diff --git a/.alltests b/.alltests
new file mode 100755
index 0000000000..75ccf9a527
--- /dev/null
+++ b/.alltests
@@ -0,0 +1,22 @@
+#!/bin/bash
+
+set -e
+
+TOP_DIR=$(dirname $(realpath "$0"))
+
+echo "==== Unit tests ===="
+resetswift
+$TOP_DIR/.unittests $@
+
+echo "==== Func tests ===="
+resetswift
+startmain
+$TOP_DIR/.functests $@
+
+echo "==== Probe tests ===="
+resetswift
+$TOP_DIR/.probetests $@
+
+echo "All tests runs fine"
+
+exit 0
diff --git a/.coveragerc b/.coveragerc
index 5893dbe75f..6f8f341733 100644
--- a/.coveragerc
+++ b/.coveragerc
@@ -3,4 +3,5 @@ branch = True
 omit = /usr*,setup.py,*egg*,.venv/*,.tox/*,test/*
 
 [report]
-ignore-errors = True
+show_missing = True
+ignore_errors = True
diff --git a/.dockerignore b/.dockerignore
new file mode 100644
index 0000000000..e8bdd7d5cc
--- /dev/null
+++ b/.dockerignore
@@ -0,0 +1,11 @@
+.tox
+api-ref
+cover
+doc/manpages
+doc/s3api
+doc/source
+examples
+releasenotes
+.stestr
+test
+tools
diff --git a/.functests b/.functests
index 9797f58a1e..3d1af25b73 100755
--- a/.functests
+++ b/.functests
@@ -1,15 +1,15 @@
 #!/bin/bash
 
-SRC_DIR=$(dirname $0)
+# How-To debug functional tests:
+# SWIFT_TEST_IN_PROCESS=1 tox -e func -- --pdb test.functional.tests.TestFile.testCopy
 
-cd ${SRC_DIR}/test/functional
-nosetests --exe $@
-func1=$?
-cd -
+SRC_DIR=$(dirname $(realpath "$0"))
 
-cd ${SRC_DIR}/test/functionalnosetests
-nosetests --exe $@
-func2=$?
-cd -
+cd ${SRC_DIR} > /dev/null
+export TESTS_DIR=${SRC_DIR}/test/functional
+ARGS="run --concurrency 1 $@"
+stestr $ARGS || stestr run --concurrency 1 --failing
+rvalue=$?
+cd -  > /dev/null
 
-exit $((func1 + func2))
+exit $rvalue
diff --git a/.gitignore b/.gitignore
index ae7e6fcc59..46ae0a33b4 100644
--- a/.gitignore
+++ b/.gitignore
@@ -1,10 +1,27 @@
 *.py[co]
 *.sw?
+*~
 doc/build/*
 dist
+build
+cover
 ChangeLog
 .coverage
-swift.egg-info
+*.egg
+*.egg-info
+.eggs/*
 .DS_Store
 .tox
-pycscope.*
\ No newline at end of file
+pycscope.*
+.idea
+MANIFEST
+
+.testrepository/*
+.stestr/*
+.noseids
+subunit.log
+test/probe/.noseids
+RELEASENOTES.rst
+releasenotes/notes/reno.cache
+/tools/playbooks/**/*.retry
+.vscode/*
diff --git a/.gitreview b/.gitreview
index d7c52c0593..529e7ec93d 100644
--- a/.gitreview
+++ b/.gitreview
@@ -1,4 +1,4 @@
 [gerrit]
-host=review.openstack.org
+host=review.opendev.org
 port=29418
 project=openstack/swift.git
diff --git a/.mailmap b/.mailmap
index c0d6e31d9a..adcdf007d9 100644
--- a/.mailmap
+++ b/.mailmap
@@ -2,6 +2,7 @@ Greg Holt <gholt@rackspace.com> gholt <gholt@brim.net>
 Greg Holt <gholt@rackspace.com> gholt <devnull@brim.net>
 Greg Holt <gholt@rackspace.com> gholt <z-github@brim.net>
 Greg Holt <gholt@rackspace.com> gholt <z-launchpad@brim.net>
+Greg Holt <gholt@rackspace.com> <gregory.holt+launchpad.net@gmail.com>
 Greg Holt <gholt@rackspace.com>
 John Dickinson <me@not.mn> <john.dickinson@rackspace.com>
 Michael Barton <mike@weirdlooking.com> <michael.barton@rackspace.com>
@@ -9,6 +10,7 @@ Michael Barton <mike@weirdlooking.com> <mike-launchpad@weirdlooking.com>
 Michael Barton <mike@weirdlooking.com> Mike Barton
 Clay Gerrard <clay.gerrard@gmail.com> <clayg@clayg-desktop>
 Clay Gerrard <clay.gerrard@gmail.com> <clay.gerrard@rackspace.com>
+Clay Gerrard <clay.gerrard@gmail.com> <clay@swiftstack.com>
 Clay Gerrard <clay.gerrard@gmail.com> clayg <clay.gerrard@gmail.com>
 David Goetz <david.goetz@rackspace.com> <david.goetz@gmail.com>
 David Goetz <david.goetz@rackspace.com> <dpgoetz@gmail.com>
@@ -17,19 +19,133 @@ Anne Gentle <anne@openstack.org> annegentle
 Fujita Tomonori <fujita.tomonori@lab.ntt.co.jp>
 Greg Lange <greglange@gmail.com> <glange@rackspace.com>
 Greg Lange <greglange@gmail.com> <greglange+launchpad@gmail.com>
+Chmouel Boudjnah <chmouel@enovance.com> <chmouel@chmouel.com>
 Gaurav B. Gangalwar <gaurav@gluster.com> gaurav@gluster.com <>
 Joe Arnold <joe@swiftstack.com> <joe@cloudscaling.com>
 Kapil Thangavelu <kapil.foss@gmail.com> kapil.foss@gmail.com <>
 Samuel Merritt <sam@swiftstack.com> <spam@andcheese.org>
+Samuel Merritt <sam@swiftstack.com> <smerritt@nvidia.com>
 Morita Kazutaka <morita.kazutaka@gmail.com>
-Zhong Yue Luo <lzyeval@gmail.com> lzyeval <lzyeval@gmail.com>
+Zhongyue Luo <zhongyue.nah@intel.com> <lzyeval@gmail.com>
 Russ Nelson <russ@crynwr.com> <nelson@nelson-laptop>
 Marcelo Martins <btorch@gmail.com> <marcelo.martins@rackspace.com>
 Andrew Clay Shafer <acs@parvuscaptus.com> <andrew@cloudscaling.com>
 Soren Hansen <soren@linux2go.dk> <soren.hansen@rackspace.com>
+Soren Hansen <soren@linux2go.dk> <sorhanse@cisco.com>
 Ye Jia Xu <xyj.asmy@gmail.com> monsterxx03 <xyj.asmy@gmail.com>
 Victor Rodionov <victor.rodionov@nexenta.com> <vito.ordaz@gmail.com>
 Florian Hines <syn@ronin.io> <florian.hines@gmail.com>
 Jay Payne <letterj@gmail.com> <letterj@racklabs.com>
 Doug Weimer <dweimer@gmail.com> <dougw@sdsc.edu>
 Li Riqiang <lrqrun@gmail.com> lrqrun <lrqrun@gmail.com>
+Cory Wright <cory.wright@rackspace.com> <corywright@gmail.com>
+Julien Danjou <julien@danjou.info> <julien.danjou@enovance.com>
+David Hadas <davidh@il.ibm.com> <david.hadas@gmail.com>
+Yaguang Wang <yaguang.wang@intel.com> ywang19 <yaguang.wang@intel.com>
+Liu Siqi <meizu647@gmail.com> dk647 <meizu647@gmail.com>
+James E. Blair <jeblair@openstack.org> <james.blair@rackspace.com>
+James E. Blair <jeblair@openstack.org> <jeblair@redhat.com>
+Kun Huang <gareth@unitedstack.com> <academicgareth@gmail.com>
+Michael Shuler <mshuler@gmail.com> <mshuler@rackspace.com>
+Ilya Kharin <ikharin@mirantis.com> <akscram@gmail.com>
+Dmitry Ukov <dukov@mirantis.com> Ukov Dmitry <dukov@mirantis.com>
+Tom Fifield <tom@openstack.org> Tom Fifield <fifieldt@unimelb.edu.au>
+Sascha Peilicke <saschpe@gmx.de> Sascha Peilicke <saschpe@suse.de>
+Zhenguo Niu <zhenguo@unitedstack.com> <Niu.ZGlinux@gmail.com>
+Peter Portante <peter.portante@redhat.com> <peter.a.portante@gmail.com>
+Christian Schwede <cschwede@redhat.com> <info@cschwede.de>
+Christian Schwede <cschwede@redhat.com> <christian.schwede@enovance.com>
+Constantine Peresypkin <constantine.peresypk@rackspace.com> <constantine@litestack.com>
+Madhuri Kumari <madhuri.rai07@gmail.com> madhuri <madhuri@madhuri-VirtualBox.(none)>
+Morgan Fainberg <morgan.fainberg@gmail.com> <m@metacloud.com>
+Hua Zhang <zhuadl@cn.ibm.com> <zhuadl@cn.ibm.com>
+Yummy Bian <yummy.bian@gmail.com> <yummy.bian@gmail.com>
+Alistair Coles <alistairncoles@gmail.com> <alistair.coles@hpe.com>
+Alistair Coles <alistairncoles@gmail.com> <alistair.coles@hp.com>
+Tong Li <litong01@us.ibm.com> <litong01@us.ibm.com>
+Paul Luse <paul.e.luse@intel.com> <paul.e.luse@intel.com>
+Yuan Zhou <yuan.zhou@intel.com> <yuan.zhou@intel.com>
+Jola Mirecka <jola.mirecka@hp.com> <jola.mirecka@hp.com>
+Ning Zhang <ning@zmanda.com> <ning@zmanda.com>
+Mauro Stettler <mauro.stettler@gmail.com> <mauro.stettler@gmail.com>
+Pawel Palucki <pawel.palucki@gmail.com> <pawel.palucki@gmail.com>
+Guang Yee <guang.yee@hpe.com> <guang.yee@hp.com>
+Jing Liuqing <jing.liuqing@99cloud.net> <jing.liuqing@99cloud.net>
+Lorcan Browne <lorcan.browne@hpe.com> <lorcan.browne@hp.com>
+Eohyung Lee <liquidnuker@gmail.com> <liquid@kt.com>
+Harshit Chitalia <harshit@acelio.com> <harshit@acelio.com>
+Richard Hawkins <richard.hawkins@rackspace.com>
+Sarvesh Ranjan <saranjan@cisco.com>
+Minwoo Bae <minwoob@us.ibm.com> Minwoo B
+Jaivish Kothari <jaivish.kothari@nectechnologies.in> <janonymous.codevulture@gmail.com>
+Michael Matur <michael.matur@gmail.com>
+Kazuhiro Miyahara <miyahara.kazuhiro@lab.ntt.co.jp>
+Alexandra Settle <asettle@suse.com> <alexandra.settle@rackspace.com>
+Kenichiro Matsuda <matsuda_kenichi@jp.fujitsu.com>
+Atsushi Sakai <sakaia@jp.fujitsu.com>
+Takashi Natsume <natsume.takashi@lab.ntt.co.jp>
+Nakagawa Masaaki <nakagawamsa@nttdata.co.jp> nakagawamsa
+Romain Le Disez <romain.ledisez@ovh.net> Romain LE DISEZ
+Romain Le Disez <romain.ledisez@ovh.net> <romain.le-disez@corp.ovh.com>
+Donagh McCabe <donagh.mccabe@gmail.com> <donagh.mccabe@hpe.com>
+Donagh McCabe <donagh.mccabe@gmail.com> <donagh.mccabe@hp.com>
+Eamonn O'Toole <eamonn.otoole@hpe.com> <eamonn.otoole@hp.com>
+Gerry Drudy <gerry.drudy@hpe.com> <gerry.drudy@hp.com>
+Mark Seger <mark.seger@hpe.com> <mark.seger@hp.com>
+Timur Alperovich <timur.alperovich@gmail.com> <timuralp@swiftstack.com>
+Mehdi Abaakouk <sileht@redhat.com> <mehdi.abaakouk@enovance.com>
+Richard Hawkins <richard.hawkins@rackspace.com> <hurricanerix@gmail.com>
+Ondrej Novy <ondrej.novy@firma.seznam.cz>
+Ondrej Novy <ondrej.novy@firma.seznam.cz> <novy@ondrej.org>
+Peter Lisák <peter.lisak@gmail.com> <peter.lisak@firma.seznam.cz>
+Peter Lisák <peter.lisak@gmail.com> Peter Lisák <peter.lisak@firma.seznam.cz>
+Ke Liang <ke.liang@easystack.cn>
+Daisuke Morita <morita.daisuke@ntti3.com> <morita.daisuke@lab.ntt.co.jp>
+Andreas Jaeger <aj@suse.de> <aj@suse.com>
+Hugo Kuo <tonytkdk@gmail.com>
+Gage Hugo <gh159m@att.com>
+Oshrit Feder <oshritf@il.ibm.com> <OSHRITF@il.ibm.com>
+Larry Rensing <lr699s@att.com>
+Ben Keller <bjkeller@us.ibm.com>
+Chaozhe Chen <chaozhe.chen@easystack.cn>
+Brian Cline <bcline@softlayer.com> <bcline@us.ibm.com>
+Brian Cline <bcline@softlayer.com> <brian.cline@gmail.com>
+Dharmendra Kushwaha <dharmendra.kushwaha@nectechnologies.in>
+Zhang Guoqing <zhang.guoqing@99cloud.net>
+Kato Tomoyuki <kato.tomoyuki@jp.fujitsu.com>
+Liang Jingtao <liang.jingtao@zte.com.cn>
+Yu Yafei <yu.yafei@zte.com.cn>
+Zheng Yao <zheng.yao1@zte.com.cn>
+Paul Dardeau <paul.dardeau@intel.com> <pauldardeau@gmail.com>
+Cheng Li <shcli@cn.ibm.com>
+Nandini Tata <nandini.tata@intel.com> <nandini.tata.15@gmail.com>
+Flavio Percoco <flaper87@gmail.com>
+Tin Lam <tinlam@gmail.com> <tl3438@att.com>
+Hisashi Osanai <osanai.hisashi@gmail.com> <osanai.hisashi@jp.fujitsu.com>
+Bryan Keller <kellerbr@us.ibm.com>
+Doug Hellmann <doug@doughellmann.com> <doug.hellmann@dreamhost.com>
+zhangdebo1987 <zhangdebo@inspur.com> zhangdebo
+Thomas Goirand <thomas@goirand.fr> <zigo@debian.org>
+Thiago da Silva <thiagodasilva@gmail.com> <thiago@redhat.com>
+Kota Tsuyuzaki <bloodeagle40234@gmail.com> <kota.tsuyuzaki.pc@hco.ntt.co.jp>
+Kota Tsuyuzaki <bloodeagle40234@gmail.com> <tsuyuzaki.kota@lab.ntt.co.jp>
+Kota Tsuyuzaki <bloodeagle40234@gmail.com> <k.tsuyuzaki@ntt.com>
+Ehud Kaldor <ehud@unfairfunction.org> <ehud@UnfairFunction.org>
+Takashi Kajinami <kajinamit@oss.nttdata.com> <kajinamit@nttdata.co.jp>
+Takashi Kajinami <kajinamit@oss.nttdata.com> <tkajinam@redhat.com>
+Yuxin Wang <wang.yuxin@ostorage.com.cn> Wang Yuxin
+Gilles Biannic <gilles.biannic@corp.ovh.com> gillesbiannic
+melissaml <ma.lei@99cloud.net> <malei@maleideMacBook-Pro.local>
+Ashwin Nair <nairashwin952013@gmail.com> indianwhocodes
+Romain de Joux <romain.de-joux@ovhcloud.com> <romain.de-joux@corp.ovh.com>
+Takashi Natsume <takanattie@gmail.com> <natsume.takashi@lab.ntt.co.jp>
+Pete Zaitcev <zaitcev@yahoo.com> <zaitcev@kotori.zaitcev.us>
+Mandell Degerness <mdegerness@nvidia.com> <mdegerness@swiftstack.com>
+Anish Kachinthaya <anishk23733@gmail.com> <akachinthaya@nvidia.com>
+Daanish Khan <daanish1337@gmail.com> <daanishk@andrew.cmu.edu>
+Chris Smart <distroguy@gmail.com> <chris.smart@humanservices.gov.au>
+Ashwin Nair <nairashwin952013@gmail.com> <ashnair@nvidia.com>
+Chinemerem Chigbo <chinemeremchigbo@Outlook.com> Chinemerem
+Chinemerem Chigbo <chinemeremchigbo@Outlook.com> <cchigbo@nvidia.com>
+Tim Burke <tim.burke@gmail.com> <tburke@nvidia.com>
+Christian Ohanaja <christianohanaja431@gmail.com> <cohanaja@nvidia.com>
diff --git a/.manpages b/.manpages
new file mode 100755
index 0000000000..69fcfc74d5
--- /dev/null
+++ b/.manpages
@@ -0,0 +1,18 @@
+#!/bin/sh
+
+RET=0
+for MAN in doc/manpages/* ; do
+    OUTPUT=$(LC_ALL=en_US.UTF-8 MANROFFSEQ='' MANWIDTH=80 man --warnings -E UTF-8 -l \
+        -Tutf8 -Z "$MAN" 2>&1 >/dev/null)
+    if [ -n "$OUTPUT" ] ; then
+        RET=1
+        echo "$MAN:"
+        echo "$OUTPUT"
+    fi
+done
+
+if [ "$RET" -eq "0" ] ; then
+    echo "All manpages are fine"
+fi
+
+exit "$RET"
diff --git a/.probetests b/.probetests
index 5d9f69915e..9a7aafda63 100755
--- a/.probetests
+++ b/.probetests
@@ -1,7 +1,9 @@
 #!/bin/bash
 
-cd $(dirname $0)/test/probe
-nosetests --exe
+SRC_DIR=$(dirname $(realpath "$0"))
+
+cd ${SRC_DIR}/test/probe
+pytest $@
 rvalue=$?
 cd -
 
diff --git a/.stestr.conf b/.stestr.conf
new file mode 100644
index 0000000000..3e674fb026
--- /dev/null
+++ b/.stestr.conf
@@ -0,0 +1,2 @@
+[DEFAULT]
+test_path=./test/functional
diff --git a/.unittests b/.unittests
index 6fc2eb1ed9..9873b17974 100755
--- a/.unittests
+++ b/.unittests
@@ -1,7 +1,9 @@
 #!/bin/bash
 
-cd $(dirname $0)/test/unit 
-nosetests --exe --with-coverage --cover-package swift --cover-erase $@
+TOP_DIR=$(dirname $(realpath "$0"))
+
+cd $TOP_DIR/test/unit
+pytest --cov-report=html:"$TOP_DIR"/cover $@
 rvalue=$?
 rm -f .coverage
 cd -
diff --git a/.zuul.yaml b/.zuul.yaml
new file mode 100644
index 0000000000..c580994d2f
--- /dev/null
+++ b/.zuul.yaml
@@ -0,0 +1,773 @@
+- job:
+    name: swift-tox-base
+    parent: openstack-tox-py310
+    nodeset: ubuntu-jammy
+    description: |
+      Base job for swift-tox jobs.
+
+      It sets TMPDIR to an XFS mount point created via
+      tools/test-setup.sh.
+    timeout: 5400
+    vars:
+      tox_environment:
+        TMPDIR: '{{ ansible_env.HOME }}/xfstmp'
+        COLUMNS: 240
+
+- job:
+    name: swift-tox-py37
+    parent: swift-tox-base
+    description: |
+      Run unit-tests for swift under cPython version 3.7.
+
+      Uses tox with the ``py37`` environment.
+      It sets TMPDIR to an XFS mount point created via
+      tools/test-setup.sh.
+    vars:
+      tox_envlist: py37
+      python_use_pyenv: True
+      python_version: 3.7
+    post-run: tools/playbooks/common/cover-post.yaml
+
+- job:
+    name: swift-tox-py38
+    parent: swift-tox-base
+    nodeset: ubuntu-focal
+    description: |
+      Run unit-tests for swift under cPython version 3.8.
+
+      Uses tox with the ``py38`` environment.
+      It sets TMPDIR to an XFS mount point created via
+      tools/test-setup.sh.
+    vars:
+      tox_envlist: py38
+      python_version: 3.8
+    post-run: tools/playbooks/common/cover-post.yaml
+
+- job:
+    name: swift-tox-py38-arm64
+    parent: swift-tox-py38
+    nodeset: ubuntu-focal-arm64
+    description: |
+      Run unit tests for an OpenStack Python project under cPython
+      version 3.8 on top of arm64 architecture.
+    timeout: 10800
+
+- job:
+    name: swift-tox-py312-arm64
+    parent: swift-tox-py312
+    nodeset: debian-bookworm-arm64
+    description: |
+      Run unit tests for an OpenStack Python project under cPython
+      version 3.12 on top of arm64 architecture.
+    timeout: 10800
+
+- job:
+    name: swift-tox-py39
+    parent: swift-tox-base
+    nodeset: ubuntu-focal
+    description: |
+      Run unit-tests for swift under cPython version 3.9.
+
+      Uses tox with the ``py39`` environment.
+      It sets TMPDIR to an XFS mount point created via
+      tools/test-setup.sh.
+    vars:
+      tox_envlist: py39
+      python_version: 3.9
+    post-run: tools/playbooks/common/cover-post.yaml
+
+- job:
+    name: swift-tox-py310
+    parent: swift-tox-base
+    nodeset: ubuntu-jammy
+    description: |
+      Run unit-tests for swift under cPython version 3.10.
+
+      Uses tox with the ``py310`` environment.
+      It sets TMPDIR to an XFS mount point created via
+      tools/test-setup.sh.
+    vars:
+      tox_envlist: py310
+      python_version: '3.10'
+    post-run: tools/playbooks/common/cover-post.yaml
+
+- job:
+    name: swift-tox-py311
+    parent: swift-tox-base
+    nodeset: ubuntu-jammy
+    description: |
+      Run unit-tests for swift under cPython version 3.11.
+
+      Uses tox with the ``py311`` environment.
+      It sets TMPDIR to an XFS mount point created via
+      tools/test-setup.sh.
+    vars:
+      tox_envlist: py311
+      python_version: '3.11'
+
+- job:
+    name: swift-tox-py312
+    parent: swift-tox-base
+    nodeset: debian-bookworm
+    description: |
+      Run unit-tests for swift under cPython version 3.12.
+
+      Uses tox with the ``py312`` environment.
+      It sets TMPDIR to an XFS mount point created via
+      tools/test-setup.sh.
+    vars:
+      tox_envlist: py312
+      python_use_pyenv: True
+      python_version: '3.12'
+
+- job:
+    name: swift-tox-py313
+    parent: swift-tox-base
+    nodeset: ubuntu-noble
+    description: |
+      Run unit-tests for swift under cPython version 3.13.
+
+      Uses tox with the ``py313`` environment.
+      It sets TMPDIR to an XFS mount point created via
+      tools/test-setup.sh.
+    vars:
+      tox_envlist: py313
+      python_use_pyenv: True
+      python_version: '3.13'
+
+- job:
+    name: swift-tox-func-py312
+    parent: swift-tox-base
+    nodeset: ubuntu-noble
+    description: |
+      Run functional tests for swift under cPython version 3.12.
+
+      Uses tox with the ``func-py3`` environment.
+      It sets TMPDIR to an XFS mount point created via
+      tools/test-setup.sh.
+    vars:
+      tox_envlist: func
+      python_version: 3.12
+
+- job:
+    name: swift-tox-func-py39-centos-9-stream
+    parent: swift-tox-func-py312
+    nodeset: centos-9-stream
+    vars:
+      python_version: 3.9
+
+- job:
+    name: swift-tox-func-encryption-py39-centos-9-stream
+    parent: swift-tox-func-py39-centos-9-stream
+    vars:
+      tox_envlist: func-encryption
+
+- job:
+    name: swift-tox-func-ec-py39-centos-9-stream
+    parent: swift-tox-func-py39-centos-9-stream
+    vars:
+      tox_envlist: func-ec
+
+- job:
+    name: swift-tox-func-encryption-py312
+    parent: swift-tox-func-py312
+    description: |
+      Run functional tests for swift under cPython version 3.12.
+
+      Uses tox with the ``func-encryption-py3`` environment.
+      It sets TMPDIR to an XFS mount point created via
+      tools/test-setup.sh.
+    vars:
+      tox_envlist: func-encryption
+
+- job:
+    name: swift-tox-func-encryption-py312-arm64
+    parent: swift-tox-func-encryption-py312
+    nodeset: ubuntu-noble-arm64
+    description: |
+      Run functional tests for swift under cPython version 3.12
+      on top of arm64 architecture.
+
+      Uses tox with the ``func-encryption-py3`` environment.
+      It sets TMPDIR to an XFS mount point created via
+      tools/test-setup.sh.
+    timeout: 10800
+
+- job:
+    name: swift-tox-func-py312-arm64
+    parent: swift-tox-func-py312
+    nodeset: ubuntu-noble-arm64
+    description: |
+      Run functional tests for swift under cPython version 3.12
+      on top of arm64 architecture.
+
+      Uses tox with the ``func-py3`` environment.
+      It sets TMPDIR to an XFS mount point created via
+      tools/test-setup.sh.
+    timeout: 10800
+
+- job:
+    name: swift-tox-func-ec-py312
+    parent: swift-tox-func-py312
+    description: |
+      Run functional tests for swift under cPython version 3.12.
+
+      Uses tox with the ``func-ec-py3`` environment.
+      It sets TMPDIR to an XFS mount point created via
+      tools/test-setup.sh.
+    vars:
+      tox_envlist: func-ec
+
+- job:
+    name: swift-dsvm-functional
+    parent: devstack-minimal
+    description: |
+      Setup a Swift/Keystone environment and run Swift's func tests.
+    required-projects:
+      - opendev.org/openstack/requirements
+      - opendev.org/openstack/swift
+      - opendev.org/openstack/keystone
+    timeout: 5400
+    vars:
+      tox_environment:
+        COLUMNS: 240
+      tox_constraints_file: '{{ ansible_user_dir }}/src/opendev.org/openstack/requirements/upper-constraints.txt'
+      # This tox env get run twice; once for Keystone and once for tempauth
+      tox_envlist: func,s3api
+      devstack_localrc:
+        SWIFT_HASH: changeme
+        # We don't need multiple replicas to run purely functional tests.
+        # In fact, devstack special cases some things when there's only
+        # one replica.
+        SWIFT_REPLICAS: 1
+        # One replica => no need for replicators, etc.
+        SWIFT_START_ALL_SERVICES: False
+      devstack_services:
+        keystone: true
+        swift: true
+        s3api: true
+      zuul_work_dir: src/opendev.org/openstack/swift
+    pre-run: tools/playbooks/dsvm/pre.yaml
+    run: tools/playbooks/dsvm/run.yaml
+    post-run: tools/playbooks/dsvm/post.yaml
+
+- job:
+    name: swift-dsvm-functional-ipv6
+    parent: swift-dsvm-functional
+    vars:
+      devstack_localrc:
+        SERVICE_IP_VERSION: 6
+        SERVICE_HOST: ""
+
+- job:
+    name: swift-tox-func-ceph-s3tests-tempauth
+    parent: unittests
+    voting: false
+    nodeset: centos-9-stream
+    description: |
+      Setup a SAIO dev environment and run ceph-s3tests
+    timeout: 5400
+    vars:
+      tox_environment:
+        COLUMNS: 240
+      s3_acl: yes
+    pre-run:
+      - tools/playbooks/common/install_dependencies.yaml
+      - tools/playbooks/saio_single_node_setup/setup_saio.yaml
+      - tools/playbooks/saio_single_node_setup/add_s3api.yaml
+      - tools/playbooks/saio_single_node_setup/make_rings.yaml
+      - tools/playbooks/common/restart_swift.yaml
+    run: tools/playbooks/ceph-s3tests/run.yaml
+    post-run:
+      - tools/playbooks/probetests/post.yaml
+      - tools/playbooks/ceph-s3tests/post.yaml
+
+- job:
+    name: swift-tox-func-s3api-compat-tests-tempauth
+    parent: unittests
+    nodeset: centos-9-stream
+    description: |
+      Setup a SAIO dev environment and run our s3api test suite
+    timeout: 1800
+    vars:
+      tox_environment:
+        COLUMNS: 240
+      s3_acl: yes
+    pre-run:
+      - tools/playbooks/common/install_dependencies.yaml
+      - tools/playbooks/saio_single_node_setup/setup_saio.yaml
+      - tools/playbooks/saio_single_node_setup/add_s3api.yaml
+      - tools/playbooks/saio_single_node_setup/make_rings.yaml
+      - tools/playbooks/common/restart_swift.yaml
+    run: tools/playbooks/s3api-tests/run.yaml
+    post-run:
+      - tools/playbooks/probetests/post.yaml
+
+- job:
+    name: swift-probetests-centos-9-stream
+    parent: unittests
+    nodeset: centos-9-stream
+    description: |
+      Setup a SAIO dev environment and run Swift's probe tests
+      under Python 3.
+    timeout: 7200
+    vars:
+      tox_environment:
+        COLUMNS: 240
+      s3_acl: no
+    pre-run:
+      - tools/playbooks/common/install_dependencies.yaml
+      - tools/playbooks/saio_single_node_setup/setup_saio.yaml
+      - tools/playbooks/saio_single_node_setup/make_rings.yaml
+      - tools/playbooks/saio_single_node_setup/add_s3api.yaml
+    run: tools/playbooks/probetests/run.yaml
+    post-run: tools/playbooks/probetests/post.yaml
+
+- job:
+    name: swift-probetests-centos-9-stream-arm64
+    parent: swift-probetests-centos-9-stream
+    nodeset:
+      nodes:
+        - name: swift-centos-9-stream-arm64
+          label: centos-9-stream-arm64
+    description: |
+      Setup a SAIO dev environment and run Swift's probe tests
+      under Python 3 on top of arm64 architecture.
+    timeout: 10800
+
+- job:
+    name: swift-func-cors
+    parent: swift-probetests-centos-9-stream
+    description: |
+      Setup a SAIO dev environment and run Swift's CORS functional tests
+    timeout: 1200
+    pre-run:
+      - tools/playbooks/cors/install_selenium.yaml
+    run: tools/playbooks/cors/run.yaml
+    post-run: tools/playbooks/cors/post.yaml
+
+- nodeset:
+    name: swift-five-nodes-centos-9
+    nodes:
+      - name: test-runner1
+        label: centos-9-stream
+      - name: proxy1
+        label: centos-9-stream
+      - name: account1
+        label: centos-9-stream
+      - name: container1
+        label: centos-9-stream
+      - name: object1
+        label: centos-9-stream
+    groups:
+      - name: test-runner
+        nodes:
+          - test-runner1
+      - name: swift-cluster
+        nodes:
+          - proxy1
+          - account1
+          - container1
+          - object1
+      - name: proxy
+        nodes:
+          - proxy1
+      - name: account
+        nodes:
+          - account1
+      - name: container
+        nodes:
+          - container1
+      - name: object
+        nodes:
+          - object1
+      - name: storage
+        nodes:
+          - account1
+          - container1
+          - object1
+
+- job:
+    name: swift-multinode-rolling-upgrade
+    parent: multinode
+    nodeset: swift-five-nodes-centos-9
+    description: |
+      Build a 4 node swift cluster and run functional tests
+    timeout: 5400
+    vars:
+      tox_envlist: func
+    pre-run:
+      - tools/playbooks/multinode_setup/pre.yaml
+      - tools/playbooks/common/install_dependencies.yaml
+      - tools/playbooks/multinode_setup/configure_loopback.yaml
+      - tools/playbooks/multinode_setup/common_config.yaml
+      - tools/playbooks/multinode_setup/make_rings.yaml
+    run: tools/playbooks/multinode_setup/run.yaml
+    post-run: tools/playbooks/probetests/post.yaml
+
+- job:
+    name: swift-multinode-rolling-upgrade-wallaby
+    parent: swift-multinode-rolling-upgrade
+    vars:
+      previous_swift_version: wallaby-eom
+      tox_envlist: func-py3
+
+- job:
+    name: swift-multinode-rolling-upgrade-xena
+    parent: swift-multinode-rolling-upgrade
+    vars:
+      previous_swift_version: xena-eom
+      tox_envlist: func-py3
+
+- job:
+    name: swift-multinode-rolling-upgrade-yoga
+    parent: swift-multinode-rolling-upgrade
+    vars:
+      previous_swift_version: yoga-eom
+      tox_envlist: func-py3
+
+- job:
+    name: swift-multinode-rolling-upgrade-zed
+    parent: swift-multinode-rolling-upgrade
+    vars:
+      previous_swift_version: zed-eom
+      tox_envlist: func-py3
+
+- job:
+    name: swift-multinode-rolling-upgrade-antelope
+    parent: swift-multinode-rolling-upgrade
+    vars:
+      previous_swift_version: 2023.1-eom
+      tox_envlist: func-py3
+
+- job:
+    name: swift-multinode-rolling-upgrade-bobcat
+    parent: swift-multinode-rolling-upgrade
+    vars:
+      previous_swift_version: 2023.2-eol
+      tox_envlist: func-py3
+
+- job:
+    name: swift-multinode-rolling-upgrade-caracal
+    parent: swift-multinode-rolling-upgrade
+    vars:
+      previous_swift_version: 2024.1-eom
+      tox_envlist: func-py3
+
+- job:
+    name: swift-multinode-rolling-upgrade-dalmatian
+    parent: swift-multinode-rolling-upgrade
+    vars:
+      previous_swift_version: origin/stable/2024.2
+      tox_envlist: func-py3
+
+- job:
+    name: swift-multinode-rolling-upgrade-epoxy
+    parent: swift-multinode-rolling-upgrade
+    vars:
+      previous_swift_version: origin/stable/2025.1
+
+- job:
+    name: swift-multinode-rolling-upgrade-flamingo
+    parent: swift-multinode-rolling-upgrade
+    vars:
+      previous_swift_version: origin/stable/2025.2
+
+- job:
+    name: swift-multinode-rolling-upgrade-master
+    parent: swift-multinode-rolling-upgrade
+    vars:
+      previous_swift_version: origin/master
+
+- job:
+    name: swift-tox-lower-constraints
+    parent: openstack-tox-lower-constraints
+    vars:
+      python_use_pyenv: True
+      python_version: 3.7
+      tox_environment:
+        TMPDIR: '{{ ansible_env.HOME }}/xfstmp'
+
+# Image building jobs
+- secret:
+    name: swift-dockerhub-2026
+    data:
+      username: screamingfrenzy
+      password: !encrypted/pkcs1-oaep
+        # Updated via `zuul-client --zuul-url https://zuul.opendev.org encrypt --tenant openstack --project openstack/swift --secret-name swift-dockerhub-2026 --infile /tmp/secret --field-name password`
+        # Be careful not to include any trailing newlines in the secret file! It should contain *exactly* the password: no more, no less.
+        # Note that we've seen issues with some special characters causing issues in the ansible plumbing; new passwords should probably avoid using double quotes ("), single quotes ('), and dollar signs ($).
+        - R0AnQRtM0ObjNvqQgc/E9KH1o4CeNwzPB4jUc0ji6BHjHL4zXPi1P29L1BZgc+MlG/Ps/
+          SLHTQPyUJpmrlVyFKBhvQcs+0qpeF56TqHYN1sW0j7IHHRLvfRHzKO5oarWeVWJi34PRx
+          cGdXIT3oYvwWq8D6Lr/XgBOH4eotpfxxR7IYUM7Ti07MHBiVtzZHMvV0/I/YzkaK1oZ2C
+          n5AYmII/h57YtgTpOOM5dHL3Q6qOaQ4s9nkvyia5R7aRjZW+L1MqP9UjpslGF5AXkAoI5
+          xafRwXdCC7L7cwktmvWUgH8mLjoBhVMZR9wn8IqrsrwUI0qs1QvI6N3mC+lIFTdFfDyfx
+          bJy8umeIkdZ5AmuDEstpb/PORW4q+JfRPFtxtBPxj7E5GrYC5AaBId+8/nHy0vQmcYfON
+          RT0/lQ+xTlfEkSu2PkIoQsXG1Xxdmeb+j/dG/eTlxQVCyza1DITzOfCLwwrdvHxJvez8M
+          CvUoS5q0+R+9NRvM1Pc+qTJM7GIe2MNwCn1TcClJd0tspcm2I+uxf/LhX/53qGzs94YrO
+          +ccqWd4W1ejajbIhCI9VmxhudxJfxxly17g5keJkxDH+akKg4vbg78agiS3NhIkFIiKOn
+          zQGlA92Ufvd7VnMXJvH+wzK+9RV822i0f/Vfz1aE53Xq1r0bnUPtYFiNlpgrn0=
+
+- job:
+    name: swift-build-image
+    parent: opendev-build-docker-image
+    voting: false
+    description: Build SAIO docker images.
+    vars: &swift_image_vars
+      docker_images:
+        - context: .
+          repository: openstackswift/saio
+          tags:
+            - latest
+            - py3
+
+- job:
+    name: swift-upload-image
+    parent: opendev-upload-docker-image
+    voting: false
+    description: Build SAIO docker images and upload to Docker Hub.
+    secrets:
+      name: docker_credentials
+      secret: swift-dockerhub-2026
+      pass-to-parent: true
+    vars: *swift_image_vars
+
+- job:
+    name: swift-promote-image
+    parent: opendev-promote-docker-image
+    voting: false
+    description: Promote previously uploaded Docker images.
+    secrets:
+      name: docker_credentials
+      secret: swift-dockerhub-2026
+      pass-to-parent: true
+    vars: *swift_image_vars
+
+- job:
+    name: swift-tox-func-py39-centos-9-stream-fips
+    parent: swift-tox-func-py39-centos-9-stream
+    voting: false
+    description: |
+      Functional testing on a FIPS enabled Centos 9 system
+    vars:
+      nslookup_target: 'opendev.org'
+      enable_fips: true
+
+- job:
+    name: swift-tox-func-encryption-py39-centos-9-stream-fips
+    parent: swift-tox-func-encryption-py39-centos-9-stream
+    voting: false
+    description: |
+      Functional encryption testing on a FIPS enabled
+      Centos 9 system
+    vars:
+      nslookup_target: 'opendev.org'
+      enable_fips: true
+
+- job:
+    name: swift-tox-func-ec-py39-centos-9-stream-fips
+    parent: swift-tox-func-ec-py39-centos-9-stream
+    voting: false
+    description: |
+      Functional EC testing on a FIPS enabled Centos 9 system
+    vars:
+      nslookup_target: 'opendev.org'
+      enable_fips: true
+
+# TODO(gmann): As per the 2025.1 testing runtime, we need to run at least
+# one job on jammy. This job can be removed as per the future testing
+# runtime (whenever we start testing Ubuntu 26.04 as default version).
+- job:
+    name: tempest-integrated-object-storage-ubuntu-jammy
+    description: This is integrated object-storage job testing on Ubuntu jammy(22.04)
+    parent: tempest-integrated-object-storage
+    nodeset: openstack-single-node-jammy
+
+- project-template:
+    name: swift-jobs-arm64
+    description: |
+      Runs tests for an OpenStack Python project under the CPython
+      version 3 releases designated for testing on top of ARM64 architecture.
+    check-arm64:
+      jobs:
+        - swift-tox-py312-arm64
+    experimental:
+      jobs:
+        - swift-tox-py38-arm64
+        - swift-tox-func-encryption-py312-arm64
+        - swift-tox-func-py312-arm64
+
+- project:
+    templates:
+      - publish-openstack-docs-pti
+      - periodic-stable-jobs
+      - check-requirements
+      - release-notes-jobs-python3
+      - integrated-gate-object-storage
+      - swift-jobs-arm64
+    check:
+      jobs:
+        - swift-tox-func-py39-centos-9-stream-fips:
+            irrelevant-files: &functest-irrelevant-files
+              - ^(api-ref|doc|releasenotes)/.*$
+              - ^test/(cors|probe|s3api)/.*$
+              - ^(.gitreview|.mailmap|AUTHORS|CHANGELOG|.*\.rst)$
+        - swift-tox-func-encryption-py39-centos-9-stream-fips:
+            irrelevant-files: *functest-irrelevant-files
+        - swift-tox-func-ec-py39-centos-9-stream-fips:
+            irrelevant-files: *functest-irrelevant-files
+        - swift-build-image:
+            irrelevant-files: &docker-irrelevant-files
+              - ^(api-ref|doc|releasenotes)/.*$
+              - ^test/(functional|probe)/.*$
+
+        # Unit tests
+        - swift-tox-py37:
+            irrelevant-files: &unittest-irrelevant-files
+              - ^(api-ref|doc|releasenotes)/.*$
+              - ^test/(cors|functional|probe|s3api)/.*$
+        - swift-tox-py39:
+            irrelevant-files: *unittest-irrelevant-files
+        - swift-tox-py312:
+            irrelevant-files: *unittest-irrelevant-files
+        - swift-tox-py313:
+            irrelevant-files: *unittest-irrelevant-files
+
+        # Functional tests
+        - swift-tox-func-py312:
+            irrelevant-files: *functest-irrelevant-files
+        - swift-tox-func-encryption-py312:
+            irrelevant-files: *functest-irrelevant-files
+        - swift-tox-func-ec-py312:
+            irrelevant-files: *functest-irrelevant-files
+
+        # Other tests
+        - swift-func-cors:
+            irrelevant-files:
+              - ^(api-ref|releasenotes)/.*$
+              # Keep doc/saio -- we use those sample configs in the saio playbooks
+              - ^doc/(requirements.txt|(manpages|s3api|source)/.*)$
+              - ^test/(unit|functional|probe|s3api)/.*$
+              - ^(.gitreview|.mailmap|AUTHORS|CHANGELOG)$
+        - swift-tox-func-ceph-s3tests-tempauth:
+            irrelevant-files:
+              - ^(api-ref|releasenotes)/.*$
+              # Keep doc/saio -- we use those sample configs in the saio playbooks
+              # Also keep doc/s3api -- it holds known failures for these tests
+              - ^doc/(requirements.txt|(manpages|source)/.*)$
+              - ^test/.*$
+              - ^(.gitreview|.mailmap|AUTHORS|CHANGELOG|.*\.rst)$
+        - swift-tox-func-s3api-compat-tests-tempauth:
+            irrelevant-files:
+              - ^(api-ref|releasenotes)/.*$
+              # Keep doc/saio -- we use those sample configs in the saio playbooks
+              - ^doc/(requirements.txt|(manpages|s3api|source)/.*)$
+              - ^test/(cors|unit|functional|probe)/.*$
+              - ^(.gitreview|.mailmap|AUTHORS|CHANGELOG|.*\.rst)$
+        - swift-probetests-centos-9-stream:
+            irrelevant-files: &probetest-irrelevant-files
+              - ^(api-ref|releasenotes)/.*$
+              # Keep doc/saio -- we use those sample configs in the saio playbooks
+              - ^doc/(requirements.txt|(manpages|s3api|source)/.*)$
+              - ^test/(cors|unit|functional|s3api)/.*$
+              - ^(.gitreview|.mailmap|AUTHORS|CHANGELOG|.*\.rst)$
+        - swift-dsvm-functional:
+            irrelevant-files: *functest-irrelevant-files
+        - swift-dsvm-functional-ipv6:
+            irrelevant-files: *functest-irrelevant-files
+        - swift-tox-lower-constraints:
+            irrelevant-files: *unittest-irrelevant-files
+        - openstack-tox-pep8:
+            irrelevant-files: &pep8-irrelevant-files
+              - ^(api-ref|etc|examples|releasenotes)/.*$
+              # Keep doc/manpages -- we want to syntax check them
+              - ^doc/(requirements.txt|(saio|s3api|source)/.*)$
+        - swift-multinode-rolling-upgrade:
+            irrelevant-files: *functest-irrelevant-files
+        - tempest-integrated-object-storage:
+            irrelevant-files: &tempest-irrelevant-files
+              - ^(api-ref|doc|releasenotes)/.*$
+              - ^test/.*$
+              - ^(.gitreview|.mailmap|AUTHORS|CHANGELOG|.*\.rst)$
+        - tempest-integrated-object-storage-ubuntu-jammy:
+            irrelevant-files: *tempest-irrelevant-files
+        - tempest-ipv6-only:
+            irrelevant-files: *tempest-irrelevant-files
+        - openstacksdk-functional-devstack:
+            irrelevant-files: *tempest-irrelevant-files
+        - grenade:
+            irrelevant-files: *tempest-irrelevant-files
+        - grenade-skip-level:
+            irrelevant-files: *tempest-irrelevant-files
+        - grenade-skip-level-always:
+            irrelevant-files: *tempest-irrelevant-files
+    gate:
+      jobs:
+        # For gate jobs, err towards running more jobs (so, generally avoid
+        # using irrelevant-files). Exceptions should mainly be made for
+        # long-running jobs, like probetests or (once they move to
+        # in-tree definitions) dsvm jobs.
+        - swift-upload-image:
+            irrelevant-files: *docker-irrelevant-files
+        - swift-tox-py37
+        - swift-tox-py39
+        - swift-tox-py312
+        - swift-tox-py313
+        - swift-tox-func-py312
+        - swift-tox-func-encryption-py312
+        - swift-tox-func-ec-py312
+        - swift-func-cors
+        - swift-tox-func-s3api-compat-tests-tempauth
+        - swift-probetests-centos-9-stream:
+            irrelevant-files: *probetest-irrelevant-files
+        - swift-dsvm-functional:
+            irrelevant-files: *functest-irrelevant-files
+        - swift-dsvm-functional-ipv6:
+            irrelevant-files: *functest-irrelevant-files
+        - swift-tox-lower-constraints:
+            irrelevant-files: *unittest-irrelevant-files
+        - openstack-tox-pep8:
+            irrelevant-files: *pep8-irrelevant-files
+        - swift-multinode-rolling-upgrade:
+            irrelevant-files: *functest-irrelevant-files
+        - tempest-integrated-object-storage:
+            irrelevant-files: *tempest-irrelevant-files
+        - tempest-integrated-object-storage-ubuntu-jammy:
+            irrelevant-files: *tempest-irrelevant-files
+        - tempest-ipv6-only:
+            irrelevant-files: *tempest-irrelevant-files
+        - openstacksdk-functional-devstack:
+            irrelevant-files: *tempest-irrelevant-files
+        - grenade:
+            irrelevant-files: *tempest-irrelevant-files
+        - grenade-skip-level:
+            irrelevant-files: *tempest-irrelevant-files
+        - grenade-skip-level-always:
+            irrelevant-files: *tempest-irrelevant-files
+    experimental:
+      jobs:
+        - swift-tox-py38
+        - swift-tox-py310
+        - swift-tox-py311
+        - swift-tox-func-py39-centos-9-stream
+        - swift-tox-func-encryption-py39-centos-9-stream
+        - swift-tox-func-ec-py39-centos-9-stream
+        - swift-multinode-rolling-upgrade-wallaby
+        - swift-multinode-rolling-upgrade-xena
+        - swift-multinode-rolling-upgrade-yoga
+        - swift-multinode-rolling-upgrade-zed
+        - swift-multinode-rolling-upgrade-antelope
+        - swift-multinode-rolling-upgrade-bobcat
+        - swift-multinode-rolling-upgrade-caracal
+        - swift-multinode-rolling-upgrade-dalmatian
+        - swift-multinode-rolling-upgrade-epoxy
+        - swift-multinode-rolling-upgrade-flamingo
+        - swift-multinode-rolling-upgrade-master:
+            branches: master
+
+    post:
+      jobs:
+        - publish-openstack-python-branch-tarball
+    promote:
+      jobs:
+        - swift-promote-image
diff --git a/AUTHORS b/AUTHORS
index e123d379a9..1b3f4faf28 100644
--- a/AUTHORS
+++ b/AUTHORS
@@ -1,7 +1,7 @@
 Maintainer
 ----------
-OpenStack, LLC.
-IRC: #openstack on irc.freenode.net
+OpenStack Foundation
+IRC: #openstack on irc.oftc.net
 
 Original Authors
 ----------------
@@ -13,82 +13,494 @@ Jay Payne (letterj@gmail.com)
 Will Reese (wreese@gmail.com)
 Chuck Thier (cthier@gmail.com)
 
+Core Emeritus
+-------------
+Chmouel Boudjnah (chmouel@enovance.com)
+Florian Hines (syn@ronin.io)
+Greg Holt (gholt@rackspace.com)
+Paul Luse (paul.e.luse@intel.com)
+Donagh McCabe (donagh.mccabe@gmail.com)
+Hisashi Osanai (osanai.hisashi@gmail.com)
+Jay Payne (letterj@gmail.com)
+Peter Portante (peter.portante@redhat.com)
+Will Reese (wreese@gmail.com)
+Chuck Thier (cthier@gmail.com)
+Darrell Bishop (darrell@swiftstack.com)
+David Goetz (david.goetz@rackspace.com)
+Greg Lange (greglange@gmail.com)
+Janie Richling (jrichli@us.ibm.com)
+Michael Barton (mike@weirdlooking.com)
+Mahati Chamarthy (mahati.chamarthy@gmail.com)
+Samuel Merritt (smerritt@nvidia.com)
+Romain Le Disez (romain.ledisez@ovh.net)
+Pete Zaitcev (zaitcev@yahoo.com)
+
 Contributors
 ------------
-Jesse Andrews (anotherjesse@gmail.com)
-Joe Arnold (joe@swiftstack.com)
-Ionuț Arțăriși (iartarisi@suse.cz)
-Darrell Bishop (darrell@swiftstack.com)
-James E. Blair (james.blair@rackspace.com)
-Chmouel Boudjnah (chmouel@chmouel.com)
-Clark Boylan (clark.boylan@gmail.com)
-Russell Bryant (rbryant@redhat.com)
-Devin Carlen (devin.carlen@gmail.com)
-Thierry Carrez (thierry@openstack.org)
-François Charlier (francois.charlier@enovance.com)
-Ray Chen (oldsharp@163.com)
-Brian Cline (bcline@softlayer.com)
-Julien Danjou (julien.danjou@enovance.com)
-Dan Dillinger (dan.dillinger@sonian.net)
-Tom Fifield (fifieldt@unimelb.edu.au)
-Gaurav B. Gangalwar (gaurav@gluster.com)
+Aaron Rosen (arosen@nicira.com)
+Ade Lee (alee@redhat.com)
+Adrian Smith (adrian_f_smith@dell.com)
+Adrien Pensart (adrien.pensart@corp.ovh.com)
+afariasa (afariasa@redhat.com)
+Akihiro Motoki (amotoki@gmail.com)
+Akihito Takai (takaiak@nttdata.co.jp)
+Alex Gaynor (alex.gaynor@gmail.com)
+Alex Holden (alex@alexjonasholden.com)
+Alex Pecoraro (alex.pecoraro@emc.com)
+Alex Szarka (szarka@inf.u-szeged.hu)
+Alex Yang (alex890714@gmail.com)
+Alexander Fadeev (fadeevab.com@gmail.com)
+Alexandra Settle (asettle@suse.com)
+Alexandre Lécuyer (alexandre.lecuyer@corp.ovh.com)
+Alfredo Moralejo (amoralej@redhat.com)
+Alistair Coles (alistairncoles@gmail.com)
+Andreas Jaeger (aj@suse.de)
+Andrew Clay Shafer (acs@parvuscaptus.com)
+Andrew Hale (andy@wwwdata.eu)
+Andrew Welleck (awellec@us.ibm.com)
+Andy McCrae (andy.mccrae@gmail.com)
+Anh Tran (anhtt@vn.fujitsu.com)
+Anish Kachinthaya (anishk23733@gmail.com)
+Ankur Gupta (ankur.gupta@intel.com)
 Anne Gentle (anne@openstack.org)
+aolivo (aolivo@blizzard.com)
+Arnaud JOST (arnaud.jost@ovh.net)
+arzhna (arzhna@gmail.com)
+Ashwin Nair (nairashwin952013@gmail.com)
+Atsushi Sakai (sakaia@jp.fujitsu.com)
+Aymeric Ducroquetz (aymeric.ducroquetz@ovhcloud.com)
+Azhagu Selvan SP (tamizhgeek@gmail.com)
+Azmain Adib (adib1905@gmail.com)
+baiwenteng (baiwenteng@inspur.com)
+Ben Keller (bjkeller@us.ibm.com)
+Ben Martin (blmartin@us.ibm.com)
+bhavani.cr (bhavani.r@nectechnologies.in)
+Bill Huber (wbhuber@us.ibm.com)
+Bob Ball (bob.ball@citrix.com)
+Brent Roskos (broskos@internap.com)
+Brian Cline (bcline@softlayer.com)
+Brian Curtin (brian.curtin@rackspace.com)
+Brian D. Burns (iosctr@gmail.com)
+Brian K. Jones (bkjones@gmail.com)
+Brian Ober (bober@us.ibm.com)
+Brian Reitz (brian.reitz@oracle.com)
+Bryan Keller (kellerbr@us.ibm.com)
+Béla Vancsics (vancsics@inf.u-szeged.hu)
+Caleb Tennis (caleb.tennis@gmail.com)
+Callum Dickinson (callum.dickinson@catalystcloud.nz)
+Cao Xuan Hoang (hoangcx@vn.fujitsu.com)
+Carlos Cavanna (ccavanna@ca.ibm.com)
+Catherine Northcott (catherine@northcott.nz)
+Cedric Dos Santos (cedric.dos.sant@gmail.com)
+Changbin Liu (changbin.liu@gmail.com)
+ChangBo Guo(gcb) (eric.guo@easystack.cn)
+Chaozhe Chen (chaozhe.chen@easystack.cn)
+Charles Hsu (charles0126@gmail.com)
+chenaidong1 (chen.aidong@zte.com.cn)
+cheng (li.chenga@h3c.com)
+Cheng Li (shcli@cn.ibm.com)
+chengebj5238 (chengebj@inspur.com)
+chenxiangui (chenxiangui@inspur.com)
+Chetan Mishra (chetan.s115@gmail.com)
+Chinemerem Chigbo (chinemeremchigbo@Outlook.com)
+Chmouel Boudjnah (chmouel@enovance.com)
+Chris Smart (distroguy@gmail.com)
+Chris Wedgwood (cw@f00f.org)
+Christian Berendt (berendt@b1-systems.de)
+Christian Hugo (hugo.christian@web.de)
+Christian Ohanaja (christianohanaja431@gmail.com)
+Christian Schwede (cschwede@redhat.com)
+Christopher Bartz (bartz@dkrz.de)
+Christopher MacGown (chris@pistoncloud.com)
+Chuck Short (chuck.short@canonical.com)
+Clark Boylan (clark.boylan@gmail.com)
 Clay Gerrard (clay.gerrard@gmail.com)
-Mark Gius (launchpad@markgius.com)
+Clément Contini (ccontini@cloudops.com)
+Colin Nicholson (colin.nicholson@iomart.com)
+Colleen Murphy (colleen.murphy@suse.com)
+Conrad Weidenkeller (conrad.weidenkeller@rackspace.com)
+Constantine Peresypkin (constantine.peresypk@rackspace.com)
+Corey Bryant (corey.bryant@canonical.com)
+Cory Wright (cory.wright@rackspace.com)
+Cristian A Sanchez (cristian.a.sanchez@intel.com)
+CY Chiang (cychiang@cht.com.tw)
+Cyril Roelandt (cyril@redhat.com)
+Daanish Khan (daanish1337@gmail.com)
+Dae S. Kim (dae@velatum.com)
+Daisuke Morita (morita.daisuke@ntti3.com)
+Dan Dillinger (dan.dillinger@sonian.net)
+Dan Hersam (dan.hersam@hp.com)
+Dan Prince (dprince@redhat.com)
+dangming (dangming@unitedstack.com)
+Daniele Pizzolli (dpizzolli@fbk.eu)
+Daniele Valeriani (daniele@dvaleriani.net)
+Darrell Bishop (darrell@swiftstack.com)
+Darryl Tam (dtam@swiftstack.com)
 David Goetz (david.goetz@rackspace.com)
-Jonathan Gonzalez V (jonathan.abdiel@gmail.com)
-David Hadas (david.hadas@gmail.com)
-Soren Hansen (soren@linux2go.dk)
-Doug Hellmann (doug.hellmann@dreamhost.com)
+David Hadas (davidh@il.ibm.com)
+David Liu (david.liu@cn.ibm.com)
+David Moreau Simard (dmsimard@iweb.com)
+David Rabel (rabel@b1-systems.de)
+Dean Troyer (dtroyer@gmail.com)
+Denis V. Meltsaykin (dmeltsaykin@mirantis.com)
 Derek Higgins (derekh@redhat.com)
+Devin Carlen (devin.carlen@gmail.com)
+Dharmendra Kushwaha (dharmendra.kushwaha@nectechnologies.in)
+Dhriti Shikhar (dhrish20@gmail.com)
+Dieter Plaetinck (dieter@vimeo.com)
+Dirk Mueller (dirk@dmllr.de)
+Dmitriy Ukhlov (dukhlov@mirantis.com)
+Dmitry Ukov (dukov@mirantis.com)
+Dolph Mathews (dolph.mathews@gmail.com)
+Donagh McCabe (donagh.mccabe@gmail.com)
+dongu (gmj03003@gmail.com)
+Doron Chen (cdoron@il.ibm.com)
+Doug Hellmann (doug@doughellmann.com)
+Doug Weimer (dweimer@gmail.com)
+Dr. Jens Harbott (harbott@osism.tech)
+Dragos Manolescu (dragosm@hp.com)
+Drew Balfour (andrew.balfour@oracle.com)
+Eamonn O'Toole (eamonn.otoole@hpe.com)
+Ed Leafe (ed.leafe@rackspace.com)
+Edward Hope-Morley (opentastic@gmail.com)
+Ehud Kaldor (ehud@unfairfunction.org)
+Ellen Leahy (ellen.mar.leahy@hpe.com)
+Elod Illes (elod.illes@est.tech)
+Emett Speer (speer.emett@gmail.com)
+Emile Snyder (emile.snyder@gmail.com)
+Emmanuel Cazenave (contact@emcaz.fr)
+Eohyung Lee (liquidnuker@gmail.com)
+Eran Rom (eranr@il.ibm.com)
+Eugene Kirpichov (ekirpichov@gmail.com)
+Ewan Mellor (ewan.mellor@citrix.com)
+Fabien Boucher (fabien.boucher@enovance.com)
+Falk Reimann (falk.reimann@sap.com)
+FatemaKhalid (fatemakhalid96@gmail.com)
+Felipe Reyes (freyes@tty.cl)
+Ferenc Horváth (hferenc@inf.u-szeged.hu)
+Filippo Giunchedi (fgiunchedi@wikimedia.org)
+Flavio Percoco (flaper87@gmail.com)
+Florent Flament (florent.flament-ext@cloudwatt.com)
+Florent Vennetier (florent.vennetier@ovhcloud.com)
 Florian Hines (syn@ronin.io)
+François Charlier (francois.charlier@enovance.com)
+Fujita Tomonori (fujita.tomonori@lab.ntt.co.jp)
+Félix Cantournet (felix.cantournet@cloudwatt.com)
+Gage Hugo (gh159m@att.com)
+Ganesh Maharaj Mahalingam (ganesh.mahalingam@intel.com)
+gaobin (gaobin@inspur.com)
+gaofei (gao.fei@inspur.com)
+Gaurav B. Gangalwar (gaurav@gluster.com)
+gecong1973 (ge.cong@zte.com.cn)
+gengchc2 (geng.changcai2@zte.com.cn)
+Gerard Gine (ggine@swiftstack.com)
+Gerry Drudy (gerry.drudy@hpe.com)
+Ghanshyam Mann (gmann@ghanshyammann.com)
+Gil Vernik (gilv@il.ibm.com)
+Gilles Biannic (gilles.biannic@corp.ovh.com)
+Gleb Samsonov (sams-gleb@yandex.ru)
+Gonéri Le Bouder (goneri.lebouder@enovance.com)
+Graham Hayes (graham.hayes@hpe.com)
+Gregory Haynes (greg@greghaynes.net)
+Grzegorz Grasza (xek@redhat.com)
+Guang Yee (guang.yee@hpe.com)
+guotao (guotao.bj@inspur.com)
+Gábor Antal (antal@inf.u-szeged.hu)
+Ha Van Tu (tuhv@vn.fujitsu.com)
+Hamdi Roumani (roumani@ca.ibm.com)
+Hanxi Liu (hanxi.liu@easystack.cn)
+Harshada Mangesh Kakad (harshadak@metsi.co.uk)
+Harshit Chitalia (harshit@acelio.com)
+HCLTech-SSW (hcl_ss_oss@hcl.com)
+Hervé Beraud (hberaud@redhat.com)
+hgangwx (hgangwx@cn.ibm.com)
+Hisashi Osanai (osanai.hisashi@gmail.com)
+Hodong Hwang (hodong.hwang@kt.com)
+Hou Ming Wang (houming.wang@easystack.cn)
+houweichao (houwch@gohighsec.com)
+Hu Bing (hubingsh@cn.ibm.com)
+Hua Zhang (zhuadl@cn.ibm.com)
+Hugo Kuo (tonytkdk@gmail.com)
+Ilya Kharin (ikharin@mirantis.com)
+Ionuț Arțăriși (iartarisi@suse.cz)
 Iryoung Jeong (iryoung@gmail.com)
-Paul Jimenez (pj@place.org)
-Brian K. Jones (bkjones@gmail.com)
-Morita Kazutaka (morita.kazutaka@gmail.com)
+its-not-a-bug-its-a-feature (david.cole@sohonet.com)
+Ivan Anfimov (lazekteam@gmail.com)
+Jaivish Kothari (jaivish.kothari@nectechnologies.in)
+Jake Yip (jake.yip@ardc.edu.au)
+James E. Blair (jeblair@openstack.org)
+James Nguyen (ngmqng@gmail.com)
+James Page (james.page@ubuntu.com)
+Jamie Lennox (jlennox@redhat.com)
+Jan Zerebecki (jan.openstack@zerebecki.de)
+Janie Richling (jrichli@us.ibm.com)
+Jason Johnson (jajohnson@softlayer.com)
+Jay S. Bryant (jsbryant@us.ibm.com)
+Jens Harbott (j.harbott@x-ion.de)
+Jeremy Stanley (fungi@yuggoth.org)
+Jesse Andrews (anotherjesse@gmail.com)
+Ji-Wei (ji.wei3@zte.com.cn)
+Jian Zhang (jian.zhang@intel.com)
+Jiangmiao Gao (tolbkni@gmail.com)
+Jianjian Huo (jhuo@nvidia.com)
+jiaqi07 (wangjiaqi07@inspur.com)
+Jing Liuqing (jing.liuqing@99cloud.net)
+jinyuanliu (liujinyuan@inspur.com)
+Joanna H. Huang (joanna.huitzu.huang@gmail.com)
+Joe Arnold (joe@swiftstack.com)
+Joe Gordon (jogo@cloudscaling.com)
+Joe Yang (jyang@swiftstack.com)
+Joel Wright (joel.wright@sohonet.com)
+John Leach (john@johnleach.co.uk)
+Jola Mirecka (jola.mirecka@hp.com)
+Jon Snitow (otherjon@swiftstack.com)
+Jonathan Gonzalez V (jonathan.abdiel@gmail.com)
+Jonathan Hinson (jlhinson@us.ibm.com)
 Josh Kearney (josh@jk0.org)
-Ed Leafe (ed.leafe@rackspace.com)
-Tong Li (litong01@us.ibm.com)
-Victor Lowther (victor.lowther@gmail.com)
-Zhong Yue Luo (lzyeval@gmail.com)
-Dragos Manolescu (dragosm@hp.com)
 Juan J. Martinez (juan@memset.com)
+Julien Danjou (julien@danjou.info)
+junboli (junbo85.li@gmail.com)
+Kai Zhang (zakir.exe@gmail.com)
+Kapil Thangavelu (kapil.foss@gmail.com)
+karen chan (karen@karen-chan.com)
+Kato Tomoyuki (kato.tomoyuki@jp.fujitsu.com)
+Kazuhiro Miyahara (miyahara.kazuhiro@lab.ntt.co.jp)
+Ke Liang (ke.liang@easystack.cn)
+Kenichiro Matsuda (matsuda_kenichi@jp.fujitsu.com)
+Keshava Bharadwaj (kb.sankethi@gmail.com)
+kim woo seok (rladntjr4@gmail.com)
+Kiyoung Jung (kiyoung.jung@kt.com)
+Koert van der Veer (koert@cloudvps.com)
+Konrad Kügler (swamblumat-eclipsebugs@yahoo.de)
+Kota Tsuyuzaki (bloodeagle40234@gmail.com)
+Ksenia Demina (kdemina@mirantis.com)
+Kuan-Lin Chen (kuanlinchen@synology.com)
+Kun Huang (gareth@unitedstack.com)
+Larry Rensing (lr699s@att.com)
+Leah Klearman (lklrmn@gmail.com)
+Li Riqiang (lrqrun@gmail.com)
+Liang Jingtao (liang.jingtao@zte.com.cn)
+lijunbo (lijunbo@fiberhome.com)
+likui (likui@yovole.com)
+Lin Yang (lin.a.yang@intel.com)
+Lingxian Kong (anlin.kong@gmail.com)
+lingyongxu (lyxu@fiberhome.com)
+Liu Siqi (meizu647@gmail.com)
+liujiong (liujiong@gohighsec.com)
+liuyamin (liuyamin@fiberhome.com)
+Lokesh S (lokesh.s@hp.com)
+Lorcan Browne (lorcan.browne@hpe.com)
+Luciano Lo Giudice (luciano.logiudice@canonical.com)
+Luis de Bethencourt (luis@debethencourt.com)
+Luong Anh Tuan (tuanla@vn.fujitsu.com)
+lvxianguo (lvxianguo@inspur.com)
+M V P Nitesh (m.nitesh@nectechnologies.in)
+Madhuri Kumari (madhuri.rai07@gmail.com)
+Mahati Chamarthy (mahati.chamarthy@gmail.com)
+Mandell Degerness (mdegerness@nvidia.com)
+manuvakery1 (manu.km@idrive.com)
+maoshuai (fwsakura@163.com)
 Marcelo Martins (btorch@gmail.com)
-Donagh McCabe (donagh.mccabe@hp.com)
-Andy McCrae (andy.mccrae@gmail.com)
+Maria Malyarova (savoreux69@gmail.com)
+Mark Gius (launchpad@markgius.com)
+Mark Seger (mark.seger@hpe.com)
+Martin Geisler (martin@geisler.net)
+Martin Kletzander (mkletzan@redhat.com)
+Maru Newby (mnewby@internap.com)
+Masaki Tsukuda (tsukuda.masaki@po.ntts.co.jp)
+Mathias Bjoerkqvist (mbj@zurich.ibm.com)
+Matt Kassawara (mkassawara@gmail.com)
+Matt Riedemann (mriedem@us.ibm.com)
+Matthew Oliver (matt@oliver.net.au)
+Matthew Vernon (mvernon@wikimedia.org)
+Matthieu Huin (mhu@enovance.com)
+Mauro Stettler (mauro.stettler@gmail.com)
+Mehdi Abaakouk (sileht@redhat.com)
+melissaml (ma.lei@99cloud.net)
+Michael Matur (michael.matur@gmail.com)
+Michael Shuler (mshuler@gmail.com)
+Michele Valsecchi (mvalsecc@redhat.com)
+Mike Fedosin (mfedosin@mirantis.com)
+Mingyu Li (li.mingyu@99cloud.net)
+Minwoo Bae (minwoob@us.ibm.com)
+Mitsuhiro SHIGEMATSU (shigematsu.mitsuhiro@lab.ntt.co.jp)
+mmcardle (mark.mcardle@sohonet.com)
+Mohamed Hassaneen (mohammedashoor89@gmail.com)
+Mohammed Al-Jawaheri (mjawaheri02@gmail.com)
+Mohit Motiani (mohit.motiani@intel.com)
+Monty Taylor (mordred@inaugust.com)
+Morgan Fainberg (morgan.fainberg@gmail.com)
+Morita Kazutaka (morita.kazutaka@gmail.com)
+Motonobu Ichimura (motonobu@gmail.com)
+Nada El-Mestkawy (nadamaged05@gmail.com)
+Nadeem Syed (snadeem.hameed@gmail.com)
+Nakagawa Masaaki (nakagawamsa@nttdata.co.jp)
+Nakul Dahiwade (nakul.dahiwade@intel.com)
+Nam Nguyen Hoai (namnh@vn.fujitsu.com)
+Nandini Tata (nandini.tata@intel.com)
+Naoto Nishizono (nishizono.naoto@po.ntts.co.jp)
+Nassim Babaci (nassim.babaci@cloudwatt.com)
+Nathan Kinder (nkinder@redhat.com)
+nathang15 (nguyennathan1502@gmail.com)
+Nelson Almeida (nelsonmarcos@gmail.com)
+Newptone (xingchao@unitedstack.com)
+ngcjny (noguchi.junya@fujitsu.com)
+Ngo Quoc Cuong (cuongnq@vn.fujitsu.com)
+Nguyen Hai (nguyentrihai93@gmail.com)
+Nguyen Hung Phuong (phuongnh@vn.fujitsu.com)
+Nguyen Phuong An (AnNP@vn.fujitsu.com)
+Nguyen Quoc Viet (nguyenqviet98@gmail.com)
+Nicholas Njihia (nicholas.njihia@canonical.com)
+Nicolas Helgeson (nh202b@att.com)
+Nicolas Trangez (ikke@nicolast.be)
+Ning Zhang (ning@zmanda.com)
+Nirmal Thacker (nirmalthacker@gmail.com)
+niuke (niuke19970315@163.com)
+npraveen35 (npraveen35@gmail.com)
+Olga Saprycheva (osapryc@us.ibm.com)
+Ondrej Novy (ondrej.novy@firma.seznam.cz)
+Or Ozeri (oro@il.ibm.com)
+Oshrit Feder (oshritf@il.ibm.com)
+Paul Dardeau (paul.dardeau@intel.com)
+Paul Jimenez (pj@place.org)
+Paul Luse (paul.e.luse@intel.com)
 Paul McMillan (paul.mcmillan@nebula.com)
-Ewan Mellor (ewan.mellor@citrix.com)
+Pavel Kvasnička (pavel.kvasnicka@firma.seznam.cz)
+Pawel Palucki (pawel.palucki@gmail.com)
+Pearl Yajing Tan (pearl.y.tan@seagate.com)
+pengyuesheng (pengyuesheng@gohighsec.com)
+Peter Lisák (peter.lisak@gmail.com)
+Peter Portante (peter.portante@redhat.com)
+Petr Kovar (pkovar@redhat.com)
+Philippe SERAPHIN (philippe.seraphin@infomaniak.com)
+Pradeep Kumar Singh (pradeep.singh@nectechnologies.in)
+Prashanth Pai (ppai@redhat.com)
+Pádraig Brady (pbrady@redhat.com)
+Qiaowei Ren (qiaowei.ren@intel.com)
+Rafael Rivero (rafael@cloudscaling.com)
+Rainer Toebbicke (Rainer.Toebbicke@cern.ch)
+rajat29 (rajat.sharma@nectechnologies.in)
+Ray Chen (oldsharp@163.com)
+Rebecca Finn (rebeccax.finn@intel.com)
+Renich Bon Ćirić (renich@cloudsigma.com)
+Ricardo Ferreira (ricardo.sff@gmail.com)
+Richard Hawkins (richard.hawkins@rackspace.com)
+ricolin (ricolin@ricolky.com)
+Robert Francis (robefran@ca.ibm.com)
+Robin Naundorf (r.naundorf@fh-muenster.de)
+Romain de Joux (romain.de-joux@ovhcloud.com)
+Russ Nelson (russ@crynwr.com)
+Russell Bryant (rbryant@redhat.com)
+Sachin Patil (psachin@redhat.com)
+Sam Morrison (sorrison@gmail.com)
 Samuel Merritt (sam@swiftstack.com)
+Sarafraj Singh (Sarafraj.Singh@intel.com)
+Sarvesh Ranjan (saranjan@cisco.com)
+Sascha Peilicke (saschpe@gmx.de)
+Saverio Proto (saverio.proto@switch.ch)
+Scott Simpson (sasimpson@gmail.com)
+Sean McGinnis (sean.mcginnis@gmail.com)
+Sean Mooney (work@seanmooney.info)
+SeongSoo Cho (ppiyakk2@printf.kr)
+Sergey Kraynev (skraynev@mirantis.com)
+Sergey Lukjanov (slukjanov@mirantis.com)
+Shane Wang (shane.wang@intel.com)
+shangxiaobj (shangxiaobj@inspur.com)
+shaofeng_cheng (chengsf@winhong.com)
+Shashank Kumar Shankar (shashank.kumar.shankar@intel.com)
+Shashirekha Gundur (shashirekha.j.gundur@intel.com)
+Shilla Saebi (shilla.saebi@gmail.com)
+Shreeya Deshpande (shreeyad@nvidia.com)
+Shri Javadekar (shrinand@maginatics.com)
+Simeon Gourlin (simeon.gourlin@infomaniak.com)
+Sivasathurappan Radhakrishnan (siva.radhakrishnan@intel.com)
+Soren Hansen (soren@linux2go.dk)
+Stefan Majewsky (stefan.majewsky@sap.com)
 Stephen Milton (milton@isomedia.com)
-Russ Nelson (russ@crynwr.com)
-Maru Newby (mnewby@internap.com)
-Colin Nicholson (colin.nicholson@iomart.com)
-Eamonn O'Toole (eamonn.otoole@hp.com)
-Constantine Peresypkin (constantine@litestack.com)
-Dan Prince (dprince@redhat.com)
-Felipe Reyes (freyes@tty.cl)
-Li Riqiang (lrqrun@gmail.com)
+Steve Kowalik (steven@wedontsleep.org)
+Steve Martinelli (stevemar@ca.ibm.com)
+Steven Lang (Steven.Lang@hgst.com)
+Sushil Kumar (sushil.kumar2@globallogic.com)
+Takashi Kajinami (kajinamit@oss.nttdata.com)
+Takashi Natsume (takanattie@gmail.com)
+TheSriram (sriram@klusterkloud.com)
+Thiago da Silva (thiagodasilva@gmail.com)
+Thibault Person (thibault.person@ovhcloud.com)
+Thierry Carrez (thierry@openstack.org)
+Thomas Goirand (thomas@goirand.fr)
+Thomas Herve (therve@redhat.com)
+Thomas Leaman (thomas.leaman@hp.com)
+Tiago Primini (primini@gmail.com)
+Tim Burke (tim.burke@gmail.com)
+Timothy Okwii (tokwii@cisco.com)
+Timur Alperovich (timur.alperovich@gmail.com)
+Tin Lam (tinlam@gmail.com)
+Tobias Stevenson (tstevenson@vbridges.com)
+Tom Fifield (tom@openstack.org)
+Tomas Matlocha (tomas.matlocha@firma.seznam.cz)
+tone-zhang (tone.zhang@linaro.org)
+Tong Li (litong01@us.ibm.com)
+Tovin Seven (vinhnt@vn.fujitsu.com)
+Tra Bui (trabui.0517@gmail.com)
+Travis McPeak (tmcpeak@us.ibm.com)
+Tushar Gohad (tushar.gohad@intel.com)
+Van Hung Pham (hungpv@vn.fujitsu.com)
+venkatamahesh (venkatamaheshkotha@gmail.com)
+Venkateswarlu Pallamala (p.venkatesh551@gmail.com)
+Victor Lowther (victor.lowther@gmail.com)
 Victor Rodionov (victor.rodionov@nexenta.com)
-Brent Roskos (broskos@internap.com)
-Michael Shuler (mshuler@rackspace.com)
-Andrew Clay Shafer (acs@parvuscaptus.com)
-Scott Simpson (sasimpson@gmail.com)
-Adrian Smith (adrian_f_smith@dell.com)
-Monty Taylor (mordred@inaugust.com)
-Caleb Tennis (caleb.tennis@gmail.com)
-Rainer Toebbicke (Rainer.Toebbicke@cern.ch)
-Fujita Tomonori (fujita.tomonori@lab.ntt.co.jp)
-Kapil Thangavelu (kapil.foss@gmail.com)
-Dean Troyer (dtroyer@gmail.com)
-Kota Tsuyuzaki (tsuyuzaki.kota@lab.ntt.co.jp)
+Victor Stinner (vstinner@redhat.com)
+Viktor Varga (vvarga@inf.u-szeged.hu)
+Vil Surkin (mail@vills.me)
 Vincent Untz (vuntz@suse.com)
-Daniele Valeriani (daniele@dvaleriani.net)
-Chris Wedgwood (cw@f00f.org)
-Conrad Weidenkeller (conrad.weidenkeller@rackspace.com)
-Doug Weimer (dweimer@gmail.com)
-Cory Wright (cory.wright@rackspace.com)
+Vitaly Bordyug (vbordug@gmail.com)
+Vladimir Vechkanov (vvechkanov@mirantis.com)
+Vu Cong Tuan (tuanvc@vn.fujitsu.com)
+vxlinux (yan.wei7@zte.com.cn)
+Walter Doekes (walter+github@wjd.nu)
+wangdequn (wangdequn@inspur.com)
+wanghongtaozz (wanghongtaozz@inspur.com)
+wanghui (wang_hui@inspur.com)
+wangqi (wang.qi@99cloud.net)
+Wei LingFei (weilingfei@uniontech.com)
+whoami-rajat (rajatdhasmana@gmail.com)
+wu.shiming (wushiming@yovole.com)
+Wu Wenxiang (wu.wenxiang@99cloud.net)
+Wyllys Ingersoll (wyllys.ingersoll@evault.com)
+xhancar (pavel.hancar@gmail.com)
+XieYingYun (smokony@sina.com)
+Yaguang Wang (yaguang.wang@intel.com)
+Yan Xiao (yanxiao@nvidia.com)
+yanghuichan (yanghc@fiberhome.com)
+Yatin Kumbhare (yatinkumbhare@gmail.com)
 Ye Jia Xu (xyj.asmy@gmail.com)
-Alex Yang (alex890714@gmail.com)
-Pete Zaitcev (zaitcev@kotori.zaitcev.us)
-Ning Zhang (ning@zmanda.com)
+Yee (mail.zhang.yee@gmail.com)
+Yu Yafei (yu.yafei@zte.com.cn)
 Yuan Zhou (yuan.zhou@intel.com)
+yuhui_inspur (yuhui@inspur.com)
+Yummy Bian (yummy.bian@gmail.com)
+Yuriy Taraday (yorik.sar@gmail.com)
+Yushiro FURUKAWA (y.furukawa_2@jp.fujitsu.com)
+Yuxin Wang (wang.yuxin@ostorage.com.cn)
+Zack M. Davis (zdavis@swiftstack.com)
+Zap Chang (zapchang@gmail.com)
+zengjia (zengjia@awcloud.com)
+Zhang Guoqing (zhang.guoqing@99cloud.net)
+Zhang Jinnan (ben.os@99cloud.net)
+zhang.lei (zhang.lei@99cloud.net)
+zhangboye (zhangboye@inspur.com)
+zhangdebo1987 (zhangdebo@inspur.com)
+zhangyanxian (zhangyanxianmail@163.com)
+Zhao Lei (zhaolei@cn.fujitsu.com)
+zhaoleilc (15247232416@163.com)
+Zheng Yao (zheng.yao1@zte.com.cn)
+zheng yin (yin.zheng@easystack.cn)
+Zhenguo Niu (zhenguo@unitedstack.com)
+zhengwei6082 (zhengwei6082@fiberhome.com)
+ZhijunWei (wzj334965317@outlook.com)
+ZhiQiang Fan (aji.zqfan@gmail.com)
+ZhongShengping (chdzsp@163.com)
+Zhongyue Luo (zhongyue.nah@intel.com)
+zhufl (zhu.fanglei@zte.com.cn)
+zhulingjie (easyzlj@gmail.com)
+翟小君 (zhaixiaojun@gohighsec.com)
diff --git a/CHANGELOG b/CHANGELOG
index c5aada64c2..1aff48e4e4 100644
--- a/CHANGELOG
+++ b/CHANGELOG
@@ -1,3 +1,4555 @@
+swift (2.37.0)
+
+    * The s3token middleware now passes service auth tokens to Keystone
+      if credentials are provided. This is required to enable S3 API
+      access for Keystone users when using Keystone >25.0.0, !=26.0.0,
+      !=26.0.1, !=27.0.0, !=28.0.0. See etc/proxy-server.conf-sample for
+      configuration details. For more information, see
+      https://security.openstack.org/ossa/OSSA-2025-002.html and
+      https://bugs.launchpad.net/keystone/+bug/2119646
+
+    * The s3token middleware now caches credential secrets for one minute
+      by default, if credentials are provided. Secret-caching typically
+      reduces the load on Keystone and is required for Keystone users to
+      be able to use signed aws-chunked transfers. To return to prior
+      behavior, explicitly set `secret_cache_duration = 0` in the
+      `[filter:s3api]` section of your proxy-server.conf.
+
+    * Improved checksum validation for S3 API DeleteObjects requests.
+
+    * POST requests are more likely to receive a 503 response in the
+      face of backend inconsistencies.
+
+    * The KMS keymaster now supports selecting the endpoint returned in the
+      Keystone catalog via the `barbican_region_name` configuration option.
+      This may be useful in multi-region deployments which have multiple
+      endpoints.
+
+    * The request line-length limit is now configurable for all WSGI servers
+      via the `max_request_line` option in the `[swift-constraints]` section
+      of swift.conf. By default, continue to use eventlet's default of 8192
+      bytes.
+
+    * Writes to sharded containers are less likely to have their updates
+      sent to the root container. This uses a new cooperative-token
+      mechanism to limit the number of concurrent shard range queries
+      to the root container; see the `[app:proxy-server]` section of
+      etc/proxy-server.conf-sample for configuration options.
+
+    * The following new metrics were added when using labeled metrics:
+
+      * The proxy-logging middleware may now emit real-time transfer metrics.
+        See the `statsd_emit_buffer_xfer_bytes_seconds` option in
+        etc/proxy-server.conf-sample for more information.
+
+      * The proxy-logging middleware now includes an `api` label whose value
+        may be `swift` or `S3` depending on whether the client request is
+        serviced by the swift API or S3 API.
+
+      * The s3api middleware now emits a counter recording the usage of
+        various protocol-related headers.
+
+      * The container-sharder now emits a timing metric for the length of
+        time between shard range creation and cleaving.
+
+    * `swift-manage-shard-ranges` now defaults to committing pending
+      updates before looking for shard range boundaries. A new option,
+      `--skip-commits`, may be used to restore previous behavior.
+
+    * Added a `--clobber-hardlink-collisions` option to `swift-object-relinker`.
+      With this option enabled during the relink phase the relinker will
+      quarantine the colliding file in the new target part dir and retry the
+      relink. During the cleanup phase it will ignore the un-matched inode
+      "collision" and allow the cleanup of the old file in the old part dir
+      similar to tombstones.
+
+    * Fixed the `swift_dir` option for WSGI servers; the file
+      `/etc/swift/swift.conf` no longer needs to exist when that option
+      is set.
+
+    * Fixed an object-server error when there is a part-power increase in
+      progress and there was an issue marking the file in the new partition
+      space as durable.
+
+    * Device names are now included in sharded database IDs, similar to
+      regular databases. This provides more context when examining
+      incoming/outgoing sync tables or sharding CleaveContexts.
+
+    * Database replicators now clean up temporary files older than
+      `reclaim_age`.
+
+    * Removed fallback support using netifaces; `getifaddrs` is now always
+      used to determine available IP addresses.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.36.0, OpenStack Flamingo)
+
+    * S3 API
+
+      * Added support for aws-chunked transfers. Recent AWS clients recently
+        began defaulting to this mode. See also:
+        https://docs.aws.amazon.com/AmazonS3/latest/API/sigv4-streaming.html
+
+      * Added support for verifying additional checksums during upload. All
+        algorithms currently supported by AWS are supported: CRC64NVME,
+        CRC32, CRC32C, SHA1, and SHA256. See also:
+        https://docs.aws.amazon.com/AmazonS3/latest/userguide/checking-object-integrity.html
+        Note that some algorithms require the availability of additional
+        libraries: ISA-L or anycrc.
+
+      * Added support for create-without-overwrite conditional writes.
+
+      * Fixed HTTP framing issues when returning errors for a request with
+        `Expect: 100-continue`.
+
+      * Improved various error messages to better imitate AWS responses.
+
+    * Let clients request heartbeats during COPYs by including
+      the query parameter `heartbeat=on`.
+
+      With heartbeating turned on, the proxy will start its response
+      immediately with 202 Accepted then send a single whitespace
+      character periodically until the request completes. At that
+      point, a final summary chunk will be sent which includes a
+      "Response Status" key indicating success or failure.
+
+    * Labeled metrics
+
+      * Added support for emitting labeled statsd metrics in a variety of
+        formats. Middleware authors should see the documentation at
+        https://docs.openstack.org/swift/latest/misc.html#swift.common.statsd_client.LabeledStatsdClient
+        for more information.
+
+      * Instrumented proxy-logging with labeled metrics. See
+        `proxy-server.conf-sample` for more information.
+
+      * Instrumented the object-server with labeled metrics. See
+        `object-server.conf-sample` for more information.
+
+    * Added `access_user_id` logging field; out-of-tree auth middlewares should
+      use `environ['swift.access_logging']['user_id']` to populate this field.
+
+    * Introduced an extensible ring format. This allows both more than 65,536
+      devices and more data structures to be in a ring. For more information,
+      see https://docs.openstack.org/swift/latest/overview_ring_format.html#ring-v2.
+
+    * SSYNC connections are now promptly terminated when subrequests timeout.
+
+    * Python 3.13 (with the GIL enabled) is now supported. Free-threaded
+      builds remain untested.
+
+    * Removed support for Python 3.6. Flamingo (2025.2) will be the final
+      stable release to support Python 3.7 and 3.8.
+
+    * Removed support for pickled ring files. These have not been written
+      since Swift 1.7.0.
+
+    * Fixed a recursion error in the account-quota middleware.
+
+    * Fixed an error in `invalidate_hash` when the partition is deleted while
+      waiting for the partition lock.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.35.0, OpenStack Epoxy)
+
+    * Removed the use of `eval` in the xprofile middleware. Note that this
+      middleware is only intended for development purposes and is not
+      intended for use in production systems.
+
+    * Account listings now include storage policy information for the
+      containers listed.
+
+    * The S3 API no longer requires a `Content-MD5` header for `DeleteObjects`
+      requests when using v4 signatures.
+
+    * Uploads to containers with object versioning enabled now require a
+      `Content-Length` or `Transfer-Encoding: chunked` header, similar to
+      other containers.
+
+    * Fixed a server error when deleting a specific version via the S3 API.
+
+    * `X-Open-Expired` now works properly with `?part-number` requests.
+
+    * Fixed `Content-Type` and `Content-Length` headers in account and
+      container `HEAD` responses (with eventlet>=0.38.0).
+
+    * Object expiration fixes:
+
+      * The configuration options `expiring_objects_container_divisor` and
+        `expiring_objects_account_name` are now deprecated.
+
+        If a cluster was deployed with a non-standard account name, operators
+        should remove the option from all configs so they are using a supported
+        configuration going forward, but will need to deploy stand-alone expirer
+        processes with legacy expirer config to clean-up old expiration tasks
+        from the previously configured account name.
+
+      * Added a new configuration option, `round_robin_task_cache_size`, to
+        adjust the number of tasks to cache before processing. This may be used
+        to trade faster expirer start-up for more lumpy container-server load.
+
+      * The object-expirer now better handles errors during listings.
+
+      * The object-expirer now respects the `internal_client_conf_path`
+        configuration option in legacy `object-expirer.conf` configs.
+
+    * WSGI process management improvements:
+
+      * Added a `stale_worker_timeout` configuration option to the WSGI
+        servers. Once this time elapses following a reload, the manager
+        process will issue SIGKILLs to any remaining stale workers.
+
+      * Improved the reliability of `swift-reload`.
+
+    * Object updater observability improvements:
+
+      * Added last start time to recon dumps as `object_updater_last`.
+
+      * Added information (including target account/container) from oldest
+        failed updates to recon dumps, both per-device and aggregated for the
+        node. Use the new `async_tracker_max_entries` and
+        `async_tracker_dump_count` options to adjust how many records to
+        collect.
+
+      * Separated unlinks-due-to-outdated-updates from
+        unlinks-due-to-fully-processed-updates in logged stats.
+
+    * Added the option to tune down ETag validation in the object-server
+      during full-object reads. By default, every full read will continue
+      to have its ETag validated as bytes are streamed to the proxy-server.
+      The `etag_validate_pct` option may be used to configure approximately
+      what percentage of full-object reads should be validated; reducing this
+      can improve performance when object-servers are CPU-constrained.
+
+      Partial reads continue to never have their ETag validated in the
+      object-server. The object-auditor continues to periodically validate
+      every object's ETag.
+
+    * The `cooperative_period` option for the object-server now affects PUT
+      requests in a way similar to GET responses.
+
+    * Fixed an issue with the object-reconstructor that would prevent
+      reconstruction of objects with non-ASCII header names.
+
+    * Fixed an issue with the container-reconciler that could cause reconciler
+      databases to have conflicting rows that could not be resolved.
+
+    * Removed use of the deprecated cgi module.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.34.0, OpenStack Dalmatian)
+
+    * Middleware features:
+
+      * The static large object (SLO) middleware now supports including
+        a `?part-number=<N>` query parameter to request just part of a
+        large object. This may be used to enable efficient parallel
+        downloads. For more information, see
+        https://docs.openstack.org/swift/latest/overview_large_objects.html#retrieving-a-large-object
+
+      * The S3 API middleware now supports the `?partNumber=<N>` query
+        parameter, enabling parallel downloads.
+
+      * The KMS keymaster now supports overriding the endpoint returned
+        in the Keystone catalog via the `barbican_endpoint` configuration
+        option. This may be useful in multi-region deployments which have
+        multiple endpoints.
+
+      * The backend ratelimiter now supports dynamic reloading of limits.
+        The new configuration options `backend_ratelimit_conf_path` and
+        `config_reload_interval` control which file is reloaded and how
+        frequently, respectively.
+
+      * The backend ratelimiter now supports per-method, per-device
+        ratelimits. See `etc/backend-ratelimit.conf-sample` for more
+        information.
+
+    * S3 API improvements:
+
+      * Error response reasons are now logged as part of the `log_info`
+        field. This can be especially useful when diagnosing HEAD
+        failures, which necessarily have no response body.
+
+      * Fixed a server error when using non-ASCII access key IDs.
+
+      * Fixed several checksum-related error responses to be more AWS-like.
+
+    * Account quota improvements:
+
+      * Overall account byte quotas should now be set with the
+        `X-Account-Quota-Bytes` header. The `X-Account-Meta-Quota-Bytes`
+        header is now deprecated.
+
+      * The account quota middleware now supports object-count quotas
+        in addition to byte-count quotas, similar to the container
+        quota middleware. For more information, see
+        https://docs.openstack.org/swift/latest/middleware.html#module-swift.common.middleware.account_quotas
+
+      * Using an `X-Remove-Account-Quota-Bytes-Policy-<policy name>` header
+        now removes the per-policy quota, rather than reducing it to zero.
+
+    * Object expiration improvements:
+
+      * Added per-account and per-container reaping delays. These may be
+        used to offer some grace period in which to recover expired objects.
+
+      * Added a proxy-server configuration option: `allow_open_expired`.
+        This defaults to false; if true, clients may intereact with expired
+        objects by including an `X-Open-Expired: true` header in GET, HEAD,
+        or POST requests.
+
+      * Expiring object queue entries now include the size of the object to
+        be expired in the `swift_expirer_bytes` parameter of the queue entry's
+        content-type.
+
+      * Added metrics to count skipped, delayed, and assigned tasks as
+        they're enumerated.
+
+    * Proxy-server fixes:
+
+      * Object POSTs now 503 rather than trusting the 404s that might be
+        returned from handoffs when primaries are overloaded.
+
+      * Client disconnects should always be logged within the context of
+        the appropriate client request. Previously, there were some cases
+        where logging would occur during general garbage collection, leading
+        to incorrect or missing transaction IDs in logs.
+
+      * The proxy-logging middleware now emits timing and transfer stats for
+        more requests such as auth requests. These will be labeled `UNKNOWN`
+        rather than `account`, `container`, etc.
+
+      * Fixed a server error when the Swift request path has missing account
+        or container components.
+
+    * Python 3.12 is now supported.
+
+    * `EUCLEAN` errors are better handled on the object server.
+
+    * `swift-account-info` now supports the `--sync` option to display the
+      contents of the incoming and outgoing sync tables, similar to
+      `swift-container-info`.
+
+    * The `swift-drive-audit` tool now works with ISO timestamps in kernel
+      logs.
+
+    * The `swift-recon-cron` tool now better handles missing directories.
+
+    * Dependency update: lxml must be at least 4.2.3.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.33.0, OpenStack Caracal)
+
+    * S3 API fixes:
+
+      * When the `+segments` container's storage policy differs from that of
+        the primary container, completed manifests are now written with the
+        correct policy in the primary container.
+
+      * Add basic read support for object locking. This improves
+        compatibility with an Ansible S3 module. Write support is not
+        yet implemented, so get-object-lock-configuration will always 404.
+
+      * If there's a conflict deleting the in-progress-upload marker when
+        completing a multipart-upload, a 503 is now returned to the client,
+        prompting it to retry.
+
+      * Added `Accept-Ranges: bytes` to object responses. Range requests
+        have always been supported; now, that support is properly advertised.
+
+    * Static large object fixes:
+
+      * Fixed a server error when handling conditional GET requests.
+
+      * Return an error if the SLO manifest could not be parsed. Previously,
+        a zero-byte response was returned.
+
+    * Proxy server fixes:
+
+      * Added a new `swift.proxy_logging_status` request environment key that
+        middlewares may use to override the logged status for a request.
+
+      * Transaction IDs are included in more error responses.
+
+      * Added a counter metric when caching shard ranges.
+
+      * The `recoverable_node_timeout` option no longer applies to
+        `X-Newest` GET requests.
+
+      * Improved error-handling in multi-part range responses.
+
+    * Sharding fixes:
+
+      * Prevent resets of a shard range's epoch.
+
+      * Cleaned up `X-Backend-*` headers in listing responses.
+
+      * Reduced the frequency of `Reclaimable db stuck waiting for shrinking`
+        messages when a root DB has been deleted but its shards have not been
+        shrunk away.
+
+      * The more-efficient shard range structure from the last release is now
+        used when fetching ranges from the backend.
+
+      * Include more information in shard-replication warnings.
+
+    * Object server fixes:
+
+      * Object POSTs and chunked PUTs are no longer accepted when the target
+        drive is already past its `fallocate_reserve`. DELETEs are still
+        allowed.
+
+      * Added the ability to configure cooperative yielding when servicing
+        GET responses, via the `cooperative_period` option. See the example
+        config for more information.
+
+      * Invalid `hashes.invalid` entries are now ignored, rather than
+        causing a complete partition rehash.
+
+    * Prefix-based tempurls may now be used to explore staticweb
+      listings within that prefix. Note that this opens a new ability
+      to list containers from tempurls, but only if staticweb's
+      `X-Container-Meta-Web-Listings` is enabled.
+
+    * When generating index pages from listings, staticweb now sends an HTML5
+      doctype. This makes them https://peps.python.org/pep-0503/ compliant,
+      allowing their continued use for simple Python package repositories.
+
+    * Per-service `auto_create_account_prefix` configuration options have
+      been removed. These options were deprecated in favor of `swift.conf`
+      configuration in Swift 2.24.0, part of the OpenStack Ussuri release.
+
+    * Added a `swift-reload` command to assist with safely reloading WSGI
+      servers.
+
+    * Daemons now send `STOPPING` and `RELOADING` systemd notifications
+      when the service is configured with `Type=notify`.
+
+    * Added more metrics to the container-server, allowing GET and PUT timings
+      to be broken out for listings, shard range operations, and container
+      creation.
+
+    * Daemons send object updates via the replication network in more cases.
+
+    * `swift-account-info` and `swift-container-info` now accept a `--sync`
+      flag to show information from the incoming/outgoing sync tables.
+
+    * Several fixes to prepare for Python 3.12 support. While not yet tested
+      in the gate, initial manual testing looks promising.
+
+    * Added support for recent versions of eventlet.
+
+    * The dark-data object audit watcher now works with sharded containers.
+      Previously, it would think that all data files were absent from
+      listings.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.32.0, OpenStack Bobcat)
+
+    * Python 3 fixes:
+
+      * Python 3 object servers can now read unencrypted non-ASCII metadata
+        that was written under Python 2.
+
+      * Ssync no longer corrupts unencrypted non-ASCII metadata during
+        transfers.
+
+      * Fixed an encoding issue when writing non-ASCII object names to sharded
+        containers and shard range caching is not enabled.
+
+      * Fixed an encoding issue when handling non-ASCII account names.
+
+      * Fixed a `generator already executing` error on client disconnect.
+
+      * Suppressed `RemoteDisconnected` tracebacks.
+
+    * Metrics improvements:
+
+      * Metrics are now emitted for a variety of S3 error responses, in the
+        form `s3api.<status_int>.<error_class>[.<reason>]`
+
+      * Fixed an issue that prevented proxy servers from emitting metrics and
+        logs for backend requests made when getting account or container info.
+
+      * Account and container info metrics now include the response status code
+        when backend requests are made.
+
+      * Added timing metrics to the container sharder for various operations.
+
+    * Python 3.11 is now supported.
+
+    * Added the ability for reseller admins to set per-policy account quotas by
+      posting metadata of the form `X-Account-Quota-Bytes-Policy-<policy name>`.
+
+    * Added a `keepalive_timeout` option to the proxy server to limit how long
+      to wait for a client to initiate a request, separate from the general
+      `client_timeout` option. Note that this requires eventlet 0.34.0
+      (currently unreleased) or later.
+
+    * Added a `keep_cache_slo_manifest` option to the object server to better
+      control whether SLO manifests are dropped from the page cache.
+
+    * WSGI servers now accept a `--test-config` option that may be used to
+      validate configuration changes before reloading/restarting the server.
+
+    * The structure of cached shard ranges has changed, improving performance
+      when listing or writing to sharded containers. Note that immediately
+      after upgrade, the new structures will all be cache misses, which may
+      lead to a thundering herd problem. To avoid this, upgrade just a few
+      nodes first, let them service some fraction of traffic to populate the
+      cache, then upgrade the rest of the cluster.
+
+    * A variety of performance improvements have been made for sharded
+      container databases.
+
+    * Various logging and metrics improvements when talking to memcache.
+
+    * Fixed ssync's handling of timestamp offsets. Previously, this could cause
+      ssync to fail with a 409 Conflict, causing the transfer to fail and
+      preventing handoffs from clearing.
+
+    * Fixed an issue where an erasure-coded PUT could prevent other requests
+      from being processed when network calls rarely or never blocked.
+
+    * Fixed an issue when downloading an SLO manifest would hit a recoverable
+      error and attempt to resume from another node. This would manifest as
+      either a pyeclib decode error or an unexpected empty response.
+
+    * The proxy server now applies error-limiting to the correct node when
+      handling a recoverable node error.
+
+    * Account, container, and object log fields are now correctly identified
+      when returning `BadDigest` responses to S3 requests.
+
+    * Previously, under some circumstances, a non-standard config option such
+      as `RECLAIM_AGE` might get parsed as `reclaim_age` for some processes
+      but ignored by others. Now, all config parsing is case-sensitive;
+      non-standard names will always be ignored.
+
+    * Reduced the backend load of making `?versions` requests to a container
+      that has never had object versioning enabled.
+
+    * Improved formatting of meta and sysmeta for `swift-account-info` and
+      `swift-container-info`.
+
+    * The standard-library `logging` module is no longer monkey-patched when
+      importing `swift.common.utils`, making it easier to re-use swift code
+      in other contexts.
+
+    * Removed the hard dependency on netifaces; it may still be used if the
+      `getifaddrs` C function is not available. This fallback support may be
+      removed in a future release.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.31.1, OpenStack Antelope)
+
+    * Sharding fixes
+
+      * Shards no longer report stats to the root database when they are in
+        the CREATED state.
+
+      * Sharding metadata is no longer cleared when databases are deleted.
+        This could previously cause deleted shards that still had rows to
+        become stuck and never move them to the correct database.
+
+      * Fixed a performance regression in the handling of misplaced objects.
+
+      * Swift path and on-disk path are now included with all sharder logging.
+
+    * `s3token` no longer mangles request paths that include the Access Key ID.
+
+    * User metadata is now exposed via CORS when encryption is enabled,
+      matching the behavior when encryption is not enabled.
+
+    * Fewer backend requests are now required when account or container
+      information is missing from memcache.
+
+    * Fixed logging of IP and port in the proxy-server; in particular,
+      internal clients now correctly log about the replication IP/port.
+
+    * Fixed a bug in the object replicator that would cause an under-reporting
+      of failures.
+
+    * Various other minor bug fixes.
+
+
+swift (2.31.0)
+
+    * S3 API improvements
+
+      * Fixed a security issue in how `s3api` handles XML parsing that allowed
+        authenticated S3 clients to read arbitrary files from proxy servers.
+        Refer to CVE-2022-47950 for more information.
+
+      * Fixed a server error when handling malformed CompleteMultipartUpload
+        requests.
+
+      * Improved error reporting when attempting to set invalid `X-Delete-At`
+        or `X-Delete-After` values via the S3 API.
+
+    * Sharding improvements
+
+      * Sync more shard ranges from the root database to the shards. This
+        helps ensure shard range repairs effected at the root make their way
+        to shards that would otherwise be stuck trying to further divide
+        into sub-shards.
+
+      * Added a `merge` subcommand to `swift-manage-shard-ranges` to merge
+        arbitrary shard ranges into a container DB. Minimal safety checks
+        are performed; it should only be used for emergency shard range
+        manipulation by expert users.
+
+      * Improved performance of `delimiter` listings for sharded containers.
+
+      * Added more safety checks to the `repair` subcommand of
+        `swift-manage-shard-ranges`.
+
+      * Better handle `EOFError` and `KeyboardInterrupt` when prompting for
+        input in `swift-manage-shard-ranges`.
+
+      * Warnings are now emitted when sharding appears to have become stuck.
+        Use the new `container_sharding_timeout` option to configure the
+        "stuck" threshold; the default is 48 hours.
+
+      * Stop warning about transient overlaps when auditing shard ranges.
+
+    * Metrics improvements
+
+      * Added timing stats for memcached operations.
+
+      * Renamed and improved the granularity of shard range cache and
+        backend stats. Metrics dashboards may need to be updated.
+
+      * Emit stats when backend nodes are error-limited.
+
+    * Added support for Python 3.10.
+
+    * Added an optional `backend_ratelimit` middleware for backend servers.
+      See the backend server sample configuration files for more information.
+
+    * Added the ability to configure a chance to skip checking memcache when
+      querying account and container information. This allows some fraction
+      of traffic to go to disk and refresh memcache before the key ages out.
+      Recommended values for the new `account_existence_skip_cache_pct` and
+      `container_existence_skip_cache_pct` options are in the range of
+      0.0 to 0.01.
+
+    * Static large object segments may now be deleted asynchronously by
+      default. Operators may return to the old behavior by disabling the
+      `allow_async_delete` option in the `[filter:slo]` section
+      in their proxy-server.conf.
+
+    * Absolute-form request targets are now accepted. This enables access for
+      certain clients and SDKs (including some older versions of rclone that
+      were using an old version of aws-sdk-go).
+
+    * Fixed a path-rewriting bug introduced in Python 3.7.14, 3.8.14, 3.9.14,
+      and 3.10.6 that could cause some `domain_remap` requests to be routed to
+      the wrong object.
+
+    * Fixed a server error when attempting to access data in a deleted
+      container that had an erasure-coded storage policy.
+
+    * Improved error messages to clients that encounter errors using the
+      `formpost` middleware.
+
+    * Removed some inappropriate error-suppression when locking account and
+      container databases.
+
+    * Improved server start-up time when using multiple workers.
+
+    * Removed some unnecessary locking when logging.
+
+    * Added some basic object-metadata validation; invalid diskfiles will be
+      quarantined via the auditor or reconstructor.
+
+    * Enhanced logging when error-limiting a backend node.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.30.1, zed stable backports)
+
+    * Fixed a security issue in how `s3api` handles XML parsing that allowed
+      authenticated S3 clients to read arbitrary files from proxy servers.
+      Refer to CVE-2022-47950 for more information.
+
+    * Fixed a path-rewriting bug introduced in Python 3.7.14, 3.8.14, 3.9.14,
+      and 3.10.6 that could cause some `domain_remap` requests to be routed to
+      the wrong object.
+
+
+swift (2.30.0, OpenStack Zed)
+
+    * Sharding improvements
+
+      * The `swift-manage-shard-ranges` tool has a new mode to repair gaps
+        in the namespace.
+
+      * Misplaced tombstone records are now properly cleaved.
+
+      * Fixed a bug where the sharder could fail to find a device to use for
+        cleaving.
+
+      * Databases marked deleted are now processed by the sharder.
+
+      * More information is now synced to the fresh database when sharding.
+        Previously, a database could lose the fact that it had been marked
+        as deleted.
+
+      * Shard ranges with no rows to cleave could previously be left in the
+        CREATED state after cleaving. Now, they are advanced to CLEAVED.
+
+      * Metrics are now emitted for whether databases used for cleaving
+        were created or already existed, allowing a better understanding
+        of the reason for handoffs in the cluster.
+
+      * Misplaced-record stats are now also emitted to statsd. Previously,
+        these were only available in logs.
+
+    * S3 API improvements
+
+      * Constant-time string comparisons are now used when checking signatures.
+
+      * Fixed cross-policy object copies. Previously, copied data would
+        always be written using the source container's policy. Now, the
+        destination container's policy will be used, avoiding availability
+        issues and unnecessary container-reconciler work.
+
+      * More headers are now copied from multi-part upload markers to their
+        completed objects, including `Content-Encoding`.
+
+      * When running with `s3_acl` disabled, `bucket-owner-full-control` and
+        `bucket-owner-read` canned ACLs will be translated to the same Swift
+        ACLs as `private`.
+
+      * The S3 ACL and Delete Multiple APIs are now less case-sensitive.
+
+      * Improved the error message when deleting a bucket that's ever had
+        versioning enabled and still has versions in it.
+
+      * `LastModified` timestamps in listings are now rounded up to whole
+        seconds, like they are in responses from AWS.
+
+      * Proxy logging for Complete Multipart Upload requests is now more
+        consistent when requests have been retried.
+
+    * Logging improvements
+
+      * Signal handling is more consistently logged at notice level.
+        Previously, signal handling would sometimes be logged at info
+        or error levels.
+
+      * The message template for proxy logging may now include a
+        `{domain}` field for the client-provided `Host` header.
+
+      * The object-replicator now logs successful rsync transfers at debug
+        instead of info.
+
+      * Added a `log_rsync_transfers` option to the object-replicator.
+        Set it to false to disable logging rsync "send" lines; during
+        large rebalances, such logging can overwhelm log aggregation
+        while providing little useful information.
+
+      * Transaction IDs are now only included in daemon log lines
+        in a request/response context.
+
+    * Fixed a socket leak when clients try to delete a non-SLO as though
+      it were a Static Large Object.
+
+    * The formpost digest algorithm is now configurable via the new
+      `allowed_digests` option, and support is added for both SHA-256
+      and SHA-512. Supported formpost digests are exposed to clients in
+      `/info`. Additionally, formpost signatures can now be base64 encoded.
+
+    * Added metrics to the formpost and tempurl middlewares to monitor
+      digest usage in signatures.
+
+    * SHA-1 signatures are now deprecated for the formpost and tempurl
+      middlewares. At some point in the future, SHA-1 will no longer be
+      enabled by default; eventually, support for it will be removed
+      entirely.
+
+    * Improved compatibility with certain FIPS-mode-enabled systems.
+
+    * Added a `ring_ip` option for various object services. This may be
+      used to find own devices in the ring in a containerized environment
+      where the `bind_ip` may not appear in the ring at all.
+
+    * Account and container replicators can now be configured with a
+      `handoff_delete` option, similar to object replicators and
+      reconstructors. See the sample config for more information.
+
+    * Developers using Swift's memcache client may now opt in to having
+      a `MemcacheConnectionError` be raised when no connection succeeded
+      using a new `raise_on_error` keyword argument to `get`/`set`.
+
+    * The tempurl middleware has been updated to return a 503 if storing a
+      token in memcache fails. Third party authentication middlewares are
+      encouraged to also use the new `raise_on_error` keyword argument
+      when storing ephemeral tokens in memcache.
+
+    * Pickle support has been removed from Swift's memcache client. Support
+      had been deprecated since Swift 1.7.0.
+
+    * Device names are now included in new database IDs. This provides more
+      context when examining incoming/outgoing sync tables or sharding
+      CleaveContexts.
+
+    * Database replication connections are now closed following an error
+      or timeout. This prevents a traceback in some cases when the replicator
+      tries to reuse the connection.
+
+    * `ENOENT` and `ENODATA` errors are better handled in the object
+      replicator and auditor.
+
+    * Improved object update throughput by shifting some shard range
+      filtering from Python to SQL.
+
+    * Include `Vary: Origin` header when CORS responses vary by origin.
+
+    * The staticweb middleware now allows empty listings at the root of
+      a container. Previously, this would result in a 404 response.
+
+    * Ring builder output tables better display weights over 1000.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.29.2, yoga stable backports)
+
+    * Fixed a security issue in how `s3api` handles XML parsing that allowed
+      authenticated S3 clients to read arbitrary files from proxy servers.
+      Refer to CVE-2022-47950 for more information.
+
+    * Constant-time string comparisons are now used when checking S3 API
+      signatures.
+
+    * Fixed a path-rewriting bug introduced in Python 3.7.14, 3.8.14, 3.9.14,
+      and 3.10.6 that could cause some `domain_remap` requests to be routed to
+      the wrong object.
+
+    * Improved compatibility with certain FIPS-mode-enabled systems.
+
+
+swift (2.29.1, OpenStack Yoga)
+
+    * This is the final stable branch that will support Python 2.7.
+
+    * Fixed s3v4 signature calculation when the client sends an un-encoded
+      path in the request.
+
+    * Fixed multiple issues in s3api involving Multipart Uploads with
+      non-ASCII names.
+
+    * The object-updater now defers rate-limited updates to the end of its
+      cycle; these deferred updates will be processed (at the limited rate)
+      until the configured `interval` elapses. A new `max_deferred_updates`
+      option may be used to bound the deferral queue.
+
+    * Empty account and container partition directories are now cleaned up
+      immediately after replication, rather than needing to wait for an
+      additional replication cycle.
+
+    * The object-expirer now only cleans up empty containers. Previously, it
+      would attempt to delete all processed containers, regardless of whether
+      there were entries which were skipped or had errors.
+
+    * A new `item_size_warning_threshold` option may be used to monitor for
+      values that are approaching the limit of what can be stored in memcache.
+      See the memcache sample config for more information.
+
+    * Internal clients now correctly use their configured User-Agent in
+      backend requests, rather than only using it for logging.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.29.0)
+
+    * S3 API improvements
+
+      * CORS preflights are now allowed for pre-signed URLs.
+
+      * The `storage_domain` option now accepts a comma-separated list of
+        storage domains. This allows multiple storage domains to configured
+        for use with virtual-host style addressing.
+
+      * Fixed the types of configured values in /info response.
+
+      * Fixed a server error when trying to copy objects with non-ASCII names.
+
+      * Fixed a server error when uploading objects with very long names.
+        A KeyTooLongError is now returned.
+
+      * Fixed an error when multi-deleting MPUs when SLO async-deletes
+        are enabled.
+
+      * Fixed an error that allowed list-uploads and list-parts requests to
+        return incomplete or out-of-order results.
+
+      * Fixed several bugs when dealing with non-ASCII object names and
+        multipart uploads.
+
+      * Reduced the overhead of retrieving bucket and object ACLs.
+
+    * Replication, reconstruction, and diskfile improvements
+
+      * The reconstructor now uses the replication network to fetch fragments
+        for reconstruction.
+
+      * Added the ability to limit how many objects per handoff partition
+        will be reverted in a reconstructor cycle using the new
+        `max_objects_per_revert` option. This may be useful to reduce
+        ssync timeouts and lock contention, ensuring that progress is made
+        during rebalances.
+
+      * Ensure that non-durable data and .meta files are purged from handoffs
+        after syncing.
+
+      * Fixed tracebacks when there's a race to mark a file durable or delete it.
+
+      * Improved cooperative multitasking during ssync.
+
+      * Upon detecting a ring change, the reconstructor now only aborts the
+        jobs for that ring and continues processing jobs for other rings.
+
+      * Fixed a traceback when logging about a lock timeout in the replicator.
+
+    * Object updater improvements
+
+      * Added the ability to ratelimit updates (approximately) per-container
+        using the new `max_objects_per_container_per_second` option. This may
+        be used to limit requests to already-overloaded containers while still
+        making progress on updates to other containers.
+
+      * Added timing stats by response code.
+
+      * Updates are now sent over the replication network.
+
+      * Fixed a race condition where swift would attempt to quarantine
+        recently-deleted updates.
+
+    * Memcache improvements
+
+      * Added the ability to configure a chance to skip checking memcache when
+        querying shard ranges. This allows some fraction of traffic to go to
+        disk and refresh memcache before the key ages out. Recommended values
+        for the new `container_updating_shard_ranges_skip_cache_pct` and
+        `container_listing_shard_ranges_skip_cache_pct` options are in the
+        range of 0.0 to 0.1.
+
+      * Added stats for shard range cache hits, misses, and skips.
+
+      * Improved handling of timeouts and other errors when obtaining a
+        connection to memcached.
+
+    * Recon improvements
+
+      * Added object-reconstructor stats to recon.
+
+      * Each object-server IP is now queried only once when reporting disk
+        usage. Previously, each port in the ring would be queried; when using
+        servers-per-port, this could dramatically overstate the disk capacity
+        in the cluster.
+
+    * Fixed a security issue where tempurl and s3api signatures were logged in
+      full. This allowed an attacker with access to log data to perform replay
+      attacks, potentially accessing or overwriting cluster data. Now, such
+      signatures are redacted in a manner similar to auth tokens; see the
+      `reveal_sensitive_prefix` option in `proxy-server.conf`.
+
+      See CVE-2017-8761 for more information.
+
+    * Added a new `swift.common.registry` module. This includes helper
+      functions `register_sensitive_header` and `register_sensitive_param`
+      which third party middleware authors may use to flag headers and query
+      parameters for redaction when logging. For more information, see
+      https://docs.openstack.org/swift/latest/misc.html#module-swift.common.registry
+
+    * Added the ability to configure project-scope read-only roles for
+      keystoneauth using the new `project_reader_roles` option.
+
+    * The cname_lookup middleware now works with dnspython 2.0 and later.
+
+    * The internal clients used by the container-reconciler, container-sharder,
+      container-sync, and object-expirer daemons now use a more-descriptive
+      `<daemon>-ic` log name, rather than `swift`. If you previously
+      configured the `log_name` option in `internal-client.conf`, you must
+      now use the `set log_name = <value>` syntax to configure it, even if
+      no value is set in the `[DEFAULT]` section. This may be done prior to
+      upgrading.
+
+    * Fixed a bug that allowed some statsd metrics to be annotated with the
+      wrong backend layer.
+
+    * The `StatsdClient.set_prefix` method is now deprecated and
+      may be removed in a future release; by extension, so is the
+      `LogAdapter.set_statsd_prefix` method. Middleware developers should
+      use the `statsd_tail_prefix` argument to `get_logger` instead.
+
+    * Fixed a traceback in the account-server when there's no account
+      database on disk to receive a container update. The account-server
+      now correctly 404s.
+
+    * The container-updater will quarantine container databases if all
+      replicas for the account respond 404.
+
+    * Fixed a proxy-server error when the read-only middleware tried to
+      handle non-Swift paths (such as may be used by third-party middleware).
+
+    * Some client behaviors that the proxy previously logged at warning have
+      been lowered to info.
+
+    * Removed translations from most logging.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.28.1, xena stable backports)
+
+    * Fixed a security issue in how `s3api` handles XML parsing that allowed
+      authenticated S3 clients to read arbitrary files from proxy servers.
+      Refer to CVE-2022-47950 for more information.
+
+    * Constant-time string comparisons are now used when checking S3 API
+      signatures.
+
+    * Fixed a path-rewriting bug introduced in Python 3.7.14, 3.8.14, 3.9.14,
+      and 3.10.6 that could cause some `domain_remap` requests to be routed to
+      the wrong object.
+
+    * Improved compatibility with certain FIPS-mode-enabled systems.
+
+    * Ensure that non-durable data and .meta files are purged from handoffs
+      after syncing.
+
+
+swift (2.28.0, OpenStack Xena)
+
+    * Sharding improvements:
+
+      * When building a listing from shards, any failure to retrieve
+        listings will result in a 503 response. Previously, failures
+        fetching a partiucular shard would result in a gap in listings.
+
+      * Container-server logs now include the shard path in the referer
+        field when receiving stat updates.
+
+      * Added a new config option, `rows_per_shard`, to specify how many
+        objects should be in each shard when scanning for ranges. The default
+        is `shard_container_threshold / 2`, preserving existing behavior.
+
+      * Added a new config option, `minimum_shard_size`. When scanning
+        for shard ranges, if the final shard would otherwise contain
+        fewer than this many objects, the previous shard will instead
+        be expanded to the end of the namespace (and so may contain up
+        to `rows_per_shard + minimum_shard_size` objects). This reduces
+        the number of small shards generated. The default value is
+        `rows_per_shard / 5`.
+
+      * Added a new config option, `shrink_threshold`, to specify the
+        absolute size below which a shard will be considered for shrinking.
+        This overrides the `shard_shrink_point` configuration option, which
+        expressed this as a percentage of `shard_container_threshold`.
+        `shard_shrink_point` is now deprecated.
+
+      * Similar to above, `expansion_limit` was added as an absolute-size
+        replacement for the now-deprecated `shard_shrink_merge_point`
+        configuration option.
+
+      * The sharder now correctly identifies and fails audits for shard
+        ranges that overlap exactly.
+
+      * The sharder and swift-manage-shard-ranges now consider total row
+        count (instead of just object count) when deciding whether a shard
+        is a candidate for shrinking.
+
+      * If the sharder encounters shard range gaps while cleaving, it will
+        now log an error and halt sharding progress. Previously, rows may
+        not have been moved properly, leading to data loss.
+
+      * Sharding cycle time and last-completion time are now available via
+        swift-recon.
+
+      * Fixed an issue where resolving overlapping shard ranges via shrinking
+        could prematurely mark created or cleaved shards as active.
+
+    * `swift-manage-shard-ranges` improvements:
+
+      * Exit codes are now applied more consistently:
+
+          - 0 for success
+          - 1 for an unexpected outcome
+          - 2 for invalid options
+          - 3 for user exit
+
+        As a result, some errors that previously resulted in exit code 2
+        will now exit with code 1.
+
+      * Added a new 'repair' command to automatically identify and
+        optionally resolve overlapping shard ranges.
+
+      * Added a new 'analyze' command to automatically identify overlapping
+        shard ranges and recommend a resolution based on a JSON listing
+        of shard ranges such as produced by the 'show' command.
+
+      * Added a `--includes` option for the 'show' command to only output
+        shard ranges that may include a given object name.
+
+      * Added a `--dry-run` option for the 'compact' command.
+
+      * The 'compact' command now outputs the total number of compactible
+        sequences.
+
+    * S3 API improvements:
+
+      * Added an option, `ratelimit_as_client_error`, to return 429s for
+        rate-limited responses. Several clients/SDKs have seem to support
+        retries with backoffs on 429, and having it as a client error
+        cleans up logging and metrics. By default, Swift will respond 503,
+        matching AWS documentation.
+
+      * Fixed a server error in bucket listings when `s3_acl` is enabled
+        and staticweb is configured for the container.
+
+      * Fixed a server error when a client exceeds `client_timeout` during an
+        upload. Now, a `RequestTimeout` error is correctly returned.
+
+      * Fixed a server error when downloading multipart uploads/static large
+        objects that have missing or inaccessible segments. This is a state
+        that cannot arise in AWS, so a new `BrokenMPU` error is returned,
+        indicating that retrying the request is unlikely to succeed.
+
+      * Fixed several issues with the prefix, marker, and delimiter
+        parameters that would be mirrored back to clients when listing
+        buckets.
+
+    * Partition power increase improvements:
+
+      * The relinker now spawns multiple subprocesses to process disks
+        in parallel. By default, one worker is spawned per disk; use the
+        new `--workers` option to control how many subprocesses are used.
+        Use `--workers=0` to maintain the previous behavior.
+
+      * The relinker now performs eventlet-hub selection the same way as
+        other daemons. In particular, `epolls` will no longer be selected,
+        as it seemed to cause occassional hangs.
+
+      * The relinker can now target specific storage policies or
+        partitions by using the new `--policy` and `--partition`
+        options.
+
+      * Partitions that encountered errors during relinking are no longer
+        marked as completed in the relinker state file. This ensures that
+        a subsequent relink will retry the failed partitions.
+
+      * Partition cleanup is more robust, decreasing the likelihood of
+        leaving behind mostly-empty partitions from the old partition
+        power.
+
+      * Improved relinker progress logging, and started collecting
+        progress information for swift-recon.
+
+      * Cleanup is more robust to files and directories being deleted by
+        another process.
+
+      * The relinker better handles data found from earlier partition power
+        increases.
+
+      * The relinker better handles tombstones found for the same object
+        but with different inodes.
+
+      * The reconciler now defers working on policies that have a partition
+        power increase in progress to avoid issues with concurrent writes.
+
+    * Erasure coding fixes:
+
+      * Added the ability to quarantine EC fragments that have no (or few)
+        other fragments in the cluster. A new configuration option,
+        `quarantine_threshold`, in the reconstructor controls the point at
+        the fragment will be quarantined; the default (0) will never
+        quarantine. Only fragments older than `quarantine_age` (default:
+        `reclaim_age`) may be quarantined. Before quarantining, the
+        reconstructor will attempt to fetch fragments from handoff nodes
+        in addition to the usual primary nodes; a new `request_node_count`
+        option (default `2 * replicas`) limits the total number of nodes to
+        contact.
+
+      * Added a delay before deleting non-durable data. A new configuration
+        option, `commit_window` in the `[DEFAULT]` section of
+        object-server.conf, adjusts this delay; the default is 60 seconds. This
+        improves the durability of both back-dated PUTs (from the reconciler or
+        container-sync, for example) and fresh writes to handoffs by preventing
+        the reconstructor from deleting data that the object-server was still
+        writing.
+
+      * Improved proxy-server and object-reconstructor logging when data
+        cannot be reconstructed.
+
+      * Fixed an issue where some but not all fragments having metadata
+        applied could prevent reconstruction of missing fragments.
+
+      * Server-side copying of erasure-coded data to a replicated policy no
+        longer copies EC sysmeta. The previous behavior had no material
+        effect, but could confuse operators examining data on disk.
+
+    * Python 3 fixes:
+
+      * Fixed a server error when performing a PUT authorized via
+        tempurl with some proxy pipelines.
+
+      * Fixed a server error during GET of a symlink with some proxy
+        pipelines.
+
+      * Fixed an issue with logging setup when /dev/log doesn't exist
+        or is not a UNIX socket.
+
+    * The container-reconciler now scales out better with new `processes`,
+      `process`, and `concurrency` options, similar to the object-expirer.
+
+    * The dark-data audit watcher now skips objects younger than a new
+      configurable `grace_age` period. This avoids issues where data
+      could be flagged, quarantined, or deleted because of listing
+      consistency issues. The default is one week.
+
+    * The dark-data audit watcher now requires that all primary locations
+      for an object's container agree that the data does not appear in
+      listings to consider data "dark". Previously, a network partition
+      that left an object node isolated could cause it to quarantine or
+      delete all of its data.
+
+    * More daemons now support systemd notify sockets.
+
+    * `EPIPE` errors no longer log tracebacks.
+
+    * The account and container auditors now log and update recon before
+      going to sleep.
+
+    * The object-expirer logs fewer client disconnects.
+
+    * `swift-recon-cron` now includes the last time it was run in the recon
+      information.
+
+    * `EIO` errors during read now cause object diskfiles to be quarantined.
+
+    * The formpost middleware now properly supports uploading multiple files
+      with different content-types.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.27.0, OpenStack Wallaby)
+
+    * Added "audit watcher" hooks to allow operators to run arbitrary code
+      against every diskfile in a cluster. For more information, see
+      https://docs.openstack.org/swift/latest/development_watchers.html
+
+    * Added support for system-scoped "reader" roles when authenticating using
+      Keystone. Operators may configure this using the `system_reader_roles`
+      option in the `[filter:keystoneauth]` section of their proxy-server.conf.
+
+      A comparable group, `.reseller_reader`, is now available for development
+      purposes when authenticating using tempauth.
+
+    * Allow static large object segments to be deleted asynchronously.
+      Operators may opt into this new behavior by enabling the new
+      `allow_async_delete` option in the `[filter:slo]` section
+      in their proxy-server.conf. For more information, see
+      https://docs.openstack.org/swift/latest/overview_large_objects.html#deleting-a-large-object
+
+    * Added the ability to connect to memcached over TLS. See the
+      `tls_*` options in etc/memcache.conf-sample
+
+    * The proxy-server now caches 'listing' shards, improving listing
+      performance for sharded containers. A new config option,
+      `recheck_listing_shard_ranges`, controls the cache time and defaults to
+      10 minutes; set it to 0 to disable caching (the previous behavior).
+
+    * Added a new optional proxy-logging field `{wire_status_int}` for the
+      status code returned to the client. For more information, see
+      https://docs.openstack.org/swift/latest/logs.html#proxy-logs
+
+    * Errors downloading a Static Large Object that cause a shorter-than-expected
+      response are now logged as 500s.
+
+    * Memcache client error-limiting is now configurable. See the
+      `error_suppression_*` options in etc/memcache.conf-sample
+
+    * Added `tasks_per_second` option to rate-limit the object-expirer.
+
+    * Added `usedforsecurity` annotations for use on FIPS-compliant systems.
+
+    * Added an option to write EC fragments with legacy CRC to ensure a smooth
+      upgrade from liberasurecode<=1.5.0 to >=1.6.2. For more information, see
+      https://bugs.launchpad.net/liberasurecode/+bug/1886088
+
+    * **Known Issue**: Operators should verify that encryption is not enabled
+      in their reconciler pipelines; having it enabled there may harm data
+      durability. For more information, see https://launchpad.net/bugs/1910804
+
+    * S3 API improvements:
+
+      * Fixed a bug that prevented the s3api pipeline validation described in
+        proxy-server.conf-sample from being performed. As documented, operators
+        can disable this via the `auth_pipeline_check` option if proxy startup
+        fails with validation errors.
+
+      * Make allowable clock skew configurable, with a default value of
+        15 minutes to match AWS. Note that this was previously hardcoded at
+        5 minutes; operators may want to preserve the prior behavior by setting
+        `allowable_clock_skew = 300` in the `[filter:s3api]` section of their
+        proxy-server.conf.
+
+      * Fixed an issue where SHA mismatches in client XML payloads would cause
+        a server error. Swift now correctly responds with a client error about
+        the bad digest.
+
+      * Fixed an issue where non-base64 signatures would cause a server error.
+        Swift now correctly responds with a client error about the invalid
+        digest.
+
+      * Container ACLs are now cloned to the `+segments` container when it is
+        created.
+
+      * The correct storage policy is now logged for S3 requests.
+
+      * Added the ability to configure auth region in s3token middleware.
+
+      * CORS-related headers are now passed through appropriately when using
+        the S3 API. Note that allowed origins and other container metadata
+        must still be configured through the Swift API as documented at
+        https://docs.openstack.org/swift/latest/cors.html
+
+        Preflight requests do not contain enough information to map a
+        bucket to an account/container pair; a new cluster-wide option
+        `cors_preflight_allow_origin` may be configured for such OPTIONS
+        requests. The default (blank) rejects all S3 preflight requests.
+
+    * Sharding improvements:
+
+      * Prevent shard databases from losing track of their root database when
+        deleted.
+
+      * Prevent sharded root databases from being reclaimed to ensure that
+        shards can detect that they have been deleted.
+
+      * A `--no-auto-shard` option has been added to `swift-container-sharder`.
+
+      * The sharder daemon has been enhanced to better support the shrinking
+        of shards that are no longer required. Shard containers will now
+        discover from their root container if they should be shrinking. They
+        will also discover the shards into which they should shrink, which may
+        include the root container itself.
+
+      * A 'compact' command has been added to `swift-manage-shard-ranges` that
+        enables sequences of contiguous shards with low object counts to be
+        compacted into another existing shard, or into the root container.
+
+      * `swift-manage-shard-ranges` can now accept a config file; this
+        may be used to ensure consistency of threshold values with the
+        container-sharder config.
+
+      * Overlapping shrinking shards no longer generate audit warnings; these
+        are expected to sometimes overlap.
+
+      * The sharding progress reports in recon cache now continue to be included
+        for a period of time after sharding has completed. The time period
+        may be configured using the `recon_sharded_timeout` option in the
+        `[container-sharder]` section of container-server.conf, and defaults
+        to 12 hours.
+
+      * Add root containers with compactible ranges to recon cache.
+
+      * Expose sharding statistics in the backend recon middleware.
+
+    * Replication improvements:
+
+      * Fixed a race condition in ssync that could lead to a loss of data
+        durability (or even loss of data, for two-replica policies) when some
+        object servers have outdated rings. Replication via rsync is likely
+        still affected by a similar bug.
+
+      * Non-durable fragments can now be reverted from handoffs.
+
+      * The post-rsync REPLICATE call no longer recalculates hashes immediately.
+
+      * Hashes are no longer invalidated after a successful ssync; they were
+        already invalidated during the data transfer.
+
+      * Reduced log noise for common ssync errors.
+
+    * Python 3 fixes:
+
+      * Added support for Python 3.9.
+
+      * Staticweb correctly handles listings when paths include non-ASCII
+        characters.
+
+      * S3 API now allows multipart uploads with non-ASCII characters in the
+        object name.
+
+      * Fixed an import-ordering issue in `swift-dispersion-populate`.
+
+    * Partition power increase improvements:
+
+      * Fixed a bug where stale state files would cause misplaced data during
+        multiple partition power increases.
+
+      * Removed a race condition that could cause newly-written data to not be
+        linked into the new partition for the new partition power.
+
+      * Improved safety during cleanup to ensure files have been relinked
+        appropriately before unlinking.
+
+      * Added an option to drop privileges when running the relinker as root.
+
+      * Added an option to rate-limit how quickly data files are relinked or
+        cleaned up. This may be used to reduce I/O load during partition power
+        increases, improving end-user performance.
+
+      * Rehash partitions during the partition power increase. Previously, we
+        relied on the replication engine to perform the rehash, which could
+        cause an unexpected I/O spike after a partition power increase.
+
+      * Warn when relinking/cleaning up and any disks are unmounted.
+
+      * Log progress per partition when relinking/cleaning up.
+
+      * During clean-up, stop warning about tombstones that got reaped from
+        the new location but not the old.
+
+      * Added the ability to read options from object-server.conf, similar to
+        background daemons.
+
+    * Turned off thread-logging when monkey-patching with eventlet. This
+      addresses a potential hang in the proxy-server while logging client
+      disconnects.
+
+    * Fixed a bug that could cause EC GET responses to return a server error.
+
+    * Fixed an issue with `swift-drive-audit` when run around New Year's.
+
+    * Server errors encountered when validating the first segment of a Static or
+      Dynamic Large Object now return a 503 to the client, rather than a 409.
+
+    * Errors when setting keys in memcached are now logged. This helps
+      operators detect when shard ranges for caching have gotten too large to
+      be stored, for example.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.26.0, OpenStack Victoria)
+
+    * Extend concurrent reads to erasure coded policies. Previously, the
+      options `concurrent_gets` and `concurrency_timeout` only applied to
+      replicated policies.
+
+    * Add a new `concurrent_ec_extra_requests` option to allow the proxy to
+      make some extra backend requests immediately. The proxy will respond as
+      soon as there are enough responses available to reconstruct.
+
+    * The concurrent read options (`concurrent_gets`, `concurrency_timeout`,
+      and `concurrent_ec_extra_requests`) may now be configured per
+      storage-policy.
+
+    * Replication servers can now handle all request methods. This allows
+      ssync to work with a separate replication network.
+
+    * All background daemons now use the replication network. This allows
+      better isolation between external, client-facing traffic and internal,
+      background traffic. Note that during a rolling upgrade, replication
+      servers may respond with `405 Method Not Allowed`. To avoid this,
+      operators should remove the config option `replication_server = true`
+      from their replication servers; this will allow them to handle all
+      request methods before upgrading.
+
+    * S3 API improvements:
+
+      * Fixed some SignatureDoesNotMatch errors when using the AWS .NET SDK.
+
+      * Add basic read support for object tagging. This improves
+        compatibility with AWS CLI version 2. Write support is not
+        yet implemented, so the tag set will always be empty.
+
+      * CompleteMultipartUpload requests may now be safely retried.
+
+      * Improved quota-exceeded error messages.
+
+      * Improved logging and statsd metrics. Be aware that this will cause
+        an increase in the proxy-logging statsd metrics emited for S3
+        responses. However, this should more accurately reflect the state
+        of the system.
+
+      * S3 requests are now less demanding on the container layer.
+
+    * Python 3 bug fixes:
+
+      * Fixed an error when reading encrypted data that was written while
+        running Python 2 for a path that includes non-ASCII characters. This
+        was caused by a difference in string types that resulted in
+        ambiguity when decrypting. To prevent the ambiguity for new data, set
+        `meta_version_to_write = 3` in your keymaster configuration after
+        upgrading all proxy servers.
+
+        If upgrading from Swift 2.20.0 or Swift 2.19.1 or earlier, set
+        `meta_version_to_write = 1` in your keymaster configuration prior
+        to upgrading.
+
+      * Object expiration respects the `expiring_objects_container_divisor`
+        config option.
+
+      * `fallocate_reserve` may be specified as a percentage in more places.
+
+      * The ETag-quoting middleware no longer raises TypeErrors.
+
+    * Sharding improvements:
+
+      * Prevent object updates from auto-creating shard containers. This
+        ensures more consistent listings for sharded containers during
+        rebalances.
+
+      * Deleted shard containers are no longer considered root containers.
+        This prevents unnecessary sharding audit failures and allows the
+        deleted shard database to actually be unlinked.
+
+      * `swift-container-info` now summarizes shard range information.
+        Pass `-v`/`--verbose` if you want to see all of them.
+
+      * Improved container-sharder stat reporting to reduce load on root
+        container databases.
+
+      * Don't inject shard ranges when user quits.
+
+    * Servers now open one listen socket per worker, ensuring each worker
+      serves roughly the same number of concurrent connections.
+
+    * Server workers may now be gracefully terminated via `SIGHUP` or
+      `SIGUSR1`. The parent process will then spawn a fresh worker.
+
+    * During rebalances, clients should no longer get 404s for data that
+      exists but whose replicas are overloaded.
+
+    * Improved cache management for account and container responses.
+
+    * Allow proxy-logging middlewares to be configured more independently.
+
+    * Allow operators to pass either raw or URL-quoted paths to
+      swift-get-nodes. Notably, this allows swift-get-nodes to work with
+      the reserved namespace used for object versioning.
+
+    * Container read ACLs now work with object versioning. This only
+      allows access to the most-recent version via an unversioned URL.
+
+    * Improved how containers reclaim deleted rows to reduce locking and object
+      update throughput.
+
+    * Large object reads log fewer client disconnects.
+
+    * Allow ratelimit to be placed multiple times in a proxy pipeline,
+      such as both before s3api and auth (to handle swift requests without
+      needing to make an auth decision) and after (to limit S3 requests).
+
+    * Shuffle object-updater work. This somewhat reduces the impact a
+      single overloaded database has on other containers' listings.
+
+    * Fix a proxy-server error when retrieving erasure coded data when
+      there are durable fragments but not enough to reconstruct.
+
+    * Fix an error in the proxy server when finalizing data.
+
+    * Improve performance when increasing partition power.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.25.1, ussuri stable backports)
+
+    * Python 3 bug fixes:
+
+      * Fixed an error when reading encrypted data that was written while
+        running Python 2 for a path that includes non-ASCII characters. This
+        was caused by a difference in string types that resulted in
+        ambiguity when decrypting. To prevent the ambiguity for new data, set
+        `meta_version_to_write = 3` in your keymaster configuration after
+        upgrading all proxy servers.
+
+        If upgrading from Swift 2.20.0 or Swift 2.19.1 or earlier, set
+        `meta_version_to_write = 1` in your keymaster configuration prior
+        to upgrading.
+
+      * Object expiration respects the `expiring_objects_container_divisor`
+        config option.
+
+      * `fallocate_reserve` may be specified as a percentage in more places.
+
+      * The ETag-quoting middleware no longer raises TypeErrors.
+
+    * Improved how containers reclaim deleted rows to reduce locking and object
+      update throughput.
+
+    * Fix a proxy-server error when retrieving erasure coded data when
+      there are durable fragments but not enough to reconstruct.
+
+    * Fixed some SignatureDoesNotMatch errors when using the AWS .NET SDK.
+
+    * Region name config option is now respected when configuring S3 credential
+      caching.
+
+
+swift (2.25.0, OpenStack Ussuri)
+
+    * WSGI server processes can now notify systemd when they are ready.
+
+    * Added `ttfb` (Time to First Byte) and `pid` (Process ID) to the set
+      of available proxy-server log fields. For more information, see
+      https://docs.openstack.org/swift/latest/logs.html
+
+    * Improved proxy-server performance by reducing unnecessary locking,
+      memory copies, and eventlet scheduling.
+
+    * Reduced object-replicator and object-reconstructor CPU usage by only
+      checking that the device list is current when rings change.
+
+    * Improved performance of sharded container listings when performing
+      prefix listings.
+
+    * Improved container-sync performance when data has already been
+      deleted or overwritten.
+
+    * Account quotas are now enforced even on empty accounts.
+
+    * Getting an SLO manifest with `?format=raw` now responds with an ETag
+      that matches the MD5 of the generated body rather than the MD5 of
+      the manifest stored on disk.
+
+    * Provide useful status codes in logs for some versioning and symlink
+      subrequests that were previously logged as 499.
+
+    * Fixed 500 from cname_lookup middleware. Previously, if the looked-up
+      domain was used by domain_remap to update the request path, the
+      server would respond Internal Error.
+
+    * On Python 3, fixed an issue when reading or writing objects with a
+      content-type like `message/*`. Previously, Swift would fail to respond.
+
+    * On Python 3, fixed a RecursionError in swift-dispersion-report when
+      using TLS.
+
+    * Fixed a bug in the new object versioning API that would cause more
+      than `limit` results to be returned when listing.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.24.0)
+
+    * Added a new object versioning mode, with APIs for querying and
+      accessing old versions. For more information, see the documentation
+      at https://docs.openstack.org/swift/latest/middleware.html#module-swift.common.middleware.versioned_writes.object_versioning
+
+    * Added support for S3 versioning using the above new mode.
+
+    * Added a new middleware to allow accounts and containers to opt-in to
+      RFC-compliant ETags. This may be useful when using Swift as an origin
+      for some content delivery networks. For more information, see the
+      documentation at https://docs.openstack.org/swift/latest/middleware.html#module-swift.common.middleware.etag_quoter
+      Clients should be aware of the fact that ETags may be quoted for RFC
+      compliance; this may become the default behavior in some future release.
+
+    * Proxy, account, container, and object servers now support "seamless
+      reloads" via `SIGUSR1`. This is similar to the existing graceful
+      restarts but keeps the server socket open the whole time, reducing
+      service downtime.
+
+    * New buckets created via the S3 API will now store multi-part upload
+      data in the same storage policy as other data rather than the
+      cluster's default storage policy.
+
+    * Device region and zone can now be changed via `swift-ring-builder`.
+      Note that this may cause a lot of data movement on the next rebalance
+      as the builder tries to reach full dispersion.
+
+    * Added support for Python 3.8.
+
+    * The container sharder can now handle containers with special
+      characters in their names.
+
+    * Internal client no longer logs object DELETEs as status 499.
+
+    * Objects with an `X-Delete-At` value in the far future no longer cause
+      backend server errors.
+
+    * The bulk extract middleware once again allows clients to specify metadata
+      (including expiration timestamps) for all objects in the archive.
+
+    * Container sync now synchronizes static symlinks in a way similar to
+      static large objects.
+
+    * `swift_source` is set for more sub-requests in the proxy-server. See
+      https://docs.openstack.org/swift/latest/logs.html#swift-source
+
+    * Errors encountered while validating static symlink targets no longer
+      cause BadResponseLength errors in the proxy-server.
+
+    * On Python 3, the KMS keymaster now works with secrets stored
+      in Barbican with a text/plain payload-content-type.
+
+    * On Python 3, the formpost middleware now works with unicode file names.
+
+    * Several utility scripts now work better on Python 3:
+
+      * swift-account-audit
+
+      * swift-dispersion-populate
+
+      * swift-drive-recon
+
+      * swift-recon
+
+    * On Python 3, certain S3 API headers are now lower case as they
+      would be coming from AWS.
+
+    * Per-service `auto_create_account_prefix` settings are now deprecated
+      and may be ignored in a future release; if you need to use this, please
+      set it in the `[swift-constraints]` section of /etc/swift/swift.conf.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.23.3, train stable backports)
+
+    * Sharding improvements:
+
+      * Prevent object updates from auto-creating shard containers. This
+        ensures more consistent listings for sharded containers during
+        rebalances.
+
+      * Deleted shard containers are no longer considered root containers.
+        This prevents unnecessary sharding audit failures and allows the
+        deleted shard database to actually be unlinked.
+
+      * The sharder daemon has been enhanced to better support the shrinking
+        of shards that are no longer required. Shard containers will now
+        discover from their root container if they should be shrinking. They
+        will also discover the shards into which they should shrink, which may
+        include the root container itself.
+
+      * Improved performance of sharded container listings when performing
+        prefix listings.
+
+      * Improved container-sharder stat reporting to reduce load on root
+        container databases.
+
+      * The container sharder can now handle containers with special
+        characters in their names.
+
+      * `swift-container-info` now summarizes shard range information.
+        Pass `-v`/`--verbose` if you want to see all of them.
+
+      * Don't inject shard ranges when user quits.
+
+      * Various other minor bug fixes and improvements.
+
+    * Python 3 bug fixes:
+
+      * Fixed a potential server error when uploading data via a tempurl.
+
+      * Fixed a potential server error when getting symlink details.
+
+    * Added the ability to connect to memcached over TLS. See the
+      `tls_*` options in etc/memcache.conf-sample
+
+
+swift (2.23.2, train stable backports)
+
+    * Python 3 bug fixes:
+
+      * Fixed an error when reading encrypted data that was written while
+        running Python 2 for a path that includes non-ASCII characters. This
+        was caused by a difference in string types that resulted in
+        ambiguity when decrypting. To prevent the ambiguity for new data, set
+        `meta_version_to_write = 3` in your keymaster configuration after
+        upgrading all proxy servers.
+
+        If upgrading from Swift 2.20.0 or Swift 2.19.1 or earlier, set
+        `meta_version_to_write = 1` in your keymaster configuration prior
+        to upgrading.
+
+      * Fixed an issue when reading or writing objects with a content-type
+        like `message/*`. Previously, Swift would fail to respond.
+
+      * Object expiration respects the `expiring_objects_container_divisor`
+        config option.
+
+      * `fallocate_reserve` may be specified as a percentage in more places.
+
+      * The formpost middleware now works with unicode file names.
+
+      * Certain S3 API headers are now lower case as they would be coming
+        from AWS.
+
+    * Improved how containers reclaim deleted rows to reduce locking and object
+      update throughput.
+
+    * Fix a proxy-server error when retrieving erasure coded data when
+      there are durable fragments but not enough to reconstruct.
+
+    * Fixed 500 from cname_lookup middleware. Previously, if the looked-up
+      domain was used by domain_remap to update the request path, the
+      server would respond Internal Error.
+
+    * The bulk extract middleware once again allows clients to specify metadata
+      (including expiration timestamps) for all objects in the archive.
+
+    * Errors encountered while validating static symlink targets no longer
+      cause BadResponseLength errors in the proxy-server.
+
+    * Fixed some SignatureDoesNotMatch errors when using the AWS .NET SDK.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.23.1, train stable backports)
+
+    * On Python 3, the KMS keymaster now works with secrets stored
+      in Barbican with a text/plain payload-content-type.
+
+    * Several utility scripts now work better on Python 3:
+
+      * swift-account-audit
+
+      * swift-dispersion-populate
+
+      * swift-drive-recon
+
+      * swift-recon
+
+
+swift (2.23.0, OpenStack Train)
+
+    * Python 3.6 and 3.7 are now fully supported. Several py3-related
+      fixes are included:
+
+      * Removed a request-smuggling vector when running a mixed
+        py2/py3 cluster.
+
+      * Allow fallocate_reserve to be specified as a percentage.
+
+      * Fixed listings for sharded containers.
+
+      * Fixed non-ASCII account metadata handling.
+
+      * Fixed rsync output parsing.
+
+      * Fixed some title-casing of headers.
+
+      If you've been testing Swift on Python 3, upgrade at your earliest
+      convenience.
+
+    * Added "static symlinks", which perform some validation as they
+      follow redirects and include more information about their target
+      in container listings.
+
+    * Multi-character strings may now be used as delimiters in account
+      and container listings.
+
+    * Sharding improvements
+
+      * Container metadata related to sharding are now removed when no
+        longer needed.
+
+      * Empty container databases (such as might be created on handoffs)
+        now shard much more quickly.
+
+    * The proxy-server now ignores 404 responses from handoffs that have
+      no data when deciding on the correct response for object requests,
+      similar to what it already does for account and container requests.
+
+    * Static Large Object sizes in listings for versioned containers are
+      now more accurate.
+
+    * When refetching Static Large Object manifests, non-manifest responses
+      are now handled better.
+
+    * S3 API now translates 503 Service Unavailable responses to a more
+      S3-like response instead of raising an error.
+
+    * Improved proxy-to-backend requests to be more RFC-compliant.
+
+    * Dependency update: eventlet must be at least 0.25.0. This also
+      dragged forward minimum-supported versions of dnspython (1.15.0),
+      greenlet (0.3.2), and six (1.10.0).
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.22.0)
+
+    * Experimental support for Python 3.6 and 3.7 is now available.
+      Note that this requires eventlet>=0.25.0. All unit tests pass,
+      and running functional tests under Python 2 will pass against
+      services running under Python 3. Expect full support in the
+      next minor release.
+
+    * Log formats are now more configurable and include support for
+      anonymization. See the log_msg_template option in proxy-server.conf
+      and https://docs.openstack.org/swift/latest/logs.html#proxy-logs
+      for more information.
+
+    * Added an operator tool, swift-container-deleter, to asynchronously
+      delete some or all objects in a container using the object expirers.
+
+    * Swift-all-in-one Docker images are now built and published to
+      https://hub.docker.com/r/openstackswift/saio. These are intended
+      for use as development targets, but will hopefully be useful as a
+      starting point for other work involving containerizing Swift.
+
+    * The object-expirer may now be configured in object-server.conf.
+      This is in anticipation of a future change to allow the
+      object-expirer to be deployed on all nodes that run object-servers.
+
+    * Correctness improvements
+
+      * The proxy-server now ignores 404 responses from handoffs without
+        databases when deciding on the correct response for account and
+        container requests.
+
+      * Object writes to a container whose existence cannot be verified
+        now 503 instead of 404.
+
+    * Sharding improvements
+
+      * The container-replicator now only attempts to fetch shard ranges if
+        the remote indicates that it has shard ranges. Further, it does so
+        with a timeout to prevent the process from hanging in certain cases.
+
+      * The proxy-server now caches 'updating' shards, improving write
+        performance for sharded containers. A new config option,
+        `recheck_updating_shard_ranges`, controls the cache time; set it to
+        0 to disable caching.
+
+      * The container-replicator now correctly enqueues container-reconciler
+        work for sharded containers.
+
+    * S3 API improvements
+
+      * Unsigned payloads work with v4 signatures once more.
+
+      * Multipart upload parts may now be copied from other multipart uploads.
+
+      * CompleteMultipartUpload requests with a Content-MD5 now work.
+
+      * Content-Type can now be updated when copying an object.
+
+      * Fixed v1 listings that end with a non-ASCII object name.
+
+    * Background corruption-detection improvements
+
+      * Detect and remove invalid entries from hashes.pkl
+
+      * When object path is not a directory, just quarantine it,
+        rather than the whole suffix.
+
+    * Dependency updates: we've increased our minimum supported version
+      of cryptography to 2.0.2 and netifaces to 0.8. This is largely due
+      to the difficulty of continuing to test with the old versions.
+
+      If running Swift under Python 3, eventlet must be at least 0.25.0.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.21.1, stein stable backports)
+
+    * Sharding improvements
+
+      * The container-replicator now only attempts to fetch shard ranges if
+        the remote indicates that it has shard ranges. Further, it does so
+        with a timeout to prevent the process from hanging in certain cases.
+
+      * The container-replicator now correctly enqueues container-reconciler
+        work for sharded containers.
+
+      * Container metadata related to sharding are now removed when no
+        longer needed.
+
+    * S3 API improvements
+
+      * Unsigned payloads work with v4 signatures once more.
+
+      * Multipart upload parts may now be copied from other multipart uploads.
+
+      * CompleteMultipartUpload requests with a Content-MD5 now work.
+
+      * Content-Type can now be updated when copying an object.
+
+      * Fixed v1 listings that end with a non-ASCII object name.
+
+    * Background corruption-detection improvements
+
+      * Detect and remove invalid entries from hashes.pkl
+
+      * When object path is not a directory, just quarantine it,
+        rather than the whole suffix.
+
+    * Static Large Object sizes in listings for versioned containers are
+      now more accurate.
+
+    * When refetching Static Large Object manifests, non-manifest responses
+      are now handled better.
+
+    * Cross-account symlinks now store correct account information in
+      container listings. This was previously fixed in 2.22.0.
+
+    * Requesting multiple ranges from a Dynamic Large Object now returns the
+      entire object instead of incorrect data. This was previously fixed in
+      2.23.0.
+
+    * When making backend requests, the proxy-server now ensures query
+      parameters are always properly quoted. Previously, the proxy would
+      encounter an error on Python 2.7.17 if the client included non-ASCII
+      query parameters in object requests. This was previously fixed in
+      2.23.0.
+
+
+swift (2.21.0, OpenStack Stein)
+
+    * Change the behavior of the EC reconstructor to perform a
+      fragment rebuild to a handoff node when a primary peer responds
+      with 507 to the REPLICATE request. This changes EC to match the
+      existing behavior of replication when drives fail. After a
+      rebalance of EC rings (potentially removing unmounted/failed
+      devices), it's most IO efficient to run in handoffs_only mode to
+      avoid unnecessary rebuilds.
+
+    * O_TMPFILE support is now detected by attempting to use it
+      instead of looking at the kernel version. This allows older
+      kernels with backported patches to take advantage of the
+      O_TMPFILE functionality.
+
+    * Add slo_manifest_hook callback to allow other middlewares to
+      impose additional constraints on or make edits to SLO manifests
+      before being written. For example, a middleware could enforce
+      minimum segment size or insert data segments.
+
+    * Fixed an issue with multi-region EC policies that caused the EC
+      reconstructor to constantly attempt cross-region rebuild
+      traffic.
+
+    * Fixed an issue where S3 API v4 signatures would not be validated
+      against the body of the request, allowing a replay attack if
+      request headers were captured by a malicious third party.
+
+    * Display crypto data/metadata details in swift-object-info.
+
+    * formpost can now accept a content-encoding parameter.
+
+    * Fixed an issue where multipart uploads with the S3 API would
+      sometimes report an error despite all segments being upload
+      successfully.
+
+    * Multipart object segments are now actually deleted when the
+      multipart object is deleted via the S3 API.
+
+    * Swift now returns a 503 (instead of a 500) when an account
+      auto-create fails.
+
+    * Fixed a bug where encryption would store the incorrect key
+      metadata if the object name starts with a slash.
+
+    * Fixed an issue where an object server failure during a client
+      download could leave an open socket between the proxy and
+      client.
+
+    * Fixed an issue where deleted EC objects didn't have their
+      on-disk directories cleaned up. This would cause extra resource
+      usage on the object servers.
+
+    * Fixed issue where bulk requests using xml and expect
+      100-continue would return a malformed HTTP response.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.20.0)
+
+    * S3 API compatibility updates
+
+      * Swift can now cache the S3 secret from Keystone to use for
+        subsequent requests. This functionality is disabled by default but
+        can be enabled by setting the `secret_cache_duration` in the s3token
+        section of the proxy server config to a number greater than 0.
+
+      * s3api now mimics the AWS S3 behavior of periodically sending
+        whitespace characters on a Complete Multipart Upload request to keep
+        the connection from timing out. Note that since a request could fail
+        after the initial 200 OK response has been sent, it is important to
+        check the response body to determine if the request succeeded.
+
+      * s3api now properly handles x-amz-metadata-directive headers on
+        COPY operations.
+
+      * s3api now uses concurrency (default 2) to handle multi-delete
+        requests. This allows multi-delete requests to be processed much
+        more quickly.
+
+      * s3api now mimics some forms of AWS server-side encryption
+        based on whether Swift's at-rest encryption functionality is enabled.
+        Note that S3 API users are now able to know more about how the
+        cluster is configured than they were previously, ie knowledge of
+        encryption at-rest functionality being enabled or not.
+
+      * s3api responses now include a '-' in multipart ETags.
+
+        For new multipart-uploads via the S3 API, the ETag that is
+        stored will be calculated in the same way that AWS uses. This
+        ETag will be used in GET/HEAD responses, bucket listings, and
+        conditional requests via the S3 API. Accessing the same object
+        via the Swift API will use the SLO Etag; however, in JSON
+        container listings the multipart upload etag will be exposed
+        in a new "s3_etag" key. Previously, some S3 clients would complain
+        about download corruption when the ETag did not have a '-'.
+
+      * S3 ETag for SLOs now include a '-'.
+
+        Ordinary objects in S3 use the MD5 of the object as the ETag,
+        just like Swift. Multipart Uploads follow a different format, notably
+        including a dash followed by the number of segments. To that end
+        (and for S3 API requests *only*), SLO responses via the S3 API have a
+        literal '-N' added on the end of the ETag.
+
+      * The default location is now set to "us-east-1". This is more likely
+        to be the default region that a client will try when using v4
+        signatures.
+
+        Deployers with clusters that relied on the old implicit default
+        location of "US" should explicitly set `location = US` in the
+        `[filter:s3api]` section of proxy-server.conf before upgrading.
+
+      * Add basic support for ?versions bucket listings. We still do not
+        have support for toggling S3 bucket versioning, but we can at least
+        support getting the latest versions of all objects.
+
+    * Fixed an issue with SSYNC requests to ensure that only one request
+      can be running on a partition at a time.
+
+    * Data encryption updates
+
+      * The kmip_keymaster middleware can now be configured directly in the
+        proxy-server config file. The existing behavior of using an external
+        config file is still supported.
+
+      * Multiple keymaster middlewares are now supported. This allows
+        migration from one key provider to another.
+
+        Note that secret_id values must remain unique across all keymasters
+        in a given pipeline. If they are not unique, the right-most keymaster
+        will take precedence.
+
+        When looking for the active root secret, only the right-most
+        keymaster is used.
+
+      * Prevent PyKMIP's kmip_protocol logger from logging at DEBUG.
+        Previously, some versions of PyKMIP would include all wire
+        data when the root logger was configured to log at DEBUG; this
+        could expose key material in logs. Only the kmip_keymaster was
+        affected.
+
+    * Fixed an issue where a failed drive could prevent the container sharder
+      from making progress.
+
+    * Storage policy definitions in swift.conf can now define the diskfile
+      to use to access objects. See the included swift.conf-sample file for
+      a description of usage.
+
+    * The EC reconstructor will now attempt to remove empty directories
+      immediately, while the inodes are still cached, rather than waiting
+      until the next run.
+
+    * Added a keep_idle config option to configure KEEPIDLE time for TCP
+      sockets. The default value is the old constant of 600.
+
+    * Add databases_per_second to the account-replicator,
+      container-replicator, and container-sharder. This prevents them from
+      using a full CPU core when they are not IO limited.
+
+    * Allow direct_client users to overwrite the X-Timestamp header.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.19.2, rocky stable backports)
+
+    * Sharding improvements
+
+      * The container-replicator now only attempts to fetch shard ranges if
+        the remote indicates that it has shard ranges. Further, it does so
+        with a timeout to prevent the process from hanging in certain cases.
+
+      * The container-replicator now correctly enqueues container-reconciler
+        work for sharded containers.
+
+    * S3 API improvements
+
+      * Fixed an issue where v4 signatures would not be validated against
+        the body of the request, allowing a replay attack if request headers
+        were captured by a malicious third party. Note that unsigned payloads
+        still function normally.
+
+      * CompleteMultipartUpload requests with a Content-MD5 now work.
+
+      * Fixed v1 listings that end with a non-ASCII object name.
+
+      * Multipart object segments are now actually deleted when the
+        multipart object is deleted via the S3 API.
+
+      * Fixed an issue that caused Delete Multiple Objects requests with
+        large bodies to 400. This was previously fixed in 2.20.0.
+
+      * Fixed an issue where non-ASCII Keystone EC2 credentials would not get
+        mapped to the correct account. This was previously fixed in 2.20.0.
+
+    * Background corruption-detection improvements
+
+      * Detect and remove invalid entries from hashes.pkl
+
+      * When object path is not a directory, just quarantine it,
+        rather than the whole suffix.
+
+
+    * Fixed a bug where encryption would store the incorrect key
+      metadata if the object name starts with a slash.
+
+    * Fixed an issue where an object server failure during a client
+      download could leave an open socket between the proxy and
+      client.
+
+    * Static Large Object sizes in listings for versioned containers are
+      now more accurate.
+
+    * When refetching Static Large Object manifests, non-manifest responses
+      are now handled better.
+
+    * Cross-account symlinks now store correct account information in
+      container listings. This was previously fixed in 2.22.0.
+
+    * Requesting multiple ranges from a Dynamic Large Object now returns the
+      entire object instead of incorrect data. This was previously fixed in
+      2.23.0.
+
+    * When making backend requests, the proxy-server now ensures query
+      parameters are always properly quoted. Previously, the proxy would
+      encounter an error on Python 2.7.17 if the client included non-ASCII
+      query parameters in object requests. This was previously fixed in
+      2.23.0.
+
+
+swift (2.19.1, rocky stable backports)
+
+    * Prevent PyKMIP's kmip_protocol logger from logging at DEBUG.
+      Previously, some versions of PyKMIP would include all wire
+      data when the root logger was configured to log at DEBUG; this
+      could expose key material in logs. Only the kmip_keymaster was
+      affected.
+
+    * Fixed an issue where a failed drive could prevent the container sharder
+      from making progress.
+
+    * Fixed a bug in how Swift uses eventlet that was exposed under high
+      concurrency.
+
+
+swift (2.19.0, OpenStack Rocky)
+
+    * TempURLs now support IP range restrictions. Please see
+      https://docs.openstack.org/swift/latest/middleware.html#client-usage
+      for more information on how to use this additional restriction.
+
+    * Add support for multiple root encryption secrets for the trivial
+      and KMIP keymasters. This allows operators to rotate encryption
+      keys over time without needing to re-encrypt all existing data
+      in the cluster. Please see the included sample config files for
+      instructions on how to multiple encryption keys.
+
+    * The object updater now supports two configuration settings:
+      "concurrency" and "updater_workers". The latter controls how many
+      worker processes are spawned, while the former controls how many
+      concurrent container updates are performed by each worker
+      process. This should speed the processing of async_pendings.
+
+      On upgrade, a node configured with concurrency=N will still handle
+      async updates N-at-a-time, but will do so using only one process
+      instead of N.
+
+      If you have a config file like this:
+
+          [object-updater]
+          concurrency = <N>
+
+      and you want to take advantage of faster updates, then do this:
+
+          [object-updater]
+          concurrency = 8  # the default; you can omit this line
+          updater_workers = <N>
+
+      If you want updates to be processed exactly as before, do this:
+
+          [object-updater]
+          concurrency = 1
+          updater_workers = <N>
+
+    * When listing objects in a container in json format, static large
+      objects (SLOs) will now include an additional new "slo_etag" key
+      that matches the etag returned when requesting the SLO. The
+      existing "hash" key remains unchanged as the MD5 of the SLO
+      manifest. Text and XML listings are unaffected by this change.
+
+    * Log deprecation warnings for `run_pause`. This setting was
+      deprecated in Swift 2.4.0 and is replaced by `interval`.
+      It may be removed in a future release.
+
+    * Object reconstructor logs are now prefixed with information
+      about the specific worker process logging the message. This
+      makes reading the logs and understanding the messages much simpler.
+
+    * Lower bounds of dependencies have been updated to reflect what
+      is actually tested.
+
+    * SSYNC replication mode now removes as much of the directory
+      structure as possible as soon at it observes that the directory
+      is empty. This reduces the work needed for subsequent replication
+      passes.
+
+    * The container-updater now reports zero objects and bytes used for
+      child DBs in sharded containers. This prevents double-counting in
+      utilization reports.
+
+    * Add fallocate_reserve to account and container servers. This
+      allows disks shared between account/container and object rings to
+      avoid getting 100% full. The default value of 1% matches the
+      existing default on object servers.
+
+    * Added an experimental `swift-ring-composer` CLI tool to build
+      composite rings.
+
+    * Added an optional `read_only` middleware to make an entire cluster
+      or individual accounts read only.
+
+    * Fixed a bug where zero-byte PUTs would not work properly
+      with "If-None-Match: *" conditional requests.
+
+    * ACLs now work with unicode in user/account names.
+
+    * COPY now works with unicode account names.
+
+    * Improved S3 API compatibility.
+
+    * Lock timeouts in the container updater are now logged at INFO
+      level, not ERROR.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.18.0)
+
+    * Added container sharding, an operator controlled feature that
+      may be used to shard very large container databases into a
+      number of smaller shard containers. This mitigates the issues
+      with one large DB by distributing the data across multiple
+      smaller databases throughout the cluster. Please read the full
+      overview at
+      https://docs.openstack.org/swift/latest/overview_container_sharding.html
+
+    * Provide an S3 API compatibility layer. The external "swift3"
+      project has been imported into Swift's codebase as the "s3api"
+      middleware.
+
+    * Added "emergency mode" hooks in the account and container replicators.
+      These options may be used to prioritize moving handoff
+      partitions to primary locations more quickly. This helps when
+      adding capacity to a ring.
+
+      - Added `-d <devs>` and `-p <partitions>` command line options.
+
+      - Added a handoffs-only mode.
+
+    * Add a multiprocess mode to the object replicator. Setting the
+      "replicator_workers" setting to a positive value N will result
+      in the replicator using up to N worker processes to perform
+      replication tasks. At most one worker per disk will be spawned.
+
+      Worker process logs will have a bit of information prepended so
+      operators can tell which messages came from which worker. The
+      prefix is "[worker M/N pid=P] ", where M is the worker's index,
+      N is the total number of workers, and P is the process ID. Every
+      message from the replicator's logger will have the prefix
+
+    * The object reconstructor will now fork all available worker
+      processes when operating on a subset of local devices.
+
+    * Add support for PROXY protocol v1 to the proxy server. This
+      allows the Swift proxy server to log accurate client IP
+      addresses when there is a proxy or SSL-terminator between the
+      client and the Swift proxy server.  Example servers supporting
+      this PROXY protocol include stunnel, haproxy, hitch, and
+      varnish. See the sample proxy server config file for the
+      appropriate config setting to enable or disable this
+      functionality.
+
+    * In the ratelimit middleware, account whitelist and blacklist
+      settings have been deprecated and may be removed in a future
+      release. When found, a deprecation message will be logged.
+      Instead of these config file values, set X-Account-Sysmeta-
+      Global-Write-Ratelimit:WHITELIST and X-Account-Sysmeta-Global-
+      Write-Ratelimit:BLACKLIST on the particular accounts that need
+      to be whitelisted or blacklisted. System metadata cannot be added
+      or modified by standard clients. Use the internal client to set sysmeta.
+
+    * Add a --drop-prefixes flag to swift-account-info,
+      swift-container-info, and swift-object-info. This makes the
+      output between the three more consistent.
+
+    * statsd error messages correspond to 5xx responses only. This
+      makes monitoring more useful because actual errors (5xx) will
+      not be hidden by common user requests (4xx). Previously, some 4xx
+      responses would be included in timing information in the statsd
+      error messages.
+
+    * Truncate error logs to prevent log handler from running out of buffer.
+
+    * Updated requirements.txt to match global exclusions and formatting.
+
+    * tempauth user names now support unicode characters.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.17.1, queens stable backports)
+
+    * Fix SLO delete for accounts with non-ASCII names.
+
+    * Fixed an issue in COPY where concurrent requests may have copied the
+      wrong data.
+
+    * Fixed a bug in how Swift uses eventlet that was exposed under high
+      concurrency.
+
+
+swift (2.17.0, OpenStack Queens)
+
+    * Added symlink objects support.
+
+      Symlink objects reference one other object. They are created by
+      creating an empty object with an X-Symlink-Target header. The value of
+      the header is of the format <container>/<object>, and the target does
+      not need to exist at the time of symlink creation. Cross-account
+      symlinks can be created by including the
+      X-Symlink-Target-Account header.
+
+      GET and HEAD requests to a symlink will operate on the
+      referenced object and require appropriate permission in the
+      target container. DELETE and PUT requests will operate on the
+      symlink object itself. POST requests are not forwarded to the
+      referenced object. POST requests sent to a symlink will result
+      in a 307 Temporary Redirect response.
+
+    * Added support for inline data segments in SLO manifests.
+
+      Upgrade impact: during a rolling upgrade, an updated proxy server
+      may write a manifest that an out-of-date proxy server will not be
+      able to read. This will resolve itself once the upgrade completes
+      on all nodes.
+
+    * The tempurl digest algorithm is now configurable, and Swift added
+      support for both SHA-256 and SHA-512. Supported tempurl digests
+      are exposed to clients in `/info`. Additionally, tempurl signatures
+      can now be base64 encoded.
+
+    * Object expiry improvements
+
+      - Disallow X-Delete-At header values equal to the X-Timestamp header.
+
+      - X-Delete-At computation now uses X-Timestamp instead of
+        system time. This prevents clock skew causing inconsistent
+        expiry data.
+
+      - Deleting an expiring object will now cause less work in the system.
+        The number of async pending files written has been reduced for all
+        objects and greatly reduced for erasure-coded objects. This
+        dramatically reduces the burden on container servers.
+
+      - Stopped logging tracebacks when receiving an unexpected response.
+
+      - Allow the expirer to gracefully move past updating stale work items.
+
+    * When the object auditor examines an object, it will now add any
+      missing metadata checksums.
+
+    * `swift-ring-builder` improvements
+
+      - Save the ring when dispersion improves, even if balance
+        doesn't improve.
+
+      - Improved the granularity of the ring dispersion metric so that
+        small improvements after a rebalance can show changes in the
+        dispersion number. Dispersion in existing and new rings can be
+        recalculated using the new '--recalculate' option to
+        `swift-ring-builder`.
+
+      - Display more info on empty rings.
+
+    * Fixed rare socket leak on range requests to erasure-coded objects.
+
+    * The number of container updates on object PUTs (ie to update listings)
+      has been recomputed to be far more efficient while maintaining
+      durability guarantees. Specifically, object PUTs to erasure-coded
+      policies will now normally result in far fewer container updates.
+
+    * Moved Zuul v3 tox jobs into the Swift code repo.
+
+    * Changed where liberasurecode-devel for CentOS 7 is referenced and
+      installed as a dependency.
+
+    * Added container/object listing with prefix to InternalClient.
+
+    * Added '--swift-versions' to `swift-recon` CLI to compare installed
+      versions in the cluster.
+
+    * Stop logging tracebacks in the `object-replicator` when it runs
+      out of handoff locations.
+
+    * Send ETag header in 206 Partial Content responses to SLO reads.
+
+    * Now `swift-recon-cron` works with conf.d configs.
+
+    * Improved `object-updater` stats logging. It now tells you all of
+      its stats (successes, failures, quarantines due to bad pickles,
+      unlinks, and errors), and it tells you incremental progress every
+      five minutes. The logging at the end of a pass remains and has
+      been expanded to also include all stats.
+
+    * If a proxy server is configured to autocreate accounts and the
+      account create fails, it will now return a server error (500)
+      instead of Not Found (404).
+
+    * Fractional replicas are no longer allowed for erasure code policies.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.16.0)
+
+    * Add checksum to object extended attributes.
+
+    * Let clients request heartbeats during SLO PUTs by including
+      the query parameter `heartbeat=on`.
+
+      With heartbeating turned on, the proxy will start its response
+      immediately with 202 Accepted then send a single whitespace
+      character periodically until the request completes. At that
+      point, a final summary chunk will be sent which includes a
+      "Response Status" key indicating success or failure and (if
+      successful) an "Etag" key indicating the Etag of the resulting
+      SLO.
+
+    * Added support for retrieving the encryption root secret from an
+      external key management system. In practice, this is currently limited
+      to Barbican.
+
+    * Move listing formatting out to a new proxy middleware named
+      `listing_formats`. `listing_formats` should be just right of the
+      first proxy-logging middleware, and left of most other
+      middlewares. If it is not already present, it will be
+      automatically inserted for you.
+
+      Note: if you have a custom middleware that makes account or
+      container listings, it will only receive listings in JSON format.
+
+    * Log deprecation warning for `allow_versions` in the container
+      server config. Configure the `versioned_writes` middleware in
+      the proxy server instead. This option will be ignored in a
+      future release.
+
+    * Replaced `replication_one_per_device` by custom count defined by
+      `replication_concurrency_per_device`. The original config value
+      is deprecated, but continues to function for now. If both values
+      are defined, the old `replication_one_per_device` is ignored.
+
+    * Fixed a rare issue where multiple backend timeouts could result
+      in bad data being returned to the client.
+
+    * Cleaned up logged tracebacks when talking to memcached servers.
+
+    * Account and container replication stats logs now include
+      `remote_merges`, the number of times a whole database was sent
+      to another node.
+
+    * Respond 400 Bad Request when Accept headers fail to parse
+      instead of returning 406 Not Acceptable.
+
+    * The `domain_remap` middleware now supports the
+      `mangle_client_paths` option. Its default "false" value changes
+      `domain_remap` parsing to stop stripping the `path_root` value
+      from URL paths. If users depend on this path mangling, operators
+      should set `mangle_client_paths` to "True" before upgrading.
+
+    * Remove `swift-temp-url` script. The functionality has been in
+      swiftclient for a long time and this script has been deprecated
+      since 2.10.0.
+
+    * Removed all `post_as_copy` related code and configs. The option
+      has been deprecated since 2.13.0.
+
+    * Fixed XML responses (eg on bulk extractions and SLO upload
+      failures) to be more correct. The enclosing "delete" tag was
+      removed where it doesn't make sense and replaced with "extract"
+      or "upload" depending on the context.
+
+    * Static Large Object (SLO) manifest may now (again) have zero-byte
+      last segments.
+
+    * Fixed an issue where background consistency daemon child
+      processes would deadlock waiting on the same file descriptor.
+
+    * Removed a race condition where a POST to an SLO could modify the
+      X-Static-Large-Object metadata.
+
+    * Accept a trade off of dispersion for balance in the ring builder
+      that will result in getting to balanced rings much more quickly
+      in some cases.
+
+    * Fixed using `swift-ring-builder set_weight` with more than one
+      device.
+
+    * When requesting objects, return 404 if a tombstone is found and
+      is newer than any data found. Previous behavior was to return
+      stale data.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.15.2, pike stable backports)
+
+    * Fixed a cache invalidation issue related to GET and PUT requests to
+      containers that would occasionally cause object PUTs to a container to
+      404 after the container had been successfully created.
+
+    * Removed a race condition where a POST to an SLO could modify the
+      X-Static-Large-Object metadata.
+
+    * Fixed rare socket leak on range requests to erasure-coded objects.
+
+    * Fix SLO delete for accounts with non-ASCII names.
+
+    * Fixed an issue in COPY where concurrent requests may have copied the
+      wrong data.
+
+    * Fixed time skew when using X-Delete-After.
+
+    * Send ETag header in 206 Partial Content responses to SLO reads.
+
+
+swift (2.15.1, OpenStack Pike)
+
+    * Fixed a bug introduced in 2.15.0 where the object reconstructor
+      would exit with a traceback if no EC policy was configured.
+
+    * Fixed deadlock when logging from a tpool thread.
+
+      The object server runs certain IO-intensive methods outside the
+      main pthread for performance. Previously, if one of those methods
+      tried to log, this can cause a crash that eventually leads to an
+      object server with hundreds or thousands of greenthreads, all
+      deadlocked. The fix is to use a mutex that works across different
+      greenlets and different pthreads.
+
+    * The object reconstructor can now rebuild an EC fragment for an
+      expired object.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.15.0)
+
+    * Add Composite Ring Functionality
+
+      A composite ring comprises two or more component rings that are
+      combined to form a single ring with a replica count equal to the
+      sum of the component rings. The component rings are built
+      independently, using distinct devices in distinct regions, which
+      means that the dispersion of replicas between the components can
+      be guaranteed.
+
+      Composite rings can be used for explicit replica placement and
+      "replicated EC" for global erasure codes policies.
+
+      Composite rings support 'cooperative' rebalance which means that
+      during rebalance all component rings will be consulted before a
+      partition is moved in any component ring. This avoids the same
+      partition being simultaneously moved in multiple components.
+
+      We do not yet have CLI tools for creating composite rings, but
+      the functionality has been enabled in the ring modules to
+      support this advanced functionality. CLI tools will be delivered
+      in a subsequent release.
+
+      For further information see the docs at
+      <https://docs.openstack.org/swift/latest/overview_ring.html#module-swift.common.ring.composite_builder>
+
+    * The EC reconstructor process has been dramatically improved by
+      adding support for multiple concurrent workers. Multiple
+      processes are required to get high concurrency, and this change
+      results in much faster rebalance times on servers with many
+      drives.
+
+      Currently the default is still only one process, and no workers.
+      Set `reconstructor_workers` in the `[object-reconstructor]`
+      section to some whole number <= the number of devices on a node
+      to get that many reconstructor workers.
+
+    * Add support to increase object ring partition power transparently
+      to end users and with no cluster downtime. Increasing the ring
+      partition power allows for incremental adjustment to the upper bound
+      of the cluster size. Please review the full docs at
+      <https://docs.openstack.org/swift/latest/ring_partpower.html>.
+
+    * Added support for per-policy proxy config options. This allows
+      per-policy affinity options to be set for use with duplicated EC
+      policies and composite rings. Certain options found in per-policy
+      conf sections will override their equivalents that may be set
+      in the [app:proxy-server] section. Currently the options handled that
+      way are sorting_method, read_affinity, write_affinity,
+      write_affinity_node_count, and write_affinity_handoff_delete_count.
+
+    * Enabled versioned writes on Dynamic Large Objects (DLOs).
+
+    * Write-affinity aware object deletion
+
+      Previously, when deleting objects in multi-region swift
+      deployment with write affinity configured, users always get 404
+      when deleting object before it's replicated to appropriate nodes.
+
+      Now Swift will use `write_affinity_handoff_delete_count` to
+      define how many local handoff nodes should swift send request to
+      get more candidates for the final response. The default value
+      "auto" means Swift will calculate the number automatically based
+      on the number of replicas and current cluster topology.
+
+    * Require that known-bad EC schemes be deprecated
+
+      Erasure-coded storage policies using isa_l_rs_vand and nparity
+      >= 5 must be configured as deprecated, preventing any new
+      containers from being created with such a policy. This
+      configuration is known to harm data durability. Any data in such
+      policies should be migrated to a new policy. See
+      https://bugs.launchpad.net/swift/+bug/1639691 for more
+      information
+
+    * Optimize the Erasure Code reconstructor protocol to reduce IO
+      load on servers.
+
+    * Fixed a bug where SSYNC would fail to replicate unexpired object.
+
+    * Fixed a bug in domain_remap when obj starts/ends with slash.
+
+    * Fixed a socket leak in copy middleware when a large object was copied.
+
+    * Fixed a few areas where the `swiftdir` option was not respected.
+
+    * `swift-recon` now respects storage policy aliases.
+
+    * cname_lookup middleware now accepts a `nameservers` config
+      variable that, if defined, will be used for DNS lookups instead of
+      the system default.
+
+    * Make mount_check option usable in containerized environments by
+      adding a check for an ".ismount" file at the root directory of
+      a device.
+
+    * Remove deprecated `vm_test_mode` option.
+
+    * The object and container server config option `slowdown` has been
+      deprecated in favor of the new `objects_per_second` and
+      `containers_per_second` options.
+
+    * The output of devices from `swift-ring-builder` has been reordered
+      by region, zone, ip, and device.
+
+    * Imported docs content from openstack-manuals project.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.14.0)
+
+    * Fixed error where a container drive error resulted in double space
+      usage on rest drives. When drive with container or account database
+      is unmounted, the bug would create handoff replicas on all remaining
+      drives, increasing the drive space used and filling the cluster.
+
+    * Fixed UnicodeDecodeError in the object reconstructor that would
+      prevent objects with non-ascii names from being reconstructed and
+      caused the reconstructor process to hang.
+
+    * EC Fragment Duplication - Foundational Global EC Cluster Support.
+
+    * Fixed encoding issue in ssync where a mix of ascii and non-ascii
+      metadata values would cause an error.
+
+    * `name_check` and `cname_lookup` keys have been added to `/info`.
+
+    * Add Vary: headers for CORS responses.
+
+    * Always set Swift processes to use UTC.
+
+    * Prevent logged traceback in object-server on client disconnect for
+      chunked transfers to replicated policies.
+
+    * Removed per-device reconstruction stats. Now that the reconstructor
+      is shuffling parts before going through them, those stats no longer
+      make sense.
+
+    * Log correct status code for conditional requests.
+
+    * Drop support for auth-server from common/manager.py and `swift-init`.
+
+    * Include received fragment index in reconstructor log warnings.
+
+    * Fixed a race condition in updating hashes.pkl where a partition
+      suffix invalidation may have been skipped.
+
+    * `domain_remap` now accepts a list of domains in "storage_domain".
+
+    * Do not follow CNAME when host is in storage_domain.
+
+    * Enable cluster-wide CORS Expose-Headers setting via
+      "cors_expose_headers".
+
+    * Cache all answers from nameservers in cname_lookup.
+
+    * Log the correct request type of a subrequest downstream of copy.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.13.0, OpenStack Ocata)
+
+    * Improvements in key parts of the consistency engine
+
+      - Improved performance by eliminating an unneeded directory
+        structure hash.
+
+      - Optimized the common case for hashing filesystem trees, thus
+        eliminating a lot of extraneous disk I/O.
+
+      - Updated the `hashes.pkl` file format to include timestamp information
+        for race detection. Also simplified hashing logic to prevent race
+        conditions and optimize for the common case.
+
+      - The erasure code reconstructor will now shuffle work jobs across all
+        disks instead of going disk-by-disk. This eliminates single-disk I/O
+        contention and allows continued scaling as concurrency is increased.
+
+      - Erasure code reconstruction handles moving data from handoff nodes
+        better. Instead of moving the data to another handoff, it waits
+        until it can be moved to a primary node.
+
+      Upgrade Impact: If you upgrade and roll back, you must delete all
+      `hashes.pkl` files.
+
+    * If using erasure coding with ISA-L in rs_vand mode and 5 or more parity
+      fragments, Swift will emit a warning. This is a configuration that is
+      known to harm data durability. In a future release, this warning will be
+      upgraded to an error unless the policy is marked as deprecated. All data
+      in an erasure code storage policy using isa_l_rs_vand with 5 or more
+      parity should be migrated as soon as possible. Please see
+      https://bugs.launchpad.net/swift/+bug/1639691 for more information.
+
+    * The erasure code reconstructor `handoffs_first` option has been
+      deprecated in favor of `handoffs_only`. `handoffs_only` is far more
+      useful, and just like `handoffs_first` mode in the replicator, it gives
+      the operator the option of forcing the consistency engine to focus
+      solely on revert (handoff) jobs, thus improving the speed of
+      rebalances.  The `handoffs_only` behavior is somewhat consistent with
+      the replicator's `handoffs_first` option (any error on any handoff in
+      the replicator will make it essentially handoff only forever) but the
+      `handoff_only` option does what you want and is named correctly in the
+      reconstructor.
+
+    * The default for `object_post_as_copy` has been changed to False. The
+      option is now deprecated and will be removed in a future release. If
+      your cluster is still running with post-as-copy enabled, please update
+      it to use the "fast-post" method. Future versions of Swift will not
+      support post-as-copy, and future features will not be supported under
+      post-as-copy. ("Fast-post" is where `object_post_as_copy` is false).
+
+    * Temporary URLs now support one common form of ISO 8601 timestamps in
+      addition to Unix seconds-since-epoch timestamps. The ISO 8601 format
+      accepted is '%Y-%m-%dT%H:%M:%SZ'. This makes TempURLs more
+      user-friendly to produce and consume.
+
+    * Listing containers in accounts with json or xml now includes a
+      `last_modified` time. This does not change any on-disk data, but simply
+      exposes the value to offer consistency with the object listings on
+      containers.
+
+    * Fixed a bug where the ring builder would not allow removal of a device
+      when min_part_seconds_left was greater than zero.
+
+    * PUT subrequests generated from a client-side COPY will now properly log
+      the SSC (server-side copy) Swift source field. See
+      https://docs.openstack.org/swift/latest/logs.html#swift-source for
+      more information.
+
+    * Fixed a bug where an SLO download with a range request may have resulted
+      in a 5xx series response.
+
+    * SLO manifest PUT requests can now be properly validated by sending an
+      ETag header of the md5 sum of the concatenated md5 sums of the
+      referenced segments.
+
+    * Fixed the stats calculation in the erasure code reconstructor.
+
+    * Rings with min_part_hours set to zero will now only move one partition
+      replica per rebalance, thus matching behavior when min_part_hours is
+      greater than zero.
+
+    * I/O priority is now supported on AArch64 architecture.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.12.0)
+
+    * Ring files now include byteorder information about the endian of
+      the machine used to generate the file, and the values are
+      appropriately byteswapped if deserialized on a machine with a
+      different endianness.
+
+      Newly created ring files will be byteorder agnostic, but
+      previously generated ring files will still fail on different
+      endian architectures. Regenerating older ring files will cause
+      them to become byteorder agnostic. The regeneration of the ring
+      files will not cause any new data movement. Newer ring files
+      will still be usable by older versions of Swift (on machines
+      with the same endianness--this maintains existing behavior).
+
+    * All 416 responses will now include a Content-Range header with
+      an unsatisfied-range value. This allows the caller to know the
+      valid range request value for an object.
+
+    * TempURLs now support a validation against a common prefix. A
+      prefix-based signature grants access to all objects which share the
+      same prefix. This avoids the creation of a large amount of signatures,
+      when a whole container or pseudofolder is shared.
+
+    * Correctly handle deleted files with if-none-match requests.
+
+    * Correctly send 412 Precondition Failed if a user sends an
+      invalid copy destination. Previously Swift would send a 500
+      Internal Server Error.
+
+    * In SLO manifests, the `etag` and `size_bytes` keys are now fully
+      optional and not required. Previously, the keys needed to exist
+      but the values were optional. The only required key is `path`.
+
+    * Fixed a rare infinite loop in `swift-ring-builder` while placing parts.
+
+    * Ensure update of the container by object-updater, removing a rare
+      possibility that objects would never be added to a container listing.
+
+    * Fixed non-deterministic suffix updates in hashes.pkl where a partition
+      may be updated much less often than expected.
+
+    * Fixed regression in consolidate_hashes that occurred when a new
+      file was stored to new suffix to a non-empty partition. This bug
+      was introduced in 2.7.0 and could cause an increase in rsync
+      replication stats during and after upgrade, due to inconsistent
+      hashing of partition suffixes.
+
+    * Account and container databases will now be quarantined if the
+      database schema has been corrupted.
+
+    * Removed "in-process-" from func env tox name to work with
+      upstream CI.
+
+    * Respect server type for --md5 check in swift-recon.
+
+    * Remove empty db hash and suffix directories if a db gets quarantined.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.11.0)
+
+    * We have made significant improvements and changes to the erasure
+      code implementation.
+
+      - Instead of using a separate .durable file to indicate the
+        durable status of an EC fragment archive, we rename the .data
+        to include a durable marker in the filename. This saves one
+        inode for every EC .data file. Existing .durable files will not
+        be removed, and they will continue to work just fine.
+
+        Note that after writing EC data with Swift 2.11.0 or later, that
+        data will not be accessible to earlier versions of Swift.
+
+      - Closed a bug where ssync may have written bad fragment data in
+        some circumstances. A check was added to ensure the correct number
+        of bytes is written for a fragment before finalizing the write.
+        Also, erasure coded fragment metadata will now be validated on read
+        requests and, if bad data is found, the fragment will be quarantined.
+
+      - The improvements to EC reads made in Swift 2.10.0 have also been
+        applied to the reconstructor. This allows fragments to be rebuilt
+        in more circumstances, resulting in faster recovery from failures.
+
+      - WARNING: If you are using the ISA-L library for erasure codes,
+        please upgrade to liberasurecode 1.3.1 (or later) as soon as
+        possible. If you are using isa_l_rs_vand with more than 4 parity,
+        please read https://bugs.launchpad.net/swift/+bug/1639691 and take
+        necessary action.
+
+      - Updated the PyECLib dependency to 1.3.1.
+
+    * Added a configurable URL base to staticweb.
+
+    * Support multi-range GETs for static large objects.
+
+    * TempURLs using the "inline" parameter can now also set the
+      "filename" parameter. Both are used in the Content-Disposition
+      response header.
+
+    * Mirror X-Trans-Id to X-Openstack-Request-Id.
+
+    * SLO will now concurrently HEAD segments, resulting in much faster
+      manifest validation and object creation. By default, two HEAD requests
+      will be done at a time, but this can be changed by the operator via
+      the new `concurrency` setting in the "[filter:slo]" section of
+      the proxy server config.
+
+    * Suppressed the KeyError message when auditor finds an expired object.
+
+    * Daemons using InternalClient can now be properly killed with SIGTERM.
+
+    * Added a "user" option to the drive-audit config file. Its value is
+      used to set the owner of the drive-audit recon cache.
+
+    * Throttle update_auditor_status calls so it updates no more than once
+      per minute.
+
+    * Suppress unexpected-file warnings for rsync temp files.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.10.0, OpenStack Newton)
+
+    * Object versioning now supports a "history" mode in addition to
+      the older "stack" mode. The difference is in how DELETE requests
+      are handled. For full details, please read
+      https://docs.openstack.org/swift/latest/overview_object_versioning.html.
+
+    * New config variables to change the schedule priority and I/O
+      scheduling class. Servers and daemons now understand
+      `nice_priority`, `ionice_class`, and `ionice_priority` to
+      schedule their relative importance. Please read
+      https://docs.openstack.org/swift/latest/admin_guide.html
+      for full config details.
+
+    * On newer kernels (3.15+ when using xfs), Swift will use the O_TMPFILE
+      flag when opening a file instead of creating a temporary file
+      and renaming it on commit. This makes the data path simpler and
+      allows the filesystem to more efficiently optimize the files on
+      disk, resulting in better performance.
+
+    * Erasure code GET performance has been significantly
+      improved in clusters that are not completely healthy.
+
+    * Significant improvements to the api-ref doc available at
+      https://docs.openstack.org/api-ref/object-store/.
+
+    * A PUT or POST to a container will now update the container's
+      Last-Modified time, and that value will be included in a
+      GET/HEAD response.
+
+    * Include object sysmeta in POST responses. Sysmeta is still
+      stripped from the response before being sent to the client, but
+      this allows middleware to make use of the information.
+
+    * Fixed a bug where a container listing delimiter wouldn't work
+      with encryption.
+
+    * Fixed a bug where some headers weren't being copied correctly
+      in a COPY request.
+
+    * Container sync can now copy SLOs more efficiently by allowing
+      the manifest to be synced before all of the referenced segments.
+      This fixes a bug where container sync would not copy SLO manifests.
+
+    * Fixed a bug where some tombstone files might never be reclaimed.
+
+    * Update dnspython dependency to 1.14, removing the need to have
+      separate dnspython dependencies for Py2 and Py3.
+
+    * Deprecate swift-temp-url and call python-swiftclient's
+      implementation instead. This adds python-swiftclient as an
+      optional dependency of Swift.
+
+    * Moved other-requirements.txt to bindep.txt. bindep.txt lists
+      non-python dependencies of Swift.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.9.0)
+
+    * Swift now supports at-rest encryption. This feature encrypts all
+      object data and user-set object metadata as it is sent to the cluster.
+      This feature is designed to prevent information leaks if a hard drive
+      leaves the cluster. The encryption is transparent to the end-user.
+
+      At-rest encryption in Swift is enabled on the proxy server by
+      adding two middlewares to the pipeline. The `keymaster` middleware
+      is responsible for managing the encryption keys and the `encryption`
+      middleware does the actual encryption and decryption.
+
+      Existing clusters will continue to work without enabling
+      encryption. Although enabling this feature on existing clusters
+      is supported, best practice is to enable this feature on new
+      clusters when the cluster is created.
+
+      For more information on the details of the at-rest encryption
+      feature, please see the docs at
+      https://docs.openstack.org/swift/latest/overview_encryption.html.
+
+    * `swift-recon` can now be called with more than one server type.
+
+    * Fixed a bug where non-ascii names could cause an error in logging
+      and cause a 5xx response to the client.
+
+    * The install guide and API reference have been moved into Swift's
+      source code repository.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.8.0)
+
+    * Allow concurrent bulk deletes for server-side deletes of static
+      large objects. Previously this would be single-threaded and each
+      DELETE executed serially. The new `delete_concurrency` value
+      (default value is 2) in the `[filter:slo]` and `[filter:bulk]`
+      sections of the proxy server config controls the concurrency
+      used to perform the DELETE requests for referenced segments. The
+      default value is recommended, but setting the value to 1
+      restores previous behavior.
+
+    * Refactor server-side copy as middleware
+
+      The COPY verb is now implemented in the `copy` middleware instead
+      of in the proxy server code. If not explicitly added, the server
+      side copy middleware is auto-inserted to the left of `dlo`, `slo`
+      and `versioned_writes` middlewares in the proxy server pipeline.
+      As a result, dlo and slo `copy_hooks` are no longer required. SLO
+      manifests are now validated when copied so when copying a
+      manifest to another account the referenced segments must be
+      readable in that account for the manifest copy to succeed
+      (previously this validation was not made, meaning the manifest
+      was copied but could be unusable if the segments were not
+      readable).
+
+      With this change, there should be no change in functionality or
+      existing behavior.
+
+    * `fallocate_reserve` can now be a percentage (a value ending in "%"),
+      and the default has been adjusted to "1%".
+
+    * Now properly require account/container metadata be valid UTF-8
+
+    * TempURL responses now include an `Expires` header with the
+      expiration time embedded in the URL.
+
+    * Non-Python dependencies are now listed in other-requirements.txt.
+
+    * `swift-ring-builder` now supports a `--yes` option to assume a
+      yes response to all questions. This is useful for scripts.
+
+    * Write requests to a replicated storage policy with an even number
+      of replicas now have a quorum size of half the replica count
+      instead of half-plus-one.
+
+    * Container sync now logs per-container stat information so operators
+      can track progress. This is logged at INFO level.
+
+    * `swift-dispersion-*` now allows region to be specified when there
+      are multiple Swift regions served by the same Keystone instance
+
+    * Fix infinite recursion during logging when syslog is down.
+
+    * Fixed a bug where a backend failure during a read could result in
+      a missing byte in the response body.
+
+    * Stop `staticweb` revealing container existence to unauth'd requests.
+
+    * Reclaim isolated .meta files if they are older than the `reclaim_age`.
+
+    * Make `rsync` ignore its own temporary files instead of spreading
+      them around the cluster, wasting space.
+
+    * The object auditor now ignores files in the devices directory when
+      auditing objects.
+
+    * The deprecated `threads_per_disk` setting has been removed. Deployers
+      are encouraged to use `servers_per_port` instead.
+
+    * Fixed an issue where a single-replica configuration for account or
+      container DBs could result in the DB being inadvertently deleted if
+      it was placed on a handoff node.
+
+    * `disable_fallocate` now also correctly disables `fallocate_reserve`.
+
+    * Fixed a bug where the account-reaper did not delete all containers
+      in a reaped account.
+
+    * Correctly handle delimiter queries where results start with the
+      delimiter and no prefix is given.
+
+    * Changed the recommended ports for Swift services from ports
+      6000-6002 to unused ports 6200-6202 so they do not conflict with
+      X-Windows or other services. Since these config values must be
+      explicitly set in the config file, this doesn't impact existing
+      deployments.
+
+    * Fixed an instance where REPLICATE requests would not use
+      `replication_ip`.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.7.0, OpenStack Mitaka)
+
+    * Bump PyECLib requirement to >= 1.2.0
+
+    * Update container on fast-POST
+
+      "Fast-POST" is the mode where `object_post_as_copy` is set to
+      `False` in the proxy server config. This mode now allows for
+      fast, efficient updates of metadata without needing to fully
+      recopy the contents of the object. While the default still is
+      `object_post_as_copy` as True, the plan is to change the default
+      to False and then deprecate post-as-copy functionality in later
+      releases. Fast-POST now supports container-sync functionality.
+
+    * Add concurrent reads option to proxy.
+
+      This change adds 2 new parameters to enable and control concurrent
+      GETs in Swift, these are `concurrent_gets` and `concurrency_timeout`.
+
+      `concurrent_gets` allows you to turn on or off concurrent
+      GETs; when on, it will set the GET/HEAD concurrency to the
+      replica count. And in the case of EC HEADs it will set it to
+      ndata. The proxy will then serve only the first valid source to
+      respond. This applies to all account, container, and replicated
+      object GETs and HEADs. For EC only HEAD requests are affected.
+      The default for `concurrent_gets` is off.
+
+      `concurrency_timeout` is related to `concurrent_gets` and is
+      the amount of time to wait before firing the next thread. A
+      value of 0 will fire at the same time (fully concurrent), but
+      setting another value will stagger the firing allowing you the
+      ability to give a node a short chance to respond before firing
+      the next. This value is a float and should be somewhere between
+      0 and `node_timeout`. The default is `conn_timeout`, meaning by
+      default it will stagger the firing.
+
+    * Added an operational procedures guide to the docs. It can be
+      found at https://docs.openstack.org/swift/latest/ops_runbook/index.html and
+      includes information on detecting and handling day-to-day
+      operational issues in a Swift cluster.
+
+    * Make `handoffs_first` a more useful mode for the object replicator.
+
+      The `handoffs_first` replication mode is used during periods of
+      problematic cluster behavior (e.g. full disks) when replication
+      needs to quickly drain partitions from a handoff node and move
+      them to a primary node.
+
+      Previously, `handoffs_first` would sort that handoff work before
+      "normal" replication jobs, but the normal replication work could
+      take quite some time and result in handoffs not being drained
+      quickly enough.
+
+      In order to focus on getting handoff partitions off the node
+      `handoffs_first` mode will now abort the current replication
+      sweep before attempting any primary suffix syncing if any of the
+      handoff partitions were not removed for any reason - and start
+      over with replication of handoffs jobs as the highest priority.
+
+      Note that `handoffs_first` being enabled will emit a warning on
+      start up, even if no handoff jobs fail, because of the negative
+      impact it can have during normal operations by dog-piling on a
+      node that was temporarily unavailable.
+
+    * By default, inbound `X-Timestamp` headers are now disallowed
+      (except when in an authorized container-sync request). This
+      header is useful for allowing data migration from other storage
+      systems to Swift and keeping the original timestamp of the data.
+      If you have this migration use case (or any other requirement on
+      allowing the clients to set an object's timestamp), set the
+      `shunt_inbound_x_timestamp` config variable to False in the
+      gatekeeper middleware config section of the proxy server config.
+
+    * Requesting a SLO manifest file with the query parameters
+      "?multipart-manifest=get&format=raw" will return the contents of
+      the manifest in the format as was originally sent by the client.
+      The "format=raw" is new.
+
+    * Static web page listings can now be rendered with a custom
+      label. By default listings are rendered with a label of:
+      "Listing of /v1/<account>/<container>/<path>". This change adds
+      a new custom metadata key/value pair
+      `X-Container-Meta-Web-Listings-Label: My Label` that when set,
+      will cause the following: "Listing of My Label/<path>" to be
+      rendered instead.
+
+    * Previously, static large objects (SLOs) had a minimum segment
+      size (default to 1MiB). This limit has been removed, but small
+      segments will be ratelimited. The config parameter
+      `rate_limit_under_size` controls the definition of "small"
+      segments (1MiB by default), and `rate_limit_segments_per_sec`
+      controls how many segments per second can be served (default is 1).
+      With the default values, the effective behavior is identical to the
+      previous behavior when serving SLOs.
+
+    * Container sync has been improved to perform a HEAD on the remote
+      side of the sync for each object being synced. If the object
+      exists on the remote side, container-sync will no longer
+      transfer the object, thus significantly lowering the network
+      requirements to use the feature.
+
+    * The object auditor will now clean up any old, stale rsync temp
+      files that it finds. These rsync temp files are left if the
+      rsync process fails without completing a full transfer of an
+      object. Since these files can be large, the temp files may end
+      up filling a disk. The new auditor functionality will reap these
+      rsync temp files if they are old. The new object-auditor config
+      variable `rsync_tempfile_timeout` is the number of seconds old a
+      tempfile must be before it is reaped. By default, this variable
+      is set to "auto" or the rsync_timeout plus 900 seconds (falling
+      back to a value of 1 day).
+
+    * The Erasure Code reconstruction process has been made more
+      efficient by not syncing data files when only the durable commit
+      file is missing.
+
+    * Fixed a bug where 304 and 416 response may not have the right
+      Etag and Accept-Ranges headers when the object is stored in an
+      Erasure Coded policy.
+
+    * Versioned writes now correctly stores the date of previous versions
+      using GMT instead of local time.
+
+    * The deprecated Keystone middleware option is_admin has been removed.
+
+    * Fixed log format in object auditor.
+
+    * The zero-byte mode (ZBF) of the object auditor will now properly
+      observe the `--once` option.
+
+    * Swift keeps track, internally, of "dirty" parts of the partition
+      keyspace with a "hashes.pkl" file. Operations on this file no
+      longer require a read-modify-write cycle and use a new
+      "hashes.invalid" file to track dirty partitions. This change
+      will improve end-user performance for PUT and DELETE operations.
+
+    * The object replicator's succeeded and failed counts are now logged.
+
+    * `swift-recon` can now query hosts by storage policy.
+
+    * The log_statsd_host value can now be an IPv6 address or a hostname
+      which only resolves to an IPv6 address.
+
+    * Erasure coded fragments now properly call fallocate to reserve disk
+      space before being written.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.6.0)
+
+    * Dependency changes
+      - Updated minimum version of eventlet to 0.17.4 to support IPv6.
+
+      - Updated the minimum version of PyECLib to 1.0.7.
+
+    * The ring rebalancing algorithm was updated to better handle edge cases
+      and to give better (more balanced) rings in the general case. New rings
+      will have better initial placement, capacity adjustments will move less
+      data for better balance, and existing rings that were imbalanced should
+      start to become better balanced as they go through rebalance cycles.
+
+    * Added container and account reverse listings.
+
+      A GET request to an account or container resource with a "reverse=true"
+      query parameter will return the listing in reverse order. When
+      iterating over pages of reverse listings, the relative order of marker
+      and end_marker are swapped.
+
+    * Storage policies now support having more than one name.
+
+      This allows operators to fix a typo without breaking existing clients,
+      or, alternatively, have "short names" for policies. This is implemented
+      with the "aliases" config key in the storage policy config in
+      swift.conf. The aliases value is a list of names that the storage
+      policy may also be identified by. The storage policy "name" is used to
+      report the policy to users (eg in container headers). The aliases have
+      the same naming restrictions as the policy's primary name.
+
+    * The object auditor learned the "interval" config value to control the
+      time between each audit pass.
+
+    * `swift-recon --all` now includes the config checksum check.
+
+    * `swift-init` learned the --kill-after-timeout option to force a service
+      to quit (SIGKILL) after a designated time.
+
+    * `swift-recon` now correctly shows timestamps in UTC instead of local
+      time.
+
+    * Fixed bug where `swift-ring-builder` couldn't select device id 0.
+
+    * Documented the previously undocumented
+      `swift-ring-builder pretend_min_part_hours_passed` command.
+
+    * The "node_timeout" config value now accepts decimal values.
+
+    * `swift-ring-builder` now properly removes devices with zero weight.
+
+    * `swift-init` return codes are updated via "--strict" and "--non-strict"
+      options. Please see the usage string for more information.
+
+    * `swift-ring-builder` now reports the min_part_hours lockout time
+      remaining
+
+    * Container sync has been improved to more quickly find and iterate over
+      the containers to be synced. This reduced server load and lowers the
+      time required to see data propagate between two clusters. Please see
+      https://docs.openstack.org/swift/latest/overview_container_sync.html for more details
+      about the new on-disk structure for tracking synchronized containers.
+
+    * A container POST will now update that container's put-timestamp value.
+
+    * TempURL header restrictions are now exposed in /info.
+
+    * Error messages on static large object manifest responses have been
+      greatly improved.
+
+    * Closed a bug where an unfinished read of a large object would leak a
+      socket file descriptor and a small amount of memory. (CVE-2016-0738)
+
+    * Fixed an issue where a zero-byte object PUT with an incorrect Etag
+      would return a 503.
+
+    * Fixed an error when a static large object manifest references the same
+      object more than once.
+
+    * Improved performance of finding handoff nodes if a zone is empty.
+
+    * Fixed duplication of headers in Access-Control-Expose-Headers on CORS
+      requests.
+
+    * Fixed handling of IPv6 connections to memcache pools.
+
+    * Continued work towards python 3 compatibility.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.5.0, OpenStack Liberty)
+
+    * Added the ability to specify ranges for Static Large Object (SLO)
+      segments.
+
+    * Replicator configs now support an "rsync_module" value to allow
+      for per-device rsync modules. This setting gives operators the
+      ability to fine-tune replication traffic in a Swift cluster and
+      isolate replication disk IO to a particular device. Please see
+      the docs and sample config files for more information and
+      examples.
+
+    * Significant work has gone in to testing, fixing, and validating
+      Swift's erasure code support at different scales.
+
+    * Swift now emits StatsD metrics on a per-policy basis.
+
+    * Fixed an issue with Keystone integration where a COPY request to a
+      service account may have succeeded even if a service token was not
+      included in the request.
+
+    * Ring validation now warns if a placement partition gets assigned to the
+      same device multiple times. This happens when devices in the ring are
+      unbalanced (e.g. two servers where one server has significantly more
+      available capacity).
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.4.0)
+
+    * Dependency changes
+
+      - Added six requirement. This is part of an ongoing effort to add
+        support for Python 3.
+
+      - Dropped support for Python 2.6.
+
+    * Config changes
+
+      - Recent versions of Python restrict the number of headers allowed in a
+        request to 100. This number may be too low for custom middleware. The
+        new "extra_header_count" config value in swift.conf can be used to
+        increase the number of headers allowed.
+
+      - Renamed "run_pause" setting to "interval" (current configs with
+        run_pause still work). Future versions of Swift may remove the
+        run_pause setting.
+
+    * Versioned writes middleware
+
+      The versioned writes feature has been refactored and reimplemented as
+      middleware. You should explicitly add the versioned_writes middleware to
+      your proxy pipeline, but do not remove or disable the existing container
+      server config setting ("allow_versions"), if it is currently enabled.
+      The existing container server config setting enables existing
+      containers to continue being versioned. Please see
+      https://docs.openstack.org/swift/latest/middleware.html#how-to-enable-object-versioning-in-a-swift-cluster
+      for further upgrade notes.
+
+    * Allow 1+ object-servers-per-disk deployment
+
+      Enabled by a new > 0 integer config value, "servers_per_port" in the
+      [DEFAULT] config section for object-server and/or replication server
+      configs. The setting's integer value determines how many different
+      object-server workers handle requests for any single unique local port
+      in the ring. In this mode, the parent swift-object-server process
+      continues to run as the original user (i.e. root if low-port binding
+      is required), binds to all ports as defined in the ring, and forks off
+      the specified number of workers per listen socket. The child, per-port
+      servers drop privileges and behave pretty much how object-server workers
+      always have, except that because the ring has unique ports per disk, the
+      object-servers will only be handling requests for a single disk. The
+      parent process detects dead servers and restarts them (with the correct
+      listen socket), starts missing servers when an updated ring file is
+      found with a device on the server with a new port, and kills extraneous
+      servers when their port is found to no longer be in the ring. The ring
+      files are stat'ed at most every "ring_check_interval" seconds, as
+      configured in the object-server config (same default of 15s).
+
+      In testing, this deployment configuration (with a value of 3) lowers
+      request latency, improves requests per second, and isolates slow disk
+      IO as compared to the existing "workers" setting. To use this, each
+      device must be added to the ring using a different port.
+
+    * Do container listing updates in another (green)thread
+
+      The object server has learned the "container_update_timeout" setting
+      (with a default of 1 second). This value is the number of seconds that
+      the object server will wait for the container server to update the
+      listing before returning the status of the object PUT operation.
+
+      Previously, the object server would wait up to 3 seconds for the
+      container server response. The new behavior dramatically lowers object
+      PUT latency when container servers in the cluster are busy (e.g. when
+      the container is very large). Setting the value too low may result in a
+      client PUT'ing an object and not being able to immediately find it in
+      listings. Setting it too high will increase latency for clients when
+      container servers are busy.
+
+    * TempURL fixes (closes CVE-2015-5223)
+
+      Do not allow PUT tempurls to create pointers to other data.
+      Specifically, disallow the creation of DLO object manifests via a PUT
+      tempurl. This prevents discoverability attacks which can use any PUT
+      tempurl to probe for private data by creating a DLO object manifest and
+      then using the PUT tempurl to head the object.
+
+    * Ring changes
+
+      - Partition placement no longer uses the port number to place
+        partitions. This improves dispersion in small clusters running one
+        object server per drive, and it does not affect dispersion in
+        clusters running one object server per server.
+
+      - Added ring-builder-analyzer tool to more easily test and analyze a
+        series of ring management operations.
+
+      - Stop moving partitions unnecessarily when overload is on.
+
+    * Significant improvements and bug fixes have been made to erasure code
+      support. This feature is suitable for beta testing, but it is not yet
+      ready for broad production usage.
+
+    * Bulk upload now treats user xattrs on files in the given archive as
+      object metadata on the resulting created objects.
+
+    * Emit warning log in object replicator if "handoffs_first" or
+      "handoff_delete" is set.
+
+    * Enable object replicator's failure count in swift-recon.
+
+    * Added storage policy support to dispersion tools.
+
+    * Support keystone v3 domains in swift-dispersion.
+
+    * Added domain_remap information to the /info endpoint.
+
+    * Added support for a "default_reseller_prefix" in domain_remap
+      middleware config.
+
+    * Allow SLO PUTs to forgo per-segment integrity checks. Previously, each
+      segment referenced in the manifest also needed the correct etag and
+      bytes setting. These fields now allow the "null" value to skip those
+      particular checks on the given segment.
+
+    * Allow rsync to use compression via a "rsync_compress" config. If set to
+      true, compression is only enabled for an rsync to a device in a
+      different region. In some cases, this can speed up cross-region
+      replication data transfer.
+
+    * Added time synchronization check in swift-recon (the --time option).
+
+    * The account reaper now runs faster on large accounts.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.3.0, OpenStack Kilo)
+
+    * Erasure Code support (beta)
+
+      Swift now supports an erasure-code (EC) storage policy type. This allows
+      deployers to achieve very high durability with less raw capacity as used
+      in replicated storage. However, EC requires more CPU and network
+      resources, so it is not good for every use case. EC is great for storing
+      large, infrequently accessed data in a single region.
+
+      Swift's implementation of erasure codes is meant to be transparent to
+      end users. There is no API difference between replicated storage and
+      EC storage.
+
+      To support erasure codes, Swift now depends on PyECLib and
+      liberasurecode. liberasurecode is a pluggable library that allows for
+      the actual EC algorithm to be implemented in a library of your choosing.
+
+      As a beta release, EC support is nearly fully feature complete, but it
+      is lacking support for some features (like multi-range reads) and has
+      not had a full performance characterization. This feature relies on
+      ssync for durability. Deployers are urged to do extensive testing and
+      not deploy production data using an erasure code storage policy.
+
+      Full docs are at https://docs.openstack.org/swift/latest/overview_erasure_code.html
+
+    * Add support for container TempURL Keys.
+
+    * Make more memcache options configurable. connection_timeout,
+      pool_timeout, tries, and io_timeout are all now configurable.
+
+    * Swift now supports composite tokens. This allows another service to
+      act on behalf of a user, but only with that user's consent.
+      See https://docs.openstack.org/swift/latest/overview_auth.html for more details.
+
+    * Multi-region replication was improved. When replicating data to a
+      different region, only one replica will be pushed per replication
+      cycle. This gives the remote region a chance to replicate the data
+      locally instead of pushing more data over the inter-region network.
+
+    * Internal requests from the ratelimit middleware now properly log a
+      swift_source. See https://docs.openstack.org/swift/latest/logs.html for details.
+
+    * Improved storage policy support for quarantine stats in swift-recon.
+
+    * The proxy log line now includes the request's storage policy index.
+
+    * Ring checker has been added to swift-recon to validate if rings are
+      built correctly. As part of this feature, storage servers have learned
+      the OPTIONS verb.
+
+    * Add support of x-remove- headers for container-sync.
+
+    * Rings now support hostnames instead of just IP addresses.
+
+    * Swift now enforces that the API version on a request is valid. Valid
+      versions are configured via the valid_api_versions setting in swift.conf
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.2.2)
+
+    * Data placement changes
+
+      This release has several major changes to data placement in Swift in
+      order to better handle different deployment patterns. First, with an
+      unbalance-able ring, less partitions will move if the movement doesn't
+      result in any better dispersion across failure domains. Also, empty
+      (partition weight of zero) devices will no longer keep partitions after
+      rebalancing when there is an unbalance-able ring.
+
+      Second, the notion of "overload" has been added to Swift's rings. This
+      allows devices to take some extra partitions (more than would normally
+      be allowed by the device weight) so that smaller and unbalanced clusters
+      will have less data movement between servers, zones, or regions if there
+      is a failure in the cluster.
+
+      Finally, rings have a new metric called "dispersion". This is the
+      percentage of partitions in the ring that have too many replicas in a
+      particular failure domain. For example, if you have three servers in a
+      cluster but two replicas for a partition get placed onto the same
+      server, that partition will count towards the dispersion metric. A
+      lower value is better, and the value can be used to find the proper
+      value for "overload".
+
+      The overload and dispersion metrics have been exposed in the
+      swift-ring-build CLI tools.
+
+      See https://docs.openstack.org/swift/latest/overview_ring.html
+      for more info on how data placement works now.
+
+    * Improve replication of large out-of-sync, out-of-date containers.
+
+    * Added console logging to swift-drive-audit with a new log_to_console
+      config option (default False).
+
+    * Optimize replication when a device and/or partition is specified.
+
+    * Fix dynamic large object manifests getting versioned. This was not
+      intended and did not work. Now it is properly prevented.
+
+    * Fix the GET's response code when there is a missing segment in a
+      large object manifest.
+
+    * Change black/white listing in ratelimit middleware to use sysmeta.
+      Instead of using the config option, operators can set
+      "X-Account-Sysmeta-Global-Write-Ratelimit: WHITELIST" or
+      "X-Account-Sysmeta-Global-Write-Ratelimit: BLACKLIST" on an account to
+      whitelist or blacklist it for ratelimiting. Note: the existing
+      config options continue to work.
+
+    * Use TCP_NODELAY on outgoing connections.
+
+    * Improve object-replicator startup time.
+
+    * Implement OPTIONS verb for storage nodes.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.2.1)
+
+    * Swift now rejects object names with Unicode surrogates.
+
+    * Return 403 (instead of 413) on unauthorized upload when over account
+      quota.
+
+    * Fix a rare condition when a rebalance could cause swift-ring-builder
+      to crash. This would only happen on old ring files when "rebalance"
+      was the first command run.
+
+    * Storage node error limits now survive a ring reload.
+
+    * Speed up reading and writing xattrs for object metadata by using larger
+      xattr value sizes. The change is moving from 254 byte values to 64KiB
+      values. There is no migration issue with this.
+
+    * Deleted containers beyond the reclaim age are now properly reclaimed.
+
+    * Full Simplified Chinese translation (zh_CN locale) for errors and logs.
+
+    * Container quota is now properly enforced during cross-account COPY.
+
+    * ssync replication now properly uses the configured replication_ip.
+
+    * Fixed issue were ssync did not replicate custom object headers.
+
+    * swift-drive-audit now has the 'unmount_failed_device' config option
+      (default to True) that controls if the process will unmount failed
+      drives or not.
+
+    * swift-drive-audit will now dump drive error rates to a recon file.
+      The file location is controlled by the 'recon_cache_path' config value
+      and it includes each drive and its associated number of errors.
+
+    * When a filesystem does't support xattr, the object server now returns
+      a 507 Insufficient Storage error to the proxy server.
+
+    * Clean up empty account and container partitions directories if they
+      are empty. This keeps the system healthy and prevents a large number
+      of empty directories from slowing down the replication process.
+
+    * Show the sum of every policy's amount of async pendings in swift-recon.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.2.0, OpenStack Juno)
+
+    * Added support for Keystone v3 auth.
+
+      Keystone v3 introduced the concept of "domains" and user names
+      are no longer unique across domains. Swift's Keystone integration
+      now requires that ACLs be set on IDs, which are unique across
+      domains, and further restricts setting new ACLs to only use IDs.
+
+      Please see https://docs.openstack.org/swift/latest/overview_auth.html for
+      more information on configuring Swift and Keystone together.
+
+    * Swift now supports server-side account-to-account copy. Server-
+      side copy in Swift requires the X-Copy-From header (on a PUT)
+      or the Destination header (on a COPY). To initiate an account-to-
+      account copy, the existing header value remains the same, but the
+      X-Copy-From-Account header (on a PUT) or the Destination-Account
+      (on a COPY) are used to indicate the proper account.
+
+    * Limit partition movement when adding a new placement tier.
+
+      When adding a new placement tier (server, zone, or region), Swift
+      previously attempted to move all placement partitions, regardless
+      of the space available on the new tier, to ensure the best possible
+      durability. Unfortunately, this could result in too many partitions
+      being moved all at once to a new tier. Swift's ring-builder now
+      ensures that only the correct number of placement partitions are
+      rebalanced, and thus makes adding capacity to the cluster more
+      efficient.
+
+    * Per storage policy container counts are now reported in an
+      account response headers.
+
+    * Swift will now reject, with a 4xx series response, GET requests
+      with more than 50 ranges, more than 3 overlapping ranges, or more
+      than 8 non-increasing ranges.
+
+    * The bind_port config setting is now required to be explicitly set.
+
+    * The object server can now use splice() for a zero-copy GET
+      response. This feature is enabled with the "splice" config variable
+      in the object server config and defaults to off. Also, this feature
+      only works on recent Linux kernels (AF_ALG sockets must be
+      supported). A zero-copy GET response can significantly reduce CPU
+      requirements for object servers.
+
+    * Added "--no-overlap" option to swift-dispersion populate so that
+      multiple runs of the tool can add coverage without overlapping
+      existing monitored partitions.
+
+    * swift-recon now supports filtering by region.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.1.0)
+
+    * swift-ring-builder placement was improved to allow gradual addition
+      of new regions without causing a massive migration of data to the new
+      region. The change was to prefer device weight first, then look at
+      failure domains.
+
+    * Logging updates
+
+      - Eliminated "Handoff requested (N)" log spam.
+
+      - Added process pid to the end of storage node log lines.
+
+      - Container auditor now logs a warning if the devices path contains a
+        non-directory.
+
+      - Object daemons now send a user-agent string with their full name.
+
+    * 412 and 416 responses are no longer tracked as errors in the StatsD
+      messages from the backend servers.
+
+    * Parallel object auditor
+
+      The object auditor can now be controlled with a "concurrency" config
+      value that allows multiple auditor processes to run at once. Using
+      multiple parallel auditor processes can speed up the overall auditor
+      cycle time.
+
+    * The object updater will now concurrently update each necessary node
+      in a new greenthread.
+
+    * TempURL updates
+
+      - The default allowed methods have changed to also allow POST and
+        DELETE. The new default list is "GET HEAD PUT POST DELETE".
+
+      - TempURLs for POST now also allow HEAD, matching existing GET and PUT
+        functionality.
+
+      - Added filename*= support to TempURL Content-Disposition response
+        header.
+
+    * X-Delete-At/After can now be used with the FormPost middleware.
+
+    * Make swift-form-signature output a sample form.
+
+    * Add v2 API to list endpoints middleware
+
+      The new API adds better support for storage policies and changes the
+      response from a list of backend urls to a dictionary with the keys
+      "endpoints" and "headers". The endpoints key contains a list of the
+      backend urls, and the headers key is a dictionary of headers to send
+      along with the backend request.
+
+    * Added allow_account_management and account_autocreate values to /info
+      responses.
+
+    * Enable object system metadata on PUTs (Note: POST support is ongoing).
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (2.0.0)
+
+    * Storage policies
+
+      Storage policies allow deployers to configure multiple object rings
+      and expose them to end users on a per-container basis. Deployers
+      can create policies based on hardware performance, regions, or other
+      criteria and independently choose different replication factors on
+      them. A policy is set on a Swift container at container creation
+      time and cannot be changed.
+
+      Full docs are at https://docs.openstack.org/swift/latest/overview_policies.html
+
+    * Add profiling middleware in Swift
+
+      The profile middleware provides a tool to profile Swift
+      code on the fly and collects statistical data for performance
+      analysis. A native simple Web UI is also provided to help
+      query and visualize the data.
+
+    * Add --quoted option to swift-temp-url
+
+    * swift-recon now supports checking the md5sum of swift.conf, which
+      helps deployers verify configurations are consistent across a cluster.
+
+    * Users can now set the transaction id suffix by passing in
+      a value in the X-Trans-Id-Extra header.
+
+    * New log_max_line_length option caps the maximum length of a log line.
+
+    * Support If-[Un]Modified-Since for object HEAD
+
+    * Added missing constraints and ratelimit parameters to /info
+
+    * Add ability to remove subsections from /info
+
+    * Unify logging for account, container, and object server processes
+      to provide a consistent message format. This change reorders the
+      fields logged for the account server.
+
+    * Add targeted config loading to swift-init. This allows an easier
+      and more explicit way to tell swift-init to run specific server
+      process configurations.
+
+    * Properly quote www-authenticate (CVE-2014-3497)
+
+    * Fix logging issue when services stop on py26.
+
+    * Change the default logged length of the auth token to 16.
+
+    * Explicitly set permissions on generated ring files to 0644
+
+    * Fix file uploads larger than 2GiB in the formpost feature
+
+    * Fixed issue where large objects would fail to download if the
+      auth token expired partway through the download
+
+    * Various other minor bug fixes and improvements
+
+
+swift (1.13.1, OpenStack Icehouse)
+
+    * Change the behavior of CORS responses to better match the spec
+
+      A new proxy config variable (strict_cors_mode, default to True)
+      has been added. Setting it to False keeps the old behavior. For
+      an overview of old versus new behavior, please see
+      https://review.opendev.org/#/c/69419/
+
+    * Invert the responsibility of the two instances of proxy-logging in
+      the proxy pipeline
+
+      The first proxy_logging middleware instance to receive a request
+      in the pipeline marks that request as handling it. So now, the
+      left most proxy_logging middleware handles logging for all
+      client requests, and the right most proxy_logging middleware
+      handles all other requests initiated from within the pipeline to
+      its left. This fixes logging related to large object
+      requests not properly recording bandwidth.
+
+    * Added swift-container-info and swift-account-info tools
+
+    * Allow specification of object devices for audit
+
+    * Dynamic large object COPY requests with ?multipart-manifest=get
+      now work as expected
+
+    * When a client is downloading a large object and one of the segment
+      reads gets bad data, Swift will now immediately abort the request.
+
+    * Fix ring-builder crash when a ring partition was assigned to a
+      deleted device, zero-weighted device, and normal device
+
+    * Make probetests work with conf.d configs
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (1.13.0)
+
+    * Account-level ACLs and ACL format v2
+
+      Accounts now have a new privileged header to represent ACLs or
+      any other form of account-level access control. The value of
+      the header is a JSON dictionary string to be interpreted by the
+      auth system. A reference implementation is given in TempAuth.
+      Please see the full docs at
+      https://docs.openstack.org/swift/latest/overview_auth.html
+
+    * Added a WSGI environment flag to stop swob from always using
+      absolute location. This is useful if middleware needs to use
+      out-of-spec Location headers in a response.
+
+    * Container sync proxies now support simple load balancing
+
+    * Config option to lower the timeout for recoverable object GETs
+
+    * Add a way to ratelimit all writes to an account
+
+    * Allow multiple storage_domain values in cname_lookup middleware
+
+    * Moved all DLO functionality into middleware
+
+      The proxy will automatically insert the dlo middleware at an
+      appropriate place in the pipeline the same way it does with the
+      gatekeeper middleware. Clusters will still support DLOs after upgrade
+      even with an old config file that doesn't mention dlo at all.
+
+    * Remove python-swiftclient dependency
+
+    * Add secondary groups to process user during privilege escalation
+
+    * When logging request headers, it is now possible to specify
+      specifically which headers should be logged
+
+    * Added log_requests config parameter to account and container servers
+      to match the parameter in the object server. This allows a deployer
+      to turn off log messages for these processes.
+
+    * Ensure swift.source is set for DLO/SLO requests
+
+    * Fixed an issue where overwriting segments in a dynamic manifest
+      could cause issues on pipelined requests.
+
+    * Properly handle COPY verb in container quota middleware
+
+    * Improved StaticWeb 404 error message on web-listings and index
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (1.12.0)
+
+    * Several important pieces of information have been added to /info:
+
+       - Configured constraints are included and allow a client to discover
+         the limits on names and object sizes that the cluster supports.
+
+       - The supported tempurl methods are now included.
+
+       - Static large object constraints are now included.
+
+    * The Last-Modified header value returned will now be the object's
+      timestamp rounded up to the next second. This allows subsequent
+      requests with If-[un]modified-Since to use the Last-Modified
+      value as expected.
+
+    * Non-integer values for if-delete-at headers will now properly
+      report a 400 error instead of a 503.
+
+    * Fix object versioning with non-ASCII container names.
+
+    * Bulk delete with POST now works properly.
+
+    * Generic means for persisting system metadata
+
+      Swift now supports system-level metadata on accounts and
+      containers. System metadata provides a means to store internal
+      custom metadata with associated Swift resources in a safe and
+      secure fashion without actually having to plumb custom metadata
+      through the core swift servers. The new gatekeeper middleware
+      prevents this system metadata from leaking into the request or
+      being set by a client.
+
+    * catch_errors and gatekeeper middleware are now forced into the proxy
+      pipeline if not explicitly referenced.
+
+    * New container sync configuration option, separating the end user
+      from knowing the required end point and adding more secure
+      signed requests. See
+      https://docs.openstack.org/swift/latest/overview_container_sync.html
+      for full information.
+
+    * bulk middleware now can be configured to retry deleting containers.
+
+    * The default yield_frequency used to keep client connections alive
+      during slow bulk requests was reduced from 60 seconds to 10 seconds.
+      While this is a change to a default, it should not affect deployments
+      and there is no migration process needed.
+
+    * Swift processes will attempt to set RLIMIT_NPROC to 8192.
+
+    * Server processes will now exit with a non-zero error code on config
+      errors.
+
+    * Warn if read_affinity is configured but not enabled.
+
+    * Fix checkmount error parsing in swift-recon.
+
+    * Log at warn level when an object is quarantined.
+
+    * Fixed CVE-2014-0006 to avoid a potential timing attack with tempurl.
+
+    * Various other minor bug fixes and improvements.
+
+
+swift (1.11.0)
+
+    * Added discoverable capabilities
+
+      A Swift proxy server now by default (although it can be turned off)
+      will respond to requests to /info. The response to these requests
+      include information about the cluster and can be used by clients to
+      determine which features are supported in the cluster.
+
+    * Object replication ssync (an rsync alternative)
+
+      A Swift storage node can now be configured to use Swift primitives
+      for replication transport instead of rsync. This is an experimental
+      feature that is not yet considered production ready.
+
+    * If a source times out on an object server read, try another one
+      of them with a modified range.
+
+    * The proxy now responds to many types of requests as soon as it
+      has a quorum. This can help speed up responses (without
+      changing the results), especially when one node is acting up.
+      There is a post_quorum_timeout config value that can tune how
+      long to wait for requests to finish after a quorum has been
+      established.
+
+    * Add accurate timestamps in proxy log lines for the start and
+      end of a request. These are added as new fields on the end of
+      the existing log lines, and therefore should not break
+      existing, well-behaved log processors.
+
+    * Add an "inline" query parameter to tempurl
+
+      By default, temporary URLs add a "Content-Disposition" header
+      that forces many clients to download the object. Now, temporary
+      URLs support an optional "inline" query parameter that will
+      force a "Content-Disposition: inline" header to be added to the
+      response, overriding the default.
+
+    * Use TCP_NODELAY for created sockets. This can dramatically
+      lower latency for small object workloads.
+
+    * DiskFile API, with reference implementation
+
+      The DiskFile abstraction for talking to data on disk has been
+      refactored to allow alternate implementations to be developed.
+      Included in the codebase is an in-memory reference
+      implementation. For full documentation, please see the developer
+      documentation. The DiskFile API is still a work in progress and
+      is not yet finalized.
+
+    * Removal of swift-bench
+
+      The included benchmarking tool swift-bench has been extracted
+      from the codebase and is now in its own repository at
+      https://github.com/openstack/swift-bench. New swift-bench
+      binaries and packages may be found on PyPI at
+      https://pypi.org/project/swift-bench
+
+    * Bulk delete now also supports the POST verb, in addition to DELETE
+
+    * Added functionality to the swift-ring-builder to support
+      limited recreation of ring builder files from the ring file itself.
+
+    * HEAD on account now returns 410 if account was deleted and
+      not yet reaped. The old behavior was to return a 404.
+
+    * Fixed a bug introduced since the 1.10.0 release that
+      prevented expired objects from being removed from the system.
+      This resulted in orphaned expired objects taking up space on
+      the system but inaccessible to the API. This regression and
+      fix are only important if you have deployed code since the
+      1.10.0 release. For a full discussion, including a script that
+      can be used to clean up orphaned objects, see
+      https://bugs.launchpad.net/swift/+bug/1257330
+
+    * Tie socket write buffer size to server chunk size parameter. This
+      pairs the underlying network buffer size with the size of data
+      that Swift attempts to read from the connection, thereby
+      improving efficiency and throughput on connections.
+
+    * Fix 500 from account-quota middleware. If a user had set
+      X-Account-Meta-Quota-Bytes to something non-integer prior to
+      the installation of the account-quota middleware, then the
+      quota check would choke on it. Now a non-integer value is
+      treated as "no quota".
+
+    * Quarantine objects with busted metadata. Before, if you
+      encountered an object with corrupt or missing xattrs, the
+      object server would return a 500 on GET, and wouldn't quarantine
+      anything. Now the object server returns a 404 for that GET and
+      the corrupted file is quarantined, thus giving replication a
+      chance to fix it.
+
+    * Fix quarantine and error counts in audit logs
+
+    * Report transaction ID in failure exception logs
+
+    * Make pbr a build-time only dependency
+
+    * Worked around a bug in eventlet 0.9.16 where the size of the
+      memcache connection pools would grow unbounded.
+
+    * Tempurl keys are now properly stored as utf8
+
+    * Fixed an issue where concurrent PUT requests to accounts or
+      containers may result in errors due to locked databases.
+
+    * Handle copy requests in account and container quota middleware
+
+    * Now ensure that a WWW-Authenticate header is on all 401 responses
+
+    * Various other bug fixes and improvements
+
+
+swift (1.10.0, OpenStack Havana)
+
+    * Added support for pooling memcache connections
+
+    * Added support to replicating handoff partitions first in object
+      replication. Can also configure how many remote nodes a storage node
+      must talk to before removing a local handoff partition.
+
+    * Fixed bug where memcache entries would not expire
+
+    * Much faster calculation for choosing handoff nodes
+
+    * Added container listing ratelimiting
+
+    * Fixed issue where the proxy would continue to read from a storage
+      server even after a client had disconnected
+
+    * Added support for headers that are only visible to the owner of a Swift
+      account
+
+    * Fixed ranged GET with If-None-Match
+
+    * Fixed an issue where rings may not be balanced after initial creation
+
+    * Fixed internationalization support
+
+    * Return the correct etag for a static large object on the PUT response
+
+    * Allow users to extract archives to containers with ACLs set
+
+    * Fix support for range requests against static large objects
+
+    * Now logs x-copy-from header in a useful place
+
+    * Reverted back to old XML output of account and container listings to
+      ensure older clients do not break
+
+    * Account quotas now appropriately handle copy requests
+
+    * Fix issue with UTF-8 handling in versioned writes
+
+    * Various other bug fixes and improvements, including support for running
+      Swift under Pypy and continuing work to support storage policies
+
+
+swift (1.9.1)
+
+    * Disallow PUT, POST, and DELETE requests from creating older tombstone
+      files, preventing the possibility of filling up the disk and removing
+      unnecessary container updates.
+
+    * Set default wsgi workers to cpu_count
+
+      Change the default value of wsgi workers from 1 to auto. The new
+      default value for workers in the proxy, container, account & object
+      wsgi servers will spawn as many workers per process as you have cpu
+      cores. This will not be ideal for some configurations, but it's much
+      more likely to produce a successful out of the box deployment.
+
+    * Added reveal_sensitive_prefix config setting to filter the auth token
+      logged by the proxy server.
+
+    * Ensure Keystone's reseller prefix ends with an underscore. Previously
+      this was a recommendation--now it is enforced.
+
+    * Added log_file_pattern config to swift-drive-audit for drive errors
+
+    * Add support for telling Swift to detect a content type on a request.
+
+    * Additional object stats are now logged in the object auditor
+
+    * Moved the DiskFile interface into its own module
+
+    * Ensure the SQLite cursors are closed when creating functions
+
+    * Better support for valid Accept headers
+
+    * In Keystone, don't allow users to delete their own account
+
+    * Return a UTC timezone designator in container listings
+
+    * Ensure that users can't remove their account quotas
+
+    * Allow floating point value for dispersion coverage
+
+    * Fix incorrect error page handling in staticweb
+
+    * Add utf-8 charset to multipart-manifest=get response.
+
+    * Allow dispersion tools to use keystone server with insecure certificate
+
+    * Ensure that files are always closed in tests
+
+    * Use OpenStack's "Hacking" guidelines for code formatting
+
+    * Various other minor bug fixes and improvements
+
+
+swift (1.9.0)
+
+    * Global clusters support
+
+      The "region" concept introduced in Swift 1.8.0 has been augmented with
+      support for using a separate replication network and configuring read
+      and write affinity. These features combine to offer support for a single
+      Swift cluster spanning wide geographic area.
+
+    * Disk performance
+
+      The object server now can be configured to use threadpools to increase
+      performance and smooth out latency throughout the system. Also, many
+      disk operations were reordered to increase reliability and improve
+      performance.
+
+    * Added config file conf.d support
+
+      Allow Swift daemons and servers to optionally accept a directory as the
+      configuration parameter. This allows different parts of the config file
+      to be managed separately, eg each middleware could use a separate file
+      for its particular config settings.
+
+    * Allow two TempURL keys per account
+
+      By adding a second key, a user can safely rotate keys and prevent URLs
+      already in use from becoming invalid. TempURL middlware has also been
+      updated to allow a configuable set of allowed methods and to prevent a
+      bugrelated to content-disposition names.
+
+    * Added crossdomain.xml middleware. See
+      https://docs.openstack.org/swift/latest/crossdomain.html for details
+
+    * Added rsync bandwidth limit setting for object replicator
+
+    * Transaction ID updated to include the time and an optional suffix
+
+    * Added x-remove-versions-location header to disable versioned writes
+
+    * Improvements to support for Keystone ACLs
+
+    * Added parallelism to object expirer daemon
+
+    * Added support for ring hash prefix in addition to the existing suffix
+
+    * Allow all headers requested for CORS
+
+    * Stop getting useless bytes on manifest Range requests
+
+    * Improved container-sync resiliency
+
+    * Added example Apache config files. See
+      https://docs.openstack.org/swift/latest/apache_deployment_guide.html
+      for more info
+
+    * If an account is marked as deleted but hasn't been reaped and is still
+      on disk, responses will include an "X-Account-Status" header
+
+    * Fix 503 on account/container HEAD with invalid format
+
+    * Added extra safety on account-level DELETE when using bulk deletes
+
+    * Made colons quote-safe in logs (mainly for IPv6)
+
+    * Fixed bug with bulk delete max items
+
+    * Fixed static large object manifest range requests
+
+    * Prevent static large objects from containing other static large objects
+
+    * Fixed issue with use of delimiter in container queries where some
+      objects would not be listed
+
+    * Various other minor bug fixes and improvements
+
+
+swift (1.8.0, OpenStack Grizzly)
+
+    * Make rings' replica count adjustable
+
+    * Added a region tier to the ring above zones
+
+    * Added timing-based sorting of object servers on read requests
+
+    * Added support for auto-extract archive uploads
+
+    * Added support for bulk delete requests
+
+    * Added support for large objects with static manifests
+
+    * Added list_endpoints middleware to provide an API for determining where
+      the ring places data
+
+    * proxy-logging middleware can now handle logging for other middleware
+
+      proxy-logging should be used twice in the proxy pipeline. The first
+      handles middleware logs for requests that never made it all the way
+      to the server. The last handles requests that do make it to the server.
+
+      This is a change that may require an update to your proxy server
+      config file or custom middleware that you may be using. See the full
+      docs at https://docs.openstack.org/swift/latest/misc.html.
+
+    * Changed the default sample rate for a few high-traffic requests.
+
+      Added log_statsd_sample_rate_factor to globally tune the StatsD
+      sample rate. This tunable can be used to reduce StatsD traffic
+      proportionally for all metrics and is intended to replace
+      log_statsd_default_sample_rate, which is left alone for
+      backward-compatibility, should anyone be using it.
+
+    * Added swift_hash_path_prefix option to swift.conf
+
+      New deployments are advised to set this value to a random secret
+      to protect against hash collisions
+
+    * Added user-managed container quotas
+
+    * Added support for account-level quotas managed by an auth reseller
+
+    * Added --run-dir option to swift-init
+
+    * Added more options to swift-bench
+
+    * Added support for CORS "actual requests"
+
+    * Added fallocate_reserve option to protect against full drives
+
+    * Allow ring rebalance to take a seed
+
+    * Ring serialization will now produce the same gzip file (Py2.7)
+
+    * Added support to swift-drive-audit for handling rotated logs
+
+    * Added first-byte latency timings for GET requests
+
+    * Added per disk PUT timing monitoring support
+
+    * Added speed limit options for DB auditor
+
+    * Force log entries to be one line
+
+    * Ensure that fsync is used and not just fdatasync
+
+    * Improved handoff node selection
+
+    * Deprecated keystone is_admin feature
+
+    * Fix large objects with unicode in the segment names
+
+    * Update Swift's MemcacheRing to provide API compatibility with
+      standard Python memcache libraries
+
+    * Various other minor bug fixes and improvements
+
+
+swift (1.7.6)
+
+    * Better tempauth storage URL guessing
+
+    * Added --top option to swift-recon -d
+
+    * Allow optional, temporary healthcheck failure
+
+    * keystoneauth middleware now supports cross-tenant ACLs
+
+    * Add dispersion report flags to limit reports
+
+    * Add config option to turn eventlet debug on/off
+
+    * Added override option for swift-init's KILL_WAIT
+
+    * Added oldest and most recent replication pass to swift-recon
+
+    * Fixed 500 error response when GETing a many-segment manifest
+
+    * Memcached keys now use a delta timeout when possible
+
+    * Refactor DiskFile to hide temp file names and exts
+
+    * Remove IP-based container-sync ACLs from auth middlewares
+
+    * Fixed bug in deleting memcached account info data
+
+    * Fixed lazy-listing of object manifest segments
+
+    * Fixed bug where a ? in the object name caused an error
+
+    * Swift now returns 406 if it can't satisfy Accept
+
+    * Fix infinite recursion bug in object replicator
+
+    * Swift will now reject names with NULL characters
+
+    * Fixed object-auditor logging to use a minimum of unix sockets
+
+    * Various other minor bug fixes and improvements
+
+
 swift (1.7.5)
 
     * Support OPTIONS verb, including CORS preflight requests
@@ -48,29 +4600,32 @@ swift (1.7.5)
 
     * Various other minor bug fixes and improvements
 
-swift (1.7.4)
+
+swift (1.7.4, OpenStack Folsom)
 
     * Fix issue where early client disconnects may have caused a memory leak
 
+
 swift (1.7.2)
 
     * Fix issue where memcache serialization was not properly loading
       the config value
 
+
 swift (1.7.0)
 
     * Use custom encoding for ring data instead of pickle
 
       Serialize RingData in a versioned, custom format which is a combination
       of a JSON-encoded header and .tostring() dumps of the
-      replica2part2dev_id arrays.  This format deserializes hundreds of times
+      replica2part2dev_id arrays. This format deserializes hundreds of times
       faster than rings serialized with Python 2.7's pickle (a significant
       performance regression for ring loading between Python 2.6 and Python
-      2.7).  Fixes bug 1031954.
+      2.7). Fixes bug 1031954.
 
       The new implementation is backward-compatible; if a ring
       does not begin with a new-style magic string, it is assumed to be an
-      old-style pickle-dumped ring and is handled as before.  So new Swift
+      old-style pickle-dumped ring and is handled as before. So new Swift
       code can read old rings, but old Swift code will not be able to read
       newly-serialized rings.
 
@@ -127,6 +4682,7 @@ swift (1.7.0)
 
     * Various other minor bug fixes and improvements
 
+
 swift (1.6.0)
 
     * Removed bin/swift and swift/common/client.py from the swift repo. These
@@ -141,7 +4697,7 @@ swift (1.6.0)
       substantially affects the JSON output of the dispersion report, and any
       tools written to consume this output will need to be updated.
 
-    * Added Solaris (Illumos) compability
+    * Added Solaris (Illumos) compatibility
 
     * Added -a option to swift-get-nodes to show all handoffs
 
@@ -186,6 +4742,7 @@ swift (1.6.0)
 
     * Various other minor bug fixes and improvements
 
+
 swift (1.5.0)
 
     * New option to toggle SQLite database preallocation with account
@@ -254,7 +4811,8 @@ swift (1.5.0)
 
     * Various other minor bug fixes and improvements
 
-swift (1.4.8)
+
+swift (1.4.8, OpenStack Essex)
 
     * Added optional max_containers_per_account restriction
 
@@ -285,6 +4843,7 @@ swift (1.4.8)
 
     * Refactored some ring building functions for clarity and simplicity
 
+
 swift (1.4.7)
 
     * Improvements to account and container replication.
@@ -303,6 +4862,7 @@ swift (1.4.7)
 
     * Other bug fixes and documentation updates.
 
+
 swift (1.4.6)
 
     * TempURL and FormPost middleware added
@@ -327,6 +4887,7 @@ swift (1.4.6)
 
     * Other minor bug fixes
 
+
 swift (1.4.5)
 
     * New swift-orphans and swift-oldies command line tools to detect
@@ -355,6 +4916,7 @@ swift (1.4.5)
 
     * PEP8 Updates.
 
+
 swift (1.4.4)
 
     * Fixes to prevent socket hoarding (memory leak)
@@ -397,7 +4959,8 @@ swift (1.4.4)
 
     * Query only specific zone via swift-recon.
 
-swift (1.4.3)
+
+swift (1.4.3, OpenStack Diablo)
 
     * Additional quarantine catching code.
 
@@ -421,6 +4984,7 @@ swift (1.4.3)
     * Fix to the swift tool to strip any leading slashes on file names when
       uploading.
 
+
 swift (1.4.2)
 
     * Removed stats/logging code from Swift [now in separate slogging project].
@@ -448,6 +5012,7 @@ swift (1.4.2)
     * This fixes the bug that drop_buffer_cache() doesn't work on systems where
       off_t isn't 64 bits.
 
+
 swift (1.4.1)
 
     * st renamed to swift
@@ -464,6 +5029,7 @@ swift (1.4.1)
     * Accounts are auto-created if an auth token is valid when the
       account_autocreate proxy config parameter is set to true.
 
+
 swift (1.4.0)
 
     * swift-bench now cleans up containers it creates.
@@ -522,3 +5088,16 @@ swift (1.4.0)
 
     * Stats uploaders now allow overrides for source_filename_pattern and
       new_log_cutoff values.
+
+
+----
+
+Changelog entries for previous versions are incomplete
+
+swift (1.3.0, OpenStack Cactus)
+
+swift (1.2.0, OpenStack Bexar)
+
+swift (1.1.0, OpenStack Austin)
+
+swift (1.0.0, Initial Release)
diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
deleted file mode 100644
index 85297900c3..0000000000
--- a/CONTRIBUTING.md
+++ /dev/null
@@ -1,12 +0,0 @@
-If you would like to contribute to the development of OpenStack,
-you must follow the steps in the "If you're a developer, start here"
-section of this page: [http://wiki.openstack.org/HowToContribute](http://wiki.openstack.org/HowToContribute#If_you.27re_a_developer.2C_start_here:)
-
-Once those steps have been completed, changes to OpenStack
-should be submitted for review via the Gerrit tool, following
-the workflow documented at [http://wiki.openstack.org/GerritWorkflow](http://wiki.openstack.org/GerritWorkflow).
-
-Pull requests submitted through GitHub will be ignored.
-
-Bugs should be filed [on Launchpad](https://bugs.launchpad.net/swift),
-not in GitHub's issue tracker.
diff --git a/CONTRIBUTING.rst b/CONTRIBUTING.rst
new file mode 100644
index 0000000000..b2117bf7f5
--- /dev/null
+++ b/CONTRIBUTING.rst
@@ -0,0 +1,184 @@
+Contributing to OpenStack Swift
+===============================
+
+Who is a Contributor?
+---------------------
+
+Put simply, if you improve Swift, you're a contributor. The easiest way to
+improve the project is to tell us where there's a bug. In other words, filing
+a bug is a valuable and helpful way to contribute to the project.
+
+Once a bug has been filed, someone will work on writing a patch to fix the
+bug. Perhaps you'd like to fix a bug. Writing code to fix a bug or add new
+functionality is tremendously important.
+
+Once code has been written, it is submitted upstream for review. All code,
+even that written by the most senior members of the community, must pass code
+review and all tests before it can be included in the project. Reviewing
+proposed patches is a very helpful way to be a contributor.
+
+Swift is nothing without the community behind it. We'd love to welcome you to
+our community. Come find us in #openstack-swift on OFTC IRC or on the
+OpenStack dev mailing list.
+
+For general information on contributing to OpenStack, please check out the
+`contributor guide <https://docs.openstack.org/contributors/>`_ to get started.
+It covers all the basics that are common to all OpenStack projects: the accounts
+you need, the basics of interacting with our Gerrit review system, how we
+communicate as a community, etc.
+
+For more project information, feel free to check out the `Swift documentation <https://docs.openstack.org/swift/latest/>`__.
+
+Filing a Bug
+~~~~~~~~~~~~
+
+Filing a bug is the easiest way to contribute. You can find currently-tracked bugs on our `Launchpad. <https://bugs.launchpad.net/swift>`__
+Use the `Report a bug <https://bugs.launchpad.net/swift/+filebug>`__ link to
+file a new bug.
+
+If you find something in Swift that doesn't match the documentation or doesn't
+meet your expectations with how it should work, please let us know. Of course,
+if you ever get an error (like a Traceback message in the logs), we definitely
+want to know about that. We'll do our best to diagnose any problem and patch
+it as soon as possible.
+
+A bug report, at minimum, should describe what you were doing that caused the
+bug. "Swift broke, pls fix" is not helpful. Instead, something like "When I
+restarted syslog, Swift started logging traceback messages" is very helpful.
+The goal is that we can reproduce the bug and isolate the issue in order to
+apply a fix. If you don't have full details, that's ok. Anything you can
+provide is helpful.
+
+You may have noticed that there are many tracked bugs, but not all of them
+have been confirmed. If you take a look at an old bug report and you can
+reproduce the issue described, please leave a comment on the bug about that.
+It lets us all know that the bug is very likely to be valid.
+
+Reviewing Someone Else's Code
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+All code reviews in OpenStack projects are done on our Gerrit instance at
+`review.opendev.org <https://review.opendev.org/q/project:openstack/swift+is:open>`__.
+Reviewing patches is one of the most effective ways you can contribute to the community.
+
+We've written a set of `Review Guidelines <https://docs.openstack.org/swift/latest/contributor/review_guidelines.html>`__ to help you
+give good reviews.
+
+To find out what reviews are priortiy in the community, you can read `Priority Reviews <https://wiki.openstack.org/wiki/Swift/PriorityReviews>`__ on our wiki.
+
+What do I work on?
+------------------
+
+If you're looking for a way to write and contribute code, but you're not sure
+what to work on, check out the `"wishlist" bugs <https://bugs.launchpad.net/swift/+bugs?field.importance%3Alist=WISHLIST>`__ in the bug tracker. These are
+normally smaller items that someone took the time to write down but didn't
+have time to implement.
+
+And please join #openstack-swift on OFTC IRC to tell us what you're working on.
+
+Getting Started
+---------------
+
+https://docs.openstack.org/swift/latest/first_contribution_swift.html
+
+Once those steps have been completed, changes to OpenStack
+should be submitted for review via the Gerrit tool, following our `Development Workflow. <http://docs.openstack.org/infra/manual/developers.html#development-workflow>`__
+
+Gerrit is the review system used in the OpenStack projects. We're sorry, but
+we won't be able to respond to pull requests submitted through GitHub.
+
+Bugs should be filed `on Launchpad <https://bugs.launchpad.net/swift>`__,
+not in GitHub's issue tracker.
+
+Swift Design Principles
+=======================
+
+-  `The Zen of Python <https://peps.python.org/pep-0020>`__
+-  Simple Scales
+-  Minimal dependencies
+-  Re-use existing tools and libraries when reasonable
+-  Leverage the economies of scale
+-  Small, loosely coupled RESTful services
+-  No single points of failure
+-  Start with the use case
+-  ... then design from the cluster operator up
+-  If you haven't argued about it, you don't have the right answer yet
+   :)
+-  If it is your first implementation, you probably aren't done yet :)
+
+Please don't feel offended by difference of opinion. Be prepared to
+advocate for your change and iterate on it based on feedback. Reach out
+to other people working on the project on
+`IRC <http://eavesdrop.openstack.org/irclogs/%23openstack-swift/>`__ or
+the `mailing
+list <https://lists.openstack.org/archives/list/openstack-discuss@lists.openstack.org/>`__ - we want
+to help.
+
+Recommended workflow
+====================
+
+-  Set up a `Swift All-In-One
+   VM <https://docs.openstack.org/swift/latest/development_saio.html>`__\ (SAIO).
+
+-  Make your changes. Docs and tests for your patch must land before or
+   with your patch.
+
+-  Run unit tests, functional tests, probe tests ``./.unittests``
+   ``./.functests`` ``./.probetests``
+
+-  Run ``tox`` (no command-line args needed)
+
+-  ``git review``
+
+Notes on Testing
+================
+
+Running the tests above against Swift in your development environment
+(ie your SAIO) will catch most issues. Any patch you propose is expected
+to be both tested and documented and all tests should pass.
+
+If you want to run just a subset of the tests while you are developing,
+you can use pytest:
+
+.. code-block:: console
+
+    cd test/unit/common/middleware/ && pytest test_healthcheck.py
+
+To check which parts of your code are being exercised by a test, you can
+run tox and then point your browser to swift/cover/index.html:
+
+.. code-block:: console
+
+    tox -e py3 -- test.unit.common.middleware.test_healthcheck:TestHealthCheck.test_healthcheck
+
+Swift's unit tests are designed to test small parts of the code in
+isolation. The functional tests validate that the entire system is
+working from an external perspective (they are "black-box" tests). You
+can even run functional tests against public Swift endpoints. The
+probetests are designed to test much of Swift's internal processes. For
+example, a test may write data, intentionally corrupt it, and then
+ensure that the correct processes detect and repair it.
+
+When your patch is submitted for code review, it will automatically be
+tested on the OpenStack CI infrastructure. In addition to many of the
+tests above, it will also be tested by several other OpenStack test
+jobs.
+
+Once your patch has been reviewed and approved by core reviewers and
+has passed all automated tests, it will be merged into the Swift source
+tree.
+
+Ideas
+=====
+
+https://wiki.openstack.org/wiki/Swift/ideas
+
+If you're working on something, it's a very good idea to write down
+what you're thinking about. This lets others get up to speed, helps
+you collaborate, and serves as a great record for future reference.
+Write down your thoughts somewhere and put a link to it here. It
+doesn't matter what form your thoughts are in; use whatever is best
+for you. Your document should include why your idea is needed and your
+thoughts on particular design choices and tradeoffs. Please include
+some contact information (ideally, your IRC nick) so that people can
+collaborate with you.
diff --git a/Dockerfile b/Dockerfile
new file mode 100644
index 0000000000..f4a652ba40
--- /dev/null
+++ b/Dockerfile
@@ -0,0 +1,76 @@
+################################################
+#
+#  Alpine 3.16.2 Swift-All-In-One
+#
+################################################
+
+FROM        alpine:3.16.2
+MAINTAINER  Openstack Swift
+
+ENV	        S6_LOGGING 1
+ENV	        S6_VERSION 1.21.4.0
+ENV         SOCKLOG_VERSION 3.0.1-1
+ENV	        ARCH amd64
+ENV         BUILD_DIR "/tmp"
+ENV         ENV="/etc/profile"
+
+#COPY        docker/install_scripts /install_scripts
+COPY        . /opt/swift
+
+ADD	        https://github.com/just-containers/s6-overlay/releases/download/v$S6_VERSION/s6-overlay-$ARCH.tar.gz /tmp/
+ADD	        https://github.com/just-containers/s6-overlay/releases/download/v$S6_VERSION/s6-overlay-$ARCH.tar.gz.sig /tmp/
+ADD         https://github.com/just-containers/socklog-overlay/releases/download/v$SOCKLOG_VERSION/socklog-overlay-$ARCH.tar.gz /tmp/
+
+RUN         mkdir /etc/swift && \
+            echo && \
+            echo && \
+            echo && \
+            echo "================   starting swift_needs  ===================" && \
+            /opt/swift/docker/install_scripts/00_swift_needs.sh && \
+            echo && \
+            echo && \
+            echo && \
+            echo "================   starting apk_install_prereqs  ===================" && \
+            /opt/swift/docker/install_scripts/10_apk_install_prereqs.sh && \
+            echo && \
+            echo && \
+            echo && \
+            echo "================   starting apk_install_py3  ===================" && \
+            /opt/swift/docker/install_scripts/21_apk_install_py3.sh && \
+            echo && \
+            echo && \
+            echo && \
+            echo "================   starting swift_install  ===================" && \
+            /opt/swift/docker/install_scripts/50_swift_install.sh && \
+            echo && \
+            echo && \
+            echo && \
+            echo "================   installing s6-overlay  ===================" && \
+            gpg --import /opt/swift/docker/s6-gpg-pub-key && \
+            gpg --verify /tmp/s6-overlay-$ARCH.tar.gz.sig /tmp/s6-overlay-$ARCH.tar.gz && \
+            gunzip -c /tmp/s6-overlay-$ARCH.tar.gz | tar -xf - -C / && \
+            gunzip -c /tmp/socklog-overlay-amd64.tar.gz | tar -xf - -C / && \
+            rm -rf /tmp/s6-overlay*  && \
+            rm -rf /tmp/socklog-overlay* && \
+            echo && \
+            echo && \
+            echo && \
+            echo "================   starting pip_uninstall_dev  ===================" && \
+            /opt/swift/docker/install_scripts/60_pip_uninstall_dev.sh && \
+            echo && \
+            echo && \
+            echo && \
+            echo "================   starting apk_uninstall_dev  ===================" && \
+            /opt/swift/docker/install_scripts/99_apk_uninstall_dev.sh && \
+            echo && \
+            echo && \
+            echo && \
+            echo "================ clean up  ===================" && \
+            echo "TODO: cleanup"
+            #rm -rf /opt/swift
+
+
+# Add Swift required configuration files
+COPY         docker/rootfs /
+
+ENTRYPOINT	["/init"]
diff --git a/LICENSE b/LICENSE
index 75b52484ea..d645695673 100644
--- a/LICENSE
+++ b/LICENSE
@@ -1,202 +1,202 @@
-
-                                 Apache License
-                           Version 2.0, January 2004
-                        http://www.apache.org/licenses/
-
-   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
-
-   1. Definitions.
-
-      "License" shall mean the terms and conditions for use, reproduction,
-      and distribution as defined by Sections 1 through 9 of this document.
-
-      "Licensor" shall mean the copyright owner or entity authorized by
-      the copyright owner that is granting the License.
-
-      "Legal Entity" shall mean the union of the acting entity and all
-      other entities that control, are controlled by, or are under common
-      control with that entity. For the purposes of this definition,
-      "control" means (i) the power, direct or indirect, to cause the
-      direction or management of such entity, whether by contract or
-      otherwise, or (ii) ownership of fifty percent (50%) or more of the
-      outstanding shares, or (iii) beneficial ownership of such entity.
-
-      "You" (or "Your") shall mean an individual or Legal Entity
-      exercising permissions granted by this License.
-
-      "Source" form shall mean the preferred form for making modifications,
-      including but not limited to software source code, documentation
-      source, and configuration files.
-
-      "Object" form shall mean any form resulting from mechanical
-      transformation or translation of a Source form, including but
-      not limited to compiled object code, generated documentation,
-      and conversions to other media types.
-
-      "Work" shall mean the work of authorship, whether in Source or
-      Object form, made available under the License, as indicated by a
-      copyright notice that is included in or attached to the work
-      (an example is provided in the Appendix below).
-
-      "Derivative Works" shall mean any work, whether in Source or Object
-      form, that is based on (or derived from) the Work and for which the
-      editorial revisions, annotations, elaborations, or other modifications
-      represent, as a whole, an original work of authorship. For the purposes
-      of this License, Derivative Works shall not include works that remain
-      separable from, or merely link (or bind by name) to the interfaces of,
-      the Work and Derivative Works thereof.
-
-      "Contribution" shall mean any work of authorship, including
-      the original version of the Work and any modifications or additions
-      to that Work or Derivative Works thereof, that is intentionally
-      submitted to Licensor for inclusion in the Work by the copyright owner
-      or by an individual or Legal Entity authorized to submit on behalf of
-      the copyright owner. For the purposes of this definition, "submitted"
-      means any form of electronic, verbal, or written communication sent
-      to the Licensor or its representatives, including but not limited to
-      communication on electronic mailing lists, source code control systems,
-      and issue tracking systems that are managed by, or on behalf of, the
-      Licensor for the purpose of discussing and improving the Work, but
-      excluding communication that is conspicuously marked or otherwise
-      designated in writing by the copyright owner as "Not a Contribution."
-
-      "Contributor" shall mean Licensor and any individual or Legal Entity
-      on behalf of whom a Contribution has been received by Licensor and
-      subsequently incorporated within the Work.
-
-   2. Grant of Copyright License. Subject to the terms and conditions of
-      this License, each Contributor hereby grants to You a perpetual,
-      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-      copyright license to reproduce, prepare Derivative Works of,
-      publicly display, publicly perform, sublicense, and distribute the
-      Work and such Derivative Works in Source or Object form.
-
-   3. Grant of Patent License. Subject to the terms and conditions of
-      this License, each Contributor hereby grants to You a perpetual,
-      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-      (except as stated in this section) patent license to make, have made,
-      use, offer to sell, sell, import, and otherwise transfer the Work,
-      where such license applies only to those patent claims licensable
-      by such Contributor that are necessarily infringed by their
-      Contribution(s) alone or by combination of their Contribution(s)
-      with the Work to which such Contribution(s) was submitted. If You
-      institute patent litigation against any entity (including a
-      cross-claim or counterclaim in a lawsuit) alleging that the Work
-      or a Contribution incorporated within the Work constitutes direct
-      or contributory patent infringement, then any patent licenses
-      granted to You under this License for that Work shall terminate
-      as of the date such litigation is filed.
-
-   4. Redistribution. You may reproduce and distribute copies of the
-      Work or Derivative Works thereof in any medium, with or without
-      modifications, and in Source or Object form, provided that You
-      meet the following conditions:
-
-      (a) You must give any other recipients of the Work or
-          Derivative Works a copy of this License; and
-
-      (b) You must cause any modified files to carry prominent notices
-          stating that You changed the files; and
-
-      (c) You must retain, in the Source form of any Derivative Works
-          that You distribute, all copyright, patent, trademark, and
-          attribution notices from the Source form of the Work,
-          excluding those notices that do not pertain to any part of
-          the Derivative Works; and
-
-      (d) If the Work includes a "NOTICE" text file as part of its
-          distribution, then any Derivative Works that You distribute must
-          include a readable copy of the attribution notices contained
-          within such NOTICE file, excluding those notices that do not
-          pertain to any part of the Derivative Works, in at least one
-          of the following places: within a NOTICE text file distributed
-          as part of the Derivative Works; within the Source form or
-          documentation, if provided along with the Derivative Works; or,
-          within a display generated by the Derivative Works, if and
-          wherever such third-party notices normally appear. The contents
-          of the NOTICE file are for informational purposes only and
-          do not modify the License. You may add Your own attribution
-          notices within Derivative Works that You distribute, alongside
-          or as an addendum to the NOTICE text from the Work, provided
-          that such additional attribution notices cannot be construed
-          as modifying the License.
-
-      You may add Your own copyright statement to Your modifications and
-      may provide additional or different license terms and conditions
-      for use, reproduction, or distribution of Your modifications, or
-      for any such Derivative Works as a whole, provided Your use,
-      reproduction, and distribution of the Work otherwise complies with
-      the conditions stated in this License.
-
-   5. Submission of Contributions. Unless You explicitly state otherwise,
-      any Contribution intentionally submitted for inclusion in the Work
-      by You to the Licensor shall be under the terms and conditions of
-      this License, without any additional terms or conditions.
-      Notwithstanding the above, nothing herein shall supersede or modify
-      the terms of any separate license agreement you may have executed
-      with Licensor regarding such Contributions.
-
-   6. Trademarks. This License does not grant permission to use the trade
-      names, trademarks, service marks, or product names of the Licensor,
-      except as required for reasonable and customary use in describing the
-      origin of the Work and reproducing the content of the NOTICE file.
-
-   7. Disclaimer of Warranty. Unless required by applicable law or
-      agreed to in writing, Licensor provides the Work (and each
-      Contributor provides its Contributions) on an "AS IS" BASIS,
-      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-      implied, including, without limitation, any warranties or conditions
-      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
-      PARTICULAR PURPOSE. You are solely responsible for determining the
-      appropriateness of using or redistributing the Work and assume any
-      risks associated with Your exercise of permissions under this License.
-
-   8. Limitation of Liability. In no event and under no legal theory,
-      whether in tort (including negligence), contract, or otherwise,
-      unless required by applicable law (such as deliberate and grossly
-      negligent acts) or agreed to in writing, shall any Contributor be
-      liable to You for damages, including any direct, indirect, special,
-      incidental, or consequential damages of any character arising as a
-      result of this License or out of the use or inability to use the
-      Work (including but not limited to damages for loss of goodwill,
-      work stoppage, computer failure or malfunction, or any and all
-      other commercial damages or losses), even if such Contributor
-      has been advised of the possibility of such damages.
-
-   9. Accepting Warranty or Additional Liability. While redistributing
-      the Work or Derivative Works thereof, You may choose to offer,
-      and charge a fee for, acceptance of support, warranty, indemnity,
-      or other liability obligations and/or rights consistent with this
-      License. However, in accepting such obligations, You may act only
-      on Your own behalf and on Your sole responsibility, not on behalf
-      of any other Contributor, and only if You agree to indemnify,
-      defend, and hold each Contributor harmless for any liability
-      incurred by, or claims asserted against, such Contributor by reason
-      of your accepting any such warranty or additional liability.
-
-   END OF TERMS AND CONDITIONS
-
-   APPENDIX: How to apply the Apache License to your work.
-
-      To apply the Apache License to your work, attach the following
-      boilerplate notice, with the fields enclosed by brackets "[]"
-      replaced with your own identifying information. (Don't include
-      the brackets!)  The text should be enclosed in the appropriate
-      comment syntax for the file format. We also recommend that a
-      file or class name and description of purpose be included on the
-      same "printed page" as the copyright notice for easier
-      identification within third-party archives.
-
-   Copyright [yyyy] [name of copyright owner]
-
-   Licensed under the Apache License, Version 2.0 (the "License");
-   you may not use this file except in compliance with the License.
-   You may obtain a copy of the License at
-
-       http://www.apache.org/licenses/LICENSE-2.0
-
-   Unless required by applicable law or agreed to in writing, software
-   distributed under the License is distributed on an "AS IS" BASIS,
-   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-   See the License for the specific language governing permissions and
-   limitations under the License.
+
+                                 Apache License
+                           Version 2.0, January 2004
+                        http://www.apache.org/licenses/
+
+   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+
+   1. Definitions.
+
+      "License" shall mean the terms and conditions for use, reproduction,
+      and distribution as defined by Sections 1 through 9 of this document.
+
+      "Licensor" shall mean the copyright owner or entity authorized by
+      the copyright owner that is granting the License.
+
+      "Legal Entity" shall mean the union of the acting entity and all
+      other entities that control, are controlled by, or are under common
+      control with that entity. For the purposes of this definition,
+      "control" means (i) the power, direct or indirect, to cause the
+      direction or management of such entity, whether by contract or
+      otherwise, or (ii) ownership of fifty percent (50%) or more of the
+      outstanding shares, or (iii) beneficial ownership of such entity.
+
+      "You" (or "Your") shall mean an individual or Legal Entity
+      exercising permissions granted by this License.
+
+      "Source" form shall mean the preferred form for making modifications,
+      including but not limited to software source code, documentation
+      source, and configuration files.
+
+      "Object" form shall mean any form resulting from mechanical
+      transformation or translation of a Source form, including but
+      not limited to compiled object code, generated documentation,
+      and conversions to other media types.
+
+      "Work" shall mean the work of authorship, whether in Source or
+      Object form, made available under the License, as indicated by a
+      copyright notice that is included in or attached to the work
+      (an example is provided in the Appendix below).
+
+      "Derivative Works" shall mean any work, whether in Source or Object
+      form, that is based on (or derived from) the Work and for which the
+      editorial revisions, annotations, elaborations, or other modifications
+      represent, as a whole, an original work of authorship. For the purposes
+      of this License, Derivative Works shall not include works that remain
+      separable from, or merely link (or bind by name) to the interfaces of,
+      the Work and Derivative Works thereof.
+
+      "Contribution" shall mean any work of authorship, including
+      the original version of the Work and any modifications or additions
+      to that Work or Derivative Works thereof, that is intentionally
+      submitted to Licensor for inclusion in the Work by the copyright owner
+      or by an individual or Legal Entity authorized to submit on behalf of
+      the copyright owner. For the purposes of this definition, "submitted"
+      means any form of electronic, verbal, or written communication sent
+      to the Licensor or its representatives, including but not limited to
+      communication on electronic mailing lists, source code control systems,
+      and issue tracking systems that are managed by, or on behalf of, the
+      Licensor for the purpose of discussing and improving the Work, but
+      excluding communication that is conspicuously marked or otherwise
+      designated in writing by the copyright owner as "Not a Contribution."
+
+      "Contributor" shall mean Licensor and any individual or Legal Entity
+      on behalf of whom a Contribution has been received by Licensor and
+      subsequently incorporated within the Work.
+
+   2. Grant of Copyright License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      copyright license to reproduce, prepare Derivative Works of,
+      publicly display, publicly perform, sublicense, and distribute the
+      Work and such Derivative Works in Source or Object form.
+
+   3. Grant of Patent License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      (except as stated in this section) patent license to make, have made,
+      use, offer to sell, sell, import, and otherwise transfer the Work,
+      where such license applies only to those patent claims licensable
+      by such Contributor that are necessarily infringed by their
+      Contribution(s) alone or by combination of their Contribution(s)
+      with the Work to which such Contribution(s) was submitted. If You
+      institute patent litigation against any entity (including a
+      cross-claim or counterclaim in a lawsuit) alleging that the Work
+      or a Contribution incorporated within the Work constitutes direct
+      or contributory patent infringement, then any patent licenses
+      granted to You under this License for that Work shall terminate
+      as of the date such litigation is filed.
+
+   4. Redistribution. You may reproduce and distribute copies of the
+      Work or Derivative Works thereof in any medium, with or without
+      modifications, and in Source or Object form, provided that You
+      meet the following conditions:
+
+      (a) You must give any other recipients of the Work or
+          Derivative Works a copy of this License; and
+
+      (b) You must cause any modified files to carry prominent notices
+          stating that You changed the files; and
+
+      (c) You must retain, in the Source form of any Derivative Works
+          that You distribute, all copyright, patent, trademark, and
+          attribution notices from the Source form of the Work,
+          excluding those notices that do not pertain to any part of
+          the Derivative Works; and
+
+      (d) If the Work includes a "NOTICE" text file as part of its
+          distribution, then any Derivative Works that You distribute must
+          include a readable copy of the attribution notices contained
+          within such NOTICE file, excluding those notices that do not
+          pertain to any part of the Derivative Works, in at least one
+          of the following places: within a NOTICE text file distributed
+          as part of the Derivative Works; within the Source form or
+          documentation, if provided along with the Derivative Works; or,
+          within a display generated by the Derivative Works, if and
+          wherever such third-party notices normally appear. The contents
+          of the NOTICE file are for informational purposes only and
+          do not modify the License. You may add Your own attribution
+          notices within Derivative Works that You distribute, alongside
+          or as an addendum to the NOTICE text from the Work, provided
+          that such additional attribution notices cannot be construed
+          as modifying the License.
+
+      You may add Your own copyright statement to Your modifications and
+      may provide additional or different license terms and conditions
+      for use, reproduction, or distribution of Your modifications, or
+      for any such Derivative Works as a whole, provided Your use,
+      reproduction, and distribution of the Work otherwise complies with
+      the conditions stated in this License.
+
+   5. Submission of Contributions. Unless You explicitly state otherwise,
+      any Contribution intentionally submitted for inclusion in the Work
+      by You to the Licensor shall be under the terms and conditions of
+      this License, without any additional terms or conditions.
+      Notwithstanding the above, nothing herein shall supersede or modify
+      the terms of any separate license agreement you may have executed
+      with Licensor regarding such Contributions.
+
+   6. Trademarks. This License does not grant permission to use the trade
+      names, trademarks, service marks, or product names of the Licensor,
+      except as required for reasonable and customary use in describing the
+      origin of the Work and reproducing the content of the NOTICE file.
+
+   7. Disclaimer of Warranty. Unless required by applicable law or
+      agreed to in writing, Licensor provides the Work (and each
+      Contributor provides its Contributions) on an "AS IS" BASIS,
+      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+      implied, including, without limitation, any warranties or conditions
+      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
+      PARTICULAR PURPOSE. You are solely responsible for determining the
+      appropriateness of using or redistributing the Work and assume any
+      risks associated with Your exercise of permissions under this License.
+
+   8. Limitation of Liability. In no event and under no legal theory,
+      whether in tort (including negligence), contract, or otherwise,
+      unless required by applicable law (such as deliberate and grossly
+      negligent acts) or agreed to in writing, shall any Contributor be
+      liable to You for damages, including any direct, indirect, special,
+      incidental, or consequential damages of any character arising as a
+      result of this License or out of the use or inability to use the
+      Work (including but not limited to damages for loss of goodwill,
+      work stoppage, computer failure or malfunction, or any and all
+      other commercial damages or losses), even if such Contributor
+      has been advised of the possibility of such damages.
+
+   9. Accepting Warranty or Additional Liability. While redistributing
+      the Work or Derivative Works thereof, You may choose to offer,
+      and charge a fee for, acceptance of support, warranty, indemnity,
+      or other liability obligations and/or rights consistent with this
+      License. However, in accepting such obligations, You may act only
+      on Your own behalf and on Your sole responsibility, not on behalf
+      of any other Contributor, and only if You agree to indemnify,
+      defend, and hold each Contributor harmless for any liability
+      incurred by, or claims asserted against, such Contributor by reason
+      of your accepting any such warranty or additional liability.
+
+   END OF TERMS AND CONDITIONS
+
+   APPENDIX: How to apply the Apache License to your work.
+
+      To apply the Apache License to your work, attach the following
+      boilerplate notice, with the fields enclosed by brackets "[]"
+      replaced with your own identifying information. (Don't include
+      the brackets!)  The text should be enclosed in the appropriate
+      comment syntax for the file format. We also recommend that a
+      file or class name and description of purpose be included on the
+      same "printed page" as the copyright notice for easier
+      identification within third-party archives.
+
+   Copyright [yyyy] [name of copyright owner]
+
+   Licensed under the Apache License, Version 2.0 (the "License");
+   you may not use this file except in compliance with the License.
+   You may obtain a copy of the License at
+
+       http://www.apache.org/licenses/LICENSE-2.0
+
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.
diff --git a/MANIFEST.in b/MANIFEST.in
index 73ea9e2e8b..495d35c967 100644
--- a/MANIFEST.in
+++ b/MANIFEST.in
@@ -1,12 +1,13 @@
 include AUTHORS LICENSE .functests .unittests .probetests test/__init__.py
-include CHANGELOG README.md
+include CHANGELOG CONTRIBUTING.rst README.rst
 include babel.cfg
 include test/sample.conf
 include tox.ini
+include requirements.txt test-requirements.txt
 graft doc
 graft etc
-graft locale
+graft swift/locale
+recursive-include swift/common/middleware/s3api/schema *.rng
 graft test/functional
 graft test/probe
 graft test/unit
-graft tools
diff --git a/README.md b/README.md
deleted file mode 100644
index a839dd6fcc..0000000000
--- a/README.md
+++ /dev/null
@@ -1,83 +0,0 @@
-# Swift
-
-A distributed object storage system designed to scale from a single machine
-to thousands of servers. Swift is optimized for multi-tenancy and high
-concurrency. Swift is ideal for backups, web and mobile content, and any other
-unstructured data that can grow without bound.
-
-Swift provides a simple, REST-based API fully documented at
-http://doc.openstack.org/.
-
-Swift was originally developed as the basis for Rackspace's Cloud Files and
-was open-sourced in 2010 as part of the OpenStack project. It has since grown
-to include contributions from many companies and has spawned a thriving
-ecosystem of 3rd party tools. Swift's contributors are listed in the AUTHORS
-file.
-
-## Docs
-
-To build documentation install sphinx (`pip install sphinx`), run
-`python setup.py build_sphinx`, and then browse to /doc/build/html/index.html.
-These docs are auto-generated after every commit and available online at
-http://docs.openstack.org/developer/swift/.
-
-## For Developers
-
-The best place to get started is the ["SAIO - Swift All In One"](http://docs.openstack.org/developer/swift/development_saio.html).
-This document will walk you through setting up a development cluster of Swift
-in a VM. The SAIO environment is ideal for running small-scale tests against
-swift and trying out new features and bug fixes.
-
-You can run unit tests with `.unittests` and functional tests with
-`.functests`.
-
-### Code Organization
-
- * bin/: Executable scripts that are the processes run by the deployer
- * doc/: Documentation
- * etc/: Sample config files
- * swift/: Core code
-    * account/: account server
-    * common/: code shared by different modules
-        * middleware/: "standard", officially-supported middleware
-        * ring/: code implementing Swift's ring
-    * container/: container server
-    * obj/: object server
-    * proxy/: proxy server
- * test/: Unit and functional tests
-
-### Data Flow
-
-Swift is a WSGI application and uses eventlet's WSGI server. After the
-processes are running, the entry point for new requests is the `Application`
-class in `swift/proxy/server.py`. From there, a controller is chosen, and the
-request is processed. The proxy may choose to forward the request to a back-
-end server. For example, the entry point for requests to the object server is
-the `ObjectController` class in `swift/obj/server.py`.
-
-
-## For Deployers
-
-Deployer docs are also available at
-http://docs.openstack.org/developer/swift/. A good starting point is at
-http://docs.openstack.org/developer/swift/deployment_guide.html
-
-You can run functional tests against a swift cluster with `.functests`. These
-functional tests require `/etc/swift/test.conf` to run. A sample config file
-can be found in this source tree in `test/sample.conf`.
-
-## For Client Apps
-
-For client applications, official Python language bindings are provided at
-http://github.com/openstack/python-swiftclient.
-
-Complete API documentation at
-http://docs.openstack.org/api/openstack-object-storage/1.0/content/
-
-----
-
-For more information come hang out in #openstack-swift on freenode.
-
-Thanks,
-
-The Swift Development Team
diff --git a/README.rst b/README.rst
new file mode 100644
index 0000000000..1afe2b0a37
--- /dev/null
+++ b/README.rst
@@ -0,0 +1,154 @@
+===============
+OpenStack Swift
+===============
+
+OpenStack Swift is a distributed object storage system designed to scale
+from a single machine to thousands of servers. Swift is optimized for
+multi-tenancy and high concurrency. Swift is ideal for backups, web and mobile
+content, and any other unstructured data that can grow without bound.
+
+Swift provides a simple, REST-based API fully documented at
+https://docs.openstack.org/swift/latest/.
+
+Swift was originally developed as the basis for Rackspace's Cloud Files
+and was open-sourced in 2010 as part of the OpenStack project. It has
+since grown to include contributions from many companies and has spawned
+a thriving ecosystem of 3rd party tools. Swift's contributors are listed
+in the AUTHORS file.
+
+Docs
+----
+
+To build documentation run::
+
+    pip install -r requirements.txt -r doc/requirements.txt
+    sphinx-build -W -b html doc/source doc/build/html
+
+and then browse to doc/build/html/index.html. These docs are auto-generated
+after every commit and available online at
+https://docs.openstack.org/swift/latest/.
+
+For Developers
+--------------
+
+Getting Started
+~~~~~~~~~~~~~~~
+
+Swift is part of OpenStack and follows the code contribution, review, and
+testing processes common to all OpenStack projects.
+
+If you would like to start contributing, check out these
+`notes <CONTRIBUTING.rst>`__ to help you get started.
+
+The best place to get started is the
+`"SAIO - Swift All In One" <https://docs.openstack.org/swift/latest/development_saio.html>`__.
+This document will walk you through setting up a development cluster of
+Swift in a VM. The SAIO environment is ideal for running small-scale
+tests against Swift and trying out new features and bug fixes.
+
+Tests
+~~~~~
+
+There are three types of tests included in Swift's source tree.
+
+#. Unit tests
+#. Functional tests
+#. Probe tests
+
+Unit tests check that small sections of the code behave properly. For example,
+a unit test may test a single function to ensure that various input gives the
+expected output. This validates that the code is correct and regressions are
+not introduced.
+
+Functional tests check that the client API is working as expected. These can
+be run against any endpoint claiming to support the Swift API (although some
+tests require multiple accounts with different privilege levels). These are
+"black box" tests that ensure that client apps written against Swift will
+continue to work.
+
+Probe tests are "white box" tests that validate the internal workings of a
+Swift cluster. They are written to work against the
+`"SAIO - Swift All In One" <https://docs.openstack.org/swift/latest/development_saio.html>`__
+dev environment. For example, a probe test may create an object, delete one
+replica, and ensure that the background consistency processes find and correct
+the error.
+
+You can run unit tests with ``.unittests``, functional tests with
+``.functests``, and probe tests with ``.probetests``. There is an
+additional ``.alltests`` script that wraps the other three.
+
+To fully run the tests, the target environment must use a filesystem that
+supports large xattrs. XFS is strongly recommended. For unit tests and in-
+process functional tests, either mount ``/tmp`` with XFS or provide another
+XFS filesystem via the ``TMPDIR`` environment variable. Without this setting,
+tests should still pass, but a very large number will be skipped.
+
+Code Organization
+~~~~~~~~~~~~~~~~~
+
+-  doc/: Documentation
+-  etc/: Sample config files
+-  examples/: Config snippets used in the docs
+-  swift/: Core code
+
+   -  account/: account server
+   -  cli/: code that backs some of the CLI tools
+   -  common/: code shared by different modules
+
+      -  middleware/: "standard", officially-supported middleware
+      -  ring/: code implementing Swift's ring
+
+   -  container/: container server
+   -  locale/: internationalization (translation) data
+   -  obj/: object server
+   -  proxy/: proxy server
+
+-  test/: Unit, functional, and probe tests
+
+Data Flow
+~~~~~~~~~
+
+Swift is a WSGI application and uses eventlet's WSGI server. After the
+processes are running, the entry point for new requests is the
+``Application`` class in ``swift/proxy/server.py``. From there, a
+controller is chosen, and the request is processed. The proxy may choose
+to forward the request to a back-end server. For example, the entry
+point for requests to the object server is the ``ObjectController``
+class in ``swift/obj/server.py``.
+
+For Deployers
+-------------
+
+Deployer docs are also available at
+https://docs.openstack.org/swift/latest/. A good starting point is at
+https://docs.openstack.org/swift/latest/deployment_guide.html
+There is an `ops runbook <https://docs.openstack.org/swift/latest/ops_runbook/index.html>`__
+that gives information about how to diagnose and troubleshoot common issues
+when running a Swift cluster.
+
+You can run functional tests against a Swift cluster with
+``.functests``. These functional tests require ``/etc/swift/test.conf``
+to run. A sample config file can be found in this source tree in
+``test/sample.conf``.
+
+For Client Apps
+---------------
+
+For client applications, official Python language bindings are provided
+at https://opendev.org/openstack/python-swiftclient.
+
+Complete API documentation at
+https://docs.openstack.org/api-ref/object-store/
+
+There is a large ecosystem of applications and libraries that support and
+work with OpenStack Swift. Several are listed on the
+`associated projects <https://docs.openstack.org/swift/latest/associated_projects.html>`__
+page.
+
+--------------
+
+For more information come hang out in #openstack-swift on OFTC.
+
+Thanks,
+
+The Swift Development Team
diff --git a/REVIEW_GUIDELINES.rst b/REVIEW_GUIDELINES.rst
new file mode 100644
index 0000000000..e2bc4c6bbb
--- /dev/null
+++ b/REVIEW_GUIDELINES.rst
@@ -0,0 +1,390 @@
+Review Guidelines
+=================
+
+Effective code review is a skill like any other professional skill you
+develop with experience. Effective code review requires trust. No
+one is perfect. Everyone makes mistakes. Trust builds over time.
+
+This document will enumerate behaviors commonly observed and
+associated with competent reviews of changes purposed to the Swift
+code base. No one is expected to "follow these steps". Guidelines
+are not *rules*, not all behaviors will be relevant in all situations.
+
+    Code review is collaboration, not judgement.
+
+    -- Alistair Coles
+
+Checkout the Change
+-------------------
+
+You will need to have a copy of the change in an environment where you
+can freely edit and experiment with the code in order to provide a
+non-superficial review. Superficial reviews are not terribly helpful.
+Always try to be helpful. ;)
+
+Check out the change so that you may begin.
+
+Commonly, ``git review -d <change-id>``
+
+Run it
+------
+
+Imagine that you submit a patch to Swift, and a reviewer starts to
+take a look at it. Your commit message on the patch claims that it
+fixes a bug or adds a feature, but as soon as the reviewer downloads
+it locally and tries to test it, a severe and obvious error shows up.
+Something like a syntax error or a missing dependency.
+
+"Did you even run this?" is the review comment all contributors dread.
+
+Reviewers in particular need to be fearful merging changes that just
+don't work - or at least fail in frequently common enough scenarios to
+be considered "horribly broken". A comment in our review that says
+roughly "I ran this on my machine and observed ``description of
+behavior change is supposed to achieve``" is the most powerful defense
+we have against the terrible scorn from our fellow Swift developers
+and operators when we accidentally merge bad code.
+
+If you're doing a fair amount of reviews - you will participate in
+merging a change that will break my clusters - it's cool - I'll do it
+to you at some point too (sorry about that). But when either of us go
+look at the reviews to understand the process gap that allowed this to
+happen - it better not be just because we were too lazy to check it out
+and run it before it got merged.
+
+Or be warned, you may receive, the dreaded...
+
+    "Did you even *run* this?"
+
+I'm sorry, I know it's rough. ;)
+
+Consider edge cases very seriously
+----------------------------------
+
+    Saying "that should rarely happen" is the same as saying "that
+    *will* happen"
+
+    -- Douglas Crockford
+
+Scale is an *amazingly* abusive partner. If you contribute changes to
+Swift your code is running - in production - at scale - and your bugs
+cannot hide. I wish on all of us that our bugs may be exceptionally
+rare - meaning they only happen in extremely unlikely edge cases. For
+example, bad things that happen only 1 out of every 10K times an op is
+performed will be discovered in minutes. Bad things that happen only
+1 out of every one billion times something happens will be observed -
+by multiple deployments - over the course of a release. Bad things
+that happen 1/100 times some op is performed are considered "horribly
+broken". Tests must exhaustively exercise possible scenarios. Every
+system call and network connection will raise an error and timeout -
+where will that Exception be caught?
+
+Run the tests
+-------------
+
+Yes, I know Gerrit does this already. You can do it *too*. You might
+not need to re-run *all* the tests on your machine - it depends on the
+change. But, if you're not sure which will be most useful - running
+all of them best - unit - functional - probe. If you can't reliably
+get all tests passing in your development environment you will not be
+able to do effective reviews. Whatever tests/suites you are able to
+exercise/validate on your machine against your config you should
+mention in your review comments so that other reviewers might choose
+to do *other* testing locally when they have the change checked out.
+
+e.g.
+
+    I went ahead and ran probe/test_object_metadata_replication.py on
+    my machine with both sync_method = rsync and sync_method = ssync -
+    that works for me - but I didn't try it with object_post_as_copy =
+    false
+
+Maintainable Code is Obvious
+----------------------------
+
+Style is an important component to review. The goal is maintainability.
+
+However, keep in mind that generally style, readability and
+maintainability are orthogonal to the suitability of a change for
+merge. A critical bug fix may be a well written pythonic masterpiece
+of style - or it may be a hack-y ugly mess that will absolutely need
+to be cleaned up at some point - but it absolutely should merge
+because: CRITICAL. BUG. FIX.
+
+You should comment inline to praise code that is "obvious". You should
+comment inline to highlight code that you found to be "obfuscated".
+
+Unfortunately "readability" is often subjective. We should remember
+that it's probably just our own personal preference. Rather than a
+comment that says "You should use a list comprehension here" - rewrite
+the code as a list comprehension, run the specific tests that hit the
+relevant section to validate your code is correct, then leave a
+comment that says:
+
+    I find this more readable:
+
+    ``diff with working tested code``
+
+If the author (or another reviewer) agrees - it's possible the change will get
+updated to include that improvement before it is merged; or it may happen in a
+follow-up change.
+
+However, remember that style is non-material - it is useful to provide (via
+diff) suggestions to improve maintainability as part of your review - but if
+the suggestion is functionally equivalent - it is by definition optional.
+
+Commit Messages
+---------------
+
+Read the commit message thoroughly before you begin the review.
+
+Commit messages must answer the "why" and the "what for" - more so
+than the "how" or "what it does". Commonly this will take the form of
+a short description:
+
+- What is broken - without this change
+- What is impossible to do with Swift - without this change
+- What is slower/worse/harder - without this change
+
+If you're not able to discern why a change is being made or how it
+would be used - you may have to ask for more details before you can
+successfully review it.
+
+Commit messages need to have a high consistent quality. While many
+things under source control can be fixed and improved in a follow-up
+change - commit messages are forever. Luckily it's easy to fix minor
+mistakes using the in-line edit feature in Gerrit!  If you can avoid
+ever having to *ask* someone to change a commit message you will find
+yourself an amazingly happier and more productive reviewer.
+
+Also commit messages should follow the OpenStack Commit Message
+guidelines, including references to relevant impact tags or bug
+numbers. You should hand out links to the OpenStack Commit Message
+guidelines *liberally* via comments when fixing commit messages during
+review.
+
+Here you go: `GitCommitMessages <https://wiki.openstack.org/wiki/GitCommitMessages#Summary_of_Git_commit_message_structure>`_
+
+New Tests
+---------
+
+New tests should be added for all code changes. Historically you
+should expect good changes to have a diff line count ratio of at least
+2:1 tests to code. Even if a change has to "fix" a lot of *existing*
+tests, if a change does not include any *new* tests it probably should
+not merge.
+
+If a change includes a good ratio of test changes and adds new tests -
+you should say so in your review comments.
+
+If it does not - you should write some!
+
+... and offer them to the patch author as a diff indicating to them that
+"something" like these tests I'm providing as an example will *need* to be
+included in this change before it is suitable to merge. Bonus points if you
+include suggestions for the author as to how they might improve or expand upon
+the tests stubs you provide.
+
+Be *very* careful about asking an author to add a test for a "small change"
+before attempting to do so yourself. It's quite possible there is a lack of
+existing test infrastructure needed to develop a concise and clear test - the
+author of a small change may not be the best person to introduce a large
+amount of new test infrastructure. Also, most of the time remember it's
+*harder* to write the test than the change - if the author is unable to
+develop a test for their change on their own you may prevent a useful change
+from being merged. At a minimum you should suggest a specific unit test that
+you think they should be able to copy and modify to exercise the behavior in
+their change. If you're not sure if such a test exists - replace their change
+with an Exception and run tests until you find one that blows up.
+
+Documentation
+-------------
+
+Most changes should include documentation. New functions and code
+should have Docstrings. Tests should obviate new or changed behaviors
+with descriptive and meaningful phrases. New features should include
+changes to the documentation tree. New config options should be
+documented in example configs. The commit message should document the
+change for the change log.
+
+Always point out typos or grammar mistakes when you see them in
+review, but also consider that if you were able to recognize the
+intent of the statement - documentation with typos may be easier to
+iterate and improve on than nothing.
+
+If a change does not have adequate documentation it may not be suitable to
+merge. If a change includes incorrect or misleading documentation or is
+contrary to *existing* documentation is probably is not suitable to merge.
+
+Every change could have better documentation.
+
+Like with tests, a patch isn't done until it has docs. Any patch that
+adds a new feature, changes behavior, updates configs, or in any other
+way is different than previous behavior requires docs. manpages,
+sample configs, docstrings, descriptive prose in the source tree, etc.
+
+Reviewers Write Code
+--------------------
+
+Reviews have been shown to provide many benefits - one of which is shared
+ownership. After providing a positive review you should understand how the
+change works. Doing this will probably require you to "play with" the change.
+
+You might functionally test the change in various scenarios. You may need to
+write a new unit test to validate the change will degrade gracefully under
+failure. You might have to write a script to exercise the change under some
+superficial load. You might have to break the change and validate the new
+tests fail and provide useful errors. You might have to step through some
+critical section of the code in a debugger to understand when all the possible
+branches are exercised in tests.
+
+When you're done with your review an artifact of your effort will be
+observable in the piles of code and scripts and diffs you wrote while
+reviewing. You should make sure to capture those artifacts in a paste
+or gist and include them in your review comments so that others may
+reference them.
+
+e.g.
+
+    When I broke the change like this:
+
+    ``diff``
+
+    it blew up like this:
+
+    ``unit test failure``
+
+
+It's not uncommon that a review takes more time than writing a change -
+hopefully the author also spent as much time as you did *validating* their
+change but that's not really in your control. When you provide a positive
+review you should be sure you understand the change - even seemingly trivial
+changes will take time to consider the ramifications.
+
+Leave Comments
+--------------
+
+Leave. Lots. Of. Comments.
+
+A popular web comic has stated that
+`WTFs/Minute <http://www.osnews.com/images/comics/wtfm.jpg>`_ is the
+*only* valid measurement of code quality.
+
+If something initially strikes you as questionable - you should jot
+down a note so you can loop back around to it.
+
+However, because of the distributed nature of authors and reviewers
+it's *imperative* that you try your best to answer your own questions
+as part of your review.
+
+Do not say "Does this blow up if it gets called when xyz" - rather try
+and find a test that specifically covers that condition and mention it
+in the comment so others can find it more quickly. Or if you can find
+no such test, add one to demonstrate the failure, and include a diff
+in a comment. Hopefully you can say "I *thought* this would blow up,
+so I wrote this test, but it seems fine."
+
+But if your initial reaction is "I don't understand this" or "How does
+this even work?" you should notate it and explain whatever you *were*
+able to figure out in order to help subsequent reviewers more quickly
+identify and grok the subtle or complex issues.
+
+Because you will be leaving lots of comments - many of which are
+potentially not highlighting anything specific - it is VERY important
+to leave a good summary. Your summary should include details of how
+you reviewed the change. You may include what you liked most, or
+least.
+
+If you are leaving a negative score ideally you should provide clear
+instructions on how the change could be modified such that it would be
+suitable for merge - again diffs work best.
+
+Scoring
+-------
+
+Scoring is subjective. Try to realize you're making a judgment call.
+
+A positive score means you believe Swift would be undeniably better
+off with this code merged than it would be going one more second
+without this change running in production immediately. It is indeed
+high praise - you should be sure.
+
+A negative score means that to the best of your abilities you have not
+been able to your satisfaction, to justify the value of a change
+against the cost of its deficiencies and risks. It is a surprisingly
+difficult chore to be confident about the value of unproven code or a
+not well understood use-case in an uncertain world, and unfortunately
+all too easy with a **thorough** review to uncover our defects, and be
+reminded of the risk of... regression.
+
+Reviewers must try *very* hard first and foremost to keep master stable.
+
+If you can demonstrate a change has an incorrect *behavior* it's
+almost without exception that the change must be revised to fix the
+defect *before* merging rather than letting it in and having to also
+file a bug.
+
+Every commit must be deployable to production.
+
+Beyond that - almost any change might be merge-able depending on
+its merits!  Here are some tips you might be able to use to find more
+changes that should merge!
+
+#. Fixing bugs is HUGELY valuable - the *only* thing which has a
+   higher cost than the value of fixing a bug - is adding a new
+   bug - if it's broken and this change makes it fixed (without
+   breaking anything else) you have a winner!
+
+#. Features are INCREDIBLY difficult to justify their value against
+   the cost of increased complexity, lowered maintainability, risk
+   of regression, or new defects. Try to focus on what is
+   *impossible* without the feature - when you make the impossible
+   possible, things are better. Make things better.
+
+#. Purely test/doc changes, complex refactoring, or mechanical
+   cleanups are quite nuanced because there's less concrete
+   objective value. I've seen lots of these kind of changes
+   get lost to the backlog. I've also seen some success where
+   multiple authors have collaborated to "push-over" a change
+   rather than provide a "review" ultimately resulting in a
+   quorum of three or more "authors" who all agree there is a lot
+   of value in the change - however subjective.
+
+Because the bar is high - most reviews will end with a negative score.
+
+However, for non-material grievances (nits) - you should feel
+confident in a positive review if the change is otherwise complete
+correct and undeniably makes Swift better (not perfect, *better*). If
+you see something worth fixing you should point it out in review
+comments, but when applying a score consider if it *need* be fixed
+before the change is suitable to merge vs. fixing it in a follow up
+change?  Consider if the change makes Swift so undeniably *better*
+and it was deployed in production without making any additional
+changes would it still be correct and complete?  Would releasing the
+change to production without any additional follow up make it more
+difficult to maintain and continue to improve Swift?
+
+Endeavor to leave a positive or negative score on every change you review.
+
+Use your best judgment.
+
+A note on Swift Core Maintainers
+--------------------------------
+
+Swift Core maintainers may provide positive reviews scores that *look*
+different from your reviews - a "+2" instead of a "+1".
+
+But it's *exactly the same* as your "+1".
+
+It means the change has been thoroughly and positively reviewed. The
+only reason it's different is to help identify changes which have
+received multiple competent and positive reviews. If you consistently
+provide competent reviews you run a *VERY* high risk of being
+approached to have your future positive review scores changed from a
+"+1" to "+2" in order to make it easier to identify changes which need
+to get merged.
+
+Ideally a review from a core maintainer should provide a clear path
+forward for the patch author. If you don't know how to proceed
+respond to the reviewers comments on the change and ask for help.
+We'd love to try and help.
diff --git a/api-ref/source/conf.py b/api-ref/source/conf.py
new file mode 100644
index 0000000000..dea25e9c7b
--- /dev/null
+++ b/api-ref/source/conf.py
@@ -0,0 +1,210 @@
+# -*- coding: utf-8 -*-
+#
+# Licensed under the Apache License, Version 2.0 (the "License"); you may
+# not use this file except in compliance with the License. You may obtain
+# a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
+# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
+# License for the specific language governing permissions and limitations
+# under the License.
+#
+# swift documentation build configuration file
+#
+# This file is execfile()d with the current directory set to
+# its containing dir.
+#
+# Note that not all possible configuration values are present in this
+# autogenerated file.
+#
+# All configuration values have a default; values that are commented out
+# serve to show the default.
+
+import datetime
+import os
+import sys
+import warnings
+
+
+html_theme = 'openstackdocs'
+html_theme_options = {
+    "sidebar_mode": "toc",
+}
+
+extensions = [
+    'os_api_ref',
+    'openstackdocstheme'
+]
+
+# If extensions (or modules to document with autodoc) are in another directory,
+# add these directories to sys.path here. If the directory is relative to the
+# documentation root, use os.path.abspath to make it absolute, like shown here.
+sys.path.insert(0, os.path.abspath('../../'))
+sys.path.insert(0, os.path.abspath('../'))
+sys.path.insert(0, os.path.abspath('./'))
+
+# -- General configuration ----------------------------------------------------
+
+# Add any Sphinx extension module names here, as strings. They can be
+# extensions coming with Sphinx (named 'sphinx.ext.*') or your custom ones.
+
+# The suffix of source filenames.
+source_suffix = '.rst'
+
+# The encoding of source files.
+#
+# source_encoding = 'utf-8'
+
+# The master toctree document.
+master_doc = 'index'
+
+# General information about the project.
+project = u'Object Storage API Reference'
+copyright = u'2010-present, OpenStack Foundation'
+
+# The language for content autogenerated by Sphinx. Refer to documentation
+# for a list of supported languages.
+#
+# language = None
+
+# There are two options for replacing |today|: either, you set today to some
+# non-false value, then it is used:
+# today = ''
+# Else, today_fmt is used as the format for a strftime call.
+# today_fmt = '%B %d, %Y'
+
+# The reST default role (used for this markup: `text`) to use
+# for all documents.
+# default_role = None
+
+# If true, '()' will be appended to :func: etc. cross-reference text.
+# add_function_parentheses = True
+
+# If true, the current module name will be prepended to all description
+# unit titles (such as .. function::).
+add_module_names = False
+
+# If true, sectionauthor and moduleauthor directives will be shown in the
+# output. They are ignored by default.
+show_authors = False
+
+# The name of the Pygments (syntax highlighting) style to use.
+pygments_style = 'native'
+
+# openstackdocstheme options
+openstackdocs_repo_name = 'openstack/swift'
+openstackdocs_bug_project = 'swift'
+openstackdocs_bug_tag = 'api-ref'
+
+# -- Options for man page output ----------------------------------------------
+
+# Grouping the document tree for man pages.
+# List of tuples 'sourcefile', 'target', u'title', u'Authors name', 'manual'
+
+
+# -- Options for HTML output --------------------------------------------------
+
+# The theme to use for HTML and HTML Help pages.  Major themes that come with
+# Sphinx are currently 'default' and 'sphinxdoc'.
+# html_theme_path = ["."]
+# html_theme = '_theme'
+
+# Theme options are theme-specific and customize the look and feel of a theme
+# further.  For a list of options available for each theme, see the
+# documentation.
+# html_theme_options = {}
+
+# Add any paths that contain custom themes here, relative to this directory.
+# html_theme_path = []
+
+# The name for this set of Sphinx documents.  If None, it defaults to
+# "<project> v<release> documentation".
+# html_title = None
+
+# A shorter title for the navigation bar.  Default is the same as html_title.
+# html_short_title = None
+
+# The name of an image file (relative to this directory) to place at the top
+# of the sidebar.
+# html_logo = None
+
+# The name of an image file (within the static path) to use as favicon of the
+# docs.  This file should be a Windows icon file (.ico) being 16x16 or 32x32
+# pixels large.
+# html_favicon = None
+
+# Add any paths that contain custom static files (such as style sheets) here,
+# relative to this directory. They are copied after the builtin static files,
+# so a file named "default.css" will overwrite the builtin "default.css".
+# html_static_path = ['_static']
+
+# If true, SmartyPants will be used to convert quotes and dashes to
+# typographically correct entities.
+# html_use_smartypants = True
+
+# Custom sidebar templates, maps document names to template names.
+# html_sidebars = {}
+
+# Additional templates that should be rendered to pages, maps page names to
+# template names.
+# html_additional_pages = {}
+
+# If false, no module index is generated.
+# html_use_modindex = True
+
+# If false, no index is generated.
+# html_use_index = True
+
+# If true, the index is split into individual pages for each letter.
+# html_split_index = False
+
+# If true, links to the reST sources are added to the pages.
+# html_show_sourcelink = True
+
+# If true, an OpenSearch description file will be output, and all pages will
+# contain a <link> tag referring to it.  The value of this option must be the
+# base URL from which the finished HTML is served.
+# html_use_opensearch = ''
+
+# If nonempty, this is the file name suffix for HTML files (e.g. ".xhtml").
+# html_file_suffix = ''
+
+# Output file base name for HTML help builder.
+htmlhelp_basename = 'swiftdoc'
+
+
+# -- Options for LaTeX output -------------------------------------------------
+
+# The paper size ('letter' or 'a4').
+# latex_paper_size = 'letter'
+
+# The font size ('10pt', '11pt' or '12pt').
+# latex_font_size = '10pt'
+
+# Grouping the document tree into LaTeX files. List of tuples
+# (source start file, target name, title, author, documentclass
+# [howto/manual]).
+latex_documents = [
+    ('index', 'swift.tex', u'OpenStack Object Storage API Documentation',
+     u'OpenStack Foundation', 'manual'),
+]
+
+# The name of an image file (relative to this directory) to place at the top of
+# the title page.
+# latex_logo = None
+
+# For "manual" documents, if this is true, then toplevel headings are parts,
+# not chapters.
+# latex_use_parts = False
+
+# Additional stuff for the LaTeX preamble.
+# latex_preamble = ''
+
+# Documents to append as an appendix to all manuals.
+# latex_appendices = []
+
+# If false, no module index is generated.
+# latex_use_modindex = True
diff --git a/api-ref/source/index.rst b/api-ref/source/index.rst
new file mode 100644
index 0000000000..22f40d575c
--- /dev/null
+++ b/api-ref/source/index.rst
@@ -0,0 +1,15 @@
+:tocdepth: 2
+
+===================
+ Object Storage API
+===================
+
+.. rest_expand_all::
+
+.. include:: storage_info.inc
+.. include:: storage-account-services.inc
+.. include:: storage-container-services.inc
+.. include:: storage-object-services.inc
+.. include:: storage_endpoints.inc
+
+
diff --git a/api-ref/source/metadata_header_encoding.inc b/api-ref/source/metadata_header_encoding.inc
new file mode 100644
index 0000000000..1aee47bf83
--- /dev/null
+++ b/api-ref/source/metadata_header_encoding.inc
@@ -0,0 +1,6 @@
+.. note::
+
+    The metadata value must be UTF-8-encoded and then
+    URL-encoded before you include it in the header.
+    This is a direct violation of the HTTP/1.1 `basic rules
+    <http://www.w3.org/Protocols/rfc2616/rfc2616-sec2.html#sec2.2>`_.
diff --git a/api-ref/source/metadata_header_syntax.inc b/api-ref/source/metadata_header_syntax.inc
new file mode 100644
index 0000000000..771f99dfcf
--- /dev/null
+++ b/api-ref/source/metadata_header_syntax.inc
@@ -0,0 +1,7 @@
+.. note::
+
+    Metadata keys (the name of the metadata) must be treated as case-insensitive
+    at all times. These keys can contain ASCII 7-bit characters that are not
+    control (0-31) characters, DEL, or a separator character, according to
+    `HTTP/1.1 <http://www.w3.org/Protocols/rfc2616/rfc2616.html>`_ .
+    The underscore character is silently converted to a hyphen.
diff --git a/api-ref/source/parameters.yaml b/api-ref/source/parameters.yaml
new file mode 100644
index 0000000000..01952f58f4
--- /dev/null
+++ b/api-ref/source/parameters.yaml
@@ -0,0 +1,1270 @@
+# variables in header
+Accept:
+  description: |
+    Instead of using the ``format`` query parameter,
+    set this header to ``application/json``, ``application/xml``, or
+    ``text/xml``.
+  in: header
+  required: false
+  type: string
+Accept-Ranges:
+  description: |
+    The type of ranges that the object accepts.
+  in: header
+  required: true
+  type: string
+Content-Disposition:
+  description: |
+    If set, specifies the override behavior for the
+    browser. For example, this header might specify that the browser
+    use a download program to save this file rather than show the
+    file, which is the default.
+  in: header
+  required: false
+  type: string
+Content-Disposition_resp:
+  description: |
+    If present, specifies the override behavior for the
+    browser. For example, this header might specify that the browser
+    use a download program to save this file rather than show the
+    file, which is the default.  If not set, this header is not
+    returned by this operation.
+  in: header
+  required: false
+  type: string
+Content-Encoding:
+  description: |
+    If set, the value of the ``Content-Encoding``
+    metadata.
+  in: header
+  required: false
+  type: string
+Content-Encoding_resp:
+  description: |
+    If present, the value of the ``Content-Encoding``
+    metadata.  If not set, the operation does not return this header.
+  in: header
+  required: false
+  type: string
+Content-Length_cud_resp:
+  description: |
+    If the operation succeeds, this value is zero
+    (0) or the length of informational or error
+    text in the response body.
+  in: header
+  required: true
+  type: string
+Content-Length_get_resp:
+  description: |
+    The length of the object content in the response
+    body, in bytes.
+  in: header
+  required: true
+  type: string
+Content-Length_listing_resp:
+  description: |
+    If the operation succeeds, the length of the response body
+    in bytes. On error, this is the length of the error text.
+  in: header
+  required: true
+  type: string
+Content-Length_obj_head_resp:
+  description: |
+    HEAD operations do not return content. The
+    ``Content-Length`` header value is not the size of the response
+    body but is the size of the object, in bytes.
+  in: header
+  required: true
+  type: string
+Content-Length_put_req:
+  description: |
+    Set to the length of the object content (i.e. the length in bytes
+    of the request body). Do not
+    set if chunked transfer encoding is being used.
+  in: header
+  required: false
+  type: integer
+Content-Type_cud_resp:
+  description: |
+    If present, this value is the MIME
+    type of the informational or error text in the response body.
+  in: header
+  required: false
+  type: string
+Content-Type_listing_resp:
+  description: |
+    If the operation succeeds, this value is the MIME type of the list
+    response. The MIME type is determined by the listing format specified by
+    the request and will be one of ``text/plain``, ``application/json``,
+    ``application/xml``, or ``text/xml``. If the operation fails, this value is
+    the MIME type of the error text in the response body.
+  in: header
+  required: true
+  type: string
+Content-Type_obj_cu_req:
+  description: |
+    Sets the MIME type for the object.
+  in: header
+  required: false
+  type: string
+Content-Type_obj_resp:
+  description: |
+    If the operation succeeds, this value is the MIME type of the object. If
+    the operation fails, this value is the MIME type of the error text in the
+    response body.
+  in: header
+  required: true
+  type: string
+Date:
+  description: |
+    The date and time the system responded to the request,
+    using the preferred format of
+    `RFC 7231 <https://tools.ietf.org/html/rfc7231#section-7.1.1.1>`_ as
+    shown in this example ``Thu, 16 Jun 2016 15:10:38 GMT``. The time is
+    always in UTC.
+  in: header
+  required: true
+  type: string
+Destination:
+  description: |
+    The container and object name of the destination
+    object in the form of ``/container/object``. You must UTF-8-encode
+    and then URL-encode the names of the destination container and
+    object before you include them in this header.
+  in: header
+  required: true
+  type: string
+Destination-Account:
+  description: |
+    Specifies the account name where the object is copied to. If not
+    specified, the object is copied to the account which owns the object
+    (i.e., the account in the path).
+  in: header
+  required: false
+  type: string
+ETag_obj_copied:
+  description: |
+    The MD5 checksum of the copied object content.
+    The value is not quoted.
+  in: header
+  required: true
+  type: string
+ETag_obj_received:
+  description: |
+    The MD5 checksum of the uploaded object content.
+    The value is not quoted. If it is an SLO, it would
+    be MD5 checksum of the segments' etags.
+  in: header
+  required: true
+  type: string
+ETag_obj_req:
+  description: |
+    The MD5 checksum value of the request body. For
+    example, the MD5 checksum value of the object content. For
+    manifest objects, this value is the MD5 checksum of the
+    concatenated string of ETag values for each of the segments in
+    the manifest. You are strongly recommended to compute
+    the MD5 checksum value and include it in the request. This
+    enables the Object Storage API to check the integrity of the
+    upload. The value is not quoted.
+  in: header
+  required: false
+  type: string
+ETag_obj_resp:
+  description: |
+    For objects smaller than 5 GB, this value is the
+    MD5 checksum of the object content. The value is not quoted.  For
+    manifest objects, this value is the MD5 checksum of the
+    concatenated string of ETag values for each of the
+    segments in the manifest, and not the MD5 checksum of the content
+    that was downloaded. Also the value is enclosed in double-quote
+    characters.  You are strongly recommended to compute the MD5
+    checksum of the response body as it is received and compare this
+    value with the one in the ETag header. If they differ, the content
+    was corrupted, so retry the operation.
+  in: header
+  required: true
+  type: string
+If-Match:
+  description: |
+    See `Request for Comments: 2616
+    <http://www.ietf.org/rfc/rfc2616.txt>`_.
+  in: header
+  required: false
+  type: string
+If-Modified-Since:
+  description: |
+    See `Request for Comments: 2616
+    <http://www.ietf.org/rfc/rfc2616.txt>`_.
+  in: header
+  required: false
+  type: string
+If-None-Match-get-request:
+  description: |
+    A client that has one or more entities previously
+    obtained from the resource can verify that none of those entities is
+    current by including a list of their associated entity tags in the
+    ``If-None-Match header`` field.
+    See `Request for Comments: 2616 <http://www.ietf.org/rfc/rfc2616.txt>`_
+    for details.
+  in: header
+  required: false
+  type: string
+If-None-Match-put-request:
+  description: |
+    In combination with ``Expect: 100-Continue``,
+    specify an ``"If-None-Match: *"`` header to query whether the
+    server already has a copy of the object before any data is sent.
+  in: header
+  required: false
+  type: string
+If-Unmodified-Since:
+  description: |
+    See `Request for Comments: 2616
+    <http://www.ietf.org/rfc/rfc2616.txt>`_.
+  in: header
+  required: false
+  type: string
+Last-Modified:
+  description: |
+    The date and time when the object was created or its metadata was
+    changed. The date and time is formatted as shown in this
+    example: ``Fri, 12 Aug 2016 14:24:16 GMT``
+
+    The time is always in UTC.
+  in: header
+  required: true
+  type: string
+Range:
+  description: |
+    The ranges of content to get.  You can use the
+    ``Range`` header to get portions of data by using one or more
+    range specifications. To specify many ranges, separate the range
+    specifications with a comma.  The types of range specifications
+    are:  - **Byte range specification**. Use FIRST_BYTE_OFFSET to
+    specify the   start of the data range, and LAST_BYTE_OFFSET to
+    specify the end.   You can omit the LAST_BYTE_OFFSET and if you
+    do, the value   defaults to the offset of the last byte of data.
+    - **Suffix byte range specification**. Use LENGTH bytes to specify
+    the length of the data range.  The following forms of the header
+    specify the following ranges of data:
+
+    - ``Range: bytes=-5``. The last five bytes.
+    - ``Range: bytes=10-15``. The six bytes of data after a 10-byte   offset.
+    - ``Range: bytes=10-15,-5``. A multi-part response that contains the
+      last five bytes and the six
+      bytes of data after a 10-byte offset. The ``Content-Type``
+      response header contains   ``multipart/byteranges``.
+    - ``Range: bytes=4-6``. Bytes 4 to 6 inclusive.
+    - ``Range: bytes=2-2``. Byte 2, the third byte of the data.
+    - ``Range: bytes=6-``. Byte 6 and after.
+    - ``Range: bytes=1-3,2-5``. A multi-part response that
+      contains   bytes 1 to 3 inclusive, and bytes 2 to 5 inclusive. The
+      ``Content-Type`` response header contains
+      ``multipart/byteranges``.
+  in: header
+  required: false
+  type: string
+Transfer-Encoding:
+  description: |
+    Set to ``chunked`` to enable chunked transfer
+    encoding. If used, do not set the ``Content-Length`` header to a
+    non-zero value.
+  in: header
+  required: false
+  type: string
+X-Account-Access-Control_req:
+  description: |
+    **Note**: `X-Account-Access-Control` is not supported by Keystone auth.
+
+    Sets an account access control list (ACL) that grants access to
+    containers and objects in the account.
+    See `Account ACLs
+    <https://docs.openstack.org/swift/latest/overview_acl.html#account-acls>`_
+    for more information.
+  in: header
+  required: false
+  type: string
+X-Account-Access-Control_resp:
+  description: |
+    **Note**: `X-Account-Access-Control` is not supported by Keystone auth.
+
+    The account access control list (ACL) that grants access to
+    containers and objects in the account.
+    If there is no ACL, this header is not returned by this operation.
+    See `Account ACLs
+    <https://docs.openstack.org/swift/latest/overview_acl.html#account-acls>`_
+    for more information.
+  in: header
+  required: false
+  type: string
+X-Account-Bytes-Used:
+  description: |
+    The total number of bytes that are stored in
+    Object Storage for the account.
+  in: header
+  required: true
+  type: integer
+X-Account-Container-Count:
+  description: |
+    The number of containers.
+  in: header
+  required: true
+  type: integer
+X-Account-Meta-name:
+  description: |
+    The custom account metadata item, where
+    ``name`` is the name of the metadata item.  One ``X-Account-Meta-name``
+    response header appears for each metadata item (for
+    each ``name``).
+  in: header
+  required: false
+  type: string
+X-Account-Meta-name_req:
+  description: |
+    The account metadata. The ``name`` is the name
+    of metadata item that you want to add, update, or delete. To
+    delete this item, send an empty value in this header.  You must
+    specify an ``X-Account-Meta-name`` header for each metadata
+    item (for each ``name``) that you want to add, update, or
+    delete.
+  in: header
+  required: false
+  type: string
+X-Account-Meta-Quota-Bytes_resp:
+  description: |
+    If present, this is the limit on the total size in bytes of objects stored
+    in the account.
+    Typically this value is set by an administrator.
+  in: header
+  required: false
+  type: string
+X-Account-Meta-Temp-URL-Key-2_req:
+  description: |
+    A second secret key value for temporary URLs.
+    The second key enables you to rotate keys by having
+    two active keys at the same time.
+  in: header
+  required: false
+  type: string
+X-Account-Meta-Temp-URL-Key-2_resp:
+  description: |
+    The second secret key value for temporary URLs. If
+    not set, this header is not returned in the response.
+  in: header
+  required: false
+  type: string
+X-Account-Meta-Temp-URL-Key_req:
+  description: |
+    The secret key value for temporary URLs.
+  in: header
+  required: false
+  type: string
+X-Account-Meta-Temp-URL-Key_resp:
+  description: |
+    The secret key value for temporary URLs. If not
+    set, this header is not returned in the response.
+  in: header
+  required: false
+  type: string
+X-Account-Object-Count:
+  description: |
+    The number of objects in the account.
+  in: header
+  required: true
+  type: integer
+X-Account-Storage-Policy-name-Bytes-Used:
+  description: |
+    The total number of bytes that are stored in
+    in a given storage policy, where ``name`` is the
+    name of the storage policy.
+  in: header
+  required: true
+  type: integer
+X-Account-Storage-Policy-name-Container-Count:
+  description: |
+    The number of containers in the account that use the given
+    storage policy where ``name`` is the name of the storage policy.
+  in: header
+  required: true
+  type: integer
+X-Account-Storage-Policy-name-Object-Count:
+  description: |
+    The number of objects in given storage policy where ``name`` is
+    the name of the storage policy.
+  in: header
+  required: true
+  type: integer
+X-Auth-Token:
+  description: |
+    Authentication token. If you omit this header,
+    your request fails unless the account owner has granted you access
+    through an access control list (ACL).
+  in: header
+  required: false
+  type: string
+X-Container-Bytes-Used:
+  description: |
+    The total number of bytes used.
+  in: header
+  required: true
+  type: integer
+X-Container-Meta-Access-Control-Allow-Origin:
+  description: |
+    Originating URLs allowed to make cross-origin
+    requests (CORS), separated by spaces. This heading applies to the
+    container only, and all objects within the container with this
+    header applied are CORS-enabled for the allowed origin URLs.  A
+    browser (user-agent) typically issues a `preflighted request
+    <https://developer.mozilla.org/en-
+    US/docs/HTTP/Access_control_CORS>`_ , which is an OPTIONS call
+    that verifies the origin is allowed to make the request. The
+    Object Storage service returns 200 if the originating URL is
+    listed in this header parameter, and issues a 401 if the
+    originating URL is not allowed to make a cross-origin request.
+    Once a 200 is returned, the browser makes a second request to the
+    Object Storage service to retrieve the CORS-enabled object.
+  in: header
+  required: false
+  type: string
+X-Container-Meta-Access-Control-Expose-Headers:
+  description: |
+    Headers the Object Storage service exposes to the
+    browser (technically, through the ``user-agent`` setting), in the
+    request response, separated by spaces.  By default the Object
+    Storage service returns the following headers:
+
+    - All "simple response headers" as listed on
+      `http://www.w3.org/TR/cors/#simple-response-header
+      <http://www.w3.org/TR/cors/#simple-response-header>`_.
+    - The headers ``etag``, ``x-timestamp``, ``x-trans-id``,
+      ``x-openstack-request-id``.
+    - All metadata headers (``X-Container-Meta-*`` for containers and
+      ``X-Object-Meta-*`` for objects).
+    - headers listed in ``X-Container-Meta-Access-Control-Expose-Headers``.
+  in: header
+  required: false
+  type: string
+X-Container-Meta-Access-Control-Max-Age:
+  description: |
+    Maximum time for the origin to hold the preflight
+    results. A browser may make an OPTIONS call to verify the origin
+    is allowed to make the request. Set the value to an integer number
+    of seconds after the time that the request was received.
+  in: header
+  required: false
+  type: string
+X-Container-Meta-name:
+  description: |
+    The custom container metadata item, where
+    ``name`` is the name of the metadata item.  One ``X-Container-Meta-name``
+    response header appears for each metadata item (for
+    each ``name``).
+  in: header
+  required: true
+  type: string
+X-Container-Meta-name_req:
+  description: |
+    The container metadata, where ``name`` is the
+    name of metadata item.  You must specify an ``X-Container-Meta-name``
+    header for each metadata item (for each ``name``) that
+    you want to add or update.
+  in: header
+  required: false
+  type: string
+X-Container-Meta-Quota-Bytes:
+  description: |
+    Sets maximum size of the container, in bytes.
+    Typically these values are set by an administrator. Returns a 413
+    response (request entity too large) when an object PUT operation
+    exceeds this quota value.
+    This value does not take effect immediately. see
+    `Container Quotas
+    <https://docs.openstack.org/swift/latest/api/container_quotas.html>`_
+    for more information.
+  in: header
+  required: false
+  type: string
+X-Container-Meta-Quota-Bytes_resp:
+  description: |
+    The maximum size of the container, in bytes. If not set, this header is not
+    returned by this operation.
+  in: header
+  required: false
+  type: string
+X-Container-Meta-Quota-Count:
+  description: |
+    Sets maximum object count of the container.
+    Typically these values are set by an administrator. Returns a 413
+    response (request entity too large) when an object PUT operation
+    exceeds this quota value.
+    This value does not take effect immediately. see
+    `Container Quotas
+    <https://docs.openstack.org/swift/latest/api/container_quotas.html>`_
+    for more information.
+  in: header
+  required: false
+  type: string
+X-Container-Meta-Quota-Count_resp:
+  description: |
+    The maximum object count of the container. If not set, this header is not
+    returned by this operation.
+  in: header
+  required: false
+  type: string
+X-Container-Meta-Temp-URL-Key-2_req:
+  description: |
+    A second secret key value for temporary URLs.
+    The second key enables you to rotate keys by having
+    two active keys at the same time.
+  in: header
+  required: false
+  type: string
+X-Container-Meta-Temp-URL-Key-2_resp:
+  description: |
+    The second secret key value for temporary URLs. If
+    not set, this header is not returned in the response.
+  in: header
+  required: false
+  type: string
+X-Container-Meta-Temp-URL-Key_req:
+  description: |
+    The secret key value for temporary URLs.
+  in: header
+  required: false
+  type: string
+X-Container-Meta-Temp-URL-Key_resp:
+  description: |
+    The secret key value for temporary URLs. If not
+    set, this header is not returned in the response.
+  in: header
+  required: false
+  type: string
+X-Container-Meta-Web-Directory-Type:
+  description: |
+    Sets the content-type of directory marker
+    objects. If the header is not set, default is
+    ``application/directory``. Directory marker objects are 0-byte
+    objects that represent directories to create a simulated
+    hierarchical structure.  For example, if you set ``"X-Container-
+    Meta-Web-Directory-Type: text/directory"``, Object Storage treats
+    0-byte objects with a content-type of ``text/directory`` as
+    directories rather than objects.
+  in: header
+  required: false
+  type: string
+X-Container-Object-Count:
+  description: |
+    The number of objects.
+  in: header
+  required: true
+  type: integer
+X-Container-Read:
+  description: |
+    Sets a container access control list (ACL) that grants read access.
+    The scope of the access is specific to the container. The ACL grants
+    the ability to perform GET or HEAD operations on objects in the container
+    or to perform a GET or HEAD operation on the container itself.
+
+    The format and scope of the ACL is dependent on the authorization system
+    used by the Object Storage service. See `Container ACLs
+    <https://docs.openstack.org/swift/latest/overview_acl.html#container-acls>`_
+    for more information.
+  in: header
+  required: false
+  type: string
+X-Container-Read_resp:
+  description: |
+    The ACL that grants read access. If there is no ACL, this
+    header is not returned by this operation.
+    See `Container ACLs
+    <https://docs.openstack.org/swift/latest/overview_acl.html#container-acls>`_
+    for more information.
+  in: header
+  required: false
+  type: string
+X-Container-Sync-Key:
+  description: |
+    Sets the secret key for container
+    synchronization. If you remove the secret key, synchronization is
+    halted.
+    For more information, see `Container to Container Synchronization
+    <https://docs.openstack.org/swift/latest/overview_container_sync.html>`_
+  in: header
+  required: false
+  type: string
+X-Container-Sync-Key_resp:
+  description: |
+    The secret key for container synchronization. If
+    not set, this header is not returned by this operation.
+  in: header
+  required: false
+  type: string
+X-Container-Sync-To:
+  description: |
+    Sets the destination for container
+    synchronization. Used with the secret key indicated in the ``X
+    -Container-Sync-Key`` header. If you want to stop a container from
+    synchronizing, send a blank value for the ``X-Container-Sync-Key``
+    header.
+  in: header
+  required: false
+  type: string
+X-Container-Sync-To_resp:
+  description: |
+    The destination for container synchronization. If
+    not set, this header is not returned by this operation.
+  in: header
+  required: false
+  type: string
+X-Container-Write:
+  description: |
+    Sets a container access control list (ACL) that grants write access.
+    The scope of the access is specific to the container. The ACL grants
+    the ability to perform PUT, POST and DELETE operations on
+    objects in the container. It does not grant write access to the container
+    metadata.
+
+    The format of the ACL is dependent on the authorization system
+    used by the Object Storage service.  See `Container ACLs
+    <https://docs.openstack.org/swift/latest/overview_acl.html#container-acls>`_
+    for more information.
+
+  in: header
+  required: false
+  type: string
+X-Container-Write_resp:
+  description:
+    The ACL that grants write access. If there is no ACL,
+    this header is not returned by this operation.
+    See `Container ACLs
+    <https://docs.openstack.org/swift/latest/overview_acl.html#container-acls>`_
+    for more information.
+  in: header
+  required: false
+  type: string
+X-Copied-From:
+  description: |
+    For a copied object, shows the container and
+    object name from which the new object was copied. The value is in
+    the ``{container}/{object}`` format.
+  in: header
+  required: false
+  type: string
+X-Copied-From-Account:
+  description: |
+    For a copied object, shows the account
+    from which the new object was copied.
+  in: header
+  required: false
+  type: string
+X-Copied-From-Last-Modified:
+  description: |
+    For a copied object, the date and time in `UNIX
+    Epoch time stamp format
+    <https://en.wikipedia.org/wiki/Unix_time>`_ when the container and
+    object name from which the new object was copied was last
+    modified.  For example, ``1440619048`` is equivalent to ``Mon,
+    Wed, 26 Aug 2015 19:57:28 GMT``.
+  in: header
+  required: false
+  type: integer
+X-Copy-From:
+  description: |
+    If set, this is the name of an object used to
+    create the new object by copying the ``X-Copy-From`` object. The
+    value is in form ``{container}/{object}``. You must UTF-8-encode
+    and then URL-encode the names of the container and object before
+    you include them in the header.  Using PUT with ``X-Copy-From``
+    has the same effect as using the COPY operation to copy an object.
+    Using ``Range`` header with ``X-Copy-From`` will create a new
+    partial copied object with bytes set by ``Range``.
+  in: header
+  required: false
+  type: string
+X-Copy-From-Account:
+  description: |
+    Specifies the account name where the object is copied from. If not
+    specified, the object is copied from the account which owns the new
+    object (i.e., the account in the path).
+  in: header
+  required: false
+  type: string
+X-Delete-After:
+  description: |
+    The number of seconds after which the system removes the object. The value
+    should be a positive integer. Internally, the Object Storage system uses
+    this value to generate an ``X-Delete-At`` metadata item. If both
+    ``X-Delete-After`` and ``X-Delete-At`` are set then ``X-Delete-After``
+    takes precedence.
+  in: header
+  required: false
+  type: integer
+X-Delete-At:
+  description: |
+    The date and time in `UNIX Epoch time stamp format
+    <https://en.wikipedia.org/wiki/Unix_time>`_ when the system removes the
+    object.  For example, ``1440619048`` is equivalent to ``Mon, Wed, 26 Aug
+    2015 19:57:28 GMT``.  The value should be a positive integer corresponding
+    to a time in the future. If both ``X-Delete-After`` and ``X-Delete-At`` are
+    set then ``X-Delete-After`` takes precedence.
+  in: header
+  required: false
+  type: integer
+X-Delete-At_resp:
+  description: |
+    If present, specifies date and time in `UNIX Epoch time stamp format
+    <https://en.wikipedia.org/wiki/Unix_time>`_ when the system removes the
+    object.  For example, ``1440619048`` is equivalent to ``Mon, Wed, 26 Aug
+    2015 19:57:28 GMT``.
+  in: header
+  required: false
+  type: integer
+X-Detect-Content-Type:
+  description: |
+    If set to ``true``, Object Storage guesses the
+    content type based on the file extension and ignores the value
+    sent in the ``Content-Type`` header, if present.
+  in: header
+  required: false
+  type: boolean
+X-Fresh-Metadata:
+  description: |
+    Enables object creation that omits existing user
+    metadata.  If set to ``true``, the COPY request creates an object
+    without existing user metadata.  Default value is ``false``.
+  in: header
+  required: false
+  type: boolean
+X-History-Location:
+  description: |
+    The URL-encoded UTF-8 representation of the container that stores
+    previous versions of objects. If neither this nor ``X-Versions-Location``
+    is set, versioning is disabled for this container. ``X-History-Location``
+    and ``X-Versions-Location`` cannot both be set at the same time. For more
+    information about object versioning, see `Object versioning
+    <https://docs.openstack.org/swift/latest/api/object_versioning.html>`_.
+  in: header
+  required: false
+  type: string
+X-History-Location_resp:
+  description: |
+    If present, this container has versioning enabled and the value
+    is the UTF-8 encoded name of another container. For more information
+    about object versioning, see `Object versioning
+    <https://docs.openstack.org/swift/latest/api/object_versioning.html>`_.
+  in: header
+  required: false
+  type: string
+X-Newest:
+  description: |
+    If set to true , Object Storage queries all
+    replicas to return the most recent one. If you omit this header,
+    Object Storage responds faster after it finds one valid replica.
+    Because setting this header to true is more expensive for the back
+    end, use it only when it is absolutely needed.
+  in: header
+  required: false
+  type: boolean
+X-Object-Manifest:
+  description: |
+    Set to specify that this is a dynamic large
+    object manifest object. The value is the container and object name
+    prefix of the segment objects in the form ``container/prefix``.
+    You must UTF-8-encode and then URL-encode the names of the
+    container and prefix before you include them in this header.
+  in: header
+  required: false
+  type: string
+X-Object-Manifest_resp:
+  description: |
+    If present, this is a dynamic large object
+    manifest object. The value is the container and object name prefix
+    of the segment objects in the form ``container/prefix``.
+  in: header
+  required: false
+  type: string
+X-Object-Meta-name:
+  description: |
+    The object metadata, where ``name`` is the name
+    of the metadata item.  You must specify an
+    ``X-Object-Meta-name`` header for each metadata ``name`` item that
+    you want to add or update.
+  in: header
+  required: false
+  type: string
+X-Object-Meta-name_resp:
+  description: |
+    If present, the custom object metadata item, where ``name``
+    is the name of the metadata item.  One``X-Object-Meta-name``
+    response header appears for each metadata ``name`` item.
+  in: header
+  required: false
+  type: string
+X-Openstack-Request-Id:
+  description: |
+    A unique transaction ID for this request. Your
+    service provider might need this value if you report a problem.
+    (same as ``X-Trans-Id``)
+  in: header
+  required: true
+  type: string
+X-Remove-Account-name:
+  description: |
+    Removes the metadata item named ``name``.
+    For example, ``X-Remove-Account-Meta-Blue`` removes
+    custom metadata.
+  in: header
+  required: false
+  type: string
+X-Remove-Container-name:
+  description: |
+    Removes the metadata item named ``name``. For
+    example, ``X-Remove-Container-Read`` removes the
+    ``X-Container-Read`` metadata item and ``X-Remove-Container-Meta-Blue``
+    removes custom metadata.
+  in: header
+  required: false
+  type: string
+X-Remove-History-Location:
+  description: |
+    Set to any value to disable versioning. Note that this disables version
+    that was set via ``X-Versions-Location`` as well.
+  in: header
+  required: false
+  type: string
+X-Remove-Versions-Location:
+  description: |
+    Set to any value to disable versioning. Note that this disables version
+    that was set via ``X-History-Location`` as well.
+  in: header
+  required: false
+  type: string
+X-Service-Token:
+  description: |
+    A service token. See `OpenStack Service Using Composite Tokens
+    <https://docs.openstack.org/swift/latest/overview_auth.html#openstack-
+    service-using-composite-tokens>`_ for more information.
+  in: header
+  required: false
+  type: string
+X-Static-Large-Object:
+  description: |
+    Set to ``true`` if this object is a static large
+    object manifest object.
+  in: header
+  required: true
+  type: boolean
+X-Storage-Policy:
+  description: |
+    In requests, specifies the name of the storage policy to use for
+    the container. In responses, is the storage policy name.
+    The storage policy of the container cannot be changed.
+  in: header
+  required: false
+  type: string
+X-Symlink-Target:
+  description: |
+    Set to specify that this is a symlink object.
+    The value is the relative path of the target object in the
+    format <container>/<object>.  The target object does not need to
+    exist at the time of symlink creation.
+    You must UTF-8-encode and then URL-encode the names of the
+    container and object before you include them in this header.
+  in: header
+  required: false
+  type: string
+X-Symlink-Target-Account:
+  description: |
+    Set to specify that this is a cross-account symlink to
+    an object in the account specified in the value.
+    The ``X-Symlink-Target`` must also be set for this to
+    be effective.
+    You must UTF-8-encode and then URL-encode the account name
+    before you include it in this header.
+  in: header
+  required: false
+  type: string
+X-Symlink-Target-Account_resp:
+  description: |
+    If present, and ``X-Symlink-Target`` is present, then
+    this is a cross-account symlink to
+    an object in the account specified in the value.
+  in: header
+  required: false
+  type: string
+X-Symlink-Target_resp:
+  description: |
+    If present, this is a symlink object.
+    The value is the relative path of the target object in the
+    format <container>/<object>.
+  in: header
+  required: false
+  type: string
+X-Timestamp:
+  description: |
+    The date and time in `UNIX Epoch time stamp
+    format <https://en.wikipedia.org/wiki/Unix_time>`_ when the
+    account, container, or object was initially created as a current
+    version.  For example, ``1440619048`` is equivalent to ``Mon, Wed,
+    26 Aug 2015 19:57:28 GMT``.
+  in: header
+  required: true
+  type: integer
+X-Trans-Id:
+  description: |
+    A unique transaction ID for this request. Your
+    service provider might need this value if you report a problem.
+  in: header
+  required: true
+  type: string
+X-Trans-Id-Extra:
+  description: |
+    Extra transaction information. Use the ``X-Trans-Id-Extra``
+    request header to include extra information to help you
+    debug any errors that might occur with large object upload and
+    other Object Storage transactions.  The server appends the
+    first 32 characters of the ``X-Trans-Id-Extra`` request header
+    value to the transaction ID value in the generated ``X-Trans-Id``
+    response header. You must UTF-8-encode and then URL-encode the
+    extra transaction information before you include it in the
+    ``X-Trans-Id-Extra`` request header.  For example, you can include
+    extra transaction information when you upload `large objects
+    <https://docs.openstack.org/swift/latest/api/large_objects.html>`_
+    such as images. When
+    you upload each segment and the manifest, include the same value
+    in the ``X-Trans-Id-Extra`` request header. If an error occurs,
+    you can find all requests that are related to the large object
+    upload in the Object Storage logs.  You can also use ``X-Trans-Id-Extra``
+    strings to help operators debug requests that fail to
+    receive responses. The operator can search for the extra
+    information in the logs.
+  in: header
+  required: false
+  type: string
+X-Versions-Location:
+  description: |
+    The URL-encoded UTF-8 representation of the container that stores
+    previous versions of objects. If neither this nor ``X-History-Location``
+    is set, versioning is disabled for this container. ``X-Versions-Location``
+    and ``X-History-Location`` cannot both be set at the same time. For more
+    information about object versioning, see `Object versioning
+    <https://docs.openstack.org/swift/latest/api/object_versioning.html>`_.
+  in: header
+  required: false
+  type: string
+X-Versions-Location_resp:
+  description: |
+    If present, this container has versioning enabled and the value
+    is the UTF-8 encoded name of another container. For more information
+    about object versioning, see `Object versioning
+    <https://docs.openstack.org/swift/latest/api/object_versioning.html>`_.
+  in: header
+  required: false
+  type: string
+
+# variables in path
+account:
+  description: |
+    The unique name for the account. An account is
+    also known as the project or tenant.
+  in: path
+  required: false
+  type: string
+container:
+  description: |
+    The unique (within an account) name for the container.  The container
+    name must be from 1 to 256 characters long and can start with any
+    character and contain any pattern. Character set must be UTF-8.
+    The container name cannot contain a slash (``/``) character
+    because this character delimits the container and object name. For
+    example, the path ``/v1/account/www/pages`` specifies the ``www``
+    container, not the ``www/pages`` container.
+  in: path
+  required: false
+  type: string
+object:
+  description: |
+    The unique name for the object.
+  in: path
+  required: false
+  type: string
+
+# variables in query
+bulk-delete:
+  description: |
+    When the ``bulk-delete`` query parameter is present in the POST
+    request, multiple objects or containers can be deleted
+    with a single request. See `Bulk Delete
+    <https://docs.openstack.org/swift/latest/middleware.html#bulk-delete>`_
+    for how this feature is used.
+  in: query
+  required: false
+  type: string
+delimiter:
+  description: |
+    The delimiter is a single character used to split object
+    names to present a pseudo-directory hierarchy of objects. When combined
+    with a ``prefix`` query, this enables API users to simulate and
+    traverse the objects in a container as if they were in a directory tree.
+  in: query
+  required: false
+  type: string
+end_marker:
+  description: |
+    For a string value, `x` , constrains the list to items whose names
+    are less than `x`.
+  in: query
+  required: false
+  type: string
+extract-archive:
+  description: |
+    When the ``extract-archive`` query parameter is present in the POST
+    request, an archive (tar file) is uploaded and extracted to
+    create multiple objects. See `Extract Archive
+    <https://docs.openstack.org/swift/latest/middleware.html#extract-archive>`_
+    for how this feature is used.
+  in: query
+  required: false
+  type: string
+filename:
+  description: |
+    Overrides the default file name. Object Storage
+    generates a default file name for GET temporary URLs that is based
+    on the object name. Object Storage returns this value in the
+    ``Content-Disposition`` response header. Browsers can interpret
+    this file name value as a file attachment to save. For more
+    information about temporary URLs, see `Temporary URL middleware
+    <https://docs.openstack.org/swift/latest/api/temporary_url_middleware.html>`_.
+  in: query
+  required: false
+  type: string
+format:
+  description: |
+    The response format. Valid values are ``json``,
+    ``xml``, or ``plain``. The default is ``plain``.  If you append
+    the ``format=xml`` or ``format=json`` query parameter to the
+    storage account URL, the response shows extended container
+    information serialized in that format.  If you append the
+    ``format=plain`` query parameter, the response lists the container
+    names separated by newlines.
+  in: query
+  required: false
+  type: string
+limit:
+  description: |
+    For an integer value n , limits the number of
+    results to n .
+  in: query
+  required: false
+  type: integer
+marker:
+  description: |
+    For a string value, `x` , constrains the list to items whose names
+    are greater than `x`.
+  in: query
+  required: false
+  type: string
+multipart-manifest_copy:
+  description: |
+    If you include the ``multipart-manifest=get``
+    query parameter and the object is a large object, the object
+    contents are not copied. Instead, the manifest is copied to
+    the new object.
+  in: query
+  required: false
+  type: string
+multipart-manifest_delete:
+  description: |
+    If you include the ``multipart-manifest=delete``
+    query parameter and the object is a static large object, the
+    segment objects and manifest object are deleted. If you omit the
+    ``multipart-manifest=delete`` query parameter and the object is a
+    static large object, the manifest object is deleted but the
+    segment objects are not deleted.  The response body will contain
+    the status of the deletion of every processed segment object.
+  in: query
+  required: false
+  type: string
+multipart-manifest_get:
+  description: |
+    If you include the ``multipart-manifest=get``
+    query parameter and the object is a large object, the object
+    contents are not returned. Instead, the manifest is returned in
+    the ``X-Object-Manifest`` response header for dynamic large
+    objects or in the response body for static large objects.
+  in: query
+  required: false
+  type: string
+multipart-manifest_head:
+  description: |
+    If you include the ``multipart-manifest=get`` query parameter and the
+    object is a large object, the object metadata is not returned. Instead, the
+    response headers will include the manifest metadata and for dynamic large
+    objects the ``X-Object-Manifest`` response header.
+  in: query
+  required: false
+  type: string
+multipart-manifest_put:
+  description: |
+    If you include the ``multipart-manifest=put`` query parameter, the object
+    is a static large object manifest and the body contains the manifest.
+    See `Static large objects <https://docs.openstack.org/swift/latest
+    /api/large_objects.html#static-large-objects>`_ for more information.
+  in: query
+  required: false
+  type: string
+path:
+  description: |
+    For a string value, returns the object names that
+    are nested in the pseudo path. Please use ``prefix``/``delimiter``
+    queries instead of using this ``path`` query.
+  in: query
+  required: false
+  type: string
+prefix:
+  description: |
+    Only objects with this prefix will be returned. When combined with a
+    ``delimiter`` query, this enables API users to simulate and
+    traverse the objects in a container as if they were in a directory tree.
+  in: query
+  required: false
+  type: string
+reverse:
+  description: |
+    By default, listings are returned sorted by name, ascending. If you include
+    the ``reverse=true`` query parameter, the listing will be returned sorted
+    by name, descending.
+  in: query
+  required: false
+  type: boolean
+swiftinfo_expires:
+  description: |
+    The time at which ``swiftinfo_sig`` expires. The time is in
+    `UNIX Epoch time stamp format
+    <https://en.wikipedia.org/wiki/Unix_time>`_.
+  in: query
+  required: false
+  type: integer
+swiftinfo_sig:
+  description: |
+    A hash-based message authentication code (HMAC)
+    that enables access to administrator-only information. To use this
+    parameter, the ``swiftinfo_expires`` parameter is also required.
+  in: query
+  required: false
+  type: string
+symlink:
+  description: |
+    If you include the ``symlink=get`` query parameter
+    and the object is a symlink, then the response will include
+    data and metadata from the symlink itself rather than from the target.
+  in: query
+  required: false
+  type: string
+symlink_copy:
+  description: |
+    If you include the ``symlink=get`` query parameter
+    and the object is a symlink, the target object
+    contents are not copied. Instead, the symlink is copied to
+    create a new symlink to the same target.
+  in: query
+  required: false
+  type: string
+temp_url_expires:
+  description: |
+    The date and time in `UNIX Epoch time stamp
+    format <https://en.wikipedia.org/wiki/Unix_time>`_ or
+    `ISO 8601 UTC timestamp <https://en.wikipedia.org/wiki/ISO_8601>`_
+    when the signature for temporary URLs expires.
+    For example, ``1440619048`` or ``2015-08-26T19:57:28Z``
+    is equivalent to ``Mon, Wed, 26 Aug 2015 19:57:28 GMT``.  For more
+    information about temporary URLs, see `Temporary URL middleware
+    <https://docs.openstack.org/swift/latest/api/temporary_url_middleware.html>`_.
+  in: query
+  required: true
+  type: integer
+temp_url_sig:
+  description: |
+    Used with temporary URLs to sign the request with
+    an HMAC-SHA1 cryptographic signature that defines the allowed HTTP
+    method, expiration date, full path to the object, and the secret
+    key for the temporary URL. For more information about temporary
+    URLs, see `Temporary URL middleware
+    <https://docs.openstack.org/swift/latest/api/temporary_url_middleware.html>`_.
+  in: query
+  required: true
+  type: string
+
+# variables in body
+bytes_in_account_get:
+  description: |
+    The total number of bytes that are stored in
+    Object Storage for the account.
+  in: body
+  required: true
+  type: integer
+bytes_in_container_get:
+  description: |
+    The total number of bytes that are stored in
+    Object Storage for the container.
+  in: body
+  required: true
+  type: integer
+content_type:
+  description: |
+    The content type of the object.
+  in: body
+  required: true
+  type: string
+count:
+  description: |
+    The number of objects in the container.
+  in: body
+  required: true
+  type: integer
+hash:
+  description: |
+    The MD5 checksum value of the object content.
+  in: body
+  required: true
+  type: string
+last_modified:
+  description: |
+    The date and time when the object was last modified.
+
+    The date and time stamp format is `ISO 8601
+    <https://en.wikipedia.org/wiki/ISO_8601>`_:
+
+    ::
+
+       CCYY-MM-DDThh:mm:ss±hh:mm
+
+    For example, ``2015-08-27T09:49:58-05:00``.
+
+    The ``±hh:mm`` value, if included, is the time zone as an offset
+    from UTC. In the previous example, the offset value is ``-05:00``.
+  in: body
+  required: true
+  type: string
+name_in_account_get:
+  description: |
+    The name of the container.
+  in: body
+  required: true
+  type: string
+name_in_container_get:
+  description: |
+    The name of the object.
+  in: body
+  required: true
+  type: string
+symlink_path:
+  description: |
+    This field exists only when the object is symlink.
+    This is the target path of the symlink object.
+  in: body
+  required: true
+  type: string
+
+
diff --git a/api-ref/source/samples/account-containers-list-http-request-json.txt b/api-ref/source/samples/account-containers-list-http-request-json.txt
new file mode 100644
index 0000000000..137ee93fbd
--- /dev/null
+++ b/api-ref/source/samples/account-containers-list-http-request-json.txt
@@ -0,0 +1 @@
+curl -i $publicURL?format=json -X GET -H "X-Auth-Token: $token"
diff --git a/api-ref/source/samples/account-containers-list-http-request-xml.txt b/api-ref/source/samples/account-containers-list-http-request-xml.txt
new file mode 100644
index 0000000000..6f9293fdca
--- /dev/null
+++ b/api-ref/source/samples/account-containers-list-http-request-xml.txt
@@ -0,0 +1 @@
+curl -i $publicURL?format=xml -X GET -H "X-Auth-Token: $token"
diff --git a/api-ref/source/samples/account-containers-list-http-response-json.txt b/api-ref/source/samples/account-containers-list-http-response-json.txt
new file mode 100644
index 0000000000..6c86e00ca5
--- /dev/null
+++ b/api-ref/source/samples/account-containers-list-http-response-json.txt
@@ -0,0 +1,12 @@
+HTTP/1.1 200 OK
+Content-Length: 96
+X-Account-Object-Count: 1
+X-Timestamp: 1389453423.35964
+X-Account-Meta-Subject: Literature
+X-Account-Bytes-Used: 14
+X-Account-Container-Count: 2
+Content-Type: application/json; charset=utf-8
+Accept-Ranges: bytes
+X-Trans-Id: tx274a77a8975c4a66aeb24-0052d95365
+X-Openstack-Request-Id: tx274a77a8975c4a66aeb24-0052d95365
+Date: Fri, 17 Jan 2014 15:59:33 GMT
diff --git a/api-ref/source/samples/account-containers-list-http-response-xml.txt b/api-ref/source/samples/account-containers-list-http-response-xml.txt
new file mode 100644
index 0000000000..c477638567
--- /dev/null
+++ b/api-ref/source/samples/account-containers-list-http-response-xml.txt
@@ -0,0 +1,12 @@
+HTTP/1.1 200 OK
+Content-Length: 262
+X-Account-Object-Count: 1
+X-Timestamp: 1389453423.35964
+X-Account-Meta-Subject: Literature
+X-Account-Bytes-Used: 14
+X-Account-Container-Count: 2
+Content-Type: application/xml; charset=utf-8
+Accept-Ranges: bytes
+X-Trans-Id: tx69f60bc9f7634a01988e6-0052d9544b
+X-Openstack-Request-Id: tx69f60bc9f7634a01988e6-0052d9544b
+Date: Fri, 17 Jan 2014 16:03:23 GMT
diff --git a/api-ref/source/samples/account-containers-list-response.json b/api-ref/source/samples/account-containers-list-response.json
new file mode 100644
index 0000000000..d9864aa246
--- /dev/null
+++ b/api-ref/source/samples/account-containers-list-response.json
@@ -0,0 +1,14 @@
+[
+    {
+        "count": 0,
+        "bytes": 0,
+        "name": "janeausten",
+        "last_modified": "2013-11-19T20:08:13.283452"
+    },
+    {
+        "count": 1,
+        "bytes": 14,
+        "name": "marktwain",
+        "last_modified": "2016-04-29T16:23:50.460230"
+    }
+]
diff --git a/api-ref/source/samples/account-containers-list-response.xml b/api-ref/source/samples/account-containers-list-response.xml
new file mode 100644
index 0000000000..6e194aebce
--- /dev/null
+++ b/api-ref/source/samples/account-containers-list-response.xml
@@ -0,0 +1,15 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<account name="my_account">
+    <container>
+        <name>janeausten</name>
+        <count>0</count>
+        <bytes>0</bytes>
+        <last_modified>2013-11-19T20:08:13.283452</last_modified>
+    </container>
+    <container>
+        <name>marktwain</name>
+        <count>1</count>
+        <bytes>14</bytes>
+        <last_modified>2016-04-29T16:23:50.460230</last_modified>
+    </container>
+</account>
diff --git a/api-ref/source/samples/capabilities-list-response.json b/api-ref/source/samples/capabilities-list-response.json
new file mode 100644
index 0000000000..f082dc7b9e
--- /dev/null
+++ b/api-ref/source/samples/capabilities-list-response.json
@@ -0,0 +1,12 @@
+{
+    "swift": {
+        "version": "1.11.0"
+    },
+    "slo": {
+        "max_manifest_segments": 1000,
+        "max_manifest_size": 2097152,
+        "min_segment_size": 1
+    },
+    "staticweb": {},
+    "tempurl": {}
+}
diff --git a/api-ref/source/samples/containers-list-http-request.txt b/api-ref/source/samples/containers-list-http-request.txt
new file mode 100644
index 0000000000..4101ce80e5
--- /dev/null
+++ b/api-ref/source/samples/containers-list-http-request.txt
@@ -0,0 +1,3 @@
+GET /{api_version}/{account} HTTP/1.1
+Host: storage.swiftdrive.com
+X-Auth-Token: eaaafd18-0fed-4b3a-81b4-663c99ec1cbb
\ No newline at end of file
diff --git a/api-ref/source/samples/containers-list-http-response.txt b/api-ref/source/samples/containers-list-http-response.txt
new file mode 100644
index 0000000000..43070e5235
--- /dev/null
+++ b/api-ref/source/samples/containers-list-http-response.txt
@@ -0,0 +1,9 @@
+HTTP/1.1 200 Ok
+Date: Thu, 07 Jun 2010 18:57:07 GMT
+Content-Type: text/plain; charset=UTF-8
+Content-Length: 32
+
+images
+movies
+documents
+backups
\ No newline at end of file
diff --git a/api-ref/source/samples/endpoints-list-response-headers.json b/api-ref/source/samples/endpoints-list-response-headers.json
new file mode 100644
index 0000000000..3a0d930603
--- /dev/null
+++ b/api-ref/source/samples/endpoints-list-response-headers.json
@@ -0,0 +1,14 @@
+{
+    "endpoints": [
+        "http://storage01.swiftdrive.com:6208/d8/583/AUTH_dev/EC_cont1/obj",
+        "http://storage02.swiftdrive.com:6208/d2/583/AUTH_dev/EC_cont1/obj",
+        "http://storage02.swiftdrive.com:6206/d3/583/AUTH_dev/EC_cont1/obj",
+        "http://storage02.swiftdrive.com:6208/d5/583/AUTH_dev/EC_cont1/obj",
+        "http://storage01.swiftdrive.com:6207/d7/583/AUTH_dev/EC_cont1/obj",
+        "http://storage02.swiftdrive.com:6207/d4/583/AUTH_dev/EC_cont1/obj",
+        "http://storage01.swiftdrive.com:6206/d6/583/AUTH_dev/EC_cont1/obj"
+    ],
+    "headers": {
+        "X-Backend-Storage-Policy-Index": "2"
+    }
+}
diff --git a/api-ref/source/samples/endpoints-list-response.json b/api-ref/source/samples/endpoints-list-response.json
new file mode 100644
index 0000000000..1f0f9cf93f
--- /dev/null
+++ b/api-ref/source/samples/endpoints-list-response.json
@@ -0,0 +1,8 @@
+{
+    "endpoints": [
+        "http://storage02.swiftdrive:6202/d2/617/AUTH_dev",
+        "http://storage01.swiftdrive:6202/d8/617/AUTH_dev",
+        "http://storage01.swiftdrive:6202/d11/617/AUTH_dev"
+    ],
+    "headers": {}
+}
diff --git a/api-ref/source/samples/goodbyeworld.txt b/api-ref/source/samples/goodbyeworld.txt
new file mode 100644
index 0000000000..aebc9c0c05
--- /dev/null
+++ b/api-ref/source/samples/goodbyeworld.txt
@@ -0,0 +1 @@
+Goodbye World!
\ No newline at end of file
diff --git a/api-ref/source/samples/helloworld.txt b/api-ref/source/samples/helloworld.txt
new file mode 100644
index 0000000000..6900abf34d
--- /dev/null
+++ b/api-ref/source/samples/helloworld.txt
@@ -0,0 +1 @@
+Hello World Again!
\ No newline at end of file
diff --git a/api-ref/source/samples/objects-list-http-response-json.txt b/api-ref/source/samples/objects-list-http-response-json.txt
new file mode 100644
index 0000000000..aa0f6b4297
--- /dev/null
+++ b/api-ref/source/samples/objects-list-http-response-json.txt
@@ -0,0 +1,11 @@
+HTTP/1.1 200 OK
+Content-Length: 341
+X-Container-Object-Count: 2
+Accept-Ranges: bytes
+X-Container-Meta-Book: TomSawyer
+X-Timestamp: 1389727543.65372
+X-Container-Bytes-Used: 26
+Content-Type: application/json; charset=utf-8
+X-Trans-Id: tx26377fe5fab74869825d1-0052d6bdff
+X-Openstack-Request-Id: tx26377fe5fab74869825d1-0052d6bdff
+Date: Wed, 15 Jan 2014 16:57:35 GMT
diff --git a/api-ref/source/samples/objects-list-http-response-xml.txt b/api-ref/source/samples/objects-list-http-response-xml.txt
new file mode 100644
index 0000000000..b9804cb583
--- /dev/null
+++ b/api-ref/source/samples/objects-list-http-response-xml.txt
@@ -0,0 +1,11 @@
+HTTP/1.1 200 OK
+Content-Length: 500
+X-Container-Object-Count: 2
+Accept-Ranges: bytes
+X-Container-Meta-Book: TomSawyer
+X-Timestamp: 1389727543.65372
+X-Container-Bytes-Used: 26
+Content-Type: application/xml; charset=utf-8
+X-Trans-Id: txc75ea9a6e66f47d79e0c5-0052d6be76
+X-Openstack-Request-Id: txc75ea9a6e66f47d79e0c5-0052d6be76
+Date: Wed, 15 Jan 2014 16:59:35 GMT
diff --git a/api-ref/source/samples/objects-list-response.json b/api-ref/source/samples/objects-list-response.json
new file mode 100644
index 0000000000..b104d3a9a6
--- /dev/null
+++ b/api-ref/source/samples/objects-list-response.json
@@ -0,0 +1,16 @@
+[
+    {
+        "hash": "451e372e48e0f6b1114fa0724aa79fa1",
+        "last_modified": "2014-01-15T16:41:49.390270",
+        "bytes": 14,
+        "name": "goodbye",
+        "content_type": "application/octet-stream"
+    },
+    {
+        "hash": "ed076287532e86365e841e92bfc50d8c",
+        "last_modified": "2014-01-15T16:37:43.427570",
+        "bytes": 12,
+        "name": "helloworld",
+        "content_type": "application/octet-stream"
+    }
+]
diff --git a/api-ref/source/samples/objects-list-response.xml b/api-ref/source/samples/objects-list-response.xml
new file mode 100644
index 0000000000..07fda614c1
--- /dev/null
+++ b/api-ref/source/samples/objects-list-response.xml
@@ -0,0 +1,17 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<container name="marktwain">
+    <object>
+        <name>goodbye</name>
+        <hash>451e372e48e0f6b1114fa0724aa79fa1</hash>
+        <bytes>14</bytes>
+        <content_type>application/octet-stream</content_type>
+        <last_modified>2014-01-15T16:41:49.390270</last_modified>
+    </object>
+    <object>
+        <name>helloworld</name>
+        <hash>ed076287532e86365e841e92bfc50d8c</hash>
+        <bytes>12</bytes>
+        <content_type>application/octet-stream</content_type>
+        <last_modified>2014-01-15T16:37:43.427570</last_modified>
+    </object>
+</container>
diff --git a/api-ref/source/storage-account-services.inc b/api-ref/source/storage-account-services.inc
new file mode 100644
index 0000000000..2bcab9ab94
--- /dev/null
+++ b/api-ref/source/storage-account-services.inc
@@ -0,0 +1,430 @@
+.. -*- rst -*-
+
+========
+Accounts
+========
+
+Lists containers for an account. Creates, updates, shows, and
+deletes account metadata. For more information and concepts about
+accounts see `Object Storage API overview
+<https://docs.openstack.org/swift/latest/api/object_api_v1_overview.html>`_.
+
+
+
+Show account details and list containers
+========================================
+
+.. rest_method::  GET /v1/{account}
+
+Shows details for an account and lists containers, sorted by name, in the account.
+
+The sort order for the name is based on a binary comparison, a
+single built-in collating sequence that compares string data by
+using the SQLite memcmp() function, regardless of text encoding.
+See `Collating Sequences
+<http://www.sqlite.org/datatype3.html#collation>`_.
+
+The response body returns a list of containers. The default
+response (``text/plain``) returns one container per line.
+
+If you use query parameters to page through a long list of
+containers, you have reached the end of the list if the number of
+items in the returned list is less than the request ``limit``
+value. The list contains more items if the number of items in the
+returned list equals the ``limit`` value.
+
+When asking for a list of containers and there are none, the
+response behavior changes depending on whether the request format
+is text, JSON, or XML. For a text response, you get a 204 , because
+there is no content. However, for a JSON or XML response, you get a
+200 with content indicating an empty array.
+
+Example requests and responses:
+
+- Show account details and list containers and ask for a JSON
+  response:
+
+  .. literalinclude:: samples/account-containers-list-http-request-json.txt
+  .. literalinclude:: samples/account-containers-list-http-response-json.txt
+  .. literalinclude:: samples/account-containers-list-response.json
+
+- Show account details and list containers and ask for an XML response:
+
+  .. literalinclude:: samples/account-containers-list-http-request-xml.txt
+  .. literalinclude:: samples/account-containers-list-http-response-xml.txt
+  .. literalinclude:: samples/account-containers-list-response.xml
+
+If the request succeeds, the operation returns one of these status
+codes:
+
+- ``OK (200)``. Success. The response body lists the containers.
+
+- ``No Content (204)``. Success. The response body shows no
+  containers. Either the account has no containers or you are
+  paging through a long list of names by using the ``marker``,
+  ``limit``, or ``end_marker`` query parameter and you have reached
+  the end of the list.
+
+
+Normal response codes: 200
+Error response codes:204,
+
+
+Request
+-------
+
+.. rest_parameters:: parameters.yaml
+
+   - account: account
+   - limit: limit
+   - marker: marker
+   - end_marker: end_marker
+   - format: format
+   - prefix: prefix
+   - delimiter: delimiter
+   - reverse: reverse
+   - X-Auth-Token: X-Auth-Token
+   - X-Service-Token: X-Service-Token
+   - X-Newest: X-Newest
+   - Accept: Accept
+   - X-Trans-Id-Extra: X-Trans-Id-Extra
+
+
+Response Parameters
+-------------------
+
+.. rest_parameters:: parameters.yaml
+
+   - Content-Length: Content-Length_listing_resp
+   - X-Account-Meta-name: X-Account-Meta-name
+   - X-Account-Meta-Temp-URL-Key: X-Account-Meta-Temp-URL-Key_resp
+   - X-Account-Meta-Temp-URL-Key-2: X-Account-Meta-Temp-URL-Key-2_resp
+   - X-Timestamp: X-Timestamp
+   - X-Trans-Id: X-Trans-Id
+   - X-Openstack-Request-Id: X-Openstack-Request-Id
+   - Date: Date
+   - X-Account-Bytes-Used: X-Account-Bytes-Used
+   - X-Account-Container-Count: X-Account-Container-Count
+   - X-Account-Object-Count: X-Account-Object-Count
+   - X-Account-Storage-Policy-name-Bytes-Used: X-Account-Storage-Policy-name-Bytes-Used
+   - X-Account-Storage-Policy-name-Container-Count: X-Account-Storage-Policy-name-Container-Count
+   - X-Account-Storage-Policy-name-Object-Count: X-Account-Storage-Policy-name-Object-Count
+   - X-Account-Meta-Quota-Bytes: X-Account-Meta-Quota-Bytes_resp
+   - X-Account-Access-Control: X-Account-Access-Control_resp
+   - Content-Type: Content-Type_listing_resp
+   - count: count
+   - bytes: bytes_in_account_get
+   - name: name_in_account_get
+
+
+Create, update, or delete account metadata
+==========================================
+
+.. rest_method::  POST /v1/{account}
+
+Creates, updates, or deletes account metadata.
+
+To create, update, or delete custom metadata, use the
+``X-Account-Meta-{name}`` request header, where ``{name}`` is the name of the
+metadata item.
+
+Account metadata operations work differently than how
+object metadata operations work. Depending on the contents of your
+POST account metadata request, the Object Storage API updates the
+metadata as shown in the following table:
+
+**Account metadata operations**
+
++----------------------------------------------------------+---------------------------------------------------------------+
+| POST request header contains                             | Result                                                        |
++----------------------------------------------------------+---------------------------------------------------------------+
+| A metadata key without a value.                          | The API removes the metadata item from the account.           |
+|                                                          |                                                               |
+| The metadata key already exists for the account.         |                                                               |
++----------------------------------------------------------+---------------------------------------------------------------+
+| A metadata key without a value.                          | The API ignores the metadata key.                             |
+|                                                          |                                                               |
+| The metadata key does not already exist for the account. |                                                               |
++----------------------------------------------------------+---------------------------------------------------------------+
+| A metadata key value.                                    | The API updates the metadata key value for the account.       |
+|                                                          |                                                               |
+| The metadata key already exists for the account.         |                                                               |
++----------------------------------------------------------+---------------------------------------------------------------+
+| A metadata key value.                                    | The API adds the metadata key and value pair, or item, to the |
+|                                                          | account.                                                      |
+| The metadata key does not already exist for the account. |                                                               |
++----------------------------------------------------------+---------------------------------------------------------------+
+| One or more account metadata items are omitted.          | The API does not change the existing metadata items.          |
+|                                                          |                                                               |
+| The metadata items already exist for the account.        |                                                               |
++----------------------------------------------------------+---------------------------------------------------------------+
+
+
+
+To delete a metadata header, send an empty value for that header,
+such as for the ``X-Account-Meta-Book`` header. If the tool you use
+to communicate with Object Storage, such as an older version of
+cURL, does not support empty headers, send the ``X-Remove-Account-
+Meta-{name}`` header with an arbitrary value. For example,
+``X-Remove-Account-Meta-Book: x``. The operation ignores the arbitrary
+value.
+
+.. include:: metadata_header_syntax.inc
+.. include:: metadata_header_encoding.inc
+
+Subsequent requests for the same key and value pair overwrite the
+existing value.
+
+If the container already has other custom metadata items, a request
+to create, update, or delete metadata does not affect those items.
+
+This operation does not accept a request body.
+
+Example requests and responses:
+
+- Create account metadata:
+
+  ::
+
+     curl -i $publicURL -X POST -H "X-Auth-Token: $token" -H "X-Account-Meta-Book: MobyDick" -H "X-Account-Meta-Subject: Literature"
+
+
+
+
+  ::
+
+     HTTP/1.1 204 No Content
+     Content-Length: 0
+     Content-Type: text/html; charset=UTF-8
+     X-Trans-Id: tx8c2dd6aee35442a4a5646-0052d954fb
+     X-Openstack-Request-Id: tx8c2dd6aee35442a4a5646-0052d954fb
+     Date: Fri, 17 Jan 2014 16:06:19 GMT
+
+
+- Update account metadata:
+
+  ::
+
+     curl -i $publicURL -X POST -H "X-Auth-Token: $token" -H "X-Account-Meta-Subject: AmericanLiterature"
+
+
+
+
+  ::
+
+     HTTP/1.1 204 No Content
+     Content-Length: 0
+     Content-Type: text/html; charset=UTF-8
+     X-Trans-Id: tx1439b96137364ab581156-0052d95532
+     X-Openstack-Request-Id: tx1439b96137364ab581156-0052d95532
+     Date: Fri, 17 Jan 2014 16:07:14 GMT
+
+
+- Delete account metadata:
+
+  ::
+
+     curl -i $publicURL -X POST -H "X-Auth-Token: $token" -H "X-Remove-Account-Meta-Subject: x"
+
+
+
+
+  ::
+
+     HTTP/1.1 204 No Content
+     Content-Length: 0
+     Content-Type: text/html; charset=UTF-8
+     X-Trans-Id: tx411cf57701424da99948a-0052d9556f
+     X-Openstack-Request-Id: tx411cf57701424da99948a-0052d9556f
+     Date: Fri, 17 Jan 2014 16:08:15 GMT
+
+
+If the request succeeds, the operation returns the ``No Content
+(204)`` response code.
+
+To confirm your changes, issue a show account metadata request.
+
+Error response codes:204,
+
+
+Request
+-------
+
+.. rest_parameters:: parameters.yaml
+
+   - account: account
+   - X-Auth-Token: X-Auth-Token
+   - X-Service-Token: X-Service-Token
+   - X-Account-Meta-Temp-URL-Key: X-Account-Meta-Temp-URL-Key_req
+   - X-Account-Meta-Temp-URL-Key-2: X-Account-Meta-Temp-URL-Key-2_req
+   - X-Account-Meta-name: X-Account-Meta-name_req
+   - X-Remove-Account-name: X-Remove-Account-name
+   - X-Account-Access-Control: X-Account-Access-Control_req
+   - X-Trans-Id-Extra: X-Trans-Id-Extra
+
+
+Response Parameters
+-------------------
+
+.. rest_parameters:: parameters.yaml
+
+   - Date: Date
+   - X-Timestamp: X-Timestamp
+   - Content-Length: Content-Length_cud_resp
+   - Content-Type: Content-Type_cud_resp
+   - X-Trans-Id: X-Trans-Id
+   - X-Openstack-Request-Id: X-Openstack-Request-Id
+
+
+Show account metadata
+=====================
+
+.. rest_method::  HEAD /v1/{account}
+
+Shows metadata for an account.
+
+Metadata for the account includes:
+
+- Number of containers
+
+- Number of objects
+
+- Total number of bytes that are stored in Object Storage for the
+  account
+
+Because the storage system can store large amounts of data, take
+care when you represent the total bytes response as an integer;
+when possible, convert it to a 64-bit unsigned integer if your
+platform supports that primitive type.
+
+Do not include metadata headers in this request.
+
+Show account metadata request:
+
+::
+
+   curl -i $publicURL -X HEAD -H "X-Auth-Token: $token"
+
+
+
+
+::
+
+   HTTP/1.1 204 No Content
+   Content-Length: 0
+   X-Account-Object-Count: 1
+   X-Account-Meta-Book: MobyDick
+   X-Timestamp: 1389453423.35964
+   X-Account-Bytes-Used: 14
+   X-Account-Container-Count: 2
+   Content-Type: text/plain; charset=utf-8
+   Accept-Ranges: bytes
+   X-Trans-Id: txafb3504870144b8ca40f7-0052d955d4
+   X-Openstack-Request-Id: txafb3504870144b8ca40f7-0052d955d4
+   Date: Fri, 17 Jan 2014 16:09:56 GMT
+
+
+If the account or authentication token is not valid, the operation
+returns the ``Unauthorized (401)`` response code.
+
+Error response codes:204,401,
+
+
+Request
+-------
+
+.. rest_parameters:: parameters.yaml
+
+   - account: account
+   - X-Auth-Token: X-Auth-Token
+   - X-Service-Token: X-Service-Token
+   - X-Newest: X-Newest
+   - X-Trans-Id-Extra: X-Trans-Id-Extra
+
+
+Response Parameters
+-------------------
+
+.. rest_parameters:: parameters.yaml
+
+   - Content-Length: Content-Length_cud_resp
+   - X-Account-Meta-name: X-Account-Meta-name
+   - X-Account-Meta-Temp-URL-Key: X-Account-Meta-Temp-URL-Key_resp
+   - X-Account-Meta-Temp-URL-Key-2: X-Account-Meta-Temp-URL-Key-2_resp
+   - X-Timestamp: X-Timestamp
+   - X-Trans-Id: X-Trans-Id
+   - X-Openstack-Request-Id: X-Openstack-Request-Id
+   - Date: Date
+   - X-Account-Bytes-Used: X-Account-Bytes-Used
+   - X-Account-Object-Count: X-Account-Object-Count
+   - X-Account-Container-Count: X-Account-Container-Count
+   - X-Account-Storage-Policy-name-Bytes-Used: X-Account-Storage-Policy-name-Bytes-Used
+   - X-Account-Storage-Policy-name-Container-Count: X-Account-Storage-Policy-name-Container-Count
+   - X-Account-Storage-Policy-name-Object-Count: X-Account-Storage-Policy-name-Object-Count
+   - X-Account-Meta-Quota-Bytes: X-Account-Meta-Quota-Bytes_resp
+   - X-Account-Access-Control: X-Account-Access-Control_resp
+   - Content-Type: Content-Type_cud_resp
+
+
+Delete the specified account
+============================
+
+.. rest_method::  DELETE /v1/{account}
+
+Deletes the specified account when a reseller admin issues this request.
+Accounts are only deleted by (1) having a reseller admin level auth token (2)
+sending a DELETE to a proxy server for the account to be deleted and (3) that
+proxy server having the allow_account_management" config option set to true.
+
+Note that an issuing a DELETE request simply marks the account for deletion
+later as outlined in the link: https://docs.openstack.org/swift/latest/overview_reaper.html.
+
+Take care when performing this operation because deleting an account is a
+one-way operation that is not trivially recoverable. It's crucial to note that in
+an OpenStack context, you should delete an account after the project/tenant has been deleted from Keystone.
+
+
+::
+
+   curl -i $publicURL -X DELETE -H 'X-Auth-Token: $<reseller admin token>' 
+
+
+
+::
+
+   HTTP/1.1 204 No Content
+   Content-Length: 0
+   Content-Type: text/html; charset=UTF-8
+   X-Account-Status: Deleted
+   X-Trans-Id: tx91ce60a640cc42eca198a-006128c180
+   X-Openstack-Request-Id: tx91ce60a640cc42eca198a-006128c180
+   Date: Fri, 27 Aug 2021 11:42:08 GMT
+
+If the account or authentication token is not valid, the operation
+returns the ``Unauthorized (401)``. If you try to delete an account with a
+non-admin token, a ``403 Forbidden`` response code is returned.
+If you give a non-existent account or an invalid URL, a ``404 Not Found`` response code is returned.
+
+Error response codes:204,401,403,404.
+
+
+Request
+-------
+
+.. rest_parameters:: parameters.yaml
+
+   - account: account
+   - X-Auth-Token: X-Auth-Token
+
+Response Parameters
+-------------------
+
+.. rest_parameters:: parameters.yaml
+
+   - Date: Date
+   - X-Timestamp: X-Timestamp
+   - Content-Length: Content-Length_cud_resp
+   - Content-Type: Content-Type_cud_resp
+   - X-Trans-Id: X-Trans-Id
+   - X-Openstack-Request-Id: X-Openstack-Request-Id
+
diff --git a/api-ref/source/storage-container-services.inc b/api-ref/source/storage-container-services.inc
new file mode 100644
index 0000000000..7d7be9fc52
--- /dev/null
+++ b/api-ref/source/storage-container-services.inc
@@ -0,0 +1,559 @@
+.. -*- rst -*-
+
+==========
+Containers
+==========
+
+Lists objects in a container. Creates, shows details for, and
+deletes containers. Creates, updates, shows, and deletes container
+metadata. For more information and concepts about
+containers see `Object Storage API overview
+<https://docs.openstack.org/swift/latest/api/object_api_v1_overview.html>`_.
+
+
+Show container details and list objects
+=======================================
+
+.. rest_method::  GET /v1/{account}/{container}
+
+Shows details for a container and lists objects, sorted by name, in the container.
+
+Specify query parameters in the request to filter the list and
+return a subset of objects. Omit query parameters to return
+a list of objects that are stored in the container,
+up to 10,000 names. The 10,000 maximum value is configurable. To
+view the value for the cluster, issue a GET ``/info`` request.
+
+Example requests and responses:
+
+- ``OK (200)``. Success. The response body lists the objects.
+
+- ``No Content (204)``. Success. The response body shows no objects.
+  Either the container has no objects or you are paging through a
+  long list of objects by using the ``marker``, ``limit``, or
+  ``end_marker`` query parameter and you have reached the end of
+  the list.
+
+If the container does not exist, the call returns the ``Not Found
+(404)`` response code.
+
+Normal response codes: 200, 204
+
+Error response codes: 404
+
+
+Request
+-------
+
+.. rest_parameters:: parameters.yaml
+
+   - account: account
+   - container: container
+   - limit: limit
+   - marker: marker
+   - end_marker: end_marker
+   - prefix: prefix
+   - format: format
+   - delimiter: delimiter
+   - path: path
+   - reverse: reverse
+   - X-Auth-Token: X-Auth-Token
+   - X-Service-Token: X-Service-Token
+   - X-Newest: X-Newest
+   - Accept: Accept
+   - X-Container-Meta-Temp-URL-Key: X-Container-Meta-Temp-URL-Key_req
+   - X-Container-Meta-Temp-URL-Key-2: X-Container-Meta-Temp-URL-Key-2_req
+   - X-Trans-Id-Extra: X-Trans-Id-Extra
+   - X-Storage-Policy: X-Storage-Policy
+
+
+Response Parameters
+-------------------
+
+.. rest_parameters:: parameters.yaml
+
+   - X-Container-Meta-name: X-Container-Meta-name
+   - Content-Length: Content-Length_listing_resp
+   - X-Container-Object-Count: X-Container-Object-Count
+   - X-Container-Bytes-Used: X-Container-Bytes-Used
+   - Accept-Ranges: Accept-Ranges
+   - X-Container-Meta-Temp-URL-Key: X-Container-Meta-Temp-URL-Key_resp
+   - X-Container-Meta-Temp-URL-Key-2: X-Container-Meta-Temp-URL-Key-2_resp
+   - X-Container-Meta-Quota-Count: X-Container-Meta-Quota-Count_resp
+   - X-Container-Meta-Quota-Bytes: X-Container-Meta-Quota-Bytes_resp
+   - X-Storage-Policy: X-Storage-Policy
+   - X-Container-Read: X-Container-Read_resp
+   - X-Container-Write: X-Container-Write_resp
+   - X-Container-Sync-Key: X-Container-Sync-Key_resp
+   - X-Container-Sync-To: X-Container-Sync-To_resp
+   - X-Versions-Location: X-Versions-Location_resp
+   - X-History-Location: X-History-Location_resp
+   - X-Timestamp: X-Timestamp
+   - X-Trans-Id: X-Trans-Id
+   - X-Openstack-Request-Id: X-Openstack-Request-Id
+   - Content-Type: Content-Type_listing_resp
+   - Date: Date
+   - hash: hash
+   - last_modified: last_modified
+   - content_type: content_type
+   - bytes: bytes_in_container_get
+   - name: name_in_container_get
+   - symlink_path: symlink_path
+
+
+Response Example format=json
+----------------------------
+
+.. literalinclude:: samples/objects-list-http-response-json.txt
+.. literalinclude:: samples/objects-list-response.json
+
+
+Response Example format=xml
+---------------------------
+
+.. literalinclude:: samples/objects-list-http-response-xml.txt
+.. literalinclude:: samples/objects-list-response.xml
+
+Create container
+================
+
+.. rest_method::  PUT /v1/{account}/{container}
+
+Creates a container.
+
+You do not need to check whether a container already exists before
+issuing a PUT operation because the operation is idempotent: It
+creates a container or updates an existing container, as
+appropriate.
+
+To create, update, or delete a custom metadata item, use the ``X
+-Container-Meta-{name}`` header, where ``{name}`` is the name of
+the metadata item.
+
+.. include:: metadata_header_syntax.inc
+.. include:: metadata_header_encoding.inc
+
+Example requests and responses:
+
+- Create a container with no metadata:
+
+  ::
+
+     curl -i $publicURL/steven -X PUT -H "Content-Length: 0" -H "X-Auth-Token: $token"
+
+
+
+
+  ::
+
+     HTTP/1.1 201 Created
+     Content-Length: 0
+     Content-Type: text/html; charset=UTF-8
+     X-Trans-Id: tx7f6b7fa09bc2443a94df0-0052d58b56
+     X-Openstack-Request-Id: tx7f6b7fa09bc2443a94df0-0052d58b56
+     Date: Tue, 14 Jan 2014 19:09:10 GMT
+
+
+- Create a container with metadata:
+
+  ::
+
+     curl -i $publicURL/marktwain -X PUT -H "X-Auth-Token: $token" -H "X-Container-Meta-Book: TomSawyer"
+
+
+
+
+  ::
+
+     HTTP/1.1 201 Created
+     Content-Length: 0
+     Content-Type: text/html; charset=UTF-8
+     X-Trans-Id: tx06021f10fc8642b2901e7-0052d58f37
+     X-Openstack-Request-Id: tx06021f10fc8642b2901e7-0052d58f37
+     Date: Tue, 14 Jan 2014 19:25:43 GMT
+
+- Create a container with an ACL to allow anybody to get an object in the
+  marktwain container:
+  ::
+
+     curl -i $publicURL/marktwain -X PUT -H "X-Auth-Token: $token" -H "X-Container-Read: .r:*"
+
+
+
+  ::
+
+     HTTP/1.1 201 Created
+     Content-Length: 0
+     Content-Type: text/html; charset=UTF-8
+     X-Trans-Id: tx06021f10fc8642b2901e7-0052d58f37
+     X-Openstack-Request-Id: tx06021f10fc8642b2901e7-0052d58f37
+     Date: Tue, 14 Jan 2014 19:25:43 GMT
+
+Normal response codes: 201, 202
+
+Error response codes: 400, 404, 507
+
+Request
+-------
+
+.. rest_parameters:: parameters.yaml
+
+   - account: account
+   - container: container
+   - X-Auth-Token: X-Auth-Token
+   - X-Service-Token: X-Service-Token
+   - X-Container-Read: X-Container-Read
+   - X-Container-Write: X-Container-Write
+   - X-Container-Sync-To: X-Container-Sync-To
+   - X-Container-Sync-Key: X-Container-Sync-Key
+   - X-Versions-Location: X-Versions-Location
+   - X-History-Location: X-History-Location
+   - X-Container-Meta-name: X-Container-Meta-name_req
+   - X-Container-Meta-Access-Control-Allow-Origin: X-Container-Meta-Access-Control-Allow-Origin
+   - X-Container-Meta-Access-Control-Max-Age: X-Container-Meta-Access-Control-Max-Age
+   - X-Container-Meta-Access-Control-Expose-Headers: X-Container-Meta-Access-Control-Expose-Headers
+   - X-Container-Meta-Quota-Bytes: X-Container-Meta-Quota-Bytes
+   - X-Container-Meta-Quota-Count: X-Container-Meta-Quota-Count
+   - X-Container-Meta-Temp-URL-Key: X-Container-Meta-Temp-URL-Key_req
+   - X-Container-Meta-Temp-URL-Key-2: X-Container-Meta-Temp-URL-Key-2_req
+   - X-Trans-Id-Extra: X-Trans-Id-Extra
+   - X-Storage-Policy: X-Storage-Policy
+
+
+Response Parameters
+-------------------
+
+.. rest_parameters:: parameters.yaml
+
+   - Date: Date
+   - X-Timestamp: X-Timestamp
+   - Content-Length: Content-Length_cud_resp
+   - Content-Type: Content-Type_cud_resp
+   - X-Trans-Id: X-Trans-Id
+   - X-Openstack-Request-Id: X-Openstack-Request-Id
+
+
+
+
+
+
+Create, update, or delete container metadata
+============================================
+
+.. rest_method::  POST /v1/{account}/{container}
+
+Creates, updates, or deletes custom metadata for a container.
+
+To create, update, or delete a custom metadata item, use the ``X
+-Container-Meta-{name}`` header, where ``{name}`` is the name of
+the metadata item.
+
+.. include:: metadata_header_syntax.inc
+.. include:: metadata_header_encoding.inc
+
+Subsequent requests for the same key and value pair overwrite the
+previous value.
+
+To delete container metadata, send an empty value for that header,
+such as for the ``X-Container-Meta-Book`` header. If the tool you
+use to communicate with Object Storage, such as an older version of
+cURL, does not support empty headers, send the ``X-Remove-
+Container-Meta-{name}`` header with an arbitrary value. For
+example, ``X-Remove-Container-Meta-Book: x``. The operation ignores
+the arbitrary value.
+
+If the container already has other custom metadata items, a request
+to create, update, or delete metadata does not affect those items.
+
+Example requests and responses:
+
+- Create container metadata:
+
+  ::
+
+     curl -i $publicURL/marktwain -X POST -H "X-Auth-Token: $token" -H "X-Container-Meta-Author: MarkTwain" -H "X-Container-Meta-Web-Directory-Type: text/directory" -H "X-Container-Meta-Century: Nineteenth"
+
+
+
+
+  ::
+
+     HTTP/1.1 204 No Content
+     Content-Length: 0
+     Content-Type: text/html; charset=UTF-8
+     X-Trans-Id: tx05dbd434c651429193139-0052d82635
+     X-Openstack-Request-Id: tx05dbd434c651429193139-0052d82635
+     Date: Thu, 16 Jan 2014 18:34:29 GMT
+
+
+- Update container metadata:
+
+  ::
+
+     curl -i $publicURL/marktwain -X POST -H "X-Auth-Token: $token" -H "X-Container-Meta-Author: SamuelClemens"
+
+
+
+
+  ::
+
+     HTTP/1.1 204 No Content
+     Content-Length: 0
+     Content-Type: text/html; charset=UTF-8
+     X-Trans-Id: txe60c7314bf614bb39dfe4-0052d82653
+     X-Openstack-Request-Id: txe60c7314bf614bb39dfe4-0052d82653
+     Date: Thu, 16 Jan 2014 18:34:59 GMT
+
+
+- Delete container metadata:
+
+  ::
+
+     curl -i $publicURL/marktwain -X POST -H "X-Auth-Token: $token" -H "X-Remove-Container-Meta-Century: x"
+
+
+
+
+  ::
+
+     HTTP/1.1 204 No Content
+     Content-Length: 0
+     Content-Type: text/html; charset=UTF-8
+     X-Trans-Id: tx7997e18da2a34a9e84ceb-0052d826d0
+     X-Openstack-Request-Id: tx7997e18da2a34a9e84ceb-0052d826d0
+     Date: Thu, 16 Jan 2014 18:37:04 GMT
+
+
+If the request succeeds, the operation returns the ``No Content
+(204)`` response code.
+
+To confirm your changes, issue a show container metadata request.
+
+Normal response codes: 204
+
+Error response codes: 404
+
+
+Request
+-------
+
+.. rest_parameters:: parameters.yaml
+
+   - account: account
+   - container: container
+   - X-Auth-Token: X-Auth-Token
+   - X-Service-Token: X-Service-Token
+   - X-Container-Read: X-Container-Read
+   - X-Remove-Container-name: X-Remove-Container-name
+   - X-Container-Write: X-Container-Write
+   - X-Container-Sync-To: X-Container-Sync-To
+   - X-Container-Sync-Key: X-Container-Sync-Key
+   - X-Versions-Location: X-Versions-Location
+   - X-History-Location: X-History-Location
+   - X-Remove-Versions-Location: X-Remove-Versions-Location
+   - X-Remove-History-Location: X-Remove-History-Location
+   - X-Container-Meta-name: X-Container-Meta-name_req
+   - X-Container-Meta-Access-Control-Allow-Origin: X-Container-Meta-Access-Control-Allow-Origin
+   - X-Container-Meta-Access-Control-Max-Age: X-Container-Meta-Access-Control-Max-Age
+   - X-Container-Meta-Access-Control-Expose-Headers: X-Container-Meta-Access-Control-Expose-Headers
+   - X-Container-Meta-Quota-Bytes: X-Container-Meta-Quota-Bytes
+   - X-Container-Meta-Quota-Count: X-Container-Meta-Quota-Count
+   - X-Container-Meta-Web-Directory-Type: X-Container-Meta-Web-Directory-Type
+   - X-Container-Meta-Temp-URL-Key: X-Container-Meta-Temp-URL-Key_req
+   - X-Container-Meta-Temp-URL-Key-2: X-Container-Meta-Temp-URL-Key-2_req
+   - X-Trans-Id-Extra: X-Trans-Id-Extra
+
+
+Response Parameters
+-------------------
+
+.. rest_parameters:: parameters.yaml
+
+   - Date: Date
+   - X-Timestamp: X-Timestamp
+   - Content-Length: Content-Length_cud_resp
+   - Content-Type: Content-Type_cud_resp
+   - X-Trans-Id: X-Trans-Id
+   - X-Openstack-Request-Id: X-Openstack-Request-Id
+
+
+
+
+
+Show container metadata
+=======================
+
+.. rest_method::  HEAD /v1/{account}/{container}
+
+Shows container metadata, including the number of objects and the total bytes of all objects stored in the container.
+
+Show container metadata request:
+
+::
+
+   curl -i $publicURL/marktwain -X HEAD -H "X-Auth-Token: $token"
+
+
+
+
+::
+
+   HTTP/1.1 204 No Content
+   Content-Length: 0
+   X-Container-Object-Count: 1
+   Accept-Ranges: bytes
+   X-Container-Meta-Book: TomSawyer
+   X-Timestamp: 1389727543.65372
+   X-Container-Meta-Author: SamuelClemens
+   X-Container-Bytes-Used: 14
+   Content-Type: text/plain; charset=utf-8
+   X-Trans-Id: tx0287b982a268461b9ec14-0052d826e2
+   X-Openstack-Request-Id: tx0287b982a268461b9ec14-0052d826e2
+   Date: Thu, 16 Jan 2014 18:37:22 GMT
+
+
+If the request succeeds, the operation returns the ``No Content
+(204)`` response code.
+
+Normal response codes: 204
+
+
+Request
+-------
+
+.. rest_parameters:: parameters.yaml
+
+   - account: account
+   - container: container
+   - X-Auth-Token: X-Auth-Token
+   - X-Service-Token: X-Service-Token
+   - X-Newest: X-Newest
+   - X-Trans-Id-Extra: X-Trans-Id-Extra
+
+
+Response Parameters
+-------------------
+
+.. rest_parameters:: parameters.yaml
+
+   - X-Container-Meta-name: X-Container-Meta-name
+   - Content-Length: Content-Length_cud_resp
+   - X-Container-Object-Count: X-Container-Object-Count
+   - X-Container-Bytes-Used: X-Container-Bytes-Used
+   - X-Container-Write: X-Container-Write_resp
+   - X-Container-Meta-Quota-Bytes: X-Container-Meta-Quota-Bytes_resp
+   - X-Container-Meta-Quota-Count: X-Container-Meta-Quota-Count_resp
+   - Accept-Ranges: Accept-Ranges
+   - X-Container-Read: X-Container-Read_resp
+   - X-Container-Meta-Access-Control-Expose-Headers: X-Container-Meta-Access-Control-Expose-Headers
+   - X-Container-Meta-Temp-URL-Key: X-Container-Meta-Temp-URL-Key_resp
+   - X-Container-Meta-Temp-URL-Key-2: X-Container-Meta-Temp-URL-Key-2_resp
+   - X-Timestamp: X-Timestamp
+   - X-Container-Meta-Access-Control-Allow-Origin: X-Container-Meta-Access-Control-Allow-Origin
+   - X-Container-Meta-Access-Control-Max-Age: X-Container-Meta-Access-Control-Max-Age
+   - X-Container-Sync-Key: X-Container-Sync-Key_resp
+   - X-Container-Sync-To: X-Container-Sync-To_resp
+   - Date: Date
+   - X-Trans-Id: X-Trans-Id
+   - X-Openstack-Request-Id: X-Openstack-Request-Id
+   - Content-Type: Content-Type_cud_resp
+   - X-Versions-Location: X-Versions-Location_resp
+   - X-History-Location: X-History-Location_resp
+   - X-Storage-Policy: X-Storage-Policy
+
+
+
+
+
+Delete container
+================
+
+.. rest_method::  DELETE /v1/{account}/{container}
+
+Deletes an empty container.
+
+This operation fails unless the container is empty. An empty
+container has no objects.
+
+Delete the ``steven`` container:
+
+::
+
+   curl -i $publicURL/steven -X DELETE -H "X-Auth-Token: $token"
+
+
+If the container does not exist, the response is:
+
+::
+
+   HTTP/1.1 404 Not Found
+   Content-Length: 70
+   Content-Type: text/html; charset=UTF-8
+   X-Trans-Id: tx4d728126b17b43b598bf7-0052d81e34
+   X-Openstack-Request-Id: tx4d728126b17b43b598bf7-0052d81e34
+   Date: Thu, 16 Jan 2014 18:00:20 GMT
+
+
+If the container exists and the deletion succeeds, the response is:
+
+::
+
+   HTTP/1.1 204 No Content
+   Content-Length: 0
+   Content-Type: text/html; charset=UTF-8
+   X-Trans-Id: txf76c375ebece4df19c84c-0052d81f14
+   X-Openstack-Request-Id: txf76c375ebece4df19c84c-0052d81f14
+   Date: Thu, 16 Jan 2014 18:04:04 GMT
+
+
+If the container exists but is not empty, the response is:
+
+::
+
+   HTTP/1.1 409 Conflict
+   Content-Length: 95
+   Content-Type: text/html; charset=UTF-8
+   X-Trans-Id: tx7782dc6a97b94a46956b5-0052d81f6b
+   X-Openstack-Request-Id: tx7782dc6a97b94a46956b5-0052d81f6b
+   Date: Thu, 16 Jan 2014 18:05:31 GMT
+   <html>
+   <h1>Conflict
+   </h1>
+   <p>There was a conflict when trying to complete your request.
+   </p>
+   </html>
+
+Normal response codes: 204
+
+Error response codes: 404, 409
+
+
+Request
+-------
+
+.. rest_parameters:: parameters.yaml
+
+   - account: account
+   - container: container
+   - X-Auth-Token: X-Auth-Token
+   - X-Service-Token: X-Service-Token
+   - X-Trans-Id-Extra: X-Trans-Id-Extra
+
+
+Response Parameters
+-------------------
+
+.. rest_parameters:: parameters.yaml
+
+   - Date: Date
+   - X-Timestamp: X-Timestamp
+   - Content-Length: Content-Length_cud_resp
+   - Content-Type: Content-Type_cud_resp
+   - X-Trans-Id: X-Trans-Id
+   - X-Openstack-Request-Id: X-Openstack-Request-Id
+
+
+
+
+
+
diff --git a/api-ref/source/storage-object-services.inc b/api-ref/source/storage-object-services.inc
new file mode 100644
index 0000000000..2519b5973d
--- /dev/null
+++ b/api-ref/source/storage-object-services.inc
@@ -0,0 +1,787 @@
+.. -*- rst -*-
+
+=======
+Objects
+=======
+
+Creates, replaces, shows details for, and deletes objects. Copies
+objects from another object with a new or different name. Updates
+object metadata. For more information and concepts about
+objects see `Object Storage API overview
+<https://docs.openstack.org/swift/latest/api/object_api_v1_overview.html>`_
+and `Large Objects
+<https://docs.openstack.org/swift/latest/api/large_objects.html>`_.
+
+
+Get object content and metadata
+===============================
+
+.. rest_method::  GET /v1/{account}/{container}/{object}
+
+Downloads the object content and gets the object metadata.
+
+This operation returns the object metadata in the response headers
+and the object content in the response body.
+
+If this is a large object, the response body contains the
+concatenated content of the segment objects. To get the manifest
+instead of concatenated segment objects for a static large object,
+use the ``multipart-manifest`` query parameter.
+
+Example requests and responses:
+
+- Show object details for the ``goodbye`` object in the
+  ``marktwain`` container:
+
+  ::
+
+     curl -i $publicURL/marktwain/goodbye -X GET -H "X-Auth-Token: $token"
+
+
+
+
+  ::
+
+     HTTP/1.1 200 OK
+     Content-Length: 14
+     Accept-Ranges: bytes
+     Last-Modified: Wed, 15 Jan 2014 16:41:49 GMT
+     Etag: 451e372e48e0f6b1114fa0724aa79fa1
+     X-Timestamp: 1389804109.39027
+     X-Object-Meta-Orig-Filename: goodbyeworld.txt
+     Content-Type: application/octet-stream
+     X-Trans-Id: tx8145a190241f4cf6b05f5-0052d82a34
+     X-Openstack-Request-Id: tx8145a190241f4cf6b05f5-0052d82a34
+     Date: Thu, 16 Jan 2014 18:51:32 GMT
+     Goodbye World!
+
+
+- Show object details for the ``goodbye`` object, which does not
+  exist, in the ``janeausten`` container:
+
+  ::
+
+     curl -i $publicURL/janeausten/goodbye -X GET -H "X-Auth-Token: $token"
+
+
+
+
+  ::
+
+     HTTP/1.1 404 Not Found
+     Content-Length: 70
+     Content-Type: text/html; charset=UTF-8
+     X-Trans-Id: tx073f7cbb850c4c99934b9-0052d82b04
+     X-Openstack-Request-Id: tx073f7cbb850c4c99934b9-0052d82b04
+     Date: Thu, 16 Jan 2014 18:55:00 GMT
+     <html>
+     <h1>Not Found
+     </h1>
+     <p>The resource could not be found.
+     </p>
+     </html>
+
+
+The operation returns the ``Range Not Satisfiable (416)`` response
+code for any ranged GET requests that specify more than:
+
+- Fifty ranges.
+
+- Three overlapping ranges.
+
+- Eight non-increasing ranges.
+
+
+Normal response codes: 200
+
+Error response codes: 416, 404
+
+
+Request
+-------
+
+.. rest_parameters:: parameters.yaml
+
+   - account: account
+   - container: container
+   - object: object
+   - X-Auth-Token: X-Auth-Token
+   - X-Service-Token: X-Service-Token
+   - X-Newest: X-Newest
+   - temp_url_sig: temp_url_sig
+   - temp_url_expires: temp_url_expires
+   - filename: filename
+   - multipart-manifest: multipart-manifest_get
+   - symlink: symlink
+   - Range: Range
+   - If-Match: If-Match
+   - If-None-Match: If-None-Match-get-request
+   - If-Modified-Since: If-Modified-Since
+   - If-Unmodified-Since: If-Unmodified-Since
+   - X-Trans-Id-Extra: X-Trans-Id-Extra
+
+
+Response Parameters
+-------------------
+
+.. rest_parameters:: parameters.yaml
+
+   - Content-Length: Content-Length_get_resp
+   - Content-Type: Content-Type_obj_resp
+   - X-Object-Meta-name: X-Object-Meta-name_resp
+   - Content-Disposition: Content-Disposition_resp
+   - Content-Encoding: Content-Encoding_resp
+   - X-Delete-At: X-Delete-At_resp
+   - Accept-Ranges: Accept-Ranges
+   - X-Object-Manifest: X-Object-Manifest_resp
+   - Last-Modified: Last-Modified
+   - ETag: ETag_obj_resp
+   - X-Timestamp: X-Timestamp
+   - X-Trans-Id: X-Trans-Id
+   - X-Openstack-Request-Id: X-Openstack-Request-Id
+   - Date: Date
+   - X-Static-Large-Object: X-Static-Large-Object
+   - X-Symlink-Target: X-Symlink-Target_resp
+   - X-Symlink-Target-Account: X-Symlink-Target-Account_resp
+
+
+Response Example
+----------------
+
+See examples above.
+
+
+Create or replace object
+========================
+
+.. rest_method::  PUT /v1/{account}/{container}/{object}
+
+Creates an object with data content and metadata, or replaces an existing object with data content and metadata.
+
+The PUT operation always creates an object. If you use this
+operation on an existing object, you replace the existing object
+and metadata rather than modifying the object. Consequently, this
+operation returns the ``Created (201)`` response code.
+
+If you use this operation to copy a manifest object, the new object
+is a normal object and not a copy of the manifest. Instead it is a
+concatenation of all the segment objects. This means that you
+cannot copy objects larger than 5 GB.
+
+Note that the provider may have limited the characters which are allowed
+in an object name. Any name limits are exposed under the ``name_check`` key
+in the ``/info`` discoverability response. Regardless of ``name_check``
+limitations, names must be URL quoted UTF-8.
+
+To create custom metadata, use the
+``X-Object-Meta-name`` header, where ``name`` is the name of the metadata
+item.
+
+.. include:: metadata_header_syntax.inc
+
+Example requests and responses:
+
+- Create object:
+
+  ::
+
+     curl -i $publicURL/janeausten/helloworld.txt -X PUT -d "Hello" -H "Content-Type: text/html; charset=UTF-8" -H "X-Auth-Token: $token"
+
+
+
+
+  ::
+
+     HTTP/1.1 201 Created
+     Last-Modified: Fri, 17 Jan 2014 17:28:35 GMT
+     Content-Length: 0
+     Etag: 8b1a9953c4611296a827abf8c47804d7
+     Content-Type: text/html; charset=UTF-8
+     X-Trans-Id: tx4d5e4f06d357462bb732f-0052d96843
+     X-Openstack-Request-Id: tx4d5e4f06d357462bb732f-0052d96843
+     Date: Fri, 17 Jan 2014 17:28:35 GMT
+
+
+- Replace object:
+
+  ::
+
+     curl -i $publicURL/janeausten/helloworld.txt -X PUT -d "Hola" -H "X-Auth-Token: $token"
+
+
+
+
+  ::
+
+     HTTP/1.1 201 Created
+     Last-Modified: Fri, 17 Jan 2014 17:28:35 GMT
+     Content-Length: 0
+     Etag: f688ae26e9cfa3ba6235477831d5122e
+     Content-Type: text/html; charset=UTF-8
+     X-Trans-Id: tx4d5e4f06d357462bb732f-0052d96843
+     X-Openstack-Request-Id: tx4d5e4f06d357462bb732f-0052d96843
+     Date: Fri, 17 Jan 2014 17:28:35 GMT
+
+
+The ``Created (201)`` response code indicates a successful write.
+
+If the container for the object does not already exist, the operation
+returns the ``404 Not Found`` response code.
+
+If the request times out, the operation returns the ``Request
+Timeout (408)`` response code.
+
+The ``Length Required (411)`` response code indicates a missing
+``Transfer-Encoding`` or ``Content-Length`` request header.
+
+If the MD5 checksum of the data that is written to the object store
+does not match the optional ``ETag`` value, the operation returns
+the ``Unprocessable Entity (422)`` response code.
+
+Normal response codes: 201
+
+Error response codes: 404, 408, 411, 422
+
+
+Request
+-------
+
+.. rest_parameters:: parameters.yaml
+
+   - account: account
+   - container: container
+   - object: object
+   - multipart-manifest: multipart-manifest_put
+   - temp_url_sig: temp_url_sig
+   - temp_url_expires: temp_url_expires
+   - X-Object-Manifest: X-Object-Manifest
+   - X-Auth-Token: X-Auth-Token
+   - X-Service-Token: X-Service-Token
+   - Content-Length: Content-Length_put_req
+   - Transfer-Encoding: Transfer-Encoding
+   - Content-Type: Content-Type_obj_cu_req
+   - X-Detect-Content-Type: X-Detect-Content-Type
+   - X-Copy-From: X-Copy-From
+   - X-Copy-From-Account: X-Copy-From-Account
+   - ETag: ETag_obj_req
+   - Content-Disposition: Content-Disposition
+   - Content-Encoding: Content-Encoding
+   - X-Delete-At: X-Delete-At
+   - X-Delete-After: X-Delete-After
+   - X-Object-Meta-name: X-Object-Meta-name
+   - If-None-Match: If-None-Match-put-request
+   - X-Trans-Id-Extra: X-Trans-Id-Extra
+   - X-Symlink-Target: X-Symlink-Target
+   - X-Symlink-Target-Account: X-Symlink-Target-Account
+
+
+Response Parameters
+-------------------
+
+.. rest_parameters:: parameters.yaml
+
+   - Content-Length: Content-Length_cud_resp
+   - ETag: ETag_obj_received
+   - X-Timestamp: X-Timestamp
+   - X-Trans-Id: X-Trans-Id
+   - X-Openstack-Request-Id: X-Openstack-Request-Id
+   - Date: Date
+   - Content-Type: Content-Type_obj_resp
+   - last_modified: last_modified
+
+
+
+
+
+
+
+
+Copy object
+===========
+
+.. rest_method::  COPY /v1/{account}/{container}/{object}
+
+Copies an object to another object in the object store.
+
+You can copy an object to a new object with the same name. Copying
+to the same name is an alternative to using POST to add metadata to
+an object. With POST, you must specify all the metadata. With COPY,
+you can add additional metadata to the object.
+
+With COPY, you can set the ``X-Fresh-Metadata`` header to ``true``
+to copy the object without any existing metadata.
+
+Alternatively, you can use PUT with the ``X-Copy-From`` request
+header to accomplish the same operation as the COPY object
+operation.
+
+The COPY operation always creates an object. If you use this
+operation on an existing object, you replace the existing object
+and metadata rather than modifying the object. Consequently, this
+operation returns the ``Created (201)`` response code.
+
+Normally, if you use this operation to copy a manifest object, the new object
+is a normal object and not a copy of the manifest. Instead it is a
+concatenation of all the segment objects. This means that you
+cannot copy objects larger than 5 GB in size.
+
+To copy the manifest object, you include the
+``multipart-manifest=get`` query string in the COPY request.
+The new object contains the same manifest as the original.
+The segment objects are not copied. Instead, both the original
+and new manifest objects share the same set of segment objects.
+
+To copy a symlink either with a COPY or a PUT with the
+``X-Copy-From`` request, include the ``symlink=get`` query string.
+The new symlink will have the same target as the original.
+The target object is not copied. Instead, both the original
+and new symlinks point to the same target object.
+
+All metadata is
+preserved during the object copy. If you specify metadata on the
+request to copy the object, either PUT or COPY , the metadata
+overwrites any conflicting keys on the target (new) object.
+
+Example requests and responses:
+
+- Copy the ``goodbye`` object from the ``marktwain`` container to
+  the ``janeausten`` container:
+
+  ::
+
+     curl -i $publicURL/marktwain/goodbye -X COPY -H "X-Auth-Token: $token" -H "Destination: janeausten/goodbye"
+
+
+
+
+  ::
+
+     HTTP/1.1 201 Created
+     Content-Length: 0
+     X-Copied-From-Last-Modified: Thu, 16 Jan 2014 21:19:45 GMT
+     X-Copied-From: marktwain/goodbye
+     Last-Modified: Fri, 17 Jan 2014 18:22:57 GMT
+     Etag: 451e372e48e0f6b1114fa0724aa79fa1
+     Content-Type: text/html; charset=UTF-8
+     X-Object-Meta-Movie: AmericanPie
+     X-Trans-Id: txdcb481ad49d24e9a81107-0052d97501
+     X-Openstack-Request-Id: txdcb481ad49d24e9a81107-0052d97501
+     Date: Fri, 17 Jan 2014 18:22:57 GMT
+
+
+- Alternatively, you can use PUT to copy the ``goodbye`` object from
+  the ``marktwain`` container to the ``janeausten`` container. This
+  request requires a ``Content-Length`` header, even if it is set
+  to zero (0).
+
+  ::
+
+     curl -i $publicURL/janeausten/goodbye -X PUT -H "X-Auth-Token: $token" -H "X-Copy-From: /marktwain/goodbye" -H "Content-Length: 0"
+
+
+
+
+  ::
+
+     HTTP/1.1 201 Created
+     Content-Length: 0
+     X-Copied-From-Last-Modified: Thu, 16 Jan 2014 21:19:45 GMT
+     X-Copied-From: marktwain/goodbye
+     Last-Modified: Fri, 17 Jan 2014 18:22:57 GMT
+     Etag: 451e372e48e0f6b1114fa0724aa79fa1
+     Content-Type: text/html; charset=UTF-8
+     X-Object-Meta-Movie: AmericanPie
+     X-Trans-Id: txdcb481ad49d24e9a81107-0052d97501
+     X-Openstack-Request-Id: txdcb481ad49d24e9a81107-0052d97501
+     Date: Fri, 17 Jan 2014 18:22:57 GMT
+
+
+When several replicas exist, the system copies from the most recent
+replica. That is, the COPY operation behaves as though the
+``X-Newest`` header is in the request.
+
+Normal response codes: 201
+
+
+Request
+-------
+
+.. rest_parameters:: parameters.yaml
+
+   - account: account
+   - container: container
+   - object: object
+   - multipart-manifest: multipart-manifest_copy
+   - symlink: symlink_copy
+   - X-Auth-Token: X-Auth-Token
+   - X-Service-Token: X-Service-Token
+   - Destination: Destination
+   - Destination-Account: Destination-Account
+   - Content-Type: Content-Type_obj_cu_req
+   - Content-Encoding: Content-Encoding
+   - Content-Disposition: Content-Disposition
+   - X-Object-Meta-name: X-Object-Meta-name
+   - X-Fresh-Metadata: X-Fresh-Metadata
+   - X-Trans-Id-Extra: X-Trans-Id-Extra
+
+
+Response Parameters
+-------------------
+
+.. rest_parameters:: parameters.yaml
+
+   - Content-Length: Content-Length_cud_resp
+   - X-Copied-From-Last-Modified: X-Copied-From-Last-Modified
+   - X-Copied-From: X-Copied-From
+   - X-Copied-From-Account: X-Copied-From-Account
+   - Last-Modified: Last-Modified
+   - ETag: ETag_obj_copied
+   - X-Timestamp: X-Timestamp
+   - X-Trans-Id: X-Trans-Id
+   - X-Openstack-Request-Id: X-Openstack-Request-Id
+   - Date: Date
+   - Content-Type: Content-Type_obj_resp
+
+
+
+
+
+Delete object
+=============
+
+.. rest_method::  DELETE /v1/{account}/{container}/{object}
+
+Permanently deletes an object from the object store.
+
+Object deletion occurs as soon as possible. Subsequent GET, HEAD, POST,
+or DELETE operations should return a ``404 Not Found`` error code, but
+may return stale data due to eventual consistency.
+
+For static large object manifests, you can add the
+``?multipart-manifest=delete`` query parameter. This operation deletes
+the segment objects and, if all deletions succeed, this operation
+deletes the manifest object.
+
+A DELETE request made to a symlink path will delete the symlink
+rather than the target object.
+
+An alternative to using the DELETE operation is to use
+the POST operation with the ``bulk-delete`` query parameter.
+
+Example request and response:
+
+- Delete the ``helloworld`` object from the ``marktwain`` container:
+
+  ::
+
+     curl -i $publicURL/marktwain/helloworld -X DELETE -H "X-Auth-Token: $token"
+
+
+
+
+  ::
+
+     HTTP/1.1 204 No Content
+     Content-Length: 0
+     Content-Type: text/html; charset=UTF-8
+     X-Trans-Id: tx36c7606fcd1843f59167c-0052d6fdac
+     X-Openstack-Request-Id: tx36c7606fcd1843f59167c-0052d6fdac
+     Date: Wed, 15 Jan 2014 21:29:16 GMT
+
+
+Typically, the DELETE operation does not return a response body.
+However, with the ``multipart-manifest=delete`` query parameter,
+the response body contains a list of manifest and segment objects
+and the status of their DELETE operations.
+
+Normal response codes: 204
+
+
+Request
+-------
+
+.. rest_parameters:: parameters.yaml
+
+   - account: account
+   - container: container
+   - object: object
+   - multipart-manifest: multipart-manifest_delete
+   - X-Auth-Token: X-Auth-Token
+   - X-Service-Token: X-Service-Token
+   - X-Trans-Id-Extra: X-Trans-Id-Extra
+
+
+Response Parameters
+-------------------
+
+.. rest_parameters:: parameters.yaml
+
+   - Date: Date
+   - X-Timestamp: X-Timestamp
+   - Content-Length: Content-Length_cud_resp
+   - Content-Type: Content-Type_cud_resp
+   - X-Trans-Id: X-Trans-Id
+   - X-Openstack-Request-Id: X-Openstack-Request-Id
+
+
+
+
+
+Show object metadata
+====================
+
+.. rest_method::  HEAD /v1/{account}/{container}/{object}
+
+Shows object metadata.
+
+
+
+Example requests and responses:
+
+- Show object metadata:
+
+  ::
+
+     curl $publicURL/marktwain/goodbye --head -H "X-Auth-Token: $token"
+
+
+
+
+  ::
+
+     HTTP/1.1 200 OK
+     Content-Length: 14
+     Accept-Ranges: bytes
+     Last-Modified: Thu, 16 Jan 2014 21:12:31 GMT
+     Etag: 451e372e48e0f6b1114fa0724aa79fa1
+     X-Timestamp: 1389906751.73463
+     X-Object-Meta-Book: GoodbyeColumbus
+     Content-Type: application/octet-stream
+     X-Trans-Id: tx37ea34dcd1ed48ca9bc7d-0052d84b6f
+     X-Openstack-Request-Id: tx37ea34dcd1ed48ca9bc7d-0052d84b6f
+     Date: Thu, 16 Jan 2014 21:13:19 GMT
+
+  Note: The ``--head`` option was used in the above example. If we had
+  used ``-i -X HEAD`` and the ``Content-Length`` response header is non-zero,
+  the cURL command stalls after it prints the response headers because it
+  is waiting for a response body. However, the Object Storage system
+  does not return a response body for the HEAD operation.
+
+
+If the request succeeds, the operation returns the ``200`` response
+code.
+
+
+Normal response codes: 200
+
+
+Request
+-------
+
+.. rest_parameters:: parameters.yaml
+
+   - account: account
+   - container: container
+   - object: object
+   - X-Auth-Token: X-Auth-Token
+   - X-Service-Token: X-Service-Token
+   - temp_url_sig: temp_url_sig
+   - temp_url_expires: temp_url_expires
+   - filename: filename
+   - multipart-manifest: multipart-manifest_head
+   - symlink: symlink
+   - X-Newest: X-Newest
+   - If-Match: If-Match
+   - If-None-Match: If-None-Match-get-request
+   - If-Modified-Since: If-Modified-Since
+   - If-Unmodified-Since: If-Unmodified-Since
+   - X-Trans-Id-Extra: X-Trans-Id-Extra
+
+
+Response Parameters
+-------------------
+
+.. rest_parameters:: parameters.yaml
+
+   - Content-Length: Content-Length_obj_head_resp
+   - X-Object-Meta-name: X-Object-Meta-name
+   - Content-Disposition: Content-Disposition_resp
+   - Content-Encoding: Content-Encoding_resp
+   - X-Delete-At: X-Delete-At_resp
+   - X-Object-Manifest: X-Object-Manifest_resp
+   - Last-Modified: Last-Modified
+   - ETag: ETag_obj_resp
+   - X-Timestamp: X-Timestamp
+   - X-Trans-Id: X-Trans-Id
+   - X-Openstack-Request-Id: X-Openstack-Request-Id
+   - Date: Date
+   - X-Static-Large-Object: X-Static-Large-Object
+   - Content-Type: Content-Type_obj_resp
+   - X-Symlink-Target: X-Symlink-Target_resp
+   - X-Symlink-Target-Account: X-Symlink-Target-Account_resp
+
+
+Response Example
+----------------
+
+See examples above.
+
+
+
+Create or update object metadata
+================================
+
+.. rest_method::  POST /v1/{account}/{container}/{object}
+
+Creates or updates object metadata.
+
+To create or update custom metadata, use the
+``X-Object-Meta-name`` header, where ``name`` is the name of the metadata
+item.
+
+.. include:: metadata_header_syntax.inc
+
+In addition to the custom metadata, you can update the
+``Content-Type``, ``Content-Encoding``, ``Content-Disposition``, and
+``X-Delete-At`` system metadata items. However you cannot update other
+system metadata, such as ``Content-Length`` or ``Last-Modified``.
+
+You can use COPY as an alternate to the POST operation by copying
+to the same object. With the POST operation you must specify all
+metadata items, whereas with the COPY operation, you need to
+specify only changed or additional items.
+All metadata is preserved during the object copy. If you specify
+metadata on the request to copy the object, either PUT or COPY ,
+the metadata overwrites any conflicting keys on the target (new)
+object.
+
+.. note::
+
+  While using COPY instead of POST allows sending only a subset of
+  the metadata, it carries the cost of reading and rewriting the entire
+  contents of the object.
+
+A POST request deletes any existing custom metadata that you added
+with a previous PUT or POST request. Consequently, you must specify
+all custom metadata in the request. However, system metadata is
+unchanged by the POST request unless you explicitly supply it in a
+request header.
+
+You can also set the ``X-Delete-At`` or ``X-Delete-After`` header
+to define when to expire the object.
+
+When used as described in this section, the POST operation creates
+or replaces metadata. This form of the operation has no request
+body. There are alternate uses of the POST operation as follows:
+
+- You can also use the `form POST feature
+  <http://docs.openstack.org/liberty/config-reference/content/object-
+  storage-form-post.html>`_ to upload objects.
+
+- The POST operation when used with the ``bulk-delete`` query parameter
+  can be used to delete multiple objects and containers in a single
+  operation.
+
+- The POST operation when used with the ``extract-archive`` query parameter
+  can be used to upload an archive (tar file). The archive is then extracted
+  to create objects.
+
+A POST request must not include X-Symlink-Target header. If it does then a
+400 status code is returned and the object metadata is not modified.
+
+When a POST request is sent to a symlink, the metadata will be applied to the
+symlink, but the request will result in a ``307 Temporary Redirect`` response
+to the client. The POST is never redirected to the target object, thus a
+GET/HEAD request to the symlink without ``symlink=get`` will not return the
+metadata that was sent as part of the POST request.
+
+Example requests and responses:
+
+- Create object metadata:
+
+  ::
+
+     curl -i $publicURL/marktwain/goodbye -X POST -H "X-Auth-Token: $token" -H "X-Object-Meta-Book: GoodbyeColumbus"
+
+
+
+
+  ::
+
+     HTTP/1.1 202 Accepted
+     Content-Length: 76
+     Content-Type: text/html; charset=UTF-8
+     X-Trans-Id: txb5fb5c91ba1f4f37bb648-0052d84b3f
+     X-Openstack-Request-Id: txb5fb5c91ba1f4f37bb648-0052d84b3f
+     Date: Thu, 16 Jan 2014 21:12:31 GMT
+     <html>
+     <h1>Accepted
+     </h1>
+     <p>The request is accepted for processing.
+     </p>
+     </html>
+
+
+- Update object metadata:
+
+  ::
+
+     curl -i $publicURL/marktwain/goodbye -X POST -H "X-Auth-Token: $token" -H "X-Object-Meta-Book: GoodbyeOldFriend"
+
+
+
+
+  ::
+
+     HTTP/1.1 202 Accepted
+     Content-Length: 76
+     Content-Type: text/html; charset=UTF-8
+     X-Trans-Id: tx5ec7ab81cdb34ced887c8-0052d84ca4
+     X-Openstack-Request-Id: tx5ec7ab81cdb34ced887c8-0052d84ca4
+     Date: Thu, 16 Jan 2014 21:18:28 GMT
+     <html>
+     <h1>Accepted
+     </h1>
+     <p>The request is accepted for processing.
+     </p>
+     </html>
+
+Normal response codes: 202
+
+
+Request
+-------
+
+.. rest_parameters:: parameters.yaml
+
+   - account: account
+   - container: container
+   - object: object
+   - bulk-delete: bulk-delete
+   - extract-archive: extract-archive
+   - X-Auth-Token: X-Auth-Token
+   - X-Service-Token: X-Service-Token
+   - X-Object-Meta-name: X-Object-Meta-name
+   - X-Delete-At: X-Delete-At
+   - X-Delete-After: X-Delete-After
+   - Content-Disposition: Content-Disposition
+   - Content-Encoding: Content-Encoding
+   - Content-Type: Content-Type_obj_cu_req
+   - X-Trans-Id-Extra: X-Trans-Id-Extra
+
+
+Response Parameters
+-------------------
+
+.. rest_parameters:: parameters.yaml
+
+   - Date: Date
+   - X-Timestamp: X-Timestamp
+   - Content-Length: Content-Length_cud_resp
+   - Content-Type: Content-Type_cud_resp
+   - X-Trans-Id: X-Trans-Id
+   - X-Openstack-Request-Id: X-Openstack-Request-Id
+
+
+
+
diff --git a/api-ref/source/storage_endpoints.inc b/api-ref/source/storage_endpoints.inc
new file mode 100644
index 0000000000..41845425d4
--- /dev/null
+++ b/api-ref/source/storage_endpoints.inc
@@ -0,0 +1,37 @@
+.. -*- rst -*-
+
+=========
+Endpoints
+=========
+
+If configured, lists endpoints for an account.
+
+
+List endpoints
+==============
+
+.. rest_method::  GET /v1/endpoints
+
+Lists endpoints for an object, account, or container.
+
+When the cloud provider enables middleware to list the
+``/endpoints/`` path, software that needs data location information
+can use this call to avoid network overhead. The cloud provider can
+map the ``/endpoints/`` path to another resource, so this exact
+resource might vary from provider to provider. Because it goes
+straight to the middleware, the call is not authenticated, so be
+sure you have tightly secured the environment and network when
+using this call.
+
+Error response codes:201,
+
+
+Request
+-------
+
+This operation does not accept a request body.
+
+
+
+
+
diff --git a/api-ref/source/storage_info.inc b/api-ref/source/storage_info.inc
new file mode 100644
index 0000000000..0487210b3d
--- /dev/null
+++ b/api-ref/source/storage_info.inc
@@ -0,0 +1,46 @@
+.. -*- rst -*-
+
+===============
+Discoverability
+===============
+
+If configured, lists the activated capabilities for this version of
+the OpenStack Object Storage API.
+
+
+List activated capabilities
+===========================
+
+.. rest_method::  GET /info
+
+Lists the activated capabilities for this version of the OpenStack Object Storage API.
+
+Most of the information is "public" i.e. visible to all callers. However, some
+configuration and capability items are reserved for the administrators of the
+system. To access this data, the ``swiftinfo_sig`` and ``swiftinfo_expires``
+query parameters must be added to the request.
+
+
+Normal response codes: 200
+Error response codes:
+
+
+Request
+-------
+
+.. rest_parameters:: parameters.yaml
+
+   - swiftinfo_sig: swiftinfo_sig
+   - swiftinfo_expires: swiftinfo_expires
+
+
+
+
+Response Example
+----------------
+
+.. literalinclude:: samples/capabilities-list-response.json
+   :language: javascript
+
+
+
diff --git a/babel.cfg b/babel.cfg
deleted file mode 100644
index 15cd6cb76b..0000000000
--- a/babel.cfg
+++ /dev/null
@@ -1,2 +0,0 @@
-[python: **.py]
-
diff --git a/bandit.yaml b/bandit.yaml
new file mode 100644
index 0000000000..62b37689b4
--- /dev/null
+++ b/bandit.yaml
@@ -0,0 +1,111 @@
+
+### This config may optionally select a subset of tests to run or skip by
+### filling out the 'tests' and 'skips' lists given below. If no tests are
+### specified for inclusion then it is assumed all tests are desired. The skips
+### set will remove specific tests from the include set. This can be controlled
+### using the -t/-s CLI options. Note that the same test ID should not appear
+### in both 'tests' and 'skips', this would be nonsensical and is detected by
+### Bandit at runtime.
+
+# See https://bandit.readthedocs.io/en/latest/blacklists/blacklist_calls.html
+# for documentation of the available tests.
+
+# (optional) list included test IDs here, eg '[B101, B406]':
+tests:
+
+# (optional) list skipped test IDs here, eg '[B101, B406]':
+skips:
+  # We default to binding to all interfaces
+  - B104
+  # Yes, we sometimes catch just to quietly swallow an exception
+  - B110
+  # We use insecure randomness all over the place, because
+  # it's exceedingly rare that we need secure randomness
+  - B311
+  # We dynamically build SQL all over the place
+  - B608
+  # We often use subprocesses, and require a lot of trust in our use of them
+  - B404
+  - B603
+  - B607
+  # We parse xml
+  - B405
+  - B603
+
+### (optional) plugin settings - some test plugins require configuration data
+### that may be given here, per-plugin. All bandit test plugins have a built in
+### set of sensible defaults and these will be used if no configuration is
+### provided. It is not necessary to provide settings for every (or any) plugin
+### if the defaults are acceptable.
+
+#any_other_function_with_shell_equals_true:
+#  no_shell: [os.execl, os.execle, os.execlp, os.execlpe, os.execv, os.execve, os.execvp,
+#    os.execvpe, os.spawnl, os.spawnle, os.spawnlp, os.spawnlpe, os.spawnv, os.spawnve,
+#    os.spawnvp, os.spawnvpe, os.startfile]
+#  shell: [os.system, os.popen, os.popen2, os.popen3, os.popen4, popen2.popen2, popen2.popen3,
+#    popen2.popen4, popen2.Popen3, popen2.Popen4, commands.getoutput, commands.getstatusoutput]
+#  subprocess: [subprocess.Popen, subprocess.call, subprocess.check_call, subprocess.check_output,
+#    utils.execute, utils.execute_with_timeout]
+#execute_with_run_as_root_equals_true:
+#  function_names: [ceilometer.utils.execute, cinder.utils.execute, neutron.agent.linux.utils.execute,
+#    nova.utils.execute, nova.utils.trycmd]
+#hardcoded_tmp_directory:
+#  tmp_dirs: [/tmp, /var/tmp, /dev/shm]
+#linux_commands_wildcard_injection:
+#  no_shell: [os.execl, os.execle, os.execlp, os.execlpe, os.execv, os.execve, os.execvp,
+#    os.execvpe, os.spawnl, os.spawnle, os.spawnlp, os.spawnlpe, os.spawnv, os.spawnve,
+#    os.spawnvp, os.spawnvpe, os.startfile]
+#  shell: [os.system, os.popen, os.popen2, os.popen3, os.popen4, popen2.popen2, popen2.popen3,
+#    popen2.popen4, popen2.Popen3, popen2.Popen4, commands.getoutput, commands.getstatusoutput]
+#  subprocess: [subprocess.Popen, subprocess.call, subprocess.check_call, subprocess.check_output,
+#    utils.execute, utils.execute_with_timeout]
+#password_config_option_not_marked_secret:
+#  function_names: [oslo.config.cfg.StrOpt, oslo_config.cfg.StrOpt]
+#ssl_with_bad_defaults:
+#  bad_protocol_versions: [PROTOCOL_SSLv2, SSLv2_METHOD, SSLv23_METHOD, PROTOCOL_SSLv3,
+#    PROTOCOL_TLSv1, SSLv3_METHOD, TLSv1_METHOD]
+#ssl_with_bad_version:
+#  bad_protocol_versions: [PROTOCOL_SSLv2, SSLv2_METHOD, SSLv23_METHOD, PROTOCOL_SSLv3,
+#    PROTOCOL_TLSv1, SSLv3_METHOD, TLSv1_METHOD]
+#start_process_with_a_shell:
+#  no_shell: [os.execl, os.execle, os.execlp, os.execlpe, os.execv, os.execve, os.execvp,
+#    os.execvpe, os.spawnl, os.spawnle, os.spawnlp, os.spawnlpe, os.spawnv, os.spawnve,
+#    os.spawnvp, os.spawnvpe, os.startfile]
+#  shell: [os.system, os.popen, os.popen2, os.popen3, os.popen4, popen2.popen2, popen2.popen3,
+#    popen2.popen4, popen2.Popen3, popen2.Popen4, commands.getoutput, commands.getstatusoutput]
+#  subprocess: [subprocess.Popen, subprocess.call, subprocess.check_call, subprocess.check_output,
+#    utils.execute, utils.execute_with_timeout]
+#start_process_with_no_shell:
+#  no_shell: [os.execl, os.execle, os.execlp, os.execlpe, os.execv, os.execve, os.execvp,
+#    os.execvpe, os.spawnl, os.spawnle, os.spawnlp, os.spawnlpe, os.spawnv, os.spawnve,
+#    os.spawnvp, os.spawnvpe, os.startfile]
+#  shell: [os.system, os.popen, os.popen2, os.popen3, os.popen4, popen2.popen2, popen2.popen3,
+#    popen2.popen4, popen2.Popen3, popen2.Popen4, commands.getoutput, commands.getstatusoutput]
+#  subprocess: [subprocess.Popen, subprocess.call, subprocess.check_call, subprocess.check_output,
+#    utils.execute, utils.execute_with_timeout]
+#start_process_with_partial_path:
+#  no_shell: [os.execl, os.execle, os.execlp, os.execlpe, os.execv, os.execve, os.execvp,
+#    os.execvpe, os.spawnl, os.spawnle, os.spawnlp, os.spawnlpe, os.spawnv, os.spawnve,
+#    os.spawnvp, os.spawnvpe, os.startfile]
+#  shell: [os.system, os.popen, os.popen2, os.popen3, os.popen4, popen2.popen2, popen2.popen3,
+#    popen2.popen4, popen2.Popen3, popen2.Popen4, commands.getoutput, commands.getstatusoutput]
+#  subprocess: [subprocess.Popen, subprocess.call, subprocess.check_call, subprocess.check_output,
+#    utils.execute, utils.execute_with_timeout]
+#subprocess_popen_with_shell_equals_true:
+#  no_shell: [os.execl, os.execle, os.execlp, os.execlpe, os.execv, os.execve, os.execvp,
+#    os.execvpe, os.spawnl, os.spawnle, os.spawnlp, os.spawnlpe, os.spawnv, os.spawnve,
+#    os.spawnvp, os.spawnvpe, os.startfile]
+#  shell: [os.system, os.popen, os.popen2, os.popen3, os.popen4, popen2.popen2, popen2.popen3,
+#    popen2.popen4, popen2.Popen3, popen2.Popen4, commands.getoutput, commands.getstatusoutput]
+#  subprocess: [subprocess.Popen, subprocess.call, subprocess.check_call, subprocess.check_output,
+#    utils.execute, utils.execute_with_timeout]
+#subprocess_without_shell_equals_true:
+#  no_shell: [os.execl, os.execle, os.execlp, os.execlpe, os.execv, os.execve, os.execvp,
+#    os.execvpe, os.spawnl, os.spawnle, os.spawnlp, os.spawnlpe, os.spawnv, os.spawnve,
+#    os.spawnvp, os.spawnvpe, os.startfile]
+#  shell: [os.system, os.popen, os.popen2, os.popen3, os.popen4, popen2.popen2, popen2.popen3,
+#    popen2.popen4, popen2.Popen3, popen2.Popen4, commands.getoutput, commands.getstatusoutput]
+#  subprocess: [subprocess.Popen, subprocess.call, subprocess.check_call, subprocess.check_output,
+#    utils.execute, utils.execute_with_timeout]
+#try_except_continue: {check_typed_exception: false}
+#try_except_pass: {check_typed_exception: false}
diff --git a/bin/swift-bench b/bin/swift-bench
deleted file mode 100755
index b575b1952c..0000000000
--- a/bin/swift-bench
+++ /dev/null
@@ -1,175 +0,0 @@
-#!/usr/bin/env python
-# Copyright (c) 2010-2012 OpenStack, LLC.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#    http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-# implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-import logging
-import os
-import sys
-import signal
-import uuid
-from optparse import OptionParser
-
-from swift.common.bench import (BenchController, DistributedBenchController,
-                                create_containers, delete_containers)
-from swift.common.utils import readconf, LogAdapter, config_true_value
-
-# The defaults should be sufficient to run swift-bench on a SAIO
-CONF_DEFAULTS = {
-    'auth': os.environ.get('ST_AUTH', ''),
-    'user': os.environ.get('ST_USER', ''),
-    'key': os.environ.get('ST_KEY', ''),
-    'auth_version': '1.0',
-    'use_proxy': 'yes',
-    'put_concurrency': '10',
-    'get_concurrency': '10',
-    'del_concurrency': '10',
-    'concurrency': '',  # set all 3 in one shot
-    'object_sources': '',  # set of file contents to read and use for PUTs
-    'lower_object_size': '10',  # bounded random size used if these differ
-    'upper_object_size': '10',
-    'object_size': '1',  # only if not object_sources and lower == upper
-    'num_objects': '1000',
-    'num_gets': '10000',
-    'delete': 'yes',
-    'container_name': uuid.uuid4().hex,  # really "container name base"
-    'num_containers': '20',
-    'url': '',  # used when use_proxy = no or overrides auth X-Storage-Url
-    'account': '',  # used when use_proxy = no
-    'devices': 'sdb1',  # space-sep list
-    'log_level': 'INFO',
-    'timeout': '10',
-    'auth_version': '1.0',
-    'bench_clients': [],
-}
-
-SAIO_DEFAULTS = {
-    'auth': 'http://localhost:8080/auth/v1.0',
-    'user': 'test:tester',
-    'key': 'testing',
-}
-
-if __name__ == '__main__':
-    usage = "usage: %prog [OPTIONS] [CONF_FILE]"
-    usage += """\n\nConf file with SAIO defaults:
-
-    [bench]
-    auth = http://localhost:8080/auth/v1.0
-    user = test:tester
-    key = testing
-    concurrency = 10
-    object_size = 1
-    num_objects = 1000
-    num_gets = 10000
-    delete = yes
-    auth_version = 1.0
-    """
-    parser = OptionParser(usage=usage)
-    parser.add_option('', '--saio', dest='saio', action='store_true',
-                      default=False, help='Run benchmark with SAIO defaults')
-    parser.add_option('-A', '--auth', dest='auth',
-                      help='URL for obtaining an auth token')
-    parser.add_option('-U', '--user', dest='user',
-                      help='User name for obtaining an auth token')
-    parser.add_option('-K', '--key', dest='key',
-                      help='Key for obtaining an auth token')
-    parser.add_option('-b', '--bench-clients', action='append',
-                      metavar='<ip>:<port>',
-                      help=('A string of the form "<ip>:<port>" which matches '
-                            'the arguments supplied to a swift-bench-client '
-                            'process.  This argument must be specified '
-                            'once per swift-bench-client you want to '
-                            'utilize.'))
-    parser.add_option('-u', '--url', dest='url',
-                      help='Storage URL')
-    parser.add_option('-c', '--concurrency', dest='concurrency',
-                      help='Number of concurrent connections to use')
-    parser.add_option('-s', '--object-size', dest='object_size',
-                      help='Size of objects to PUT (in bytes)')
-    parser.add_option('-l', '--lower-object-size', dest='lower_object_size',
-                      help=('Lower size of objects (in bytes); '
-                            '--object-size will be upper-object-size'))
-    parser.add_option('-n', '--num-objects', dest='num_objects',
-                      help='Number of objects to PUT')
-    parser.add_option('-g', '--num-gets', dest='num_gets',
-                      help='Number of GET operations to perform')
-    parser.add_option('-x', '--no-delete', dest='delete', action='store_false',
-                      help='If set, will not delete the objects created')
-    parser.add_option('-V', '--auth_version', dest='auth_version',
-                      help='Authentication version')
-
-    if len(sys.argv) == 1:
-        parser.print_help()
-        sys.exit(1)
-    options, args = parser.parse_args()
-    if options.saio:
-        CONF_DEFAULTS.update(SAIO_DEFAULTS)
-    if getattr(options, 'lower_object_size', None):
-        if options.object_size <= options.lower_object_size:
-            raise ValueError('--lower-object-size (%s) must be '
-                             '< --object-size (%s)' %
-                             (options.lower_object_size, options.object_size))
-        CONF_DEFAULTS['upper_object_size'] = options.object_size
-    if args:
-        conf = args[0]
-        if not os.path.exists(conf):
-            sys.exit("No such conf file: %s" % conf)
-        conf = readconf(conf, 'bench', log_name='swift-bench',
-                        defaults=CONF_DEFAULTS)
-        conf['bench_clients'] = []
-    else:
-        conf = CONF_DEFAULTS
-    parser.set_defaults(**conf)
-    options, _junk = parser.parse_args()
-    if options.concurrency is not '':
-        options.put_concurrency = options.concurrency
-        options.get_concurrency = options.concurrency
-        options.del_concurrency = options.concurrency
-    options.containers = ['%s_%d' % (options.container_name, i)
-                          for i in xrange(int(options.num_containers))]
-    # check boolean options vs config parameter values
-    if config_true_value(str(options.delete).lower()):
-        options.delete = 'yes'
-    else:
-        options.delete = 'no'
-
-    def sigterm(signum, frame):
-        sys.exit('Termination signal received.')
-    signal.signal(signal.SIGTERM, sigterm)
-
-    logger = logging.getLogger()
-    logger.setLevel({
-        'debug': logging.DEBUG,
-        'info': logging.INFO,
-        'warning': logging.WARNING,
-        'error': logging.ERROR,
-        'critical': logging.CRITICAL}.get(
-            options.log_level.lower(), logging.INFO))
-    loghandler = logging.StreamHandler()
-    logger.addHandler(loghandler)
-    logger = LogAdapter(logger, 'swift-bench')
-    logformat = logging.Formatter('%(server)s %(asctime)s %(levelname)s '
-                                  '%(message)s')
-    loghandler.setFormatter(logformat)
-
-    if options.use_proxy:
-        create_containers(logger, options)
-
-    controller_class = DistributedBenchController if options.bench_clients \
-        else BenchController
-    controller = controller_class(logger, options)
-    controller.run()
-
-    if config_true_value(options.delete.lower()):
-        delete_containers(logger, options)
diff --git a/bin/swift-bench-client b/bin/swift-bench-client
deleted file mode 100755
index 9473b4560c..0000000000
--- a/bin/swift-bench-client
+++ /dev/null
@@ -1,59 +0,0 @@
-#!/usr/bin/env python
-# Copyright (c) 2010-2012 OpenStack, LLC.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#    http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-# implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-import logging
-import sys
-import signal
-from optparse import OptionParser
-
-from swift.common.bench import BenchServer
-from swift.common.utils import LogAdapter
-
-if __name__ == '__main__':
-    usage = "usage: %prog <ip> <port>"
-    usage += "\n\nRun a client for distributed swift-bench runs."
-    parser = OptionParser(usage=usage)
-    parser.add_option('-o', '--log-level', dest='log_level',
-                      default='info',
-                      help='Logging level (debug, info, etc)')
-
-    if len(sys.argv) != 3:
-        parser.print_help()
-        sys.exit(1)
-    options, args = parser.parse_args()
-
-    logger = logging.getLogger()
-    logger.setLevel({
-        'debug': logging.DEBUG,
-        'info': logging.INFO,
-        'warning': logging.WARNING,
-        'error': logging.ERROR,
-        'critical': logging.CRITICAL}.get(
-            options.log_level.lower(), logging.INFO))
-    loghandler = logging.StreamHandler()
-    logger.addHandler(loghandler)
-    logger = LogAdapter(logger, 'swift-bench-client')
-    logformat = logging.Formatter('%(server)s %(asctime)s %(levelname)s '
-                                  '%(message)s')
-    loghandler.setFormatter(logformat)
-
-    def sigterm(signum, frame):
-        sys.exit('Termination signal received.')
-    signal.signal(signal.SIGTERM, sigterm)
-    signal.signal(signal.SIGINT, sigterm)
-
-    server = BenchServer(logger, args[0], args[1])
-    server.run()
diff --git a/bin/swift-container-auditor b/bin/swift-container-auditor
deleted file mode 100755
index b49a290f33..0000000000
--- a/bin/swift-container-auditor
+++ /dev/null
@@ -1,23 +0,0 @@
-#!/usr/bin/env python
-# Copyright (c) 2010-2012 OpenStack, LLC.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#    http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-# implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-from swift.container.auditor import ContainerAuditor
-from swift.common.utils import parse_options
-from swift.common.daemon import run_daemon
-
-if __name__ == '__main__':
-    conf_file, options = parse_options(once=True)
-    run_daemon(ContainerAuditor, conf_file, **options)
diff --git a/bin/swift-container-replicator b/bin/swift-container-replicator
deleted file mode 100755
index 62b803c0c4..0000000000
--- a/bin/swift-container-replicator
+++ /dev/null
@@ -1,23 +0,0 @@
-#!/usr/bin/env python
-# Copyright (c) 2010-2012 OpenStack, LLC.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#    http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-# implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-from swift.container.replicator import ContainerReplicator
-from swift.common.utils import parse_options
-from swift.common.daemon import run_daemon
-
-if __name__ == '__main__':
-    conf_file, options = parse_options(once=True)
-    run_daemon(ContainerReplicator, conf_file, **options)
diff --git a/bin/swift-container-server b/bin/swift-container-server
deleted file mode 100755
index b47dce017f..0000000000
--- a/bin/swift-container-server
+++ /dev/null
@@ -1,22 +0,0 @@
-#!/usr/bin/env python
-# Copyright (c) 2010-2012 OpenStack, LLC.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#    http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-# implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-from swift.common.utils import parse_options
-from swift.common.wsgi import run_wsgi
-
-if __name__ == '__main__':
-    conf_file, options = parse_options()
-    run_wsgi(conf_file, 'container-server', default_port=6001, **options)
diff --git a/bin/swift-container-sync b/bin/swift-container-sync
deleted file mode 100755
index 7b6378c4c7..0000000000
--- a/bin/swift-container-sync
+++ /dev/null
@@ -1,23 +0,0 @@
-#!/usr/bin/python
-# Copyright (c) 2010-2012 OpenStack, LLC.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#    http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-# implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-from swift.container.sync import ContainerSync
-from swift.common.utils import parse_options
-from swift.common.daemon import run_daemon
-
-if __name__ == '__main__':
-    conf_file, options = parse_options(once=True)
-    run_daemon(ContainerSync, conf_file, **options)
diff --git a/bin/swift-container-updater b/bin/swift-container-updater
deleted file mode 100755
index b80cbda092..0000000000
--- a/bin/swift-container-updater
+++ /dev/null
@@ -1,23 +0,0 @@
-#!/usr/bin/env python
-# Copyright (c) 2010-2012 OpenStack, LLC.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#    http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-# implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-from swift.container.updater import ContainerUpdater
-from swift.common.utils import parse_options
-from swift.common.daemon import run_daemon
-
-if __name__ == '__main__':
-    conf_file, options = parse_options(once=True)
-    run_daemon(ContainerUpdater, conf_file, **options)
diff --git a/bin/swift-dispersion-populate b/bin/swift-dispersion-populate
deleted file mode 100755
index 1fe01adc0b..0000000000
--- a/bin/swift-dispersion-populate
+++ /dev/null
@@ -1,156 +0,0 @@
-#!/usr/bin/env python
-# Copyright (c) 2010-2012 OpenStack, LLC.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#    http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-# implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-import os
-import traceback
-from ConfigParser import ConfigParser
-from cStringIO import StringIO
-from sys import exit, argv, stdout
-from time import time
-from uuid import uuid4
-
-from eventlet import GreenPool, patcher, sleep
-from eventlet.pools import Pool
-
-from swiftclient import Connection, get_auth
-from swift.common.ring import Ring
-from swift.common.utils import compute_eta, get_time_units
-
-
-def put_container(connpool, container, report):
-    global retries_done
-    try:
-        with connpool.item() as conn:
-            conn.put_container(container)
-            retries_done += conn.attempts - 1
-        if report:
-            report(True)
-    except Exception:
-        if report:
-            report(False)
-        raise
-
-
-def put_object(connpool, container, obj, report):
-    global retries_done
-    try:
-        with connpool.item() as conn:
-            conn.put_object(container, obj, StringIO(obj),
-                            headers={'x-object-meta-dispersion': obj})
-            retries_done += conn.attempts - 1
-        if report:
-            report(True)
-    except Exception:
-        if report:
-            report(False)
-        raise
-
-
-def report(success):
-    global begun, created, item_type, next_report, need_to_create, retries_done
-    if not success:
-        traceback.print_exc()
-        exit('Gave up due to error(s).')
-    created += 1
-    if time() < next_report:
-        return
-    next_report = time() + 5
-    eta, eta_unit = compute_eta(begun, created, need_to_create)
-    print '\r\x1B[KCreating %s: %d of %d, %d%s left, %d retries' % (item_type,
-          created, need_to_create, round(eta), eta_unit, retries_done),
-    stdout.flush()
-
-
-if __name__ == '__main__':
-    global begun, created, item_type, next_report, need_to_create, retries_done
-    patcher.monkey_patch()
-
-    conffile = '/etc/swift/dispersion.conf'
-    if len(argv) == 2:
-        conffile = argv[1]
-    elif len(argv) > 2:
-        exit('Syntax: %s [conffile]' % argv[0])
-    c = ConfigParser()
-    if not c.read(conffile):
-        exit('Unable to read config file: %s' % conffile)
-    conf = dict(c.items('dispersion'))
-    swift_dir = conf.get('swift_dir', '/etc/swift')
-    dispersion_coverage = int(conf.get('dispersion_coverage', 1))
-    retries = int(conf.get('retries', 5))
-    concurrency = int(conf.get('concurrency', 25))
-
-    coropool = GreenPool(size=concurrency)
-    retries_done = 0
-
-    url, token = get_auth(conf['auth_url'], conf['auth_user'],
-                          conf['auth_key'],
-                          auth_version=conf.get('auth_version', '1.0'))
-    account = url.rsplit('/', 1)[1]
-    connpool = Pool(max_size=concurrency)
-    connpool.create = lambda: Connection(conf['auth_url'],
-                                         conf['auth_user'], conf['auth_key'],
-                                         retries=retries,
-                                         preauthurl=url, preauthtoken=token)
-
-    container_ring = Ring(swift_dir, ring_name='container')
-    parts_left = dict((x, x) for x in xrange(container_ring.partition_count))
-    item_type = 'containers'
-    created = 0
-    retries_done = 0
-    need_to_create = need_to_queue = \
-        dispersion_coverage / 100.0 * container_ring.partition_count
-    begun = next_report = time()
-    next_report += 2
-    while need_to_queue >= 1:
-        container = 'dispersion_%s' % uuid4().hex
-        part, _junk = container_ring.get_nodes(account, container)
-        if part in parts_left:
-            coropool.spawn(put_container, connpool, container, report)
-            sleep()
-            del parts_left[part]
-            need_to_queue -= 1
-    coropool.waitall()
-    elapsed, elapsed_unit = get_time_units(time() - begun)
-    print '\r\x1B[KCreated %d containers for dispersion reporting, %d%s, %d ' \
-          'retries' % \
-          (need_to_create, round(elapsed), elapsed_unit, retries_done)
-    stdout.flush()
-
-    container = 'dispersion_objects'
-    put_container(connpool, container, None)
-    object_ring = Ring(swift_dir, ring_name='object')
-    parts_left = dict((x, x) for x in xrange(object_ring.partition_count))
-    item_type = 'objects'
-    created = 0
-    retries_done = 0
-    need_to_create = need_to_queue = \
-        dispersion_coverage / 100.0 * object_ring.partition_count
-    begun = next_report = time()
-    next_report += 2
-    while need_to_queue >= 1:
-        obj = 'dispersion_%s' % uuid4().hex
-        part, _junk = object_ring.get_nodes(account, container, obj)
-        if part in parts_left:
-            coropool.spawn(put_object, connpool, container, obj, report)
-            sleep()
-            del parts_left[part]
-            need_to_queue -= 1
-    coropool.waitall()
-    elapsed, elapsed_unit = get_time_units(time() - begun)
-    print '\r\x1B[KCreated %d objects for dispersion reporting, %d%s, %d ' \
-          'retries' % \
-          (need_to_create, round(elapsed), elapsed_unit, retries_done)
-    stdout.flush()
diff --git a/bin/swift-drive-audit b/bin/swift-drive-audit
deleted file mode 100755
index 6c742a483e..0000000000
--- a/bin/swift-drive-audit
+++ /dev/null
@@ -1,137 +0,0 @@
-#!/usr/bin/env python
-# Copyright (c) 2010-2012 OpenStack, LLC.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#    http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-# implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-import datetime
-import os
-import re
-import subprocess
-import sys
-from ConfigParser import ConfigParser
-
-from swift.common.utils import get_logger
-
-
-# To search for more types of errors, add the regex to the list below
-error_re = [
-    re.compile(r'\berror\b.*\b(sd[a-z]{1,2}\d?)\b'),
-    re.compile(r'\b(sd[a-z]{1,2}\d?)\b.*\berror\b'),
-]
-
-
-def get_devices(device_dir, logger):
-    devices = []
-    for line in open('/proc/mounts').readlines():
-        data = line.strip().split()
-        block_device = data[0]
-        mount_point = data[1]
-        if mount_point.startswith(device_dir):
-            device = {}
-            device['mount_point'] = mount_point
-            device['block_device'] = block_device
-            try:
-                device_num = os.stat(block_device).st_rdev
-            except OSError, e:
-                # If we can't stat the device, then something weird is going on
-                logger.error("Error: Could not stat %s!" %
-                             block_device)
-                continue
-            device['major'] = str(os.major(device_num))
-            device['minor'] = str(os.minor(device_num))
-            devices.append(device)
-    for line in open('/proc/partitions').readlines()[2:]:
-        major, minor, blocks, kernel_device = line.strip().split()
-        device = [d for d in devices
-                  if d['major'] == major and d['minor'] == minor]
-        if device:
-            device[0]['kernel_device'] = kernel_device
-    return devices
-
-
-def get_errors(minutes):
-    errors = {}
-    start_time = datetime.datetime.now() - datetime.timedelta(minutes=minutes)
-    try:
-        for line in open('/var/log/kern.log'):
-            if '[    0.000000]' in line:
-                # Ignore anything before the last boot
-                errors = {}
-                continue
-            log_time_string = '%s %s' % (start_time.year,
-                                         ' '.join(line.split()[:3]))
-            log_time = datetime.datetime.strptime(
-                log_time_string, '%Y %b %d %H:%M:%S')
-            if log_time > start_time:
-                for err in error_re:
-                    for device in err.findall(line):
-                        errors[device] = errors.get(device, 0) + 1
-        return errors
-    except IOError:
-        logger.error("Error: Unable to open /var/log/kern.log")
-        print("Unable to open /var/log/kern.log")
-        sys.exit(1)
-
-
-def comment_fstab(mount_point):
-    with open('/etc/fstab', 'r') as fstab:
-        with open('/etc/fstab.new', 'w') as new_fstab:
-            for line in fstab:
-                parts = line.split()
-                if len(parts) > 2 and line.split()[1] == mount_point:
-                    new_fstab.write('#' + line)
-                else:
-                    new_fstab.write(line)
-    os.rename('/etc/fstab.new', '/etc/fstab')
-
-
-if __name__ == '__main__':
-    c = ConfigParser()
-    try:
-        conf_path = sys.argv[1]
-    except Exception:
-        print "Usage: %s CONF_FILE" % sys.argv[0].split('/')[-1]
-        sys.exit(1)
-    if not c.read(conf_path):
-        print "Unable to read config file %s" % conf_path
-        sys.exit(1)
-    conf = dict(c.items('drive-audit'))
-    device_dir = conf.get('device_dir', '/srv/node')
-    minutes = int(conf.get('minutes', 60))
-    error_limit = int(conf.get('error_limit', 1))
-    conf['log_name'] = conf.get('log_name', 'drive-audit')
-    logger = get_logger(conf, log_route='drive-audit')
-    devices = get_devices(device_dir, logger)
-    logger.debug("Devices found: %s" % str(devices))
-    if not devices:
-        logger.error("Error: No devices found!")
-    errors = get_errors(minutes)
-    logger.debug("Errors found: %s" % str(errors))
-    unmounts = 0
-    for kernel_device, count in errors.items():
-        if count >= error_limit:
-            device = \
-                [d for d in devices if d['kernel_device'] == kernel_device]
-            if device:
-                mount_point = device[0]['mount_point']
-                if mount_point.startswith(device_dir):
-                    logger.info("Unmounting %s with %d errors" %
-                                (mount_point, count))
-                    subprocess.call(['umount', '-fl', mount_point])
-                    logger.info("Commenting out %s from /etc/fstab" %
-                                (mount_point))
-                    comment_fstab(mount_point)
-                    unmounts += 1
-    if unmounts == 0:
-        logger.info("No drives were unmounted")
diff --git a/bin/swift-form-signature b/bin/swift-form-signature
deleted file mode 100755
index 08a5adce53..0000000000
--- a/bin/swift-form-signature
+++ /dev/null
@@ -1,71 +0,0 @@
-#!/usr/bin/env python
-
-import hmac
-from hashlib import sha1
-from os.path import basename
-from sys import argv, exit
-from time import time
-
-
-if __name__ == '__main__':
-    if len(argv) != 7:
-        prog = basename(argv[0])
-        print 'Syntax: %s <path> <redirect> <max_file_size> ' \
-              '<max_file_count> <seconds> <key>' % prog
-        print
-        print 'Where:'
-        print '  <path>            The prefix to use for form uploaded'
-        print '                    objects. For example:'
-        print '                    /v1/account/container/object_prefix_ would'
-        print '                    ensure all form uploads have that path'
-        print '                    prepended to the browser-given file name.'
-        print '  <redirect>        The URL to redirect the browser to after'
-        print '                    the uploads have completed.'
-        print '  <max_file_size>   The maximum file size per file uploaded.'
-        print '  <max_file_count>  The maximum number of uploaded files'
-        print '                    allowed.'
-        print '  <seconds>         The number of seconds from now to allow'
-        print '                    the form post to begin.'
-        print '  <key>             The X-Account-Meta-Temp-URL-Key for the'
-        print '                    account.'
-        print
-        print 'Example output:'
-        print '    Expires: 1323842228'
-        print '  Signature: 18de97e47345a82c4dbfb3b06a640dbb'
-        exit(1)
-    path, redirect, max_file_size, max_file_count, seconds, key = argv[1:]
-    try:
-        max_file_size = int(max_file_size)
-    except ValueError:
-        max_file_size = -1
-    if max_file_size < 0:
-        print 'Please use a <max_file_size> value greater than or equal to 0.'
-        exit(1)
-    try:
-        max_file_count = int(max_file_count)
-    except ValueError:
-        max_file_count = 0
-    if max_file_count < 1:
-        print 'Please use a positive <max_file_count> value.'
-        exit(1)
-    try:
-        expires = int(time() + int(seconds))
-    except ValueError:
-        expires = 0
-    if expires < 1:
-        print 'Please use a positive <seconds> value.'
-        exit(1)
-    parts = path.split('/', 4)
-    # Must be four parts, ['', 'v1', 'a', 'c'], must be a v1 request, have
-    # account and container values, and optionally have an object prefix.
-    if len(parts) < 4 or parts[0] or parts[1] != 'v1' or not parts[2] or \
-            not parts[3]:
-        print '<path> must point to a container at least.'
-        print 'For example: /v1/account/container'
-        print '         Or: /v1/account/container/object_prefix'
-        exit(1)
-    sig = hmac.new(key, '%s\n%s\n%s\n%s\n%s' % (path, redirect, max_file_size,
-                                                max_file_count, expires),
-                   sha1).hexdigest()
-    print '  Expires:', expires
-    print 'Signature:', sig
diff --git a/bin/swift-get-nodes b/bin/swift-get-nodes
deleted file mode 100755
index fcf45ae77b..0000000000
--- a/bin/swift-get-nodes
+++ /dev/null
@@ -1,132 +0,0 @@
-#!/usr/bin/env python
-# Copyright (c) 2010-2012 OpenStack, LLC.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#    http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-# implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-import optparse
-import sys
-import urllib
-
-from swift.common.ring import Ring
-from swift.common.utils import hash_path
-
-
-parser = optparse.OptionParser()
-parser.add_option('-a', '--all', action='store_true',
-                  help='Show all handoff nodes')
-parser.add_option('-p', '--partition', metavar='PARTITION',
-                  help='Show nodes for a given partition')
-(options, args) = parser.parse_args()
-
-if (len(args) < 2 or len(args) > 4) and \
-   (options.partition is None or not args):
-    print 'Usage: %s [-a] <ring.gz> <account> [<container>] [<object>]' \
-        % sys.argv[0]
-    print '   Or: %s [-a] <ring.gz> -p partition' % sys.argv[0]
-    print 'Shows the nodes responsible for the item specified.'
-    print 'Example:'
-    print '    $ %s /etc/swift/account.ring.gz MyAccount' % sys.argv[0]
-    print '    Partition 5743883'
-    print '    Hash 96ae332a60b58910784e4417a03e1ad0'
-    print '    10.1.1.7:8000 sdd1'
-    print '    10.1.9.2:8000 sdb1'
-    print '    10.1.5.5:8000 sdf1'
-    print '    10.1.5.9:8000 sdt1 # [Handoff]'
-    sys.exit(1)
-
-ringloc = None
-account = None
-container = None
-obj = None
-
-if len(args) == 4:
-    # Account, Container and Object
-    ring_file, account, container, obj = args
-    ring = Ring(ring_file)
-    hash_str = hash_path(account, container, obj)
-    part, nodes = ring.get_nodes(account, container, obj)
-    target = "%s/%s/%s" % (account, container, obj)
-    loc = 'objects'
-elif len(args) == 3:
-    # Account, Container
-    ring_file, account, container = args
-    ring = Ring(ring_file)
-    hash_str = hash_path(account, container)
-    part, nodes = ring.get_nodes(account, container)
-    target = "%s/%s" % (account, container)
-    loc = 'containers'
-elif len(args) == 2:
-    # Account
-    ring_file, account = args
-    ring = Ring(ring_file)
-    hash_str = hash_path(account)
-    part, nodes = ring.get_nodes(account)
-    target = "%s" % (account)
-    loc = 'accounts'
-elif len(args) == 1:
-    # Partition
-    ring_file = args[0]
-    ring = Ring(ring_file)
-    hash_str = None
-    part = int(options.partition)
-    nodes = ring.get_part_nodes(part)
-    target = ''
-    loc = ring_file.rsplit('/', 1)[-1].split('.', 1)[0]
-    if loc in ('account', 'container', 'object'):
-        loc += 's'
-    else:
-        loc = '<type>'
-
-more_nodes = []
-for more_node in ring.get_more_nodes(part):
-    more_nodes.append(more_node)
-    if not options.all and len(more_nodes) >= ring.replica_count:
-        break
-
-print '\nAccount \t%s' % account
-print 'Container\t%s' % container
-print 'Object   \t%s\n' % obj
-print '\nPartition\t%s' % part
-print 'Hash       \t%s\n' % hash_str
-
-for node in nodes:
-    print 'Server:Port Device\t%s:%s %s' % (node['ip'], node['port'],
-                                            node['device'])
-for mnode in more_nodes:
-    print 'Server:Port Device\t%s:%s %s\t [Handoff]' \
-        % (mnode['ip'], mnode['port'], mnode['device'])
-print "\n"
-for node in nodes:
-    print 'curl -I -XHEAD "http://%s:%s/%s/%s/%s"' \
-        % (node['ip'], node['port'], node['device'], part,
-           urllib.quote(target))
-for mnode in more_nodes:
-    print 'curl -I -XHEAD "http://%s:%s/%s/%s/%s" # [Handoff]' \
-        % (mnode['ip'], mnode['port'], mnode['device'], part,
-           urllib.quote(target))
-print "\n"
-for node in nodes:
-    if hash_str:
-        print 'ssh %s "ls -lah /srv/node/%s/%s/%s/%s/%s/"' % (
-            node['ip'], node['device'], loc, part, hash_str[-3:], hash_str)
-    else:
-        print 'ssh %s "ls -lah /srv/node/%s/%s/%s/"' % (
-            node['ip'], node['device'], loc, part)
-for mnode in more_nodes:
-    if hash_str:
-        print 'ssh %s "ls -lah /srv/node/%s/%s/%s/%s/%s/" # [Handoff]' % (
-            mnode['ip'], mnode['device'], loc, part, hash_str[-3:], hash_str)
-    else:
-        print 'ssh %s "ls -lah /srv/node/%s/%s/%s/" # [Handoff]' % (
-            mnode['ip'], mnode['device'], loc, part)
diff --git a/bin/swift-init b/bin/swift-init
deleted file mode 100755
index 17dcbd0be1..0000000000
--- a/bin/swift-init
+++ /dev/null
@@ -1,73 +0,0 @@
-#!/usr/bin/env python
-# Copyright (c) 2010-2012 OpenStack, LLC.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#    http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-# implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-import sys
-from optparse import OptionParser
-
-from swift.common.manager import Server, Manager, UnknownCommandError
-
-USAGE = """%prog <server> [<server> ...] <command> [options]
-
-Commands:
-""" + '\n'.join(["%16s: %s" % x for x in Manager.list_commands()])
-
-
-def main():
-    parser = OptionParser(USAGE)
-    parser.add_option('-v', '--verbose', action="store_true",
-                      default=False, help="display verbose output")
-    parser.add_option('-w', '--no-wait', action="store_false", dest="wait",
-                      default=True, help="won't wait for server to start "
-                      "before returning")
-    parser.add_option('-o', '--once', action="store_true",
-                      default=False, help="only run one pass of daemon")
-    # this is a negative option, default is options.daemon = True
-    parser.add_option('-n', '--no-daemon', action="store_false", dest="daemon",
-                      default=True, help="start server interactively")
-    parser.add_option('-g', '--graceful', action="store_true",
-                      default=False, help="send SIGHUP to supporting servers")
-    parser.add_option('-c', '--config-num', metavar="N", type="int",
-                      dest="number", default=0,
-                      help="send command to the Nth server only")
-    options, args = parser.parse_args()
-
-    if len(args) < 2:
-        parser.print_help()
-        print 'ERROR: specify server(s) and command'
-        return 1
-
-    command = args[-1]
-    servers = args[:-1]
-
-    # this is just a silly swap for me cause I always try to "start main"
-    commands = dict(Manager.list_commands()).keys()
-    if command not in commands and servers[0] in commands:
-        servers.append(command)
-        command = servers.pop(0)
-
-    manager = Manager(servers)
-    try:
-        status = manager.run_command(command, **options.__dict__)
-    except UnknownCommandError:
-        parser.print_help()
-        print 'ERROR: unknown command, %s' % command
-        status = 1
-
-    return 1 if status else 0
-
-
-if __name__ == "__main__":
-    sys.exit(main())
diff --git a/bin/swift-object-auditor b/bin/swift-object-auditor
deleted file mode 100755
index 2a2d38bfcd..0000000000
--- a/bin/swift-object-auditor
+++ /dev/null
@@ -1,27 +0,0 @@
-#!/usr/bin/env python
-# Copyright (c) 2010-2012 OpenStack, LLC.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#    http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-# implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-from swift.obj.auditor import ObjectAuditor
-from swift.common.utils import parse_options
-from swift.common.daemon import run_daemon
-from optparse import OptionParser
-
-if __name__ == '__main__':
-    parser = OptionParser("%prog CONFIG [options]")
-    parser.add_option('-z', '--zero_byte_fps',
-                      help='Audit only zero byte files at specified files/sec')
-    conf_file, options = parse_options(parser=parser, once=True)
-    run_daemon(ObjectAuditor, conf_file, **options)
diff --git a/bin/swift-object-info b/bin/swift-object-info
deleted file mode 100755
index bf612cc5b7..0000000000
--- a/bin/swift-object-info
+++ /dev/null
@@ -1,92 +0,0 @@
-#!/usr/bin/env python
-# Copyright (c) 2010-2012 OpenStack, LLC.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#    http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-# implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-import sys
-import cPickle as pickle
-from datetime import datetime
-from hashlib import md5
-
-from swift.common.ring import Ring
-from swift.obj.server import read_metadata
-from swift.common.utils import hash_path
-
-if __name__ == '__main__':
-    if len(sys.argv) <= 1:
-        print "Usage: %s OBJECT_FILE" % sys.argv[0]
-        sys.exit(1)
-    try:
-        ring = Ring('/etc/swift/', ring_name='object')
-    except Exception:
-        ring = None
-    datafile = sys.argv[1]
-    fp = open(datafile, 'rb')
-    metadata = read_metadata(fp)
-    path = metadata.pop('name', '')
-    content_type = metadata.pop('Content-Type', '')
-    ts = metadata.pop('X-Timestamp', '')
-    etag = metadata.pop('ETag', '')
-    length = metadata.pop('Content-Length', '')
-    if path:
-        print 'Path: %s' % path
-        account, container, obj = path.split('/', 3)[1:]
-        print '  Account: %s' % account
-        print '  Container: %s' % container
-        print '  Object: %s' % obj
-        obj_hash = hash_path(account, container, obj)
-        print '  Object hash: %s' % obj_hash
-        if ring is not None:
-            print 'Ring locations:'
-            part, nodes = ring.get_nodes(account, container, obj)
-            for node in nodes:
-                print ('  %s:%s - /srv/node/%s/objects/%s/%s/%s/%s.data' %
-                       (node['ip'], node['port'], node['device'], part,
-                        obj_hash[-3:], obj_hash, ts))
-    else:
-        print 'Path: Not found in metadata'
-    if content_type:
-        print 'Content-Type: %s' % content_type
-    else:
-        print 'Content-Type: Not found in metadata'
-    if ts:
-        print 'Timestamp: %s (%s)' % (datetime.fromtimestamp(float(ts)), ts)
-    else:
-        print 'Timestamp: Not found in metadata'
-    h = md5()
-    file_len = 0
-    while True:
-        data = fp.read(64 * 1024)
-        if not data:
-            break
-        h.update(data)
-        file_len += len(data)
-    h = h.hexdigest()
-    if etag:
-        if h == etag:
-            print 'ETag: %s (valid)' % etag
-        else:
-            print "Etag: %s doesn't match file hash of %s!" % (etag, h)
-    else:
-        print 'ETag: Not found in metadata'
-    if length:
-        if file_len == int(length):
-            print 'Content-Length: %s (valid)' % length
-        else:
-            print "Content-Length: %s doesn't match file length of %s" % (
-                length, file_len)
-    else:
-        print 'Content-Length: Not found in metadata'
-    print 'User Metadata: %s' % metadata
-    fp.close()
diff --git a/bin/swift-object-replicator b/bin/swift-object-replicator
deleted file mode 100755
index 2f01a209a3..0000000000
--- a/bin/swift-object-replicator
+++ /dev/null
@@ -1,31 +0,0 @@
-#!/usr/bin/env python
-# Copyright (c) 2010-2012 OpenStack, LLC.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#    http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-# implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-from swift.obj.replicator import ObjectReplicator
-from swift.common.utils import parse_options
-from swift.common.daemon import run_daemon
-from optparse import OptionParser
-
-if __name__ == '__main__':
-    parser = OptionParser("%prog CONFIG [options]")
-    parser.add_option('-d', '--devices',
-                      help='Replicate only given devices. '
-                           'Comma-separated list')
-    parser.add_option('-p', '--partitions',
-                      help='Replicate only given partitions. '
-                           'Comma-separated list')
-    conf_file, options = parse_options(parser=parser, once=True)
-    run_daemon(ObjectReplicator, conf_file, **options)
diff --git a/bin/swift-object-updater b/bin/swift-object-updater
deleted file mode 100755
index c7f04c965d..0000000000
--- a/bin/swift-object-updater
+++ /dev/null
@@ -1,23 +0,0 @@
-#!/usr/bin/env python
-# Copyright (c) 2010-2012 OpenStack, LLC.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#    http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-# implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-from swift.obj.updater import ObjectUpdater
-from swift.common.utils import parse_options
-from swift.common.daemon import run_daemon
-
-if __name__ == '__main__':
-    conf_file, options = parse_options(once=True)
-    run_daemon(ObjectUpdater, conf_file, **options)
diff --git a/bin/swift-oldies b/bin/swift-oldies
deleted file mode 100755
index 15f34e5281..0000000000
--- a/bin/swift-oldies
+++ /dev/null
@@ -1,67 +0,0 @@
-#!/usr/bin/env python
-
-import optparse
-import os
-import signal
-import subprocess
-import sys
-
-
-if __name__ == '__main__':
-    parser = optparse.OptionParser(usage='''%prog [options]
-
-Lists old Swift processes.
-        '''.strip())
-    parser.add_option('-a', '--age', dest='hours', type='int', default=720,
-                      help='look for processes at least HOURS old; '
-                      'default: 720 (30 days)')
-    (options, args) = parser.parse_args()
-
-    listing = []
-    for line in subprocess.Popen(
-            ['ps', '-eo', 'etime,pid,args', '--no-headers'],
-            stdout=subprocess.PIPE).communicate()[0].split('\n'):
-        if not line:
-            continue
-        hours = 0
-        try:
-            etime, pid, args = line.split(None, 2)
-        except ValueError:
-            sys.exit('Could not process ps line %r' % line)
-        if not args.startswith('/usr/bin/python /usr/bin/swift-') and \
-                not args.startswith('/usr/bin/python /usr/local/bin/swift-'):
-            continue
-        args = args.split('-', 1)[1]
-        etime = etime.split('-')
-        if len(etime) == 2:
-            hours = int(etime[0]) * 24
-            etime = etime[1]
-        elif len(etime) == 1:
-            etime = etime[0]
-        else:
-            sys.exit('Could not process etime value from %r' % line)
-        etime = etime.split(':')
-        if len(etime) == 3:
-            hours += int(etime[0])
-        elif len(etime) != 2:
-            sys.exit('Could not process etime value from %r' % line)
-        if hours >= options.hours:
-            listing.append((str(hours), pid, args))
-
-    if not listing:
-        exit()
-
-    hours_len = len('Hours')
-    pid_len = len('PID')
-    args_len = len('Command')
-    for hours, pid, args in listing:
-        hours_len = max(hours_len, len(hours))
-        pid_len = max(pid_len, len(pid))
-        args_len = max(args_len, len(args))
-    args_len = min(args_len, 78 - hours_len - pid_len)
-
-    print ('%%%ds %%%ds %%s' % (hours_len, pid_len)) % \
-          ('Hours', 'PID', 'Command')
-    for hours, pid, args in listing:
-        print ('%%%ds %%%ds %%s' % (hours_len, pid_len)) % \
-              (hours, pid, args[:args_len])
diff --git a/bin/swift-recon b/bin/swift-recon
deleted file mode 100755
index b72cc2841d..0000000000
--- a/bin/swift-recon
+++ /dev/null
@@ -1,765 +0,0 @@
-#! /usr/bin/env python
-"""
-    cmdline utility to perform cluster reconnaissance
-"""
-
-
-from eventlet.green import urllib2
-from swift.common.ring import Ring
-from urlparse import urlparse
-try:
-    import simplejson as json
-except ImportError:
-    import json
-from hashlib import md5
-import eventlet
-import optparse
-import time
-import sys
-import os
-
-
-class Scout(object):
-    """
-    Obtain swift recon information
-    """
-
-    def __init__(self, recon_type, verbose=False, suppress_errors=False,
-                 timeout=5):
-        self.recon_type = recon_type
-        self.verbose = verbose
-        self.suppress_errors = suppress_errors
-        self.timeout = timeout
-
-    def scout_host(self, base_url, recon_type):
-        """
-        Perform the actual HTTP request to obtain swift recon telemtry.
-
-        :param base_url: the base url of the host you wish to check. str of the
-                        format 'http://127.0.0.1:6000/recon/'
-        :param recon_type: the swift recon check to request.
-        :returns: tuple of (recon url used, response body, and status)
-        """
-        url = base_url + recon_type
-        try:
-            body = urllib2.urlopen(url, timeout=self.timeout).read()
-            content = json.loads(body)
-            if self.verbose:
-                print "-> %s: %s" % (url, content)
-            status = 200
-        except urllib2.HTTPError as err:
-            if not self.suppress_errors or self.verbose:
-                print "-> %s: %s" % (url, err)
-            content = err
-            status = err.code
-        except urllib2.URLError as err:
-            if not self.suppress_errors or self.verbose:
-                print "-> %s: %s" % (url, err)
-            content = err
-            status = -1
-        return url, content, status
-
-    def scout(self, host):
-        """
-        Obtain telemetry from a host running the swift recon middleware.
-
-        :param host: host to check
-        :returns: tuple of (recon url used, response body, and status)
-        """
-        base_url = "http://%s:%s/recon/" % (host[0], host[1])
-        url, content, status = self.scout_host(base_url, self.recon_type)
-        return url, content, status
-
-
-class SwiftRecon(object):
-    """
-    Retrieve and report cluster info from hosts running recon middleware.
-    """
-
-    def __init__(self):
-        self.verbose = False
-        self.suppress_errors = False
-        self.timeout = 5
-        self.pool_size = 30
-        self.pool = eventlet.GreenPool(self.pool_size)
-        self.check_types = ['account', 'container', 'object']
-        self.server_type = 'object'
-
-    def _gen_stats(self, stats, name=None):
-        """ compute various stats from a list of values """
-        cstats = [x for x in stats if x is not None]
-        if len(cstats) > 0:
-            ret_dict = {'low': min(cstats), 'high': max(cstats),
-                        'total': sum(cstats), 'reported': len(cstats),
-                        'number_none': len(stats) - len(cstats), 'name': name}
-            ret_dict['average'] = \
-                ret_dict['total'] / float(len(cstats))
-            ret_dict['perc_none'] = \
-                ret_dict['number_none'] * 100.0 / len(stats)
-        else:
-            ret_dict = {'reported': 0}
-        return ret_dict
-
-    def _print_stats(self, stats):
-        """
-        print out formatted stats to console
-
-        :param stats: dict of stats generated by _gen_stats
-        """
-        print '[%(name)s] low: %(low)d, high: %(high)d, avg: ' \
-              '%(average).1f, total: %(total)d, ' \
-              'Failed: %(perc_none).1f%%, no_result: %(number_none)d, ' \
-              'reported: %(reported)d' % stats
-
-    def _ptime(self, timev=None):
-        """
-        :param timev: a unix timestamp or None
-        :returns: a pretty string of the current time or provided time
-        """
-        if timev:
-            return time.strftime("%Y-%m-%d %H:%M:%S", time.localtime(timev))
-        else:
-            return time.strftime("%Y-%m-%d %H:%M:%S", time.localtime())
-
-    def get_devices(self, zone_filter, swift_dir, ring_name):
-        """
-        Get a list of hosts in the ring
-
-        :param zone_filter: Only list zones matching given filter
-        :param swift_dir: Directory of swift config, usually /etc/swift
-        :param ring_name: Name of the ring, such as 'object'
-        :returns: a set of tuples containing the ip and port of hosts
-        """
-        ring_data = Ring(swift_dir, ring_name=ring_name)
-        if zone_filter:
-            ips = set((n['ip'], n['port']) for n in ring_data.devs
-                      if n and n['zone'] == zone_filter)
-        else:
-            ips = set((n['ip'], n['port']) for n in ring_data.devs if n)
-        return ips
-
-    def get_ringmd5(self, hosts, ringfile):
-        """
-        Compare ring md5sum's with those on remote host
-
-        :param hosts: set of hosts to check. in the format of:
-            set([('127.0.0.1', 6020), ('127.0.0.2', 6030)])
-        :param ringfile: The local ring file to compare the md5sum with.
-        """
-        stats = {}
-        matches = 0
-        errors = 0
-        md5sum = md5()
-        with open(ringfile, 'rb') as f:
-            block = f.read(4096)
-            while block:
-                md5sum.update(block)
-                block = f.read(4096)
-        ring_sum = md5sum.hexdigest()
-        recon = Scout("ringmd5", self.verbose, self.suppress_errors,
-                      self.timeout)
-        print "[%s] Checking ring md5sums" % self._ptime()
-        if self.verbose:
-            print "-> On disk %s md5sum: %s" % (ringfile, ring_sum)
-        for url, response, status in self.pool.imap(recon.scout, hosts):
-            if status == 200:
-                stats[url] = response[ringfile]
-                if response[ringfile] != ring_sum:
-                    print "!! %s (%s) doesn't match on disk md5sum" % \
-                        (url, response[ringfile])
-                else:
-                    matches = matches + 1
-                    if self.verbose:
-                        print "-> %s matches." % url
-            else:
-                errors = errors + 1
-        print "%s/%s hosts matched, %s error[s] while checking hosts." \
-            % (matches, len(hosts), errors)
-        print "=" * 79
-
-    def async_check(self, hosts):
-        """
-        Obtain and print async pending statistics
-
-        :param hosts: set of hosts to check. in the format of:
-            set([('127.0.0.1', 6020), ('127.0.0.2', 6030)])
-        """
-        scan = {}
-        recon = Scout("async", self.verbose, self.suppress_errors,
-                      self.timeout)
-        print "[%s] Checking async pendings" % self._ptime()
-        for url, response, status in self.pool.imap(recon.scout, hosts):
-            if status == 200:
-                scan[url] = response['async_pending']
-        stats = self._gen_stats(scan.values(), 'async_pending')
-        if stats['reported'] > 0:
-            self._print_stats(stats)
-        else:
-            print "[async_pending] - No hosts returned valid data."
-        print "=" * 79
-
-    def umount_check(self, hosts):
-        """
-        Check for and print unmounted drives
-
-        :param hosts: set of hosts to check. in the format of:
-            set([('127.0.0.1', 6020), ('127.0.0.2', 6030)])
-        """
-        stats = {}
-        recon = Scout("unmounted", self.verbose, self.suppress_errors,
-                      self.timeout)
-        print "[%s] Getting unmounted drives from %s hosts..." % \
-            (self._ptime(), len(hosts))
-        for url, response, status in self.pool.imap(recon.scout, hosts):
-            if status == 200:
-                stats[url] = []
-                for i in response:
-                    stats[url].append(i['device'])
-        for host in stats:
-            node = urlparse(host).netloc
-            for entry in stats[host]:
-                print "Not mounted: %s on %s" % (entry, node)
-        print "=" * 79
-
-    def expirer_check(self, hosts):
-        """
-        Obtain and print expirer statistics
-
-        :param hosts: set of hosts to check. in the format of:
-            set([('127.0.0.1', 6020), ('127.0.0.2', 6030)])
-        """
-        stats = {'object_expiration_pass': [], 'expired_last_pass': []}
-        recon = Scout("expirer/%s" % self.server_type, self.verbose,
-                      self.suppress_errors, self.timeout)
-        print "[%s] Checking on expirers" % self._ptime()
-        for url, response, status in self.pool.imap(recon.scout, hosts):
-            if status == 200:
-                stats['object_expiration_pass'].append(
-                    response.get('object_expiration_pass'))
-                stats['expired_last_pass'].append(
-                    response.get('expired_last_pass'))
-        for k in stats:
-            if stats[k]:
-                computed = self._gen_stats(stats[k], name=k)
-                if computed['reported'] > 0:
-                    self._print_stats(computed)
-                else:
-                    print "[%s] - No hosts returned valid data." % k
-            else:
-                print "[%s] - No hosts returned valid data." % k
-        print "=" * 79
-
-    def replication_check(self, hosts):
-        """
-        Obtain and print replication statistics
-
-        :param hosts: set of hosts to check. in the format of:
-            set([('127.0.0.1', 6020), ('127.0.0.2', 6030)])
-        """
-        stats = {'replication_time': [], 'failure': [], 'success': [],
-                 'attempted': []}
-        recon = Scout("replication/%s" % self.server_type, self.verbose,
-                      self.suppress_errors, self.timeout)
-        print "[%s] Checking on replication" % self._ptime()
-        for url, response, status in self.pool.imap(recon.scout, hosts):
-            if status == 200:
-                stats['replication_time'].append(
-                    response.get('replication_time'))
-                repl_stats = response['replication_stats']
-                if repl_stats:
-                    for stat_key in ['attempted', 'failure', 'success']:
-                        stats[stat_key].append(repl_stats.get(stat_key))
-        for k in stats:
-            if stats[k]:
-                if k != 'replication_time':
-                    computed = self._gen_stats(stats[k],
-                                               name='replication_%s' % k)
-                else:
-                    computed = self._gen_stats(stats[k], name=k)
-                if computed['reported'] > 0:
-                    self._print_stats(computed)
-                else:
-                    print "[%s] - No hosts returned valid data." % k
-            else:
-                print "[%s] - No hosts returned valid data." % k
-        print "=" * 79
-
-    def object_replication_check(self, hosts):
-        """
-        Obtain and print replication statistics from object servers
-
-        :param hosts: set of hosts to check. in the format of:
-            set([('127.0.0.1', 6020), ('127.0.0.2', 6030)])
-        """
-        stats = {}
-        recon = Scout("replication", self.verbose, self.suppress_errors,
-                      self.timeout)
-        print "[%s] Checking on replication" % self._ptime()
-        for url, response, status in self.pool.imap(recon.scout, hosts):
-            if status == 200:
-                stats[url] = response['object_replication_time']
-        times = [x for x in stats.values() if x is not None]
-        if len(stats) > 0 and len(times) > 0:
-            computed = self._gen_stats(times, 'replication_time')
-            if computed['reported'] > 0:
-                self._print_stats(computed)
-            else:
-                print "[replication_time] - No hosts returned valid data."
-        else:
-            print "[replication_time] - No hosts returned valid data."
-        print "=" * 79
-
-    def updater_check(self, hosts):
-        """
-        Obtain and print updater statistics
-
-        :param hosts: set of hosts to check. in the format of:
-            set([('127.0.0.1', 6020), ('127.0.0.2', 6030)])
-        """
-        stats = []
-        recon = Scout("updater/%s" % self.server_type, self.verbose,
-                      self.suppress_errors, self.timeout)
-        print "[%s] Checking updater times" % self._ptime()
-        for url, response, status in self.pool.imap(recon.scout, hosts):
-            if status == 200:
-                if response['%s_updater_sweep' % self.server_type]:
-                    stats.append(response['%s_updater_sweep' %
-                                          self.server_type])
-        if len(stats) > 0:
-            computed = self._gen_stats(stats, name='updater_last_sweep')
-            if computed['reported'] > 0:
-                self._print_stats(computed)
-            else:
-                print "[updater_last_sweep] - No hosts returned valid data."
-        else:
-            print "[updater_last_sweep] - No hosts returned valid data."
-        print "=" * 79
-
-    def auditor_check(self, hosts):
-        """
-        Obtain and print obj auditor statistics
-
-        :param hosts: set of hosts to check. in the format of:
-            set([('127.0.0.1', 6020), ('127.0.0.2', 6030)])
-        """
-        scan = {}
-        adone = '%s_auditor_pass_completed' % self.server_type
-        afail = '%s_audits_failed' % self.server_type
-        apass = '%s_audits_passed' % self.server_type
-        asince = '%s_audits_since' % self.server_type
-        recon = Scout("auditor/%s" % self.server_type, self.verbose,
-                      self.suppress_errors, self.timeout)
-        print "[%s] Checking auditor stats" % self._ptime()
-        for url, response, status in self.pool.imap(recon.scout, hosts):
-            if status == 200:
-                scan[url] = response
-        if len(scan) < 1:
-            print "Error: No hosts available"
-            return
-        stats = {}
-        stats[adone] = [scan[i][adone] for i in scan
-                        if scan[i][adone] is not None]
-        stats[afail] = [scan[i][afail] for i in scan
-                        if scan[i][afail] is not None]
-        stats[apass] = [scan[i][apass] for i in scan
-                        if scan[i][apass] is not None]
-        stats[asince] = [scan[i][asince] for i in scan
-                         if scan[i][asince] is not None]
-        for k in stats:
-            if len(stats[k]) < 1:
-                print "[%s] - No hosts returned valid data." % k
-            else:
-                if k != asince:
-                    computed = self._gen_stats(stats[k], k)
-                    if computed['reported'] > 0:
-                        self._print_stats(computed)
-        if len(stats[asince]) >= 1:
-            low = min(stats[asince])
-            high = max(stats[asince])
-            total = sum(stats[asince])
-            average = total / len(stats[asince])
-            print '[last_pass] oldest: %s, newest: %s, avg: %s' % \
-                  (self._ptime(low), self._ptime(high), self._ptime(average))
-        print "=" * 79
-
-    def object_auditor_check(self, hosts):
-        """
-        Obtain and print obj auditor statistics
-
-        :param hosts: set of hosts to check. in the format of:
-            set([('127.0.0.1', 6020), ('127.0.0.2', 6030)])
-        """
-        all_scan = {}
-        zbf_scan = {}
-        atime = 'audit_time'
-        bprocessed = 'bytes_processed'
-        passes = 'passes'
-        errors = 'errors'
-        quarantined = 'quarantined'
-        recon = Scout("auditor/object", self.verbose, self.suppress_errors,
-                      self.timeout)
-        print "[%s] Checking auditor stats " % self._ptime()
-        for url, response, status in self.pool.imap(recon.scout, hosts):
-            if status == 200:
-                if response['object_auditor_stats_ALL']:
-                    all_scan[url] = response['object_auditor_stats_ALL']
-                if response['object_auditor_stats_ZBF']:
-                    zbf_scan[url] = response['object_auditor_stats_ZBF']
-        if len(all_scan) > 0:
-            stats = {}
-            stats[atime] = [all_scan[i][atime] for i in all_scan]
-            stats[bprocessed] = [all_scan[i][bprocessed] for i in all_scan]
-            stats[passes] = [all_scan[i][passes] for i in all_scan]
-            stats[errors] = [all_scan[i][errors] for i in all_scan]
-            stats[quarantined] = [all_scan[i][quarantined] for i in all_scan]
-            for k in stats:
-                if None in stats[k]:
-                    stats[k] = [x for x in stats[k] if x is not None]
-                if len(stats[k]) < 1:
-                    print "[Auditor %s] - No hosts returned valid data." % k
-                else:
-                    computed = self._gen_stats(stats[k],
-                                               name='ALL_%s_last_path' % k)
-                    if computed['reported'] > 0:
-                        self._print_stats(computed)
-                    else:
-                        print "[ALL_auditor] - No hosts returned valid data."
-        else:
-            print "[ALL_auditor] - No hosts returned valid data."
-        if len(zbf_scan) > 0:
-            stats = {}
-            stats[atime] = [zbf_scan[i][atime] for i in zbf_scan]
-            stats[bprocessed] = [zbf_scan[i][bprocessed] for i in zbf_scan]
-            stats[errors] = [zbf_scan[i][errors] for i in zbf_scan]
-            stats[quarantined] = [zbf_scan[i][quarantined] for i in zbf_scan]
-            for k in stats:
-                if None in stats[k]:
-                    stats[k] = [x for x in stats[k] if x is not None]
-                if len(stats[k]) < 1:
-                    print "[Auditor %s] - No hosts returned valid data." % k
-                else:
-                    computed = self._gen_stats(stats[k],
-                                               name='ZBF_%s_last_path' % k)
-                    if computed['reported'] > 0:
-                        self._print_stats(computed)
-                    else:
-                        print "[ZBF_auditor] - No hosts returned valid data."
-        else:
-            print "[ZBF_auditor] - No hosts returned valid data."
-        print "=" * 79
-
-    def load_check(self, hosts):
-        """
-        Obtain and print load average statistics
-
-        :param hosts: set of hosts to check. in the format of:
-            set([('127.0.0.1', 6020), ('127.0.0.2', 6030)])
-        """
-        load1 = {}
-        load5 = {}
-        load15 = {}
-        recon = Scout("load", self.verbose, self.suppress_errors,
-                      self.timeout)
-        print "[%s] Checking load averages" % self._ptime()
-        for url, response, status in self.pool.imap(recon.scout, hosts):
-            if status == 200:
-                load1[url] = response['1m']
-                load5[url] = response['5m']
-                load15[url] = response['15m']
-        stats = {"1m": load1, "5m": load5, "15m": load15}
-        for item in stats:
-            if len(stats[item]) > 0:
-                computed = self._gen_stats(stats[item].values(),
-                                           name='%s_load_avg' % item)
-                self._print_stats(computed)
-            else:
-                print "[%s_load_avg] - No hosts returned valid data." % item
-        print "=" * 79
-
-    def quarantine_check(self, hosts):
-        """
-        Obtain and print quarantine statistics
-
-        :param hosts: set of hosts to check. in the format of:
-            set([('127.0.0.1', 6020), ('127.0.0.2', 6030)])
-        """
-        objq = {}
-        conq = {}
-        acctq = {}
-        recon = Scout("quarantined", self.verbose, self.suppress_errors,
-                      self.timeout)
-        print "[%s] Checking quarantine" % self._ptime()
-        for url, response, status in self.pool.imap(recon.scout, hosts):
-            if status == 200:
-                objq[url] = response['objects']
-                conq[url] = response['containers']
-                acctq[url] = response['accounts']
-        stats = {"objects": objq, "containers": conq, "accounts": acctq}
-        for item in stats:
-            if len(stats[item]) > 0:
-                computed = self._gen_stats(stats[item].values(),
-                                           name='quarantined_%s' % item)
-                self._print_stats(computed)
-            else:
-                print "No hosts returned valid data."
-        print "=" * 79
-
-    def socket_usage(self, hosts):
-        """
-        Obtain and print /proc/net/sockstat statistics
-
-        :param hosts: set of hosts to check. in the format of:
-            set([('127.0.0.1', 6020), ('127.0.0.2', 6030)])
-        """
-        inuse4 = {}
-        mem = {}
-        inuse6 = {}
-        timewait = {}
-        orphan = {}
-        recon = Scout("sockstat", self.verbose, self.suppress_errors,
-                      self.timeout)
-        print "[%s] Checking socket usage" % self._ptime()
-        for url, response, status in self.pool.imap(recon.scout, hosts):
-            if status == 200:
-                inuse4[url] = response['tcp_in_use']
-                mem[url] = response['tcp_mem_allocated_bytes']
-                inuse6[url] = response['tcp6_in_use']
-                timewait[url] = response['time_wait']
-                orphan[url] = response['orphan']
-        stats = {"tcp_in_use": inuse4, "tcp_mem_allocated_bytes": mem,
-                 "tcp6_in_use": inuse6, "time_wait": timewait,
-                 "orphan": orphan}
-        for item in stats:
-            if len(stats[item]) > 0:
-                computed = self._gen_stats(stats[item].values(), item)
-                self._print_stats(computed)
-            else:
-                print "No hosts returned valid data."
-        print "=" * 79
-
-    def disk_usage(self, hosts, top=0):
-        """
-        Obtain and print disk usage statistics
-
-        :param hosts: set of hosts to check. in the format of:
-            set([('127.0.0.1', 6020), ('127.0.0.2', 6030)])
-        """
-        stats = {}
-        highs = []
-        lows = []
-        raw_total_used = []
-        raw_total_avail = []
-        percents = {}
-        top_percents = [(None, 0)] * top
-        recon = Scout("diskusage", self.verbose, self.suppress_errors,
-                      self.timeout)
-        print "[%s] Checking disk usage now" % self._ptime()
-        for url, response, status in self.pool.imap(recon.scout, hosts):
-            if status == 200:
-                hostusage = []
-                for entry in response:
-                    if entry['mounted']:
-                        used = float(entry['used']) / float(entry['size']) \
-                            * 100.0
-                        raw_total_used.append(entry['used'])
-                        raw_total_avail.append(entry['avail'])
-                        hostusage.append(round(used, 2))
-                        for ident, oused in top_percents:
-                            if oused < used:
-                                top_percents.append(
-                                    (url + ' ' + entry['device'], used))
-                                top_percents.sort(key=lambda x: -x[1])
-                                top_percents.pop()
-                                break
-                stats[url] = hostusage
-
-        for url in stats:
-            if len(stats[url]) > 0:
-                #get per host hi/los for another day
-                low = min(stats[url])
-                high = max(stats[url])
-                highs.append(high)
-                lows.append(low)
-                for percent in stats[url]:
-                    percents[int(percent)] = percents.get(int(percent), 0) + 1
-            else:
-                print "-> %s: Error. No drive info available." % url
-
-        if len(lows) > 0:
-            low = min(lows)
-            high = max(highs)
-            #dist graph shamelessly stolen from https://github.com/gholt/tcod
-            print "Distribution Graph:"
-            mul = 69.0 / max(percents.values())
-            for percent in sorted(percents):
-                print '% 3d%%%5d %s' % (percent, percents[percent],
-                                        '*' * int(percents[percent] * mul))
-            raw_used = sum(raw_total_used)
-            raw_avail = sum(raw_total_avail)
-            raw_total = raw_used + raw_avail
-            avg_used = 100.0 * raw_used / raw_total
-            print "Disk usage: space used: %s of %s" % (raw_used, raw_total)
-            print "Disk usage: space free: %s of %s" % (raw_avail, raw_total)
-            print "Disk usage: lowest: %s%%, highest: %s%%, avg: %s%%" % \
-                (low, high, avg_used)
-        else:
-            print "No hosts returned valid data."
-        print "=" * 79
-        if top_percents:
-            print 'TOP %s' % top
-            for ident, used in top_percents:
-                if ident:
-                    url, device = ident.split()
-                    host = urlparse(url).netloc.split(':')[0]
-                    print '%.02f%%  %s' % (used, '%-15s %s' % (host, device))
-
-    def main(self):
-        """
-        Retrieve and report cluster info from hosts running recon middleware.
-        """
-        print "=" * 79
-        usage = '''
-        usage: %prog <server_type> [-v] [--suppress] [-a] [-r] [-u] [-d]
-        [-l] [--md5] [--auditor] [--updater] [--expirer] [--sockstat]
-
-        <server_type>\taccount|container|object
-        Defaults to object server.
-
-        ex: %prog container -l --auditor
-        '''
-        args = optparse.OptionParser(usage)
-        args.add_option('--verbose', '-v', action="store_true",
-                        help="Print verbose info")
-        args.add_option('--suppress', action="store_true",
-                        help="Suppress most connection related errors")
-        args.add_option('--async', '-a', action="store_true",
-                        help="Get async stats")
-        args.add_option('--replication', '-r', action="store_true",
-                        help="Get replication stats")
-        args.add_option('--auditor', action="store_true",
-                        help="Get auditor stats")
-        args.add_option('--updater', action="store_true",
-                        help="Get updater stats")
-        args.add_option('--expirer', action="store_true",
-                        help="Get expirer stats")
-        args.add_option('--unmounted', '-u', action="store_true",
-                        help="Check cluster for unmounted devices")
-        args.add_option('--diskusage', '-d', action="store_true",
-                        help="Get disk usage stats")
-        args.add_option('--loadstats', '-l', action="store_true",
-                        help="Get cluster load average stats")
-        args.add_option('--quarantined', '-q', action="store_true",
-                        help="Get cluster quarantine stats")
-        args.add_option('--md5', action="store_true",
-                        help="Get md5sum of servers ring and compare to "
-                        "local copy")
-        args.add_option('--sockstat', action="store_true",
-                        help="Get cluster socket usage stats")
-        args.add_option('--top', type='int', metavar='COUNT', default=0,
-                        help='Also show the top COUNT entries in rank order.')
-        args.add_option('--all', action="store_true",
-                        help="Perform all checks. Equal to -arudlq --md5 "
-                        "--sockstat")
-        args.add_option('--zone', '-z', type="int",
-                        help="Only query servers in specified zone")
-        args.add_option('--timeout', '-t', type="int", metavar="SECONDS",
-                        help="Time to wait for a response from a server",
-                        default=5)
-        args.add_option('--swiftdir', default="/etc/swift",
-                        help="Default = /etc/swift")
-        options, arguments = args.parse_args()
-
-        if len(sys.argv) <= 1 or len(arguments) > 1:
-            args.print_help()
-            sys.exit(0)
-
-        if arguments:
-            if arguments[0] in self.check_types:
-                self.server_type = arguments[0]
-            else:
-                print "Invalid Server Type"
-                args.print_help()
-                sys.exit(1)
-        else:
-            self.server_type = 'object'
-
-        swift_dir = options.swiftdir
-        ring_file = os.path.join(swift_dir, '%s.ring.gz' % self.server_type)
-        self.verbose = options.verbose
-        self.suppress_errors = options.suppress
-        self.timeout = options.timeout
-
-        if options.zone:
-            hosts = self.get_devices(options.zone, swift_dir, self.server_type)
-        else:
-            hosts = self.get_devices(None, swift_dir, self.server_type)
-
-        print "--> Starting reconnaissance on %s hosts" % len(hosts)
-        print "=" * 79
-
-        if options.all:
-            if self.server_type == 'object':
-                self.async_check(hosts)
-                self.object_replication_check(hosts)
-                self.object_auditor_check(hosts)
-                self.updater_check(hosts)
-                self.expirer_check(hosts)
-            elif self.server_type == 'container':
-                self.replication_check(hosts)
-                self.auditor_check(hosts)
-                self.updater_check(hosts)
-            elif self.server_type == 'account':
-                self.replication_check(hosts)
-                self.auditor_check(hosts)
-            self.umount_check(hosts)
-            self.load_check(hosts)
-            self.disk_usage(hosts)
-            self.get_ringmd5(hosts, ring_file)
-            self.quarantine_check(hosts)
-            self.socket_usage(hosts)
-        else:
-            if options.async:
-                if self.server_type == 'object':
-                    self.async_check(hosts)
-                else:
-                    print "Error: Can't check async's on non object servers."
-            if options.unmounted:
-                self.umount_check(hosts)
-            if options.replication:
-                if self.server_type == 'object':
-                    self.object_replication_check(hosts)
-                else:
-                    self.replication_check(hosts)
-            if options.auditor:
-                if self.server_type == 'object':
-                    self.object_auditor_check(hosts)
-                else:
-                    self.auditor_check(hosts)
-            if options.updater:
-                if self.server_type == 'account':
-                    print "Error: Can't check updaters on account servers."
-                else:
-                    self.updater_check(hosts)
-            if options.expirer:
-                if self.server_type == 'object':
-                    self.expirer_check(hosts)
-                else:
-                    print "Error: Can't check expired on non object servers."
-            if options.loadstats:
-                self.load_check(hosts)
-            if options.diskusage:
-                self.disk_usage(hosts, options.top)
-            if options.md5:
-                self.get_ringmd5(hosts, ring_file)
-            if options.quarantined:
-                self.quarantine_check(hosts)
-            if options.sockstat:
-                self.socket_usage(hosts)
-
-
-if __name__ == '__main__':
-    try:
-        reconnoiter = SwiftRecon()
-        reconnoiter.main()
-    except KeyboardInterrupt:
-        print '\n'
diff --git a/bin/swift-recon-cron b/bin/swift-recon-cron
deleted file mode 100755
index d8cb010780..0000000000
--- a/bin/swift-recon-cron
+++ /dev/null
@@ -1,63 +0,0 @@
-#!/usr/bin/env python
-"""
-swift-recon-cron.py
-"""
-
-import os
-import sys
-from ConfigParser import ConfigParser
-from swift.common.utils import get_logger, dump_recon_cache
-
-
-def get_async_count(device_dir, logger):
-    async_count = 0
-    for i in os.listdir(device_dir):
-        asyncdir = os.path.join(device_dir, i, "async_pending")
-        if os.path.isdir(asyncdir):
-            for entry in os.listdir(asyncdir):
-                if os.path.isdir(os.path.join(asyncdir, entry)):
-                    async_hdir = os.path.join(asyncdir, entry)
-                    async_count += len(os.listdir(async_hdir))
-    return async_count
-
-
-def main():
-    c = ConfigParser()
-    try:
-        conf_path = sys.argv[1]
-    except Exception:
-        print "Usage: %s CONF_FILE" % sys.argv[0].split('/')[-1]
-        print "ex: swift-recon-cron /etc/swift/object-server.conf"
-        sys.exit(1)
-    if not c.read(conf_path):
-        print "Unable to read config file %s" % conf_path
-        sys.exit(1)
-    conf = dict(c.items('filter:recon'))
-    device_dir = conf.get('devices', '/srv/node')
-    recon_cache_path = conf.get('recon_cache_path', '/var/cache/swift')
-    recon_lock_path = conf.get('recon_lock_path', '/var/lock')
-    cache_file = os.path.join(recon_cache_path, "object.recon")
-    lock_dir = os.path.join(recon_lock_path, "swift-recon-object-cron")
-    conf['log_name'] = conf.get('log_name', 'recon-cron')
-    logger = get_logger(conf, log_route='recon-cron')
-    try:
-        os.mkdir(lock_dir)
-    except OSError as e:
-        logger.critical(_(str(e)))
-        print str(e)
-        sys.exit(1)
-    try:
-        asyncs = get_async_count(device_dir, logger)
-    except Exception:
-        logger.exception(
-            _('Exception during recon-cron while accessing devices'))
-
-    dump_recon_cache({'async_pending': asyncs}, cache_file, logger)
-
-    try:
-        os.rmdir(lock_dir)
-    except Exception:
-        logger.exception(_('Exception remove cronjob lock'))
-
-if __name__ == '__main__':
-    main()
diff --git a/bin/swift-ring-builder b/bin/swift-ring-builder
deleted file mode 100755
index a31021e3c0..0000000000
--- a/bin/swift-ring-builder
+++ /dev/null
@@ -1,628 +0,0 @@
-#! /usr/bin/env python
-# Copyright (c) 2010-2012 OpenStack, LLC.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#    http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-# implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-import cPickle as pickle
-from array import array
-from errno import EEXIST
-from itertools import islice, izip
-from os import mkdir
-from os.path import basename, dirname, exists, join as pathjoin
-from sys import argv, exit
-from textwrap import wrap
-from time import time
-
-from swift.common import exceptions
-from swift.common.ring import RingBuilder
-
-
-MAJOR_VERSION = 1
-MINOR_VERSION = 3
-EXIT_SUCCESS = 0
-EXIT_WARNING = 1
-EXIT_ERROR = 2
-
-
-def format_device(dev):
-    """
-    Format a device for display.
-    """
-    if ':' in dev['ip']:
-        return 'd%(id)sz%(zone)s-[%(ip)s]:%(port)s/%(device)s_"%(meta)s"' % dev
-    else:
-        return 'd%(id)sz%(zone)s-%(ip)s:%(port)s/%(device)s_"%(meta)s"' % dev
-
-
-class Commands:
-
-    def unknown():
-        print 'Unknown command: %s' % argv[2]
-        exit(EXIT_ERROR)
-
-    def create():
-        """
-swift-ring-builder <builder_file> create <part_power> <replicas>
-                                         <min_part_hours>
-    Creates <builder_file> with 2^<part_power> partitions and <replicas>.
-    <min_part_hours> is number of hours to restrict moving a partition more
-    than once.
-        """
-        if len(argv) < 6:
-            print Commands.create.__doc__.strip()
-            exit(EXIT_ERROR)
-        builder = RingBuilder(int(argv[3]), int(argv[4]), int(argv[5]))
-        backup_dir = pathjoin(dirname(argv[1]), 'backups')
-        try:
-            mkdir(backup_dir)
-        except OSError, err:
-            if err.errno != EEXIST:
-                raise
-        pickle.dump(builder.to_dict(), open(pathjoin(backup_dir,
-                    '%d.' % time() + basename(argv[1])), 'wb'), protocol=2)
-        pickle.dump(builder.to_dict(), open(argv[1], 'wb'), protocol=2)
-        exit(EXIT_SUCCESS)
-
-    def default():
-        """
-swift-ring-builder <builder_file>
-    Shows information about the ring and the devices within.
-        """
-        print '%s, build version %d' % (argv[1], builder.version)
-        zones = 0
-        balance = 0
-        if builder.devs:
-            zones = len(set(d['zone'] for d in builder.devs if d is not None))
-            balance = builder.get_balance()
-        print '%d partitions, %d replicas, %d zones, %d devices, %.02f ' \
-              'balance' % (builder.parts, builder.replicas, zones,
-                           len([d for d in builder.devs if d]), balance)
-        print 'The minimum number of hours before a partition can be ' \
-              'reassigned is %s' % builder.min_part_hours
-        if builder.devs:
-            print 'Devices:    id  zone      ip address  port      name ' \
-                  'weight partitions balance meta'
-            weighted_parts = builder.parts * builder.replicas / \
-                sum(d['weight'] for d in builder.devs if d is not None)
-            for dev in builder.devs:
-                if dev is None:
-                    continue
-                if not dev['weight']:
-                    if dev['parts']:
-                        balance = 999.99
-                    else:
-                        balance = 0
-                else:
-                    balance = 100.0 * dev['parts'] / \
-                        (dev['weight'] * weighted_parts) - 100.0
-                print '         %5d %5d %15s %5d %9s %6.02f %10s %7.02f %s' % \
-                    (dev['id'], dev['zone'], dev['ip'], dev['port'],
-                     dev['device'], dev['weight'], dev['parts'], balance,
-                     dev['meta'])
-        exit(EXIT_SUCCESS)
-
-    def search():
-        """
-swift-ring-builder <builder_file> search <search-value>
-    Shows information about matching devices.
-        """
-        if len(argv) < 4:
-            print Commands.search.__doc__.strip()
-            print
-            print builder.search_devs.__doc__.strip()
-            exit(EXIT_ERROR)
-        devs = builder.search_devs(argv[3])
-        if not devs:
-            print 'No matching devices found'
-            exit(EXIT_ERROR)
-        print 'Devices:    id  zone      ip address  port      name ' \
-              'weight partitions balance meta'
-        weighted_parts = builder.parts * builder.replicas / \
-            sum(d['weight'] for d in builder.devs if d is not None)
-        for dev in devs:
-            if not dev['weight']:
-                if dev['parts']:
-                    balance = 999.99
-                else:
-                    balance = 0
-            else:
-                balance = 100.0 * dev['parts'] / \
-                    (dev['weight'] * weighted_parts) - 100.0
-            print '         %5d %5d %15s %5d %9s %6.02f %10s %7.02f %s' % \
-                (dev['id'], dev['zone'], dev['ip'], dev['port'],
-                 dev['device'], dev['weight'], dev['parts'], balance,
-                 dev['meta'])
-        exit(EXIT_SUCCESS)
-
-    def list_parts():
-        """
-swift-ring-builder <builder_file> list_parts <search-value> [<search-value>] ..
-    Returns a 2 column list of all the partitions that are assigned to any of
-    the devices matching the search values given. The first column is the
-    assigned partition number and the second column is the number of device
-    matches for that partition. The list is ordered from most number of matches
-    to least. If there are a lot of devices to match against, this command
-    could take a while to run.
-        """
-        if len(argv) < 4:
-            print Commands.list_parts.__doc__.strip()
-            print
-            print builder.search_devs.__doc__.strip()
-            exit(EXIT_ERROR)
-        devs = []
-        for arg in argv[3:]:
-            devs.extend(builder.search_devs(arg) or [])
-        if not devs:
-            print 'No matching devices found'
-            exit(EXIT_ERROR)
-        devs = [d['id'] for d in devs]
-        matches = [array('i') for x in xrange(builder.replicas)]
-        for part in xrange(builder.parts):
-            count = len([d for d in builder.get_part_devices(part)
-                         if d['id'] in devs])
-            if count:
-                matches[builder.replicas - count].append(part)
-        print 'Partition   Matches'
-        for index, parts in enumerate(matches):
-            for part in parts:
-                print '%9d   %7d' % (part, builder.replicas - index)
-        exit(EXIT_SUCCESS)
-
-    def add():
-        """
-swift-ring-builder <builder_file> add
-    z<zone>-<ip>:<port>/<device_name>_<meta> <weight>
-    [z<zone>-<ip>:<port>/<device_name>_<meta> <weight>] ...
-
-    Adds devices to the ring with the given information. No partitions will be
-    assigned to the new device until after running 'rebalance'. This is so you
-    can make multiple device changes and rebalance them all just once.
-        """
-        if len(argv) < 5 or len(argv) % 2 != 1:
-            print Commands.add.__doc__.strip()
-            exit(EXIT_ERROR)
-
-        devs_and_weights = izip(islice(argv, 3, len(argv), 2),
-                                islice(argv, 4, len(argv), 2))
-        for devstr, weightstr in devs_and_weights:
-            if not devstr.startswith('z'):
-                print 'Invalid add value: %s' % devstr
-                exit(EXIT_ERROR)
-            i = 1
-            while i < len(devstr) and devstr[i].isdigit():
-                i += 1
-            zone = int(devstr[1:i])
-            rest = devstr[i:]
-
-            if not rest.startswith('-'):
-                print 'Invalid add value: %s' % devstr
-                print "The on-disk ring builder is unchanged.\n"
-                exit(EXIT_ERROR)
-            i = 1
-            if rest[i] == '[':
-                i += 1
-                while i < len(rest) and rest[i] != ']':
-                    i += 1
-                i += 1
-                ip = rest[1:i].lstrip('[').rstrip(']')
-                rest = rest[i:]
-            else:
-                while i < len(rest) and rest[i] in '0123456789.':
-                    i += 1
-                ip = rest[1:i]
-                rest = rest[i:]
-
-            if not rest.startswith(':'):
-                print 'Invalid add value: %s' % devstr
-                print "The on-disk ring builder is unchanged.\n"
-                exit(EXIT_ERROR)
-            i = 1
-            while i < len(rest) and rest[i].isdigit():
-                i += 1
-            port = int(rest[1:i])
-            rest = rest[i:]
-
-            if not rest.startswith('/'):
-                print 'Invalid add value: %s' % devstr
-                print "The on-disk ring builder is unchanged.\n"
-                exit(EXIT_ERROR)
-            i = 1
-            while i < len(rest) and rest[i] != '_':
-                i += 1
-            device_name = rest[1:i]
-            rest = rest[i:]
-
-            meta = ''
-            if rest.startswith('_'):
-                meta = rest[1:]
-
-            try:
-                weight = float(weightstr)
-            except ValueError:
-                print 'Invalid weight value: %s' % weightstr
-                print "The on-disk ring builder is unchanged.\n"
-                exit(EXIT_ERROR)
-
-            if weight < 0:
-                print 'Invalid weight value (must be positive): %s' % weightstr
-                print "The on-disk ring builder is unchanged.\n"
-                exit(EXIT_ERROR)
-
-            for dev in builder.devs:
-                if dev is None:
-                    continue
-                if dev['ip'] == ip and dev['port'] == port and \
-                        dev['device'] == device_name:
-                    print 'Device %d already uses %s:%d/%s.' % \
-                          (dev['id'], dev['ip'], dev['port'], dev['device'])
-                    print "The on-disk ring builder is unchanged.\n"
-                    exit(EXIT_ERROR)
-
-            builder.add_dev({'zone': zone, 'ip': ip, 'port': port,
-                             'device': device_name, 'weight': weight,
-                             'meta': meta})
-            new_dev = builder.search_devs(
-                'z%s-%s:%s/%s' % (zone, ip, port, device_name))[0]['id']
-            if ':' in ip:
-                print 'Device z%s-[%s]:%s/%s_"%s" with %s weight got id %s' % \
-                      (zone, ip, port, device_name, meta, weight, new_dev)
-            else:
-                print 'Device z%s-%s:%s/%s_"%s" with %s weight got id %s' % \
-                      (zone, ip, port, device_name, meta, weight, new_dev)
-        pickle.dump(builder.to_dict(), open(argv[1], 'wb'), protocol=2)
-        exit(EXIT_SUCCESS)
-
-    def set_weight():
-        """
-swift-ring-builder <builder_file> set_weight <search-value> <weight>
-    [<search-value> <weight] ...
-
-    Resets the devices' weights. No partitions will be reassigned to or from
-    the device until after running 'rebalance'. This is so you can make
-    multiple device changes and rebalance them all just once.
-        """
-        if len(argv) < 5 or len(argv) % 2 != 1:
-            print Commands.set_weight.__doc__.strip()
-            print
-            print builder.search_devs.__doc__.strip()
-            exit(EXIT_ERROR)
-
-        devs_and_weights = izip(islice(argv, 3, len(argv), 2),
-                                islice(argv, 4, len(argv), 2))
-        for devstr, weightstr in devs_and_weights:
-            devs = builder.search_devs(devstr)
-            weight = float(weightstr)
-            if not devs:
-                print("Search value \"%s\" matched 0 devices.\n"
-                      "The on-disk ring builder is unchanged.\n"
-                      % devstr)
-                exit(EXIT_ERROR)
-            if len(devs) > 1:
-                print 'Matched more than one device:'
-                for dev in devs:
-                    print '    d%(id)sz%(zone)s-%(ip)s:%(port)s/%(device)s_' \
-                          '"%(meta)s"' % dev
-                if raw_input('Are you sure you want to update the weight for '
-                             'these %s devices? (y/N) ' % len(devs)) != 'y':
-                    print 'Aborting device modifications'
-                    exit(EXIT_ERROR)
-            for dev in devs:
-                builder.set_dev_weight(dev['id'], weight)
-                print 'd%(id)sz%(zone)s-%(ip)s:%(port)s/%(device)s_' \
-                      '"%(meta)s" weight set to %(weight)s' % dev
-        pickle.dump(builder.to_dict(), open(argv[1], 'wb'), protocol=2)
-        exit(EXIT_SUCCESS)
-
-    def set_info():
-        """
-swift-ring-builder <builder_file> set_info
-    <search-value> <ip>:<port>/<device_name>_<meta>
-    [<search-value> <ip>:<port>/<device_name>_<meta>] ...
-
-    For each search-value, resets the matched device's information.
-    This information isn't used to assign partitions, so you can use
-    'write_ring' afterward to rewrite the current ring with the newer
-    device information. Any of the parts are optional in the final
-    <ip>:<port>/<device_name>_<meta> parameter; just give what you
-    want to change. For instance set_info d74 _"snet: 5.6.7.8" would
-    just update the meta data for device id 74.
-        """
-        if len(argv) < 5 or len(argv) % 2 != 1:
-            print Commands.set_info.__doc__.strip()
-            print
-            print builder.search_devs.__doc__.strip()
-            exit(EXIT_ERROR)
-
-        searches_and_changes = izip(islice(argv, 3, len(argv), 2),
-                                    islice(argv, 4, len(argv), 2))
-
-        for search_value, change_value in searches_and_changes:
-            devs = builder.search_devs(search_value)
-            change = []
-            if len(change_value) and change_value[0].isdigit():
-                i = 1
-                while (i < len(change_value) and
-                       change_value[i] in '0123456789.'):
-                    i += 1
-                change.append(('ip', change_value[:i]))
-                change_value = change_value[i:]
-            elif len(change_value) and change_value[0] == '[':
-                i = 1
-                while i < len(change_value) and change_value[i] != ']':
-                    i += 1
-                i += 1
-                change.append(('ip', change_value[:i].lstrip('[').rstrip(']')))
-                change_value = change_value[i:]
-            if change_value.startswith(':'):
-                i = 1
-                while i < len(change_value) and change_value[i].isdigit():
-                    i += 1
-                change.append(('port', int(change_value[1:i])))
-                change_value = change_value[i:]
-            if change_value.startswith('/'):
-                i = 1
-                while i < len(change_value) and change_value[i] != '_':
-                    i += 1
-                change.append(('device', change_value[1:i]))
-                change_value = change_value[i:]
-            if change_value.startswith('_'):
-                change.append(('meta', change_value[1:]))
-                change_value = ''
-            if change_value or not change:
-                raise ValueError('Invalid set info change value: %s' %
-                                 repr(argv[4]))
-            if not devs:
-                print("Search value \"%s\" matched 0 devices.\n"
-                      "The on-disk ring builder is unchanged.\n"
-                      % search_value)
-                exit(EXIT_ERROR)
-            if len(devs) > 1:
-                print 'Matched more than one device:'
-                for dev in devs:
-                    print '    %s' % format_device(dev)
-                if raw_input('Are you sure you want to update the info for '
-                             'these %s devices? (y/N) ' % len(devs)) != 'y':
-                    print 'Aborting device modifications'
-                    exit(EXIT_ERROR)
-            for dev in devs:
-                orig_dev_string = format_device(dev)
-                test_dev = dict(dev)
-                for key, value in change:
-                    test_dev[key] = value
-                for check_dev in builder.devs:
-                    if not check_dev or check_dev['id'] == test_dev['id']:
-                        continue
-                    if check_dev['ip'] == test_dev['ip'] and \
-                            check_dev['port'] == test_dev['port'] and \
-                            check_dev['device'] == test_dev['device']:
-                        print 'Device %d already uses %s:%d/%s.' % \
-                              (check_dev['id'], check_dev['ip'],
-                               check_dev['port'], check_dev['device'])
-                        exit(EXIT_ERROR)
-                for key, value in change:
-                    dev[key] = value
-                print 'Device %s is now %s' % (orig_dev_string,
-                                               format_device(dev))
-        pickle.dump(builder.to_dict(), open(argv[1], 'wb'), protocol=2)
-        exit(EXIT_SUCCESS)
-
-    def remove():
-        """
-swift-ring-builder <builder_file> remove <search-value> [search-value ...]
-    Removes the device(s) from the ring. This should normally just be used for
-    a device that has failed. For a device you wish to decommission, it's best
-    to set its weight to 0, wait for it to drain all its data, then use this
-    remove command. This will not take effect until after running 'rebalance'.
-    This is so you can make multiple device changes and rebalance them all just
-    once.
-        """
-        if len(argv) < 4:
-            print Commands.remove.__doc__.strip()
-            print
-            print builder.search_devs.__doc__.strip()
-            exit(EXIT_ERROR)
-
-        for search_value in argv[3:]:
-            devs = builder.search_devs(search_value)
-            if not devs:
-                print("Search value \"%s\" matched 0 devices.\n"
-                      "The on-disk ring builder is unchanged." % search_value)
-                exit(EXIT_ERROR)
-            if len(devs) > 1:
-                print 'Matched more than one device:'
-                for dev in devs:
-                    print '    d%(id)sz%(zone)s-%(ip)s:%(port)s/%(device)s_' \
-                          '"%(meta)s"' % dev
-                if raw_input('Are you sure you want to remove these %s '
-                             'devices? (y/N) ' % len(devs)) != 'y':
-                    print 'Aborting device removals'
-                    exit(EXIT_ERROR)
-            for dev in devs:
-                try:
-                    builder.remove_dev(dev['id'])
-                except exceptions.RingBuilderError, e:
-                    print '-' * 79
-                    print(
-                        "An error occurred while removing device with id %d\n"
-                        "This usually means that you attempted to remove\n"
-                        "the last device in a ring. If this is the case,\n"
-                        "consider creating a new ring instead.\n"
-                        "The on-disk ring builder is unchanged.\n"
-                        "Original exception message: %s" %
-                        (dev['id'], e.message)
-                    )
-                    print '-' * 79
-                    exit(EXIT_ERROR)
-
-                print 'd%(id)sz%(zone)s-%(ip)s:%(port)s/%(device)s_' \
-                      '"%(meta)s" marked for removal and will be removed' \
-                      ' next rebalance.' % dev
-        pickle.dump(builder.to_dict(), open(argv[1], 'wb'), protocol=2)
-        exit(EXIT_SUCCESS)
-
-    def rebalance():
-        """
-swift-ring-builder <builder_file> rebalance
-    Attempts to rebalance the ring by reassigning partitions that haven't been
-    recently reassigned.
-        """
-        devs_changed = builder.devs_changed
-        try:
-            last_balance = builder.get_balance()
-            parts, balance = builder.rebalance()
-        except exceptions.RingBuilderError, e:
-            print '-' * 79
-            print ("An error has occurred during ring validation. Common\n"
-                   "causes of failure are rings that are empty or do not\n"
-                   "have enough devices to accommodate the replica count.\n"
-                   "Original exception message:\n %s" % e.message
-                   )
-            print '-' * 79
-            exit(EXIT_ERROR)
-        if not parts:
-            print 'No partitions could be reassigned.'
-            print 'Either none need to be or none can be due to ' \
-                  'min_part_hours [%s].' % builder.min_part_hours
-            exit(EXIT_WARNING)
-        if not devs_changed and abs(last_balance - balance) < 1:
-            print 'Cowardly refusing to save rebalance as it did not change ' \
-                  'at least 1%.'
-            exit(EXIT_WARNING)
-        try:
-            builder.validate()
-        except exceptions.RingValidationError, e:
-            print '-' * 79
-            print ("An error has occurred during ring validation. Common\n"
-                   "causes of failure are rings that are empty or do not\n"
-                   "have enough devices to accommodate the replica count.\n"
-                   "Original exception message:\n %s" % e.message
-                   )
-            print '-' * 79
-            exit(EXIT_ERROR)
-        print 'Reassigned %d (%.02f%%) partitions. Balance is now %.02f.' % \
-              (parts, 100.0 * parts / builder.parts, balance)
-        status = EXIT_SUCCESS
-        if balance > 5:
-            print '-' * 79
-            print 'NOTE: Balance of %.02f indicates you should push this ' % \
-                  balance
-            print '      ring, wait at least %d hours, and rebalance/repush.' \
-                  % builder.min_part_hours
-            print '-' * 79
-            status = EXIT_WARNING
-        ts = time()
-        builder.get_ring().save(
-            pathjoin(backup_dir, '%d.' % ts + basename(ring_file)))
-        pickle.dump(builder.to_dict(), open(pathjoin(backup_dir,
-                    '%d.' % ts + basename(argv[1])), 'wb'), protocol=2)
-        builder.get_ring().save(ring_file)
-        pickle.dump(builder.to_dict(), open(argv[1], 'wb'), protocol=2)
-        exit(status)
-
-    def validate():
-        """
-swift-ring-builder <builder_file> validate
-    Just runs the validation routines on the ring.
-        """
-        builder.validate()
-        exit(EXIT_SUCCESS)
-
-    def write_ring():
-        """
-swift-ring-builder <builder_file> write_ring
-    Just rewrites the distributable ring file. This is done automatically after
-    a successful rebalance, so really this is only useful after one or more
-    'set_info' calls when no rebalance is needed but you want to send out the
-    new device information.
-        """
-        ring_data = builder.get_ring()
-        if not ring_data._replica2part2dev_id:
-            if ring_data.devs:
-                print 'Warning: Writing a ring with no partition ' \
-                      'assignments but with devices; did you forget to run ' \
-                      '"rebalance"?'
-            else:
-                print 'Warning: Writing an empty ring'
-        ring_data.save(
-            pathjoin(backup_dir, '%d.' % time() + basename(ring_file)))
-        ring_data.save(ring_file)
-        exit(EXIT_SUCCESS)
-
-    def pretend_min_part_hours_passed():
-        builder.pretend_min_part_hours_passed()
-        pickle.dump(builder.to_dict(), open(argv[1], 'wb'), protocol=2)
-        exit(EXIT_SUCCESS)
-
-    def set_min_part_hours():
-        """
-swift-ring-builder <builder_file> set_min_part_hours <hours>
-    Changes the <min_part_hours> to the given <hours>. This should be set to
-    however long a full replication/update cycle takes. We're working on a way
-    to determine this more easily than scanning logs.
-        """
-        if len(argv) < 4:
-            print Commands.set_min_part_hours.__doc__.strip()
-            exit(EXIT_ERROR)
-        builder.change_min_part_hours(int(argv[3]))
-        print 'The minimum number of hours before a partition can be ' \
-              'reassigned is now set to %s' % argv[3]
-        pickle.dump(builder.to_dict(), open(argv[1], 'wb'), protocol=2)
-        exit(EXIT_SUCCESS)
-
-
-if __name__ == '__main__':
-    if len(argv) < 2:
-        print "swift-ring-builder %(MAJOR_VERSION)s.%(MINOR_VERSION)s\n" % \
-              globals()
-        print Commands.default.__doc__.strip()
-        print
-        cmds = [c for c, f in Commands.__dict__.iteritems()
-                if f.__doc__ and c[0] != '_' and c != 'default']
-        cmds.sort()
-        for cmd in cmds:
-            print Commands.__dict__[cmd].__doc__.strip()
-            print
-        print RingBuilder.search_devs.__doc__.strip()
-        print
-        for line in wrap(' '.join(cmds), 79, initial_indent='Quick list: ',
-                         subsequent_indent='            '):
-            print line
-        print ('Exit codes: 0 = operation successful\n'
-               '            1 = operation completed with warnings\n'
-               '            2 = error')
-        exit(EXIT_SUCCESS)
-
-    if exists(argv[1]):
-        builder = RingBuilder.load(argv[1])
-    elif len(argv) < 3 or argv[2] != 'create':
-        print 'Ring Builder file does not exist: %s' % argv[1]
-        exit(EXIT_ERROR)
-
-    backup_dir = pathjoin(dirname(argv[1]), 'backups')
-    try:
-        mkdir(backup_dir)
-    except OSError, err:
-        if err.errno != EEXIST:
-            raise
-
-    ring_file = argv[1]
-    if ring_file.endswith('.builder'):
-        ring_file = ring_file[:-len('.builder')]
-    ring_file += '.ring.gz'
-
-    if len(argv) == 2:
-        command = "default"
-    else:
-        command = argv[2]
-    Commands.__dict__.get(command, Commands.unknown)()
diff --git a/bin/swift-temp-url b/bin/swift-temp-url
deleted file mode 100755
index da7595a753..0000000000
--- a/bin/swift-temp-url
+++ /dev/null
@@ -1,59 +0,0 @@
-#!/usr/bin/env python
-
-import hmac
-from hashlib import sha1
-from os.path import basename
-from sys import argv, exit
-from time import time
-
-
-if __name__ == '__main__':
-    if len(argv) != 5:
-        prog = basename(argv[0])
-        print 'Syntax: %s <method> <seconds> <path> <key>' % prog
-        print
-        print 'Where:'
-        print '  <method>   The method to allow, GET or PUT.'
-        print '             Note: HEAD will also be allowed.'
-        print '  <seconds>  The number of seconds from now to allow requests.'
-        print '  <path>     The full path to the resource.'
-        print '             Example: /v1/AUTH_account/c/o'
-        print '  <key>      The X-Account-Meta-Temp-URL-Key for the account.'
-        print
-        print 'Example output:'
-        print '    /v1/AUTH_account/c/o?temp_url_sig=34d49efc32fe6e3082e411e' \
-              'eeb85bd8a&temp_url_expires=1323482948'
-        print
-        print 'This can be used to form a URL to give out for the access '
-        print 'allowed. For example:'
-        print '    echo https://swift-cluster.example.com`%s GET 60 ' \
-              '/v1/AUTH_account/c/o mykey`' % prog
-        print
-        print 'Might output:'
-        print '    https://swift-cluster.example.com/v1/AUTH_account/c/o?' \
-              'temp_url_sig=34d49efc32fe6e3082e411eeeb85bd8a&' \
-              'temp_url_expires=1323482948'
-        exit(1)
-    method, seconds, path, key = argv[1:]
-    if method not in ('GET', 'PUT'):
-        print 'Please use either the GET or PUT method.'
-        exit(1)
-    try:
-        expires = int(time() + int(seconds))
-    except ValueError:
-        expires = 0
-    if expires < 1:
-        print 'Please use a positive <seconds> value.'
-        exit(1)
-    parts = path.split('/', 4)
-    # Must be five parts, ['', 'v1', 'a', 'c', 'o'], must be a v1 request, have
-    # account, container, and object values, and the object value can't just
-    # have '/'s.
-    if len(parts) != 5 or parts[0] or parts[1] != 'v1' or not parts[2] or \
-            not parts[3] or not parts[4].strip('/'):
-        print '<path> must point to an object.'
-        print 'For example: /v1/account/container/object'
-        exit(1)
-    sig = hmac.new(key, '%s\n%s\n%s' % (method, expires, path),
-                   sha1).hexdigest()
-    print '%s?temp_url_sig=%s&temp_url_expires=%s' % (path, sig, expires)
diff --git a/bindep.txt b/bindep.txt
new file mode 100644
index 0000000000..4510a6059b
--- /dev/null
+++ b/bindep.txt
@@ -0,0 +1,39 @@
+# This is a cross-platform list tracking distribution packages needed by tests;
+# see http://docs.openstack.org/infra/bindep/ for additional information.
+
+build-essential [platform:dpkg]
+linux-headers [platform:apk]
+gcc [platform:rpm platform:apk]
+gettext [!platform:suse]
+gettext-runtime [platform:suse]
+liberasurecode-dev [platform:dpkg]
+# There's no library in CentOS 7 but Fedora and openSUSE have it.
+liberasurecode-devel [platform:rpm !platform:centos]
+libffi-dev [platform:dpkg platform:apk]
+libffi-devel [platform:rpm]
+libxml2-dev [platform:dpkg platform:apk]
+libxml2-devel [platform:rpm]
+libxslt-devel [platform:rpm]
+libxslt1-dev [platform:dpkg]
+libxslt-dev [platform:apk]
+memcached
+python3-dev [platform:dpkg platform:apk test]
+python3-devel [platform:rpm test]
+# python3-devel does not pull in the python3 package on openSUSE so
+# we need to be explicit. The python3 package contains the XML module
+# which is required by a python3 virtualenv.
+# See https://bugzilla.suse.com/show_bug.cgi?id=1046990
+python3 [platform:suse platform:apk test]
+rsync
+xfsprogs
+libssl-dev [platform:dpkg]
+openssl-devel [platform:redhat]
+openssl-dev [platform:apk]
+libopenssl-devel [platform:suse]
+py-cffi [platform:apk]
+musl-dev [platform:apk]
+man-db [pep8]
+man [platform:rpm pep8]
+# libsrvg2 is required to build docs
+librsvg2-tools [doc platform:rpm]
+librsvg2-bin [doc platform:dpkg]
diff --git a/doc/manpages/account-server.conf.5 b/doc/manpages/account-server.conf.5
index acc1742ba8..f3a9c1851a 100644
--- a/doc/manpages/account-server.conf.5
+++ b/doc/manpages/account-server.conf.5
@@ -1,6 +1,6 @@
 .\"
 .\" Author: Joao Marcelo Martins <marcelo.martins@rackspace.com> or <btorch@gmail.com>
-.\" Copyright (c) 2010-2012 OpenStack, LLC.
+.\" Copyright (c) 2010-2012 OpenStack Foundation.
 .\"
 .\" Licensed under the Apache License, Version 2.0 (the "License");
 .\" you may not use this file except in compliance with the License.
@@ -20,7 +20,7 @@
 .SH NAME
 .LP
 .B account-server.conf
-\- configuration file for the openstack-swift account server
+\- configuration file for the OpenStack Swift account server
 
 
 
@@ -42,7 +42,7 @@ certain number of key/value parameters which are described later.
 Any line that begins with a '#' symbol is ignored.
 
 You can find more information about python-pastedeploy configuration format at
-\fIhttp://pythonpaste.org/deploy/#config-format\fR
+\fIhttps://docs.pylonsproject.org/projects/pastedeploy/en/latest/#config-format\fR
 
 
 
@@ -56,26 +56,91 @@ are acceptable within this section.
 IP address the account server should bind to. The default is 0.0.0.0 which will make
 it bind to all available addresses.
 .IP "\fBbind_port\fR"
-TCP port the account server should bind to. The default is 6002.
+TCP port the account server should bind to. The default is 6202.
+.IP "\fBkeep_idle\fR"
+Value to set for socket TCP_KEEPIDLE. The default value is 600.
+.IP "\fBbind_timeout\fR"
+Timeout to bind socket. The default is 30.
 .IP \fBbacklog\fR
 TCP backlog.  Maximum number of allowed pending connections. The default value is 4096.
 .IP \fBworkers\fR
-Number of account server workers to fork. The default is 1.
+The number of pre-forked processes that will accept connections.  Zero means
+no fork.  The default is auto which will make the server try to match the
+number of effective cpu cores if python multiprocessing is available (included
+with most python distributions >= 2.6) or fallback to one.  It's worth noting
+that individual workers will use many eventlet co-routines to service multiple
+concurrent requests.
+.IP \fBmax_clients\fR
+Maximum number of clients one worker can process simultaneously (it will
+actually accept(2) N + 1). Setting this to one (1) will only handle one request
+at a time, without accepting another request concurrently.  The default is 1024.
 .IP \fBuser\fR
 The system user that the account server will run as. The default is swift.
 .IP \fBswift_dir\fR
 Swift configuration directory. The default is /etc/swift.
 .IP \fBdevices\fR
-Parent directory or where devices are mounted. Default is /srv/node.
+Parent directory of where devices are mounted. Default is /srv/node.
 .IP \fBmount_check\fR
 Whether or not check if the devices are mounted to prevent accidentally writing to
 the root device. The default is set to true.
+.IP \fBdisable_fallocate\fR
+Disable pre-allocate disk space for a file. The default is false.
 .IP \fBlog_name\fR
 Label used when logging. The default is swift.
 .IP \fBlog_facility\fR
 Syslog log facility. The default is LOG_LOCAL0.
 .IP \fBlog_level\fR
 Logging level. The default is INFO.
+.IP "\fBlog_address\fR
+Logging address. The default is /dev/log.
+.IP \fBlog_max_line_length\fR
+The following caps the length of log lines to the value given; no limit if
+set to 0, the default.
+.IP \fBlog_custom_handlers\fR
+Comma separated list of functions to call to setup custom log handlers.
+functions get passed: conf, name, log_to_console, log_route, fmt, logger,
+adapted_logger. The default is empty.
+.IP \fBlog_udp_host\fR
+If set, log_udp_host will override log_address.
+.IP "\fBlog_udp_port\fR
+UDP log port, the default is 514.
+.IP \fBlog_statsd_host\fR
+StatsD server. IPv4/IPv6 addresses and hostnames are
+supported. If a hostname resolves to an IPv4 and IPv6 address, the IPv4
+address will be used.
+.IP \fBlog_statsd_port\fR
+The default is 8125.
+.IP \fBlog_statsd_default_sample_rate\fR
+The default is 1.
+.IP \fBlog_statsd_sample_rate_factor\fR
+The default is 1.
+.IP \fBlog_statsd_metric_prefix\fR
+The default is empty.
+.IP \fBdb_preallocation\fR
+If you don't mind the extra disk space usage in overhead, you can turn this
+on to preallocate disk space with SQLite databases to decrease fragmentation.
+The default is false.
+.IP \fBeventlet_debug\fR
+Debug mode for eventlet library. The default is false.
+.IP \fBfallocate_reserve\fR
+You can set fallocate_reserve to the number of bytes or percentage of disk
+space you'd like fallocate to reserve, whether there is space for the given
+file size or not. Percentage will be used if the value ends with a '%'.
+The default is 1%.
+.IP \fBnice_priority\fR
+Modify scheduling priority of server processes. Niceness values range from -20
+(most favorable to the process) to 19 (least favorable to the process).
+The default does not modify priority.
+.IP \fBionice_class\fR
+Modify I/O scheduling class of server processes. I/O niceness class values
+are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and IOPRIO_CLASS_IDLE (idle).
+The default does not modify class and priority.
+Work only with ionice_priority.
+.IP \fBionice_priority\fR
+Modify I/O scheduling priority of server processes. I/O niceness priority
+is a number which goes from 0 to 7. The higher the value, the lower
+the I/O priority of the process. Work only with ionice_class.
+Ignored if IOPRIO_CLASS_IDLE is set.
 .RE
 .PD
 
@@ -108,12 +173,33 @@ This is normally \fBegg:swift#account\fR.
 Label used when logging. The default is account-server.
 .IP "\fBset log_facility\fR
 Syslog log facility. The default is LOG_LOCAL0.
-.IP "\fB set log_level\fR
+.IP "\fBset log_level\fR
 Logging level. The default is INFO.
-.IP "\fB set log_requests\fR
+.IP "\fBset log_requests\fR
 Enables request logging. The default is True.
-.IP "\fB set log_address\fR
+.IP "\fBset log_address\fR
 Logging address. The default is /dev/log.
+.IP "\fBreplication_server\fR
+Configure parameter for creating specific server.
+To handle all verbs, including replication verbs, do not specify
+"replication_server" (this is the default). To only handle replication,
+set to a true value (e.g. "true" or "1"). To handle only non-replication
+verbs, set to "false". Unless you have a separate replication network, you
+should not specify any value for "replication_server". The default is empty.
+.IP \fBnice_priority\fR
+Modify scheduling priority of server processes. Niceness values range from -20
+(most favorable to the process) to 19 (least favorable to the process).
+The default does not modify priority.
+.IP \fBionice_class\fR
+Modify I/O scheduling class of server processes. I/O niceness class values
+are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and IOPRIO_CLASS_IDLE (idle).
+The default does not modify class and priority.
+Work only with ionice_priority.
+.IP \fBionice_priority\fR
+Modify I/O scheduling priority of server processes. I/O niceness priority
+is a number which goes from 0 to 7. The higher the value, the lower
+the I/O priority of the process. Work only with ionice_class.
+Ignored if IOPRIO_CLASS_IDLE is set.
 .RE
 .PD
 
@@ -149,6 +235,36 @@ and ensure that swift has read/write. The default is /var/cache/swift.
 .RE
 .PD
 
+.RS 0
+.IP "\fB[filter:xprofile]\fR"
+.RS 3
+.IP "\fBuse\fR"
+Entry point for paste.deploy for the xprofile middleware. This is the reference to the installed python egg.
+This is normally \fBegg:swift#xprofile\fR.
+.IP "\fBprofile_module\fR"
+This option enable you to switch profilers which should inherit from python
+standard profiler. Currently the supported value can be 'cProfile', 'eventlet.green.profile' etc.
+.IP "\fBlog_filename_prefix\fR"
+This prefix will be used to combine process ID and timestamp to name the
+profile data file.  Make sure the executing user has permission to write
+into this path (missing path segments will be created, if necessary).
+If you enable profiling in more than one type of daemon, you must override
+it with an unique value like, the default is /var/log/swift/profile/account.profile.
+.IP "\fBdump_interval\fR"
+The profile data will be dumped to local disk based on above naming rule
+in this interval. The default is 5.0.
+.IP "\fBdump_timestamp\fR"
+Be careful, this option will enable profiler to dump data into the file with
+time stamp which means there will be lots of files piled up in the directory.
+The default is false
+.IP "\fBpath\fR"
+This is the path of the URL to access the mini web UI. The default is __profile__.
+.IP "\fBflush_at_shutdown\fR"
+Clear the data when the wsgi server shutdown. The default is false.
+.IP "\fBunwind\fR"
+Unwind the iterator of applications. Default is false.
+.RE
+.PD
 
 
 .SH ADDITIONAL SECTIONS
@@ -167,24 +283,16 @@ Syslog log facility. The default is LOG_LOCAL0.
 Logging level. The default is INFO.
 .IP \fBlog_address\fR
 Logging address. The default is /dev/log.
-.IP \fBvm_test_mode\fR
-Indicates that you are using a VM environment. The default is no.
 .IP \fBper_diff\fR
-The default is 1000.
+Maximum number of database rows that will be sync'd in a single HTTP replication request. The default is 1000.
 .IP \fBmax_diffs\fR
 This caps how long the replicator will spend trying to sync a given database per pass so the other databases don't get starved. The default is 100.
 .IP \fBconcurrency\fR
 Number of replication workers to spawn. The default is 8.
 .IP "\fBrun_pause [deprecated]\fR"
-Time in seconds to wait between replication passes. The default is 10.
+Time in seconds to wait between replication passes. The default is 30.
 .IP \fBinterval\fR
 Replaces run_pause with the more standard "interval", which means the replicator won't pause unless it takes less than the interval set. The default is 30.
-.IP \fBerror_suppression_interval\fR
-How long without an error before a node's error count is reset. This will also be how long before a node is re-enabled after suppression is triggered.
-The default is 60 seconds.
-.IP \fBerror_suppression_limit\fR
-How many errors can accumulate before a node is temporarily ignored. The default
-is 10 seconds.
 .IP \fBnode_timeout\fR
 Request timeout to external services. The default is 10 seconds.
 .IP \fBconn_timeout\fR
@@ -192,6 +300,29 @@ Connection timeout to external services. The default is 0.5 seconds.
 .IP \fBreclaim_age\fR
 Time elapsed in seconds before an account can be reclaimed. The default is
 604800 seconds.
+.IP \fBrsync_compress\fR
+Allow rsync to compress data which is transmitted to destination node
+during sync. However, this is applicable only when destination node is in
+a different region than the local one. The default is false.
+.IP \fBrsync_module\fR
+Format of the rsync module where the replicator will send data. See
+etc/rsyncd.conf-sample for some usage examples.
+.IP \fBrecon_cache_path\fR
+Path to recon cache directory. The default is /var/cache/swift.
+.IP \fBnice_priority\fR
+Modify scheduling priority of server processes. Niceness values range from -20
+(most favorable to the process) to 19 (least favorable to the process).
+The default does not modify priority.
+.IP \fBionice_class\fR
+Modify I/O scheduling class of server processes. I/O niceness class values
+are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and IOPRIO_CLASS_IDLE (idle).
+The default does not modify class and priority.
+Work only with ionice_priority.
+.IP \fBionice_priority\fR
+Modify I/O scheduling priority of server processes. I/O niceness priority
+is a number which goes from 0 to 7. The higher the value, the lower
+the I/O priority of the process. Work only with ionice_class.
+Ignored if IOPRIO_CLASS_IDLE is set.
 .RE
 
 
@@ -210,6 +341,24 @@ Logging level. The default is INFO.
 Logging address. The default is /dev/log.
 .IP \fBinterval\fR
 Will audit, at most, 1 account per device per interval. The default is 1800 seconds.
+.IP \fBaccounts_per_second\fR
+Maximum accounts audited per second. Should be tuned according to individual system specs. 0 is unlimited. The default is 200.
+.IP \fBrecon_cache_path\fR
+Path to recon cache directory. The default is /var/cache/swift.
+.IP \fBnice_priority\fR
+Modify scheduling priority of server processes. Niceness values range from -20
+(most favorable to the process) to 19 (least favorable to the process).
+The default does not modify priority.
+.IP \fBionice_class\fR
+Modify I/O scheduling class of server processes. I/O niceness class values
+are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and IOPRIO_CLASS_IDLE (idle).
+The default does not modify class and priority.
+Work only with ionice_priority.
+.IP \fBionice_priority\fR
+Modify I/O scheduling priority of server processes. I/O niceness priority
+is a number which goes from 0 to 7. The higher the value, the lower
+the I/O priority of the process. Work only with ionice_class.
+Ignored if IOPRIO_CLASS_IDLE is set.
 .RE
 
 
@@ -234,6 +383,36 @@ Minimum time for a pass to take. The default is 3600 seconds.
 Request timeout to external services. The default is 10 seconds.
 .IP \fBconn_timeout\fR
 Connection timeout to external services. The default is 0.5 seconds.
+.IP \fBdelay_reaping\fR
+Normally, the reaper begins deleting account information for deleted accounts
+immediately; you can set this to delay its work however. The value is in
+seconds. The default is 0.  The sum of this value and the
+container-updater interval should be less than the account-replicator
+reclaim_age. This ensures that once the account-reaper has deleted a
+container there is sufficient time for the container-updater to report to the
+account before the account DB is removed.
+.IP \fBreap_warn_after\fR
+If the account fails to be reaped due to a persistent error, the
+account reaper will log a message such as:
+    Account <name> has not been reaped since <date>
+You can search logs for this message if space is not being reclaimed
+after you delete account(s).
+Default is 2592000 seconds (30 days). This is in addition to any time
+requested by delay_reaping.
+.IP \fBnice_priority\fR
+Modify scheduling priority of server processes. Niceness values range from -20
+(most favorable to the process) to 19 (least favorable to the process).
+The default does not modify priority.
+.IP \fBionice_class\fR
+Modify I/O scheduling class of server processes. I/O niceness class values
+are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and IOPRIO_CLASS_IDLE (idle).
+The default does not modify class and priority.
+Work only with ionice_priority.
+.IP \fBionice_priority\fR
+Modify I/O scheduling priority of server processes. I/O niceness priority
+is a number which goes from 0 to 7. The higher the value, the lower
+the I/O priority of the process. Work only with ionice_class.
+Ignored if IOPRIO_CLASS_IDLE is set.
 .RE
 .PD
 
@@ -243,13 +422,11 @@ Connection timeout to external services. The default is 0.5 seconds.
 .SH DOCUMENTATION
 .LP
 More in depth documentation about the swift-account-server and
-also Openstack-Swift as a whole can be found at
-.BI http://swift.openstack.org/admin_guide.html
+also OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/admin_guide.html
 and
-.BI http://swift.openstack.org
+.BI https://docs.openstack.org/swift/latest/
 
 
 .SH "SEE ALSO"
 .BR swift-account-server(1),
-
-
diff --git a/doc/manpages/container-reconciler.conf.5 b/doc/manpages/container-reconciler.conf.5
new file mode 100644
index 0000000000..79797b6496
--- /dev/null
+++ b/doc/manpages/container-reconciler.conf.5
@@ -0,0 +1,182 @@
+.\"
+.\" Author: HCLTech-SSW <hcl_ss_oss@hcl.com>
+.\" Copyright (c) 2010-2017 OpenStack Foundation.
+.\"
+.\" Licensed under the Apache License, Version 2.0 (the "License");
+.\" you may not use this file except in compliance with the License.
+.\" You may obtain a copy of the License at
+.\"
+.\"    http://www.apache.org/licenses/LICENSE-2.0
+.\"
+.\" Unless required by applicable law or agreed to in writing, software
+.\" distributed under the License is distributed on an "AS IS" BASIS,
+.\" WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+.\" implied.
+.\" See the License for the specific language governing permissions and
+.\" limitations under the License.
+.\"
+.TH container-reconciler.conf 5 "10/25/2017" "Linux" "OpenStack Swift"
+
+.SH NAME
+.LP
+.B container-reconciler.conf
+\- configuration file for the OpenStack Swift container reconciler
+
+
+.SH SYNOPSIS
+.LP
+.B container-reconciler.conf
+
+
+.SH DESCRIPTION
+.PP
+This is the configuration file used by the container reconciler.
+
+The configuration file follows the python-pastedeploy syntax. The file is divided
+into sections, which are enclosed by square brackets. Each section will contain a
+certain number of key/value parameters which are described later.
+
+Any line that begins with a '#' symbol is ignored.
+
+You can find more information about python-pastedeploy configuration format at
+\fIhttps://docs.pylonsproject.org/projects/pastedeploy/en/latest/#config-format\fR
+
+
+.SH GLOBAL SECTION
+.PD 1
+.RS 0
+This is indicated by section named [DEFAULT]. Below are the parameters that
+are acceptable within this section.
+
+.IP "\fBlog_address\fR"
+Location where syslog sends the logs to. The default is /dev/log.
+.IP "\fBlog_custom_handlers \fR"
+Comma-separated list of functions to call to setup custom log handlers.
+.IP "\fBlog_facility\fR"
+Syslog log facility. The default is LOG_LOCAL0.
+.IP "\fBlog_level\fR"
+Log level used for logging. The default is INFO.
+.IP "\fBlog_name\fR"
+Label used when logging. The default is swift.
+.IP "\fBlog_statsd_default_sample_rate\fR"
+Defines the probability of sending a sample for any given event or
+timing measurement. The default is 1.0.
+.IP "\fBlog_statsd_host\fR"
+If not set, the StatsD feature is disabled. The default is localhost.
+.IP "\fBlog_statsd_metric_prefix\fR"
+Value will be prepended to every metric sent to the StatsD server.
+.IP "\fBlog_statsd_port\fR"
+The port value for the StatsD server. The default is 8125.
+.IP "\fBlog_statsd_sample_rate_factor\fR"
+It is not recommended to set this to a value less than 1.0, if frequency of
+logging is too high, tune the log_statsd_default_sample_rate instead.
+The default value is 1.0.
+.IP "\fBlog_udp_host\fR"
+If not set, the UDP receiver for syslog is disabled.
+.IP "\fBlog_udp_port\fR"
+Port value for UDP receiver, if enabled. The default is 514.
+.IP "\fBswift_dir\fR"
+Swift configuration directory. The default is /etc/swift.
+.IP "\fBuser\fR"
+User to run as. The default is swift.
+.RE
+.PD
+
+
+.SH CONTAINER RECONCILER SECTION
+.PD 1
+.RS 0
+.IP "\fB[container-reconciler]\fR"
+.RE
+.RS 3
+.IP "\fBinterval\fR"
+Minimum time for a pass to take. The default is 30 seconds.
+.IP "\fBreclaim_age\fR"
+Time elapsed in seconds before an object can be reclaimed. The default is 604800 seconds.
+.IP "\fBrequest_tries\fR"
+Server errors from requests will be retried by default. The default is 3.
+.RE
+.PD
+
+
+.SH PIPELINE SECTION
+.PD 1
+.RS 0
+.IP "\fB[pipeline:main]\fR"
+.RE
+.RS 3
+.IP "\fBpipeline\fR"
+Pipeline to use for  processing operations. The default is "catch_errors proxy-logging cache proxy-server".
+.RE
+.PD
+
+
+.SH APP SECTION
+.PD 1
+.RS 0
+\fBFor details of the available options see proxy-server.conf.5.\fR
+
+.RS 0
+.IP "\fB[app:proxy-server]\fR"
+.RE
+.RS 3
+.IP "\fBuse\fR"
+Entry point for paste.deploy in the server.
+This is normally \fBegg:swift#proxy\fR.
+.RE
+.PD
+
+
+.SH FILTER SECTIONS
+.PD 1
+.RS 0
+Any section that has its name prefixed by "filter:" indicates a filter section.
+Filters are used to specify configuration parameters for specific swift middlewares.
+Below are the filters available and respective acceptable parameters.
+
+\fBFor details of the available options for each filter section see proxy-server.conf.5.\fR
+
+.RS 0
+.IP "\fB[filter:cache]\fR"
+.RE
+Caching middleware that manages caching in swift.
+
+.RS 3
+.IP "\fBuse\fR"
+Entry point for paste.deploy in the server.
+This is normally \fBegg:swift#memcache\fR.
+.RE
+.PD
+
+
+.RS 0
+.IP "\fB[filter:catch_errors]\fR"
+.RE
+.RS 3
+.IP "\fBuse\fR"
+Entry point for paste.deploy in the server.
+This is normally \fBegg:swift#catch_errors\fR.
+.RE
+.PD
+
+
+.RS 0
+.IP "\fB[filter:proxy-logging]\fR"
+.RE
+.RS 3
+.IP "\fBuse\fR"
+Entry point for paste.deploy in the server.
+This is normally \fBegg:swift#proxy_logging\fR.
+.RE
+.PD
+
+
+.SH DOCUMENTATION
+.LP
+More in depth documentation in regards to
+.BI swift-container-reconciler
+and also about OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/overview_policies.html.
+
+.SH "SEE ALSO"
+.BR swift-container-reconciler(1)
diff --git a/doc/manpages/container-server.conf.5 b/doc/manpages/container-server.conf.5
index 406545b186..000bc3e94e 100644
--- a/doc/manpages/container-server.conf.5
+++ b/doc/manpages/container-server.conf.5
@@ -1,6 +1,6 @@
 .\"
 .\" Author: Joao Marcelo Martins <marcelo.martins@rackspace.com> or <btorch@gmail.com>
-.\" Copyright (c) 2010-2012 OpenStack, LLC.
+.\" Copyright (c) 2010-2012 OpenStack Foundation.
 .\"
 .\" Licensed under the Apache License, Version 2.0 (the "License");
 .\" you may not use this file except in compliance with the License.
@@ -20,7 +20,7 @@
 .SH NAME
 .LP
 .B container-server.conf
-\- configuration file for the openstack-swift container server
+\- configuration file for the OpenStack Swift container server
 
 
 
@@ -42,7 +42,7 @@ certain number of key/value parameters which are described later.
 Any line that begins with a '#' symbol is ignored.
 
 You can find more information about python-pastedeploy configuration format at
-\fIhttp://pythonpaste.org/deploy/#config-format\fR
+\fIhttps://docs.pylonsproject.org/projects/pastedeploy/en/latest/#config-format\fR
 
 
 
@@ -56,20 +56,41 @@ are acceptable within this section.
 IP address the container server should bind to. The default is 0.0.0.0 which will make
 it bind to all available addresses.
 .IP "\fBbind_port\fR"
-TCP port the container server should bind to. The default is 6001.
+TCP port the container server should bind to. The default is 6201.
+.IP "\fBkeep_idle\fR"
+Value to set for socket TCP_KEEPIDLE. The default value is 600.
+.IP "\fBbind_timeout\fR"
+Timeout to bind socket. The default is 30.
 .IP \fBbacklog\fR
 TCP backlog.  Maximum number of allowed pending connections. The default value is 4096.
 .IP \fBworkers\fR
-Number of container server workers to fork. The default is 1.
+The number of pre-forked processes that will accept connections.  Zero means
+no fork.  The default is auto which will make the server try to match the
+number of effective cpu cores if python multiprocessing is available (included
+with most python distributions >= 2.6) or fallback to one.  It's worth noting
+that individual workers will use many eventlet co-routines to service multiple
+concurrent requests.
+.IP \fBmax_clients\fR
+Maximum number of clients one worker can process simultaneously (it will
+actually accept(2) N + 1). Setting this to one (1) will only handle one request
+at a time, without accepting another request concurrently.  The default is 1024.
+.IP \fBallowed_sync_hosts\fR
+This is a comma separated list of hosts allowed in the X-Container-Sync-To
+field for containers. This is the old-style of using container sync. It is
+strongly recommended to use the new style of a separate
+container-sync-realms.conf -- see container-sync-realms.conf-sample
+allowed_sync_hosts = 127.0.0.1
 .IP \fBuser\fR
 The system user that the container server will run as. The default is swift.
 .IP \fBswift_dir\fR
 Swift configuration directory. The default is /etc/swift.
 .IP \fBdevices\fR
-Parent directory or where devices are mounted. Default is /srv/node.
+Parent directory of where devices are mounted. Default is /srv/node.
 .IP \fBmount_check\fR
 Whether or not check if the devices are mounted to prevent accidentally writing to
 the root device. The default is set to true.
+.IP \fBdisable_fallocate\fR
+Disable pre-allocate disk space for a file. The default is false.
 .IP \fBlog_name\fR
 Label used when logging. The default is swift.
 .IP \fBlog_facility\fR
@@ -78,6 +99,54 @@ Syslog log facility. The default is LOG_LOCAL0.
 Logging level. The default is INFO.
 .IP \fBlog_address\fR
 Logging address. The default is /dev/log.
+.IP \fBlog_max_line_length\fR
+The following caps the length of log lines to the value given; no limit if
+set to 0, the default.
+.IP \fBlog_custom_handlers\fR
+Comma separated list of functions to call to setup custom log handlers.
+functions get passed: conf, name, log_to_console, log_route, fmt, logger,
+adapted_logger. The default is empty.
+.IP \fBlog_udp_host\fR
+If set, log_udp_host will override log_address.
+.IP "\fBlog_udp_port\fR
+UDP log port, the default is 514.
+.IP \fBlog_statsd_host\fR
+StatsD server. IPv4/IPv6 addresses and hostnames are
+supported. If a hostname resolves to an IPv4 and IPv6 address, the IPv4
+address will be used.
+.IP \fBlog_statsd_port\fR
+The default is 8125.
+.IP \fBlog_statsd_default_sample_rate\fR
+The default is 1.
+.IP \fBlog_statsd_sample_rate_factor\fR
+The default is 1.
+.IP \fBlog_statsd_metric_prefix\fR
+The default is empty.
+.IP \fBdb_preallocation\fR
+If you don't mind the extra disk space usage in overhead, you can turn this
+on to preallocate disk space with SQLite databases to decrease fragmentation.
+The default is false.
+.IP \fBeventlet_debug\fR
+Debug mode for eventlet library. The default is false.
+.IP \fBfallocate_reserve\fR
+You can set fallocate_reserve to the number of bytes or percentage of disk
+space you'd like fallocate to reserve, whether there is space for the given
+file size or not. Percentage will be used if the value ends with a '%'.
+The default is 1%.
+.IP \fBnice_priority\fR
+Modify scheduling priority of server processes. Niceness values range from -20
+(most favorable to the process) to 19 (least favorable to the process).
+The default does not modify priority.
+.IP \fBionice_class\fR
+Modify I/O scheduling class of server processes. I/O niceness class values
+are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and IOPRIO_CLASS_IDLE (idle).
+The default does not modify class and priority.
+Work only with ionice_priority.
+.IP \fBionice_priority\fR
+Modify I/O scheduling priority of server processes. I/O niceness priority
+is a number which goes from 0 to 7. The higher the value, the lower
+the I/O priority of the process. Work only with ionice_class.
+Ignored if IOPRIO_CLASS_IDLE is set.
 .RE
 .PD
 
@@ -110,16 +179,39 @@ This is normally \fBegg:swift#container\fR.
 Label used when logging. The default is container-server.
 .IP "\fBset log_facility\fR
 Syslog log facility. The default is LOG_LOCAL0.
-.IP "\fB set log_level\fR
+.IP "\fBset log_level\fR
 Logging level. The default is INFO.
-.IP "\fB set log_requests\fR
+.IP "\fBset log_requests\fR
 Enables request logging. The default is True.
-.IP "\fB set log_address\fR
+.IP "\fBset log_address\fR
 Logging address. The default is /dev/log.
 .IP \fBnode_timeout\fR
 Request timeout to external services. The default is 3 seconds.
 .IP \fBconn_timeout\fR
 Connection timeout to external services. The default is 0.5 seconds.
+.IP \fBallow_versions\fR
+The default is false.
+.IP \fBreplication_server\fR
+Configure parameter for creating specific server.
+To handle all verbs, including replication verbs, do not specify
+"replication_server" (this is the default). To only handle replication,
+set to a True value (e.g. "True" or "1"). To handle only non-replication
+verbs, set to "False". Unless you have a separate replication network, you
+should not specify any value for "replication_server".
+.IP \fBnice_priority\fR
+Modify scheduling priority of server processes. Niceness values range from -20
+(most favorable to the process) to 19 (least favorable to the process).
+The default does not modify priority.
+.IP \fBionice_class\fR
+Modify I/O scheduling class of server processes. I/O niceness class values
+are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and IOPRIO_CLASS_IDLE (idle).
+The default does not modify class and priority.
+Work only with ionice_priority.
+.IP \fBionice_priority\fR
+Modify I/O scheduling priority of server processes. I/O niceness priority
+is a number which goes from 0 to 7. The higher the value, the lower
+the I/O priority of the process. Work only with ionice_class.
+Ignored if IOPRIO_CLASS_IDLE is set.
 .RE
 .PD
 
@@ -155,6 +247,36 @@ and ensure that swift has read/write. The default is /var/cache/swift.
 .RE
 .PD
 
+.RS 0
+.IP "\fB[filter:xprofile]\fR"
+.RS 3
+.IP "\fBuse\fR"
+Entry point for paste.deploy for the xprofile middleware. This is the reference to the installed python egg.
+This is normally \fBegg:swift#xprofile\fR.
+.IP "\fBprofile_module\fR"
+This option enable you to switch profilers which should inherit from python
+standard profiler. Currently the supported value can be 'cProfile', 'eventlet.green.profile' etc.
+.IP "\fBlog_filename_prefix\fR"
+This prefix will be used to combine process ID and timestamp to name the
+profile data file.  Make sure the executing user has permission to write
+into this path (missing path segments will be created, if necessary).
+If you enable profiling in more than one type of daemon, you must override
+it with an unique value like, the default is /var/log/swift/profile/account.profile.
+.IP "\fBdump_interval\fR"
+The profile data will be dumped to local disk based on above naming rule
+in this interval. The default is 5.0.
+.IP "\fBdump_timestamp\fR"
+Be careful, this option will enable profiler to dump data into the file with
+time stamp which means there will be lots of files piled up in the directory.
+The default is false
+.IP "\fBpath\fR"
+This is the path of the URL to access the mini web UI. The default is __profile__.
+.IP "\fBflush_at_shutdown\fR"
+Clear the data when the wsgi server shutdown. The default is false.
+.IP "\fBunwind\fR"
+Unwind the iterator of applications. Default is false.
+.RE
+.PD
 
 
 .SH ADDITIONAL SECTIONS
@@ -173,16 +295,14 @@ Syslog log facility. The default is LOG_LOCAL0.
 Logging level. The default is INFO.
 .IP \fBlog_address\fR
 Logging address. The default is /dev/log.
-.IP \fBvm_test_mode\fR
-Indicates that you are using a VM environment. The default is no.
-.IP \fBer_diff\fR
-The default is 1000.
+.IP \fBper_diff\fR
+Maximum number of database rows that will be sync'd in a single HTTP replication request. The default is 1000.
 .IP \fBmax_diffs\fR
 This caps how long the replicator will spend trying to sync a given database per pass so the other databases don't get starved. The default is 100.
 .IP \fBconcurrency\fR
 Number of replication workers to spawn. The default is 8.
 .IP "\fBrun_pause [deprecated]\fR"
-Time in seconds to wait between replication passes. The default is 10.
+Time in seconds to wait between replication passes. The default is 30.
 .IP \fBinterval\fR
 Replaces run_pause with the more standard "interval", which means the replicator won't pause unless it takes less than the interval set. The default is 30.
 .IP \fBnode_timeout\fR
@@ -192,6 +312,29 @@ Connection timeout to external services. The default is 0.5 seconds.
 .IP \fBreclaim_age\fR
 Time elapsed in seconds before an container can be reclaimed. The default is
 604800 seconds.
+.IP \fBrsync_compress\fR
+Allow rsync to compress data which is transmitted to destination node
+during sync. However, this is applicable only when destination node is in
+a different region than the local one. The default is false.
+.IP \fBrsync_module\fR
+Format of the rsync module where the replicator will send data. See
+etc/rsyncd.conf-sample for some usage examples.
+.IP \fBrecon_cache_path\fR
+Path to recon cache directory. The default is /var/cache/swift.
+.IP \fBnice_priority\fR
+Modify scheduling priority of server processes. Niceness values range from -20
+(most favorable to the process) to 19 (least favorable to the process).
+The default does not modify priority.
+.IP \fBionice_class\fR
+Modify I/O scheduling class of server processes. I/O niceness class values
+are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and IOPRIO_CLASS_IDLE (idle).
+The default does not modify class and priority.
+Work only with ionice_priority.
+.IP \fBionice_priority\fR
+Modify I/O scheduling priority of server processes. I/O niceness priority
+is a number which goes from 0 to 7. The higher the value, the lower
+the I/O priority of the process. Work only with ionice_class.
+Ignored if IOPRIO_CLASS_IDLE is set.
 .RE
 
 
@@ -210,15 +353,33 @@ Logging address. The default is /dev/log.
 .IP \fBinterval\fR
 Minimum time for a pass to take. The default is 300 seconds.
 .IP \fBconcurrency\fR
-Number of reaper workers to spawn. The default is 4.
+Number of updater workers to spawn. The default is 4.
 .IP \fBnode_timeout\fR
 Request timeout to external services. The default is 3 seconds.
 .IP \fBconn_timeout\fR
 Connection timeout to external services. The default is 0.5 seconds.
-.IP \fBslowdown = 0.01\fR
-Slowdown will sleep that amount between containers. The default is 0.01 seconds.
+.IP \fBcontainers_per_second\fR
+Maximum containers updated per second. Should be tuned according to individual system specs. 0 is unlimited. The default is 50.
+.IP "\fBslowdown [deprecated]\fR"
+Slowdown will sleep that amount between containers. The default is 0.01 seconds. Deprecated in favor of containers_per_second
 .IP \fBaccount_suppression_time\fR
 Seconds to suppress updating an account that has generated an error. The default is 60 seconds.
+.IP \fBrecon_cache_path\fR
+Path to recon cache directory. The default is /var/cache/swift.
+.IP \fBnice_priority\fR
+Modify scheduling priority of server processes. Niceness values range from -20
+(most favorable to the process) to 19 (least favorable to the process).
+The default does not modify priority.
+.IP \fBionice_class\fR
+Modify I/O scheduling class of server processes. I/O niceness class values
+are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and IOPRIO_CLASS_IDLE (idle).
+The default does not modify class and priority.
+Work only with ionice_priority.
+.IP \fBionice_priority\fR
+Modify I/O scheduling priority of server processes. I/O niceness priority
+is a number which goes from 0 to 7. The higher the value, the lower
+the I/O priority of the process. Work only with ionice_class.
+Ignored if IOPRIO_CLASS_IDLE is set.
 .RE
 .PD
 
@@ -237,6 +398,24 @@ Logging level. The default is INFO.
 Logging address. The default is /dev/log.
 .IP \fBinterval\fR
 Will audit, at most, 1 container per device per interval. The default is 1800 seconds.
+.IP \fBcontainers_per_second\fR
+Maximum containers audited per second. Should be tuned according to individual system specs. 0 is unlimited. The default is 200.
+.IP \fBrecon_cache_path\fR
+Path to recon cache directory. The default is /var/cache/swift.
+.IP \fBnice_priority\fR
+Modify scheduling priority of server processes. Niceness values range from -20
+(most favorable to the process) to 19 (least favorable to the process).
+The default does not modify priority.
+.IP \fBionice_class\fR
+Modify I/O scheduling class of server processes. I/O niceness class values
+are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and IOPRIO_CLASS_IDLE (idle).
+The default does not modify class and priority.
+Work only with ionice_priority.
+.IP \fBionice_priority\fR
+Modify I/O scheduling priority of server processes. I/O niceness priority
+is a number which goes from 0 to 7. The higher the value, the lower
+the I/O priority of the process. Work only with ionice_class.
+Ignored if IOPRIO_CLASS_IDLE is set.
 .RE
 
 
@@ -259,6 +438,26 @@ If you need to use an HTTP Proxy, set it here; defaults to no proxy.
 Will audit, at most, each container once per interval. The default is 300 seconds.
 .IP \fBcontainer_time\fR
 Maximum amount of time to spend syncing each container per pass. The default is 60 seconds.
+.IP \fBconn_timeout\fR
+Connection timeout to external services. The default is 5 seconds.
+.IP \fBrequest_tries\fR
+Server errors from requests will be retried by default. The default is 3.
+.IP \fBinternal_client_conf_path\fR
+Internal client config file path.
+.IP \fBnice_priority\fR
+Modify scheduling priority of server processes. Niceness values range from -20
+(most favorable to the process) to 19 (least favorable to the process).
+The default does not modify priority.
+.IP \fBionice_class\fR
+Modify I/O scheduling class of server processes. I/O niceness class values
+are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and IOPRIO_CLASS_IDLE (idle).
+The default does not modify class and priority.
+Work only with ionice_priority.
+.IP \fBionice_priority\fR
+Modify I/O scheduling priority of server processes. I/O niceness priority
+is a number which goes from 0 to 7. The higher the value, the lower
+the I/O priority of the process. Work only with ionice_class.
+Ignored if IOPRIO_CLASS_IDLE is set.
 .RE
 .PD
 
@@ -268,13 +467,11 @@ Maximum amount of time to spend syncing each container per pass. The default is
 .SH DOCUMENTATION
 .LP
 More in depth documentation about the swift-container-server and
-also Openstack-Swift as a whole can be found at
-.BI http://swift.openstack.org/admin_guide.html
+also OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/admin_guide.html
 and
-.BI http://swift.openstack.org
+.BI https://docs.openstack.org/swift/latest/
 
 
 .SH "SEE ALSO"
-.BR swift-container-server(1),
-
-
+.BR swift-container-server(1)
diff --git a/doc/manpages/container-sync-realms.conf.5 b/doc/manpages/container-sync-realms.conf.5
new file mode 100644
index 0000000000..e96b400115
--- /dev/null
+++ b/doc/manpages/container-sync-realms.conf.5
@@ -0,0 +1,138 @@
+.\"
+.\" Author: HCLTech-SSW <hcl_ss_oss@hcl.com>
+.\" Copyright (c) 2010-2017 OpenStack Foundation.
+.\"
+.\" Licensed under the Apache License, Version 2.0 (the "License");
+.\" you may not use this file except in compliance with the License.
+.\" You may obtain a copy of the License at
+.\"
+.\"    http://www.apache.org/licenses/LICENSE-2.0
+.\"
+.\" Unless required by applicable law or agreed to in writing, software
+.\" distributed under the License is distributed on an "AS IS" BASIS,
+.\" WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+.\" implied.
+.\" See the License for the specific language governing permissions and
+.\" limitations under the License.
+.\"
+.TH container-sync-realms.conf 5 "10/09/2017" "Linux" "OpenStack Swift"
+
+.SH NAME
+.LP
+.B container-sync-realms.conf
+\- configuration file for the OpenStack Swift container sync realms
+
+
+
+.SH SYNOPSIS
+.LP
+.B container-sync-realms.conf
+
+
+
+.SH DESCRIPTION
+.PP
+This is the configuration file used by the Object storage Swift to perform container to container
+synchronization. This configuration file is used to configure clusters to allow/accept sync
+requests to/from other clusters. Using this configuration file, the user specifies where
+to sync their container to along with a secret synchronization key.
+
+You can find more information about container to container synchronization at
+\fIhttps://docs.openstack.org/swift/latest/overview_container_sync.html\fR
+
+The configuration file follows the python-pastedeploy syntax. The file is divided
+into sections, which are enclosed by square brackets. Each section will contain a
+certain number of key/value parameters which are described later.
+
+Any line that begins with a '#' symbol is ignored.
+
+You can find more information about python-pastedeploy configuration format at
+\fIhttps://docs.pylonsproject.org/projects/pastedeploy/en/latest/#config-format\fR
+
+
+
+.SH GLOBAL SECTION
+.PD 1
+.RS 0
+This is indicated by section named [DEFAULT]. Below are the parameters that
+are acceptable within this section.
+
+.IP "\fBmtime_check_interval\fR"
+The number of seconds between checking the modified time of this config file for changes
+and therefore reloading it. The default value is 300.
+.RE
+.PD
+
+
+
+.SH REALM SECTIONS
+.PD 1
+.RS 0
+Each section name is the name of a sync realm, for example [realm1].
+A sync realm is a set of clusters that have agreed to allow container syncing with each other.
+Realm names will be considered case insensitive. Below are the parameters that are acceptable
+within this section.
+
+.IP "\fBcluster_clustername1\fR"
+Any values in the realm section whose name begin with cluster_ will indicate the name and
+endpoint of a cluster and will be used by external users in their container's
+X-Container-Sync-To metadata header values with the format as "realm_name/cluster_name/container_name".
+The Realm and cluster names are considered to be case insensitive.
+.IP "\fBcluster_clustername2\fR"
+Any values in the realm section whose name begin with cluster_ will indicate the name and
+endpoint of a cluster and will be used by external users in their container's
+X-Container-Sync-To metadata header values with the format as "realm_name/cluster_name/container_name".
+The Realm and cluster names are considered to be case insensitive.
+
+The endpoint is what the container sync daemon will use when sending out
+requests to that cluster. Keep in mind this endpoint must be reachable by all
+container servers, since that is where the container sync daemon runs. Note
+that the endpoint ends with /v1/ and that the container sync daemon will then
+add the account/container/obj name after that.
+
+.IP "\fBkey\fR"
+The key is the overall cluster-to-cluster key used in combination with the external
+users' key that they set on their containers' X-Container-Sync-Key metadata header
+values. These keys will be used to sign each request the container sync daemon makes
+and used to validate each incoming container sync request.
+.IP "\fBkey2\fR"
+The key2 is optional and is an additional key incoming requests will be checked
+against. This is so you can rotate keys if you wish; you move the existing
+key to key2 and make a new key value.
+.RE
+.PD
+
+.SH EXAMPLE
+.nf
+.RS 0
+[DEFAULT]
+mtime_check_interval = 300
+
+
+[realm1]
+key = realm1key
+key2 = realm1key2
+cluster_clustername1 = https://host1/v1/
+cluster_clustername2 = https://host2/v1/
+
+[realm2]
+key = realm2key
+key2 = realm2key2
+cluster_clustername3 = https://host3/v1/
+cluster_clustername4 = https://host4/v1/
+.RE
+.fi
+
+
+.SH DOCUMENTATION
+.LP
+More in depth documentation in regards to
+.BI swift-container-sync
+and also about OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/overview_container_sync.html
+and
+.BI https://docs.openstack.org/swift/latest/
+
+
+.SH "SEE ALSO"
+.BR swift-container-sync(1)
diff --git a/doc/manpages/dispersion.conf.5 b/doc/manpages/dispersion.conf.5
index 8355304473..7698ee338e 100644
--- a/doc/manpages/dispersion.conf.5
+++ b/doc/manpages/dispersion.conf.5
@@ -1,6 +1,6 @@
 .\"
 .\" Author: Joao Marcelo Martins <marcelo.martins@rackspace.com> or <btorch@gmail.com>
-.\" Copyright (c) 2010-2012 OpenStack, LLC.
+.\" Copyright (c) 2010-2012 OpenStack Foundation.
 .\"
 .\" Licensed under the Apache License, Version 2.0 (the "License");
 .\" you may not use this file except in compliance with the License.
@@ -14,42 +14,58 @@
 .\" implied.
 .\" See the License for the specific language governing permissions and
 .\" limitations under the License.
-.\"  
+.\"
 .TH dispersion.conf 5 "8/26/2011" "Linux" "OpenStack Swift"
 
-.SH NAME 
+.SH NAME
 .LP
 .B dispersion.conf
-\- configuration file for the openstack-swift dispersion tools 
+\- configuration file for the OpenStack Swift dispersion tools
 
 .SH SYNOPSIS
 .LP
 .B dispersion.conf
 
-.SH DESCRIPTION 
+.SH DESCRIPTION
 .PP
 This is the configuration file used by the dispersion populate and report tools.
-The file format consists of the '[dispersion]' module as the header and available parameters. 
-Any line that begins with a '#' symbol is ignored. 
+The file format consists of the '[dispersion]' module as the header and available parameters.
+Any line that begins with a '#' symbol is ignored.
 
 
 .SH PARAMETERS
-.PD 1 
+.PD 1
 .RS 0
+.IP "\fBauth_version\fR"
+Authentication system API version. The default is 1.0.
 .IP "\fBauth_url\fR"
-Authentication system URL 
-.IP "\fBauth_user\fR" 
+Authentication system URL
+.IP "\fBauth_user\fR"
 Authentication system account/user name
 .IP "\fBauth_key\fR"
-Authentication system account/user password 
+Authentication system account/user password
+.IP "\fBproject_name\fR"
+Project name in case of keystone auth version 3
+.IP "\fBproject_domain_name\fR"
+Project domain name in case of keystone auth version 3
+.IP "\fBuser_domain_name\fR"
+User domain name in case of keystone auth version 3
+.IP "\fBendpoint_type\fR"
+The default is 'publicURL'.
+.IP "\fBkeystone_api_insecure\fR"
+The default is false.
 .IP "\fBswift_dir\fR"
-Location of openstack-swift configuration and ring files
+Location of OpenStack Swift configuration and ring files
 .IP "\fBdispersion_coverage\fR"
-Percentage of partition coverage to use. The default is 1.
+Percentage of partition coverage to use. The default is 1.0.
 .IP "\fBretries\fR"
-Maximum number of attempts
+Maximum number of attempts. The defaul is 5.
 .IP "\fBconcurrency\fR"
 Concurrency to use. The default is 25.
+.IP "\fBcontainer_populate\fR"
+The default is true.
+.IP "\fBobject_populate\fR"
+The default is true.
 .IP "\fBdump_json\fR"
 Whether to output in json format. The default is no.
 .IP "\fBcontainer_report\fR"
@@ -60,30 +76,34 @@ Whether to run the object report. The default is yes.
 .PD
 
 .SH SAMPLE
-.PD 0 
+.PD 0
 .RS 0
 .IP "[dispersion]"
 .IP "auth_url = https://127.0.0.1:443/auth/v1.0"
 .IP "auth_user = dpstats:dpstats"
 .IP "auth_key = dpstats"
 .IP "swift_dir = /etc/swift"
-.IP "# dispersion_coverage = 1"
+.IP "# keystone_api_insecure = no"
+.IP "# project_name = dpstats"
+.IP "# project_domain_name = default"
+.IP "# user_domain_name = default"
+.IP "# dispersion_coverage = 1.0"
 .IP "# retries = 5"
 .IP "# concurrency = 25"
 .IP "# dump_json = no"
 .IP "# container_report = yes"
 .IP "# object_report = yes"
 .RE
-.PD 
+.PD
+
 
- 
 .SH DOCUMENTATION
 .LP
 More in depth documentation about the swift-dispersion utilities and
-also Openstack-Swift as a whole can be found at 
-.BI http://swift.openstack.org/admin_guide.html#cluster-health
-and 
-.BI http://swift.openstack.org
+also OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/admin_guide.html#dispersion-report
+and
+.BI https://docs.openstack.org/swift/latest/
 
 
 .SH "SEE ALSO"
diff --git a/doc/manpages/object-expirer.conf.5 b/doc/manpages/object-expirer.conf.5
index 8de307ee22..42ca4e0756 100644
--- a/doc/manpages/object-expirer.conf.5
+++ b/doc/manpages/object-expirer.conf.5
@@ -1,6 +1,6 @@
 .\"
 .\" Author: Joao Marcelo Martins <marcelo.martins@rackspace.com> or <btorch@gmail.com>
-.\" Copyright (c) 2012 OpenStack, LLC.
+.\" Copyright (c) 2012 OpenStack Foundation.
 .\"
 .\" Licensed under the Apache License, Version 2.0 (the "License");
 .\" you may not use this file except in compliance with the License.
@@ -14,13 +14,13 @@
 .\" implied.
 .\" See the License for the specific language governing permissions and
 .\" limitations under the License.
-.\"  
+.\"
 .TH object-expirer.conf 5 "03/15/2012" "Linux" "OpenStack Swift"
 
-.SH NAME 
+.SH NAME
 .LP
 .B object-expirer.conf
-\- configuration file for the openstack-swift object exprier daemon  
+\- configuration file for the OpenStack Swift object expirer daemon
 
 
 
@@ -30,54 +30,100 @@
 
 
 
-.SH DESCRIPTION 
+.SH DESCRIPTION
 .PP
-This is the configuration file used by the object expirer daemon. The daemon's 
-function is to query the internal hidden expiring_objects_account to discover 
+This is the configuration file used by the object expirer daemon. The daemon's
+function is to query the internal hidden expiring_objects_account to discover
 objects that need to be deleted and to then delete them.
 
 The configuration file follows the python-pastedeploy syntax. The file is divided
-into sections, which are enclosed by square brackets. Each section will contain a 
-certain number of key/value parameters which are described later. 
+into sections, which are enclosed by square brackets. Each section will contain a
+certain number of key/value parameters which are described later.
 
-Any line that begins with a '#' symbol is ignored. 
+Any line that begins with a '#' symbol is ignored.
 
-You can find more information about python-pastedeploy configuration format at 
-\fIhttp://pythonpaste.org/deploy/#config-format\fR
+You can find more information about python-pastedeploy configuration format at
+\fIhttps://docs.pylonsproject.org/projects/pastedeploy/en/latest/#config-format\fR
 
 
 
 .SH GLOBAL SECTION
-.PD 1 
+.PD 1
 .RS 0
-This is indicated by section named [DEFAULT]. Below are the parameters that 
-are acceptable within this section. 
+This is indicated by section named [DEFAULT]. Below are the parameters that
+are acceptable within this section.
 
-.IP \fBswift_dir\fR 
+.IP \fBswift_dir\fR
 Swift configuration directory. The default is /etc/swift.
-.IP \fBuser\fR 
-The system user that the object server will run as. The default is swift. 
-.IP \fBlog_name\fR 
+.IP \fBuser\fR
+The system user that the object server will run as. The default is swift.
+.IP \fBlog_name\fR
 Label used when logging. The default is swift.
-.IP \fBlog_facility\fR 
+.IP \fBlog_facility\fR
 Syslog log facility. The default is LOG_LOCAL0.
-.IP \fBlog_level\fR 
+.IP \fBlog_level\fR
 Logging level. The default is INFO.
 .IP \fBlog_address\fR
 Logging address. The default is /dev/log.
+.IP \fBlog_max_line_length\fR
+The following caps the length of log lines to the value given; no limit if
+set to 0, the default.
+.IP \fBlog_custom_handlers\fR
+Comma separated list of functions to call to setup custom log handlers.
+functions get passed: conf, name, log_to_console, log_route, fmt, logger,
+adapted_logger. The default is empty.
+.IP \fBlog_udp_host\fR
+If set, log_udp_host will override log_address.
+.IP "\fBlog_udp_port\fR
+UDP log port, the default is 514.
+.IP \fBlog_statsd_host\fR
+StatsD server. IPv4/IPv6 addresses and hostnames are
+supported. If a hostname resolves to an IPv4 and IPv6 address, the IPv4
+address will be used.
+.IP \fBlog_statsd_port\fR
+The default is 8125.
+.IP \fBlog_statsd_default_sample_rate\fR
+The default is 1.
+.IP \fBlog_statsd_sample_rate_factor\fR
+The default is 1.
+.IP \fBlog_statsd_metric_prefix\fR
+The default is empty.
+.IP \fBdelay_reaping_account/container\fR
+Normally, the expirer begins reaping expired objects immediately.  You can add
+options prefixed with "delay_reaping_" in the form of
+"delay_reaping_<ACCT>[/<CNTR>]" to cause the expirer to delay processing of
+tasks in those account or account/container.  The <ACCT>[/<CNTR>] part of the
+config option names should url-quote the paths.  The value is in seconds. The
+default is no delay for any tasks.
+.IP \fBround_robin_task_cache_size\fR
+Number of tasks objects to cache before processing.
+.IP \fBnice_priority\fR
+Modify scheduling priority of server processes. Niceness values range from -20
+(most favorable to the process) to 19 (least favorable to the process).
+The default does not modify priority.
+.IP \fBionice_class\fR
+Modify I/O scheduling class of server processes. I/O niceness class values
+are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and IOPRIO_CLASS_IDLE (idle).
+The default does not modify class and priority.
+Work only with ionice_priority.
+.IP \fBionice_priority\fR
+Modify I/O scheduling priority of server processes. I/O niceness priority
+is a number which goes from 0 to 7. The higher the value, the lower
+the I/O priority of the process. Work only with ionice_class.
+Ignored if IOPRIO_CLASS_IDLE is set.
 .RE
 .PD
 
 
 
 .SH PIPELINE SECTION
-.PD 1 
+.PD 1
 .RS 0
 This is indicated by section name [pipeline:main]. Below are the parameters that
-are acceptable within this section. 
+are acceptable within this section.
 
 .IP "\fBpipeline\fR"
-It is used when you need to apply a number of filters. It is a list of filters 
+It is used when you need to apply a number of filters. It is a list of filters
 ended by an application. The default should be \fB"catch_errors cache proxy-server"\fR
 .RE
 .PD
@@ -85,24 +131,38 @@ ended by an application. The default should be \fB"catch_errors cache proxy-serv
 
 
 .SH APP SECTION
-.PD 1 
+.PD 1
 .RS 0
 This is indicated by section name [app:object-server]. Below are the parameters
 that are acceptable within this section.
 .IP "\fBuse\fR"
-Entry point for paste.deploy for the object server. This is the reference to the installed python egg. 
-The default is \fBegg:swift#proxy\fR. See proxy-server.conf-sample for options or See proxy-server.conf manpage. 
+Entry point for paste.deploy for the object server. This is the reference to the installed python egg.
+The default is \fBegg:swift#proxy\fR. See proxy-server.conf-sample for options or See proxy-server.conf manpage.
+.IP \fBnice_priority\fR
+Modify scheduling priority of server processes. Niceness values range from -20
+(most favorable to the process) to 19 (least favorable to the process).
+The default does not modify priority.
+.IP \fBionice_class\fR
+Modify I/O scheduling class of server processes. I/O niceness class values
+are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and IOPRIO_CLASS_IDLE (idle).
+The default does not modify class and priority.
+Work only with ionice_priority.
+.IP \fBionice_priority\fR
+Modify I/O scheduling priority of server processes. I/O niceness priority
+is a number which goes from 0 to 7. The higher the value, the lower
+the I/O priority of the process. Work only with ionice_class.
+Ignored if IOPRIO_CLASS_IDLE is set.
 .RE
 .PD
 
 
 
 .SH FILTER SECTION
-.PD 1 
+.PD 1
 .RS 0
 Any section that has its name prefixed by "filter:" indicates a filter section.
 Filters are used to specify configuration parameters for specific swift middlewares.
-Below are the filters available and respective acceptable parameters. 
+Below are the filters available and respective acceptable parameters.
 
 .RS 0
 .IP "\fB[filter:cache]\fR"
@@ -117,8 +177,8 @@ The default is \fBegg:swift#memcache\fR. See proxy-server.conf-sample for option
 .RE
 
 
-.RS 0  
-.IP "\fB[filter:catch_errors]\fR" 
+.RS 0
+.IP "\fB[filter:catch_errors]\fR"
 .RE
 .RS 3
 .IP \fBuse\fR
@@ -126,17 +186,79 @@ Entry point for paste.deploy for the catch_errors middleware. This is the refere
 The default is \fBegg:swift#catch_errors\fR. See proxy-server.conf-sample for options or See proxy-server.conf manpage.
 .RE
 
+.RS 0
+.IP "\fB[filter:proxy-logging]\fR"
+.RE
+
+Logging for the proxy server now lives in this middleware.
+If the access_* variables are not set, logging directives from [DEFAULT]
+without "access_" will be used.
+
+.RS 3
+.IP \fBuse\fR
+Entry point for paste.deploy for the proxy_logging middleware. This is the reference to the installed python egg.
+This is normally \fBegg:swift#proxy_logging\fR. See proxy-server.conf-sample for options or See proxy-server.conf manpage.
+.RE
+
 .PD
 
 
+.SH OBJECT EXPIRER SECTION
+.PD 1
+.RS 0
+.IP "\fB[object-expirer]\fR"
+.RE
+.RS 3
+.IP \fBinterval\fR
+Replaces run_pause with the more standard "interval", which means the replicator won't pause unless it takes less than the interval set. The default is 300.
+.IP \fBreport_interval\fR
+The default is 300 seconds.
+.IP \fBrequest_tries\fR
+The number of times the expirer's internal client will
+attempt any given request in the event of failure. The default is 3.
+.IP \fBconcurrency\fR
+Number of expirer workers to spawn. The default is 1.
+.IP \fBprocesses\fR
+Processes is how many parts to divide the work into, one part per process that will be doing the work.
+Processes set 0 means that a single process will be doing all the work.
+Processes can also be specified on the command line and will override the config value.
+The default is 0.
+.IP \fBprocess\fR
+Process is which of the parts a particular process will work on process can also be specified
+on the command line and will override the config value process is "zero based", if you want
+to use 3 processes, you should run processes with process set to 0, 1, and 2. The default is 0.
+.IP \fBreclaim_age\fR
+The expirer will re-attempt expiring if the source object is not available
+up to reclaim_age seconds before it gives up and deletes the entry in the
+queue. The default is 604800 seconds.
+.IP \fBrecon_cache_path\fR
+Path to recon cache directory. The default is /var/cache/swift.
+.IP \fBnice_priority\fR
+Modify scheduling priority of server processes. Niceness values range from -20
+(most favorable to the process) to 19 (least favorable to the process).
+The default does not modify priority.
+.IP \fBionice_class\fR
+Modify I/O scheduling class of server processes. I/O niceness class values
+are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and IOPRIO_CLASS_IDLE (idle).
+The default does not modify class and priority.
+Work only with ionice_priority.
+.IP \fBionice_priority\fR
+Modify I/O scheduling priority of server processes. I/O niceness priority
+is a number which goes from 0 to 7. The higher the value, the lower
+the I/O priority of the process. Work only with ionice_class.
+Ignored if IOPRIO_CLASS_IDLE is set.
+
+.RE
+.PD
+
 
 .SH DOCUMENTATION
 .LP
 More in depth documentation about the swift-object-expirer and
-also Openstack-Swift as a whole can be found at 
-.BI http://swift.openstack.org/admin_guide.html 
-and 
-.BI http://swift.openstack.org
+also OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/admin_guide.html
+and
+.BI https://docs.openstack.org/swift/latest/
 
 
 .SH "SEE ALSO"
diff --git a/doc/manpages/object-server.conf.5 b/doc/manpages/object-server.conf.5
index 4087cde138..a8c743e6d4 100644
--- a/doc/manpages/object-server.conf.5
+++ b/doc/manpages/object-server.conf.5
@@ -1,6 +1,6 @@
 .\"
 .\" Author: Joao Marcelo Martins <marcelo.martins@rackspace.com> or <btorch@gmail.com>
-.\" Copyright (c) 2010-2012 OpenStack, LLC.
+.\" Copyright (c) 2010-2012 OpenStack Foundation.
 .\"
 .\" Licensed under the Apache License, Version 2.0 (the "License");
 .\" you may not use this file except in compliance with the License.
@@ -20,7 +20,7 @@
 .SH NAME
 .LP
 .B object-server.conf
-\- configuration file for the openstack-swift object server
+\- configuration file for the OpenStack Swift object server
 
 
 
@@ -33,7 +33,8 @@
 .SH DESCRIPTION
 .PP
 This is the configuration file used by the object server and other object
-background services, such as; replicator, updater and auditor.
+background services, such as; replicator, reconstructor, updater, auditor, and
+expirer.
 
 The configuration file follows the python-pastedeploy syntax. The file is divided
 into sections, which are enclosed by square brackets. Each section will contain a
@@ -42,7 +43,7 @@ certain number of key/value parameters which are described later.
 Any line that begins with a '#' symbol is ignored.
 
 You can find more information about python-pastedeploy configuration format at
-\fIhttp://pythonpaste.org/deploy/#config-format\fR
+\fIhttps://docs.pylonsproject.org/projects/pastedeploy/en/latest/#config-format\fR
 
 
 
@@ -56,20 +57,39 @@ are acceptable within this section.
 IP address the object server should bind to. The default is 0.0.0.0 which will make
 it bind to all available addresses.
 .IP "\fBbind_port\fR"
-TCP port the object server should bind to. The default is 6000.
+TCP port the object server should bind to. The default is 6200.
+.IP "\fBkeep_idle\fR"
+Value to set for socket TCP_KEEPIDLE. The default value is 600.
+.IP "\fBbind_timeout\fR"
+Timeout to bind socket. The default is 30.
 .IP \fBbacklog\fR
 TCP backlog. Maximum number of allowed pending connections. The default value is 4096.
 .IP \fBworkers\fR
-Number of object server workers to fork. The default is 1.
+The number of pre-forked processes that will accept connections.  Zero means
+no fork.  The default is auto which will make the server try to match the
+number of effective cpu cores if python multiprocessing is available (included
+with most python distributions >= 2.6) or fallback to one.  It's worth noting
+that individual workers will use many eventlet co-routines to service multiple
+concurrent requests.
+.IP \fBmax_clients\fR
+Maximum number of clients one worker can process simultaneously (it will
+actually accept(2) N + 1). Setting this to one (1) will only handle one request
+at a time, without accepting another request concurrently. The default is 1024.
 .IP \fBuser\fR
 The system user that the object server will run as. The default is swift.
 .IP \fBswift_dir\fR
 Swift configuration directory. The default is /etc/swift.
 .IP \fBdevices\fR
-Parent directory or where devices are mounted. Default is /srv/node.
+Parent directory of where devices are mounted. Default is /srv/node.
 .IP \fBmount_check\fR
 Whether or not check if the devices are mounted to prevent accidentally writing to
 the root device. The default is set to true.
+.IP \fBdisable_fallocate\fR
+Disable pre-allocate disk space for a file. The default is false.
+.IP \fBservers_per_port\fR
+Make object-server run this many worker processes per unique port of "local"
+ring devices across all storage policies. The default value of 0 disables this
+feature.
 .IP \fBlog_name\fR
 Label used when logging. The default is swift.
 .IP \fBlog_facility\fR
@@ -78,6 +98,70 @@ Syslog log facility. The default is LOG_LOCAL0.
 Logging level. The default is INFO.
 .IP \fBlog_address\fR
 Logging address. The default is /dev/log.
+.IP \fBlog_max_line_length\fR
+The following caps the length of log lines to the value given; no limit if
+set to 0, the default.
+.IP \fBlog_custom_handlers\fR
+Comma separated list of functions to call to setup custom log handlers.
+functions get passed: conf, name, log_to_console, log_route, fmt, logger,
+adapted_logger. The default is empty.
+.IP \fBlog_udp_host\fR
+If set, log_udp_host will override log_address.
+.IP "\fBlog_udp_port\fR
+UDP log port, the default is 514.
+.IP \fBlog_statsd_host\fR
+StatsD server. IPv4/IPv6 addresses and hostnames are
+supported. If a hostname resolves to an IPv4 and IPv6 address, the IPv4
+address will be used.
+.IP \fBlog_statsd_port\fR
+The default is 8125.
+.IP \fBlog_statsd_default_sample_rate\fR
+The default is 1.
+.IP \fBlog_statsd_sample_rate_factor\fR
+The default is 1.
+.IP \fBlog_statsd_metric_prefix\fR
+The default is empty.
+.IP \fBeventlet_debug\fR
+Debug mode for eventlet library. The default is false.
+.IP \fBfallocate_reserve\fR
+You can set fallocate_reserve to the number of bytes or percentage of disk
+space you'd like fallocate to reserve, whether there is space for the given
+file size or not. Percentage will be used if the value ends with a '%'.
+The default is 1%.
+.IP \fBnode_timeout\fR
+Request timeout to external services. The default is 3 seconds.
+.IP \fBconn_timeout\fR
+Connection timeout to external services. The default is 0.5 seconds.
+.IP \fBcontainer_update_timeout\fR
+Time to wait while sending a container update on object update. The default is 1 second.
+.IP \fBclient_timeout\fR
+Time to wait while receiving each chunk of data from a client or another
+backend node. The default is 60.
+.IP \fBnetwork_chunk_size\fR
+The default is 65536.
+.IP \fBdisk_chunk_size\fR
+The default is 65536.
+.IP \fBreclaim_age\fR
+Time elapsed in seconds before an object can be reclaimed. The default is
+604800 seconds.
+.IP \fBcommit_window\fR
+Time in seconds during which a newly written non-durable data file will not be
+reclaimed. The value should be greater than zero and much less than
+reclaim_age. The default is 60.0 seconds.
+.IP \fBnice_priority\fR
+Modify scheduling priority of server processes. Niceness values range from -20
+(most favorable to the process) to 19 (least favorable to the process).
+The default does not modify priority.
+.IP \fBionice_class\fR
+Modify I/O scheduling class of server processes. I/O niceness class values
+are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and IOPRIO_CLASS_IDLE (idle).
+The default does not modify class and priority.
+Work only with ionice_priority.
+.IP \fBionice_priority\fR
+Modify I/O scheduling priority of server processes. I/O niceness priority
+is a number which goes from 0 to 7. The higher the value, the lower
+the I/O priority of the process. Work only with ionice_class.
+Ignored if IOPRIO_CLASS_IDLE is set.
 .RE
 .PD
 
@@ -106,20 +190,85 @@ that are acceptable within this section.
 .IP "\fBuse\fR"
 Entry point for paste.deploy for the object server. This is the reference to the installed python egg.
 This is normally \fBegg:swift#object\fR.
-.IP "\fBset log_name\fR
+.IP "\fBset log_name\fR"
 Label used when logging. The default is object-server.
-.IP "\fBset log_facility\fR
+.IP "\fBset log_facility\fR"
 Syslog log facility. The default is LOG_LOCAL0.
-.IP "\fB set log_level\fR
+.IP "\fBset log_level\fR"
 Logging level. The default is INFO.
-.IP "\fB set log_requests\fR
+.IP "\fBset log_requests\fR"
 Enables request logging. The default is True.
-.IP "\fB set log_address\fR
+.IP "\fBset log_address\fR"
 Logging address. The default is /dev/log.
+.IP "\fBmax_upload_time\fR"
+The default is 86400.
+.IP "\fBslow\fR"
+The default is 0.
+.IP "\fBkeep_cache_size\fR"
+Objects smaller than this are not evicted from the buffercache once read. The default is 5242880.
+.IP "\fBkeep_cache_private\fR"
+If true, objects for authenticated GET requests may be kept in buffer cache
+if small enough. The default is false.
+.IP "\fBmb_per_sync\fR"
+On PUTs, sync data every n MB. The default is 512.
+.IP "\fBallowed_headers\fR"
+Comma separated list of headers that can be set in metadata on an object.
+This list is in addition to X-Object-Meta-* headers and cannot include Content-Type, etag, Content-Length, or deleted.
+The default is 'Content-Disposition, Content-Encoding, X-Delete-At, X-Object-Manifest, X-Static-Large-Object, Cache-Control, Content-Language, Expires, X-Robots-Tag'.
+.IP "\fBreplication_server\fR"
+Configure parameter for creating specific server
+To handle all verbs, including replication verbs, do not specify
+"replication_server" (this is the default). To only handle replication,
+set to a True value (e.g. "True" or "1"). To handle only non-replication
+verbs, set to "False". Unless you have a separate replication network, you
+should not specify any value for "replication_server".
+.IP "\fBreplication_concurrency\fR"
+Set to restrict the number of concurrent incoming SSYNC requests
+Set to 0 for unlimited (the default is 4). Note that SSYNC requests are only used
+by the object reconstructor or the object replicator when configured to use ssync.
+.IP "\fBreplication_concurrency_per_device\fR"
+Set to restrict the number of concurrent incoming SSYNC requests per device;
+set to 0 for unlimited requests per devices. This can help control I/O to each
+device. This does not override replication_concurrency described above, so you
+may need to adjust both parameters depending on your hardware or network
+capacity. Defaults to 1.
+.IP "\fBreplication_lock_timeout\fR"
+Number of seconds to wait for an existing replication device lock before
+giving up. The default is 15.
+.IP "\fBreplication_failure_threshold\fR"
+.IP "\fBreplication_failure_ratio\fR"
+These two settings control when the SSYNC subrequest handler will
+abort an incoming SSYNC attempt. An abort will occur if there are at
+least threshold number of failures and the value of failures / successes
+exceeds the ratio. The defaults of 100 and 1.0 means that at least 100
+failures have to occur and there have to be more failures than successes for
+an abort to occur.
+.IP "\fBsplice\fR"
+Use splice() for zero-copy object GETs. This requires Linux kernel
+version 3.0 or greater. If you set "splice = yes" but the kernel
+does not support it, error messages will appear in the object server
+logs at startup, but your object servers should continue to function.
+The default is false.
 .IP \fBnode_timeout\fR
 Request timeout to external services. The default is 3 seconds.
 .IP \fBconn_timeout\fR
 Connection timeout to external services. The default is 0.5 seconds.
+.IP \fBcontainer_update_timeout\fR
+Time to wait while sending a container update on object update. The default is 1 second.
+.IP \fBnice_priority\fR
+Modify scheduling priority of server processes. Niceness values range from -20
+(most favorable to the process) to 19 (least favorable to the process).
+The default does not modify priority.
+.IP \fBionice_class\fR
+Modify I/O scheduling class of server processes. I/O niceness class values
+are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and IOPRIO_CLASS_IDLE (idle).
+The default does not modify class and priority.
+Work only with ionice_priority.
+.IP \fBionice_priority\fR
+Modify I/O scheduling priority of server processes. I/O niceness priority
+is a number which goes from 0 to 7. The higher the value, the lower
+the I/O priority of the process. Work only with ionice_class.
+Ignored if IOPRIO_CLASS_IDLE is set.
 .RE
 .PD
 
@@ -153,9 +302,41 @@ This is normally \fBegg:swift#recon\fR.
 The recon_cache_path simply sets the directory where stats for a few items will be stored.
 Depending on the method of deployment you may need to create this directory manually
 and ensure that swift has read/write. The default is /var/cache/swift.
+.IP "\fBrecon_lock_path\fR"
+The default is /var/lock.
 .RE
 .PD
 
+.RS 0
+.IP "\fB[filter:xprofile]\fR"
+.RS 3
+.IP "\fBuse\fR"
+Entry point for paste.deploy for the xprofile middleware. This is the reference to the installed python egg.
+This is normally \fBegg:swift#xprofile\fR.
+.IP "\fBprofile_module\fR"
+This option enable you to switch profilers which should inherit from python
+standard profiler. Currently the supported value can be 'cProfile', 'eventlet.green.profile' etc.
+.IP "\fBlog_filename_prefix\fR"
+This prefix will be used to combine process ID and timestamp to name the
+profile data file.  Make sure the executing user has permission to write
+into this path (missing path segments will be created, if necessary).
+If you enable profiling in more than one type of daemon, you must override
+it with an unique value like, the default is /var/log/swift/profile/account.profile.
+.IP "\fBdump_interval\fR"
+The profile data will be dumped to local disk based on above naming rule
+in this interval. The default is 5.0.
+.IP "\fBdump_timestamp\fR"
+Be careful, this option will enable profiler to dump data into the file with
+time stamp which means there will be lots of files piled up in the directory.
+The default is false
+.IP "\fBpath\fR"
+This is the path of the URL to access the mini web UI. The default is __profile__.
+.IP "\fBflush_at_shutdown\fR"
+Clear the data when the wsgi server shutdown. The default is false.
+.IP "\fBunwind\fR"
+Unwind the iterator of applications. Default is false.
+.RE
+.PD
 
 
 .SH ADDITIONAL SECTIONS
@@ -174,35 +355,130 @@ Syslog log facility. The default is LOG_LOCAL0.
 Logging level. The default is INFO.
 .IP \fBlog_address\fR
 Logging address. The default is /dev/log.
-.IP \fBvm_test_mode\fR
-Indicates that you are using a VM environment. The default is no.
 .IP \fBdaemonize\fR
 Whether or not to run replication as a daemon. The default is yes.
-.IP \fBrun_pause\fR
+.IP "\fBrun_pause [deprecated]\fR"
+Time in seconds to wait between replication passes. The default is 30.
+.IP \fBinterval\fR
 Time in seconds to wait between replication passes. The default is 30.
 .IP \fBconcurrency\fR
 Number of replication workers to spawn. The default is 1.
 .IP \fBstats_interval\fR
 Interval in seconds between logging replication statistics. The default is 300.
+.IP \fBsync_method\fR
+The sync method to use; default is rsync but you can use ssync to try the
+EXPERIMENTAL all-swift-code-no-rsync-callouts method. Once ssync is verified
+as having performance comparable to, or better than, rsync, we plan to
+deprecate rsync so we can move on with more features for replication.
 .IP \fBrsync_timeout\fR
 Max duration of a partition rsync. The default is 900 seconds.
 .IP \fBrsync_io_timeout\fR
 Passed to rsync for I/O OP timeout. The default is 30 seconds.
+.IP \fBrsync_compress\fR
+Allow rsync to compress data which is transmitted to destination node
+during sync. However, this is applicable only when destination node is in
+a different region than the local one.
+NOTE: Objects that are already compressed (for example: .tar.gz, .mp3) might
+slow down the syncing process. The default is false.
+.IP \fBrsync_module\fR
+Format of the rsync module where the replicator will send data. See
+etc/rsyncd.conf-sample for some usage examples. The default is empty.
+.IP \fBnode_timeout\fR
+Request timeout to external services. The default is 10 seconds.
+.IP \fBrsync_bwlimit\fR
+Passed to rsync for bandwidth limit in kB/s.  The default is 0 (unlimited).
 .IP \fBhttp_timeout\fR
 Max duration of an HTTP request. The default is 60 seconds.
 .IP \fBlockup_timeout\fR
 Attempts to kill all workers if nothing replicates for lockup_timeout seconds. The
 default is 1800 seconds.
-.IP \fBreclaim_age\fR
-Time elapsed in seconds before an object can be reclaimed. The default is
-604800 seconds.
-.IP \fBrecon_enable\fR
-Enable logging of replication stats for recon. The default is on.
+.IP \fBring_check_interval\fR
+The default is 15.
+.IP \fBrsync_error_log_line_length\fR
+Limits how long rsync error log lines are. 0 (default) means to log the entire line.
+.IP "\fBrecon_cache_path\fR"
+The recon_cache_path simply sets the directory where stats for a few items will be stored.
+Depending on the method of deployment you may need to create this directory manually
+and ensure that swift has read/write.The default is /var/cache/swift.
+.IP "\fBhandoffs_first\fR"
+The flag to replicate handoffs prior to canonical partitions.
+It allows one to force syncing and deleting handoffs quickly.
+If set to a True value(e.g. "True" or "1"), partitions
+that are not supposed to be on the node will be replicated first.
+The default is false.
+.IP "\fBhandoff_delete\fR"
+The number of replicas which are ensured in swift.
+If the number less than the number of replicas is set, object-replicator
+could delete local handoffs even if all replicas are not ensured in the
+cluster. Object-replicator would remove local handoff partition directories
+after syncing partition when the number of successful responses is greater
+than or equal to this number. By default(auto), handoff partitions will be
+removed  when it has successfully replicated to all the canonical nodes.
+
+The handoffs_first and handoff_delete are options for a special case
+such as disk full in the cluster. These two options SHOULD NOT BE
+CHANGED, except for such an extreme situations. (e.g. disks filled up
+or are about to fill up. Anyway, DO NOT let your drives fill up).
+.IP \fBnice_priority\fR
+Modify scheduling priority of server processes. Niceness values range from -20
+(most favorable to the process) to 19 (least favorable to the process).
+The default does not modify priority.
+.IP \fBionice_class\fR
+Modify I/O scheduling class of server processes. I/O niceness class values
+are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and IOPRIO_CLASS_IDLE (idle).
+The default does not modify class and priority.
+Work only with ionice_priority.
+.IP \fBionice_priority\fR
+Modify I/O scheduling priority of server processes. I/O niceness priority
+is a number which goes from 0 to 7. The higher the value, the lower
+the I/O priority of the process. Work only with ionice_class.
+Ignored if IOPRIO_CLASS_IDLE is set.
+.RE
+
+
+.RS 0
+.IP "\fB[object-reconstructor]\fR"
+.RE
+.RS 3
+.IP \fBlog_name\fR
+Label used when logging. The default is object-reconstructor.
+.IP \fBlog_facility\fR
+Syslog log facility. The default is LOG_LOCAL0.
+.IP \fBlog_level\fR
+Logging level. The default is INFO.
+.IP \fBlog_address\fR
+Logging address. The default is /dev/log.
+.IP \fBdaemonize\fR
+Whether or not to run replication as a daemon. The default is yes.
+.IP "\fBrun_pause [deprecated]\fR"
+Time in seconds to wait between replication passes. The default is 30.
+.IP \fBinterval\fR
+Time in seconds to wait between replication passes. The default is 30.
+.IP \fBconcurrency\fR
+Number of replication workers to spawn. The default is 1.
+.IP \fBstats_interval\fR
+Interval in seconds between logging replication statistics. The default is 300.
+.IP \fBnode_timeout\fR
+Request timeout to external services. The default is 10 seconds.
+.IP \fBhttp_timeout\fR
+Max duration of an HTTP request. The default is 60 seconds.
+.IP \fBlockup_timeout\fR
+Attempts to kill all workers if nothing replicates for lockup_timeout seconds. The
+default is 1800 seconds.
+.IP \fBring_check_interval\fR
+The default is 15.
 .IP "\fBrecon_cache_path\fR"
 The recon_cache_path simply sets the directory where stats for a few items will be stored.
 Depending on the method of deployment you may need to create this directory manually
 and ensure that swift has read/write.The default is /var/cache/swift.
+.IP "\fBhandoffs_first\fR"
+The flag to replicate handoffs prior to canonical partitions.
+It allows one to force syncing and deleting handoffs quickly.
+If set to a True value(e.g. "True" or "1"), partitions
+that are not supposed to be on the node will be replicated first.
+The default is false.
 .RE
+.PD
 
 
 .RS 0
@@ -220,13 +496,31 @@ Logging address. The default is /dev/log.
 .IP \fBinterval\fR
 Minimum time for a pass to take. The default is 300 seconds.
 .IP \fBconcurrency\fR
-Number of reaper workers to spawn. The default is 1.
+Number of updater workers to spawn. The default is 1.
 .IP \fBnode_timeout\fR
 Request timeout to external services. The default is 10 seconds.
-.IP \fBconn_timeout\fR
-Connection timeout to external services. The default is 0.5 seconds.
-.IP \fBslowdown = 0.01\fR
-Slowdown will sleep that amount between objects. The default is 0.01 seconds.
+.IP \fBobjects_per_second\fR
+Maximum objects updated per second. Should be tuned according to individual system specs. 0 is unlimited. The default is 50.
+.IP "\fBslowdown [deprecated]\fR"
+Slowdown will sleep that amount between objects. The default is 0.01 seconds. Deprecated in favor of objects_per_second.
+.IP "\fBrecon_cache_path\fR"
+The recon_cache_path simply sets the directory where stats for a few items will be stored.
+Depending on the method of deployment you may need to create this directory manually
+and ensure that swift has read/write. The default is /var/cache/swift.
+.IP \fBnice_priority\fR
+Modify scheduling priority of server processes. Niceness values range from -20
+(most favorable to the process) to 19 (least favorable to the process).
+The default does not modify priority.
+.IP \fBionice_class\fR
+Modify I/O scheduling class of server processes. I/O niceness class values
+are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and IOPRIO_CLASS_IDLE (idle).
+The default does not modify class and priority.
+Work only with ionice_priority.
+.IP \fBionice_priority\fR
+Modify I/O scheduling priority of server processes. I/O niceness priority
+is a number which goes from 0 to 7. The higher the value, the lower
+the I/O priority of the process. Work only with ionice_class.
+Ignored if IOPRIO_CLASS_IDLE is set.
 .RE
 .PD
 
@@ -244,31 +538,125 @@ Logging level. The default is INFO.
 .IP \fBlog_address\fR
 Logging address. The default is /dev/log.
 
+.IP \fBdisk_chunk_size\fR
+The default is 65536.
 .IP \fBfiles_per_second\fR
 Maximum files audited per second. Should be tuned according to individual
 system specs. 0 is unlimited. The default is 20.
 .IP \fBbytes_per_second\fR
 Maximum bytes audited per second. Should be tuned according to individual
 system specs. 0 is unlimited. The default is 10000000.
+.IP \fBconcurrency\fR
+Number of auditor workers to spawn. The default is 1.
 .IP \fBlog_time\fR
 The default is 3600 seconds.
 .IP \fBzero_byte_files_per_second\fR
 The default is 50.
+.IP "\fBrecon_cache_path\fR"
+The recon_cache_path simply sets the directory where stats for a few items will be stored.
+Depending on the method of deployment you may need to create this directory manually
+and ensure that swift has read/write. The default is /var/cache/swift.
+.IP \fBobject_size_stats\fR
+Takes a comma separated list of ints. If set, the object auditor will
+increment a counter for every object whose size is <= to the given break
+points and report the result after a full scan.
+.IP \fBrsync_tempfile_timeout\fR
+Time elapsed in seconds before rsync tempfiles will be unlinked. Config value of "auto"
+will try to use object-replicator's rsync_timeout + 900 or fall-back to 86400 (1 day).
+.IP \fBnice_priority\fR
+Modify scheduling priority of server processes. Niceness values range from -20
+(most favorable to the process) to 19 (least favorable to the process).
+The default does not modify priority.
+.IP \fBionice_class\fR
+Modify I/O scheduling class of server processes. I/O niceness class values
+are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and IOPRIO_CLASS_IDLE (idle).
+The default does not modify class and priority.
+Work only with ionice_priority.
+.IP \fBionice_priority\fR
+Modify I/O scheduling priority of server processes. I/O niceness priority
+is a number which goes from 0 to 7. The higher the value, the lower
+the I/O priority of the process. Work only with ionice_class.
+Ignored if IOPRIO_CLASS_IDLE is set.
 .RE
 
 
+.RS 0
+.IP "\fB[object-expirer]\fR"
+.RE
+.RS 3
+.IP \fBlog_name\fR
+Label used when logging. The default is object-expirer.
+.IP \fBlog_facility\fR
+Syslog log facility. The default is LOG_LOCAL0.
+.IP \fBlog_level\fR
+Logging level. The default is INFO.
+.IP \fBlog_address\fR
+Logging address. The default is /dev/log.
+.IP \fBinterval\fR
+Minimum time for a pass to take. The default is 300 seconds.
+.IP \fBreport_interval\fR
+Minimum time for a pass to report. The default is 300 seconds.
+.IP \fBrequest_tries\fR
+The number of times the expirer's internal client will
+attempt any given request in the event of failure. The default is 3.
+.IP \fBconcurrency\fR
+Number of expirer workers to spawn. The default is 1.
+.IP \fBdequeue_from_legacy\fR
+The flag to execute legacy style expirer tasks. The default is false.
+.IP \fBprocesses\fR
+Processes can only be used in conjunction with `dequeue_from_legacy`.
+Processes is how many parts to divide the legacy work into, one part per process that will be doing the work.
+Processes set 0 means that a single process will be doing all the legacy work.
+Processes can also be specified on the command line and will override the config value.
+The default is 0.
+.IP \fBprocess\fR
+Process can only be used in conjunction with `dequeue_from_legacy`.
+Process is which of the parts a particular legacy process will work on process can also be specified
+on the command line and will override the config value process is "zero based", if you want
+to use 3 processes, you should run processes with process set to 0, 1, and 2. The default is 0.
+.IP \fBreclaim_age\fR
+The expirer will re-attempt expiring if the source object is not available up
+to reclaim_age seconds before it gives up and deletes the task in the queue.
+The default is 604800 seconds (= 1 week).
+.IP \fBdelay_reaping_account/container\fR
+Normally, the expirer begins reaping expired objects immediately.  You can add
+options prefixed with "delay_reaping_" in the form of
+"delay_reaping_<ACCT>[/<CNTR>]" to cause the expirer to delay processing of
+tasks in those account or account/container.  The <ACCT>[/<CNTR>] part of the
+config option names should url-quote the paths.  The value is in seconds. The
+default is no delay for any tasks.
+.IP \fBround_robin_task_cache_size\fR
+Number of tasks objects to cache before processing.
+.IP \fBrecon_cache_path\fR
+Path to recon cache directory. The default is /var/cache/swift
+.IP \fBnice_priority\fR
+Modify scheduling priority of server processes. Niceness values range from -20
+(most favorable to the process) to 19 (least favorable to the process).
+The default does not modify priority.
+.IP \fBionice_class\fR
+Modify I/O scheduling class of server processes. I/O niceness class values
+are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and IOPRIO_CLASS_IDLE (idle).
+The default does not modify class and priority.
+Work only with ionice_priority.
+.IP \fBionice_priority\fR
+Modify I/O scheduling priority of server processes. I/O niceness priority
+is a number which goes from 0 to 7. The higher the value, the lower
+the I/O priority of the process. Work only with ionice_class.
+Ignored if IOPRIO_CLASS_IDLE is set.
+.RE
+.PD
+
+
 
 
 .SH DOCUMENTATION
 .LP
 More in depth documentation about the swift-object-server and
-also Openstack-Swift as a whole can be found at
-.BI http://swift.openstack.org/admin_guide.html
+also OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/admin_guide.html
 and
-.BI http://swift.openstack.org
+.BI https://docs.openstack.org/swift/latest/
 
 
 .SH "SEE ALSO"
 .BR swift-object-server(1),
-
-
diff --git a/doc/manpages/proxy-server.conf.5 b/doc/manpages/proxy-server.conf.5
index 2d077e0e45..6fe7c93163 100644
--- a/doc/manpages/proxy-server.conf.5
+++ b/doc/manpages/proxy-server.conf.5
@@ -1,6 +1,6 @@
 .\"
 .\" Author: Joao Marcelo Martins <marcelo.martins@rackspace.com> or <btorch@gmail.com>
-.\" Copyright (c) 2010-2012 OpenStack, LLC.
+.\" Copyright (c) 2010-2012 OpenStack Foundation.
 .\"
 .\" Licensed under the Apache License, Version 2.0 (the "License");
 .\" you may not use this file except in compliance with the License.
@@ -20,7 +20,7 @@
 .SH NAME
 .LP
 .B proxy-server.conf
-\- configuration file for the openstack-swift proxy server
+\- configuration file for the OpenStack Swift proxy server
 
 
 
@@ -41,7 +41,7 @@ certain number of key/value parameters which are described later.
 Any line that begins with a '#' symbol is ignored.
 
 You can find more information about python-pastedeploy configuration format at
-\fIhttp://pythonpaste.org/deploy/#config-format\fR
+\fIhttps://docs.pylonsproject.org/projects/pastedeploy/en/latest/#config-format\fR
 
 
 
@@ -56,12 +56,38 @@ IP address the proxy server should bind to. The default is 0.0.0.0 which will ma
 it bind to all available addresses.
 .IP "\fBbind_port\fR"
 TCP port the proxy server should bind to. The default is 80.
+.IP "\fBkeep_idle\fR"
+Value to set for socket TCP_KEEPIDLE. The default value is 600.
+.IP "\fBbind_timeout\fR"
+Timeout to bind socket. The default is 30.
 .IP \fBbacklog\fR
 TCP backlog.  Maximum number of allowed pending connections. The default value is 4096.
+.IP \fBadmin_key\fR
+Key to use for admin calls that are HMAC signed.  Default is empty,
+which will disable admin calls to /info.
+.IP \fBdisallowed_sections\fR
+Allows the ability to withhold sections from showing up in the public calls
+to /info.  You can withhold subsections by separating the dict level with a
+".".  The following would cause the sections 'container_quotas' and 'tempurl'
+to not be listed, and the key max_failed_deletes would be removed from
+bulk_delete.  Default value is 'swift.valid_api_versions' which allows all
+registered features to be listed via HTTP GET /info except
+swift.valid_api_versions information
 .IP \fBworkers\fR
-Number of container server workers to fork. The default is 1.
+The number of pre-forked processes that will accept connections.  Zero means
+no fork.  The default is auto which will make the server try to match the
+number of effective cpu cores if python multiprocessing is available (included
+with most python distributions >= 2.6) or fallback to one.  It's worth noting
+that individual workers will use many eventlet co-routines to service multiple
+concurrent requests.
+.IP \fBmax_clients\fR
+Maximum number of clients one worker can process simultaneously (it will
+actually accept(2) N + 1). Setting this to one (1) will only handle one request
+at a time, without accepting another request concurrently.  The default is 1024.
 .IP \fBuser\fR
-The system user that the container server will run as. The default is swift.
+The system user that the proxy server will run as. The default is swift.
+.IP \fBexpose_info\fR
+Enables exposing configuration settings via HTTP GET /info. The default is true.
 .IP \fBswift_dir\fR
 Swift configuration directory. The default is /etc/swift.
 .IP \fBcert_file\fR
@@ -78,6 +104,62 @@ Syslog log facility. The default is LOG_LOCAL0.
 Logging level. The default is INFO.
 .IP \fBlog_address\fR
 Logging address. The default is /dev/log.
+.IP \fBlog_max_line_length\fR
+To cap the length of log lines to the value given. No limit if set to 0, the default.
+.IP \fBlog_headers\fR
+The default is false.
+.IP \fBlog_custom_handlers\fR
+Comma separated list of functions to call to setup custom log handlers.
+functions get passed: conf, name, log_to_console, log_route, fmt, logger,
+adapted_logger. The default is empty.
+.IP \fBlog_udp_host\fR
+If set, log_udp_host will override log_address.
+.IP "\fBlog_udp_port\fR
+UDP log port, the default is 514.
+.IP \fBlog_statsd_host\fR
+StatsD server. IPv4/IPv6 addresses and hostnames are
+supported. If a hostname resolves to an IPv4 and IPv6 address, the IPv4
+address will be used.
+.IP \fBlog_statsd_port\fR
+The default is 8125.
+.IP \fBlog_statsd_default_sample_rate\fR
+The default is 1.
+.IP \fBlog_statsd_sample_rate_factor\fR
+The default is 1.
+.IP \fBlog_statsd_metric_prefix\fR
+The default is empty.
+.IP \fBclient_timeout\fR
+Time to wait while receiving each chunk of data from a client or another
+backend node. The default is 60.
+.IP \fBeventlet_debug\fR
+Debug mode for eventlet library. The default is false.
+.IP \fBtrans_id_suffix\fR
+This optional suffix (default is empty) that would be appended to the swift transaction
+id allows one to easily figure out from which cluster that X-Trans-Id belongs to.
+This is very useful when one is managing more than one swift cluster.
+.IP \fBcors_allow_origin\fR
+List of origin hosts that are allowed for CORS requests in addition to what
+the container has set. Use a comma separated list of full URL (http://foo.bar:1234,https://foo.bar)
+.IP \fBstrict_cors_mode\fR
+If True (default) then CORS requests are only allowed if their Origin header
+matches an allowed origin. Otherwise, any Origin is allowed.
+.IP \fBcors_expose_headers\fR
+Comma separated list of headers to expose through Access-Control-Expose-Headers,
+in addition to the defaults and any headers set in container metadata.
+.IP \fBnice_priority\fR
+Modify scheduling priority of server processes. Niceness values range from -20
+(most favorable to the process) to 19 (least favorable to the process).
+The default does not modify priority.
+.IP \fBionice_class\fR
+Modify I/O scheduling class of server processes. I/O niceness class values
+are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and IOPRIO_CLASS_IDLE (idle).
+The default does not modify class and priority.
+Work only with ionice_priority.
+.IP \fBionice_priority\fR
+Modify I/O scheduling priority of server processes. I/O niceness priority
+is a number which goes from 0 to 7. The higher the value, the lower
+the I/O priority of the process. Work only with ionice_class.
+Ignored if IOPRIO_CLASS_IDLE is set.
 .RE
 .PD
 
@@ -91,8 +173,13 @@ are acceptable within this section.
 
 .IP "\fBpipeline\fR"
 It is used when you need apply a number of filters. It is a list of filters
-ended by an application. The normal pipeline is "catch_errors healthcheck
-cache ratelimit tempauth proxy-logging proxy-server".
+ended by an application. The normal pipeline is "catch_errors gatekeeper healthcheck proxy-logging cache container_sync bulk tempurl ratelimit tempauth container-quotas account-quotas slo dlo versioned_writes proxy-logging proxy-server".
+
+Note: The double proxy-logging in the pipeline is not a mistake. The
+left-most proxy-logging is there to log requests that were handled in
+middleware and never made it through to the right-most middleware (and
+proxy server). Double logging is prevented for normal requests. See
+proxy-logging docs.
 .RE
 .PD
 
@@ -114,6 +201,7 @@ This is normally \fBegg:swift#healthcheck\fR.
 An optional filesystem path which, if present, will cause the healthcheck
 URL to return "503 Service Unavailable" with a body of "DISABLED BY FILE".
 .RE
+.PD
 
 
 .RS 0
@@ -141,20 +229,35 @@ systems are in use for one Swift cluster. The default is AUTH.
 .IP \fBauth_prefix\fR
 The auth prefix will cause requests beginning with this prefix to be routed
 to the auth subsystem, for granting tokens, etc. The default is /auth/.
+.IP \fBrequire_group\fR
+The require_group parameter names a group that must be presented by
+either X-Auth-Token or X-Service-Token. Usually this parameter is
+used only with multiple reseller prefixes (e.g., SERVICE_require_group=blah).
+By default, no group is needed. Do not use .admin.
 .IP \fBtoken_life\fR
 This is the time in seconds before the token expires. The default is 86400.
-.IP \fBallowed_sync_hosts\fR
-This is a comma separated list of hosts allowed to send X-Container-Sync-Key requests.
+.IP \fBallow_overrides\fR
+This allows middleware higher in the WSGI pipeline to override auth
+processing, useful for middleware such as tempurl and formpost. If you know
+you're not going to use such middleware and you want a bit of extra security,
+you can set this to false. The default is true.
+.IP \fBstorage_url_scheme\fR
+This specifies what scheme to return with storage urls:
+http, https, or default (chooses based on what the server is running as)
+This can be useful with an SSL load balancer in front of a non-SSL server.
 .IP \fBuser_<account>_<user>\fR
 Lastly, you need to list all the accounts/users you want here. The format is:
 user_<account>_<user> = <key> [group] [group] [...] [storage_url]
+or if you want underscores in <account> or <user>, you can base64 encode them
+(with no equal signs) and use this format:
+user64_<account_b64>_<user_b64> = <key> [group] [group] [...] [storage_url]
 
 There are special groups of: \fI.reseller_admin\fR who can do anything to any account for this auth
 and also \fI.admin\fR who can do anything within the account.
 
 If neither of these groups are specified, the user can only access containers that
 have been explicitly allowed for them by a \fI.admin\fR or \fI.reseller_admin\fR.
-The trailing optional storage_url allows you to specify an alternate url to hand
+The trailing optional storage_url allows you to specify an alternate URL to hand
 back to the user upon authentication. If not specified, this defaults to
 \fIhttp[s]://<ip>:<port>/v1/<reseller_prefix>_<account>\fR where http or https depends
 on whether cert_file is specified in the [DEFAULT] section, <ip> and <port> are based
@@ -173,6 +276,113 @@ Here are example entries, required for running the tests:
 .RE
 .PD
 
+.RS 0
+.IP "\fB[filter:authtoken]\fR"
+.RE
+
+To enable Keystone authentication you need to have the auth token
+middleware first to be configured. Here is an example below, please
+refer to the keystone's documentation for details about the
+different settings.
+
+You'll need to have as well the keystoneauth middleware enabled
+and have it in your main pipeline so instead of having tempauth in
+there you can change it to: authtoken keystoneauth
+
+The auth credentials ("project_domain_name", "user_domain_name", "username",
+"project_name", "password")  must match the Keystone credentials for the Swift
+service. The example values shown here assume a user named "swift" with admin
+role on a project named "service", both being in the Keystone domain with id
+"default". Refer to the KeystoneMiddleware documentation at
+.BI https://docs.openstack.org/keystonemiddleware/latest/middlewarearchitecture.html#configuration
+for other examples.
+
+.PD 0
+.RS 10
+.IP "paste.filter_factory = keystonemiddleware.auth_token:filter_factory"
+.IP "www_authenticate_uri = http://keystonehost:5000"
+.IP "auth_url = http://keystonehost:5000"
+.IP "auth_plugin = password"
+.IP "project_domain_id = default"
+.IP "user_domain_id = default"
+.IP "project_name = service"
+.IP "username = swift"
+.IP "password = password"
+.IP ""
+.IP "# delay_auth_decision defaults to False, but leaving it as false will"
+.IP "# prevent other auth systems, staticweb, tempurl, formpost, and ACLs from"
+.IP "# working. This value must be explicitly set to True."
+.IP "delay_auth_decision = False"
+.IP
+.IP "cache = swift.cache"
+.IP "include_service_catalog = False"
+.RE
+.PD
+
+
+.RS 0
+.IP "\fB[filter:keystoneauth]\fR"
+.RE
+
+Keystone authentication middleware.
+
+.RS 3
+.IP \fBuse\fR
+Entry point for paste.deploy for the keystoneauth middleware. This is the reference to the installed python egg.
+This is normally \fBegg:swift#keystoneauth\fR.
+.IP \fBreseller_prefix\fR
+The reseller_prefix option lists account namespaces that this middleware is
+responsible for. The prefix is placed before the Keystone project id.
+For example, for project 12345678, and prefix AUTH, the account is
+named AUTH_12345678 (i.e., path is /v1/AUTH_12345678/...).
+Several prefixes are allowed by specifying a comma-separated list
+as in: "reseller_prefix = AUTH, SERVICE". The empty string indicates a
+single blank/empty prefix. If an empty prefix is required in a list of
+prefixes, a value of '' (two single quote characters) indicates a
+blank/empty prefix. Except for the blank/empty prefix, an underscore ('_')
+character is appended to the value unless already present.
+.IP \fBoperator_roles\fR
+The user must have at least one role named by operator_roles on a
+project in order to create, delete and modify containers and objects
+and to set and read privileged headers such as ACLs.
+If there are several reseller prefix items, you can prefix the
+parameter so it applies only to those accounts (for example
+the parameter SERVICE_operator_roles applies to the /v1/SERVICE_<project>
+path). If you omit the prefix, the option applies to all reseller
+prefix items. For the blank/empty prefix, prefix with '' (do not put
+underscore after the two single quote characters).
+.IP \fBreseller_admin_role\fR
+The reseller admin role has the ability to create and delete accounts.
+.IP \fBallow_overrides\fR
+This allows middleware higher in the WSGI pipeline to override auth
+processing, useful for middleware such as tempurl and formpost. If you know
+you're not going to use such middleware and you want a bit of extra security,
+you can set this to false.
+.IP \fBservice_roles\fR
+If the service_roles parameter is present, an X-Service-Token must be
+present in the request that when validated, grants at least one role listed
+in the parameter. The X-Service-Token may be scoped to any project.
+If there are several reseller prefix items, you can prefix the
+parameter so it applies only to those accounts (for example
+the parameter SERVICE_service_roles applies to the /v1/SERVICE_<project>
+path). If you omit the prefix, the option applies to all reseller
+prefix items. For the blank/empty prefix, prefix with '' (do not put
+underscore after the two single quote characters).
+By default, no service_roles are required.
+.IP \fBdefault_domain_id\fR
+For backwards compatibility, keystoneauth will match names in cross-tenant
+access control lists (ACLs) when both the requesting user and the tenant
+are in the default domain i.e the domain to which existing tenants are
+migrated. The default_domain_id value configured here should be the same as
+the value used during migration of tenants to keystone domains.
+.IP \fBallow_names_in_acls\fR
+For a new installation, or an installation in which keystone projects may
+move between domains, you should disable backwards compatible name matching
+in ACLs by setting allow_names_in_acls to false:
+.RE
+.PD
+
+
 .RS 0
 .IP "\fB[filter:cache]\fR"
 .RE
@@ -191,27 +401,18 @@ Syslog log facility. The default is LOG_LOCAL0.
 Logging level. The default is INFO.
 .IP "\fBset log_address\fR"
 Logging address. The default is /dev/log.
-.IP "\fBset log_headers\fR "
+.IP "\fBset log_headers\fR"
 Enables the ability to log request headers. The default is False.
+.IP \fBmemcache_max_connections\fR
+Sets the maximum number of connections to each memcached server per worker.
 .IP \fBmemcache_servers\fR
-If not set in the configuration file, the value for memcache_servers will be read from /etc/swift/memcache.conf (see memcache.conf-sample) or lacking that file, it will default to the value below. You can specify multiple servers separated with commas, as in: 10.1.2.3:11211,10.1.2.4:11211. This can be a list separated by commas. The default is 127.0.0.1:11211.
-.IP \fBmemcache_serialization_support\fR
-This sets how memcache values are serialized and deserialized:
-.RE
-
-.PD 0
-.RS 10
-.IP "0 = older, insecure pickle serialization"
-.IP "1 = json serialization but pickles can still be read (still insecure)"
-.IP "2 = json serialization only (secure and the default)"
+If not set in the configuration file, the value for memcache_servers will be
+read from /etc/swift/memcache.conf (see memcache.conf-sample) or lacking that
+file, it will default to 127.0.0.1:11211. You can specify multiple servers
+separated with commas, as in: 10.1.2.3:11211,10.1.2.4:11211.  (IPv6
+addresses must follow rfc3986 section-3.2.2, i.e. [::1]:11211)
 .RE
-
-.RS 10
-To avoid an instant full cache flush, existing installations should upgrade with 0, then set to 1 and reload, then after some time (24 hours) set to 2 and reload. In the future, the ability to use pickle serialization will be removed.
-
-If not set in the configuration file, the value for memcache_serialization_support will be read from /etc/swift/memcache.conf if it exists (see memcache.conf-sample). Otherwise, the default value as indicated above will be used.
-.RE
-
+.PD
 
 
 .RS 0
@@ -251,22 +452,23 @@ rate but better average accuracy. The default is 5.
 .IP \fBaccount_ratelimit\fR
 If set, will limit PUT and DELETE requests to /account_name/container_name. Number is
 in requests per second. If set to 0 means disabled. The default is 0.
-.IP \fBaccount_whitelist\fR
-Comma separated lists of account names that will not be rate limited. The default is ''.
-.IP \fBaccount_blacklist\fR
-Comma separated lists of account names that will not be allowed. Returns a 497 response.
-The default is ''.
 .IP \fBcontainer_ratelimit_size\fR
 When set with container_limit_x = r: for containers of size x, limit requests per second
 to r. Will limit PUT, DELETE, and POST requests to /a/c/o. The default is ''.
+.IP \fBcontainer_listing_ratelimit_size\fR
+Similarly to the above container-level write limits, the following will limit
+container GET (listing) requests.
 .RE
+.PD
+
 
 
 .RS 0
 .IP "\fB[filter:domain_remap]\fR"
 .RE
 
-Middleware that translates container and account parts of a domain to path parameters that the proxy server understands. The container.account.storageurl/object gets translated to container.account.storageurl/path_root/account/container/object and account.storageurl/path_root/container/object gets translated to account.storageurl/path_root/account/container/object
+Middleware that translates container and account parts of a domain to path parameters that the proxy server understands.
+The container.account.storageurl/object gets translated to container.account.storageurl/path_root/account/container/object and account.storageurl/path_root/container/object gets translated to account.storageurl/path_root/account/container/object
 
 .RS 3
 .IP \fBuse\fR
@@ -274,12 +476,16 @@ Entry point for paste.deploy for the domain_remap middleware. This is the refere
 This is normally \fBegg:swift#domain_remap\fR.
 .IP "\fBset log_name\fR"
 Label used when logging. The default is domain_remap.
+.IP "\fBset log_facility\fR"
+Syslog log facility. The default is LOG_LOCAL0.
+.IP "\fBset log_level\fR "
+Logging level. The default is INFO.
 .IP "\fBset log_address\fR"
 Logging address. The default is /dev/log.
-.IP "\fBset log_headers\fR"
+.IP "\fBset log_headers\fR "
 Enables the ability to log request headers. The default is False.
 .IP \fBstorage_domain\fR
-The domain to be used by the middleware.
+The domain to be used by the middleware. Multiple domains can be specified separated by a comma.
 .IP \fBpath_root\fR
 The path root value for the storage URL. The default is v1.
 .IP \fBreseller_prefixes\fR
@@ -287,11 +493,15 @@ Browsers can convert a host header to lowercase, so check that reseller
 prefix on the account is the correct case. This is done by comparing the
 items in the reseller_prefixes config option to the found prefix. If they
 match except for case, the item from reseller_prefixes will be used
-instead of the found reseller prefix. The reseller_prefixes list is exclusive.
-If defined, any request with an account prefix not in that list will be ignored
-by this middleware. Defaults to 'AUTH'.
+instead of the found reseller prefix. When none match, the default reseller
+prefix is used. When no default reseller prefix is configured, any request with
+an account prefix not in that list will be ignored by this middleware.
+Defaults to 'AUTH'.
+.IP \fBdefault_reseller_prefix\fR
+The default reseller prefix. This is used when none of the configured
+reseller_prefixes match. When not set, no reseller prefix is added.
 .RE
-
+.PD
 
 
 .RS 0
@@ -312,7 +522,7 @@ Logging address. The default is /dev/log.
 .IP "\fBset log_headers\fR"
 Enables the ability to log request headers. The default is False.
 .RE
-
+.PD
 
 
 .RS 0
@@ -340,8 +550,12 @@ The domain to be used by the middleware.
 .IP \fBlookup_depth\fR
 How deep in the CNAME chain to look for something that matches the storage domain.
 The default is 1.
+.IP \fBnameservers\fR
+Specify the nameservers to use to do the CNAME resolution. If unset, the system
+configuration is used. Multiple nameservers can be specified separated by a comma.
+Default is unset.
 .RE
-
+.PD
 
 
 .RS 0
@@ -354,8 +568,6 @@ Note: Put staticweb just after your auth filter(s) in the pipeline
 .IP \fBuse\fR
 Entry point for paste.deploy for the staticweb middleware. This is the reference to the installed python egg.
 This is normally \fBegg:swift#staticweb\fR.
-.IP \fBcache_timeout\fR
-Seconds to cache container x-container-meta-web-* header values. The default is 300 seconds.
 .IP "\fBset log_name\fR"
 Label used when logging. The default is staticweb.
 .IP "\fBset log_facility\fR"
@@ -366,23 +578,22 @@ Logging level. The default is INFO.
 Logging address. The default is /dev/log.
 .IP "\fBset log_headers\fR"
 Enables the ability to log request headers. The default is False.
-.IP "\fBset access_log_name\fR"
-Label used when logging. The default is staticweb.
-.IP "\fBset access_log_facility\fR"
-Syslog log facility. The default is LOG_LOCAL0.
-.IP "\fBset access_log_level\fR "
-Logging level. The default is INFO.
 .RE
-
+.PD
 
 
 .RS 0
 .IP "\fB[filter:tempurl]\fR"
 .RE
 
-Note: Put tempurl just before your auth filter(s) in the pipeline
+Note: Put tempurl before slo, dlo, and your auth filter(s) in the pipeline
 
 .RS 3
+.IP \fBuse\fR
+Entry point for paste.deploy for the tempurl middleware. This is the reference to the installed python egg.
+This is normally \fBegg:swift#tempurl\fR.
+.IP \fBmethods\fR
+The methods allowed with Temp URLs. The default is 'GET HEAD PUT POST DELETE'.
 .IP \fBincoming_remove_headers\fR
 The headers to remove from incoming requests. Simply a whitespace delimited list of header names and names can optionally end with '*' to indicate a prefix match. incoming_allow_headers is a list of exceptions to these removals.
 .IP \fBincoming_allow_headers\fR
@@ -391,9 +602,8 @@ The headers allowed as exceptions to incoming_remove_headers. Simply a whitespac
 The headers to remove from outgoing responses. Simply a whitespace delimited list of header names and names can optionally end with '*' to indicate a prefix match. outgoing_allow_headers is a list of exceptions to these removals.
 .IP "\fBoutgoing_allow_headers\fR"
 The headers allowed as exceptions to outgoing_remove_headers. Simply a whitespace delimited list of header names and names can optionally end with '*' to indicate a prefix match.
-.IP "\fBset log_level\fR "
 .RE
-
+.PD
 
 
 .RS 0
@@ -407,6 +617,7 @@ Note: Put formpost just before your auth filter(s) in the pipeline
 Entry point for paste.deploy for the formpost middleware. This is the reference to the installed python egg.
 This is normally \fBegg:swift#formpost\fR.
 .RE
+.PD
 
 
 
@@ -421,16 +632,29 @@ Note: Just needs to be placed before the proxy-server in the pipeline.
 Entry point for paste.deploy for the name_check middleware. This is the reference to the installed python egg.
 This is normally \fBegg:swift#name_check\fR.
 .IP \fBforbidden_chars\fR
-Characters that will not be allowed in a name.
+Characters that will not be allowed in a name. The default is '"`<>.
 .IP \fBmaximum_length\fR
-Maximum number of characters that can be in the name.
+Maximum number of characters that can be in the name. The default is 255.
 .IP \fBforbidden_regexp\fR
-Python regular expressions of substrings that will not be allowed in a name.
+Python regular expressions of substrings that will not be allowed in a name. The default is /\./|/\.\./|/\.$|/\.\.$.
+.RE
+.PD
+
+
+.RS 0
+.IP "\fB[filter:list-endpoints]\fR"
+.RS 3
+.IP \fBuse\fR
+Entry point for paste.deploy for the list_endpoints middleware. This is the reference to the installed python egg.
+This is normally \fBegg:swift#list_endpoints\fR.
+.IP \fBlist_endpoints_path\fR
+The default is '/endpoints/'.
 .RE
+.PD
 
 
 .RS 0
-.IP "\fB[filter:proxy_logging]\fR"
+.IP "\fB[filter:proxy-logging]\fR"
 .RE
 
 Logging for the proxy server now lives in this middleware.
@@ -456,25 +680,304 @@ unset.
 Default is 514.
 .IP \fBaccess_log_statsd_host\fR
 You can use log_statsd_* from [DEFAULT], or override them here.
-Default is localhost.
+StatsD server. IPv4/IPv6 addresses and hostnames are
+supported. If a hostname resolves to an IPv4 and IPv6 address, the IPv4
+address will be used.
 .IP \fBaccess_log_statsd_port\fR
 Default is 8125.
 .IP \fBaccess_log_statsd_default_sample_rate\fR
 Default is 1.
-.IP \fBaccess_log_statsd_metric_prefix =
+.IP \fBaccess_log_statsd_sample_rate_factor\fR
+The default is 1.
+.IP \fBaccess_log_statsd_metric_prefix\fR
 Default is "" (empty-string)
 .IP \fBaccess_log_headers\fR
 Default is False.
+.IP \fBaccess_log_headers_only\fR
+If access_log_headers is True and access_log_headers_only is set only
+these headers are logged. Multiple headers can be defined as comma separated
+list like this: access_log_headers_only = Host, X-Object-Meta-Mtime
+.IP \fBreveal_sensitive_prefix\fR
+By default, the X-Auth-Token is logged. To obscure the value,
+set reveal_sensitive_prefix to the number of characters to log.
+For example, if set to 12, only the first 12 characters of the
+token appear in the log. An unauthorized access of the log file
+won't allow unauthorized usage of the token. However, the first
+12 or so characters is unique enough that you can trace/debug
+token usage. Set to 0 to suppress the token completely (replaced
+by '...' in the log). The default is 16 chars.
+Note: reveal_sensitive_prefix will not affect the value logged with access_log_headers=True.
 .IP \fBlog_statsd_valid_http_methods\fR
 What HTTP methods are allowed for StatsD logging (comma-sep); request methods
 not in this list will have "BAD_METHOD" for the <verb> portion of the metric.
 Default is "GET,HEAD,POST,PUT,DELETE,COPY,OPTIONS".
+.IP \fBlog_anonymization_method\fR
+Hashing algorithm for anonymization. Must be one of algorithms supported by Python's hashlib. Default is MD5.
+.IP \fBlog_anonymization_salt\fR
+Salt added as prefix before hashing the value to anonymize. Default is empty (no salt).
+.IP "\fBlog_msg_template\fR"
+Template used to format access logs. All words surrounded by curly brackets will be substituted with the appropriate values.
+
 .RE
+.PD 0
+.RS 10
+.IP "Some keywords map to timestamps and can be converted to standard dates formats using the matching transformers: 'datetime', 'asctime' or 'iso8601'."
+.IP "Other transformers for timestamps are 's', 'ms', 'us' and 'ns' for seconds, milliseconds, microseconds and nanoseconds."
+.IP "Python's strftime directives can also be used as tranformers (a, A, b, B, c, d, H, I, j, m, M, p, S, U, w, W, x, X, y, Y, Z)."
+.IP "Some keywords map to user data that could be anonymized by using the transformer 'anonymized'."
+.IP "Keywords availables are:"
+.PD 0
+.RS 7
+.IP "client_ip              (anonymizable)"
+.IP "remote_addr            (anonymizable)"
+.IP "method                 (request method)"
+.IP "path                   (anonymizable)"
+.IP "protocol"
+.IP "status_int"
+.IP "referer                (anonymizable)"
+.IP "user_agent             (anonymizable)"
+.IP "auth_token"
+.IP "bytes_recvd            (number of bytes received)"
+.IP "bytes_sent             (number of bytes sent)"
+.IP "client_etag            (anonymizable)"
+.IP "transaction_id"
+.IP "headers                (anonymizable)"
+.IP "request_time           (difference between start and end timestamps)
+.IP "source"
+.IP "log_info"
+.IP "start_time             (timestamp at the receiving, timestamp)"
+.IP "end_time               (timestamp at the end of the treatment, timestamp)"
+.IP "ttfb                   (duration between request and first bytes is sent)"
+.IP "policy_index"
+.IP "account                (account name, anonymizable)"
+.IP "container              (container name, anonymizable)"
+.IP "object                 (object name, anonymizable)"
+.IP "pid                    (PID of the process emitting the log line)"
+.PD
+.RE
+
+.IP "Example: '{client_ip.anonymized} {remote_addr.anonymized} {start_time.iso8601} {end_time.H}:{end_time.M} {method} acc:{account} cnt:{container} obj:{object.anonymized}'"
+.IP "Default: '{client_ip} {remote_addr} {end_time.datetime} {method} {path} {protocol} {status_int} {referer} {user_agent} {auth_token} {bytes_recvd} {bytes_sent} {client_etag} {transaction_id} {headers} {request_time} {source} {log_info} {start_time} {end_time} {policy_index}'"
+.IP "Warning: A bad log message template will raise an error in initialization."
+.RE
+.PD
 
 
+.RS 0
+.IP "\fB[filter:bulk]\fR"
+.RE
+
+Note: Put before both ratelimit and auth in the pipeline.
+
+.RS 3
+.IP \fBuse\fR
+Entry point for paste.deploy for the bulk middleware. This is the reference to the installed python egg.
+This is normally \fBegg:swift#bulk\fR.
+.IP \fBmax_containers_per_extraction\fR
+The default is 10000.
+.IP \fBmax_failed_extractions\fR
+The default is 1000.
+.IP \fBmax_deletes_per_request\fR
+The default is 10000.
+.IP \fBmax_failed_deletes\fR
+The default is 1000.
+
+In order to keep a connection active during a potentially long bulk request,
+Swift may return whitespace prepended to the actual response body. This
+whitespace will be yielded no more than every yield_frequency seconds.
+The default is 10.
+.IP \fByield_frequency\fR
+
+.IP \fBdelete_container_retry_count\fR
+Note: This parameter is used during a bulk delete of objects and
+their container. This would frequently fail because it is very likely
+that all replicated objects have not been deleted by the time the middleware got a
+successful response. It can be configured the number of retries. And the
+number of seconds to wait between each retry will be 1.5**retry
+The default is 0.
+.RE
 .PD
 
 
+.RS 0
+.IP "\fB[filter:slo]\fR"
+.RE
+
+Note: Put after auth and staticweb in the pipeline.
+
+.RS 3
+.IP \fBuse\fR
+Entry point for paste.deploy for the slo middleware. This is the reference to the installed python egg.
+This is normally \fBegg:swift#slo\fR.
+.IP \fBmax_manifest_segments\fR
+The default is 1000.
+.IP \fBmax_manifest_size\fR
+The default is 2097152.
+.IP \fBmin_segment_size\fR
+The default is 1048576
+.IP \fBrate_limit_after_segment\fR
+Start rate-limiting object segments after the Nth segment of a segmented
+object. The default is 10 segments.
+.IP \fBrate_limit_segments_per_sec\fR
+Once segment rate-limiting kicks in for an object, limit segments served to N
+per second. The default is 1.
+.IP \fBmax_get_time\fR
+Time limit on GET requests (seconds). The default is 86400.
+.RE
+.PD
+
+
+.RS 0
+.IP "\fB[filter:dlo]\fR"
+.RE
+
+Note: Put after auth and staticweb in the pipeline.
+If you don't put it in the pipeline, it will be inserted for you.
+
+.RS 3
+.IP \fBuse\fR
+Entry point for paste.deploy for the dlo middleware. This is the reference to the installed python egg.
+This is normally \fBegg:swift#dlo\fR.
+.IP \fBrate_limit_after_segment\fR
+Start rate-limiting object segments after the Nth segment of a segmented
+object. The default is 10 segments.
+.IP \fBrate_limit_segments_per_sec\fR
+Once segment rate-limiting kicks in for an object, limit segments served to N
+per second. The default is 1.
+.IP \fBmax_get_time\fR
+Time limit on GET requests (seconds). The default is 86400.
+.RE
+.PD
+
+
+.RS 0
+.IP "\fB[filter:container-quotas]\fR"
+.RE
+
+Note: Put after auth in the pipeline.
+
+.RS 3
+.IP \fBuse\fR
+Entry point for paste.deploy for the container_quotas middleware. This is the reference to the installed python egg.
+This is normally \fBegg:swift#container_quotas\fR.
+.RE
+.PD
+
+
+.RS 0
+.IP "\fB[filter:account-quotas]\fR"
+.RE
+
+Note: Put after auth in the pipeline.
+
+.RS 3
+.IP \fBuse\fR
+Entry point for paste.deploy for the account_quotas middleware. This is the reference to the installed python egg.
+This is normally \fBegg:swift#account_quotas\fR.
+.RE
+.PD
+
+
+.RS 0
+.IP "\fB[filter:gatekeeper]\fR"
+.RE
+
+Note: this middleware requires python-dnspython
+
+.RS 3
+.IP \fBuse\fR
+Entry point for paste.deploy for the gatekeeper middleware. This is the reference to the installed python egg.
+This is normally \fBegg:swift#gatekeeper\fR.
+.IP "\fBset log_name\fR"
+Label used when logging. The default is gatekeeper.
+.IP "\fBset log_facility\fR"
+Syslog log facility. The default is LOG_LOCAL0.
+.IP "\fBset log_level\fR "
+Logging level. The default is INFO.
+.IP "\fBset log_address\fR"
+Logging address. The default is /dev/log.
+.IP "\fBset log_headers\fR"
+Enables the ability to log request headers. The default is False.
+.RE
+.PD
+
+
+.RS 0
+.IP "\fB[filter:container_sync]\fR"
+.RE
+
+Note: this middleware requires python-dnspython
+
+.RS 3
+.IP \fBuse\fR
+Entry point for paste.deploy for the container_sync middleware. This is the reference to the installed python egg.
+This is normally \fBegg:swift#container_sync\fR.
+.IP \fBallow_full_urls\fR
+Set this to false if you want to disallow any full URL values to be set for
+any new X-Container-Sync-To headers. This will keep any new full urls from
+coming in, but won't change any existing values already in the cluster.
+Updating those will have to be done manually, as knowing what the true realm
+endpoint should be cannot always be guessed. The default is true.
+.IP \fBcurrent\fR
+Set this to specify this clusters //realm/cluster as "current" in /info
+.RE
+.PD
+
+
+.RS 0
+.IP "\fB[filter:xprofile]\fR"
+.RE
+
+Note: Put it at the beginning of the pipeline to profile all middleware. But it is safer to put this after healthcheck.
+
+.RS 3
+.IP "\fBuse\fR"
+Entry point for paste.deploy for the xprofile middleware. This is the reference to the installed python egg.
+This is normally \fBegg:swift#xprofile\fR.
+.IP "\fBprofile_module\fR"
+This option enable you to switch profilers which should inherit from python
+standard profiler. Currently the supported value can be 'cProfile', 'eventlet.green.profile' etc.
+.IP "\fBlog_filename_prefix\fR"
+This prefix will be used to combine process ID and timestamp to name the
+profile data file.  Make sure the executing user has permission to write
+into this path (missing path segments will be created, if necessary).
+If you enable profiling in more than one type of daemon, you must override
+it with an unique value like, the default is /var/log/swift/profile/account.profile.
+.IP "\fBdump_interval\fR"
+The profile data will be dumped to local disk based on above naming rule
+in this interval. The default is 5.0.
+.IP "\fBdump_timestamp\fR"
+Be careful, this option will enable profiler to dump data into the file with
+time stamp which means there will be lots of files piled up in the directory.
+The default is false
+.IP "\fBpath\fR"
+This is the path of the URL to access the mini web UI. The default is __profile__.
+.IP "\fBflush_at_shutdown\fR"
+Clear the data when the wsgi server shutdown. The default is false.
+.IP "\fBunwind\fR"
+Unwind the iterator of applications. Default is false.
+.RE
+.PD
+
+
+.RS 0
+.IP "\fB[filter:versioned_writes]\fR"
+.RE
+
+Note: Put after slo, dlo in the pipeline.
+If you don't put it in the pipeline, it will be inserted automatically.
+
+.RS 3
+.IP \fBuse\fR
+Entry point for paste.deploy for the versioned_writes middleware. This is the reference to the installed python egg.
+This is normally \fBegg:swift#versioned_writes\fR.
+.IP \fBallow_versioned_writes\fR
+Enables using versioned writes middleware and exposing configuration settings via HTTP GET /info.
+WARNING: Setting this option bypasses the "allow_versions" option
+in the container configuration file, which will be eventually
+deprecated. See documentation for more details.
+.RE
+.PD
 
 
 .SH APP SECTION
@@ -485,13 +988,13 @@ that are acceptable within this section.
 .IP \fBuse\fR
 Entry point for paste.deploy for the proxy server. This is the reference to the installed python egg.
 This is normally \fBegg:swift#proxy\fR.
-.IP \fBset log_name\fR
+.IP "\fBset log_name\fR"
 Label used when logging. The default is proxy-server.
-.IP \fBset log_facility\fR
+.IP "\fBset log_facility\fR"
 Syslog log facility. The default is LOG_LOCAL0.
-.IP \fB set log_level\fR
+.IP "\fBset log_level\fR"
 Logging level. The default is INFO.
-.IP \fB set log_address\fR
+.IP "\fBset log_address\fR"
 Logging address. The default is /dev/log.
 .IP \fBlog_handoffs\fR
 Log when handoff locations are used.  Default is True.
@@ -500,15 +1003,24 @@ Cache timeout in seconds to send memcached for account existence. The default is
 .IP \fBrecheck_container_existence\fR
 Cache timeout in seconds to send memcached for container existence. The default is 60 seconds.
 .IP \fBobject_chunk_size\fR
-Chunk size to read from object servers. The default is 8192.
+Chunk size to read from object servers. The default is 65536.
 .IP \fBclient_chunk_size\fR
-Chunk size to read from clients. The default is 8192.
+Chunk size to read from clients. The default is 65536.
 .IP \fBnode_timeout\fR
 Request timeout to external services. The default is 10 seconds.
-.IP \fBclient_timeoutt\fR
-Timeout to read one chunk from a client. The default is 60 seconds.
+.IP \fBrecoverable_node_timeout\fR
+How long the proxy server will wait for an initial response and to read a
+chunk of data from the object servers while serving GET / HEAD requests.
+Timeouts from these requests can be recovered from so setting this to
+something lower than node_timeout would provide quicker error recovery
+while allowing for a longer timeout for non-recoverable requests (PUTs).
+Defaults to node_timeout, should be overridden if node_timeout is set to a
+high number to prevent client timeouts from firing before the proxy server
+has a chance to retry.
 .IP \fBconn_timeout\fR
 Connection timeout to external services. The default is 0.5 seconds.
+.IP \fBpost_quorum_timeout\fR
+How long to wait for requests to finish after a quorum has been established. The default is 0.5 seconds.
 .IP \fBerror_suppression_interval\fR
 Time in seconds that must elapse since the last error for a node to
 be considered no longer error limited. The default is 60 seconds.
@@ -518,35 +1030,115 @@ Error count to consider a node error limited. The default is 10.
 Whether account PUTs and DELETEs are even callable. If set to 'true' any authorized
 user may create and delete accounts; if 'false' no one, even authorized, can. The default
 is false.
-.IP \fBobject_post_as_copy\fR
-Set object_post_as_copy = false to turn on fast posts where only the metadata changes
-are stored as new and the original data file is kept in place. This makes for quicker
-posts; but since the container metadata isn't updated in this mode, features like
-container sync won't be able to sync posts. The default is True.
 .IP \fBaccount_autocreate\fR
 If set to 'true' authorized accounts that do not yet exist within the Swift cluster
 will be automatically created. The default is set to false.
+.IP \fBmax_containers_per_account\fR
+If set to a positive value, trying to create a container when the account
+already has at least this maximum containers will result in a 403 Forbidden.
+Note: This is a soft limit, meaning a user might exceed the cap for
+recheck_account_existence before the 403s kick in.
+.IP \fBmax_containers_whitelist\fR
+This is a comma separated list of account hashes that ignore the max_containers_per_account cap.
+.IP \fBdeny_host_headers\fR
+Comma separated list of Host headers to which the proxy will deny requests. The default is empty.
+.IP \fBsorting_method\fR
+Storage nodes can be chosen at random (shuffle - default), by using timing
+measurements (timing), or by using an explicit match (affinity).
+Using timing measurements may allow for lower overall latency, while
+using affinity allows for finer control. In both the timing and
+affinity cases, equally-sorting nodes are still randomly chosen to
+spread load.
+The valid values for sorting_method are "affinity", "shuffle", and "timing".
+.IP \fBtiming_expiry\fR
+If the "timing" sorting_method is used, the timings will only be valid for
+the number of seconds configured by timing_expiry. The default is 300.
+.IP \fBconcurrent_gets\fR
+If "on" then use replica count number of threads concurrently during a GET/HEAD
+and return with the first successful response. In the EC case, this parameter
+only affects an EC HEAD as an EC GET behaves differently. Default is "off".
+.IP \fBconcurrency_timeout\fR
+This parameter controls how long to wait before firing off the next
+concurrent_get thread. A value of 0 would we fully concurrent, any other number
+will stagger the firing of the threads. This number should be between 0 and
+node_timeout. The default is the value of conn_timeout (0.5).
+.IP \fBrequest_node_count\fR
+Set to the number of nodes to contact for a normal request. You can use '* replicas'
+at the end to have it use the number given times the number of
+replicas for the ring being used for the request. The default is '2 * replicas'.
+.IP \fBread_affinity\fR
+Specifies which backend servers to prefer on reads. Format is a comma
+separated list of affinity descriptors of the form <selection>=<priority>.
+The <selection> may be r<N> for selecting nodes in region N or r<N>z<M> for
+selecting nodes in region N, zone M. The <priority> value should be a whole
+number that represents the priority to be given to the selection; lower numbers
+are higher priority. Default is empty, meaning no preference.
+
+Example: first read from region 1 zone 1, then region 1 zone 2, then anything
+in region 2, then everything else:
+
+.PD 0
+.RS 10
+.IP "read_affinity = r1z1=100, r1z2=200, r2=300"
+.RE
+.PD
+.IP \fBwrite_affinity\fR
+Specifies which backend servers to prefer on writes. Format is a comma
+separated list of affinity descriptors of the form r<N> for region N or
+r<N>z<M> for region N, zone M. If this is set, then when handling an object
+PUT request, some number (see setting write_affinity_node_count) of local
+backend servers will be tried before any nonlocal ones. Default is empty,
+meaning no preference.
+
+Example: try to write to regions 1 and 2 before writing to any other
+nodes:
+
+.PD 0
+.RS 10
+write_affinity = r1, r2
+.RE
+.PD
+.IP \fBwrite_affinity_node_count\fR
+The number of local (as governed by the write_affinity setting) nodes to
+attempt to contact first on writes, before any non-local ones. The value
+should be an integer number, or use '* replicas' at the end to have it use
+the number given times the number of replicas for the ring being used for the
+request. The default is '2 * replicas'.
+.IP \fBswift_owner_headers\fR
+These are the headers whose values will only be shown to swift_owners. The
+exact definition of a swift_owner is up to the auth system in use, but
+usually indicates administrative responsibilities.
+The default is 'x-container-read, x-container-write, x-container-sync-key, x-container-sync-to, x-account-meta-temp-url-key, x-account-meta-temp-url-key-2, x-container-meta-temp-url-key, x-container-meta-temp-url-key-2, x-account-access-control'.
 .IP \fBrate_limit_after_segment\fR
 Start rate-limiting object segments after the Nth segment of a segmented
 object.  The default is 10 segments.
 .IP \fBrate_limit_segments_per_sec\fR
 Once segment rate-limiting kicks in for an object, limit segments served to N
 per second.  The default is 1.
+.IP \fBnice_priority\fR
+Modify scheduling priority of server processes. Niceness values range from -20
+(most favorable to the process) to 19 (least favorable to the process).
+The default does not modify priority.
+.IP \fBionice_class\fR
+Modify I/O scheduling class of server processes. I/O niceness class values
+are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and IOPRIO_CLASS_IDLE (idle).
+The default does not modify class and priority.
+Work only with ionice_priority.
+.IP \fBionice_priority\fR
+Modify I/O scheduling priority of server processes. I/O niceness priority
+is a number which goes from 0 to 7. The higher the value, the lower
+the I/O priority of the process. Work only with ionice_class.
+Ignored if IOPRIO_CLASS_IDLE is set.
 .RE
 .PD
 
-
-
 .SH DOCUMENTATION
 .LP
 More in depth documentation about the swift-proxy-server and
-also Openstack-Swift as a whole can be found at
-.BI http://swift.openstack.org/admin_guide.html
+also OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/admin_guide.html
 and
-.BI http://swift.openstack.org
-
+.BI https://docs.openstack.org/swift/latest/
 
 .SH "SEE ALSO"
-.BR swift-proxy-server(1),
-
-
+.BR swift-proxy-server(1)
diff --git a/doc/manpages/swift-account-audit.1 b/doc/manpages/swift-account-audit.1
new file mode 100644
index 0000000000..64d60c584b
--- /dev/null
+++ b/doc/manpages/swift-account-audit.1
@@ -0,0 +1,63 @@
+.\"
+.\" Copyright (c) 2016 OpenStack Foundation.
+.\"
+.\" Licensed under the Apache License, Version 2.0 (the "License");
+.\" you may not use this file except in compliance with the License.
+.\" You may obtain a copy of the License at
+.\"
+.\"    http://www.apache.org/licenses/LICENSE-2.0
+.\"
+.\" Unless required by applicable law or agreed to in writing, software
+.\" distributed under the License is distributed on an "AS IS" BASIS,
+.\" WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+.\" implied.
+.\" See the License for the specific language governing permissions and
+.\" limitations under the License.
+.\"
+.TH SWIFT-ACCOUNT-AUDIT "1" "August 2016" "OpenStack Swift"
+.SH NAME
+swift\-account\-audit \- manually audit OpenStack Swift accounts
+
+.SH SYNOPSIS
+.PP
+.B swift\-account\-audit\/
+\fI[options]\fR \fI[url 1]\fR \fI[url 2]\fR \fI...\fR
+
+.SH DESCRIPTION
+.PP
+The swift-account-audit cli tool can be used to audit the data for an account.
+It crawls the account, checking that all containers and objects can be found.
+
+You can also feed a list of URLs to the script through stdin.
+
+.SH OPTIONS
+.TP
+\fB\-c\fR \fIconcurrency\fR
+Set the concurrency, default 50
+.TP
+\fB\-r\fR \fIring dir\fR
+Ring locations, default \fI/etc/swift\fR
+.TP
+\fB\-e\fR \fIfilename\fR
+File for writing a list of inconsistent URLs
+.TP
+\fB\-d\fR
+Also download files and verify md5
+
+.SH EXAMPLES
+.nf
+/usr/bin/swift\-account\-audit\/ AUTH_88ad0b83\-b2c5\-4fa1\-b2d6\-60c597202076
+/usr/bin/swift\-account\-audit\/ AUTH_88ad0b83\-b2c5\-4fa1\-b2d6\-60c597202076/container/object
+/usr/bin/swift\-account\-audit\/ \fB\-e\fR errors.txt AUTH_88ad0b83\-b2c5\-4fa1\-b2d6\-60c597202076/container
+/usr/bin/swift\-account\-audit\/ < errors.txt
+/usr/bin/swift\-account\-audit\/ \fB\-c\fR 25 \fB\-d\fR < errors.txt
+.fi
+
+.SH DOCUMENTATION
+.LP
+More in depth documentation in regards to
+.BI swift\-account\-audit
+and also about OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/
+and
+.BI https://docs.openstack.org
diff --git a/doc/manpages/swift-account-auditor.1 b/doc/manpages/swift-account-auditor.1
index 86e60fbb4c..9983ac61de 100644
--- a/doc/manpages/swift-account-auditor.1
+++ b/doc/manpages/swift-account-auditor.1
@@ -1,6 +1,6 @@
 .\"
 .\" Author: Joao Marcelo Martins <marcelo.martins@rackspace.com> or <btorch@gmail.com>
-.\" Copyright (c) 2010-2012 OpenStack, LLC.
+.\" Copyright (c) 2010-2012 OpenStack Foundation.
 .\"
 .\" Licensed under the Apache License, Version 2.0 (the "License");
 .\" you may not use this file except in compliance with the License.
@@ -14,24 +14,24 @@
 .\" implied.
 .\" See the License for the specific language governing permissions and
 .\" limitations under the License.
-.\"  
+.\"
 .TH swift-account-auditor 1 "8/26/2011" "Linux" "OpenStack Swift"
 
-.SH NAME 
+.SH NAME
 .LP
-.B swift-account-auditor 
-\- Openstack-swift account auditor
+.B swift-account-auditor
+\- OpenStack Swift account auditor
 
 .SH SYNOPSIS
 .LP
-.B swift-account-auditor 
+.B swift-account-auditor
 [CONFIG] [-h|--help] [-v|--verbose] [-o|--once]
 
-.SH DESCRIPTION 
+.SH DESCRIPTION
 .PP
 
-The account auditor crawls the local account system checking the integrity of accounts 
-objects. If corruption is found (in the case of bit rot, for example), the file is 
+The account auditor crawls the local account system checking the integrity of accounts
+objects. If corruption is found (in the case of bit rot, for example), the file is
 quarantined, and replication will replace the bad file from another replica.
 
 The options are as follows:
@@ -46,17 +46,17 @@ The options are as follows:
 .IP "-o"
 .IP "--once"
 .RS 4
-.IP "only run one pass of daemon" 
+.IP "only run one pass of daemon"
 .RE
 .PD
 .RE
-    
+
 .SH DOCUMENTATION
 .LP
-More in depth documentation in regards to 
-.BI swift-account-auditor 
-and also about Openstack-Swift as a whole can be found at 
-.BI http://swift.openstack.org/index.html
+More in depth documentation in regards to
+.BI swift-account-auditor
+and also about OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/
 
 .SH "SEE ALSO"
 .BR account-server.conf(5)
diff --git a/doc/manpages/swift-account-info.1 b/doc/manpages/swift-account-info.1
new file mode 100644
index 0000000000..41ab188214
--- /dev/null
+++ b/doc/manpages/swift-account-info.1
@@ -0,0 +1,69 @@
+.\"
+.\" Author: Madhuri Kumari<madhuri.rai07@gmail.com>
+.\"
+.\" Licensed under the Apache License, Version 2.0 (the "License");
+.\" you may not use this file except in compliance with the License.
+.\" You may obtain a copy of the License at
+.\"
+.\"    http://www.apache.org/licenses/LICENSE-2.0
+.\"
+.\" Unless required by applicable law or agreed to in writing, software
+.\" distributed under the License is distributed on an "AS IS" BASIS,
+.\" WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+.\" implied.
+.\" See the License for the specific language governing permissions and
+.\" limitations under the License.
+.\"
+.TH swift-account-info 1 "10/25/2016" "Linux" "OpenStack Swift"
+
+.SH NAME
+.LP
+.B swift-account-info
+\- OpenStack Swift account-info tool
+
+.SH SYNOPSIS
+.LP
+.B swift-account-info
+<account_db_file> [options]
+
+.SH DESCRIPTION
+.PP
+This is a very simple swift tool that allows a swiftop engineer to retrieve
+information about an account that is located on the storage node. One calls
+the tool with a given db file as it is stored on the storage node system.
+It will then return several information about that account such as;
+
+.PD 0
+.IP  "- Account"
+.IP  "- Account hash "
+.IP  "- Created timestamp "
+.IP  "- Put timestamp "
+.IP  "- Delete timestamp "
+.IP  "- Container Count "
+.IP  "- Object count "
+.IP  "- Bytes used "
+.IP  "- Chexor "
+.IP  "- ID"
+.IP  "- User Metadata "
+.IP  "- Ring Location"
+.PD
+
+.SH OPTIONS
+.TP
+\fB\-h, --help \fR
+Shows the help message and exit
+.TP
+\fB\-d SWIFT_DIR, --swift-dir=SWIFT_DIR\fR
+Pass location of swift configuration file if different from the default
+location /etc/swift
+
+.SH DOCUMENTATION
+.LP
+More documentation about OpenStack Swift can be found at
+.BI https://docs.openstack.org/swift/latest/
+
+.SH "SEE ALSO"
+
+.BR swift-container-info(1),
+.BR swift-get-nodes(1),
+.BR swift-object-info(1)
diff --git a/doc/manpages/swift-account-reaper.1 b/doc/manpages/swift-account-reaper.1
index 4dc1f72929..225aee34a3 100644
--- a/doc/manpages/swift-account-reaper.1
+++ b/doc/manpages/swift-account-reaper.1
@@ -1,6 +1,6 @@
 .\"
 .\" Author: Joao Marcelo Martins <marcelo.martins@rackspace.com> or <btorch@gmail.com>
-.\" Copyright (c) 2010-2012 OpenStack, LLC.
+.\" Copyright (c) 2010-2012 OpenStack Foundation.
 .\"
 .\" Licensed under the Apache License, Version 2.0 (the "License");
 .\" you may not use this file except in compliance with the License.
@@ -14,24 +14,24 @@
 .\" implied.
 .\" See the License for the specific language governing permissions and
 .\" limitations under the License.
-.\"  
+.\"
 .TH swift-account-reaper 1 "8/26/2011" "Linux" "OpenStack Swift"
 
-.SH NAME 
+.SH NAME
 .LP
 .B swift-account-reaper
-\- Openstack-swift account reaper
+\- OpenStack Swift account reaper
 
 .SH SYNOPSIS
 .LP
-.B swift-account-reaper 
+.B swift-account-reaper
 [CONFIG] [-h|--help] [-v|--verbose] [-o|--once]
 
-.SH DESCRIPTION 
+.SH DESCRIPTION
 .PP
 Removes data from status=DELETED accounts. These are accounts that have
 been asked to be removed by the reseller via services remove_storage_account
-XMLRPC call. 
+XMLRPC call.
 .PP
 The account is not deleted immediately by the services call, but instead
 the account is simply marked for deletion by setting the status column in
@@ -51,18 +51,18 @@ The options are as follows:
 .IP "-o"
 .IP "--once"
 .RS 4
-.IP "only run one pass of daemon" 
+.IP "only run one pass of daemon"
 .RE
 .PD
 .RE
 
-    
+
 .SH DOCUMENTATION
 .LP
-More in depth documentation in regards to 
-.BI swift-object-auditor 
-and also about Openstack-Swift as a whole can be found at 
-.BI http://swift.openstack.org/index.html
+More in depth documentation in regards to
+.BI swift-object-auditor
+and also about OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/
 
 
 .SH "SEE ALSO"
diff --git a/doc/manpages/swift-account-replicator.1 b/doc/manpages/swift-account-replicator.1
index 7df81ed8ff..896f2eb307 100644
--- a/doc/manpages/swift-account-replicator.1
+++ b/doc/manpages/swift-account-replicator.1
@@ -1,6 +1,6 @@
 .\"
 .\" Author: Joao Marcelo Martins <marcelo.martins@rackspace.com> or <btorch@gmail.com>
-.\" Copyright (c) 2010-2012 OpenStack, LLC.
+.\" Copyright (c) 2010-2012 OpenStack Foundation.
 .\"
 .\" Licensed under the Apache License, Version 2.0 (the "License");
 .\" you may not use this file except in compliance with the License.
@@ -14,31 +14,31 @@
 .\" implied.
 .\" See the License for the specific language governing permissions and
 .\" limitations under the License.
-.\"  
+.\"
 .TH swift-account-replicator 1 "8/26/2011" "Linux" "OpenStack Swift"
 
-.SH NAME 
+.SH NAME
 .LP
-.B swift-account-replicator 
-\- Openstack-swift account replicator
+.B swift-account-replicator
+\- OpenStack Swift account replicator
 
 .SH SYNOPSIS
 .LP
-.B swift-account-replicator 
+.B swift-account-replicator
 [CONFIG] [-h|--help] [-v|--verbose] [-o|--once]
 
-.SH DESCRIPTION 
+.SH DESCRIPTION
 .PP
-Replication is designed to keep the system in a consistent state in the face of 
-temporary error conditions like network outages or drive failures. The replication 
-processes compare local data with each remote copy to ensure they all contain the 
-latest version. Account replication uses a combination of hashes and shared high 
+Replication is designed to keep the system in a consistent state in the face of
+temporary error conditions like network outages or drive failures. The replication
+processes compare local data with each remote copy to ensure they all contain the
+latest version. Account replication uses a combination of hashes and shared high
 water marks to quickly compare subsections of each partition.
 .PP
-Replication updates are push based. Account replication push missing records over 
+Replication updates are push based. Account replication push missing records over
 HTTP or rsync whole database files. The replicator also ensures that data is removed
-from the system. When an account item is deleted a tombstone is set as the latest 
-version of the item. The replicator will see the tombstone and ensure that the item 
+from the system. When an account item is deleted a tombstone is set as the latest
+version of the item. The replicator will see the tombstone and ensure that the item
 is removed from the entire system.
 
 The options are as follows:
@@ -53,18 +53,18 @@ The options are as follows:
 .IP "-o"
 .IP "--once"
 .RS 4
-.IP "only run one pass of daemon" 
+.IP "only run one pass of daemon"
 .RE
-.PD 
+.PD
 .RE
-    
-   
+
+
 .SH DOCUMENTATION
 .LP
-More in depth documentation in regards to 
+More in depth documentation in regards to
 .BI swift-account-replicator
-and also about Openstack-Swift as a whole can be found at 
-.BI http://swift.openstack.org/index.html
+and also about OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/
 
 
 .SH "SEE ALSO"
diff --git a/doc/manpages/swift-account-server.1 b/doc/manpages/swift-account-server.1
index 21ba86f7a9..1d4b2992e1 100644
--- a/doc/manpages/swift-account-server.1
+++ b/doc/manpages/swift-account-server.1
@@ -1,6 +1,6 @@
 .\"
 .\" Author: Joao Marcelo Martins <marcelo.martins@rackspace.com> or <btorch@gmail.com>
-.\" Copyright (c) 2010-2011 OpenStack, LLC.
+.\" Copyright (c) 2010-2011 OpenStack Foundation.
 .\"
 .\" Licensed under the Apache License, Version 2.0 (the "License");
 .\" you may not use this file except in compliance with the License.
@@ -14,33 +14,33 @@
 .\" implied.
 .\" See the License for the specific language governing permissions and
 .\" limitations under the License.
-.\"  
+.\"
 .TH swift-account-server 1 "8/26/2011" "Linux" "OpenStack Swift"
 
-.SH NAME 
+.SH NAME
 .LP
 .B swift-account-server
-\- Openstack-swift account server
+\- OpenStack Swift account server
 
 .SH SYNOPSIS
 .LP
 .B swift-account-server
 [CONFIG] [-h|--help] [-v|--verbose]
 
-.SH DESCRIPTION 
+.SH DESCRIPTION
 .PP
 The Account Server's primary job is to handle listings of containers. The listings
 are stored as sqlite database files, and replicated across the cluster similar to how
-objects are. 
+objects are.
 
 .SH DOCUMENTATION
 .LP
-More in depth documentation in regards to 
+More in depth documentation in regards to
 .BI swift-account-server
-and also about Openstack-Swift as a whole can be found at 
-.BI http://swift.openstack.org/index.html
-and 
-.BI http://docs.openstack.org
+and also about OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/
+and
+.BI https://docs.openstack.org
 
 
 .SH "SEE ALSO"
diff --git a/doc/manpages/swift-config.1 b/doc/manpages/swift-config.1
new file mode 100644
index 0000000000..d1ad1af8c6
--- /dev/null
+++ b/doc/manpages/swift-config.1
@@ -0,0 +1,51 @@
+.\"
+.\" Copyright (c) 2016 OpenStack Foundation.
+.\"
+.\" Licensed under the Apache License, Version 2.0 (the "License");
+.\" you may not use this file except in compliance with the License.
+.\" You may obtain a copy of the License at
+.\"
+.\"    http://www.apache.org/licenses/LICENSE-2.0
+.\"
+.\" Unless required by applicable law or agreed to in writing, software
+.\" distributed under the License is distributed on an "AS IS" BASIS,
+.\" WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+.\" implied.
+.\" See the License for the specific language governing permissions and
+.\" limitations under the License.
+.\"
+.TH SWIFT-CONFIG "1" "August 2016" "OpenStack Swift"
+
+.SH NAME
+swift\-config \- OpenStack Swift config parser
+
+.SH SYNOPSIS
+.B swift\-config
+[\fIoptions\fR] \fISERVER\fR
+
+.SH DESCRIPTION
+.PP
+Combine Swift configuration files and print result.
+
+.SH OPTIONS
+.TP
+\fB\-h\fR, \fB\-\-help\fR
+Show this help message and exit
+.TP
+\fB\-c\fR \fIN\fR, \fB\-\-config\-num\fR=\fIN\fR
+Parse config for the \fIN\fRth server only
+.TP
+\fB\-s\fR \fISECTION\fR, \fB\-\-section\fR=\fISECTION\fR
+Only display matching sections
+.TP
+\fB\-w\fR, \fB\-\-wsgi\fR
+Use wsgi/paste parser instead of readconf
+
+.SH DOCUMENTATION
+.LP
+More in depth documentation in regards to
+.BI swift\-config
+and also about OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/
+and
+.BI https://docs.openstack.org
diff --git a/doc/manpages/swift-container-auditor.1 b/doc/manpages/swift-container-auditor.1
index 2718f043d5..eae68fc006 100644
--- a/doc/manpages/swift-container-auditor.1
+++ b/doc/manpages/swift-container-auditor.1
@@ -1,6 +1,6 @@
 .\"
 .\" Author: Joao Marcelo Martins <marcelo.martins@rackspace.com> or <btorch@gmail.com>
-.\" Copyright (c) 2010-2012 OpenStack, LLC.
+.\" Copyright (c) 2010-2012 OpenStack Foundation.
 .\"
 .\" Licensed under the Apache License, Version 2.0 (the "License");
 .\" you may not use this file except in compliance with the License.
@@ -14,24 +14,24 @@
 .\" implied.
 .\" See the License for the specific language governing permissions and
 .\" limitations under the License.
-.\"  
+.\"
 .TH swift-container-auditor 1 "8/26/2011" "Linux" "OpenStack Swift"
 
-.SH NAME 
+.SH NAME
 .LP
-.B swift-container-auditor 
-\- Openstack-swift container auditor
+.B swift-container-auditor
+\- OpenStack Swift container auditor
 
 .SH SYNOPSIS
 .LP
-.B swift-container-auditor 
+.B swift-container-auditor
 [CONFIG] [-h|--help] [-v|--verbose] [-o|--once]
 
-.SH DESCRIPTION 
+.SH DESCRIPTION
 .PP
 
-The container auditor crawls the local container system checking the integrity of container 
-objects. If corruption is found (in the case of bit rot, for example), the file is 
+The container auditor crawls the local container system checking the integrity of container
+objects. If corruption is found (in the case of bit rot, for example), the file is
 quarantined, and replication will replace the bad file from another replica.
 
 The options are as follows:
@@ -46,18 +46,18 @@ The options are as follows:
 .IP "-o"
 .IP "--once"
 .RS 4
-.IP "only run one pass of daemon" 
+.IP "only run one pass of daemon"
 .RE
 .PD
 .RE
-     	
-    
+
+
 .SH DOCUMENTATION
 .LP
-More in depth documentation in regards to 
-.BI swift-container-auditor 
-and also about Openstack-Swift as a whole can be found at 
-.BI http://swift.openstack.org/index.html
+More in depth documentation in regards to
+.BI swift-container-auditor
+and also about OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/
 
 
 .SH "SEE ALSO"
diff --git a/doc/manpages/swift-container-info.1 b/doc/manpages/swift-container-info.1
new file mode 100644
index 0000000000..ddacd7cf17
--- /dev/null
+++ b/doc/manpages/swift-container-info.1
@@ -0,0 +1,74 @@
+.\"
+.\" Author: Madhuri Kumari <madhuri.rai07@gmail.com>
+.\" Copyright (c) 2010-2011 OpenStack Foundation.
+.\"
+.\" Licensed under the Apache License, Version 2.0 (the "License");
+.\" you may not use this file except in compliance with the License.
+.\" You may obtain a copy of the License at
+.\"
+.\"    http://www.apache.org/licenses/LICENSE-2.0
+.\"
+.\" Unless required by applicable law or agreed to in writing, software
+.\" distributed under the License is distributed on an "AS IS" BASIS,
+.\" WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+.\" implied.
+.\" See the License for the specific language governing permissions and
+.\" limitations under the License.
+.\"
+.TH swift-container-info 1 "10/25/2016" "Linux" "OpenStack Swift"
+
+.SH NAME
+.LP
+.B swift-container-info
+\- OpenStack Swift container-info tool
+
+.SH SYNOPSIS
+.LP
+.B swift-container-info
+<container_db_file> [options]
+
+.SH DESCRIPTION
+.PP
+This is a very simple swift tool that allows a swiftop engineer to retrieve
+information about a container that is located on the storage node.
+One calls the tool with a given container db file as
+it is stored on the storage node system.
+It will then return several information about that container such as;
+
+.PD 0
+.IP  "- Account it belongs to"
+.IP  "- Container "
+.IP  "- Created timestamp "
+.IP  "- Put timestamp "
+.IP  "- Delete timestamp "
+.IP  "- Object count "
+.IP  "- Bytes used "
+.IP  "- Reported put timestamp "
+.IP  "- Reported delete timestamp "
+.IP  "- Reported object count "
+.IP  "- Reported bytes used "
+.IP  "- Hash "
+.IP  "- ID "
+.IP  "- User metadata "
+.IP  "- X-Container-Sync-Point 1 "
+.IP  "- X-Container-Sync-Point 2 "
+.IP  "- Location on the ring "
+.PD
+
+.SH OPTIONS
+.TP
+\fB\-h, --help \fR
+Shows the help message and exit
+.TP
+\fB\-d SWIFT_DIR, --swift-dir=SWIFT_DIR\fR
+Pass location of swift configuration  file if different from the default
+location /etc/swift
+
+.SH DOCUMENTATION
+.LP
+More documentation about OpenStack Swift can be found at
+.BI https://docs.openstack.org/swift/latest/
+
+.SH "SEE ALSO"
+.BR swift-get-nodes(1),
+.BR swift-object-info(1)
diff --git a/doc/manpages/swift-container-reconciler.1 b/doc/manpages/swift-container-reconciler.1
new file mode 100644
index 0000000000..eaee41bbfb
--- /dev/null
+++ b/doc/manpages/swift-container-reconciler.1
@@ -0,0 +1,58 @@
+.\"
+.\" Copyright (c) 2016 OpenStack Foundation.
+.\"
+.\" Licensed under the Apache License, Version 2.0 (the "License");
+.\" you may not use this file except in compliance with the License.
+.\" You may obtain a copy of the License at
+.\"
+.\"    http://www.apache.org/licenses/LICENSE-2.0
+.\"
+.\" Unless required by applicable law or agreed to in writing, software
+.\" distributed under the License is distributed on an "AS IS" BASIS,
+.\" WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+.\" implied.
+.\" See the License for the specific language governing permissions and
+.\" limitations under the License.
+.\"
+.TH SWIFT-CONTAINER-RECONCILER "1" "August 2016" "OpenStack Swift"
+
+.SH NAME
+swift\-container\-reconciler \- OpenStack Swift container reconciler
+
+.SH SYNOPSIS
+.B swift\-container\-reconciler
+\fICONFIG \fR[\fIoptions\fR]
+
+.SH DESCRIPTION
+.PP
+This daemon will take objects that are in the wrong storage policy and
+move them to the right ones, or delete requests that went to the wrong
+storage policy and apply them to the right ones. It operates on a
+queue similar to the object-expirer's queue.
+
+Discovering that the object is in the wrong policy is done in the container
+replicator; the container reconciler is the daemon that handles them once they
+happen.
+
+Like the object expirer, you only need to run one of these per cluster
+
+.SH OPTIONS
+.TP
+\fB\-h\fR, \fB\-\-help\fR
+Show this help message and exit
+.TP
+\fB\-v\fR, \fB\-\-verbose\fR
+Log to console
+.TP
+\fB\-o\fR, \fB\-\-once\fR
+Only run one pass of daemon
+.PP
+
+.SH DOCUMENTATION
+.LP
+More in depth documentation in regards to
+.BI swift\-container\-reconciler
+and also about OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/
+and
+.BI https://docs.openstack.org
diff --git a/doc/manpages/swift-container-replicator.1 b/doc/manpages/swift-container-replicator.1
index 0469c78ff2..b0103f1633 100644
--- a/doc/manpages/swift-container-replicator.1
+++ b/doc/manpages/swift-container-replicator.1
@@ -1,6 +1,6 @@
 .\"
 .\" Author: Joao Marcelo Martins <marcelo.martins@rackspace.com> or <btorch@gmail.com>
-.\" Copyright (c) 2010-2012 OpenStack, LLC.
+.\" Copyright (c) 2010-2012 OpenStack Foundation.
 .\"
 .\" Licensed under the Apache License, Version 2.0 (the "License");
 .\" you may not use this file except in compliance with the License.
@@ -14,31 +14,31 @@
 .\" implied.
 .\" See the License for the specific language governing permissions and
 .\" limitations under the License.
-.\"  
+.\"
 .TH swift-container-replicator 1 "8/26/2011" "Linux" "OpenStack Swift"
 
-.SH NAME 
+.SH NAME
 .LP
-.B swift-container-replicator 
-\- Openstack-swift container replicator
+.B swift-container-replicator
+\- OpenStack Swift container replicator
 
 .SH SYNOPSIS
 .LP
-.B swift-container-replicator 
+.B swift-container-replicator
 [CONFIG] [-h|--help] [-v|--verbose] [-o|--once]
 
-.SH DESCRIPTION 
+.SH DESCRIPTION
 .PP
-Replication is designed to keep the system in a consistent state in the face of 
-temporary error conditions like network outages or drive failures. The replication 
-processes compare local data with each remote copy to ensure they all contain the 
-latest version. Container replication uses a combination of hashes and shared high 
+Replication is designed to keep the system in a consistent state in the face of
+temporary error conditions like network outages or drive failures. The replication
+processes compare local data with each remote copy to ensure they all contain the
+latest version. Container replication uses a combination of hashes and shared high
 water marks to quickly compare subsections of each partition.
 .PP
-Replication updates are push based. Container replication push missing records over 
+Replication updates are push based. Container replication push missing records over
 HTTP or rsync whole database files. The replicator also ensures that data is removed
-from the system. When an container item is deleted a tombstone is set as the latest 
-version of the item. The replicator will see the tombstone and ensure that the item 
+from the system. When an container item is deleted a tombstone is set as the latest
+version of the item. The replicator will see the tombstone and ensure that the item
 is removed from the entire system.
 
 The options are as follows:
@@ -53,18 +53,18 @@ The options are as follows:
 .IP "-o"
 .IP "--once"
 .RS 4
-.IP "only run one pass of daemon" 
+.IP "only run one pass of daemon"
 .RE
 .PD
 .RE
-    
-   
+
+
 .SH DOCUMENTATION
 .LP
-More in depth documentation in regards to 
+More in depth documentation in regards to
 .BI swift-container-replicator
-and also about Openstack-Swift as a whole can be found at 
-.BI http://swift.openstack.org/index.html
+and also about OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/
 
 
 .SH "SEE ALSO"
diff --git a/doc/manpages/swift-container-server.1 b/doc/manpages/swift-container-server.1
index 20cc5aebe4..0271bdac69 100644
--- a/doc/manpages/swift-container-server.1
+++ b/doc/manpages/swift-container-server.1
@@ -1,6 +1,6 @@
 .\"
 .\" Author: Joao Marcelo Martins <marcelo.martins@rackspace.com> or <btorch@gmail.com>
-.\" Copyright (c) 2010-2011 OpenStack, LLC.
+.\" Copyright (c) 2010-2011 OpenStack Foundation.
 .\"
 .\" Licensed under the Apache License, Version 2.0 (the "License");
 .\" you may not use this file except in compliance with the License.
@@ -14,37 +14,37 @@
 .\" implied.
 .\" See the License for the specific language governing permissions and
 .\" limitations under the License.
-.\"  
+.\"
 .TH swift-container-server 1 "8/26/2011" "Linux" "OpenStack Swift"
 
-.SH NAME 
+.SH NAME
 .LP
 .B swift-container-server
-\- Openstack-swift container server
+\- OpenStack Swift container server
 
 .SH SYNOPSIS
 .LP
 .B swift-container-server
 [CONFIG] [-h|--help] [-v|--verbose]
 
-.SH DESCRIPTION 
+.SH DESCRIPTION
 .PP
-The Container Server's primary job is to handle listings of objects. It doesn't know 
-where those objects are, just what objects are in a specific container. The listings 
-are stored as sqlite database files, and replicated across the cluster similar to how 
-objects are. Statistics are also tracked that include the total number of objects, and 
+The Container Server's primary job is to handle listings of objects. It doesn't know
+where those objects are, just what objects are in a specific container. The listings
+are stored as sqlite database files, and replicated across the cluster similar to how
+objects are. Statistics are also tracked that include the total number of objects, and
 total storage usage for that container.
 
 .SH DOCUMENTATION
 .LP
-More in depth documentation in regards to 
+More in depth documentation in regards to
 .BI swift-container-server
-and also about Openstack-Swift as a whole can be found at 
-.BI http://swift.openstack.org/index.html
-and 
-.BI http://docs.openstack.org
+and also about OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/
+and
+.BI https://docs.openstack.org
 
-.LP 
+.LP
 
 .SH "SEE ALSO"
 .BR container-server.conf(5)
diff --git a/doc/manpages/swift-container-sync.1 b/doc/manpages/swift-container-sync.1
index 11669ec1b3..1c1616faa5 100644
--- a/doc/manpages/swift-container-sync.1
+++ b/doc/manpages/swift-container-sync.1
@@ -1,6 +1,6 @@
 .\"
 .\" Author: Joao Marcelo Martins <marcelo.martins@rackspace.com> or <btorch@gmail.com>
-.\" Copyright (c) 2010-2011 OpenStack, LLC.
+.\" Copyright (c) 2010-2011 OpenStack Foundation.
 .\"
 .\" Licensed under the Apache License, Version 2.0 (the "License");
 .\" you may not use this file except in compliance with the License.
@@ -14,25 +14,25 @@
 .\" implied.
 .\" See the License for the specific language governing permissions and
 .\" limitations under the License.
-.\"  
+.\"
 .TH swift-container-sync 1 "8/26/2011" "Linux" "OpenStack Swift"
 
-.SH NAME 
+.SH NAME
 .LP
 .B swift-container-sync
-\- Openstack-swift container sync
+\- OpenStack Swift container sync
 
 .SH SYNOPSIS
 .LP
 .B swift-container-sync
 [CONFIG] [-h|--help] [-v|--verbose] [-o|--once]
 
-.SH DESCRIPTION 
+.SH DESCRIPTION
 .PP
 Swift has a feature where all the contents of a container can be mirrored to
 another container through background synchronization. Swift cluster operators
 configure their cluster to allow/accept sync requests to/from other clusters,
-and the user specifies where to sync their container to along with a secret 
+and the user specifies where to sync their container to along with a secret
 synchronization key.
 .PP
 The swift-container-sync does the job of sending updates to the remote container.
@@ -42,14 +42,14 @@ newer rows since the last sync will trigger PUTs or DELETEs to the other contain
 
 .SH DOCUMENTATION
 .LP
-More in depth documentation in regards to 
+More in depth documentation in regards to
 .BI swift-container-sync
-and also about Openstack-Swift as a whole can be found at 
-.BI http://swift.openstack.org/overview_container_sync.html
-and 
-.BI http://docs.openstack.org
+and also about OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/overview_container_sync.html
+and
+.BI https://docs.openstack.org
 
-.LP 
+.LP
 
 .SH "SEE ALSO"
 .BR container-server.conf(5)
diff --git a/doc/manpages/swift-container-updater.1 b/doc/manpages/swift-container-updater.1
index 9ec709ce70..c69b533629 100644
--- a/doc/manpages/swift-container-updater.1
+++ b/doc/manpages/swift-container-updater.1
@@ -1,6 +1,6 @@
 .\"
 .\" Author: Joao Marcelo Martins <marcelo.martins@rackspace.com> or <btorch@gmail.com>
-.\" Copyright (c) 2010-2012 OpenStack, LLC.
+.\" Copyright (c) 2010-2012 OpenStack Foundation.
 .\"
 .\" Licensed under the Apache License, Version 2.0 (the "License");
 .\" you may not use this file except in compliance with the License.
@@ -14,31 +14,31 @@
 .\" implied.
 .\" See the License for the specific language governing permissions and
 .\" limitations under the License.
-.\"  
+.\"
 .TH swift-container-updater 1 "8/26/2011" "Linux" "OpenStack Swift"
 
-.SH NAME 
+.SH NAME
 .LP
 .B swift-container-updater
-\- Openstack-swift container updater
+\- OpenStack Swift container updater
 
 .SH SYNOPSIS
 .LP
-.B swift-container-updater 
+.B swift-container-updater
 [CONFIG] [-h|--help] [-v|--verbose] [-o|--once]
 
-.SH DESCRIPTION 
+.SH DESCRIPTION
 .PP
-The container updater is responsible for updating container information in the account database. 
+The container updater is responsible for updating container information in the account database.
 It will walk the container path in the system looking for container DBs and sending updates
-to the account server as needed as it goes along. 
+to the account server as needed as it goes along.
 
-There are times when account data can not be immediately updated. This usually occurs 
-during failure scenarios or periods of high load. This is where an eventual consistency 
-window will most likely come in to play. 
+There are times when account data can not be immediately updated. This usually occurs
+during failure scenarios or periods of high load. This is where an eventual consistency
+window will most likely come in to play.
 
-In practice, the consistency window is only as large as the frequency at which 
-the updater runs and may not even be noticed as the proxy server will route 
+In practice, the consistency window is only as large as the frequency at which
+the updater runs and may not even be noticed as the proxy server will route
 listing requests to the first account server which responds. The server under
 load may not be the one that serves subsequent listing requests – one of the other
 two replicas may handle the listing.
@@ -55,17 +55,17 @@ The options are as follows:
 .IP "-o"
 .IP "--once"
 .RS 4
-.IP "only run one pass of daemon" 
+.IP "only run one pass of daemon"
 .RE
 .PD
 .RE
-       
+
 .SH DOCUMENTATION
 .LP
-More in depth documentation in regards to 
+More in depth documentation in regards to
 .BI swift-container-updater
-and also about Openstack-Swift as a whole can be found at 
-.BI http://swift.openstack.org/index.html
+and also about OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/
 
 
 .SH "SEE ALSO"
diff --git a/doc/manpages/swift-dispersion-populate.1 b/doc/manpages/swift-dispersion-populate.1
index 27188cef1b..6584bfb211 100644
--- a/doc/manpages/swift-dispersion-populate.1
+++ b/doc/manpages/swift-dispersion-populate.1
@@ -1,6 +1,6 @@
 .\"
 .\" Author: Joao Marcelo Martins <marcelo.martins@rackspace.com> or <btorch@gmail.com>
-.\" Copyright (c) 2010-2011 OpenStack, LLC.
+.\" Copyright (c) 2010-2011 OpenStack Foundation.
 .\"
 .\" Licensed under the Apache License, Version 2.0 (the "License");
 .\" you may not use this file except in compliance with the License.
@@ -14,26 +14,26 @@
 .\" implied.
 .\" See the License for the specific language governing permissions and
 .\" limitations under the License.
-.\"  
+.\"
 .TH swift-dispersion-populate 1 "8/26/2011" "Linux" "OpenStack Swift"
 
-.SH NAME 
+.SH NAME
 .LP
 .B swift-dispersion-populate
-\- Openstack-swift dispersion populate 
+\- OpenStack Swift dispersion populate
 
 .SH SYNOPSIS
 .LP
-.B swift-dispersion-populate
+.B swift-dispersion-populate [--container-suffix-start] [--object-suffix-start] [--container-only|--object-only] [--insecure] [conf_file]
 
-.SH DESCRIPTION 
+.SH DESCRIPTION
 .PP
 This is one of the swift-dispersion utilities that is used to evaluate the
-overall cluster health. This is accomplished by checking if a set of 
+overall cluster health. This is accomplished by checking if a set of
 deliberately distributed containers and objects are currently in their
 proper places within the cluster.
 
-.PP 
+.PP
 For instance, a common deployment has three replicas of each object.
 The health of that object can be measured by checking if each replica
 is in its proper place. If only 2 of the 3 is in place the object's health
@@ -48,17 +48,36 @@ we need to run the \fBswift-dispersion-report\fR tool to check the health of eac
 of these containers and objects.
 
 .PP
-These tools need direct access to the entire cluster and to the ring files. 
-Installing them on a proxy server will probably do or a box used for swift 
-administration purposes that also contains the common swift packages and ring. 
-Both \fBswift-dispersion-populate\fR and \fBswift-dispersion-report\fR use the 
+These tools need direct access to the entire cluster and to the ring files.
+Installing them on a proxy server will probably do or a box used for swift
+administration purposes that also contains the common swift packages and ring.
+Both \fBswift-dispersion-populate\fR and \fBswift-dispersion-report\fR use the
 same configuration file, /etc/swift/dispersion.conf . The account used by these
 tool should be a dedicated account for the dispersion stats and also have admin
-privileges. 
+privileges.
+
+.SH OPTIONS
+.RS 0
+.PD 1
+.IP "\fB--insecure\fR"
+Allow accessing insecure keystone server. The keystone's certificate will not
+be verified.
+.IP "\fB--container-suffix-start=NUMBER\fR"
+Start container suffix at NUMBER and resume population at this point; default: 0
+.IP "\fB--object-suffix-start=NUMBER\fR"
+Start object suffix at NUMBER and resume population at this point; default: 0
+.IP "\fB--object-only\fR"
+Only run object population
+.IP "\fB--container-only\fR"
+Only run container population
+.IP "\fB--no-overlap\fR"
+Increase coverage by amount in dispersion_coverage option with no overlap of existing partitions (if run more than once)
+.IP "\fB-P, --policy-name\fR"
+Specify storage policy name
 
 .SH CONFIGURATION
-.PD 0 
-Example \fI/etc/swift/dispersion.conf\fR: 
+.PD 0
+Example \fI/etc/swift/dispersion.conf\fR:
 
 .RS 3
 .IP "[dispersion]"
@@ -66,30 +85,37 @@ Example \fI/etc/swift/dispersion.conf\fR:
 .IP "auth_user = dpstats:dpstats"
 .IP "auth_key = dpstats"
 .IP "swift_dir = /etc/swift"
-.IP "# dispersion_coverage = 1"
+.IP "# project_name = dpstats"
+.IP "# project_domain_name = default"
+.IP "# user_domain_name = default"
+.IP "# dispersion_coverage = 1.0"
 .IP "# retries = 5"
 .IP "# concurrency = 25"
+.IP "# endpoint_type = publicURL"
 .RE
-.PD 
-.SH EXAMPLE
-.PP 
+.PD
+
+.SH EXAMPLE
+.PP
 .PD 0
 $ swift-dispersion-populate
 .RS 1
 .IP "Created 2621 containers for dispersion reporting, 38s, 0 retries"
 .IP "Created 2621 objects for dispersion reporting, 27s, 0 retries"
-.RE
+.RE
+
 .PD
- 
+
+
 .SH DOCUMENTATION
 .LP
 More in depth documentation about the swift-dispersion utilities and
-also Openstack-Swift as a whole can be found at 
-.BI http://swift.openstack.org/admin_guide.html#cluster-health
-and 
-.BI http://swift.openstack.org
+also OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/admin_guide.html#dispersion-report
+and
+.BI https://docs.openstack.org/swift/latest/
 
 
 .SH "SEE ALSO"
 .BR swift-dispersion-report(1),
-.BR dispersion.conf (5)
+.BR dispersion.conf(5)
diff --git a/doc/manpages/swift-dispersion-report.1 b/doc/manpages/swift-dispersion-report.1
index 2b0ffcd796..f789720616 100644
--- a/doc/manpages/swift-dispersion-report.1
+++ b/doc/manpages/swift-dispersion-report.1
@@ -1,6 +1,6 @@
 .\"
 .\" Author: Joao Marcelo Martins <marcelo.martins@rackspace.com> or <btorch@gmail.com>
-.\" Copyright (c) 2010-2011 OpenStack, LLC.
+.\" Copyright (c) 2010-2011 OpenStack Foundation.
 .\"
 .\" Licensed under the Apache License, Version 2.0 (the "License");
 .\" you may not use this file except in compliance with the License.
@@ -14,45 +14,45 @@
 .\" implied.
 .\" See the License for the specific language governing permissions and
 .\" limitations under the License.
-.\"  
+.\"
 .TH swift-dispersion-report 1 "8/26/2011" "Linux" "OpenStack Swift"
 
-.SH NAME 
+.SH NAME
 .LP
 .B swift-dispersion-report
-\- Openstack-swift dispersion report 
+\- OpenStack Swift dispersion report
 
 .SH SYNOPSIS
 .LP
-.B swift-dispersion-report [-d|--debug] [-j|--dump-json] [-p|--partitions] [--container-only|--object-only] [conf_file]
+.B swift-dispersion-report [-d|--debug] [-j|--dump-json] [-p|--partitions] [--container-only|--object-only] [--insecure] [conf_file]
 
-.SH DESCRIPTION 
+.SH DESCRIPTION
 .PP
 This is one of the swift-dispersion utilities that is used to evaluate the
-overall cluster health. This is accomplished by checking if a set of 
+overall cluster health. This is accomplished by checking if a set of
 deliberately distributed containers and objects are currently in their
 proper places within the cluster.
 
-.PP 
+.PP
 For instance, a common deployment has three replicas of each object.
 The health of that object can be measured by checking if each replica
 is in its proper place. If only 2 of the 3 is in place the object's health
 can be said to be at 66.66%, where 100% would be perfect.
 
 .PP
-Once the \fBswift-dispersion-populate\fR has been used to populate the 
-dispersion account, one should run the \fBswift-dispersion-report\fR tool 
+Once the \fBswift-dispersion-populate\fR has been used to populate the
+dispersion account, one should run the \fBswift-dispersion-report\fR tool
 repeatedly for the life of the cluster, in order to check the health of each
 of these containers and objects.
 
 .PP
-These tools need direct access to the entire cluster and to the ring files. 
-Installing them on a proxy server will probably do or a box used for swift 
-administration purposes that also contains the common swift packages and ring. 
-Both \fBswift-dispersion-populate\fR and \fBswift-dispersion-report\fR use the 
+These tools need direct access to the entire cluster and to the ring files.
+Installing them on a proxy server will probably do or a box used for swift
+administration purposes that also contains the common swift packages and ring.
+Both \fBswift-dispersion-populate\fR and \fBswift-dispersion-report\fR use the
 same configuration file, /etc/swift/dispersion.conf . The account used by these
 tool should be a dedicated account for the dispersion stats and also have admin
-privileges. 
+privileges.
 
 .SH OPTIONS
 .RS 0
@@ -60,33 +60,28 @@ privileges.
 .IP "\fB-d, --debug\fR"
 output any 404 responses to standard error
 
-.SH OPTIONS
-.RS 0
-.PD 1
 .IP "\fB-j, --dump-json\fR"
 output dispersion report in json format
 
-.SH OPTIONS
-.RS 0
-.PD 1
 .IP "\fB-p, --partitions\fR"
 output the partition numbers that have any missing replicas
 
-.SH OPTIONS
-.RS 0
-.PD 1
 .IP "\fB--container-only\fR"
 Only run the container report
 
-.SH OPTIONS
-.RS 0
-.PD 1
 .IP "\fB--object-only\fR"
 Only run the object report
 
+.IP "\fB--insecure\fR"
+Allow accessing insecure keystone server. The keystone's certificate will not
+be verified.
+
+.IP "\fB-P, --policy-name\fR"
+Specify storage policy name
+
 .SH CONFIGURATION
-.PD 0 
-Example \fI/etc/swift/dispersion.conf\fR: 
+.PD 0
+Example \fI/etc/swift/dispersion.conf\fR:
 
 .RS 3
 .IP "[dispersion]"
@@ -94,17 +89,23 @@ Example \fI/etc/swift/dispersion.conf\fR:
 .IP "auth_user = dpstats:dpstats"
 .IP "auth_key = dpstats"
 .IP "swift_dir = /etc/swift"
-.IP "# dispersion_coverage = 1"
+.IP "# project_name = dpstats"
+.IP "# project_domain_name = default"
+.IP "# user_domain_name = default"
+.IP "# dispersion_coverage = 1.0"
 .IP "# retries = 5"
 .IP "# concurrency = 25"
 .IP "# dump_json = no"
+.IP "# endpoint_type = publicURL"
 .RE
-.PD 
-.SH EXAMPLE
-.PP 
+.PD
+
+.SH EXAMPLE
+.PP
 .PD 0
-$ swift-dispersion-report 
-
+$ swift-dispersion-report
+
+
 .RS 1
 .IP "Queried 2622 containers for dispersion reporting, 31s, 0 retries"
 .IP "100.00% of container copies found (7866 of 7866)"
@@ -113,18 +114,20 @@ $ swift-dispersion-report
 .IP "Queried 2621 objects for dispersion reporting, 22s, 0 retries"
 .IP "100.00% of object copies found (7863 of 7863)"
 .IP "Sample represents 1.00% of the object partition space"
-.RE
+.RE
+
 .PD
- 
+
+
 .SH DOCUMENTATION
 .LP
 More in depth documentation about the swift-dispersion utilities and
-also Openstack-Swift as a whole can be found at 
-.BI http://swift.openstack.org/admin_guide.html#cluster-health
-and 
-.BI http://swift.openstack.org
+also OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/admin_guide.html#dispersion-report
+and
+.BI https://docs.openstack.org/swift/latest/
 
 
 .SH "SEE ALSO"
 .BR swift-dispersion-populate(1),
-.BR dispersion.conf (5)
+.BR dispersion.conf(5)
diff --git a/doc/manpages/swift-drive-audit.1 b/doc/manpages/swift-drive-audit.1
new file mode 100644
index 0000000000..cf8902061b
--- /dev/null
+++ b/doc/manpages/swift-drive-audit.1
@@ -0,0 +1,38 @@
+.\"
+.\" Copyright (c) 2016 OpenStack Foundation.
+.\"
+.\" Licensed under the Apache License, Version 2.0 (the "License");
+.\" you may not use this file except in compliance with the License.
+.\" You may obtain a copy of the License at
+.\"
+.\"    http://www.apache.org/licenses/LICENSE-2.0
+.\"
+.\" Unless required by applicable law or agreed to in writing, software
+.\" distributed under the License is distributed on an "AS IS" BASIS,
+.\" WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+.\" implied.
+.\" See the License for the specific language governing permissions and
+.\" limitations under the License.
+.\"
+.TH SWIFT-DRIVE-AUDIT "1" "August 2016" "OpenStack Swift"
+
+.SH NAME
+swift\-drive\-audit \- OpenStack Swift drive audit cron job
+
+.SH SYNOPSIS
+.B swift\-drive\-audit
+\fICONFIG\fR
+
+.SH DESCRIPTION
+.PP
+Tool that can be run by using cron to watch for bad drives. If errors are
+detected, it unmounts the bad drive, so that Swift can work around it.
+
+.SH DOCUMENTATION
+.LP
+More in depth documentation in regards to
+.BI swift\-drive\-audit
+and also about OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/
+and
+.BI https://docs.openstack.org
diff --git a/doc/manpages/swift-form-signature.1 b/doc/manpages/swift-form-signature.1
new file mode 100644
index 0000000000..2ce640b90c
--- /dev/null
+++ b/doc/manpages/swift-form-signature.1
@@ -0,0 +1,67 @@
+.\"
+.\" Copyright (c) 2016 OpenStack Foundation.
+.\"
+.\" Licensed under the Apache License, Version 2.0 (the "License");
+.\" you may not use this file except in compliance with the License.
+.\" You may obtain a copy of the License at
+.\"
+.\"    http://www.apache.org/licenses/LICENSE-2.0
+.\"
+.\" Unless required by applicable law or agreed to in writing, software
+.\" distributed under the License is distributed on an "AS IS" BASIS,
+.\" WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+.\" implied.
+.\" See the License for the specific language governing permissions and
+.\" limitations under the License.
+.\"
+.TH SWIFT-FORM-SIGNATURE "1" "August 2016" "OpenStack Swift"
+
+.SH NAME
+swift\-form\-signature \- compute the expires and signature for OpenStack Swift Form POST middleware
+
+.SH SYNOPSIS
+.B swift\-form\-signature
+\fIpath\fR \fIredirect\fR \fImax_file_size\fR \fImax_file_count\fR
+\fIseconds\fR \fIkey\fR
+
+.SH DESCRIPTION
+.PP
+Tool to compute expires and signature values which can be used to upload
+objects directly to the Swift from a browser by using the form POST middleware.
+
+.SH OPTIONS
+.TP
+.I path
+The prefix to use for form uploaded
+objects. For example:
+\fI/v1/account/container/object_prefix_\fP would
+ensure all form uploads have that path
+prepended to the browser\-given file name.
+.TP
+.I redirect
+The URL to redirect the browser to after
+the uploads have completed.
+.TP
+.I max_file_size
+The maximum file size per file uploaded.
+.TP
+.I max_file_count
+The maximum number of uploaded files
+allowed.
+.TP
+.I seconds
+The number of seconds from now to allow
+the form post to begin.
+.TP
+.I key
+The X\-Account\-Meta\-Temp\-URL\-Key for the
+account.
+
+.SH DOCUMENTATION
+.LP
+More in depth documentation in regards to
+.BI swift\-form\-signature
+and also about OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/
+and
+.BI https://docs.openstack.org
diff --git a/doc/manpages/swift-get-nodes.1 b/doc/manpages/swift-get-nodes.1
index d9409c58f5..73d1475ed2 100644
--- a/doc/manpages/swift-get-nodes.1
+++ b/doc/manpages/swift-get-nodes.1
@@ -1,6 +1,6 @@
 .\"
 .\" Author: Joao Marcelo Martins <marcelo.martins@rackspace.com> or <btorch@gmail.com>
-.\" Copyright (c) 2010-2011 OpenStack, LLC.
+.\" Copyright (c) 2010-2011 OpenStack Foundation.
 .\"
 .\" Licensed under the Apache License, Version 2.0 (the "License");
 .\" you may not use this file except in compliance with the License.
@@ -14,33 +14,61 @@
 .\" implied.
 .\" See the License for the specific language governing permissions and
 .\" limitations under the License.
-.\"  
-.TH swift-get-nodes 1 "8/26/2011" "Linux" "OpenStack Swift"
+.\"
+.TH swift-get-nodes 1 "10/25/2016" "Linux" "OpenStack Swift"
 
-.SH NAME 
+.SH NAME
 .LP
 .B swift-get-nodes
-\- Openstack-swift get-nodes tool
+\- OpenStack Swift get-nodes tool
 
 .SH SYNOPSIS
 .LP
-.B swift-get-nodes 
-\ <ring.gz> <account> [<container>] [<object>]
- 
-.SH DESCRIPTION 
+.B swift-get-nodes
+\ [options] <ring.gz> <account> [<container> [<object>]]
+
+Or
+
+.B swift-get-nodes
+[options] <ring.gz> -p <partition>
+
+Or
+
+.B swift-get-nodes
+\ [options] -P policy_name <account> <container> <object>
+
+.SH DESCRIPTION
 .PP
 The swift-get-nodes tool can be used to find out the location where
-a particular account, container or object item is located within the 
-swift cluster nodes. For example, if you have the account hash and a container 
-name that belongs to that account, you can use swift-get-nodes to lookup 
+a particular account, container or object item is located within the
+swift cluster nodes. For example, if you have the account hash and a container
+name that belongs to that account, you can use swift-get-nodes to lookup
 where the container resides by using the container ring.
 
+.SH OPTIONS
+.TP
+\fB\-h --help \fR
+Shows the help message and exit
+.TP
+\fB\-a, --all\fR
+Show all handoff nodes
+.TP
+\fB\-p PARTITION, --partition=PARTITION\fR
+Show nodes for a given partition
+.TP
+\fB\-P POLICY_NAME, --policy-name=POLICY_NAME \fR
+Specify storage policy name
+.TP
+\fB\-d SWIFT_DIR, --swift-dir=SWIFT_DIR\fR
+Pass location of swift configuration file if different from the default
+location /etc/swift
+
 .RS 0
 .IP "\fIExample:\fR"
 .RE
 
 .RS 4
-.PD 0 
+.PD 0
 .IP "$ swift-get-nodes /etc/swift/account.ring.gz MyAccount-12ac01446be2"
 
 .PD 0
@@ -51,28 +79,35 @@ where the container resides by using the container ring.
 .IP "Partition 221082"
 .IP "Hash d7e6ba68cfdce0f0e4ca7890e46cacce"
 
-.IP "Server:Port Device      172.24.24.29:6002 sdd"
-.IP "Server:Port Device      172.24.24.27:6002 sdr"
-.IP "Server:Port Device      172.24.24.32:6002 sde"
-.IP "Server:Port Device      172.24.24.26:6002 sdv    [Handoff]"
-
-.IP "curl -I -XHEAD http://172.24.24.29:6002/sdd/221082/MyAccount-12ac01446be2"
-.IP "curl -I -XHEAD http://172.24.24.27:6002/sdr/221082/MyAccount-12ac01446be2"
-.IP "curl -I -XHEAD http://172.24.24.32:6002/sde/221082/MyAccount-12ac01446be2"
-.IP "curl -I -XHEAD http://172.24.24.26:6002/sdv/221082/MyAccount-12ac01446be2 # [Handoff]"
+.IP "Server:Port Device      172.24.24.29:6202 sdd"
+.IP "Server:Port Device      172.24.24.27:6202 sdr"
+.IP "Server:Port Device      172.24.24.32:6202 sde"
+.IP "Server:Port Device      172.24.24.26:6202 sdv    [Handoff]"
+
+
+.IP "curl -I -XHEAD http://172.24.24.29:6202/sdd/221082/MyAccount-12ac01446be2"
+.IP "curl -I -XHEAD http://172.24.24.27:6202/sdr/221082/MyAccount-12ac01446be2"
+.IP "curl -I -XHEAD http://172.24.24.32:6202/sde/221082/MyAccount-12ac01446be2"
+.IP "curl -I -XHEAD http://172.24.24.26:6202/sdv/221082/MyAccount-12ac01446be2 # [Handoff]"
 
 .IP "ssh 172.24.24.29 ls -lah /srv/node/sdd/accounts/221082/cce/d7e6ba68cfdce0f0e4ca7890e46cacce/ "
-.IP "ssh 172.24.24.27 ls -lah /srv/node/sdr/accounts/221082/cce/d7e6ba68cfdce0f0e4ca7890e46cacce/".IP "ssh 172.24.24.32 ls -lah /srv/node/sde/accounts/221082/cce/d7e6ba68cfdce0f0e4ca7890e46cacce/".IP "ssh 172.24.24.26 ls -lah /srv/node/sdv/accounts/221082/cce/d7e6ba68cfdce0f0e4ca7890e46cacce/ # [Handoff] "
-.PD 
-.RE 
+.IP "ssh 172.24.24.27 ls -lah /srv/node/sdr/accounts/221082/cce/d7e6ba68cfdce0f0e4ca7890e46cacce/"
+.IP "ssh 172.24.24.32 ls -lah /srv/node/sde/accounts/221082/cce/d7e6ba68cfdce0f0e4ca7890e46cacce/"
+.IP "ssh 172.24.24.26 ls -lah /srv/node/sdv/accounts/221082/cce/d7e6ba68cfdce0f0e4ca7890e46cacce/ # [Handoff] "
+
+.PD
+.RE
 
 .SH DOCUMENTATION
 .LP
-More documentation about Openstack-Swift can be found at 
-.BI http://swift.openstack.org/index.html
+More documentation about OpenStack Swift can be found at
+.BI https://docs.openstack.org/swift/latest/
 
 
 
 .SH "SEE ALSO"
+
+.BR swift-account-info(1),
+.BR swift-container-info(1),
 .BR swift-object-info(1),
 .BR swift-ring-builder(1)
diff --git a/doc/manpages/swift-init.1 b/doc/manpages/swift-init.1
index 0d5431bfa0..c056e04fea 100644
--- a/doc/manpages/swift-init.1
+++ b/doc/manpages/swift-init.1
@@ -1,6 +1,6 @@
 .\"
 .\" Author: Joao Marcelo Martins <marcelo.martins@rackspace.com> or <btorch@gmail.com>
-.\" Copyright (c) 2010-2011 OpenStack, LLC.
+.\" Copyright (c) 2010-2011 OpenStack Foundation.
 .\"
 .\" Licensed under the Apache License, Version 2.0 (the "License");
 .\" you may not use this file except in compliance with the License.
@@ -14,25 +14,25 @@
 .\" implied.
 .\" See the License for the specific language governing permissions and
 .\" limitations under the License.
-.\"  
+.\"
 .TH swift-init 1 "8/26/2011" "Linux" "OpenStack Swift"
 
-.SH NAME 
+.SH NAME
 .LP
 .B swift-init
-\- Openstack-swift swift-init tool
+\- OpenStack Swift swift-init tool
 
 .SH SYNOPSIS
 .LP
 .B swift-init
  <server> [<server> ...] <command> [options]
- 
-.SH DESCRIPTION 
+
+.SH DESCRIPTION
 .PP
 The swift-init tool can be used to initialize all swift daemons available as part of
-openstack-swift. Instead of calling individual init scripts for each 
-swift daemon, one can just use swift-init. With swift-init you can initialize 
-just one swift service, such as the "proxy", or a combination of them. The tool also 
+OpenStack Swift. Instead of calling individual init scripts for each
+swift daemon, one can just use swift-init. With swift-init you can initialize
+just one swift service, such as the "proxy", or a combination of them. The tool also
 allows one to use the keywords such as "all", "main" and "rest" for the <server> argument.
 
 
@@ -41,17 +41,17 @@ allows one to use the keywords such as "all", "main" and "rest" for the <server>
 .PD 0
 .RS 4
 .IP "\fIproxy\fR" "4"
-.IP "    - Initializes the swift proxy daemon" 
+.IP "    - Initializes the swift proxy daemon"
 .RE
 
 .RS 4
 .IP "\fIobject\fR, \fIobject-replicator\fR, \fIobject-auditor\fR, \fIobject-updater\fR"
-.IP "    - Initialize the swift object daemons above"
+.IP "    - Initializes the swift object daemons above"
 .RE
 
 .RS 4
 .IP "\fIcontainer\fR, \fIcontainer-update\fR, \fIcontainer-replicator\fR, \fIcontainer-auditor\fR"
-.IP "    - Initialize the swift container daemons above"
+.IP "    - Initializes the swift container daemons above"
 .RE
 
 .RS 4
@@ -66,16 +66,16 @@ allows one to use the keywords such as "all", "main" and "rest" for the <server>
 
 .RS 4
 .IP "\fImain\fR"
-.IP "    - Initializes all the \fBmain\fR swift daemons "
+.IP "    - Initializes all the \fBmain\fR swift daemons"
 .IP "      (proxy, container, account and object servers)"
 .RE
 
 .RS 4
 .IP "\fIrest\fR"
-.IP "    - Initializes all the other \fBswift background daemons\fR such as"
-.IP "      (updater, replicator, auditor, reaper)"
+.IP "    - Initializes all the other \fBswift background daemons\fR"
+.IP "      (updater, replicator, auditor, reaper, etc)"
 .RE
-.PD 
+.PD
 
 
 \fBCommands:\fR
@@ -87,19 +87,20 @@ allows one to use the keywords such as "all", "main" and "rest" for the <server>
 .IP "\fIno-wait\fR: \t\t\t spawn server and return immediately"
 .IP "\fIonce\fR: \t\t\t start server and run one pass on supporting daemons"
 .IP "\fIreload\fR: \t\t\t graceful shutdown then restart on supporting servers"
+.IP "\fIreload-seamless\fR: \t\t reload supporting servers with no downtime"
 .IP "\fIrestart\fR: \t\t\t stops then restarts server"
 .IP "\fIshutdown\fR: \t\t allow current requests to finish on supporting servers"
 .IP "\fIstart\fR: \t\t\t starts a server"
 .IP "\fIstatus\fR: \t\t\t display status of tracked pids for server"
 .IP "\fIstop\fR: \t\t\t stops a server"
-.PD 
+.PD
 .RE
 
 
 
 \fBOptions:\fR
 .RS 4
-.PD 0 
+.PD 0
 .IP "-h, --help \t\t\t show this help message and exit"
 .IP "-v, --verbose \t\t\t display verbose output"
 .IP "-w, --no-wait \t\t\t won't wait for server to start before returning
@@ -107,14 +108,17 @@ allows one to use the keywords such as "all", "main" and "rest" for the <server>
 .IP "-n, --no-daemon \t\t start server interactively
 .IP "-g, --graceful \t\t send SIGHUP to supporting servers
 .IP "-c N, --config-num=N \t send command to the Nth server only
-.PD 
+.IP "-k N, --kill-wait=N \t wait N seconds for processes to die (default 15)
+.IP "-r RUN_DIR, --run-dir=RUN_DIR directory where the pids will be stored (default /var/run/swift)
+.IP "--strict return non-zero status code if some config is missing. Default mode if server is explicitly named."
+.IP "--non-strict return zero status code even if some config is missing. Default mode if server is one of aliases `all`, `main` or `rest`."
+.IP "--kill-after-timeout kill daemon and all children after kill-wait period."
+.PD
 .RE
-
-
-.SH DOCUMENTATION
-.LP
-More documentation about Openstack-Swift can be found at 
-.BI http://swift.openstack.org/index.html
 
 
 
+.SH DOCUMENTATION
+.LP
+More documentation about OpenStack Swift can be found at
+.BI https://docs.openstack.org/swift/latest/
diff --git a/doc/manpages/swift-object-auditor.1 b/doc/manpages/swift-object-auditor.1
index 5be922676c..999acc1825 100644
--- a/doc/manpages/swift-object-auditor.1
+++ b/doc/manpages/swift-object-auditor.1
@@ -1,6 +1,6 @@
 .\"
 .\" Author: Joao Marcelo Martins <marcelo.martins@rackspace.com> or <btorch@gmail.com>
-.\" Copyright (c) 2010-2012 OpenStack, LLC.
+.\" Copyright (c) 2010-2012 OpenStack Foundation.
 .\"
 .\" Licensed under the Apache License, Version 2.0 (the "License");
 .\" you may not use this file except in compliance with the License.
@@ -14,23 +14,23 @@
 .\" implied.
 .\" See the License for the specific language governing permissions and
 .\" limitations under the License.
-.\"  
+.\"
 .TH swift-object-auditor 1 "8/26/2011" "Linux" "OpenStack Swift"
 
-.SH NAME 
+.SH NAME
 .LP
-.B swift-object-auditor 
-\- Openstack-swift object auditor
+.B swift-object-auditor
+\- OpenStack Swift object auditor
 
 .SH SYNOPSIS
 .LP
-.B swift-object-auditor 
+.B swift-object-auditor
 [CONFIG] [-h|--help] [-v|--verbose] [-o|--once] [-z|--zero_byte_fps]
 
-.SH DESCRIPTION 
+.SH DESCRIPTION
 .PP
-The object auditor crawls the local object system checking the integrity of objects. 
-If corruption is found (in the case of bit rot, for example), the file is 
+The object auditor crawls the local object system checking the integrity of objects.
+If corruption is found (in the case of bit rot, for example), the file is
 quarantined, and replication will replace the bad file from another replica.
 
 The options are as follows:
@@ -46,7 +46,7 @@ The options are as follows:
 .IP "-o"
 .IP "--once"
 .RS 4
-.IP "only run one pass of daemon" 
+.IP "only run one pass of daemon"
 .RE
 
 .IP "-z ZERO_BYTE_FPS"
@@ -56,14 +56,14 @@ The options are as follows:
 .RE
 .PD
 .RE
-    
-    
+
+
 .SH DOCUMENTATION
 .LP
-More in depth documentation in regards to 
-.BI swift-object-auditor 
-and also about Openstack-Swift as a whole can be found at 
-.BI http://swift.openstack.org/index.html
+More in depth documentation in regards to
+.BI swift-object-auditor
+and also about OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/
 
 
 .SH "SEE ALSO"
diff --git a/doc/manpages/swift-object-expirer.1 b/doc/manpages/swift-object-expirer.1
index 24e1cbb05c..0615f9f99f 100644
--- a/doc/manpages/swift-object-expirer.1
+++ b/doc/manpages/swift-object-expirer.1
@@ -1,6 +1,6 @@
 .\"
 .\" Author: Joao Marcelo Martins <marcelo.martins@rackspace.com> or <btorch@gmail.com>
-.\" Copyright (c) 2012 OpenStack, LLC.
+.\" Copyright (c) 2012 OpenStack Foundation.
 .\"
 .\" Licensed under the Apache License, Version 2.0 (the "License");
 .\" you may not use this file except in compliance with the License.
@@ -14,31 +14,31 @@
 .\" implied.
 .\" See the License for the specific language governing permissions and
 .\" limitations under the License.
-.\"  
+.\"
 .TH swift-object-expirer 1 "3/15/2012" "Linux" "OpenStack Swift"
 
-.SH NAME 
+.SH NAME
 .LP
 .B swift-object-expirer
-\- Openstack-swift object expirer
+\- OpenStack Swift object expirer
 
 .SH SYNOPSIS
 .LP
-.B swift-object-expirer 
+.B swift-object-expirer
 [CONFIG] [-h|--help] [-v|--verbose] [-o|--once]
 
-.SH DESCRIPTION 
+.SH DESCRIPTION
 .PP
-The swift-object-expirer offers scheduled deletion of objects. The Swift client would 
-use the X-Delete-At or X-Delete-After headers during an object PUT or POST and the 
-cluster would automatically quit serving that object at the specified time and would 
+The swift-object-expirer offers scheduled deletion of objects. The Swift client would
+use the X-Delete-At or X-Delete-After headers during an object PUT or POST and the
+cluster would automatically quit serving that object at the specified time and would
 shortly thereafter remove the object from the system.
 
-The X-Delete-At header takes a Unix Epoch timestamp, in integer form; for example: 
+The X-Delete-At header takes a Unix Epoch timestamp, in integer form; for example:
 1317070737 represents Mon Sep 26 20:58:57 2011 UTC.
 
-The X-Delete-After header takes a integer number of seconds. The proxy server 
-that receives the request will convert this header into an X-Delete-At header 
+The X-Delete-After header takes an integer number of seconds. The proxy server
+that receives the request will convert this header into an X-Delete-At header
 using its current time plus the value given.
 
 The options are as follows:
@@ -53,22 +53,23 @@ The options are as follows:
 .IP "-o"
 .IP "--once"
 .RS 4
-.IP "only run one pass of daemon" 
+.IP "only run one pass of daemon"
 .RE
 .PD
 .RE
-    
-   
+
+
 .SH DOCUMENTATION
 .LP
-More in depth documentation in regards to 
+More in depth documentation in regards to
 .BI swift-object-expirer
-can be foud at 
-.BI http://swift.openstack.org/overview_expiring_objects.html
-and also about Openstack-Swift as a whole can be found at 
-.BI http://swift.openstack.org/index.html
+can be found at
+.BI https://docs.openstack.org/swift/latest/overview_expiring_objects.html
+and also about OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/
 
 
 .SH "SEE ALSO"
+.BR object-server.conf(5)
 .BR object-expirer.conf(5)
 
diff --git a/doc/manpages/swift-object-info.1 b/doc/manpages/swift-object-info.1
index fe38638b03..be7e6e51f6 100644
--- a/doc/manpages/swift-object-info.1
+++ b/doc/manpages/swift-object-info.1
@@ -1,6 +1,6 @@
 .\"
 .\" Author: Joao Marcelo Martins <marcelo.martins@rackspace.com> or <btorch@gmail.com>
-.\" Copyright (c) 2010-2011 OpenStack, LLC.
+.\" Copyright (c) 2010-2011 OpenStack Foundation.
 .\"
 .\" Licensed under the Apache License, Version 2.0 (the "License");
 .\" you may not use this file except in compliance with the License.
@@ -14,42 +14,60 @@
 .\" implied.
 .\" See the License for the specific language governing permissions and
 .\" limitations under the License.
-.\"  
-.TH swift-object-info 1 "8/26/2011" "Linux" "OpenStack Swift"
+.\"
+.TH swift-object-info 1 "10/25/2016" "Linux" "OpenStack Swift"
 
-.SH NAME 
+.SH NAME
 .LP
 .B swift-object-info
-\- Openstack-swift object-info tool
+\- OpenStack Swift object-info tool
 
 .SH SYNOPSIS
 .LP
 .B swift-object-info
-[OBJECT_FILE] 
+<object_file> [options]
 
-.SH DESCRIPTION 
+.SH DESCRIPTION
 .PP
-This is a very simple swift tool that allows a swiftop engineer to retrieve 
-information about an object that is located on the storage node. One calls 
-the tool with a given object file as it is stored on the storage node system. 
-It will then return several information about that object such as; 
+This is a very simple swift tool that allows a swiftop engineer to retrieve
+information about an object that is located on the storage node. One calls
+the tool with a given object file as it is stored on the storage node system.
+It will then return several information about that object such as;
 
 .PD 0
-.IP	"- Account it belongs to"
+.IP  "- Account it belongs to"
 .IP  "- Container "
 .IP  "- Object hash "
-.IP  "- Location on the ring "
 .IP  "- Content Type "
 .IP  "- timestamp "
 .IP  "- Etag "
 .IP  "- Content Length "
 .IP  "- User Metadata "
-.PD 
-    
+.IP  "- Location on the ring "
+.PD
+
+.SH OPTIONS
+.TP
+\fB\-h --help \fR
+Shows the help message and exit
+.TP
+\fB\-n, --no-check-etag\fR
+Don't verify file contents against stored etag
+.TP
+\fB\-d SWIFT_DIR, --swift-dir=SWIFT_DIR\fR
+Pass location of swift configuration file if different from the default
+location /etc/swift
+.TP
+\fB\-P POLICY_NAME, --policy-name=POLICY_NAME \fR
+Specify storage policy name
+
 .SH DOCUMENTATION
 .LP
-More documentation about Openstack-Swift can be found at 
-.BI http://swift.openstack.org/index.html
+More documentation about OpenStack Swift can be found at
+.BI https://docs.openstack.org/swift/latest/
 
 .SH "SEE ALSO"
-.BR swift-get-nodes(1),
+
+.BR swift-account-info(1),
+.BR swift-container-info(1),
+.BR swift-get-nodes(1)
diff --git a/doc/manpages/swift-object-reconstructor.1 b/doc/manpages/swift-object-reconstructor.1
new file mode 100644
index 0000000000..3877d8eaf1
--- /dev/null
+++ b/doc/manpages/swift-object-reconstructor.1
@@ -0,0 +1,61 @@
+.\"
+.\" Copyright (c) 2016 OpenStack Foundation.
+.\"
+.\" Licensed under the Apache License, Version 2.0 (the "License");
+.\" you may not use this file except in compliance with the License.
+.\" You may obtain a copy of the License at
+.\"
+.\"    http://www.apache.org/licenses/LICENSE-2.0
+.\"
+.\" Unless required by applicable law or agreed to in writing, software
+.\" distributed under the License is distributed on an "AS IS" BASIS,
+.\" WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+.\" implied.
+.\" See the License for the specific language governing permissions and
+.\" limitations under the License.
+.\"
+.TH SWIFT-OBJECT-RECONSTRUCTOR "1" "August 2016" "OpenStack Swift"
+
+.SH NAME
+swift\-object\-reconstructor \- OpenStack Swift EC object reconstructor
+
+.SH SYNOPSIS
+.B swift\-object\-reconstructor
+\fICONFIG \fR[\fIoptions\fR]
+
+.SH DESCRIPTION
+.PP
+Daemon for reconstruction of EC objects. Once a pair of nodes has
+determined the need to replace a missing object fragment, instead of
+pushing over a copy like replication would do, the reconstructor has to
+read in enough surviving fragments from other nodes and perform a local
+reconstruction before it has the correct data to push to the other node.
+
+.SH OPTIONS
+.TP
+\fB\-h\fR, \fB\-\-help\fR
+Show this help message and exit
+.TP
+\fB\-d\fR \fIDEVICES\fR, \fB\-\-devices\fR=\fIDEVICES\fR
+Reconstruct only given devices. Comma\-separated list. Only has effect if
+\-\-once is used.
+.TP
+\fB\-p\fR \fIPARTITIONS\fR, \fB\-\-partitions\fR=\fIPARTITIONS\fR
+Reconstruct only given partitions. Comma\-separated
+list. Only has effect if \-\-once is used.
+.TP
+\fB\-v\fR, \fB\-\-verbose\fR
+Log to console
+.TP
+\fB\-o\fR, \fB\-\-once\fR
+Only run one pass of daemon
+.PP
+
+.SH DOCUMENTATION
+.LP
+More in depth documentation in regards to
+.BI swift\-object\-reconstructor
+and also about OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/
+and
+.BI https://docs.openstack.org
diff --git a/doc/manpages/swift-object-relinker.1 b/doc/manpages/swift-object-relinker.1
new file mode 100644
index 0000000000..8b42a6fc5e
--- /dev/null
+++ b/doc/manpages/swift-object-relinker.1
@@ -0,0 +1,75 @@
+.\"
+.\" Copyright (c) 2017 OpenStack Foundation.
+.\"
+.\" Licensed under the Apache License, Version 2.0 (the "License");
+.\" you may not use this file except in compliance with the License.
+.\" You may obtain a copy of the License at
+.\"
+.\"    http://www.apache.org/licenses/LICENSE-2.0
+.\"
+.\" Unless required by applicable law or agreed to in writing, software
+.\" distributed under the License is distributed on an "AS IS" BASIS,
+.\" WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+.\" implied.
+.\" See the License for the specific language governing permissions and
+.\" limitations under the License.
+.\"
+.TH SWIFT-OBJECT-RELINKER "1" "December 2017" "OpenStack Swift"
+
+.SH NAME
+\fBswift\-object\-relinker\fR \- relink and cleanup objects to increase partition power
+.SH SYNOPSIS
+.B swift\-object\-relinker
+[\fIoptions\fR] <\fIcommand\fR>
+
+.SH DESCRIPTION
+.PP
+The relinker prepares an object server's filesystem for a partition power
+change by crawling the filesystem and linking existing objects to future
+partition directories.
+
+More information can be found at
+.BI https://docs.openstack.org/swift/latest/ring_partpower.html
+
+.SH COMMANDS
+.TP
+\fBrelink\fR
+Relink files for partition power increase.
+
+.TP
+\fBcleanup\fR
+Remove hard links in the old locations.
+
+.SH OPTIONS
+.TP
+\fB\-h\fR, \fB\-\-help\fR
+Show this help message and exit
+
+.TP
+\fB\-\-swift-dir\fR \fISWIFT_DIR\fR
+Path to swift directory
+
+.TP
+\fB\-\-devices\fR \fIDEVICES\fR
+Path to swift device directory
+
+.TP
+\fB\-\-skip\-mount\-check\fR
+Don't test if disk is mounted
+
+.TP
+\fB\-\-logfile\fR \fILOGFILE\fR
+Set log file name
+
+.TP
+\fB\-\-debug\fR
+Enable debug mode
+
+.SH DOCUMENTATION
+.LP
+More in depth documentation in regards to
+.BI swift\-object\-relinker
+and also about OpenStack Swift as a whole can be found at
+.BI http://docs.openstack.org/developer/swift/index.html
+and
+.BI http://docs.openstack.org
diff --git a/doc/manpages/swift-object-replicator.1 b/doc/manpages/swift-object-replicator.1
index 71c0383aa2..62eae6990b 100644
--- a/doc/manpages/swift-object-replicator.1
+++ b/doc/manpages/swift-object-replicator.1
@@ -1,6 +1,6 @@
 .\"
 .\" Author: Joao Marcelo Martins <marcelo.martins@rackspace.com> or <btorch@gmail.com>
-.\" Copyright (c) 2010-2012 OpenStack, LLC.
+.\" Copyright (c) 2010-2012 OpenStack Foundation.
 .\"
 .\" Licensed under the Apache License, Version 2.0 (the "License");
 .\" you may not use this file except in compliance with the License.
@@ -14,57 +14,64 @@
 .\" implied.
 .\" See the License for the specific language governing permissions and
 .\" limitations under the License.
-.\"  
+.\"
 .TH swift-object-replicator 1 "8/26/2011" "Linux" "OpenStack Swift"
 
-.SH NAME 
+.SH NAME
 .LP
-.B swift-object-replicator 
-\- Openstack-swift object replicator
+.B swift-object-replicator
+\- OpenStack Swift object replicator
 
 .SH SYNOPSIS
 .LP
-.B swift-object-replicator 
+.B swift-object-replicator
 [CONFIG] [-h|--help] [-v|--verbose] [-o|--once]
 
-.SH DESCRIPTION 
+.SH DESCRIPTION
 .PP
-Replication is designed to keep the system in a consistent state in the face of 
-temporary error conditions like network outages or drive failures. The replication 
-processes compare local data with each remote copy to ensure they all contain the 
-latest version. Object replication uses a hash list to quickly compare subsections 
+Replication is designed to keep the system in a consistent state in the face of
+temporary error conditions like network outages or drive failures. The replication
+processes compare local data with each remote copy to ensure they all contain the
+latest version. Object replication uses a hash list to quickly compare subsections
 of each partition.
 .PP
-Replication updates are push based. For object replication, updating is just a matter 
+Replication updates are push based. For object replication, updating is just a matter
 of rsyncing files to the peer. The replicator also ensures that data is removed
-from the system. When an object item is deleted a tombstone is set as the latest 
-version of the item. The replicator will see the tombstone and ensure that the item 
+from the system. When an object item is deleted a tombstone is set as the latest
+version of the item. The replicator will see the tombstone and ensure that the item
 is removed from the entire system.
 
-The options are as follows:
+.SH OPTIONS
+.TP
+\fB\-h\fR, \fB\-\-help\fR
+Show this help message and exit
+.TP
+\fB\-d\fR \fIDEVICES\fR, \fB\-\-devices\fR=\fIDEVICES\fR
+Replicate only given devices. Comma\-separated list. Only has effect if
+\-\-once is used.
+.TP
+\fB\-p\fR \fIPARTITIONS\fR, \fB\-\-partitions\fR=\fIPARTITIONS\fR
+Replicate only given partitions. Comma\-separated
+list. Only has effect if \-\-once is used.
+.TP
+\fB\-i\fR \fIPOLICIES\fR, \fB\-\-policies\fR=\fIPOLICIES\fR
+Replicate only given policy indices. Comma\-separated list. Only has effect if
+\-\-once is used.
+.TP
+\fB\-v\fR, \fB\-\-verbose\fR
+Log to console
+.TP
+\fB\-o\fR, \fB\-\-once\fR
+Only run one pass of daemon
+.PP
+
 
-.RS 4
-.PD 0
-.IP "-v"
-.IP "--verbose"
-.RS 4
-.IP "log to console"
-.RE
-.IP "-o"
-.IP "--once"
-.RS 4
-.IP "only run one pass of daemon" 
-.RE
-.PD
-.RE
-    
-   
 .SH DOCUMENTATION
 .LP
-More in depth documentation in regards to 
+More in depth documentation in regards to
 .BI swift-object-replicator
-and also about Openstack-Swift as a whole can be found at 
-.BI http://swift.openstack.org/index.html
+and also about OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/
 
 
 .SH "SEE ALSO"
diff --git a/doc/manpages/swift-object-server.1 b/doc/manpages/swift-object-server.1
index e3d0d34693..76632a9313 100644
--- a/doc/manpages/swift-object-server.1
+++ b/doc/manpages/swift-object-server.1
@@ -1,6 +1,6 @@
 .\"
 .\" Author: Joao Marcelo Martins <marcelo.martins@rackspace.com> or <btorch@gmail.com>
-.\" Copyright (c) 2010-2011 OpenStack, LLC.
+.\" Copyright (c) 2010-2011 OpenStack Foundation.
 .\"
 .\" Licensed under the Apache License, Version 2.0 (the "License");
 .\" you may not use this file except in compliance with the License.
@@ -14,40 +14,40 @@
 .\" implied.
 .\" See the License for the specific language governing permissions and
 .\" limitations under the License.
-.\"  
+.\"
 .TH swift-object-server 1 "8/26/2011" "Linux" "OpenStack Swift"
 
-.SH NAME 
+.SH NAME
 .LP
 .B swift-object-server
-\- Openstack-swift object server.
+\- OpenStack Swift object server.
 
 .SH SYNOPSIS
 .LP
 .B swift-object-server
 [CONFIG] [-h|--help] [-v|--verbose]
 
-.SH DESCRIPTION 
+.SH DESCRIPTION
 .PP
 The Object Server is a very simple blob storage server that can store, retrieve
-and delete objects stored on local devices. Objects are stored as binary files 
+and delete objects stored on local devices. Objects are stored as binary files
 on the filesystem with metadata stored in the file's extended attributes (xattrs).
-This requires that the underlying filesystem choice for object servers support 
-xattrs on files. Some filesystems, like ext3, have xattrs turned off by default. 
+This requires that the underlying filesystem choice for object servers support
+xattrs on files. Some filesystems, like ext3, have xattrs turned off by default.
 Each object is stored using a path derived from the object name's hash and the operation's
 timestamp. Last write always wins, and ensures that the latest object version will be
 served. A deletion is also treated as a version of the file (a 0 byte file ending with
-".ts", which stands for tombstone). This ensures that deleted files are replicated 
+".ts", which stands for tombstone). This ensures that deleted files are replicated
 correctly and older versions don't magically reappear due to failure scenarios.
 
 .SH DOCUMENTATION
 .LP
-More in depth documentation in regards to 
+More in depth documentation in regards to
 .BI swift-object-server
-and also about Openstack-Swift as a whole can be found at 
-.BI http://swift.openstack.org/index.html
-and 
-.BI http://docs.openstack.org
+and also about OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/
+and
+.BI https://docs.openstack.org
 
 
 .SH "SEE ALSO"
diff --git a/doc/manpages/swift-object-updater.1 b/doc/manpages/swift-object-updater.1
index 254b3499ba..da175674e2 100644
--- a/doc/manpages/swift-object-updater.1
+++ b/doc/manpages/swift-object-updater.1
@@ -1,6 +1,6 @@
 .\"
 .\" Author: Joao Marcelo Martins <marcelo.martins@rackspace.com> or <btorch@gmail.com>
-.\" Copyright (c) 2010-2012 OpenStack, LLC.
+.\" Copyright (c) 2010-2012 OpenStack Foundation.
 .\"
 .\" Licensed under the Apache License, Version 2.0 (the "License");
 .\" you may not use this file except in compliance with the License.
@@ -14,36 +14,36 @@
 .\" implied.
 .\" See the License for the specific language governing permissions and
 .\" limitations under the License.
-.\"  
+.\"
 .TH swift-object-updater 1 "8/26/2011" "Linux" "OpenStack Swift"
 
-.SH NAME 
+.SH NAME
 .LP
 .B swift-object-updater
-\- Openstack-swift object updater
+\- OpenStack Swift object updater
 
 .SH SYNOPSIS
 .LP
 .B swift-object-updater
 [CONFIG] [-h|--help] [-v|--verbose] [-o|--once]
 
-.SH DESCRIPTION 
+.SH DESCRIPTION
 .PP
-The object updater is responsible for updating object information in container listings. 
-It will check to see if there are any locally queued updates on the filesystem of each 
-devices, what is also known as async pending file(s), walk each one and update the 
+The object updater is responsible for updating object information in container listings.
+It will check to see if there are any locally queued updates on the filesystem of each
+devices, what is also known as async pending file(s), walk each one and update the
 container listing.
 
-For example, suppose a container server is under load and a new object is put 
-into the system. The object will be immediately available for reads as soon as 
-the proxy server responds to the client with success. However, the object 
-server has not been able to update the object listing in the container server. 
-Therefore, the update would be queued locally for a later update. Container listings, 
+For example, suppose a container server is under load and a new object is put
+into the system. The object will be immediately available for reads as soon as
+the proxy server responds to the client with success. However, the object
+server has not been able to update the object listing in the container server.
+Therefore, the update would be queued locally for a later update. Container listings,
 therefore, may not immediately contain the object. This is where an eventual consistency
-window will most likely come in to play. 
+window will most likely come in to play.
 
-In practice, the consistency window is only as large as the frequency at which 
-the updater runs and may not even be noticed as the proxy server will route 
+In practice, the consistency window is only as large as the frequency at which
+the updater runs and may not even be noticed as the proxy server will route
 listing requests to the first container server which responds. The server under
 load may not be the one that serves subsequent listing requests – one of the other
 two replicas may handle the listing.
@@ -60,18 +60,18 @@ The options are as follows:
 .IP "-o"
 .IP "--once"
 .RS 4
-.IP "only run one pass of daemon" 
+.IP "only run one pass of daemon"
 .RE
-.PD 
+.PD
 .RE
-    
-    
+
+
 .SH DOCUMENTATION
 .LP
-More in depth documentation in regards to 
+More in depth documentation in regards to
 .BI swift-object-updater
-and also about Openstack-Swift as a whole can be found at 
-.BI http://swift.openstack.org/index.html
+and also about OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/
 
 
 .SH "SEE ALSO"
diff --git a/doc/manpages/swift-oldies.1 b/doc/manpages/swift-oldies.1
new file mode 100644
index 0000000000..4266f42df9
--- /dev/null
+++ b/doc/manpages/swift-oldies.1
@@ -0,0 +1,69 @@
+.\"
+.\" Author: Paul Dardeau <paul.dardeau@intel.com>
+.\" Copyright (c) 2016 OpenStack Foundation.
+.\"
+.\" Licensed under the Apache License, Version 2.0 (the "License");
+.\" you may not use this file except in compliance with the License.
+.\" You may obtain a copy of the License at
+.\"
+.\"    http://www.apache.org/licenses/LICENSE-2.0
+.\"
+.\" Unless required by applicable law or agreed to in writing, software
+.\" distributed under the License is distributed on an "AS IS" BASIS,
+.\" WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+.\" implied.
+.\" See the License for the specific language governing permissions and
+.\" limitations under the License.
+.\"
+.TH swift-oldies 1 "8/04/2016" "Linux" "OpenStack Swift"
+
+.SH NAME
+.LP
+.B swift-oldies
+\- OpenStack Swift oldies tool
+
+.SH SYNOPSIS
+.LP
+.B swift-oldies
+[-h|--help] [-a|--age]
+
+
+.SH DESCRIPTION
+.PP
+Lists Swift processes that have been running more than a specific length of
+time (in hours). This is done by scanning the list of currently executing
+processes (via ps command) and examining the execution time of those python
+processes whose program names begin with 'swift-'.
+
+Example (see all Swift processes older than two days):
+swift-oldies \-a 48
+
+The options are as follows:
+
+.RS 4
+.PD 0
+.IP "-a HOURS"
+.IP "--age=HOURS"
+.RS 4
+.IP "Look for processes at least HOURS old; default: 720 (30 days)"
+.RE
+.PD 0
+
+.IP "-h"
+.IP "--help"
+.RS 4
+.IP "Display program help and exit"
+.PD
+.RE
+
+
+.SH DOCUMENTATION
+.LP
+More documentation about OpenStack Swift can be found at
+.BI https://docs.openstack.org/swift/latest/
+
+
+.SH "SEE ALSO"
+
+.BR swift-orphans(1)
+
diff --git a/doc/manpages/swift-orphans.1 b/doc/manpages/swift-orphans.1
index b4b6158bdc..e39513b614 100644
--- a/doc/manpages/swift-orphans.1
+++ b/doc/manpages/swift-orphans.1
@@ -1,6 +1,6 @@
 .\"
 .\" Author: Joao Marcelo Martins <marcelo.martins@rackspace.com> or <btorch@gmail.com>
-.\" Copyright (c) 2012 OpenStack, LLC.
+.\" Copyright (c) 2012 OpenStack Foundation.
 .\"
 .\" Licensed under the Apache License, Version 2.0 (the "License");
 .\" you may not use this file except in compliance with the License.
@@ -14,30 +14,31 @@
 .\" implied.
 .\" See the License for the specific language governing permissions and
 .\" limitations under the License.
-.\"  
+.\"
 .TH swift-orphans 1 "3/15/2012" "Linux" "OpenStack Swift"
 
-.SH NAME 
+.SH NAME
 .LP
 .B swift-orphans
-\- Openstack-swift orphans tool
+\- OpenStack Swift orphans tool
 
 .SH SYNOPSIS
 .LP
-.B swift-orphans 
-[-h|--help] [-a|--age] [-k|--kill] [-w|--wide]
+.B swift-orphans
+[-h|--help] [-a|--age] [-k|--kill] [-w|--wide] [-r|--run-dir]
 
 
-.SH DESCRIPTION 
+.SH DESCRIPTION
 .PP
 Lists and optionally kills orphaned Swift processes. This is done by scanning
-/var/run/swift for .pid files and listing any processes that look like Swift
-processes but aren't associated with the pids in those .pid files. Any Swift
-processes running with the 'once' parameter are ignored, as those are usually
-for full-speed audit scans and such.
+/var/run/swift or the directory specified to the \-r switch for .pid files and
+listing any processes that look like Swift processes but aren't associated with
+the pids in those .pid files. Any Swift processes running with the 'once'
+parameter are ignored, as those are usually for full-speed audit scans and
+such.
 
-Example (sends SIGTERM to all orphaned Swift processes older than two hours): 
-swift-orphans -a 2 -k TERM
+Example (sends SIGTERM to all orphaned Swift processes older than two hours):
+swift-orphans \-a 2 \-k TERM
 
 The options are as follows:
 
@@ -61,9 +62,9 @@ The options are as follows:
 .PD
 .RE
 
-    
+
 .SH DOCUMENTATION
 .LP
-More documentation about Openstack-Swift can be found at 
-.BI http://swift.openstack.org/index.html
+More documentation about OpenStack Swift can be found at
+.BI https://docs.openstack.org/swift/latest/
 
diff --git a/doc/manpages/swift-proxy-server.1 b/doc/manpages/swift-proxy-server.1
index 2a4b6c36f4..790d3fda05 100644
--- a/doc/manpages/swift-proxy-server.1
+++ b/doc/manpages/swift-proxy-server.1
@@ -1,6 +1,6 @@
 .\"
 .\" Author: Joao Marcelo Martins <marcelo.martins@rackspace.com> or <btorch@gmail.com>
-.\" Copyright (c) 2010-2011 OpenStack, LLC.
+.\" Copyright (c) 2010-2011 OpenStack Foundation.
 .\"
 .\" Licensed under the Apache License, Version 2.0 (the "License");
 .\" you may not use this file except in compliance with the License.
@@ -14,36 +14,36 @@
 .\" implied.
 .\" See the License for the specific language governing permissions and
 .\" limitations under the License.
-.\"  
+.\"
 .TH swift-proxy-server 1 "8/26/2011" "Linux" "OpenStack Swift"
 
-.SH NAME 
+.SH NAME
 .LP
-.B swift-proxy-server 
-\- Openstack-swift proxy server.
+.B swift-proxy-server
+\- OpenStack Swift proxy server.
 
 .SH SYNOPSIS
 .LP
 .B swift-proxy-server
 [CONFIG] [-h|--help] [-v|--verbose]
 
-.SH DESCRIPTION 
+.SH DESCRIPTION
 .PP
-The Swift Proxy Server is responsible for tying together the rest of the Swift architecture. 
-For each request, it will look up the location of the account, container, or object in the 
-ring and route the request accordingly. The public API is also exposed through the Proxy 
-Server. A large number of failures are also handled in the Proxy Server. For example, 
+The Swift Proxy Server is responsible for tying together the rest of the Swift architecture.
+For each request, it will look up the location of the account, container, or object in the
+ring and route the request accordingly. The public API is also exposed through the Proxy
+Server. A large number of failures are also handled in the Proxy Server. For example,
 if a server is unavailable for an object PUT, it will ask the ring for a handoff server
 and route there instead. When objects are streamed to or from an object server, they are
-streamed directly through the proxy server to or from the user the proxy server does 
+streamed directly through the proxy server to or from the user the proxy server does
 not spool them.
 
 .SH DOCUMENTATION
 .LP
-More in depth documentation in regards to 
+More in depth documentation in regards to
 .BI swift-proxy-server
-and also about Openstack-Swift as a whole can be found at 
-.BI http://swift.openstack.org/index.html
+and also about OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/
 
 
 .SH "SEE ALSO"
diff --git a/doc/manpages/swift-recon-cron.1 b/doc/manpages/swift-recon-cron.1
new file mode 100644
index 0000000000..8ebbcb2c29
--- /dev/null
+++ b/doc/manpages/swift-recon-cron.1
@@ -0,0 +1,38 @@
+.\"
+.\" Copyright (c) 2016 OpenStack Foundation.
+.\"
+.\" Licensed under the Apache License, Version 2.0 (the "License");
+.\" you may not use this file except in compliance with the License.
+.\" You may obtain a copy of the License at
+.\"
+.\"    http://www.apache.org/licenses/LICENSE-2.0
+.\"
+.\" Unless required by applicable law or agreed to in writing, software
+.\" distributed under the License is distributed on an "AS IS" BASIS,
+.\" WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+.\" implied.
+.\" See the License for the specific language governing permissions and
+.\" limitations under the License.
+.\"
+.TH SWIFT-RECON-CRON "1" "August 2016" "OpenStack Swift"
+
+.SH NAME
+swift\-recon\-cron \- OpenStack Swift recon cron job
+
+.SH SYNOPSIS
+.B swift\-recon\-cron
+\fI<CONFIG>\fR
+
+.SH DESCRIPTION
+.PP
+Tool that can be run by using cron to fill recon cache. Recon data
+can be read by \fBswift-recon\fR tool.
+
+.SH DOCUMENTATION
+.LP
+More in depth documentation in regards to
+.BI swift\-recon\-cron
+and also about OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/
+and
+.BI https://docs.openstack.org
diff --git a/doc/manpages/swift-recon.1 b/doc/manpages/swift-recon.1
index a9745c28da..dc5a19d002 100644
--- a/doc/manpages/swift-recon.1
+++ b/doc/manpages/swift-recon.1
@@ -1,6 +1,6 @@
 .\"
 .\" Author: Joao Marcelo Martins <marcelo.martins@rackspace.com> or <btorch@gmail.com>
-.\" Copyright (c) 2010-2011 OpenStack, LLC.
+.\" Copyright (c) 2010-2011 OpenStack Foundation.
 .\"
 .\" Licensed under the Apache License, Version 2.0 (the "License");
 .\" you may not use this file except in compliance with the License.
@@ -14,26 +14,26 @@
 .\" implied.
 .\" See the License for the specific language governing permissions and
 .\" limitations under the License.
-.\"  
+.\"
 .TH swift-recon 1 "8/26/2011" "Linux" "OpenStack Swift"
 
-.SH NAME 
+.SH NAME
 .LP
 .B swift-recon
-\- Openstack-swift recon middleware cli tool
+\- OpenStack Swift recon middleware cli tool
 
 .SH SYNOPSIS
 .LP
-.B swift-recon 
-\ <server_type> [-v] [--suppress] [-a] [-r] [-u] [-d] [-l] [--md5] [--auditor] [--updater] [--expirer] [--sockstat]
- 
-.SH DESCRIPTION 
+.B swift-recon
+\ <server_type> [-v] [--suppress] [-a] [-r] [-u] [-d] [-l] [-T] [--md5] [--auditor] [--updater] [--expirer] [--sockstat]
+
+.SH DESCRIPTION
 .PP
 The swift-recon cli tool can be used to retrieve various metrics and telemetry information about
-a cluster that has been collected by the swift-recon middleware. 
+a cluster that has been collected by the swift-recon middleware.
 
-In order to make use of the swift-recon middleware, update the object-server.conf file and 
-enable the recon middleware by adding a pipeline entry and setting its option(s). You can view 
+In order to make use of the swift-recon middleware, update the object-server.conf file and
+enable the recon middleware by adding a pipeline entry and setting its option(s). You can view
 more information in the example section below.
 
 
@@ -58,24 +58,48 @@ Get updater stats
 Get expirer stats
 .IP "\fB-r, --replication\fR"
 Get replication stats
+.IP "\fB-R, --reconstruction\fR"
+Get reconstruction stats
 .IP "\fB-u, --unmounted\fR"
 Check cluster for unmounted devices
 .IP "\fB-d, --diskusage\fR"
 Get disk usage stats
+.IP "\fB--top=COUNT\fR"
+Also show the top COUNT entries in rank order
+.IP "\fB--lowest=COUNT\fR"
+Also show the lowest COUNT entries in rank order
+.IP "\fB--human-readable\fR"
+Use human readable suffix for disk usage stats
 .IP "\fB-l, --loadstats\fR"
 Get cluster load average stats
 .IP "\fB-q, --quarantined\fR"
 Get cluster quarantine stats
+.IP "\fB--validate-servers\fR"
+Validate servers on the ring
 .IP "\fB--md5\fR"
-Get md5sum of servers ring and compare to local cop
+Get md5sum of servers ring and compare to local copy
+.IP "\fB--sockstat\fR"
+Get cluster socket usage stats
+.IP "\fB--driveaudit\fR"
+Get drive audit error stats
+.IP "\fB-T, --time\fR"
+Check time synchronization
+.IP "\fB--swift-versions\fR"
+Check swift version
 .IP "\fB--all\fR"
-Perform all checks. Equivalent to -arudlq --md5
+Perform all checks. Equivalent to \-arudlqT
+\-\-md5 \-\-sockstat \-\-auditor \-\-updater \-\-expirer
+\-\-driveaudit \-\-validate\-servers \-\-swift-versions
+.IP "\fB--region=REGION\fR"
+Only query servers in specified region
 .IP "\fB-z ZONE, --zone=ZONE\fR"
 Only query servers in specified zone
+.IP "\fB-t SECONDS, --timeout=SECONDS\fR"
+Time to wait for a response from a server
 .IP "\fB--swiftdir=PATH\fR"
 Default = /etc/swift
 .PD
-.RE  
+.RE
 
 
 
@@ -84,16 +108,16 @@ Default = /etc/swift
 .PD 0
 .RS 0
 .IP "ubuntu:~$ swift-recon -q --zone 3"
-.IP "==============================================================================="
+.IP "================================================================="
 .IP "[2011-10-18 19:36:00] Checking quarantine dirs on 1 hosts... "
 .IP "[Quarantined objects] low: 4, high: 4, avg: 4, total: 4 "
 .IP "[Quarantined accounts] low: 0, high: 0, avg: 0, total: 0 "
 .IP "[Quarantined containers] low: 0, high: 0, avg: 0, total: 0 "
-.IP "==============================================================================="
+.IP "================================================================="
 .RE
 
 .RS 0
-Finally if you also wish to track asynchronous pending’s you will need to setup a 
+Finally if you also wish to track asynchronous pending's you will need to setup a
 cronjob to run the swift-recon-cron script periodically:
 
 .IP "*/5 * * * * swift /usr/bin/swift-recon-cron /etc/swift/object-server.conf"
@@ -104,10 +128,10 @@ cronjob to run the swift-recon-cron script periodically:
 
 .SH DOCUMENTATION
 .LP
-More documentation about Openstack-Swift can be found at 
-.BI http://swift.openstack.org/index.html 
-Also more specific documentation about swift-recon can be found at 
-.BI http://swift.openstack.org/admin_guide.html#cluster-telemetry-and-monitoring
+More documentation about OpenStack Swift can be found at
+.BI https://docs.openstack.org/swift/latest/
+Also more specific documentation about swift-recon can be found at
+.BI https://docs.openstack.org/swift/latest/admin_guide.html\#cluster-telemetry-and-monitoring
 
 
 
diff --git a/doc/manpages/swift-reconciler-enqueue.1 b/doc/manpages/swift-reconciler-enqueue.1
new file mode 100644
index 0000000000..fe9c3db1fc
--- /dev/null
+++ b/doc/manpages/swift-reconciler-enqueue.1
@@ -0,0 +1,58 @@
+.\"
+.\" Copyright (c) 2016 OpenStack Foundation.
+.\"
+.\" Licensed under the Apache License, Version 2.0 (the "License");
+.\" you may not use this file except in compliance with the License.
+.\" You may obtain a copy of the License at
+.\"
+.\"    http://www.apache.org/licenses/LICENSE-2.0
+.\"
+.\" Unless required by applicable law or agreed to in writing, software
+.\" distributed under the License is distributed on an "AS IS" BASIS,
+.\" WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+.\" implied.
+.\" See the License for the specific language governing permissions and
+.\" limitations under the License.
+.\"
+.TH SWIFT-RECONCILER-ENQUEUE "1" "August 2016" "OpenStack Swift"
+
+.SH NAME
+swift\-reconciler\-enqueue \- OpenStack Swift reconciler enqueue
+.SH SYNOPSIS
+.B swift\-reconciler\-enqueue
+\fIpolicy_index\fR \fI/a/c/o\fR \fItimestamp\fR \fR[\fIoptions\fR]
+
+.SH DESCRIPTION
+.PP
+This script enqueues an object to be evaluated by the reconciler.
+
+.SH OPTIONS
+.TP
+\fIpolicy_index\fR
+The policy the object is currently stored in.
+.TP
+\fI/a/c/o\fR
+The full path of the object \- UTF\-8
+.TP
+\fItimestamp\fR
+The timestamp of the datafile/tombstone.
+
+.TP
+\fB\-h\fR, \fB\-\-help\fR
+Show this help message and exit
+.TP
+\fB\-X\fR \fIOP\fR, \fB\-\-op\fR=\fIOP\fR
+The method of the misplaced operation
+.TP
+\fB\-f\fR, \fB\-\-force\fR
+Force an object to be re\-enqueued
+.PP
+
+.SH DOCUMENTATION
+.LP
+More in depth documentation in regards to
+.BI swift\-reconciler\-enqueue
+and also about OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/
+and
+.BI https://docs.openstack.org
diff --git a/doc/manpages/swift-ring-builder-analyzer.1 b/doc/manpages/swift-ring-builder-analyzer.1
new file mode 100644
index 0000000000..6ced40416e
--- /dev/null
+++ b/doc/manpages/swift-ring-builder-analyzer.1
@@ -0,0 +1,52 @@
+.\"
+.\" Copyright (c) 2016 OpenStack Foundation.
+.\"
+.\" Licensed under the Apache License, Version 2.0 (the "License");
+.\" you may not use this file except in compliance with the License.
+.\" You may obtain a copy of the License at
+.\"
+.\"    http://www.apache.org/licenses/LICENSE-2.0
+.\"
+.\" Unless required by applicable law or agreed to in writing, software
+.\" distributed under the License is distributed on an "AS IS" BASIS,
+.\" WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+.\" implied.
+.\" See the License for the specific language governing permissions and
+.\" limitations under the License.
+.\"
+.TH SWIFT-RING-BUILDER-ANALYZER "1" "August 2016" "OpenStack Swift"
+
+.SH NAME
+swift\-ring\-builder\-analyzer \- put the OpenStack Swift ring builder through its paces
+.SH SYNOPSIS
+.B swift\-ring\-builder\-analyzer
+[\fIoptions\fR] \fIscenario_path\fR
+
+.SH DESCRIPTION
+.PP
+This is a tool to help developers quantify changes to the ring
+builder. It takes a scenario (JSON file) describing the builder's
+basic parameters (part_power, replicas, etc.) and a number of
+"rounds", where each round is a set of operations to perform on the
+builder. For each round, the operations are applied, and then the
+builder is rebalanced until it reaches a steady state.
+
+.SH OPTIONS
+.TP
+.I scenario_path
+Path to the scenario file
+.TP
+\fB\-h\fR, \fB\-\-help\fR
+Show this help message and exit
+.TP
+\fB\-\-check\fR, \fB\-c\fR
+Just check the scenario, don't execute it.
+
+.SH DOCUMENTATION
+.LP
+More in depth documentation in regards to
+.BI swift\-ring\-builder\-analyzer
+and also about OpenStack Swift as a whole can be found at
+.BI https://docs.openstack.org/swift/latest/
+and
+.BI https://docs.openstack.org
diff --git a/doc/manpages/swift-ring-builder.1 b/doc/manpages/swift-ring-builder.1
index c8433e8ddf..ac6bb7a1af 100644
--- a/doc/manpages/swift-ring-builder.1
+++ b/doc/manpages/swift-ring-builder.1
@@ -1,6 +1,6 @@
 .\"
 .\" Author: Joao Marcelo Martins <marcelo.martins@rackspace.com> or <btorch@gmail.com>
-.\" Copyright (c) 2010-2011 OpenStack, LLC.
+.\" Copyright (c) 2010-2011 OpenStack Foundation.
 .\"
 .\" Licensed under the Apache License, Version 2.0 (the "License");
 .\" you may not use this file except in compliance with the License.
@@ -14,26 +14,26 @@
 .\" implied.
 .\" See the License for the specific language governing permissions and
 .\" limitations under the License.
-.\"  
+.\"
 .TH swift-ring-builder 1 "8/26/2011" "Linux" "OpenStack Swift"
 
-.SH NAME 
+.SH NAME
 .LP
 .B swift-ring-builder
-\- Openstack-swift ring builder
+\- OpenStack Swift ring builder
 
 .SH SYNOPSIS
 .LP
 .B swift-ring-builder
 <builder_file> <commands> <arguments> <...>
 
-.SH DESCRIPTION 
+.SH DESCRIPTION
 .PP
-The swift-ring-builder utility is used to create, search and manipulate 
-the swift storage ring. The ring-builder assigns partitions to devices and 
+The swift-ring-builder utility is used to create, search and manipulate
+the swift storage ring. The ring-builder assigns partitions to devices and
 writes an optimized Python structure to a gzipped, pickled file on disk for
-shipping out to the servers. The server processes just check the modification 
-time of the file occasionally and reload their in-memory copies of the ring 
+shipping out to the servers. The server processes just check the modification
+time of the file occasionally and reload their in-memory copies of the ring
 structure as needed. Because of how the ring-builder manages changes to the
 ring, using a slightly older ring usually just means one of the three replicas
 for a subset of the partitions will be incorrect, which can be easily worked around.
@@ -48,15 +48,23 @@ partitions will end up assigned to different devices, and therefore nearly all
 data stored will have to be replicated to new locations. So, recovery from a
 builder file loss is possible, but data will definitely be unreachable for an
 extended time.
+.PP
+If invoked as 'swift-ring-builder-safe' the directory containing the builder
+file provided will be locked (via a .lock file in the files parent directory).
+This provides a basic safe guard against multiple instances of the swift-ring-builder
+(or other utilities that observe this lock) from attempting to write to or read
+the builder/ring files while operations are in progress. This can be useful in
+environments where ring management has been automated but the operator still
+needs to interact with the rings manually.
 
 
 .SH SEARCH
-.PD 0 
+.PD 0
 
 .IP "\fB<search-value>\fR"
 .RS 5
 .IP "Can be of the form:"
-.IP "d<device_id>z<zone>-<ip>:<port>/<device_name>_<meta>"
+.IP "d<device_id>r<region>z<zone>-<ip>:<port>/<device_name>_<meta>"
 
 .IP "Any part is optional, but you must include at least one, examples:"
 
@@ -65,6 +73,7 @@ extended time.
 .IP "z1               Matches devices in zone 1"
 .IP "z1-1.2.3.4       Matches devices in zone 1 with the ip 1.2.3.4"
 .IP "1.2.3.4          Matches devices in any zone with the ip 1.2.3.4"
+.IP "r1z1:5678        Matches devices in zone 1 present in region 1 using port 5678"
 .IP "z1:5678          Matches devices in zone 1 using port 5678"
 .IP ":5678            Matches devices that use port 5678"
 .IP "/sdb1            Matches devices with the device name sdb1"
@@ -73,12 +82,12 @@ extended time.
 .IP "[::1]            Matches devices in any zone with the ip ::1"
 .IP "z1-[::1]:5678    Matches devices in zone 1 with ip ::1 and port 5678"
 .RE
-   
+
 Most specific example:
 
 .RS 3
-d74z1-1.2.3.4:5678/sdb1_"snet: 5.6.7.8" 
-.RE 
+d74z1-1.2.3.4:5678/sdb1_"snet: 5.6.7.8"
+.RE
 
 Nerd explanation:
 
@@ -86,17 +95,22 @@ Nerd explanation:
 .IP "All items require their single character prefix except the ip, in which case the - is optional unless the device id or zone is also included."
 .RE
 .RE
-.PD 
+.PD
+
 
+.SH OPTIONS
+.TP
+.I "\-y, \-\-yes"
+Assume a yes response to all questions
 
 .SH COMMANDS
 
-.PD 0 
+.PD 0
 
 
 .IP "\fB<builder_file>\fR"
 .RS 5
-Shows information about the ring and the devices within. 
+Shows information about the ring and the devices within.
 .RE
 
 
@@ -106,17 +120,19 @@ Shows information about matching devices.
 .RE
 
 
-.IP "\fBadd\fR z<zone>-<ip>:<port>/<device_name>_<meta><wght>"
+.IP "\fBadd\fR z<zone>-<ip>:<port>/<device_name>_<meta> <weight>"
+.IP "\fBadd\fR r<region>z<zone>-<ip>:<port>/<device_name>_<meta> <weight>"
+.IP "\fBadd\fR -r <region> -z <zone> -i <ip> -p <port> -d <device_name> -m <meta> -w <weight>"
 .RS 5
-Adds a device to the ring with the given information. No partitions will be 
-assigned to the new device until after running 'rebalance'. This is so you 
+Adds a device to the ring with the given information. No partitions will be
+assigned to the new device until after running 'rebalance'. This is so you
 can make multiple device changes and rebalance them all just once.
 .RE
 
 
 .IP "\fBcreate\fR <part_power> <replicas> <min_part_hours>"
 .RS 5
-Creates <builder_file> with 2^<part_power> partitions and <replicas>. 
+Creates <builder_file> with 2^<part_power> partitions and <replicas>.
 <min_part_hours> is number of hours to restrict moving a partition more than once.
 .RE
 
@@ -128,11 +144,11 @@ the devices matching the search values given. The first column is the
 assigned partition number and the second column is the number of device
 matches for that partition. The list is ordered from most number of matches
 to least. If there are a lot of devices to match against, this command
-could take a while to run.  
+could take a while to run.
 .RE
 
 
-.IP "\fBrebalence\fR"
+.IP "\fBrebalance\fR"
 .RS 5
 Attempts to rebalance the ring by reassigning partitions that haven't been recently reassigned.
 .RE
@@ -140,37 +156,37 @@ Attempts to rebalance the ring by reassigning partitions that haven't been recen
 
 .IP "\fBremove\fR <search-value> "
 .RS 5
-Removes the device(s) from the ring. This should normally just be used for 
-a device that has failed. For a device you wish to decommission, it's best 
-to set its weight to 0, wait for it to drain all its data, then use this 
-remove command. This will not take effect until after running 'rebalance'. 
+Removes the device(s) from the ring. This should normally just be used for
+a device that has failed. For a device you wish to decommission, it's best
+to set its weight to 0, wait for it to drain all its data, then use this
+remove command. This will not take effect until after running 'rebalance'.
 This is so you can make multiple device changes and rebalance them all just once.
 .RE
 
 
 .IP "\fBset_info\fR <search-value> <ip>:<port>/<device_name>_<meta>"
 .RS 5
-Resets the device's information. This information isn't used to assign 
-partitions, so you can use 'write_ring' afterward to rewrite the current 
-ring with the newer device information. Any of the parts are optional 
-in the final <ip>:<port>/<device_name>_<meta> parameter; just give what you 
-want to change. For instance set_info d74 _"snet: 5.6.7.8" would just 
+Resets the device's information. This information isn't used to assign
+partitions, so you can use 'write_ring' afterward to rewrite the current
+ring with the newer device information. Any of the parts are optional
+in the final <ip>:<port>/<device_name>_<meta> parameter; just give what you
+want to change. For instance set_info d74 _"snet: 5.6.7.8" would just
 update the meta data for device id 74.
 .RE
 
 
 .IP "\fBset_min_part_hours\fR <hours>"
 .RS 5
-Changes the <min_part_hours> to the given <hours>. This should be set to 
-however long a full replication/update cycle takes. We're working on a way 
+Changes the <min_part_hours> to the given <hours>. This should be set to
+however long a full replication/update cycle takes. We're working on a way
 to determine this more easily than scanning logs.
 .RE
 
 
 .IP "\fBset_weight\fR <search-value> <weight>"
 .RS 5
-Resets the device's weight. No partitions will be reassigned to or from the 
-device until after running 'rebalance'. This is so you can make multiple 
+Resets the device's weight. No partitions will be reassigned to or from the
+device until after running 'rebalance'. This is so you can make multiple
 device changes and rebalance them all just once.
 .RE
 
@@ -183,8 +199,8 @@ Just runs the validation routines on the ring.
 
 .IP "\fBwrite_ring\fR"
 .RS 5
-Just rewrites the distributable ring file. This is done automatically after 
-a successful rebalance, so really this is only useful after one or more 'set_info' 
+Just rewrites the distributable ring file. This is done automatically after
+a successful rebalance, so really this is only useful after one or more 'set_info'
 calls when no rebalance is needed but you want to send out the new device information.
 .RE
 
@@ -193,17 +209,16 @@ calls when no rebalance is needed but you want to send out the new device inform
             set_min_part_hours set_weight validate write_ring
 
 \fBExit codes:\fR 0 = ring changed, 1 = ring did not change, 2 = error
-.PD 
+.PD
 
 
- 
-.SH DOCUMENTATION
-.LP
-More in depth documentation about the swift ring and also Openstack-Swift as a 
-whole can be found at 
-.BI http://swift.openstack.org/overview_ring.html, 
-.BI http://swift.openstack.org/admin_guide.html#managing-the-rings 
-and 
-.BI http://swift.openstack.org
 
 
+.SH DOCUMENTATION
+.LP
+More in depth documentation about the swift ring and also OpenStack Swift as a
+whole can be found at
+.BI https://docs.openstack.org/swift/latest/overview_ring.html
+.BI https://docs.openstack.org/swift/latest/admin_guide.html#managing-the-rings
+and
+.BI https://docs.openstack.org/swift/latest/
diff --git a/doc/manpages/swift-ring-composer.1 b/doc/manpages/swift-ring-composer.1
new file mode 100644
index 0000000000..8d029ff334
--- /dev/null
+++ b/doc/manpages/swift-ring-composer.1
@@ -0,0 +1,40 @@
+.TH swift-ring-composer "1" "June 2018" "Linux" "OpenStack Swift"
+.SH NAME
+.B swift-ring-composer
+\- manual page for swift-ring-composer
+
+.SH SYNOPSIS
+.LP
+.B swift-ring-composer
+[\-h] <composite_builder_file> {show,compose} ...
+
+.SH DESCRIPTION
+This is a tool for building a composite ring file from other existing ring
+builder files. The component ring builders must all have the same partition
+power. Each device must only be used in a single component builder. Each
+region must only be used in a single component builder.
+.PP
+.B NOTE:
+This tool is for experimental use and may be removed in future versions of Swift.
+.PP
+.SS "positional arguments:"
+.TP
+<composite_builder_file>
+Name of composite builder file
+.SS "optional arguments:"
+.TP
+\fB\-h\fR, \fB\-\-help\fR
+show this help message and exit
+.SH "COMMANDS"
+.TP
+.SS "\fBshow\fR [-h]"
+show composite ring builder metadata
+.TP
+.SS "\fBcompose\fR [-h] [<builder_file> <builder_file> [<builder_file> ...] --output <ring_file> [--force]"
+compose composite ring
+.PP
+.SH DOCUMENTATION
+.LP
+More in depth documentation about the swift ring and also OpenStack Swift as a
+whole can be found at
+.BI https://swift.openstack.org
diff --git a/doc/manpages/swift.1 b/doc/manpages/swift.1
deleted file mode 100644
index 9e86dd1601..0000000000
--- a/doc/manpages/swift.1
+++ /dev/null
@@ -1,121 +0,0 @@
-.\"
-.\" Author: Joao Marcelo Martins <marcelo.martins@rackspace.com> or <btorch@gmail.com>
-.\" Copyright (c) 2010-2011 OpenStack, LLC.
-.\"
-.\" Licensed under the Apache License, Version 2.0 (the "License");
-.\" you may not use this file except in compliance with the License.
-.\" You may obtain a copy of the License at
-.\"
-.\"    http://www.apache.org/licenses/LICENSE-2.0
-.\"
-.\" Unless required by applicable law or agreed to in writing, software
-.\" distributed under the License is distributed on an "AS IS" BASIS,
-.\" WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-.\" implied.
-.\" See the License for the specific language governing permissions and
-.\" limitations under the License.
-.\"  
-.TH swift 1 "8/26/2011" "Linux" "OpenStack Swift"
-
-.SH NAME 
-.LP
-.B swift
-\- Openstack-swift swift tool 
-
-.SH SYNOPSIS
-.LP
-.B swift
-[options] <command> [args]
-
-.SH DESCRIPTION 
-.PP
-The swift tool is a command line interface script for communicating with 
-an openstack-swift object storage environment. It allows one to perform 
-several types of operations.
-
-.SH COMMANDS
-.PP 
-
-\fBstat\fR [\fIcontainer\fR] [\fIobject\fR]
-.RS 4
-Displays information for the account, container, or object depending on the args given (if any).
-.RE
-
-\fBlist\fR [\fIcommand-options\fR] [\fIcontainer\fR]
-.RS 4
-Lists the containers for the account or the objects for a container. The -p or --prefix is an option that will only list items beginning 
-with that prefix. The -d or --delimiter is option (for container listings only) 
-that will roll up items with the given delimiter (see Cloud Files general 
-documentation for what this means).
-.RE    
-
-\fBupload\fR [\fIcommand-options\fR] container file_or_directory [\fIfile_or_directory\fR] [...]
-.RS 4
-Uploads to the given container the files and directories specified by the 
-remaining args. The -c or --changed is an option that will only upload files 
-that have changed since the last upload. The -S <size> or --segment-size <size> 
-and --leave-segments are options as well (see --help for more).
-.RE
-
-\fBpost\fR [\fIcommand-options\fR] [\fIcontainer\fR] [\fIobject\fR]
-.RS 4
-Updates meta information for the account, container, or object depending
-on the args given. If the container is not found, it will be created
-automatically; but this is not true for accounts and objects. Containers 
-also allow the -r (or --read-acl) and -w (or --write-acl) options. The -m
-or --meta option is allowed on all and used to define the user meta data
-items to set in the form Name:Value. This option can be repeated. 
-\fBExample\fR: post -m Color:Blue -m Size:Large
-.RE    
-    
-\fBdownload\fR [\fIcommand-options\fR] [\fIcontainer\fR] [\fIobject\fR] [\fIobject\fR] [...]
-.RS 4
-Downloads everything in the account (with --all), or everything in a
-container, or a list of objects depending on the args given. For a single
-object download, you may use the -o [--output] <filename> option to
-redirect the output to a specific file or if "-" then just redirect to stdout.
-.RE
-
-\fBdelete\fR [\fIcommand-options\fR] [\fIcontainer\fR] [\fIobject\fR] [\fIobject\fR] [...]
-.RS 4
-Deletes everything in the account (with --all), or everything in a container,
-or a list of objects depending on the args given. Segments of manifest objects
-will be deleted as well, unless you specify the --leave-segments option.
-.RE 
-
-.SH OPTIONS
-.PD 0 
-.IP "--version              Show program's version number and exit"
-.IP "-h, --help             Show this help message and exit"
-.IP "-s, --snet             Use SERVICENET internal network"
-.IP "-v, --verbose          Print more info"
-.IP "-q, --quiet            Suppress status output"
-.IP "-A AUTH, --auth=AUTH   URL for obtaining an auth token "
-.IP "-U USER, --user=USER   User name for obtaining an auth token"
-.IP "-K KEY, --key=KEY      Key for obtaining an auth token"
-.PD 
-
-.SH EXAMPLE
-.PP 
-swift -A https://127.0.0.1:443/auth/v1.0 -U swiftops:swiftops -K swiftops stat
-
-.RS 2
-.PD 0 
-.IP "Account: AUTH_43b42dae-dc0b-4a4b-ac55-97de614d6e6e"
-.IP "Containers: 1"
-.IP "Objects: 1"
-.IP "Bytes: 1124"
-.IP "Accept-Ranges: bytes"
-.IP "X-Trans-Id: txb21186a9eef64ed295a1e95896a0fc72"
-.PD 
-.RE 
-
-  
-.SH DOCUMENTATION
-.LP
-More in depth documentation about Openstack-Swift as a whole can be found at 
-.BI http://swift.openstack.org
-
-
-.LP 
-
diff --git a/doc/manpages/swift.conf.5 b/doc/manpages/swift.conf.5
new file mode 100644
index 0000000000..b750cfdd4f
--- /dev/null
+++ b/doc/manpages/swift.conf.5
@@ -0,0 +1,217 @@
+.\"
+.\" Author: Nandini Tata <nandini.tata@intel.com>
+.\" Copyright (c) 2016 OpenStack Foundation.
+.\"
+.\" Licensed under the Apache License, Version 2.0 (the "License");
+.\" you may not use this file except in compliance with the License.
+.\" You may obtain a copy of the License at
+.\"
+.\"    http://www.apache.org/licenses/LICENSE-2.0
+.\"
+.\" Unless required by applicable law or agreed to in writing, software
+.\" distributed under the License is distributed on an "AS IS" BASIS,
+.\" WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+.\" implied.
+.\" See the License for the specific language governing permissions and
+.\" limitations under the License.
+.\"
+.TH swift.conf 5 "8/8/2016" "Linux" "OpenStack Swift"
+
+.SH NAME
+.LP
+.B swift.conf
+\- common configuration file for the OpenStack object storage services
+
+
+
+.SH SYNOPSIS
+.LP
+.B swift.conf
+
+
+
+.SH DESCRIPTION
+.PP
+This is the common configuration file used by all services of OpenStack object
+storage services.
+
+The configuration file follows the python-pastedeploy syntax. The file is
+divided into sections, which are enclosed by square brackets. Each section
+will contain a certain number of key/value parameters which are described
+later.
+
+Any line that begins with a '#' symbol is ignored.
+
+You can find more information about python-pastedeploy configuration format at
+\fIhttps://docs.pylonsproject.org/projects/pastedeploy/en/latest/#config-format\fR
+
+
+
+.SH SWIFT HASH SECTION
+.PD 1
+.RS 0
+This is indicated by section named [swift-hash]. Below are the parameters that
+are acceptable within this section:
+
+.PD 0
+.IP "\fBswift_hash_path_suffix\fR"
+.IP "\fBswift_hash_path_prefix\fR"
+.PD
+
+swift_hash_path_suffix and swift_hash_path_prefix are used as part of the
+hashing algorithm when determining data placement in the cluster.
+These values should remain secret and MUST NOT change once a cluster has been
+deployed.
+
+Use only printable chars (python -c "import string; print(string.printable)").
+
+
+
+.SH STORAGE POLICY SECTION
+.PD 1
+.RS 0
+This is indicated by section name [storage-policy:#]
+
+Storage policies are defined here and they determine various characteristics
+about how objects are stored and treated. Policies are specified by name on
+a per container basis. The policy index is specified in the section header
+and is used internally. The policy with index 0 is always used for legacy
+containers and can be given a name for use in metadata; however, the ring file
+name will always be 'object.ring.gz' for backwards compatibility. If no
+policies are defined, a policy with index 0 will be automatically created for
+backwards compatibility and given the name Policy-0. A default policy is used
+when creating new containers when no policy is specified in the request. If
+no other policies are defined, the policy with index 0 will be declared the
+default. If multiple policies are defined, you must define a policy with index
+0 and you must specify a default. It is recommended you always define a
+section for storage-policy:0. Aliases are not mandatory when defining a
+storage policy.
+
+.IP "\fB[storage-policy:index]\fR"
+Each storage policy is defined in a separate section with an index specified
+in the header. Below are the parameters that are acceptable within this
+section:
+
+.IP "\fBname\fR"
+Name of the storage policy. Policy names are case insensitive.
+.IP "\fBaliases\fR"
+Multiple names can be assigned to one policy using aliases. All names must
+follow the Swift naming rules.
+.IP "\fBpolicy_type\fR"
+Policy type can be replication or erasure_coding. Replication policy
+replicates the objects to specified number of replicas. Erasure coding uses
+PyECLib API library for encode/decode operations. Please refer to Swift
+documentation for details on how erasure coding is implemented.
+.IP "\fBec_type\fR"
+This parameter must be chosen from the list of EC backends supported by
+PyECLib.
+.IP "\fBec_num_data_fragments\fR"
+This parameter is specific to 'erasure coding' policy_type only. It defines
+the number of fragments that will be comprised of data.
+.IP "\fBec_num_parity_fragments\fR"
+This parameter is specific to 'erasure coding' policy_type only. It defines
+the number of fragments that will be comprised of parity.
+.IP "\fBec_object_segment_size\fR"
+This parameter is specific to 'erasure coding' policy_type only. It defines
+the amount of data that will be buffered up before feeding a segment into the
+encoder/decoder. The default value is 1048576.
+.IP "\fIExamples:\fR"
+
+.PD 0
+.IP "[storage-policy:0]"
+.IP "name = Policy-0"
+.IP "default = yes"
+.IP "policy_type = replication"
+.IP "aliases = yellow, orange"
+
+.IP "[storage-policy:1]"
+.IP "name = silver"
+.IP "policy_type = replication"
+
+.IP "[storage-policy:2]"
+.IP "name = deepfreeze10-4"
+.IP "aliases = df10-4"
+.IP "policy_type = erasure_coding"
+.IP "ec_type = liberasurecode_rs_vand"
+.IP "ec_num_data_fragments = 10"
+.IP "ec_num_parity_fragments = 4"
+.IP "ec_object_segment_size = 1048576"
+.PD
+.RE
+.PD
+
+
+
+.SH SWIFT CONSTRAINTS SECTION
+.PD 1
+.RS 0
+This is indicated by section name [swift-constraints]. This section sets the
+basic constraints on data saved in the swift cluster. These constraints are
+automatically published by the proxy server in responses to /info requests.
+Below are the parameters that are acceptable within this section:
+.IP "\fBmax_file_size\fR"
+max_file_size is the largest "normal" object that can be saved in the cluster.
+This is also the limit on the size of each segment of a "large" object when
+using the large object manifest support. This value is set in bytes. Setting
+it to lower than 1MiB will cause some tests to fail. It is STRONGLY
+recommended to leave this value at the default (5 * 2**30 + 2).
+.IP "\fBmax_meta_name_length\fR"
+max_meta_name_length is the max number of bytes in the utf8 encoding of the
+name portion of a metadata header.
+.IP "\fBmax_meta_value_length\fR"
+max_meta_value_length is the max number of bytes in the utf8 encoding of a
+metadata value.
+.IP "\fBmax_meta_count\fR"
+max_meta_count is the max number of metadata keys that can be stored on a
+single account, container, or object.
+.IP "\fBmax_meta_overall_size\fR"
+max_meta_overall_size is the max number of bytes in the utf8 encoding of the
+metadata (keys + values).
+.IP "\fBmax_header_size\fR"
+max_header_size is the max number of bytes in the utf8 encoding of each
+header. Using 8192 as default because eventlet uses 8192 as max size of header
+line. This value may need to be increased when using identity v3 API tokens
+including more than 7 catalog entries.
+.IP "\fBextra_header_count\fR"
+By default the maximum number of allowed headers depends on the number of max
+allowed metadata settings plus a default value of 36 for swift internally
+generated headers and regular http headers. If for some reason this is not
+enough (custom middleware for example) it can be increased with the
+extra_header_count constraint.
+.IP "\fBmax_object_name_length\fR"
+max_object_name_length is the max number of bytes in the utf8 encoding of an
+object name.
+.IP "\fBcontainer_listing_limit\fR"
+container_listing_limit is the default (and max) number of items returned for
+a container listing request.
+.IP "\fBaccount_listing_limit\fR"
+account_listing_limit is the default (and max) number of items returned for an
+account listing request.
+.IP "\fBmax_account_name_length\fR"
+max_account_name_length is the max number of bytes in the utf8 encoding of an
+account name.
+.IP "\fBmax_container_name_length\fR"
+max_container_name_length is the max number of bytes in the utf8 encoding of a
+container name.
+.IP "\fBvalid_api_versions\fR"
+By default, all REST API calls should use "v1" or "v1.0" as the version string,
+for example "/v1/account". This can be manually overridden to make this
+backward-compatible, in case a different version string has been used before.
+Use a comma-separated list in case of multiple allowed versions, for example
+valid_api_versions = v0,v1,v2.
+This is only enforced for account, container and object requests. The allowed
+api versions are by default excluded from /info.
+.IP "\fBauto_create_account_prefix\fR"
+auto_create_account_prefix specifies the prefix for system accounts, such as
+those used by the object-expirer, and container-sharder.
+Default is ".".
+
+
+
+.SH DOCUMENTATION
+.LP
+More in depth documentation about the swift.conf and also OpenStack-Swift as a
+whole can be found at
+.BI https://docs.openstack.org/swift/latest/admin_guide.html
+and
+.BI https://docs.openstack.org/swift/latest/
diff --git a/doc/requirements.txt b/doc/requirements.txt
new file mode 100644
index 0000000000..32c5aaebd6
--- /dev/null
+++ b/doc/requirements.txt
@@ -0,0 +1,10 @@
+# The order of packages is significant, because pip processes them in the order
+# of appearance. Changing the order has an impact on the overall integration
+# process, which may cause wedges in the gate later.
+# this is required for the docs build jobs
+sphinx>=2.0.0,!=2.1.0 # BSD
+openstackdocstheme>=2.2.1 # Apache-2.0
+reno>=3.1.0 # Apache-2.0
+os-api-ref>=1.0.0 # Apache-2.0
+python-keystoneclient>=3.19.0 # Apache-2.0
+sphinxcontrib-svg2pdfconverter>=0.1.0 # BSD
diff --git a/doc/s3api/conf/ceph-known-failures-keystone.yaml b/doc/s3api/conf/ceph-known-failures-keystone.yaml
new file mode 100644
index 0000000000..69f0e76ffb
--- /dev/null
+++ b/doc/s3api/conf/ceph-known-failures-keystone.yaml
@@ -0,0 +1,194 @@
+ceph_s3:
+  <nose.suite.ContextSuite context=s3tests.functional>:teardown: {status: KNOWN}
+  <nose.suite.ContextSuite context=test_routing_generator>:setup: {status: KNOWN}
+  s3tests.functional.test_headers.test_bucket_create_bad_authorization_invalid_aws2: {status: KNOWN}
+  s3tests.functional.test_headers.test_bucket_create_bad_authorization_none: {status: KNOWN}
+  s3tests.functional.test_headers.test_object_create_bad_authorization_invalid_aws2: {status: KNOWN}
+  s3tests.functional.test_headers.test_object_create_bad_authorization_none: {status: KNOWN}
+  s3tests.functional.test_s3.test_100_continue: {status: KNOWN}
+  s3tests.functional.test_s3.test_atomic_conditional_write_1mb: {status: KNOWN}
+  s3tests.functional.test_s3.test_atomic_dual_conditional_write_1mb: {status: KNOWN}
+  s3tests.functional.test_s3.test_bucket_acl_default: {status: KNOWN}
+  s3tests.functional.test_s3.test_bucket_acl_grant_email: {status: KNOWN}
+  s3tests.functional.test_s3.test_bucket_acl_grant_email_notexist: {status: KNOWN}
+  s3tests.functional.test_s3.test_bucket_acl_grant_nonexist_user: {status: KNOWN}
+  s3tests.functional.test_s3.test_bucket_acl_grant_userid_fullcontrol: {status: KNOWN}
+  s3tests.functional.test_s3.test_bucket_acl_grant_userid_read: {status: KNOWN}
+  s3tests.functional.test_s3.test_bucket_acl_grant_userid_readacp: {status: KNOWN}
+  s3tests.functional.test_s3.test_bucket_acl_grant_userid_write: {status: KNOWN}
+  s3tests.functional.test_s3.test_bucket_acl_grant_userid_writeacp: {status: KNOWN}
+  s3tests.functional.test_s3.test_bucket_acl_no_grants: {status: KNOWN}
+  s3tests.functional.test_s3.test_bucket_acls_changes_persistent: {status: KNOWN}
+  s3tests.functional.test_s3.test_bucket_acl_xml_fullcontrol: {status: KNOWN}
+  s3tests.functional.test_s3.test_bucket_acl_xml_read: {status: KNOWN}
+  s3tests.functional.test_s3.test_bucket_acl_xml_readacp: {status: KNOWN}
+  s3tests.functional.test_s3.test_bucket_acl_xml_write: {status: KNOWN}
+  s3tests.functional.test_s3.test_bucket_acl_xml_writeacp: {status: KNOWN}
+  s3tests.functional.test_s3.test_bucket_header_acl_grants: {status: KNOWN}
+  s3tests.functional.test_s3.test_bucket_list_objects_anonymous: {status: KNOWN}
+  s3tests.functional.test_s3.test_bucket_list_objects_anonymous_fail: {status: KNOWN}
+  s3tests.functional.test_s3.test_bucket_recreate_not_overriding: {status: KNOWN}
+  s3tests.functional.test_s3.test_cors_origin_response: {status: KNOWN}
+  s3tests.functional.test_s3.test_cors_origin_wildcard: {status: KNOWN}
+  s3tests.functional.test_s3.test_list_buckets_anonymous: {status: KNOWN}
+  s3tests.functional.test_s3.test_list_buckets_invalid_auth: {status: KNOWN}
+  s3tests.functional.test_s3.test_logging_toggle: {status: KNOWN}
+  s3tests.functional.test_s3.test_multipart_resend_first_finishes_last: {status: KNOWN}
+  s3tests.functional.test_s3.test_object_acl_full_control_verify_owner: {status: KNOWN}
+  s3tests.functional.test_s3.test_object_acl_xml: {status: KNOWN}
+  s3tests.functional.test_s3.test_object_acl_xml_read: {status: KNOWN}
+  s3tests.functional.test_s3.test_object_acl_xml_readacp: {status: KNOWN}
+  s3tests.functional.test_s3.test_object_acl_xml_write: {status: KNOWN}
+  s3tests.functional.test_s3.test_object_acl_xml_writeacp: {status: KNOWN}
+  s3tests.functional.test_s3.test_object_copy_canned_acl: {status: KNOWN}
+  s3tests.functional.test_s3.test_object_copy_not_owned_object_bucket: {status: KNOWN}
+  s3tests.functional.test_s3.test_object_giveaway: {status: KNOWN}
+  s3tests.functional.test_s3.test_object_header_acl_grants: {status: KNOWN}
+  s3tests.functional.test_s3.test_object_raw_get: {status: KNOWN}
+  s3tests.functional.test_s3.test_object_raw_get_bucket_acl: {status: KNOWN}
+  s3tests.functional.test_s3.test_object_raw_get_bucket_gone: {status: KNOWN}
+  s3tests.functional.test_s3.test_object_raw_get_object_acl: {status: KNOWN}
+  s3tests.functional.test_s3.test_object_raw_get_object_gone: {status: KNOWN}
+  s3tests.functional.test_s3.test_object_raw_put: {status: KNOWN}
+  s3tests.functional.test_s3.test_object_raw_put_write_access: {status: KNOWN}
+  s3tests.functional.test_s3.test_object_set_valid_acl: {status: KNOWN}
+  s3tests.functional.test_s3.test_post_object_anonymous_request: {status: KNOWN}
+  s3tests.functional.test_s3.test_post_object_authenticated_request: {status: KNOWN}
+  s3tests.functional.test_s3.test_post_object_authenticated_request_bad_access_key: {status: KNOWN}
+  s3tests.functional.test_s3.test_post_object_case_insensitive_condition_fields: {status: KNOWN}
+  s3tests.functional.test_s3.test_post_object_condition_is_case_sensitive: {status: KNOWN}
+  s3tests.functional.test_s3.test_post_object_escaped_field_values: {status: KNOWN}
+  s3tests.functional.test_s3.test_post_object_expired_policy: {status: KNOWN}
+  s3tests.functional.test_s3.test_post_object_expires_is_case_sensitive: {status: KNOWN}
+  s3tests.functional.test_s3.test_post_object_ignored_header: {status: KNOWN}
+  s3tests.functional.test_s3.test_post_object_invalid_access_key: {status: KNOWN}
+  s3tests.functional.test_s3.test_post_object_invalid_content_length_argument: {status: KNOWN}
+  s3tests.functional.test_s3.test_post_object_invalid_date_format: {status: KNOWN}
+  s3tests.functional.test_s3.test_post_object_invalid_request_field_value: {status: KNOWN}
+  s3tests.functional.test_s3.test_post_object_invalid_signature: {status: KNOWN}
+  s3tests.functional.test_s3.test_post_object_missing_conditions_list: {status: KNOWN}
+  s3tests.functional.test_s3.test_post_object_missing_content_length_argument: {status: KNOWN}
+  s3tests.functional.test_s3.test_post_object_missing_expires_condition: {status: KNOWN}
+  s3tests.functional.test_s3.test_post_object_missing_policy_condition: {status: KNOWN}
+  s3tests.functional.test_s3.test_post_object_missing_signature: {status: KNOWN}
+  s3tests.functional.test_s3.test_post_object_no_key_specified: {status: KNOWN}
+  s3tests.functional.test_s3.test_post_object_request_missing_policy_specified_field: {status: KNOWN}
+  s3tests.functional.test_s3.test_post_object_set_invalid_success_code: {status: KNOWN}
+  s3tests.functional.test_s3.test_post_object_set_key_from_filename: {status: KNOWN}
+  s3tests.functional.test_s3.test_post_object_set_success_code: {status: KNOWN}
+  s3tests.functional.test_s3.test_post_object_success_redirect_action: {status: KNOWN}
+  s3tests.functional.test_s3.test_post_object_upload_larger_than_chunk: {status: KNOWN}
+  s3tests.functional.test_s3.test_post_object_upload_size_below_minimum: {status: KNOWN}
+  s3tests.functional.test_s3.test_post_object_upload_size_limit_exceeded: {status: KNOWN}
+  s3tests.functional.test_s3.test_post_object_user_specified_header: {status: KNOWN}
+  s3tests.functional.test_s3.test_put_object_ifmatch_failed: {status: KNOWN}
+  s3tests.functional.test_s3.test_put_object_ifmatch_good: {status: KNOWN}
+  s3tests.functional.test_s3.test_put_object_ifmatch_nonexisted_failed: {status: KNOWN}
+  s3tests.functional.test_s3.test_put_object_ifmatch_overwrite_existed_good: {status: KNOWN}
+  s3tests.functional.test_s3.test_put_object_ifnonmatch_failed: {status: KNOWN}
+  s3tests.functional.test_s3.test_put_object_ifnonmatch_good: {status: KNOWN}
+  s3tests.functional.test_s3.test_set_cors: {status: KNOWN}
+  s3tests.functional.test_s3.test_stress_bucket_acls_changes: {status: KNOWN}
+  s3tests.functional.test_s3.test_versioned_concurrent_object_create_concurrent_remove: {status: KNOWN}
+  s3tests.functional.test_s3.test_versioned_object_acl: {status: KNOWN}
+  s3tests.functional.test_s3.test_versioning_copy_obj_version: {status: KNOWN}
+  s3tests.functional.test_s3.test_versioning_multi_object_delete: {status: KNOWN}
+  s3tests.functional.test_s3.test_versioning_multi_object_delete_with_marker: {status: KNOWN}
+  s3tests.functional.test_s3.test_versioning_multi_object_delete_with_marker_create: {status: KNOWN}
+  s3tests.functional.test_s3.test_versioning_obj_create_overwrite_multipart: {status: KNOWN}
+  s3tests.functional.test_s3.test_versioning_obj_create_read_remove_head: {status: KNOWN}
+  s3tests.functional.test_s3.test_versioning_obj_create_versions_remove_all: {status: KNOWN}
+  s3tests.functional.test_s3.test_versioning_obj_create_versions_remove_special_names: {status: KNOWN}
+  s3tests.functional.test_s3.test_versioning_obj_suspend_versions: {status: KNOWN}
+  s3tests.functional.test_s3.test_versioning_obj_suspend_versions_simple: {status: KNOWN}
+  s3tests.functional.test_s3_website.check_can_test_website: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_bucket_private_redirectall_base: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_bucket_private_redirectall_path: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_bucket_private_redirectall_path_upgrade: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_nonexistant_bucket_rgw: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_nonexistant_bucket_s3: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_private_bucket_list_empty: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_private_bucket_list_empty_blockederrordoc: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_private_bucket_list_empty_gooderrordoc: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_private_bucket_list_empty_missingerrordoc: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_private_bucket_list_private_index: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_private_bucket_list_private_index_blockederrordoc: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_private_bucket_list_private_index_gooderrordoc: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_private_bucket_list_private_index_missingerrordoc: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_private_bucket_list_public_index: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_public_bucket_list_empty: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_public_bucket_list_empty_blockederrordoc: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_public_bucket_list_empty_gooderrordoc: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_public_bucket_list_empty_missingerrordoc: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_public_bucket_list_private_index: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_public_bucket_list_private_index_blockederrordoc: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_public_bucket_list_private_index_gooderrordoc: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_public_bucket_list_private_index_missingerrordoc: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_public_bucket_list_public_index: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_xredirect_nonwebsite: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_xredirect_private_abs: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_xredirect_private_relative: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_xredirect_public_abs: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_xredirect_public_relative: {status: KNOWN}
+  s3tests.functional.test_s3.test_bucket_list_return_data_versioning: {status: KNOWN}
+  s3tests.functional.test_s3.test_bucket_policy: {status: KNOWN}
+  s3tests.functional.test_s3.test_bucket_policy_acl: {status: KNOWN}
+  s3tests.functional.test_s3.test_bucket_policy_another_bucket: {status: KNOWN}
+  s3tests.functional.test_s3.test_bucket_policy_different_tenant: {status: KNOWN}
+  s3tests.functional.test_s3.test_bucket_policy_set_condition_operator_end_with_IfExists: {status: KNOWN}
+  s3tests.functional.test_s3.test_delete_tags_obj_public: {status: KNOWN}
+  s3tests.functional.test_s3.test_encryption_sse_c_invalid_md5: {status: KNOWN}
+  s3tests.functional.test_s3.test_encryption_sse_c_method_head: {status: KNOWN}
+  s3tests.functional.test_s3.test_encryption_sse_c_multipart_bad_download: {status: KNOWN}
+  s3tests.functional.test_s3.test_encryption_sse_c_multipart_invalid_chunks_1: {status: KNOWN}
+  s3tests.functional.test_s3.test_encryption_sse_c_multipart_invalid_chunks_2: {status: KNOWN}
+  s3tests.functional.test_s3.test_encryption_sse_c_no_key: {status: KNOWN}
+  s3tests.functional.test_s3.test_encryption_sse_c_no_md5: {status: KNOWN}
+  s3tests.functional.test_s3.test_encryption_sse_c_other_key: {status: KNOWN}
+  s3tests.functional.test_s3.test_encryption_sse_c_post_object_authenticated_request: {status: KNOWN}
+  s3tests.functional.test_s3.test_encryption_sse_c_present: {status: KNOWN}
+  s3tests.functional.test_s3.test_get_obj_head_tagging: {status: KNOWN}
+  s3tests.functional.test_s3.test_get_obj_tagging: {status: KNOWN}
+  s3tests.functional.test_s3.test_get_tags_acl_public: {status: KNOWN}
+  s3tests.functional.test_s3.test_lifecycle_deletemarker_expiration: {status: KNOWN}
+  s3tests.functional.test_s3.test_lifecycle_expiration: {status: KNOWN}
+  s3tests.functional.test_s3.test_lifecycle_expiration_date: {status: KNOWN}
+  s3tests.functional.test_s3.test_lifecycle_get: {status: KNOWN}
+  s3tests.functional.test_s3.test_lifecycle_get_no_id: {status: KNOWN}
+  s3tests.functional.test_s3.test_lifecycle_id_too_long: {status: KNOWN}
+  s3tests.functional.test_s3.test_lifecycle_multipart_expiration: {status: KNOWN}
+  s3tests.functional.test_s3.test_lifecycle_noncur_expiration: {status: KNOWN}
+  s3tests.functional.test_s3.test_lifecycle_rules_conflicted: {status: KNOWN}
+  s3tests.functional.test_s3.test_lifecycle_same_id: {status: KNOWN}
+  s3tests.functional.test_s3.test_lifecycle_set: {status: KNOWN}
+  s3tests.functional.test_s3.test_lifecycle_set_date: {status: KNOWN}
+  s3tests.functional.test_s3.test_lifecycle_set_deletemarker: {status: KNOWN}
+  s3tests.functional.test_s3.test_lifecycle_set_empty_filter: {status: KNOWN}
+  s3tests.functional.test_s3.test_lifecycle_set_filter: {status: KNOWN}
+  s3tests.functional.test_s3.test_lifecycle_set_multipart: {status: KNOWN}
+  s3tests.functional.test_s3.test_lifecycle_set_noncurrent: {status: KNOWN}
+  s3tests.functional.test_s3.test_multipart_copy_invalid_range: {status: KNOWN}
+  s3tests.functional.test_s3.test_post_object_empty_conditions: {status: KNOWN}
+  s3tests.functional.test_s3.test_post_object_tags_anonymous_request: {status: KNOWN}
+  s3tests.functional.test_s3.test_post_object_tags_authenticated_request: {status: KNOWN}
+  s3tests.functional.test_s3.test_put_delete_tags: {status: KNOWN}
+  s3tests.functional.test_s3.test_put_excess_key_tags: {status: KNOWN}
+  s3tests.functional.test_s3.test_put_excess_tags: {status: KNOWN}
+  s3tests.functional.test_s3.test_put_excess_val_tags: {status: KNOWN}
+  s3tests.functional.test_s3.test_put_max_kvsize_tags: {status: KNOWN}
+  s3tests.functional.test_s3.test_put_max_tags: {status: KNOWN}
+  s3tests.functional.test_s3.test_put_modify_tags: {status: KNOWN}
+  s3tests.functional.test_s3.test_put_obj_with_tags: {status: KNOWN}
+  s3tests.functional.test_s3.test_put_tags_acl_public: {status: KNOWN}
+  s3tests.functional.test_s3.test_sse_kms_method_head: {status: KNOWN}
+  s3tests.functional.test_s3.test_sse_kms_multipart_invalid_chunks_1: {status: KNOWN}
+  s3tests.functional.test_s3.test_sse_kms_multipart_invalid_chunks_2: {status: KNOWN}
+  s3tests.functional.test_s3.test_sse_kms_multipart_upload: {status: KNOWN}
+  s3tests.functional.test_s3.test_sse_kms_post_object_authenticated_request: {status: KNOWN}
+  s3tests.functional.test_s3.test_sse_kms_present: {status: KNOWN}
+  s3tests.functional.test_s3.test_sse_kms_read_declare: {status: KNOWN}
+  s3tests.functional.test_s3.test_sse_kms_transfer_13b: {status: KNOWN}
+  s3tests.functional.test_s3.test_sse_kms_transfer_1MB: {status: KNOWN}
+  s3tests.functional.test_s3.test_sse_kms_transfer_1b: {status: KNOWN}
+  s3tests.functional.test_s3.test_sse_kms_transfer_1kb: {status: KNOWN}
+  s3tests.functional.test_s3.test_versioned_object_acl_no_version_specified: {status: KNOWN}
diff --git a/doc/s3api/conf/ceph-known-failures-tempauth.yaml b/doc/s3api/conf/ceph-known-failures-tempauth.yaml
new file mode 100644
index 0000000000..86dc1dbdb5
--- /dev/null
+++ b/doc/s3api/conf/ceph-known-failures-tempauth.yaml
@@ -0,0 +1,359 @@
+ceph_s3:
+  <nose.suite.ContextSuite context=s3tests.functional>:teardown: {status: KNOWN}
+  <nose.suite.ContextSuite context=s3tests_boto3.functional>:teardown: {status: KNOWN}
+  <nose.suite.ContextSuite context=test_routing_generator>:setup: {status: KNOWN}
+  s3tests.functional.test_headers.test_bucket_create_bad_authorization_invalid_aws2: {status: KNOWN}
+  s3tests.functional.test_headers.test_bucket_create_bad_authorization_none: {status: KNOWN}
+  s3tests.functional.test_headers.test_object_create_bad_authorization_invalid_aws2: {status: KNOWN}
+  s3tests.functional.test_headers.test_object_create_bad_authorization_none: {status: KNOWN}
+  s3tests.functional.test_s3.test_atomic_dual_conditional_write_1mb: {status: KNOWN}
+  s3tests.functional.test_s3.test_logging_toggle: {status: KNOWN}
+  s3tests.functional.test_s3_website.check_can_test_website: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_bucket_private_redirectall_base: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_bucket_private_redirectall_path: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_bucket_private_redirectall_path_upgrade: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_nonexistant_bucket_rgw: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_nonexistant_bucket_s3: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_private_bucket_list_empty: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_private_bucket_list_empty_blockederrordoc: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_private_bucket_list_empty_gooderrordoc: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_private_bucket_list_empty_missingerrordoc: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_private_bucket_list_private_index: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_private_bucket_list_private_index_blockederrordoc: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_private_bucket_list_private_index_gooderrordoc: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_private_bucket_list_private_index_missingerrordoc: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_private_bucket_list_public_index: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_public_bucket_list_empty: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_public_bucket_list_empty_blockederrordoc: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_public_bucket_list_empty_gooderrordoc: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_public_bucket_list_empty_missingerrordoc: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_public_bucket_list_private_index: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_public_bucket_list_private_index_blockederrordoc: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_public_bucket_list_private_index_gooderrordoc: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_public_bucket_list_private_index_missingerrordoc: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_public_bucket_list_public_index: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_xredirect_nonwebsite: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_xredirect_private_abs: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_xredirect_private_relative: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_xredirect_public_abs: {status: KNOWN}
+  s3tests.functional.test_s3_website.test_website_xredirect_public_relative: {status: KNOWN}
+  s3tests.functional.test_s3.test_bucket_policy_different_tenant: {status: KNOWN}
+  s3tests.functional.test_s3.test_bucket_policy_set_condition_operator_end_with_IfExists: {status: KNOWN}
+  s3tests.functional.test_s3.test_encryption_sse_c_multipart_invalid_chunks_1: {status: KNOWN}
+  s3tests.functional.test_s3.test_encryption_sse_c_multipart_invalid_chunks_2: {status: KNOWN}
+  s3tests.functional.test_s3.test_bucket_policy_put_obj_enc: {status: KNOWN}
+  s3tests.functional.test_s3.test_bucket_policy_put_obj_request_obj_tag: {status: KNOWN}
+  s3tests.functional.test_s3.test_append_object_position_wrong: {status: KNOWN}
+  s3tests.functional.test_s3.test_append_normal_object: {status: KNOWN}
+  s3tests.functional.test_s3.test_append_object: {status: KNOWN}
+  s3tests_boto3.functional.test_headers.test_bucket_create_bad_authorization_empty: {status: KNOWN}
+  s3tests_boto3.functional.test_headers.test_bucket_create_bad_authorization_invalid_aws2: {status: KNOWN}
+  s3tests_boto3.functional.test_headers.test_bucket_create_bad_authorization_none: {status: KNOWN}
+  s3tests_boto3.functional.test_headers.test_bucket_create_bad_date_none_aws2: {status: KNOWN}
+  s3tests_boto3.functional.test_headers.test_object_create_bad_authorization_empty: {status: KNOWN}
+  s3tests_boto3.functional.test_headers.test_object_create_bad_authorization_incorrect_aws2: {status: KNOWN}
+  s3tests_boto3.functional.test_headers.test_object_create_bad_authorization_invalid_aws2: {status: KNOWN}
+  s3tests_boto3.functional.test_headers.test_object_create_bad_authorization_none: {status: KNOWN}
+  s3tests_boto3.functional.test_headers.test_object_create_bad_contentlength_mismatch_above: {status: KNOWN}
+  s3tests_boto3.functional.test_headers.test_object_create_bad_contentlength_mismatch_below_aws2: {status: KNOWN}
+  s3tests_boto3.functional.test_headers.test_object_create_bad_contentlength_none: {status: KNOWN}
+  s3tests_boto3.functional.test_headers.test_object_create_bad_date_none_aws2: {status: KNOWN}
+  s3tests_boto3.functional.test_headers.test_bucket_create_bad_ua_empty_aws2: {status: KNOWN}
+  s3tests_boto3.functional.test_headers.test_bucket_create_bad_ua_none_aws2: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_100_continue: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_atomic_conditional_write_1mb: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_atomic_dual_conditional_write_1mb: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_acl_grant_email: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_acl_grant_email_notexist: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_acl_grant_nonexist_user: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_acl_no_grants: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_create_exists: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_create_naming_bad_long: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_create_naming_bad_punctuation: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_create_naming_bad_short_empty: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_head_extended: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_list_objects_anonymous: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_list_objects_anonymous_fail: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_list_return_data_versioning: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_list_unordered: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_listv2_objects_anonymous: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_listv2_objects_anonymous_fail: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_listv2_unordered: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_policy: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_policy_acl: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_policy_another_bucket: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_policy_different_tenant: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_policy_get_obj_acl_existing_tag: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_policy_get_obj_existing_tag: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_policy_get_obj_tagging_existing_tag: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_policy_put_obj_acl: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_policy_put_obj_copy_source: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_policy_put_obj_copy_source_meta: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_policy_put_obj_enc: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_policy_put_obj_grant: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_policy_put_obj_request_obj_tag: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_policy_put_obj_tagging_existing_tag: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_policy_set_condition_operator_end_with_IfExists: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_recreate_not_overriding: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucketv2_policy: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucketv2_policy_acl: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucketv2_policy_another_bucket: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucketv2_policy_different_tenant: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_cors_header_option: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_cors_origin_response: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_cors_origin_wildcard: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_delete_tags_obj_public: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_encryption_key_no_sse_c: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_encryption_sse_c_invalid_md5: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_encryption_sse_c_method_head: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_encryption_sse_c_multipart_bad_download: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_encryption_sse_c_multipart_invalid_chunks_1: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_encryption_sse_c_multipart_invalid_chunks_2: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_encryption_sse_c_no_key: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_encryption_sse_c_no_md5: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_encryption_sse_c_other_key: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_encryption_sse_c_post_object_authenticated_request: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_encryption_sse_c_present: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_get_obj_head_tagging: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_get_obj_tagging: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_get_tags_acl_public: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_lifecycle_deletemarker_expiration: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_lifecycle_expiration: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_lifecycle_expiration_date: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_lifecycle_expiration_days0: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_lifecycle_expiration_header_head: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_lifecycle_expiration_header_put: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_lifecycle_expiration_versioning_enabled: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_lifecycle_get: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_lifecycle_get_no_id: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_lifecycle_id_too_long: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_lifecycle_multipart_expiration: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_lifecycle_noncur_expiration: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_lifecycle_same_id: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_lifecycle_set: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_lifecycle_set_date: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_lifecycle_set_deletemarker: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_lifecycle_set_empty_filter: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_lifecycle_set_filter: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_lifecycle_set_multipart: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_lifecycle_set_noncurrent: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_lifecyclev2_expiration: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_list_buckets_anonymous: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_list_buckets_invalid_auth: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_logging_toggle: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_multipart_copy_invalid_range: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_multipart_resend_first_finishes_last: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_multipart_upload_empty: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_anon_put: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_anon_put_write_access: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_delete_key_bucket_gone: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_lock_delete_object_with_legal_hold_off: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_lock_delete_object_with_legal_hold_on: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_lock_delete_object_with_retention: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_lock_get_legal_hold_invalid_bucket: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_lock_get_obj_lock: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_lock_get_obj_metadata: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_lock_get_obj_retention: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_lock_get_obj_retention_invalid_bucket: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_lock_put_legal_hold_invalid_bucket: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_lock_put_legal_hold_invalid_status: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_lock_put_obj_lock: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_lock_put_obj_lock_invalid_bucket: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_lock_put_obj_lock_invalid_days: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_lock_put_obj_lock_invalid_status: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_lock_put_obj_lock_invalid_years: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_lock_put_obj_lock_with_days_and_years: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_lock_put_obj_retention: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_lock_put_obj_retention_increase_period: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_lock_put_obj_retention_invalid_bucket: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_lock_put_obj_retention_invalid_mode: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_lock_put_obj_retention_override_default_retention: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_lock_put_obj_retention_shorten_period: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_lock_put_obj_retention_shorten_period_bypass: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_lock_put_obj_retention_versionid: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_lock_suspend_versioning: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_lock_uploading_obj: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_raw_get: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_raw_get_bucket_acl: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_raw_get_bucket_gone: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_raw_get_object_acl: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_raw_get_object_gone: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_raw_get_x_amz_expires_out_max_range: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_raw_get_x_amz_expires_out_positive_range: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_raw_put_authenticated_expired: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_set_get_metadata_empty_to_unreadable_prefix: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_set_get_metadata_empty_to_unreadable_suffix: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_set_get_metadata_overwrite_to_unreadable_prefix: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_set_get_metadata_overwrite_to_unreadable_suffix: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_set_get_non_utf8_metadata: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_set_get_unicode_metadata: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_anonymous_request: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_authenticated_no_content_type: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_authenticated_request: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_authenticated_request_bad_access_key: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_case_insensitive_condition_fields: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_condition_is_case_sensitive: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_empty_conditions: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_escaped_field_values: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_expired_policy: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_expires_is_case_sensitive: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_ignored_header: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_invalid_access_key: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_invalid_content_length_argument: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_invalid_date_format: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_invalid_request_field_value: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_invalid_signature: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_missing_conditions_list: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_missing_content_length_argument: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_missing_expires_condition: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_missing_policy_condition: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_missing_signature: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_no_key_specified: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_request_missing_policy_specified_field: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_set_invalid_success_code: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_set_key_from_filename: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_set_success_code: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_success_redirect_action: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_tags_anonymous_request: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_tags_authenticated_request: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_upload_larger_than_chunk: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_upload_size_below_minimum: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_upload_size_limit_exceeded: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_post_object_user_specified_header: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_put_delete_tags: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_put_excess_key_tags: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_put_excess_tags: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_put_excess_val_tags: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_put_max_kvsize_tags: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_put_max_tags: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_put_modify_tags: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_put_obj_with_tags: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_put_object_ifmatch_failed: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_put_object_ifmatch_good: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_put_object_ifmatch_nonexisted_failed: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_put_object_ifmatch_overwrite_existed_good: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_put_object_ifnonmatch_failed: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_put_object_ifnonmatch_good: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_put_tags_acl_public: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_set_cors: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_set_tagging: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_sse_kms_method_head: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_sse_kms_multipart_invalid_chunks_1: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_sse_kms_multipart_invalid_chunks_2: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_sse_kms_multipart_upload: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_sse_kms_not_declared: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_sse_kms_post_object_authenticated_request: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_sse_kms_present: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_sse_kms_read_declare: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_sse_kms_transfer_13b: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_sse_kms_transfer_1MB: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_sse_kms_transfer_1b: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_sse_kms_transfer_1kb: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_versioning_bucket_multipart_upload_return_version_id: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_versioning_multi_object_delete_with_marker_create: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_versioning_obj_plain_null_version_overwrite: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_account_usage: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_head_bucket_usage: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_set_get_metadata_empty_to_unreadable_infix: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_recreate_overwrite_acl: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_recreate_new_acl: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_acl_grant_email_not_exist: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_buckets_list_ctime: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_create_naming_good_starts_alpha: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_bucket_create_naming_good_starts_digit: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_list_multipart_upload_owner: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_set_bucket_tagging: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_atomic_dual_write_1mb: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_atomic_dual_write_4mb: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_atomic_dual_write_8mb: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_lifecycle_expiration_tags1: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_lifecycle_expiration_tags2: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_lifecycle_expiration_versioned_tags2: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_lifecycle_expiration_noncur_tags1: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_lifecycle_expiration_header_tags_head: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_lifecycle_expiration_header_and_tags_head: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_lock_get_obj_retention_iso8601: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_lock_multi_delete_object_with_retention: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_lock_changing_mode_from_governance_without_bypass: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_lock_changing_mode_from_compliance: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_object_read_unreadable: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_user_policy: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_get_bucket_policy_status: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_get_public_acl_bucket_policy_status: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_get_authpublic_acl_bucket_policy_status: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_get_publicpolicy_acl_bucket_policy_status: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_get_nonpublicpolicy_acl_bucket_policy_status: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_get_nonpublicpolicy_deny_bucket_policy_status: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_get_default_public_block: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_put_public_block: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_block_public_put_bucket_acls: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_block_public_object_canned_acls: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_block_public_policy: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_ignore_public_acls: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_multipart_upload_on_a_bucket_with_policy: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_put_bucket_encryption: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_get_bucket_encryption: {status: KNOWN}
+  s3tests_boto3.functional.test_s3.test_delete_bucket_encryption: {status: KNOWN}
+  s3tests_boto3.functional.test_s3select.test_generate_where_clause: {status: KNOWN}
+  s3tests_boto3.functional.test_s3select.test_generate_projection: {status: KNOWN}
+  s3tests_boto3.functional.test_s3select.test_count_operation: {status: KNOWN}
+  s3tests_boto3.functional.test_s3select.test_column_sum_min_max: {status: KNOWN}
+  s3tests_boto3.functional.test_s3select.test_nullif_expressions: {status: KNOWN}
+  s3tests_boto3.functional.test_s3select.test_nulliftrue_expressions: {status: KNOWN}
+  s3tests_boto3.functional.test_s3select.test_is_not_null_expressions: {status: KNOWN}
+  s3tests_boto3.functional.test_s3select.test_lowerupper_expressions: {status: KNOWN}
+  s3tests_boto3.functional.test_s3select.test_in_expressions: {status: KNOWN}
+  s3tests_boto3.functional.test_s3select.test_true_false_in_expressions: {status: KNOWN}
+  s3tests_boto3.functional.test_s3select.test_like_expressions: {status: KNOWN}
+  s3tests_boto3.functional.test_s3select.test_truefalselike_expressions: {status: KNOWN}
+  s3tests_boto3.functional.test_s3select.test_complex_expressions: {status: KNOWN}
+  s3tests_boto3.functional.test_s3select.test_alias: {status: KNOWN}
+  s3tests_boto3.functional.test_s3select.test_alias_cyclic_refernce: {status: KNOWN}
+  s3tests_boto3.functional.test_s3select.test_datetime: {status: KNOWN}
+  s3tests_boto3.functional.test_s3select.test_true_false_datetime: {status: KNOWN}
+  s3tests_boto3.functional.test_s3select.test_csv_parser: {status: KNOWN}
+  s3tests_boto3.functional.test_s3select.test_csv_definition: {status: KNOWN}
+  s3tests_boto3.functional.test_s3select.test_schema_definition: {status: KNOWN}
+  s3tests_boto3.functional.test_s3select.test_when_then_else_expressions: {status: KNOWN}
+  s3tests_boto3.functional.test_s3select.test_coalesce_expressions: {status: KNOWN}
+  s3tests_boto3.functional.test_s3select.test_cast_expressions: {status: KNOWN}
+  s3tests_boto3.functional.test_s3select.test_trim_expressions: {status: KNOWN}
+  s3tests_boto3.functional.test_s3select.test_truefalse_trim_expressions: {status: KNOWN}
+  s3tests_boto3.functional.test_s3select.test_escape_expressions: {status: KNOWN}
+  s3tests_boto3.functional.test_s3select.test_case_value_expressions: {status: KNOWN}
+  s3tests_boto3.functional.test_s3select.test_bool_cast_expressions: {status: KNOWN}
+  s3tests_boto3.functional.test_s3select.test_progress_expressions: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_get_session_token: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_get_session_token_permanent_creds_denied: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_assume_role_allow: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_assume_role_deny: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_assume_role_creds_expiry: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_assume_role_deny_head_nonexistent: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_assume_role_allow_head_nonexistent: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_assume_role_with_web_identity: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_session_policy_check_on_different_buckets: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_session_policy_check_on_same_bucket: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_session_policy_check_put_obj_denial: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_swapping_role_policy_and_session_policy: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_session_policy_check_different_op_permissions: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_session_policy_check_with_deny_effect: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_session_policy_check_with_deny_on_same_op: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_session_policy_bucket_policy_role_arn: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_session_policy_bucket_policy_session_arn: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_session_policy_copy_object: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_session_policy_no_bucket_role_policy: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_session_policy_bucket_policy_deny: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_assume_role_with_web_identity_with_sub: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_assume_role_with_web_identity_with_azp: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_assume_role_with_web_identity_with_request_tag: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_assume_role_with_web_identity_with_principal_tag: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_assume_role_with_web_identity_for_all_values: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_assume_role_with_web_identity_for_all_values_deny: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_assume_role_with_web_identity_tag_keys_trust_policy: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_assume_role_with_web_identity_tag_keys_role_policy: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_assume_role_with_web_identity_resource_tag: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_assume_role_with_web_identity_resource_tag_deny: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_assume_role_with_web_identity_wrong_resource_tag_deny: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_assume_role_with_web_identity_resource_tag_princ_tag: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_assume_role_with_web_identity_resource_tag_copy_obj: {status: KNOWN}
+  s3tests_boto3.functional.test_sts.test_assume_role_with_web_identity_role_resource_tag: {status: KNOWN}
diff --git a/doc/s3api/rnc/access_control_policy.rnc b/doc/s3api/rnc/access_control_policy.rnc
new file mode 100644
index 0000000000..c857359e09
--- /dev/null
+++ b/doc/s3api/rnc/access_control_policy.rnc
@@ -0,0 +1,7 @@
+include "common.rnc"
+
+start =
+  element AccessControlPolicy {
+    element Owner { CanonicalUser } &
+    element AccessControlList { AccessControlList }
+  }
diff --git a/doc/s3api/rnc/bucket_logging_status.rnc b/doc/s3api/rnc/bucket_logging_status.rnc
new file mode 100644
index 0000000000..a7d9a1effc
--- /dev/null
+++ b/doc/s3api/rnc/bucket_logging_status.rnc
@@ -0,0 +1,10 @@
+include "common.rnc"
+
+start =
+  element BucketLoggingStatus {
+    element LoggingEnabled {
+      element TargetBucket { xsd:string } &
+      element TargetPrefix { xsd:string } &
+      element TargetGrants { AccessControlList }?
+    }?
+  }
diff --git a/doc/s3api/rnc/common.rnc b/doc/s3api/rnc/common.rnc
new file mode 100644
index 0000000000..79dddbb556
--- /dev/null
+++ b/doc/s3api/rnc/common.rnc
@@ -0,0 +1,26 @@
+namespace xsi = "http://www.w3.org/2001/XMLSchema-instance"
+
+CanonicalUser =
+  element ID { xsd:string } &
+  element DisplayName { xsd:string }?
+
+StorageClass = "STANDARD" | "REDUCED_REDUNDANCY" | "GLACIER" | "UNKNOWN"
+
+AccessControlList =
+  element Grant {
+    element Grantee {
+      (
+        attribute xsi:type { "AmazonCustomerByEmail" },
+        element EmailAddress { xsd:string }
+      ) | (
+        attribute xsi:type { "CanonicalUser" },
+        CanonicalUser
+      ) | (
+        attribute xsi:type { "Group" },
+        element URI { xsd:string }
+      )
+    } &
+    element Permission {
+      "READ" | "WRITE" | "READ_ACP" | "WRITE_ACP" | "FULL_CONTROL"
+    }
+  }*
diff --git a/doc/s3api/rnc/complete_multipart_upload.rnc b/doc/s3api/rnc/complete_multipart_upload.rnc
new file mode 100644
index 0000000000..2a8459ef62
--- /dev/null
+++ b/doc/s3api/rnc/complete_multipart_upload.rnc
@@ -0,0 +1,12 @@
+start =
+  element CompleteMultipartUpload {
+    element Part {
+      element PartNumber { xsd:int } &
+      element ETag { xsd:string } &
+      element ChecksumCRC32 { xsd:string }? &
+      element ChecksumCRC32C { xsd:string }? &
+      element ChecksumCRC64NVME { xsd:string }? &
+      element ChecksumSHA1 { xsd:string }? &
+      element ChecksumSHA256 { xsd:string }?
+    }+
+  }
diff --git a/doc/s3api/rnc/complete_multipart_upload_result.rnc b/doc/s3api/rnc/complete_multipart_upload_result.rnc
new file mode 100644
index 0000000000..6dd9cbeb9f
--- /dev/null
+++ b/doc/s3api/rnc/complete_multipart_upload_result.rnc
@@ -0,0 +1,7 @@
+start =
+  element CompleteMultipartUploadResult {
+    element Location { xsd:anyURI },
+    element Bucket { xsd:string },
+    element Key { xsd:string },
+    element ETag { xsd:string }
+  }
diff --git a/doc/s3api/rnc/copy_object_result.rnc b/doc/s3api/rnc/copy_object_result.rnc
new file mode 100644
index 0000000000..bf96a8a91d
--- /dev/null
+++ b/doc/s3api/rnc/copy_object_result.rnc
@@ -0,0 +1,5 @@
+start =
+  element CopyObjectResult {
+    element LastModified { xsd:dateTime },
+    element ETag { xsd:string }
+  }
diff --git a/doc/s3api/rnc/copy_part_result.rnc b/doc/s3api/rnc/copy_part_result.rnc
new file mode 100644
index 0000000000..a7d7956515
--- /dev/null
+++ b/doc/s3api/rnc/copy_part_result.rnc
@@ -0,0 +1,5 @@
+start =
+  element CopyPartResult {
+    element LastModified { xsd:dateTime },
+    element ETag { xsd:string }
+  }
diff --git a/doc/s3api/rnc/create_bucket_configuration.rnc b/doc/s3api/rnc/create_bucket_configuration.rnc
new file mode 100644
index 0000000000..e366d72ed5
--- /dev/null
+++ b/doc/s3api/rnc/create_bucket_configuration.rnc
@@ -0,0 +1,4 @@
+start =
+  element * {
+    element LocationConstraint { xsd:string }
+  }
diff --git a/doc/s3api/rnc/delete.rnc b/doc/s3api/rnc/delete.rnc
new file mode 100644
index 0000000000..a0cac2d74f
--- /dev/null
+++ b/doc/s3api/rnc/delete.rnc
@@ -0,0 +1,8 @@
+start =
+  element Delete {
+    element Quiet { xsd:string }? &
+    element Object {
+      element Key { xsd:string } &
+      element VersionId { xsd:string }?
+    }+
+  }
diff --git a/doc/s3api/rnc/delete_result.rnc b/doc/s3api/rnc/delete_result.rnc
new file mode 100644
index 0000000000..3a63bf78a8
--- /dev/null
+++ b/doc/s3api/rnc/delete_result.rnc
@@ -0,0 +1,17 @@
+start =
+  element DeleteResult {
+    (
+      element Deleted {
+        element Key { xsd:string },
+        element VersionId { xsd:string }?,
+        element DeleteMarker { xsd:boolean }?,
+        element DeleteMarkerVersionId { xsd:string }?
+      } |
+      element Error {
+        element Key { xsd:string },
+        element VersionId { xsd:string }?,
+        element Code { xsd:string },
+        element Message { xsd:string }
+      }
+    )*
+  }
diff --git a/doc/s3api/rnc/error.rnc b/doc/s3api/rnc/error.rnc
new file mode 100644
index 0000000000..0e352c71a6
--- /dev/null
+++ b/doc/s3api/rnc/error.rnc
@@ -0,0 +1,11 @@
+start =
+  element Error {
+    element Code { xsd:string },
+    element Message { xsd:string },
+    DebugInfo*
+  }
+
+DebugInfo =
+  element * {
+    (attribute * { text } | text | DebugInfo)*
+  }
diff --git a/doc/s3api/rnc/initiate_multipart_upload_result.rnc b/doc/s3api/rnc/initiate_multipart_upload_result.rnc
new file mode 100644
index 0000000000..8830121f95
--- /dev/null
+++ b/doc/s3api/rnc/initiate_multipart_upload_result.rnc
@@ -0,0 +1,6 @@
+start =
+  element InitiateMultipartUploadResult {
+    element Bucket { xsd:string },
+    element Key { xsd:string },
+    element UploadId { xsd:string }
+  }
diff --git a/doc/s3api/rnc/lifecycle_configuration.rnc b/doc/s3api/rnc/lifecycle_configuration.rnc
new file mode 100644
index 0000000000..b21fc07b67
--- /dev/null
+++ b/doc/s3api/rnc/lifecycle_configuration.rnc
@@ -0,0 +1,20 @@
+include "common.rnc"
+
+start =
+  element LifecycleConfiguration {
+    element Rule {
+      element ID { xsd:string }? &
+      element Prefix { xsd:string } &
+      element Status { "Enabled" | "Disabled" } &
+      element Transition { Transition }? &
+      element Expiration { Expiration }?
+    }+
+  }
+
+Expiration =
+  element Days { xsd:int } |
+  element Date { xsd:dateTime }
+
+Transition =
+  Expiration &
+  element StorageClass { StorageClass }
diff --git a/doc/s3api/rnc/list_all_my_buckets_result.rnc b/doc/s3api/rnc/list_all_my_buckets_result.rnc
new file mode 100644
index 0000000000..220a34aa99
--- /dev/null
+++ b/doc/s3api/rnc/list_all_my_buckets_result.rnc
@@ -0,0 +1,12 @@
+include "common.rnc"
+
+start =
+  element ListAllMyBucketsResult {
+    element Owner { CanonicalUser },
+    element Buckets {
+      element Bucket {
+        element Name { xsd:string },
+        element CreationDate { xsd:dateTime }
+      }*
+    }
+  }
diff --git a/doc/s3api/rnc/list_bucket_result.rnc b/doc/s3api/rnc/list_bucket_result.rnc
new file mode 100644
index 0000000000..eb86c08042
--- /dev/null
+++ b/doc/s3api/rnc/list_bucket_result.rnc
@@ -0,0 +1,33 @@
+include "common.rnc"
+
+start =
+  element ListBucketResult {
+    element Name { xsd:string },
+    element Prefix { xsd:string },
+    (
+      (
+        element Marker { xsd:string },
+        element NextMarker { xsd:string }?
+      ) | (
+        element NextContinuationToken { xsd:string }?,
+        element ContinuationToken { xsd:string }?,
+        element StartAfter { xsd:string }?,
+        element KeyCount { xsd:int }
+      )
+    ),
+    element MaxKeys { xsd:int },
+    element Delimiter { xsd:string }?,
+    element EncodingType { xsd:string }?,
+    element IsTruncated { xsd:boolean },
+    element Contents {
+      element Key { xsd:string },
+      element LastModified { xsd:dateTime },
+      element ETag { xsd:string },
+      element Size { xsd:long },
+      element Owner { CanonicalUser }?,
+      element StorageClass { StorageClass }
+    }*,
+    element CommonPrefixes {
+      element Prefix { xsd:string }
+    }*
+  }
diff --git a/doc/s3api/rnc/list_multipart_uploads_result.rnc b/doc/s3api/rnc/list_multipart_uploads_result.rnc
new file mode 100644
index 0000000000..6ac1e1237c
--- /dev/null
+++ b/doc/s3api/rnc/list_multipart_uploads_result.rnc
@@ -0,0 +1,26 @@
+include "common.rnc"
+
+start =
+  element ListMultipartUploadsResult {
+    element Bucket { xsd:string },
+    element KeyMarker { xsd:string },
+    element UploadIdMarker { xsd:string },
+    element NextKeyMarker { xsd:string },
+    element NextUploadIdMarker { xsd:string },
+    element Delimiter { xsd:string }?,
+    element Prefix { xsd:string }?,
+    element MaxUploads { xsd:int },
+    element EncodingType { xsd:string }?,
+    element IsTruncated { xsd:boolean },
+    element Upload {
+      element Key { xsd:string },
+      element UploadId { xsd:string },
+      element Initiator { CanonicalUser },
+      element Owner { CanonicalUser },
+      element StorageClass { StorageClass },
+      element Initiated { xsd:dateTime }
+    }*,
+    element CommonPrefixes {
+      element Prefix { xsd:string }
+    }*
+  }
diff --git a/doc/s3api/rnc/list_parts_result.rnc b/doc/s3api/rnc/list_parts_result.rnc
new file mode 100644
index 0000000000..2143315427
--- /dev/null
+++ b/doc/s3api/rnc/list_parts_result.rnc
@@ -0,0 +1,22 @@
+include "common.rnc"
+
+start =
+    element ListPartsResult {
+    element Bucket { xsd:string },
+    element Key { xsd:string },
+    element UploadId { xsd:string },
+    element Initiator { CanonicalUser },
+    element Owner { CanonicalUser },
+    element StorageClass { StorageClass },
+    element PartNumberMarker { xsd:int },
+    element NextPartNumberMarker { xsd:int },
+    element MaxParts { xsd:int },
+    element EncodingType { xsd:string }?,
+    element IsTruncated { xsd:boolean },
+    element Part {
+      element PartNumber { xsd:int },
+      element LastModified { xsd:dateTime },
+      element ETag { xsd:string },
+      element Size { xsd:long }
+    }*
+  }
diff --git a/doc/s3api/rnc/list_versions_result.rnc b/doc/s3api/rnc/list_versions_result.rnc
new file mode 100644
index 0000000000..969073f3b0
--- /dev/null
+++ b/doc/s3api/rnc/list_versions_result.rnc
@@ -0,0 +1,37 @@
+include "common.rnc"
+
+start =
+  element ListVersionsResult {
+    element Name { xsd:string },
+    element Prefix { xsd:string },
+    element KeyMarker { xsd:string },
+    element VersionIdMarker { xsd:string },
+    element NextKeyMarker { xsd:string }?,
+    element NextVersionIdMarker { xsd:string }?,
+    element MaxKeys { xsd:int },
+    element EncodingType { xsd:string }?,
+    element Delimiter { xsd:string }?,
+    element IsTruncated { xsd:boolean },
+    (
+      element Version {
+        element Key { xsd:string },
+        element VersionId { xsd:string },
+        element IsLatest { xsd:boolean },
+        element LastModified { xsd:dateTime },
+        element ETag { xsd:string },
+        element Size { xsd:long },
+        element Owner { CanonicalUser }?,
+        element StorageClass { StorageClass }
+      } |
+      element DeleteMarker {
+        element Key { xsd:string },
+        element VersionId { xsd:string },
+        element IsLatest { xsd:boolean },
+        element LastModified { xsd:dateTime },
+        element Owner { CanonicalUser }?
+      }
+    )*,
+    element CommonPrefixes {
+      element Prefix { xsd:string }
+    }*
+  }
diff --git a/doc/s3api/rnc/location_constraint.rnc b/doc/s3api/rnc/location_constraint.rnc
new file mode 100644
index 0000000000..829176ff95
--- /dev/null
+++ b/doc/s3api/rnc/location_constraint.rnc
@@ -0,0 +1 @@
+start = element LocationConstraint { xsd:string }
diff --git a/doc/s3api/rnc/versioning_configuration.rnc b/doc/s3api/rnc/versioning_configuration.rnc
new file mode 100644
index 0000000000..87e5d15a97
--- /dev/null
+++ b/doc/s3api/rnc/versioning_configuration.rnc
@@ -0,0 +1,5 @@
+start =
+  element VersioningConfiguration {
+    element Status { "Enabled" | "Suspended" }? &
+    element MfaDelete { "Enabled" | "Disabled" }?
+  }
diff --git a/doc/saio/bin/remakerings b/doc/saio/bin/remakerings
new file mode 100755
index 0000000000..0d67b6b4ce
--- /dev/null
+++ b/doc/saio/bin/remakerings
@@ -0,0 +1,42 @@
+#!/bin/bash
+
+set -e
+
+cd /etc/swift
+
+rm -f *.builder *.ring.gz backups/*.builder backups/*.ring.gz
+
+swift-ring-builder object.builder create 10 3 1
+swift-ring-builder object.builder add r1z1-127.0.0.1:6210/sdb1 1
+swift-ring-builder object.builder add r1z2-127.0.0.2:6220/sdb2 1
+swift-ring-builder object.builder add r1z3-127.0.0.3:6230/sdb3 1
+swift-ring-builder object.builder add r1z4-127.0.0.4:6240/sdb4 1
+swift-ring-builder object.builder rebalance
+swift-ring-builder object-1.builder create 10 2 1
+swift-ring-builder object-1.builder add r1z1-127.0.0.1:6210/sdb1 1
+swift-ring-builder object-1.builder add r1z2-127.0.0.2:6220/sdb2 1
+swift-ring-builder object-1.builder add r1z3-127.0.0.3:6230/sdb3 1
+swift-ring-builder object-1.builder add r1z4-127.0.0.4:6240/sdb4 1
+swift-ring-builder object-1.builder rebalance
+swift-ring-builder object-2.builder create 10 6 1
+swift-ring-builder object-2.builder add r1z1-127.0.0.1:6210/sdb1 1
+swift-ring-builder object-2.builder add r1z1-127.0.0.1:6210/sdb5 1
+swift-ring-builder object-2.builder add r1z2-127.0.0.2:6220/sdb2 1
+swift-ring-builder object-2.builder add r1z2-127.0.0.2:6220/sdb6 1
+swift-ring-builder object-2.builder add r1z3-127.0.0.3:6230/sdb3 1
+swift-ring-builder object-2.builder add r1z3-127.0.0.3:6230/sdb7 1
+swift-ring-builder object-2.builder add r1z4-127.0.0.4:6240/sdb4 1
+swift-ring-builder object-2.builder add r1z4-127.0.0.4:6240/sdb8 1
+swift-ring-builder object-2.builder rebalance
+swift-ring-builder container.builder create 10 3 1
+swift-ring-builder container.builder add r1z1-127.0.0.1:6211/sdb1 1
+swift-ring-builder container.builder add r1z2-127.0.0.2:6221/sdb2 1
+swift-ring-builder container.builder add r1z3-127.0.0.3:6231/sdb3 1
+swift-ring-builder container.builder add r1z4-127.0.0.4:6241/sdb4 1
+swift-ring-builder container.builder rebalance
+swift-ring-builder account.builder create 10 3 1
+swift-ring-builder account.builder add r1z1-127.0.0.1:6212/sdb1 1
+swift-ring-builder account.builder add r1z2-127.0.0.2:6222/sdb2 1
+swift-ring-builder account.builder add r1z3-127.0.0.3:6232/sdb3 1
+swift-ring-builder account.builder add r1z4-127.0.0.4:6242/sdb4 1
+swift-ring-builder account.builder rebalance
diff --git a/doc/saio/bin/resetswift b/doc/saio/bin/resetswift
new file mode 100755
index 0000000000..65c7a306cd
--- /dev/null
+++ b/doc/saio/bin/resetswift
@@ -0,0 +1,30 @@
+#!/bin/bash
+
+set -e
+
+swift-init all kill
+swift-orphans -a 0 -k KILL
+
+# Remove the following line if you did not set up rsyslog for individual logging:
+sudo find /var/log/swift -type f -exec rm -f {} \;
+if cut -d' ' -f2 /proc/mounts | grep -q /mnt/sdb1 ; then
+    sudo umount /mnt/sdb1
+fi
+# If you are using a loopback device set SAIO_BLOCK_DEVICE to "/srv/swift-disk"
+sudo mkfs.xfs -f ${SAIO_BLOCK_DEVICE:-/dev/sdb1}
+sudo mount /mnt/sdb1
+sudo mkdir /mnt/sdb1/1 /mnt/sdb1/2 /mnt/sdb1/3 /mnt/sdb1/4
+sudo chown ${USER}:${USER} /mnt/sdb1/*
+mkdir -p /srv/1/node/sdb1 /srv/1/node/sdb5 \
+         /srv/2/node/sdb2 /srv/2/node/sdb6 \
+         /srv/3/node/sdb3 /srv/3/node/sdb7 \
+         /srv/4/node/sdb4 /srv/4/node/sdb8
+sudo rm -f /var/log/debug /var/log/messages /var/log/rsyncd.log /var/log/syslog
+find /var/cache/swift* -type f -name *.recon -exec rm -f {} \;
+if [ "`type -t systemctl`" == "file" ]; then
+    sudo systemctl restart rsyslog
+    sudo systemctl restart memcached
+else
+    sudo service rsyslog restart
+    sudo service memcached restart
+fi
diff --git a/doc/saio/bin/startmain b/doc/saio/bin/startmain
new file mode 100755
index 0000000000..f099424db2
--- /dev/null
+++ b/doc/saio/bin/startmain
@@ -0,0 +1,5 @@
+#!/bin/bash
+
+set -e
+
+swift-init main start
diff --git a/doc/saio/bin/startrest b/doc/saio/bin/startrest
new file mode 100755
index 0000000000..bb1996b25b
--- /dev/null
+++ b/doc/saio/bin/startrest
@@ -0,0 +1,5 @@
+#!/bin/bash
+
+set -e
+
+swift-init rest start
diff --git a/doc/saio/rsyncd.conf b/doc/saio/rsyncd.conf
new file mode 100644
index 0000000000..28aca5a595
--- /dev/null
+++ b/doc/saio/rsyncd.conf
@@ -0,0 +1,77 @@
+uid = <your-user-name>
+gid = <your-user-name>
+log file = /var/log/rsyncd.log
+pid file = /var/run/rsyncd.pid
+address = 0.0.0.0
+
+[account6212]
+max connections = 25
+path = /srv/1/node/
+read only = false
+lock file = /var/lock/account6212.lock
+
+[account6222]
+max connections = 25
+path = /srv/2/node/
+read only = false
+lock file = /var/lock/account6222.lock
+
+[account6232]
+max connections = 25
+path = /srv/3/node/
+read only = false
+lock file = /var/lock/account6232.lock
+
+[account6242]
+max connections = 25
+path = /srv/4/node/
+read only = false
+lock file = /var/lock/account6242.lock
+
+[container6211]
+max connections = 25
+path = /srv/1/node/
+read only = false
+lock file = /var/lock/container6211.lock
+
+[container6221]
+max connections = 25
+path = /srv/2/node/
+read only = false
+lock file = /var/lock/container6221.lock
+
+[container6231]
+max connections = 25
+path = /srv/3/node/
+read only = false
+lock file = /var/lock/container6231.lock
+
+[container6241]
+max connections = 25
+path = /srv/4/node/
+read only = false
+lock file = /var/lock/container6241.lock
+
+[object6210]
+max connections = 25
+path = /srv/1/node/
+read only = false
+lock file = /var/lock/object6210.lock
+
+[object6220]
+max connections = 25
+path = /srv/2/node/
+read only = false
+lock file = /var/lock/object6220.lock
+
+[object6230]
+max connections = 25
+path = /srv/3/node/
+read only = false
+lock file = /var/lock/object6230.lock
+
+[object6240]
+max connections = 25
+path = /srv/4/node/
+read only = false
+lock file = /var/lock/object6240.lock
diff --git a/doc/saio/rsyslog.d/10-swift.conf b/doc/saio/rsyslog.d/10-swift.conf
new file mode 100644
index 0000000000..e0a5624340
--- /dev/null
+++ b/doc/saio/rsyslog.d/10-swift.conf
@@ -0,0 +1,30 @@
+# Uncomment the following to have a log containing all logs together
+#local1,local2,local3,local4,local5.*   /var/log/swift/all.log
+
+# Uncomment the following to have hourly proxy logs for stats processing
+#$template HourlyProxyLog,"/var/log/swift/hourly/%$YEAR%%$MONTH%%$DAY%%$HOUR%"
+#local1.*;local1.!notice ?HourlyProxyLog
+
+local1.*;local1.!notice /var/log/swift/proxy.log
+local1.notice           /var/log/swift/proxy.error
+local1.*                ~
+
+local2.*;local2.!notice /var/log/swift/storage1.log
+local2.notice           /var/log/swift/storage1.error
+local2.*                ~
+
+local3.*;local3.!notice /var/log/swift/storage2.log
+local3.notice           /var/log/swift/storage2.error
+local3.*                ~
+
+local4.*;local4.!notice /var/log/swift/storage3.log
+local4.notice           /var/log/swift/storage3.error
+local4.*                ~
+
+local5.*;local5.!notice /var/log/swift/storage4.log
+local5.notice           /var/log/swift/storage4.error
+local5.*                ~
+
+local6.*;local6.!notice /var/log/swift/expirer.log
+local6.notice           /var/log/swift/expirer.error
+local6.*                ~
diff --git a/doc/saio/swift/account-server/1.conf b/doc/saio/swift/account-server/1.conf
new file mode 100644
index 0000000000..e405f2de41
--- /dev/null
+++ b/doc/saio/swift/account-server/1.conf
@@ -0,0 +1,30 @@
+[DEFAULT]
+devices = /srv/1/node
+mount_check = false
+disable_fallocate = true
+bind_ip = 127.0.0.1
+bind_port = 6212
+workers = 1
+user = <your-user-name>
+log_facility = LOG_LOCAL2
+recon_cache_path = /var/cache/swift
+eventlet_debug = true
+
+[pipeline:main]
+pipeline = healthcheck recon account-server
+
+[app:account-server]
+use = egg:swift#account
+
+[filter:recon]
+use = egg:swift#recon
+
+[filter:healthcheck]
+use = egg:swift#healthcheck
+
+[account-replicator]
+rsync_module = {replication_ip}::account{replication_port}
+
+[account-auditor]
+
+[account-reaper]
diff --git a/doc/saio/swift/account-server/2.conf b/doc/saio/swift/account-server/2.conf
new file mode 100644
index 0000000000..9b580566ea
--- /dev/null
+++ b/doc/saio/swift/account-server/2.conf
@@ -0,0 +1,30 @@
+[DEFAULT]
+devices = /srv/2/node
+mount_check = false
+disable_fallocate = true
+bind_ip = 127.0.0.2
+bind_port = 6222
+workers = 1
+user = <your-user-name>
+log_facility = LOG_LOCAL3
+recon_cache_path = /var/cache/swift2
+eventlet_debug = true
+
+[pipeline:main]
+pipeline = healthcheck recon account-server
+
+[app:account-server]
+use = egg:swift#account
+
+[filter:recon]
+use = egg:swift#recon
+
+[filter:healthcheck]
+use = egg:swift#healthcheck
+
+[account-replicator]
+rsync_module = {replication_ip}::account{replication_port}
+
+[account-auditor]
+
+[account-reaper]
diff --git a/doc/saio/swift/account-server/3.conf b/doc/saio/swift/account-server/3.conf
new file mode 100644
index 0000000000..c0cbe6e33e
--- /dev/null
+++ b/doc/saio/swift/account-server/3.conf
@@ -0,0 +1,30 @@
+[DEFAULT]
+devices = /srv/3/node
+mount_check = false
+disable_fallocate = true
+bind_ip = 127.0.0.3
+bind_port = 6232
+workers = 1
+user = <your-user-name>
+log_facility = LOG_LOCAL4
+recon_cache_path = /var/cache/swift3
+eventlet_debug = true
+
+[pipeline:main]
+pipeline = healthcheck recon account-server
+
+[app:account-server]
+use = egg:swift#account
+
+[filter:recon]
+use = egg:swift#recon
+
+[filter:healthcheck]
+use = egg:swift#healthcheck
+
+[account-replicator]
+rsync_module = {replication_ip}::account{replication_port}
+
+[account-auditor]
+
+[account-reaper]
diff --git a/doc/saio/swift/account-server/4.conf b/doc/saio/swift/account-server/4.conf
new file mode 100644
index 0000000000..105d0eec16
--- /dev/null
+++ b/doc/saio/swift/account-server/4.conf
@@ -0,0 +1,30 @@
+[DEFAULT]
+devices = /srv/4/node
+mount_check = false
+disable_fallocate = true
+bind_ip = 127.0.0.4
+bind_port = 6242
+workers = 1
+user = <your-user-name>
+log_facility = LOG_LOCAL5
+recon_cache_path = /var/cache/swift4
+eventlet_debug = true
+
+[pipeline:main]
+pipeline = healthcheck recon account-server
+
+[app:account-server]
+use = egg:swift#account
+
+[filter:recon]
+use = egg:swift#recon
+
+[filter:healthcheck]
+use = egg:swift#healthcheck
+
+[account-replicator]
+rsync_module = {replication_ip}::account{replication_port}
+
+[account-auditor]
+
+[account-reaper]
diff --git a/doc/saio/swift/container-reconciler/1.conf b/doc/saio/swift/container-reconciler/1.conf
new file mode 100644
index 0000000000..9350405e98
--- /dev/null
+++ b/doc/saio/swift/container-reconciler/1.conf
@@ -0,0 +1,49 @@
+[DEFAULT]
+# swift_dir = /etc/swift
+user = <your-user-name>
+# You can specify default log routing here if you want:
+# log_name = swift
+log_facility = LOG_LOCAL2
+# log_level = INFO
+# log_address = /dev/log
+#
+# comma separated list of functions to call to setup custom log handlers.
+# functions get passed: conf, name, log_to_console, log_route, fmt, logger,
+# adapted_logger
+# log_custom_handlers =
+#
+# If set, log_udp_host will override log_address
+# log_udp_host =
+# log_udp_port = 514
+#
+# You can enable StatsD logging here:
+# log_statsd_host =
+# log_statsd_port = 8125
+# log_statsd_default_sample_rate = 1.0
+# log_statsd_sample_rate_factor = 1.0
+# log_statsd_metric_prefix =
+
+[container-reconciler]
+# reclaim_age = 604800
+# interval = 300
+# request_tries = 3
+processes = 4
+process = 0
+
+[pipeline:main]
+pipeline = catch_errors proxy-logging cache proxy-server
+
+[app:proxy-server]
+use = egg:swift#proxy
+# See proxy-server.conf-sample for options
+
+[filter:cache]
+use = egg:swift#memcache
+# See proxy-server.conf-sample for options
+
+[filter:proxy-logging]
+use = egg:swift#proxy_logging
+
+[filter:catch_errors]
+use = egg:swift#catch_errors
+# See proxy-server.conf-sample for options
diff --git a/doc/saio/swift/container-reconciler/2.conf b/doc/saio/swift/container-reconciler/2.conf
new file mode 100644
index 0000000000..6ffcf84d7d
--- /dev/null
+++ b/doc/saio/swift/container-reconciler/2.conf
@@ -0,0 +1,49 @@
+[DEFAULT]
+# swift_dir = /etc/swift
+user = <your-user-name>
+# You can specify default log routing here if you want:
+# log_name = swift
+log_facility = LOG_LOCAL3
+# log_level = INFO
+# log_address = /dev/log
+#
+# comma separated list of functions to call to setup custom log handlers.
+# functions get passed: conf, name, log_to_console, log_route, fmt, logger,
+# adapted_logger
+# log_custom_handlers =
+#
+# If set, log_udp_host will override log_address
+# log_udp_host =
+# log_udp_port = 514
+#
+# You can enable StatsD logging here:
+# log_statsd_host =
+# log_statsd_port = 8125
+# log_statsd_default_sample_rate = 1.0
+# log_statsd_sample_rate_factor = 1.0
+# log_statsd_metric_prefix =
+
+[container-reconciler]
+# reclaim_age = 604800
+# interval = 300
+# request_tries = 3
+processes = 4
+process = 1
+
+[pipeline:main]
+pipeline = catch_errors proxy-logging cache proxy-server
+
+[app:proxy-server]
+use = egg:swift#proxy
+# See proxy-server.conf-sample for options
+
+[filter:cache]
+use = egg:swift#memcache
+# See proxy-server.conf-sample for options
+
+[filter:proxy-logging]
+use = egg:swift#proxy_logging
+
+[filter:catch_errors]
+use = egg:swift#catch_errors
+# See proxy-server.conf-sample for options
diff --git a/doc/saio/swift/container-reconciler/3.conf b/doc/saio/swift/container-reconciler/3.conf
new file mode 100644
index 0000000000..843b7bb79e
--- /dev/null
+++ b/doc/saio/swift/container-reconciler/3.conf
@@ -0,0 +1,49 @@
+[DEFAULT]
+# swift_dir = /etc/swift
+user = <your-user-name>
+# You can specify default log routing here if you want:
+# log_name = swift
+log_facility = LOG_LOCAL4
+# log_level = INFO
+# log_address = /dev/log
+#
+# comma separated list of functions to call to setup custom log handlers.
+# functions get passed: conf, name, log_to_console, log_route, fmt, logger,
+# adapted_logger
+# log_custom_handlers =
+#
+# If set, log_udp_host will override log_address
+# log_udp_host =
+# log_udp_port = 514
+#
+# You can enable StatsD logging here:
+# log_statsd_host =
+# log_statsd_port = 8125
+# log_statsd_default_sample_rate = 1.0
+# log_statsd_sample_rate_factor = 1.0
+# log_statsd_metric_prefix =
+
+[container-reconciler]
+# reclaim_age = 604800
+# interval = 300
+# request_tries = 3
+processes = 4
+process = 2
+
+[pipeline:main]
+pipeline = catch_errors proxy-logging cache proxy-server
+
+[app:proxy-server]
+use = egg:swift#proxy
+# See proxy-server.conf-sample for options
+
+[filter:cache]
+use = egg:swift#memcache
+# See proxy-server.conf-sample for options
+
+[filter:proxy-logging]
+use = egg:swift#proxy_logging
+
+[filter:catch_errors]
+use = egg:swift#catch_errors
+# See proxy-server.conf-sample for options
diff --git a/doc/saio/swift/container-reconciler/4.conf b/doc/saio/swift/container-reconciler/4.conf
new file mode 100644
index 0000000000..b7d6dc9978
--- /dev/null
+++ b/doc/saio/swift/container-reconciler/4.conf
@@ -0,0 +1,49 @@
+[DEFAULT]
+# swift_dir = /etc/swift
+user = <your-user-name>
+# You can specify default log routing here if you want:
+# log_name = swift
+log_facility = LOG_LOCAL5
+# log_level = INFO
+# log_address = /dev/log
+#
+# comma separated list of functions to call to setup custom log handlers.
+# functions get passed: conf, name, log_to_console, log_route, fmt, logger,
+# adapted_logger
+# log_custom_handlers =
+#
+# If set, log_udp_host will override log_address
+# log_udp_host =
+# log_udp_port = 514
+#
+# You can enable StatsD logging here:
+# log_statsd_host =
+# log_statsd_port = 8125
+# log_statsd_default_sample_rate = 1.0
+# log_statsd_sample_rate_factor = 1.0
+# log_statsd_metric_prefix =
+
+[container-reconciler]
+# reclaim_age = 604800
+# interval = 300
+# request_tries = 3
+processes = 4
+process = 3
+
+[pipeline:main]
+pipeline = catch_errors proxy-logging cache proxy-server
+
+[app:proxy-server]
+use = egg:swift#proxy
+# See proxy-server.conf-sample for options
+
+[filter:cache]
+use = egg:swift#memcache
+# See proxy-server.conf-sample for options
+
+[filter:proxy-logging]
+use = egg:swift#proxy_logging
+
+[filter:catch_errors]
+use = egg:swift#catch_errors
+# See proxy-server.conf-sample for options
diff --git a/doc/saio/swift/container-server/1.conf b/doc/saio/swift/container-server/1.conf
new file mode 100644
index 0000000000..af03ac8e3f
--- /dev/null
+++ b/doc/saio/swift/container-server/1.conf
@@ -0,0 +1,42 @@
+[DEFAULT]
+devices = /srv/1/node
+mount_check = false
+disable_fallocate = true
+bind_ip = 127.0.0.1
+bind_port = 6211
+workers = 1
+user = <your-user-name>
+log_facility = LOG_LOCAL2
+recon_cache_path = /var/cache/swift
+eventlet_debug = true
+
+[pipeline:main]
+pipeline = healthcheck recon container-server
+
+[app:container-server]
+use = egg:swift#container
+
+[filter:recon]
+use = egg:swift#recon
+
+[filter:healthcheck]
+use = egg:swift#healthcheck
+
+[container-replicator]
+rsync_module = {replication_ip}::container{replication_port}
+
+[container-updater]
+
+[container-auditor]
+
+[container-sync]
+
+[container-sharder]
+auto_shard = true
+rsync_module = {replication_ip}::container{replication_port}
+# This is intentionally much smaller than the default of 1,000,000 so tests
+# can run in a reasonable amount of time
+shard_container_threshold = 100
+# The probe tests make explicit assumptions about the batch sizes
+shard_scanner_batch_size = 10
+cleave_batch_size = 2
diff --git a/doc/saio/swift/container-server/2.conf b/doc/saio/swift/container-server/2.conf
new file mode 100644
index 0000000000..fe20c6d2c4
--- /dev/null
+++ b/doc/saio/swift/container-server/2.conf
@@ -0,0 +1,42 @@
+[DEFAULT]
+devices = /srv/2/node
+mount_check = false
+disable_fallocate = true
+bind_ip = 127.0.0.2
+bind_port = 6221
+workers = 1
+user = <your-user-name>
+log_facility = LOG_LOCAL3
+recon_cache_path = /var/cache/swift2
+eventlet_debug = true
+
+[pipeline:main]
+pipeline = healthcheck recon container-server
+
+[app:container-server]
+use = egg:swift#container
+
+[filter:recon]
+use = egg:swift#recon
+
+[filter:healthcheck]
+use = egg:swift#healthcheck
+
+[container-replicator]
+rsync_module = {replication_ip}::container{replication_port}
+
+[container-updater]
+
+[container-auditor]
+
+[container-sync]
+
+[container-sharder]
+auto_shard = true
+rsync_module = {replication_ip}::container{replication_port}
+# This is intentionally much smaller than the default of 1,000,000 so tests
+# can run in a reasonable amount of time
+shard_container_threshold = 100
+# The probe tests make explicit assumptions about the batch sizes
+shard_scanner_batch_size = 10
+cleave_batch_size = 2
diff --git a/doc/saio/swift/container-server/3.conf b/doc/saio/swift/container-server/3.conf
new file mode 100644
index 0000000000..a6960ba065
--- /dev/null
+++ b/doc/saio/swift/container-server/3.conf
@@ -0,0 +1,42 @@
+[DEFAULT]
+devices = /srv/3/node
+mount_check = false
+disable_fallocate = true
+bind_ip = 127.0.0.3
+bind_port = 6231
+workers = 1
+user = <your-user-name>
+log_facility = LOG_LOCAL4
+recon_cache_path = /var/cache/swift3
+eventlet_debug = true
+
+[pipeline:main]
+pipeline = healthcheck recon container-server
+
+[app:container-server]
+use = egg:swift#container
+
+[filter:recon]
+use = egg:swift#recon
+
+[filter:healthcheck]
+use = egg:swift#healthcheck
+
+[container-replicator]
+rsync_module = {replication_ip}::container{replication_port}
+
+[container-updater]
+
+[container-auditor]
+
+[container-sync]
+
+[container-sharder]
+auto_shard = true
+rsync_module = {replication_ip}::container{replication_port}
+# This is intentionally much smaller than the default of 1,000,000 so tests
+# can run in a reasonable amount of time
+shard_container_threshold = 100
+# The probe tests make explicit assumptions about the batch sizes
+shard_scanner_batch_size = 10
+cleave_batch_size = 2
diff --git a/doc/saio/swift/container-server/4.conf b/doc/saio/swift/container-server/4.conf
new file mode 100644
index 0000000000..35c0a528f6
--- /dev/null
+++ b/doc/saio/swift/container-server/4.conf
@@ -0,0 +1,42 @@
+[DEFAULT]
+devices = /srv/4/node
+mount_check = false
+disable_fallocate = true
+bind_ip = 127.0.0.4
+bind_port = 6241
+workers = 1
+user = <your-user-name>
+log_facility = LOG_LOCAL5
+recon_cache_path = /var/cache/swift4
+eventlet_debug = true
+
+[pipeline:main]
+pipeline = healthcheck recon container-server
+
+[app:container-server]
+use = egg:swift#container
+
+[filter:recon]
+use = egg:swift#recon
+
+[filter:healthcheck]
+use = egg:swift#healthcheck
+
+[container-replicator]
+rsync_module = {replication_ip}::container{replication_port}
+
+[container-updater]
+
+[container-auditor]
+
+[container-sync]
+
+[container-sharder]
+auto_shard = true
+rsync_module = {replication_ip}::container{replication_port}
+# This is intentionally much smaller than the default of 1,000,000 so tests
+# can run in a reasonable amount of time
+shard_container_threshold = 100
+# The probe tests make explicit assumptions about the batch sizes
+shard_scanner_batch_size = 10
+cleave_batch_size = 2
diff --git a/doc/saio/swift/container-sync-realms.conf b/doc/saio/swift/container-sync-realms.conf
new file mode 100644
index 0000000000..503a71c4f1
--- /dev/null
+++ b/doc/saio/swift/container-sync-realms.conf
@@ -0,0 +1,5 @@
+[saio]
+key = changeme
+key2 = changeme
+cluster_saio_endpoint = http://127.0.0.1:8080/v1/
+
diff --git a/doc/saio/swift/internal-client.conf b/doc/saio/swift/internal-client.conf
new file mode 100644
index 0000000000..052d1e7549
--- /dev/null
+++ b/doc/saio/swift/internal-client.conf
@@ -0,0 +1,24 @@
+[DEFAULT]
+
+[pipeline:main]
+pipeline = catch_errors proxy-logging cache symlink proxy-server
+
+[app:proxy-server]
+use = egg:swift#proxy
+account_autocreate = true
+# See proxy-server.conf-sample for options
+
+[filter:symlink]
+use = egg:swift#symlink
+# See proxy-server.conf-sample for options
+
+[filter:cache]
+use = egg:swift#memcache
+# See proxy-server.conf-sample for options
+
+[filter:proxy-logging]
+use = egg:swift#proxy_logging
+
+[filter:catch_errors]
+use = egg:swift#catch_errors
+# See proxy-server.conf-sample for options
diff --git a/doc/saio/swift/object-expirer.conf b/doc/saio/swift/object-expirer.conf
new file mode 100644
index 0000000000..58c85d2843
--- /dev/null
+++ b/doc/saio/swift/object-expirer.conf
@@ -0,0 +1,58 @@
+[DEFAULT]
+# swift_dir = /etc/swift
+user = <your-user-name>
+# You can specify default log routing here if you want:
+log_name = object-expirer
+log_facility = LOG_LOCAL6
+log_level = INFO
+#log_address = /dev/log
+#
+# comma separated list of functions to call to setup custom log handlers.
+# functions get passed: conf, name, log_to_console, log_route, fmt, logger,
+# adapted_logger
+# log_custom_handlers =
+#
+# If set, log_udp_host will override log_address
+# log_udp_host =
+# log_udp_port = 514
+#
+# You can enable StatsD logging here:
+# log_statsd_host =
+# log_statsd_port = 8125
+# log_statsd_default_sample_rate = 1.0
+# log_statsd_sample_rate_factor = 1.0
+# log_statsd_metric_prefix =
+
+[object-expirer]
+interval = 300
+# report_interval = 300
+# concurrency is the level of concurrency to use to do the work, this value
+# must be set to at least 1
+# concurrency = 1
+# processes is how many parts to divide the work into, one part per process
+#   that will be doing the work
+# processes set 0 means that a single process will be doing all the work
+# processes can also be specified on the command line and will override the
+#   config value
+# processes = 0
+# process is which of the parts a particular process will work on
+# process can also be specified on the command line and will override the config
+#   value
+# process is "zero based", if you want to use 3 processes, you should run
+#  processes with process set to 0, 1, and 2
+# process = 0
+
+[pipeline:main]
+pipeline = catch_errors cache proxy-server
+
+[app:proxy-server]
+use = egg:swift#proxy
+# See proxy-server.conf-sample for options
+
+[filter:cache]
+use = egg:swift#memcache
+# See proxy-server.conf-sample for options
+
+[filter:catch_errors]
+use = egg:swift#catch_errors
+# See proxy-server.conf-sample for options
diff --git a/doc/saio/swift/object-server/1.conf b/doc/saio/swift/object-server/1.conf
new file mode 100644
index 0000000000..ecd5ff01c9
--- /dev/null
+++ b/doc/saio/swift/object-server/1.conf
@@ -0,0 +1,34 @@
+[DEFAULT]
+devices = /srv/1/node
+mount_check = false
+disable_fallocate = true
+bind_ip = 127.0.0.1
+bind_port = 6210
+workers = 1
+user = <your-user-name>
+log_facility = LOG_LOCAL2
+recon_cache_path = /var/cache/swift
+eventlet_debug = true
+
+[pipeline:main]
+pipeline = healthcheck recon object-server
+
+[app:object-server]
+use = egg:swift#object
+
+[filter:recon]
+use = egg:swift#recon
+
+[filter:healthcheck]
+use = egg:swift#healthcheck
+
+[object-replicator]
+rsync_module = {replication_ip}::object{replication_port}
+
+[object-reconstructor]
+
+[object-updater]
+
+[object-auditor]
+
+[object-relinker]
diff --git a/doc/saio/swift/object-server/2.conf b/doc/saio/swift/object-server/2.conf
new file mode 100644
index 0000000000..456f7d5586
--- /dev/null
+++ b/doc/saio/swift/object-server/2.conf
@@ -0,0 +1,34 @@
+[DEFAULT]
+devices = /srv/2/node
+mount_check = false
+disable_fallocate = true
+bind_ip = 127.0.0.2
+bind_port = 6220
+workers = 1
+user = <your-user-name>
+log_facility = LOG_LOCAL3
+recon_cache_path = /var/cache/swift2
+eventlet_debug = true
+
+[pipeline:main]
+pipeline = healthcheck recon object-server
+
+[app:object-server]
+use = egg:swift#object
+
+[filter:recon]
+use = egg:swift#recon
+
+[filter:healthcheck]
+use = egg:swift#healthcheck
+
+[object-replicator]
+rsync_module = {replication_ip}::object{replication_port}
+
+[object-reconstructor]
+
+[object-updater]
+
+[object-auditor]
+
+[object-relinker]
diff --git a/doc/saio/swift/object-server/3.conf b/doc/saio/swift/object-server/3.conf
new file mode 100644
index 0000000000..9a0ebbdca0
--- /dev/null
+++ b/doc/saio/swift/object-server/3.conf
@@ -0,0 +1,34 @@
+[DEFAULT]
+devices = /srv/3/node
+mount_check = false
+disable_fallocate = true
+bind_ip = 127.0.0.3
+bind_port = 6230
+workers = 1
+user = <your-user-name>
+log_facility = LOG_LOCAL4
+recon_cache_path = /var/cache/swift3
+eventlet_debug = true
+
+[pipeline:main]
+pipeline = healthcheck recon object-server
+
+[app:object-server]
+use = egg:swift#object
+
+[filter:recon]
+use = egg:swift#recon
+
+[filter:healthcheck]
+use = egg:swift#healthcheck
+
+[object-replicator]
+rsync_module = {replication_ip}::object{replication_port}
+
+[object-reconstructor]
+
+[object-updater]
+
+[object-auditor]
+
+[object-relinker]
diff --git a/doc/saio/swift/object-server/4.conf b/doc/saio/swift/object-server/4.conf
new file mode 100644
index 0000000000..1c0db1ff51
--- /dev/null
+++ b/doc/saio/swift/object-server/4.conf
@@ -0,0 +1,34 @@
+[DEFAULT]
+devices = /srv/4/node
+mount_check = false
+disable_fallocate = true
+bind_ip = 127.0.0.4
+bind_port = 6240
+workers = 1
+user = <your-user-name>
+log_facility = LOG_LOCAL5
+recon_cache_path = /var/cache/swift4
+eventlet_debug = true
+
+[pipeline:main]
+pipeline = healthcheck recon object-server
+
+[app:object-server]
+use = egg:swift#object
+
+[filter:recon]
+use = egg:swift#recon
+
+[filter:healthcheck]
+use = egg:swift#healthcheck
+
+[object-replicator]
+rsync_module = {replication_ip}::object{replication_port}
+
+[object-reconstructor]
+
+[object-updater]
+
+[object-auditor]
+
+[object-relinker]
diff --git a/doc/saio/swift/proxy-server.conf b/doc/saio/swift/proxy-server.conf
new file mode 100644
index 0000000000..c43c036072
--- /dev/null
+++ b/doc/saio/swift/proxy-server.conf
@@ -0,0 +1,109 @@
+[DEFAULT]
+bind_ip = 127.0.0.1
+bind_port = 8080
+workers = 1
+user = <your-user-name>
+log_facility = LOG_LOCAL1
+eventlet_debug = true
+
+[pipeline:main]
+# Yes, proxy-logging appears twice. This is so that
+# middleware-originated requests get logged too.
+pipeline = catch_errors gatekeeper healthcheck proxy-logging cache etag-quoter listing_formats bulk tempurl ratelimit crossdomain container_sync tempauth staticweb copy container-quotas account-quotas slo dlo versioned_writes symlink proxy-logging proxy-server
+
+[filter:catch_errors]
+use = egg:swift#catch_errors
+
+[filter:healthcheck]
+use = egg:swift#healthcheck
+
+[filter:proxy-logging]
+use = egg:swift#proxy_logging
+
+[filter:bulk]
+use = egg:swift#bulk
+
+[filter:ratelimit]
+use = egg:swift#ratelimit
+
+[filter:crossdomain]
+use = egg:swift#crossdomain
+
+[filter:dlo]
+use = egg:swift#dlo
+
+[filter:slo]
+use = egg:swift#slo
+
+[filter:container_sync]
+use = egg:swift#container_sync
+current = //saio/saio_endpoint
+
+[filter:tempurl]
+use = egg:swift#tempurl
+
+[filter:tempauth]
+use = egg:swift#tempauth
+user_admin_admin = admin .admin .reseller_admin
+user_test_tester = testing .admin
+user_test_tester2 = testing2 .admin
+user_test_tester3 = testing3
+user_test2_tester2 = testing2 .admin
+
+[filter:staticweb]
+use = egg:swift#staticweb
+
+[filter:account-quotas]
+use = egg:swift#account_quotas
+
+[filter:container-quotas]
+use = egg:swift#container_quotas
+
+[filter:cache]
+use = egg:swift#memcache
+
+[filter:etag-quoter]
+use = egg:swift#etag_quoter
+enable_by_default = false
+
+[filter:gatekeeper]
+use = egg:swift#gatekeeper
+
+[filter:versioned_writes]
+use = egg:swift#versioned_writes
+allow_versioned_writes = true
+allow_object_versioning = true
+
+[filter:copy]
+use = egg:swift#copy
+
+[filter:listing_formats]
+use = egg:swift#listing_formats
+
+[filter:domain_remap]
+use = egg:swift#domain_remap
+
+[filter:symlink]
+use = egg:swift#symlink
+
+# To enable, add the s3api middleware to the pipeline before tempauth
+[filter:s3api]
+use = egg:swift#s3api
+s3_acl = yes
+check_bucket_owner = yes
+cors_preflight_allow_origin = *
+
+# Example to create root secret: `openssl rand -base64 32`
+[filter:keymaster]
+use = egg:swift#keymaster
+encryption_root_secret = changeme/changeme/changeme/changeme/change/=
+
+# To enable use of encryption add both middlewares to pipeline, example:
+# <other middleware> keymaster encryption proxy-logging proxy-server
+[filter:encryption]
+use = egg:swift#encryption
+
+[app:proxy-server]
+use = egg:swift#proxy
+allow_account_management = true
+account_autocreate = true
diff --git a/doc/saio/swift/swift.conf b/doc/saio/swift/swift.conf
new file mode 100644
index 0000000000..e01a0ac881
--- /dev/null
+++ b/doc/saio/swift/swift.conf
@@ -0,0 +1,21 @@
+[swift-hash]
+# random unique strings that can never change (DO NOT LOSE)
+# Use only printable chars (python -c "import string; print(string.printable)")
+swift_hash_path_prefix = changeme
+swift_hash_path_suffix = changeme
+
+[storage-policy:0]
+name = gold
+policy_type = replication
+default = yes
+
+[storage-policy:1]
+name = silver
+policy_type = replication
+
+[storage-policy:2]
+name = ec42
+policy_type = erasure_coding
+ec_type = liberasurecode_rs_vand
+ec_num_data_fragments = 4
+ec_num_parity_fragments = 2
diff --git a/doc/source/_extra/.htaccess b/doc/source/_extra/.htaccess
new file mode 100644
index 0000000000..b45cdfeb54
--- /dev/null
+++ b/doc/source/_extra/.htaccess
@@ -0,0 +1,2 @@
+# docs redirects are defined here
+redirectmatch 301 ^/swift/([^/]+)/team.html$ https://github.com/openstack/swift/blob/master/AUTHORS
diff --git a/doc/source/_ga/layout.html b/doc/source/_ga/layout.html
deleted file mode 100644
index 876fe009d8..0000000000
--- a/doc/source/_ga/layout.html
+++ /dev/null
@@ -1,17 +0,0 @@
-{% extends "!layout.html" %}
-
-{% block footer %}
-{{ super() }}
-<script type="text/javascript">
-var gaJsHost = (("https:" == document.location.protocol) ? "https://ssl." : "http://www.");
-document.write(unescape("%3Cscript src='" + gaJsHost + "google-analytics.com/ga.js' type='text/javascript'%3E%3C/script%3E"));
-</script>
-<script type="text/javascript">
-try {
-var pageTracker = _gat._getTracker("UA-17511903-4");
-pageTracker._setDomainName("none");
-pageTracker._setAllowLinker(true);
-pageTracker._trackPageview();
-} catch(err) {}</script>
-{% endblock %}
-
diff --git a/doc/source/_static/basic.css b/doc/source/_static/basic.css
deleted file mode 100644
index d909ce37c7..0000000000
--- a/doc/source/_static/basic.css
+++ /dev/null
@@ -1,416 +0,0 @@
-/**
- * Sphinx stylesheet -- basic theme
- * ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
- */
-
-/* -- main layout ----------------------------------------------------------- */
-
-div.clearer {
-    clear: both;
-}
-
-/* -- relbar ---------------------------------------------------------------- */
-
-div.related {
-    width: 100%;
-    font-size: 90%;
-}
-
-div.related h3 {
-    display: none;
-}
-
-div.related ul {
-    margin: 0;
-    padding: 0 0 0 10px;
-    list-style: none;
-}
-
-div.related li {
-    display: inline;
-}
-
-div.related li.right {
-    float: right;
-    margin-right: 5px;
-}
-
-/* -- sidebar --------------------------------------------------------------- */
-
-div.sphinxsidebarwrapper {
-    padding: 10px 5px 0 10px;
-}
-
-div.sphinxsidebar {
-    float: left;
-    width: 230px;
-    margin-left: -100%;
-    font-size: 90%;
-}
-
-div.sphinxsidebar ul {
-    list-style: none;
-}
-
-div.sphinxsidebar ul ul,
-div.sphinxsidebar ul.want-points {
-    margin-left: 20px;
-    list-style: square;
-}
-
-div.sphinxsidebar ul ul {
-    margin-top: 0;
-    margin-bottom: 0;
-}
-
-div.sphinxsidebar form {
-    margin-top: 10px;
-}
-
-div.sphinxsidebar input {
-    border: 1px solid #98dbcc;
-    font-family: sans-serif;
-    font-size: 1em;
-}
-
-img {
-    border: 0;
-}
-
-/* -- search page ----------------------------------------------------------- */
-
-ul.search {
-    margin: 10px 0 0 20px;
-    padding: 0;
-}
-
-ul.search li {
-    padding: 5px 0 5px 20px;
-    background-image: url(file.png);
-    background-repeat: no-repeat;
-    background-position: 0 7px;
-}
-
-ul.search li a {
-    font-weight: bold;
-}
-
-ul.search li div.context {
-    color: #888;
-    margin: 2px 0 0 30px;
-    text-align: left;
-}
-
-ul.keywordmatches li.goodmatch a {
-    font-weight: bold;
-}
-
-/* -- index page ------------------------------------------------------------ */
-
-table.contentstable {
-    width: 90%;
-}
-
-table.contentstable p.biglink {
-    line-height: 150%;
-}
-
-a.biglink {
-    font-size: 1.3em;
-}
-
-span.linkdescr {
-    font-style: italic;
-    padding-top: 5px;
-    font-size: 90%;
-}
-
-/* -- general index --------------------------------------------------------- */
-
-table.indextable td {
-    text-align: left;
-    vertical-align: top;
-}
-
-table.indextable dl, table.indextable dd {
-    margin-top: 0;
-    margin-bottom: 0;
-}
-
-table.indextable tr.pcap {
-    height: 10px;
-}
-
-table.indextable tr.cap {
-    margin-top: 10px;
-    background-color: #f2f2f2;
-}
-
-img.toggler {
-    margin-right: 3px;
-    margin-top: 3px;
-    cursor: pointer;
-}
-
-/* -- general body styles --------------------------------------------------- */
-
-a.headerlink {
-    visibility: hidden;
-}
-
-h1:hover > a.headerlink,
-h2:hover > a.headerlink,
-h3:hover > a.headerlink,
-h4:hover > a.headerlink,
-h5:hover > a.headerlink,
-h6:hover > a.headerlink,
-dt:hover > a.headerlink {
-    visibility: visible;
-}
-
-div.body p.caption {
-    text-align: inherit;
-}
-
-div.body td {
-    text-align: left;
-}
-
-.field-list ul {
-    padding-left: 1em;
-}
-
-.first {
-}
-
-p.rubric {
-    margin-top: 30px;
-    font-weight: bold;
-}
-
-/* -- sidebars -------------------------------------------------------------- */
-
-div.sidebar {
-    margin: 0 0 0.5em 1em;
-    border: 1px solid #ddb;
-    padding: 7px 7px 0 7px;
-    background-color: #ffe;
-    width: 40%;
-    float: right;
-}
-
-p.sidebar-title {
-    font-weight: bold;
-}
-
-/* -- topics ---------------------------------------------------------------- */
-
-div.topic {
-    border: 1px solid #ccc;
-    padding: 7px 7px 0 7px;
-    margin: 10px 0 10px 0;
-}
-
-p.topic-title {
-    font-size: 1.1em;
-    font-weight: bold;
-    margin-top: 10px;
-}
-
-/* -- admonitions ----------------------------------------------------------- */
-
-div.admonition {
-    margin-top: 10px;
-    margin-bottom: 10px;
-    padding: 7px;
-}
-
-div.admonition dt {
-    font-weight: bold;
-}
-
-div.admonition dl {
-    margin-bottom: 0;
-}
-
-p.admonition-title {
-    margin: 0px 10px 5px 0px;
-    font-weight: bold;
-}
-
-div.body p.centered {
-    text-align: center;
-    margin-top: 25px;
-}
-
-/* -- tables ---------------------------------------------------------------- */
-
-table.docutils {
-    border: 0;
-    border-collapse: collapse;
-}
-
-table.docutils td, table.docutils th {
-    padding: 1px 8px 1px 0;
-    border-top: 0;
-    border-left: 0;
-    border-right: 0;
-    border-bottom: 1px solid #aaa;
-}
-
-table.field-list td, table.field-list th {
-    border: 0 !important;
-}
-
-table.footnote td, table.footnote th {
-    border: 0 !important;
-}
-
-th {
-    text-align: left;
-    padding-right: 5px;
-}
-
-/* -- other body styles ----------------------------------------------------- */
-
-dl {
-    margin-bottom: 15px;
-}
-
-dd p {
-    margin-top: 0px;
-}
-
-dd ul, dd table {
-    margin-bottom: 10px;
-}
-
-dd {
-    margin-top: 3px;
-    margin-bottom: 10px;
-    margin-left: 30px;
-}
-
-dt:target, .highlight {
-    background-color: #fbe54e;
-}
-
-dl.glossary dt {
-    font-weight: bold;
-    font-size: 1.1em;
-}
-
-.field-list ul {
-    margin: 0;
-    padding-left: 1em;
-}
-
-.field-list p {
-    margin: 0;
-}
-
-.refcount {
-    color: #060;
-}
-
-.optional {
-    font-size: 1.3em;
-}
-
-.versionmodified {
-    font-style: italic;
-}
-
-.system-message {
-    background-color: #fda;
-    padding: 5px;
-    border: 3px solid red;
-}
-
-.footnote:target  {
-    background-color: #ffa
-}
-
-.line-block {
-    display: block;
-    margin-top: 1em;
-    margin-bottom: 1em;
-}
-
-.line-block .line-block {
-    margin-top: 0;
-    margin-bottom: 0;
-    margin-left: 1.5em;
-}
-
-/* -- code displays --------------------------------------------------------- */
-
-pre {
-    overflow: auto;
-}
-
-td.linenos pre {
-    padding: 5px 0px;
-    border: 0;
-    background-color: transparent;
-    color: #aaa;
-}
-
-table.highlighttable {
-    margin-left: 0.5em;
-}
-
-table.highlighttable td {
-    padding: 0 0.5em 0 0.5em;
-}
-
-tt.descname {
-    background-color: transparent;
-    font-weight: bold;
-    font-size: 1.2em;
-}
-
-tt.descclassname {
-    background-color: transparent;
-}
-
-tt.xref, a tt {
-    background-color: transparent;
-    font-weight: bold;
-}
-
-h1 tt, h2 tt, h3 tt, h4 tt, h5 tt, h6 tt {
-    background-color: transparent;
-}
-
-/* -- math display ---------------------------------------------------------- */
-
-img.math {
-    vertical-align: middle;
-}
-
-div.body div.math p {
-    text-align: center;
-}
-
-span.eqno {
-    float: right;
-}
-
-/* -- printout stylesheet --------------------------------------------------- */
-
-@media print {
-    div.document,
-    div.documentwrapper,
-    div.bodywrapper {
-        margin: 0 !important;
-        width: 100%;
-    }
-
-    div.sphinxsidebar,
-    div.related,
-    div.footer,
-    #top-link {
-        display: none;
-    }
-}
diff --git a/doc/source/_static/default.css b/doc/source/_static/default.css
deleted file mode 100644
index c8091ecb4d..0000000000
--- a/doc/source/_static/default.css
+++ /dev/null
@@ -1,230 +0,0 @@
-/**
- * Sphinx stylesheet -- default theme
- * ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
- */
-
-@import url("basic.css");
-
-/* -- page layout ----------------------------------------------------------- */
-
-body {
-    font-family: sans-serif;
-    font-size: 100%;
-    background-color: #11303d;
-    color: #000;
-    margin: 0;
-    padding: 0;
-}
-
-div.document {
-    background-color: #1c4e63;
-}
-
-div.documentwrapper {
-    float: left;
-    width: 100%;
-}
-
-div.bodywrapper {
-    margin: 0 0 0 230px;
-}
-
-div.body {
-    background-color: #ffffff;
-    color: #000000;
-    padding: 0 20px 30px 20px;
-}
-
-div.footer {
-    color: #ffffff;
-    width: 100%;
-    padding: 9px 0 9px 0;
-    text-align: center;
-    font-size: 75%;
-}
-
-div.footer a {
-    color: #ffffff;
-    text-decoration: underline;
-}
-
-div.related {
-    background-color: #133f52;
-    line-height: 30px;
-    color: #ffffff;
-}
-
-div.related a {
-    color: #ffffff;
-}
-
-div.sphinxsidebar {
-}
-
-div.sphinxsidebar h3 {
-    font-family: 'Trebuchet MS', sans-serif;
-    color: #ffffff;
-    font-size: 1.4em;
-    font-weight: normal;
-    margin: 0;
-    padding: 0;
-}
-
-div.sphinxsidebar h3 a {
-    color: #ffffff;
-}
-
-div.sphinxsidebar h4 {
-    font-family: 'Trebuchet MS', sans-serif;
-    color: #ffffff;
-    font-size: 1.3em;
-    font-weight: normal;
-    margin: 5px 0 0 0;
-    padding: 0;
-}
-
-div.sphinxsidebar p {
-    color: #ffffff;
-}
-
-div.sphinxsidebar p.topless {
-    margin: 5px 10px 10px 10px;
-}
-
-div.sphinxsidebar ul {
-    margin: 10px;
-    padding: 0;
-    color: #ffffff;
-}
-
-div.sphinxsidebar a {
-    color: #98dbcc;
-}
-
-div.sphinxsidebar input {
-    border: 1px solid #98dbcc;
-    font-family: sans-serif;
-    font-size: 1em;
-}
-
-/* -- body styles ----------------------------------------------------------- */
-
-a {
-    color: #355f7c;
-    text-decoration: none;
-}
-
-a:hover {
-    text-decoration: underline;
-}
-
-div.body p, div.body dd, div.body li {
-    text-align: left;
-    line-height: 130%;
-}
-
-div.body h1,
-div.body h2,
-div.body h3,
-div.body h4,
-div.body h5,
-div.body h6 {
-    font-family: 'Trebuchet MS', sans-serif;
-    background-color: #f2f2f2;
-    font-weight: normal;
-    color: #20435c;
-    border-bottom: 1px solid #ccc;
-    margin: 20px -20px 10px -20px;
-    padding: 3px 0 3px 10px;
-}
-
-div.body h1 { margin-top: 0; font-size: 200%; }
-div.body h2 { font-size: 160%; }
-div.body h3 { font-size: 140%; }
-div.body h4 { font-size: 120%; }
-div.body h5 { font-size: 110%; }
-div.body h6 { font-size: 100%; }
-
-a.headerlink {
-    color: #c60f0f;
-    font-size: 0.8em;
-    padding: 0 4px 0 4px;
-    text-decoration: none;
-}
-
-a.headerlink:hover {
-    background-color: #c60f0f;
-    color: white;
-}
-
-div.body p, div.body dd, div.body li {
-    text-align: left;
-    line-height: 130%;
-}
-
-div.admonition p.admonition-title + p {
-    display: inline;
-}
-
-div.admonition p {
-    margin-bottom: 5px;
-}
-
-div.admonition pre {
-    margin-bottom: 5px;
-}
-
-div.admonition ul, div.admonition ol {
-    margin-bottom: 5px;
-}
-
-div.note {
-    background-color: #eee;
-    border: 1px solid #ccc;
-}
-
-div.seealso {
-    background-color: #ffc;
-    border: 1px solid #ff6;
-}
-
-div.topic {
-    background-color: #eee;
-}
-
-div.warning {
-    background-color: #ffe4e4;
-    border: 1px solid #f66;
-}
-
-p.admonition-title {
-    display: inline;
-}
-
-p.admonition-title:after {
-    content: ":";
-}
-
-pre {
-    padding: 5px;
-    background-color: #eeffcc;
-    color: #333333;
-    line-height: 120%;
-    border: 1px solid #ac9;
-    border-left: none;
-    border-right: none;
-}
-
-tt {
-    background-color: #ecf0f3;
-    padding: 0 1px 0 1px;
-    font-size: 0.95em;
-}
-
-.warning tt {
-    background: #efc2c2;
-}
-
-.note tt {
-    background: #d6d6d6;
-}
diff --git a/doc/source/_static/tweaks.css b/doc/source/_static/tweaks.css
deleted file mode 100644
index 1b6fdaa186..0000000000
--- a/doc/source/_static/tweaks.css
+++ /dev/null
@@ -1,212 +0,0 @@
-ul.todo_list {
-    list-style-type: none;
-    margin: 0;
-    padding: 0;
-}
-
-ul.todo_list li {
-    display: block;
-    margin: 0;
-    padding: 7px 0;
-    border-top: 1px solid #eee;
-}
-
-ul.todo_list li p {
-    display: inline;
-}
-
-ul.todo_list li p.link {
-    font-weight: bold;
-}
-
-ul.todo_list li p.details {
-    font-style: italic;
-}
-
-ul.todo_list li {
-}
-
-div.admonition {
-    border: 1px solid #8F1000;
-}
-
-div.admonition p.admonition-title {
-    background-color: #8F1000;
-    border-bottom: 1px solid #8E8E8E;
-}
-
-a {
-	color: #CF2F19;
-}
-
-div.related ul li a {
-	color: #CF2F19;
-}
-
-div.sphinxsidebar h4 {
-	background-color:#8E8E8E;
-	border:1px solid #255E6E;
-	color:white;
-	font-size:1em;
-	margin:1em 0 0.5em;
-	padding:0.1em 0 0.1em 0.5em;
-}
-
-em {
-    font-style: normal;
-}
-
-table.docutils {
-	font-size: 11px;
-}
-
-a tt {
-	color:#CF2F19;
-}
-
-/* ------------------------------------------
-PURE CSS SPEECH BUBBLES
-by Nicolas Gallagher
-- http://nicolasgallagher.com/pure-css-speech-bubbles/
-
-http://nicolasgallagher.com
-http://twitter.com/necolas
-
-Created: 02 March 2010
-Version: 1.1 (21 October 2010)
-
-Dual licensed under MIT and GNU GPLv2 © Nicolas Gallagher 
------------------------------------------- */
-/* THE SPEECH BUBBLE
-------------------------------------------------------------------------------------------------------------------------------- */
-
-/* THE SPEECH BUBBLE
-------------------------------------------------------------------------------------------------------------------------------- */
-
-.triangle-border {
-	position:relative;
-	padding:15px;
-	margin:1em 0 3em;
-	border:5px solid #BC1518;
-	color:#333;
-	background:#fff;
-	
-	/* css3 */
-	-moz-border-radius:10px;
-	-webkit-border-radius:10px;
-	border-radius:10px;
-}
-
-/* Variant : for left positioned triangle
------------------------------------------- */
-
-.triangle-border.left {
-	margin-left:30px;
-}
-
-/* Variant : for right positioned triangle
------------------------------------------- */
-
-.triangle-border.right {
-	margin-right:30px;
-}
-
-/* THE TRIANGLE
-------------------------------------------------------------------------------------------------------------------------------- */
-
-.triangle-border:before {
-	content:"";
-	display:block; /* reduce the damage in FF3.0 */
-	position:absolute;
-	bottom:-40px; /* value = - border-top-width - border-bottom-width */
-	left:40px; /* controls horizontal position */
-	width:0;
-	height:0;
-	border:20px solid transparent;
-	border-top-color:#BC1518;
-}
-
-/* creates the smaller  triangle */
-.triangle-border:after {
-	content:"";
-	display:block; /* reduce the damage in FF3.0 */
-	position:absolute;
-	bottom:-26px; /* value = - border-top-width - border-bottom-width */
-	left:47px; /* value = (:before left) + (:before border-left) - (:after border-left) */
-	width:0;
-	height:0;
-	border:13px solid transparent;
-	border-top-color:#fff;
-}
-
-/* Variant : top
------------------------------------------- */
-
-/* creates the larger triangle */
-.triangle-border.top:before {
-	top:-40px; /* value = - border-top-width - border-bottom-width */
-	right:40px; /* controls horizontal position */
-	bottom:auto;
-	left:auto;
-	border:20px solid transparent;
-	border-bottom-color:#BC1518;
-}
-
-/* creates the smaller  triangle */
-.triangle-border.top:after {
-	top:-26px; /* value = - border-top-width - border-bottom-width */
-	right:47px; /* value = (:before right) + (:before border-right) - (:after border-right) */
-	bottom:auto;
-	left:auto;
-	border:13px solid transparent;
-	border-bottom-color:#fff;
-}
-
-/* Variant : left
------------------------------------------- */
-
-/* creates the larger triangle */
-.triangle-border.left:before {
-	top:10px; /* controls vertical position */
-	left:-30px; /* value = - border-left-width - border-right-width */
-	bottom:auto;
-	border-width:15px 30px 15px 0;
-	border-style:solid;
-	border-color:transparent #BC1518;
-}
-
-/* creates the smaller  triangle */
-.triangle-border.left:after {
-	top:16px; /* value = (:before top) + (:before border-top) - (:after border-top) */
-	left:-21px; /* value = - border-left-width - border-right-width */
-	bottom:auto;
-	border-width:9px 21px 9px 0;
-	border-style:solid;
-	border-color:transparent #fff;
-}
-
-/* Variant : right
------------------------------------------- */
-
-/* creates the larger triangle */
-.triangle-border.right:before {
-	top:10px; /* controls vertical position */
-	right:-30px; /* value = - border-left-width - border-right-width */
-	bottom:auto;
-    left:auto;
-	border-width:15px 0 15px 30px;
-	border-style:solid;
-	border-color:transparent #BC1518;
-}
-
-/* creates the smaller  triangle */
-.triangle-border.right:after {
-	top:16px; /* value = (:before top) + (:before border-top) - (:after border-top) */
-	right:-21px; /* value = - border-left-width - border-right-width */
-	bottom:auto;
-    left:auto;
-	border-width:9px 0 9px 21px;
-	border-style:solid;
-	border-color:transparent #fff;
-}
-
diff --git a/doc/source/_theme/layout.html b/doc/source/_theme/layout.html
deleted file mode 100644
index fae4d6764d..0000000000
--- a/doc/source/_theme/layout.html
+++ /dev/null
@@ -1,69 +0,0 @@
-{% extends "sphinxdoc/layout.html" %}
-{% set css_files = css_files + ['_static/tweaks.css'] %}
-
-{%- macro sidebar() %}
-{%- if not embedded %}{% if not theme_nosidebar|tobool %}
-      <div class="sphinxsidebar">
-        <div class="sphinxsidebarwrapper">
-          {%- block sidebarlogo %}
-          {%- if logo %}
-            <p class="logo"><a href="{{ pathto(master_doc) }}">
-              <img class="logo" src="{{ pathto('_static/' + logo, 1) }}" alt="Logo"/>
-            </a></p>
-          {%- endif %}
-          {%- endblock %}
-          {%- block sidebartoc %}
-          {%- if display_toc %}
-            <h3><a href="{{ pathto(master_doc) }}">{{ _('Table Of Contents') }}</a></h3>
-            {{ toc }}
-          {%- endif %}
-          {%- endblock %}
-          {%- block sidebarrel %}
-          {%- if prev %}
-            <h4>{{ _('Previous topic') }}</h4>
-            <p class="topless"><a href="{{ prev.link|e }}"
-                                  title="{{ _('previous chapter') }}">{{ prev.title }}</a></p>
-          {%- endif %}
-          {%- if next %}
-            <h4>{{ _('Next topic') }}</h4>
-            <p class="topless"><a href="{{ next.link|e }}"
-                                  title="{{ _('next chapter') }}">{{ next.title }}</a></p>
-          {%- endif %}
-          {%- endblock %}
-          {%- block sidebarsourcelink %}
-          {%- if show_source and has_source and sourcename %}
-            <h3>{{ _('This Page') }}</h3>
-            <ul class="this-page-menu">
-              <li><a href="{{ pathto('_sources/' + sourcename, true)|e }}"
-                     rel="nofollow">{{ _('Show Source') }}</a></li>
-            </ul>
-          {%- endif %}
-          {%- endblock %}
-          {%- if customsidebar %}
-          {% include customsidebar %}
-          {%- endif %}
-          {%- block sidebarsearch %}
-          {%- if pagename != "search" %}
-          <div id="searchbox" style="display: none">
-            <h3>{{ _('Quick search') }}</h3>
-              <form class="search" action="{{ pathto('search') }}" method="get">
-                <input type="text" name="q" size="18" />
-                <input type="submit" value="{{ _('Go') }}" />
-                <input type="hidden" name="check_keywords" value="yes" />
-                <input type="hidden" name="area" value="default" />
-              </form>
-              <p class="searchtip" style="font-size: 90%">
-              {{ _('Enter search terms or a module, class or function name.') }}
-              </p>
-          </div>
-          <script type="text/javascript">$('#searchbox').show(0);</script>
-          <p class="triangle-border right">
-				Psst... hey. Did you know you can read about Swift at <a href="http://docs.openstack.org/">docs.openstack.org</a> also? Plus you can get to past versions at<a href="http://swift.openstack.org/1.3">Swift 1.3 docs</a> and <a href="http://swift.openstack.org/1.2">Swift 1.2 docs</a>.
-			</p>
-          {%- endif %}
-
-          {%- endblock %}
-        </div>
-      </div>
-      {%- endif %}{% endif %}
-{%- endmacro %}
\ No newline at end of file
diff --git a/doc/source/_theme/theme.conf b/doc/source/_theme/theme.conf
deleted file mode 100644
index e039fe01f9..0000000000
--- a/doc/source/_theme/theme.conf
+++ /dev/null
@@ -1,5 +0,0 @@
-[theme]
-inherit = sphinxdoc
-stylesheet = sphinxdoc.css
-pygments_style = friendly
-
diff --git a/doc/source/account.rst b/doc/source/account.rst
index 2ddb1f7d33..e7f0722d52 100644
--- a/doc/source/account.rst
+++ b/doc/source/account.rst
@@ -4,22 +4,22 @@
 Account
 *******
 
-.. _account-server:
+.. _account-auditor:
 
-Account Server
-==============
+Account Auditor
+===============
 
-.. automodule:: swift.account.server
+.. automodule:: swift.account.auditor
     :members:
     :undoc-members:
     :show-inheritance:
 
-.. _account-auditor:
+.. _account-backend:
 
-Account Auditor
+Account Backend
 ===============
 
-.. automodule:: swift.account.auditor
+.. automodule:: swift.account.backend
     :members:
     :undoc-members:
     :show-inheritance:
@@ -34,3 +34,12 @@ Account Reaper
     :undoc-members:
     :show-inheritance:
 
+.. _account-server:
+
+Account Server
+==============
+
+.. automodule:: swift.account.server
+    :members:
+    :undoc-members:
+    :show-inheritance:
diff --git a/doc/source/admin/figures/objectstorage-accountscontainers.png b/doc/source/admin/figures/objectstorage-accountscontainers.png
new file mode 100644
index 0000000000..4df7326a80
Binary files /dev/null and b/doc/source/admin/figures/objectstorage-accountscontainers.png differ
diff --git a/doc/source/admin/figures/objectstorage-arch.png b/doc/source/admin/figures/objectstorage-arch.png
new file mode 100644
index 0000000000..3b7978b673
Binary files /dev/null and b/doc/source/admin/figures/objectstorage-arch.png differ
diff --git a/doc/source/admin/figures/objectstorage-buildingblocks.png b/doc/source/admin/figures/objectstorage-buildingblocks.png
new file mode 100644
index 0000000000..8499ca1ead
Binary files /dev/null and b/doc/source/admin/figures/objectstorage-buildingblocks.png differ
diff --git a/doc/source/admin/figures/objectstorage-nodes.png b/doc/source/admin/figures/objectstorage-nodes.png
new file mode 100644
index 0000000000..e7a0396f5f
Binary files /dev/null and b/doc/source/admin/figures/objectstorage-nodes.png differ
diff --git a/doc/source/admin/figures/objectstorage-partitions.png b/doc/source/admin/figures/objectstorage-partitions.png
new file mode 100644
index 0000000000..7e319ca0b7
Binary files /dev/null and b/doc/source/admin/figures/objectstorage-partitions.png differ
diff --git a/doc/source/admin/figures/objectstorage-replication.png b/doc/source/admin/figures/objectstorage-replication.png
new file mode 100644
index 0000000000..8ce1309131
Binary files /dev/null and b/doc/source/admin/figures/objectstorage-replication.png differ
diff --git a/doc/source/admin/figures/objectstorage-ring.png b/doc/source/admin/figures/objectstorage-ring.png
new file mode 100644
index 0000000000..22ef31201a
Binary files /dev/null and b/doc/source/admin/figures/objectstorage-ring.png differ
diff --git a/doc/source/admin/figures/objectstorage-usecase.png b/doc/source/admin/figures/objectstorage-usecase.png
new file mode 100644
index 0000000000..5d7c8f421e
Binary files /dev/null and b/doc/source/admin/figures/objectstorage-usecase.png differ
diff --git a/doc/source/admin/figures/objectstorage-zones.png b/doc/source/admin/figures/objectstorage-zones.png
new file mode 100644
index 0000000000..ee5ffbf72c
Binary files /dev/null and b/doc/source/admin/figures/objectstorage-zones.png differ
diff --git a/doc/source/admin/figures/objectstorage.png b/doc/source/admin/figures/objectstorage.png
new file mode 100644
index 0000000000..9454065c28
Binary files /dev/null and b/doc/source/admin/figures/objectstorage.png differ
diff --git a/doc/source/admin/index.rst b/doc/source/admin/index.rst
new file mode 100644
index 0000000000..1145a82570
--- /dev/null
+++ b/doc/source/admin/index.rst
@@ -0,0 +1,21 @@
+===================================
+OpenStack Swift Administrator Guide
+===================================
+
+.. toctree::
+   :maxdepth: 2
+
+   objectstorage-intro.rst
+   objectstorage-features.rst
+   objectstorage-characteristics.rst
+   objectstorage-components.rst
+   objectstorage-ringbuilder.rst
+   objectstorage-arch.rst
+   objectstorage-replication.rst
+   objectstorage-large-objects.rst
+   objectstorage-auditors.rst
+   objectstorage-EC.rst
+   objectstorage-account-reaper.rst
+   objectstorage-tenant-specific-image-storage.rst
+   objectstorage-monitoring.rst
+   objectstorage-troubleshoot.rst
diff --git a/doc/source/admin/objectstorage-EC.rst b/doc/source/admin/objectstorage-EC.rst
new file mode 100644
index 0000000000..2e324079d0
--- /dev/null
+++ b/doc/source/admin/objectstorage-EC.rst
@@ -0,0 +1,19 @@
+==============
+Erasure coding
+==============
+
+Erasure coding is a set of algorithms that allows the reconstruction of
+missing data from a set of original data. In theory, erasure coding uses
+less capacity with similar durability characteristics as replicas.
+From an application perspective, erasure coding support is transparent.
+Object Storage (swift) implements erasure coding as a Storage Policy.
+See :doc:`/overview_policies` for more details.
+
+There is no external API related to erasure coding. Create a container using a
+Storage Policy; the interaction with the cluster is the same as any
+other durability policy. Because support implements as a Storage Policy,
+you can isolate all storage devices that associate with your cluster's
+erasure coding capability. It is entirely possible to share devices between
+storage policies, but for erasure coding it may make more sense to use
+not only separate devices but possibly even entire nodes dedicated for erasure
+coding.
diff --git a/doc/source/admin/objectstorage-account-reaper.rst b/doc/source/admin/objectstorage-account-reaper.rst
new file mode 100644
index 0000000000..0acdc20578
--- /dev/null
+++ b/doc/source/admin/objectstorage-account-reaper.rst
@@ -0,0 +1,51 @@
+==============
+Account reaper
+==============
+
+The purpose of the account reaper is to remove data from the deleted accounts.
+
+A reseller marks an account for deletion by issuing a ``DELETE`` request
+on the account's storage URL. This action sets the ``status`` column of
+the account_stat table in the account database and replicas to
+``DELETED``, marking the account's data for deletion.
+
+Typically, a specific retention time or undelete are not provided.
+However, you can set a ``delay_reaping`` value in the
+``[account-reaper]`` section of the ``account-server.conf`` file to
+delay the actual deletion of data. At this time, to undelete you have to update
+the account database replicas directly, set the status column to an
+empty string and update the put_timestamp to be greater than the
+delete_timestamp.
+
+.. note::
+
+   It is on the development to-do list to write a utility that performs
+   this task, preferably through a REST call.
+
+The account reaper runs on each account server and scans the server
+occasionally for account databases marked for deletion. It only fires up
+on the accounts for which the server is the primary node, so that
+multiple account servers aren't trying to do it simultaneously. Using
+multiple servers to delete one account might improve the deletion speed
+but requires coordination to avoid duplication. Speed really is not a
+big concern with data deletion, and large accounts aren't deleted often.
+
+Deleting an account is simple. For each account container, all objects
+are deleted and then the container is deleted. Deletion requests that
+fail will not stop the overall process but will cause the overall
+process to fail eventually (for example, if an object delete times out,
+you will not be able to delete the container or the account). The
+account reaper keeps trying to delete an account until it is empty, at
+which point the database reclaim process within the db\_replicator will
+remove the database files.
+
+A persistent error state may prevent the deletion of an object or
+container. If this happens, you will see a message in the log, for example:
+
+.. code-block:: console
+
+   Account <name> has not been reaped since <date>
+
+You can control when this is logged with the ``reap_warn_after`` value in the
+``[account-reaper]`` section of the ``account-server.conf`` file.
+The default value is 30 days.
diff --git a/doc/source/admin/objectstorage-arch.rst b/doc/source/admin/objectstorage-arch.rst
new file mode 100644
index 0000000000..69b7fd96a7
--- /dev/null
+++ b/doc/source/admin/objectstorage-arch.rst
@@ -0,0 +1,89 @@
+====================
+Cluster architecture
+====================
+
+Access tier
+~~~~~~~~~~~
+Large-scale deployments segment off an access tier, which is considered
+the Object Storage system's central hub. The access tier fields the
+incoming API requests from clients and moves data in and out of the
+system. This tier consists of front-end load balancers, ssl-terminators,
+and authentication services. It runs the (distributed) brain of the
+Object Storage system: the proxy server processes.
+
+.. note::
+
+   If you want to use OpenStack Identity API v3 for authentication, you
+   have the following options available in ``/etc/swift/dispersion.conf``:
+   ``auth_version``, ``user_domain_name``, ``project_domain_name``,
+   and ``project_name``.
+
+**Object Storage architecture**
+
+
+.. figure:: figures/objectstorage-arch.png
+
+
+Because access servers are collocated in their own tier, you can scale
+out read/write access regardless of the storage capacity. For example,
+if a cluster is on the public Internet, requires SSL termination, and
+has a high demand for data access, you can provision many access
+servers. However, if the cluster is on a private network and used
+primarily for archival purposes, you need fewer access servers.
+
+Since this is an HTTP addressable storage service, you may incorporate a
+load balancer into the access tier.
+
+Typically, the tier consists of a collection of 1U servers. These
+machines use a moderate amount of RAM and are network I/O intensive.
+Since these systems field each incoming API request, you should
+provision them with two high-throughput (10GbE) interfaces - one for the
+incoming front-end requests and the other for the back-end access to
+the object storage nodes to put and fetch data.
+
+Factors to consider
+-------------------
+
+For most publicly facing deployments as well as private deployments
+available across a wide-reaching corporate network, you use SSL to
+encrypt traffic to the client. SSL adds significant processing load to
+establish sessions between clients, which is why you have to provision
+more capacity in the access layer. SSL may not be required for private
+deployments on trusted networks.
+
+Storage nodes
+~~~~~~~~~~~~~
+
+In most configurations, each of the five zones should have an equal
+amount of storage capacity. Storage nodes use a reasonable amount of
+memory and CPU. Metadata needs to be readily available to return objects
+quickly. The object stores run services not only to field incoming
+requests from the access tier, but to also run replicators, auditors,
+and reapers. You can provision storage nodes with single gigabit or
+10 gigabit network interface depending on the expected workload and
+desired performance, although it may be desirable to isolate replication
+traffic with a second interface.
+
+**Object Storage (swift)**
+
+
+.. figure:: figures/objectstorage-nodes.png
+
+
+
+Currently, a 2 TB or 3 TB SATA disk delivers good performance for the
+price. You can use desktop-grade drives if you have responsive remote
+hands in the datacenter and enterprise-grade drives if you don't.
+
+Factors to consider
+-------------------
+
+You should keep in mind the desired I/O performance for single-threaded
+requests. This system does not use RAID, so a single disk handles each
+request for an object. Disk performance impacts single-threaded response
+rates.
+
+To achieve apparent higher throughput, the object storage system is
+designed to handle concurrent uploads/downloads. The network I/O
+capacity (1GbE, bonded 1GbE pair, or 10GbE) should match your desired
+concurrent throughput needs for reads and writes.
diff --git a/doc/source/admin/objectstorage-auditors.rst b/doc/source/admin/objectstorage-auditors.rst
new file mode 100644
index 0000000000..1a3a5783cf
--- /dev/null
+++ b/doc/source/admin/objectstorage-auditors.rst
@@ -0,0 +1,30 @@
+==============
+Object Auditor
+==============
+
+On system failures, the XFS file system can sometimes truncate files it is
+trying to write and produce zero-byte files. The object-auditor will catch
+these problems but in the case of a system crash it is advisable to run
+an extra, less rate limited sweep, to check for these specific files.
+You can run this command as follows:
+
+.. code-block:: console
+
+   $ swift-object-auditor /path/to/object-server/config/file.conf once -z 1000
+
+.. note::
+
+   "-z" means to only check for zero-byte files at 1000 files per second.
+
+It is useful to run the object auditor on a specific device or set of devices.
+You can run the object-auditor once as follows:
+
+.. code-block:: console
+
+   $ swift-object-auditor /path/to/object-server/config/file.conf once \
+     --devices=sda,sdb
+
+.. note::
+
+   This will run the object auditor on only the ``sda`` and ``sdb`` devices.
+   This parameter accepts a comma-separated list of values.
diff --git a/doc/source/admin/objectstorage-characteristics.rst b/doc/source/admin/objectstorage-characteristics.rst
new file mode 100644
index 0000000000..3846bccb25
--- /dev/null
+++ b/doc/source/admin/objectstorage-characteristics.rst
@@ -0,0 +1,47 @@
+==============================
+Object Storage characteristics
+==============================
+
+The key characteristics of Object Storage are that:
+
+-  All objects stored in Object Storage have a URL.
+
+-  "Storage Policies" may be used to define different levels of durability
+   for objects stored in the cluster. These policies support not only
+   complete replicas but also erasure-coded fragments.
+
+-  All replicas or fragments for an object are stored in as-unique-as-possible
+   zones to increase durability and availability.
+
+-  All objects have their own metadata.
+
+-  Developers interact with the object storage system through a RESTful
+   HTTP API.
+
+-  Object data can be located anywhere in the cluster.
+
+-  The cluster scales by adding additional nodes without sacrificing
+   performance, which allows a more cost-effective linear storage
+   expansion than fork-lift upgrades.
+
+-  Data does not have to be migrated to an entirely new storage system.
+
+-  New nodes can be added to the cluster without downtime.
+
+-  Failed nodes and disks can be swapped out without downtime.
+
+-  It runs on industry-standard hardware, such as Dell, HP, and
+   Supermicro.
+
+.. _objectstorage-figure:
+
+Object Storage (swift)
+
+.. figure:: figures/objectstorage.png
+
+Developers can either write directly to the Swift API or use one of the
+many client libraries that exist for all of the popular programming
+languages, such as Java, Python, Ruby, and C#. Amazon S3 and RackSpace
+Cloud Files users should be very familiar with Object Storage. Users new
+to object storage systems will have to adjust to a different approach
+and mindset than those required for a traditional filesystem.
diff --git a/doc/source/admin/objectstorage-components.rst b/doc/source/admin/objectstorage-components.rst
new file mode 100644
index 0000000000..d784e07599
--- /dev/null
+++ b/doc/source/admin/objectstorage-components.rst
@@ -0,0 +1,255 @@
+==========
+Components
+==========
+
+Object Storage uses the following components to deliver high
+availability, high durability, and high concurrency:
+
+-  **Proxy servers** - Handle all of the incoming API requests.
+
+-  **Rings** - Map logical names of data to locations on particular
+   disks.
+
+-  **Zones** - Isolate data from other zones. A failure in one zone
+   does not impact the rest of the cluster as data replicates
+   across zones.
+
+-  **Accounts and containers** - Each account and container are
+   individual databases that are distributed across the cluster. An
+   account database contains the list of containers in that account. A
+   container database contains the list of objects in that container.
+
+-  **Objects** - The data itself.
+
+-  **Partitions** - A partition stores objects, account databases, and
+   container databases and helps manage locations where data lives in
+   the cluster.
+
+
+.. _objectstorage-building-blocks-figure:
+
+**Object Storage building blocks**
+
+.. figure:: figures/objectstorage-buildingblocks.png
+
+
+Proxy servers
+-------------
+
+Proxy servers are the public face of Object Storage and handle all of
+the incoming API requests. Once a proxy server receives a request, it
+determines the storage node based on the object's URL, for example:
+``https://swift.example.com/v1/account/container/object``. Proxy servers
+also coordinate responses, handle failures, and coordinate timestamps.
+
+Proxy servers use a shared-nothing architecture and can be scaled as
+needed based on projected workloads. A minimum of two proxy servers
+should be deployed behind a separately-managed load balancer. If one
+proxy server fails, the others take over.
+
+Rings
+-----
+
+A ring represents a mapping between the names of entities stored in the
+cluster and their physical locations on disks. There are separate rings
+for accounts, containers, and objects. When components of the system need
+to perform an operation on an object, container, or account, they need to
+interact with the corresponding ring to determine the appropriate location
+in the cluster.
+
+The ring maintains this mapping using zones, devices, partitions, and
+replicas. Each partition in the ring is replicated, by default, three
+times across the cluster, and partition locations are stored in the
+mapping maintained by the ring. The ring is also responsible for
+determining which devices are used as handoffs in failure scenarios.
+
+Data can be isolated into zones in the ring. Each partition replica
+will try to reside in a different zone. A zone could represent a
+drive, a server, a cabinet, a switch, or even a data center.
+
+The partitions of the ring are distributed among all of the devices
+in the Object Storage installation. When partitions need to be moved
+around (for example, if a device is added to the cluster), the ring
+ensures that a minimum number of partitions are moved at a time, and
+only one replica of a partition is moved at a time.
+
+You can use weights to balance the distribution of partitions on drives
+across the cluster. This can be useful, for example, when differently
+sized drives are used in a cluster.
+
+The ring is used by the proxy server and several background processes
+(like replication).
+
+
+.. _objectstorage-ring-figure:
+
+**The ring**
+
+.. figure:: figures/objectstorage-ring.png
+
+These rings are externally managed. The server processes themselves
+do not modify the rings, they are instead given new rings modified by
+other tools.
+
+The ring uses a configurable number of bits from an ``MD5`` hash for a path
+as a partition index that designates a device. The number of bits kept
+from the hash is known as the partition power, and 2 to the partition
+power indicates the partition count. Partitioning the full ``MD5`` hash ring
+allows other parts of the cluster to work in batches of items at once
+which ends up either more efficient or at least less complex than
+working with each item separately or the entire cluster all at once.
+
+Another configurable value is the replica count, which indicates how
+many of the partition-device assignments make up a single ring. For a
+given partition index, each replica's device will not be in the same
+zone as any other replica's device. Zones can be used to group devices
+based on physical locations, power separations, network separations, or
+any other attribute that would improve the availability of multiple
+replicas at the same time.
+
+Zones
+-----
+
+Object Storage allows configuring zones in order to isolate failure
+boundaries. If possible, each data replica resides in a separate zone.
+At the smallest level, a zone could be a single drive or a grouping of a
+few drives. If there were five object storage servers, then each server
+would represent its own zone. Larger deployments would have an entire
+rack (or multiple racks) of object servers, each representing a zone.
+The goal of zones is to allow the cluster to tolerate significant
+outages of storage servers without losing all replicas of the data.
+
+
+.. _objectstorage-zones-figure:
+
+**Zones**
+
+.. figure:: figures/objectstorage-zones.png
+
+
+Accounts and containers
+-----------------------
+
+Each account and container is an individual SQLite database that is
+distributed across the cluster. An account database contains the list of
+containers in that account. A container database contains the list of
+objects in that container.
+
+
+.. _objectstorage-accountscontainers-figure:
+
+**Accounts and containers**
+
+.. figure:: figures/objectstorage-accountscontainers.png
+
+
+To keep track of object data locations, each account in the system has a
+database that references all of its containers, and each container
+database references each object.
+
+Partitions
+----------
+
+A partition is a collection of stored data. This includes account databases,
+container databases, and objects. Partitions are core to the replication
+system.
+
+Think of a partition as a bin moving throughout a fulfillment center
+warehouse. Individual orders get thrown into the bin. The system treats
+that bin as a cohesive entity as it moves throughout the system. A bin
+is easier to deal with than many little things. It makes for fewer
+moving parts throughout the system.
+
+System replicators and object uploads/downloads operate on partitions.
+As the system scales up, its behavior continues to be predictable
+because the number of partitions is a fixed number.
+
+Implementing a partition is conceptually simple: a partition is just a
+directory sitting on a disk with a corresponding hash table of what it
+contains.
+
+
+.. _objectstorage-partitions-figure:
+
+**Partitions**
+
+.. figure:: figures/objectstorage-partitions.png
+
+
+Replicators
+-----------
+
+In order to ensure that there are three copies of the data everywhere,
+replicators continuously examine each partition. For each local
+partition, the replicator compares it against the replicated copies in
+the other zones to see if there are any differences.
+
+The replicator knows if replication needs to take place by examining
+hashes. A hash file is created for each partition, which contains hashes
+of each directory in the partition. For a given partition, the hash files
+for each of the partition's copies are compared. If the hashes are
+different, then it is time to replicate, and the directory that needs to
+be replicated is copied over.
+
+This is where partitions come in handy. With fewer things in the system,
+larger chunks of data are transferred around (rather than lots of little
+TCP connections, which is inefficient) and there is a consistent number
+of hashes to compare.
+
+The cluster has an eventually-consistent behavior where old data may be
+served from partitions that missed updates, but replication will cause
+all partitions to converge toward the newest data.
+
+
+.. _objectstorage-replication-figure:
+
+**Replication**
+
+.. figure:: figures/objectstorage-replication.png
+
+
+If a zone goes down, one of the nodes containing a replica notices and
+proactively copies data to a handoff location.
+
+Use cases
+---------
+
+The following sections show use cases for object uploads and downloads
+and introduce the components.
+
+
+Upload
+~~~~~~
+
+A client uses the REST API to make a HTTP request to PUT an object into
+an existing container. The cluster receives the request. First, the
+system must figure out where the data is going to go. To do this, the
+account name, container name, and object name are all used to determine
+the partition where this object should live.
+
+Then a lookup in the ring figures out which storage nodes contain the
+partitions in question.
+
+The data is then sent to each storage node where it is placed in the
+appropriate partition. At least two of the three writes must be
+successful before the client is notified that the upload was successful.
+
+Next, the container database is updated asynchronously to reflect that
+there is a new object in it.
+
+
+.. _objectstorage-usecase-figure:
+
+**Object Storage in use**
+
+.. figure:: figures/objectstorage-usecase.png
+
+
+Download
+~~~~~~~~
+
+A request comes in for an account/container/object. Using the same
+consistent hashing, the partition index is determined. A lookup in the
+ring reveals which storage nodes contain that partition. A request is
+made to one of the storage nodes to fetch the object and, if that fails,
+requests are made to the other nodes.
diff --git a/doc/source/admin/objectstorage-features.rst b/doc/source/admin/objectstorage-features.rst
new file mode 100644
index 0000000000..b0cb0ed0af
--- /dev/null
+++ b/doc/source/admin/objectstorage-features.rst
@@ -0,0 +1,52 @@
+=====================
+Features and benefits
+=====================
+
+.. list-table::
+   :header-rows: 1
+   :widths: 10 40
+
+   * - Features
+     - Benefits
+   * - Leverages commodity hardware
+     - No lock-in, lower price/GB.
+   * - HDD/node failure agnostic
+     - Self-healing, reliable, data redundancy protects from failures.
+   * - Unlimited storage
+     - Large and flat namespace, highly scalable read/write access,
+       able to serve content directly from storage system.
+   * - Multi-dimensional scalability
+     - Scale-out architecture: Scale vertically and
+       horizontally-distributed storage. Backs up and archives large
+       amounts of data with linear performance.
+   * - Account/container/object structure
+     - No nesting, not a traditional file system: Optimized for scale,
+       it scales to multiple petabytes and billions of objects.
+   * - Built-in replication 3✕ + data redundancy (compared with 2✕ on
+       RAID)
+     - A configurable number of accounts, containers and object copies
+       for high availability.
+   * - Easily add capacity (unlike RAID resize)
+     - Elastic data scaling with ease.
+   * - No central database
+     - Higher performance, no bottlenecks.
+   * - RAID not required
+     - Handle many small, random reads and writes efficiently.
+   * - Built-in management utilities
+     - Account management: Create, add, verify, and delete users;
+       Container management: Upload, download, and verify; Monitoring:
+       Capacity, host, network, log trawling, and cluster health.
+   * - Drive auditing
+     - Detect drive failures preempting data corruption.
+   * - Expiring objects
+     - Users can set an expiration time or a TTL on an object to
+       control access.
+   * - Direct object access
+     - Enable direct browser access to content, such as for a control
+       panel.
+   * - Realtime visibility into client requests
+     - Know what users are requesting.
+   * - Supports S3 API
+     - Utilize tools that were designed for the popular S3 API.
+   * - Restrict containers per account
+     - Limit access to control usage by user.
diff --git a/doc/source/admin/objectstorage-intro.rst b/doc/source/admin/objectstorage-intro.rst
new file mode 100644
index 0000000000..c5061e8a14
--- /dev/null
+++ b/doc/source/admin/objectstorage-intro.rst
@@ -0,0 +1,23 @@
+==============================
+Introduction to Object Storage
+==============================
+
+OpenStack Object Storage (swift) is used for redundant, scalable data
+storage using clusters of standardized servers to store petabytes of
+accessible data. It is a long-term storage system for large amounts of
+static data which can be retrieved and updated. Object Storage uses a
+distributed architecture
+with no central point of control, providing greater scalability,
+redundancy, and permanence. Objects are written to multiple hardware
+devices, with the OpenStack software responsible for ensuring data
+replication and integrity across the cluster. Storage clusters scale
+horizontally by adding new nodes. Should a node fail, OpenStack works to
+replicate its content from other active nodes. Because OpenStack uses
+software logic to ensure data replication and distribution across
+different devices, inexpensive commodity hard drives and servers can be
+used in lieu of more expensive equipment.
+
+Object Storage is ideal for cost effective, scale-out storage. It
+provides a fully distributed, API-accessible storage platform that can
+be integrated directly into applications or used for backup, archiving,
+and data retention.
diff --git a/doc/source/admin/objectstorage-large-objects.rst b/doc/source/admin/objectstorage-large-objects.rst
new file mode 100644
index 0000000000..e4b0490314
--- /dev/null
+++ b/doc/source/admin/objectstorage-large-objects.rst
@@ -0,0 +1,32 @@
+====================
+Large object support
+====================
+
+Object Storage (swift) uses segmentation to support the upload of large
+objects. By default, Object Storage limits the download size of a single
+object to 5GB. Using segmentation, uploading a single object is virtually
+unlimited. The segmentation process works by fragmenting the object,
+and automatically creating a file that sends the segments together as
+a single object. This option offers greater upload speed with the possibility
+of parallel uploads.
+
+Large objects
+~~~~~~~~~~~~~
+The large object is comprised of two types of objects:
+
+-  **Segment objects** store the object content. You can divide your
+   content into segments, and upload each segment into its own segment
+   object. Segment objects do not have any special features. You create,
+   update, download, and delete segment objects just as you would normal
+   objects.
+
+-  A **manifest object** links the segment objects into one logical
+   large object. When you download a manifest object, Object Storage
+   concatenates and returns the contents of the segment objects in the
+   response body of the request. The manifest object types are:
+
+   - **Static large objects**
+   - **Dynamic large objects**
+
+To find out more information on large object support,
+see :doc:`/overview_large_objects` in the developer documentation.
diff --git a/doc/source/admin/objectstorage-monitoring.rst b/doc/source/admin/objectstorage-monitoring.rst
new file mode 100644
index 0000000000..86e81711b8
--- /dev/null
+++ b/doc/source/admin/objectstorage-monitoring.rst
@@ -0,0 +1,216 @@
+=========================
+Object Storage monitoring
+=========================
+
+.. note::
+
+   This section was excerpted from a `blog post by Darrell
+   Bishop <https://swiftstack.com/blog/2012/04/11/swift-monitoring-with-statsd>`_ and
+   has since been edited.
+
+An OpenStack Object Storage cluster is a collection of many daemons that
+work together across many nodes. With so many different components, you
+must be able to tell what is going on inside the cluster. Tracking
+server-level meters like CPU utilization, load, memory consumption, disk
+usage and utilization, and so on is necessary, but not sufficient.
+
+Swift Recon
+~~~~~~~~~~~
+
+The Swift Recon middleware (see :ref:`cluster_telemetry_and_monitoring`)
+provides general machine statistics, such as load average, socket
+statistics, ``/proc/meminfo`` contents, as well as Swift-specific meters:
+
+-  The ``MD5`` sum of each ring file.
+
+-  The most recent object replication time.
+
+-  Count of each type of quarantined file: Account, container, or
+   object.
+
+-  Count of "async_pendings" (deferred container updates) on disk.
+
+Swift Recon is middleware that is installed in the object servers
+pipeline and takes one required option: A local cache directory. To
+track ``async_pendings``, you must set up an additional cron job for
+each object server. You access data by either sending HTTP requests
+directly to the object server or using the ``swift-recon`` command-line
+client.
+
+There are Object Storage cluster statistics but the typical
+server meters overlap with existing server monitoring systems. To get
+the Swift-specific meters into a monitoring system, they must be polled.
+Swift Recon acts as a middleware meters collector. The
+process that feeds meters to your statistics system, such as
+``collectd`` and ``gmond``, should already run on the storage node.
+You can choose to either talk to Swift Recon or collect the meters
+directly.
+
+Swift-Informant
+~~~~~~~~~~~~~~~
+
+Swift-Informant middleware (see
+`swift-informant <https://github.com/pandemicsyn/swift-informant>`_) has
+real-time visibility into Object Storage client requests. It sits in the
+pipeline for the proxy server, and after each request to the proxy server it
+sends three meters to a ``StatsD`` server:
+
+-  A counter increment for a meter like ``obj.GET.200`` or
+   ``cont.PUT.404``.
+
+-  Timing data for a meter like ``acct.GET.200`` or ``obj.GET.200``.
+   [The README says the meters look like ``duration.acct.GET.200``, but
+   I do not see the ``duration`` in the code. I am not sure what the
+   Etsy server does but our StatsD server turns timing meters into five
+   derivative meters with new segments appended, so it probably works as
+   coded. The first meter turns into ``acct.GET.200.lower``,
+   ``acct.GET.200.upper``, ``acct.GET.200.mean``,
+   ``acct.GET.200.upper_90``, and ``acct.GET.200.count``].
+
+-  A counter increase by the bytes transferred for a meter like
+   ``tfer.obj.PUT.201``.
+
+This is used for receiving information on the quality of service clients
+experience with the timing meters, as well as sensing the volume of the
+various modifications of a request server type, command, and response
+code. Swift-Informant requires no change to core Object
+Storage code because it is implemented as middleware. However, it gives
+no insight into the workings of the cluster past the proxy server.
+If the responsiveness of one storage node degrades, you can only see
+that some of the requests are bad, either as high latency or error
+status codes.
+
+Statsdlog
+~~~~~~~~~
+
+The `Statsdlog <https://github.com/pandemicsyn/statsdlog>`_
+project increments StatsD counters based on logged events. Like
+Swift-Informant, it is also non-intrusive, however statsdlog can track
+events from all Object Storage daemons, not just proxy-server. The
+daemon listens to a UDP stream of syslog messages, and StatsD counters
+are incremented when a log line matches a regular expression. Meter
+names are mapped to regex match patterns in a JSON file, allowing
+flexible configuration of what meters are extracted from the log stream.
+
+Currently, only the first matching regex triggers a StatsD counter
+increment, and the counter is always incremented by one. There is no way
+to increment a counter by more than one or send timing data to StatsD
+based on the log line content. The tool could be extended to handle more
+meters for each line and data extraction, including timing data. But a
+coupling would still exist between the log textual format and the log
+parsing regexes, which would themselves be more complex to support
+multiple matches for each line and data extraction. Also, log processing
+introduces a delay between the triggering event and sending the data to
+StatsD. It would be preferable to increment error counters where they
+occur and send timing data as soon as it is known to avoid coupling
+between a log string and a parsing regex and prevent a time delay
+between events and sending data to StatsD.
+
+The next section describes another method for gathering Object Storage
+operational meters.
+
+Swift StatsD logging
+~~~~~~~~~~~~~~~~~~~~
+
+StatsD (see `Measure Anything, Measure Everything
+<https://codeascraft.com/2011/02/15/measure-anything-measure-everything/>`_)
+was designed for application code to be deeply instrumented. Meters are
+sent in real-time by the code that just noticed or did something. The
+overhead of sending a meter is extremely low: a ``sendto`` of one UDP
+packet. If that overhead is still too high, the StatsD client library
+can send only a random portion of samples and StatsD approximates the
+actual number when flushing meters upstream.
+
+To avoid the problems inherent with middleware-based monitoring and
+after-the-fact log processing, the sending of StatsD meters is
+integrated into Object Storage itself. Details of the meters tracked
+are in the :doc:`/admin_guide`.
+
+The sending of meters is integrated with the logging framework. To
+enable, configure ``log_statsd_host`` in the relevant config file. You
+can also specify the port and a default sample rate. The specified
+default sample rate is used unless a specific call to a statsd logging
+method (see the list below) overrides it. Currently, no logging calls
+override the sample rate, but it is conceivable that some meters may
+require accuracy (``sample_rate=1``) while others may not.
+
+.. code-block:: ini
+
+   [DEFAULT]
+   # ...
+   log_statsd_host = 127.0.0.1
+   log_statsd_port = 8125
+   log_statsd_default_sample_rate = 1
+
+Then the LogAdapter object returned by ``get_logger()``, usually stored
+in ``self.logger``, has these new methods:
+
+-  ``update_stats(self, metric, amount, sample_rate=1)`` Increments
+   the supplied meter by the given amount. This is used when you need
+   to add or subtract more that one from a counter, like incrementing
+   ``suffix.hashes`` by the number of computed hashes in the object
+   replicator.
+
+-  ``increment(self, metric, sample_rate=1)`` Increments the given counter
+   meter by one.
+
+-  ``decrement(self, metric, sample_rate=1)`` Lowers the given counter
+   meter by one.
+
+-  ``timing(self, metric, timing_ms, sample_rate=1)`` Record that the
+   given meter took the supplied number of milliseconds.
+
+-  ``timing_since(self, metric, orig_time, sample_rate=1)``
+   Convenience method to record a timing meter whose value is "now"
+   minus an existing timestamp.
+
+.. note::
+
+   These logging methods may safely be called anywhere you have a
+   logger object. If StatsD logging has not been configured, the methods
+   are no-ops. This avoids messy conditional logic each place a meter is
+   recorded. These example usages show the new logging methods:
+
+   .. code-block:: python
+
+      # swift/obj/replicator.py
+      def update(self, job):
+           # ...
+          begin = time.time()
+          try:
+              hashed, local_hash = tpool.execute(tpooled_get_hashes, job['path'],
+                      do_listdir=(self.replication_count % 10) == 0,
+                      reclaim_age=self.reclaim_age)
+              # See tpooled_get_hashes "Hack".
+              if isinstance(hashed, BaseException):
+                  raise hashed
+              self.suffix_hash += hashed
+              self.logger.update_stats('suffix.hashes', hashed)
+              # ...
+          finally:
+              self.partition_times.append(time.time() - begin)
+              self.logger.timing_since('partition.update.timing', begin)
+
+   .. code-block:: python
+
+      # swift/container/updater.py
+      def process_container(self, dbfile):
+          # ...
+          start_time = time.time()
+          # ...
+              for event in events:
+                  if 200 <= event.wait() < 300:
+                      successes += 1
+                  else:
+                      failures += 1
+              if successes > failures:
+                self.logger.increment('successes')
+                  # ...
+              else:
+                  self.logger.increment('failures')
+                  # ...
+              # Only track timing data for attempted updates:
+              self.logger.timing_since('timing', start_time)
+          else:
+              self.logger.increment('no_changes')
+              self.no_changes += 1
diff --git a/doc/source/admin/objectstorage-replication.rst b/doc/source/admin/objectstorage-replication.rst
new file mode 100644
index 0000000000..32cd33ad60
--- /dev/null
+++ b/doc/source/admin/objectstorage-replication.rst
@@ -0,0 +1,98 @@
+===========
+Replication
+===========
+
+Because each replica in Object Storage functions independently and
+clients generally require only a simple majority of nodes to respond to
+consider an operation successful, transient failures like network
+partitions can quickly cause replicas to diverge. These differences are
+eventually reconciled by asynchronous, peer-to-peer replicator
+processes. The replicator processes traverse their local file systems
+and concurrently perform operations in a manner that balances load
+across physical disks.
+
+Replication uses a push model, with records and files generally only
+being copied from local to remote replicas. This is important because
+data on the node might not belong there (as in the case of hand offs and
+ring changes), and a replicator cannot know which data it should pull in
+from elsewhere in the cluster. Any node that contains data must ensure
+that data gets to where it belongs. The ring handles replica placement.
+
+To replicate deletions in addition to creations, every deleted record or
+file in the system is marked by a tombstone. The replication process
+cleans up tombstones after a time period known as the ``consistency
+window``. This window defines the duration of the replication and how
+long transient failure can remove a node from the cluster. Tombstone
+cleanup must be tied to replication to reach replica convergence.
+
+If a replicator detects that a remote drive has failed, the replicator
+uses the ``get_more_nodes`` interface for the ring to choose an
+alternate node with which to synchronize. The replicator can maintain
+desired levels of replication during disk failures, though some replicas
+might not be in an immediately usable location.
+
+.. note::
+
+   The replicator does not maintain desired levels of replication when
+   failures such as entire node failures occur; most failures are
+   transient.
+
+The main replication types are:
+
+- Database replication
+    Replicates containers and objects.
+
+- Object replication
+    Replicates object data.
+
+Database replication
+~~~~~~~~~~~~~~~~~~~~
+
+Database replication completes a low-cost hash comparison to determine
+whether two replicas already match. Normally, this check can quickly
+verify that most databases in the system are already synchronized. If
+the hashes differ, the replicator synchronizes the databases by sharing
+records added since the last synchronization point.
+
+This synchronization point is a high water mark that notes the last
+record at which two databases were known to be synchronized, and is
+stored in each database as a tuple of the remote database ID and record
+ID. Database IDs are unique across all replicas of the database, and
+record IDs are monotonically increasing integers. After all new records
+are pushed to the remote database, the entire synchronization table of
+the local database is pushed, so the remote database can guarantee that
+it is synchronized with everything with which the local database was
+previously synchronized.
+
+If a replica is missing, the whole local database file is transmitted to
+the peer by using rsync(1) and is assigned a new unique ID.
+
+In practice, database replication can process hundreds of databases per
+concurrency setting per second (up to the number of available CPUs or
+disks) and is bound by the number of database transactions that must be
+performed.
+
+Object replication
+~~~~~~~~~~~~~~~~~~
+
+The initial implementation of object replication performed an rsync to
+push data from a local partition to all remote servers where it was
+expected to reside. While this worked at small scale, replication times
+skyrocketed once directory structures could no longer be held in RAM.
+This scheme was modified to save a hash of the contents for each suffix
+directory to a per-partition hashes file. The hash for a suffix
+directory is no longer valid when the contents of that suffix directory
+is modified.
+
+The object replication process reads in hash files and calculates any
+invalidated hashes. Then, it transmits the hashes to each remote server
+that should hold the partition, and only suffix directories with
+differing hashes on the remote server are rsynced. After pushing files
+to the remote server, the replication process notifies it to recalculate
+hashes for the rsynced suffix directories.
+
+The number of uncached directories that object replication must
+traverse, usually as a result of invalidated suffix directory hashes,
+impedes performance. To provide acceptable replication speeds, object
+replication is designed to invalidate around 2 percent of the hash space
+on a normal node each day.
diff --git a/doc/source/admin/objectstorage-ringbuilder.rst b/doc/source/admin/objectstorage-ringbuilder.rst
new file mode 100644
index 0000000000..ddd6f6063c
--- /dev/null
+++ b/doc/source/admin/objectstorage-ringbuilder.rst
@@ -0,0 +1,228 @@
+============
+Ring-builder
+============
+
+Use the swift-ring-builder utility to build and manage rings. This
+utility assigns partitions to devices and writes an optimized Python
+structure to a gzipped, serialized file on disk for transmission to the
+servers. The server processes occasionally check the modification time
+of the file and reload in-memory copies of the ring structure as needed.
+If you use a slightly older version of the ring, one of the three
+replicas for a partition subset will be incorrect because of the way the
+ring-builder manages changes to the ring. You can work around this
+issue.
+
+The ring-builder also keeps its own builder file with the ring
+information and additional data required to build future rings. It is
+very important to keep multiple backup copies of these builder files.
+One option is to copy the builder files out to every server while
+copying the ring files themselves. Another is to upload the builder
+files into the cluster itself. If you lose the builder file, you have to
+create a new ring from scratch. Nearly all partitions would be assigned
+to different devices and, therefore, nearly all of the stored data would
+have to be replicated to new locations. So, recovery from a builder file
+loss is possible, but data would be unreachable for an extended time.
+
+Ring data structure
+~~~~~~~~~~~~~~~~~~~
+
+The ring data structure consists of three top level fields: a list of
+devices in the cluster, a list of lists of device ids indicating
+partition to device assignments, and an integer indicating the number of
+bits to shift an MD5 hash to calculate the partition for the hash.
+
+Partition assignment list
+~~~~~~~~~~~~~~~~~~~~~~~~~
+
+This is a list of ``array('H')`` of devices ids. The outermost list
+contains an ``array('H')`` for each replica. Each ``array('H')`` has a
+length equal to the partition count for the ring. Each integer in the
+``array('H')`` is an index into the above list of devices. The partition
+list is known internally to the Ring class as ``_replica2part2dev_id``.
+
+So, to create a list of device dictionaries assigned to a partition, the
+Python code would look like:
+
+.. code-block:: python
+
+   devices = [self.devs[part2dev_id[partition]] for
+   part2dev_id in self._replica2part2dev_id]
+
+That code is a little simplistic because it does not account for the
+removal of duplicate devices. If a ring has more replicas than devices,
+a partition will have more than one replica on a device.
+
+``array('H')`` is used for memory conservation as there may be millions
+of partitions.
+
+Overload
+~~~~~~~~
+
+The ring builder tries to keep replicas as far apart as possible while
+still respecting device weights. When it can not do both, the overload
+factor determines what happens. Each device takes an extra
+fraction of its desired partitions to allow for replica dispersion;
+after that extra fraction is exhausted, replicas are placed closer
+together than optimal.
+
+The overload factor lets the operator trade off replica
+dispersion (durability) against data dispersion (uniform disk usage).
+
+The default overload factor is 0, so device weights are strictly
+followed.
+
+With an overload factor of 0.1, each device accepts 10% more
+partitions than it otherwise would, but only if it needs to maintain
+partition dispersion.
+
+For example, consider a 3-node cluster of machines with equal-size disks;
+node A has 12 disks, node B has 12 disks, and node C has
+11 disks. The ring has an overload factor of 0.1 (10%).
+
+Without the overload, some partitions would end up with replicas only
+on nodes A and B. However, with the overload, every device can accept
+up to 10% more partitions for the sake of dispersion. The
+missing disk in C means there is one disk's worth of partitions
+to spread across the remaining 11 disks, which gives each
+disk in C an extra 9.09% load. Since this is less than the 10%
+overload, there is one replica of each partition on each node.
+
+However, this does mean that the disks in node C have more data
+than the disks in nodes A and B. If 80% full is the warning
+threshold for the cluster, node C's disks reach 80% full while A
+and B's disks are only 72.7% full.
+
+
+Replica counts
+~~~~~~~~~~~~~~
+
+To support the gradual change in replica counts, a ring can have a real
+number of replicas and is not restricted to an integer number of
+replicas.
+
+A fractional replica count is for the whole ring and not for individual
+partitions. It indicates the average number of replicas for each
+partition. For example, a replica count of 3.2 means that 20 percent of
+partitions have four replicas and 80 percent have three replicas.
+
+The replica count is adjustable. For example:
+
+.. code-block:: console
+
+   $ swift-ring-builder account.builder set_replicas 4
+   $ swift-ring-builder account.builder rebalance
+
+You must rebalance the replica ring in globally distributed clusters.
+Operators of these clusters generally want an equal number of replicas
+and regions. Therefore, when an operator adds or removes a region, the
+operator adds or removes a replica. Removing unneeded replicas saves on
+the cost of disks.
+
+You can gradually increase the replica count at a rate that does not
+adversely affect cluster performance. For example:
+
+.. code-block:: console
+
+   $ swift-ring-builder object.builder set_replicas 3.01
+   $ swift-ring-builder object.builder rebalance
+   <distribute rings and wait>...
+
+   $ swift-ring-builder object.builder set_replicas 3.02
+   $ swift-ring-builder object.builder rebalance
+   <distribute rings and wait>...
+
+Changes take effect after the ring is rebalanced. Therefore, if you
+intend to change from 3 replicas to 3.01 but you accidentally type
+2.01, no data is lost.
+
+Additionally, the :command:`swift-ring-builder X.builder create` command can
+now take a decimal argument for the number of replicas.
+
+Partition shift value
+~~~~~~~~~~~~~~~~~~~~~
+
+The partition shift value is known internally to the Ring class as
+``_part_shift``. This value is used to shift an MD5 hash to calculate
+the partition where the data for that hash should reside. Only the top
+four bytes of the hash is used in this process. For example, to compute
+the partition for the ``/account/container/object`` path using Python:
+
+.. code-block:: python
+
+   partition = unpack_from('>I',
+   md5('/account/container/object').digest())[0] >>
+   self._part_shift
+
+For a ring generated with part\_power P, the partition shift value is
+``32 - P``.
+
+Build the ring
+~~~~~~~~~~~~~~
+
+The ring builder process includes these high-level steps:
+
+#. The utility calculates the number of partitions to assign to each
+   device based on the weight of the device. For example, for a
+   partition at the power of 20, the ring has 1,048,576 partitions. One
+   thousand devices of equal weight each want 1,048.576 partitions. The
+   devices are sorted by the number of partitions they desire and kept
+   in order throughout the initialization process.
+
+   .. note::
+
+      Each device is also assigned a random tiebreaker value that is
+      used when two devices desire the same number of partitions. This
+      tiebreaker is not stored on disk anywhere, and so two different
+      rings created with the same parameters will have different
+      partition assignments. For repeatable partition assignments,
+      ``RingBuilder.rebalance()`` takes an optional seed value that
+      seeds the Python pseudo-random number generator.
+
+#. The ring builder assigns each partition replica to the device that
+   requires most partitions at that point while keeping it as far away
+   as possible from other replicas. The ring builder prefers to assign a
+   replica to a device in a region that does not already have a replica.
+   If no such region is available, the ring builder searches for a
+   device in a different zone, or on a different server. If it does not
+   find one, it looks for a device with no replicas. Finally, if all
+   options are exhausted, the ring builder assigns the replica to the
+   device that has the fewest replicas already assigned.
+
+   .. note::
+
+      The ring builder assigns multiple replicas to one device only if
+      the ring has fewer devices than it has replicas.
+
+#. When building a new ring from an old ring, the ring builder
+   recalculates the desired number of partitions that each device wants.
+
+#. The ring builder unassigns partitions and gathers these partitions
+   for reassignment, as follows:
+
+   - The ring builder unassigns any assigned partitions from any
+     removed devices and adds these partitions to the gathered list.
+   - The ring builder unassigns any partition replicas that can be
+     spread out for better durability and adds these partitions to the
+     gathered list.
+   - The ring builder unassigns random partitions from any devices that
+     have more partitions than they need and adds these partitions to
+     the gathered list.
+
+#. The ring builder reassigns the gathered partitions to devices by
+   using a similar method to the one described previously.
+
+#. When the ring builder reassigns a replica to a partition, the ring
+   builder records the time of the reassignment. The ring builder uses
+   this value when it gathers partitions for reassignment so that no
+   partition is moved twice in a configurable amount of time. The
+   RingBuilder class knows this configurable amount of time as
+   ``min_part_hours``. The ring builder ignores this restriction for
+   replicas of partitions on removed devices because removal of a device
+   happens on device failure only, and reassignment is the only choice.
+
+These steps do not always perfectly rebalance a ring due to the random
+nature of gathering partitions for reassignment. To help reach a more
+balanced ring, the rebalance process is repeated until near perfect
+(less than 1 percent off) or when the balance does not improve by at
+least 1 percent (indicating we probably cannot get perfect balance due
+to wildly imbalanced zones or too many partitions recently moved).
diff --git a/doc/source/admin/objectstorage-tenant-specific-image-storage.rst b/doc/source/admin/objectstorage-tenant-specific-image-storage.rst
new file mode 100644
index 0000000000..69855d8ef1
--- /dev/null
+++ b/doc/source/admin/objectstorage-tenant-specific-image-storage.rst
@@ -0,0 +1,32 @@
+==============================================================
+Configure project-specific image locations with Object Storage
+==============================================================
+
+For some deployers, it is not ideal to store all images in one place to
+enable all projects and users to access them. You can configure the Image
+service to store image data in project-specific image locations. Then,
+only the following projects can use the Image service to access the
+created image:
+
+- The project who owns the image
+- Projects that are defined in ``swift_store_admin_tenants`` and that
+  have admin-level accounts
+
+**To configure project-specific image locations**
+
+#. Configure swift as your ``default_store`` in the
+   ``glance-api.conf`` file.
+
+#. Set these configuration options in the ``glance-api.conf`` file:
+
+   - swift_store_multi_tenant
+      Set to ``True`` to enable tenant-specific storage locations.
+      Default is ``False``.
+
+   - swift_store_admin_tenants
+      Specify a list of tenant IDs that can grant read and write access to all
+      Object Storage containers that are created by the Image service.
+
+With this configuration, images are stored in an Object Storage service
+(swift) endpoint that is pulled from the service catalog for the
+authenticated user.
diff --git a/doc/source/admin/objectstorage-troubleshoot.rst b/doc/source/admin/objectstorage-troubleshoot.rst
new file mode 100644
index 0000000000..29adaba07a
--- /dev/null
+++ b/doc/source/admin/objectstorage-troubleshoot.rst
@@ -0,0 +1,208 @@
+===========================
+Troubleshoot Object Storage
+===========================
+
+For Object Storage, everything is logged in ``/var/log/syslog`` (or
+``messages`` on some distros). Several settings enable further
+customization of logging, such as ``log_name``, ``log_facility``, and
+``log_level``, within the object server configuration files.
+
+Drive failure
+~~~~~~~~~~~~~
+
+Problem
+-------
+
+Drive failure can prevent Object Storage performing replication.
+
+Solution
+--------
+
+In the event that a drive has failed, the first step is to make sure the
+drive is unmounted. This will make it easier for Object Storage to work
+around the failure until it has been resolved. If the drive is going to
+be replaced immediately, then it is just best to replace the drive,
+format it, remount it, and let replication fill it up.
+
+If you cannot replace the drive immediately, then it is best to leave it
+unmounted, and remove the drive from the ring. This will allow all the
+replicas that were on that drive to be replicated elsewhere until the
+drive is replaced. Once the drive is replaced, it can be re-added to the
+ring.
+
+You can look at error messages in the ``/var/log/kern.log`` file for
+hints of drive failure.
+
+Server failure
+~~~~~~~~~~~~~~
+
+Problem
+-------
+
+The server is potentially offline, and may have failed, or require a
+reboot.
+
+Solution
+--------
+
+If a server is having hardware issues, it is a good idea to make sure
+the Object Storage services are not running. This will allow Object
+Storage to work around the failure while you troubleshoot.
+
+If the server just needs a reboot, or a small amount of work that should
+only last a couple of hours, then it is probably best to let Object
+Storage work around the failure and get the machine fixed and back
+online. When the machine comes back online, replication will make sure
+that anything that is missing during the downtime will get updated.
+
+If the server has more serious issues, then it is probably best to
+remove all of the server's devices from the ring. Once the server has
+been repaired and is back online, the server's devices can be added back
+into the ring. It is important that the devices are reformatted before
+putting them back into the ring as it is likely to be responsible for a
+different set of partitions than before.
+
+Detect failed drives
+~~~~~~~~~~~~~~~~~~~~
+
+Problem
+-------
+
+When drives fail, it can be difficult to detect that a drive has failed,
+and the details of the failure.
+
+Solution
+--------
+
+It has been our experience that when a drive is about to fail, error
+messages appear in the ``/var/log/kern.log`` file. There is a script called
+``swift-drive-audit`` that can be run via cron to watch for bad drives. If
+errors are detected, it will unmount the bad drive, so that Object
+Storage can work around it. The script takes a configuration file with
+the following settings:
+
+.. list-table:: **Description of configuration options for [drive-audit] in drive-audit.conf**
+   :header-rows: 1
+
+   * - Configuration option = Default value
+     - Description
+   * - ``device_dir = /srv/node``
+     - Directory devices are mounted under
+   * - ``error_limit = 1``
+     - Number of errors to find before a device is unmounted
+   * - ``log_address = /dev/log``
+     - Location where syslog sends the logs to
+   * - ``log_facility = LOG_LOCAL0``
+     - Syslog log facility
+   * - ``log_file_pattern = /var/log/kern.*[!.][!g][!z]``
+     - Location of the log file with globbing pattern to check against device
+       errors locate device blocks with errors in the log file
+   * - ``log_level = INFO``
+     - Logging level
+   * - ``log_max_line_length = 0``
+     - Caps the length of log lines to the value given; no limit if set to 0,
+       the default.
+   * - ``log_to_console = False``
+     - No help text available for this option.
+   * - ``minutes = 60``
+     - Number of minutes to look back in ``/var/log/kern.log``
+   * - ``recon_cache_path = /var/cache/swift``
+     - Directory where stats for a few items will be stored
+   * - ``regex_pattern_1 = \berror\b.*\b(dm-[0-9]{1,2}\d?)\b``
+     - No help text available for this option.
+   * - ``unmount_failed_device = True``
+     - No help text available for this option.
+
+.. warning::
+
+   This script has only been tested on Ubuntu 10.04; use with caution on
+   other operating systems in production.
+
+Emergency recovery of ring builder files
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Problem
+-------
+
+An emergency might prevent a successful backup from restoring the
+cluster to operational status.
+
+Solution
+--------
+
+You should always keep a backup of swift ring builder files. However, if
+an emergency occurs, this procedure may assist in returning your cluster
+to an operational state.
+
+Using existing swift tools, there is no way to recover a builder file
+from a ``ring.gz`` file. However, if you have a knowledge of Python, it
+is possible to construct a builder file that is pretty close to the one
+you have lost.
+
+.. warning::
+
+   This procedure is a last-resort for emergency circumstances. It
+   requires knowledge of the swift python code and may not succeed.
+
+#. Load the ring and a new ringbuilder object in a Python REPL:
+
+   .. code-block:: python
+
+      >>> from swift.common.ring import RingData, RingBuilder
+      >>> ring = RingData.load('/path/to/account.ring.gz')
+
+#. Start copying the data we have in the ring into the builder:
+
+   .. code-block:: python
+
+      >>> import math
+      >>> partitions = len(ring._replica2part2dev_id[0])
+      >>> replicas = len(ring._replica2part2dev_id)
+
+      >>> builder = RingBuilder(int(math.log(partitions, 2)), replicas, 1)
+      >>> builder.devs = ring.devs
+      >>> builder._replica2part2dev = ring._replica2part2dev_id
+      >>> builder._last_part_moves_epoch = 0
+      >>> from array import array
+      >>> builder._last_part_moves = array('B', (0 for _ in range(partitions)))
+      >>> builder._set_parts_wanted()
+      >>> for d in builder._iter_devs():
+                  d['parts'] = 0
+      >>> for p2d in builder._replica2part2dev:
+                  for dev_id in p2d:
+                      builder.devs[dev_id]['parts'] += 1
+
+      This is the extent of the recoverable fields.
+
+#. For ``min_part_hours`` you either have to remember what the value you
+   used was, or just make up a new one:
+
+   .. code-block:: python
+
+      >>> builder.change_min_part_hours(24) # or whatever you want it to be
+
+#. Validate the builder. If this raises an exception, check your
+   previous code:
+
+   .. code-block:: python
+
+      >>> builder.validate()
+
+#. After it validates, save the builder and create a new ``account.builder``:
+
+   .. code-block:: python
+
+      >>> import pickle
+      >>> pickle.dump(builder.to_dict(), open('account.builder', 'wb'), protocol=2)
+      >>> exit ()
+
+#. You should now have a file called ``account.builder`` in the current
+   working directory. Run
+   :command:`swift-ring-builder account.builder write_ring` and compare the new
+   ``account.ring.gz`` to the ``account.ring.gz`` that you started
+   from. They probably are not byte-for-byte identical, but if you load them
+   in a REPL and their ``_replica2part2dev_id`` and ``devs`` attributes are
+   the same (or nearly so), then you are in good shape.
+
+#. Repeat the procedure for ``container.ring.gz`` and
+   ``object.ring.gz``, and you might get usable builder files.
diff --git a/doc/source/admin_guide.rst b/doc/source/admin_guide.rst
index b1d00fa364..8754fd34d7 100644
--- a/doc/source/admin_guide.rst
+++ b/doc/source/admin_guide.rst
@@ -2,6 +2,33 @@
 Administrator's Guide
 =====================
 
+-------------------------
+Defining Storage Policies
+-------------------------
+
+Defining your Storage Policies is very easy to do with Swift.  It is important
+that the administrator understand the concepts behind Storage Policies
+before actually creating and using them in order to get the most benefit out
+of the feature and, more importantly, to avoid having to make unnecessary changes
+once a set of policies have been deployed to a cluster.
+
+It is highly recommended that the reader fully read and comprehend
+:doc:`overview_policies` before proceeding with administration of
+policies.  Plan carefully and it is suggested that experimentation be
+done first on a non-production cluster to be certain that the desired
+configuration meets the needs of the users.  See :ref:`upgrade-policy`
+before planning the upgrade of your existing deployment.
+
+Following is a high level view of the very few steps it takes to configure
+policies once you have decided what you want to do:
+
+#. Define your policies in ``/etc/swift/swift.conf``
+#. Create the corresponding object rings
+#. Communicate the names of the Storage Policies to cluster users
+
+For a specific example that takes you through these steps, please see
+:doc:`policies_saio`
+
 ------------------
 Managing the Rings
 ------------------
@@ -22,25 +49,27 @@ ring building server **last** after all Swift nodes have been successfully
 upgraded, or refrain from generating rings until all Swift nodes have
 been successfully upgraded.
 
-If you need to downgrade from a version of swift greater than 1.6.0 to
+If you need to downgrade from a version of Swift greater than 1.6.0 to
 a version less than or equal to 1.6.0, first downgrade your ring-building
 server, generate new rings, push them out, then continue with the rest
 of the downgrade.
 
 For more information see :doc:`overview_ring`.
 
+.. highlight:: none
+
 Removing a device from the ring::
 
     swift-ring-builder <builder-file> remove <ip_address>/<device_name>
-    
+
 Removing a server from the ring::
 
     swift-ring-builder <builder-file> remove <ip_address>
-    
+
 Adding devices to the ring:
 
 See :ref:`ring-preparing`
-    
+
 See what devices for a server are in the ring::
 
     swift-ring-builder <builder-file> search <ip_address>
@@ -49,10 +78,79 @@ Once you are done with all changes to the ring, the changes need to be
 "committed"::
 
     swift-ring-builder <builder-file> rebalance
-    
+
 Once the new rings are built, they should be pushed out to all the servers
 in the cluster.
 
+Optionally, if invoked as 'swift-ring-builder-safe' the directory containing
+the specified builder file will be locked (via a .lock file in the parent
+directory). This provides a basic safe guard against multiple instances
+of the swift-ring-builder (or other utilities that observe this lock) from
+attempting to write to or read the builder/ring files while operations are in
+progress. This can be useful in environments where ring management has been
+automated but the operator still needs to interact with the rings manually.
+
+If the ring builder is not producing the balances that you are
+expecting, you can gain visibility into what it's doing with the
+``--debug`` flag.::
+
+    swift-ring-builder <builder-file> rebalance --debug
+
+This produces a great deal of output that is mostly useful if you are
+either (a) attempting to fix the ring builder, or (b) filing a bug
+against the ring builder.
+
+You may notice in the rebalance output a 'dispersion' number. What this
+number means is explained in :ref:`ring_dispersion` but in essence
+is the percentage of partitions in the ring that have too many replicas
+within a particular failure domain. You can ask 'swift-ring-builder' what
+the dispersion is with::
+
+  swift-ring-builder <builder-file> dispersion
+
+This will give you the percentage again, if you want a detailed view of
+the dispersion simply add a ``--verbose``::
+
+  swift-ring-builder <builder-file> dispersion --verbose
+
+This will not only display the percentage but will also display a dispersion
+table that lists partition dispersion by tier. You can use this table to figure
+out were you need to add capacity or to help tune an :ref:`ring_overload` value.
+
+Now let's take an example with 1 region, 3 zones and 4 devices. Each device has
+the same weight, and the ``dispersion --verbose`` might show the following::
+
+  Dispersion is 16.666667, Balance is 0.000000, Overload is 0.00%
+  Required overload is 33.333333%
+  Worst tier is 33.333333 (r1z3)
+  --------------------------------------------------------------------------
+  Tier                           Parts      %    Max     0     1     2     3
+  --------------------------------------------------------------------------
+  r1                               768   0.00      3     0     0     0   256
+  r1z1                             192   0.00      1    64   192     0     0
+  r1z1-127.0.0.1                   192   0.00      1    64   192     0     0
+  r1z1-127.0.0.1/sda               192   0.00      1    64   192     0     0
+  r1z2                             192   0.00      1    64   192     0     0
+  r1z2-127.0.0.2                   192   0.00      1    64   192     0     0
+  r1z2-127.0.0.2/sda               192   0.00      1    64   192     0     0
+  r1z3                             384  33.33      1     0   128   128     0
+  r1z3-127.0.0.3                   384  33.33      1     0   128   128     0
+  r1z3-127.0.0.3/sda               192   0.00      1    64   192     0     0
+  r1z3-127.0.0.3/sdb               192   0.00      1    64   192     0     0
+
+The first line reports that there are 256 partitions with 3 copies in region 1;
+and this is an expected output in this case (single region with 3 replicas) as
+reported by the "Max" value.
+
+However, there is some imbalance in the cluster, more precisely in zone 3. The
+"Max" reports a maximum of 1 copy in this zone; however 50.00% of the partitions
+are storing 2 replicas in this zone (which is somewhat expected, because there
+are more disks in this zone).
+
+You can now either add more capacity to the other zones, decrease the total
+weight in zone 3 or set the overload to a value `greater than` 33.333333% -
+only as much overload as needed will be used.
+
 -----------------------
 Scripting Ring Creation
 -----------------------
@@ -65,18 +163,19 @@ You can create scripts to create the account and container rings and rebalance.
     cd /etc/swift
     rm -f account.builder account.ring.gz backups/account.builder backups/account.ring.gz
     swift-ring-builder account.builder create 18 3 1
-    swift-ring-builder account.builder add z1-<account-server-1>:6002/sdb1 1
-    swift-ring-builder account.builder add z2-<account-server-2>:6002/sdb1 1
+    swift-ring-builder account.builder add r1z1-<account-server-1>:6202/sdb1 1
+    swift-ring-builder account.builder add r1z2-<account-server-2>:6202/sdb1 1
     swift-ring-builder account.builder rebalance
 
    You need to replace the values of <account-server-1>,
    <account-server-2>, etc. with the IP addresses of the account
    servers used in your setup. You can have as many account servers as
    you need. All account servers are assumed to be listening on port
-   6002, and have a storage device called "sdb1" (this is a directory
+   6202, and have a storage device called "sdb1" (this is a directory
    name created under /drives when we setup the account server). The
    "z1", "z2", etc. designate zones, and you can choose whether you
-   put devices in the same or different zones.
+   put devices in the same or different zones. The "r1" designates
+   the region, with different regions specified as "r1", "r2", etc.
 
 2. Make the script file executable and run it to create the account ring file::
 
@@ -104,22 +203,37 @@ Handling Drive Failure
 ----------------------
 
 In the event that a drive has failed, the first step is to make sure the drive
-is unmounted.  This will make it easier for swift to work around the failure
+is unmounted.  This will make it easier for Swift to work around the failure
 until it has been resolved.  If the drive is going to be replaced immediately,
 then it is just best to replace the drive, format it, remount it, and let
 replication fill it up.
 
+After the drive is unmounted, make sure the mount point is owned by root
+(root:root 755). This ensures that rsync will not try to replicate into the
+root drive once the failed drive is unmounted.
+
 If the drive can't be replaced immediately, then it is best to leave it
-unmounted, and remove the drive from the ring. This will allow all the
+unmounted, and set the device weight to 0. This will allow all the
 replicas that were on that drive to be replicated elsewhere until the drive
-is replaced.  Once the drive is replaced, it can be re-added to the ring.
+is replaced. Once the drive is replaced, the device weight can be increased
+again. Setting the device weight to 0 instead of removing the drive from the
+ring gives Swift the chance to replicate data from the failing disk too (in case
+it is still possible to read some of the data).
+
+Setting the device weight to 0 (or removing a failed drive from the ring) has
+another benefit: all partitions that were stored on the failed drive are
+distributed over the remaining disks in the cluster, and each disk only needs to
+store a few new partitions. This is much faster compared to replicating all
+partitions to a single, new disk. It decreases the time to recover from a
+degraded number of replicas significantly, and becomes more and more important
+with bigger disks.
 
 -----------------------
 Handling Server Failure
 -----------------------
 
-If a server is having hardware issues, it is a good idea to make sure the 
-swift services are not running.  This will allow Swift to work around the
+If a server is having hardware issues, it is a good idea to make sure the
+Swift services are not running.  This will allow Swift to work around the
 failure while you troubleshoot.
 
 If the server just needs a reboot, or a small amount of work that should
@@ -141,31 +255,156 @@ Detecting Failed Drives
 
 It has been our experience that when a drive is about to fail, error messages
 will spew into `/var/log/kern.log`.  There is a script called
-`swift-drive-audit` that can be run via cron to watch for bad drives.  If 
+`swift-drive-audit` that can be run via cron to watch for bad drives.  If
 errors are detected, it will unmount the bad drive, so that Swift can
 work around it.  The script takes a configuration file with the following
 settings:
 
-[drive-audit]
+``[drive-audit]``
+
+==================  ==============  ===========================================
+Option              Default         Description
+------------------  --------------  -------------------------------------------
+user                swift           Drop privileges to this user for non-root
+                                    tasks
+log_facility        LOG_LOCAL0      Syslog log facility
+log_level           INFO            Log level
+device_dir          /srv/node       Directory devices are mounted under
+minutes             60              Number of minutes to look back in
+                                    `/var/log/kern.log`
+error_limit         1               Number of errors to find before a device
+                                    is unmounted
+log_file_pattern    /var/log/kern*  Location of the log file with globbing
+                                    pattern to check against device errors
+regex_pattern_X     (see below)     Regular expression patterns to be used to
+                                    locate device blocks with errors in the
+                                    log file
+==================  ==============  ===========================================
+
+The default regex pattern used to locate device blocks with errors are
+`\berror\b.*\b(sd[a-z]{1,2}\d?)\b` and `\b(sd[a-z]{1,2}\d?)\b.*\berror\b`.
+One is able to overwrite the default above by providing new expressions
+using the format `regex_pattern_X = regex_expression`, where `X` is a number.
+
+This script has been tested on Ubuntu 10.04 and Ubuntu 12.04, so if you are
+using a different distro or OS, some care should be taken before using in production.
+
+------------------------------
+Preventing Disk Full Scenarios
+------------------------------
+
+.. highlight:: cfg
+
+Prevent disk full scenarios by ensuring that the ``proxy-server`` blocks PUT
+requests and rsync prevents replication to the specific drives.
+
+You can prevent `proxy-server` PUT requests to low space disks by
+ensuring ``fallocate_reserve`` is set in ``account-server.conf``,
+``container-server.conf``, and ``object-server.conf``. By default,
+``fallocate_reserve`` is set to 1%. In the object server, this blocks
+PUT requests that would leave the free disk space below 1% of the
+disk. In the account and container servers, this blocks operations
+that will increase account or container database size once the free
+disk space falls below 1%.
+
+Setting ``fallocate_reserve`` is highly recommended to avoid filling
+disks to 100%. When Swift's disks are completely full, all requests
+involving those disks will fail, including DELETE requests that would
+otherwise free up space. This is because object deletion includes the
+creation of a zero-byte tombstone (.ts) to record the time of the
+deletion for replication purposes; this happens prior to deletion of
+the object's data. On a completely-full filesystem, that zero-byte .ts
+file cannot be created, so the DELETE request will fail and the disk
+will remain completely full. If ``fallocate_reserve`` is set, then the
+filesystem will have enough space to create the zero-byte .ts file,
+and thus the deletion of the object will succeed and free up some
+space.
+
+In order to prevent rsync replication to specific drives, firstly
+setup ``rsync_module`` per disk in your ``object-replicator``.
+Set this in ``object-server.conf``:
+
+.. code:: cfg
+
+    [object-replicator]
+    rsync_module = {replication_ip}::object_{device}
+
+Set the individual drives in ``rsync.conf``. For example:
+
+.. code:: cfg
+
+    [object_sda]
+    max connections = 4
+    lock file = /var/lock/object_sda.lock
+
+    [object_sdb]
+    max connections = 4
+    lock file = /var/lock/object_sdb.lock
+
+Finally, monitor the disk space of each disk and adjust the rsync
+``max connections`` per drive to ``-1``. We recommend utilising your existing
+monitoring solution to achieve this. The following is an example script:
 
-==================  ==========  ===========================================
-Option              Default     Description
-------------------  ----------  -------------------------------------------
-log_facility        LOG_LOCAL0  Syslog log facility
-log_level           INFO        Log level
-device_dir          /srv/node   Directory devices are mounted under
-minutes             60          Number of minutes to look back in
-                                `/var/log/kern.log`
-error_limit         1           Number of errors to find before a device
-                                is unmounted
-==================  ==========  ===========================================
+.. code-block:: python
 
-This script has only been tested on Ubuntu 10.04, so if you are using a
-different distro or OS, some care should be taken before using in production.
+    #!/usr/bin/env python
+    import os
+    import errno
 
---------------
-Cluster Health
---------------
+    RESERVE = 500 * 2 ** 20  # 500 MiB
+
+    DEVICES = '/srv/node1'
+
+    path_template = '/etc/rsync.d/disable_%s.conf'
+    config_template = '''
+    [object_%s]
+    max connections = -1
+    '''
+
+    def disable_rsync(device):
+        with open(path_template % device, 'w') as f:
+            f.write(config_template.lstrip() % device)
+
+
+    def enable_rsync(device):
+        try:
+            os.unlink(path_template % device)
+        except OSError as e:
+            # ignore file does not exist
+            if e.errno != errno.ENOENT:
+                raise
+
+
+    for device in os.listdir(DEVICES):
+        path = os.path.join(DEVICES, device)
+        st = os.statvfs(path)
+        free = st.f_bavail * st.f_frsize
+        if free < RESERVE:
+            disable_rsync(device)
+        else:
+            enable_rsync(device)
+
+For the above script to work, ensure ``/etc/rsync.d/`` conf files are
+included, by specifying ``&include`` in your ``rsync.conf`` file:
+
+.. code:: cfg
+
+    &include /etc/rsync.d
+
+Use this in conjunction with a cron job to periodically run the script, for example:
+
+.. highlight:: none
+
+.. code:: cfg
+
+    # /etc/cron.d/devicecheck
+    * * * * * root /some/path/to/disable_rsync.py
+
+.. _dispersion_report:
+
+-----------------
+Dispersion Report
+-----------------
 
 There is a swift-dispersion-report tool for measuring overall cluster health.
 This is accomplished by checking if a set of deliberately distributed
@@ -191,6 +430,8 @@ object names until they fall on distinct partitions. Last, and repeatedly for
 the life of the cluster, we need to run the swift-dispersion-report tool to
 check the health of each of these containers and objects.
 
+.. highlight:: cfg
+
 These tools need direct access to the entire cluster and to the ring files
 (installing them on a proxy server will probably do). Both
 swift-dispersion-populate and swift-dispersion-report use the same
@@ -200,10 +441,14 @@ configuration file, /etc/swift/dispersion.conf. Example conf file::
     auth_url = http://localhost:8080/auth/v1.0
     auth_user = test:tester
     auth_key = testing
+    endpoint_type = internalURL
+
+.. highlight:: none
 
 There are also options for the conf file for specifying the dispersion coverage
 (defaults to 1%), retries, concurrency, etc. though usually the defaults are
-fine.
+fine. If you want to use keystone v3 for authentication there are options like
+auth_version, user_domain_name, project_domain_name and project_name.
 
 Once the configuration is in place, run `swift-dispersion-populate` to populate
 the containers and objects throughout the cluster.
@@ -216,7 +461,7 @@ the cluster. Here is an example of a cluster in perfect health::
     Queried 2621 containers for dispersion reporting, 19s, 0 retries
     100.00% of container copies found (7863 of 7863)
     Sample represents 1.00% of the container partition space
-    
+
     Queried 2619 objects for dispersion reporting, 7s, 0 retries
     100.00% of object copies found (7857 of 7857)
     Sample represents 1.00% of the object partition space
@@ -232,7 +477,7 @@ that has::
     Queried 2621 containers for dispersion reporting, 8s, 0 retries
     100.00% of container copies found (7863 of 7863)
     Sample represents 1.00% of the container partition space
-    
+
     Queried 2619 objects for dispersion reporting, 7s, 0 retries
     There were 1763 partitions missing one copy.
     77.56% of object copies found (6094 of 7857)
@@ -266,12 +511,157 @@ You can also run the report for only containers or objects::
     100.00% of object copies found (7857 of 7857)
     Sample represents 1.00% of the object partition space
 
-Alternatively, the dispersion report can also be output in json format. This 
+Alternatively, the dispersion report can also be output in JSON format. This
 allows it to be more easily consumed by third party utilities::
 
     $ swift-dispersion-report -j
     {"object": {"retries:": 0, "missing_two": 0, "copies_found": 7863, "missing_one": 0, "copies_expected": 7863, "pct_found": 100.0, "overlapping": 0, "missing_all": 0}, "container": {"retries:": 0, "missing_two": 0, "copies_found": 12534, "missing_one": 0, "copies_expected": 12534, "pct_found": 100.0, "overlapping": 15, "missing_all": 0}}
 
+Note that you may select which storage policy to use by setting the option
+'--policy-name silver' or '-P silver' (silver is the example policy name here).
+If no policy is specified, the default will be used per the swift.conf file.
+When you specify a policy the containers created also include the policy index,
+thus even when running a container_only report, you will need to specify the
+policy not using the default.
+
+-----------------------------------------------
+Geographically Distributed Swift Considerations
+-----------------------------------------------
+
+Swift provides two features that may be used to distribute replicas of objects
+across multiple geographically distributed data-centers: with
+:doc:`overview_global_cluster` object replicas may be dispersed across devices
+from different data-centers by using `regions` in ring device descriptors; with
+:doc:`overview_container_sync` objects may be copied between independent Swift
+clusters in each data-center. The operation and configuration of each are
+described in their respective documentation. The following points should be
+considered when selecting the feature that is most appropriate for a particular
+use case:
+
+#. Global Clusters allows the distribution of object replicas across
+   data-centers to be controlled by the cluster operator on per-policy basis,
+   since the distribution is determined by the assignment of devices from
+   each data-center in each policy's ring file. With Container Sync the end
+   user controls the distribution of objects across clusters on a
+   per-container basis.
+
+#. Global Clusters requires an operator to coordinate ring deployments across
+   multiple data-centers. Container Sync allows for independent management of
+   separate Swift clusters in each data-center, and for existing Swift
+   clusters to be used as peers in Container Sync relationships without
+   deploying new policies/rings.
+
+#. Global Clusters seamlessly supports features that may rely on
+   cross-container operations such as large objects and versioned writes.
+   Container Sync requires the end user to ensure that all required
+   containers are sync'd for these features to work in all data-centers.
+
+#. Global Clusters makes objects available for GET or HEAD requests in both
+   data-centers even if a replica of the object has not yet been
+   asynchronously migrated between data-centers, by forwarding requests
+   between data-centers. Container Sync is unable to serve requests for an
+   object in a particular data-center until the asynchronous sync process has
+   copied the object to that data-center.
+
+#. Global Clusters may require less storage capacity than Container Sync to
+   achieve equivalent durability of objects in each data-center. Global
+   Clusters can restore replicas that are lost or corrupted in one
+   data-center using replicas from other data-centers. Container Sync
+   requires each data-center to independently manage the durability of
+   objects, which may result in each data-center storing more replicas than
+   with Global Clusters.
+
+#. Global Clusters execute all account/container metadata updates
+   synchronously to account/container replicas in all data-centers, which may
+   incur delays when making updates across WANs. Container Sync only copies
+   objects between data-centers and all Swift internal traffic is
+   confined to each data-center.
+
+#. Global Clusters does not yet guarantee the availability of objects stored
+   in Erasure Coded policies when one data-center is offline. With Container
+   Sync the availability of objects in each data-center is independent of the
+   state of other data-centers once objects have been synced. Container Sync
+   also allows objects to be stored using different policy types in different
+   data-centers.
+
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+Checking handoff partition distribution
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+You can check if handoff partitions are piling up on a server by
+comparing the expected number of partitions with the actual number on
+your disks. First get the number of partitions that are currently
+assigned to a server using the ``dispersion`` command from
+``swift-ring-builder``::
+
+    swift-ring-builder sample.builder dispersion --verbose
+    Dispersion is 0.000000, Balance is 0.000000, Overload is 0.00%
+    Required overload is 0.000000%
+    --------------------------------------------------------------------------
+    Tier                           Parts      %    Max     0     1     2     3
+    --------------------------------------------------------------------------
+    r1                              8192   0.00      2     0     0  8192     0
+    r1z1                            4096   0.00      1  4096  4096     0     0
+    r1z1-172.16.10.1                4096   0.00      1  4096  4096     0     0
+    r1z1-172.16.10.1/sda1           4096   0.00      1  4096  4096     0     0
+    r1z2                            4096   0.00      1  4096  4096     0     0
+    r1z2-172.16.10.2                4096   0.00      1  4096  4096     0     0
+    r1z2-172.16.10.2/sda1           4096   0.00      1  4096  4096     0     0
+    r1z3                            4096   0.00      1  4096  4096     0     0
+    r1z3-172.16.10.3                4096   0.00      1  4096  4096     0     0
+    r1z3-172.16.10.3/sda1           4096   0.00      1  4096  4096     0     0
+    r1z4                            4096   0.00      1  4096  4096     0     0
+    r1z4-172.16.20.4                4096   0.00      1  4096  4096     0     0
+    r1z4-172.16.20.4/sda1           4096   0.00      1  4096  4096     0     0
+    r2                              8192   0.00      2     0  8192     0     0
+    r2z1                            4096   0.00      1  4096  4096     0     0
+    r2z1-172.16.20.1                4096   0.00      1  4096  4096     0     0
+    r2z1-172.16.20.1/sda1           4096   0.00      1  4096  4096     0     0
+    r2z2                            4096   0.00      1  4096  4096     0     0
+    r2z2-172.16.20.2                4096   0.00      1  4096  4096     0     0
+    r2z2-172.16.20.2/sda1           4096   0.00      1  4096  4096     0     0
+
+As you can see from the output, each server should store 4096 partitions, and
+each region should store 8192 partitions. This example used a partition power
+of 13 and 3 replicas.
+
+With write_affinity enabled it is expected to have a higher number of
+partitions on disk compared to the value reported by the
+swift-ring-builder dispersion command. The number of additional (handoff)
+partitions in region r1 depends on your cluster size, the amount
+of incoming data as well as the replication speed.
+
+Let's use the example from above with 6 nodes in 2 regions, and write_affinity
+configured to write to region r1 first. `swift-ring-builder` reported that
+each node should store 4096 partitions::
+
+ Expected partitions for region r2:                                      8192
+ Handoffs stored across 4 nodes in region r1:                 8192 / 4 = 2048
+ Maximum number of partitions on each server in region r1: 2048 + 4096 = 6144
+
+Worst case is that handoff partitions in region 1 are populated with new
+object replicas faster than replication is able to move them to region 2.
+In that case you will see ~ 6144 partitions per
+server in region r1. Your actual number should be lower and
+between 4096 and 6144 partitions (preferably on the lower side).
+
+Now count the number of object partitions on a given server in region 1,
+for example on 172.16.10.1.  Note that the pathnames might be
+different; `/srv/node/` is the default mount location, and `objects`
+applies only to storage policy 0 (storage policy 1 would use
+`objects-1` and so on)::
+
+    find -L /srv/node/ -maxdepth 3 -type d -wholename "*objects/*" | wc -l
+
+If this number is always on the upper end of the expected partition
+number range (4096 to 6144) or increasing you should check your
+replication speed and maybe even disable write_affinity.
+Please refer to the next section how to collect metrics from Swift, and
+especially :ref:`swift-recon -r <recon-replication>` how to check replication
+stats.
+
+
+.. _cluster_telemetry_and_monitoring:
 
 --------------------------------
 Cluster Telemetry and Monitoring
@@ -282,6 +672,8 @@ object servers using the recon server middleware and the swift-recon cli. To do
 so update your account, container, or object servers pipelines to include recon
 and add the associated filter config.
 
+.. highlight:: cfg
+
 object-server.conf sample::
 
     [pipeline:main]
@@ -309,9 +701,11 @@ account-server.conf sample::
     use = egg:swift#recon
     recon_cache_path = /var/cache/swift
 
+.. highlight:: none
+
 The recon_cache_path simply sets the directory where stats for a few items will
 be stored. Depending on the method of deployment you may need to create this
-directory manually and ensure that swift has read/write access.
+directory manually and ensure that Swift has read/write access.
 
 Finally, if you also wish to track asynchronous pending on your object
 servers you will need to setup a cronjob to run the swift-recon-cron script
@@ -319,10 +713,11 @@ periodically on your object servers::
 
     */5 * * * * swift /usr/bin/swift-recon-cron /etc/swift/object-server.conf
 
-Once the recon middleware is enabled a GET request for "/recon/<metric>" to
-the server will return a json formatted response::
+Once the recon middleware is enabled, a GET request for
+"/recon/<metric>" to the backend object server will return a
+JSON-formatted response::
 
-    fhines@ubuntu:~$ curl -i http://localhost:6030/recon/async
+    fhines@ubuntu:~$ curl -i http://localhost:6230/recon/async
     HTTP/1.1 200 OK
     Content-Type: application/json
     Content-Length: 20
@@ -330,6 +725,10 @@ the server will return a json formatted response::
 
     {"async_pending": 0}
 
+
+Note that the default port for the object server is 6200, except on a
+Swift All-In-One installation, which uses 6210, 6220, 6230, and 6240.
+
 The following metrics and telemetry are currently exposed:
 
 =========================   ========================================================================================
@@ -340,23 +739,32 @@ Request URI                 Description
 /recon/mounted              returns *ALL* currently mounted filesystems
 /recon/unmounted            returns all unmounted drives if mount_check = True
 /recon/diskusage            returns disk utilization for storage devices
+/recon/driveaudit           returns # of drive audit errors
 /recon/ringmd5              returns object/container/account ring md5sums
+/recon/swiftconfmd5         returns swift.conf md5sum
 /recon/quarantined          returns # of quarantined objects/accounts/containers
 /recon/sockstat             returns consumable info from /proc/net/sockstat|6
 /recon/devices              returns list of devices and devices dir i.e. /srv/node
 /recon/async                returns count of async pending
-/recon/replication          returns object replication times (for backward compatability)
+/recon/replication          returns object replication info (for backward compatibility)
 /recon/replication/<type>   returns replication info for given type (account, container, object)
 /recon/auditor/<type>       returns auditor stats on last reported scan for given type (account, container, object)
 /recon/updater/<type>       returns last updater sweep times for given type (container, object)
+/recon/expirer/object       returns time elapsed and number of objects deleted during last object expirer sweep
+/recon/version              returns Swift version
+/recon/time                 returns node time
 =========================   ========================================================================================
 
+Note that 'object_replication_last' and 'object_replication_time' in object
+replication info are considered to be transitional and will be removed in
+the subsequent releases. Use 'replication_last' and 'replication_time' instead.
+
 This information can also be queried via the swift-recon command line utility::
 
     fhines@ubuntu:~$ swift-recon -h
-    Usage: 
+    Usage:
             usage: swift-recon <server_type> [-v] [--suppress] [-a] [-r] [-u] [-d]
-            [-l] [--md5] [--auditor] [--updater] [--expirer] [--sockstat]
+            [-R] [-l] [-T] [--md5] [--auditor] [--updater] [--expirer] [--sockstat]
 
             <server_type>   account|container|object
             Defaults to object server.
@@ -370,6 +778,7 @@ This information can also be queried via the swift-recon command line utility::
       --suppress            Suppress most connection related errors
       -a, --async           Get async stats
       -r, --replication     Get replication stats
+      -R, --reconstruction  Get reconstruction stats
       --auditor             Get auditor stats
       --updater             Get updater stats
       --expirer             Get expirer stats
@@ -379,12 +788,17 @@ This information can also be queried via the swift-recon command line utility::
       -q, --quarantined     Get cluster quarantine stats
       --md5                 Get md5sum of servers ring and compare to local copy
       --sockstat            Get cluster socket usage stats
-      --all                 Perform all checks. Equal to -arudlq --md5 --sockstat
+      -T, --time            Check time synchronization
+      --all                 Perform all checks. Equal to
+                            -arudlqT --md5 --sockstat --auditor --updater
+                            --expirer --driveaudit --validate-servers
       -z ZONE, --zone=ZONE  Only query servers in specified zone
       -t SECONDS, --timeout=SECONDS
                             Time to wait for a response from a server
       --swiftdir=SWIFTDIR   Default = /etc/swift
 
+.. _recon-replication:
+
 For example, to obtain container replication info from all hosts in zone "3"::
 
     fhines@ubuntu:~$ swift-recon container -r --zone 3
@@ -401,20 +815,31 @@ For example, to obtain container replication info from all hosts in zone "3"::
 Reporting Metrics to StatsD
 ---------------------------
 
+.. highlight:: cfg
+
+.. note::
+    The legacy statsd metrics described in this section are being supplemented
+    with :doc:`metrics/labels`.
+
 If you have a StatsD_ server running, Swift may be configured to send it
 real-time operational metrics.  To enable this, set the following
 configuration entries (see the sample configuration files)::
 
     log_statsd_host = localhost
     log_statsd_port = 8125
-    log_statsd_default_sample_rate = 1
+    log_statsd_default_sample_rate = 1.0
+    log_statsd_sample_rate_factor = 1.0
     log_statsd_metric_prefix =                [empty-string]
 
 If `log_statsd_host` is not set, this feature is disabled.  The default values
-for the other settings are given above.
-
-.. _StatsD: http://codeascraft.etsy.com/2011/02/15/measure-anything-measure-everything/
-.. _Graphite: http://graphite.wikidot.com/
+for the other settings are given above.  The `log_statsd_host` can be a
+hostname, an IPv4 address, or an IPv6 address (not surrounded with brackets, as
+this is unnecessary since the port is specified separately).  If a hostname
+resolves to an IPv4 address, an IPv4 socket will be used to send StatsD UDP
+packets, even if the hostname would also resolve to an IPv6 address.
+
+.. _StatsD: https://codeascraft.com/2011/02/15/measure-anything-measure-everything/
+.. _Graphite: http://graphiteapp.org/
 .. _Ganglia: http://ganglia.sourceforge.net/
 
 The sample rate is a real number between 0 and 1 which defines the
@@ -422,9 +847,24 @@ probability of sending a sample for any given event or timing measurement.
 This sample rate is sent with each sample to StatsD and used to
 multiply the value.  For example, with a sample rate of 0.5, StatsD will
 multiply that counter's value by 2 when flushing the metric to an upstream
-monitoring system (Graphite_, Ganglia_, etc.).  To get the best data, start
-with the default `log_statsd_default_sample_rate` value of 1 and only lower
-it as needed.
+monitoring system (Graphite_, Ganglia_, etc.).
+
+Some relatively high-frequency metrics have a default sample rate less than
+one.  If you want to override the default sample rate for all metrics whose
+default sample rate is not specified in the Swift source, you may set
+`log_statsd_default_sample_rate` to a value less than one.  This is NOT
+recommended (see next paragraph).  A better way to reduce StatsD load is to
+adjust `log_statsd_sample_rate_factor` to a value less than one.  The
+`log_statsd_sample_rate_factor` is multiplied to any sample rate (either the
+global default or one specified by the actual metric logging call in the Swift
+source) prior to handling.  In other words, this one tunable can lower the
+frequency of all StatsD logging by a proportional amount.
+
+To get the best data, start with the default `log_statsd_default_sample_rate`
+and `log_statsd_sample_rate_factor` values of 1 and only lower
+`log_statsd_sample_rate_factor` if needed.  The
+`log_statsd_default_sample_rate` should not be used and remains for backward
+compatibility only.
 
 The metric prefix will be prepended to every metric sent to the StatsD server
 For example, with::
@@ -437,411 +877,38 @@ servers when sending statistics to a central StatsD server.  If you run a local
 StatsD server per node, you could configure a per-node metrics prefix there and
 leave `log_statsd_metric_prefix` blank.
 
-Note that metrics reported to StatsD are counters or timing data (which
-StatsD usually expands out to min, max, avg, count, and 90th percentile
-per timing metric).  Some important "gauge" metrics will still need to
-be collected using another method.  For example, the
-`object-server.async_pendings` StatsD metric counts the generation of
-async_pendings in real-time, but will not tell you the current number
-of async_pending container updates on disk at any point in time.
+Note that metrics reported to StatsD are counters or timing data (which are
+sent in units of milliseconds).  StatsD usually expands timing data out to min,
+max, avg, count, and 90th percentile per timing metric, but the details of
+this behavior will depend on the configuration of your StatsD server.  Some
+important "gauge" metrics may still need to be collected using another method.
+For example, the `object-server.async_pendings` StatsD metric counts the generation
+of async_pendings in real-time, but will not tell you the current number of
+async_pending container updates on disk at any point in time.
 
 Note also that the set of metrics collected, their names, and their semantics
-are not locked down and will change over time.  StatsD logging is currently in
-a "beta" stage and will continue to evolve.
-
-Metrics for `account-auditor`:
-
-==========================  =========================================================
-Metric Name                 Description
---------------------------  ---------------------------------------------------------
-`account-auditor.errors`    Count of audit runs (across all account databases) which
-                            caught an Exception.
-`account-auditor.passes`    Count of individual account databases which passed audit.
-`account-auditor.failures`  Count of individual account databases which failed audit.
-`account-auditor.timing`    Timing data for individual account database audits.
-==========================  =========================================================
-
-Metrics for `account-reaper`:
-
-==============================================  ====================================================
-Metric Name                                     Description
-----------------------------------------------  ----------------------------------------------------
-`account-reaper.errors`                         Count of devices failing the mount check.
-`account-reaper.timing`                         Timing data for each reap_account() call.
-`account-reaper.return_codes.X`                 Count of HTTP return codes from various operations
-                                                (eg. object listing, container deletion, etc.). The
-                                                value for X is the first digit of the return code
-                                                (2 for 201, 4 for 404, etc.).
-`account-reaper.containers_failures`            Count of failures to delete a container.
-`account-reaper.containers_deleted`             Count of containers successfully deleted.
-`account-reaper.containers_remaining`           Count of containers which failed to delete with
-                                                zero successes.
-`account-reaper.containers_possibly_remaining`  Count of containers which failed to delete with
-                                                at least one success.
-`account-reaper.objects_failures`               Count of failures to delete an object.
-`account-reaper.objects_deleted`                Count of objects successfully deleted.
-`account-reaper.objects_remaining`              Count of objects which failed to delete with zero
-                                                successes.
-`account-reaper.objects_possibly_remaining`     Count of objects which failed to delete with at
-                                                least one success.
-==============================================  ====================================================
-
-Metrics for `account-server` ("Not Found" is not considered an error and requests
-which increment `errors` are not included in the timing data):
-
-========================================  =======================================================
-Metric Name                               Description
-----------------------------------------  -------------------------------------------------------
-`account-server.DELETE.errors.timing`     Timing data for each DELETE request resulting in an
-                                          error: bad request, not mounted, missing timestamp.
-`account-server.DELETE.timing`            Timing data for each DELETE request not resulting in
-                                          an error.
-`account-server.PUT.errors.timing`        Timing data for each PUT request resulting in an error:
-                                          bad request, not mounted, conflict, recently-deleted.
-`account-server.PUT.timing`               Timing data for each PUT request not resulting in an
-                                          error.
-`account-server.HEAD.errors.timing`       Timing data for each HEAD request resulting in an
-                                          error: bad request, not mounted.
-`account-server.HEAD.timing`              Timing data for each HEAD request not resulting in
-                                          an error.
-`account-server.GET.errors.timing`        Timing data for each GET request resulting in an
-                                          error: bad request, not mounted, bad delimiter,
-                                          account listing limit too high, bad accept header.
-`account-server.GET.timing`               Timing data for each GET request not resulting in
-                                          an error.
-`account-server.REPLICATE.errors.timing`  Timing data for each REPLICATE request resulting in an
-                                          error: bad request, not mounted.
-`account-server.REPLICATE.timing`         Timing data for each REPLICATE request not resulting
-                                          in an error.
-`account-server.POST.errors.timing`       Timing data for each POST request resulting in an
-                                          error: bad request, bad or missing timestamp, not
-                                          mounted.
-`account-server.POST.timing`              Timing data for each POST request not resulting in
-                                          an error.
-========================================  =======================================================
-
-Metrics for `account-replicator`:
-
-=====================================  ====================================================
-Metric Name                            Description
--------------------------------------  ----------------------------------------------------
-`account-replicator.diffs`             Count of syncs handled by sending differing rows.
-`account-replicator.diff_caps`         Count of "diffs" operations which failed because
-                                       "max_diffs" was hit.
-`account-replicator.no_changes`        Count of accounts found to be in sync.
-`account-replicator.hashmatches`       Count of accounts found to be in sync via hash
-                                       comparison (`broker.merge_syncs` was called).
-`account-replicator.rsyncs`            Count of completely missing accounts which were sent
-                                       via rsync.
-`account-replicator.remote_merges`     Count of syncs handled by sending entire database
-                                       via rsync.
-`account-replicator.attempts`          Count of database replication attempts.
-`account-replicator.failures`          Count of database replication attempts which failed
-                                       due to corruption (quarantined) or inability to read
-                                       as well as attempts to individual nodes which
-                                       failed.
-`account-replicator.removes.<device>`  Count of databases on <device> deleted because the
-                                       delete_timestamp was greater than the put_timestamp
-                                       and the database had no rows or because it was
-                                       successfully sync'ed to other locations and doesn't
-                                       belong here anymore.
-`account-replicator.successes`         Count of replication attempts to an individual node
-                                       which were successful.
-`account-replicator.timing`            Timing data for each database replication attempt
-                                       not resulting in a failure.
-=====================================  ====================================================
-
-Metrics for `container-auditor`:
-
-============================  ====================================================
-Metric Name                   Description
-----------------------------  ----------------------------------------------------
-`container-auditor.errors`    Incremented when an Exception is caught in an audit
-                              pass (only once per pass, max).
-`container-auditor.passes`    Count of individual containers passing an audit.
-`container-auditor.failures`  Count of individual containers failing an audit.
-`container-auditor.timing`    Timing data for each container audit.
-============================  ====================================================
-
-Metrics for `container-replicator`:
-
-=======================================  ====================================================
-Metric Name                              Description
----------------------------------------  ----------------------------------------------------
-`container-replicator.diffs`             Count of syncs handled by sending differing rows.
-`container-replicator.diff_caps`         Count of "diffs" operations which failed because
-                                         "max_diffs" was hit.
-`container-replicator.no_changes`        Count of containers found to be in sync.
-`container-replicator.hashmatches`       Count of containers found to be in sync via hash
-                                         comparison (`broker.merge_syncs` was called).
-`container-replicator.rsyncs`            Count of completely missing containers where were sent
-                                         via rsync.
-`container-replicator.remote_merges`     Count of syncs handled by sending entire database
-                                         via rsync.
-`container-replicator.attempts`          Count of database replication attempts.
-`container-replicator.failures`          Count of database replication attempts which failed
-                                         due to corruption (quarantined) or inability to read
-                                         as well as attempts to individual nodes which
-                                         failed.
-`container-replicator.removes.<device>`  Count of databases deleted on <device> because the
-                                         delete_timestamp was greater than the put_timestamp
-                                         and the database had no rows or because it was
-                                         successfully sync'ed to other locations and doesn't
-                                         belong here anymore.
-`container-replicator.successes`         Count of replication attempts to an individual node
-                                         which were successful.
-`container-replicator.timing`            Timing data for each database replication attempt
-                                         not resulting in a failure.
-=======================================  ====================================================
-
-Metrics for `container-server` ("Not Found" is not considered an error and requests
-which increment `errors` are not included in the timing data):
-
-==========================================  ====================================================
-Metric Name                                 Description
-------------------------------------------  ----------------------------------------------------
-`container-server.DELETE.errors.timing`     Timing data for DELETE request errors: bad request,
-                                            not mounted, missing timestamp, conflict.
-`container-server.DELETE.timing`            Timing data for each DELETE request not resulting in
-                                            an error.
-`container-server.PUT.errors.timing`        Timing data for PUT request errors: bad request,
-                                            missing timestamp, not mounted, conflict.
-`container-server.PUT.timing`               Timing data for each PUT request not resulting in an
-                                            error.
-`container-server.HEAD.errors.timing`       Timing data for HEAD request errors: bad request,
-                                            not mounted.
-`container-server.HEAD.timing`              Timing data for each HEAD request not resulting in
-                                            an error.
-`container-server.GET.errors.timing`        Timing data for GET request errors: bad request,
-                                            not mounted, parameters not utf8, bad accept header.
-`container-server.GET.timing`               Timing data for each GET request not resulting in
-                                            an error.
-`container-server.REPLICATE.errors.timing`  Timing data for REPLICATE request errors: bad
-                                            request, not mounted.
-`container-server.REPLICATE.timing`         Timing data for each REPLICATE request not resulting
-                                            in an error.
-`container-server.POST.errors.timing`       Timing data for POST request errors: bad request,
-                                            bad x-container-sync-to, not mounted.
-`container-server.POST.timing`              Timing data for each POST request not resulting in
-                                            an error.
-==========================================  ====================================================
-
-Metrics for `container-sync`:
-
-===============================  ====================================================
-Metric Name                      Description
--------------------------------  ----------------------------------------------------
-`container-sync.skips`           Count of containers skipped because they don't have
-                                 sync'ing enabled.
-`container-sync.failures`        Count of failures sync'ing of individual containers.
-`container-sync.syncs`           Count of individual containers sync'ed successfully.
-`container-sync.deletes`         Count of container database rows sync'ed by
-                                 deletion.
-`container-sync.deletes.timing`  Timing data for each container database row
-                                 sychronization via deletion.
-`container-sync.puts`            Count of container database rows sync'ed by PUTing.
-`container-sync.puts.timing`     Timing data for each container database row
-                                 synchronization via PUTing.
-===============================  ====================================================
-
-Metrics for `container-updater`:
-
-==============================  ====================================================
-Metric Name                     Description
-------------------------------  ----------------------------------------------------
-`container-updater.successes`   Count of containers which successfully updated their
-                                account.
-`container-updater.failures`    Count of containers which failed to update their
-                                account.
-`container-updater.no_changes`  Count of containers which didn't need to update
-                                their account.
-`container-updater.timing`      Timing data for processing a container; only
-                                includes timing for containers which needed to
-                                update their accounts (i.e. "successes" and
-                                "failures" but not "no_changes").
-==============================  ====================================================
-
-Metrics for `object-auditor`:
-
-============================  ====================================================
-Metric Name                   Description
-----------------------------  ----------------------------------------------------
-`object-auditor.quarantines`  Count of objects failing audit and quarantined.
-`object-auditor.errors`       Count of errors encountered while auditing objects.
-`object-auditor.timing`       Timing data for each object audit (does not include
-                              any rate-limiting sleep time for
-                              max_files_per_second, but does include rate-limiting
-                              sleep time for max_bytes_per_second).
-============================  ====================================================
-
-Metrics for `object-expirer`:
-
-========================  ====================================================
-Metric Name               Description
-------------------------  ----------------------------------------------------
-`object-expirer.objects`  Count of objects expired.
-`object-expirer.errors`   Count of errors encountered while attempting to
-                          expire an object.
-`object-expirer.timing`   Timing data for each object expiration attempt,
-                          including ones resulting in an error.
-========================  ====================================================
-
-Metrics for `object-replicator`:
-
-===================================================  ====================================================
-Metric Name                                          Description
----------------------------------------------------  ----------------------------------------------------
-`object-replicator.partition.delete.count.<device>`  A count of partitions on <device> which were
-                                                     replicated to another node because they didn't
-                                                     belong on this node.  This metric is tracked
-                                                     per-device to allow for "quiescence detection" for
-                                                     object replication activity on each device.
-`object-replicator.partition.delete.timing`          Timing data for partitions replicated to another
-                                                     node because they didn't belong on this node.  This
-                                                     metric is not tracked per device.
-`object-replicator.partition.update.count.<device>`  A count of partitions on <device> which were
-                                                     replicated to another node, but also belong on this
-                                                     node.  As with delete.count, this metric is tracked
-                                                     per-device.
-`object-replicator.partition.update.timing`          Timing data for partitions replicated which also
-                                                     belong on this node.  This metric is not tracked
-                                                     per-device.
-`object-replicator.suffix.hashes`                    Count of suffix directories whose hash (of filenames)
-                                                     was recalculated.
-`object-replicator.suffix.syncs`                     Count of suffix directories replicated with rsync.
-===================================================  ====================================================
-
-Metrics for `object-server`:
-
-=======================================  ====================================================
-Metric Name                              Description
----------------------------------------  ----------------------------------------------------
-`object-server.quarantines`              Count of objects (files) found bad and moved to
-                                         quarantine.
-`object-server.async_pendings`           Count of container updates saved as async_pendings
-                                         (may result from PUT or DELETE requests).
-`object-server.POST.errors.timing`       Timing data for POST request errors: bad request,
-                                         missing timestamp, delete-at in past, not mounted.
-`object-server.POST.timing`              Timing data for each POST request not resulting in
-                                         an error.
-`object-server.PUT.errors.timing`        Timing data for PUT request errors: bad request,
-                                         not mounted, missing timestamp, object creation
-                                         constraint violation, delete-at in past.
-`object-server.PUT.timeouts`             Count of object PUTs which exceeded max_upload_time.
-`object-server.PUT.timing`               Timing data for each PUT request not resulting in an
-                                         error.
-`object-server.GET.errors.timing`        Timing data for GET request errors: bad request,
-                                         not mounted, header timestamps before the epoch,
-                                         precondition failed.
-                                         File errors resulting in a quarantine are not
-                                         counted here.
-`object-server.GET.timing`               Timing data for each GET request not resulting in an
-                                         error.  Includes requests which couldn't find the
-                                         object (including disk errors resulting in file
-                                         quarantine).
-`object-server.HEAD.errors.timing`       Timing data for HEAD request errors: bad request,
-                                         not mounted.
-`object-server.HEAD.timing`              Timing data for each HEAD request not resulting in
-                                         an error.  Includes requests which couldn't find the
-                                         object (including disk errors resulting in file
-                                         quarantine).
-`object-server.DELETE.errors.timing`     Timing data for DELETE request errors: bad request,
-                                         missing timestamp, not mounted, precondition
-                                         failed.  Includes requests which couldn't find or
-                                         match the object.
-`object-server.DELETE.timing`            Timing data for each DELETE request not resulting
-                                         in an error.
-`object-server.REPLICATE.errors.timing`  Timing data for REPLICATE request errors: bad
-                                         request, not mounted.
-`object-server.REPLICATE.timing`         Timing data for each REPLICATE request not resulting
-                                         in an error.
-=======================================  ====================================================
-
-Metrics for `object-updater`:
-
-============================  ====================================================
-Metric Name                   Description
-----------------------------  ----------------------------------------------------
-`object-updater.errors`       Count of drives not mounted or async_pending files
-                              with an unexpected name.
-`object-updater.timing`       Timing data for object sweeps to flush async_pending
-                              container updates.  Does not include object sweeps
-                              which did not find an existing async_pending storage
-                              directory.
-`object-updater.quarantines`  Count of async_pending container updates which were
-                              corrupted and moved to quarantine.
-`object-updater.successes`    Count of successful container updates.
-`object-updater.failures`     Count of failed container updates.
-`object-updater.unlinks`      Count of async_pending files unlinked. An
-                              async_pending file is unlinked either when it is
-                              successfully processed or when the replicator sees
-                              that there is a newer async_pending file for the
-                              same object.
-============================  ====================================================
-
-Metrics for `proxy-server` (in the table, `<type>` is the proxy-server
-controller responsible for the request and will be one of "account",
-"container", or "object"):
-
-========================================  ====================================================
-Metric Name                               Description
-----------------------------------------  ----------------------------------------------------
-`proxy-server.errors`                     Count of errors encountered while serving requests
-                                          before the controller type is determined.  Includes
-                                          invalid Content-Length, errors finding the internal
-                                          controller to handle the request, invalid utf8, and
-                                          bad URLs.
-`proxy-server.<type>.handoff_count`       Count of node hand-offs; only tracked if log_handoffs
-                                          is set in the proxy-server config.
-`proxy-server.<type>.handoff_all_count`   Count of times *only* hand-off locations were
-                                          utilized; only tracked if log_handoffs is set in the
-                                          proxy-server config.
-`proxy-server.<type>.client_timeouts`     Count of client timeouts (client did not read within
-                                          `client_timeout` seconds during a GET or did not
-                                          supply data within `client_timeout` seconds during
-                                          a PUT).
-`proxy-server.<type>.client_disconnects`  Count of detected client disconnects during PUT
-                                          operations (does NOT include caught Exceptions in
-                                          the proxy-server which caused a client disconnect).
-========================================  ====================================================
-
-Metrics for `proxy-logging` middleware (in the table, `<type>` is either the
-proxy-server controller responsible for the request: "account", "container",
-"object", or the string "SOS" if the request came from the `Swift Origin Server`_
-middleware.  The `<verb>` portion will be one of "GET", "HEAD", "POST", "PUT",
-"DELETE", "COPY", "OPTIONS", or "BAD_METHOD".  The list of valid HTTP methods
-is configurable via the `log_statsd_valid_http_methods` config variable and
-the default setting yields the above behavior.
-
-.. _Swift Origin Server: https://github.com/dpgoetz/sos
-
-============================================  ====================================================
-Metric Name                                   Description
---------------------------------------------  ----------------------------------------------------
-`proxy-server.<type>.<verb>.<status>.timing`  Timing data for requests.  The <status> portion is
-                                              the numeric HTTP status code for the request (eg.
-                                              "200" or "404")
-`proxy-server.<type>.<verb>.<status>.xfer`    The count of the sum of bytes transferred in (from
-                                              clients) and out (to clients) for requests.  The
-                                              <type>, <verb>, and <status> portions of the metric
-                                              are just like the timing metric.
-============================================  ====================================================
-
-Metrics for `tempauth` middleware (in the table, `<reseller_prefix>` represents
-the actual configured reseller_prefix or "`NONE`" if the reseller_prefix is the
-empty string):
-
-=========================================  ====================================================
-Metric Name                                Description
------------------------------------------  ----------------------------------------------------
-`tempauth.<reseller_prefix>.unauthorized`  Count of regular requests which were denied with
-                                           HTTPUnauthorized.
-`tempauth.<reseller_prefix>.forbidden`     Count of regular requests which were denied with
-                                           HTTPForbidden.
-`tempauth.<reseller_prefix>.token_denied`  Count of token requests which were denied.
-`tempauth.<reseller_prefix>.errors`        Count of errors.
-=========================================  ====================================================
-
+are not locked down and will change over time. For more details, see the
+service-specific tables listed below:
+
+.. toctree::
+   metrics/account_auditor
+   metrics/account_reaper
+   metrics/account_server
+   metrics/account_replicator
+   metrics/container_auditor
+   metrics/container_replicator
+   metrics/container_server
+   metrics/container_sync
+   metrics/container_updater
+   metrics/object_auditor
+   metrics/object_expirer
+   metrics/object_reconstructor
+   metrics/object_replicator
+   metrics/object_server
+   metrics/object_updater
+   metrics/proxy_server
+
+Or, view :doc:`metrics/all` as one page.
 
 ------------------------
 Debugging Tips and Tools
@@ -858,6 +925,14 @@ If you are looking at an object on the server and need more info,
 `swift-object-info` will display the account, container, replica locations
 and metadata of the object.
 
+If you are looking at a container on the server and need more info,
+`swift-container-info` will display all the information like the account,
+container, replica locations and metadata of the container.
+
+If you are looking at an account on the server and need more info,
+`swift-account-info` will display the account, replica locations
+and metadata of the account.
+
 If you want to audit the data for an account, `swift-account-audit` can be
 used to crawl the account, checking that all containers and objects can be
 found.
@@ -866,23 +941,41 @@ found.
 Managing Services
 -----------------
 
-Swift services are generally managed with `swift-init`. the general usage is
-``swift-init <service> <command>``, where service is the swift service to 
+Swift services are generally managed with ``swift-init``. the general usage is
+``swift-init <service> <command>``, where service is the Swift service to
 manage (for example object, container, account, proxy) and command is one of:
 
-==========  ===============================================
-Command     Description
-----------  -----------------------------------------------
-start       Start the service
-stop        Stop the service
-restart     Restart the service
-shutdown    Attempt to gracefully shutdown the service
-reload      Attempt to gracefully restart the service
-==========  ===============================================
-
-A graceful shutdown or reload will finish any current requests before 
-completely stopping the old service.  There is also a special case of 
-`swift-init all <command>`, which will run the command for all swift services.
+===============  ===============================================
+Command          Description
+---------------  -----------------------------------------------
+start            Start the service
+stop             Stop the service
+restart          Restart the service
+shutdown         Attempt to gracefully shutdown the service
+reload           Attempt to gracefully restart the service
+reload-seamless  Attempt to seamlessly restart the service
+===============  ===============================================
+
+A graceful shutdown or reload will allow all server workers to finish any
+current requests before exiting.  The parent server process exits immediately.
+
+A seamless reload will make new configuration settings active, with no window
+where client requests fail due to there being no active listen socket.
+The parent server process will re-exec itself, retaining its existing PID.
+After the re-exec'ed parent server process binds its listen sockets, the old
+listen sockets are closed and old server workers finish any current requests
+before exiting.
+
+There is also a special case of ``swift-init all <command>``, which will run
+the command for all swift services.
+
+In cases where there are multiple configs for a service, a specific config
+can be managed with ``swift-init <service>.<config> <command>``.
+For example, when a separate replication network is used, there might be
+``/etc/swift/object-server/public.conf`` for the object server and
+``/etc/swift/object-server/replication.conf`` for the replication services.
+In this case, the replication services could be restarted with
+``swift-init object-server.replication restart``.
 
 --------------
 Object Auditor
@@ -892,20 +985,31 @@ On system failures, the XFS file system can sometimes truncate files it's
 trying to write and produce zero-byte files. The object-auditor will catch
 these problems but in the case of a system crash it would be advisable to run
 an extra, less rate limited sweep to check for these specific files. You can
-run this command as follows:
-`swift-object-auditor /path/to/object-server/config/file.conf once -z 1000`
-"-z" means to only check for zero-byte files at 1000 files per second.
+run this command as follows::
+
+   swift-object-auditor /path/to/object-server/config/file.conf once -z 1000
+
+``-z`` means to only check for zero-byte files at 1000 files per second.
+
+At times it is useful to be able to run the object auditor on a specific
+device or set of devices.  You can run the object-auditor as follows::
+
+   swift-object-auditor /path/to/object-server/config/file.conf once --devices=sda,sdb
+
+This will run the object auditor on only the sda and sdb devices. This param
+accepts a comma separated list of values.
 
 -----------------
 Object Replicator
 -----------------
 
 At times it is useful to be able to run the object replicator on a specific
-device or partition.  You can run the object-replicator as follows:
-swift-object-replicator /path/to/object-server/config/file.conf once --devices=sda,sdb
+device or partition.  You can run the object-replicator as follows::
+
+   swift-object-replicator /path/to/object-server/config/file.conf once --devices=sda,sdb
 
 This will run the object replicator on only the sda and sdb devices.  You can
-likewise run that command with --partitions.  Both params accept a comma
+likewise run that command with ``--partitions``.  Both params accept a comma
 separated list of values. If both are specified they will be ANDed together.
 These can only be run in "once" mode.
 
@@ -915,9 +1019,9 @@ Swift Orphans
 
 Swift Orphans are processes left over after a reload of a Swift server.
 
-For example, when upgrading a proxy server you would probaby finish
-with a `swift-init proxy-server reload` or `/etc/init.d/swift-proxy
-reload`. This kills the parent proxy server process and leaves the
+For example, when upgrading a proxy server you would probably finish
+with a ``swift-init proxy-server reload`` or ``/etc/init.d/swift-proxy
+reload``. This kills the parent proxy server process and leaves the
 child processes running to finish processing whatever requests they
 might be handling at the time. It then starts up a new parent proxy
 server process and its children to handle new incoming requests. This
@@ -927,16 +1031,16 @@ The orphaned child processes may take a while to exit, depending on
 the length of the requests they were handling. However, sometimes an
 old process can be hung up due to some bug or hardware issue. In these
 cases, these orphaned processes will hang around
-forever. `swift-orphans` can be used to find and kill these orphans.
+forever. ``swift-orphans`` can be used to find and kill these orphans.
 
-`swift-orphans` with no arguments will just list the orphans it finds
+``swift-orphans`` with no arguments will just list the orphans it finds
 that were started more than 24 hours ago. You shouldn't really check
 for orphans until 24 hours after you perform a reload, as some
-requests can take a long time to process. `swift-orphans -k TERM` will
-send the SIG_TERM signal to the orphans processes, or you can `kill
--TERM` the pids yourself if you prefer.
+requests can take a long time to process. ``swift-orphans -k TERM`` will
+send the SIG_TERM signal to the orphans processes, or you can ``kill
+-TERM`` the pids yourself if you prefer.
 
-You can run `swift-orphans --help` for more options.
+You can run ``swift-orphans --help`` for more options.
 
 
 ------------
@@ -947,11 +1051,11 @@ Swift Oldies are processes that have just been around for a long
 time. There's nothing necessarily wrong with this, but it might
 indicate a hung process if you regularly upgrade and reload/restart
 services. You might have so many servers that you don't notice when a
-reload/restart fails; `swift-oldies` can help with this.
+reload/restart fails; ``swift-oldies`` can help with this.
 
 For example, if you upgraded and reloaded/restarted everything 2 days
-ago, and you've already cleaned up any orphans with `swift-orphans`,
-you can run `swift-oldies -a 48` to find any Swift processes still
+ago, and you've already cleaned up any orphans with ``swift-orphans``,
+you can run ``swift-oldies -a 48`` to find any Swift processes still
 around that were started more than 2 days ago and then investigate
 them accordingly.
 
@@ -963,9 +1067,9 @@ Custom Log Handlers
 
 Swift supports setting up custom log handlers for services by specifying a
 comma-separated list of functions to invoke when logging is setup. It does so
-via the `log_custom_handlers` configuration option. Logger hooks invoked are
-passed the same arguments as Swift's get_logger function (as well as the
-getLogger and LogAdapter object):
+via the ``log_custom_handlers`` configuration option. Logger hooks invoked are
+passed the same arguments as Swift's ``get_logger`` function, as well as the
+``logging.Logger`` and ``SwiftLogAdapter`` objects:
 
 ==============  ===============================================
 Name            Description
@@ -979,6 +1083,14 @@ logger          The logging.getLogger object
 adapted_logger  The LogAdapter object
 ==============  ===============================================
 
+.. note::
+    The instance of ``SwiftLogAdapter`` that wraps the ``logging.Logger``
+    object may be replaced with cloned instances during runtime, for example to
+    use a different log prefix with the same ``logging.Logger``.  Custom log
+    handlers should therefore not modify any attributes of the
+    ``SwiftLogAdapter`` instance other than those that will be copied if it is
+    cloned.
+
 A basic example that sets up a custom logger might look like the
 following:
 
@@ -993,3 +1105,10 @@ following:
 
 See :ref:`custom-logger-hooks-label` for sample use cases.
 
+------------------------
+Securing OpenStack Swift
+------------------------
+
+Please refer to the security guide at https://docs.openstack.org/security-guide
+and in particular the `Object Storage
+<https://docs.openstack.org/security-guide/object-storage.html>`__ section.
diff --git a/doc/source/apache_deployment_guide.rst b/doc/source/apache_deployment_guide.rst
new file mode 100644
index 0000000000..e0b3ed4924
--- /dev/null
+++ b/doc/source/apache_deployment_guide.rst
@@ -0,0 +1,193 @@
+=======================
+Apache Deployment Guide
+=======================
+
+----------------------------
+Web Front End Considerations
+----------------------------
+
+Swift can be configured to work both using an integral web front-end and using a
+full-fledged Web Server such as the Apache2 (HTTPD) web server. The integral
+web front-end is a wsgi mini "Web Server" which opens up its own socket and
+serves http requests directly. The incoming requests accepted by the integral
+web front-end are then forwarded to a wsgi application (the core swift) for
+further handling, possibly via wsgi middleware sub-components.
+
+client<---->'integral web front-end'<---->middleware<---->'core swift'
+
+To gain full advantage of Apache2, Swift can alternatively be configured to work
+as a request processor of the Apache2 server. This alternative deployment
+scenario uses mod_wsgi of Apache2 to forward requests to the swift wsgi
+application and middleware.
+
+client<---->'Apache2 with mod_wsgi'<----->middleware<---->'core swift'
+
+The integral web front-end offers simplicity and requires minimal configuration.
+It is also the web front-end most commonly used with Swift. Additionally, the
+integral web front-end includes support for receiving chunked transfer encoding
+from a client, presently not supported by Apache2 in the operation mode
+described here.
+
+The use of Apache2 offers new ways to extend Swift and integrate it with
+existing authentication, administration and control systems. A single Apache2
+server can serve as the web front end of any number of swift servers residing on
+a swift node. For example when a storage node offers account, container and
+object services, a single Apache2 server can serve as the web front end of all
+three services.
+
+The apache variant described here was tested as part of an IBM research work.
+It was found that following tuning, the Apache2 offer generally equivalent
+performance to that offered by the integral web front-end. Alternative to
+Apache2, other web servers may be used, but were never tested.
+
+-------------
+Apache2 Setup
+-------------
+Both Apache2 and mod-wsgi needs to be installed on the system. Ubuntu comes
+with Apache2 installed. Install mod-wsgi using::
+
+    sudo apt-get install libapache2-mod-wsgi
+
+Create a directory for the Apache2 wsgi files::
+
+    sudo mkdir /srv/www/swift
+
+Create a working directory for the wsgi processes::
+
+    sudo mkdir -m 2770 /var/lib/swift
+    sudo chown swift:swift /var/lib/swift
+
+Create a file for each service under ``/srv/www/swift``.
+
+For a proxy service create ``/srv/www/swift/proxy-server.wsgi``::
+
+    from swift.common.wsgi import init_request_processor
+    application, conf, logger, log_name = \
+        init_request_processor('/etc/swift/proxy-server.conf','proxy-server')
+
+For an account service create ``/srv/www/swift/account-server.wsgi``::
+
+    from swift.common.wsgi import init_request_processor
+    application, conf, logger, log_name = \
+        init_request_processor('/etc/swift/account-server.conf',
+                               'account-server')
+
+For an container service create ``/srv/www/swift/container-server.wsgi``::
+
+    from swift.common.wsgi import init_request_processor
+    application, conf, logger, log_name = \
+        init_request_processor('/etc/swift/container-server.conf',
+                              'container-server')
+
+For an object service create ``/srv/www/swift/object-server.wsgi``::
+
+    from swift.common.wsgi import init_request_processor
+    application, conf, logger, log_name = \
+        init_request_processor('/etc/swift/object-server.conf',
+                               'object-server')
+
+Create a ``/etc/apache2/conf.d/swift_wsgi.conf`` configuration file that will
+define a port and Virtual Host per each local service. For example an Apache2
+serving as a web front end of a proxy service::
+
+    # Proxy
+    Listen 8080
+
+    <VirtualHost *:8080>
+        ServerName proxy-server
+
+        LimitRequestBody 5368709122
+        LimitRequestFields 200
+
+        WSGIDaemonProcess proxy-server processes=5 threads=1 user=swift group=swift display-name=%{GROUP}
+        WSGIProcessGroup proxy-server
+        WSGIScriptAlias / /srv/www/swift/proxy-server.wsgi
+        LogLevel debug
+        CustomLog /var/log/apache2/proxy.log combined
+        ErrorLog /var/log/apache2/proxy-server
+    </VirtualHost>
+
+Notice that when using Apache the limit on the maximal object size should be
+imposed by Apache using the `LimitRequestBody` rather by the swift proxy. Note
+also that the `LimitRequestBody` should indicate the same value as indicated by
+`max_file_size` located in both ``/etc/swift/swift.conf`` and in
+``/etc/swift/test.conf``.  The Swift default value for `max_file_size` (when not
+present) is `5368709122`. For example an Apache2 serving as a web front end of a
+storage node::
+
+    # Object Service
+    Listen 6200
+
+    <VirtualHost *:6200>
+        ServerName object-server
+
+        LimitRequestFields 200
+
+        WSGIDaemonProcess object-server processes=5 threads=1 user=swift group=swift display-name=%{GROUP}
+        WSGIProcessGroup object-server
+        WSGIScriptAlias / /srv/www/swift/object-server.wsgi
+        LogLevel debug
+        CustomLog /var/log/apache2/access.log combined
+        ErrorLog /var/log/apache2/object-server
+    </VirtualHost>
+
+    # Container Service
+    Listen 6201
+
+    <VirtualHost *:6201>
+        ServerName container-server
+
+        LimitRequestFields 200
+
+        WSGIDaemonProcess container-server processes=5 threads=1 user=swift group=swift display-name=%{GROUP}
+        WSGIProcessGroup container-server
+        WSGIScriptAlias / /srv/www/swift/container-server.wsgi
+        LogLevel debug
+        CustomLog /var/log/apache2/access.log combined
+        ErrorLog /var/log/apache2/container-server
+    </VirtualHost>
+
+    # Account Service
+    Listen 6202
+
+    <VirtualHost *:6202>
+        ServerName account-server
+
+        LimitRequestFields 200
+
+        WSGIDaemonProcess account-server processes=5 threads=1 user=swift group=swift display-name=%{GROUP}
+        WSGIProcessGroup account-server
+        WSGIScriptAlias / /srv/www/swift/account-server.wsgi
+        LogLevel debug
+        CustomLog /var/log/apache2/access.log combined
+        ErrorLog /var/log/apache2/account-server
+    </VirtualHost>
+
+Enable the newly configured Virtual Hosts::
+
+    a2ensite swift_wsgi.conf
+
+Next, stop, test and start Apache2 again::
+
+    # stop it
+    systemctl stop apache2.service
+
+    # test the configuration
+    apache2ctl -t
+
+    # start it if the test succeeds
+    systemctl start apache2.service
+
+
+Edit the tests config file and add::
+
+    web_front_end = apache2
+    normalized_urls = True
+
+Also check to see that the file includes `max_file_size` of the same value as
+used for the `LimitRequestBody` in the apache config file above.
+
+We are done. You may run functional tests to test - e.g.::
+
+    cd ~swift/swift
+    ./.functests
diff --git a/doc/source/api/authentication.rst b/doc/source/api/authentication.rst
new file mode 100644
index 0000000000..3d1044e7c3
--- /dev/null
+++ b/doc/source/api/authentication.rst
@@ -0,0 +1,58 @@
+==============
+Authentication
+==============
+
+The owner of an Object Storage account controls access to that account
+and its containers and objects. An owner is the user who has the
+''admin'' role for that tenant. The tenant is also known as the project
+or account. As the account owner, you can modify account metadata and
+create, modify, and delete containers and objects.
+
+To identify yourself as the account owner, include an authentication
+token in the ''X-Auth-Token'' header in the API request.
+
+Depending on the token value in the ''X-Auth-Token'' header, one of the
+following actions occur:
+
+-  ''X-Auth-Token'' contains the token for the account owner.
+
+   The request is permitted and has full access to make changes to the
+   account.
+
+-  The ''X-Auth-Token'' header is omitted or it contains a token for a
+   non-owner or a token that is not valid.
+
+   The request fails with a 401 Unauthorized or 403 Forbidden response.
+
+   You have no access to accounts or containers, unless an access
+   control list (ACL) explicitly grants access.
+
+   The account owner can grant account and container access to users
+   through access control lists (ACLs).
+
+In addition, it is possible to provide an additional token in the
+''X-Service-Token'' header. More information about how this is used is in
+:doc:`../overview_backing_store`.
+
+The following list describes the authentication services that you can
+use with Object Storage:
+
+- OpenStack Identity (keystone): For Object Storage, account is synonymous with
+  project or tenant ID.
+
+- Tempauth middleware: Object Storage includes this middleware. User and account
+  management is performed in Object Storage itself.
+
+- Swauth middleware: Stored in github, this custom middleware is modeled on 
+  Tempauth. Usage is similar to Tempauth.
+
+- Other custom middleware: Write it yourself to fit your environment.
+
+Specifically, you use the ''X-Auth-Token'' header to pass an
+authentication token to an API request.
+
+Authentication tokens expire after a time period that the authentication
+service defines. When a token expires, use of the token causes requests
+to fail with a 401 Unauthorized response. To continue, you must obtain a
+new token.
+
diff --git a/doc/source/api/bulk-delete.rst b/doc/source/api/bulk-delete.rst
new file mode 100644
index 0000000000..367eed3aa8
--- /dev/null
+++ b/doc/source/api/bulk-delete.rst
@@ -0,0 +1,93 @@
+.. _bulk-delete:
+
+===========
+Bulk delete
+===========
+
+To discover whether your Object Storage system supports this feature,
+see :ref:`discoverability`. Alternatively, check with your service provider.
+
+With bulk delete, you can delete up to 10,000 objects or containers
+(configurable) in one request.
+
+Bulk delete request
+~~~~~~~~~~~~~~~~~~~
+
+To perform a bulk delete operation, add the ``bulk-delete`` query
+parameter to the path of a ``POST`` or ``DELETE`` operation.
+
+.. note::
+
+   The ``DELETE`` operation is supported for backwards compatibility.
+
+The path is the account, such as ``/v1/12345678912345``, that contains
+the objects and containers.
+
+In the request body of the ``POST`` or ``DELETE`` operation, list the
+objects or containers to be deleted. Separate each name with a newline
+character. You can include a maximum of 10,000 items (configurable) in
+the list.
+
+In addition, you must:
+
+-  UTF-8-encode and then URL-encode the names.
+
+-  To indicate an object, specify the container and object name as:
+   ``CONTAINER_NAME``/``OBJECT_NAME``.
+
+-  To indicate a container, specify the container name as:
+   ``CONTAINER_NAME``. Make sure that the container is empty. If it
+   contains objects, Object Storage cannot delete the container.
+
+-  Set the ``Content-Type`` request header to ``text/plain``.
+
+Bulk delete response
+~~~~~~~~~~~~~~~~~~~~
+
+When Object Storage processes the request, it performs multiple
+sub-operations. Even if all sub-operations fail, the operation returns a
+200 status. The bulk operation returns a response body that contains
+details that indicate which sub-operations have succeeded and failed.
+Some sub-operations might succeed while others fail. Examine the
+response body to determine the results of each delete sub-operation.
+
+You can set the ``Accept`` request header to one of the following values
+to define the response format:
+
+``text/plain``
+   Formats response as plain text. If you omit the
+   ``Accept`` header, ``text/plain`` is the default.
+
+``application/json``
+   Formats response as JSON.
+
+``application/xml`` or ``text/xml``
+   Formats response as XML.
+
+The response body contains the following information:
+
+-  The number of files actually deleted.
+
+-  The number of not found objects.
+
+-  Errors. A list of object names and associated error statuses for the
+   objects that failed to delete. The format depends on the value that
+   you set in the ``Accept`` header.
+
+The following bulk delete response is in ``application/xml`` format. In
+this example, the ``mycontainer`` container is not empty, so it cannot
+be deleted.
+
+.. code-block:: xml
+
+   <delete>
+       <number_deleted>2</number_deleted>
+       <number_not_found>4</number_not_found>
+       <errors>
+           <object>
+               <name>/v1/12345678912345/mycontainer</name>
+               <status>409 Conflict</status>
+           </object>
+       </errors>
+   </delete>
+
diff --git a/doc/source/api/container_quotas.rst b/doc/source/api/container_quotas.rst
new file mode 100644
index 0000000000..9c58eef274
--- /dev/null
+++ b/doc/source/api/container_quotas.rst
@@ -0,0 +1,32 @@
+.. _container_quotas:
+
+================
+Container quotas
+================
+
+You can set quotas on the size and number of objects stored in a
+container by setting the following metadata:
+
+-  ``X-Container-Meta-Quota-Bytes``. The size, in bytes, of objects that
+   can be stored in a container.
+
+-  ``X-Container-Meta-Quota-Count``. The number of objects that can be
+   stored in a container.
+
+When you exceed a container quota, subsequent requests to create objects
+fail with a 413 Request Entity Too Large error.
+
+The Object Storage system uses an eventual consistency model. When you
+create a new object, the container size and object count might not be
+immediately updated. Consequently, you might be allowed to create
+objects even though you have actually exceeded the quota.
+
+At some later time, the system updates the container size and object
+count to the actual values. At this time, subsequent requests fails. In
+addition, if you are currently under the
+``X-Container-Meta-Quota-Bytes`` limit and a request uses chunked
+transfer encoding, the system cannot know if the request will exceed the
+quota so the system allows the request. However, once the quota is
+exceeded, any subsequent uploads that use chunked transfer encoding
+fail.
+
diff --git a/doc/source/api/discoverability.rst b/doc/source/api/discoverability.rst
new file mode 100644
index 0000000000..c086d16f7f
--- /dev/null
+++ b/doc/source/api/discoverability.rst
@@ -0,0 +1,37 @@
+===============
+Discoverability
+===============
+
+Your Object Storage system might not enable all features that you read about because your service provider chooses which features to enable.
+
+To discover which features are enabled in your Object Storage system,
+use the ``/info`` request. However, your service provider might have
+disabled the ``/info`` request, or you might be using an older version
+that does not support the ``/info`` request.
+
+To use the ``/info`` request, send a **GET** request using the ``/info``
+path to the Object Store endpoint as shown in this example:
+
+.. code:: console
+
+    # curl https://storage.clouddrive.com/info
+
+This example shows a truncated response body:
+
+.. code:: console
+
+    {
+       "swift":{
+          "version":"1.11.0"
+       },
+       "staticweb":{
+
+       },
+       "tempurl":{
+
+       }
+    }
+
+This output shows that the Object Storage system has enabled the static
+website and temporary URL features.
+
diff --git a/doc/source/api/form_post_middleware.rst b/doc/source/api/form_post_middleware.rst
new file mode 100644
index 0000000000..97921d41e8
--- /dev/null
+++ b/doc/source/api/form_post_middleware.rst
@@ -0,0 +1,211 @@
+====================
+Form POST middleware
+====================
+
+To discover whether your Object Storage system supports this feature,
+check with your service provider or send a **GET** request using the :file:`/info`
+path.
+
+You can upload objects directly to the Object Storage system from a
+browser by using the form **POST** middleware. This middleware uses
+account or container secret keys to generate a cryptographic signature for the
+request. This means that you do not need to send an authentication token
+in the ``X-Auth-Token`` header to perform the request.
+
+The form **POST** middleware uses the same secret keys as the temporary
+URL middleware uses. For information about how to set these keys, see
+:ref:`secret_keys`.
+
+For information about the form **POST** middleware configuration
+options, see :ref:`formpost` in the *Source Documentation*.
+
+Form POST format
+~~~~~~~~~~~~~~~~
+
+To upload objects to a cluster, you can use an HTML form **POST**
+request.
+
+The format of the form **POST** request is:
+
+**Example 1.14. Form POST format**
+
+.. code:: xml
+
+    <form action="SWIFT_URL"
+        method="POST"
+        enctype="multipart/form-data">
+        <input type="hidden" name="redirect" value="REDIRECT_URL"/>
+        <input type="hidden" name="max_file_size" value="BYTES"/>
+        <input type="hidden" name="max_file_count" value="COUNT"/>
+        <input type="hidden" name="expires" value="UNIX_TIMESTAMP"/>
+        <input type="hidden" name="signature" value="HMAC"/>
+        <input type="file" name="FILE_NAME"/>
+        <br/>
+        <input type="submit"/>
+    </form>
+
+
+**action="SWIFT_URL"**
+
+Set to full URL where the objects are to be uploaded. The names of
+uploaded files are appended to the specified *SWIFT_URL*. So, you
+can upload directly to the root of a container with a URL like:
+
+.. code:: none
+
+    https://swift-cluster.example.com/v1/my_account/container/
+
+Optionally, you can include an object prefix to separate uploads, such
+as:
+
+.. code:: none
+
+    https://swift-cluster.example.com/v1/my_account/container/OBJECT_PREFIX
+
+
+**method="POST"**
+
+Must be ``POST``.
+
+
+**enctype="multipart/form-data"**
+
+Must be ``multipart/form-data``.
+
+
+**name="redirect" value="REDIRECT_URL"**
+
+Redirects the browser to the *REDIRECT_URL* after the upload
+completes. The URL has status and message query parameters added to it,
+which specify the HTTP status code for the upload and an optional error
+message. The 2\ *nn* status code indicates success.
+
+The *REDIRECT_URL* can be an empty string. If so, the ``Location``
+response header is not set.
+
+**name="max\_file\_size" value="BYTES"**
+
+Required. Indicates the size, in bytes, of the maximum single file
+upload.
+
+**name="max\_file\_count" value= "COUNT"**
+
+Required. Indicates the maximum number of files that can be uploaded
+with the form.
+
+
+**name="expires" value="UNIX_TIMESTAMP"**
+
+The UNIX timestamp that specifies the time before which the form must be
+submitted before it becomes no longer valid.
+
+
+**name="signature" value="HMAC"**
+
+The HMAC-SHA1 signature of the form.
+
+
+**type="file" name="FILE_NAME"**
+
+File name of the file to be uploaded. You can include from one to the
+``max_file_count`` value of files.
+
+The file attributes must appear after the other attributes to be
+processed correctly.
+
+If attributes appear after the file attributes, they are not sent with
+the sub-request because all attributes in the file cannot be parsed on
+the server side unless the whole file is read into memory; the server
+does not have enough memory to service these requests. Attributes that
+follow the file attributes are ignored.
+
+Optionally, if you want the uploaded files to be temporary you can set x-delete-at or x-delete-after attributes by adding one of these as a form input:
+
+.. code:: xml
+
+    <input type="hidden" name="x_delete_at" value="<unix-timestamp>" />
+    <input type="hidden" name="x_delete_after" value="<seconds>" />
+
+
+**type= "submit"**
+
+Must be ``submit``.
+
+HMAC-SHA1 signature for form POST
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Form **POST** middleware uses an HMAC-SHA1 cryptographic signature. This
+signature includes these elements from the form:
+
+-  The path. Starting with ``/v1/`` onwards and including a container
+   name and, optionally, an object prefix. In `Example 1.15`, "HMAC-SHA1
+   signature for form
+   POST" the path is
+   ``/v1/my_account/container/object_prefix``. Do not URL-encode the
+   path at this stage.
+
+-  A redirect URL. If there is no redirect URL, use the empty string.
+
+-  Maximum file size. In `Example 1.15`, "HMAC-SHA1 signature for form
+   POST" the
+   ``max_file_size`` is ``104857600`` bytes.
+
+-  The maximum number of objects to upload. In `Example 1.15`, "HMAC-SHA1
+   signature for form
+   POST" ``max_file_count`` is ``10``.
+
+-  Expiry time. In `Example 1.15, "HMAC-SHA1 signature for form
+   POST" the expiry time
+   is set to ``600`` seconds into the future.
+
+-  The secret key. Set as the ``X-Account-Meta-Temp-URL-Key`` header
+   value for accounts or ``X-Container-Meta-Temp-URL-Key`` header
+   value for containers.  See :ref:`secret_keys` for more information.
+
+The following example code generates a signature for use with form
+**POST**:
+
+**Example 1.15. HMAC-SHA1 signature for form POST**
+
+.. code:: python
+
+    import hmac
+    from hashlib import sha1
+    from time import time
+    path = '/v1/my_account/container/object_prefix'
+    redirect = 'https://myserver.com/some-page'
+    max_file_size = 104857600
+    max_file_count = 10
+    expires = int(time() + 600)
+    key = 'MYKEY'
+    hmac_body = '%s\n%s\n%s\n%s\n%s' % (path, redirect,
+    max_file_size, max_file_count, expires)
+    signature = hmac.new(key, hmac_body, sha1).hexdigest()
+
+
+For more information, see `RFC 2104: HMAC: Keyed-Hashing for Message
+Authentication <http://www.ietf.org/rfc/rfc2104.txt>`__.
+
+Form POST example
+~~~~~~~~~~~~~~~~~
+
+The following example shows how to submit a form by using a cURL
+command. In this example, the object prefix is ``photos/`` and the file
+being uploaded is called ``flower.jpg``.
+
+This example uses the **swift-form-signature** script to compute the
+``expires`` and ``signature`` values.
+
+.. code:: console
+
+    $ bin/swift-form-signature /v1/my_account/container/photos/ https://example.com/done.html 5373952000 1 200 MYKEY
+    Expires: 1390825338
+    Signature: 35129416ebda2f1a21b3c2b8939850dfc63d8f43
+
+.. code:: console
+
+    $ curl -i https://swift-cluster.example.com/v1/my_account/container/photos/ -X POST \
+           -F max_file_size=5373952000 -F max_file_count=1 -F expires=1390825338 \
+           -F signature=35129416ebda2f1a21b3c2b8939850dfc63d8f43 \
+           -F redirect=https://example.com/done.html \
+           -F file=@flower.jpg
diff --git a/doc/source/api/large_objects.rst b/doc/source/api/large_objects.rst
new file mode 100644
index 0000000000..f05f72ebd9
--- /dev/null
+++ b/doc/source/api/large_objects.rst
@@ -0,0 +1,347 @@
+=============
+Large objects
+=============
+
+By default, the content of an object cannot be greater than 5 GB.
+However, you can use a number of smaller objects to construct a large
+object. The large object is comprised of two types of objects:
+
+-  **Segment objects** store the object content. You can divide your
+   content into segments, and upload each segment into its own segment
+   object. Segment objects do not have any special features. You create,
+   update, download, and delete segment objects just as you would normal
+   objects.
+
+-  A **manifest object** links the segment objects into one logical
+   large object. When you download a manifest object, Object Storage
+   concatenates and returns the contents of the segment objects in the
+   response body of the request. This behavior extends to the response
+   headers returned by **GET** and **HEAD** requests. The
+   ``Content-Length`` response header value is the total size of all
+   segment objects. Object Storage calculates the ``ETag`` response
+   header value by taking the ``ETag`` value of each segment,
+   concatenating them together, and returning the MD5 checksum of the
+   result. The manifest object types are:
+
+   **Static large objects**
+       The manifest object content is an ordered list of the names of
+       the segment objects in JSON format.
+
+   **Dynamic large objects**
+       The manifest object has a ``X-Object-Manifest`` metadata header.
+       The value of this header is ``{container}/{prefix}``,
+       where ``{container}`` is the name of the container where the
+       segment objects are stored, and ``{prefix}`` is a string that all
+       segment objects have in common. The manifest object should have
+       no content. However, this is not enforced.
+
+Note
+~~~~
+
+If you make a **COPY** request by using a manifest object as the source,
+the new object is a normal, and not a segment, object. If the total size
+of the source segment objects exceeds 5 GB, the **COPY** request fails.
+However, you can make a duplicate of the manifest object and this new
+object can be larger than 5 GB.
+
+Static large objects
+~~~~~~~~~~~~~~~~~~~~
+
+To create a static large object, divide your content into pieces and
+create (upload) a segment object to contain each piece.
+
+Create a manifest object. Include the ``multipart-manifest=put``
+query parameter at the end of the manifest object name to indicate that
+this is a manifest object.
+
+The body of the **PUT** request on the manifest object comprises a json
+list, where each element is an object representing a segment. These objects
+may contain the following attributes:
+
+-  ``path`` (required). The container and object name in the format:
+   ``{container-name}/{object-name}``
+
+-  ``etag`` (optional). If provided, this value must match the ``ETag``
+   of the segment object. This was included in the response headers when
+   the segment was created. Generally, this will be the MD5 sum of the
+   segment.
+
+-  ``size_bytes`` (optional). The size of the segment object. If provided,
+   this value must match the ``Content-Length`` of that object.
+
+-  ``range`` (optional). The subset of the referenced object that should
+   be used for segment data. This behaves similar to the ``Range`` header.
+   If omitted, the entire object will be used.
+
+Providing the optional ``etag`` and ``size_bytes`` attributes for each
+segment ensures that the upload cannot corrupt your data.
+
+**Example Static large object manifest list**
+
+This example shows three segment objects. You can use several containers
+and the object names do not have to conform to a specific pattern, in
+contrast to dynamic large objects.
+
+.. code:: json
+
+    [
+        {
+            "path": "mycontainer/objseg1",
+            "etag": "0228c7926b8b642dfb29554cd1f00963",
+            "size_bytes": 1468006
+        },
+        {
+            "path": "mycontainer/pseudodir/seg-obj2",
+            "etag": "5bfc9ea51a00b790717eeb934fb77b9b",
+            "size_bytes": 1572864
+        },
+        {
+            "path": "other-container/seg-final",
+            "etag": "b9c3da507d2557c1ddc51f27c54bae51",
+            "size_bytes": 256
+        }
+    ]
+
+|
+
+The ``Content-Length`` request header must contain the length of the
+json content—not the length of the segment objects. However, after the
+**PUT** operation completes, the ``Content-Length`` metadata is set to
+the total length of all the object segments. When using the ``ETag``
+request header in a **PUT** operation, it  must contain the MD5 checksum
+of the concatenated ``ETag`` values of the object segments. You can also
+set the ``Content-Type`` request header and custom object metadata.
+
+When the **PUT** operation sees the ``multipart-manifest=put`` query
+parameter, it reads the request body and verifies that each segment
+object exists and that the sizes and ETags match. If there is a
+mismatch, the **PUT** operation fails.
+
+This verification process can take a long time to complete, particularly
+as the number of segments increases. You may include a ``heartbeat=on``
+query parameter to have the server:
+
+1. send a ``202 Accepted`` response before it begins validating segments,
+2. periodically send whitespace characters to keep the connection alive, and
+3. send a final response code in the body.
+
+.. note::
+    The server may still immediately respond with ``400 Bad Request``
+    if it can determine that the request is invalid before making
+    backend requests.
+
+If everything matches, the manifest object is created. The
+``X-Static-Large-Object`` metadata is set to ``true`` indicating that
+this is a static object manifest.
+
+Normally when you perform a **GET** operation on the manifest object,
+the response body contains the concatenated content of the segment
+objects. To download the manifest list, use the
+``multipart-manifest=get`` query parameter. The resulting list is not
+formatted the same as the manifest you originally used in the **PUT**
+operation.
+
+If you use the **DELETE** operation on a manifest object, the manifest
+object is deleted. The segment objects are not affected. However, if you
+add the ``multipart-manifest=delete`` query parameter, the segment
+objects are deleted and if all are successfully deleted, the manifest
+object is also deleted.
+
+To change the manifest, use a **PUT** operation with the
+``multipart-manifest=put`` query parameter. This request creates a
+manifest object. You can also update the object metadata in the usual
+way.
+
+Dynamic large objects
+~~~~~~~~~~~~~~~~~~~~~
+
+You must segment objects that are larger than 5 GB before you can upload
+them. You then upload the segment objects like you would any other
+object and create a dynamic large manifest object. The manifest object
+tells Object Storage how to find the segment objects that comprise the
+large object. The segments remain individually addressable, but
+retrieving the manifest object streams all the segments concatenated.
+There is no limit to the number of segments that can be a part of a
+single large object, but ``Content-Length`` is included in **GET** or **HEAD**
+response only if the number of segments is smaller than container listing
+limit. In other words, the number of segments that fit within a single
+container listing page.
+
+To ensure the download works correctly, you must upload all the object
+segments to the same container and ensure that each object name is
+prefixed in such a way that it sorts in the order in which it should be
+concatenated. You also create and upload a manifest file. The manifest
+file is a zero-byte file with the extra ``X-Object-Manifest``
+``{container}/{prefix}`` header, where ``{container}`` is the container
+the object segments are in and ``{prefix}`` is the common prefix for all
+the segments. You must UTF-8-encode and then URL-encode the container
+and common prefix in the ``X-Object-Manifest`` header.
+
+It is best to upload all the segments first and then create or update
+the manifest. With this method, the full object is not available for
+downloading until the upload is complete. Also, you can upload a new set
+of segments to a second location and update the manifest to point to
+this new location. During the upload of the new segments, the original
+manifest is still available to download the first set of segments.
+
+.. note::
+
+  When updating a manifest object using a POST request, a
+  ``X-Object-Manifest`` header must be included for the
+  object to continue to behave as a manifest object.
+
+**Example Upload segment of large object request: HTTP**
+
+.. code:: none
+
+    PUT /{api_version}/{account}/{container}/{object} HTTP/1.1
+    Host: storage.clouddrive.com
+    X-Auth-Token: eaaafd18-0fed-4b3a-81b4-663c99ec1cbb
+    ETag: 8a964ee2a5e88be344f36c22562a6486
+    Content-Length: 1
+    X-Object-Meta-PIN: 1234
+
+
+No response body is returned. A status code of 2\ *``nn``* (between 200
+and 299, inclusive) indicates a successful write; status 411 Length
+Required denotes a missing ``Content-Length`` or ``Content-Type`` header
+in the request. If the MD5 checksum of the data written to the storage
+system does NOT match the (optionally) supplied ETag value, a 422
+Unprocessable Entity response is returned.
+
+You can continue uploading segments like this example shows, prior to
+uploading the manifest.
+
+**Example Upload next segment of large object request: HTTP**
+
+.. code:: none
+
+    PUT /{api_version}/{account}/{container}/{object} HTTP/1.1
+    Host: storage.clouddrive.com
+    X-Auth-Token: eaaafd18-0fed-4b3a-81b4-663c99ec1cbb
+    ETag: 8a964ee2a5e88be344f36c22562a6486
+    Content-Length: 1
+    X-Object-Meta-PIN: 1234
+
+
+Next, upload the manifest you created that indicates the container the
+object segments reside within. Note that uploading additional segments
+after the manifest is created causes the concatenated object to be that
+much larger but you do not need to recreate the manifest file for
+subsequent additional segments.
+
+**Example Upload manifest request: HTTP**
+
+.. code:: none
+
+    PUT /{api_version}/{account}/{container}/{object} HTTP/1.1
+    Host: storage.clouddrive.com
+    X-Auth-Token: eaaafd18-0fed-4b3a-81b4-663c99ec1cbb
+    Content-Length: 0
+    X-Object-Meta-PIN: 1234
+    X-Object-Manifest: {container}/{prefix}
+
+
+**Example Upload manifest response: HTTP**
+
+.. code:: none
+
+    [...]
+
+
+The ``Content-Type`` in the response for a **GET** or **HEAD** on the
+manifest is the same as the ``Content-Type`` set during the **PUT**
+request that created the manifest. You can easily change the
+``Content-Type`` by reissuing the **PUT** request.
+
+Comparison of static and dynamic large objects
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+While static and dynamic objects have similar behavior, here are
+their differences:
+
+End-to-end integrity
+--------------------
+
+With static large objects, integrity can be assured.
+The list of segments may include the MD5 checksum (``ETag``) of each segment.
+You cannot upload the manifest object if the ``ETag`` in the list differs
+from the uploaded segment object. If a segment is somehow lost, an attempt
+to download the manifest object results in an error.
+
+With dynamic large objects, integrity is not guaranteed. The eventual
+consistency model means that although you have uploaded a segment object, it
+might not appear in the container listing until later. If you download the
+manifest before it appears in the container, it does not form part of the
+content returned in response to a **GET** request.
+
+Upload Order
+------------
+
+With static large objects, you must upload the
+segment objects before you upload the manifest object.
+
+With dynamic large objects, you can upload manifest and segment objects
+in any order. In case a premature download of the manifest occurs, we
+recommend users upload the manifest object after the segments. However,
+the system does not enforce the order.
+
+Removal or addition of segment objects
+--------------------------------------
+
+With static large objects, you cannot add or
+remove segment objects from the manifest. However, you can create a
+completely new manifest object of the same name with a different manifest
+list.
+
+With dynamic large objects, you can upload new segment objects or remove
+existing segments. The names must simply match the ``{prefix}`` supplied
+in ``X-Object-Manifest``.
+
+Segment object size and number
+------------------------------
+
+With static large objects, the segment objects must be at least 1 byte in size.
+However, if the segment objects are less than 1MB (by default),
+the SLO download is (by default) rate limited. At most,
+1000 segments are supported (by default) and the manifest has a limit
+(by default) of 2MB in size.
+
+With dynamic large objects, segment objects can be any size.
+
+Segment object container name
+-----------------------------
+
+With static large objects, the manifest list includes the container name of each object.
+Segment objects can be in different containers.
+
+With dynamic large objects, all segment objects must be in the same container.
+
+Manifest object metadata
+------------------------
+
+With static large objects, the manifest object has ``X-Static-Large-Object``
+set to ``true``. You do not set this
+metadata directly. Instead the system sets it when you **PUT** a static
+manifest object.
+
+With dynamic large objects, the ``X-Object-Manifest`` value is the
+``{container}/{prefix}``, which indicates
+where the segment objects are located. You supply this request header in the
+**PUT** operation.
+
+Copying the manifest object
+---------------------------
+
+The semantics are the same for both static and dynamic large objects.
+When copying large objects, the **COPY** operation does not create
+a manifest object but a normal object with content same as what you would
+get on a **GET** request to the original manifest object.
+
+To copy the manifest object, you include the ``multipart-manifest=get``
+query parameter in the **COPY**  request. The new object contains the same
+manifest as the original. The segment objects are not copied. Instead,
+both the original and new manifest objects share the same set of segment
+objects.
+
+
diff --git a/doc/source/api/object-expiration.rst b/doc/source/api/object-expiration.rst
new file mode 100644
index 0000000000..e101b4de5e
--- /dev/null
+++ b/doc/source/api/object-expiration.rst
@@ -0,0 +1,48 @@
+=================
+Object expiration
+=================
+
+You can schedule Object Storage (swift) objects to expire by setting the
+``X-Delete-At`` or ``X-Delete-After`` header. Once the object is deleted,
+swift will no longer serve the object and it will be deleted from the cluster
+shortly thereafter.
+
+*  Set an object to expire at an absolute time (in Unix time). You
+   can get the current Unix time by running ``date +'%s'``.
+
+   .. code-block:: console
+
+      $ swift post CONTAINER OBJECT_FILENAME -H "X-Delete-At:UNIX_TIME"
+
+   Verify the ``X-Delete-At`` header has posted to the object:
+
+   .. code-block:: console
+
+      $ swift stat CONTAINER OBJECT_FILENAME
+
+*  Set an object to expire after a relative amount of time (in seconds):
+
+   .. code-block:: console
+
+      $ swift post CONTAINER OBJECT_FILENAME -H "X-Delete-After:SECONDS"
+
+   The ``X-Delete-After`` header will be converted to ``X-Delete-At``.
+   Verify the ``X-Delete-At`` header has posted to the object:
+
+   .. code-block:: console
+
+      $ swift stat CONTAINER OBJECT_FILENAME
+
+   If you no longer want to expire the object, you can remove the
+   ``X-Delete-At`` header:
+
+   .. code-block:: console
+
+      $ swift post CONTAINER OBJECT_FILENAME -H "X-Remove-Delete-At:"
+
+.. note::
+
+   In order for object expiration to work properly, the
+   ``swift-object-expirer`` daemon will need access to all backend
+   servers in the cluster. The daemon does not need access to the
+   proxy-server or public network.
diff --git a/doc/source/api/object_api_v1_overview.rst b/doc/source/api/object_api_v1_overview.rst
new file mode 100644
index 0000000000..37fa28e40f
--- /dev/null
+++ b/doc/source/api/object_api_v1_overview.rst
@@ -0,0 +1,194 @@
+Object Storage API overview
+---------------------------
+
+OpenStack Object Storage is a highly available, distributed, eventually
+consistent object/blob store. You create, modify, and get objects and
+metadata by using the Object Storage API, which is implemented as a set
+of Representational State Transfer (REST) web services.
+
+For an introduction to OpenStack Object Storage, see the :doc:`/admin/index`.
+
+You use the HTTPS (SSL) protocol to interact with Object Storage, and
+you use standard HTTP calls to perform API operations. You can also use
+language-specific APIs, which use the RESTful API, that make it easier
+for you to integrate into your applications.
+
+To assert your right to access and change data in an account, you
+identify yourself to Object Storage by using an authentication token. To
+get a token, you present your credentials to an authentication service.
+The authentication service returns a token and the URL for the account.
+Depending on which authentication service that you use, the URL for the
+account appears in:
+
+-  **OpenStack Identity Service**. The URL is defined in the service
+   catalog.
+
+-  **Tempauth**. The URL is provided in the ``X-Storage-Url`` response
+   header.
+
+In both cases, the URL is the full URL and includes the account
+resource.
+
+The Object Storage API supports the standard, non-serialized response
+format, which is the default, and both JSON and XML serialized response
+formats.
+
+The Object Storage system organizes data in a hierarchy, as follows:
+
+-  **Account**. Represents the top-level of the hierarchy.
+
+   Your service provider creates your account and you own all resources
+   in that account. The account defines a namespace for containers. A
+   container might have the same name in two different accounts.
+
+   In the OpenStack environment, *account* is synonymous with a project
+   or tenant.
+
+-  **Container**. Defines a namespace for objects. An object with the
+   same name in two different containers represents two different
+   objects. You can create any number of containers within an account.
+
+   In addition to containing objects, you can also use the container to
+   control access to objects by using an access control list (ACL). You
+   cannot store an ACL with individual objects.
+
+   In addition, you configure and control many other features, such as
+   object versioning, at the container level.
+
+   You can bulk-delete up to 10,000 containers in a single request.
+
+   You can set a storage policy on a container with predefined names
+   and definitions from your cloud provider.
+
+-  **Object**. Stores data content, such as documents, images, and so
+   on. You can also store custom metadata with an object.
+
+   With the Object Storage API, you can:
+
+   -  Store an unlimited number of objects. Each object can be as large
+      as 5 GB, which is the default. You can configure the maximum
+      object size.
+
+   -  Upload and store objects of any size with large object creation.
+
+   -  Use cross-origin resource sharing to manage object security.
+
+   -  Compress files using content-encoding metadata.
+
+   -  Override browser behavior for an object using content-disposition metadata.
+
+   -  Schedule objects for deletion.
+
+   -  Bulk-delete up to 10,000 objects in a single request.
+
+   -  Auto-extract archive files.
+
+   -  Generate a URL that provides time-limited **GET** access to an
+      object.
+
+   -  Upload objects directly to the Object Storage system from a
+      browser by using form **POST** middleware.
+
+   -  Create symbolic links to other objects.
+
+The account, container, and object hierarchy affects the way you
+interact with the Object Storage API.
+
+Specifically, the resource path reflects this structure and has this
+format:
+
+.. code:: none
+
+    /v1/{account}/{container}/{object}
+
+For example, for the ``flowers/rose.jpg`` object in the ``images``
+container in the ``12345678912345`` account, the resource path is:
+
+.. code:: none
+
+    /v1/12345678912345/images/flowers/rose.jpg
+
+Notice that the object name contains the ``/`` character. This slash
+does not indicate that Object Storage has a sub-hierarchy called
+``flowers`` because containers do not store objects in actual
+sub-folders. However, the inclusion of ``/`` or a similar convention
+inside object names enables you to create pseudo-hierarchical folders
+and directories.
+
+For example, if the endpoint for Object Storage is
+``objects.mycloud.com``, the returned URL is
+``https://objects.mycloud.com/v1/12345678912345``.
+
+To access a container, append the container name to the resource path.
+
+To access an object, append the container and the object name to the
+path.
+
+If you have a large number of containers or objects, you can use query
+parameters to page through large lists of containers or objects. Use the
+``marker``, ``limit``, and ``end_marker`` query parameters to
+control how many items are returned in a list and where the list starts
+or ends. If you want to page through in reverse order, you can use the query
+parameter ``reverse``, noting that your marker and end_markers should be
+switched when applied to a reverse listing. I.e, for a list of objects
+``[a, b, c, d, e]`` the non-reversed could be:
+
+.. code:: none
+
+  /v1/{account}/{container}/?marker=a&end_marker=d
+  b
+  c
+
+However, when reversed marker and end_marker are applied to a reversed list:
+
+.. code:: none
+
+  /v1/{account}/{container}/?marker=d&end_marker=a&reverse=on
+  c
+  b
+
+Object Storage HTTP requests have the following default constraints.
+Your service provider might use different default values.
+
+============================ ============= =====
+Item                         Maximum value Notes
+============================ ============= =====
+Number of HTTP headers       90
+Length of HTTP headers       4096 bytes
+Length per HTTP request line 8192 bytes
+Length of HTTP request       5 GB
+Length of container names    256 bytes     Cannot contain the ``/`` character.
+Length of object names       1024 bytes    By default, there are no character restrictions.
+============================ ============= =====
+
+You must UTF-8-encode and then URL-encode container and object names
+before you call the API binding. If you use an API binding that performs
+the URL-encoding for you, do not URL-encode the names before you call
+the API binding. Otherwise, you double-encode these names. Check the
+length restrictions against the URL-encoded string.
+
+The API Reference describes the operations that you can perform with the
+Object Storage API:
+
+-  `Storage
+   accounts <https://docs.openstack.org/api-ref/object-store/index.html#accounts>`__:
+   Use to perform account-level tasks.
+
+   Lists containers for a specified account. Creates, updates, and
+   deletes account metadata. Shows account metadata.
+
+-  `Storage
+   containers <https://docs.openstack.org/api-ref/object-store/index.html#containers>`__:
+   Use to perform container-level tasks.
+
+   Lists objects in a specified container. Creates, shows details for,
+   and deletes containers. Creates, updates, shows, and deletes
+   container metadata.
+
+-  `Storage
+   objects <https://docs.openstack.org/api-ref/object-store/index.html#objects>`__:
+   Use to perform object-level tasks.
+
+   Creates, replaces, shows details for, and deletes objects. Copies
+   objects with another object with a new or different name. Updates
+   object metadata.
diff --git a/doc/source/api/object_versioning.rst b/doc/source/api/object_versioning.rst
new file mode 100644
index 0000000000..b3438a6e49
--- /dev/null
+++ b/doc/source/api/object_versioning.rst
@@ -0,0 +1,351 @@
+=================
+Object versioning
+=================
+
+You can store multiple versions of your content so that you can recover
+from unintended overwrites. Object versioning is an easy way to
+implement version control, which you can use with any type of content.
+
+.. note::
+    You cannot version a large-object manifest file, but the large-object
+    manifest file can point to versioned segments.
+
+.. note::
+    It is strongly recommended that you put non-current objects in a
+    different container than the container where current object versions
+    reside.
+
+To allow object versioning within a cluster, the cloud provider should add the
+``versioned_writes`` filter to the pipeline and set the
+``allow_versioned_writes`` option to ``true`` in the
+``[filter:versioned_writes]`` section of the proxy-server configuration file.
+
+To enable object versioning for a container, you must specify an "archive
+container" that will retain non-current versions via either the
+``X-Versions-Location`` or ``X-History-Location`` header. These two headers
+enable two distinct modes of operation. Either mode may be used within a
+cluster, but only one mode may be active for any given container. You must
+UTF-8-encode and then URL-encode the container name before you include it in
+the header.
+
+For both modes, **PUT** requests will archive any pre-existing objects before
+writing new data, and **GET** requests will serve the current version. **COPY**
+requests behave like a **GET** followed by a **PUT**; that is, if the copy
+*source* is in a versioned container then the current version will be copied,
+and if the copy *destination* is in a versioned container then any pre-existing
+object will be archived before writing new data.
+
+If object versioning was enabled using ``X-History-Location``, then object
+**DELETE** requests will copy the current version to the archive container then
+remove it from the versioned container.
+
+If object versioning was enabled using ``X-Versions-Location``, then object
+**DELETE** requests will restore the most-recent version from the archive
+container, overwriting the current version.
+
+Example Using ``X-Versions-Location``
+-------------------------------------
+
+#. Create the ``current`` container:
+
+   .. code:: console
+
+      # curl -i $publicURL/current -X PUT -H "Content-Length: 0" -H "X-Auth-Token: $token" -H "X-Versions-Location: archive"
+
+   .. code:: console
+
+      HTTP/1.1 201 Created
+      Content-Length: 0
+      Content-Type: text/html; charset=UTF-8
+      X-Trans-Id: txb91810fb717347d09eec8-0052e18997
+      X-Openstack-Request-Id: txb91810fb717347d09eec8-0052e18997
+      Date: Thu, 23 Jan 2014 21:28:55 GMT
+
+#. Create the first version of an object in the ``current`` container:
+
+   .. code:: console
+
+      # curl -i $publicURL/current/my_object --data-binary 1 -X PUT -H "Content-Length: 0" -H "X-Auth-Token: $token"
+
+   .. code:: console
+
+      HTTP/1.1 201 Created
+      Last-Modified: Thu, 23 Jan 2014 21:31:22 GMT
+      Content-Length: 0
+      Etag: d41d8cd98f00b204e9800998ecf8427e
+      Content-Type: text/html; charset=UTF-8
+      X-Trans-Id: tx5992d536a4bd4fec973aa-0052e18a2a
+      X-Openstack-Request-Id: tx5992d536a4bd4fec973aa-0052e18a2a
+      Date: Thu, 23 Jan 2014 21:31:22 GMT
+
+   Nothing is written to the non-current version container when you
+   initially **PUT** an object in the ``current`` container. However,
+   subsequent **PUT** requests that edit an object trigger the creation
+   of a version of that object in the ``archive`` container.
+
+   These non-current versions are named as follows:
+
+   .. code:: none
+
+      <length><object_name>/<timestamp>
+
+   Where ``length`` is the 3-character, zero-padded hexadecimal
+   character length of the object, ``<object_name>`` is the object name,
+   and ``<timestamp>`` is the time when the object was initially created
+   as a current version.
+
+#. Create a second version of the object in the ``current`` container:
+
+   .. code:: console
+
+      # curl -i $publicURL/current/my_object --data-binary 2 -X PUT -H "Content-Length: 0" -H "X-Auth-Token: $token"
+
+   .. code:: console
+
+      HTTP/1.1 201 Created
+      Last-Modified: Thu, 23 Jan 2014 21:41:32 GMT
+      Content-Length: 0
+      Etag: d41d8cd98f00b204e9800998ecf8427e
+      Content-Type: text/html; charset=UTF-8
+      X-Trans-Id: tx468287ce4fc94eada96ec-0052e18c8c
+      X-Openstack-Request-Id: tx468287ce4fc94eada96ec-0052e18c8c
+      Date: Thu, 23 Jan 2014 21:41:32 GMT
+
+#. Issue a **GET** request to a versioned object to get the current
+   version of the object. You do not have to do any request redirects or
+   metadata lookups.
+
+   List older versions of the object in the ``archive`` container:
+
+   .. code:: console
+
+      # curl -i $publicURL/archive?prefix=009my_object -X GET -H "X-Auth-Token: $token"
+
+   .. code:: console
+
+      HTTP/1.1 200 OK
+      Content-Length: 30
+      X-Container-Object-Count: 1
+      Accept-Ranges: bytes
+      X-Timestamp: 1390513280.79684
+      X-Container-Bytes-Used: 0
+      Content-Type: text/plain; charset=utf-8
+      X-Trans-Id: tx9a441884997542d3a5868-0052e18d8e
+      X-Openstack-Request-Id: tx9a441884997542d3a5868-0052e18d8e
+      Date: Thu, 23 Jan 2014 21:45:50 GMT
+
+      009my_object/1390512682.92052
+
+   .. note::
+      A **POST** request to a versioned object updates only the metadata
+      for the object and does not create a new version of the object. New
+      versions are created only when the content of the object changes.
+
+#. Issue a **DELETE** request to a versioned object to remove the
+   current version of the object and replace it with the next-most
+   current version in the non-current container.
+
+   .. code:: console
+
+      # curl -i $publicURL/current/my_object -X DELETE -H "X-Auth-Token: $token"
+
+   .. code:: console
+
+      HTTP/1.1 204 No Content
+      Content-Length: 0
+      Content-Type: text/html; charset=UTF-8
+      X-Trans-Id: tx006d944e02494e229b8ee-0052e18edd
+      X-Openstack-Request-Id: tx006d944e02494e229b8ee-0052e18edd
+      Date: Thu, 23 Jan 2014 21:51:25 GMT
+
+   List objects in the ``archive`` container to show that the archived
+   object was moved back to the ``current`` container:
+
+   .. code:: console
+
+      # curl -i $publicURL/archive?prefix=009my_object -X GET -H "X-Auth-Token: $token"
+
+   .. code:: console
+
+      HTTP/1.1 204 No Content
+      Content-Length: 0
+      X-Container-Object-Count: 0
+      Accept-Ranges: bytes
+      X-Timestamp: 1390513280.79684
+      X-Container-Bytes-Used: 0
+      Content-Type: text/html; charset=UTF-8
+      X-Trans-Id: tx044f2a05f56f4997af737-0052e18eed
+      X-Openstack-Request-Id: tx044f2a05f56f4997af737-0052e18eed
+      Date: Thu, 23 Jan 2014 21:51:41 GMT
+
+   This next-most current version carries with it any metadata last set
+   on it. If want to completely remove an object and you have five
+   versions of it, you must **DELETE** it five times.
+
+Example Using ``X-History-Location``
+------------------------------------
+
+#. Create the ``current`` container:
+
+   .. code:: console
+
+      # curl -i $publicURL/current -X PUT -H "Content-Length: 0" -H "X-Auth-Token: $token" -H "X-History-Location: archive"
+
+   .. code:: console
+
+      HTTP/1.1 201 Created
+      Content-Length: 0
+      Content-Type: text/html; charset=UTF-8
+      X-Trans-Id: txb91810fb717347d09eec8-0052e18997
+      X-Openstack-Request-Id: txb91810fb717347d09eec8-0052e18997
+      Date: Thu, 23 Jan 2014 21:28:55 GMT
+
+#. Create the first version of an object in the ``current`` container:
+
+   .. code:: console
+
+      # curl -i $publicURL/current/my_object --data-binary 1 -X PUT -H "Content-Length: 0" -H "X-Auth-Token: $token"
+
+   .. code:: console
+
+      HTTP/1.1 201 Created
+      Last-Modified: Thu, 23 Jan 2014 21:31:22 GMT
+      Content-Length: 0
+      Etag: d41d8cd98f00b204e9800998ecf8427e
+      Content-Type: text/html; charset=UTF-8
+      X-Trans-Id: tx5992d536a4bd4fec973aa-0052e18a2a
+      X-Openstack-Request-Id: tx5992d536a4bd4fec973aa-0052e18a2a
+      Date: Thu, 23 Jan 2014 21:31:22 GMT
+
+   Nothing is written to the non-current version container when you
+   initially **PUT** an object in the ``current`` container. However,
+   subsequent **PUT** requests that edit an object trigger the creation
+   of a version of that object in the ``archive`` container.
+
+   These non-current versions are named as follows:
+
+   .. code:: none
+
+      <length><object_name>/<timestamp>
+
+   Where ``length`` is the 3-character, zero-padded hexadecimal
+   character length of the object, ``<object_name>`` is the object name,
+   and ``<timestamp>`` is the time when the object was initially created
+   as a current version.
+
+#. Create a second version of the object in the ``current`` container:
+
+   .. code:: console
+
+      # curl -i $publicURL/current/my_object --data-binary 2 -X PUT -H "Content-Length: 0" -H "X-Auth-Token: $token"
+
+   .. code:: console
+
+      HTTP/1.1 201 Created
+      Last-Modified: Thu, 23 Jan 2014 21:41:32 GMT
+      Content-Length: 0
+      Etag: d41d8cd98f00b204e9800998ecf8427e
+      Content-Type: text/html; charset=UTF-8
+      X-Trans-Id: tx468287ce4fc94eada96ec-0052e18c8c
+      X-Openstack-Request-Id: tx468287ce4fc94eada96ec-0052e18c8c
+      Date: Thu, 23 Jan 2014 21:41:32 GMT
+
+#. Issue a **GET** request to a versioned object to get the current
+   version of the object. You do not have to do any request redirects or
+   metadata lookups.
+
+   List older versions of the object in the ``archive`` container:
+
+   .. code:: console
+
+      # curl -i $publicURL/archive?prefix=009my_object -X GET -H "X-Auth-Token: $token"
+
+   .. code:: console
+
+      HTTP/1.1 200 OK
+      Content-Length: 30
+      X-Container-Object-Count: 1
+      Accept-Ranges: bytes
+      X-Timestamp: 1390513280.79684
+      X-Container-Bytes-Used: 0
+      Content-Type: text/plain; charset=utf-8
+      X-Trans-Id: tx9a441884997542d3a5868-0052e18d8e
+      X-Openstack-Request-Id: tx9a441884997542d3a5868-0052e18d8e
+      Date: Thu, 23 Jan 2014 21:45:50 GMT
+
+      009my_object/1390512682.92052
+
+   .. note::
+      A **POST** request to a versioned object updates only the metadata
+      for the object and does not create a new version of the object. New
+      versions are created only when the content of the object changes.
+
+#. Issue a **DELETE** request to a versioned object to copy the
+   current version of the object to the archive container then delete it from
+   the current container. Subsequent **GET** requests to the object in the
+   current container will return ``404 Not Found``.
+
+   .. code:: console
+
+      # curl -i $publicURL/current/my_object -X DELETE -H "X-Auth-Token: $token"
+
+   .. code:: console
+
+      HTTP/1.1 204 No Content
+      Content-Length: 0
+      Content-Type: text/html; charset=UTF-8
+      X-Trans-Id: tx006d944e02494e229b8ee-0052e18edd
+      X-Openstack-Request-Id: tx006d944e02494e229b8ee-0052e18edd
+      Date: Thu, 23 Jan 2014 21:51:25 GMT
+
+   List older versions of the object in the ``archive`` container:
+
+   .. code:: console
+
+      # curl -i $publicURL/archive?prefix=009my_object -X GET -H "X-Auth-Token: $token"
+
+   .. code:: console
+
+      HTTP/1.1 200 OK
+      Content-Length: 90
+      X-Container-Object-Count: 3
+      Accept-Ranges: bytes
+      X-Timestamp: 1390513280.79684
+      X-Container-Bytes-Used: 0
+      Content-Type: text/html; charset=UTF-8
+      X-Trans-Id: tx044f2a05f56f4997af737-0052e18eed
+      X-Openstack-Request-Id: tx044f2a05f56f4997af737-0052e18eed
+      Date: Thu, 23 Jan 2014 21:51:41 GMT
+
+      009my_object/1390512682.92052
+      009my_object/1390512692.23062
+      009my_object/1390513885.67732
+
+   In addition to the two previous versions of the object, the archive
+   container has a "delete marker" to record when the object was deleted.
+
+   To permanently delete a previous version, issue a **DELETE** to the version
+   in the archive container.
+
+Disabling Object Versioning
+---------------------------
+
+To disable object versioning for the ``current`` container, remove
+its ``X-Versions-Location`` metadata header by sending an empty key
+value.
+
+.. code:: console
+
+   # curl -i $publicURL/current -X PUT -H "Content-Length: 0" -H "X-Auth-Token: $token" -H "X-Versions-Location: "
+
+.. code:: console
+
+   HTTP/1.1 202 Accepted
+   Content-Length: 76
+   Content-Type: text/html; charset=UTF-8
+   X-Trans-Id: txe2476de217134549996d0-0052e19038
+   X-Openstack-Request-Id: txe2476de217134549996d0-0052e19038
+   Date: Thu, 23 Jan 2014 21:57:12 GMT
+
+   <html><h1>Accepted</h1><p>The request is accepted for processing.</p></html>
+
diff --git a/doc/source/api/pagination.rst b/doc/source/api/pagination.rst
new file mode 100644
index 0000000000..8af0f42baa
--- /dev/null
+++ b/doc/source/api/pagination.rst
@@ -0,0 +1,137 @@
+=================================================
+Page through large lists of containers or objects
+=================================================
+
+If you have a large number of containers or objects, you can use the
+``marker``, ``limit``, and ``end_marker`` parameters to control
+how many items are returned in a list and where the list starts or ends.
+If you want to page backwards you can use the ``reverse`` parameter.
+
+* marker
+    When you request a list of containers or objects, Object Storage
+    returns a maximum of 10,000 names for each request. To get
+    subsequent names, you must make another request with the
+    ``marker`` parameter. Set the ``marker`` parameter to the name of
+    the last item returned in the previous list. You must URL-encode the
+    ``marker`` value before you send the HTTP request. Object Storage
+    returns a maximum of 10,000 names starting after the last item
+    returned.
+
+* limit
+    To return fewer than 10,000 names, use the ``limit`` parameter. If
+    the number of names returned equals the specified ``limit`` (or
+    10,000 if you omit the ``limit`` parameter), you can assume there
+    are more names to list. If the number of names in the list is
+    exactly divisible by the ``limit`` value, the last request has no
+    content.
+
+* end_marker
+    Limits the result set to names that are less than the
+    ``end_marker`` parameter value. You must URL-encode the
+    ``end_marker`` value before you send the HTTP request.
+
+* reverse
+    By default, listings are returned sorted by name, ascending. If you
+    include the ``reverse=true`` query parameter, the listing will be
+    returned sorted by name, descending.
+
+To page through a large list of containers
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Assume the following list of container names:
+
+.. code-block:: console
+
+   apples
+   bananas
+   kiwis
+   oranges
+   pears
+
+#. Use a ``limit`` of two:
+
+   .. code-block:: console
+
+      # curl -i $publicURL/?limit=2 -X GET -H "X-Auth-Token: $token"
+
+   .. code-block:: console
+
+      apples
+      bananas
+
+   Because two container names are returned, there are more names to
+   list.
+
+#. Make another request with a ``marker`` parameter set to the name of
+   the last item returned:
+
+   .. code-block:: console
+
+      # curl -i $publicURL/?limit=2&amp;marker=bananas -X GET -H \
+        “X-Auth-Token: $token"
+
+   .. code-block:: console
+
+      kiwis
+      oranges
+
+   Again, two items are returned, and there might be more.
+
+#. Make another request with a ``marker`` of the last item returned:
+
+   .. code-block:: console
+
+      # curl -i $publicURL/?limit=2&amp;marker=oranges -X GET -H \"
+        X-Auth-Token: $token"
+
+   .. code-block:: console
+
+      pears
+
+   You receive a one-item response, which is fewer than the ``limit``
+   number of names. This indicates that this is the end of the list.
+
+#. Use the ``end_marker`` parameter to limit the result set to object
+   names that are less than the ``end_marker`` parameter value:
+
+   .. code-block:: console
+
+      # curl -i $publicURL/?end_marker=oranges -X GET -H \"
+       X-Auth-Token: $token"
+
+   .. code-block:: console
+
+      apples
+      bananas
+      kiwis
+
+   You receive a result set of all container names before the
+   ``end-marker`` value.
+
+#. Use the ``reverse`` parameter to work from the back of the
+   list:
+
+   .. code-block:: console
+
+      # curl -i $publicURL/?reverse=true -X GET -H \"
+         X-Auth-Token: $token"
+
+   .. code-block:: console
+
+      pears
+      oranges
+      kiwis
+      bananas
+      apples
+
+#. You can also combine parameters:
+
+   .. code-block:: console
+
+      # curl -i $publicURL/?reverse=true&end_marker=kiwis -X GET -H \"
+         X-Auth-Token: $token"
+
+   .. code-block:: console
+
+      pears
+      oranges
diff --git a/doc/source/api/pseudo-hierarchical-folders-directories.rst b/doc/source/api/pseudo-hierarchical-folders-directories.rst
new file mode 100644
index 0000000000..c7e764f2db
--- /dev/null
+++ b/doc/source/api/pseudo-hierarchical-folders-directories.rst
@@ -0,0 +1,155 @@
+===========================================
+Pseudo-hierarchical folders and directories
+===========================================
+
+Although you cannot nest directories in OpenStack Object Storage, you
+can simulate a hierarchical structure within a single container by
+adding forward slash characters (``/``) in the object name. To navigate
+the pseudo-directory structure, you can use the ``delimiter`` query
+parameter. This example shows you how to use pseudo-hierarchical folders
+and directories.
+
+.. note::
+
+   In this example, the objects reside in a container called ``backups``.
+   Within that container, the objects are organized in a pseudo-directory
+   called ``photos``. The container name is not displayed in the example,
+   but it is a part of the object URLs. For instance, the URL of the
+   picture ``me.jpg`` is
+   ``https://swift.example.com/v1/CF_xer7_343/backups/photos/me.jpg``.
+
+List pseudo-hierarchical folders request: HTTP
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+To display a list of all the objects in the storage container, use
+``GET`` without a ``delimiter`` or ``prefix``.
+
+.. code-block:: console
+
+   $ curl -X GET -i -H "X-Auth-Token: $token" \
+    $publicurl/v1/AccountString/backups
+
+The system returns status code 2xx (between 200 and 299, inclusive) and
+the requested list of the objects.
+
+.. code-block:: console
+
+   photos/animals/cats/persian.jpg
+   photos/animals/cats/siamese.jpg
+   photos/animals/dogs/corgi.jpg
+   photos/animals/dogs/poodle.jpg
+   photos/animals/dogs/terrier.jpg
+   photos/me.jpg
+   photos/plants/fern.jpg
+   photos/plants/rose.jpg
+
+Use the delimiter parameter to limit the displayed results. To use
+``delimiter`` with pseudo-directories, you must use the parameter slash
+(``/``).
+
+.. code-block:: console
+
+   $ curl -X GET -i -H "X-Auth-Token: $token" \
+    $publicurl/v1/AccountString/backups?delimiter=/
+
+The system returns status code 2xx (between 200 and 299, inclusive) and
+the requested matching objects. Because you use the slash, only the
+pseudo-directory ``photos/`` displays. The returned values from a slash
+``delimiter`` query are not real objects. The value will refer to
+a real object if it does not end with a slash. The pseudo-directories
+have no content-type, rather, each pseudo-directory has
+its own ``subdir`` entry in the response of JSON and XML results.
+For example:
+
+.. code-block:: JSON
+
+   [
+     {
+       "subdir": "photos/"
+     }
+   ]
+
+.. code-block:: XML
+
+   <?xml version="1.0" encoding="UTF-8"?>
+   <container name="backups">
+     <subdir name="photos/">
+       <name>photos/</name>
+     </subdir>
+   </container>
+
+Use the ``prefix`` and ``delimiter`` parameters to view the objects
+inside a pseudo-directory, including further nested pseudo-directories.
+
+.. code-block:: console
+
+   $ curl -X GET -i -H "X-Auth-Token: $token" \
+    $publicurl/v1/AccountString/backups?prefix=photos/&delimiter=/
+
+The system returns status code 2xx (between 200 and 299, inclusive) and
+the objects and pseudo-directories within the top level
+pseudo-directory.
+
+.. code-block:: console
+
+   photos/animals/
+   photos/me.jpg
+   photos/plants/
+
+.. code-block:: JSON
+
+   [
+     {
+       "subdir": "photos/animals/"
+     },
+     {
+       "hash": "b249a153f8f38b51e92916bbc6ea57ad",
+       "last_modified": "2015-12-03T17:31:28.187370",
+       "bytes": 2906,
+       "name": "photos/me.jpg",
+       "content_type": "image/jpeg"
+     },
+     {
+       "subdir": "photos/plants/"
+     }
+   ]
+
+.. code-block:: XML
+
+   <?xml version="1.0" encoding="UTF-8"?>
+   <container name="backups">
+     <subdir name="photos/animals/">
+       <name>photos/animals/</name>
+     </subdir>
+     <object>
+       <name>photos/me.jpg</name>
+       <hash>b249a153f8f38b51e92916bbc6ea57ad</hash>
+       <bytes>2906</bytes>
+       <content_type>image/jpeg</content_type>
+       <last_modified>2015-12-03T17:31:28.187370</last_modified>
+     </object>
+     <subdir name="photos/plants/">
+       <name>photos/plants/</name>
+     </subdir>
+   </container>
+
+You can create an unlimited number of nested pseudo-directories. To
+navigate through them, use a longer ``prefix`` parameter coupled with
+the ``delimiter`` parameter. In this sample output, there is a
+pseudo-directory called ``dogs`` within the pseudo-directory
+``animals``. To navigate directly to the files contained within
+``dogs``, enter the following command:
+
+.. code-block:: console
+
+   $ curl -X GET -i -H "X-Auth-Token: $token" \
+    $publicurl/v1/AccountString/backups?prefix=photos/animals/dogs/&delimiter=/
+
+The system returns status code 2xx (between 200 and 299, inclusive) and
+the objects and pseudo-directories within the nested pseudo-directory.
+
+.. code-block:: console
+
+   photos/animals/dogs/corgi.jpg
+   photos/animals/dogs/poodle.jpg
+   photos/animals/dogs/terrier.jpg
diff --git a/doc/source/api/serialized-response-formats.rst b/doc/source/api/serialized-response-formats.rst
new file mode 100644
index 0000000000..8e60c7fcf6
--- /dev/null
+++ b/doc/source/api/serialized-response-formats.rst
@@ -0,0 +1,119 @@
+===========================
+Serialized response formats
+===========================
+
+By default, the Object Storage API uses a ``text/plain`` response
+format. In addition, both JSON and XML data serialization response
+formats are supported.
+
+To define the response format, use one of these methods:
+
++-------------------+-------------------------------------------------------+
+|Method             |Description                                            |
++===================+=======================================================+
+|format= ``format`` |Append this parameter to the URL for a ``GET`` request,|
+|query parameter    |where ``format`` is ``json`` or ``xml``.               |
++-------------------+-------------------------------------------------------+
+|``Accept`` request |Include this header in the ``GET`` request.            |
+|header             |The valid header values are:                           |
+|                   |                                                       |
+|                   |text/plain                                             |
+|                   |  Plain text response format. The default.             |
+|                   |application/jsontext                                   |
+|                   |  JSON data serialization response format.             |
+|                   |application/xml                                        |
+|                   |  XML data serialization response format.              |
+|                   |text/xml                                               |
+|                   |  XML data serialization response format.              |
++-------------------+-------------------------------------------------------+
+
+Example 1. JSON example with format query parameter
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+For example, this request uses the ``format`` query parameter to ask
+for a JSON response:
+
+.. code-block:: console
+
+   $ curl -i $publicURL?format=json -X GET -H "X-Auth-Token: $token"
+
+.. code-block:: console
+
+   HTTP/1.1 200 OK
+   Content-Length: 96
+   X-Account-Object-Count: 1
+   X-Timestamp: 1389453423.35964
+   X-Account-Meta-Subject: Literature
+   X-Account-Bytes-Used: 14
+   X-Account-Container-Count: 2
+   Content-Type: application/json; charset=utf-8
+   Accept-Ranges: bytes
+   X-Trans-Id: tx274a77a8975c4a66aeb24-0052d95365
+   Date: Fri, 17 Jan 2014 15:59:33 GMT
+
+Object Storage lists container names with additional information in JSON
+format:
+
+.. code-block:: json
+
+   [
+      {
+         "count":0,
+         "bytes":0,
+         "name":"janeausten"
+      },
+      {
+         "count":1,
+         "bytes":14,
+         "name":"marktwain"
+      }
+   ]
+
+
+Example 2. XML example with Accept header
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+This request uses the ``Accept`` request header to ask for an XML
+response:
+
+.. code-block:: console
+
+   $ curl -i $publicURL -X GET -H "X-Auth-Token: $token" -H \
+     "Accept: application/xml; charset=utf-8"
+
+.. code-block:: console
+
+   HTTP/1.1 200 OK
+   Content-Length: 263
+   X-Account-Object-Count: 3
+   X-Account-Meta-Book: MobyDick
+   X-Timestamp: 1389453423.35964
+   X-Account-Bytes-Used: 47
+   X-Account-Container-Count: 2
+   Content-Type: application/xml; charset=utf-8
+   Accept-Ranges: bytes
+   X-Trans-Id: txf0b4c9727c3e491694019-0052e03420
+   Date: Wed, 22 Jan 2014 21:12:00 GMT
+
+Object Storage lists container names with additional information in XML
+format:
+
+.. code-block:: xml
+
+   <?xml version="1.0" encoding="UTF-8"?>
+   <account name="AUTH_73f0aa26640f4971864919d0eb0f0880">
+       <container>
+           <name>janeausten</name>
+           <count>2</count>
+           <bytes>33</bytes>
+       </container>
+       <container>
+           <name>marktwain</name>
+           <count>1</count>
+           <bytes>14</bytes>
+       </container>
+   </account>
+
+The remainder of the examples in this guide use standard, non-serialized
+responses. However, all ``GET`` requests that perform list operations
+accept the ``format`` query parameter or ``Accept`` request header.
diff --git a/doc/source/api/static-website.rst b/doc/source/api/static-website.rst
new file mode 100644
index 0000000000..48dd34c9df
--- /dev/null
+++ b/doc/source/api/static-website.rst
@@ -0,0 +1,120 @@
+.. _static-website:
+
+=====================
+Create static website
+=====================
+
+To discover whether your Object Storage system supports this feature,
+see :ref:`discoverability`. Alternatively, check with your service
+provider.
+
+You can use your Object Storage account to create a static website. This
+static website is created with Static Web middleware and serves container
+data with a specified index file, error file resolution, and optional
+file listings. This mode is normally active only for anonymous requests,
+which provide no authentication token. To use it with authenticated
+requests, set the header ``X-Web-Mode`` to ``TRUE`` on the request.
+
+The Static Web filter must be added to the pipeline in your
+``/etc/swift/proxy-server.conf`` file below any authentication
+middleware. You must also add a Static Web middleware configuration
+section.
+
+Your publicly readable containers are checked for two headers,
+``X-Container-Meta-Web-Index`` and ``X-Container-Meta-Web-Error``. The
+``X-Container-Meta-Web-Error`` header is discussed below, in the
+section called :ref:`set_error_static_website`.
+
+Use ``X-Container-Meta-Web-Index`` to determine the index file (or
+default page served, such as ``index.html``) for your website. When
+someone initially enters your site, the ``index.html`` file displays
+automatically. If you create sub-directories for your site by creating
+pseudo-directories in your container, the index page for each
+sub-directory is displayed by default. If your pseudo-directory does not
+have a file with the same name as your index file, visits to the
+sub-directory return a 404 error.
+
+You also have the option of displaying a list of files in your
+pseudo-directory instead of a web page. To do this, set the
+``X-Container-Meta-Web-Listings`` header to ``TRUE``. You may add styles
+to your file listing by setting ``X-Container-Meta-Web-Listings-CSS``
+to a style sheet (for example, ``lists.css``).
+
+Static Web middleware through Object Storage
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The following sections show how to use Static Web middleware through
+Object Storage.
+
+Make container publicly readable
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Make the container publicly readable. Once the container is publicly
+readable, you can access your objects directly, but you must set the
+index file to browse the main site URL and its sub-directories.
+
+.. code-block:: console
+
+   $ swift post -r '.r:*,.rlistings' container
+
+
+Set site index file
+^^^^^^^^^^^^^^^^^^^
+
+Set the index file. In this case, ``index.html`` is the default file
+displayed when the site appears.
+
+.. code-block:: console
+
+   $ swift post -m 'web-index:index.html' container
+
+Enable file listing
+^^^^^^^^^^^^^^^^^^^
+
+Turn on file listing. If you do not set the index file, the URL displays
+a list of the objects in the container. Instructions on styling the list
+with a CSS follow.
+
+.. code-block:: console
+
+   $ swift post -m 'web-listings: true' container
+
+Enable CSS for file listing
+^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Style the file listing using a CSS.
+
+.. code-block:: console
+
+   $ swift post -m 'web-listings-css:listings.css' container
+
+.. _set_error_static_website:
+
+Set error pages for static website
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+You can create and set custom error pages for visitors to your website;
+currently, only 401 (Unauthorized) and 404 (Not Found) errors are
+supported. To do this, set the metadata header,
+``X-Container-Meta-Web-Error``.
+
+Error pages are served with the status code pre-pended to the name of
+the error page you set. For instance, if you set
+``X-Container-Meta-Web-Error`` to ``error.html``, 401 errors will
+display the page ``401error.html``. Similarly, 404 errors will display
+``404error.html``. You must have both of these pages created in your
+container when you set the ``X-Container-Meta-Web-Error`` metadata, or
+your site will display generic error pages.
+
+You only have to set the ``X-Container-Meta-Web-Error`` metadata once
+for your entire static website.
+
+Set error pages for static website request
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+.. code-block:: console
+
+   $ swift post -m 'web-error:error.html' container
+
+
+Any 2\ ``nn`` response indicates success.
diff --git a/doc/source/api/temporary_url_middleware.rst b/doc/source/api/temporary_url_middleware.rst
new file mode 100644
index 0000000000..767b4722aa
--- /dev/null
+++ b/doc/source/api/temporary_url_middleware.rst
@@ -0,0 +1,230 @@
+========================
+Temporary URL middleware
+========================
+
+To discover whether your Object Storage system supports this feature,
+check with your service provider or send a **GET** request using the ``/info``
+path.
+
+A temporary URL gives users temporary access to objects. For example, a
+website might want to provide a link to download a large object in
+Object Storage, but the Object Storage account has no public access. The
+website can generate a URL that provides time-limited **GET** access to
+the object. When the web browser user clicks on the link, the browser
+downloads the object directly from Object Storage, eliminating the need
+for the website to act as a proxy for the request.
+
+Furthermore, a temporary URL can be prefix-based. These URLs
+contain a signature which is valid for all objects which share
+a common prefix. They are useful for sharing a set of objects.
+
+Ask your cloud administrator to enable the temporary URL feature. For
+information, see :ref:`tempurl` in the *Source Documentation*.
+
+.. note::
+
+   To use **POST** requests to upload objects to specific Object Storage
+   locations, use :doc:`form_post_middleware` instead of temporary URL middleware.
+
+Temporary URL format
+~~~~~~~~~~~~~~~~~~~~
+
+A temporary URL is comprised of the URL for an object with added query
+parameters:
+
+**Example Temporary URL format**
+
+.. code:: none
+
+   https://swift-cluster.example.com/v1/my_account/container/object
+   ?temp_url_sig=732fcac368abb10c78a4cbe95c3fab7f311584532bf779abd5074e13cbe8b88b
+   &temp_url_expires=1323479485
+   &filename=My+Test+File.pdf
+
+The example shows these elements:
+
+
+**Object URL**: Required. The full path URL to the object.
+
+**temp\_url\_sig**: Required. An HMAC cryptographic signature that defines
+the allowed HTTP method, expiration date, full path to the object, and the
+secret key for the temporary URL. The digest used (for example, SHA-256 or
+SHA-512) must be supported by the cluster; supported digests will be listed
+in the ``tempurl.allowed_digests`` key in the cluster's capabilities.
+
+**temp\_url\_expires**: Required. An expiration date as a UNIX Epoch timestamp
+or ISO 8601 UTC timestamp. For example, ``1390852007`` or
+``2014-01-27T19:46:47Z`` can be used to represent
+``Mon, 27 Jan 2014 19:46:47 GMT``.
+
+For more information, see `Epoch & Unix Timestamp Conversion
+Tools <https://www.epochconverter.com/>`__.
+
+**filename**: Optional. Overrides the default file name. Object Storage
+generates a default file name for **GET** temporary URLs that is based on the
+object name. Object Storage returns this value in the ``Content-Disposition``
+response header. Browsers can interpret this file name value as a file
+attachment to be saved.
+
+A prefix-based temporary URL is similar but requires the parameter
+``temp_url_prefix``, which must be equal to the common prefix shared
+by all object names for which the URL is valid.
+
+.. code:: none
+
+   https://swift-cluster.example.com/v1/my_account/container/my_prefix/object
+   ?temp_url_sig=732fcac368abb10c78a4cbe95c3fab7f311584532bf779abd5074e13cbe8b88b
+   &temp_url_expires=2011-12-10T01:11:25Z
+   &temp_url_prefix=my_prefix
+
+.. _secret_keys:
+
+Secret Keys
+~~~~~~~~~~~
+
+The cryptographic signature used in Temporary URLs and also in
+:doc:`form_post_middleware` uses a secret key. Object Storage allows you to
+store two secret key values per account, and two per container. When validating
+a request, Object Storage checks signatures against all keys. Using two keys at
+each level enables key rotation without invalidating existing temporary URLs.
+
+To set the keys at the account level, set one or both of the following
+request headers to arbitrary values on a **POST** request to the account:
+
+-  ``X-Account-Meta-Temp-URL-Key``
+
+-  ``X-Account-Meta-Temp-URL-Key-2``
+
+To set the keys at the container level, set one or both of the following
+request headers to arbitrary values on a **POST** or **PUT** request to the
+container:
+
+-  ``X-Container-Meta-Temp-URL-Key``
+
+-  ``X-Container-Meta-Temp-URL-Key-2``
+
+The arbitrary values serve as the secret keys.
+
+For example, use the **swift post** command to set the secret key to
+*``MYKEY``*:
+
+.. code:: console
+
+   $ swift post -m "Temp-URL-Key:MYKEY"
+
+.. note::
+
+   Changing these headers invalidates any previously generated temporary
+   URLs within 60 seconds, which is the memcache time for the key.
+
+HMAC signature for temporary URLs
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Temporary URL middleware uses an HMAC cryptographic signature. This
+signature includes these elements:
+
+-  The allowed method. Typically, **GET** or **PUT**.
+
+-  Expiry time. In the example for the HMAC-SHA256 signature for temporary
+   URLs below, the expiry time is set to ``86400`` seconds (or 1 day)
+   into the future. Please be aware that you have to use a UNIX timestamp
+   for generating the signature (in the API request it is also allowed to
+   use an ISO 8601 UTC timestamp).
+
+-  The path. Starting with ``/v1/`` onwards and including a container
+   name and object. The path for prefix-based signatures must start with
+   ``prefix:/v1/``. Do not URL-encode the path at this stage.
+
+-  The secret key. Use one of the key values as described
+   in :ref:`secret_keys`.
+
+These sample Python codes show how to compute a signature for use with
+temporary URLs:
+
+**Example HMAC-SHA256 signature for object-based temporary URLs**
+
+.. code:: python
+
+   import hmac
+   from hashlib import sha256
+   from time import time
+   method = 'GET'
+   duration_in_seconds = 60*60*24
+   expires = int(time() + duration_in_seconds)
+   path = '/v1/my_account/container/object'
+   key = 'MYKEY'
+   hmac_body = '%s\n%s\n%s' % (method, expires, path)
+   signature = hmac.new(key, hmac_body, sha256).hexdigest()
+
+**Example HMAC-SHA512 signature for prefix-based temporary URLs**
+
+.. code:: python
+
+   import hmac
+   from hashlib import sha512
+   from time import time
+   method = 'GET'
+   duration_in_seconds = 60*60*24
+   expires = int(time() + duration_in_seconds)
+   path = 'prefix:/v1/my_account/container/my_prefix'
+   key = 'MYKEY'
+   hmac_body = '%s\n%s\n%s' % (method, expires, path)
+   signature = hmac.new(key, hmac_body, sha512).hexdigest()
+
+Do not URL-encode the path when you generate the HMAC signature.
+However, when you make the actual HTTP request, you should properly
+URL-encode the URL.
+
+The *``MYKEY``* value is one of the key values as described
+in :ref:`secret_keys`.
+
+For more information, see `RFC 2104: HMAC: Keyed-Hashing for Message
+Authentication <http://www.ietf.org/rfc/rfc2104.txt>`__.
+
+If you want to transform a UNIX timestamp into an ISO 8601 UTC timestamp,
+you can use following code snippet:
+
+.. code:: python
+
+   import time
+   time.strftime('%Y-%m-%dT%H:%M:%SZ', time.gmtime(timestamp))
+
+Using the ``swift`` tool to generate a Temporary URL
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The ``swift`` tool provides the  tempurl_ option that
+auto-generates the *``temp_url_sig``* and *``temp_url_expires``* query
+parameters. For example, you might run this command:
+
+.. code:: console
+
+   $ swift tempurl GET 3600 /v1/my_account/container/object MYKEY
+
+.. note::
+
+   The ``swift`` tool is not yet updated and continues to use the
+   deprecated cipher SHA1.
+
+This command returns the path:
+
+.. code:: none
+
+   /v1/my_account/container/object
+   ?temp_url_sig=5c4cc8886f36a9d0919d708ade98bf0cc71c9e91
+   &temp_url_expires=1374497657
+
+To create the temporary URL, prefix this path with the Object Storage
+storage host name. For example, prefix the path with
+``https://swift-cluster.example.com``, as follows:
+
+.. code:: none
+
+   https://swift-cluster.example.com/v1/my_account/container/object
+   ?temp_url_sig=5c4cc8886f36a9d0919d708ade98bf0cc71c9e91
+   &temp_url_expires=1374497657
+
+Note that if the above example is copied exactly, and used in a command
+shell, then the ampersand is interpreted as an operator and the URL
+will be truncated. Enclose the URL in quotation marks to avoid this.
+
+.. _tempurl: https://docs.openstack.org/python-swiftclient/latest/cli/index.html#swift-tempurl
diff --git a/doc/source/api/use_content-encoding_metadata.rst b/doc/source/api/use_content-encoding_metadata.rst
new file mode 100644
index 0000000000..18c94878e6
--- /dev/null
+++ b/doc/source/api/use_content-encoding_metadata.rst
@@ -0,0 +1,22 @@
+=============================
+Use Content-Encoding metadata
+=============================
+
+When you create an object or update its metadata, you can optionally set
+the ``Content-Encoding`` metadata. This metadata enables you to indicate
+that the object content is compressed without losing the identity of the
+underlying media type (``Content-Type``) of the file, such as a video.
+
+**Example Content-Encoding header request: HTTP**
+
+This example assigns an attachment type to the ``Content-Encoding``
+header that indicates how the file is downloaded:
+
+.. code:: none
+
+   PUT /<api version>/<account>/<container>/<object> HTTP/1.1
+   Host: storage.clouddrive.com
+   X-Auth-Token: eaaafd18-0fed-4b3a-81b4-663c99ec1cbb
+   Content-Type: video/mp4
+   Content-Encoding: gzip
+
diff --git a/doc/source/api/use_the_content-disposition_metadata.rst b/doc/source/api/use_the_content-disposition_metadata.rst
new file mode 100644
index 0000000000..fc6cf95fc7
--- /dev/null
+++ b/doc/source/api/use_the_content-disposition_metadata.rst
@@ -0,0 +1,31 @@
+====================================
+Use the Content-Disposition metadata
+====================================
+
+To override the default behavior for a browser, use the
+``Content-Disposition`` header to specify the override behavior and
+assign this header to an object. For example, this header might specify
+that the browser use a download program to save this file rather than
+show the file, which is the default.
+
+**Example Override browser default behavior request: HTTP**
+
+This example assigns an attachment type to the ``Content-Disposition``
+header. This attachment type indicates that the file is to be downloaded
+as ``goodbye.txt``:
+
+.. code:: console
+
+   # curl -i  $publicURL/marktwain/goodbye -X POST -H "X-Auth-Token: $token" -H "Content-Length: 14" -H "Content-Type: application/octet-stream" -H "Content-Disposition: attachment; filename=goodbye.txt"
+
+.. code:: console
+
+   HTTP/1.1 202 Accepted
+   Content-Length: 76
+   Content-Type: text/html; charset=UTF-8
+   X-Trans-Id: txa9b5e57d7f354d7ea9f57-0052e17e13
+   X-Openstack-Request-Id: txa9b5e57d7f354d7ea9f57-0052e17e13
+   Date: Thu, 23 Jan 2014 20:39:47 GMT
+
+   <html><h1>Accepted</h1><p>The request is accepted for processing.</p></html>
+
diff --git a/doc/source/associated_projects.rst b/doc/source/associated_projects.rst
index 10e01fbc4e..27db41fa3d 100644
--- a/doc/source/associated_projects.rst
+++ b/doc/source/associated_projects.rst
@@ -3,49 +3,89 @@
 Associated Projects
 ===================
 
+.. _application-bindings:
 
 Application Bindings
 --------------------
 
 * OpenStack supported binding:
 
-   * `Python-SwiftClient <http://pypi.python.org/pypi/python-swiftclient>`_
+  * `Python-SwiftClient <https://pypi.org/project/python-swiftclient>`_
 
-* Made for Cloud Files, but mostly work with Swift too:
+* Unofficial libraries and bindings:
 
-    * `CSharp-CloudFiles <https://github.com/rackspace/csharp-cloudfiles>`_
-    * `Java-CloudFiles <https://github.com/rackspace/java-cloudfiles>`_
-    * `PHP-CloudFiles <https://github.com/rackspace/php-cloudfiles>`_
-    * `Python-CloudFiles <https://github.com/rackspace/python-cloudfiles>`_
-    * `Ruby-CloudFiles <https://github.com/rackspace/ruby-cloudfiles>`_
+  * PHP
 
-* `RSwift <https://github.com/pandemicsyn/RSwift>`_ - Unofficial R API bindings.
+    * `PHP-opencloud <http://php-opencloud.com>`_ - Official Rackspace PHP
+      bindings that should work for other Swift deployments too.
+
+  * Ruby
+
+    * `swift_client <https://github.com/mrkamel/swift_client>`_ -
+      Small but powerful Ruby client to interact with OpenStack Swift
+    * `nightcrawler_swift <https://github.com/tulios/nightcrawler_swift>`_ -
+      This Ruby gem teleports your assets to an OpenStack Swift bucket/container
+    * `swift storage <https://rubygems.org/gems/swift-storage>`_ -
+      Simple OpenStack Swift storage client.
+
+  * Java
+
+    * `libcloud <http://libcloud.apache.org>`_ - Apache Libcloud - a unified
+      interface in Python for different clouds with OpenStack Swift support.
+    * `jclouds <http://jclouds.apache.org/guides/openstack/>`_ -
+      Java library offering bindings for all OpenStack projects
+    * `java-openstack-swift <https://github.com/iterate-ch/java-openstack-swift>`_ -
+      Java bindings for OpenStack Swift
+    * `javaswift <http://javaswift.org/>`_ - Collection of Java tools for Swift
+
+  * Bash
+
+    * `supload <https://github.com/selectel/supload>`_ - Bash script to
+      upload file to cloud storage based on OpenStack Swift API.
+
+  * .NET
+
+    * `openstacknetsdk.org <http://www.openstacknetsdk.org>`_ - An OpenStack
+      Cloud SDK for Microsoft .NET.
+
+  * Go
+
+    * `Go language bindings <https://github.com/ncw/swift>`_
+    * `Gophercloud an OpenStack SDK for Go <https://godoc.org/github.com/gophercloud/gophercloud>`_
 
-* `Go language bindings <https://github.com/ncw/swift>`_
 
 Authentication
 --------------
 
-* `Keystone <https://github.com/openstack/keystone>`_ - Official Identity Service for OpenStack.
-* `Swauth <https://github.com/gholt/swauth>`_ - Older Swift authentication service that only requires Swift itself.
+* `Keystone <https://opendev.org/openstack/keystone>`_ - Official Identity
+  Service for OpenStack.
+* `Swauth <https://opendev.org/x/swauth/>`_ - **RETIRED**: An alternative Swift
+  authentication service that only requires Swift itself.
+* `Basicauth <https://github.com/CloudVPS/swift-basicauth>`_ - HTTP Basic
+  authentication support (keystone backed).
 
 
 Command Line Access
 -------------------
 
-* `Swiftly <https://github.com/gholt/swiftly>`_ - Alternate command line access to Swift with direct (no proxy) access capabilities as well.
+* `Swiftly <https://github.com/gholt/swiftly>`_ - Alternate command line
+  access to Swift with direct (no proxy) access capabilities as well.
 
 
 Log Processing
 --------------
 
-* `Slogging <https://github.com/notmyname/slogging>`_ - Basic stats and logging tools.
+* `slogging <https://opendev.org/x/slogging>`_ - Basic stats and
+  logging tools.
 
 
 Monitoring & Statistics
 -----------------------
 
-* `Swift Informant <https://github.com/pandemicsyn/swift-informant>`_ - Swift Proxy Middleware to send events to a statsd instance.
+* `Swift Informant <https://github.com/pandemicsyn/swift-informant>`_ -
+  Swift proxy Middleware to send events to a statsd instance.
+* `Swift Inspector <https://github.com/hurricanerix/swift-inspector>`_ -
+  Swift middleware to relay information about a request back to the client.
 
 
 Content Distribution Network Integration
@@ -57,8 +97,18 @@ Content Distribution Network Integration
 Alternative API
 ---------------
 
-* `Swift3 <https://github.com/fujita/swift3>`_ - Amazon S3 API emulation.
-* `CDMI <https://github.com/osaddon/cdmi>`_ - CDMI support
+* `ProxyFS <https://github.com/NVIDIA/proxyfs>`_ - Integrated file and
+  object access for Swift object storage
+* `SwiftHLM <https://github.com/ibm-research/SwiftHLM>`_ - a middleware for
+  using OpenStack Swift with tape and other high latency media storage
+  backends.
+
+
+Benchmarking/Load Generators
+----------------------------
+
+* `getput <https://github.com/markseger/getput>`_ - getput tool suite
+* `COSbench <https://github.com/intel-cloud/cosbench>`_ - COSbench tool suite
 
 
 .. _custom-logger-hooks-label:
@@ -66,9 +116,51 @@ Alternative API
 Custom Logger Hooks
 -------------------
 
-* `swift-sentry <https://github.com/pandemicsyn/swift-sentry>`_ - Sentry exception reporting for Swift
+* `swift-sentry <https://github.com/pandemicsyn/swift-sentry>`_ -
+  Sentry exception reporting for Swift
+
+Storage Backends (DiskFile API implementations)
+-----------------------------------------------
+* `Swift-on-File <https://opendev.org/x/swiftonfile>`_ -
+  Enables objects created using Swift API to be accessed as files on a POSIX
+  filesystem and vice versa.
+* `swift-scality-backend <https://github.com/scality/ScalitySproxydSwift>`_ -
+  Scality sproxyd object server implementation for Swift.
+
+Developer Tools
+---------------
+* `SAIO bash scripts <https://github.com/ntata/swift-setup-scripts>`_ -
+  Well commented simple bash scripts for Swift all in one setup.
+* `vagrant-swift-all-in-one
+  <https://github.com/NVIDIA/vagrant-swift-all-in-one>`_ - Quickly setup a
+  standard development environment using Vagrant and Chef cookbooks in an
+  Ubuntu virtual machine.
+* `SAIO Ansible playbook <https://github.com/thiagodasilva/ansible-saio>`_ -
+  Quickly setup a standard development environment using Vagrant and Ansible in
+  a Fedora virtual machine (with built-in `Swift-on-File
+  <https://opendev.org/x/swiftonfile>`_ support).
+* `Multi Swift <https://github.com/ntata/multi-swift-POC>`_ -
+  Bash scripts to spin up multiple Swift clusters sharing the same hardware
+
 
 Other
 -----
 
-* `Glance <https://github.com/openstack/glance>`_ - Provides services for discovering, registering, and retrieving virtual machine images (for OpenStack Compute [Nova], for example).
+* `Glance <https://opendev.org/openstack/glance>`_ - Provides services for
+  discovering, registering, and retrieving virtual machine images
+  (for OpenStack Compute [Nova], for example).
+* `Django Swiftbrowser <https://github.com/cschwede/django-swiftbrowser>`_ -
+  Simple Django web app to access OpenStack Swift.
+* `Swift-account-stats <https://github.com/redhat-cip/swift-account-stats>`_ -
+  Swift-account-stats is a tool to report statistics on Swift usage at
+  tenant and global levels.
+* `PyECLib <https://opendev.org/openstack/pyeclib>`_ - High-level erasure code
+  library used by Swift
+* `liberasurecode <https://opendev.org/openstack/liberasurecode>`_ - Low-level
+  erasure code library used by PyECLib
+* `Swift Browser <https://github.com/mgeisler/swift-browser>`_ - JavaScript
+  interface for Swift
+* `swift-ui <https://github.com/fanatic/swift-ui>`_ - OpenStack Swift
+  web browser
+* `swiftbackmeup <https://github.com/redhat-cip/swiftbackmeup>`_ -
+  Utility that allows one to create backups and upload them to OpenStack Swift
diff --git a/doc/source/audit_watchers.rst b/doc/source/audit_watchers.rst
new file mode 100644
index 0000000000..51ca39537e
--- /dev/null
+++ b/doc/source/audit_watchers.rst
@@ -0,0 +1,12 @@
+.. _common_audit_watchers:
+
+*********************
+Object Audit Watchers
+*********************
+
+.. _dark_data:
+
+Dark Data
+=========
+
+.. automodule:: swift.obj.watchers.dark_data
diff --git a/doc/source/conf.py b/doc/source/conf.py
index c1cb24ddf9..c8a0d7afb9 100644
--- a/doc/source/conf.py
+++ b/doc/source/conf.py
@@ -1,5 +1,18 @@
 # -*- coding: utf-8 -*-
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# Copyright (c) 2010-2012 OpenStack Foundation.
 #
 # Swift documentation build configuration file, created by
 # sphinx-quickstart on Tue May 18 13:50:15 2010.
@@ -13,8 +26,19 @@
 # All configuration values have a default; values that are commented out
 # serve to show the default.
 
-import sys
+import datetime
+import logging
 import os
+import sys
+
+# NOTE(amotoki): Our current doc build job uses an older version of
+# liberasurecode which comes from Ubuntu 16.04.
+# pyeclib emits a warning message if liberasurecode <1.3.1 is used [1] and
+# this causes the doc build failure if warning-is-error is enabled in Sphinx.
+# As a workaround we suppress the warning message from pyeclib until we use
+# a newer version of liberasurecode in our doc build job.
+# [1] https://github.com/openstack/pyeclib/commit/d163972b
+logging.getLogger('pyeclib').setLevel(logging.ERROR)
 
 # If extensions (or modules to document with autodoc) are in another directory,
 # add these directories to sys.path here. If the directory is relative to the
@@ -26,56 +50,47 @@
 
 # Add any Sphinx extension module names here, as strings. They can be
 # extensions coming with Sphinx (named 'sphinx.ext.*') or your custom ones.
-extensions = ['sphinx.ext.autodoc', 'sphinx.ext.intersphinx',
-              'sphinx.ext.todo', 'sphinx.ext.coverage', 'sphinx.ext.pngmath',
-              'sphinx.ext.ifconfig']
+extensions = ['sphinx.ext.autodoc',
+              'sphinx.ext.todo',
+              'sphinx.ext.coverage',
+              'sphinx.ext.ifconfig',
+              'openstackdocstheme',
+              'sphinxcontrib.rsvgconverter']
 todo_include_todos = True
 
 # Add any paths that contain templates here, relative to this directory.
-# Changing the path so that the Hudson build output contains GA code and the
-# source docs do not contain the code so local, offline sphinx builds are
-# "clean."
-templates_path = []
-if os.getenv('HUDSON_PUBLISH_DOCS'):
-    templates_path = ['_ga', '_templates']
-else:
-    templates_path = ['_templates']
+# templates_path = []
 
 # The suffix of source filenames.
 source_suffix = '.rst'
 
 # The encoding of source files.
-#source_encoding = 'utf-8'
+# source_encoding = 'utf-8'
 
 # The master toctree document.
 master_doc = 'index'
 
 # General information about the project.
-project = u'Swift'
-copyright = u'2011-present, OpenStack, LLC'
-
-# The version info for the project you're documenting, acts as replacement for
-# |version| and |release|, also used in various other places throughout the
-# built documents.
-#
-# The short X.Y version.
-from swift import __version__
-version = __version__.rsplit('.', 1)[0]
-# The full version, including alpha/beta/rc tags.
-release = __version__
+project = 'Swift'
+if 'SOURCE_DATE_EPOCH' in os.environ:
+    now = float(os.environ.get('SOURCE_DATE_EPOCH'))
+    now = datetime.datetime.fromtimestamp(now, tz=datetime.timezone.utc)
+else:
+    now = datetime.date.today()
+copyright = '%d, OpenStack Foundation' % now.year
 
 # The language for content autogenerated by Sphinx. Refer to documentation
 # for a list of supported languages.
-#language = None
+# language = None
 
 # There are two options for replacing |today|: either, you set today to some
 # non-false value, then it is used:
-#today = ''
+# today = ''
 # Else, today_fmt is used as the format for a strftime call.
-#today_fmt = '%B %d, %Y'
+# today_fmt = '%B %d, %Y'
 
 # List of documents that shouldn't be included in the build.
-#unused_docs = []
+# unused_docs = []
 
 # List of directories, relative to source directory, that shouldn't be searched
 # for source files.
@@ -83,21 +98,21 @@
 
 # The reST default role (used for this markup: `text`) to use for all
 # documents.
-#default_role = None
+# default_role = None
 
 # If true, '()' will be appended to :func: etc. cross-reference text.
-#add_function_parentheses = True
+# add_function_parentheses = True
 
 # If true, the current module name will be prepended to all description
 # unit titles (such as .. function::).
-#add_module_names = True
+# add_module_names = True
 
 # If true, sectionauthor and moduleauthor directives will be shown in the
 # output. They are ignored by default.
 show_authors = True
 
 # The name of the Pygments (syntax highlighting) style to use.
-pygments_style = 'sphinx'
+pygments_style = 'native'
 
 # A list of ignored prefixes for module index sorting.
 modindex_common_prefix = ['swift.']
@@ -108,74 +123,75 @@
 # The theme to use for HTML and HTML Help pages.  Major themes that come with
 # Sphinx are currently 'default' and 'sphinxdoc'.
 # html_theme = 'default'
-html_theme_path = ["."]
-html_theme = '_theme'
+# html_theme_path = ["."]
+html_theme = 'openstackdocs'
 
 # Theme options are theme-specific and customize the look and feel of a theme
 # further.  For a list of options available for each theme, see the
 # documentation.
-#html_theme_options = {}
+html_theme_options = {
+    # turn off the "these docs aren't current" banner
+    'display_badge': False,
+}
 
 # Add any paths that contain custom themes here, relative to this directory.
-#html_theme_path = []
+# html_theme_path = []
 
 # The name for this set of Sphinx documents.  If None, it defaults to
 # "<project> v<release> documentation".
-#html_title = None
+# html_title = None
 
 # A shorter title for the navigation bar.  Default is the same as html_title.
-#html_short_title = None
+# html_short_title = None
 
 # The name of an image file (relative to this directory) to place at the top
 # of the sidebar.
-#html_logo = None
+# html_logo = None
 
 # The name of an image file (within the static path) to use as favicon of the
 # docs.  This file should be a Windows icon file (.ico) being 16x16 or 32x32
 # pixels large.
-#html_favicon = None
+# html_favicon = None
 
 # Add any paths that contain custom static files (such as style sheets) here,
 # relative to this directory. They are copied after the builtin static files,
 # so a file named "default.css" will overwrite the builtin "default.css".
-html_static_path = ['_static']
+# html_static_path = ['_static']
 
-# If not '', a 'Last updated on:' timestamp is inserted at every page bottom,
-# using the given strftime format.
-#html_last_updated_fmt = '%b %d, %Y'
-git_cmd = "git log --pretty=format:'%ad, commit %h' --date=local -n1"
-html_last_updated_fmt = os.popen(git_cmd).read()
+# Add any paths that contain "extra" files, such as .htaccess or
+# robots.txt.
+html_extra_path = ['_extra']
 
 # If true, SmartyPants will be used to convert quotes and dashes to
 # typographically correct entities.
-#html_use_smartypants = True
+# html_use_smartypants = True
 
 # Custom sidebar templates, maps document names to template names.
-#html_sidebars = {}
+# html_sidebars = {}
 
 # Additional templates that should be rendered to pages, maps page names to
 # template names.
-#html_additional_pages = {}
+# html_additional_pages = {}
 
 # If false, no module index is generated.
-#html_use_modindex = True
+# html_use_modindex = True
 
 # If false, no index is generated.
-#html_use_index = True
+# html_use_index = True
 
 # If true, the index is split into individual pages for each letter.
-#html_split_index = False
+# html_split_index = False
 
 # If true, links to the reST sources are added to the pages.
-#html_show_sourcelink = True
+# html_show_sourcelink = True
 
 # If true, an OpenSearch description file will be output, and all pages will
 # contain a <link> tag referring to it.  The value of this option must be the
 # base URL from which the finished HTML is served.
-#html_use_opensearch = ''
+# html_use_opensearch = ''
 
 # If nonempty, this is the file name suffix for HTML files (e.g. ".xhtml").
-#html_file_suffix = ''
+# html_file_suffix = ''
 
 # Output file base name for HTML help builder.
 htmlhelp_basename = 'swiftdoc'
@@ -184,37 +200,41 @@
 # -- Options for LaTeX output -------------------------------------------------
 
 # The paper size ('letter' or 'a4').
-#latex_paper_size = 'letter'
+# latex_paper_size = 'letter'
 
 # The font size ('10pt', '11pt' or '12pt').
-#latex_font_size = '10pt'
+# latex_font_size = '10pt'
 
 # Grouping the document tree into LaTeX files. List of tuples
 # (source start file, target name, title, author, documentclass
 # [howto/manual]).
 latex_documents = [
-    ('index', 'Swift.tex', u'Swift Documentation',
-     u'Swift Team', 'manual'),
+    ('index', 'doc-swift.tex', 'Swift Documentation',
+     'Swift Team', 'manual'),
 ]
 
 # The name of an image file (relative to this directory) to place at the top of
 # the title page.
-#latex_logo = None
+# latex_logo = None
 
 # For "manual" documents, if this is true, then toplevel headings are parts,
 # not chapters.
-#latex_use_parts = False
+# latex_use_parts = False
 
 # Additional stuff for the LaTeX preamble.
-#latex_preamble = ''
+# latex_preamble = ''
 
 # Documents to append as an appendix to all manuals.
-#latex_appendices = []
+# latex_appendices = []
 
 # If false, no module index is generated.
-#latex_use_modindex = True
+# latex_use_modindex = True
+
+latex_use_xindy = False
 
-# Example configuration for intersphinx: refer to the Python standard library.
-intersphinx_mapping = {'python': ('http://docs.python.org/', None),
-                       'nova': ('http://nova.openstack.org', None),
-                       'glance': ('http://glance.openstack.org', None)}
+# -- Options for openstackdocstheme -------------------------------------------
+openstackdocs_repo_name = 'openstack/swift'
+openstackdocs_pdf_link = True
+openstackdocs_auto_name = False
+openstackdocs_bug_project = 'swift'
+openstackdocs_bug_tag = ''
diff --git a/doc/source/config/account_server_config.rst b/doc/source/config/account_server_config.rst
new file mode 100644
index 0000000000..f305c021b0
--- /dev/null
+++ b/doc/source/config/account_server_config.rst
@@ -0,0 +1,377 @@
+.. _account-server-config:
+
+----------------------------
+Account Server Configuration
+----------------------------
+
+This document describes the configuration options available for the account
+server. Documentation for other swift configuration options can be found at
+:doc:`index`.
+
+An example Account Server configuration can be found at
+etc/account-server.conf-sample in the source code repository.
+
+The following configuration sections are available:
+
+* :ref:`[DEFAULT] <account_server_default_options>`
+* `[account-server]`_
+* `[account-replicator]`_
+* `[account-auditor]`_
+* `[account-reaper]`_
+
+.. _account_server_default_options:
+
+*********
+[DEFAULT]
+*********
+
+===============================  ==========  =============================================
+Option                           Default     Description
+-------------------------------  ----------  ---------------------------------------------
+swift_dir                        /etc/swift  Swift configuration directory
+devices                          /srv/node   Parent directory or where devices are mounted
+mount_check                      true        Whether or not check if the devices are
+                                             mounted to prevent accidentally writing
+                                             to the root device
+bind_ip                          0.0.0.0     IP Address for server to bind to
+bind_port                        6202        Port for server to bind to
+keep_idle                        600         Value to set for socket TCP_KEEPIDLE
+bind_timeout                     30          Seconds to attempt bind before giving up
+backlog                          4096        Maximum number of allowed pending
+                                             connections
+workers                          auto        Override the number of pre-forked workers
+                                             that will accept connections.  If set it
+                                             should be an integer, zero means no fork.  If
+                                             unset, it will try to default to the number
+                                             of effective cpu cores and fallback to one.
+                                             Increasing the number of workers may reduce
+                                             the possibility of slow file system
+                                             operations in one request from negatively
+                                             impacting other requests.  See
+                                             :ref:`general-service-tuning`.
+max_clients                      1024        Maximum number of clients one worker can
+                                             process simultaneously (it will actually
+                                             accept(2) N + 1). Setting this to one (1)
+                                             will only handle one request at a time,
+                                             without accepting another request
+                                             concurrently.
+user                             swift       User to run as
+db_preallocation                 off         If you don't mind the extra disk space usage in
+                                             overhead, you can turn this on to preallocate
+                                             disk space with SQLite databases to decrease
+                                             fragmentation.
+disable_fallocate                false       Disable "fast fail" fallocate checks if the
+                                             underlying filesystem does not support it.
+log_name                         swift       Label used when logging
+log_facility                     LOG_LOCAL0  Syslog log facility
+log_level                        INFO        Logging level
+log_address                      /dev/log    Logging directory
+log_max_line_length              0           Caps the length of log lines to the
+                                             value given; no limit if set to 0, the
+                                             default.
+log_custom_handlers              None        Comma-separated list of functions to call
+                                             to setup custom log handlers.
+log_udp_host                                 Override log_address
+log_udp_port                     514         UDP log port
+log_statsd_host                  None        Enables StatsD logging; IPv4/IPv6
+                                             address or a hostname.  If a
+                                             hostname resolves to an IPv4 and IPv6
+                                             address, the IPv4 address will be
+                                             used.
+log_statsd_port                  8125
+log_statsd_default_sample_rate   1.0
+log_statsd_sample_rate_factor    1.0
+log_statsd_metric_prefix
+eventlet_debug                   false       If true, turn on debug logging for eventlet
+fallocate_reserve                1%          You can set fallocate_reserve to the
+                                             number of bytes or percentage of disk
+                                             space you'd like fallocate to reserve,
+                                             whether there is space for the given
+                                             file size or not. Percentage will be used
+                                             if the value ends with a '%'. This is
+                                             useful for systems that behave badly when
+                                             they completely run out of space; you can
+                                             make the services pretend they're out of
+                                             space early.
+nice_priority                    None        Scheduling priority of server processes.
+                                             Niceness values range from -20 (most
+                                             favorable to the process) to 19 (least
+                                             favorable to the process). The default
+                                             does not modify priority.
+ionice_class                     None        I/O scheduling class of server processes.
+                                             I/O niceness class values are IOPRIO_CLASS_RT
+                                             (realtime), IOPRIO_CLASS_BE (best-effort),
+                                             and IOPRIO_CLASS_IDLE (idle).
+                                             The default does not modify class and
+                                             priority. Linux supports io scheduling
+                                             priorities and classes since 2.6.13 with
+                                             the CFQ io scheduler.
+                                             Work only with ionice_priority.
+ionice_priority                  None        I/O scheduling priority of server processes.
+                                             I/O niceness priority is a number which
+                                             goes from 0 to 7. The higher the value,
+                                             the lower the I/O priority of the process.
+                                             Work only with ionice_class.
+                                             Ignored if IOPRIO_CLASS_IDLE is set.
+===============================  ==========  =============================================
+
+****************
+[account-server]
+****************
+
+=============================  ==============  ==========================================
+Option                         Default         Description
+-----------------------------  --------------  ------------------------------------------
+use                                            Entry point for paste.deploy for the account
+                                               server.  For most cases, this should be
+                                               ``egg:swift#account``.
+set log_name                   account-server  Label used when logging
+set log_facility               LOG_LOCAL0      Syslog log facility
+set log_level                  INFO            Logging level
+set log_requests               True            Whether or not to log each
+                                               request
+set log_address                /dev/log        Logging directory
+replication_server                             Configure parameter for creating
+                                               specific server. To handle all verbs,
+                                               including replication verbs, do not
+                                               specify "replication_server"
+                                               (this is the default). To only
+                                               handle replication, set to a True
+                                               value (e.g. "True" or "1").
+                                               To handle only non-replication
+                                               verbs, set to "False". Unless you
+                                               have a separate replication network, you
+                                               should not specify any value for
+                                               "replication_server".
+nice_priority                  None            Scheduling priority of server processes.
+                                               Niceness values range from -20 (most
+                                               favorable to the process) to 19 (least
+                                               favorable to the process). The default
+                                               does not modify priority.
+ionice_class                   None            I/O scheduling class of server processes.
+                                               I/O niceness class values are IOPRIO_CLASS_RT
+                                               (realtime), IOPRIO_CLASS_BE (best-effort),
+                                               and IOPRIO_CLASS_IDLE (idle).
+                                               The default does not modify class and
+                                               priority. Linux supports io scheduling
+                                               priorities and classes since 2.6.13 with
+                                               the CFQ io scheduler.
+                                               Work only with ionice_priority.
+ionice_priority                None            I/O scheduling priority of server
+                                               processes. I/O niceness priority is
+                                               a number which goes from 0 to 7.
+                                               The higher the value, the lower the I/O
+                                               priority of the process. Work only with
+                                               ionice_class.
+                                               Ignored if IOPRIO_CLASS_IDLE is set.
+=============================  ==============  ==========================================
+
+********************
+[account-replicator]
+********************
+
+==================== =========================  =====================================
+Option               Default                    Description
+-------------------- -------------------------  -------------------------------------
+log_name             account-replicator         Label used when logging
+log_facility         LOG_LOCAL0                 Syslog log facility
+log_level            INFO                       Logging level
+log_address          /dev/log                   Logging directory
+per_diff             1000                       Maximum number of database rows
+                                                that will be sync'd in a single
+                                                HTTP replication request.
+                                                Databases with less than or
+                                                equal to this number of
+                                                differing rows will always be
+                                                sync'd using an HTTP replication
+                                                request rather than using rsync.
+max_diffs            100                        Maximum number of HTTP
+                                                replication requests attempted
+                                                on each replication pass for any
+                                                one container. This caps how
+                                                long the replicator will spend
+                                                trying to sync a given database
+                                                per pass so the other databases
+                                                don't get starved.
+concurrency          8                          Number of replication workers
+                                                to spawn
+interval             30                         Time in seconds to wait between
+                                                replication passes
+databases_per_second 50                         Maximum databases to process
+                                                per second.  Should be tuned
+                                                according to individual
+                                                system specs.  0 is unlimited.
+node_timeout         10                         Request timeout to external
+                                                services
+conn_timeout         0.5                        Connection timeout to external
+                                                services
+reclaim_age          604800                     Time elapsed in seconds before
+                                                an account can be reclaimed
+rsync_module         {replication_ip}::account  Format of the rsync module where
+                                                the replicator will send data.
+                                                The configuration value can
+                                                include some variables that will
+                                                be extracted from the ring.
+                                                Variables must follow the format
+                                                {NAME} where NAME is one of: ip,
+                                                port, replication_ip,
+                                                replication_port, region, zone,
+                                                device, meta. See
+                                                etc/rsyncd.conf-sample for some
+                                                examples.
+rsync_compress       no                         Allow rsync to compress data
+                                                which is transmitted to
+                                                destination node during sync.
+                                                However, this is applicable only
+                                                when destination node is in a
+                                                different region than the local
+                                                one. NOTE: Objects that are
+                                                already compressed (for example:
+                                                .tar.gz, mp3) might slow down
+                                                the syncing process.
+recon_cache_path     /var/cache/swift           Path to recon cache
+nice_priority        None                       Scheduling priority of server
+                                                processes. Niceness values
+                                                range from -20 (most favorable
+                                                to the process) to 19 (least
+                                                favorable to the process).
+                                                The default does not modify
+                                                priority.
+ionice_class         None                       I/O scheduling class of server
+                                                processes. I/O niceness class
+                                                values are IOPRIO_CLASS_RT
+                                                (realtime), IOPRIO_CLASS_BE
+                                                (best-effort), and IOPRIO_CLASS_IDLE
+                                                (idle).
+                                                The default does not modify
+                                                class and priority. Linux supports
+                                                io scheduling priorities and classes
+                                                since 2.6.13 with the CFQ io scheduler.
+                                                Work only with ionice_priority.
+ionice_priority      None                       I/O scheduling priority of server
+                                                processes. I/O niceness priority
+                                                is a number which goes from 0 to 7.
+                                                The higher the value, the lower
+                                                the I/O priority of the process.
+                                                Work only with ionice_class.
+                                                Ignored if IOPRIO_CLASS_IDLE
+                                                is set.
+handoffs_only        no                         When handoffs_only mode is enabled
+                                                the replicator will *only* replicate
+                                                from handoff nodes to primary nodes
+                                                and will not sync primary nodes
+                                                with other primary nodes.
+handoff_delete       auto                       the number of replicas which are
+                                                ensured in swift. If the number
+                                                less than the number of replicas
+                                                is set, account-replicator
+                                                could delete local handoffs even
+                                                if all replicas are not ensured in
+                                                the cluster. The replicator would
+                                                remove local handoff account database
+                                                after syncing when the number of
+                                                successful responses is greater than
+                                                or equal to this number. By default
+                                                handoff partitions will be removed
+                                                when it has successfully replicated
+                                                to all the canonical nodes.
+==================== =========================  =====================================
+
+*****************
+[account-auditor]
+*****************
+
+====================  ================  =======================================
+Option                Default           Description
+--------------------  ----------------  ---------------------------------------
+log_name              account-auditor   Label used when logging
+log_facility          LOG_LOCAL0        Syslog log facility
+log_level             INFO              Logging level
+log_address           /dev/log          Logging directory
+interval              1800              Minimum time for a pass to take
+accounts_per_second   200               Maximum accounts audited per second.
+                                        Should be tuned according to individual
+                                        system specs. 0 is unlimited.
+recon_cache_path      /var/cache/swift  Path to recon cache
+nice_priority         None              Scheduling priority of server processes.
+                                        Niceness values range from -20 (most
+                                        favorable to the process) to 19 (least
+                                        favorable to the process). The default
+                                        does not modify priority.
+ionice_class          None              I/O scheduling class of server processes.
+                                        I/O niceness class values are
+                                        IOPRIO_CLASS_RT (realtime),
+                                        IOPRIO_CLASS_BE (best-effort),
+                                        and IOPRIO_CLASS_IDLE (idle).
+                                        The default does not modify class and
+                                        priority. Linux supports io scheduling
+                                        priorities and classes since 2.6.13 with
+                                        the CFQ io scheduler.
+                                        Work only with ionice_priority.
+ionice_priority       None              I/O scheduling priority of server
+                                        processes. I/O niceness priority is
+                                        a number which goes from 0 to 7.
+                                        The higher the value, the lower the I/O
+                                        priority of the process. Work only with
+                                        ionice_class.
+                                        Ignored if IOPRIO_CLASS_IDLE is set.
+====================  ================  =======================================
+
+****************
+[account-reaper]
+****************
+
+==================  ===============  =========================================
+Option              Default          Description
+------------------  ---------------  -----------------------------------------
+log_name            account-reaper   Label used when logging
+log_facility        LOG_LOCAL0       Syslog log facility
+log_level           INFO             Logging level
+log_address         /dev/log         Logging directory
+concurrency         25               Number of replication workers to spawn
+interval            3600             Minimum time for a pass to take
+node_timeout        10               Request timeout to external services
+conn_timeout        0.5              Connection timeout to external services
+delay_reaping       0                Normally, the reaper begins deleting
+                                     account information for deleted accounts
+                                     immediately; you can set this to delay
+                                     its work however. The value is in seconds,
+                                     2592000 = 30 days, for example. The sum of
+                                     this value and the container-updater
+                                     ``interval`` should be less than the
+                                     account-replicator ``reclaim_age``. This
+                                     ensures that once the account-reaper has
+                                     deleted a container there is sufficient
+                                     time for the container-updater to report
+                                     to the account before the account DB is
+                                     removed.
+reap_warn_after     2892000          If the account fails to be reaped due
+                                     to a persistent error, the account reaper
+                                     will log a message such as:
+                                     Account <name> has not been reaped since <date>
+                                     You can search logs for this message if
+                                     space is not being reclaimed after you
+                                     delete account(s). This is in addition to
+                                     any time requested by delay_reaping.
+nice_priority       None             Scheduling priority of server processes.
+                                     Niceness values range from -20 (most
+                                     favorable to the process) to 19 (least
+                                     favorable to the process). The default
+                                     does not modify priority.
+ionice_class        None             I/O scheduling class of server processes.
+                                     I/O niceness class values are IOPRIO_CLASS_RT
+                                     (realtime), IOPRIO_CLASS_BE (best-effort),
+                                     and IOPRIO_CLASS_IDLE (idle).
+                                     The default does not modify class and
+                                     priority. Linux supports io scheduling
+                                     priorities and classes since 2.6.13 with
+                                     the CFQ io scheduler.
+                                     Work only with ionice_priority.
+ionice_priority     None             I/O scheduling priority of server
+                                     processes. I/O niceness priority is
+                                     a number which goes from 0 to 7.
+                                     The higher the value, the lower the I/O
+                                     priority of the process. Work only with
+                                     ionice_class.
+                                     Ignored if IOPRIO_CLASS_IDLE is set.
+==================  ===============  =========================================
diff --git a/doc/source/config/container_server_config.rst b/doc/source/config/container_server_config.rst
new file mode 100644
index 0000000000..6f7d6031a3
--- /dev/null
+++ b/doc/source/config/container_server_config.rst
@@ -0,0 +1,650 @@
+.. _container-server-config:
+
+------------------------------
+Container Server Configuration
+------------------------------
+
+This document describes the configuration options available for the container
+server. Documentation for other swift configuration options can be found at
+:doc:`index`.
+
+An example Container Server configuration can be found at
+etc/container-server.conf-sample in the source code repository.
+
+The following configuration sections are available:
+
+* :ref:`[DEFAULT] <container_server_default_options>`
+* `[container-server]`_
+* `[container-replicator]`_
+* `[container-sharder]`_
+* `[container-updater]`_
+* `[container-auditor]`_
+
+.. _container_server_default_options:
+
+*********
+[DEFAULT]
+*********
+
+===============================  ==========  ============================================
+Option                           Default     Description
+-------------------------------  ----------  --------------------------------------------
+swift_dir                        /etc/swift  Swift configuration directory
+devices                          /srv/node   Parent directory of where devices are mounted
+mount_check                      true        Whether or not check if the devices are
+                                             mounted to prevent accidentally writing
+                                             to the root device
+bind_ip                          0.0.0.0     IP Address for server to bind to
+bind_port                        6201        Port for server to bind to
+keep_idle                        600         Value to set for socket TCP_KEEPIDLE
+bind_timeout                     30          Seconds to attempt bind before giving up
+backlog                          4096        Maximum number of allowed pending
+                                             connections
+workers                          auto        Override the number of pre-forked workers
+                                             that will accept connections.  If set it
+                                             should be an integer, zero means no fork.  If
+                                             unset, it will try to default to the number
+                                             of effective cpu cores and fallback to one.
+                                             Increasing the number of workers may reduce
+                                             the possibility of slow file system
+                                             operations in one request from negatively
+                                             impacting other requests.  See
+                                             :ref:`general-service-tuning`.
+max_clients                      1024        Maximum number of clients one worker can
+                                             process simultaneously (it will actually
+                                             accept(2) N + 1). Setting this to one (1)
+                                             will only handle one request at a time,
+                                             without accepting another request
+                                             concurrently.
+user                             swift       User to run as
+disable_fallocate                false       Disable "fast fail" fallocate checks if the
+                                             underlying filesystem does not support it.
+log_name                         swift       Label used when logging
+log_facility                     LOG_LOCAL0  Syslog log facility
+log_level                        INFO        Logging level
+log_address                      /dev/log    Logging directory
+log_max_line_length              0           Caps the length of log lines to the
+                                             value given; no limit if set to 0, the
+                                             default.
+log_custom_handlers              None        Comma-separated list of functions to call
+                                             to setup custom log handlers.
+log_udp_host                                 Override log_address
+log_udp_port                     514         UDP log port
+log_statsd_host                  None        Enables StatsD logging; IPv4/IPv6
+                                             address or a hostname.  If a
+                                             hostname resolves to an IPv4 and IPv6
+                                             address, the IPv4 address will be
+                                             used.
+log_statsd_port                  8125
+log_statsd_default_sample_rate   1.0
+log_statsd_sample_rate_factor    1.0
+log_statsd_metric_prefix
+eventlet_debug                   false       If true, turn on debug logging for eventlet
+fallocate_reserve                1%          You can set fallocate_reserve to the
+                                             number of bytes or percentage of disk
+                                             space you'd like fallocate to reserve,
+                                             whether there is space for the given
+                                             file size or not. Percentage will be used
+                                             if the value ends with a '%'. This is
+                                             useful for systems that behave badly when
+                                             they completely run out of space; you can
+                                             make the services pretend they're out of
+                                             space early.
+db_preallocation                 off         If you don't mind the extra disk space usage
+                                             in overhead, you can turn this on to preallocate
+                                             disk space with SQLite databases to decrease
+                                             fragmentation.
+nice_priority                    None        Scheduling priority of server processes.
+                                             Niceness values range from -20 (most
+                                             favorable to the process) to 19 (least
+                                             favorable to the process). The default
+                                             does not modify priority.
+ionice_class                     None        I/O scheduling class of server processes.
+                                             I/O niceness class values are IOPRIO_CLASS_RT
+                                             (realtime), IOPRIO_CLASS_BE (best-effort),
+                                             and IOPRIO_CLASS_IDLE (idle).
+                                             The default does not modify class and
+                                             priority. Linux supports io scheduling
+                                             priorities and classes since 2.6.13
+                                             with the CFQ io scheduler.
+                                             Work only with ionice_priority.
+ionice_priority                  None        I/O scheduling priority of server processes.
+                                             I/O niceness priority is a number which
+                                             goes from 0 to 7. The higher the value,
+                                             the lower the I/O priority of the process.
+                                             Work only with ionice_class.
+                                             Ignored if IOPRIO_CLASS_IDLE is set.
+===============================  ==========  ============================================
+
+******************
+[container-server]
+******************
+
+==============================  ================  ========================================
+Option                          Default           Description
+------------------------------  ----------------  ----------------------------------------
+use                                               paste.deploy entry point for the
+                                                  container server.  For most cases, this
+                                                  should be ``egg:swift#container``.
+set log_name                    container-server  Label used when logging
+set log_facility                LOG_LOCAL0        Syslog log facility
+set log_level                   INFO              Logging level
+set log_requests                True              Whether or not to log each
+                                                  request
+set log_address                 /dev/log          Logging directory
+node_timeout                    3                 Request timeout to external services
+conn_timeout                    0.5               Connection timeout to external services
+allow_versions                  false             Enable/Disable object versioning feature
+replication_server                                Configure parameter for creating
+                                                  specific server. To handle all verbs,
+                                                  including replication verbs, do not
+                                                  specify "replication_server"
+                                                  (this is the default). To only
+                                                  handle replication, set to a True
+                                                  value (e.g. "True" or "1").
+                                                  To handle only non-replication
+                                                  verbs, set to "False". Unless you
+                                                  have a separate replication network, you
+                                                  should not specify any value for
+                                                  "replication_server".
+nice_priority                   None              Scheduling priority of server processes.
+                                                  Niceness values range from -20 (most
+                                                  favorable to the process) to 19 (least
+                                                  favorable to the process). The default
+                                                  does not modify priority.
+ionice_class                    None              I/O scheduling class of server processes.
+                                                  I/O niceness class values are
+                                                  IOPRIO_CLASS_RT (realtime),
+                                                  IOPRIO_CLASS_BE (best-effort),
+                                                  and IOPRIO_CLASS_IDLE (idle).
+                                                  The default does not modify class and
+                                                  priority. Linux supports io scheduling
+                                                  priorities and classes since 2.6.13 with
+                                                  the CFQ io scheduler.
+                                                  Work only with ionice_priority.
+ionice_priority                 None              I/O scheduling priority of server
+                                                  processes. I/O niceness priority is
+                                                  a number which goes from 0 to 7.
+                                                  The higher the value, the lower the I/O
+                                                  priority of the process. Work only with
+                                                  ionice_class.
+                                                  Ignored if IOPRIO_CLASS_IDLE is set.
+==============================  ================  ========================================
+
+**********************
+[container-replicator]
+**********************
+
+==================== ===========================  =======================================
+Option               Default                      Description
+-------------------- ---------------------------  ---------------------------------------
+log_name             container-replicator         Label used when logging
+log_facility         LOG_LOCAL0                   Syslog log facility
+log_level            INFO                         Logging level
+log_address          /dev/log                     Logging directory
+per_diff             1000                         Maximum number of database
+                                                  rows that will be sync'd in a
+                                                  single HTTP replication
+                                                  request. Databases with less
+                                                  than or equal to this number
+                                                  of differing rows will always
+                                                  be sync'd using an HTTP
+                                                  replication request rather
+                                                  than using rsync.
+max_diffs            100                          Maximum number of HTTP
+                                                  replication requests attempted
+                                                  on each replication pass for
+                                                  any one container. This caps
+                                                  how long the replicator will
+                                                  spend trying to sync a given
+                                                  database per pass so the other
+                                                  databases don't get starved.
+concurrency          8                            Number of replication workers
+                                                  to spawn
+interval             30                           Time in seconds to wait
+                                                  between replication passes
+databases_per_second 50                           Maximum databases to process
+                                                  per second.  Should be tuned
+                                                  according to individual
+                                                  system specs.  0 is unlimited.
+node_timeout         10                           Request timeout to external
+                                                  services
+conn_timeout         0.5                          Connection timeout to external
+                                                  services
+reclaim_age          604800                       Time elapsed in seconds before
+                                                  a container can be reclaimed
+rsync_module         {replication_ip}::container  Format of the rsync module
+                                                  where the replicator will send
+                                                  data. The configuration value
+                                                  can include some variables
+                                                  that will be extracted from
+                                                  the ring. Variables must
+                                                  follow the format {NAME} where
+                                                  NAME is one of: ip, port,
+                                                  replication_ip,
+                                                  replication_port, region,
+                                                  zone, device, meta. See
+                                                  etc/rsyncd.conf-sample for
+                                                  some examples.
+rsync_compress       no                           Allow rsync to compress data
+                                                  which is transmitted to
+                                                  destination node during sync.
+                                                  However, this is applicable
+                                                  only when destination node is
+                                                  in a different region than the
+                                                  local one. NOTE: Objects that
+                                                  are already compressed (for
+                                                  example: .tar.gz, mp3) might
+                                                  slow down the syncing process.
+recon_cache_path     /var/cache/swift             Path to recon cache
+nice_priority        None                         Scheduling priority of server
+                                                  processes. Niceness values
+                                                  range from -20 (most favorable
+                                                  to the process) to 19 (least
+                                                  favorable to the process).
+                                                  The default does not modify
+                                                  priority.
+ionice_class         None                         I/O scheduling class of server
+                                                  processes. I/O niceness class
+                                                  values are
+                                                  IOPRIO_CLASS_RT (realtime),
+                                                  IOPRIO_CLASS_BE (best-effort),
+                                                  and IOPRIO_CLASS_IDLE (idle).
+                                                  The default does not modify
+                                                  class and priority. Linux
+                                                  supports io scheduling
+                                                  priorities and classes since
+                                                  2.6.13 with the CFQ io
+                                                  scheduler.
+                                                  Work only with ionice_priority.
+ionice_priority      None                         I/O scheduling priority of
+                                                  server processes. I/O niceness
+                                                  priority is a number which goes
+                                                  from 0 to 7.
+                                                  The higher the value, the lower
+                                                  the I/O priority of the process.
+                                                  Work only with ionice_class.
+                                                  Ignored if IOPRIO_CLASS_IDLE
+                                                  is set.
+handoffs_only        no                           When handoffs_only mode is enabled
+                                                  the replicator will *only* replicate
+                                                  from handoff nodes to primary nodes
+                                                  and will not sync primary nodes
+                                                  with other primary nodes.
+handoff_delete       auto                         the number of replicas which are
+                                                  ensured in swift. If the number
+                                                  less than the number of replicas
+                                                  is set, container-replicator
+                                                  could delete local handoffs even
+                                                  if all replicas are not ensured in
+                                                  the cluster. The replicator would
+                                                  remove local handoff container database
+                                                  after syncing when the number of
+                                                  successful responses is greater than
+                                                  or equal to this number. By default
+                                                  handoff partitions will be removed
+                                                  when it has successfully replicated
+                                                  to all the canonical nodes.
+==================== ===========================  =======================================
+
+*******************
+[container-sharder]
+*******************
+
+The container-sharder re-uses features of the container-replicator and inherits
+the following configuration options defined for the `[container-replicator]`_:
+
+* interval
+* databases_per_second
+* per_diff
+* max_diffs
+* concurrency
+* node_timeout
+* conn_timeout
+* reclaim_age
+* rsync_compress
+* rsync_module
+* recon_cache_path
+
+Some config options in this section may also be used by the
+:ref:`swift-manage-shard-ranges CLI tool <swift-manage-shard-ranges>`.
+
+================================= =================  =======================================
+Option                            Default            Description
+--------------------------------- -----------------  ---------------------------------------
+log_name                          container-sharder  Label used when logging
+log_facility                      LOG_LOCAL0         Syslog log facility
+log_level                         INFO               Logging level
+log_address                       /dev/log           Logging directory
+
+
+auto_shard                        false               If the auto_shard option
+                                                      is true then the sharder
+                                                      will automatically select
+                                                      containers to shard, scan
+                                                      for shard ranges, and
+                                                      select shards to shrink.
+                                                      Warning: auto-sharding is
+                                                      still under development
+                                                      and should not be used in
+                                                      production; do not set
+                                                      this option to true in a
+                                                      production cluster.
+
+shard_container_threshold         1000000             This defines the
+                                                      object count at which a
+                                                      container with
+                                                      container-sharding
+                                                      enabled will start to
+                                                      shard. This also
+                                                      indirectly determines the
+                                                      the defaults for
+                                                      rows_per_shard,
+                                                      shrink_threshold and
+                                                      expansion_limit.
+
+rows_per_shard                    500000              This defines the initial
+                                                      nominal size of shard
+                                                      containers. The default
+                                                      is shard_container_threshold // 2.
+
+minimum_shard_size                100000              Minimum size of the final
+                                                      shard range. If this is
+                                                      greater than one then the
+                                                      final shard range may be
+                                                      extended to more than
+                                                      rows_per_shard in order
+                                                      to avoid a further shard
+                                                      range with less than
+                                                      minimum_shard_size rows.
+                                                      The default value is
+                                                      rows_per_shard // 5.
+
+shrink_threshold                                      This defines the
+                                                      object count below which
+                                                      a 'donor' shard container
+                                                      will be considered for
+                                                      shrinking into another
+                                                      'acceptor' shard
+                                                      container. The default is
+                                                      determined by
+                                                      shard_shrink_point. If
+                                                      set, shrink_threshold
+                                                      will take precedence over
+                                                      shard_shrink_point.
+
+shard_shrink_point                10                  Deprecated: shrink_threshold
+                                                      is recommended and if set
+                                                      will take precedence over
+                                                      shard_shrink_point.
+                                                      This defines the
+                                                      object count below which
+                                                      a 'donor' shard container
+                                                      will be considered for
+                                                      shrinking into another
+                                                      'acceptor' shard
+                                                      container.
+                                                      shard_shrink_point is a
+                                                      percentage of
+                                                      shard_container_threshold
+                                                      e.g. the default value of
+                                                      10 means 10% of the
+                                                      shard_container_threshold.
+
+expansion_limit                                       This defines the
+                                                      maximum allowed size of
+                                                      an acceptor shard
+                                                      container after having a
+                                                      donor merged into it. The
+                                                      default is determined by
+                                                      shard_shrink_merge_point.
+                                                      If set, expansion_limit
+                                                      will take precedence over
+                                                      shard_shrink_merge_point.
+
+shard_shrink_merge_point          75                  Deprecated: expansion_limit
+                                                      is recommended and if set
+                                                      will take precedence over
+                                                      shard_shrink_merge_point.
+                                                      This defines the
+                                                      maximum allowed size of
+                                                      an acceptor shard
+                                                      container after having a
+                                                      donor merged into it.
+                                                      Shard_shrink_merge_point
+                                                      is a percentage of
+                                                      shard_container_threshold.
+                                                      e.g. the default value of
+                                                      75 means that the
+                                                      projected sum of a donor
+                                                      object count and acceptor
+                                                      count must be less than
+                                                      75% of shard_container_threshold
+                                                      for the donor to be
+                                                      allowed to merge into the
+                                                      acceptor.
+
+                                                      For example, if
+                                                      shard_container_threshold
+                                                      is 1 million,
+                                                      shard_shrink_point is 10,
+                                                      and shard_shrink_merge_point
+                                                      is 75 then a shard will
+                                                      be considered for
+                                                      shrinking if it has less
+                                                      than or equal to 100
+                                                      thousand objects but will
+                                                      only merge into an
+                                                      acceptor if the combined
+                                                      object count would be
+                                                      less than or equal to 750
+                                                      thousand objects.
+
+
+shard_scanner_batch_size          10                  When auto-sharding is
+                                                      enabled this defines the
+                                                      maximum number of shard
+                                                      ranges that will be found
+                                                      each time the sharder
+                                                      daemon visits a sharding
+                                                      container. If necessary
+                                                      the sharder daemon will
+                                                      continue to search for
+                                                      more shard ranges each
+                                                      time it visits the
+                                                      container.
+
+cleave_batch_size                 2                   Defines the number of
+                                                      shard ranges that will be
+                                                      cleaved each time the
+                                                      sharder daemon visits a
+                                                      sharding container.
+
+cleave_row_batch_size             10000               Defines the size of
+                                                      batches of object rows
+                                                      read from a sharding
+                                                      container and merged to a
+                                                      shard container during
+                                                      cleaving.
+
+shard_replication_quorum          auto                Defines the number of
+                                                      successfully replicated
+                                                      shard dbs required when
+                                                      cleaving a previously
+                                                      uncleaved shard range
+                                                      before the sharder will
+                                                      progress to the next
+                                                      shard range. The value
+                                                      should be less than or
+                                                      equal to the container
+                                                      ring replica count. The
+                                                      default of 'auto' causes
+                                                      the container ring quorum
+                                                      value to be used. This
+                                                      option only applies to
+                                                      the container-sharder
+                                                      replication and does not
+                                                      affect the number of
+                                                      shard container replicas
+                                                      that will eventually be
+                                                      replicated by the
+                                                      container-replicator.
+
+
+existing_shard_replication_quorum auto                Defines the number of
+                                                      successfully replicated
+                                                      shard dbs required when
+                                                      cleaving a shard range
+                                                      that has been previously
+                                                      cleaved on another node
+                                                      before the sharder will
+                                                      progress to the next
+                                                      shard range. The value
+                                                      should be less than or
+                                                      equal to the container
+                                                      ring replica count. The
+                                                      default of 'auto' causes
+                                                      the shard_replication_quorum
+                                                      value to be used. This
+                                                      option only applies to
+                                                      the container-sharder
+                                                      replication and does not
+                                                      affect the number of
+                                                      shard container replicas
+                                                      that will eventually be
+                                                      replicated by the
+                                                      container-replicator.
+
+internal_client_conf_path         see description     The sharder uses an
+                                                      internal client to create
+                                                      and make requests to
+                                                      containers. The absolute
+                                                      path to the client config
+                                                      file can be configured.
+                                                      Defaults to
+                                                      /etc/swift/internal-client.conf
+
+request_tries                     3                   The number of time the
+                                                      internal client will
+                                                      retry requests.
+
+recon_candidates_limit            5                   Each time the sharder
+                                                      dumps stats to the recon
+                                                      cache file it includes a
+                                                      list of containers that
+                                                      appear to need sharding
+                                                      but are not yet sharding.
+                                                      By default this list is
+                                                      limited to the top 5
+                                                      containers, ordered by
+                                                      object count. The limit
+                                                      may be changed by setting
+                                                      recon_candidates_limit to
+                                                      an integer value. A
+                                                      negative value implies no
+                                                      limit.
+
+broker_timeout                    60                  Large databases tend to
+                                                      take a while to work
+                                                      with, but we want to make
+                                                      sure we write down our
+                                                      progress. Use a
+                                                      larger-than-normal broker
+                                                      timeout to make us less
+                                                      likely to bomb out on a
+                                                      LockTimeout.
+================================= =================  =======================================
+
+*******************
+[container-updater]
+*******************
+
+========================  =================  ==================================
+Option                    Default            Description
+------------------------  -----------------  ----------------------------------
+log_name                  container-updater  Label used when logging
+log_facility              LOG_LOCAL0         Syslog log facility
+log_level                 INFO               Logging level
+log_address               /dev/log           Logging directory
+interval                  300                Minimum time for a pass to take
+concurrency               4                  Number of updater workers to spawn
+node_timeout              3                  Request timeout to external
+                                             services
+conn_timeout              0.5                Connection timeout to external
+                                             services
+containers_per_second     50                 Maximum containers updated per second.
+                                             Should be tuned according to individual
+                                             system specs. 0 is unlimited.
+
+slowdown                  0.01               Time in seconds to wait between
+                                             containers. Deprecated in favor of
+                                             containers_per_second.
+account_suppression_time  60                 Seconds to suppress updating an
+                                             account that has generated an
+                                             error (timeout, not yet found,
+                                             etc.)
+recon_cache_path          /var/cache/swift   Path to recon cache
+nice_priority             None               Scheduling priority of server
+                                             processes. Niceness values range
+                                             from -20 (most favorable to the
+                                             process) to 19 (least favorable
+                                             to the process). The default does
+                                             not modify priority.
+ionice_class              None               I/O scheduling class of server
+                                             processes. I/O niceness class
+                                             values are IOPRIO_CLASS_RT (realtime),
+                                             IOPRIO_CLASS_BE (best-effort),
+                                             and IOPRIO_CLASS_IDLE (idle).
+                                             The default does not modify class and
+                                             priority. Linux supports io scheduling
+                                             priorities and classes since 2.6.13 with
+                                             the CFQ io scheduler.
+                                             Work only with ionice_priority.
+ionice_priority           None               I/O scheduling priority of server
+                                             processes. I/O niceness priority is
+                                             a number which goes from 0 to 7.
+                                             The higher the value, the lower
+                                             the I/O priority of the process.
+                                             Work only with ionice_class.
+                                             Ignored if IOPRIO_CLASS_IDLE is set.
+========================  =================  ==================================
+
+*******************
+[container-auditor]
+*******************
+
+=====================  =================  =======================================
+Option                 Default            Description
+---------------------  -----------------  ---------------------------------------
+log_name               container-auditor  Label used when logging
+log_facility           LOG_LOCAL0         Syslog log facility
+log_level              INFO               Logging level
+log_address            /dev/log           Logging directory
+interval               1800               Minimum time for a pass to take
+containers_per_second  200                Maximum containers audited per second.
+                                          Should be tuned according to individual
+                                          system specs. 0 is unlimited.
+recon_cache_path       /var/cache/swift   Path to recon cache
+nice_priority          None               Scheduling priority of server processes.
+                                          Niceness values range from -20 (most
+                                          favorable to the process) to 19 (least
+                                          favorable to the process). The default
+                                          does not modify priority.
+ionice_class           None               I/O scheduling class of server processes.
+                                          I/O niceness class values are
+                                          IOPRIO_CLASS_RT (realtime),
+                                          IOPRIO_CLASS_BE (best-effort),
+                                          and IOPRIO_CLASS_IDLE (idle).
+                                          The default does not modify class and
+                                          priority. Linux supports io scheduling
+                                          priorities and classes since 2.6.13 with
+                                          the CFQ io scheduler.
+                                          Work only with ionice_priority.
+ionice_priority        None               I/O scheduling priority of server
+                                          processes. I/O niceness priority is
+                                          a number which goes from 0 to 7.
+                                          The higher the value, the lower the I/O
+                                          priority of the process. Work only with
+                                          ionice_class.
+                                          Ignored if IOPRIO_CLASS_IDLE is set.
+=====================  =================  =======================================
diff --git a/doc/source/config/global_memcache_config.rst b/doc/source/config/global_memcache_config.rst
new file mode 100644
index 0000000000..21ef6c43a2
--- /dev/null
+++ b/doc/source/config/global_memcache_config.rst
@@ -0,0 +1,73 @@
+.. _memcache-config:
+
+-----------------------------
+Global Memcache Configuration
+-----------------------------
+
+This document describes the configuration options available for the global swift memcache configuration
+which usually lives under /etc/swift/memcache.conf.
+Documentation for other swift configuration options can be found at
+:doc:`index`.
+
+An example memcache.conf configuration can be found at
+etc/memcache.conf-sample in the source code repository.
+
+There is only 1 configuration section available:
+
+* :ref:`[memcache] <memcache_conf_memcache_section>`
+
+
+.. _memcache_conf_memcache_section:
+
+**********
+[memcache]
+**********
+
+===========================  ===============    =============================================
+Option                       Default            Description
+---------------------------  ---------------    ---------------------------------------------
+memcache_servers             127.0.0.1:11211    Comma separated list of memcached servers
+                                                ip:port or [ipv6addr]:port
+memcache_max_connections     2                  Max number of connections to each memcached
+                                                server per worker
+connect_timeout              0.3                Timeout for connection
+pool_timeout                 1.0                Timeout for pooled connection
+tries                        3                  Number of servers to retry on failures
+                                                getting a pooled connection
+io_timeout                   2.0                Timeout for read and writes
+error_suppression_interval   60.0               How long without an error before a server's
+                                                error count is reset. This will also be how
+                                                long before a server is reenabled after
+                                                suppression is triggered.
+                                                Set to 0 to disable error-limiting.
+error_suppression_limit      10                 How many errors can accumulate before a
+                                                server is temporarily ignored
+item_size_warning_threshold  -1                 If an item size ever gets above
+                                                item_size_warning_threshold then a warning
+                                                will be logged. This can be used to alert
+                                                when memcache item sizes are getting to
+                                                their limit. 
+                                                It's an absolute size in bytes. Setting the
+                                                value to 0 will warn on every memcache set.
+                                                A value of -1 disables the warning
+tls_enabled                  False              (Optional) Global toggle for TLS usage
+                                                when comunicating with the caching servers
+tls_cafile                                      (Optional) Path to a file of concatenated
+                                                CA certificates in PEM format necessary to
+                                                establish the caching server's authenticity.
+                                                If tls_enabled is False, this option is
+                                                ignored.
+tls_certfile                                    (Optional) Path to a single file in PEM
+                                                format containing the client's certificate
+                                                as well as any number of CA certificates
+                                                needed to establish the certificate's
+                                                authenticity. This file is only required
+                                                when client side authentication is
+                                                necessary. If tls_enabled is False,
+                                                this option is ignored
+tls_keyfile                                     (Optional) Path to a single file containing
+                                                the client's private key in. Otherwhise the
+                                                private key will be taken from the file
+                                                specified in tls_certfile. If tls_enabled
+                                                is False, this option is ignored
+===========================  ===============    =============================================
\ No newline at end of file
diff --git a/doc/source/config/index.rst b/doc/source/config/index.rst
new file mode 100644
index 0000000000..bfec36b78a
--- /dev/null
+++ b/doc/source/config/index.rst
@@ -0,0 +1,18 @@
+===========================
+Configuration Documentation
+===========================
+
+.. toctree::
+    :maxdepth: 2
+
+    swift_common_config.rst
+    proxy_server_config.rst
+    account_server_config.rst
+    container_server_config.rst
+    object_server_config.rst
+    global_memcache_config.rst
+
+Configuration options for middleware can be found at:
+
+* :doc:`../middleware`
+* :doc:`../overview_auth`
diff --git a/doc/source/config/object_server_config.rst b/doc/source/config/object_server_config.rst
new file mode 100644
index 0000000000..f85ee5df7e
--- /dev/null
+++ b/doc/source/config/object_server_config.rst
@@ -0,0 +1,765 @@
+.. _object-server-config:
+
+---------------------------
+Object Server Configuration
+---------------------------
+
+This document describes the configuration options available for the object
+server. Documentation for other swift configuration options can be found at
+:doc:`index`.
+
+An Example Object Server configuration can be found at
+etc/object-server.conf-sample in the source code repository.
+
+The following configuration sections are available:
+
+* :ref:`[DEFAULT] <object-server-default-options>`
+* `[object-server]`_
+* `[object-replicator]`_
+* `[object-reconstructor]`_
+* `[object-updater]`_
+* `[object-auditor]`_
+* `[object-expirer]`_
+
+.. _object-server-default-options:
+
+*********
+[DEFAULT]
+*********
+
+================================ ==========  ============================================
+Option                           Default     Description
+-------------------------------- ----------  --------------------------------------------
+swift_dir                        /etc/swift  Swift configuration directory
+devices                          /srv/node   Parent directory of where devices are
+                                             mounted
+mount_check                      true        Whether or not check if the devices are
+                                             mounted to prevent accidentally writing
+                                             to the root device
+bind_ip                          0.0.0.0     IP Address for server to bind to
+bind_port                        6200        Port for server to bind to
+keep_idle                        600         Value to set for socket TCP_KEEPIDLE
+bind_timeout                     30          Seconds to attempt bind before giving up
+backlog                          4096        Maximum number of allowed pending
+                                             connections
+workers                          auto        Override the number of pre-forked workers
+                                             that will accept connections.  If set it
+                                             should be an integer, zero means no fork.
+                                             If unset, it will try to default to the
+                                             number of effective cpu cores and fallback
+                                             to one. Increasing the number of workers
+                                             helps slow filesystem operations in one
+                                             request from negatively impacting other
+                                             requests, but only the
+                                             :ref:`servers_per_port
+                                             <server-per-port-configuration>` option
+                                             provides complete I/O isolation with no
+                                             measurable overhead.
+servers_per_port                 0           If each disk in each storage policy ring
+                                             has unique port numbers for its "ip"
+                                             value, you can use this setting to have
+                                             each object-server worker only service
+                                             requests for the single disk matching the
+                                             port in the ring. The value of this
+                                             setting determines how many worker
+                                             processes run for each port (disk) in the
+                                             ring. If you have 24 disks per server, and
+                                             this setting is 4, then each storage node
+                                             will have 1 + (24 * 4) = 97 total
+                                             object-server processes running. This
+                                             gives complete I/O isolation, drastically
+                                             reducing the impact of slow disks on
+                                             storage node performance. The
+                                             object-replicator and object-reconstructor
+                                             need to see this setting too, so it must
+                                             be in the [DEFAULT] section.
+                                             See :ref:`server-per-port-configuration`.
+max_clients                      1024        Maximum number of clients one worker can
+                                             process simultaneously (it will actually
+                                             accept(2) N + 1). Setting this to one (1)
+                                             will only handle one request at a time,
+                                             without accepting another request
+                                             concurrently.
+disable_fallocate                false       Disable "fast fail" fallocate checks if
+                                             the underlying filesystem does not support
+                                             it.
+log_name                         swift       Label used when logging
+log_facility                     LOG_LOCAL0  Syslog log facility
+log_level                        INFO        Logging level
+log_address                      /dev/log    Logging directory
+log_max_line_length              0           Caps the length of log lines to the
+                                             value given; no limit if set to 0, the
+                                             default.
+log_custom_handlers              None        Comma-separated list of functions to call
+                                             to setup custom log handlers.
+log_udp_host                                 Override log_address
+log_udp_port                     514         UDP log port
+log_statsd_host                  None        Enables StatsD logging; IPv4/IPv6
+                                             address or a hostname.  If a
+                                             hostname resolves to an IPv4 and IPv6
+                                             address, the IPv4 address will be
+                                             used.
+log_statsd_port                  8125
+log_statsd_default_sample_rate   1.0
+log_statsd_sample_rate_factor    1.0
+log_statsd_metric_prefix
+eventlet_debug                   false       If true, turn on debug logging for
+                                             eventlet
+fallocate_reserve                1%          You can set fallocate_reserve to the
+                                             number of bytes or percentage of disk
+                                             space you'd like fallocate to reserve,
+                                             whether there is space for the given
+                                             file size or not. Percentage will be used
+                                             if the value ends with a '%'. This is
+                                             useful for systems that behave badly when
+                                             they completely run out of space; you can
+                                             make the services pretend they're out of
+                                             space early.
+conn_timeout                     0.5         Time to wait while attempting to connect
+                                             to another backend node.
+node_timeout                     3           Time to wait while sending each chunk of
+                                             data to another backend node.
+client_timeout                   60          Time to wait while receiving each chunk of
+                                             data from a client or another backend node
+network_chunk_size               65536       Size of chunks to read/write over the
+                                             network
+disk_chunk_size                  65536       Size of chunks to read/write to disk
+container_update_timeout         1           Time to wait while sending a container
+                                             update on object update.
+reclaim_age                      604800      Time elapsed in seconds before the tombstone
+                                             file representing a deleted object can be
+                                             reclaimed.  This is the maximum window for
+                                             your consistency engine.  If a node that was
+                                             disconnected from the cluster because of a
+                                             fault is reintroduced into the cluster after
+                                             this window without having its data purged
+                                             it will result in dark data.  This setting
+                                             should be consistent across all object
+                                             services.
+commit_window                    60          Non-durable data files may also
+                                             get reclaimed if they are older
+                                             than reclaim_age, but not if the
+                                             time they were written to disk
+                                             (i.e. mtime) is less than
+                                             commit_window seconds ago. A
+                                             commit_window greater than zero is
+                                             strongly recommended to avoid
+                                             unintended reclamation of data
+                                             files that were about to become
+                                             durable; commit_window should be
+                                             much less than reclaim_age.
+nice_priority                    None        Scheduling priority of server processes.
+                                             Niceness values range from -20 (most
+                                             favorable to the process) to 19 (least
+                                             favorable to the process). The default
+                                             does not modify priority.
+ionice_class                     None        I/O scheduling class of server processes.
+                                             I/O niceness class values are IOPRIO_CLASS_RT
+                                             (realtime), IOPRIO_CLASS_BE (best-effort),
+                                             and IOPRIO_CLASS_IDLE (idle).
+                                             The default does not modify class and
+                                             priority. Linux supports io scheduling
+                                             priorities and classes since 2.6.13 with
+                                             the CFQ io scheduler.
+                                             Work only with ionice_priority.
+ionice_priority                  None        I/O scheduling priority of server
+                                             processes. I/O niceness priority is
+                                             a number which goes from 0 to 7.
+                                             The higher the value, the lower the I/O
+                                             priority of the process. Work only with
+                                             ionice_class.
+                                             Ignored if IOPRIO_CLASS_IDLE is set.
+================================ ==========  ============================================
+
+.. _object-server-options:
+
+***************
+[object-server]
+***************
+
+================================== ====================== ===============================================
+Option                             Default                Description
+---------------------------------- ---------------------- -----------------------------------------------
+use                                                       paste.deploy entry point for the
+                                                          object server.  For most cases,
+                                                          this should be
+                                                          ``egg:swift#object``.
+set log_name                       object-server          Label used when logging
+set log_facility                   LOG_LOCAL0             Syslog log facility
+set log_level                      INFO                   Logging level
+set log_requests                   True                   Whether or not to log each
+                                                          request
+set log_address                    /dev/log               Logging directory
+user                               swift                  User to run as
+max_upload_time                    86400                  Maximum time allowed to upload an
+                                                          object
+slow                               0                      If > 0, Minimum time in seconds for a PUT or
+                                                          DELETE request to complete.  This is only
+                                                          useful to simulate slow devices during testing
+                                                          and development.
+mb_per_sync                        512                    On PUT requests, sync file every
+                                                          n MB
+keep_cache_size                    5242880                Largest object size to keep in
+                                                          buffer cache
+keep_cache_private                 false                  Allow non-public objects to stay
+                                                          in kernel's buffer cache
+keep_cache_slo_manifest            false                  Allow SLO object's manifest file to stay in
+                                                          kernel's buffer cache if its size is under
+                                                          keep_cache_size. This config will only matter
+                                                          when 'keep_cache_private' is false.
+allowed_headers                    Content-Disposition,   Comma separated list of headers
+                                   Content-Encoding,      that can be set in metadata on an object.
+                                   X-Delete-At,           This list is in addition to
+                                   X-Object-Manifest,     X-Object-Meta-* headers and cannot include
+                                   X-Static-Large-Object  Content-Type, etag, Content-Length, or deleted
+                                   Cache-Control,
+                                   Content-Language,
+                                   Expires,
+                                   X-Robots-Tag
+replication_server                                        Configure parameter for creating
+                                                          specific server. To handle all verbs,
+                                                          including replication verbs, do not
+                                                          specify "replication_server"
+                                                          (this is the default). To only
+                                                          handle replication, set to a True
+                                                          value (e.g. "True" or "1").
+                                                          To handle only non-replication
+                                                          verbs, set to "False". Unless you
+                                                          have a separate replication network, you
+                                                          should not specify any value for
+                                                          "replication_server".
+replication_concurrency            4                      Set to restrict the number of
+                                                          concurrent incoming SSYNC
+                                                          requests; set to 0 for unlimited
+replication_concurrency_per_device 1                      Set to restrict the number of
+                                                          concurrent incoming SSYNC
+                                                          requests per device; set to 0 for
+                                                          unlimited requests per devices.
+                                                          This can help control I/O to each
+                                                          device. This does not override
+                                                          replication_concurrency described
+                                                          above, so you may need to adjust
+                                                          both parameters depending on your
+                                                          hardware or network capacity.
+replication_lock_timeout           15                     Number of seconds to wait for an
+                                                          existing replication device lock
+                                                          before giving up.
+replication_failure_threshold      100                    The number of subrequest failures
+                                                          before the
+                                                          replication_failure_ratio is
+                                                          checked
+replication_failure_ratio          1.0                    If the value of failures /
+                                                          successes of SSYNC
+                                                          subrequests exceeds this ratio,
+                                                          the overall SSYNC request
+                                                          will be aborted
+splice                             no                     Use splice() for zero-copy object
+                                                          GETs. This requires Linux kernel
+                                                          version 3.0 or greater. If you set
+                                                          "splice = yes" but the kernel
+                                                          does not support it, error messages
+                                                          will appear in the object server
+                                                          logs at startup, but your object
+                                                          servers should continue to function.
+nice_priority                      None                   Scheduling priority of server processes.
+                                                          Niceness values range from -20 (most
+                                                          favorable to the process) to 19 (least
+                                                          favorable to the process). The default
+                                                          does not modify priority.
+ionice_class                       None                   I/O scheduling class of server processes.
+                                                          I/O niceness class values are IOPRIO_CLASS_RT
+                                                          (realtime), IOPRIO_CLASS_BE (best-effort),
+                                                          and IOPRIO_CLASS_IDLE (idle).
+                                                          The default does not modify class and
+                                                          priority. Linux supports io scheduling
+                                                          priorities and classes since 2.6.13 with
+                                                          the CFQ io scheduler.
+                                                          Work only with ionice_priority.
+ionice_priority                    None                   I/O scheduling priority of server
+                                                          processes. I/O niceness priority is
+                                                          a number which goes from 0 to 7.
+                                                          The higher the value, the lower the I/O
+                                                          priority of the process. Work only with
+                                                          ionice_class.
+                                                          Ignored if IOPRIO_CLASS_IDLE is set.
+eventlet_tpool_num_threads         auto                   The number of threads in eventlet's thread pool.
+                                                          Most IO will occur in the object server's main
+                                                          thread, but certain "heavy" IO operations will
+                                                          occur in separate IO threads, managed by
+                                                          eventlet.
+                                                          The default value is auto, whose actual value
+                                                          is dependent on the servers_per_port value.
+                                                          If servers_per_port is zero then it uses
+                                                          eventlet's default (currently 20 threads).
+                                                          If the servers_per_port is nonzero then it'll
+                                                          only use 1 thread per process.
+                                                          This value can be overridden with an integer
+                                                          value.
+================================== ====================== ===============================================
+
+*******************
+[object-replicator]
+*******************
+
+===========================  ========================  ================================
+Option                       Default                   Description
+---------------------------  ------------------------  --------------------------------
+log_name                     object-replicator         Label used when logging
+log_facility                 LOG_LOCAL0                Syslog log facility
+log_level                    INFO                      Logging level
+log_address                  /dev/log                  Logging directory
+daemonize                    yes                       Whether or not to run replication
+                                                       as a daemon
+interval                     30                        Time in seconds to wait between
+                                                       replication passes
+concurrency                  1                         Number of replication jobs to
+                                                       run per worker process
+replicator_workers           0                         Number of worker processes to use.
+                                                       No matter how big this number is,
+                                                       at most one worker per disk will
+                                                       be used. The default value of 0
+                                                       means no forking; all work is done
+                                                       in the main process.
+sync_method                  rsync                     The sync method to use; default
+                                                       is rsync but you can use ssync to
+                                                       try the EXPERIMENTAL
+                                                       all-swift-code-no-rsync-callouts
+                                                       method. Once ssync is verified as
+                                                       or better than, rsync, we plan to
+                                                       deprecate rsync so we can move on
+                                                       with more features for
+                                                       replication.
+rsync_timeout                900                       Max duration of a partition rsync
+rsync_bwlimit                0                         Bandwidth limit for rsync in kB/s.
+                                                       0 means unlimited.
+rsync_io_timeout             30                        Timeout value sent to rsync
+                                                       --timeout and --contimeout
+                                                       options
+rsync_compress               no                        Allow rsync to compress data
+                                                       which is transmitted to destination
+                                                       node during sync. However, this
+                                                       is applicable only when destination
+                                                       node is in a different region
+                                                       than the local one.
+                                                       NOTE: Objects that are already
+                                                       compressed (for example: .tar.gz,
+                                                       .mp3) might slow down the syncing
+                                                       process.
+stats_interval               300                       Interval in seconds between
+                                                       logging replication statistics
+handoffs_first               false                     If set to True, partitions that
+                                                       are not supposed to be on the
+                                                       node will be replicated first.
+                                                       The default setting should not be
+                                                       changed, except for extreme
+                                                       situations.
+handoff_delete               auto                      By default handoff partitions
+                                                       will be removed when it has
+                                                       successfully replicated to all
+                                                       the canonical nodes. If set to an
+                                                       integer n, it will remove the
+                                                       partition if it is successfully
+                                                       replicated to n nodes.  The
+                                                       default setting should not be
+                                                       changed, except for extreme
+                                                       situations.
+node_timeout                 DEFAULT or 10             Request timeout to external
+                                                       services. This uses what's set
+                                                       here, or what's set in the
+                                                       DEFAULT section, or 10 (though
+                                                       other sections use 3 as the final
+                                                       default).
+http_timeout                 60                        Max duration of an http request.
+                                                       This is for REPLICATE finalization
+                                                       calls and so should be longer
+                                                       than node_timeout.
+lockup_timeout               1800                      Attempts to kill all workers if
+                                                       nothing replicates for
+                                                       lockup_timeout seconds
+rsync_module                 {replication_ip}::object  Format of the rsync module where
+                                                       the replicator will send data.
+                                                       The configuration value can
+                                                       include some variables that will
+                                                       be extracted from the ring.
+                                                       Variables must follow the format
+                                                       {NAME} where NAME is one of: ip,
+                                                       port, replication_ip,
+                                                       replication_port, region, zone,
+                                                       device, meta. See
+                                                       etc/rsyncd.conf-sample for some
+                                                       examples.
+rsync_error_log_line_length  0                         Limits how long rsync error log
+                                                       lines are
+ring_check_interval          15                        Interval for checking new ring
+                                                       file
+recon_cache_path             /var/cache/swift          Path to recon cache
+nice_priority                None                      Scheduling priority of server
+                                                       processes. Niceness values
+                                                       range from -20 (most favorable
+                                                       to the process) to 19 (least
+                                                       favorable to the process).
+                                                       The default does not modify
+                                                       priority.
+ionice_class                 None                      I/O scheduling class of server
+                                                       processes. I/O niceness class
+                                                       values are IOPRIO_CLASS_RT (realtime),
+                                                       IOPRIO_CLASS_BE (best-effort),
+                                                       and IOPRIO_CLASS_IDLE (idle).
+                                                       The default does not modify
+                                                       class and priority.
+                                                       Linux supports io scheduling
+                                                       priorities and classes since
+                                                       2.6.13 with the CFQ io scheduler.
+                                                       Work only with ionice_priority.
+ionice_priority              None                      I/O scheduling priority of server
+                                                       processes. I/O niceness priority
+                                                       is a number which goes from
+                                                       0 to 7. The higher the value,
+                                                       the lower the I/O priority of
+                                                       the process.
+                                                       Work only with ionice_class.
+                                                       Ignored if IOPRIO_CLASS_IDLE
+                                                       is set.
+===========================  ========================  ================================
+
+**********************
+[object-reconstructor]
+**********************
+
+===========================  ========================  ================================
+Option                       Default                   Description
+---------------------------  ------------------------  --------------------------------
+log_name                     object-reconstructor      Label used when logging
+log_facility                 LOG_LOCAL0                Syslog log facility
+log_level                    INFO                      Logging level
+log_address                  /dev/log                  Logging directory
+daemonize                    yes                       Whether or not to run
+                                                       reconstruction as a daemon
+interval                     30                        Time in seconds to wait between
+                                                       reconstruction passes
+reconstructor_workers        0                         Maximum number of worker processes
+                                                       to spawn.  Each worker will handle
+                                                       a subset of devices.  Devices will
+                                                       be assigned evenly among the workers
+                                                       so that workers cycle at similar
+                                                       intervals (which can lead to fewer
+                                                       workers than requested).  You can not
+                                                       have more workers than devices.  If
+                                                       you have no devices only a single
+                                                       worker is spawned.
+concurrency                  1                         Number of reconstruction threads to
+                                                       spawn per reconstructor process.
+stats_interval               300                       Interval in seconds between
+                                                       logging reconstruction statistics
+handoffs_only                false                     The handoffs_only mode option is for
+                                                       special case emergency situations
+                                                       during rebalance such as disk full in
+                                                       the cluster.  This option SHOULD NOT
+                                                       BE CHANGED, except for extreme
+                                                       situations.  When handoffs_only mode
+                                                       is enabled the reconstructor will
+                                                       *only* revert fragments from handoff
+                                                       nodes to primary nodes and will not
+                                                       sync primary nodes with neighboring
+                                                       primary nodes.  This will force the
+                                                       reconstructor to sync and delete
+                                                       handoffs' fragments more quickly and
+                                                       minimize the time of the rebalance by
+                                                       limiting the number of rebuilds.  The
+                                                       handoffs_only option is only for
+                                                       temporary use and should be disabled
+                                                       as soon as the emergency situation
+                                                       has been resolved.
+rebuild_handoff_node_count   2                         The default strategy for unmounted
+                                                       drives will stage
+                                                       rebuilt data on a
+                                                       handoff node until
+                                                       updated rings are
+                                                       deployed.  Because
+                                                       fragments are rebuilt on
+                                                       offset handoffs based on
+                                                       fragment index and the
+                                                       proxy limits how deep it
+                                                       will search for EC frags
+                                                       we restrict how many
+                                                       nodes we'll try.
+                                                       Setting to 0 will
+                                                       disable rebuilds to
+                                                       handoffs and only
+                                                       rebuild fragments for
+                                                       unmounted devices to
+                                                       mounted primaries after
+                                                       a ring change. Setting
+                                                       to -1 means "no limit".
+max_objects_per_revert       0                         By default the reconstructor
+                                                       attempts to revert all
+                                                       objects from handoff
+                                                       partitions in a single
+                                                       batch using a single
+                                                       SSYNC request. In
+                                                       exceptional
+                                                       circumstances
+                                                       max_objects_per_revert
+                                                       can be used to
+                                                       temporarily limit the
+                                                       number of objects
+                                                       reverted by each
+                                                       reconstructor revert
+                                                       type job. If more than
+                                                       max_objects_per_revert
+                                                       are available in a
+                                                       sender's handoff
+                                                       partition, the remaining
+                                                       objects will remain in
+                                                       the handoff partition
+                                                       and will not be reverted
+                                                       until the next time the
+                                                       reconstructor visits
+                                                       that handoff partition
+                                                       i.e. with this option
+                                                       set, a single cycle of
+                                                       the reconstructor may
+                                                       not completely revert
+                                                       all handoff partitions.
+                                                       The option has no effect
+                                                       on reconstructor sync
+                                                       type jobs between
+                                                       primary partitions. A
+                                                       value of 0 (the default)
+                                                       means there is no limit.
+node_timeout                 DEFAULT or 10             Request timeout to external
+                                                       services. The value used is the value
+                                                       set in this section, or the value set
+                                                       in the DEFAULT section, or 10.
+http_timeout                 60                        Max duration of an http request.
+                                                       This is for REPLICATE finalization
+                                                       calls and so should be longer
+                                                       than node_timeout.
+lockup_timeout               1800                      Attempts to kill all threads if
+                                                       no fragment has been reconstructed
+                                                       for lockup_timeout seconds.
+ring_check_interval          15                        Interval for checking new ring
+                                                       file
+recon_cache_path             /var/cache/swift          Path to recon cache
+nice_priority                None                      Scheduling priority of server
+                                                       processes. Niceness values
+                                                       range from -20 (most favorable
+                                                       to the process) to 19 (least
+                                                       favorable to the process).
+                                                       The default does not modify
+                                                       priority.
+ionice_class                 None                      I/O scheduling class of server
+                                                       processes. I/O niceness class
+                                                       values are IOPRIO_CLASS_RT (realtime),
+                                                       IOPRIO_CLASS_BE (best-effort),
+                                                       and IOPRIO_CLASS_IDLE (idle).
+                                                       The default does not modify
+                                                       class and priority.
+                                                       Linux supports io scheduling
+                                                       priorities and classes since
+                                                       2.6.13 with the CFQ io scheduler.
+                                                       Work only with ionice_priority.
+ionice_priority              None                      I/O scheduling priority of server
+                                                       processes. I/O niceness priority
+                                                       is a number which goes from
+                                                       0 to 7. The higher the value,
+                                                       the lower the I/O priority of
+                                                       the process.
+                                                       Work only with ionice_class.
+                                                       Ignored if IOPRIO_CLASS_IDLE
+                                                       is set.
+quarantine_threshold         0                         The reconstructor may quarantine
+                                                       stale isolated fragments
+                                                       when it fails to fetch
+                                                       more than the
+                                                       quarantine_threshold
+                                                       number of fragments
+                                                       (including the stale
+                                                       fragment) during an
+                                                       attempt to reconstruct.
+quarantine_age               reclaim_age               Fragments are not quarantined
+                                                       until they are older than
+                                                       quarantine_age, which defaults
+                                                       to the value of reclaim_age.
+===========================  ========================  ================================
+
+****************
+[object-updater]
+****************
+
+=================== =================== ==========================================
+Option              Default             Description
+------------------- ------------------- ------------------------------------------
+log_name            object-updater      Label used when logging
+log_facility        LOG_LOCAL0          Syslog log facility
+log_level           INFO                Logging level
+log_address         /dev/log            Logging directory
+interval            300                 Minimum time for a pass to take
+updater_workers     1                   Number of worker processes
+concurrency         8                   Number of updates to run concurrently in
+                                        each worker process
+node_timeout        DEFAULT or 10       Request timeout to external services. This
+                                        uses what's set here, or what's set in the
+                                        DEFAULT section, or 10 (though other
+                                        sections use 3 as the final default).
+objects_per_second  50                  Maximum objects updated per second.
+                                        Should be tuned according to individual
+                                        system specs. 0 is unlimited.
+slowdown            0.01                Time in seconds to wait between objects.
+                                        Deprecated in favor of objects_per_second.
+report_interval     300                 Interval in seconds between logging
+                                        statistics about the current update pass.
+recon_cache_path    /var/cache/swift    Path to recon cache
+nice_priority       None                Scheduling priority of server processes.
+                                        Niceness values range from -20 (most
+                                        favorable to the process) to 19 (least
+                                        favorable to the process). The default
+                                        does not modify priority.
+ionice_class        None                I/O scheduling class of server processes.
+                                        I/O niceness class values are IOPRIO_CLASS_RT
+                                        (realtime), IOPRIO_CLASS_BE (best-effort),
+                                        and IOPRIO_CLASS_IDLE (idle).
+                                        The default does not modify class and
+                                        priority. Linux supports io scheduling
+                                        priorities and classes since 2.6.13 with
+                                        the CFQ io scheduler.
+                                        Work only with ionice_priority.
+ionice_priority     None                I/O scheduling priority of server
+                                        processes. I/O niceness priority is
+                                        a number which goes from 0 to 7.
+                                        The higher the value, the lower the I/O
+                                        priority of the process. Work only with
+                                        ionice_class.
+                                        Ignored if IOPRIO_CLASS_IDLE is set.
+=================== =================== ==========================================
+
+****************
+[object-auditor]
+****************
+
+=========================== =================== ==========================================
+Option                      Default             Description
+--------------------------- ------------------- ------------------------------------------
+log_name                    object-auditor      Label used when logging
+log_facility                LOG_LOCAL0          Syslog log facility
+log_level                   INFO                Logging level
+log_address                 /dev/log            Logging directory
+log_time                    3600                Frequency of status logs in seconds.
+interval                    30                  Time in seconds to wait between
+                                                auditor passes
+disk_chunk_size             65536               Size of chunks read during auditing
+files_per_second            20                  Maximum files audited per second per
+                                                auditor process. Should be tuned according
+                                                to individual system specs. 0 is unlimited.
+bytes_per_second            10000000            Maximum bytes audited per second per
+                                                auditor process. Should be tuned according
+                                                to individual system specs. 0 is unlimited.
+concurrency                 1                   The number of parallel processes to use
+                                                for checksum auditing.
+zero_byte_files_per_second  50
+object_size_stats
+recon_cache_path            /var/cache/swift    Path to recon cache
+rsync_tempfile_timeout      auto                Time elapsed in seconds before rsync
+                                                tempfiles will be unlinked. Config value
+                                                of "auto" try to use object-replicator's
+                                                rsync_timeout + 900 or fallback to 86400
+                                                (1 day).
+nice_priority               None                Scheduling priority of server processes.
+                                                Niceness values range from -20 (most
+                                                favorable to the process) to 19 (least
+                                                favorable to the process). The default
+                                                does not modify priority.
+ionice_class                None                I/O scheduling class of server processes.
+                                                I/O niceness class values are IOPRIO_CLASS_RT
+                                                (realtime), IOPRIO_CLASS_BE (best-effort),
+                                                and IOPRIO_CLASS_IDLE (idle).
+                                                The default does not modify class and
+                                                priority. Linux supports io scheduling
+                                                priorities and classes since 2.6.13 with
+                                                the CFQ io scheduler.
+                                                Work only with ionice_priority.
+ionice_priority             None                I/O scheduling priority of server
+                                                processes. I/O niceness priority is
+                                                a number which goes from 0 to 7.
+                                                The higher the value, the lower the I/O
+                                                priority of the process. Work only with
+                                                ionice_class.
+                                                Ignored if IOPRIO_CLASS_IDLE is set.
+=========================== =================== ==========================================
+
+****************
+[object-expirer]
+****************
+
+============================= =============================== ==========================================
+Option                        Default                         Description
+----------------------------- ------------------------------- ------------------------------------------
+log_name                      object-expirer                  Label used when logging
+log_facility                  LOG_LOCAL0                      Syslog log facility
+log_level                     INFO                            Logging level
+log_address                   /dev/log                        Logging directory
+interval                      300                             Time in seconds to wait between
+                                                              expirer passes
+report_interval               300                             Frequency of status logs in seconds.
+concurrency                   1                               Level of concurrency to use to do the work,
+                                                              this value must be set to at least 1
+dequeue_from_legacy           False                           This service will look for jobs on the
+                                                              legacy expirer task queue.
+round_robin_task_cache_size   100000                          Number of tasks objects to cache before processing.
+processes                     0                               How many parts to divide the legacy work into,
+                                                              one part per process that will be doing the work.
+                                                              When set 0 means that a single legacy
+                                                              process will be doing all the work.
+                                                              This can only be used in conjunction with
+                                                              ``dequeue_from_legacy``.
+process                       0                               Which of the parts a particular legacy process will
+                                                              work on. It is "zero based", if you want to use 3
+                                                              processes, you should run processes with process
+                                                              set to 0, 1, and 2.
+                                                              This can only be used in conjunction with
+                                                              ``dequeue_from_legacy``.
+reclaim_age                   604800                          How long an un-processable expired object
+                                                              marker will be retried before it is abandoned.
+                                                              It is not coupled with the tombstone reclaim age
+                                                              in the consistency engine.
+request_tries                 3                               The number of times the expirer's internal client
+                                                              will attempt any given request in the event
+                                                              of failure
+recon_cache_path              /var/cache/swift                Path to recon cache
+nice_priority                 None                            Scheduling priority of server processes.
+                                                              Niceness values range from -20 (most
+                                                              favorable to the process) to 19 (least
+                                                              favorable to the process). The default
+                                                              does not modify priority.
+ionice_class                  None                            I/O scheduling class of server processes.
+                                                              I/O niceness class values are IOPRIO_CLASS_RT
+                                                              (realtime), IOPRIO_CLASS_BE (best-effort),
+                                                              and IOPRIO_CLASS_IDLE (idle).
+                                                              The default does not modify class and
+                                                              priority. Linux supports io scheduling
+                                                              priorities and classes since 2.6.13 with
+                                                              the CFQ io scheduler.
+                                                              Work only with ionice_priority.
+ionice_priority               None                            I/O scheduling priority of server
+                                                              processes. I/O niceness priority is
+                                                              a number which goes from 0 to 7.
+                                                              The higher the value, the lower the I/O
+                                                              priority of the process. Work only with
+                                                              ionice_class.
+                                                              Ignored if IOPRIO_CLASS_IDLE is set.
+delay_reaping_<ACCT>           0.0                            A dynamic configuration option for
+                                                              setting account level delay_reaping values.
+                                                              The delay_reaping value is configured for
+                                                              the account with the name placed in
+                                                              <ACCT>. The object expirer will reap objects in
+                                                              this account from disk only after this delay
+                                                              following their x-delete-at time.
+delay_reaping_<ACCT>/<CNTR>    0.0                            A dynamic configuration option for
+                                                              setting container level delay_reaping values.
+                                                              The delay_reaping value is configured for
+                                                              the container with the account name placed
+                                                              in <ACCT> and the container name in <CNTR>.
+                                                              The object expirer will reap objects in this
+                                                              container from disk only after this delay
+                                                              following their x-delete-at time.
+============================= =============================== ==========================================
diff --git a/doc/source/config/proxy_server_config.rst b/doc/source/config/proxy_server_config.rst
new file mode 100644
index 0000000000..877cd32559
--- /dev/null
+++ b/doc/source/config/proxy_server_config.rst
@@ -0,0 +1,392 @@
+.. _proxy-server-config:
+
+--------------------------
+Proxy Server Configuration
+--------------------------
+
+This document describes the configuration options available for the proxy
+server. Some proxy server options may be configured on a :ref:`per-policy
+<proxy_server_per_policy_config>` basis. Additional documentation for
+proxy-server middleware can be found at :doc:`../middleware` and
+:doc:`../overview_auth`.
+
+Documentation for other swift configuration options can be found at
+:doc:`index`.
+
+An example Proxy Server configuration can be found at
+etc/proxy-server.conf-sample in the source code repository.
+
+The following configuration sections are available:
+
+* :ref:`[DEFAULT] <proxy_server_default_options>`
+* `[proxy-server]`_
+
+
+.. _proxy_server_default_options:
+
+*********
+[DEFAULT]
+*********
+
+====================================  ========================  ========================================
+Option                                Default                   Description
+------------------------------------  ------------------------  ----------------------------------------
+bind_ip                               0.0.0.0                   IP Address for server to
+                                                                bind to
+bind_port                             80                        Port for server to bind to
+keep_idle                             600                       Value to set for socket TCP_KEEPIDLE
+bind_timeout                          30                        Seconds to attempt bind before
+                                                                giving up
+backlog                               4096                      Maximum number of allowed pending
+                                                                connections
+swift_dir                             /etc/swift                Swift configuration directory
+workers                               auto                      Override the number of
+                                                                pre-forked workers that will
+                                                                accept connections.  If set it
+                                                                should be an integer, zero
+                                                                means no fork.  If unset, it
+                                                                will try to default to the
+                                                                number of effective cpu cores
+                                                                and fallback to one.  See
+                                                                :ref:`general-service-tuning`.
+max_clients                           1024                      Maximum number of clients one
+                                                                worker can process
+                                                                simultaneously (it will
+                                                                actually accept(2) N +
+                                                                1). Setting this to one (1)
+                                                                will only handle one request at
+                                                                a time, without accepting
+                                                                another request
+                                                                concurrently.
+user                                  swift                     User to run as
+cert_file                                                       Path to the ssl .crt. This
+                                                                should be enabled for testing
+                                                                purposes only.
+key_file                                                        Path to the ssl .key. This
+                                                                should be enabled for testing
+                                                                purposes only.
+cors_allow_origin                                               List of origin hosts that are allowed
+                                                                for CORS requests in addition to what
+                                                                the container has set.
+strict_cors_mode                      True                      If True (default) then CORS
+                                                                requests are only allowed if their
+                                                                Origin header matches an allowed
+                                                                origin. Otherwise, any Origin is
+                                                                allowed.
+cors_expose_headers                                             This is a list of headers that
+                                                                are included in the header
+                                                                Access-Control-Expose-Headers
+                                                                in addition to what the container
+                                                                has set.
+client_timeout                        60
+trans_id_suffix                                                 This optional suffix (default is empty)
+                                                                that would be appended to the swift
+                                                                transaction id allows one to easily
+                                                                figure out from which cluster that
+                                                                X-Trans-Id belongs to. This is very
+                                                                useful when one is managing more than
+                                                                one swift cluster.
+log_name                              swift                     Label used when logging
+log_facility                          LOG_LOCAL0                Syslog log facility
+log_level                             INFO                      Logging level
+log_headers                           False
+log_address                           /dev/log                  Logging directory
+log_max_line_length                   0                         Caps the length of log
+                                                                lines to the value given;
+                                                                no limit if set to 0, the
+                                                                default.
+log_custom_handlers                   None                      Comma separated list of functions
+                                                                to call to setup custom log
+                                                                handlers.
+log_udp_host                                                    Override log_address
+log_udp_port                          514                       UDP log port
+log_statsd_host                       None                      Enables StatsD logging; IPv4/IPv6
+                                                                address or a hostname.  If a
+                                                                hostname resolves to an IPv4 and IPv6
+                                                                address, the IPv4 address will be
+                                                                used.
+log_statsd_port                       8125
+log_statsd_default_sample_rate        1.0
+log_statsd_sample_rate_factor         1.0
+log_statsd_metric_prefix
+eventlet_debug                        false                     If true, turn on debug logging
+                                                                for eventlet
+
+expose_info                           true                      Enables exposing configuration
+                                                                settings via HTTP GET /info.
+admin_key                                                       Key to use for admin calls that
+                                                                are HMAC signed.  Default
+                                                                is empty, which will
+                                                                disable admin calls to
+                                                                /info.
+disallowed_sections                   swift.valid_api_versions  Allows the ability to withhold
+                                                                sections from showing up in the
+                                                                public calls to /info. You can
+                                                                withhold subsections by separating
+                                                                the dict level with a ".".
+nice_priority                         None                      Scheduling priority of server
+                                                                processes.
+                                                                Niceness values range from -20 (most
+                                                                favorable to the process) to 19 (least
+                                                                favorable to the process). The default
+                                                                does not modify priority.
+ionice_class                          None                      I/O scheduling class of server
+                                                                processes. I/O niceness class values
+                                                                are IOPRIO_CLASS_RT (realtime),
+                                                                IOPRIO_CLASS_BE (best-effort) and
+                                                                IOPRIO_CLASS_IDLE (idle).
+                                                                The default does not
+                                                                modify class and priority. Linux
+                                                                supports io scheduling priorities
+                                                                and classes since 2.6.13 with
+                                                                the CFQ io scheduler.
+                                                                Work only with ionice_priority.
+ionice_priority                       None                      I/O scheduling priority of server
+                                                                processes. I/O niceness priority is
+                                                                a number which goes from 0 to 7.
+                                                                The higher the value, the lower
+                                                                the I/O priority of the process.
+                                                                Work only with ionice_class.
+                                                                Ignored if IOPRIO_CLASS_IDLE is set.
+====================================  ========================  ========================================
+
+**************
+[proxy-server]
+**************
+
+==============================================  ===============  =====================================
+Option                                          Default          Description
+----------------------------------------------  ---------------  -------------------------------------
+use                                                              Entry point for paste.deploy for
+                                                                 the proxy server.  For most
+                                                                 cases, this should be
+                                                                 ``egg:swift#proxy``.
+set log_name                                    proxy-server     Label used when logging
+set log_facility                                LOG_LOCAL0       Syslog log facility
+set log_level                                   INFO             Log level
+set log_headers                                 True             If True, log headers in each
+                                                                 request
+set log_handoffs                                True             If True, the proxy will log
+                                                                 whenever it has to failover to a
+                                                                 handoff node
+recheck_account_existence                       60               Cache timeout in seconds to
+                                                                 send memcached for account
+                                                                 existence
+recheck_container_existence                     60               Cache timeout in seconds to
+                                                                 send memcached for container
+                                                                 existence
+account_existence_skip_cache_pct                0.0              Periodically, bypass the cache
+                                                                 for account info requests and
+                                                                 goto disk to refresh the data
+                                                                 in the cache. This is a percentage
+                                                                 of requests should randomly skip.
+                                                                 Values around 0.0 - 0.1 (1 in every
+                                                                 1000) are recommended.
+container_existence_skip_cache_pct              0.0              Periodically, bypass the cache
+                                                                 for container info requests and
+                                                                 goto disk to refresh the data
+                                                                 in the cache. This is a percentage
+                                                                 of requests should randomly skip.
+                                                                 Values around 0.0 - 0.1 (1 in every
+                                                                 1000) are recommended.
+container_updating_shard_ranges_skip_cache_pct  0.0              Periodically, bypass the cache
+                                                                 for shard_range update requests and
+                                                                 goto disk to refresh the data
+                                                                 in the cache. This is a percentage
+                                                                 of requests should randomly skip.
+                                                                 Values around 0.0 - 0.1 (1 in every
+                                                                 1000) are recommended.
+container_listing_shard_ranges_skip_cache_pct   0.0              Periodically, bypass the cache
+                                                                 for shard_range listing info requests
+                                                                 and goto disk to refresh the data
+                                                                 in the cache. This is a percentage
+                                                                 of requests should randomly skip.
+                                                                 Values around 0.0 - 0.1 (1 in every
+                                                                 1000) are recommended.
+object_chunk_size                               65536            Chunk size to read from
+                                                                 object servers
+client_chunk_size                               65536            Chunk size to read from
+                                                                 clients
+memcache_servers                                127.0.0.1:11211  Comma separated list of
+                                                                 memcached servers
+                                                                 ip:port or [ipv6addr]:port,
+                                                                 if this value is
+                                                                 empty, the memcache client will look
+                                                                 for a :ref:`[memcache.conf] <memcache-config>`
+memcache_max_connections                        2                Max number of connections to
+                                                                 each memcached server per
+                                                                 worker
+node_timeout                                    10               Request timeout to external
+                                                                 services
+recoverable_node_timeout                        node_timeout     Request timeout to external
+                                                                 services for requests that, on
+                                                                 failure, can be recovered
+                                                                 from. For example, object GET.
+client_timeout                                  60               Timeout to read one chunk
+                                                                 from a client
+conn_timeout                                    0.5              Connection timeout to
+                                                                 external services
+error_suppression_interval                      60               Time in seconds that must
+                                                                 elapse since the last error
+                                                                 for a node to be considered
+                                                                 no longer error limited
+error_suppression_limit                         10               Error count to consider a
+                                                                 node error limited
+allow_account_management                        false            Whether account PUTs and DELETEs
+                                                                 are even callable
+account_autocreate                              false            If set to 'true' authorized
+                                                                 accounts that do not yet exist
+                                                                 within the Swift cluster will
+                                                                 be automatically created.
+max_containers_per_account                      0                If set to a positive value,
+                                                                 trying to create a container
+                                                                 when the account already has at
+                                                                 least this maximum containers
+                                                                 will result in a 403 Forbidden.
+                                                                 Note: This is a soft limit,
+                                                                 meaning a user might exceed the
+                                                                 cap for
+                                                                 recheck_account_existence before
+                                                                 the 403s kick in.
+max_containers_whitelist                                         This is a comma separated list
+                                                                 of account names that ignore
+                                                                 the max_containers_per_account
+                                                                 cap.
+rate_limit_after_segment                        10               Rate limit the download of
+                                                                 large object segments after
+                                                                 this segment is downloaded.
+rate_limit_segments_per_sec                     1                Rate limit large object
+                                                                 downloads at this rate.
+request_node_count                              2 * replicas     Set to the number of nodes to
+                                                                 contact for a normal request.
+                                                                 You can use '* replicas' at the
+                                                                 end to have it use the number
+                                                                 given times the number of
+                                                                 replicas for the ring being used
+                                                                 for the request.
+swift_owner_headers                             <see the sample  These are the headers whose
+                                                conf file for    values will only be shown to
+                                                the list of      swift_owners. The exact
+                                                default          definition of a swift_owner is
+                                                headers>         up to the auth system in use,
+                                                                 but usually indicates
+                                                                 administrative responsibilities.
+sorting_method                                  shuffle          Storage nodes can be chosen at
+                                                                 random (shuffle), by using timing
+                                                                 measurements (timing), or by using
+                                                                 an explicit match (affinity).
+                                                                 Using timing measurements may allow
+                                                                 for lower overall latency, while
+                                                                 using affinity allows for finer
+                                                                 control. In both the timing and
+                                                                 affinity cases, equally-sorting nodes
+                                                                 are still randomly chosen to spread
+                                                                 load. This option may be overridden
+                                                                 in a per-policy configuration
+                                                                 section.
+timing_expiry                                   300              If the "timing" sorting_method is
+                                                                 used, the timings will only be valid
+                                                                 for the number of seconds configured
+                                                                 by timing_expiry.
+concurrent_gets                                 off              Use replica count number of
+                                                                 threads concurrently during a
+                                                                 GET/HEAD and return with the
+                                                                 first successful response. In
+                                                                 the EC case, this parameter only
+                                                                 affects an EC HEAD as an EC GET
+                                                                 behaves differently.
+concurrency_timeout                             conn_timeout     This parameter controls how long
+                                                                 to wait before firing off the
+                                                                 next concurrent_get thread. A
+                                                                 value of 0 would we fully concurrent,
+                                                                 any other number will stagger the
+                                                                 firing of the threads. This number
+                                                                 should be between 0 and node_timeout.
+                                                                 The default is conn_timeout (0.5).
+nice_priority                                   None             Scheduling priority of server
+                                                                 processes.
+                                                                 Niceness values range from -20 (most
+                                                                 favorable to the process) to 19 (least
+                                                                 favorable to the process). The default
+                                                                 does not modify priority.
+ionice_class                                    None             I/O scheduling class of server
+                                                                 processes. I/O niceness class values
+                                                                 are IOPRIO_CLASS_RT (realtime),
+                                                                 IOPRIO_CLASS_BE (best-effort),
+                                                                 and IOPRIO_CLASS_IDLE (idle).
+                                                                 The default does not modify class and
+                                                                 priority. Linux supports io scheduling
+                                                                 priorities and classes since 2.6.13
+                                                                 with the CFQ io scheduler.
+                                                                 Work only with ionice_priority.
+ionice_priority                                 None             I/O scheduling priority of server
+                                                                 processes. I/O niceness priority is
+                                                                 a number which goes from 0 to 7.
+                                                                 The higher the value, the lower the
+                                                                 I/O priority of the process. Work
+                                                                 only with ionice_class.
+                                                                 Ignored if IOPRIO_CLASS_IDLE is set.
+read_affinity                                   None             Specifies which backend servers to
+                                                                 prefer on reads; used in conjunction
+                                                                 with the sorting_method option being
+                                                                 set to 'affinity'. Format is a comma
+                                                                 separated list of affinity descriptors
+                                                                 of the form <selection>=<priority>.
+                                                                 The <selection> may be r<N> for
+                                                                 selecting nodes in region N or
+                                                                 r<N>z<M> for selecting nodes in
+                                                                 region N, zone M. The <priority>
+                                                                 value should be a whole number
+                                                                 that represents the priority to
+                                                                 be given to the selection; lower
+                                                                 numbers are higher priority.
+                                                                 Default is empty, meaning no
+                                                                 preference. This option may be
+                                                                 overridden in a per-policy
+                                                                 configuration section.
+write_affinity                                  None             Specifies which backend servers to
+                                                                 prefer on writes. Format is a comma
+                                                                 separated list of affinity
+                                                                 descriptors of the form r<N> for
+                                                                 region N or r<N>z<M> for region N,
+                                                                 zone M. Default is empty, meaning no
+                                                                 preference. This option may be
+                                                                 overridden in a per-policy
+                                                                 configuration section.
+write_affinity_node_count                       2 * replicas     The number of local (as governed by
+                                                                 the write_affinity setting) nodes to
+                                                                 attempt to contact first on writes,
+                                                                 before any non-local ones. The value
+                                                                 should be an integer number, or use
+                                                                 '* replicas' at the end to have it
+                                                                 use the number given times the number
+                                                                 of replicas for the ring being used
+                                                                 for the request. This option may be
+                                                                 overridden in a per-policy
+                                                                 configuration section.
+write_affinity_handoff_delete_count             auto             The number of local (as governed by
+                                                                 the write_affinity setting) handoff
+                                                                 nodes to attempt to contact on
+                                                                 deletion, in addition to primary
+                                                                 nodes. Example: in geographically
+                                                                 distributed deployment, If replicas=3,
+                                                                 sometimes there may be 1 primary node
+                                                                 and 2 local handoff nodes in one region
+                                                                 holding the object after uploading but
+                                                                 before object replicated to the
+                                                                 appropriate locations in other regions.
+                                                                 In this case, include these handoff
+                                                                 nodes to send request when deleting
+                                                                 object could help make correct decision
+                                                                 for the response. The default value 'auto'
+                                                                 means Swift will calculate the number
+                                                                 automatically, the default value is
+                                                                 (replicas - len(local_primary_nodes)).
+                                                                 This option may be overridden in a
+                                                                 per-policy configuration section.
+allow_open_expired                              false            If true (default is false), an object that
+                                                                 has expired but not yet been reaped can be
+                                                                 can be accessed by setting the
+                                                                 'x-open-expired' header to true in
+                                                                 GET, HEAD, and POST requests.
+==============================================  ===============  =====================================
diff --git a/doc/source/config/swift_common_config.rst b/doc/source/config/swift_common_config.rst
new file mode 100644
index 0000000000..8bb6eabe91
--- /dev/null
+++ b/doc/source/config/swift_common_config.rst
@@ -0,0 +1,35 @@
+.. _swift-common-config:
+
+--------------------
+Common configuration
+--------------------
+
+This document describes the configuration options common to all swift servers.
+Documentation for other swift configuration options can be found at
+:doc:`index`.
+
+An example of common configuration file can be found at etc/swift.conf-sample
+
+The following configuration options are available:
+
+==========================  ==========  =============================================
+Option                      Default     Description
+--------------------------  ----------  ---------------------------------------------
+max_header_size             8192        max_header_size is the max number of bytes in
+                                        the utf8 encoding of each header. Using 8192
+                                        as default because eventlet use 8192 as max
+                                        size of header line. This value may need to
+                                        be increased when using identity v3 API
+                                        tokens including more than 7 catalog entries.
+                                        See also include_service_catalog in
+                                        proxy-server.conf-sample (documented in
+                                        overview_auth.rst).
+extra_header_count          0           By default the maximum number of allowed
+                                        headers depends on the number of max
+                                        allowed metadata settings plus a default
+                                        value of 32 for regular http  headers.
+                                        If for some reason this is not enough (custom
+                                        middleware for example) it can be increased
+                                        with the extra_header_count constraint.
+==========================  ==========  =============================================
+
diff --git a/doc/source/container.rst b/doc/source/container.rst
index d80adcaa32..bc95753852 100644
--- a/doc/source/container.rst
+++ b/doc/source/container.rst
@@ -4,6 +4,36 @@
 Container
 *********
 
+.. _container-auditor:
+
+Container Auditor
+=================
+
+.. automodule:: swift.container.auditor
+    :members:
+    :undoc-members:
+    :show-inheritance:
+
+.. _container-backend:
+
+Container Backend
+=================
+
+.. automodule:: swift.container.backend
+    :members:
+    :undoc-members:
+    :show-inheritance:
+
+.. _container-replicator:
+
+Container Replicator
+====================
+
+.. automodule:: swift.container.replicator
+    :members:
+    :undoc-members:
+    :show-inheritance:
+
 .. _container-server:
 
 Container Server
@@ -14,26 +44,28 @@ Container Server
     :undoc-members:
     :show-inheritance:
 
-.. _container-updater:
+.. _container-reconciler:
 
-Container Updater
-=================
+Container Reconciler
+====================
 
-.. automodule:: swift.container.updater
+.. automodule:: swift.container.reconciler
     :members:
     :undoc-members:
     :show-inheritance:
 
-.. _container-auditor:
+.. _container-sharder:
 
-Container Auditor
+Container Sharder
 =================
 
-.. automodule:: swift.container.auditor
+.. automodule:: swift.container.sharder
     :members:
     :undoc-members:
     :show-inheritance:
 
+.. _container-sync-daemon:
+
 Container Sync
 ==============
 
@@ -41,3 +73,13 @@ Container Sync
     :members:
     :undoc-members:
     :show-inheritance:
+
+.. _container-updater:
+
+Container Updater
+=================
+
+.. automodule:: swift.container.updater
+    :members:
+    :undoc-members:
+    :show-inheritance:
diff --git a/doc/source/contributor/contributing.rst b/doc/source/contributor/contributing.rst
new file mode 100644
index 0000000000..52561addb0
--- /dev/null
+++ b/doc/source/contributor/contributing.rst
@@ -0,0 +1,75 @@
+.. include:: ../../../CONTRIBUTING.rst
+
+Community
+=========
+
+Communication
+-------------
+IRC
+    People working on the Swift project may be found in the
+    ``#openstack-swift`` channel on OFTC during working hours
+    in their timezone.  The channel is logged, so if you ask 
+    a question when no one is around, you can 
+    `check the log <http://eavesdrop.openstack.org/irclogs/%23openstack-swift/>`__
+    to see if it's been answered.
+
+weekly meeting
+    This is a Swift team meeting. The discussion in this meeting is about
+    all things related to the Swift project:
+
+- time: http://eavesdrop.openstack.org/#Swift_Team_Meeting
+- agenda: https://wiki.openstack.org/wiki/Meetings/Swift
+
+mailing list
+    We use the openstack-discuss@lists.openstack.org mailing list for
+    asynchronous discussions or to communicate with other OpenStack teams.
+    Use the prefix ``[swift]`` in your subject line (it's a high-volume
+    list, so most people use email filters).
+
+    You can use our `mailing list info page <https://lists.openstack.org/mailman3/lists/openstack-discuss.lists.openstack.org/>`__ to read the archives and subscribe.
+
+Contacting the Core Team
+------------------------
+
+The swift-core team is an active group of contributors who are responsible
+for directing and maintaining the Swift project.  As a new contributor, your
+interaction with this group will be mostly through code reviews, because
+only members of swift-core can approve a code change to be merged into the
+code repository. But the swift-core team also spend time on IRC so feel
+free to drop in to ask questions or just to meet us.
+
+.. note::
+   Although your contribution will require reviews by members of
+   swift-core, these aren't the only people whose reviews matter.
+   Anyone with a gerrit account can post reviews, so you can ask
+   other developers you know to review your code ... and you can
+   review theirs.  (A good way to learn your way around the codebase
+   is to review other people's patches.)
+
+   If you're thinking, "I'm new at this, how can I possibly provide
+   a helpful review?", take a look at `How to Review Changes the
+   OpenStack Way
+   <https://docs.openstack.org/project-team-guide/review-the-openstack-way.html>`_.
+
+   Or for more specifically in a Swift context read :doc:`review_guidelines`
+
+You can read about the role of core reviewers in the
+`OpenStack governance documentation
+<https://docs.openstack.org/contributors/common/governance.html#core-reviewer>`_, learn
+more about the swift-core members in our gerrit
+`membership list <https://review.opendev.org/#/admin/groups/24,members>`__, and 
+also find the team at our `Swift weekly meetings <#communication>`__.
+
+Getting Your Patch Merged
+-------------------------
+Understanding how reviewers review and what they look for will help getting
+your code merged. See `Swift Review Guidelines <https://docs.openstack.org/swift/latest/contributor/review_guidelines.html>`_
+for how we review code.
+
+Keep in mind that reviewers are also human; if something feels stalled, then
+come and poke us on IRC or add it to our meeting agenda.
+
+Project Team Lead Duties
+------------------------
+All common PTL duties are enumerated in the `PTL guide
+<https://docs.openstack.org/project-team-guide/ptl.html>`_.
diff --git a/doc/source/contributor/review_guidelines.rst b/doc/source/contributor/review_guidelines.rst
new file mode 100644
index 0000000000..314e764f49
--- /dev/null
+++ b/doc/source/contributor/review_guidelines.rst
@@ -0,0 +1 @@
+.. include:: ../../../REVIEW_GUIDELINES.rst
diff --git a/doc/source/cors.rst b/doc/source/cors.rst
new file mode 100644
index 0000000000..91e1611b5d
--- /dev/null
+++ b/doc/source/cors.rst
@@ -0,0 +1,106 @@
+====
+CORS
+====
+
+CORS_ is a mechanism to allow code running in a browser (Javascript for
+example) make requests to a domain other than the one from where it originated.
+
+Swift supports CORS requests to containers and objects.
+
+CORS metadata is held on the container only. The values given apply to the
+container itself and all objects within it.
+
+The supported headers are,
+
++------------------------------------------------+------------------------------+
+| Metadata                                       | Use                          |
++================================================+==============================+
+| X-Container-Meta-Access-Control-Allow-Origin   | Origins to be allowed to     |
+|                                                | make Cross Origin Requests,  |
+|                                                | space separated.             |
++------------------------------------------------+------------------------------+
+| X-Container-Meta-Access-Control-Max-Age        | Max age for the Origin to    |
+|                                                | hold the preflight results.  |
++------------------------------------------------+------------------------------+
+| X-Container-Meta-Access-Control-Expose-Headers | Headers exposed to the user  |
+|                                                | agent (e.g. browser) in the  |
+|                                                | actual request response.     |
+|                                                | Space separated.             |
++------------------------------------------------+------------------------------+
+
+In addition the values set in container metadata, some cluster-wide values
+may also be configured using the ``strict_cors_mode``, ``cors_allow_origin``
+and ``cors_expose_headers`` in ``proxy-server.conf``. See
+``proxy-server.conf-sample`` for more information.
+
+Before a browser issues an actual request it may issue a `preflight request`_.
+The preflight request is an OPTIONS call to verify the Origin is allowed to
+make the request. The sequence of events are,
+
+* Browser makes OPTIONS request to Swift
+* Swift returns 200/401 to browser based on allowed origins
+* If 200, browser makes the "actual request" to Swift, i.e. PUT, POST, DELETE,
+  HEAD, GET
+
+When a browser receives a response to an actual request it only exposes those
+headers listed in the ``Access-Control-Expose-Headers`` header. By default Swift
+returns the following values for this header,
+
+* "simple response headers" as listed on
+  http://www.w3.org/TR/cors/#simple-response-header
+* the headers ``etag``, ``x-timestamp``, ``x-trans-id``,
+  ``x-openstack-request-id``
+* all metadata headers (``X-Container-Meta-*`` for containers and
+  ``X-Object-Meta-*`` for objects)
+* headers listed in ``X-Container-Meta-Access-Control-Expose-Headers``
+* headers configured using the ``cors_expose_headers`` option in
+  ``proxy-server.conf``
+
+.. note::
+    An OPTIONS request to a symlink object will respond with the options for
+    the symlink only, the request will not be redirected to the target object.
+    Therefore, if the symlink's target object is in another container with
+    CORS settings, the response will not reflect the settings.
+
+
+-----------------
+Sample Javascript
+-----------------
+
+To see some CORS Javascript in action download the `test CORS page`_ (source
+below). Host it on a webserver and take note of the protocol and hostname
+(origin) you'll be using to request the page, e.g. http://localhost.
+
+Locate a container you'd like to query. Needless to say the Swift cluster
+hosting this container should have CORS support. Append the origin of the
+test page to the container's ``X-Container-Meta-Access-Control-Allow-Origin``
+header,::
+
+    curl -X POST -H 'X-Auth-Token: xxx' \
+      -H 'X-Container-Meta-Access-Control-Allow-Origin: http://localhost' \
+      http://192.168.56.3:8080/v1/AUTH_test/cont1
+
+At this point the container is now accessible to CORS clients hosted on
+http://localhost. Open the test CORS page in your browser.
+
+#. Populate the Token field
+#. Populate the URL field with the URL of either a container or object
+#. Select the request method
+#. Hit Submit
+
+Assuming the request succeeds you should see the response header and body. If
+something went wrong the response status will be 0.
+
+.. _test CORS page:
+
+--------------
+Test CORS Page
+--------------
+
+A sample cross-site test page is located in the project source tree
+``doc/source/test-cors.html``.
+
+.. literalinclude:: test-cors.html
+
+.. _CORS: https://developer.mozilla.org/en-US/docs/HTTP/Access_control_CORS
+.. _preflight request: https://developer.mozilla.org/en-US/docs/HTTP/Access_control_CORS#Preflighted_requests
diff --git a/doc/source/crossdomain.rst b/doc/source/crossdomain.rst
new file mode 100644
index 0000000000..31915d3689
--- /dev/null
+++ b/doc/source/crossdomain.rst
@@ -0,0 +1,69 @@
+========================
+Cross-domain Policy File
+========================
+
+A cross-domain policy file allows web pages hosted elsewhere to use client
+side technologies such as Flash, Java and Silverlight to interact
+with the Swift API.
+
+See https://www.adobe.com/devnet-docs/acrobatetk/tools/AppSec/xdomain.html for
+a description of the purpose and structure of the cross-domain policy
+file. The cross-domain policy file is installed in the root of a web
+server (i.e., the path is ``/crossdomain.xml``).
+
+The crossdomain middleware responds to a path of ``/crossdomain.xml`` with an
+XML document such as:
+
+.. code:: xml
+
+    <?xml version="1.0"?>
+    <!DOCTYPE cross-domain-policy SYSTEM "http://www.adobe.com/xml/dtds/cross-domain-policy.dtd" >
+    <cross-domain-policy>
+        <allow-access-from domain="*" secure="false" />
+    </cross-domain-policy>
+
+You should use a policy appropriate to your site. The examples and the
+default policy are provided to indicate how to syntactically construct
+a cross domain policy file -- they are not recommendations.
+
+-------------
+Configuration
+-------------
+
+To enable this middleware, add it to the pipeline in your proxy-server.conf
+file. It should be added before any authentication (e.g., tempauth or
+keystone) middleware. In this example ellipsis (...) indicate other
+middleware you may have chosen to use:
+
+.. code:: cfg
+
+    [pipeline:main]
+    pipeline =  ... crossdomain ... authtoken ... proxy-server
+
+And add a filter section, such as:
+
+.. code:: cfg
+
+    [filter:crossdomain]
+    use = egg:swift#crossdomain
+    cross_domain_policy = <allow-access-from domain="*.example.com" />
+        <allow-access-from domain="www.example.com" secure="false" />
+
+For continuation lines, put some whitespace before the continuation
+text. Ensure you put a completely blank line to terminate the
+``cross_domain_policy`` value.
+
+The ``cross_domain_policy`` name/value is optional. If omitted, the policy
+defaults as if you had specified:
+
+.. code:: cfg
+
+    cross_domain_policy = <allow-access-from domain="*" secure="false" />
+
+.. note::
+
+   The default policy is very permissive; this is appropriate
+   for most public cloud deployments, but may not be appropriate
+   for all deployments. See also:
+   `CWE-942 <https://cwe.mitre.org/data/definitions/942.html>`__
+
diff --git a/doc/source/deployment_guide.rst b/doc/source/deployment_guide.rst
index badcd22ba2..2a8d52bed4 100644
--- a/doc/source/deployment_guide.rst
+++ b/doc/source/deployment_guide.rst
@@ -1,24 +1,25 @@
-================
+
 Deployment Guide
 ================
 
+This document provides general guidance for deploying and configuring Swift.
+Detailed descriptions of configuration options can be found in the
+:doc:`configuration documentation <config/index>`.
+
 -----------------------
 Hardware Considerations
 -----------------------
 
-Swift is designed to run on commodity hardware. At Rackspace, our storage
-servers are currently running fairly generic 4U servers with 24 2T SATA
-drives and 8 cores of processing power. RAID on the storage drives is not
-required and not recommended. Swift's disk usage pattern is the worst
-case possible for RAID, and performance degrades very quickly using RAID 5
-or 6.
+Swift is designed to run on commodity hardware. RAID on the storage drives is
+not required and not recommended. Swift's disk usage pattern is the worst case
+possible for RAID, and performance degrades very quickly using RAID 5 or 6.
 
 ------------------
 Deployment Options
 ------------------
 
-The swift services run completely autonomously, which provides for a lot of
-flexibility when architecting the hardware deployment for swift. The 4 main
+The Swift services run completely autonomously, which provides for a lot of
+flexibility when architecting the hardware deployment for Swift. The 4 main
 services are:
 
 #. Proxy Services
@@ -36,21 +37,35 @@ and network I/O intensive.
 The easiest deployment is to install all services on each server. There is
 nothing wrong with doing this, as it scales each service out horizontally.
 
-At Rackspace, we put the Proxy Services on their own servers and all of the
-Storage Services on the same server. This allows us to send 10g networking to
-the proxy and 1g to the storage servers, and keep load balancing to the
-proxies more manageable.  Storage Services scale out horizontally as storage
-servers are added, and we can scale overall API throughput by adding more
-Proxies.
+Alternatively, one set of servers may be dedicated to the Proxy Services and a
+different set of servers dedicated to the Storage Services. This allows faster
+networking to be configured to the proxy than the storage servers, and keeps
+load balancing to the proxies more manageable.  Storage Services scale out
+horizontally as storage servers are added, and the overall API throughput can
+be scaled by adding more proxies.
 
 If you need more throughput to either Account or Container Services, they may
 each be deployed to their own servers. For example you might use faster (but
 more expensive) SAS or even SSD drives to get faster disk I/O to the databases.
 
+A high-availability (HA) deployment of Swift requires that multiple proxy
+servers are deployed and requests are load-balanced between them. Each proxy
+server instance is stateless and able to respond to requests for the entire
+cluster.
+
 Load balancing and network design is left as an exercise to the reader,
 but this is a very important part of the cluster, so time should be spent
 designing the network for a Swift cluster.
 
+
+---------------------
+Web Front End Options
+---------------------
+
+Swift comes with an integral web front end. However, it can also be deployed
+as a request processor of an Apache2 using mod_wsgi as described in
+:doc:`Apache Deployment Guide <apache_deployment_guide>`.
+
 .. _ring-preparing:
 
 ------------------
@@ -87,8 +102,12 @@ into consideration can include physical location, power availability, and
 network connectivity. For example, in a small cluster you might decide to
 split the zones up by cabinet, with each cabinet having its own power and
 network connectivity. The zone concept is very abstract, so feel free to use
-it in whatever way best isolates your data from failure. Zones are referenced
-by number, beginning with 1.
+it in whatever way best isolates your data from failure. Each zone exists
+in a region.
+
+A region is also an abstract concept that may be used to distinguish between
+geographically separated areas as well as can be used within same datacenter.
+Regions and zones are referenced by a positive integer.
 
 You can now start building the ring with::
 
@@ -100,17 +119,18 @@ specific partition can be moved in succession (24 is a good value for this).
 
 Devices can be added to the ring with::
 
-    swift-ring-builder <builder_file> add z<zone>-<ip>:<port>/<device_name>_<meta> <weight>
+    swift-ring-builder <builder_file> add r<region>z<zone>-<ip>:<port>/<device_name>_<meta> <weight>
 
 This will add a device to the ring where <builder_file> is the name of the
-builder file that was created previously, <zone> is the number of the zone
-this device is in, <ip> is the ip address of the server the device is in,
-<port> is the port number that the server is running on, <device_name> is
-the name of the device on the server (for example: sdb1), <meta> is a string
-of metadata for the device (optional), and <weight> is a float weight that
-determines how many partitions are put on the device relative to the rest of
-the devices in the cluster (a good starting point is 100.0 x TB on the drive).
-Add each device that will be initially in the cluster.
+builder file that was created previously, <region> is the number of the region
+the zone is in, <zone> is the number of the zone this device is in, <ip> is
+the ip address of the server the device is in, <port> is the port number that
+the server is running on, <device_name> is the name of the device on the server
+(for example: sdb1), <meta> is a string of metadata for the device (optional),
+and <weight> is a float weight that determines how many partitions are put on
+the device relative to the rest of the devices in the cluster (a good starting
+point is 100.0 x TB on the drive).Add each device that will be initially in the
+cluster.
 
 Once all of the devices are added to the ring, run::
 
@@ -130,15 +150,164 @@ swift-ring-builder with no options will display help text with available
 commands and options. More information on how the ring works internally
 can be found in the :doc:`Ring Overview <overview_ring>`.
 
+.. _server-per-port-configuration:
+
+-------------------------------
+Running object-servers Per Disk
+-------------------------------
+
+The lack of true asynchronous file I/O on Linux leaves the object-server
+workers vulnerable to misbehaving disks.  Because any object-server worker can
+service a request for any disk, and a slow I/O request blocks the eventlet hub,
+a single slow disk can impair an entire storage node.  This also prevents
+object servers from fully utilizing all their disks during heavy load.
+
+Another way to get full I/O isolation is to give each disk on a storage node a
+different port in the storage policy rings.  Then set the
+:ref:`servers_per_port <object-server-default-options>`
+option in the object-server config.  NOTE: while the purpose of this config
+setting is to run one or more object-server worker processes per *disk*, the
+implementation just runs object-servers per unique port of local devices in the
+rings.  The deployer must combine this option with appropriately-configured
+rings to benefit from this feature.
+
+Here's an example (abbreviated) old-style ring (2 node cluster with 2 disks
+each)::
+
+ Devices:    id  region  zone      ip address  port  replication ip  replication port      name
+              0       1     1       1.1.0.1    6200       1.1.0.1                6200      d1
+              1       1     1       1.1.0.1    6200       1.1.0.1                6200      d2
+              2       1     2       1.1.0.2    6200       1.1.0.2                6200      d3
+              3       1     2       1.1.0.2    6200       1.1.0.2                6200      d4
+
+And here's the same ring set up for ``servers_per_port``::
+
+ Devices:    id  region  zone      ip address  port  replication ip  replication port      name
+              0       1     1       1.1.0.1    6200       1.1.0.1                6200      d1
+              1       1     1       1.1.0.1    6201       1.1.0.1                6201      d2
+              2       1     2       1.1.0.2    6200       1.1.0.2                6200      d3
+              3       1     2       1.1.0.2    6201       1.1.0.2                6201      d4
+
+When migrating from normal to ``servers_per_port``, perform these steps in order:
+
+#. Upgrade Swift code to a version capable of doing ``servers_per_port``.
+
+#. Enable ``servers_per_port`` with a value greater than zero.
+
+#. Restart ``swift-object-server`` processes with a SIGHUP.  At this point, you
+   will have the ``servers_per_port`` number of ``swift-object-server`` processes
+   serving all requests for all disks on each node.  This preserves
+   availability, but you should perform the next step as quickly as possible.
+
+#. Push out new rings that actually have different ports per disk on each
+   server.  One of the ports in the new ring should be the same as the port
+   used in the old ring ("6200" in the example above).  This will cover
+   existing proxy-server processes who haven't loaded the new ring yet.  They
+   can still talk to any storage node regardless of whether or not that
+   storage node has loaded the ring and started object-server processes on the
+   new ports.
+
+If you do not run a separate object-server for replication, then this setting
+must be available to the object-replicator and object-reconstructor (i.e.
+appear in the [DEFAULT] config section).
+
+.. _general-service-configuration:
+
+-----------------------------
+General Service Configuration
+-----------------------------
+
+Most Swift services fall into two categories.  Swift's wsgi servers and
+background daemons.
+
+For more information specific to the configuration of Swift's wsgi servers
+with paste deploy see :ref:`general-server-configuration`.
+
+Configuration for servers and daemons can be expressed together in the same
+file for each type of server, or separately.  If a required section for the
+service trying to start is missing there will be an error.  The sections not
+used by the service are ignored.
+
+Consider the example of an object storage node.  By convention, configuration
+for the object-server, object-updater, object-replicator, object-auditor, and
+object-reconstructor exist in a single file ``/etc/swift/object-server.conf``::
+
+    [DEFAULT]
+    reclaim_age = 604800
+
+    [pipeline:main]
+    pipeline = object-server
+
+    [app:object-server]
+    use = egg:swift#object
+
+    [object-replicator]
+
+    [object-updater]
+
+    [object-auditor]
+
+Swift services expect a configuration path as the first argument::
+
+    $ swift-object-auditor
+    Usage: swift-object-auditor CONFIG [options]
+
+    Error: missing config path argument
+
+If you omit the object-auditor section this file could not be used as the
+configuration path when starting the ``swift-object-auditor`` daemon::
+
+    $ swift-object-auditor /etc/swift/object-server.conf
+    Unable to find object-auditor config section in /etc/swift/object-server.conf
+
+If the configuration path is a directory instead of a file all of the files in
+the directory with the file extension ".conf" will be combined to generate the
+configuration object which is delivered to the Swift service.  This is
+referred to generally as "directory based configuration".
+
+Directory based configuration leverages ConfigParser's native multi-file
+support.  Files ending in ".conf" in the given directory are parsed in
+lexicographical order.  Filenames starting with '.' are ignored.  A mixture of
+file and directory configuration paths is not supported - if the configuration
+path is a file only that file will be parsed.
+
+The Swift service management tool ``swift-init`` has adopted the convention of
+looking for ``/etc/swift/{type}-server.conf.d/`` if the file
+``/etc/swift/{type}-server.conf`` file does not exist.
+
+When using directory based configuration, if the same option under the same
+section appears more than once in different files, the last value parsed is
+said to override previous occurrences.  You can ensure proper override
+precedence by prefixing the files in the configuration directory with
+numerical values.::
+
+    /etc/swift/
+        default.base
+        object-server.conf.d/
+            000_default.conf -> ../default.base
+            001_default-override.conf
+            010_server.conf
+            020_replicator.conf
+            030_updater.conf
+            040_auditor.conf
+
+You can inspect the resulting combined configuration object using the
+``swift-config`` command line tool
+
+.. _general-server-configuration:
+
 ----------------------------
 General Server Configuration
 ----------------------------
 
-Swift uses paste.deploy (http://pythonpaste.org/deploy/) to manage server
-configurations. Default configuration options are set in the `[DEFAULT]`
-section, and any options specified there can be overridden in any of the other
-sections BUT ONLY BY USING THE SYNTAX ``set option_name = value``. This is the
-unfortunate way paste.deploy works and I'll try to explain it in full.
+Swift uses paste.deploy (https://pypi.org/project/Paste/) to manage server
+configurations. Detailed descriptions of configuration options can be found in
+the :doc:`configuration documentation <config/index>`.
+
+Default configuration options are set in the ``[DEFAULT]`` section, and any
+options specified there can be overridden in any of the other sections BUT
+ONLY BY USING THE SYNTAX ``set option_name = value``. This is the unfortunate
+way paste.deploy works and I'll try to explain it in full.
 
 First, here's an example paste.deploy configuration file::
 
@@ -169,30 +338,30 @@ The resulting configuration that myapp receives is::
             'set name4': 'globalvalue'}
     local {'name6': 'localvalue'}
 
-So, `name1` got the global value which is fine since it's only in the `DEFAULT`
+So, ``name1`` got the global value which is fine since it's only in the ``DEFAULT``
 section anyway.
 
-`name2` got the global value from `DEFAULT` even though it appears to be
-overridden in the `app:myapp` subsection. This is just the unfortunate way
+``name2`` got the global value from ``DEFAULT`` even though it appears to be
+overridden in the ``app:myapp`` subsection. This is just the unfortunate way
 paste.deploy works (at least at the time of this writing.)
 
-`name3` got the local value from the `app:myapp` subsection because it is using
+``name3`` got the local value from the ``app:myapp`` subsection because it is using
 the special paste.deploy syntax of ``set option_name = value``. So, if you want
-a default value for most app/filters but want to overridde it in one
+a default value for most app/filters but want to override it in one
 subsection, this is how you do it.
 
-`name4` got the global value from `DEFAULT` since it's only in that section
-anyway. But, since we used the ``set`` syntax in the `DEFAULT` section even
+``name4`` got the global value from ``DEFAULT`` since it's only in that section
+anyway. But, since we used the ``set`` syntax in the ``DEFAULT`` section even
 though we shouldn't, notice we also got a ``set name4`` variable. Weird, but
 probably not harmful.
 
-`name5` got the local value from the `app:myapp` subsection since it's only
+``name5`` got the local value from the ``app:myapp`` subsection since it's only
 there anyway, but notice that it is in the global configuration and not the
 local configuration. This is because we used the ``set`` syntax to set the
 value. Again, weird, but not harmful since Swift just treats the two sets of
 configuration values as one set anyway.
 
-`name6` got the local value from `app:myapp` subsection since it's only there,
+``name6`` got the local value from ``app:myapp`` subsection since it's only there,
 and since we didn't use the ``set`` syntax, it's only in the local
 configuration and not the global one. Though, as indicated above, there is no
 special distinction with Swift.
@@ -209,522 +378,148 @@ The main rule to remember when working with Swift configuration files is:
     configuration files.
 
 
----------------------------
-Object Server Configuration
----------------------------
-
-An Example Object Server configuration can be found at
-etc/object-server.conf-sample in the source code repository.
-
-The following configuration options are available:
-
-[DEFAULT]
-
-===================  ==========  =============================================
-Option               Default     Description
--------------------  ----------  ---------------------------------------------
-swift_dir            /etc/swift  Swift configuration directory
-devices              /srv/node   Parent directory of where devices are mounted
-mount_check          true        Whether or not check if the devices are
-                                 mounted to prevent accidentally writing
-                                 to the root device
-bind_ip              0.0.0.0     IP Address for server to bind to
-bind_port            6000        Port for server to bind to
-bind_timeout         30          Seconds to attempt bind before giving up
-workers              1           Number of workers to fork
-disable_fallocate    false       Disable "fast fail" fallocate checks if the
-                                 underlying filesystem does not support it.
-log_custom_handlers  None        Comma-separated list of functions to call
-                                 to setup custom log handlers.
-eventlet_debug       false       If true, turn on debug logging for eventlet
-===================  ==========  =============================================
-
-[object-server]
-
-==================  =============  ===========================================
-Option              Default        Description
-------------------  -------------  -------------------------------------------
-use                                paste.deploy entry point for the object
-                                   server.  For most cases, this should be
-                                   `egg:swift#object`.
-set log_name        object-server  Label used when logging
-set log_facility    LOG_LOCAL0     Syslog log facility
-set log_level       INFO           Logging level
-set log_requests    True           Whether or not to log each request
-user                swift          User to run as
-node_timeout        3              Request timeout to external services
-conn_timeout        0.5            Connection timeout to external services
-network_chunk_size  65536          Size of chunks to read/write over the
-                                   network
-disk_chunk_size     65536          Size of chunks to read/write to disk
-max_upload_time     86400          Maximum time allowed to upload an object
-slow                0              If > 0, Minimum time in seconds for a PUT
-                                   or DELETE request to complete
-mb_per_sync         512            On PUT requests, sync file every n MB
-keep_cache_size     5242880        Largest object size to keep in buffer cache
-keep_cache_private  false          Allow non-public objects to stay in
-                                   kernel's buffer cache
-==================  =============  ===========================================
-
-[object-replicator]
-
-==================  =================  =======================================
-Option              Default            Description
-------------------  -----------------  ---------------------------------------
-log_name            object-replicator  Label used when logging
-log_facility        LOG_LOCAL0         Syslog log facility
-log_level           INFO               Logging level
-daemonize           yes                Whether or not to run replication as a
-                                       daemon
-run_pause           30                 Time in seconds to wait between
-                                       replication passes
-concurrency         1                  Number of replication workers to spawn
-timeout             5                  Timeout value sent to rsync --timeout
-                                       and --contimeout options
-stats_interval      3600               Interval in seconds between logging
-                                       replication statistics
-reclaim_age         604800             Time elapsed in seconds before an
-                                       object can be reclaimed
-==================  =================  =======================================
-
-[object-updater]
-
-==================  ==============  ==========================================
-Option              Default         Description
-------------------  --------------  ------------------------------------------
-log_name            object-updater  Label used when logging
-log_facility        LOG_LOCAL0      Syslog log facility
-log_level           INFO            Logging level
-interval            300             Minimum time for a pass to take
-concurrency         1               Number of updater workers to spawn
-node_timeout        10              Request timeout to external services
-conn_timeout        0.5             Connection timeout to external services
-slowdown            0.01            Time in seconds to wait between objects
-==================  ==============  ==========================================
-
-[object-auditor]
-
-==================  ==============  ==========================================
-Option              Default         Description
-------------------  --------------  ------------------------------------------
-log_name            object-auditor  Label used when logging
-log_facility        LOG_LOCAL0      Syslog log facility
-log_level           INFO            Logging level
-log_time            3600            Frequency of status logs in seconds.
-files_per_second    20              Maximum files audited per second. Should
-                                    be tuned according to individual system
-                                    specs. 0 is unlimited.
-bytes_per_second    10000000        Maximum bytes audited per second. Should
-                                    be tuned according to individual system
-                                    specs. 0 is unlimited.
-==================  ==============  ==========================================
-
-------------------------------
-Container Server Configuration
-------------------------------
-
-An example Container Server configuration can be found at
-etc/container-server.conf-sample in the source code repository.
-
-The following configuration options are available:
-
-[DEFAULT]
-
-===================  ==========  ============================================
-Option               Default     Description
--------------------  ----------  --------------------------------------------
-swift_dir            /etc/swift  Swift configuration directory
-devices              /srv/node   Parent directory of where devices are mounted
-mount_check          true        Whether or not check if the devices are
-                                 mounted to prevent accidentally writing
-                                 to the root device
-bind_ip              0.0.0.0     IP Address for server to bind to
-bind_port            6001        Port for server to bind to
-bind_timeout         30          Seconds to attempt bind before giving up
-workers              1           Number of workers to fork
-user                 swift       User to run as
-disable_fallocate    false       Disable "fast fail" fallocate checks if the
-                                 underlying filesystem does not support it.
-log_custom_handlers  None        Comma-separated list of functions to call
-                                 to setup custom log handlers.
-eventlet_debug       false       If true, turn on debug logging for eventlet
-===================  ==========  ============================================
-
-[container-server]
-
-==================  ================  ========================================
-Option              Default           Description
-------------------  ----------------  ----------------------------------------
-use                                   paste.deploy entry point for the
-                                      container server.  For most cases, this
-                                      should be `egg:swift#container`.
-set log_name        container-server  Label used when logging
-set log_facility    LOG_LOCAL0        Syslog log facility
-set log_level       INFO              Logging level
-node_timeout        3                 Request timeout to external services
-conn_timeout        0.5               Connection timeout to external services
-allow_versions      false             Enable/Disable object versioning feature
-==================  ================  ========================================
-
-[container-replicator]
-
-==================  ====================  ====================================
-Option              Default               Description
-------------------  --------------------  ------------------------------------
-log_name            container-replicator  Label used when logging
-log_facility        LOG_LOCAL0            Syslog log facility
-log_level           INFO                  Logging level
-per_diff            1000
-concurrency         8                     Number of replication workers to
-                                          spawn
-run_pause           30                    Time in seconds to wait between
-                                          replication passes
-node_timeout        10                    Request timeout to external services
-conn_timeout        0.5                   Connection timeout to external
-                                          services
-reclaim_age         604800                Time elapsed in seconds before a
-                                          container can be reclaimed
-==================  ====================  ====================================
-
-[container-updater]
-
-========================  =================  ==================================
-Option                    Default            Description
-------------------------  -----------------  ----------------------------------
-log_name                  container-updater  Label used when logging
-log_facility              LOG_LOCAL0         Syslog log facility
-log_level                 INFO               Logging level
-interval                  300                Minimum time for a pass to take
-concurrency               4                  Number of updater workers to spawn
-node_timeout              3                  Request timeout to external
-                                             services
-conn_timeout              0.5                Connection timeout to external
-                                             services
-slowdown                  0.01               Time in seconds to wait between
-                                             containers
-account_suppression_time  60                 Seconds to suppress updating an
-                                             account that has generated an
-                                             error (timeout, not yet found,
-                                             etc.)
-========================  =================  ==================================
-
-[container-auditor]
-
-==================  =================  =======================================
-Option              Default            Description
-------------------  -----------------  ---------------------------------------
-log_name            container-auditor  Label used when logging
-log_facility        LOG_LOCAL0         Syslog log facility
-log_level           INFO               Logging level
-interval            1800               Minimum time for a pass to take
-==================  =================  =======================================
+.. _proxy_server_per_policy_config:
 
-----------------------------
-Account Server Configuration
-----------------------------
+************************
+Per policy configuration
+************************
+
+Some proxy-server configuration options may be overridden for individual
+:doc:`overview_policies` by including per-policy config section(s). These
+options are:
+
+- ``sorting_method``
+- ``read_affinity``
+- ``write_affinity``
+- ``write_affinity_node_count``
+- ``write_affinity_handoff_delete_count``
+
+The per-policy config section name must be of the form::
+
+    [proxy-server:policy:<policy index>]
+
+.. note::
+
+    The per-policy config section name should refer to the policy index, not
+    the policy name.
+
+.. note::
+
+    The first part of proxy-server config section name must match the name of
+    the proxy-server config section. This is typically ``proxy-server`` as
+    shown above, but if different then the names of any per-policy config
+    sections must be changed accordingly.
+
+The value of an option specified in a per-policy section will override any
+value given in the proxy-server section for that policy only. Otherwise the
+value of these options will be that specified in the proxy-server section.
+
+For example, the following section provides policy-specific options for a
+policy with index ``3``::
+
+    [proxy-server:policy:3]
+    sorting_method = affinity
+    read_affinity = r2=1
+    write_affinity = r2
+    write_affinity_node_count = 1 * replicas
+    write_affinity_handoff_delete_count = 2
+
+.. note::
+
+    It is recommended that per-policy config options are *not* included in the
+    ``[DEFAULT]`` section. If they are then the following behavior applies.
+
+    Per-policy config sections will inherit options in the ``[DEFAULT]``
+    section of the config file, and any such inheritance will take precedence
+    over inheriting options from the proxy-server config section.
+
+    Per-policy config section options will override options in the
+    ``[DEFAULT]`` section. Unlike the behavior described under `General Server
+    Configuration`_ for paste-deploy ``filter`` and ``app`` sections, the
+    ``set`` keyword is not required for options to override in per-policy
+    config sections.
+
+    For example, given the following settings in a config file::
+
+        [DEFAULT]
+        sorting_method = affinity
+        read_affinity = r0=100
+        write_affinity = r0
+
+        [app:proxy-server]
+        use = egg:swift#proxy
+        # use of set keyword here overrides [DEFAULT] option
+        set read_affinity = r1=100
+        # without set keyword, [DEFAULT] option overrides in a paste-deploy section
+        write_affinity = r1
+
+        [proxy-server:policy:0]
+        sorting_method = affinity
+        # set keyword not required here to override [DEFAULT] option
+        write_affinity = r1
+
+    would result in policy with index ``0`` having settings:
+
+    * ``read_affinity = r0=100`` (inherited from the ``[DEFAULT]`` section)
+    * ``write_affinity = r1`` (specified in the policy 0 section)
+
+    and any other policy would have the default settings of:
+
+    * ``read_affinity = r1=100`` (set in the proxy-server section)
+    * ``write_affinity = r0`` (inherited from the ``[DEFAULT]`` section)
+
+*****************
+Proxy Middlewares
+*****************
+
+Many features in Swift are implemented as middleware in the proxy-server
+pipeline. See :doc:`middleware` and the ``proxy-server.conf-sample`` file for
+more information. In particular, the use of some type of :doc:`authentication
+and authorization middleware <overview_auth>` is highly recommended.
 
-An example Account Server configuration can be found at
-etc/account-server.conf-sample in the source code repository.
-
-The following configuration options are available:
-
-[DEFAULT]
-
-===================  ==========  =============================================
-Option               Default     Description
--------------------  ----------  ---------------------------------------------
-swift_dir            /etc/swift  Swift configuration directory
-devices              /srv/node   Parent directory or where devices are mounted
-mount_check          true        Whether or not check if the devices are
-                                 mounted to prevent accidentally writing
-                                 to the root device
-bind_ip              0.0.0.0     IP Address for server to bind to
-bind_port            6002        Port for server to bind to
-bind_timeout         30          Seconds to attempt bind before giving up
-workers              1           Number of workers to fork
-user                 swift       User to run as
-db_preallocation     off         If you don't mind the extra disk space usage in
-                                 overhead, you can turn this on to preallocate
-                                 disk space with SQLite databases to decrease
-                                 fragmentation.
-disable_fallocate    false       Disable "fast fail" fallocate checks if the
-                                 underlying filesystem does not support it.
-log_custom_handlers  None        Comma-separated list of functions to call
-                                 to setup custom log handlers.
-eventlet_debug       false       If true, turn on debug logging for eventlet
-===================  ==========  =============================================
-
-[account-server]
-
-==================  ==============  ==========================================
-Option              Default         Description
-------------------  --------------  ------------------------------------------
-use                                 Entry point for paste.deploy for the account
-                                    server.  For most cases, this should be
-                                    `egg:swift#account`.
-set log_name        account-server  Label used when logging
-set log_facility    LOG_LOCAL0      Syslog log facility
-set log_level       INFO            Logging level
-==================  ==============  ==========================================
-
-[account-replicator]
-
-==================  ==================  ======================================
-Option              Default             Description
-------------------  ------------------  --------------------------------------
-log_name            account-replicator  Label used when logging
-log_facility        LOG_LOCAL0          Syslog log facility
-log_level           INFO                Logging level
-per_diff            1000
-concurrency         8                   Number of replication workers to spawn
-run_pause           30                  Time in seconds to wait between
-                                        replication passes
-node_timeout        10                  Request timeout to external services
-conn_timeout        0.5                 Connection timeout to external services
-reclaim_age         604800              Time elapsed in seconds before an
-                                        account can be reclaimed
-==================  ==================  ======================================
-
-[account-auditor]
-
-====================  ===============  =======================================
-Option                Default          Description
---------------------  ---------------  ---------------------------------------
-log_name              account-auditor  Label used when logging
-log_facility          LOG_LOCAL0       Syslog log facility
-log_level             INFO             Logging level
-interval              1800             Minimum time for a pass to take
-====================  ===============  =======================================
-
-[account-reaper]
-
-==================  ===============  =========================================
-Option              Default          Description
-------------------  ---------------  -----------------------------------------
-log_name            account-auditor  Label used when logging
-log_facility        LOG_LOCAL0       Syslog log facility
-log_level           INFO             Logging level
-concurrency         25               Number of replication workers to spawn
-interval            3600             Minimum time for a pass to take
-node_timeout        10               Request timeout to external services
-conn_timeout        0.5              Connection timeout to external services
-delay_reaping       0                Normally, the reaper begins deleting
-                                     account information for deleted accounts
-                                     immediately; you can set this to delay
-                                     its work however. The value is in seconds,
-                                     2592000 = 30 days, for example.
-==================  ===============  =========================================
-
---------------------------
-Proxy Server Configuration
---------------------------
-
-An example Proxy Server configuration can be found at
-etc/proxy-server.conf-sample in the source code repository.
-
-The following configuration options are available:
-
-[DEFAULT]
-
-============================  ===============  =============================
-Option                        Default          Description
-----------------------------  ---------------  -----------------------------
-bind_ip                       0.0.0.0          IP Address for server to
-                                               bind to
-bind_port                     80               Port for server to bind to
-bind_timeout                  30               Seconds to attempt bind before
-                                               giving up
-swift_dir                     /etc/swift       Swift configuration directory
-workers                       1                Number of workers to fork
-user                          swift            User to run as
-cert_file                                      Path to the ssl .crt. This
-                                               should be enabled for testing
-                                               purposes only.
-key_file                                       Path to the ssl .key. This
-                                               should be enabled for testing
-                                               purposes only.
-cors_allow_origin                              This is a list of hosts that
-                                               are included with any CORS 
-                                               request by default and 
-                                               returned with the 
-                                               Access-Control-Allow-Origin
-                                               header in addition to what
-                                               the container has set.
-log_custom_handlers           None             Comma separated list of functions
-                                               to call to setup custom log
-                                               handlers.
-eventlet_debug                false            If true, turn on debug logging
-                                               for eventlet
-============================  ===============  =============================
-
-[proxy-server]
-
-============================  ===============  =============================
-Option                        Default          Description
-----------------------------  ---------------  -----------------------------
-use                                            Entry point for paste.deploy for
-                                               the proxy server.  For most
-                                               cases, this should be
-                                               `egg:swift#proxy`.
-set log_name                  proxy-server     Label used when logging
-set log_facility              LOG_LOCAL0       Syslog log facility
-set log_level                 INFO             Log level
-set log_headers               True             If True, log headers in each
-                                               request
-set log_handoffs              True             If True, the proxy will log
-                                               whenever it has to failover to a
-                                               handoff node
-recheck_account_existence     60               Cache timeout in seconds to
-                                               send memcached for account
-                                               existence
-recheck_container_existence   60               Cache timeout in seconds to
-                                               send memcached for container
-                                               existence
-object_chunk_size             65536            Chunk size to read from
-                                               object servers
-client_chunk_size             65536            Chunk size to read from
-                                               clients
-memcache_servers              127.0.0.1:11211  Comma separated list of
-                                               memcached servers ip:port
-node_timeout                  10               Request timeout to external
-                                               services
-client_timeout                60               Timeout to read one chunk
-                                               from a client
-conn_timeout                  0.5              Connection timeout to
-                                               external services
-error_suppression_interval    60               Time in seconds that must
-                                               elapse since the last error
-                                               for a node to be considered
-                                               no longer error limited
-error_suppression_limit       10               Error count to consider a
-                                               node error limited
-allow_account_management      false            Whether account PUTs and DELETEs
-                                               are even callable
-object_post_as_copy           true             Set object_post_as_copy = false
-                                               to turn on fast posts where only
-                                               the metadata changes are stored
-                                               anew and the original data file
-                                               is kept in place. This makes for
-                                               quicker posts; but since the
-                                               container metadata isn't updated
-                                               in this mode, features like
-                                               container sync won't be able to
-                                               sync posts.
-account_autocreate            false            If set to 'true' authorized
-                                               accounts that do not yet exist
-                                               within the Swift cluster will
-                                               be automatically created.
-max_containers_per_account    0                If set to a positive value,
-                                               trying to create a container
-                                               when the account already has at
-                                               least this maximum containers
-                                               will result in a 403 Forbidden.
-                                               Note: This is a soft limit,
-                                               meaning a user might exceed the
-                                               cap for
-                                               recheck_account_existence before
-                                               the 403s kick in.
-max_containers_whitelist                       This is a comma separated list
-                                               of account names that ignore
-                                               the max_containers_per_account
-                                               cap.
-rate_limit_after_segment      10               Rate limit the download of
-                                               large object segments after
-                                               this segment is downloaded.
-rate_limit_segments_per_sec   1                Rate limit large object
-                                               downloads at this rate.
-============================  ===============  =============================
-
-[tempauth]
-
-=====================  =============================== =======================
-Option                 Default                         Description
----------------------  ------------------------------- -----------------------
-use                                                    Entry point for
-                                                       paste.deploy to use for
-                                                       auth. To use tempauth
-                                                       set to:
-                                                       `egg:swift#tempauth`
-set log_name           tempauth                        Label used when logging
-set log_facility       LOG_LOCAL0                      Syslog log facility
-set log_level          INFO                            Log level
-set log_headers        True                            If True, log headers in
-                                                       each request
-reseller_prefix        AUTH                            The naming scope for the
-                                                       auth service. Swift
-                                                       storage accounts and
-                                                       auth tokens will begin
-                                                       with this prefix.
-auth_prefix            /auth/                          The HTTP request path
-                                                       prefix for the auth
-                                                       service. Swift itself
-                                                       reserves anything
-                                                       beginning with the
-                                                       letter `v`.
-token_life             86400                           The number of seconds a
-                                                       token is valid.
-storage_url_scheme     default                         Scheme to return with
-                                                       storage urls: http,
-                                                       https, or default
-                                                       (chooses based on what
-                                                       the server is running
-                                                       as) This can be useful
-                                                       with an SSL load
-                                                       balancer in front of a
-                                                       non-SSL server.
-=====================  =============================== =======================
-
-Additionally, you need to list all the accounts/users you want here. The format
-is::
-
-    user_<account>_<user> = <key> [group] [group] [...] [storage_url]
-
-or if you want to be able to include underscores in the ``<account>`` or
-``<user>`` portions, you can base64 encode them (with *no* equal signs) in a
-line like this::
-
-    user64_<account_b64>_<user_b64> = <key> [group] [group] [...] [storage_url]
-
-There are special groups of::
-
-    .reseller_admin = can do anything to any account for this auth
-    .admin = can do anything within the account
-
-If neither of these groups are specified, the user can only access containers
-that have been explicitly allowed for them by a .admin or .reseller_admin.
-
-The trailing optional storage_url allows you to specify an alternate url to
-hand back to the user upon authentication. If not specified, this defaults to::
-
-    $HOST/v1/<reseller_prefix>_<account>
-
-Where $HOST will do its best to resolve to what the requester would need to use
-to reach this host, <reseller_prefix> is from this section, and <account> is
-from the user_<account>_<user> name. Note that $HOST cannot possibly handle
-when you have a load balancer in front of it that does https while TempAuth
-itself runs with http; in such a case, you'll have to specify the
-storage_url_scheme configuration value as an override.
-
-Here are example entries, required for running the tests::
-
-    user_admin_admin = admin .admin .reseller_admin
-    user_test_tester = testing .admin
-    user_test2_tester2 = testing2 .admin
-    user_test_tester3 = testing3
-
-    # account "test_y" and user "tester_y" (note the lack of padding = chars)
-    user64_dGVzdF95_dGVzdGVyX3k = testing4 .admin
 
 ------------------------
 Memcached Considerations
 ------------------------
 
-Several of the Services rely on Memcached for caching certain types of
-lookups, such as auth tokens, and container/account existence.  Swift does
-not do any caching of actual object data.  Memcached should be able to run
-on any servers that have available RAM and CPU.  At Rackspace, we run
-Memcached on the proxy servers.  The `memcache_servers` config option
-in the `proxy-server.conf` should contain all memcached servers.
+Several of the Services rely on Memcached for caching certain types of lookups,
+such as auth tokens, and container/account existence.  Swift does not do any
+caching of actual object data.  Memcached should be able to run on any servers
+that have available RAM and CPU.  Typically Memcached is run on the proxy
+servers.  The ``memcache_servers`` config option in the ``proxy-server.conf``
+should contain all memcached servers.
+
+*************************
+Shard Range Listing Cache
+*************************
+
+When a container gets :ref:`sharded<sharding_doc>` the root container will still be the
+primary entry point to many container requests, as it provides the list of shards.
+To take load off the root container Swift by default caches the list of shards returned.
+
+As the number of shards for a root container grows to more than 3k the memcache default max
+size of 1MB can be reached.
+
+If you over-run your max configured memcache size you'll see messages like::
+
+  Error setting value in memcached: 127.0.0.1:11211: SERVER_ERROR object too large for cache
+
+When you see these messages your root containers are getting hammered and
+probably returning 503 reponses to clients.  Override the default 1MB limit to
+5MB with something like::
+
+  /usr/bin/memcached -I 5000000 ...
+
+Memcache has a ``stats sizes`` option that can point out the current size usage. As this
+reaches the current max an increase might be in order::
+
+  # telnet <memcache server> 11211
+  > stats sizes
+  STAT 160 2
+  STAT 448 1
+  STAT 576 1
+  END
+
 
 -----------
 System Time
@@ -734,30 +529,58 @@ Time may be relative but it is relatively important for Swift!  Swift uses
 timestamps to determine which is the most recent version of an object.
 It is very important for the system time on each server in the cluster to
 by synced as closely as possible (more so for the proxy server, but in general
-it is a good idea for all the servers).  At Rackspace, we use NTP with a local
-NTP server to ensure that the system times are as close as possible.  This
-should also be monitored to ensure that the times do not vary too much.
+it is a good idea for all the servers).  Typical deployments use NTP with a
+local NTP server to ensure that the system times are as close as possible.
+This should also be monitored to ensure that the times do not vary too much.
+
+.. _general-service-tuning:
 
 ----------------------
 General Service Tuning
 ----------------------
 
-Most services support either a worker or concurrency value in the settings.
-This allows the services to make effective use of the cores available. A good
-starting point to set the concurrency level for the proxy and storage services
-to 2 times the number of cores available. If more than one service is
-sharing a server, then some experimentation may be needed to find the best
-balance.
-
-At Rackspace, our Proxy servers have dual quad core processors, giving us 8
-cores. Our testing has shown 16 workers to be a pretty good balance when
-saturating a 10g network and gives good CPU utilization.
-
-Our Storage servers all run together on the same servers. These servers have
-dual quad core processors, for 8 cores total. We run the Account, Container,
-and Object servers with 8 workers each. Most of the background jobs are run
-at a concurrency of 1, with the exception of the replicators which are run at
-a concurrency of 2.
+Most services support either a ``workers`` or ``concurrency`` value in the
+settings.  This allows the services to make effective use of the cores
+available. A good starting point is to set the concurrency level for the proxy
+and storage services to 2 times the number of cores available. If more than
+one service is sharing a server, then some experimentation may be needed to
+find the best balance.
+
+For example, one operator reported using the following settings in a production
+Swift cluster:
+
+- Proxy servers have dual quad core processors (i.e. 8 cores); testing has
+  shown 16 workers to be a pretty good balance when saturating a 10g network
+  and gives good CPU utilization.
+
+- Storage server processes all run together on the same servers. These servers
+  have dual quad core processors, for 8 cores total. The Account, Container,
+  and Object servers are run with 8 workers each. Most of the background jobs
+  are run at a concurrency of 1, with the exception of the replicators which
+  are run at a concurrency of 2.
+
+The ``max_clients`` parameter can be used to adjust the number of client
+requests an individual worker accepts for processing. The fewer requests being
+processed at one time, the less likely a request that consumes the worker's
+CPU time, or blocks in the OS, will negatively impact other requests. The more
+requests being processed at one time, the more likely one worker can utilize
+network and disk capacity.
+
+On systems that have more cores, and more memory, where one can afford to run
+more workers, raising the number of workers and lowering the maximum number of
+clients serviced per worker can lessen the impact of CPU intensive or stalled
+requests.
+
+The ``nice_priority`` parameter can be used to set program scheduling priority.
+The ``ionice_class`` and ``ionice_priority`` parameters can be used to set I/O scheduling
+class and priority on the systems that use an I/O scheduler that supports
+I/O priorities. As at kernel 2.6.17 the only such scheduler is the Completely
+Fair Queuing (CFQ) I/O scheduler. If you run your Storage servers all together
+on the same servers, you can slow down the auditors or prioritize
+object-server I/O via these parameters (but probably do not need to change
+it on the proxy). It is a new feature and the best practices are still
+being developed. On some systems it may be required to run the daemons as root.
+For more info also see setpriority(2) and ioprio_set(2).
 
 The above configuration setting should be taken as suggestions and testing
 of configuration settings should be done to ensure best utilization of CPU,
@@ -773,43 +596,69 @@ thorough testing with our use cases and hardware configurations, XFS was
 the best all-around choice. If you decide to use a filesystem other than
 XFS, we highly recommend thorough testing.
 
-If you are using XFS, some settings that can dramatically impact
-performance. We recommend the following when creating the XFS
-partition::
+For distros with more recent kernels (for example Ubuntu 12.04 Precise),
+we recommend using the default settings (including the default inode size
+of 256 bytes) when creating the file system::
+
+    mkfs.xfs -L D1 /dev/sda1
+
+In the last couple of years, XFS has made great improvements in how inodes
+are allocated and used.  Using the default inode size no longer has an
+impact on performance.
+
+For distros with older kernels (for example Ubuntu 10.04 Lucid),
+some settings can dramatically impact performance. We recommend the
+following when creating the file system::
 
-    mkfs.xfs -i size=1024 -f /dev/sda1
+    mkfs.xfs -i size=1024 -L D1 /dev/sda1
 
 Setting the inode size is important, as XFS stores xattr data in the inode.
 If the metadata is too large to fit in the inode, a new extent is created,
 which can cause quite a performance problem. Upping the inode size to 1024
 bytes provides enough room to write the default metadata, plus a little
-headroom. We do not recommend running Swift on RAID, but if you are using
-RAID it is also important to make sure that the proper sunit and swidth
-settings get set so that XFS can make most efficient use of the RAID array.
+headroom.
 
-We also recommend the following example mount options when using XFS::
+The following example mount options are recommended when using XFS::
 
-    mount -t xfs -o noatime,nodiratime,nobarrier,logbufs=8 /dev/sda1 /srv/node/sda
+    mount -t xfs -o noatime -L D1 /srv/node/d1
 
-For a standard swift install, all data drives are mounted directly under
-/srv/node (as can be seen in the above example of mounting /def/sda1 as
-/srv/node/sda). If you choose to mount the drives in another directory,
-be sure to set the `devices` config option in all of the server configs to
+We do not recommend running Swift on RAID, but if you are using
+RAID it is also important to make sure that the proper sunit and swidth
+settings get set so that XFS can make most efficient use of the RAID array.
+
+For a standard Swift install, all data drives are mounted directly under
+``/srv/node`` (as can be seen in the above example of mounting label ``D1``
+as ``/srv/node/d1``). If you choose to mount the drives in another directory,
+be sure to set the ``devices`` config option in all of the server configs to
 point to the correct directory.
 
+The mount points for each drive in ``/srv/node/`` should be owned by the root user
+almost exclusively (``root:root 755``). This is required to prevent rsync from
+syncing files into the root drive in the event a drive is unmounted.
+
 Swift uses system calls to reserve space for new objects being written into
-the system. If your filesystem does not support `fallocate()` or
-`posix_fallocate()`, be sure to set the `disable_fallocate = true` config
+the system. If your filesystem does not support ``fallocate()`` or
+``posix_fallocate()``, be sure to set the ``disable_fallocate = true`` config
 parameter in account, container, and object server configs.
 
+Most current Linux distributions ship with a default installation of updatedb.
+This tool runs periodically and updates the file name database that is used by
+the GNU locate tool. However, including Swift object and container database
+files is most likely not required and the periodic update affects the
+performance quite a bit. To disable the inclusion of these files add the path
+where Swift stores its data to the setting PRUNEPATHS in ``/etc/updatedb.conf``::
+
+    PRUNEPATHS="... /tmp ... /var/spool ... /srv/node"
+
+
 ---------------------
 General System Tuning
 ---------------------
 
-Rackspace currently runs Swift on Ubuntu Server 10.04, and the following
-changes have been found to be useful for our use cases.
+The following changes have been found to be useful when running Swift on Ubuntu
+Server 10.04.
 
-The following settings should be in `/etc/sysctl.conf`::
+The following settings should be in ``/etc/sysctl.conf``::
 
     # disable TIME_WAIT.. wait..
     net.ipv4.tcp_tw_recycle=1
@@ -819,9 +668,9 @@ The following settings should be in `/etc/sysctl.conf`::
     net.ipv4.tcp_syncookies = 0
 
     # double amount of allowed conntrack
-    net.ipv4.netfilter.ip_conntrack_max = 262144
+    net.netfilter.nf_conntrack_max = 262144
 
-To load the updated sysctl settings, run ``sudo sysctl -p``
+To load the updated sysctl settings, run ``sudo sysctl -p``.
 
 A note about changing the TIME_WAIT values.  By default the OS will hold
 a port open for 60 seconds to ensure that any remaining packets can be
@@ -835,7 +684,7 @@ Logging Considerations
 ----------------------
 
 Swift is set up to log directly to syslog. Every service can be configured
-with the `log_facility` option to set the syslog log facility destination.
+with the ``log_facility`` option to set the syslog log facility destination.
 We recommended using syslog-ng to route the logs to specific log
 files locally on the server and also to remote log collecting servers.
 Additionally, custom log handlers can be used via the custom_log_handlers
diff --git a/doc/source/development_auth.rst b/doc/source/development_auth.rst
index e913850b5a..53c50b6743 100644
--- a/doc/source/development_auth.rst
+++ b/doc/source/development_auth.rst
@@ -37,7 +37,7 @@ will be omitted.
 
 It is highly recommended that authentication server implementers prefix their
 tokens and Swift storage accounts they create with a configurable reseller
-prefix (`AUTH_` by default with the included TempAuth). This prefix will avoid
+prefix (``AUTH_`` by default with the included TempAuth). This prefix will avoid
 conflicts with other authentication servers that might be using the same
 Swift cluster. Otherwise, the Swift cluster will have to try all the resellers
 until one validates a token or all fail.
@@ -48,18 +48,18 @@ designations as you'll see later).
 
 Example Authentication with TempAuth:
 
-    * Token AUTH_tkabcd is given to the TempAuth middleware in a request's
-      X-Auth-Token header.
-    * The TempAuth middleware validates the token AUTH_tkabcd and discovers
-      it matches the "tester" user within the "test" account for the storage
-      account "AUTH_storage_xyz".
-    * The TempAuth middleware sets the REMOTE_USER to
-      "test:tester,test,AUTH_storage_xyz"
-    * Now this user will have full access (via authorization procedures later)
-      to the AUTH_storage_xyz Swift storage account and access to containers in
-      other storage accounts, provided the storage account begins with the same
-      `AUTH_` reseller prefix and the container has an ACL specifying at least
-      one of those three groups.
+* Token AUTH_tkabcd is given to the TempAuth middleware in a request's
+  X-Auth-Token header.
+* The TempAuth middleware validates the token AUTH_tkabcd and discovers
+  it matches the "tester" user within the "test" account for the storage
+  account "AUTH_storage_xyz".
+* The TempAuth middleware sets the REMOTE_USER to
+  "test:tester,test,AUTH_storage_xyz"
+* Now this user will have full access (via authorization procedures later)
+  to the AUTH_storage_xyz Swift storage account and access to containers in
+  other storage accounts, provided the storage account begins with the same
+  ``AUTH_`` reseller prefix and the container has an ACL specifying at least
+  one of those three groups.
 
 Authorization is performed through callbacks by the Swift Proxy server to the
 WSGI environment's swift.authorize value, if one is set. The swift.authorize
@@ -352,7 +352,7 @@ folks a start on their own code if they want to use repoze.what::
             self.ssl = \
                 conf.get('ssl', 'false').lower() in ('true', 'on', '1', 'yes')
             self.auth_prefix = conf.get('prefix', '/')
-            self.timeout = int(conf.get('node_timeout', 10))
+            self.timeout = float(conf.get('node_timeout', 10))
 
         def authenticate(self, env, identity):
             token = identity.get('token')
@@ -375,7 +375,7 @@ folks a start on their own code if they want to use repoze.what::
                 expiration = float(resp.getheader('x-auth-ttl'))
                 user = resp.getheader('x-auth-user')
                 memcache_client.set(key, (time(), expiration, user),
-                                    timeout=expiration)
+                                    time=expiration)
                 return user
             return None
 
@@ -487,7 +487,8 @@ folks a start on their own code if they want to use repoze.what::
 Allowing CORS with Auth
 -----------------------
 
-Cross Origin RequestS require that the auth system allow the OPTIONS method to 
-pass through without a token.  The preflight request will make an OPTIONS call 
-against the object or container and will not work if the auth system stops it.
+Cross Origin Resource Sharing (CORS) require that the auth system allow the
+OPTIONS method to pass through without a token.  The preflight request will
+make an OPTIONS call against the object or container and will not work if
+the auth system stops it.
 See TempAuth for an example of how OPTIONS requests are handled.
diff --git a/doc/source/development_guidelines.rst b/doc/source/development_guidelines.rst
index 5682233bfc..6af3e49513 100644
--- a/doc/source/development_guidelines.rst
+++ b/doc/source/development_guidelines.rst
@@ -6,65 +6,301 @@ Development Guidelines
 Coding Guidelines
 -----------------
 
-For the most part we try to follow PEP 8 guidelines which can be viewed 
+For the most part we try to follow PEP 8 guidelines which can be viewed
 here: http://www.python.org/dev/peps/pep-0008/
 
-There is a useful pep8 command line tool for checking files for pep8
-compliance which can be installed with ``easy_install pep8``.
-
 ------------------
 Testing Guidelines
 ------------------
 
-Swift has a comprehensive suite of tests that are run on all submitted code,
-and it is recommended that developers execute the tests themselves to 
-catch regressions early.  Developers are also expected to keep the
-test suite up-to-date with any submitted code changes.
+Swift has a comprehensive suite of tests and pep8 checks that are run on all
+submitted code, and it is recommended that developers execute the tests
+themselves to catch regressions early.  Developers are also expected to keep
+the test suite up-to-date with any submitted code changes.
+
+Swift's tests and pep8 checks can be executed in an isolated environment
+with ``tox``: http://tox.testrun.org/
+
+To execute the tests:
+
+* Ensure ``pip`` and ``virtualenv`` are upgraded to satisfy the version
+  requirements listed in the OpenStack `global requirements`_::
+
+    pip install pip -U
+    pip install virtualenv -U
+
+.. _`global requirements`: https://github.com/openstack/requirements/blob/master/global-requirements.txt
+
+* Install ``tox``::
+
+    pip install tox
+
+* Generate list of  distribution packages to install for testing::
+
+    tox -e bindep
+
+  Now install these packages using your distribution package manager
+  like apt-get, dnf, yum, or zypper.
+
+* Run ``tox`` from the root of the swift repo::
+
+    tox
+
+To run a selected subset of unit tests with ``pytest``:
+
+* Create a virtual environment with ``tox``::
+
+    tox devenv -e py3 .env
+
+.. note::
+  Alternatively, here are the steps of manual preparation of the virtual environment::
+
+    virtualenv .env
+    source .env/bin/activate
+    pip3 install -r requirements.txt -r test-requirements.txt -c py36-constraints.txt
+    pip3 install -e .
+    deactivate
+
+* Activate the virtual environment::
+
+    source .env/bin/activate
+
+* Run some unit tests, for example::
+
+    pytest test/unit/common/middleware/crypto
+
+* Run all unit tests::
+
+    pytest test/unit
+
+.. note::
+  If you installed using ``cd ~/swift; sudo python setup.py develop``, you may
+  need to do ``cd ~/swift; sudo chown -R ${USER}:${USER} swift.egg-info`` prior
+  to running ``tox``.
+
+* By default ``tox`` will run **all of the unit test** and pep8 checks listed in
+  the ``tox.ini`` file ``envlist`` option. A subset of the test environments
+  can be specified on the ``tox`` command line or by setting the ``TOXENV``
+  environment variable. For example, to run only the pep8 checks and python3
+  unit tests use::
+
+    tox -e pep8,py3
+
+  or::
+
+    TOXENV=py3,pep8 tox
+
+  To run unit tests with python3.12 specifically::
+
+    tox -e py312
+
+.. note::
+  As of ``tox`` version 2.0.0, most environment variables are not automatically
+  passed to the test environment. Swift's ``tox.ini`` overrides this default
+  behavior so that variable names matching ``SWIFT_*`` and ``*_proxy`` will be
+  passed, but you may need to run ``tox --recreate`` for this to take effect
+  after upgrading from ``tox`` <2.0.0.
+
+  Conversely, if you do not want those environment variables to be passed to
+  the test environment then you will need to unset them before calling ``tox``.
+
+  Also, if you ever encounter DistributionNotFound, try to use ``tox
+  --recreate`` or remove the ``.tox`` directory to force ``tox`` to recreate the
+  dependency list.
+
+  Swift's tests require having an XFS directory available in ``/tmp`` or
+  in the ``TMPDIR`` environment variable.
+
+Swift's functional tests may be executed against a :doc:`development_saio` or
+other running Swift cluster using the command::
+
+  tox -e func
+
+The endpoint and authorization credentials to be used by functional tests
+should be configured in the ``test.conf`` file as described in the section
+:ref:`setup_scripts`.
+
+The environment variable ``SWIFT_TEST_POLICY`` may be set to specify a
+particular storage policy *name* that will be used for testing. When set, tests
+that would otherwise not specify a policy or choose a random policy from
+those available will instead use the policy specified. Tests that use more than
+one policy will include the specified policy in the set of policies used. The
+specified policy must be available on the cluster under test.
 
-Swift's suite of unit tests can be executed in an isolated environment
-with Tox: http://tox.testrun.org/
+For example, this command would run the functional tests using policy
+'silver'::
 
-To execute the unit tests:
+  SWIFT_TEST_POLICY=silver tox -e func
 
-* Install Tox:
+To run a single functional test, use the ``--no-discover`` option together with
+a path to a specific test method, for example::
 
-  - `pip install tox`
+  tox -e func -- --no-discover test.functional.tests.TestFile.testCopy
 
-* Run Tox from the root of the swift repo:
 
-  - `tox`
+In-process functional testing
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-* Optionally, run only specific tox builds:
+If the ``test.conf`` file is not found then the functional test framework will
+instantiate a set of Swift servers in the same process that executes the
+functional tests. This 'in-process test' mode may also be enabled (or disabled)
+by setting the environment variable ``SWIFT_TEST_IN_PROCESS`` to a true (or
+false) value prior to executing ``tox -e func``.
 
-  - `tox -e pep8,py26`
+When using the 'in-process test' mode some server configuration options may be
+set using environment variables:
+
+- the optional in-memory object server may be selected by setting the
+  environment variable ``SWIFT_TEST_IN_MEMORY_OBJ`` to a true value.
+
+- encryption may be added to the proxy pipeline by setting the
+  environment variable ``SWIFT_TEST_IN_PROCESS_CONF_LOADER`` to
+  ``encryption``.
+
+- a 2+1 EC policy may be installed as the default policy by setting the
+  environment variable ``SWIFT_TEST_IN_PROCESS_CONF_LOADER`` to
+  ``ec``.
+
+- logging to stdout may be enabled by setting ``SWIFT_TEST_DEBUG_LOGS``.
+
+For example, this command would run the in-process mode functional tests with
+encryption enabled in the proxy-server::
+
+    SWIFT_TEST_IN_PROCESS=1 SWIFT_TEST_IN_PROCESS_CONF_LOADER=encryption \
+        tox -e func
+
+This particular example may also be run using the ``func-encryption``
+tox environment::
+
+    tox -e func-encryption
+
+The ``tox.ini`` file also specifies test environments for running other
+in-process functional test configurations, e.g.::
+
+  tox -e func-ec
+
+To debug the functional tests, use the 'in-process test' mode and pass the
+``--pdb`` flag to ``tox``::
+
+    SWIFT_TEST_IN_PROCESS=1 tox -e func -- --pdb \
+        test.functional.tests.TestFile.testCopy
+
+The 'in-process test' mode searches for ``proxy-server.conf`` and
+``swift.conf`` config files from which it copies config options and overrides
+some options to suit in process testing. The search will first look for config
+files in a ``<custom_conf_source_dir>`` that may optionally be specified using
+the environment variable::
+
+     SWIFT_TEST_IN_PROCESS_CONF_DIR=<custom_conf_source_dir>
+
+If ``SWIFT_TEST_IN_PROCESS_CONF_DIR`` is not set, or if a config file is not
+found in ``<custom_conf_source_dir>``, the search will then look in the
+``etc/`` directory in the source tree. If the config file is still not found,
+the corresponding sample config file from ``etc/`` is used (e.g.
+``proxy-server.conf-sample`` or ``swift.conf-sample``).
+
+When using the 'in-process test' mode ``SWIFT_TEST_POLICY`` may be set to
+specify a particular storage policy *name* that will be used for testing as
+described above. When set, this policy must exist in the ``swift.conf`` file
+and its corresponding ring file must exist in ``<custom_conf_source_dir>`` (if
+specified) or ``etc/``. The test setup will set the specified policy to be the
+default and use its ring file properties for constructing the test object ring.
+This allows in-process testing to be run against various policy types and ring
+files.
+
+For example, this command would run the in-process mode functional tests
+using config files found in ``$HOME/my_tests`` and policy 'silver'::
+
+ SWIFT_TEST_IN_PROCESS=1 SWIFT_TEST_IN_PROCESS_CONF_DIR=$HOME/my_tests \
+    SWIFT_TEST_POLICY=silver tox -e func
+
+
+S3 API cross-compatibility tests
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+The cross-compatibility tests in directory `test/s3api` are intended to verify
+that the Swift S3 API behaves in the same way as the AWS S3 API. They should
+pass when run against either a Swift endpoint (with S3 API enabled) or an AWS
+S3 endpoint.
+
+To run against an AWS S3 endpoint, the `/etc/swift/test.conf` file must be
+edited to provide AWS key IDs and secrets. Alternatively, an AWS CLI style
+credentials file can be loaded by setting the ``SWIFT_TEST_AWS_CONFIG_FILE``
+environment variable, e.g.::
+
+    SWIFT_TEST_AWS_CONFIG_FILE=~/.aws/credentials pytest ./test/s3api
+
+.. note::
+  When using ``SWIFT_TEST_AWS_CONFIG_FILE``, the region defaults to
+  ``us-east-1`` and only the default credentials are loaded.
+
+
+------------
+Coding Style
+------------
+
+Swift uses flake8 with the OpenStack `hacking`_ module to enforce
+coding style.
+
+Install flake8 and hacking with pip or by the packages of your
+Operating System.
+
+It is advised to integrate flake8+hacking with your editor to get it
+automated and not get `caught` by Jenkins.
+
+For example for Vim the `syntastic`_ plugin can do this for you.
+
+.. _`hacking`: https://pypi.org/project/hacking
+.. _`syntastic`: https://github.com/scrooloose/syntastic
 
 ------------------------
 Documentation Guidelines
 ------------------------
 
-The documentation in docstrings should follow the PEP 257 conventions 
+The documentation in docstrings should follow the PEP 257 conventions
 (as mentioned in the PEP 8 guidelines).
 
 More specifically:
 
-    1.  Triple qutes should be used for all docstrings.
-    2.  If the docstring is simple and fits on one line, then just use
-        one line.
-    3.  For docstrings that take multiple lines, there should be a newline
-        after the opening quotes, and before the closing quotes.
-    4.  Sphinx is used to build documentation, so use the restructured text
-        markup to designate parameters, return values, etc.  Documentation on
-        the sphinx specific markup can be found here:
-        http://sphinx.pocoo.org/markup/index.html
+#.  Triple quotes should be used for all docstrings.
+#.  If the docstring is simple and fits on one line, then just use
+    one line.
+#.  For docstrings that take multiple lines, there should be a newline
+    after the opening quotes, and before the closing quotes.
+#.  Sphinx is used to build documentation, so use the restructured text
+    markup to designate parameters, return values, etc.  Documentation on
+    the sphinx specific markup can be found here:
+    https://www.sphinx-doc.org/en/master/
+
+To build documentation run::
+
+    pip install -r requirements.txt -r doc/requirements.txt
+    sphinx-build -W -b html doc/source doc/build/html
+
+and then browse to doc/build/html/index.html. These docs are auto-generated
+after every commit and available online at
+https://docs.openstack.org/swift/latest/.
+
+--------
+Manpages
+--------
+
+For sanity check of your change in manpage, use this command in the root
+of your Swift repo::
+
+  ./.manpages
 
 ---------------------
 License and Copyright
 ---------------------
 
-Every source file should have the following copyright and license statement at
-the top::
+You can have the following copyright and license statement at
+the top of each source file. Copyright assignment is optional.
+
+New files should contain the current year. Substantial updates can have
+another year added, and date ranges are not needed.::
 
-    # Copyright (c) 2010-2012 OpenStack, LLC.
+    # Copyright (c) 2013 OpenStack Foundation.
     #
     # Licensed under the Apache License, Version 2.0 (the "License");
     # you may not use this file except in compliance with the License.
diff --git a/doc/source/development_middleware.rst b/doc/source/development_middleware.rst
new file mode 100644
index 0000000000..41e6ace20c
--- /dev/null
+++ b/doc/source/development_middleware.rst
@@ -0,0 +1,383 @@
+=======================
+Middleware and Metadata
+=======================
+
+----------------
+Using Middleware
+----------------
+
+`Python WSGI Middleware`_ (or just "middleware") can be used to "wrap"
+the request and response of a Python WSGI application (i.e. a webapp,
+or REST/HTTP API), like Swift's WSGI servers (proxy-server,
+account-server, container-server, object-server).  Swift uses middleware
+to add (sometimes optional) behaviors to the Swift WSGI servers.
+
+.. _Python WSGI Middleware: http://www.python.org/dev/peps/pep-0333/#middleware-components-that-play-both-sides
+
+Middleware can be added to the Swift WSGI servers by modifying their
+`paste`_ configuration file.  The majority of Swift middleware is applied
+to the :ref:`proxy-server`.
+
+.. _paste: https://pypi.org/project/Paste/
+
+Given the following basic configuration::
+
+    [DEFAULT]
+    log_level = DEBUG
+    user = <your-user-name>
+
+    [pipeline:main]
+    pipeline = proxy-server
+
+    [app:proxy-server]
+    use = egg:swift#proxy
+
+You could add the :ref:`healthcheck` middleware by adding a section for
+that filter and adding it to the pipeline::
+
+    [DEFAULT]
+    log_level = DEBUG
+    user = <your-user-name>
+
+    [pipeline:main]
+    pipeline = healthcheck proxy-server
+
+    [filter:healthcheck]
+    use = egg:swift#healthcheck
+
+    [app:proxy-server]
+    use = egg:swift#proxy
+
+
+Some middleware is required and will be inserted into your pipeline
+automatically by core swift code (e.g. the proxy-server will insert
+:ref:`catch_errors` and :ref:`gatekeeper` at the start of the pipeline if they
+are not already present).  You can see which features are available on a given
+Swift endpoint (including middleware) using the :ref:`discoverability`
+interface.
+
+
+----------------------------
+Creating Your Own Middleware
+----------------------------
+
+The best way to see how to write middleware is to look at examples.
+
+Many optional features in Swift are implemented as
+:ref:`common_middleware` and provided in ``swift.common.middleware``, but
+Swift middleware may be packaged and distributed as a separate project.
+Some examples are listed on the :ref:`associated_projects` page.
+
+A contrived middleware example that modifies request behavior by
+inspecting custom HTTP headers (e.g. X-Webhook) and uses :ref:`sysmeta`
+to persist data to backend storage as well as common patterns like a
+:func:`.get_container_info` cache/query and :func:`.wsgify` decorator is
+presented below::
+
+    from swift.common.http import is_success
+    from swift.common.swob import wsgify
+    from swift.common.utils import split_path, get_logger
+    from swift.common.request_helpers import get_sys_meta_prefix
+    from swift.proxy.controllers.base import get_container_info
+    from eventlet import Timeout
+    from eventlet.green.urllib import urllib_request
+
+    # x-container-sysmeta-webhook
+    SYSMETA_WEBHOOK = get_sys_meta_prefix('container') + 'webhook'
+
+
+    class WebhookMiddleware(object):
+        def __init__(self, app, conf):
+            self.app = app
+            self.logger = get_logger(conf, log_route='webhook')
+
+        @wsgify
+        def __call__(self, req):
+            obj = None
+            try:
+                (version, account, container, obj) = \
+                    split_path(req.path_info, 4, 4, True)
+            except ValueError:
+                # not an object request
+                pass
+            if 'x-webhook' in req.headers:
+                # translate user's request header to sysmeta
+                req.headers[SYSMETA_WEBHOOK] = \
+                    req.headers['x-webhook']
+            if 'x-remove-webhook' in req.headers:
+                # empty value will tombstone sysmeta
+                req.headers[SYSMETA_WEBHOOK] = ''
+            # account and object storage will ignore x-container-sysmeta-*
+            resp = req.get_response(self.app)
+            if obj and is_success(resp.status_int) and req.method == 'PUT':
+                container_info = get_container_info(req.environ, self.app)
+                # container_info may have our new sysmeta key
+                webhook = container_info['sysmeta'].get('webhook')
+                if webhook:
+                    # create a POST request with obj name as body
+                    webhook_req = urllib_request.Request(webhook, data=obj)
+                    with Timeout(20):
+                        try:
+                            urllib_request.urlopen(webhook_req).read()
+                        except (Exception, Timeout):
+                            self.logger.exception(
+                                'failed POST to webhook %s' % webhook)
+                        else:
+                            self.logger.info(
+                                'successfully called webhook %s' % webhook)
+            if 'x-container-sysmeta-webhook' in resp.headers:
+                # translate sysmeta from the backend resp to
+                # user-visible client resp header
+                resp.headers['x-webhook'] = resp.headers[SYSMETA_WEBHOOK]
+            return resp
+
+
+    def webhook_factory(global_conf, **local_conf):
+        conf = global_conf.copy()
+        conf.update(local_conf)
+
+        def webhook_filter(app):
+            return WebhookMiddleware(app, conf)
+        return webhook_filter
+
+In practice this middleware will call the URL stored on the container as
+X-Webhook on all successful object uploads.
+
+If this example was at ``<swift-repo>/swift/common/middleware/webhook.py`` -
+you could add it to your proxy by creating a new filter section and
+adding it to the pipeline::
+
+    [DEFAULT]
+    log_level = DEBUG
+    user = <your-user-name>
+
+    [pipeline:main]
+    pipeline = healthcheck webhook proxy-server
+
+    [filter:webhook]
+    paste.filter_factory = swift.common.middleware.webhook:webhook_factory
+
+    [filter:healthcheck]
+    use = egg:swift#healthcheck
+
+    [app:proxy-server]
+    use = egg:swift#proxy
+
+Most python packages expose middleware as entrypoints.  See `PasteDeploy`_
+documentation for more information about the syntax of the ``use`` option.
+All middleware included with Swift is installed to support the ``egg:swift``
+syntax.
+
+.. _PasteDeploy: https://pypi.org/project/PasteDeploy/
+
+Middleware may advertize its availability and capabilities via Swift's
+:ref:`discoverability` support by using
+:func:`.register_swift_info`::
+
+    from swift.common.registry import register_swift_info
+    def webhook_factory(global_conf, **local_conf):
+        register_swift_info('webhook')
+        def webhook_filter(app):
+            return WebhookMiddleware(app)
+        return webhook_filter
+
+If a middleware handles sensitive information in headers or query parameters
+that may need redaction when logging, use the :func:`.register_sensitive_header`
+and :func:`.register_sensitive_param` functions. This should be done in the
+filter factory::
+
+    from swift.common.registry import register_sensitive_header
+    def webhook_factory(global_conf, **local_conf):
+        register_sensitive_header('webhook-api-key')
+        def webhook_filter(app):
+            return WebhookMiddleware(app)
+        return webhook_filter
+
+
+Middlewares can override the status integer that is logged by proxy_logging
+middleware by setting ``swift.proxy_logging_status`` in the request WSGI
+environment. The value should be an integer. The value will replace the default
+status integer in the log message, unless the proxy_logging middleware detects
+a client disconnect or exception while handling the request, in which case
+``swift.proxy_logging_status`` is overridden by a 499 or 500 respectively.
+
+--------------
+Swift Metadata
+--------------
+
+Generally speaking metadata is information about a resource that is
+associated with the resource but is not the data contained in the
+resource itself - which is set and retrieved via HTTP headers. (e.g. the
+"Content-Type" of a Swift object that is returned in HTTP response
+headers)
+
+All user resources in Swift (i.e. account, container, objects) can have
+user metadata associated with them.  Middleware may also persist custom
+metadata to accounts and containers safely using System Metadata.  Some
+core Swift features which predate sysmeta have added exceptions for
+custom non-user metadata headers (e.g.  :ref:`acls`,
+:ref:`large-objects`)
+
+.. _usermeta:
+
+^^^^^^^^^^^^^
+User Metadata
+^^^^^^^^^^^^^
+
+User metadata takes the form of ``X-<type>-Meta-<key>: <value>``, where
+``<type>`` depends on the resources type (i.e. Account, Container, Object)
+and ``<key>`` and ``<value>`` are set by the client.
+
+User metadata should generally be reserved for use by the client or
+client applications.  A perfect example use-case for user metadata is
+`python-swiftclient`_'s ``X-Object-Meta-Mtime`` which it stores on
+object it uploads to implement its ``--changed`` option which will only
+upload files that have changed since the last upload.
+
+.. _python-swiftclient: https://opendev.org/openstack/python-swiftclient
+
+New middleware should avoid storing metadata within the User Metadata
+namespace to avoid potential conflict with existing user metadata when
+introducing new metadata keys.  An example of legacy middleware that
+borrows the user metadata namespace is :ref:`tempurl`.  An example of
+middleware which uses custom non-user metadata to avoid the user
+metadata namespace is :ref:`slo-doc`.
+
+User metadata that is stored by a PUT or POST request to a container or account
+resource persists until it is explicitly removed by a subsequent PUT or POST
+request that includes a header ``X-<type>-Meta-<key>`` with no value or a
+header ``X-Remove-<type>-Meta-<key>: <ignored-value>``. In the latter case the
+``<ignored-value>`` is not stored. All user metadata stored with an account or
+container resource is deleted when the account or container is deleted.
+
+User metadata that is stored with an object resource has a different semantic;
+object user metadata persists until any subsequent PUT or POST request is made
+to the same object, at which point all user metadata stored with that object is
+deleted en-masse and replaced with any user metadata included with the PUT or
+POST request. As a result, it is not possible to update a subset of the user
+metadata items stored with an object while leaving some items unchanged.
+
+.. _sysmeta:
+
+^^^^^^^^^^^^^^^^^^^^^^^^^
+System Metadata (Sysmeta)
+^^^^^^^^^^^^^^^^^^^^^^^^^
+
+System metadata takes the form of ``X-<type>-Sysmeta-<key>: <value>``,
+where ``<type>`` depends on the resources type (i.e. Account, Container,
+Object) and ``<key>`` and ``<value>`` are set by trusted code running in a
+Swift WSGI Server.
+
+All headers on client requests in the form of ``X-<type>-Sysmeta-<key>``
+will be dropped from the request before being processed by any
+middleware.  All headers on responses from back-end systems in the form
+of ``X-<type>-Sysmeta-<key>`` will be removed after all middlewares have
+processed the response but before the response is sent to the client.
+See :ref:`gatekeeper` middleware for more information.
+
+System metadata provides a means to store potentially private custom
+metadata with associated Swift resources in a safe and secure fashion
+without actually having to plumb custom metadata through the core swift
+servers.  The incoming filtering ensures that the namespace can not be
+modified directly by client requests, and the outgoing filter ensures
+that removing middleware that uses a specific system metadata key
+renders it benign.  New middleware should take advantage of system
+metadata.
+
+System metadata may be set on accounts and containers by including headers with
+a PUT or POST request. Where a header name matches the name of an existing item
+of system metadata, the value of the existing item will be updated. Otherwise
+existing items are preserved. A system metadata header with an empty value will
+cause any existing item with the same name to be deleted.
+
+System metadata may be set on objects using only PUT requests. All items of
+existing system metadata will be deleted and replaced en-masse by any system
+metadata headers included with the PUT request. System metadata is neither
+updated nor deleted by a POST request: updating individual items of system
+metadata with a POST request is not yet supported in the same way that updating
+individual items of user metadata is not supported. In cases where middleware
+needs to store its own metadata with a POST request, it may use Object Transient
+Sysmeta.
+
+
+^^^^^^^^^^^^^^^
+Object Metadata
+^^^^^^^^^^^^^^^
+
+Objects have other metadata in addition to the user metadata and system
+metadata described above.
+
+******************
+Immutable Metadata
+******************
+
+Objects have several items of immutable metadata. Like system metadata, these
+may only be set using PUT requests. However, they do not follow the general
+``X-Object-Sysmeta-<key>`` naming scheme and they are not automatically removed
+from client responses.
+
+Object immutable metadata includes::
+
+    X-Timestamp
+    Content-Length
+    Etag
+
+``X-Timestamp`` and ``Content-Length`` metadata MUST be included in PUT
+requests to object servers. ``Etag`` metadata is generated by object servers
+when they handle a PUT request, but checked against any ``Etag`` header sent
+with the PUT request.
+
+Object immutable metadata, along with ``Content-Type``, is the only object
+metadata that is stored by container servers and returned in object listings.
+
+************
+Content-Type
+************
+
+Object ``Content-Type`` metadata is treated differently from immutable
+metadata, system metadata and user metadata.
+
+``Content-Type`` MUST be included in PUT requests to object servers. Unlike
+immutable metadata or system metadata, ``Content-Type`` is mutable and may be
+included in POST requests to object servers. However, unlike object user
+metadata, existing ``Content-Type`` metadata persists if a POST request does
+not include new ``Content-Type`` metadata. This is because an object must have
+``Content-Type`` metadata, which is also stored by container servers and
+returned in object listings.
+
+``Content-Type`` is the only item of object metadata that is both mutable and
+yet also persists when not specified in a POST request.
+
+.. _transient_sysmeta:
+
+************************
+Object Transient-Sysmeta
+************************
+
+If middleware needs to store object metadata with a POST request it may do so
+using headers of the form ``X-Object-Transient-Sysmeta-<key>: <value>``.
+
+All headers on client requests in the form of
+``X-Object-Transient-Sysmeta-<key>`` will be dropped from the request before
+being processed by any middleware.  All headers on responses from back-end
+systems in the form of ``X-Object-Transient-Sysmeta-<key>`` will be removed
+after all middlewares have processed the response but before the response is
+sent to the client. See :ref:`gatekeeper` middleware for more information.
+
+Transient-sysmeta updates on an object have the same semantic as user
+metadata updates on an object (see :ref:`usermeta`) i.e. whenever any PUT or
+POST request is made to an object, all existing items of transient-sysmeta are
+deleted en-masse and replaced with any transient-sysmeta included with the PUT
+or POST request. Transient-sysmeta set by a middleware is therefore prone to
+deletion by a subsequent client-generated POST request unless the middleware is
+careful to include its transient-sysmeta with every POST. Likewise, user
+metadata set by a client is prone to deletion by a subsequent
+middleware-generated POST request, and for that reason middleware should avoid
+generating POST requests that are independent of any client request.
+
+Transient-sysmeta deliberately uses a different header prefix to user metadata
+so that middlewares can avoid potential conflict with user metadata keys.
+
+Transient-sysmeta deliberately uses a different header prefix to system
+metadata to emphasize the fact that the data is only persisted until a
+subsequent POST.
diff --git a/doc/source/development_ondisk_backends.rst b/doc/source/development_ondisk_backends.rst
new file mode 100644
index 0000000000..14934d7b6c
--- /dev/null
+++ b/doc/source/development_ondisk_backends.rst
@@ -0,0 +1,39 @@
+===============================
+Pluggable On-Disk Back-end APIs
+===============================
+
+The internal REST API used between the proxy server and the account, container
+and object server is almost identical to public Swift REST API, but with a few
+internal extensions (for example, update an account with a new container).
+
+The pluggable back-end APIs for the three REST API servers (account,
+container, object) abstracts the needs for servicing the various REST APIs
+from the details of how data is laid out and stored on-disk.
+
+The APIs are documented in the reference implementations for all three
+servers. For historical reasons, the object server backend reference
+implementation module is named ``diskfile``, while the account and container
+server backend reference implementation modules are named appropriately.
+
+This API is still under development and not yet finalized.
+
+-----------------------------------------
+Back-end API for Account Server REST APIs
+-----------------------------------------
+.. automodule:: swift.account.backend
+    :noindex:
+    :members:
+
+-------------------------------------------
+Back-end API for Container Server REST APIs
+-------------------------------------------
+.. automodule:: swift.container.backend
+    :noindex:
+    :members:
+
+----------------------------------------
+Back-end API for Object Server REST APIs
+----------------------------------------
+.. automodule:: swift.obj.diskfile
+    :noindex:
+    :members:
diff --git a/doc/source/development_saio.rst b/doc/source/development_saio.rst
old mode 100755
new mode 100644
index 18de01c105..a9f1e6fffe
--- a/doc/source/development_saio.rst
+++ b/doc/source/development_saio.rst
@@ -1,56 +1,115 @@
+.. _saio:
+
 =======================
-SAIO - Swift All In One
+SAIO (Swift All In One)
 =======================
 
+.. note::
+    This guide assumes an existing Linux server. A physical machine or VM will
+    work. We recommend configuring it with at least 2GB of memory and 40GB of
+    storage space. We recommend using a VM in order to isolate Swift and its
+    dependencies from other projects you may be working on.
+
 ---------------------------------------------
 Instructions for setting up a development VM
 ---------------------------------------------
 
-This section documents setting up a virtual machine for doing Swift development.
-The virtual machine will emulate running a four node Swift cluster.
+This section documents setting up a virtual machine for doing Swift
+development.  The virtual machine will emulate running a four node Swift
+cluster. To begin:
 
-* Get the *Ubuntu 10.04 LTS (Lucid Lynx)* server image:
+* Get a Linux system server image, this guide will cover:
 
-  - Ubuntu Server ISO: http://releases.ubuntu.com/lucid/ubuntu-10.04.4-server-amd64.iso (717 MB)
-  - Ubuntu Live/Install: http://cdimage.ubuntu.com/releases/lucid/release/ubuntu-10.04.4-dvd-amd64.iso (4.2 GB)
-  - Ubuntu Mirrors: https://launchpad.net/ubuntu/+cdmirrors
+  * Ubuntu 24.04 LTS
+  * CentOS Stream 9
+  * Fedora
+  * OpenSuse
 
-* Create guest virtual machine from the Ubuntu image.
+- Create guest virtual machine from the image.
 
-Additional information about setting up a Swift development snapshot on other distributions is
-available on the wiki at http://wiki.openstack.org/SAIOInstructions.
+----------------------------
+What's in a <your-user-name>
+----------------------------
 
------------------------------------------
-Installing dependencies and the core code
------------------------------------------
-* As root on guest (you'll have to log in as you, then `sudo su -`):
+Much of the configuration described in this guide requires escalated
+administrator (``root``) privileges; however, we assume that administrator logs
+in as an unprivileged user and can use ``sudo`` to run privileged commands.
+
+Swift processes also run under a separate user and group, set by configuration
+option, and referenced as ``<your-user-name>:<your-group-name>``.  The default user
+is ``swift``, which may not exist on your system.  These instructions are
+intended to allow a developer to use his/her username for
+``<your-user-name>:<your-group-name>``.
+
+.. note::
+  For OpenSuse users, a user's primary group is ``users``, so you have 2 options:
+
+  * Change ``${USER}:${USER}`` to ``${USER}:users`` in all references of this guide; or
+  * Create a group for your username and add yourself to it::
+
+     sudo groupadd ${USER} && sudo gpasswd -a ${USER} ${USER} && newgrp ${USER}
+
+-----------------------
+Installing dependencies
+-----------------------
+
+* On ``apt`` based systems::
+
+        sudo apt-get update
+        sudo apt-get install curl gcc memcached rsync sqlite3 xfsprogs \
+                             git-core libffi-dev python3-setuptools \
+                             liberasurecode-dev libssl-dev
+        sudo apt-get install python3-coverage python3-dev python3-pytest \
+                             python3-xattr python3-eventlet \
+                             python3-greenlet python3-pastedeploy \
+                             python3-pip python3-dnspython
+
+* On ``CentOS`` (requires additional repositories)::
+
+        sudo dnf update
+        sudo dnf install epel-release
+        sudo dnf config-manager --enable epel extras
+        sudo dnf install centos-release-openstack-epoxy
+        sudo dnf install curl gcc memcached rsync-daemon sqlite xfsprogs git-core \
+                         libffi-devel liberasurecode-devel \
+                         openssl-devel python3-setuptools \
+                         python3-coverage python3-devel python3-pytest \
+                         python3-pyxattr python3-eventlet \
+                         python3-greenlet python3-paste-deploy \
+                         python3-pip python3-dns
+
+* On ``Fedora``::
+
+        sudo dnf update
+        sudo dnf install curl gcc memcached rsync-daemon sqlite xfsprogs git-core \
+                         libffi-devel liberasurecode-devel python3-pyeclib \
+                         openssl-devel python3-setuptools \
+                         python3-coverage python3-devel python3-pytest \
+                         python3-pyxattr python3-eventlet \
+                         python3-greenlet python3-paste-deploy \
+                         python3-pip python3-dns
 
-  #. `apt-get install python-software-properties`
-  #. `add-apt-repository ppa:swift-core/release`
-  #. `apt-get update`
-  #. `apt-get install curl gcc git-core memcached python-coverage python-dev
-     python-nose python-setuptools python-simplejson python-xattr sqlite3
-     xfsprogs python-eventlet python-greenlet python-pastedeploy
-     python-netifaces python-pip`
-  #. `pip install mock`
-  #. Install anything else you want, like screen, ssh, vim, etc.
+* On ``OpenSuse``::
 
-* On Fedora, log in as root and do:
+        sudo zypper install curl gcc memcached rsync sqlite3 xfsprogs git-core \
+                            libffi-devel liberasurecode-devel python3-setuptools \
+                            libopenssl-devel
+        sudo zypper install python3-coverage python3-devel python3-nose \
+                            python3-xattr python3-eventlet python3-greenlet \
+                            python3-pip python3-dnspython
 
-  #. `yum install openstack-swift openstack-swift-proxy
-     openstack-swift-account openstack-swift-container openstack-swift-object`
-  #. `yum install xinetd rsync`
-  #. `yum install memcached`
-  #. `yum install python-netifaces python-nose python-mock`
+.. note::
+   This installs necessary system dependencies and *most* of the python
+   dependencies. Later in the process setuptools/distribute or pip will install
+   and/or upgrade packages.
 
-  This installs all necessary dependencies, and also creates user `swift`
-  and group `swift`. So, `swift:swift` ought to be used in every place where
-  this manual calls for `<your-user-name>:<your-group-name>`.
+-------------------
+Configuring storage
+-------------------
 
-  Ensure that you are installing the version of Swift that corresponds to
-  this document. If not, enable the correct update repositories.
+Swift requires some space on XFS filesystems to store data and run tests.
 
-Next, choose either :ref:`partition-section` or :ref:`loopback-section`.
+Choose either :ref:`partition-section` or :ref:`loopback-section`.
 
 .. _partition-section:
 
@@ -58,731 +117,685 @@ Using a partition for storage
 =============================
 
 If you are going to use a separate partition for Swift data, be sure to add
-another device when creating the VM, and follow these instructions.
-
-  #. `fdisk /dev/sdb` (set up a single partition)
-  #. `mkfs.xfs -i size=1024 /dev/sdb1`
-  #. Edit `/etc/fstab` and add
-       `/dev/sdb1 /mnt/sdb1 xfs noatime,nodiratime,nobarrier,logbufs=8 0 0`
-  #. `mkdir /mnt/sdb1`
-  #. `mount /mnt/sdb1`
-  #. `mkdir /mnt/sdb1/1 /mnt/sdb1/2 /mnt/sdb1/3 /mnt/sdb1/4`
-  #. `chown <your-user-name>:<your-group-name> /mnt/sdb1/*`
-  #. `mkdir /srv`
-  #. `for x in {1..4}; do ln -s /mnt/sdb1/$x /srv/$x; done`
-  #. `mkdir -p /etc/swift/object-server /etc/swift/container-server /etc/swift/account-server /srv/1/node/sdb1 /srv/2/node/sdb2 /srv/3/node/sdb3 /srv/4/node/sdb4 /var/run/swift`
-  #. `chown -R <your-user-name>:<your-group-name> /etc/swift /srv/[1-4]/ /var/run/swift` -- **Make sure to include the trailing slash after /srv/[1-4]/**
-  #. Add to `/etc/rc.local` (before the `exit 0`)::
+another device when creating the VM, and follow these instructions:
 
-        mkdir -p /var/cache/swift /var/cache/swift2 /var/cache/swift3 /var/cache/swift4
-        chown <your-user-name>:<your-group-name> /var/cache/swift*
-        mkdir -p /var/run/swift
-        chown <your-user-name>:<your-group-name> /var/run/swift
-  #. Next, skip to :ref:`rsync-section`.
+.. note::
+   The disk does not have to be ``/dev/sdb1`` (for example, it could be
+   ``/dev/vdb1``) however the mount point should still be ``/mnt/sdb1``.
+
+#. Set up a single partition on the device (this will wipe the drive)::
+
+      sudo parted /dev/sdb mklabel msdos mkpart p xfs 0% 100%
+
+#. Create an XFS file system on the partition::
+
+      sudo mkfs.xfs /dev/sdb1
+
+#. Find the UUID of the new partition::
+
+      sudo blkid
+
+#. Edit ``/etc/fstab`` and add::
+
+      UUID="<UUID-from-output-above>" /mnt/sdb1 xfs noatime 0 0
+
+#. Create the Swift data mount point and test that mounting works::
+
+      sudo mkdir /mnt/sdb1
+      sudo mount -a
 
+#. Next, skip to :ref:`common-dev-section`.
 
 .. _loopback-section:
 
 Using a loopback device for storage
 ===================================
 
-If you want to use a loopback device instead of another partition, follow these instructions.
-
-  #. `mkdir /srv`
-  #. `dd if=/dev/zero of=/srv/swift-disk bs=1024 count=0 seek=1000000`
-       (modify seek to make a larger or smaller partition)
-  #. `mkfs.xfs -i size=1024 /srv/swift-disk`
-  #. Edit `/etc/fstab` and add
-       `/srv/swift-disk /mnt/sdb1 xfs loop,noatime,nodiratime,nobarrier,logbufs=8 0 0`
-  #. `mkdir /mnt/sdb1`
-  #. `mount /mnt/sdb1`
-  #. `mkdir /mnt/sdb1/1 /mnt/sdb1/2 /mnt/sdb1/3 /mnt/sdb1/4`
-  #. `chown <your-user-name>:<your-group-name> /mnt/sdb1/*`
-  #. `for x in {1..4}; do ln -s /mnt/sdb1/$x /srv/$x; done`
-  #. `mkdir -p /etc/swift/object-server /etc/swift/container-server /etc/swift/account-server /srv/1/node/sdb1 /srv/2/node/sdb2 /srv/3/node/sdb3 /srv/4/node/sdb4 /var/run/swift`
-  #. `chown -R <your-user-name>:<your-group-name> /etc/swift /srv/[1-4]/ /var/run/swift` -- **Make sure to include the trailing slash after /srv/[1-4]/**
-  #. Add to `/etc/rc.local` (before the `exit 0`)::
+If you want to use a loopback device instead of another partition, follow
+these instructions:
+
+#. Create the file for the loopback device::
+
+      sudo mkdir -p /srv
+      sudo truncate -s 1GB /srv/swift-disk
+      sudo mkfs.xfs /srv/swift-disk
+
+   Modify size specified in the ``truncate`` command to make a larger or
+   smaller partition as needed.
+
+#. Edit `/etc/fstab` and add::
+
+      /srv/swift-disk /mnt/sdb1 xfs loop,noatime 0 0
+
+#. Create the Swift data mount point and test that mounting works::
+
+      sudo mkdir /mnt/sdb1
+      sudo mount -a
+
+.. _common-dev-section:
+
+Common Post-Device Setup
+========================
+
+#. Create the individualized data links::
+
+      sudo mkdir /mnt/sdb1/1 /mnt/sdb1/2 /mnt/sdb1/3 /mnt/sdb1/4
+      sudo chown ${USER}:${USER} /mnt/sdb1/*
+      for x in {1..4}; do sudo ln -s /mnt/sdb1/$x /srv/$x; done
+      sudo mkdir -p /srv/1/node/sdb1 /srv/1/node/sdb5 \
+                    /srv/2/node/sdb2 /srv/2/node/sdb6 \
+                    /srv/3/node/sdb3 /srv/3/node/sdb7 \
+                    /srv/4/node/sdb4 /srv/4/node/sdb8
+      sudo mkdir -p /var/run/swift
+      sudo mkdir -p /var/cache/swift /var/cache/swift2 \
+                    /var/cache/swift3 /var/cache/swift4
+      sudo chown -R ${USER}:${USER} /var/run/swift
+      sudo chown -R ${USER}:${USER} /var/cache/swift*
+      # **Make sure to include the trailing slash after /srv/$x/**
+      for x in {1..4}; do sudo chown -R ${USER}:${USER} /srv/$x/; done
+
+   .. note::
+      We create the mount points and mount the loopback file under
+      /mnt/sdb1. This file will contain one directory per simulated Swift node,
+      each owned by the current Swift user.
+
+      We then create symlinks to these directories under /srv.
+      If the disk sdb or loopback file is unmounted, files will not be written under
+      /srv/\*, because the symbolic link destination /mnt/sdb1/* will not
+      exist. This prevents disk sync operations from writing to the root
+      partition in the event a drive is unmounted.
+
+#. Restore appropriate permissions on reboot.
+
+   * On traditional Linux systems, add the following lines to ``/etc/rc.local`` (before the ``exit 0``)::
 
         mkdir -p /var/cache/swift /var/cache/swift2 /var/cache/swift3 /var/cache/swift4
         chown <your-user-name>:<your-group-name> /var/cache/swift*
         mkdir -p /var/run/swift
         chown <your-user-name>:<your-group-name> /var/run/swift
 
-.. _rsync-section:
+   * On CentOS and Fedora we can use systemd (rc.local is deprecated)::
 
-----------------
-Setting up rsync
-----------------
+        cat << EOF |sudo tee /etc/tmpfiles.d/swift.conf
+        d /var/cache/swift 0755 ${USER} ${USER} - -
+        d /var/cache/swift2 0755 ${USER} ${USER} - -
+        d /var/cache/swift3 0755 ${USER} ${USER} - -
+        d /var/cache/swift4 0755 ${USER} ${USER} - -
+        d /var/run/swift 0755 ${USER} ${USER} - -
+        EOF
 
-  #. Create /etc/rsyncd.conf::
-
-        uid = <Your user name>
-        gid = <Your group name>
-        log file = /var/log/rsyncd.log
-        pid file = /var/run/rsyncd.pid
-        address = 127.0.0.1
-
-        [account6012]
-        max connections = 25
-        path = /srv/1/node/
-        read only = false
-        lock file = /var/lock/account6012.lock
-
-        [account6022]
-        max connections = 25
-        path = /srv/2/node/
-        read only = false
-        lock file = /var/lock/account6022.lock
-
-        [account6032]
-        max connections = 25
-        path = /srv/3/node/
-        read only = false
-        lock file = /var/lock/account6032.lock
-
-        [account6042]
-        max connections = 25
-        path = /srv/4/node/
-        read only = false
-        lock file = /var/lock/account6042.lock
-
-
-        [container6011]
-        max connections = 25
-        path = /srv/1/node/
-        read only = false
-        lock file = /var/lock/container6011.lock
-
-        [container6021]
-        max connections = 25
-        path = /srv/2/node/
-        read only = false
-        lock file = /var/lock/container6021.lock
-
-        [container6031]
-        max connections = 25
-        path = /srv/3/node/
-        read only = false
-        lock file = /var/lock/container6031.lock
-
-        [container6041]
-        max connections = 25
-        path = /srv/4/node/
-        read only = false
-        lock file = /var/lock/container6041.lock
-
-
-        [object6010]
-        max connections = 25
-        path = /srv/1/node/
-        read only = false
-        lock file = /var/lock/object6010.lock
-
-        [object6020]
-        max connections = 25
-        path = /srv/2/node/
-        read only = false
-        lock file = /var/lock/object6020.lock
-
-        [object6030]
-        max connections = 25
-        path = /srv/3/node/
-        read only = false
-        lock file = /var/lock/object6030.lock
-
-        [object6040]
-        max connections = 25
-        path = /srv/4/node/
-        read only = false
-        lock file = /var/lock/object6040.lock
-
-  #. On Ubuntu, edit the following line in /etc/default/rsync::
-
-        RSYNC_ENABLE=true
-
-     On Fedora, edit the following line in /etc/xinetd.d/rsync::
-
-        disable = no
-
-  #. On Ubuntu `service rsync restart`
+   * On OpenSuse place the lines in ``/etc/init.d/boot.local``.
 
-------------------
-Starting memcached
-------------------
+   .. note::
+      On some systems the rc file might need to be an executable shell script.
 
-On Fedora, make sure that memcached runs, running this if necessary:
+Creating an XFS tmp dir
+-----------------------
 
-  * `systemctl enable memcached.service`
-  * `systemctl start memcached.service`
+Tests require having a directory available on an XFS filesystem. By default the
+tests use ``/tmp``, however this can be pointed elsewhere with the ``TMPDIR``
+environment variable.
 
-If this is not done, tokens of tempauth expire immediately and accessing
-Swift with curl becomes impossible.
+.. note::
+   If your root filesystem is XFS, you can skip this section if ``/tmp`` is
+   just a directory and not a mounted tmpfs. Or you could simply point to any
+   existing directory owned by your user by specifying it with the ``TMPDIR``
+   environment variable.
 
----------------------------------------------------
-Optional: Setting up rsyslog for individual logging
----------------------------------------------------
+   If your root filesystem is not XFS, you should create a loopback device,
+   format it with XFS and mount it. You can mount it over ``/tmp`` or to
+   another location and specify it with the ``TMPDIR`` environment variable.
 
-  #. Create /etc/rsyslog.d/10-swift.conf::
+* Create the file for the tmp loopback device::
 
-      # Uncomment the following to have a log containing all logs together
-      #local1,local2,local3,local4,local5.*   /var/log/swift/all.log
+      sudo mkdir -p /srv
+      sudo truncate -s 1GB /srv/swift-tmp  # create 1GB file for XFS in /srv
+      sudo mkfs.xfs /srv/swift-tmp
 
-      # Uncomment the following to have hourly proxy logs for stats processing
-      #$template HourlyProxyLog,"/var/log/swift/hourly/%$YEAR%%$MONTH%%$DAY%%$HOUR%"
-      #local1.*;local1.!notice ?HourlyProxyLog
+* To mount the tmp loopback device at ``/tmp``, do the following::
 
-      local1.*;local1.!notice /var/log/swift/proxy.log
-      local1.notice           /var/log/swift/proxy.error
-      local1.*                ~
+      sudo mount -o loop,noatime /srv/swift-tmp /tmp
+      sudo chmod -R 1777 /tmp
 
-      local2.*;local2.!notice /var/log/swift/storage1.log
-      local2.notice           /var/log/swift/storage1.error
-      local2.*                ~
+  * To persist this, edit and add the following to ``/etc/fstab``::
 
-      local3.*;local3.!notice /var/log/swift/storage2.log
-      local3.notice           /var/log/swift/storage2.error
-      local3.*                ~
+        /srv/swift-tmp /tmp xfs rw,noatime,attr2,inode64,noquota 0 0
 
-      local4.*;local4.!notice /var/log/swift/storage3.log
-      local4.notice           /var/log/swift/storage3.error
-      local4.*                ~
+* To mount the tmp loopback at an alternate location (for example, ``/mnt/tmp``),
+  do the following::
 
-      local5.*;local5.!notice /var/log/swift/storage4.log
-      local5.notice           /var/log/swift/storage4.error
-      local5.*                ~
+      sudo mkdir -p /mnt/tmp
+      sudo mount -o loop,noatime /srv/swift-tmp /mnt/tmp
+      sudo chown ${USER}:${USER} /mnt/tmp
 
-  #. Edit /etc/rsyslog.conf and make the following change::
+  * To persist this, edit and add the following to ``/etc/fstab``::
 
-      $PrivDropToGroup adm
+        /srv/swift-tmp /mnt/tmp xfs rw,noatime,attr2,inode64,noquota 0 0
 
-  #. `mkdir -p /var/log/swift/hourly`
-  #. `chown -R syslog.adm /var/log/swift`
-  #. `chmod -R g+w /var/log/swift`
-  #. `service rsyslog restart`
+  * Set your ``TMPDIR`` environment dir so that Swift looks in the right location::
 
-------------------------------------------------
-Getting the code and setting up test environment
-------------------------------------------------
+        export TMPDIR=/mnt/tmp
+        echo "export TMPDIR=/mnt/tmp" >> $HOME/.bashrc
 
-Sample configuration files are provided with all defaults in line-by-line comments.
+----------------
+Getting the code
+----------------
 
-Do these commands as you on guest.
+#. Check out the python-swiftclient repo::
 
-  #. `mkdir ~/bin`
-  #. Check out the swift repo with `git clone https://github.com/openstack/swift.git`
-  #. Build a development installation of swift, for example:
-     `cd ~/swift; sudo python setup.py develop`
-  #. Check out the python-swiftclient repo with `git clone https://github.com/openstack/python-swiftclient.git`
-  #. Build a development installation of python-swiftclient, for example:
-     `cd ~/python-swiftclient; sudo python setup.py develop`
-  #. Edit `~/.bashrc` and add to the end::
+      cd $HOME; git clone https://opendev.org/openstack/python-swiftclient.git
 
-        export SWIFT_TEST_CONFIG_FILE=/etc/swift/test.conf
-        export PATH=${PATH}:~/bin
+#. Build a development installation of python-swiftclient::
 
-  #. `. ~/.bashrc`
+      cd $HOME/python-swiftclient; sudo python3 setup.py develop; cd -
 
----------------------
-Configuring each node
----------------------
+#. Check out the Swift repo::
 
-Sample configuration files are provided with all defaults in line-by-line comments.
+      git clone https://github.com/openstack/swift.git
 
-  #. Create `/etc/swift/proxy-server.conf`::
+#. Build a development installation of Swift::
 
-        [DEFAULT]
-        bind_port = 8080
-        user = <your-user-name>
-        log_facility = LOG_LOCAL1
-        eventlet_debug = true
+      cd $HOME/swift; sudo pip install --no-binary cryptography -r requirements.txt; sudo python setup.py develop; cd -
 
-        [pipeline:main]
-        pipeline = healthcheck cache tempauth proxy-logging proxy-server
+   .. note::
+      Due to a difference in how ``libssl.so`` is named in OpenSuse vs. other Linux distros the
+      wheel/binary won't work; thus we use ``--no-binary cryptography`` to build ``cryptography``
+      locally.
 
-        [app:proxy-server]
-        use = egg:swift#proxy
-        allow_account_management = true
-        account_autocreate = true
+   Fedora users might have to perform the following if development
+   installation of Swift fails::
 
-        [filter:tempauth]
-        use = egg:swift#tempauth
-        user_admin_admin = admin .admin .reseller_admin
-        user_test_tester = testing .admin
-        user_test2_tester2 = testing2 .admin
-        user_test_tester3 = testing3
+      sudo pip install -U xattr
 
-        [filter:healthcheck]
-        use = egg:swift#healthcheck
+#. Install Swift's test dependencies::
 
-        [filter:cache]
-        use = egg:swift#memcache
+      cd $HOME/swift; sudo pip install -r test-requirements.txt
 
-        [filter:proxy-logging]
-        use = egg:swift#proxy_logging
+----------------
+Setting up rsync
+----------------
 
-  #. Create `/etc/swift/swift.conf`:
+#. Create ``/etc/rsyncd.conf``::
 
-     .. code-block:: none
+      sudo cp $HOME/swift/doc/saio/rsyncd.conf /etc/
+      sudo sed -i "s/<your-user-name>/${USER}/" /etc/rsyncd.conf
 
-        [swift-hash]
-        # random unique string that can never change (DO NOT LOSE)
-        swift_hash_path_suffix = changeme
+   Here is the default ``rsyncd.conf`` file contents maintained in the repo
+   that is copied and fixed up above:
 
-  #. Create `/etc/swift/account-server/1.conf`::
+   .. literalinclude:: /../saio/rsyncd.conf
+      :language: ini
 
-        [DEFAULT]
-        devices = /srv/1/node
-        mount_check = false
-        disable_fallocate = true
-        bind_port = 6012
-        user = <your-user-name>
-        log_facility = LOG_LOCAL2
-        recon_cache_path = /var/cache/swift
-        eventlet_debug = true
+#. Enable rsync daemon
 
-        [pipeline:main]
-        pipeline = recon account-server
+   * On Ubuntu, edit the following line in ``/etc/default/rsync``::
 
-        [app:account-server]
-        use = egg:swift#account
+      RSYNC_ENABLE=true
 
-        [filter:recon]
-        use = egg:swift#recon
+   .. note::
+      You might have to create the file to perform the edits.
 
-        [account-replicator]
-        vm_test_mode = yes
+   * On CentOS and Fedora, enable the systemd service::
 
-        [account-auditor]
+      sudo systemctl enable rsyncd
 
-        [account-reaper]
+   * On OpenSuse, nothing needs to happen here.
 
-  #. Create `/etc/swift/account-server/2.conf`::
 
-        [DEFAULT]
-        devices = /srv/2/node
-        mount_check = false
-        disable_fallocate = true
-        bind_port = 6022
-        user = <your-user-name>
-        log_facility = LOG_LOCAL3
-        recon_cache_path = /var/cache/swift2
-        eventlet_debug = true
+#. On platforms with SELinux in ``Enforcing`` mode, either set to ``Permissive``::
 
-        [pipeline:main]
-        pipeline = recon account-server
+      sudo setenforce Permissive
+      sudo sed -i 's/^SELINUX=.*/SELINUX=permissive/g' /etc/selinux/config
 
-        [app:account-server]
-        use = egg:swift#account
+   Or just allow rsync full access::
 
-        [filter:recon]
-        use = egg:swift#recon
+      sudo setsebool -P rsync_full_access 1
 
-        [account-replicator]
-        vm_test_mode = yes
+#. Start the rsync daemon
 
-        [account-auditor]
+   * On Ubuntu 14.04, run::
 
-        [account-reaper]
+      sudo service rsync restart
 
-  #. Create `/etc/swift/account-server/3.conf`::
+   * On Ubuntu 16.04, run::
 
-        [DEFAULT]
-        devices = /srv/3/node
-        mount_check = false
-        disable_fallocate = true
-        bind_port = 6032
-        user = <your-user-name>
-        log_facility = LOG_LOCAL4
-        recon_cache_path = /var/cache/swift3
-        eventlet_debug = true
+      sudo systemctl enable rsync
+      sudo systemctl start rsync
 
-        [pipeline:main]
-        pipeline = recon account-server
+   * On CentOS, Fedora and OpenSuse, run::
 
-        [app:account-server]
-        use = egg:swift#account
+      sudo systemctl start rsyncd
 
-        [filter:recon]
-        use = egg:swift#recon
+   * On other xinetd based systems simply run::
 
-        [account-replicator]
-        vm_test_mode = yes
+      sudo service xinetd restart
 
-        [account-auditor]
+#. Verify rsync is accepting connections for all servers::
 
-        [account-reaper]
+      rsync rsync://pub@localhost/
 
-  #. Create `/etc/swift/account-server/4.conf`::
+   You should see the following output from the above command::
 
-        [DEFAULT]
-        devices = /srv/4/node
-        mount_check = false
-        disable_fallocate = true
-        bind_port = 6042
-        user = <your-user-name>
-        log_facility = LOG_LOCAL5
-        recon_cache_path = /var/cache/swift4
-        eventlet_debug = true
+      account6212
+      account6222
+      account6232
+      account6242
+      container6211
+      container6221
+      container6231
+      container6241
+      object6210
+      object6220
+      object6230
+      object6240
 
-        [pipeline:main]
-        pipeline = recon account-server
+------------------
+Starting memcached
+------------------
 
-        [app:account-server]
-        use = egg:swift#account
+On non-Ubuntu distros you need to ensure memcached is running::
 
-        [filter:recon]
-        use = egg:swift#recon
+        sudo service memcached start
+        sudo chkconfig memcached on
 
-        [account-replicator]
-        vm_test_mode = yes
+or::
 
-        [account-auditor]
+        sudo systemctl enable memcached
+        sudo systemctl start memcached
 
-        [account-reaper]
+The tempauth middleware stores tokens in memcached. If memcached is not
+running, tokens cannot be validated, and accessing Swift becomes impossible.
 
-  #. Create `/etc/swift/container-server/1.conf`::
+---------------------------------------------------
+Optional: Setting up rsyslog for individual logging
+---------------------------------------------------
 
-        [DEFAULT]
-        devices = /srv/1/node
-        mount_check = false
-        disable_fallocate = true
-        bind_port = 6011
-        user = <your-user-name>
-        log_facility = LOG_LOCAL2
-        recon_cache_path = /var/cache/swift
-        eventlet_debug = true
+Fedora and OpenSuse may not have rsyslog installed, in which case you will need
+to install it if you want to use individual logging.
 
-        [pipeline:main]
-        pipeline = recon container-server
+#. Install rsyslogd
 
-        [app:container-server]
-        use = egg:swift#container
 
-        [filter:recon]
-        use = egg:swift#recon
+   * On Fedora::
 
-        [container-replicator]
-        vm_test_mode = yes
+      sudo dnf install rsyslog
 
-        [container-updater]
+   * On OpenSuse::
 
-        [container-auditor]
+      sudo zypper install rsyslog
 
-        [container-sync]
+#. Install the Swift rsyslogd configuration::
 
-  #. Create `/etc/swift/container-server/2.conf`::
+      sudo cp $HOME/swift/doc/saio/rsyslog.d/10-swift.conf /etc/rsyslog.d/
 
-        [DEFAULT]
-        devices = /srv/2/node
-        mount_check = false
-        disable_fallocate = true
-        bind_port = 6021
-        user = <your-user-name>
-        log_facility = LOG_LOCAL3
-        recon_cache_path = /var/cache/swift2
-        eventlet_debug = true
+   Be sure to review that conf file to determine if you want all the logs
+   in one file vs. all the logs separated out, and if you want hourly logs
+   for stats processing. For convenience, we provide its default contents
+   below:
 
-        [pipeline:main]
-        pipeline = recon container-server
+   .. literalinclude:: /../saio/rsyslog.d/10-swift.conf
+      :language: ini
 
-        [app:container-server]
-        use = egg:swift#container
+#. Edit ``/etc/rsyslog.conf`` and make the following change (usually in the
+   "GLOBAL DIRECTIVES" section)::
 
-        [filter:recon]
-        use = egg:swift#recon
+      $PrivDropToGroup adm
 
-        [container-replicator]
-        vm_test_mode = yes
+#. If using hourly logs (see above) perform::
 
-        [container-updater]
+      sudo mkdir -p /var/log/swift/hourly
 
-        [container-auditor]
+   Otherwise perform::
 
-        [container-sync]
+      sudo mkdir -p /var/log/swift
 
-  #. Create `/etc/swift/container-server/3.conf`::
+#. Setup the logging directory and start syslog:
 
-        [DEFAULT]
-        devices = /srv/3/node
-        mount_check = false
-        disable_fallocate = true
-        bind_port = 6031
-        user = <your-user-name>
-        log_facility = LOG_LOCAL4
-        recon_cache_path = /var/cache/swift3
-        eventlet_debug = true
+   * On Ubuntu::
 
-        [pipeline:main]
-        pipeline = recon container-server
+      sudo chown -R syslog.adm /var/log/swift
+      sudo chmod -R g+w /var/log/swift
+      sudo service rsyslog restart
 
-        [app:container-server]
-        use = egg:swift#container
+   * On CentOS, Fedora and OpenSuse::
 
-        [filter:recon]
-        use = egg:swift#recon
+      sudo chown -R root:adm /var/log/swift
+      sudo chmod -R g+w /var/log/swift
+      sudo systemctl restart rsyslog
+      sudo systemctl enable rsyslog
 
-        [container-replicator]
-        vm_test_mode = yes
+---------------------
+Configuring each node
+---------------------
 
-        [container-updater]
+After performing the following steps, be sure to verify that Swift has access
+to resulting configuration files (sample configuration files are provided with
+all defaults in line-by-line comments).
 
-        [container-auditor]
+#. Optionally remove an existing swift directory::
 
-        [container-sync]
+      sudo rm -rf /etc/swift
 
-  #. Create `/etc/swift/container-server/4.conf`::
+#. Populate the ``/etc/swift`` directory itself::
 
-        [DEFAULT]
-        devices = /srv/4/node
-        mount_check = false
-        disable_fallocate = true
-        bind_port = 6041
-        user = <your-user-name>
-        log_facility = LOG_LOCAL5
-        recon_cache_path = /var/cache/swift4
-        eventlet_debug = true
+      cd $HOME/swift/doc; sudo cp -r saio/swift /etc/swift; cd -
+      sudo chown -R ${USER}:${USER} /etc/swift
 
-        [pipeline:main]
-        pipeline = recon container-server
+#. Update ``<your-user-name>`` references in the Swift config files::
 
-        [app:container-server]
-        use = egg:swift#container
+      find /etc/swift/ -name \*.conf | xargs sudo sed -i "s/<your-user-name>/${USER}/"
 
-        [filter:recon]
-        use = egg:swift#recon
+The contents of the configuration files provided by executing the above
+commands are as follows:
 
-        [container-replicator]
-        vm_test_mode = yes
+#. ``/etc/swift/swift.conf``
 
-        [container-updater]
+   .. literalinclude:: /../saio/swift/swift.conf
+      :language: ini
 
-        [container-auditor]
+#. ``/etc/swift/proxy-server.conf``
 
-        [container-sync]
+   .. literalinclude:: /../saio/swift/proxy-server.conf
+      :language: ini
 
+#. ``/etc/swift/object-expirer.conf``
 
-  #. Create `/etc/swift/object-server/1.conf`::
+   .. literalinclude:: /../saio/swift/object-expirer.conf
+      :language: ini
 
-        [DEFAULT]
-        devices = /srv/1/node
-        mount_check = false
-        disable_fallocate = true
-        bind_port = 6010
-        user = <your-user-name>
-        log_facility = LOG_LOCAL2
-        recon_cache_path = /var/cache/swift
-        eventlet_debug = true
+#. ``/etc/swift/container-sync-realms.conf``
 
-        [pipeline:main]
-        pipeline = recon object-server
+   .. literalinclude:: /../saio/swift/container-sync-realms.conf
+      :language: ini
 
-        [app:object-server]
-        use = egg:swift#object
+#. ``/etc/swift/account-server/1.conf``
 
-        [filter:recon]
-        use = egg:swift#recon
+   .. literalinclude:: /../saio/swift/account-server/1.conf
+      :language: ini
 
-        [object-replicator]
-        vm_test_mode = yes
+#. ``/etc/swift/container-server/1.conf``
 
-        [object-updater]
+   .. literalinclude:: /../saio/swift/container-server/1.conf
+      :language: ini
 
-        [object-auditor]
+#. ``/etc/swift/container-reconciler/1.conf``
 
-  #. Create `/etc/swift/object-server/2.conf`::
+   .. literalinclude:: /../saio/swift/container-reconciler/1.conf
+      :language: ini
 
-        [DEFAULT]
-        devices = /srv/2/node
-        mount_check = false
-        disable_fallocate = true
-        bind_port = 6020
-        user = <your-user-name>
-        log_facility = LOG_LOCAL3
-        recon_cache_path = /var/cache/swift2
-        eventlet_debug = true
+#. ``/etc/swift/object-server/1.conf``
 
-        [pipeline:main]
-        pipeline = recon object-server
+   .. literalinclude:: /../saio/swift/object-server/1.conf
+      :language: ini
 
-        [app:object-server]
-        use = egg:swift#object
+#. ``/etc/swift/account-server/2.conf``
 
-        [filter:recon]
-        use = egg:swift#recon
+   .. literalinclude:: /../saio/swift/account-server/2.conf
+      :language: ini
 
-        [object-replicator]
-        vm_test_mode = yes
+#. ``/etc/swift/container-server/2.conf``
 
-        [object-updater]
+   .. literalinclude:: /../saio/swift/container-server/2.conf
+      :language: ini
 
-        [object-auditor]
+#. ``/etc/swift/container-reconciler/2.conf``
 
-  #. Create `/etc/swift/object-server/3.conf`::
+   .. literalinclude:: /../saio/swift/container-reconciler/2.conf
+      :language: ini
 
-        [DEFAULT]
-        devices = /srv/3/node
-        mount_check = false
-        disable_fallocate = true
-        bind_port = 6030
-        user = <your-user-name>
-        log_facility = LOG_LOCAL4
-        recon_cache_path = /var/cache/swift3
-        eventlet_debug = true
+#. ``/etc/swift/object-server/2.conf``
 
-        [pipeline:main]
-        pipeline = recon object-server
+   .. literalinclude:: /../saio/swift/object-server/2.conf
+      :language: ini
 
-        [app:object-server]
-        use = egg:swift#object
+#. ``/etc/swift/account-server/3.conf``
 
-        [filter:recon]
-        use = egg:swift#recon
+   .. literalinclude:: /../saio/swift/account-server/3.conf
+      :language: ini
 
-        [object-replicator]
-        vm_test_mode = yes
+#. ``/etc/swift/container-server/3.conf``
 
-        [object-updater]
+   .. literalinclude:: /../saio/swift/container-server/3.conf
+      :language: ini
 
-        [object-auditor]
+#. ``/etc/swift/container-reconciler/3.conf``
 
-  #. Create `/etc/swift/object-server/4.conf`::
+   .. literalinclude:: /../saio/swift/container-reconciler/3.conf
+      :language: ini
 
-        [DEFAULT]
-        devices = /srv/4/node
-        mount_check = false
-        disable_fallocate = true
-        bind_port = 6040
-        user = <your-user-name>
-        log_facility = LOG_LOCAL5
-        recon_cache_path = /var/cache/swift4
-        eventlet_debug = true
+#. ``/etc/swift/object-server/3.conf``
 
-        [pipeline:main]
-        pipeline = recon object-server
+   .. literalinclude:: /../saio/swift/object-server/3.conf
+      :language: ini
 
-        [app:object-server]
-        use = egg:swift#object
+#. ``/etc/swift/account-server/4.conf``
 
-        [filter:recon]
-        use = egg:swift#recon
+   .. literalinclude:: /../saio/swift/account-server/4.conf
+      :language: ini
 
-        [object-replicator]
-        vm_test_mode = yes
+#. ``/etc/swift/container-server/4.conf``
 
-        [object-updater]
+   .. literalinclude:: /../saio/swift/container-server/4.conf
+      :language: ini
 
-        [object-auditor]
+#. ``/etc/swift/container-reconciler/4.conf``
+
+   .. literalinclude:: /../saio/swift/container-reconciler/4.conf
+      :language: ini
+
+#. ``/etc/swift/object-server/4.conf``
+
+   .. literalinclude:: /../saio/swift/object-server/4.conf
+      :language: ini
+
+.. _setup_scripts:
 
 ------------------------------------
 Setting up scripts for running Swift
 ------------------------------------
 
-  #. Create `~/bin/resetswift.`
+#. Copy the SAIO scripts for resetting the environment::
+
+      mkdir -p $HOME/bin
+      cd $HOME/swift/doc; cp saio/bin/* $HOME/bin; cd -
+      chmod +x $HOME/bin/*
+
+#. Edit the ``$HOME/bin/resetswift`` script
+
+   The template ``resetswift`` script looks like the following:
+
+   .. literalinclude:: /../saio/bin/resetswift
+      :language: bash
+
+   If you did not set up rsyslog for individual logging, remove the ``find
+   /var/log/swift...`` line::
+
+      sed -i "/find \/var\/log\/swift/d" $HOME/bin/resetswift
+
+
+#. Install the sample configuration file for running tests::
+
+      cp $HOME/swift/test/sample.conf /etc/swift/test.conf
+
+   The template ``test.conf`` looks like the following:
+
+   .. literalinclude:: /../../test/sample.conf
+      :language: ini
+
+-----------------------------------------
+Configure environment variables for Swift
+-----------------------------------------
+
+#. Add an environment variable for running tests below::
+
+      echo "export SWIFT_TEST_CONFIG_FILE=/etc/swift/test.conf" >> $HOME/.bashrc
+
+#. Be sure that your ``PATH`` includes the ``bin`` directory::
+
+      echo "export PATH=${PATH}:$HOME/bin" >> $HOME/.bashrc
+
+#. If you are using a loopback device for Swift Storage, add an environment var
+   to substitute ``/dev/sdb1`` with ``/srv/swift-disk``::
+
+      echo "export SAIO_BLOCK_DEVICE=/srv/swift-disk" >> $HOME/.bashrc
+
+#. If you are using a device other than ``/dev/sdb1`` for Swift storage (for
+   example, ``/dev/vdb1``), add an environment var to substitute it::
+
+      echo "export SAIO_BLOCK_DEVICE=/dev/vdb1" >> $HOME/.bashrc
+
+#. If you are using a location other than ``/tmp`` for Swift tmp data (for
+   example, ``/mnt/tmp``), add ``TMPDIR`` environment var to set it::
+
+      export TMPDIR=/mnt/tmp
+      echo "export TMPDIR=/mnt/tmp" >> $HOME/.bashrc
+
+#. Source the above environment variables into your current environment::
+
+      . $HOME/.bashrc
+
+--------------------------
+Constructing initial rings
+--------------------------
+
+#. Construct the initial rings using the provided script::
+
+      remakerings
+
+   The ``remakerings`` script looks like the following:
+
+   .. literalinclude:: /../saio/bin/remakerings
+      :language: bash
+
+   You can expect the output from this command to produce the following.  Note
+   that 3 object rings are created in order to test storage policies and EC in
+   the SAIO environment.  The EC ring is the only one with all 8 devices.
+   There are also two replication rings, one for 3x replication and another
+   for 2x replication, but those rings only use 4 devices:
+
+
+   .. code-block:: console
+
+      Device d0r1z1-127.0.0.1:6210R127.0.0.1:6210/sdb1_"" with 1.0 weight got id 0
+      Device d1r1z2-127.0.0.2:6220R127.0.0.2:6220/sdb2_"" with 1.0 weight got id 1
+      Device d2r1z3-127.0.0.3:6230R127.0.0.3:6230/sdb3_"" with 1.0 weight got id 2
+      Device d3r1z4-127.0.0.4:6240R127.0.0.4:6240/sdb4_"" with 1.0 weight got id 3
+      Reassigned 3072 (300.00%) partitions. Balance is now 0.00.  Dispersion is now 0.00
+      Device d0r1z1-127.0.0.1:6210R127.0.0.1:6210/sdb1_"" with 1.0 weight got id 0
+      Device d1r1z2-127.0.0.2:6220R127.0.0.2:6220/sdb2_"" with 1.0 weight got id 1
+      Device d2r1z3-127.0.0.3:6230R127.0.0.3:6230/sdb3_"" with 1.0 weight got id 2
+      Device d3r1z4-127.0.0.4:6240R127.0.0.4:6240/sdb4_"" with 1.0 weight got id 3
+      Reassigned 2048 (200.00%) partitions. Balance is now 0.00.  Dispersion is now 0.00
+      Device d0r1z1-127.0.0.1:6210R127.0.0.1:6210/sdb1_"" with 1.0 weight got id 0
+      Device d1r1z1-127.0.0.1:6210R127.0.0.1:6210/sdb5_"" with 1.0 weight got id 1
+      Device d2r1z2-127.0.0.2:6220R127.0.0.2:6220/sdb2_"" with 1.0 weight got id 2
+      Device d3r1z2-127.0.0.2:6220R127.0.0.2:6220/sdb6_"" with 1.0 weight got id 3
+      Device d4r1z3-127.0.0.3:6230R127.0.0.3:6230/sdb3_"" with 1.0 weight got id 4
+      Device d5r1z3-127.0.0.3:6230R127.0.0.3:6230/sdb7_"" with 1.0 weight got id 5
+      Device d6r1z4-127.0.0.4:6240R127.0.0.4:6240/sdb4_"" with 1.0 weight got id 6
+      Device d7r1z4-127.0.0.4:6240R127.0.0.4:6240/sdb8_"" with 1.0 weight got id 7
+      Reassigned 6144 (600.00%) partitions. Balance is now 0.00.  Dispersion is now 0.00
+      Device d0r1z1-127.0.0.1:6211R127.0.0.1:6211/sdb1_"" with 1.0 weight got id 0
+      Device d1r1z2-127.0.0.2:6221R127.0.0.2:6221/sdb2_"" with 1.0 weight got id 1
+      Device d2r1z3-127.0.0.3:6231R127.0.0.3:6231/sdb3_"" with 1.0 weight got id 2
+      Device d3r1z4-127.0.0.4:6241R127.0.0.4:6241/sdb4_"" with 1.0 weight got id 3
+      Reassigned 3072 (300.00%) partitions. Balance is now 0.00.  Dispersion is now 0.00
+      Device d0r1z1-127.0.0.1:6212R127.0.0.1:6212/sdb1_"" with 1.0 weight got id 0
+      Device d1r1z2-127.0.0.2:6222R127.0.0.2:6222/sdb2_"" with 1.0 weight got id 1
+      Device d2r1z3-127.0.0.3:6232R127.0.0.3:6232/sdb3_"" with 1.0 weight got id 2
+      Device d3r1z4-127.0.0.4:6242R127.0.0.4:6242/sdb4_"" with 1.0 weight got id 3
+      Reassigned 3072 (300.00%) partitions. Balance is now 0.00.  Dispersion is now 0.00
+
+
+#. Read more about Storage Policies and your SAIO :doc:`policies_saio`
+
+-------------
+Testing Swift
+-------------
 
-     If you are using a loopback device substitute `/dev/sdb1` with `/srv/swift-disk`.
+#. Verify the unit tests run::
 
-     If you did not set up rsyslog for individual logging, remove the `find /var/log/swift...` line::
+      $HOME/swift/.unittests
 
-        #!/bin/bash
+   Note that the unit tests do not require any Swift daemons running.
 
-        swift-init all stop
-        find /var/log/swift -type f -exec rm -f {} \;
-        sudo umount /mnt/sdb1
-        sudo mkfs.xfs -f -i size=1024 /dev/sdb1
-        sudo mount /mnt/sdb1
-        sudo mkdir /mnt/sdb1/1 /mnt/sdb1/2 /mnt/sdb1/3 /mnt/sdb1/4
-        sudo chown <your-user-name>:<your-group-name> /mnt/sdb1/*
-        mkdir -p /srv/1/node/sdb1 /srv/2/node/sdb2 /srv/3/node/sdb3 /srv/4/node/sdb4
-        sudo rm -f /var/log/debug /var/log/messages /var/log/rsyncd.log /var/log/syslog
-        find /var/cache/swift* -type f -name *.recon -exec rm -f {} \;
-        sudo service rsyslog restart
-        sudo service memcached restart
+#. Start the "main" Swift daemon processes (proxy, account, container, and
+   object)::
 
-  #. Create `~/bin/remakerings`::
+      startmain
 
-        #!/bin/bash
+   (The "``Unable to increase file descriptor limit.  Running as non-root?``"
+   warnings are expected and ok.)
 
-        cd /etc/swift
+   The ``startmain`` script looks like the following:
 
-        rm -f *.builder *.ring.gz backups/*.builder backups/*.ring.gz
+   .. literalinclude:: /../saio/bin/startmain
+      :language: bash
 
-        swift-ring-builder object.builder create 18 3 1
-        swift-ring-builder object.builder add z1-127.0.0.1:6010/sdb1 1
-        swift-ring-builder object.builder add z2-127.0.0.1:6020/sdb2 1
-        swift-ring-builder object.builder add z3-127.0.0.1:6030/sdb3 1
-        swift-ring-builder object.builder add z4-127.0.0.1:6040/sdb4 1
-        swift-ring-builder object.builder rebalance
-        swift-ring-builder container.builder create 18 3 1
-        swift-ring-builder container.builder add z1-127.0.0.1:6011/sdb1 1
-        swift-ring-builder container.builder add z2-127.0.0.1:6021/sdb2 1
-        swift-ring-builder container.builder add z3-127.0.0.1:6031/sdb3 1
-        swift-ring-builder container.builder add z4-127.0.0.1:6041/sdb4 1
-        swift-ring-builder container.builder rebalance
-        swift-ring-builder account.builder create 18 3 1
-        swift-ring-builder account.builder add z1-127.0.0.1:6012/sdb1 1
-        swift-ring-builder account.builder add z2-127.0.0.1:6022/sdb2 1
-        swift-ring-builder account.builder add z3-127.0.0.1:6032/sdb3 1
-        swift-ring-builder account.builder add z4-127.0.0.1:6042/sdb4 1
-        swift-ring-builder account.builder rebalance
+#. Get an ``X-Storage-Url`` and ``X-Auth-Token``::
 
-  #. Create `~/bin/startmain`::
+      curl -v -H 'X-Storage-User: test:tester' -H 'X-Storage-Pass: testing' http://127.0.0.1:8080/auth/v1.0
 
-        #!/bin/bash
+#. Check that you can ``GET`` account::
 
-        swift-init main start
+      curl -v -H 'X-Auth-Token: <token-from-x-auth-token-above>' <url-from-x-storage-url-above>
 
-  #. Create `~/bin/startrest`::
+#. Check that the ``swift`` command provided by python-swiftclient works::
 
-        #!/bin/bash
+      swift -A http://127.0.0.1:8080/auth/v1.0 -U test:tester -K testing stat
 
-        swift-init rest start
+#. Verify the functional tests run::
 
-  #. `chmod +x ~/bin/*`
-  #. `remakerings`
-  #. `cd ~/swift; ./.unittests`
-  #. `startmain` (The ``Unable to increase file descriptor limit.  Running as non-root?`` warnings are expected and ok.)
-  #. Get an `X-Storage-Url` and `X-Auth-Token`: ``curl -v -H 'X-Storage-User: test:tester' -H 'X-Storage-Pass: testing' http://127.0.0.1:8080/auth/v1.0``
-  #. Check that you can GET account: ``curl -v -H 'X-Auth-Token: <token-from-x-auth-token-above>' <url-from-x-storage-url-above>``
-  #. Check that `swift` works: `swift -A http://127.0.0.1:8080/auth/v1.0 -U test:tester -K testing stat`
-  #. `cp ~/swift/test/sample.conf /etc/swift/test.conf`
-  #. `cd ~/swift; ./.functests` (Note: functional tests will first delete
-     everything in the configured accounts.)
-  #. `cd ~/swift; ./.probetests` (Note: probe tests will reset your
-     environment as they call `resetswift` for each test.)
+      $HOME/swift/.functests
 
-If you plan to work on documentation (and who doesn't?!) you must
-install Sphinx and then you can build the documentation:
+   (Note: functional tests will first delete everything in the configured
+   accounts.)
 
-On Ubuntu:
-  #. `sudo apt-get install python-sphinx`
-  #. `python setup.py build_sphinx`
+#. Verify the probe tests run::
 
-On MacOS:
-  #. `sudo easy_install -U sphinx`
-  #. `python setup.py build_sphinx`
+      $HOME/swift/.probetests
 
-Install tox so you find Py26 and PEP8 problems before Jenkins does:
-  #. `sudo apt-get install python2.6-dev python-pip`
-  #. `sudo pip install tox`
+   (Note: probe tests will reset your environment as they call ``resetswift``
+   for each test.)
 
 ----------------
 Debugging Issues
 ----------------
 
-If all doesn't go as planned, and tests fail, or you can't auth, or something doesn't work, here are some good starting places to look for issues:
+If all doesn't go as planned, and tests fail, or you can't auth, or something
+doesn't work, here are some good starting places to look for issues:
 
-#. Everything is logged in /var/log/syslog, so that is a good first place to
-   look for errors (most likely python tracebacks).
+#. Everything is logged using system facilities -- usually in ``/var/log/syslog``,
+   but possibly in ``/var/log/messages`` on e.g. Fedora -- so that is a good first
+   place to look for errors (most likely python tracebacks).
 #. Make sure all of the server processes are running.  For the base
    functionality, the Proxy, Account, Container, and Object servers
    should be running.
 #. If one of the servers are not running, and no errors are logged to syslog,
    it may be useful to try to start the server manually, for example:
-   `swift-object-server /etc/swift/object-server/1.conf` will start the
+   ``swift-object-server /etc/swift/object-server/1.conf`` will start the
    object server.  If there are problems not showing up in syslog,
    then you will likely see the traceback on startup.
 #. If you need to, you can turn off syslog for unit tests. This can be
-   useful for environments where /dev/log is unavailable, or which
+   useful for environments where ``/dev/log`` is unavailable, or which
    cannot rate limit (unit tests generate a lot of logs very quickly).
-   Open the file SWIFT_TEST_CONFIG_FILE points to, and change the
-   value of fake_syslog to True.
+   Open the file ``SWIFT_TEST_CONFIG_FILE`` points to, and change the
+   value of ``fake_syslog`` to ``True``.
+#. If you encounter a ``401 Unauthorized`` when following Step 12 where
+   you check that you can ``GET`` account, use ``sudo service memcached status``
+   and check if memcache is running. If memcache is not running, start it using
+   ``sudo service memcached start``. Once memcache is running, rerun ``GET`` account.
+
+------------
+Known Issues
+------------
+
+Listed here are some "gotcha's" that you may run into when using or testing your SAIO:
+
+#. fallocate_reserve - in most cases a SAIO doesn't have a very large XFS partition
+   so having fallocate enabled and fallocate_reserve set can cause issues, specifically
+   when trying to run the functional tests. For this reason fallocate has been turned
+   off on the object-servers in the SAIO. If you want to play with the fallocate_reserve
+   settings then know that functional tests will fail unless you change the max_file_size
+   constraint to something more reasonable then the default (5G). Ideally you'd make
+   it 1/4 of your XFS file system size so the tests can pass.
diff --git a/doc/source/development_watchers.rst b/doc/source/development_watchers.rst
new file mode 100644
index 0000000000..6aee254394
--- /dev/null
+++ b/doc/source/development_watchers.rst
@@ -0,0 +1,112 @@
+================
+Auditor Watchers
+================
+
+--------
+Overview
+--------
+
+The duty of auditors is to guard Swift against corruption in the
+storage media. But because auditors crawl all objects, they can be
+used to program Swift to operate on every object. It is done through
+an API known as "watcher".
+
+Watchers do not have any private view into the cluster.
+An operator can write a standalone program that walks the
+directories and performs any desired inspection or maintenance.
+What watcher brings to the table is a framework to do the same
+job easily, under resource restrictions already in place
+for the auditor.
+
+Operations performed by watchers are often site-specific, or else
+they would be incorporated into Swift already. However, the code in
+the tree provides a reference implementation for convenience.
+It is located in swift/obj/watchers/dark_data.py and implements
+so-called "Dark Data Watcher".
+
+Currently, only object auditor supports the watchers.
+
+-------------
+The API class
+-------------
+
+The implementation of a watcher is a Python class that may look like this::
+
+  class MyWatcher(object):
+
+    def __init__(self, conf, logger, **kwargs):
+        pass
+
+    def start(self, audit_type, **kwargs):
+        pass
+
+    def see_object(self, object_metadata, policy_index, partition,
+                   data_file_path, **kwargs):
+        pass
+
+    def end(self, **kwargs):
+        pass
+
+Arguments to watcher methods are passed as keyword arguments,
+and methods are expected to consume new, unknown arguments.
+
+The method __init__() is used to save configuration and logger
+at the start of the plug-in.
+
+The method start() is invoked when auditor starts a pass.
+It usually resets counters. The argument `auditor_type` is string of
+`"ALL"` or `"ZBF"`, according to the type of the auditor running
+the watcher. Watchers that talk to the network tend to hang off the
+ALL-type auditor, the lightweight ones are okay with the ZBF-type.
+
+The method end() is the closing bracket for start(). It is typically
+used to log something, or dump some statistics.
+
+The method see_object() is called when auditor completed an audit
+of an object. This is where most of the work is done.
+
+The protocol for see_object() allows it to raise a special exception,
+QuarantienRequested. Auditor catches it and quarantines the object.
+In general, it's okay for watcher methods to throw exceptions, so
+an author of a watcher plugin does not have to catch them explicitly
+with a try:; they can be just permitted to bubble up naturally.
+
+-------------------
+Loading the plugins
+-------------------
+
+Swift auditor loads watcher classes from eggs, so it is necessary
+to wrap the class and provide it an entry point::
+
+  $ cat /usr/lib/python3.8/site-p*/mywatcher*egg-info/entry_points.txt
+  [mywatcher.mysection]
+  mywatcherentry = mywatcher:MyWatcher
+
+Operator tells Swift auditor what plugins to load by adding them
+to object-server.conf in the section [object-auditor]. It is also
+possible to pass parameters, arriving in the argument conf{} of
+method start()::
+
+  [object-auditor]
+  watchers = mywatcher#mywatcherentry,swift#dark_data
+
+  [object-auditor:watcher:mywatcher#mywatcherentry]
+  myparam=testing2020
+
+Do not forget to remove the watcher from auditors when done.
+Although the API itself is very lightweight, it is common for watchers
+to incur a significant performance penalty: they can talk to networked
+services or access additional objects.
+
+-----------------
+Dark Data Watcher
+-----------------
+
+The watcher API is assumed to be under development. Operators who
+need extensions are welcome to report any needs for more arguments
+to see_object().
+
+The :ref:`dark_data` watcher has been provided as an example. If an
+operator wants to create their own watcher, start by copying
+the provided example template ``swift/obj/watchers/dark_data.py`` and see
+if it is sufficient.
diff --git a/doc/source/first_contribution_swift.rst b/doc/source/first_contribution_swift.rst
new file mode 100644
index 0000000000..8d986c3187
--- /dev/null
+++ b/doc/source/first_contribution_swift.rst
@@ -0,0 +1,208 @@
+===========================
+First Contribution to Swift
+===========================
+
+-------------
+Getting Swift
+-------------
+
+.. highlight: none
+
+Swift's source code is hosted on github and managed with git.  The current
+trunk can be checked out like this::
+
+    git clone https://github.com/openstack/swift.git
+
+This will clone the Swift repository under your account.
+
+A source tarball for the latest release of Swift is available on the
+`launchpad project page <https://launchpad.net/swift>`_.
+
+Prebuilt packages for Ubuntu and RHEL variants are available.
+
+* `Swift Ubuntu Packages <https://launchpad.net/ubuntu/+source/swift>`_
+* `Swift RDO Packages <https://www.rdoproject.org/documentation/repositories/>`_
+
+--------------------
+Source Control Setup
+--------------------
+
+Swift uses ``git`` for source control. The OpenStack
+`Developer's Guide <http://docs.openstack.org/infra/manual/developers.html>`_
+describes the steps for setting up Git and all the necessary accounts for
+contributing code to Swift.
+
+----------------
+Changes to Swift
+----------------
+
+Once you have the source code and source control set up, you can make your
+changes to Swift.
+
+-------
+Testing
+-------
+
+The :doc:`Development Guidelines <development_guidelines>` describe the testing
+requirements before submitting Swift code.
+
+In summary, you can execute tox from the swift home directory (where you
+checked out the source code)::
+
+    tox
+
+Tox will present tests results. Notice that in the beginning, it is very common
+to break many coding style guidelines.
+
+--------------------------
+Proposing changes to Swift
+--------------------------
+
+The OpenStack
+`Developer's Guide <http://docs.openstack.org/infra/manual/developers.html>`_
+describes the most common ``git`` commands that you will need.
+
+Following is a list of the commands that you need to know for your first
+contribution to Swift:
+
+To clone a copy of Swift::
+
+    git clone https://github.com/openstack/swift.git
+
+Under the swift directory, set up the Gerrit repository. The following command
+configures the repository to know about Gerrit and installs the ``Change-Id``
+commit hook. You only need to do this once::
+
+    git review -s
+
+To create your development branch (substitute branch_name for a name of your
+choice::
+
+    git checkout -b <branch_name>
+
+To check the files that have been updated in your branch::
+
+    git status
+
+To check the differences between your branch and the repository::
+
+    git diff
+
+Assuming you have not added new files, you commit all your changes using::
+
+    git commit -a
+
+Read the `Summary of Git commit message structure <https://wiki.openstack.org/wiki/GitCommitMessages?%22Summary%20of%20Git%20commit%20message%20structure%22#Summary_of_Git_commit_message_structure>`_
+for best practices on writing the commit message. When you are ready to send
+your changes for review use::
+
+    git review
+
+If successful, Git response message will contain a URL you can use to track your
+changes.
+
+If you need to make further changes to the same review, you can commit them
+using::
+
+    git commit -a --amend
+
+This will commit the changes under the same set of changes you issued earlier.
+Notice that in order to send your latest version for review, you will still
+need to call::
+
+    git review
+
+---------------------
+Tracking your changes
+---------------------
+
+After proposing changes to Swift, you can track them at
+https://review.opendev.org. After logging in, you will see a dashboard of
+"Outgoing reviews" for changes you have proposed, "Incoming reviews" for
+changes you are reviewing, and "Recently closed" changes for which you were
+either a reviewer or owner.
+
+.. _post-rebase-instructions:
+
+------------------------
+Post rebase instructions
+------------------------
+
+After rebasing, the following steps should be performed to rebuild the swift
+installation. Note that these commands should be performed from the root of the
+swift repo directory (e.g. ``$HOME/swift/``)::
+
+    sudo python setup.py develop
+    sudo pip install -r test-requirements.txt
+
+If using TOX, depending on the changes made during the rebase, you may need to
+rebuild the TOX environment (generally this will be the case if
+test-requirements.txt was updated such that a new version of a package is
+required), this can be accomplished using the ``-r`` argument to the TOX cli::
+
+    tox -r
+
+You can include any of the other TOX arguments as well, for example, to run the
+pep8 suite and rebuild the TOX environment the following can be used::
+
+    tox -r -e pep8
+
+The rebuild option only needs to be specified once for a particular build (e.g.
+pep8), that is further invocations of the same build will not require this
+until the next rebase.
+
+---------------
+Troubleshooting
+---------------
+
+You may run into the following errors when starting Swift if you rebase
+your commit using::
+
+    git rebase
+
+.. code-block:: python
+
+   Traceback (most recent call last):
+       File "/usr/local/bin/swift-init", line 5, in <module>
+           from pkg_resources import require
+       File "/usr/lib/python2.7/dist-packages/pkg_resources.py", line 2749, in <module>
+           working_set = WorkingSet._build_master()
+       File "/usr/lib/python2.7/dist-packages/pkg_resources.py", line 446, in _build_master
+           return cls._build_from_requirements(__requires__)
+       File "/usr/lib/python2.7/dist-packages/pkg_resources.py", line 459, in _build_from_requirements
+           dists = ws.resolve(reqs, Environment())
+       File "/usr/lib/python2.7/dist-packages/pkg_resources.py", line 628, in resolve
+           raise DistributionNotFound(req)
+   pkg_resources.DistributionNotFound: swift==2.3.1.devXXX
+
+(where XXX represents a dev version of Swift).
+
+.. code-block:: python
+
+   Traceback (most recent call last):
+       File "/usr/local/bin/swift-proxy-server", line 10, in <module>
+         execfile(__file__)
+       File "/home/swift/swift/bin/swift-proxy-server", line 23, in <module>
+         sys.exit(run_wsgi(conf_file, 'proxy-server', **options))
+       File "/home/swift/swift/swift/common/wsgi.py", line 888, in run_wsgi
+         loadapp(conf_path, global_conf=global_conf)
+       File "/home/swift/swift/swift/common/wsgi.py", line 390, in loadapp
+         func(PipelineWrapper(ctx))
+       File "/home/swift/swift/swift/proxy/server.py", line 602, in modify_wsgi_pipeline
+         ctx = pipe.create_filter(filter_name)
+       File "/home/swift/swift/swift/common/wsgi.py", line 329, in create_filter
+         global_conf=self.context.global_conf)
+       File "/usr/lib/python2.7/dist-packages/paste/deploy/loadwsgi.py", line 296, in loadcontext
+         global_conf=global_conf)
+       File "/usr/lib/python2.7/dist-packages/paste/deploy/loadwsgi.py", line 328, in _loadegg
+         return loader.get_context(object_type, name, global_conf)
+       File "/usr/lib/python2.7/dist-packages/paste/deploy/loadwsgi.py", line 620, in get_context
+         object_type, name=name)
+       File "/usr/lib/python2.7/dist-packages/paste/deploy/loadwsgi.py", line 659, in find_egg_entry_point
+         for prot in protocol_options] or '(no entry points)'))))
+   LookupError: Entry point 'versioned_writes' not found in egg 'swift' (dir: /home/swift/swift; protocols: paste.filter_factory, paste.filter_app_factory; entry_points: )
+
+This happens because ``git rebase`` will retrieve code for a different version
+of Swift in the development stream, but the start scripts under
+``/usr/local/bin`` have not been updated. The solution is to follow the steps
+described in the :ref:`post-rebase-instructions` section.
diff --git a/doc/source/getting_started.rst b/doc/source/getting_started.rst
index dc6ee973d2..790ccd82dd 100644
--- a/doc/source/getting_started.rst
+++ b/doc/source/getting_started.rst
@@ -6,36 +6,17 @@ Getting Started
 System Requirements
 -------------------
 
-Swift development currently targets Ubuntu Server 10.04, but should work on 
-most Linux platforms with the following software:
+Swift development currently targets Ubuntu Server 22.04, but should work on
+most Linux platforms.
 
-* Python 2.6
-* rsync 3.0
+Swift is written in Python and has these dependencies:
 
-And the following python libraries:
-
-* Eventlet 0.9.8
-* Setuptools
-* Simplejson
-* Xattr
-* Nose
-* Sphinx
-* netifaces
-
--------------
-Getting Swift
--------------
-
-Swift's source code is hosted on github and managed with git.  The current trunk can be checked out like this:
-
-    ``git clone https://github.com/openstack/swift.git``
-
-A source tarball for the latest release of Swift is available on the `launchpad project page <https://launchpad.net/swift>`_.
-
-Prebuilt packages for Ubuntu are available starting with Natty, or from PPAs for earlier releases.
-
-* `Swift Ubuntu Packages <https://launchpad.net/ubuntu/+source/swift>`_
-* `Swift PPA Archive <https://launchpad.net/~swift-core/+archive/release>`_
+* Python (3.6-3.12)
+* rsync 3.x
+* `liberasurecode <https://opendev.org/openstack/liberasurecode/>`__
+* The Python packages listed in `the requirements file <https://github.com/openstack/swift/blob/master/requirements.txt>`__
+* Testing additionally requires `the test dependencies <https://github.com/openstack/swift/blob/master/test-requirements.txt>`__
+* Testing requires `these distribution packages <https://github.com/openstack/swift/blob/master/bindep.txt>`__
 
 -----------
 Development
@@ -46,11 +27,24 @@ following docs will be useful:
 
 * :doc:`Swift All in One <development_saio>` - Set up a VM with Swift installed
 * :doc:`Development Guidelines <development_guidelines>`
+* :doc:`First Contribution to Swift <first_contribution_swift>`
+* :doc:`Associated Projects <associated_projects>`
+
+--------------------------
+CLI client and SDK library
+--------------------------
+
+There are many clients in the :ref:`ecosystem <application-bindings>`. The official CLI
+and SDK is python-swiftclient.
+
+* `Source code <https://opendev.org/openstack/python-swiftclient>`__
+* `Python Package Index <https://pypi.org/project/python-swiftclient>`__
 
 ----------
 Production
 ----------
 
-If you want to set up and configure Swift for a production cluster, the following doc should be useful:
+If you want to set up and configure Swift for a production cluster, the
+following doc should be useful:
 
-* :doc:`Multiple Server Swift Installation <howto_installmultinode>`
+* :doc:`install/index`
diff --git a/doc/source/howto_installmultinode.rst b/doc/source/howto_installmultinode.rst
deleted file mode 100644
index 61d208191d..0000000000
--- a/doc/source/howto_installmultinode.rst
+++ /dev/null
@@ -1,443 +0,0 @@
-==============================================================
-Instructions for a Multiple Server Swift Installation (Ubuntu)
-==============================================================
-
-Prerequisites
--------------
-* Ubuntu Server 10.04 LTS installation media
-
-.. note:
-    Swift can run with other distros, but for this document we will focus
-    on installing on Ubuntu Server, ypmv (your packaging may vary).
-
-Basic architecture and terms
-----------------------------
-- *node* - a host machine running one or more Swift services
-- *Proxy node* - node that runs Proxy services; also runs TempAuth
-- *Storage node* - node that runs Account, Container, and Object services
-- *ring* - a set of mappings of Swift data to physical devices
-
-This document shows a cluster using the following types of nodes:
-
-- one Proxy node
-
-  - Runs the swift-proxy-server processes which proxy requests to the
-    appropriate Storage nodes. The proxy server will also contain
-    the TempAuth service as WSGI middleware.
-
-- five Storage nodes
-
-  - Runs the swift-account-server, swift-container-server, and
-    swift-object-server processes which control storage of the account
-    databases, the container databases, as well as the actual stored
-    objects.
-
-.. note::
-    Fewer Storage nodes can be used initially, but a minimum of 5 is
-    recommended for a production cluster.
-
-This document describes each Storage node as a separate zone in the ring.
-It is recommended to have a minimum of 5 zones. A zone is a group of nodes
-that is as isolated as possible from other nodes (separate servers, network,
-power, even geography). The ring guarantees that every replica is stored
-in a separate zone.  For more information about the ring and zones, see: :doc:`The Rings <overview_ring>`.
-
-To increase reliability, you may want to add additional Proxy servers for performance which is described in :ref:`add-proxy-server`.
-
-Network Setup Notes
--------------------
-
-This document refers to two networks.  An external network for connecting to the Proxy server, and a storage network that is not accessibile from outside the cluster, to which all of the nodes are connected.  All of the Swift services, as well as the rsync daemon on the Storage nodes are configured to listen on their STORAGE_LOCAL_NET IP addresses.
-
-.. note::
-    Run all commands as the root user
-
-General OS configuration and partitioning for each node
--------------------------------------------------------
-
-#. Install the baseline Ubuntu Server 10.04 LTS on all nodes.
-
-#. Install common Swift software prereqs::
-
-        apt-get install python-software-properties
-        add-apt-repository ppa:swift-core/release
-        apt-get update
-        apt-get install swift python-swiftclient openssh-server
-
-#. Create and populate configuration directories::
-
-        mkdir -p /etc/swift
-        chown -R swift:swift /etc/swift/
-
-#. On the first node only, create /etc/swift/swift.conf::
-
-        cat >/etc/swift/swift.conf <<EOF
-        [swift-hash]
-        # random unique string that can never change (DO NOT LOSE)
-        swift_hash_path_suffix = `od -t x8 -N 8 -A n </dev/random`
-        EOF
-
-#. On the second and subsequent nodes: Copy that file over. It must be the same on every node in the cluster!::
-
-        scp firstnode.example.com:/etc/swift/swift.conf /etc/swift/
-
-#. Publish the local network IP address for use by scripts found later in this documentation::
-
-        export STORAGE_LOCAL_NET_IP=10.1.2.3
-        export PROXY_LOCAL_NET_IP=10.1.2.4
-
-.. note::
-    The random string of text in /etc/swift/swift.conf is
-    used as a salt when hashing to determine mappings in the ring.
-
-.. _config-proxy:
-
-Configure the Proxy node
-------------------------
-
-.. note::
-    It is assumed that all commands are run as the root user
-
-#. Install swift-proxy service::
-
-        apt-get install swift-proxy memcached
-
-#. Create self-signed cert for SSL::
-
-        cd /etc/swift
-        openssl req -new -x509 -nodes -out cert.crt -keyout cert.key
-
-.. note::
-    If you don't create the cert files, Swift silently uses http internally rather than https. This document assumes that you have created
-    these certs, so if you're following along step-by-step, create them. In a
-    production cluster, you should terminate SSL before the proxy server. SSL
-    support is provided for testing purposes only.
-
-#. Modify memcached to listen on the default interfaces. Preferably this should be on a local, non-public network. Edit the IP address in /etc/memcached.conf, for example::
-
-        perl -pi -e "s/-l 127.0.0.1/-l $PROXY_LOCAL_NET_IP/" /etc/memcached.conf
-
-#. Restart the memcached server::
-
-        service memcached restart
-
-#. Create /etc/swift/proxy-server.conf::
-
-        cat >/etc/swift/proxy-server.conf <<EOF
-        [DEFAULT]
-        cert_file = /etc/swift/cert.crt
-        key_file = /etc/swift/cert.key
-        bind_port = 8080
-        workers = 8
-        user = swift
-
-        [pipeline:main]
-        pipeline = healthcheck cache tempauth proxy-server
-
-        [app:proxy-server]
-        use = egg:swift#proxy
-        allow_account_management = true
-        account_autocreate = true
-
-        [filter:tempauth]
-        use = egg:swift#tempauth
-        user_system_root = testpass .admin https://$PROXY_LOCAL_NET_IP:8080/v1/AUTH_system
-
-        [filter:healthcheck]
-        use = egg:swift#healthcheck
-
-        [filter:cache]
-        use = egg:swift#memcache
-        memcache_servers = $PROXY_LOCAL_NET_IP:11211
-        EOF
-
-   .. note::
-
-    If you run multiple memcache servers, put the multiple IP:port listings
-    in the [filter:cache] section of the proxy-server.conf file like:
-    `10.1.2.3:11211,10.1.2.4:11211`. Only the proxy server uses memcache.
-
-#. Create the account, container and object rings. The builder command is basically creating a builder file with a few parameters. The parameter with the value of 18 represents 2 ^ 18th, the value that the partition will be sized to. Set this "partition power" value based on the total amount of storage you expect your entire ring to use. The value of 3 represents the number of replicas of each object, with the last value being the number of hours to restrict moving a partition more than once.
-
-   ::
-
-    cd /etc/swift
-    swift-ring-builder account.builder create 18 3 1
-    swift-ring-builder container.builder create 18 3 1
-    swift-ring-builder object.builder create 18 3 1
-
-   .. note::
-
-    For more information on building rings, see :doc:`overview_ring`.
-
-#. For every storage device in /srv/node on each node add entries to each ring::
-
-    export ZONE=                    # set the zone number for that storage device
-    export STORAGE_LOCAL_NET_IP=    # and the IP address
-    export WEIGHT=100               # relative weight (higher for bigger/faster disks)
-    export DEVICE=sdb1
-    swift-ring-builder account.builder add z$ZONE-$STORAGE_LOCAL_NET_IP:6002/$DEVICE $WEIGHT
-    swift-ring-builder container.builder add z$ZONE-$STORAGE_LOCAL_NET_IP:6001/$DEVICE $WEIGHT
-    swift-ring-builder object.builder add z$ZONE-$STORAGE_LOCAL_NET_IP:6000/$DEVICE $WEIGHT
-
-   .. note::
-    Assuming there are 5 zones with 1 node per zone, ZONE should start at
-    1 and increment by one for each additional node.
-
-#. Verify the ring contents for each ring::
-
-    swift-ring-builder account.builder
-    swift-ring-builder container.builder
-    swift-ring-builder object.builder
-
-#. Rebalance the rings::
-
-    swift-ring-builder account.builder rebalance
-    swift-ring-builder container.builder rebalance
-    swift-ring-builder object.builder rebalance
-
-   .. note::
-    Rebalancing rings can take some time.
-
-#. Copy the account.ring.gz, container.ring.gz, and object.ring.gz files
-   to each of the Proxy and Storage nodes in /etc/swift.
-
-#. Make sure all the config files are owned by the swift user::
-
-        chown -R swift:swift /etc/swift
-
-#. Start Proxy services::
-
-        swift-init proxy start
-
-
-Configure the Storage nodes
----------------------------
-
-..  note::
-    Swift *should* work on any modern filesystem that supports
-    Extended Attributes (XATTRS). We currently recommend XFS as it
-    demonstrated the best overall performance for the swift use case after
-    considerable testing and benchmarking at Rackspace. It is also the
-    only filesystem that has been thoroughly tested. These instructions
-    assume that you are going to devote /dev/sdb1 to an XFS filesystem.
-
-#. Install Storage node packages::
-
-        apt-get install swift-account swift-container swift-object xfsprogs
-
-#. For every device on the node, setup the XFS volume (/dev/sdb is used
-   as an example)::
-
-        fdisk /dev/sdb  (set up a single partition)
-        mkfs.xfs -i size=1024 /dev/sdb1
-        echo "/dev/sdb1 /srv/node/sdb1 xfs noatime,nodiratime,nobarrier,logbufs=8 0 0" >> /etc/fstab
-        mkdir -p /srv/node/sdb1
-        mount /srv/node/sdb1
-        chown -R swift:swift /srv/node
-
-#. Create /etc/rsyncd.conf::
-
-        cat >/etc/rsyncd.conf <<EOF
-        uid = swift
-        gid = swift
-        log file = /var/log/rsyncd.log
-        pid file = /var/run/rsyncd.pid
-        address = $STORAGE_LOCAL_NET_IP
-
-        [account]
-        max connections = 2
-        path = /srv/node/
-        read only = false
-        lock file = /var/lock/account.lock
-
-        [container]
-        max connections = 2
-        path = /srv/node/
-        read only = false
-        lock file = /var/lock/container.lock
-
-        [object]
-        max connections = 2
-        path = /srv/node/
-        read only = false
-        lock file = /var/lock/object.lock
-        EOF
-
-#. Edit the RSYNC_ENABLE= line in /etc/default/rsync::
-
-        perl -pi -e 's/RSYNC_ENABLE=false/RSYNC_ENABLE=true/' /etc/default/rsync
-
-#. Start rsync daemon::
-
-        service rsync start
-
-   ..  note::
-    The rsync daemon requires no authentication, so it should be run on
-    a local, private network.
-
-#. Create /etc/swift/account-server.conf::
-
-        cat >/etc/swift/account-server.conf <<EOF
-        [DEFAULT]
-        bind_ip = $STORAGE_LOCAL_NET_IP
-        workers = 2
-
-        [pipeline:main]
-        pipeline = account-server
-
-        [app:account-server]
-        use = egg:swift#account
-
-        [account-replicator]
-
-        [account-auditor]
-
-        [account-reaper]
-        EOF
-
-#. Create /etc/swift/container-server.conf::
-
-        cat >/etc/swift/container-server.conf <<EOF
-        [DEFAULT]
-        bind_ip = $STORAGE_LOCAL_NET_IP
-        workers = 2
-
-        [pipeline:main]
-        pipeline = container-server
-
-        [app:container-server]
-        use = egg:swift#container
-
-        [container-replicator]
-
-        [container-updater]
-
-        [container-auditor]
-        EOF
-
-#. Create /etc/swift/object-server.conf::
-
-        cat >/etc/swift/object-server.conf <<EOF
-        [DEFAULT]
-        bind_ip = $STORAGE_LOCAL_NET_IP
-        workers = 2
-
-        [pipeline:main]
-        pipeline = object-server
-
-        [app:object-server]
-        use = egg:swift#object
-
-        [object-replicator]
-
-        [object-updater]
-
-        [object-auditor]
-        EOF
-
-#. Start the storage services. If you use this command, it will try to start
-   every service for which a configuration file exists, and throw a warning
-   for any configuration files which don't exist::
-
-         swift-init all start
-
-   Or, if you want to start them one at a time, run them as below.
-   Note that if the server program in question generates any output on its
-   stdout or stderr, swift-init has already redirected the command's output
-   to /dev/null. If you encounter any difficulty, stop the server and run it
-   by hand from the command line. Any server may be started using
-   "swift-$SERVER-$SERVICE /etc/swift/$SERVER-config", where $SERVER might
-   be object, continer, or account, and $SERVICE might be server,
-   replicator, updater, or auditor.
-
-   ::
-
-         swift-init object-server start
-         swift-init object-replicator start
-         swift-init object-updater start
-         swift-init object-auditor start
-         swift-init container-server start
-         swift-init container-replicator start
-         swift-init container-updater start
-         swift-init container-auditor start
-         swift-init account-server start
-         swift-init account-replicator start
-         swift-init account-auditor start
-
-Create Swift admin account and test
------------------------------------
-
-You run these commands from the Proxy node.
-
-#. Get an X-Storage-Url and X-Auth-Token::
-
-        curl -k -v -H 'X-Storage-User: system:root' -H 'X-Storage-Pass: testpass' https://$PROXY_LOCAL_NET_IP:8080/auth/v1.0
-
-#. Check that you can HEAD the account::
-
-        curl -k -v -H 'X-Auth-Token: <token-from-x-auth-token-above>' <url-from-x-storage-url-above>
-
-#. Check that ``swift`` works  (at this point, expect zero containers, zero objects, and zero bytes)::
-
-        swift -A https://$PROXY_LOCAL_NET_IP:8080/auth/v1.0 -U system:root -K testpass stat
-
-#. Use ``swift`` to upload a few files named 'bigfile[1-2].tgz' to a container named 'myfiles'::
-
-        swift -A https://$PROXY_LOCAL_NET_IP:8080/auth/v1.0 -U system:root -K testpass upload myfiles bigfile1.tgz
-        swift -A https://$PROXY_LOCAL_NET_IP:8080/auth/v1.0 -U system:root -K testpass upload myfiles bigfile2.tgz
-
-#. Use ``swift`` to download all files from the 'myfiles' container::
-
-        swift -A https://$PROXY_LOCAL_NET_IP:8080/auth/v1.0 -U system:root -K testpass download myfiles
-
-#. Use ``swift`` to save a backup of your builder files to a container named 'builders'. Very important not to lose your builders!::
-
-        swift -A https://$PROXY_LOCAL_NET_IP:8080/auth/v1.0 -U system:root -K testpass upload builders /etc/swift/*.builder
-
-#. Use ``swift`` to list your containers::
-
-        swift -A https://$PROXY_LOCAL_NET_IP:8080/auth/v1.0 -U system:root -K testpass list
-
-#. Use ``swift`` to list the contents of your 'builders' container::
-
-        swift -A https://$PROXY_LOCAL_NET_IP:8080/auth/v1.0 -U system:root -K testpass list builders
-
-#. Use ``swift`` to download all files from the 'builders' container::
-
-        swift -A https://$PROXY_LOCAL_NET_IP:8080/auth/v1.0 -U system:root -K testpass download builders
-
-.. _add-proxy-server:
-
-Adding a Proxy Server
----------------------
-
-For reliability's sake you may want to have more than one proxy server. You can set up the additional proxy node in the same manner that you set up the first proxy node but with additional configuration steps.
-
-Once you have more than two proxies, you also want to load balance between the two, which means your storage endpoint also changes. You can select from different strategies for load balancing. For example, you could use round robin dns, or an actual load balancer (like pound) in front of the two proxies, and point your storage url to the load balancer.
-
-See :ref:`config-proxy` for the initial setup, and then follow these additional steps.
-
-#. Update the list of memcache servers in /etc/swift/proxy-server.conf for all the added proxy servers. If you run multiple memcache servers, use this pattern for the multiple IP:port listings: `10.1.2.3:11211,10.1.2.4:11211` in each proxy server's conf file.::
-
-        [filter:cache]
-        use = egg:swift#memcache
-        memcache_servers = $PROXY_LOCAL_NET_IP:11211
-
-#. Change the storage url for any users to point to the load balanced url, rather than the first proxy server you created in /etc/swift/proxy-server.conf::
-
-        [filter:tempauth]
-        use = egg:swift#tempauth
-        user_system_root = testpass .admin http[s]://<LOAD_BALANCER_HOSTNAME>:<PORT>/v1/AUTH_system
-
-#. Next, copy all the ring information to all the nodes, including your new proxy nodes, and ensure the ring info gets to all the storage nodes as well.
-
-#. After you sync all the nodes, make sure the admin has the keys in /etc/swift and the ownership for the ring file is correct.
-
-Troubleshooting Notes
----------------------
-If you see problems, look in var/log/syslog (or messages on some distros).
-
-Also, at Rackspace we have seen hints at drive failures by looking at error messages in /var/log/kern.log.
-
-There are more debugging hints and tips in the :doc:`admin_guide`.
diff --git a/doc/source/images/ec_overview.png b/doc/source/images/ec_overview.png
new file mode 100644
index 0000000000..d44a103177
Binary files /dev/null and b/doc/source/images/ec_overview.png differ
diff --git a/doc/source/images/reload_process_tree_1.svg b/doc/source/images/reload_process_tree_1.svg
new file mode 100644
index 0000000000..fe026aac4d
--- /dev/null
+++ b/doc/source/images/reload_process_tree_1.svg
@@ -0,0 +1,35 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN" "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
+<svg version="1.1" width="250" height="140" viewbox="0 0 250 140" xmlns="http://www.w3.org/2000/svg">
+  <g>
+    <rect x="5" y="5" width="200" height="50" rx="10" />
+    <text x="105" y="30">Manager Process</text>
+  </g>
+  <g>
+    <rect x="25" y="65" width="200" height="50" rx="10" />
+    <rect x="35" y="75" width="200" height="50" rx="10" />
+    <rect x="45" y="85" width="200" height="50" rx="10" />
+    <text x="145" y="110">Workers</text>
+  </g>
+  <path d="M 15 55 V 100 H 35
+           m -5 -5 l 5 5 -5 5" />
+  <style>
+    <![CDATA[
+      rect {
+        fill: #edf2f7;
+        stroke: #2A4E68;
+        stroke-width: 2;
+      }
+      path {
+        fill: none;
+        stroke-width: 2;
+        stroke: black;
+      }
+      text {
+        dominant-baseline: central;
+        text-anchor: middle;
+        font: 12 sans-serif;
+      }
+    ]]>
+  </style>
+</svg>
diff --git a/doc/source/images/reload_process_tree_2.svg b/doc/source/images/reload_process_tree_2.svg
new file mode 100644
index 0000000000..ef071e2480
--- /dev/null
+++ b/doc/source/images/reload_process_tree_2.svg
@@ -0,0 +1,41 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN" "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
+<svg version="1.1" width="250" height="200" viewbox="0 0 250 200" xmlns="http://www.w3.org/2000/svg">
+  <g>
+    <rect x="5" y="5" width="200" height="50" rx="10" />
+    <text x="105" y="30">Manager Process</text>
+  </g>
+  <g>
+    <rect x="25" y="65" width="200" height="50" rx="10" />
+    <rect x="35" y="75" width="200" height="50" rx="10" />
+    <rect x="45" y="85" width="200" height="50" rx="10" />
+    <text x="145" y="110">Workers</text>
+  </g>
+  <g>
+    <rect x="25" y="145" width="200" height="50" rx="10" />
+    <text x="125" y="170">Socket Closer</text>
+  </g>
+  <path d="M 15 55 V 100 H 35
+           m -5 -5 l 5 5 -5 5" />
+  <path d="M 15 55 V 170 H 25
+           m -5 -5 l 5 5 -5 5" />
+  <style>
+    <![CDATA[
+      rect {
+        fill: #edf2f7;
+        stroke: #2A4E68;
+        stroke-width: 2;
+      }
+      path {
+        fill: none;
+        stroke-width: 2;
+        stroke: black;
+      }
+      text {
+        dominant-baseline: central;
+        text-anchor: middle;
+        font: 12 sans-serif;
+      }
+    ]]>
+  </style>
+</svg>
diff --git a/doc/source/images/reload_process_tree_3.svg b/doc/source/images/reload_process_tree_3.svg
new file mode 100644
index 0000000000..93918a72e9
--- /dev/null
+++ b/doc/source/images/reload_process_tree_3.svg
@@ -0,0 +1,41 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN" "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
+<svg version="1.1" width="250" height="200" viewbox="0 0 250 200" xmlns="http://www.w3.org/2000/svg">
+  <g>
+    <rect x="5" y="5" width="200" height="50" rx="10" />
+    <text x="105" y="30">Re-exec'ed Manager</text>
+  </g>
+  <g>
+    <rect x="25" y="65" width="200" height="50" rx="10" />
+    <rect x="35" y="75" width="200" height="50" rx="10" />
+    <rect x="45" y="85" width="200" height="50" rx="10" />
+    <text x="145" y="110">Old Workers</text>
+  </g>
+  <g>
+    <rect x="25" y="145" width="200" height="50" rx="10" />
+    <text x="125" y="170">Socket Closer</text>
+  </g>
+  <path d="M 15 55 V 100 H 35
+           m -5 -5 l 5 5 -5 5" />
+  <path d="M 15 55 V 170 H 25
+           m -5 -5 l 5 5 -5 5" />
+  <style>
+    <![CDATA[
+      rect {
+        fill: #edf2f7;
+        stroke: #2A4E68;
+        stroke-width: 2;
+      }
+      path {
+        fill: none;
+        stroke-width: 2;
+        stroke: black;
+      }
+      text {
+        dominant-baseline: central;
+        text-anchor: middle;
+        font: 12 sans-serif;
+      }
+    ]]>
+  </style>
+</svg>
diff --git a/doc/source/images/reload_process_tree_4.svg b/doc/source/images/reload_process_tree_4.svg
new file mode 100644
index 0000000000..fd04d0a30f
--- /dev/null
+++ b/doc/source/images/reload_process_tree_4.svg
@@ -0,0 +1,49 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN" "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
+<svg version="1.1" width="250" height="280" viewbox="0 0 250 280" xmlns="http://www.w3.org/2000/svg">
+  <g>
+    <rect x="5" y="5" width="200" height="50" rx="10" />
+    <text x="105" y="30">Re-exec'ed Manager</text>
+  </g>
+  <g>
+    <rect x="25" y="65" width="200" height="50" rx="10" />
+    <rect x="35" y="75" width="200" height="50" rx="10" />
+    <rect x="45" y="85" width="200" height="50" rx="10" />
+    <text x="145" y="110">Old Workers</text>
+  </g>
+  <g>
+    <rect x="25" y="145" width="200" height="50" rx="10" />
+    <text x="125" y="170">Socket Closer</text>
+  </g>
+  <g>
+    <rect x="25" y="205" width="200" height="50" rx="10" />
+    <rect x="35" y="215" width="200" height="50" rx="10" />
+    <rect x="45" y="225" width="200" height="50" rx="10" />
+    <text x="145" y="250">New Workers</text>
+  </g>
+  <path d="M 15 55 V 100 H 35
+           m -5 -5 l 5 5 -5 5" />
+  <path d="M 15 55 V 170 H 25
+           m -5 -5 l 5 5 -5 5" />
+  <path d="M 15 55 V 240 H 35
+           m -5 -5 l 5 5 -5 5" />
+  <style>
+    <![CDATA[
+      rect {
+        fill: #edf2f7;
+        stroke: #2A4E68;
+        stroke-width: 2;
+      }
+      path {
+        fill: none;
+        stroke-width: 2;
+        stroke: black;
+      }
+      text {
+        dominant-baseline: central;
+        text-anchor: middle;
+        font: 12 sans-serif;
+      }
+    ]]>
+  </style>
+</svg>
diff --git a/doc/source/images/reload_process_tree_5.svg b/doc/source/images/reload_process_tree_5.svg
new file mode 100644
index 0000000000..baac19884b
--- /dev/null
+++ b/doc/source/images/reload_process_tree_5.svg
@@ -0,0 +1,43 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN" "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
+<svg version="1.1" width="250" height="220" viewbox="0 0 250 220" xmlns="http://www.w3.org/2000/svg">
+  <g>
+    <rect x="5" y="5" width="200" height="50" rx="10" />
+    <text x="105" y="30">Re-exec'ed Manager</text>
+  </g>
+  <g>
+    <rect x="25" y="65" width="200" height="50" rx="10" />
+    <rect x="35" y="75" width="200" height="50" rx="10" />
+    <rect x="45" y="85" width="200" height="50" rx="10" />
+    <text x="145" y="110">Old Workers</text>
+  </g>
+  <g>
+    <rect x="25" y="145" width="200" height="50" rx="10" />
+    <rect x="35" y="155" width="200" height="50" rx="10" />
+    <rect x="45" y="165" width="200" height="50" rx="10" />
+    <text x="145" y="190">New Workers</text>
+  </g>
+  <path d="M 15 55 V 100 H 35
+           m -5 -5 l 5 5 -5 5" />
+  <path d="M 15 55 V 180 H 35
+           m -5 -5 l 5 5 -5 5" />
+  <style>
+    <![CDATA[
+      rect {
+        fill: #edf2f7;
+        stroke: #2A4E68;
+        stroke-width: 2;
+      }
+      path {
+        fill: none;
+        stroke-width: 2;
+        stroke: black;
+      }
+      text {
+        dominant-baseline: central;
+        text-anchor: middle;
+        font: 12 sans-serif;
+      }
+    ]]>
+  </style>
+</svg>
diff --git a/doc/source/images/reload_process_tree_6.svg b/doc/source/images/reload_process_tree_6.svg
new file mode 100644
index 0000000000..730a8ac6ba
--- /dev/null
+++ b/doc/source/images/reload_process_tree_6.svg
@@ -0,0 +1,35 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN" "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
+<svg version="1.1" width="250" height="140" viewbox="0 0 250 140" xmlns="http://www.w3.org/2000/svg">
+  <g>
+    <rect x="5" y="5" width="200" height="50" rx="10" />
+    <text x="105" y="30">Re-exec'ed Manager</text>
+  </g>
+  <g>
+    <rect x="25" y="65" width="200" height="50" rx="10" />
+    <rect x="35" y="75" width="200" height="50" rx="10" />
+    <rect x="45" y="85" width="200" height="50" rx="10" />
+    <text x="145" y="110">New Workers</text>
+  </g>
+  <path d="M 15 55 V 100 H 35
+           m -5 -5 l 5 5 -5 5" />
+  <style>
+    <![CDATA[
+      rect {
+        fill: #edf2f7;
+        stroke: #2A4E68;
+        stroke-width: 2;
+      }
+      path {
+        fill: none;
+        stroke-width: 2;
+        stroke: black;
+      }
+      text {
+        dominant-baseline: central;
+        text-anchor: middle;
+        font: 12 sans-serif;
+      }
+    ]]>
+  </style>
+</svg>
diff --git a/doc/source/images/sharded_GET.svg b/doc/source/images/sharded_GET.svg
new file mode 100644
index 0000000000..03c271b5cc
--- /dev/null
+++ b/doc/source/images/sharded_GET.svg
@@ -0,0 +1,2019 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<svg
+   xmlns:dc="http://purl.org/dc/elements/1.1/"
+   xmlns:cc="http://creativecommons.org/ns#"
+   xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
+   xmlns:svg="http://www.w3.org/2000/svg"
+   xmlns="http://www.w3.org/2000/svg"
+   xmlns:xlink="http://www.w3.org/1999/xlink"
+   xmlns:sodipodi="http://sodipodi.sourceforge.net/DTD/sodipodi-0.dtd"
+   xmlns:inkscape="http://www.inkscape.org/namespaces/inkscape"
+   width="787"
+   height="460"
+   version="1.1"
+   id="svg1304"
+   sodipodi:docname="sharding_lock_sharded_GET.svg"
+   inkscape:version="0.92.2 (5c3e80d, 2017-08-06)">
+  <metadata
+     id="metadata1310">
+    <rdf:RDF>
+      <cc:Work
+         rdf:about="">
+        <dc:format>image/svg+xml</dc:format>
+        <dc:type
+           rdf:resource="http://purl.org/dc/dcmitype/StillImage" />
+        <dc:title></dc:title>
+      </cc:Work>
+    </rdf:RDF>
+  </metadata>
+  <defs
+     id="defs1308">
+    <marker
+       inkscape:stockid="EmptyTriangleOutL"
+       orient="auto"
+       refY="0"
+       refX="0"
+       id="marker6295"
+       style="overflow:visible"
+       inkscape:isstock="true">
+      <path
+         id="path6293"
+         d="M 5.77,0 -2.88,5 V -5 Z"
+         style="fill:#ffffff;fill-rule:evenodd;stroke:#000000;stroke-width:1.00000003pt;stroke-opacity:1"
+         transform="matrix(0.8,0,0,0.8,-4.8,0)"
+         inkscape:connector-curvature="0" />
+    </marker>
+    <marker
+       inkscape:stockid="EmptyTriangleInL"
+       orient="auto"
+       refY="0"
+       refX="0"
+       id="marker6183"
+       style="overflow:visible"
+       inkscape:isstock="true">
+      <path
+         id="path6181"
+         d="M 5.77,0 -2.88,5 V -5 Z"
+         style="fill:#ffffff;fill-rule:evenodd;stroke:#000000;stroke-width:1.00000003pt;stroke-opacity:1"
+         transform="matrix(-0.8,0,0,-0.8,4.8,0)"
+         inkscape:connector-curvature="0" />
+    </marker>
+    <marker
+       inkscape:stockid="EmptyTriangleOutL"
+       orient="auto"
+       refY="0"
+       refX="0"
+       id="marker5092"
+       style="overflow:visible"
+       inkscape:isstock="true">
+      <path
+         id="path5090"
+         d="M 5.77,0 -2.88,5 V -5 Z"
+         style="fill:#ffffff;fill-rule:evenodd;stroke:#000000;stroke-width:1.00000003pt;stroke-opacity:1"
+         transform="matrix(0.8,0,0,0.8,-4.8,0)"
+         inkscape:connector-curvature="0" />
+    </marker>
+    <marker
+       inkscape:stockid="EmptyTriangleInL"
+       orient="auto"
+       refY="0"
+       refX="0"
+       id="marker5004"
+       style="overflow:visible"
+       inkscape:isstock="true">
+      <path
+         id="path5002"
+         d="M 5.77,0 -2.88,5 V -5 Z"
+         style="fill:#ffffff;fill-rule:evenodd;stroke:#000000;stroke-width:1.00000003pt;stroke-opacity:1"
+         transform="matrix(-0.8,0,0,-0.8,4.8,0)"
+         inkscape:connector-curvature="0" />
+    </marker>
+    <marker
+       inkscape:stockid="EmptyTriangleOutL"
+       orient="auto"
+       refY="0"
+       refX="0"
+       id="marker4906"
+       style="overflow:visible"
+       inkscape:isstock="true">
+      <path
+         id="path4904"
+         d="M 5.77,0 -2.88,5 V -5 Z"
+         style="fill:#ffffff;fill-rule:evenodd;stroke:#000000;stroke-width:1.00000003pt;stroke-opacity:1"
+         transform="matrix(0.8,0,0,0.8,-4.8,0)"
+         inkscape:connector-curvature="0" />
+    </marker>
+    <marker
+       inkscape:stockid="EmptyTriangleInL"
+       orient="auto"
+       refY="0"
+       refX="0"
+       id="marker4830"
+       style="overflow:visible"
+       inkscape:isstock="true">
+      <path
+         id="path4828"
+         d="M 5.77,0 -2.88,5 V -5 Z"
+         style="fill:#ffffff;fill-rule:evenodd;stroke:#000000;stroke-width:1.00000003pt;stroke-opacity:1"
+         transform="matrix(-0.8,0,0,-0.8,4.8,0)"
+         inkscape:connector-curvature="0" />
+    </marker>
+    <marker
+       inkscape:stockid="EmptyTriangleOutL"
+       orient="auto"
+       refY="0"
+       refX="0"
+       id="marker4007"
+       style="overflow:visible"
+       inkscape:isstock="true">
+      <path
+         id="path4005"
+         d="M 5.77,0 -2.88,5 V -5 Z"
+         style="fill:#ffffff;fill-rule:evenodd;stroke:#000000;stroke-width:1.00000003pt;stroke-opacity:1"
+         transform="matrix(0.8,0,0,0.8,-4.8,0)"
+         inkscape:connector-curvature="0" />
+    </marker>
+    <marker
+       inkscape:stockid="EmptyTriangleInL"
+       orient="auto"
+       refY="0"
+       refX="0"
+       id="EmptyTriangleInL"
+       style="overflow:visible"
+       inkscape:isstock="true">
+      <path
+         id="path3260"
+         d="M 5.77,0 -2.88,5 V -5 Z"
+         style="fill:#ffffff;fill-rule:evenodd;stroke:#000000;stroke-width:1.00000003pt;stroke-opacity:1"
+         transform="matrix(-0.8,0,0,-0.8,4.8,0)"
+         inkscape:connector-curvature="0" />
+    </marker>
+    <marker
+       inkscape:stockid="EmptyTriangleOutL"
+       orient="auto"
+       refY="0"
+       refX="0"
+       id="EmptyTriangleOutL"
+       style="overflow:visible"
+       inkscape:isstock="true">
+      <path
+         id="path3269"
+         d="M 5.77,0 -2.88,5 V -5 Z"
+         style="fill:#ffffff;fill-rule:evenodd;stroke:#000000;stroke-width:1.00000003pt;stroke-opacity:1"
+         transform="matrix(0.8,0,0,0.8,-4.8,0)"
+         inkscape:connector-curvature="0" />
+    </marker>
+    <defs
+       id="defs1300">
+      <path
+         id="v"
+         d="M 0,20 411,-1484 H 569 L 162,20 H 0"
+         inkscape:connector-curvature="0" />
+      <path
+         id="w"
+         d="M 797,-207 C 713,-60 620,16 414,20 203,24 88,-98 87,-302 c 0,-112 37,-198 111,-258 74,-60 192,-93 356,-96 l 243,-4 c 10,-201 -43,-307 -232,-305 -154,2 -223,43 -242,172 l -188,-17 c 31,-195 175,-292 434,-292 259,0 410,116 410,364 v 466 c 3,95 12,159 101,161 17,0 37,-2 59,-7 V -6 C 1094,5 1047,10 1000,10 857,8 812,-66 803,-207 Z m -525,-92 c -1,116 66,187 183,184 230,-7 361,-164 342,-419 -124,5 -305,-2 -389,30 -83,32 -136,92 -136,205"
+         inkscape:connector-curvature="0" />
+      <path
+         id="x"
+         d="m 779,-765 c -19,-119 -93,-196 -233,-196 -95,0 -164,32 -207,95 -43,63 -64,170 -64,320 0,144 23,251 68,320 45,69 114,104 205,104 139,0 224,-79 240,-212 l 182,12 C 946,-119 781,22 553,20 230,17 87,-201 87,-542 c 0,-338 145,-557 464,-560 225,-1 380,129 413,323"
+         inkscape:connector-curvature="0" />
+      <path
+         id="y"
+         d="m 336,-268 c 2,98 22,139 114,141 24,0 59,-5 104,-14 V -8 C 495,8 434,16 372,16 228,16 156,-66 156,-229 V -951 H 31 v -131 h 132 l 53,-242 h 120 v 242 h 200 v 131 H 336 v 683"
+         inkscape:connector-curvature="0" />
+      <g
+         id="a">
+        <use
+           id="use981"
+           xlink:href="#v"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use983"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,9.8784722,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use985"
+           xlink:href="#x"
+           transform="matrix(0.01736111,0,0,0.01736111,29.652778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use987"
+           xlink:href="#x"
+           transform="matrix(0.01736111,0,0,0.01736111,47.430556,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use989"
+           xlink:href="#y"
+           transform="matrix(0.01736111,0,0,0.01736111,65.208333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="z"
+         d="M 187,0 V -219 H 382 V 0 H 187"
+         inkscape:connector-curvature="0" />
+      <path
+         id="A"
+         d="m 513,-963 c -139,1 -238,29 -238,149 0,72 41,100 95,127 55,27 348,94 404,125 101,56 176,118 176,263 C 950,-73 758,21 511,20 254,19 107,-55 57,-254 l 159,-31 c 34,123 133,168 295,168 156,0 264,-34 264,-168 0,-156 -183,-165 -315,-204 -171,-51 -245,-68 -323,-172 -26,-35 -37,-82 -37,-135 0,-220 172,-304 413,-303 232,1 379,74 418,265 l -162,20 C 746,-918 647,-964 513,-963"
+         inkscape:connector-curvature="0" />
+      <path
+         id="B"
+         d="m 322,-1484 c -2,195 6,405 -8,587 h 3 c 73,-129 159,-205 346,-205 250,0 342,118 343,381 V 0 H 825 v -686 c 3,-190 -43,-277 -223,-277 -176,-1 -280,140 -280,325 V 0 H 142 v -1484 h 180"
+         inkscape:connector-curvature="0" />
+      <path
+         id="C"
+         d="m 318,-861 c 55,-157 83,-241 257,-241 24,0 48,3 73,10 v 165 c -24,-7 -56,-10 -96,-10 -75,0 -132,33 -171,97 -39,64 -59,156 -59,276 V 0 H 142 c -3,-364 6,-725 -6,-1082 h 170 c 5,123 8,196 8,221 h 4"
+         inkscape:connector-curvature="0" />
+      <path
+         id="D"
+         d="m 835,0 c -5,-29 -11,-137 -10,-174 h -4 C 759,-45 663,20 484,20 177,20 86,-201 86,-536 c 0,-377 133,-566 398,-566 178,1 273,67 339,188 -4,-187 -1,-380 -2,-570 h 180 v 1261 c 0,113 2,187 6,223 z m -14,-554 c 0,-255 -58,-415 -289,-415 -91,0 -151,37 -196,101 -76,109 -77,543 -1,651 44,63 105,98 195,98 235,0 291,-173 291,-435"
+         inkscape:connector-curvature="0" />
+      <path
+         id="E"
+         d="m 87,-548 c 0,-338 159,-553 484,-554 325,-2 484,204 477,599 H 276 c -1,227 88,385 302,388 146,2 246,-65 283,-166 l 158,45 C 954,-65 807,20 578,20 240,20 87,-193 87,-548 Z m 775,-93 c -19,-206 -90,-328 -294,-328 -185,0 -285,140 -290,328 h 584"
+         inkscape:connector-curvature="0" />
+      <path
+         id="F"
+         d="M -31,407 V 277 H 1162 V 407 H -31"
+         inkscape:connector-curvature="0" />
+      <g
+         id="b">
+        <use
+           id="use999"
+           xlink:href="#v"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1001"
+           xlink:href="#z"
+           transform="matrix(0.01736111,0,0,0.01736111,9.8784722,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1003"
+           xlink:href="#A"
+           transform="matrix(0.01736111,0,0,0.01736111,19.756944,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1005"
+           xlink:href="#B"
+           transform="matrix(0.01736111,0,0,0.01736111,37.534722,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1007"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,57.309028,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1009"
+           xlink:href="#C"
+           transform="matrix(0.01736111,0,0,0.01736111,77.083333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1011"
+           xlink:href="#D"
+           transform="matrix(0.01736111,0,0,0.01736111,88.923611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1013"
+           xlink:href="#E"
+           transform="matrix(0.01736111,0,0,0.01736111,108.69792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1015"
+           xlink:href="#D"
+           transform="matrix(0.01736111,0,0,0.01736111,128.47222,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1017"
+           xlink:href="#F"
+           transform="matrix(0.01736111,0,0,0.01736111,148.24653,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1019"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,168.02083,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1021"
+           xlink:href="#x"
+           transform="matrix(0.01736111,0,0,0.01736111,187.79514,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1023"
+           xlink:href="#x"
+           transform="matrix(0.01736111,0,0,0.01736111,205.57292,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1025"
+           xlink:href="#y"
+           transform="matrix(0.01736111,0,0,0.01736111,223.35069,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="G"
+         d="m 571,-1102 c 350,0 480,196 482,560 2,357 -151,562 -488,562 -332,0 -479,-218 -479,-562 0,-373 162,-560 485,-560 z m -8,989 c 244,0 301,-164 301,-429 0,-266 -49,-427 -290,-427 -239,0 -299,165 -299,427 0,252 61,429 288,429"
+         inkscape:connector-curvature="0" />
+      <path
+         id="H"
+         d="m 663,-1102 c 251,0 343,119 343,381 V 0 H 825 v -686 c 0,-183 -40,-279 -223,-277 -184,2 -280,141 -280,336 V 0 H 142 c -3,-345 6,-754 -6,-1082 h 170 c 5,68 6,94 8,185 h 3 c 76,-134 157,-205 346,-205"
+         inkscape:connector-curvature="0" />
+      <path
+         id="I"
+         d="m 1059,-705 c 0,235 -42,415 -125,539 C 851,-42 729,20 567,20 405,20 283,-42 202,-165 121,-288 80,-468 80,-705 c 0,-242 39,-423 118,-544 79,-121 204,-181 375,-181 166,0 288,61 367,183 79,122 119,303 119,542 z m -257,436 c 94,-156 93,-724 4,-878 -51,-89 -125,-137 -233,-137 -111,0 -186,48 -239,135 -91,149 -91,731 2,883 55,89 126,139 233,139 106,0 178,-51 233,-142"
+         inkscape:connector-curvature="0" />
+      <path
+         id="J"
+         d="m 156,0 v -153 h 359 v -1084 l -318,227 v -170 l 333,-229 h 166 v 1256 h 343 V 0 H 156"
+         inkscape:connector-curvature="0" />
+      <path
+         id="K"
+         d="m 655,-1102 c 307,0 398,221 398,556 0,377 -133,566 -398,566 -180,0 -272,-66 -339,-188 1,22 -7,151 -10,168 H 132 c 4,-36 6,-110 6,-223 v -1261 h 180 c -2,196 4,384 -4,576 h 4 c 62,-129 158,-194 337,-194 z m -337,573 c 0,254 57,416 289,416 91,0 152,-37 197,-101 76,-109 76,-543 0,-651 -44,-63 -105,-98 -195,-98 -236,0 -291,169 -291,434"
+         inkscape:connector-curvature="0" />
+      <path
+         id="L"
+         d="m 572,-1430 c 269,0 442,128 442,386 0,144 -72,232 -149,325 -108,130 -487,366 -564,566 h 735 V 0 H 103 v -127 c 119,-285 378,-432 583,-627 76,-72 141,-150 143,-284 1,-156 -100,-244 -257,-244 -156,0 -263,93 -277,238 l -184,-17 c 24,-224 208,-369 461,-369"
+         inkscape:connector-curvature="0" />
+      <path
+         id="M"
+         d="m 715,-719 c 191,17 334,134 334,330 C 1049,-115 858,20 571,20 288,20 108,-110 78,-362 l 186,-17 c 24,167 126,250 307,250 177,0 294,-88 291,-266 -3,-174 -149,-246 -344,-244 H 416 v -156 h 98 c 179,2 311,-77 311,-243 0,-157 -98,-244 -264,-244 -159,0 -264,88 -278,233 l -181,-14 c 23,-229 206,-367 461,-367 262,0 447,124 447,373 0,197 -120,298 -295,334 v 4"
+         inkscape:connector-curvature="0" />
+      <path
+         id="N"
+         d="M 1036,-1263 C 892,-1043 790,-871 731,-746 626,-522 556,-302 553,0 H 365 c 0,-180 39,-369 115,-568 76,-199 203,-429 382,-688 H 105 v -153 h 931 v 146"
+         inkscape:connector-curvature="0" />
+      <g
+         id="c">
+        <use
+           id="use1036"
+           xlink:href="#x"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1038"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1040"
+           xlink:href="#H"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1042"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1044"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,50.403646,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1046"
+           xlink:href="#I"
+           transform="matrix(0.01302083,0,0,0.01302083,65.234375,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1048"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,80.065104,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1050"
+           xlink:href="#J"
+           transform="matrix(0.01302083,0,0,0.01302083,94.895833,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1052"
+           xlink:href="#E"
+           transform="matrix(0.01302083,0,0,0.01302083,109.72656,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1054"
+           xlink:href="#E"
+           transform="matrix(0.01302083,0,0,0.01302083,124.55729,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1056"
+           xlink:href="#K"
+           transform="matrix(0.01302083,0,0,0.01302083,139.38802,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1058"
+           xlink:href="#L"
+           transform="matrix(0.01302083,0,0,0.01302083,154.21875,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1060"
+           xlink:href="#M"
+           transform="matrix(0.01302083,0,0,0.01302083,169.04948,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1062"
+           xlink:href="#N"
+           transform="matrix(0.01302083,0,0,0.01302083,183.88021,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="d">
+        <use
+           id="use1065"
+           xlink:href="#x"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1067"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1069"
+           xlink:href="#H"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1071"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="e">
+        <use
+           id="use1074"
+           xlink:href="#x"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1076"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1078"
+           xlink:href="#H"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1080"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="O"
+         d="M 496,424 C 268,175 127,-92 127,-532 c 0,-438 143,-704 369,-952 h 174 c -222,249 -362,524 -362,954 0,431 138,703 362,954 H 496"
+         inkscape:connector-curvature="0" />
+      <path
+         id="P"
+         d="m 320,-908 c 63,-128 152,-193 335,-193 133,0 233,45 299,134 66,89 99,230 99,421 0,377 -133,566 -398,566 -167,0 -279,-63 -336,-188 h -5 c 8,141 2,428 4,593 H 138 V -861 c 0,-111 -2,-185 -6,-221 h 174 c 5,33 9,134 10,174 z m -2,380 c 0,254 57,415 289,415 89,0 149,-37 195,-99 76,-105 79,-547 1,-653 -45,-62 -105,-97 -194,-97 -243,1 -291,184 -291,434"
+         inkscape:connector-curvature="0" />
+      <path
+         id="Q"
+         d="m 137,-1312 v -172 h 180 v 172 z M 137,0 V -1082 H 317 V 0 H 137"
+         inkscape:connector-curvature="0" />
+      <path
+         id="R"
+         d="M 613,0 H 400 L 7,-1082 h 192 c 109,337 207,579 307,941 97,-323 214,-627 320,-941 h 191"
+         inkscape:connector-curvature="0" />
+      <g
+         id="f">
+        <use
+           id="use1087"
+           xlink:href="#O"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1089"
+           xlink:href="#P"
+           transform="matrix(0.01302083,0,0,0.01302083,8.8802083,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1091"
+           xlink:href="#Q"
+           transform="matrix(0.01302083,0,0,0.01302083,23.710937,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1093"
+           xlink:href="#R"
+           transform="matrix(0.01302083,0,0,0.01302083,29.635417,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1095"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,42.96875,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1097"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,57.799479,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="S"
+         d="m 186,-1484 c 228,249 369,516 369,956 0,438 -143,704 -369,952 H 12 C 235,172 374,-97 374,-530 374,-961 234,-1234 12,-1484 h 174"
+         inkscape:connector-curvature="0" />
+      <g
+         id="g">
+        <use
+           id="use1101"
+           xlink:href="#D"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1103"
+           xlink:href="#K"
+           transform="matrix(0.01302083,0,0,0.01302083,14.830729,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1105"
+           xlink:href="#S"
+           transform="matrix(0.01302083,0,0,0.01302083,29.661458,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="T"
+         d="m 779,-765 c -19,-119 -93,-196 -233,-196 -95,0 -164,32 -207,95 -43,63 -64,170 -64,320 0,144 23,251 68,320 45,69 114,104 205,104 139,0 224,-79 240,-212 l 182,12 C 946,-119 781,22 553,20 230,17 87,-201 87,-542 c 0,-338 145,-557 464,-560 225,-1 380,129 413,323"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="U"
+         d="M 797,-207 C 713,-60 620,16 414,20 203,24 88,-98 87,-302 c 0,-112 37,-198 111,-258 74,-60 192,-93 356,-96 l 243,-4 c 10,-201 -43,-307 -232,-305 -154,2 -223,43 -242,172 l -188,-17 c 31,-195 175,-292 434,-292 259,0 410,116 410,364 v 466 c 3,95 12,159 101,161 17,0 37,-2 59,-7 V -6 C 1094,5 1047,10 1000,10 857,8 812,-66 803,-207 Z m -525,-92 c -1,116 66,187 183,184 230,-7 361,-164 342,-419 -124,5 -305,-2 -389,30 -83,32 -136,92 -136,205"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="V"
+         d="m 336,-268 c 2,98 22,139 114,141 24,0 59,-5 104,-14 V -8 C 495,8 434,16 372,16 228,16 156,-66 156,-229 V -951 H 31 v -131 h 132 l 53,-242 h 120 v 242 h 200 v 131 H 336 v 683"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <g
+         id="h">
+        <use
+           id="use1111"
+           xlink:href="#T"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1113"
+           xlink:href="#U"
+           transform="matrix(0.01736111,0,0,0.01736111,17.777778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1115"
+           xlink:href="#V"
+           transform="matrix(0.01736111,0,0,0.01736111,37.552083,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="W"
+         d="m 824,-897 c -1,-17 6,-175 12,-185 h 171 c -12,319 -6,716 -6,1051 0,304 -151,456 -453,456 -226,0 -374,-90 -417,-267 l 181,-26 c 24,102 112,157 241,156 179,0 269,-105 269,-315 0,-57 3,-120 -2,-174 C 759,-74 647,8 472,8 339,8 242,-36 180,-124 118,-212 86,-350 86,-539 c 0,-191 33,-332 100,-423 67,-91 169,-137 306,-137 167,0 273,85 332,202 z m -38,579 c 48,-119 46,-331 0,-450 -42,-108 -118,-197 -250,-197 -92,0 -154,37 -201,100 -78,107 -74,530 -4,643 63,101 251,129 353,47 43,-35 77,-81 102,-143"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="X"
+         d="m 137,-1312 v -172 h 180 v 172 z M 137,0 V -1082 H 317 V 0 H 137"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="Y"
+         d="m 318,-861 c 55,-157 83,-241 257,-241 24,0 48,3 73,10 v 165 c -24,-7 -56,-10 -96,-10 -75,0 -132,33 -171,97 -39,64 -59,156 -59,276 V 0 H 142 c -3,-364 6,-725 -6,-1082 h 170 c 5,123 8,196 8,221 h 4"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="Z"
+         d="m 492,-1341 c -103,3 -130,49 -131,162 v 97 h 211 v 131 H 361 V 0 H 181 V -951 H 29 v -131 h 152 v -122 c 0,-192 78,-276 264,-278 50,0 92,4 127,12 v 137 c -30,-5 -57,-8 -80,-8"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="aa"
+         d="m 87,-548 c 0,-338 159,-553 484,-554 325,-2 484,204 477,599 H 276 c -1,227 88,385 302,388 146,2 246,-65 283,-166 l 158,45 C 954,-65 807,20 578,20 240,20 87,-193 87,-548 Z m 775,-93 c -19,-206 -90,-328 -294,-328 -185,0 -285,140 -290,328 h 584"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <g
+         id="i">
+        <use
+           id="use1123"
+           xlink:href="#W"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1125"
+           xlink:href="#X"
+           transform="matrix(0.01736111,0,0,0.01736111,19.774306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1127"
+           xlink:href="#Y"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1129"
+           xlink:href="#U"
+           transform="matrix(0.01736111,0,0,0.01736111,39.513889,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1131"
+           xlink:href="#Z"
+           transform="matrix(0.01736111,0,0,0.01736111,59.288194,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1133"
+           xlink:href="#Z"
+           transform="matrix(0.01736111,0,0,0.01736111,68.524306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1135"
+           xlink:href="#aa"
+           transform="matrix(0.01736111,0,0,0.01736111,78.402778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="ab"
+         d="M 138,0 V -1484 H 318 V 0 H 138"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="ac"
+         d="m 571,-1102 c 350,0 480,196 482,560 2,357 -151,562 -488,562 -332,0 -479,-218 -479,-562 0,-373 162,-560 485,-560 z m -8,989 c 244,0 301,-164 301,-429 0,-266 -49,-427 -290,-427 -239,0 -299,165 -299,427 0,252 61,429 288,429"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <g
+         id="j">
+        <use
+           id="use1140"
+           xlink:href="#X"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1142"
+           xlink:href="#W"
+           transform="matrix(0.01736111,0,0,0.01736111,7.8993056,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1144"
+           xlink:href="#ab"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1146"
+           xlink:href="#ac"
+           transform="matrix(0.01736111,0,0,0.01736111,35.572917,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1148"
+           xlink:href="#ac"
+           transform="matrix(0.01736111,0,0,0.01736111,55.347222,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="ad"
+         d="m 765,-739 c 171,25 285,155 285,346 C 1049,-119 859,20 570,20 286,20 89,-117 89,-391 89,-574 212,-714 370,-737 v -4 c -143,-30 -248,-160 -248,-328 1,-229 198,-361 444,-361 254,0 448,125 449,363 1,166 -104,300 -250,324 z m -197,-70 c 171,-2 261,-74 260,-248 0,-159 -87,-239 -262,-239 -165,0 -260,77 -260,239 0,163 99,249 262,248 z m 4,694 c 200,0 291,-92 291,-295 1,-179 -116,-264 -297,-264 -175,0 -292,98 -291,268 0,194 99,291 297,291"
+         inkscape:connector-curvature="0" />
+      <path
+         id="ae"
+         d="m 492,-1341 c -103,3 -130,49 -131,162 v 97 h 211 v 131 H 361 V 0 H 181 V -951 H 29 v -131 h 152 v -122 c 0,-192 78,-276 264,-278 50,0 92,4 127,12 v 137 c -30,-5 -57,-8 -80,-8"
+         inkscape:connector-curvature="0" />
+      <g
+         id="k">
+        <use
+           id="use1153"
+           xlink:href="#x"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1155"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1157"
+           xlink:href="#H"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1159"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1161"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,50.403646,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1163"
+           xlink:href="#I"
+           transform="matrix(0.01302083,0,0,0.01302083,65.234375,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1165"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,80.065104,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1167"
+           xlink:href="#D"
+           transform="matrix(0.01302083,0,0,0.01302083,94.895833,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1169"
+           xlink:href="#D"
+           transform="matrix(0.01302083,0,0,0.01302083,109.72656,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1171"
+           xlink:href="#ad"
+           transform="matrix(0.01302083,0,0,0.01302083,124.55729,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1173"
+           xlink:href="#M"
+           transform="matrix(0.01302083,0,0,0.01302083,139.38802,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1175"
+           xlink:href="#L"
+           transform="matrix(0.01302083,0,0,0.01302083,154.21875,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1177"
+           xlink:href="#ad"
+           transform="matrix(0.01302083,0,0,0.01302083,169.04948,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1179"
+           xlink:href="#ae"
+           transform="matrix(0.01302083,0,0,0.01302083,183.88021,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="af"
+         d="m 625,-911 c 261,-2 424,185 424,450 0,289 -169,481 -455,481 -159,0 -280,-59 -364,-177 -84,-118 -126,-290 -126,-515 0,-244 44,-431 131,-562 87,-131 212,-196 373,-196 213,0 347,96 402,287 l -172,31 c -35,-115 -113,-172 -232,-172 -103,0 -182,48 -238,144 -56,96 -85,234 -85,415 59,-113 178,-184 342,-186 z m -37,786 c 182,0 278,-138 278,-328 0,-193 -98,-318 -284,-319 -166,-1 -281,107 -281,276 0,195 106,371 287,371"
+         inkscape:connector-curvature="0" />
+      <g
+         id="l">
+        <use
+           id="use1183"
+           xlink:href="#x"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1185"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1187"
+           xlink:href="#H"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1189"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1191"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,50.403646,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1193"
+           xlink:href="#I"
+           transform="matrix(0.01302083,0,0,0.01302083,65.234375,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1195"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,80.065104,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1197"
+           xlink:href="#w"
+           transform="matrix(0.01302083,0,0,0.01302083,94.895833,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1199"
+           xlink:href="#x"
+           transform="matrix(0.01302083,0,0,0.01302083,109.72656,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1201"
+           xlink:href="#I"
+           transform="matrix(0.01302083,0,0,0.01302083,123.0599,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1203"
+           xlink:href="#I"
+           transform="matrix(0.01302083,0,0,0.01302083,137.89062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1205"
+           xlink:href="#x"
+           transform="matrix(0.01302083,0,0,0.01302083,152.72135,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1207"
+           xlink:href="#af"
+           transform="matrix(0.01302083,0,0,0.01302083,166.05469,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1209"
+           xlink:href="#w"
+           transform="matrix(0.01302083,0,0,0.01302083,180.88542,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="m">
+        <use
+           id="use1212"
+           xlink:href="#H"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1214"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,19.774306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1216"
+           xlink:href="#H"
+           transform="matrix(0.01736111,0,0,0.01736111,39.548611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1218"
+           xlink:href="#E"
+           transform="matrix(0.01736111,0,0,0.01736111,59.322917,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="ag"
+         d="m 91,-464 v -160 h 500 v 160 H 91"
+         inkscape:connector-curvature="0" />
+      <use
+         id="n"
+         xlink:href="#ag"
+         transform="scale(0.01736111)"
+         x="0"
+         y="0"
+         width="100%"
+         height="100%" />
+      <g
+         id="o">
+        <use
+           id="use1223"
+           xlink:href="#x"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1225"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,17.777778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1227"
+           xlink:href="#y"
+           transform="matrix(0.01736111,0,0,0.01736111,37.552083,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="p">
+        <use
+           id="use1230"
+           xlink:href="#x"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1232"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,17.777778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1234"
+           xlink:href="#y"
+           transform="matrix(0.01736111,0,0,0.01736111,37.552083,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="ah"
+         d="m 824,-897 c -1,-17 6,-175 12,-185 h 171 c -12,319 -6,716 -6,1051 0,304 -151,456 -453,456 -226,0 -374,-90 -417,-267 l 181,-26 c 24,102 112,157 241,156 179,0 269,-105 269,-315 0,-57 3,-120 -2,-174 C 759,-74 647,8 472,8 339,8 242,-36 180,-124 118,-212 86,-350 86,-539 c 0,-191 33,-332 100,-423 67,-91 169,-137 306,-137 167,0 273,85 332,202 z m -38,579 c 48,-119 46,-331 0,-450 -42,-108 -118,-197 -250,-197 -92,0 -154,37 -201,100 -78,107 -74,530 -4,643 63,101 251,129 353,47 43,-35 77,-81 102,-143"
+         inkscape:connector-curvature="0" />
+      <g
+         id="q">
+        <use
+           id="use1238"
+           xlink:href="#ah"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1240"
+           xlink:href="#Q"
+           transform="matrix(0.01736111,0,0,0.01736111,19.774306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1242"
+           xlink:href="#C"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1244"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,39.513889,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1246"
+           xlink:href="#ae"
+           transform="matrix(0.01736111,0,0,0.01736111,59.288194,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1248"
+           xlink:href="#ae"
+           transform="matrix(0.01736111,0,0,0.01736111,68.524306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1250"
+           xlink:href="#E"
+           transform="matrix(0.01736111,0,0,0.01736111,78.402778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="r">
+        <use
+           id="use1253"
+           xlink:href="#ah"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1255"
+           xlink:href="#Q"
+           transform="matrix(0.01736111,0,0,0.01736111,19.774306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1257"
+           xlink:href="#C"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1259"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,39.513889,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1261"
+           xlink:href="#ae"
+           transform="matrix(0.01736111,0,0,0.01736111,59.288194,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1263"
+           xlink:href="#ae"
+           transform="matrix(0.01736111,0,0,0.01736111,68.524306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1265"
+           xlink:href="#E"
+           transform="matrix(0.01736111,0,0,0.01736111,78.402778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="ai"
+         d="M 138,0 V -1484 H 318 V 0 H 138"
+         inkscape:connector-curvature="0" />
+      <g
+         id="s">
+        <use
+           id="use1269"
+           xlink:href="#Q"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1271"
+           xlink:href="#ah"
+           transform="matrix(0.01736111,0,0,0.01736111,7.8993056,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1273"
+           xlink:href="#ai"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1275"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,35.572917,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1277"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,55.347222,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="t">
+        <use
+           id="use1280"
+           xlink:href="#Q"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1282"
+           xlink:href="#ah"
+           transform="matrix(0.01736111,0,0,0.01736111,7.8993056,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1284"
+           xlink:href="#ai"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1286"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,35.572917,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1288"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,55.347222,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="u">
+        <use
+           id="use1291"
+           xlink:href="#H"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1293"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,19.774306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1295"
+           xlink:href="#H"
+           transform="matrix(0.01736111,0,0,0.01736111,39.548611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1297"
+           xlink:href="#E"
+           transform="matrix(0.01736111,0,0,0.01736111,59.322917,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+    </defs>
+    <marker
+       inkscape:stockid="EmptyTriangleOutL"
+       orient="auto"
+       refY="0"
+       refX="0"
+       id="EmptyTriangleOutL-3"
+       style="overflow:visible"
+       inkscape:isstock="true">
+      <path
+         inkscape:connector-curvature="0"
+         id="path3269-8"
+         d="M 5.77,0 -2.88,5 V -5 Z"
+         style="fill:#ffffff;fill-rule:evenodd;stroke:#000000;stroke-width:1.00000003pt;stroke-opacity:1"
+         transform="matrix(0.8,0,0,0.8,-4.8,0)" />
+    </marker>
+    <marker
+       inkscape:stockid="EmptyTriangleInL"
+       orient="auto"
+       refY="0"
+       refX="0"
+       id="EmptyTriangleInL-3"
+       style="overflow:visible"
+       inkscape:isstock="true">
+      <path
+         inkscape:connector-curvature="0"
+         id="path3260-1"
+         d="M 5.77,0 -2.88,5 V -5 Z"
+         style="fill:#ffffff;fill-rule:evenodd;stroke:#000000;stroke-width:1.00000003pt;stroke-opacity:1"
+         transform="matrix(-0.8,0,0,-0.8,4.8,0)" />
+    </marker>
+    <marker
+       inkscape:stockid="EmptyTriangleInL"
+       orient="auto"
+       refY="0"
+       refX="0"
+       id="EmptyTriangleInL-3-9"
+       style="overflow:visible"
+       inkscape:isstock="true">
+      <path
+         inkscape:connector-curvature="0"
+         id="path3260-1-6"
+         d="M 5.77,0 -2.88,5 V -5 Z"
+         style="fill:#ffffff;fill-rule:evenodd;stroke:#000000;stroke-width:1.00000003pt;stroke-opacity:1"
+         transform="matrix(-0.8,0,0,-0.8,4.8,0)" />
+    </marker>
+    <marker
+       inkscape:stockid="EmptyTriangleOutL"
+       orient="auto"
+       refY="0"
+       refX="0"
+       id="marker4007-4"
+       style="overflow:visible"
+       inkscape:isstock="true">
+      <path
+         inkscape:connector-curvature="0"
+         id="path4005-3"
+         d="M 5.77,0 -2.88,5 V -5 Z"
+         style="fill:#ffffff;fill-rule:evenodd;stroke:#000000;stroke-width:1.00000003pt;stroke-opacity:1"
+         transform="matrix(0.8,0,0,0.8,-4.8,0)" />
+    </marker>
+    <marker
+       inkscape:stockid="EmptyTriangleInL"
+       orient="auto"
+       refY="0"
+       refX="0"
+       id="EmptyTriangleInL-3-3"
+       style="overflow:visible"
+       inkscape:isstock="true">
+      <path
+         inkscape:connector-curvature="0"
+         id="path3260-1-8"
+         d="M 5.77,0 -2.88,5 V -5 Z"
+         style="fill:#ffffff;fill-rule:evenodd;stroke:#000000;stroke-width:1.00000003pt;stroke-opacity:1"
+         transform="matrix(-0.8,0,0,-0.8,4.8,0)" />
+    </marker>
+    <marker
+       inkscape:stockid="EmptyTriangleOutL"
+       orient="auto"
+       refY="0"
+       refX="0"
+       id="marker4007-6"
+       style="overflow:visible"
+       inkscape:isstock="true">
+      <path
+         inkscape:connector-curvature="0"
+         id="path4005-0"
+         d="M 5.77,0 -2.88,5 V -5 Z"
+         style="fill:#ffffff;fill-rule:evenodd;stroke:#000000;stroke-width:1.00000003pt;stroke-opacity:1"
+         transform="matrix(0.8,0,0,0.8,-4.8,0)" />
+    </marker>
+    <marker
+       inkscape:stockid="EmptyTriangleInL"
+       orient="auto"
+       refY="0"
+       refX="0"
+       id="marker5004-8"
+       style="overflow:visible"
+       inkscape:isstock="true">
+      <path
+         inkscape:connector-curvature="0"
+         id="path5002-8"
+         d="M 5.77,0 -2.88,5 V -5 Z"
+         style="fill:#ffffff;fill-rule:evenodd;stroke:#000000;stroke-width:1.00000003pt;stroke-opacity:1"
+         transform="matrix(-0.8,0,0,-0.8,4.8,0)" />
+    </marker>
+    <marker
+       inkscape:stockid="EmptyTriangleOutL"
+       orient="auto"
+       refY="0"
+       refX="0"
+       id="marker5092-8"
+       style="overflow:visible"
+       inkscape:isstock="true">
+      <path
+         inkscape:connector-curvature="0"
+         id="path5090-9"
+         d="M 5.77,0 -2.88,5 V -5 Z"
+         style="fill:#ffffff;fill-rule:evenodd;stroke:#000000;stroke-width:1.00000003pt;stroke-opacity:1"
+         transform="matrix(0.8,0,0,0.8,-4.8,0)" />
+    </marker>
+  </defs>
+  <sodipodi:namedview
+     pagecolor="#ffffff"
+     bordercolor="#666666"
+     borderopacity="1"
+     objecttolerance="10"
+     gridtolerance="10"
+     guidetolerance="10"
+     inkscape:pageopacity="0"
+     inkscape:pageshadow="2"
+     inkscape:window-width="3840"
+     inkscape:window-height="2031"
+     id="namedview1306"
+     showgrid="false"
+     inkscape:zoom="2.1371359"
+     inkscape:cx="357.15751"
+     inkscape:cy="315.38739"
+     inkscape:window-x="0"
+     inkscape:window-y="55"
+     inkscape:window-maximized="1"
+     inkscape:current-layer="svg1304" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke-width:0.45284426"
+     inkscape:connector-curvature="0"
+     id="path861"
+     d="M 0.896161,223.84405 H 628.99114 V 339.77218 H 0.896161 Z" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:1.01232886"
+     inkscape:connector-curvature="0"
+     id="path863"
+     d="m 12.267992,223.84405 h 11.371829 m 5.685916,0 h 11.371831 m 5.691571,0 H 57.76097 m 5.691573,0 h 11.371829 m 5.685916,0 h 11.37183 m 5.691577,0 h 11.371825 m 5.66895,0 h 11.38315 m 5.68591,0 h 11.37183 m 5.68591,0 h 11.37182 m 5.68591,0 h 11.37184 m 5.68592,0 h 11.37184 m 5.69156,0 h 11.37182 m 5.68593,0 h 11.37183 m 5.68591,0 h 11.37184 m 5.68591,0 h 11.37182 m 5.68592,0 h 11.37183 m 5.69158,0 h 11.37183 m 5.68591,0 h 11.37182 m 5.68027,0 h 11.37183 m 5.69723,0 h 11.37183 m 5.68026,0 h 11.37184 m 5.69156,0 h 11.37183 m 5.68591,0 h 11.37183 m 5.68592,0 h 11.37184 m 5.68591,0 H 433.054 m 5.69156,0 h 11.36618 m 5.69157,0 h 11.37184 m 5.68591,0 h 11.37183 m 5.69158,0 h 11.37182 m 5.68592,0 h 11.38316 m 5.6859,0 h 11.37183 m 5.68591,0 h 11.37183 m 5.68593,0 h 11.37183 m 5.6859,0 h 11.37184 m 5.69157,0 h 11.37182 m 5.68593,0 h 11.37183 m 5.68591,0 h 11.37183 m 5.68592,0 h 11.37182 m 5.68592,0 h 11.37183 m 5.69157,0 h 11.37183 m 5.68592,0 h 11.37183 m 5.68024,0 h 11.37185 m 5.68592,0 h 11.37183 m 5.68025,0 h 11.37182 m 5.69158,0 h 11.37183 m 5.68592,0 h 5.68592 v 4.29297 m 0,4.29296 v 8.59046 m 0,4.29296 v 8.59045 m 0,4.29297 v 8.58592 m 0,4.30202 v 8.58593 m 0,4.29297 v 8.58592 m 0,4.30202 v 8.5814 m 0,4.29296 v 8.58593 m 0,4.28844 v 8.59045 m 0,4.29297 v 4.28843 h -5.68592 m -5.68592,0 h -11.37183 m -5.68593,0 h -11.37181 m -5.69157,0 h -11.37184 m -5.69157,0 h -11.37182 m -5.68593,0 h -11.37182 m -5.69157,0 h -11.37184 m -5.68591,0 h -11.38316 m -5.6859,0 h -11.37183 m -5.68593,0 h -11.37182 m -5.6859,0 h -11.37184 m -5.68592,0 h -11.37183 m -5.69158,0 h -11.37182 m -5.6859,0 h -11.37185 m -5.68592,0 h -11.37182 m -5.68592,0 h -11.37183 m -5.68591,0 h -11.37184 m -5.69157,0 h -11.37182 m -5.68592,0 h -11.37183 m -5.68025,0 H 455.792 m -5.68026,0 h -11.37181 m -5.68028,0 h -11.37182 m -5.69157,0 h -11.37184 m -5.68592,0 h -11.37183 m -5.68591,0 h -11.37183 m -5.68593,0 h -11.37182 m -5.69157,0 h -11.36617 m -5.69157,0 h -11.37184 m -5.68592,0 h -11.37182 m -5.69157,0 h -11.37183 m -5.68592,0 h -11.38313 m -5.68591,0 h -11.37185 m -5.68591,0 h -11.37184 m -5.68591,0 H 216.9666 m -5.68593,0 h -11.37183 m -5.69156,0 h -11.37184 m -5.68591,0 h -11.37182 m -5.68593,0 h -11.37183 m -5.68592,0 h -11.37182 m -5.68592,0 h -11.37182 m -5.69158,0 H 97.551059 m -5.685914,0 h -11.37183 m -5.680258,0 H 63.441228 m -5.685915,0 H 46.383482 m -5.680259,0 H 29.331395 m -5.691574,0 H 12.267992 m -5.6859158,0 H 0.896161 v -4.29296 m 0,-4.29297 v -8.59045 m 0,-4.29297 v -8.59045 m 0,-4.29296 v -8.57687 m 0,-4.30203 v -8.58592 m 0,-4.29296 v -8.58593 m 0,-4.30202 v -8.5814 m 0,-4.29296 v -8.59046 m 0,-4.28843 v -8.59046 m 0,-4.29296 v -4.29297 h 5.6859152" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path865"
+     d="M 4.9717593,223.84405 H 52.067561 v 30.34057 H 4.9717593 Z" />
+  <path
+     style="fill:#d2fff2;stroke-width:0.50616443"
+     inkscape:connector-curvature="0"
+     id="path869"
+     d="M 0.896161,339.77218 H 785.60903 V 455.70031 H 0.896161 Z" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:1.01232886"
+     inkscape:connector-curvature="0"
+     id="path871"
+     d="m 12.267992,339.77218 h 11.371829 m 5.685916,0 h 11.371831 m 5.691571,0 H 57.76097 m 5.691573,0 h 11.371829 m 5.685916,0 h 11.37183 m 5.691577,0 h 11.371825 m 5.68592,0 h 11.38314 m 5.68591,0 h 11.37184 m 5.68592,0 h 11.37184 m 5.6859,0 h 11.37182 m 5.68591,0 h 11.37183 m 5.69159,0 h 11.37184 m 5.6859,0 h 11.37182 m 5.68591,0 h 11.37185 m 5.68591,0 h 11.37184 m 5.68591,0 h 11.37182 m 5.69158,0 h 11.37184 m 5.68591,0 h 11.37183 m 5.68026,0 h 11.37181 m 5.68593,0 h 11.37183 m 5.68025,0 H 364.823 m 5.6916,0 h 11.37182 m 5.68592,0 h 11.37182 m 5.68591,0 h 11.37184 m 5.68592,0 h 11.37182 m 5.69158,0 h 11.36051 m 5.69157,0 h 11.37184 m 5.68591,0 h 11.37183 m 5.69158,0 h 11.37182 m 5.68592,0 h 11.38316 m 5.6859,0 h 11.37183 m 5.68591,0 h 11.37183 m 5.68593,0 h 11.37183 m 5.6859,0 h 11.37184 m 5.69157,0 h 11.37182 m 5.68593,0 h 11.37183 m 5.68591,0 h 11.37183 m 5.68592,0 h 11.37182 m 5.68592,0 h 11.37183 m 5.69157,0 h 11.37183 m 5.68592,0 h 11.37183 m 5.68024,0 h 11.37185 m 5.68592,0 h 11.37183 m 5.68025,0 h 11.37182 m 5.69158,0 h 11.37183 m 5.68592,0 h 5.68592 v 4.29296 m 0,4.29297 v 8.59045 m 0,4.29297 v 8.59045 m 0,4.29297 v 8.58592 m 0,4.30202 v 8.58593 m 0,4.29296 v 8.58593 m 0,4.30202 v 8.5814 m 0,4.29296 v 8.58593 m 0,4.28843 v 8.59046 m 0,4.29296 v 4.28844 h -5.68592 m -5.68592,0 h -11.37183 m -5.68593,0 h -11.37181 m -5.69157,0 h -11.37184 m -5.69157,0 h -11.37182 m -5.68593,0 h -11.37182 m -5.69157,0 h -11.37184 m -5.68591,0 h -11.38316 m -5.6859,0 h -11.37183 m -5.68593,0 h -11.37182 m -5.6859,0 h -11.37184 m -5.68592,0 h -11.37183 m -5.69158,0 h -11.37182 m -5.6859,0 h -11.37185 m -5.68592,0 h -11.37182 m -5.68592,0 h -11.37183 m -5.68591,0 h -11.37184 m -5.69157,0 h -11.37182 m -5.68592,0 h -11.37183 m -5.68025,0 H 455.792 m -5.68026,0 h -11.37181 m -5.68028,0 h -11.37182 m -5.69157,0 h -11.37184 m -5.68592,0 h -11.37183 m -5.68591,0 h -11.37183 m -5.68593,0 h -11.37182 m -5.69157,0 h -11.36617 m -5.69157,0 h -11.37184 m -5.68592,0 h -11.37182 m -5.69157,0 h -11.37183 m -5.68592,0 h -11.38313 m -5.68591,0 h -11.37185 m -5.68591,0 h -11.37184 m -5.68591,0 H 216.9666 m -5.68593,0 h -11.37183 m -5.69156,0 h -11.37184 m -5.68591,0 h -11.37182 m -5.68593,0 h -11.37183 m -5.68592,0 h -11.37182 m -5.68592,0 h -11.37182 m -5.69158,0 H 97.551059 m -5.685914,0 h -11.37183 m -5.680258,0 H 63.441228 m -5.685915,0 H 46.383482 m -5.680259,0 H 29.331395 m -5.691574,0 H 12.267992 m -5.6859158,0 H 0.896161 v -4.29297 m 0,-4.29296 v -8.59045 m 0,-4.29297 v -8.59045 m 0,-4.29297 v -8.57687 m 0,-4.30202 v -8.58592 m 0,-4.29297 v -8.58592 m 0,-4.30202 v -8.5814 m 0,-4.29297 V 361.237 m 0,-4.28844 v -8.59045 m 0,-4.29297 v -4.29296 h 5.6859152" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path873"
+     d="M 4.9717593,339.77218 H 122.71126 v 30.34056 H 4.9717593 Z" />
+  <path
+     style="fill:#ffffff;stroke:#000000;stroke-width:1.07623756"
+     inkscape:connector-curvature="0"
+     id="path877"
+     d="m 3.360172,396.7534 c 0,-2.74164 3.159469,-4.9602 7.063854,-4.9602 H 150.41677 c 3.90438,0 7.06386,2.21856 7.06386,4.9602 v 30.21218 c 0,2.74164 -3.15948,4.9602 -7.06386,4.9602 H 10.424026 c -3.904385,0 -7.063854,-2.21856 -7.063854,-4.9602 z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path897"
+     d="m 68.369954,309.43162 h 38.038916 v 30.34056 H 68.369954 Z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path913"
+     d="m 199.24194,309.43162 h 87.39894 v 30.34056 h -87.39894 z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path941"
+     d="M 41.010676,431.24672 H 153.76889 v 30.34056 H 41.010676 Z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path949"
+     d="M 154.90138,431.24672 H 267.6596 v 30.34056 H 154.90138 Z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path957"
+     d="M 292.79208,431.69956 H 405.5503 v 30.34057 H 292.79208 Z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path967"
+     d="m 497.21346,302.63895 h 112.75822 v 30.34057 H 497.21346 Z" />
+  <path
+     style="fill:#ffffff;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path885"
+     d="m 338.91129,266.63783 c 0,-2.75329 2.22799,-4.98129 4.98128,-4.98129 h 98.72005 c 2.75329,0 4.98129,2.228 4.98129,4.98129 v 30.34057 c 0,2.75329 -2.228,4.98128 -4.98129,4.98128 h -98.72005 c -2.75329,0 -4.98128,-2.22799 -4.98128,-4.98128 z" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="344.86392"
+     y="287.66559"
+     id="text101-6"><tspan
+       sodipodi:role="line"
+       id="tspan99-88"
+       x="344.86392"
+       y="287.66559"
+       style="stroke-width:0.45284379">cont (fresh db)</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="6.9198484"
+     y="357.37653"
+     id="text277"><tspan
+       sodipodi:role="line"
+       id="tspan275"
+       x="6.9198484"
+       y="357.37653"
+       style="stroke-width:0.45284379">/.shards_acct</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="8.2687769"
+     y="240.81049"
+     id="text281"><tspan
+       sodipodi:role="line"
+       id="tspan279"
+       x="8.2687769"
+       y="240.81049"
+       style="stroke-width:0.45284379">/acct</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="9.5435867"
+     y="417.57593"
+     id="text101"><tspan
+       sodipodi:role="line"
+       id="tspan99"
+       x="9.5435867"
+       y="417.57593"
+       style="stroke-width:0.45284379">cont-568d8e-&lt;ts&gt;-0</tspan></text>
+  <flowRoot
+     xml:space="preserve"
+     id="flowRoot1828"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:37.33333206px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none"
+     transform="translate(0,200)"><flowRegion
+       id="flowRegion1830"><rect
+         id="rect1832"
+         width="573.11005"
+         height="39.244427"
+         x="182.43355"
+         y="184.33957" /></flowRegion><flowPara
+       id="flowPara1834" /></flowRoot>  <path
+     style="fill:#ffffff;stroke:#000000;stroke-width:1.07623756"
+     inkscape:connector-curvature="0"
+     id="path877-7"
+     d="m 159.91421,396.7534 c 0,-2.74164 3.15947,-4.9602 7.06385,-4.9602 h 139.99275 c 3.90438,0 7.06386,2.21856 7.06386,4.9602 v 30.21218 c 0,2.74164 -3.15948,4.9602 -7.06386,4.9602 H 166.97806 c -3.90438,0 -7.06385,-2.21856 -7.06385,-4.9602 z" />
+  <path
+     style="fill:#ffffff;stroke:#000000;stroke-width:1.07623756"
+     inkscape:connector-curvature="0"
+     id="path877-7-6"
+     d="m 316.32694,396.75341 c 0,-2.74164 3.15947,-4.96021 7.06385,-4.96021 h 139.99275 c 3.90438,0 7.06386,2.21856 7.06386,4.9602 v 30.21218 c 0,2.74164 -3.15948,4.9602 -7.06386,4.9602 H 323.39079 c -3.90438,0 -7.06385,-2.21856 -7.06385,-4.9602 z" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="168.83531"
+     y="417.57593"
+     id="text101-7"><tspan
+       sodipodi:role="line"
+       id="tspan99-8"
+       x="168.83531"
+       y="417.57593"
+       style="stroke-width:0.45284379">cont-750ed3-&lt;ts&gt;-1</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="325.60159"
+     y="417.57593"
+     id="text101-7-4"><tspan
+       sodipodi:role="line"
+       id="tspan99-8-4"
+       x="325.60159"
+       y="417.57593"
+       style="stroke-width:0.45284379">cont-4ec28d-&lt;ts&gt;-2</tspan></text>
+  <flowRoot
+     xml:space="preserve"
+     id="flowRoot6150"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:37.33333206px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none"
+     transform="translate(0,200)"><flowRegion
+       id="flowRegion6152"><rect
+         id="rect6154"
+         width="658.73334"
+         height="99.261536"
+         x="-102.56863"
+         y="156.43877" /></flowRegion><flowPara
+       id="flowPara6156" /></flowRoot>  <path
+     style="fill:#ffffff;stroke:#000000;stroke-width:1.07623756"
+     inkscape:connector-curvature="0"
+     id="path877-7-6-6"
+     d="m 472.61796,396.22338 c 0,-2.74164 3.15947,-4.96021 7.06385,-4.96021 h 139.99275 c 3.90438,0 7.06386,2.21856 7.06386,4.9602 v 30.21218 c 0,2.74164 -3.15948,4.9602 -7.06386,4.9602 H 479.68181 c -3.90438,0 -7.06385,-2.21856 -7.06385,-4.9602 z" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="481.89264"
+     y="417.0459"
+     id="text101-7-4-8"><tspan
+       sodipodi:role="line"
+       id="tspan99-8-4-7"
+       x="481.89264"
+       y="417.0459"
+       style="stroke-width:0.45284379">cont-aef34f-&lt;ts&gt;-3</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="48.558598"
+     y="451.41711"
+     id="text281-90"><tspan
+       sodipodi:role="line"
+       id="tspan279-3"
+       x="48.558598"
+       y="451.41711"
+       style="stroke-width:0.45284379">&quot;&quot; - &quot;cat&quot;</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="180.88539"
+     y="450.23547"
+     id="text281-90-3"><tspan
+       sodipodi:role="line"
+       id="tspan279-3-3"
+       x="180.88539"
+       y="450.23547"
+       style="stroke-width:0.45284379">&quot;cat&quot; - &quot;giraffe&quot;</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="333.40033"
+     y="450.23547"
+     id="text281-90-3-7"><tspan
+       sodipodi:role="line"
+       id="tspan279-3-3-3"
+       x="333.40033"
+       y="450.23547"
+       style="stroke-width:0.45284379">&quot;giraffe&quot; - &quot;igloo&quot;</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="494.11285"
+     y="450.23547"
+     id="text281-90-3-7-2"><tspan
+       sodipodi:role="line"
+       id="tspan279-3-3-3-6"
+       x="494.11285"
+       y="450.23547"
+       style="stroke-width:0.45284379">&quot;igloo&quot; - &quot;linux&quot;</tspan></text>
+  <path
+     style="fill:#ffffff;stroke:#000000;stroke-width:1.07623756"
+     inkscape:connector-curvature="0"
+     id="path877-7-6-6-2"
+     d="m 629.49288,396.25157 c 0,-2.74164 3.15947,-4.96021 7.06385,-4.96021 h 139.99275 c 3.90438,0 7.06386,2.21856 7.06386,4.9602 v 30.21218 c 0,2.74164 -3.15948,4.9602 -7.06386,4.9602 H 636.55673 c -3.90438,0 -7.06385,-2.21856 -7.06385,-4.9602 z" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="638.76752"
+     y="417.0741"
+     id="text101-7-4-8-6"><tspan
+       sodipodi:role="line"
+       id="tspan99-8-4-7-6"
+       x="638.76752"
+       y="417.0741"
+       style="stroke-width:0.45284379">cont-4837ad-&lt;ts&gt;-4</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="668.46472"
+     y="450.26367"
+     id="text281-90-3-7-2-4"><tspan
+       sodipodi:role="line"
+       id="tspan279-3-3-3-6-9"
+       x="668.46472"
+       y="450.26367"
+       style="stroke-width:0.45284379">&quot;linux&quot; - &quot;&quot;</tspan></text>
+  <path
+     d="m 304.83643,98.104 c 0,-2.7533 2.22799,-4.98129 4.98128,-4.98129 h 98.72005 c 2.75329,0 4.98129,2.22799 4.98129,4.98129 v 30.34056 c 0,2.75329 -2.228,4.98128 -4.98129,4.98128 h -98.72005 c -2.75329,0 -4.98128,-2.22799 -4.98128,-4.98128 z"
+     id="path885-9"
+     inkscape:connector-curvature="0"
+     style="fill:#ffffff;stroke:#000000;stroke-width:0.90568852" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="340.24823"
+     y="117.61249"
+     id="text101-6-7"><tspan
+       sodipodi:role="line"
+       id="tspan99-88-5"
+       x="340.24823"
+       y="117.61249"
+       style="stroke-width:0.45284379">proxy</tspan></text>
+  <path
+     style="fill:none;stroke:#000000;stroke-width:1px;stroke-linecap:butt;stroke-linejoin:miter;stroke-opacity:1;marker-end:url(#EmptyTriangleOutL)"
+     d="m 349.72857,7.20913 c 0,85.0327 0,85.0327 0,85.0327"
+     id="path3107"
+     inkscape:connector-curvature="0" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:1px;stroke-linecap:butt;stroke-linejoin:miter;stroke-opacity:1;marker-start:url(#EmptyTriangleInL)"
+     d="m 371.40033,6.9337 c 0,85.0327 0,85.0327 0,85.0327"
+     id="path3107-8"
+     inkscape:connector-curvature="0" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:1px;stroke-linecap:butt;stroke-linejoin:miter;stroke-opacity:1;marker-start:url(#marker4830);marker-end:url(#marker4906)"
+     d="m 407.13129,134.26188 c 0,126.72189 0,126.72189 0,126.72189"
+     id="path4826"
+     inkscape:connector-curvature="0" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:1px;stroke-linecap:butt;stroke-linejoin:miter;stroke-opacity:1;marker-start:url(#marker5004);marker-end:url(#marker5092)"
+     d="m 336.16041,391.67606 c 0,-258.07591 0,-258.07591 0,-258.07591"
+     id="path5000"
+     inkscape:connector-curvature="0" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:1px;stroke-linecap:butt;stroke-linejoin:miter;stroke-opacity:1;marker-start:url(#marker6183);marker-end:url(#marker6295)"
+     d="M 323.25662,133.26928 C 289.01193,390.68346 289.01193,390.68346 289.01193,390.68346"
+     id="path6179"
+     inkscape:connector-curvature="0" />
+  <g
+     id="g6677"
+     transform="translate(-0.64693247,-67.95863)">
+    <circle
+       r="8.4370966"
+       cy="103.82908"
+       cx="337.64932"
+       id="path6543"
+       style="fill:#ffffff;fill-opacity:0.34622521;stroke:#000000" />
+    <text
+       id="text101-6-7-7"
+       y="108.6488"
+       x="333.60883"
+       style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+       xml:space="preserve"><tspan
+         style="stroke-width:0.45284379"
+         y="108.6488"
+         x="333.60883"
+         id="tspan99-88-5-6"
+         sodipodi:role="line">1</tspan></text>
+  </g>
+  <g
+     id="g6682"
+     transform="translate(11.896394,52.849)">
+    <circle
+       r="8.4370966"
+       cy="103.49822"
+       cx="383.97064"
+       id="path6543-4"
+       style="fill:#ffffff;fill-opacity:0.34622521;stroke:#000000" />
+    <text
+       id="text101-6-7-7-3"
+       y="108.31794"
+       x="379.93011"
+       style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+       xml:space="preserve"><tspan
+         style="stroke-width:0.45284379"
+         y="108.31794"
+         x="379.93011"
+         id="tspan99-88-5-6-0"
+         sodipodi:role="line">2</tspan></text>
+  </g>
+  <flowRoot
+     xml:space="preserve"
+     id="flowRoot6584"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:37.33333206px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none"
+     transform="translate(0,-68)"><flowRegion
+       id="flowRegion6586"><rect
+         id="rect6588"
+         width="53.10408"
+         height="38.049652"
+         x="142.43805"
+         y="120.20698" /></flowRegion><flowPara
+       id="flowPara6590"></flowPara></flowRoot>  <g
+     id="g6687"
+     transform="translate(98.267365,77.25042)">
+    <circle
+       r="8.4370966"
+       cy="109.78468"
+       cx="206.95703"
+       id="path6543-4-3"
+       style="fill:#ffffff;fill-opacity:0.34622521;stroke:#000000" />
+    <text
+       id="text101-6-7-7-3-0"
+       y="114.60439"
+       x="202.91652"
+       style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+       xml:space="preserve"><tspan
+         style="stroke-width:0.45284379"
+         y="114.60439"
+         x="202.91652"
+         id="tspan99-88-5-6-0-9"
+         sodipodi:role="line">3</tspan></text>
+  </g>
+  <flowRoot
+     xml:space="preserve"
+     id="flowRoot6613"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:37.33333206px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none"
+     transform="translate(0,-68)"><flowRegion
+       id="flowRegion6615"><rect
+         id="rect6617"
+         width="39.538551"
+         height="50.291714"
+         x="206.12987"
+         y="123.68108" /></flowRegion><flowPara
+       id="flowPara6619"></flowPara></flowRoot>  <g
+     id="g6692"
+     transform="translate(202.15946,37.71186)">
+    <circle
+       r="8.4370966"
+       cy="154.28622"
+       cx="145.41585"
+       id="path6543-4-3-2"
+       style="fill:#ffffff;fill-opacity:0.34622521;stroke:#000000" />
+    <text
+       id="text101-6-7-7-3-0-5"
+       y="159.10594"
+       x="141.37534"
+       style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+       xml:space="preserve"><tspan
+         style="stroke-width:0.45284379"
+         y="159.10594"
+         x="141.37534"
+         id="tspan99-88-5-6-0-9-4"
+         sodipodi:role="line">4</tspan></text>
+  </g>
+  <g
+     id="g6697"
+     transform="translate(190.57914,-120.40099)">
+    <circle
+       r="8.4370966"
+       cy="156.27144"
+       cx="191.9026"
+       id="path6543-4-3-2-0"
+       style="fill:#ffffff;fill-opacity:0.34622521;stroke:#000000" />
+    <text
+       id="text101-6-7-7-3-0-5-5"
+       y="161.09116"
+       x="187.86209"
+       style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+       xml:space="preserve"><tspan
+         style="stroke-width:0.45284379"
+         y="161.09116"
+         x="187.86209"
+         id="tspan99-88-5-6-0-9-4-9"
+         sodipodi:role="line">5</tspan></text>
+  </g>
+</svg>
diff --git a/doc/source/images/sharding_GET.svg b/doc/source/images/sharding_GET.svg
new file mode 100644
index 0000000000..5e9240feeb
--- /dev/null
+++ b/doc/source/images/sharding_GET.svg
@@ -0,0 +1,2112 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<svg
+   xmlns:dc="http://purl.org/dc/elements/1.1/"
+   xmlns:cc="http://creativecommons.org/ns#"
+   xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
+   xmlns:svg="http://www.w3.org/2000/svg"
+   xmlns="http://www.w3.org/2000/svg"
+   xmlns:xlink="http://www.w3.org/1999/xlink"
+   xmlns:sodipodi="http://sodipodi.sourceforge.net/DTD/sodipodi-0.dtd"
+   xmlns:inkscape="http://www.inkscape.org/namespaces/inkscape"
+   width="630"
+   height="500"
+   version="1.1"
+   id="svg1304"
+   sodipodi:docname="sharding_lock_sharding_GET.svg"
+   inkscape:version="0.92.2 (5c3e80d, 2017-08-06)">
+  <metadata
+     id="metadata1310">
+    <rdf:RDF>
+      <cc:Work
+         rdf:about="">
+        <dc:format>image/svg+xml</dc:format>
+        <dc:type
+           rdf:resource="http://purl.org/dc/dcmitype/StillImage" />
+        <dc:title></dc:title>
+      </cc:Work>
+    </rdf:RDF>
+  </metadata>
+  <defs
+     id="defs1308">
+    <marker
+       inkscape:isstock="true"
+       style="overflow:visible"
+       id="marker16051"
+       refX="0"
+       refY="0"
+       orient="auto"
+       inkscape:stockid="EmptyTriangleOutL">
+      <path
+         transform="matrix(0.8,0,0,0.8,-4.8,0)"
+         style="fill:#3a73c9;fill-opacity:0.97254902;fill-rule:evenodd;stroke:#5083cf;stroke-width:1.00000003pt;stroke-opacity:0.80849669"
+         d="M 5.77,0 -2.88,5 V -5 Z"
+         id="path16049"
+         inkscape:connector-curvature="0" />
+    </marker>
+    <marker
+       inkscape:stockid="EmptyTriangleOutL"
+       orient="auto"
+       refY="0"
+       refX="0"
+       id="marker15907"
+       style="overflow:visible"
+       inkscape:isstock="true">
+      <path
+         id="path15905"
+         d="M 5.77,0 -2.88,5 V -5 Z"
+         style="fill:#338000;fill-opacity:1;fill-rule:evenodd;stroke:#338000;stroke-width:1.00000003pt;stroke-opacity:1"
+         transform="matrix(0.8,0,0,0.8,-4.8,0)"
+         inkscape:connector-curvature="0" />
+    </marker>
+    <marker
+       inkscape:stockid="EmptyTriangleInL"
+       orient="auto"
+       refY="0"
+       refX="0"
+       id="marker15801"
+       style="overflow:visible"
+       inkscape:isstock="true">
+      <path
+         id="path15799"
+         d="M 5.77,0 -2.88,5 V -5 Z"
+         style="fill:#338000;fill-opacity:1;fill-rule:evenodd;stroke:#338000;stroke-width:1.00000003pt;stroke-opacity:1"
+         transform="matrix(-0.8,0,0,-0.8,4.8,0)"
+         inkscape:connector-curvature="0" />
+    </marker>
+    <marker
+       inkscape:isstock="true"
+       style="overflow:visible"
+       id="marker15697"
+       refX="0"
+       refY="0"
+       orient="auto"
+       inkscape:stockid="EmptyTriangleOutL"
+       inkscape:collect="always">
+      <path
+         transform="matrix(0.8,0,0,0.8,-4.8,0)"
+         style="fill:#338000;fill-opacity:1;fill-rule:evenodd;stroke:#338000;stroke-width:1.00000003pt;stroke-opacity:1"
+         d="M 5.77,0 -2.88,5 V -5 Z"
+         id="path15695"
+         inkscape:connector-curvature="0" />
+    </marker>
+    <marker
+       inkscape:isstock="true"
+       style="overflow:visible"
+       id="marker15603"
+       refX="0"
+       refY="0"
+       orient="auto"
+       inkscape:stockid="EmptyTriangleInL"
+       inkscape:collect="always">
+      <path
+         transform="matrix(-0.8,0,0,-0.8,4.8,0)"
+         style="fill:#338000;fill-opacity:1;fill-rule:evenodd;stroke:#338000;stroke-width:1.00000003pt;stroke-opacity:1"
+         d="M 5.77,0 -2.88,5 V -5 Z"
+         id="path15601"
+         inkscape:connector-curvature="0" />
+    </marker>
+    <marker
+       inkscape:isstock="true"
+       style="overflow:visible"
+       id="marker15073"
+       refX="0"
+       refY="0"
+       orient="auto"
+       inkscape:stockid="EmptyTriangleInL">
+      <path
+         transform="matrix(-0.8,0,0,-0.8,4.8,0)"
+         style="fill:#3771c8;fill-opacity:1;fill-rule:evenodd;stroke:#3771c8;stroke-width:1.00000003pt;stroke-opacity:1"
+         d="M 5.77,0 -2.88,5 V -5 Z"
+         id="path15071"
+         inkscape:connector-curvature="0" />
+    </marker>
+    <marker
+       inkscape:isstock="true"
+       style="overflow:visible"
+       id="marker13593"
+       refX="0"
+       refY="0"
+       orient="auto"
+       inkscape:stockid="EmptyTriangleInL">
+      <path
+         transform="matrix(-0.8,0,0,-0.8,4.8,0)"
+         style="fill:#3a73c9;fill-opacity:0.97254902;fill-rule:evenodd;stroke:#5083cf;stroke-width:1.00000003pt;stroke-opacity:0.80849669"
+         d="M 5.77,0 -2.88,5 V -5 Z"
+         id="path13591"
+         inkscape:connector-curvature="0" />
+    </marker>
+    <marker
+       inkscape:isstock="true"
+       style="overflow:visible"
+       id="marker11339"
+       refX="0"
+       refY="0"
+       orient="auto"
+       inkscape:stockid="EmptyTriangleOutL">
+      <path
+         transform="matrix(0.8,0,0,0.8,-4.8,0)"
+         style="fill:#ffffff;fill-rule:evenodd;stroke:#000000;stroke-width:1.00000003pt;stroke-opacity:1"
+         d="M 5.77,0 -2.88,5 V -5 Z"
+         id="path11337"
+         inkscape:connector-curvature="0" />
+    </marker>
+    <marker
+       inkscape:stockid="EmptyTriangleInL"
+       orient="auto"
+       refY="0"
+       refX="0"
+       id="marker11239"
+       style="overflow:visible"
+       inkscape:isstock="true"
+       inkscape:collect="always">
+      <path
+         id="path11237"
+         d="M 5.77,0 -2.88,5 V -5 Z"
+         style="fill:#ffffff;fill-rule:evenodd;stroke:#000000;stroke-width:1.00000003pt;stroke-opacity:1"
+         transform="matrix(-0.8,0,0,-0.8,4.8,0)"
+         inkscape:connector-curvature="0" />
+    </marker>
+    <marker
+       inkscape:stockid="EmptyTriangleOutL"
+       orient="auto"
+       refY="0"
+       refX="0"
+       id="marker11143"
+       style="overflow:visible"
+       inkscape:isstock="true"
+       inkscape:collect="always">
+      <path
+         id="path11141"
+         d="M 5.77,0 -2.88,5 V -5 Z"
+         style="fill:#3771c8;fill-opacity:1;fill-rule:evenodd;stroke:#3771c8;stroke-width:1.00000003pt;stroke-opacity:1"
+         transform="matrix(0.8,0,0,0.8,-4.8,0)"
+         inkscape:connector-curvature="0" />
+    </marker>
+    <marker
+       inkscape:stockid="EmptyTriangleInL"
+       orient="auto"
+       refY="0"
+       refX="0"
+       id="marker11055"
+       style="overflow:visible"
+       inkscape:isstock="true">
+      <path
+         id="path11053"
+         d="M 5.77,0 -2.88,5 V -5 Z"
+         style="fill:#ffffff;fill-rule:evenodd;stroke:#000000;stroke-width:1.00000003pt;stroke-opacity:1"
+         transform="matrix(-0.8,0,0,-0.8,4.8,0)"
+         inkscape:connector-curvature="0" />
+    </marker>
+    <marker
+       inkscape:stockid="EmptyTriangleOutL"
+       orient="auto"
+       refY="0"
+       refX="0"
+       id="marker10157"
+       style="overflow:visible"
+       inkscape:isstock="true"
+       inkscape:collect="always">
+      <path
+         id="path10155"
+         d="M 5.77,0 -2.88,5 V -5 Z"
+         style="fill:#ffffff;fill-rule:evenodd;stroke:#000000;stroke-width:1.00000003pt;stroke-opacity:1"
+         transform="matrix(0.8,0,0,0.8,-4.8,0)"
+         inkscape:connector-curvature="0" />
+    </marker>
+    <marker
+       inkscape:stockid="EmptyTriangleInL"
+       orient="auto"
+       refY="0"
+       refX="0"
+       id="marker10123"
+       style="overflow:visible"
+       inkscape:isstock="true">
+      <path
+         id="path10121"
+         d="M 5.77,0 -2.88,5 V -5 Z"
+         style="fill:#ffffff;fill-rule:evenodd;stroke:#000000;stroke-width:1.00000003pt;stroke-opacity:1"
+         transform="matrix(-0.8,0,0,-0.8,4.8,0)"
+         inkscape:connector-curvature="0" />
+    </marker>
+    <defs
+       id="defs1300">
+      <path
+         id="v"
+         d="M 0,20 411,-1484 H 569 L 162,20 H 0"
+         inkscape:connector-curvature="0" />
+      <path
+         id="w"
+         d="M 797,-207 C 713,-60 620,16 414,20 203,24 88,-98 87,-302 c 0,-112 37,-198 111,-258 74,-60 192,-93 356,-96 l 243,-4 c 10,-201 -43,-307 -232,-305 -154,2 -223,43 -242,172 l -188,-17 c 31,-195 175,-292 434,-292 259,0 410,116 410,364 v 466 c 3,95 12,159 101,161 17,0 37,-2 59,-7 V -6 C 1094,5 1047,10 1000,10 857,8 812,-66 803,-207 Z m -525,-92 c -1,116 66,187 183,184 230,-7 361,-164 342,-419 -124,5 -305,-2 -389,30 -83,32 -136,92 -136,205"
+         inkscape:connector-curvature="0" />
+      <path
+         id="x"
+         d="m 779,-765 c -19,-119 -93,-196 -233,-196 -95,0 -164,32 -207,95 -43,63 -64,170 -64,320 0,144 23,251 68,320 45,69 114,104 205,104 139,0 224,-79 240,-212 l 182,12 C 946,-119 781,22 553,20 230,17 87,-201 87,-542 c 0,-338 145,-557 464,-560 225,-1 380,129 413,323"
+         inkscape:connector-curvature="0" />
+      <path
+         id="y"
+         d="m 336,-268 c 2,98 22,139 114,141 24,0 59,-5 104,-14 V -8 C 495,8 434,16 372,16 228,16 156,-66 156,-229 V -951 H 31 v -131 h 132 l 53,-242 h 120 v 242 h 200 v 131 H 336 v 683"
+         inkscape:connector-curvature="0" />
+      <g
+         id="a">
+        <use
+           id="use981"
+           xlink:href="#v"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use983"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,9.8784722,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use985"
+           xlink:href="#x"
+           transform="matrix(0.01736111,0,0,0.01736111,29.652778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use987"
+           xlink:href="#x"
+           transform="matrix(0.01736111,0,0,0.01736111,47.430556,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use989"
+           xlink:href="#y"
+           transform="matrix(0.01736111,0,0,0.01736111,65.208333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="z"
+         d="M 187,0 V -219 H 382 V 0 H 187"
+         inkscape:connector-curvature="0" />
+      <path
+         id="A"
+         d="m 513,-963 c -139,1 -238,29 -238,149 0,72 41,100 95,127 55,27 348,94 404,125 101,56 176,118 176,263 C 950,-73 758,21 511,20 254,19 107,-55 57,-254 l 159,-31 c 34,123 133,168 295,168 156,0 264,-34 264,-168 0,-156 -183,-165 -315,-204 -171,-51 -245,-68 -323,-172 -26,-35 -37,-82 -37,-135 0,-220 172,-304 413,-303 232,1 379,74 418,265 l -162,20 C 746,-918 647,-964 513,-963"
+         inkscape:connector-curvature="0" />
+      <path
+         id="B"
+         d="m 322,-1484 c -2,195 6,405 -8,587 h 3 c 73,-129 159,-205 346,-205 250,0 342,118 343,381 V 0 H 825 v -686 c 3,-190 -43,-277 -223,-277 -176,-1 -280,140 -280,325 V 0 H 142 v -1484 h 180"
+         inkscape:connector-curvature="0" />
+      <path
+         id="C"
+         d="m 318,-861 c 55,-157 83,-241 257,-241 24,0 48,3 73,10 v 165 c -24,-7 -56,-10 -96,-10 -75,0 -132,33 -171,97 -39,64 -59,156 -59,276 V 0 H 142 c -3,-364 6,-725 -6,-1082 h 170 c 5,123 8,196 8,221 h 4"
+         inkscape:connector-curvature="0" />
+      <path
+         id="D"
+         d="m 835,0 c -5,-29 -11,-137 -10,-174 h -4 C 759,-45 663,20 484,20 177,20 86,-201 86,-536 c 0,-377 133,-566 398,-566 178,1 273,67 339,188 -4,-187 -1,-380 -2,-570 h 180 v 1261 c 0,113 2,187 6,223 z m -14,-554 c 0,-255 -58,-415 -289,-415 -91,0 -151,37 -196,101 -76,109 -77,543 -1,651 44,63 105,98 195,98 235,0 291,-173 291,-435"
+         inkscape:connector-curvature="0" />
+      <path
+         id="E"
+         d="m 87,-548 c 0,-338 159,-553 484,-554 325,-2 484,204 477,599 H 276 c -1,227 88,385 302,388 146,2 246,-65 283,-166 l 158,45 C 954,-65 807,20 578,20 240,20 87,-193 87,-548 Z m 775,-93 c -19,-206 -90,-328 -294,-328 -185,0 -285,140 -290,328 h 584"
+         inkscape:connector-curvature="0" />
+      <path
+         id="F"
+         d="M -31,407 V 277 H 1162 V 407 H -31"
+         inkscape:connector-curvature="0" />
+      <g
+         id="b">
+        <use
+           id="use999"
+           xlink:href="#v"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1001"
+           xlink:href="#z"
+           transform="matrix(0.01736111,0,0,0.01736111,9.8784722,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1003"
+           xlink:href="#A"
+           transform="matrix(0.01736111,0,0,0.01736111,19.756944,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1005"
+           xlink:href="#B"
+           transform="matrix(0.01736111,0,0,0.01736111,37.534722,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1007"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,57.309028,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1009"
+           xlink:href="#C"
+           transform="matrix(0.01736111,0,0,0.01736111,77.083333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1011"
+           xlink:href="#D"
+           transform="matrix(0.01736111,0,0,0.01736111,88.923611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1013"
+           xlink:href="#E"
+           transform="matrix(0.01736111,0,0,0.01736111,108.69792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1015"
+           xlink:href="#D"
+           transform="matrix(0.01736111,0,0,0.01736111,128.47222,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1017"
+           xlink:href="#F"
+           transform="matrix(0.01736111,0,0,0.01736111,148.24653,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1019"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,168.02083,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1021"
+           xlink:href="#x"
+           transform="matrix(0.01736111,0,0,0.01736111,187.79514,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1023"
+           xlink:href="#x"
+           transform="matrix(0.01736111,0,0,0.01736111,205.57292,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1025"
+           xlink:href="#y"
+           transform="matrix(0.01736111,0,0,0.01736111,223.35069,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="G"
+         d="m 571,-1102 c 350,0 480,196 482,560 2,357 -151,562 -488,562 -332,0 -479,-218 -479,-562 0,-373 162,-560 485,-560 z m -8,989 c 244,0 301,-164 301,-429 0,-266 -49,-427 -290,-427 -239,0 -299,165 -299,427 0,252 61,429 288,429"
+         inkscape:connector-curvature="0" />
+      <path
+         id="H"
+         d="m 663,-1102 c 251,0 343,119 343,381 V 0 H 825 v -686 c 0,-183 -40,-279 -223,-277 -184,2 -280,141 -280,336 V 0 H 142 c -3,-345 6,-754 -6,-1082 h 170 c 5,68 6,94 8,185 h 3 c 76,-134 157,-205 346,-205"
+         inkscape:connector-curvature="0" />
+      <path
+         id="I"
+         d="m 1059,-705 c 0,235 -42,415 -125,539 C 851,-42 729,20 567,20 405,20 283,-42 202,-165 121,-288 80,-468 80,-705 c 0,-242 39,-423 118,-544 79,-121 204,-181 375,-181 166,0 288,61 367,183 79,122 119,303 119,542 z m -257,436 c 94,-156 93,-724 4,-878 -51,-89 -125,-137 -233,-137 -111,0 -186,48 -239,135 -91,149 -91,731 2,883 55,89 126,139 233,139 106,0 178,-51 233,-142"
+         inkscape:connector-curvature="0" />
+      <path
+         id="J"
+         d="m 156,0 v -153 h 359 v -1084 l -318,227 v -170 l 333,-229 h 166 v 1256 h 343 V 0 H 156"
+         inkscape:connector-curvature="0" />
+      <path
+         id="K"
+         d="m 655,-1102 c 307,0 398,221 398,556 0,377 -133,566 -398,566 -180,0 -272,-66 -339,-188 1,22 -7,151 -10,168 H 132 c 4,-36 6,-110 6,-223 v -1261 h 180 c -2,196 4,384 -4,576 h 4 c 62,-129 158,-194 337,-194 z m -337,573 c 0,254 57,416 289,416 91,0 152,-37 197,-101 76,-109 76,-543 0,-651 -44,-63 -105,-98 -195,-98 -236,0 -291,169 -291,434"
+         inkscape:connector-curvature="0" />
+      <path
+         id="L"
+         d="m 572,-1430 c 269,0 442,128 442,386 0,144 -72,232 -149,325 -108,130 -487,366 -564,566 h 735 V 0 H 103 v -127 c 119,-285 378,-432 583,-627 76,-72 141,-150 143,-284 1,-156 -100,-244 -257,-244 -156,0 -263,93 -277,238 l -184,-17 c 24,-224 208,-369 461,-369"
+         inkscape:connector-curvature="0" />
+      <path
+         id="M"
+         d="m 715,-719 c 191,17 334,134 334,330 C 1049,-115 858,20 571,20 288,20 108,-110 78,-362 l 186,-17 c 24,167 126,250 307,250 177,0 294,-88 291,-266 -3,-174 -149,-246 -344,-244 H 416 v -156 h 98 c 179,2 311,-77 311,-243 0,-157 -98,-244 -264,-244 -159,0 -264,88 -278,233 l -181,-14 c 23,-229 206,-367 461,-367 262,0 447,124 447,373 0,197 -120,298 -295,334 v 4"
+         inkscape:connector-curvature="0" />
+      <path
+         id="N"
+         d="M 1036,-1263 C 892,-1043 790,-871 731,-746 626,-522 556,-302 553,0 H 365 c 0,-180 39,-369 115,-568 76,-199 203,-429 382,-688 H 105 v -153 h 931 v 146"
+         inkscape:connector-curvature="0" />
+      <g
+         id="c">
+        <use
+           id="use1036"
+           xlink:href="#x"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1038"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1040"
+           xlink:href="#H"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1042"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1044"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,50.403646,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1046"
+           xlink:href="#I"
+           transform="matrix(0.01302083,0,0,0.01302083,65.234375,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1048"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,80.065104,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1050"
+           xlink:href="#J"
+           transform="matrix(0.01302083,0,0,0.01302083,94.895833,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1052"
+           xlink:href="#E"
+           transform="matrix(0.01302083,0,0,0.01302083,109.72656,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1054"
+           xlink:href="#E"
+           transform="matrix(0.01302083,0,0,0.01302083,124.55729,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1056"
+           xlink:href="#K"
+           transform="matrix(0.01302083,0,0,0.01302083,139.38802,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1058"
+           xlink:href="#L"
+           transform="matrix(0.01302083,0,0,0.01302083,154.21875,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1060"
+           xlink:href="#M"
+           transform="matrix(0.01302083,0,0,0.01302083,169.04948,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1062"
+           xlink:href="#N"
+           transform="matrix(0.01302083,0,0,0.01302083,183.88021,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="d">
+        <use
+           id="use1065"
+           xlink:href="#x"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1067"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1069"
+           xlink:href="#H"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1071"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="e">
+        <use
+           id="use1074"
+           xlink:href="#x"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1076"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1078"
+           xlink:href="#H"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1080"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="O"
+         d="M 496,424 C 268,175 127,-92 127,-532 c 0,-438 143,-704 369,-952 h 174 c -222,249 -362,524 -362,954 0,431 138,703 362,954 H 496"
+         inkscape:connector-curvature="0" />
+      <path
+         id="P"
+         d="m 320,-908 c 63,-128 152,-193 335,-193 133,0 233,45 299,134 66,89 99,230 99,421 0,377 -133,566 -398,566 -167,0 -279,-63 -336,-188 h -5 c 8,141 2,428 4,593 H 138 V -861 c 0,-111 -2,-185 -6,-221 h 174 c 5,33 9,134 10,174 z m -2,380 c 0,254 57,415 289,415 89,0 149,-37 195,-99 76,-105 79,-547 1,-653 -45,-62 -105,-97 -194,-97 -243,1 -291,184 -291,434"
+         inkscape:connector-curvature="0" />
+      <path
+         id="Q"
+         d="m 137,-1312 v -172 h 180 v 172 z M 137,0 V -1082 H 317 V 0 H 137"
+         inkscape:connector-curvature="0" />
+      <path
+         id="R"
+         d="M 613,0 H 400 L 7,-1082 h 192 c 109,337 207,579 307,941 97,-323 214,-627 320,-941 h 191"
+         inkscape:connector-curvature="0" />
+      <g
+         id="f">
+        <use
+           id="use1087"
+           xlink:href="#O"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1089"
+           xlink:href="#P"
+           transform="matrix(0.01302083,0,0,0.01302083,8.8802083,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1091"
+           xlink:href="#Q"
+           transform="matrix(0.01302083,0,0,0.01302083,23.710937,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1093"
+           xlink:href="#R"
+           transform="matrix(0.01302083,0,0,0.01302083,29.635417,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1095"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,42.96875,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1097"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,57.799479,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="S"
+         d="m 186,-1484 c 228,249 369,516 369,956 0,438 -143,704 -369,952 H 12 C 235,172 374,-97 374,-530 374,-961 234,-1234 12,-1484 h 174"
+         inkscape:connector-curvature="0" />
+      <g
+         id="g">
+        <use
+           id="use1101"
+           xlink:href="#D"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1103"
+           xlink:href="#K"
+           transform="matrix(0.01302083,0,0,0.01302083,14.830729,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1105"
+           xlink:href="#S"
+           transform="matrix(0.01302083,0,0,0.01302083,29.661458,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="T"
+         d="m 779,-765 c -19,-119 -93,-196 -233,-196 -95,0 -164,32 -207,95 -43,63 -64,170 -64,320 0,144 23,251 68,320 45,69 114,104 205,104 139,0 224,-79 240,-212 l 182,12 C 946,-119 781,22 553,20 230,17 87,-201 87,-542 c 0,-338 145,-557 464,-560 225,-1 380,129 413,323"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="U"
+         d="M 797,-207 C 713,-60 620,16 414,20 203,24 88,-98 87,-302 c 0,-112 37,-198 111,-258 74,-60 192,-93 356,-96 l 243,-4 c 10,-201 -43,-307 -232,-305 -154,2 -223,43 -242,172 l -188,-17 c 31,-195 175,-292 434,-292 259,0 410,116 410,364 v 466 c 3,95 12,159 101,161 17,0 37,-2 59,-7 V -6 C 1094,5 1047,10 1000,10 857,8 812,-66 803,-207 Z m -525,-92 c -1,116 66,187 183,184 230,-7 361,-164 342,-419 -124,5 -305,-2 -389,30 -83,32 -136,92 -136,205"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="V"
+         d="m 336,-268 c 2,98 22,139 114,141 24,0 59,-5 104,-14 V -8 C 495,8 434,16 372,16 228,16 156,-66 156,-229 V -951 H 31 v -131 h 132 l 53,-242 h 120 v 242 h 200 v 131 H 336 v 683"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <g
+         id="h">
+        <use
+           id="use1111"
+           xlink:href="#T"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1113"
+           xlink:href="#U"
+           transform="matrix(0.01736111,0,0,0.01736111,17.777778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1115"
+           xlink:href="#V"
+           transform="matrix(0.01736111,0,0,0.01736111,37.552083,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="W"
+         d="m 824,-897 c -1,-17 6,-175 12,-185 h 171 c -12,319 -6,716 -6,1051 0,304 -151,456 -453,456 -226,0 -374,-90 -417,-267 l 181,-26 c 24,102 112,157 241,156 179,0 269,-105 269,-315 0,-57 3,-120 -2,-174 C 759,-74 647,8 472,8 339,8 242,-36 180,-124 118,-212 86,-350 86,-539 c 0,-191 33,-332 100,-423 67,-91 169,-137 306,-137 167,0 273,85 332,202 z m -38,579 c 48,-119 46,-331 0,-450 -42,-108 -118,-197 -250,-197 -92,0 -154,37 -201,100 -78,107 -74,530 -4,643 63,101 251,129 353,47 43,-35 77,-81 102,-143"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="X"
+         d="m 137,-1312 v -172 h 180 v 172 z M 137,0 V -1082 H 317 V 0 H 137"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="Y"
+         d="m 318,-861 c 55,-157 83,-241 257,-241 24,0 48,3 73,10 v 165 c -24,-7 -56,-10 -96,-10 -75,0 -132,33 -171,97 -39,64 -59,156 -59,276 V 0 H 142 c -3,-364 6,-725 -6,-1082 h 170 c 5,123 8,196 8,221 h 4"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="Z"
+         d="m 492,-1341 c -103,3 -130,49 -131,162 v 97 h 211 v 131 H 361 V 0 H 181 V -951 H 29 v -131 h 152 v -122 c 0,-192 78,-276 264,-278 50,0 92,4 127,12 v 137 c -30,-5 -57,-8 -80,-8"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="aa"
+         d="m 87,-548 c 0,-338 159,-553 484,-554 325,-2 484,204 477,599 H 276 c -1,227 88,385 302,388 146,2 246,-65 283,-166 l 158,45 C 954,-65 807,20 578,20 240,20 87,-193 87,-548 Z m 775,-93 c -19,-206 -90,-328 -294,-328 -185,0 -285,140 -290,328 h 584"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <g
+         id="i">
+        <use
+           id="use1123"
+           xlink:href="#W"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1125"
+           xlink:href="#X"
+           transform="matrix(0.01736111,0,0,0.01736111,19.774306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1127"
+           xlink:href="#Y"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1129"
+           xlink:href="#U"
+           transform="matrix(0.01736111,0,0,0.01736111,39.513889,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1131"
+           xlink:href="#Z"
+           transform="matrix(0.01736111,0,0,0.01736111,59.288194,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1133"
+           xlink:href="#Z"
+           transform="matrix(0.01736111,0,0,0.01736111,68.524306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1135"
+           xlink:href="#aa"
+           transform="matrix(0.01736111,0,0,0.01736111,78.402778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="ab"
+         d="M 138,0 V -1484 H 318 V 0 H 138"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="ac"
+         d="m 571,-1102 c 350,0 480,196 482,560 2,357 -151,562 -488,562 -332,0 -479,-218 -479,-562 0,-373 162,-560 485,-560 z m -8,989 c 244,0 301,-164 301,-429 0,-266 -49,-427 -290,-427 -239,0 -299,165 -299,427 0,252 61,429 288,429"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <g
+         id="j">
+        <use
+           id="use1140"
+           xlink:href="#X"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1142"
+           xlink:href="#W"
+           transform="matrix(0.01736111,0,0,0.01736111,7.8993056,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1144"
+           xlink:href="#ab"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1146"
+           xlink:href="#ac"
+           transform="matrix(0.01736111,0,0,0.01736111,35.572917,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1148"
+           xlink:href="#ac"
+           transform="matrix(0.01736111,0,0,0.01736111,55.347222,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="ad"
+         d="m 765,-739 c 171,25 285,155 285,346 C 1049,-119 859,20 570,20 286,20 89,-117 89,-391 89,-574 212,-714 370,-737 v -4 c -143,-30 -248,-160 -248,-328 1,-229 198,-361 444,-361 254,0 448,125 449,363 1,166 -104,300 -250,324 z m -197,-70 c 171,-2 261,-74 260,-248 0,-159 -87,-239 -262,-239 -165,0 -260,77 -260,239 0,163 99,249 262,248 z m 4,694 c 200,0 291,-92 291,-295 1,-179 -116,-264 -297,-264 -175,0 -292,98 -291,268 0,194 99,291 297,291"
+         inkscape:connector-curvature="0" />
+      <path
+         id="ae"
+         d="m 492,-1341 c -103,3 -130,49 -131,162 v 97 h 211 v 131 H 361 V 0 H 181 V -951 H 29 v -131 h 152 v -122 c 0,-192 78,-276 264,-278 50,0 92,4 127,12 v 137 c -30,-5 -57,-8 -80,-8"
+         inkscape:connector-curvature="0" />
+      <g
+         id="k">
+        <use
+           id="use1153"
+           xlink:href="#x"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1155"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1157"
+           xlink:href="#H"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1159"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1161"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,50.403646,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1163"
+           xlink:href="#I"
+           transform="matrix(0.01302083,0,0,0.01302083,65.234375,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1165"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,80.065104,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1167"
+           xlink:href="#D"
+           transform="matrix(0.01302083,0,0,0.01302083,94.895833,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1169"
+           xlink:href="#D"
+           transform="matrix(0.01302083,0,0,0.01302083,109.72656,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1171"
+           xlink:href="#ad"
+           transform="matrix(0.01302083,0,0,0.01302083,124.55729,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1173"
+           xlink:href="#M"
+           transform="matrix(0.01302083,0,0,0.01302083,139.38802,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1175"
+           xlink:href="#L"
+           transform="matrix(0.01302083,0,0,0.01302083,154.21875,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1177"
+           xlink:href="#ad"
+           transform="matrix(0.01302083,0,0,0.01302083,169.04948,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1179"
+           xlink:href="#ae"
+           transform="matrix(0.01302083,0,0,0.01302083,183.88021,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="af"
+         d="m 625,-911 c 261,-2 424,185 424,450 0,289 -169,481 -455,481 -159,0 -280,-59 -364,-177 -84,-118 -126,-290 -126,-515 0,-244 44,-431 131,-562 87,-131 212,-196 373,-196 213,0 347,96 402,287 l -172,31 c -35,-115 -113,-172 -232,-172 -103,0 -182,48 -238,144 -56,96 -85,234 -85,415 59,-113 178,-184 342,-186 z m -37,786 c 182,0 278,-138 278,-328 0,-193 -98,-318 -284,-319 -166,-1 -281,107 -281,276 0,195 106,371 287,371"
+         inkscape:connector-curvature="0" />
+      <g
+         id="l">
+        <use
+           id="use1183"
+           xlink:href="#x"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1185"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1187"
+           xlink:href="#H"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1189"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1191"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,50.403646,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1193"
+           xlink:href="#I"
+           transform="matrix(0.01302083,0,0,0.01302083,65.234375,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1195"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,80.065104,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1197"
+           xlink:href="#w"
+           transform="matrix(0.01302083,0,0,0.01302083,94.895833,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1199"
+           xlink:href="#x"
+           transform="matrix(0.01302083,0,0,0.01302083,109.72656,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1201"
+           xlink:href="#I"
+           transform="matrix(0.01302083,0,0,0.01302083,123.0599,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1203"
+           xlink:href="#I"
+           transform="matrix(0.01302083,0,0,0.01302083,137.89062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1205"
+           xlink:href="#x"
+           transform="matrix(0.01302083,0,0,0.01302083,152.72135,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1207"
+           xlink:href="#af"
+           transform="matrix(0.01302083,0,0,0.01302083,166.05469,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1209"
+           xlink:href="#w"
+           transform="matrix(0.01302083,0,0,0.01302083,180.88542,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="m">
+        <use
+           id="use1212"
+           xlink:href="#H"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1214"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,19.774306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1216"
+           xlink:href="#H"
+           transform="matrix(0.01736111,0,0,0.01736111,39.548611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1218"
+           xlink:href="#E"
+           transform="matrix(0.01736111,0,0,0.01736111,59.322917,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="ag"
+         d="m 91,-464 v -160 h 500 v 160 H 91"
+         inkscape:connector-curvature="0" />
+      <use
+         id="n"
+         xlink:href="#ag"
+         transform="scale(0.01736111)"
+         x="0"
+         y="0"
+         width="100%"
+         height="100%" />
+      <g
+         id="o">
+        <use
+           id="use1223"
+           xlink:href="#x"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1225"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,17.777778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1227"
+           xlink:href="#y"
+           transform="matrix(0.01736111,0,0,0.01736111,37.552083,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="p">
+        <use
+           id="use1230"
+           xlink:href="#x"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1232"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,17.777778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1234"
+           xlink:href="#y"
+           transform="matrix(0.01736111,0,0,0.01736111,37.552083,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="ah"
+         d="m 824,-897 c -1,-17 6,-175 12,-185 h 171 c -12,319 -6,716 -6,1051 0,304 -151,456 -453,456 -226,0 -374,-90 -417,-267 l 181,-26 c 24,102 112,157 241,156 179,0 269,-105 269,-315 0,-57 3,-120 -2,-174 C 759,-74 647,8 472,8 339,8 242,-36 180,-124 118,-212 86,-350 86,-539 c 0,-191 33,-332 100,-423 67,-91 169,-137 306,-137 167,0 273,85 332,202 z m -38,579 c 48,-119 46,-331 0,-450 -42,-108 -118,-197 -250,-197 -92,0 -154,37 -201,100 -78,107 -74,530 -4,643 63,101 251,129 353,47 43,-35 77,-81 102,-143"
+         inkscape:connector-curvature="0" />
+      <g
+         id="q">
+        <use
+           id="use1238"
+           xlink:href="#ah"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1240"
+           xlink:href="#Q"
+           transform="matrix(0.01736111,0,0,0.01736111,19.774306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1242"
+           xlink:href="#C"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1244"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,39.513889,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1246"
+           xlink:href="#ae"
+           transform="matrix(0.01736111,0,0,0.01736111,59.288194,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1248"
+           xlink:href="#ae"
+           transform="matrix(0.01736111,0,0,0.01736111,68.524306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1250"
+           xlink:href="#E"
+           transform="matrix(0.01736111,0,0,0.01736111,78.402778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="r">
+        <use
+           id="use1253"
+           xlink:href="#ah"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1255"
+           xlink:href="#Q"
+           transform="matrix(0.01736111,0,0,0.01736111,19.774306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1257"
+           xlink:href="#C"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1259"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,39.513889,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1261"
+           xlink:href="#ae"
+           transform="matrix(0.01736111,0,0,0.01736111,59.288194,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1263"
+           xlink:href="#ae"
+           transform="matrix(0.01736111,0,0,0.01736111,68.524306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1265"
+           xlink:href="#E"
+           transform="matrix(0.01736111,0,0,0.01736111,78.402778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="ai"
+         d="M 138,0 V -1484 H 318 V 0 H 138"
+         inkscape:connector-curvature="0" />
+      <g
+         id="s">
+        <use
+           id="use1269"
+           xlink:href="#Q"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1271"
+           xlink:href="#ah"
+           transform="matrix(0.01736111,0,0,0.01736111,7.8993056,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1273"
+           xlink:href="#ai"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1275"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,35.572917,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1277"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,55.347222,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="t">
+        <use
+           id="use1280"
+           xlink:href="#Q"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1282"
+           xlink:href="#ah"
+           transform="matrix(0.01736111,0,0,0.01736111,7.8993056,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1284"
+           xlink:href="#ai"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1286"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,35.572917,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1288"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,55.347222,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="u">
+        <use
+           id="use1291"
+           xlink:href="#H"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1293"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,19.774306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1295"
+           xlink:href="#H"
+           transform="matrix(0.01736111,0,0,0.01736111,39.548611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1297"
+           xlink:href="#E"
+           transform="matrix(0.01736111,0,0,0.01736111,59.322917,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+    </defs>
+    <marker
+       inkscape:stockid="EmptyTriangleInL"
+       orient="auto"
+       refY="0"
+       refX="0"
+       id="EmptyTriangleInL"
+       style="overflow:visible"
+       inkscape:isstock="true">
+      <path
+         id="path3260"
+         d="M 5.77,0 -2.88,5 V -5 Z"
+         style="fill:#ffffff;fill-rule:evenodd;stroke:#000000;stroke-width:1.00000003pt;stroke-opacity:1"
+         transform="matrix(-0.8,0,0,-0.8,4.8,0)"
+         inkscape:connector-curvature="0" />
+    </marker>
+    <marker
+       inkscape:stockid="EmptyTriangleOutL"
+       orient="auto"
+       refY="0"
+       refX="0"
+       id="EmptyTriangleOutL"
+       style="overflow:visible"
+       inkscape:isstock="true">
+      <path
+         id="path3269"
+         d="M 5.77,0 -2.88,5 V -5 Z"
+         style="fill:#ffffff;fill-rule:evenodd;stroke:#000000;stroke-width:1.00000003pt;stroke-opacity:1"
+         transform="matrix(0.8,0,0,0.8,-4.8,0)"
+         inkscape:connector-curvature="0" />
+    </marker>
+  </defs>
+  <sodipodi:namedview
+     pagecolor="#ffffff"
+     bordercolor="#666666"
+     borderopacity="1"
+     objecttolerance="10"
+     gridtolerance="10"
+     guidetolerance="10"
+     inkscape:pageopacity="0"
+     inkscape:pageshadow="2"
+     inkscape:window-width="3840"
+     inkscape:window-height="2031"
+     id="namedview1306"
+     showgrid="false"
+     inkscape:zoom="2.5646897"
+     inkscape:cx="175.9772"
+     inkscape:cy="289.68747"
+     inkscape:window-x="0"
+     inkscape:window-y="55"
+     inkscape:window-maximized="1"
+     inkscape:current-layer="svg1304" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke-width:0.45284426"
+     inkscape:connector-curvature="0"
+     id="path861"
+     d="M 0.896161,263.84405 H 628.99114 V 379.77218 H 0.896161 Z" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path863"
+     d="M 9.9983304,263.84405 H 19.1005 m 4.551085,0 h 9.102169 m 4.555613,0 h 9.10217 m 4.555613,0 h 9.102169 m 4.551085,0 h 9.102169 m 4.555613,0 h 9.10217 m 4.537499,0 h 9.111225 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55561,0 h 9.10217 m 4.55109,0 h 9.10216 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55561,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.54656,0 h 9.10217 m 4.56014,0 h 9.10217 m 4.54656,0 h 9.10217 m 4.55561,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55561,0 h 9.09765 m 4.55561,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55562,0 h 9.10216 m 4.55109,0 h 9.11123 m 4.55108,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55562,0 h 9.10216 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55561,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.54655,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.54655,0 h 9.10217 m 4.55562,0 h 9.10217 m 4.55108,0 h 4.55109 v 4.29297 m 0,4.29296 v 8.59046 m 0,4.29296 v 8.59045 m 0,4.29297 v 8.58592 m 0,4.30202 v 8.58593 m 0,4.29297 v 8.58592 m 0,4.30202 v 8.5814 m 0,4.29296 v 8.58593 m 0,4.28844 v 8.59045 m 0,4.29297 v 4.28843 h -4.55109 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.11123 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.54656,0 h -9.10217 m -4.54655,0 h -9.10217 m -4.54656,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10216 m -4.55562,0 h -9.09764 m -4.55561,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.11123 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.102165 m -4.555613,0 h -9.102169 m -4.551085,0 h -9.102169 m -4.546557,0 h -9.102169 m -4.551085,0 h -9.102169 m -4.546557,0 h -9.102169 m -4.555613,0 H 9.9983304 m -4.5510847,0 H 0.896161 v -4.29296 m 0,-4.29297 v -8.59045 m 0,-4.29297 v -8.59045 m 0,-4.29296 v -8.57688 m 0,-4.30202 v -8.58592 m 0,-4.29297 v -8.58592 m 0,-4.30202 v -8.5814 m 0,-4.29296 v -8.59046 m 0,-4.28843 v -8.59046 m 0,-4.29296 v -4.29297 h 4.5510847" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path865"
+     d="M 4.9717593,263.84405 H 52.067561 v 30.34057 H 4.9717593 Z" />
+  <path
+     style="fill:#d2fff2;stroke-width:0.45284426"
+     inkscape:connector-curvature="0"
+     id="path869"
+     d="M 0.896161,379.77218 H 628.99114 V 495.70031 H 0.896161 Z" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path871"
+     d="M 9.9983304,379.77218 H 19.1005 m 4.551085,0 h 9.102169 m 4.555613,0 h 9.10217 m 4.555613,0 h 9.102169 m 4.551085,0 h 9.102169 m 4.555613,0 h 9.10217 m 4.551085,0 h 9.111229 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55562,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55562,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.54656,0 h 9.10216 m 4.55109,0 h 9.10217 m 4.54656,0 h 9.10216 m 4.55562,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55561,0 h 9.09312 m 4.55561,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55562,0 h 9.10216 m 4.55109,0 h 9.11123 m 4.55108,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55562,0 h 9.10216 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55561,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.54655,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.54655,0 h 9.10217 m 4.55562,0 h 9.10217 m 4.55108,0 h 4.55109 v 4.29296 m 0,4.29297 v 8.59045 m 0,4.29297 v 8.59045 m 0,4.29297 v 8.58592 m 0,4.30202 v 8.58593 m 0,4.29296 v 8.58593 m 0,4.30202 v 8.5814 m 0,4.29296 v 8.58593 m 0,4.28843 v 8.59046 m 0,4.29296 v 4.28844 h -4.55109 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.11123 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.54656,0 h -9.10217 m -4.54655,0 h -9.10217 m -4.54656,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10216 m -4.55562,0 h -9.09764 m -4.55561,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.11123 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.102165 m -4.555613,0 h -9.102169 m -4.551085,0 h -9.102169 m -4.546557,0 h -9.102169 m -4.551085,0 h -9.102169 m -4.546557,0 h -9.102169 m -4.555613,0 H 9.9983304 m -4.5510847,0 H 0.896161 v -4.29297 m 0,-4.29296 v -8.59045 m 0,-4.29297 v -8.59045 m 0,-4.29297 v -8.57687 m 0,-4.30202 v -8.58592 m 0,-4.29297 v -8.58592 m 0,-4.30202 v -8.5814 m 0,-4.29297 V 401.237 m 0,-4.28844 v -8.59045 m 0,-4.29297 v -4.29296 h 4.5510847" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path873"
+     d="M 4.9717593,379.77218 H 122.71126 v 30.34056 H 4.9717593 Z" />
+  <path
+     style="fill:#ffffff;stroke:#000000;stroke-width:1.07623756"
+     inkscape:connector-curvature="0"
+     id="path877"
+     d="m 3.360172,436.7534 c 0,-2.74164 3.159469,-4.9602 7.063854,-4.9602 H 150.41677 c 3.90438,0 7.06386,2.21856 7.06386,4.9602 v 30.21218 c 0,2.74164 -3.15948,4.9602 -7.06386,4.9602 H 10.424026 c -3.904385,0 -7.063854,-2.21856 -7.063854,-4.9602 z" />
+  <path
+     style="fill:#dadada;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path881"
+     d="m 15.840021,306.41141 c 0,-2.75329 2.227994,-4.98129 4.981287,-4.98129 H 476.83547 c 2.75329,0 4.98128,2.228 4.98128,4.98129 v 30.34057 c 0,2.75329 -2.22799,4.98128 -4.98128,4.98128 H 20.821308 c -2.753293,0 -4.981287,-2.22799 -4.981287,-4.98128 z" />
+  <path
+     style="fill:#ffffff;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path885"
+     d="m 499.02484,306.41141 c 0,-2.75329 2.22799,-4.98129 4.98128,-4.98129 h 98.72005 c 2.75329,0 4.98129,2.228 4.98129,4.98129 v 30.34057 c 0,2.75329 -2.228,4.98128 -4.98129,4.98128 h -98.72005 c -2.75329,0 -4.98128,-2.22799 -4.98128,-4.98128 z" />
+  <path
+     style="fill:none;stroke-width:0.45284426"
+     inkscape:connector-curvature="0"
+     id="path893"
+     d="m 87.389413,301.43012 v 40.30314" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path897"
+     d="m 68.369954,349.43162 h 38.038916 v 30.34056 H 68.369954 Z" />
+  <path
+     style="fill:none;stroke-width:0.45284426"
+     inkscape:connector-curvature="0"
+     id="path901"
+     d="m 164.82578,301.43012 v 40.30314" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path905"
+     d="m 134.93806,349.43162 h 60.68113 v 30.34056 h -60.68113 z" />
+  <path
+     style="fill:none;stroke-width:0.45284426"
+     inkscape:connector-curvature="0"
+     id="path909"
+     d="m 242.71499,301.43012 v 40.30314" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path913"
+     d="m 199.24194,349.43162 h 87.39894 v 30.34056 h -87.39894 z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path941"
+     d="M 41.010676,471.24672 H 153.76889 v 30.34056 H 41.010676 Z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path949"
+     d="M 154.90138,471.24672 H 267.6596 v 30.34056 H 154.90138 Z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path957"
+     d="M 292.79208,471.69956 H 405.5503 v 30.34057 H 292.79208 Z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path967"
+     d="m 497.21346,342.63895 h 112.75822 v 30.34057 H 497.21346 Z" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="504.97748"
+     y="327.43918"
+     id="text101-6"><tspan
+       sodipodi:role="line"
+       id="tspan99-88"
+       x="504.97748"
+       y="327.43918"
+       style="stroke-width:0.45284379">cont (fresh db)</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="199.31563"
+     y="327.04028"
+     id="text101-6-4"><tspan
+       sodipodi:role="line"
+       id="tspan99-88-4"
+       x="199.31563"
+       y="327.04028"
+       style="stroke-width:0.45284379">cont (retiring db)</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="6.9198484"
+     y="397.37653"
+     id="text277"><tspan
+       sodipodi:role="line"
+       id="tspan275"
+       x="6.9198484"
+       y="397.37653"
+       style="stroke-width:0.45284379">/.shards_acct</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="8.2687769"
+     y="280.81049"
+     id="text281"><tspan
+       sodipodi:role="line"
+       id="tspan279"
+       x="8.2687769"
+       y="280.81049"
+       style="stroke-width:0.45284379">/acct</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="9.5435867"
+     y="457.57593"
+     id="text101"><tspan
+       sodipodi:role="line"
+       id="tspan99"
+       x="9.5435867"
+       y="457.57593"
+       style="stroke-width:0.45284379">cont-568d8e-&lt;ts&gt;-0</tspan></text>
+  <flowRoot
+     xml:space="preserve"
+     id="flowRoot1828"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:37.33333206px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none"
+     transform="translate(0,240)"><flowRegion
+       id="flowRegion1830"><rect
+         id="rect1832"
+         width="573.11005"
+         height="39.244427"
+         x="182.43355"
+         y="184.33957" /></flowRegion><flowPara
+       id="flowPara1834" /></flowRoot>  <path
+     style="fill:#ffffff;stroke:#000000;stroke-width:1.07623756"
+     inkscape:connector-curvature="0"
+     id="path877-7"
+     d="m 159.91421,436.7534 c 0,-2.74164 3.15947,-4.9602 7.06385,-4.9602 h 139.99275 c 3.90438,0 7.06386,2.21856 7.06386,4.9602 v 30.21218 c 0,2.74164 -3.15948,4.9602 -7.06386,4.9602 H 166.97806 c -3.90438,0 -7.06385,-2.21856 -7.06385,-4.9602 z" />
+  <path
+     style="fill:#ffffff;stroke:#000000;stroke-width:1.07623756"
+     inkscape:connector-curvature="0"
+     id="path877-7-6"
+     d="m 316.32694,436.75341 c 0,-2.74164 3.15947,-4.96021 7.06385,-4.96021 h 139.99275 c 3.90438,0 7.06386,2.21856 7.06386,4.9602 v 30.21218 c 0,2.74164 -3.15948,4.9602 -7.06386,4.9602 H 323.39079 c -3.90438,0 -7.06385,-2.21856 -7.06385,-4.9602 z" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="168.83531"
+     y="457.57593"
+     id="text101-7"><tspan
+       sodipodi:role="line"
+       id="tspan99-8"
+       x="168.83531"
+       y="457.57593"
+       style="stroke-width:0.45284379">cont-750ed3-&lt;ts&gt;-1</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="325.60159"
+     y="457.57593"
+     id="text101-7-4"><tspan
+       sodipodi:role="line"
+       id="tspan99-8-4"
+       x="325.60159"
+       y="457.57593"
+       style="stroke-width:0.45284379">cont-4ec28d-&lt;ts&gt;-2</tspan></text>
+  <path
+     style="fill:#0000ff;fill-opacity:1;stroke:#0000ff;stroke-width:0.90600002;stroke-linecap:butt;stroke-linejoin:miter;stroke-miterlimit:4;stroke-dasharray:7.24800014, 3.62400007;stroke-dashoffset:0;stroke-opacity:1"
+     d="m 86.923722,301.70074 c 0,39.73056 0.0442,39.59798 0.0442,39.59798 v 0 0 0"
+     id="path4476"
+     inkscape:connector-curvature="0" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#0000ff;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="75.443924"
+     y="372.1507"
+     id="text281-9"><tspan
+       sodipodi:role="line"
+       id="tspan279-9"
+       x="75.443924"
+       y="372.1507"
+       style="fill:#0000ff;stroke-width:0.45284379">cat</tspan></text>
+  <path
+     style="fill:#0000ff;fill-opacity:1;stroke:#0000ff;stroke-width:0.90600002;stroke-linecap:butt;stroke-linejoin:miter;stroke-miterlimit:4;stroke-dasharray:7.24800014, 3.62400007;stroke-dashoffset:0;stroke-opacity:1"
+     d="m 163.80955,301.72884 c 0,39.73056 0.0442,39.59798 0.0442,39.59798 v 0 0 0"
+     id="path4476-6"
+     inkscape:connector-curvature="0" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#0000ff;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="140.32585"
+     y="371.16364"
+     id="text281-9-8"><tspan
+       sodipodi:role="line"
+       id="tspan279-9-3"
+       x="140.32585"
+       y="371.16364"
+       style="fill:#0000ff;stroke-width:0.45284379">giraffe</tspan></text>
+  <path
+     style="fill:#f9f9f9;fill-opacity:1;stroke:#ba2e44;stroke-width:0.90600002;stroke-linecap:butt;stroke-linejoin:miter;stroke-miterlimit:4;stroke-dasharray:7.24800014, 3.62400007;stroke-dashoffset:0;stroke-opacity:1"
+     d="m 242.00139,301.72884 c 0,39.73055 0.0442,39.59798 0.0442,39.59798 v 0 0 0"
+     id="path4476-6-8"
+     inkscape:connector-curvature="0" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#aa0000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="224.25607"
+     y="371.16364"
+     id="text281-9-8-3"><tspan
+       sodipodi:role="line"
+       id="tspan279-9-3-3"
+       x="224.25607"
+       y="371.16364"
+       style="fill:#aa0000;stroke-width:0.45284379">igloo</tspan></text>
+  <path
+     style="fill:#f9f9f9;fill-opacity:1;stroke:#ba2e44;stroke-width:0.90600002;stroke-linecap:butt;stroke-linejoin:miter;stroke-miterlimit:4;stroke-dasharray:7.24800014, 3.62400007;stroke-dashoffset:0;stroke-opacity:1"
+     d="m 317.27929,302.64347 c 0,39.73056 0.0442,39.59799 0.0442,39.59799 v 0 0 0"
+     id="path4476-6-8-3"
+     inkscape:connector-curvature="0" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#aa0000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="299.53397"
+     y="372.07825"
+     id="text281-9-8-3-8"><tspan
+       sodipodi:role="line"
+       id="tspan279-9-3-3-0"
+       x="299.53397"
+       y="372.07825"
+       style="fill:#aa0000;stroke-width:0.45284379">linux</tspan></text>
+  <flowRoot
+     xml:space="preserve"
+     id="flowRoot6150"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:37.33333206px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none"
+     transform="translate(0,240)"><flowRegion
+       id="flowRegion6152"><rect
+         id="rect6154"
+         width="658.73334"
+         height="99.261536"
+         x="-102.56863"
+         y="156.43877" /></flowRegion><flowPara
+       id="flowPara6156" /></flowRoot>  <path
+     style="fill:#ffffff;stroke:#000000;stroke-width:1.07623756"
+     inkscape:connector-curvature="0"
+     id="path877-7-6-6"
+     d="m 472.61796,436.22338 c 0,-2.74164 3.15947,-4.96021 7.06385,-4.96021 h 139.99275 c 3.90438,0 7.06386,2.21856 7.06386,4.9602 v 30.21218 c 0,2.74164 -3.15948,4.9602 -7.06386,4.9602 H 479.68181 c -3.90438,0 -7.06385,-2.21856 -7.06385,-4.9602 z" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="481.89264"
+     y="457.0459"
+     id="text101-7-4-8"><tspan
+       sodipodi:role="line"
+       id="tspan99-8-4-7"
+       x="481.89264"
+       y="457.0459"
+       style="stroke-width:0.45284379">cont-aef34f-&lt;ts&gt;-3</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="48.558598"
+     y="491.41714"
+     id="text281-90"><tspan
+       sodipodi:role="line"
+       id="tspan279-3"
+       x="48.558598"
+       y="491.41714"
+       style="stroke-width:0.45284379">&quot;&quot; - &quot;cat&quot;</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="180.88539"
+     y="490.2355"
+     id="text281-90-3"><tspan
+       sodipodi:role="line"
+       id="tspan279-3-3"
+       x="180.88539"
+       y="490.2355"
+       style="stroke-width:0.45284379">&quot;cat&quot; - &quot;giraffe&quot;</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="333.40033"
+     y="490.2355"
+     id="text281-90-3-7"><tspan
+       sodipodi:role="line"
+       id="tspan279-3-3-3"
+       x="333.40033"
+       y="490.2355"
+       style="stroke-width:0.45284379">&quot;giraffe&quot; - &quot;igloo&quot;</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="494.11285"
+     y="490.2355"
+     id="text281-90-3-7-2"><tspan
+       sodipodi:role="line"
+       id="tspan279-3-3-3-6"
+       x="494.11285"
+       y="490.2355"
+       style="stroke-width:0.45284379">&quot;igloo&quot; - &quot;linux&quot;</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="515.27777"
+     y="370.0264"
+     id="text281-90-3-7-2-5"><tspan
+       sodipodi:role="line"
+       id="tspan279-3-3-3-6-2"
+       x="515.27777"
+       y="370.0264"
+       style="stroke-width:0.45284379">&quot;linux&quot; - &quot;&quot;</tspan></text>
+  <g
+     id="g9562"
+     transform="translate(66.175461,268.97255)">
+    <path
+       style="fill:#ffffff;stroke:#000000;stroke-width:0.90568852"
+       inkscape:connector-curvature="0"
+       id="path885-9"
+       d="m 194.42688,-171.66102 c 0,-2.7533 2.22799,-4.98129 4.98128,-4.98129 h 98.72005 c 2.75329,0 4.98129,2.22799 4.98129,4.98129 v 30.34056 c 0,2.75329 -2.228,4.98128 -4.98129,4.98128 h -98.72005 c -2.75329,0 -4.98128,-2.22799 -4.98128,-4.98128 z" />
+    <text
+       id="text101-6-7"
+       y="-152.15254"
+       x="229.83868"
+       style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+       xml:space="preserve"><tspan
+         style="stroke-width:0.45284379"
+         y="-152.15254"
+         x="229.83868"
+         id="tspan99-88-5"
+         sodipodi:role="line">proxy</tspan></text>
+  </g>
+  <path
+     style="fill:none;stroke:#000000;stroke-width:1px;stroke-linecap:butt;stroke-linejoin:miter;stroke-opacity:1;marker-end:url(#EmptyTriangleOutL)"
+     d="m 306.63754,6.19529 c 0,85.0327 0,85.0327 0,85.0327"
+     id="path3107"
+     inkscape:connector-curvature="0" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:1px;stroke-linecap:butt;stroke-linejoin:miter;stroke-opacity:1;marker-start:url(#EmptyTriangleInL)"
+     d="m 328.3093,5.91986 c 0,85.0327 0,85.0327 0,85.0327"
+     id="path3107-8"
+     inkscape:connector-curvature="0" />
+  <g
+     id="g6677"
+     transform="translate(-43.02298,-49.41488)">
+    <circle
+       r="8.4370966"
+       cy="103.82908"
+       cx="337.64932"
+       id="path6543"
+       style="fill:#ffffff;fill-opacity:0.34622521;stroke:#000000" />
+    <text
+       id="text101-6-7-7"
+       y="108.6488"
+       x="333.60883"
+       style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+       xml:space="preserve"><tspan
+         style="stroke-width:0.45284379"
+         y="108.6488"
+         x="333.60883"
+         id="tspan99-88-5-6"
+         sodipodi:role="line">1</tspan></text>
+  </g>
+  <g
+     id="g6682"
+     transform="translate(95.02034,123.78481)">
+    <circle
+       r="8.4370966"
+       cy="103.49822"
+       cx="383.97064"
+       id="path6543-4"
+       style="fill:#ffffff;fill-opacity:0.34622521;stroke:#000000" />
+    <text
+       id="text101-6-7-7-3"
+       y="108.31794"
+       x="379.93011"
+       style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+       xml:space="preserve"><tspan
+         style="stroke-width:0.45284379"
+         y="108.31794"
+         x="379.93011"
+         id="tspan99-88-5-6-0"
+         sodipodi:role="line">2</tspan></text>
+  </g>
+  <g
+     id="g16036"
+     transform="translate(366.39382,255.45418)">
+    <circle
+       r="8.4370966"
+       cy="-28.171146"
+       cx="-192.15164"
+       id="path6543-4-3"
+       style="fill:#ffffff;fill-opacity:0.34622521;stroke:#3771c8;stroke-opacity:1" />
+    <text
+       id="text101-6-7-7-3-0"
+       y="-23.351437"
+       x="-196.19215"
+       style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#3771c8;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+       xml:space="preserve"><tspan
+         style="fill:#3771c8;stroke-width:0.45284379"
+         y="-23.351437"
+         x="-196.19215"
+         id="tspan99-88-5-6-0-9"
+         sodipodi:role="line">3</tspan></text>
+  </g>
+  <g
+     id="g16041"
+     transform="translate(390.41964,250.4912)">
+    <circle
+       r="8.4370966"
+       cy="-23.208166"
+       cx="-149.80074"
+       id="path6543-4-3-2"
+       style="fill:#ffffff;fill-opacity:0.34622521;stroke:#3771c8;stroke-opacity:1" />
+    <text
+       id="text101-6-7-7-3-0-5"
+       y="-18.388449"
+       x="-153.84125"
+       style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#3771c8;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+       xml:space="preserve"><tspan
+         style="fill:#3771c8;fill-opacity:1;stroke-width:0.45284379"
+         y="-18.388449"
+         x="-153.84125"
+         id="tspan99-88-5-6-0-9-4"
+         sodipodi:role="line">4</tspan></text>
+  </g>
+  <g
+     id="g6697"
+     transform="translate(148.20309,-101.85724)">
+    <circle
+       r="8.4370966"
+       cy="156.27144"
+       cx="191.9026"
+       id="path6543-4-3-2-0"
+       style="fill:#ffffff;fill-opacity:0.34622521;stroke:#000000" />
+    <text
+       id="text101-6-7-7-3-0-5-5"
+       y="161.09116"
+       x="187.86209"
+       style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+       xml:space="preserve"><tspan
+         style="stroke-width:0.45284379"
+         y="161.09116"
+         x="187.86209"
+         id="tspan99-88-5-6-0-9-4-9"
+         sodipodi:role="line">5</tspan></text>
+  </g>
+  <g
+     id="g16020"
+     transform="translate(216.86468,419.26453)">
+    <circle
+       r="8.4370966"
+       cy="-191.98149"
+       cx="77.324554"
+       id="path6543-4-3-4"
+       style="fill:#ffffff;fill-opacity:0.34622521;stroke:#338000" />
+    <text
+       id="text101-6-7-7-3-0-3"
+       y="-187.16177"
+       x="73.284042"
+       style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#338000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+       xml:space="preserve"><tspan
+         style="fill:#338000;stroke-width:0.45284379"
+         y="-187.16177"
+         x="73.284042"
+         id="tspan99-88-5-6-0-9-5"
+         sodipodi:role="line">3</tspan></text>
+  </g>
+  <g
+     id="g16025"
+     transform="translate(223.50339,414.30154)">
+    <circle
+       r="8.4370966"
+       cy="-187.01851"
+       cx="119.67545"
+       id="path6543-4-3-2-7"
+       style="fill:#ffffff;fill-opacity:0.34622521;stroke:#338000" />
+    <text
+       id="text101-6-7-7-3-0-5-4"
+       y="-182.19879"
+       x="115.63493"
+       style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#338000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+       xml:space="preserve"><tspan
+         style="fill:#338000;stroke-width:0.45284379"
+         y="-182.19879"
+         x="115.63493"
+         id="tspan99-88-5-6-0-9-4-3"
+         sodipodi:role="line">4</tspan></text>
+  </g>
+  <path
+     style="fill:none;stroke:#000000;stroke-width:1px;stroke-linecap:butt;stroke-linejoin:miter;stroke-opacity:1;marker-start:url(#marker11239);marker-end:url(#marker10157)"
+     d="m 367.5,133.5 c 163,166 163,166 163,166"
+     id="path13299"
+     inkscape:connector-curvature="0" />
+  <path
+     style="fill:#3a73c9;fill-opacity:0.97254902;stroke:#5083cf;stroke-width:1px;stroke-linecap:butt;stroke-linejoin:miter;stroke-opacity:0.80849669;marker-start:url(#marker13593);marker-end:url(#marker16051)"
+     d="m 262.5,131.5 c -217,299 -217,299 -217,299"
+     id="path13583"
+     inkscape:connector-curvature="0" />
+  <path
+     style="fill:#3771c8;fill-opacity:1;stroke:#3771c8;stroke-width:1px;stroke-linecap:butt;stroke-linejoin:miter;stroke-opacity:1;marker-start:url(#marker15073);marker-end:url(#marker11143)"
+     d="m 194,433.5 86,-300"
+     id="path15009"
+     inkscape:connector-curvature="0" />
+  <path
+     style="fill:#338000;fill-opacity:1;stroke:#338000;stroke-width:1px;stroke-linecap:butt;stroke-linejoin:miter;stroke-opacity:1;marker-start:url(#marker15603);marker-end:url(#marker15697)"
+     d="m 275,431.5 47.5,-297"
+     id="path15593"
+     inkscape:connector-curvature="0" />
+  <path
+     style="fill:#338000;fill-opacity:1;stroke:#338000;stroke-width:1px;stroke-linecap:butt;stroke-linejoin:miter;stroke-opacity:1;marker-start:url(#marker15801);marker-end:url(#marker15907)"
+     d="m 342,135 22,163.5"
+     id="path15791"
+     inkscape:connector-curvature="0" />
+</svg>
diff --git a/doc/source/images/sharding_cleave1_load.svg b/doc/source/images/sharding_cleave1_load.svg
new file mode 100644
index 0000000000..4485e3ea09
--- /dev/null
+++ b/doc/source/images/sharding_cleave1_load.svg
@@ -0,0 +1,1694 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<svg
+   xmlns:lucid="lucid"
+   xmlns:dc="http://purl.org/dc/elements/1.1/"
+   xmlns:cc="http://creativecommons.org/ns#"
+   xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
+   xmlns:svg="http://www.w3.org/2000/svg"
+   xmlns="http://www.w3.org/2000/svg"
+   xmlns:xlink="http://www.w3.org/1999/xlink"
+   xmlns:sodipodi="http://sodipodi.sourceforge.net/DTD/sodipodi-0.dtd"
+   xmlns:inkscape="http://www.inkscape.org/namespaces/inkscape"
+   width="630"
+   height="260"
+   version="1.1"
+   id="svg1304"
+   sodipodi:docname="sharding_lock3.svg"
+   inkscape:version="0.92.2 (5c3e80d, 2017-08-06)">
+  <metadata
+     id="metadata1310">
+    <rdf:RDF>
+      <cc:Work
+         rdf:about="">
+        <dc:format>image/svg+xml</dc:format>
+        <dc:type
+           rdf:resource="http://purl.org/dc/dcmitype/StillImage" />
+        <dc:title />
+      </cc:Work>
+    </rdf:RDF>
+  </metadata>
+  <defs
+     id="defs1308">
+    <defs
+       id="defs1300">
+      <path
+         id="v"
+         d="M 0,20 411,-1484 H 569 L 162,20 H 0"
+         inkscape:connector-curvature="0" />
+      <path
+         id="w"
+         d="M 797,-207 C 713,-60 620,16 414,20 203,24 88,-98 87,-302 c 0,-112 37,-198 111,-258 74,-60 192,-93 356,-96 l 243,-4 c 10,-201 -43,-307 -232,-305 -154,2 -223,43 -242,172 l -188,-17 c 31,-195 175,-292 434,-292 259,0 410,116 410,364 v 466 c 3,95 12,159 101,161 17,0 37,-2 59,-7 V -6 C 1094,5 1047,10 1000,10 857,8 812,-66 803,-207 Z m -525,-92 c -1,116 66,187 183,184 230,-7 361,-164 342,-419 -124,5 -305,-2 -389,30 -83,32 -136,92 -136,205"
+         inkscape:connector-curvature="0" />
+      <path
+         id="x"
+         d="m 779,-765 c -19,-119 -93,-196 -233,-196 -95,0 -164,32 -207,95 -43,63 -64,170 -64,320 0,144 23,251 68,320 45,69 114,104 205,104 139,0 224,-79 240,-212 l 182,12 C 946,-119 781,22 553,20 230,17 87,-201 87,-542 c 0,-338 145,-557 464,-560 225,-1 380,129 413,323"
+         inkscape:connector-curvature="0" />
+      <path
+         id="y"
+         d="m 336,-268 c 2,98 22,139 114,141 24,0 59,-5 104,-14 V -8 C 495,8 434,16 372,16 228,16 156,-66 156,-229 V -951 H 31 v -131 h 132 l 53,-242 h 120 v 242 h 200 v 131 H 336 v 683"
+         inkscape:connector-curvature="0" />
+      <g
+         id="a">
+        <use
+           id="use981"
+           xlink:href="#v"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use983"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,9.8784722,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use985"
+           xlink:href="#x"
+           transform="matrix(0.01736111,0,0,0.01736111,29.652778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use987"
+           xlink:href="#x"
+           transform="matrix(0.01736111,0,0,0.01736111,47.430556,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use989"
+           xlink:href="#y"
+           transform="matrix(0.01736111,0,0,0.01736111,65.208333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="z"
+         d="M 187,0 V -219 H 382 V 0 H 187"
+         inkscape:connector-curvature="0" />
+      <path
+         id="A"
+         d="m 513,-963 c -139,1 -238,29 -238,149 0,72 41,100 95,127 55,27 348,94 404,125 101,56 176,118 176,263 C 950,-73 758,21 511,20 254,19 107,-55 57,-254 l 159,-31 c 34,123 133,168 295,168 156,0 264,-34 264,-168 0,-156 -183,-165 -315,-204 -171,-51 -245,-68 -323,-172 -26,-35 -37,-82 -37,-135 0,-220 172,-304 413,-303 232,1 379,74 418,265 l -162,20 C 746,-918 647,-964 513,-963"
+         inkscape:connector-curvature="0" />
+      <path
+         id="B"
+         d="m 322,-1484 c -2,195 6,405 -8,587 h 3 c 73,-129 159,-205 346,-205 250,0 342,118 343,381 V 0 H 825 v -686 c 3,-190 -43,-277 -223,-277 -176,-1 -280,140 -280,325 V 0 H 142 v -1484 h 180"
+         inkscape:connector-curvature="0" />
+      <path
+         id="C"
+         d="m 318,-861 c 55,-157 83,-241 257,-241 24,0 48,3 73,10 v 165 c -24,-7 -56,-10 -96,-10 -75,0 -132,33 -171,97 -39,64 -59,156 -59,276 V 0 H 142 c -3,-364 6,-725 -6,-1082 h 170 c 5,123 8,196 8,221 h 4"
+         inkscape:connector-curvature="0" />
+      <path
+         id="D"
+         d="m 835,0 c -5,-29 -11,-137 -10,-174 h -4 C 759,-45 663,20 484,20 177,20 86,-201 86,-536 c 0,-377 133,-566 398,-566 178,1 273,67 339,188 -4,-187 -1,-380 -2,-570 h 180 v 1261 c 0,113 2,187 6,223 z m -14,-554 c 0,-255 -58,-415 -289,-415 -91,0 -151,37 -196,101 -76,109 -77,543 -1,651 44,63 105,98 195,98 235,0 291,-173 291,-435"
+         inkscape:connector-curvature="0" />
+      <path
+         id="E"
+         d="m 87,-548 c 0,-338 159,-553 484,-554 325,-2 484,204 477,599 H 276 c -1,227 88,385 302,388 146,2 246,-65 283,-166 l 158,45 C 954,-65 807,20 578,20 240,20 87,-193 87,-548 Z m 775,-93 c -19,-206 -90,-328 -294,-328 -185,0 -285,140 -290,328 h 584"
+         inkscape:connector-curvature="0" />
+      <path
+         id="F"
+         d="M -31,407 V 277 H 1162 V 407 H -31"
+         inkscape:connector-curvature="0" />
+      <g
+         id="b">
+        <use
+           id="use999"
+           xlink:href="#v"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1001"
+           xlink:href="#z"
+           transform="matrix(0.01736111,0,0,0.01736111,9.8784722,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1003"
+           xlink:href="#A"
+           transform="matrix(0.01736111,0,0,0.01736111,19.756944,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1005"
+           xlink:href="#B"
+           transform="matrix(0.01736111,0,0,0.01736111,37.534722,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1007"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,57.309028,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1009"
+           xlink:href="#C"
+           transform="matrix(0.01736111,0,0,0.01736111,77.083333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1011"
+           xlink:href="#D"
+           transform="matrix(0.01736111,0,0,0.01736111,88.923611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1013"
+           xlink:href="#E"
+           transform="matrix(0.01736111,0,0,0.01736111,108.69792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1015"
+           xlink:href="#D"
+           transform="matrix(0.01736111,0,0,0.01736111,128.47222,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1017"
+           xlink:href="#F"
+           transform="matrix(0.01736111,0,0,0.01736111,148.24653,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1019"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,168.02083,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1021"
+           xlink:href="#x"
+           transform="matrix(0.01736111,0,0,0.01736111,187.79514,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1023"
+           xlink:href="#x"
+           transform="matrix(0.01736111,0,0,0.01736111,205.57292,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1025"
+           xlink:href="#y"
+           transform="matrix(0.01736111,0,0,0.01736111,223.35069,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="G"
+         d="m 571,-1102 c 350,0 480,196 482,560 2,357 -151,562 -488,562 -332,0 -479,-218 -479,-562 0,-373 162,-560 485,-560 z m -8,989 c 244,0 301,-164 301,-429 0,-266 -49,-427 -290,-427 -239,0 -299,165 -299,427 0,252 61,429 288,429"
+         inkscape:connector-curvature="0" />
+      <path
+         id="H"
+         d="m 663,-1102 c 251,0 343,119 343,381 V 0 H 825 v -686 c 0,-183 -40,-279 -223,-277 -184,2 -280,141 -280,336 V 0 H 142 c -3,-345 6,-754 -6,-1082 h 170 c 5,68 6,94 8,185 h 3 c 76,-134 157,-205 346,-205"
+         inkscape:connector-curvature="0" />
+      <path
+         id="I"
+         d="m 1059,-705 c 0,235 -42,415 -125,539 C 851,-42 729,20 567,20 405,20 283,-42 202,-165 121,-288 80,-468 80,-705 c 0,-242 39,-423 118,-544 79,-121 204,-181 375,-181 166,0 288,61 367,183 79,122 119,303 119,542 z m -257,436 c 94,-156 93,-724 4,-878 -51,-89 -125,-137 -233,-137 -111,0 -186,48 -239,135 -91,149 -91,731 2,883 55,89 126,139 233,139 106,0 178,-51 233,-142"
+         inkscape:connector-curvature="0" />
+      <path
+         id="J"
+         d="m 156,0 v -153 h 359 v -1084 l -318,227 v -170 l 333,-229 h 166 v 1256 h 343 V 0 H 156"
+         inkscape:connector-curvature="0" />
+      <path
+         id="K"
+         d="m 655,-1102 c 307,0 398,221 398,556 0,377 -133,566 -398,566 -180,0 -272,-66 -339,-188 1,22 -7,151 -10,168 H 132 c 4,-36 6,-110 6,-223 v -1261 h 180 c -2,196 4,384 -4,576 h 4 c 62,-129 158,-194 337,-194 z m -337,573 c 0,254 57,416 289,416 91,0 152,-37 197,-101 76,-109 76,-543 0,-651 -44,-63 -105,-98 -195,-98 -236,0 -291,169 -291,434"
+         inkscape:connector-curvature="0" />
+      <path
+         id="L"
+         d="m 572,-1430 c 269,0 442,128 442,386 0,144 -72,232 -149,325 -108,130 -487,366 -564,566 h 735 V 0 H 103 v -127 c 119,-285 378,-432 583,-627 76,-72 141,-150 143,-284 1,-156 -100,-244 -257,-244 -156,0 -263,93 -277,238 l -184,-17 c 24,-224 208,-369 461,-369"
+         inkscape:connector-curvature="0" />
+      <path
+         id="M"
+         d="m 715,-719 c 191,17 334,134 334,330 C 1049,-115 858,20 571,20 288,20 108,-110 78,-362 l 186,-17 c 24,167 126,250 307,250 177,0 294,-88 291,-266 -3,-174 -149,-246 -344,-244 H 416 v -156 h 98 c 179,2 311,-77 311,-243 0,-157 -98,-244 -264,-244 -159,0 -264,88 -278,233 l -181,-14 c 23,-229 206,-367 461,-367 262,0 447,124 447,373 0,197 -120,298 -295,334 v 4"
+         inkscape:connector-curvature="0" />
+      <path
+         id="N"
+         d="M 1036,-1263 C 892,-1043 790,-871 731,-746 626,-522 556,-302 553,0 H 365 c 0,-180 39,-369 115,-568 76,-199 203,-429 382,-688 H 105 v -153 h 931 v 146"
+         inkscape:connector-curvature="0" />
+      <g
+         id="c">
+        <use
+           id="use1036"
+           xlink:href="#x"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1038"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1040"
+           xlink:href="#H"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1042"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1044"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,50.403646,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1046"
+           xlink:href="#I"
+           transform="matrix(0.01302083,0,0,0.01302083,65.234375,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1048"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,80.065104,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1050"
+           xlink:href="#J"
+           transform="matrix(0.01302083,0,0,0.01302083,94.895833,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1052"
+           xlink:href="#E"
+           transform="matrix(0.01302083,0,0,0.01302083,109.72656,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1054"
+           xlink:href="#E"
+           transform="matrix(0.01302083,0,0,0.01302083,124.55729,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1056"
+           xlink:href="#K"
+           transform="matrix(0.01302083,0,0,0.01302083,139.38802,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1058"
+           xlink:href="#L"
+           transform="matrix(0.01302083,0,0,0.01302083,154.21875,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1060"
+           xlink:href="#M"
+           transform="matrix(0.01302083,0,0,0.01302083,169.04948,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1062"
+           xlink:href="#N"
+           transform="matrix(0.01302083,0,0,0.01302083,183.88021,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="d">
+        <use
+           id="use1065"
+           xlink:href="#x"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1067"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1069"
+           xlink:href="#H"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1071"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="e">
+        <use
+           id="use1074"
+           xlink:href="#x"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1076"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1078"
+           xlink:href="#H"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1080"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="O"
+         d="M 496,424 C 268,175 127,-92 127,-532 c 0,-438 143,-704 369,-952 h 174 c -222,249 -362,524 -362,954 0,431 138,703 362,954 H 496"
+         inkscape:connector-curvature="0" />
+      <path
+         id="P"
+         d="m 320,-908 c 63,-128 152,-193 335,-193 133,0 233,45 299,134 66,89 99,230 99,421 0,377 -133,566 -398,566 -167,0 -279,-63 -336,-188 h -5 c 8,141 2,428 4,593 H 138 V -861 c 0,-111 -2,-185 -6,-221 h 174 c 5,33 9,134 10,174 z m -2,380 c 0,254 57,415 289,415 89,0 149,-37 195,-99 76,-105 79,-547 1,-653 -45,-62 -105,-97 -194,-97 -243,1 -291,184 -291,434"
+         inkscape:connector-curvature="0" />
+      <path
+         id="Q"
+         d="m 137,-1312 v -172 h 180 v 172 z M 137,0 V -1082 H 317 V 0 H 137"
+         inkscape:connector-curvature="0" />
+      <path
+         id="R"
+         d="M 613,0 H 400 L 7,-1082 h 192 c 109,337 207,579 307,941 97,-323 214,-627 320,-941 h 191"
+         inkscape:connector-curvature="0" />
+      <g
+         id="f">
+        <use
+           id="use1087"
+           xlink:href="#O"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1089"
+           xlink:href="#P"
+           transform="matrix(0.01302083,0,0,0.01302083,8.8802083,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1091"
+           xlink:href="#Q"
+           transform="matrix(0.01302083,0,0,0.01302083,23.710937,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1093"
+           xlink:href="#R"
+           transform="matrix(0.01302083,0,0,0.01302083,29.635417,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1095"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,42.96875,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1097"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,57.799479,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="S"
+         d="m 186,-1484 c 228,249 369,516 369,956 0,438 -143,704 -369,952 H 12 C 235,172 374,-97 374,-530 374,-961 234,-1234 12,-1484 h 174"
+         inkscape:connector-curvature="0" />
+      <g
+         id="g">
+        <use
+           id="use1101"
+           xlink:href="#D"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1103"
+           xlink:href="#K"
+           transform="matrix(0.01302083,0,0,0.01302083,14.830729,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1105"
+           xlink:href="#S"
+           transform="matrix(0.01302083,0,0,0.01302083,29.661458,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="T"
+         d="m 779,-765 c -19,-119 -93,-196 -233,-196 -95,0 -164,32 -207,95 -43,63 -64,170 -64,320 0,144 23,251 68,320 45,69 114,104 205,104 139,0 224,-79 240,-212 l 182,12 C 946,-119 781,22 553,20 230,17 87,-201 87,-542 c 0,-338 145,-557 464,-560 225,-1 380,129 413,323"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="U"
+         d="M 797,-207 C 713,-60 620,16 414,20 203,24 88,-98 87,-302 c 0,-112 37,-198 111,-258 74,-60 192,-93 356,-96 l 243,-4 c 10,-201 -43,-307 -232,-305 -154,2 -223,43 -242,172 l -188,-17 c 31,-195 175,-292 434,-292 259,0 410,116 410,364 v 466 c 3,95 12,159 101,161 17,0 37,-2 59,-7 V -6 C 1094,5 1047,10 1000,10 857,8 812,-66 803,-207 Z m -525,-92 c -1,116 66,187 183,184 230,-7 361,-164 342,-419 -124,5 -305,-2 -389,30 -83,32 -136,92 -136,205"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="V"
+         d="m 336,-268 c 2,98 22,139 114,141 24,0 59,-5 104,-14 V -8 C 495,8 434,16 372,16 228,16 156,-66 156,-229 V -951 H 31 v -131 h 132 l 53,-242 h 120 v 242 h 200 v 131 H 336 v 683"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <g
+         id="h">
+        <use
+           id="use1111"
+           xlink:href="#T"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1113"
+           xlink:href="#U"
+           transform="matrix(0.01736111,0,0,0.01736111,17.777778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1115"
+           xlink:href="#V"
+           transform="matrix(0.01736111,0,0,0.01736111,37.552083,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="W"
+         d="m 824,-897 c -1,-17 6,-175 12,-185 h 171 c -12,319 -6,716 -6,1051 0,304 -151,456 -453,456 -226,0 -374,-90 -417,-267 l 181,-26 c 24,102 112,157 241,156 179,0 269,-105 269,-315 0,-57 3,-120 -2,-174 C 759,-74 647,8 472,8 339,8 242,-36 180,-124 118,-212 86,-350 86,-539 c 0,-191 33,-332 100,-423 67,-91 169,-137 306,-137 167,0 273,85 332,202 z m -38,579 c 48,-119 46,-331 0,-450 -42,-108 -118,-197 -250,-197 -92,0 -154,37 -201,100 -78,107 -74,530 -4,643 63,101 251,129 353,47 43,-35 77,-81 102,-143"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="X"
+         d="m 137,-1312 v -172 h 180 v 172 z M 137,0 V -1082 H 317 V 0 H 137"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="Y"
+         d="m 318,-861 c 55,-157 83,-241 257,-241 24,0 48,3 73,10 v 165 c -24,-7 -56,-10 -96,-10 -75,0 -132,33 -171,97 -39,64 -59,156 -59,276 V 0 H 142 c -3,-364 6,-725 -6,-1082 h 170 c 5,123 8,196 8,221 h 4"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="Z"
+         d="m 492,-1341 c -103,3 -130,49 -131,162 v 97 h 211 v 131 H 361 V 0 H 181 V -951 H 29 v -131 h 152 v -122 c 0,-192 78,-276 264,-278 50,0 92,4 127,12 v 137 c -30,-5 -57,-8 -80,-8"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="aa"
+         d="m 87,-548 c 0,-338 159,-553 484,-554 325,-2 484,204 477,599 H 276 c -1,227 88,385 302,388 146,2 246,-65 283,-166 l 158,45 C 954,-65 807,20 578,20 240,20 87,-193 87,-548 Z m 775,-93 c -19,-206 -90,-328 -294,-328 -185,0 -285,140 -290,328 h 584"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <g
+         id="i">
+        <use
+           id="use1123"
+           xlink:href="#W"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1125"
+           xlink:href="#X"
+           transform="matrix(0.01736111,0,0,0.01736111,19.774306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1127"
+           xlink:href="#Y"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1129"
+           xlink:href="#U"
+           transform="matrix(0.01736111,0,0,0.01736111,39.513889,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1131"
+           xlink:href="#Z"
+           transform="matrix(0.01736111,0,0,0.01736111,59.288194,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1133"
+           xlink:href="#Z"
+           transform="matrix(0.01736111,0,0,0.01736111,68.524306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1135"
+           xlink:href="#aa"
+           transform="matrix(0.01736111,0,0,0.01736111,78.402778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="ab"
+         d="M 138,0 V -1484 H 318 V 0 H 138"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="ac"
+         d="m 571,-1102 c 350,0 480,196 482,560 2,357 -151,562 -488,562 -332,0 -479,-218 -479,-562 0,-373 162,-560 485,-560 z m -8,989 c 244,0 301,-164 301,-429 0,-266 -49,-427 -290,-427 -239,0 -299,165 -299,427 0,252 61,429 288,429"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <g
+         id="j">
+        <use
+           id="use1140"
+           xlink:href="#X"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1142"
+           xlink:href="#W"
+           transform="matrix(0.01736111,0,0,0.01736111,7.8993056,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1144"
+           xlink:href="#ab"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1146"
+           xlink:href="#ac"
+           transform="matrix(0.01736111,0,0,0.01736111,35.572917,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1148"
+           xlink:href="#ac"
+           transform="matrix(0.01736111,0,0,0.01736111,55.347222,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="ad"
+         d="m 765,-739 c 171,25 285,155 285,346 C 1049,-119 859,20 570,20 286,20 89,-117 89,-391 89,-574 212,-714 370,-737 v -4 c -143,-30 -248,-160 -248,-328 1,-229 198,-361 444,-361 254,0 448,125 449,363 1,166 -104,300 -250,324 z m -197,-70 c 171,-2 261,-74 260,-248 0,-159 -87,-239 -262,-239 -165,0 -260,77 -260,239 0,163 99,249 262,248 z m 4,694 c 200,0 291,-92 291,-295 1,-179 -116,-264 -297,-264 -175,0 -292,98 -291,268 0,194 99,291 297,291"
+         inkscape:connector-curvature="0" />
+      <path
+         id="ae"
+         d="m 492,-1341 c -103,3 -130,49 -131,162 v 97 h 211 v 131 H 361 V 0 H 181 V -951 H 29 v -131 h 152 v -122 c 0,-192 78,-276 264,-278 50,0 92,4 127,12 v 137 c -30,-5 -57,-8 -80,-8"
+         inkscape:connector-curvature="0" />
+      <g
+         id="k">
+        <use
+           id="use1153"
+           xlink:href="#x"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1155"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1157"
+           xlink:href="#H"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1159"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1161"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,50.403646,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1163"
+           xlink:href="#I"
+           transform="matrix(0.01302083,0,0,0.01302083,65.234375,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1165"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,80.065104,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1167"
+           xlink:href="#D"
+           transform="matrix(0.01302083,0,0,0.01302083,94.895833,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1169"
+           xlink:href="#D"
+           transform="matrix(0.01302083,0,0,0.01302083,109.72656,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1171"
+           xlink:href="#ad"
+           transform="matrix(0.01302083,0,0,0.01302083,124.55729,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1173"
+           xlink:href="#M"
+           transform="matrix(0.01302083,0,0,0.01302083,139.38802,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1175"
+           xlink:href="#L"
+           transform="matrix(0.01302083,0,0,0.01302083,154.21875,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1177"
+           xlink:href="#ad"
+           transform="matrix(0.01302083,0,0,0.01302083,169.04948,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1179"
+           xlink:href="#ae"
+           transform="matrix(0.01302083,0,0,0.01302083,183.88021,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="af"
+         d="m 625,-911 c 261,-2 424,185 424,450 0,289 -169,481 -455,481 -159,0 -280,-59 -364,-177 -84,-118 -126,-290 -126,-515 0,-244 44,-431 131,-562 87,-131 212,-196 373,-196 213,0 347,96 402,287 l -172,31 c -35,-115 -113,-172 -232,-172 -103,0 -182,48 -238,144 -56,96 -85,234 -85,415 59,-113 178,-184 342,-186 z m -37,786 c 182,0 278,-138 278,-328 0,-193 -98,-318 -284,-319 -166,-1 -281,107 -281,276 0,195 106,371 287,371"
+         inkscape:connector-curvature="0" />
+      <g
+         id="l">
+        <use
+           id="use1183"
+           xlink:href="#x"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1185"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1187"
+           xlink:href="#H"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1189"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1191"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,50.403646,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1193"
+           xlink:href="#I"
+           transform="matrix(0.01302083,0,0,0.01302083,65.234375,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1195"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,80.065104,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1197"
+           xlink:href="#w"
+           transform="matrix(0.01302083,0,0,0.01302083,94.895833,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1199"
+           xlink:href="#x"
+           transform="matrix(0.01302083,0,0,0.01302083,109.72656,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1201"
+           xlink:href="#I"
+           transform="matrix(0.01302083,0,0,0.01302083,123.0599,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1203"
+           xlink:href="#I"
+           transform="matrix(0.01302083,0,0,0.01302083,137.89062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1205"
+           xlink:href="#x"
+           transform="matrix(0.01302083,0,0,0.01302083,152.72135,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1207"
+           xlink:href="#af"
+           transform="matrix(0.01302083,0,0,0.01302083,166.05469,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1209"
+           xlink:href="#w"
+           transform="matrix(0.01302083,0,0,0.01302083,180.88542,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="m">
+        <use
+           id="use1212"
+           xlink:href="#H"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1214"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,19.774306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1216"
+           xlink:href="#H"
+           transform="matrix(0.01736111,0,0,0.01736111,39.548611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1218"
+           xlink:href="#E"
+           transform="matrix(0.01736111,0,0,0.01736111,59.322917,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="ag"
+         d="m 91,-464 v -160 h 500 v 160 H 91"
+         inkscape:connector-curvature="0" />
+      <use
+         id="n"
+         xlink:href="#ag"
+         transform="scale(0.01736111)"
+         x="0"
+         y="0"
+         width="100%"
+         height="100%" />
+      <g
+         id="o">
+        <use
+           id="use1223"
+           xlink:href="#x"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1225"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,17.777778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1227"
+           xlink:href="#y"
+           transform="matrix(0.01736111,0,0,0.01736111,37.552083,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="p">
+        <use
+           id="use1230"
+           xlink:href="#x"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1232"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,17.777778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1234"
+           xlink:href="#y"
+           transform="matrix(0.01736111,0,0,0.01736111,37.552083,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="ah"
+         d="m 824,-897 c -1,-17 6,-175 12,-185 h 171 c -12,319 -6,716 -6,1051 0,304 -151,456 -453,456 -226,0 -374,-90 -417,-267 l 181,-26 c 24,102 112,157 241,156 179,0 269,-105 269,-315 0,-57 3,-120 -2,-174 C 759,-74 647,8 472,8 339,8 242,-36 180,-124 118,-212 86,-350 86,-539 c 0,-191 33,-332 100,-423 67,-91 169,-137 306,-137 167,0 273,85 332,202 z m -38,579 c 48,-119 46,-331 0,-450 -42,-108 -118,-197 -250,-197 -92,0 -154,37 -201,100 -78,107 -74,530 -4,643 63,101 251,129 353,47 43,-35 77,-81 102,-143"
+         inkscape:connector-curvature="0" />
+      <g
+         id="q">
+        <use
+           id="use1238"
+           xlink:href="#ah"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1240"
+           xlink:href="#Q"
+           transform="matrix(0.01736111,0,0,0.01736111,19.774306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1242"
+           xlink:href="#C"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1244"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,39.513889,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1246"
+           xlink:href="#ae"
+           transform="matrix(0.01736111,0,0,0.01736111,59.288194,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1248"
+           xlink:href="#ae"
+           transform="matrix(0.01736111,0,0,0.01736111,68.524306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1250"
+           xlink:href="#E"
+           transform="matrix(0.01736111,0,0,0.01736111,78.402778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="r">
+        <use
+           id="use1253"
+           xlink:href="#ah"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1255"
+           xlink:href="#Q"
+           transform="matrix(0.01736111,0,0,0.01736111,19.774306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1257"
+           xlink:href="#C"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1259"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,39.513889,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1261"
+           xlink:href="#ae"
+           transform="matrix(0.01736111,0,0,0.01736111,59.288194,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1263"
+           xlink:href="#ae"
+           transform="matrix(0.01736111,0,0,0.01736111,68.524306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1265"
+           xlink:href="#E"
+           transform="matrix(0.01736111,0,0,0.01736111,78.402778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="ai"
+         d="M 138,0 V -1484 H 318 V 0 H 138"
+         inkscape:connector-curvature="0" />
+      <g
+         id="s">
+        <use
+           id="use1269"
+           xlink:href="#Q"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1271"
+           xlink:href="#ah"
+           transform="matrix(0.01736111,0,0,0.01736111,7.8993056,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1273"
+           xlink:href="#ai"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1275"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,35.572917,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1277"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,55.347222,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="t">
+        <use
+           id="use1280"
+           xlink:href="#Q"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1282"
+           xlink:href="#ah"
+           transform="matrix(0.01736111,0,0,0.01736111,7.8993056,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1284"
+           xlink:href="#ai"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1286"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,35.572917,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1288"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,55.347222,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="u">
+        <use
+           id="use1291"
+           xlink:href="#H"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1293"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,19.774306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1295"
+           xlink:href="#H"
+           transform="matrix(0.01736111,0,0,0.01736111,39.548611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1297"
+           xlink:href="#E"
+           transform="matrix(0.01736111,0,0,0.01736111,59.322917,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+    </defs>
+  </defs>
+  <sodipodi:namedview
+     pagecolor="#ffffff"
+     bordercolor="#666666"
+     borderopacity="1"
+     objecttolerance="10"
+     gridtolerance="10"
+     guidetolerance="10"
+     inkscape:pageopacity="0"
+     inkscape:pageshadow="2"
+     inkscape:window-width="3840"
+     inkscape:window-height="2031"
+     id="namedview1306"
+     showgrid="false"
+     inkscape:zoom="3.8314309"
+     inkscape:cx="251.19261"
+     inkscape:cy="58.808494"
+     inkscape:window-x="0"
+     inkscape:window-y="55"
+     inkscape:window-maximized="1"
+     inkscape:current-layer="svg1304" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke-width:0.45284426"
+     inkscape:connector-curvature="0"
+     id="path861"
+     d="M 0.896161,23.844052 H 628.99114 V 139.77218 H 0.896161 Z" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path863"
+     d="M 9.9983304,23.844052 H 19.1005 m 4.551085,0 h 9.102169 m 4.555613,0 h 9.10217 m 4.555613,0 h 9.102169 m 4.551085,0 h 9.102169 m 4.555613,0 h 9.10217 m 4.537499,0 h 9.111225 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55561,0 h 9.10217 m 4.55109,0 h 9.10216 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55561,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.54656,0 h 9.10217 m 4.56014,0 h 9.10217 m 4.54656,0 h 9.10217 m 4.55561,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55561,0 h 9.09765 m 4.55561,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55562,0 h 9.10216 m 4.55109,0 h 9.11123 m 4.55108,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55562,0 h 9.10216 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55561,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.54655,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.54655,0 h 9.10217 m 4.55562,0 h 9.10217 m 4.55108,0 h 4.55109 v 4.292964 m 0,4.292963 v 8.590456 m 0,4.292963 v 8.590456 m 0,4.292963 v 8.585927 m 0,4.30202 v 8.585927 m 0,4.292964 v 8.585927 m 0,4.30202 V 105.433 m 0,4.29296 v 8.58593 m 0,4.28844 v 8.59045 m 0,4.29297 v 4.28843 h -4.55109 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.11123 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.54656,0 h -9.10217 m -4.54655,0 h -9.10217 m -4.54656,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10216 m -4.55562,0 h -9.09764 m -4.55561,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.11123 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.102165 m -4.555613,0 h -9.102169 m -4.551085,0 h -9.102169 m -4.546557,0 h -9.102169 m -4.551085,0 h -9.102169 m -4.546557,0 h -9.102169 m -4.555613,0 H 9.9983304 m -4.5510847,0 H 0.896161 v -4.29296 m 0,-4.29297 v -8.59045 m 0,-4.29297 v -8.59045 m 0,-4.29296 v -8.576875 m 0,-4.30202 v -8.585927 m 0,-4.292963 v -8.585927 m 0,-4.302021 v -8.581398 m 0,-4.292964 V 45.30887 m 0,-4.288435 v -8.590456 m 0,-4.292963 v -4.292964 h 4.5510847" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path865"
+     d="M 4.9717593,23.844052 H 52.067561 V 54.184617 H 4.9717593 Z" />
+  <path
+     style="fill:#d2fff2;stroke-width:0.45284426"
+     inkscape:connector-curvature="0"
+     id="path869"
+     d="M 0.896161,139.77218 H 628.99114 V 255.70031 H 0.896161 Z" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path871"
+     d="M 9.9983304,139.77218 H 19.1005 m 4.551085,0 h 9.102169 m 4.555613,0 h 9.10217 m 4.555613,0 h 9.102169 m 4.551085,0 h 9.102169 m 4.555613,0 h 9.10217 m 4.551085,0 h 9.111229 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55562,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55562,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.54656,0 h 9.10216 m 4.55109,0 h 9.10217 m 4.54656,0 h 9.10216 m 4.55562,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55561,0 h 9.09312 m 4.55561,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55562,0 h 9.10216 m 4.55109,0 h 9.11123 m 4.55108,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55562,0 h 9.10216 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55561,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.54655,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.54655,0 h 9.10217 m 4.55562,0 h 9.10217 m 4.55108,0 h 4.55109 v 4.29296 m 0,4.29297 v 8.59045 m 0,4.29297 v 8.59045 m 0,4.29297 v 8.58592 m 0,4.30202 v 8.58593 m 0,4.29296 v 8.58593 m 0,4.30202 v 8.5814 m 0,4.29296 v 8.58593 m 0,4.28843 v 8.59046 m 0,4.29296 v 4.28844 h -4.55109 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.11123 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.54656,0 h -9.10217 m -4.54655,0 h -9.10217 m -4.54656,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10216 m -4.55562,0 h -9.09764 m -4.55561,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.11123 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.102165 m -4.555613,0 h -9.102169 m -4.551085,0 h -9.102169 m -4.546557,0 h -9.102169 m -4.551085,0 h -9.102169 m -4.546557,0 h -9.102169 m -4.555613,0 H 9.9983304 m -4.5510847,0 H 0.896161 v -4.29297 m 0,-4.29296 v -8.59045 m 0,-4.29297 v -8.59045 m 0,-4.29297 v -8.57687 m 0,-4.30202 v -8.58592 m 0,-4.29297 v -8.58592 m 0,-4.30202 v -8.5814 m 0,-4.29297 V 161.237 m 0,-4.28844 v -8.59045 m 0,-4.29297 v -4.29296 h 4.5510847" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path873"
+     d="M 4.9717593,139.77218 H 122.71126 v 30.34056 H 4.9717593 Z" />
+  <path
+     style="fill:#ffffff;stroke:#000000;stroke-width:1.07623756"
+     inkscape:connector-curvature="0"
+     id="path877"
+     d="m 45.360172,196.7534 c 0,-2.74164 3.159469,-4.9602 7.063854,-4.9602 H 192.41677 c 3.90438,0 7.06386,2.21856 7.06386,4.9602 v 30.21218 c 0,2.74164 -3.15948,4.9602 -7.06386,4.9602 H 52.424026 c -3.904385,0 -7.063854,-2.21856 -7.063854,-4.9602 z" />
+  <path
+     style="fill:#dadada;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path881"
+     d="m 15.840021,66.411412 c 0,-2.753293 2.227994,-4.981287 4.981287,-4.981287 H 476.83547 c 2.75329,0 4.98128,2.227994 4.98128,4.981287 v 30.340564 c 0,2.753294 -2.22799,4.981284 -4.98128,4.981284 H 20.821308 c -2.753293,0 -4.981287,-2.22799 -4.981287,-4.981284 z" />
+  <path
+     style="fill:#ffffff;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path885"
+     d="m 499.02484,66.411412 c 0,-2.753293 2.22799,-4.981287 4.98128,-4.981287 h 98.72005 c 2.75329,0 4.98129,2.227994 4.98129,4.981287 v 30.340564 c 0,2.753294 -2.228,4.981284 -4.98129,4.981284 h -98.72005 c -2.75329,0 -4.98128,-2.22799 -4.98128,-4.981284 z" />
+  <path
+     style="fill:none;stroke-width:0.45284426"
+     inkscape:connector-curvature="0"
+     id="path893"
+     d="M 87.389413,61.430125 V 101.73326" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path897"
+     d="m 68.369954,109.43162 h 38.038916 v 30.34056 H 68.369954 Z" />
+  <path
+     style="fill:none;stroke-width:0.45284426"
+     inkscape:connector-curvature="0"
+     id="path901"
+     d="M 164.82578,61.430125 V 101.73326" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path905"
+     d="m 134.93806,109.43162 h 60.68113 v 30.34056 h -60.68113 z" />
+  <path
+     style="fill:none;stroke-width:0.45284426"
+     inkscape:connector-curvature="0"
+     id="path909"
+     d="M 242.71499,61.430125 V 101.73326" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path913"
+     d="m 199.24194,109.43162 h 87.39894 v 30.34056 h -87.39894 z" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path917"
+     d="M 553.81899,60.524437 507.62888,5.277438 m 43.92589,56.152687 42.21414,-49.849095" />
+  <path
+     style="stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path919"
+     d="m 598.15244,6.3959633 -2.56762,6.2854777 -3.20614,-2.717065 z" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path921"
+     d="M 120.06905,190.49074 73.878938,164.67861 m 43.925892,26.26497 40.32125,-22.27088" />
+  <path
+     style="stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path923"
+     d="m 164.07193,165.38505 -4.64166,4.96317 -2.02874,-3.66803 z" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path929"
+     d="m 291.95975,190.49074 -46.19011,-25.81213 m 43.92589,26.26497 39.882,-22.24371" />
+  <path
+     style="stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path931"
+     d="m 335.50978,165.39411 -4.61901,4.98128 -2.0378,-3.66803 z" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path937"
+     d="M 465.85045,190.49074 419.2075,164.67861 m 44.37873,26.26497 39.882,-22.24371" />
+  <path
+     style="stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path939"
+     d="m 509.40049,165.39411 -4.61902,4.98128 -2.03779,-3.66803 z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path941"
+     d="M 43.010676,231.24672 H 155.76889 v 30.34056 H 43.010676 Z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path949"
+     d="M 168.90138,231.24672 H 281.6596 v 30.34056 H 168.90138 Z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path957"
+     d="M 294.79208,231.69956 H 407.5503 v 30.34057 H 294.79208 Z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path967"
+     d="m 497.21346,102.63895 h 112.75822 v 30.34057 H 497.21346 Z" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="504.97748"
+     y="87.439178"
+     id="text101-6"><tspan
+       sodipodi:role="line"
+       id="tspan99-88"
+       x="504.97748"
+       y="87.439178"
+       style="stroke-width:0.45284379">cont (fresh db)</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="199.31563"
+     y="87.040298"
+     id="text101-6-4"><tspan
+       sodipodi:role="line"
+       id="tspan99-88-4"
+       x="199.31563"
+       y="87.040298"
+       style="stroke-width:0.45284379">cont (retiring db)</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="6.9198484"
+     y="157.37654"
+     id="text277"><tspan
+       sodipodi:role="line"
+       id="tspan275"
+       x="6.9198484"
+       y="157.37654"
+       style="stroke-width:0.45284379">/.shards_acct</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="8.2687769"
+     y="40.810501"
+     id="text281"><tspan
+       sodipodi:role="line"
+       id="tspan279"
+       x="8.2687769"
+       y="40.810501"
+       style="stroke-width:0.45284379">/acct</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="51.543587"
+     y="217.57593"
+     id="text101"><tspan
+       sodipodi:role="line"
+       id="tspan99"
+       x="51.543587"
+       y="217.57593"
+       style="stroke-width:0.45284379">cont-568d8e-&lt;ts&gt;-0</tspan></text>
+  <flowRoot
+     xml:space="preserve"
+     id="flowRoot1828"
+     style="fill:black;fill-opacity:1;stroke:none;font-family:sans-serif;font-style:normal;font-weight:normal;font-size:37.33333333px;line-height:1.25;letter-spacing:0px;word-spacing:0px;-inkscape-font-specification:'sans-serif, Normal';font-stretch:normal;font-variant:normal;text-anchor:start;text-align:start;writing-mode:lr;font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal"><flowRegion
+       id="flowRegion1830"><rect
+         id="rect1832"
+         width="573.11005"
+         height="39.244427"
+         x="182.43355"
+         y="184.33957" /></flowRegion><flowPara
+       id="flowPara1834" /></flowRoot>  <path
+     style="fill:#ffffff;stroke:#000000;stroke-width:1.07623756"
+     inkscape:connector-curvature="0"
+     id="path877-7"
+     d="m 213.91421,196.7534 c 0,-2.74164 3.15947,-4.9602 7.06385,-4.9602 h 139.99275 c 3.90438,0 7.06386,2.21856 7.06386,4.9602 v 30.21218 c 0,2.74164 -3.15948,4.9602 -7.06386,4.9602 H 220.97806 c -3.90438,0 -7.06385,-2.21856 -7.06385,-4.9602 z" />
+  <path
+     style="fill:#ffffff;stroke:#000000;stroke-width:1.07623756"
+     inkscape:connector-curvature="0"
+     id="path877-7-6"
+     d="m 384.32694,196.75341 c 0,-2.74164 3.15947,-4.96021 7.06385,-4.96021 h 139.99275 c 3.90438,0 7.06386,2.21856 7.06386,4.9602 v 30.21218 c 0,2.74164 -3.15948,4.9602 -7.06386,4.9602 H 391.39079 c -3.90438,0 -7.06385,-2.21856 -7.06385,-4.9602 z" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="222.83531"
+     y="217.57593"
+     id="text101-7"><tspan
+       sodipodi:role="line"
+       id="tspan99-8"
+       x="222.83531"
+       y="217.57593"
+       style="stroke-width:0.45284379">cont-750ed3-&lt;ts&gt;-1</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="393.60159"
+     y="217.57593"
+     id="text101-7-4"><tspan
+       sodipodi:role="line"
+       id="tspan99-8-4"
+       x="393.60159"
+       y="217.57593"
+       style="stroke-width:0.45284379">cont-4ec28d-&lt;ts&gt;-2</tspan></text>
+  <g
+     style="display:block"
+     id="g3010"
+     display="block"
+     lucid:layer-id="GKaF8qZL2vPh1"
+     class="lucid-layer"
+     transform="matrix(0.45284347,0,0,0.45284347,-83.54524,-8.2580505)">
+    <path
+       style="fill:none;stroke:#ffff00;stroke-width:13"
+       inkscape:connector-curvature="0"
+       id="path3002"
+       d="M 355.43,446.08 268,218" />
+    <path
+       style="fill:#ffff00"
+       inkscape:connector-curvature="0"
+       id="path3004"
+       d="M 365.18,427.45 360,458 l -24.28,-19.26 8.08,-10.2 7.06,5.6 1.5,-8.87 z" />
+    <path
+       style="fill:none;stroke:#ffff00;stroke-width:13"
+       inkscape:connector-curvature="0"
+       id="path3006"
+       d="M 510.26,464.4 1331,226" />
+    <path
+       style="fill:#ffff00"
+       inkscape:connector-curvature="0"
+       id="path3008"
+       d="m 528.7,454.28 -6.18,6.56 8.73,2.25 -3.23,12.58 -30.02,-7.7 21.22,-22.6 z" />
+  </g>
+  <path
+     style="fill:#800000;fill-opacity:1;stroke:#0000ff;stroke-width:0.90600002;stroke-linecap:butt;stroke-linejoin:miter;stroke-miterlimit:4;stroke-dasharray:7.24800014, 3.62400007;stroke-dashoffset:0;stroke-opacity:1"
+     d="m 86.222746,62.10815 c 0,39.73056 0.0442,39.59798 0.0442,39.59798 v 0 0 0"
+     id="path4476-4"
+     inkscape:connector-curvature="0" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#0000ff;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="74.74295"
+     y="132.55811"
+     id="text281-9-0"><tspan
+       sodipodi:role="line"
+       id="tspan279-9-6"
+       x="74.74295"
+       y="132.55811"
+       style="fill:#0000ff;stroke-width:0.45284379">cat</tspan></text>
+  <path
+     style="fill:#aa0000;fill-opacity:1;stroke:#aa0000;stroke-width:0.90600002;stroke-linecap:butt;stroke-linejoin:miter;stroke-miterlimit:4;stroke-dasharray:7.24800014, 3.62400007;stroke-dashoffset:0;stroke-opacity:1"
+     d="m 163.10857,62.13625 c 0,39.73056 0.0442,39.59798 0.0442,39.59798 v 0 0 0"
+     id="path4476-6"
+     inkscape:connector-curvature="0" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#aa0000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="139.62488"
+     y="131.57104"
+     id="text281-9-8"><tspan
+       sodipodi:role="line"
+       id="tspan279-9-3"
+       x="139.62488"
+       y="131.57104"
+       style="fill:#aa0000;stroke-width:0.45284379">giraffe</tspan></text>
+  <path
+     style="fill:#f9f9f9;fill-opacity:1;stroke:#ba2e44;stroke-width:0.90600002;stroke-linecap:butt;stroke-linejoin:miter;stroke-miterlimit:4;stroke-dasharray:7.24800014, 3.62400007;stroke-dashoffset:0;stroke-opacity:1"
+     d="m 241.30041,62.13625 c 0,39.73055 0.0442,39.59798 0.0442,39.59798 v 0 0 0"
+     id="path4476-6-8"
+     inkscape:connector-curvature="0" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#aa0000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="223.5551"
+     y="131.57104"
+     id="text281-9-8-3"><tspan
+       sodipodi:role="line"
+       id="tspan279-9-3-3"
+       x="223.5551"
+       y="131.57104"
+       style="fill:#aa0000;stroke-width:0.45284379">igloo</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="514.57678"
+     y="130.43381"
+     id="text281-90-3-7-2-5"><tspan
+       sodipodi:role="line"
+       id="tspan279-3-3-3-6-2"
+       x="514.57678"
+       y="130.43381"
+       style="stroke-width:0.45284379">&quot;igloo&quot; - &quot;&quot;</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="87.754631"
+     y="252.25916"
+     id="text281-90"><tspan
+       sodipodi:role="line"
+       id="tspan279-3"
+       x="87.754631"
+       y="252.25916"
+       style="stroke-width:0.45284379">&quot;&quot; - &quot;cat&quot;</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="238.08142"
+     y="251.07751"
+     id="text281-90-3"><tspan
+       sodipodi:role="line"
+       id="tspan279-3-3"
+       x="238.08142"
+       y="251.07751"
+       style="stroke-width:0.45284379">&quot;cat&quot; - &quot;giraffe&quot;</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="404.59634"
+     y="251.07751"
+     id="text281-90-3-7"><tspan
+       sodipodi:role="line"
+       id="tspan279-3-3-3"
+       x="404.59634"
+       y="251.07751"
+       style="stroke-width:0.45284379">&quot;giraffe&quot; - &quot;igloo&quot;</tspan></text>
+</svg>
diff --git a/doc/source/images/sharding_cleave2_load.svg b/doc/source/images/sharding_cleave2_load.svg
new file mode 100644
index 0000000000..548aab56ab
--- /dev/null
+++ b/doc/source/images/sharding_cleave2_load.svg
@@ -0,0 +1,1754 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<svg
+   xmlns:dc="http://purl.org/dc/elements/1.1/"
+   xmlns:cc="http://creativecommons.org/ns#"
+   xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
+   xmlns:svg="http://www.w3.org/2000/svg"
+   xmlns="http://www.w3.org/2000/svg"
+   xmlns:xlink="http://www.w3.org/1999/xlink"
+   xmlns:sodipodi="http://sodipodi.sourceforge.net/DTD/sodipodi-0.dtd"
+   xmlns:inkscape="http://www.inkscape.org/namespaces/inkscape"
+   width="630"
+   height="260"
+   version="1.1"
+   id="svg1304"
+   sodipodi:docname="sharding_lock4.svg"
+   inkscape:version="0.92.2 (5c3e80d, 2017-08-06)">
+  <metadata
+     id="metadata1310">
+    <rdf:RDF>
+      <cc:Work
+         rdf:about="">
+        <dc:format>image/svg+xml</dc:format>
+        <dc:type
+           rdf:resource="http://purl.org/dc/dcmitype/StillImage" />
+        <dc:title></dc:title>
+      </cc:Work>
+    </rdf:RDF>
+  </metadata>
+  <defs
+     id="defs1308">
+    <defs
+       id="defs1300">
+      <path
+         id="v"
+         d="M 0,20 411,-1484 H 569 L 162,20 H 0"
+         inkscape:connector-curvature="0" />
+      <path
+         id="w"
+         d="M 797,-207 C 713,-60 620,16 414,20 203,24 88,-98 87,-302 c 0,-112 37,-198 111,-258 74,-60 192,-93 356,-96 l 243,-4 c 10,-201 -43,-307 -232,-305 -154,2 -223,43 -242,172 l -188,-17 c 31,-195 175,-292 434,-292 259,0 410,116 410,364 v 466 c 3,95 12,159 101,161 17,0 37,-2 59,-7 V -6 C 1094,5 1047,10 1000,10 857,8 812,-66 803,-207 Z m -525,-92 c -1,116 66,187 183,184 230,-7 361,-164 342,-419 -124,5 -305,-2 -389,30 -83,32 -136,92 -136,205"
+         inkscape:connector-curvature="0" />
+      <path
+         id="x"
+         d="m 779,-765 c -19,-119 -93,-196 -233,-196 -95,0 -164,32 -207,95 -43,63 -64,170 -64,320 0,144 23,251 68,320 45,69 114,104 205,104 139,0 224,-79 240,-212 l 182,12 C 946,-119 781,22 553,20 230,17 87,-201 87,-542 c 0,-338 145,-557 464,-560 225,-1 380,129 413,323"
+         inkscape:connector-curvature="0" />
+      <path
+         id="y"
+         d="m 336,-268 c 2,98 22,139 114,141 24,0 59,-5 104,-14 V -8 C 495,8 434,16 372,16 228,16 156,-66 156,-229 V -951 H 31 v -131 h 132 l 53,-242 h 120 v 242 h 200 v 131 H 336 v 683"
+         inkscape:connector-curvature="0" />
+      <g
+         id="a">
+        <use
+           id="use981"
+           xlink:href="#v"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use983"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,9.8784722,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use985"
+           xlink:href="#x"
+           transform="matrix(0.01736111,0,0,0.01736111,29.652778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use987"
+           xlink:href="#x"
+           transform="matrix(0.01736111,0,0,0.01736111,47.430556,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use989"
+           xlink:href="#y"
+           transform="matrix(0.01736111,0,0,0.01736111,65.208333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="z"
+         d="M 187,0 V -219 H 382 V 0 H 187"
+         inkscape:connector-curvature="0" />
+      <path
+         id="A"
+         d="m 513,-963 c -139,1 -238,29 -238,149 0,72 41,100 95,127 55,27 348,94 404,125 101,56 176,118 176,263 C 950,-73 758,21 511,20 254,19 107,-55 57,-254 l 159,-31 c 34,123 133,168 295,168 156,0 264,-34 264,-168 0,-156 -183,-165 -315,-204 -171,-51 -245,-68 -323,-172 -26,-35 -37,-82 -37,-135 0,-220 172,-304 413,-303 232,1 379,74 418,265 l -162,20 C 746,-918 647,-964 513,-963"
+         inkscape:connector-curvature="0" />
+      <path
+         id="B"
+         d="m 322,-1484 c -2,195 6,405 -8,587 h 3 c 73,-129 159,-205 346,-205 250,0 342,118 343,381 V 0 H 825 v -686 c 3,-190 -43,-277 -223,-277 -176,-1 -280,140 -280,325 V 0 H 142 v -1484 h 180"
+         inkscape:connector-curvature="0" />
+      <path
+         id="C"
+         d="m 318,-861 c 55,-157 83,-241 257,-241 24,0 48,3 73,10 v 165 c -24,-7 -56,-10 -96,-10 -75,0 -132,33 -171,97 -39,64 -59,156 -59,276 V 0 H 142 c -3,-364 6,-725 -6,-1082 h 170 c 5,123 8,196 8,221 h 4"
+         inkscape:connector-curvature="0" />
+      <path
+         id="D"
+         d="m 835,0 c -5,-29 -11,-137 -10,-174 h -4 C 759,-45 663,20 484,20 177,20 86,-201 86,-536 c 0,-377 133,-566 398,-566 178,1 273,67 339,188 -4,-187 -1,-380 -2,-570 h 180 v 1261 c 0,113 2,187 6,223 z m -14,-554 c 0,-255 -58,-415 -289,-415 -91,0 -151,37 -196,101 -76,109 -77,543 -1,651 44,63 105,98 195,98 235,0 291,-173 291,-435"
+         inkscape:connector-curvature="0" />
+      <path
+         id="E"
+         d="m 87,-548 c 0,-338 159,-553 484,-554 325,-2 484,204 477,599 H 276 c -1,227 88,385 302,388 146,2 246,-65 283,-166 l 158,45 C 954,-65 807,20 578,20 240,20 87,-193 87,-548 Z m 775,-93 c -19,-206 -90,-328 -294,-328 -185,0 -285,140 -290,328 h 584"
+         inkscape:connector-curvature="0" />
+      <path
+         id="F"
+         d="M -31,407 V 277 H 1162 V 407 H -31"
+         inkscape:connector-curvature="0" />
+      <g
+         id="b">
+        <use
+           id="use999"
+           xlink:href="#v"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1001"
+           xlink:href="#z"
+           transform="matrix(0.01736111,0,0,0.01736111,9.8784722,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1003"
+           xlink:href="#A"
+           transform="matrix(0.01736111,0,0,0.01736111,19.756944,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1005"
+           xlink:href="#B"
+           transform="matrix(0.01736111,0,0,0.01736111,37.534722,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1007"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,57.309028,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1009"
+           xlink:href="#C"
+           transform="matrix(0.01736111,0,0,0.01736111,77.083333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1011"
+           xlink:href="#D"
+           transform="matrix(0.01736111,0,0,0.01736111,88.923611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1013"
+           xlink:href="#E"
+           transform="matrix(0.01736111,0,0,0.01736111,108.69792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1015"
+           xlink:href="#D"
+           transform="matrix(0.01736111,0,0,0.01736111,128.47222,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1017"
+           xlink:href="#F"
+           transform="matrix(0.01736111,0,0,0.01736111,148.24653,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1019"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,168.02083,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1021"
+           xlink:href="#x"
+           transform="matrix(0.01736111,0,0,0.01736111,187.79514,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1023"
+           xlink:href="#x"
+           transform="matrix(0.01736111,0,0,0.01736111,205.57292,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1025"
+           xlink:href="#y"
+           transform="matrix(0.01736111,0,0,0.01736111,223.35069,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="G"
+         d="m 571,-1102 c 350,0 480,196 482,560 2,357 -151,562 -488,562 -332,0 -479,-218 -479,-562 0,-373 162,-560 485,-560 z m -8,989 c 244,0 301,-164 301,-429 0,-266 -49,-427 -290,-427 -239,0 -299,165 -299,427 0,252 61,429 288,429"
+         inkscape:connector-curvature="0" />
+      <path
+         id="H"
+         d="m 663,-1102 c 251,0 343,119 343,381 V 0 H 825 v -686 c 0,-183 -40,-279 -223,-277 -184,2 -280,141 -280,336 V 0 H 142 c -3,-345 6,-754 -6,-1082 h 170 c 5,68 6,94 8,185 h 3 c 76,-134 157,-205 346,-205"
+         inkscape:connector-curvature="0" />
+      <path
+         id="I"
+         d="m 1059,-705 c 0,235 -42,415 -125,539 C 851,-42 729,20 567,20 405,20 283,-42 202,-165 121,-288 80,-468 80,-705 c 0,-242 39,-423 118,-544 79,-121 204,-181 375,-181 166,0 288,61 367,183 79,122 119,303 119,542 z m -257,436 c 94,-156 93,-724 4,-878 -51,-89 -125,-137 -233,-137 -111,0 -186,48 -239,135 -91,149 -91,731 2,883 55,89 126,139 233,139 106,0 178,-51 233,-142"
+         inkscape:connector-curvature="0" />
+      <path
+         id="J"
+         d="m 156,0 v -153 h 359 v -1084 l -318,227 v -170 l 333,-229 h 166 v 1256 h 343 V 0 H 156"
+         inkscape:connector-curvature="0" />
+      <path
+         id="K"
+         d="m 655,-1102 c 307,0 398,221 398,556 0,377 -133,566 -398,566 -180,0 -272,-66 -339,-188 1,22 -7,151 -10,168 H 132 c 4,-36 6,-110 6,-223 v -1261 h 180 c -2,196 4,384 -4,576 h 4 c 62,-129 158,-194 337,-194 z m -337,573 c 0,254 57,416 289,416 91,0 152,-37 197,-101 76,-109 76,-543 0,-651 -44,-63 -105,-98 -195,-98 -236,0 -291,169 -291,434"
+         inkscape:connector-curvature="0" />
+      <path
+         id="L"
+         d="m 572,-1430 c 269,0 442,128 442,386 0,144 -72,232 -149,325 -108,130 -487,366 -564,566 h 735 V 0 H 103 v -127 c 119,-285 378,-432 583,-627 76,-72 141,-150 143,-284 1,-156 -100,-244 -257,-244 -156,0 -263,93 -277,238 l -184,-17 c 24,-224 208,-369 461,-369"
+         inkscape:connector-curvature="0" />
+      <path
+         id="M"
+         d="m 715,-719 c 191,17 334,134 334,330 C 1049,-115 858,20 571,20 288,20 108,-110 78,-362 l 186,-17 c 24,167 126,250 307,250 177,0 294,-88 291,-266 -3,-174 -149,-246 -344,-244 H 416 v -156 h 98 c 179,2 311,-77 311,-243 0,-157 -98,-244 -264,-244 -159,0 -264,88 -278,233 l -181,-14 c 23,-229 206,-367 461,-367 262,0 447,124 447,373 0,197 -120,298 -295,334 v 4"
+         inkscape:connector-curvature="0" />
+      <path
+         id="N"
+         d="M 1036,-1263 C 892,-1043 790,-871 731,-746 626,-522 556,-302 553,0 H 365 c 0,-180 39,-369 115,-568 76,-199 203,-429 382,-688 H 105 v -153 h 931 v 146"
+         inkscape:connector-curvature="0" />
+      <g
+         id="c">
+        <use
+           id="use1036"
+           xlink:href="#x"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1038"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1040"
+           xlink:href="#H"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1042"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1044"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,50.403646,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1046"
+           xlink:href="#I"
+           transform="matrix(0.01302083,0,0,0.01302083,65.234375,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1048"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,80.065104,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1050"
+           xlink:href="#J"
+           transform="matrix(0.01302083,0,0,0.01302083,94.895833,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1052"
+           xlink:href="#E"
+           transform="matrix(0.01302083,0,0,0.01302083,109.72656,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1054"
+           xlink:href="#E"
+           transform="matrix(0.01302083,0,0,0.01302083,124.55729,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1056"
+           xlink:href="#K"
+           transform="matrix(0.01302083,0,0,0.01302083,139.38802,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1058"
+           xlink:href="#L"
+           transform="matrix(0.01302083,0,0,0.01302083,154.21875,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1060"
+           xlink:href="#M"
+           transform="matrix(0.01302083,0,0,0.01302083,169.04948,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1062"
+           xlink:href="#N"
+           transform="matrix(0.01302083,0,0,0.01302083,183.88021,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="d">
+        <use
+           id="use1065"
+           xlink:href="#x"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1067"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1069"
+           xlink:href="#H"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1071"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="e">
+        <use
+           id="use1074"
+           xlink:href="#x"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1076"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1078"
+           xlink:href="#H"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1080"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="O"
+         d="M 496,424 C 268,175 127,-92 127,-532 c 0,-438 143,-704 369,-952 h 174 c -222,249 -362,524 -362,954 0,431 138,703 362,954 H 496"
+         inkscape:connector-curvature="0" />
+      <path
+         id="P"
+         d="m 320,-908 c 63,-128 152,-193 335,-193 133,0 233,45 299,134 66,89 99,230 99,421 0,377 -133,566 -398,566 -167,0 -279,-63 -336,-188 h -5 c 8,141 2,428 4,593 H 138 V -861 c 0,-111 -2,-185 -6,-221 h 174 c 5,33 9,134 10,174 z m -2,380 c 0,254 57,415 289,415 89,0 149,-37 195,-99 76,-105 79,-547 1,-653 -45,-62 -105,-97 -194,-97 -243,1 -291,184 -291,434"
+         inkscape:connector-curvature="0" />
+      <path
+         id="Q"
+         d="m 137,-1312 v -172 h 180 v 172 z M 137,0 V -1082 H 317 V 0 H 137"
+         inkscape:connector-curvature="0" />
+      <path
+         id="R"
+         d="M 613,0 H 400 L 7,-1082 h 192 c 109,337 207,579 307,941 97,-323 214,-627 320,-941 h 191"
+         inkscape:connector-curvature="0" />
+      <g
+         id="f">
+        <use
+           id="use1087"
+           xlink:href="#O"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1089"
+           xlink:href="#P"
+           transform="matrix(0.01302083,0,0,0.01302083,8.8802083,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1091"
+           xlink:href="#Q"
+           transform="matrix(0.01302083,0,0,0.01302083,23.710937,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1093"
+           xlink:href="#R"
+           transform="matrix(0.01302083,0,0,0.01302083,29.635417,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1095"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,42.96875,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1097"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,57.799479,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="S"
+         d="m 186,-1484 c 228,249 369,516 369,956 0,438 -143,704 -369,952 H 12 C 235,172 374,-97 374,-530 374,-961 234,-1234 12,-1484 h 174"
+         inkscape:connector-curvature="0" />
+      <g
+         id="g">
+        <use
+           id="use1101"
+           xlink:href="#D"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1103"
+           xlink:href="#K"
+           transform="matrix(0.01302083,0,0,0.01302083,14.830729,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1105"
+           xlink:href="#S"
+           transform="matrix(0.01302083,0,0,0.01302083,29.661458,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="T"
+         d="m 779,-765 c -19,-119 -93,-196 -233,-196 -95,0 -164,32 -207,95 -43,63 -64,170 -64,320 0,144 23,251 68,320 45,69 114,104 205,104 139,0 224,-79 240,-212 l 182,12 C 946,-119 781,22 553,20 230,17 87,-201 87,-542 c 0,-338 145,-557 464,-560 225,-1 380,129 413,323"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="U"
+         d="M 797,-207 C 713,-60 620,16 414,20 203,24 88,-98 87,-302 c 0,-112 37,-198 111,-258 74,-60 192,-93 356,-96 l 243,-4 c 10,-201 -43,-307 -232,-305 -154,2 -223,43 -242,172 l -188,-17 c 31,-195 175,-292 434,-292 259,0 410,116 410,364 v 466 c 3,95 12,159 101,161 17,0 37,-2 59,-7 V -6 C 1094,5 1047,10 1000,10 857,8 812,-66 803,-207 Z m -525,-92 c -1,116 66,187 183,184 230,-7 361,-164 342,-419 -124,5 -305,-2 -389,30 -83,32 -136,92 -136,205"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="V"
+         d="m 336,-268 c 2,98 22,139 114,141 24,0 59,-5 104,-14 V -8 C 495,8 434,16 372,16 228,16 156,-66 156,-229 V -951 H 31 v -131 h 132 l 53,-242 h 120 v 242 h 200 v 131 H 336 v 683"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <g
+         id="h">
+        <use
+           id="use1111"
+           xlink:href="#T"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1113"
+           xlink:href="#U"
+           transform="matrix(0.01736111,0,0,0.01736111,17.777778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1115"
+           xlink:href="#V"
+           transform="matrix(0.01736111,0,0,0.01736111,37.552083,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="W"
+         d="m 824,-897 c -1,-17 6,-175 12,-185 h 171 c -12,319 -6,716 -6,1051 0,304 -151,456 -453,456 -226,0 -374,-90 -417,-267 l 181,-26 c 24,102 112,157 241,156 179,0 269,-105 269,-315 0,-57 3,-120 -2,-174 C 759,-74 647,8 472,8 339,8 242,-36 180,-124 118,-212 86,-350 86,-539 c 0,-191 33,-332 100,-423 67,-91 169,-137 306,-137 167,0 273,85 332,202 z m -38,579 c 48,-119 46,-331 0,-450 -42,-108 -118,-197 -250,-197 -92,0 -154,37 -201,100 -78,107 -74,530 -4,643 63,101 251,129 353,47 43,-35 77,-81 102,-143"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="X"
+         d="m 137,-1312 v -172 h 180 v 172 z M 137,0 V -1082 H 317 V 0 H 137"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="Y"
+         d="m 318,-861 c 55,-157 83,-241 257,-241 24,0 48,3 73,10 v 165 c -24,-7 -56,-10 -96,-10 -75,0 -132,33 -171,97 -39,64 -59,156 -59,276 V 0 H 142 c -3,-364 6,-725 -6,-1082 h 170 c 5,123 8,196 8,221 h 4"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="Z"
+         d="m 492,-1341 c -103,3 -130,49 -131,162 v 97 h 211 v 131 H 361 V 0 H 181 V -951 H 29 v -131 h 152 v -122 c 0,-192 78,-276 264,-278 50,0 92,4 127,12 v 137 c -30,-5 -57,-8 -80,-8"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="aa"
+         d="m 87,-548 c 0,-338 159,-553 484,-554 325,-2 484,204 477,599 H 276 c -1,227 88,385 302,388 146,2 246,-65 283,-166 l 158,45 C 954,-65 807,20 578,20 240,20 87,-193 87,-548 Z m 775,-93 c -19,-206 -90,-328 -294,-328 -185,0 -285,140 -290,328 h 584"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <g
+         id="i">
+        <use
+           id="use1123"
+           xlink:href="#W"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1125"
+           xlink:href="#X"
+           transform="matrix(0.01736111,0,0,0.01736111,19.774306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1127"
+           xlink:href="#Y"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1129"
+           xlink:href="#U"
+           transform="matrix(0.01736111,0,0,0.01736111,39.513889,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1131"
+           xlink:href="#Z"
+           transform="matrix(0.01736111,0,0,0.01736111,59.288194,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1133"
+           xlink:href="#Z"
+           transform="matrix(0.01736111,0,0,0.01736111,68.524306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1135"
+           xlink:href="#aa"
+           transform="matrix(0.01736111,0,0,0.01736111,78.402778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="ab"
+         d="M 138,0 V -1484 H 318 V 0 H 138"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="ac"
+         d="m 571,-1102 c 350,0 480,196 482,560 2,357 -151,562 -488,562 -332,0 -479,-218 -479,-562 0,-373 162,-560 485,-560 z m -8,989 c 244,0 301,-164 301,-429 0,-266 -49,-427 -290,-427 -239,0 -299,165 -299,427 0,252 61,429 288,429"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <g
+         id="j">
+        <use
+           id="use1140"
+           xlink:href="#X"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1142"
+           xlink:href="#W"
+           transform="matrix(0.01736111,0,0,0.01736111,7.8993056,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1144"
+           xlink:href="#ab"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1146"
+           xlink:href="#ac"
+           transform="matrix(0.01736111,0,0,0.01736111,35.572917,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1148"
+           xlink:href="#ac"
+           transform="matrix(0.01736111,0,0,0.01736111,55.347222,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="ad"
+         d="m 765,-739 c 171,25 285,155 285,346 C 1049,-119 859,20 570,20 286,20 89,-117 89,-391 89,-574 212,-714 370,-737 v -4 c -143,-30 -248,-160 -248,-328 1,-229 198,-361 444,-361 254,0 448,125 449,363 1,166 -104,300 -250,324 z m -197,-70 c 171,-2 261,-74 260,-248 0,-159 -87,-239 -262,-239 -165,0 -260,77 -260,239 0,163 99,249 262,248 z m 4,694 c 200,0 291,-92 291,-295 1,-179 -116,-264 -297,-264 -175,0 -292,98 -291,268 0,194 99,291 297,291"
+         inkscape:connector-curvature="0" />
+      <path
+         id="ae"
+         d="m 492,-1341 c -103,3 -130,49 -131,162 v 97 h 211 v 131 H 361 V 0 H 181 V -951 H 29 v -131 h 152 v -122 c 0,-192 78,-276 264,-278 50,0 92,4 127,12 v 137 c -30,-5 -57,-8 -80,-8"
+         inkscape:connector-curvature="0" />
+      <g
+         id="k">
+        <use
+           id="use1153"
+           xlink:href="#x"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1155"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1157"
+           xlink:href="#H"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1159"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1161"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,50.403646,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1163"
+           xlink:href="#I"
+           transform="matrix(0.01302083,0,0,0.01302083,65.234375,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1165"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,80.065104,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1167"
+           xlink:href="#D"
+           transform="matrix(0.01302083,0,0,0.01302083,94.895833,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1169"
+           xlink:href="#D"
+           transform="matrix(0.01302083,0,0,0.01302083,109.72656,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1171"
+           xlink:href="#ad"
+           transform="matrix(0.01302083,0,0,0.01302083,124.55729,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1173"
+           xlink:href="#M"
+           transform="matrix(0.01302083,0,0,0.01302083,139.38802,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1175"
+           xlink:href="#L"
+           transform="matrix(0.01302083,0,0,0.01302083,154.21875,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1177"
+           xlink:href="#ad"
+           transform="matrix(0.01302083,0,0,0.01302083,169.04948,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1179"
+           xlink:href="#ae"
+           transform="matrix(0.01302083,0,0,0.01302083,183.88021,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="af"
+         d="m 625,-911 c 261,-2 424,185 424,450 0,289 -169,481 -455,481 -159,0 -280,-59 -364,-177 -84,-118 -126,-290 -126,-515 0,-244 44,-431 131,-562 87,-131 212,-196 373,-196 213,0 347,96 402,287 l -172,31 c -35,-115 -113,-172 -232,-172 -103,0 -182,48 -238,144 -56,96 -85,234 -85,415 59,-113 178,-184 342,-186 z m -37,786 c 182,0 278,-138 278,-328 0,-193 -98,-318 -284,-319 -166,-1 -281,107 -281,276 0,195 106,371 287,371"
+         inkscape:connector-curvature="0" />
+      <g
+         id="l">
+        <use
+           id="use1183"
+           xlink:href="#x"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1185"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1187"
+           xlink:href="#H"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1189"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1191"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,50.403646,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1193"
+           xlink:href="#I"
+           transform="matrix(0.01302083,0,0,0.01302083,65.234375,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1195"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,80.065104,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1197"
+           xlink:href="#w"
+           transform="matrix(0.01302083,0,0,0.01302083,94.895833,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1199"
+           xlink:href="#x"
+           transform="matrix(0.01302083,0,0,0.01302083,109.72656,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1201"
+           xlink:href="#I"
+           transform="matrix(0.01302083,0,0,0.01302083,123.0599,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1203"
+           xlink:href="#I"
+           transform="matrix(0.01302083,0,0,0.01302083,137.89062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1205"
+           xlink:href="#x"
+           transform="matrix(0.01302083,0,0,0.01302083,152.72135,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1207"
+           xlink:href="#af"
+           transform="matrix(0.01302083,0,0,0.01302083,166.05469,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1209"
+           xlink:href="#w"
+           transform="matrix(0.01302083,0,0,0.01302083,180.88542,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="m">
+        <use
+           id="use1212"
+           xlink:href="#H"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1214"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,19.774306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1216"
+           xlink:href="#H"
+           transform="matrix(0.01736111,0,0,0.01736111,39.548611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1218"
+           xlink:href="#E"
+           transform="matrix(0.01736111,0,0,0.01736111,59.322917,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="ag"
+         d="m 91,-464 v -160 h 500 v 160 H 91"
+         inkscape:connector-curvature="0" />
+      <use
+         id="n"
+         xlink:href="#ag"
+         transform="scale(0.01736111)"
+         x="0"
+         y="0"
+         width="100%"
+         height="100%" />
+      <g
+         id="o">
+        <use
+           id="use1223"
+           xlink:href="#x"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1225"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,17.777778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1227"
+           xlink:href="#y"
+           transform="matrix(0.01736111,0,0,0.01736111,37.552083,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="p">
+        <use
+           id="use1230"
+           xlink:href="#x"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1232"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,17.777778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1234"
+           xlink:href="#y"
+           transform="matrix(0.01736111,0,0,0.01736111,37.552083,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="ah"
+         d="m 824,-897 c -1,-17 6,-175 12,-185 h 171 c -12,319 -6,716 -6,1051 0,304 -151,456 -453,456 -226,0 -374,-90 -417,-267 l 181,-26 c 24,102 112,157 241,156 179,0 269,-105 269,-315 0,-57 3,-120 -2,-174 C 759,-74 647,8 472,8 339,8 242,-36 180,-124 118,-212 86,-350 86,-539 c 0,-191 33,-332 100,-423 67,-91 169,-137 306,-137 167,0 273,85 332,202 z m -38,579 c 48,-119 46,-331 0,-450 -42,-108 -118,-197 -250,-197 -92,0 -154,37 -201,100 -78,107 -74,530 -4,643 63,101 251,129 353,47 43,-35 77,-81 102,-143"
+         inkscape:connector-curvature="0" />
+      <g
+         id="q">
+        <use
+           id="use1238"
+           xlink:href="#ah"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1240"
+           xlink:href="#Q"
+           transform="matrix(0.01736111,0,0,0.01736111,19.774306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1242"
+           xlink:href="#C"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1244"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,39.513889,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1246"
+           xlink:href="#ae"
+           transform="matrix(0.01736111,0,0,0.01736111,59.288194,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1248"
+           xlink:href="#ae"
+           transform="matrix(0.01736111,0,0,0.01736111,68.524306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1250"
+           xlink:href="#E"
+           transform="matrix(0.01736111,0,0,0.01736111,78.402778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="r">
+        <use
+           id="use1253"
+           xlink:href="#ah"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1255"
+           xlink:href="#Q"
+           transform="matrix(0.01736111,0,0,0.01736111,19.774306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1257"
+           xlink:href="#C"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1259"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,39.513889,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1261"
+           xlink:href="#ae"
+           transform="matrix(0.01736111,0,0,0.01736111,59.288194,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1263"
+           xlink:href="#ae"
+           transform="matrix(0.01736111,0,0,0.01736111,68.524306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1265"
+           xlink:href="#E"
+           transform="matrix(0.01736111,0,0,0.01736111,78.402778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="ai"
+         d="M 138,0 V -1484 H 318 V 0 H 138"
+         inkscape:connector-curvature="0" />
+      <g
+         id="s">
+        <use
+           id="use1269"
+           xlink:href="#Q"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1271"
+           xlink:href="#ah"
+           transform="matrix(0.01736111,0,0,0.01736111,7.8993056,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1273"
+           xlink:href="#ai"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1275"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,35.572917,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1277"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,55.347222,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="t">
+        <use
+           id="use1280"
+           xlink:href="#Q"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1282"
+           xlink:href="#ah"
+           transform="matrix(0.01736111,0,0,0.01736111,7.8993056,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1284"
+           xlink:href="#ai"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1286"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,35.572917,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1288"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,55.347222,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="u">
+        <use
+           id="use1291"
+           xlink:href="#H"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1293"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,19.774306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1295"
+           xlink:href="#H"
+           transform="matrix(0.01736111,0,0,0.01736111,39.548611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1297"
+           xlink:href="#E"
+           transform="matrix(0.01736111,0,0,0.01736111,59.322917,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+    </defs>
+  </defs>
+  <sodipodi:namedview
+     pagecolor="#ffffff"
+     bordercolor="#666666"
+     borderopacity="1"
+     objecttolerance="10"
+     gridtolerance="10"
+     guidetolerance="10"
+     inkscape:pageopacity="0"
+     inkscape:pageshadow="2"
+     inkscape:window-width="3840"
+     inkscape:window-height="2031"
+     id="namedview1306"
+     showgrid="false"
+     inkscape:zoom="2.1371359"
+     inkscape:cx="178.81398"
+     inkscape:cy="272.0199"
+     inkscape:window-x="0"
+     inkscape:window-y="55"
+     inkscape:window-maximized="1"
+     inkscape:current-layer="svg1304" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke-width:0.45284426"
+     inkscape:connector-curvature="0"
+     id="path861"
+     d="M 0.896161,23.844052 H 628.99114 V 139.77218 H 0.896161 Z" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path863"
+     d="M 9.9983304,23.844052 H 19.1005 m 4.551085,0 h 9.102169 m 4.555613,0 h 9.10217 m 4.555613,0 h 9.102169 m 4.551085,0 h 9.102169 m 4.555613,0 h 9.10217 m 4.537499,0 h 9.111225 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55561,0 h 9.10217 m 4.55109,0 h 9.10216 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55561,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.54656,0 h 9.10217 m 4.56014,0 h 9.10217 m 4.54656,0 h 9.10217 m 4.55561,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55561,0 h 9.09765 m 4.55561,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55562,0 h 9.10216 m 4.55109,0 h 9.11123 m 4.55108,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55562,0 h 9.10216 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55561,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.54655,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.54655,0 h 9.10217 m 4.55562,0 h 9.10217 m 4.55108,0 h 4.55109 v 4.292964 m 0,4.292963 v 8.590456 m 0,4.292963 v 8.590456 m 0,4.292963 v 8.585927 m 0,4.30202 v 8.585927 m 0,4.292964 v 8.585927 m 0,4.30202 V 105.433 m 0,4.29296 v 8.58593 m 0,4.28844 v 8.59045 m 0,4.29297 v 4.28843 h -4.55109 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.11123 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.54656,0 h -9.10217 m -4.54655,0 h -9.10217 m -4.54656,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10216 m -4.55562,0 h -9.09764 m -4.55561,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.11123 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.102165 m -4.555613,0 h -9.102169 m -4.551085,0 h -9.102169 m -4.546557,0 h -9.102169 m -4.551085,0 h -9.102169 m -4.546557,0 h -9.102169 m -4.555613,0 H 9.9983304 m -4.5510847,0 H 0.896161 v -4.29296 m 0,-4.29297 v -8.59045 m 0,-4.29297 v -8.59045 m 0,-4.29296 v -8.576875 m 0,-4.30202 v -8.585927 m 0,-4.292963 v -8.585927 m 0,-4.302021 v -8.581398 m 0,-4.292964 V 45.30887 m 0,-4.288435 v -8.590456 m 0,-4.292963 v -4.292964 h 4.5510847" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path865"
+     d="M 4.9717593,23.844052 H 52.067561 V 54.184617 H 4.9717593 Z" />
+  <path
+     style="fill:#d2fff2;stroke-width:0.45284426"
+     inkscape:connector-curvature="0"
+     id="path869"
+     d="M 0.896161,139.77218 H 628.99114 V 255.70031 H 0.896161 Z" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path871"
+     d="M 9.9983304,139.77218 H 19.1005 m 4.551085,0 h 9.102169 m 4.555613,0 h 9.10217 m 4.555613,0 h 9.102169 m 4.551085,0 h 9.102169 m 4.555613,0 h 9.10217 m 4.551085,0 h 9.111229 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55562,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55562,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.54656,0 h 9.10216 m 4.55109,0 h 9.10217 m 4.54656,0 h 9.10216 m 4.55562,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55561,0 h 9.09312 m 4.55561,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55562,0 h 9.10216 m 4.55109,0 h 9.11123 m 4.55108,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55562,0 h 9.10216 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55561,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.54655,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.54655,0 h 9.10217 m 4.55562,0 h 9.10217 m 4.55108,0 h 4.55109 v 4.29296 m 0,4.29297 v 8.59045 m 0,4.29297 v 8.59045 m 0,4.29297 v 8.58592 m 0,4.30202 v 8.58593 m 0,4.29296 v 8.58593 m 0,4.30202 v 8.5814 m 0,4.29296 v 8.58593 m 0,4.28843 v 8.59046 m 0,4.29296 v 4.28844 h -4.55109 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.11123 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.54656,0 h -9.10217 m -4.54655,0 h -9.10217 m -4.54656,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10216 m -4.55562,0 h -9.09764 m -4.55561,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.11123 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.102165 m -4.555613,0 h -9.102169 m -4.551085,0 h -9.102169 m -4.546557,0 h -9.102169 m -4.551085,0 h -9.102169 m -4.546557,0 h -9.102169 m -4.555613,0 H 9.9983304 m -4.5510847,0 H 0.896161 v -4.29297 m 0,-4.29296 v -8.59045 m 0,-4.29297 v -8.59045 m 0,-4.29297 v -8.57687 m 0,-4.30202 v -8.58592 m 0,-4.29297 v -8.58592 m 0,-4.30202 v -8.5814 m 0,-4.29297 V 161.237 m 0,-4.28844 v -8.59045 m 0,-4.29297 v -4.29296 h 4.5510847" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path873"
+     d="M 4.9717593,139.77218 H 122.71126 v 30.34056 H 4.9717593 Z" />
+  <path
+     style="fill:#ffffff;stroke:#000000;stroke-width:1.07623756"
+     inkscape:connector-curvature="0"
+     id="path877"
+     d="m 3.360172,196.7534 c 0,-2.74164 3.159469,-4.9602 7.063854,-4.9602 H 150.41677 c 3.90438,0 7.06386,2.21856 7.06386,4.9602 v 30.21218 c 0,2.74164 -3.15948,4.9602 -7.06386,4.9602 H 10.424026 c -3.904385,0 -7.063854,-2.21856 -7.063854,-4.9602 z" />
+  <path
+     style="fill:#dadada;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path881"
+     d="m 15.840021,66.411412 c 0,-2.753293 2.227994,-4.981287 4.981287,-4.981287 H 476.83547 c 2.75329,0 4.98128,2.227994 4.98128,4.981287 v 30.340564 c 0,2.753294 -2.22799,4.981284 -4.98128,4.981284 H 20.821308 c -2.753293,0 -4.981287,-2.22799 -4.981287,-4.981284 z" />
+  <path
+     style="fill:#ffffff;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path885"
+     d="m 499.02484,66.411412 c 0,-2.753293 2.22799,-4.981287 4.98128,-4.981287 h 98.72005 c 2.75329,0 4.98129,2.227994 4.98129,4.981287 v 30.340564 c 0,2.753294 -2.228,4.981284 -4.98129,4.981284 h -98.72005 c -2.75329,0 -4.98128,-2.22799 -4.98128,-4.981284 z" />
+  <path
+     style="fill:none;stroke-width:0.45284426"
+     inkscape:connector-curvature="0"
+     id="path893"
+     d="M 87.389413,61.430125 V 101.73326" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path897"
+     d="m 68.369954,109.43162 h 38.038916 v 30.34056 H 68.369954 Z" />
+  <path
+     style="fill:none;stroke-width:0.45284426"
+     inkscape:connector-curvature="0"
+     id="path901"
+     d="M 164.82578,61.430125 V 101.73326" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path905"
+     d="m 134.93806,109.43162 h 60.68113 v 30.34056 h -60.68113 z" />
+  <path
+     style="fill:none;stroke-width:0.45284426"
+     inkscape:connector-curvature="0"
+     id="path909"
+     d="M 242.71499,61.430125 V 101.73326" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path913"
+     d="m 199.24194,109.43162 h 87.39894 v 30.34056 h -87.39894 z" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path917"
+     d="M 553.81899,60.524437 507.62888,5.277438 m 43.92589,56.152687 42.21414,-49.849095" />
+  <path
+     style="stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path919"
+     d="m 598.15244,6.3959633 -2.56762,6.2854777 -3.20614,-2.717065 z" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path921"
+     d="M 78.06905,190.49074 31.878938,164.67861 m 43.925892,26.26497 40.32125,-22.27088" />
+  <path
+     style="stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path923"
+     d="m 122.07193,165.38505 -4.64166,4.96317 -2.02874,-3.66803 z" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path929"
+     d="m 237.95975,190.49074 -46.19011,-25.81213 m 43.92589,26.26497 39.882,-22.24371" />
+  <path
+     style="stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path931"
+     d="m 281.50978,165.39411 -4.61901,4.98128 -2.0378,-3.66803 z" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path937"
+     d="M 397.85045,190.49074 351.2075,164.67861 m 44.37873,26.26497 39.882,-22.24371" />
+  <path
+     style="stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path939"
+     d="m 441.40049,165.39411 -4.61902,4.98128 -2.03779,-3.66803 z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path941"
+     d="M 41.010676,231.24672 H 153.76889 v 30.34056 H 41.010676 Z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path949"
+     d="M 154.90138,231.24672 H 267.6596 v 30.34056 H 154.90138 Z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path957"
+     d="M 292.79208,231.69956 H 405.5503 v 30.34057 H 292.79208 Z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path967"
+     d="m 497.21346,102.63895 h 112.75822 v 30.34057 H 497.21346 Z" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="504.97748"
+     y="87.439178"
+     id="text101-6"><tspan
+       sodipodi:role="line"
+       id="tspan99-88"
+       x="504.97748"
+       y="87.439178"
+       style="stroke-width:0.45284379">cont (fresh db)</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="199.31563"
+     y="87.040298"
+     id="text101-6-4"><tspan
+       sodipodi:role="line"
+       id="tspan99-88-4"
+       x="199.31563"
+       y="87.040298"
+       style="stroke-width:0.45284379">cont (retiring db)</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="6.9198484"
+     y="157.37654"
+     id="text277"><tspan
+       sodipodi:role="line"
+       id="tspan275"
+       x="6.9198484"
+       y="157.37654"
+       style="stroke-width:0.45284379">/.shards_acct</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="8.2687769"
+     y="40.810501"
+     id="text281"><tspan
+       sodipodi:role="line"
+       id="tspan279"
+       x="8.2687769"
+       y="40.810501"
+       style="stroke-width:0.45284379">/acct</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="9.5435867"
+     y="217.57593"
+     id="text101"><tspan
+       sodipodi:role="line"
+       id="tspan99"
+       x="9.5435867"
+       y="217.57593"
+       style="stroke-width:0.45284379">cont-568d8e-&lt;ts&gt;-0</tspan></text>
+  <flowRoot
+     xml:space="preserve"
+     id="flowRoot1828"
+     style="fill:black;fill-opacity:1;stroke:none;font-family:sans-serif;font-style:normal;font-weight:normal;font-size:37.33333333px;line-height:1.25;letter-spacing:0px;word-spacing:0px;-inkscape-font-specification:'sans-serif, Normal';font-stretch:normal;font-variant:normal;text-anchor:start;text-align:start;writing-mode:lr;font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal"><flowRegion
+       id="flowRegion1830"><rect
+         id="rect1832"
+         width="573.11005"
+         height="39.244427"
+         x="182.43355"
+         y="184.33957" /></flowRegion><flowPara
+       id="flowPara1834"></flowPara></flowRoot>  <path
+     style="fill:#ffffff;stroke:#000000;stroke-width:1.07623756"
+     inkscape:connector-curvature="0"
+     id="path877-7"
+     d="m 159.91421,196.7534 c 0,-2.74164 3.15947,-4.9602 7.06385,-4.9602 h 139.99275 c 3.90438,0 7.06386,2.21856 7.06386,4.9602 v 30.21218 c 0,2.74164 -3.15948,4.9602 -7.06386,4.9602 H 166.97806 c -3.90438,0 -7.06385,-2.21856 -7.06385,-4.9602 z" />
+  <path
+     style="fill:#ffffff;stroke:#000000;stroke-width:1.07623756"
+     inkscape:connector-curvature="0"
+     id="path877-7-6"
+     d="m 316.32694,196.75341 c 0,-2.74164 3.15947,-4.96021 7.06385,-4.96021 h 139.99275 c 3.90438,0 7.06386,2.21856 7.06386,4.9602 v 30.21218 c 0,2.74164 -3.15948,4.9602 -7.06386,4.9602 H 323.39079 c -3.90438,0 -7.06385,-2.21856 -7.06385,-4.9602 z" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="168.83531"
+     y="217.57593"
+     id="text101-7"><tspan
+       sodipodi:role="line"
+       id="tspan99-8"
+       x="168.83531"
+       y="217.57593"
+       style="stroke-width:0.45284379">cont-750ed3-&lt;ts&gt;-1</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="325.60159"
+     y="217.57593"
+     id="text101-7-4"><tspan
+       sodipodi:role="line"
+       id="tspan99-8-4"
+       x="325.60159"
+       y="217.57593"
+       style="stroke-width:0.45284379">cont-4ec28d-&lt;ts&gt;-2</tspan></text>
+  <path
+     style="fill:#0000ff;fill-opacity:1;stroke:#0000ff;stroke-width:0.90600002;stroke-linecap:butt;stroke-linejoin:miter;stroke-miterlimit:4;stroke-dasharray:7.24800014, 3.62400007;stroke-dashoffset:0;stroke-opacity:1"
+     d="m 86.923722,61.700742 c 0,39.730558 0.0442,39.597978 0.0442,39.597978 v 0 0 0"
+     id="path4476"
+     inkscape:connector-curvature="0" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#0000ff;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="75.443924"
+     y="132.15068"
+     id="text281-9"><tspan
+       sodipodi:role="line"
+       id="tspan279-9"
+       x="75.443924"
+       y="132.15068"
+       style="fill:#0000ff;stroke-width:0.45284379">cat</tspan></text>
+  <g
+     id="g6164">
+    <path
+       d="M 295.55297,200.04105 547.85062,97.163898"
+       id="path5240"
+       inkscape:connector-curvature="0"
+       style="fill:none;stroke:#ffff00;stroke-width:5.88697529" />
+    <path
+       d="m 303.37812,194.60692 -2.468,3.25142 4.03031,0.59776 -0.8604,5.82358 -11.13091,-1.64836 -0.57512,-0.24001 -1.28607,-0.16755 h -0.88758 l 8.4863,-11.17619 z"
+       id="path5242"
+       inkscape:connector-curvature="0"
+       style="fill:#ffff00;stroke-width:0.45284426" />
+  </g>
+  <path
+     style="fill:#0000ff;fill-opacity:1;stroke:#0000ff;stroke-width:0.90600002;stroke-linecap:butt;stroke-linejoin:miter;stroke-miterlimit:4;stroke-dasharray:7.24800014, 3.62400007;stroke-dashoffset:0;stroke-opacity:1"
+     d="m 163.80955,61.72884 c 0,39.73056 0.0442,39.59798 0.0442,39.59798 v 0 0 0"
+     id="path4476-6"
+     inkscape:connector-curvature="0" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#0000ff;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="140.32585"
+     y="131.16364"
+     id="text281-9-8"><tspan
+       sodipodi:role="line"
+       id="tspan279-9-3"
+       x="140.32585"
+       y="131.16364"
+       style="fill:#0000ff;stroke-width:0.45284379">giraffe</tspan></text>
+  <g
+     id="g6160">
+    <path
+       d="m 226.83838,202.22376 -12.92417,-5.47036 2.29139,-5.42054 3.75861,1.58495 -0.41662,-4.05295 5.85528,-0.60229 z"
+       id="path5238"
+       inkscape:connector-curvature="0"
+       style="fill:#ffff00;stroke-width:0.45284426" />
+    <path
+       d="M 223.4013,197.57305 146.17777,93.088298"
+       id="path5236"
+       inkscape:connector-curvature="0"
+       style="fill:none;stroke:#ffff00;stroke-width:5.88697529" />
+  </g>
+  <path
+     style="fill:#f9f9f9;fill-opacity:1;stroke:#ba2e44;stroke-width:0.90600002;stroke-linecap:butt;stroke-linejoin:miter;stroke-miterlimit:4;stroke-dasharray:7.24800014, 3.62400007;stroke-dashoffset:0;stroke-opacity:1"
+     d="m 242.00139,61.728839 c 0,39.730551 0.0442,39.597981 0.0442,39.597981 v 0 0 0"
+     id="path4476-6-8"
+     inkscape:connector-curvature="0" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#aa0000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="224.25607"
+     y="131.16364"
+     id="text281-9-8-3"><tspan
+       sodipodi:role="line"
+       id="tspan279-9-3-3"
+       x="224.25607"
+       y="131.16364"
+       style="fill:#aa0000;stroke-width:0.45284379">igloo</tspan></text>
+  <path
+     style="fill:#f9f9f9;fill-opacity:1;stroke:#ba2e44;stroke-width:0.90600002;stroke-linecap:butt;stroke-linejoin:miter;stroke-miterlimit:4;stroke-dasharray:7.24800014, 3.62400007;stroke-dashoffset:0;stroke-opacity:1"
+     d="m 317.27929,62.643472 c 0,39.730558 0.0442,39.597988 0.0442,39.597988 v 0 0 0"
+     id="path4476-6-8-3"
+     inkscape:connector-curvature="0" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#aa0000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="299.53397"
+     y="132.07826"
+     id="text281-9-8-3-8"><tspan
+       sodipodi:role="line"
+       id="tspan279-9-3-3-0"
+       x="299.53397"
+       y="132.07826"
+       style="fill:#aa0000;stroke-width:0.45284379">linux</tspan></text>
+  <flowRoot
+     xml:space="preserve"
+     id="flowRoot6150"
+     style="fill:black;fill-opacity:1;stroke:none;font-family:sans-serif;font-style:normal;font-weight:normal;font-size:37.33333333px;line-height:1.25;letter-spacing:0px;word-spacing:0px;-inkscape-font-specification:'sans-serif, Normal';font-stretch:normal;font-variant:normal;text-anchor:start;text-align:start;writing-mode:lr;font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal"><flowRegion
+       id="flowRegion6152"><rect
+         id="rect6154"
+         width="658.73334"
+         height="99.261536"
+         x="-102.56863"
+         y="156.43877" /></flowRegion><flowPara
+       id="flowPara6156"></flowPara></flowRoot>  <path
+     style="fill:none;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path937-4"
+     d="m 554.14147,189.96071 -46.64295,-25.81213 m 44.37873,26.26497 39.882,-22.24371" />
+  <path
+     style="stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path939-7"
+     d="m 597.69151,164.86408 -4.61902,4.98128 -2.03779,-3.66803 z" />
+  <path
+     style="fill:#ffffff;stroke:#000000;stroke-width:1.07623756"
+     inkscape:connector-curvature="0"
+     id="path877-7-6-6"
+     d="m 472.61796,196.22338 c 0,-2.74164 3.15947,-4.96021 7.06385,-4.96021 h 139.99275 c 3.90438,0 7.06386,2.21856 7.06386,4.9602 v 30.21218 c 0,2.74164 -3.15948,4.9602 -7.06386,4.9602 H 479.68181 c -3.90438,0 -7.06385,-2.21856 -7.06385,-4.9602 z" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="481.89264"
+     y="217.0459"
+     id="text101-7-4-8"><tspan
+       sodipodi:role="line"
+       id="tspan99-8-4-7"
+       x="481.89264"
+       y="217.0459"
+       style="stroke-width:0.45284379">cont-aef34f-&lt;ts&gt;-3</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="48.558598"
+     y="251.41714"
+     id="text281-90"><tspan
+       sodipodi:role="line"
+       id="tspan279-3"
+       x="48.558598"
+       y="251.41714"
+       style="stroke-width:0.45284379">&quot;&quot; - &quot;cat&quot;</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="180.88539"
+     y="250.2355"
+     id="text281-90-3"><tspan
+       sodipodi:role="line"
+       id="tspan279-3-3"
+       x="180.88539"
+       y="250.2355"
+       style="stroke-width:0.45284379">&quot;cat&quot; - &quot;giraffe&quot;</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="333.40033"
+     y="250.2355"
+     id="text281-90-3-7"><tspan
+       sodipodi:role="line"
+       id="tspan279-3-3-3"
+       x="333.40033"
+       y="250.2355"
+       style="stroke-width:0.45284379">&quot;giraffe&quot; - &quot;igloo&quot;</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="494.11285"
+     y="250.2355"
+     id="text281-90-3-7-2"><tspan
+       sodipodi:role="line"
+       id="tspan279-3-3-3-6"
+       x="494.11285"
+       y="250.2355"
+       style="stroke-width:0.45284379">&quot;igloo&quot; - &quot;linux&quot;</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="515.27777"
+     y="130.0264"
+     id="text281-90-3-7-2-5"><tspan
+       sodipodi:role="line"
+       id="tspan279-3-3-3-6-2"
+       x="515.27777"
+       y="130.0264"
+       style="stroke-width:0.45284379">&quot;linux&quot; - &quot;&quot;</tspan></text>
+</svg>
diff --git a/doc/source/images/sharding_cleave_basic.svg b/doc/source/images/sharding_cleave_basic.svg
new file mode 100644
index 0000000000..fd5069754f
--- /dev/null
+++ b/doc/source/images/sharding_cleave_basic.svg
@@ -0,0 +1,649 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<svg
+   xmlns:dc="http://purl.org/dc/elements/1.1/"
+   xmlns:cc="http://creativecommons.org/ns#"
+   xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
+   xmlns:svg="http://www.w3.org/2000/svg"
+   xmlns="http://www.w3.org/2000/svg"
+   xmlns:xlink="http://www.w3.org/1999/xlink"
+   xmlns:sodipodi="http://sodipodi.sourceforge.net/DTD/sodipodi-0.dtd"
+   xmlns:inkscape="http://www.inkscape.org/namespaces/inkscape"
+   width="630"
+   height="235"
+   version="1.1"
+   id="svg161"
+   sodipodi:docname="sharding_snip5.svg"
+   inkscape:version="0.92.2 (5c3e80d, 2017-08-06)">
+  <metadata
+     id="metadata167">
+    <rdf:RDF>
+      <cc:Work
+         rdf:about="">
+        <dc:format>image/svg+xml</dc:format>
+        <dc:type
+           rdf:resource="http://purl.org/dc/dcmitype/StillImage" />
+        <dc:title></dc:title>
+      </cc:Work>
+    </rdf:RDF>
+  </metadata>
+  <defs
+     id="defs165">
+    <defs
+       id="defs157">
+      <path
+         id="f"
+         d="M 0,20 411,-1484 H 569 L 162,20 H 0"
+         inkscape:connector-curvature="0" />
+      <path
+         id="g"
+         d="M 797,-207 C 713,-60 620,16 414,20 203,24 88,-98 87,-302 c 0,-112 37,-198 111,-258 74,-60 192,-93 356,-96 l 243,-4 c 10,-201 -43,-307 -232,-305 -154,2 -223,43 -242,172 l -188,-17 c 31,-195 175,-292 434,-292 259,0 410,116 410,364 v 466 c 3,95 12,159 101,161 17,0 37,-2 59,-7 V -6 C 1094,5 1047,10 1000,10 857,8 812,-66 803,-207 Z m -525,-92 c -1,116 66,187 183,184 230,-7 361,-164 342,-419 -124,5 -305,-2 -389,30 -83,32 -136,92 -136,205"
+         inkscape:connector-curvature="0" />
+      <path
+         id="h"
+         d="m 779,-765 c -19,-119 -93,-196 -233,-196 -95,0 -164,32 -207,95 -43,63 -64,170 -64,320 0,144 23,251 68,320 45,69 114,104 205,104 139,0 224,-79 240,-212 l 182,12 C 946,-119 781,22 553,20 230,17 87,-201 87,-542 c 0,-338 145,-557 464,-560 225,-1 380,129 413,323"
+         inkscape:connector-curvature="0" />
+      <path
+         id="i"
+         d="m 336,-268 c 2,98 22,139 114,141 24,0 59,-5 104,-14 V -8 C 495,8 434,16 372,16 228,16 156,-66 156,-229 V -951 H 31 v -131 h 132 l 53,-242 h 120 v 242 h 200 v 131 H 336 v 683"
+         inkscape:connector-curvature="0" />
+      <g
+         id="a">
+        <use
+           id="use42"
+           xlink:href="#f"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use44"
+           xlink:href="#g"
+           transform="matrix(0.01736111,0,0,0.01736111,9.8784722,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use46"
+           xlink:href="#h"
+           transform="matrix(0.01736111,0,0,0.01736111,29.652778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use48"
+           xlink:href="#h"
+           transform="matrix(0.01736111,0,0,0.01736111,47.430556,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use50"
+           xlink:href="#i"
+           transform="matrix(0.01736111,0,0,0.01736111,65.208333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="j"
+         d="M 187,0 V -219 H 382 V 0 H 187"
+         inkscape:connector-curvature="0" />
+      <path
+         id="k"
+         d="m 513,-963 c -139,1 -238,29 -238,149 0,72 41,100 95,127 55,27 348,94 404,125 101,56 176,118 176,263 C 950,-73 758,21 511,20 254,19 107,-55 57,-254 l 159,-31 c 34,123 133,168 295,168 156,0 264,-34 264,-168 0,-156 -183,-165 -315,-204 -171,-51 -245,-68 -323,-172 -26,-35 -37,-82 -37,-135 0,-220 172,-304 413,-303 232,1 379,74 418,265 l -162,20 C 746,-918 647,-964 513,-963"
+         inkscape:connector-curvature="0" />
+      <path
+         id="l"
+         d="m 322,-1484 c -2,195 6,405 -8,587 h 3 c 73,-129 159,-205 346,-205 250,0 342,118 343,381 V 0 H 825 v -686 c 3,-190 -43,-277 -223,-277 -176,-1 -280,140 -280,325 V 0 H 142 v -1484 h 180"
+         inkscape:connector-curvature="0" />
+      <path
+         id="m"
+         d="m 318,-861 c 55,-157 83,-241 257,-241 24,0 48,3 73,10 v 165 c -24,-7 -56,-10 -96,-10 -75,0 -132,33 -171,97 -39,64 -59,156 -59,276 V 0 H 142 c -3,-364 6,-725 -6,-1082 h 170 c 5,123 8,196 8,221 h 4"
+         inkscape:connector-curvature="0" />
+      <path
+         id="n"
+         d="m 835,0 c -5,-29 -11,-137 -10,-174 h -4 C 759,-45 663,20 484,20 177,20 86,-201 86,-536 c 0,-377 133,-566 398,-566 178,1 273,67 339,188 -4,-187 -1,-380 -2,-570 h 180 v 1261 c 0,113 2,187 6,223 z m -14,-554 c 0,-255 -58,-415 -289,-415 -91,0 -151,37 -196,101 -76,109 -77,543 -1,651 44,63 105,98 195,98 235,0 291,-173 291,-435"
+         inkscape:connector-curvature="0" />
+      <path
+         id="o"
+         d="m 87,-548 c 0,-338 159,-553 484,-554 325,-2 484,204 477,599 H 276 c -1,227 88,385 302,388 146,2 246,-65 283,-166 l 158,45 C 954,-65 807,20 578,20 240,20 87,-193 87,-548 Z m 775,-93 c -19,-206 -90,-328 -294,-328 -185,0 -285,140 -290,328 h 584"
+         inkscape:connector-curvature="0" />
+      <path
+         id="p"
+         d="M -31,407 V 277 H 1162 V 407 H -31"
+         inkscape:connector-curvature="0" />
+      <g
+         id="b">
+        <use
+           id="use60"
+           xlink:href="#f"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use62"
+           xlink:href="#j"
+           transform="matrix(0.01736111,0,0,0.01736111,9.8784722,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use64"
+           xlink:href="#k"
+           transform="matrix(0.01736111,0,0,0.01736111,19.756944,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use66"
+           xlink:href="#l"
+           transform="matrix(0.01736111,0,0,0.01736111,37.534722,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use68"
+           xlink:href="#g"
+           transform="matrix(0.01736111,0,0,0.01736111,57.309028,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use70"
+           xlink:href="#m"
+           transform="matrix(0.01736111,0,0,0.01736111,77.083333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use72"
+           xlink:href="#n"
+           transform="matrix(0.01736111,0,0,0.01736111,88.923611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use74"
+           xlink:href="#o"
+           transform="matrix(0.01736111,0,0,0.01736111,108.69792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use76"
+           xlink:href="#n"
+           transform="matrix(0.01736111,0,0,0.01736111,128.47222,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use78"
+           xlink:href="#p"
+           transform="matrix(0.01736111,0,0,0.01736111,148.24653,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use80"
+           xlink:href="#g"
+           transform="matrix(0.01736111,0,0,0.01736111,168.02083,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use82"
+           xlink:href="#h"
+           transform="matrix(0.01736111,0,0,0.01736111,187.79514,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use84"
+           xlink:href="#h"
+           transform="matrix(0.01736111,0,0,0.01736111,205.57292,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use86"
+           xlink:href="#i"
+           transform="matrix(0.01736111,0,0,0.01736111,223.35069,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="q"
+         d="m 571,-1102 c 350,0 480,196 482,560 2,357 -151,562 -488,562 -332,0 -479,-218 -479,-562 0,-373 162,-560 485,-560 z m -8,989 c 244,0 301,-164 301,-429 0,-266 -49,-427 -290,-427 -239,0 -299,165 -299,427 0,252 61,429 288,429"
+         inkscape:connector-curvature="0" />
+      <path
+         id="r"
+         d="m 663,-1102 c 251,0 343,119 343,381 V 0 H 825 v -686 c 0,-183 -40,-279 -223,-277 -184,2 -280,141 -280,336 V 0 H 142 c -3,-345 6,-754 -6,-1082 h 170 c 5,68 6,94 8,185 h 3 c 76,-134 157,-205 346,-205"
+         inkscape:connector-curvature="0" />
+      <path
+         id="s"
+         d="m 156,0 v -153 h 359 v -1084 l -318,227 v -170 l 333,-229 h 166 v 1256 h 343 V 0 H 156"
+         inkscape:connector-curvature="0" />
+      <path
+         id="t"
+         d="m 655,-1102 c 307,0 398,221 398,556 0,377 -133,566 -398,566 -180,0 -272,-66 -339,-188 1,22 -7,151 -10,168 H 132 c 4,-36 6,-110 6,-223 v -1261 h 180 c -2,196 4,384 -4,576 h 4 c 62,-129 158,-194 337,-194 z m -337,573 c 0,254 57,416 289,416 91,0 152,-37 197,-101 76,-109 76,-543 0,-651 -44,-63 -105,-98 -195,-98 -236,0 -291,169 -291,434"
+         inkscape:connector-curvature="0" />
+      <path
+         id="u"
+         d="m 572,-1430 c 269,0 442,128 442,386 0,144 -72,232 -149,325 -108,130 -487,366 -564,566 h 735 V 0 H 103 v -127 c 119,-285 378,-432 583,-627 76,-72 141,-150 143,-284 1,-156 -100,-244 -257,-244 -156,0 -263,93 -277,238 l -184,-17 c 24,-224 208,-369 461,-369"
+         inkscape:connector-curvature="0" />
+      <path
+         id="v"
+         d="m 715,-719 c 191,17 334,134 334,330 C 1049,-115 858,20 571,20 288,20 108,-110 78,-362 l 186,-17 c 24,167 126,250 307,250 177,0 294,-88 291,-266 -3,-174 -149,-246 -344,-244 H 416 v -156 h 98 c 179,2 311,-77 311,-243 0,-157 -98,-244 -264,-244 -159,0 -264,88 -278,233 l -181,-14 c 23,-229 206,-367 461,-367 262,0 447,124 447,373 0,197 -120,298 -295,334 v 4"
+         inkscape:connector-curvature="0" />
+      <path
+         id="w"
+         d="M 1036,-1263 C 892,-1043 790,-871 731,-746 626,-522 556,-302 553,0 H 365 c 0,-180 39,-369 115,-568 76,-199 203,-429 382,-688 H 105 v -153 h 931 v 146"
+         inkscape:connector-curvature="0" />
+      <g
+         id="c">
+        <use
+           id="use96"
+           xlink:href="#h"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use98"
+           xlink:href="#q"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use100"
+           xlink:href="#r"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use102"
+           xlink:href="#i"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use104"
+           xlink:href="#p"
+           transform="matrix(0.01302083,0,0,0.01302083,50.403646,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use106"
+           xlink:href="#s"
+           transform="matrix(0.01302083,0,0,0.01302083,65.234375,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use108"
+           xlink:href="#o"
+           transform="matrix(0.01302083,0,0,0.01302083,80.065104,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use110"
+           xlink:href="#o"
+           transform="matrix(0.01302083,0,0,0.01302083,94.895833,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use112"
+           xlink:href="#t"
+           transform="matrix(0.01302083,0,0,0.01302083,109.72656,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use114"
+           xlink:href="#u"
+           transform="matrix(0.01302083,0,0,0.01302083,124.55729,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use116"
+           xlink:href="#v"
+           transform="matrix(0.01302083,0,0,0.01302083,139.38802,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use118"
+           xlink:href="#w"
+           transform="matrix(0.01302083,0,0,0.01302083,154.21875,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="d">
+        <use
+           id="use121"
+           xlink:href="#h"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use123"
+           xlink:href="#q"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use125"
+           xlink:href="#r"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use127"
+           xlink:href="#i"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="x"
+         d="m 765,-739 c 171,25 285,155 285,346 C 1049,-119 859,20 570,20 286,20 89,-117 89,-391 89,-574 212,-714 370,-737 v -4 c -143,-30 -248,-160 -248,-328 1,-229 198,-361 444,-361 254,0 448,125 449,363 1,166 -104,300 -250,324 z m -197,-70 c 171,-2 261,-74 260,-248 0,-159 -87,-239 -262,-239 -165,0 -260,77 -260,239 0,163 99,249 262,248 z m 4,694 c 200,0 291,-92 291,-295 1,-179 -116,-264 -297,-264 -175,0 -292,98 -291,268 0,194 99,291 297,291"
+         inkscape:connector-curvature="0" />
+      <path
+         id="y"
+         d="m 492,-1341 c -103,3 -130,49 -131,162 v 97 h 211 v 131 H 361 V 0 H 181 V -951 H 29 v -131 h 152 v -122 c 0,-192 78,-276 264,-278 50,0 92,4 127,12 v 137 c -30,-5 -57,-8 -80,-8"
+         inkscape:connector-curvature="0" />
+      <g
+         id="e">
+        <use
+           id="use132"
+           xlink:href="#h"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use134"
+           xlink:href="#q"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use136"
+           xlink:href="#r"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use138"
+           xlink:href="#i"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use140"
+           xlink:href="#p"
+           transform="matrix(0.01302083,0,0,0.01302083,50.403646,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use142"
+           xlink:href="#n"
+           transform="matrix(0.01302083,0,0,0.01302083,65.234375,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use144"
+           xlink:href="#n"
+           transform="matrix(0.01302083,0,0,0.01302083,80.065104,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use146"
+           xlink:href="#x"
+           transform="matrix(0.01302083,0,0,0.01302083,94.895833,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use148"
+           xlink:href="#v"
+           transform="matrix(0.01302083,0,0,0.01302083,109.72656,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use150"
+           xlink:href="#u"
+           transform="matrix(0.01302083,0,0,0.01302083,124.55729,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use152"
+           xlink:href="#x"
+           transform="matrix(0.01302083,0,0,0.01302083,139.38802,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use154"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,154.21875,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+    </defs>
+  </defs>
+  <sodipodi:namedview
+     pagecolor="#ffffff"
+     bordercolor="#666666"
+     borderopacity="1"
+     objecttolerance="10"
+     gridtolerance="10"
+     guidetolerance="10"
+     inkscape:pageopacity="0"
+     inkscape:pageshadow="2"
+     inkscape:window-width="3840"
+     inkscape:window-height="2031"
+     id="namedview163"
+     showgrid="false"
+     inkscape:zoom="2.8284271"
+     inkscape:cx="431.66392"
+     inkscape:cy="182.41243"
+     inkscape:window-x="0"
+     inkscape:window-y="55"
+     inkscape:window-maximized="1"
+     inkscape:current-layer="svg161" />
+  <g
+     id="g264">
+    <path
+       d="m 0.80639,2.9507 h 628.09436 v 115.928 H 0.80639 Z"
+       id="path2"
+       inkscape:connector-curvature="0"
+       style="fill:#ffffff;fill-opacity:0;stroke-width:0.45284379" />
+    <path
+       d="m 9.90855,2.9507 h 9.10216 m 4.55108,0 h 9.10216 m 4.55561,0 h 9.10216 m 4.55561,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55561,0 h 9.10216 m 4.55108,0 h 9.11121 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55561,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55108,0 H 196.53 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55561,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.54655,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.54655,0 h 9.10216 m 4.55561,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55561,0 h 9.0931 m 4.55561,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55561,0 h 9.10216 m 4.55108,0 h 9.11121 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55105,0 h 9.1022 m 4.5511,0 h 9.1021 m 4.5556,0 h 9.1022 m 4.5511,0 h 9.1021 m 4.5511,0 h 9.1022 m 4.5511,0 h 9.1021 m 4.5511,0 h 9.1022 m 4.5556,0 h 9.1021 m 4.5511,0 h 9.1022 m 4.5465,0 h 9.1022 m 4.5511,0 h 9.1021 m 4.5466,0 h 9.1021 m 4.5556,0 h 9.1022 m 4.5511,0 h 4.5511 v 4.293 m 0,4.2929 v 8.5905 m 0,4.2929 v 8.5905 m 0,4.2929 v 8.5859 m 0,4.3021 v 8.5859 m 0,4.2929 v 8.5859 m 0,4.3021 v 8.5814 m 0,4.2929 v 8.5859 m 0,4.2885 v 8.5904 m 0,4.293 v 4.2884 h -4.5511 m -4.5511,0 h -9.1022 m -4.551,0 h -9.1022 m -4.5556,0 h -9.1022 m -4.5556,0 h -9.1021 m -4.5511,0 h -9.1022 m -4.5556,0 h -9.1021 m -4.5511,0 h -9.1112 m -4.5511,0 h -9.1022 m -4.5511,0 h -9.1021 m -4.5511,0 h -9.1022 m -4.551,0 h -9.1022 m -4.5556,0 h -9.1022 m -4.5511,0 h -9.1021 m -4.55109,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55561,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.54655,0 h -9.10216 m -4.54655,0 h -9.10216 m -4.54655,0 h -9.10216 m -4.55561,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55561,0 h -9.09763 m -4.55561,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55561,0 h -9.10216 m -4.55108,0 h -9.11121 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55561,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55561,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.54655,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.54655,0 h -9.10216 m -4.55561,0 H 9.90855 m -4.55108,0 H 0.80639 v -4.293 m 0,-4.2929 v -8.5905 m 0,-4.2929 v -8.5905 m 0,-4.2929 v -8.5769 m 0,-4.302 v -8.5859 m 0,-4.293 v -8.5859 m 0,-4.302 v -8.5814 m 0,-4.293 v -8.5904 m 0,-4.2884 v -8.5905 m 0,-4.2929 v -4.293 h 4.55108"
+       id="path4"
+       inkscape:connector-curvature="0"
+       style="fill:none;stroke:#000000;stroke-width:0.90568757" />
+    <path
+       d="M 4.88199,2.9507 H 51.97774 V 33.2912 H 4.88199 Z"
+       id="path6"
+       inkscape:connector-curvature="0"
+       style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568757;stroke-opacity:0" />
+    <path
+       d="m 0.80639,118.8787 h 628.09436 v 115.928 H 0.80639 Z"
+       id="path10"
+       inkscape:connector-curvature="0"
+       style="fill:#d2fff2;stroke-width:0.45284379" />
+    <path
+       d="m 9.90855,118.8787 h 9.10216 m 4.55108,0 h 9.10216 m 4.55561,0 h 9.10216 m 4.55561,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55561,0 h 9.10216 m 4.55108,0 h 9.11121 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55561,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55108,0 H 196.53 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55561,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.54655,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.54655,0 h 9.10216 m 4.55561,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55561,0 h 9.0931 m 4.55561,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55561,0 h 9.10216 m 4.55108,0 h 9.11121 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55105,0 h 9.1022 m 4.5511,0 h 9.1021 m 4.5556,0 h 9.1022 m 4.5511,0 h 9.1021 m 4.5511,0 h 9.1022 m 4.5511,0 h 9.1021 m 4.5511,0 h 9.1022 m 4.5556,0 h 9.1021 m 4.5511,0 h 9.1022 m 4.5465,0 h 9.1022 m 4.5511,0 h 9.1021 m 4.5466,0 h 9.1021 m 4.5556,0 h 9.1022 m 4.5511,0 h 4.5511 v 4.293 m 0,4.2929 v 8.5905 m 0,4.2929 v 8.5905 m 0,4.2929 v 8.5859 m 0,4.3021 v 8.5859 m 0,4.2929 v 8.586 m 0,4.302 v 8.5814 m 0,4.2929 v 8.5859 m 0,4.2885 v 8.5904 m 0,4.293 v 4.2884 h -4.5511 m -4.5511,0 h -9.1022 m -4.551,0 h -9.1022 m -4.5556,0 h -9.1022 m -4.5556,0 h -9.1021 m -4.5511,0 h -9.1022 m -4.5556,0 h -9.1021 m -4.5511,0 h -9.1112 m -4.5511,0 h -9.1022 m -4.5511,0 h -9.1021 m -4.5511,0 h -9.1022 m -4.551,0 h -9.1022 m -4.5556,0 h -9.1022 m -4.5511,0 h -9.1021 m -4.55109,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55561,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.54655,0 h -9.10216 m -4.54655,0 h -9.10216 m -4.54655,0 h -9.10216 m -4.55561,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55561,0 h -9.09763 m -4.55561,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55561,0 h -9.10216 m -4.55108,0 h -9.11121 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55561,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55561,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.54655,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.54655,0 h -9.10216 m -4.55561,0 H 9.90855 m -4.55108,0 H 0.80639 v -4.293 m 0,-4.2929 v -8.5905 m 0,-4.2929 v -8.5905 m 0,-4.2929 v -8.5769 m 0,-4.302 v -8.5859 m 0,-4.293 v -8.5859 m 0,-4.302 v -8.5814 m 0,-4.293 v -8.5904 m 0,-4.2884 v -8.5905 m 0,-4.2929 v -4.293 h 4.55108"
+       id="path12"
+       inkscape:connector-curvature="0"
+       style="fill:none;stroke:#000000;stroke-width:0.90568757" />
+    <path
+       d="m 4.88199,118.8787 h 117.73938 v 30.3405 H 4.88199 Z"
+       id="path14"
+       inkscape:connector-curvature="0"
+       style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568757;stroke-opacity:0" />
+    <path
+       d="m 43.49452,161.537 c 0,-2.7368 3.59697,-4.9515 8.042,-4.9515 h 159.37776 c 4.44503,0 8.042,2.2147 8.042,4.9515 v 30.1586 c 0,2.7368 -3.59697,4.9514 -8.042,4.9514 H 51.53652 c -4.44503,0 -8.042,-2.2146 -8.042,-4.9514 z"
+       id="path18"
+       inkscape:connector-curvature="0"
+       style="fill:#ffffff;stroke:#000000;stroke-width:1.1473186" />
+    <path
+       d="M 154.20269,158.1403 380.23061,81.7455"
+       id="path22"
+       inkscape:connector-curvature="0"
+       style="fill:none;stroke:#000000;stroke-width:0.90568757" />
+    <path
+       style="stroke-width:0.45284379"
+       d="m 160.45647,151.574 -5.41149,6.2764 8.11496,1.7208 -0.18113,0.8786 -9.61841,-2.0288 6.40774,-7.4447 z m 221.20965,-69.8285 -1.2906,0.4302 -0.29435,-0.8604 0.0725,-0.023 h 1.35853 z"
+       id="path24"
+       inkscape:connector-curvature="0" />
+    <path
+       d="m 321.87263,45.9708 c 0,-2.7532 2.22799,-4.9812 4.98128,-4.9812 h 228.68614 c 2.7533,0 4.9812,2.228 4.9812,4.9812 v 30.3406 c 0,2.7533 -2.2279,4.9813 -4.9812,4.9813 H 326.85391 c -2.75329,0 -4.98128,-2.228 -4.98128,-4.9813 z"
+       id="path26"
+       inkscape:connector-curvature="0"
+       style="fill:#ffffff;stroke:#000000;stroke-width:0.90568757" />
+    <path
+       d="m 239.12085,161.5353 c 0,-2.7371 3.5692,-4.9519 7.97993,-4.9519 H 405.2485 c 4.41075,0 7.97997,2.2148 7.97997,4.9519 v 30.1619 c 0,2.7371 -3.56922,4.952 -7.97997,4.952 H 247.10078 c -4.41073,0 -7.97993,-2.2149 -7.97993,-4.952 z"
+       id="path30"
+       inkscape:connector-curvature="0"
+       style="fill:#ffffff;stroke:#000000;stroke-width:1.14294505" />
+    <path
+       d="M 273.62212,155.5772 404.62983,81.7455"
+       id="path34"
+       inkscape:connector-curvature="0"
+       style="fill:none;stroke:#000000;stroke-width:0.90568757" />
+    <path
+       style="stroke-width:0.45284379"
+       d="m 278.54454,147.9513 -4.14805,7.1866 8.28704,0.1721 -0.0136,0.9057 -9.82671,-0.2038 4.91336,-8.5135 z m 127.49363,-66.4775 -1.17739,0.6657 -0.45285,-0.788 0.10869,-0.059 h 1.42193 z"
+       id="path36"
+       inkscape:connector-curvature="0" />
+    <text
+       id="text277"
+       y="135.63394"
+       x="8.0519142"
+       style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+       xml:space="preserve"><tspan
+         style="stroke-width:0.45284379"
+         y="135.63394"
+         x="8.0519142"
+         id="tspan275"
+         sodipodi:role="line">/.shards_acct</tspan></text>
+    <text
+       id="text281"
+       y="20.61161"
+       x="8.9575539"
+       style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+       xml:space="preserve"><tspan
+         style="stroke-width:0.45284379"
+         y="20.61161"
+         x="8.9575539"
+         id="tspan279"
+         sodipodi:role="line">/acct</tspan></text>
+    <text
+       id="text101"
+       y="182.27689"
+       x="61.487461"
+       style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+       xml:space="preserve"><tspan
+         style="stroke-width:0.45284379"
+         y="182.27689"
+         x="61.487461"
+         id="tspan99"
+         sodipodi:role="line">cont-568d8e-&lt;ts&gt;-0</tspan></text>
+    <text
+       id="text101-7"
+       y="183.15335"
+       x="260.96158"
+       style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+       xml:space="preserve"><tspan
+         style="stroke-width:0.45284379"
+         y="183.15335"
+         x="260.96158"
+         id="tspan99-8"
+         sodipodi:role="line">cont-750ed3-&lt;ts&gt;-1</tspan></text>
+    <text
+       id="text101-6"
+       y="65.650284"
+       x="427.37085"
+       style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+       xml:space="preserve"><tspan
+         style="stroke-width:0.45284379"
+         y="65.650284"
+         x="427.37085"
+         id="tspan99-88"
+         sodipodi:role="line">cont</tspan></text>
+  </g>
+</svg>
diff --git a/doc/source/images/sharding_db_states.svg b/doc/source/images/sharding_db_states.svg
new file mode 100644
index 0000000000..6693ef9b3a
--- /dev/null
+++ b/doc/source/images/sharding_db_states.svg
@@ -0,0 +1,1502 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<svg
+   xmlns:xhtml="http://www.w3.org/1999/xhtml"
+   xmlns:dc="http://purl.org/dc/elements/1.1/"
+   xmlns:cc="http://creativecommons.org/ns#"
+   xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
+   xmlns:svg="http://www.w3.org/2000/svg"
+   xmlns="http://www.w3.org/2000/svg"
+   xmlns:xlink="http://www.w3.org/1999/xlink"
+   xmlns:sodipodi="http://sodipodi.sourceforge.net/DTD/sodipodi-0.dtd"
+   xmlns:inkscape="http://www.inkscape.org/namespaces/inkscape"
+   width="771px"
+   height="571px"
+   version="1.1"
+   content="&lt;mxfile userAgent=&quot;Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/65.0.3325.181 Safari/537.36&quot; version=&quot;8.5.15&quot; editor=&quot;www.draw.io&quot; type=&quot;device&quot;&gt;&lt;diagram id=&quot;844ccadc-2c7b-a79e-c7fb-3468bcd4754d&quot; name=&quot;Page-1&quot;&gt;7X1Zd+JI0vav6dvvaHWVLzFgLDcpChCLuAPBCCS2Y2Mj5a//4omU2HHh6nL1zHnVM3WMhJRSxh6ZTwR/meVFUnsZrqdiNZ7M/zK0cfKXWfnLMHTLuKM/OJOqM980S50IX2bj7KL9ifZMTrKTWnb2bTaevB5duFmt5pvZ+vhksFouJ8Hm6Nzw5WW1Pb7sP6v58VPXw3BydqIdDOfnZ3uz8Waqzn63tf35p8ksnOZP1rXsm9EwiMOX1dsye95fhvkf/k99vRjmY2XXv06H49X24JRZ/cssv6xWG/VpkZQnc9A2J5u67/HKt7v3fpksN7fcYKgb3ofzt0n+xvxemzSnBb3iGh9nCybaw/vkZTMjUtWHo8n8x+p1tpmtlvT9aLXZrBZ0wRxfPOwIUV7NVy88VE6K/Ril+SzEvZvVms4OX9eKmf+ZJRN6wQd+ZCk/q+Vn6PN4uBn+ZZbUofH4+h7+ZTwkC5pa+ceTawzSB2vUS94CuV6PFhvpG4/bgafNhk8tLais3uvm2Byn9v67tv0eLIL30eJxM+i7W7/nzoP0/uB7J5zU9NfRUtwFi9biR/t5NX5qbRuz7+80kllfBrK+uE8H6fek4cV2XZbSunTSev85Hsx0OenZmt8PN3R/5Mzydzt7H1Ok6j1EVNqK8r0cL4KZ8zTdjGq2bCzd90Ftvh0ZrfXh8wPjPh72H+i7+I0+68HCnQ/wLkbnbbToanWt1WnRWLgvqNG1bW1bX7S0QXk/J98Q985iqo2fSnf19D4KFt3puDY3Bj33fdTT3+mat5H5vKwbNs1qf9+klhCNXg/vpZkEb2OZXS+rNtHjPbtuP5dFKzqaw1M3HZXV3Ac18T7oJfNRr/s2fhLvom0l9YNnBuZg+QH9U1EpbesmZGB/D/1LTmh2N2zbM783nweLex20GiydmVObx3Qd6K4LGVjEqz3dvHU8Mtw3v6fP6Zoqfdb5HWvfw9GyOx8vvofCC2mOg/WgPy6PzPDeiUqhKJeSRsV/c6M4JL4a9ahk0rjGoP8sh737tx9tJ6lHVTz7bWi6kd9/mDeWg3mwdNcjw8IYb25lvA0WHc15clIRNTV35pC8P89cy/deQ6eSxIPeQGZvz59FenRFuRT+YB50p0E8Tv1eaz0gmczueB327Lnff34KFo/xEHOq+FshO7MfMz+a1KrfcD+P8eRqI7MUDnvNe2fJnw1REZiPHD/NX6Fjgdl6D8p6NDKS9yBaRYOF+h9d805/5aDfxJxmdWktHHM6baRqbJqFHNfutzse0Gc3KskG6R6NaY9qnfyZG9+4fx2Zzp1jZKNHG76+3ruH7q7HT/GdIPke0feB0dVAY2f2/ZQi5fsLMz96q++Dxfx1XOum2Vsthr1EG/QdmnUsaUarQW++HD5hRtU3IUPdpbcdG/N4XAvVOc+xcC574w09j+5/Ji1OoGHvo5mejfksMetOPC7TuDa98YakwhZRAOpa6rhkuBVHd0myaZyXwHCnQa1zx2PXutG4opFEJ6bfn0snOqPuYtAZT8d9l6Tu8a25SPRg9rAe0D2DRffJ73dlYMyno/j5dazmpzNXa63qoD9Y+/3WThoblTh1vZImos6x1C7IWtSSuW8SPRaPr2Pj0Q5S5/1Iiirb95ymx+eTc16U1fuN6BmD3mPaMp+nZAHno2XTEF51CzqJSJu5XpU0KGYpDJ6e5yTd7qDfWo0MSOkzWUN+J3rXveR3ezZJCVm9ZZck8tkLao/RoHP/1u27c9Ab44ooJG31wefl7p0eWzSGLWFhRyTto96jFizm1t8V8DpMGuXS1qmQ1pPValSqllPWpChbxLc4rHu+XY+E7ZZjshIxWSRHp3m8NTxY+RDHKVkJdfxzup5IM6RV6Z6iGn+udDQ1uqtNyKbmelWHXa/dp42ZG7kLYfjSpyfeLwZLdw4pIt15v0H3dZKC5EPd99y5MDrySPdnFtnoJrTitmdUYvujZ/hed+r2qtaxfame2pfvdePc/v1DCUz3EuiYxFntWFK6b8N+C1qtkw1KO+bD1De6P0ZzkjjEExWH3pOsw8wyBHyVV6XjDkmQpZN9p++r/L2YWRLHv6Dx5/bUaxqN8kf2tCOZZ+mR7dye285r0ubK0kfSBk7pPrzkobSdSgLZiAsU/2f+LBFeE1qXstaRFRNSIB7BtS+NxTQd9HySTfeqL6RZbREXDar6fFybvvOsF90F84FoOti9aas7Wsw1xHdkbefBXMWTnmF3AwPjhHgHSZb9zZXhsVV6ep6Olu6CYqcNzYMsyyPFdPAUnRXFEW9kcdcscx7LXErWKWFrRcdClqz6L1nkT8u9cSD3W5J7yTEtnivXK9CE5hddvLci9N9upSV0j2O1q1Z6rOj6Sl5s/nel9Epe+b+Bjtb/PB2j305HstOt+WApjuPbwyicI/ABR9mB8hSL5ylrVu2ZMogWRfTK3oB69FwD/+itDjLBNWnkeB4YU6LovQm/e/K9SZyMR2awmWAmESzHw3RgdDOvo812keeJZabY7w1j1nvT+bA3XsG+NbymfW18ih+sYU9fTxbdWEWpR9fdjYz7zYXz+/dT3jqkubyPjXGq6DGYjp6YszOyJDFx/B0cJ29kq2yjdMoVPSDJIcmi7OzRpviWxkimk143Jdt87Hk4q8EYTYviG/v8+xje12q0LYo8qom4Rp/+eD14aq3wPhRnbS/xZ8Qec64xD8rW6TXxLgMr63pucUc97cjz/6jlMnJ5PjTf2aC3vXdi9b1TOcnEFuN0ZHa3o959jOgjow/JwweaUdbSRqVDcXJAMV8nQfzXaMezE2uxzLzVkrIcGzH9+Nj6b2isdNgPV27ZwqpCynFluaQhL2h4Do0dJy5HC6WN8HzK+Szr7/bFuLD2qA1zT43P5NNciSh0v6bQWD4jy0gQj7gR5b8qbjz8HtKjk05T3BdK4u6hp88zo7tx//n177J7lCn97W1w/NqYiXTgCU0g3jwau2UHiEcWj6lPlGCb6YktzUg6lQ5xzTIbNUGRtXgTFd9yyxrZKrKDkQjdNlHA61h18ktkfyi+KeXvuCEppFizA8qBQpSD+3SdQ/l0aNIY2VzDTT5GIMknV/xUpFo+Rri/r/NG1+j0HhTFOxRLOZzbZ2OEFKdpxHGNJOjkPaZ3JLmZLx+QhdJonvqUuL2elEPk/mQvQ4xF89tlERuyn/RcshxlzaD3sxuV5vpkPSKaKLtLYwRmw+toZ99X9lmMqISXcu4tSdkqk0T+TDGixTHifl3pbrQg6e+DR13Es7CpMjCVbT2MzZHZjSprPVhsV86FeNuNyCIg+6lBI6ElIdG7GlIGR/zsGpgzyUs6rJSQOet+qpFfLFnEc6KPldK1qTvDOfrbLtHfpkm+MK176nriM8VUVcuVHdBT0rwpoxIhxdQ0Rmg4WIfxfNybkGwY9PyQ+KfTLPRAVomvPs1dIz8WSzpHvI+JByHxPruvJ7b8LLJ+pD8bWCW30uTnu5XAFF4H58ii8V86Jjnrhep9+/5mNz/KCun50pXduyux9ZnGUmwdlX63xr42llh5Cy9HGZTh/N0+lgTiNK+kUpQDzkNqMCuiNGmikkTLl2SnUqJMFGp1L9eovVbmGkWarTSqrB1o1F4rc43aa3aulVPpphbRw5E7rdxr4k6bfRkTp0q6mLFm5VqZ1pl7zfDsPZ5WZ3b9c/l9fJDfH/Bh4doq66iSdAa2y5nI0ffgY6pWCcW2cTH7fqAsIMwyY/5MltUxzrVvFZGkkkR3jB1/IMGRwDwhddsGpDiqUq5GUSRZVOIJWa3wreEJzM+AZYVmsPSTVrDWVKAZJfgyk8ZXq5rs4x3wyXKxTlXZaRDGIOkmLQCfvCo9x8H4eqOtYQyiQRy6+Mvald8H3xbj2ZsGnkNZW265sQ4Gyy2gByQj9GzSrnjj9le3WbWoJMVh5rsYrEe1be6trmWM6ws0TEj2pFv7gzQky0eWxYQcs7eQTVtZnCZ5cXgOeh+vs21gZZ/uVdbP0oWElWQLSt/hXnq2F7DVIlk0YC0FPU9ZVKIP6x99R/cxraOYPC/0hWy9bMKb2px5VJoU2/DYWK2wsbLtwsKSBSYdgCXee1xJ3of5FmzdlPmG8Te4PpsbvYuaD72LqeZQkjR//NWIZsrKRhgb1/jZnBzSvyCz/B28A66jyKKqqzEoepCwD/Ci6l7Q/7rFHaTZaqhEbFQ9W/s+uyYKPo4CyUrUyRJRjJK4p9Ff+UNJTRE1n0qqIzsGa/Ysj48ckhJLIs4gThFl5hF8D/khSf6NLHKH4iTkYLFEfEHWUYO2KQkLiBOHUgq/2THYskFiyUeBa2SRTDfd+coNxhAyIGqSxEMTWDrIV5ImYgyKQWyWDo8leO9jd5pO/l6SZ4E0slV3aHz4W6zzNTe5ttS9K1z6wBY25WcjEXd2HIkI0iXyQUSdku3DU3sUXUCXUkun6AtRhE3yZR3qcmaHDqlLshcgJt8qSjdtMcMMQ8RMxxFFRZiZfmKVNlTRhJPJNCgi+FyjIqxMziniZd1WEUYbERF0jaLiyDGUH6V8g6Ill98rt60dSRTXmeuVkDlFvl0qHQ15LhwVc77GXNMpZ4UfNaHnSu+aW9HO7YSyISQdMtNJ6HYWlfE1RKfxNQ5iB+DUYl/lqoppP8PVRvkSV0XB1a/k6ve6Edyad0al8yh0JjhiIft2nBu0ef2f7EkrQsQlIh98S8kmgQdWNn+LPRd44MUaR3MypDmzp4WnU56WvGijEquocne9SDiCJP4TnWEzE+QLmTcGnWnecUq2kiKTkGxfuMnvU16wCU9FNtbXlCfm6DVRHq8qM4+n6A45I+81mV3YETtcsSjfLw/Xw0a9rkbyTfpQPV0Bf3qOB9G63ar6F2jvG+Kua9ynw0u6VmtFjQVyUcpDK/aaotzloM14gxfsmdM7xL5c80qE3z9dec88F67QJv2HuaPeIx303XeKp6JjpMUDtDVDD7Qi/Bv15nxfXXc1cL/d06cDo3Mex/GbuvSmydo3upQ9d0KgLyivmedIh8Ndfd98nmOfcrzAOp2+GRl2hgrAPq9LOQ2jOrbjHnYI3JiumQ571vs1O8UzVFf33dWgf2FlZf+OMVEQOxCKFlN/ca9j7W9HB+N+S98jzyIv/6xlaIXLUUHOoSXNpUZaEh/fm3FHG/ZbZBXPaab0cf9OlyIZ8KGxfNB9om1gTOfB6e7R6TssIIGPlPe5xG/XHvWe30eQ3Jq4G9fmGkUq12kYIx76QRke2SjSn+pGVKYdsm13lJPfkT1Ub8NP+GgUkq+IcrEt75tHNkYlOj/KQftBTnr6bGRsyXtYodIYrMaLPIrKn0By46aUy2qMvLgU4dF8drLFqJYHCdkamQ/z0YLyhP7DNFg2c3meE03Wo/J3m6IuynHvD95Jz99p4y/jTbAIyII7Oe/kyOymvvHBbDMMzn16JW6M6JqHgXGGWDjTUCUldjqQVUTaGeczrl4ce/sO29HECuzZrtvOYhGdMn17vy47LsnXGqv9VyM51pay37vgPfZeBDpPcnoog0THdFDz70a1+JY7ofnA1ETb9925a5qn3ul16Nk5B7/XzfzcFW0zP5xHRq/A7M6GC+zanuariuIXrbXitMjt13X74qaDHnnY/mDuG/ebEcl3kKHJyG5EA2QpfQGk1YyPa/cbvzd/q1/CEeRP3Q76zxvsYX9o4T968pIimkV3Gyzu43HPZa27am1/2xNbtbnE6qq/7P6xJ3bJqgwUZq47pvMbeS1Ogl3e+bNzRBJLdSdu1Y73xLDn/MjWJT//Q+EDaYS/zIcMxjl52UySq1BQfQcwXSS1yWox2bykdElyjL1Njw+3e/yrbmaw3ukh9jUHxQ4zzG24G3mPO6UPGfT0MgzVKmCoBQy1gKEWMNQChlrAUAsYagFDLWCoBQy1gKEWMNQChlrAUAsYagFDLWCoBQy1gKEWMNQChlrAUAsYagFDLWCoBQy1gKEWMNQChloAFgsYasHVPbyigKEWMNQChlrAUAsYagFDLWCoBQy1gKH+T8NQDd36gzjUuwKHWuBQCxxqgUMtcKgFDrXAoRY41AKHWuBQCxxqgUMtcKgFDrXAoRY41AKHWuBQCxxqgUMtcKgFDrXAoRY41AKHWuBQCxxqgUMtcKgFYrHAoRZc3eMrChxqgUMtcKgFDrXAoRY41AKHWuBQCxzq/xYO1dD+TSDqtwKIWgBRCyBqAUQtgKgFELUAohZA1AKIWgBRCyBqAUQtgKgFELUAohZA1AKIWgBRCyBqAUQtgKgFELUAohZA1AKIWgBRCyBqAUQtgKgFZLEAohZc3QMsCiBqAUQtgKgFELUAohZA1AKIWgBRCyDq/zYQ1co7pP4RIKpZAFELIOoZENUc9Jw3coS5u8zcrhvV/2+AUBMsJ34AQm1SYvBKxy/13pjMfPMN7wVw6bDXNZuLe4vBO7yo4yCJTU83dihUTgMD4RRvsQISEx6da/O2q61AQA9W9vdwG/YQyIoNGY3BrEfL2y1yb7xFf+/M7lcUds/rxuMdQgdK8t+HPX15CF76cXSvPSUexOPFfD7OFt9UeOWEPmhdg1wweInGFka23X8CpuWtezkkAzoyA2xfAxyhD3sI3+5f6f2nI04lnCTbZubt5/24bgZh9RlUQfdpIyOZY0PPx5wiJIknW+rL9fvI0BiI5tTuldt/ahGPulgwZOfCCXt5P4+j7e722XZ3RE4pRThf76mt6hMZOboWG39u1HwT2I6oNLWz7+kZjUqARQuDgvAP4Q8N73RuY7qWeJfqvG0hKs1r3x/AY2NAko+23oMa0pMdYJehpaDHT+ECnn/qXL8AAC22rhfcAoCWotL5EKAoojBtVJwTgOJtAGghS4b4CAAtHUuN/1UA6Asbgzmg4oya9CbSLd8GTKX3ViCAa1DBuevNp2RHfwWYmmJx7WNQ+uNiEI3jhqnoude9Fbb5JC/u/2GIomM2aLa3zM6VrLFfArkXUWC5H0JEvxpy/zmJo7T6Rii0g+35DyRObOG1f1XiXFn9hTKIX4Ip83m/l5zBDNXx4+sB5aTwqtqNsELI1fYzEGYF9gLsr4OSlDADh2Hzja3WASS2cwX+guVyKbAZn8FfXN5gxDJ6yW60SyiCSISsagxEQETidbBkbp56NKLz64BSTHrX6ehpPJ30xRltL9An4yEfT0fVA8mS2CBC9MZR493w6Xk+YODfRSm0xGcgwDUGBKQC0JMKogoFAOCNXI4YrkKCd6Awojlk1cxAYUk98k0AKFxssFYEgGfYbrBEG2AEQM2rOtHytuKRc719OqdQZjXOpbEiElUIdQu4Wlm9T4BVIwXJxMZG0+BjBjkB0M3g05+XapQtQ0RVTeyhHBb55wQQBSFDbABhq1sTlfi3SN2n7JmsMkxh4oFjiKVjS7S/SAoVED11Z5btyuZNUkcSmzCdd1IX0v3YBBaagjtWsfGRNvYlLkYD8MfyrqDBQKmOW/4lKfxcBJe4FSeH/Bv05ia/xW2UhFchH/iAZZ/Y63W1IWVfkHaKLZnjny/1AMSNbOxtdjFVAIc9LLABsE9ZAwCGOFDS6HPCgI4o3EOwuVSQy1AUBNvjCP80uv8KqdUwr0xqyc6E1r9La4c0x98yVOKraF1pQtL3cHfOtvyzTOwraN3YWwiSKcf+hJ/6Clrz1rpb/kpa+2SZ2fpmtAbcJT7Lar+A1rrYyXUH5Q1bVY76O+kHKx+kt9OP3ukALuzKYAuPBQiN8ChrZRCdwDWHpRlvAJkf0o/ijJvod1vsW5Ifxr41xybebn8xHzHFx/nI1CcanOQegDPdOv7W/VmJMeLZ9HfkNp+JQF2S8Js1W5Y4svt0BCpRfhrmEagFzftJUdq+LCFliKHMYgGAIgBCB0AD8YR0GEhN0uEFkER4YZNBG1hl/Hxx1WeyHi0rubkl68H6jfkLWY8UAOWX86wnVPDF27TYZPCOJ5QWAz4sHc1lwDrFRhy9C9JiPCOP3gGjDs/W0L4iem/aZC9ujN7VKtnno3eBgm0rj94bgOl4H5ee7YHYAcNvRKqid1DSlTGDcBteoNH5TeY/Ugb4/QvU69ya+wDK+2nqAbDWqLD1znKfKoBP+m25D4PWNAY5sQcBUCk0KdMm78vAppDBnV5IEXNOPR9gMLNxWur1RdS7OXP889Tj8qNQzywew1bJlyLr0SHPbrsEwDvlHbHMM0fKrgAVPi0A/O2xCj3T2MXgMy3h90i/NHNEwRnFcrdnjoBnHmSOW7fSAUSabAhlvZUmYHcp0Sr5u52XwyOOF9xAQ2WPQgIA/yeyxyYAy3n2uCFb/abKa75kTSMrwMUzQu02SQQ8v7pVpS28hkHvyz43YRCjB6l08M4kCbtcnKJMSzYqnbzdxAEHv7TYGUDYZFfszMBb/9Zi50+vSqqoWlgMDL0tA0y4QC6nJZcdOfpJVqLWNShb2Usn7GWg7Zs17J/5B+wkbN9/q51kL8O7sQd5imOg7I5zNxSvAs7rUV7w73gZebMu/wteBuuQvuHuddsUkc/y6FZKKJ5lq4k9fTqfx9YGtwdCUe+X63K4b71D3q2hGhl8pS7bn8iQWZezAlCOb9wKRYWzowz5JEJk25gA48Eec6fLKuv7ek/TqIjc0yTMbS7U/EpP06FYOTZubWxE0WK6j3ma2KM49dtbUYnNvWXEPc6hZUR8ZN/UxuZkZx/Qye4iuFjSH+gNr2SdNL45KNLqWI3KeeHVcaHJM3SD5NI5Lx8q6+m4l5AOdQ2iLL1H81teYnmwp8/lgYy1kCh+eo7q3MyjpMr1PGGoPI7LUxMulJIoZ0QBQfZd39e4uNkbrIQqvNDGMy0/F3FRQdlSxSQeKBugwIDurRpuWkp53CjYCFhQzzcDufsO0nR4TZhfM46aKKHT3UWYqPK6llH38nMocs7noJ29935OmnTRzEk+3lzELLYNXpPf7cHuGlM0ULybtQmo95/1EcnHoD+Yc+l5ZfOzYmVYJY65VWmcz2tgqmzDTxueS1ypohROJ2pss+w6yYqGSYaJehLrtygDwnfxttH3Ja9wRNOIy/xRGtNGOV1gYseD43qPZB9N3rDuW0FOW0JxKp6juW1NAwVVboC9PorJsQfh+RveTcK+qecgntWE6W9c5LVk3X0JiDzeBeXsVd7XU9z2uRhTcdJnbpOOJUNeh3YMX1Y1lCUpr3EgATS/BopNM86r72gskjoUUYtKi+fHe49EB3A0L2kiusj9+5dSldsIoMmQT2skMbAjOQ244JPbEFRQCE7P8TKaPKH0HXm7Y6n5hViPTLOxDZYkLo+Jd3xQPAIfbivwFUAYHa7jLfa4BIqIv32s0R+UlFVi66BlgeFysW2sSoQ8YftZiY8qaYSdcxLQ3SXNo4hxA1tL8zEzubLGkSpFQysB4q/G+7ZczlSiaJz4yzSuMk0blRByxbtrRCNVJD+DXDmaoh2iBM71pJAOyxUQcCQvQOElsCJoM9BgHrMVsVDWJlR5EqyIze0VlDyjDG6j1tbDdAS58ppZKVhpK3oiYR7h/nJ2fcp6wS0WIF8NrGhl949R1Ivcjdt2cPmcmRU1G6qELjT3cyghM0lgJZmuFS7iT5UchRbNHUXXFE82d3QhWiu6cFsF3g/QlWzRZxnYamwuOmbZQnkXxuQyNwm5nd5stRzLjarXrJbVMLhAdxMsu+Q71vPxovs2Mlpxdj4vMb8Wh+5KzFHoRhqYAKeJkm2KPkAFivdirKmSpnZQFq9B47ixSRtNUGL2CcQp1fyCqetkqxRNFAGaaMEg0FyqwtpmiZRL8BNwssFaX0VRXKqKENFiwde42DeF5AgUJG5FNPgMteRXUWtfkO9yc4empWxkDGrpiE0avIra3Lpsqym2KkO3sLsfoHGlra7HfiUXy2tq97pkKXvdJJsJqiIz1qDDKVNAlVbaKF8m2VHlfWyfS+CQQfJqY3whYROrbI/PyvyuRB6NSqAfRh6HSLR/5g/VOsqJP+SSa5RTXvOHJAl2A21M9v4Q9NXF0pcNbsHSyv0h2cEg5EYNUvkXl6VQ2X7SZayQG2T/NtwkgKQXOo6mAayHUbaqwmXfh/6wY8FfuFy6W7Jyf4j1rWN/WM3t1s4fkl9Jf+oPuST91B/SWEuSeiCgK9PcH3JJ+qE/xN76iT/kEuK9P+zADh34Q2heYB37Q4or2GaFkF8t94dEc/PQH/KKDhpD7P1hxodP+MP0mj8M/4k/NBoX/KHLjSNC+EPwxOT2OWiOwn4FkSfxWlZ1Zbdjiq1K3LBK8SejS7amCh1WsqNyCzfb78ziJeDCElWaTbopkS13sP6/hU9ptPmZaIgRKrnJG12UsFqGZi1o3RMqnS7J/X2l/X1nz6frJedBmrKuiPRLXO6r5KSzYTmU4KtA2wR+L/KH4JtEmfjP7QF/RtnzdXsQ/RN74OsX7IHJZd0cH+90ZKt45MCGAqMmD47Vrpfav0/RzIP5jPxv5/v9VNEo3xnU0L5LNRdBIxeSHxpvy/iMNvMj4QYo3O6qpKuYqMR6y16wQvdx2X4sVRxRNTI+Jhxv7O4rnT4ffxHf4PqUM361orI5aGex5ZJutQtq7eepZfP8TIxw0mj3c17PmK7HtU6uVcir7Cw7IV88jVQzjsBAcbvyerCcjskIiqwYneIEiyU9CiTvhlU6HKG7EaS1yqhM8m7Y41URLHMjzFq2CFhTIBFsl1uvxCkifZcbmHQQH5CV7/DzyOqbdbbcYRaDhMgTwdGEi3s5AitpQHE2yKKRJ01Zi2ZsfckTXGsicIGqlBNcjSWMz1JVoNUux6qM5jO4HYQscXMil3RCUdfXVEsAUBOUQRsFtCVxNI6oJI7xN87yM6xrgKo0U9h+3MtNq0JuR0AxssE2i6ka0Hw6qoUB8kCyfwKNrhiRGG9U0yy63oMOsPyilQG3miD7yrt0HMOj9VjUzHQMvkWYn8iTto2redJP/YI5rM21wc6OxNhtsFRzraYuFtCfkCQIbRkctD+QQAAoKUWbNJZSU0kpzxexIuICAzaUbTJ9j4iVolyLY4UZR6obtjUStoNpz60zGl4JEg36aqptW6BzXMEtpquKnvCCHPtxewvyV9zeg6TQQXsPyjVK8M+4N8niA4r23c9IqPfbJNTm5hzwdhEylLwBnmOrRjsdZHscw7scpwfwdpwVko6hbZStqBNmVIKeVhUGQ0noltuqccs04hBLqEAjRIPH4Ig4QEMTUC4lu4K/BkUmqcotqpneczu3hKM5ZKq8gsItvrhJhquiQ5O0IFRSGidZBGTf7AW9jrzqBSu3ecHLuJCOtfeCTZV1K7uUCAk7G8CucRMjikyRRWIFQ+2Pl7OIjBsAwjpUJdbLVFuuUFNepolrgYBEE0k0BtkK1WzQFohWOPOGRFY56hDc/IizkC03j5FV8NjmxoVt7OU55w1DrtPM/CKaHUQOARrPaOr9Y83tYS2wowleaasmWXszRPdZXirYinKjeKZXM2vxpVbR6F74EB0WTLCMBho3juJ9yqqiF9biuRELog+ml62wM1h1rsKLW0BFcvs1NMLhBjqfWZN0j+tCDjVY+0f5qmozrRrI8YpqAM4rW87rIjy7DfujSDVWI+nYuPDMjLLGsYsmh4aK1yARYfZ9h7WdvsfaDuIW+As9y101ZXd39/FxIPkYuRnGCY+f8/wZikVfRLFKfJFi2BXBunTmEQ8o1uEMcj8THLcOKZaqzGt3rGNF8oBSOJYHlDo8NlT7O2T6u2P+/kadlNjR/BqdbBp7naym3GwUdgx1EXIcqZ0azqiVJ2b9LOV0MUR2HND8Xc56YugNVtp2x5zRYUUS2boU+fHp9+oYTZb4/v0xf2+eRSUXWkUd7OigNdPpjg6j/xhbm+3o4rNAbNU+a5P3M6m7XCfgVXkXVTXTtnT+TNxS7cv3jbxdrBlEXO1pogp4COwaPCPabqkqaZ2bQ3rYVQwz/EqVqHRJWnj952QXqmRfkRbVFPE2zbpSCxH+l8xRaF83x85/yxytr5uj8y/M8TzaoHzoumX76brleEXeYr5vroq9LDRJ7ZhshXtYDwpVRRY3E8VaJdZssbYbYM0Ia5GGq9DGplrPQ1TmqHUZ3qlEroA1myb2Xixu+jtDPhKkqq1dKd/byP4K1WjUy9o6q6ao9C7kbyVHhclFq7+3XSnnjB+2+ka1fmdf++CFlN/AEjdTzh3b3PDYuNjE/Uo2F5hHP+hylM01uZr31/2xOG6B6zHCNlErZpQnGCJrucq7YSqDVc0Uw2wNwFZ5AzI+ZFjcSBFZMTc3BEqSG57LWOYtnl1uE+0gLkbMbGWYaMSIkldm8sbs7Kc7KTL1hheoTO/pQgZ8VXrj7TXpFfKX/TKqbQ/9MktbQ61yUWwDbAA0sJSt3yBfw25BoCv6cByNvED53Rn5dBWpYbWUd5MbqtJzmzVX1bACzxgcZM9YYfVUNOdyK16BZquaakrJcbKWrVRaHCenWLmcX23TeVHabPeqtDm3rSmbl2ttD9aUsZ9JEYfDa65ol66yYB8oCmQQmoqDBaIaRCcya59pc+bMLdYheYitQ6moEWZrEFg34D1Fw2EcuZ+qdU+sc0LyuPW/lu2zYnfNUH+dbD2H12zsxtUVrMttMPeIFMcSjPW5ipu7ZiMSzqTTUqKal/vrsxjp6npy6fp6coV7CdzEH7ccX+PvId9sF9qPNVnpm4pvTdngKNpPVeYXyywjlmzzUB0KZEuEFc4QNlDn9pwpdjoFjiWvRKhm7aZao2NcAvaQNYX7dxJemWC8hWrmrv462J+zs3Uo7ZL9vraaS1p5LcORt1lOf33N8h5aVPKjtrKoFM8u2KLqAnTgtUCOyreMZlMVz8BPE52QoUBuebeYjoWpcrhAWdiolLWIbWJ/z8j2NxV+Q0XmalU3xSpNU7V1bvPePPZFDVW/ye1QtYvritdl7Vr8Sry5yXpaf1+LHcqHVtWRvAeAZvZeZlUVogpN0ZVV5cbsyH5E9lMRsc37SrxqwB4Le7tMiwb2GNpsPzYKX+CHwP64WEtkXCpiEGAr0FAc+3FYo8UapW+o3fXmRv1sG2gWW+551nO57fGxjVV5jSyZ7pV9O4UI++U9IFQcbQ+8E35eRbXJ5dXCZ/K+5BkYl1JSto68u8seh/7xemsQMhqAYyLoV2ApHe9ItW+Ea/ysOT03d7dzGWachqqS0vgHIhg9jVWbwGTEOnYJsr05l7FCwMw4qv3wJc9+2T8Z16Ohn2KA8OM+0XD38zMOIyF4TZg8qxs9R1mGnKq1+Twm5ZjSVjGmr++P8e4OvP82Q/rZmffW83hUYRWCLP5EDwwVl6r9yqzxvdoHM4ZljeQCnv7S2vRp0+ATP1RJNoN+i+TgUfO904rE1qIxf662znNutEfsj8znl2uNUtl/ke/6sZhv0DFLdTzbWKPeNmu4mrcYvtpcFj/782FT37OubDUX7Rpx33vHbJF9TZ5V++LLth2NNXcNMNsP3F7xoKPcjT97nDds7Eo0NPa5IXGLrnlcj2bfrzQu/nmD3fz9slarig6LR7KbqDHd0+Bi89nLjTsPuLNvy+sd3/8bW8Bm7UTl8PTnXC++R4AObLV70rGH5chI4p81MlZtqvO2wAI7uKQhvJ+oNxNXrraCMmoh1btAuj8Y5bj17zxv8rkKnxeJ1jCqYV4hddD0cycFY2P+MsTPzlFklLWUpqx6s65r8PCdu85uZjrPrL7k3n+Lgdn85jyO10NjvhkgSmg/VPLW1E558DquvL777cGS/i5GT81v/lLdo97pOX1ejLWGnrztx38gybt/c2qqIemg1wz9ZRw2O6uQIsrYoTnkHY3y77iCa/bwMFk8dkYmLCbdf+Wd6lFOyy7Fb8/r4Il/9vd6m+KDRsZMtycBTaJoqfvmk9YQx9PxTnvRlnn+WpcUuSPTp+hgUEtI0l43A+P+dVDWZ5O2PiVv9jYhuo/7WWPoZc6ra7xVtBiZtzTovq3h9iPFabY96pE9kj9tcq3s74cNmTNJ/6ip8/cPWwTnkSosREwe/YLF2a2U7toiD/pT/LD0G8WmOZ9+1sr4dATwpfKppsncj/Kz7Zl3kvDJ9yN6kjcIP3uX0UU3RcQFn7zz0A6QDub24ZOjTHrd1xF+ePKnVMqvaC4el5dkJtOP6222VcPhOVoSv175kQDvxDv6vWfSt+Zv8YzXPHKAfpe9uRakv+qRyX7qFDE8Pb8Pnoib/FPq1yOA3/I8rbWmyDId9p71P/S8ebCYG9lPGnAkdla7tbc9uxbhp30KL0V4dM95REiWjvvahmiSjP//jrbSpn3UVdqwv511lf5+oal0fu6f9JT+ftZTurxaboaz5eSFTlcezjpM0yzp8Q/TzYKGrOj08XXzsooneefo5WqJxtP/mc3nJ6eGWf/ogKhCo583ll7MxmM85mE7nW0m7fUwwDO3L0P0m+b21Gg0za2lX6fD8WqbHYTz4etr9jlYLWZB9vlKb+v8DWme7ZnEI/S77Pig/bXG//2mtuHmEX/1uwtdw/NO4ocMNn5D0/B83AMOtyab2ctsGRYM/iIGm3fWH2Swfsbgx5fJ67Tg7m/jrv5vstco2Ptn2Wv/UfNs//xHHSbLcenlhQkagJgg4RGLD8n9MVmPpYEI+fho0n+7b3rZlO1Ps2AyDiefZcABge0L9M3PvUzmw83s/Xj4S0TPnvBjNaMHX+Xvd+v/2cdjvK7eXoJJdtued2cj3Wk/G2kzfAknm7ORWAp2E79NMO7OBKP9VGpVqpX/E0oPbn6l0t+ZJ7/k8u1bzstDtb8klrp9XQJvVvtvhdp/sdqb3445bHz//ut6fzbUl6n9eUJWCMbXCob1/TeJhfWl/uD+TDA6buERvs4j/FmHYJyn6cxcx60V3P0C7hrf9S9kLx2+rFabQ2UnEk7FajzBFf8f&lt;/diagram&gt;&lt;/mxfile&gt;"
+   id="svg240"
+   sodipodi:docname="sharding_db_states2.svg"
+   inkscape:version="0.92.2 (5c3e80d, 2017-08-06)">
+  <metadata
+     id="metadata244">
+    <rdf:RDF>
+      <cc:Work
+         rdf:about="">
+        <dc:format>image/svg+xml</dc:format>
+        <dc:type
+           rdf:resource="http://purl.org/dc/dcmitype/StillImage" />
+        <dc:title></dc:title>
+      </cc:Work>
+    </rdf:RDF>
+  </metadata>
+  <sodipodi:namedview
+     pagecolor="#ffffff"
+     bordercolor="#666666"
+     borderopacity="1"
+     objecttolerance="10"
+     gridtolerance="10"
+     guidetolerance="10"
+     inkscape:pageopacity="0"
+     inkscape:pageshadow="2"
+     inkscape:window-width="3840"
+     inkscape:window-height="2031"
+     id="namedview242"
+     showgrid="false"
+     inkscape:zoom="3.084063"
+     inkscape:cx="405.2791"
+     inkscape:cy="259.56019"
+     inkscape:window-x="0"
+     inkscape:window-y="55"
+     inkscape:window-maximized="1"
+     inkscape:current-layer="svg240" />
+  <defs
+     id="defs172">
+    <linearGradient
+       id="linearGradient6035">
+      <stop
+         offset="0"
+         style="stop-color:#ffffff"
+         id="stop6037" />
+      <stop
+         offset="1"
+         style="stop-color:#ffffff;stop-opacity:0"
+         id="stop6039" />
+    </linearGradient>
+    <filter
+       inkscape:collect="always"
+       x="-.064257"
+       y="-.19277"
+       color-interpolation-filters="sRGB"
+       width="1.1285"
+       height="1.3855"
+       id="filter6093">
+      <feGaussianBlur
+         inkscape:collect="always"
+         stdDeviation="0.89250425"
+         id="feGaussianBlur6095" />
+    </filter>
+    <linearGradient
+       inkscape:collect="always"
+       x1="269.97"
+       y1="511.97"
+       gradientTransform="matrix(1.1818,0,0,1.1818,-30.649,-69.394)"
+       x2="286.63"
+       gradientUnits="userSpaceOnUse"
+       spreadMethod="reflect"
+       y2="511.97"
+       id="linearGradient6110">
+      <stop
+         offset="0"
+         style="stop-color:#c6c6c6"
+         id="stop5497" />
+      <stop
+         offset=".20485"
+         style="stop-color:#e3e3e3"
+         id="stop5501" />
+      <stop
+         offset="1"
+         style="stop-color:#a5a5a8"
+         id="stop5499" />
+    </linearGradient>
+    <linearGradient
+       inkscape:collect="always"
+       x1="282.36"
+       y1="518.56"
+       x2="286.63"
+       gradientUnits="userSpaceOnUse"
+       y2="527.34"
+       id="linearGradient6112">
+      <stop
+         offset="0"
+         style="stop-color:#e3e3e3"
+         id="stop5468" />
+      <stop
+         offset="1"
+         style="stop-color:#a5a5a8"
+         id="stop5470" />
+    </linearGradient>
+    <linearGradient
+       inkscape:collect="always"
+       x1="308.5"
+       y1="522.61"
+       gradientTransform="translate(0,0.25)"
+       x2="327.78"
+       gradientUnits="userSpaceOnUse"
+       spreadMethod="reflect"
+       xlink:href="#linearGradient6035"
+       y2="520.33"
+       id="linearGradient6114" />
+    <linearGradient
+       inkscape:collect="always"
+       x1="308.5"
+       y1="522.61"
+       gradientTransform="translate(0,12)"
+       x2="327.78"
+       gradientUnits="userSpaceOnUse"
+       spreadMethod="reflect"
+       xlink:href="#linearGradient6035"
+       y2="520.33"
+       id="linearGradient6116" />
+    <linearGradient
+       inkscape:collect="always"
+       x1="308.5"
+       y1="522.61"
+       gradientTransform="translate(0,22)"
+       x2="327.78"
+       gradientUnits="userSpaceOnUse"
+       spreadMethod="reflect"
+       xlink:href="#linearGradient6035"
+       y2="520.33"
+       id="linearGradient6118" />
+    <filter
+       style="color-interpolation-filters:sRGB"
+       inkscape:collect="always"
+       x="-0.064257003"
+       y="-0.19277"
+       width="1.1285"
+       height="1.3855"
+       id="filter6093-0">
+      <feGaussianBlur
+         inkscape:collect="always"
+         stdDeviation="0.89250425"
+         id="feGaussianBlur6095-7" />
+    </filter>
+    <linearGradient
+       inkscape:collect="always"
+       x1="269.97"
+       y1="511.97"
+       gradientTransform="matrix(1.1818,0,0,1.1818,-30.649,-69.394)"
+       x2="286.63"
+       gradientUnits="userSpaceOnUse"
+       spreadMethod="reflect"
+       y2="511.97"
+       id="linearGradient6110-8">
+      <stop
+         offset="0"
+         style="stop-color:#c6c6c6"
+         id="stop5497-6" />
+      <stop
+         offset=".20485"
+         style="stop-color:#e3e3e3"
+         id="stop5501-8" />
+      <stop
+         offset="1"
+         style="stop-color:#a5a5a8"
+         id="stop5499-8" />
+    </linearGradient>
+    <linearGradient
+       inkscape:collect="always"
+       x1="282.35999"
+       y1="518.56"
+       x2="286.63"
+       gradientUnits="userSpaceOnUse"
+       y2="527.34003"
+       id="linearGradient6112-4">
+      <stop
+         offset="0"
+         style="stop-color:#e3e3e3"
+         id="stop5468-3" />
+      <stop
+         offset="1"
+         style="stop-color:#a5a5a8"
+         id="stop5470-1" />
+    </linearGradient>
+    <linearGradient
+       inkscape:collect="always"
+       x1="308.5"
+       y1="522.60999"
+       gradientTransform="translate(0,0.25)"
+       x2="327.78"
+       gradientUnits="userSpaceOnUse"
+       spreadMethod="reflect"
+       xlink:href="#linearGradient6035"
+       y2="520.33002"
+       id="linearGradient6114-4" />
+    <linearGradient
+       inkscape:collect="always"
+       x1="308.5"
+       y1="522.60999"
+       gradientTransform="translate(0,12)"
+       x2="327.78"
+       gradientUnits="userSpaceOnUse"
+       spreadMethod="reflect"
+       xlink:href="#linearGradient6035"
+       y2="520.33002"
+       id="linearGradient6116-0" />
+    <linearGradient
+       inkscape:collect="always"
+       x1="308.5"
+       y1="522.60999"
+       gradientTransform="translate(0,22)"
+       x2="327.78"
+       gradientUnits="userSpaceOnUse"
+       spreadMethod="reflect"
+       xlink:href="#linearGradient6035"
+       y2="520.33002"
+       id="linearGradient6118-6" />
+    <filter
+       style="color-interpolation-filters:sRGB"
+       inkscape:collect="always"
+       x="-0.064257003"
+       y="-0.19277"
+       width="1.1285"
+       height="1.3855"
+       id="filter6093-0-9">
+      <feGaussianBlur
+         inkscape:collect="always"
+         stdDeviation="0.89250425"
+         id="feGaussianBlur6095-7-8" />
+    </filter>
+    <linearGradient
+       inkscape:collect="always"
+       x1="269.97"
+       y1="511.97"
+       gradientTransform="matrix(1.1818,0,0,1.1818,-30.649,-69.394)"
+       x2="286.63"
+       gradientUnits="userSpaceOnUse"
+       spreadMethod="reflect"
+       y2="511.97"
+       id="linearGradient6110-8-4">
+      <stop
+         offset="0"
+         style="stop-color:#c6c6c6"
+         id="stop5497-6-8" />
+      <stop
+         offset=".20485"
+         style="stop-color:#e3e3e3"
+         id="stop5501-8-1" />
+      <stop
+         offset="1"
+         style="stop-color:#a5a5a8"
+         id="stop5499-8-0" />
+    </linearGradient>
+    <linearGradient
+       inkscape:collect="always"
+       x1="282.35999"
+       y1="518.56"
+       x2="286.63"
+       gradientUnits="userSpaceOnUse"
+       y2="527.34003"
+       id="linearGradient6112-4-3">
+      <stop
+         offset="0"
+         style="stop-color:#e3e3e3"
+         id="stop5468-3-0" />
+      <stop
+         offset="1"
+         style="stop-color:#a5a5a8"
+         id="stop5470-1-4" />
+    </linearGradient>
+    <linearGradient
+       inkscape:collect="always"
+       x1="308.5"
+       y1="522.60999"
+       gradientTransform="translate(0,0.25)"
+       x2="327.78"
+       gradientUnits="userSpaceOnUse"
+       spreadMethod="reflect"
+       xlink:href="#linearGradient6035"
+       y2="520.33002"
+       id="linearGradient6114-4-4" />
+    <linearGradient
+       inkscape:collect="always"
+       x1="308.5"
+       y1="522.60999"
+       gradientTransform="translate(0,12)"
+       x2="327.78"
+       gradientUnits="userSpaceOnUse"
+       spreadMethod="reflect"
+       xlink:href="#linearGradient6035"
+       y2="520.33002"
+       id="linearGradient6116-0-7" />
+    <linearGradient
+       inkscape:collect="always"
+       x1="308.5"
+       y1="522.60999"
+       gradientTransform="translate(0,22)"
+       x2="327.78"
+       gradientUnits="userSpaceOnUse"
+       spreadMethod="reflect"
+       xlink:href="#linearGradient6035"
+       y2="520.33002"
+       id="linearGradient6118-6-6" />
+    <filter
+       style="color-interpolation-filters:sRGB"
+       inkscape:collect="always"
+       x="-0.064257003"
+       y="-0.19277"
+       width="1.1285"
+       height="1.3855"
+       id="filter6093-0-9-1">
+      <feGaussianBlur
+         inkscape:collect="always"
+         stdDeviation="0.89250425"
+         id="feGaussianBlur6095-7-8-8" />
+    </filter>
+    <linearGradient
+       inkscape:collect="always"
+       x1="269.97"
+       y1="511.97"
+       gradientTransform="matrix(1.1818,0,0,1.1818,-30.649,-69.394)"
+       x2="286.63"
+       gradientUnits="userSpaceOnUse"
+       spreadMethod="reflect"
+       y2="511.97"
+       id="linearGradient6110-8-4-5">
+      <stop
+         offset="0"
+         style="stop-color:#c6c6c6"
+         id="stop5497-6-8-9" />
+      <stop
+         offset=".20485"
+         style="stop-color:#e3e3e3"
+         id="stop5501-8-1-7" />
+      <stop
+         offset="1"
+         style="stop-color:#a5a5a8"
+         id="stop5499-8-0-5" />
+    </linearGradient>
+    <linearGradient
+       inkscape:collect="always"
+       x1="282.35999"
+       y1="518.56"
+       x2="286.63"
+       gradientUnits="userSpaceOnUse"
+       y2="527.34003"
+       id="linearGradient6112-4-3-3">
+      <stop
+         offset="0"
+         style="stop-color:#e3e3e3"
+         id="stop5468-3-0-8" />
+      <stop
+         offset="1"
+         style="stop-color:#a5a5a8"
+         id="stop5470-1-4-8" />
+    </linearGradient>
+    <linearGradient
+       inkscape:collect="always"
+       x1="308.5"
+       y1="522.60999"
+       gradientTransform="translate(0,0.25)"
+       x2="327.78"
+       gradientUnits="userSpaceOnUse"
+       spreadMethod="reflect"
+       xlink:href="#linearGradient6035"
+       y2="520.33002"
+       id="linearGradient6114-4-4-3" />
+    <linearGradient
+       inkscape:collect="always"
+       x1="308.5"
+       y1="522.60999"
+       gradientTransform="translate(0,12)"
+       x2="327.78"
+       gradientUnits="userSpaceOnUse"
+       spreadMethod="reflect"
+       xlink:href="#linearGradient6035"
+       y2="520.33002"
+       id="linearGradient6116-0-7-9" />
+    <linearGradient
+       inkscape:collect="always"
+       x1="308.5"
+       y1="522.60999"
+       gradientTransform="translate(0,22)"
+       x2="327.78"
+       gradientUnits="userSpaceOnUse"
+       spreadMethod="reflect"
+       xlink:href="#linearGradient6035"
+       y2="520.33002"
+       id="linearGradient6118-6-6-6" />
+    <filter
+       style="color-interpolation-filters:sRGB"
+       inkscape:collect="always"
+       x="-0.064257003"
+       y="-0.19277"
+       width="1.1285"
+       height="1.3855"
+       id="filter6093-0-9-7">
+      <feGaussianBlur
+         inkscape:collect="always"
+         stdDeviation="0.89250425"
+         id="feGaussianBlur6095-7-8-6" />
+    </filter>
+    <linearGradient
+       inkscape:collect="always"
+       x1="269.97"
+       y1="511.97"
+       gradientTransform="matrix(1.1818,0,0,1.1818,-30.649,-69.394)"
+       x2="286.63"
+       gradientUnits="userSpaceOnUse"
+       spreadMethod="reflect"
+       y2="511.97"
+       id="linearGradient6110-8-4-4">
+      <stop
+         offset="0"
+         style="stop-color:#c6c6c6"
+         id="stop5497-6-8-3" />
+      <stop
+         offset=".20485"
+         style="stop-color:#e3e3e3"
+         id="stop5501-8-1-0" />
+      <stop
+         offset="1"
+         style="stop-color:#a5a5a8"
+         id="stop5499-8-0-3" />
+    </linearGradient>
+    <linearGradient
+       inkscape:collect="always"
+       x1="282.35999"
+       y1="518.56"
+       x2="286.63"
+       gradientUnits="userSpaceOnUse"
+       y2="527.34003"
+       id="linearGradient6112-4-3-0">
+      <stop
+         offset="0"
+         style="stop-color:#e3e3e3"
+         id="stop5468-3-0-9" />
+      <stop
+         offset="1"
+         style="stop-color:#a5a5a8"
+         id="stop5470-1-4-2" />
+    </linearGradient>
+    <linearGradient
+       inkscape:collect="always"
+       x1="308.5"
+       y1="522.60999"
+       gradientTransform="translate(0,0.25)"
+       x2="327.78"
+       gradientUnits="userSpaceOnUse"
+       spreadMethod="reflect"
+       xlink:href="#linearGradient6035"
+       y2="520.33002"
+       id="linearGradient6114-4-4-5" />
+    <linearGradient
+       inkscape:collect="always"
+       x1="308.5"
+       y1="522.60999"
+       gradientTransform="translate(0,12)"
+       x2="327.78"
+       gradientUnits="userSpaceOnUse"
+       spreadMethod="reflect"
+       xlink:href="#linearGradient6035"
+       y2="520.33002"
+       id="linearGradient6116-0-7-5" />
+    <linearGradient
+       inkscape:collect="always"
+       x1="308.5"
+       y1="522.60999"
+       gradientTransform="translate(0,22)"
+       x2="327.78"
+       gradientUnits="userSpaceOnUse"
+       spreadMethod="reflect"
+       xlink:href="#linearGradient6035"
+       y2="520.33002"
+       id="linearGradient6118-6-6-9" />
+    <linearGradient
+       id="linearGradient3057">
+      <stop
+         offset="0"
+         style="stop-color:#282828"
+         id="stop3059" />
+      <stop
+         offset="1"
+         style="stop-color:#282828;stop-opacity:0"
+         id="stop3061" />
+    </linearGradient>
+    <linearGradient
+       id="linearGradient2834">
+      <stop
+         offset="0"
+         style="stop-color:#e59a00"
+         id="stop2836" />
+      <stop
+         offset="1"
+         style="stop-color:#faff7d;stop-opacity:.18367"
+         id="stop2838" />
+    </linearGradient>
+    <linearGradient
+       id="linearGradient2713">
+      <stop
+         offset="0"
+         style="stop-color:#000000"
+         id="stop2715" />
+      <stop
+         offset="1"
+         style="stop-color:#ffffff"
+         id="stop2717" />
+    </linearGradient>
+    <radialGradient
+       inkscape:collect="always"
+       r="15.157"
+       gradientTransform="matrix(0.43334,0,0,1.435,6.4099,-0.11314)"
+       cx="20.361"
+       cy="22.546"
+       gradientUnits="userSpaceOnUse"
+       xlink:href="#linearGradient6035"
+       id="radialGradient3114" />
+    <radialGradient
+       inkscape:collect="always"
+       r="15.157"
+       gradientTransform="matrix(0.50007,0,0,1.6752,5.003,-5.1081)"
+       cx="20.361"
+       cy="22.546"
+       gradientUnits="userSpaceOnUse"
+       xlink:href="#linearGradient6035"
+       id="radialGradient3116" />
+    <radialGradient
+       inkscape:collect="always"
+       r="15.157"
+       gradientTransform="matrix(0.6214,0,0,1.8821,2.3888,-9.4094)"
+       cx="20.361"
+       cy="22.546"
+       gradientUnits="userSpaceOnUse"
+       xlink:href="#linearGradient6035"
+       id="radialGradient3118" />
+    <linearGradient
+       inkscape:collect="always"
+       x1="26.974"
+       y1="68.68"
+       gradientTransform="matrix(2.1361,0,0,1.826,2.3487,-1.0128)"
+       x2="26.974"
+       gradientUnits="userSpaceOnUse"
+       xlink:href="#linearGradient6035"
+       y2="44.981"
+       id="linearGradient3130" />
+    <linearGradient
+       inkscape:collect="always"
+       x1="17.682"
+       y1="60.434"
+       gradientTransform="matrix(2.2188,0,0,1.826,-0.051304,-1.0128)"
+       x2="17.425"
+       gradientUnits="userSpaceOnUse"
+       spreadMethod="reflect"
+       xlink:href="#linearGradient2713"
+       y2="62.78"
+       id="linearGradient3142" />
+    <linearGradient
+       inkscape:collect="always"
+       x1="24.261"
+       y1="44.011"
+       gradientTransform="matrix(2.2188,0,0,1.826,-0.051304,-1.0128)"
+       x2="24.606"
+       gradientUnits="userSpaceOnUse"
+       spreadMethod="reflect"
+       xlink:href="#linearGradient2713"
+       y2="45.888"
+       id="linearGradient3145" />
+    <linearGradient
+       inkscape:collect="always"
+       x1="29.094"
+       y1="46.357"
+       gradientTransform="matrix(2.2188,0,0,1.826,-0.051304,-1.0128)"
+       x2="29.094"
+       gradientUnits="userSpaceOnUse"
+       spreadMethod="reflect"
+       xlink:href="#linearGradient2713"
+       y2="47.296"
+       id="linearGradient3148" />
+    <linearGradient
+       inkscape:collect="always"
+       x1="29.614"
+       y1="52.609"
+       gradientTransform="matrix(2.1518,0,0,1.7708,-0.051304,4.3518)"
+       x2="44.724"
+       gradientUnits="userSpaceOnUse"
+       spreadMethod="reflect"
+       y2="52.609"
+       id="linearGradient3151">
+      <stop
+         offset="0"
+         style="stop-color:#db9300"
+         id="stop2703" />
+      <stop
+         offset=".75"
+         style="stop-color:#fac700"
+         id="stop2770" />
+      <stop
+         offset="1"
+         style="stop-color:#fff363"
+         id="stop2705" />
+    </linearGradient>
+    <radialGradient
+       inkscape:collect="always"
+       r="7.4833"
+       gradientTransform="matrix(7.5313,0,0,0.53795,3.9743,-2.0257)"
+       cx="8.0178"
+       cy="231.98"
+       gradientUnits="userSpaceOnUse"
+       xlink:href="#linearGradient3057"
+       id="radialGradient4946" />
+    <radialGradient
+       inkscape:collect="always"
+       r="7.4833"
+       gradientTransform="matrix(7.5313,0,0,0.67244,3.9743,-34.231)"
+       cx="8.0178"
+       cy="231.98"
+       gradientUnits="userSpaceOnUse"
+       xlink:href="#linearGradient3057"
+       id="radialGradient4949" />
+    <radialGradient
+       inkscape:collect="always"
+       r="7.4833"
+       gradientTransform="matrix(7.5313,0,0,0.53795,3.9743,-0.012826)"
+       cx="8.0178"
+       cy="231.98"
+       gradientUnits="userSpaceOnUse"
+       xlink:href="#linearGradient3057"
+       id="radialGradient4952" />
+    <radialGradient
+       inkscape:collect="always"
+       r="6.0679"
+       gradientTransform="matrix(-2.8463,0,0,2.0879,139.53,-3.5862)"
+       cx="21.595"
+       cy="8.9814"
+       gradientUnits="userSpaceOnUse"
+       xlink:href="#linearGradient2834"
+       id="radialGradient4955" />
+    <radialGradient
+       inkscape:collect="always"
+       r="6.0679"
+       gradientTransform="matrix(3.085,0,0,2.0529,-15.985,-3.1493)"
+       cx="21.595"
+       cy="8.9814"
+       gradientUnits="userSpaceOnUse"
+       xlink:href="#linearGradient2834"
+       id="radialGradient4958" />
+    <linearGradient
+       inkscape:collect="always"
+       x1="33.184"
+       y1="24.385"
+       gradientTransform="matrix(2.1611,0,0,1.8045,-0.051304,2.2671)"
+       x2="33.184"
+       gradientUnits="userSpaceOnUse"
+       xlink:href="#linearGradient6035"
+       y2="-13.17"
+       id="linearGradient4965" />
+    <linearGradient
+       inkscape:collect="always"
+       x1="33.184"
+       y1="24.385"
+       gradientTransform="matrix(2.2102,0,0,1.9643,-1.5159,-2.1713)"
+       x2="33.184"
+       gradientUnits="userSpaceOnUse"
+       xlink:href="#linearGradient6035"
+       y2="-13.17"
+       id="linearGradient4968" />
+    <linearGradient
+       inkscape:collect="always"
+       x1="38.782"
+       y1="9.5746"
+       gradientTransform="matrix(1.632,0,0,2.4825,-0.051304,-0.012826)"
+       x2="38.782"
+       gradientUnits="userSpaceOnUse"
+       xlink:href="#linearGradient6035"
+       y2="7.5863"
+       id="linearGradient4971" />
+    <radialGradient
+       inkscape:collect="always"
+       r="6.0679"
+       gradientTransform="matrix(-2.3666,0,0,1.7265,129.12,-0.11292)"
+       cx="21.595"
+       cy="8.9814"
+       gradientUnits="userSpaceOnUse"
+       xlink:href="#linearGradient2834"
+       id="radialGradient4974" />
+    <radialGradient
+       inkscape:collect="always"
+       r="6.0679"
+       gradientTransform="matrix(2.3666,0,0,1.7265,-0.40436,-0.012826)"
+       cx="21.595"
+       cy="8.9814"
+       gradientUnits="userSpaceOnUse"
+       xlink:href="#linearGradient2834"
+       id="radialGradient4977" />
+    <linearGradient
+       inkscape:collect="always"
+       x1="38.363"
+       y1="11.17"
+       gradientTransform="matrix(1.6375,0,0,2.4742,-0.051304,-0.012826)"
+       x2="39.724"
+       gradientUnits="userSpaceOnUse"
+       xlink:href="#linearGradient6035"
+       y2="6.0918"
+       id="linearGradient4980" />
+    <linearGradient
+       inkscape:collect="always"
+       x1="35.996"
+       y1="1.6246"
+       gradientTransform="matrix(1.632,0,0,2.4361,-0.051304,2.0097)"
+       x2="35.996"
+       gradientUnits="userSpaceOnUse"
+       xlink:href="#linearGradient6035"
+       y2="11.711"
+       id="linearGradient4983" />
+    <radialGradient
+       inkscape:collect="always"
+       xlink:href="#linearGradient6035"
+       id="radialGradient1344"
+       gradientUnits="userSpaceOnUse"
+       gradientTransform="matrix(0.43334,0,0,1.435,6.4099,-0.11314)"
+       cx="20.361"
+       cy="22.546"
+       r="15.157" />
+    <radialGradient
+       inkscape:collect="always"
+       xlink:href="#linearGradient6035"
+       id="radialGradient1346"
+       gradientUnits="userSpaceOnUse"
+       gradientTransform="matrix(0.50007,0,0,1.6752,5.003,-5.1081)"
+       cx="20.361"
+       cy="22.546"
+       r="15.157" />
+    <radialGradient
+       inkscape:collect="always"
+       xlink:href="#linearGradient6035"
+       id="radialGradient1348"
+       gradientUnits="userSpaceOnUse"
+       gradientTransform="matrix(0.6214,0,0,1.8821,2.3888,-9.4094)"
+       cx="20.361"
+       cy="22.546"
+       r="15.157" />
+  </defs>
+  <g
+     id="g188"
+     transform="translate(20,152)">
+    <switch
+       id="switch186">
+      <foreignObject
+         requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"
+         height="17"
+         width="96"
+         pointer-events="all"
+         style="overflow:visible;">
+        <xhtml:div
+           style="display: inline-block; font-size: 16px; font-family: Helvetica; color: rgb(0, 0, 0); line-height: 1.2; vertical-align: top; width: 97px; white-space: nowrap; word-wrap: normal; text-align: center;">
+          <xhtml:div
+             style="display:inline-block;text-align:inherit;text-decoration:inherit;">Container DB</xhtml:div>
+        </xhtml:div>
+      </foreignObject>
+      <text
+         style="font-size:16px;font-family:Helvetica;text-anchor:middle;fill:#000000"
+         id="text184"
+         font-size="16px"
+         y="17"
+         x="48">Container DB</text>
+    </switch>
+  </g>
+  <g
+     id="g194"
+     transform="translate(27,356)">
+    <switch
+       id="switch192">
+      <foreignObject
+         requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"
+         height="17"
+         width="82"
+         pointer-events="all"
+         style="overflow:visible;">
+        <xhtml:div
+           style="display: inline-block; font-size: 16px; font-family: Helvetica; color: rgb(0, 0, 0); line-height: 1.2; vertical-align: top; width: 83px; white-space: nowrap; word-wrap: normal; text-align: center;">
+          <xhtml:div
+             style="display:inline-block;text-align:inherit;text-decoration:inherit;">Retiring DB</xhtml:div>
+        </xhtml:div>
+      </foreignObject>
+      <text
+         style="font-size:16px;font-family:Helvetica;text-anchor:middle;fill:#000000"
+         id="text190"
+         font-size="16px"
+         y="17"
+         x="41">Retiring DB</text>
+    </switch>
+  </g>
+  <g
+     id="g200"
+     transform="translate(224,356)">
+    <switch
+       id="switch198">
+      <foreignObject
+         requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"
+         height="17"
+         width="68"
+         pointer-events="all"
+         style="overflow:visible;">
+        <xhtml:div
+           style="display: inline-block; font-size: 16px; font-family: Helvetica; color: rgb(0, 0, 0); line-height: 1.2; vertical-align: top; width: 69px; white-space: nowrap; word-wrap: normal; text-align: center;">
+          <xhtml:div
+             style="display:inline-block;text-align:inherit;text-decoration:inherit;">Fresh DB</xhtml:div>
+        </xhtml:div>
+      </foreignObject>
+      <text
+         style="font-size:16px;font-family:Helvetica;text-anchor:middle;fill:#000000"
+         id="text196"
+         font-size="16px"
+         y="17"
+         x="34">Fresh DB</text>
+    </switch>
+  </g>
+  <g
+     id="g206"
+     transform="translate(224,552)">
+    <switch
+       id="switch204">
+      <foreignObject
+         requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"
+         height="17"
+         width="68"
+         pointer-events="all"
+         style="overflow:visible;">
+        <xhtml:div
+           style="display: inline-block; font-size: 16px; font-family: Helvetica; color: rgb(0, 0, 0); line-height: 1.2; vertical-align: top; width: 69px; white-space: nowrap; word-wrap: normal; text-align: center;">
+          <xhtml:div
+             style="display:inline-block;text-align:inherit;text-decoration:inherit;">Fresh DB</xhtml:div>
+        </xhtml:div>
+      </foreignObject>
+      <text
+         style="font-size:16px;font-family:Helvetica;text-anchor:middle;fill:#000000"
+         id="text202"
+         font-size="16px"
+         y="17"
+         x="34">Fresh DB</text>
+    </switch>
+  </g>
+  <path
+     style="fill:none;stroke:#ff3333;stroke-width:5;stroke-miterlimit:10"
+     inkscape:connector-curvature="0"
+     id="path208"
+     pointer-events="none"
+     stroke-miterlimit="10"
+     d="M 203.5,75 H 579.66" />
+  <path
+     style="fill:#ff3333;stroke:#ff3333;stroke-width:5;stroke-miterlimit:10"
+     inkscape:connector-curvature="0"
+     id="path210"
+     pointer-events="none"
+     stroke-miterlimit="10"
+     d="m 587.91,75 -11,5.5 2.75,-5.5 -2.75,-5.5 z" />
+  <g
+     id="g216"
+     transform="translate(641,463)">
+    <switch
+       id="switch214">
+      <foreignObject
+         requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"
+         height="24"
+         width="108"
+         pointer-events="all"
+         style="overflow:visible;">
+        <xhtml:div
+           style="display: inline-block; font-size: 22px; font-family: Helvetica; color: rgb(0, 0, 0); line-height: 1.2; vertical-align: top; width: 109px; white-space: nowrap; word-wrap: normal; text-align: center;">
+          <xhtml:div
+             style="display:inline-block;text-align:inherit;text-decoration:inherit;">SHARDED</xhtml:div>
+        </xhtml:div>
+      </foreignObject>
+      <text
+         style="font-size:22px;font-family:Helvetica;text-anchor:middle;fill:#000000"
+         id="text212"
+         font-size="22px"
+         y="23"
+         x="54">SHARDED</text>
+    </switch>
+  </g>
+  <path
+     style="fill:none;stroke:#ff3333;stroke-width:5;stroke-miterlimit:10"
+     inkscape:connector-curvature="0"
+     id="path218"
+     pointer-events="none"
+     stroke-miterlimit="10"
+     d="m 360.5,279 216.16,-0.47" />
+  <path
+     style="fill:#ff3333;stroke:#ff3333;stroke-width:5;stroke-miterlimit:10"
+     inkscape:connector-curvature="0"
+     id="path220"
+     pointer-events="none"
+     stroke-miterlimit="10"
+     d="m 584.91,278.51 -10.99,5.53 2.74,-5.51 -2.76,-5.49 z" />
+  <path
+     style="fill:none;stroke:#ff3333;stroke-width:5;stroke-miterlimit:10"
+     inkscape:connector-curvature="0"
+     id="path222"
+     pointer-events="none"
+     stroke-miterlimit="10"
+     d="m 360.5,475.5 216.16,-0.47" />
+  <path
+     style="fill:#ff3333;stroke:#ff3333;stroke-width:5;stroke-miterlimit:10"
+     inkscape:connector-curvature="0"
+     id="path224"
+     pointer-events="none"
+     stroke-miterlimit="10"
+     d="m 584.91,475.01 -10.99,5.53 2.74,-5.51 -2.76,-5.49 z" />
+  <g
+     id="g230"
+     transform="translate(626,63)">
+    <switch
+       id="switch228">
+      <foreignObject
+         requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"
+         height="24"
+         width="139"
+         pointer-events="all"
+         style="overflow:visible;">
+        <xhtml:div
+           style="display: inline-block; font-size: 22px; font-family: Helvetica; color: rgb(0, 0, 0); line-height: 1.2; vertical-align: top; width: 140px; white-space: nowrap; word-wrap: normal; text-align: center;">
+          <xhtml:div
+             style="display:inline-block;text-align:inherit;text-decoration:inherit;">UNSHARDED</xhtml:div>
+        </xhtml:div>
+      </foreignObject>
+      <text
+         style="font-size:22px;font-family:Helvetica;text-anchor:middle;fill:#000000"
+         id="text226"
+         font-size="22px"
+         y="23"
+         x="70">UNSHARDED</text>
+    </switch>
+  </g>
+  <g
+     id="g236"
+     transform="translate(637,267)">
+    <switch
+       id="switch234">
+      <foreignObject
+         requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"
+         height="24"
+         width="116"
+         pointer-events="all"
+         style="overflow:visible;">
+        <xhtml:div
+           style="display: inline-block; font-size: 22px; font-family: Helvetica; color: rgb(0, 0, 0); line-height: 1.2; vertical-align: top; width: 117px; white-space: nowrap; word-wrap: normal; text-align: center;">
+          <xhtml:div
+             style="display:inline-block;text-align:inherit;text-decoration:inherit;">SHARDING</xhtml:div>
+        </xhtml:div>
+      </foreignObject>
+      <text
+         style="font-size:22px;font-family:Helvetica;text-anchor:middle;fill:#000000"
+         id="text232"
+         font-size="22px"
+         y="23"
+         x="58">SHARDING</text>
+    </switch>
+  </g>
+  <g
+     transform="matrix(0.71834105,0,0,0.71834105,-203.01543,-359.92958)"
+     inkscape:label="Layer 1"
+     id="layer1">
+    <g
+       transform="matrix(4.1992,0,0,4.1992,-914.56,-1633.8)"
+       id="g6097">
+      <ellipse
+         transform="matrix(1.1818,0,0,1.1818,-30.649,-65.984)"
+         style="fill:#2e3436;filter:url(#filter6093)"
+         id="path6079"
+         cx="286.6308"
+         cy="521.77954"
+         rx="16.667517"
+         ry="5.5558391" />
+      <path
+         d="m 288.41,517.5 v 30.092 h 0.125 c -0.0806,0.24126 -0.125,0.47032 -0.125,0.71875 0,3.6263 8.8086,6.5625 19.688,6.5625 10.8794,0 19.688,-2.9362 19.688,-6.5625 0,-0.24879 -0.0442,-0.47715 -0.125,-0.71875 h 0.125 V 517.5 h -39.375 z"
+         style="fill:url(#linearGradient6110)"
+         sodipodi:nodetypes="cccssscccc"
+         id="path5488"
+         inkscape:connector-curvature="0" />
+      <ellipse
+         transform="matrix(1.1818,0,0,1.1818,-30.649,-99.394)"
+         style="fill:url(#linearGradient6112)"
+         id="path5460"
+         cx="286.6308"
+         cy="521.77954"
+         rx="16.667517"
+         ry="5.5558391" />
+      <path
+         d="m 288.38,539.09 c 0.14735,3.584 8.9318,6.4688 19.719,6.4688 10.756,0 19.492,-2.8677 19.688,-6.4375 -3.4515,2.9359 -10.959,4.9688 -19.688,4.9688 -8.7461,0 -16.277,-2.0544 -19.719,-5 z"
+         style="fill:#565656"
+         id="path6026"
+         inkscape:connector-curvature="0" />
+      <path
+         d="m 288.38,517.34 c 0.14735,3.584 8.9318,6.4688 19.719,6.4688 10.756,0 19.492,-2.8677 19.688,-6.4375 -0.21572,0.18349 -0.44078,0.35509 -0.6875,0.53125 -0.009,0.0117 -0.0216,0.0196 -0.0312,0.0312 -2.2921,2.7774 -9.9035,4.8125 -18.969,4.8125 -9.122,0 -16.786,-2.0707 -19.031,-4.875 -0.0249,-0.0179 -0.038,-0.0446 -0.0625,-0.0625 -0.21872,-0.15969 -0.43159,-0.30323 -0.625,-0.46875 z"
+         style="fill:url(#linearGradient6114)"
+         id="path6030"
+         inkscape:connector-curvature="0" />
+      <g
+         id="g6071">
+        <g
+           transform="translate(0,-0.52315)"
+           id="g6067">
+          <path
+             d="m 288.38,529.09 c 0.14735,3.584 8.9318,6.4688 19.719,6.4688 10.756,0 19.492,-2.8677 19.688,-6.4375 -3.4515,2.9359 -10.959,4.9688 -19.688,4.9688 -8.7461,0 -16.277,-2.0544 -19.719,-5 z"
+             style="fill:#565656"
+             id="path6022"
+             inkscape:connector-curvature="0" />
+          <path
+             d="m 288.38,529.09 c 0.14735,3.584 8.9318,6.4688 19.719,6.4688 10.756,0 19.492,-2.8677 19.688,-6.4375 -0.0497,0.0422 -0.10543,0.0838 -0.15625,0.125 -1.2422,3.2268 -9.5106,5.7188 -19.531,5.7188 -10.113,0 -18.468,-2.5112 -19.594,-5.7812 -0.0401,-0.0317 -0.0863,-0.0607 -0.125,-0.0937 z"
+             style="fill:url(#linearGradient6116)"
+             id="path6043"
+             inkscape:connector-curvature="0" />
+        </g>
+        <path
+           d="m 288.38,539.09 c 0.14735,3.584 8.9318,6.4688 19.719,6.4688 10.756,0 19.492,-2.8677 19.688,-6.4375 -0.0497,0.0422 -0.10543,0.0838 -0.15625,0.125 -1.2422,3.2268 -9.5106,5.7188 -19.531,5.7188 -10.113,0 -18.468,-2.5112 -19.594,-5.7812 -0.0401,-0.0317 -0.0863,-0.0607 -0.125,-0.0937 z"
+           style="fill:url(#linearGradient6118)"
+           id="path6054"
+           inkscape:connector-curvature="0" />
+      </g>
+      <path
+         d="m 288.5,549.94 c 1.126,3.27 9.481,5.7812 19.594,5.7812 10.021,0 18.289,-2.492 19.531,-5.7188 -3.5163,2.8678 -10.929,4.8438 -19.531,4.8438 -8.6478,0 -16.1,-2.0137 -19.594,-4.9062 z"
+         style="fill:#565656"
+         id="path6060"
+         inkscape:connector-curvature="0" />
+    </g>
+  </g>
+  <g
+     transform="matrix(0.71834105,0,0,0.71834105,-204.60975,-358.79471)"
+     inkscape:label="Layer 1"
+     id="layer1-8">
+    <g
+       transform="matrix(4.1992,0,0,4.1992,-914.56,-1633.8)"
+       id="g6097-9">
+      <ellipse
+         transform="matrix(1.1818,0,0,1.1818,-30.649,-65.984)"
+         style="fill:#2e3436;filter:url(#filter6093-0)"
+         id="path6079-2"
+         cx="286.6308"
+         cy="521.77954"
+         rx="16.667517"
+         ry="5.5558391" />
+      <path
+         d="m 288.41,517.5 v 30.092 h 0.125 c -0.0806,0.24126 -0.125,0.47032 -0.125,0.71875 0,3.6263 8.8086,6.5625 19.688,6.5625 10.8794,0 19.688,-2.9362 19.688,-6.5625 0,-0.24879 -0.0442,-0.47715 -0.125,-0.71875 h 0.125 V 517.5 h -39.375 z"
+         style="fill:url(#linearGradient6110-8)"
+         sodipodi:nodetypes="cccssscccc"
+         id="path5488-6"
+         inkscape:connector-curvature="0" />
+      <ellipse
+         transform="matrix(1.1818,0,0,1.1818,-30.649,-99.394)"
+         style="fill:url(#linearGradient6112-4)"
+         id="path5460-6"
+         cx="286.6308"
+         cy="521.77954"
+         rx="16.667517"
+         ry="5.5558391" />
+      <path
+         d="m 288.38,539.09 c 0.14735,3.584 8.9318,6.4688 19.719,6.4688 10.756,0 19.492,-2.8677 19.688,-6.4375 -3.4515,2.9359 -10.959,4.9688 -19.688,4.9688 -8.7461,0 -16.277,-2.0544 -19.719,-5 z"
+         style="fill:#565656"
+         id="path6026-4"
+         inkscape:connector-curvature="0" />
+      <path
+         d="m 288.38,517.34 c 0.14735,3.584 8.9318,6.4688 19.719,6.4688 10.756,0 19.492,-2.8677 19.688,-6.4375 -0.21572,0.18349 -0.44078,0.35509 -0.6875,0.53125 -0.009,0.0117 -0.0216,0.0196 -0.0312,0.0312 -2.2921,2.7774 -9.9035,4.8125 -18.969,4.8125 -9.122,0 -16.786,-2.0707 -19.031,-4.875 -0.0249,-0.0179 -0.038,-0.0446 -0.0625,-0.0625 -0.21872,-0.15969 -0.43159,-0.30323 -0.625,-0.46875 z"
+         style="fill:url(#linearGradient6114-4)"
+         id="path6030-9"
+         inkscape:connector-curvature="0" />
+      <g
+         id="g6071-5">
+        <g
+           transform="translate(0,-0.52315)"
+           id="g6067-0">
+          <path
+             d="m 288.38,529.09 c 0.14735,3.584 8.9318,6.4688 19.719,6.4688 10.756,0 19.492,-2.8677 19.688,-6.4375 -3.4515,2.9359 -10.959,4.9688 -19.688,4.9688 -8.7461,0 -16.277,-2.0544 -19.719,-5 z"
+             style="fill:#565656"
+             id="path6022-4"
+             inkscape:connector-curvature="0" />
+          <path
+             d="m 288.38,529.09 c 0.14735,3.584 8.9318,6.4688 19.719,6.4688 10.756,0 19.492,-2.8677 19.688,-6.4375 -0.0497,0.0422 -0.10543,0.0838 -0.15625,0.125 -1.2422,3.2268 -9.5106,5.7188 -19.531,5.7188 -10.113,0 -18.468,-2.5112 -19.594,-5.7812 -0.0401,-0.0317 -0.0863,-0.0607 -0.125,-0.0937 z"
+             style="fill:url(#linearGradient6116-0)"
+             id="path6043-8"
+             inkscape:connector-curvature="0" />
+        </g>
+        <path
+           d="m 288.38,539.09 c 0.14735,3.584 8.9318,6.4688 19.719,6.4688 10.756,0 19.492,-2.8677 19.688,-6.4375 -0.0497,0.0422 -0.10543,0.0838 -0.15625,0.125 -1.2422,3.2268 -9.5106,5.7188 -19.531,5.7188 -10.113,0 -18.468,-2.5112 -19.594,-5.7812 -0.0401,-0.0317 -0.0863,-0.0607 -0.125,-0.0937 z"
+           style="fill:url(#linearGradient6118-6)"
+           id="path6054-7"
+           inkscape:connector-curvature="0" />
+      </g>
+      <path
+         d="m 288.5,549.94 c 1.126,3.27 9.481,5.7812 19.594,5.7812 10.021,0 18.289,-2.492 19.531,-5.7188 -3.5163,2.8678 -10.929,4.8438 -19.531,4.8438 -8.6478,0 -16.1,-2.0137 -19.594,-4.9062 z"
+         style="fill:#565656"
+         id="path6060-1"
+         inkscape:connector-curvature="0" />
+    </g>
+  </g>
+  <g
+     transform="matrix(0.71834105,0,0,0.71834105,-18.491634,-160.67943)"
+     inkscape:label="Layer 1"
+     id="layer1-8-3">
+    <g
+       transform="matrix(4.1992,0,0,4.1992,-914.56,-1633.8)"
+       id="g6097-9-1">
+      <ellipse
+         transform="matrix(1.1818,0,0,1.1818,-30.649,-65.984)"
+         style="fill:#2e3436;filter:url(#filter6093-0-9)"
+         id="path6079-2-7"
+         cx="286.6308"
+         cy="521.77954"
+         rx="16.667517"
+         ry="5.5558391" />
+      <path
+         d="m 288.41,517.5 v 30.092 h 0.125 c -0.0806,0.24126 -0.125,0.47032 -0.125,0.71875 0,3.6263 8.8086,6.5625 19.688,6.5625 10.8794,0 19.688,-2.9362 19.688,-6.5625 0,-0.24879 -0.0442,-0.47715 -0.125,-0.71875 h 0.125 V 517.5 h -39.375 z"
+         style="fill:url(#linearGradient6110-8-4)"
+         sodipodi:nodetypes="cccssscccc"
+         id="path5488-6-5"
+         inkscape:connector-curvature="0" />
+      <ellipse
+         transform="matrix(1.1818,0,0,1.1818,-30.649,-99.394)"
+         style="fill:url(#linearGradient6112-4-3)"
+         id="path5460-6-9"
+         cx="286.6308"
+         cy="521.77954"
+         rx="16.667517"
+         ry="5.5558391" />
+      <path
+         d="m 288.38,539.09 c 0.14735,3.584 8.9318,6.4688 19.719,6.4688 10.756,0 19.492,-2.8677 19.688,-6.4375 -3.4515,2.9359 -10.959,4.9688 -19.688,4.9688 -8.7461,0 -16.277,-2.0544 -19.719,-5 z"
+         style="fill:#565656"
+         id="path6026-4-6"
+         inkscape:connector-curvature="0" />
+      <path
+         d="m 288.38,517.34 c 0.14735,3.584 8.9318,6.4688 19.719,6.4688 10.756,0 19.492,-2.8677 19.688,-6.4375 -0.21572,0.18349 -0.44078,0.35509 -0.6875,0.53125 -0.009,0.0117 -0.0216,0.0196 -0.0312,0.0312 -2.2921,2.7774 -9.9035,4.8125 -18.969,4.8125 -9.122,0 -16.786,-2.0707 -19.031,-4.875 -0.0249,-0.0179 -0.038,-0.0446 -0.0625,-0.0625 -0.21872,-0.15969 -0.43159,-0.30323 -0.625,-0.46875 z"
+         style="fill:url(#linearGradient6114-4-4)"
+         id="path6030-9-2"
+         inkscape:connector-curvature="0" />
+      <g
+         id="g6071-5-1">
+        <g
+           transform="translate(0,-0.52315)"
+           id="g6067-0-7">
+          <path
+             d="m 288.38,529.09 c 0.14735,3.584 8.9318,6.4688 19.719,6.4688 10.756,0 19.492,-2.8677 19.688,-6.4375 -3.4515,2.9359 -10.959,4.9688 -19.688,4.9688 -8.7461,0 -16.277,-2.0544 -19.719,-5 z"
+             style="fill:#565656"
+             id="path6022-4-8"
+             inkscape:connector-curvature="0" />
+          <path
+             d="m 288.38,529.09 c 0.14735,3.584 8.9318,6.4688 19.719,6.4688 10.756,0 19.492,-2.8677 19.688,-6.4375 -0.0497,0.0422 -0.10543,0.0838 -0.15625,0.125 -1.2422,3.2268 -9.5106,5.7188 -19.531,5.7188 -10.113,0 -18.468,-2.5112 -19.594,-5.7812 -0.0401,-0.0317 -0.0863,-0.0607 -0.125,-0.0937 z"
+             style="fill:url(#linearGradient6116-0-7)"
+             id="path6043-8-5"
+             inkscape:connector-curvature="0" />
+        </g>
+        <path
+           d="m 288.38,539.09 c 0.14735,3.584 8.9318,6.4688 19.719,6.4688 10.756,0 19.492,-2.8677 19.688,-6.4375 -0.0497,0.0422 -0.10543,0.0838 -0.15625,0.125 -1.2422,3.2268 -9.5106,5.7188 -19.531,5.7188 -10.113,0 -18.468,-2.5112 -19.594,-5.7812 -0.0401,-0.0317 -0.0863,-0.0607 -0.125,-0.0937 z"
+           style="fill:url(#linearGradient6118-6-6)"
+           id="path6054-7-7"
+           inkscape:connector-curvature="0" />
+      </g>
+      <path
+         d="m 288.5,549.94 c 1.126,3.27 9.481,5.7812 19.594,5.7812 10.021,0 18.289,-2.492 19.531,-5.7188 -3.5163,2.8678 -10.929,4.8438 -19.531,4.8438 -8.6478,0 -16.1,-2.0137 -19.594,-4.9062 z"
+         style="fill:#565656"
+         id="path6060-1-4"
+         inkscape:connector-curvature="0" />
+    </g>
+  </g>
+  <g
+     transform="matrix(0.71834105,0,0,0.71834105,-17.518891,40.354071)"
+     inkscape:label="Layer 1"
+     id="layer1-8-3-4">
+    <g
+       transform="matrix(4.1992,0,0,4.1992,-914.56,-1633.8)"
+       id="g6097-9-1-3">
+      <ellipse
+         transform="matrix(1.1818,0,0,1.1818,-30.649,-65.984)"
+         style="fill:#2e3436;filter:url(#filter6093-0-9-1)"
+         id="path6079-2-7-3"
+         cx="286.6308"
+         cy="521.77954"
+         rx="16.667517"
+         ry="5.5558391" />
+      <path
+         d="m 288.41,517.5 v 30.092 h 0.125 c -0.0806,0.24126 -0.125,0.47032 -0.125,0.71875 0,3.6263 8.8086,6.5625 19.688,6.5625 10.8794,0 19.688,-2.9362 19.688,-6.5625 0,-0.24879 -0.0442,-0.47715 -0.125,-0.71875 h 0.125 V 517.5 h -39.375 z"
+         style="fill:url(#linearGradient6110-8-4-5)"
+         sodipodi:nodetypes="cccssscccc"
+         id="path5488-6-5-3"
+         inkscape:connector-curvature="0" />
+      <ellipse
+         transform="matrix(1.1818,0,0,1.1818,-30.649,-99.394)"
+         style="fill:url(#linearGradient6112-4-3-3)"
+         id="path5460-6-9-8"
+         cx="286.6308"
+         cy="521.77954"
+         rx="16.667517"
+         ry="5.5558391" />
+      <path
+         d="m 288.38,539.09 c 0.14735,3.584 8.9318,6.4688 19.719,6.4688 10.756,0 19.492,-2.8677 19.688,-6.4375 -3.4515,2.9359 -10.959,4.9688 -19.688,4.9688 -8.7461,0 -16.277,-2.0544 -19.719,-5 z"
+         style="fill:#565656"
+         id="path6026-4-6-6"
+         inkscape:connector-curvature="0" />
+      <path
+         d="m 288.38,517.34 c 0.14735,3.584 8.9318,6.4688 19.719,6.4688 10.756,0 19.492,-2.8677 19.688,-6.4375 -0.21572,0.18349 -0.44078,0.35509 -0.6875,0.53125 -0.009,0.0117 -0.0216,0.0196 -0.0312,0.0312 -2.2921,2.7774 -9.9035,4.8125 -18.969,4.8125 -9.122,0 -16.786,-2.0707 -19.031,-4.875 -0.0249,-0.0179 -0.038,-0.0446 -0.0625,-0.0625 -0.21872,-0.15969 -0.43159,-0.30323 -0.625,-0.46875 z"
+         style="fill:url(#linearGradient6114-4-4-3)"
+         id="path6030-9-2-0"
+         inkscape:connector-curvature="0" />
+      <g
+         id="g6071-5-1-4">
+        <g
+           transform="translate(0,-0.52315)"
+           id="g6067-0-7-8">
+          <path
+             d="m 288.38,529.09 c 0.14735,3.584 8.9318,6.4688 19.719,6.4688 10.756,0 19.492,-2.8677 19.688,-6.4375 -3.4515,2.9359 -10.959,4.9688 -19.688,4.9688 -8.7461,0 -16.277,-2.0544 -19.719,-5 z"
+             style="fill:#565656"
+             id="path6022-4-8-8"
+             inkscape:connector-curvature="0" />
+          <path
+             d="m 288.38,529.09 c 0.14735,3.584 8.9318,6.4688 19.719,6.4688 10.756,0 19.492,-2.8677 19.688,-6.4375 -0.0497,0.0422 -0.10543,0.0838 -0.15625,0.125 -1.2422,3.2268 -9.5106,5.7188 -19.531,5.7188 -10.113,0 -18.468,-2.5112 -19.594,-5.7812 -0.0401,-0.0317 -0.0863,-0.0607 -0.125,-0.0937 z"
+             style="fill:url(#linearGradient6116-0-7-9)"
+             id="path6043-8-5-8"
+             inkscape:connector-curvature="0" />
+        </g>
+        <path
+           d="m 288.38,539.09 c 0.14735,3.584 8.9318,6.4688 19.719,6.4688 10.756,0 19.492,-2.8677 19.688,-6.4375 -0.0497,0.0422 -0.10543,0.0838 -0.15625,0.125 -1.2422,3.2268 -9.5106,5.7188 -19.531,5.7188 -10.113,0 -18.468,-2.5112 -19.594,-5.7812 -0.0401,-0.0317 -0.0863,-0.0607 -0.125,-0.0937 z"
+           style="fill:url(#linearGradient6118-6-6-6)"
+           id="path6054-7-7-9"
+           inkscape:connector-curvature="0" />
+      </g>
+      <path
+         d="m 288.5,549.94 c 1.126,3.27 9.481,5.7812 19.594,5.7812 10.021,0 18.289,-2.492 19.531,-5.7188 -3.5163,2.8678 -10.929,4.8438 -19.531,4.8438 -8.6478,0 -16.1,-2.0137 -19.594,-4.9062 z"
+         style="fill:#565656"
+         id="path6060-1-4-7"
+         inkscape:connector-curvature="0" />
+    </g>
+  </g>
+  <g
+     transform="matrix(0.71834105,0,0,0.71834105,-204.2855,-155.81572)"
+     inkscape:label="Layer 1"
+     id="layer1-8-3-46">
+    <g
+       transform="matrix(4.1992,0,0,4.1992,-914.56,-1633.8)"
+       id="g6097-9-1-9">
+      <ellipse
+         transform="matrix(1.1818,0,0,1.1818,-30.649,-65.984)"
+         style="fill:#2e3436;filter:url(#filter6093-0-9-7)"
+         id="path6079-2-7-2"
+         cx="286.6308"
+         cy="521.77954"
+         rx="16.667517"
+         ry="5.5558391" />
+      <path
+         d="m 288.41,517.5 v 30.092 h 0.125 c -0.0806,0.24126 -0.125,0.47032 -0.125,0.71875 0,3.6263 8.8086,6.5625 19.688,6.5625 10.8794,0 19.688,-2.9362 19.688,-6.5625 0,-0.24879 -0.0442,-0.47715 -0.125,-0.71875 h 0.125 V 517.5 h -39.375 z"
+         style="fill:url(#linearGradient6110-8-4-4)"
+         sodipodi:nodetypes="cccssscccc"
+         id="path5488-6-5-2"
+         inkscape:connector-curvature="0" />
+      <ellipse
+         transform="matrix(1.1818,0,0,1.1818,-30.649,-99.394)"
+         style="fill:url(#linearGradient6112-4-3-0)"
+         id="path5460-6-9-4"
+         cx="286.6308"
+         cy="521.77954"
+         rx="16.667517"
+         ry="5.5558391" />
+      <path
+         d="m 288.38,539.09 c 0.14735,3.584 8.9318,6.4688 19.719,6.4688 10.756,0 19.492,-2.8677 19.688,-6.4375 -3.4515,2.9359 -10.959,4.9688 -19.688,4.9688 -8.7461,0 -16.277,-2.0544 -19.719,-5 z"
+         style="fill:#565656"
+         id="path6026-4-6-7"
+         inkscape:connector-curvature="0" />
+      <path
+         d="m 288.38,517.34 c 0.14735,3.584 8.9318,6.4688 19.719,6.4688 10.756,0 19.492,-2.8677 19.688,-6.4375 -0.21572,0.18349 -0.44078,0.35509 -0.6875,0.53125 -0.009,0.0117 -0.0216,0.0196 -0.0312,0.0312 -2.2921,2.7774 -9.9035,4.8125 -18.969,4.8125 -9.122,0 -16.786,-2.0707 -19.031,-4.875 -0.0249,-0.0179 -0.038,-0.0446 -0.0625,-0.0625 -0.21872,-0.15969 -0.43159,-0.30323 -0.625,-0.46875 z"
+         style="fill:url(#linearGradient6114-4-4-5)"
+         id="path6030-9-2-7"
+         inkscape:connector-curvature="0" />
+      <g
+         id="g6071-5-1-5">
+        <g
+           transform="translate(0,-0.52315)"
+           id="g6067-0-7-4">
+          <path
+             d="m 288.38,529.09 c 0.14735,3.584 8.9318,6.4688 19.719,6.4688 10.756,0 19.492,-2.8677 19.688,-6.4375 -3.4515,2.9359 -10.959,4.9688 -19.688,4.9688 -8.7461,0 -16.277,-2.0544 -19.719,-5 z"
+             style="fill:#565656"
+             id="path6022-4-8-81"
+             inkscape:connector-curvature="0" />
+          <path
+             d="m 288.38,529.09 c 0.14735,3.584 8.9318,6.4688 19.719,6.4688 10.756,0 19.492,-2.8677 19.688,-6.4375 -0.0497,0.0422 -0.10543,0.0838 -0.15625,0.125 -1.2422,3.2268 -9.5106,5.7188 -19.531,5.7188 -10.113,0 -18.468,-2.5112 -19.594,-5.7812 -0.0401,-0.0317 -0.0863,-0.0607 -0.125,-0.0937 z"
+             style="fill:url(#linearGradient6116-0-7-5)"
+             id="path6043-8-5-2"
+             inkscape:connector-curvature="0" />
+        </g>
+        <path
+           d="m 288.38,539.09 c 0.14735,3.584 8.9318,6.4688 19.719,6.4688 10.756,0 19.492,-2.8677 19.688,-6.4375 -0.0497,0.0422 -0.10543,0.0838 -0.15625,0.125 -1.2422,3.2268 -9.5106,5.7188 -19.531,5.7188 -10.113,0 -18.468,-2.5112 -19.594,-5.7812 -0.0401,-0.0317 -0.0863,-0.0607 -0.125,-0.0937 z"
+           style="fill:url(#linearGradient6118-6-6-9)"
+           id="path6054-7-7-8"
+           inkscape:connector-curvature="0" />
+      </g>
+      <path
+         d="m 288.5,549.94 c 1.126,3.27 9.481,5.7812 19.594,5.7812 10.021,0 18.289,-2.492 19.531,-5.7188 -3.5163,2.8678 -10.929,4.8438 -19.531,4.8438 -8.6478,0 -16.1,-2.0137 -19.594,-4.9062 z"
+         style="fill:#565656"
+         id="path6060-1-4-9"
+         inkscape:connector-curvature="0" />
+    </g>
+  </g>
+  <g
+     id="g5908"
+     transform="matrix(0.6835767,0,0,0.6835767,23.77275,252.34198)">
+    <g
+       id="g5889">
+      <path
+         d="M 64.359,2 C 44.287,2 28.128,18.159 28.128,38.231 V 78.487 H 38.192 V 38.231 c 0,-14.497 11.671,-26.167 26.167,-26.167 14.496,0 26.167,11.67 26.167,26.167 V 78.487 H 100.59 V 38.231 C 100.59,18.159 84.431,2 64.359,2 Z"
+         style="fill:#282828;fill-rule:evenodd"
+         id="rect2723"
+         inkscape:connector-curvature="0" />
+      <path
+         d="m 64.359,4.6293 c -18.957,0 -34.218,16.307 -34.218,34.909 v 37.528 c 0,14.09 8.776,26.054 21.261,31.044 -8.945,-4.07 -15.222,-12.796 -15.222,-23.143 v -47.404 c 0,-14.225 11.67,-26.621 26.166,-26.621 h 4.026 c 14.496,0 26.167,12.396 26.167,26.621 v 47.404 c 0,10.347 -6.277,19.073 -15.222,23.143 12.484,-4.99 21.26,-16.954 21.26,-31.044 v -37.528 c 0,-18.602 -15.261,-34.909 -34.218,-34.909 z"
+         style="opacity:0.65;fill:url(#linearGradient4983);fill-rule:evenodd"
+         id="path3082"
+         inkscape:connector-curvature="0" />
+      <path
+         d="m 64.359,2.8539 c -19.51,0 -35.217,15.601 -35.217,34.98 v 39.095 c 0,14.677 9.033,27.141 21.881,32.341 -9.206,-4.24 -15.666,-13.332 -15.666,-24.11 v -49.384 c 0,-14.819 12.011,-29.082 26.931,-29.082 l 4.143,-10e-5 c 14.919,0 26.93,14.263 26.93,29.082 v 49.384 c 0,10.778 -6.46,19.87 -15.666,24.11 12.848,-5.2 21.881,-17.664 21.881,-32.341 v -39.095 c 0,-19.379 -15.707,-34.98 -35.217,-34.98 z"
+         style="opacity:0.5;fill:url(#linearGradient4980);fill-rule:evenodd"
+         id="path2931"
+         inkscape:connector-curvature="0" />
+      <path
+         d="m 49.471,12.003 c -5.439,3.405 -8.499,9.21 -7.9,11.145 0.646,2.085 4.467,-7.233 15.283,-10.119 8.341,-2.225 0,-5.6488 -7.383,-1.026 z"
+         style="opacity:0.8;fill:url(#radialGradient4977);fill-rule:evenodd"
+         id="path2861"
+         inkscape:connector-curvature="0" />
+      <path
+         d="m 79.248,11.903 c 5.438,3.405 8.498,9.21 7.899,11.145 -0.646,2.085 -4.467,-7.233 -15.283,-10.119 -8.341,-2.225 0,-5.6489 7.384,-1.026 z"
+         style="opacity:0.8;fill:url(#radialGradient4974);fill-rule:evenodd"
+         id="path2871"
+         inkscape:connector-curvature="0" />
+      <path
+         d="m 64.359,6.2794 c -18.957,0 -34.218,12.995 -34.218,31.952 v 38.244 c 0,14.357 8.776,26.545 21.261,31.635 -8.945,-4.15 -15.222,-13.04 -15.222,-23.584 v -48.308 c 0,-14.496 11.67,-26.182 26.166,-26.182 h 4.026 c 14.496,0 26.167,11.686 26.167,26.182 v 48.308 c 0,10.544 -6.277,19.434 -15.222,23.584 12.484,-5.09 21.26,-17.278 21.26,-31.635 v -38.244 c 0,-18.957 -15.261,-31.952 -34.218,-31.952 z"
+         style="opacity:0.5;fill:url(#linearGradient4971);fill-rule:evenodd"
+         id="rect2875"
+         inkscape:connector-curvature="0" />
+      <path
+         d="m 64.359,4.0389 c -26.762,0 -32.937,23.315 -32.937,33.86 0,31.634 2.058,31.634 2.058,0 0,-23.199 16.463,-32.355 30.879,-32.355 14.416,2e-4 30.879,10.103 30.879,32.355 0,31.634 2.059,31.634 2.059,0 0,-10.545 -6.176,-33.86 -32.938,-33.86 z"
+         style="opacity:0.8;fill:url(#linearGradient4968);fill-rule:evenodd"
+         id="path2933"
+         inkscape:connector-curvature="0" />
+      <path
+         d="m 64.359,7.0913 c -26.167,0 -32.205,22.3 -32.205,31.988 0,29.062 2.013,29.062 2.013,0 0,-21.312 16.096,-30.605 30.192,-30.605 14.096,2e-4 30.193,10.162 30.193,30.605 0,29.062 2.012,29.062 2.012,0 0,-9.688 -6.038,-31.988 -32.205,-31.988 z"
+         style="opacity:0.6;fill:url(#linearGradient4965);fill-rule:evenodd"
+         id="path2885"
+         inkscape:connector-curvature="0" />
+      <path
+         d="m 36.98,16.488 c -2.876,5.248 3.027,1.931 4.398,0.273 C 45.232,12.102 51.745,8.7251 57.463,7.6228 62.257,6.6985 62.988,4.8471 59.04,4.5407 51.168,3.9296 39.736,11.456 36.98,16.4877 Z"
+         style="opacity:0.8;fill:#ffffff;fill-rule:evenodd"
+         id="path2897"
+         inkscape:connector-curvature="0" />
+      <path
+         d="m 32.623,25.156 c 0.305,2.564 5.264,-5.798 9.168,-9.724 4.768,-4.795 11.996,-8.1509 15.474,-8.5943 6.198,-0.7905 3.256,-3.828 -0.629,-3.0606 -14.12,2.7892 -24.79,14.839 -24.013,21.379 z"
+         style="opacity:0.6;fill:#ffffff;fill-rule:evenodd"
+         id="path2901"
+         inkscape:connector-curvature="0" />
+      <path
+         d="m 91.58,16.452 c 2.894,5.237 -3.02,1.942 -4.397,0.29 C 83.312,12.097 76.786,8.7435 71.064,7.6624 66.266,6.7557 64.916,4.9102 68.863,4.5892 c 7.87,-0.64 19.942,6.8408 22.717,11.863 z"
+         style="opacity:0.8;fill:#ffffff;fill-rule:evenodd"
+         id="path2909"
+         inkscape:connector-curvature="0" />
+      <path
+         d="M 95.798,24.925 C 95.503,27.491 90.514,19.146 86.595,15.235 81.809,10.458 74.569,7.1282 71.09,6.6976 64.889,5.9299 67.797,3.0024 71.707,3.6353 c 14.141,2.3015 24.844,14.747 24.091,21.29 z"
+         style="opacity:0.6;fill:#ffffff;fill-rule:evenodd"
+         id="path2911"
+         inkscape:connector-curvature="0" />
+      <path
+         d="M 49.032,11.138 C 41.943,15.187 37.953,22.09 38.734,24.39 c 0.842,2.479 5.823,-8.601 19.923,-12.032 10.873,-2.646 0,-6.7166 -9.625,-1.22 z"
+         style="opacity:0.4;fill:url(#radialGradient4958);fill-rule:evenodd"
+         id="path2953"
+         inkscape:connector-curvature="0" />
+      <path
+         d="m 79.54,10.945 c 6.541,4.118 10.222,11.138 9.501,13.479 C 88.265,26.945 83.669,15.676 70.66,12.186 60.629,9.4947 70.661,5.3546 79.54,10.945 Z"
+         style="opacity:0.4;fill:url(#radialGradient4955);fill-rule:evenodd"
+         id="path2957"
+         inkscape:connector-curvature="0" />
+      <path
+         d="m 120.72,124.78 c 0,2.23 -25.235,4.03 -56.361,4.03 C 33.233,128.81 8,127.01 8,124.78 c 0,-2.22 25.233,-4.02 56.359,-4.02 31.126,0 56.361,1.8 56.361,4.02 z"
+         style="opacity:0.4;fill:url(#radialGradient4952);fill-rule:evenodd"
+         id="path3055"
+         inkscape:connector-curvature="0" />
+      <path
+         d="m 120.72,121.76 c 0,2.78 -25.235,5.04 -56.361,5.04 C 33.233,126.8 8,124.54 8,121.76 c 0,-2.78 25.233,-5.03 56.359,-5.03 31.126,0 56.361,2.25 56.361,5.03 z"
+         style="opacity:0.4;fill:url(#radialGradient4949);fill-rule:evenodd"
+         id="path3065"
+         inkscape:connector-curvature="0" />
+      <path
+         d="m 120.72,122.77 c 0,2.22 -25.235,4.03 -56.361,4.03 C 33.233,126.8 8,124.99 8,122.77 c 0,-2.22 25.233,-4.03 56.359,-4.03 31.126,0 56.361,1.81 56.361,4.03 z"
+         style="opacity:0.4;fill:url(#radialGradient4946);fill-rule:evenodd"
+         id="path3067"
+         inkscape:connector-curvature="0" />
+    </g>
+    <g
+       id="g4928">
+      <rect
+         x="24.103001"
+         y="57.359001"
+         width="80.513"
+         height="66.259003"
+         ry="0.5"
+         rx="0.5"
+         style="fill:url(#linearGradient3151);fill-rule:evenodd"
+         id="rect1941" />
+      <rect
+         x="24.103001"
+         y="57.359001"
+         width="80.513"
+         height="66.259003"
+         ry="0.5"
+         rx="0.5"
+         style="opacity:0.02999998;fill:url(#linearGradient3148);fill-rule:evenodd"
+         id="rect2709" />
+      <rect
+         x="24.103001"
+         y="57.359001"
+         width="80.513"
+         height="66.259003"
+         ry="0.5"
+         rx="0.5"
+         style="opacity:0.02999998;fill:url(#linearGradient3145);fill-rule:evenodd"
+         id="rect2734" />
+      <rect
+         x="24.103001"
+         y="57.359001"
+         width="80.513"
+         height="66.259003"
+         ry="0.5"
+         rx="0.5"
+         style="opacity:0.02999998;fill:url(#linearGradient3142);fill-rule:evenodd"
+         id="rect2738" />
+      <path
+         d="m 26.619,57.359 c 1.81,2.122 18.145,3.786 38.655,3.786 20.229,0 36.296,-1.647 38.486,-3.727 -0.03,-0.003 -0.03,-0.059 -0.06,-0.059 z"
+         style="opacity:0.5;fill:#ffffff;fill-rule:evenodd"
+         id="path2727"
+         inkscape:connector-curvature="0" />
+      <g
+         transform="matrix(1.7195,0,0,1.9816,4.4209,1.4876)"
+         id="g2798">
+        <path
+           d="m 13.971,30.767 c -0.439,2.629 -0.931,19.309 0.697,22.88 1.592,3.493 1.393,-16.667 5.273,-19.84 3.921,-3.207 -5.555,-5.52 -5.97,-3.04 z"
+           style="opacity:0.40278003;fill:url(#radialGradient1344);fill-rule:evenodd"
+           id="path2778"
+           inkscape:connector-curvature="0" />
+        <path
+           d="m 13.729,30.942 c -0.508,3.069 -1.075,22.541 0.803,26.71 1.837,4.078 1.608,-19.457 6.085,-23.161 4.525,-3.744 -6.41,-6.445 -6.888,-3.549 z"
+           style="opacity:0.3;fill:url(#radialGradient1346);fill-rule:evenodd"
+           id="path2790"
+           inkscape:connector-curvature="0" />
+        <path
+           d="m 13.232,31.092 c -0.631,3.449 -1.335,25.325 0.998,30.009 2.283,4.582 1.998,-21.86 7.562,-26.022 5.623,-4.206 -7.966,-7.24 -8.56,-3.987 z"
+           style="opacity:0.2;fill:url(#radialGradient1348);fill-rule:evenodd"
+           id="path2794"
+           inkscape:connector-curvature="0" />
+      </g>
+      <g
+         transform="matrix(-1.7195,0,0,1.9816,124.3,1.4876)"
+         id="g2803">
+        <path
+           d="m 13.971,30.767 c -0.439,2.629 -0.931,19.309 0.697,22.88 1.592,3.493 1.393,-16.667 5.273,-19.84 3.921,-3.207 -5.555,-5.52 -5.97,-3.04 z"
+           style="opacity:0.40278003;fill:url(#radialGradient3114);fill-rule:evenodd"
+           id="path2805"
+           inkscape:connector-curvature="0" />
+        <path
+           d="m 13.729,30.942 c -0.508,3.069 -1.075,22.541 0.803,26.71 1.837,4.078 1.608,-19.457 6.085,-23.161 4.525,-3.744 -6.41,-6.445 -6.888,-3.549 z"
+           style="opacity:0.3;fill:url(#radialGradient3116);fill-rule:evenodd"
+           id="path2807"
+           inkscape:connector-curvature="0" />
+        <path
+           d="m 13.232,31.092 c -0.631,3.449 -1.335,25.325 0.998,30.009 2.283,4.582 1.998,-21.86 7.562,-26.022 5.623,-4.206 -7.966,-7.24 -8.56,-3.987 z"
+           style="opacity:0.2;fill:url(#radialGradient3118);fill-rule:evenodd"
+           id="path2809"
+           inkscape:connector-curvature="0" />
+      </g>
+      <path
+         d="m 103.12,114.72 v 7.89 c 0,0.56 -0.44,1.01 -0.97,1.01 H 26.572 c -0.537,0 -0.969,-0.45 -0.969,-1.01 V 94.596 c 0,29.514 77.517,-20.879 77.517,20.124 z"
+         style="opacity:0.25;fill:url(#linearGradient3130);fill-rule:evenodd"
+         id="rect3077"
+         inkscape:connector-curvature="0" />
+      <path
+         d="m 25.647,123.62 c 1.81,-2.12 18.145,-3.79 38.655,-3.79 20.229,0 36.298,1.65 38.488,3.73 -0.04,0 -0.03,0.06 -0.06,0.06 z"
+         style="opacity:0.5;fill:#000000;fill-rule:evenodd"
+         id="path2768"
+         inkscape:connector-curvature="0" />
+    </g>
+  </g>
+</svg>
diff --git a/doc/source/images/sharding_scan_basic.svg b/doc/source/images/sharding_scan_basic.svg
new file mode 100644
index 0000000000..54c30f0d8d
--- /dev/null
+++ b/doc/source/images/sharding_scan_basic.svg
@@ -0,0 +1,259 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<svg
+   xmlns:dc="http://purl.org/dc/elements/1.1/"
+   xmlns:cc="http://creativecommons.org/ns#"
+   xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
+   xmlns:svg="http://www.w3.org/2000/svg"
+   xmlns="http://www.w3.org/2000/svg"
+   xmlns:xlink="http://www.w3.org/1999/xlink"
+   xmlns:sodipodi="http://sodipodi.sourceforge.net/DTD/sodipodi-0.dtd"
+   xmlns:inkscape="http://www.inkscape.org/namespaces/inkscape"
+   width="630.00006"
+   height="120"
+   version="1.1"
+   id="svg54"
+   sodipodi:docname="sharding_snip2.svg"
+   inkscape:version="0.92.2 (5c3e80d, 2017-08-06)">
+  <metadata
+     id="metadata60">
+    <rdf:RDF>
+      <cc:Work
+         rdf:about="">
+        <dc:format>image/svg+xml</dc:format>
+        <dc:type
+           rdf:resource="http://purl.org/dc/dcmitype/StillImage" />
+        <dc:title />
+      </cc:Work>
+    </rdf:RDF>
+  </metadata>
+  <defs
+     id="defs58">
+    <defs
+       id="defs50">
+      <path
+         id="d"
+         d="m 779,-765 c -19,-119 -93,-196 -233,-196 -95,0 -164,32 -207,95 -43,63 -64,170 -64,320 0,144 23,251 68,320 45,69 114,104 205,104 139,0 224,-79 240,-212 l 182,12 C 946,-119 781,22 553,20 230,17 87,-201 87,-542 c 0,-338 145,-557 464,-560 225,-1 380,129 413,323"
+         inkscape:connector-curvature="0" />
+      <path
+         id="e"
+         d="m 571,-1102 c 350,0 480,196 482,560 2,357 -151,562 -488,562 -332,0 -479,-218 -479,-562 0,-373 162,-560 485,-560 z m -8,989 c 244,0 301,-164 301,-429 0,-266 -49,-427 -290,-427 -239,0 -299,165 -299,427 0,252 61,429 288,429"
+         inkscape:connector-curvature="0" />
+      <path
+         id="f"
+         d="m 663,-1102 c 251,0 343,119 343,381 V 0 H 825 v -686 c 0,-183 -40,-279 -223,-277 -184,2 -280,141 -280,336 V 0 H 142 c -3,-345 6,-754 -6,-1082 h 170 c 5,68 6,94 8,185 h 3 c 76,-134 157,-205 346,-205"
+         inkscape:connector-curvature="0" />
+      <path
+         id="g"
+         d="m 336,-268 c 2,98 22,139 114,141 24,0 59,-5 104,-14 V -8 C 495,8 434,16 372,16 228,16 156,-66 156,-229 V -951 H 31 v -131 h 132 l 53,-242 h 120 v 242 h 200 v 131 H 336 v 683"
+         inkscape:connector-curvature="0" />
+      <g
+         id="a">
+        <use
+           id="use26"
+           xlink:href="#d"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use28"
+           xlink:href="#e"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use30"
+           xlink:href="#f"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use32"
+           xlink:href="#g"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="h"
+         d="M 0,20 411,-1484 H 569 L 162,20 H 0"
+         inkscape:connector-curvature="0" />
+      <path
+         id="i"
+         d="M 797,-207 C 713,-60 620,16 414,20 203,24 88,-98 87,-302 c 0,-112 37,-198 111,-258 74,-60 192,-93 356,-96 l 243,-4 c 10,-201 -43,-307 -232,-305 -154,2 -223,43 -242,172 l -188,-17 c 31,-195 175,-292 434,-292 259,0 410,116 410,364 v 466 c 3,95 12,159 101,161 17,0 37,-2 59,-7 V -6 C 1094,5 1047,10 1000,10 857,8 812,-66 803,-207 Z m -525,-92 c -1,116 66,187 183,184 230,-7 361,-164 342,-419 -124,5 -305,-2 -389,30 -83,32 -136,92 -136,205"
+         inkscape:connector-curvature="0" />
+      <g
+         id="b">
+        <use
+           id="use37"
+           xlink:href="#h"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use39"
+           xlink:href="#i"
+           transform="matrix(0.01736111,0,0,0.01736111,9.8784722,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use41"
+           xlink:href="#d"
+           transform="matrix(0.01736111,0,0,0.01736111,29.652778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use43"
+           xlink:href="#d"
+           transform="matrix(0.01736111,0,0,0.01736111,47.430556,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use45"
+           xlink:href="#g"
+           transform="matrix(0.01736111,0,0,0.01736111,65.208333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="j"
+         d="m 492,-1341 c -103,3 -130,49 -131,162 v 97 h 211 v 131 H 361 V 0 H 181 V -951 H 29 v -131 h 152 v -122 c 0,-192 78,-276 264,-278 50,0 92,4 127,12 v 137 c -30,-5 -57,-8 -80,-8"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <use
+         id="c"
+         xlink:href="#j"
+         transform="scale(0.01736111)"
+         x="0"
+         y="0"
+         width="100%"
+         height="100%" />
+    </defs>
+  </defs>
+  <sodipodi:namedview
+     pagecolor="#ffffff"
+     bordercolor="#666666"
+     borderopacity="1"
+     objecttolerance="10"
+     gridtolerance="10"
+     guidetolerance="10"
+     inkscape:pageopacity="0"
+     inkscape:pageshadow="2"
+     inkscape:window-width="3840"
+     inkscape:window-height="2031"
+     id="namedview56"
+     showgrid="false"
+     inkscape:zoom="1.8847584"
+     inkscape:cx="-83.692254"
+     inkscape:cy="345.83434"
+     inkscape:window-x="0"
+     inkscape:window-y="55"
+     inkscape:window-maximized="1"
+     inkscape:current-layer="svg54"
+     inkscape:pagecheckerboard="true"
+     fit-margin-top="0"
+     fit-margin-left="0"
+     fit-margin-right="0"
+     fit-margin-bottom="0" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke-width:0.45284379"
+     inkscape:connector-curvature="0"
+     id="path2"
+     d="M 1.4528438,1.9 H 629.5472 V 117.8 H 1.4528438 Z" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:0.90568757"
+     inkscape:connector-curvature="0"
+     id="path4"
+     d="m 10.555004,1.9 h 9.10216 m 4.55108,0 h 9.10216 m 4.55561,0 h 9.10216 m 4.55561,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55561,0 h 9.10216 m 4.55108,0 h 9.111206 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55561,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55561,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.54655,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.54655,0 h 9.10216 m 4.55561,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55561,0 h 9.10216 m 4.5556,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55561,0 h 9.10213 m 4.5511,0 h 9.1112 m 4.5511,0 h 9.1022 m 4.551,0 h 9.1022 m 4.5511,0 h 9.1021 m 4.5511,0 h 9.1022 m 4.5556,0 h 9.1022 m 4.551,0 h 9.1022 m 4.5511,0 h 9.1021 m 4.5511,0 h 9.1022 m 4.5511,0 h 9.1021 m 4.5556,0 h 9.1022 m 4.5511,0 h 9.1021 m 4.5466,0 h 9.1021 m 4.5511,0 h 9.1022 m 4.5465,0 h 9.1022 m 4.5556,0 h 9.1022 m 4.551,0 h 4.5421 v 4.3 m 0,4.2 V 19 m 0,4.3 v 8.6 m 0,4.3 v 8.6 m 0,4.3 v 8.6 m 0,4.3 v 8.6 m 0,4.3 v 8.6 m 0,4.2 v 8.6 m 0,4.3 v 8.6 m 0,4.3 v 4.3 h -4.5511 m -4.5511,0 h -9.1022 m -4.551,0 h -9.1022 m -4.5556,0 h -9.1022 m -4.5556,0 h -9.1021 m -4.5511,0 h -9.1022 m -4.5556,0 h -9.1021 m -4.5511,0 h -9.1112 m -4.5511,0 h -9.1022 m -4.5511,0 h -9.1021 m -4.5511,0 h -9.1022 m -4.551,0 h -9.1022 m -4.5556,0 H 461.13 m -4.5511,0 h -9.1021 m -4.5511,0 h -9.1022 m -4.551,0 h -9.1022 m -4.5511,0 h -9.1021 m -4.5556,0 h -9.1022 m -4.55108,0 h -9.10216 m -4.54655,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.54655,0 h -9.10216 m -4.55561,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55561,0 h -9.0931 m -4.55561,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55561,0 h -9.10216 m -4.55108,0 h -9.11121 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55561,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.102156 m -4.55561,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.54655,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.54655,0 h -9.10216 m -4.55561,0 h -9.10216 m -4.5510802,0 h -4.55108 v -4.3 m 0,-4.3 v -8.6 m 0,-4.3 v -8.6 m 0,-4.3 v -8.5 m 0,-4.3 V 62 m 0,-4.3 v -8.6 m 0,-4.3 v -8.6 m 0,-4.3 v -8.6 m 0,-4.3 v -8.6 m 0,-4.2 V 1.9 h 4.55108" />
+  <path
+     style="fill:#ffffff;stroke:#000000;stroke-width:0.90568757"
+     inkscape:connector-curvature="0"
+     id="path6"
+     d="m 82.511884,44.4 c 0,-2.7 2.22799,-5 4.98128,-5 H 543.5068 c 2.7533,0 4.9813,2.3 4.9813,5 v 30.4 c 0,2.7 -2.228,5 -4.9813,5 H 87.493164 c -2.75329,0 -4.98128,-2.3 -4.98128,-5 z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568757;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path10"
+     d="M 5.5284438,1.9 H 52.624194 V 32.2 H 5.5284438 Z" />
+  <path
+     style="fill:none;stroke-width:0.45284379"
+     inkscape:connector-curvature="0"
+     id="path14"
+     d="M 169.87329,39.4 V 79.8" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568757;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path18"
+     d="m 172.62779,87.4 h 14.94384 v 30.4 h -14.94384 z" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="9.9593773"
+     y="19.10981"
+     id="text281"><tspan
+       sodipodi:role="line"
+       id="tspan279"
+       x="9.9593773"
+       y="19.10981"
+       style="stroke-width:0.45284379">/acct</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="299.41342"
+     y="64.584816"
+     id="text281-9"><tspan
+       sodipodi:role="line"
+       id="tspan279-1"
+       x="299.41342"
+       y="64.584816"
+       style="stroke-width:0.45284379">cont</tspan></text>
+  <path
+     style="fill:#800000;fill-opacity:1;stroke:#aa0000;stroke-width:0.90600002;stroke-linecap:butt;stroke-linejoin:miter;stroke-miterlimit:4;stroke-dasharray:7.24800014, 3.62400007;stroke-dashoffset:0;stroke-opacity:1"
+     d="m 169.27742,39.4 c 0,39.730565 0.0442,39.597985 0.0442,39.597985 v 0 0 0"
+     id="path4476-4"
+     inkscape:connector-curvature="0" />
+  <path
+     style="fill:#aa0000;fill-opacity:1;stroke:#aa0000;stroke-width:0.90600002;stroke-linecap:butt;stroke-linejoin:miter;stroke-miterlimit:4;stroke-dasharray:7.24800014, 3.62400007;stroke-dashoffset:0;stroke-opacity:1"
+     d="m 252.83355,39.4281 c 0,39.730565 0.0442,39.597985 0.0442,39.597985 v 0 0 0"
+     id="path4476-6"
+     inkscape:connector-curvature="0" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#aa0000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="157.79762"
+     y="110.58204"
+     id="text281-0"><tspan
+       sodipodi:role="line"
+       id="tspan279-4"
+       x="157.79762"
+       y="110.58204"
+       style="fill:#aa0000;stroke-width:0.45284379">cat</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#aa0000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="229.34985"
+     y="109.59498"
+     id="text281-0-2"><tspan
+       sodipodi:role="line"
+       id="tspan279-4-7"
+       x="229.34985"
+       y="109.59498"
+       style="fill:#aa0000;stroke-width:0.45284379">giraffe</tspan></text>
+</svg>
diff --git a/doc/source/images/sharding_scan_load.svg b/doc/source/images/sharding_scan_load.svg
new file mode 100644
index 0000000000..327ac1a06c
--- /dev/null
+++ b/doc/source/images/sharding_scan_load.svg
@@ -0,0 +1,1665 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<svg
+   xmlns:dc="http://purl.org/dc/elements/1.1/"
+   xmlns:cc="http://creativecommons.org/ns#"
+   xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
+   xmlns:svg="http://www.w3.org/2000/svg"
+   xmlns="http://www.w3.org/2000/svg"
+   xmlns:xlink="http://www.w3.org/1999/xlink"
+   xmlns:sodipodi="http://sodipodi.sourceforge.net/DTD/sodipodi-0.dtd"
+   xmlns:inkscape="http://www.inkscape.org/namespaces/inkscape"
+   width="630"
+   height="260"
+   version="1.1"
+   id="svg1304"
+   sodipodi:docname="sharding_lock2.svg"
+   inkscape:version="0.92.2 (5c3e80d, 2017-08-06)">
+  <metadata
+     id="metadata1310">
+    <rdf:RDF>
+      <cc:Work
+         rdf:about="">
+        <dc:format>image/svg+xml</dc:format>
+        <dc:type
+           rdf:resource="http://purl.org/dc/dcmitype/StillImage" />
+        <dc:title />
+      </cc:Work>
+    </rdf:RDF>
+  </metadata>
+  <defs
+     id="defs1308">
+    <defs
+       id="defs1300">
+      <path
+         id="v"
+         d="M 0,20 411,-1484 H 569 L 162,20 H 0"
+         inkscape:connector-curvature="0" />
+      <path
+         id="w"
+         d="M 797,-207 C 713,-60 620,16 414,20 203,24 88,-98 87,-302 c 0,-112 37,-198 111,-258 74,-60 192,-93 356,-96 l 243,-4 c 10,-201 -43,-307 -232,-305 -154,2 -223,43 -242,172 l -188,-17 c 31,-195 175,-292 434,-292 259,0 410,116 410,364 v 466 c 3,95 12,159 101,161 17,0 37,-2 59,-7 V -6 C 1094,5 1047,10 1000,10 857,8 812,-66 803,-207 Z m -525,-92 c -1,116 66,187 183,184 230,-7 361,-164 342,-419 -124,5 -305,-2 -389,30 -83,32 -136,92 -136,205"
+         inkscape:connector-curvature="0" />
+      <path
+         id="x"
+         d="m 779,-765 c -19,-119 -93,-196 -233,-196 -95,0 -164,32 -207,95 -43,63 -64,170 -64,320 0,144 23,251 68,320 45,69 114,104 205,104 139,0 224,-79 240,-212 l 182,12 C 946,-119 781,22 553,20 230,17 87,-201 87,-542 c 0,-338 145,-557 464,-560 225,-1 380,129 413,323"
+         inkscape:connector-curvature="0" />
+      <path
+         id="y"
+         d="m 336,-268 c 2,98 22,139 114,141 24,0 59,-5 104,-14 V -8 C 495,8 434,16 372,16 228,16 156,-66 156,-229 V -951 H 31 v -131 h 132 l 53,-242 h 120 v 242 h 200 v 131 H 336 v 683"
+         inkscape:connector-curvature="0" />
+      <g
+         id="a">
+        <use
+           id="use981"
+           xlink:href="#v"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use983"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,9.8784722,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use985"
+           xlink:href="#x"
+           transform="matrix(0.01736111,0,0,0.01736111,29.652778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use987"
+           xlink:href="#x"
+           transform="matrix(0.01736111,0,0,0.01736111,47.430556,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use989"
+           xlink:href="#y"
+           transform="matrix(0.01736111,0,0,0.01736111,65.208333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="z"
+         d="M 187,0 V -219 H 382 V 0 H 187"
+         inkscape:connector-curvature="0" />
+      <path
+         id="A"
+         d="m 513,-963 c -139,1 -238,29 -238,149 0,72 41,100 95,127 55,27 348,94 404,125 101,56 176,118 176,263 C 950,-73 758,21 511,20 254,19 107,-55 57,-254 l 159,-31 c 34,123 133,168 295,168 156,0 264,-34 264,-168 0,-156 -183,-165 -315,-204 -171,-51 -245,-68 -323,-172 -26,-35 -37,-82 -37,-135 0,-220 172,-304 413,-303 232,1 379,74 418,265 l -162,20 C 746,-918 647,-964 513,-963"
+         inkscape:connector-curvature="0" />
+      <path
+         id="B"
+         d="m 322,-1484 c -2,195 6,405 -8,587 h 3 c 73,-129 159,-205 346,-205 250,0 342,118 343,381 V 0 H 825 v -686 c 3,-190 -43,-277 -223,-277 -176,-1 -280,140 -280,325 V 0 H 142 v -1484 h 180"
+         inkscape:connector-curvature="0" />
+      <path
+         id="C"
+         d="m 318,-861 c 55,-157 83,-241 257,-241 24,0 48,3 73,10 v 165 c -24,-7 -56,-10 -96,-10 -75,0 -132,33 -171,97 -39,64 -59,156 -59,276 V 0 H 142 c -3,-364 6,-725 -6,-1082 h 170 c 5,123 8,196 8,221 h 4"
+         inkscape:connector-curvature="0" />
+      <path
+         id="D"
+         d="m 835,0 c -5,-29 -11,-137 -10,-174 h -4 C 759,-45 663,20 484,20 177,20 86,-201 86,-536 c 0,-377 133,-566 398,-566 178,1 273,67 339,188 -4,-187 -1,-380 -2,-570 h 180 v 1261 c 0,113 2,187 6,223 z m -14,-554 c 0,-255 -58,-415 -289,-415 -91,0 -151,37 -196,101 -76,109 -77,543 -1,651 44,63 105,98 195,98 235,0 291,-173 291,-435"
+         inkscape:connector-curvature="0" />
+      <path
+         id="E"
+         d="m 87,-548 c 0,-338 159,-553 484,-554 325,-2 484,204 477,599 H 276 c -1,227 88,385 302,388 146,2 246,-65 283,-166 l 158,45 C 954,-65 807,20 578,20 240,20 87,-193 87,-548 Z m 775,-93 c -19,-206 -90,-328 -294,-328 -185,0 -285,140 -290,328 h 584"
+         inkscape:connector-curvature="0" />
+      <path
+         id="F"
+         d="M -31,407 V 277 H 1162 V 407 H -31"
+         inkscape:connector-curvature="0" />
+      <g
+         id="b">
+        <use
+           id="use999"
+           xlink:href="#v"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1001"
+           xlink:href="#z"
+           transform="matrix(0.01736111,0,0,0.01736111,9.8784722,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1003"
+           xlink:href="#A"
+           transform="matrix(0.01736111,0,0,0.01736111,19.756944,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1005"
+           xlink:href="#B"
+           transform="matrix(0.01736111,0,0,0.01736111,37.534722,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1007"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,57.309028,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1009"
+           xlink:href="#C"
+           transform="matrix(0.01736111,0,0,0.01736111,77.083333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1011"
+           xlink:href="#D"
+           transform="matrix(0.01736111,0,0,0.01736111,88.923611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1013"
+           xlink:href="#E"
+           transform="matrix(0.01736111,0,0,0.01736111,108.69792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1015"
+           xlink:href="#D"
+           transform="matrix(0.01736111,0,0,0.01736111,128.47222,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1017"
+           xlink:href="#F"
+           transform="matrix(0.01736111,0,0,0.01736111,148.24653,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1019"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,168.02083,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1021"
+           xlink:href="#x"
+           transform="matrix(0.01736111,0,0,0.01736111,187.79514,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1023"
+           xlink:href="#x"
+           transform="matrix(0.01736111,0,0,0.01736111,205.57292,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1025"
+           xlink:href="#y"
+           transform="matrix(0.01736111,0,0,0.01736111,223.35069,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="G"
+         d="m 571,-1102 c 350,0 480,196 482,560 2,357 -151,562 -488,562 -332,0 -479,-218 -479,-562 0,-373 162,-560 485,-560 z m -8,989 c 244,0 301,-164 301,-429 0,-266 -49,-427 -290,-427 -239,0 -299,165 -299,427 0,252 61,429 288,429"
+         inkscape:connector-curvature="0" />
+      <path
+         id="H"
+         d="m 663,-1102 c 251,0 343,119 343,381 V 0 H 825 v -686 c 0,-183 -40,-279 -223,-277 -184,2 -280,141 -280,336 V 0 H 142 c -3,-345 6,-754 -6,-1082 h 170 c 5,68 6,94 8,185 h 3 c 76,-134 157,-205 346,-205"
+         inkscape:connector-curvature="0" />
+      <path
+         id="I"
+         d="m 1059,-705 c 0,235 -42,415 -125,539 C 851,-42 729,20 567,20 405,20 283,-42 202,-165 121,-288 80,-468 80,-705 c 0,-242 39,-423 118,-544 79,-121 204,-181 375,-181 166,0 288,61 367,183 79,122 119,303 119,542 z m -257,436 c 94,-156 93,-724 4,-878 -51,-89 -125,-137 -233,-137 -111,0 -186,48 -239,135 -91,149 -91,731 2,883 55,89 126,139 233,139 106,0 178,-51 233,-142"
+         inkscape:connector-curvature="0" />
+      <path
+         id="J"
+         d="m 156,0 v -153 h 359 v -1084 l -318,227 v -170 l 333,-229 h 166 v 1256 h 343 V 0 H 156"
+         inkscape:connector-curvature="0" />
+      <path
+         id="K"
+         d="m 655,-1102 c 307,0 398,221 398,556 0,377 -133,566 -398,566 -180,0 -272,-66 -339,-188 1,22 -7,151 -10,168 H 132 c 4,-36 6,-110 6,-223 v -1261 h 180 c -2,196 4,384 -4,576 h 4 c 62,-129 158,-194 337,-194 z m -337,573 c 0,254 57,416 289,416 91,0 152,-37 197,-101 76,-109 76,-543 0,-651 -44,-63 -105,-98 -195,-98 -236,0 -291,169 -291,434"
+         inkscape:connector-curvature="0" />
+      <path
+         id="L"
+         d="m 572,-1430 c 269,0 442,128 442,386 0,144 -72,232 -149,325 -108,130 -487,366 -564,566 h 735 V 0 H 103 v -127 c 119,-285 378,-432 583,-627 76,-72 141,-150 143,-284 1,-156 -100,-244 -257,-244 -156,0 -263,93 -277,238 l -184,-17 c 24,-224 208,-369 461,-369"
+         inkscape:connector-curvature="0" />
+      <path
+         id="M"
+         d="m 715,-719 c 191,17 334,134 334,330 C 1049,-115 858,20 571,20 288,20 108,-110 78,-362 l 186,-17 c 24,167 126,250 307,250 177,0 294,-88 291,-266 -3,-174 -149,-246 -344,-244 H 416 v -156 h 98 c 179,2 311,-77 311,-243 0,-157 -98,-244 -264,-244 -159,0 -264,88 -278,233 l -181,-14 c 23,-229 206,-367 461,-367 262,0 447,124 447,373 0,197 -120,298 -295,334 v 4"
+         inkscape:connector-curvature="0" />
+      <path
+         id="N"
+         d="M 1036,-1263 C 892,-1043 790,-871 731,-746 626,-522 556,-302 553,0 H 365 c 0,-180 39,-369 115,-568 76,-199 203,-429 382,-688 H 105 v -153 h 931 v 146"
+         inkscape:connector-curvature="0" />
+      <g
+         id="c">
+        <use
+           id="use1036"
+           xlink:href="#x"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1038"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1040"
+           xlink:href="#H"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1042"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1044"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,50.403646,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1046"
+           xlink:href="#I"
+           transform="matrix(0.01302083,0,0,0.01302083,65.234375,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1048"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,80.065104,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1050"
+           xlink:href="#J"
+           transform="matrix(0.01302083,0,0,0.01302083,94.895833,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1052"
+           xlink:href="#E"
+           transform="matrix(0.01302083,0,0,0.01302083,109.72656,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1054"
+           xlink:href="#E"
+           transform="matrix(0.01302083,0,0,0.01302083,124.55729,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1056"
+           xlink:href="#K"
+           transform="matrix(0.01302083,0,0,0.01302083,139.38802,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1058"
+           xlink:href="#L"
+           transform="matrix(0.01302083,0,0,0.01302083,154.21875,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1060"
+           xlink:href="#M"
+           transform="matrix(0.01302083,0,0,0.01302083,169.04948,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1062"
+           xlink:href="#N"
+           transform="matrix(0.01302083,0,0,0.01302083,183.88021,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="d">
+        <use
+           id="use1065"
+           xlink:href="#x"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1067"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1069"
+           xlink:href="#H"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1071"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="e">
+        <use
+           id="use1074"
+           xlink:href="#x"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1076"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1078"
+           xlink:href="#H"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1080"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="O"
+         d="M 496,424 C 268,175 127,-92 127,-532 c 0,-438 143,-704 369,-952 h 174 c -222,249 -362,524 -362,954 0,431 138,703 362,954 H 496"
+         inkscape:connector-curvature="0" />
+      <path
+         id="P"
+         d="m 320,-908 c 63,-128 152,-193 335,-193 133,0 233,45 299,134 66,89 99,230 99,421 0,377 -133,566 -398,566 -167,0 -279,-63 -336,-188 h -5 c 8,141 2,428 4,593 H 138 V -861 c 0,-111 -2,-185 -6,-221 h 174 c 5,33 9,134 10,174 z m -2,380 c 0,254 57,415 289,415 89,0 149,-37 195,-99 76,-105 79,-547 1,-653 -45,-62 -105,-97 -194,-97 -243,1 -291,184 -291,434"
+         inkscape:connector-curvature="0" />
+      <path
+         id="Q"
+         d="m 137,-1312 v -172 h 180 v 172 z M 137,0 V -1082 H 317 V 0 H 137"
+         inkscape:connector-curvature="0" />
+      <path
+         id="R"
+         d="M 613,0 H 400 L 7,-1082 h 192 c 109,337 207,579 307,941 97,-323 214,-627 320,-941 h 191"
+         inkscape:connector-curvature="0" />
+      <g
+         id="f">
+        <use
+           id="use1087"
+           xlink:href="#O"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1089"
+           xlink:href="#P"
+           transform="matrix(0.01302083,0,0,0.01302083,8.8802083,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1091"
+           xlink:href="#Q"
+           transform="matrix(0.01302083,0,0,0.01302083,23.710937,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1093"
+           xlink:href="#R"
+           transform="matrix(0.01302083,0,0,0.01302083,29.635417,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1095"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,42.96875,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1097"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,57.799479,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="S"
+         d="m 186,-1484 c 228,249 369,516 369,956 0,438 -143,704 -369,952 H 12 C 235,172 374,-97 374,-530 374,-961 234,-1234 12,-1484 h 174"
+         inkscape:connector-curvature="0" />
+      <g
+         id="g">
+        <use
+           id="use1101"
+           xlink:href="#D"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1103"
+           xlink:href="#K"
+           transform="matrix(0.01302083,0,0,0.01302083,14.830729,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1105"
+           xlink:href="#S"
+           transform="matrix(0.01302083,0,0,0.01302083,29.661458,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="T"
+         d="m 779,-765 c -19,-119 -93,-196 -233,-196 -95,0 -164,32 -207,95 -43,63 -64,170 -64,320 0,144 23,251 68,320 45,69 114,104 205,104 139,0 224,-79 240,-212 l 182,12 C 946,-119 781,22 553,20 230,17 87,-201 87,-542 c 0,-338 145,-557 464,-560 225,-1 380,129 413,323"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="U"
+         d="M 797,-207 C 713,-60 620,16 414,20 203,24 88,-98 87,-302 c 0,-112 37,-198 111,-258 74,-60 192,-93 356,-96 l 243,-4 c 10,-201 -43,-307 -232,-305 -154,2 -223,43 -242,172 l -188,-17 c 31,-195 175,-292 434,-292 259,0 410,116 410,364 v 466 c 3,95 12,159 101,161 17,0 37,-2 59,-7 V -6 C 1094,5 1047,10 1000,10 857,8 812,-66 803,-207 Z m -525,-92 c -1,116 66,187 183,184 230,-7 361,-164 342,-419 -124,5 -305,-2 -389,30 -83,32 -136,92 -136,205"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="V"
+         d="m 336,-268 c 2,98 22,139 114,141 24,0 59,-5 104,-14 V -8 C 495,8 434,16 372,16 228,16 156,-66 156,-229 V -951 H 31 v -131 h 132 l 53,-242 h 120 v 242 h 200 v 131 H 336 v 683"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <g
+         id="h">
+        <use
+           id="use1111"
+           xlink:href="#T"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1113"
+           xlink:href="#U"
+           transform="matrix(0.01736111,0,0,0.01736111,17.777778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1115"
+           xlink:href="#V"
+           transform="matrix(0.01736111,0,0,0.01736111,37.552083,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="W"
+         d="m 824,-897 c -1,-17 6,-175 12,-185 h 171 c -12,319 -6,716 -6,1051 0,304 -151,456 -453,456 -226,0 -374,-90 -417,-267 l 181,-26 c 24,102 112,157 241,156 179,0 269,-105 269,-315 0,-57 3,-120 -2,-174 C 759,-74 647,8 472,8 339,8 242,-36 180,-124 118,-212 86,-350 86,-539 c 0,-191 33,-332 100,-423 67,-91 169,-137 306,-137 167,0 273,85 332,202 z m -38,579 c 48,-119 46,-331 0,-450 -42,-108 -118,-197 -250,-197 -92,0 -154,37 -201,100 -78,107 -74,530 -4,643 63,101 251,129 353,47 43,-35 77,-81 102,-143"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="X"
+         d="m 137,-1312 v -172 h 180 v 172 z M 137,0 V -1082 H 317 V 0 H 137"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="Y"
+         d="m 318,-861 c 55,-157 83,-241 257,-241 24,0 48,3 73,10 v 165 c -24,-7 -56,-10 -96,-10 -75,0 -132,33 -171,97 -39,64 -59,156 -59,276 V 0 H 142 c -3,-364 6,-725 -6,-1082 h 170 c 5,123 8,196 8,221 h 4"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="Z"
+         d="m 492,-1341 c -103,3 -130,49 -131,162 v 97 h 211 v 131 H 361 V 0 H 181 V -951 H 29 v -131 h 152 v -122 c 0,-192 78,-276 264,-278 50,0 92,4 127,12 v 137 c -30,-5 -57,-8 -80,-8"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="aa"
+         d="m 87,-548 c 0,-338 159,-553 484,-554 325,-2 484,204 477,599 H 276 c -1,227 88,385 302,388 146,2 246,-65 283,-166 l 158,45 C 954,-65 807,20 578,20 240,20 87,-193 87,-548 Z m 775,-93 c -19,-206 -90,-328 -294,-328 -185,0 -285,140 -290,328 h 584"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <g
+         id="i">
+        <use
+           id="use1123"
+           xlink:href="#W"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1125"
+           xlink:href="#X"
+           transform="matrix(0.01736111,0,0,0.01736111,19.774306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1127"
+           xlink:href="#Y"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1129"
+           xlink:href="#U"
+           transform="matrix(0.01736111,0,0,0.01736111,39.513889,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1131"
+           xlink:href="#Z"
+           transform="matrix(0.01736111,0,0,0.01736111,59.288194,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1133"
+           xlink:href="#Z"
+           transform="matrix(0.01736111,0,0,0.01736111,68.524306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1135"
+           xlink:href="#aa"
+           transform="matrix(0.01736111,0,0,0.01736111,78.402778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="ab"
+         d="M 138,0 V -1484 H 318 V 0 H 138"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="ac"
+         d="m 571,-1102 c 350,0 480,196 482,560 2,357 -151,562 -488,562 -332,0 -479,-218 -479,-562 0,-373 162,-560 485,-560 z m -8,989 c 244,0 301,-164 301,-429 0,-266 -49,-427 -290,-427 -239,0 -299,165 -299,427 0,252 61,429 288,429"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <g
+         id="j">
+        <use
+           id="use1140"
+           xlink:href="#X"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1142"
+           xlink:href="#W"
+           transform="matrix(0.01736111,0,0,0.01736111,7.8993056,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1144"
+           xlink:href="#ab"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1146"
+           xlink:href="#ac"
+           transform="matrix(0.01736111,0,0,0.01736111,35.572917,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1148"
+           xlink:href="#ac"
+           transform="matrix(0.01736111,0,0,0.01736111,55.347222,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="ad"
+         d="m 765,-739 c 171,25 285,155 285,346 C 1049,-119 859,20 570,20 286,20 89,-117 89,-391 89,-574 212,-714 370,-737 v -4 c -143,-30 -248,-160 -248,-328 1,-229 198,-361 444,-361 254,0 448,125 449,363 1,166 -104,300 -250,324 z m -197,-70 c 171,-2 261,-74 260,-248 0,-159 -87,-239 -262,-239 -165,0 -260,77 -260,239 0,163 99,249 262,248 z m 4,694 c 200,0 291,-92 291,-295 1,-179 -116,-264 -297,-264 -175,0 -292,98 -291,268 0,194 99,291 297,291"
+         inkscape:connector-curvature="0" />
+      <path
+         id="ae"
+         d="m 492,-1341 c -103,3 -130,49 -131,162 v 97 h 211 v 131 H 361 V 0 H 181 V -951 H 29 v -131 h 152 v -122 c 0,-192 78,-276 264,-278 50,0 92,4 127,12 v 137 c -30,-5 -57,-8 -80,-8"
+         inkscape:connector-curvature="0" />
+      <g
+         id="k">
+        <use
+           id="use1153"
+           xlink:href="#x"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1155"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1157"
+           xlink:href="#H"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1159"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1161"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,50.403646,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1163"
+           xlink:href="#I"
+           transform="matrix(0.01302083,0,0,0.01302083,65.234375,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1165"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,80.065104,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1167"
+           xlink:href="#D"
+           transform="matrix(0.01302083,0,0,0.01302083,94.895833,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1169"
+           xlink:href="#D"
+           transform="matrix(0.01302083,0,0,0.01302083,109.72656,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1171"
+           xlink:href="#ad"
+           transform="matrix(0.01302083,0,0,0.01302083,124.55729,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1173"
+           xlink:href="#M"
+           transform="matrix(0.01302083,0,0,0.01302083,139.38802,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1175"
+           xlink:href="#L"
+           transform="matrix(0.01302083,0,0,0.01302083,154.21875,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1177"
+           xlink:href="#ad"
+           transform="matrix(0.01302083,0,0,0.01302083,169.04948,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1179"
+           xlink:href="#ae"
+           transform="matrix(0.01302083,0,0,0.01302083,183.88021,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="af"
+         d="m 625,-911 c 261,-2 424,185 424,450 0,289 -169,481 -455,481 -159,0 -280,-59 -364,-177 -84,-118 -126,-290 -126,-515 0,-244 44,-431 131,-562 87,-131 212,-196 373,-196 213,0 347,96 402,287 l -172,31 c -35,-115 -113,-172 -232,-172 -103,0 -182,48 -238,144 -56,96 -85,234 -85,415 59,-113 178,-184 342,-186 z m -37,786 c 182,0 278,-138 278,-328 0,-193 -98,-318 -284,-319 -166,-1 -281,107 -281,276 0,195 106,371 287,371"
+         inkscape:connector-curvature="0" />
+      <g
+         id="l">
+        <use
+           id="use1183"
+           xlink:href="#x"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1185"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1187"
+           xlink:href="#H"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1189"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1191"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,50.403646,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1193"
+           xlink:href="#I"
+           transform="matrix(0.01302083,0,0,0.01302083,65.234375,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1195"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,80.065104,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1197"
+           xlink:href="#w"
+           transform="matrix(0.01302083,0,0,0.01302083,94.895833,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1199"
+           xlink:href="#x"
+           transform="matrix(0.01302083,0,0,0.01302083,109.72656,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1201"
+           xlink:href="#I"
+           transform="matrix(0.01302083,0,0,0.01302083,123.0599,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1203"
+           xlink:href="#I"
+           transform="matrix(0.01302083,0,0,0.01302083,137.89062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1205"
+           xlink:href="#x"
+           transform="matrix(0.01302083,0,0,0.01302083,152.72135,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1207"
+           xlink:href="#af"
+           transform="matrix(0.01302083,0,0,0.01302083,166.05469,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1209"
+           xlink:href="#w"
+           transform="matrix(0.01302083,0,0,0.01302083,180.88542,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="m">
+        <use
+           id="use1212"
+           xlink:href="#H"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1214"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,19.774306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1216"
+           xlink:href="#H"
+           transform="matrix(0.01736111,0,0,0.01736111,39.548611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1218"
+           xlink:href="#E"
+           transform="matrix(0.01736111,0,0,0.01736111,59.322917,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="ag"
+         d="m 91,-464 v -160 h 500 v 160 H 91"
+         inkscape:connector-curvature="0" />
+      <use
+         id="n"
+         xlink:href="#ag"
+         transform="scale(0.01736111)"
+         x="0"
+         y="0"
+         width="100%"
+         height="100%" />
+      <g
+         id="o">
+        <use
+           id="use1223"
+           xlink:href="#x"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1225"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,17.777778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1227"
+           xlink:href="#y"
+           transform="matrix(0.01736111,0,0,0.01736111,37.552083,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="p">
+        <use
+           id="use1230"
+           xlink:href="#x"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1232"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,17.777778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1234"
+           xlink:href="#y"
+           transform="matrix(0.01736111,0,0,0.01736111,37.552083,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="ah"
+         d="m 824,-897 c -1,-17 6,-175 12,-185 h 171 c -12,319 -6,716 -6,1051 0,304 -151,456 -453,456 -226,0 -374,-90 -417,-267 l 181,-26 c 24,102 112,157 241,156 179,0 269,-105 269,-315 0,-57 3,-120 -2,-174 C 759,-74 647,8 472,8 339,8 242,-36 180,-124 118,-212 86,-350 86,-539 c 0,-191 33,-332 100,-423 67,-91 169,-137 306,-137 167,0 273,85 332,202 z m -38,579 c 48,-119 46,-331 0,-450 -42,-108 -118,-197 -250,-197 -92,0 -154,37 -201,100 -78,107 -74,530 -4,643 63,101 251,129 353,47 43,-35 77,-81 102,-143"
+         inkscape:connector-curvature="0" />
+      <g
+         id="q">
+        <use
+           id="use1238"
+           xlink:href="#ah"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1240"
+           xlink:href="#Q"
+           transform="matrix(0.01736111,0,0,0.01736111,19.774306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1242"
+           xlink:href="#C"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1244"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,39.513889,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1246"
+           xlink:href="#ae"
+           transform="matrix(0.01736111,0,0,0.01736111,59.288194,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1248"
+           xlink:href="#ae"
+           transform="matrix(0.01736111,0,0,0.01736111,68.524306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1250"
+           xlink:href="#E"
+           transform="matrix(0.01736111,0,0,0.01736111,78.402778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="r">
+        <use
+           id="use1253"
+           xlink:href="#ah"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1255"
+           xlink:href="#Q"
+           transform="matrix(0.01736111,0,0,0.01736111,19.774306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1257"
+           xlink:href="#C"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1259"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,39.513889,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1261"
+           xlink:href="#ae"
+           transform="matrix(0.01736111,0,0,0.01736111,59.288194,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1263"
+           xlink:href="#ae"
+           transform="matrix(0.01736111,0,0,0.01736111,68.524306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1265"
+           xlink:href="#E"
+           transform="matrix(0.01736111,0,0,0.01736111,78.402778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="ai"
+         d="M 138,0 V -1484 H 318 V 0 H 138"
+         inkscape:connector-curvature="0" />
+      <g
+         id="s">
+        <use
+           id="use1269"
+           xlink:href="#Q"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1271"
+           xlink:href="#ah"
+           transform="matrix(0.01736111,0,0,0.01736111,7.8993056,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1273"
+           xlink:href="#ai"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1275"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,35.572917,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1277"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,55.347222,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="t">
+        <use
+           id="use1280"
+           xlink:href="#Q"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1282"
+           xlink:href="#ah"
+           transform="matrix(0.01736111,0,0,0.01736111,7.8993056,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1284"
+           xlink:href="#ai"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1286"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,35.572917,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1288"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,55.347222,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="u">
+        <use
+           id="use1291"
+           xlink:href="#H"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1293"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,19.774306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1295"
+           xlink:href="#H"
+           transform="matrix(0.01736111,0,0,0.01736111,39.548611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1297"
+           xlink:href="#E"
+           transform="matrix(0.01736111,0,0,0.01736111,59.322917,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+    </defs>
+  </defs>
+  <sodipodi:namedview
+     pagecolor="#ffffff"
+     bordercolor="#666666"
+     borderopacity="1"
+     objecttolerance="10"
+     gridtolerance="10"
+     guidetolerance="10"
+     inkscape:pageopacity="0"
+     inkscape:pageshadow="2"
+     inkscape:window-width="3840"
+     inkscape:window-height="2031"
+     id="namedview1306"
+     showgrid="false"
+     inkscape:zoom="2.8284271"
+     inkscape:cx="266.16443"
+     inkscape:cy="101.43173"
+     inkscape:window-x="0"
+     inkscape:window-y="55"
+     inkscape:window-maximized="1"
+     inkscape:current-layer="svg1304" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke-width:0.45284426"
+     inkscape:connector-curvature="0"
+     id="path861"
+     d="M 0.896161,23.844052 H 628.99114 V 139.77218 H 0.896161 Z" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path863"
+     d="M 9.9983304,23.844052 H 19.1005 m 4.551085,0 h 9.102169 m 4.555613,0 h 9.10217 m 4.555613,0 h 9.102169 m 4.551085,0 h 9.102169 m 4.555613,0 h 9.10217 m 4.537499,0 h 9.111225 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55561,0 h 9.10217 m 4.55109,0 h 9.10216 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55561,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.54656,0 h 9.10217 m 4.56014,0 h 9.10217 m 4.54656,0 h 9.10217 m 4.55561,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55561,0 h 9.09765 m 4.55561,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55562,0 h 9.10216 m 4.55109,0 h 9.11123 m 4.55108,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55562,0 h 9.10216 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55561,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.54655,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.54655,0 h 9.10217 m 4.55562,0 h 9.10217 m 4.55108,0 h 4.55109 v 4.292964 m 0,4.292963 v 8.590456 m 0,4.292963 v 8.590456 m 0,4.292963 v 8.585927 m 0,4.30202 v 8.585927 m 0,4.292964 v 8.585927 m 0,4.30202 V 105.433 m 0,4.29296 v 8.58593 m 0,4.28844 v 8.59045 m 0,4.29297 v 4.28843 h -4.55109 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.11123 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.54656,0 h -9.10217 m -4.54655,0 h -9.10217 m -4.54656,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10216 m -4.55562,0 h -9.09764 m -4.55561,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.11123 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.102165 m -4.555613,0 h -9.102169 m -4.551085,0 h -9.102169 m -4.546557,0 h -9.102169 m -4.551085,0 h -9.102169 m -4.546557,0 h -9.102169 m -4.555613,0 H 9.9983304 m -4.5510847,0 H 0.896161 v -4.29296 m 0,-4.29297 v -8.59045 m 0,-4.29297 v -8.59045 m 0,-4.29296 v -8.576875 m 0,-4.30202 v -8.585927 m 0,-4.292963 v -8.585927 m 0,-4.302021 v -8.581398 m 0,-4.292964 V 45.30887 m 0,-4.288435 v -8.590456 m 0,-4.292963 v -4.292964 h 4.5510847" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path865"
+     d="M 4.9717593,23.844052 H 52.067561 V 54.184617 H 4.9717593 Z" />
+  <path
+     style="fill:#d2fff2;stroke-width:0.45284426"
+     inkscape:connector-curvature="0"
+     id="path869"
+     d="M 0.896161,139.77218 H 628.99114 V 255.70031 H 0.896161 Z" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path871"
+     d="M 9.9983304,139.77218 H 19.1005 m 4.551085,0 h 9.102169 m 4.555613,0 h 9.10217 m 4.555613,0 h 9.102169 m 4.551085,0 h 9.102169 m 4.555613,0 h 9.10217 m 4.551085,0 h 9.111229 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55562,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55562,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.54656,0 h 9.10216 m 4.55109,0 h 9.10217 m 4.54656,0 h 9.10216 m 4.55562,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55561,0 h 9.09312 m 4.55561,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55562,0 h 9.10216 m 4.55109,0 h 9.11123 m 4.55108,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55562,0 h 9.10216 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.55108,0 h 9.10217 m 4.55561,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.54655,0 h 9.10217 m 4.55109,0 h 9.10217 m 4.54655,0 h 9.10217 m 4.55562,0 h 9.10217 m 4.55108,0 h 4.55109 v 4.29296 m 0,4.29297 v 8.59045 m 0,4.29297 v 8.59045 m 0,4.29297 v 8.58592 m 0,4.30202 v 8.58593 m 0,4.29296 v 8.58593 m 0,4.30202 v 8.5814 m 0,4.29296 v 8.58593 m 0,4.28843 v 8.59046 m 0,4.29296 v 4.28844 h -4.55109 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.11123 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.54656,0 h -9.10217 m -4.54655,0 h -9.10217 m -4.54656,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10216 m -4.55562,0 h -9.09764 m -4.55561,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.11123 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55561,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.10217 m -4.55108,0 h -9.10217 m -4.55109,0 h -9.102165 m -4.555613,0 h -9.102169 m -4.551085,0 h -9.102169 m -4.546557,0 h -9.102169 m -4.551085,0 h -9.102169 m -4.546557,0 h -9.102169 m -4.555613,0 H 9.9983304 m -4.5510847,0 H 0.896161 v -4.29297 m 0,-4.29296 v -8.59045 m 0,-4.29297 v -8.59045 m 0,-4.29297 v -8.57687 m 0,-4.30202 v -8.58592 m 0,-4.29297 v -8.58592 m 0,-4.30202 v -8.5814 m 0,-4.29297 V 161.237 m 0,-4.28844 v -8.59045 m 0,-4.29297 v -4.29296 h 4.5510847" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path873"
+     d="M 4.9717593,139.77218 H 122.71126 v 30.34056 H 4.9717593 Z" />
+  <path
+     style="fill:#ffffff;stroke:#000000;stroke-width:1.07623756"
+     inkscape:connector-curvature="0"
+     id="path877"
+     d="m 45.360172,196.7534 c 0,-2.74164 3.159469,-4.9602 7.063854,-4.9602 H 192.41677 c 3.90438,0 7.06386,2.21856 7.06386,4.9602 v 30.21218 c 0,2.74164 -3.15948,4.9602 -7.06386,4.9602 H 52.424026 c -3.904385,0 -7.063854,-2.21856 -7.063854,-4.9602 z" />
+  <path
+     style="fill:#dadada;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path881"
+     d="m 15.840021,66.411412 c 0,-2.753293 2.227994,-4.981287 4.981287,-4.981287 H 476.83547 c 2.75329,0 4.98128,2.227994 4.98128,4.981287 v 30.340564 c 0,2.753294 -2.22799,4.981284 -4.98128,4.981284 H 20.821308 c -2.753293,0 -4.981287,-2.22799 -4.981287,-4.981284 z" />
+  <path
+     style="fill:#ffffff;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path885"
+     d="m 499.02484,66.411412 c 0,-2.753293 2.22799,-4.981287 4.98128,-4.981287 h 98.72005 c 2.75329,0 4.98129,2.227994 4.98129,4.981287 v 30.340564 c 0,2.753294 -2.228,4.981284 -4.98129,4.981284 h -98.72005 c -2.75329,0 -4.98128,-2.22799 -4.98128,-4.981284 z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path897"
+     d="m 68.369954,109.43162 h 38.038916 v 30.34056 H 68.369954 Z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path905"
+     d="m 134.93806,109.43162 h 60.68113 v 30.34056 h -60.68113 z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path913"
+     d="m 199.24194,109.43162 h 87.39894 v 30.34056 h -87.39894 z" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path917"
+     d="M 553.81899,60.524437 507.62888,5.277438 m 43.92589,56.152687 42.21414,-49.849095" />
+  <path
+     style="stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path919"
+     d="m 598.15244,6.3959633 -2.56762,6.2854777 -3.20614,-2.717065 z" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path921"
+     d="M 120.06905,190.49074 73.878938,164.67861 m 43.925892,26.26497 40.32125,-22.27088" />
+  <path
+     style="stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path923"
+     d="m 164.07193,165.38505 -4.64166,4.96317 -2.02874,-3.66803 z" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path929"
+     d="m 291.95975,190.49074 -46.19011,-25.81213 m 43.92589,26.26497 39.882,-22.24371" />
+  <path
+     style="stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path931"
+     d="m 335.50978,165.39411 -4.61901,4.98128 -2.0378,-3.66803 z" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path937"
+     d="M 465.85045,190.49074 419.2075,164.67861 m 44.37873,26.26497 39.882,-22.24371" />
+  <path
+     style="stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path939"
+     d="m 509.40049,165.39411 -4.61902,4.98128 -2.03779,-3.66803 z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path941"
+     d="M 43.010676,231.24672 H 155.76889 v 30.34056 H 43.010676 Z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path949"
+     d="M 168.90138,231.24672 H 281.6596 v 30.34056 H 168.90138 Z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path957"
+     d="M 294.79208,231.69956 H 407.5503 v 30.34057 H 294.79208 Z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path967"
+     d="m 497.21346,102.63895 h 112.75822 v 30.34057 H 497.21346 Z" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="504.97748"
+     y="87.439178"
+     id="text101-6"><tspan
+       sodipodi:role="line"
+       id="tspan99-88"
+       x="504.97748"
+       y="87.439178"
+       style="stroke-width:0.45284379">cont (fresh db)</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="199.31563"
+     y="87.040298"
+     id="text101-6-4"><tspan
+       sodipodi:role="line"
+       id="tspan99-88-4"
+       x="199.31563"
+       y="87.040298"
+       style="stroke-width:0.45284379">cont (retiring db)</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="6.9198484"
+     y="157.37654"
+     id="text277"><tspan
+       sodipodi:role="line"
+       id="tspan275"
+       x="6.9198484"
+       y="157.37654"
+       style="stroke-width:0.45284379">/.shards_acct</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="8.2687769"
+     y="40.810501"
+     id="text281"><tspan
+       sodipodi:role="line"
+       id="tspan279"
+       x="8.2687769"
+       y="40.810501"
+       style="stroke-width:0.45284379">/acct</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="51.543587"
+     y="217.57593"
+     id="text101"><tspan
+       sodipodi:role="line"
+       id="tspan99"
+       x="51.543587"
+       y="217.57593"
+       style="stroke-width:0.45284379">cont-568d8e-&lt;ts&gt;-0</tspan></text>
+  <flowRoot
+     xml:space="preserve"
+     id="flowRoot1828"
+     style="fill:black;fill-opacity:1;stroke:none;font-family:sans-serif;font-style:normal;font-weight:normal;font-size:37.33333333px;line-height:1.25;letter-spacing:0px;word-spacing:0px;-inkscape-font-specification:'sans-serif, Normal';font-stretch:normal;font-variant:normal;text-anchor:start;text-align:start;writing-mode:lr;font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal"><flowRegion
+       id="flowRegion1830"><rect
+         id="rect1832"
+         width="573.11005"
+         height="39.244427"
+         x="182.43355"
+         y="184.33957" /></flowRegion><flowPara
+       id="flowPara1834" /></flowRoot>  <path
+     style="fill:#ffffff;stroke:#000000;stroke-width:1.07623756"
+     inkscape:connector-curvature="0"
+     id="path877-7"
+     d="m 213.91421,196.7534 c 0,-2.74164 3.15947,-4.9602 7.06385,-4.9602 h 139.99275 c 3.90438,0 7.06386,2.21856 7.06386,4.9602 v 30.21218 c 0,2.74164 -3.15948,4.9602 -7.06386,4.9602 H 220.97806 c -3.90438,0 -7.06385,-2.21856 -7.06385,-4.9602 z" />
+  <path
+     style="fill:#ffffff;stroke:#000000;stroke-width:1.07623756"
+     inkscape:connector-curvature="0"
+     id="path877-7-6"
+     d="m 384.32694,196.75341 c 0,-2.74164 3.15947,-4.96021 7.06385,-4.96021 h 139.99275 c 3.90438,0 7.06386,2.21856 7.06386,4.9602 v 30.21218 c 0,2.74164 -3.15948,4.9602 -7.06386,4.9602 H 391.39079 c -3.90438,0 -7.06385,-2.21856 -7.06385,-4.9602 z" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="222.83531"
+     y="217.57593"
+     id="text101-7"><tspan
+       sodipodi:role="line"
+       id="tspan99-8"
+       x="222.83531"
+       y="217.57593"
+       style="stroke-width:0.45284379">cont-750ed3-&lt;ts&gt;-1</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="393.60159"
+     y="217.57593"
+     id="text101-7-4"><tspan
+       sodipodi:role="line"
+       id="tspan99-8-4"
+       x="393.60159"
+       y="217.57593"
+       style="stroke-width:0.45284379">cont-4ec28d-&lt;ts&gt;-2</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="87.972763"
+     y="252.09793"
+     id="text281-90"><tspan
+       sodipodi:role="line"
+       id="tspan279-3"
+       x="87.972763"
+       y="252.09793"
+       style="stroke-width:0.45284379">&quot;&quot; - &quot;cat&quot;</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="238.29955"
+     y="250.91629"
+     id="text281-90-3"><tspan
+       sodipodi:role="line"
+       id="tspan279-3-3"
+       x="238.29955"
+       y="250.91629"
+       style="stroke-width:0.45284379">&quot;cat&quot; - &quot;giraffe&quot;</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="404.81448"
+     y="250.91629"
+     id="text281-90-3-7"><tspan
+       sodipodi:role="line"
+       id="tspan279-3-3-3"
+       x="404.81448"
+       y="250.91629"
+       style="stroke-width:0.45284379">&quot;giraffe&quot; - &quot;igloo&quot;</tspan></text>
+  <path
+     style="fill:none;stroke-width:0.45284426"
+     inkscape:connector-curvature="0"
+     id="path893-3"
+     d="M 86.805144,61.141415 V 101.44455" />
+  <path
+     style="fill:none;stroke-width:0.45284426"
+     inkscape:connector-curvature="0"
+     id="path901-8"
+     d="M 164.24151,61.141415 V 101.44455" />
+  <path
+     style="fill:none;stroke-width:0.45284426"
+     inkscape:connector-curvature="0"
+     id="path909-0"
+     d="M 242.13072,61.141415 V 101.44455" />
+  <path
+     style="fill:#800000;fill-opacity:1;stroke:#aa0000;stroke-width:0.90600002;stroke-linecap:butt;stroke-linejoin:miter;stroke-miterlimit:4;stroke-dasharray:7.24800014, 3.62400007;stroke-dashoffset:0;stroke-opacity:1"
+     d="m 85.638474,61.819435 c 0,39.730565 0.0442,39.597985 0.0442,39.597985 v 0 0 0"
+     id="path4476-4"
+     inkscape:connector-curvature="0" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#aa0000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="74.158684"
+     y="132.26939"
+     id="text281-9-0"><tspan
+       sodipodi:role="line"
+       id="tspan279-9-6"
+       x="74.158684"
+       y="132.26939"
+       style="fill:#aa0000;stroke-width:0.45284379">cat</tspan></text>
+  <path
+     style="fill:#aa0000;fill-opacity:1;stroke:#aa0000;stroke-width:0.90600002;stroke-linecap:butt;stroke-linejoin:miter;stroke-miterlimit:4;stroke-dasharray:7.24800014, 3.62400007;stroke-dashoffset:0;stroke-opacity:1"
+     d="m 162.5243,61.847535 c 0,39.730565 0.0442,39.597985 0.0442,39.597985 v 0 0 0"
+     id="path4476-6"
+     inkscape:connector-curvature="0" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#aa0000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="139.04062"
+     y="131.28233"
+     id="text281-9-8"><tspan
+       sodipodi:role="line"
+       id="tspan279-9-3"
+       x="139.04062"
+       y="131.28233"
+       style="fill:#aa0000;stroke-width:0.45284379">giraffe</tspan></text>
+  <path
+     style="fill:#f9f9f9;fill-opacity:1;stroke:#ba2e44;stroke-width:0.90600002;stroke-linecap:butt;stroke-linejoin:miter;stroke-miterlimit:4;stroke-dasharray:7.24800014, 3.62400007;stroke-dashoffset:0;stroke-opacity:1"
+     d="m 240.71614,61.847535 c 0,39.730555 0.0442,39.597985 0.0442,39.597985 v 0 0 0"
+     id="path4476-6-8"
+     inkscape:connector-curvature="0" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#aa0000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="222.97086"
+     y="131.28233"
+     id="text281-9-8-3"><tspan
+       sodipodi:role="line"
+       id="tspan279-9-3-3"
+       x="222.97086"
+       y="131.28233"
+       style="fill:#aa0000;stroke-width:0.45284379">igloo</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="518.90784"
+     y="130.70813"
+     id="text281-90-3-7-2-5"><tspan
+       sodipodi:role="line"
+       id="tspan279-3-3-3-6-2"
+       x="518.90784"
+       y="130.70813"
+       style="stroke-width:0.45284379">&quot;igloo&quot; - &quot;&quot;</tspan></text>
+</svg>
diff --git a/doc/source/images/sharding_sharded_load.svg b/doc/source/images/sharding_sharded_load.svg
new file mode 100644
index 0000000000..ae9aacb86c
--- /dev/null
+++ b/doc/source/images/sharding_sharded_load.svg
@@ -0,0 +1,1650 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<svg
+   xmlns:dc="http://purl.org/dc/elements/1.1/"
+   xmlns:cc="http://creativecommons.org/ns#"
+   xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
+   xmlns:svg="http://www.w3.org/2000/svg"
+   xmlns="http://www.w3.org/2000/svg"
+   xmlns:xlink="http://www.w3.org/1999/xlink"
+   xmlns:sodipodi="http://sodipodi.sourceforge.net/DTD/sodipodi-0.dtd"
+   xmlns:inkscape="http://www.inkscape.org/namespaces/inkscape"
+   width="787"
+   height="240"
+   version="1.1"
+   id="svg1304"
+   sodipodi:docname="sharding_lock5.svg"
+   inkscape:version="0.92.2 (5c3e80d, 2017-08-06)">
+  <metadata
+     id="metadata1310">
+    <rdf:RDF>
+      <cc:Work
+         rdf:about="">
+        <dc:format>image/svg+xml</dc:format>
+        <dc:type
+           rdf:resource="http://purl.org/dc/dcmitype/StillImage" />
+        <dc:title></dc:title>
+      </cc:Work>
+    </rdf:RDF>
+  </metadata>
+  <defs
+     id="defs1308">
+    <defs
+       id="defs1300">
+      <path
+         id="v"
+         d="M 0,20 411,-1484 H 569 L 162,20 H 0"
+         inkscape:connector-curvature="0" />
+      <path
+         id="w"
+         d="M 797,-207 C 713,-60 620,16 414,20 203,24 88,-98 87,-302 c 0,-112 37,-198 111,-258 74,-60 192,-93 356,-96 l 243,-4 c 10,-201 -43,-307 -232,-305 -154,2 -223,43 -242,172 l -188,-17 c 31,-195 175,-292 434,-292 259,0 410,116 410,364 v 466 c 3,95 12,159 101,161 17,0 37,-2 59,-7 V -6 C 1094,5 1047,10 1000,10 857,8 812,-66 803,-207 Z m -525,-92 c -1,116 66,187 183,184 230,-7 361,-164 342,-419 -124,5 -305,-2 -389,30 -83,32 -136,92 -136,205"
+         inkscape:connector-curvature="0" />
+      <path
+         id="x"
+         d="m 779,-765 c -19,-119 -93,-196 -233,-196 -95,0 -164,32 -207,95 -43,63 -64,170 -64,320 0,144 23,251 68,320 45,69 114,104 205,104 139,0 224,-79 240,-212 l 182,12 C 946,-119 781,22 553,20 230,17 87,-201 87,-542 c 0,-338 145,-557 464,-560 225,-1 380,129 413,323"
+         inkscape:connector-curvature="0" />
+      <path
+         id="y"
+         d="m 336,-268 c 2,98 22,139 114,141 24,0 59,-5 104,-14 V -8 C 495,8 434,16 372,16 228,16 156,-66 156,-229 V -951 H 31 v -131 h 132 l 53,-242 h 120 v 242 h 200 v 131 H 336 v 683"
+         inkscape:connector-curvature="0" />
+      <g
+         id="a">
+        <use
+           id="use981"
+           xlink:href="#v"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use983"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,9.8784722,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use985"
+           xlink:href="#x"
+           transform="matrix(0.01736111,0,0,0.01736111,29.652778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use987"
+           xlink:href="#x"
+           transform="matrix(0.01736111,0,0,0.01736111,47.430556,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use989"
+           xlink:href="#y"
+           transform="matrix(0.01736111,0,0,0.01736111,65.208333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="z"
+         d="M 187,0 V -219 H 382 V 0 H 187"
+         inkscape:connector-curvature="0" />
+      <path
+         id="A"
+         d="m 513,-963 c -139,1 -238,29 -238,149 0,72 41,100 95,127 55,27 348,94 404,125 101,56 176,118 176,263 C 950,-73 758,21 511,20 254,19 107,-55 57,-254 l 159,-31 c 34,123 133,168 295,168 156,0 264,-34 264,-168 0,-156 -183,-165 -315,-204 -171,-51 -245,-68 -323,-172 -26,-35 -37,-82 -37,-135 0,-220 172,-304 413,-303 232,1 379,74 418,265 l -162,20 C 746,-918 647,-964 513,-963"
+         inkscape:connector-curvature="0" />
+      <path
+         id="B"
+         d="m 322,-1484 c -2,195 6,405 -8,587 h 3 c 73,-129 159,-205 346,-205 250,0 342,118 343,381 V 0 H 825 v -686 c 3,-190 -43,-277 -223,-277 -176,-1 -280,140 -280,325 V 0 H 142 v -1484 h 180"
+         inkscape:connector-curvature="0" />
+      <path
+         id="C"
+         d="m 318,-861 c 55,-157 83,-241 257,-241 24,0 48,3 73,10 v 165 c -24,-7 -56,-10 -96,-10 -75,0 -132,33 -171,97 -39,64 -59,156 -59,276 V 0 H 142 c -3,-364 6,-725 -6,-1082 h 170 c 5,123 8,196 8,221 h 4"
+         inkscape:connector-curvature="0" />
+      <path
+         id="D"
+         d="m 835,0 c -5,-29 -11,-137 -10,-174 h -4 C 759,-45 663,20 484,20 177,20 86,-201 86,-536 c 0,-377 133,-566 398,-566 178,1 273,67 339,188 -4,-187 -1,-380 -2,-570 h 180 v 1261 c 0,113 2,187 6,223 z m -14,-554 c 0,-255 -58,-415 -289,-415 -91,0 -151,37 -196,101 -76,109 -77,543 -1,651 44,63 105,98 195,98 235,0 291,-173 291,-435"
+         inkscape:connector-curvature="0" />
+      <path
+         id="E"
+         d="m 87,-548 c 0,-338 159,-553 484,-554 325,-2 484,204 477,599 H 276 c -1,227 88,385 302,388 146,2 246,-65 283,-166 l 158,45 C 954,-65 807,20 578,20 240,20 87,-193 87,-548 Z m 775,-93 c -19,-206 -90,-328 -294,-328 -185,0 -285,140 -290,328 h 584"
+         inkscape:connector-curvature="0" />
+      <path
+         id="F"
+         d="M -31,407 V 277 H 1162 V 407 H -31"
+         inkscape:connector-curvature="0" />
+      <g
+         id="b">
+        <use
+           id="use999"
+           xlink:href="#v"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1001"
+           xlink:href="#z"
+           transform="matrix(0.01736111,0,0,0.01736111,9.8784722,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1003"
+           xlink:href="#A"
+           transform="matrix(0.01736111,0,0,0.01736111,19.756944,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1005"
+           xlink:href="#B"
+           transform="matrix(0.01736111,0,0,0.01736111,37.534722,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1007"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,57.309028,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1009"
+           xlink:href="#C"
+           transform="matrix(0.01736111,0,0,0.01736111,77.083333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1011"
+           xlink:href="#D"
+           transform="matrix(0.01736111,0,0,0.01736111,88.923611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1013"
+           xlink:href="#E"
+           transform="matrix(0.01736111,0,0,0.01736111,108.69792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1015"
+           xlink:href="#D"
+           transform="matrix(0.01736111,0,0,0.01736111,128.47222,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1017"
+           xlink:href="#F"
+           transform="matrix(0.01736111,0,0,0.01736111,148.24653,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1019"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,168.02083,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1021"
+           xlink:href="#x"
+           transform="matrix(0.01736111,0,0,0.01736111,187.79514,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1023"
+           xlink:href="#x"
+           transform="matrix(0.01736111,0,0,0.01736111,205.57292,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1025"
+           xlink:href="#y"
+           transform="matrix(0.01736111,0,0,0.01736111,223.35069,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="G"
+         d="m 571,-1102 c 350,0 480,196 482,560 2,357 -151,562 -488,562 -332,0 -479,-218 -479,-562 0,-373 162,-560 485,-560 z m -8,989 c 244,0 301,-164 301,-429 0,-266 -49,-427 -290,-427 -239,0 -299,165 -299,427 0,252 61,429 288,429"
+         inkscape:connector-curvature="0" />
+      <path
+         id="H"
+         d="m 663,-1102 c 251,0 343,119 343,381 V 0 H 825 v -686 c 0,-183 -40,-279 -223,-277 -184,2 -280,141 -280,336 V 0 H 142 c -3,-345 6,-754 -6,-1082 h 170 c 5,68 6,94 8,185 h 3 c 76,-134 157,-205 346,-205"
+         inkscape:connector-curvature="0" />
+      <path
+         id="I"
+         d="m 1059,-705 c 0,235 -42,415 -125,539 C 851,-42 729,20 567,20 405,20 283,-42 202,-165 121,-288 80,-468 80,-705 c 0,-242 39,-423 118,-544 79,-121 204,-181 375,-181 166,0 288,61 367,183 79,122 119,303 119,542 z m -257,436 c 94,-156 93,-724 4,-878 -51,-89 -125,-137 -233,-137 -111,0 -186,48 -239,135 -91,149 -91,731 2,883 55,89 126,139 233,139 106,0 178,-51 233,-142"
+         inkscape:connector-curvature="0" />
+      <path
+         id="J"
+         d="m 156,0 v -153 h 359 v -1084 l -318,227 v -170 l 333,-229 h 166 v 1256 h 343 V 0 H 156"
+         inkscape:connector-curvature="0" />
+      <path
+         id="K"
+         d="m 655,-1102 c 307,0 398,221 398,556 0,377 -133,566 -398,566 -180,0 -272,-66 -339,-188 1,22 -7,151 -10,168 H 132 c 4,-36 6,-110 6,-223 v -1261 h 180 c -2,196 4,384 -4,576 h 4 c 62,-129 158,-194 337,-194 z m -337,573 c 0,254 57,416 289,416 91,0 152,-37 197,-101 76,-109 76,-543 0,-651 -44,-63 -105,-98 -195,-98 -236,0 -291,169 -291,434"
+         inkscape:connector-curvature="0" />
+      <path
+         id="L"
+         d="m 572,-1430 c 269,0 442,128 442,386 0,144 -72,232 -149,325 -108,130 -487,366 -564,566 h 735 V 0 H 103 v -127 c 119,-285 378,-432 583,-627 76,-72 141,-150 143,-284 1,-156 -100,-244 -257,-244 -156,0 -263,93 -277,238 l -184,-17 c 24,-224 208,-369 461,-369"
+         inkscape:connector-curvature="0" />
+      <path
+         id="M"
+         d="m 715,-719 c 191,17 334,134 334,330 C 1049,-115 858,20 571,20 288,20 108,-110 78,-362 l 186,-17 c 24,167 126,250 307,250 177,0 294,-88 291,-266 -3,-174 -149,-246 -344,-244 H 416 v -156 h 98 c 179,2 311,-77 311,-243 0,-157 -98,-244 -264,-244 -159,0 -264,88 -278,233 l -181,-14 c 23,-229 206,-367 461,-367 262,0 447,124 447,373 0,197 -120,298 -295,334 v 4"
+         inkscape:connector-curvature="0" />
+      <path
+         id="N"
+         d="M 1036,-1263 C 892,-1043 790,-871 731,-746 626,-522 556,-302 553,0 H 365 c 0,-180 39,-369 115,-568 76,-199 203,-429 382,-688 H 105 v -153 h 931 v 146"
+         inkscape:connector-curvature="0" />
+      <g
+         id="c">
+        <use
+           id="use1036"
+           xlink:href="#x"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1038"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1040"
+           xlink:href="#H"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1042"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1044"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,50.403646,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1046"
+           xlink:href="#I"
+           transform="matrix(0.01302083,0,0,0.01302083,65.234375,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1048"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,80.065104,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1050"
+           xlink:href="#J"
+           transform="matrix(0.01302083,0,0,0.01302083,94.895833,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1052"
+           xlink:href="#E"
+           transform="matrix(0.01302083,0,0,0.01302083,109.72656,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1054"
+           xlink:href="#E"
+           transform="matrix(0.01302083,0,0,0.01302083,124.55729,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1056"
+           xlink:href="#K"
+           transform="matrix(0.01302083,0,0,0.01302083,139.38802,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1058"
+           xlink:href="#L"
+           transform="matrix(0.01302083,0,0,0.01302083,154.21875,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1060"
+           xlink:href="#M"
+           transform="matrix(0.01302083,0,0,0.01302083,169.04948,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1062"
+           xlink:href="#N"
+           transform="matrix(0.01302083,0,0,0.01302083,183.88021,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="d">
+        <use
+           id="use1065"
+           xlink:href="#x"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1067"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1069"
+           xlink:href="#H"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1071"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="e">
+        <use
+           id="use1074"
+           xlink:href="#x"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1076"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1078"
+           xlink:href="#H"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1080"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="O"
+         d="M 496,424 C 268,175 127,-92 127,-532 c 0,-438 143,-704 369,-952 h 174 c -222,249 -362,524 -362,954 0,431 138,703 362,954 H 496"
+         inkscape:connector-curvature="0" />
+      <path
+         id="P"
+         d="m 320,-908 c 63,-128 152,-193 335,-193 133,0 233,45 299,134 66,89 99,230 99,421 0,377 -133,566 -398,566 -167,0 -279,-63 -336,-188 h -5 c 8,141 2,428 4,593 H 138 V -861 c 0,-111 -2,-185 -6,-221 h 174 c 5,33 9,134 10,174 z m -2,380 c 0,254 57,415 289,415 89,0 149,-37 195,-99 76,-105 79,-547 1,-653 -45,-62 -105,-97 -194,-97 -243,1 -291,184 -291,434"
+         inkscape:connector-curvature="0" />
+      <path
+         id="Q"
+         d="m 137,-1312 v -172 h 180 v 172 z M 137,0 V -1082 H 317 V 0 H 137"
+         inkscape:connector-curvature="0" />
+      <path
+         id="R"
+         d="M 613,0 H 400 L 7,-1082 h 192 c 109,337 207,579 307,941 97,-323 214,-627 320,-941 h 191"
+         inkscape:connector-curvature="0" />
+      <g
+         id="f">
+        <use
+           id="use1087"
+           xlink:href="#O"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1089"
+           xlink:href="#P"
+           transform="matrix(0.01302083,0,0,0.01302083,8.8802083,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1091"
+           xlink:href="#Q"
+           transform="matrix(0.01302083,0,0,0.01302083,23.710937,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1093"
+           xlink:href="#R"
+           transform="matrix(0.01302083,0,0,0.01302083,29.635417,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1095"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,42.96875,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1097"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,57.799479,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="S"
+         d="m 186,-1484 c 228,249 369,516 369,956 0,438 -143,704 -369,952 H 12 C 235,172 374,-97 374,-530 374,-961 234,-1234 12,-1484 h 174"
+         inkscape:connector-curvature="0" />
+      <g
+         id="g">
+        <use
+           id="use1101"
+           xlink:href="#D"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1103"
+           xlink:href="#K"
+           transform="matrix(0.01302083,0,0,0.01302083,14.830729,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1105"
+           xlink:href="#S"
+           transform="matrix(0.01302083,0,0,0.01302083,29.661458,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="T"
+         d="m 779,-765 c -19,-119 -93,-196 -233,-196 -95,0 -164,32 -207,95 -43,63 -64,170 -64,320 0,144 23,251 68,320 45,69 114,104 205,104 139,0 224,-79 240,-212 l 182,12 C 946,-119 781,22 553,20 230,17 87,-201 87,-542 c 0,-338 145,-557 464,-560 225,-1 380,129 413,323"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="U"
+         d="M 797,-207 C 713,-60 620,16 414,20 203,24 88,-98 87,-302 c 0,-112 37,-198 111,-258 74,-60 192,-93 356,-96 l 243,-4 c 10,-201 -43,-307 -232,-305 -154,2 -223,43 -242,172 l -188,-17 c 31,-195 175,-292 434,-292 259,0 410,116 410,364 v 466 c 3,95 12,159 101,161 17,0 37,-2 59,-7 V -6 C 1094,5 1047,10 1000,10 857,8 812,-66 803,-207 Z m -525,-92 c -1,116 66,187 183,184 230,-7 361,-164 342,-419 -124,5 -305,-2 -389,30 -83,32 -136,92 -136,205"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="V"
+         d="m 336,-268 c 2,98 22,139 114,141 24,0 59,-5 104,-14 V -8 C 495,8 434,16 372,16 228,16 156,-66 156,-229 V -951 H 31 v -131 h 132 l 53,-242 h 120 v 242 h 200 v 131 H 336 v 683"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <g
+         id="h">
+        <use
+           id="use1111"
+           xlink:href="#T"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1113"
+           xlink:href="#U"
+           transform="matrix(0.01736111,0,0,0.01736111,17.777778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1115"
+           xlink:href="#V"
+           transform="matrix(0.01736111,0,0,0.01736111,37.552083,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="W"
+         d="m 824,-897 c -1,-17 6,-175 12,-185 h 171 c -12,319 -6,716 -6,1051 0,304 -151,456 -453,456 -226,0 -374,-90 -417,-267 l 181,-26 c 24,102 112,157 241,156 179,0 269,-105 269,-315 0,-57 3,-120 -2,-174 C 759,-74 647,8 472,8 339,8 242,-36 180,-124 118,-212 86,-350 86,-539 c 0,-191 33,-332 100,-423 67,-91 169,-137 306,-137 167,0 273,85 332,202 z m -38,579 c 48,-119 46,-331 0,-450 -42,-108 -118,-197 -250,-197 -92,0 -154,37 -201,100 -78,107 -74,530 -4,643 63,101 251,129 353,47 43,-35 77,-81 102,-143"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="X"
+         d="m 137,-1312 v -172 h 180 v 172 z M 137,0 V -1082 H 317 V 0 H 137"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="Y"
+         d="m 318,-861 c 55,-157 83,-241 257,-241 24,0 48,3 73,10 v 165 c -24,-7 -56,-10 -96,-10 -75,0 -132,33 -171,97 -39,64 -59,156 -59,276 V 0 H 142 c -3,-364 6,-725 -6,-1082 h 170 c 5,123 8,196 8,221 h 4"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="Z"
+         d="m 492,-1341 c -103,3 -130,49 -131,162 v 97 h 211 v 131 H 361 V 0 H 181 V -951 H 29 v -131 h 152 v -122 c 0,-192 78,-276 264,-278 50,0 92,4 127,12 v 137 c -30,-5 -57,-8 -80,-8"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="aa"
+         d="m 87,-548 c 0,-338 159,-553 484,-554 325,-2 484,204 477,599 H 276 c -1,227 88,385 302,388 146,2 246,-65 283,-166 l 158,45 C 954,-65 807,20 578,20 240,20 87,-193 87,-548 Z m 775,-93 c -19,-206 -90,-328 -294,-328 -185,0 -285,140 -290,328 h 584"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <g
+         id="i">
+        <use
+           id="use1123"
+           xlink:href="#W"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1125"
+           xlink:href="#X"
+           transform="matrix(0.01736111,0,0,0.01736111,19.774306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1127"
+           xlink:href="#Y"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1129"
+           xlink:href="#U"
+           transform="matrix(0.01736111,0,0,0.01736111,39.513889,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1131"
+           xlink:href="#Z"
+           transform="matrix(0.01736111,0,0,0.01736111,59.288194,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1133"
+           xlink:href="#Z"
+           transform="matrix(0.01736111,0,0,0.01736111,68.524306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1135"
+           xlink:href="#aa"
+           transform="matrix(0.01736111,0,0,0.01736111,78.402778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="ab"
+         d="M 138,0 V -1484 H 318 V 0 H 138"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <path
+         id="ac"
+         d="m 571,-1102 c 350,0 480,196 482,560 2,357 -151,562 -488,562 -332,0 -479,-218 -479,-562 0,-373 162,-560 485,-560 z m -8,989 c 244,0 301,-164 301,-429 0,-266 -49,-427 -290,-427 -239,0 -299,165 -299,427 0,252 61,429 288,429"
+         inkscape:connector-curvature="0"
+         style="fill:#b1001c" />
+      <g
+         id="j">
+        <use
+           id="use1140"
+           xlink:href="#X"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1142"
+           xlink:href="#W"
+           transform="matrix(0.01736111,0,0,0.01736111,7.8993056,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1144"
+           xlink:href="#ab"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1146"
+           xlink:href="#ac"
+           transform="matrix(0.01736111,0,0,0.01736111,35.572917,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1148"
+           xlink:href="#ac"
+           transform="matrix(0.01736111,0,0,0.01736111,55.347222,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="ad"
+         d="m 765,-739 c 171,25 285,155 285,346 C 1049,-119 859,20 570,20 286,20 89,-117 89,-391 89,-574 212,-714 370,-737 v -4 c -143,-30 -248,-160 -248,-328 1,-229 198,-361 444,-361 254,0 448,125 449,363 1,166 -104,300 -250,324 z m -197,-70 c 171,-2 261,-74 260,-248 0,-159 -87,-239 -262,-239 -165,0 -260,77 -260,239 0,163 99,249 262,248 z m 4,694 c 200,0 291,-92 291,-295 1,-179 -116,-264 -297,-264 -175,0 -292,98 -291,268 0,194 99,291 297,291"
+         inkscape:connector-curvature="0" />
+      <path
+         id="ae"
+         d="m 492,-1341 c -103,3 -130,49 -131,162 v 97 h 211 v 131 H 361 V 0 H 181 V -951 H 29 v -131 h 152 v -122 c 0,-192 78,-276 264,-278 50,0 92,4 127,12 v 137 c -30,-5 -57,-8 -80,-8"
+         inkscape:connector-curvature="0" />
+      <g
+         id="k">
+        <use
+           id="use1153"
+           xlink:href="#x"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1155"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1157"
+           xlink:href="#H"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1159"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1161"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,50.403646,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1163"
+           xlink:href="#I"
+           transform="matrix(0.01302083,0,0,0.01302083,65.234375,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1165"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,80.065104,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1167"
+           xlink:href="#D"
+           transform="matrix(0.01302083,0,0,0.01302083,94.895833,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1169"
+           xlink:href="#D"
+           transform="matrix(0.01302083,0,0,0.01302083,109.72656,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1171"
+           xlink:href="#ad"
+           transform="matrix(0.01302083,0,0,0.01302083,124.55729,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1173"
+           xlink:href="#M"
+           transform="matrix(0.01302083,0,0,0.01302083,139.38802,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1175"
+           xlink:href="#L"
+           transform="matrix(0.01302083,0,0,0.01302083,154.21875,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1177"
+           xlink:href="#ad"
+           transform="matrix(0.01302083,0,0,0.01302083,169.04948,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1179"
+           xlink:href="#ae"
+           transform="matrix(0.01302083,0,0,0.01302083,183.88021,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="af"
+         d="m 625,-911 c 261,-2 424,185 424,450 0,289 -169,481 -455,481 -159,0 -280,-59 -364,-177 -84,-118 -126,-290 -126,-515 0,-244 44,-431 131,-562 87,-131 212,-196 373,-196 213,0 347,96 402,287 l -172,31 c -35,-115 -113,-172 -232,-172 -103,0 -182,48 -238,144 -56,96 -85,234 -85,415 59,-113 178,-184 342,-186 z m -37,786 c 182,0 278,-138 278,-328 0,-193 -98,-318 -284,-319 -166,-1 -281,107 -281,276 0,195 106,371 287,371"
+         inkscape:connector-curvature="0" />
+      <g
+         id="l">
+        <use
+           id="use1183"
+           xlink:href="#x"
+           transform="scale(0.01302083)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1185"
+           xlink:href="#G"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1187"
+           xlink:href="#H"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1189"
+           xlink:href="#y"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1191"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,50.403646,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1193"
+           xlink:href="#I"
+           transform="matrix(0.01302083,0,0,0.01302083,65.234375,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1195"
+           xlink:href="#F"
+           transform="matrix(0.01302083,0,0,0.01302083,80.065104,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1197"
+           xlink:href="#w"
+           transform="matrix(0.01302083,0,0,0.01302083,94.895833,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1199"
+           xlink:href="#x"
+           transform="matrix(0.01302083,0,0,0.01302083,109.72656,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1201"
+           xlink:href="#I"
+           transform="matrix(0.01302083,0,0,0.01302083,123.0599,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1203"
+           xlink:href="#I"
+           transform="matrix(0.01302083,0,0,0.01302083,137.89062,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1205"
+           xlink:href="#x"
+           transform="matrix(0.01302083,0,0,0.01302083,152.72135,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1207"
+           xlink:href="#af"
+           transform="matrix(0.01302083,0,0,0.01302083,166.05469,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1209"
+           xlink:href="#w"
+           transform="matrix(0.01302083,0,0,0.01302083,180.88542,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="m">
+        <use
+           id="use1212"
+           xlink:href="#H"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1214"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,19.774306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1216"
+           xlink:href="#H"
+           transform="matrix(0.01736111,0,0,0.01736111,39.548611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1218"
+           xlink:href="#E"
+           transform="matrix(0.01736111,0,0,0.01736111,59.322917,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="ag"
+         d="m 91,-464 v -160 h 500 v 160 H 91"
+         inkscape:connector-curvature="0" />
+      <use
+         id="n"
+         xlink:href="#ag"
+         transform="scale(0.01736111)"
+         x="0"
+         y="0"
+         width="100%"
+         height="100%" />
+      <g
+         id="o">
+        <use
+           id="use1223"
+           xlink:href="#x"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1225"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,17.777778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1227"
+           xlink:href="#y"
+           transform="matrix(0.01736111,0,0,0.01736111,37.552083,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="p">
+        <use
+           id="use1230"
+           xlink:href="#x"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1232"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,17.777778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1234"
+           xlink:href="#y"
+           transform="matrix(0.01736111,0,0,0.01736111,37.552083,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="ah"
+         d="m 824,-897 c -1,-17 6,-175 12,-185 h 171 c -12,319 -6,716 -6,1051 0,304 -151,456 -453,456 -226,0 -374,-90 -417,-267 l 181,-26 c 24,102 112,157 241,156 179,0 269,-105 269,-315 0,-57 3,-120 -2,-174 C 759,-74 647,8 472,8 339,8 242,-36 180,-124 118,-212 86,-350 86,-539 c 0,-191 33,-332 100,-423 67,-91 169,-137 306,-137 167,0 273,85 332,202 z m -38,579 c 48,-119 46,-331 0,-450 -42,-108 -118,-197 -250,-197 -92,0 -154,37 -201,100 -78,107 -74,530 -4,643 63,101 251,129 353,47 43,-35 77,-81 102,-143"
+         inkscape:connector-curvature="0" />
+      <g
+         id="q">
+        <use
+           id="use1238"
+           xlink:href="#ah"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1240"
+           xlink:href="#Q"
+           transform="matrix(0.01736111,0,0,0.01736111,19.774306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1242"
+           xlink:href="#C"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1244"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,39.513889,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1246"
+           xlink:href="#ae"
+           transform="matrix(0.01736111,0,0,0.01736111,59.288194,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1248"
+           xlink:href="#ae"
+           transform="matrix(0.01736111,0,0,0.01736111,68.524306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1250"
+           xlink:href="#E"
+           transform="matrix(0.01736111,0,0,0.01736111,78.402778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="r">
+        <use
+           id="use1253"
+           xlink:href="#ah"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1255"
+           xlink:href="#Q"
+           transform="matrix(0.01736111,0,0,0.01736111,19.774306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1257"
+           xlink:href="#C"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1259"
+           xlink:href="#w"
+           transform="matrix(0.01736111,0,0,0.01736111,39.513889,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1261"
+           xlink:href="#ae"
+           transform="matrix(0.01736111,0,0,0.01736111,59.288194,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1263"
+           xlink:href="#ae"
+           transform="matrix(0.01736111,0,0,0.01736111,68.524306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1265"
+           xlink:href="#E"
+           transform="matrix(0.01736111,0,0,0.01736111,78.402778,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <path
+         id="ai"
+         d="M 138,0 V -1484 H 318 V 0 H 138"
+         inkscape:connector-curvature="0" />
+      <g
+         id="s">
+        <use
+           id="use1269"
+           xlink:href="#Q"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1271"
+           xlink:href="#ah"
+           transform="matrix(0.01736111,0,0,0.01736111,7.8993056,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1273"
+           xlink:href="#ai"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1275"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,35.572917,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1277"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,55.347222,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="t">
+        <use
+           id="use1280"
+           xlink:href="#Q"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1282"
+           xlink:href="#ah"
+           transform="matrix(0.01736111,0,0,0.01736111,7.8993056,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1284"
+           xlink:href="#ai"
+           transform="matrix(0.01736111,0,0,0.01736111,27.673611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1286"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,35.572917,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1288"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,55.347222,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+      <g
+         id="u">
+        <use
+           id="use1291"
+           xlink:href="#H"
+           transform="scale(0.01736111)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1293"
+           xlink:href="#G"
+           transform="matrix(0.01736111,0,0,0.01736111,19.774306,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1295"
+           xlink:href="#H"
+           transform="matrix(0.01736111,0,0,0.01736111,39.548611,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+        <use
+           id="use1297"
+           xlink:href="#E"
+           transform="matrix(0.01736111,0,0,0.01736111,59.322917,0)"
+           x="0"
+           y="0"
+           width="100%"
+           height="100%" />
+      </g>
+    </defs>
+  </defs>
+  <sodipodi:namedview
+     pagecolor="#ffffff"
+     bordercolor="#666666"
+     borderopacity="1"
+     objecttolerance="10"
+     gridtolerance="10"
+     guidetolerance="10"
+     inkscape:pageopacity="0"
+     inkscape:pageshadow="2"
+     inkscape:window-width="3840"
+     inkscape:window-height="2031"
+     id="namedview1306"
+     showgrid="false"
+     inkscape:zoom="2.1371359"
+     inkscape:cx="526.00635"
+     inkscape:cy="94.855522"
+     inkscape:window-x="0"
+     inkscape:window-y="55"
+     inkscape:window-maximized="1"
+     inkscape:current-layer="svg1304" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke-width:0.45284426"
+     inkscape:connector-curvature="0"
+     id="path861"
+     d="M 0.896161,3.844052 H 628.99114 V 119.77218 H 0.896161 Z" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:1.01232886"
+     inkscape:connector-curvature="0"
+     id="path863"
+     d="m 12.267992,3.844052 h 11.371829 m 5.685916,0 h 11.371831 m 5.691571,0 H 57.76097 m 5.691573,0 h 11.371829 m 5.685916,0 h 11.37183 m 5.691577,0 h 11.371825 m 5.66895,0 h 11.38315 m 5.68591,0 h 11.37183 m 5.68591,0 h 11.37182 m 5.68591,0 h 11.37184 m 5.68592,0 h 11.37184 m 5.69156,0 h 11.37182 m 5.68593,0 h 11.37183 m 5.68591,0 h 11.37184 m 5.68591,0 h 11.37182 m 5.68592,0 h 11.37183 m 5.69158,0 h 11.37183 m 5.68591,0 h 11.37182 m 5.68027,0 h 11.37183 m 5.69723,0 h 11.37183 m 5.68026,0 h 11.37184 m 5.69156,0 h 11.37183 m 5.68591,0 h 11.37183 m 5.68592,0 h 11.37184 m 5.68591,0 H 433.054 m 5.69156,0 h 11.36618 m 5.69157,0 h 11.37184 m 5.68591,0 h 11.37183 m 5.69158,0 h 11.37182 m 5.68592,0 h 11.38316 m 5.6859,0 h 11.37183 m 5.68591,0 h 11.37183 m 5.68593,0 h 11.37183 m 5.6859,0 h 11.37184 m 5.69157,0 h 11.37182 m 5.68593,0 h 11.37183 m 5.68591,0 h 11.37183 m 5.68592,0 h 11.37182 m 5.68592,0 h 11.37183 m 5.69157,0 h 11.37183 m 5.68592,0 h 11.37183 m 5.68024,0 h 11.37185 m 5.68592,0 h 11.37183 m 5.68025,0 h 11.37182 m 5.69158,0 h 11.37183 m 5.68592,0 h 5.68592 v 4.292964 m 0,4.292963 v 8.590456 m 0,4.292963 v 8.590456 m 0,4.292963 v 8.585927 m 0,4.30202 v 8.585927 m 0,4.292964 v 8.585927 m 0,4.30202 V 85.433 m 0,4.29296 v 8.58593 m 0,4.28844 v 8.59045 m 0,4.29297 v 4.28843 h -5.68592 m -5.68592,0 h -11.37183 m -5.68593,0 h -11.37181 m -5.69157,0 h -11.37184 m -5.69157,0 h -11.37182 m -5.68593,0 h -11.37182 m -5.69157,0 h -11.37184 m -5.68591,0 h -11.38316 m -5.6859,0 h -11.37183 m -5.68593,0 h -11.37182 m -5.6859,0 h -11.37184 m -5.68592,0 h -11.37183 m -5.69158,0 h -11.37182 m -5.6859,0 h -11.37185 m -5.68592,0 h -11.37182 m -5.68592,0 h -11.37183 m -5.68591,0 h -11.37184 m -5.69157,0 h -11.37182 m -5.68592,0 h -11.37183 m -5.68025,0 H 455.792 m -5.68026,0 h -11.37181 m -5.68028,0 h -11.37182 m -5.69157,0 h -11.37184 m -5.68592,0 h -11.37183 m -5.68591,0 h -11.37183 m -5.68593,0 h -11.37182 m -5.69157,0 h -11.36617 m -5.69157,0 h -11.37184 m -5.68592,0 h -11.37182 m -5.69157,0 h -11.37183 m -5.68592,0 h -11.38313 m -5.68591,0 h -11.37185 m -5.68591,0 h -11.37184 m -5.68591,0 H 216.9666 m -5.68593,0 h -11.37183 m -5.69156,0 h -11.37184 m -5.68591,0 h -11.37182 m -5.68593,0 h -11.37183 m -5.68592,0 h -11.37182 m -5.68592,0 h -11.37182 m -5.69158,0 H 97.551059 m -5.685914,0 h -11.37183 m -5.680258,0 H 63.441228 m -5.685915,0 H 46.383482 m -5.680259,0 H 29.331395 m -5.691574,0 H 12.267992 m -5.6859158,0 H 0.896161 v -4.29296 m 0,-4.29297 v -8.59045 m 0,-4.29297 v -8.59045 m 0,-4.29296 v -8.576875 m 0,-4.30202 v -8.585927 m 0,-4.292963 v -8.585927 m 0,-4.302021 v -8.581398 m 0,-4.292964 V 25.30887 m 0,-4.288435 v -8.590456 m 0,-4.292963 V 3.844052 h 5.6859152" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path865"
+     d="M 4.9717593,3.844052 H 52.067561 V 34.184617 H 4.9717593 Z" />
+  <path
+     style="fill:#d2fff2;stroke-width:0.50616443"
+     inkscape:connector-curvature="0"
+     id="path869"
+     d="M 0.896161,119.77218 H 785.60903 V 235.70031 H 0.896161 Z" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:1.01232886"
+     inkscape:connector-curvature="0"
+     id="path871"
+     d="m 12.267992,119.77218 h 11.371829 m 5.685916,0 h 11.371831 m 5.691571,0 H 57.76097 m 5.691573,0 h 11.371829 m 5.685916,0 h 11.37183 m 5.691577,0 h 11.371825 m 5.68592,0 h 11.38314 m 5.68591,0 h 11.37184 m 5.68592,0 h 11.37184 m 5.6859,0 h 11.37182 m 5.68591,0 h 11.37183 m 5.69159,0 h 11.37184 m 5.6859,0 h 11.37182 m 5.68591,0 h 11.37185 m 5.68591,0 h 11.37184 m 5.68591,0 h 11.37182 m 5.69158,0 h 11.37184 m 5.68591,0 h 11.37183 m 5.68026,0 h 11.37181 m 5.68593,0 h 11.37183 m 5.68025,0 H 364.823 m 5.6916,0 h 11.37182 m 5.68592,0 h 11.37182 m 5.68591,0 h 11.37184 m 5.68592,0 h 11.37182 m 5.69158,0 h 11.36051 m 5.69157,0 h 11.37184 m 5.68591,0 h 11.37183 m 5.69158,0 h 11.37182 m 5.68592,0 h 11.38316 m 5.6859,0 h 11.37183 m 5.68591,0 h 11.37183 m 5.68593,0 h 11.37183 m 5.6859,0 h 11.37184 m 5.69157,0 h 11.37182 m 5.68593,0 h 11.37183 m 5.68591,0 h 11.37183 m 5.68592,0 h 11.37182 m 5.68592,0 h 11.37183 m 5.69157,0 h 11.37183 m 5.68592,0 h 11.37183 m 5.68024,0 h 11.37185 m 5.68592,0 h 11.37183 m 5.68025,0 h 11.37182 m 5.69158,0 h 11.37183 m 5.68592,0 h 5.68592 v 4.29296 m 0,4.29297 v 8.59045 m 0,4.29297 v 8.59045 m 0,4.29297 v 8.58592 m 0,4.30202 v 8.58593 m 0,4.29296 v 8.58593 m 0,4.30202 v 8.5814 m 0,4.29296 v 8.58593 m 0,4.28843 v 8.59046 m 0,4.29296 v 4.28844 h -5.68592 m -5.68592,0 h -11.37183 m -5.68593,0 h -11.37181 m -5.69157,0 h -11.37184 m -5.69157,0 h -11.37182 m -5.68593,0 h -11.37182 m -5.69157,0 h -11.37184 m -5.68591,0 h -11.38316 m -5.6859,0 h -11.37183 m -5.68593,0 h -11.37182 m -5.6859,0 h -11.37184 m -5.68592,0 h -11.37183 m -5.69158,0 h -11.37182 m -5.6859,0 h -11.37185 m -5.68592,0 h -11.37182 m -5.68592,0 h -11.37183 m -5.68591,0 h -11.37184 m -5.69157,0 h -11.37182 m -5.68592,0 h -11.37183 m -5.68025,0 H 455.792 m -5.68026,0 h -11.37181 m -5.68028,0 h -11.37182 m -5.69157,0 h -11.37184 m -5.68592,0 h -11.37183 m -5.68591,0 h -11.37183 m -5.68593,0 h -11.37182 m -5.69157,0 h -11.36617 m -5.69157,0 h -11.37184 m -5.68592,0 h -11.37182 m -5.69157,0 h -11.37183 m -5.68592,0 h -11.38313 m -5.68591,0 h -11.37185 m -5.68591,0 h -11.37184 m -5.68591,0 H 216.9666 m -5.68593,0 h -11.37183 m -5.69156,0 h -11.37184 m -5.68591,0 h -11.37182 m -5.68593,0 h -11.37183 m -5.68592,0 h -11.37182 m -5.68592,0 h -11.37182 m -5.69158,0 H 97.551059 m -5.685914,0 h -11.37183 m -5.680258,0 H 63.441228 m -5.685915,0 H 46.383482 m -5.680259,0 H 29.331395 m -5.691574,0 H 12.267992 m -5.6859158,0 H 0.896161 v -4.29297 m 0,-4.29296 v -8.59045 m 0,-4.29297 v -8.59045 m 0,-4.29297 v -8.57687 m 0,-4.30202 v -8.58592 m 0,-4.29297 v -8.58592 m 0,-4.30202 v -8.5814 m 0,-4.29297 V 141.237 m 0,-4.28844 v -8.59045 m 0,-4.29297 v -4.29296 h 5.6859152" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path873"
+     d="M 4.9717593,119.77218 H 122.71126 v 30.34056 H 4.9717593 Z" />
+  <path
+     style="fill:#ffffff;stroke:#000000;stroke-width:1.07623756"
+     inkscape:connector-curvature="0"
+     id="path877"
+     d="m 3.360172,176.7534 c 0,-2.74164 3.159469,-4.9602 7.063854,-4.9602 H 150.41677 c 3.90438,0 7.06386,2.21856 7.06386,4.9602 v 30.21218 c 0,2.74164 -3.15948,4.9602 -7.06386,4.9602 H 10.424026 c -3.904385,0 -7.063854,-2.21856 -7.063854,-4.9602 z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path897"
+     d="m 68.369954,89.43162 h 38.038916 v 30.34056 H 68.369954 Z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path913"
+     d="m 199.24194,89.43162 h 87.39894 v 30.34056 h -87.39894 z" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path921"
+     d="M 78.06905,170.49074 31.878938,144.67861 m 43.925892,26.26497 40.32125,-22.27088" />
+  <path
+     style="stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path923"
+     d="m 122.07193,145.38505 -4.64166,4.96317 -2.02874,-3.66803 z" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path929"
+     d="m 237.95975,170.49074 -46.19011,-25.81213 m 43.92589,26.26497 39.882,-22.24371" />
+  <path
+     style="stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path931"
+     d="m 281.50978,145.39411 -4.61901,4.98128 -2.0378,-3.66803 z" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path937"
+     d="M 397.85045,170.49074 351.2075,144.67861 m 44.37873,26.26497 39.882,-22.24371" />
+  <path
+     style="stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path939"
+     d="m 441.40049,145.39411 -4.61902,4.98128 -2.03779,-3.66803 z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path941"
+     d="M 41.010676,211.24672 H 153.76889 v 30.34056 H 41.010676 Z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path949"
+     d="M 154.90138,211.24672 H 267.6596 v 30.34056 H 154.90138 Z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path957"
+     d="M 292.79208,211.69956 H 405.5503 v 30.34057 H 292.79208 Z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568852;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path967"
+     d="m 497.21346,82.63895 h 112.75822 v 30.34057 H 497.21346 Z" />
+  <g
+     id="g286"
+     transform="translate(-160.11355,-19.773576)">
+    <path
+       d="m 499.02484,66.411412 c 0,-2.753293 2.22799,-4.981287 4.98128,-4.981287 h 98.72005 c 2.75329,0 4.98129,2.227994 4.98129,4.981287 v 30.340564 c 0,2.753294 -2.228,4.981284 -4.98129,4.981284 h -98.72005 c -2.75329,0 -4.98128,-2.22799 -4.98128,-4.981284 z"
+       id="path885"
+       inkscape:connector-curvature="0"
+       style="fill:#ffffff;stroke:#000000;stroke-width:0.90568852" />
+    <text
+       id="text101-6"
+       y="87.439178"
+       x="504.97748"
+       style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+       xml:space="preserve"><tspan
+         style="stroke-width:0.45284379"
+         y="87.439178"
+         x="504.97748"
+         id="tspan99-88"
+         sodipodi:role="line">cont (fresh db)</tspan></text>
+  </g>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="6.9198484"
+     y="137.37654"
+     id="text277"><tspan
+       sodipodi:role="line"
+       id="tspan275"
+       x="6.9198484"
+       y="137.37654"
+       style="stroke-width:0.45284379">/.shards_acct</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="8.2687769"
+     y="20.810501"
+     id="text281"><tspan
+       sodipodi:role="line"
+       id="tspan279"
+       x="8.2687769"
+       y="20.810501"
+       style="stroke-width:0.45284379">/acct</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="9.5435867"
+     y="197.57593"
+     id="text101"><tspan
+       sodipodi:role="line"
+       id="tspan99"
+       x="9.5435867"
+       y="197.57593"
+       style="stroke-width:0.45284379">cont-568d8e-&lt;ts&gt;-0</tspan></text>
+  <flowRoot
+     xml:space="preserve"
+     id="flowRoot1828"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:37.33333206px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none"
+     transform="translate(0,-20)"><flowRegion
+       id="flowRegion1830"><rect
+         id="rect1832"
+         width="573.11005"
+         height="39.244427"
+         x="182.43355"
+         y="184.33957" /></flowRegion><flowPara
+       id="flowPara1834" /></flowRoot>  <path
+     style="fill:#ffffff;stroke:#000000;stroke-width:1.07623756"
+     inkscape:connector-curvature="0"
+     id="path877-7"
+     d="m 159.91421,176.7534 c 0,-2.74164 3.15947,-4.9602 7.06385,-4.9602 h 139.99275 c 3.90438,0 7.06386,2.21856 7.06386,4.9602 v 30.21218 c 0,2.74164 -3.15948,4.9602 -7.06386,4.9602 H 166.97806 c -3.90438,0 -7.06385,-2.21856 -7.06385,-4.9602 z" />
+  <path
+     style="fill:#ffffff;stroke:#000000;stroke-width:1.07623756"
+     inkscape:connector-curvature="0"
+     id="path877-7-6"
+     d="m 316.32694,176.75341 c 0,-2.74164 3.15947,-4.96021 7.06385,-4.96021 h 139.99275 c 3.90438,0 7.06386,2.21856 7.06386,4.9602 v 30.21218 c 0,2.74164 -3.15948,4.9602 -7.06386,4.9602 H 323.39079 c -3.90438,0 -7.06385,-2.21856 -7.06385,-4.9602 z" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="168.83531"
+     y="197.57593"
+     id="text101-7"><tspan
+       sodipodi:role="line"
+       id="tspan99-8"
+       x="168.83531"
+       y="197.57593"
+       style="stroke-width:0.45284379">cont-750ed3-&lt;ts&gt;-1</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="325.60159"
+     y="197.57593"
+     id="text101-7-4"><tspan
+       sodipodi:role="line"
+       id="tspan99-8-4"
+       x="325.60159"
+       y="197.57593"
+       style="stroke-width:0.45284379">cont-4ec28d-&lt;ts&gt;-2</tspan></text>
+  <flowRoot
+     xml:space="preserve"
+     id="flowRoot6150"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:37.33333206px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none"
+     transform="translate(0,-20)"><flowRegion
+       id="flowRegion6152"><rect
+         id="rect6154"
+         width="658.73334"
+         height="99.261536"
+         x="-102.56863"
+         y="156.43877" /></flowRegion><flowPara
+       id="flowPara6156" /></flowRoot>  <path
+     style="fill:none;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path937-4"
+     d="m 554.14147,169.96071 -46.64295,-25.81213 m 44.37873,26.26497 39.882,-22.24371" />
+  <path
+     style="stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path939-7"
+     d="m 597.69151,144.86408 -4.61902,4.98128 -2.03779,-3.66803 z" />
+  <path
+     style="fill:#ffffff;stroke:#000000;stroke-width:1.07623756"
+     inkscape:connector-curvature="0"
+     id="path877-7-6-6"
+     d="m 472.61796,176.22338 c 0,-2.74164 3.15947,-4.96021 7.06385,-4.96021 h 139.99275 c 3.90438,0 7.06386,2.21856 7.06386,4.9602 v 30.21218 c 0,2.74164 -3.15948,4.9602 -7.06386,4.9602 H 479.68181 c -3.90438,0 -7.06385,-2.21856 -7.06385,-4.9602 z" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="481.89264"
+     y="197.0459"
+     id="text101-7-4-8"><tspan
+       sodipodi:role="line"
+       id="tspan99-8-4-7"
+       x="481.89264"
+       y="197.0459"
+       style="stroke-width:0.45284379">cont-aef34f-&lt;ts&gt;-3</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="48.558598"
+     y="231.41714"
+     id="text281-90"><tspan
+       sodipodi:role="line"
+       id="tspan279-3"
+       x="48.558598"
+       y="231.41714"
+       style="stroke-width:0.45284379">&quot;&quot; - &quot;cat&quot;</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="180.88539"
+     y="230.2355"
+     id="text281-90-3"><tspan
+       sodipodi:role="line"
+       id="tspan279-3-3"
+       x="180.88539"
+       y="230.2355"
+       style="stroke-width:0.45284379">&quot;cat&quot; - &quot;giraffe&quot;</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="333.40033"
+     y="230.2355"
+     id="text281-90-3-7"><tspan
+       sodipodi:role="line"
+       id="tspan279-3-3-3"
+       x="333.40033"
+       y="230.2355"
+       style="stroke-width:0.45284379">&quot;giraffe&quot; - &quot;igloo&quot;</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="494.11285"
+     y="230.2355"
+     id="text281-90-3-7-2"><tspan
+       sodipodi:role="line"
+       id="tspan279-3-3-3-6"
+       x="494.11285"
+       y="230.2355"
+       style="stroke-width:0.45284379">&quot;igloo&quot; - &quot;linux&quot;</tspan></text>
+  <path
+     style="fill:none;stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path937-4-8"
+     d="m 711.01639,169.9889 -46.64295,-25.81213 m 44.37873,26.26497 39.882,-22.24371" />
+  <path
+     style="stroke:#000000;stroke-width:0.90568852"
+     inkscape:connector-curvature="0"
+     id="path939-7-9"
+     d="m 754.56643,144.89227 -4.61902,4.98128 -2.03779,-3.66803 z" />
+  <path
+     style="fill:#ffffff;stroke:#000000;stroke-width:1.07623756"
+     inkscape:connector-curvature="0"
+     id="path877-7-6-6-2"
+     d="m 629.49288,176.25157 c 0,-2.74164 3.15947,-4.96021 7.06385,-4.96021 h 139.99275 c 3.90438,0 7.06386,2.21856 7.06386,4.9602 v 30.21218 c 0,2.74164 -3.15948,4.9602 -7.06386,4.9602 H 636.55673 c -3.90438,0 -7.06385,-2.21856 -7.06385,-4.9602 z" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="638.76752"
+     y="197.0741"
+     id="text101-7-4-8-6"><tspan
+       sodipodi:role="line"
+       id="tspan99-8-4-7-6"
+       x="638.76752"
+       y="197.0741"
+       style="stroke-width:0.45284379">cont-4837ad-&lt;ts&gt;-4</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="668.46472"
+     y="230.2637"
+     id="text281-90-3-7-2-4"><tspan
+       sodipodi:role="line"
+       id="tspan279-3-3-3-6-9"
+       x="668.46472"
+       y="230.2637"
+       style="stroke-width:0.45284379">&quot;linux&quot; - &quot;&quot;</tspan></text>
+</svg>
diff --git a/doc/source/images/sharding_unsharded.svg b/doc/source/images/sharding_unsharded.svg
new file mode 100644
index 0000000000..4241b0de13
--- /dev/null
+++ b/doc/source/images/sharding_unsharded.svg
@@ -0,0 +1,199 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<svg
+   xmlns:dc="http://purl.org/dc/elements/1.1/"
+   xmlns:cc="http://creativecommons.org/ns#"
+   xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
+   xmlns:svg="http://www.w3.org/2000/svg"
+   xmlns="http://www.w3.org/2000/svg"
+   xmlns:xlink="http://www.w3.org/1999/xlink"
+   xmlns:sodipodi="http://sodipodi.sourceforge.net/DTD/sodipodi-0.dtd"
+   xmlns:inkscape="http://www.inkscape.org/namespaces/inkscape"
+   width="630"
+   height="120"
+   version="1.1"
+   id="svg3952"
+   sodipodi:docname="sharding_snip1.svg"
+   inkscape:version="0.92.2 (5c3e80d, 2017-08-06)">
+  <metadata
+     id="metadata3958">
+    <rdf:RDF>
+      <cc:Work
+         rdf:about="">
+        <dc:format>image/svg+xml</dc:format>
+        <dc:type
+           rdf:resource="http://purl.org/dc/dcmitype/StillImage" />
+        <dc:title />
+      </cc:Work>
+    </rdf:RDF>
+  </metadata>
+  <defs
+     id="defs3956">
+    <defs
+       id="defs3948">
+      <path
+         inkscape:connector-curvature="0"
+         id="c"
+         d="m 779,-765 c -19,-119 -93,-196 -233,-196 -95,0 -164,32 -207,95 -43,63 -64,170 -64,320 0,144 23,251 68,320 45,69 114,104 205,104 139,0 224,-79 240,-212 l 182,12 C 946,-119 781,22 553,20 230,17 87,-201 87,-542 c 0,-338 145,-557 464,-560 225,-1 380,129 413,323" />
+      <path
+         inkscape:connector-curvature="0"
+         id="d"
+         d="m 571,-1102 c 350,0 480,196 482,560 2,357 -151,562 -488,562 -332,0 -479,-218 -479,-562 0,-373 162,-560 485,-560 z m -8,989 c 244,0 301,-164 301,-429 0,-266 -49,-427 -290,-427 -239,0 -299,165 -299,427 0,252 61,429 288,429" />
+      <path
+         inkscape:connector-curvature="0"
+         id="e"
+         d="m 663,-1102 c 251,0 343,119 343,381 V 0 H 825 v -686 c 0,-183 -40,-279 -223,-277 -184,2 -280,141 -280,336 V 0 H 142 c -3,-345 6,-754 -6,-1082 h 170 c 5,68 6,94 8,185 h 3 c 76,-134 157,-205 346,-205" />
+      <path
+         inkscape:connector-curvature="0"
+         id="f"
+         d="m 336,-268 c 2,98 22,139 114,141 24,0 59,-5 104,-14 V -8 C 495,8 434,16 372,16 228,16 156,-66 156,-229 V -951 H 31 v -131 h 132 l 53,-242 h 120 v 242 h 200 v 131 H 336 v 683" />
+      <g
+         id="a">
+        <use
+           height="100%"
+           width="100%"
+           y="0"
+           x="0"
+           id="use3926"
+           xlink:href="#c"
+           transform="scale(0.01302083)" />
+        <use
+           height="100%"
+           width="100%"
+           y="0"
+           x="0"
+           id="use3928"
+           xlink:href="#d"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)" />
+        <use
+           height="100%"
+           width="100%"
+           y="0"
+           x="0"
+           id="use3930"
+           xlink:href="#e"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)" />
+        <use
+           height="100%"
+           width="100%"
+           y="0"
+           x="0"
+           id="use3932"
+           xlink:href="#f"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)" />
+      </g>
+      <path
+         inkscape:connector-curvature="0"
+         id="g"
+         d="M 0,20 411,-1484 H 569 L 162,20 H 0" />
+      <path
+         inkscape:connector-curvature="0"
+         id="h"
+         d="M 797,-207 C 713,-60 620,16 414,20 203,24 88,-98 87,-302 c 0,-112 37,-198 111,-258 74,-60 192,-93 356,-96 l 243,-4 c 10,-201 -43,-307 -232,-305 -154,2 -223,43 -242,172 l -188,-17 c 31,-195 175,-292 434,-292 259,0 410,116 410,364 v 466 c 3,95 12,159 101,161 17,0 37,-2 59,-7 V -6 C 1094,5 1047,10 1000,10 857,8 812,-66 803,-207 Z m -525,-92 c -1,116 66,187 183,184 230,-7 361,-164 342,-419 -124,5 -305,-2 -389,30 -83,32 -136,92 -136,205" />
+      <g
+         id="b">
+        <use
+           height="100%"
+           width="100%"
+           y="0"
+           x="0"
+           id="use3937"
+           xlink:href="#g"
+           transform="scale(0.01736111)" />
+        <use
+           height="100%"
+           width="100%"
+           y="0"
+           x="0"
+           id="use3939"
+           xlink:href="#h"
+           transform="matrix(0.01736111,0,0,0.01736111,9.8784722,0)" />
+        <use
+           height="100%"
+           width="100%"
+           y="0"
+           x="0"
+           id="use3941"
+           xlink:href="#c"
+           transform="matrix(0.01736111,0,0,0.01736111,29.652778,0)" />
+        <use
+           height="100%"
+           width="100%"
+           y="0"
+           x="0"
+           id="use3943"
+           xlink:href="#c"
+           transform="matrix(0.01736111,0,0,0.01736111,47.430556,0)" />
+        <use
+           height="100%"
+           width="100%"
+           y="0"
+           x="0"
+           id="use3945"
+           xlink:href="#f"
+           transform="matrix(0.01736111,0,0,0.01736111,65.208333,0)" />
+      </g>
+    </defs>
+  </defs>
+  <sodipodi:namedview
+     pagecolor="#ffffff"
+     bordercolor="#666666"
+     borderopacity="1"
+     objecttolerance="10"
+     gridtolerance="10"
+     guidetolerance="10"
+     inkscape:pageopacity="0"
+     inkscape:pageshadow="2"
+     inkscape:window-width="3840"
+     inkscape:window-height="2031"
+     id="namedview3954"
+     showgrid="false"
+     inkscape:zoom="4"
+     inkscape:cx="259.51356"
+     inkscape:cy="162.22523"
+     inkscape:window-x="0"
+     inkscape:window-y="55"
+     inkscape:window-maximized="1"
+     inkscape:current-layer="svg3952" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke-width:0.45284376"
+     inkscape:connector-curvature="0"
+     id="path3910"
+     d="M 0.95284148,2.5359665 H 629.04715 V 118.46397 H 0.95284148 Z" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:0.90568751"
+     inkscape:connector-curvature="0"
+     id="path3912"
+     d="m 10.055001,2.5359665 h 9.10216 m 4.55108,0 h 9.10216 m 4.555608,0 h 9.10216 m 4.555608,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.555608,0 h 9.10216 m 4.55108,0 h 9.111215 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55561,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.5556,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.54656,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.54655,0 h 9.10216 m 4.5556,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55561,0 h 9.10216 m 4.55561,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55561,0 h 9.10216 m 4.55108,0 h 9.11121 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55561,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.55561,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.54655,0 h 9.10216 m 4.55108,0 h 9.10216 m 4.54655,0 h 9.10216 m 4.55561,0 h 9.10216 m 4.55108,0 h 4.54202 v 4.2929589 m 0,4.2929586 v 8.590447 m 0,4.292959 v 8.590446 m 0,4.292959 v 8.585918 m 0,4.302016 v 8.585917 m 0,4.292959 v 8.585918 m 0,4.302016 v 8.58139 m 0,4.292958 v 8.585918 m 0,4.288435 v 8.59044 m 0,4.29296 v 4.28843 h -4.55108 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55561,0 h -9.10216 m -4.55561,0 h -9.10215 m -4.55108,0 h -9.10216 m -4.55561,0 h -9.10216 m -4.55108,0 h -9.11122 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55561,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55107,0 h -9.10216 m -4.55561,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.54655,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.54655,0 h -9.10216 m -4.55561,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55561,0 h -9.0931 m -4.55561,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55561,0 h -9.10216 m -4.55108,0 h -9.11122 m -4.55108,0 h -9.10215 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55561,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.55108,0 h -9.102161 m -4.555608,0 h -9.10216 m -4.55108,0 h -9.10216 m -4.546551,0 h -9.10216 m -4.55108,0 h -9.102159 m -4.546552,0 h -9.10216 m -4.555608,0 h -9.10216 m -4.5510796,0 H 0.95284148 v -4.29296 m 0,-4.29296 v -8.59044 m 0,-4.292962 v -8.590446 m 0,-4.292959 v -8.576861 m 0,-4.302016 v -8.585918 m 0,-4.292958 v -8.585918 m 0,-4.302016 v -8.58139 m 0,-4.292959 v -8.590446 m 0,-4.28843 v -8.590447 m 0,-4.2929586 V 2.5359665 H 5.5039214" />
+  <path
+     style="fill:#ffffff;stroke:#000000;stroke-width:0.90568751"
+     inkscape:connector-curvature="0"
+     id="path3914"
+     d="m 82.011876,45.103281 c 0,-2.75329 2.227992,-4.981282 4.981282,-4.981282 H 543.00683 c 2.75329,0 4.98129,2.227992 4.98129,4.981282 v 30.340532 c 0,2.753291 -2.228,4.981282 -4.98129,4.981282 H 86.993158 c -2.75329,0 -4.981282,-2.227991 -4.981282,-4.981282 z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.90568751;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path3918"
+     d="M 5.0284354,2.5359665 H 52.124187 V 32.876499 H 5.0284354 Z" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="6.4593792"
+     y="19.109808"
+     id="text281"><tspan
+       sodipodi:role="line"
+       id="tspan279"
+       x="6.4593792"
+       y="19.109808"
+       style="stroke-width:0.45284379">/acct</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="298.91342"
+     y="65.258369"
+     id="text281-8"><tspan
+       sodipodi:role="line"
+       id="tspan279-9"
+       x="298.91342"
+       y="65.258369"
+       style="stroke-width:0.45284379">cont</tspan></text>
+</svg>
diff --git a/doc/source/images/sharding_unsharded_load.svg b/doc/source/images/sharding_unsharded_load.svg
new file mode 100644
index 0000000000..e613e8cbbd
--- /dev/null
+++ b/doc/source/images/sharding_unsharded_load.svg
@@ -0,0 +1,219 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<svg
+   xmlns:dc="http://purl.org/dc/elements/1.1/"
+   xmlns:cc="http://creativecommons.org/ns#"
+   xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
+   xmlns:svg="http://www.w3.org/2000/svg"
+   xmlns="http://www.w3.org/2000/svg"
+   xmlns:xlink="http://www.w3.org/1999/xlink"
+   xmlns:sodipodi="http://sodipodi.sourceforge.net/DTD/sodipodi-0.dtd"
+   xmlns:inkscape="http://www.inkscape.org/namespaces/inkscape"
+   width="642"
+   height="139"
+   version="1.1"
+   id="svg2012"
+   sodipodi:docname="sharding_lock1.svg"
+   inkscape:version="0.92.2 (5c3e80d, 2017-08-06)">
+  <metadata
+     id="metadata2018">
+    <rdf:RDF>
+      <cc:Work
+         rdf:about="">
+        <dc:format>image/svg+xml</dc:format>
+        <dc:type
+           rdf:resource="http://purl.org/dc/dcmitype/StillImage" />
+        <dc:title></dc:title>
+      </cc:Work>
+    </rdf:RDF>
+  </metadata>
+  <defs
+     id="defs2016">
+    <defs
+       id="defs2008">
+      <path
+         inkscape:connector-curvature="0"
+         id="c"
+         d="m 779,-765 c -19,-119 -93,-196 -233,-196 -95,0 -164,32 -207,95 -43,63 -64,170 -64,320 0,144 23,251 68,320 45,69 114,104 205,104 139,0 224,-79 240,-212 l 182,12 C 946,-119 781,22 553,20 230,17 87,-201 87,-542 c 0,-338 145,-557 464,-560 225,-1 380,129 413,323" />
+      <path
+         inkscape:connector-curvature="0"
+         id="d"
+         d="m 571,-1102 c 350,0 480,196 482,560 2,357 -151,562 -488,562 -332,0 -479,-218 -479,-562 0,-373 162,-560 485,-560 z m -8,989 c 244,0 301,-164 301,-429 0,-266 -49,-427 -290,-427 -239,0 -299,165 -299,427 0,252 61,429 288,429" />
+      <path
+         inkscape:connector-curvature="0"
+         id="e"
+         d="m 663,-1102 c 251,0 343,119 343,381 V 0 H 825 v -686 c 0,-183 -40,-279 -223,-277 -184,2 -280,141 -280,336 V 0 H 142 c -3,-345 6,-754 -6,-1082 h 170 c 5,68 6,94 8,185 h 3 c 76,-134 157,-205 346,-205" />
+      <path
+         inkscape:connector-curvature="0"
+         id="f"
+         d="m 336,-268 c 2,98 22,139 114,141 24,0 59,-5 104,-14 V -8 C 495,8 434,16 372,16 228,16 156,-66 156,-229 V -951 H 31 v -131 h 132 l 53,-242 h 120 v 242 h 200 v 131 H 336 v 683" />
+      <g
+         id="a">
+        <use
+           height="100%"
+           width="100%"
+           y="0"
+           x="0"
+           id="use1986"
+           xlink:href="#c"
+           transform="scale(0.01302083)" />
+        <use
+           height="100%"
+           width="100%"
+           y="0"
+           x="0"
+           id="use1988"
+           xlink:href="#d"
+           transform="matrix(0.01302083,0,0,0.01302083,13.333333,0)" />
+        <use
+           height="100%"
+           width="100%"
+           y="0"
+           x="0"
+           id="use1990"
+           xlink:href="#e"
+           transform="matrix(0.01302083,0,0,0.01302083,28.164062,0)" />
+        <use
+           height="100%"
+           width="100%"
+           y="0"
+           x="0"
+           id="use1992"
+           xlink:href="#f"
+           transform="matrix(0.01302083,0,0,0.01302083,42.994792,0)" />
+      </g>
+      <path
+         inkscape:connector-curvature="0"
+         id="g"
+         d="M 0,20 411,-1484 H 569 L 162,20 H 0" />
+      <path
+         inkscape:connector-curvature="0"
+         id="h"
+         d="M 797,-207 C 713,-60 620,16 414,20 203,24 88,-98 87,-302 c 0,-112 37,-198 111,-258 74,-60 192,-93 356,-96 l 243,-4 c 10,-201 -43,-307 -232,-305 -154,2 -223,43 -242,172 l -188,-17 c 31,-195 175,-292 434,-292 259,0 410,116 410,364 v 466 c 3,95 12,159 101,161 17,0 37,-2 59,-7 V -6 C 1094,5 1047,10 1000,10 857,8 812,-66 803,-207 Z m -525,-92 c -1,116 66,187 183,184 230,-7 361,-164 342,-419 -124,5 -305,-2 -389,30 -83,32 -136,92 -136,205" />
+      <g
+         id="b">
+        <use
+           height="100%"
+           width="100%"
+           y="0"
+           x="0"
+           id="use1997"
+           xlink:href="#g"
+           transform="scale(0.01736111)" />
+        <use
+           height="100%"
+           width="100%"
+           y="0"
+           x="0"
+           id="use1999"
+           xlink:href="#h"
+           transform="matrix(0.01736111,0,0,0.01736111,9.8784722,0)" />
+        <use
+           height="100%"
+           width="100%"
+           y="0"
+           x="0"
+           id="use2001"
+           xlink:href="#c"
+           transform="matrix(0.01736111,0,0,0.01736111,29.652778,0)" />
+        <use
+           height="100%"
+           width="100%"
+           y="0"
+           x="0"
+           id="use2003"
+           xlink:href="#c"
+           transform="matrix(0.01736111,0,0,0.01736111,47.430556,0)" />
+        <use
+           height="100%"
+           width="100%"
+           y="0"
+           x="0"
+           id="use2005"
+           xlink:href="#f"
+           transform="matrix(0.01736111,0,0,0.01736111,65.208333,0)" />
+      </g>
+    </defs>
+  </defs>
+  <sodipodi:namedview
+     pagecolor="#ffffff"
+     bordercolor="#666666"
+     borderopacity="1"
+     objecttolerance="10"
+     gridtolerance="10"
+     guidetolerance="10"
+     inkscape:pageopacity="0"
+     inkscape:pageshadow="2"
+     inkscape:window-width="3522"
+     inkscape:window-height="1971"
+     id="namedview2014"
+     showgrid="false"
+     inkscape:zoom="2.8284271"
+     inkscape:cx="450.01007"
+     inkscape:cy="76.915323"
+     inkscape:window-x="0"
+     inkscape:window-y="55"
+     inkscape:window-maximized="0"
+     inkscape:current-layer="svg2012" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke-width:0.46028754"
+     inkscape:connector-curvature="0"
+     id="path1962"
+     d="M 2.540593,20.136033 H 640.95941 V 137.96964 H 2.540593 Z" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:0.92057508"
+     inkscape:connector-curvature="0"
+     id="path1964"
+     d="m 11.792373,20.136033 h 9.251779 m 4.62589,0 h 9.251779 m 4.630493,0 h 9.25178 m 4.630492,0 h 9.25178 m 4.62589,0 h 9.251779 m 4.630493,0 h 9.251779 m 4.62589,0 h 9.260983 m 4.62589,0 h 9.25178 m 4.62589,0 h 9.25178 m 4.62589,0 h 9.25178 m 4.62589,0 h 9.25178 m 4.63049,0 h 9.25178 m 4.62589,0 h 9.25178 m 4.62589,0 h 9.25178 m 4.62589,0 h 9.25178 m 4.62589,0 h 9.25178 m 4.63049,0 h 9.25178 m 4.62589,0 h 9.25178 m 4.62129,0 h 9.25178 m 4.62589,0 h 9.25178 m 4.62128,0 h 9.25178 m 4.6305,0 h 9.25178 m 4.62589,0 h 9.25177 m 4.62589,0 h 9.25178 m 4.62589,0 h 9.25178 m 4.6305,0 h 9.25178 m 4.63049,0 h 9.25178 m 4.62589,0 h 9.25178 m 4.63049,0 h 9.25178 m 4.62589,0 h 9.26098 m 4.62589,0 h 9.25178 m 4.62589,0 h 9.25178 m 4.62589,0 h 9.25178 m 4.62589,0 h 9.25178 m 4.63049,0 h 9.25178 m 4.62589,0 h 9.25178 m 4.62589,0 h 9.25178 m 4.62589,0 h 9.25178 m 4.62589,0 h 9.25178 m 4.63049,0 h 9.25178 m 4.62589,0 h 9.25178 m 4.62129,0 h 9.25178 m 4.62589,0 h 9.25178 m 4.62129,0 h 9.25177 m 4.6305,0 h 9.25178 m 4.62589,0 h 4.61668 v 4.363526 m 0,4.363526 v 8.731654 m 0,4.363526 v 8.731655 m 0,4.363526 v 8.727051 m 0,4.372732 v 8.727052 m 0,4.363526 v 8.727051 m 0,4.372732 v 8.72245 m 0,4.36352 v 8.72706 m 0,4.35892 v 8.73165 m 0,4.36353 v 4.35892 h -4.62589 m -4.62589,0 h -9.25178 m -4.62589,0 h -9.25178 m -4.63049,0 h -9.25178 m -4.63049,0 h -9.25178 m -4.62589,0 h -9.25178 m -4.63049,0 h -9.25178 m -4.62589,0 h -9.26099 m -4.62589,0 h -9.25178 m -4.62589,0 h -9.25178 m -4.62589,0 h -9.25178 m -4.62589,0 h -9.25178 m -4.63049,0 h -9.25178 m -4.62589,0 h -9.25178 m -4.62589,0 h -9.25178 m -4.62589,0 h -9.25178 m -4.62589,0 h -9.25178 m -4.63049,0 h -9.25178 m -4.62589,0 h -9.25178 m -4.62128,0 h -9.25178 m -4.62589,0 h -9.25178 m -4.62129,0 h -9.25178 m -4.63049,0 h -9.25178 m -4.62589,0 h -9.25178 m -4.62589,0 h -9.25178 m -4.62589,0 h -9.25178 m -4.63049,0 h -9.24258 m -4.63049,0 h -9.25178 m -4.62589,0 h -9.25178 m -4.63049,0 h -9.25178 m -4.62589,0 h -9.26098 m -4.62589,0 h -9.25178 m -4.62589,0 h -9.25178 m -4.62589,0 h -9.25178 m -4.62589,0 h -9.25178 m -4.63049,0 h -9.25178 m -4.62589,0 h -9.25178 m -4.62589,0 h -9.25178 m -4.62589,0 h -9.25178 m -4.62589,0 h -9.251781 m -4.630493,0 h -9.25178 m -4.625889,0 h -9.25178 m -4.621287,0 h -9.251779 m -4.62589,0 h -9.25178 m -4.621287,0 h -9.251779 m -4.630493,0 h -9.251779 m -4.6258903,0 H 2.540593 v -4.36352 m 0,-4.36353 v -8.73165 m 0,-4.36353 v -8.73165 m 0,-4.36353 v -8.717846 m 0,-4.372731 v -8.727052 m 0,-4.363526 v -8.727052 m 0,-4.372731 v -8.722449 m 0,-4.363526 v -8.731655 m 0,-4.358923 v -8.731654 m 0,-4.363526 v -4.363526 h 4.6258897" />
+  <path
+     style="fill:#ffffff;stroke:#000000;stroke-width:0.92057508"
+     inkscape:connector-curvature="0"
+     id="path1966"
+     d="m 84.932063,63.403062 c 0,-2.798549 2.264614,-5.063163 5.063163,-5.063163 H 553.50478 c 2.79855,0 5.06316,2.264614 5.06316,5.063163 v 30.839265 c 0,2.798548 -2.26461,5.063163 -5.06316,5.063163 H 89.995226 c -2.798549,0 -5.063163,-2.264615 -5.063163,-5.063163 z" />
+  <path
+     style="fill:#ffffff;fill-opacity:0;stroke:#000000;stroke-width:0.92057508;stroke-opacity:0"
+     inkscape:connector-curvature="0"
+     id="path1970"
+     d="M 6.6831808,20.136033 H 54.553085 V 50.975298 H 6.6831808 Z" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:0.92057508"
+     inkscape:connector-curvature="0"
+     id="path1974"
+     d="M 322.70095,58.339899 275.53989,1.7245313" />
+  <path
+     inkscape:connector-curvature="0"
+     id="path1976"
+     d="m 323.29933,58.339899 h -0.59838 l 0.34982,-0.294584 z"
+     style="stroke-width:0.46028754" />
+  <path
+     style="fill:none;stroke:#000000;stroke-width:0.92057508"
+     inkscape:connector-curvature="0"
+     id="path1978"
+     d="M 320.18778,59.260474 362.69073,8.1777626" />
+  <path
+     style="stroke:#000000;stroke-width:0.92057508"
+     inkscape:connector-curvature="0"
+     id="path1980"
+     d="m 367.10489,2.8752502 -2.5592,6.4072025 -3.28185,-2.7295051 z" />
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:13.2834177px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="307.00397"
+     y="83.392113"
+     id="text101-6-4"><tspan
+       sodipodi:role="line"
+       id="tspan99-88-4"
+       x="307.00397"
+       y="83.392113"
+       style="stroke-width:0.45284379">cont</tspan></text>
+  <text
+     xml:space="preserve"
+     style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:14.49100113px;line-height:1.25;font-family:sans-serif;-inkscape-font-specification:'sans-serif, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-feature-settings:normal;text-align:start;letter-spacing:0px;word-spacing:0px;writing-mode:lr-tb;text-anchor:start;fill:#000000;fill-opacity:1;stroke:none;stroke-width:0.45284379"
+     x="10.03654"
+     y="38.250904"
+     id="text281"><tspan
+       sodipodi:role="line"
+       id="tspan279"
+       x="10.03654"
+       y="38.250904"
+       style="stroke-width:0.45284379">/acct</tspan></text>
+</svg>
diff --git a/doc/source/index.rst b/doc/source/index.rst
index 2d8b97ba5a..6332d396e5 100644
--- a/doc/source/index.rst
+++ b/doc/source/index.rst
@@ -1,5 +1,5 @@
 ..
-      Copyright 2010-2012 OpenStack LLC 
+      Copyright 2010-2012 OpenStack Foundation
       All Rights Reserved.
 
       Licensed under the Apache License, Version 2.0 (the "License"); you may
@@ -13,16 +13,17 @@
       WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
       License for the specific language governing permissions and limitations
       under the License.
-      
+
+=================================
 Welcome to Swift's documentation!
 =================================
 
-Swift is a highly available, distributed, eventually consistent object/blob 
+Swift is a highly available, distributed, eventually consistent object/blob
 store. Organizations can use Swift to store lots of data efficiently, safely, and cheaply.
 
 This documentation is generated by the Sphinx toolkit and lives in the source
 tree.  Additional documentation on Swift and other components of OpenStack can
-be found on the `OpenStack wiki`_ and at http://docs.openstack.org.  
+be found on the `OpenStack wiki`_ and at http://docs.openstack.org.
 
 .. _`OpenStack wiki`: http://wiki.openstack.org
 
@@ -32,8 +33,8 @@ be found on the `OpenStack wiki`_ and at http://docs.openstack.org.
 
 
 .. toctree::
-    :maxdepth: 1
-    
+    :maxdepth: 2
+
     getting_started
 
 Overview and Concepts
@@ -42,18 +43,40 @@ Overview and Concepts
 .. toctree::
     :maxdepth: 1
 
+    api/object_api_v1_overview
     overview_architecture
+    overview_wsgi_management
     overview_ring
+    overview_ring_format
+    overview_policies
     overview_reaper
     overview_auth
+    overview_acl
     overview_replication
     ratelimit
     overview_large_objects
-    overview_object_versioning
+    overview_global_cluster
     overview_container_sync
     overview_expiring_objects
+    cors
+    crossdomain
+    overview_erasure_code
+    overview_encryption
+    overview_backing_store
+    overview_container_sharding
+    ring_background
+    ring_partpower
     associated_projects
 
+Contributor Documentation
+=========================
+
+.. toctree::
+    :maxdepth: 2
+
+    contributor/contributing
+    contributor/review_guidelines
+
 Developer Documentation
 =======================
 
@@ -62,17 +85,73 @@ Developer Documentation
 
     development_guidelines
     development_saio
+    first_contribution_swift
+    policies_saio
     development_auth
+    development_middleware
+    development_ondisk_backends
+    development_watchers
 
 Administrator Documentation
 ===========================
 
 .. toctree::
     :maxdepth: 1
-    
-    howto_installmultinode
+
     deployment_guide
+    apache_deployment_guide
     admin_guide
+    replication_network
+    logs
+    ops_runbook/index
+    admin/index
+    install/index
+    config/index
+
+
+Object Storage v1 REST API Documentation
+========================================
+
+See `Complete Reference for the Object Storage REST API <https://docs.openstack.org/api-ref/object-store/>`_
+
+The following provides supporting information for the REST API:
+
+.. toctree::
+    :maxdepth: 1
+
+    api/object_api_v1_overview.rst
+    api/discoverability.rst
+    api/authentication.rst
+    api/container_quotas.rst
+    api/object_versioning.rst
+    api/large_objects.rst
+    api/temporary_url_middleware.rst
+    api/form_post_middleware.rst
+    api/use_content-encoding_metadata.rst
+    api/use_the_content-disposition_metadata.rst
+    api/pseudo-hierarchical-folders-directories.rst
+    api/pagination.rst
+    api/serialized-response-formats.rst
+    api/static-website.rst
+    api/object-expiration.rst
+    api/bulk-delete.rst
+
+S3 Compatibility Info
+=====================
+
+.. toctree::
+    :maxdepth: 1
+
+    s3_compat
+
+OpenStack End User Guide
+========================
+
+The `OpenStack End User Guide <http://docs.openstack.org/user-guide>`_
+has additional information on using Swift.
+See the `Manage objects and containers <http://docs.openstack.org/user-guide/managing-openstack-object-storage-with-swift-cli.html>`_
+section.
+
 
 Source Documentation
 ====================
@@ -87,6 +166,8 @@ Source Documentation
     db
     object
     misc
+    middleware
+    audit_watchers
 
 
 Indices and tables
@@ -95,4 +176,3 @@ Indices and tables
 * :ref:`genindex`
 * :ref:`modindex`
 * :ref:`search`
-
diff --git a/doc/source/install/controller-common_prerequisites.txt b/doc/source/install/controller-common_prerequisites.txt
new file mode 100644
index 0000000000..0ba7c3d5f1
--- /dev/null
+++ b/doc/source/install/controller-common_prerequisites.txt
@@ -0,0 +1,116 @@
+Prerequisites
+-------------
+
+The proxy service relies on an authentication and authorization mechanism such
+as the Identity service. However, unlike other services, it also offers an
+internal mechanism that allows it to operate without any other OpenStack
+services. Before you configure the Object Storage service, you must
+create service credentials and an API endpoint.
+
+.. note::
+
+   The Object Storage service does not use an SQL database on the controller
+   node. Instead, it uses distributed SQLite databases on each storage node.
+
+#. Source the ``admin`` credentials to gain access to admin-only CLI commands:
+
+   .. code-block:: console
+
+      $ . admin-openrc
+
+#. To create the Identity service credentials, complete these steps:
+
+   * Create the ``swift`` user:
+
+     .. code-block:: console
+
+        $ openstack user create --domain default --password-prompt swift
+        User Password:
+        Repeat User Password:
+        +-----------+----------------------------------+
+        | Field     | Value                            |
+        +-----------+----------------------------------+
+        | domain_id | default                          |
+        | enabled   | True                             |
+        | id        | d535e5cbd2b74ac7bfb97db9cced3ed6 |
+        | name      | swift                            |
+        +-----------+----------------------------------+
+
+   * Add the ``admin`` role to the ``swift`` user:
+
+     .. code-block:: console
+
+        $ openstack role add --project service --user swift admin
+
+     .. note::
+
+        This command provides no output.
+
+   * Create the ``swift`` service entity:
+
+     .. code-block:: console
+
+        $ openstack service create --name swift \
+          --description "OpenStack Object Storage" object-store
+        +-------------+----------------------------------+
+        | Field       | Value                            |
+        +-------------+----------------------------------+
+        | description | OpenStack Object Storage         |
+        | enabled     | True                             |
+        | id          | 75ef509da2c340499d454ae96a2c5c34 |
+        | name        | swift                            |
+        | type        | object-store                     |
+        +-------------+----------------------------------+
+
+#. Create the Object Storage service API endpoints:
+
+   .. code-block:: console
+
+      $ openstack endpoint create --region RegionOne \
+        object-store public http://controller:8080/v1/AUTH_%\(project_id\)s
+      +--------------+----------------------------------------------+
+      | Field        | Value                                        |
+      +--------------+----------------------------------------------+
+      | enabled      | True                                         |
+      | id           | 12bfd36f26694c97813f665707114e0d             |
+      | interface    | public                                       |
+      | region       | RegionOne                                    |
+      | region_id    | RegionOne                                    |
+      | service_id   | 75ef509da2c340499d454ae96a2c5c34             |
+      | service_name | swift                                        |
+      | service_type | object-store                                 |
+      | url          | http://controller:8080/v1/AUTH_%(project_id)s |
+      +--------------+----------------------------------------------+
+
+      $ openstack endpoint create --region RegionOne \
+        object-store internal http://controller:8080/v1/AUTH_%\(project_id\)s
+      +--------------+----------------------------------------------+
+      | Field        | Value                                        |
+      +--------------+----------------------------------------------+
+      | enabled      | True                                         |
+      | id           | 7a36bee6733a4b5590d74d3080ee6789             |
+      | interface    | internal                                     |
+      | region       | RegionOne                                    |
+      | region_id    | RegionOne                                    |
+      | service_id   | 75ef509da2c340499d454ae96a2c5c34             |
+      | service_name | swift                                        |
+      | service_type | object-store                                 |
+      | url          | http://controller:8080/v1/AUTH_%(project_id)s |
+      +--------------+----------------------------------------------+
+
+      $ openstack endpoint create --region RegionOne \
+        object-store admin http://controller:8080/v1
+      +--------------+----------------------------------+
+      | Field        | Value                            |
+      +--------------+----------------------------------+
+      | enabled      | True                             |
+      | id           | ebb72cd6851d4defabc0b9d71cdca69b |
+      | interface    | admin                            |
+      | region       | RegionOne                        |
+      | region_id    | RegionOne                        |
+      | service_id   | 75ef509da2c340499d454ae96a2c5c34 |
+      | service_name | swift                            |
+      | service_type | object-store                     |
+      | url          | http://controller:8080/v1        |
+      +--------------+----------------------------------+
+
diff --git a/doc/source/install/controller-include.txt b/doc/source/install/controller-include.txt
new file mode 100644
index 0000000000..ec6b37a270
--- /dev/null
+++ b/doc/source/install/controller-include.txt
@@ -0,0 +1,84 @@
+Edit the ``/etc/swift/proxy-server.conf`` file and complete the
+following actions:
+
+* In the ``[DEFAULT]`` section, configure the bind port, user, and
+  configuration directory:
+
+  .. code-block:: none
+
+     [DEFAULT]
+     ...
+     bind_port = 8080
+     user = swift
+     swift_dir = /etc/swift
+
+* In the ``[pipeline:main]`` section, remove the ``tempurl`` and
+  ``tempauth`` modules and add the ``authtoken`` and ``keystoneauth``
+  modules:
+
+  .. code-block:: none
+
+     [pipeline:main]
+     pipeline = catch_errors gatekeeper healthcheck proxy-logging cache container_sync bulk ratelimit authtoken keystoneauth container-quotas account-quotas slo dlo versioned_writes proxy-logging proxy-server
+
+  .. note::
+
+     Do not change the order of the modules.
+
+  .. note::
+
+     For more information on other modules that enable additional features,
+     see the `Deployment Guide <https://docs.openstack.org/swift/latest/deployment_guide.html>`__.
+
+* In the ``[app:proxy-server]`` section, enable automatic account creation:
+
+  .. code-block:: console
+
+     [app:proxy-server]
+     use = egg:swift#proxy
+     ...
+     account_autocreate = True
+
+* In the ``[filter:keystoneauth]`` section, configure the operator roles:
+
+  .. code-block:: console
+
+     [filter:keystoneauth]
+     use = egg:swift#keystoneauth
+     ...
+     operator_roles = admin,user
+
+* In the ``[filter:authtoken]`` section, configure Identity service access:
+
+  .. code-block:: none
+
+     [filter:authtoken]
+     paste.filter_factory = keystonemiddleware.auth_token:filter_factory
+     ...
+     www_authenticate_uri = http://controller:5000
+     auth_url = http://controller:5000
+     memcached_servers = controller:11211
+     auth_type = password
+     project_domain_id = default
+     user_domain_id = default
+     project_name = service
+     username = swift
+     password = SWIFT_PASS
+     delay_auth_decision = True
+
+  Replace ``SWIFT_PASS`` with the password you chose for the ``swift`` user
+  in the Identity service.
+
+  .. note::
+
+     Comment out or remove any other options in the ``[filter:authtoken]``
+     section.
+
+* In the ``[filter:cache]`` section, configure the ``memcached`` location:
+
+  .. code-block:: none
+
+     [filter:cache]
+     use = egg:swift#memcache
+     ...
+     memcache_servers = controller:11211
diff --git a/doc/source/install/controller-install-debian.rst b/doc/source/install/controller-install-debian.rst
new file mode 100644
index 0000000000..abcd65ff77
--- /dev/null
+++ b/doc/source/install/controller-install-debian.rst
@@ -0,0 +1,52 @@
+.. _controller-debian:
+
+Install and configure the controller node for Debian
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+This section describes how to install and configure the proxy service that
+handles requests for the account, container, and object services operating
+on the storage nodes. For simplicity, this guide installs and configures
+the proxy service on the controller node. However, you can run the proxy
+service on any node with network connectivity to the storage nodes.
+Additionally, you can install and configure the proxy service on multiple
+nodes to increase performance and redundancy. For more information, see the
+`Deployment Guide <https://docs.openstack.org/swift/latest/deployment_guide.html>`__.
+
+This section applies to Debian.
+
+.. include:: controller-common_prerequisites.txt
+
+Install and configure components
+--------------------------------
+
+.. note::
+
+   Default configuration files vary by distribution. You might need
+   to add these sections and options rather than modifying existing
+   sections and options. Also, an ellipsis (``...``) in the configuration
+   snippets indicates potential default configuration options that you
+   should retain.
+
+#. Install the packages:
+
+   .. code-block:: console
+
+      # apt-get install swift swift-proxy python3-swiftclient \
+        python3-keystoneclient python3-keystonemiddleware \
+        memcached
+
+   .. note::
+
+      Complete OpenStack environments already include some of these
+      packages.
+
+   2. Create the ``/etc/swift`` directory.
+
+   3. Obtain the proxy service configuration file from the Object Storage
+      source repository:
+
+      .. code-block:: console
+
+         # curl -o /etc/swift/proxy-server.conf https://opendev.org/openstack/swift/raw/branch/master/etc/proxy-server.conf-sample
+
+   4. .. include:: controller-include.txt
diff --git a/doc/source/install/controller-install-rdo.rst b/doc/source/install/controller-install-rdo.rst
new file mode 100644
index 0000000000..076ecaf200
--- /dev/null
+++ b/doc/source/install/controller-install-rdo.rst
@@ -0,0 +1,50 @@
+.. _controller-rdo:
+
+Install and configure the controller node for Red Hat Enterprise Linux and CentOS
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+This section describes how to install and configure the proxy service that
+handles requests for the account, container, and object services operating
+on the storage nodes. For simplicity, this guide installs and configures
+the proxy service on the controller node. However, you can run the proxy
+service on any node with network connectivity to the storage nodes.
+Additionally, you can install and configure the proxy service on multiple
+nodes to increase performance and redundancy. For more information, see the
+`Deployment Guide <https://docs.openstack.org/swift/latest/deployment_guide.html>`__.
+
+This section applies to Red Hat Enterprise Linux 9 and CentOS stream9.
+
+.. include:: controller-common_prerequisites.txt
+
+Install and configure components
+--------------------------------
+
+.. note::
+
+   Default configuration files vary by distribution. You might need
+   to add these sections and options rather than modifying existing
+   sections and options. Also, an ellipsis (``...``) in the configuration
+   snippets indicates potential default configuration options that you
+   should retain.
+
+#. Install the packages:
+
+   .. code-block:: console
+
+      # dnf install openstack-swift-proxy python3-swiftclient \
+        python3-keystoneclient python3-keystonemiddleware \
+        memcached
+
+   .. note::
+
+      Complete OpenStack environments already include some of these
+      packages.
+
+   2. Obtain the proxy service configuration file from the Object Storage
+      source repository:
+
+      .. code-block:: console
+
+         # curl -o /etc/swift/proxy-server.conf https://opendev.org/openstack/swift/raw/branch/master/etc/proxy-server.conf-sample
+
+   3. .. include:: controller-include.txt
diff --git a/doc/source/install/controller-install-ubuntu.rst b/doc/source/install/controller-install-ubuntu.rst
new file mode 100644
index 0000000000..e60ba8e872
--- /dev/null
+++ b/doc/source/install/controller-install-ubuntu.rst
@@ -0,0 +1,52 @@
+.. _controller-ubuntu:
+
+Install and configure the controller node for Ubuntu
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+This section describes how to install and configure the proxy service that
+handles requests for the account, container, and object services operating
+on the storage nodes. For simplicity, this guide installs and configures
+the proxy service on the controller node. However, you can run the proxy
+service on any node with network connectivity to the storage nodes.
+Additionally, you can install and configure the proxy service on multiple
+nodes to increase performance and redundancy. For more information, see the
+`Deployment Guide <https://docs.openstack.org/swift/latest/deployment_guide.html>`__.
+
+This section applies to Ubuntu 14.04 (LTS).
+
+.. include:: controller-common_prerequisites.txt
+
+Install and configure components
+--------------------------------
+
+.. note::
+
+   Default configuration files vary by distribution. You might need
+   to add these sections and options rather than modifying existing
+   sections and options. Also, an ellipsis (``...``) in the configuration
+   snippets indicates potential default configuration options that you
+   should retain.
+
+#. Install the packages:
+
+   .. code-block:: console
+
+      # apt-get install swift swift-proxy python-swiftclient \
+        python-keystoneclient python-keystonemiddleware \
+        memcached
+
+   .. note::
+
+      Complete OpenStack environments already include some of these
+      packages.
+
+   2. Create the ``/etc/swift`` directory.
+
+   3. Obtain the proxy service configuration file from the Object Storage
+      source repository:
+
+      .. code-block:: console
+
+         # curl -o /etc/swift/proxy-server.conf https://opendev.org/openstack/swift/raw/branch/master/etc/proxy-server.conf-sample
+
+   4. .. include:: controller-include.txt
diff --git a/doc/source/install/controller-install.rst b/doc/source/install/controller-install.rst
new file mode 100644
index 0000000000..294c2396b3
--- /dev/null
+++ b/doc/source/install/controller-install.rst
@@ -0,0 +1,17 @@
+.. _controller:
+
+Install and configure the controller node
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+This section describes how to install and configure the proxy service that
+handles requests for the account, container, and object services operating
+on the storage nodes.
+
+Note that installation and configuration vary by distribution.
+
+.. toctree::
+   :maxdepth: 1
+
+   controller-install-rdo.rst
+   controller-install-ubuntu.rst
+   controller-install-debian.rst
diff --git a/doc/source/install/edit_hosts_file.txt b/doc/source/install/edit_hosts_file.txt
new file mode 100644
index 0000000000..2e9bc9659f
--- /dev/null
+++ b/doc/source/install/edit_hosts_file.txt
@@ -0,0 +1,19 @@
+Edit the ``/etc/hosts`` file to contain the following:
+
+.. code-block:: none
+
+   # controller
+   10.0.0.11       controller
+
+   # compute1
+   10.0.0.31       compute1
+
+   # block1
+   10.0.0.41       block1
+
+   # object1
+   10.0.0.51       object1
+
+   # object2
+   10.0.0.52       object2
+
diff --git a/doc/source/install/environment-networking.rst b/doc/source/install/environment-networking.rst
new file mode 100644
index 0000000000..befb309fa7
--- /dev/null
+++ b/doc/source/install/environment-networking.rst
@@ -0,0 +1,66 @@
+.. _networking:
+
+Configure networking
+~~~~~~~~~~~~~~~~~~~~
+
+Before you start deploying the Object Storage service in your OpenStack
+environment, configure networking for two additional storage nodes.
+
+First node
+----------
+
+Configure network interfaces
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+* Configure the management interface:
+
+  * IP address: ``10.0.0.51``
+
+  * Network mask: ``255.255.255.0`` (or ``/24``)
+
+  * Default gateway: ``10.0.0.1``
+
+Configure name resolution
+^^^^^^^^^^^^^^^^^^^^^^^^^
+
+#. Set the hostname of the node to ``object1``.
+
+#. .. include:: edit_hosts_file.txt
+
+#. Reboot the system to activate the changes.
+
+Second node
+-----------
+
+Configure network interfaces
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+* Configure the management interface:
+
+  * IP address: ``10.0.0.52``
+
+  * Network mask: ``255.255.255.0`` (or ``/24``)
+
+  * Default gateway: ``10.0.0.1``
+
+Configure name resolution
+^^^^^^^^^^^^^^^^^^^^^^^^^
+
+#. Set the hostname of the node to ``object2``.
+
+#. .. include:: edit_hosts_file.txt
+
+#. Reboot the system to activate the changes.
+
+.. warning::
+
+   Some distributions add an extraneous entry in the ``/etc/hosts``
+   file that resolves the actual hostname to another loopback IP
+   address such as ``127.0.1.1``. You must comment out or remove this
+   entry to prevent name resolution problems. **Do not remove the
+   127.0.0.1 entry.**
+
+.. note::
+
+   To reduce complexity of this guide, we add host entries for optional
+   services regardless of whether you choose to deploy them.
diff --git a/doc/source/install/finalize-installation-rdo.rst b/doc/source/install/finalize-installation-rdo.rst
new file mode 100644
index 0000000000..ec6b115061
--- /dev/null
+++ b/doc/source/install/finalize-installation-rdo.rst
@@ -0,0 +1,89 @@
+.. _finalize-rdo:
+
+Finalize installation for Red Hat Enterprise Linux and CentOS
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. note::
+
+   Default configuration files vary by distribution. You might need
+   to add these sections and options rather than modifying existing
+   sections and options. Also, an ellipsis (``...``) in the configuration
+   snippets indicates potential default configuration options that you
+   should retain.
+
+This section applies to Red Hat Enterprise Linux 9 and CentOS stream9.
+
+#. Obtain the ``/etc/swift/swift.conf`` file from the Object
+   Storage source repository:
+
+   .. code-block:: console
+
+      # curl -o /etc/swift/swift.conf \
+        https://opendev.org/openstack/swift/raw/branch/master/etc/swift.conf-sample
+
+#. Edit the ``/etc/swift/swift.conf`` file and complete the following
+   actions:
+
+   * In the ``[swift-hash]`` section, configure the hash path prefix and
+     suffix for your environment.
+
+     .. code-block:: none
+
+        [swift-hash]
+        ...
+        swift_hash_path_suffix = HASH_PATH_SUFFIX
+        swift_hash_path_prefix = HASH_PATH_PREFIX
+
+     Replace HASH_PATH_PREFIX and HASH_PATH_SUFFIX with unique values.
+
+     .. warning::
+
+        Keep these values secret and do not change or lose them.
+
+   * In the ``[storage-policy:0]`` section, configure the default
+     storage policy:
+
+     .. code-block:: none
+
+        [storage-policy:0]
+        ...
+        name = Policy-0
+        default = yes
+
+#. Copy the ``swift.conf`` file to the ``/etc/swift`` directory on
+   each storage node and any additional nodes running the proxy service.
+
+4. On all nodes, ensure proper ownership of the configuration directory:
+
+   .. code-block:: console
+
+      # chown -R root:swift /etc/swift
+
+5. On the controller node and any other nodes running the proxy service,
+   start the Object Storage proxy service including its dependencies and
+   configure them to start when the system boots:
+
+   .. code-block:: console
+
+      # systemctl enable openstack-swift-proxy.service memcached.service
+      # systemctl start openstack-swift-proxy.service memcached.service
+
+6. On the storage nodes, start the Object Storage services and configure
+   them to start when the system boots:
+
+   .. code-block:: console
+
+      # systemctl enable openstack-swift-account.service openstack-swift-account-auditor.service \
+        openstack-swift-account-reaper.service openstack-swift-account-replicator.service
+      # systemctl start openstack-swift-account.service openstack-swift-account-auditor.service \
+        openstack-swift-account-reaper.service openstack-swift-account-replicator.service
+      # systemctl enable openstack-swift-container.service \
+        openstack-swift-container-auditor.service openstack-swift-container-replicator.service \
+        openstack-swift-container-updater.service
+      # systemctl start openstack-swift-container.service \
+        openstack-swift-container-auditor.service openstack-swift-container-replicator.service \
+        openstack-swift-container-updater.service
+      # systemctl enable openstack-swift-object.service openstack-swift-object-auditor.service \
+        openstack-swift-object-replicator.service openstack-swift-object-updater.service
+      # systemctl start openstack-swift-object.service openstack-swift-object-auditor.service \
+        openstack-swift-object-replicator.service openstack-swift-object-updater.service
diff --git a/doc/source/install/finalize-installation-ubuntu-debian.rst b/doc/source/install/finalize-installation-ubuntu-debian.rst
new file mode 100644
index 0000000000..ccde2fd568
--- /dev/null
+++ b/doc/source/install/finalize-installation-ubuntu-debian.rst
@@ -0,0 +1,80 @@
+.. _finalize-ubuntu-debian:
+
+Finalize installation for Ubuntu and Debian
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. note::
+
+   Default configuration files vary by distribution. You might need
+   to add these sections and options rather than modifying existing
+   sections and options. Also, an ellipsis (``...``) in the configuration
+   snippets indicates potential default configuration options that you
+   should retain.
+
+This section applies to Ubuntu 14.04 (LTS) and Debian.
+
+#. Obtain the ``/etc/swift/swift.conf`` file from the Object
+   Storage source repository:
+
+   .. code-block:: console
+
+      # curl -o /etc/swift/swift.conf \
+        https://opendev.org/openstack/swift/raw/branch/master/etc/swift.conf-sample
+
+#. Edit the ``/etc/swift/swift.conf`` file and complete the following
+   actions:
+
+   * In the ``[swift-hash]`` section, configure the hash path prefix and
+     suffix for your environment.
+
+     .. code-block:: none
+
+        [swift-hash]
+        ...
+        swift_hash_path_suffix = HASH_PATH_SUFFIX
+        swift_hash_path_prefix = HASH_PATH_PREFIX
+
+     Replace HASH_PATH_PREFIX and HASH_PATH_SUFFIX with unique values.
+
+     .. warning::
+
+        Keep these values secret and do not change or lose them.
+
+   * In the ``[storage-policy:0]`` section, configure the default
+     storage policy:
+
+     .. code-block:: none
+
+        [storage-policy:0]
+        ...
+        name = Policy-0
+        default = yes
+
+#. Copy the ``swift.conf`` file to the ``/etc/swift`` directory on
+   each storage node and any additional nodes running the proxy service.
+
+4. On all nodes, ensure proper ownership of the configuration directory:
+
+   .. code-block:: console
+
+      # chown -R root:swift /etc/swift
+
+5. On the controller node and any other nodes running the proxy service,
+   restart the Object Storage proxy service including its dependencies:
+
+   .. code-block:: console
+
+      # service memcached restart
+      # service swift-proxy restart
+
+6. On the storage nodes, start the Object Storage services:
+
+   .. code-block:: console
+
+      # swift-init all start
+
+   .. note::
+
+      The storage node runs many Object Storage services and the
+      :command:`swift-init` command makes them easier to manage.
+      You can ignore errors from services not running on the storage node.
diff --git a/doc/source/install/finalize-installation.rst b/doc/source/install/finalize-installation.rst
new file mode 100644
index 0000000000..447198bcae
--- /dev/null
+++ b/doc/source/install/finalize-installation.rst
@@ -0,0 +1,12 @@
+.. _finalize:
+
+Finalize installation
+~~~~~~~~~~~~~~~~~~~~~
+
+Finalizing installation varies by distribution.
+
+.. toctree::
+   :maxdepth: 1
+
+   finalize-installation-rdo.rst
+   finalize-installation-ubuntu-debian.rst
diff --git a/doc/source/install/get_started.rst b/doc/source/install/get_started.rst
new file mode 100644
index 0000000000..1cf963010f
--- /dev/null
+++ b/doc/source/install/get_started.rst
@@ -0,0 +1,51 @@
+===============================
+Object Storage service overview
+===============================
+
+The OpenStack Object Storage is a multi-tenant object storage system. It
+is highly scalable and can manage large amounts of unstructured data at
+low cost through a RESTful HTTP API.
+
+It includes the following components:
+
+Proxy servers (swift-proxy-server)
+  Accepts OpenStack Object Storage API and raw HTTP requests to upload
+  files, modify metadata, and create containers. It also serves file
+  or container listings to web browsers. To improve performance, the
+  proxy server can use an optional cache that is usually deployed with
+  memcache.
+
+Account servers (swift-account-server)
+  Manages accounts defined with Object Storage.
+
+Container servers (swift-container-server)
+  Manages the mapping of containers or folders, within Object Storage.
+
+Object servers (swift-object-server)
+  Manages actual objects, such as files, on the storage nodes.
+
+Various periodic processes
+  Performs housekeeping tasks on the large data store. The replication
+  services ensure consistency and availability through the cluster.
+  Other periodic processes include auditors, updaters, and reapers.
+
+WSGI middleware
+  Handles authentication and is usually OpenStack Identity.
+
+swift client
+  Enables users to submit commands to the REST API through a
+  command-line client authorized as either a admin user, reseller
+  user, or swift user.
+
+swift-init
+  Script that initializes the building of the ring file, takes daemon
+  names as parameter and offers commands. Documented in
+  https://docs.openstack.org/swift/latest/admin_guide.html#managing-services.
+
+swift-recon
+  A cli tool used to retrieve various metrics and telemetry information
+  about a cluster that has been collected by the swift-recon middleware.
+
+swift-ring-builder
+  Storage ring build and rebalance utility. Documented in
+  https://docs.openstack.org/swift/latest/admin_guide.html#managing-the-rings.
diff --git a/doc/source/install/index.rst b/doc/source/install/index.rst
new file mode 100644
index 0000000000..62d062356e
--- /dev/null
+++ b/doc/source/install/index.rst
@@ -0,0 +1,24 @@
+============================
+Object Storage Install Guide
+============================
+
+.. toctree::
+   :maxdepth: 2
+
+   get_started.rst
+   environment-networking.rst
+   controller-install.rst
+   storage-install.rst
+   initial-rings.rst
+   finalize-installation.rst
+   verify.rst
+   next-steps.rst
+
+The Object Storage services (swift) work together to provide
+object storage and retrieval through a REST API.
+
+This chapter assumes a working setup of OpenStack following the
+`OpenStack Installation Tutorial <https://docs.openstack.org/latest/install/>`_.
+
+Your environment must at least include the Identity service (keystone)
+prior to deploying Object Storage.
diff --git a/doc/source/install/initial-rings.rst b/doc/source/install/initial-rings.rst
new file mode 100644
index 0000000000..e09dfd4ed2
--- /dev/null
+++ b/doc/source/install/initial-rings.rst
@@ -0,0 +1,253 @@
+Create and distribute initial rings
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Before starting the Object Storage services, you must create the initial
+account, container, and object rings. The ring builder creates configuration
+files that each node uses to determine and deploy the storage architecture.
+For simplicity, this guide uses one region and two zones with 2^10 (1024)
+maximum partitions, 3 replicas of each object, and 1 hour minimum time between
+moving a partition more than once. For Object Storage, a partition indicates a
+directory on a storage device rather than a conventional partition table.
+For more information, see the
+`Deployment Guide <https://docs.openstack.org/swift/latest/deployment_guide.html>`__.
+
+.. note::
+   Perform these steps on the controller node.
+
+Create account ring
+-------------------
+
+The account server uses the account ring to maintain lists of containers.
+
+#. Change to the ``/etc/swift`` directory.
+
+#. Create the base ``account.builder`` file:
+
+   .. code-block:: console
+
+      # swift-ring-builder account.builder create 10 3 1
+
+   .. note::
+
+      This command provides no output.
+
+#. Add each storage node to the ring:
+
+   .. code-block:: console
+
+      # swift-ring-builder account.builder \
+        add --region 1 --zone 1 --ip STORAGE_NODE_MANAGEMENT_INTERFACE_IP_ADDRESS --port 6202 \
+        --device DEVICE_NAME --weight DEVICE_WEIGHT
+
+   Replace ``STORAGE_NODE_MANAGEMENT_INTERFACE_IP_ADDRESS`` with the IP address
+   of the management network on the storage node. Replace ``DEVICE_NAME`` with a
+   storage device name on the same storage node. For example, using the first
+   storage node in :ref:`storage` with the ``/dev/sdb`` storage
+   device and weight of 100:
+
+   .. code-block:: console
+
+      # swift-ring-builder account.builder add \
+        --region 1 --zone 1 --ip 10.0.0.51 --port 6202 --device sdb --weight 100
+
+   Repeat this command for each storage device on each storage node. In the
+   example architecture, use the command in four variations:
+
+   .. code-block:: console
+
+      # swift-ring-builder account.builder add \
+        --region 1 --zone 1 --ip 10.0.0.51 --port 6202 --device sdb --weight 100
+      Device d0r1z1-10.0.0.51:6202R10.0.0.51:6202/sdb_"" with 100.0 weight got id 0
+      # swift-ring-builder account.builder add \
+        --region 1 --zone 1 --ip 10.0.0.51 --port 6202 --device sdc --weight 100
+      Device d1r1z2-10.0.0.51:6202R10.0.0.51:6202/sdc_"" with 100.0 weight got id 1
+      # swift-ring-builder account.builder add \
+        --region 1 --zone 2 --ip 10.0.0.52 --port 6202 --device sdb --weight 100
+      Device d2r1z3-10.0.0.52:6202R10.0.0.52:6202/sdb_"" with 100.0 weight got id 2
+      # swift-ring-builder account.builder add \
+        --region 1 --zone 2 --ip 10.0.0.52 --port 6202 --device sdc --weight 100
+      Device d3r1z4-10.0.0.52:6202R10.0.0.52:6202/sdc_"" with 100.0 weight got id 3
+
+#. Verify the ring contents:
+
+   .. code-block:: console
+
+      # swift-ring-builder account.builder
+      account.builder, build version 4
+      1024 partitions, 3.000000 replicas, 1 regions, 2 zones, 4 devices, 100.00 balance, 0.00 dispersion
+      The minimum number of hours before a partition can be reassigned is 1
+      The overload factor is 0.00% (0.000000)
+      Devices:    id  region  zone      ip address  port  replication ip  replication port      name weight partitions balance meta
+                   0       1     1       10.0.0.51  6202       10.0.0.51              6202      sdb  100.00          0 -100.00
+                   1       1     1       10.0.0.51  6202       10.0.0.51              6202      sdc  100.00          0 -100.00
+                   2       1     2       10.0.0.52  6202       10.0.0.52              6202      sdb  100.00          0 -100.00
+                   3       1     2       10.0.0.52  6202       10.0.0.52              6202      sdc  100.00          0 -100.00
+
+#. Rebalance the ring:
+
+   .. code-block:: console
+
+      # swift-ring-builder account.builder rebalance
+      Reassigned 1024 (100.00%) partitions. Balance is now 0.00.  Dispersion is now 0.00
+
+Create container ring
+---------------------
+
+The container server uses the container ring to maintain lists of objects.
+However, it does not track object locations.
+
+#. Change to the ``/etc/swift`` directory.
+
+#. Create the base ``container.builder`` file:
+
+   .. code-block:: console
+
+      # swift-ring-builder container.builder create 10 3 1
+
+   .. note::
+
+      This command provides no output.
+
+#. Add each storage node to the ring:
+
+   .. code-block:: console
+
+      # swift-ring-builder container.builder \
+        add --region 1 --zone 1 --ip STORAGE_NODE_MANAGEMENT_INTERFACE_IP_ADDRESS --port 6201 \
+        --device DEVICE_NAME --weight DEVICE_WEIGHT
+
+   Replace ``STORAGE_NODE_MANAGEMENT_INTERFACE_IP_ADDRESS`` with the IP address
+   of the management network on the storage node. Replace ``DEVICE_NAME`` with a
+   storage device name on the same storage node. For example, using the first
+   storage node in :ref:`storage` with the ``/dev/sdb``
+   storage device and weight of 100:
+
+   .. code-block:: console
+
+      # swift-ring-builder container.builder add \
+        --region 1 --zone 1 --ip 10.0.0.51 --port 6201 --device sdb --weight 100
+
+   Repeat this command for each storage device on each storage node. In the
+   example architecture, use the command in four variations:
+
+   .. code-block:: console
+
+      # swift-ring-builder container.builder add \
+        --region 1 --zone 1 --ip 10.0.0.51 --port 6201 --device sdb --weight 100
+      Device d0r1z1-10.0.0.51:6201R10.0.0.51:6201/sdb_"" with 100.0 weight got id 0
+      # swift-ring-builder container.builder add \
+        --region 1 --zone 1 --ip 10.0.0.51 --port 6201 --device sdc --weight 100
+      Device d1r1z2-10.0.0.51:6201R10.0.0.51:6201/sdc_"" with 100.0 weight got id 1
+      # swift-ring-builder container.builder add \
+        --region 1 --zone 2 --ip 10.0.0.52 --port 6201 --device sdb --weight 100
+      Device d2r1z3-10.0.0.52:6201R10.0.0.52:6201/sdb_"" with 100.0 weight got id 2
+      # swift-ring-builder container.builder add \
+        --region 1 --zone 2 --ip 10.0.0.52 --port 6201 --device sdc --weight 100
+      Device d3r1z4-10.0.0.52:6201R10.0.0.52:6201/sdc_"" with 100.0 weight got id 3
+
+#. Verify the ring contents:
+
+   .. code-block:: console
+
+      # swift-ring-builder container.builder
+      container.builder, build version 4
+      1024 partitions, 3.000000 replicas, 1 regions, 2 zones, 4 devices, 100.00 balance, 0.00 dispersion
+      The minimum number of hours before a partition can be reassigned is 1
+      The overload factor is 0.00% (0.000000)
+      Devices:    id  region  zone      ip address  port  replication ip  replication port      name weight partitions balance meta
+                   0       1     1       10.0.0.51  6201       10.0.0.51              6201      sdb  100.00          0 -100.00
+                   1       1     1       10.0.0.51  6201       10.0.0.51              6201      sdc  100.00          0 -100.00
+                   2       1     2       10.0.0.52  6201       10.0.0.52              6201      sdb  100.00          0 -100.00
+                   3       1     2       10.0.0.52  6201       10.0.0.52              6201      sdc  100.00          0 -100.00
+
+#. Rebalance the ring:
+
+   .. code-block:: console
+
+      # swift-ring-builder container.builder rebalance
+      Reassigned 1024 (100.00%) partitions. Balance is now 0.00.  Dispersion is now 0.00
+
+Create object ring
+------------------
+
+The object server uses the object ring to maintain lists of object locations
+on local devices.
+
+#. Change to the ``/etc/swift`` directory.
+
+#. Create the base ``object.builder`` file:
+
+   .. code-block:: console
+
+      # swift-ring-builder object.builder create 10 3 1
+
+   .. note::
+
+      This command provides no output.
+
+#. Add each storage node to the ring:
+
+   .. code-block:: console
+
+      # swift-ring-builder object.builder \
+        add --region 1 --zone 1 --ip STORAGE_NODE_MANAGEMENT_INTERFACE_IP_ADDRESS --port 6200 \
+        --device DEVICE_NAME --weight DEVICE_WEIGHT
+
+   Replace ``STORAGE_NODE_MANAGEMENT_INTERFACE_IP_ADDRESS`` with the IP address
+   of the management network on the storage node. Replace ``DEVICE_NAME`` with
+   a storage device name on the same storage node. For example, using the first
+   storage node in :ref:`storage` with the ``/dev/sdb`` storage
+   device and weight of 100:
+
+   .. code-block:: console
+
+      # swift-ring-builder object.builder add \
+        --region 1 --zone 1 --ip 10.0.0.51 --port 6200 --device sdb --weight 100
+
+   Repeat this command for each storage device on each storage node. In the
+   example architecture, use the command in four variations:
+
+   .. code-block:: console
+
+      # swift-ring-builder object.builder add \
+        --region 1 --zone 1 --ip 10.0.0.51 --port 6200 --device sdb --weight 100
+      Device d0r1z1-10.0.0.51:6200R10.0.0.51:6200/sdb_"" with 100.0 weight got id 0
+      # swift-ring-builder object.builder add \
+        --region 1 --zone 1 --ip 10.0.0.51 --port 6200 --device sdc --weight 100
+      Device d1r1z2-10.0.0.51:6200R10.0.0.51:6200/sdc_"" with 100.0 weight got id 1
+      # swift-ring-builder object.builder add \
+        --region 1 --zone 2 --ip 10.0.0.52 --port 6200 --device sdb --weight 100
+      Device d2r1z3-10.0.0.52:6200R10.0.0.52:6200/sdb_"" with 100.0 weight got id 2
+      # swift-ring-builder object.builder add \
+        --region 1 --zone 2 --ip 10.0.0.52 --port 6200 --device sdc --weight 100
+      Device d3r1z4-10.0.0.52:6200R10.0.0.52:6200/sdc_"" with 100.0 weight got id 3
+
+#. Verify the ring contents:
+
+   .. code-block:: console
+
+      # swift-ring-builder object.builder
+      object.builder, build version 4
+      1024 partitions, 3.000000 replicas, 1 regions, 2 zones, 4 devices, 100.00 balance, 0.00 dispersion
+      The minimum number of hours before a partition can be reassigned is 1
+      The overload factor is 0.00% (0.000000)
+      Devices:    id  region  zone      ip address  port  replication ip  replication port      name weight partitions balance meta
+                   0       1     1       10.0.0.51  6200       10.0.0.51              6200      sdb  100.00          0 -100.00
+                   1       1     1       10.0.0.51  6200       10.0.0.51              6200      sdc  100.00          0 -100.00
+                   2       1     2       10.0.0.52  6200       10.0.0.52              6200      sdb  100.00          0 -100.00
+                   3       1     2       10.0.0.52  6200       10.0.0.52              6200      sdc  100.00          0 -100.00
+
+#. Rebalance the ring:
+
+   .. code-block:: console
+
+      # swift-ring-builder object.builder rebalance
+      Reassigned 1024 (100.00%) partitions. Balance is now 0.00.  Dispersion is now 0.00
+
+Distribute ring configuration files
+-----------------------------------
+
+* Copy the ``account.ring.gz``, ``container.ring.gz``, and
+  ``object.ring.gz`` files to the ``/etc/swift`` directory
+  on each storage node and any additional nodes running the
+  proxy service.
diff --git a/doc/source/install/next-steps.rst b/doc/source/install/next-steps.rst
new file mode 100644
index 0000000000..27585ff818
--- /dev/null
+++ b/doc/source/install/next-steps.rst
@@ -0,0 +1,10 @@
+.. _next-steps:
+
+==========
+Next steps
+==========
+
+Your OpenStack environment now includes Object Storage.
+
+To add more services, see the
+`additional documentation on installing OpenStack <https://docs.openstack.org/latest/install/>`_ .
diff --git a/doc/source/install/storage-include1.txt b/doc/source/install/storage-include1.txt
new file mode 100644
index 0000000000..711782300a
--- /dev/null
+++ b/doc/source/install/storage-include1.txt
@@ -0,0 +1,41 @@
+Edit the ``/etc/swift/account-server.conf`` file and complete the
+following actions:
+
+* In the ``[DEFAULT]`` section, configure the bind IP address, bind port,
+  user, configuration directory, and mount point directory:
+
+  .. code-block:: none
+
+     [DEFAULT]
+     ...
+     bind_ip = MANAGEMENT_INTERFACE_IP_ADDRESS
+     bind_port = 6202
+     user = swift
+     swift_dir = /etc/swift
+     devices = /srv/node
+     mount_check = True
+
+  Replace ``MANAGEMENT_INTERFACE_IP_ADDRESS`` with the IP address of the
+  management network on the storage node.
+
+* In the ``[pipeline:main]`` section, enable the appropriate modules:
+
+  .. code-block:: none
+
+     [pipeline:main]
+     pipeline = healthcheck recon account-server
+
+  .. note::
+
+     For more information on other modules that enable additional features,
+     see the `Deployment Guide <https://docs.openstack.org/swift/latest/deployment_guide.html>`__.
+
+* In the ``[filter:recon]`` section, configure the recon (meters) cache
+  directory:
+
+  .. code-block:: none
+
+     [filter:recon]
+     use = egg:swift#recon
+     ...
+     recon_cache_path = /var/cache/swift
diff --git a/doc/source/install/storage-include2.txt b/doc/source/install/storage-include2.txt
new file mode 100644
index 0000000000..cb320d9a1b
--- /dev/null
+++ b/doc/source/install/storage-include2.txt
@@ -0,0 +1,41 @@
+Edit the ``/etc/swift/container-server.conf`` file and complete the
+following actions:
+
+* In the ``[DEFAULT]`` section, configure the bind IP address, bind port,
+  user, configuration directory, and mount point directory:
+
+  .. code-block:: none
+
+     [DEFAULT]
+     ...
+     bind_ip = MANAGEMENT_INTERFACE_IP_ADDRESS
+     bind_port = 6201
+     user = swift
+     swift_dir = /etc/swift
+     devices = /srv/node
+     mount_check = True
+
+  Replace ``MANAGEMENT_INTERFACE_IP_ADDRESS`` with the IP address of the
+  management network on the storage node.
+
+* In the ``[pipeline:main]`` section, enable the appropriate modules:
+
+  .. code-block:: none
+
+     [pipeline:main]
+     pipeline = healthcheck recon container-server
+
+  .. note::
+
+     For more information on other modules that enable additional features,
+     see the `Deployment Guide <https://docs.openstack.org/swift/latest/deployment_guide.html>`__.
+
+* In the ``[filter:recon]`` section, configure the recon (meters) cache
+  directory:
+
+  .. code-block:: none
+
+     [filter:recon]
+     use = egg:swift#recon
+     ...
+     recon_cache_path = /var/cache/swift
diff --git a/doc/source/install/storage-include3.txt b/doc/source/install/storage-include3.txt
new file mode 100644
index 0000000000..2cc9e2d235
--- /dev/null
+++ b/doc/source/install/storage-include3.txt
@@ -0,0 +1,42 @@
+Edit the ``/etc/swift/object-server.conf`` file and complete the
+following actions:
+
+* In the ``[DEFAULT]`` section, configure the bind IP address, bind port,
+  user, configuration directory, and mount point directory:
+
+  .. code-block:: none
+
+     [DEFAULT]
+     ...
+     bind_ip = MANAGEMENT_INTERFACE_IP_ADDRESS
+     bind_port = 6200
+     user = swift
+     swift_dir = /etc/swift
+     devices = /srv/node
+     mount_check = True
+
+  Replace ``MANAGEMENT_INTERFACE_IP_ADDRESS`` with the IP address of the
+  management network on the storage node.
+
+* In the ``[pipeline:main]`` section, enable the appropriate modules:
+
+  .. code-block:: none
+
+     [pipeline:main]
+     pipeline = healthcheck recon object-server
+
+  .. note::
+
+     For more information on other modules that enable additional features,
+     see the `Deployment Guide <https://docs.openstack.org/swift/latest/deployment_guide.html>`__.
+
+* In the ``[filter:recon]`` section, configure the recon (meters) cache
+  and lock directories:
+
+  .. code-block:: none
+
+     [filter:recon]
+     use = egg:swift#recon
+     ...
+     recon_cache_path = /var/cache/swift
+     recon_lock_path = /var/lock
diff --git a/doc/source/install/storage-install-rdo.rst b/doc/source/install/storage-install-rdo.rst
new file mode 100644
index 0000000000..c032d8e35c
--- /dev/null
+++ b/doc/source/install/storage-install-rdo.rst
@@ -0,0 +1,172 @@
+.. _storage-rdo:
+
+Install and configure the storage nodes for Red Hat Enterprise Linux and CentOS
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+This section describes how to install and configure storage nodes
+that operate the account, container, and object services. For
+simplicity, this configuration references two storage nodes, each
+containing two empty local block storage devices. The instructions
+use ``/dev/sdb`` and ``/dev/sdc``, but you can substitute different
+values for your particular nodes.
+
+Although Object Storage supports any file system with
+extended attributes (xattr), testing and benchmarking
+indicate the best performance and reliability on XFS. For
+more information on horizontally scaling your environment, see the
+`Deployment Guide <https://docs.openstack.org/swift/latest/deployment_guide.html>`_.
+
+This section applies to Red Hat Enterprise Linux 9 and CentOS stream9.
+
+Prerequisites
+-------------
+
+Before you install and configure the Object Storage service on the
+storage nodes, you must prepare the storage devices.
+
+.. note::
+
+   Perform these steps on each storage node.
+
+#. Install the supporting utility packages:
+
+   .. code-block:: console
+
+      # dnf install xfsprogs rsync
+
+#. Format the ``/dev/sdb`` and ``/dev/sdc`` devices as XFS:
+
+   .. code-block:: console
+
+      # mkfs.xfs /dev/sdb
+      # mkfs.xfs /dev/sdc
+
+#. Create the mount point directory structure:
+
+   .. code-block:: console
+
+      # mkdir -p /srv/node/sdb
+      # mkdir -p /srv/node/sdc
+
+#. Find the UUID of the new partitions:
+
+   .. code-block:: console
+
+      # blkid
+
+#. Edit the ``/etc/fstab`` file and add the following to it:
+
+   .. code-block:: none
+
+      UUID="<UUID-from-output-above>" /srv/node/sdb xfs noatime 0 2
+      UUID="<UUID-from-output-above>" /srv/node/sdc xfs noatime 0 2
+
+#. Mount the devices:
+
+   .. code-block:: console
+
+      # mount /srv/node/sdb
+      # mount /srv/node/sdc
+
+#. Create or edit the ``/etc/rsyncd.conf`` file to contain the following:
+
+   .. code-block:: none
+
+      uid = swift
+      gid = swift
+      log file = /var/log/rsyncd.log
+      pid file = /var/run/rsyncd.pid
+      address = MANAGEMENT_INTERFACE_IP_ADDRESS
+
+      [account]
+      max connections = 2
+      path = /srv/node/
+      read only = False
+      lock file = /var/lock/account.lock
+
+      [container]
+      max connections = 2
+      path = /srv/node/
+      read only = False
+      lock file = /var/lock/container.lock
+
+      [object]
+      max connections = 2
+      path = /srv/node/
+      read only = False
+      lock file = /var/lock/object.lock
+
+   Replace ``MANAGEMENT_INTERFACE_IP_ADDRESS`` with the IP address of the
+   management network on the storage node.
+
+   .. note::
+
+      The ``rsync`` service requires no authentication, so consider running
+      it on a private network in production environments.
+
+7. Start the ``rsyncd`` service and configure it to start when the
+   system boots:
+
+   .. code-block:: console
+
+      # systemctl enable rsyncd.service
+      # systemctl start rsyncd.service
+
+Install and configure components
+--------------------------------
+
+.. note::
+
+   Default configuration files vary by distribution. You might need
+   to add these sections and options rather than modifying existing
+   sections and options. Also, an ellipsis (``...``) in the configuration
+   snippets indicates potential default configuration options that you
+   should retain.
+
+.. note::
+
+   Perform these steps on each storage node.
+
+#. Install the packages:
+
+   .. code-block:: console
+
+      # dnf install openstack-swift-account openstack-swift-container \
+        openstack-swift-object
+
+2. Obtain the accounting, container, and object service configuration
+   files from the Object Storage source repository:
+
+   .. code-block:: console
+
+      # curl -o /etc/swift/account-server.conf https://opendev.org/openstack/swift/raw/branch/master/etc/account-server.conf-sample
+      # curl -o /etc/swift/container-server.conf https://opendev.org/openstack/swift/raw/branch/master/etc/container-server.conf-sample
+      # curl -o /etc/swift/object-server.conf https://opendev.org/openstack/swift/raw/branch/master/etc/object-server.conf-sample
+
+3.  .. include:: storage-include1.txt
+4.  .. include:: storage-include2.txt
+5.  .. include:: storage-include3.txt
+6. Ensure proper ownership of the mount point directory structure:
+
+   .. code-block:: console
+
+      # chown -R swift:swift /srv/node
+
+7. Create the ``recon`` directory and ensure proper ownership of it:
+
+   .. code-block:: console
+
+      # mkdir -p /var/cache/swift
+      # chown -R root:swift /var/cache/swift
+      # chmod -R 775 /var/cache/swift
+
+8. Enable necessary access in the firewall
+
+   .. code-block:: console
+
+      # firewall-cmd --permanent --add-port=6200/tcp
+      # firewall-cmd --permanent --add-port=6201/tcp
+      # firewall-cmd --permanent --add-port=6202/tcp
+
+   The rsync service includes its own firewall configuration.
+   Connect from one node to another to ensure that access is allowed.
diff --git a/doc/source/install/storage-install-ubuntu-debian.rst b/doc/source/install/storage-install-ubuntu-debian.rst
new file mode 100644
index 0000000000..2464844370
--- /dev/null
+++ b/doc/source/install/storage-install-ubuntu-debian.rst
@@ -0,0 +1,165 @@
+.. _storage-ubuntu-debian:
+
+Install and configure the storage nodes for Ubuntu and Debian
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+This section describes how to install and configure storage nodes
+that operate the account, container, and object services. For
+simplicity, this configuration references two storage nodes, each
+containing two empty local block storage devices. The instructions
+use ``/dev/sdb`` and ``/dev/sdc``, but you can substitute different
+values for your particular nodes.
+
+Although Object Storage supports any file system with
+extended attributes (xattr), testing and benchmarking
+indicate the best performance and reliability on XFS. For
+more information on horizontally scaling your environment, see the
+`Deployment Guide <https://docs.openstack.org/swift/latest/deployment_guide.html>`_.
+
+This section applies to Ubuntu 14.04 (LTS) and Debian.
+
+Prerequisites
+-------------
+
+Before you install and configure the Object Storage service on the
+storage nodes, you must prepare the storage devices.
+
+.. note::
+
+   Perform these steps on each storage node.
+
+#. Install the supporting utility packages:
+
+   .. code-block:: console
+
+      # apt-get install xfsprogs rsync
+
+#. Format the ``/dev/sdb`` and ``/dev/sdc`` devices as XFS:
+
+   .. code-block:: console
+
+      # mkfs.xfs /dev/sdb
+      # mkfs.xfs /dev/sdc
+
+#. Create the mount point directory structure:
+
+   .. code-block:: console
+
+      # mkdir -p /srv/node/sdb
+      # mkdir -p /srv/node/sdc
+
+#. Find the UUID of the new partitions:
+
+   .. code-block:: console
+
+      # blkid
+
+#. Edit the ``/etc/fstab`` file and add the following to it:
+
+   .. code-block:: none
+
+      UUID="<UUID-from-output-above>" /srv/node/sdb xfs noatime 0 2
+      UUID="<UUID-from-output-above>" /srv/node/sdc xfs noatime 0 2
+
+#. Mount the devices:
+
+   .. code-block:: console
+
+      # mount /srv/node/sdb
+      # mount /srv/node/sdc
+
+#. Create or edit the ``/etc/rsyncd.conf`` file to contain the following:
+
+   .. code-block:: none
+
+      uid = swift
+      gid = swift
+      log file = /var/log/rsyncd.log
+      pid file = /var/run/rsyncd.pid
+      address = MANAGEMENT_INTERFACE_IP_ADDRESS
+
+      [account]
+      max connections = 2
+      path = /srv/node/
+      read only = False
+      lock file = /var/lock/account.lock
+
+      [container]
+      max connections = 2
+      path = /srv/node/
+      read only = False
+      lock file = /var/lock/container.lock
+
+      [object]
+      max connections = 2
+      path = /srv/node/
+      read only = False
+      lock file = /var/lock/object.lock
+
+   Replace ``MANAGEMENT_INTERFACE_IP_ADDRESS`` with the IP address of the
+   management network on the storage node.
+
+   .. note::
+
+      The ``rsync`` service requires no authentication, so consider running
+      it on a private network in production environments.
+
+7. Edit the ``/etc/default/rsync`` file and enable the ``rsync``
+   service:
+
+   .. code-block:: none
+
+      RSYNC_ENABLE=true
+
+8. Start the ``rsync`` service:
+
+   .. code-block:: console
+
+      # service rsync start
+
+Install and configure components
+--------------------------------
+
+.. note::
+
+   Default configuration files vary by distribution. You might need
+   to add these sections and options rather than modifying existing
+   sections and options. Also, an ellipsis (``...``) in the configuration
+   snippets indicates potential default configuration options that you
+   should retain.
+
+.. note::
+
+   Perform these steps on each storage node.
+
+#. Install the packages:
+
+   .. code-block:: console
+
+      # apt-get install swift swift-account swift-container swift-object
+
+2. Obtain the accounting, container, and object service configuration
+   files from the Object Storage source repository:
+
+   .. code-block:: console
+
+      # curl -o /etc/swift/account-server.conf https://opendev.org/openstack/swift/raw/branch/master/etc/account-server.conf-sample
+      # curl -o /etc/swift/container-server.conf https://opendev.org/openstack/swift/raw/branch/master/etc/container-server.conf-sample
+      # curl -o /etc/swift/object-server.conf https://opendev.org/openstack/swift/raw/branch/master/etc/object-server.conf-sample
+
+3.  .. include:: storage-include1.txt
+4.  .. include:: storage-include2.txt
+5.  .. include:: storage-include3.txt
+6. Ensure proper ownership of the mount point directory structure:
+
+   .. code-block:: console
+
+      # chown -R swift:swift /srv/node
+
+7. Create the ``recon`` directory and ensure proper ownership of it:
+
+   .. code-block:: console
+
+      # mkdir -p /var/cache/swift
+      # chown -R root:swift /var/cache/swift
+      # chmod -R 775 /var/cache/swift
diff --git a/doc/source/install/storage-install.rst b/doc/source/install/storage-install.rst
new file mode 100644
index 0000000000..7c1d4f9169
--- /dev/null
+++ b/doc/source/install/storage-install.rst
@@ -0,0 +1,15 @@
+.. _storage:
+
+Install and configure the storage nodes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+This section describes how to install and configure storage nodes
+that operate the account, container, and object services.
+
+Note that installation and configuration vary by distribution.
+
+.. toctree::
+   :maxdepth: 1
+
+   storage-install-rdo.rst
+   storage-install-ubuntu-debian.rst
diff --git a/doc/source/install/verify.rst b/doc/source/install/verify.rst
new file mode 100644
index 0000000000..2580cdd7cd
--- /dev/null
+++ b/doc/source/install/verify.rst
@@ -0,0 +1,94 @@
+.. _verify:
+
+Verify operation
+~~~~~~~~~~~~~~~~
+
+Verify operation of the Object Storage service.
+
+.. note::
+
+   Perform these steps on the controller node.
+
+.. warning::
+
+   If you are using Red Hat Enterprise Linux 7 or CentOS 7 and one or more of
+   these steps do not work, check the ``/var/log/audit/audit.log`` file for
+   SELinux messages indicating denial of actions for the ``swift`` processes.
+   If present, change the security context of the ``/srv/node`` directory to
+   the lowest security level (s0) for the ``swift_data_t`` type, ``object_r``
+   role and the ``system_u`` user:
+
+   .. code-block:: console
+
+      # chcon -R system_u:object_r:swift_data_t:s0 /srv/node
+
+#. Source the ``demo`` credentials:
+
+   .. code-block:: console
+
+      $ . demo-openrc
+
+#. Show the service status:
+
+   .. code-block:: console
+
+      $ swift stat
+                              Account: AUTH_ed0b60bf607743088218b0a533d5943f
+                           Containers: 0
+                              Objects: 0
+                                Bytes: 0
+          X-Account-Project-Domain-Id: default
+                          X-Timestamp: 1444143887.71539
+                           X-Trans-Id: tx1396aeaf17254e94beb34-0056143bde
+               X-Openstack-Request-Id: tx1396aeaf17254e94beb34-0056143bde
+                         Content-Type: text/plain; charset=utf-8
+                        Accept-Ranges: bytes
+
+#. Create ``container1`` container:
+
+   .. code-block:: console
+
+      $ openstack container create container1
+      +---------------------------------------+------------+------------------------------------+
+      | account                               | container  | x-trans-id                         |
+      +---------------------------------------+------------+------------------------------------+
+      | AUTH_ed0b60bf607743088218b0a533d5943f | container1 | tx8c4034dc306c44dd8cd68-0056f00a4a |
+      +---------------------------------------+------------+------------------------------------+
+
+#. Upload a test file to the ``container1`` container:
+
+   .. code-block:: console
+
+      $ openstack object create container1 FILE
+      +--------+------------+----------------------------------+
+      | object | container  | etag                             |
+      +--------+------------+----------------------------------+
+      | FILE   | container1 | ee1eca47dc88f4879d8a229cc70a07c6 |
+      +--------+------------+----------------------------------+
+
+   Replace ``FILE`` with the name of a local file to upload to the
+   ``container1`` container.
+
+#. List files in the ``container1`` container:
+
+   .. code-block:: console
+
+      $ openstack object list container1
+      +------+
+      | Name |
+      +------+
+      | FILE |
+      +------+
+
+#. Download a test file from the ``container1`` container:
+
+   .. code-block:: console
+
+      $ openstack object save container1 FILE
+
+   Replace ``FILE`` with the name of the file uploaded to the
+   ``container1`` container.
+
+   .. note::
+
+      This command provides no output.
diff --git a/doc/source/logs.rst b/doc/source/logs.rst
new file mode 100644
index 0000000000..16bc6f0da7
--- /dev/null
+++ b/doc/source/logs.rst
@@ -0,0 +1,198 @@
+====
+Logs
+====
+
+Swift has quite verbose logging, and the generated logs can be used for
+cluster monitoring, utilization calculations, audit records, and more. As an
+overview, Swift's logs are sent to syslog and organized by log level and
+syslog facility. All log lines related to the same request have the same
+transaction id. This page documents the log formats used in the system.
+
+.. note::
+
+    By default, Swift will log full log lines. However, with the
+    ``log_max_line_length`` setting and depending on your logging server
+    software, lines may be truncated or shortened. With ``log_max_line_length <
+    7``, the log line will be truncated. With ``log_max_line_length >= 7``, the
+    log line will be "shortened": about half the max length followed by " ... "
+    followed by the other half the max length. Unless you use exceptionally
+    short values, you are unlikely to run across this with the following
+    documented log lines, but you may see it with debugging and error log
+    lines.
+
+----------
+Proxy Logs
+----------
+
+The proxy logs contain the record of all external API requests made to the
+proxy server. Swift's proxy servers log requests using a custom format
+designed to provide robust information and simple processing. It is possible
+to change this format with  the ``log_msg_template`` config parameter.
+The default log format is::
+
+    {client_ip} {remote_addr} {end_time.datetime} {method} {path} {protocol}
+        {status_int} {referer} {user_agent} {auth_token} {bytes_recvd}
+        {bytes_sent} {client_etag} {transaction_id} {headers} {request_time}
+        {source} {log_info} {start_time} {end_time} {policy_index}
+        {access_user_id}
+
+Some keywords, signaled by the (anonymizable) flag, can be anonymized by
+using the transformer 'anonymized'. The data are applied the hashing method of
+``log_anonymization_method`` and an optional salt ``log_anonymization_salt``.
+
+Some keywords, signaled by the (timestamp) flag, can be converted to standard
+dates formats using the matching transformers: 'datetime', 'asctime' or
+'iso8601'. Other transformers for timestamps are 's', 'ms', 'us' and 'ns' for
+seconds, milliseconds, microseconds and nanoseconds. Python's strftime
+directives can also be used as tranformers (a, A, b, B, c, d, H, I, j, m, M, p,
+S, U, w, W, x, X, y, Y, Z).
+
+Example::
+
+    {client_ip.anonymized} {remote_addr.anonymized} {start_time.iso8601}
+        {end_time.H}:{end_time.M} {method} acc:{account} cnt:{container}
+        obj:{object.anonymized}
+
+=================== ==========================================================
+**Log Field**       **Value**
+------------------- ----------------------------------------------------------
+client_ip           Swift's guess at the end-client IP, taken from various
+                    headers in the request. (anonymizable)
+remote_addr         The IP address of the other end of the TCP connection.
+                    (anonymizable)
+end_time            Timestamp of the request. (timestamp)
+method              The HTTP verb in the request.
+domain              The domain in the request. (anonymizable)
+path                The path portion of the request. (anonymizable)
+protocol            The transport protocol used (currently one of http or
+                    https).
+status_int          The response code for the request.
+referer             The value of the HTTP Referer header. (anonymizable)
+user_agent          The value of the HTTP User-Agent header. (anonymizable)
+auth_token          The value of the auth token. This may be truncated or
+                    otherwise obscured.
+bytes_recvd         The number of bytes read from the client for this request.
+bytes_sent          The number of bytes sent to the client in the body of the
+                    response. This is how many bytes were yielded to the WSGI
+                    server.
+client_etag         The etag header value given by the client. (anonymizable)
+transaction_id      The transaction id of the request.
+headers             The headers given in the request. (anonymizable)
+request_time        The duration of the request.
+source              The "source" of the request. This may be set for requests
+                    that are generated in order to fulfill client requests,
+                    e.g. bulk uploads.
+log_info            Various info that may be useful for diagnostics, e.g. the
+                    value of any x-delete-at header.
+start_time          High-resolution timestamp from the start of the request.
+                    (timestamp)
+end_time            High-resolution timestamp from the end of the request.
+                    (timestamp)
+ttfb                Duration between the request and the first bytes is sent.
+policy_index        The value of the storage policy index.
+account             The account part extracted from the path of the request.
+                    (anonymizable)
+container           The container part extracted from the path of the request.
+                    (anonymizable)
+object              The object part extracted from the path of the request.
+                    (anonymizable)
+pid                 PID of the process emitting the log line.
+wire_status_int     The status sent to the client, which may be different than
+                    the logged response code if there was an error during the
+                    body of the request or a disconnect.
+access_user_id      The user ID for logging. Middlewares should set
+                    environ['swift.access_logging']['user_id'] to identify the user
+                    for logging purposes. For S3 API requests, this contains the S3
+                    access key ID. Other auth middlewares should set user-specific
+                    identifiers. For requests without auth middleware support, this
+                    field will be "-".
+=================== ==========================================================
+
+In one log line, all of the above fields are space-separated and url-encoded.
+If any value is empty, it will be logged as a "-". This allows for simple
+parsing by splitting each line on whitespace. New values may be placed at the
+end of the log line from time to time, but the order of the existing values
+will not change. Swift log processing utilities should look for the first N
+fields they require (e.g. in Python using something like
+``log_line.split()[:14]`` to get up through the transaction id).
+
+.. note::
+
+    Some log fields (like the request path) are already url quoted, so the
+    logged value will be double-quoted. For example, if a client uploads an
+    object name with a ``:`` in it, it will be url-quoted as ``%3A``. The log
+    module will then quote this value as ``%253A``.
+
+Swift Source
+============
+
+The ``source`` value in the proxy logs is used to identify the originator of a
+request in the system. For example, if the client initiates a bulk upload, the
+proxy server may end up doing many requests. The initial bulk upload request
+will be logged as normal, but all of the internal "child requests" will have a
+source value indicating they came from the bulk functionality.
+
+======================= =============================
+**Logged Source Value** **Originator of the Request**
+----------------------- -----------------------------
+FP                      :ref:`formpost`
+SLO                     :ref:`static-large-objects`
+SW                      :ref:`staticweb`
+TU                      :ref:`tempurl`
+BD                      :ref:`bulk` (delete)
+EA                      :ref:`bulk` (extract)
+AQ                      :ref:`account-quotas`
+CQ                      :ref:`container-quotas`
+CS                      :ref:`container-sync`
+TA                      :ref:`common_tempauth`
+DLO                     :ref:`dynamic-large-objects`
+LE                      :ref:`list_endpoints`
+KS                      :ref:`keystoneauth`
+RL                      :ref:`ratelimit`
+RO                      :ref:`read_only`
+VW                      :ref:`versioned_writes`
+SSC                     :ref:`copy`
+SYM                     :ref:`symlink`
+SH                      :ref:`sharding_doc`
+S3                      :ref:`s3api`
+OV                      :ref:`object_versioning`
+EQ                      :ref:`etag_quoter`
+======================= =============================
+
+
+-----------------
+Storage Node Logs
+-----------------
+
+Swift's account, container, and object server processes each log requests
+that they receive, if they have been configured to do so with the
+``log_requests`` config parameter (which defaults to true). The format for
+these log lines is::
+
+    remote_addr - - [datetime] "request_method request_path" status_int
+        content_length "referer" "transaction_id" "user_agent" request_time
+        additional_info server_pid policy_index
+
+=================== ==========================================================
+**Log Field**       **Value**
+------------------- ----------------------------------------------------------
+remote_addr         The IP address of the other end of the TCP connection.
+datetime            Timestamp of the request, in
+                    "day/month/year:hour:minute:second +0000" format.
+request_method      The HTTP verb in the request.
+request_path        The path portion of the request.
+status_int          The response code for the request.
+content_length      The value of the Content-Length header in the response.
+referer             The value of the HTTP Referer header.
+transaction_id      The transaction id of the request.
+user_agent          The value of the HTTP User-Agent header. Swift services
+                    report a user-agent string of the service name followed by
+                    the process ID, such as ``"proxy-server <pid of the
+                    proxy>"`` or ``"object-updater <pid of the object
+                    updater>"``.
+request_time        The time between request received and response started.
+                    **Note**: This includes transfer time on PUT, but not GET.
+additional_info     Additional useful information.
+server_pid          The process id of the server
+policy_index        The value of the storage policy index.
+=================== ==========================================================
diff --git a/doc/source/metrics/account_auditor.rst b/doc/source/metrics/account_auditor.rst
new file mode 100644
index 0000000000..83fbd74408
--- /dev/null
+++ b/doc/source/metrics/account_auditor.rst
@@ -0,0 +1,12 @@
+``account-auditor`` Metrics
+===========================
+
+============================  =========================================================
+Metric Name                   Description
+----------------------------  ---------------------------------------------------------
+``account-auditor.errors``    Count of audit runs (across all account databases) which
+                              caught an Exception.
+``account-auditor.passes``    Count of individual account databases which passed audit.
+``account-auditor.failures``  Count of individual account databases which failed audit.
+``account-auditor.timing``    Timing data for individual account database audits.
+============================  =========================================================
diff --git a/doc/source/metrics/account_reaper.rst b/doc/source/metrics/account_reaper.rst
new file mode 100644
index 0000000000..a95f8b2c12
--- /dev/null
+++ b/doc/source/metrics/account_reaper.rst
@@ -0,0 +1,25 @@
+``account-reaper`` Metrics
+==========================
+
+================================================  ====================================================
+Metric Name                                       Description
+------------------------------------------------  ----------------------------------------------------
+``account-reaper.errors``                         Count of devices failing the mount check.
+``account-reaper.timing``                         Timing data for each reap_account() call.
+``account-reaper.return_codes.X``                 Count of HTTP return codes from various operations
+                                                  (e.g. object listing, container deletion, etc.). The
+                                                  value for X is the first digit of the return code
+                                                  (2 for 201, 4 for 404, etc.).
+``account-reaper.containers_failures``            Count of failures to delete a container.
+``account-reaper.containers_deleted``             Count of containers successfully deleted.
+``account-reaper.containers_remaining``           Count of containers which failed to delete with
+                                                  zero successes.
+``account-reaper.containers_possibly_remaining``  Count of containers which failed to delete with
+                                                  at least one success.
+``account-reaper.objects_failures``               Count of failures to delete an object.
+``account-reaper.objects_deleted``                Count of objects successfully deleted.
+``account-reaper.objects_remaining``              Count of objects which failed to delete with zero
+                                                  successes.
+``account-reaper.objects_possibly_remaining``     Count of objects which failed to delete with at
+                                                  least one success.
+================================================  ====================================================
diff --git a/doc/source/metrics/account_replicator.rst b/doc/source/metrics/account_replicator.rst
new file mode 100644
index 0000000000..19127953b0
--- /dev/null
+++ b/doc/source/metrics/account_replicator.rst
@@ -0,0 +1,31 @@
+``account-replicator`` Metrics
+==============================
+
+=======================================  ====================================================
+Metric Name                              Description
+---------------------------------------  ----------------------------------------------------
+``account-replicator.diffs``             Count of syncs handled by sending differing rows.
+``account-replicator.diff_caps``         Count of "diffs" operations which failed because
+                                         "max_diffs" was hit.
+``account-replicator.no_changes``        Count of accounts found to be in sync.
+``account-replicator.hashmatches``       Count of accounts found to be in sync via hash
+                                         comparison (``broker.merge_syncs`` was called).
+``account-replicator.rsyncs``            Count of completely missing accounts which were sent
+                                         via rsync.
+``account-replicator.remote_merges``     Count of syncs handled by sending entire database
+                                         via rsync.
+``account-replicator.attempts``          Count of database replication attempts.
+``account-replicator.failures``          Count of database replication attempts which failed
+                                         due to corruption (quarantined) or inability to read
+                                         as well as attempts to individual nodes which
+                                         failed.
+``account-replicator.removes.<device>``  Count of databases on <device> deleted because the
+                                         delete_timestamp was greater than the put_timestamp
+                                         and the database had no rows or because it was
+                                         successfully sync'ed to other locations and doesn't
+                                         belong here anymore.
+``account-replicator.successes``         Count of replication attempts to an individual node
+                                         which were successful.
+``account-replicator.timing``            Timing data for each database replication attempt
+                                         not resulting in a failure.
+=======================================  ====================================================
diff --git a/doc/source/metrics/account_server.rst b/doc/source/metrics/account_server.rst
new file mode 100644
index 0000000000..6bf75f0558
--- /dev/null
+++ b/doc/source/metrics/account_server.rst
@@ -0,0 +1,37 @@
+``account-server`` Metrics
+==========================
+
+..note::
+   "Not Found" is not considered an error and requests
+   which increment ``errors`` are not included in the timing data.
+
+==========================================  =======================================================
+Metric Name                                 Description
+------------------------------------------  -------------------------------------------------------
+``account-server.DELETE.errors.timing``     Timing data for each DELETE request resulting in an
+                                            error: bad request, not mounted, missing timestamp.
+``account-server.DELETE.timing``            Timing data for each DELETE request not resulting in
+                                            an error.
+``account-server.PUT.errors.timing``        Timing data for each PUT request resulting in an error:
+                                            bad request, not mounted, conflict, recently-deleted.
+``account-server.PUT.timing``               Timing data for each PUT request not resulting in an
+                                            error.
+``account-server.HEAD.errors.timing``       Timing data for each HEAD request resulting in an
+                                            error: bad request, not mounted.
+``account-server.HEAD.timing``              Timing data for each HEAD request not resulting in
+                                            an error.
+``account-server.GET.errors.timing``        Timing data for each GET request resulting in an
+                                            error: bad request, not mounted, bad delimiter,
+                                            account listing limit too high, bad accept header.
+``account-server.GET.timing``               Timing data for each GET request not resulting in
+                                            an error.
+``account-server.REPLICATE.errors.timing``  Timing data for each REPLICATE request resulting in an
+                                            error: bad request, not mounted.
+``account-server.REPLICATE.timing``         Timing data for each REPLICATE request not resulting
+                                            in an error.
+``account-server.POST.errors.timing``       Timing data for each POST request resulting in an
+                                            error: bad request, bad or missing timestamp, not
+                                            mounted.
+``account-server.POST.timing``              Timing data for each POST request not resulting in
+                                            an error.
+==========================================  =======================================================
diff --git a/doc/source/metrics/all.rst b/doc/source/metrics/all.rst
new file mode 100644
index 0000000000..bca1c10870
--- /dev/null
+++ b/doc/source/metrics/all.rst
@@ -0,0 +1,24 @@
+:orphan:
+
+All Statsd Metrics
+==================
+
+.. include:: account_auditor.rst
+.. include:: account_reaper.rst
+.. include:: account_server.rst
+.. include:: account_replicator.rst
+
+.. include:: container_auditor.rst
+.. include:: container_replicator.rst
+.. include:: container_server.rst
+.. include:: container_sync.rst
+.. include:: container_updater.rst
+
+.. include:: object_auditor.rst
+.. include:: object_expirer.rst
+.. include:: object_reconstructor.rst
+.. include:: object_replicator.rst
+.. include:: object_server.rst
+.. include:: object_updater.rst
+
+.. include:: proxy_server.rst
diff --git a/doc/source/metrics/container_auditor.rst b/doc/source/metrics/container_auditor.rst
new file mode 100644
index 0000000000..4054337098
--- /dev/null
+++ b/doc/source/metrics/container_auditor.rst
@@ -0,0 +1,12 @@
+``container-auditor`` Metrics
+=============================
+
+==============================  ====================================================
+Metric Name                     Description
+------------------------------  ----------------------------------------------------
+``container-auditor.errors``    Incremented when an Exception is caught in an audit
+                                pass (only once per pass, max).
+``container-auditor.passes``    Count of individual containers passing an audit.
+``container-auditor.failures``  Count of individual containers failing an audit.
+``container-auditor.timing``    Timing data for each container audit.
+==============================  ====================================================
diff --git a/doc/source/metrics/container_replicator.rst b/doc/source/metrics/container_replicator.rst
new file mode 100644
index 0000000000..c575190638
--- /dev/null
+++ b/doc/source/metrics/container_replicator.rst
@@ -0,0 +1,31 @@
+``container-replicator`` Metrics
+================================
+
+=========================================  ====================================================
+Metric Name                                Description
+-----------------------------------------  ----------------------------------------------------
+``container-replicator.diffs``             Count of syncs handled by sending differing rows.
+``container-replicator.diff_caps``         Count of "diffs" operations which failed because
+                                           "max_diffs" was hit.
+``container-replicator.no_changes``        Count of containers found to be in sync.
+``container-replicator.hashmatches``       Count of containers found to be in sync via hash
+                                           comparison (``broker.merge_syncs`` was called).
+``container-replicator.rsyncs``            Count of completely missing containers where were sent
+                                           via rsync.
+``container-replicator.remote_merges``     Count of syncs handled by sending entire database
+                                           via rsync.
+``container-replicator.attempts``          Count of database replication attempts.
+``container-replicator.failures``          Count of database replication attempts which failed
+                                           due to corruption (quarantined) or inability to read
+                                           as well as attempts to individual nodes which
+                                           failed.
+``container-replicator.removes.<device>``  Count of databases deleted on <device> because the
+                                           delete_timestamp was greater than the put_timestamp
+                                           and the database had no rows or because it was
+                                           successfully sync'ed to other locations and doesn't
+                                           belong here anymore.
+``container-replicator.successes``         Count of replication attempts to an individual node
+                                           which were successful.
+``container-replicator.timing``            Timing data for each database replication attempt
+                                           not resulting in a failure.
+=========================================  ====================================================
diff --git a/doc/source/metrics/container_server.rst b/doc/source/metrics/container_server.rst
new file mode 100644
index 0000000000..a5c41daf87
--- /dev/null
+++ b/doc/source/metrics/container_server.rst
@@ -0,0 +1,35 @@
+``container-server`` Metrics
+============================
+
+.. note::
+   "Not Found" is not considered an error and requests
+   which increment ``errors`` are not included in the timing data.
+
+============================================  ====================================================
+Metric Name                                   Description
+--------------------------------------------  ----------------------------------------------------
+``container-server.DELETE.errors.timing``     Timing data for DELETE request errors: bad request,
+                                              not mounted, missing timestamp, conflict.
+``container-server.DELETE.timing``            Timing data for each DELETE request not resulting in
+                                              an error.
+``container-server.PUT.errors.timing``        Timing data for PUT request errors: bad request,
+                                              missing timestamp, not mounted, conflict.
+``container-server.PUT.timing``               Timing data for each PUT request not resulting in an
+                                              error.
+``container-server.HEAD.errors.timing``       Timing data for HEAD request errors: bad request,
+                                              not mounted.
+``container-server.HEAD.timing``              Timing data for each HEAD request not resulting in
+                                              an error.
+``container-server.GET.errors.timing``        Timing data for GET request errors: bad request,
+                                              not mounted, parameters not utf8, bad accept header.
+``container-server.GET.timing``               Timing data for each GET request not resulting in
+                                              an error.
+``container-server.REPLICATE.errors.timing``  Timing data for REPLICATE request errors: bad
+                                              request, not mounted.
+``container-server.REPLICATE.timing``         Timing data for each REPLICATE request not resulting
+                                              in an error.
+``container-server.POST.errors.timing``       Timing data for POST request errors: bad request,
+                                              bad x-container-sync-to, not mounted.
+``container-server.POST.timing``              Timing data for each POST request not resulting in
+                                              an error.
+============================================  ====================================================
diff --git a/doc/source/metrics/container_sync.rst b/doc/source/metrics/container_sync.rst
new file mode 100644
index 0000000000..e36a15fef1
--- /dev/null
+++ b/doc/source/metrics/container_sync.rst
@@ -0,0 +1,18 @@
+``container-sync`` Metrics
+==========================
+
+=================================  ====================================================
+Metric Name                        Description
+---------------------------------  ----------------------------------------------------
+``container-sync.skips``           Count of containers skipped because they don't have
+                                   sync'ing enabled.
+``container-sync.failures``        Count of failures sync'ing of individual containers.
+``container-sync.syncs``           Count of individual containers sync'ed successfully.
+``container-sync.deletes``         Count of container database rows sync'ed by
+                                   deletion.
+``container-sync.deletes.timing``  Timing data for each container database row
+                                   synchronization via deletion.
+``container-sync.puts``            Count of container database rows sync'ed by Putting.
+``container-sync.puts.timing``     Timing data for each container database row
+                                   synchronization via Putting.
+=================================  ====================================================
diff --git a/doc/source/metrics/container_updater.rst b/doc/source/metrics/container_updater.rst
new file mode 100644
index 0000000000..d498266f21
--- /dev/null
+++ b/doc/source/metrics/container_updater.rst
@@ -0,0 +1,17 @@
+``container-updater`` Metrics
+=============================
+
+================================  ====================================================
+Metric Name                       Description
+--------------------------------  ----------------------------------------------------
+``container-updater.successes``   Count of containers which successfully updated their
+                                  account.
+``container-updater.failures``    Count of containers which failed to update their
+                                  account.
+``container-updater.no_changes``  Count of containers which didn't need to update
+                                  their account.
+``container-updater.timing``      Timing data for processing a container; only
+                                  includes timing for containers which needed to
+                                  update their accounts (i.e. "successes" and
+                                  "failures" but not "no_changes").
+================================  ====================================================
diff --git a/doc/source/metrics/labels.rst b/doc/source/metrics/labels.rst
new file mode 100644
index 0000000000..6e85254167
--- /dev/null
+++ b/doc/source/metrics/labels.rst
@@ -0,0 +1,68 @@
+:orphan:
+
+Labeled Metrics
+===============
+
+.. note::
+   Labeled metrics are still an experimental feature. This document contains
+   forward looking statements that anticipate future development of labeled
+   metrics support. In particular, metric names and labels may be subject to
+   change as we explore the space.
+
+.. warning::
+   Enabling labeled metrics will likely cause a dramatic increase in the number
+   of distinct metrics time series. Ensure your metrics pipeline is prepared.
+
+Recent versions of Swift emit StatsD metrics with explicit application-defined
+labels, rather than relying on consumers knowing how to unpack the legacy label
+names. A variety of StatsD extension formats are available, many of which are
+parsed by `statsd_exporter <https://github.com/prometheus/statsd_exporter/>`__:
+
+- ``librato``
+- ``influxdb``
+- ``dogstatsd``
+- ``graphite``
+
+See the ``proxy-server.conf-sample`` file for more information on configuring
+labeled metrics.
+
+Labeled metrics are emitted in addition to legacy StatsD metrics.  However,
+legacy StatsD metrics can be disabled by setting the ``statsd_emit_legacy``
+option to ``False``.  This is not recommended until more legacy metrics have
+been supplemented with equivalent labeled metrics.
+
+As various Swift middlewares, services and daemons are upgraded to emit labeled
+metrics, they will be documented in the relevant section of the :doc:`all`
+page.
+
+Common Labels
+-------------
+
+Each labeled metric may have its own unique labels, but many labeled metrics
+will use some or all of a common set of labels.  The common labels are
+documented here for information purposes, but the authoritative set of labels
+for each metric can be found in the sections of the :doc:`all` page.
+
+.. table::
+   :align: left
+
+   ================ ==========================================================
+   Label Name       Value
+   ---------------- ----------------------------------------------------------
+   ``resource``     The type of resource associated with the metric
+                    i.e. ``account``, ``container`` or ``object``.
+   ``account``      The quoted account name associated with the metric.
+   ``container``    The quoted container name associated with the metric.
+   ``policy``       The storage policy index associated with the metric.
+   ``status``       The status int of an HTTP response associated with the
+                    metric.
+   ``method``       The method of an HTTP request associated with the metric.
+   ================ ==========================================================
+
+
+.. note::
+   Note that metrics will *not* have labels that would likely have a very high
+   cardinality of values, such as object names, as this is expected to be
+   problematic for metrics collectors. Nevertheless, some operators may still
+   need to drop labels such as ``container`` in order to keep metric
+   cardinalities reasonable.
diff --git a/doc/source/metrics/object_auditor.rst b/doc/source/metrics/object_auditor.rst
new file mode 100644
index 0000000000..4baa040075
--- /dev/null
+++ b/doc/source/metrics/object_auditor.rst
@@ -0,0 +1,13 @@
+``object-auditor`` Metrics
+==========================
+
+==============================  ====================================================
+Metric Name                     Description
+------------------------------  ----------------------------------------------------
+``object-auditor.quarantines``  Count of objects failing audit and quarantined.
+``object-auditor.errors``       Count of errors encountered while auditing objects.
+``object-auditor.timing``       Timing data for each object audit (does not include
+                                any rate-limiting sleep time for
+                                max_files_per_second, but does include rate-limiting
+                                sleep time for max_bytes_per_second).
+==============================  ====================================================
diff --git a/doc/source/metrics/object_expirer.rst b/doc/source/metrics/object_expirer.rst
new file mode 100644
index 0000000000..71e725ec8f
--- /dev/null
+++ b/doc/source/metrics/object_expirer.rst
@@ -0,0 +1,12 @@
+``object-expirer`` Metrics
+==========================
+
+==========================  ====================================================
+Metric Name                 Description
+--------------------------  ----------------------------------------------------
+``object-expirer.objects``  Count of objects expired.
+``object-expirer.errors``   Count of errors encountered while attempting to
+                            expire an object.
+``object-expirer.timing``   Timing data for each object expiration attempt,
+                            including ones resulting in an error.
+==========================  ====================================================
diff --git a/doc/source/metrics/object_reconstructor.rst b/doc/source/metrics/object_reconstructor.rst
new file mode 100644
index 0000000000..66ec0bec8b
--- /dev/null
+++ b/doc/source/metrics/object_reconstructor.rst
@@ -0,0 +1,25 @@
+``object-reconstructor`` Metrics
+================================
+
+========================================================  ======================================================
+Metric Name                                               Description
+--------------------------------------------------------  ------------------------------------------------------
+``object-reconstructor.partition.delete.count.<device>``  A count of partitions on <device> which were
+                                                          reconstructed and synced to another node because they
+                                                          didn't belong on this node. This metric is tracked
+                                                          per-device to allow for "quiescence detection" for
+                                                          object reconstruction activity on each device.
+``object-reconstructor.partition.delete.timing``          Timing data for partitions reconstructed and synced to
+                                                          another node because they didn't belong on this node.
+                                                          This metric is not tracked per device.
+``object-reconstructor.partition.update.count.<device>``  A count of partitions on <device> which were
+                                                          reconstructed and synced to another node, but also
+                                                          belong on this node. As with delete.count, this metric
+                                                          is tracked per-device.
+``object-reconstructor.partition.update.timing``          Timing data for partitions reconstructed which also
+                                                          belong on this node. This metric is not tracked
+                                                          per-device.
+``object-reconstructor.suffix.hashes``                    Count of suffix directories whose hash (of filenames)
+                                                          was recalculated.
+``object-reconstructor.suffix.syncs``                     Count of suffix directories reconstructed with ssync.
+========================================================  ======================================================
diff --git a/doc/source/metrics/object_replicator.rst b/doc/source/metrics/object_replicator.rst
new file mode 100644
index 0000000000..934c1c3f5a
--- /dev/null
+++ b/doc/source/metrics/object_replicator.rst
@@ -0,0 +1,25 @@
+``object-replicator`` Metrics
+=============================
+
+=====================================================  ====================================================
+Metric Name                                            Description
+-----------------------------------------------------  ----------------------------------------------------
+``object-replicator.partition.delete.count.<device>``  A count of partitions on <device> which were
+                                                       replicated to another node because they didn't
+                                                       belong on this node.  This metric is tracked
+                                                       per-device to allow for "quiescence detection" for
+                                                       object replication activity on each device.
+``object-replicator.partition.delete.timing``          Timing data for partitions replicated to another
+                                                       node because they didn't belong on this node.  This
+                                                       metric is not tracked per device.
+``object-replicator.partition.update.count.<device>``  A count of partitions on <device> which were
+                                                       replicated to another node, but also belong on this
+                                                       node.  As with delete.count, this metric is tracked
+                                                       per-device.
+``object-replicator.partition.update.timing``          Timing data for partitions replicated which also
+                                                       belong on this node.  This metric is not tracked
+                                                       per-device.
+``object-replicator.suffix.hashes``                    Count of suffix directories whose hash (of filenames)
+                                                       was recalculated.
+``object-replicator.suffix.syncs``                     Count of suffix directories replicated with rsync.
+=====================================================  ====================================================
diff --git a/doc/source/metrics/object_server.rst b/doc/source/metrics/object_server.rst
new file mode 100644
index 0000000000..ef4c5e07ad
--- /dev/null
+++ b/doc/source/metrics/object_server.rst
@@ -0,0 +1,49 @@
+``object-server`` Metrics
+=========================
+
+=========================================  ====================================================
+Metric Name                                Description
+-----------------------------------------  ----------------------------------------------------
+``object-server.quarantines``              Count of objects (files) found bad and moved to
+                                           quarantine.
+``object-server.async_pendings``           Count of container updates saved as async_pendings
+                                           (may result from PUT or DELETE requests).
+``object-server.POST.errors.timing``       Timing data for POST request errors: bad request,
+                                           missing timestamp, delete-at in past, not mounted.
+``object-server.POST.timing``              Timing data for each POST request not resulting in
+                                           an error.
+``object-server.PUT.errors.timing``        Timing data for PUT request errors: bad request,
+                                           not mounted, missing timestamp, object creation
+                                           constraint violation, delete-at in past.
+``object-server.PUT.timeouts``             Count of object PUTs which exceeded max_upload_time.
+``object-server.PUT.timing``               Timing data for each PUT request not resulting in an
+                                           error.
+``object-server.PUT.<device>.timing``      Timing data per kB transferred (ms/kB) for each
+                                           non-zero-byte PUT request on each device.
+                                           Monitoring problematic devices, higher is bad.
+``object-server.GET.errors.timing``        Timing data for GET request errors: bad request,
+                                           not mounted, header timestamps before the epoch,
+                                           precondition failed.
+                                           File errors resulting in a quarantine are not
+                                           counted here.
+``object-server.GET.timing``               Timing data for each GET request not resulting in an
+                                           error.  Includes requests which couldn't find the
+                                           object (including disk errors resulting in file
+                                           quarantine).
+``object-server.HEAD.errors.timing``       Timing data for HEAD request errors: bad request,
+                                           not mounted.
+``object-server.HEAD.timing``              Timing data for each HEAD request not resulting in
+                                           an error.  Includes requests which couldn't find the
+                                           object (including disk errors resulting in file
+                                           quarantine).
+``object-server.DELETE.errors.timing``     Timing data for DELETE request errors: bad request,
+                                           missing timestamp, not mounted, precondition
+                                           failed.  Includes requests which couldn't find or
+                                           match the object.
+``object-server.DELETE.timing``            Timing data for each DELETE request not resulting
+                                           in an error.
+``object-server.REPLICATE.errors.timing``  Timing data for REPLICATE request errors: bad
+                                           request, not mounted.
+``object-server.REPLICATE.timing``         Timing data for each REPLICATE request not resulting
+                                           in an error.
+=========================================  ====================================================
diff --git a/doc/source/metrics/object_updater.rst b/doc/source/metrics/object_updater.rst
new file mode 100644
index 0000000000..ca223e4994
--- /dev/null
+++ b/doc/source/metrics/object_updater.rst
@@ -0,0 +1,22 @@
+``object-updater`` Metrics
+==========================
+
+==============================  ====================================================
+Metric Name                     Description
+------------------------------  ----------------------------------------------------
+``object-updater.errors``       Count of drives not mounted or async_pending files
+                                with an unexpected name.
+``object-updater.timing``       Timing data for object sweeps to flush async_pending
+                                container updates.  Does not include object sweeps
+                                which did not find an existing async_pending storage
+                                directory.
+``object-updater.quarantines``  Count of async_pending container updates which were
+                                corrupted and moved to quarantine.
+``object-updater.successes``    Count of successful container updates.
+``object-updater.failures``     Count of failed container updates.
+``object-updater.unlinks``      Count of async_pending files unlinked. An
+                                async_pending file is unlinked either when it is
+                                successfully processed or when the replicator sees
+                                that there is a newer async_pending file for the
+                                same object.
+==============================  ====================================================
diff --git a/doc/source/metrics/proxy_server.rst b/doc/source/metrics/proxy_server.rst
new file mode 100644
index 0000000000..3e72f426f7
--- /dev/null
+++ b/doc/source/metrics/proxy_server.rst
@@ -0,0 +1,113 @@
+``proxy-server`` Metrics
+========================
+
+In the table, ``<type>`` is the proxy-server controller responsible for the
+request and will be one of ``account``, ``container``, or ``object``.
+
+==========================================  ====================================================
+Metric Name                                 Description
+------------------------------------------  ----------------------------------------------------
+``proxy-server.errors``                     Count of errors encountered while serving requests
+                                            before the controller type is determined.  Includes
+                                            invalid Content-Length, errors finding the internal
+                                            controller to handle the request, invalid utf8, and
+                                            bad URLs.
+``proxy-server.<type>.handoff_count``       Count of node hand-offs; only tracked if log_handoffs
+                                            is set in the proxy-server config.
+``proxy-server.<type>.handoff_all_count``   Count of times *only* hand-off locations were
+                                            utilized; only tracked if log_handoffs is set in the
+                                            proxy-server config.
+``proxy-server.<type>.client_timeouts``     Count of client timeouts (client did not read within
+                                            ``client_timeout`` seconds during a GET or did not
+                                            supply data within ``client_timeout`` seconds during
+                                            a PUT).
+``proxy-server.<type>.client_disconnects``  Count of detected client disconnects during PUT
+                                            operations (does NOT include caught Exceptions in
+                                            the proxy-server which caused a client disconnect).
+==========================================  ====================================================
+
+Additionally, middleware often emit their own metrics
+
+``proxy-logging`` Middleware
+----------------------------
+
+In the table, ``<type>`` is either the proxy-server controller responsible
+for the request: ``account``, ``container``, ``object``, or the string
+``SOS`` if the request came from the `Swift Origin Server`_ middleware.
+The ``<verb>`` portion will be one of ``GET``, ``HEAD``, ``POST``, ``PUT``,
+``DELETE``, ``COPY``, ``OPTIONS``, or ``BAD_METHOD``.  The list of valid
+HTTP methods is configurable via the ``log_statsd_valid_http_methods``
+config variable and the default setting yields the above behavior.
+
+.. _Swift Origin Server: https://github.com/dpgoetz/sos
+
+======================================================  ============================================
+Metric Name                                             Description
+------------------------------------------------------  --------------------------------------------
+``proxy-server.<type>.<verb>.<status>.timing``          Timing data for requests, start to finish.
+                                                        The <status> portion is the numeric HTTP
+                                                        status code for the request (e.g.  "200" or
+                                                        "404").
+``proxy-server.<type>.GET.<status>.first-byte.timing``  Timing data up to completion of sending the
+                                                        response headers (only for GET requests).
+                                                        <status> and <type> are as for the main
+                                                        timing metric.
+``proxy-server.<type>.<verb>.<status>.xfer``            This counter metric is the sum of bytes
+                                                        transferred in (from clients) and out (to
+                                                        clients) for requests.  The <type>, <verb>,
+                                                        and <status> portions of the metric are just
+                                                        like the main timing metric.
+======================================================  ============================================
+
+The ``proxy-logging`` middleware also groups these metrics by policy.  The
+``<policy-index>`` portion represents a policy index:
+
+============================================================================  =====================================
+Metric Name                                                                   Description
+----------------------------------------------------------------------------  -------------------------------------
+``proxy-server.object.policy.<policy-index>.<verb>.<status>.timing``          Timing data for requests, aggregated
+                                                                              by policy index.
+``proxy-server.object.policy.<policy-index>.GET.<status>.first-byte.timing``  Timing data up to completion of
+                                                                              sending the response headers,
+                                                                              aggregated by policy index.
+``proxy-server.object.policy.<policy-index>.<verb>.<status>.xfer``            Sum of bytes transferred in and out,
+                                                                              aggregated by policy index.
+============================================================================  =====================================
+
+``tempauth`` Middleware
+-----------------------
+In the table, ``<reseller_prefix>`` represents the actual configured
+reseller_prefix or ``NONE`` if the reseller_prefix is the empty string:
+
+===========================================  ====================================================
+Metric Name                                  Description
+-------------------------------------------  ----------------------------------------------------
+``tempauth.<reseller_prefix>.unauthorized``  Count of regular requests which were denied with
+                                             HTTPUnauthorized.
+``tempauth.<reseller_prefix>.forbidden``     Count of regular requests which were denied with
+                                             HTTPForbidden.
+``tempauth.<reseller_prefix>.token_denied``  Count of token requests which were denied.
+``tempauth.<reseller_prefix>.errors``        Count of errors.
+===========================================  ====================================================
+
+``tempurl`` Middleware
+----------------------
+
+==========================================  ====================================================
+Metric Name                                 Description
+------------------------------------------  ----------------------------------------------------
+``proxy-server.tempurl.digests.<digest>``   Count of requests authorized using the specified
+                                            ``<digest>``; may be one of ``sha1``, ``sha256``,
+                                            or ``sha512``.
+==========================================  ====================================================
+
+``formpost`` Middleware
+-----------------------
+
+==========================================  ====================================================
+Metric Name                                 Description
+------------------------------------------  ----------------------------------------------------
+``proxy-server.formpost.digests.<digest>``  Count of requests authorized using the specified
+                                            ``<digest>``; may be one of ``sha1``, ``sha256``,
+                                            or ``sha512``.
+==========================================  ====================================================
diff --git a/doc/source/middleware.rst b/doc/source/middleware.rst
new file mode 100644
index 0000000000..ee2e3dc674
--- /dev/null
+++ b/doc/source/middleware.rst
@@ -0,0 +1,404 @@
+.. _common_middleware:
+
+**********
+Middleware
+**********
+
+.. _account-quotas:
+
+Account Quotas
+==============
+
+.. automodule:: swift.common.middleware.account_quotas
+    :members:
+    :show-inheritance:
+
+.. _s3api:
+
+AWS S3 Api
+==========
+
+.. automodule:: swift.common.middleware.s3api.s3api
+    :members:
+    :show-inheritance:
+
+.. automodule:: swift.common.middleware.s3api.s3token
+    :members:
+    :show-inheritance:
+
+.. automodule:: swift.common.middleware.s3api.s3request
+    :members:
+    :show-inheritance:
+
+.. automodule:: swift.common.middleware.s3api.s3response
+    :members:
+    :show-inheritance:
+
+.. automodule:: swift.common.middleware.s3api.exception
+    :members:
+    :show-inheritance:
+
+.. automodule:: swift.common.middleware.s3api.etree
+    :members: _Element
+    :show-inheritance:
+
+.. automodule:: swift.common.middleware.s3api.utils
+    :members:
+    :show-inheritance:
+
+.. automodule:: swift.common.middleware.s3api.subresource
+    :members:
+    :show-inheritance:
+
+.. automodule:: swift.common.middleware.s3api.acl_handlers
+    :members:
+    :show-inheritance:
+
+.. automodule:: swift.common.middleware.s3api.acl_utils
+    :members:
+    :show-inheritance:
+
+.. automodule:: swift.common.middleware.s3api.controllers.base
+    :members:
+    :show-inheritance:
+
+.. automodule:: swift.common.middleware.s3api.controllers.service
+    :members:
+    :show-inheritance:
+
+.. automodule:: swift.common.middleware.s3api.controllers.bucket
+    :members:
+    :show-inheritance:
+
+.. automodule:: swift.common.middleware.s3api.controllers.obj
+    :members:
+    :show-inheritance:
+
+.. automodule:: swift.common.middleware.s3api.controllers.acl
+    :members:
+    :show-inheritance:
+
+.. automodule:: swift.common.middleware.s3api.controllers.s3_acl
+    :members:
+    :show-inheritance:
+
+.. automodule:: swift.common.middleware.s3api.controllers.multi_upload
+    :members:
+    :show-inheritance:
+
+.. automodule:: swift.common.middleware.s3api.controllers.multi_delete
+    :members:
+    :show-inheritance:
+
+.. automodule:: swift.common.middleware.s3api.controllers.versioning
+    :members:
+    :show-inheritance:
+
+.. automodule:: swift.common.middleware.s3api.controllers.location
+    :members:
+    :show-inheritance:
+
+.. automodule:: swift.common.middleware.s3api.controllers.logging
+    :members:
+    :show-inheritance:
+
+Backend Ratelimit
+=================
+
+.. automodule:: swift.common.middleware.backend_ratelimit
+    :members:
+    :show-inheritance:
+
+.. _bulk:
+
+Bulk Operations (Delete and Archive Auto Extraction)
+====================================================
+
+.. automodule:: swift.common.middleware.bulk
+    :members:
+    :show-inheritance:
+
+.. _catch_errors:
+
+CatchErrors
+=============
+
+.. automodule:: swift.common.middleware.catch_errors
+    :members:
+    :show-inheritance:
+
+CNAME Lookup
+============
+
+.. automodule:: swift.common.middleware.cname_lookup
+    :members:
+    :show-inheritance:
+
+.. _container-quotas:
+
+Container Quotas
+================
+
+.. automodule:: swift.common.middleware.container_quotas
+    :members:
+    :show-inheritance:
+
+.. _container-sync:
+
+Container Sync Middleware
+=========================
+
+.. automodule:: swift.common.middleware.container_sync
+    :members:
+    :show-inheritance:
+
+Cross Domain Policies
+=====================
+
+.. automodule:: swift.common.middleware.crossdomain
+    :members:
+    :show-inheritance:
+
+.. _discoverability:
+
+Discoverability
+===============
+
+Swift will by default provide clients with an interface providing details
+about the installation. Unless disabled (i.e ``expose_info=false`` in
+:ref:`proxy-server-config`), a GET request to ``/info`` will return configuration
+data in JSON format.  An example response::
+
+    {"swift": {"version": "1.11.0"}, "staticweb": {}, "tempurl": {}}
+
+This would signify to the client that swift version 1.11.0 is running and that
+staticweb and tempurl are available in this installation.
+
+There may be administrator-only information available via ``/info``. To
+retrieve it, one must use an HMAC-signed request, similar to TempURL.
+The signature may be produced like so::
+
+    swift tempurl GET 3600 /info secret 2>/dev/null | sed s/temp_url/swiftinfo/g
+
+Domain Remap
+============
+
+.. automodule:: swift.common.middleware.domain_remap
+    :members:
+    :show-inheritance:
+
+Dynamic Large Objects
+=====================
+
+DLO support centers around a user specified filter that matches
+segments and concatenates them together in object listing order. Please see
+the DLO docs for :ref:`dlo-doc` further details.
+
+.. _encryption:
+
+Encryption
+==========
+
+Encryption middleware should be deployed in conjunction with the
+:ref:`keymaster` middleware.
+
+.. automodule:: swift.common.middleware.crypto
+    :members:
+    :show-inheritance:
+
+.. automodule:: swift.common.middleware.crypto.encrypter
+    :members:
+    :show-inheritance:
+
+.. automodule:: swift.common.middleware.crypto.decrypter
+    :members:
+    :show-inheritance:
+
+.. _etag_quoter:
+
+Etag Quoter
+===========
+
+.. automodule:: swift.common.middleware.etag_quoter
+    :members:
+    :show-inheritance:
+
+.. _formpost:
+
+FormPost
+========
+
+.. automodule:: swift.common.middleware.formpost
+    :members:
+    :show-inheritance:
+
+.. _gatekeeper:
+
+GateKeeper
+==========
+
+.. automodule:: swift.common.middleware.gatekeeper
+    :members:
+    :show-inheritance:
+
+.. _healthcheck:
+
+Healthcheck
+===========
+
+.. automodule:: swift.common.middleware.healthcheck
+    :members:
+    :show-inheritance:
+
+.. _keymaster:
+
+Keymaster
+=========
+
+Keymaster middleware should be deployed in conjunction with the
+:ref:`encryption` middleware.
+
+.. automodule:: swift.common.middleware.crypto.keymaster
+    :members:
+    :show-inheritance:
+
+.. _keystoneauth:
+
+KeystoneAuth
+============
+
+.. automodule:: swift.common.middleware.keystoneauth
+    :members:
+    :show-inheritance:
+
+.. _list_endpoints:
+
+List Endpoints
+==============
+
+.. automodule:: swift.common.middleware.list_endpoints
+    :members:
+    :show-inheritance:
+
+Memcache
+========
+
+.. automodule:: swift.common.middleware.memcache
+    :members:
+    :show-inheritance:
+
+Name Check (Forbidden Character Filter)
+=======================================
+
+.. automodule:: swift.common.middleware.name_check
+    :members:
+    :show-inheritance:
+
+.. _object_versioning:
+
+Object Versioning
+=================
+
+.. automodule:: swift.common.middleware.versioned_writes.object_versioning
+    :members:
+    :show-inheritance:
+
+Proxy Logging
+=============
+
+.. automodule:: swift.common.middleware.proxy_logging
+    :members:
+    :show-inheritance:
+
+Ratelimit
+=========
+
+.. automodule:: swift.common.middleware.ratelimit
+    :members:
+    :show-inheritance:
+
+.. _read_only:
+
+Read Only
+=========
+
+.. automodule:: swift.common.middleware.read_only
+    :members:
+    :show-inheritance:
+
+.. _recon:
+
+Recon
+=====
+
+.. automodule:: swift.common.middleware.recon
+    :members:
+    :show-inheritance:
+
+.. _copy:
+
+Server Side Copy
+================
+
+.. automodule:: swift.common.middleware.copy
+    :members:
+    :show-inheritance:
+
+Static Large Objects
+====================
+
+Please see
+the SLO docs for :ref:`slo-doc` further details.
+
+
+.. _staticweb:
+
+StaticWeb
+=========
+
+.. automodule:: swift.common.middleware.staticweb
+    :members:
+    :show-inheritance:
+
+.. _symlink:
+
+Symlink
+=======
+
+.. automodule:: swift.common.middleware.symlink
+    :members:
+    :show-inheritance:
+
+.. _common_tempauth:
+
+TempAuth
+========
+
+.. automodule:: swift.common.middleware.tempauth
+    :members:
+    :show-inheritance:
+
+.. _tempurl:
+
+TempURL
+=======
+
+.. automodule:: swift.common.middleware.tempurl
+    :members:
+    :show-inheritance:
+
+.. _versioned_writes:
+
+Versioned Writes
+=================
+
+.. automodule:: swift.common.middleware.versioned_writes.legacy
+    :members:
+    :show-inheritance:
+
+XProfile
+==============
+
+.. automodule:: swift.common.middleware.xprofile
+    :members:
+    :show-inheritance:
diff --git a/doc/source/misc.rst b/doc/source/misc.rst
index 0c0d607267..1012b13bec 100644
--- a/doc/source/misc.rst
+++ b/doc/source/misc.rst
@@ -4,60 +4,60 @@
 Misc
 ****
 
-.. _exceptions:
+.. _acls:
 
-Exceptions
-==========
+ACLs
+====
 
-.. automodule:: swift.common.exceptions
+.. automodule:: swift.common.middleware.acl
     :members:
-    :undoc-members:
     :show-inheritance:
 
-.. _constraints:
+.. _buffered_http:
 
-Constraints
-===========
+Buffered HTTP
+=============
 
-.. automodule:: swift.common.constraints
+.. automodule:: swift.common.bufferedhttp
     :members:
-    :undoc-members:
     :show-inheritance:
 
-.. _utils:
 
-Utils
-=====
+.. _config:
 
-.. automodule:: swift.common.utils
+Config
+======
+
+.. automodule:: swift.common.utils.config
     :members:
     :show-inheritance:
 
-.. _common_tempauth:
+.. _constraints:
 
-TempAuth
-========
+Constraints
+===========
 
-.. automodule:: swift.common.middleware.tempauth
+.. automodule:: swift.common.constraints
     :members:
+    :undoc-members:
     :show-inheritance:
 
-.. _acls:
-
-ACLs
-====
+Container Sync Realms
+=====================
 
-.. automodule:: swift.common.middleware.acl
+.. automodule:: swift.common.container_sync_realms
     :members:
     :show-inheritance:
 
-.. _wsgi:
 
-WSGI
-====
+.. _digest:
 
-.. automodule:: swift.common.wsgi
+Digest
+======
+
+.. automodule:: swift.common.digest
     :members:
+    :undoc-members:
     :show-inheritance:
 
 .. _direct_client:
@@ -70,6 +70,16 @@ Direct Client
     :undoc-members:
     :show-inheritance:
 
+.. _exceptions:
+
+Exceptions
+==========
+
+.. automodule:: swift.common.exceptions
+    :members:
+    :undoc-members:
+    :show-inheritance:
+
 .. _internal_client:
 
 Internal Client
@@ -80,34 +90,39 @@ Internal Client
     :undoc-members:
     :show-inheritance:
 
-.. _buffered_http:
+.. _ipaddrs:
 
-Buffered HTTP
-=============
+IPAddrs
+=======
 
-.. automodule:: swift.common.bufferedhttp
+.. automodule:: swift.common.utils.ipaddrs
     :members:
     :show-inheritance:
 
-.. _healthcheck:
+.. _libc:
 
-Healthcheck
-===========
+Libc
+====
 
-.. automodule:: swift.common.middleware.healthcheck
+.. automodule:: swift.common.utils.libc
     :members:
     :show-inheritance:
 
-.. _recon:
+.. _logs:
 
-Recon
-===========
+Logs
+====
 
-.. automodule:: swift.common.middleware.recon
+.. automodule:: swift.common.utils.logs
     :members:
     :show-inheritance:
 
-.. _memecached:
+Manager
+=========
+
+.. automodule:: swift.common.manager
+    :members:
+    :show-inheritance:
 
 MemCacheD
 =========
@@ -116,90 +131,86 @@ MemCacheD
     :members:
     :show-inheritance:
 
-Manager
-=========
+.. _registry:
 
-.. automodule:: swift.common.manager
+Middleware Registry
+===================
+
+.. automodule:: swift.common.registry
     :members:
+    :undoc-members:
     :show-inheritance:
 
-Ratelimit
-=========
+.. _request_helpers:
+
+Request Helpers
+===============
 
-.. automodule:: swift.common.middleware.ratelimit
+.. automodule:: swift.common.request_helpers
     :members:
+    :undoc-members:
     :show-inheritance:
 
-StaticWeb
-=========
+.. _statsd_client:
+
+StatsdClient
+============
 
-.. automodule:: swift.common.middleware.staticweb
+.. automodule:: swift.common.statsd_client
     :members:
     :show-inheritance:
 
-TempURL
-=======
+.. _storage_policy:
 
-.. automodule:: swift.common.middleware.tempurl
+Storage Policy
+==============
+
+.. automodule:: swift.common.storage_policy
     :members:
     :show-inheritance:
 
-FormPost
-========
+.. _swob:
 
-.. automodule:: swift.common.middleware.formpost
+Swob
+====
+
+.. automodule:: swift.common.swob
     :members:
     :show-inheritance:
+    :special-members: __call__
 
-Domain Remap
-============
+.. _timestamp:
 
-.. automodule:: swift.common.middleware.domain_remap
+Timestamp
+=========
+
+.. automodule:: swift.common.utils.timestamp
     :members:
     :show-inheritance:
 
-CNAME Lookup
-============
+.. _base_utils:
+
+Utils Base
+==========
 
-.. automodule:: swift.common.middleware.cname_lookup
+.. automodule:: swift.common.utils.base
     :members:
     :show-inheritance:
 
-Proxy Logging
-=============
+.. _utils:
 
-.. automodule:: swift.common.middleware.proxy_logging
+Utils
+=====
+
+.. automodule:: swift.common.utils
     :members:
     :show-inheritance:
 
-CORS Headers
-============
+.. _wsgi:
 
-Cross Origin RequestS or CORS allows the browser to make requests against
-Swift from another origin via the browser.  This enables the use of HTML5
-forms and javascript uploads to swift.  The owner of a container can set
-three headers:
-
-+---------------------------------------------+-------------------------------+
-|Metadata                                     | Use                           |
-+=============================================+===============================+
-|X-Container-Meta-Access-Control-Allow-Origin | Origins to be allowed to      |
-|                                             | make Cross Origin Requests,   |
-|                                             | space separated               |
-+---------------------------------------------+-------------------------------+
-|X-Container-Meta-Access-Control-Max-Age      | Max age for the Origin to     |
-|                                             | hold the preflight results.   |
-+---------------------------------------------+-------------------------------+
-|X-Container-Meta-Access-Control-Allow-Headers| Headers to be allowed in      |
-|                                             | actual request by browser.    |
-+---------------------------------------------+-------------------------------+
-
-When the browser does a request it can issue a preflight request.  The 
-preflight request is the OPTIONS call that verifies the Origin is allowed
-to make the request.
-
-* Browser makes OPTIONS request to Swift
-* Swift returns 200/401 to browser based on allowed origins
-* If 200, browser makes PUT, POST, DELETE, HEAD, GET request to Swift
-
-CORS should be used in conjunction with TempURL and FormPost.
+WSGI
+====
+
+.. automodule:: swift.common.wsgi
+    :members:
+    :show-inheritance:
diff --git a/doc/source/object.rst b/doc/source/object.rst
index 9a2643d4a7..73e9ee0eae 100644
--- a/doc/source/object.rst
+++ b/doc/source/object.rst
@@ -4,12 +4,22 @@
 Object
 ******
 
-.. _object-server:
+.. _object-auditor:
 
-Object Server
-=============
+Object Auditor
+==============
 
-.. automodule:: swift.obj.server
+.. automodule:: swift.obj.auditor
+    :members:
+    :undoc-members:
+    :show-inheritance:
+
+.. _object-diskfile:
+
+Object Backend
+==============
+
+.. automodule:: swift.obj.diskfile
     :members:
     :undoc-members:
     :show-inheritance:
@@ -24,23 +34,42 @@ Object Replicator
     :undoc-members:
     :show-inheritance:
 
-.. _object-updater:
+.. automodule:: swift.obj.ssync_sender
+    :members:
+    :undoc-members:
+    :show-inheritance:
 
-Object Updater
-==============
+.. automodule:: swift.obj.ssync_receiver
+    :members:
+    :undoc-members:
+    :show-inheritance:
 
-.. automodule:: swift.obj.updater
+.. _object-reconstructor:
+
+Object Reconstructor
+====================
+
+.. automodule:: swift.obj.reconstructor
     :members:
     :undoc-members:
     :show-inheritance:
 
-.. _object-auditor:
+.. _object-server:
 
-Object Auditor
-==============
+Object Server
+=============
 
-.. automodule:: swift.obj.auditor
+.. automodule:: swift.obj.server
     :members:
     :undoc-members:
     :show-inheritance:
 
+.. _object-updater:
+
+Object Updater
+==============
+
+.. automodule:: swift.obj.updater
+    :members:
+    :undoc-members:
+    :show-inheritance:
diff --git a/doc/source/ops_runbook/diagnose.rst b/doc/source/ops_runbook/diagnose.rst
new file mode 100644
index 0000000000..976cdb70de
--- /dev/null
+++ b/doc/source/ops_runbook/diagnose.rst
@@ -0,0 +1,1204 @@
+==================================
+Identifying issues and resolutions
+==================================
+
+Is the system up?
+-----------------
+
+If you have a report that Swift is down, perform the following basic checks:
+
+#. Run swift functional tests.
+
+#. From a server in your data center, use ``curl`` to check ``/healthcheck``
+   (see below).
+
+#. If you have a monitoring system, check your monitoring system.
+
+#. Check your hardware load balancers infrastructure.
+
+#. Run swift-recon on a proxy node.
+
+Functional tests usage
+-----------------------
+
+We would recommend that you set up the functional tests to run against your
+production system. Run regularly this can be a useful tool to validate
+that the system is configured correctly. In addition, it can provide
+early warning about failures in your system (if the functional tests stop
+working, user applications will also probably stop working).
+
+A script for running the function tests is located in ``swift/.functests``.
+
+
+External monitoring
+-------------------
+
+We use pingdom.com to monitor the external Swift API. We suggest the
+following:
+
+-  Do a GET on ``/healthcheck``
+
+-  Create a container, make it public (``x-container-read:
+   .r*,.rlistings``), create a small file in the container; do a GET
+   on the object
+
+Diagnose: General approach
+--------------------------
+
+-  Look at service status in your monitoring system.
+
+-  In addition to system monitoring tools and issue logging by users,
+   swift errors will often result in log entries (see :ref:`swift_logs`).
+
+-  Look at any logs your deployment tool produces.
+
+-  Log files should be reviewed for error signatures (see below) that
+   may point to a known issue, or root cause issues reported by the
+   diagnostics tools, prior to escalation.
+
+Dependencies
+^^^^^^^^^^^^
+
+The Swift software is dependent on overall system health. Operating
+system level issues with network connectivity, domain name resolution,
+user management, hardware and system configuration and capacity in terms
+of memory and free disk space, may result is secondary Swift issues.
+System level issues should be resolved prior to diagnosis of swift
+issues.
+
+
+Diagnose: Swift-dispersion-report
+---------------------------------
+
+The swift-dispersion-report is a useful tool to gauge the general
+health of the system. Configure the ``swift-dispersion`` report to cover at
+a minimum every disk drive in your system (usually 1% coverage).
+See :ref:`dispersion_report` for details of how to configure and
+use the dispersion reporting tool.
+
+The ``swift-dispersion-report`` tool can take a long time to run, especially
+if any servers are down. We suggest you run it regularly
+(e.g., in a cron job) and save the results. This makes it easy to refer
+to the last report without having to wait for a long-running command
+to complete.
+
+Diagnose: Is system responding to ``/healthcheck``?
+---------------------------------------------------
+
+When you want to establish if a swift endpoint is running, run ``curl -k``
+against ``https://$ENDPOINT/healthcheck``.
+
+.. _swift_logs:
+
+Diagnose: Interpreting messages in ``/var/log/swift/`` files
+------------------------------------------------------------
+
+.. note::
+
+   In the Hewlett Packard Enterprise Helion Public Cloud we send logs to
+   ``proxy.log`` (proxy-server logs), ``server.log`` (object-server,
+   account-server, container-server logs), ``background.log`` (all
+   other servers [object-replicator, etc]).
+
+The following table lists known issues:
+
+.. list-table::
+   :widths: 25 25 25 25
+   :header-rows: 1
+
+   * - **Logfile**
+     - **Signature**
+     - **Issue**
+     - **Steps to take**
+   * - /var/log/syslog
+     - kernel: [] sd .... [csbu:sd...] Sense Key: Medium Error
+     - Suggests disk surface issues
+     - Run ``swift-drive-audit`` on the target node to check for disk errors,
+       repair disk errors
+   * - /var/log/syslog
+     - kernel: [] sd .... [csbu:sd...] Sense Key: Hardware Error
+     - Suggests storage hardware issues
+     - Run diagnostics on the target node to check for disk failures,
+       replace failed disks
+   * - /var/log/syslog
+     - kernel: [] .... I/O error, dev sd.... ,sector ....
+     -
+     - Run diagnostics on the target node to check for disk errors
+   * - /var/log/syslog
+     - pound: NULL get_thr_arg
+     - Multiple threads woke up
+     - Noise, safe to ignore
+   * - /var/log/swift/proxy.log
+     - .... ERROR .... ConnectionTimeout ....
+     - A storage node is not responding in a timely fashion
+     - Check if node is down, not running Swift,
+       unconfigured, storage off-line or for network issues between the
+       proxy and non responding node
+   * - /var/log/swift/proxy.log
+     - proxy-server .... HTTP/1.0 500 ....
+     - A proxy server has reported an internal server error
+     - Examine the logs for any errors at the time the error was reported to
+       attempt to understand the cause of the error.
+   * - /var/log/swift/server.log
+     - .... ERROR .... ConnectionTimeout ....
+     - A storage server is not responding in a timely fashion
+     - Check if node is down, not running Swift,
+       unconfigured, storage off-line or for network issues between the
+       server and non responding node
+   * - /var/log/swift/server.log
+     - .... ERROR .... Remote I/O error: '/srv/node/disk....
+     - A storage device is not responding as expected
+     - Run ``swift-drive-audit`` and check the filesystem named in the error
+       for corruption (unmount & xfs_repair). Check if the filesystem
+       is mounted and working.
+   * - /var/log/swift/background.log
+     - object-server ERROR container update failed .... Connection refused
+     - A container server node could not be contacted
+     - Check if node is down, not running Swift,
+       unconfigured, storage off-line or for network issues between the
+       server and non responding node
+   * - /var/log/swift/background.log
+     - object-updater ERROR with remote .... ConnectionTimeout
+     - The remote container server is busy
+     - If the container is very large, some errors updating it can be
+       expected. However, this error can also occur if there is a networking
+       issue.
+   * - /var/log/swift/background.log
+     - account-reaper STDOUT: .... error: ECONNREFUSED
+     - Network connectivity issue or the target server is down.
+     - Resolve network issue or reboot the target server
+   * - /var/log/swift/background.log
+     - .... ERROR .... ConnectionTimeout
+     - A storage server is not responding in a timely fashion
+     - The target server may be busy. However, this error can also occur if
+       there is a networking issue.
+   * - /var/log/swift/background.log
+     - .... ERROR syncing .... Timeout
+     - A timeout occurred syncing data to another node.
+     - The target server may be busy. However, this error can also occur if
+       there is a networking issue.
+   * - /var/log/swift/background.log
+     - .... ERROR Remote drive not mounted ....
+     - A storage server disk is unavailable
+     - Repair and remount the file system (on the remote node)
+   * - /var/log/swift/background.log
+     - object-replicator .... responded as unmounted
+     - A storage server disk is unavailable
+     - Repair and remount the file system (on the remote node)
+   * - /var/log/swift/\*.log
+     - STDOUT: EXCEPTION IN
+     - A unexpected error occurred
+     - Read the Traceback details, if it matches known issues
+       (e.g. active network/disk issues), check for re-ocurrences
+       after the primary issues have been resolved
+   * - /var/log/rsyncd.log
+     - rsync: mkdir "/disk....failed: No such file or directory....
+     - A local storage server disk is unavailable
+     - Run diagnostics on the node to check for a failed or
+       unmounted disk
+   * - /var/log/swift*
+     - Exception: Could not bind to 0.0.0.0:6xxx
+     - Possible Swift process restart issue. This indicates an old swift
+       process is still running.
+     - Restart Swift services. If some swift services are reported down,
+       check if they left residual process behind.
+
+Diagnose: Parted reports the backup GPT table is corrupt
+--------------------------------------------------------
+
+-  If a GPT table is broken, a message like the following should be
+   observed when the following command is run:
+
+   .. code:: console
+
+      $ sudo parted -l
+
+   .. code:: console
+
+      Error: The backup GPT table is corrupt, but the primary appears OK,
+      so that will be used.
+
+      OK/Cancel?
+
+To fix, go to :ref:`fix_broken_gpt_table`
+
+
+Diagnose: Drives diagnostic reports a FS label is not acceptable
+----------------------------------------------------------------
+
+If diagnostics reports something like  "FS label: obj001dsk011 is not
+acceptable", it indicates that a partition has a valid disk label, but an
+invalid filesystem label. In such cases proceed as follows:
+
+#. Verify that the disk labels are correct:
+
+   .. code:: console
+
+      $ FS=/dev/sd#1
+
+      $ sudo parted -l | grep object
+
+#. If partition labels are inconsistent then, resolve the disk label issues
+   before proceeding:
+
+   .. code:: console
+
+      $ sudo parted -s ${FS} name ${PART_NO} ${PART_NAME} #Partition Label
+      $ # PART_NO is 1 for object disks and 3 for OS disks
+      $ # PART_NAME follows the convention seen in "sudo parted -l | grep object"
+
+#. If the Filesystem label is missing then create it with care:
+
+   .. code:: console
+
+      $ sudo xfs_admin -l ${FS} #Filesystem label (12 Char limit)
+
+      $ # Check for the existence of a FS label
+
+      $ OBJNO=<3 Length Object No.>
+
+      $ # I.E OBJNO for sw-stbaz3-object0007 would be 007
+
+      $ DISKNO=<3 Length Disk No.>
+
+      $ # I.E DISKNO for /dev/sdb would be 001, /dev/sdc would be 002 etc.
+
+      $ sudo xfs_admin -L "obj${OBJNO}dsk${DISKNO}" ${FS}
+
+      $ # Create a FS Label
+
+Diagnose: Failed LUNs
+---------------------
+
+.. note::
+
+   The HPE Helion Public Cloud uses direct attach SmartArray
+   controllers/drives. The information here is specific to that
+   environment. The hpacucli utility mentioned here may be called
+   hpssacli in your environment.
+
+The ``swift_diagnostics`` mount checks may return a warning that a LUN has
+failed, typically accompanied by DriveAudit check failures and device
+errors.
+
+Such cases are typically caused by a drive failure, and if drive check
+also reports a failed status for the underlying drive, then follow
+the procedure to replace the disk.
+
+Otherwise the lun can be re-enabled as follows:
+
+#. Generate a hpssacli diagnostic report. This report allows the DC
+   team to troubleshoot potential cabling or hardware issues so it is
+   imperative that you run it immediately when troubleshooting a failed
+   LUN. You will come back later and grep this file for more details, but
+   just generate it for now.
+
+   .. code:: console
+
+      $ sudo hpssacli controller all diag file=/tmp/hpacu.diag ris=on xml=off zip=off
+
+Export the following variables using the below instructions before
+proceeding further.
+
+#. Print a list of logical drives and their numbers and take note of the
+   failed drive's number and array value (example output: "array A
+   logicaldrive 1..." would be exported as LDRIVE=1):
+
+   .. code:: console
+
+      $ sudo hpssacli controller slot=1 ld all show
+
+#. Export the number of the logical drive that was retrieved from the
+   previous command into the LDRIVE variable:
+
+   .. code:: console
+
+      $ export LDRIVE=<LogicalDriveNumber>
+
+#. Print the array value and Port:Box:Bay for all drives and take note of
+   the Port:Box:Bay for the failed drive (example output: " array A
+   physicaldrive 2C:1:1..." would be exported as PBOX=2C:1:1). Match the
+   array value of this output with the array value obtained from the
+   previous command to be sure you are working on the same drive. Also,
+   the array value usually matches the device name (For example, /dev/sdc
+   in the case of "array c"), but we will run a different command to be sure
+   we are operating on the correct device.
+
+   .. code:: console
+
+      $ sudo hpssacli controller slot=1 pd all show
+
+.. note::
+
+   Sometimes a LUN may appear to be failed as it is not and cannot
+   be mounted but the hpssacli/parted commands may show no problems with
+   the LUNS/drives. In this case, the filesystem may be corrupt and may be
+   necessary to run ``sudo xfs_check /dev/sd[a-l][1-2]`` to see if there is
+   an xfs issue. The results of running this command may require that
+   ``xfs_repair`` is run.
+
+#. Export the Port:Box:Bay for the failed drive into the PBOX variable:
+
+   .. code:: console
+
+      $ export PBOX=<Port:Box:Bay>
+
+#. Print the physical device information and take note of the Disk Name
+   (example output: "Disk Name: /dev/sdk" would be exported as
+   DEV=/dev/sdk):
+
+   .. code:: console
+
+      $ sudo hpssacli controller slot=1 ld ${LDRIVE} show detail | grep -i "Disk Name"
+
+#. Export the device name variable from the preceding command (example:
+   /dev/sdk):
+
+   .. code:: console
+
+      $ export DEV=<Device>
+
+#. Export the filesystem variable. Disks that are split between the
+   operating system and data storage, typically sda and sdb, should  only
+   have repairs done on their data filesystem, usually /dev/sda2 and
+   /dev/sdb2, Other data only disks have just one partition on the device,
+   so the filesystem will be 1. In any case you should verify the data
+   filesystem by running ``df -h | grep /srv/node`` and using the listed
+   data filesystem for the device in question as the export. For example:
+   /dev/sdk1.
+
+   .. code:: console
+
+      $ export FS=<Filesystem>
+
+#. Verify the LUN is failed, and the device is not:
+
+   .. code:: console
+
+      $ sudo hpssacli controller slot=1 ld all show
+      $ sudo hpssacli controller slot=1 pd all show
+      $ sudo hpssacli controller slot=1 ld ${LDRIVE} show detail
+      $ sudo hpssacli controller slot=1 pd ${PBOX} show detail
+
+#. Stop the swift and rsync service:
+
+   .. code:: console
+
+      $ sudo service rsync stop
+      $ sudo swift-init shutdown all
+
+#. Unmount the problem drive, fix the LUN and the filesystem:
+
+   .. code:: console
+
+      $ sudo umount ${FS}
+
+#. If umount fails, you should run lsof search for the mountpoint and
+   kill any lingering processes before repeating the unpount:
+
+   .. code:: console
+
+      $ sudo hpacucli controller slot=1 ld ${LDRIVE} modify reenable
+      $ sudo xfs_repair ${FS}
+
+#. If the ``xfs_repair`` complains about possible journal data, use the
+   ``xfs_repair -L`` option to zeroise the journal log.
+
+#. Once complete test-mount the filesystem, and tidy up its lost and
+   found area.
+
+   .. code:: console
+
+      $ sudo mount ${FS} /mnt
+      $ sudo rm -rf /mnt/lost+found/
+      $ sudo umount /mnt
+
+#. Mount the filesystem and restart swift and rsync.
+
+#. Run the following to determine if a DC ticket is needed to check the
+   cables on the node:
+
+   .. code:: console
+
+      $ grep -y media.exchanged /tmp/hpacu.diag
+      $ grep -y hot.plug.count /tmp/hpacu.diag
+
+#. If the output reports any non 0x00 values, it suggests that the cables
+   should be checked. For example, log a DC ticket to check the sas cables
+   between the drive and the expander.
+
+.. _diagnose_slow_disk_drives:
+
+Diagnose: Slow disk devices
+---------------------------
+
+.. note::
+
+   collectl is an open-source performance gathering/analysis tool.
+
+If the diagnostics report a message such as ``sda: drive is slow``, you
+should log onto the node and run the following command (remove ``-c 1`` option to continuously monitor
+the data):
+
+.. code:: console
+
+   $ /usr/bin/collectl -s D -c 1
+   waiting for 1 second sample...
+   # DISK STATISTICS (/sec)
+   #          <---------reads---------><---------writes---------><--------averages--------> Pct
+   #Name       KBytes Merged  IOs Size  KBytes Merged  IOs Size  RWSize  QLen  Wait SvcTim Util
+   sdb            204      0   33    6      43      0    4   11       6     1     7      6   23
+   sda             84      0   13    6     108     21    6   18      10     1     7      7   13
+   sdc            100      0   16    6       0      0    0    0       6     1     7      6    9
+   sdd            140      0   22    6      22      0    2   11       6     1     9      9   22
+   sde             76      0   12    6     255      0   52    5       5     1     2      1   10
+   sdf            276      0   44    6       0      0    0    0       6     1    11      8   38
+   sdg            112      0   17    7      18      0    2    9       6     1     7      7   13
+   sdh           3552      0   73   49       0      0    0    0      48     1     9      8   62
+   sdi             72      0   12    6       0      0    0    0       6     1     8      8   10
+   sdj            112      0   17    7      22      0    2   11       7     1    10      9   18
+   sdk            120      0   19    6      21      0    2   11       6     1     8      8   16
+   sdl            144      0   22    7      18      0    2    9       6     1     9      7   18
+   dm-0             0      0    0    0       0      0    0    0       0     0     0      0    0
+   dm-1             0      0    0    0      60      0   15    4       4     0     0      0    0
+   dm-2             0      0    0    0      48      0   12    4       4     0     0      0    0
+   dm-3             0      0    0    0       0      0    0    0       0     0     0      0    0
+   dm-4             0      0    0    0       0      0    0    0       0     0     0      0    0
+   dm-5             0      0    0    0       0      0    0    0       0     0     0      0    0
+
+
+Look at the ``Wait`` and ``SvcTime`` values. It is not normal for
+these values to exceed 50msec. This is known to impact customer
+performance (upload/download). For a controller problem, many/all drives
+will show long wait and service times. A reboot may correct the problem;
+otherwise hardware replacement is needed.
+
+Another way to look at the data is as follows:
+
+.. code:: console
+
+   $ /opt/hp/syseng/disk-anal.pl -d
+   Disk: sda  Wait: 54580 371  65  25  12   6   6   0   1   2   0  46
+   Disk: sdb  Wait: 54532 374  96  36  16   7   4   1   0   2   0  46
+   Disk: sdc  Wait: 54345 554 105  29  15   4   7   1   4   4   0  46
+   Disk: sdd  Wait: 54175 553 254  31  20  11   6   6   2   2   1  53
+   Disk: sde  Wait: 54923  66  56  15   8   7   7   0   1   0   2  29
+   Disk: sdf  Wait: 50952 941 565 403 426 366 442 447 338  99  38  97
+   Disk: sdg  Wait: 50711 689 808 562 642 675 696 185  43  14   7  82
+   Disk: sdh  Wait: 51018 668 688 483 575 542 692 275  55  22   9  87
+   Disk: sdi  Wait: 51012 1011 849 672 568 240 344 280  38  13   6  81
+   Disk: sdj  Wait: 50724 743 770 586 662 509 684 283  46  17  11  79
+   Disk: sdk  Wait: 50886 700 585 517 633 511 729 352  89  23   8  81
+   Disk: sdl  Wait: 50106 617 794 553 604 504 532 501 288 234 165 216
+   Disk: sda  Time: 55040  22  16   6   1   1  13   0   0   0   3  12
+
+   Disk: sdb  Time: 55014  41  19   8   3   1   8   0   0   0   3  17
+   Disk: sdc  Time: 55032  23  14   8   9   2   6   1   0   0   0  19
+   Disk: sdd  Time: 55022  29  17  12   6   2  11   0   0   0   1  14
+   Disk: sde  Time: 55018  34  15  11  12   1   9   0   0   0   2  12
+   Disk: sdf  Time: 54809 250  45   7   1   0   0   0   0   0   1   1
+   Disk: sdg  Time: 55070  36   6   2   0   0   0   0   0   0   0   0
+   Disk: sdh  Time: 55079  33   2   0   0   0   0   0   0   0   0   0
+   Disk: sdi  Time: 55074  28   7   2   0   0   2   0   0   0   0   1
+   Disk: sdj  Time: 55067  35  10   0   1   0   0   0   0   0   0   1
+   Disk: sdk  Time: 55068  31  10   3   0   0   1   0   0   0   0   1
+   Disk: sdl  Time: 54905 130  61   7   3   4   1   0   0   0   0   3
+
+This shows the historical distribution of the wait and service times
+over a day. This is how you read it:
+
+-  sda did 54580 operations with a short wait time, 371 operations with
+   a longer wait time and 65 with an even longer wait time.
+
+-  sdl did 50106 operations with a short wait time, but as you can see
+   many took longer.
+
+There is a clear pattern that sdf to sdl have a problem. Actually, sda
+to sde would more normally have lots of zeros in their data. But maybe
+this is a busy system. In this example it is worth changing the
+controller as the individual drives may be ok.
+
+After the controller is changed, use collectl -s D as described above to
+see if the problem has cleared. disk-anal.pl will continue to show
+historical data. You can look at recent data as follows. It only looks
+at data from 13:15 to 14:15. As you can see, this is a relatively clean
+system (few if any long wait or service times):
+
+.. code:: console
+
+   $ /opt/hp/syseng/disk-anal.pl -d -t 13:15-14:15
+   Disk: sda  Wait:  3600   0   0   0   0   0   0   0   0   0   0   0
+   Disk: sdb  Wait:  3600   0   0   0   0   0   0   0   0   0   0   0
+   Disk: sdc  Wait:  3600   0   0   0   0   0   0   0   0   0   0   0
+   Disk: sdd  Wait:  3600   0   0   0   0   0   0   0   0   0   0   0
+   Disk: sde  Wait:  3600   0   0   0   0   0   0   0   0   0   0   0
+   Disk: sdf  Wait:  3600   0   0   0   0   0   0   0   0   0   0   0
+   Disk: sdg  Wait:  3594   6   0   0   0   0   0   0   0   0   0   0
+   Disk: sdh  Wait:  3600   0   0   0   0   0   0   0   0   0   0   0
+   Disk: sdi  Wait:  3600   0   0   0   0   0   0   0   0   0   0   0
+   Disk: sdj  Wait:  3600   0   0   0   0   0   0   0   0   0   0   0
+   Disk: sdk  Wait:  3600   0   0   0   0   0   0   0   0   0   0   0
+   Disk: sdl  Wait:  3599   1   0   0   0   0   0   0   0   0   0   0
+   Disk: sda  Time:  3600   0   0   0   0   0   0   0   0   0   0   0
+   Disk: sdb  Time:  3600   0   0   0   0   0   0   0   0   0   0   0
+   Disk: sdc  Time:  3600   0   0   0   0   0   0   0   0   0   0   0
+   Disk: sdd  Time:  3600   0   0   0   0   0   0   0   0   0   0   0
+   Disk: sde  Time:  3600   0   0   0   0   0   0   0   0   0   0   0
+   Disk: sdf  Time:  3600   0   0   0   0   0   0   0   0   0   0   0
+   Disk: sdg  Time:  3594   6   0   0   0   0   0   0   0   0   0   0
+   Disk: sdh  Time:  3600   0   0   0   0   0   0   0   0   0   0   0
+   Disk: sdi  Time:  3600   0   0   0   0   0   0   0   0   0   0   0
+   Disk: sdj  Time:  3600   0   0   0   0   0   0   0   0   0   0   0
+   Disk: sdk  Time:  3600   0   0   0   0   0   0   0   0   0   0   0
+   Disk: sdl  Time:  3599   1   0   0   0   0   0   0   0   0   0   0
+
+For long wait times, where the service time appears normal is to check
+the logical drive cache status. While the cache may be enabled, it can
+be disabled on a per-drive basis.
+
+Diagnose: Slow network link - Measuring network performance
+-----------------------------------------------------------
+
+Network faults can cause performance between Swift nodes to degrade. Testing
+with ``netperf`` is recommended. Other methods (such as copying large
+files) may also work, but can produce inconclusive results.
+
+Install ``netperf`` on all systems if not
+already installed. Check that the UFW rules for its control port are in place.
+However, there are no pre-opened ports for netperf's data connection. Pick a
+port number. In this example, 12866 is used because it is one higher
+than netperf's default control port number, 12865. If you get very
+strange results including zero values, you may not have gotten the data
+port opened in UFW at the target or may have gotten the netperf
+command-line wrong.
+
+Pick a ``source`` and ``target`` node. The source is often a proxy node
+and the target is often an object node. Using the same source proxy you
+can test communication to different object nodes in different AZs to
+identity possible bottlenecks.
+
+Running tests
+^^^^^^^^^^^^^
+
+#. Prepare the ``target`` node as follows:
+
+   .. code:: console
+
+      $ sudo iptables -I INPUT -p tcp -j ACCEPT
+
+   Or, do:
+
+   .. code:: console
+
+      $ sudo ufw allow 12866/tcp
+
+#. On the ``source`` node, run the following command to check
+   throughput. Note the double-dash before the -P option.
+   The command takes 10 seconds to complete. The ``target`` node is 192.168.245.5.
+
+   .. code:: console
+
+      $ netperf -H 192.168.245.5 -- -P 12866
+      MIGRATED TCP STREAM TEST from 0.0.0.0 (0.0.0.0) port 12866 AF_INET to
+      <redacted>.72.4 (<redacted>.72.4) port 12866 AF_INET : demo
+      Recv   Send    Send
+      Socket Socket  Message  Elapsed
+      Size   Size    Size     Time     Throughput
+      bytes  bytes   bytes    secs.    10^6bits/sec
+      87380  16384  16384    10.02     923.69
+
+#. On the ``source`` node, run the following command to check latency:
+
+   .. code:: console
+
+      $ netperf -H 192.168.245.5 -t TCP_RR -- -P 12866
+      MIGRATED TCP REQUEST/RESPONSE TEST from 0.0.0.0 (0.0.0.0) port 12866
+      AF_INET to <redacted>.72.4 (<redacted>.72.4) port 12866 AF_INET : demo
+      : first burst 0
+      Local  Remote Socket   Size    Request  Resp.   Elapsed  Trans.
+      Send   Recv   Size     Size    Time     Rate
+      bytes  Bytes  bytes    bytes   secs.    per sec
+      16384  87380  1        1       10.00    11753.37
+      16384  87380
+
+Expected results
+^^^^^^^^^^^^^^^^
+
+Faults will show up as differences between different pairs of nodes.
+However, for reference, here are some expected numbers:
+
+-  For throughput, proxy to proxy, expect ~9300 Mbit/sec  (proxies have
+   a 10Ge link).
+
+-  For throughout, proxy to object, expect ~920 Mbit/sec  (at time of
+   writing this, object nodes have a 1Ge link).
+
+-  For throughput, object to object, expect ~920 Mbit/sec.
+
+-  For latency (all types), expect ~11000 transactions/sec.
+
+Diagnose: Remapping sectors experiencing UREs
+---------------------------------------------
+
+#. Find the bad sector, device, and filesystem in ``kern.log``.
+
+#. Set the environment variables SEC, DEV & FS, for example:
+
+   .. code:: console
+
+      $ SEC=2930954256
+      $ DEV=/dev/sdi
+      $ FS=/dev/sdi1
+
+#. Verify that the sector is bad:
+
+   .. code:: console
+
+      $ sudo dd if=${DEV} of=/dev/null bs=512 count=1 skip=${SEC}
+
+#. If the sector is bad this command will output an input/output error:
+
+   .. code:: console
+
+      dd: reading `/dev/sdi`: Input/output error
+      0+0 records in
+      0+0 records out
+
+#. Prevent chef from attempting to re-mount the filesystem while the
+   repair is in progress:
+
+   .. code:: console
+
+      $ sudo mv /etc/chef/client.pem /etc/chef/xx-client.xx-pem
+
+#. Stop the swift and rsync service:
+
+   .. code:: console
+
+      $ sudo service rsync stop
+      $ sudo swift-init shutdown all
+
+#. Unmount the problem drive:
+
+   .. code:: console
+
+      $ sudo umount ${FS}
+
+#. Overwrite/remap the bad sector:
+
+   .. code:: console
+
+      $ sudo dd_rescue -d -A -m8b -s ${SEC}b ${DEV} ${DEV}
+
+#. This command should report an input/output error the first time
+   it is run. Run the command a second time, if it successfully remapped
+   the bad sector it should not report an input/output error.
+
+#. Verify the sector is now readable:
+
+   .. code:: console
+
+      $ sudo dd if=${DEV} of=/dev/null bs=512 count=1 skip=${SEC}
+
+#. If the sector is now readable this command should not report an
+   input/output error.
+
+#. If more than one problem sector is listed, set the SEC environment
+   variable to the next sector in the list:
+
+   .. code:: console
+
+      $ SEC=123456789
+
+#. Repeat from step 8.
+
+#. Repair the filesystem:
+
+   .. code:: console
+
+      $ sudo xfs_repair ${FS}
+
+#. If ``xfs_repair`` reports that the filesystem has valuable filesystem
+   changes:
+
+   .. code:: console
+
+      $ sudo xfs_repair ${FS}
+      Phase 1 - find and verify superblock...
+      Phase 2 - using internal log
+              - zero log...
+      ERROR: The filesystem has valuable metadata changes in a log which
+      needs to be replayed.
+      Mount the filesystem to replay the log, and unmount it before
+      re-running xfs_repair.
+      If you are unable to mount the filesystem, then use the -L option to
+      destroy the log and attempt a repair. Note that destroying the log may
+      cause corruption -- please attempt a mount of the filesystem before
+      doing this.
+
+#. You should attempt to mount the filesystem, and clear the lost+found
+   area:
+
+   .. code:: console
+
+      $ sudo mount $FS /mnt
+      $ sudo rm -rf /mnt/lost+found/*
+      $ sudo umount /mnt
+
+#. If the filesystem fails to mount then you will need to use the
+   ``xfs_repair -L`` option to force log zeroing.
+   Repeat step 11.
+
+#. If ``xfs_repair`` reports that an additional input/output error has been
+   encountered, get the sector details as follows:
+
+   .. code:: console
+
+      $ sudo grep "I/O error" /var/log/kern.log | grep sector | tail -1
+
+#. If new input/output error is reported then set the SEC environment
+   variable to the problem sector number:
+
+   .. code:: console
+
+      $ SEC=234567890
+
+#. Repeat from step 8
+
+
+#. Remount the filesystem and restart swift and rsync.
+
+   -  If all UREs in the kern.log have been fixed and you are still unable
+      to have xfs_repair disk, it is possible that the URE's have
+      corrupted the filesystem or possibly destroyed the drive altogether.
+      In this case, the first step is to re-format the filesystem and if
+      this fails, get the disk replaced.
+
+
+Diagnose: High system latency
+-----------------------------
+
+.. note::
+
+   The latency measurements described here are specific to the HPE
+   Helion Public Cloud.
+
+-  A bad NIC on a proxy server. However, as explained above, this
+   usually causes the peak to rise, but average should remain near
+   normal parameters. A quick fix is to shutdown the proxy.
+
+-  A stuck memcache server. Accepts connections, but then will not respond.
+   Expect to see timeout messages in ``/var/log/proxy.log`` (port 11211).
+   Swift Diags will also report this as a failed node/port. A quick fix
+   is to shutdown the proxy server.
+
+-  A bad/broken object server can also cause problems if the accounts
+   used by the monitor program happen to live on the bad object server.
+
+-  A general network problem within the data canter. Compare the results
+   with the Pingdom monitors to see if they also have a problem.
+
+Diagnose: Interface reports errors
+----------------------------------
+
+Should a network interface on a Swift node begin reporting network
+errors, it may well indicate a cable, switch, or network issue.
+
+Get an overview of the interface with:
+
+.. code:: console
+
+   $ sudo ifconfig eth{n}
+   $ sudo ethtool eth{n}
+
+The ``Link Detected:`` indicator will read ``yes`` if the nic is
+cabled.
+
+Establish the adapter type with:
+
+.. code:: console
+
+   $ sudo ethtool  -i eth{n}
+
+Gather the interface statistics with:
+
+.. code:: console
+
+   $ sudo ethtool  -S eth{n}
+
+If the nick supports self test, this can be performed with:
+
+.. code:: console
+
+   $ sudo ethtool  -t eth{n}
+
+Self tests should read ``PASS`` if the nic is operating correctly.
+
+Nic module drivers can be re-initialised by carefully removing and
+re-installing the modules (this avoids rebooting the server).
+For example, mellanox drivers use a two part driver mlx4_en and
+mlx4_core. To reload these you must carefully remove the mlx4_en
+(ethernet) then the mlx4_core modules, and reinstall them in the
+reverse order.
+
+As the interface will be disabled while the modules are unloaded, you
+must be very careful not to lock yourself out so it may be better
+to script this.
+
+Diagnose: Hung swift object replicator
+--------------------------------------
+
+A replicator reports in its log that remaining time exceeds
+100 hours. This may indicate that the swift ``object-replicator`` is stuck and not
+making progress. Another useful way to check this is with the
+'swift-recon -r' command on a swift proxy server:
+
+.. code:: console
+
+   $ sudo swift-recon -r
+   ===============================================================================
+
+   --> Starting reconnaissance on 384 hosts
+   ===============================================================================
+   [2013-07-17 12:56:19] Checking on replication
+   [replication_time] low: 2, high: 80, avg: 28.8, total: 11037, Failed: 0.0%, no_result: 0, reported: 383
+   Oldest completion was 2013-06-12 22:46:50 (12 days ago) by 192.168.245.3:6200.
+   Most recent completion was 2013-07-17 12:56:19 (5 seconds ago) by 192.168.245.5:6200.
+   ===============================================================================
+
+The ``Oldest completion`` line in this example indicates that the
+object-replicator on swift object server 192.168.245.3 has not completed
+the replication cycle in 12 days. This replicator is stuck. The object
+replicator cycle is generally less than 1 hour. Though an replicator
+cycle of 15-20 hours can occur if nodes are added to the system and a
+new ring has been deployed.
+
+You can further check if the object replicator is stuck by logging on
+the object server and checking the object replicator progress with
+the following command:
+
+.. code:: console
+
+   $ sudo grep object-rep /var/log/swift/background.log | grep -e "Starting object replication" -e "Object replication complete" -e "partitions rep"
+   Jul 16 06:25:46 192.168.245.4 object-replicator 15344/16450 (93.28%) partitions replicated in 69018.48s (0.22/sec, 22h remaining)
+   Jul 16 06:30:46 192.168.245.4object-replicator 15344/16450 (93.28%) partitions replicated in 69318.58s (0.22/sec, 22h remaining)
+   Jul 16 06:35:46 192.168.245.4 object-replicator 15344/16450 (93.28%) partitions replicated in 69618.63s (0.22/sec, 23h remaining)
+   Jul 16 06:40:46 192.168.245.4 object-replicator 15344/16450 (93.28%) partitions replicated in 69918.73s (0.22/sec, 23h remaining)
+   Jul 16 06:45:46 192.168.245.4 object-replicator 15348/16450 (93.30%) partitions replicated in 70218.75s (0.22/sec, 24h remaining)
+   Jul 16 06:50:47 192.168.245.4object-replicator 15348/16450 (93.30%) partitions replicated in 70518.85s (0.22/sec, 24h remaining)
+   Jul 16 06:55:47 192.168.245.4 object-replicator 15348/16450 (93.30%) partitions replicated in 70818.95s (0.22/sec, 25h remaining)
+   Jul 16 07:00:47 192.168.245.4 object-replicator 15348/16450 (93.30%) partitions replicated in 71119.05s (0.22/sec, 25h remaining)
+   Jul 16 07:05:47 192.168.245.4 object-replicator 15348/16450 (93.30%) partitions replicated in 71419.15s (0.21/sec, 26h remaining)
+   Jul 16 07:10:47 192.168.245.4object-replicator 15348/16450 (93.30%) partitions replicated in 71719.25s (0.21/sec, 26h remaining)
+   Jul 16 07:15:47 192.168.245.4 object-replicator 15348/16450 (93.30%) partitions replicated in 72019.27s (0.21/sec, 27h remaining)
+   Jul 16 07:20:47 192.168.245.4object-replicator 15348/16450 (93.30%) partitions replicated in 72319.37s (0.21/sec, 27h remaining)
+   Jul 16 07:25:47 192.168.245.4 object-replicator 15348/16450 (93.30%) partitions replicated in 72619.47s (0.21/sec, 28h remaining)
+   Jul 16 07:30:47 192.168.245.4 object-replicator 15348/16450 (93.30%) partitions replicated in 72919.56s (0.21/sec, 28h remaining)
+   Jul 16 07:35:47 192.168.245.4 object-replicator 15348/16450 (93.30%) partitions replicated in 73219.67s (0.21/sec, 29h remaining)
+   Jul 16 07:40:47 192.168.245.4 object-replicator 15348/16450 (93.30%) partitions replicated in 73519.76s (0.21/sec, 29h remaining)
+
+The above status is output every 5 minutes to ``/var/log/swift/background.log``.
+
+.. note::
+
+   The 'remaining' time is increasing as time goes on, normally the
+   time remaining should be decreasing. Also note the partition number. For example,
+   15344 remains the same for several status lines. Eventually the object
+   replicator detects the hang and attempts to make progress by killing the
+   problem thread. The replicator then progresses to the next partition but
+   quite often it again gets stuck on the same partition.
+
+One of the reasons for the object replicator hanging like this is
+filesystem corruption on the drive. The following is a typical log entry
+of a corrupted filesystem detected by the object replicator:
+
+.. code:: console
+
+   $ sudo bzgrep "Remote I/O error" /var/log/swift/background.log* |grep srv | - tail -1
+   Jul 12 03:33:30 192.168.245.4 object-replicator STDOUT: ERROR:root:Error hashing suffix#012Traceback (most recent call last):#012 File
+   "/usr/lib/python2.7/dist-packages/swift/obj/replicator.py", line 199, in get_hashes#012 hashes[suffix] = hash_suffix(suffix_dir,
+   reclaim_age)#012 File "/usr/lib/python2.7/dist-packages/swift/obj/replicator.py", line 84, in hash_suffix#012 path_contents =
+   sorted(os.listdir(path))#012OSError: [Errno 121] Remote I/O error: '/srv/node/disk4/objects/1643763/b51'
+
+An ``ls`` of the problem file or directory usually shows something like the following:
+
+.. code:: console
+
+   $ ls -l /srv/node/disk4/objects/1643763/b51
+   ls: cannot access /srv/node/disk4/objects/1643763/b51: Remote I/O error
+
+If no entry with ``Remote I/O error`` occurs in the ``background.log`` it is
+not possible to determine why the object-replicator is hung. It may be
+that the ``Remote I/O error`` entry is older than 7 days and so has been
+rotated out of the logs. In this scenario it may be best to simply
+restart the object-replicator.
+
+#. Stop the object-replicator:
+
+   .. code:: console
+
+      # sudo swift-init object-replicator stop
+
+#. Make sure the object replicator has stopped, if it has hung, the stop
+   command will not stop the hung process:
+
+   .. code:: console
+
+      # ps auxww | - grep swift-object-replicator
+
+#. If the previous ps shows the object-replicator is still running, kill
+   the process:
+
+   .. code:: console
+
+      # kill -9 <pid-of-swift-object-replicator>
+
+#. Start the object-replicator:
+
+   .. code:: console
+
+      # sudo swift-init object-replicator start
+
+If the above grep did find an ``Remote I/O error`` then it may be possible
+to repair the problem filesystem.
+
+#. Stop swift and rsync:
+
+   .. code:: console
+
+      # sudo swift-init all shutdown
+      # sudo service rsync stop
+
+#. Make sure all swift process have stopped:
+
+   .. code:: console
+
+      # ps auxww | grep swift | grep python
+
+#. Kill any swift processes still running.
+
+#. Unmount the problem filesystem:
+
+   .. code:: console
+
+      # sudo umount /srv/node/disk4
+
+#. Repair the filesystem:
+
+   .. code:: console
+
+      # sudo xfs_repair -P /dev/sde1
+
+#. If the ``xfs_repair`` fails then it may be necessary to re-format the
+   filesystem. See :ref:`fix_broken_xfs_filesystem`. If the
+   ``xfs_repair`` is successful, re-enable chef using the following command
+   and replication should commence again.
+
+
+Diagnose: High CPU load
+-----------------------
+
+The CPU load average on an object server, as shown with the
+'uptime' command, is typically under 10 when the server is
+lightly-moderately loaded:
+
+.. code:: console
+
+   $ uptime
+   07:59:26 up 99 days,  5:57,  1 user,  load average: 8.59, 8.39, 8.32
+
+During times of increased activity, due to user transactions or object
+replication, the CPU load average can increase to  to around 30.
+
+However, sometimes the CPU load average can increase significantly. The
+following is an example of an object server that has extremely high CPU
+load:
+
+.. code:: console
+
+   $ uptime
+   07:44:02 up 18:22,  1 user,  load average: 407.12, 406.36, 404.59
+
+Further issues and resolutions
+------------------------------
+
+.. note::
+
+   The urgency levels in each **Action** column indicates whether or
+   not it is required to take immediate action, or if the problem can be worked
+   on during business hours.
+
+.. list-table::
+   :widths: 33 33 33
+   :header-rows: 1
+
+   * - **Scenario**
+     - **Description**
+     - **Action**
+   * - ``/healthcheck`` latency is high.
+     - The ``/healthcheck`` test does not tax the proxy very much so any drop in value is probably related to
+       network issues, rather than the proxies being very busy. A very slow proxy might impact the average
+       number, but it would need to be very slow to shift the number that much.
+     - Check networks. Do a ``curl https://<ip-address>:<port>/healthcheck`` where
+       ``ip-address`` is individual proxy IP address.
+       Repeat this for every proxy server to see if you can pin point the problem.
+
+       Urgency: If there are other indications that your system is slow, you should treat
+       this as an urgent problem.
+   * - Swift process is not running.
+     - You can use ``swift-init`` status to check if swift processes are running on any
+       given server.
+     - Run this command:
+
+       .. code:: console
+
+          $ sudo swift-init all start
+
+       Examine messages in the swift log files to see if there are any
+       error messages related to any of the swift processes since the time you
+       ran the ``swift-init`` command.
+
+       Take any corrective actions that seem necessary.
+
+       Urgency: If this only affects one server, and you have more than one,
+       identifying and fixing the problem can wait until business hours.
+       If this same problem affects many servers, then you need to take corrective
+       action immediately.
+   * - ntpd is not running.
+     - NTP is not running.
+     - Configure and start NTP.
+
+       Urgency: For proxy servers, this is vital.
+
+   * - Host clock is not syncd to an NTP server.
+     - Node time settings does not match NTP server time.
+       This may take some time to sync after a reboot.
+     - Assuming NTP is configured and running, you have to wait until the times sync.
+   * - A swift process has hundreds, to thousands of open file descriptors.
+     - May happen to any of the swift processes.
+       Known to have happened with a ``rsyslod`` restart and where ``/tmp`` was hanging.
+
+     - Restart the swift processes on the affected node:
+
+       .. code:: console
+
+          $ sudo swift-init all reload
+
+       Urgency:
+                If known performance problem: Immediate
+
+                If system seems fine: Medium
+   * - A swift process is not owned by the swift user.
+     - If the UID of the swift user has changed, then the processes might not be
+       owned by that UID.
+     - Urgency: If this only affects one server, and you have more than one,
+       identifying and fixing the problem can wait until business hours.
+       If this same problem affects many servers, then you need to take corrective
+       action immediately.
+   * - Object account or container files not owned by swift.
+     - This typically happens if during a reinstall or a re-image of a server that the UID
+       of the swift user was changed. The data files in the object account and container
+       directories are owned by the original swift UID. As a result, the current swift
+       user does not own these files.
+     - Correct the UID of the swift user to reflect that of the original UID. An alternate
+       action is to change the ownership of every file on all file systems. This alternate
+       action is often impractical and will take considerable time.
+
+       Urgency: If this only affects one server, and you have more than one,
+       identifying and fixing the problem can wait until business hours.
+       If this same problem affects many servers, then you need to take corrective
+       action immediately.
+   * - A disk drive has a high IO wait or service time.
+     - If high wait IO times are seen for a single disk, then the disk drive is the problem.
+       If most/all devices are slow, the controller is probably the source of the problem.
+       The controller cache may also be miss configured – which will cause similar long
+       wait or service times.
+     - As a first step, if your controllers have a cache, check that it is enabled and their battery/capacitor
+       is working.
+
+       Second, reboot the server.
+       If problem persists, file a DC ticket to have the drive or controller replaced.
+       See :ref:`diagnose_slow_disk_drives` on how to check the drive wait or service times.
+
+       Urgency: Medium
+   * - The network interface is not up.
+     - Use the ``ifconfig`` and ``ethtool`` commands to determine the network state.
+     - You can try restarting the interface. However, generally the interface
+       (or cable) is probably broken, especially if the interface is flapping.
+
+       Urgency: If this only affects one server, and you have more than one,
+       identifying and fixing the problem can wait until business hours.
+       If this same problem affects many servers, then you need to take corrective
+       action immediately.
+   * - Network interface card (NIC) is not operating at the expected speed.
+     - The NIC is running at a slower speed than its nominal rated speed.
+       For example, it is running at 100 Mb/s and the NIC is a 1Ge NIC.
+     - 1. Try resetting the interface with:
+
+          .. code:: console
+
+             $ sudo ethtool -s eth0 speed 1000
+
+          ... and then run:
+
+          .. code:: console
+
+             $ sudo lshw -class
+
+          See if size goes to the expected speed. Failing
+          that, check hardware (NIC cable/switch port).
+
+       2. If persistent, consider shutting down the server (especially if a proxy)
+          until the problem is identified and resolved. If you leave this server
+          running it can have a large impact on overall performance.
+
+       Urgency: High
+   * - The interface RX/TX error count is non-zero.
+     - A value of 0 is typical, but counts of 1 or 2 do not indicate a problem.
+     - 1. For low numbers (For example, 1 or 2), you can simply ignore. Numbers in the range
+          3-30 probably indicate that the error count has crept up slowly over a long time.
+          Consider rebooting the server to remove the report from the noise.
+
+          Typically, when a cable or interface is bad, the error count goes to 400+. For example,
+          it stands out. There may be other symptoms such as the interface going up and down or
+          not running at correct speed. A server with a high error count should be watched.
+
+       2. If the error count continues to climb, consider taking the server down until
+          it can be properly investigated. In any case, a reboot should be done to clear
+          the error count.
+
+       Urgency: High, if the error count increasing.
+
+   * - In a swift log you see a message that a process has not replicated in over 24 hours.
+     - The replicator has not successfully completed a run in the last 24 hours.
+       This indicates that the replicator has probably hung.
+     - Use ``swift-init`` to stop and then restart the replicator process.
+
+       Urgency: Low. However if you
+       recently added or replaced disk drives then you should treat this urgently.
+   * - Container Updater has not run in 4 hour(s).
+     - The service may appear to be running however, it may be hung. Examine their swift
+       logs to see if there are any error messages relating to the container updater. This
+       may potentially explain why the container is not running.
+     - Urgency: Medium
+       This may have been triggered by a recent restart of the  rsyslog daemon.
+       Restart the service with:
+
+       .. code:: console
+
+          $ sudo swift-init <service> reload
+
+   * - Object replicator: Reports the remaining time and that time is more than 100 hours.
+     - Each replication cycle the object replicator writes a log message to its log
+       reporting statistics about the current cycle. This includes an estimate for the
+       remaining time needed to replicate all objects. If this time is longer than
+       100 hours, there is a problem with the replication process.
+     - Urgency: Medium
+       Restart the service with:
+
+       .. code:: console
+
+          $ sudo swift-init object-replicator reload
+
+       Check that the remaining replication time is going down.
+
diff --git a/doc/source/ops_runbook/index.rst b/doc/source/ops_runbook/index.rst
new file mode 100644
index 0000000000..8bf3f425ac
--- /dev/null
+++ b/doc/source/ops_runbook/index.rst
@@ -0,0 +1,27 @@
+=================
+Swift Ops Runbook
+=================
+
+This document contains operational procedures that Hewlett Packard Enterprise (HPE) uses to operate
+and monitor the Swift system within the HPE Helion Public Cloud. This
+document is an excerpt of a larger product-specific handbook. As such,
+the material may appear incomplete. The suggestions and recommendations
+made in this document are for our particular environment, and may not be
+suitable for your environment or situation. We make no representations
+concerning the accuracy, adequacy, completeness or suitability of the
+information, suggestions or recommendations. This document are provided
+for reference only. We are not responsible for your use of any
+information, suggestions or recommendations contained herein.
+
+
+.. toctree::
+   :maxdepth: 2
+
+   diagnose.rst
+   procedures.rst
+   maintenance.rst
+   troubleshooting.rst
+
+
+
+
diff --git a/doc/source/ops_runbook/maintenance.rst b/doc/source/ops_runbook/maintenance.rst
new file mode 100644
index 0000000000..c63feb7bd5
--- /dev/null
+++ b/doc/source/ops_runbook/maintenance.rst
@@ -0,0 +1,330 @@
+==================
+Server maintenance
+==================
+
+General assumptions
+~~~~~~~~~~~~~~~~~~~
+
+-  It is assumed that anyone attempting to replace hardware components
+   will have already read and understood the appropriate maintenance and
+   service guides.
+
+-  It is assumed that where servers need to be taken off-line for
+   hardware replacement, that this will be done in series, bringing the
+   server back on-line before taking the next off-line.
+
+-  It is assumed that the operations directed procedure will be used for
+   identifying hardware for replacement.
+
+Assessing the health of swift
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+You can run the swift-recon tool on a Swift proxy node to get a quick
+check of how Swift is doing. Please note that the numbers below are
+necessarily somewhat subjective. Sometimes parameters for which we
+say 'low values are good' will have pretty high values for a time. Often
+if you wait a while things get better.
+
+For example:
+
+.. code:: console
+
+   $ sudo swift-recon -rla
+   ===============================================================================
+   [2012-03-10 12:57:21] Checking async pendings on 384 hosts...
+   Async stats: low: 0, high: 1, avg: 0, total: 1
+   ===============================================================================
+
+   [2012-03-10 12:57:22] Checking replication times on 384 hosts...
+   [Replication Times] shortest: 1.4113877813, longest: 36.8293570836, avg: 4.86278064749
+   ===============================================================================
+
+   [2012-03-10 12:57:22] Checking load avg's on 384 hosts...
+   [5m load average] lowest: 2.22, highest: 9.5, avg: 4.59578125
+   [15m load average] lowest: 2.36, highest: 9.45, avg: 4.62622395833
+   [1m load average] lowest: 1.84, highest: 9.57, avg: 4.5696875
+   ===============================================================================
+
+In the example above we ask for information on replication times (-r),
+load averages (-l) and async pendings (-a). This is a healthy Swift
+system. Rules-of-thumb for 'good' recon output are:
+
+-  Nodes that respond are up and running Swift. If all nodes respond,
+   that is a good sign. But some nodes may time out. For example:
+
+   .. code:: console
+
+      -> [http://<redacted>.29:6200/recon/load:] <urlopen error [Errno 111] ECONNREFUSED>
+      -> [http://<redacted>.31:6200/recon/load:] <urlopen error timed out>
+
+-  That could be okay or could require investigation.
+
+-  Low values (say < 10 for high and average) for async pendings are
+   good. Higher values occur when disks are down and/or when the system
+   is heavily loaded. Many simultaneous PUTs to the same container can
+   drive async pendings up. This may be normal, and may resolve itself
+   after a while. If it persists, one way to track down the problem is
+   to find a node with high async pendings (with ``swift-recon -av | sort
+   -n -k4``), then check its Swift logs, Often async pendings are high
+   because a node cannot write to a container on another node. Often
+   this is because the node or disk is offline or bad. This may be okay
+   if we know about it.
+
+-  Low values for replication times are good. These values rise when new
+   rings are pushed, and when nodes and devices are brought back on
+   line.
+
+-  Our 'high' load average values are typically in the 9-15 range. If
+   they are a lot bigger it is worth having a look at the systems
+   pushing the average up. Run ``swift-recon -av`` to get the individual
+   averages. To sort the entries with the highest at the end,
+   run ``swift-recon -av | sort -n -k4``.
+
+For comparison here is the recon output for the same system above when
+two entire racks of Swift are down:
+
+.. code:: console
+
+   [2012-03-10 16:56:33] Checking async pendings on 384 hosts...
+   -> http://<redacted>.22:6200/recon/async: <urlopen error timed out>
+   -> http://<redacted>.18:6200/recon/async: <urlopen error timed out>
+   -> http://<redacted>.16:6200/recon/async: <urlopen error timed out>
+   -> http://<redacted>.13:6200/recon/async: <urlopen error timed out>
+   -> http://<redacted>.30:6200/recon/async: <urlopen error timed out>
+   -> http://<redacted>.6:6200/recon/async: <urlopen error timed out>
+   .........
+   -> http://<redacted>.5:6200/recon/async: <urlopen error timed out>
+   -> http://<redacted>.15:6200/recon/async: <urlopen error timed out>
+   -> http://<redacted>.9:6200/recon/async: <urlopen error timed out>
+   -> http://<redacted>.27:6200/recon/async: <urlopen error timed out>
+   -> http://<redacted>.4:6200/recon/async: <urlopen error timed out>
+   -> http://<redacted>.8:6200/recon/async: <urlopen error timed out>
+   Async stats: low: 243, high: 659, avg: 413, total: 132275
+   ===============================================================================
+   [2012-03-10 16:57:48] Checking replication times on 384 hosts...
+   -> http://<redacted>.22:6200/recon/replication: <urlopen error timed out>
+   -> http://<redacted>.18:6200/recon/replication: <urlopen error timed out>
+   -> http://<redacted>.16:6200/recon/replication: <urlopen error timed out>
+   -> http://<redacted>.13:6200/recon/replication: <urlopen error timed out>
+   -> http://<redacted>.30:6200/recon/replication: <urlopen error timed out>
+   -> http://<redacted>.6:6200/recon/replication: <urlopen error timed out>
+   ............
+   -> http://<redacted>.5:6200/recon/replication: <urlopen error timed out>
+   -> http://<redacted>.15:6200/recon/replication: <urlopen error timed out>
+   -> http://<redacted>.9:6200/recon/replication: <urlopen error timed out>
+   -> http://<redacted>.27:6200/recon/replication: <urlopen error timed out>
+   -> http://<redacted>.4:6200/recon/replication: <urlopen error timed out>
+   -> http://<redacted>.8:6200/recon/replication: <urlopen error timed out>
+   [Replication Times] shortest: 1.38144306739, longest: 112.620954418, avg: 10.285
+   9475361
+   ===============================================================================
+   [2012-03-10 16:59:03] Checking load avg's on 384 hosts...
+   -> http://<redacted>.22:6200/recon/load: <urlopen error timed out>
+   -> http://<redacted>.18:6200/recon/load: <urlopen error timed out>
+   -> http://<redacted>.16:6200/recon/load: <urlopen error timed out>
+   -> http://<redacted>.13:6200/recon/load: <urlopen error timed out>
+   -> http://<redacted>.30:6200/recon/load: <urlopen error timed out>
+   -> http://<redacted>.6:6200/recon/load: <urlopen error timed out>
+   ............
+   -> http://<redacted>.15:6200/recon/load: <urlopen error timed out>
+   -> http://<redacted>.9:6200/recon/load: <urlopen error timed out>
+   -> http://<redacted>.27:6200/recon/load: <urlopen error timed out>
+   -> http://<redacted>.4:6200/recon/load: <urlopen error timed out>
+   -> http://<redacted>.8:6200/recon/load: <urlopen error timed out>
+   [5m load average] lowest: 1.71, highest: 4.91, avg: 2.486375
+   [15m load average] lowest: 1.79, highest: 5.04, avg: 2.506125
+   [1m load average] lowest: 1.46, highest: 4.55, avg: 2.4929375
+   ===============================================================================
+
+.. note::
+
+   The replication times and load averages are within reasonable
+   parameters, even with 80 object stores down. Async pendings, however is
+   quite high. This is due to the fact that the containers on the servers
+   which are down cannot be updated. When those servers come back up, async
+   pendings should drop. If async pendings were at this level without an
+   explanation, we have a problem.
+
+Recon examples
+~~~~~~~~~~~~~~
+
+Here is an example of noting and tracking down a problem with recon.
+
+Running reccon shows some async pendings:
+
+.. code:: console
+
+   $ ssh -q <redacted>.132.7 sudo swift-recon -alr
+   ===============================================================================
+   [2012-03-14 17:25:55] Checking async pendings on 384 hosts...
+   Async stats: low: 0, high: 23, avg: 8, total: 3356
+   ===============================================================================
+   [2012-03-14 17:25:55] Checking replication times on 384 hosts...
+   [Replication Times] shortest: 1.49303831657, longest: 39.6982825994, avg: 4.2418222066
+   ===============================================================================
+   [2012-03-14 17:25:56] Checking load avg's on 384 hosts...
+   [5m load average] lowest: 2.35, highest: 8.88, avg: 4.45911458333
+   [15m load average] lowest: 2.41, highest: 9.11, avg: 4.504765625
+   [1m load average] lowest: 1.95, highest: 8.56, avg: 4.40588541667
+    ===============================================================================
+
+Why? Running recon again with -av swift (not shown here) tells us that
+the node with the highest (23) is <redacted>.72.61. Looking at the log
+files on <redacted>.72.61 we see:
+
+.. code:: console
+
+   $ sudo tail -f /var/log/swift/background.log | - grep -i ERROR
+   Mar 14 17:28:06 <redacted> container-replicator ERROR Remote drive not mounted
+   {'zone': 5, 'weight': 1952.0, 'ip': '<redacted>.204.119', 'id': 5481, 'meta': '', 'device': 'disk6', 'port': 6201}
+   Mar 14 17:28:06 <redacted> container-replicator ERROR Remote drive not mounted
+   {'zone': 5, 'weight': 1952.0, 'ip': '<redacted>.204.119', 'id': 5481, 'meta': '', 'device': 'disk6', 'port': 6201}
+   Mar 14 17:28:09 <redacted> container-replicator ERROR Remote drive not mounted
+   {'zone': 5, 'weight': 1952.0, 'ip': '<redacted>.204.20', 'id': 2311, 'meta': '', 'device': 'disk5', 'port': 6201}
+   Mar 14 17:28:11 <redacted> container-replicator ERROR Remote drive not mounted
+   {'zone': 5, 'weight': 1952.0, 'ip': '<redacted>.204.20', 'id': 2311, 'meta': '', 'device': 'disk5', 'port': 6201}
+   Mar 14 17:28:13 <redacted> container-replicator ERROR Remote drive not mounted
+   {'zone': 5, 'weight': 1952.0, 'ip': '<redacted>.204.119', 'id': 5481, 'meta': '', 'device': 'disk6', 'port': 6201}
+   Mar 14 17:28:13 <redacted> container-replicator ERROR Remote drive not mounted
+   {'zone': 5, 'weight': 1952.0, 'ip': '<redacted>.204.119', 'id': 5481, 'meta': '', 'device': 'disk6', 'port': 6201}
+   Mar 14 17:28:15 <redacted> container-replicator ERROR Remote drive not mounted
+   {'zone': 5, 'weight': 1952.0, 'ip': '<redacted>.204.20', 'id': 2311, 'meta': '', 'device': 'disk5', 'port': 6201}
+   Mar 14 17:28:15 <redacted> container-replicator ERROR Remote drive not mounted
+   {'zone': 5, 'weight': 1952.0, 'ip': '<redacted>.204.20', 'id': 2311, 'meta': '', 'device': 'disk5', 'port': 6201}
+   Mar 14 17:28:19 <redacted> container-replicator ERROR Remote drive not mounted
+   {'zone': 5, 'weight': 1952.0, 'ip': '<redacted>.204.20', 'id': 2311, 'meta': '', 'device': 'disk5', 'port': 6201}
+   Mar 14 17:28:19 <redacted> container-replicator ERROR Remote drive not mounted
+   {'zone': 5, 'weight': 1952.0, 'ip': '<redacted>.204.20', 'id': 2311, 'meta': '', 'device': 'disk5', 'port': 6201}
+   Mar 14 17:28:20 <redacted> container-replicator ERROR Remote drive not mounted
+   {'zone': 5, 'weight': 1952.0, 'ip': '<redacted>.204.119', 'id': 5481, 'meta': '', 'device': 'disk6', 'port': 6201}
+   Mar 14 17:28:21 <redacted> container-replicator ERROR Remote drive not mounted
+   {'zone': 5, 'weight': 1952.0, 'ip': '<redacted>.204.20', 'id': 2311, 'meta': '', 'device': 'disk5', 'port': 6201}
+   Mar 14 17:28:21 <redacted> container-replicator ERROR Remote drive not mounted
+   {'zone': 5, 'weight': 1952.0, 'ip': '<redacted>.204.20', 'id': 2311, 'meta': '', 'device': 'disk5', 'port': 6201}
+   Mar 14 17:28:22 <redacted> container-replicator ERROR Remote drive not mounted
+   {'zone': 5, 'weight': 1952.0, 'ip': '<redacted>.204.20', 'id': 2311, 'meta': '', 'device': 'disk5', 'port': 6201}
+
+That is why this node has a lot of async pendings: a bunch of disks that
+are not mounted on <redacted> and <redacted>. There may be other issues,
+but clearing this up will likely drop the async pendings a fair bit, as
+other nodes will be having the same problem.
+
+Assessing the availability risk when multiple storage servers are down
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. note::
+
+   This procedure will tell you if you have a problem, however, in practice
+   you will find that you will not use this procedure frequently.
+
+If three storage nodes (or, more precisely, three disks on three
+different storage nodes) are down, there is a small but nonzero
+probability that user objects, containers, or accounts will not be
+available.
+
+Procedure
+---------
+
+.. note::
+
+   swift has three rings: one each for objects, containers and accounts.
+   This procedure should be run three times, each time specifying the
+   appropriate ``*.builder`` file.
+
+#. Determine whether all three nodes are in different Swift zones by
+   running the ring builder on a proxy node to determine which zones
+   the storage nodes are in. For example:
+
+   .. code:: console
+
+      % sudo swift-ring-builder /etc/swift/object.builder
+      /etc/swift/object.builder, build version 1467
+      2097152 partitions, 3 replicas, 5 zones, 1320 devices, 0.02 balance
+      The minimum number of hours before a partition can be reassigned is 24
+      Devices:    id  zone     ip address    port     name  weight  partitions balance meta
+                   0     1     <redacted>.4  6200     disk0 1708.00       4259   -0.00
+                   1     1     <redacted>.4  6200     disk1 1708.00       4260    0.02
+                   2     1     <redacted>.4  6200     disk2 1952.00       4868    0.01
+                   3     1     <redacted>.4  6200     disk3 1952.00       4868    0.01
+                   4     1     <redacted>.4  6200     disk4 1952.00       4867   -0.01
+
+#. Here, node <redacted>.4 is in zone 1. If two or more of the three
+   nodes under consideration are in the same Swift zone, they do not
+   have any ring partitions in common; there is little/no data
+   availability risk if all three nodes are down.
+
+#. If the nodes are in three distinct Swift zones it is necessary to
+   whether the nodes have ring partitions in common. Run ``swift-ring``
+   builder again, this time with the ``list_parts`` option and specify
+   the nodes under consideration. For example:
+
+   .. code:: console
+
+      % sudo swift-ring-builder /etc/swift/object.builder list_parts <redacted>.8 <redacted>.15 <redacted>.72.2
+      Partition   Matches
+      91           2
+      729          2
+      3754         2
+      3769         2
+      3947         2
+      5818         2
+      7918         2
+      8733         2
+      9509         2
+      10233        2
+
+#. The ``list_parts`` option to the ring builder indicates how many ring
+   partitions the nodes have in common. If, as in this case,  the
+   first entry in the list has a 'Matches' column of 2 or less,  there
+   is no data availability risk if all three nodes are down.
+
+#. If the 'Matches' column has entries equal to 3, there is some data
+   availability risk if all three nodes are down. The risk is generally
+   small, and is proportional to the number of entries that have a 3 in
+   the Matches column. For example:
+
+   .. code:: console
+
+      Partition   Matches
+      26865          3
+      362367         3
+      745940         3
+      778715         3
+      797559         3
+      820295         3
+      822118         3
+      839603         3
+      852332         3
+      855965         3
+      858016         3
+
+#. A quick way to count the number of rows with 3 matches is:
+
+   .. code:: console
+
+      % sudo swift-ring-builder /etc/swift/object.builder list_parts <redacted>.8 <redacted>.15 <redacted>.72.2 | grep "3$" | wc -l
+
+      30
+
+#. In this case the nodes have 30 out of a total of 2097152 partitions
+   in common; about 0.001%. In this case the risk is small/nonzero.
+   Recall that a partition is simply a portion of the ring mapping
+   space, not actual data. So having partitions in common is a necessary
+   but not sufficient condition for data unavailability.
+
+   .. note::
+
+      We should not bring down a node for repair if it shows
+      Matches entries of 3 with other nodes that are also down.
+
+      If three nodes that have 3 partitions in common are all down, there is
+      a nonzero probability that data are unavailable and we should work to
+      bring some or all of the nodes up ASAP.
+
+Swift startup/shutdown
+~~~~~~~~~~~~~~~~~~~~~~
+
+-  Use reload - not stop/start/restart.
+
+-  Try to roll sets of servers (especially proxy) in groups of less
+   than 20% of your servers.
diff --git a/doc/source/ops_runbook/procedures.rst b/doc/source/ops_runbook/procedures.rst
new file mode 100644
index 0000000000..1d84d59698
--- /dev/null
+++ b/doc/source/ops_runbook/procedures.rst
@@ -0,0 +1,412 @@
+=================================
+Software configuration procedures
+=================================
+
+.. _fix_broken_gpt_table:
+
+Fix broken GPT table (broken disk partition)
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+-  If a GPT table is broken, a message like the following should be
+   observed when the command...
+
+   .. code:: console
+
+      $ sudo parted -l
+
+-  ... is run.
+
+   .. code:: console
+
+      ...
+      Error: The backup GPT table is corrupt, but the primary appears OK, so that will
+      be used.
+      OK/Cancel?
+
+#. To fix this, firstly install the ``gdisk`` program to fix this:
+
+   .. code:: console
+
+      $ sudo aptitude install gdisk
+
+#. Run ``gdisk`` for the particular drive with the damaged partition:
+
+   .. code: console
+
+      $ sudo gdisk /dev/sd*a-l*
+      GPT fdisk (gdisk) version 0.6.14
+
+      Caution: invalid backup GPT header, but valid main header; regenerating
+      backup header from main header.
+
+      Warning! One or more CRCs don't match. You should repair the disk!
+
+      Partition table scan:
+         MBR: protective
+         BSD: not present
+         APM: not present
+         GPT: damaged
+      /dev/sd
+      *****************************************************************************
+      Caution: Found protective or hybrid MBR and corrupt GPT. Using GPT, but disk
+      verification and recovery are STRONGLY recommended.
+      *****************************************************************************
+
+#. On the command prompt, type ``r`` (recovery and transformation
+   options), followed by ``d`` (use main GPT header) , ``v`` (verify disk)
+   and finally ``w`` (write table to disk and exit). Will also need to
+   enter ``Y`` when prompted in order to confirm actions.
+
+   .. code:: console
+
+      Command (? for help): r
+
+      Recovery/transformation command (? for help): d
+
+      Recovery/transformation command (? for help): v
+
+      Caution: The CRC for the backup partition table is invalid. This table may
+      be corrupt. This program will automatically create a new backup partition
+      table when you save your partitions.
+
+      Caution: Partition 1 doesn't begin on a 8-sector boundary. This may
+      result in degraded performance on some modern (2009 and later) hard disks.
+
+      Caution: Partition 2 doesn't begin on a 8-sector boundary. This may
+      result in degraded performance on some modern (2009 and later) hard disks.
+
+      Caution: Partition 3 doesn't begin on a 8-sector boundary. This may
+      result in degraded performance on some modern (2009 and later) hard disks.
+
+      Identified 1 problems!
+
+      Recovery/transformation command (? for help): w
+
+      Final checks complete. About to write GPT data. THIS WILL OVERWRITE EXISTING
+      PARTITIONS!!
+
+      Do you want to proceed, possibly destroying your data? (Y/N): Y
+
+      OK; writing new GUID partition table (GPT).
+      The operation has completed successfully.
+
+#. Running the command:
+
+   .. code:: console
+
+      $ sudo parted /dev/sd#
+
+#. Should now show that the partition is recovered and healthy again.
+
+#. Finally, uninstall ``gdisk`` from the node:
+
+   .. code:: console
+
+      $ sudo aptitude remove gdisk
+
+.. _fix_broken_xfs_filesystem:
+
+Procedure: Fix broken XFS filesystem
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+#. A filesystem may be corrupt or broken if the following output is
+   observed when checking its label:
+
+   .. code:: console
+
+      $ sudo xfs_admin -l /dev/sd#
+      cache_node_purge: refcount was 1, not zero (node=0x25d5ee0)
+      xfs_admin: cannot read root inode (117)
+      cache_node_purge: refcount was 1, not zero (node=0x25d92b0)
+      xfs_admin: cannot read realtime bitmap inode (117)
+      bad sb magic # 0 in AG 1
+      failed to read label in AG 1
+
+#. Run the following commands to remove the broken/corrupt filesystem and replace.
+   (This example uses the filesystem ``/dev/sdb2``) Firstly need to replace the partition:
+
+   .. code:: console
+
+      $ sudo parted
+      GNU Parted 2.3
+      Using /dev/sda
+      Welcome to GNU Parted! Type 'help' to view a list of commands.
+      (parted) select /dev/sdb
+      Using /dev/sdb
+      (parted) p
+      Model: HP LOGICAL VOLUME (scsi)
+      Disk /dev/sdb: 2000GB
+      Sector size (logical/physical): 512B/512B
+      Partition Table: gpt
+
+      Number  Start   End     Size    File system  Name   Flags
+      1      17.4kB  1024MB  1024MB  ext3                 boot
+      2      1024MB  1751GB  1750GB  xfs          sw-aw2az1-object045-disk1
+      3      1751GB  2000GB  249GB                        lvm
+
+      (parted) rm 2
+      (parted) mkpart primary 2 -1
+      Warning: You requested a partition from 2000kB to 2000GB.
+      The closest location we can manage is 1024MB to 1751GB.
+      Is this still acceptable to you?
+      Yes/No? Yes
+      Warning: The resulting partition is not properly aligned for best performance.
+      Ignore/Cancel? Ignore
+      (parted) p
+      Model: HP LOGICAL VOLUME (scsi)
+      Disk /dev/sdb: 2000GB
+      Sector size (logical/physical): 512B/512B
+      Partition Table: gpt
+
+      Number  Start   End     Size    File system  Name     Flags
+      1      17.4kB  1024MB  1024MB  ext3                  boot
+      2      1024MB  1751GB  1750GB  xfs          primary
+      3      1751GB  2000GB  249GB                         lvm
+
+      (parted) quit
+
+#. Next step is to scrub the filesystem and format:
+
+   .. code:: console
+
+      $ sudo dd if=/dev/zero of=/dev/sdb2 bs=$((1024*1024)) count=1
+      1+0 records in
+      1+0 records out
+      1048576 bytes (1.0 MB) copied, 0.00480617 s, 218 MB/s
+      $ sudo /sbin/mkfs.xfs -f -i size=1024 /dev/sdb2
+      meta-data=/dev/sdb2              isize=1024   agcount=4, agsize=106811524 blks
+               =                       sectsz=512   attr=2, projid32bit=0
+      data     =                       bsize=4096   blocks=427246093, imaxpct=5
+               =                       sunit=0      swidth=0 blks
+      naming   =version 2              bsize=4096   ascii-ci=0
+      log      =internal log           bsize=4096   blocks=208616, version=2
+               =                       sectsz=512   sunit=0 blks, lazy-count=1
+      realtime =none                   extsz=4096   blocks=0, rtextents=0
+
+#. You should now label and mount your filesystem.
+
+#. Can now check to see if the filesystem is mounted using the command:
+
+   .. code:: console
+
+      $ mount
+
+.. _checking_if_account_ok:
+
+Procedure: Checking if an account is okay
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. note::
+
+   ``swift-direct`` is only available in the HPE Helion Public Cloud.
+   Use ``swiftly`` as an alternate (or use ``swift-get-nodes`` as explained
+   here).
+
+You must know the tenant/project ID. You can check if the account is okay as follows from a proxy.
+
+.. code:: console
+
+   $ sudo -u swift  /opt/hp/swift/bin/swift-direct show AUTH_<project-id>
+
+The response will either be similar to a swift list of the account
+containers, or an error indicating that the resource could not be found.
+
+Alternatively, you can use ``swift-get-nodes`` to find the account database
+files. Run the following on a proxy:
+
+.. code:: console
+
+   $ sudo swift-get-nodes /etc/swift/account.ring.gz  AUTH_<project-id>
+
+The response will print curl/ssh commands that will list the replicated
+account databases. Use the indicated ``curl`` or ``ssh`` commands to check
+the status and existence of the account.
+
+Procedure: Getting  swift account stats
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+.. note::
+
+   ``swift-direct`` is specific to the HPE Helion Public Cloud. Go look at
+   ``swifty`` for an alternate or use ``swift-get-nodes`` as explained
+   in :ref:`checking_if_account_ok`.
+
+This procedure describes how you determine the swift usage for a given
+swift account, that is the number of containers, number of objects and
+total bytes used. To do this you will need the project ID.
+
+Log onto one of the swift proxy servers.
+
+Use swift-direct to show this accounts usage:
+
+.. code:: console
+
+   $ sudo -u swift /opt/hp/swift/bin/swift-direct show AUTH_<project-id>
+   Status: 200
+         Content-Length: 0
+         Accept-Ranges: bytes
+         X-Timestamp: 1379698586.88364
+         X-Account-Bytes-Used: 67440225625994
+         X-Account-Container-Count: 1
+         Content-Type: text/plain; charset=utf-8
+         X-Account-Object-Count: 8436776
+         Status: 200
+         name: my_container  count: 8436776  bytes: 67440225625994
+
+This account has 1 container. That container has 8436776 objects. The
+total bytes used is 67440225625994.
+
+Procedure: Revive a deleted account
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Swift accounts are normally not recreated. If a tenant/project is deleted,
+the account can then be deleted. If the user wishes to use Swift again,
+the normal process is to create a new tenant/project -- and hence a
+new Swift account.
+
+However, if the Swift account is deleted, but the tenant/project is not
+deleted from Keystone, the user can no longer access the account. This
+is because the account is marked deleted in Swift. You can revive
+the account as described in this process.
+
+.. note::
+
+    The containers and objects in the "old" account cannot be listed
+    anymore. In addition, if the Account Reaper process has not
+    finished reaping the containers and objects in the "old" account, these
+    are effectively orphaned and it is virtually impossible to find and delete
+    them to free up disk space.
+
+The solution is to delete the account database files and
+re-create the account as follows:
+
+#. You must know the tenant/project ID. The account name is AUTH_<project-id>.
+   In this example, the tenant/project is ``4ebe3039674d4864a11fe0864ae4d905``
+   so the Swift account name is ``AUTH_4ebe3039674d4864a11fe0864ae4d905``.
+
+#. Use ``swift-get-nodes`` to locate the account's database files (on three
+   servers). The output has been truncated so we can focus on the import pieces
+   of data:
+
+   .. code:: console
+
+       $ sudo swift-get-nodes /etc/swift/account.ring.gz AUTH_4ebe3039674d4864a11fe0864ae4d905
+       ...
+       curl -I -XHEAD "http://192.168.245.5:6202/disk1/3934/AUTH_4ebe3039674d4864a11fe0864ae4d905"
+       curl -I -XHEAD "http://192.168.245.3:6202/disk0/3934/AUTH_4ebe3039674d4864a11fe0864ae4d905"
+       curl -I -XHEAD "http://192.168.245.4:6202/disk1/3934/AUTH_4ebe3039674d4864a11fe0864ae4d905"
+       ...
+       Use your own device location of servers:
+       such as "export DEVICE=/srv/node"
+       ssh 192.168.245.5 "ls -lah ${DEVICE:-/srv/node*}/disk1/accounts/3934/052/f5ecf8b40de3e1b0adb0dbe576874052"
+       ssh 192.168.245.3 "ls -lah ${DEVICE:-/srv/node*}/disk0/accounts/3934/052/f5ecf8b40de3e1b0adb0dbe576874052"
+       ssh 192.168.245.4 "ls -lah ${DEVICE:-/srv/node*}/disk1/accounts/3934/052/f5ecf8b40de3e1b0adb0dbe576874052"
+       ...
+       note: `/srv/node*` is used as default value of `devices`, the real value is set in the config file on each storage node.
+
+
+#. Before proceeding check that the account is really deleted by using curl. Execute the
+   commands printed by ``swift-get-nodes``. For example:
+
+   .. code:: console
+
+       $ curl -I -XHEAD "http://192.168.245.5:6202/disk1/3934/AUTH_4ebe3039674d4864a11fe0864ae4d905"
+       HTTP/1.1 404 Not Found
+       Content-Length: 0
+       Content-Type: text/html; charset=utf-8
+
+   Repeat for the other two servers (192.168.245.3 and 192.168.245.4).
+   A ``404 Not Found`` indicates that the account is deleted (or never existed).
+
+   If you get a ``204 No Content`` response, do **not** proceed.
+
+#. Use the ssh commands printed by ``swift-get-nodes`` to check if database
+   files exist. For example:
+
+   .. code:: console
+
+       $  ssh 192.168.245.5 "ls -lah ${DEVICE:-/srv/node*}/disk1/accounts/3934/052/f5ecf8b40de3e1b0adb0dbe576874052"
+       total 20K
+       drwxr-xr-x 2 swift swift 110 Mar  9 10:22 .
+       drwxr-xr-x 3 swift swift  45 Mar  9 10:18 ..
+       -rw------- 1 swift swift 17K Mar  9 10:22 f5ecf8b40de3e1b0adb0dbe576874052.db
+       -rw-r--r-- 1 swift swift   0 Mar  9 10:22 f5ecf8b40de3e1b0adb0dbe576874052.db.pending
+       -rwxr-xr-x 1 swift swift   0 Mar  9 10:18 .lock
+
+   Repeat for the other two servers (192.168.245.3 and 192.168.245.4).
+
+   If no files exist, no further action is needed.
+
+#. Stop Swift processes on all nodes listed by ``swift-get-nodes``
+   (In this example, that is 192.168.245.3, 192.168.245.4 and 192.168.245.5).
+
+#. We recommend you make backup copies of the database files.
+
+#. Delete the database files. For example:
+
+   .. code:: console
+
+       $ ssh 192.168.245.5
+       $ cd /srv/node/disk1/accounts/3934/052/f5ecf8b40de3e1b0adb0dbe576874052
+       $ sudo rm *
+
+   Repeat for the other two servers (192.168.245.3 and 192.168.245.4).
+
+#. Restart Swift on all three servers
+
+At this stage, the account is fully deleted. If you enable the auto-create option, the
+next time the user attempts to access the account, the account will be created.
+You may also use swiftly to recreate the account.
+
+
+Procedure: Temporarily stop load balancers from directing traffic to a proxy server
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+You can stop the load balancers sending requests to a proxy server as
+follows. This can be useful when a proxy is misbehaving but you need
+Swift running to help diagnose the problem. By removing from the load
+balancers, customer's are not impacted by the misbehaving proxy.
+
+#. Ensure that in /etc/swift/proxy-server.conf the ``disable_path`` variable is set to
+   ``/etc/swift/disabled-by-file``.
+
+#. Log onto the proxy node.
+
+#. Shut down Swift as follows:
+
+   .. code:: console
+
+      $ sudo swift-init proxy shutdown
+
+   .. note::
+
+      Shutdown, not stop.
+
+#. Create the ``/etc/swift/disabled-by-file`` file. For example:
+
+   .. code:: console
+
+      $ sudo touch /etc/swift/disabled-by-file
+
+#. Optional, restart Swift:
+
+   .. code:: console
+
+      $ sudo swift-init proxy start
+
+It works because the healthcheck middleware looks for /etc/swift/disabled-by-file.
+If it exists, the middleware will return 503/error instead of 200/OK. This means the load balancer
+should stop sending traffic to the proxy.
+
+Procedure: Ad-Hoc disk performance test
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+You can get an idea whether a disk drive is performing as follows:
+
+.. code:: console
+
+   $ sudo dd bs=1M count=256 if=/dev/zero conv=fdatasync of=/srv/node/disk11/remember-to-delete-this-later
+
+You can expect ~600MB/sec. If you get a low number, repeat many times as
+Swift itself may also read or write to the disk, hence giving a lower
+number.
diff --git a/doc/source/ops_runbook/troubleshooting.rst b/doc/source/ops_runbook/troubleshooting.rst
new file mode 100644
index 0000000000..75511010cd
--- /dev/null
+++ b/doc/source/ops_runbook/troubleshooting.rst
@@ -0,0 +1,259 @@
+====================
+Troubleshooting tips
+====================
+
+Diagnose: Customer complains they receive a HTTP status 500 when trying to browse containers
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+This entry is prompted by a real customer issue and exclusively focused on how
+that problem was identified.
+There are many reasons why a http status of 500 could be returned. If
+there are no obvious problems with the swift object store, then it may
+be necessary to take a closer look at the users transactions.
+After finding the users swift account, you can
+search the swift proxy logs on each swift proxy server for
+transactions from this user. The linux ``bzgrep`` command can be used to
+search all the proxy log files on a node including the ``.bz2`` compressed
+files. For example:
+
+.. code:: console
+
+   $ PDSH_SSH_ARGS_APPEND="-o StrictHostKeyChecking=no" pdsh -l <yourusername> -R ssh \
+     -w <redacted>.68.[4-11,132-139 4-11,132-139],<redacted>.132.[4-11,132-139] \
+     'sudo bzgrep -w AUTH_redacted-4962-4692-98fb-52ddda82a5af /var/log/swift/proxy.log*' |  dshbak -c
+   .
+   .
+   ----------------
+   <redacted>.132.6
+   ----------------
+   Feb 29 08:51:57 sw-aw2az2-proxy011 proxy-server <redacted>.16.132
+   <redacted>.66.8 29/Feb/2012/08/51/57 GET /v1.0/AUTH_redacted-4962-4692-98fb-52ddda82a5af
+   /%3Fformat%3Djson HTTP/1.0 404 - - <REDACTED>_4f4d50c5e4b064d88bd7ab82 - - -
+   tx429fc3be354f434ab7f9c6c4206c1dc3 - 0.0130
+
+This shows a ``GET`` operation on the users account.
+
+.. note::
+
+   The HTTP status returned is 404, Not found, rather than 500 as reported by the user.
+
+Using the transaction ID, ``tx429fc3be354f434ab7f9c6c4206c1dc3`` you can
+search the swift object servers log files for this transaction ID:
+
+.. code:: console
+
+   $ PDSH_SSH_ARGS_APPEND="-o StrictHostKeyChecking=no" pdsh -l <yourusername> -R ssh \
+     -w <redacted>.72.[4-67|4-67],<redacted>.[4-67|4-67],<redacted>.[4-67|4-67],<redacted>.204.[4-131] \
+     'sudo bzgrep tx429fc3be354f434ab7f9c6c4206c1dc3 /var/log/swift/server.log*' | dshbak -c
+   .
+   .
+   ----------------
+   <redacted>.72.16
+   ----------------
+   Feb 29 08:51:57 sw-aw2az1-object013 account-server <redacted>.132.6 - -
+
+   [29/Feb/2012:08:51:57 +0000|] "GET /disk9/198875/AUTH_redacted-4962-4692-98fb-52ddda82a5af"
+   404 - "tx429fc3be354f434ab7f9c6c4206c1dc3" "-" "-"
+
+   0.0016 ""
+   ----------------
+   <redacted>.31
+   ----------------
+   Feb 29 08:51:57 node-az2-object060 account-server <redacted>.132.6 - -
+   [29/Feb/2012:08:51:57 +0000|] "GET /disk6/198875/AUTH_redacted-4962-
+   4692-98fb-52ddda82a5af" 404 - "tx429fc3be354f434ab7f9c6c4206c1dc3" "-" "-" 0.0011 ""
+   ----------------
+   <redacted>.204.70
+   ----------------
+
+   Feb 29 08:51:57 sw-aw2az3-object0067 account-server <redacted>.132.6 - -
+   [29/Feb/2012:08:51:57 +0000|] "GET /disk6/198875/AUTH_redacted-4962-
+   4692-98fb-52ddda82a5af" 404 - "tx429fc3be354f434ab7f9c6c4206c1dc3" "-" "-" 0.0014 ""
+
+.. note::
+
+   The 3 GET operations to 3 different object servers that hold the 3
+   replicas of this users account. Each ``GET`` returns a HTTP status of 404,
+   Not found.
+
+Next, use the ``swift-get-nodes`` command to determine exactly where the
+user's account data is stored:
+
+.. code:: console
+
+   $ sudo swift-get-nodes /etc/swift/account.ring.gz AUTH_redacted-4962-4692-98fb-52ddda82a5af
+   Account AUTH_redacted-4962-4692-98fb-52ddda82a5af
+   Container None
+   Object None
+
+   Partition 198875
+   Hash 1846d99185f8a0edaf65cfbf37439696
+
+   Server:Port Device <redacted>.31:6202 disk6
+   Server:Port Device <redacted>.204.70:6202 disk6
+   Server:Port Device <redacted>.72.16:6202 disk9
+   Server:Port Device <redacted>.204.64:6202 disk11 [Handoff]
+   Server:Port Device <redacted>.26:6202 disk11 [Handoff]
+   Server:Port Device <redacted>.72.27:6202 disk11 [Handoff]
+
+   curl -I -XHEAD "`http://<redacted>.31:6202/disk6/198875/AUTH_redacted-4962-4692-98fb-52ddda82a5af"
+   <http://15.185.138.31:6202/disk6/198875/AUTH_db0050ad-4962-4692-98fb-52ddda82a5af>`_
+   curl -I -XHEAD "`http://<redacted>.204.70:6202/disk6/198875/AUTH_redacted-4962-4692-98fb-52ddda82a5af"
+   <http://15.185.204.70:6202/disk6/198875/AUTH_db0050ad-4962-4692-98fb-52ddda82a5af>`_
+   curl -I -XHEAD "`http://<redacted>.72.16:6202/disk9/198875/AUTH_redacted-4962-4692-98fb-52ddda82a5af"
+   <http://15.185.72.16:6202/disk9/198875/AUTH_db0050ad-4962-4692-98fb-52ddda82a5af>`_
+   curl -I -XHEAD "`http://<redacted>.204.64:6202/disk11/198875/AUTH_redacted-4962-4692-98fb-52ddda82a5af"
+   <http://15.185.204.64:6202/disk11/198875/AUTH_db0050ad-4962-4692-98fb-52ddda82a5af>`_ # [Handoff]
+   curl -I -XHEAD "`http://<redacted>.26:6202/disk11/198875/AUTH_redacted-4962-4692-98fb-52ddda82a5af"
+   <http://15.185.136.26:6202/disk11/198875/AUTH_db0050ad-4962-4692-98fb-52ddda82a5af>`_ # [Handoff]
+   curl -I -XHEAD "`http://<redacted>.72.27:6202/disk11/198875/AUTH_redacted-4962-4692-98fb-52ddda82a5af"
+   <http://15.185.72.27:6202/disk11/198875/AUTH_db0050ad-4962-4692-98fb-52ddda82a5af>`_ # [Handoff]
+
+   ssh <redacted>.31 "ls -lah /srv/node/disk6/accounts/198875/696/1846d99185f8a0edaf65cfbf37439696/"
+   ssh <redacted>.204.70 "ls -lah /srv/node/disk6/accounts/198875/696/1846d99185f8a0edaf65cfbf37439696/"
+   ssh <redacted>.72.16 "ls -lah /srv/node/disk9/accounts/198875/696/1846d99185f8a0edaf65cfbf37439696/"
+   ssh <redacted>.204.64 "ls -lah /srv/node/disk11/accounts/198875/696/1846d99185f8a0edaf65cfbf37439696/" # [Handoff]
+   ssh <redacted>.26 "ls -lah /srv/node/disk11/accounts/198875/696/1846d99185f8a0edaf65cfbf37439696/" # [Handoff]
+   ssh <redacted>.72.27 "ls -lah /srv/node/disk11/accounts/198875/696/1846d99185f8a0edaf65cfbf37439696/" # [Handoff]
+
+Check each of the primary servers, <redacted>.31, <redacted>.204.70  and <redacted>.72.16, for
+this users account. For example on <redacted>.72.16:
+
+.. code:: console
+
+   $ ls -lah /srv/node/disk9/accounts/198875/696/1846d99185f8a0edaf65cfbf37439696/
+   total 1.0M
+   drwxrwxrwx 2 swift swift 98 2012-02-23 14:49 .
+   drwxrwxrwx 3 swift swift 45 2012-02-03 23:28 ..
+   -rw------- 1 swift swift 15K 2012-02-23 14:49 1846d99185f8a0edaf65cfbf37439696.db
+   -rw-rw-rw- 1 swift swift 0 2012-02-23 14:49 1846d99185f8a0edaf65cfbf37439696.db.pending
+
+So this users account db, an sqlite db is present. Use sqlite to
+checkout the account:
+
+.. code:: console
+
+   $ sudo cp /srv/node/disk9/accounts/198875/696/1846d99185f8a0edaf65cfbf37439696/1846d99185f8a0edaf65cfbf37439696.db /tmp
+   $ sudo sqlite3 /tmp/1846d99185f8a0edaf65cfbf37439696.db
+   sqlite> .mode line
+   sqlite> select * from account_stat;
+   account = AUTH_redacted-4962-4692-98fb-52ddda82a5af
+   created_at = 1328311738.42190
+   put_timestamp = 1330000873.61411
+   delete_timestamp = 1330001026.00514
+   container_count = 0
+   object_count = 0
+   bytes_used = 0
+   hash = eb7e5d0ea3544d9def940b19114e8b43
+   id = 2de8c8a8-cef9-4a94-a421-2f845802fe90
+   status = DELETED
+   status_changed_at = 1330001026.00514
+   metadata =
+
+.. note:
+
+   The status is ``DELETED``. So this account was deleted. This explains
+   why the GET operations are returning 404, not found. Check the account
+   delete date/time:
+
+   .. code:: console
+
+      $ python
+
+      >>> import time
+      >>> time.ctime(1330001026.00514)
+      'Thu Feb 23 12:43:46 2012'
+
+Next try and find the ``DELETE`` operation for this account in the proxy
+server logs:
+
+.. code:: console
+
+   $ PDSH_SSH_ARGS_APPEND="-o StrictHostKeyChecking=no" pdsh -l <yourusername> -R ssh \
+     -w <redacted>.68.[4-11,132-139 4-11,132-139],<redacted>.132.[4-11,132-139|4-11,132-139] \
+     'sudo bzgrep AUTH_redacted-4962-4692-98fb-52ddda82a5af /var/log/swift/proxy.log* \
+     | grep -w DELETE | awk "{print $3,$10,$12}"' |- dshbak -c
+   .
+   .
+   Feb 23 12:43:46 sw-aw2az2-proxy001 proxy-server <redacted> <redacted>.66.7 23/Feb/2012/12/43/46 DELETE /v1.0/AUTH_redacted-4962-4692-98fb-
+   52ddda82a5af/ HTTP/1.0 204 - Apache-HttpClient/4.1.2%20%28java%201.5%29 <REDACTED>_4f458ee4e4b02a869c3aad02 - - -
+   tx4471188b0b87406899973d297c55ab53 - 0.0086
+
+From this you can see the operation that resulted in the account being deleted.
+
+Procedure: Deleting objects
+~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Simple case - deleting small number of objects and containers
+-------------------------------------------------------------
+
+.. note::
+
+   ``swift-direct`` is specific to the Hewlett Packard Enterprise Helion Public Cloud.
+   Use ``swiftly`` as an alternative.
+
+.. note::
+
+   Object and container names are in UTF8. Swift direct accepts UTF8
+   directly, not URL-encoded UTF8 (the REST API expects UTF8 and then
+   URL-encoded). In practice cut and paste of foreign language strings to
+   a terminal window will produce the right result.
+
+   Hint: Use the ``head`` command before any destructive commands.
+
+To delete a small number of objects, log into any proxy node and proceed
+as follows:
+
+Examine the object in question:
+
+.. code:: console
+
+   $ sudo -u swift /opt/hp/swift/bin/swift-direct head 132345678912345 container_name obj_name
+
+See if ``X-Object-Manifest`` or ``X-Static-Large-Object`` is set,
+then this is the manifest object and segment objects may be in another
+container.
+
+If the ``X-Object-Manifest`` attribute is set, you need to find the
+name of the objects this means it is a DLO. For example,
+if ``X-Object-Manifest`` is ``container2/seg-blah``, list the contents
+of the container container2 as follows:
+
+.. code:: console
+
+   $ sudo -u swift /opt/hp/swift/bin/swift-direct show 132345678912345 container2
+
+Pick out the objects whose names start with ``seg-blah``.
+Delete the segment objects as follows:
+
+.. code:: console
+
+   $ sudo -u swift /opt/hp/swift/bin/swift-direct delete 132345678912345 container2 seg-blah01
+   $ sudo -u swift /opt/hp/swift/bin/swift-direct delete 132345678912345 container2 seg-blah02
+   etc
+
+If ``X-Static-Large-Object`` is set, you need to read the contents. Do this by:
+
+-  Using swift-get-nodes to get the details of the object's location.
+-  Change the ``-X HEAD`` to ``-X GET`` and run ``curl`` against one copy.
+-  This lists a JSON body listing containers and object names
+-  Delete the objects as described above for DLO segments
+
+Once the segments are deleted, you can delete the object using
+``swift-direct`` as described above.
+
+Finally, use ``swift-direct`` to delete the container.
+
+Procedure: Decommissioning swift nodes
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+Should Swift nodes need to be decommissioned (e.g.,, where they are being
+re-purposed), it is very important to follow the following steps.
+
+#. In the case of object servers, follow the procedure for removing
+   the node from the rings.
+#. In the case of swift proxy servers, have the network team remove
+   the node from the load balancers.
+#. Open a network ticket to have the node removed from network
+   firewalls.
+#. Make sure that you remove the ``/etc/swift`` directory and everything in it.
diff --git a/doc/source/overview_acl.rst b/doc/source/overview_acl.rst
new file mode 100644
index 0000000000..d4c1ca09e2
--- /dev/null
+++ b/doc/source/overview_acl.rst
@@ -0,0 +1,410 @@
+
+===========================
+Access Control Lists (ACLs)
+===========================
+
+Normally to create, read and modify containers and objects, you must have the
+appropriate roles on the project associated with the account, i.e., you
+must be the owner of the account. However, an owner can grant access to
+other users by using an Access Control List (ACL).
+
+There are two types of ACLs:
+
+- :ref:`container_acls`. These are specified on a container and
+  apply to that container only and the objects in the container.
+- :ref:`account_acls`. These are specified at the account level and
+  apply to all containers and objects in the account.
+
+.. _container_acls:
+
+--------------
+Container ACLs
+--------------
+
+Container ACLs are stored in the ``X-Container-Write`` and ``X-Container-Read``
+metadata. The scope of the ACL is limited to the container where the
+metadata is set and the objects in the container. In addition:
+
+- ``X-Container-Write`` grants the ability to perform PUT, POST and DELETE
+  operations on objects within a container. It does not grant the ability
+  to perform POST or DELETE operations on the container itself. Some ACL
+  elements also grant the ability to perform HEAD or GET operations on the
+  container.
+
+- ``X-Container-Read`` grants the ability to perform GET and HEAD
+  operations on objects within a container. Some of the ACL elements also grant
+  the ability to perform HEAD or GET operations on the container itself.
+  However, a container ACL does not allow access to privileged metadata (such
+  as ``X-Container-Sync-Key``).
+
+Container ACLs use the "V1" ACL syntax which is a comma separated string
+of elements as shown in the following example::
+
+    .r:*,.rlistings,7ec59e87c6584c348b563254aae4c221:*
+
+Spaces may occur between elements as shown in the following example::
+
+
+    .r : *, .rlistings, 7ec59e87c6584c348b563254aae4c221:*
+
+However, these spaces are removed from the value stored in the
+``X-Container-Write`` and ``X-Container-Read`` metadata. In addition,
+the ``.r:`` string can be written as ``.referrer:``, but is stored as ``.r:``.
+
+While all auth systems use
+the same syntax, the meaning of some elements
+is different because of the different concepts used by different
+auth systems as explained in the following sections:
+
+- :ref:`acl_common_elements`
+- :ref:`acl_keystone_elements`
+- :ref:`acl_tempauth_elements`
+
+
+.. _acl_common_elements:
+
+Common ACL Elements
+-------------------
+
+The following table describes elements of an ACL that are
+supported by both Keystone auth and TempAuth. These elements
+should only be used with ``X-Container-Read`` (with the exception
+of ``.rlistings``, an error will occur if used with
+``X-Container-Write``):
+
+============================== ================================================
+Element                        Description
+============================== ================================================
+.r:*                           Any user has access to objects. No token is
+                               required in the request.
+.r:<referrer>                  The referrer is granted access to objects. The
+                               referrer is identified by the ``Referer``
+                               request header in the request. No token is
+                               required.
+.r:-<referrer>                 This syntax (with "-" prepended to the
+                               referrer) is supported. However, it does not
+                               deny access if another element (e.g., ``.r:*``)
+                               grants access.
+.rlistings                     Any user can perform a HEAD or GET operation
+                               on the container provided the user also has
+                               read access on objects (e.g., also has ``.r:*``
+                               or ``.r:<referrer>``. No token is required.
+============================== ================================================
+
+.. _acl_keystone_elements:
+
+Keystone Auth ACL Elements
+--------------------------
+
+The following table describes elements of an ACL that are
+supported only by Keystone auth. Keystone auth also supports
+the elements described in :ref:`acl_common_elements`.
+
+A token must be included in the request for any of these ACL elements
+to take effect.
+
+============================== ================================================
+Element                        Description
+============================== ================================================
+<project-id>:<user-id>         The specified user, provided a token
+                               scoped to the project is included
+                               in the request, is granted access.
+                               Access to the container is also granted
+                               when used in ``X-Container-Read``.
+<project-id>:\*                Any user with a role in the specified Keystone
+                               project has access. A token scoped to the
+                               project must be included in the request.
+                               Access to the container is also granted
+                               when used in ``X-Container-Read``.
+\*:<user-id>                   The specified user has access. A token
+                               for the user (scoped to any
+                               project) must be included in the request.
+                               Access to the container is also granted
+                               when used in ``X-Container-Read``.
+\*:\*                          Any user has access.
+                               Access to the container is also granted
+                               when used in ``X-Container-Read``.
+                               The ``*:*`` element differs from the ``.r:*``
+                               element because
+                               ``*:*`` requires that a valid token is
+                               included in the request whereas ``.r:*``
+                               does not require a token. In addition,
+                               ``.r:*`` does not grant access to the
+                               container listing.
+<role_name>                    A user with the specified role *name* on the
+                               project within which the container is stored is
+                               granted access. A user token scoped to the
+                               project must be included in the request. Access
+                               to the container is also granted when used in
+                               ``X-Container-Read``.
+============================== ================================================
+
+.. note::
+
+    Keystone project (tenant) or user *names* (i.e.,
+    ``<project-name>:<user-name>``) must no longer be
+    used because with the introduction
+    of domains in Keystone, names are not globally unique. You should
+    use user and project *ids* instead.
+
+    For backwards compatibility, ACLs using names will be granted by
+    keystoneauth when it can be established that
+    the grantee project, the grantee user and the project being
+    accessed are either not yet in a domain (e.g. the ``X-Auth-Token`` has
+    been obtained via the Keystone V2 API) or are all in the default domain
+    to which legacy accounts would have been migrated.
+
+
+.. _acl_tempauth_elements:
+
+TempAuth ACL Elements
+---------------------
+
+The following table describes elements of an ACL that are
+supported only by TempAuth. TempAuth auth also supports
+the elements described in :ref:`acl_common_elements`.
+
+============================== ================================================
+Element                        Description
+============================== ================================================
+<user-name>                    The named user is granted access. The
+                               wildcard ("*") character is not supported.
+                               A token from the user must be included in the
+                               request.
+============================== ================================================
+
+----------------------
+Container ACL Examples
+----------------------
+
+Container ACLs may be set by including ``X-Container-Write`` and/or
+``X-Container-Read`` headers with a PUT or a POST request to the container URL.
+The following examples use the ``swift`` command line client which support
+these headers being set via its ``--write-acl`` and ``--read-acl`` options.
+
+Example: Public Container
+-------------------------
+
+The following allows anybody to list objects in the ``www`` container and
+download objects. The users do not need to include a token in
+their request. This ACL is commonly referred to as making the
+container "public". It is useful when used with :ref:`staticweb`::
+
+    swift post www --read-acl ".r:*,.rlistings"
+
+
+Example: Shared Writable Container
+----------------------------------
+
+The following allows anybody to upload or download objects. However, to
+download an object, the exact name of the object must be known since
+users cannot list the objects in the container.
+The users must include a Keystone token in the upload request. However, it does not
+need to be scoped to the project associated with the container::
+
+    swift post www --read-acl ".r:*" --write-acl "*:*"
+
+
+Example: Sharing a Container with Project Members
+-------------------------------------------------
+
+The following allows any member of the ``77b8f82565f14814bece56e50c4c240f``
+project to upload and download objects or to list the contents
+of the ``www`` container. A token scoped to the ``77b8f82565f14814bece56e50c4c240f``
+project must be included in the request::
+
+    swift post www --read-acl "77b8f82565f14814bece56e50c4c240f:*" \
+                   --write-acl "77b8f82565f14814bece56e50c4c240f:*"
+
+
+Example: Sharing a Container with Users having a specified Role
+---------------------------------------------------------------
+
+The following allows any user that has been assigned the
+``my_read_access_role`` on the project within which the ``www`` container is
+stored to download objects or to list the contents of the ``www`` container. A
+user token scoped to the project must be included in the download or list
+request::
+
+    swift post www --read-acl "my_read_access_role"
+
+
+Example: Allowing a Referrer Domain to Download Objects
+-------------------------------------------------------
+
+The following allows any request from
+the ``example.com`` domain to access an object in the container::
+
+    swift post www --read-acl ".r:.example.com"
+
+However, the request from the user **must** contain the appropriate
+`Referer` header as shown in this example request::
+
+    curl -i $publicURL/www/document --head -H "Referer: http://www.example.com/index.html"
+
+.. note::
+
+    The `Referer` header is included in requests by many browsers. However,
+    since it is easy to create a request with any desired value in the
+    `Referer` header, the referrer ACL has very weak security.
+
+
+Example: Sharing a Container with Another User
+----------------------------------------------
+
+Sharing a Container with another user requires the knowledge of few
+parameters regarding the users.
+
+The sharing user must know:
+
+- the ``OpenStack user id`` of the other user
+
+The sharing user must communicate to the other user:
+
+- the name of the shared container
+- the ``OS_STORAGE_URL``
+
+Usually the ``OS_STORAGE_URL`` is not exposed directly to the user
+because the ``swift client`` by default automatically construct the
+``OS_STORAGE_URL`` based on the User credential.
+
+We assume that in the current directory there are the two client
+environment script for the two users ``sharing.openrc`` and
+``other.openrc``.
+
+The ``sharing.openrc`` should be similar to the following:
+
+.. code-block:: bash
+
+    export OS_USERNAME=sharing
+    # WARNING: Save the password in clear text only for testing purposes
+    export OS_PASSWORD=password
+    export OS_TENANT_NAME=projectName
+    export OS_AUTH_URL=https://identityHost:portNumber/v2.0
+    # The following lines can be omitted
+    export OS_TENANT_ID=tenantIDString
+    export OS_REGION_NAME=regionName
+    export OS_CACERT=/path/to/cacertFile
+
+The ``other.openrc`` should be similar to the following:
+
+.. code-block:: bash
+
+    export OS_USERNAME=other
+    # WARNING: Save the password in clear text only for testing purposes
+    export OS_PASSWORD=otherPassword
+    export OS_TENANT_NAME=otherProjectName
+    export OS_AUTH_URL=https://identityHost:portNumber/v2.0
+    # The following lines can be omitted
+    export OS_TENANT_ID=tenantIDString
+    export OS_REGION_NAME=regionName
+    export OS_CACERT=/path/to/cacertFile
+
+For more information see `using the OpenStack RC file
+<https://docs.openstack.org/user-guide/common/cli-set-environment-variables-using-openstack-rc.html>`_
+
+First we figure out the other user id::
+
+    . other.openrc
+    OUID="$(openstack user show --format json "${OS_USERNAME}" | jq -r .id)"
+
+or alternatively::
+
+    . other.openrc
+    OUID="$(openstack token issue -f json | jq -r .user_id)"
+
+Then we figure out the storage url of the sharing user::
+
+    sharing.openrc
+    SURL="$(swift auth | awk -F = '/OS_STORAGE_URL/ {print $2}')"
+
+Running as the sharing user create a shared container named ``shared``
+in read-only mode with the other user using the proper acl::
+
+    sharing.openrc
+    swift post --read-acl "*:${OUID}" shared
+
+Running as the sharing user create and upload a test file::
+
+    touch void
+    swift upload shared void
+
+Running as the other user list the files in the ``shared`` container::
+
+    other.openrc
+    swift --os-storage-url="${SURL}" list shared
+
+Running as the other user download the ``shared`` container in the
+``/tmp`` directory::
+
+    cd /tmp
+    swift --os-storage-url="${SURL}" download shared
+
+
+.. _account_acls:
+
+------------
+Account ACLs
+------------
+
+.. note::
+
+    Account ACLs are not currently supported by Keystone auth
+
+The ``X-Account-Access-Control`` header is used to specify
+account-level ACLs in a format specific to the auth system.
+These headers are visible and settable only by account owners (those for whom
+``swift_owner`` is true).
+Behavior of account ACLs is auth-system-dependent.  In the case of TempAuth,
+if an authenticated user has membership in a group which is listed in the
+ACL, then the user is allowed the access level of that ACL.
+
+Account ACLs use the "V2" ACL syntax, which is a JSON dictionary with keys
+named "admin", "read-write", and "read-only".  (Note the case sensitivity.)
+An example value for the ``X-Account-Access-Control`` header looks like this,
+where ``a``, ``b`` and ``c`` are user names::
+
+   {"admin":["a","b"],"read-only":["c"]}
+
+Keys may be absent (as shown in above example).
+
+The recommended way to generate ACL strings is as follows::
+
+  from swift.common.middleware.acl import format_acl
+  acl_data = { 'admin': ['alice'], 'read-write': ['bob', 'carol'] }
+  acl_string = format_acl(version=2, acl_dict=acl_data)
+
+Using the :func:`format_acl` method will ensure
+that JSON is encoded as ASCII (using e.g. '\u1234' for Unicode).  While
+it's permissible to manually send ``curl`` commands containing
+``X-Account-Access-Control`` headers, you should exercise caution when
+doing so, due to the potential for human error.
+
+Within the JSON dictionary stored in ``X-Account-Access-Control``, the keys
+have the following meanings:
+
+============   ==============================================================
+Access Level   Description
+============   ==============================================================
+read-only      These identities can read *everything* (except privileged
+               headers) in the account.  Specifically, a user with read-only
+               account access can get a list of containers in the account,
+               list the contents of any container, retrieve any object, and
+               see the (non-privileged) headers of the account, any
+               container, or any object.
+read-write     These identities can read or write (or create) any container.
+               A user with read-write account access can create new
+               containers, set any unprivileged container headers, overwrite
+               objects, delete containers, etc.  A read-write user can NOT
+               set account headers (or perform any PUT/POST/DELETE requests
+               on the account).
+admin          These identities have "swift_owner" privileges.  A user with
+               admin account access can do anything the account owner can,
+               including setting account headers and any privileged headers
+               -- and thus granting read-only, read-write, or admin access
+               to other users.
+============   ==============================================================
+
+
+For more details, see :mod:`swift.common.middleware.tempauth`.  For details
+on the ACL format, see :mod:`swift.common.middleware.acl`.
diff --git a/doc/source/overview_architecture.rst b/doc/source/overview_architecture.rst
index 7cd56a8c7c..b0ae293d9a 100644
--- a/doc/source/overview_architecture.rst
+++ b/doc/source/overview_architecture.rst
@@ -2,8 +2,6 @@
 Swift Architectural Overview
 ============================
 
-.. TODO - add links to more detailed overview in each section below.
-
 ------------
 Proxy Server
 ------------
@@ -11,7 +9,10 @@ Proxy Server
 The Proxy Server is responsible for tying together the rest of the Swift
 architecture. For each request, it will look up the location of the account,
 container, or object in the ring (see below) and route the request accordingly.
-The public API is also exposed through the Proxy Server.
+For Erasure Code type policies, the Proxy Server is also responsible for
+encoding and decoding object data.  See :doc:`overview_erasure_code` for
+complete information on Erasure Code support.  The public API is also exposed
+through the Proxy Server.
 
 A large number of failures are also handled in the Proxy Server. For
 example, if a server is unavailable for an object PUT, it will ask the
@@ -27,9 +28,9 @@ The Ring
 
 A ring represents a mapping between the names of entities stored on disk and
 their physical location. There are separate rings for accounts, containers, and
-objects. When other components need to perform any operation on an object,
-container, or account, they need to interact with the appropriate ring to
-determine its location in the cluster.
+one object ring per storage policy. When other components need to perform any
+operation on an object, container, or account, they need to interact with the
+appropriate ring to determine its location in the cluster.
 
 The Ring maintains this mapping using zones, devices, partitions, and replicas.
 Each partition in the ring is replicated, by default, 3 times across the
@@ -37,22 +38,71 @@ cluster, and the locations for a partition are stored in the mapping maintained
 by the ring. The ring is also responsible for determining which devices are
 used for handoff in failure scenarios.
 
-Data can be isolated with the concept of zones in the ring. Each replica
-of a partition is guaranteed to reside in a different zone. A zone could
-represent a drive, a server, a cabinet, a switch, or even a datacenter.
+The replicas of each partition will be isolated onto as many distinct regions,
+zones, servers and devices as the capacity of these failure domains allow.  If
+there are less failure domains at a given tier than replicas of the partition
+assigned within a tier (e.g. a 3 replica cluster with 2 servers), or the
+available capacity across the failure domains within a tier are not well
+balanced it will not be possible to achieve both even capacity distribution
+(`balance`) as well as complete isolation of replicas across failure domains
+(`dispersion`).  When this occurs the ring management tools will display a
+warning so that the operator can evaluate the cluster topology.
+
+Data is evenly distributed across the capacity available in the cluster as
+described by the devices weight.  Weights can be used to balance the
+distribution of partitions on drives across the cluster. This can be useful,
+for example, when different sized drives are used in a cluster.  Device
+weights can also be used when adding or removing capacity or failure domains
+to control how many partitions are reassigned during a rebalance to be moved
+as soon as replication bandwidth allows.
+
+.. note::
+    Prior to Swift 2.1.0 it was not possible to restrict partition movement by
+    device weight when adding new failure domains, and would allow extremely
+    unbalanced rings.  The greedy dispersion algorithm is now subject to the
+    constraints of the physical capacity in the system, but can be adjusted
+    with-in reason via the overload option.  Artificially unbalancing the
+    partition assignment without respect to capacity can introduce unexpected
+    full devices when a given failure domain does not physically support its
+    share of the used capacity in the tier.
+
+When partitions need to be moved around (for example if a device is added to
+the cluster), the ring ensures that a minimum number of partitions are moved
+at a time, and only one replica of a partition is moved at a time.
+
+The ring is used by the Proxy server and several background processes
+(like replication). See :doc:`overview_ring` for complete information on the
+ring.
+
+----------------
+Storage Policies
+----------------
 
-The partitions of the ring are equally divided among all the devices in the
-Swift installation. When partitions need to be moved around (for example if a
-device is added to the cluster), the ring ensures that a minimum number of
-partitions are moved at a time, and only one replica of a partition is moved at
-a time.
+Storage Policies provide a way for object storage providers to differentiate
+service levels, features and behaviors of a Swift deployment.  Each Storage
+Policy configured in Swift is exposed to the client via an abstract name.
+Each device in the system is assigned to one or more Storage Policies.  This
+is accomplished through the use of multiple object rings, where each Storage
+Policy has an independent object ring, which may include a subset of hardware
+implementing a particular differentiation.
 
-Weights can be used to balance the distribution of partitions on drives
-across the cluster. This can be useful, for example, when different sized
-drives are used in a cluster.
+For example, one might have the default policy with 3x replication, and create
+a second policy which, when applied to new containers only uses 2x replication.
+Another might add SSDs to a set of storage nodes and create a performance tier
+storage policy for certain containers to have their objects stored there.  Yet
+another might be the use of Erasure Coding to define a cold-storage tier.
 
-The ring is used by the Proxy server and several background processes
-(like replication).
+This mapping is then exposed on a per-container basis, where each container
+can be assigned a specific storage policy when it is created, which remains in
+effect for the lifetime of the container.  Applications require minimal
+awareness of storage policies to use them; once a container has been created
+with a specific policy, all objects stored in it will be done so in accordance
+with that policy.
+
+The Storage Policies feature is implemented throughout the entire code base so
+it is an important concept in understanding Swift architecture.
+
+See :doc:`overview_policies` for complete information on storage policies.
 
 -------------
 Object Server
@@ -111,6 +161,19 @@ item (object, container, or account) is deleted, a tombstone is set as the
 latest version of the item. The replicator will see the tombstone and ensure
 that the item is removed from the entire system.
 
+See :doc:`overview_replication` for complete information on replication.
+
+--------------
+Reconstruction
+--------------
+
+The reconstructor is used by Erasure Code policies and is analogous to the
+replicator for Replication type policies.  See :doc:`overview_erasure_code`
+for complete information on both Erasure Code support as well as the
+reconstructor.
+
+.. _architecture_updaters:
+
 --------
 Updaters
 --------
@@ -141,5 +204,4 @@ containers, and accounts. If corruption is found (in the case of bit rot,
 for example), the file is quarantined, and replication will replace the bad
 file from another replica. If other errors are found they are logged (for
 example, an object's listing can't be found on any container server it
-should be).
-
+should be).
\ No newline at end of file
diff --git a/doc/source/overview_auth.rst b/doc/source/overview_auth.rst
index ee0f3fb85d..d5b1be6324 100644
--- a/doc/source/overview_auth.rst
+++ b/doc/source/overview_auth.rst
@@ -3,12 +3,11 @@ The Auth System
 ===============
 
 --------
-TempAuth
+Overview
 --------
 
-The auth system for Swift is loosely based on the auth system from the existing
-Rackspace architecture -- actually from a few existing auth systems -- and is
-therefore a bit disjointed. The distilled points about it are:
+Swift supports a number of auth systems that share the following common
+characteristics:
 
 * The authentication/authorization part can be an external system or a
   subsystem run within Swift as WSGI middleware
@@ -26,51 +25,101 @@ validation.
 
 Swift will make calls to the auth system, giving the auth token to be
 validated. For a valid token, the auth system responds with an overall
-expiration in seconds from now. Swift will cache the token up to the expiration
+expiration time in seconds from now. To avoid the overhead in validating the same
+token over and over again, Swift will cache the
+token for a configurable time, but no longer than the expiration
 time.
 
-The included TempAuth also has the concept of admin and non-admin users within
-an account. Admin users can do anything within the account. Non-admin users can
-only perform operations per container based on the container's X-Container-Read
-and X-Container-Write ACLs. For more information on ACLs, see
-:mod:`swift.common.middleware.acl`.
+The Swift project includes two auth systems:
+
+- :ref:`temp_auth`
+- :ref:`keystone_auth`
+
+It is also possible to write your own auth system as described in
+:ref:`extending_auth`.
+
+.. _temp_auth:
+
+--------
+TempAuth
+--------
 
-Additionally, if the auth system sets the request environ's swift_owner key to
-True, the proxy will return additional header information in some requests,
-such as the X-Container-Sync-Key for a container GET or HEAD.
+TempAuth is used primarily in Swift's functional test environment and can be
+used in other test environments (such as :doc:`development_saio`). It is not
+recommended to use TempAuth in a production system. However, TempAuth is fully
+functional and can be used as a model to develop your own auth system.
+
+TempAuth has the concept of admin and non-admin users
+within an account.  Admin users can do anything within the account.
+Non-admin users can only perform read operations. However, some
+privileged metadata such as X-Container-Sync-Key is not accessible to
+non-admin users.
+
+Users with the special group ``.reseller_admin`` can operate on any account.
+For an example usage please see :mod:`swift.common.middleware.tempauth`.
+If a request is coming from a reseller the auth system sets the request environ
+reseller_request to True. This can be used by other middlewares.
+
+Other users may be granted the ability to perform operations on
+an account or container via ACLs. TempAuth supports two types of ACL:
+
+- Per container ACLs based on the
+  container's ``X-Container-Read`` and ``X-Container-Write`` metadata. See
+  :ref:`container_acls` for more information.
+
+- Per account ACLs based on the account's ``X-Account-Access-Control``
+  metadata. For more information see :ref:`account_acls`.
 
 TempAuth will now allow OPTIONS requests to go through without a token.
 
-The user starts a session by sending a ReST request to the auth system to
-receive the auth token and a URL to the Swift system.
+The TempAuth middleware is responsible for creating its own tokens. A user
+makes a request containing their username and password and TempAuth
+responds with a token. This token is then used to perform subsequent
+requests on the user's account, containers and objects.
+
+.. _keystone_auth:
 
 -------------
 Keystone Auth
 -------------
 
-Swift is able to authenticate against OpenStack keystone via the
-:mod:`swift.common.middleware.keystoneauth` middleware.
+Swift is able to authenticate against OpenStack Keystone_. In this
+environment, Keystone is responsible for creating and validating
+tokens. The :ref:`keystoneauth` middleware is responsible for
+implementing the auth system within Swift as described here.
+
+The :ref:`keystoneauth` middleware supports per container based ACLs on the
+container's ``X-Container-Read`` and ``X-Container-Write`` metadata.
+For more information see :ref:`container_acls`.
 
-In order to use the ``keystoneauth`` middleware the ``authtoken``
-middleware from python-keystoneclient will need to be configured.
+The account-level ACL is not supported by Keystone auth.
+
+In order to use the ``keystoneauth`` middleware the ``auth_token``
+middleware from KeystoneMiddleware_ will need to be configured.
 
 The ``authtoken`` middleware performs the authentication token
 validation and retrieves actual user authentication information. It
-can be found in the python-keystoneclient distribution.
+can be found in the KeystoneMiddleware_ distribution.
+
+The :ref:`keystoneauth` middleware performs authorization and mapping the
+Keystone roles to Swift's ACLs.
 
-The ``keystoneauth`` middleware performs authorization and mapping the
-``keystone`` roles to Swift's ACLs.
+.. _KeystoneMiddleware: https://docs.openstack.org/keystonemiddleware/latest/
+.. _Keystone: https://docs.openstack.org/keystone/latest/
+
+.. _configuring_keystone_auth:
 
 Configuring Swift to use Keystone
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-Configuring Swift to use Keystone is relatively straight
-forward.  The first step is to ensure that you have the auth_token
-middleware installed, distributed with keystone it can either be
-dropped in your python path or installed via the keystone package.
+Configuring Swift to use Keystone_
+is relatively straightforward.  The first
+step is to ensure that you have the ``auth_token`` middleware installed. It can
+either be dropped in your python path or installed via the KeystoneMiddleware_
+package.
 
 You need at first make sure you have a service endpoint of type
-``object-store`` in keystone pointing to your Swift proxy. For example
+``object-store`` in Keystone pointing to your Swift proxy. For example
 having this in your ``/etc/keystone/default_catalog.templates`` ::
 
   catalog.RegionOne.object_store.name = Swift Service
@@ -78,7 +127,7 @@ having this in your ``/etc/keystone/default_catalog.templates`` ::
   catalog.RegionOne.object_store.adminURL = http://swiftproxy:8080/
   catalog.RegionOne.object_store.internalURL = http://swiftproxy:8080/v1/AUTH_$(tenant_id)s
 
-On your Swift Proxy server you will want to adjust your main pipeline
+On your Swift proxy server you will want to adjust your main pipeline
 and add auth_token and keystoneauth in your
 ``/etc/swift/proxy-server.conf`` like this ::
 
@@ -88,46 +137,234 @@ and add auth_token and keystoneauth in your
 add the configuration for the authtoken middleware::
 
   [filter:authtoken]
-  paste.filter_factory = keystoneclient.middleware.auth_token:filter_factory
-  auth_host = keystonehost
-  auth_port = 35357
-  auth_protocol = http
-  auth_uri = http://keystonehost:5000/
-  admin_tenant_name = service
-  admin_user = swift
-  admin_password = password
+  paste.filter_factory = keystonemiddleware.auth_token:filter_factory
+  www_authenticate_uri = http://keystonehost:5000/
+  auth_url = http://keystonehost:5000/
+  auth_plugin = password
+  project_domain_id = default
+  user_domain_id = default
+  project_name = service
+  username = swift
+  password = password
+  cache = swift.cache
+  include_service_catalog = False
+  delay_auth_decision = True
 
 The actual values for these variables will need to be set depending on
-your situation.  For more information, please refer to the Keystone
-documentation on the ``auth_token`` middleware, but in short:
+your situation, but in short:
+
+* ``www_authenticate_uri`` should point to a Keystone service from which users may
+  retrieve tokens. This value is used in the `WWW-Authenticate` header that
+  auth_token sends with any denial response.
+* ``auth_url`` points to the Keystone Admin service. This information is
+  used by the middleware to actually query Keystone about the validity of the
+  authentication tokens. It is not necessary to append any Keystone API version
+  number to this URI.
+* The auth credentials (``project_domain_id``, ``user_domain_id``,
+  ``username``, ``project_name``, ``password``) will be used to retrieve an
+  admin token. That token will be used to authorize user tokens behind the
+  scenes. These credentials must match the Keystone credentials for the Swift
+  service. The example values shown here assume a user named 'swift' with admin
+  role on a project named 'service', both being in the Keystone domain with id
+  'default'. Refer to the `KeystoneMiddleware documentation
+  <https://docs.openstack.org/keystonemiddleware/latest/middlewarearchitecture.html#configuration>`_
+  for other examples.
+
+* ``cache`` is set to ``swift.cache``. This means that the middleware
+  will get the Swift memcache from the request environment.
+* ``include_service_catalog`` defaults to ``True`` if not set. This means
+  that when validating a token, the service catalog is retrieved
+  and stored in the ``X-Service-Catalog`` header. This is required if you use
+  access-rules in Application Credentials. You may also need to increase
+  `max_header_size`.
 
-* Those variables beginning with ``auth_`` point to the Keystone
-  Admin service.  This information is used by the middleware to actually
-  query Keystone about the validity of the
-  authentication tokens.
-* The admin auth credentials (``admin_user``, ``admin_tenant_name``,
-  ``admin_password``) will be used to retrieve an admin token. That
-  token will be used to authorize user tokens behind the scenes.
 
 .. note::
 
-    If support is required for unvalidated users (as with anonymous
-    access) or for tempurl/formpost middleware, authtoken will need
-    to be configured with delay_auth_decision set to 1.
+    The authtoken config variable ``delay_auth_decision`` must be set to
+    ``True``. The default is ``False``, but that breaks public access,
+    :ref:`staticweb`, :ref:`formpost`, :ref:`tempurl`, and authenticated
+    capabilities requests (using :ref:`discoverability`).
+
+and you can finally add the keystoneauth configuration. Here is a simple
+configuration::
+
+  [filter:keystoneauth]
+  use = egg:swift#keystoneauth
+  operator_roles = admin, swiftoperator
 
-and you can finally add the keystoneauth configuration::
+Use an appropriate list of roles in operator_roles. For example, in
+some systems, the role ``_member_`` or ``Member`` is used to indicate
+that the user is allowed to operate on project resources.
+
+OpenStack Service Using Composite Tokens
+----------------------------------------
+
+Some OpenStack services such as Cinder and Glance may use
+a "service account". In this mode, you configure a separate account where
+the service stores project data that it manages. This account is not used
+directly by the end-user. Instead, all access is done through the service.
+
+To access the "service" account, the service must present two tokens: one from
+the end-user and another from its own service user. Only when both tokens are
+present can the account be accessed. This section describes how to set the
+configuration options to correctly control access to both the "normal" and
+"service" accounts.
+
+In this example, end users use the ``AUTH_`` prefix in account names,
+whereas services use the ``SERVICE_`` prefix::
+
+  [filter:keystoneauth]
+  use = egg:swift#keystoneauth
+  reseller_prefix = AUTH, SERVICE
+  operator_roles = admin, swiftoperator
+  SERVICE_service_roles = service
+
+The actual values for these variable will need to be set depending on your
+situation as follows:
+
+* The first item in the reseller_prefix list must match Keystone's endpoint
+  (see ``/etc/keystone/default_catalog.templates`` above). Normally
+  this is ``AUTH``.
+* The second item in the reseller_prefix list is the prefix used by the
+  OpenStack services(s). You must configure this value (``SERVICE`` in the
+  example) with whatever the other OpenStack service(s) use.
+* Set the operator_roles option to contain a role or roles that end-user's
+  have on project's they use.
+* Set the SERVICE_service_roles value to a role or roles that only the
+  OpenStack service user has. Do not use a role that is assigned to
+  "normal" end users. In this example, the role ``service`` is used.
+  The service user is granted this role to a *single* project only. You do
+  not need to make the service user a member of every project.
+
+This configuration works as follows:
+
+* The end-user presents a user token to an OpenStack service. The service
+  then makes a Swift request to the account with the ``SERVICE`` prefix.
+* The service forwards the original user token with the request. It also
+  adds it's own service token.
+* Swift validates both tokens. When validated, the user token gives the
+  ``admin`` or ``swiftoperator`` role(s). When validated, the service token
+  gives the ``service`` role.
+* Swift interprets the above configuration as follows:
+
+  * Did the user token provide one of the roles listed in operator_roles?
+  * Did the service token have the ``service`` role as described by the
+    ``SERVICE_service_roles`` options.
+
+* If both conditions are met, the request is granted. Otherwise, Swift
+  rejects the request.
+
+In the above example, all services share the same account. You can separate
+each service into its own account. For example, the following provides a
+dedicated account for each of the Glance and Cinder services. In addition,
+you must assign the ``glance_service`` and ``cinder_service`` to the
+appropriate service users::
 
   [filter:keystoneauth]
   use = egg:swift#keystoneauth
+  reseller_prefix = AUTH, IMAGE, VOLUME
   operator_roles = admin, swiftoperator
+  IMAGE_service_roles = glance_service
+  VOLUME_service_roles = cinder_service
+
+
+Access control using keystoneauth
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+By default the only users able to perform operations (e.g. create a container)
+on an account are those having a Keystone role for the corresponding Keystone
+project that matches one of the roles specified in the ``operator_roles``
+option.
+
+Users who have one of the ``operator_roles`` will be able to set container ACLs
+to grant other users permission to read and/or write objects in specific
+containers, using ``X-Container-Read`` and ``X-Container-Write`` headers
+respectively. In addition to the ACL formats described
+:mod:`here <swift.common.middleware.acl>`, keystoneauth supports ACLs using the
+format::
+
+ other_project_id:other_user_id.
+
+where ``other_project_id`` is the UUID of a Keystone project and
+``other_user_id`` is the UUID of a Keystone user. This will allow the other
+user to access a container provided their token is scoped on the other
+project. Both ``other_project_id`` and ``other_user_id`` may be replaced with
+the wildcard character ``*`` which will match any project or user respectively.
+
+Be sure to use Keystone UUIDs rather than names in container ACLs.
+
+.. note::
+
+    For backwards compatibility, keystoneauth will by default grant container
+    ACLs expressed as ``other_project_name:other_user_name`` (i.e. using
+    Keystone names rather than UUIDs) in the special case when both the other
+    project and the other user are in Keystone's default domain and the project
+    being accessed is also in the default domain.
+
+    For further information see :ref:`keystoneauth`
+
+Users with the Keystone role defined in ``reseller_admin_role``
+(``ResellerAdmin`` by default) can operate on any account. The auth system
+sets the request environ reseller_request to True if a request is coming
+from a user with this role. This can be used by other middlewares.
+
+Troubleshooting tips for keystoneauth deployment
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-By default the only users able to give ACL or to Create other
-containers are the ones who has the Keystone role specified in the
-``operator_roles`` setting.
+Some common mistakes can result in API requests failing when first deploying
+keystone with Swift:
 
-This user who have one of those role will be able to give ACLs to
-other users on containers, see the documentation on ACL here
-:mod:`swift.common.middleware.acl`.
+* Incorrect configuration of the Swift endpoint in the Keystone service.
+
+  By default, keystoneauth expects the account part of a URL to have the form
+  ``AUTH_<keystone_project_id>``. Sometimes the ``AUTH_`` prefix is missed when
+  configuring Swift endpoints in Keystone, as described in the `Install  Guide
+  <http://docs.openstack.org/>`_. This is easily diagnosed by inspecting the
+  proxy-server log file for a failed request URL and checking that the URL
+  includes the ``AUTH_`` prefix (or whatever reseller prefix may have been
+  configured for keystoneauth)::
+
+      GOOD:
+      proxy-server: 127.0.0.1 127.0.0.1 07/Sep/2016/16/06/58 HEAD /v1/AUTH_cfb8d9d45212408b90bc0776117aec9e HTTP/1.0 204 ...
+
+      BAD:
+      proxy-server: 127.0.0.1 127.0.0.1 07/Sep/2016/16/07/35 HEAD /v1/cfb8d9d45212408b90bc0776117aec9e HTTP/1.0 403 ...
+
+
+* Incorrect configuration of the ``authtoken`` middleware options in the Swift
+  proxy server.
+
+  The ``authtoken`` middleware communicates with the Keystone service to
+  validate tokens that are presented with client requests. To do this
+  ``authtoken`` must authenticate itself with Keystone using the credentials
+  configured in the ``[filter:authtoken]`` section of
+  ``/etc/swift/proxy-server.conf``. Errors in these credentials can result in
+  ``authtoken`` failing to validate tokens and may be revealed in the proxy
+  server logs by a message such as::
+
+      proxy-server: Identity server rejected authorization
+
+  .. note::
+
+      More detailed log messaging may be seen by setting the ``authtoken``
+      option ``log_level = debug``.
+
+  The ``authtoken`` configuration options may be checked by attempting to use
+  them to communicate directly with Keystone using an ``openstack`` command
+  line. For example, given the ``authtoken`` configuration sample shown in
+  :ref:`configuring_keystone_auth`, the following command should return a
+  service catalog::
+
+      openstack --os-identity-api-version=3 --os-auth-url=http://keystonehost:5000/ \
+          --os-username=swift --os-user-domain-id=default \
+          --os-project-name=service --os-project-domain-id=default \
+          --os-password=password catalog show object-store
+
+  If this ``openstack`` command fails then it is likely that there is a problem
+  with the ``authtoken`` configuration.
+
+.. _extending_auth:
 
 --------------
 Extending Auth
@@ -135,7 +372,8 @@ Extending Auth
 
 TempAuth is written as wsgi middleware, so implementing your own auth is as
 easy as writing new wsgi middleware, and plugging it in to the proxy server.
-The KeyStone project and the Swauth project are examples of additional auth
-services.
 
-Also, see :doc:`development_auth`.
+See :doc:`development_auth` for detailed information on extending the
+auth system.
+
+
diff --git a/doc/source/overview_backing_store.rst b/doc/source/overview_backing_store.rst
new file mode 100644
index 0000000000..0bb1251a4c
--- /dev/null
+++ b/doc/source/overview_backing_store.rst
@@ -0,0 +1,273 @@
+
+=============================================
+Using Swift as Backing Store for Service Data
+=============================================
+
+----------
+Background
+----------
+
+This section provides guidance to OpenStack Service developers for how to
+store your users' data in Swift. An example of this is that a user requests
+that Nova save a snapshot of a VM. Nova passes the request to Glance,
+Glance writes the image to a Swift container as a set of objects.
+
+Throughout this section, the following terminology and concepts are used:
+
+* User or end-user. This is a person making a request that will result in
+  an OpenStack Service making a request to Swift.
+
+* Project (also known as Tenant). This is the unit of resource ownership.
+  While data such as snapshot images or block volume backups may be
+  stored as a result of an end-user's request, the reality is that these
+  are project data.
+
+* Service. This is a program or system used by end-users. Specifically, it
+  is any program or system that is capable of receiving end-user's tokens and
+  validating the token with the Keystone Service and has a need to store
+  data in Swift. Glance and Cinder are examples of such Services.
+
+* Service User. This is a Keystone user that has been assigned to a Service.
+  This allows the Service to generate and use its own tokens so that it
+  can interact with other Services as itself.
+
+* Service Project. This is a project (tenant) that is associated with a
+  Service. There may be a single project shared by many Services or there
+  may be a project dedicated to each Service. In this document, the
+  main purpose of the Service Project is to allow the system operator
+  to configure specific roles for each Service User.
+
+-------------------------------
+Alternate Backing Store Schemes
+-------------------------------
+
+There are three schemes described here:
+
+* Dedicated Service Account (Single Tenant)
+
+  Your Service has a dedicated Service Project (hence a single dedicated
+  Swift account). Data for all users and projects are stored in this
+  account. Your Service must have a user assigned to it (the Service User).
+  When you have data to store on behalf of one of your users, you use the
+  Service User credentials to get a token for the Service Project and
+  request Swift to store the data in the Service Project.
+
+  With this scheme, data for all users is stored in a single account. This
+  is transparent to your users and since the credentials for the Service User
+  are typically not shared with anyone, your users' cannot access their
+  data by making a request directly to Swift. However, since data belonging
+  to all users is stored in one account, it presents a single point of
+  vulnerably to accidental deletion or a leak of the service-user
+  credentials.
+
+* Multi Project (Multi Tenant)
+
+  Data belonging to a project is stored in the Swift account
+  associated with the project. Users make requests to your Service using
+  a token scoped to a project in the normal way. You can then use this
+  same token to store the user data in the project's Swift account.
+
+  The effect is that data is stored in multiple projects (aka tenants).
+  Hence this scheme has been known as the "multi tenant" scheme.
+
+  With this scheme, access is controlled by Keystone. The users must
+  have a role that allows them to perform the request to your Service. In
+  addition, they must have a role that also allows them to store data in
+  the Swift account. By default, the admin or swiftoperator roles are
+  used for this purpose (specific systems may use other role names). If the
+  user does not have the appropriate roles, when your Service attempts
+  to access Swift, the operation will fail.
+
+  Since you are using the user's token to access the data, it follows that
+  the user can use the same token to access Swift directly -- bypassing your
+  Service. When end-users are browsing containers, they will also see
+  your Service's containers and objects -- and may potentially delete
+  the data. Conversely, there is no single account where all data so leakage
+  of credentials will only affect a single project/tenant.
+
+* Service Prefix Account
+
+  Data belonging to a project is stored in a Swift account associated
+  with the project. This is similar to the Multi Project scheme described
+  above. However, the Swift account is different than the account that
+  users access. Specifically, it has a different account prefix. For example,
+  for the project 1234, the user account is named AUTH_1234. Your Service uses
+  a different account, for example, SERVICE_1234.
+
+  To access the SERVICE_1234 account, you must present two tokens: the user's
+  token is put in the X-Auth-Token header. You present your Service's token
+  in the X-Service-Token header. Swift is configured such that only when both
+  tokens are presented will it allow access. Specifically, the user cannot
+  bypass your Service because they only have their own token. Conversely, your
+  Service can only access the data while it has a copy of the user's token --
+  the Service's token by itself will not grant access.
+
+  The data stored in the Service Prefix Account cannot be seen by end-users.
+  So they cannot delete this data -- they can only access the data if they
+  make a request through your Service. The data is also more secure. To make
+  an unauthorized access, someone would need to compromise both an end-user's
+  and your Service User credentials. Even then, this would only expose one
+  project -- not other projects.
+
+The Service Prefix Account scheme combines features of the Dedicated Service
+Account and Multi Project schemes. It has the private, dedicated,
+characteristics of the Dedicated Service Account scheme but does not present
+a single point of attack. Using the Service Prefix Account scheme is a little
+more involved than the other schemes, so the rest of this document describes
+it more detail.
+
+-------------------------------
+Service Prefix Account Overview
+-------------------------------
+
+The following diagram shows the flow through the system from the end-user,
+to your Service and then onto Swift::
+
+      client
+         \
+          \   <request>: <path-specific-to-the-service>
+           \  x-auth-token: <user-token>
+            \
+          SERVICE
+             \
+              \    PUT: /v1/SERVICE_1234/<container>/<object>
+               \   x-auth-token: <user-token>
+                \  x-service-token: <service-token>
+                 \
+                Swift
+
+The sequence of events and actions are as follows:
+
+* Request arrives at your Service
+
+* The <user-token> is validated by the keystonemiddleware.auth_token
+  middleware. The user's role(s) are used to determine if the user
+  can perform the request. See :doc:`overview_auth` for technical
+  information on the authentication system.
+
+* As part of this request, your Service needs to access Swift (either to
+  write or read a container or object). In this example, you want to perform
+  a PUT on <container>/<object>.
+
+* In the wsgi environment, the auth_token module will have populated the
+  HTTP_X_SERVICE_CATALOG item. This lists the Swift endpoint and account.
+  This is something such as https://<netloc>/v1/AUTH_1234 where ``AUTH_``
+  is a prefix and ``1234`` is the project id.
+
+* The ``AUTH_`` prefix is the default value. However, your system may use a
+  different prefix. To determine the actual prefix, search for the first
+  underscore ('_') character in the account name. If there is no underscore
+  character in the account name, this means there is no prefix.
+
+* Your Service should have a configuration parameter that provides the
+  appropriate prefix to use for storing data in Swift. There is more
+  discussion of this below, but for now assume the prefix is ``SERVICE_``.
+
+* Replace the prefix (``AUTH_`` in above examples) in the path with
+  ``SERVICE_``, so the full URL to access the object becomes
+  https://<netloc>/v1/SERVICE_1234/<container>/<object>.
+
+* Make the request to Swift, using this URL. In the X-Auth-Token header place
+  a copy of the <user-token>. In the X-Service-Token header, place your
+  Service's token. If you use python-swiftclient you can achieve this
+  by:
+
+  * Putting the URL in the ``preauthurl`` parameter
+  * Putting the <user-token> in ``preauthtoken`` parameter
+  * Adding the X-Service-Token to the ``headers`` parameter
+
+
+Using the HTTP_X_SERVICE_CATALOG to get Swift Account Name
+----------------------------------------------------------
+
+The auth_token middleware populates the wsgi environment with information when
+it validates the user's token. The HTTP_X_SERVICE_CATALOG item is a JSON
+string containing  details of the OpenStack endpoints. For Swift, this also
+contains the project's Swift account name. Here is an example of a catalog
+entry for Swift::
+
+    "serviceCatalog": [
+        ...
+        {
+            ....
+            "type": "object-store",
+            "endpoints": [
+               ...
+               {
+                   ...
+                   "publicURL": "https://<netloc>/v1/AUTH_1234",
+                   "region": "<region-name>"
+                   ...
+               }
+               ...
+         ...
+         }
+    }
+
+To get the End-user's account:
+
+* Look for an entry with ``type`` of ``object-store``
+
+* If there are several regions, there will be several endpoints. Use the
+  appropriate region name and select the ``publicURL`` item.
+
+* The Swift account name is the final item in the path ("AUTH_1234" in this
+  example).
+
+Getting a Service Token
+-----------------------
+
+A Service Token is no different than any other token and is requested
+from Keystone using user credentials and project in the usual way. The core
+requirement is that your Service User has the appropriate role. In practice:
+
+* Your Service must have a user assigned to it (the Service User).
+
+* Your Service has a project assigned to it (the Service Project).
+
+* The Service User must have a role on the Service Project. This role is
+  distinct from any of the normal end-user roles.
+
+* The role used must the role configured in the /etc/swift/proxy-server.conf.
+  This is the ``<prefix>_service_roles`` option. In this example, the role
+  is the ``service`` role::
+
+    [keystoneauth]
+    reseller_prefix = AUTH_, SERVICE_
+    SERVICE_service_role = service
+
+The ``service`` role should only be granted to OpenStack Services. It should
+not be granted to users.
+
+Single or multiple Service Prefixes?
+------------------------------------
+
+Most of the examples used in this document used a single prefix. The
+prefix, ``SERVICE`` was used. By using a single prefix, an operator is
+allowing all OpenStack Services to share the same account for data
+associated with a given project. For test systems or deployments well protected
+on private firewalled networks, this is appropriate.
+
+However, if one Service is compromised, that Service can access
+data created by another Service. To prevent this, multiple Service Prefixes may
+be used. This also requires that the operator configure multiple service
+roles. For example, in a system that has Glance and Cinder, the following
+Swift configuration could be used::
+
+    [keystoneauth]
+    reseller_prefix = AUTH_, IMAGE_, BLOCK_
+    IMAGE_service_roles = image_service
+    BLOCK_service_roles = block_service
+
+The Service User for Glance would be granted the ``image_service`` role on its
+Service Project and the Cinder Service user is granted the ``block_service``
+role on its project. In this scheme, if the Cinder Service was compromised,
+it would not be able to access any Glance data.
+
+Container Naming
+----------------
+
+Since a single Service Prefix is possible, container names should be prefixed
+with a unique string to prevent name clashes. We suggest you use the service
+type field (as used in the service catalog). For example, The Glance Service
+would use "image" as a prefix.
diff --git a/doc/source/overview_container_sharding.rst b/doc/source/overview_container_sharding.rst
new file mode 100644
index 0000000000..f834b5946e
--- /dev/null
+++ b/doc/source/overview_container_sharding.rst
@@ -0,0 +1,694 @@
+.. _sharding_doc:
+
+==================
+Container Sharding
+==================
+
+Container sharding is an operator controlled feature that may be used to shard
+very large container databases into a number of smaller shard containers
+
+.. note::
+
+    It is strongly recommended that operators gain experience of sharding
+    containers in a non-production cluster before using in production.
+
+    The sharding process involves moving all sharding container database
+    records via the container replication engine; the time taken to complete
+    sharding is dependent upon the existing cluster load and the performance of
+    the container database being sharded.
+
+    There is currently no documented process for reversing the sharding
+    process once sharding has been enabled.
+
+
+----------
+Background
+----------
+The metadata for each container in Swift is stored in an SQLite database. This
+metadata includes: information about the container such as its name,
+modification time and current object count; user metadata that may been written
+to the container by clients; a record of every object in the container. The
+container database object records are used to generate container listings in
+response to container GET requests; each object record stores the object's
+name, size, hash and content-type as well as associated timestamps.
+
+As the number of objects in a container increases then the number of object
+records in the container database increases. Eventually the container database
+performance starts to degrade and the time taken to update an object record
+increases. This can result in object updates timing out, with a corresponding
+increase in the backlog of pending :ref:`asynchronous updates
+<architecture_updaters>` on object servers. Container databases are typically
+replicated on several nodes and any database performance degradation can also
+result in longer :doc:`container replication <overview_replication>` times.
+
+The point at which container database performance starts to degrade depends
+upon the choice of hardware in the container ring. Anecdotal evidence suggests
+that containers with tens of millions of object records have noticeably
+degraded performance.
+
+This performance degradation can be avoided by ensuring that clients use an
+object naming scheme that disperses objects across a number of containers
+thereby distributing load across a number of container databases. However, that
+is not always desirable nor is it under the control of the cluster operator.
+
+Swift's container sharding feature provides the operator with a mechanism to
+distribute the load on a single client-visible container across multiple,
+hidden, shard containers, each of which stores a subset of the container's
+object records. Clients are unaware of container sharding; clients continue to
+use the same API to access a container that, if sharded, maps to a number of
+shard containers within the Swift cluster.
+
+------------------------
+Deployment and operation
+------------------------
+
+Upgrade Considerations
+----------------------
+
+It is essential that all servers in a Swift cluster have been upgraded to
+support the container sharding feature before attempting to shard a container.
+
+Identifying containers in need of sharding
+------------------------------------------
+
+Container sharding is currently initiated by the ``swift-manage-shard-ranges``
+CLI tool :ref:`described below <swift-manage-shard-ranges>`. Operators must
+first identify containers that are candidates for sharding. To assist with
+this, the :ref:`sharder_daemon` inspects the size of containers that it visits
+and writes a list of sharding candidates to recon cache. For example::
+
+    "sharding_candidates": {
+        "found": 1,
+        "top": [
+            {
+                "account": "AUTH_test",
+                "container": "c1",
+                "file_size": 497763328,
+                "meta_timestamp": "1525346445.31161",
+                "node_index": 2,
+                "object_count": 3349028,
+                "path": <path_to_db>,
+                "root": "AUTH_test/c1"
+            }
+        ]
+    }
+
+A container is considered to be a sharding candidate if its object count is
+greater than or equal to the ``shard_container_threshold`` option.
+The number of candidates reported is limited to a number configured by the
+``recon_candidates_limit`` option such that only the largest candidate
+containers are included in the ``sharding_candidates`` data.
+
+
+.. _swift-manage-shard-ranges:
+
+``swift-manage-shard-ranges`` CLI tool
+--------------------------------------
+
+.. automodule:: swift.cli.manage_shard_ranges
+    :members:
+    :show-inheritance:
+
+
+.. _sharder_daemon:
+
+``container-sharder`` daemon
+----------------------------
+
+Once sharding has been enabled for a container, the act of sharding is
+performed by the :ref:`container-sharder`.  The :ref:`container-sharder` daemon
+must be running on all container servers. The ``container-sharder`` daemon
+periodically visits each container database to perform any container sharding
+tasks that are required.
+
+The ``container-sharder`` daemon requires a ``[container-sharder]`` config
+section to exist in the container server configuration file; a sample config
+section is shown in the `container-server.conf-sample` file.
+
+.. note::
+
+    The ``auto_shard`` option is currently **NOT** recommended for production
+    systems and should be set to ``false`` (the default value).
+
+    Several of the ``[container-sharder]`` config options are only significant
+    when the ``auto_shard`` option is enabled. This option enables the
+    ``container-sharder`` daemon to automatically identify containers that are
+    candidates for sharding and initiate the sharding process, instead of using
+    the ``swift-manage-shard-ranges`` tool.
+
+The container sharder uses an internal client and therefore requires an
+internal client configuration file to exist. By default the internal-client
+configuration file is expected to be found at
+`/etc/swift/internal-client.conf`. An alternative location for the
+configuration file may be specified using the ``internal_client_conf_path``
+option in the ``[container-sharder]`` config section.
+
+The content of the internal-client configuration file should be the same as the
+`internal-client.conf-sample` file. In particular, the internal-client
+configuration should have::
+
+    account_autocreate = True
+
+in the ``[proxy-server]`` section.
+
+A container database may require several visits by the ``container-sharder``
+daemon before it is fully sharded. On each visit the ``container-sharder``
+daemon will move a subset of object records to new shard containers by cleaving
+new shard container databases from the original. By default, two shards are
+processed per visit; this number may be configured by the ``cleave_batch_size``
+option.
+
+The ``container-sharder`` daemon periodically writes progress data for
+containers that are being sharded to recon cache. For example::
+
+    "sharding_in_progress": {
+        "all": [
+            {
+                "account": "AUTH_test",
+                "active": 0,
+                "cleaved": 2,
+                "container": "c1",
+                "created": 5,
+                "db_state": "sharding",
+                "error": null,
+                "file_size": 26624,
+                "found": 0,
+                "meta_timestamp": "1525349617.46235",
+                "node_index": 1,
+                "object_count": 3349030,
+                "path": <path_to_db>,
+                "processing_time": 0.00381,
+                "root": "AUTH_test/c1",
+                "state": "sharding",
+                "tombstones": -1,
+                "total_replicate_time": 0.07549,
+                "total_sharding_time": 210.091,
+            }
+        ]
+    }
+
+This example indicates that from a total of 7 shard ranges, 2 have been cleaved
+whereas 5 remain in created state waiting to be cleaved.
+
+Shard containers are created in an internal account and not visible to clients.
+By default, shard containers for an account ``AUTH_test`` are created in the
+internal account ``.shards_AUTH_test``.
+
+Once a container has started sharding, object updates to that container may be
+redirected to the shard container. The ``container-sharder`` daemon is also
+responsible for sending updates of a shard's object count and bytes_used to the
+original container so that aggegrate object count and bytes used values can be
+returned in responses to client requests.
+
+.. note::
+
+    The ``container-sharder`` daemon must continue to run on all container
+    servers in order for shards object stats updates to be generated.
+
+
+--------------
+Under the hood
+--------------
+
+Terminology
+-----------
+
+================== ====================================================
+Name               Description
+================== ====================================================
+Root container     The original container that lives in the
+                   user's account. It holds references to its
+                   shard containers.
+Retiring DB        The original database file that is to be sharded.
+Fresh DB           A database file that will replace the retiring
+                   database.
+Epoch              A timestamp at which the fresh DB is created; the
+                   epoch value is embedded in the fresh DB filename.
+Shard range        A range of the object namespace defined by a lower
+                   bound and upper bound.
+Shard container    A container that holds object records for a shard
+                   range. Shard containers exist in a hidden account
+                   mirroring the user's account.
+Parent container   The container from which a shard container has been
+                   cleaved. When first sharding a root container each
+                   shard's parent container will be the root container.
+                   When sharding a shard container each shard's parent
+                   container will be the sharding shard container.
+Misplaced objects  Items that don't belong in a container's shard
+                   range. These will be moved to their correct
+                   location by the container-sharder.
+Cleaving           The act of moving object records within a shard
+                   range to a shard container database.
+Shrinking          The act of merging a small shard container into
+                   another shard container in order to delete the
+                   small shard container.
+Donor              The shard range that is shrinking away.
+Acceptor           The shard range into which a donor is merged.
+================== ====================================================
+
+
+Finding shard ranges
+--------------------
+
+The end goal of sharding a container is to replace the original container
+database which has grown very large with a number of shard container databases,
+each of which is responsible for storing a range of the entire object
+namespace. The first step towards achieving this is to identify an appropriate
+set of contiguous object namespaces, known as shard ranges, each of which
+contains a similar sized portion of the container's current object content.
+
+Shard ranges cannot simply be selected by sharding the namespace uniformly,
+because object names are not guaranteed to be distributed uniformly. If the
+container were naively sharded into two shard ranges, one containing all
+object names up to `m` and the other containing all object names beyond `m`,
+then if all object names actually start with `o` the outcome would be an
+extremely unbalanced pair of shard containers.
+
+It is also too simplistic to assume that every container that requires sharding
+can be sharded into two. This might be the goal in the ideal world, but in
+practice there will be containers that have grown very large and should be
+sharded into many shards. Furthermore, the time required to find the exact
+mid-point of the existing object names in a large SQLite database would
+increase with container size.
+
+For these reasons, shard ranges of size `N` are found by searching for the
+`Nth` object in the database table, sorted by object name, and then searching
+for the `(2 * N)th` object, and so on until all objects have been searched. For
+a container that has exactly `2N` objects, the end result is the same as
+sharding the container at the midpoint of its object names. In practice
+sharding would typically be enabled for containers with great than `2N` objects
+and more than two shard ranges will be found, the last one probably containing
+less than `N` objects. With containers having large multiples of `N` objects,
+shard ranges can be identified in batches which enables more scalable solution.
+
+To illustrate this process, consider a very large container in a user account
+``acct`` that is a candidate for sharding:
+
+.. image:: images/sharding_unsharded.svg
+
+The :ref:`swift-manage-shard-ranges` tool ``find`` sub-command searches the
+object table for the `Nth` object whose name will become the upper bound of the
+first shard range, and the lower bound of the second shard range. The lower
+bound of the first shard range is the empty string.
+
+For the purposes of this example the first upper bound is `cat`:
+
+.. image:: images/sharding_scan_basic.svg
+
+:ref:`swift-manage-shard-ranges` continues to search the container to find
+further shard ranges, with the final upper bound also being the empty string.
+
+Enabling sharding
+-----------------
+
+Once shard ranges have been found the :ref:`swift-manage-shard-ranges`
+``replace`` sub-command is used to insert them into the `shard_ranges` table
+of the container database. In addition to its lower and upper bounds, each
+shard range is given a unique name.
+
+The ``enable`` sub-command then creates some final state required to initiate
+sharding the container, including a special shard range record referred to as
+the container's `own_shard_range` whose name is equal to the container's path.
+This is used to keep a record of the object namespace that the container
+covers, which for user containers is always the entire namespace. Sharding of
+the container will only begin when its own shard range's state has been set to
+``SHARDING``.
+
+The :class:`~swift.common.utils.ShardRange` class
+-------------------------------------------------
+
+The :class:`~swift.common.utils.ShardRange` class provides methods for
+interactng with the attributes and state of a shard range. The class
+encapsulates the following properties:
+
+* The name of the shard range which is also the name of the shard container
+  used to hold object records in its namespace.
+* Lower and upper bounds which define the object namespace of the shard range.
+* A deleted flag.
+* A timestamp at which the bounds and deleted flag were last modified.
+* The object stats for the shard range i.e. object count and bytes used.
+* A timestamp at which the object stats were last modified.
+* The state of the shard range, and an epoch, which is the timestamp used in
+  the shard container's database file name.
+* A timestamp at which the state and epoch were last modified.
+
+A shard range progresses through the following states:
+
+* FOUND: the shard range has been identified in the container that is to be
+  sharded but no resources have been created for it.
+* CREATED: a shard container has been created to store the contents of the
+  shard range.
+* CLEAVED: the sharding container's contents for the shard range have been
+  copied to the shard container from *at least one replica* of the sharding
+  container.
+* ACTIVE: a sharding container's constituent shard ranges are moved to this
+  state when all shard ranges in the sharding container have been cleaved.
+* SHRINKING: the shard range has been enabled for shrinking; or
+* SHARDING: the shard range has been enabled for sharding into further
+  sub-shards.
+* SHARDED: the shard range has completed sharding or shrinking; the container
+  will typically now have a number of constituent ACTIVE shard ranges.
+
+.. note::
+
+    Shard range state represents the most advanced state of the shard range on
+    any replica of the container. For example, a shard range in CLEAVED state
+    may not have completed cleaving on all replicas but has cleaved on at least
+    one replica.
+
+Fresh and retiring database files
+---------------------------------
+
+As alluded to earlier, writing to a large container causes increased latency
+for the container servers. Once sharding has been initiated on a container it
+is desirable to stop writing to the large database; ultimately it will be
+unlinked. This is primarily achieved by redirecting object updates to new shard
+containers as they are created (see :ref:`redirecting_updates` below), but some
+object updates may still need to be accepted by the root container and other
+container metadata must still be modifiable.
+
+To render the large `retiring` database effectively read-only, when the
+:ref:`sharder_daemon` finds a container with a set of shard range records,
+including an `own_shard_range`, it first creates a fresh database file which
+will ultimately replace the existing `retiring` database. For a retiring DB
+whose filename is::
+
+    <hash>.db
+
+the fresh database file name is of the form::
+
+    <hash>_<epoch>.db
+
+where `epoch` is a timestamp stored in the container's `own_shard_range`.
+
+The fresh DB has a copy of the shard ranges table from the retiring DB and all
+other container metadata apart from the object records. Once a fresh DB file
+has been created it is used to store any new object updates and no more object
+records are written to the retiring DB file.
+
+Once the sharding process has completed, the retiring DB file will be unlinked
+leaving only the fresh DB file in the container's directory. There are
+therefore three states that the container DB directory may be in during the
+sharding process: UNSHARDED, SHARDING and SHARDED.
+
+.. image:: images/sharding_db_states.svg
+
+If the container ever shrink to the point that is has no shards then the fresh
+DB starts to store object records, behaving the same as an unsharded container.
+This is known as the COLLAPSED state.
+
+In summary, the DB states that any container replica may be in are:
+
+- UNSHARDED - In this state there is just one standard container database. All
+  containers are originally in this state.
+- SHARDING - There are now two databases, the retiring database and a fresh
+  database. The fresh database stores any metadata, container level stats,
+  an object holding table, and a table that stores shard ranges.
+- SHARDED - There is only one database, the fresh database, which has one or
+  more shard ranges in addition to its own shard range. The retiring database
+  has been unlinked.
+- COLLAPSED - There is only one database, the fresh database, which has only
+  its own shard range and store object records.
+
+.. note::
+
+    DB state is unique to each replica of a container and is not necessarily
+    synchronised with shard range state.
+
+Creating shard containers
+-------------------------
+
+The :ref:`sharder_daemon` next creates a shard container for each shard range
+using the shard range name as the name of the shard container:
+
+.. image:: /images/sharding_cleave_basic.svg
+
+Each shard container has an `own_shard_range` record which has the
+lower and upper bounds of the object namespace for which it is responsible, and
+a reference to the sharding user container, which is referred to as the
+`root_container`. Unlike the `root_container`, the shard container's
+`own_shard_range` does not cover the entire namepsace.
+
+A shard range name takes the form ``<shard_a>/<shard_c>`` where `<shard_a>`
+is a hidden account and `<shard_c>` is a container name that is derived from
+the root container.
+
+The account name `<shard_a>` used for shard containers is formed by prefixing
+the user account with the string ``.shards_``. This avoids namespace collisions
+and also keeps all the shard containers out of view from users of the account.
+
+The container name for each shard container has the form::
+
+  <root container name>-<hash of parent container>-<timestamp>-<shard index>
+
+where `root container name` is the name of the user container to which the
+contents of the shard container belong, `parent container` is the name of the
+container from which the shard is being cleaved, `timestamp` is the time at
+which the shard range was created and `shard index` is the position of the
+shard range in the name-ordered list of shard ranges for the `parent
+container`.
+
+When sharding a user container the parent container name will be the same as
+the root container. However, if a *shard container* grows to a size that it
+requires sharding, then the parent container name for its shards will be the
+name of the sharding shard container.
+
+For example, consider a user container with path ``AUTH_user/c`` which is
+sharded into two shard containers whose name will be::
+
+  .shards_AUTH_user/c-<hash(c)>-1234512345.12345-0
+  .shards_AUTH_user/c-<hash(c)>-1234512345.12345-1
+
+If the first shard container is subsequently sharded into a further two shard
+containers then they will be named::
+
+  .shards_AUTH_user/c-<hash(c-<hash(c)>-1234567890.12345-0)>-1234567890.12345-0
+  .shards_AUTH_user/c-<hash(c-<hash(c)>-1234567890.12345-0)>-1234567890.12345-1
+
+This naming scheme guarantees that shards, and shards of shards, each have a
+unique name of bounded length.
+
+
+Cleaving shard containers
+-------------------------
+
+Having created empty shard containers the sharder daemon will proceed to cleave
+objects from the retiring database to each shard range. Cleaving occurs in
+batches of two (by default) shard ranges, so if a container has more than two
+shard ranges then the daemon must visit it multiple times to complete cleaving.
+
+To cleave a shard range the daemon creates a shard database for the shard
+container on a local device. This device may be one of the shard container's
+primary nodes but often it will not. Object records from the corresponding
+shard range namespace are then copied from the retiring DB to this shard DB.
+
+Swift's container replication mechanism is then used to replicate the shard DB
+to its primary nodes. Checks are made to ensure that the new shard container DB
+has been replicated to a sufficient number of its primary nodes before it is
+considered to have been successfully cleaved. By default the daemon requires
+successful replication of a new shard broker to at least a quorum of the
+container rings replica count, but this requirement can be tuned using the
+``shard_replication_quorum`` option.
+
+Once a shard range has been successfully cleaved from a retiring database the
+daemon transitions its state to ``CLEAVED``. It should be noted that this state
+transition occurs as soon as any one of the retiring DB replicas has cleaved
+the shard range, and therefore does not imply that all retiring DB replicas
+have cleaved that range. The significance of the state transition is that the
+shard container is now considered suitable for contributing to object listings,
+since its contents are present on a quorum of its primary nodes and are the
+same as at least one of the retiring DBs for that namespace.
+
+Once a shard range is in the ``CLEAVED`` state, the requirement for
+'successful' cleaving of other instances of the retirng DB may optionally be
+relaxed since it is not so imperative that their contents are replicated
+*immediately* to their primary nodes. The ``existing_shard_replication_quorum``
+option can be used to reduce the quorum required for a cleaved shard range to
+be considered successfully replicated by the sharder daemon.
+
+.. note::
+
+    Once cleaved, shard container DBs will continue to be replicated by the
+    normal `container-replicator` daemon so that they will eventually be fully
+    replicated to all primary nodes regardless of any replication quorum options
+    used by the sharder daemon.
+
+The cleaving progress of each replica of a retiring DB must be
+tracked independently of the shard range state. This is done using a per-DB
+CleavingContext object that maintains a cleaving cursor for the retiring DB
+that it is associated with. The cleaving cursor is simply the upper bound of
+the last shard range to have been cleaved *from that particular retiring DB*.
+
+Each CleavingContext is stored in the sharding container's sysmeta under a key
+that is the ``id`` of the retiring DB. Since all container DB files have a
+unique ``id``, this guarantees that each retiring DB will have a unique
+CleavingContext. Furthermore, if the retiring DB file is changed, for example
+by an rsync_then_merge replication operation which might change the contents of
+the DB's object table, then it will get a new unique CleavingContext.
+
+A CleavingContext maintains other state that is used to ensure that a retiring
+DB is only considered to be fully cleaved, and ready to be deleted, if *all* of
+its object rows have been cleaved to a shard range.
+
+Once all shard ranges have been cleaved from the retiring DB it is deleted. The
+container is now represented by the fresh DB which has a table of shard range
+records that point to the shard containers that store the container's object
+records.
+
+.. _redirecting_updates:
+
+Redirecting object updates
+--------------------------
+
+Once a shard container exists, object updates arising from new client requests
+and async pending files are directed to the shard container instead of the root
+container. This takes load off of the root container.
+
+For a sharded (or partially sharded) container, when the proxy receives a new
+object request it issues a GET request to the container for data describing a
+shard container to which the object update should be sent. The proxy then
+annotates the object request with the shard container location so that the
+object server will forward object updates to the shard container. If those
+updates fail then the async pending file that is written on the object server
+contains the shard container location.
+
+When the object updater processes async pending files for previously failed
+object updates, it may not find a shard container location. In this case the
+updater sends the update to the `root container`, which returns a redirection
+response with the shard container location.
+
+.. note::
+
+    Object updates are directed to shard containers as soon as they exist, even
+    if the retiring DB object records have not yet been cleaved to the shard
+    container. This prevents further writes to the retiring DB and also avoids
+    the fresh DB being polluted by new object updates. The goal is to
+    ultimately have all object records in the shard containers and none in the
+    root container.
+
+Building container listings
+---------------------------
+
+Listing requests for a sharded container are handled by querying the shard
+containers for components of the listing. The proxy forwards the client listing
+request to the root container, as it would for an unsharded container, but the
+container server responds with a list of shard ranges rather than objects. The
+proxy then queries each shard container in namespace order for their listing,
+until either the listing length limit is reached or all shard ranges have been
+listed.
+
+While a container is still in the process of sharding, only *cleaved* shard
+ranges are used when building a container listing. Shard ranges that have not
+yet cleaved will not have any object records from the root container. The root
+container continues to provide listings for the uncleaved part of its
+namespace.
+
+.. note::
+
+   New object updates are redirected to shard containers that have not yet been
+   cleaved. These updates will not therefore be included in container listings
+   until their shard range has been cleaved.
+
+Example request redirection
+---------------------------
+
+As an example, consider a sharding container in which 3 shard ranges have been
+found ending in cat, giraffe and igloo. Their respective shard containers have
+been created so update requests for objects up to "igloo" are redirected to the
+appropriate shard container. The root DB continues to handle listing requests
+and update requests for any object name beyond "igloo".
+
+.. image:: images/sharding_scan_load.svg
+
+The sharder daemon cleaves objects from the retiring DB to the shard range DBs;
+it also moves any misplaced objects from the root container's fresh DB to the
+shard DB. Cleaving progress is represented by the blue line. Once the first
+shard range has been cleaved listing requests for that namespace are directed
+to the shard container. The root container still provides listings for the
+remainder of the namespace.
+
+.. image:: images/sharding_cleave1_load.svg
+
+The process continues: the sharder cleaves the next range and a new range is
+found with upper bound of "linux". Now the root container only needs to handle
+listing requests up to "giraffe" and update requests for objects whose name is
+greater than "linux". Load will continue to diminish on the root DB and be
+dispersed across the shard DBs.
+
+.. image:: images/sharding_cleave2_load.svg
+
+
+Container replication
+---------------------
+
+Shard range records are replicated between container DB replicas in much the
+same way as object records are for unsharded containers. However, the usual
+replication of object records between replicas of a container is halted as soon
+as a container is capable of being sharded. Instead, object records are moved
+to their new locations in shard containers. This avoids unnecessary replication
+traffic between container replicas.
+
+To facilitate this, shard ranges are both 'pushed' and 'pulled' during
+replication, prior to any attempt to replicate objects. This means that the
+node initiating replication learns about shard ranges from the destination node
+early during the replication process and is able to skip object replication if
+it discovers that it has shard ranges and is able to shard.
+
+.. note::
+
+    When the destination DB for container replication is missing then the
+    'complete_rsync' replication mechanism is still used and in this case only
+    both object records and shard range records are copied to the destination
+    node.
+
+Container deletion
+------------------
+
+Sharded containers may be deleted by a ``DELETE`` request just like an
+unsharded container. A sharded container must be empty before it can be deleted
+which implies that all of its shard containers must have reported that they are
+empty.
+
+Shard containers are *not* immediately deleted when their root container is
+deleted; the shard containers remain undeleted so that they are able to
+continue to receive object updates that might arrive after the root container
+has been deleted. Shard containers continue to update their deleted root
+container with their object stats. If a shard container does receive object
+updates that cause it to no longer be empty then the root container will no
+longer be considered deleted once that shard container sends an object stats
+update.
+
+
+Sharding a shard container
+--------------------------
+
+A shard container may grow to a size that requires it to be sharded.
+``swift-manage-shard-ranges`` may be used to identify shard ranges within a
+shard container and enable sharding in the same way as for a root container.
+When a shard is sharding it notifies the root container of its shard ranges so
+that the root container can start to redirect object updates to the new
+'sub-shards'. When the shard has completed sharding the root is aware of all
+the new sub-shards and the sharding shard deletes its shard range record in the
+root container shard ranges table. At this point the root container is aware of
+all the new sub-shards which collectively cover the namespace of the
+now-deleted shard.
+
+There is no hierarchy of shards beyond the root container and its immediate
+shards. When a shard shards, its sub-shards are effectively re-parented with
+the root container.
+
+
+Shrinking a shard container
+---------------------------
+
+A shard container's contents may reduce to a point where the shard container is
+no longer required. If this happens then the shard container may be shrunk into
+another shard range. Shrinking is achieved in a similar way to sharding: an
+'acceptor' shard range is written to the shrinking shard container's shard
+ranges table; unlike sharding, where shard ranges each cover a subset of the
+sharding container's namespace, the acceptor shard range is a superset of the
+shrinking shard range.
+
+Once given an acceptor shard range the shrinking shard will cleave itself to
+its acceptor, and then delete itself from the root container shard ranges
+table.
diff --git a/doc/source/overview_container_sync.rst b/doc/source/overview_container_sync.rst
index b62136d258..7413911e87 100644
--- a/doc/source/overview_container_sync.rst
+++ b/doc/source/overview_container_sync.rst
@@ -14,25 +14,120 @@ synchronization key.
 
 .. note::
 
-    Container sync will sync object POSTs only if the proxy server is set to
-    use "object_post_as_copy = true" which is the default. So-called fast
-    object posts, "object_post_as_copy = false" do not update the container
-    listings and therefore can't be detected for synchronization.
+    If you are using the :ref:`Large Objects <large-objects>` feature and
+    syncing to another cluster then you will need to ensure that manifest files
+    and segment files are synced. If segment files are in a different container
+    than their manifest then both the manifest's container and the segments'
+    container must be synced. The target container for synced segment files
+    must always have the same name as their source container in order for them
+    to be resolved by synced manifests.
+
+    Be aware that manifest files may be synced before segment files even if
+    they are in the same container and were created after the segment files.
+
+    In the case of :ref:`Static Large Objects <static-large-objects>`, a GET
+    request for a manifest whose segments have yet to be completely synced will
+    fail with none or only part of the large object content being returned.
+
+    In the case of :ref:`Dynamic Large Objects <dynamic-large-objects>`, a GET
+    request for a manifest whose segments have yet to be completely synced will
+    either fail or return unexpected (and most likely incorrect) content.
 
 .. note::
 
-    If you are using the large objects feature you will need to ensure both
-    your manifest file and your segment files are synced if they happen to be
-    in different containers.
+    If you are using encryption middleware in the cluster from which objects
+    are being synced, then you should follow the instructions for
+    :ref:`container_sync_client_config` to be compatible with encryption.
 
---------------------------------------------
-Configuring a Cluster's Allowable Sync Hosts
---------------------------------------------
+.. note::
 
-The Swift cluster operator must allow synchronization with a set of hosts
-before the user can enable container synchronization. First, the backend
-container server needs to be given this list of hosts in the
-container-server.conf file::
+    If you are using symlink middleware in the cluster from which objects
+    are being synced, then you should follow the instructions for
+    :ref:`symlink_container_sync_client_config` to be compatible with symlinks.
+
+    Be aware that symlinks may be synced before their targets even if they are
+    in the same container and were created after the target objects. In such
+    cases, a GET for the symlink will fail with a ``404 Not Found`` error.  If
+    the target has been overwritten, a GET may produce an older version (for
+    dynamic links) or a ``409 Conflict`` error (for static links).
+
+--------------------------
+Configuring Container Sync
+--------------------------
+
+Create a ``container-sync-realms.conf`` file specifying the allowable clusters
+and their information::
+
+    [realm1]
+    key = realm1key
+    key2 = realm1key2
+    cluster_clustername1 = https://host1/v1/
+    cluster_clustername2 = https://host2/v1/
+
+    [realm2]
+    key = realm2key
+    key2 = realm2key2
+    cluster_clustername3 = https://host3/v1/
+    cluster_clustername4 = https://host4/v1/
+
+
+Each section name is the name of a sync realm. A sync realm is a set of
+clusters that have agreed to allow container syncing with each other. Realm
+names will be considered case insensitive.
+
+``key`` is the overall cluster-to-cluster key used in combination with the
+external users' key that they set on their containers'
+``X-Container-Sync-Key`` metadata header values. These keys will be used to
+sign each request the container sync daemon makes and used to validate each
+incoming container sync request.
+
+``key2`` is optional and is an additional key incoming requests will be checked
+against. This is so you can rotate keys if you wish; you move the existing ``key``
+to ``key2`` and make a new ``key`` value.
+
+Any values in the realm section whose names begin with ``cluster_`` will
+indicate the name and endpoint of a cluster and will be used by external users in
+their containers' ``X-Container-Sync-To`` metadata header values with the format
+``//realm_name/cluster_name/account_name/container_name``. Realm and cluster
+names are considered case insensitive.
+
+The endpoint is what the container sync daemon will use when sending out
+requests to that cluster. Keep in mind this endpoint must be reachable by all
+container servers, since that is where the container sync daemon runs. Note
+that the endpoint ends with ``/v1/`` and that the container sync daemon will then
+add the ``account/container/obj`` name after that.
+
+Distribute this ``container-sync-realms.conf`` file to all your proxy servers
+and container servers.
+
+You also need to add the container_sync middleware to your proxy pipeline. It
+needs to be after any memcache middleware and before any auth middleware. The
+``[filter:container_sync]`` section only needs the ``use`` item. For example::
+
+    [pipeline:main]
+    pipeline = healthcheck proxy-logging cache container_sync tempauth proxy-logging proxy-server
+
+    [filter:container_sync]
+    use = egg:swift#container_sync
+
+The container sync daemon will use an internal client to sync objects. Even if
+you don't configure the internal client, the container sync daemon will work
+with default configuration. The default configuration is the same as
+``internal-client.conf-sample``. If you want to configure the internal client,
+please update ``internal_client_conf_path`` in ``container-server.conf``. The
+configuration file at the path will be used for the internal client.
+
+-------------------------------------------------------
+Old-Style: Configuring a Cluster's Allowable Sync Hosts
+-------------------------------------------------------
+
+This section is for the old-style of using container sync. See the previous
+section, Configuring Container Sync, for the new-style.
+
+With the old-style, the Swift cluster operator must allow synchronization with
+a set of hosts before the user can enable container synchronization. First, the
+backend container server needs to be given this list of hosts in the
+``container-server.conf`` file::
 
     [DEFAULT]
     # This is a comma separated list of hosts allowed in the
@@ -52,13 +147,79 @@ container-server.conf file::
     # Maximum amount of time to spend syncing each container
     # container_time = 60
 
-Tracking sync progress, problems, and just general activity can only be
-achieved with log processing for this first release of container
-synchronization. In that light, you may wish to set the above `log_` options to
-direct the container-sync logs to a different file for easier monitoring.
-Additionally, it should be noted there is no way for an end user to detect sync
-progress or problems other than HEADing both containers and comparing the
-overall information.
+
+----------------------
+Logging Container Sync
+----------------------
+
+Currently, log processing is the only way to track sync progress, problems,
+and even just general activity for container synchronization. In that
+light, you may wish to set the above ``log_`` options to direct the
+container-sync logs to a different file for easier monitoring. Additionally, it
+should be noted there is no way for an end user to monitor sync progress or
+detect problems other than HEADing both containers and comparing the overall
+information.
+
+
+
+-----------------------------
+Container Sync Statistics
+-----------------------------
+
+Container Sync INFO level logs contain activity metrics and accounting
+information for insightful tracking.
+Currently two different statistics are collected:
+
+About once an hour or so, accumulated statistics of all operations performed
+by Container Sync are reported to the log file with the following format::
+
+    Since (time): (sync) synced [(delete) deletes, (put) puts], (skip) skipped, (fail) failed
+
+time
+    last report time
+sync
+    number of containers with sync turned on that were successfully synced
+delete
+    number of successful DELETE object requests to the target cluster
+put
+    number of successful PUT object request to the target cluster
+skip
+    number of containers whose sync has been turned off, but are not
+    yet cleared from the sync store
+fail
+    number of containers with failure (due to exception, timeout or other
+    reason)
+
+For each container synced, per container statistics are reported with the
+following format::
+
+    Container sync report: (container), time window start: (start), time window end: %(end), puts: (puts), posts: (posts), deletes: (deletes), bytes: (bytes), sync_point1: (point1), sync_point2: (point2), total_rows: (total)
+
+container
+    account/container statistics are for
+start
+    report start time
+end
+    report end time
+puts
+    number of successful PUT object requests to the target container
+posts
+    N/A (0)
+deletes
+    number of successful DELETE object requests to the target container
+bytes
+    number of bytes sent over the network to the target container
+point1
+    progress indication - the container's ``x_container_sync_point1``
+point2
+    progress indication - the container's ``x_container_sync_point2``
+total
+    number of objects processed at the container
+
+It is possible that more than one server syncs a container, therefore log files
+from all servers need to be evaluated
+
+
 
 ----------------------------------------------------------
 Using the ``swift`` tool to set up synchronized containers
@@ -73,6 +234,122 @@ Using the ``swift`` tool to set up synchronized containers
     You must be the account admin on the account to set synchronization targets
     and keys.
 
+You simply tell each container where to sync to and give it a secret
+synchronization key. First, let's get the account details for our two cluster
+accounts::
+
+    $ swift -A http://cluster1/auth/v1.0 -U test:tester -K testing stat -v
+    StorageURL: http://cluster1/v1/AUTH_208d1854-e475-4500-b315-81de645d060e
+    Auth Token: AUTH_tkd5359e46ff9e419fa193dbd367f3cd19
+       Account: AUTH_208d1854-e475-4500-b315-81de645d060e
+    Containers: 0
+       Objects: 0
+         Bytes: 0
+
+    $ swift -A http://cluster2/auth/v1.0 -U test2:tester2 -K testing2 stat -v
+    StorageURL: http://cluster2/v1/AUTH_33cdcad8-09fb-4940-90da-0f00cbf21c7c
+    Auth Token: AUTH_tk816a1aaf403c49adb92ecfca2f88e430
+       Account: AUTH_33cdcad8-09fb-4940-90da-0f00cbf21c7c
+    Containers: 0
+       Objects: 0
+         Bytes: 0
+
+Now, let's make our first container and tell it to synchronize to a second
+we'll make next::
+
+    $ swift -A http://cluster1/auth/v1.0 -U test:tester -K testing post \
+      -t '//realm_name/clustername2/AUTH_33cdcad8-09fb-4940-90da-0f00cbf21c7c/container2' \
+      -k 'secret' container1
+
+The ``-t`` indicates the cluster to sync to, which is the realm name of the
+section from ``container-sync-realms.conf``, followed by the cluster name from
+that section (without the ``cluster_`` prefix), followed by the account and container
+names we want to sync to. The ``-k`` specifies the secret key the two containers will share for
+synchronization; this is the user key, the cluster key in
+``container-sync-realms.conf`` will also be used behind the scenes.
+
+Now, we'll do something similar for the second cluster's container::
+
+    $ swift -A http://cluster2/auth/v1.0 -U test2:tester2 -K testing2 post \
+      -t '//realm_name/clustername1/AUTH_208d1854-e475-4500-b315-81de645d060e/container1' \
+      -k 'secret' container2
+
+That's it. Now we can upload a bunch of stuff to the first container and watch
+as it gets synchronized over to the second::
+
+    $ swift -A http://cluster1/auth/v1.0 -U test:tester -K testing \
+      upload container1 .
+    photo002.png
+    photo004.png
+    photo001.png
+    photo003.png
+
+    $ swift -A http://cluster2/auth/v1.0 -U test2:tester2 -K testing2 \
+      list container2
+
+    [Nothing there yet, so we wait a bit...]
+
+.. note::
+
+    If you're an operator running :ref:`saio` and just testing, each time you
+    configure a container for synchronization and place objects in the
+    source container you will need to ensure that container-sync runs
+    before attempting to retrieve objects from the target container.
+    That is, you need to run::
+
+      swift-init container-sync once
+
+Now expect to see objects copied from the first container to the second::
+
+    $ swift -A http://cluster2/auth/v1.0 -U test2:tester2 -K testing2 \
+      list container2
+    photo001.png
+    photo002.png
+    photo003.png
+    photo004.png
+
+You can also set up a chain of synced containers if you want more than two.
+You'd point 1 -> 2, then 2 -> 3, and finally 3 -> 1 for three containers.
+They'd all need to share the same secret synchronization key.
+
+.. _`python-swiftclient`: http://github.com/openstack/python-swiftclient
+
+-----------------------------------
+Using curl (or other tools) instead
+-----------------------------------
+
+So what's ``swift`` doing behind the scenes? Nothing overly complicated. It
+translates the ``-t <value>`` option into an ``X-Container-Sync-To: <value>``
+header and the ``-k <value>`` option into an ``X-Container-Sync-Key: <value>``
+header.
+
+For instance, when we created the first container above and told it to
+synchronize to the second, we could have used this curl command::
+
+    $ curl -i -X POST -H 'X-Auth-Token: AUTH_tkd5359e46ff9e419fa193dbd367f3cd19' \
+      -H 'X-Container-Sync-To: //realm_name/clustername2/AUTH_33cdcad8-09fb-4940-90da-0f00cbf21c7c/container2' \
+      -H 'X-Container-Sync-Key: secret' \
+      'http://cluster1/v1/AUTH_208d1854-e475-4500-b315-81de645d060e/container1'
+    HTTP/1.1 204 No Content
+    Content-Length: 0
+    Content-Type: text/plain; charset=UTF-8
+    Date: Thu, 24 Feb 2011 22:39:14 GMT
+
+---------------------------------------------------------------------
+Old-Style: Using the ``swift`` tool to set up synchronized containers
+---------------------------------------------------------------------
+
+.. note::
+
+    The ``swift`` tool is available from the `python-swiftclient`_ library.
+
+.. note::
+
+    You must be the account admin on the account to set synchronization targets
+    and keys.
+
+This is for the old-style of container syncing using ``allowed_sync_hosts``.
+
 You simply tell each container where to sync to and give it a secret
 synchronization key. First, let's get the account details for our two cluster
 accounts::
@@ -139,9 +416,11 @@ They'd all need to share the same secret synchronization key.
 
 .. _`python-swiftclient`: http://github.com/openstack/python-swiftclient
 
------------------------------------
-Using curl (or other tools) instead
------------------------------------
+----------------------------------------------
+Old-Style: Using curl (or other tools) instead
+----------------------------------------------
+
+This is for the old-style of container syncing using ``allowed_sync_hosts``.
 
 So what's ``swift`` doing behind the scenes? Nothing overly complicated. It
 translates the ``-t <value>`` option into an ``X-Container-Sync-To: <value>``
@@ -164,27 +443,41 @@ synchronize to the second, we could have used this curl command::
 What's going on behind the scenes, in the cluster?
 --------------------------------------------------
 
-The swift-container-sync does the job of sending updates to the remote
-container.
-
-This is done by scanning the local devices for container databases and
-checking for x-container-sync-to and x-container-sync-key metadata values.
-If they exist, newer rows since the last sync will trigger PUTs or DELETEs
-to the other container.
-
-.. note::
-
-    The swift-container-sync process runs on each container server in
-    the cluster and talks to the proxy servers in the remote cluster.
-    Therefore, the container servers must be permitted to initiate
-    outbound connections to the remote proxy servers.
+Container ring devices have a directory called ``containers``, where container
+databases reside. In addition to ``containers``, each container ring device
+also has a directory called ``sync-containers``. ``sync-containers`` holds
+symlinks to container databases that were configured for container sync using
+``x-container-sync-to`` and ``x-container-sync-key`` metadata keys.
+
+The swift-container-sync process does the job of sending updates to the remote
+container. This is done by scanning ``sync-containers`` for container
+databases. For each container db found, newer rows since the last sync will
+trigger PUTs or DELETEs to the other container.
+
+``sync-containers`` is maintained as follows:
+Whenever the container-server processes a PUT or a POST request that carries
+``x-container-sync-to`` and ``x-container-sync-key`` metadata keys the server
+creates a symlink to the container database in ``sync-containers``. Whenever
+the container server deletes a synced container, the appropriate symlink
+is deleted from ``sync-containers``.
+
+In addition to the container-server, the container-replicator process does the
+job of identifying containers that should be synchronized. This is done by
+scanning the local devices for container databases and checking for
+``x-container-sync-to`` and ``x-container-sync-key`` metadata values. If they exist
+then a symlink to the container database is created in a ``sync-containers``
+sub-directory on the same device.
+
+Similarly, when the container sync metadata keys are deleted, the container
+server and container-replicator would take care of deleting the symlinks
+from ``sync-containers``.
 
 .. note::
 
-    Container sync will sync object POSTs only if the proxy server is set to
-    use "object_post_as_copy = true" which is the default. So-called fast
-    object posts, "object_post_as_copy = false" do not update the container
-    listings and therefore can't be detected for synchronization.
+    The swift-container-sync process runs on each container server in the
+    cluster and talks to the proxy servers (or load balancers) in the remote
+    cluster. Therefore, the container servers must be permitted to initiate
+    outbound connections to the remote proxy servers (or load balancers).
 
 The actual syncing is slightly more complicated to make use of the three
 (or number-of-replicas) main nodes for a container without each trying to
@@ -195,7 +488,7 @@ Two sync points are kept in each container database. When syncing a
 container, the container-sync process figures out which replica of the
 container it has. In a standard 3-replica scenario, the process will
 have either replica number 0, 1, or 2. This is used to figure out
-which rows are belong to this sync process and which ones don't.
+which rows belong to this sync process and which ones don't.
 
 An example may help. Assume a replica count of 3 and database row IDs
 are 1..6. Also, assume that container-sync is running on this
@@ -223,7 +516,7 @@ hash of the object name, so it's not always guaranteed to be exactly
 one out of every three rows, but it usually gets close. For the sake
 of example, let's say that this process ends up owning rows 2 and 5.
 
-Once it's finished syncing those rows, it updates SP1 to be the
+Once it's finished trying to sync those rows, it updates SP1 to be the
 biggest row-id that it's seen, which is 6 in this example. ::
 
    SP2           SP1
@@ -241,19 +534,23 @@ container, creating new rows in the database. ::
 
 On the next run, the container-sync starts off looking at rows with
 ids between SP1 and SP2. This time, there are a bunch of them. The
-sync process takes the ones it *does not* own and syncs them. Again,
-this is based on the hashes, so this will be everything it didn't sync
-before. In this example, that's rows 0, 1, 3, 4, and 6.
-
-Under normal circumstances, the container-sync processes for the other
-replicas will have already taken care of synchronizing those rows, so
-this is a set of quick checks. However, if one of those other sync
+sync process try to sync all of them. If it succeeds, it will set
+SP2 to equal SP1. If it fails, it will set SP2 to the failed object
+and will continue to try all other objects till SP1, setting SP2 to
+the first object that failed.
+
+Under normal circumstances, the container-sync processes
+will have already taken care of synchronizing all rows, between SP1
+and SP2, resulting in a set of quick checks.
+However, if one of the sync
 processes failed for some reason, then this is a vital fallback to
 make sure all the objects in the container get synchronized. Without
 this seemingly-redundant work, any container-sync failure results in
-unsynchronized objects.
+unsynchronized objects. Note that the container sync will persistently
+retry to sync any faulty object until success, while logging each failure.
 
-Once it's done with the fallback rows, SP2 is advanced to SP1. ::
+Once it's done with the fallback rows, and assuming no faults occurred,
+SP2 is advanced to SP1. ::
 
                  SP2
                  SP1
diff --git a/doc/source/overview_encryption.rst b/doc/source/overview_encryption.rst
new file mode 100644
index 0000000000..beab7ba11d
--- /dev/null
+++ b/doc/source/overview_encryption.rst
@@ -0,0 +1,812 @@
+=================
+Object Encryption
+=================
+
+Swift supports the optional encryption of object data at rest on storage nodes.
+The encryption of object data is intended to mitigate the risk of users' data
+being read if an unauthorised party were to gain physical access to a disk.
+
+.. note::
+
+    Swift's data-at-rest encryption accepts plaintext object data from the
+    client, encrypts it in the cluster, and stores the encrypted data. This
+    protects object data from inadvertently being exposed if a data drive
+    leaves the Swift cluster. If a user wishes to ensure that the plaintext
+    data is always encrypted while in transit and in storage, it is strongly
+    recommended that the data be encrypted before sending it to the Swift
+    cluster. Encrypting on the client side is the only way to ensure that the
+    data is fully encrypted for its entire lifecycle.
+
+Encryption of data at rest is implemented by middleware that may be included in
+the proxy server WSGI pipeline. The feature is internal to a Swift cluster and
+not exposed through the API. Clients are unaware that data is encrypted by this
+feature internally to the Swift service; internally encrypted data should never
+be returned to clients via the Swift API.
+
+The following data are encrypted while at rest in Swift:
+
+* Object content i.e. the content of an object PUT request's body
+* The entity tag (ETag) of objects that have non-zero content
+* All custom user object metadata values i.e. metadata sent using
+  X-Object-Meta- prefixed headers with PUT or POST requests
+
+Any data or metadata not included in the list above are not encrypted,
+including:
+
+* Account, container and object names
+* Account and container custom user metadata values
+* All custom user metadata names
+* Object Content-Type values
+* Object size
+* System metadata
+
+.. note::
+
+    This feature is intended to provide `confidentiality` of data that is at
+    rest i.e. to protect user data from being read by an attacker that gains
+    access to disks on which object data is stored.
+
+    This feature is not intended to prevent undetectable `modification`
+    of user data at rest.
+
+    This feature is not intended to protect against an attacker that gains
+    access to Swift's internal network connections, or gains access to key
+    material or is able to modify the Swift code running on Swift nodes.
+
+.. _encryption_deployment:
+
+------------------------
+Deployment and operation
+------------------------
+
+Encryption is deployed by adding two middleware filters to the proxy
+server WSGI pipeline and including their respective filter configuration
+sections in the `proxy-server.conf` file. :ref:`Additional steps
+<container_sync_client_config>` are required if the container sync feature is
+being used.
+
+The `keymaster` and `encryption` middleware filters must be to the right of all
+other middleware in the pipeline apart from the final proxy-logging middleware,
+and in the order shown in this example::
+
+  <other middleware> keymaster encryption proxy-logging proxy-server
+
+  [filter:keymaster]
+  use = egg:swift#keymaster
+  encryption_root_secret = your_secret
+
+  [filter:encryption]
+  use = egg:swift#encryption
+  # disable_encryption = False
+
+See the `proxy-server.conf-sample` file for further details on the middleware
+configuration options.
+
+Keymaster middleware
+--------------------
+
+The `keymaster` middleware must be configured with a root secret before it is
+used. By default the `keymaster` middleware will use the root secret configured
+using the ``encryption_root_secret`` option in the middleware filter section of
+the `proxy-server.conf` file, for example::
+
+  [filter:keymaster]
+  use = egg:swift#keymaster
+  encryption_root_secret = your_secret
+
+Root secret values MUST be at least 44 valid base-64 characters and
+should be consistent across all proxy servers. The minimum length of 44 has
+been chosen because it is the length of a base-64 encoded 32 byte value.
+
+.. note::
+
+    The ``encryption_root_secret`` option holds the master secret key used for
+    encryption.  The security of all encrypted data critically depends on this
+    key and it should therefore be set to a high-entropy value. For example, a
+    suitable ``encryption_root_secret`` may be obtained by base-64 encoding a
+    32 byte (or longer) value generated by a cryptographically secure random
+    number generator.
+
+    The ``encryption_root_secret`` value is necessary to recover any encrypted
+    data from the storage system, and therefore, it must be guarded against
+    accidental loss. Its value (and consequently, the proxy-server.conf file)
+    should not be stored on any disk that is in any account, container or
+    object ring.
+
+    The ``encryption_root_secret`` value should not be changed once deployed.
+    Doing so would prevent Swift from properly decrypting data that was
+    encrypted using the former value, and would therefore result in the loss of
+    that data.
+
+One method for generating a suitable value for ``encryption_root_secret`` is to
+use the ``openssl`` command line tool::
+
+    openssl rand -base64 32
+
+
+Separate keymaster configuration file
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The ``encryption_root_secret`` option may alternatively be specified in a
+separate config file at a path specified by the ``keymaster_config_path``
+option, for example::
+
+  [filter:keymaster]
+  use = egg:swift#keymaster
+  keymaster_config_path = /etc/swift/keymaster.conf
+
+This has the advantage of allowing multiple processes which need to be
+encryption-aware (for example, proxy-server and container-sync) to share the
+same config file, ensuring that consistent encryption keys are used by those
+processes. It also allows the keymaster configuration file to have different
+permissions than the `proxy-server.conf` file.
+
+A separate keymaster config file should have a ``[keymaster]`` section
+containing the ``encryption_root_secret`` option::
+
+  [keymaster]
+  encryption_root_secret = your_secret
+
+
+.. note::
+
+    Alternative keymaster middleware is available to retrieve encryption root
+    secrets from an :ref:`external key management system
+    <encryption_root_secret_in_external_kms>` such as `Barbican
+    <https://docs.openstack.org/barbican>`_ rather than storing root secrets in
+    configuration files.
+
+Once deployed, the encryption filter will by default encrypt object data and
+metadata when handling PUT and POST requests and decrypt object data and
+metadata when handling GET and HEAD requests. COPY requests are transformed
+into GET and PUT requests by the :ref:`copy` middleware before reaching the
+encryption middleware and as a result object data and metadata is decrypted and
+re-encrypted when copied.
+
+.. _changing_the_root_secret:
+
+Changing the encryption root secret
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+From time to time it may be desirable to change the root secret that is used to
+derive encryption keys for new data written to the cluster. The `keymaster`
+middleware allows alternative root secrets to be specified in its configuration
+using options of the form::
+
+    encryption_root_secret_<secret_id> = <secret value>
+
+where ``secret_id`` is a unique identifier for the root secret and ``secret
+value`` is a value that meets the requirements for a root secret described
+above.
+
+Only one root secret is used to encrypt new data at any moment in time. This
+root secret is specified using the ``active_root_secret_id`` option. If
+specified, the value of this option should be one of the configured root secret
+``secret_id`` values; otherwise the value of ``encryption_root_secret`` will be
+taken as the default active root secret.
+
+.. note::
+
+    The active root secret is only used to derive keys for new data written to
+    the cluster. Changing the active root secret does not cause any existing
+    data to be re-encrypted.
+
+Existing encrypted data will be decrypted using the root secret that was active
+when that data was written. All previous active root secrets must therefore
+remain in the middleware configuration in order for decryption of existing data
+to succeed.  Existing encrypted data will reference previous root secret by
+the ``secret_id`` so it must be kept consistent in the configuration.
+
+.. note::
+
+    Do not remove or change any previously active ``<secret value>`` or ``<secret_id>``.
+
+For example, the following keymaster configuration file specifies three root
+secrets, with the value of ``encryption_root_secret_2`` being the current
+active root secret::
+
+    [keymaster]
+    active_root_secret_id = 2
+    encryption_root_secret = your_secret
+    encryption_root_secret_1 = your_secret_1
+    encryption_root_secret_2 = your_secret_2
+
+.. note::
+
+    To ensure there is no loss of data availability, deploying a new key to
+    your cluster requires a two-stage config change. First, add the new key
+    to the ``encryption_root_secret_<secret_id>`` option and restart the
+    proxy-server. Do this for all proxies. Next, set the
+    ``active_root_secret_id`` option to the new secret id and restart the
+    proxy. Again, do this for all proxies. This process ensures that all
+    proxies will have the new key available for *decryption* before any proxy
+    uses it for *encryption*.
+
+Encryption middleware
+---------------------
+
+Once deployed, the encryption filter will by default encrypt object data and
+metadata when handling PUT and POST requests and decrypt object data and
+metadata when handling GET and HEAD requests. COPY requests are transformed
+into GET and PUT requests by the :ref:`copy` middleware before reaching the
+encryption middleware and as a result object data and metadata is decrypted and
+re-encrypted when copied.
+
+
+.. _encryption_root_secret_in_external_kms:
+
+Encryption Root Secret in External Key Management System
+--------------------------------------------------------
+
+The benefits of using a dedicated system for storing the encryption root secret
+include the auditing and access control infrastructure that are already in
+place in such a system, and the fact that an encryption root secret stored in a
+key management system (KMS) may be backed by a hardware security module (HSM)
+for additional security. Another significant benefit of storing the root
+encryption secret in an external KMS is that it is in this case never stored on
+a disk in the Swift cluster.
+
+Swift supports fetching encryption root secrets from a `Barbican
+<https://docs.openstack.org/barbican>`_ service or a KMIP_ service using the
+``kms_keymaster`` or ``kmip_keymaster`` middleware respectively.
+
+.. _KMIP: https://www.oasis-open.org/committees/kmip/
+
+Encryption Root Secret in a Barbican KMS
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Make sure the required dependencies are installed for retrieving an encryption
+root secret from an external KMS. This can be done when installing Swift (add
+the ``-e`` flag to install as a development version) by changing to the Swift
+directory and running the following command to install Swift together with
+the ``kms_keymaster`` extra dependencies::
+
+  sudo pip install .[kms_keymaster]
+
+Another way to install the dependencies is by making sure the
+following lines exist in the requirements.txt file, and installing them using
+``pip install -r requirements.txt``::
+
+  cryptography>=1.6                       # BSD/Apache-2.0
+  castellan>=0.6.0
+
+.. note::
+
+    If any of the required packages is already installed, the ``--upgrade``
+    flag may be required for the ``pip`` commands in order for the required
+    minimum version to be installed.
+
+To make use of an encryption root secret stored in an external KMS,
+replace the keymaster middleware with the kms_keymaster middleware in the
+proxy server WSGI pipeline in `proxy-server.conf`, in the order shown in this
+example::
+
+  <other middleware> kms_keymaster encryption proxy-logging proxy-server
+
+and add a section to the same file::
+
+  [filter:kms_keymaster]
+  use = egg:swift#kms_keymaster
+  keymaster_config_path = file_with_kms_keymaster_config
+
+Create or edit the file `file_with_kms_keymaster_config` referenced above.
+For further details on the middleware configuration options, see the
+`keymaster.conf-sample` file. An example of the content of this file, with
+optional parameters omitted, is below::
+
+  [kms_keymaster]
+  key_id = changeme
+  username = swift
+  password = password
+  project_name = swift
+  auth_endpoint = http://keystonehost:5000/v3
+
+The encryption root secret shall be created and stored in the external key
+management system before it can be used by the keymaster. It shall be stored
+as a symmetric key, with content type ``application/octet-stream``,
+``base64`` content encoding, ``AES`` algorithm, bit length ``256``, and secret
+type ``symmetric``. The mode ``ctr`` may also be stored for informational
+purposes - it is not currently checked by the keymaster.
+
+The following command can be used to store the currently configured
+``encryption_root_secret`` value from the `proxy-server.conf` file
+in Barbican::
+
+    openstack secret store --name swift_root_secret \
+    --payload-content-type="application/octet-stream" \
+    --payload-content-encoding="base64" --algorithm aes --bit-length 256 \
+    --mode ctr --secret-type symmetric --payload <base64_encoded_root_secret>
+
+Alternatively, the existing root secret can also be stored in Barbican using
+`curl <https://docs.openstack.org/api-guide/key-manager/secrets.html>`__.
+
+.. note::
+
+    The credentials used to store the secret in Barbican shall be the same
+    ones that the proxy server uses to retrieve the secret, i.e., the ones
+    configured in the `keymaster.conf` file. For clarity reasons the commands
+    shown here omit the credentials - they may be specified explicitly, or in
+    environment variables.
+
+Instead of using an existing root secret, Barbican can also be asked to
+generate a new 256-bit root secret, with content type
+``application/octet-stream`` and algorithm ``AES`` (the ``mode`` parameter is
+currently optional)::
+
+    openstack secret order create --name swift_root_secret \
+    --payload-content-type="application/octet-stream" --algorithm aes \
+    --bit-length 256 --mode ctr key
+
+The ``order create`` creates an asynchronous request to create the actual
+secret.
+The order can be retrieved using ``openstack secret order get``, and once the
+order completes successfully, the output will show the key id of the generated
+root secret.
+Keys currently stored in Barbican can be listed using the
+``openstack secret list`` command.
+
+.. note::
+
+    Both the order (the asynchronous request for creating or storing a secret),
+    and the actual secret itself, have similar unique identifiers. Once the
+    order has been completed, the key id is shown in the output of the ``order
+    get`` command.
+
+The keymaster uses the explicitly configured username and password (and
+project name etc.) from the `keymaster.conf` file for retrieving the encryption
+root secret from an external key management system. The `Castellan library
+<https://docs.openstack.org/castellan/latest/>`_ is used to communicate with
+Barbican.
+
+For the proxy server, reading the encryption root secret directly from the
+`proxy-server.conf` file, from the `keymaster.conf` file pointed to
+from the `proxy-server.conf` file, or from an external key management system
+such as Barbican, are all functionally equivalent. In case reading the
+encryption root secret from the external key management system fails, the
+proxy server will not start up. If the encryption root secret is retrieved
+successfully, it is cached in memory in the proxy server.
+
+For further details on the configuration options, see the
+`[filter:kms_keymaster]` section in the `proxy-server.conf-sample` file, and
+the `keymaster.conf-sample` file.
+
+
+Encryption Root Secret in a KMIP service
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+This middleware enables Swift to fetch a root secret from a KMIP_ service. The
+root secret is expected to have been previously created in the KMIP_ service
+and is referenced by its unique identifier. The secret should be an AES-256
+symmetric key.
+
+To use this middleware Swift must be installed with the extra required
+dependencies::
+
+    sudo pip install .[kmip_keymaster]
+
+Add the ``-e`` flag to install as a development version.
+
+Edit the swift `proxy-server.conf` file to insert the middleware in the wsgi
+pipeline, replacing any other keymaster middleware::
+
+    [pipeline:main]
+    pipeline = catch_errors gatekeeper healthcheck proxy-logging \
+        <other middleware> kmip_keymaster encryption proxy-logging proxy-server
+
+and add a new filter section::
+
+    [filter:kmip_keymaster]
+    use = egg:swift#kmip_keymaster
+    key_id = <unique id of secret to be fetched from the KMIP service>
+    host = <KMIP server host>
+    port = <KMIP server port>
+    certfile = /path/to/client/cert.pem
+    keyfile = /path/to/client/key.pem
+    ca_certs = /path/to/server/cert.pem
+    username = <KMIP username>
+    password = <KMIP password>
+
+Apart from ``use`` and ``key_id`` the options are as defined for a PyKMIP
+client. The authoritative definition of these options can be found at
+`<https://pykmip.readthedocs.io/en/latest/client.html>`_.
+
+The value of the ``key_id`` option should be the unique identifier for a secret
+that will be retrieved from the KMIP_ service.
+
+The keymaster configuration can alternatively be defined in a separate config
+file by using the ``keymaster_config_path`` option::
+
+    [filter:kmip_keymaster]
+    use = egg:swift#kmip_keymaster
+    keymaster_config_path = /etc/swift/kmip_keymaster.conf
+
+In this case, the ``filter:kmip_keymaster`` section should contain no other
+options than ``use`` and ``keymaster_config_path``. All other options should be
+defined in the separate config file in a section named ``kmip_keymaster``. For
+example::
+
+    [kmip_keymaster]
+    key_id = 1234567890
+    host = 127.0.0.1
+    port = 5696
+    certfile = /etc/swift/kmip_client.crt
+    keyfile = /etc/swift/kmip_client.key
+    ca_certs = /etc/swift/kmip_server.crt
+    username = swift
+    password = swift_password
+
+Changing the encryption root secret of external KMS's
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+Because the KMS and KMIP keymaster's derive from the default KeyMaster they
+also have to ability to define multiple keys. The only difference is the key
+option names. Instead of using the form `encryption_root_secret_<secret_id>`
+both external KMS's use `key_id_<secret_id>`, as it is an extension of their
+existing configuration. For example::
+
+  ...
+  key_id = 1234567890
+  key_id_foo = 0987654321
+  key_id_bar = 5432106789
+  active_root_secret_id = foo
+  ...
+
+Other then that, the process is the same as :ref:`changing_the_root_secret`.
+
+Upgrade Considerations
+----------------------
+
+When upgrading an existing cluster to deploy encryption, the following sequence
+of steps is recommended:
+
+#. Upgrade all object servers
+#. Upgrade all proxy servers
+#. Add keymaster and encryption middlewares to every proxy server's middleware
+   pipeline with the encryption ``disable_encryption`` option set to ``True``
+   and the keymaster ``encryption_root_secret`` value set as described above.
+#. If required, follow the steps for :ref:`container_sync_client_config`.
+#. Finally, change the encryption ``disable_encryption`` option to ``False``
+
+Objects that existed in the cluster prior to the keymaster and encryption
+middlewares being deployed are still readable with GET and HEAD requests. The
+content of those objects will not be encrypted unless they are written again by
+a PUT or COPY request. Any user metadata of those objects will not be encrypted
+unless it is written again by a PUT, POST or COPY request.
+
+Disabling Encryption
+--------------------
+
+Once deployed, the keymaster and encryption middlewares should not be removed
+from the pipeline. To do so will cause encrypted object data and/or metadata to
+be returned in response to GET or HEAD requests for objects that were
+previously encrypted.
+
+Encryption of inbound object data may be disabled by setting the encryption
+``disable_encryption`` option to ``True``, in which case existing encrypted
+objects will remain encrypted but new data written with PUT, POST or COPY
+requests will not be encrypted. The keymaster and encryption middlewares should
+remain in the pipeline even when encryption of new objects is not required. The
+encryption middleware is needed to handle GET requests for objects that may
+have been previously encrypted. The keymaster is needed to provide keys for
+those requests.
+
+.. _container_sync_client_config:
+
+Container sync configuration
+----------------------------
+
+If container sync is being used then the keymaster and encryption middlewares
+must be added to the container sync internal client pipeline. The following
+configuration steps are required:
+
+#. Create a custom internal client configuration file for container sync (if
+   one is not already in use) based on the sample file
+   `internal-client.conf-sample`. For example, copy
+   `internal-client.conf-sample` to `/etc/swift/container-sync-client.conf`.
+#. Modify this file to include the middlewares in the pipeline in
+   the same way as described above for the proxy server.
+#. Modify the container-sync section of all container server config files to
+   point to this internal client config file using the
+   ``internal_client_conf_path`` option. For example::
+
+     internal_client_conf_path = /etc/swift/container-sync-client.conf
+
+.. note::
+
+    The ``encryption_root_secret`` value is necessary to recover any encrypted
+    data from the storage system, and therefore, it must be guarded against
+    accidental loss. Its value (and consequently, the custom internal client
+    configuration file) should not be stored on any disk that is in any
+    account, container or object ring.
+
+.. note::
+
+    These container sync configuration steps will be necessary for container
+    sync probe tests to pass if the encryption middlewares are included in the
+    proxy pipeline of a test cluster.
+
+--------------
+Implementation
+--------------
+
+Encryption scheme
+-----------------
+
+Plaintext data is encrypted to ciphertext using the AES cipher with 256-bit
+keys implemented by the python `cryptography package
+<https://pypi.org/project/cryptography>`_. The cipher is used in counter
+(CTR) mode so that any byte or range of bytes in the ciphertext may be
+decrypted independently of any other bytes in the ciphertext. This enables very
+simple handling of ranged GETs.
+
+In general an item of unencrypted data, ``plaintext``, is transformed to an
+item of encrypted data, ``ciphertext``::
+
+  ciphertext = E(plaintext, k, iv)
+
+where ``E`` is the encryption function, ``k`` is an encryption key and ``iv``
+is a unique initialization vector (IV) chosen for each encryption context. For
+example, the object body is one encryption context with a randomly chosen IV.
+The IV is stored as metadata of the encrypted item so that it is available for
+decryption::
+
+  plaintext = D(ciphertext, k, iv)
+
+where ``D`` is the decryption function.
+
+The implementation of CTR mode follows `NIST SP800-38A
+<http://csrc.nist.gov/publications/nistpubs/800-38a/sp800-38a.pdf>`_, and the
+full IV passed to the encryption or decryption function serves as the initial
+counter block.
+
+In general any encrypted item has accompanying crypto-metadata that describes
+the IV and the cipher algorithm used for the encryption::
+
+  crypto_metadata = {"iv": <16 byte value>,
+                     "cipher": "AES_CTR_256"}
+
+This crypto-metadata is stored either with the ciphertext (for user
+metadata and etags) or as a separate header (for object bodies).
+
+Key management
+--------------
+
+A keymaster middleware is responsible for providing the keys required for each
+encryption and decryption operation. Two keys are required when handling object
+requests: a `container key` that is uniquely associated with the container path
+and an `object key` that is uniquely associated with the object path.  These
+keys are made available to the encryption middleware via a callback function
+that the keymaster installs in the WSGI request environ.
+
+The current keymaster implementation derives container and object keys from the
+``encryption_root_secret`` in a deterministic way by constructing a SHA256
+HMAC using the ``encryption_root_secret`` as a key and the container or object
+path as a message, for example::
+
+  object_key = HMAC(encryption_root_secret, "/a/c/o")
+
+Other strategies for providing object and container keys may be employed by
+future implementations of alternative keymaster middleware.
+
+During each object PUT, a random key is generated to encrypt the object body.
+This random key is then encrypted using the object key provided by the
+keymaster. This makes it safe to store the encrypted random key alongside the
+encrypted object data and metadata.
+
+This process of `key wrapping` enables more efficient re-keying events when the
+object key may need to be replaced and consequently any data encrypted using
+that key must be re-encrypted. Key wrapping minimizes the amount of data
+encrypted using those keys to just other randomly chosen keys which can be
+re-wrapped efficiently without needing to re-encrypt the larger amounts of data
+that were encrypted using the random keys.
+
+.. note::
+
+    Re-keying is not currently implemented. Key wrapping is implemented
+    in anticipation of future re-keying operations.
+
+
+Encryption middleware
+---------------------
+
+The encryption middleware is composed of an `encrypter` component and a
+`decrypter` component.
+
+Encrypter operation
+^^^^^^^^^^^^^^^^^^^
+
+Custom user metadata
+++++++++++++++++++++
+
+The encrypter encrypts each item of custom user metadata using the object key
+provided by the keymaster and an IV that is randomly chosen for that metadata
+item. The encrypted values are stored as :ref:`transient_sysmeta` with
+associated crypto-metadata appended to the encrypted value. For example::
+
+  X-Object-Meta-Private1: value1
+  X-Object-Meta-Private2: value2
+
+are transformed to::
+
+  X-Object-Transient-Sysmeta-Crypto-Meta-Private1:
+    E(value1, object_key, header_iv_1); swift_meta={"iv": header_iv_1,
+                                                    "cipher": "AES_CTR_256"}
+  X-Object-Transient-Sysmeta-Crypto-Meta-Private2:
+    E(value2, object_key, header_iv_2); swift_meta={"iv": header_iv_2,
+                                                    "cipher": "AES_CTR_256"}
+
+The unencrypted custom user metadata headers are removed.
+
+Object body
++++++++++++
+
+Encryption of an object body is performed using a randomly chosen body key
+and a randomly chosen IV::
+
+  body_ciphertext = E(body_plaintext, body_key, body_iv)
+
+The body_key is wrapped using the object key provided by the keymaster and a
+randomly chosen IV::
+
+  wrapped_body_key = E(body_key, object_key, body_key_iv)
+
+The encrypter stores the associated crypto-metadata in a system metadata
+header::
+
+  X-Object-Sysmeta-Crypto-Body-Meta:
+      {"iv": body_iv,
+       "cipher": "AES_CTR_256",
+       "body_key": {"key": wrapped_body_key,
+                    "iv": body_key_iv}}
+
+Note that in this case there is an extra item of crypto-metadata which stores
+the wrapped body key and its IV.
+
+Entity tag
+++++++++++
+
+While encrypting the object body the encrypter also calculates the ETag (md5
+digest) of the plaintext body. This value is encrypted using the object key
+provided by the keymaster and a randomly chosen IV, and saved as an item of
+system metadata, with associated crypto-metadata appended to the encrypted
+value::
+
+  X-Object-Sysmeta-Crypto-Etag:
+    E(md5(plaintext), object_key, etag_iv); swift_meta={"iv": etag_iv,
+                                                        "cipher": "AES_CTR_256"}
+
+The encrypter also forces an encrypted version of the plaintext ETag to be sent
+with container updates by adding an update override header to the PUT request.
+The associated crypto-metadata is appended to the encrypted ETag value of this
+update override header::
+
+  X-Object-Sysmeta-Container-Update-Override-Etag:
+      E(md5(plaintext), container_key, override_etag_iv);
+      meta={"iv": override_etag_iv, "cipher": "AES_CTR_256"}
+
+The container key is used for this encryption so that the decrypter is able
+to decrypt the ETags in container listings when handling a container request,
+since object keys may not be available in that context.
+
+Since the plaintext ETag value is only known once the encrypter has completed
+processing the entire object body, the ``X-Object-Sysmeta-Crypto-Etag`` and
+``X-Object-Sysmeta-Container-Update-Override-Etag`` headers are sent after the
+encrypted object body using the proxy server's support for request footers.
+
+.. _conditional_requests:
+
+Conditional Requests
+++++++++++++++++++++
+
+In general, an object server evaluates conditional requests with
+``If[-None]-Match`` headers by comparing values listed in an
+``If[-None]-Match`` header against the ETag that is stored in the object
+metadata. This is not possible when the ETag stored in object metadata has been
+encrypted. The encrypter therefore calculates an HMAC using the object key and
+the ETag while handling object PUT requests, and stores this under the metadata
+key ``X-Object-Sysmeta-Crypto-Etag-Mac``::
+
+  X-Object-Sysmeta-Crypto-Etag-Mac: HMAC(object_key, md5(plaintext))
+
+Like other ETag-related metadata, this is sent after the encrypted object body
+using the proxy server's support for request footers.
+
+The encrypter similarly calculates an HMAC for each ETag value included in
+``If[-None]-Match`` headers of conditional GET or HEAD requests, and appends
+these to the ``If[-None]-Match`` header. The encrypter also sets the
+``X-Backend-Etag-Is-At`` header to point to the previously stored
+``X-Object-Sysmeta-Crypto-Etag-Mac`` metadata so that the object server
+evaluates the conditional request by comparing the HMAC values included in the
+``If[-None]-Match`` with the value stored under
+``X-Object-Sysmeta-Crypto-Etag-Mac``. For example, given a conditional request
+with header::
+
+  If-Match: match_etag
+
+the encrypter would transform the request headers to include::
+
+  If-Match: match_etag,HMAC(object_key, match_etag)
+  X-Backend-Etag-Is-At: X-Object-Sysmeta-Crypto-Etag-Mac
+
+This enables the object server to perform an encrypted comparison to check
+whether the ETags match, without leaking the ETag itself or leaking information
+about the object body.
+
+Decrypter operation
+^^^^^^^^^^^^^^^^^^^
+
+For each GET or HEAD request to an object, the decrypter inspects the response
+for encrypted items (revealed by crypto-metadata headers), and if any are
+discovered then it will:
+
+#. Fetch the object and container keys from the keymaster via its callback
+#. Decrypt the ``X-Object-Sysmeta-Crypto-Etag`` value
+#. Decrypt the ``X-Object-Sysmeta-Container-Update-Override-Etag`` value
+#. Decrypt metadata header values using the object key
+#. Decrypt the wrapped body key found in ``X-Object-Sysmeta-Crypto-Body-Meta``
+#. Decrypt the body using the body key
+
+For each GET request to a container that would include ETags in its response
+body, the decrypter will:
+
+#. GET the response body with the container listing
+#. Fetch the container key from the keymaster via its callback
+#. Decrypt any encrypted ETag entries in the container listing using the
+   container key
+
+
+Impact on other Swift services and features
+-------------------------------------------
+
+Encryption has no impact on :ref:`versioned_writes` other than that any
+previously unencrypted objects will be encrypted as they are copied to or from
+the versions container. Keymaster and encryption middlewares should be placed
+after ``versioned_writes`` in the proxy server pipeline, as described in
+:ref:`encryption_deployment`.
+
+`Container Sync` uses an internal client to GET objects that are to be sync'd.
+This internal client must be configured to use the keymaster and encryption
+middlewares as described :ref:`above <container_sync_client_config>`.
+
+Encryption has no impact on the `object-auditor` service. Since the ETag
+header saved with the object at rest is the md5 sum of the encrypted object
+body then the auditor will verify that encrypted data is valid.
+
+Encryption has no impact on the `object-expirer` service. ``X-Delete-At`` and
+``X-Delete-After`` headers are not encrypted.
+
+Encryption has no impact on the `object-replicator` and `object-reconstructor`
+services. These services are unaware of the object or EC fragment data being
+encrypted.
+
+Encryption has no impact on the `container-reconciler` service. The
+`container-reconciler` uses an internal client to move objects between
+different policy rings. The reconciler's pipeline *MUST NOT* have encryption
+enabled. The destination object has the same URL as the source object and the
+object is moved without re-encryption.
+
+
+Considerations for developers
+-----------------------------
+
+Developers should be aware that keymaster and encryption middlewares rely on
+the path of an object remaining unchanged. The included keymaster derives keys
+for containers and objects based on their paths and the
+``encryption_root_secret``. The keymaster does not rely on object metadata to
+inform its generation of keys for GET and HEAD requests because when handling
+:ref:`conditional_requests` it is required to provide the object key before any
+metadata has been read from the object.
+
+Developers should therefore give careful consideration to any new features that
+would relocate object data and metadata within a Swift cluster by means that do
+not cause the object data and metadata to pass through the encryption
+middlewares in the proxy pipeline and be re-encrypted.
+
+The crypto-metadata associated with each encrypted item does include some
+`key_id` metadata that is provided by the keymaster and contains the path used
+to derive keys. This `key_id` metadata is persisted in anticipation of future
+scenarios when it may be necessary to decrypt an object that has been relocated
+without re-encrypting, in which case the metadata could be used to derive the
+keys that were used for encryption. However, this alone is not sufficient to
+handle conditional requests and to decrypt container listings where objects
+have been relocated, and further work will be required to solve those issues.
diff --git a/doc/source/overview_erasure_code.rst b/doc/source/overview_erasure_code.rst
new file mode 100644
index 0000000000..26cf7aa828
--- /dev/null
+++ b/doc/source/overview_erasure_code.rst
@@ -0,0 +1,921 @@
+====================
+Erasure Code Support
+====================
+
+*******************************
+History and Theory of Operation
+*******************************
+
+There's a lot of good material out there on Erasure Code (EC) theory, this short
+introduction is just meant to provide some basic context to help the reader
+better understand the implementation in Swift.
+
+Erasure Coding for storage applications grew out of Coding Theory as far back as
+the 1960s with the Reed-Solomon codes.  These codes have been used for years in
+applications ranging from CDs to DVDs to general communications and, yes, even
+in the space program starting with Voyager! The basic idea is that some amount
+of data is broken up into smaller pieces called fragments and coded in such a
+way that it can be transmitted with the ability to tolerate the loss of some
+number of the coded fragments.  That's where the word "erasure" comes in, if you
+transmit 14 fragments and only 13 are received then one of them is said to be
+"erased".  The word "erasure" provides an important distinction with EC; it
+isn't about detecting errors, it's about dealing with failures.  Another
+important element of EC is that the number of erasures that can be tolerated can
+be adjusted to meet the needs of the application.
+
+At a high level EC works by using a specific scheme to break up a single data
+buffer into several smaller data buffers then, depending on the scheme,
+performing some encoding operation on that data in order to generate additional
+information.  So you end up with more data than you started with and that extra
+data is often called "parity".  Note that there are many, many different
+encoding techniques that vary both in how they organize and manipulate the data
+as well by what means they use to calculate parity.  For example, one scheme
+might rely on `Galois Field Arithmetic <http://www.ssrc.ucsc.edu/Papers/plank-
+fast13.pdf>`_ while others may work with only XOR. The number of variations and
+details about their differences are well beyond the scope of this introduction,
+but we will talk more about a few of them when we get into the implementation of
+EC in Swift.
+
+Overview of EC Support in Swift
+================================
+
+First and foremost, from an application perspective EC support is totally
+transparent. There are no EC related external API; a container is simply created
+using a Storage Policy defined to use EC and then interaction with the cluster
+is the same as any other durability policy.
+
+EC is implemented in Swift as a Storage Policy, see :doc:`overview_policies` for
+complete details on Storage Policies.  Because support is implemented as a
+Storage Policy, all of the storage devices associated with your cluster's EC
+capability can be isolated.  It is entirely possible to share devices between
+storage policies, but for EC it may make more sense to not only use separate
+devices but possibly even entire nodes dedicated for EC.
+
+Which direction one chooses depends on why the EC policy is being deployed.  If,
+for example, there is a production replication policy in place already and the
+goal is to add a cold storage tier such that the existing nodes performing
+replication are impacted as little as possible, adding a new set of nodes
+dedicated to EC might make the most sense but also incurs the most cost.  On the
+other hand, if EC is being added as a capability to provide additional
+durability for a specific set of applications and the existing infrastructure is
+well suited for EC (sufficient number of nodes, zones for the EC scheme that is
+chosen) then leveraging the existing infrastructure such that the EC ring shares
+nodes with the replication ring makes the most sense.  These are some of the
+main considerations:
+
+* Layout of existing infrastructure.
+* Cost of adding dedicated EC nodes (or just dedicated EC devices).
+* Intended usage model(s).
+
+The Swift code base does not include any of the algorithms necessary to perform
+the actual encoding and decoding of data; that is left to external libraries.
+The Storage Policies architecture is leveraged to enable EC on a per container
+basis -- the object rings are still used to determine the placement of EC data
+fragments. Although there are several code paths that are unique to an operation
+associated with an EC policy, an external dependency to an Erasure Code library
+is what Swift counts on to perform the low level EC functions.  The use of an
+external library allows for maximum flexibility as there are a significant
+number of options out there, each with its owns pros and cons that can vary
+greatly from one use case to another.
+
+PyECLib:  External Erasure Code Library
+=======================================
+
+PyECLib is a Python Erasure Coding Library originally designed and written as
+part of the effort to add EC support to the Swift project, however it is an
+independent project.  The library provides a well-defined and simple Python
+interface and internally implements a plug-in architecture allowing it to take
+advantage of many well-known C libraries such as:
+
+* Jerasure and GFComplete at http://jerasure.org.
+* Intel(R) ISA-L at http://01.org/intel%C2%AE-storage-acceleration-library-open-source-version.
+* Or write your own!
+
+PyECLib uses a C based library called liberasurecode to implement the plug in
+infrastructure; liberasurecode is available at:
+
+* liberasurecode: https://github.com/openstack/liberasurecode
+
+PyECLib itself therefore allows for not only choice but further extensibility as
+well. PyECLib also comes with a handy utility to help determine the best
+algorithm to use based on the equipment that will be used (processors and server
+configurations may vary in performance per algorithm).  More on this will be
+covered in the configuration section.  PyECLib is included as a Swift
+requirement.
+
+For complete details see `PyECLib <https://github.com/openstack/pyeclib>`_
+
+Storing and Retrieving Objects
+==============================
+
+We will discuss the details of how PUT and GET work in the "Under the Hood"
+section later on. The key point here is that all of the erasure code work goes
+on behind the scenes; this summary is a high level information overview only.
+
+The PUT flow looks like this:
+
+#. The proxy server streams in an object and buffers up "a segment" of data
+   (size is configurable).
+#. The proxy server calls on PyECLib to encode the data into smaller fragments.
+#. The proxy streams the encoded fragments out to the storage nodes based on
+   ring locations.
+#. Repeat until the client is done sending data.
+#. The client is notified of completion when a quorum is met.
+
+The GET flow looks like this:
+
+#. The proxy server makes simultaneous requests to participating nodes.
+#. As soon as the proxy has the fragments it needs, it calls on PyECLib to
+   decode the data.
+#. The proxy streams the decoded data it has back to the client.
+#. Repeat until the proxy is done sending data back to the client.
+
+It may sound like, from this high level overview, that using EC is going to
+cause an explosion in the number of actual files stored in each node's local
+file system.  Although it is true that more files will be stored (because an
+object is broken into pieces), the implementation works to minimize this where
+possible, more details are available in the Under the Hood section.
+
+Handoff Nodes
+=============
+
+In EC policies, similarly to replication, handoff nodes are a set of storage
+nodes used to augment the list of primary nodes responsible for storing an
+erasure coded object. These handoff nodes are used in the event that one or more
+of the primaries are unavailable.  Handoff nodes are still selected with an
+attempt to achieve maximum separation of the data being placed.
+
+Reconstruction
+==============
+
+For an EC policy, reconstruction is analogous to the process of replication for
+a replication type policy -- essentially "the reconstructor" replaces "the
+replicator" for EC policy types. The basic framework of reconstruction is very
+similar to that of replication with a few notable exceptions:
+
+* Because EC does not actually replicate partitions, it needs to operate at a
+  finer granularity than what is provided with rsync, therefore EC leverages
+  much of ssync behind the scenes (you do not need to manually configure ssync).
+* Once a pair of nodes has determined the need to replace a missing object
+  fragment, instead of pushing over a copy like replication would do, the
+  reconstructor has to read in enough surviving fragments from other nodes and
+  perform a local reconstruction before it has the correct data to push to the
+  other node.
+* A reconstructor does not talk to all other reconstructors in the set of nodes
+  responsible for an EC partition, this would be far too chatty, instead each
+  reconstructor is responsible for sync'ing with the partition's closest two
+  neighbors (closest meaning left and right on the ring).
+
+.. note::
+
+    EC work (encode and decode) takes place both on the proxy nodes, for PUT/GET
+    operations, as well as on the storage nodes for reconstruction.  As with
+    replication, reconstruction can be the result of rebalancing, bit-rot, drive
+    failure or reverting data from a hand-off node back to its primary.
+
+**************************
+Performance Considerations
+**************************
+
+In general, EC has different performance characteristics than replicated data.
+EC requires substantially more CPU to read and write data, and is more suited
+for larger objects that are not frequently accessed (e.g. backups).
+
+Operators are encouraged to characterize the performance of various EC schemes
+and share their observations with the developer community.
+
+
+.. _using_ec_policy:
+
+****************************
+Using an Erasure Code Policy
+****************************
+
+To use an EC policy, the administrator simply needs to define an EC policy in
+`swift.conf` and create/configure the associated object ring.  An example of how
+an EC policy can be setup is shown below::
+
+        [storage-policy:2]
+        name = ec104
+        policy_type = erasure_coding
+        ec_type = liberasurecode_rs_vand
+        ec_num_data_fragments = 10
+        ec_num_parity_fragments = 4
+        ec_object_segment_size = 1048576
+
+Let's take a closer look at each configuration parameter:
+
+* ``name``: This is a standard storage policy parameter.
+  See :doc:`overview_policies` for details.
+* ``policy_type``: Set this to ``erasure_coding`` to indicate that this is an EC
+  policy.
+* ``ec_type``: Set this value according to the available options in the selected
+  PyECLib back-end. This specifies the EC scheme that is to be used.  For
+  example the option shown here selects Vandermonde Reed-Solomon encoding while
+  an option of ``flat_xor_hd_3`` would select Flat-XOR based HD combination
+  codes. See the `PyECLib <https://github.com/openstack/pyeclib>`_ page for
+  full details.
+* ``ec_num_data_fragments``: The total number of fragments that will be
+  comprised of data.
+* ``ec_num_parity_fragments``: The total number of fragments that will be
+  comprised of parity.
+* ``ec_object_segment_size``: The amount of data that will be buffered up before
+  feeding a segment into the encoder/decoder. The default value is 1048576.
+
+When PyECLib encodes an object, it will break it into N fragments. However, what
+is important during configuration, is how many of those are data and how many
+are parity.  So in the example above, PyECLib will actually break an object in
+14 different fragments, 10 of them will be made up of actual object data and 4
+of them will be made of parity data (calculations depending on ec_type).
+
+When deciding which devices to use in the EC policy's object ring, be sure to
+carefully consider the performance impacts.  Running some performance
+benchmarking in a test environment for your configuration is highly recommended
+before deployment.
+
+To create the EC policy's object ring, the only difference in the usage of the
+``swift-ring-builder create`` command is the ``replicas`` parameter.  The
+``replicas`` value is the number of fragments spread across the object servers
+associated with the ring; ``replicas`` must be equal to the sum of
+``ec_num_data_fragments`` and ``ec_num_parity_fragments``. For example::
+
+  swift-ring-builder object-1.builder create 10 14 1
+
+Note that in this example the ``replicas`` value of ``14`` is based on the sum of
+``10`` EC data fragments and ``4`` EC parity fragments.
+
+Once you have configured your EC policy in `swift.conf` and created your object
+ring, your application is ready to start using EC simply by creating a container
+with the specified policy name and interacting as usual.
+
+.. note::
+
+    It's important to note that once you have deployed a policy and have created
+    objects with that policy, these configurations options cannot be changed. In
+    case a change in the configuration is desired, you must create a new policy
+    and migrate the data to a new container.
+
+.. warning::
+
+    Using ``isa_l_rs_vand`` with more than 4 parity fragments creates fragments
+    which may in some circumstances fail to reconstruct properly or (with
+    liberasurecode < 1.3.1) reconstruct corrupted data. New policies that need
+    large numbers of parity fragments should consider using ``isa_l_rs_cauchy``.
+    Any existing affected policies must be marked deprecated, and data in
+    containers with that policy should be migrated to a new policy.
+
+Migrating Between Policies
+==========================
+
+A common usage of EC is to migrate less commonly accessed data from a more
+expensive but lower latency policy such as replication.  When an application
+determines that it wants to move data from a replication policy to an EC policy,
+it simply needs to move the data from the replicated container to an EC
+container that was created with the target durability policy.
+
+
+*********
+Global EC
+*********
+
+The following recommendations are made when deploying an EC policy that spans
+multiple regions in a :doc:`Global Cluster <overview_global_cluster>`:
+
+* The global EC policy should use :ref:`ec_duplication` in conjunction with a
+  :ref:`Composite Ring <composite_rings>`, as described below.
+* Proxy servers should be :ref:`configured to use read affinity
+  <configuring_global_clusters>` to prefer reading from their local region for
+  the global EC policy. :ref:`proxy_server_per_policy_config` allows this to be
+  configured for individual policies.
+
+.. note::
+
+    Before deploying a Global EC policy, consideration should be given to the
+    :ref:`global_ec_known_issues`, in particular the relatively poor
+    performance anticipated from the object-reconstructor.
+
+.. _ec_duplication:
+
+EC Duplication
+==============
+
+EC Duplication enables Swift to make duplicated copies of fragments of erasure
+coded objects.  If an EC storage policy is configured with a non-default
+``ec_duplication_factor`` of ``N > 1``, then the policy will create ``N``
+duplicates of each unique fragment that is returned from the configured EC
+engine.
+
+Duplication of EC fragments is optimal for Global EC storage policies, which
+require dispersion of fragment data across failure domains. Without fragment
+duplication, common EC parameters will not distribute enough unique fragments
+between large failure domains to allow for a rebuild using fragments from any
+one domain.  For example a uniformly distributed ``10+4`` EC policy schema
+would place 7 fragments in each of two failure domains, which is less in each
+failure domain than the 10 fragments needed to rebuild a missing fragment.
+
+Without fragment duplication, an EC policy schema must be adjusted to include
+additional parity fragments in order to guarantee the number of fragments in
+each failure domain is greater than the number required to rebuild. For
+example, a uniformly distributed ``10+18`` EC policy schema would place 14
+fragments in each of two failure domains, which is more than sufficient in each
+failure domain to rebuild a missing fragment. However, empirical testing has
+shown encoding a schema with ``num_parity > num_data`` (such as ``10+18``) is
+less efficient than using duplication of fragments.  EC fragment duplication
+enables Swift's Global EC to maintain more independence between failure domains
+without sacrificing efficiency on read/write or rebuild!
+
+The ``ec_duplication_factor`` option may be configured in `swift.conf` in each
+``storage-policy`` section. The option may be omitted - the default value is
+``1`` (i.e. no duplication)::
+
+        [storage-policy:2]
+        name = ec104
+        policy_type = erasure_coding
+        ec_type = liberasurecode_rs_vand
+        ec_num_data_fragments = 10
+        ec_num_parity_fragments = 4
+        ec_object_segment_size = 1048576
+        ec_duplication_factor = 2
+
+.. warning::
+
+    EC duplication is intended for use with Global EC policies. To ensure
+    independent availability of data in all regions, the
+    ``ec_duplication_factor`` option should only be used in conjunction with
+    :ref:`composite_rings`, as described in this document.
+
+In this example, a ``10+4`` schema and a duplication factor of ``2`` will
+result in ``(10+4)x2 = 28`` fragments being stored (we will use the shorthand
+``10+4x2`` to denote that policy configuration) .  The ring for this policy
+should be configured with 28 replicas (i.e.  ``(ec_num_data_fragments +
+ec_num_parity_fragments) * ec_duplication_factor``).  A ``10+4x2`` schema
+**can** allow a multi-region deployment to rebuild an object to full durability
+even when *more* than 14 fragments are unavailable.  This is advantageous with
+respect to a ``10+18`` configuration not only because reads from data fragments
+will be more common and more efficient, but also because a ``10+4x2`` can grow
+into a ``10+4x3`` to expand into another region.
+
+EC duplication with composite rings
+-----------------------------------
+
+It is recommended that EC Duplication is used with :ref:`composite_rings` in
+order to disperse duplicate fragments across regions.
+
+When EC duplication is used, it is highly desirable to have one duplicate of
+each fragment placed in each region. This ensures that a set of
+``ec_num_data_fragments`` unique fragments (the minimum needed to reconstruct
+an object) can always be assembled from a single region. This in turn means
+that objects are robust in the event of an entire region becoming unavailable.
+
+This can be achieved by using a :ref:`composite ring <composite_rings>` with
+the following properties:
+
+* The number of component rings in the composite ring is equal to the
+  ``ec_duplication_factor`` for the policy.
+* Each *component* ring has a number of ``replicas`` that is equal to the sum
+  of ``ec_num_data_fragments`` and ``ec_num_parity_fragments``.
+* Each component ring is populated with devices in a unique region.
+
+This arrangement results in each component ring in the composite ring, and
+therefore each region, having one copy of each fragment.
+
+For example, consider a Swift cluster with two regions, ``region1`` and
+``region2`` and a ``4+2x2`` EC policy schema. This policy should use a
+composite ring with two component rings, ``ring1`` and ``ring2``, having
+devices exclusively in regions ``region1`` and ``region2`` respectively. Each
+component ring should have ``replicas = 6``. As a result, the first 6
+fragments for an object will always be placed in ``ring1`` (i.e. in
+``region1``) and the second 6 duplicate fragments will always be placed in
+``ring2`` (i.e. in ``region2``).
+
+Conversely, a conventional ring spanning the two regions may give a suboptimal
+distribution of duplicates across the regions; it is possible for duplicates of
+the same fragment to be placed in the same region, and consequently for another
+region to have no copies of that fragment. This may make it impossible to
+assemble a set of ``ec_num_data_fragments`` unique fragments from a single
+region. For example, the conventional ring could have a pathologically
+sub-optimal placement such as::
+
+  r1
+    <timestamp>#0#d.data
+    <timestamp>#0#d.data
+    <timestamp>#2#d.data
+    <timestamp>#2#d.data
+    <timestamp>#4#d.data
+    <timestamp>#4#d.data
+  r2
+    <timestamp>#1#d.data
+    <timestamp>#1#d.data
+    <timestamp>#3#d.data
+    <timestamp>#3#d.data
+    <timestamp>#5#d.data
+    <timestamp>#5#d.data
+
+In this case, the object cannot be reconstructed  from a single region;
+``region1`` has only the fragments with index ``0, 2, 4`` and ``region2`` has
+the other 3 indexes, but we need 4 unique indexes to be able to rebuild an
+object.
+
+Node Selection Strategy for Reads
+---------------------------------
+
+Proxy servers require a set of *unique* fragment indexes to decode the original
+object when handling a GET request to an EC policy. With a conventional EC
+policy, this is very likely to be the outcome of reading fragments from a
+random selection of backend nodes. With an EC Duplication policy it is
+significantly more likely that responses from a *random* selection of backend
+nodes might include some duplicated fragments.
+
+For this reason it is strongly recommended that EC Duplication always be
+deployed in combination with :ref:`composite_rings` and :ref:`proxy server read
+affinity <configuring_global_clusters>`.
+
+Under normal conditions with the recommended deployment, read affinity will
+cause a proxy server to first attempt to read fragments from nodes in its local
+region. These fragments are guaranteed to be unique with respect to each other.
+Even if there are a small number of local failures, unique local parity
+fragments will make up the difference.  However, should enough local primary
+storage nodes fail, such that sufficient unique fragments are not available in
+the local region, a global EC cluster will proceed to read fragments from the
+other region(s). Random reads from the remote region are not guaranteed to
+return unique fragments; with EC Duplication there is a significantly high
+probability that the proxy server will encounter a fragment that is a duplicate
+of one it has already found in the local region. The proxy server will ignore
+these and make additional requests until it accumulates the required set of
+unique fragments, potentially searching all the primary and handoff locations
+in the local and remote regions before ultimately failing the read.
+
+A global EC deployment configured as recommended is therefore extremely
+resilient. However, under extreme failure conditions read handling can be
+inefficient because nodes in other regions are guaranteed to have some
+fragments which are duplicates of those the proxy server has already received.
+Work is in progress to improve the proxy server node selection strategy such
+that when it is necessary to read from other regions, nodes that are likely to
+have useful fragments are preferred over those that are likely to return a
+duplicate.
+
+.. _global_ec_known_issues:
+
+Known Issues
+============
+
+Efficient Cross Region Rebuild
+------------------------------
+
+Work is also in progress to improve the object-reconstructor efficiency for
+Global EC policies. Unlike the proxy server, the reconstructor does not apply
+any read affinity settings when gathering fragments. It is therefore likely to
+receive duplicated fragments (i.e. make wasted backend GET requests) while
+performing *every* fragment reconstruction.
+
+Additionally, other reconstructor optimisations for Global EC are under
+investigation:
+
+* Since fragments are duplicated between regions it may in some cases be more
+  attractive to restore failed fragments from their duplicates in another
+  region instead of rebuilding them from other fragments in the local region.
+
+* Conversely, to avoid WAN transfer it may be more attractive to rebuild
+  fragments from local parity.
+
+* During rebalance it will always be more attractive to revert a fragment from
+  it's old-primary to it's new primary rather than rebuilding or transferring a
+  duplicate from the remote region.
+
+
+**************
+Under the Hood
+**************
+
+Now that we've explained a little about EC support in Swift and how to
+configure and use it, let's explore how EC fits in at the nuts-n-bolts level.
+
+Terminology
+===========
+
+The term 'fragment' has been used already to describe the output of the EC
+process (a series of fragments) however we need to define some other key terms
+here before going any deeper.  Without paying special attention to using the
+correct terms consistently, it is very easy to get confused in a hurry!
+
+* **chunk**: HTTP chunks received over wire (term not used to describe any EC
+  specific operation).
+* **segment**: Not to be confused with SLO/DLO use of the word, in EC we call a
+  segment a series of consecutive HTTP chunks buffered up before performing an
+  EC operation.
+* **fragment**: Data and parity 'fragments' are generated when erasure coding
+  transformation is applied to a segment.
+* **EC archive**: A concatenation of EC fragments; to a storage node this looks
+  like an object.
+* **ec_ndata**: Number of EC data fragments.
+* **ec_nparity**: Number of EC parity fragments.
+
+Middleware
+==========
+
+Middleware remains unchanged.  For most middleware (e.g., SLO/DLO) the fact that
+the proxy is fragmenting incoming objects is transparent.  For list endpoints,
+however, it is a bit different. A caller of list endpoints will get back the
+locations of all of the fragments.  The caller will be unable to re-assemble the
+original object with this information, however the node locations may still
+prove to be useful information for some applications.
+
+On Disk Storage
+===============
+
+EC archives are stored on disk in their respective objects-N directory based on
+their policy index.  See :doc:`overview_policies` for details on per policy
+directory information.
+
+In addition to the object timestamp, the filenames of EC archives encode other
+information related to the archive:
+
+* The fragment archive index. This is required for a few reasons. For one, it
+  allows us to store fragment archives of different indexes on the same storage
+  node which is not typical however it is possible in many circumstances.
+  Without unique filenames for the different EC archive files in a set, we
+  would be at risk of overwriting one archive of index `n` with another of
+  index `m` in some scenarios.
+
+  The index is appended to the filename just before the ``.data`` extension.
+  For example, the filename for a fragment archive storing the 5th fragment
+  would be::
+
+    1418673556.92690#5.data
+
+* The durable state of the archive. The meaning of this will be described in
+  more detail later, but a fragment archive that is considered durable has an
+  additional ``#d`` string included in its filename immediately before the
+  ``.data`` extension. For example::
+
+    1418673556.92690#5#d.data
+
+A policy-specific transformation function is therefore used to build the
+archive filename. These functions are implemented in the diskfile module as
+methods of policy specific sub classes of ``BaseDiskFileManager``.
+
+The transformation function for the replication policy is simply a NOP.
+
+.. note::
+
+    In older versions the durable state of an archive was represented by an
+    additional file called the ``.durable`` file instead of the ``#d``
+    substring in the ``.data`` filename. The ``.durable`` for the example above
+    would be::
+
+        1418673556.92690.durable
+
+
+Proxy Server
+============
+
+High Level
+----------
+
+The Proxy Server handles Erasure Coding in a different manner than replication,
+therefore there are several code paths unique to EC policies either though sub
+classing or simple conditionals.  Taking a closer look at the PUT and the GET
+paths will help make this clearer.  But first, a high level overview of how an
+object flows through the system:
+
+.. image:: images/ec_overview.png
+
+Note how:
+
+* Incoming objects are buffered into segments at the proxy.
+* Segments are erasure coded into fragments at the proxy.
+* The proxy stripes fragments across participating nodes such that the on-disk
+  stored files that we call a fragment archive is appended with each new
+  fragment.
+
+This scheme makes it possible to minimize the number of on-disk files given our
+segmenting and fragmenting.
+
+Multi_Phase Conversation
+------------------------
+
+Multi-part MIME document support is used to allow the proxy to engage in a
+handshake conversation with the storage node for processing PUT requests.  This
+is required for a few different reasons.
+
+#. From the perspective of the storage node, a fragment archive is really just
+   another object, we need a mechanism to send down the original object etag
+   after all fragment archives have landed.
+#. Without introducing strong consistency semantics, the proxy needs a mechanism
+   to know when a quorum of fragment archives have actually made it to disk
+   before it can inform the client of a successful PUT.
+
+MIME supports a conversation between the proxy and the storage nodes for every
+PUT. This provides us with the ability to handle a PUT in one connection and
+assure that we have the essence of a 2 phase commit, basically having the proxy
+communicate back to the storage nodes once it has confirmation that a quorum of
+fragment archives in the set have been written.
+
+For the first phase of the conversation the proxy requires a quorum of
+`ec_ndata + 1` fragment archives to be successfully put to storage nodes. This
+ensures that the object could still be reconstructed even if one of the
+fragment archives becomes unavailable. As described above, each fragment
+archive file is named::
+
+    <ts>#<frag_index>.data
+
+where ``ts`` is the timestamp and ``frag_index`` is the fragment archive index.
+
+During the second phase of the conversation the proxy communicates a
+confirmation to storage nodes that the fragment archive quorum has been
+achieved. This causes each storage node to rename the fragment archive written
+in the first phase of the conversation to include the substring ``#d`` in its
+name::
+
+    <ts>#<frag_index>#d.data
+
+This indicates to the object server that this fragment archive is `durable` and
+that there is a set of data files that are durable at timestamp ``ts``.
+
+For the second phase of the conversation the proxy requires a quorum of
+`ec_ndata + 1` successful commits on storage nodes. This ensures that there are
+sufficient committed fragment archives for the object to be reconstructed even
+if one becomes unavailable. The reconstructor ensures that the durable state is
+replicated on storage nodes where it may be missing.
+
+Note that the completion of the commit phase of the conversation
+is also a signal for the object server to go ahead and immediately delete older
+timestamp files for this object. This is critical as we do not want to delete
+the older object until the storage node has confirmation from the proxy, via the
+multi-phase conversation, that the other nodes have landed enough for a quorum.
+
+The basic flow looks like this:
+
+#. The Proxy Server erasure codes and streams the object fragments
+   (ec_ndata + ec_nparity) to the storage nodes.
+#. The storage nodes store objects as EC archives and upon finishing object
+   data/metadata write, send a 1st-phase response to proxy.
+#. Upon quorum of storage nodes responses, the proxy initiates 2nd-phase by
+   sending commit confirmations to object servers.
+#. Upon receipt of commit message, object servers rename ``.data`` files to
+   include the ``#d`` substring, indicating successful PUT, and send a final
+   response to the proxy server.
+#. The proxy waits for `ec_ndata + 1` object servers to respond with a
+   success (2xx) status before responding to the client with a successful
+   status.
+
+Here is a high level example of what the conversation looks like::
+
+    proxy: PUT /p/a/c/o
+         Transfer-Encoding': 'chunked'
+         Expect': '100-continue'
+         X-Backend-Obj-Multiphase-Commit: yes
+    obj:   100 Continue
+         X-Obj-Multiphase-Commit: yes
+    proxy: --MIMEboundary
+         X-Document: object body
+         <obj_data>
+         --MIMEboundary
+         X-Document: object metadata
+         Content-MD5: <footer_meta_cksum>
+         <footer_meta>
+         --MIMEboundary
+    <object server writes data, metadata to <ts>#<frag_index>.data file>
+    obj:   100 Continue
+    <quorum>
+    proxy: X-Document: put commit
+         commit_confirmation
+         --MIMEboundary--
+    <object server renames <ts>#<frag_index>.data to <ts>#<frag_index>#d.data>
+    obj:   20x
+    <proxy waits to receive >=2 2xx responses>
+    proxy: 2xx -> client
+
+A few key points on the durable state of a fragment archive:
+
+* A durable fragment archive means that there exist sufficient other fragment
+  archives elsewhere in the cluster (durable and/or non-durable) to reconstruct
+  the object.
+* When a proxy does a GET, it will require at least one object server to
+  respond with a fragment archive is durable before reconstructing and
+  returning the object to the client.
+
+Partial PUT Failures
+--------------------
+
+A partial PUT failure has a few different modes.  In one scenario the Proxy
+Server is alive through the entire PUT conversation.  This is a very
+straightforward case. The client will receive a good response if and only if a
+quorum of fragment archives were successfully landed on their storage nodes.
+In this case the Reconstructor will discover the missing fragment archives,
+perform a reconstruction and deliver those fragment archives to their nodes.
+
+The more interesting case is what happens if the proxy dies in the middle of a
+conversation.  If it turns out that a quorum had been met and the commit phase
+of the conversation finished, its as simple as the previous case in that the
+reconstructor will repair things.  However, if the commit didn't get a chance to
+happen then some number of the storage nodes have .data files on them (fragment
+archives) but none of them knows whether there are enough elsewhere for the
+entire object to be reconstructed.  In this case the client will not have
+received a 2xx response so there is no issue there, however, it is left to the
+storage nodes to clean up the stale fragment archives.  Work is ongoing in this
+area to enable the proxy to play a role in reviving these fragment archives,
+however, for the current release, a proxy failure after the start of a
+conversation but before the commit message will simply result in a PUT failure.
+
+GET
+---
+
+The GET for EC is different enough from replication that subclassing the
+`BaseObjectController` to the `ECObjectController` enables an efficient way to
+implement the high level steps described earlier:
+
+#. The proxy server makes simultaneous requests to `ec_ndata` primary object
+   server nodes with goal of finding a set of `ec_ndata` distinct EC archives
+   at the same timestamp, and an indication from at least one object server
+   that a durable fragment archive exists for that timestamp. If this goal is
+   not achieved with the first `ec_ndata` requests then the proxy server
+   continues to issue requests to the remaining primary nodes and then handoff
+   nodes.
+#. As soon as the proxy server has found a usable set of `ec_ndata` EC
+   archives, it starts to call PyECLib to decode fragments as they are returned
+   by the object server nodes.
+#. The proxy server creates Etag and content length headers for the client
+   response since each EC archive's metadata is valid only for that archive.
+#. The proxy streams the decoded data it has back to the client.
+
+Note that the proxy does not require all objects servers to have a durable
+fragment archive to return in response to a GET. The proxy will be satisfied if
+just one object server has a durable fragment archive at the same timestamp as
+EC archives returned from other object servers. This means that the proxy can
+successfully GET an object that had missing durable state on some nodes when it
+was PUT (i.e. a partial PUT failure occurred).
+
+Note also that an object server may inform the proxy server that it has more
+than one EC archive for different timestamps and/or fragment indexes, which may
+cause the proxy server to issue multiple requests for distinct EC archives to
+that object server. (This situation can temporarily occur after a ring
+rebalance when a handoff node storing an archive has become a primary node and
+received its primary archive but not yet moved the handoff archive to its
+primary node.)
+
+The proxy may receive EC archives having different timestamps, and may
+receive several EC archives having the same index. The proxy therefore
+ensures that it has sufficient EC archives with the same timestamp
+and distinct fragment indexes before considering a GET to be successful.
+
+Object Server
+=============
+
+The Object Server, like the Proxy Server, supports MIME conversations as
+described in the proxy section earlier. This includes processing of the commit
+message and decoding various sections of the MIME document to extract the footer
+which includes things like the entire object etag.
+
+DiskFile
+--------
+
+Erasure code policies use subclassed ``ECDiskFile``, ``ECDiskFileWriter``,
+``ECDiskFileReader`` and ``ECDiskFileManager`` to implement EC specific
+handling of on disk files.  This includes things like file name manipulation to
+include the fragment index and durable state in the filename, construction of
+EC specific ``hashes.pkl`` file to include fragment index information, etc.
+
+Metadata
+^^^^^^^^
+
+There are few different categories of metadata that are associated with EC:
+
+System Metadata: EC has a set of object level system metadata that it
+attaches to each of the EC archives.  The metadata is for internal use only:
+
+* ``X-Object-Sysmeta-EC-Etag``:  The Etag of the original object.
+* ``X-Object-Sysmeta-EC-Content-Length``: The content length of the original
+  object.
+* ``X-Object-Sysmeta-EC-Frag-Index``: The fragment index for the object.
+* ``X-Object-Sysmeta-EC-Scheme``: Description of the EC policy used to encode
+  the object.
+* ``X-Object-Sysmeta-EC-Segment-Size``: The segment size used for the object.
+
+User Metadata:  User metadata is unaffected by EC, however, a full copy of the
+user metadata is stored with every EC archive.  This is required as the
+reconstructor needs this information and each reconstructor only communicates
+with its closest neighbors on the ring.
+
+PyECLib Metadata:  PyECLib stores a small amount of metadata on a per fragment
+basis.  This metadata is not documented here as it is opaque to Swift.
+
+Database Updates
+================
+
+As account and container rings are not associated with a Storage Policy, there
+is no change to how these database updates occur when using an EC policy.
+
+The Reconstructor
+=================
+
+The Reconstructor performs analogous functions to the replicator:
+
+#. Recovering from disk drive failure.
+#. Moving data around because of a rebalance.
+#. Reverting data back to a primary from a handoff.
+#. Recovering fragment archives from bit rot discovered by the auditor.
+
+However, under the hood it operates quite differently.  The following are some
+of the key elements in understanding how the reconstructor operates.
+
+Unlike the replicator, the work that the reconstructor does is not always as
+easy to break down into the 2 basic tasks of synchronize or revert (move data
+from handoff back to primary) because of the fact that one storage node can
+house fragment archives of various indexes and each index really \"belongs\" to
+a different node.  So, whereas when the replicator is reverting data from a
+handoff it has just one node to send its data to, the reconstructor can have
+several.  Additionally, it is not always the case that the processing of a
+particular suffix directory means one or the other job type for the entire
+directory (as it does for replication). The scenarios that create these mixed
+situations can be pretty complex so we will just focus on what the
+reconstructor does here and not a detailed explanation of why.
+
+Job Construction and Processing
+-------------------------------
+
+Because of the nature of the work it has to do as described above, the
+reconstructor builds jobs for a single job processor.  The job itself contains
+all of the information needed for the processor to execute the job which may be
+a synchronization or a data reversion.  There may be a mix of jobs that
+perform both of these operations on the same suffix directory.
+
+Jobs are constructed on a per-partition basis and then per-fragment-index basis.
+That is, there will be one job for every fragment index in a partition.
+Performing this construction \"up front\" like this helps minimize the
+interaction between nodes collecting hashes.pkl information.
+
+Once a set of jobs for a partition has been constructed, those jobs are sent off
+to threads for execution. The single job processor then performs the necessary
+actions, working closely with ssync to carry out its instructions.  For data
+reversion, the actual objects themselves are cleaned up via the ssync module and
+once that partition's set of jobs is complete, the reconstructor will attempt to
+remove the relevant directory structures.
+
+Job construction must account for a variety of scenarios, including:
+
+#. A partition directory with all fragment indexes matching the local node
+   index.  This is the case where everything is where it belongs and we just
+   need to compare hashes and sync if needed. Here we simply sync with our
+   partners.
+#. A partition directory with at least one local fragment index and mix of
+   others.  Here we need to sync with our partners where fragment indexes
+   matches the local_id, all others are sync'd with their home nodes and then
+   deleted.
+#. A partition directory with no local fragment index and just one or more of
+   others. Here we sync with just the home nodes for the fragment indexes that
+   we have and then all the local archives are deleted.  This is the basic
+   handoff reversion case.
+
+.. note::
+    A \"home node\" is the node where the fragment index encoded in the
+    fragment archive's filename matches the node index of a node in the primary
+    partition list.
+
+Node Communication
+------------------
+
+The replicators talk to all nodes who have a copy of their object, typically
+just 2 other nodes.  For EC, having each reconstructor node talk to all nodes
+would incur a large amount of overhead as there will typically be a much larger
+number of nodes participating in the EC scheme.  Therefore, the reconstructor is
+built to talk to its adjacent nodes on the ring only.  These nodes are typically
+referred to as partners.
+
+Reconstruction
+--------------
+
+Reconstruction can be thought of sort of like replication but with an extra step
+in the middle. The reconstructor is hard-wired to use ssync to determine what is
+missing and desired by the other side. However, before an object is sent over
+the wire it needs to be reconstructed from the remaining fragments as the local
+fragment is just that - a different fragment index than what the other end is
+asking for.
+
+Thus, there are hooks in ssync for EC based policies. One case would be for
+basic reconstruction which, at a high level, looks like this:
+
+* Determine which nodes need to be contacted to collect other EC archives needed
+  to perform reconstruction.
+* Update the etag and fragment index metadata elements of the newly constructed
+  fragment archive.
+* Establish a connection to the target nodes and give ssync a DiskFileLike class
+  from which it can stream data.
+
+The reader in this class gathers fragments from the nodes and uses PyECLib to
+reconstruct each segment before yielding data back to ssync. Essentially what
+this means is that data is buffered, in memory, on a per segment basis at the
+node performing reconstruction and each segment is dynamically reconstructed and
+delivered to ``ssync_sender`` where the ``send_put()`` method will ship them on
+over.  The sender is then responsible for deleting the objects as they are sent
+in the case of data reversion.
+
+The Auditor
+===========
+
+Because the auditor already operates on a per storage policy basis, there are no
+specific auditor changes associated with EC.  Each EC archive looks like, and is
+treated like, a regular object from the perspective of the auditor.  Therefore,
+if the auditor finds bit-rot in an EC archive, it simply quarantines it and the
+reconstructor will take care of the rest just as the replicator does for
+replication policies.
diff --git a/doc/source/overview_expiring_objects.rst b/doc/source/overview_expiring_objects.rst
index ba91570963..9fe0fefe5e 100644
--- a/doc/source/overview_expiring_objects.rst
+++ b/doc/source/overview_expiring_objects.rst
@@ -2,42 +2,187 @@
 Expiring Object Support
 =======================
 
-The ``swift-object-expirer`` offers scheduled deletion of objects. The Swift client would use the ``X-Delete-At`` or ``X-Delete-After`` headers during an object ``PUT`` or ``POST`` and the cluster would automatically quit serving that object at the specified time and would shortly thereafter remove the object from the system.
+The ``swift-object-expirer`` offers scheduled deletion of objects. The Swift
+client would use the ``X-Delete-At`` or ``X-Delete-After`` headers during an
+object ``PUT`` or ``POST`` and the cluster would automatically quit serving
+that object at the specified time and would shortly thereafter remove the
+object from the system.
 
-The ``X-Delete-At`` header takes a Unix Epoch timestamp, in integer form; for example: ``1317070737`` represents ``Mon Sep 26 20:58:57 2011 UTC``.
+The ``X-Delete-At`` header takes a Unix Epoch timestamp, in integer form; for
+example: ``1317070737`` represents ``Mon Sep 26 20:58:57 2011 UTC``.
 
-The ``X-Delete-After`` header takes a integer number of seconds. The proxy server that receives the request will convert this header into an ``X-Delete-At`` header using its current time plus the value given.
+The ``X-Delete-After`` header takes a positive integer number of seconds. The
+proxy server that receives the request will convert this header into an
+``X-Delete-At`` header using the request timestamp plus the value given.
 
-As expiring objects are added to the system, the object servers will record the expirations in a hidden ``.expiring_objects`` account for the ``swift-object-expirer`` to handle later.
+If both the ``X-Delete-At`` and ``X-Delete-After`` headers are sent with a
+request then the ``X-Delete-After`` header will take precedence.
 
-Just one instance of the ``swift-object-expirer`` daemon needs to run for a cluster. This isn't exactly automatic failover high availability, but if this daemon doesn't run for a few hours it should not be any real issue. The expired-but-not-yet-deleted objects will still ``404 Not Found`` if someone tries to ``GET`` or ``HEAD`` them and they'll just be deleted a bit later when the daemon is restarted.
+As expiring objects are added to the system, the object servers will record the
+expirations in a hidden ``.expiring_objects`` account for the
+``swift-object-expirer`` to handle later.
 
-The daemon uses the ``/etc/swift/object-expirer.conf`` by default, and here is a quick sample conf file::
+Usually, just one instance of the ``swift-object-expirer`` daemon needs to run
+for a cluster. This isn't exactly automatic failover high availability, but if
+this daemon doesn't run for a few hours it should not be any real issue. The
+expired-but-not-yet-deleted objects will still ``404 Not Found`` if someone
+tries to ``GET`` or ``HEAD`` them and they'll just be deleted a bit later when
+the daemon is restarted.
+
+By default, the ``swift-object-expirer`` daemon will run with a concurrency of
+1.  Increase this value to get more concurrency.  A concurrency of 1 may not be
+enough to delete expiring objects in a timely fashion for a particular Swift
+cluster.
+
+It is possible to run multiple daemons to do different parts of the work if a
+single process with a concurrency of more than 1 is not enough (see the sample
+config file for details).
+
+To run the ``swift-object-expirer`` as multiple processes, set ``processes`` to
+the number of processes (either in the config file or on the command line).
+Then run one process for each part.  Use ``process`` to specify the part of the
+work to be done by a process using the command line or the config.  So, for
+example, if you'd like to run three processes, set ``processes`` to 3 and run
+three processes with ``process`` set to 0, 1, and 2 for the three processes.
+If multiple processes are used, it's necessary to run one for each part of the
+work or that part of the work will not be done.
+
+By default the daemon looks for two different config files. When launching,
+the process searches for the ``[object-expirer]`` section in the
+
+``/etc/swift/object-server.conf`` config. If the section or the config is missing
+it will then look for and use the ``/etc/swift/object-expirer.conf`` config.
+The latter config file is considered deprecated and is searched for to aid
+in cluster upgrades.
+
+Delay Reaping of Objects from Disk
+----------------------------------
+
+Swift's expiring object ``x-delete-at`` feature can be used to have the cluster
+reap user's objects automatically from disk on their behalf when they no longer
+want them stored in their account. In some cases it may be necessary to
+"intervene" in the expected expiration process to prevent accidental or
+premature data loss if an object marked for expiration should NOT be deleted
+immediately when it expires for whatever reason. In these cases
+``swift-object-expirer`` offers configuration of a ``delay_reaping`` value
+on accounts and containers, which provides a delay between when an object
+is marked for deletion, or expired, and when it is actually reaped from disk.
+When this is set in the object expirer config the object expirer leaves expired
+objects on disk (and in container listings) for the ``delay_reaping`` time.
+After this delay has passed objects will be reaped as normal.
+
+The ``delay_reaping`` value can be set either at an account level or a
+container level. When set at an account level, the object expirer will
+only reap objects within the account after the delay. A container level
+``delay_reaping`` works similarly for containers and overrides an account
+level ``delay_reaping`` value.
+
+The ``delay_reaping`` values are set in the ``[object-expirer]`` section in
+either the object-server or object-expirer config files. They are configured
+with dynamic config option names prefixed with ``delay_reaping_<ACCT>``
+at the account level and ``delay_reaping_<ACCT>/<CNTR>`` at the container
+level, with the ``delay_reaping`` value in seconds.
+
+Here is an example of ``delay_reaping`` configs in the``object-expirer``
+section in the ``object-server.conf``::
 
-    [DEFAULT]
-    # swift_dir = /etc/swift
-    # user = swift
-    # You can specify default log routing here if you want:
-    # log_name = swift
-    # log_facility = LOG_LOCAL0
-    # log_level = INFO
-    
     [object-expirer]
-    interval = 300
-    
-    [pipeline:main]
-    pipeline = catch_errors cache proxy-server
-    
-    [app:proxy-server]
-    use = egg:swift#proxy
-    # See proxy-server.conf-sample for options
-    
-    [filter:cache]
-    use = egg:swift#memcache
-    # See proxy-server.conf-sample for options
-    
-    [filter:catch_errors]
-    use = egg:swift#catch_errors
-    # See proxy-server.conf-sample for options
-
-The daemon needs to run on a machine with access to all the backend servers in the cluster, but does not need proxy server or public access. The daemon will use its own internal proxy code instance to access the backend servers.
+    delay_reaping_AUTH_test = 300.0
+    delay_reaping_AUTH_test2 = 86400.0
+    delay_reaping_AUTH_test/test = 0.0
+    delay_reaping_AUTH_test/test2 = 600.0
+
+.. note::
+    A container level ``delay_reaping`` value does not require an account level
+    ``delay_reaping`` value but overrides the account level value for the same
+    account if it exists. By default, no ``delay_reaping`` value is configured
+    for any accounts or containers.
+
+Accessing Objects After Expiration
+----------------------------------
+
+By default, objects that expire become inaccessible, even to the account owner.
+The object may not have been deleted, but any GET/HEAD/POST client request for
+the object will respond 404 Not Found after the ``x-delete-at`` timestamp
+has passed.
+
+The ``swift-proxy-server`` offers the ability to globally configure a flag to
+allow requests to access expired objects that have not yet been deleted.
+When this flag is enabled, a user can make a GET, HEAD, or POST request with
+the header ``x-open-expired`` set to true to access the expired object.
+
+The global configuration is an opt-in flag that can be set in the
+``[proxy-server]`` section of the ``proxy-server.conf`` file. It is configured
+with a single flag ``allow_open_expired`` set to true or false. By default,
+this flag is set to false.
+
+Here is an example in the ``proxy-server`` section in ``proxy-server.conf``::
+
+    [proxy-server]
+    allow_open_expired = false
+
+To discover whether this flag is set, you can send a **GET** request to the
+``/info`` :ref:`discoverability <discoverability>` path. This will return
+configuration data in JSON format where the value of ``allow_open_expired`` is
+exposed.
+
+When using a temporary URL to access the object, this feature is not enabled.
+This means that adding the header will not allow requests to temporary URLs
+to access expired objects.
+
+Upgrading impact: General Task Queue vs Legacy Queue
+----------------------------------------------------
+
+The expirer daemon will be moving to a new general task-queue based design that
+will divide the work across all object servers, as such only expirers defined
+in the object-server config will be able to use the new system.
+
+The legacy object expirer config is documented in
+``etc/object-expirer.conf-sample``. The alternative object-server config
+section is documented in ``etc/object-server.conf-sample``.
+
+The parameters in both files are identical except for a new option in the
+object-server ``[object-expirer]`` section, ``dequeue_from_legacy``
+which when set to ``True`` will tell the expirer that in addition to using
+the new task queueing system to also check the legacy (soon to be deprecated)
+queue.
+
+.. note::
+    The new task-queue system has not been completed yet. So an expirer's with
+    ``dequeue_from_legacy`` set to ``False`` will currently do nothing.
+
+By default ``dequeue_from_legacy`` will be ``False``, it is necessary to
+be set to ``True`` explicitly while migrating from the old expiring queue.
+
+Any expirer using the old config ``/etc/swift/object-expirer.conf`` will not
+use the new general task queue. It'll ignore the ``dequeue_from_legacy``
+and will only check the legacy queue. Meaning it'll run as a legacy expirer.
+
+Why is this important? If you are currently running object-expirers on nodes
+that are not object storage nodes, then for the time being they will still
+work but only by dequeuing from the old queue.
+When the new general task queue is introduced, expirers will be required to
+run on the object servers so that any new objects added can be removed.
+If you're in this situation, you can safely setup the new expirer
+section in the ``object-server.conf`` to deal with the new queue and leave the
+legacy expirers running elsewhere.
+
+However, if your old expirers are running on the object-servers, the most
+common topology, then you would add the new section to all object servers, to
+deal the new queue. In order to maintain the same number of expirers checking
+the legacy queue, pick the same number of nodes as you previously had and turn
+on ``dequeue_from_legacy`` on those nodes only. Also note on these nodes
+you'd need to keep the legacy ``process`` and ``processes`` options to maintain
+the concurrency level for the legacy queue.
+
+.. note::
+    Be careful not to enable ``dequeue_from_legacy`` on too many expirers as
+    all legacy tasks are stored in a single hidden account and the same hidden
+    containers. On a large cluster one may inadvertently overload the
+    acccount/container servers handling the legacy expirer queue.
+
+.. note::
+    When running legacy expirers, the daemon needs to run on a machine with
+    access to all the backend servers in the cluster, but does not need proxy
+    server or public access. The daemon will use its own internal proxy code
+    instance to access the backend servers.
diff --git a/doc/source/overview_global_cluster.rst b/doc/source/overview_global_cluster.rst
new file mode 100644
index 0000000000..2f1c40bf88
--- /dev/null
+++ b/doc/source/overview_global_cluster.rst
@@ -0,0 +1,149 @@
+===============
+Global Clusters
+===============
+
+--------
+Overview
+--------
+
+Swift's default configuration is currently designed to work in a
+single region, where a region is defined as a group of machines with
+high-bandwidth, low-latency links between them. However, configuration
+options exist that make running a performant multi-region Swift
+cluster possible.
+
+For the rest of this section, we will assume a two-region Swift
+cluster: region 1 in San Francisco (SF), and region 2 in New York
+(NY). Each region shall contain within it 3 zones, numbered 1, 2, and
+3, for a total of 6 zones.
+
+.. _configuring_global_clusters:
+
+---------------------------
+Configuring Global Clusters
+---------------------------
+
+.. note::
+
+    The proxy-server configuration options described below can be given generic
+    settings in the ``[app:proxy-server]`` configuration section and/or given
+    specific settings for individual policies using
+    :ref:`proxy_server_per_policy_config`.
+
+~~~~~~~~~~~~~
+read_affinity
+~~~~~~~~~~~~~
+
+This setting, combined with sorting_method setting, makes the proxy
+server prefer local backend servers for GET and HEAD requests over
+non-local ones. For example, it is preferable for an SF proxy server
+to service object GET requests by talking to SF object servers, as the
+client will receive lower latency and higher throughput.
+
+By default, Swift randomly chooses one of the three replicas to give
+to the client, thereby spreading the load evenly. In the case of a
+geographically-distributed cluster, the administrator is likely to
+prioritize keeping traffic local over even distribution of results.
+This is where the read_affinity setting comes in.
+
+Example::
+
+    [app:proxy-server]
+    sorting_method = affinity
+    read_affinity = r1=100
+
+This will make the proxy attempt to service GET and HEAD requests from
+backends in region 1 before contacting any backends in region 2.
+However, if no region 1 backends are available (due to replica
+placement, failed hardware, or other reasons), then the proxy will
+fall back to backend servers in other regions.
+
+Example::
+
+    [app:proxy-server]
+    sorting_method = affinity
+    read_affinity = r1z1=100, r1=200
+
+This will make the proxy attempt to service GET and HEAD requests from
+backends in region 1 zone 1, then backends in region 1, then any other
+backends. If a proxy is physically close to a particular zone or
+zones, this can provide bandwidth savings. For example, if a zone
+corresponds to servers in a particular rack, and the proxy server is
+in that same rack, then setting read_affinity to prefer reads from
+within the rack will result in less traffic between the top-of-rack
+switches.
+
+The read_affinity setting may contain any number of region/zone
+specifiers; the priority number (after the equals sign) determines the
+ordering in which backend servers will be contacted. A lower number
+means higher priority.
+
+Note that read_affinity only affects the ordering of primary nodes
+(see ring docs for definition of primary node), not the ordering of
+handoff nodes.
+
+~~~~~~~~~~~~~~
+write_affinity
+~~~~~~~~~~~~~~
+
+This setting makes the proxy server prefer local backend servers for
+object PUT requests over non-local ones. For example, it may be
+preferable for an SF proxy server to service object PUT requests
+by talking to SF object servers, as the client will receive lower
+latency and higher throughput. However, if this setting is used, note
+that a NY proxy server handling a GET request for an object that was
+PUT using write affinity may have to fetch it across the WAN link, as
+the object won't immediately have any replicas in NY. However,
+replication will move the object's replicas to their proper homes in
+both SF and NY.
+
+One potential issue with write_affinity is, end user may get 404 error when
+deleting objects before replication. The write_affinity_handoff_delete_count
+setting is used together with write_affinity in order to solve that issue.
+With its default configuration, Swift will calculate the proper number of
+handoff nodes to send requests to.
+
+Note that only object PUT/DELETE requests are affected by the write_affinity
+setting; POST, GET, HEAD, OPTIONS, and account/container PUT requests are
+not affected.
+
+This setting lets you trade data distribution for throughput. If
+write_affinity is enabled, then object replicas will initially be
+stored all within a particular region or zone, thereby decreasing the
+quality of the data distribution, but the replicas will be distributed
+over fast WAN links, giving higher throughput to clients. Note that
+the replicators will eventually move objects to their proper,
+well-distributed homes.
+
+The write_affinity setting is useful only when you don't typically
+read objects immediately after writing them. For example, consider a
+workload of mainly backups: if you have a bunch of machines in NY that
+periodically write backups to Swift, then odds are that you don't then
+immediately read those backups in SF. If your workload doesn't look
+like that, then you probably shouldn't use write_affinity.
+
+The write_affinity_node_count setting is only useful in conjunction
+with write_affinity; it governs how many local object servers will be
+tried before falling back to non-local ones.
+
+Example::
+
+    [app:proxy-server]
+    write_affinity = r1
+    write_affinity_node_count = 2 * replicas
+
+Assuming 3 replicas, this configuration will make object PUTs try
+storing the object's replicas on up to 6 disks ("2 * replicas") in
+region 1 ("r1"). Proxy server tries to find 3 devices for storing the
+object. While a device is unavailable, it queries the ring for the 4th
+device and so on until 6th device. If the 6th disk is still unavailable,
+the last replica will be sent to other region. It doesn't mean there'll
+have 6 replicas in region 1.
+
+
+You should be aware that, if you have data coming into SF faster than
+your replicators are transferring it to NY, then your cluster's data
+distribution will get worse and worse over time as objects pile up in SF.
+If this happens, it is recommended to disable write_affinity and simply let
+object PUTs traverse the WAN link, as that will naturally limit the
+object growth rate to what your WAN link can handle.
diff --git a/doc/source/overview_large_objects.rst b/doc/source/overview_large_objects.rst
index 52176172e9..e96c87015f 100644
--- a/doc/source/overview_large_objects.rst
+++ b/doc/source/overview_large_objects.rst
@@ -1,3 +1,5 @@
+.. _large-objects:
+
 ====================
 Large Object Support
 ====================
@@ -13,88 +15,39 @@ special manifest file is created that, when downloaded, sends all the segments
 concatenated as a single object. This also offers much greater upload speed
 with the possibility of parallel uploads of the segments.
 
--------------------------------------
-Using ``swift`` for Segmented Objects
--------------------------------------
-
-The quickest way to try out this feature is use the ``swift`` Swift Tool
-included with the `python-swiftclient`_ library.  You can use the ``-S``
-option to specify the segment size to use when splitting a large file. For
-example::
+.. _dynamic-large-objects:
 
-    swift upload test_container -S 1073741824 large_file
+.. _dlo-doc:
 
-This would split the large_file into 1G segments and begin uploading those
-segments in parallel. Once all the segments have been uploaded, ``swift`` will
-then create the manifest file so the segments can be downloaded as one.
+---------------------
+Dynamic Large Objects
+---------------------
 
-So now, the following ``swift`` command would download the entire large object::
+.. automodule:: swift.common.middleware.dlo
+    :members:
+    :show-inheritance:
 
-    swift download test_container large_file
+.. _static-large-objects:
 
-``swift`` uses a strict convention for its segmented object
-support. In the above example it will upload all the segments into a
-second container named test_container_segments. These segments will
-have names like large_file/1290206778.25/21474836480/00000000,
-large_file/1290206778.25/21474836480/00000001, etc.
+.. _slo-doc:
 
-The main benefit for using a separate container is that the main container
-listings will not be polluted with all the segment names. The reason for using
-the segment name format of <name>/<timestamp>/<size>/<segment> is so that an
-upload of a new file with the same name won't overwrite the contents of the
-first until the last moment when the manifest file is updated.
+--------------------
+Static Large Objects
+--------------------
 
-``swift`` will manage these segment files for you, deleting old segments on
-deletes and overwrites, etc. You can override this behavior with the
-``--leave-segments`` option if desired; this is useful if you want to have
-multiple versions of the same large object available.
-
-.. _`python-swiftclient`: http://github.com/openstack/python-swiftclient
+.. automodule:: swift.common.middleware.slo
+    :members:
+    :show-inheritance:
 
 ----------
 Direct API
 ----------
 
-You can also work with the segments and manifests directly with HTTP
-requests instead of having ``swift`` do that for you. You can just
-upload the segments like you would any other object and the manifest
-is just a zero-byte file with an extra ``X-Object-Manifest`` header.
-
-All the object segments need to be in the same container, have a common object
-name prefix, and their names sort in the order they should be concatenated.
-They don't have to be in the same container as the manifest file will be, which
-is useful to keep container listings clean as explained above with ``swift``.
-
-The manifest file is simply a zero-byte file with the extra
-``X-Object-Manifest: <container>/<prefix>`` header, where ``<container>`` is
-the container the object segments are in and ``<prefix>`` is the common prefix
-for all the segments.
-
-It is best to upload all the segments first and then create or update the
-manifest. In this way, the full object won't be available for downloading until
-the upload is complete. Also, you can upload a new set of segments to a second
-location and then update the manifest to point to this new location. During the
-upload of the new segments, the original manifest will still be available to
-download the first set of segments.
-
-Here's an example using ``curl`` with tiny 1-byte segments::
-
-    # First, upload the segments
-    curl -X PUT -H 'X-Auth-Token: <token>' \
-        http://<storage_url>/container/myobject/1 --data-binary '1'
-    curl -X PUT -H 'X-Auth-Token: <token>' \
-        http://<storage_url>/container/myobject/2 --data-binary '2'
-    curl -X PUT -H 'X-Auth-Token: <token>' \
-        http://<storage_url>/container/myobject/3 --data-binary '3'
-
-    # Next, create the manifest file
-    curl -X PUT -H 'X-Auth-Token: <token>' \
-        -H 'X-Object-Manifest: container/myobject/' \
-        http://<storage_url>/container/myobject --data-binary ''
-
-    # And now we can download the segments as a single object
-    curl -H 'X-Auth-Token: <token>' \
-        http://<storage_url>/container/myobject
+SLO support centers around the user generated manifest file. After the user
+has uploaded the segments into their account a manifest file needs to be
+built and uploaded. All object segments, must be at least 1 byte
+in size. Please see the SLO docs for :ref:`slo-doc` further
+details.
 
 ----------------
 Additional Notes
@@ -104,6 +57,10 @@ Additional Notes
   <container>/<prefix>`` header will be returned with the concatenated object
   so you can tell where it's getting its segments from.
 
+* When updating a manifest object using a POST request, a
+  ``X-Object-Manifest`` header must be included for the object to
+  continue to behave as a manifest object.
+
 * The response's ``Content-Length`` for a ``GET`` or ``HEAD`` on the manifest
   file will be the sum of all the segments in the ``<container>/<prefix>``
   listing, dynamically. So, uploading additional segments after the manifest is
@@ -117,11 +74,11 @@ Additional Notes
 
 * The response's ``ETag`` for a ``GET`` or ``HEAD`` on the manifest file will
   be the MD5 sum of the concatenated string of ETags for each of the segments
-  in the ``<container>/<prefix>`` listing, dynamically. Usually in Swift the
-  ETag is the MD5 sum of the contents of the object, and that holds true for
-  each segment independently. But, it's not feasible to generate such an ETag
-  for the manifest itself, so this method was chosen to at least offer change
-  detection.
+  in the manifest (for DLO, from the listing ``<container>/<prefix>``).
+  Usually in Swift the ETag is the MD5 sum of the contents of the object, and
+  that holds true for each segment independently. But it's not meaningful to
+  generate such an ETag for the manifest itself so this method was chosen to
+  at least offer change detection.
 
 
 .. note::
@@ -134,10 +91,10 @@ Additional Notes
 History
 -------
 
-Large object support has gone through various iterations before settling on
-this implementation.
+Dynamic large object support has gone through various iterations before
+settling on this implementation.
 
-The primary factor driving the limitation of object size in swift is
+The primary factor driving the limitation of object size in Swift is
 maintaining balance among the partitions of the ring.  To maintain an even
 dispersion of disk usage throughout the cluster the obvious storage pattern
 was to simply split larger objects into smaller segments, which could then be
@@ -168,20 +125,32 @@ The current "user manifest" design was chosen in order to provide a
 transparent download of large objects to the client and still provide the
 uploading client a clean API to support segmented uploads.
 
-Alternative "explicit" user manifest options were discussed which would have
-required a pre-defined format for listing the segments to "finalize" the
-segmented upload.  While this may offer some potential advantages, it was
-decided that pushing an added burden onto the client which could potentially
-limit adoption should be avoided in favor of a simpler "API" (essentially just
-the format of the 'X-Object-Manifest' header).
-
-During development it was noted that this "implicit" user manifest approach
-which is based on the path prefix can be potentially affected by the eventual
-consistency window of the container listings, which could theoretically cause
-a GET on the manifest object to return an invalid whole object for that short
-term.  In reality you're unlikely to encounter this scenario unless you're
-running very high concurrency uploads against a small testing environment
-which isn't running the object-updaters or container-replicators.
-
-Like all of swift, Large Object Support is living feature which will continue
-to improve and may change over time.
+To meet an many use cases as possible Swift supports two types of large
+object manifests. Dynamic and static large object manifests both support
+the same idea of allowing the user to upload many segments to be later
+downloaded as a single file.
+
+Dynamic large objects rely on a container listing to provide the manifest.
+This has the advantage of allowing the user to add/removes segments from the
+manifest at any time. It has the disadvantage of relying on eventually
+consistent container listings. All three copies of the container dbs must
+be updated for a complete list to be guaranteed. Also, all segments must
+be in a single container, which can limit concurrent upload speed.
+
+Static large objects rely on a user provided manifest file. A user can
+upload objects into multiple containers and then reference those objects
+(segments) in a self generated manifest file. Future GETs to that file will
+download the concatenation of the specified segments. This has the advantage of
+being able to immediately download the complete object once the manifest has
+been successfully PUT. Being able to upload segments into separate containers
+also improves concurrent upload speed. It has the disadvantage that the
+manifest is finalized once PUT. Any changes to it means it has to be replaced.
+
+Between these two methods the user has great flexibility in how (s)he chooses
+to upload and retrieve large objects to Swift. Swift does not, however, stop
+the user from harming themselves. In both cases the segments are deletable by
+the user at any time. If a segment was deleted by mistake, a dynamic large
+object, having no way of knowing it was ever there, would happily ignore the
+deleted file and the user will get an incomplete file. A static large object
+would, when failing to retrieve the object specified in the manifest, drop the
+connection and the user would receive partial results.
diff --git a/doc/source/overview_object_versioning.rst b/doc/source/overview_object_versioning.rst
deleted file mode 100644
index c9355a9b51..0000000000
--- a/doc/source/overview_object_versioning.rst
+++ /dev/null
@@ -1,77 +0,0 @@
-=================
-Object Versioning
-=================
-
---------
-Overview
---------
-
-Object versioning in swift is implemented by setting a flag on the container
-to tell swift to version all objects in the container. The flag is the
-``X-Versions-Location`` header on the container, and its value is the
-container where the versions are stored. It is recommended to use a different
-``X-Versions-Location`` container for each container that is being versioned.
-
-When data is ``PUT`` into a versioned container (a container with the
-versioning flag turned on), the existing data in the file is redirected to a
-new object and the data in the ``PUT`` request is saved as the data for the
-versioned object. The new object name (for the previous version) is 
-``<versions_container>/<length><object_name>/<timestamp>``, where ``length``
-is the 3-character zero-padded hexidecimal length of the ``<object_name>`` and
-``<timestamp>`` is the timestamp of when the previous version was created.
-
-A ``GET`` to a versioned object will return the current version of the object
-without having to do any request redirects or metadata lookups.
-
-A ``POST`` to a versioned object will update the object metadata as normal,
-but will not create a new version of the object. In other words, new versions
-are only created when the content of the object changes.
-
-A ``DELETE`` to a versioned object will only remove the current version of the
-object. If you have 5 total versions of the object, you must delete the
-object 5 times to completely remove the object.
-
-Note: A large object manifest file cannot be versioned, but a large object
-manifest may point to versioned segments.
-
---------------------------------------------------
-How to Enable Object Versioning in a Swift Cluster
---------------------------------------------------
-
-Set ``allow_versions`` to ``True`` in the container server config.
-
------------------------
-Examples Using ``curl``
------------------------
-
-First, create a container with the ``X-Versions-Location`` header or add the
-header to an existing container. Also make sure the container referenced by
-the ``X-Versions-Location`` exists. In this example, the name of that
-container is "versions"::
-
-    curl -i -XPUT -H "X-Auth-Token: <token>" \
-        -H "X-Versions-Location: versions" http://<storage_url>/container
-    curl -i -XPUT -H "X-Auth-Token: <token>" http://<storage_url>/versions
-
-Create an object (the first version)::
-
-    curl -i -XPUT --data-binary 1 -H "X-Auth-Token: <token>" \
-        http://<storage_url>/container/myobject
-
-Now create a new version of that object::
-
-    curl -i -XPUT --data-binary 2 -H "X-Auth-Token: <token>" \
-        http://<storage_url>/container/myobject
-
-See a listing of the older versions of the object::
-
-    curl -i -H "X-Auth-Token: <token>" \
-        http://<storage_url>/versions?prefix=008myobject/
-
-Now delete the current version of the object and see that the older version is
-gone::
-
-    curl -i -XDELETE -H "X-Auth-Token: <token>" \
-        http://<storage_url>/container/myobject
-    curl -i -H "X-Auth-Token: <token>" \
-        http://<storage_url>/versions?prefix=008myobject/
diff --git a/doc/source/overview_policies.rst b/doc/source/overview_policies.rst
new file mode 100644
index 0000000000..822db5037e
--- /dev/null
+++ b/doc/source/overview_policies.rst
@@ -0,0 +1,680 @@
+================
+Storage Policies
+================
+
+Storage Policies allow for some level of segmenting the cluster for various
+purposes through the creation of multiple object rings. The Storage Policies
+feature is implemented throughout the entire code base so it is an important
+concept in understanding Swift architecture.
+
+As described in :doc:`overview_ring`, Swift uses modified hashing rings to
+determine where data should reside in the cluster. There is a separate ring for
+account databases, container databases, and there is also one object ring per
+storage policy.  Each object ring behaves exactly the same way and is maintained
+in the same manner, but with policies, different devices can belong to different
+rings. By supporting multiple object rings, Swift allows the application and/or
+deployer to essentially segregate the object storage within a single cluster.
+There are many reasons why this might be desirable:
+
+* Different levels of durability:  If a provider wants to offer, for example,
+  2x replication and 3x replication but doesn't want to maintain 2 separate
+  clusters, they would setup a 2x and a 3x replication policy and assign the
+  nodes to their respective rings. Furthermore, if a provider wanted to offer a
+  cold storage tier, they could create an erasure coded policy.
+
+* Performance:  Just as SSDs can be used as the exclusive members of an account
+  or database ring, an SSD-only object ring can be created as well and used to
+  implement a low-latency/high performance policy.
+
+* Collecting nodes into group:  Different object rings may have different
+  physical servers so that objects in specific storage policies are always
+  placed in a particular data center or geography.
+
+* Different Storage implementations:  Another example would be to collect
+  together a set of nodes that use a different Diskfile (e.g., Kinetic,
+  GlusterFS) and use a policy to direct traffic just to those nodes.
+
+* Different read and write affinity settings: proxy-servers can be configured
+  to use different read and write affinity options for each policy. See
+  :ref:`proxy_server_per_policy_config` for more details.
+
+.. note::
+
+    Today, Swift supports two different policy types: Replication and Erasure
+    Code. See :doc:`overview_erasure_code` for details.
+
+    Also note that Diskfile refers to backend object storage plug-in
+    architecture. See :doc:`development_ondisk_backends` for details.
+
+-----------------------
+Containers and Policies
+-----------------------
+
+Policies are implemented at the container level.  There are many advantages to
+this approach, not the least of which is how easy it makes life on
+applications that want to take advantage of them.  It also ensures that
+Storage Policies remain a core feature of Swift independent of the auth
+implementation.  Policies were not implemented at the account/auth layer
+because it would require changes to all auth systems in use by Swift
+deployers.  Each container has a new special immutable metadata element called
+the storage policy index.  Note that internally, Swift relies on policy
+indexes and not policy names.  Policy names exist for human readability and
+translation is managed in the proxy.  When a container is created, one new
+optional header is supported to specify the policy name. If no name is
+specified, the default policy is used (and if no other policies defined,
+Policy-0 is considered the default).  We will be covering the difference
+between default and Policy-0 in the next section.
+
+Policies are assigned when a container is created.  Once a container has been
+assigned a policy, it cannot be changed (unless it is deleted/recreated).  The
+implications on data placement/movement for large datasets would make this a
+task best left for applications to perform. Therefore, if a container has an
+existing policy of, for example 3x replication, and one wanted to migrate that
+data to an Erasure Code policy, the application would create another container
+specifying the other policy parameters and then simply move the data from one
+container to the other.  Policies apply on a per container basis allowing for
+minimal application awareness; once a container has been created with a specific
+policy, all objects stored in it will be done so in accordance with that policy.
+If a container with a specific name is deleted (requires the container be empty)
+a new container may be created with the same name without any restriction on
+storage policy enforced by the deleted container which previously shared the
+same name.
+
+Containers have a many-to-one relationship with policies meaning that any number
+of containers can share one policy.  There is no limit to how many containers
+can use a specific policy.
+
+The notion of associating a ring with a container introduces an interesting
+scenario: What would happen if 2 containers of the same name were created with
+different Storage Policies on either side of a network outage at the same time?
+Furthermore, what would happen if objects were placed in those containers, a
+whole bunch of them, and then later the network outage was restored?  Well,
+without special care it would be a big problem as an application could end up
+using the wrong ring to try and find an object.  Luckily there is a solution for
+this problem, a daemon known as the Container Reconciler works tirelessly to
+identify and rectify this potential scenario.
+
+--------------------
+Container Reconciler
+--------------------
+
+Because atomicity of container creation cannot be enforced in a
+distributed eventually consistent system, object writes into the wrong
+storage policy must be eventually merged into the correct storage policy
+by an asynchronous daemon.  Recovery from object writes during a network
+partition which resulted in a split brain container created with
+different storage policies are handled by the
+`swift-container-reconciler` daemon.
+
+The container reconciler works off a queue similar to the
+object-expirer.  The queue is populated during container-replication.
+It is never considered incorrect to enqueue an object to be evaluated by
+the container-reconciler because if there is nothing wrong with the location
+of the object the reconciler will simply dequeue it.  The
+container-reconciler queue is an indexed log for the real location of an
+object for which a discrepancy in the storage policy of the container was
+discovered.
+
+To determine the correct storage policy of a container, it is necessary
+to update the status_changed_at field in the container_stat table when a
+container changes status from deleted to re-created.  This transaction
+log allows the container-replicator to update the correct storage policy
+both when replicating a container and handling REPLICATE requests.
+
+Because each object write is a separate distributed transaction it is
+not possible to determine the correctness of the storage policy for each
+object write with respect to the entire transaction log at a given
+container database.  As such, container databases will always record the
+object write regardless of the storage policy on a per object row basis.
+Object byte and count stats are tracked per storage policy in each
+container and reconciled using normal object row merge semantics.
+
+The object rows are ensured to be fully durable during replication using
+the normal container replication.  After the container
+replicator pushes its object rows to available primary nodes any
+misplaced object rows are bulk loaded into containers based off the
+object timestamp under the ``.misplaced_objects`` system account.  The
+rows are initially written to a handoff container on the local node, and
+at the end of the replication pass the ``.misplaced_objects`` containers are
+replicated to the correct primary nodes.
+
+The container-reconciler processes the ``.misplaced_objects`` containers in
+descending order and reaps its containers as the objects represented by
+the rows are successfully reconciled.  The container-reconciler will
+always validate the correct storage policy for enqueued objects using
+direct container HEAD requests which are accelerated via caching.
+
+Because failure of individual storage nodes in aggregate is assumed to
+be common at scale, the container-reconciler will make forward progress
+with a simple quorum majority.  During a combination of failures and
+rebalances it is possible that a quorum could provide an incomplete
+record of the correct storage policy - so an object write may have to be
+applied more than once.  Because storage nodes and container databases
+will not process writes with an ``X-Timestamp`` less than or equal to
+their existing record when objects writes are re-applied their timestamp
+is slightly incremented.  In order for this increment to be applied
+transparently to the client a second vector of time has been added to
+Swift for internal use.  See :class:`~swift.common.utils.Timestamp`.
+
+As the reconciler applies object writes to the correct storage policy it
+cleans up writes which no longer apply to the incorrect storage policy
+and removes the rows from the ``.misplaced_objects`` containers.  After all
+rows have been successfully processed it sleeps and will periodically
+check for newly enqueued rows to be discovered during container
+replication.
+
+.. _default-policy:
+
+-------------------------
+Default versus 'Policy-0'
+-------------------------
+
+Storage Policies is a versatile feature intended to support both new and
+pre-existing clusters with the same level of flexibility.  For that reason, we
+introduce the ``Policy-0`` concept which is not the same as the "default"
+policy.  As you will see when we begin to configure policies, each policy has
+a single name and an arbitrary number of aliases (human friendly,
+configurable) as well as an index (or simply policy number). Swift reserves
+index 0 to map to the object ring that's present in all installations
+(e.g., ``/etc/swift/object.ring.gz``). You can name this policy anything you
+like, and if no policies are defined it will report itself as ``Policy-0``,
+however you cannot change the index as there must always be a policy with
+index 0.
+
+Another important concept is the default policy which can be any policy
+in the cluster.  The default policy is the policy that is automatically
+chosen when a container creation request is sent without a storage
+policy being specified. :ref:`configure-policy` describes how to set the
+default policy.  The difference from ``Policy-0`` is subtle but
+extremely important.  ``Policy-0`` is what is used by Swift when
+accessing pre-storage-policy containers which won't have a policy - in
+this case we would not use the default as it might not have the same
+policy as legacy containers.  When no other policies are defined, Swift
+will always choose ``Policy-0`` as the default.
+
+In other words, default means "create using this policy if nothing else is
+specified" and ``Policy-0`` means "use the legacy policy if a container doesn't
+have one" which really means use ``object.ring.gz`` for lookups.
+
+.. note::
+
+    With the Storage Policy based code, it's not possible to create a
+    container that doesn't have a policy.  If nothing is provided, Swift will
+    still select the default and assign it to the container.  For containers
+    created before Storage Policies were introduced, the legacy Policy-0 will
+    be used.
+
+.. _deprecate-policy:
+
+--------------------
+Deprecating Policies
+--------------------
+
+There will be times when a policy is no longer desired; however simply
+deleting the policy and associated rings would be problematic for existing
+data.  In order to ensure that resources are not orphaned in the cluster (left
+on disk but no longer accessible) and to provide proper messaging to
+applications when a policy needs to be retired, the notion of deprecation is
+used.  :ref:`configure-policy` describes how to deprecate a policy.
+
+Swift's behavior with deprecated policies is as follows:
+
+* The deprecated policy will not appear in /info
+* PUT/GET/DELETE/POST/HEAD are still allowed on the pre-existing containers
+  created with a deprecated policy
+* Clients will get an ''400 Bad Request'' error when trying to create a new
+  container using the deprecated policy
+* Clients still have access to policy statistics via HEAD on pre-existing
+  containers
+
+.. note::
+
+    A policy cannot be both the default and deprecated.  If you deprecate the
+    default policy, you must specify a new default.
+
+You can also use the deprecated feature to rollout new policies.  If you
+want to test a new storage policy before making it generally available
+you could deprecate the policy when you initially roll it the new
+configuration and rings to all nodes.  Being deprecated will render it
+innate and unable to be used.  To test it you will need to create a
+container with that storage policy; which will require a single proxy
+instance (or a set of proxy-servers which are only internally
+accessible) that has been one-off configured with the new policy NOT
+marked deprecated.  Once the container has been created with the new
+storage policy any client authorized to use that container will be able
+to add and access data stored in that container in the new storage
+policy.  When satisfied you can roll out a new ``swift.conf`` which does
+not mark the policy as deprecated to all nodes.
+
+.. _configure-policy:
+
+--------------------
+Configuring Policies
+--------------------
+
+.. note::
+
+    See :doc:`policies_saio` for a step by step guide on adding a policy to the
+    SAIO setup.
+
+It is important that the deployer have a solid understanding of the semantics
+for configuring policies.  Configuring a policy is a three-step process:
+
+#. Edit your ``/etc/swift/swift.conf`` file to define your new policy.
+#. Create the corresponding policy object ring file.
+#. (Optional) Create policy-specific proxy-server configuration settings.
+
+Defining a policy
+-----------------
+
+Each policy is defined by a section in the ``/etc/swift/swift.conf`` file. The
+section name must be of the form ``[storage-policy:<N>]`` where ``<N>`` is the
+policy index. There's no reason other than readability that policy indexes be
+sequential but the following rules are enforced:
+
+* If a policy with index ``0`` is not declared and no other policies are
+  defined, Swift will create a default policy with index ``0``.
+* The policy index must be a non-negative integer.
+* Policy indexes must be unique.
+
+.. warning::
+
+    The index of a policy should never be changed once a policy has been
+    created and used. Changing a policy index may cause loss of access to data.
+
+Each policy section contains the following options:
+
+* ``name = <policy_name>`` (required)
+    - The primary name of the policy.
+    - Policy names are case insensitive.
+    - Policy names must contain only letters, digits or a dash.
+    - Policy names must be unique.
+    - Policy names can be changed.
+    - The name ``Policy-0`` can only be used for the policy with
+      index ``0``.
+    - To avoid confusion with policy indexes it is strongly recommended that
+      policy names are not numbers (e.g. '1'). However, for backwards
+      compatibility, names that are numbers are supported.
+* ``aliases = <policy_name>[, <policy_name>, ...]`` (optional)
+    - A comma-separated list of alternative names for the policy.
+    - The default value is an empty list (i.e. no aliases).
+    - All alias names must follow the rules for the ``name`` option.
+    - Aliases can be added to and removed from the list.
+    - Aliases can be useful to retain support for old primary names if the
+      primary name is changed.
+* ``default = [true|false]`` (optional)
+    - If ``true`` then this policy will be used when the client does not
+      specify a policy.
+    - The default value is ``false``.
+    - The default policy can be changed at any time, by setting
+      ``default = true`` in the desired policy section.
+    - If no policy is declared as the default and no other policies are
+      defined, the policy with index ``0`` is set as the default;
+    - Otherwise, exactly one policy must be declared default.
+    - Deprecated policies cannot be declared the default.
+    - See :ref:`default-policy` for more information.
+* ``deprecated = [true|false]`` (optional)
+    - If ``true`` then new containers cannot be created using this policy.
+    - The default value is ``false``.
+    - Any policy may be deprecated by adding the ``deprecated`` option to
+      the desired policy section. However, a deprecated policy may not also
+      be declared the default. Therefore, since there must always be a
+      default policy, there must also always be at least one policy which
+      is not deprecated.
+    - See :ref:`deprecate-policy` for more information.
+* ``policy_type = [replication|erasure_coding]`` (optional)
+    - The option ``policy_type`` is used to distinguish between different
+      policy types.
+    - The default value is ``replication``.
+    - When defining an EC policy use the value ``erasure_coding``.
+* ``diskfile_module = <entry point>`` (optional)
+    - The option ``diskfile_module`` is used to load an alternate backend
+      object storage plug-in architecture.
+    - The default value is ``egg:swift#replication.fs`` or
+      ``egg:swift#erasure_coding.fs`` depending on the policy type. The scheme
+      and package name are optionals and default to ``egg`` and ``swift``.
+
+The EC policy type has additional required options. See
+:ref:`using_ec_policy` for details.
+
+The following is an example of a properly configured ``swift.conf`` file. See
+:doc:`policies_saio` for full instructions on setting up an all-in-one with
+this example configuration.::
+
+        [swift-hash]
+        # random unique strings that can never change (DO NOT LOSE)
+        # Use only printable chars (python -c "import string; print(string.printable)")
+        swift_hash_path_prefix = changeme
+        swift_hash_path_suffix = changeme
+
+        [storage-policy:0]
+        name = gold
+        aliases = yellow, orange
+        policy_type = replication
+        default = yes
+
+        [storage-policy:1]
+        name = silver
+        policy_type = replication
+        diskfile_module = replication.fs
+        deprecated = yes
+
+
+Creating a ring
+---------------
+
+Once ``swift.conf`` is configured for a new policy, a new ring must be created.
+The ring tools are not policy name aware so it's critical that the correct
+policy index be used when creating the new policy's ring file. Additional
+object rings are created using ``swift-ring-builder`` in the same manner as the
+legacy ring except that ``-N`` is appended after the word ``object`` in the
+builder file name, where ``N`` matches the policy index used in ``swift.conf``.
+So, to create the ring for policy index ``1``::
+
+        swift-ring-builder object-1.builder create 10 3 1
+
+Continue to use the same naming convention when using ``swift-ring-builder`` to
+add devices, rebalance etc. This naming convention is also used in the pattern
+for per-policy storage node data directories.
+
+.. note::
+
+    The same drives can indeed be used for multiple policies and the details
+    of how that's managed on disk will be covered in a later section, it's
+    important to understand the implications of such a configuration before
+    setting one up.  Make sure it's really what you want to do, in many cases
+    it will be, but in others maybe not.
+
+
+Proxy server configuration (optional)
+-------------------------------------
+
+The :ref:`proxy-server` configuration options related to read and write
+affinity may optionally be overridden for individual storage policies. See
+:ref:`proxy_server_per_policy_config` for more details.
+
+
+--------------
+Using Policies
+--------------
+
+Using policies is very simple - a policy is only specified when a container is
+initially created.  There are no other API changes.  Creating a container can
+be done without any special policy information::
+
+        curl -v -X PUT -H 'X-Auth-Token: <your auth token>' \
+            http://127.0.0.1:8080/v1/AUTH_test/myCont0
+
+Which will result in a container created that is associated with the
+policy name 'gold' assuming we're using the swift.conf example from
+above.  It would use 'gold' because it was specified as the default.
+Now, when we put an object into this container, it will get placed on
+nodes that are part of the ring we created for policy 'gold'.
+
+If we wanted to explicitly state that we wanted policy 'gold' the command
+would simply need to include a new header as shown below::
+
+        curl -v -X PUT -H 'X-Auth-Token: <your auth token>' \
+            -H 'X-Storage-Policy: gold' http://127.0.0.1:8080/v1/AUTH_test/myCont0
+
+And that's it!  The application does not need to specify the policy name ever
+again.  There are some illegal operations however:
+
+* If an invalid (typo, non-existent) policy is specified: 400 Bad Request
+* if you try to change the policy either via PUT or POST: 409 Conflict
+
+If you'd like to see how the storage in the cluster is being used, simply HEAD
+the account and you'll see not only the cumulative numbers, as before, but
+per policy statistics as well.  In the example below there's 3 objects total
+with two of them in policy 'gold' and one in policy 'silver'::
+
+        curl -i -X HEAD -H 'X-Auth-Token: <your auth token>' \
+            http://127.0.0.1:8080/v1/AUTH_test
+
+and your results will include (some output removed for readability)::
+
+        X-Account-Container-Count: 3
+        X-Account-Object-Count: 3
+        X-Account-Bytes-Used: 21
+        X-Storage-Policy-Gold-Object-Count: 2
+        X-Storage-Policy-Gold-Bytes-Used: 14
+        X-Storage-Policy-Silver-Object-Count: 1
+        X-Storage-Policy-Silver-Bytes-Used: 7
+
+--------------
+Under the Hood
+--------------
+
+Now that we've explained a little about what Policies are and how to
+configure/use them, let's explore how Storage Policies fit in at the
+nuts-n-bolts level.
+
+Parsing and Configuring
+-----------------------
+
+The module, :ref:`storage_policy`, is responsible for parsing the
+``swift.conf`` file, validating the input, and creating a global collection of
+configured policies via class :class:`.StoragePolicyCollection`.  This
+collection is made up of policies of class :class:`.StoragePolicy`. The
+collection class includes handy functions for getting to a policy either by
+name or by index , getting info about the policies, etc. There's also one
+very important function, :meth:`~.StoragePolicyCollection.get_object_ring`.
+Object rings are members of the :class:`.StoragePolicy` class and are
+actually not instantiated until the :meth:`~.StoragePolicy.load_ring`
+method is called.  Any caller anywhere in the code base that needs to access
+an object ring must use the :data:`.POLICIES` global singleton to access the
+:meth:`~.StoragePolicyCollection.get_object_ring` function and provide the
+policy index which will call :meth:`~.StoragePolicy.load_ring` if
+needed; however, when starting request handling services such as the
+:ref:`proxy-server` rings are proactively loaded to provide moderate
+protection against a mis-configuration resulting in a run time error.  The
+global is instantiated when Swift starts and provides a mechanism to patch
+policies for the test code.
+
+Middleware
+----------
+
+Middleware can take advantage of policies through the :data:`.POLICIES` global
+and by importing :func:`.get_container_info` to gain access to the policy index
+associated with the container in question.  From the index it can then use the
+:data:`.POLICIES` singleton to grab the right ring.  For example,
+:ref:`list_endpoints` is policy aware using the means just described. Another
+example is :ref:`recon` which will report the md5 sums for all of the rings.
+
+Proxy Server
+------------
+
+The :ref:`proxy-server` module's role in Storage Policies is essentially to make
+sure the correct ring is used as its member element.  Before policies, the one
+object ring would be instantiated when the :class:`.Application` class was
+instantiated and could be overridden by test code via init parameter.  With
+policies, however, there is no init parameter and the :class:`.Application`
+class instead depends on the :data:`.POLICIES` global singleton to retrieve the
+ring which is instantiated the first time it's needed.  So, instead of an object
+ring member of the :class:`.Application` class, there is an accessor function,
+:meth:`~.Application.get_object_ring`, that gets the ring from
+:data:`.POLICIES`.
+
+In general, when any module running on the proxy requires an object ring, it
+does so via first getting the policy index from the cached container info.  The
+exception is during container creation where it uses the policy name from the
+request header to look up policy index from the :data:`.POLICIES` global.  Once
+the proxy has determined the policy index, it can use the
+:meth:`~.Application.get_object_ring` method described earlier to gain access to
+the correct ring.  It then has the responsibility of passing the index
+information, not the policy name, on to the back-end servers via the header ``X
+-Backend-Storage-Policy-Index``. Going the other way, the proxy also strips the
+index out of headers that go back to clients, and makes sure they only see the
+friendly policy names.
+
+On Disk Storage
+---------------
+
+Policies each have their own directories on the back-end servers and are
+identified by their storage policy indexes.  Organizing the back-end directory
+structures by policy index helps keep track of things and also allows for
+sharing of disks between policies which may or may not make sense depending on
+the needs of the provider.  More on this later, but for now be aware of the
+following directory naming convention:
+
+* ``/objects`` maps to objects associated with Policy-0
+* ``/objects-N`` maps to storage policy index #N
+* ``/async_pending`` maps to async pending update for Policy-0
+* ``/async_pending-N`` maps to async pending update for storage policy index #N
+* ``/tmp`` maps to the DiskFile temporary directory for Policy-0
+* ``/tmp-N`` maps to the DiskFile temporary directory for policy index #N
+* ``/quarantined/objects`` maps to the quarantine directory for Policy-0
+* ``/quarantined/objects-N`` maps to the quarantine directory for policy index #N
+
+Note that these directory names are actually owned by the specific Diskfile
+implementation, the names shown above are used by the default Diskfile.
+
+Object Server
+-------------
+
+The :ref:`object-server` is not involved with selecting the storage policy
+placement directly.  However, because of how back-end directory structures are
+setup for policies, as described earlier, the object server modules do play a
+role.  When the object server gets a :class:`.Diskfile`, it passes in the
+policy index and leaves the actual directory naming/structure mechanisms to
+:class:`.Diskfile`.  By passing in the index, the instance of
+:class:`.Diskfile` being used will assure that data is properly located in the
+tree based on its policy.
+
+For the same reason, the :ref:`object-updater` also is policy aware.  As
+previously described, different policies use different async pending directories
+so the updater needs to know how to scan them appropriately.
+
+The :ref:`object-replicator` is policy aware in that, depending on the policy,
+it may have to do drastically different things, or maybe not.  For example, the
+difference in handling a replication job for 2x versus 3x is trivial; however,
+the difference in handling replication between 3x and erasure code is most
+definitely not.  In fact, the term 'replication' really isn't appropriate for
+some policies like erasure code; however, the majority of the framework for
+collecting and processing jobs is common.  Thus, those functions in the
+replicator are leveraged for all policies and then there is policy specific code
+required for each policy, added when the policy is defined if needed.
+
+The ssync functionality is policy aware for the same reason. Some of the
+other modules may not obviously be affected, but the back-end directory
+structure owned by :class:`.Diskfile` requires the policy index
+parameter.  Therefore ssync being policy aware really means passing the
+policy index along.  See :class:`~swift.obj.ssync_sender` and
+:class:`~swift.obj.ssync_receiver` for more information on ssync.
+
+For :class:`.Diskfile` itself, being policy aware is all about managing the
+back-end structure using the provided policy index.  In other words, callers who
+get a :class:`.Diskfile` instance provide a policy index and
+:class:`.Diskfile`'s job is to keep data separated via this index (however it
+chooses) such that policies can share the same media/nodes if desired.  The
+included implementation of :class:`.Diskfile` lays out the directory structure
+described earlier but that's owned within :class:`.Diskfile`; external modules
+have no visibility into that detail.  A common function is provided to map
+various directory names and/or strings based on their policy index. For example
+:class:`.Diskfile` defines :func:`~swift.obj.diskfile.get_data_dir` which builds
+off of a generic :func:`.get_policy_string` to consistently build policy aware
+strings for various usage.
+
+Container Server
+----------------
+
+The :ref:`container-server` plays a very important role in Storage Policies, it
+is responsible for handling the assignment of a policy to a container and the
+prevention of bad things like changing policies or picking the wrong policy to
+use when nothing is specified (recall earlier discussion on Policy-0 versus
+default).
+
+The :ref:`container-updater` is policy aware, however its job is very simple, to
+pass the policy index along to the :ref:`account-server` via a request header.
+
+The :ref:`container-backend` is responsible for both altering existing DB
+schema as well as assuring new DBs are created with a schema that supports
+storage policies.  The "on-demand" migration of container schemas allows Swift
+to upgrade without downtime (sqlite's alter statements are fast regardless of
+row count).  To support rolling upgrades (and downgrades) the incompatible
+schema changes to the ``container_stat`` table are made to a
+``container_info`` table, and the ``container_stat`` table is replaced with a
+view that includes an ``INSTEAD OF UPDATE`` trigger which makes it behave like
+the old table.
+
+The policy index is stored here for use in reporting information
+about the container as well as managing split-brain scenario induced
+discrepancies between containers and their storage policies.  Furthermore,
+during split-brain, containers must be prepared to track object updates from
+multiple policies so the object table also includes a
+``storage_policy_index`` column.  Per-policy object counts and bytes are
+updated in the ``policy_stat`` table using ``INSERT`` and ``DELETE`` triggers
+similar to the pre-policy triggers that updated ``container_stat`` directly.
+
+The :ref:`container-replicator` daemon will pro-actively migrate legacy
+schemas as part of its normal consistency checking process when it updates the
+``reconciler_sync_point`` entry in the ``container_info`` table.  This ensures
+that read heavy containers which do not encounter any writes will still get
+migrated to be fully compatible with the post-storage-policy queries without
+having to fall back and retry queries with the legacy schema to service
+container read requests.
+
+The :ref:`container-sync-daemon` functionality only needs to be policy aware in
+that it accesses the object rings.  Therefore, it needs to pull the policy index
+out of the container information and use it to select the appropriate object
+ring from the :data:`.POLICIES` global.
+
+Account Server
+--------------
+
+The :ref:`account-server`'s role in Storage Policies is really limited to
+reporting. When a HEAD request is made on an account (see example provided
+earlier), the account server is provided with the storage policy index and
+builds the ``object_count`` and ``byte_count`` information for the client on a
+per policy basis.
+
+The account servers are able to report per-storage-policy object and byte
+counts because of some policy specific DB schema changes.  A policy specific
+table, ``policy_stat``, maintains information on a per policy basis (one row
+per policy) in the same manner in which the ``account_stat`` table does.  The
+``account_stat`` table still serves the same purpose and is not replaced by
+``policy_stat``, it holds the total account stats whereas ``policy_stat`` just
+has the break downs.  The backend is also responsible for migrating
+pre-storage-policy accounts by altering the DB schema and populating the
+``policy_stat`` table for Policy-0 with current ``account_stat`` data at that
+point in time.
+
+The per-storage-policy object and byte counts are not updated with each object
+PUT and DELETE request, instead container updates to the account server are
+performed asynchronously by the ``swift-container-updater``.
+
+.. _upgrade-policy:
+
+Upgrading and Confirming Functionality
+--------------------------------------
+
+Upgrading to a version of Swift that has Storage Policy support is not
+difficult, in fact, the cluster administrator isn't required to make any special
+configuration changes to get going.  Swift will automatically begin using the
+existing object ring as both the default ring and the Policy-0 ring.  Adding the
+declaration of policy 0 is totally optional and in its absence, the name given
+to the implicit policy 0 will be 'Policy-0'.  Let's say for testing purposes
+that you wanted to take an existing cluster that already has lots of data on it
+and upgrade to Swift with Storage Policies. From there you want to go ahead and
+create a policy and test a few things out.  All you need to do is:
+
+#. Upgrade all of your Swift nodes to a policy-aware version of Swift
+#. Define your policies in ``/etc/swift/swift.conf``
+#. Create the corresponding object rings
+#. Create containers and objects and confirm their placement is as expected
+
+For a specific example that takes you through these steps, please see
+:doc:`policies_saio`
+
+.. note::
+
+    If you downgrade from a Storage Policy enabled version of Swift to an
+    older version that doesn't support policies, you will not be able to
+    access any data stored in policies other than the policy with index 0 but
+    those objects WILL appear in container listings (possibly as duplicates if
+    there was a network partition and un-reconciled objects).  It is EXTREMELY
+    important that you perform any necessary integration testing on the
+    upgraded deployment before enabling an additional storage policy to ensure
+    a consistent API experience for your clients.  DO NOT downgrade to a
+    version of Swift that does not support storage policies once you expose
+    multiple storage policies.
diff --git a/doc/source/overview_reaper.rst b/doc/source/overview_reaper.rst
index 0488a92863..7e791c31f0 100644
--- a/doc/source/overview_reaper.rst
+++ b/doc/source/overview_reaper.rst
@@ -18,7 +18,7 @@ account-server.conf to delay the actual deletion of data. At this time, there
 is no utility to undelete an account; one would have to update the account
 database replicas directly, setting the status column to an empty string and
 updating the put_timestamp to be greater than the delete_timestamp. (On the
-TODO list is writing a utility to perform this task, preferably through a ReST
+TODO list is writing a utility to perform this task, preferably through a REST
 call.)
 
 The account reaper runs on each account server and scans the server
@@ -40,6 +40,12 @@ troublesome spot. The account reaper will keep trying to delete an account
 until it eventually becomes empty, at which point the database reclaim process
 within the db_replicator will eventually remove the database files.
 
+Sometimes a persistent error state can prevent some object or container
+from being deleted. If this happens, you will see a message such as "Account
+<name> has not been reaped since <date>" in the log. You can control when
+this is logged with the reap_warn_after value in the [account-reaper] section
+of the account-server.conf file. By default this is 30 days.
+
 -------
 History
 -------
@@ -47,7 +53,7 @@ History
 At first, a simple approach of deleting an account through completely external
 calls was considered as it required no changes to the system. All data would
 simply be deleted in the same way the actual user would, through the public
-ReST API. However, the downside was that it would use proxy resources and log
+REST API. However, the downside was that it would use proxy resources and log
 everything when it didn't really need to. Also, it would likely need a
 dedicated server or two, just for issuing the delete requests.
 
diff --git a/doc/source/overview_replication.rst b/doc/source/overview_replication.rst
index ab2b2c1523..ad9d78fc01 100644
--- a/doc/source/overview_replication.rst
+++ b/doc/source/overview_replication.rst
@@ -2,39 +2,168 @@
 Replication
 ===========
 
-Since each replica in swift functions independently, and clients generally require only a simple majority of nodes responding to consider an operation successful, transient failures like network partitions can quickly cause replicas to diverge.  These differences are eventually reconciled by asynchronous, peer-to-peer replicator processes.  The replicator processes traverse their local filesystems, concurrently performing operations in a manner that balances load across physical disks.
-
-Replication uses a push model, with records and files generally only being copied from local to remote replicas.  This is important because data on the node may not belong there (as in the case of handoffs and ring changes), and a replicator can't know what data exists elsewhere in the cluster that it should pull in.  It's the duty of any node that contains data to ensure that data gets to where it belongs.  Replica placement is handled by the ring.
-
-Every deleted record or file in the system is marked by a tombstone, so that deletions can be replicated alongside creations.  These tombstones are cleaned up by the replication process after a period of time referred to as the consistency window, which is related to replication duration and how long transient failures can remove a node from the cluster.  Tombstone cleanup must be tied to replication to reach replica convergence.
-
-If a replicator detects that a remote drive is has failed, it will use the ring's "get_more_nodes" interface to choose an alternate node to synchronize with.  The replicator can maintain desired levels of replication in the face of disk failures, though some replicas may not be in an immediately usable location.  Note that the replicator doesn't maintain desired levels of replication in the case of other failures (e.g. entire node failures) because the most of such failures are transient.
-
-Replication is an area of active development, and likely rife with potential improvements to speed and correctness.
-
-There are two major classes of replicator - the db replicator, which replicates accounts and containers, and the object replicator, which replicates object data.
-
+Because each replica in Swift functions independently, and clients generally
+require only a simple majority of nodes responding to consider an operation
+successful, transient failures like network partitions can quickly cause
+replicas to diverge. These differences are eventually reconciled by
+asynchronous, peer-to-peer replicator processes. The replicator processes
+traverse their local filesystems, concurrently performing operations in a
+manner that balances load across physical disks.
+
+Replication uses a push model, with records and files generally only being
+copied from local to remote replicas. This is important because data on the
+node may not belong there (as in the case of handoffs and ring changes), and a
+replicator can't know what data exists elsewhere in the cluster that it should
+pull in. It's the duty of any node that contains data to ensure that data gets
+to where it belongs. Replica placement is handled by the ring.
+
+Every deleted record or file in the system is marked by a tombstone, so that
+deletions can be replicated alongside creations. The replication process cleans
+up tombstones after a time period known as the consistency window.
+The consistency window encompasses replication duration and how long transient
+failure can remove a node from the cluster. Tombstone cleanup must
+be tied to replication to reach replica convergence.
+
+If a replicator detects that a remote drive has failed, the replicator uses
+the get_more_nodes interface for the ring to choose an alternate node with
+which to synchronize. The replicator can maintain desired levels of replication
+in the face of disk failures, though some replicas may not be in an immediately
+usable location. Note that the replicator doesn't maintain desired levels of
+replication when other failures, such as entire node failures, occur because
+most failure are transient.
+
+Replication is an area of active development, and likely rife with potential
+improvements to speed and correctness.
+
+There are two major classes of replicator - the db replicator, which
+replicates accounts and containers, and the object replicator, which
+replicates object data.
 
 --------------
 DB Replication
 --------------
 
-The first step performed by db replication is a low-cost hash comparison to find out whether or not two replicas already match.  Under normal operation, this check is able to verify that most databases in the system are already synchronized very quickly.  If the hashes differ, the replicator brings the databases in sync by sharing records added since the last sync point.
+The first step performed by db replication is a low-cost hash comparison to
+determine whether two replicas already match. Under normal operation,
+this check is able to verify that most databases in the system are already
+synchronized very quickly. If the hashes differ, the replicator brings the
+databases in sync by sharing records added since the last sync point.
 
-This sync point is a high water mark noting the last record at which two databases were known to be in sync, and is stored in each database as a tuple of the remote database id and record id.  Database ids are unique amongst all replicas of the database, and record ids are monotonically increasing integers.  After all new records have been pushed to the remote database, the entire sync table of the local database is pushed, so the remote database knows it's now in sync with everyone the local database has previously synchronized with.
+This sync point is a high water mark noting the last record at which two
+databases were known to be in sync, and is stored in each database as a tuple
+of the remote database id and record id. Database ids are unique amongst all
+replicas of the database, and record ids are monotonically increasing
+integers. After all new records have been pushed to the remote database, the
+entire sync table of the local database is pushed, so the remote database
+can guarantee that it is in sync with everything with which the local database
+has previously synchronized.
 
-If a replica is found to be missing entirely, the whole local database file is transmitted to the peer using rsync(1) and vested with a new unique id.
+If a replica is found to be missing entirely, the whole local database file is
+transmitted to the peer using rsync(1) and vested with a new unique id.
 
-In practice, DB replication can process hundreds of databases per concurrency setting per second (up to the number of available CPUs or disks) and is bound by the number of DB transactions that must be performed.
+In practice, DB replication can process hundreds of databases per concurrency
+setting per second (up to the number of available CPUs or disks) and is bound
+by the number of DB transactions that must be performed.
 
 
 ------------------
 Object Replication
 ------------------
 
-The initial implementation of object replication simply performed an rsync to push data from a local partition to all remote servers it was expected to exist on.  While this performed adequately at small scale, replication times skyrocketed once directory structures could no longer be held in RAM.  We now use a modification of this scheme in which a hash of the contents for each suffix directory is saved to a per-partition hashes file.  The hash for a suffix directory is invalidated when the contents of that suffix directory are modified.
-
-The object replication process reads in these hash files, calculating any invalidated hashes.  It then transmits the hashes to each remote server that should hold the partition, and only suffix directories with differing hashes on the remote server are rsynced.  After pushing files to the remote server, the replication process notifies it to recalculate hashes for the rsynced suffix directories.
-
-Performance of object replication is generally bound by the number of uncached directories it has to traverse, usually as a result of invalidated suffix directory hashes.  Using write volume and partition counts from our running systems, it was designed so that around 2% of the hash space on a normal node will be invalidated per day, which has experimentally given us acceptable replication speeds.
-
+The initial implementation of object replication simply performed an rsync to
+push data from a local partition to all remote servers it was expected to
+exist on. While this performed adequately at small scale, replication times
+skyrocketed once directory structures could no longer be held in RAM. We now
+use a modification of this scheme in which a hash of the contents for each
+suffix directory is saved to a per-partition hashes file. The hash for a
+suffix directory is invalidated when the contents of that suffix directory are
+modified.
+
+The object replication process reads in these hash files, calculating any
+invalidated hashes. It then transmits the hashes to each remote server that
+should hold the partition, and only suffix directories with differing hashes
+on the remote server are rsynced. After pushing files to the remote server,
+the replication process notifies it to recalculate hashes for the rsynced
+suffix directories.
+
+Performance of object replication is generally bound by the number of uncached
+directories it has to traverse, usually as a result of invalidated suffix
+directory hashes. Using write volume and partition counts from our running
+systems, it was designed so that around 2% of the hash space on a normal node
+will be invalidated per day, which has experimentally given us acceptable
+replication speeds.
+
+.. _ssync:
+
+Work continues with a new ssync method where rsync is not used at all and
+instead all-Swift code is used to transfer the objects. At first, this ssync
+will just strive to emulate the rsync behavior. Once deemed stable it will open
+the way for future improvements in replication since we'll be able to easily
+add code in the replication path instead of trying to alter the rsync code
+base and distributing such modifications.
+
+One of the first improvements planned is an "index.db" that will replace the
+hashes.pkl. This will allow quicker updates to that data as well as more
+streamlined queries. Quite likely we'll implement a better scheme than the
+current one hashes.pkl uses (hash-trees, that sort of thing).
+
+Another improvement planned all along the way is separating the local disk
+structure from the protocol path structure. This separation will allow ring
+resizing at some point, or at least ring-doubling.
+
+Note that for objects being stored with an Erasure Code policy, the replicator
+daemon is not involved.  Instead, the reconstructor is used by Erasure Code
+policies and is analogous to the replicator for Replication type policies.
+See :doc:`overview_erasure_code` for complete information on both Erasure Code
+support as well as the reconstructor.
+
+----------
+Hashes.pkl
+----------
+
+The hashes.pkl file is a key element for both replication and reconstruction
+(for Erasure Coding).  Both daemons use this file to determine if any kind of
+action is required between nodes that are participating in the durability
+scheme.  The file itself is a pickled dictionary with slightly different
+formats depending on whether the policy is Replication or Erasure Code.  In
+either case, however, the same basic information is provided between the
+nodes.  The dictionary contains a dictionary where the key is a suffix
+directory name and the value is the MD5 hash of the directory listing for
+that suffix.  In this manner, the daemon can quickly identify differences
+between local and remote suffix directories on a per partition basis as the
+scope of any one hashes.pkl file is a partition directory.
+
+For Erasure Code policies, there is a little more information required.  An
+object's hash directory may contain multiple fragments of a single object in
+the event that the node is acting as a handoff or perhaps if a rebalance is
+underway.  Each fragment of an object is stored with a fragment index, so
+the hashes.pkl for an Erasure Code partition will still be a dictionary
+keyed on the suffix directory name, however, the value is another dictionary
+keyed on the fragment index with subsequent MD5 hashes for each one as
+values.  Some files within an object hash directory don't require a fragment
+index so None is used to represent those.  Below are examples of what these
+dictionaries might look like.
+
+Replication hashes.pkl::
+
+    {'a43': '72018c5fbfae934e1f56069ad4425627',
+     'b23': '12348c5fbfae934e1f56069ad4421234'}
+
+Erasure Code hashes.pkl::
+
+    {'a43': {None: '72018c5fbfae934e1f56069ad4425627',
+             2: 'b6dd6db937cb8748f50a5b6e4bc3b808'},
+     'b23': {None: '12348c5fbfae934e1f56069ad4421234',
+             1: '45676db937cb8748f50a5b6e4bc34567'}}
+
+
+
+
+
+-----------------------------
+Dedicated replication network
+-----------------------------
+
+Swift has support for using dedicated network for replication traffic.
+For more information see :ref:`Overview of dedicated replication network
+<Dedicated-replication-network>`.
diff --git a/doc/source/overview_ring.rst b/doc/source/overview_ring.rst
index 9af54959db..d5415c2c7c 100644
--- a/doc/source/overview_ring.rst
+++ b/doc/source/overview_ring.rst
@@ -4,48 +4,67 @@ The Rings
 
 The rings determine where data should reside in the cluster. There is a
 separate ring for account databases, container databases, and individual
-objects but each ring works in the same way. These rings are externally
-managed, in that the server processes themselves do not modify the rings, they
-are instead given new rings modified by other tools.
-
-The ring uses a configurable number of bits from a path's MD5 hash as a
-partition index that designates a device. The number of bits kept from the hash
-is known as the partition power, and 2 to the partition power indicates the
-partition count. Partitioning the full MD5 hash ring allows other parts of the
-cluster to work in batches of items at once which ends up either more efficient
-or at least less complex than working with each item separately or the entire
-cluster all at once.
-
-Another configurable value is the replica count, which indicates how many of
-the partition->device assignments comprise a single ring. For a given partition
-number, each replica's device will not be in the same zone as any other
-replica's device. Zones can be used to group devices based on physical
-locations, power separations, network separations, or any other attribute that
-would lessen multiple replicas being unavailable at the same time.
+object storage policies but each ring works in the same way. These rings are
+externally managed. The server processes themselves do not modify the
+rings; they are instead given new rings modified by other tools.
+
+The ring uses a configurable number of bits from the MD5 hash of an item's path
+as a partition index that designates the device(s) on which that item should
+be stored. The number of bits kept from the hash is known as the partition
+power, and 2 to the partition power indicates the partition count. Partitioning
+the full MD5 hash ring allows the cluster components to process resources in
+batches. This ends up either more efficient or at least less complex than
+working with each item separately or the entire cluster all at once.
+
+Another configurable value is the replica count, which indicates how many
+devices to assign for each partition in the ring. By having multiple devices
+responsible for each partition, the cluster can recover from drive or network
+failures.
+
+Devices are added to the ring to describe the capacity available for
+partition replica assignments.  Devices are placed into failure domains
+consisting of region, zone, and server.  Regions can be used to describe
+geographical systems characterized by lower bandwidth or higher latency between
+machines in different regions.  Many rings will consist of only a single
+region.  Zones can be used to group devices based on physical locations, power
+separations, network separations, or any other attribute that would lessen
+multiple replicas being unavailable at the same time.
+
+Devices are given a weight which describes the relative storage capacity
+contributed by the device in comparison to other devices.
+
+When building a ring, replicas for each partition will be assigned to devices
+according to the devices' weights.  Additionally, each replica of a partition
+will preferentially be assigned to a device whose failure domain does not
+already have a replica for that partition.  Only a single replica of a
+partition may be assigned to each device - you must have at least as many
+devices as replicas.
+
+.. _ring_builder:
 
 ------------
 Ring Builder
 ------------
 
 The rings are built and managed manually by a utility called the ring-builder.
-The ring-builder assigns partitions to devices and writes an optimized Python
-structure to a gzipped, serialized file on disk for shipping out to the servers.
-The server processes just check the modification time of the file occasionally
-and reload their in-memory copies of the ring structure as needed. Because of
-how the ring-builder manages changes to the ring, using a slightly older ring
-usually just means one of the three replicas for a subset of the partitions
-will be incorrect, which can be easily worked around.
-
-The ring-builder also keeps its own builder file with the ring information and
-additional data required to build future rings. It is very important to keep
-multiple backup copies of these builder files. One option is to copy the
-builder files out to every server while copying the ring files themselves.
-Another is to upload the builder files into the cluster itself. Complete loss
-of a builder file will mean creating a new ring from scratch, nearly all
-partitions will end up assigned to different devices, and therefore nearly all
-data stored will have to be replicated to new locations. So, recovery from a
-builder file loss is possible, but data will definitely be unreachable for an
-extended time.
+The ring-builder assigns partitions to devices and writes an optimized
+structure to a gzipped, serialized file on disk for shipping out to the
+servers. The server processes check the modification time of the file
+occasionally and reload their in-memory copies of the ring structure as needed.
+Because of how the ring-builder manages changes to the ring, using a slightly
+older ring usually just means that for a subset of the partitions the device
+for one of the replicas  will be incorrect, which can be easily worked around.
+
+The ring-builder also keeps a separate builder file which includes the ring
+information as well as additional data required to build future rings. It is
+very important to keep multiple backup copies of these builder files. One
+option is to copy the builder files out to every server while copying the ring
+files themselves. Another is to upload the builder files into the cluster
+itself. Complete loss of a builder file will mean creating a new ring from
+scratch, nearly all partitions will end up assigned to different devices, and
+therefore nearly all data stored will have to be replicated to new locations.
+So, recovery from a builder file loss is possible, but data will definitely be
+unreachable for an extended time.
 
 -------------------
 Ring Data Structure
@@ -60,128 +79,316 @@ to calculate the partition for the hash.
 List of Devices
 ***************
 
-The list of devices is known internally to the Ring class as devs. Each item in
-the list of devices is a dictionary with the following keys:
-
-======  =======  ==============================================================
-id      integer  The index into the list devices.
-zone    integer  The zone the devices resides in.
-weight  float    The relative weight of the device in comparison to other
-                 devices. This usually corresponds directly to the amount of
-                 disk space the device has compared to other devices. For
-                 instance a device with 1 terabyte of space might have a weight
-                 of 100.0 and another device with 2 terabytes of space might
-                 have a weight of 200.0. This weight can also be used to bring
-                 back into balance a device that has ended up with more or less
-                 data than desired over time. A good average weight of 100.0
-                 allows flexibility in lowering the weight later if necessary.
-ip      string   The IP address of the server containing the device.
-port    int      The TCP port the listening server process uses that serves
-                 requests for the device.
-device  string   The on disk name of the device on the server.
-                 For example: sdb1
-meta    string   A general-use field for storing additional information for the
-                 device. This information isn't used directly by the server
-                 processes, but can be useful in debugging. For example, the
-                 date and time of installation and hardware manufacturer could
-                 be stored here.
-======  =======  ==============================================================
-
-Note: The list of devices may contain holes, or indexes set to None, for
-devices that have been removed from the cluster. Generally, device ids are not
-reused. Also, some devices may be temporarily disabled by setting their weight
-to 0.0. To obtain a list of active devices (for uptime polling, for example)
-the Python code would look like: ``devices = [device for device in self.devs if
-device and device['weight']]``
+The list of devices is known internally to the Ring class as ``devs``. Each
+item in the list of devices is a dictionary with the following keys:
+
+.. table::
+   :widths: 10 10 80
+
+   ======  =======  ==============================================================
+   id      integer  The index into the list of devices.
+   zone    integer  The zone in which the device resides.
+   region  integer  The region in which the zone resides.
+   weight  float    The relative weight of the device in comparison to other
+                    devices. This usually corresponds directly to the amount of
+                    disk space the device has compared to other devices. For
+                    instance a device with 1 terabyte of space might have a weight
+                    of 100.0 and another device with 2 terabytes of space might
+                    have a weight of 200.0. This weight can also be used to bring
+                    back into balance a device that has ended up with more or less
+                    data than desired over time. A good average weight of 100.0
+                    allows flexibility in lowering the weight later if necessary.
+   ip      string   The IP address or hostname of the server containing the device.
+   port    int      The TCP port on which the server process listens to serve
+                    requests for the device.
+   device  string   The on-disk name of the device on the server.
+                    For example: ``sdb1``
+   meta    string   A general-use field for storing additional information for the
+                    device. This information isn't used directly by the server
+                    processes, but can be useful in debugging. For example, the
+                    date and time of installation and hardware manufacturer could
+                    be stored here.
+   ======  =======  ==============================================================
+
+.. note::
+    The list of devices may contain holes, or indexes set to ``None``, for
+    devices that have been removed from the cluster. However, device ids are
+    reused. Device ids are reused to avoid potentially running out of device id
+    slots when there are available slots (from prior removal of devices). A
+    consequence of this device id reuse is that the device id (integer value)
+    does not necessarily correspond with the chronology of when the device was
+    added to the ring. Also, some devices may be temporarily disabled by
+    setting their weight to ``0.0``. To obtain a list of active devices (for
+    uptime polling, for example) the Python code would look like::
+
+        devices = list(self._iter_devs())
 
 *************************
 Partition Assignment List
 *************************
 
-This is a list of array('I') of devices ids. The outermost list contains an
-array('I') for each replica. Each array('I') has a length equal to the
-partition count for the ring. Each integer in the array('I') is an index into
-the above list of devices. The partition list is known internally to the Ring
-class as _replica2part2dev_id.
+The partition assignment list is known internally to the Ring class as
+``_replica2part2dev_id``. This is a list of ``array('H')``\s, one for each
+replica. Each ``array('H')`` has a length equal to the partition count for the
+ring. Each integer in the ``array('H')`` is an index into the above list of
+devices.
 
 So, to create a list of device dictionaries assigned to a partition, the Python
-code would look like: ``devices = [self.devs[part2dev_id[partition]] for
-part2dev_id in self._replica2part2dev_id]``
+code would look like::
 
-array('I') is used for memory conservation as there may be millions of
+    devices = [self.devs[part2dev_id[partition]]
+               for part2dev_id in self._replica2part2dev_id]
+
+``array('H')`` is used for memory conservation as there may be millions of
 partitions.
 
 *********************
 Partition Shift Value
 *********************
 
-The partition shift value is known internally to the Ring class as _part_shift.
-This value used to shift an MD5 hash to calculate the partition on which the
-data for that hash should reside. Only the top four bytes of the hash is used
-in this process. For example, to compute the partition for the path
-/account/container/object the Python code might look like: ``partition =
-unpack_from('>I', md5('/account/container/object').digest())[0] >>
-self._part_shift``
+The partition shift value is known internally to the Ring class as
+``_part_shift``. This value is used to shift an MD5 hash of an item's path to
+calculate the partition on which the data for that item should reside. Only the
+top four bytes of the hash are used in this process. For example, to compute
+the partition for the path ``/account/container/object``, the Python code might
+look like::
+
+    objhash = md5('/account/container/object').digest()
+    partition = struct.unpack_from('>I', objhash)[0] >> self._part_shift
+
+For a ring generated with partition power ``P``, the partition shift value is
+``32 - P``.
+
+*******************
+Fractional Replicas
+*******************
+
+A ring is not restricted to having an integer number of replicas. In order to
+support the gradual changing of replica counts, the ring is able to have a real
+number of replicas.
+
+When the number of replicas is not an integer, the last element of
+``_replica2part2dev_id`` will have a length that is less than the partition
+count for the ring. This means that some partitions will have more replicas
+than others. For example, if a ring has ``3.25`` replicas, then 25% of its
+partitions will have four replicas, while the remaining 75% will have just
+three.
+
+.. _ring_dispersion:
+
+**********
+Dispersion
+**********
+
+With each rebalance, the ring builder calculates a dispersion metric. This is
+the percentage of partitions in the ring that have too many replicas within a
+particular failure domain.
+
+For example, if you have three servers in a cluster but two replicas for a
+partition get placed onto the same server, that partition will count towards
+the dispersion metric.
+
+A lower dispersion value is better, and the value can be used to find the
+proper value for "overload".
+
+.. _ring_overload:
+
+********
+Overload
+********
+
+The ring builder tries to keep replicas as far apart as possible while
+still respecting device weights. When it can't do both, the overload
+factor determines what happens. Each device may take some extra
+fraction of its desired partitions to allow for replica dispersion;
+once that extra fraction is exhausted, replicas will be placed closer
+together than is optimal for durability.
+
+Essentially, the overload factor lets the operator trade off replica
+dispersion (durability) against device balance (uniform disk usage).
+
+The default overload factor is ``0``, so device weights will be strictly
+followed.
+
+With an overload factor of ``0.1``, each device will accept 10% more
+partitions than it otherwise would, but only if needed to maintain
+dispersion.
+
+Example: Consider a 3-node cluster of machines with equal-size disks;
+let node A have 12 disks, node B have 12 disks, and node C have only
+11 disks. Let the ring have an overload factor of ``0.1`` (10%).
+
+Without the overload, some partitions would end up with replicas only
+on nodes A and B. However, with the overload, every device is willing
+to accept up to 10% more partitions for the sake of dispersion. The
+missing disk in C means there is one disk's worth of partitions that
+would like to spread across the remaining 11 disks, which gives each
+disk in C an extra 9.09% load. Since this is less than the 10%
+overload, there is one replica of each partition on each node.
+
+However, this does mean that the disks in node C will have more data
+on them than the disks in nodes A and B. If 80% full is the warning
+threshold for the cluster, node C's disks will reach 80% full while A
+and B's disks are only 72.7% full.
+
+-------------------------------
+Partition & Replica Terminology
+-------------------------------
+
+All descriptions of consistent hashing describe the process of breaking the
+keyspace up into multiple ranges (vnodes, buckets, etc.) - many more than the
+number of "nodes" to which keys in the keyspace must be assigned.  Swift calls
+these ranges `partitions` - they are partitions of the total keyspace.
+
+Each partition will have multiple replicas.  Every replica of each partition
+must be assigned to a device in the ring.  When describing a specific replica
+of a partition (like when it's assigned a device) it is described as a
+`part-replica` in that it is a specific `replica` of the specific `partition`.
+A single device will likely be assigned different replicas from many
+partitions, but it may not be assigned multiple replicas of a single partition.
+
+The total number of partitions in a ring is calculated as ``2 **
+<part-power>``.  The total number of part-replicas in a ring is calculated as
+``<replica-count> * 2 ** <part-power>``.
+
+When considering a device's `weight` it is useful to describe the number of
+part-replicas it would like to be assigned.  A single device, regardless of
+weight, will never hold more than ``2 ** <part-power>`` part-replicas because
+it can not have more than one replica of any partition assigned.  The number of
+part-replicas a device can take by weights is calculated as its `parts-wanted`.
+The true number of part-replicas assigned to a device can be compared to its
+parts-wanted similarly to a calculation of percentage error - this deviation in
+the observed result from the idealized target is called a device's `balance`.
+
+When considering a device's `failure domain` it is useful to describe the number
+of part-replicas it would like to be assigned.  The number of part-replicas
+wanted in a failure domain of a tier is the sum of the part-replicas wanted in
+the failure domains of its sub-tier.  However, collectively when the total
+number of part-replicas in a failure domain exceeds or is equal to ``2 **
+<part-power>`` it is most obvious that it's no longer sufficient to consider
+only the number of total part-replicas, but rather the fraction of each
+replica's partitions.  Consider for example a ring with 3 replicas and 3
+servers: while dispersion requires that each server hold only ⅓ of the total
+part-replicas, placement is additionally constrained to require ``1.0`` replica
+of *each* partition per server.  It would not be sufficient to satisfy
+dispersion if two devices on one of the servers each held a replica of a single
+partition, while another server held none.  By considering a decimal fraction
+of one replica's worth of partitions in a failure domain we can derive the
+total part-replicas wanted in a failure domain (``1.0 * 2 ** <part-power>``).
+Additionally we infer more about `which` part-replicas must go in the failure
+domain.  Consider a ring with three replicas and two zones, each with two
+servers (four servers total). The three replicas worth of partitions will be
+assigned into two failure domains at the zone tier.  Each zone must hold more
+than one replica of some partitions.  We represent this improper fraction of a
+replica's worth of partitions in decimal form as ``1.5`` (``3.0 / 2``).  This
+tells us not only the *number* of total partitions (``1.5 * 2 **
+<part-power>``) but also that *each* partition must have `at least` one replica
+in this failure domain (in fact ``0.5`` of the partitions will have 2
+replicas).  Within each zone the two servers will hold ``0.75`` of a replica's
+worth of partitions - this is equal both to "the fraction of a replica's worth
+of partitions assigned to each zone (``1.5``) divided evenly among the number
+of failure domains in its sub-tier (2 servers in each zone, i.e.  ``1.5 / 2``)"
+but *also* "the total number of replicas (``3.0``) divided evenly among the
+total number of failure domains in the server tier (2 servers × 2 zones = 4,
+i.e.  ``3.0 / 4``)". It is useful to consider that each server in this ring
+will hold only ``0.75`` of a replica's worth of partitions which tells that any
+server should have `at most` one replica of a given partition assigned.  In the
+interests of brevity, some variable names will often refer to the concept
+representing the fraction of a replica's worth of partitions in decimal form as
+*replicanths* - this is meant to invoke connotations similar to ordinal numbers
+as applied to fractions, but generalized to a replica instead of a four\*th* or
+a fif\*th*.  The "n" was probably thrown in because of Blade Runner.
 
 -----------------
 Building the Ring
 -----------------
 
-The initial building of the ring first calculates the number of partitions that
-should ideally be assigned to each device based the device's weight. For
-example, if the partition power of 20 the ring will have 1,048,576 partitions.
-If there are 1,000 devices of equal weight they will each desire 1,048.576
-partitions. The devices are then sorted by the number of partitions they desire
-and kept in order throughout the initialization process.
-
-Then, the ring builder assigns each replica of each partition to the device
-that desires the most partitions at that point while keeping it as far away as
-possible from other replicas. The ring builder prefers to assign a replica to a
-device in a zone that has no replicas already; should there be no such zone
-available, the ring builder will try to find a device on a different server;
-failing that, it will just look for a device that has no replicas; finally, if
-all other options are exhausted, the ring builder will assign the replica to
-the device that has the fewest replicas already assigned.
-
-When building a new ring based on an old ring, the desired number of partitions
-each device wants is recalculated. Next the partitions to be reassigned are
-gathered up. Any removed devices have all their assigned partitions unassigned
-and added to the gathered list. Any partition replicas that (due to the
-addition of new devices) can be spread out for better durability are unassigned
-and added to the gathered list. Any devices that have more partitions than they
-now desire have random partitions unassigned from them and added to the
-gathered list. Lastly, the gathered partitions are then reassigned to devices
-using a similar method as in the initial assignment described above.
+First the ring builder calculates the replicanths wanted at each tier in the
+ring's topology based on weight.
+
+Then the ring builder calculates the replicanths wanted at each tier in the
+ring's topology based on dispersion.
+
+Then the ring builder calculates the maximum deviation on a single device
+between its weighted replicanths and wanted replicanths.
+
+Next we interpolate between the two replicanth values (weighted & wanted) at
+each tier using the specified overload (up to the maximum required overload).
+It's a linear interpolation, similar to solving for a point on a line between
+two points - we calculate the slope across the max required overload and then
+calculate the intersection of the line with the desired overload.  This
+becomes the target.
+
+From the target we calculate the minimum and maximum number of replicas any
+partition may have in a tier.  This becomes the `replica-plan`.
+
+Finally, we calculate the number of partitions that should ideally be assigned
+to each device based the replica-plan.
+
+On initial balance (i.e., the first time partitions are placed to generate a
+ring) we must assign each replica of each partition to the device that desires
+the most partitions excluding any devices that already have their maximum
+number of replicas of that partition assigned to some parent tier of that
+device's failure domain.
+
+When building a new ring based on an old ring, the desired number of
+partitions each device wants is recalculated from the current replica-plan.
+Next the partitions to be reassigned are gathered up. Any removed devices have
+all their assigned partitions unassigned and added to the gathered list. Any
+partition replicas that (due to the addition of new devices) can be spread out
+for better durability are unassigned and added to the gathered list. Any
+devices that have more partitions than they now desire have random partitions
+unassigned from them and added to the gathered list. Lastly, the gathered
+partitions are then reassigned to devices using a similar method as in the
+initial assignment described above.
 
 Whenever a partition has a replica reassigned, the time of the reassignment is
 recorded. This is taken into account when gathering partitions to reassign so
 that no partition is moved twice in a configurable amount of time. This
 configurable amount of time is known internally to the RingBuilder class as
-min_part_hours. This restriction is ignored for replicas of partitions on
-devices that have been removed, as removing a device only happens on device
+``min_part_hours``. This restriction is ignored for replicas of partitions on
+devices that have been removed, as device removal should only happens on device
 failure and there's no choice but to make a reassignment.
 
 The above processes don't always perfectly rebalance a ring due to the random
 nature of gathering partitions for reassignment. To help reach a more balanced
-ring, the rebalance process is repeated until near perfect (less 1% off) or
-when the balance doesn't improve by at least 1% (indicating we probably can't
-get perfect balance due to wildly imbalanced zones or too many partitions
-recently moved).
+ring, the rebalance process is repeated a fixed number of times until the
+replica-plan is fulfilled or unable to be fulfilled (indicating we probably
+can't get perfect balance due to too many partitions recently moved).
+
+
+.. _composite_rings:
+
+---------------
+Composite Rings
+---------------
+
+See :ref:`composite_builder`.
+
+**********************************
+swift-ring-composer (Experimental)
+**********************************
+.. automodule:: swift.cli.ringcomposer
+
+---------------------
+Ring Builder Analyzer
+---------------------
+.. automodule:: swift.cli.ring_builder_analyzer
 
 -------
 History
 -------
 
 The ring code went through many iterations before arriving at what it is now
-and while it has been stable for a while now, the algorithm may be tweaked or
-perhaps even fundamentally changed if new ideas emerge. This section will try
+and while it has largely been stable, the algorithm has seen a few tweaks or
+perhaps even fundamentally changed as new ideas emerge. This section will try
 to describe the previous ideas attempted and attempt to explain why they were
 discarded.
 
 A "live ring" option was considered where each server could maintain its own
 copy of the ring and the servers would use a gossip protocol to communicate the
 changes they made. This was discarded as too complex and error prone to code
-correctly in the project time span available. One bug could easily gossip bad
+correctly in the project timespan available. One bug could easily gossip bad
 data out to the entire cluster and be difficult to recover from. Having an
 externally managed ring simplifies the process, allows full validation of data
 before it's shipped out to the servers, and guarantees each server is using a
@@ -195,18 +402,18 @@ like the current process but where servers could submit change requests to the
 ring server to have a new ring built and shipped back out to the servers. This
 was discarded due to project time constraints and because ring changes are
 currently infrequent enough that manual control was sufficient. However, lack
-of quick automatic ring changes did mean that other parts of the system had to
-be coded to handle devices being unavailable for a period of hours until
+of quick automatic ring changes did mean that other components of the system
+had to be coded to handle devices being unavailable for a period of hours until
 someone could manually update the ring.
 
 The current ring process has each replica of a partition independently assigned
 to a device. A version of the ring that used a third of the memory was tried,
 where the first replica of a partition was directly assigned and the other two
 were determined by "walking" the ring until finding additional devices in other
-zones. This was discarded as control was lost as to how many replicas for a
-given partition moved at once. Keeping each replica independent allows for
+zones. This was discarded due to the loss of control over how many replicas for
+a given partition moved at once. Keeping each replica independent allows for
 moving only one partition replica within a given time window (except due to
-device failures). Using the additional memory was deemed a good tradeoff for
+device failures). Using the additional memory was deemed a good trade-off for
 moving data around the cluster much less often.
 
 Another ring design was tried where the partition to device assignments weren't
@@ -219,16 +426,16 @@ add up. In the end, the memory savings wasn't that great and more processing
 power was used, so the idea was discarded.
 
 A completely non-partitioned ring was also tried but discarded as the
-partitioning helps many other parts of the system, especially replication.
+partitioning helps many other components of the system, especially replication.
 Replication can be attempted and retried in a partition batch with the other
 replicas rather than each data item independently attempted and retried. Hashes
 of directory structures can be calculated and compared with other replicas to
 reduce directory walking and network traffic.
 
 Partitioning and independently assigning partition replicas also allowed for
-the best balanced cluster. The best of the other strategies tended to give
-+-10% variance on device balance with devices of equal weight and +-15% with
-devices of varying weights. The current strategy allows us to get +-3% and +-8%
+the best-balanced cluster. The best of the other strategies tended to give
+±10% variance on device balance with devices of equal weight and ±15% with
+devices of varying weights. The current strategy allows us to get ±3% and ±8%
 respectively.
 
 Various hashing algorithms were tried. SHA offers better security, but the ring
@@ -237,3 +444,19 @@ faster, but MD5 was built-in and hash computation is a small percentage of the
 overall request handling time. In all, once it was decided the servers wouldn't
 be maintaining the rings themselves anyway and only doing hash lookups, MD5 was
 chosen for its general availability, good distribution, and adequate speed.
+
+The placement algorithm has seen a number of behavioral changes for
+unbalanceable rings. The ring builder wants to keep replicas as far apart as
+possible while still respecting device weights. In most cases, the ring
+builder can achieve both, but sometimes they conflict.  At first, the behavior
+was to keep the replicas far apart and ignore device weight, but that made it
+impossible to gradually go from one region to two, or from two to three. Then
+it was changed to favor device weight over dispersion, but that wasn't so good
+for rings that were close to balanceable, like 3 machines with 60TB, 60TB, and
+57TB of disk space; operators were expecting one replica per machine, but
+didn't always get it. After that, overload was added to the ring builder so
+that operators could choose a balance between dispersion and device weights.
+In time the overload concept was improved and made more accurate.
+
+For more background on consistent hashing rings, please see
+:doc:`ring_background`.
diff --git a/doc/source/overview_ring_format.rst b/doc/source/overview_ring_format.rst
new file mode 100644
index 0000000000..7f108c3d8c
--- /dev/null
+++ b/doc/source/overview_ring_format.rst
@@ -0,0 +1,253 @@
+=================
+Ring File Formats
+=================
+
+The ring is the most important data structure in Swift. How this data structure
+been serialized to disk has changed over the years.
+
+Initially ring files contain three key pieces of information:
+
+* the part_power value (often stored as ``part_shift := 32 - part_power``)
+
+  * which determines how many partitions are in the ring,
+
+* the device list
+
+  * which includes all the disks participating in the ring, and
+
+* the replica-to-part-to-device table
+
+  * which has all ``replica_count * (2 ** part_power)`` partition assignments.
+
+But the ability to extend the serialization format to add more data structures
+to the ring serialization format has meant a new ring v2 format has been created.
+
+Ring files have always been gzipped when serialized, though the inner,
+raw format has evolved over the years.
+
+Ring v0
+-------
+
+Initially, rings were simply pickle dumps of the RingData object. `With
+Swift 1.3.0 <https://opendev.org/openstack/swift/commit/fc6391ea>`__, this
+changed to pickling a pure-stdlib data structure, but the core concept
+was the same.
+
+.. note:
+
+    Swift 2.36.0 dropped support for v0 rings.
+
+Ring v1
+-------
+
+Pickle presented some problems, however. While `there are security
+concerns <https://docs.python.org/3/library/pickle.html>`__ around unpickling
+untrusted data, security boundaries are generally drawn such that rings are
+assumed to be trusted. Ultimately, what pushed us to a new format were
+`performance considerations <https://bugs.launchpad.net/swift/+bug/1031954>`__.
+
+Starting in `Swift 1.7.0 <https://opendev.org/openstack/swift/commit/f8ce43a2>`__,
+Swift began using a new format (while still being willing to read the old one).
+The new format starts with some magic so we may identify it as such::
+
+    +---------------+-------+
+    |'R' '1' 'N' 'G'| <vrs> |
+    +---------------+-------+
+
+where ``<vrs>`` is a network-order two-byte version number (which is always 1).
+After that, a JSON object is serialized as::
+
+    +---------------+-------...---+
+    | <data-length> | <data ... > |
+    +---------------+-------...---+
+
+where ``<data-length>`` is the network-order four-byte length (in bytes) of
+``<data>``, which is the ASCII-encoded JSON-serialized object. This object
+has at minimum three keys:
+
+* ``devs`` for the device list
+* ``part_shift`` (i.e., ``32 - part_power``)
+* ``replica_count`` for the integer number of part-to-device rows to read
+
+The replica-to-part-to-device table then follows::
+
+    +-------+-------+...+-------+-------+
+    | <dev> | <dev> |...| <dev> | <dev> |
+    +-------+-------+...+-------+-------+
+    | <dev> | <dev> |...| <dev> | <dev> |
+    +-------+-------+...+-------+-------+
+    |                ...                |
+    +-------+-------+...+-------+-------+
+    | <dev> | <dev> |...|
+    +-------+-------+...+
+
+Each ``<dev>`` is a host-order two-byte index into the ``devs`` list. Every row
+except the last has exactly ``2 ** part_power`` entries; the last row may
+have the same or fewer.
+
+The metadata object has proven quite versatile: new keys have been added
+to provide additional information while remaining backwards-compatible.
+In order, the following new fields have been added:
+
+* ``byteorder`` specifies whether the host-order for the
+  replica-to-part-to-device table is "big" or "little" endian. Added in
+  `Swift 2.12.0 <https://opendev.org/openstack/swift/commit/1ec6e2bb>`__,
+  this allows rings written on big-endian machines to be read on
+  little-endian machines and vice-versa.
+* ``next_part_power`` indicates whether a partition-power increase is in
+  progress. Added in `Swift 2.15.0 <https://opendev.org/openstack/swift/commit/e1140666>`__,
+  this will have one of two values, if present: the ring's current
+  ``part_power``, indicating that there may be hardlinks to clean up,
+  or ``part_power + 1`` indicating that hardlinks may need to be created.
+  See :ref:`the documentation<modify_part_power>`
+  for more information.
+* ``version`` specifies the version number of the ring-builder that was used
+  to write this ring. Added in `Swift 2.24.0 <https://opendev.org/openstack/swift/commit/6853616a>`__,
+  this allows the comparing of rings from different machines to determine
+  which is newer.
+
+Ring v2
+-------
+
+The way that v1 rings dealt with fractional replicas made it impossible
+to reliably serialize additional large data structures after the
+replica-to-part-to-device table. The v2 format has been designed to be
+extensable.
+
+The new format starts with magic similar to v1::
+
+    +---------------+-------+
+    |'R' '1' 'N' 'G'| <vrs> |
+    +---------------+-------+
+
+where <vrs> is again a network-order two-byte version number (which is now 2).
+By bumping the version number, we ensure that old versions of Swift refuse to
+read the ring, rather than misinterpret the content.
+
+After that, a series of BLOBs are serialized, each as::
+
+    +-------------------------------+-------...---+
+    | <data-length>                 | <data ... > |
+    +-------------------------------+-------...---+
+
+where ``<data-length>`` is the network-order eight-byte length (in bytes) of
+``<data>``. Each BLOB is preceded by a ``Z_FULL_FLUSH`` to allow it to be
+decompressed without reading the whole file.
+
+The order of the BLOBs isn't important, although they do tend to be written
+in the order Swift will read them while loading. This reduces the disk seeks
+necessary to load.
+
+The final BLOB is an index: a JSON object mapping named sections to an array
+of offsets within the file, like
+
+.. code::
+
+   {
+       section: [
+           compressed start,
+           uncompressed start,
+           compressed end,
+           uncompressed end,
+           checksum method,
+           checksum value
+       ],
+       ...
+   }
+
+Section names may be arbitrary strings, but the "swift/" prefix is reserved
+for upstream use. The start/end values mark the beginning and ending of the
+section's BLOB. Note that some end values may be ``null`` if they were not
+known when the index was written -- in particular, this *will* be true for
+the index itself. The checksum method should be one of ``"md5"``, ``"sha1"``,
+``"sha256"``, or ``"sha512"``; other values will be ignored in anticipation
+of a need to support further algorithms. The checksum value will be the
+hex-encoded digest of the uncompressed section's bytes. Like end values,
+checksum data may be ``null`` if not known when the index is written.
+
+Finally, a "tail" is written:
+
+* the gzip stream is flushed with another ``Z_FULL_FLUSH``,
+* the stream is switched to uncompressed,
+* the eight-byte offset of the uncompressed start of the index is written,
+* the gzip stream is flushed with another ``Z_FULL_FLUSH``,
+* the eight-byte offset of the compressed start of the index is written,
+* the gzip stream is flushed with another ``Z_FULL_FLUSH``, and
+* the gzip stream is closed; this involves:
+
+  * flushing the underlying deflate stream with ``Z_FINISH``
+  * writing ``CRC32`` (of the full uncompressed data)
+  * writing ``ISIZE`` (the length of the full uncompressed data ``mod 2 ** 32``)
+
+By switching to uncompressed, we can know exactly how many bytes will be
+written in the tail, so that when reading we can quickly seek to and read the
+index offset, seek to the index start, and read the index. From there we
+can do similar things for any other section.
+
+
+* Seek to the end of the file
+* Go back 31 bytes in the underlying file; this should leave us at the start of
+  the deflate block containing the offset for the compressed start
+* Decompress 8 bytes from the deflate stream to get the location of the
+  compressed start of the index BLOB
+* Seek to that location
+* Read/decompress the size of the index BLOB
+* Read/decompress the json serialized index.
+
+.. note:: This 31 bytes is the deflate block containing the 8 byte location,
+   a ``Z_FULL_FLUSH`` block, the ``Z_FINISH`` block, and the ``CRC32`` and
+   ``ISIZE``. For more information, see `RFC 1951`_ (for the deflate stream)
+   and `RFC 1952`_ (for the gzip format).
+
+The currently defined section and section names upstream are as follows:
+
+* ``swift/index`` - The swift index
+* ``swift/ring/metadata`` - Ring metadata serialized as json
+* ``swift/ring/devices`` - Devices json serialized data structure.
+
+  * This has been seperated from the ring metadata structure in v1 as it
+    gets large
+
+* ``swift/ring/assignments`` - The ring replica2part2dev_id data structure
+
+.. note::
+   Third-parties may find it useful to add their own sections; however,
+   the ``swift/`` prefix is reserved for future upstream enhancements.
+
+swift/ring/metadata
+~~~~~~~~~~~~~~~~~~~
+This BLOB is an ASCII-encoded JSON object full of metadata, similar
+to v1 rings. It has the following required keys:
+
+* ``part_shift``
+* ``dev_id_bytes`` specifies the number of bytes used for each ``<dev>`` in the
+  replica-to-part-to-device table; will be one of 2, 4, or 8
+
+Additionally, there are several optional keys which may be present:
+
+* ``next_part_power``
+* ``version``
+
+Notice that two keys are no longer present: ``replica_count`` is no longer
+needed as the size of the replica-to-part-to-device table is explicit, and
+``byteorder`` is not needed as all data in v2 rings should be written using
+network-order.
+
+swift/ring/devices
+~~~~~~~~~~~~~~~~~~
+This BLOB contains a list of swift device dictionarys. And was seperated out
+from the metadata BLOB as this can become a large structure in it's own right.
+
+swift/ring/assignments
+~~~~~~~~~~~~~~~~~~~~~~
+This BLOB is the replica-to-part-to-device table. It's length will be
+``replicas * (2 ** part_power) * dev_id_bytes``, where ``replicas`` is the exact
+(potentially fractional) replica count for the ring. Unlike in v1, each
+``<dev>`` is written using network-order.
+
+Note that this is why we increased the size of ``<data-length>`` as compared to
+the v1 format -- otherwise, we may not be able to represent rings with both
+high ``replica_count`` and high ``part_power``.
+
+.. _RFC 1952: https://rfc-editor.org/rfc/rfc1952
+.. _RFC 1951: https://rfc-editor.org/rfc/rfc1951
diff --git a/doc/source/overview_wsgi_management.rst b/doc/source/overview_wsgi_management.rst
new file mode 100644
index 0000000000..ab1098afe5
--- /dev/null
+++ b/doc/source/overview_wsgi_management.rst
@@ -0,0 +1,87 @@
+WSGI Server Process Management
+==============================
+
+Graceful Shutdowns with ``SIGHUP``
+----------------------------------
+
+Swift has always supported graceful WSGI server shutdown via ``SIGHUP``.
+This causes the manager process to fall out of its
+ensure-all-workers-are-running loop, close all workers' listen sockets,
+and exit. Closing the listen sockets causes all new ``accept`` calls to
+fail, but does not impact any established connections.
+
+The workers are re-parented, likely to PID 1, and are discoverable with
+``swift-orphans``. When the ``accept`` call fails, it waits for the
+connection-handling ``GreenPool`` to complete, then exits. Each worker
+continues processing the current request, then closes the connection.
+Note that clients will get connection errors if they try to re-use a
+connection for further requests.
+
+Prior to the introduction of seamless reloads (see below), a common
+reload strategy was to perform a graceful shutdown followed by a fresh
+service start.
+
+Seamless Reloads with ``SIGUSR1``
+---------------------------------
+
+Beginning with Swift 2.24.0, WSGI servers support seamless reloads via
+``SIGUSR1``. This allows servers to restart to pick up configuration or
+code changes while being minimally-disruptive to clients. The process
+is as follows:
+
+.. image:: images/reload_process_tree_1.svg
+
+1. Manager process receives ``USR1`` signal. This causes the process to fall
+   out of its loop ensuring that all workers are running and instead begin
+   reloading. The workers continue servicing client requests as long as
+   their listen sockets remain open.
+
+.. image:: images/reload_process_tree_2.svg
+
+2. Manager process forks. The new child knows about all the existing
+   workers and their listen sockets; it will be responsible for closing
+   the old worker listen sockets so they stop accepting new connections.
+
+.. image:: images/reload_process_tree_3.svg
+
+3. Manager process re-exec's itself. It picks up new configuration and
+   code while maintaining the same PID as the old manager process. At
+   this point only the socket-closer is tracking the old workers, but
+   everything (including old workers) remains a child of the new manager
+   process. As a result, old workers are *not* discoverable with
+   ``swift-orphans``; ``swift-oldies`` may be useful, but will also find
+   the manager process.
+
+.. image:: images/reload_process_tree_4.svg
+
+4. New manager process forks off new workers, each with its own listen
+   socket. Once all workers have started and can accept new connections,
+   the manager notifies the socket-closer via a pipe. The socket-closer
+   closes the old worker listen sockets so they stop accepting new
+   connections, passes the list of old workers to the new manager,
+   then exits.
+
+.. image:: images/reload_process_tree_5.svg
+
+5. Old workers continue servicing any in-progress connections, while new
+   connections are picked up by new workers. Once an old worker completes
+   all of its oustanding requests, it exits. Beginning with Swift 2.35.0,
+   if any workers persist beyond ``stale_worker_timeout``, the new manager
+   will clean them up with ``KILL`` signals.
+
+.. image:: images/reload_process_tree_6.svg
+
+6. All old workers have now exited. Only new code and configs are in use.
+
+``swift-reload``
+----------------
+
+Beginning with Swift 2.33.0, a new ``swift-reload`` helper is included
+to help validate the reload process. Given a PID, it will
+
+1. Validate that the PID seems to belong to a Swift WSGI server manager
+   process,
+2. Check that the config file used by that PID is currently valid,
+3. Send the ``USR1`` signal to initiate a reload, and
+4. Wait for the new workers to come up (indicating the reload is complete)
+   before exiting.
diff --git a/doc/source/policies_saio.rst b/doc/source/policies_saio.rst
new file mode 100644
index 0000000000..9a8f6ce2e8
--- /dev/null
+++ b/doc/source/policies_saio.rst
@@ -0,0 +1,177 @@
+===========================================
+Adding Storage Policies to an Existing SAIO
+===========================================
+
+Depending on when you downloaded your SAIO environment, it may already
+be prepared with two storage policies that enable some basic functional
+tests.  In the event that you are adding a storage policy to an existing
+installation, however, the following section will walk you through the
+steps for setting up Storage Policies.  Note that configuring more than
+one storage policy on your development environment is recommended but
+optional.  Enabling multiple Storage Policies is very easy regardless of
+whether you are working with an existing installation or starting a
+brand new one.
+
+Now we will create two policies - the first one will be a standard triple
+replication policy that we will also explicitly set as the default and
+the second will be setup for reduced replication using a factor of 2x.
+We will call the first one 'gold' and the second one 'silver'.  In this
+example both policies map to the same devices because it's also
+important for this sample implementation to be simple and easy
+to understand and adding a bunch of new devices isn't really required
+to implement a usable set of policies.
+
+1. To define your policies, add the following to your ``/etc/swift/swift.conf``
+   file:
+
+   .. code:: ini
+
+      [storage-policy:0]
+      name = gold
+      aliases = yellow, orange
+      default = yes
+
+      [storage-policy:1]
+      name = silver
+
+   See :doc:`overview_policies` for detailed information on ``swift.conf`` policy
+   options.
+
+2. To create the object ring for the silver policy (index 1), add the following
+   to your ``bin/remakerings`` script and re-run it (your script may already have
+   these changes):
+
+   .. code:: shell
+
+      swift-ring-builder object-1.builder create 10 2 1
+      swift-ring-builder object-1.builder add r1z1-127.0.0.1:6210/sdb1 1
+      swift-ring-builder object-1.builder add r1z2-127.0.0.1:6220/sdb2 1
+      swift-ring-builder object-1.builder add r1z3-127.0.0.1:6230/sdb3 1
+      swift-ring-builder object-1.builder add r1z4-127.0.0.1:6240/sdb4 1
+      swift-ring-builder object-1.builder rebalance
+
+   Note that the reduced replication of the silver policy is only a function
+   of the replication parameter in the ``swift-ring-builder create`` command
+   and is not specified  in ``/etc/swift/swift.conf``.
+
+3. Copy ``etc/container-reconciler.conf-sample`` to
+   ``/etc/swift/container-reconciler.conf`` and fix the user option:
+
+   .. code:: shell
+
+      cp etc/container-reconciler.conf-sample /etc/swift/container-reconciler.conf
+      sed -i "s/# user.*/user = $USER/g" /etc/swift/container-reconciler.conf
+
+------------------
+Using Policies
+------------------
+
+Setting up Storage Policies was very simple, and using them is even
+simpler.  In this section, we will run some commands to create a few
+containers with different policies and store objects in them and see how
+Storage Policies effect placement of data in Swift.
+
+1. We will be using the list_endpoints middleware to confirm object locations,
+   so enable that now in your ``proxy-server.conf`` file by adding it to the pipeline
+   and including the filter section as shown below (be sure to restart your proxy
+   after making these changes):
+
+   .. code:: ini
+
+      pipeline = catch_errors gatekeeper healthcheck proxy-logging cache bulk \
+        slo dlo ratelimit crossdomain list-endpoints tempurl tempauth staticweb \
+        container-quotas account-quotas proxy-logging proxy-server
+
+      [filter:list-endpoints]
+      use = egg:swift#list_endpoints
+
+2. Check to see that your policies are reported via /info:
+
+   .. code:: shell
+
+      swift -A http://127.0.0.1:8080/auth/v1.0 -U test:tester -K testing info
+
+   You should see this: (only showing the policy output here):
+
+   .. code:: none
+
+      policies: [{'aliases': 'gold, yellow, orange', 'default': True,
+          'name': 'gold'}, {'aliases': 'silver', 'name': 'silver'}]
+
+3. Now create a container without specifying a policy, it will use the
+   default, 'gold' and then put a test object in it (create the file ``file0.txt``
+   with your favorite editor with some content):
+
+   .. code:: shell
+
+      curl -v -X PUT -H 'X-Auth-Token: <your auth token>' \
+          http://127.0.0.1:8080/v1/AUTH_test/myCont0
+      curl -X PUT -v -T file0.txt -H 'X-Auth-Token: <your auth token>' \
+          http://127.0.0.1:8080/v1/AUTH_test/myCont0/file0.txt
+
+4. Now confirm placement of the object with the :ref:`list_endpoints` middleware:
+
+   .. code:: shell
+
+      curl -X GET -v http://127.0.0.1:8080/endpoints/AUTH_test/myCont0/file0.txt
+
+   You should see this: (note placement on expected devices):
+
+   .. code:: json
+
+      ["http://127.0.0.1:6230/sdb3/761/AUTH_test/myCont0/file0.txt",
+       "http://127.0.0.1:6210/sdb1/761/AUTH_test/myCont0/file0.txt",
+       "http://127.0.0.1:6220/sdb2/761/AUTH_test/myCont0/file0.txt"]
+
+5. Create a container using policy 'silver' and put a different file in it:
+
+   .. code:: shell
+
+      curl -v -X PUT -H 'X-Auth-Token: <your auth token>' -H \
+          "X-Storage-Policy: silver" \
+          http://127.0.0.1:8080/v1/AUTH_test/myCont1
+      curl -X PUT -v -T file1.txt -H 'X-Auth-Token: <your auth token>' \
+          http://127.0.0.1:8080/v1/AUTH_test/myCont1/
+
+6. Confirm placement of the object for policy 'silver':
+
+   .. code:: shell
+
+      curl -X GET -v http://127.0.0.1:8080/endpoints/AUTH_test/myCont1/file1.txt
+
+   You should see this: (note placement on expected devices):
+
+   .. code:: json
+
+      ["http://127.0.0.1:6210/sdb1/32/AUTH_test/myCont1/file1.txt",
+       "http://127.0.0.1:6240/sdb4/32/AUTH_test/myCont1/file1.txt"]
+
+7. Confirm account information with HEAD, make sure that your container-updater
+   service is running and has executed once since you performed the PUTs or the
+   account database won't be updated yet:
+
+   .. code:: shell
+
+      curl -i -X HEAD -H 'X-Auth-Token: <your auth token>' \
+          http://127.0.0.1:8080/v1/AUTH_test
+
+   You should see something like this (note that total and per policy stats
+   object sizes will vary):
+
+   .. code:: none
+
+      HTTP/1.1 204 No Content
+      Content-Length: 0
+      X-Account-Object-Count: 2
+      X-Account-Bytes-Used: 174
+      X-Account-Container-Count: 2
+      X-Account-Storage-Policy-Gold-Object-Count: 1
+      X-Account-Storage-Policy-Gold-Bytes-Used: 84
+      X-Account-Storage-Policy-Silver-Object-Count: 1
+      X-Account-Storage-Policy-Silver-Bytes-Used: 90
+      X-Timestamp: 1397230339.71525
+      Content-Type: text/plain; charset=utf-8
+      Accept-Ranges: bytes
+      X-Trans-Id: tx96e7496b19bb44abb55a3-0053482c75
+      X-Openstack-Request-Id: tx96e7496b19bb44abb55a3-0053482c75
+      Date: Fri, 11 Apr 2014 17:55:01 GMT
diff --git a/doc/source/proxy.rst b/doc/source/proxy.rst
index 210480d7eb..405d06280d 100644
--- a/doc/source/proxy.rst
+++ b/doc/source/proxy.rst
@@ -4,6 +4,43 @@
 Proxy
 *****
 
+.. _proxy-controllers:
+
+Proxy Controllers
+=================
+
+Base
+~~~~
+
+.. automodule:: swift.proxy.controllers.base
+    :members:
+    :undoc-members:
+    :show-inheritance:
+
+Account
+~~~~~~~
+
+.. automodule:: swift.proxy.controllers.account
+    :members:
+    :undoc-members:
+    :show-inheritance:
+
+Container
+~~~~~~~~~
+
+.. automodule:: swift.proxy.controllers.container
+    :members:
+    :undoc-members:
+    :show-inheritance:
+
+Object
+~~~~~~
+
+.. automodule:: swift.proxy.controllers.obj
+    :members:
+    :undoc-members:
+    :show-inheritance:
+
 .. _proxy-server:
 
 Proxy Server
diff --git a/doc/source/ratelimit.rst b/doc/source/ratelimit.rst
index 3b5f95bd03..81832f2bf2 100644
--- a/doc/source/ratelimit.rst
+++ b/doc/source/ratelimit.rst
@@ -1,8 +1,10 @@
+.. _ratelimit:
+
 =============
 Rate Limiting
 =============
 
-Rate limiting in swift is implemented as a pluggable middleware.  Rate
+Rate limiting in Swift is implemented as a pluggable middleware.  Rate
 limiting is performed on requests that result in database writes to the
 account and container sqlite dbs.  It uses memcached and is dependent on
 the proxy servers having highly synchronized time.  The rate limits are
@@ -15,38 +17,44 @@ Configuration
 All configuration is optional.  If no account or container limits are provided
 there will be no rate limiting.  Configuration available:
 
-======================== =========  ===========================================
-Option                   Default     Description
------------------------- ---------  -------------------------------------------
-clock_accuracy           1000       Represents how accurate the proxy servers'
-                                    system clocks are with each other. 1000
-                                    means that all the proxies' clock are
-                                    accurate to each other within 1
-                                    millisecond.  No ratelimit should be
-                                    higher than the clock accuracy.
-max_sleep_time_seconds   60         App will immediately return a 498 response
-                                    if the necessary sleep time ever exceeds
-                                    the given max_sleep_time_seconds.
-log_sleep_time_seconds   0          To allow visibility into rate limiting set
-                                    this value > 0 and all sleeps greater than
-                                    the number will be logged.
-rate_buffer_seconds      5          Number of seconds the rate counter can
-                                    drop and be allowed to catch up (at a
-                                    faster than listed rate). A larger number
-                                    will result in larger spikes in rate but
-                                    better average accuracy.
-account_ratelimit        0          If set, will limit PUT and DELETE requests
-                                    to /account_name/container_name.
-                                    Number is in requests per second.
-account_whitelist        ''         Comma separated lists of account names that
-                                    will not be rate limited.
-account_blacklist        ''         Comma separated lists of account names that
-                                    will not be allowed. Returns a 497 response.
-container_ratelimit_size ''         When set with container_limit_x = r:
-                                    for containers of size x, limit requests
-                                    per second to r.  Will limit PUT, DELETE,
-                                    and POST requests to /a/c/o.
-======================== =========  ===========================================
+================================ ======= ======================================
+Option                           Default Description
+-------------------------------- ------- --------------------------------------
+clock_accuracy                   1000    Represents how accurate the proxy
+                                         servers' system clocks are with each
+                                         other. 1000 means that all the
+                                         proxies' clock are accurate to each
+                                         other within 1 millisecond. No
+                                         ratelimit should be higher than the
+                                         clock accuracy.
+max_sleep_time_seconds           60      App will immediately return a 498
+                                         response if the necessary sleep time
+                                         ever exceeds the given
+                                         max_sleep_time_seconds.
+log_sleep_time_seconds           0       To allow visibility into rate limiting
+                                         set this value > 0 and all sleeps
+                                         greater than the number will be
+                                         logged.
+rate_buffer_seconds              5       Number of seconds the rate counter can
+                                         drop and be allowed to catch up (at a
+                                         faster than listed rate). A larger
+                                         number will result in larger spikes in
+                                         rate but better average accuracy.
+account_ratelimit                0       If set, will limit PUT and DELETE
+                                         requests to
+                                         /account_name/container_name. Number
+                                         is in requests per second.
+container_ratelimit_size         ''      When set with container_ratelimit_x =
+                                         r: for containers of size x, limit
+                                         requests per second to r. Will limit
+                                         PUT, DELETE, and POST requests to
+                                         /a/c/o.
+container_listing_ratelimit_size ''      When set with
+                                         container_listing_ratelimit_x = r: for
+                                         containers of size x, limit listing
+                                         requests per second to r. Will limit
+                                         GET requests to /a/c.
+================================ ======= ======================================
 
 The container rate limits are linearly interpolated from the values given.  A
 sample container rate limiting could be:
@@ -70,3 +78,35 @@ Container Size      Rate Limit
 ================    ============
 
 
+-----------------------------
+Account Specific Ratelimiting
+-----------------------------
+
+
+The above ratelimiting is to prevent the "many writes to a single container"
+bottleneck from causing a problem. There could also be a problem where a single
+account is just using too much of the cluster's resources.  In this case, the
+container ratelimits may not help because the customer could be doing thousands
+of reqs/sec to distributed containers each getting a small fraction of the
+total so those limits would never trigger. If a system administrator notices
+this, he/she can set the X-Account-Sysmeta-Global-Write-Ratelimit on an account
+and that will limit the total number of write requests (PUT, POST, DELETE,
+COPY) that account can do for the whole account. This limit will be in addition
+to the applicable account/container limits from above. This header will be
+hidden from the user, because of the gatekeeper middleware, and can only be set
+using a direct client to the account nodes. It accepts a float value and will
+only limit requests if the value is > 0.
+
+-------------------
+Black/White-listing
+-------------------
+
+To blacklist or whitelist an account set:
+
+X-Account-Sysmeta-Global-Write-Ratelimit: BLACKLIST
+
+or
+
+X-Account-Sysmeta-Global-Write-Ratelimit: WHITELIST
+
+in the account headers.
diff --git a/doc/source/replication_network.rst b/doc/source/replication_network.rst
new file mode 100644
index 0000000000..6740ec8250
--- /dev/null
+++ b/doc/source/replication_network.rst
@@ -0,0 +1,527 @@
+.. _Dedicated-replication-network:
+
+=============================
+Dedicated replication network
+=============================
+
+-------
+Summary
+-------
+
+Swift's replication process is essential for consistency and availability of
+data. By default, replication activity will use the same network interface as
+other cluster operations. However, if a replication interface is set in the
+ring for a node, that node will send replication traffic on its designated
+separate replication network interface. Replication traffic includes REPLICATE
+requests and rsync traffic.
+
+To separate the cluster-internal replication traffic from client traffic,
+separate replication servers can be used. These replication servers are based
+on the standard storage servers, but they listen on the replication IP and
+only respond to REPLICATE requests. Storage servers can serve REPLICATE
+requests, so an operator can transition to using a separate replication
+network with no cluster downtime.
+
+Replication IP and port information is stored in the ring on a per-node basis.
+These parameters will be used if they are present, but they are not required.
+If this information does not exist or is empty for a particular node, the
+node's standard IP and port will be used for replication.
+
+--------------------
+For SAIO replication
+--------------------
+
+#. Create new script in ``~/bin/`` (for example: ``remakerings_new``)::
+
+        #!/bin/bash
+        set -e
+        cd /etc/swift
+        rm -f *.builder *.ring.gz backups/*.builder backups/*.ring.gz
+        swift-ring-builder object.builder create 10 3 1
+        swift-ring-builder object.builder add z1-127.0.0.1:6210R127.0.0.1:6250/sdb1 1
+        swift-ring-builder object.builder add z2-127.0.0.1:6220R127.0.0.1:6260/sdb2 1
+        swift-ring-builder object.builder add z3-127.0.0.1:6230R127.0.0.1:6270/sdb3 1
+        swift-ring-builder object.builder add z4-127.0.0.1:6240R127.0.0.1:6280/sdb4 1
+        swift-ring-builder object.builder rebalance
+        swift-ring-builder object-1.builder create 10 2 1
+        swift-ring-builder object-1.builder add z1-127.0.0.1:6210R127.0.0.1:6250/sdb1 1
+        swift-ring-builder object-1.builder add z2-127.0.0.1:6220R127.0.0.1:6260/sdb2 1
+        swift-ring-builder object-1.builder add z3-127.0.0.1:6230R127.0.0.1:6270/sdb3 1
+        swift-ring-builder object-1.builder add z4-127.0.0.1:6240R127.0.0.1:6280/sdb4 1
+        swift-ring-builder object-1.builder rebalance
+        swift-ring-builder object-2.builder create 10 6 1
+        swift-ring-builder object-2.builder add z1-127.0.0.1:6210R127.0.0.1:6250/sdb1 1
+        swift-ring-builder object-2.builder add z1-127.0.0.1:6210R127.0.0.1:6250/sdb5 1
+        swift-ring-builder object-2.builder add z2-127.0.0.1:6220R127.0.0.1:6260/sdb2 1
+        swift-ring-builder object-2.builder add z2-127.0.0.1:6220R127.0.0.1:6260/sdb6 1
+        swift-ring-builder object-2.builder add z3-127.0.0.1:6230R127.0.0.1:6270/sdb3 1
+        swift-ring-builder object-2.builder add z3-127.0.0.1:6230R127.0.0.1:6270/sdb7 1
+        swift-ring-builder object-2.builder add z4-127.0.0.1:6240R127.0.0.1:6280/sdb4 1
+        swift-ring-builder object-2.builder add z4-127.0.0.1:6240R127.0.0.1:6280/sdb8 1
+        swift-ring-builder object-2.builder rebalance
+        swift-ring-builder container.builder create 10 3 1
+        swift-ring-builder container.builder add z1-127.0.0.1:6211R127.0.0.1:6251/sdb1 1
+        swift-ring-builder container.builder add z2-127.0.0.1:6221R127.0.0.1:6261/sdb2 1
+        swift-ring-builder container.builder add z3-127.0.0.1:6231R127.0.0.1:6271/sdb3 1
+        swift-ring-builder container.builder add z4-127.0.0.1:6241R127.0.0.1:6281/sdb4 1
+        swift-ring-builder container.builder rebalance
+        swift-ring-builder account.builder create 10 3 1
+        swift-ring-builder account.builder add z1-127.0.0.1:6212R127.0.0.1:6252/sdb1 1
+        swift-ring-builder account.builder add z2-127.0.0.1:6222R127.0.0.1:6262/sdb2 1
+        swift-ring-builder account.builder add z3-127.0.0.1:6232R127.0.0.1:6272/sdb3 1
+        swift-ring-builder account.builder add z4-127.0.0.1:6242R127.0.0.1:6282/sdb4 1
+        swift-ring-builder account.builder rebalance
+
+   .. note::
+      Syntax of adding device has been changed: ``R<ip_replication>:<port_replication>``
+      was added between ``z<zone>-<ip>:<port>`` and ``/<device_name>_<meta> <weight>``.
+      Added devices will use <ip_replication> and <port_replication> for replication activities.
+
+#. Add next rows in ``/etc/rsyncd.conf``::
+
+        [account6252]
+        max connections = 25
+        path = /srv/1/node/
+        read only = false
+        lock file = /var/lock/account6252.lock
+
+        [account6262]
+        max connections = 25
+        path = /srv/2/node/
+        read only = false
+        lock file = /var/lock/account6262.lock
+
+        [account6272]
+        max connections = 25
+        path = /srv/3/node/
+        read only = false
+        lock file = /var/lock/account6272.lock
+
+        [account6282]
+        max connections = 25
+        path = /srv/4/node/
+        read only = false
+        lock file = /var/lock/account6282.lock
+
+
+        [container6251]
+        max connections = 25
+        path = /srv/1/node/
+        read only = false
+        lock file = /var/lock/container6251.lock
+
+        [container6261]
+        max connections = 25
+        path = /srv/2/node/
+        read only = false
+        lock file = /var/lock/container6261.lock
+
+        [container6271]
+        max connections = 25
+        path = /srv/3/node/
+        read only = false
+        lock file = /var/lock/container6271.lock
+
+        [container6281]
+        max connections = 25
+        path = /srv/4/node/
+        read only = false
+        lock file = /var/lock/container6281.lock
+
+
+        [object6250]
+        max connections = 25
+        path = /srv/1/node/
+        read only = false
+        lock file = /var/lock/object6250.lock
+
+        [object6260]
+        max connections = 25
+        path = /srv/2/node/
+        read only = false
+        lock file = /var/lock/object6260.lock
+
+        [object6270]
+        max connections = 25
+        path = /srv/3/node/
+        read only = false
+        lock file = /var/lock/object6270.lock
+
+        [object6280]
+        max connections = 25
+        path = /srv/4/node/
+        read only = false
+        lock file = /var/lock/object6280.lock
+
+#. Restart rsync daemon::
+
+        service rsync restart
+
+#. Update configuration files in directories:
+
+   * /etc/swift/object-server(files: 1.conf, 2.conf, 3.conf, 4.conf)
+   * /etc/swift/container-server(files: 1.conf, 2.conf, 3.conf, 4.conf)
+   * /etc/swift/account-server(files: 1.conf, 2.conf, 3.conf, 4.conf)
+
+   delete all configuration options in section ``[<*>-replicator]``
+
+#. Add configuration files for object-server, in ``/etc/swift/object-server/``
+
+   * 5.conf::
+
+        [DEFAULT]
+        devices = /srv/1/node
+        mount_check = false
+        disable_fallocate = true
+        bind_port = 6250
+        user = swift
+        log_facility = LOG_LOCAL2
+        recon_cache_path = /var/cache/swift
+
+        [pipeline:main]
+        pipeline = recon object-server
+
+        [app:object-server]
+        use = egg:swift#object
+        replication_server = True
+
+        [filter:recon]
+        use = egg:swift#recon
+
+        [object-replicator]
+        rsync_module = {replication_ip}::object{replication_port}
+
+   * 6.conf::
+
+        [DEFAULT]
+        devices = /srv/2/node
+        mount_check = false
+        disable_fallocate = true
+        bind_port = 6260
+        user = swift
+        log_facility = LOG_LOCAL3
+        recon_cache_path = /var/cache/swift2
+
+        [pipeline:main]
+        pipeline = recon object-server
+
+        [app:object-server]
+        use = egg:swift#object
+        replication_server = True
+
+        [filter:recon]
+        use = egg:swift#recon
+
+        [object-replicator]
+        rsync_module = {replication_ip}::object{replication_port}
+
+   * 7.conf::
+
+        [DEFAULT]
+        devices = /srv/3/node
+        mount_check = false
+        disable_fallocate = true
+        bind_port = 6270
+        user = swift
+        log_facility = LOG_LOCAL4
+        recon_cache_path = /var/cache/swift3
+
+        [pipeline:main]
+        pipeline = recon object-server
+
+        [app:object-server]
+        use = egg:swift#object
+        replication_server = True
+
+        [filter:recon]
+        use = egg:swift#recon
+
+        [object-replicator]
+        rsync_module = {replication_ip}::object{replication_port}
+
+   * 8.conf::
+
+        [DEFAULT]
+        devices = /srv/4/node
+        mount_check = false
+        disable_fallocate = true
+        bind_port = 6280
+        user = swift
+        log_facility = LOG_LOCAL5
+        recon_cache_path = /var/cache/swift4
+
+        [pipeline:main]
+        pipeline = recon object-server
+
+        [app:object-server]
+        use = egg:swift#object
+        replication_server = True
+
+        [filter:recon]
+        use = egg:swift#recon
+
+        [object-replicator]
+        rsync_module = {replication_ip}::object{replication_port}
+
+#. Add configuration files for container-server, in ``/etc/swift/container-server/``
+
+   * 5.conf::
+
+        [DEFAULT]
+        devices = /srv/1/node
+        mount_check = false
+        disable_fallocate = true
+        bind_port = 6251
+        user = swift
+        log_facility = LOG_LOCAL2
+        recon_cache_path = /var/cache/swift
+
+        [pipeline:main]
+        pipeline = recon container-server
+
+        [app:container-server]
+        use = egg:swift#container
+        replication_server = True
+
+        [filter:recon]
+        use = egg:swift#recon
+
+        [container-replicator]
+        rsync_module = {replication_ip}::container{replication_port}
+
+   * 6.conf::
+
+        [DEFAULT]
+        devices = /srv/2/node
+        mount_check = false
+        disable_fallocate = true
+        bind_port = 6261
+        user = swift
+        log_facility = LOG_LOCAL3
+        recon_cache_path = /var/cache/swift2
+
+        [pipeline:main]
+        pipeline = recon container-server
+
+        [app:container-server]
+        use = egg:swift#container
+        replication_server = True
+
+        [filter:recon]
+        use = egg:swift#recon
+
+        [container-replicator]
+        rsync_module = {replication_ip}::container{replication_port}
+
+   * 7.conf::
+
+        [DEFAULT]
+        devices = /srv/3/node
+        mount_check = false
+        disable_fallocate = true
+        bind_port = 6271
+        user = swift
+        log_facility = LOG_LOCAL4
+        recon_cache_path = /var/cache/swift3
+
+        [pipeline:main]
+        pipeline = recon container-server
+
+        [app:container-server]
+        use = egg:swift#container
+        replication_server = True
+
+        [filter:recon]
+        use = egg:swift#recon
+
+        [container-replicator]
+        rsync_module = {replication_ip}::container{replication_port}
+
+   * 8.conf::
+
+        [DEFAULT]
+        devices = /srv/4/node
+        mount_check = false
+        disable_fallocate = true
+        bind_port = 6281
+        user = swift
+        log_facility = LOG_LOCAL5
+        recon_cache_path = /var/cache/swift4
+
+        [pipeline:main]
+        pipeline = recon container-server
+
+        [app:container-server]
+        use = egg:swift#container
+        replication_server = True
+
+        [filter:recon]
+        use = egg:swift#recon
+
+        [container-replicator]
+        rsync_module = {replication_ip}::container{replication_port}
+
+#. Add configuration files for account-server, in ``/etc/swift/account-server/``
+
+   * 5.conf::
+
+        [DEFAULT]
+        devices = /srv/1/node
+        mount_check = false
+        disable_fallocate = true
+        bind_port = 6252
+        user = swift
+        log_facility = LOG_LOCAL2
+        recon_cache_path = /var/cache/swift
+
+        [pipeline:main]
+        pipeline = recon account-server
+
+        [app:account-server]
+        use = egg:swift#account
+        replication_server = True
+
+        [filter:recon]
+        use = egg:swift#recon
+
+        [account-replicator]
+        rsync_module = {replication_ip}::account{replication_port}
+
+   * 6.conf::
+
+        [DEFAULT]
+        devices = /srv/2/node
+        mount_check = false
+        disable_fallocate = true
+        bind_port = 6262
+        user = swift
+        log_facility = LOG_LOCAL3
+        recon_cache_path = /var/cache/swift2
+
+        [pipeline:main]
+        pipeline = recon account-server
+
+        [app:account-server]
+        use = egg:swift#account
+        replication_server = True
+
+        [filter:recon]
+        use = egg:swift#recon
+
+        [account-replicator]
+        rsync_module = {replication_ip}::account{replication_port}
+
+   * 7.conf::
+
+        [DEFAULT]
+        devices = /srv/3/node
+        mount_check = false
+        disable_fallocate = true
+        bind_port = 6272
+        user = swift
+        log_facility = LOG_LOCAL4
+        recon_cache_path = /var/cache/swift3
+
+        [pipeline:main]
+        pipeline = recon account-server
+
+        [app:account-server]
+        use = egg:swift#account
+        replication_server = True
+
+        [filter:recon]
+        use = egg:swift#recon
+
+        [account-replicator]
+        rsync_module = {replication_ip}::account{replication_port}
+
+   * 8.conf::
+
+        [DEFAULT]
+        devices = /srv/4/node
+        mount_check = false
+        disable_fallocate = true
+        bind_port = 6282
+        user = swift
+        log_facility = LOG_LOCAL5
+        recon_cache_path = /var/cache/swift4
+
+        [pipeline:main]
+        pipeline = recon account-server
+
+        [app:account-server]
+        use = egg:swift#account
+        replication_server = True
+
+        [filter:recon]
+        use = egg:swift#recon
+
+        [account-replicator]
+        rsync_module = {replication_ip}::account{replication_port}
+
+
+---------------------------------
+For a Multiple Server replication
+---------------------------------
+
+#. Move configuration file.
+
+   * Configuration file for object-server from /etc/swift/object-server.conf to /etc/swift/object-server/1.conf
+
+   * Configuration file for container-server from /etc/swift/container-server.conf to /etc/swift/container-server/1.conf
+
+   * Configuration file for account-server from /etc/swift/account-server.conf to /etc/swift/account-server/1.conf
+
+#. Add changes in configuration files in directories:
+
+   * /etc/swift/object-server(files: 1.conf)
+   * /etc/swift/container-server(files: 1.conf)
+   * /etc/swift/account-server(files: 1.conf)
+
+   delete all configuration options in section [<*>-replicator]
+
+#. Add configuration files for object-server, in /etc/swift/object-server/2.conf::
+
+        [DEFAULT]
+        bind_ip = $STORAGE_LOCAL_NET_IP
+        workers = 2
+
+        [pipeline:main]
+        pipeline = object-server
+
+        [app:object-server]
+        use = egg:swift#object
+        replication_server = True
+
+        [object-replicator]
+
+#. Add configuration files for container-server, in /etc/swift/container-server/2.conf::
+
+        [DEFAULT]
+        bind_ip = $STORAGE_LOCAL_NET_IP
+        workers = 2
+
+        [pipeline:main]
+        pipeline = container-server
+
+        [app:container-server]
+        use = egg:swift#container
+        replication_server = True
+
+        [container-replicator]
+
+#. Add configuration files for account-server, in /etc/swift/account-server/2.conf::
+
+        [DEFAULT]
+        bind_ip = $STORAGE_LOCAL_NET_IP
+        workers = 2
+
+        [pipeline:main]
+        pipeline = account-server
+
+        [app:account-server]
+        use = egg:swift#account
+        replication_server = True
+
+        [account-replicator]
+
diff --git a/doc/source/ring.rst b/doc/source/ring.rst
index d8f5a611f4..196a0b88a3 100644
--- a/doc/source/ring.rst
+++ b/doc/source/ring.rst
@@ -4,6 +4,16 @@
 Partitioned Consistent Hash Ring
 ********************************
 
+.. _ring-io:
+
+Ring IO
+=======
+
+.. automodule:: swift.common.ring.io
+    :members:
+    :undoc-members:
+    :show-inheritance:
+
 .. _ring:
 
 Ring
@@ -23,3 +33,13 @@ Ring Builder
     :members:
     :undoc-members:
     :show-inheritance:
+
+.. _composite_builder:
+
+Composite Ring Builder
+======================
+
+.. automodule:: swift.common.ring.composite_builder
+    :members:
+    :undoc-members:
+    :show-inheritance:
diff --git a/doc/source/ring_background.rst b/doc/source/ring_background.rst
new file mode 100644
index 0000000000..cc6ade8b85
--- /dev/null
+++ b/doc/source/ring_background.rst
@@ -0,0 +1,966 @@
+==================================
+Building a Consistent Hashing Ring
+==================================
+
+------------------------------------
+Authored by Greg Holt, February 2011
+------------------------------------
+
+This is a compilation of five posts I made earlier discussing how to build
+a consistent hashing ring. The posts seemed to be accessed quite frequently,
+so I've gathered them all here on one page for easier reading.
+
+.. note::
+    This is an historical document; as such, all code examples are Python 2.
+    If this makes you squirm, think of it as pseudo-code. Regardless of
+    implementation language, the state of the art in consistent-hashing and
+    distributed systems more generally has advanced. We hope that this
+    introduction from first principles will still prove informative,
+    particularly with regard to how data is distributed within a Swift
+    cluster.
+
+Part 1
+======
+"Consistent Hashing" is a term used to describe a process where data is
+distributed using a hashing algorithm to determine its location. Using
+only the hash of the id of the data you can determine exactly where that
+data should be. This mapping of hashes to locations is usually termed a
+"ring".
+
+Probably the simplest hash is just a modulus of the id. For instance, if
+all ids are numbers and you have two machines you wish to distribute data
+to, you could just put all odd numbered ids on one machine and even numbered
+ids on the other. Assuming you have a balanced number of odd and even
+numbered ids, and a balanced data size per id, your data would be balanced
+between the two machines.
+
+Since data ids are often textual names and not numbers, like paths for
+files or URLs, it makes sense to use a "real" hashing algorithm to convert
+the names to numbers first. Using MD5 for instance, the hash of the name
+'mom.png' is '4559a12e3e8da7c2186250c2f292e3af' and the hash of 'dad.png'
+is '096edcc4107e9e18d6a03a43b3853bea'. Now, using the modulus, we can
+place 'mom.jpg' on the odd machine and 'dad.png' on the even one. Another
+benefit of using a hashing algorithm like MD5 is that the resulting hashes
+have a known even distribution, meaning your ids will be evenly distributed
+without worrying about keeping the id values themselves evenly distributed.
+
+Here is a simple example of this in action:
+
+.. code-block:: python
+
+  from hashlib import md5
+  from struct import unpack_from
+
+  NODE_COUNT = 100
+  DATA_ID_COUNT = 10000000
+
+  node_counts = [0] * NODE_COUNT
+  for data_id in range(DATA_ID_COUNT):
+      data_id = str(data_id)
+      # This just pulls part of the hash out as an integer
+      hsh = unpack_from('>I', md5(data_id).digest())[0]
+      node_id = hsh % NODE_COUNT
+      node_counts[node_id] += 1
+  desired_count = DATA_ID_COUNT / NODE_COUNT
+  print '%d: Desired data ids per node' % desired_count
+  max_count = max(node_counts)
+  over = 100.0 * (max_count - desired_count) / desired_count
+  print '%d: Most data ids on one node, %.02f%% over' % \
+      (max_count, over)
+  min_count = min(node_counts)
+  under = 100.0 * (desired_count - min_count) / desired_count
+  print '%d: Least data ids on one node, %.02f%% under' % \
+      (min_count, under)
+
+::
+
+  100000: Desired data ids per node
+  100695: Most data ids on one node, 0.69% over
+  99073: Least data ids on one node, 0.93% under
+
+So that's not bad at all; less than a percent over/under for distribution
+per node. In the next part of this series we'll examine where modulus
+distribution causes problems and how to improve our ring to overcome them.
+
+Part 2
+======
+In Part 1 of this series, we did a simple test of using the modulus of a
+hash to locate data. We saw very good distribution, but that's only part
+of the story. Distributed systems not only need to distribute load, but
+they often also need to grow as more and more data is placed in it.
+
+So let's imagine we have a 100 node system up and running using our
+previous algorithm, but it's starting to get full so we want to add
+another node. When we add that 101st node to our algorithm we notice
+that many ids now map to different nodes than they previously did.
+We're going to have to shuffle a ton of data around our system to get
+it all into place again.
+
+Let's examine what's happened on a much smaller scale: just 2 nodes
+again, node 0 gets even ids and node 1 gets odd ids. So data id 100
+would map to node 0, data id 101 to node 1, data id 102 to node 0, etc.
+This is simply node = id % 2. Now we add a third node (node 2) for more
+space, so we want node = id % 3. So now data id 100 maps to node id 1,
+data id 101 to node 2, and data id 102 to node 0. So we have to move
+data for 2 of our 3 ids so they can be found again.
+
+Let's examine this at a larger scale:
+
+.. code-block:: python
+
+  from hashlib import md5
+  from struct import unpack_from
+
+  NODE_COUNT = 100
+  NEW_NODE_COUNT = 101
+  DATA_ID_COUNT = 10000000
+
+  moved_ids = 0
+  for data_id in range(DATA_ID_COUNT):
+      data_id = str(data_id)
+      hsh = unpack_from('>I', md5(str(data_id)).digest())[0]
+      node_id = hsh % NODE_COUNT
+      new_node_id = hsh % NEW_NODE_COUNT
+      if node_id != new_node_id:
+          moved_ids += 1
+  percent_moved = 100.0 * moved_ids / DATA_ID_COUNT
+  print '%d ids moved, %.02f%%' % (moved_ids, percent_moved)
+
+::
+
+  9900989 ids moved, 99.01%
+
+Wow, that's severe. We'd have to shuffle around 99% of our data just
+to increase our capacity 1%! We need a new algorithm that combats this
+behavior.
+
+This is where the "ring" really comes in. We can assign ranges of hashes
+directly to nodes and then use an algorithm that minimizes the changes
+to those ranges. Back to our small scale, let's say our ids range from 0
+to 999. We have two nodes and we'll assign data ids 0–499 to node 0 and
+500–999 to node 1. Later, when we add node 2, we can take half the data
+ids from node 0 and half from node 1, minimizing the amount of data that
+needs to move.
+
+Let's examine this at a larger scale:
+
+.. code-block:: python
+
+  from bisect import bisect_left
+  from hashlib import md5
+  from struct import unpack_from
+
+  NODE_COUNT = 100
+  NEW_NODE_COUNT = 101
+  DATA_ID_COUNT = 10000000
+
+  node_range_starts = []
+  for node_id in range(NODE_COUNT):
+      node_range_starts.append(DATA_ID_COUNT /
+                               NODE_COUNT * node_id)
+  new_node_range_starts = []
+  for new_node_id in range(NEW_NODE_COUNT):
+      new_node_range_starts.append(DATA_ID_COUNT /
+                                NEW_NODE_COUNT * new_node_id)
+  moved_ids = 0
+  for data_id in range(DATA_ID_COUNT):
+      data_id = str(data_id)
+      hsh = unpack_from('>I', md5(str(data_id)).digest())[0]
+      node_id = bisect_left(node_range_starts,
+                            hsh % DATA_ID_COUNT) % NODE_COUNT
+      new_node_id = bisect_left(new_node_range_starts,
+                            hsh % DATA_ID_COUNT) % NEW_NODE_COUNT
+      if node_id != new_node_id:
+          moved_ids += 1
+  percent_moved = 100.0 * moved_ids / DATA_ID_COUNT
+  print '%d ids moved, %.02f%%' % (moved_ids, percent_moved)
+
+::
+
+  4901707 ids moved, 49.02%
+
+Okay, that is better. But still, moving 50% of our data to add 1% capacity
+is not very good. If we examine what happened more closely we'll see what
+is an "accordion effect". We shrunk node 0's range a bit to give to the
+new node, but that shifted all the other node's ranges by the same amount.
+
+We can minimize the change to a node's assigned range by assigning several
+smaller ranges instead of the single broad range we were before. This can
+be done by creating "virtual nodes" for each node. So 100 nodes might have
+1000 virtual nodes. Let's examine how that might work.
+
+.. code-block:: python
+
+  from bisect import bisect_left
+  from hashlib import md5
+  from struct import unpack_from
+
+  NODE_COUNT = 100
+  DATA_ID_COUNT = 10000000
+  VNODE_COUNT = 1000
+
+  vnode_range_starts = []
+  vnode2node = []
+  for vnode_id in range(VNODE_COUNT):
+      vnode_range_starts.append(DATA_ID_COUNT /
+                                VNODE_COUNT * vnode_id)
+      vnode2node.append(vnode_id % NODE_COUNT)
+  new_vnode2node = list(vnode2node)
+  new_node_id = NODE_COUNT
+  NEW_NODE_COUNT = NODE_COUNT + 1
+  vnodes_to_reassign = VNODE_COUNT / NEW_NODE_COUNT
+  while vnodes_to_reassign > 0:
+      for node_to_take_from in range(NODE_COUNT):
+          for vnode_id, node_id in enumerate(new_vnode2node):
+              if node_id == node_to_take_from:
+                  new_vnode2node[vnode_id] = new_node_id
+                  vnodes_to_reassign -= 1
+                  break
+          if vnodes_to_reassign <= 0:
+              break
+  moved_ids = 0
+  for data_id in range(DATA_ID_COUNT):
+      data_id = str(data_id)
+      hsh = unpack_from('>I', md5(str(data_id)).digest())[0]
+      vnode_id = bisect_left(vnode_range_starts,
+                           hsh % DATA_ID_COUNT) % VNODE_COUNT
+      node_id = vnode2node[vnode_id]
+      new_node_id = new_vnode2node[vnode_id]
+      if node_id != new_node_id:
+          moved_ids += 1
+  percent_moved = 100.0 * moved_ids / DATA_ID_COUNT
+  print '%d ids moved, %.02f%%' % (moved_ids, percent_moved)
+
+::
+
+  90423 ids moved, 0.90%
+
+There we go, we added 1% capacity and only moved 0.9% of existing data.
+The vnode_range_starts list seems a bit out of place though. Its values
+are calculated and never change for the lifetime of the cluster, so let's
+optimize that out.
+
+.. code-block:: python
+
+  from bisect import bisect_left
+  from hashlib import md5
+  from struct import unpack_from
+
+  NODE_COUNT = 100
+  DATA_ID_COUNT = 10000000
+  VNODE_COUNT = 1000
+
+  vnode2node = []
+  for vnode_id in range(VNODE_COUNT):
+      vnode2node.append(vnode_id % NODE_COUNT)
+  new_vnode2node = list(vnode2node)
+  new_node_id = NODE_COUNT
+  vnodes_to_reassign = VNODE_COUNT / (NODE_COUNT + 1)
+  while vnodes_to_reassign > 0:
+      for node_to_take_from in range(NODE_COUNT):
+          for vnode_id, node_id in enumerate(vnode2node):
+              if node_id == node_to_take_from:
+                  vnode2node[vnode_id] = new_node_id
+                  vnodes_to_reassign -= 1
+                  break
+          if vnodes_to_reassign <= 0:
+              break
+  moved_ids = 0
+  for data_id in range(DATA_ID_COUNT):
+      data_id = str(data_id)
+      hsh = unpack_from('>I', md5(str(data_id)).digest())[0]
+      vnode_id = hsh % VNODE_COUNT
+      node_id = vnode2node[vnode_id]
+      new_node_id = new_vnode2node[vnode_id]
+      if node_id != new_node_id:
+          moved_ids += 1
+  percent_moved = 100.0 * moved_ids / DATA_ID_COUNT
+  print '%d ids moved, %.02f%%' % (moved_ids, percent_moved)
+
+::
+
+  89841 ids moved, 0.90%
+
+There we go. In the next part of this series, will further examine the
+algorithm's limitations and how to improve on it.
+
+Part 3
+======
+In Part 2 of this series, we reached an algorithm that performed well
+even when adding new nodes to the cluster. We used 1000 virtual nodes
+that could be independently assigned to nodes, allowing us to minimize
+the amount of data moved when a node was added.
+
+The number of virtual nodes puts a cap on how many real nodes you can
+have. For example, if you have 1000 virtual nodes and you try to add a
+1001st real node, you can't assign a virtual node to it without leaving
+another real node with no assignment, leaving you with just 1000 active
+real nodes still.
+
+Unfortunately, the number of virtual nodes created at the beginning can
+never change for the life of the cluster without a lot of careful work.
+For example, you could double the virtual node count by splitting each
+existing virtual node in half and assigning both halves to the same real
+node. However, if the real node uses the virtual node's id to optimally
+store the data (for example, all data might be stored in /[virtual node
+id]/[data id]) it would have to move data around locally to reflect the
+change. And it would have to resolve data using both the new and old
+locations while the moves were taking place, making atomic operations
+difficult or impossible.
+
+Let's continue with this assumption that changing the virtual node
+count is more work than it's worth, but keep in mind that some applications
+might be fine with this.
+
+The easiest way to deal with this limitation is to make the limit high
+enough that it won't matter. For instance, if we decide our cluster will
+never exceed 60,000 real nodes, we can just make 60,000 virtual nodes.
+
+Also, we should include in our calculations the relative size of our
+nodes. For instance, a year from now we might have real nodes that can
+handle twice the capacity of our current nodes. So we'd want to assign
+twice the virtual nodes to those future nodes, so maybe we should raise
+our virtual node estimate to 120,000.
+
+A good rule to follow might be to calculate 100 virtual nodes to each
+real node at maximum capacity. This would allow you to alter the load
+on any given node by 1%, even at max capacity, which is pretty fine
+tuning. So now we're at 6,000,000 virtual nodes for a max capacity cluster
+of 60,000 real nodes.
+
+6 million virtual nodes seems like a lot, and it might seem like we'd
+use up way too much memory. But the only structure this affects is the
+virtual node to real node mapping. The base amount of memory required
+would be 6 million times 2 bytes (to store a real node id from 0 to
+65,535). 12 megabytes of memory just isn't that much to use these days.
+
+Even with all the overhead of flexible data types, things aren't that
+bad. I changed the code from the previous part in this series to have
+60,000 real and 6,000,000 virtual nodes, changed the list to an array('H'),
+and python topped out at 27m of resident memory – and that includes two
+rings.
+
+To change terminology a bit, we're going to start calling these virtual
+nodes "partitions". This will make it a bit easier to discern between the
+two types of nodes we've been talking about so far. Also, it makes sense
+to talk about partitions as they are really just unchanging sections
+of the hash space.
+
+We're also going to always keep the partition count a power of two. This
+makes it easy to just use bit manipulation on the hash to determine the
+partition rather than modulus. It isn't much faster, but it is a little.
+So, here's our updated ring code, using 8,388,608 (2 ** 23) partitions
+and 65,536 nodes. We've upped the sample data id set and checked the
+distribution to make sure we haven't broken anything.
+
+.. code-block:: python
+
+  from array import array
+  from hashlib import md5
+  from struct import unpack_from
+
+  PARTITION_POWER = 23
+  PARTITION_SHIFT = 32 - PARTITION_POWER
+  NODE_COUNT = 65536
+  DATA_ID_COUNT = 100000000
+
+  part2node = array('H')
+  for part in range(2 ** PARTITION_POWER):
+      part2node.append(part % NODE_COUNT)
+  node_counts = [0] * NODE_COUNT
+  for data_id in range(DATA_ID_COUNT):
+      data_id = str(data_id)
+      part = unpack_from('>I',
+          md5(str(data_id)).digest())[0] >> PARTITION_SHIFT
+      node_id = part2node[part]
+      node_counts[node_id] += 1
+  desired_count = DATA_ID_COUNT / NODE_COUNT
+  print '%d: Desired data ids per node' % desired_count
+  max_count = max(node_counts)
+  over = 100.0 * (max_count - desired_count) / desired_count
+  print '%d: Most data ids on one node, %.02f%% over' % \
+      (max_count, over)
+  min_count = min(node_counts)
+  under = 100.0 * (desired_count - min_count) / desired_count
+  print '%d: Least data ids on one node, %.02f%% under' % \
+      (min_count, under)
+
+::
+
+  1525: Desired data ids per node
+  1683: Most data ids on one node, 10.36% over
+  1360: Least data ids on one node, 10.82% under
+
+Hmm. +–10% seems a bit high, but I reran with 65,536 partitions and
+256 nodes and got +–0.4% so it's just that our sample size (100m) is
+too small for our number of partitions (8m). It'll take way too long
+to run experiments with an even larger sample size, so let's reduce
+back down to these lesser numbers. (To be certain, I reran at the full
+version with a 10 billion data id sample set and got +–1%, but it took
+6.5 hours to run.)
+
+In the next part of this series, we'll talk about how to increase the
+durability of our data in the cluster.
+
+Part 4
+======
+In Part 3 of this series, we just further discussed partitions (virtual
+nodes) and cleaned up our code a bit based on that. Now, let's talk
+about how to increase the durability and availability of our data in the
+cluster.
+
+For many distributed data stores, durability is quite important. Either
+RAID arrays or individually distinct copies of data are required. While
+RAID will increase the durability, it does nothing to increase the
+availability – if the RAID machine crashes, the data may be safe but
+inaccessible until repairs are done. If we keep distinct copies of the
+data on different machines and a machine crashes, the other copies will
+still be available while we repair the broken machine.
+
+An easy way to gain this multiple copy durability/availability is to
+just use multiple rings and groups of nodes. For instance, to achieve
+the industry standard of three copies, you'd split the nodes into three
+groups and each group would have its own ring and each would receive a
+copy of each data item. This can work well enough, but has the drawback
+that expanding capacity requires adding three nodes at a time and that
+losing one node essentially lowers capacity by three times that node's
+capacity.
+
+Instead, let's use a different, but common, approach of meeting our
+requirements with a single ring. This can be done by walking the ring
+from the starting point and looking for additional distinct nodes.
+Here's code that supports a variable number of replicas (set to 3 for
+testing):
+
+.. code-block:: python
+
+  from array import array
+  from hashlib import md5
+  from struct import unpack_from
+
+  REPLICAS = 3
+  PARTITION_POWER = 16
+  PARTITION_SHIFT = 32 - PARTITION_POWER
+  PARTITION_MAX = 2 ** PARTITION_POWER - 1
+  NODE_COUNT = 256
+  DATA_ID_COUNT = 10000000
+
+  part2node = array('H')
+  for part in range(2 ** PARTITION_POWER):
+      part2node.append(part % NODE_COUNT)
+  node_counts = [0] * NODE_COUNT
+  for data_id in range(DATA_ID_COUNT):
+      data_id = str(data_id)
+      part = unpack_from('>I',
+          md5(str(data_id)).digest())[0] >> PARTITION_SHIFT
+      node_ids = [part2node[part]]
+      node_counts[node_ids[0]] += 1
+      for replica in range(1, REPLICAS):
+          while part2node[part] in node_ids:
+              part += 1
+              if part > PARTITION_MAX:
+                  part = 0
+          node_ids.append(part2node[part])
+          node_counts[node_ids[-1]] += 1
+  desired_count = DATA_ID_COUNT / NODE_COUNT * REPLICAS
+  print '%d: Desired data ids per node' % desired_count
+  max_count = max(node_counts)
+  over = 100.0 * (max_count - desired_count) / desired_count
+  print '%d: Most data ids on one node, %.02f%% over' % \
+      (max_count, over)
+  min_count = min(node_counts)
+  under = 100.0 * (desired_count - min_count) / desired_count
+  print '%d: Least data ids on one node, %.02f%% under' % \
+      (min_count, under)
+
+::
+
+  117186: Desired data ids per node
+  118133: Most data ids on one node, 0.81% over
+  116093: Least data ids on one node, 0.93% under
+
+That's pretty good; less than 1% over/under. While this works well,
+there are a couple of problems.
+
+First, because of how we've initially assigned the partitions to nodes,
+all the partitions for a given node have their extra copies on the same
+other two nodes. The problem here is that when a machine fails, the load
+on these other nodes will jump by that amount. It'd be better if we
+initially shuffled the partition assignment to distribute the failover
+load better.
+
+The other problem is a bit harder to explain, but deals with physical
+separation of machines. Imagine you can only put 16 machines in a rack
+in your datacenter. The 256 nodes we've been using would fill 16 racks.
+With our current code, if a rack goes out (power problem, network issue,
+etc.) there is a good chance some data will have all three copies in that
+rack, becoming inaccessible. We can fix this shortcoming by adding the
+concept of zones to our nodes, and then ensuring that replicas are stored
+in distinct zones.
+
+.. code-block:: python
+
+  from array import array
+  from hashlib import md5
+  from random import shuffle
+  from struct import unpack_from
+
+  REPLICAS = 3
+  PARTITION_POWER = 16
+  PARTITION_SHIFT = 32 - PARTITION_POWER
+  PARTITION_MAX = 2 ** PARTITION_POWER - 1
+  NODE_COUNT = 256
+  ZONE_COUNT = 16
+  DATA_ID_COUNT = 10000000
+
+  node2zone = []
+  while len(node2zone) < NODE_COUNT:
+      zone = 0
+      while zone < ZONE_COUNT and len(node2zone) < NODE_COUNT:
+          node2zone.append(zone)
+          zone += 1
+  part2node = array('H')
+  for part in range(2 ** PARTITION_POWER):
+      part2node.append(part % NODE_COUNT)
+  shuffle(part2node)
+  node_counts = [0] * NODE_COUNT
+  zone_counts = [0] * ZONE_COUNT
+  for data_id in range(DATA_ID_COUNT):
+      data_id = str(data_id)
+      part = unpack_from('>I',
+          md5(str(data_id)).digest())[0] >> PARTITION_SHIFT
+      node_ids = [part2node[part]]
+      zones = [node2zone[node_ids[0]]]
+      node_counts[node_ids[0]] += 1
+      zone_counts[zones[0]] += 1
+      for replica in range(1, REPLICAS):
+          while part2node[part] in node_ids and \
+                  node2zone[part2node[part]] in zones:
+              part += 1
+              if part > PARTITION_MAX:
+                  part = 0
+          node_ids.append(part2node[part])
+          zones.append(node2zone[node_ids[-1]])
+          node_counts[node_ids[-1]] += 1
+          zone_counts[zones[-1]] += 1
+  desired_count = DATA_ID_COUNT / NODE_COUNT * REPLICAS
+  print '%d: Desired data ids per node' % desired_count
+  max_count = max(node_counts)
+  over = 100.0 * (max_count - desired_count) / desired_count
+  print '%d: Most data ids on one node, %.02f%% over' % \
+      (max_count, over)
+  min_count = min(node_counts)
+  under = 100.0 * (desired_count - min_count) / desired_count
+  print '%d: Least data ids on one node, %.02f%% under' % \
+      (min_count, under)
+  desired_count = DATA_ID_COUNT / ZONE_COUNT * REPLICAS
+  print '%d: Desired data ids per zone' % desired_count
+  max_count = max(zone_counts)
+  over = 100.0 * (max_count - desired_count) / desired_count
+  print '%d: Most data ids in one zone, %.02f%% over' % \
+      (max_count, over)
+  min_count = min(zone_counts)
+  under = 100.0 * (desired_count - min_count) / desired_count
+  print '%d: Least data ids in one zone, %.02f%% under' % \
+      (min_count, under)
+
+::
+
+  117186: Desired data ids per node
+  118782: Most data ids on one node, 1.36% over
+  115632: Least data ids on one node, 1.33% under
+  1875000: Desired data ids per zone
+  1878533: Most data ids in one zone, 0.19% over
+  1869070: Least data ids in one zone, 0.32% under
+
+So the shuffle and zone distinctions affected our distribution some,
+but still definitely good enough. This test took about 64 seconds to
+run on my machine.
+
+There's a completely alternate, and quite common, way of accomplishing
+these same requirements. This alternate method doesn't use partitions
+at all, but instead just assigns anchors to the nodes within the hash
+space. Finding the first node for a given hash just involves walking
+this anchor ring for the next node, and finding additional nodes works
+similarly as before. To attain the equivalent of our virtual nodes,
+each real node is assigned multiple anchors.
+
+.. code-block:: python
+
+  from bisect import bisect_left
+  from hashlib import md5
+  from struct import unpack_from
+
+  REPLICAS = 3
+  NODE_COUNT = 256
+  ZONE_COUNT = 16
+  DATA_ID_COUNT = 10000000
+  VNODE_COUNT = 100
+
+  node2zone = []
+  while len(node2zone) < NODE_COUNT:
+      zone = 0
+      while zone < ZONE_COUNT and len(node2zone) < NODE_COUNT:
+          node2zone.append(zone)
+          zone += 1
+  hash2index = []
+  index2node = []
+  for node in range(NODE_COUNT):
+      for vnode in range(VNODE_COUNT):
+          hsh = unpack_from('>I', md5(str(node)).digest())[0]
+          index = bisect_left(hash2index, hsh)
+          if index > len(hash2index):
+              index = 0
+          hash2index.insert(index, hsh)
+          index2node.insert(index, node)
+  node_counts = [0] * NODE_COUNT
+  zone_counts = [0] * ZONE_COUNT
+  for data_id in range(DATA_ID_COUNT):
+      data_id = str(data_id)
+      hsh = unpack_from('>I', md5(str(data_id)).digest())[0]
+      index = bisect_left(hash2index, hsh)
+      if index >= len(hash2index):
+          index = 0
+      node_ids = [index2node[index]]
+      zones = [node2zone[node_ids[0]]]
+      node_counts[node_ids[0]] += 1
+      zone_counts[zones[0]] += 1
+      for replica in range(1, REPLICAS):
+          while index2node[index] in node_ids and \
+                  node2zone[index2node[index]] in zones:
+              index += 1
+              if index >= len(hash2index):
+                  index = 0
+          node_ids.append(index2node[index])
+          zones.append(node2zone[node_ids[-1]])
+          node_counts[node_ids[-1]] += 1
+          zone_counts[zones[-1]] += 1
+  desired_count = DATA_ID_COUNT / NODE_COUNT * REPLICAS
+  print '%d: Desired data ids per node' % desired_count
+  max_count = max(node_counts)
+  over = 100.0 * (max_count - desired_count) / desired_count
+  print '%d: Most data ids on one node, %.02f%% over' % \
+      (max_count, over)
+  min_count = min(node_counts)
+  under = 100.0 * (desired_count - min_count) / desired_count
+  print '%d: Least data ids on one node, %.02f%% under' % \
+      (min_count, under)
+  desired_count = DATA_ID_COUNT / ZONE_COUNT * REPLICAS
+  print '%d: Desired data ids per zone' % desired_count
+  max_count = max(zone_counts)
+  over = 100.0 * (max_count - desired_count) / desired_count
+  print '%d: Most data ids in one zone, %.02f%% over' % \
+      (max_count, over)
+  min_count = min(zone_counts)
+  under = 100.0 * (desired_count - min_count) / desired_count
+  print '%d: Least data ids in one zone, %.02f%% under' % \
+      (min_count, under)
+
+::
+
+  117186: Desired data ids per node
+  351282: Most data ids on one node, 199.76% over
+  15965: Least data ids on one node, 86.38% under
+  1875000: Desired data ids per zone
+  2248496: Most data ids in one zone, 19.92% over
+  1378013: Least data ids in one zone, 26.51% under
+
+This test took over 15 minutes to run! Unfortunately, this method also
+gives much less control over the distribution. To get better distribution,
+you have to add more virtual nodes, which eats up more memory and takes
+even more time to build the ring and perform distinct node lookups. The
+most common operation, data id lookup, can be improved (by predetermining
+each virtual node's failover nodes, for instance) but it starts off so
+far behind our first approach that we'll just stick with that.
+
+In the next part of this series, we'll start to wrap all this up into
+a useful Python module.
+
+Part 5
+======
+In Part 4 of this series, we ended up with a multiple copy, distinctly
+zoned ring. Or at least the start of it. In this final part we'll package
+the code up into a useable Python module and then add one last feature.
+First, let's separate the ring itself from the building of the data for
+the ring and its testing.
+
+.. code-block:: python
+
+  from array import array
+  from hashlib import md5
+  from random import shuffle
+  from struct import unpack_from
+  from time import time
+
+  class Ring(object):
+
+      def __init__(self, nodes, part2node, replicas):
+          self.nodes = nodes
+          self.part2node = part2node
+          self.replicas = replicas
+          partition_power = 1
+          while 2 ** partition_power < len(part2node):
+              partition_power += 1
+          if len(part2node) != 2 ** partition_power:
+              raise Exception("part2node's length is not an "
+                              "exact power of 2")
+          self.partition_shift = 32 - partition_power
+
+      def get_nodes(self, data_id):
+          data_id = str(data_id)
+          part = unpack_from('>I',
+             md5(data_id).digest())[0] >> self.partition_shift
+          node_ids = [self.part2node[part]]
+          zones = [self.nodes[node_ids[0]]]
+          for replica in range(1, self.replicas):
+              while self.part2node[part] in node_ids and \
+                     self.nodes[self.part2node[part]] in zones:
+                  part += 1
+                  if part >= len(self.part2node):
+                      part = 0
+              node_ids.append(self.part2node[part])
+              zones.append(self.nodes[node_ids[-1]])
+          return [self.nodes[n] for n in node_ids]
+
+  def build_ring(nodes, partition_power, replicas):
+      begin = time()
+      part2node = array('H')
+      for part in range(2 ** partition_power):
+          part2node.append(part % len(nodes))
+      shuffle(part2node)
+      ring = Ring(nodes, part2node, replicas)
+      print '%.02fs to build ring' % (time() - begin)
+      return ring
+
+  def test_ring(ring):
+      begin = time()
+      DATA_ID_COUNT = 10000000
+      node_counts = {}
+      zone_counts = {}
+      for data_id in range(DATA_ID_COUNT):
+          for node in ring.get_nodes(data_id):
+              node_counts[node['id']] = \
+                  node_counts.get(node['id'], 0) + 1
+              zone_counts[node['zone']] = \
+                  zone_counts.get(node['zone'], 0) + 1
+      print '%ds to test ring' % (time() - begin)
+      desired_count = \
+          DATA_ID_COUNT / len(ring.nodes) * REPLICAS
+      print '%d: Desired data ids per node' % desired_count
+      max_count = max(node_counts.values())
+      over = \
+          100.0 * (max_count - desired_count) / desired_count
+      print '%d: Most data ids on one node, %.02f%% over' % \
+          (max_count, over)
+      min_count = min(node_counts.values())
+      under = \
+          100.0 * (desired_count - min_count) / desired_count
+      print '%d: Least data ids on one node, %.02f%% under' % \
+          (min_count, under)
+      zone_count = \
+          len(set(n['zone'] for n in ring.nodes.values()))
+      desired_count = \
+          DATA_ID_COUNT / zone_count * ring.replicas
+      print '%d: Desired data ids per zone' % desired_count
+      max_count = max(zone_counts.values())
+      over = \
+          100.0 * (max_count - desired_count) / desired_count
+      print '%d: Most data ids in one zone, %.02f%% over' % \
+          (max_count, over)
+      min_count = min(zone_counts.values())
+      under = \
+          100.0 * (desired_count - min_count) / desired_count
+      print '%d: Least data ids in one zone, %.02f%% under' % \
+          (min_count, under)
+
+  if __name__ == '__main__':
+      PARTITION_POWER = 16
+      REPLICAS = 3
+      NODE_COUNT = 256
+      ZONE_COUNT = 16
+      nodes = {}
+      while len(nodes) < NODE_COUNT:
+          zone = 0
+          while zone < ZONE_COUNT and len(nodes) < NODE_COUNT:
+              node_id = len(nodes)
+              nodes[node_id] = {'id': node_id, 'zone': zone}
+              zone += 1
+      ring = build_ring(nodes, PARTITION_POWER, REPLICAS)
+      test_ring(ring)
+
+::
+
+  0.06s to build ring
+  82s to test ring
+  117186: Desired data ids per node
+  118773: Most data ids on one node, 1.35% over
+  115801: Least data ids on one node, 1.18% under
+  1875000: Desired data ids per zone
+  1878339: Most data ids in one zone, 0.18% over
+  1869914: Least data ids in one zone, 0.27% under
+
+It takes a bit longer to test our ring, but that's mostly because of
+the switch to dictionaries from arrays for various items. Having node
+dictionaries is nice because you can attach any node information you
+want directly there (ip addresses, tcp ports, drive paths, etc.). But
+we're still on track for further testing; our distribution is still good.
+
+Now, let's add our one last feature to our ring: the concept of weights.
+Weights are useful because the nodes you add later in a ring's life are
+likely to have more capacity than those you have at the outset. For this
+test, we'll make half our nodes have twice the weight. We'll have to
+change build_ring to give more partitions to the nodes with more weight
+and we'll change test_ring to take into account these weights. Since
+we've changed so much I'll just post the entire module again:
+
+.. code-block:: python
+
+  from array import array
+  from hashlib import md5
+  from random import shuffle
+  from struct import unpack_from
+  from time import time
+
+  class Ring(object):
+
+      def __init__(self, nodes, part2node, replicas):
+          self.nodes = nodes
+          self.part2node = part2node
+          self.replicas = replicas
+          partition_power = 1
+          while 2 ** partition_power < len(part2node):
+              partition_power += 1
+          if len(part2node) != 2 ** partition_power:
+              raise Exception("part2node's length is not an "
+                              "exact power of 2")
+          self.partition_shift = 32 - partition_power
+
+      def get_nodes(self, data_id):
+          data_id = str(data_id)
+          part = unpack_from('>I',
+             md5(data_id).digest())[0] >> self.partition_shift
+          node_ids = [self.part2node[part]]
+          zones = [self.nodes[node_ids[0]]]
+          for replica in range(1, self.replicas):
+              while self.part2node[part] in node_ids and \
+                     self.nodes[self.part2node[part]] in zones:
+                  part += 1
+                  if part >= len(self.part2node):
+                      part = 0
+              node_ids.append(self.part2node[part])
+              zones.append(self.nodes[node_ids[-1]])
+          return [self.nodes[n] for n in node_ids]
+
+  def build_ring(nodes, partition_power, replicas):
+      begin = time()
+      parts = 2 ** partition_power
+      total_weight = \
+          float(sum(n['weight'] for n in nodes.values()))
+      for node in nodes.values():
+          node['desired_parts'] = \
+              parts / total_weight * node['weight']
+      part2node = array('H')
+      for part in range(2 ** partition_power):
+          for node in nodes.values():
+              if node['desired_parts'] >= 1:
+                  node['desired_parts'] -= 1
+                  part2node.append(node['id'])
+                  break
+          else:
+              for node in nodes.values():
+                  if node['desired_parts'] >= 0:
+                      node['desired_parts'] -= 1
+                      part2node.append(node['id'])
+                      break
+      shuffle(part2node)
+      ring = Ring(nodes, part2node, replicas)
+      print '%.02fs to build ring' % (time() - begin)
+      return ring
+
+  def test_ring(ring):
+      begin = time()
+      DATA_ID_COUNT = 10000000
+      node_counts = {}
+      zone_counts = {}
+      for data_id in range(DATA_ID_COUNT):
+          for node in ring.get_nodes(data_id):
+              node_counts[node['id']] = \
+                  node_counts.get(node['id'], 0) + 1
+              zone_counts[node['zone']] = \
+                  zone_counts.get(node['zone'], 0) + 1
+      print '%ds to test ring' % (time() - begin)
+      total_weight = float(sum(n['weight'] for n in
+                               ring.nodes.values()))
+      max_over = 0
+      max_under = 0
+      for node in ring.nodes.values():
+          desired = DATA_ID_COUNT * REPLICAS * \
+              node['weight'] / total_weight
+          diff = node_counts[node['id']] - desired
+          if diff > 0:
+              over = 100.0 * diff / desired
+              if over > max_over:
+                  max_over = over
+          else:
+              under = 100.0 * (-diff) / desired
+              if under > max_under:
+                  max_under = under
+      print '%.02f%% max node over' % max_over
+      print '%.02f%% max node under' % max_under
+      max_over = 0
+      max_under = 0
+      for zone in set(n['zone'] for n in
+                      ring.nodes.values()):
+          zone_weight = sum(n['weight'] for n in
+              ring.nodes.values() if n['zone'] == zone)
+          desired = DATA_ID_COUNT * REPLICAS * \
+              zone_weight / total_weight
+          diff = zone_counts[zone] - desired
+          if diff > 0:
+              over = 100.0 * diff / desired
+              if over > max_over:
+                  max_over = over
+          else:
+              under = 100.0 * (-diff) / desired
+              if under > max_under:
+                  max_under = under
+      print '%.02f%% max zone over' % max_over
+      print '%.02f%% max zone under' % max_under
+
+  if __name__ == '__main__':
+      PARTITION_POWER = 16
+      REPLICAS = 3
+      NODE_COUNT = 256
+      ZONE_COUNT = 16
+      nodes = {}
+      while len(nodes) < NODE_COUNT:
+          zone = 0
+          while zone < ZONE_COUNT and len(nodes) < NODE_COUNT:
+              node_id = len(nodes)
+              nodes[node_id] = {'id': node_id, 'zone': zone,
+                                'weight': 1.0 + (node_id % 2)}
+              zone += 1
+      ring = build_ring(nodes, PARTITION_POWER, REPLICAS)
+      test_ring(ring)
+
+::
+
+  0.88s to build ring
+  86s to test ring
+  1.66% max over
+  1.46% max under
+  0.28% max zone over
+  0.23% max zone under
+
+So things are still good, even though we have differently weighted nodes.
+I ran another test with this code using random weights from 1 to 100 and
+got over/under values for nodes of 7.35%/18.12% and zones of 0.24%/0.22%,
+still pretty good considering the crazy weight ranges.
+
+Summary
+=======
+Hopefully this series has been a good introduction to building a ring.
+This code is essentially how the OpenStack Swift ring works, except that
+Swift's ring has lots of additional optimizations, such as storing each
+replica assignment separately, and lots of extra features for building,
+validating, and otherwise working with rings.
diff --git a/doc/source/ring_partpower.rst b/doc/source/ring_partpower.rst
new file mode 100644
index 0000000000..2e22bec5ed
--- /dev/null
+++ b/doc/source/ring_partpower.rst
@@ -0,0 +1,199 @@
+.. _modify_part_power:
+
+==============================
+Modifying Ring Partition Power
+==============================
+
+The ring partition power determines the on-disk location of data files and is
+selected when creating a new ring. In normal operation, it is a fixed value.
+This is because a different partition power results in a different on-disk
+location for all data files.
+
+However, increasing the partition power by 1 can be done by choosing locations
+that are on the same disk. As a result, we can create hard-links for both the
+new and old locations, avoiding data movement without impacting availability.
+
+To enable a partition power change without interrupting user access, object
+servers need to be aware of it in advance. Therefore a partition power change
+needs to be done in multiple steps.
+
+.. note::
+
+    Do not increase the partition power on account and container rings.
+    Increasing the partition power is *only* supported for object rings.
+    Trying to increase the part_power for account and container rings *will*
+    result in unavailability, maybe even data loss.
+
+
+-------
+Caveats
+-------
+
+Before increasing the partition power, consider the possible drawbacks.
+There are a few caveats when increasing the partition power:
+
+* Almost all diskfiles in the cluster need to be relinked then cleaned up,
+  and all partition directories need to be rehashed. This imposes significant
+  I/O load on object servers, which may impact client requests. Consider using
+  cgroups, ``ionice``, or even just the built-in ``--files-per-second``
+  rate-limiting to reduce client impact.
+* Object replicators and reconstructors will skip affected policies during the
+  partition power increase. Replicators are not aware of hard-links, and would
+  simply copy the content; this would result in heavy data movement and the
+  worst case would be that all data is stored twice.
+* Due to the fact that each object will now be hard linked from two locations,
+  many more inodes will be used temporarily - expect around twice the amount.
+  You need to check the free inode count *before* increasing the partition
+  power. Even after the increase is complete and extra hardlinks are cleaned
+  up, expect increased inode usage since there will be twice as many partition
+  and suffix directories.
+* Also, object auditors might read each object twice before cleanup removes the
+  second hard link.
+* Due to the new inodes more memory is needed to cache them, and your
+  object servers should have plenty of available memory to avoid running out of
+  inode cache. Setting ``vfs_cache_pressure`` to 1 might help with that.
+* All nodes in the cluster *must* run at least Swift version 2.13.0 or later.
+
+Due to these caveats you should only increase the partition power if really
+needed, i.e. if the number of partitions per disk is extremely low and the data
+is distributed unevenly across disks.
+
+-----------------------------------
+1. Prepare partition power increase
+-----------------------------------
+
+The swift-ring-builder is used to prepare the ring for an upcoming partition
+power increase. It will store a new variable ``next_part_power`` with the current
+partition power + 1. Object servers recognize this, and hard links to the new
+location will be created (or deleted) on every PUT or DELETE.  This will make
+it possible to access newly written objects using the future partition power::
+
+    swift-ring-builder <builder-file> prepare_increase_partition_power
+    swift-ring-builder <builder-file> write_ring
+
+Now you need to copy the updated .ring.gz to all nodes. Already existing data
+needs to be relinked too; therefore an operator has to run a relinker command
+on all object servers in this phase::
+
+    swift-object-relinker relink
+
+.. note::
+
+    Start relinking after *all* the servers re-read the modified ring files,
+    which normally happens within 15 seconds after writing a modified ring.
+    Also, make sure the modified rings are pushed to all nodes running object
+    services (replicators, reconstructors and reconcilers)- they have to skip
+    the policy during relinking.
+
+.. note::
+
+    The relinking command must run as the same user as the daemon processes
+    (usually swift). It will create files and directories that must be
+    manipulable by the daemon processes (server, auditor, replicator, ...).
+    If necessary, the ``--user`` option may be used to drop privileges.
+
+Relinking might take some time; while there is no data copied or actually
+moved, the tool still needs to walk the whole file system and create new hard
+links as required.
+
+---------------------------
+2. Increase partition power
+---------------------------
+
+Now that all existing data can be found using the new location, it's time to
+actually increase the partition power itself::
+
+    swift-ring-builder <builder-file> increase_partition_power
+    swift-ring-builder <builder-file> write_ring
+
+Now you need to copy the updated .ring.gz again to all nodes. Object servers
+are now using the new, increased partition power and no longer create
+additional hard links.
+
+
+.. note::
+
+    The object servers will create additional hard links for each modified or
+    new object, and this requires more inodes.
+
+.. note::
+
+    If you decide you don't want to increase the partition power, you should
+    instead cancel the increase. It is not possible to revert this operation
+    once started. To abort the partition power increase, execute the following
+    commands, copy the updated .ring.gz files to all nodes and continue with
+    `3. Cleanup`_ afterwards::
+
+        swift-ring-builder <builder-file> cancel_increase_partition_power
+        swift-ring-builder <builder-file> write_ring
+
+
+----------
+3. Cleanup
+----------
+
+Existing hard links in the old locations need to be removed, and a cleanup tool
+is provided to do this. Run the following command on each storage node::
+
+    swift-object-relinker cleanup
+
+.. note::
+
+    The cleanup must be finished within your object servers ``reclaim_age``
+    period (which is by default 1 week). Otherwise objects that have been
+    overwritten between step #1 and step #2 and deleted afterwards can't be
+    cleaned up anymore. You may want to increase your ``reclaim_age`` before
+    or during relinking.
+
+Afterwards it is required to update the rings one last
+time to inform servers that all steps to increase the partition power are done,
+and replicators should resume their job::
+
+    swift-ring-builder <builder-file> finish_increase_partition_power
+    swift-ring-builder <builder-file> write_ring
+
+Now you need to copy the updated .ring.gz again to all nodes.
+
+----------
+Background
+----------
+
+An existing object that is currently located on partition X will be placed
+either on partition 2*X or 2*X+1 after the partition power is increased. The
+reason for this is the Ring.get_part() method, that does a bitwise shift to the
+right.
+
+To avoid actual data movement to different disks or even nodes, the allocation
+of partitions to nodes needs to be changed. The allocation is pairwise due to
+the above mentioned new partition scheme. Therefore devices are allocated like
+this, with the partition being the index and the value being the device id::
+
+        old        new
+    part  dev   part  dev
+    ----  ---   ----  ---
+    0     0     0     0
+                1     0
+    1     3     2     3
+                3     3
+    2     7     4     7
+                5     7
+    3     5     6     5
+                7     5
+    4     2     8     2
+                9     2
+    5     1     10    1
+                11    1
+
+There is a helper method to compute the new path, and the following example
+shows the mapping between old and new location::
+
+    >>> from swift.common.utils import replace_partition_in_path
+    >>> old='objects/16003/a38/fa0fcec07328d068e24ccbf2a62f2a38/1467658208.57179.data'
+    >>> replace_partition_in_path('', '/sda/' + old, 14)
+    'objects/16003/a38/fa0fcec07328d068e24ccbf2a62f2a38/1467658208.57179.data'
+    >>> replace_partition_in_path('', '/sda/' + old, 15)
+    'objects/32007/a38/fa0fcec07328d068e24ccbf2a62f2a38/1467658208.57179.data'
+
+Using the original partition power (14) it returned the same path; however
+after an increase to 15 it returns the new path, and the new partition is 2*X+1
+in this case.
diff --git a/doc/source/s3_compat.rst b/doc/source/s3_compat.rst
new file mode 100644
index 0000000000..04010a7c17
--- /dev/null
+++ b/doc/source/s3_compat.rst
@@ -0,0 +1,145 @@
+S3/Swift REST API Comparison Matrix
+===================================
+
+General compatibility statement
+-------------------------------
+
+S3 is a product from Amazon, and as such, it includes "features" that
+are  outside the scope of Swift itself. For example, Swift doesn't
+have anything to do with billing, whereas S3 buckets can be tied to
+Amazon's billing system. Similarly, log delivery is a service outside
+of Swift. It's entirely possible for a Swift deployment to provide that
+functionality, but it is not part of Swift itself. Likewise, a Swift
+deployment can provide similar geographic availability as S3, but this
+is tied to the deployer's willingness to build the infrastructure and
+support systems to do so.
+
+Amazon S3 operations
+---------------------
+
++------------------------------------------------+------------------+--------------+
+| S3 REST API method                             | Category         | Swift S3 API |
++================================================+==================+==============+
+| `GET Object`_                                  | Core-API         | Yes          |
++------------------------------------------------+------------------+--------------+
+| `HEAD Object`_                                 | Core-API         | Yes          |
++------------------------------------------------+------------------+--------------+
+| `PUT Object`_                                  | Core-API         | Yes          |
++------------------------------------------------+------------------+--------------+
+| `PUT Object Copy`_                             | Core-API         | Yes          |
++------------------------------------------------+------------------+--------------+
+| `DELETE Object`_                               | Core-API         | Yes          |
++------------------------------------------------+------------------+--------------+
+| `Initiate Multipart Upload`_                   | Core-API         | Yes          |
++------------------------------------------------+------------------+--------------+
+| `Upload Part`_                                 | Core-API         | Yes          |
++------------------------------------------------+------------------+--------------+
+| `Upload Part Copy`_                            | Core-API         | Yes          |
++------------------------------------------------+------------------+--------------+
+| `Complete Multipart Upload`_                   | Core-API         | Yes          |
++------------------------------------------------+------------------+--------------+
+| `Abort Multipart Upload`_                      | Core-API         | Yes          |
++------------------------------------------------+------------------+--------------+
+| `List Parts`_                                  | Core-API         | Yes          |
++------------------------------------------------+------------------+--------------+
+| `GET Object ACL`_                              | Core-API         | Yes          |
++------------------------------------------------+------------------+--------------+
+| `PUT Object ACL`_                              | Core-API         | Yes          |
++------------------------------------------------+------------------+--------------+
+| `PUT Bucket`_                                  | Core-API         | Yes          |
++------------------------------------------------+------------------+--------------+
+| `GET Bucket List Objects`_                     | Core-API         | Yes          |
++------------------------------------------------+------------------+--------------+
+| `HEAD Bucket`_                                 | Core-API         | Yes          |
++------------------------------------------------+------------------+--------------+
+| `DELETE Bucket`_                               | Core-API         | Yes          |
++------------------------------------------------+------------------+--------------+
+| `List Multipart Uploads`_                      | Core-API         | Yes          |
++------------------------------------------------+------------------+--------------+
+| `GET Bucket acl`_                              | Core-API         | Yes          |
++------------------------------------------------+------------------+--------------+
+| `PUT Bucket acl`_                              | Core-API         | Yes          |
++------------------------------------------------+------------------+--------------+
+| `Versioning`_                                  | Versioning       | Yes          |
++------------------------------------------------+------------------+--------------+
+| `Bucket notification`_                         | Notifications    | No           |
++------------------------------------------------+------------------+--------------+
+| Bucket Lifecycle [1]_ [2]_ [3]_ [4]_ [5]_ [6]_ | Bucket Lifecycle | No           |
++------------------------------------------------+------------------+--------------+
+| `Bucket policy`_                               | Advanced ACLs    | No           |
++------------------------------------------------+------------------+--------------+
+| Public website [7]_ [8]_ [9]_ [10]_            | Public Website   | No           |
++------------------------------------------------+------------------+--------------+
+| Billing [11]_ [12]_                            | Billing          | No           |
++------------------------------------------------+------------------+--------------+
+| `GET Bucket location`_                         | Advanced Feature | Yes          |
++------------------------------------------------+------------------+--------------+
+| `Delete Multiple Objects`_                     | Advanced Feature | Yes          |
++------------------------------------------------+------------------+--------------+
+| `Object tagging`_                              | Advanced Feature | No           |
++------------------------------------------------+------------------+--------------+
+| `GET Object torrent`_                          | Advanced Feature | No           |
++------------------------------------------------+------------------+--------------+
+| `Bucket inventory`_                            | Advanced Feature | No           |
++------------------------------------------------+------------------+--------------+
+| `GET Bucket service`_                          | Advanced Feature | No           |
++------------------------------------------------+------------------+--------------+
+| `Bucket accelerate`_                           | CDN Integration  | No           |
++------------------------------------------------+------------------+--------------+
+
+----
+
+.. _GET Object: http://docs.amazonwebservices.com/AmazonS3/latest/API/RESTObjectGET.html
+.. _HEAD Object: http://docs.amazonwebservices.com/AmazonS3/latest/API/RESTObjectHEAD.html
+.. _PUT Object: http://docs.amazonwebservices.com/AmazonS3/latest/API/RESTObjectPUT.html
+.. _PUT Object Copy: http://docs.amazonwebservices.com/AmazonS3/latest/API/RESTObjectCOPY.html
+.. _DELETE Object: http://docs.amazonwebservices.com/AmazonS3/latest/API/RESTObjectDELETE.html
+.. _Initiate Multipart Upload: http://docs.amazonwebservices.com/AmazonS3/latest/API/mpUploadInitiate.html
+.. _Upload Part: http://docs.amazonwebservices.com/AmazonS3/latest/API/mpUploadUploadPart.html
+.. _Upload Part Copy: http://docs.amazonwebservices.com/AmazonS3/latest/API/mpUploadUploadPartCopy.html
+.. _Complete Multipart Upload: http://docs.amazonwebservices.com/AmazonS3/latest/API/mpUploadComplete.html
+.. _Abort Multipart Upload: http://docs.amazonwebservices.com/AmazonS3/latest/API/mpUploadAbort.html
+.. _List Parts: http://docs.amazonwebservices.com/AmazonS3/latest/API/mpUploadListParts.html
+.. _GET Object ACL: http://docs.amazonwebservices.com/AmazonS3/latest/API/RESTObjectGETacl.html
+.. _PUT Object ACL: http://docs.amazonwebservices.com/AmazonS3/latest/API/RESTObjectPUTacl.html
+.. _Delete Multiple Objects: http://docs.amazonwebservices.com/AmazonS3/latest/API/multiobjectdeleteapi.html
+.. _GET Object torrent: http://docs.amazonwebservices.com/AmazonS3/latest/API/RESTObjectGETtorrent.html
+.. _Object tagging: http://docs.aws.amazon.com/AmazonS3/latest/API/RESTObjectGETtagging.html
+
+.. _PUT Bucket: http://docs.amazonwebservices.com/AmazonS3/latest/API/RESTBucketPUT.html
+.. _GET Bucket List Objects: http://docs.amazonwebservices.com/AmazonS3/latest/API/RESTBucketGET.html
+.. _HEAD Bucket: http://docs.amazonwebservices.com/AmazonS3/latest/API/RESTBucketHEAD.html
+.. _DELETE Bucket: http://docs.amazonwebservices.com/AmazonS3/latest/API/RESTBucketDELETE.html
+.. _List Multipart Uploads: http://docs.amazonwebservices.com/AmazonS3/latest/API/mpUploadListMPUpload.html
+.. _GET Bucket acl: http://docs.amazonwebservices.com/AmazonS3/latest/API/RESTBucketGETacl.html
+.. _PUT Bucket acl: http://docs.amazonwebservices.com/AmazonS3/latest/API/RESTBucketPUTacl.html
+.. _Bucket notification: http://docs.amazonwebservices.com/AmazonS3/latest/API/RESTBucketGETnotification.html
+.. _Bucket policy: http://docs.amazonwebservices.com/AmazonS3/latest/API/RESTBucketGETpolicy.html
+.. _GET Bucket location: http://docs.amazonwebservices.com/AmazonS3/latest/API/RESTBucketGETlocation.html
+.. _Bucket accelerate: http://docs.aws.amazon.com/AmazonS3/latest/API/RESTBucketGETaccelerate.html
+.. _Bucket inventory: http://docs.aws.amazon.com/AmazonS3/latest/API/RESTBucketGETInventoryConfig.html
+.. _GET Bucket service: http://docs.aws.amazon.com/AmazonS3/latest/API/RESTServiceGET.html
+
+.. Versioning
+.. _Versioning: http://docs.amazonwebservices.com/AmazonS3/latest/API/RESTBucketGETversioningStatus.html
+
+
+.. Lifecycle
+.. [1] `POST restore <http://docs.aws.amazon.com/AmazonS3/latest/API/RESTObjectPOSTrestore.html>`_
+.. [2] `Bucket lifecycle <http://docs.amazonwebservices.com/AmazonS3/latest/API/RESTBucketGETlifecycle.html>`_
+.. [3] `Bucket logging <http://docs.amazonwebservices.com/AmazonS3/latest/API/RESTBucketGETlogging.html>`_
+.. [4] `Bucket analytics <http://docs.aws.amazon.com/AmazonS3/latest/API/RESTBucketGETAnalyticsConfig.html>`_
+.. [5] `Bucket metrics <http://docs.aws.amazon.com/AmazonS3/latest/API/RESTBucketGETMetricConfiguration.html>`_
+.. [6] `Bucket replication <http://docs.aws.amazon.com/AmazonS3/latest/API/RESTBucketGETreplication.html>`_
+
+
+.. Public website
+.. [7] `OPTIONS object <http://docs.aws.amazon.com/AmazonS3/latest/API/RESTOPTIONSobject.html>`_
+.. [8] `Object POST from HTML form <http://docs.amazonwebservices.com/AmazonS3/latest/API/RESTObjectPOST.html>`_
+.. [9] `Bucket public website <http://docs.amazonwebservices.com/AmazonS3/latest/API/RESTBucketGETwebsite.html>`_
+.. [10] `Bucket CORS <http://docs.aws.amazon.com/AmazonS3/latest/API/RESTBucketGETcors.html>`_
+
+
+.. Billing
+.. [11] `Request payment <http://docs.amazonwebservices.com/AmazonS3/latest/API/RESTrequestPaymentPUT.html>`_
+.. [12] `Bucket tagging <http://docs.aws.amazon.com/AmazonS3/latest/API/RESTBucketGETtagging.html>`_
diff --git a/doc/source/test-cors.html b/doc/source/test-cors.html
new file mode 100644
index 0000000000..b8a28a195f
--- /dev/null
+++ b/doc/source/test-cors.html
@@ -0,0 +1,60 @@
+<!DOCTYPE html>
+<html>
+  <head>
+    <meta charset="utf-8">
+    <title>Test CORS</title>
+  </head>
+  <body>
+
+    Token<br><input id="token" type="text" size="64"><br><br>
+
+    Method<br>
+    <select id="method">
+        <option value="GET">GET</option>
+        <option value="HEAD">HEAD</option>
+        <option value="POST">POST</option>
+        <option value="DELETE">DELETE</option>
+        <option value="PUT">PUT</option>
+    </select><br><br>
+
+    URL (Container or Object)<br><input id="url" size="64" type="text"><br><br>
+
+    <input id="submit" type="button" value="Submit" onclick="submit(); return false;">
+
+    <pre id="response_headers"></pre>
+    <p>
+    <hr>
+    <pre id="response_body"></pre>
+
+    <script type="text/javascript">
+      function submit() {
+          var token = document.getElementById('token').value;
+          var method = document.getElementById('method').value;
+          var url = document.getElementById('url').value;
+
+          document.getElementById('response_headers').textContent = null;
+          document.getElementById('response_body').textContent = null;
+
+          var request = new XMLHttpRequest();
+
+          request.onreadystatechange = function (oEvent) {
+              if (request.readyState == 4) {
+                  responseHeaders = 'Status: ' + request.status;
+                  responseHeaders = responseHeaders + '\nStatus Text: ' + request.statusText;
+                  responseHeaders = responseHeaders + '\n\n' + request.getAllResponseHeaders();
+                  document.getElementById('response_headers').textContent = responseHeaders;
+                  document.getElementById('response_body').textContent = request.responseText;
+              }
+          }
+
+          request.open(method, url);
+          if (token != '') {
+              // custom headers always trigger a pre-flight request
+              request.setRequestHeader('X-Auth-Token', token);
+          }
+          request.send(null);
+      }
+    </script>
+
+  </body>
+</html>
diff --git a/docker/dockerhub_description.md b/docker/dockerhub_description.md
new file mode 100644
index 0000000000..d5a3739f58
--- /dev/null
+++ b/docker/dockerhub_description.md
@@ -0,0 +1,50 @@
+# SAIO (Swift All in One)
+
+SAIO is a containerized instance of Openstack Swift object storage. It is
+running the main services of Swift, designed to provide an endpoint for
+application developers to test against both the Swift and AWS S3 API. It can
+also be used when integrating with a CI/CD system. These images are not
+configured to provide data durability and are not intended for production use.
+
+
+# Quickstart
+
+```
+docker pull openstackswift/saio
+docker run -d -p 8080:8080 openstackswift/saio
+```
+
+### Test against Swift API:
+
+Example using swift client to target endpoint:
+```
+swift -A http://127.0.0.1:8080/auth/v1.0 -U test:tester -K testing stat
+```
+
+### Test against S3 API:
+
+Example using s3cmd to test AWS S3:
+
+1. Create config file:
+```
+[default]
+access_key = test:tester
+secret_key = testing
+host_base = localhost:8080
+host_bucket = localhost:8080
+use_https = False
+```
+
+2. Test with s3cmd:
+```
+s3cmd -c s3cfg_saio mb s3://bucket
+```
+
+# Quick Reference
+
+- **Image tags**: `latest` automatically built/published by Zuul, follows
+   master branch. Releases are also tagged in case you want to test against
+   a specific release.
+- **Source Code**: github.com/openstack/swift
+- **Maintained by**: Openstack Swift community
+- **Feedback/Questions**: #openstack-swift on OFTC
diff --git a/docker/install_scripts/00_swift_needs.sh b/docker/install_scripts/00_swift_needs.sh
new file mode 100755
index 0000000000..b83621d7b0
--- /dev/null
+++ b/docker/install_scripts/00_swift_needs.sh
@@ -0,0 +1,22 @@
+#!/bin/sh
+set -e
+
+# adduser -D -H syslog && \
+for user in "swift"; do
+  if ! id -u $user > /dev/null 2>&1 ; then
+    adduser -D $user
+    printf "created user $user\n"
+  fi
+done
+printf "\n"
+# mkdir /srv/node && \
+# mkdir /var/spool/rsyslog && \
+# chown -R swift:swift /srv/node/ && \
+for dirname in "/srv/node" "$HOME/bin" "/opt" "/var/cache/swift" " /var/log/socklog/swift" "/var/log/swift/" "/var/run/swift"; do
+  if [ ! -d $dirname ]; then
+    mkdir -p $dirname
+    printf "created $dirname\n"
+  fi
+done
+# mkdir -p $HOME/bin && \
+# mkdir -p /opt
diff --git a/docker/install_scripts/10_apk_install_prereqs.sh b/docker/install_scripts/10_apk_install_prereqs.sh
new file mode 100755
index 0000000000..f021b4c113
--- /dev/null
+++ b/docker/install_scripts/10_apk_install_prereqs.sh
@@ -0,0 +1,27 @@
+#!/bin/sh
+set -e
+
+echo "@testing http://dl-cdn.alpinelinux.org/alpine/edge/testing" >> /etc/apk/repositories
+apk add --update \
+  linux-headers \
+  liberasurecode@testing \
+  liberasurecode-dev@testing \
+  gnupg \
+  git \
+  curl \
+  rsync \
+  memcached \
+  openssl \
+  openssl-dev \
+  sqlite \
+  sqlite-libs \
+  sqlite-dev \
+  xfsprogs \
+  zlib-dev \
+  g++ \
+  libffi \
+  libffi-dev \
+  libxslt \
+  libxslt-dev \
+  libxml2 \
+  libxml2-dev \
diff --git a/docker/install_scripts/21_apk_install_py3.sh b/docker/install_scripts/21_apk_install_py3.sh
new file mode 100755
index 0000000000..0bc647d513
--- /dev/null
+++ b/docker/install_scripts/21_apk_install_py3.sh
@@ -0,0 +1,12 @@
+#!/bin/sh
+set -e
+
+apk add --update \
+  python3 \
+  python3-dev \
+  py3-pip \
+  py3-cffi \
+  py3-cryptography
+
+if [ ! -e /usr/bin/pip ]; then ln -s pip3 /usr/bin/pip ; fi
+
diff --git a/docker/install_scripts/50_swift_install.sh b/docker/install_scripts/50_swift_install.sh
new file mode 100755
index 0000000000..953d75d541
--- /dev/null
+++ b/docker/install_scripts/50_swift_install.sh
@@ -0,0 +1,18 @@
+#!/bin/sh
+set -e
+
+pip install -U pip
+cd /opt/swift
+pip install -r requirements.txt
+pip install -e .
+
+cp doc/saio/bin/* $HOME/bin
+chmod +x $HOME/bin/*
+sed -i "s/bash/sh/g" $HOME/bin/*
+sed -i "s/sudo //g" $HOME/bin/*
+mkdir /root/tmp
+echo "export PATH=${PATH}:$HOME/bin" >> $HOME/.shrc
+echo "export PYTHON_EGG_CACHE=/root/tmp" >> $HOME/.shrc
+echo "export ENV=$HOME/.shrc" >> $HOME/.profile
+chmod +x $HOME/.shrc
+chmod +x $HOME/.profile
diff --git a/docker/install_scripts/60_pip_uninstall_dev.sh b/docker/install_scripts/60_pip_uninstall_dev.sh
new file mode 100755
index 0000000000..655aba5ccc
--- /dev/null
+++ b/docker/install_scripts/60_pip_uninstall_dev.sh
@@ -0,0 +1,9 @@
+#!/bin/sh
+set -e
+
+echo "- - - - - - - - uninstalling simplejson"
+pip uninstall --yes simplejson
+echo "- - - - - - - - uninstalling pyopenssl"
+pip uninstall --yes pyopenssl
+echo "- - - - - - - - deleting python3-dev residue (config-3.6m-x86_64-linux-gnu)"
+rm -rf /opt/usr/local/lib/python3.6/config-3.6m-x86_64-linux-gnu/
diff --git a/docker/install_scripts/99_apk_uninstall_dev.sh b/docker/install_scripts/99_apk_uninstall_dev.sh
new file mode 100755
index 0000000000..c4692ff3b4
--- /dev/null
+++ b/docker/install_scripts/99_apk_uninstall_dev.sh
@@ -0,0 +1,17 @@
+#!/bin/sh
+set -e
+
+cd /
+rm -rf /build
+
+apk del gnupg
+apk del git
+apk del openssl-dev
+apk del sqlite-dev
+apk del zlib-dev
+apk del g++
+apk del libffi-dev
+apk del libxslt-dev
+apk del libxml2-dev
+apk del python3-dev
+rm -rf /var/cache/apk/*
diff --git a/docker/install_scripts/python_test_dirs b/docker/install_scripts/python_test_dirs
new file mode 100644
index 0000000000..382d99284e
--- /dev/null
+++ b/docker/install_scripts/python_test_dirs
@@ -0,0 +1,7 @@
+/opt/python/usr/local/lib/python3.6/ctypes/test
+/opt/python/usr/local/lib/python3.6/distutils/tests
+/opt/python/usr/local/lib/python3.6/idlelib/idle_test
+/opt/python/usr/local/lib/python3.6/lib2to3/tests
+/opt/python/usr/local/lib/python3.6/sqlite3/test
+/opt/python/usr/local/lib/python3.6/test
+/opt/python/usr/local/lib/python3.6/tkinter/test
diff --git a/docker/rootfs/etc/cont-init.d/01_swift_logs b/docker/rootfs/etc/cont-init.d/01_swift_logs
new file mode 100644
index 0000000000..fcc3e4c6a8
--- /dev/null
+++ b/docker/rootfs/etc/cont-init.d/01_swift_logs
@@ -0,0 +1,4 @@
+#!/bin/sh
+
+s6-setuidgid swift ln -s /var/log/socklog/swift/swift_all/current /var/log/swift/all.log
+s6-setuidgid swift ln -s /var/log/socklog/swift/proxy_server/current /var/log/swift/proxy_access.log
diff --git a/docker/rootfs/etc/cont-init.d/02_build_remakerings b/docker/rootfs/etc/cont-init.d/02_build_remakerings
new file mode 100644
index 0000000000..e49d4a911a
--- /dev/null
+++ b/docker/rootfs/etc/cont-init.d/02_build_remakerings
@@ -0,0 +1,3 @@
+#!/usr/bin/with-contenv sh
+
+exec s6-setuidgid swift /etc/swift_build/prepare_rings
diff --git a/docker/rootfs/etc/fix-attrs.d/logging b/docker/rootfs/etc/fix-attrs.d/logging
new file mode 100644
index 0000000000..a8de639776
--- /dev/null
+++ b/docker/rootfs/etc/fix-attrs.d/logging
@@ -0,0 +1,2 @@
+/var/log/swift true swift 0755 0755
+/var/spool/rsyslog true syslog 0700 0700
diff --git a/docker/rootfs/etc/fix-attrs.d/srv_node b/docker/rootfs/etc/fix-attrs.d/srv_node
new file mode 100644
index 0000000000..adee7ec5e8
--- /dev/null
+++ b/docker/rootfs/etc/fix-attrs.d/srv_node
@@ -0,0 +1 @@
+/srv/node true swift 0700 0700
diff --git a/docker/rootfs/etc/fix-attrs.d/swift b/docker/rootfs/etc/fix-attrs.d/swift
new file mode 100644
index 0000000000..bf368314aa
--- /dev/null
+++ b/docker/rootfs/etc/fix-attrs.d/swift
@@ -0,0 +1,4 @@
+/etc/swift true swift 0700 0700
+/etc/swift/mime.types true swift 0700 0700
+/var/run/swift true swift 0755 0755
+/var/cache/swift true swift 0755 0755
diff --git a/docker/rootfs/etc/fix-attrs.d/tmp b/docker/rootfs/etc/fix-attrs.d/tmp
new file mode 100644
index 0000000000..8a6d27a5c0
--- /dev/null
+++ b/docker/rootfs/etc/fix-attrs.d/tmp
@@ -0,0 +1 @@
+/tmp true root 0700 0700
diff --git a/docker/rootfs/etc/profile b/docker/rootfs/etc/profile
new file mode 100644
index 0000000000..9ad1060e20
--- /dev/null
+++ b/docker/rootfs/etc/profile
@@ -0,0 +1,11 @@
+export CHARSET=UTF-8
+export PATH=/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/opt/python/usr/local/bin
+export PAGER=less
+export PS1='\h:\w\$ '
+umask 022
+
+for script in /etc/profile.d/*.sh ; do
+        if [ -r $script ] ; then
+                . $script
+        fi
+done
diff --git a/docker/rootfs/etc/rsyncd.conf b/docker/rootfs/etc/rsyncd.conf
new file mode 100644
index 0000000000..2d4a1fb35d
--- /dev/null
+++ b/docker/rootfs/etc/rsyncd.conf
@@ -0,0 +1,23 @@
+uid = swift
+gid = swift
+log file = /var/log/rsyncd.log
+pid file = /var/run/rsyncd.pid
+address = 127.0.0.1
+
+[account]
+max connections = 2
+path = /srv/node/
+read only = false
+lock file = /var/lock/account.lock
+
+[container]
+max connections = 2
+path = /srv/node/
+read only = false
+lock file = /var/lock/container.lock
+
+[object]
+max connections = 2
+path = /srv/node/
+read only = false
+lock file = /var/lock/object.lock
diff --git a/docker/rootfs/etc/rsyslog.conf b/docker/rootfs/etc/rsyslog.conf
new file mode 100644
index 0000000000..fa42783dab
--- /dev/null
+++ b/docker/rootfs/etc/rsyslog.conf
@@ -0,0 +1,64 @@
+#  /etc/rsyslog.conf	Configuration file for rsyslog.
+#
+#			For more information see
+#			/usr/share/doc/rsyslog-doc/html/rsyslog_conf.html
+#
+#  Default logging rules can be found in /etc/rsyslog.d/50-default.conf
+
+
+#################
+#### MODULES ####
+#################
+
+$ModLoad imuxsock # provides support for local system logging
+#$ModLoad imklog   # provides kernel logging support
+#$ModLoad immark  # provides --MARK-- message capability
+
+# provides UDP syslog reception
+#$ModLoad imudp
+#$UDPServerRun 514
+
+# provides TCP syslog reception
+#$ModLoad imtcp
+#$InputTCPServerRun 514
+
+# Enable non-kernel facility klog messages
+$KLogPermitNonKernelFacility on
+
+###########################
+#### GLOBAL DIRECTIVES ####
+###########################
+
+#
+# Use traditional timestamp format.
+# To enable high precision timestamps, comment out the following line.
+#
+$ActionFileDefaultTemplate RSYSLOG_TraditionalFileFormat
+
+# Filter duplicated messages
+$RepeatedMsgReduction on
+
+# Disable rate-limiting of log entries
+$SystemLogRateLimitInterval 0
+$SystemLogRateLimitBurst 0
+
+#
+# Set the default permissions for all log files.
+#
+$FileOwner syslog
+$FileGroup adm
+$FileCreateMode 0640
+$DirCreateMode 0755
+$Umask 0022
+$PrivDropToUser syslog
+$PrivDropToGroup syslog
+
+#
+# Where to place spool and state files
+#
+$WorkDirectory /var/spool/rsyslog
+
+#
+# Include all config files in /etc/rsyslog.d/
+#
+$IncludeConfig /etc/rsyslog.d/*.conf
diff --git a/docker/rootfs/etc/rsyslog.d/00-swift.conf b/docker/rootfs/etc/rsyslog.d/00-swift.conf
new file mode 100644
index 0000000000..00adb57258
--- /dev/null
+++ b/docker/rootfs/etc/rsyslog.d/00-swift.conf
@@ -0,0 +1,16 @@
+# NOTE: we used to enable UDP logging here, but we switched
+# back to just unix domain socket.
+
+#$imjournalRatelimitInterval 60
+#$imjournalRatelimitBurst 600000
+
+# *.*                         @127.0.0.1:514
+
+# Log all Swift proxy-server access log lines (local2) to
+# /var/log/swift/proxy_access.log
+local2.* /var/log/swift/proxy_access.log;RSYSLOG_FileFormat
+
+# Log all Swift lines to /var/log/swift/all.log
+# AND PREVENT FURTHER LOGGING OF THEM (eg. to /var/log/syslog)
+local0.*;local2.* /var/log/swift/all.log;RSYSLOG_TraditionalFileFormat
+& ~
diff --git a/docker/rootfs/etc/rsyslog.d/50-default.conf b/docker/rootfs/etc/rsyslog.d/50-default.conf
new file mode 100644
index 0000000000..d8283d485d
--- /dev/null
+++ b/docker/rootfs/etc/rsyslog.d/50-default.conf
@@ -0,0 +1,68 @@
+#  Default rules for rsyslog.
+#
+#			For more information see rsyslog.conf(5) and /etc/rsyslog.conf
+
+#
+# First some standard log files.  Log by facility.
+#
+auth,authpriv.*			/var/log/auth.log
+*.*;auth,authpriv.none		-/var/log/syslog
+#cron.*				/var/log/cron.log
+#daemon.*			-/var/log/daemon.log
+#kern.*				-/var/log/kern.log
+#lpr.*				-/var/log/lpr.log
+#mail.*				-/var/log/mail.log
+#user.*				-/var/log/user.log
+
+#
+# Logging for the mail system.  Split it up so that
+# it is easy to write scripts to parse these files.
+#
+#mail.info			-/var/log/mail.info
+#mail.warn			-/var/log/mail.warn
+mail.err			/var/log/mail.err
+
+#
+# Logging for INN news system.
+#
+news.crit			/var/log/news/news.crit
+news.err			/var/log/news/news.err
+news.notice			-/var/log/news/news.notice
+
+#
+# Some "catch-all" log files.
+#
+#*.=debug;\
+#	auth,authpriv.none;\
+#	news.none;mail.none	-/var/log/debug
+#*.=info;*.=notice;*.=warn;\
+#	auth,authpriv.none;\
+#	cron,daemon.none;\
+#	mail,news.none		-/var/log/messages
+
+#
+# Emergencies are sent to everybody logged in.
+#
+*.emerg                                :omusrmsg:*
+
+#
+# I like to have messages displayed on the console, but only on a virtual
+# console I usually leave idle.
+#
+#daemon,mail.*;\
+#	news.=crit;news.=err;news.=notice;\
+#	*.=debug;*.=info;\
+#	*.=notice;*.=warn	/dev/tty8
+
+# The named pipe /dev/xconsole is for the `xconsole' utility.  To use it,
+# you must invoke `xconsole' with the `-file' option:
+#
+#    $ xconsole -file /dev/xconsole [...]
+#
+# NOTE: adjust the list below, or you'll go crazy if you have a reasonably
+#      busy site..
+#
+daemon.*;mail.*;\
+	news.err;\
+	*.=debug;*.=info;\
+	*.=notice;*.=warn	|/dev/xconsole
diff --git a/docker/rootfs/etc/services.d/memcached/run b/docker/rootfs/etc/services.d/memcached/run
new file mode 100644
index 0000000000..a6d5f994d6
--- /dev/null
+++ b/docker/rootfs/etc/services.d/memcached/run
@@ -0,0 +1,3 @@
+#!/usr/bin/execlineb -P
+
+memcached -u root -l 127.0.0.1
diff --git a/docker/rootfs/etc/services.d/swift-account/run b/docker/rootfs/etc/services.d/swift-account/run
new file mode 100644
index 0000000000..f310983146
--- /dev/null
+++ b/docker/rootfs/etc/services.d/swift-account/run
@@ -0,0 +1,5 @@
+#!/bin/sh
+source /etc/profile
+
+# swift-account-server /etc/swift/account-server.conf
+exec s6-setuidgid swift swift-init account restart --no-daemon
diff --git a/docker/rootfs/etc/services.d/swift-container/run b/docker/rootfs/etc/services.d/swift-container/run
new file mode 100644
index 0000000000..0ed34dad05
--- /dev/null
+++ b/docker/rootfs/etc/services.d/swift-container/run
@@ -0,0 +1,5 @@
+#!/bin/sh
+source /etc/profile
+
+# swift-container-server /etc/swift/container-server.conf
+exec s6-setuidgid swift swift-init container restart --no-daemon
diff --git a/docker/rootfs/etc/services.d/swift-object/run b/docker/rootfs/etc/services.d/swift-object/run
new file mode 100644
index 0000000000..80f8c8d618
--- /dev/null
+++ b/docker/rootfs/etc/services.d/swift-object/run
@@ -0,0 +1,4 @@
+#!/bin/sh
+source /etc/profile
+
+exec s6-setuidgid swift swift-init object restart --no-daemon
diff --git a/docker/rootfs/etc/services.d/swift-proxy/run b/docker/rootfs/etc/services.d/swift-proxy/run
new file mode 100644
index 0000000000..be73b5398d
--- /dev/null
+++ b/docker/rootfs/etc/services.d/swift-proxy/run
@@ -0,0 +1,5 @@
+#!/bin/sh
+source /etc/profile
+
+# swift-proxy-server /etc/swift/proxy-server.conf
+exec s6-setuidgid swift swift-init proxy restart --no-daemon
diff --git a/docker/rootfs/etc/socklog.rules/swift_account_server b/docker/rootfs/etc/socklog.rules/swift_account_server
new file mode 100644
index 0000000000..7a8ddb8ea0
--- /dev/null
+++ b/docker/rootfs/etc/socklog.rules/swift_account_server
@@ -0,0 +1,3 @@
+-
++\local5.*
+/var/log/socklog/swift/account_server
diff --git a/docker/rootfs/etc/socklog.rules/swift_all b/docker/rootfs/etc/socklog.rules/swift_all
new file mode 100644
index 0000000000..6ce9c899dc
--- /dev/null
+++ b/docker/rootfs/etc/socklog.rules/swift_all
@@ -0,0 +1,7 @@
+-
++\local5.*
++\local4.*
++\local3.*
++\local2.*
++\local0.*
+/var/log/socklog/swift/swift_all
diff --git a/docker/rootfs/etc/socklog.rules/swift_container_server b/docker/rootfs/etc/socklog.rules/swift_container_server
new file mode 100644
index 0000000000..428119e964
--- /dev/null
+++ b/docker/rootfs/etc/socklog.rules/swift_container_server
@@ -0,0 +1,3 @@
+-
++\local4.*
+/var/log/socklog/swift/container_server
diff --git a/docker/rootfs/etc/socklog.rules/swift_object_server b/docker/rootfs/etc/socklog.rules/swift_object_server
new file mode 100644
index 0000000000..e2e92fe9d2
--- /dev/null
+++ b/docker/rootfs/etc/socklog.rules/swift_object_server
@@ -0,0 +1,3 @@
+-
++\local3.*
+/var/log/socklog/swift/object_server
diff --git a/docker/rootfs/etc/socklog.rules/swift_proxy_server b/docker/rootfs/etc/socklog.rules/swift_proxy_server
new file mode 100644
index 0000000000..b743082168
--- /dev/null
+++ b/docker/rootfs/etc/socklog.rules/swift_proxy_server
@@ -0,0 +1,3 @@
+-
++\local2.*
+/var/log/socklog/swift/proxy_server
diff --git a/docker/rootfs/etc/swift/account-server.conf b/docker/rootfs/etc/swift/account-server.conf
new file mode 100644
index 0000000000..fd61d550ca
--- /dev/null
+++ b/docker/rootfs/etc/swift/account-server.conf
@@ -0,0 +1,25 @@
+[DEFAULT]
+devices = /srv/node/
+bind_ip = 127.0.0.1
+bind_port = 6202
+workers = 2
+mount_check = false
+log_facility = LOG_LOCAL5
+
+[pipeline:main]
+pipeline = healthcheck recon account-server
+
+[app:account-server]
+use = egg:swift#account
+
+[filter:recon]
+use = egg:swift#recon
+
+[filter:healthcheck]
+use = egg:swift#healthcheck
+
+[account-replicator]
+
+[account-auditor]
+
+[account-reaper]
diff --git a/docker/rootfs/etc/swift/container-server.conf b/docker/rootfs/etc/swift/container-server.conf
new file mode 100644
index 0000000000..aec046aafa
--- /dev/null
+++ b/docker/rootfs/etc/swift/container-server.conf
@@ -0,0 +1,27 @@
+[DEFAULT]
+devices = /srv/node/
+bind_ip = 127.0.0.1
+bind_port = 6201
+workers = 2
+mount_check = false
+log_facility = LOG_LOCAL4
+
+[pipeline:main]
+pipeline = healthcheck recon container-server
+
+[app:container-server]
+use = egg:swift#container
+
+[filter:recon]
+use = egg:swift#recon
+
+[filter:healthcheck]
+use = egg:swift#healthcheck
+
+[container-replicator]
+
+[container-updater]
+
+[container-auditor]
+
+[container-sync]
diff --git a/docker/rootfs/etc/swift/object-server.conf b/docker/rootfs/etc/swift/object-server.conf
new file mode 100644
index 0000000000..67bbf2cb37
--- /dev/null
+++ b/docker/rootfs/etc/swift/object-server.conf
@@ -0,0 +1,26 @@
+[DEFAULT]
+devices = /srv/node/
+bind_ip = 127.0.0.1
+bind_port = 6200
+workers = 2
+mount_check = false
+log_facility = LOG_LOCAL3
+
+[pipeline:main]
+pipeline = healthcheck recon object-server
+
+[app:object-server]
+use = egg:swift#object
+
+[filter:recon]
+use = egg:swift#recon
+
+[filter:healthcheck]
+use = egg:swift#healthcheck
+
+
+[object-replicator]
+
+[object-updater]
+
+[object-auditor]
diff --git a/docker/rootfs/etc/swift/proxy-server.conf b/docker/rootfs/etc/swift/proxy-server.conf
new file mode 100644
index 0000000000..8189cb7f2d
--- /dev/null
+++ b/docker/rootfs/etc/swift/proxy-server.conf
@@ -0,0 +1,100 @@
+[DEFAULT]
+bind_ip = 0.0.0.0
+bind_port = 8080
+log_address = /dev/log
+log_facility = LOG_LOCAL2
+log_headers = false
+log_level = DEBUG
+log_name = proxy-server
+user = swift
+
+[pipeline:main]
+pipeline = catch_errors gatekeeper healthcheck proxy-logging cache etag-quoter listing_formats bulk tempurl ratelimit s3api tempauth staticweb copy container-quotas account-quotas slo dlo versioned_writes symlink proxy-logging proxy-server
+
+[filter:catch_errors]
+use = egg:swift#catch_errors
+
+[filter:healthcheck]
+use = egg:swift#healthcheck
+
+[filter:proxy-logging]
+use = egg:swift#proxy_logging
+
+[filter:bulk]
+use = egg:swift#bulk
+
+[filter:ratelimit]
+use = egg:swift#ratelimit
+
+[filter:crossdomain]
+use = egg:swift#crossdomain
+
+[filter:dlo]
+use = egg:swift#dlo
+
+[filter:slo]
+use = egg:swift#slo
+
+[filter:tempurl]
+use = egg:swift#tempurl
+
+[filter:tempauth]
+use = egg:swift#tempauth
+user_admin_admin = admin .admin .reseller_admin
+user_test_tester = testing .admin
+user_test_tester2 = testing2 .admin
+user_test_tester3 = testing3
+user_test2_tester2 = testing2 .admin
+
+[filter:staticweb]
+use = egg:swift#staticweb
+
+[filter:account-quotas]
+use = egg:swift#account_quotas
+
+[filter:container-quotas]
+use = egg:swift#container_quotas
+
+[filter:cache]
+use = egg:swift#memcache
+
+[filter:etag-quoter]
+use = egg:swift#etag_quoter
+enable_by_default = false
+
+[filter:gatekeeper]
+use = egg:swift#gatekeeper
+
+[filter:versioned_writes]
+use = egg:swift#versioned_writes
+allow_versioned_writes = true
+allow_object_versioning = true
+
+[filter:copy]
+use = egg:swift#copy
+
+[filter:listing_formats]
+use = egg:swift#listing_formats
+
+[filter:symlink]
+use = egg:swift#symlink
+
+# To enable, add the s3api middleware to the pipeline before tempauth
+[filter:s3api]
+use = egg:swift#s3api
+cors_preflight_allow_origin = *
+
+# Example to create root secret: `openssl rand -base64 32`
+[filter:keymaster]
+use = egg:swift#keymaster
+encryption_root_secret = changeme/changeme/changeme/changeme/change/=
+
+# To enable use of encryption add both middlewares to pipeline, example:
+# <other middleware> keymaster encryption proxy-logging proxy-server
+[filter:encryption]
+use = egg:swift#encryption
+
+[app:proxy-server]
+use = egg:swift#proxy
+allow_account_management = true
+account_autocreate = true
diff --git a/docker/rootfs/etc/swift/swift.conf b/docker/rootfs/etc/swift/swift.conf
new file mode 100644
index 0000000000..129a5d98a2
--- /dev/null
+++ b/docker/rootfs/etc/swift/swift.conf
@@ -0,0 +1,17 @@
+[swift-hash]
+# random unique strings that can never change (DO NOT LOSE)
+swift_hash_path_prefix = bd08f643f5663c4ec607
+swift_hash_path_suffix = f423bf7ab663888fe832
+
+[storage-policy:0]
+name = 1replica
+default = true
+policy_type = replication
+
+# [storage-policy:1]
+# name = EC42
+# policy_type = erasure_coding
+# ec_type = liberasurecode_rs_vand
+# ec_num_data_fragments = 4
+# ec_num_parity_fragments = 2
+# ec_object_segment_size = 1048576
diff --git a/docker/rootfs/etc/swift_build/build_devices b/docker/rootfs/etc/swift_build/build_devices
new file mode 100755
index 0000000000..7588377dd1
--- /dev/null
+++ b/docker/rootfs/etc/swift_build/build_devices
@@ -0,0 +1,62 @@
+#!/usr/bin/with-contenv sh
+
+cd /etc/swift
+DEV_SIZE="1GB"
+# POLICIES="object container account"
+MY_STORAGE_TYPE=${STORAGE_TYPE:-"internal_dirs"}
+MY_DEVICE_COUNT=${DEVICE_COUNT:-6}
+
+echo "[[ checking --privileged ]]"
+ip link add dummy0 type dummy >/dev/null
+if [[ $? -eq 0 ]]; then
+  PRIVILEGED=true
+  # clean the dummy0 link
+  ip link delete dummy0 >/dev/null
+else
+  PRIVILEGED=false
+fi
+
+echo "storage type is $MY_STORAGE_TYPE. container is privileged? $PRIVILEGED"
+
+echo "[[ checking what to use as storage devices ]]"
+DEVICE_LIST=""
+if [[ $MY_STORAGE_TYPE == "external_devices" ]]; then
+  DEVICE_LIST=$(ls /dev/ | grep -i "swift-d")
+  MY_DEVICE_COUNT=$(wc -w $DEVICE_LIST)
+  echo "  using external device. devices found: $DEVICE_LIST"
+elif [[ $MY_DEVICE_COUNT -le 0 ]]; then
+  echo "Device count must be greater than 0"
+  exit -1
+else
+  for i in $(seq 0 $(( MY_DEVICE_COUNT-1 ))); do
+    DEVICE_LIST="$DEVICE_LIST swift-d$i"
+  done
+  # echo "  using internal devices. devices to create: $DEVICE_LIST"
+fi
+
+if [[ $MY_STORAGE_TYPE == "internal_devices" ]]; then
+  for device in $DEVICE_LIST; do
+    truncate -s $DEV_SIZE /dev/$device;
+    echo "    created storage device /dev/swift-d$i of $DEV_SIZE";
+  done
+fi
+
+export PATH=$PATH:/opt/python/usr/local/bin/
+
+echo "[[ creating directories ]]"
+for dir in $DEVICE_LIST; do
+  mkdir -p /srv/node/$dir;
+  echo "  created /srv/node/$dir";
+done
+
+if [[ $MY_STORAGE_TYPE == "internal_devices" ]] || [[ $MY_STORAGE_TYPE == "external_devices" ]]; then
+  echo "[[ formating and mounting storage devices ]] "
+  for device in $DEVICE_LIST; do
+    # truncate -s $DEV_SIZE /dev/swift-d$i;
+    # echo "created storage device /dev/swift-d$i of $DEV_SIZE";
+    mkfs.xfs -f -L D$i -i size=512 /dev/$device;
+    echo "  created XFS file system on device /dev/$device";
+    mount -t xfs -o noatime /dev/$device /srv/node/$device;
+    echo "  mounted /dev/$device as /srv/node/$device";
+  done
+fi
diff --git a/docker/rootfs/etc/swift_build/build_remakerings b/docker/rootfs/etc/swift_build/build_remakerings
new file mode 100755
index 0000000000..08830d6491
--- /dev/null
+++ b/docker/rootfs/etc/swift_build/build_remakerings
@@ -0,0 +1,36 @@
+#!/usr/bin/with-contenv sh
+
+POLICIES="object container account"
+
+for p in $POLICIES; do
+  echo "swift-ring-builder $p.builder create 10 1 1" > /etc/swift/remakerings.$p;
+  echo "started /etc/swift/remakerings.$p with 'swift-ring-build create'"
+done
+
+
+for drive in `ls /srv/node/ | grep 'swift-d'`; do
+  echo "swift-ring-builder object.builder add r1z1-127.0.0.1:6200/$drive 1" >> /etc/swift/remakerings.object
+  echo "pushed command to add r1z1-127.0.0.1:6200/$drive to /etc/swift/remakerings.object"
+  echo "swift-ring-builder container.builder add r1z1-127.0.0.1:6201/$drive 1" >> /etc/swift/remakerings.container
+  echo "pushed command to add r1z1-127.0.0.1:6201/$drive to /etc/swift/remakerings.container"
+  echo "swift-ring-builder account.builder add r1z1-127.0.0.1:6202/$drive 1" >> /etc/swift/remakerings.account
+  echo "pushed command to add r1z1-127.0.0.1:6202/$drive to /etc/swift/remakerings.account"
+done
+
+for p in $POLICIES; do
+  echo "swift-ring-builder $p.builder rebalance" >> /etc/swift/remakerings.$p;
+  echo "pushed command to rebalance ring into /etc/swift/remakerings.$p"
+done
+
+echo "rm -f *.builder *.ring.gz backups/*.builder backups/*.ring.gz" > /etc/swift/remakerings
+echo "created umbrella /etc/swift/remakerings, with deleting all ring files"
+
+for p in $POLICIES; do
+  cat /etc/swift/remakerings.$p >> /etc/swift/remakerings;
+  echo "pushed /etc/swift/remakerings.$p to /etc/swift/remakerings"
+  rm -f /etc/swift/remakerings.$p;
+  echo "deleted /etc/swift/remakerings.$p"
+done
+
+chmod +x /etc/swift/remakerings
+echo "made remaketings executable (+x)"
diff --git a/docker/rootfs/etc/swift_build/prepare_rings b/docker/rootfs/etc/swift_build/prepare_rings
new file mode 100755
index 0000000000..7b951ff223
--- /dev/null
+++ b/docker/rootfs/etc/swift_build/prepare_rings
@@ -0,0 +1,6 @@
+#!/usr/bin/with-contenv sh
+
+/etc/swift_build/build_devices
+/etc/swift_build/build_remakerings
+cd /etc/swift
+/etc/swift/remakerings
diff --git a/docker/s6-gpg-pub-key b/docker/s6-gpg-pub-key
new file mode 100644
index 0000000000..c3a865fa2c
--- /dev/null
+++ b/docker/s6-gpg-pub-key
@@ -0,0 +1,69 @@
+-----BEGIN PGP PUBLIC KEY BLOCK-----
+Version: SKS 1.1.6
+Comment: Hostname: pgp.mit.edu
+
+mQINBFe3YfMBEAC6pERKLjXDcWWrMU9l68ujJkbCjtnKYRKsIjsmvoETHJkCZaHXX0JoVFth
+7OEhEh8wQG6PTWb6HPFWJxKJaLTOS6d5xc7i8iMWFjUkssh7jEJY0unON8OleggjL4bPz2Ra
+Ox5hKJru1A8BjDdT4XyYWk+PFjaJGmll7FyqyVIng2bGRYgRah+CjKPjzk1RX5cfz48lO1wg
+Fs4rzd/SrpcbqMW1nv57ZCNK1nPrDpXytrMA2ZaMxWa5I13NXTQ9hJw0yhCV46f+4vXBvz4l
+0HrVqlZE16iaiW9rniHHM1FFqH9aOMU6PWWNzrO4cyMiNBEgLT5jNAFFteKufUKaOlGRT768
+kyRfvC/uYND3BdZ8EcC+e8Fe+g7Xj/L85853XeCApDIT+FG4Poiby71SWu/PDk9qm/BJ18kh
+6f8EJvWJWMBQJCQHYs5LWEU0BUSnFucbJhd6wF+47wDC9hByvwSOc+5Q4BIj4WHoOCYjaeX5
+ET2Kto7+E4UZjC+38q0G7oH4sOfe7FFHW/R9y/9AUj/AGhNx+lyruKOXKuTZByZlHZKWV4LT
+mkey3NIRahYKWWZIBN8ndAkP62QHuMGfWOKDC6VwgFVQGkHGYZ3NuEUNsN35P77XY7G7K8dV
+wlidTS57JZarNpILNJJsYkfMd6zrRZf9a+cZWMxyvgXKgaCx4QARAQABtDVKdXN0IENvbnRh
+aW5lcnMgQm90IDxqdXN0LmNvbnRhaW5lcnMucm9ib3RAZ21haWwuY29tPokCNAQTAQoAHgUC
+V7dh8wIbAwMLCQcDFQoIAh4BAheAAxYCAQIZAQAKCRBhAbJ4Oy/RYQrJD/49WWEJXgcZClEt
+BQUTo9KZKehAh9K5+455/lFtUh8YEhiF+7HAVlOL3KlGbg/ZUXkrXbGMW4Cm91nz99Fr+rZp
+LPcogZ0Lox5IVPn6zjmxRrWuaEvH/SlnhjUiBj9/rMgWwzTSV0PLP6bOhMJ0NIteAgW+jzSy
+4Sf4N+3XE1HAeL3sUtYex0FXzRTQAjMAnCa6AJS1dCJRc0tuI13XkiZnVnqELF2CCSnaPj6o
+hn/90/sKhr7PSGQznagiAjG49nzqOE/9CRVOy8JqNS+1Y8A1PmCVofvgy3uaPKL/yLMRXk2j
++5Fed9aVGXG3JE5lJjWUAyeL3jTEdE336tc+kHVUXrTSza/akvFHTJQfaw+MVuRIPT2JvZLl
+ePOxHgM+U9eOJ7rwXYoLS/e5KrGvhi+LCMO3r4UfIGL3cgtGkM7rwvfY3uMCq7hfoA6d4SGw
+h99J6h3M7O9+UxB4VH8yjQJl6ghY0ruEgp1PpKSo9Ogdz/loZpEExnOzp4zrdFalKcy9ehUh
+Ody/S79NlKsWOE1DtbM6IQHDxZplT9IJhTxuqrDgsIaYgwUxipqvA/kEU5k5QIIoJU8u5o6i
+ZLuC6mlqOhjmLst6/ndXuVAG4GwDKrwxri3zmctxHRwDzTJXsZsKYOqrheO6HRu+6VVVNAI5
+Q/nI/vN79vbZGAb8Z5PgZrkBDQRXt2HzAQgAsrKhLIusc/9dUOPi9f3FN30obwZLZRp8qTND
+glqSyAaL5WiiGJII1erM66s1dIv1qqUbTNd6nAKfb2w5zbgAOTAKsGNEzljFKAApdZm/sAyk
+Wx9PTqVQov6PAjzgoWC9yH8UcxhvxPtpw+rqnz1oUVK9paszoZWuPz5jAE/ZhdrEXy/51ckS
+jJ/p8T55SFK3p6UzSGDqQRfDwHDgDJMIzPABpnPk+ETf/YYWbJwOx81YrlRKBau8XdyBkRlK
+ZeZ+SrvDMugn45lWSdjXJZ2BH1U7akuWd7lYP3xI/Vfs2rF3e+7+72W75s/3pOVckdbgn13B
+REgdptgOBX9ILCtpwQARAQABiQNEBBgBCgAPBQJXt2HzBQkPCZwAAhsiASkJEGEBsng7L9Fh
+wF0gBBkBCgAGBQJXt2HzAAoJECU2yhbfT82iCzoH/iAw5+zBpXdE3Ju/KrCpZ4JwzSkAw4n7
+uj4UzTtzYb5KfkXAkIQFq5MTHJ6jpHe6g6aJf5Z4NV2cbw/4d9W5rAzXkuKnksoo7JbRDt+T
+adCBCuoz8HvkVT4lgV6TTWx3kMESGaqz/y0d8P+FRCKhmbv4ayTAZZJM2cdDcqtum8sYPs9R
+d6L13x8hZGTSKavLwus64/GA2tOa334zDDI1+7AoJRRLApqdYZmX/LrQykNoNR7RSzLIn5+S
+GdCS6JU8c0oQnJgf+7zililWqagkYRqaHhcBy90XiYOPMdHyKmudcfvpYLE78E0iyHhfmsAj
+I+pK3U4MquRA+v8AfL5/PLRKbhAAomTfB2WPI9ea1nN6OfCZZE9bq/PVmeahW0CZoBmCQJLn
+oypbBtMUnOhSFd+QUWekH8+prkvq15s8LdjfhJWlzMRbwourZvffmeHX8dTuMZwwV+7flnf+
+AH9OnwcKNg5/T4aRm3gZGSV7fTFh1Regx3136TIyRcwPqjwqbc9slW6Bg9veE3ayveUKaG0S
+WDjkPad4wqFWTF84vAD+T6p1hMxBrInkj8ocHXkyxdndQAuVd4dCjdm/dlpFs/ntZFhVQUFG
+zjqZaSvqQpKIui1x3WDap1RFy7n81B/e23eO+R8CyJg+upI38FIroR38EGhEFAjgcqKSi+0f
+WDsXR49XjIO5EX7RkFhnMudvMA+sW2PsI7yAfIFrTO8VEnevAwsVNIeTpyYnVVFBTUGeRP5u
+9eNoLO3wHpARvsT4JtmdVWoTX2XzQA9xXa+6cOmiT4XLnwtIU4a8W1dfINqMUVLBhIJD2zvL
+TppISqzmIISugSMiNND0kvkp9moYXz0QodrEHzJDZmzqbTv5IAs+gPER1eNS2BZKJjXJ7Egn
+2JDWIRgm2kzS1BaSyL004F39AfsKCBcsBsbsTIUcmpRUwLjMpdkomkGGA3RHnfk06odrEEQO
+72ZOIsIwd1+X5U8tK9pnEH0/RsZONUMPtGrQ4Pe0ZlNZUHCyN6U633MUO32Wmru5AQ0EV7dh
+8wEIAOAvY6Wrlp6k/Fknu/wIZLWoGIOTR11iYgHHvVWWeoatleewsqHbzCMiCQ5txX5RJJv7
+F5xDURmoqwpKdkjFVqriuCt506MeztBohRqTvDYOczS/eQJuI+pR9/aGmESErP9+B9AmQ+rN
+no391Z+HRI75VIP+AnTZGYVMec5fQbFUwws3Dt9VeXgPIPixfVoXtz5vQPj9EfH3RTQ//9Vz
+zznZkHBPFMroM3VLznwlDb9a2Z4S4WVgztMMrZnlYmym6tN1sm61TPNK+4KFy+FNFbudcHcg
+AXXT7H5/rNhUD8aMMLAQHqNCeg/eXCQO0Sp2TzBs/x90jti9cGmyMfsZDKkAEQEAAYkDRAQY
+AQoADwUCV7dh8wUJDwmcAAIbDAEpCRBhAbJ4Oy/RYcBdIAQZAQoABgUCV7dh8wAKCRDZBk7K
+WLNt46vQB/0QOlN8vMJNVlJJZ2TD+Es63/bjd/oa1djnBXFhqii/vY1WI7c1lUK+JPIu7RpE
+eb3ZwpwnTeHxLe+kJtvEjTdHygM0KtWdq+MHAX+t+5AJA9UyVIQupztH+/87/GvtxYMIQRwg
+WY9ExP1HAi8vyLxOxQNmc1A3boYY5GA16L3AOGxtOIn43qDTz5RwY+s1A1zyUq4zczBA/Fma
+ddqN0N/arjHEkE1cLXEypcYme1xfLE8mpU3/7FSyHdQxW2o/KqoDkqVj12oKAMuBnKcYoKmr
+qsmy8eHpmbfMUrRE7frpGeF4II/NgCfEYOAxysOOq4IRXQClaZpquL4AOXN2EVjz/awQAKU6
+fpScpzZoNAMJYnbTQrs8YEy4VUFvUyZWpSVDj5aAhrZApbb7LfGQyBMFxHARnwDGv9AK6Sl+
+vHp8zvPn9nHE3D9tLGIWtjCRRhPe/RY1wWyw8ZUmBN6jDZ1LSh/Tqr7J24zsLmxGBUJcDfZ/
+awv/sabqPp0AGbs/qQwjxgWj9en6IS2+mWnWL3sQXOmxdFil/0+Tx5WOrEtCkR35yPLnTSeY
+xKP6KKfG7gA8xLxXKxxVMojjAzN0Dxb0+0iQ4RwPygb79OzAsx588Rv2Qo8kf0QyvgUZhufv
+q355qQ248FU4gBEcLc5b2yu1Iz1nToubu74Uwl9t7XzZs+RP/6ZGuItSHxsqLzVFexmNdcXh
+oKfu58NnH1Fi9wMKtAKCH31q235wSh/x0YM391cdIvSjxfItNXtykR7KDbal7YLOa5dKyRyf
+2WiYMCEAQSoRVj6A4ylRsqs9hirvYinNSWPa1ZrketKz+9g+rj0/pmQjKAPiapYkarp5yT8d
+dgQ1XuwGCaPZXhByS9s6SonZwvrthrHFoWfK7JzkepYoBKy/nGUNt+9NDWbCB6sAe2zLAfmA
+tsOhB7ZO8/AlPRQCIvEGRXcEtbYkxtB2vMNGPbIoHDv5QvbHP0Foj79SwRg/2a9wiq6i5Vwv
+wGWOhC4ELGF+imX35GGbJq0a8A2z5WX6
+=VHze
+-----END PGP PUBLIC KEY BLOCK-----
diff --git a/etc/account-server.conf-sample b/etc/account-server.conf-sample
index 5cb0d2897e..fc21517a11 100644
--- a/etc/account-server.conf-sample
+++ b/etc/account-server.conf-sample
@@ -1,38 +1,86 @@
 [DEFAULT]
 # bind_ip = 0.0.0.0
-# bind_port = 6002
+bind_port = 6202
+# keep_idle = 600
 # bind_timeout = 30
 # backlog = 4096
-# workers = 1
 # user = swift
 # swift_dir = /etc/swift
 # devices = /srv/node
 # mount_check = true
 # disable_fallocate = false
+#
+# Use an integer to override the number of pre-forked processes that will
+# accept connections.
+# workers = auto
+#
+# Maximum concurrent requests per worker
+# max_clients = 1024
+#
 # You can specify default log routing here if you want:
 # log_name = swift
 # log_facility = LOG_LOCAL0
 # log_level = INFO
 # log_address = /dev/log
+# The following caps the length of log lines to the value given; no limit if
+# set to 0, the default.
+# log_max_line_length = 0
+#
+# Hashing algorithm for log anonymization. Must be one of algorithms supported
+# by Python's hashlib.
+# log_anonymization_method = MD5
+#
+# Salt added during log anonymization
+# log_anonymization_salt =
+#
+# Template used to format logs. All words surrounded by curly brackets
+# will be substituted with the appropriate values
+# log_format = {remote_addr} - - [{time.d}/{time.b}/{time.Y}:{time.H}:{time.M}:{time.S} +0000] "{method} {path}" {status} {content_length} "{referer}" "{txn_id}" "{user_agent}" {trans_time:.4f} "{additional_info}" {pid} {policy_index}
+#
 # comma separated list of functions to call to setup custom log handlers.
 # functions get passed: conf, name, log_to_console, log_route, fmt, logger,
 # adapted_logger
 # log_custom_handlers =
+#
 # If set, log_udp_host will override log_address
 # log_udp_host =
 # log_udp_port = 514
+#
 # You can enable StatsD logging here:
-# log_statsd_host = localhost
+# log_statsd_host =
 # log_statsd_port = 8125
-# log_statsd_default_sample_rate = 1
+# log_statsd_default_sample_rate = 1.0
+# log_statsd_sample_rate_factor = 1.0
 # log_statsd_metric_prefix =
+#
 # If you don't mind the extra disk space usage in overhead, you can turn this
 # on to preallocate disk space with SQLite databases to decrease fragmentation.
 # db_preallocation = off
+#
+# Enable this option to log all sqlite3 queries (requires python >=3.3)
+# db_query_logging = off
+#
 # eventlet_debug = false
+#
+# You can set fallocate_reserve to the number of bytes or percentage of disk
+# space you'd like fallocate to reserve, whether there is space for the given
+# file size or not. Percentage will be used if the value ends with a '%'.
+# fallocate_reserve = 1%
+#
+# You can set scheduling priority of processes. Niceness values range from -20
+# (most favorable to the process) to 19 (least favorable to the process).
+# nice_priority =
+#
+# You can set I/O scheduling class and priority of processes. I/O niceness
+# class values are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and
+# IOPRIO_CLASS_IDLE (idle). I/O niceness priority is a number which goes from
+# 0 to 7. The higher the value, the lower the I/O priority of the process.
+# Work only with ionice_class.
+# ionice_class =
+# ionice_priority =
 
 [pipeline:main]
-pipeline = healthcheck recon account-server
+pipeline = healthcheck recon backend_ratelimit account-server
 
 [app:account-server]
 use = egg:swift#account
@@ -40,9 +88,41 @@ use = egg:swift#account
 # set log_name = account-server
 # set log_facility = LOG_LOCAL0
 # set log_level = INFO
-# set log_requests = True
+# set log_requests = true
 # set log_address = /dev/log
-# auto_create_account_prefix = .
+#
+# You can disable REPLICATE handling (default is to allow it). When deploying
+# a cluster with a separate replication network, you'll want multiple
+# account-server processes running: one for client-driven traffic and another
+# for replication traffic. The server handling client-driven traffic may set
+# this to false. If there is only one account-server process, leave this as
+# true.
+# replication_server = true
+#
+# You can set scheduling priority of processes. Niceness values range from -20
+# (most favorable to the process) to 19 (least favorable to the process).
+# nice_priority =
+#
+# You can set I/O scheduling class and priority of processes. I/O niceness
+# class values are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and
+# IOPRIO_CLASS_IDLE (idle). I/O niceness priority is a number which goes from
+# 0 to 7. The higher the value, the lower the I/O priority of the process.
+# Work only with ionice_class.
+# ionice_class =
+# ionice_priority =
+#
+# You can set fallocate_reserve to the number of bytes or percentage
+# of disk space you'd like kept free at all times. If the disk's free
+# space falls below this value, then PUT, POST, and REPLICATE requests
+# will be denied until the disk ha s more space available. Percentage
+# will be used if the value ends with a '%'.
+# fallocate_reserve = 1%
+#
+# When reloading servers with SIGUSR1, workers running with old config/code
+# are allowed some time to finish serving in-flight requests. Use this to
+# configure the grace period (in seconds), after which the reloaded server
+# will issue SIGKILLs to remaining stale workers.
+# stale_worker_timeout = 86400
 
 [filter:healthcheck]
 use = egg:swift#healthcheck
@@ -54,29 +134,106 @@ use = egg:swift#healthcheck
 use = egg:swift#recon
 # recon_cache_path = /var/cache/swift
 
+[filter:backend_ratelimit]
+use = egg:swift#backend_ratelimit
+# Config options can optionally be loaded from a separate config file. Config
+# options in this section will be used unless the same option is found in the
+# config file, in which case the config file option will be used. See the
+# backend-ratelimit.conf-sample file for details of available config options.
+# backend_ratelimit_conf_path = /etc/swift/backend-ratelimit.conf
+
+# The minimum interval between attempts to reload any config file at
+# backend_ratelimit_conf_path while the server is running. A value of 0 means
+# that the file is loaded at start-up but not subsequently reloaded. Note that
+# config options in this section are never reloaded after start-up.
+# config_reload_interval = 60
+
 [account-replicator]
 # You can override the default log routing for this app here (don't use set!):
 # log_name = account-replicator
 # log_facility = LOG_LOCAL0
 # log_level = INFO
 # log_address = /dev/log
-# vm_test_mode = no
+#
+# Maximum number of database rows that will be sync'd in a single HTTP
+# replication request. Databases with less than or equal to this number of
+# differing rows will always be sync'd using an HTTP replication request rather
+# than using rsync.
 # per_diff = 1000
+#
+# Maximum number of HTTP replication requests attempted on each replication
+# pass for any one container. This caps how long the replicator will spend
+# trying to sync a given database per pass so the other databases don't get
+# starved.
 # max_diffs = 100
+#
+# Number of replication workers to spawn.
 # concurrency = 8
-# interval = 30
-# How long without an error before a node's error count is reset. This will
-# also be how long before a node is reenabled after suppression is triggered.
-# error_suppression_interval = 60
-# How many errors can accumulate before a node is temporarily ignored.
-# error_suppression_limit = 10
+#
+# Time in seconds to wait between replication passes
+# interval = 30.0
+# run_pause is deprecated, use interval instead
+# run_pause = 30.0
+#
+# Process at most this many databases per second
+# databases_per_second = 50
+#
 # node_timeout = 10
 # conn_timeout = 0.5
+#
 # The replicator also performs reclamation
 # reclaim_age = 604800
-# Time in seconds to wait between replication passes
-# run_pause = 30
+#
+# Allow rsync to compress data which is transmitted to destination node
+# during sync. However, this is applicable only when destination node is in
+# a different region than the local one.
+# rsync_compress = no
+#
+# Format of the rsync module where the replicator will send data. See
+# etc/rsyncd.conf-sample for some usage examples.
+# rsync_module = {replication_ip}::account
+#
 # recon_cache_path = /var/cache/swift
+#
+# You can set scheduling priority of processes. Niceness values range from -20
+# (most favorable to the process) to 19 (least favorable to the process).
+# nice_priority =
+#
+# You can set I/O scheduling class and priority of processes. I/O niceness
+# class values are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and
+# IOPRIO_CLASS_IDLE (idle). I/O niceness priority is a number which goes from
+# 0 to 7. The higher the value, the lower the I/O priority of the process.
+# Work only with ionice_class.
+# ionice_class =
+# ionice_priority =
+#
+# The handoffs_only and handoff_delete options are for special-case emergency
+# situations such as full disks in the cluster. These options SHOULD NOT
+# BE ENABLED except in emergencies. When handoffs_only mode is enabled
+# the replicator will *only* replicate from handoff nodes to primary
+# nodes and will not sync primary nodes with other primary nodes.
+#
+# This has two main effects: first, the replicator becomes much more
+# effective at removing misplaced databases, thereby freeing up disk
+# space at a much faster pace than normal. Second, the replicator does
+# not sync data between primary nodes, so out-of-sync account and
+# container listings will not resolve while handoffs_only is enabled.
+#
+# This mode is intended to allow operators to temporarily sacrifice
+# consistency in order to gain faster rebalancing, such as during a
+# capacity addition with nearly-full disks. It is not intended for
+# long-term use.
+#
+# handoffs_only = no
+#
+# handoff_delete is the number of replicas which are ensured in swift.
+# If the number less than the number of replicas is set, account-replicator
+# could delete local handoffs even if all replicas are not ensured in the
+# cluster. The replicator would remove local handoff account database after
+# syncing when the number of successful responses is greater than or equal to
+# this number. By default(auto), handoff partitions will be
+# removed  when it has successfully replicated to all the canonical nodes.
+# handoff_delete = auto
 
 [account-auditor]
 # You can override the default log routing for this app here (don't use set!):
@@ -84,11 +241,24 @@ use = egg:swift#recon
 # log_facility = LOG_LOCAL0
 # log_level = INFO
 # log_address = /dev/log
-# Will audit, at most, 1 account per device per interval
-# interval = 1800
-# log_facility = LOG_LOCAL0
-# log_level = INFO
+#
+# Will audit each account at most once per interval
+# interval = 1800.0
+#
+# accounts_per_second = 200
 # recon_cache_path = /var/cache/swift
+#
+# You can set scheduling priority of processes. Niceness values range from -20
+# (most favorable to the process) to 19 (least favorable to the process).
+# nice_priority =
+#
+# You can set I/O scheduling class and priority of processes. I/O niceness
+# class values are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and
+# IOPRIO_CLASS_IDLE (idle). I/O niceness priority is a number which goes from
+# 0 to 7. The higher the value, the lower the I/O priority of the process.
+# Work only with ionice_class.
+# ionice_class =
+# ionice_priority =
 
 [account-reaper]
 # You can override the default log routing for this app here (don't use set!):
@@ -96,11 +266,72 @@ use = egg:swift#recon
 # log_facility = LOG_LOCAL0
 # log_level = INFO
 # log_address = /dev/log
+#
 # concurrency = 25
-# interval = 3600
+# interval = 3600.0
 # node_timeout = 10
 # conn_timeout = 0.5
+#
 # Normally, the reaper begins deleting account information for deleted accounts
 # immediately; you can set this to delay its work however. The value is in
-# seconds; 2592000 = 30 days for example.
+# seconds; 2592000 = 30 days for example. The sum of this value and the
+# container-updater interval should be less than the account-replicator
+# reclaim_age. This ensures that once the account-reaper has deleted a
+# container there is sufficient time for the container-updater to report to the
+# account before the account DB is removed.
 # delay_reaping = 0
+#
+# If the account fails to be reaped due to a persistent error, the
+# account reaper will log a message such as:
+#     Account <name> has not been reaped since <date>
+# You can search logs for this message if space is not being reclaimed
+# after you delete account(s).
+# Default is 2592000 seconds (30 days). This is in addition to any time
+# requested by delay_reaping.
+# reap_warn_after = 2592000
+#
+# You can set scheduling priority of processes. Niceness values range from -20
+# (most favorable to the process) to 19 (least favorable to the process).
+# nice_priority =
+#
+# You can set I/O scheduling class and priority of processes. I/O niceness
+# class values are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and
+# IOPRIO_CLASS_IDLE (idle). I/O niceness priority is a number which goes from
+# 0 to 7. The higher the value, the lower the I/O priority of the process.
+# Work only with ionice_class.
+# ionice_class =
+# ionice_priority =
+
+# Note: Put it at the beginning of the pipeline to profile all middleware. But
+# it is safer to put this after healthcheck. Not intended for production
+# environments!
+[filter:xprofile]
+use = egg:swift#xprofile
+# This option enable you to switch profilers which should inherit from python
+# standard profiler. Currently the supported value can be 'cProfile',
+# 'eventlet.green.profile' etc.
+# profile_module = eventlet.green.profile
+#
+# This prefix will be used to combine process ID and timestamp to name the
+# profile data file.  Make sure the executing user has permission to write
+# into this path (missing path segments will be created, if necessary).
+# If you enable profiling in more than one type of daemon, you must override
+# it with an unique value like: /var/log/swift/profile/account.profile
+# log_filename_prefix = /tmp/log/swift/profile/default.profile
+#
+# the profile data will be dumped to local disk based on above naming rule
+# in this interval.
+# dump_interval = 5.0
+#
+# Be careful, this option will enable profiler to dump data into the file with
+# time stamp which means there will be lots of files piled up in the directory.
+# dump_timestamp = false
+#
+# This is the path of the URL to access the mini web UI.
+# path = /__profile__
+#
+# Clear the data when the wsgi server shutdown.
+# flush_at_shutdown = false
+#
+# unwind the iterator of applications
+# unwind = false
diff --git a/etc/backend-ratelimit.conf-sample b/etc/backend-ratelimit.conf-sample
new file mode 100644
index 0000000000..5912b6668e
--- /dev/null
+++ b/etc/backend-ratelimit.conf-sample
@@ -0,0 +1,30 @@
+[backend_ratelimit]
+# The rate of requests to each device is limited by an overall per-device rate
+# limit that is applied to all requests to the device and/or a
+# per-method-per-device rate limit that is applied to requests of that method
+# to the device. If either of these rates would be exceeded the server will
+# return 529 responses and emit a 'backend.ratelimit' statsd metric without
+# logging.
+
+# Set the maximum overall rate of requests per device per second per worker for
+# all request methods. The default value of zero causes no per-device
+# rate-limiting to be applied other than that configured for specific request
+# methods.
+# requests_per_device_per_second = 0.0
+
+# Set maximum rate of requests per device per second per worker for individual
+# request methods. The default value of zero causes no per-method
+# rate-limiting to be applied. Note: the aggregate rate of requests for all
+# methods is still limited by requests_per_device_per_second even if a higher
+# per method rate is configured.
+# delete_requests_per_device_per_second = 0.0
+# get_requests_per_device_per_second = 0.0
+# head_requests_per_device_per_second = 0.0
+# post_requests_per_device_per_second = 0.0
+# put_requests_per_device_per_second = 0.0
+# replicate_requests_per_device_per_second = 0.0
+# update_requests_per_device_per_second = 0.0
+
+# Set the number of seconds of unused rate-limiting allowance that can
+# accumulate and be used to allow a subsequent burst of requests.
+# requests_per_device_rate_buffer = 1.0
diff --git a/etc/container-reconciler.conf-sample b/etc/container-reconciler.conf-sample
new file mode 100644
index 0000000000..6011a3c21e
--- /dev/null
+++ b/etc/container-reconciler.conf-sample
@@ -0,0 +1,96 @@
+[DEFAULT]
+# swift_dir = /etc/swift
+# user = swift
+# ring_check_interval = 15.0
+# You can specify default log routing here if you want:
+# log_name = swift
+# log_facility = LOG_LOCAL0
+# log_level = INFO
+# log_address = /dev/log
+#
+# comma separated list of functions to call to setup custom log handlers.
+# functions get passed: conf, name, log_to_console, log_route, fmt, logger,
+# adapted_logger
+# log_custom_handlers =
+#
+# If set, log_udp_host will override log_address
+# log_udp_host =
+# log_udp_port = 514
+#
+# You can enable StatsD logging here:
+# log_statsd_host =
+# log_statsd_port = 8125
+# log_statsd_default_sample_rate = 1.0
+# log_statsd_sample_rate_factor = 1.0
+# log_statsd_metric_prefix =
+#
+# You can set scheduling priority of processes. Niceness values range from -20
+# (most favorable to the process) to 19 (least favorable to the process).
+# nice_priority =
+#
+# You can set I/O scheduling class and priority of processes. I/O niceness
+# class values are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and
+# IOPRIO_CLASS_IDLE (idle). I/O niceness priority is a number which goes from
+# 0 to 7. The higher the value, the lower the I/O priority of the process.
+# Work only with ionice_class.
+# ionice_class =
+# ionice_priority =
+
+[container-reconciler]
+# The reconciler will re-attempt reconciliation if the source object is not
+# available up to reclaim_age seconds before it gives up and deletes the entry
+# in the queue.
+# reclaim_age = 604800
+# The cycle time of the daemon
+# interval = 30.0
+# Server errors from requests will be retried by default
+# request_tries = 3
+#
+# You can set scheduling priority of processes. Niceness values range from -20
+# (most favorable to the process) to 19 (least favorable to the process).
+# nice_priority =
+#
+# You can set I/O scheduling class and priority of processes. I/O niceness
+# class values are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and
+# IOPRIO_CLASS_IDLE (idle). I/O niceness priority is a number which goes from
+# 0 to 7. The higher the value, the lower the I/O priority of the process.
+# Work only with ionice_class.
+# ionice_class =
+# ionice_priority =
+# Number of objects to process concurrently per process
+# concurrency = 1
+
+# processes is how many parts to divide the work into, one part per process
+# that will be doing the work
+# processes set 0 means that a single process will be doing all the work
+# processes = 0
+#
+# process is which of the parts a particular process will work on
+# process is "zero based", if you want to use 3 processes, you should run
+# processes with process set to 0, 1, and 2
+# process = 0
+
+[pipeline:main]
+# Note that the reconciler's pipeline is intentionally very sparse -- it is
+# only responsible for moving data from one policy to another and should not
+# perform any transformations beyond (potentially) changing erasure coding.
+# It notably MUST NOT include transformative middlewares (such as encryption),
+# redirection middlewares (such as symlink), or composing middlewares (such
+# as slo and dlo).
+pipeline = catch_errors proxy-logging cache proxy-server
+
+[app:proxy-server]
+use = egg:swift#proxy
+# See proxy-server.conf-sample for options
+
+[filter:cache]
+use = egg:swift#memcache
+# See proxy-server.conf-sample for options
+
+[filter:proxy-logging]
+use = egg:swift#proxy_logging
+# See proxy-server.conf-sample for options
+
+[filter:catch_errors]
+use = egg:swift#catch_errors
+# See proxy-server.conf-sample for options
diff --git a/etc/container-server.conf-sample b/etc/container-server.conf-sample
index 728fa4cd3c..fbf5caad07 100644
--- a/etc/container-server.conf-sample
+++ b/etc/container-server.conf-sample
@@ -1,41 +1,92 @@
 [DEFAULT]
 # bind_ip = 0.0.0.0
-# bind_port = 6001
+bind_port = 6201
+# keep_idle = 600
 # bind_timeout = 30
 # backlog = 4096
-# workers = 1
 # user = swift
 # swift_dir = /etc/swift
 # devices = /srv/node
 # mount_check = true
 # disable_fallocate = false
+#
+# Use an integer to override the number of pre-forked processes that will
+# accept connections.
+# workers = auto
+#
+# Maximum concurrent requests per worker
+# max_clients = 1024
+#
 # This is a comma separated list of hosts allowed in the X-Container-Sync-To
-# field for containers.
+# field for containers. This is the old-style of using container sync. It is
+# strongly recommended to use the new style of a separate
+# container-sync-realms.conf -- see container-sync-realms.conf-sample
 # allowed_sync_hosts = 127.0.0.1
+#
 # You can specify default log routing here if you want:
 # log_name = swift
 # log_facility = LOG_LOCAL0
 # log_level = INFO
 # log_address = /dev/log
+# The following caps the length of log lines to the value given; no limit if
+# set to 0, the default.
+# log_max_line_length = 0
+#
+# Hashing algorithm for log anonymization. Must be one of algorithms supported
+# by Python's hashlib.
+# log_anonymization_method = MD5
+#
+# Salt added during log anonymization
+# log_anonymization_salt =
+#
+# Template used to format logs. All words surrounded by curly brackets
+# will be substituted with the appropriate values
+# log_format = {remote_addr} - - [{time.d}/{time.b}/{time.Y}:{time.H}:{time.M}:{time.S} +0000] "{method} {path}" {status} {content_length} "{referer}" "{txn_id}" "{user_agent}" {trans_time:.4f} "{additional_info}" {pid} {policy_index}
+#
 # comma separated list of functions to call to setup custom log handlers.
 # functions get passed: conf, name, log_to_console, log_route, fmt, logger,
 # adapted_logger
 # log_custom_handlers =
+#
 # If set, log_udp_host will override log_address
 # log_udp_host =
 # log_udp_port = 514
+#
 # You can enable StatsD logging here:
-# log_statsd_host = localhost
+# log_statsd_host =
 # log_statsd_port = 8125
-# log_statsd_default_sample_rate = 1
+# log_statsd_default_sample_rate = 1.0
+# log_statsd_sample_rate_factor = 1.0
 # log_statsd_metric_prefix =
+#
 # If you don't mind the extra disk space usage in overhead, you can turn this
 # on to preallocate disk space with SQLite databases to decrease fragmentation.
 # db_preallocation = off
+#
+# Enable this option to log all sqlite3 queries (requires python >=3.3)
+# db_query_logging = off
+#
 # eventlet_debug = false
+#
+# You can set fallocate_reserve to the number of bytes or percentage of disk
+# space you'd like fallocate to reserve, whether there is space for the given
+# file size or not. Percentage will be used if the value ends with a '%'.
+# fallocate_reserve = 1%
+#
+# You can set scheduling priority of processes. Niceness values range from -20
+# (most favorable to the process) to 19 (least favorable to the process).
+# nice_priority =
+#
+# You can set I/O scheduling class and priority of processes. I/O niceness
+# class values are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and
+# IOPRIO_CLASS_IDLE (idle). I/O niceness priority is a number which goes from
+# 0 to 7. The higher the value, the lower the I/O priority of the process.
+# Work only with ionice_class.
+# ionice_class =
+# ionice_priority =
 
 [pipeline:main]
-pipeline = healthcheck recon container-server
+pipeline = healthcheck recon backend_ratelimit container-server
 
 [app:container-server]
 use = egg:swift#container
@@ -43,12 +94,45 @@ use = egg:swift#container
 # set log_name = container-server
 # set log_facility = LOG_LOCAL0
 # set log_level = INFO
-# set log_requests = True
+# set log_requests = true
 # set log_address = /dev/log
+#
 # node_timeout = 3
 # conn_timeout = 0.5
-# allow_versions = False
-# auto_create_account_prefix = .
+# allow_versions = false
+#
+# You can disable REPLICATE handling (default is to allow it). When deploying
+# a cluster with a separate replication network, you'll want multiple
+# container-server processes running: one for client-driven traffic and another
+# for replication traffic. The server handling client-driven traffic may set
+# this to false. If there is only one container-server process, leave this as
+# true.
+# replication_server = true
+#
+# You can set scheduling priority of processes. Niceness values range from -20
+# (most favorable to the process) to 19 (least favorable to the process).
+# nice_priority =
+#
+# You can set I/O scheduling class and priority of processes. I/O niceness
+# class values are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and
+# IOPRIO_CLASS_IDLE (idle). I/O niceness priority is a number which goes from
+# 0 to 7. The higher the value, the lower the I/O priority of the process.
+# Work only with ionice_class.
+# ionice_class =
+# ionice_priority =
+#
+# You can set fallocate_reserve to the number of bytes or percentage
+# of disk space you'd like kept free at all times. If the disk's free
+# space falls below this value, then PUT, POST, and REPLICATE requests
+# will be denied until the disk ha s more space available. Percentage
+# will be used if the value ends with a '%'.
+# fallocate_reserve = 1%
+#
+# When reloading servers with SIGUSR1, workers running with old config/code
+# are allowed some time to finish serving in-flight requests. Use this to
+# configure the grace period (in seconds), after which the reloaded server
+# will issue SIGKILLs to remaining stale workers.
+# stale_worker_timeout = 86400
 
 [filter:healthcheck]
 use = egg:swift#healthcheck
@@ -60,24 +144,106 @@ use = egg:swift#healthcheck
 use = egg:swift#recon
 #recon_cache_path = /var/cache/swift
 
+[filter:backend_ratelimit]
+use = egg:swift#backend_ratelimit
+# Config options can optionally be loaded from a separate config file. Config
+# options in this section will be used unless the same option is found in the
+# config file, in which case the config file option will be used. See the
+# backend-ratelimit.conf-sample file for details of available config options.
+# backend_ratelimit_conf_path = /etc/swift/backend-ratelimit.conf
+
+# The minimum interval between attempts to reload any config file at
+# backend_ratelimit_conf_path while the server is running. A value of 0 means
+# that the file is loaded at start-up but not subsequently reloaded. Note that
+# config options in this section are never reloaded after start-up.
+# config_reload_interval = 60
+
 [container-replicator]
 # You can override the default log routing for this app here (don't use set!):
 # log_name = container-replicator
 # log_facility = LOG_LOCAL0
 # log_level = INFO
 # log_address = /dev/log
-# vm_test_mode = no
+#
+# Maximum number of database rows that will be sync'd in a single HTTP
+# replication request. Databases with less than or equal to this number of
+# differing rows will always be sync'd using an HTTP replication request rather
+# than using rsync.
 # per_diff = 1000
+#
+# Maximum number of HTTP replication requests attempted on each replication
+# pass for any one container. This caps how long the replicator will spend
+# trying to sync a given database per pass so the other databases don't get
+# starved.
 # max_diffs = 100
+#
+# Number of replication workers to spawn.
 # concurrency = 8
-# interval = 30
+#
+# Time in seconds to wait between replication passes
+# interval = 30.0
+# run_pause is deprecated, use interval instead
+# run_pause = 30.0
+#
+# Process at most this many databases per second
+# databases_per_second = 50
+#
 # node_timeout = 10
 # conn_timeout = 0.5
+#
 # The replicator also performs reclamation
 # reclaim_age = 604800
-# Time in seconds to wait between replication passes
-# run_pause = 30
+#
+# Allow rsync to compress data which is transmitted to destination node
+# during sync. However, this is applicable only when destination node is in
+# a different region than the local one.
+# rsync_compress = no
+#
+# Format of the rsync module where the replicator will send data. See
+# etc/rsyncd.conf-sample for some usage examples.
+# rsync_module = {replication_ip}::container
+#
 # recon_cache_path = /var/cache/swift
+#
+# You can set scheduling priority of processes. Niceness values range from -20
+# (most favorable to the process) to 19 (least favorable to the process).
+# nice_priority =
+#
+# You can set I/O scheduling class and priority of processes. I/O niceness
+# class values are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and
+# IOPRIO_CLASS_IDLE (idle). I/O niceness priority is a number which goes from
+# 0 to 7. The higher the value, the lower the I/O priority of the process.
+# Work only with ionice_class.
+# ionice_class =
+# ionice_priority =
+#
+# The handoffs_only and handoff_delete options are for special-case emergency
+# situations such as full disks in the cluster. These options SHOULD NOT
+# BE ENABLED except in emergencies. When handoffs_only mode is enabled
+# the replicator will *only* replicate from handoff nodes to primary
+# nodes and will not sync primary nodes with other primary nodes.
+#
+# This has two main effects: first, the replicator becomes much more
+# effective at removing misplaced databases, thereby freeing up disk
+# space at a much faster pace than normal. Second, the replicator does
+# not sync data between primary nodes, so out-of-sync account and
+# container listings will not resolve while handoffs_only is enabled.
+#
+# This mode is intended to allow operators to temporarily sacrifice
+# consistency in order to gain faster rebalancing, such as during a
+# capacity addition with nearly-full disks. It is not intended for
+# long-term use.
+#
+# handoffs_only = no
+#
+# handoff_delete is the number of replicas which are ensured in swift.
+# If the number less than the number of replicas is set, container-replicator
+# could delete local handoffs even if all replicas are not ensured in the
+# cluster. The replicator would remove local handoff container database after
+# syncing when the number of successful responses is greater than or equal to
+# this number. By default(auto), handoff partitions will be
+# removed  when it has successfully replicated to all the canonical nodes.
+# handoff_delete = auto
 
 [container-updater]
 # You can override the default log routing for this app here (don't use set!):
@@ -85,15 +251,35 @@ use = egg:swift#recon
 # log_facility = LOG_LOCAL0
 # log_level = INFO
 # log_address = /dev/log
-# interval = 300
+#
+# interval = 300.0
 # concurrency = 4
 # node_timeout = 3
 # conn_timeout = 0.5
-# slowdown will sleep that amount between containers
+#
+# Send at most this many container updates per second
+# containers_per_second = 50
+#
+# slowdown will sleep that amount between containers. Deprecated; use
+# containers_per_second instead.
 # slowdown = 0.01
+#
 # Seconds to suppress updating an account that has generated an error
 # account_suppression_time = 60
+#
 # recon_cache_path = /var/cache/swift
+#
+# You can set scheduling priority of processes. Niceness values range from -20
+# (most favorable to the process) to 19 (least favorable to the process).
+# nice_priority =
+#
+# You can set I/O scheduling class and priority of processes. I/O niceness
+# class values are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and
+# IOPRIO_CLASS_IDLE (idle). I/O niceness priority is a number which goes from
+# 0 to 7. The higher the value, the lower the I/O priority of the process.
+# Work only with ionice_class.
+# ionice_class =
+# ionice_priority =
 
 [container-auditor]
 # You can override the default log routing for this app here (don't use set!):
@@ -101,9 +287,24 @@ use = egg:swift#recon
 # log_facility = LOG_LOCAL0
 # log_level = INFO
 # log_address = /dev/log
-# Will audit, at most, 1 container per device per interval
-# interval = 1800
+#
+# Will audit each container at most once per interval
+# interval = 1800.0
+#
+# containers_per_second = 200
 # recon_cache_path = /var/cache/swift
+#
+# You can set scheduling priority of processes. Niceness values range from -20
+# (most favorable to the process) to 19 (least favorable to the process).
+# nice_priority =
+#
+# You can set I/O scheduling class and priority of processes. I/O niceness
+# class values are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and
+# IOPRIO_CLASS_IDLE (idle). I/O niceness priority is a number which goes from
+# 0 to 7. The higher the value, the lower the I/O priority of the process.
+# Work only with ionice_class.
+# ionice_class =
+# ionice_priority =
 
 [container-sync]
 # You can override the default log routing for this app here (don't use set!):
@@ -111,9 +312,246 @@ use = egg:swift#recon
 # log_facility = LOG_LOCAL0
 # log_level = INFO
 # log_address = /dev/log
+#
 # If you need to use an HTTP Proxy, set it here; defaults to no proxy.
-# sync_proxy = http://127.0.0.1:8888
-# Will sync, at most, each container once per interval
-# interval = 300
+# You can also set this to a comma separated list of HTTP Proxies and they will
+# be randomly used (simple load balancing).
+# sync_proxy = http://10.1.1.1:8888,http://10.1.1.2:8888
+#
+# Will sync each container at most once per interval
+# interval = 300.0
+#
 # Maximum amount of time to spend syncing each container per pass
 # container_time = 60
+#
+# Maximum amount of time in seconds for the connection attempt
+# conn_timeout = 5
+# Server errors from requests will be retried by default
+# request_tries = 3
+#
+# Internal client config file path
+# internal_client_conf_path = /etc/swift/internal-client.conf
+#
+# You can set scheduling priority of processes. Niceness values range from -20
+# (most favorable to the process) to 19 (least favorable to the process).
+# nice_priority =
+#
+# You can set I/O scheduling class and priority of processes. I/O niceness
+# class values are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and
+# IOPRIO_CLASS_IDLE (idle). I/O niceness priority is a number which goes from
+# 0 to 7. The higher the value, the lower the I/O priority of the process.
+# Work only with ionice_class.
+# ionice_class =
+# ionice_priority =
+
+# Note: Put it at the beginning of the pipeline to profile all middleware. But
+# it is safer to put this after healthcheck. Not intended for production
+# environments!
+[filter:xprofile]
+use = egg:swift#xprofile
+# This option enable you to switch profilers which should inherit from python
+# standard profiler. Currently the supported value can be 'cProfile',
+# 'eventlet.green.profile' etc.
+# profile_module = eventlet.green.profile
+#
+# This prefix will be used to combine process ID and timestamp to name the
+# profile data file.  Make sure the executing user has permission to write
+# into this path (missing path segments will be created, if necessary).
+# If you enable profiling in more than one type of daemon, you must override
+# it with an unique value like: /var/log/swift/profile/container.profile
+# log_filename_prefix = /tmp/log/swift/profile/default.profile
+#
+# the profile data will be dumped to local disk based on above naming rule
+# in this interval.
+# dump_interval = 5.0
+#
+# Be careful, this option will enable profiler to dump data into the file with
+# time stamp which means there will be lots of files piled up in the directory.
+# dump_timestamp = false
+#
+# This is the path of the URL to access the mini web UI.
+# path = /__profile__
+#
+# Clear the data when the wsgi server shutdown.
+# flush_at_shutdown = false
+#
+# unwind the iterator of applications
+# unwind = false
+
+[container-sharder]
+# You can override the default log routing for this app here (don't use set!):
+# log_name = container-sharder
+# log_facility = LOG_LOCAL0
+# log_level = INFO
+# log_address = /dev/log
+#
+# Container sharder specific settings
+#
+# If the auto_shard option is true then the sharder will automatically select
+# containers to shard, scan for shard ranges, and select shards to shrink.
+# The default is false.
+# Warning: auto-sharding is still under development and should not be used in
+# production; do not set this option to true in a production cluster.
+# auto_shard = false
+#
+# When auto-sharding is enabled shard_container_threshold defines the object
+# count at which a container with container-sharding enabled will start to
+# shard. shard_container_threshold also indirectly determines the defaults for
+# rows_per_shard, shrink_threshold and expansion_limit.
+# shard_container_threshold = 1000000
+#
+# rows_per_shard determines the initial nominal size of shard containers. The
+# default is shard_container_threshold // 2
+# rows_per_shard = 500000
+#
+# Minimum size of the final shard range. If this is greater than one then the
+# final shard range may be extended to more than rows_per_shard in order to
+# avoid a further shard range with less than minimum_shard_size rows. The
+# default value is rows_per_shard // 5.
+# minimum_shard_size = 100000
+#
+# When auto-sharding is enabled shrink_threshold defines the object count
+# below which a 'donor' shard container will be considered for shrinking into
+# another 'acceptor' shard container. The default is determined by
+# shard_shrink_point. If set, shrink_threshold will take precedence over
+# shard_shrink_point.
+# shrink_threshold =
+#
+# When auto-sharding is enabled shard_shrink_point defines the object count
+# below which a 'donor' shard container will be considered for shrinking into
+# another 'acceptor' shard container. shard_shrink_point is a percentage of
+# shard_container_threshold e.g. the default value of 10 means 10% of the
+# shard_container_threshold.
+# Deprecated: shrink_threshold is recommended and if set will take precedence
+# over shard_shrink_point.
+# shard_shrink_point = 10
+#
+# When auto-sharding is enabled expansion_limit defines the maximum
+# allowed size of an acceptor shard container after having a donor merged into
+# it. The default is determined by shard_shrink_merge_point.
+# If set, expansion_limit will take precedence over shard_shrink_merge_point.
+# expansion_limit =
+#
+# When auto-sharding is enabled shard_shrink_merge_point defines the maximum
+# allowed size of an acceptor shard container after having a donor merged into
+# it. Shard_shrink_merge_point is a percentage of shard_container_threshold.
+# e.g. the default value of 75 means that the projected sum of a donor object
+# count and acceptor count must be less than 75% of shard_container_threshold
+# for the donor to be allowed to merge into the acceptor.
+#
+# For example, if the shard_container_threshold is 1 million,
+# shard_shrink_point is 10, and shard_shrink_merge_point is 75 then a shard will
+# be considered for shrinking if it has less than or equal to 100 thousand
+# objects but will only merge into an acceptor if the combined object count
+# would be less than or equal to 750 thousand objects.
+# Deprecated: expansion_limit is recommended and if set will take precedence
+# over shard_shrink_merge_point.
+# shard_shrink_merge_point = 75
+#
+# When auto-sharding is enabled shard_scanner_batch_size defines the maximum
+# number of shard ranges that will be found each time the sharder daemon visits
+# a sharding container. If necessary the sharder daemon will continue to search
+# for more shard ranges each time it visits the container.
+# shard_scanner_batch_size = 10
+#
+# cleave_batch_size defines the number of shard ranges that will be cleaved
+# each time the sharder daemon visits a sharding container.
+# cleave_batch_size = 2
+#
+# cleave_row_batch_size defines the size of batches of object rows read from a
+# sharding container and merged to a shard container during cleaving.
+# cleave_row_batch_size = 10000
+#
+# max_expanding defines the maximum number of shards that could be expanded in a
+# single cycle of the sharder. Defaults to unlimited (-1).
+# max_expanding = -1
+#
+# max_shrinking defines the maximum number of shards that should be shrunk into
+# each expanding shard. Defaults to 1.
+# NOTE: Using values greater than 1 may result in temporary gaps in object listings
+# until all selected shards have shrunk.
+# max_shrinking = 1
+#
+# Defines the number of successfully replicated shard dbs required when
+# cleaving a previously uncleaved shard range before the sharder will progress
+# to the next shard range. The value should be less than or equal to the
+# container ring replica count. The default of 'auto' causes the container ring
+# quorum value to be used. This option only applies to the container-sharder
+# replication and does not affect the number of shard container replicas that
+# will eventually be replicated by the container-replicator.
+# shard_replication_quorum = auto
+#
+# Defines the number of successfully replicated shard dbs required when
+# cleaving a shard range that has been previously cleaved on another node
+# before the sharder will progress to the next shard range. The value should be
+# less than or equal to the container ring replica count. The default of 'auto'
+# causes the shard_replication_quorum value to be used. This option only
+# applies to the container-sharder replication and does not affect the number
+# of shard container replicas that will eventually be replicated by the
+# container-replicator.
+# existing_shard_replication_quorum = auto
+#
+# The sharder uses an internal client to create and make requests to
+# containers. The absolute path to the client config file can be configured.
+# internal_client_conf_path = /etc/swift/internal-client.conf
+#
+# The number of time the internal client will retry requests.
+# request_tries = 3
+#
+# Each time the sharder dumps stats to the recon cache file it includes a list
+# of containers that appear to need sharding but are not yet sharding. By
+# default this list is limited to the top 5 containers, ordered by object
+# count. The limit may be changed by setting recon_candidates_limit to an
+# integer value. A negative value implies no limit.
+# recon_candidates_limit = 5
+#
+# As the sharder visits each container that's currently sharding it dumps to
+# recon their current progress. To be able to mark their progress as completed
+# this in-progress check will need to monitor containers that have just
+# completed sharding. The recon_sharded_timeout parameter says for how long a
+# container whose just finished sharding should be checked by the in-progress
+# check. This is to allow anything monitoring the sharding recon dump to have
+# enough time to collate and see things complete. The time is capped at
+# reclaim_age, so this parameter should be less than or equal to reclaim_age.
+# The default is 12 hours (12 x 60 x 60)
+# recon_sharded_timeout = 43200
+#
+# Maximum amount of time in seconds after sharding has been started on a shard
+# container and before it's considered as timeout. After this amount of time,
+# sharder will warn that a container DB has not completed sharding.
+# The default is 48 hours (48 x 60 x 60)
+# container_sharding_timeout = 172800
+#
+# Some sharder states lead to repeated messages of 'Reclaimable db stuck
+# waiting for shrinking' on every sharder cycle. To reduce noise in logs,
+# this message will be suppressed for some time after its last emission.
+# Default is 24 hours.
+# periodic_warnings_interval = 86400
+#
+# Large databases tend to take a while to work with, but we want to make sure
+# we write down our progress. Use a larger-than-normal broker timeout to make
+# us less likely to bomb out on a LockTimeout.
+# broker_timeout = 60
+#
+# Time in seconds to wait between emitting stats to logs
+# stats_interval = 3600.0
+#
+# Time in seconds to wait between sharder cycles
+# interval = 30.0
+#
+# Process at most this many databases per second
+# databases_per_second = 50
+#
+# The container-sharder accepts the following configuration options as defined
+# in the container-replicator section:
+#
+# per_diff = 1000
+# max_diffs = 100
+# concurrency = 8
+# node_timeout = 10
+# conn_timeout = 0.5
+# reclaim_age = 604800
+# rsync_compress = no
+# rsync_module = {replication_ip}::container
+# recon_cache_path = /var/cache/swift
+#
diff --git a/etc/container-sync-realms.conf-sample b/etc/container-sync-realms.conf-sample
new file mode 100644
index 0000000000..01e4723ed5
--- /dev/null
+++ b/etc/container-sync-realms.conf-sample
@@ -0,0 +1,47 @@
+# [DEFAULT]
+# The number of seconds between checking the modified time of this config file
+# for changes and therefore reloading it.
+# mtime_check_interval = 300.0
+
+
+# [realm1]
+# key = realm1key
+# key2 = realm1key2
+# cluster_clustername1 = https://host1/v1/
+# cluster_clustername2 = https://host2/v1/
+#
+# [realm2]
+# key = realm2key
+# key2 = realm2key2
+# cluster_clustername3 = https://host3/v1/
+# cluster_clustername4 = https://host4/v1/
+
+
+# Each section name is the name of a sync realm. A sync realm is a set of
+# clusters that have agreed to allow container syncing with each other. Realm
+# names will be considered case insensitive.
+#
+# The key is the overall cluster-to-cluster key used in combination with the
+# external users' key that they set on their containers' X-Container-Sync-Key
+# metadata header values. These keys will be used to sign each request the
+# container sync daemon makes and used to validate each incoming container sync
+# request.
+#
+# The key2 is optional and is an additional key incoming requests will be
+# checked against. This is so you can rotate keys if you wish; you move the
+# existing key to key2 and make a new key value.
+#
+# Any values in the realm section whose names begin with cluster_ will indicate
+# the name and endpoint of a cluster and will be used by external users in
+# their containers' X-Container-Sync-To metadata header values with the format
+# "realm_name/cluster_name/container_name". Realm and cluster names are
+# considered case insensitive.
+#
+# The endpoint is what the container sync daemon will use when sending out
+# requests to that cluster. Keep in mind this endpoint must be reachable by all
+# container servers, since that is where the container sync daemon runs. Note
+# that the endpoint ends with /v1/ and that the container sync daemon will then
+# add the account/container/obj name after that.
+#
+# Distribute this container-sync-realms.conf file to all your proxy servers
+# and container servers.
diff --git a/etc/dispersion.conf-sample b/etc/dispersion.conf-sample
index d42cf35434..eae777a085 100644
--- a/etc/dispersion.conf-sample
+++ b/etc/dispersion.conf-sample
@@ -1,16 +1,41 @@
 [dispersion]
+# Please create a new account solely for using dispersion tools, which is
+# helpful for keep your own data clean.
 auth_url = http://localhost:8080/auth/v1.0
 auth_user = test:tester
 auth_key = testing
-# auth_url = http://saio:5000/v2.0/
-# auth_user = test:tester
-# auth_key = testing
+# auth_version = 1.0
+#
+# NOTE: If you want to use keystone (auth version 2.0), then its configuration
+# would look something like:
+# auth_url = http://localhost:5000/v2.0/
+# auth_user = tenant:user
+# auth_key = password
 # auth_version = 2.0
 #
+# NOTE: If you want to use keystone (auth version 3.0), then its configuration
+# would look something like:
+# auth_url = http://localhost:5000/v3/
+# auth_user = user
+# auth_key = password
+# auth_version = 3.0
+# project_name = project
+# project_domain_name = project_domain
+# user_domain_name = user_domain
+#
+# endpoint_type = publicURL
+#
+# NOTE: If you have only 1 region with a swift endpoint, no need to specify it
+# region_name =
+#
+# keystone_api_insecure = no
+#
 # swift_dir = /etc/swift
-# dispersion_coverage = 1
+# dispersion_coverage = 1.0
 # retries = 5
 # concurrency = 25
+# container_populate = yes
+# object_populate = yes
 # container_report = yes
 # object_report = yes
 # dump_json = no
diff --git a/etc/drive-audit.conf-sample b/etc/drive-audit.conf-sample
index 98ef4eb1be..69de6defbf 100644
--- a/etc/drive-audit.conf-sample
+++ b/etc/drive-audit.conf-sample
@@ -1,7 +1,42 @@
 [drive-audit]
+# Set owner of the drive-audit recon cache to this user:
+# user = swift
+#
 # device_dir = /srv/node
+#
+# You can specify default log routing here if you want:
+# log_name = drive-audit
 # log_facility = LOG_LOCAL0
 # log_level = INFO
 # log_address = /dev/log
+# The following caps the length of log lines to the value given; no limit if
+# set to 0, the default.
+# log_max_line_length = 0
+#
 # minutes = 60
 # error_limit = 1
+# recon_cache_path = /var/cache/swift
+# unmount_failed_device = True
+#
+# By default, drive-audit logs only to syslog. Setting this option True
+# makes drive-audit log to console in addition to syslog.
+# log_to_console = False
+#
+# Location of the log file with globbing
+# pattern to check against device errors.
+# log_file_pattern = /var/log/kern.*[!.][!g][!z]
+#
+# On Python 3, the encoding to use when reading the log file. Defaults
+# to the result of locale.getpreferredencoding(), like Python's open().
+# log_file_encoding = auto
+#
+# Regular expression patterns to be used to locate
+# device blocks with errors in the log file. Currently
+# the default ones are as follows:
+#   \berror\b.*\b(sd[a-z]{1,2}\d?)\b
+#   \b(sd[a-z]{1,2}\d?)\b.*\berror\b
+# One can overwrite the default ones by providing
+# new expressions using the format below:
+# Format: regex_pattern_X = regex_expression
+# Example:
+#   regex_pattern_1 = \berror\b.*\b(dm-[0-9]{1,2}\d?)\b
diff --git a/etc/internal-client.conf-sample b/etc/internal-client.conf-sample
new file mode 100644
index 0000000000..cbeb401c03
--- /dev/null
+++ b/etc/internal-client.conf-sample
@@ -0,0 +1,51 @@
+[DEFAULT]
+# swift_dir = /etc/swift
+# user = swift
+# You can specify default log routing here if you want:
+# Note: the 'set' syntax is necessary to override the log_name that some
+# daemons specify when instantiating an internal client.
+# set log_name = swift
+# log_facility = LOG_LOCAL0
+# log_level = INFO
+# log_address = /dev/log
+#
+# comma separated list of functions to call to setup custom log handlers.
+# functions get passed: conf, name, log_to_console, log_route, fmt, logger,
+# adapted_logger
+# log_custom_handlers =
+#
+# If set, log_udp_host will override log_address
+# log_udp_host =
+# log_udp_port = 514
+#
+# You can enable StatsD logging here:
+# log_statsd_host =
+# log_statsd_port = 8125
+# log_statsd_default_sample_rate = 1.0
+# log_statsd_sample_rate_factor = 1.0
+# log_statsd_metric_prefix =
+
+[pipeline:main]
+# Note: gatekeeper middleware is not allowed in the internal client pipeline
+pipeline = catch_errors proxy-logging cache symlink proxy-server
+
+[app:proxy-server]
+use = egg:swift#proxy
+account_autocreate = true
+# See proxy-server.conf-sample for options
+
+[filter:symlink]
+use = egg:swift#symlink
+# See proxy-server.conf-sample for options
+
+[filter:cache]
+use = egg:swift#memcache
+# See proxy-server.conf-sample for options
+
+[filter:proxy-logging]
+use = egg:swift#proxy_logging
+# See proxy-server.conf-sample for options
+
+[filter:catch_errors]
+use = egg:swift#catch_errors
+# See proxy-server.conf-sample for options
diff --git a/etc/keymaster.conf-sample b/etc/keymaster.conf-sample
new file mode 100644
index 0000000000..7881676e1a
--- /dev/null
+++ b/etc/keymaster.conf-sample
@@ -0,0 +1,131 @@
+[keymaster]
+# Over time, the format of crypto metadata on disk may change slightly to resolve
+# ambiguities. In general, you want to be writing the newest version, but to
+# ensure that all writes can still be read during rolling upgrades, there's the
+# option to write older formats as well.
+# Before upgrading from Swift 2.20.0 or earlier, ensure this is set to 1
+# Before upgrading from Swift 2.25.0 or earlier, ensure this is set to at most 2
+# After upgrading all proxy servers, set this to 3 (currently the highest version)
+# meta_version_to_write = 3
+
+# Sets the root secret from which encryption keys are derived. This must be set
+# before first use to a value that is a base64 encoding of at least 32 bytes.
+# The security of all encrypted data critically depends on this key, therefore
+# it should be set to a high-entropy value. For example, a suitable value may
+# be obtained by base-64 encoding a 32 byte (or longer) value generated by a
+# cryptographically secure random number generator. Changing the root secret is
+# likely to result in data loss. If this option is set, the root secret MUST
+# NOT be set in proxy-server.conf.
+# encryption_root_secret = changeme
+
+[kms_keymaster]
+# The kms_keymaster section is used for configuring a keymaster that retrieves
+# the encryption root secret from an external key management system (kms),
+# using the Castellan abstraction layer. Castellan can support various kms
+# backends that use Keystone for authentication. Currently, the only
+# implemented backend is for Barbican.
+
+# Over time, the format of crypto metadata on disk may change slightly to resolve
+# ambiguities. In general, you want to be writing the newest version, but to
+# ensure that all writes can still be read during rolling upgrades, there's the
+# option to write older formats as well.
+# Before upgrading from Swift 2.20.0 or earlier, ensure this is set to 1
+# Before upgrading from Swift 2.25.0 or earlier, ensure this is set to at most 2
+# After upgrading all proxy servers, set this to 3 (currently the highest version)
+# meta_version_to_write = 3
+
+# The api_class tells Castellan which key manager to use to access the external
+# key management system. The default value that accesses Barbican is
+# castellan.key_manager.barbican_key_manager.BarbicanKeyManager.
+# api_class = castellan.key_manager.barbican_key_manager.BarbicanKeyManager
+
+# The configuration options below apply to a Barbican KMS being accessed using
+# Castellan. If another KMS type is used (by specifying another value for
+# api_class), then other configuration options may be required.
+
+# The key_id is the identifier of the root secret stored in the KMS. For
+# details of how to store an existing root secret in Barbican, or how to
+# generate a new root secret in Barbican, see the 'overview_encryption'
+# documentation.
+# The key_id is the final part of the secret href returned in the
+# output of an 'openstack secret order get' command after an order to store or
+# create a key has been successfully completed. See the 'overview_encryption'
+# documentation for more information on this command.
+# key_id = changeme
+
+# The Keystone username of the user used to access the key from the KMS. The
+# username shall be set to match an existing user.
+# username = changeme
+
+# The password to go with the Keystone username above.
+# password = changeme
+
+# The Keystone project name. For security reasons, it is recommended to set
+# the project_name to a project separate from the service project used by
+# other OpenStack services. Thereby, if another service is compromised, it will
+# not have access to the Swift root encryption secret. It is recommended that
+# the swift user is the only one that has a role in this project.
+# project_name = changeme
+# Instead of the project name, the project id may also be used.
+# project_id = changeme
+
+# The Keystone URL to authenticate to. The value of auth_endpoint may be
+# set according to the value of www_authenticate_uri in [filter:authtoken] in
+# proxy-server.conf.
+# auth_endpoint = http://keystonehost/identity
+
+# The project and user domain names may optionally be specified. If they are
+# not specified, the default values of 'Default' (for *_domain_name) and
+# 'default' (for *_domain_id) are used (note the capitalization).
+# project_domain_name = Default
+# user_domain_name = Default
+# Instead of the project domain name and user domain name, the project domain
+# id and user domain id may also be specified.
+# project_domain_id = default
+# user_domain_id = default
+
+# The following configuration options may also be used in addition to/instead
+# of the above options. Refer to the Keystone documentation for more details
+# on the usage of the options: https://docs.openstack.org/keystone/
+# user_id = changeme
+# trust_id = changeme
+# reauthenticate = changeme
+# domain_id = changeme
+# domain_name = changeme
+
+# If running on a multi-region cluster, Castellan may select the wrong
+# endpoint for Barbican. To avoid this, configure the region name for the
+# correct barbican endpoint, or specify the barbican endpoint explicitly.
+# If there is only a single Barbican service in your deployment, it is
+# fine to leave these unconfigured.
+# barbican_region_name =
+# barbican_endpoint =
+
+[kmip_keymaster]
+# The kmip_keymaster section is used to configure a keymaster that fetches an
+# encryption root secret from a KMIP service.
+
+# Over time, the format of crypto metadata on disk may change slightly to resolve
+# ambiguities. In general, you want to be writing the newest version, but to
+# ensure that all writes can still be read during rolling upgrades, there's the
+# option to write older formats as well.
+# Before upgrading from Swift 2.20.0 or earlier, ensure this is set to 1
+# Before upgrading from Swift 2.25.0 or earlier, ensure this is set to at most 2
+# After upgrading all proxy servers, set this to 3 (currently the highest version)
+# meta_version_to_write = 3
+
+# The value of the ``key_id`` option should be the unique identifier for a
+# secret that will be retrieved from the KMIP service. The secret should be an
+# AES-256 symmetric key.
+# key_id = <unique id of secret to be fetched from the KMIP service>
+
+# The remaining options are used to configure a PyKMIP client and are shown
+# below for information. The authoritative definition of these options can be
+# found at: https://pykmip.readthedocs.io/en/latest/client.html.
+# host = <KMIP server host>
+# port = <KMIP server port>
+# certfile = /path/to/client/cert.pem
+# keyfile = /path/to/client/key.pem
+# ca_certs = /path/to/server/cert.pem
+# username = <KMIP username>
+# password = <KMIP password>
diff --git a/etc/magic b/etc/magic
new file mode 100644
index 0000000000..0bd2a65064
--- /dev/null
+++ b/etc/magic
@@ -0,0 +1,20 @@
+#-------------------------------------------------------------------------------
+# Openstack swift
+# Note: add this snippet to either /etc/magic or ~/.magic
+#-------------------------------------------------------------------------------
+# gzip compressed
+0 beshort 0x1f8b
+# compress method: deflate, flags: FNAME
+>&0 beshort 0x0808
+# skip ahead another 6 (MTIME, XLF, OS); read FNAME
+>>&6 search/0x40 \0
+# Skip ahead five; should cover
+#   00    -- uncompressed block
+#   06 00 -- ... of length 6
+#   f9 ff -- (one's complement of length)
+>>>&5 string/4 R1NG     Swift ring,
+>>>>&0 clear x
+>>>>&0 beshort 1        version 1
+>>>>&0 beshort 2        version 2
+>>>>&0 default x
+>>>>>&0 beshort x       unknown version (0x%04x)
diff --git a/etc/memcache.conf-sample b/etc/memcache.conf-sample
index 5ad48ab100..f85e49edc6 100644
--- a/etc/memcache.conf-sample
+++ b/etc/memcache.conf-sample
@@ -2,14 +2,53 @@
 # You can use this single conf file instead of having memcache_servers set in
 # several other conf files under [filter:cache] for example. You can specify
 # multiple servers separated with commas, as in: 10.1.2.3:11211,10.1.2.4:11211
+# (IPv6 addresses must follow rfc3986 section-3.2.2, i.e. [::1]:11211)
 # memcache_servers = 127.0.0.1:11211
 #
-# Sets how memcache values are serialized and deserialized:
-# 0 = older, insecure pickle serialization
-# 1 = json serialization but pickles can still be read (still insecure)
-# 2 = json serialization only (secure and the default)
-# To avoid an instant full cache flush, existing installations should
-# upgrade with 0, then set to 1 and reload, then after some time (24 hours)
-# set to 2 and reload.
-# In the future, the ability to use pickle serialization will be removed.
-# memcache_serialization_support = 2
+# Sets the maximum number of connections to each memcached server per worker
+# memcache_max_connections = 2
+#
+# Timeout for connection
+# connect_timeout = 0.3
+# Timeout for pooled connection
+# pool_timeout = 1.0
+# number of servers to retry on failures getting a pooled connection
+# tries = 3
+# Timeout for read and writes
+# io_timeout = 2.0
+#
+# How long without an error before a server's error count is reset. This will
+# also be how long before a server is reenabled after suppression is triggered.
+# Set to 0 to disable error-limiting.
+# error_suppression_interval = 60.0
+#
+# How many errors can accumulate before a server is temporarily ignored.
+# error_suppression_limit = 10
+#
+# (Optional) Global toggle for TLS usage when comunicating with
+# the caching servers.
+# tls_enabled = false
+#
+# (Optional) Path to a file of concatenated CA certificates in PEM
+# format necessary to establish the caching server's authenticity.
+# If tls_enabled is False, this option is ignored.
+# tls_cafile =
+#
+# (Optional) Path to a single file in PEM format containing the
+# client's certificate as well as any number of CA certificates
+# needed to establish the certificate's authenticity. This file
+# is only required when client side authentication is necessary.
+# If tls_enabled is False, this option is ignored.
+# tls_certfile =
+#
+# (Optional) Path to a single file containing the client's private
+# key in. Otherwhise the private key will be taken from the file
+# specified in tls_certfile. If tls_enabled is False, this option
+# is ignored.
+# tls_keyfile =
+#
+# If an item size ever gets above item_size_warning_threshold then a warning will be
+# logged. This can be used to alert when memcache item sizes are getting to their limit.
+# It's an absolute size in bytes. Setting the value to 0 will warn on every memcache set.
+# A value of -1 disables the warning.
+# item_size_warning_threshold = -1
diff --git a/etc/object-expirer.conf-sample b/etc/object-expirer.conf-sample
index cef0f0f19d..109c0b5093 100644
--- a/etc/object-expirer.conf-sample
+++ b/etc/object-expirer.conf-sample
@@ -6,26 +6,118 @@
 # log_facility = LOG_LOCAL0
 # log_level = INFO
 # log_address = /dev/log
+# The following caps the length of log lines to the value given; no limit if
+# set to 0, the default.
+# log_max_line_length = 0
+#
 # comma separated list of functions to call to setup custom log handlers.
 # functions get passed: conf, name, log_to_console, log_route, fmt, logger,
 # adapted_logger
 # log_custom_handlers =
+#
 # If set, log_udp_host will override log_address
 # log_udp_host =
 # log_udp_port = 514
+#
 # You can enable StatsD logging here:
-# log_statsd_host = localhost
+# log_statsd_host =
 # log_statsd_port = 8125
-# log_statsd_default_sample_rate = 1
+# log_statsd_default_sample_rate = 1.0
+# log_statsd_sample_rate_factor = 1.0
 # log_statsd_metric_prefix =
+#
+# You can set scheduling priority of processes. Niceness values range from -20
+# (most favorable to the process) to 19 (least favorable to the process).
+# nice_priority =
+#
+# You can set I/O scheduling class and priority of processes. I/O niceness
+# class values are realtime, best-effort and idle. I/O niceness
+# priority is a number which goes from 0 to 7. The higher the value, the lower
+# the I/O priority of the process. Work only with ionice_class.
+# ionice_class =
+# ionice_priority =
 
 [object-expirer]
-# interval = 300
-# auto_create_account_prefix = .
-# report_interval = 300
+# interval = 300.0
+# report_interval = 300.0
+#
+# request_tries is the number of times the expirer's internal client will
+# attempt any given request in the event of failure. The default is 3.
+# request_tries = 3
+
+# concurrency is the level of concurrency to use to do the work, this value
+# must be set to at least 1
+# concurrency = 1
+#
+# deletes can be ratelimited to prevent the expirer from overwhelming the cluster
+# tasks_per_second = 50.0
+#
+# processes is how many parts to divide the work into, one part per process
+# that will be doing the work
+# processes set 0 means that a single process will be doing all the work
+# processes can also be specified on the command line and will override the
+# config value
+# processes = 0
+#
+# process is which of the parts a particular process will work on
+# process can also be specified on the command line and will override the config
+# value
+# process is "zero based", if you want to use 3 processes, you should run
+# processes with process set to 0, 1, and 2
+# process = 0
+#
+# The expirer will re-attempt expiring if the source object is not available
+# up to reclaim_age seconds before it gives up and deletes the entry in the
+# queue.
+# reclaim_age = 604800
+#
+# The expirer can delay the reaping of expired objects on disk (and in
+# container listings) with an account level or container level delay_reaping
+# time.
+# After the delay_reaping time has passed objects will be reaped as normal.
+# You may configure this delay_reaping value in seconds with dynamic config
+# option names prefixed with delay_reaping_<ACCT> for account level delays
+# and delay_reaping_<ACCT>/<CNTR> for container level delays.
+# Special characters in <ACCT> or <CNTR> should be quoted.
+# The delay_reaping value should be a float value greater than or equal to
+# zero.
+# A container level delay_reaping does not require an account level
+# delay_reaping but overrides the account level delay_reaping for the same
+# account if it exists.
+# For example:
+# delay_reaping_AUTH_test = 300.0
+# delay_reaping_AUTH_test2 = 86400.0
+# delay_reaping_AUTH_test/test = 400.0
+# delay_reaping_AUTH_test/test2 = 600.0
+# delay_reaping_AUTH_test/special%0Achars%3Dshould%20be%20quoted
+# N.B. By default no delay_reaping value is configured for any accounts or
+# containers.
+
+# Number of tasks objects to cache before processing.  With many nodes it may
+# take some time to fill a larger cache_size but may also have a better chance
+# to distribute DELETEs to multiple target containers.
+# round_robin_task_cache_size = 100000
+
+# recon_cache_path = /var/cache/swift
+#
+# You can set scheduling priority of processes. Niceness values range from -20
+# (most favorable to the process) to 19 (least favorable to the process).
+# nice_priority =
+#
+# You can set I/O scheduling class and priority of processes. I/O niceness
+# class values are realtime, best-effort and idle. I/O niceness
+# priority is a number which goes from 0 to 7. The higher the value, the lower
+# the I/O priority of the process. Work only with ionice_class.
+# ionice_class =
+# ionice_priority =
+
+#
+# The following sections define the configuration of the expirer's internal
+# client pipeline
+#
 
 [pipeline:main]
-pipeline = catch_errors cache proxy-server
+pipeline = catch_errors proxy-logging cache proxy-server
 
 [app:proxy-server]
 use = egg:swift#proxy
@@ -38,3 +130,7 @@ use = egg:swift#memcache
 [filter:catch_errors]
 use = egg:swift#catch_errors
 # See proxy-server.conf-sample for options
+
+[filter:proxy-logging]
+use = egg:swift#proxy_logging
+# See proxy-server.conf-sample for options
diff --git a/etc/object-server.conf-sample b/etc/object-server.conf-sample
index 2e8b54f4eb..dd6bc21866 100644
--- a/etc/object-server.conf-sample
+++ b/etc/object-server.conf-sample
@@ -1,36 +1,121 @@
 [DEFAULT]
 # bind_ip = 0.0.0.0
-# bind_port = 6000
+bind_port = 6200
+# keep_idle = 600
 # bind_timeout = 30
 # backlog = 4096
-# workers = 1
 # user = swift
 # swift_dir = /etc/swift
 # devices = /srv/node
 # mount_check = true
 # disable_fallocate = false
-# expiring_objects_container_divisor = 86400
+#
+# Use an integer to override the number of pre-forked processes that will
+# accept connections.  NOTE: if servers_per_port is set, this setting is
+# ignored.
+# workers = auto
+#
+# Make object-server run this many worker processes per unique port of "local"
+# ring devices across all storage policies. The default value of 0 disables this
+# feature.
+# servers_per_port = 0
+#
+# If running in a container, servers_per_port may not be able to use the
+# bind_ip to lookup the ports in the ring.  You may instead override the port
+# lookup in the ring using the ring_ip.  Any devices/ports associted with the
+# ring_ip will be used when listening on the configured bind_ip address.
+# ring_ip = <bind_ip>
+#
+# Maximum concurrent requests per worker
+# max_clients = 1024
+#
 # You can specify default log routing here if you want:
 # log_name = swift
 # log_facility = LOG_LOCAL0
 # log_level = INFO
 # log_address = /dev/log
+# The following caps the length of log lines to the value given; no limit if
+# set to 0, the default.
+# log_max_line_length = 0
+#
+# Hashing algorithm for log anonymization. Must be one of algorithms supported
+# by Python's hashlib.
+# log_anonymization_method = MD5
+#
+# Salt added during log anonymization
+# log_anonymization_salt =
+#
+# Template used to format logs. All words surrounded by curly brackets
+# will be substituted with the appropriate values
+# log_format = {remote_addr} - - [{time.d}/{time.b}/{time.Y}:{time.H}:{time.M}:{time.S} +0000] "{method} {path}" {status} {content_length} "{referer}" "{txn_id}" "{user_agent}" {trans_time:.4f} "{additional_info}" {pid} {policy_index}
+#
 # comma separated list of functions to call to setup custom log handlers.
 # functions get passed: conf, name, log_to_console, log_route, fmt, logger,
 # adapted_logger
 # log_custom_handlers =
+#
 # If set, log_udp_host will override log_address
 # log_udp_host =
 # log_udp_port = 514
+#
 # You can enable StatsD logging here:
-# log_statsd_host = localhost
+# log_statsd_host =
 # log_statsd_port = 8125
-# log_statsd_default_sample_rate = 1
+# log_statsd_default_sample_rate = 1.0
+# log_statsd_sample_rate_factor = 1.0
 # log_statsd_metric_prefix =
+#
 # eventlet_debug = false
+#
+# You can set fallocate_reserve to the number of bytes or percentage of disk
+# space you'd like fallocate to reserve, whether there is space for the given
+# file size or not. Percentage will be used if the value ends with a '%'.
+# fallocate_reserve = 1%
+#
+# Time to wait while attempting to connect to another backend node.
+# conn_timeout = 0.5
+# Time to wait while sending each chunk of data to another backend node.
+# node_timeout = 3
+# Time to wait while sending a container update on object update.
+# container_update_timeout = 1.0
+# Time to wait while receiving each chunk of data from a client or another
+# backend node.
+# client_timeout = 60.0
+#
+# network_chunk_size = 65536
+# disk_chunk_size = 65536
+#
+# Reclamation of tombstone files is performed primarily by the replicator and
+# the reconstructor but the object-server and object-auditor also reference
+# this value - it should be the same for all object services in the cluster,
+# and not greater than the container services reclaim_age
+# reclaim_age = 604800
+#
+# Non-durable data files may also get reclaimed if they are older than
+# reclaim_age, but not if the time they were written to disk (i.e. mtime) is
+# less than commit_window seconds ago. The commit_window also prevents the
+# reconstructor removing recently written non-durable data files from a handoff
+# node after reverting them to a primary. This gives the object-server a window
+# in which to finish a concurrent PUT on a handoff and mark the data durable. A
+# commit_window greater than zero is strongly recommended to avoid unintended
+# removal of data files that were about to become durable; commit_window should
+# be much less than reclaim_age.
+# commit_window = 60.0
+#
+# You can set scheduling priority of processes. Niceness values range from -20
+# (most favorable to the process) to 19 (least favorable to the process).
+# nice_priority =
+#
+# You can set I/O scheduling class and priority of processes. I/O niceness
+# class values are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and
+# IOPRIO_CLASS_IDLE (idle). I/O niceness priority is a number which goes from
+# 0 to 7. The higher the value, the lower the I/O priority of the process.
+# Work only with ionice_class.
+# ionice_class =
+# ionice_priority =
 
 [pipeline:main]
-pipeline = healthcheck recon object-server
+pipeline = healthcheck recon backend_ratelimit object-server
 
 [app:object-server]
 use = egg:swift#object
@@ -38,26 +123,132 @@ use = egg:swift#object
 # set log_name = object-server
 # set log_facility = LOG_LOCAL0
 # set log_level = INFO
-# set log_requests = True
+# set log_requests = true
 # set log_address = /dev/log
-# node_timeout = 3
-# conn_timeout = 0.5
-# network_chunk_size = 65536
-# disk_chunk_size = 65536
+#
 # max_upload_time = 86400
+#
+# slow is the total amount of seconds an object PUT/DELETE request takes at
+# least. If it is faster, the object server will sleep this amount of time minus
+# the already passed transaction time.  This is only useful for simulating slow
+# devices on storage nodes during testing and development.
 # slow = 0
+#
 # Objects smaller than this are not evicted from the buffercache once read
-# keep_cache_size = 5424880
+# keep_cache_size = 5242880
+#
 # If true, objects for authenticated GET requests may be kept in buffer cache
 # if small enough
-# keep_cache_private = False
+# keep_cache_private = false
+#
+# If true, SLO object's manifest file for GET requests may be kept in buffer cache
+# if smaller than 'keep_cache_size'. And this config will only matter when
+# 'keep_cache_private' is false.
+# keep_cache_slo_manifest = false
+#
+# cooperative_period defines how frequent object server GET/PUT request will
+# perform the cooperative yielding during iterating the disk chunks. For
+# example, value of '5' will insert one sleep() after every 5 disk_chunk_size
+# chunk reads/writes. A value of '0' (the default) will turn off cooperative
+# yielding.
+# cooperative_period = 0
+#
+# By default, the object-server will always validate the MD5 of object data
+# while streaming a complete object response. Occassionally this is identified
+# as a CPU bottleneck, consuming as much as 40% of the CPU time of the
+# object-server. Since range-request-heavy clients don't get these integrity
+# checks, it seems reasonable to give operators a chance to tune it down and
+# instead rely on the object-auditor to detect and quarantine corrupted objects.
+# etag_validate_pct = 100
+#
 # on PUTs, sync data every n MB
 # mb_per_sync = 512
+#
 # Comma separated list of headers that can be set in metadata on an object.
 # This list is in addition to X-Object-Meta-* headers and cannot include
 # Content-Type, etag, Content-Length, or deleted
-# allowed_headers = Content-Disposition, Content-Encoding, X-Delete-At, X-Object-Manifest
-# auto_create_account_prefix = .
+# allowed_headers = Content-Disposition, Content-Encoding, X-Delete-At, X-Object-Manifest, X-Static-Large-Object, Cache-Control, Content-Language, Expires, X-Robots-Tag
+
+# The number of threads in eventlet's thread pool. Most IO will occur
+# in the object server's main thread, but certain "heavy" IO
+# operations will occur in separate IO threads, managed by eventlet.
+#
+# The default value is auto, whose actual value is dependent on the
+# servers_per_port value:
+#
+#  - When servers_per_port is zero, the default value of
+#    eventlet_tpool_num_threads is empty, which uses eventlet's default
+#    (currently 20 threads).
+#
+#  - When servers_per_port is nonzero, the default value of
+#    eventlet_tpool_num_threads is 1.
+#
+# But you may override this value to any integer value.
+#
+# Note that this value is threads per object-server process, so to
+# compute the total number of IO threads on a node, you must multiply
+# this by the number of object-server processes on the node.
+#
+# eventlet_tpool_num_threads = auto
+
+# You can disable REPLICATE and SSYNC handling (default is to allow it). When
+# deploying a cluster with a separate replication network, you'll want multiple
+# object-server processes running: one for client-driven traffic and another
+# for replication traffic. The server handling client-driven traffic may set
+# this to false. If there is only one object-server process, leave this as
+# true.
+# replication_server = true
+#
+# Set to restrict the number of concurrent incoming SSYNC requests
+# Set to 0 for unlimited
+# Note that SSYNC requests are only used by the object reconstructor or the
+# object replicator when configured to use ssync.
+# replication_concurrency = 4
+#
+# Set to restrict the number of concurrent incoming SSYNC requests per
+# device; set to 0 for unlimited requests per device. This can help control
+# I/O to each device. This does not override replication_concurrency described
+# above, so you may need to adjust both parameters depending on your hardware
+# or network capacity.
+# replication_concurrency_per_device = 1
+#
+# Number of seconds to wait for an existing replication device lock before
+# giving up.
+# replication_lock_timeout = 15
+#
+# These next two settings control when the SSYNC subrequest handler will
+# abort an incoming SSYNC attempt. An abort will occur if there are at
+# least threshold number of failures and the value of failures / successes
+# exceeds the ratio. The defaults of 100 and 1.0 means that at least 100
+# failures have to occur and there have to be more failures than successes for
+# an abort to occur.
+# replication_failure_threshold = 100
+# replication_failure_ratio = 1.0
+#
+# Use splice() for zero-copy object GETs. This requires Linux kernel
+# version 3.0 or greater. If you set "splice = yes" but the kernel
+# does not support it, error messages will appear in the object server
+# logs at startup, but your object servers should continue to function.
+#
+# splice = no
+#
+# You can set scheduling priority of processes. Niceness values range from -20
+# (most favorable to the process) to 19 (least favorable to the process).
+# nice_priority =
+#
+# You can set I/O scheduling class and priority of processes. I/O niceness
+# class values are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and
+# IOPRIO_CLASS_IDLE (idle). I/O niceness priority is a number which goes from
+# 0 to 7. The higher the value, the lower the I/O priority of the process.
+# Work only with ionice_class.
+# ionice_class =
+# ionice_priority =
+#
+# When reloading servers with SIGUSR1, workers running with old config/code
+# are allowed some time to finish serving in-flight requests. Use this to
+# configure the grace period (in seconds), after which the reloaded server
+# will issue SIGKILLs to remaining stale workers.
+# stale_worker_timeout = 86400
 
 [filter:healthcheck]
 use = egg:swift#healthcheck
@@ -70,43 +261,315 @@ use = egg:swift#recon
 #recon_cache_path = /var/cache/swift
 #recon_lock_path = /var/lock
 
+[filter:backend_ratelimit]
+use = egg:swift#backend_ratelimit
+# Config options can optionally be loaded from a separate config file. Config
+# options in this section will be used unless the same option is found in the
+# config file, in which case the config file option will be used. See the
+# backend-ratelimit.conf-sample file for details of available config options.
+# backend_ratelimit_conf_path = /etc/swift/backend-ratelimit.conf
+
+# The minimum interval between attempts to reload any config file at
+# backend_ratelimit_conf_path while the server is running. A value of 0 means
+# that the file is loaded at start-up but not subsequently reloaded. Note that
+# config options in this section are never reloaded after start-up.
+# config_reload_interval = 60
+
 [object-replicator]
 # You can override the default log routing for this app here (don't use set!):
 # log_name = object-replicator
 # log_facility = LOG_LOCAL0
 # log_level = INFO
 # log_address = /dev/log
-# vm_test_mode = no
+#
 # daemonize = on
-# run_pause = 30
+#
+# Time in seconds to wait between replication passes
+# interval = 30.0
+# run_pause is deprecated, use interval instead
+# run_pause = 30.0
+#
+# Number of concurrent replication jobs to run. This is per-process,
+# so replicator_workers=W and concurrency=C will result in W*C
+# replication jobs running at once.
 # concurrency = 1
-# stats_interval = 300
+#
+# Number of worker processes to use. No matter how big this number is,
+# at most one worker per disk will be used. 0 means no forking; all work
+# is done in the main process.
+# replicator_workers = 0
+#
+# stats_interval = 300.0
+#
+# default is rsync, alternative is ssync
+# sync_method = rsync
+#
 # max duration of a partition rsync
 # rsync_timeout = 900
-# passed to rsync for io op timeout
+#
+# bandwidth limit for rsync in kB/s. 0 means unlimited. rsync 3.2.2 and later
+# accept suffixed values like 10M or 1.5G; see the --bwlimit option for rsync(1)
+# rsync_bwlimit = 0
+#
+# passed to rsync for both io op timeout and connection timeout
 # rsync_io_timeout = 30
-# max duration of an http request
+#
+# Allow rsync to compress data which is transmitted to destination node
+# during sync. However, this is applicable only when destination node is in
+# a different region than the local one.
+# NOTE: Objects that are already compressed (for example: .tar.gz, .mp3) might
+# slow down the syncing process.
+# rsync_compress = no
+#
+# Format of the rsync module where the replicator will send data. See
+# etc/rsyncd.conf-sample for some usage examples.
+# rsync_module = {replication_ip}::object
+#
+# node_timeout = <whatever's in the DEFAULT section or 10>
+# max duration of an http request; this is for REPLICATE finalization calls and
+# so should be longer than node_timeout
 # http_timeout = 60
+#
 # attempts to kill all workers if nothing replicates for lockup_timeout seconds
 # lockup_timeout = 1800
-# The replicator also performs reclamation
-# reclaim_age = 604800
-# ring_check_interval = 15
+#
+# ring_check_interval = 15.0
 # recon_cache_path = /var/cache/swift
+#
+# By default, per-file rsync transfers are logged at debug if successful and
+# error on failure. During large rebalances (which both increase the number
+# of diskfiles transferred and increases the likelihood of failures), this
+# can overwhelm log aggregation while providing little useful insights.
+# Change this to false to disable per-file logging.
+# log_rsync_transfers = true
+#
+# limits how long rsync error log lines are
+# 0 means to log the entire line
+# rsync_error_log_line_length = 0
+#
+# handoffs_first and handoff_delete are options for a special case
+# such as disk full in the cluster. These two options SHOULD NOT BE
+# CHANGED, except for such an extreme situations. (e.g. disks filled up
+# or are about to fill up. Anyway, DO NOT let your drives fill up)
+# handoffs_first is the flag to replicate handoffs prior to canonical
+# partitions. It allows to force syncing and deleting handoffs quickly.
+# If set to a True value(e.g. "True" or "1"), partitions
+# that are not supposed to be on the node will be replicated first.
+# handoffs_first = False
+#
+# handoff_delete is the number of replicas which are ensured in swift.
+# If the number less than the number of replicas is set, object-replicator
+# could delete local handoffs even if all replicas are not ensured in the
+# cluster. Object-replicator would remove local handoff partition directories
+# after syncing partition when the number of successful responses is greater
+# than or equal to this number. By default(auto), handoff partitions will be
+# removed  when it has successfully replicated to all the canonical nodes.
+# handoff_delete = auto
+#
+# You can set scheduling priority of processes. Niceness values range from -20
+# (most favorable to the process) to 19 (least favorable to the process).
+# nice_priority =
+#
+# You can set I/O scheduling class and priority of processes. I/O niceness
+# class values are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and
+# IOPRIO_CLASS_IDLE (idle). I/O niceness priority is a number which goes from
+# 0 to 7. The higher the value, the lower the I/O priority of the process.
+# Work only with ionice_class.
+# ionice_class =
+# ionice_priority =
 
-[object-updater]
+[object-reconstructor]
 # You can override the default log routing for this app here (don't use set!):
-# log_name = object-updater
+# Unless otherwise noted, each setting below has the same meaning as described
+# in the [object-replicator] section, however these settings apply to the EC
+# reconstructor
+#
+# log_name = object-reconstructor
 # log_facility = LOG_LOCAL0
 # log_level = INFO
 # log_address = /dev/log
-# interval = 300
+#
+# daemonize = on
+#
+# Time in seconds to wait between reconstruction passes
+# interval = 30.0
+# run_pause is deprecated, use interval instead
+# run_pause = 30.0
+#
+# Maximum number of worker processes to spawn.  Each worker will handle a
+# subset of devices.  Devices will be assigned evenly among the workers so that
+# workers cycle at similar intervals (which can lead to fewer workers than
+# requested).  You can not have more workers than devices.  If you have no
+# devices only a single worker is spawned.
+# reconstructor_workers = 0
+#
 # concurrency = 1
+# stats_interval = 300.0
 # node_timeout = 10
-# conn_timeout = 0.5
-# slowdown will sleep that amount between objects
+# http_timeout = 60
+# lockup_timeout = 1800
+# ring_check_interval = 15.0
+# recon_cache_path = /var/cache/swift
+#
+# The handoffs_only mode option is for special case emergency situations during
+# rebalance such as disk full in the cluster.  This option SHOULD NOT BE
+# CHANGED, except for extreme situations.  When handoffs_only mode is enabled
+# the reconstructor will *only* revert fragments from handoff nodes to primary
+# nodes and will not sync primary nodes with neighboring primary nodes.  This
+# will force the reconstructor to sync and delete handoffs' fragments more
+# quickly and minimize the time of the rebalance by limiting the number of
+# rebuilds.  The handoffs_only option is only for temporary use and should be
+# disabled as soon as the emergency situation has been resolved.  When
+# handoffs_only is not set, the deprecated handoffs_first option will be
+# honored as a synonym, but may be ignored in a future release.
+# handoffs_only = False
+#
+# The default strategy for unmounted drives will stage rebuilt data on a
+# handoff node until updated rings are deployed.  Because fragments are rebuilt
+# on offset handoffs based on fragment index and the proxy limits how deep it
+# will search for EC frags we restrict how many nodes we'll try.  Setting to 0
+# will disable rebuilds to handoffs and only rebuild fragments for unmounted
+# devices to mounted primaries after a ring change.
+# Setting to -1 means "no limit".
+# rebuild_handoff_node_count = 2
+#
+# By default the reconstructor attempts to revert all objects from handoff
+# partitions in a single batch using a single SSYNC request. In exceptional
+# circumstances max_objects_per_revert can be used to temporarily limit the
+# number of objects reverted by each reconstructor revert type job. If more
+# than max_objects_per_revert are available in a sender's handoff partition,
+# the remaining objects will remain in the handoff partition and will not be
+# reverted until the next time the reconstructor visits that handoff partition
+# i.e. with this option set, a single cycle of the reconstructor may not
+# completely revert all handoff partitions. The option has no effect on
+# reconstructor sync type jobs between primary partitions. A value of 0 (the
+# default) means there is no limit.
+# max_objects_per_revert = 0
+#
+# You can set scheduling priority of processes. Niceness values range from -20
+# (most favorable to the process) to 19 (least favorable to the process).
+# nice_priority =
+#
+# You can set I/O scheduling class and priority of processes. I/O niceness
+# class values are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and
+# IOPRIO_CLASS_IDLE (idle). I/O niceness priority is a number which goes from
+# 0 to 7. The higher the value, the lower the I/O priority of the process.
+# Work only with ionice_class.
+# ionice_class =
+# ionice_priority =
+#
+# When upgrading from liberasurecode<=1.5.0, you may want to continue writing
+# legacy CRCs until all nodes are upgraded and capabale of reading fragments
+# with zlib CRCs. liberasurecode>=1.6.2 checks for the environment variable
+# LIBERASURECODE_WRITE_LEGACY_CRC; if set (value doesn't matter), it will use
+# its legacy CRC. Set this option to true or false to ensure the environment
+# variable is or is not set. Leave the option blank or absent to not touch
+# the environment (default). For more information, see
+# https://bugs.launchpad.net/liberasurecode/+bug/1886088
+# write_legacy_ec_crc =
+#
+# When attempting to reconstruct a missing fragment on another node from a
+# fragment on the local node, the reconstructor may fail to fetch sufficient
+# fragments to reconstruct the missing fragment. This may be because most or
+# all of the remote fragments have been deleted, and the local fragment is
+# stale, in which case the reconstructor will never succeed in reconstructing
+# the apparently missing fragment and will log errors. If the object's
+# tombstones have been reclaimed then the stale fragment will never be deleted
+# (see https://bugs.launchpad.net/swift/+bug/1655608). If an operator suspects
+# that stale fragments have been re-introduced to the cluster and is seeing
+# error logs similar to those in the bug report, then the quarantine_threshold
+# option may be set to a value greater than zero. This enables the
+# reconstructor to quarantine the stale fragments when it fails to fetch more
+# than the quarantine_threshold number of fragments (including the stale
+# fragment) during an attempt to reconstruct. For example, setting the
+# quarantine_threshold to 1 would cause a fragment to be quarantined if no
+# other fragments can be fetched. The value may be reset to zero after the
+# reconstructor has run on all affected nodes and the error logs are no longer
+# seen.
+# Note: the quarantine_threshold applies equally to all policies, but for each
+# policy it is effectively capped at (ec_ndata - 1) so that a fragment is never
+# quarantined when sufficient fragments exist to reconstruct the object.
+# quarantine_threshold = 0
+#
+# Fragments are not quarantined until they are older than
+# quarantine_age, which defaults to the value of reclaim_age.
+# quarantine_age =
+#
+# Sets the maximum number of nodes to which requests will be made before
+# quarantining a fragment. You can use '* replicas' at the end to have it use
+# the number given times the number of replicas for the ring being used for the
+# requests. The minimum number of nodes to which requests are made is the
+# number of replicas for the policy minus 1 (the node on which the fragment is
+# to be rebuilt). The minimum is only exceeded if request_node_count is
+# greater, and only for the purposes of quarantining.
+# request_node_count = 2 * replicas
+
+[object-updater]
+# You can override the default log routing for this app here (don't use set!):
+# log_name = object-updater
+# log_facility = LOG_LOCAL0
+# log_level = INFO
+# log_address = /dev/log
+#
+# interval = 300.0
+# node_timeout = <whatever's in the DEFAULT section or 10>
+#
+# updater_workers controls how many processes the object updater will
+# spawn, while concurrency controls how many async_pending records
+# each updater process will operate on at any one time. With
+# concurrency=C and updater_workers=W, there will be up to W*C
+# async_pending records being processed at once.
+# concurrency = 8
+# updater_workers = 1
+#
+# Send at most this many object updates per second
+# objects_per_second = 50
+#
+# Send at most this many object updates per bucket per second. The value must
+# be a float greater than or equal to 0. Set to 0 for unlimited.
+# max_objects_per_container_per_second = 0
+#
+# The per_container ratelimit implementation uses a hashring to constrain
+# memory requirements.  Orders of magnitude more buckets will use (nominally)
+# more memory, but will ratelimit smaller groups of containers. The value must
+# be an integer greater than 0.
+# per_container_ratelimit_buckets = 1000
+#
+# Updates that cannot be sent due to per-container rate-limiting may be
+# deferred and re-tried at the end of the updater cycle. This option constrains
+# the size of the in-memory data structure used to store deferred updates.
+# Must be an integer value greater than or equal to 0.
+# max_deferred_updates = 10000
+#
+# Maximum number of oldest async pending timestamps to track for each
+# account-container pair.
+# async_tracker_max_entries = 100
+# Maximum number of oldest async pending timestamps to dump to recon cache.
+# async_tracker_dump_count = 5
+#
+# slowdown will sleep that amount between objects. Deprecated; use
+# objects_per_second instead.
 # slowdown = 0.01
+#
+# Log stats (at INFO level) every report_interval seconds. This
+# logging is per-process, so with concurrency > 1, the logs will
+# contain one stats log per worker process every report_interval
+# seconds.
+# report_interval = 300.0
+#
 # recon_cache_path = /var/cache/swift
+#
+# You can set scheduling priority of processes. Niceness values range from -20
+# (most favorable to the process) to 19 (least favorable to the process).
+# nice_priority =
+#
+# You can set I/O scheduling class and priority of processes. I/O niceness
+# class values are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and
+# IOPRIO_CLASS_IDLE (idle). I/O niceness priority is a number which goes from
+# 0 to 7. The higher the value, the lower the I/O priority of the process.
+# Work only with ionice_class.
+# ionice_class =
+# ionice_priority =
 
 [object-auditor]
 # You can override the default log routing for this app here (don't use set!):
@@ -114,8 +577,230 @@ use = egg:swift#recon
 # log_facility = LOG_LOCAL0
 # log_level = INFO
 # log_address = /dev/log
+#
+# Time in seconds to wait between auditor passes
+# interval = 30.0
+#
+# You can set the disk chunk size that the auditor uses making it larger if
+# you like for more efficient local auditing of larger objects
+# disk_chunk_size = 65536
 # files_per_second = 20
+# concurrency = 1
 # bytes_per_second = 10000000
 # log_time = 3600
 # zero_byte_files_per_second = 50
 # recon_cache_path = /var/cache/swift
+
+# Takes a comma separated list of ints. If set, the object auditor will
+# increment a counter for every object whose size is <= to the given break
+# points and report the result after a full scan.
+# object_size_stats =
+#
+# You can set scheduling priority of processes. Niceness values range from -20
+# (most favorable to the process) to 19 (least favorable to the process).
+# nice_priority =
+#
+# You can set I/O scheduling class and priority of processes. I/O niceness
+# class values are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and
+# IOPRIO_CLASS_IDLE (idle). I/O niceness priority is a number which goes from
+# 0 to 7. The higher the value, the lower the I/O priority of the process.
+# Work only with ionice_class.
+# ionice_class =
+# ionice_priority =
+
+# The auditor will cleanup old rsync tempfiles after they are "old
+# enough" to delete.  You can configure the time elapsed in seconds
+# before rsync tempfiles will be unlinked, or the default value of
+# "auto" try to use object-replicator's rsync_timeout + 900 and fallback
+# to 86400 (1 day).
+# rsync_tempfile_timeout = auto
+
+# A comma-separated list of watcher entry points. This lets operators
+# programmatically see audited objects.
+#
+# The entry point group name is "swift.object_audit_watcher". If your
+# setup.py has something like this:
+#
+# entry_points={'swift.object_audit_watcher': [
+#     'some_watcher = some_module:Watcher']}
+#
+# then you would enable it with "watchers = some_package#some_watcher".
+# For example, the built-in reference implementation is enabled as
+# "watchers = swift#dark_data".
+#
+# watchers =
+
+# Watcher-specific parameters can be added in a section with a name
+# [object-auditor:watcher:some_package#some_watcher]. The following
+# example uses the built-in reference watcher.
+#
+# [object-auditor:watcher:swift#dark_data]
+#
+# Action type can be 'log' (default), 'delete', or 'quarantine'.
+# action=log
+#
+# The watcher ignores the objects younger than certain minimum age.
+# This prevents spurious actions upon fresh objects while container
+# listings eventually settle.
+# grace_age=604800
+
+[object-expirer]
+# If this true, this expirer will execute tasks from legacy expirer task queue,
+# at least one object server should run with dequeue_from_legacy = true
+# dequeue_from_legacy = false
+#
+# Note: Be careful not to enable ``dequeue_from_legacy`` on too many expirers
+# as all legacy tasks are stored in a single hidden account and the same hidden
+# containers. On a large cluster one may inadvertently make the
+# acccount/container server for the hidden too busy.
+#
+# Note: the processes and process options can only be used in conjunction with
+# notes using `dequeue_from_legacy = true`.  These options are ignored on nodes
+# with `dequeue_from_legacy = false`.
+#
+# processes is how many parts to divide the legacy work into, one part per
+# process that will be doing the work
+# processes set 0 means that a single legacy process will be doing all the work
+# processes can also be specified on the command line and will override the
+# config value
+# processes = 0
+#
+# process is which of the parts a particular legacy process will work on
+# process can also be specified on the command line and will override the config
+# value
+# process is "zero based", if you want to use 3 processes, you should run
+# processes with process set to 0, 1, and 2
+# process = 0
+#
+# internal_client_conf_path = /etc/swift/internal-client.conf
+#
+# You can override the default log routing for this app here (don't use set!):
+# log_name = object-expirer
+# log_facility = LOG_LOCAL0
+# log_level = INFO
+# log_address = /dev/log
+#
+# interval = 300.0
+#
+# report_interval = 300.0
+#
+# request_tries is the number of times the expirer's internal client will
+# attempt any given request in the event of failure. The default is 3.
+# request_tries = 3
+#
+# concurrency is the level of concurrency to use to do the work, this value
+# must be set to at least 1
+# concurrency = 1
+#
+# deletes can be ratelimited to prevent the expirer from overwhelming the cluster
+# tasks_per_second = 50.0
+#
+# The expirer will re-attempt expiring if the source object is not available
+# up to reclaim_age seconds before it gives up and deletes the entry in the
+# queue.
+# reclaim_age = 604800
+
+# Number of tasks objects to cache before processing.  With many nodes it may
+# take some time to fill a larger cache_size but may also have a better chance
+# to distribute DELETEs to multiple target containers.
+# round_robin_task_cache_size = 100000
+
+# recon_cache_path = /var/cache/swift
+#
+# You can set scheduling priority of processes. Niceness values range from -20
+# (most favorable to the process) to 19 (least favorable to the process).
+# nice_priority =
+#
+# You can set I/O scheduling class and priority of processes. I/O niceness
+# class values are realtime, best-effort and idle. I/O niceness
+# priority is a number which goes from 0 to 7. The higher the value, the lower
+# the I/O priority of the process. Work only with ionice_class.
+# ionice_class =
+# ionice_priority =
+#
+# The expirer can delay the reaping of expired objects on disk (and in
+# container listings) with an account level or container level delay_reaping
+# time.
+# After the delay_reaping time has passed objects will be reaped as normal.
+# You may configure this delay_reaping value in seconds with dynamic config
+# option names prefixed with delay_reaping_<ACCT> for account level delays
+# and delay_reaping_<ACCT>/<CNTR> for container level delays.
+# Special characters in <ACCT> or <CNTR> should be quoted.
+# The delay_reaping value should be a float value greater than or equal to
+# zero.
+# A container level delay_reaping does not require an account level
+# delay_reaping but overrides the account level delay_reaping for the same
+# account if it exists.
+# For example:
+# delay_reaping_AUTH_test = 300.0
+# delay_reaping_AUTH_test2 = 86400.0
+# delay_reaping_AUTH_test/test = 400.0
+# delay_reaping_AUTH_test/test2 = 600.0
+# delay_reaping_AUTH_test/special%0Achars%3Dshould%20be%20quoted
+# N.B. By default no delay_reaping value is configured for any accounts or
+# containers.
+
+# Note: Put it at the beginning of the pipleline to profile all middleware. But
+# it is safer to put this after healthcheck. Not intended for production
+# environments!
+[filter:xprofile]
+use = egg:swift#xprofile
+# This option enable you to switch profilers which should inherit from python
+# standard profiler. Currently the supported value can be 'cProfile',
+# 'eventlet.green.profile' etc.
+# profile_module = eventlet.green.profile
+#
+# This prefix will be used to combine process ID and timestamp to name the
+# profile data file.  Make sure the executing user has permission to write
+# into this path (missing path segments will be created, if necessary).
+# If you enable profiling in more than one type of daemon, you must override
+# it with an unique value like: /var/log/swift/profile/object.profile
+# log_filename_prefix = /tmp/log/swift/profile/default.profile
+#
+# the profile data will be dumped to local disk based on above naming rule
+# in this interval.
+# dump_interval = 5.0
+#
+# Be careful, this option will enable profiler to dump data into the file with
+# time stamp which means there will be lots of files piled up in the directory.
+# dump_timestamp = false
+#
+# This is the path of the URL to access the mini web UI.
+# path = /__profile__
+#
+# Clear the data when the wsgi server shutdown.
+# flush_at_shutdown = false
+#
+# unwind the iterator of applications
+# unwind = false
+
+[object-relinker]
+# You can override the default log routing for this app here (don't use set!):
+# log_name = object-relinker
+# log_facility = LOG_LOCAL0
+# log_level = INFO
+# log_address = /dev/log
+#
+# Start up to this many sub-processes to process disks in parallel. Each disk
+# will be handled by at most one child process. By default, one process is
+# spawned per disk.
+# workers = auto
+#
+# Target this many relinks/cleanups per second for each worker, to reduce the
+# likelihood that the added I/O from a partition-power increase impacts
+# client traffic. Use zero for unlimited.
+# files_per_second = 0.0
+#
+# stats_interval = 300.0
+# recon_cache_path = /var/cache/swift
+#
+# Highly concurrent PUTs can result in timestamp collisions; see
+# https://bugs.launchpad.net/swift/+bug/1971686 and
+# https://bugs.launchpad.net/swift/+bug/2127779 for more information.
+# This can lead to relinker errors which may be benign; use this option to
+# handle such errors.  With this option enabled during the relink phase
+# we'll quarantine the colliding file in the new target part dir and retry
+# the relink.  During the cleanup phase we ignore the un-matched inode
+# "collision" and allow the cleanup of the old file in the old part dir
+# same as tombstones.
+# clobber_hardlink_collisions = false
diff --git a/etc/proxy-server.conf-sample b/etc/proxy-server.conf-sample
index 7a9254de37..5caa0d630b 100644
--- a/etc/proxy-server.conf-sample
+++ b/etc/proxy-server.conf-sample
@@ -1,39 +1,168 @@
 [DEFAULT]
 # bind_ip = 0.0.0.0
-# bind_port = 80
+bind_port = 8080
+# Connection idle timeout (in seconds)
+# keep_idle = 600
+# Socket bind timeout (in seconds)
 # bind_timeout = 30
 # backlog = 4096
 # swift_dir = /etc/swift
-# workers = 1
 # user = swift
+
+# Enables exposing configuration settings via HTTP GET /info.
+# expose_info = true
+
+# Key to use for admin calls that are HMAC signed.  Default is empty,
+# which will disable admin calls to /info.
+# admin_key = secret_admin_key
+#
+# Allows the ability to withhold sections from showing up in the public calls
+# to /info.  You can withhold subsections by separating the dict level with a
+# ".". Default value is 'swift.valid_api_versions, swift.auto_create_account_prefix'
+# which allows all registered features to be listed via HTTP GET /info except
+# swift.valid_api_versions and swift.auto_create_account_prefix information.
+# As an example, the following would cause the sections 'container_quotas' and
+# 'tempurl' to not be listed, and the key max_failed_deletes would be removed from
+# bulk_delete.
+# disallowed_sections = swift.valid_api_versions, container_quotas, tempurl, bulk_delete.max_failed_deletes
+
+# Use an integer to override the number of pre-forked processes that will
+# accept connections.  Should default to the number of effective cpu
+# cores in the system.  It's worth noting that individual workers will
+# use many eventlet co-routines to service multiple concurrent requests.
+# workers = auto
+#
+# Maximum concurrent requests per worker
+# max_clients = 1024
+#
 # Set the following two lines to enable SSL. This is for testing only.
 # cert_file = /etc/swift/proxy.crt
 # key_file = /etc/swift/proxy.key
-# expiring_objects_container_divisor = 86400
+#
+#
 # You can specify default log routing here if you want:
 # log_name = swift
 # log_facility = LOG_LOCAL0
 # log_level = INFO
-# log_headers = False
+# log_headers = false
 # log_address = /dev/log
+# The following caps the length of log lines to the value given; no limit if
+# set to 0, the default.
+# log_max_line_length = 0
+#
+# This optional suffix (default is empty) that would be appended to the swift transaction
+# id allows one to easily figure out from which cluster that X-Trans-Id belongs to.
+# This is very useful when one is managing more than one swift cluster.
+# trans_id_suffix =
+#
 # comma separated list of functions to call to setup custom log handlers.
 # functions get passed: conf, name, log_to_console, log_route, fmt, logger,
 # adapted_logger
 # log_custom_handlers =
+#
 # If set, log_udp_host will override log_address
 # log_udp_host =
 # log_udp_port = 514
+#
 # You can enable StatsD logging here:
-# log_statsd_host = localhost
+# log_statsd_host =
 # log_statsd_port = 8125
-# log_statsd_default_sample_rate = 1
+# log_statsd_default_sample_rate = 1.0
+# log_statsd_sample_rate_factor = 1.0
 # log_statsd_metric_prefix =
-# Use a comma separated list of full url (http://foo.bar:1234,https://foo.bar)
+#
+# Statsd metrics may include labeling information in a variety of formats.
+# Available options:
+#     disabled, dogstatsd, graphite, influxdb, librato.
+# Defaults to disabled; enable statsd_label_mode by setting another option.
+# See also: https://github.com/prometheus/statsd_exporter#tagging-extensions.
+# Note that enabling statsd_label_mode will likely increase the number of time
+# series stored, as more labeled metrics may be exposed than may have been
+# previously extracted from the dotted non-labeled legacy metric format.
+# statsd_label_mode = disabled
+#
+# Historically, statsd metrics were emitted with implied labels as part of
+# metric name in a dotted "legacy" format. Once swift is fully instrumented
+# with labeled metrics, and you have statsd_label_mode enabled, you may want to
+# turn off legacy metrics; to do that set this option to False. Defaults to
+# True.
+# statsd_emit_legacy = True
+#
+# Statsd metrics emitted with labels also support user defined labels
+# configured by options. The format for each option is:
+#     statsd_user_label_<name> = <value>
+# where <name> and <value> are restricted to a subset of non-whitespace ASCII
+# characters, including letters (upper and lower), numbers and underscores.
+# <value> may also contain the period character (.). Each option will add a
+# label with name user_<name> and value <value> to labeled metrics.
+# User defined labels may be configured in this [DEFAULT] section, in which
+# case they will be included with every labeled metric, or they may be
+# configured in individual [filter:<middleware>] sections, in which case they
+# will only be included with labeled metrics emitted by that <middleware>.
+# For example, a proxy-server configuration could use the following to
+# delineate labeled metrics emitted by different instances of proxy-logging
+# middleware in the pipeline:
+#     [filter:subrequest-logging]
+#     use = egg:swift#proxy_logging
+#     statsd_user_label_reqctx = subrequest
+# which adds a label with name 'user_reqctx' and value 'subrequest' to every
+# labeled metrics emitted by this proxy-logging instance. This would achieve
+# similar effect as the following proxy-server configuration for legacy
+# non-labeled metrics:
+#     [filter:subrequest-logging]
+#     use = egg:swift#proxy_logging
+#     access_log_statsd_metric_prefix = subrequest
+# Note that the legacy metrics option 'access_log_statsd_metric_prefix' does
+# not apply to labeled metrics.
+# By default there are no user defined labels.
+#
+# List of origin hosts that are allowed for CORS requests in addition to what
+# the container has set.
+# Use a comma separated list of full URL (http://foo.bar:1234,https://foo.bar)
 # cors_allow_origin =
+
+# If True (default) then CORS requests are only allowed if their Origin header
+# matches an allowed origin. Otherwise, any Origin is allowed.
+# strict_cors_mode = True
+#
+# Comma separated list of headers to expose through Access-Control-Expose-Headers,
+# in addition to the defaults and any headers set in container metadata (see
+# CORS documentation).
+# cors_expose_headers =
+#
+# General timeout when sending to or receiving from clients.
+# client_timeout = 60.0
+#
+# Timeout to use when looking for pipelined requests. Set to zero to disable
+# request pipelining. Defaults to client_timeout. Requires eventlet>=0.33.4;
+# with earlier eventlet, any non-zero value is treated as client_timeout.
+# keepalive_timeout =
+#
+# Note: enabling evenlet_debug might reveal sensitive information, for example
+# signatures for temp urls
 # eventlet_debug = false
+#
+# You can set scheduling priority of processes. Niceness values range from -20
+# (most favorable to the process) to 19 (least favorable to the process).
+# nice_priority =
+#
+# You can set I/O scheduling class and priority of processes. I/O niceness
+# class values are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and
+# IOPRIO_CLASS_IDLE (idle). I/O niceness priority is a number which goes from
+# 0 to 7. The higher the value, the lower the I/O priority of the process.
+# Work only with ionice_class.
+# ionice_class =
+# ionice_priority =
 
 [pipeline:main]
-pipeline = catch_errors healthcheck cache ratelimit tempauth proxy-logging proxy-server
+# This sample pipeline uses tempauth and is used for SAIO dev work and
+# testing. See below for a pipeline using keystone.
+pipeline = catch_errors gatekeeper healthcheck proxy-logging cache listing_formats container_sync bulk tempurl ratelimit tempauth copy container-quotas account-quotas slo dlo versioned_writes symlink proxy-logging proxy-server
+
+# The following pipeline shows keystone integration. Comment out the one
+# above and uncomment this one. Additional steps for integrating keystone are
+# covered further below in the filter sections for authtoken and keystoneauth.
+#pipeline = catch_errors gatekeeper healthcheck proxy-logging cache container_sync bulk tempurl ratelimit authtoken keystoneauth copy container-quotas account-quotas slo dlo versioned_writes symlink proxy-logging proxy-server
 
 [app:proxy-server]
 use = egg:swift#proxy
@@ -42,50 +171,271 @@ use = egg:swift#proxy
 # set log_facility = LOG_LOCAL0
 # set log_level = INFO
 # set log_address = /dev/log
-# log_handoffs = True
+#
+# When deployed behind a proxy, load balancer, or SSL terminator that is
+# configured to speak the human-readable (v1) PROXY protocol (see
+# http://www.haproxy.org/download/1.7/doc/proxy-protocol.txt), you should set
+# this option to true.  The proxy-server will populate the client connection
+# information using the PROXY protocol and reject any connection missing a
+# valid PROXY line with a 400.  Only v1 (human-readable) of the PROXY protocol
+# is supported.
+# require_proxy_protocol = false
+#
+# log_handoffs = true
+# How long (in seconds) to cache account existence information. Account
+# non-existence will be cached one-tenth as long.
 # recheck_account_existence = 60
+# How long (in seconds) to cache container existence information. Container
+# non-existence will be cached one-tenth as long.
 # recheck_container_existence = 60
-# object_chunk_size = 8192
-# client_chunk_size = 8192
+#
+# How long (in seconds) the proxy should cache a set of shard ranges for
+# a container when the set is to be used for directing object updates.
+# Note that stale shard range info should be fine; updates will still
+# eventually make their way to the correct shard. As a result, you can
+# usually set this much higher than the existence checks above.
+# recheck_updating_shard_ranges = 3600
+#
+# How long the proxy should cache a set of shard ranges for a container when
+# the set is to be used for gathering object listings.
+# Note that stale shard range info might result in incomplete object listings
+# so this value should be set less than recheck_updating_shard_ranges.
+# recheck_listing_shard_ranges = 600
+#
+# For particularly active containers, having information age out of cache can
+# be quite painful: suddenly thousands of requests per second all miss and
+# have to go to disk. By (rarely) going direct to disk regardless of whether
+# data is present in memcache, we can periodically refresh the data in memcache
+# without causing a thundering herd. Values around 0.0 - 0.1 (i.e., one in
+# every thousand requests skips cache, or fewer) are recommended.
+# container_existence_skip_cache_pct = 0.0
+# container_updating_shard_ranges_skip_cache_pct = 0.0
+# container_listing_shard_ranges_skip_cache_pct = 0.0
+# account_existence_skip_cache_pct = 0.0
+#
+# Use cooperative token on updating namespace cache to coalesce the requests
+# which fetch updating namespaces from the backend and set them in memcached.
+# Number of cooperative tokens per each token session, 0 means to disable the
+# usage of cooperative token and directly talk to the backend and memcache.
+# namespace_cache_tokens_per_session = 3
+#
+# The average time spent (in seconds) on getting updating namespaces from the
+# container servers, this will be used as basic unit for cooperative token to
+# figure out intervals for the retries when requests didn't acquire a token and
+# are waiting for other requests to fill in the cache; and a cooperative token
+# session (`token_ttl`) will be 10 times of this value.
+# namespace_avg_backend_fetch_time = 0.3
+#
+# object_chunk_size = 65536
+# client_chunk_size = 65536
+#
+# How long (in seconds) the proxy server will wait on responses from the a/c/o
+# servers.
 # node_timeout = 10
-# client_timeout = 60
+#
+# How long (in seconds) the proxy server will wait for an initial response and
+# to read a chunk of data from the object servers while serving GET / HEAD
+# requests.  Timeouts from these requests can be recovered from so setting this
+# to something lower than node_timeout would provide quicker error recovery
+# while allowing for a longer timeout for non-recoverable requests (PUTs).
+# Does not apply to requests with a truthy X-Newest header value.
+# Defaults to node_timeout, should be overridden if node_timeout is set to a
+# high number to prevent client timeouts from firing before the proxy server
+# has a chance to retry.
+# recoverable_node_timeout = node_timeout
+#
+# Connection timeout (in seconds)
 # conn_timeout = 0.5
-# How long without an error before a node's error count is reset. This will
-# also be how long before a node is reenabled after suppression is triggered.
-# error_suppression_interval = 60
+#
+# How long (in seconds) to wait for requests to finish after a quorum has been
+# established.
+# post_quorum_timeout = 0.5
+#
+# How long (in seconds) without an error before a node's error count is reset.
+# This will also be how long before a node is reenabled after suppression is
+# triggered.
+# Set to 0 to disable error-limiting.
+# error_suppression_interval = 60.0
+#
 # How many errors can accumulate before a node is temporarily ignored.
 # error_suppression_limit = 10
+#
 # If set to 'true' any authorized user may create and delete accounts; if
 # 'false' no one, even authorized, can.
 # allow_account_management = false
-# Set object_post_as_copy = false to turn on fast posts where only the metadata
-# changes are stored anew and the original data file is kept in place. This
-# makes for quicker posts; but since the container metadata isn't updated in
-# this mode, features like container sync won't be able to sync posts.
-# object_post_as_copy = true
+#
 # If set to 'true' authorized accounts that do not yet exist within the Swift
 # cluster will be automatically created.
 # account_autocreate = false
+#
 # If set to a positive value, trying to create a container when the account
 # already has at least this maximum containers will result in a 403 Forbidden.
 # Note: This is a soft limit, meaning a user might exceed the cap for
 # recheck_account_existence before the 403s kick in.
 # max_containers_per_account = 0
+#
 # This is a comma separated list of account hashes that ignore the
 # max_containers_per_account cap.
 # max_containers_whitelist =
+#
 # Comma separated list of Host headers to which the proxy will deny requests.
 # deny_host_headers =
-# Prefix used when automatically creating accounts.
-# auto_create_account_prefix = .
-# Depth of the proxy put queue.
-# put_queue_depth = 10
-# Start rate-limiting object segment serving after the Nth segment of a
-# segmented object.
-# rate_limit_after_segment = 10
-# Once segment rate-limiting kicks in for an object, limit segments served
-# to N per second.
-# rate_limit_segments_per_sec = 1
+#
+# During GET and HEAD requests, storage nodes can be chosen at random
+# (shuffle), by using timing measurements (timing), or by using an explicit
+# region/zone match (affinity). Using timing measurements may allow for lower
+# overall latency, while using affinity allows for finer control. In both the
+# timing and affinity cases, equally-sorting nodes are still randomly chosen to
+# spread load.
+# The valid values for sorting_method are "affinity", "shuffle", or "timing".
+# This option may be overridden in a per-policy configuration section.
+# sorting_method = shuffle
+#
+# If the "timing" sorting_method is used, the timings will only be valid for
+# the number of seconds configured by timing_expiry.
+# timing_expiry = 300
+#
+# Normally, you should only be moving one replica's worth of data at a time
+# when rebalancing. If you're rebalancing more aggressively, increase this
+# to avoid erroneously returning a 404 when the primary assignments that
+# *didn't* change get overloaded.
+# rebalance_missing_suppression_count = 1
+#
+# By default on a GET/HEAD swift will connect to a minimum number storage nodes
+# in a minimum number of threads - for replicated data just a single request to
+# a single node one at a time.  When enabled concurrent_gets allows the proxy
+# to use up to replica count threads when waiting on a response.  In
+# conjunction with the concurrency_timeout option this will allow swift to send
+# out GET/HEAD requests to the storage nodes concurrently and answer as soon as
+# the minimum number of backend responses are available - in replicated
+# contexts this will be the first backend replica to respond.
+# concurrent_gets = off
+#
+# This parameter controls how long (in seconds) to wait before firing off the
+# next concurrent_get thread. A value of 0 would be fully concurrent, any other
+# number will stagger the firing of the threads. This number should be between
+# 0 and node_timeout. The default is what ever you set for the conn_timeout
+# parameter.
+# concurrency_timeout = 0.5
+#
+# By default on a EC GET request swift will connect to a minimum number of
+# storage nodes in a minimum number of threads - for erasure coded data, ndata
+# requests to primary nodes are started at the same time.  When greater than
+# zero this option provides additional robustness and may reduce first byte
+# latency by starting additional requests - up to as many as nparity.
+# concurrent_ec_extra_requests = 0
+#
+# Set to the number of nodes to contact for a normal request. You can use
+# '* replicas' at the end to have it use the number given times the number of
+# replicas for the ring being used for the request.
+# request_node_count = 2 * replicas
+#
+# Specifies which backend servers to prefer on reads. Format is a comma
+# separated list of affinity descriptors of the form <selection>=<priority>.
+# The <selection> may be r<N> for selecting nodes in region N or r<N>z<M> for
+# selecting nodes in region N, zone M. The <priority> value should be a whole
+# number that represents the priority to be given to the selection; lower
+# numbers are higher priority.
+#
+# Example: first read from region 1 zone 1, then region 1 zone 2, then
+# anything in region 2, then everything else:
+# read_affinity = r1z1=100, r1z2=200, r2=300
+# Default is empty, meaning no preference.
+# This option may be overridden in a per-policy configuration section.
+# read_affinity =
+#
+# Specifies which backend servers to prefer on object writes. Format is a comma
+# separated list of affinity descriptors of the form r<N> for region N or
+# r<N>z<M> for region N, zone M. If this is set, then when handling an object
+# PUT request, some number (see setting write_affinity_node_count) of local
+# backend servers will be tried before any nonlocal ones.
+#
+# Example: try to write to regions 1 and 2 before writing to any other
+# nodes:
+# write_affinity = r1, r2
+# Default is empty, meaning no preference.
+# This option may be overridden in a per-policy configuration section.
+# write_affinity =
+#
+# The number of local (as governed by the write_affinity setting) nodes to
+# attempt to contact first on writes, before any non-local ones. The value
+# should be an integer number, or use '* replicas' at the end to have it use
+# the number given times the number of replicas for the ring being used for the
+# request.
+# This option may be overridden in a per-policy configuration section.
+# write_affinity_node_count = 2 * replicas
+#
+# The number of local (as governed by the write_affinity setting) handoff nodes
+# to attempt to contact on deletion, in addition to primary nodes.
+#
+# Example: in geographically distributed deployment of 2 regions, If
+# replicas=3, sometimes there may be 1 primary node and 2 local handoff nodes
+# in one region holding the object after uploading but before object replicated
+# to the appropriate locations in other regions. In this case, include these
+# handoff nodes to send request when deleting object could help make correct
+# decision for the response. The default value 'auto' means Swift will
+# calculate the number automatically, the default value is
+# (replicas - len(local_primary_nodes)). This option may be overridden in a
+# per-policy configuration section.
+# write_affinity_handoff_delete_count = auto
+#
+# These are the headers whose values will only be shown to swift_owners. The
+# exact definition of a swift_owner is up to the auth system in use, but
+# usually indicates administrative responsibilities.
+# swift_owner_headers = x-container-read, x-container-write, x-container-sync-key, x-container-sync-to, x-account-meta-temp-url-key, x-account-meta-temp-url-key-2, x-container-meta-temp-url-key, x-container-meta-temp-url-key-2, x-account-access-control
+#
+# You can set scheduling priority of processes. Niceness values range from -20
+# (most favorable to the process) to 19 (least favorable to the process).
+# nice_priority =
+#
+# You can set I/O scheduling class and priority of processes. I/O niceness
+# class values are IOPRIO_CLASS_RT (realtime), IOPRIO_CLASS_BE (best-effort) and
+# IOPRIO_CLASS_IDLE (idle). I/O niceness priority is a number which goes from
+# 0 to 7. The higher the value, the lower the I/O priority of the process.
+# Work only with ionice_class.
+# ionice_class =
+# ionice_priority =
+#
+# When reloading servers with SIGUSR1, workers running with old config/code
+# are allowed some time to finish serving in-flight requests. Use this to
+# configure the grace period (in seconds), after which the reloaded server
+# will issue SIGKILLs to remaining stale workers.
+# stale_worker_timeout = 86400
+#
+# When upgrading from liberasurecode<=1.5.0, you may want to continue writing
+# legacy CRCs until all nodes are upgraded and capabale of reading fragments
+# with zlib CRCs. liberasurecode>=1.6.2 checks for the environment variable
+# LIBERASURECODE_WRITE_LEGACY_CRC; if set (value doesn't matter), it will use
+# its legacy CRC. Set this option to true or false to ensure the environment
+# variable is or is not set. Leave the option blank or absent to not touch
+# the environment (default). For more information, see
+# https://bugs.launchpad.net/liberasurecode/+bug/1886088
+# write_legacy_ec_crc =
+#
+# Setting 'allow_open_expired' to 'true' allows the 'x-open-expired' header
+# to be used with HEAD, GET, or POST requests to access expired objects that
+# have not yet been deleted from disk. This can be useful in conjunction with
+# the object-expirer 'delay_reaping' feature.
+# This flag is set to false by default, so it must be changed to access
+# expired objects.
+# allow_open_expired = false
+
+# Some proxy-server configuration options may be overridden on a per-policy
+# basis by including per-policy config section(s). The value of any option
+# specified a per-policy section will override any value given in the
+# proxy-server section for that policy only. Otherwise the value of these
+# options will be that specified in the proxy-server section.
+# The section name should refer to the policy index, not the policy name.
+# [proxy-server:policy:<policy index>]
+# sorting_method =
+# read_affinity =
+# write_affinity =
+# write_affinity_node_count =
+# write_affinity_handoff_delete_count =
+# rebalance_missing_suppression_count = 1
+# concurrent_gets = off
+# concurrency_timeout = 0.5
+# concurrent_ec_extra_requests = 0
 
 [filter:tempauth]
 use = egg:swift#tempauth
@@ -93,29 +443,59 @@ use = egg:swift#tempauth
 # set log_name = tempauth
 # set log_facility = LOG_LOCAL0
 # set log_level = INFO
-# set log_headers = False
+# set log_headers = false
 # set log_address = /dev/log
+#
 # The reseller prefix will verify a token begins with this prefix before even
 # attempting to validate it. Also, with authorization, only Swift storage
 # accounts with this prefix will be authorized by this middleware. Useful if
 # multiple auth systems are in use for one Swift cluster.
+# The reseller_prefix may contain a comma separated list of items. The first
+# item is used for the token as mentioned above. If second and subsequent
+# items exist, the middleware will handle authorization for an account with
+# that prefix. For example, for prefixes "AUTH, SERVICE", a path of
+# /v1/SERVICE_account is handled the same as /v1/AUTH_account. If an empty
+# (blank) reseller prefix is required, it must be first in the list. Two
+# single quote characters indicates an empty (blank) reseller prefix.
 # reseller_prefix = AUTH
+
+#
+# The require_group parameter names a group that must be presented by
+# either X-Auth-Token or X-Service-Token. Usually this parameter is
+# used only with multiple reseller prefixes (e.g., SERVICE_require_group=blah).
+# By default, no group is needed. Do not use .admin.
+# require_group =
+
 # The auth prefix will cause requests beginning with this prefix to be routed
 # to the auth subsystem, for granting tokens, etc.
 # auth_prefix = /auth/
+# Token lifetime (in seconds)
 # token_life = 86400
-# This is a comma separated list of hosts allowed to send X-Container-Sync-Key
-# requests.
-# allowed_sync_hosts = 127.0.0.1
+#
 # This allows middleware higher in the WSGI pipeline to override auth
 # processing, useful for middleware such as tempurl and formpost. If you know
 # you're not going to use such middleware and you want a bit of extra security,
 # you can set this to false.
 # allow_overrides = true
-# This specifies what scheme to return with storage urls:
+#
+# This specifies what scheme to return with storage URLs:
 # http, https, or default (chooses based on what the server is running as)
 # This can be useful with an SSL load balancer in front of a non-SSL server.
 # storage_url_scheme = default
+#
+# Fernet keys may be used for storage, rather than relying on memcached.
+# Multiple keys may be configured using options named 'fernet_key_<key_id>'
+# where 'key_id' is a unique identifier. The value should be 32 url-safe
+# base64-encoded bytes, such as may be generated using
+# `openssl rand -base64 32 | tr '+/' '-_'`
+# Any of these keys may be used for decryption. Only one key may be used
+# for encryption by a proxy at any given time; configure it with the
+# 'active_fernet_key_id' option. All proxies in the cluster should know
+# about a key before it is activated. If blank (the default),
+# memcached-backed tokens will be issued.
+# fernet_key_myid = <32 url-safe base64-encoded bytes>
+# active_fernet_key_id = myid
+#
 # Lastly, you need to list all the accounts/users you want here. The format is:
 #   user_<account>_<user> = <key> [group] [group] [...] [storage_url]
 # or if you want underscores in <account> or <user>, you can base64 encode them
@@ -123,8 +503,9 @@ use = egg:swift#tempauth
 #   user64_<account_b64>_<user_b64> = <key> [group] [group] [...] [storage_url]
 # There are special groups of:
 #   .reseller_admin = can do anything to any account for this auth
+#   .reseller_reader = can GET/HEAD anything in any account for this auth
 #   .admin = can do anything within the account
-# If neither of these groups are specified, the user can only access containers
+# If none of these groups are specified, the user can only access containers
 # that have been explicitly allowed for them by a .admin or .reseller_admin.
 # The trailing optional storage_url allows you to specify an alternate url to
 # hand back to the user upon authentication. If not specified, this defaults to
@@ -132,35 +513,303 @@ use = egg:swift#tempauth
 # to what the requester would need to use to reach this host.
 # Here are example entries, required for running the tests:
 user_admin_admin = admin .admin .reseller_admin
+user_admin_auditor = admin_ro .reseller_reader
 user_test_tester = testing .admin
-user_test2_tester2 = testing2 .admin
+user_test_tester2 = testing2 .admin
 user_test_tester3 = testing3
+user_test2_tester2 = testing2 .admin
+user_test5_tester5 = testing5 service
 
 # To enable Keystone authentication you need to have the auth token
 # middleware first to be configured. Here is an example below, please
 # refer to the keystone's documentation for details about the
 # different settings.
 #
-# You'll need to have as well the keystoneauth middleware enabled
-# and have it in your main pipeline so instead of having tempauth in
-# there you can change it to: authtoken keystone
+# You'll also need to have the keystoneauth middleware enabled and have it in
+# your main pipeline, as show in the sample pipeline at the top of this file.
+#
+# Following parameters are known to work with keystonemiddleware v2.3.0
+# (above v2.0.0), but checking the latest information in the wiki page[1]
+# is recommended.
+# 1. https://docs.openstack.org/keystonemiddleware/latest/middlewarearchitecture.html#configuration
 #
 # [filter:authtoken]
-# paste.filter_factory = keystoneclient.middleware.auth_token:filter_factory
-# auth_host = keystonehost
-# auth_port = 35357
-# auth_protocol = http
-# auth_uri = http://keystonehost:5000/
-# admin_tenant_name = service
-# admin_user = swift
-# admin_password = password
-# delay_auth_decision = 1
+# paste.filter_factory = keystonemiddleware.auth_token:filter_factory
+# www_authenticate_uri = http://keystonehost:5000
+# auth_url = http://keystonehost:5000
+# auth_plugin = password
+# The following credentials must match the Keystone credentials for the Swift
+# service and may need to be changed to match your Keystone configuration. The
+# example values shown here assume a user named 'swift' with admin role on a
+# project named 'service', both being in the Keystone domain with id 'default'.
+# Refer to the keystonemiddleware documentation link above [1] for other
+# examples.
+# project_domain_id = default
+# user_domain_id = default
+# project_name = service
+# username = swift
+# password = password
+#
+# delay_auth_decision defaults to False, but leaving it as false will
+# prevent other auth systems, staticweb, tempurl, formpost, and ACLs from
+# working. This value must be explicitly set to True.
+# delay_auth_decision = False
+#
+# cache = swift.cache
+# include_service_catalog = False
 #
 # [filter:keystoneauth]
 # use = egg:swift#keystoneauth
-# Operator roles is the role which user would be allowed to manage a
-# tenant and be able to create container or give ACL to others.
+# The reseller_prefix option lists account namespaces that this middleware is
+# responsible for. The prefix is placed before the Keystone project id.
+# For example, for project 12345678, and prefix AUTH, the account is
+# named AUTH_12345678 (i.e., path is /v1/AUTH_12345678/...).
+# Several prefixes are allowed by specifying a comma-separated list
+# as in: "reseller_prefix = AUTH, SERVICE". The empty string indicates a
+# single blank/empty prefix. If an empty prefix is required in a list of
+# prefixes, a value of '' (two single quote characters) indicates a
+# blank/empty prefix. Except for the blank/empty prefix, an underscore ('_')
+# character is appended to the value unless already present.
+# reseller_prefix = AUTH
+#
+# The user must have at least one role named by operator_roles on a
+# project in order to create, delete and modify containers and objects
+# and to set and read privileged headers such as ACLs.
+# If there are several reseller prefix items, you can prefix the
+# parameter so it applies only to those accounts (for example
+# the parameter SERVICE_operator_roles applies to the /v1/SERVICE_<project>
+# path). If you omit the prefix, the option applies to all reseller
+# prefix items. For the blank/empty prefix, prefix with '' (do not put
+# underscore after the two single quote characters).
 # operator_roles = admin, swiftoperator
+#
+# The reseller admin role has the ability to create and delete accounts
+# reseller_admin_role = ResellerAdmin
+#
+# This allows middleware higher in the WSGI pipeline to override auth
+# processing, useful for middleware such as tempurl and formpost. If you know
+# you're not going to use such middleware and you want a bit of extra security,
+# you can set this to false.
+# allow_overrides = true
+#
+# If the service_roles parameter is present, an X-Service-Token must be
+# present in the request that when validated, grants at least one role listed
+# in the parameter. The X-Service-Token may be scoped to any project.
+# If there are several reseller prefix items, you can prefix the
+# parameter so it applies only to those accounts (for example
+# the parameter SERVICE_service_roles applies to the /v1/SERVICE_<project>
+# path). If you omit the prefix, the option applies to all reseller
+# prefix items. For the blank/empty prefix, prefix with '' (do not put
+# underscore after the two single quote characters).
+# By default, no service_roles are required.
+# service_roles =
+#
+# For backwards compatibility, keystoneauth will match names in cross-tenant
+# access control lists (ACLs) when both the requesting user and the tenant
+# are in the default domain i.e the domain to which existing tenants are
+# migrated. The default_domain_id value configured here should be the same as
+# the value used during migration of tenants to keystone domains.
+# default_domain_id = default
+#
+# For a new installation, or an installation in which keystone projects may
+# move between domains, you should disable backwards compatible name matching
+# in ACLs by setting allow_names_in_acls to false:
+# allow_names_in_acls = true
+#
+# In OpenStack terms, these reader roles are scoped for system: they
+# can read anything across projects and domains.
+# They are used for auditing and compliance fuctions.
+# In Swift terms, these roles are as powerful as the reseller_admin_role,
+# only do not modify the cluster.
+# By default the list of reader roles is empty.
+# system_reader_roles =
+#
+# This is a reader role scoped for a Keystone project.
+# An identity that has this role can read anything in a project, so it is
+# basically a swiftoperator, but read-only.
+# project_reader_roles =
+
+[filter:s3api]
+use = egg:swift#s3api
+
+# s3api setup:
+#
+# With either tempauth or your custom auth:
+# - Put s3api just before your auth filter(s) in the pipeline
+# With keystone:
+# - Put s3api and s3token before keystoneauth in the pipeline, but after
+#   auth_token
+# If you have ratelimit enabled for Swift requests, you may want to place a
+# second copy after auth to also ratelimit S3 requests.
+#
+# Swift has no concept of the S3's resource owner; the resources
+# (i.e. containers and objects) created via the Swift API have no owner
+# information. This option specifies how the s3api middleware handles them
+# with the S3 API.  If this option is 'false', such kinds of resources will be
+# invisible and no users can access them with the S3 API.  If set to 'true',
+# a resource without an owner belongs to everyone and everyone can access it
+# with the S3 API.  If you care about S3 compatibility, set 'false' here.  This
+# option makes sense only when the s3_acl option is set to 'true' and your
+# Swift cluster has the resources created via the Swift API.
+# allow_no_owner = false
+#
+# Set a region name of your Swift cluster.  Note that the s3api doesn't choose
+# a region of the newly created bucket.  This value is used for the
+# GET Bucket location API and v4 signatures calculation.
+# location = us-east-1
+#
+# Set whether to enforce DNS-compliant bucket names. Note that S3 enforces
+# these conventions in all regions except the US Standard region.
+# dns_compliant_bucket_names = True
+#
+# Set the default maximum number of objects returned in the GET Bucket
+# response.
+# max_bucket_listing = 1000
+#
+# Set the maximum number of parts returned in the List Parts operation.
+# (default: 1000 as well as S3 specification)
+# If setting it larger than 10000 (swift container_listing_limit default)
+# make sure you also increase the container_listing_limit in swift.conf.
+# max_parts_listing = 1000
+#
+# Set the maximum number of objects we can delete with the Multi-Object Delete
+# operation.
+# max_multi_delete_objects = 1000
+#
+# Set the number of objects to delete at a time with the Multi-Object Delete
+# operation.
+# multi_delete_concurrency = 2
+#
+# If set to 'true', s3api uses its own metadata for ACLs
+# (e.g. X-Container-Sysmeta-S3Api-Acl) to achieve the best S3 compatibility.
+# If set to 'false', s3api tries to use Swift ACLs (e.g. X-Container-Read)
+# instead of S3 ACLs as far as possible.
+# There are some caveats that one should know about this setting. Firstly,
+# if set to 'false' after being previously set to 'true' any new objects or
+# containers stored while 'true' setting will be accessible to all users
+# because the s3 ACLs will be ignored under s3_acl=False setting. Secondly,
+# s3_acl True mode don't keep ACL consistency between both the S3 and Swift
+# API. Meaning with s3_acl enabled S3 ACLs only effect objects and buckets
+# via the S3 API. As this ACL information wont be available via the Swift API
+# and so the ACL wont be applied.
+# Note that s3_acl currently supports only keystone and tempauth.
+# DON'T USE THIS for production before enough testing for your use cases.
+# This stuff is still under development and it might cause something
+# you don't expect.
+# s3_acl = false
+#
+# Specify a (comma-separated) list of host names for your Swift cluster.
+# This enables virtual-hosted style requests.
+# storage_domain =
+#
+# Enable pipeline order check for SLO, s3token, authtoken, keystoneauth
+# according to standard s3api/Swift construction using either tempauth or
+# keystoneauth. If the order is incorrect, it raises an exception to stop
+# proxy. Turn auth_pipeline_check off only when you want to bypass these
+# authenticate middlewares in order to use other 3rd party (or your
+# proprietary) authenticate middleware.
+# auth_pipeline_check = True
+#
+# Enable multi-part uploads. (default: true)
+# This is required to store files larger than Swift's max_file_size (by
+# default, 5GiB). Note that has performance implications when deleting objects,
+# as we now have to check for whether there are also segments to delete. The
+# SLO middleware must be in the pipeline after s3api for this option to have
+# effect.
+# allow_multipart_uploads = True
+#
+# Set the maximum number of parts for Upload Part operation.(default: 1000)
+# When setting it to be larger than the default value in order to match the
+# specification of S3, set to be larger max_manifest_segments for slo
+# middleware.(specification of S3: 10000)
+# max_upload_part_num = 1000
+#
+# Enable returning only buckets which owner are the user who requested
+# GET Service operation. (default: false)
+# If you want to enable the above feature, set this and s3_acl to true.
+# That might cause significant performance degradation. So, only if your
+# service absolutely need this feature, set this setting to true.
+# If you set this to false, s3api returns all buckets.
+# check_bucket_owner = false
+#
+# By default, Swift reports only S3 style access log.
+# (e.g. PUT /bucket/object) If set force_swift_request_proxy_log
+# to be 'true', Swift will become to output Swift style log
+# (e.g. PUT /v1/account/container/object) in addition to S3 style log.
+# Note that they will be reported twice (i.e. s3api doesn't care about
+# the duplication) and Swift style log will includes also various subrequests
+# to achieve S3 compatibilities when force_swift_request_proxy_log is set to
+# 'true'
+# force_swift_request_proxy_log = false
+#
+# AWS S3 document says that each part must be at least 5 MB in a multipart
+# upload, except the last part.
+# min_segment_size = 5242880
+#
+# AWS allows clock skew up to 15 mins; note that older versions of swift/swift3
+# allowed at most 5 mins.
+# allowable_clock_skew = 900
+#
+# CORS preflight requests don't contain enough information for us to
+# identify the account that should be used for the real request, so
+# the allowed origins must be set cluster-wide. (default: blank; all
+# preflight requests will be denied)
+# cors_preflight_allow_origin =
+#
+# AWS will return a 503 Slow Down when clients are making too many requests,
+# but that can make client logs confusing if they only log/give metrics on
+# status ints. Turn this on to return 429 instead.
+# ratelimit_as_client_error = false
+
+# You can override the default log routing for this filter here:
+# log_name = s3api
+
+[filter:s3token]
+# s3token middleware authenticates with keystone using the s3 credentials
+# provided in the request header. Please put s3token between s3api
+# and keystoneauth if you're using keystoneauth.
+use = egg:swift#s3token
+
+# Prefix that will be prepended to the tenant to form the account
+reseller_prefix = AUTH_
+
+# By default, s3token will reject all invalid S3-style requests. Set this to
+# True to delegate that decision to downstream WSGI components. This may be
+# useful if there are multiple auth systems in the proxy pipeline.
+delay_auth_decision = False
+
+# Keystone server details. Note that this differs from how swift3 was
+# configured: in particular, the Keystone API version must be included.
+auth_uri = http://keystonehost:5000/v3
+
+# Connect/read timeout (in seconds) to use when communicating with Keystone
+http_timeout = 10.0
+
+# SSL-related options
+# insecure = False
+# certfile =
+# keyfile =
+
+# You can override the default log routing for this filter here:
+# log_name = s3token
+
+# Secrets may be cached to reduce latency for the client and load on Keystone.
+# This configures the duration that secrets may be cached; set to zero to
+# disable caching and prevent Swift from retrieving secrets from Keystone.
+# secret_cache_duration = 60
+# Note that caching is required to enable signed aws-chunked transfers.
+
+# Recent Keystone deployments require credentials similar to the authtoken
+# middleware; these credentials require access to the s3tokens endpoint.
+# Additionally, if secret caching is enabled, the credentials should have
+# access to view all project credentials.
+# auth_url = http://keystonehost:5000
+# auth_type = password
+# project_domain_id = default
+# project_name = service
+# user_domain_id = default
+# username = swift
+# password = password
 
 [filter:healthcheck]
 use = egg:swift#healthcheck
@@ -177,25 +826,32 @@ use = egg:swift#memcache
 # set log_name = cache
 # set log_facility = LOG_LOCAL0
 # set log_level = INFO
-# set log_headers = False
+# set log_headers = false
 # set log_address = /dev/log
+#
 # If not set here, the value for memcache_servers will be read from
 # memcache.conf (see memcache.conf-sample) or lacking that file, it will
 # default to the value below. You can specify multiple servers separated with
-# commas, as in: 10.1.2.3:11211,10.1.2.4:11211
+# commas, as in: 10.1.2.3:11211,10.1.2.4:11211 (IPv6 addresses must
+# follow rfc3986 section-3.2.2, i.e. [::1]:11211)
 # memcache_servers = 127.0.0.1:11211
 #
-# Sets how memcache values are serialized and deserialized:
-# 0 = older, insecure pickle serialization
-# 1 = json serialization but pickles can still be read (still insecure)
-# 2 = json serialization only (secure and the default)
-# If not set here, the value for memcache_serialization_support will be read
-# from /etc/swift/memcache.conf (see memcache.conf-sample).
-# To avoid an instant full cache flush, existing installations should
-# upgrade with 0, then set to 1 and reload, then after some time (24 hours)
-# set to 2 and reload.
-# In the future, the ability to use pickle serialization will be removed.
-# memcache_serialization_support = 2
+# Sets the maximum number of connections to each memcached server per worker
+# memcache_max_connections = 2
+#
+# How long (in seconds) without an error before a server's error count is
+# reset. This will also be how long before a server is reenabled after
+# suppression is triggered.  Set to 0 to disable error-limiting.
+# error_suppression_interval = 60.0
+#
+# How many errors can accumulate before a server is temporarily ignored.
+# error_suppression_limit = 10
+#
+# (Optional) Global toggle for TLS usage when comunicating with
+# the caching servers.
+# tls_enabled =
+#
+# More options documented in memcache.conf-sample
 
 [filter:ratelimit]
 use = egg:swift#ratelimit
@@ -203,44 +859,91 @@ use = egg:swift#ratelimit
 # set log_name = ratelimit
 # set log_facility = LOG_LOCAL0
 # set log_level = INFO
-# set log_headers = False
+# set log_headers = false
 # set log_address = /dev/log
+#
 # clock_accuracy should represent how accurate the proxy servers' system clocks
 # are with each other. 1000 means that all the proxies' clock are accurate to
 # each other within 1 millisecond.  No ratelimit should be higher than the
 # clock accuracy.
 # clock_accuracy = 1000
+#
 # max_sleep_time_seconds = 60
+#
 # log_sleep_time_seconds of 0 means disabled
 # log_sleep_time_seconds = 0
+#
 # allows for slow rates (e.g. running up to 5 sec's behind) to catch up.
 # rate_buffer_seconds = 5
+#
 # account_ratelimit of 0 means disabled
 # account_ratelimit = 0
 
+# DEPRECATED- these will continue to work but will be replaced
+# by the X-Account-Sysmeta-Global-Write-Ratelimit flag.
+# Please see ratelimiting docs for details.
 # these are comma separated lists of account names
 # account_whitelist = a,b
 # account_blacklist = c,d
 
 # with container_limit_x = r
-# for containers of size x limit requests per second to r.  The container
+# for containers of size x limit write requests per second to r.  The container
 # rate will be linearly interpolated from the values given. With the values
 # below, a container of size 5 will get a rate of 75.
 # container_ratelimit_0 = 100
 # container_ratelimit_10 = 50
 # container_ratelimit_50 = 20
 
+# Similarly to the above container-level write limits, the following will limit
+# container GET (listing) requests.
+# container_listing_ratelimit_0 = 100
+# container_listing_ratelimit_10 = 50
+# container_listing_ratelimit_50 = 20
+
+[filter:read_only]
+use = egg:swift#read_only
+# read_only set to true means turn global read only on
+# read_only = false
+# allow_deletes set to true means to allow deletes
+# allow_deletes = false
+# Note: Put after ratelimit in the pipeline.
+
+# Note: needs to be placed before listing_formats;
+# otherwise remapped listings will always be JSON
 [filter:domain_remap]
 use = egg:swift#domain_remap
 # You can override the default log routing for this filter here:
 # set log_name = domain_remap
 # set log_facility = LOG_LOCAL0
 # set log_level = INFO
-# set log_headers = False
+# set log_headers = false
 # set log_address = /dev/log
+#
+# Specify the storage_domain that match your cloud, multiple domains
+# can be specified separated by a comma
 # storage_domain = example.com
+
+# Specify a root path part that will be added to the start of paths if not
+# already present.
 # path_root = v1
+
+# Browsers can convert a host header to lowercase, so check that reseller
+# prefix on the account is the correct case. This is done by comparing the
+# items in the reseller_prefixes config option to the found prefix. If they
+# match except for case, the item from reseller_prefixes will be used
+# instead of the found reseller prefix. When none match, the default reseller
+# prefix is used. When no default reseller prefix is configured, any request
+# with an account prefix not in that list will be ignored by this middleware.
 # reseller_prefixes = AUTH
+# default_reseller_prefix =
+
+# Enable legacy remapping behavior for versioned path requests:
+#   c.a.example.com/v1/o -> /v1/AUTH_a/c/o
+# instead of
+#   c.a.example.com/v1/o -> /v1/AUTH_a/c/v1/o
+# ... by default all path parts after a remapped domain are considered part of
+# the object name with no special case for the path "v1"
+# mangle_client_paths = False
 
 [filter:catch_errors]
 use = egg:swift#catch_errors
@@ -248,7 +951,7 @@ use = egg:swift#catch_errors
 # set log_name = catch_errors
 # set log_facility = LOG_LOCAL0
 # set log_level = INFO
-# set log_headers = False
+# set log_headers = false
 # set log_address = /dev/log
 
 [filter:cname_lookup]
@@ -258,35 +961,54 @@ use = egg:swift#cname_lookup
 # set log_name = cname_lookup
 # set log_facility = LOG_LOCAL0
 # set log_level = INFO
-# set log_headers = False
+# set log_headers = false
 # set log_address = /dev/log
+#
+# Specify the storage_domain that match your cloud, multiple domains
+# can be specified separated by a comma
 # storage_domain = example.com
+#
 # lookup_depth = 1
+#
+# Specify the nameservers to use to do the CNAME resolution. If unset, the
+# system configuration is used. Multiple nameservers can be specified
+# separated by a comma. Default port 53 can be overridden. IPv6 is accepted.
+# Example: 127.0.0.1, 127.0.0.2, 127.0.0.3:5353, [::1], [::1]:5353
+# nameservers =
 
 # Note: Put staticweb just after your auth filter(s) in the pipeline
 [filter:staticweb]
 use = egg:swift#staticweb
-# Seconds to cache container x-container-meta-web-* header values.
-# cache_timeout = 300
 # You can override the default log routing for this filter here:
 # set log_name = staticweb
 # set log_facility = LOG_LOCAL0
 # set log_level = INFO
+# set log_headers = false
 # set log_address = /dev/log
-# set access_log_name = staticweb
-# set access_log_facility = LOG_LOCAL0
-# set access_log_level = INFO
-# set log_headers = False
+#
+# At times when it's impossible for staticweb to guess the outside
+# endpoint correctly, the url_base may be used to supply the URL
+# scheme and/or the host name (and port number) in order to generate
+# redirects.
+# Example values:
+#    http://www.example.com    - redirect to www.example.com
+#    https:                    - changes the schema only
+#    https://                  - same, changes the schema only
+#    //www.example.com:8080    - redirect www.example.com on port 8080
+#                                (schema unchanged)
+# url_base =
 
-# Note: Put tempurl just before your auth filter(s) in the pipeline
+# Note: Put tempurl before dlo, slo and your auth filter(s) in the pipeline
 [filter:tempurl]
 use = egg:swift#tempurl
+# The methods allowed with Temp URLs.
+# methods = GET HEAD PUT POST DELETE
 #
 # The headers to remove from incoming requests. Simply a whitespace delimited
 # list of header names and names can optionally end with '*' to indicate a
 # prefix match. incoming_allow_headers is a list of exceptions to these
 # removals.
-# incoming_remove_headers = x-timestamp
+# incoming_remove_headers = x-timestamp x-open-expired
 #
 # The headers allowed as exceptions to incoming_remove_headers. Simply a
 # whitespace delimited list of header names and names can optionally end with
@@ -303,10 +1025,17 @@ use = egg:swift#tempurl
 # whitespace delimited list of header names and names can optionally end with
 # '*' to indicate a prefix match.
 # outgoing_allow_headers = x-object-meta-public-*
+#
+# The digest algorithm(s) supported for generating signatures;
+# whitespace-delimited.
+# allowed_digests = sha1 sha256 sha512
 
 # Note: Put formpost just before your auth filter(s) in the pipeline
 [filter:formpost]
 use = egg:swift#formpost
+# The digest algorithm(s) supported for generating signatures;
+# whitespace-delimited.
+# allowed_digests = sha1 sha256 sha512
 
 # Note: Just needs to be placed before the proxy-server in the pipeline.
 [filter:name_check]
@@ -315,6 +1044,26 @@ use = egg:swift#name_check
 # maximum_length = 255
 # forbidden_regexp = /\./|/\.\./|/\.$|/\.\.$
 
+# Note: Etag quoter should be placed just after cache in the pipeline.
+[filter:etag-quoter]
+use = egg:swift#etag_quoter
+# Historically, Swift has emitted bare MD5 hex digests as ETags, which is not
+# RFC compliant. With this middleware in the pipeline, users can opt-in to
+# RFC-compliant ETags on a per-account or per-container basis.
+#
+# Set to true to enable RFC-compliant ETags cluster-wide by default. Users
+# can still opt-out by setting appropriate account or container metadata.
+# enable_by_default = false
+
+[filter:list-endpoints]
+use = egg:swift#list_endpoints
+# list_endpoints_path = /endpoints/
+
+# Note: The double proxy-logging in the pipeline is not a mistake. The
+# left-most proxy-logging is there to log requests that were handled in
+# middleware and never made it through to the right-most middleware (and
+# proxy server). Double logging is prevented for normal requests. See
+# proxy-logging docs.
 [filter:proxy-logging]
 use = egg:swift#proxy_logging
 # If not set, logging directives from [DEFAULT] without "access_" will be used
@@ -322,15 +1071,354 @@ use = egg:swift#proxy_logging
 # access_log_facility = LOG_LOCAL0
 # access_log_level = INFO
 # access_log_address = /dev/log
+#
+# Log route for this filter. Useful if you want to have different configs for
+# the two proxy-logging filters.
+# access_log_route = proxy-server
+#
 # If set, access_log_udp_host will override access_log_address
 # access_log_udp_host =
 # access_log_udp_port = 514
+#
 # You can use log_statsd_* from [DEFAULT] or override them here:
-# access_log_statsd_host = localhost
+# access_log_statsd_host =
 # access_log_statsd_port = 8125
-# access_log_statsd_default_sample_rate = 1
+# access_log_statsd_default_sample_rate = 1.0
+# access_log_statsd_sample_rate_factor = 1.0
 # access_log_statsd_metric_prefix =
-# access_log_headers = False
+# access_log_headers = false
+#
+# If access_log_headers is True and access_log_headers_only is set only
+# these headers are logged. Multiple headers can be defined as comma separated
+# list like this: access_log_headers_only = Host, X-Object-Meta-Mtime
+# access_log_headers_only =
+#
+# The default log format includes several sensitive values in logs:
+#   * X-Auth-Token header
+#   * temp_url_sig query parameter
+#   * Authorization header
+#   * X-Amz-Signature query parameter
+# To prevent an unauthorized access of the log file leading to an unauthorized
+# access of cluster data, only a portion of these values are written, with the
+# remainder replaced by '...' in the log. Set reveal_sensitive_prefix to the
+# number of characters to log.  Set to 0 to suppress the values entirely; set
+# to something large (1000, say) to write full values. Note that some values
+# may start appearing in full at values as low as 33.
+# reveal_sensitive_prefix = 16
+#
 # What HTTP methods are allowed for StatsD logging (comma-sep); request methods
 # not in this list will have "BAD_METHOD" for the <verb> portion of the metric.
-# log_statsd_valid_http_methods = GET,HEAD,POST,PUT,DELETE,COPY,OPTIONS
+# log_statsd_valid_http_methods = GET,HEAD,POST,PUT,DELETE,COPY,OPTIONS,UPDATE
+#
+# Hashing algorithm for log anonymization. Must be one of algorithms supported
+# by Python's hashlib.
+# log_anonymization_method = MD5
+#
+# Salt added during log anonymization
+# log_anonymization_salt =
+#
+# Template used to format access logs. All words surrounded by curly brackets
+# will be substituted with the appropriate values. For more information, see
+# https://docs.openstack.org/swift/latest/logs.html
+# log_msg_template = {client_ip} {remote_addr} {end_time.datetime} {method} {path} {protocol} {status_int} {referer} {user_agent} {auth_token} {bytes_recvd} {bytes_sent} {client_etag} {transaction_id} {headers} {request_time} {source} {log_info} {start_time} {end_time} {policy_index} {access_user_id}
+# The proxy_logging middleware attempts to translate s3api request paths to
+# swift paths. To do so it needs to know which, if any, storage domains are
+# configured for virtual-hosted style requests. This option should be a
+# comma-separated list of host names, exactly the same as that set for the
+# s3api middleware.
+# storage_domain =
+#
+# A float value in seconds for how often the proxy server should emit statsd
+# real-time buffer transfer bytes counter metrics for WSGI input or output.
+# Negative value for not emitting such metrics. 0 for always emitting such
+# metrics on every input or output call. Default is -1.
+# statsd_emit_buffer_xfer_bytes_seconds = -1
+#
+# Note: Put before both ratelimit and auth in the pipeline.
+[filter:bulk]
+use = egg:swift#bulk
+# max_containers_per_extraction = 10000
+# max_failed_extractions = 1000
+# max_deletes_per_request = 10000
+# max_failed_deletes = 1000
+#
+# In order to keep a connection active during a potentially long bulk request,
+# Swift may return whitespace prepended to the actual response body. This
+# whitespace will be yielded no more than every yield_frequency seconds.
+# yield_frequency = 10
+#
+# Note: The following parameter is used during a bulk delete of objects and
+# their container. This would frequently fail because it is very likely
+# that all replicated objects have not been deleted by the time the middleware got a
+# successful response. It can be configured the number of retries. And the
+# number of seconds to wait between each retry will be 1.5**retry
+# delete_container_retry_count = 0
+#
+# To speed up the bulk delete process, multiple deletes may be executed in
+# parallel. Avoid setting this too high, as it gives clients a force multiplier
+# which may be used in DoS attacks. The suggested range is between 2 and 10.
+# delete_concurrency = 2
+
+# Note: Put after auth and staticweb in the pipeline.
+[filter:slo]
+use = egg:swift#slo
+# max_manifest_segments = 1000
+# max_manifest_size = 8388608
+#
+# Rate limiting applies only to segments smaller than this size (bytes).
+# rate_limit_under_size = 1048576
+#
+# Start rate-limiting SLO segment serving after the Nth small segment of a
+# segmented object.
+# rate_limit_after_segment = 10
+#
+# Once segment rate-limiting kicks in for an object, limit segments served
+# to N per second. 0 means no rate-limiting.
+# rate_limit_segments_per_sec = 1
+#
+# Time limit on GET requests (seconds)
+# max_get_time = 86400
+#
+# When creating an SLO, multiple segment validations may be executed in
+# parallel. Further, multiple deletes may be executed in parallel when deleting
+# with ?multipart-manifest=delete. Use this setting to limit how many
+# subrequests may be executed concurrently. Avoid setting it too high, as it
+# gives clients a force multiplier which may be used in DoS attacks. The
+# suggested range is between 2 and 10.
+# concurrency = 2
+#
+# This may be used to separately tune validation and delete concurrency values.
+# Default is to use the concurrency value from above; all of the same caveats
+# apply regarding recommended ranges.
+# delete_concurrency = 2
+#
+# In order to keep a connection active during a potentially long PUT request,
+# clients may request that Swift send whitespace ahead of the final response
+# body. This whitespace will be yielded at most every yield_frequency seconds.
+# yield_frequency = 10
+#
+# Since SLOs may have thousands of segments, clients may request that the
+# object-expirer handle the deletion of segments using query params like
+# `?multipart-manifest=delete&async=on`. You may want to keep this off if it
+# negatively impacts your expirers; in that case, the deletes will still
+# be done as part of the client request.
+# allow_async_delete = true
+
+# Note: Put after auth and staticweb in the pipeline.
+# If you don't put it in the pipeline, it will be inserted for you.
+[filter:dlo]
+use = egg:swift#dlo
+# Start rate-limiting DLO segment serving after the Nth segment of a
+# segmented object.
+# rate_limit_after_segment = 10
+#
+# Once segment rate-limiting kicks in for an object, limit segments served
+# to N per second. 0 means no rate-limiting.
+# rate_limit_segments_per_sec = 1
+#
+# Time limit on GET requests (seconds)
+# max_get_time = 86400
+
+# Note: Put after auth and server-side copy in the pipeline.
+[filter:container-quotas]
+use = egg:swift#container_quotas
+
+# Note: Put after auth and server-side copy in the pipeline.
+[filter:account-quotas]
+use = egg:swift#account_quotas
+
+[filter:gatekeeper]
+use = egg:swift#gatekeeper
+# Set this to false if you want to allow clients to set arbitrary X-Timestamps
+# on uploaded objects. This may be used to preserve timestamps when migrating
+# from a previous storage system, but risks allowing users to upload
+# difficult-to-delete data.
+# shunt_inbound_x_timestamp = true
+#
+# Set this to true if you want to allow clients to access and manipulate the
+# (normally internal-to-swift) null namespace by including a header like
+#    X-Allow-Reserved-Names: true
+# allow_reserved_names_header = false
+#
+# You can override the default log routing for this filter here:
+# set log_name = gatekeeper
+# set log_facility = LOG_LOCAL0
+# set log_level = INFO
+# set log_headers = false
+# set log_address = /dev/log
+
+[filter:container_sync]
+use = egg:swift#container_sync
+# Set this to false if you want to disallow any full URL values to be set for
+# any new X-Container-Sync-To headers. This will keep any new full URLs from
+# coming in, but won't change any existing values already in the cluster.
+# Updating those will have to be done manually, as knowing what the true realm
+# endpoint should be cannot always be guessed.
+# allow_full_urls = true
+# Set this to specify this clusters //realm/cluster as "current" in /info
+# current = //REALM/CLUSTER
+
+# Note: Put it at the beginning of the pipeline to profile all middleware. But
+# it is safer to put this after catch_errors, gatekeeper and healthcheck.
+# Not intended for production environments!
+[filter:xprofile]
+use = egg:swift#xprofile
+# This option enable you to switch profilers which should inherit from python
+# standard profiler. Currently the supported value can be 'cProfile',
+# 'eventlet.green.profile' etc.
+# profile_module = eventlet.green.profile
+#
+# This prefix will be used to combine process ID and timestamp to name the
+# profile data file.  Make sure the executing user has permission to write
+# into this path (missing path segments will be created, if necessary).
+# If you enable profiling in more than one type of daemon, you must override
+# it with an unique value like: /var/log/swift/profile/proxy.profile
+# log_filename_prefix = /tmp/log/swift/profile/default.profile
+#
+# the profile data will be dumped to local disk based on above naming rule
+# in this interval (in seconds).
+# dump_interval = 5.0
+#
+# Be careful, this option will enable profiler to dump data into the file with
+# time stamp which means there will be lots of files piled up in the directory.
+# dump_timestamp = false
+#
+# This is the path of the URL to access the mini web UI.
+# path = /__profile__
+#
+# Clear the data when the wsgi server shutdown.
+# flush_at_shutdown = false
+#
+# unwind the iterator of applications
+# unwind = false
+
+# Note: Put after slo, dlo in the pipeline.
+# If you don't put it in the pipeline, it will be inserted automatically.
+[filter:versioned_writes]
+use = egg:swift#versioned_writes
+# Enables using versioned writes middleware and exposing configuration
+# settings via HTTP GET /info.
+# WARNING: Setting this option bypasses the "allow_versions" option
+# in the container configuration file, which will be eventually
+# deprecated. See documentation for more details.
+# allow_versioned_writes = false
+# Enables Swift object-versioning API
+# allow_object_versioning = false
+
+# Note: Put after auth and before dlo and slo middlewares.
+# If you don't put it in the pipeline, it will be inserted for you.
+[filter:copy]
+use = egg:swift#copy
+
+# Note: To enable encryption, add the following 2 dependent pieces of crypto
+# middleware to the proxy-server pipeline. They should be to the right of all
+# other middleware apart from the final proxy-logging middleware, and in the
+# order shown in this example:
+# <other middleware> keymaster encryption proxy-logging proxy-server
+[filter:keymaster]
+use = egg:swift#keymaster
+
+# Over time, the format of crypto metadata on disk may change slightly to resolve
+# ambiguities. In general, you want to be writing the newest version, but to
+# ensure that all writes can still be read during rolling upgrades, there's the
+# option to write older formats as well.
+# Before upgrading from Swift 2.20.0 or Swift 2.19.1 or earlier, ensure this is set to 1
+# Before upgrading from Swift 2.25.0 or earlier, ensure this is set to at most 2
+# After upgrading all proxy servers, set this to 3 (currently the highest version)
+#
+# The default is currently 2 to support upgrades with no configuration changes,
+# but may change to 3 in the future.
+meta_version_to_write = 2
+
+# Sets the root secret from which encryption keys are derived. This must be set
+# before first use to a value that is a base64 encoding of at least 32 bytes.
+# The security of all encrypted data critically depends on this key, therefore
+# it should be set to a high-entropy value. For example, a suitable value may
+# be obtained by base-64 encoding a 32 byte (or longer) value generated by a
+# cryptographically secure random number generator. Changing the root secret is
+# likely to result in data loss.
+encryption_root_secret = changeme
+
+# Multiple root secrets may be configured using options named
+# 'encryption_root_secret_<secret_id>' where 'secret_id' is a unique
+# identifier. This enables the root secret to be changed from time to time.
+# Only one root secret is used for object PUTs or POSTs at any moment in time.
+# This is specified by the 'active_root_secret_id' option. If
+# 'active_root_secret_id' is not specified then the root secret specified by
+# 'encryption_root_secret' is considered to be the default. Once a root secret
+# has been used as the default root secret it must remain in the config file in
+# order that any objects that were encrypted with it may be subsequently
+# decrypted. The secret_id used to identify the key cannot change.
+# encryption_root_secret_myid = changeme
+# active_root_secret_id = myid
+
+# Sets the path from which the keymaster config options should be read. This
+# allows multiple processes which need to be encryption-aware (for example,
+# proxy-server and container-sync) to share the same config file, ensuring
+# that the encryption keys used are the same. The format expected is similar
+# to other config files, with a single [keymaster] section and a single
+# encryption_root_secret option. If this option is set, the root secret
+# MUST NOT be set in proxy-server.conf.
+# keymaster_config_path =
+
+# To store the encryption root secret in a remote key management system (KMS)
+# such as Barbican, replace the keymaster middleware with the kms_keymaster
+# middleware in the proxy-server pipeline. They should be to the right of all
+# other middleware apart from the final proxy-logging middleware, and in the
+# order shown in this example:
+# <other middleware> kms_keymaster encryption proxy-logging proxy-server
+[filter:kms_keymaster]
+use = egg:swift#kms_keymaster
+
+# Sets the path from which the keymaster config options should be read. This
+# allows multiple processes which need to be encryption-aware (for example,
+# proxy-server and container-sync) to share the same config file, ensuring
+# that the encryption keys used are the same. The format expected is similar
+# to other config files, with a single [kms_keymaster] section. See the
+# keymaster.conf-sample file for details on the kms_keymaster configuration
+# options.
+# keymaster_config_path =
+
+# kmip_keymaster middleware may be used to fetch an encryption root secret from
+# a KMIP service. It should replace, in the same position, any other keymaster
+# middleware in the proxy-server pipeline, so that the middleware order is as
+# shown in this example:
+# <other middleware> kmip_keymaster encryption proxy-logging proxy-server
+[filter:kmip_keymaster]
+use = egg:swift#kmip_keymaster
+
+# Sets the path from which the keymaster config options should be read. This
+# allows multiple processes which need to be encryption-aware (for example,
+# proxy-server and container-sync) to share the same config file, ensuring
+# that the encryption keys used are the same. As an added benefit the
+# keymaster configuration file can have different permissions than the
+# `proxy-server.conf` file. The format expected is similar
+# to other config files, with a single [kmip_keymaster] section. See the
+# keymaster.conf-sample file for details on the kmip_keymaster configuration
+# options.
+# keymaster_config_path =
+
+[filter:encryption]
+use = egg:swift#encryption
+
+# By default all PUT or POST'ed object data and/or metadata will be encrypted.
+# Encryption of new data and/or metadata may be disabled by setting
+# disable_encryption to True. However, all encryption middleware should remain
+# in the pipeline in order for existing encrypted data to be read.
+# disable_encryption = False
+
+# listing_formats should be just right of the first proxy-logging middleware,
+# and left of most other middlewares. If it is not already present, it will
+# be automatically inserted for you.
+[filter:listing_formats]
+use = egg:swift#listing_formats
+
+# Note: Put after slo, dlo, versioned_writes, but before encryption in the
+# pipeline.
+[filter:symlink]
+use = egg:swift#symlink
+# Symlinks can point to other symlinks provided the number of symlinks in a
+# chain does not exceed the symloop_max value. If the number of chained
+# symlinks exceeds the limit symloop_max a 409 (HTTPConflict) error
+# response will be produced.
+# symloop_max = 2
diff --git a/etc/rsyncd.conf-sample b/etc/rsyncd.conf-sample
index c3b9952b16..00d205e1dc 100644
--- a/etc/rsyncd.conf-sample
+++ b/etc/rsyncd.conf-sample
@@ -2,6 +2,9 @@ uid = swift
 gid = swift
 log file = /var/log/rsyncd.log
 pid file = /var/run/rsyncd.pid
+# since rsync default for reverse lookup is true, you have to set it to false
+# here globally or after a few 100 nodes your dns team will fuss at you
+reverse lookup = false
 
 [account]
 max connections = 2
@@ -20,3 +23,59 @@ max connections = 8
 path = /srv/node
 read only = false
 lock file = /var/lock/object.lock
+
+
+# If rsync_module includes the device, you can tune rsyncd to permit 4
+# connections per device instead of simply allowing 8 connections for all
+# devices:
+# rsync_module = {replication_ip}::object_{device}
+#
+# (if devices in your object ring are named sda, sdb and sdc)
+#
+#[object_sda]
+#max connections = 4
+#path = /srv/node
+#read only = false
+#lock file = /var/lock/object_sda.lock
+#
+#[object_sdb]
+#max connections = 4
+#path = /srv/node
+#read only = false
+#lock file = /var/lock/object_sdb.lock
+#
+#[object_sdc]
+#max connections = 4
+#path = /srv/node
+#read only = false
+#lock file = /var/lock/object_sdc.lock
+
+
+# On a swift-all-in-one VM, you might tune rsync by replication port instead:
+# rsync_module = {replication_ip}::object{replication_port}
+#
+# So, on your SAIO, you have to set the following rsyncd configuration:
+#
+#[object6210]
+#max connections = 25
+#path = /srv/1/node/
+#read only = false
+#lock file = /var/lock/object6210.lock
+#
+#[object6220]
+#max connections = 25
+#path = /srv/2/node/
+#read only = false
+#lock file = /var/lock/object6220.lock
+#
+#[object6230]
+#max connections = 25
+#path = /srv/3/node/
+#read only = false
+#lock file = /var/lock/object6230.lock
+#
+#[object6240]
+#max connections = 25
+#path = /srv/4/node/
+#read only = false
+#lock file = /var/lock/object6240.lock
diff --git a/etc/swift-bench.conf-sample b/etc/swift-bench.conf-sample
deleted file mode 100644
index 423608ec48..0000000000
--- a/etc/swift-bench.conf-sample
+++ /dev/null
@@ -1,60 +0,0 @@
-[bench]
-# auth = http://localhost:8080/auth/v1.0
-# user = test:tester
-# key = testing
-# auth_version = 1.0
-# log-level = INFO
-# timeout = 10
-
-# You can configure PUT, GET, and DELETE concurrency independently or set all
-# three with "concurrency"
-# put_concurrency = 10
-# get_concurrency = 10
-# del_concurrency = 10
-# concurrency =
-
-# A space-sep list of files whose contents will be read and randomly chosen
-# as the body (object contents) for each PUT.
-# object_sources =
-
-# If object_sources is not set and lower_object_size != upper_object_size,
-# each PUT will randomly select an object size between the two values.  Units
-# are bytes.
-# lower_object_size = 10
-# upper_object_size = 10
-
-# If object_sources is not set and lower_object_size == upper_object_size,
-# every object PUT will contain this many bytes.
-# object_size = 1
-
-# num_objects = 1000
-# num_gets = 10000
-# num_containers = 20
-
-# The base name for created containers.
-# container_name = (randomly-chosen uuid4)
-
-# Should swift-bench benchmark DELETEing the created objects and then delete
-# all created containers?
-# delete = yes
-
-# Without use_proxy, swift-bench will talk directly to the backend Swift
-# servers.  Doing that will require "url", "account", and at least one
-# "devices" entry.
-# use_proxy = yes
-
-# If use_proxy = yes, this will override any returned X-Storage-Url returned
-# by authenticaion (the account name will still be extracted from
-# X-Storage-Url though and may NOT be set with the "account" conf var).  If
-# use_proxy = no, this setting is required and used as the X-Storage-Url when
-# deleting containers and as a source for IP and port for back-end Swift server
-# connections.  The IP and port specified in this setting must have local
-# storage access to every device specified in "devices".
-# url =
-
-# Only used (and required) when use_proxy = no.
-# account =
-
-# A space-sep list of devices names; only relevant (and required) when
-# use_proxy = no.
-# devices = sdb1
diff --git a/etc/swift-rsyslog.conf-sample b/etc/swift-rsyslog.conf-sample
new file mode 100644
index 0000000000..4d9c2f3ea1
--- /dev/null
+++ b/etc/swift-rsyslog.conf-sample
@@ -0,0 +1,40 @@
+# Uncomment the following to have a log containing all logs together
+#local.* /var/log/swift/all.log
+
+# Uncomment the following to have hourly swift logs.
+#$template HourlyProxyLog,"/var/log/swift/hourly/%$YEAR%%$MONTH%%$DAY%%$HOUR%"
+#local0.* ?HourlyProxyLog
+
+# Use the following to have separate log files for each of the main servers:
+# account-server, container-server, object-server, proxy-server. Note:
+# object-updater's output will be stored in object.log.
+if $programname contains 'swift' then /var/log/swift/swift.log
+if $programname contains 'account' then /var/log/swift/account.log
+if $programname contains 'container' then /var/log/swift/container.log
+if $programname contains 'object' then /var/log/swift/object.log
+if $programname contains 'proxy' then /var/log/swift/proxy.log
+
+# Uncomment the following to have specific log via program name.
+#if $programname == 'swift' then /var/log/swift/swift.log
+#if $programname == 'account-server' then /var/log/swift/account-server.log
+#if $programname == 'account-replicator' then /var/log/swift/account-replicator.log
+#if $programname == 'account-auditor' then /var/log/swift/account-auditor.log
+#if $programname == 'account-reaper' then /var/log/swift/account-reaper.log
+#if $programname == 'container-server' then /var/log/swift/container-server.log
+#if $programname == 'container-replicator' then /var/log/swift/container-replicator.log
+#if $programname == 'container-updater' then /var/log/swift/container-updater.log
+#if $programname == 'container-auditor' then /var/log/swift/container-auditor.log
+#if $programname == 'container-sync' then /var/log/swift/container-sync.log
+#if $programname == 'container-sharder' then /var/log/swift/container-sharder.log
+#if $programname == 'container-reconciler' then /var/log/swift/container-reconciler.log
+#if $programname == 'object-server' then /var/log/swift/object-server.log
+#if $programname == 'object-replicator' then /var/log/swift/object-replicator.log
+#if $programname == 'object-updater' then /var/log/swift/object-updater.log
+#if $programname == 'object-auditor' then /var/log/swift/object-auditor.log
+#if $programname == 'object-expirer' then /var/log/swift/object-expirer.log
+#if $programname == 'object-reconstructor' then /var/log/swift/object-reconstructor.log
+#if $programname == 'object-relinker' then /var/log/swift/object-relinker.log
+
+# Use the following to discard logs that don't match any of the above to avoid
+# them filling up /var/log/messages.
+local0.* ~
diff --git a/etc/swift.conf-sample b/etc/swift.conf-sample
index 2f4192a3c1..84454ec4f8 100644
--- a/etc/swift.conf-sample
+++ b/etc/swift.conf-sample
@@ -1,15 +1,116 @@
 [swift-hash]
 
-# swift_hash_path_suffix is used as part of the hashing algorithm
-# when determining data placement in the cluster. This value should
-# remain secret and MUST NOT change once a cluster has been deployed.
+# swift_hash_path_suffix and swift_hash_path_prefix are used as part of the
+# hashing algorithm when determining data placement in the cluster.
+# These values should remain secret and MUST NOT change
+# once a cluster has been deployed.
+# Use only printable chars (python -c "import string; print(string.printable)")
 
 swift_hash_path_suffix = changeme
-
-
+swift_hash_path_prefix = changeme
+
+# Storage policies are defined here and determine various characteristics
+# about how objects are stored and treated. More documentation can be found at
+# https://docs.openstack.org/swift/latest/overview_policies.html.
+
+# Client requests specify a policy on a per container basis using the policy
+# name. Internally the policy name is mapped to the policy index specified in
+# the policy's section header in this config file. Policy names are
+# case-insensitive and, to avoid confusion with indexes names, should not be
+# numbers.
+#
+# The policy with index 0 is always used for legacy containers and can be given
+# a name for use in metadata however the ring file name will always be
+# 'object.ring.gz' for backwards compatibility.  If no policies are defined a
+# policy with index 0 will be automatically created for backwards compatibility
+# and given the name Policy-0.  A default policy is used when creating new
+# containers when no policy is specified in the request.  If no other policies
+# are defined the policy with index 0 will be declared the default.  If
+# multiple policies are defined you must define a policy with index 0 and you
+# must specify a default.  It is recommended you always define a section for
+# storage-policy:0.
+#
+# A 'policy_type' argument is also supported but is not mandatory.  Default
+# policy type 'replication' is used when 'policy_type' is unspecified.
+#
+# A 'diskfile_module' optional argument lets you specify an alternate backend
+# object storage plug-in architecture. The default is
+# "egg:swift#replication.fs", or "egg:swift#erasure_coding.fs", depending on
+# the policy type.
+#
+# Aliases for the storage policy name may be defined, but are not required.
+#
+[storage-policy:0]
+name = Policy-0
+default = yes
+#policy_type = replication
+#diskfile_module = egg:swift#replication.fs
+aliases = yellow, orange
+
+# The following section would declare a policy called 'silver', the number of
+# replicas will be determined by how the ring is built.  In this example the
+# 'silver' policy could have a lower or higher # of replicas than the
+# 'Policy-0' policy above.  The ring filename will be 'object-1.ring.gz'.  You
+# may only specify one storage policy section as the default.  If you changed
+# this section to specify 'silver' as the default, when a client created a new
+# container w/o a policy specified, it will get the 'silver' policy because
+# this config has specified it as the default.  However if a legacy container
+# (one created with a pre-policy version of swift) is accessed, it is known
+# implicitly to be assigned to the policy with index 0 as opposed to the
+# current default. Note that even without specifying any aliases, a policy
+# always has at least the default name stored in aliases because this field is
+# used to contain all human readable names for a storage policy.
+#
+#[storage-policy:1]
+#name = silver
+#policy_type = replication
+#diskfile_module = egg:swift#replication.fs
+
+# The following declares a storage policy of type 'erasure_coding' which uses
+# Erasure Coding for data reliability. Please refer to Swift documentation for
+# details on how the 'erasure_coding' storage policy is implemented.
+#
+# Swift uses PyECLib, a Python Erasure coding API library, for encode/decode
+# operations.  Please refer to Swift documentation for details on how to
+# install PyECLib.
+#
+# When defining an EC policy, 'policy_type' needs to be 'erasure_coding' and
+# EC configuration parameters 'ec_type', 'ec_num_data_fragments' and
+# 'ec_num_parity_fragments' must be specified.  'ec_type' is chosen from the
+# list of EC backends supported by PyECLib.  The ring configured for the
+# storage policy must have its "replica" count configured to
+# 'ec_num_data_fragments' + 'ec_num_parity_fragments' - this requirement is
+# validated when services start.  'ec_object_segment_size' is the amount of
+# data that will be buffered up before feeding a segment into the
+# encoder/decoder.  More information about these configuration options and
+# supported 'ec_type' schemes is available in the Swift documentation.  See
+# https://docs.openstack.org/swift/latest/overview_erasure_code.html
+# for more information on how to configure EC policies.
+#
+# The example 'deepfreeze10-4' policy defined below is a _sample_
+# configuration with an alias of 'df10-4' as well as 10 'data' and 4 'parity'
+# fragments. 'ec_type' defines the Erasure Coding scheme.
+# 'liberasurecode_rs_vand' (Reed-Solomon Vandermonde) is used as an example
+# below.
+#
+#[storage-policy:2]
+#name = deepfreeze10-4
+#aliases = df10-4
+#policy_type = erasure_coding
+#diskfile_module = egg:swift#erasure_coding.fs
+#ec_type = liberasurecode_rs_vand
+#ec_num_data_fragments = 10
+#ec_num_parity_fragments = 4
+#ec_object_segment_size = 1048576
+#
+# Duplicated EC fragments is proof-of-concept experimental support to enable
+# Global Erasure Coding policies with multiple regions acting as independent
+# failure domains.  Do not change the default except in development/testing.
+#ec_duplication_factor = 1
 
 # The swift-constraints section sets the basic constraints on data
-# saved in the swift cluster.
+# saved in the swift cluster. These constraints are automatically
+# published by the proxy server in responses to /info requests.
 
 [swift-constraints]
 
@@ -46,6 +147,35 @@ swift_hash_path_suffix = changeme
 
 #max_meta_overall_size = 4096
 
+# max_header_size is the max number of bytes in the utf8 encoding of each
+# header. Using 8192 as default because eventlet use 8192 as max size of
+# header line. This value may need to be increased when using identity
+# v3 API tokens including more than 7 catalog entries.
+# See also include_service_catalog in proxy-server.conf-sample
+# (documented at https://docs.openstack.org/swift/latest/overview_auth.html)
+
+#max_header_size = 8192
+
+
+# max_request_line constrains the max number of characters in the request
+# line; a request line '<method> <url> <HTTP/1.1>\r\n' must have less
+# than this number of characters.
+# Using 8192 as default because eventlet use 8192 as default max request line.
+#
+# Note: Request urls are concatenated with the request method to form
+# the Referer header that is sent to backend servers, so it may be
+# necessary to increase max_header_size when increasing max_request_line.
+
+#max_request_line = 8192
+
+# By default the maximum number of allowed headers depends on the number of max
+# allowed metadata settings plus a default value of 36 for swift internally
+# generated headers and regular http headers.  If for some reason this is not
+# enough (custom middleware for example) it can be increased with the
+# extra_header_count constraint.
+
+#extra_header_count = 0
+
 
 # max_object_name_length is the max number of bytes in the utf8 encoding
 # of an object name
@@ -74,3 +204,19 @@ swift_hash_path_suffix = changeme
 # of a container name
 
 #max_container_name_length = 256
+
+
+# By default all REST API calls should use "v1" or "v1.0" as the version string,
+# for example "/v1/account". This can be manually overridden to make this
+# backward-compatible, in case a different version string has been used before.
+# Use a comma-separated list in case of multiple allowed versions, for example
+# valid_api_versions = v0,v1,v2
+# This is only enforced for account, container and object requests. The allowed
+# api versions are by default excluded from /info.
+
+# valid_api_versions = v1,v1.0
+
+# The prefix used for hidden auto-created accounts, for example accounts in
+# which shard containers are created. It defaults to '.'; don't change it.
+
+# auto_create_account_prefix = .
diff --git a/examples/apache2/account-server.template b/examples/apache2/account-server.template
new file mode 100644
index 0000000000..d336a130d8
--- /dev/null
+++ b/examples/apache2/account-server.template
@@ -0,0 +1,25 @@
+# Account Server VHOST Template For Apache2
+#
+# Change %PORT% to the port that you wish to use on your system
+# Change %SERVICENAME% to the service name you are using
+# Change %USER% to the system user that will run the daemon process
+# Change the debug level as you see fit
+#
+# For example:
+#     Replace %PORT% by 6212
+#     Replace %SERVICENAME% by account-server-1
+#     Replace %USER% with apache (or remove it for default)
+
+NameVirtualHost *:%PORT%
+Listen %PORT%
+
+<VirtualHost *:%PORT%>
+    WSGIDaemonProcess %SERVICENAME% processes=5 threads=1 user=%USER% display-name=%{GROUP}
+    WSGIProcessGroup %SERVICENAME%
+    WSGIScriptAlias / /var/www/swift/%SERVICENAME%.wsgi
+    WSGIApplicationGroup %{GLOBAL}
+    LimitRequestFields 200
+    ErrorLog /var/log/%APACHE_NAME%/%SERVICENAME%
+    LogLevel debug
+    CustomLog /var/log/%APACHE_NAME%/access.log combined
+</VirtualHost>
diff --git a/examples/apache2/container-server.template b/examples/apache2/container-server.template
new file mode 100644
index 0000000000..5b504b1958
--- /dev/null
+++ b/examples/apache2/container-server.template
@@ -0,0 +1,25 @@
+# Container Server VHOST Template For Apache2
+#
+# Change %PORT% to the port that you wish to use on your system
+# Change %SERVICENAME% to the service name you are using
+# Change %USER% to the system user that will run the daemon process
+# Change the debug level as you see fit
+#
+# For example:
+#     Replace %PORT% by 6211
+#     Replace %SERVICENAME% by container-server-1
+#     Replace %USER% with apache (or remove it for default)
+
+NameVirtualHost *:%PORT%
+Listen %PORT%
+
+<VirtualHost *:%PORT%>
+    WSGIDaemonProcess %SERVICENAME% processes=5 threads=1 user=%USER% display-name=%{GROUP}
+    WSGIProcessGroup %SERVICENAME%
+    WSGIScriptAlias / /var/www/swift/%SERVICENAME%.wsgi
+    WSGIApplicationGroup %{GLOBAL}
+    LimitRequestFields 200
+    ErrorLog /var/log/%APACHE_NAME%/%SERVICENAME%
+    LogLevel debug
+    CustomLog /var/log/%APACHE_NAME%/access.log combined
+</VirtualHost>
diff --git a/examples/apache2/object-server.template b/examples/apache2/object-server.template
new file mode 100644
index 0000000000..8e8ed65670
--- /dev/null
+++ b/examples/apache2/object-server.template
@@ -0,0 +1,25 @@
+# Object Server VHOST Template For Apache2
+#
+# Change %PORT% to the port that you wish to use on your system
+# Change %SERVICENAME% to the service name you are using
+# Change %USER% to the system user that will run the daemon process
+# Change the debug level as you see fit
+#
+# For example:
+#     Replace %PORT% by 6210
+#     Replace %SERVICENAME% by object-server-1
+#     Replace %USER% with apache (or remove it for default)
+
+NameVirtualHost *:%PORT%
+Listen %PORT%
+
+<VirtualHost *:%PORT%>
+    WSGIDaemonProcess %SERVICENAME% processes=5 threads=1 user=%USER% display-name=%{GROUP}
+    WSGIProcessGroup %SERVICENAME%
+    WSGIScriptAlias / /var/www/swift/%SERVICENAME%.wsgi
+    WSGIApplicationGroup %{GLOBAL}
+    LimitRequestFields 200
+    ErrorLog /var/log/%APACHE_NAME%/%SERVICENAME%
+    LogLevel debug
+    CustomLog /var/log/%APACHE_NAME%/access.log combined
+</VirtualHost>
diff --git a/examples/apache2/proxy-server.template b/examples/apache2/proxy-server.template
new file mode 100644
index 0000000000..f2b500be65
--- /dev/null
+++ b/examples/apache2/proxy-server.template
@@ -0,0 +1,27 @@
+# Proxy Server VHOST Template For Apache2
+#
+# Change %PORT% to the port that you wish to use on your system
+# Change %SERVICENAME% to the service name you are using
+# Change %USER% to the system user that will run the daemon process
+# Change the debug level as you see fit
+#
+# For example:
+#     Replace %PORT% by 8080
+#     Replace %SERVICENAME% by proxy-server
+#     Replace %USER% with apache (or remove it for default)
+
+NameVirtualHost *:%PORT%
+Listen %PORT%
+
+<VirtualHost *:%PORT%>
+    # The limit of an object size
+    LimitRequestBody 5368709122
+    WSGIDaemonProcess %SERVICENAME% processes=5 threads=1 user=%USER% display-name=%{GROUP}
+    WSGIProcessGroup %SERVICENAME%
+    WSGIScriptAlias / /var/www/swift/%SERVICENAME%.wsgi
+    WSGIApplicationGroup %{GLOBAL}
+    LimitRequestFields 200
+    ErrorLog /var/log/%APACHE_NAME%/%SERVICENAME%
+    LogLevel debug
+    CustomLog /var/log/%APACHE_NAME%/access.log combined
+</VirtualHost>
diff --git a/examples/wsgi/account-server.wsgi.template b/examples/wsgi/account-server.wsgi.template
new file mode 100644
index 0000000000..51bcc00d92
--- /dev/null
+++ b/examples/wsgi/account-server.wsgi.template
@@ -0,0 +1,14 @@
+# Account Server wsgi Template
+#
+# Change %SERVICECONF% to the service conf file you are using
+#
+# For example:
+#     Replace %SERVICECONF% by account-server/1.conf
+#
+# This file than need to be saved under /var/www/swift/%SERVICENAME%.wsgi
+# * Replace %SERVICENAME% with the service name you use your system
+#   E.g. Replace %SERVICENAME% by account-server-1
+
+from swift.common.wsgi import init_request_processor
+application, conf, logger, log_name = \
+    init_request_processor('/etc/swift/%SERVICECONF%','account-server')
diff --git a/examples/wsgi/container-server.wsgi.template b/examples/wsgi/container-server.wsgi.template
new file mode 100644
index 0000000000..bebd3e6a41
--- /dev/null
+++ b/examples/wsgi/container-server.wsgi.template
@@ -0,0 +1,14 @@
+# Container Server wsgi Template
+#
+# Change %SERVICECONF% to the service conf file you are using
+#
+# For example:
+#     Replace %SERVICECONF% by container-server/1.conf
+#
+# This file than need to be saved under /var/www/swift/%SERVICENAME%.wsgi
+# * Replace %SERVICENAME% with the service name you use your system
+#   E.g. Replace %SERVICENAME% by container-server-1
+
+from swift.common.wsgi import init_request_processor
+application, conf, logger, log_name = \
+    init_request_processor('/etc/swift/%SERVICECONF%','container-server')
diff --git a/examples/wsgi/object-server.wsgi.template b/examples/wsgi/object-server.wsgi.template
new file mode 100644
index 0000000000..afcb14324c
--- /dev/null
+++ b/examples/wsgi/object-server.wsgi.template
@@ -0,0 +1,14 @@
+# Object Server wsgi Template
+#
+# Change %SERVICECONF% to the service conf file you are using
+#
+# For example:
+#     Replace %SERVICECONF% by object-server/1.conf
+#
+# This file than need to be saved under /var/www/swift/%SERVICENAME%.wsgi
+# * Replace %SERVICENAME% with the service name you use your system
+#   E.g. Replace %SERVICENAME% by object-server-1
+
+from swift.common.wsgi import init_request_processor
+application, conf, logger, log_name = \
+    init_request_processor('/etc/swift/%SERVICECONF%','object-server')
diff --git a/examples/wsgi/proxy-server.wsgi.template b/examples/wsgi/proxy-server.wsgi.template
new file mode 100644
index 0000000000..1a48afeca6
--- /dev/null
+++ b/examples/wsgi/proxy-server.wsgi.template
@@ -0,0 +1,14 @@
+# Proxy Server wsgi Template
+#
+# Change %SERVICECONF% to the service conf file you are using
+#
+# For example:
+#     Replace %SERVICECONF% by proxy-server.conf
+#
+# This file than need to be saved under /var/www/swift/%SERVICENAME%.wsgi
+# * Replace %SERVICENAME% with the service name you use your system
+#   E.g. Replace %SERVICENAME% by proxy-server
+
+from swift.common.wsgi import init_request_processor
+application, conf, logger, log_name = \
+    init_request_processor('/etc/swift/%SERVICECONF%','proxy-server')
diff --git a/locale/swift.pot b/locale/swift.pot
deleted file mode 100644
index 7f905f2940..0000000000
--- a/locale/swift.pot
+++ /dev/null
@@ -1,1030 +0,0 @@
-# Translations template for swift.
-# Copyright (C) 2011 ORGANIZATION
-# This file is distributed under the same license as the swift project.
-# FIRST AUTHOR <EMAIL@ADDRESS>, 2011.
-#
-#, fuzzy
-msgid ""
-msgstr ""
-"Project-Id-Version: swift 1.2.0\n"
-"Report-Msgid-Bugs-To: EMAIL@ADDRESS\n"
-"POT-Creation-Date: 2011-01-26 23:59+0000\n"
-"PO-Revision-Date: YEAR-MO-DA HO:MI+ZONE\n"
-"Last-Translator: FULL NAME <EMAIL@ADDRESS>\n"
-"Language-Team: LANGUAGE <LL@li.org>\n"
-"MIME-Version: 1.0\n"
-"Content-Type: text/plain; charset=utf-8\n"
-"Content-Transfer-Encoding: 8bit\n"
-"Generated-By: Babel 0.9.4\n"
-
-#: swift/account/auditor.py:52 swift/account/auditor.py:75
-#, python-format
-msgid ""
-"Since %(time)s: Account audits: %(passed)s passed audit, %(failed)s "
-"failed audit"
-msgstr ""
-
-#: swift/account/auditor.py:100 swift/container/auditor.py:103
-#, python-format
-msgid "Audit passed for %s"
-msgstr ""
-
-#: swift/account/auditor.py:103
-#, python-format
-msgid "ERROR Could not get account info %s"
-msgstr ""
-
-#: swift/account/reaper.py:80 swift/container/updater.py:64
-#, python-format
-msgid "Loading account ring from %s"
-msgstr ""
-
-#: swift/account/reaper.py:88 swift/obj/updater.py:57
-#, python-format
-msgid "Loading container ring from %s"
-msgstr ""
-
-#: swift/account/reaper.py:96
-#, python-format
-msgid "Loading object ring from %s"
-msgstr ""
-
-#: swift/account/reaper.py:106
-msgid "Daemon started."
-msgstr ""
-
-#: swift/account/reaper.py:122
-#, python-format
-msgid "Begin devices pass: %s"
-msgstr ""
-
-#: swift/account/reaper.py:128 swift/common/utils.py:805
-#: swift/obj/updater.py:74 swift/obj/updater.py:113
-#, python-format
-msgid "Skipping %s as it is not mounted"
-msgstr ""
-
-#: swift/account/reaper.py:132
-#, python-format
-msgid "Devices pass completed: %.02fs"
-msgstr ""
-
-#: swift/account/reaper.py:215
-#, python-format
-msgid "Beginning pass on account %s"
-msgstr ""
-
-#: swift/account/reaper.py:238
-#, python-format
-msgid "Exception with containers for account %s"
-msgstr ""
-
-#: swift/account/reaper.py:243
-#, python-format
-msgid "Exception with account %s"
-msgstr ""
-
-#: swift/account/reaper.py:244
-#, python-format
-msgid "Incomplete pass on account %s"
-msgstr ""
-
-#: swift/account/reaper.py:246
-#, python-format
-msgid ", %s containers deleted"
-msgstr ""
-
-#: swift/account/reaper.py:248
-#, python-format
-msgid ", %s objects deleted"
-msgstr ""
-
-#: swift/account/reaper.py:250
-#, python-format
-msgid ", %s containers remaining"
-msgstr ""
-
-#: swift/account/reaper.py:253
-#, python-format
-msgid ", %s objects remaining"
-msgstr ""
-
-#: swift/account/reaper.py:255
-#, python-format
-msgid ", %s containers possibly remaining"
-msgstr ""
-
-#: swift/account/reaper.py:258
-#, python-format
-msgid ", %s objects possibly remaining"
-msgstr ""
-
-#: swift/account/reaper.py:261
-msgid ", return codes: "
-msgstr ""
-
-#: swift/account/reaper.py:265
-#, python-format
-msgid ", elapsed: %.02fs"
-msgstr ""
-
-#: swift/account/reaper.py:320 swift/account/reaper.py:355
-#: swift/account/reaper.py:406 swift/container/updater.py:277
-#, python-format
-msgid "Exception with %(ip)s:%(port)s/%(device)s"
-msgstr ""
-
-#: swift/account/reaper.py:333
-#, python-format
-msgid "Exception with objects for container %(container)s for account %(account)s"
-msgstr ""
-
-#: swift/account/server.py:309 swift/container/server.py:397
-#: swift/obj/server.py:597
-#, python-format
-msgid "ERROR __call__ error with %(method)s %(path)s "
-msgstr ""
-
-#: swift/auth/server.py:96 swift/common/middleware/swauth.py:94
-msgid "No super_admin_key set in conf file! Exiting."
-msgstr ""
-
-#: swift/auth/server.py:152
-#, python-format
-msgid ""
-"\n"
-"THERE ARE ACCOUNTS IN YOUR auth.db THAT DO NOT BEGIN WITH YOUR NEW "
-"RESELLER\n"
-"PREFIX OF \"%(reseller)s\".\n"
-"YOU HAVE A FEW OPTIONS:\n"
-"    1. RUN \"swift-auth-update-reseller-prefixes %(db_file)s "
-"%(reseller)s\",\n"
-"       \"swift-init auth-server restart\", AND\n"
-"       \"swift-auth-recreate-accounts -K ...\" TO CREATE FRESH ACCOUNTS.\n"
-"    OR\n"
-"    2. REMOVE %(db_file)s, RUN \"swift-init auth-server restart\", AND "
-"RUN\n"
-"       \"swift-auth-add-user ...\" TO CREATE BRAND NEW ACCOUNTS THAT WAY."
-"\n"
-"    OR\n"
-"    3. ADD \"reseller_prefix = %(previous)s\" (WITHOUT THE QUOTES) TO "
-"YOUR\n"
-"       proxy-server.conf IN THE [filter:auth] SECTION AND TO YOUR\n"
-"       auth-server.conf IN THE [app:auth-server] SECTION AND RUN\n"
-"       \"swift-init proxy-server restart\" AND \"swift-init auth-server "
-"restart\"\n"
-"       TO REVERT BACK TO YOUR PREVIOUS RESELLER PREFIX.\n"
-"\n"
-"    %(note)s\n"
-"                    "
-msgstr ""
-
-#: swift/auth/server.py:173
-msgid ""
-"\n"
-"    SINCE YOUR PREVIOUS RESELLER PREFIX WAS AN EMPTY STRING, IT IS NOT\n"
-"    RECOMMENDED TO PERFORM OPTION 3 AS THAT WOULD MAKE SUPPORTING "
-"MULTIPLE\n"
-"    RESELLERS MORE DIFFICULT.\n"
-"                    "
-msgstr ""
-
-#: swift/auth/server.py:178
-msgid "CRITICAL: "
-msgstr ""
-
-#: swift/auth/server.py:213
-#, python-format
-msgid "ERROR attempting to create account %(url)s: %(status)s %(reason)s"
-msgstr ""
-
-#: swift/auth/server.py:346
-#, python-format
-msgid ""
-"ALREADY EXISTS create_user(%(account)s, %(user)s, _, %(admin)s, "
-"%(reseller_admin)s) [%(elapsed).02f]"
-msgstr ""
-
-#: swift/auth/server.py:364
-#, python-format
-msgid ""
-"FAILED create_user(%(account)s, %(user)s, _, %(admin)s, "
-"%(reseller_admin)s) [%(elapsed).02f]"
-msgstr ""
-
-#: swift/auth/server.py:381
-#, python-format
-msgid ""
-"SUCCESS create_user(%(account)s, %(user)s, _, %(admin)s, "
-"%(reseller_admin)s) = %(url)s [%(elapsed).02f]"
-msgstr ""
-
-#: swift/auth/server.py:656
-msgid "ERROR Unhandled exception in ReST request"
-msgstr ""
-
-#: swift/common/bench.py:85
-#, python-format
-msgid "%(complete)s %(title)s [%(fail)s failures], %(rate).01f/s"
-msgstr ""
-
-#: swift/common/bench.py:97
-msgid "CannotSendRequest.  Skipping..."
-msgstr ""
-
-#: swift/common/bufferedhttp.py:96
-#, python-format
-msgid "HTTP PERF: %(time).5f seconds to %(method)s %(host)s:%(port)s %(path)s)"
-msgstr ""
-
-#: swift/common/db.py:299
-msgid "Broker error trying to rollback locked connection"
-msgstr ""
-
-#: swift/common/db.py:754 swift/common/db.py:1221
-#, python-format
-msgid "Invalid pending entry %(file)s: %(entry)s"
-msgstr ""
-
-#: swift/common/db_replicator.py:84
-#, python-format
-msgid "ERROR reading HTTP response from %s"
-msgstr ""
-
-#: swift/common/db_replicator.py:123
-#, python-format
-msgid "Attempted to replicate %(count)d dbs in %(time).5f seconds (%(rate).5f/s)"
-msgstr ""
-
-#: swift/common/db_replicator.py:129
-#, python-format
-msgid "Removed %(remove)d dbs"
-msgstr ""
-
-#: swift/common/db_replicator.py:130
-#, python-format
-msgid "%(success)s successes, %(failure)s failures"
-msgstr ""
-
-#: swift/common/db_replicator.py:155
-#, python-format
-msgid "ERROR rsync failed with %(code)s: %(args)s"
-msgstr ""
-
-#: swift/common/db_replicator.py:205
-#, python-format
-msgid "Syncing chunks with %s"
-msgstr ""
-
-#: swift/common/db_replicator.py:213
-#, python-format
-msgid "ERROR Bad response %(status)s from %(host)s"
-msgstr ""
-
-#: swift/common/db_replicator.py:278
-#, python-format
-msgid "ERROR Unable to connect to remote server: %s"
-msgstr ""
-
-#: swift/common/db_replicator.py:316
-#, python-format
-msgid "Replicating db %s"
-msgstr ""
-
-#: swift/common/db_replicator.py:325 swift/common/db_replicator.py:479
-#, python-format
-msgid "Quarantining DB %s"
-msgstr ""
-
-#: swift/common/db_replicator.py:328
-#, python-format
-msgid "ERROR reading db %s"
-msgstr ""
-
-#: swift/common/db_replicator.py:361
-#, python-format
-msgid "ERROR Remote drive not mounted %s"
-msgstr ""
-
-#: swift/common/db_replicator.py:363
-#, python-format
-msgid "ERROR syncing %(file)s with node %(node)s"
-msgstr ""
-
-#: swift/common/db_replicator.py:405
-msgid "ERROR Failed to get my own IPs?"
-msgstr ""
-
-#: swift/common/db_replicator.py:412
-#, python-format
-msgid "Skipping %(device)s as it is not mounted"
-msgstr ""
-
-#: swift/common/db_replicator.py:420
-msgid "Beginning replication run"
-msgstr ""
-
-#: swift/common/db_replicator.py:425
-msgid "Replication run OVER"
-msgstr ""
-
-#: swift/common/db_replicator.py:436
-msgid "ERROR trying to replicate"
-msgstr ""
-
-#: swift/common/memcached.py:69
-#, python-format
-msgid "Timeout %(action)s to memcached: %(server)s"
-msgstr ""
-
-#: swift/common/memcached.py:72
-#, python-format
-msgid "Error %(action)s to memcached: %(server)s"
-msgstr ""
-
-#: swift/common/memcached.py:81
-#, python-format
-msgid "Error limiting server %s"
-msgstr ""
-
-#: swift/common/utils.py:88
-#, python-format
-msgid "Unable to locate %s in libc.  Leaving as a no-op."
-msgstr ""
-
-#: swift/common/utils.py:255
-msgid "STDOUT: Connection reset by peer"
-msgstr ""
-
-#: swift/common/utils.py:257 swift/common/utils.py:260
-#, python-format
-msgid "STDOUT: %s"
-msgstr ""
-
-#: swift/common/utils.py:324
-msgid "Connection refused"
-msgstr ""
-
-#: swift/common/utils.py:326
-msgid "Host unreachable"
-msgstr ""
-
-#: swift/common/utils.py:328
-msgid "Connection timeout"
-msgstr ""
-
-#: swift/common/utils.py:464
-msgid "UNCAUGHT EXCEPTION"
-msgstr ""
-
-#: swift/common/utils.py:511
-msgid "Error: missing config file argument"
-msgstr ""
-
-#: swift/common/utils.py:516
-#, python-format
-msgid "Error: unable to locate %s"
-msgstr ""
-
-#: swift/common/utils.py:743
-#, python-format
-msgid "Unable to read config file %s"
-msgstr ""
-
-#: swift/common/utils.py:749
-#, python-format
-msgid "Unable to find %s config section in %s"
-msgstr ""
-
-#: swift/common/middleware/catch_errors.py:39
-#, python-format
-msgid "Error: %s"
-msgstr ""
-
-#: swift/common/middleware/cname_lookup.py:91
-#, python-format
-msgid "Mapped %(given_domain)s to %(found_domain)s"
-msgstr ""
-
-#: swift/common/middleware/cname_lookup.py:102
-#, python-format
-msgid "Following CNAME chain for  %(given_domain)s to %(found_domain)s"
-msgstr ""
-
-#: swift/common/middleware/ratelimit.py:172
-msgid "Returning 497 because of blacklisting"
-msgstr ""
-
-#: swift/common/middleware/ratelimit.py:185
-#, python-format
-msgid "Ratelimit sleep log: %(sleep)s for %(account)s/%(container)s/%(object)s"
-msgstr ""
-
-#: swift/common/middleware/ratelimit.py:192
-#, python-format
-msgid "Returning 498 because of ops rate limiting (Max Sleep) %s"
-msgstr ""
-
-#: swift/common/middleware/ratelimit.py:212
-msgid "Warning: Cannot ratelimit without a memcached client"
-msgstr ""
-
-#: swift/common/middleware/swauth.py:635
-#, python-format
-msgid ""
-"ERROR: Exception while trying to communicate with "
-"%(scheme)s://%(host)s:%(port)s/%(path)s"
-msgstr ""
-
-#: swift/container/auditor.py:54 swift/container/auditor.py:78
-#, python-format
-msgid ""
-"Since %(time)s: Container audits: %(pass)s passed audit, %(fail)s failed "
-"audit"
-msgstr ""
-
-#: swift/container/auditor.py:68
-msgid "Begin container audit \"once\" mode"
-msgstr ""
-
-#: swift/container/auditor.py:88
-#, python-format
-msgid "Container audit \"once\" mode completed: %.02fs"
-msgstr ""
-
-#: swift/container/auditor.py:106
-#, python-format
-msgid "ERROR Could not get container info %s"
-msgstr ""
-
-#: swift/container/server.py:114
-#, python-format
-msgid ""
-"ERROR Account update failed with %(ip)s:%(port)s/%(device)s (will retry "
-"later): Response %(status)s %(reason)s"
-msgstr ""
-
-#: swift/container/server.py:122
-#, python-format
-msgid ""
-"ERROR account update failed with %(ip)s:%(port)s/%(device)s (will retry "
-"later)"
-msgstr ""
-
-#: swift/container/updater.py:78 swift/obj/replicator.py:492
-#, python-format
-msgid "%s is not mounted"
-msgstr ""
-
-#: swift/container/updater.py:97
-#, python-format
-msgid "ERROR with loading suppressions from %s: "
-msgstr ""
-
-#: swift/container/updater.py:107
-msgid "Begin container update sweep"
-msgstr ""
-
-#: swift/container/updater.py:140
-#, python-format
-msgid ""
-"Container update sweep of %(path)s completed: %(elapsed).02fs, "
-"%(success)s successes, %(fail)s failures, %(no_change)s with no changes"
-msgstr ""
-
-#: swift/container/updater.py:154
-#, python-format
-msgid "Container update sweep completed: %.02fs"
-msgstr ""
-
-#: swift/container/updater.py:164
-msgid "Begin container update single threaded sweep"
-msgstr ""
-
-#: swift/container/updater.py:172
-#, python-format
-msgid ""
-"Container update single threaded sweep completed: %(elapsed).02fs, "
-"%(success)s successes, %(fail)s failures, %(no_change)s with no changes"
-msgstr ""
-
-#: swift/container/updater.py:224
-#, python-format
-msgid "Update report sent for %(container)s %(dbfile)s"
-msgstr ""
-
-#: swift/container/updater.py:232
-#, python-format
-msgid "Update report failed for %(container)s %(dbfile)s"
-msgstr ""
-
-#: swift/container/updater.py:266
-#, python-format
-msgid ""
-"ERROR account update failed with %(ip)s:%(port)s/%(device)s (will retry "
-"later): "
-msgstr ""
-
-#: swift/obj/auditor.py:61
-#, python-format
-msgid "Begin object audit \"%s\" mode"
-msgstr ""
-
-#: swift/obj/auditor.py:73
-#, python-format
-msgid ""
-"Since %(start_time)s: Locally: %(passes)d passed audit, %(quars)d "
-"quarantined, %(errors)d errors files/sec: %(frate).2f , bytes/sec: "
-"%(brate).2f"
-msgstr ""
-
-#: swift/obj/auditor.py:90
-#, python-format
-msgid ""
-"Object audit \"%(mode)s\" mode completed: %(elapsed).02fs. Total "
-"files/sec: %(frate).2f , Total bytes/sec: %(brate).2f "
-msgstr ""
-
-#: swift/obj/auditor.py:141
-#, python-format
-msgid "ERROR Object %(obj)s failed audit and will be quarantined: %(err)s"
-msgstr ""
-
-#: swift/obj/auditor.py:150
-#, python-format
-msgid "ERROR Trying to audit %s"
-msgstr ""
-
-#: swift/obj/replicator.py:182
-msgid "Error hashing suffix"
-msgstr ""
-
-#: swift/obj/replicator.py:246
-#, python-format
-msgid "Killing long-running rsync: %s"
-msgstr ""
-
-#: swift/obj/replicator.py:257
-#, python-format
-msgid "Bad rsync return code: %(args)s -> %(ret)d"
-msgstr ""
-
-#: swift/obj/replicator.py:261 swift/obj/replicator.py:265
-#, python-format
-msgid "Successful rsync of %(src)s at %(dst)s (%(time).03f)"
-msgstr ""
-
-#: swift/obj/replicator.py:350
-#, python-format
-msgid "Removing partition: %s"
-msgstr ""
-
-#: swift/obj/replicator.py:353
-msgid "Error syncing handoff partition"
-msgstr ""
-
-#: swift/obj/replicator.py:383
-#, python-format
-msgid "%(ip)s/%(device)s responded as unmounted"
-msgstr ""
-
-#: swift/obj/replicator.py:388
-#, python-format
-msgid "Invalid response %(resp)s from %(ip)s"
-msgstr ""
-
-#: swift/obj/replicator.py:410
-#, python-format
-msgid "Error syncing with node: %s"
-msgstr ""
-
-#: swift/obj/replicator.py:414
-msgid "Error syncing partition"
-msgstr ""
-
-#: swift/obj/replicator.py:424
-#, python-format
-msgid ""
-"%(replicated)d/%(total)d (%(percentage).2f%%) partitions replicated in "
-"%(time).2fs (%(rate).2f/sec, %(remaining)s remaining)"
-msgstr ""
-
-#: swift/obj/replicator.py:433
-#, python-format
-msgid ""
-"%(checked)d suffixes checked - %(hashed).2f%% hashed, %(synced).2f%% "
-"synced"
-msgstr ""
-
-#: swift/obj/replicator.py:439
-#, python-format
-msgid "Partition times: max %(max).4fs, min %(min).4fs, med %(med).4fs"
-msgstr ""
-
-#: swift/obj/replicator.py:446
-#, python-format
-msgid "Nothing replicated for %s seconds."
-msgstr ""
-
-#: swift/obj/replicator.py:475
-msgid "Lockup detected.. killing live coros."
-msgstr ""
-
-#: swift/obj/replicator.py:530
-msgid "Ring change detected. Aborting current replication pass."
-msgstr ""
-
-#: swift/obj/replicator.py:540
-msgid "Exception in top-level replication loop"
-msgstr ""
-
-#: swift/obj/replicator.py:549
-msgid "Running object replicator in script mode."
-msgstr ""
-
-#: swift/obj/replicator.py:553 swift/obj/replicator.py:565
-#, python-format
-msgid "Object replication complete. (%.02f minutes)"
-msgstr ""
-
-#: swift/obj/replicator.py:560
-msgid "Starting object replication pass."
-msgstr ""
-
-#: swift/obj/replicator.py:566
-#, python-format
-msgid "Replication sleeping for %s seconds."
-msgstr ""
-
-#: swift/obj/server.py:313
-#, python-format
-msgid ""
-"ERROR Container update failed (saving for async update later): %(status)d"
-" response from %(ip)s:%(port)s/%(dev)s"
-msgstr ""
-
-#: swift/obj/server.py:319
-#, python-format
-msgid ""
-"ERROR container update failed with %(ip)s:%(port)s/%(dev)s (saving for "
-"async update later)"
-msgstr ""
-
-#: swift/obj/updater.py:65
-msgid "Begin object update sweep"
-msgstr ""
-
-#: swift/obj/updater.py:89
-#, python-format
-msgid ""
-"Object update sweep of %(device)s completed: %(elapsed).02fs, %(success)s"
-" successes, %(fail)s failures"
-msgstr ""
-
-#: swift/obj/updater.py:98
-#, python-format
-msgid "Object update sweep completed: %.02fs"
-msgstr ""
-
-#: swift/obj/updater.py:105
-msgid "Begin object update single threaded sweep"
-msgstr ""
-
-#: swift/obj/updater.py:117
-#, python-format
-msgid ""
-"Object update single threaded sweep completed: %(elapsed).02fs, "
-"%(success)s successes, %(fail)s failures"
-msgstr ""
-
-#: swift/obj/updater.py:157
-#, python-format
-msgid "ERROR Pickle problem, quarantining %s"
-msgstr ""
-
-#: swift/obj/updater.py:177
-#, python-format
-msgid "Update sent for %(obj)s %(path)s"
-msgstr ""
-
-#: swift/obj/updater.py:182
-#, python-format
-msgid "Update failed for %(obj)s %(path)s"
-msgstr ""
-
-#: swift/obj/updater.py:206
-#, python-format
-msgid "ERROR with remote server %(ip)s:%(port)s/%(device)s"
-msgstr ""
-
-#: swift/proxy/server.py:165 swift/proxy/server.py:629
-#: swift/proxy/server.py:696 swift/proxy/server.py:712
-#: swift/proxy/server.py:721 swift/proxy/server.py:1004
-#: swift/proxy/server.py:1044 swift/proxy/server.py:1089
-msgid "Object"
-msgstr ""
-
-#: swift/proxy/server.py:170
-#, python-format
-msgid "Could not load object segment %(path)s: %(status)s"
-msgstr ""
-
-#: swift/proxy/server.py:177 swift/proxy/server.py:210
-#: swift/proxy/server.py:257
-#, python-format
-msgid "ERROR: While processing manifest /%(acc)s/%(cont)s/%(obj)s"
-msgstr ""
-
-#: swift/proxy/server.py:292
-#, python-format
-msgid "%(msg)s %(ip)s:%(port)s"
-msgstr ""
-
-#: swift/proxy/server.py:304
-#, python-format
-msgid "ERROR with %(type)s server %(ip)s:%(port)s/%(device)s re: %(info)s"
-msgstr ""
-
-#: swift/proxy/server.py:328
-#, python-format
-msgid "Node error limited %(ip)s:%(port)s (%(device)s)"
-msgstr ""
-
-#: swift/proxy/server.py:388 swift/proxy/server.py:1451
-#: swift/proxy/server.py:1497 swift/proxy/server.py:1545
-#: swift/proxy/server.py:1590
-msgid "Account"
-msgstr ""
-
-#: swift/proxy/server.py:389
-#, python-format
-msgid "Trying to get account info for %s"
-msgstr ""
-
-#: swift/proxy/server.py:466 swift/proxy/server.py:740
-#: swift/proxy/server.py:772 swift/proxy/server.py:1214
-#: swift/proxy/server.py:1301 swift/proxy/server.py:1356
-#: swift/proxy/server.py:1413
-msgid "Container"
-msgstr ""
-
-#: swift/proxy/server.py:467
-#, python-format
-msgid "Trying to get container info for %s"
-msgstr ""
-
-#: swift/proxy/server.py:552
-#, python-format
-msgid "%(type)s returning 503 for %(statuses)s"
-msgstr ""
-
-#: swift/proxy/server.py:598 swift/proxy/server.py:697
-#, python-format
-msgid "Trying to %(method)s %(path)s"
-msgstr ""
-
-#: swift/proxy/server.py:627
-msgid "Client disconnected on read"
-msgstr ""
-
-#: swift/proxy/server.py:630
-#, python-format
-msgid "Trying to read during GET of %s"
-msgstr ""
-
-#: swift/proxy/server.py:653
-#, python-format
-msgid "ERROR %(status)d %(body)s From %(type)s Server"
-msgstr ""
-
-#: swift/proxy/server.py:692
-#, python-format
-msgid "ERROR %(status)d %(body)s From Object Server"
-msgstr ""
-
-#: swift/proxy/server.py:776 swift/proxy/server.py:783
-#, python-format
-msgid "Object manifest GET could not continue listing: %s %s"
-msgstr ""
-
-#: swift/proxy/server.py:905
-msgid "Object POST"
-msgstr ""
-
-#: swift/proxy/server.py:1005
-#, python-format
-msgid "Expect: 100-continue on %s"
-msgstr ""
-
-#: swift/proxy/server.py:1017
-#, python-format
-msgid "Object PUT returning 503, %(conns)s/%(nodes)s required connections"
-msgstr ""
-
-#: swift/proxy/server.py:1045
-#, python-format
-msgid "Trying to write to %s"
-msgstr ""
-
-#: swift/proxy/server.py:1049
-#, python-format
-msgid ""
-"Object PUT exceptions during send, %(conns)s/%(nodes)s required "
-"connections"
-msgstr ""
-
-#: swift/proxy/server.py:1058
-#, python-format
-msgid "ERROR Client read timeout (%ss)"
-msgstr ""
-
-#: swift/proxy/server.py:1063
-msgid "ERROR Exception causing client disconnect"
-msgstr ""
-
-#: swift/proxy/server.py:1068
-msgid "Client disconnected without sending enough data"
-msgstr ""
-
-#: swift/proxy/server.py:1083
-#, python-format
-msgid "ERROR %(status)d %(body)s From Object Server re: %(path)s"
-msgstr ""
-
-#: swift/proxy/server.py:1090
-#, python-format
-msgid "Trying to get final status of PUT to %s"
-msgstr ""
-
-#: swift/proxy/server.py:1093
-#, python-format
-msgid "Object servers returned %s mismatched etags"
-msgstr ""
-
-#: swift/proxy/server.py:1101
-msgid "Object PUT"
-msgstr ""
-
-#: swift/proxy/server.py:1153
-msgid "Object DELETE"
-msgstr ""
-
-#: swift/proxy/server.py:1302 swift/proxy/server.py:1498
-#, python-format
-msgid "Trying to PUT to %s"
-msgstr ""
-
-#: swift/proxy/server.py:1314
-msgid "Container PUT"
-msgstr ""
-
-#: swift/proxy/server.py:1357 swift/proxy/server.py:1546
-#, python-format
-msgid "Trying to POST %s"
-msgstr ""
-
-#: swift/proxy/server.py:1369
-msgid "Container POST"
-msgstr ""
-
-#: swift/proxy/server.py:1414 swift/proxy/server.py:1591
-#, python-format
-msgid "Trying to DELETE %s"
-msgstr ""
-
-#: swift/proxy/server.py:1426
-msgid "Container DELETE"
-msgstr ""
-
-#: swift/proxy/server.py:1433
-msgid "Returning 503 because not all container nodes confirmed DELETE"
-msgstr ""
-
-#: swift/proxy/server.py:1508
-msgid "Account PUT"
-msgstr ""
-
-#: swift/proxy/server.py:1556
-msgid "Account POST"
-msgstr ""
-
-#: swift/proxy/server.py:1601
-msgid "Account DELETE"
-msgstr ""
-
-#: swift/proxy/server.py:1757
-msgid "ERROR Unhandled exception in request"
-msgstr ""
-
-#: swift/stats/access_processor.py:63 swift/stats/stats_processor.py:40
-#, python-format
-msgid "Bad line data: %s"
-msgstr ""
-
-#: swift/stats/access_processor.py:67
-#, python-format
-msgid "Bad server name: found \"%(found)s\" expected \"%(expected)s\""
-msgstr ""
-
-#: swift/stats/access_processor.py:75
-#, python-format
-msgid "Invalid path: %(error)s from data: %(log)s"
-msgstr ""
-
-#: swift/stats/access_processor.py:199
-#, python-format
-msgid "I found a bunch of bad lines in %(name)s (%(bad)d bad, %(total)d total)"
-msgstr ""
-
-#: swift/stats/account_stats.py:55
-msgid "Gathering account stats"
-msgstr ""
-
-#: swift/stats/account_stats.py:59
-#, python-format
-msgid "Gathering account stats complete (%0.2f minutes)"
-msgstr ""
-
-#: swift/stats/account_stats.py:75
-#, python-format
-msgid "Device %s is not mounted, skipping."
-msgstr ""
-
-#: swift/stats/account_stats.py:81
-#, python-format
-msgid "Path %s does not exist, skipping."
-msgstr ""
-
-#: swift/stats/log_processor.py:62
-#, python-format
-msgid "Loaded plugin \"%s\""
-msgstr ""
-
-#: swift/stats/log_processor.py:79
-#, python-format
-msgid "Processing %(obj)s with plugin \"%(plugin)s\""
-msgstr ""
-
-#: swift/stats/log_processor.py:179
-#, python-format
-msgid "Bad compressed data for %s"
-msgstr ""
-
-#: swift/stats/log_processor.py:240
-msgid "Beginning log processing"
-msgstr ""
-
-#: swift/stats/log_processor.py:278
-#, python-format
-msgid "found %d processed files"
-msgstr ""
-
-#: swift/stats/log_processor.py:283
-#, python-format
-msgid "loaded %d files to process"
-msgstr ""
-
-#: swift/stats/log_processor.py:286 swift/stats/log_processor.py:360
-#, python-format
-msgid "Log processing done (%0.2f minutes)"
-msgstr ""
-
-#: swift/stats/log_uploader.py:71
-msgid "Uploading logs"
-msgstr ""
-
-#: swift/stats/log_uploader.py:74
-#, python-format
-msgid "Uploading logs complete (%0.2f minutes)"
-msgstr ""
-
-#: swift/stats/log_uploader.py:129
-#, python-format
-msgid "Unexpected log: %s"
-msgstr ""
-
-#: swift/stats/log_uploader.py:135
-#, python-format
-msgid "Skipping log: %(file)s (< %(cutoff)d seconds old)"
-msgstr ""
-
-#: swift/stats/log_uploader.py:142
-#, python-format
-msgid "Log %s is 0 length, skipping"
-msgstr ""
-
-#: swift/stats/log_uploader.py:144
-#, python-format
-msgid "Processing log: %s"
-msgstr ""
-
-#: swift/stats/log_uploader.py:165
-#, python-format
-msgid "Uploaded log %(file)s to %(target)s"
-msgstr ""
-
-#: swift/stats/log_uploader.py:170
-#, python-format
-msgid "ERROR: Upload of log %s failed!"
-msgstr ""
-
diff --git a/lower-constraints.txt b/lower-constraints.txt
new file mode 100644
index 0000000000..ee9acd4d94
--- /dev/null
+++ b/lower-constraints.txt
@@ -0,0 +1,81 @@
+alabaster==0.7.10
+asn1crypto==0.24.0
+attrs==21.4.0
+Babel==2.5.3
+bandit==1.1.0
+boto==2.32.1
+boto3==1.9
+botocore==1.12
+castellan==0.13.0
+certifi==2018.1.18
+cffi==1.11.5
+chardet==3.0.4
+cliff==2.11.0
+cmd2==0.8.1
+coverage==5.2.1
+cryptography==2.0.2
+debtcollector==1.19.0
+dnspython==1.15.0
+docutils==0.15
+dulwich==0.19.0
+enum-compat==0.0.2
+eventlet==0.25.0
+extras==1.0.0
+fixtures==3.0.0
+future==0.16.0
+gitdb2==2.0.3
+GitPython==2.1.8
+greenlet==0.4.14
+idna==2.6
+imagesize==1.0.0
+iso8601==0.1.12
+Jinja2==2.10
+keystoneauth1==3.4.0
+keystonemiddleware==4.17.0
+linecache2==1.0.0
+lxml==4.2.3
+MarkupSafe==1.0
+mock==3.0
+monotonic==1.4
+msgpack==0.5.6
+netaddr==0.7.19
+netifaces==0.10.4
+oslo.config==5.2.0
+oslo.i18n==3.20.0
+oslo.log==3.22.0
+oslo.serialization==2.25.0
+oslo.utils==3.36.0
+PasteDeploy==2.0.0
+pbr==3.1.1
+prettytable==0.7.2
+pycparser==2.18
+pyeclib==1.3.1
+pykmip==0.7.0
+Pygments==2.2.0
+pyparsing==2.2.0
+pyperclip==1.6.0
+pytest==4.6.11
+pytest-cov==2.12.1
+pytest-subtests==0.3.0
+python-keystoneclient==3.19.0
+python-mimeparse==1.6.0
+python-subunit==1.2.0
+python-swiftclient==3.2.0
+pytz==2018.3
+PyYAML==3.12
+requests==2.14.2
+requests-mock==1.2.0
+rfc3986==1.1.0
+smmap2==2.0.3
+snowballstemmer==1.2.1
+stestr==2.0.0
+stevedore==1.28.0
+testtools==2.3.0
+traceback2==1.4.0
+unittest2==1.1.0
+urllib3==1.22
+voluptuous==0.11.1
+wrapt==1.10.11
+xattr==0.7.2
+pycadf===2.10.0
+python-dateutil===2.4.2
diff --git a/py3-constraints.txt b/py3-constraints.txt
new file mode 100644
index 0000000000..e947dda139
--- /dev/null
+++ b/py3-constraints.txt
@@ -0,0 +1,205 @@
+GitPython===3.1.45;python_version>='3.7'
+PasteDeploy===3.1.0;python_version>='3.7'
+PyJWT===2.10.1;python_version>='3.9'
+PyJWT===2.9.0;python_version=='3.8'
+# PyJWT only required for keystonemiddleware>10, which requires python>=3.8
+PyYAML===6.0.2;python_version>='3.8'
+PyYAML===6.0.1;python_version=='3.7'
+Pygments===2.19.2;python_version>='3.8'
+Pygments===2.17.2;python_version=='3.7'
+WebOb===1.8.9
+attrs===25.3.0;python_version>='3.8'
+attrs===24.2.0;python_version=='3.7'
+autopage===0.5.2
+bandit===1.8.6;python_version>='3.9'
+bandit===1.7.10;python_version=='3.8'
+bandit===1.7.5;python_version=='3.7'
+boto3===1.40.19;python_version>='3.9'
+boto3===1.37.38;python_version=='3.8'
+boto3===1.33.13;python_version=='3.7'
+botocore===1.40.19;python_version>='3.9'
+botocore===1.37.38;python_version=='3.8'
+botocore===1.33.13;python_version=='3.7'
+certifi===2025.8.3
+cffi===1.17.1;python_version>='3.8'
+cffi===1.15.1;python_version=='3.7'
+charset-normalizer===3.4.3;python_version>='3.7'
+cliff===4.11.0;python_version>='3.10'
+cliff===4.9.1;python_version=='3.9'
+cliff===4.7.0;python_version=='3.8'
+cliff===3.10.1;python_version=='3.7'
+cmd2===2.7.0;python_version>='3.9'
+cmd2===2.5.11;python_version=='3.8'
+cmd2===2.4.3;python_version=='3.7'
+coverage===7.10.5;python_version>='3.9'
+coverage===7.6.1;python_version=='3.8'
+coverage===7.2.7;python_version=='3.7'
+cryptography===45.0.6;python_version>='3.7'
+debtcollector===3.0.0;python_version>='3.8'
+debtcollector===2.5.0;python_version=='3.7'
+decorator===5.2.1;python_version>='3.8'
+decorator===5.1.1;python_version=='3.7'
+dnspython===2.7.0;python_version>='3.9'
+dnspython===2.6.1;python_version=='3.8'
+dnspython===2.3.0;python_version=='3.7'
+docutils===0.22;python_version>='3.9'
+docutils===0.20.1;python_version=='3.8'
+docutils===0.20.1;python_version=='3.7'
+dogpile.cache===1.4.0;python_version>='3.9'
+dogpile.cache===1.3.4;python_version=='3.8'
+dogpile.cache===1.2.2;python_version=='3.7'
+eventlet===0.40.3;python_version>='3.9'
+eventlet===0.39.1;python_version=='3.8'
+eventlet===0.38.2;python_version=='3.7'
+exceptiongroup===1.3.0;python_version>='3.7'
+extras===1.0.0
+fixtures===4.2.6;python_version>='3.9'
+fixtures===4.2.5;python_version=='3.8'
+fixtures===4.1.0;python_version=='3.7'
+flake8===7.1.2;python_version>='3.8'
+flake8===3.8.4;python_version=='3.7'
+gitdb===4.0.12;python_version>='3.7'
+greenlet===3.2.4;python_version>='3.9'
+greenlet===3.1.1;python_version=='3.8'
+greenlet===3.1.1;python_version=='3.7'
+hacking===7.0.0;python_version>='3.8'
+hacking===4.1.0;python_version=='3.7'
+idna===3.10
+importlib-metadata===8.7.0;python_version>='3.9'
+importlib-metadata===8.5.0;python_version=='3.8'
+importlib-metadata===6.7.0;python_version=='3.7'
+importlib-resources===6.5.2;python_version>='3.9'
+importlib-resources===6.4.5;python_version=='3.8'
+importlib-resources===5.12.0;python_version=='3.7'
+iniconfig===2.1.0;python_version>='3.8'
+iniconfig===2.0.0;python_version=='3.7'
+iso8601===2.1.0;python_version>='3.7'
+jmespath===1.0.1;python_version>='3.7'
+keystoneauth1===5.12.0;python_version>='3.10'
+keystoneauth1===5.11.1;python_version=='3.9'
+keystoneauth1===5.8.1;python_version=='3.8'
+keystoneauth1===5.1.3;python_version=='3.7'
+keystonemiddleware===10.12.0;python_version>='3.10'
+keystonemiddleware===10.11.0;python_version=='3.9'
+keystonemiddleware===10.7.1;python_version=='3.8'
+keystonemiddleware===9.5.0;python_version=='3.7'
+lxml===6.0.1;python_version>='3.8'
+lxml===5.4.0;python_version=='3.7'
+markdown-it-py===4.0.0;python_version>='3.10'
+markdown-it-py===3.0.0;python_version=='3.9'
+markdown-it-py===3.0.0;python_version=='3.8'
+markdown-it-py===2.2.0;python_version=='3.7'
+mccabe===0.7.0;python_version>='3.8'
+mccabe===0.6.1;python_version=='3.7'
+mdurl===0.1.2;python_version>='3.7'
+mock===5.2.0
+msgpack===1.1.1;python_version>='3.8'
+msgpack===1.0.5;python_version=='3.7'
+netaddr===1.3.0;python_version>='3.7'
+netifaces===0.11.0
+os-service-types===1.8.0;python_version>='3.10'
+os-service-types===1.7.0;python_version=='3.9'
+os-service-types===1.7.0;python_version=='3.8'
+os-service-types===1.7.0;python_version=='3.7'
+oslo.cache===3.12.0;python_version>='3.9'
+oslo.cache===3.8.0;python_version=='3.8'
+oslo.cache===2.11.0;python_version=='3.7'
+oslo.config===10.0.0;python_version>='3.9'
+oslo.config===9.6.0;python_version=='3.8'
+oslo.config===8.8.1;python_version=='3.7'
+oslo.context===6.1.0;python_version>='3.9'
+oslo.context===5.6.0;python_version=='3.8'
+oslo.context===4.1.0;python_version=='3.7'
+oslo.i18n===6.6.0;python_version>='3.9'
+oslo.i18n===6.4.0;python_version=='3.8'
+oslo.i18n===5.1.0;python_version=='3.7'
+oslo.log===7.2.1;python_version>='3.9'
+oslo.log===6.1.2;python_version=='3.8'
+oslo.log===4.8.0;python_version=='3.7'
+oslo.serialization===5.8.0;python_version>='3.9'
+oslo.serialization===5.5.0;python_version=='3.8'
+oslo.serialization===4.3.0;python_version=='3.7'
+oslo.utils===9.1.0;python_version>='3.9'
+oslo.utils===7.3.0;python_version=='3.8'
+oslo.utils===4.13.0;python_version=='3.7'
+packaging===25.0;python_version>='3.8'
+packaging===24.0;python_version=='3.7'
+pbr===7.0.1
+pluggy===1.6.0;python_version>='3.9'
+pluggy===1.5.0;python_version=='3.8'
+pluggy===1.2.0;python_version=='3.7'
+prettytable===3.16.0;python_version>='3.9'
+prettytable===3.11.0;python_version=='3.8'
+prettytable===3.7.0;python_version=='3.7'
+py===1.11.0
+pycadf===4.0.1;python_version>='3.9'
+pycadf===4.0.0;python_version=='3.8'
+pycadf===3.1.1;python_version=='3.7'
+pycodestyle===2.12.1;python_version>='3.8'
+pycodestyle===2.6.0;python_version=='3.7'
+pycparser===2.22;python_version>='3.8'
+pycparser===2.21;python_version=='3.7'
+pyeclib===1.6.4
+pyflakes===3.2.0;python_version>='3.8'
+pyflakes===2.2.0;python_version=='3.7'
+pyinotify===0.9.6
+pyparsing===3.2.3;python_version>='3.9'
+pyparsing===3.1.4;python_version=='3.8'
+pyparsing===3.1.4;python_version=='3.7'
+pyperclip===1.9.0
+pytest===8.4.1;python_version>='3.9'
+pytest===8.3.5;python_version=='3.8'
+pytest===7.4.4;python_version=='3.7'
+pytest-cov===6.2.1;python_version>='3.9'
+pytest-cov===5.0.0;python_version=='3.8'
+pytest-cov===4.1.0;python_version=='3.7'
+python-dateutil===2.9.0.post0
+python-keystoneclient===5.7.0;python_version>='3.10'
+python-keystoneclient===5.6.0;python_version=='3.9'
+python-keystoneclient===5.5.0;python_version=='3.8'
+python-keystoneclient===4.5.0;python_version=='3.7'
+python-subunit===1.4.4;python_version>='3.7'
+python-swiftclient===4.8.0
+pytz===2025.2
+requests===2.32.5;python_version>='3.9'
+requests===2.32.4;python_version=='3.8'
+requests===2.31.0;python_version=='3.7'
+requests-mock===1.12.1
+rfc3986===2.0.0;python_version>='3.7'
+rich===14.1.0;python_version>='3.8'
+rich===13.8.1;python_version=='3.7'
+s3transfer===0.13.1;python_version>='3.9'
+s3transfer===0.11.5;python_version=='3.8'
+s3transfer===0.8.2;python_version=='3.7'
+setuptools===75.3.0;python_version>='3.12'
+smmap===5.0.2;python_version>='3.7'
+stestr===4.2.0;python_version>='3.8'
+stestr===4.1.0;python_version=='3.7'
+stevedore===5.5.0;python_version>='3.9'
+stevedore===5.3.0;python_version=='3.8'
+stevedore===3.5.2;python_version=='3.7'
+testtools===2.7.2;python_version>='3.8'
+testtools===2.7.1;python_version=='3.7'
+tomli===2.2.1;python_version>='3.8'
+tomli===2.0.1;python_version=='3.7'
+tomlkit===0.13.3;python_version>='3.8'
+tomlkit===0.12.5;python_version=='3.7'
+typing_extensions===4.15.0;python_version>='3.9'
+typing_extensions===4.13.2;python_version=='3.8'
+typing_extensions===4.7.1;python_version=='3.7'
+tzdata===2025.2;python_version>='3.9'
+urllib3===2.5.0;python_version>='3.10'
+urllib3===1.26.20;python_version=='3.9'
+urllib3===1.26.20;python_version=='3.8'
+urllib3===1.26.20;python_version=='3.7'
+voluptuous===0.15.2;python_version>='3.9'
+voluptuous===0.14.2;python_version=='3.8'
+voluptuous===0.14.1;python_version=='3.7'
+wcwidth===0.2.13
+wrapt===1.17.3;python_version>='3.8'
+wrapt===1.16.0;python_version=='3.7'
+xattr===1.2.0;python_version>='3.8'
+xattr===0.10.1;python_version=='3.7'
+zipp===3.23.0;python_version>='3.9'
+zipp===3.20.2;python_version=='3.8'
+zipp===3.15.0;python_version=='3.7'
diff --git a/pyproject.toml b/pyproject.toml
new file mode 100644
index 0000000000..e63322f962
--- /dev/null
+++ b/pyproject.toml
@@ -0,0 +1,3 @@
+[build-system]
+requires = ["pbr>=6.0.0", "setuptools>=64"]
+build-backend = "pbr.build"
diff --git a/releasenotes/notes/2_10_0_release-666a76f4975657a5.yaml b/releasenotes/notes/2_10_0_release-666a76f4975657a5.yaml
new file mode 100644
index 0000000000..4b2e889112
--- /dev/null
+++ b/releasenotes/notes/2_10_0_release-666a76f4975657a5.yaml
@@ -0,0 +1,59 @@
+---
+features:
+ - >
+   Object versioning now supports a "history" mode in addition to
+   the older "stack" mode. The difference is in how DELETE requests
+   are handled. For full details, please read
+   https://docs.openstack.org/swift/latest/overview_object_versioning.html.
+ - >
+   New config variables to change the schedule priority and I/O
+   scheduling class. Servers and daemons now understand
+   `nice_priority`, `ionice_class`, and `ionice_priority` to
+   schedule their relative importance. Please read
+   https://docs.openstack.org/swift/latest/deployment_guide.html
+   for full config details.
+ - >
+   On newer kernels (3.15+ when using xfs), Swift will use the O_TMPFILE
+   flag when opening a file instead of creating a temporary file
+   and renaming it on commit. This makes the data path simpler and
+   allows the filesystem to more efficiently optimize the files on
+   disk, resulting in better performance.
+ - >
+   Erasure code GET performance has been significantly
+   improved in clusters that are not completely healthy.
+ - >
+   Significant improvements to the api-ref doc available at
+   https://developer.openstack.org/api-ref/object-storage/.
+ - >
+   A PUT or POST to a container will now update the container's
+   Last-Modified time, and that value will be included in a
+   GET/HEAD response.
+ - >
+   Include object sysmeta in POST responses. Sysmeta is still
+   stripped from the response before being sent to the client, but
+   this allows middleware to make use of the information.
+upgrade:
+ - >
+   Update dnspython dependency to 1.14, removing the need to have
+   separate dnspython dependencies for Py2 and Py3.
+ - >
+   Deprecate swift-temp-url and call python-swiftclient's
+   implementation instead. This adds python-swiftclient as an
+   optional dependency of Swift.
+ - >
+   Moved other-requirements.txt to bindep.txt. bindep.txt lists
+   non-python dependencies of Swift.
+fixes:
+ - >
+   Fixed a bug where a container listing delimiter wouldn't work
+   with encryption.
+ - >
+   Fixed a bug where some headers weren't being copied correctly
+   in a COPY request.
+ - >
+   Container sync can now copy SLOs more efficiently by allowing
+   the manifest to be synced before all of the referenced segments.
+   This fixes a bug where container sync would not copy SLO manifests.
+ - Fixed a bug where some tombstone files might never be reclaimed.
+other:
+  - Various other minor bug fixes and improvements.
diff --git a/releasenotes/notes/2_11_0_release-ac1d256e455d347e.yaml b/releasenotes/notes/2_11_0_release-ac1d256e455d347e.yaml
new file mode 100644
index 0000000000..f07982bbc0
--- /dev/null
+++ b/releasenotes/notes/2_11_0_release-ac1d256e455d347e.yaml
@@ -0,0 +1,54 @@
+---
+features:
+  - >
+    The improvements to EC reads made in Swift 2.10.0 have also been
+    applied to the reconstructor. This allows fragments to be rebuilt
+    in more circumstances, resulting in faster recovery from failures.
+  - >
+    Instead of using a separate .durable file to indicate the
+    durable status of an EC fragment archive, we rename the .data
+    to include a durable marker in the filename. This saves one
+    inode for every EC .data file. Existing .durable files will not
+    be removed, and they will continue to work just fine.
+  - >
+    Closed a bug where ssync may have written bad fragment data in
+    some circumstances. A check was added to ensure the correct number
+    of bytes is written for a fragment before finalizing the write.
+    Also, erasure coded fragment metadata will now be validated on read
+    requests and, if bad data is found, the fragment will be quarantined.
+  - Added a configurable URL base to staticweb.
+  - Support multi-range GETs for static large objects.
+  - >
+    TempURLs using the "inline" parameter can now also set the
+    "filename" parameter. Both are used in the Content-Disposition
+    response header.
+  - Mirror X-Trans-Id to X-Openstack-Request-Id.
+  - >
+    SLO will now concurrently HEAD segments, resulting in much faster
+    manifest validation and object creation. By default, two HEAD requests
+    will be done at a time, but this can be changed by the operator via
+    the new `concurrency` setting in the "[filter:slo]" section of
+    the proxy server config.
+  - Suppressed the KeyError message when auditor finds an expired object.
+  - Daemons using InternalClient can now be properly killed with SIGTERM.
+  - >
+    Added a "user" option to the drive-audit config file. Its value is
+    used to set the owner of the drive-audit recon cache.
+  - >
+    Throttle update_auditor_status calls so it updates no more than once
+    per minute.
+  - Suppress unexpected-file warnings for rsync temp files.
+upgrade:
+  - Updated the PyECLib dependency to 1.3.1.
+  - >
+    Note that after writing EC data with Swift 2.11.0 or later, that
+    data will not be accessible to earlier versions of Swift.
+critical:
+  - >
+    WARNING: If you are using the ISA-L library for erasure codes,
+    please upgrade to liberasurecode 1.3.1 (or later) as soon as
+    possible. If you are using isa_l_rs_vand with more than 4 parity,
+    please read https://bugs.launchpad.net/swift/+bug/1639691 and take
+    necessary action.
+other:
+  - Various other minor bug fixes and improvements.
diff --git a/releasenotes/notes/2_12_0_release-06af226abc7b91ef.yaml b/releasenotes/notes/2_12_0_release-06af226abc7b91ef.yaml
new file mode 100644
index 0000000000..0246fe5f3a
--- /dev/null
+++ b/releasenotes/notes/2_12_0_release-06af226abc7b91ef.yaml
@@ -0,0 +1,57 @@
+---
+features:
+  - >
+    Ring files now include byteorder information about the endian of
+    the machine used to generate the file, and the values are
+    appropriately byteswapped if deserialized on a machine with a
+    different endianness.
+
+    Newly created ring files will be byteorder agnostic, but
+    previously generated ring files will still fail on different
+    endian architectures. Regenerating older ring files will cause
+    them to become byteorder agnostic. The regeneration of the ring
+    files will not cause any new data movement. Newer ring files
+    will still be usable by older versions of Swift (on machines
+    with the same endianness--this maintains existing behavior).
+  - >
+    All 416 responses will now include a Content-Range header with
+    an unsatisfied-range value. This allows the caller to know the
+    valid range request value for an object.
+  - >
+    TempURLs now support a validation against a common prefix. A
+    prefix-based signature grants access to all objects which share the
+    same prefix. This avoids the creation of a large amount of signatures,
+    when a whole container or pseudofolder is shared.
+  - >
+    In SLO manifests, the `etag` and `size_bytes` keys are now fully
+    optional and not required. Previously, the keys needed to exist
+    but the values were optional. The only required key is `path`.
+  - Respect server type for --md5 check in swift-recon.
+fixes:
+  - Correctly handle deleted files with if-none-match requests.
+  - >
+    Correctly send 412 Precondition Failed if a user sends an
+    invalid copy destination. Previously Swift would send a 500
+    Internal Server Error.
+  - Fixed a rare infinite loop in `swift-ring-builder` while placing parts.
+  - >
+    Ensure update of the container by object-updater, removing a rare
+    possibility that objects would never be added to a container listing.
+  - >
+    Fixed non-deterministic suffix updates in hashes.pkl where a partition
+    may be updated much less often than expected.
+  - >
+    Fixed regression in consolidate_hashes that occurred when a new
+    file was stored to new suffix to a non-empty partition. This bug
+    was introduced in 2.7.0 and could cause an increase in rsync
+    replication stats during and after upgrade, due to inconsistent
+    hashing of partition suffixes.
+  - >
+    Account and container databases will now be quarantined if the
+    database schema has been corrupted.
+  - Remove empty db hash and suffix directories if a db gets quarantined.
+other:
+  - >
+    Removed "in-process-" from func env tox name to work with
+    upstream CI.
+  - Various other minor bug fixes and improvements.
diff --git a/releasenotes/notes/2_13_0_release-875e1fb1ef59f015.yaml b/releasenotes/notes/2_13_0_release-875e1fb1ef59f015.yaml
new file mode 100644
index 0000000000..cd922910d7
--- /dev/null
+++ b/releasenotes/notes/2_13_0_release-875e1fb1ef59f015.yaml
@@ -0,0 +1,83 @@
+---
+features:
+  - >
+    Improved performance by eliminating an unneeded directory
+    structure hash.
+  - >
+    Optimized the common case for hashing filesystem trees, thus
+    eliminating a lot of extraneous disk I/O.
+  - >
+    Updated the `hashes.pkl` file format to include timestamp information
+    for race detection. Also simplified hashing logic to prevent race
+    conditions and optimize for the common case.
+  - >
+    The erasure code reconstructor will now shuffle work jobs across all
+    disks instead of going disk-by-disk. This eliminates single-disk I/O
+    contention and allows continued scaling as concurrency is increased.
+  - >
+    Erasure code reconstruction handles moving data from handoff nodes
+    better. Instead of moving the data to another handoff, it waits
+    until it can be moved to a primary node.
+  - >
+    Temporary URLs now support one common form of ISO 8601 timestamps in
+    addition to Unix seconds-since-epoch timestamps. The ISO 8601 format
+    accepted is '%Y-%m-%dT%H:%M:%SZ'. This makes TempURLs more
+    user-friendly to produce and consume.
+  - >
+    Listing containers in accounts with json or xml now includes a
+    `last_modified` time. This does not change any on-disk data, but simply
+    exposes the value to offer consistency with the object listings on
+    containers.
+  - I/O priority is now supported on AArch64 architecture.
+upgrade:
+  - If you upgrade and roll back, you must delete all `hashes.pkl` files.
+deprecations:
+  - >
+    If using erasure coding with ISA-L in rs_vand mode and 5 or more parity
+    fragments, Swift will emit a warning. This is a configuration that is
+    known to harm data durability. In a future release, this warning will be
+    upgraded to an error unless the policy is marked as deprecated. All data
+    in an erasure code storage policy using isa_l_rs_vand with 5 or more
+    parity should be migrated as soon as possible. Please see
+    https://bugs.launchpad.net/swift/+bug/1639691 for more information.
+  - >
+    The erasure code reconstructor `handoffs_first` option has been
+    deprecated in favor of `handoffs_only`. `handoffs_only` is far more
+    useful, and just like `handoffs_first` mode in the replicator, it gives
+    the operator the option of forcing the consistency engine to focus
+    solely on revert (handoff) jobs, thus improving the speed of
+    rebalances.  The `handoffs_only` behavior is somewhat consistent with
+    the replicator's `handoffs_first` option (any error on any handoff in
+    the replicator will make it essentially handoff only forever) but the
+    `handoff_only` option does what you want and is named correctly in the
+    reconstructor.
+  - >
+    The default for `object_post_as_copy` has been changed to False. The
+    option is now deprecated and will be removed in a future release. If
+    your cluster is still running with post-as-copy enabled, please update
+    it to use the "fast-post" method. Future versions of Swift will not
+    support post-as-copy, and future features will not be supported under
+    post-as-copy. ("Fast-post" is where `object_post_as_copy` is false).
+fixes:
+  - >
+    Fixed a bug where the ring builder would not allow removal of a device
+    when min_part_seconds_left was greater than zero.
+  - >
+    PUT subrequests generated from a client-side COPY will now properly log
+    the SSC (server-side copy) Swift source field. See
+    https://docs.openstack.org/developer/swift/logs.html#swift-source for
+    more information.
+  - >
+    Fixed a bug where an SLO download with a range request may have resulted
+    in a 5xx series response.
+  - >
+    SLO manifest PUT requests can now be properly validated by sending an
+    ETag header of the md5 sum of the concatenated md5 sums of the
+    referenced segments.
+  - Fixed the stats calculation in the erasure code reconstructor.
+  - >
+    Rings with min_part_hours set to zero will now only move one partition
+    replica per rebalance, thus matching behavior when min_part_hours is
+    greater than zero.
+other:
+  - Various other minor bug fixes and improvements.
diff --git a/releasenotes/notes/2_14_0_release-7c3ef515ebded888.yaml b/releasenotes/notes/2_14_0_release-7c3ef515ebded888.yaml
new file mode 100644
index 0000000000..0307a4985a
--- /dev/null
+++ b/releasenotes/notes/2_14_0_release-7c3ef515ebded888.yaml
@@ -0,0 +1,41 @@
+---
+features:
+  - EC Fragment Duplication - Foundational Global EC Cluster Support.
+  - name_check and cname_lookup keys have been added to `/info`.
+  - Add Vary headers for CORS responses.
+  - Always set Swift processes to use UTC.
+  - >
+    Removed per-device reconstruction stats. Now that the reconstructor
+    is shuffling parts before going through them, those stats no longer
+    make sense.
+  - domain_remap now accepts a list of domains in "storage_domain".
+  - Do not follow CNAME when host is in storage_domain.
+  - >
+    Enable cluster-wide CORS Expose-Headers setting via
+    "cors_expose_headers".
+  - Cache all answers from nameservers in cname_lookup.
+fixes:
+  - >
+    Fixed error where a container drive error resulted in double space
+    usage on rest drives. When drive with container or account database
+    is unmounted, the bug would create handoff replicas on all remaining
+    drives, increasing the drive space used and filling the cluster.
+  - >
+    Fixed UnicodeDecodeError in the object reconstructor that would
+    prevent objects with non-ascii names from being reconstructed and
+    caused the reconstructor process to hang.
+  - >
+    Fixed encoding issue in ssync where a mix of ascii and non-ascii
+    metadata values would cause an error.
+  - Log the correct request type of a subrequest downstream of copy.
+  - >
+    Prevent logged traceback in object-server on client disconnect for
+    chunked transfers to replicated policies.
+  - >
+    Fixed a race condition in updating hashes.pkl where a partition
+    suffix invalidation may have been skipped.
+  - Include received fragment index in reconstructor log warnings.
+  - Log correct status code for conditional requests.
+other:
+  - Drop support for auth-server from common/manager.py and `swift-init`.
+  - Various other minor bug fixes and improvements.
diff --git a/releasenotes/notes/2_15_0_release-0a05a011fb85a9c9.yaml b/releasenotes/notes/2_15_0_release-0a05a011fb85a9c9.yaml
new file mode 100644
index 0000000000..e0b239ddbc
--- /dev/null
+++ b/releasenotes/notes/2_15_0_release-0a05a011fb85a9c9.yaml
@@ -0,0 +1,102 @@
+---
+features:
+  - |
+    Add Composite Ring Functionality
+
+    A composite ring comprises two or more component rings that are
+    combined to form a single ring with a replica count equal to the
+    sum of the component rings. The component rings are built
+    independently, using distinct devices in distinct regions, which
+    means that the dispersion of replicas between the components can
+    be guaranteed.
+
+    Composite rings can be used for explicit replica placement and
+    "replicated EC" for global erasure codes policies.
+
+    Composite rings support 'cooperative' rebalance which means that
+    during rebalance all component rings will be consulted before a
+    partition is moved in any component ring. This avoids the same
+    partition being simultaneously moved in multiple components.
+
+    We do not yet have CLI tools for creating composite rings, but
+    the functionality has been enabled in the ring modules to
+    support this advanced functionality. CLI tools will be delivered
+    in a subsequent release.
+
+    For further information see the
+    `docs <https://docs.openstack.org/swift/latest/overview_ring.html#module-swift.common.ring.composite_builder>`__
+  - |
+    The EC reconstructor process has been dramatically improved by
+    adding support for multiple concurrent workers. Multiple
+    processes are required to get high concurrency, and this change
+    results in much faster rebalance times on servers with many
+    drives.
+
+    Currently the default is still only one process, and no workers.
+    Set ``reconstructor_workers`` in the ``[object-reconstructor]``
+    section to some whole number <= the number of devices on a node
+    to get that many reconstructor workers.
+  - |
+    Add support to increase object ring partition power transparently
+    to end users and with no cluster downtime. Increasing the ring
+    part power allows for incremental adjustment to the upper bound
+    of the cluster size. Please review the
+    `full docs <https://docs.openstack.org/swift/latest/ring_partpower.html>`__
+    for more information.
+  - |
+    Added support for per-policy proxy config options. This allows
+    per-policy affinity options to be set for use with duplicated EC
+    policies and composite rings. Certain options found in per-policy
+    conf sections will override their equivalents that may be set
+    in the [app:proxy-server] section. Currently the options handled that
+    way are ``sorting_method``, ``read_affinity``, ``write_affinity``,
+    ``write_affinity_node_count``, and ``write_affinity_handoff_delete_count``.
+  - Enabled versioned writes on Dynamic Large Objects (DLOs).
+  - |
+    Write-affinity aware object deletion
+
+    Previously, when deleting objects in multi-region swift
+    deployment with write affinity configured, users always get 404
+    when deleting object before it's replicated to appropriate nodes.
+
+    Now Swift will use ``write_affinity_handoff_delete_count`` to
+    define how many local handoff nodes should swift send request to
+    get more candidates for the final response. The default value
+    "auto" means Swift will calculate the number automatically based
+    on the number of replicas and current cluster topology.
+  - |
+    Require that known-bad EC schemes be deprecated
+
+    Erasure-coded storage policies using ``isa_l_rs_vand`` and ``nparity``
+    >= 5 must be configured as deprecated, preventing any new
+    containers from being created with such a policy. This
+    configuration is known to harm data durability. Any data in such
+    policies should be migrated to a new policy. See
+    See `Launchpad bug 1639691 <https://bugs.launchpad.net/swift/+bug/1639691>`__
+    for more information.
+  - |
+    Optimize the Erasure Code reconstructor protocol to reduce IO
+    load on servers.
+  - Fixed a bug where SSYNC would fail to replicate unexpired object.
+  - Fixed a bug in domain_remap when obj starts/ends with slash.
+  - Fixed a socket leak in copy middleware when a large object was copied.
+  - Fixed a few areas where the ``swiftdir`` option was not respected.
+  - swift-recon now respects storage policy aliases.
+  - |
+    cname_lookup middleware now accepts a ``nameservers`` config
+    variable that, if defined, will be used for DNS lookups instead of
+    the system default.
+  - |
+    Make mount_check option usable in containerized environments by
+    adding a check for an ".ismount" file at the root directory of
+    a device.
+  - Remove deprecated ``vm_test_mode`` option.
+  - |
+    The object and container server config option ``slowdown`` has been
+    deprecated in favor of the new ``objects_per_second`` and
+    ``containers_per_second`` options.
+  - |
+    The output of devices from ``swift-ring-builder`` has been reordered
+    by region, zone, ip, and device.
+  - Imported docs content from openstack-manuals project.
+  - Various other minor bug fixes and improvements.
diff --git a/releasenotes/notes/2_15_1_release-be25e67bfc5e886a.yaml b/releasenotes/notes/2_15_1_release-be25e67bfc5e886a.yaml
new file mode 100644
index 0000000000..5c8ae8787a
--- /dev/null
+++ b/releasenotes/notes/2_15_1_release-be25e67bfc5e886a.yaml
@@ -0,0 +1,19 @@
+---
+fixes:
+  - |
+    Fixed a bug introduced in 2.15.0 where the object reconstructor
+    would exit with a traceback if no EC policy was configured.
+  - |
+    Fixed deadlock when logging from a tpool thread.
+
+    The object server runs certain IO-intensive methods outside the
+    main pthread for performance. Previously, if one of those methods
+    tried to log, this can cause a crash that eventually leads to an
+    object server with hundreds or thousands of greenthreads, all
+    deadlocked. The fix is to use a mutex that works across different
+    greenlets and different pthreads.
+  - |
+    The object reconstructor can now rebuild an EC fragment for an
+    expired object.
+other:
+  - Various other minor bug fixes and improvements.
diff --git a/releasenotes/notes/2_15_2_release-6996eccabba558b4.yaml b/releasenotes/notes/2_15_2_release-6996eccabba558b4.yaml
new file mode 100644
index 0000000000..74bb146012
--- /dev/null
+++ b/releasenotes/notes/2_15_2_release-6996eccabba558b4.yaml
@@ -0,0 +1,22 @@
+---
+fixes:
+  - >
+    Fixed a cache invalidation issue related to GET and PUT requests to
+    containers that would occasionally cause object PUTs to a container to
+    404 after the container had been successfully created.
+
+  - >
+    Removed a race condition where a POST to an SLO could modify the
+    X-Static-Large-Object metadata.
+
+  - Fixed rare socket leak on range requests to erasure-coded objects.
+
+  - Fix SLO delete for accounts with non-ASCII names.
+
+  - >
+    Fixed an issue in COPY where concurrent requests may have copied the
+    wrong data.
+
+  - Fixed time skew when using X-Delete-After.
+
+  - Send ETag header in 206 Partial Content responses to SLO reads.
diff --git a/releasenotes/notes/2_16_0_release-d48cb9b2629df8ab.yaml b/releasenotes/notes/2_16_0_release-d48cb9b2629df8ab.yaml
new file mode 100644
index 0000000000..51b819b9c9
--- /dev/null
+++ b/releasenotes/notes/2_16_0_release-d48cb9b2629df8ab.yaml
@@ -0,0 +1,107 @@
+---
+features:
+  - Add checksum to object extended attributes.
+
+  - |
+    Let clients request heartbeats during SLO PUTs by including
+    the query parameter ``heartbeat=on``.
+
+    With heartbeating turned on, the proxy will start its response
+    immediately with 202 Accepted then send a single whitespace
+    character periodically until the request completes. At that
+    point, a final summary chunk will be sent which includes a
+    "Response Status" key indicating success or failure and (if
+    successful) an "Etag" key indicating the Etag of the resulting
+    SLO.
+
+  - |
+    Added support for retrieving the encryption root secret from an
+    external key management system. In practice, this is currently limited
+    to Barbican.
+
+  - |
+    Move listing formatting out to a new proxy middleware named
+    ``listing_formats``. ``listing_formats`` should be just right of the
+    first proxy-logging middleware, and left of most other
+    middlewares. If it is not already present, it will be
+    automatically inserted for you.
+
+    Note: if you have a custom middleware that makes account or
+    container listings, it will only receive listings in JSON format.
+
+  - |
+    Log deprecation warning for ``allow_versions`` in the container
+    server config. Configure the ``versioned_writes`` middleware in
+    the proxy server instead. This option will be ignored in a
+    future release.
+
+  - |
+    Replaced ``replication_one_per_device`` by custom count defined by
+    ``replication_concurrency_per_device``. The original config value
+    is deprecated, but continues to function for now. If both values
+    are defined, the old ``replication_one_per_device`` is ignored.
+
+  - |
+    Fixed a rare issue where multiple backend timeouts could result
+    in bad data being returned to the client.
+
+  - Cleaned up logged tracebacks when talking to memcached servers.
+
+  - |
+    Account and container replication stats logs now include
+    ``remote_merges``, the number of times a whole database was sent
+    to another node.
+
+  - |
+    Respond 400 Bad Request when Accept headers fail to parse
+    instead of returning 406 Not Acceptable.
+
+  - |
+    The ``domain_remap`` middleware now supports the
+    ``mangle_client_paths`` option. Its default "false" value changes
+    ``domain_remap`` parsing to stop stripping the ``path_root`` value
+    from URL paths. If users depend on this path mangling, operators
+    should set ``mangle_client_paths`` to "True" before upgrading.
+
+  - |
+    Remove ``swift-temp-url`` script. The functionality has been in
+    swiftclient for a long time and this script has been deprecated
+    since 2.10.0.
+
+  - |
+    Removed all ``post_as_copy`` related code and configs. The option
+    has been deprecated since 2.13.0.
+
+  - |
+    Fixed XML responses (eg on bulk extractions and SLO upload
+    failures) to be more correct. The enclosing "delete" tag was
+    removed where it doesn't make sense and replaced with "extract"
+    or "upload" depending on the context.
+
+  - |
+    Static Large Object (SLO) manifest may now (again) have zero-byte
+    last segments.
+
+  - |
+    Fixed an issue where background consistency daemon child
+    processes would deadlock waiting on the same file descriptor.
+
+  - |
+    Removed a race condition where a POST to an SLO could modify the
+    X-Static-Large-Object metadata.
+
+  - |
+    Accept a trade off of dispersion for balance in the ring builder
+    that will result in getting to balanced rings much more quickly
+    in some cases.
+
+  - |
+    Fixed using ``swift-ring-builder set_weight`` with more than one
+    device.
+
+  - |
+    When requesting objects, return 404 if a tombstone is found and
+    is newer than any data found. Previous behavior was to return
+    stale data.
+other:
+  - Various other minor bug fixes and improvements.
diff --git a/releasenotes/notes/2_17_0_release-bd35f18c41c5ef18.yaml b/releasenotes/notes/2_17_0_release-bd35f18c41c5ef18.yaml
new file mode 100644
index 0000000000..cdb9ff04c2
--- /dev/null
+++ b/releasenotes/notes/2_17_0_release-bd35f18c41c5ef18.yaml
@@ -0,0 +1,119 @@
+---
+features:
+  - |
+    Added symlink objects support.
+
+    Symlink objects reference one other object. They are created by
+    creating an empty object with an X-Symlink-Target header. The value of
+    the header is of the format <container>/<object>, and the target does
+    not need to exist at the time of symlink creation. Cross-account
+    symlinks can be created by including the
+    X-Symlink-Target-Account header.
+
+    GET and HEAD requests to a symlink will operate on the
+    referenced object and require appropriate permission in the
+    target container. DELETE and PUT requests will operate on the
+    symlink object itself. POST requests are not forwarded to the
+    referenced object. POST requests sent to a symlink will result
+    in a 307 Temporary Redirect response.
+
+  - |
+    Added support for inline data segments in SLO manifests.
+
+    Upgrade impact -- during a rolling upgrade, an updated proxy server
+    may write a manifest that an out-of-date proxy server will not be
+    able to read. This will resolve itself once the upgrade completes
+    on all nodes.
+
+  - |
+    The tempurl digest algorithm is now configurable, and Swift added
+    support for both SHA-256 and SHA-512. Supported tempurl digests
+    are exposed to clients in ``/info``. Additionally, tempurl signatures
+    can now be base64 encoded.
+
+  - |
+    Object expiry improvements
+
+    - Disallow X-Delete-At header values equal to the X-Timestamp header.
+
+    - X-Delete-At computation now uses X-Timestamp instead of
+      system time. This prevents clock skew causing inconsistent
+      expiry data.
+
+    - Deleting an expiring object will now cause less work in the system.
+      The number of async pending files written has been reduced for all
+      objects and greatly reduced for erasure-coded objects. This
+      dramatically reduces the burden on container servers.
+
+    - Stopped logging tracebacks when receiving an unexpected response.
+
+    - Allow the expirer to gracefully move past updating stale work items.
+
+  - |
+    When the object auditor examines an object, it will now add any
+    missing metadata checksums.
+
+  - |
+    ``swift-ring-builder`` improvements
+
+    - Save the ring when dispersion improves, even if balance
+      doesn't improve.
+
+    - Improved the granularity of the ring dispersion metric so that
+      small improvements after a rebalance can show changes in the
+      dispersion number. Dispersion in existing and new rings can be
+      recalculated using the new ``--recalculate`` option to
+      ``swift-ring-builder``.
+
+    - Display more info on empty rings.
+
+  - |
+    Fixed rare socket leak on range requests to erasure-coded objects.
+
+  - |
+    The number of container updates on object PUTs (ie to update listings)
+    has been recomputed to be far more efficient  while maintaining
+    durability guarantees. Specifically, object PUTs to erasure-coded
+    policies will now normally result in far fewer container updates.
+
+  - |
+    Moved Zuul v3 tox jobs into the Swift code repo.
+
+  - |
+    Changed where liberasurecode-devel for CentOS 7 is referenced and
+    installed as a dependency.
+
+  - |
+    Added container/object listing with prefix to InternalClient.
+
+  - |
+    Added ``--swift-versions`` to ``swift-recon`` CLI to compare installed
+    versions in the cluster.
+
+  - |
+    Stop logging tracebacks in the ``object-replicator`` when it runs
+    out of handoff locations.
+
+  - |
+    Send ETag header in 206 Partial Content responses to SLO reads.
+
+  - |
+    Now ``swift-recon-cron`` works with conf.d configs.
+
+  - |
+    Improved ``object-updater`` stats logging. It now tells you all of
+    its stats (successes, failures, quarantines due to bad pickles,
+    unlinks, and errors), and it tells you incremental progress every
+    five minutes. The logging at the end of a pass remains and has
+    been expanded to also include all stats.
+
+  - |
+    If a proxy server is configured to autocreate accounts and the
+    account create fails, it will now return a server error (500)
+    instead of Not Found (404).
+
+  - |
+    Fractional replicas are no longer allowed for erasure code policies.
+
+  - |
+    Various other minor bug fixes and improvements.
diff --git a/releasenotes/notes/2_17_1_release-dd6e6879cbb94f85.yaml b/releasenotes/notes/2_17_1_release-dd6e6879cbb94f85.yaml
new file mode 100644
index 0000000000..b1fbf2cf37
--- /dev/null
+++ b/releasenotes/notes/2_17_1_release-dd6e6879cbb94f85.yaml
@@ -0,0 +1,11 @@
+---
+fixes:
+  - Fix SLO delete for accounts with non-ASCII names.
+
+  - >
+    Fixed an issue in COPY where concurrent requests may have copied the
+    wrong data.
+
+  - >
+    Fixed a bug in how Swift uses eventlet that was exposed under high
+    concurrency.
diff --git a/releasenotes/notes/2_18_0_release-3acf63cfe2475c65.yaml b/releasenotes/notes/2_18_0_release-3acf63cfe2475c65.yaml
new file mode 100644
index 0000000000..1b98c48100
--- /dev/null
+++ b/releasenotes/notes/2_18_0_release-3acf63cfe2475c65.yaml
@@ -0,0 +1,85 @@
+---
+features:
+  - |
+    Added container sharding, an operator controlled feature that
+    may be used to shard very large container databases into a
+    number of smaller shard containers. This mitigates the issues
+    with one large DB by distributing the data across multiple
+    smaller databases throughout the cluster. Please read the full
+    overview at
+    https://docs.openstack.org/swift/latest/overview_container_sharding.html
+
+  - |
+    Provide an S3 API compatibility layer. The external "swift3"
+    project has been imported into Swift's codebase as the "s3api"
+    middleware.
+
+  - |
+    Added "emergency mode" hooks in the account and container replicators.
+    These options may be used to prioritize moving handoff
+    partitions to primary locations more quickly. This helps when
+    adding capacity to a ring.
+
+    - Added ``-d <devs>`` and ``-p <partitions>`` command line options.
+
+    - Added a handoffs-only mode.
+
+  - |
+    Add a multiprocess mode to the object replicator. Setting the
+    ``replicator_workers`` setting to a positive value N will result
+    in the replicator using up to N worker processes to perform
+    replication tasks. At most one worker per disk will be spawned.
+
+    Worker process logs will have a bit of information prepended so
+    operators can tell which messages came from which worker. The
+    prefix is "[worker M/N pid=P] ", where M is the worker's index,
+    N is the total number of workers, and P is the process ID. Every
+    message from the replicator's logger will have the prefix
+
+  - |
+    The object reconstructor will now fork all available worker
+    processes when operating on a subset of local devices.
+
+  - |
+    Add support for PROXY protocol v1 to the proxy server. This
+    allows the Swift proxy server to log accurate client IP
+    addresses when there is a proxy or SSL-terminator between the
+    client and the Swift proxy server.  Example servers supporting
+    this PROXY protocol include stunnel, haproxy, hitch, and
+    varnish. See the sample proxy server config file for the
+    appropriate config setting to enable or disable this
+    functionality.
+
+  - |
+    In the ratelimit middleware, account whitelist and blacklist
+    settings have been deprecated and may be removed in a future
+    release. When found, a deprecation message will be logged.
+    Instead of these config file values, set X-Account-Sysmeta-
+    Global-Write-Ratelimit:WHITELIST and X-Account-Sysmeta-Global-
+    Write-Ratelimit:BLACKLIST on the particular accounts that need
+    to be whitelisted or blacklisted. System metadata cannot be added
+    or modified by standard clients. Use the internal client to set sysmeta.
+
+  - |
+    Add a ``--drop-prefixes`` flag to swift-account-info,
+    swift-container-info, and swift-object-info. This makes the
+    output between the three more consistent.
+
+  - |
+    statsd error messages correspond to 5xx responses only. This
+    makes monitoring more useful because actual errors (5xx) will
+    not be hidden by common user requests (4xx). Previously, some 4xx
+    responses would be included in timing information in the statsd
+    error messages.
+
+  - |
+    Truncate error logs to prevent log handler from running out of buffer.
+
+  - |
+    Updated requirements.txt to match global exclusions and formatting.
+
+  - |
+    tempauth user names now support unicode characters.
+
+  - |
+    Various other minor bug fixes and improvements.
diff --git a/releasenotes/notes/2_19_0_release-3e6ee3e6a1fcc6bb.yaml b/releasenotes/notes/2_19_0_release-3e6ee3e6a1fcc6bb.yaml
new file mode 100644
index 0000000000..d06e263952
--- /dev/null
+++ b/releasenotes/notes/2_19_0_release-3e6ee3e6a1fcc6bb.yaml
@@ -0,0 +1,103 @@
+---
+features:
+  - |
+    TempURLs now support IP range restrictions. Please see
+    https://docs.openstack.org/swift/latest/middleware.html#client-usage
+    for more information on how to use this additional restriction.
+
+  - |
+    Add support for multiple root encryption secrets for the trivial
+    and KMIP keymasters. This allows operators to rotate encryption
+    keys over time without needing to re-encrypt all existing data
+    in the cluster. Please see the included sample config files for
+    instructions on how to multiple encryption keys.
+
+  - |
+    The object updater now supports two configuration settings:
+    "concurrency" and "updater_workers". The latter controls how many
+    worker processes are spawned, while the former controls how many
+    concurrent container updates are performed by each worker
+    process. This should speed the processing of async_pendings.
+
+    On upgrade, a node configured with concurrency=N will still handle
+    async updates N-at-a-time, but will do so using only one process
+    instead of N.
+
+    If you have a config file like this::
+
+        [object-updater]
+        concurrency = <N>
+
+    and you want to take advantage of faster updates, then do this::
+
+        [object-updater]
+        concurrency = 8  # the default; you can omit this line
+        updater_workers = <N>
+
+    If you want updates to be processed exactly as before, do this::
+
+        [object-updater]
+        concurrency = 1
+        updater_workers = <N>
+
+  - |
+    When listing objects in a container in json format, static large
+    objects (SLOs) will now include an additional new "slo_etag" key
+    that matches the etag returned when requesting the SLO. The
+    existing "hash" key remains unchanged as the MD5 of the SLO
+    manifest. Text and XML listings are unaffected by this change.
+
+  - |
+    Log deprecation warnings for ``run_pause``. This setting was
+    deprecated in Swift 2.4.0 and is replaced by ``interval``.
+    It may be removed in a future release.
+
+  - |
+    Object reconstructor logs are now prefixed with information
+    about the specific worker process logging the message. This
+    makes reading the logs and understanding the messages much simpler.
+
+  - |
+    Lower bounds of dependencies have been updated to reflect what
+    is actually tested.
+
+  - |
+    SSYNC replication mode now removes as much of the directory
+    structure as possible as soon at it observes that the directory
+    is empty. This reduces the work needed for subsequent replication
+    passes.
+
+  - |
+    The container-updater now reports zero objects and bytes used for
+    child DBs in sharded containers. This prevents double-counting in
+    utilization reports.
+
+  - |
+    Add fallocate_reserve to account and container servers. This
+    allows disks shared between account/container and object rings to
+    avoid getting 100% full. The default value of 1% matches the
+    existing default on object servers.
+
+  - |
+    Added an experimental ``swift-ring-composer`` CLI tool to build
+    composite rings.
+
+  - |
+    Added an optional ``read_only`` middleware to make an entire cluster
+    or individual accounts read only.
+
+  - |
+    Fixed a bug where zero-byte PUTs would not work properly
+    with "If-None-Match: \*" conditional requests.
+
+  - ACLs now work with unicode in user/account names.
+
+  - COPY now works with unicode account names.
+
+  - Improved S3 API compatibility.
+
+  - |
+    Lock timeouts in the container updater are now logged at INFO
+    level, not ERROR.
+
+  - Various other minor bug fixes and improvements.
diff --git a/releasenotes/notes/2_19_1_release-5072dd72557f5708.yaml b/releasenotes/notes/2_19_1_release-5072dd72557f5708.yaml
new file mode 100644
index 0000000000..0e1a6d259c
--- /dev/null
+++ b/releasenotes/notes/2_19_1_release-5072dd72557f5708.yaml
@@ -0,0 +1,16 @@
+---
+fixes:
+  - >
+    Prevent PyKMIP's kmip_protocol logger from logging at DEBUG.
+    Previously, some versions of PyKMIP would include all wire
+    data when the root logger was configured to log at DEBUG; this
+    could expose key material in logs. Only the kmip_keymaster was
+    affected.
+
+  - >
+    Fixed an issue where a failed drive could prevent the container sharder
+    from making progress.
+
+  - >
+    Fixed a bug in how Swift uses eventlet that was exposed under high
+    concurrency.
diff --git a/releasenotes/notes/2_20_0_release-7b090a5f4bd916e4.yaml b/releasenotes/notes/2_20_0_release-7b090a5f4bd916e4.yaml
new file mode 100644
index 0000000000..7d15183f30
--- /dev/null
+++ b/releasenotes/notes/2_20_0_release-7b090a5f4bd916e4.yaml
@@ -0,0 +1,116 @@
+---
+features:
+  - |
+    S3 API compatibility updates
+
+    - Swift can now cache the S3 secret from Keystone to use for
+      subsequent requests. This functionality is disabled by default but
+      can be enabled by setting the ``secret_cache_duration`` in the
+      ``[filter:s3token]`` section of the proxy server config to a number
+      greater than 0.
+
+    - s3api now mimics the AWS S3 behavior of periodically sending
+      whitespace characters on a Complete Multipart Upload request to keep
+      the connection from timing out. Note that since a request could fail
+      after the initial 200 OK response has been sent, it is important to
+      check the response body to determine if the request succeeded.
+
+    - s3api now properly handles ``x-amz-metadata-directive`` headers on
+      COPY operations.
+
+    - s3api now uses concurrency (default 2) to handle multi-delete
+      requests. This allows multi-delete requests to be processed much
+      more quickly.
+
+    - s3api now mimics some forms of AWS server-side encryption
+      based on whether Swift's at-rest encryption functionality is enabled.
+      Note that S3 API users are now able to know more about how the
+      cluster is configured than they were previously, ie knowledge of
+      encryption at-rest functionality being enabled or not.
+
+    - s3api responses now include a '-' in multipart ETags.
+
+      For new multipart-uploads via the S3 API, the ETag that is
+      stored will be calculated in the same way that AWS uses. This
+      ETag will be used in GET/HEAD responses, bucket listings, and
+      conditional requests via the S3 API. Accessing the same object
+      via the Swift API will use the SLO Etag; however, in JSON
+      container listings the multipart upload etag will be exposed
+      in a new "s3_etag" key. Previously, some S3 clients would complain
+      about download corruption when the ETag did not have a '-'.
+
+    - S3 ETag for SLOs now include a '-'.
+
+      Ordinary objects in S3 use the MD5 of the object as the ETag,
+      just like Swift. Multipart Uploads follow a different format, notably
+      including a dash followed by the number of segments. To that end
+      (and for S3 API requests *only*), SLO responses via the S3 API have a
+      literal '-N' added on the end of the ETag.
+
+    - The default location is now set to "us-east-1". This is more likely
+      to be the default region that a client will try when using v4
+      signatures.
+
+      Deployers with clusters that relied on the old implicit default
+      location of "US" should explicitly set ``location = US`` in the
+      ``[filter:s3api]`` section of proxy-server.conf before upgrading.
+
+    - Add basic support for ?versions bucket listings. We still do not
+      have support for toggling S3 bucket versioning, but we can at least
+      support getting the latest versions of all objects.
+
+  - |
+    Fixed an issue with SSYNC requests to ensure that only one request
+    can be running on a partition at a time.
+
+  - |
+    Data encryption updates
+
+    - The ``kmip_keymaster`` middleware can now be configured directly in the
+      proxy-server config file. The existing behavior of using an external
+      config file is still supported.
+
+    - Multiple keymaster middlewares are now supported. This allows
+      migration from one key provider to another.
+
+      Note that ``secret_id`` values must remain unique across all keymasters
+      in a given pipeline. If they are not unique, the right-most keymaster
+      will take precedence.
+
+      When looking for the active root secret, only the right-most
+      keymaster is used.
+
+    - Prevent PyKMIP's kmip_protocol logger from logging at DEBUG.
+      Previously, some versions of PyKMIP would include all wire
+      data when the root logger was configured to log at DEBUG; this
+      could expose key material in logs. Only the ``kmip_keymaster`` was
+      affected.
+
+  - |
+    Fixed an issue where a failed drive could prevent the container sharder
+    from making progress.
+
+  - |
+    Storage policy definitions in swift.conf can now define the diskfile
+    to use to access objects. See the included swift.conf-sample file for
+    a description of usage.
+
+  - |
+    The EC reconstructor will now attempt to remove empty directories
+    immediately, while the inodes are still cached, rather than waiting
+    until the next run.
+
+  - |
+    Added a ``keep_idle`` config option to configure KEEPIDLE time for TCP
+    sockets. The default value is the old constant of 600.
+
+  - |
+    Add ``databases_per_second`` to the account-replicator,
+    container-replicator, and container-sharder. This prevents them from
+    using a full CPU core when they are not IO limited.
+
+  - |
+    Allow direct_client users to overwrite the ``X-Timestamp`` header.
+
+  - |
+    Various other minor bug fixes and improvements.
diff --git a/releasenotes/notes/2_21_0_release-d8ae33ef18b7be3a.yaml b/releasenotes/notes/2_21_0_release-d8ae33ef18b7be3a.yaml
new file mode 100644
index 0000000000..1c9c06a1a9
--- /dev/null
+++ b/releasenotes/notes/2_21_0_release-d8ae33ef18b7be3a.yaml
@@ -0,0 +1,69 @@
+---
+features:
+  - |
+    Change the behavior of the EC reconstructor to perform a
+    fragment rebuild to a handoff node when a primary peer responds
+    with 507 to the REPLICATE request. This changes EC to match the
+    existing behavior of replication when drives fail. After a
+    rebalance of EC rings (potentially removing unmounted/failed
+    devices), it's most IO efficient to run in handoffs_only mode to
+    avoid unnecessary rebuilds.
+
+  - |
+    O_TMPFILE support is now detected by attempting to use it
+    instead of looking at the kernel version. This allows older
+    kernels with backported patches to take advantage of the
+    O_TMPFILE functionality.
+
+  - |
+    Add slo_manifest_hook callback to allow other middlewares to
+    impose additional constraints on or make edits to SLO manifests
+    before being written. For example, a middleware could enforce
+    minimum segment size or insert data segments.
+
+  - |
+    Fixed an issue with multi-region EC policies that caused the EC
+    reconstructor to constantly attempt cross-region rebuild
+    traffic.
+
+  - |
+    Fixed an issue where S3 API v4 signatures would not be validated
+    against the body of the request, allowing a replay attack if
+    request headers were captured by a malicious third party.
+
+  - Display crypto data/metadata details in swift-object-info.
+
+  - formpost can now accept a content-encoding parameter.
+
+  - |
+    Fixed an issue where multipart uploads with the S3 API would
+    sometimes report an error despite all segments being upload
+    successfully.
+
+  - |
+    Multipart object segments are now actually deleted when the
+    multipart object is deleted via the S3 API.
+
+  - |
+    Swift now returns a 503 (instead of a 500) when an account
+    auto-create fails.
+
+  - |
+    Fixed a bug where encryption would store the incorrect key
+    metadata if the object name starts with a slash.
+
+  - |
+    Fixed an issue where an object server failure during a client
+    download could leave an open socket between the proxy and
+    client.
+
+  - |
+    Fixed an issue where deleted EC objects didn't have their
+    on-disk directories cleaned up. This would cause extra resource
+    usage on the object servers.
+
+  - |
+    Fixed issue where bulk requests using xml and expect
+    100-continue would return a malformed HTTP response.
+
+  - Various other minor bug fixes and improvements.
diff --git a/releasenotes/notes/2_22_0_release-f60d29508b3c1283.yaml b/releasenotes/notes/2_22_0_release-f60d29508b3c1283.yaml
new file mode 100644
index 0000000000..1e6ea3b1e4
--- /dev/null
+++ b/releasenotes/notes/2_22_0_release-f60d29508b3c1283.yaml
@@ -0,0 +1,87 @@
+---
+features:
+  - |
+    Experimental support for Python 3.6 and 3.7 is now available.
+    Note that this requires ``eventlet>=0.25.0``. All unit tests pass,
+    and running functional tests under Python 2 will pass against
+    services running under Python 3. Expect full support in the
+    next minor release.
+
+  - |
+    Log formats are now more configurable and include support for
+    anonymization. See the ``log_msg_template`` option in ``proxy-server.conf``
+    and `the Swift documentation <https://docs.openstack.org/swift/latest/logs.html#proxy-logs>`__
+    for more information.
+
+  - |
+    Added an operator tool, ``swift-container-deleter``, to asynchronously
+    delete some or all objects in a container using the object expirers.
+
+  - |
+    Swift-all-in-one Docker images are now built and published to
+    https://hub.docker.com/r/openstackswift/saio. These are intended
+    for use as development targets, but will hopefully be useful as a
+    starting point for other work involving containerizing Swift.
+
+upgrade:
+  - |
+    The ``object-expirer`` may now be configured in ``object-server.conf``.
+    This is in anticipation of a future change to allow the ``object-expirer``
+    to be deployed on all nodes that run the ``object-server``.
+
+  - |
+    **Dependency updates**: we've increased our minimum supported version
+    of ``cryptography`` to 2.0.2 and ``netifaces`` to 0.8. This is largely due
+    to the difficulty of continuing to test with the old versions.
+
+    If running Swift under Python 3, ``eventlet`` must be at least 0.25.0.
+
+fixes:
+  - |
+    Correctness improvements
+
+    * The ``proxy-server`` now ignores 404 responses from handoffs without
+      databases when deciding on the correct response for account and
+      container requests.
+
+    * Object writes to a container whose existence cannot be verified
+      now 503 instead of 404.
+
+  - |
+    Sharding improvements
+
+    * The ``container-replicator`` now only attempts to fetch shard ranges if
+      the remote indicates that it has shard ranges. Further, it does so
+      with a timeout to prevent the process from hanging in certain cases.
+
+    * The ``proxy-server`` now caches 'updating' shards, improving write
+      performance for sharded containers. A new config option,
+      ``recheck_updating_shard_ranges``, controls the cache time; set it to
+      0 to disable caching.
+
+    * The ``container-replicator`` now correctly enqueues
+      ``container-reconciler`` work for sharded containers.
+
+  - |
+    S3 API improvements
+
+    * Unsigned payloads work with v4 signatures once more.
+
+    * Multipart upload parts may now be copied from other multipart uploads.
+
+    * CompleteMultipartUpload requests with a ``Content-MD5`` now work.
+
+    * ``Content-Type`` can now be updated when copying an object.
+
+    * Fixed v1 listings that end with a non-ASCII object name.
+
+  - |
+    Background corruption-detection improvements
+
+    * Detect and remove invalid entries from ``hashes.pkl``
+
+    * When object path is not a directory, just quarantine it,
+      rather than the whole suffix.
+
+  - |
+    Various other minor bug fixes and improvements.
diff --git a/releasenotes/notes/2_23_0_release-2a2d11c1934f0b61.yaml b/releasenotes/notes/2_23_0_release-2a2d11c1934f0b61.yaml
new file mode 100644
index 0000000000..656950ee71
--- /dev/null
+++ b/releasenotes/notes/2_23_0_release-2a2d11c1934f0b61.yaml
@@ -0,0 +1,74 @@
+---
+features:
+  - |
+    Python 3.6 and 3.7 are now fully supported. If you've been testing Swift
+    on Python 3, upgrade at your earliest convenience.
+
+  - |
+    Added "static symlinks", which perform some validation as they
+    follow redirects and include more information about their target
+    in container listings. For more information, see the `symlink middleware
+    <https://docs.openstack.org/swift/latest/middleware.html#symlink>`__
+    section of the documentation.
+
+  - |
+    Multi-character strings may now be used as delimiters in account
+    and container listings.
+
+upgrade:
+  - |
+    **Dependency update**: ``eventlet`` must be at least 0.25.0. This also
+    dragged forward minimum-supported versions of ``dnspython`` (1.15.0),
+    ``greenlet`` (0.3.2), and ``six`` (1.10.0).
+
+fixes:
+  - |
+    Python 3 fixes:
+
+    * Removed a request-smuggling vector when running a mixed
+      py2/py3 cluster.
+
+    * Allow ``fallocate_reserve`` to be specified as a percentage.
+
+    * Fixed listings for sharded containers.
+
+    * Fixed non-ASCII account metadata handling.
+
+    * Fixed ``rsync`` output parsing.
+
+    * Fixed some title-casing of headers.
+
+    If you've been testing Swift on Python 3, upgrade at your earliest
+    convenience.
+
+  - |
+    Sharding improvements
+
+    * Container metadata related to sharding are now removed when no
+      longer needed.
+
+    * Empty container databases (such as might be created on handoffs)
+      now shard much more quickly.
+
+  - |
+    The ``proxy-server`` now ignores 404 responses from handoffs that have
+    no data when deciding on the correct response for object requests,
+    similar to what it already does for account and container requests.
+
+  - |
+    Static Large Object sizes in listings for versioned containers are
+    now more accurate.
+
+  - |
+    When refetching Static Large Object manifests, non-manifest responses
+    are now handled better.
+
+  - |
+    S3 API now translates ``503 Service Unavailable`` responses to a more
+    S3-like response instead of raising an error.
+
+  - |
+    Improved proxy-to-backend requests to be more RFC-compliant.
+
+  - |
+    Various other minor bug fixes and improvements.
diff --git a/releasenotes/notes/2_24_0_release-1ca244cc959922fc.yaml b/releasenotes/notes/2_24_0_release-1ca244cc959922fc.yaml
new file mode 100644
index 0000000000..0155cb2c03
--- /dev/null
+++ b/releasenotes/notes/2_24_0_release-1ca244cc959922fc.yaml
@@ -0,0 +1,92 @@
+---
+features:
+  - |
+    Added a new object versioning mode, with APIs for querying and
+    accessing old versions. For more information, see `the documentation
+    <https://docs.openstack.org/swift/latest/middleware.html#module-swift.common.middleware.versioned_writes.object_versioning>`__.
+
+  - |
+    Added support for S3 versioning using the above new mode.
+
+  - |
+    Added a new middleware to allow accounts and containers to opt-in to
+    RFC-compliant ETags. For more information, see `the documentation
+    <https://docs.openstack.org/swift/latest/middleware.html#module-swift.common.middleware.etag_quoter>`__.
+    Clients should be aware of the fact that ETags may be quoted for RFC
+    compliance; this may become the default behavior in some future release.
+
+  - |
+    Proxy, account, container, and object servers now support "seamless
+    reloads" via ``SIGUSR1``. This is similar to the existing graceful
+    restarts but keeps the server socket open the whole time, reducing
+    service downtime.
+
+  - |
+    New buckets created via the S3 API will now store multi-part upload
+    data in the same storage policy as other data rather than the
+    cluster's default storage policy.
+
+  - |
+    Device region and zone can now be changed via ``swift-ring-builder``.
+    Note that this may cause a lot of data movement on the next rebalance
+    as the builder tries to reach full dispersion.
+
+  - |
+    Added support for Python 3.8.
+
+
+deprecations:
+  - |
+    Per-service ``auto_create_account_prefix`` settings are now deprecated
+    and may be ignored in a future release; if you need to use this, please
+    set it in the ``[swift-constraints]`` section of ``/etc/swift/swift.conf``.
+
+fixes:
+  - |
+    The container sharder can now handle containers with special
+    characters in their names.
+
+  - |
+    Internal client no longer logs object DELETEs as status 499.
+
+  - |
+    Objects with an ``X-Delete-At`` value in the far future no longer cause
+    backend server errors.
+
+  - |
+    The bulk extract middleware once again allows clients to specify metadata
+    (including expiration timestamps) for all objects in the archive.
+
+  - |
+    Container sync now synchronizes static symlinks in a way similar to
+    static large objects.
+
+  - |
+    ``swift_source`` is set for more sub-requests in the proxy-server. See
+    `the documentation <https://docs.openstack.org/swift/latest/logs.html#swift-source>`__.
+
+  - |
+    Errors encountered while validating static symlink targets no longer
+    cause ``BadResponseLength`` errors in the proxy-server.
+
+  - |
+    On Python 3, the KMS keymaster now works with secrets stored
+    in Barbican with a ``text/plain`` payload-content-type.
+
+  - |
+    On Python 3, the formpost middleware now works with unicode file names.
+
+  - |
+    On Python 3, certain S3 API headers are now lower case as they
+    would be coming from AWS.
+
+  - |
+    Several utility scripts now work better on Python 3:
+
+    * ``swift-account-audit``
+
+    * ``swift-dispersion-populate``
+
+    * ``swift-drive-recon``
+
+    * ``swift-recon``
diff --git a/releasenotes/notes/2_25_0_release-09410c808881bf21.yaml b/releasenotes/notes/2_25_0_release-09410c808881bf21.yaml
new file mode 100644
index 0000000000..4782f61d0c
--- /dev/null
+++ b/releasenotes/notes/2_25_0_release-09410c808881bf21.yaml
@@ -0,0 +1,65 @@
+---
+features:
+  - |
+    WSGI server processes can now notify systemd when they are ready.
+
+  - |
+    Added a new middleware that allows users and operators to configure
+    accounts and containers to use RFC-compliant (i.e., double-quoted)
+    ETags. This may be useful when using Swift as an origin for some content
+    delivery networks. For more information, see `the middleware documentation
+    <https://docs.openstack.org/swift/latest/middleware.html#etag-quoter>`__.
+
+  - |
+    Added ``ttfb`` (Time to First Byte) and ``pid`` (Process ID) to the set
+    of available proxy-server log fields. For more information, see
+    `the documentation <https://docs.openstack.org/swift/latest/logs.html>`__.
+
+fixes:
+  - |
+    Improved proxy-server performance by reducing unnecessary locking,
+    memory copies, and eventlet scheduling.
+
+  - |
+    Reduced object-replicator and object-reconstructor CPU usage by only
+    checking that the device list is current when rings change.
+
+  - |
+    Improved performance of sharded container listings when performing
+    prefix listings.
+
+  - |
+    Improved container-sync performance when data has already been
+    deleted or overwritten.
+
+  - |
+    Account quotas are now enforced even on empty accounts.
+
+  - |
+    Getting an SLO manifest with ``?format=raw`` now responds with an ETag
+    that matches the MD5 of the generated body rather than the MD5 of
+    the manifest stored on disk.
+
+  - |
+    Provide useful status codes in logs for some versioning and symlink
+    subrequests that were previously logged as 499.
+
+  - |
+    Fixed 500 from cname_lookup middleware. Previously, if the looked-up
+    domain was used by domain_remap to update the request path, the
+    server would respond Internal Error.
+
+  - |
+    On Python 3, fixed an issue when reading or writing objects with a content
+    type like ``message/*``. Previously, Swift would fail to respond.
+
+  - |
+    On Python 3, fixed a RecursionError in swift-dispersion-report when
+    using TLS.
+
+  - |
+    Fixed a bug in the new object versioning API that would cause more
+    than ``limit`` results to be returned when listing.
+
+  - |
+    Various other minor bug fixes and improvements.
diff --git a/releasenotes/notes/2_26_0_release-6548eadcba544f72.yaml b/releasenotes/notes/2_26_0_release-6548eadcba544f72.yaml
new file mode 100644
index 0000000000..a9c1ab66da
--- /dev/null
+++ b/releasenotes/notes/2_26_0_release-6548eadcba544f72.yaml
@@ -0,0 +1,216 @@
+---
+features:
+  - |
+    Extend concurrent reads to erasure coded policies. Previously, the
+    options ``concurrent_gets`` and ``concurrency_timeout`` only applied to
+    replicated policies.
+
+  - |
+    Add a new ``concurrent_ec_extra_requests`` option to allow the proxy to
+    make some extra backend requests immediately. The proxy will respond as
+    soon as there are enough responses available to reconstruct.
+
+  - |
+    The concurrent read options (``concurrent_gets``, ``concurrency_timeout``,
+    and ``concurrent_ec_extra_requests``) may now be configured per
+    storage-policy.
+
+  - |
+    Replication servers can now handle all request methods. This allows
+    ssync to work with a separate replication network.
+
+  - |
+    All background daemons now use the replication network. This allows
+    better isolation between external, client-facing traffic and internal,
+    background traffic. Note that during a rolling upgrade, replication
+    servers may respond with ``405 Method Not Allowed``. To avoid this,
+    operators should remove the config option ``replication_server = true``
+    from their replication servers; this will allow them to handle all
+    request methods before upgrading.
+
+  - |
+    S3 API improvements:
+
+    * Fixed some SignatureDoesNotMatch errors when using the AWS .NET SDK.
+
+    * Add basic read support for object tagging. This improves
+      compatibility with AWS CLI version 2. Write support is not
+      yet implemented, so the tag set will always be empty.
+
+    * CompleteMultipartUpload requests may now be safely retried.
+
+    * Improved quota-exceeded error messages.
+
+    * Improved logging and statsd metrics. Be aware that this will cause
+      an increase in the proxy-logging statsd metrics emited for S3
+      responses. However, this should more accurately reflect the state
+      of the system.
+
+    * S3 requests are now less demanding on the container layer.
+
+  - |
+    Servers now open one listen socket per worker, ensuring each worker
+    serves roughly the same number of concurrent connections.
+
+  - |
+    Server workers may now be gracefully terminated via ``SIGHUP`` or
+    ``SIGUSR1``. The parent process will then spawn a fresh worker.
+
+  - |
+    Allow proxy-logging middlewares to be configured more independently.
+
+  - |
+    Improve performance when increasing partition power.
+
+issues:
+  - |
+    In a rolling upgrade from liberasurecode 1.5.0 or earlier to 1.6.0 or
+    later, object-servers may quarantine newly-written data, leading to
+    availability issues or even data loss. See `bug 1886088
+    <https://bugs.launchpad.net/liberasurecode/+bug/1886088>`__ for more
+    information, including how to determine whether you are affected.
+    Several mitigations are available to operators:
+
+    * If proxy and object layers can be upgraded independently and proxies
+      can be upgraded quickly:
+
+      1. Stop and disable the object-reconstructor before upgrading. This
+         ensures no upgraded object server starts writing new fragments
+         that old object servers would quarantine.
+
+      2. Upgrade liberasurecode on all object servers. Object servers can
+         now read both old and new fragments.
+
+      3. Upgrade liberasurecode on all proxy servers. Newly-written data
+         will now use new fragments. Note that not-yet-upgraded proxies
+         will not be able to read these newly-written fragments but will
+         instead respond ``500 Internal Server Error``.
+
+      4. After upgrading, re-enable and restart the object-reconstructor.
+
+    * If your users can tolerate it, consider a read-only rolling upgrade.
+      Before upgrading, enable the `read-only middleware
+      <https://docs.openstack.org/swift/latest/middleware.html#read-only>`__
+      cluster-wide to prevent new writes during the upgrade. Additionally,
+      stop and disable the object-reconstructor as above. Upgrade normally,
+      then disable the read-only middleware and re-enable and restart the
+      object-reconstructor.
+
+    * Avoid upgrading liberasurecode until swift and liberasurecode
+      better-support a rolling upgrade. Swift remains compatible with
+      liberasurecode 1.5.0 and earlier.
+
+    .. note::
+       Ubuntu 18.04 and RDO's CentOS 7 repos package liberasurecode 1.5.0,
+       while Ubuntu 20.04 and RDO's CentOS 8 repos currently package
+       liberasurecode 1.6.0 or 1.6.1. Take care when upgrading major distro
+       versions!
+
+upgrade:
+  - |
+    **If your cluster has encryption enabled and is still running Swift
+    under Python 2**, we recommend upgrading Swift *before* transitioning to
+    Python 3. Otherwise, new writes to objects with non-ASCII characters
+    in their paths may result in corrupted downloads when read from a
+    proxy-server still running old swift on Python 2. See `bug 1888037
+    <https://bugs.launchpad.net/swift/+bug/1888037>`__ for more information.
+    Note that new tags including a fix for the bug are planned for all
+    maintained stable branches; upgrading to any one of those should be
+    sufficient to ensure a smooth upgrade to the latest Swift.
+
+  - |
+    The above bug was caused by a difference in string types that resulted
+    in ambiguity when decrypting. To prevent the ambiguity for new data, set
+    ``meta_version_to_write = 3`` in your keymaster configuration *after*
+    upgrading all proxy servers.
+
+    If upgrading from Swift 2.20.0 or Swift 2.19.1 or earlier, set
+    ``meta_version_to_write = 1`` in your keymaster configuration *prior*
+    to upgrading.
+
+    See the provided ``keymaster.conf-sample`` for more information about
+    this setting.
+
+  - |
+    **If your cluster is configured with a separate replication network**,
+    note that background daemons will switch to using this network for all
+    traffic. If your account, container, or object replication servers are
+    configured with ``replication_server = true``, these daemons may log a
+    flood of ``405 Method Not Allowed`` messages during a rolling upgrade.
+    To avoid this, comment out the option and restart replication servers
+    before upgrading.
+
+fixes:
+  - |
+    Python 3 bug fixes:
+
+    * Fixed an error when reading encrypted data that was written while
+      running Python 2 for a path that includes non-ASCII characters.
+
+    * Object expiration respects the ``expiring_objects_container_divisor``
+      config option.
+
+    * ``fallocate_reserve`` may be specified as a percentage in more places.
+
+    * The ETag-quoting middleware no longer raises TypeErrors.
+
+  - |
+    Sharding improvements:
+
+    * Prevent object updates from auto-creating shard containers. This
+      ensures more consistent listings for sharded containers during
+      rebalances.
+
+    * Deleted shard containers are no longer considered root containers.
+      This prevents unnecessary sharding audit failures and allows the
+      deleted shard database to actually be unlinked.
+
+    * ``swift-container-info`` now summarizes shard range information.
+      Pass ``-v``/``--verbose`` if you want to see all of them.
+
+    * Improved container-sharder stat reporting to reduce load on root
+      container databases.
+
+    * Don't inject shard ranges when user quits.
+
+  - |
+    During rebalances, clients should no longer get 404s for data that
+    exists but whose replicas are overloaded.
+
+  - |
+    Improved cache management for account and container responses.
+
+  - |
+    Allow operators to pass either raw or URL-quoted paths to
+    ``swift-get-nodes``. Notably, this allows ``swift-get-nodes`` to
+    work with the reserved namespace used for object versioning.
+
+  - |
+    Container read ACLs now work with object versioning. This only
+    allows access to the most-recent version via an unversioned URL.
+
+  - |
+    Improved how containers reclaim deleted rows to reduce locking and object
+    update throughput.
+
+  - |
+    Large object reads log fewer client disconnects.
+
+  - |
+    Allow ratelimit to be placed multiple times in a proxy pipeline,
+    such as both before s3api and auth (to handle swift requests without
+    needing to make an auth decision) and after (to limit S3 requests).
+
+  - |
+    Shuffle object-updater work. This somewhat reduces the impact a
+    single overloaded database has on other containers' listings.
+
+  - |
+    Fix a proxy-server error when retrieving erasure coded data when
+    there are durable fragments but not enough to reconstruct.
+
+  - |
+    Fix an error in the proxy server when finalizing data.
+
+  - |
+    Various other minor bug fixes and improvements.
diff --git a/releasenotes/notes/2_27_0_release-a9ae967d6d271342.yaml b/releasenotes/notes/2_27_0_release-a9ae967d6d271342.yaml
new file mode 100644
index 0000000000..2a2231a59d
--- /dev/null
+++ b/releasenotes/notes/2_27_0_release-a9ae967d6d271342.yaml
@@ -0,0 +1,235 @@
+---
+features:
+  - |
+    Added "audit watcher" hooks to allow operators to run arbitrary code
+    against every diskfile in a cluster. For more information, see `the documentation
+    <https://docs.openstack.org/swift/latest/development_watchers.html>`__.
+
+  - |
+    Added support for system-scoped "reader" roles when authenticating using
+    Keystone. Operators may configure this using the ``system_reader_roles``
+    option in the ``[filter:keystoneauth]`` section of their proxy-server.conf.
+
+    A comparable group, ``.reseller_reader``, is now available for development
+    purposes when authenticating using tempauth.
+
+  - |
+    Allow static large object segments to be deleted asynchronously.
+    Operators may opt into this new behavior by enabling the new
+    ``allow_async_delete`` option in the ``[filter:slo]`` section
+    in their proxy-server.conf. For more information, see `the documentation
+    <https://docs.openstack.org/swift/latest/overview_large_objects.html#deleting-a-large-object>`__.
+
+  - |
+    Added the ability to connect to memcached over TLS. See the
+    ``tls_*`` options in etc/memcache.conf-sample
+
+  - |
+    The proxy-server now caches 'listing' shards, improving listing
+    performance for sharded containers. A new config option,
+    ``recheck_listing_shard_ranges``, controls the cache time and defaults to
+    10 minutes; set it to 0 to disable caching (the previous behavior).
+
+  - |
+    Added a new optional proxy-logging field ``{wire_status_int}`` for the
+    status code returned to the client. For more information, see `the documentation
+    <https://docs.openstack.org/swift/latest/logs.html#proxy-logs>`__.
+
+  - |
+    Memcache client error-limiting is now configurable. See the
+    ``error_suppression_*`` options in etc/memcache.conf-sample
+
+  - |
+    Added ``tasks_per_second`` option to rate-limit the object-expirer.
+
+  - |
+    Added ``usedforsecurity`` annotations for use on FIPS-compliant systems.
+
+  - |
+    S3 API improvements:
+
+    * Make allowable clock skew configurable, with a default value of
+      15 minutes to match AWS. Note that this was previously hardcoded at
+      5 minutes; operators may want to preserve the prior behavior by setting
+      ``allowable_clock_skew = 300`` in the ``[filter:s3api]`` section of their
+      proxy-server.conf.
+
+    * Container ACLs are now cloned to the ``+segments`` container when it is
+      created.
+
+    * Added the ability to configure auth region in s3token middleware.
+
+    * CORS-related headers are now passed through appropriately when using
+      the S3 API. Note that allowed origins and other container metadata
+      must still be `configured through the Swift API
+      <https://docs.openstack.org/swift/latest/cors.html>`__.
+
+      Preflight requests do not contain enough information to map a
+      bucket to an account/container pair; a new cluster-wide option
+      ``cors_preflight_allow_origin`` may be configured for such OPTIONS
+      requests. The default (blank) rejects all S3 preflight requests.
+
+  - |
+    Sharding improvements:
+
+    * A ``--no-auto-shard`` option has been added to ``swift-container-sharder``.
+
+    * The sharder daemon has been enhanced to better support the shrinking
+      of shards that are no longer required. Shard containers will now
+      discover from their root container if they should be shrinking. They
+      will also discover the shards into which they should shrink, which may
+      include the root container itself.
+
+    * A 'compact' command has been added to ``swift-manage-shard-ranges`` that
+      enables sequences of contiguous shards with low object counts to be
+      compacted into another existing shard, or into the root container.
+
+    * ``swift-manage-shard-ranges`` can now accept a config file; this
+      may be used to ensure consistency of threshold values with the
+      container-sharder config.
+
+    * The sharding progress reports in recon cache now continue to be included
+      for a period of time after sharding has completed. The time period
+      may be configured using the ``recon_sharded_timeout`` option in the
+      ``[container-sharder]`` section of container-server.conf, and defaults
+      to 12 hours.
+
+    * Add root containers with compactible ranges to recon cache.
+
+    * Expose sharding statistics in the backend recon middleware.
+
+  - |
+    Replication improvements:
+
+    * The post-rsync REPLICATE call no longer recalculates hashes immediately.
+
+    * Hashes are no longer invalidated after a successful ssync; they were
+      already invalidated during the data transfer.
+
+  - |
+    Added support for Python 3.9.
+
+  - |
+    Partition power increase improvements:
+
+    * Fixed a bug where stale state files would cause misplaced data during
+      multiple partition power increases.
+
+    * Removed a race condition that could cause newly-written data to not be
+      linked into the new partition for the new partition power.
+
+    * Improved safety during cleanup to ensure files have been relinked
+      appropriately before unlinking.
+
+    * Added an option to drop privileges when running the relinker as root.
+
+    * Added an option to rate-limit how quickly data files are relinked or
+      cleaned up. This may be used to reduce I/O load during partition power
+      increases, improving end-user performance.
+
+    * Rehash partitions during the partition power increase. Previously, we
+      relied on the replication engine to perform the rehash, which could
+      cause an unexpected I/O spike after a partition power increase.
+
+    * Warn when relinking/cleaning up and any disks are unmounted.
+
+    * Log progress per partition when relinking/cleaning up.
+
+    * During clean-up, stop warning about tombstones that got reaped from
+      the new location but not the old.
+
+    * Added the ability to read options from object-server.conf, similar to
+      background daemons.
+
+issues:
+  - |
+    Operators should verify that encryption is not enabled in their reconciler
+    pipelines; having it enabled there may harm data durability. For more
+    information, see `bug 1910804 <https://launchpad.net/bugs/1910804>`__.
+
+upgrade:
+  - |
+    Added an option to write EC fragments with legacy CRC to ensure a smooth
+    upgrade from liberasurecode<=1.5.0 to >=1.6.2. For more information, see
+    `bug 1886088 <https://bugs.launchpad.net/liberasurecode/+bug/1886088>`__.
+
+fixes:
+  - |
+    Errors downloading a Static Large Object that cause a shorter-than-expected
+    response are now logged as 500s.
+
+  - |
+    S3 API fixes:
+
+    * Fixed a bug that prevented the s3api pipeline validation described in
+      proxy-server.conf-sample from being performed. As documented, operators
+      can disable this via the ``auth_pipeline_check`` option if proxy startup
+      fails with validation errors.
+
+    * Fixed an issue where SHA mismatches in client XML payloads would cause
+      a server error. Swift now correctly responds with a client error about
+      the bad digest.
+
+    * Fixed an issue where non-base64 signatures would cause a server error.
+      Swift now correctly responds with a client error about the invalid
+      digest.
+
+    * The correct storage policy is now logged for S3 requests.
+
+  - |
+    Sharding fixes:
+
+    * Prevent shard databases from losing track of their root database when
+      deleted.
+
+    * Prevent sharded root databases from being reclaimed to ensure that
+      shards can detect that they have been deleted.
+
+    * Overlapping shrinking shards no longer generate audit warnings; these
+      are expected to sometimes overlap.
+
+  - |
+    Replication fixes:
+
+    * Fixed a race condition in ssync that could lead to a loss of data
+      durability (or even loss of data, for two-replica policies) when some
+      object servers have outdated rings. Replication via rsync is likely
+      still affected by a similar bug.
+
+    * Non-durable fragments can now be reverted from handoffs.
+
+    * Reduced log noise for common ssync errors.
+
+  - |
+    Python 3 fixes:
+
+    * Staticweb correctly handles listings when paths include non-ASCII
+      characters.
+
+    * S3 API now allows multipart uploads with non-ASCII characters in the
+      object name.
+
+    * Fixed an import-ordering issue in ``swift-dispersion-populate``.
+
+  - |
+    Turned off thread-logging when monkey-patching with eventlet. This
+    addresses a potential hang in the proxy-server while logging client
+    disconnects.
+
+  - |
+    Fixed a bug that could cause EC GET responses to return a server error.
+
+  - |
+    Fixed an issue with ``swift-drive-audit`` when run around New Year's.
+
+  - |
+    Server errors encountered when validating the first segment of a Static or
+    Dynamic Large Object now return a 503 to the client, rather than a 409.
+
+  - |
+    Errors when setting keys in memcached are now logged. This helps
+    operators detect when shard ranges for caching have gotten too large to
+    be stored, for example.
+
+  - |
+    Various other minor bug fixes and improvements.
diff --git a/releasenotes/notes/2_28_0_release-f2515e07fb61cd01.yaml b/releasenotes/notes/2_28_0_release-f2515e07fb61cd01.yaml
new file mode 100644
index 0000000000..bd3fdde75d
--- /dev/null
+++ b/releasenotes/notes/2_28_0_release-f2515e07fb61cd01.yaml
@@ -0,0 +1,235 @@
+---
+features:
+  - |
+    ``swift-manage-shard-ranges`` improvements:
+
+    * Exit codes are now applied more consistently:
+
+      - 0 for success
+      - 1 for an unexpected outcome
+      - 2 for invalid options
+      - 3 for user exit
+
+      As a result, some errors that previously resulted in exit code 2
+      will now exit with code 1.
+
+    * Added a new 'repair' command to automatically identify and
+      optionally resolve overlapping shard ranges.
+
+    * Added a new 'analyze' command to automatically identify overlapping
+      shard ranges and recommend a resolution based on a JSON listing
+      of shard ranges such as produced by the 'show' command.
+
+    * Added a ``--includes`` option for the 'show' command to only output
+      shard ranges that may include a given object name.
+
+    * Added a ``--dry-run`` option for the 'compact' command.
+
+    * The 'compact' command now outputs the total number of compactible
+      sequences.
+
+  - |
+    Partition power increase improvements:
+
+    * The relinker now spawns multiple subprocesses to process disks
+      in parallel. By default, one worker is spawned per disk; use the
+      new ``--workers`` option to control how many subprocesses are used.
+      Use ``--workers=0`` to maintain the previous behavior.
+
+    * The relinker can now target specific storage policies or
+      partitions by using the new ``--policy`` and ``--partition``
+      options.
+
+  - |
+    More daemons now support systemd notify sockets.
+
+  - |
+    The container-reconciler now scales out better with new ``processes``,
+    ``process``, and ``concurrency`` options, similar to the object-expirer.
+deprecations:
+  - |
+    Container sharding deprecations:
+
+    * Added a new config option, ``shrink_threshold``, to specify the
+      absolute size below which a shard will be considered for shrinking.
+      This overrides the ``shard_shrink_point`` configuration option, which
+      expressed this as a percentage of ``shard_container_threshold``.
+      ``shard_shrink_point`` is now deprecated.
+
+    * Similar to above, ``expansion_limit`` was added as an absolute-size
+      replacement for the now-deprecated ``shard_shrink_merge_point``
+      configuration option.
+fixes:
+  - |
+    Sharding improvements:
+
+    * When building a listing from shards, any failure to retrieve
+      listings will result in a 503 response. Previously, failures
+      fetching a partiucular shard would result in a gap in listings.
+
+    * Container-server logs now include the shard path in the referer
+      field when receiving stat updates.
+
+    * Added a new config option, ``rows_per_shard``, to specify how many
+      objects should be in each shard when scanning for ranges. The default
+      is ``shard_container_threshold / 2``, preserving existing behavior.
+
+    * Added a new config option, ``minimum_shard_size``. When scanning
+      for shard ranges, if the final shard would otherwise contain
+      fewer than this many objects, the previous shard will instead
+      be expanded to the end of the namespace (and so may contain up
+      to ``rows_per_shard + minimum_shard_size`` objects). This reduces
+      the number of small shards generated. The default value is
+      ``rows_per_shard / 5``.
+
+    * The sharder now correctly identifies and fails audits for shard
+      ranges that overlap exactly.
+
+    * The sharder and swift-manage-shard-ranges now consider total row
+      count (instead of just object count) when deciding whether a shard
+      is a candidate for shrinking.
+
+    * If the sharder encounters shard range gaps while cleaving, it will
+      now log an error and halt sharding progress. Previously, rows may
+      not have been moved properly, leading to data loss.
+
+    * Sharding cycle time and last-completion time are now available via
+      swift-recon.
+
+    * Fixed an issue where resolving overlapping shard ranges via shrinking
+      could prematurely mark created or cleaved shards as active.
+
+  - |
+    S3 API improvements:
+
+    * Added an option, ``ratelimit_as_client_error``, to return 429s for
+      rate-limited responses. Several clients/SDKs have seem to support
+      retries with backoffs on 429, and having it as a client error
+      cleans up logging and metrics. By default, Swift will respond 503,
+      matching AWS documentation.
+
+    * Fixed a server error in bucket listings when ``s3_acl`` is enabled
+      and staticweb is configured for the container.
+
+    * Fixed a server error when a client exceeds ``client_timeout`` during an
+      upload. Now, a ``RequestTimeout`` error is correctly returned.
+
+    * Fixed a server error when downloading multipart uploads/static large
+      objects that have missing or inaccessible segments. This is a state
+      that cannot arise in AWS, so a new ``BrokenMPU`` error is returned,
+      indicating that retrying the request is unlikely to succeed.
+
+    * Fixed several issues with the prefix, marker, and delimiter
+      parameters that would be mirrored back to clients when listing
+      buckets.
+
+  - |
+    Partition power increase fixes:
+
+    * The relinker now performs eventlet-hub selection the same way as
+      other daemons. In particular, ``epolls`` will no longer be selected,
+      as it seemed to cause occassional hangs.
+
+    * Partitions that encountered errors during relinking are no longer
+      marked as completed in the relinker state file. This ensures that
+      a subsequent relink will retry the failed partitions.
+
+    * Partition cleanup is more robust, decreasing the likelihood of
+      leaving behind mostly-empty partitions from the old partition
+      power.
+
+    * Improved relinker progress logging, and started collecting
+      progress information for swift-recon.
+
+    * Cleanup is more robust to files and directories being deleted by
+      another process.
+
+    * The relinker better handles data found from earlier partition power
+      increases.
+
+    * The relinker better handles tombstones found for the same object
+      but with different inodes.
+
+    * The reconciler now defers working on policies that have a partition
+      power increase in progress to avoid issues with concurrent writes.
+
+  - |
+    Erasure coding fixes:
+
+    * Added the ability to quarantine EC fragments that have no (or few)
+      other fragments in the cluster. A new configuration option,
+      ``quarantine_threshold``, in the reconstructor controls the point at
+      the fragment will be quarantined; the default (0) will never
+      quarantine. Only fragments older than ``quarantine_age`` (default:
+      ``reclaim_age``) may be quarantined. Before quarantining, the
+      reconstructor will attempt to fetch fragments from handoff nodes
+      in addition to the usual primary nodes; a new ``request_node_count``
+      option (default ``2 * replicas``) limits the total number of nodes to
+      contact.
+
+    * Added a delay before deleting non-durable data. A new configuration
+      option, ``commit_window`` in the ``[DEFAULT]`` section of
+      object-server.conf, adjusts this delay; the default is 60 seconds. This
+      improves the durability of both back-dated PUTs (from the reconciler or
+      container-sync, for example) and fresh writes to handoffs by preventing
+      the reconstructor from deleting data that the object-server was still
+      writing.
+
+    * Improved proxy-server and object-reconstructor logging when data
+      cannot be reconstructed.
+
+    * Fixed an issue where some but not all fragments having metadata
+      applied could prevent reconstruction of missing fragments.
+
+    * Server-side copying of erasure-coded data to a replicated policy no
+      longer copies EC sysmeta. The previous behavior had no material
+      effect, but could confuse operators examining data on disk.
+
+  - |
+    Python 3 fixes:
+
+    * Fixed a server error when performing a PUT authorized via
+      tempurl with some proxy pipelines.
+
+    * Fixed a server error during GET of a symlink with some proxy
+      pipelines.
+
+    * Fixed an issue with logging setup when /dev/log doesn't exist
+      or is not a UNIX socket.
+
+  - |
+    The dark-data audit watcher now skips objects younger than a new
+    configurable ``grace_age`` period. This avoids issues where data
+    could be flagged, quarantined, or deleted because of listing
+    consistency issues. The default is one week.
+
+  - |
+    The dark-data audit watcher now requires that all primary locations
+    for an object's container agree that the data does not appear in
+    listings to consider data "dark". Previously, a network partition
+    that left an object node isolated could cause it to quarantine or
+    delete all of its data.
+
+  - |
+    ``EPIPE`` errors no longer log tracebacks.
+
+  - |
+    The account and container auditors now log and update recon before
+    going to sleep.
+
+  - |
+    The object-expirer logs fewer client disconnects.
+
+  - |
+    ``swift-recon-cron`` now includes the last time it was run in the recon
+    information.
+
+  - |
+    ``EIO`` errors during read now cause object diskfiles to be quarantined.
+
+  - |
+    The formpost middleware now properly supports uploading multiple files
+    with different content-types.
+
+  - |
+    Various other minor bug fixes and improvements.
diff --git a/releasenotes/notes/2_29_0_release-af71f7efd73109b0.yaml b/releasenotes/notes/2_29_0_release-af71f7efd73109b0.yaml
new file mode 100644
index 0000000000..0a14ffcece
--- /dev/null
+++ b/releasenotes/notes/2_29_0_release-af71f7efd73109b0.yaml
@@ -0,0 +1,167 @@
+---
+features:
+  - |
+    S3 API improvements
+
+    * CORS preflights are now allowed for pre-signed URLs.
+
+    * The ``storage_domain`` option now accepts a comma-separated list of
+      storage domains. This allows multiple storage domains to configured
+      for use with virtual-host style addressing.
+
+    * Reduced the overhead of retrieving bucket and object ACLs.
+
+  - |
+    Replication, reconstruction, and diskfile improvements
+
+    * The reconstructor now uses the replication network to fetch fragments
+      for reconstruction.
+
+    * Added the ability to limit how many objects per handoff partition
+      will be reverted in a reconstructor cycle using the new
+      ``max_objects_per_revert`` option. This may be useful to reduce
+      ssync timeouts and lock contention, ensuring that progress is made
+      during rebalances.
+
+  - |
+    Object updater improvements
+
+    * Added the ability to ratelimit updates (approximately) per-container
+      using the new ``max_objects_per_container_per_second`` option. This may
+      be used to limit requests to already-overloaded containers while still
+      making progress on updates to other containers.
+
+    * Added timing stats by response code.
+
+    * Updates are now sent over the replication network.
+
+  - |
+    Memcache improvements
+
+    * Added the ability to configure a chance to skip checking memcache when
+      querying shard ranges. This allows some fraction of traffic to go to
+      disk and refresh memcache before the key ages out. Recommended values
+      for the new ``container_updating_shard_ranges_skip_cache_pct`` and
+      ``container_listing_shard_ranges_skip_cache_pct`` options are in the
+      range of 0.0 to 0.1.
+
+    * Added stats for shard range cache hits, misses, and skips.
+
+  - |
+    Added object-reconstructor stats to recon.
+
+  - |
+    Added a new ``swift.common.registry`` module. This includes helper
+    functions ``register_sensitive_header`` and ``register_sensitive_param``
+    which third party middleware authors may use to flag headers and query
+    parameters for redaction when logging. For more information, see `the
+    documentation <https://docs.openstack.org/swift/latest/misc.html#
+    module-swift.common.registry>`__.
+
+  - |
+    Added the ability to configure project-scope read-only roles for
+    keystoneauth using the new ``project_reader_roles`` option.
+
+  - |
+    The ``cname_lookup`` middleware now works with dnspython 2.0 and later.
+
+  - |
+    The internal clients used by the container-reconciler, container-sharder,
+    container-sync, and object-expirer daemons now use a more-descriptive
+    ``<daemon>-ic`` log name, rather than ``swift``. If you previously
+    configured the ``log_name`` option in ``internal-client.conf``, you must
+    now use the ``set log_name = <value>`` syntax to configure it, even if
+    no value is set in the ``[DEFAULT]`` section. This may be done prior to
+    upgrading.
+
+  - |
+    Removed translations from most logging.
+
+deprecations:
+  - |
+    The ``StatsdClient.set_prefix`` method is now deprecated and
+    may be removed in a future release; by extension, so is the
+    ``LogAdapter.set_statsd_prefix`` method. Middleware developers should
+    use the ``statsd_tail_prefix`` argument to ``get_logger`` instead.
+
+fixes:
+  - |
+    S3 API fixes
+
+    * Fixed the types of configured values in ``/info`` response.
+
+    * Fixed a server error when trying to copy objects with non-ASCII names.
+
+    * Fixed a server error when uploading objects with very long names.
+      A ``KeyTooLongError`` is now returned.
+
+    * Fixed an error when multi-deleting MPUs when SLO async-deletes
+      are enabled.
+
+    * Fixed an error that allowed list-uploads and list-parts requests to
+      return incomplete or out-of-order results.
+
+    * Fixed several bugs when dealing with non-ASCII object names and
+      multipart uploads.
+
+  - |
+    Replication, reconstruction, and diskfile fixes
+
+    * Ensure that non-durable data and .meta files are purged from handoffs
+      after syncing.
+
+    * Fixed tracebacks when there's a race to mark a file durable or delete it.
+
+    * Improved cooperative multitasking during ssync.
+
+    * Upon detecting a ring change, the reconstructor now only aborts the
+      jobs for that ring and continues processing jobs for other rings.
+
+    * Fixed a traceback when logging about a lock timeout in the replicator.
+
+  - |
+    Fixed a security issue where tempurl and s3api signatures were logged in
+    full. This allowed an attacker with access to log data to perform replay
+    attacks, potentially accessing or overwriting cluster data. Now, such
+    signatures are redacted in a manner similar to auth tokens; see the
+    ``reveal_sensitive_prefix`` option in ``proxy-server.conf``.
+
+    See CVE-2017-8761 for more information.
+
+  - |
+    Fixed a race condition where swift would attempt to quarantine
+    recently-deleted object updates.
+
+  - |
+    Improved handling of timeouts and other errors when obtaining a
+    connection to memcached.
+
+  - |
+    The ``swift-recon`` tool now queries each object-server IP only once
+    when reporting disk usage. Previously, each port in the ring would be
+    queried; when using servers-per-port, this could dramatically overstate
+    the disk capacity in the cluster.
+
+  - |
+    Fixed a bug that allowed some statsd metrics to be annotated with the
+    wrong backend layer.
+
+  - |
+    Fixed a traceback in the account-server when there's no account
+    database on disk to receive a container update. The account-server
+    now correctly 404s.
+
+  - |
+    The container-updater will quarantine container databases if all
+    replicas for the account respond 404.
+
+  - |
+    Fixed a proxy-server error when the read-only middleware tried to
+    handle non-Swift paths (such as may be used by third-party middleware).
+
+  - |
+    Some client behaviors that the proxy previously logged at warning have
+    been lowered to info.
+
+  - |
+    Various other minor bug fixes and improvements.
diff --git a/releasenotes/notes/2_29_1_release-a2962252523d9396.yaml b/releasenotes/notes/2_29_1_release-a2962252523d9396.yaml
new file mode 100644
index 0000000000..537c4be945
--- /dev/null
+++ b/releasenotes/notes/2_29_1_release-a2962252523d9396.yaml
@@ -0,0 +1,41 @@
+---
+deprecations:
+  - |
+    This is the final stable branch that will support Python 2.7.
+
+fixes:
+  - |
+    Fixed s3v4 signature calculation when the client sends an un-encoded
+    path in the request.
+
+  - |
+    Fixed multiple issues in s3api involving Multipart Uploads with
+    non-ASCII names.
+
+  - |
+    The object-updater now defers rate-limited updates to the end of its
+    cycle; these deferred updates will be processed (at the limited rate)
+    until the configured ``interval`` elapses. A new ``max_deferred_updates``
+    option may be used to bound the deferral queue.
+
+  - |
+    Empty account and container partition directories are now cleaned up
+    immediately after replication, rather than needing to wait for an
+    additional replication cycle.
+
+  - |
+    The object-expirer now only cleans up empty containers. Previously, it
+    would attempt to delete all processed containers, regardless of whether
+    there were entries which were skipped or had errors.
+
+  - |
+    A new ``item_size_warning_threshold`` option may be used to monitor for
+    values that are approaching the limit of what can be stored in memcache.
+    See the memcache sample config for more information.
+
+  - |
+    Internal clients now correctly use their configured ``User-Agent`` in
+    backend requests, rather than only using it for logging.
+
+  - |
+    Various other minor bug fixes and improvements.
diff --git a/releasenotes/notes/2_30_0_release-642778c3010848db.yaml b/releasenotes/notes/2_30_0_release-642778c3010848db.yaml
new file mode 100644
index 0000000000..e918df16cf
--- /dev/null
+++ b/releasenotes/notes/2_30_0_release-642778c3010848db.yaml
@@ -0,0 +1,167 @@
+---
+features:
+  - |
+    Sharding improvements
+
+    * The ``swift-manage-shard-ranges`` tool has a new mode to repair gaps
+      in the namespace.
+
+    * Metrics are now emitted for whether databases used for cleaving
+      were created or already existed, allowing a better understanding
+      of the reason for handoffs in the cluster.
+
+    * Misplaced-record stats are now also emitted to statsd. Previously,
+      these were only available in logs.
+
+  - |
+    Logging improvements
+
+    * The message template for proxy logging may now include a
+      ``{domain}`` field for the client-provided ``Host`` header.
+
+    * Added a ``log_rsync_transfers`` option to the object-replicator.
+      Set it to false to disable logging rsync "send" lines; during
+      large rebalances, such logging can overwhelm log aggregation
+      while providing little useful information.
+
+  - |
+    The formpost digest algorithm is now configurable via the new
+    ``allowed_digests`` option, and support is added for both SHA-256
+    and SHA-512. Supported formpost digests are exposed to clients in
+    ``/info``. Additionally, formpost signatures can now be base64 encoded.
+
+  - |
+    Added metrics to the formpost and tempurl middlewares to monitor
+    digest usage in signatures.
+
+  - |
+    Improved compatibility with certain FIPS-mode-enabled systems.
+
+  - |
+    Added a ``ring_ip`` option for various object services. This may be
+    used to find own devices in the ring in a containerized environment
+    where the ``bind_ip`` may not appear in the ring at all.
+
+  - |
+    Account and container replicators can now be configured with a
+    ``handoff_delete`` option, similar to object replicators and
+    reconstructors. See the sample config for more information.
+
+  - |
+    Developers using Swift's memcache client may now opt in to having
+    a ``MemcacheConnectionError`` be raised when no connection succeeded
+    using a new ``raise_on_error`` keyword argument to ``get``/``set``.
+
+  - |
+    Device names are now included in new database IDs. This provides more
+    context when examining incoming/outgoing sync tables or sharding
+    CleaveContexts.
+
+deprecations:
+  - |
+    SHA-1 signatures are now deprecated for the formpost and tempurl
+    middlewares. At some point in the future, SHA-1 will no longer be
+    enabled by default; eventually, support for it will be removed
+    entirely.
+
+security:
+  - |
+    Constant-time string comparisons are now used when checking S3 API signatures.
+
+  - |
+    Fixed a socket leak when clients try to delete a non-SLO as though
+    it were a Static Large Object.
+
+fixes:
+  - |
+    Sharding improvements
+
+    * Misplaced tombstone records are now properly cleaved.
+
+    * Fixed a bug where the sharder could fail to find a device to use for
+      cleaving.
+
+    * Databases marked deleted are now processed by the sharder.
+
+    * More information is now synced to the fresh database when sharding.
+      Previously, a database could lose the fact that it had been marked
+      as deleted.
+
+    * Shard ranges with no rows to cleave could previously be left in the
+      CREATED state after cleaving. Now, they are advanced to CLEAVED.
+
+  - |
+    S3 API improvements
+
+    * Fixed cross-policy object copies. Previously, copied data would
+      always be written using the source container's policy. Now, the
+      destination container's policy will be used, avoiding availability
+      issues and unnecessary container-reconciler work.
+
+    * More headers are now copied from multi-part upload markers to their
+      completed objects, including ``Content-Encoding``.
+
+    * When running with ``s3_acl`` disabled, ``bucket-owner-full-control`` and
+      ``bucket-owner-read`` canned ACLs will be translated to the same Swift
+      ACLs as ``private``.
+
+    * The S3 ACL and Delete Multiple APIs are now less case-sensitive.
+
+    * Improved the error message when deleting a bucket that's ever had
+      versioning enabled and still has versions in it.
+
+    * ``LastModified`` timestamps in listings are now rounded up to whole
+      seconds, like they are in responses from AWS.
+
+    * Proxy logging for Complete Multipart Upload requests is now more
+      consistent when requests have been retried.
+
+  - |
+    Logging improvements
+
+    * Signal handling is more consistently logged at notice level.
+      Previously, signal handling would sometimes be logged at info
+      or error levels.
+
+    * The object-replicator now logs successful rsync transfers at debug
+      instead of info.
+
+    * Transaction IDs are now only included in daemon log lines
+      in a request/response context.
+
+  - |
+    The tempurl middleware has been updated to return a 503 if storing a
+    token in memcache fails. Third party authentication middlewares are
+    encouraged to also use the new ``raise_on_error`` keyword argument
+    when storing ephemeral tokens in memcache.
+
+  - |
+    Database replication connections are now closed following an error
+    or timeout. This prevents a traceback in some cases when the replicator
+    tries to reuse the connection.
+
+  - |
+    ``ENOENT`` and ``ENODATA`` errors are better handled in the object
+    replicator and auditor.
+
+  - |
+    Improved object update throughput by shifting some shard range
+    filtering from Python to SQL.
+
+  - |
+    Include ``Vary: Origin`` header when CORS responses vary by origin.
+
+  - |
+    The staticweb middleware now allows empty listings at the root of
+    a container. Previously, this would result in a 404 response.
+
+  - |
+    Ring builder output tables better display weights over 1000.
+
+  - |
+    Various other minor bug fixes and improvements.
+
+other:
+  - |
+    Pickle support has been removed from Swift's memcache client. Support
+    had been deprecated since Swift 1.7.0.
diff --git a/releasenotes/notes/2_31_0_release-77e6b20dfba3b32c.yaml b/releasenotes/notes/2_31_0_release-77e6b20dfba3b32c.yaml
new file mode 100644
index 0000000000..ae5d96a637
--- /dev/null
+++ b/releasenotes/notes/2_31_0_release-77e6b20dfba3b32c.yaml
@@ -0,0 +1,118 @@
+---
+features:
+  - |
+    Added support for Python 3.10.
+
+  - |
+    Added an optional ``backend_ratelimit`` middleware for backend servers.
+    See the backend server sample configuration files for more information.
+
+  - |
+    Sharding improvements
+
+    * Added a ``merge`` subcommand to ``swift-manage-shard-ranges`` to merge
+      arbitrary shard ranges into a container DB. Minimal safety checks
+      are performed; it should only be used for emergency shard range
+      manipulation by expert users.
+
+    * Warnings are now emitted when sharding appears to have become stuck.
+      Use the new ``container_sharding_timeout`` option to configure the
+      "stuck" threshold; the default is 48 hours.
+
+  - |
+    Metrics improvements
+
+    * Added timing stats for memcached operations.
+
+    * Renamed and improved the granularity of shard range cache and
+      backend stats. Metrics dashboards may need to be updated.
+
+    * Emit stats when backend nodes are error-limited.
+
+  - |
+    Added the ability to configure a chance to skip checking memcache when
+    querying account and container information. This allows some fraction
+    of traffic to go to disk and refresh memcache before the key ages out.
+    Recommended values for the new ``account_existence_skip_cache_pct`` and
+    ``container_existence_skip_cache_pct`` options are in the range of
+    0.0 to 0.01.
+
+  - |
+    Absolute-form request targets are now accepted. This enables access for
+    certain clients and SDKs (including some older versions of rclone that
+    were using an old version of aws-sdk-go).
+
+upgrade:
+  - |
+    Static large object segments may now be deleted asynchronously by
+    default. Operators may return to the old behavior by disabling the
+    ``allow_async_delete`` option in the ``[filter:slo]`` section
+    in their proxy-server.conf.
+
+security:
+  - |
+    Fixed a security issue in how ``s3api`` handles XML parsing that allowed
+    authenticated S3 clients to read arbitrary files from proxy servers.
+    Refer to `CVE-2022-47950 <https://cve.circl.lu/cve/CVE-2022-47950>`__
+    for more information.
+
+fixes:
+  - |
+    S3 API improvements
+
+    * Fixed a server error when handling malformed CompleteMultipartUpload
+      requests.
+
+    * Improved error reporting when attempting to set invalid ``X-Delete-At``
+      or ``X-Delete-After`` values via the S3 API.
+
+  - |
+    Sharding improvements
+
+    * Sync more shard ranges from the root database to the shards. This
+      helps ensure shard range repairs effected at the root make their way
+      to shards that would otherwise be stuck trying to further divide
+      into sub-shards.
+
+    * Improved performance of ``delimiter`` listings for sharded containers.
+
+    * Added more safety checks to the ``repair`` subcommand of
+      ``swift-manage-shard-ranges``.
+
+    * Better handle ``EOFError`` and ``KeyboardInterrupt`` when prompting for
+      input in ``swift-manage-shard-ranges``.
+
+    * Stop warning about transient overlaps when auditing shard ranges.
+
+  - |
+    Fixed a path-rewriting bug introduced in Python 3.7.14, 3.8.14, 3.9.14,
+    and 3.10.6 that could cause some ``domain_remap`` requests to be routed to
+    the wrong object.
+
+  - |
+    Fixed a server error when attempting to access data in a deleted
+    container that had an erasure-coded storage policy.
+
+  - |
+    Improved error messages to clients that encounter errors using the
+    ``formpost`` middleware.
+
+  - |
+    Removed some inappropriate error-suppression when locking account and
+    container databases.
+
+  - |
+    Improved server start-up time when using multiple workers.
+
+  - |
+    Removed some unnecessary locking when logging.
+
+  - |
+    Added some basic object-metadata validation; invalid diskfiles will be
+    quarantined via the auditor or reconstructor.
+
+  - |
+    Enhanced logging when error-limiting a backend node.
+
+  - |
+    Various other minor bug fixes and improvements.
diff --git a/releasenotes/notes/2_31_1_release-20ccd07e32b91c1f.yaml b/releasenotes/notes/2_31_1_release-20ccd07e32b91c1f.yaml
new file mode 100644
index 0000000000..9461721d06
--- /dev/null
+++ b/releasenotes/notes/2_31_1_release-20ccd07e32b91c1f.yaml
@@ -0,0 +1,37 @@
+---
+fixes:
+  - |
+    Sharding fixes
+
+    * Shards no longer report stats to the root database when they are in
+      the ``CREATED`` state.
+
+    * Sharding metadata is no longer cleared when databases are deleted.
+      This could previously cause deleted shards that still had rows to
+      become stuck and never move them to the correct database.
+
+    * Fixed a performance regression in the handling of misplaced objects.
+
+    * Swift path and on-disk path are now included with all sharder logging.
+
+  - |
+    ``s3token`` no longer mangles request paths that include the Access Key ID.
+
+  - |
+    User metadata is now exposed via CORS when encryption is enabled,
+    matching the behavior when encryption is not enabled.
+
+  - |
+    Fewer backend requests are now required when account or container
+    information is missing from memcache.
+
+  - |
+    Fixed logging of IP and port in the proxy-server; in particular,
+    internal clients now correctly log about the replication IP/port.
+
+  - |
+    Fixed a bug in the object replicator that would cause an under-reporting
+    of failures.
+
+  - |
+    Various other minor bug fixes.
diff --git a/releasenotes/notes/2_32_0_release-39c8fb77a0a3e72d.yaml b/releasenotes/notes/2_32_0_release-39c8fb77a0a3e72d.yaml
new file mode 100644
index 0000000000..240daa5a17
--- /dev/null
+++ b/releasenotes/notes/2_32_0_release-39c8fb77a0a3e72d.yaml
@@ -0,0 +1,122 @@
+---
+features:
+  - |
+    Python 3.11 is now supported.
+
+  - |
+    Added the ability for reseller admins to set per-policy account quotas by
+    posting metadata of the form ``X-Account-Quota-Bytes-Policy-<policy name>``.
+
+  - |
+    Added a ``keepalive_timeout`` option to the proxy server to limit how long
+    to wait for a client to initiate a request, separate from the general
+    ``client_timeout`` option. Note that this requires eventlet 0.33.4
+    (currently unreleased) or later.
+
+  - |
+    Added a ``keep_cache_slo_manifest`` option to the object server to better
+    control whether SLO manifests are dropped from the page cache.
+
+  - |
+    WSGI servers now accept a ``--test-config`` option that may be used to
+    validate configuration changes before reloading/restarting the server.
+
+  - |
+    Metrics improvements:
+
+    * Metrics are now emitted for a variety of S3 error responses, in the
+      form ``s3api.<status_int>.<error_class>[.<reason>]``
+
+    * Account and container info metrics now include the response status code
+      when backend requests are made.
+
+    * Added timing metrics to the container sharder for various operations.
+
+  - |
+    A variety of performance improvements have been made for sharded
+    container databases.
+
+  - |
+    Various logging and metrics improvements when talking to memcache.
+
+  - |
+    Improved formatting of meta and sysmeta for ``swift-account-info`` and
+    ``swift-container-info``.
+
+upgrade:
+  - |
+    Previously, under some circumstances, a non-standard config option such
+    as ``RECLAIM_AGE`` might get parsed as ``reclaim_age`` for some processes
+    but ignored by others. Now, all config parsing is case-sensitive;
+    non-standard names will always be ignored.
+
+  - |
+    The structure of cached shard ranges has changed, improving performance
+    when listing or writing to sharded containers. Note that immediately
+    after upgrade, the new structures will all be cache misses, which may
+    lead to a thundering herd problem. To avoid this, upgrade just a few
+    nodes first, let them service some fraction of traffic to populate the
+    cache, then upgrade the rest of the cluster.
+
+deprecations:
+  - |
+    Removed the hard dependency on netifaces; it may still be used if the
+    ``getifaddrs`` C function is not available. This fallback support may be
+    removed in a future release.
+
+fixes:
+  - |
+    Python 3 fixes:
+
+    * Python 3 object servers can now read unencrypted non-ASCII metadata
+      that was written under Python 2.
+
+    * Ssync no longer corrupts unencrypted non-ASCII metadata during
+      transfers.
+
+    * Fixed an encoding issue when writing non-ASCII object names to sharded
+      containers and shard range caching is not enabled.
+
+    * Fixed an encoding issue when handling non-ASCII account names.
+
+    * Fixed a ``generator already executing`` error on client disconnect.
+
+    * Suppressed ``RemoteDisconnected`` tracebacks.
+
+  - |
+    Fixed an issue that prevented proxy servers from emitting metrics and
+    logs for backend requests made when getting account or container info.
+
+  - |
+    Fixed ssync's handling of timestamp offsets. Previously, this could cause
+    ssync to fail with a 409 Conflict, causing the transfer to fail and
+    preventing handoffs from clearing.
+
+  - |
+    Fixed an issue where an erasure-coded PUT could prevent other requests
+    from being processed when network calls rarely or never blocked.
+
+  - |
+    Fixed an issue when downloading an SLO manifest would hit a recoverable
+    error and attempt to resume from another node. This would manifest as
+    either a pyeclib decode error or an unexpected empty response.
+
+  - |
+    The proxy server now applies error-limiting to the correct node when
+    handling a recoverable node error.
+
+  - |
+    Account, container, and object log fields are now correctly identified
+    when returning ``BadDigest`` responses to S3 requests.
+
+  - |
+    Reduced the backend load of making ``?versions`` requests to a container
+    that has never had object versioning enabled.
+
+  - |
+    The standard-library ``logging`` module is no longer monkey-patched when
+    importing ``swift.common.utils``, making it easier to re-use swift code
+    in other contexts.
+
+  - |
+    Various other minor bug fixes and improvements.
diff --git a/releasenotes/notes/3_33_0_release-d208917f5012cedd.yaml b/releasenotes/notes/3_33_0_release-d208917f5012cedd.yaml
new file mode 100644
index 0000000000..d5a44bb980
--- /dev/null
+++ b/releasenotes/notes/3_33_0_release-d208917f5012cedd.yaml
@@ -0,0 +1,129 @@
+---
+features:
+  - |
+    Prefix-based tempurls may now be used to explore staticweb
+    listings within that prefix. Note that this opens a new ability
+    to list containers from tempurls, but only if staticweb's
+    ``X-Container-Meta-Web-Listings`` is enabled.
+
+  - |
+    When generating index pages from listings, staticweb now sends an HTML5
+    doctype. This makes them `PEP 503 <https://peps.python.org/pep-0503/>`__
+    compliant, allowing their `continued
+    use <https://github.com/pypa/pip/issues/10825>`__ for simple Python
+    package repositories.
+
+  - |
+    Add basic read support for S3 object locking. This improves
+    compatibility with an Ansible S3 module. Write support is not
+    yet implemented, so get-object-lock-configuration will always 404.
+
+  - |
+    Added a ``swift-reload`` command to assist with safely reloading WSGI
+    servers.
+
+  - |
+    Daemons now send ``STOPPING`` and ``RELOADING`` systemd notifications
+    when the service is configured with ``Type=notify``.
+
+  - |
+    Added more metrics to the container-server, allowing GET and PUT timings
+    to be broken out for listings, shard range operations, and container
+    creation.
+
+  - |
+    Added a counter metric to the proxy server when caching shard ranges.
+
+
+  - |
+    ``swift-account-info`` and ``swift-container-info`` now accept a ``--sync``
+    flag to show information from the incoming/outgoing sync tables.
+
+  - |
+    Several fixes to prepare for Python 3.12 support. While not yet tested
+    in the gate, initial manual testing looks promising.
+
+  - |
+    Added support for recent versions of eventlet.
+
+fixes:
+  - |
+    S3 API fixes:
+
+    * When the ``+segments`` container's storage policy differs from that of
+      the primary container, completed manifests are now written with the
+      correct policy in the primary container.
+
+    * If there's a conflict deleting the in-progress-upload marker when
+      completing a multipart-upload, a 503 is now returned to the client,
+      prompting it to retry.
+
+    * Added ``Accept-Ranges: bytes`` to object responses. Range requests
+      have always been supported; now, that support is properly advertised.
+
+  - |
+    Static large object fixes:
+
+    * Fixed a server error when handling conditional GET requests.
+
+    * Return an error if the SLO manifest could not be parsed. Previously,
+      a zero-byte response was returned.
+
+  - |
+    Proxy server fixes:
+
+    * Added a new ``swift.proxy_logging_status`` request environment key that
+      middlewares may use to override the logged status for a request.
+
+    * Transaction IDs are included in more error responses.
+
+    * The ``recoverable_node_timeout`` option no longer applies to
+      ``X-Newest`` GET requests.
+
+    * Improved error-handling in multi-part range responses.
+
+  - |
+    Sharding fixes:
+
+    * Prevent resets of a shard range's epoch.
+
+    * Cleaned up ``X-Backend-*`` headers in listing responses.
+
+    * Reduced the frequency of ``Reclaimable db stuck waiting for shrinking``
+      messages when a root DB has been deleted but its shards have not been
+      shrunk away.
+
+    * The more-efficient shard range structure from the last release is now
+      used when fetching ranges from the backend.
+
+    * Include more information in shard-replication warnings.
+
+  - |
+    Object server fixes:
+
+    * Object POSTs and chunked PUTs are no longer accepted when the target
+      drive is already past its ``fallocate_reserve``. DELETEs are still
+      allowed.
+
+    * Added the ability to configure cooperative yielding when servicing
+      GET responses, via the ``cooperative_period`` option. See the example
+      config for more information.
+
+    * Invalid ``hashes.invalid`` entries are now ignored, rather than
+      causing a complete partition rehash.
+
+  - |
+    Per-service ``auto_create_account_prefix`` configuration options have
+    been removed. These options were deprecated in favor of ``swift.conf``
+    configuration in Swift 2.24.0, part of the OpenStack Ussuri release.
+
+  - |
+    Daemons send object updates via the replication network in more cases.
+
+  - |
+    The dark-data object audit watcher now works with sharded containers.
+    Previously, it would think that all data files were absent from
+    listings.
+
+  - |
+    Various other minor bug fixes and improvements.
diff --git a/releasenotes/notes/release-2.34.0-2136ae35f56f8b5a.yaml b/releasenotes/notes/release-2.34.0-2136ae35f56f8b5a.yaml
new file mode 100644
index 0000000000..56af53eae7
--- /dev/null
+++ b/releasenotes/notes/release-2.34.0-2136ae35f56f8b5a.yaml
@@ -0,0 +1,117 @@
+---
+features:
+  - |
+    Middleware features:
+
+    * The static large object (SLO) middleware now supports including
+      a ``?part-number=<N>`` query parameter to request just part of a
+      large object. This may be used to enable efficient parallel
+      downloads. For more information, see `the documentation
+      <https://docs.openstack.org/swift/latest/overview_large_objects.html#retrieving-a-large-object>`__.
+
+    * The S3 API middleware now supports the ``?partNumber=<N>`` query
+      parameter, enabling parallel downloads.
+
+    * The KMS keymaster now supports overriding the endpoint returned
+      in the Keystone catalog via the ``barbican_endpoint`` configuration
+      option. This may be useful in multi-region deployments which have
+      multiple endpoints.
+
+    * The backend ratelimiter now supports dynamic reloading of limits.
+      The new configuration options ``backend_ratelimit_conf_path`` and
+      ``config_reload_interval`` control which file is reloaded and how
+      frequently, respectively.
+
+    * The backend ratelimiter now supports per-method, per-device
+      ratelimits. See `etc/backend-ratelimit.conf-sample
+      <https://github.com/openstack/swift/blob/master/etc/backend-ratelimit.conf-sample>`__
+      for more information.
+
+    * The account quota middleware now supports object-count quotas
+      in addition to byte-count quotas, similar to the container
+      quota middleware. For more information, see `the documentation
+      <https://docs.openstack.org/swift/latest/middleware.html#module-swift.common.middleware.account_quotas>`__.
+
+  - |
+    Object expiration improvements:
+
+    * Added per-account and per-container reaping delays. These may be
+      used to offer some grace period in which to recover expired objects.
+
+    * Added a proxy-server configuration option: ``allow_open_expired``.
+      This defaults to false; if true, clients may intereact with expired
+      objects by including an ``X-Open-Expired: true`` header in GET, HEAD,
+      or POST requests.
+
+    * Expiring object queue entries now include the size of the object to
+      be expired in the ``swift_expirer_bytes`` parameter of the queue entry's
+      content-type.
+
+    * Added metrics to count skipped, delayed, and assigned tasks as
+      they're enumerated.
+
+  - |
+    S3 API error response reasons are now logged as part of the ``log_info``
+    field. This can be especially useful when diagnosing HEAD
+    failures, which necessarily have no response body.
+
+  - |
+    Python 3.12 is now supported.
+
+  - |
+    ``swift-account-info`` now supports the ``--sync`` option to display the
+    contents of the incoming and outgoing sync tables, similar to
+    ``swift-container-info``.
+
+  - |
+    The ``swift-drive-audit`` tool now works with ISO timestamps in kernel
+    logs.
+
+upgrade:
+  - |
+    Dependency update: lxml must be at least 4.2.3.
+
+deprecations:
+  - |
+    Overall account byte quotas should now be set with the
+    ``X-Account-Quota-Bytes`` header. The ``X-Account-Meta-Quota-Bytes``
+    header is now deprecated.
+
+fixes:
+  - |
+    S3 API fixes:
+
+    * Fixed a server error when using non-ASCII access key IDs.
+
+    * Fixed several checksum-related error responses to be more AWS-like.
+
+  - |
+    Using an ``X-Remove-Account-Quota-Bytes-Policy-<policy name>`` header
+    now removes the per-policy quota, rather than reducing it to zero.
+
+  - |
+    Proxy-server fixes:
+
+    * Object POSTs now 503 rather than trusting the 404s that might be
+      returned from handoffs when primaries are overloaded.
+
+    * Client disconnects should always be logged within the context of
+      the appropriate client request. Previously, there were some cases
+      where logging would occur during general garbage collection, leading
+      to incorrect or missing transaction IDs in logs.
+
+    * The proxy-logging middleware now emits timing and transfer stats for
+      more requests such as auth requests. These will be labeled ``UNKNOWN``
+      rather than ``account``, ``container``, etc.
+
+    * Fixed a server error when the Swift request path has missing account
+      or container components.
+
+  - |
+    ``EUCLEAN`` errors are better handled on the object server.
+
+  - |
+    The ``swift-recon-cron`` tool now better handles missing directories.
+
+  - |
+    Various other minor bug fixes and improvements.
diff --git a/releasenotes/notes/release-2.35.0-bb2736e6cbc4a520.yaml b/releasenotes/notes/release-2.35.0-bb2736e6cbc4a520.yaml
new file mode 100644
index 0000000000..96ea5da750
--- /dev/null
+++ b/releasenotes/notes/release-2.35.0-bb2736e6cbc4a520.yaml
@@ -0,0 +1,109 @@
+---
+features:
+  - |
+    Account listings now include storage policy information for the
+    containers listed.
+
+  - |
+    Added a new object-expirer configuration option,
+    ``round_robin_task_cache_size``, to adjust the number of tasks to cache
+    before processing. This may be used to trade faster expirer start-up for
+    more lumpy container-server load.
+
+  - |
+    Added a ``stale_worker_timeout`` configuration option to the WSGI
+    servers. Once this time elapses following a reload, the manager
+    process will issue SIGKILLs to any remaining stale workers.
+
+  - |
+    Object updater observability improvements:
+
+    * Added last start time to recon dumps as ``object_updater_last``.
+
+    * Added information (including target account/container) from oldest
+      failed updates to recon dumps, both per-device and aggregated for the
+      node. Use the new ``async_tracker_max_entries`` and
+      ``async_tracker_dump_count`` options to adjust how many records to
+      collect.
+
+  - |
+    Added the option to tune down ETag validation in the object-server
+    during full-object reads. By default, every full read will continue
+    to have its ETag validated as bytes are streamed to the proxy-server.
+    The ``etag_validate_pct`` option may be used to configure approximately
+    what percentage of full-object reads should be validated; reducing this
+    can improve performance when object-servers are CPU-constrained.
+
+    Partial reads continue to never have their ETag validated in the
+    object-server. The object-auditor continues to periodically validate
+    every object's ETag.
+
+deprecations:
+  - |
+    The object-expirer configuration options
+    ``expiring_objects_container_divisor`` and
+    ``expiring_objects_account_name`` are now deprecated.
+
+    If a cluster was deployed with a non-standard account name, operators
+    should remove the option from all configs so they are using a supported
+    configuration going forward, but will need to deploy stand-alone expirer
+    processes with legacy expirer config to clean-up old expiration tasks
+    from the previously configured account name.
+
+fixes:
+  - |
+    Removed the use of ``eval`` in the xprofile middleware. Note that this
+    middleware is only intended for development purposes and is not
+    intended for use in production systems.
+
+  - |
+    The S3 API no longer requires a ``Content-MD5`` header for ``DeleteObjects``
+    requests when using v4 signatures.
+
+  - |
+    Uploads to containers with object versioning enabled now require a
+    ``Content-Length`` or ``Transfer-Encoding: chunked`` header, similar to
+    other containers.
+
+  - |
+    Fixed a server error when deleting a specific version via the S3 API.
+
+  - |
+    ``X-Open-Expired`` now works properly with ``?part-number`` requests.
+
+  - |
+    Fixed ``Content-Type`` and ``Content-Length`` headers in account and
+    container ``HEAD`` responses (with eventlet>=0.38.0).
+
+  - |
+    Object expiration fixes:
+
+    * The object-expirer now better handles errors during listings.
+
+    * The object-expirer now respects the ``internal_client_conf_path``
+      configuration option in legacy ``object-expirer.conf`` configs.
+
+  - |
+    Improved the reliability of ``swift-reload``.
+
+  - |
+    Separated unlinks-due-to-outdated-updates from
+    unlinks-due-to-fully-processed-updates in logged object-updater stats.
+
+  - |
+    The ``cooperative_period`` option for the object-server now affects PUT
+    requests in a way similar to GET responses.
+
+  - |
+    Fixed an issue with the object-reconstructor that would prevent
+    reconstruction of objects with non-ASCII header names.
+
+  - |
+    Fixed an issue with the container-reconciler that could cause reconciler
+    databases to have conflicting rows that could not be resolved.
+
+  - |
+    Removed use of the deprecated cgi module.
+
+  - |
+    Various other minor bug fixes and improvements.
diff --git a/releasenotes/notes/release-2.36.0-9f4b539db40bffd7.yaml b/releasenotes/notes/release-2.36.0-9f4b539db40bffd7.yaml
new file mode 100644
index 0000000000..16eb603e2f
--- /dev/null
+++ b/releasenotes/notes/release-2.36.0-9f4b539db40bffd7.yaml
@@ -0,0 +1,88 @@
+---
+features:
+  - |
+    S3 API
+
+    * Added support for aws-chunked transfers. Recent AWS clients recently
+      began defaulting to this mode. See also:
+      `Transferring Payload in Multiple Chunks (Chunked Upload)
+      <https://docs.aws.amazon.com/AmazonS3/latest/API/sigv4-streaming.html>`__.
+
+    * Added support for verifying additional checksums during upload. All
+      algorithms currently supported by AWS are supported: CRC64NVME,
+      CRC32, CRC32C, SHA1, and SHA256. See also: `Checking object integrity
+      in Amazon S3
+      <https://docs.aws.amazon.com/AmazonS3/latest/userguide/checking-object-integrity.html>`__.
+      Note that some algorithms require the availability of additional
+      libraries: ISA-L or anycrc.
+
+    * Added support for create-without-overwrite conditional writes.
+
+  - |
+    Let clients request heartbeats during COPYs by including
+    the query parameter ``heartbeat=on``.
+
+    With heartbeating turned on, the proxy will start its response
+    immediately with 202 Accepted then send a single whitespace
+    character periodically until the request completes. At that
+    point, a final summary chunk will be sent which includes a
+    ``Response Status`` key indicating success or failure.
+
+  - |
+    Labeled metrics
+
+    * Added support for emitting labeled statsd metrics in a variety of
+      formats. Middleware authors should see `the LabeledStatsdClient documentation
+      <https://docs.openstack.org/swift/latest/misc.html#swift.common.statsd_client.LabeledStatsdClient>`__
+      for more information.
+
+    * Instrumented proxy-logging with labeled metrics. See
+      ``proxy-server.conf-sample`` for more information.
+
+    * Instrumented the object-server with labeled metrics. See
+      ``object-server.conf-sample`` for more information.
+
+  - |
+    Added ``access_user_id`` logging field; out-of-tree auth middlewares should
+    use ``environ['swift.access_logging']['user_id']`` to populate this field.
+
+  - |
+    Introduced an extensible ring format. This allows both more than 65,536
+    devices and more data structures to be in a ring. For more information,
+    see `Ring File Formats -- Ring v2
+    <https://docs.openstack.org/swift/latest/overview_ring_format.html#ring-v2>`__.
+
+  - |
+    Python 3.13 (with the GIL enabled) is now supported. Free-threaded
+    builds remain untested.
+upgrade:
+  - |
+    Removed support for Python 3.6.
+
+  - |
+    Removed support for pickled ring files. These have not been written
+    since Swift 1.7.0.
+deprecations:
+  - |
+    Flamingo (2025.2) will be the final stable release to support Python 3.7 and 3.8.
+fixes:
+  - |
+    S3 API
+
+    * Fixed HTTP framing issues when returning errors for a request with
+      ``Expect: 100-continue``.
+
+    * Improved various error messages to better imitate AWS responses.
+
+  - |
+    SSYNC connections are now promptly terminated when subrequests timeout.
+
+  - |
+    Fixed a recursion error in the account-quota middleware.
+
+  - |
+    Fixed an error in ``invalidate_hash`` when the partition is deleted while
+    waiting for the partition lock.
+
+  - |
+    Various other minor bug fixes and improvements.
diff --git a/releasenotes/notes/release-2.37.0-7a89cc30f85f03e0.yaml b/releasenotes/notes/release-2.37.0-7a89cc30f85f03e0.yaml
new file mode 100644
index 0000000000..bb729ad43f
--- /dev/null
+++ b/releasenotes/notes/release-2.37.0-7a89cc30f85f03e0.yaml
@@ -0,0 +1,102 @@
+---
+features:
+  - |
+    The s3token middleware now passes service auth tokens to Keystone
+    if credentials are provided. This is required to enable S3 API
+    access for Keystone users when using Keystone >25.0.0, !=26.0.0,
+    !=26.0.1, !=27.0.0, !=28.0.0. See etc/proxy-server.conf-sample for
+    configuration details. For more information, see
+    `OSSA-2025-002 <https://security.openstack.org/ossa/OSSA-2025-002.html>`__ and
+    `bug #2119646 <https://bugs.launchpad.net/keystone/+bug/2119646>`__.
+
+  - |
+    The s3token middleware now caches credential secrets for one minute
+    by default, if credentials are provided. Secret-caching typically
+    reduces the load on Keystone and is required for Keystone users to
+    be able to use signed aws-chunked transfers. To return to prior
+    behavior, explicitly set ``secret_cache_duration = 0`` in the
+    ``[filter:s3api]`` section of your proxy-server.conf.
+
+  - |
+    The KMS keymaster now supports selecting the endpoint returned in the
+    Keystone catalog via the ``barbican_region_name`` configuration option.
+    This may be useful in multi-region deployments which have multiple
+    endpoints.
+
+  - |
+    The request line-length limit is now configurable for all WSGI servers
+    via the ``max_request_line`` option in the ``[swift-constraints]`` section
+    of swift.conf. By default, continue to use eventlet's default of 8192
+    bytes.
+
+  - |
+    The following new metrics were added when using labeled metrics:
+
+      * The proxy-logging middleware may now emit real-time transfer metrics.
+        See the ``statsd_emit_buffer_xfer_bytes_seconds`` option in
+        etc/proxy-server.conf-sample for more information.
+
+      * The proxy-logging middleware now includes an ``api`` label whose value
+        may be ``swift`` or ``S3`` depending on whether the client request is
+        serviced by the swift API or S3 API.
+
+      * The s3api middleware now emits a counter recording the usage of
+        various protocol-related headers.
+
+      * The container-sharder now emits a timing metric for the length of
+        time between shard range creation and cleaving.
+
+  - |
+    ``swift-manage-shard-ranges`` now defaults to committing pending
+    updates before looking for shard range boundaries. A new option,
+    ``--skip-commits``, may be used to restore previous behavior.
+
+  - |
+    Added a ``--clobber-hardlink-collisions`` option to ``swift-object-relinker``.
+    With this option enabled during the relink phase the relinker will
+    quarantine the colliding file in the new target part dir and retry the
+    relink. During the cleanup phase it will ignore the un-matched inode
+    "collision" and allow the cleanup of the old file in the old part dir
+    similar to tombstones.
+
+upgrade:
+  - |
+    Removed fallback support using netifaces; ``getifaddrs`` is now always
+    used to determine available IP addresses.
+
+fixes:
+  - |
+    Improved checksum validation for S3 API DeleteObjects requests.
+
+  - |
+    POST requests are more likely to receive a 503 response in the
+    face of backend inconsistencies.
+
+  - |
+    Writes to sharded containers are less likely to have their updates
+    sent to the root container. This uses a new cooperative-token
+    mechanism to limit the number of concurrent shard range queries
+    to the root container; see the ``[app:proxy-server]`` section of
+    etc/proxy-server.conf-sample for configuration options.
+
+  - |
+    Fixed the ``swift_dir`` option for WSGI servers; the file
+    ``/etc/swift/swift.conf`` no longer needs to exist when that option
+    is set.
+
+  - |
+    Fixed an object-server error when there is a part-power increase in
+    progress and there was an issue marking the file in the new partition
+    space as durable.
+
+  - |
+    Device names are now included in sharded database IDs, similar to
+    regular databases. This provides more context when examining
+    incoming/outgoing sync tables or sharding CleaveContexts.
+
+  - |
+    Database replicators now clean up temporary files older than
+    ``reclaim_age``.
+
+  - |
+    Various other minor bug fixes and improvements.
diff --git a/releasenotes/source/2023.1.rst b/releasenotes/source/2023.1.rst
new file mode 100644
index 0000000000..2c9a36fae4
--- /dev/null
+++ b/releasenotes/source/2023.1.rst
@@ -0,0 +1,6 @@
+===========================
+2023.1 Series Release Notes
+===========================
+
+.. release-notes::
+   :branch: unmaintained/2023.1
diff --git a/releasenotes/source/2023.2.rst b/releasenotes/source/2023.2.rst
new file mode 100644
index 0000000000..a4838d7d0e
--- /dev/null
+++ b/releasenotes/source/2023.2.rst
@@ -0,0 +1,6 @@
+===========================
+2023.2 Series Release Notes
+===========================
+
+.. release-notes::
+   :branch: stable/2023.2
diff --git a/releasenotes/source/2024.1.rst b/releasenotes/source/2024.1.rst
new file mode 100644
index 0000000000..6896656be6
--- /dev/null
+++ b/releasenotes/source/2024.1.rst
@@ -0,0 +1,6 @@
+===========================
+2024.1 Series Release Notes
+===========================
+
+.. release-notes::
+   :branch: unmaintained/2024.1
diff --git a/releasenotes/source/2024.2.rst b/releasenotes/source/2024.2.rst
new file mode 100644
index 0000000000..aaebcbc8c3
--- /dev/null
+++ b/releasenotes/source/2024.2.rst
@@ -0,0 +1,6 @@
+===========================
+2024.2 Series Release Notes
+===========================
+
+.. release-notes::
+   :branch: stable/2024.2
diff --git a/releasenotes/source/2025.1.rst b/releasenotes/source/2025.1.rst
new file mode 100644
index 0000000000..3add0e53aa
--- /dev/null
+++ b/releasenotes/source/2025.1.rst
@@ -0,0 +1,6 @@
+===========================
+2025.1 Series Release Notes
+===========================
+
+.. release-notes::
+   :branch: stable/2025.1
diff --git a/releasenotes/source/2025.2.rst b/releasenotes/source/2025.2.rst
new file mode 100644
index 0000000000..4dae18d869
--- /dev/null
+++ b/releasenotes/source/2025.2.rst
@@ -0,0 +1,6 @@
+===========================
+2025.2 Series Release Notes
+===========================
+
+.. release-notes::
+   :branch: stable/2025.2
diff --git a/releasenotes/source/conf.py b/releasenotes/source/conf.py
new file mode 100644
index 0000000000..401a53ab98
--- /dev/null
+++ b/releasenotes/source/conf.py
@@ -0,0 +1,353 @@
+# -*- coding: utf-8 -*-
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+# swift documentation build configuration file, created by
+# sphinx-quickstart on Mon Oct  3 17:01:55 2016.
+#
+# This file is execfile()d with the current directory set to its
+# containing dir.
+#
+# Note that not all possible configuration values are present in this
+# autogenerated file.
+#
+# All configuration values have a default; values that are commented out
+# serve to show the default.
+
+# If extensions (or modules to document with autodoc) are in another directory,
+# add these directories to sys.path here. If the directory is relative to the
+# documentation root, use os.path.abspath to make it absolute, like shown here.
+#
+# import os
+# import sys
+# sys.path.insert(0, os.path.abspath('.'))
+
+import datetime
+
+# -- General configuration ------------------------------------------------
+
+# If your documentation needs a minimal Sphinx version, state it here.
+#
+# needs_sphinx = '1.0'
+
+# Add any Sphinx extension module names here, as strings. They can be
+# extensions coming with Sphinx (named 'sphinx.ext.*') or your custom
+# ones.
+extensions = [
+    'reno.sphinxext',
+    'openstackdocstheme',
+]
+
+# Add any paths that contain templates here, relative to this directory.
+# templates_path = ['_templates']
+
+# The suffix(es) of source filenames.
+# You can specify multiple suffix as a list of string:
+#
+# source_suffix = ['.rst', '.md']
+source_suffix = '.rst'
+
+# The encoding of source files.
+#
+# source_encoding = 'utf-8-sig'
+
+# The master toctree document.
+master_doc = 'index'
+
+# General information about the project.
+project = 'Swift Release Notes'
+copyright = '%d, OpenStack Foundation' % datetime.datetime.now().year
+
+# Release notes do not need a version number in the title, they
+# cover multiple releases.
+# The short X.Y version.
+version = ''
+# The full version, including alpha/beta/rc tags.
+release = ''
+
+# The language for content autogenerated by Sphinx. Refer to documentation
+# for a list of supported languages.
+#
+# This is also used if you do content translation via gettext catalogs.
+# Usually you set "language" from the command line for these cases.
+# language = None
+
+# There are two options for replacing |today|: either, you set today to some
+# non-false value, then it is used:
+#
+# today = ''
+#
+# Else, today_fmt is used as the format for a strftime call.
+#
+# today_fmt = '%B %d, %Y'
+
+# List of patterns, relative to source directory, that match files and
+# directories to ignore when looking for source files.
+# This patterns also effect to html_static_path and html_extra_path
+exclude_patterns = ['_build', 'Thumbs.db', '.DS_Store']
+
+# The reST default role (used for this markup: `text`) to use for all
+# documents.
+#
+# default_role = None
+
+# If true, '()' will be appended to :func: etc. cross-reference text.
+#
+# add_function_parentheses = True
+
+# If true, the current module name will be prepended to all description
+# unit titles (such as .. function::).
+#
+# add_module_names = True
+
+# If true, sectionauthor and moduleauthor directives will be shown in the
+# output. They are ignored by default.
+#
+# show_authors = False
+
+# The name of the Pygments (syntax highlighting) style to use.
+pygments_style = 'native'
+
+# A list of ignored prefixes for module index sorting.
+# modindex_common_prefix = []
+
+# If true, keep warnings as "system message" paragraphs in the built documents.
+# keep_warnings = False
+
+# If true, `todo` and `todoList` produce output, else they produce nothing.
+# todo_include_todos = False
+
+
+# -- Options for HTML output ----------------------------------------------
+
+# The theme to use for HTML and HTML Help pages.  See the documentation for
+# a list of builtin themes.
+html_theme = 'openstackdocs'
+
+# Theme options are theme-specific and customize the look and feel of a theme
+# further.  For a list of options available for each theme, see the
+# documentation.
+#
+# html_theme_options = {}
+
+# Add any paths that contain custom themes here, relative to this directory.
+# html_theme_path = []
+
+# The name for this set of Sphinx documents.
+# "<project> v<release> documentation" by default.
+#
+# html_title = u'swift v2.10.0'
+
+# A shorter title for the navigation bar.  Default is the same as html_title.
+#
+# html_short_title = None
+
+# The name of an image file (relative to this directory) to place at the top
+# of the sidebar.
+#
+# html_logo = None
+
+# The name of an image file (relative to this directory) to use as a favicon of
+# the docs.  This file should be a Windows icon file (.ico) being 16x16 or
+# 32x32 pixels large.
+#
+# html_favicon = None
+
+# Add any paths that contain custom static files (such as style sheets) here,
+# relative to this directory. They are copied after the builtin static files,
+# so a file named "default.css" will overwrite the builtin "default.css".
+# html_static_path = ['_static']
+
+# Add any extra paths that contain custom files (such as robots.txt or
+# .htaccess) here, relative to this directory. These files are copied
+# directly to the root of the documentation.
+#
+# html_extra_path = []
+
+# If true, SmartyPants will be used to convert quotes and dashes to
+# typographically correct entities.
+#
+# html_use_smartypants = True
+
+# Custom sidebar templates, maps document names to template names.
+#
+# html_sidebars = {}
+
+# Additional templates that should be rendered to pages, maps page names to
+# template names.
+#
+# html_additional_pages = {}
+
+# If false, no module index is generated.
+#
+# html_domain_indices = True
+
+# If false, no index is generated.
+#
+# html_use_index = True
+
+# If true, the index is split into individual pages for each letter.
+#
+# html_split_index = False
+
+# If true, links to the reST sources are added to the pages.
+#
+# html_show_sourcelink = True
+
+# If true, "Created using Sphinx" is shown in the HTML footer. Default is True.
+#
+# html_show_sphinx = True
+
+# If true, "(C) Copyright ..." is shown in the HTML footer. Default is True.
+#
+# html_show_copyright = True
+
+# If true, an OpenSearch description file will be output, and all pages will
+# contain a <link> tag referring to it.  The value of this option must be the
+# base URL from which the finished HTML is served.
+#
+# html_use_opensearch = ''
+
+# This is the file name suffix for HTML files (e.g. ".xhtml").
+# html_file_suffix = None
+
+# Language to be used for generating the HTML full-text search index.
+# Sphinx supports the following languages:
+#   'da', 'de', 'en', 'es', 'fi', 'fr', 'hu', 'it', 'ja'
+#   'nl', 'no', 'pt', 'ro', 'ru', 'sv', 'tr', 'zh'
+#
+# html_search_language = 'en'
+
+# A dictionary with options for the search language support, empty by default.
+# 'ja' uses this config value.
+# 'zh' user can custom change `jieba` dictionary path.
+#
+# html_search_options = {'type': 'default'}
+
+# The name of a javascript file (relative to the configuration directory) that
+# implements a search results scorer. If empty, the default will be used.
+#
+# html_search_scorer = 'scorer.js'
+
+# Output file base name for HTML help builder.
+htmlhelp_basename = 'SwiftReleaseNotesdoc'
+
+# -- Options for LaTeX output ---------------------------------------------
+
+# latex_elements = {
+#      # The paper size ('letterpaper' or 'a4paper').
+#      #
+#      # 'papersize': 'letterpaper',
+
+#      # The font size ('10pt', '11pt' or '12pt').
+#      #
+#      # 'pointsize': '10pt',
+
+#      # Additional stuff for the LaTeX preamble.
+#      #
+#      # 'preamble': '',
+
+#      # Latex figure (float) alignment
+#      #
+#      # 'figure_align': 'htbp',
+# }
+
+# Grouping the document tree into LaTeX files. List of tuples
+# (source start file, target name, title,
+#  author, documentclass [howto, manual, or own class]).
+# latex_documents = [
+#     (master_doc, 'swift.tex', u'swift Documentation',
+#      u'swift', 'manual'),
+# ]
+
+# The name of an image file (relative to this directory) to place at the top of
+# the title page.
+#
+# latex_logo = None
+
+# For "manual" documents, if this is true, then toplevel headings are parts,
+# not chapters.
+#
+# latex_use_parts = False
+
+# If true, show page references after internal links.
+#
+# latex_show_pagerefs = False
+
+# If true, show URL addresses after external links.
+#
+# latex_show_urls = False
+
+# Documents to append as an appendix to all manuals.
+#
+# latex_appendices = []
+
+# It false, will not define \strong, \code, 	itleref, \crossref ... but only
+# \sphinxstrong, ..., \sphinxtitleref, ... To help avoid clash with user added
+# packages.
+#
+# latex_keep_old_macro_names = True
+
+# If false, no module index is generated.
+#
+# latex_domain_indices = True
+
+
+# -- Options for manual page output ---------------------------------------
+
+# One entry per manual page. List of tuples
+# (source start file, name, description, authors, manual section).
+# man_pages = [
+#     (master_doc, 'swift', u'swift Documentation',
+#      [author], 1)
+# ]
+
+# If true, show URL addresses after external links.
+#
+# man_show_urls = False
+
+
+# -- Options for Texinfo output -------------------------------------------
+
+# Grouping the document tree into Texinfo files. List of tuples
+# (source start file, target name, title, author,
+#  dir menu entry, description, category)
+# texinfo_documents = [
+#     (master_doc, 'swift', u'swift Documentation',
+#      author, 'swift', 'One line description of project.',
+#      'Miscellaneous'),
+# ]
+
+# Documents to append as an appendix to all manuals.
+#
+# texinfo_appendices = []
+
+# If false, no module index is generated.
+#
+# texinfo_domain_indices = True
+
+# How to display URL addresses: 'footnote', 'no', or 'inline'.
+#
+# texinfo_show_urls = 'footnote'
+
+# If true, do not generate a @detailmenu in the "Top" node's menu.
+#
+# texinfo_no_detailmenu = False
+
+locale_dirs = ['locale/']
+
+# -- Options for openstackdocstheme -------------------------------------------
+openstackdocs_repo_name = 'openstack/swift'
+openstackdocs_auto_name = False
+openstackdocs_bug_project = 'swift'
+openstackdocs_bug_tag = ''
diff --git a/releasenotes/source/current.rst b/releasenotes/source/current.rst
new file mode 100644
index 0000000000..87a748f242
--- /dev/null
+++ b/releasenotes/source/current.rst
@@ -0,0 +1,5 @@
+====================================
+ Current (Unreleased) Release Notes
+====================================
+
+.. release-notes::
diff --git a/releasenotes/source/index.rst b/releasenotes/source/index.rst
new file mode 100644
index 0000000000..823ce4a5fe
--- /dev/null
+++ b/releasenotes/source/index.rst
@@ -0,0 +1,27 @@
+=====================
+ Swift Release Notes
+=====================
+
+.. toctree::
+   :maxdepth: 1
+
+   current
+   2025.2
+   2025.1
+   2024.2
+   2024.1
+   2023.2
+   2023.1
+   zed
+   yoga
+   xena
+   wallaby
+   victoria
+   ussuri
+   train
+   stein
+   rocky
+   queens
+   pike
+   ocata
+   newton
diff --git a/releasenotes/source/locale/en_GB/LC_MESSAGES/releasenotes.po b/releasenotes/source/locale/en_GB/LC_MESSAGES/releasenotes.po
new file mode 100644
index 0000000000..1cb7513bad
--- /dev/null
+++ b/releasenotes/source/locale/en_GB/LC_MESSAGES/releasenotes.po
@@ -0,0 +1,4207 @@
+# Andi Chandler <andi@gowling.com>, 2017. #zanata
+# Andi Chandler <andi@gowling.com>, 2018. #zanata
+# Andi Chandler <andi@gowling.com>, 2020. #zanata
+# Andi Chandler <andi@gowling.com>, 2022. #zanata
+# Andi Chandler <andi@gowling.com>, 2023. #zanata
+# Andi Chandler <andi@gowling.com>, 2024. #zanata
+msgid ""
+msgstr ""
+"Project-Id-Version: Swift Release Notes\n"
+"Report-Msgid-Bugs-To: \n"
+"POT-Creation-Date: 2025-07-07 19:19+0000\n"
+"MIME-Version: 1.0\n"
+"Content-Type: text/plain; charset=UTF-8\n"
+"Content-Transfer-Encoding: 8bit\n"
+"PO-Revision-Date: 2024-10-01 01:42+0000\n"
+"Last-Translator: Andi Chandler <andi@gowling.com>\n"
+"Language-Team: English (United Kingdom)\n"
+"Language: en_GB\n"
+"X-Generator: Zanata 4.3.3\n"
+"Plural-Forms: nplurals=2; plural=(n != 1)\n"
+
+msgid ""
+"**Dependency update**: ``eventlet`` must be at least 0.25.0. This also "
+"dragged forward minimum-supported versions of ``dnspython`` (1.15.0), "
+"``greenlet`` (0.3.2), and ``six`` (1.10.0)."
+msgstr ""
+"**Dependency update**: ``eventlet`` must be at least 0.25.0. This also "
+"dragged forward minimum-supported versions of ``dnspython`` (1.15.0), "
+"``greenlet`` (0.3.2), and ``six`` (1.10.0)."
+
+msgid ""
+"**Dependency updates**: we've increased our minimum supported version of "
+"``cryptography`` to 2.0.2 and ``netifaces`` to 0.8. This is largely due to "
+"the difficulty of continuing to test with the old versions."
+msgstr ""
+"**Dependency updates**: we've increased our minimum supported version of "
+"``cryptography`` to 2.0.2 and ``netifaces`` to 0.8. This is largely due to "
+"the difficulty of continuing to test with the old versions."
+
+msgid ""
+"**If your cluster has encryption enabled and is still running Swift under "
+"Python 2**, we recommend upgrading Swift *before* transitioning to Python 3. "
+"Otherwise, new writes to objects with non-ASCII characters in their paths "
+"may result in corrupted downloads when read from a proxy-server still "
+"running old swift on Python 2. See `bug 1888037 <https://bugs.launchpad.net/"
+"swift/+bug/1888037>`__ for more information."
+msgstr ""
+"**If your cluster has encryption enabled and is still running Swift under "
+"Python 2**, we recommend upgrading Swift *before* transitioning to Python 3. "
+"Otherwise, new writes to objects with non-ASCII characters in their paths "
+"may result in corrupted downloads when read from a proxy-server still "
+"running old swift on Python 2. See `bug 1888037 <https://bugs.launchpad.net/"
+"swift/+bug/1888037>`__ for more information."
+
+msgid ""
+"**If your cluster has encryption enabled and is still running Swift under "
+"Python 2**, we recommend upgrading Swift *before* transitioning to Python 3. "
+"Otherwise, new writes to objects with non-ASCII characters in their paths "
+"may result in corrupted downloads when read from a proxy-server still "
+"running old swift on Python 2. See `bug 1888037 <https://bugs.launchpad.net/"
+"swift/+bug/1888037>`__ for more information. Note that new tags including a "
+"fix for the bug are planned for all maintained stable branches; upgrading to "
+"any one of those should be sufficient to ensure a smooth upgrade to the "
+"latest Swift."
+msgstr ""
+"**If your cluster has encryption enabled and is still running Swift under "
+"Python 2**, we recommend upgrading Swift *before* transitioning to Python 3. "
+"Otherwise, new writes to objects with non-ASCII characters in their paths "
+"may result in corrupted downloads when read from a proxy-server still "
+"running old swift on Python 2. See `bug 1888037 <https://bugs.launchpad.net/"
+"swift/+bug/1888037>`__ for more information. Note that new tags including a "
+"fix for the bug are planned for all maintained stable branches; upgrading to "
+"any one of those should be sufficient to ensure a smooth upgrade to the "
+"latest Swift."
+
+msgid ""
+"**If your cluster is configured with a separate replication network**, note "
+"that background daemons will switch to using this network for all traffic. "
+"If your account, container, or object replication servers are configured "
+"with ``replication_server = true``, these daemons may log a flood of ``405 "
+"Method Not Allowed`` messages during a rolling upgrade. To avoid this, "
+"comment out the option and restart replication servers before upgrading."
+msgstr ""
+"**If your cluster is configured with a separate replication network**, note "
+"that background daemons will switch to using this network for all traffic. "
+"If your account, container, or object replication servers are configured "
+"with ``replication_server = true``, these daemons may log a flood of ``405 "
+"Method Not Allowed`` messages during a rolling upgrade. To avoid this, "
+"comment out the option and restart replication servers before upgrading."
+
+msgid "0 for success"
+msgstr "0 for success"
+
+msgid "1 for an unexpected outcome"
+msgstr "1 for an unexpected outcome"
+
+msgid "2 for invalid options"
+msgstr "2 for invalid options"
+
+msgid "2.10.0"
+msgstr "2.10.0"
+
+msgid "2.10.1"
+msgstr "2.10.1"
+
+msgid "2.10.2"
+msgstr "2.10.2"
+
+msgid "2.11.0"
+msgstr "2.11.0"
+
+msgid "2.12.0"
+msgstr "2.12.0"
+
+msgid "2.13.0"
+msgstr "2.13.0"
+
+msgid "2.13.1"
+msgstr "2.13.1"
+
+msgid "2.13.1-12"
+msgstr "2.13.1-12"
+
+msgid "2.14.0"
+msgstr "2.14.0"
+
+msgid "2.15.0"
+msgstr "2.15.0"
+
+msgid "2.15.1"
+msgstr "2.15.1"
+
+msgid "2.15.2"
+msgstr "2.15.2"
+
+msgid "2.16.0"
+msgstr "2.16.0"
+
+msgid "2.17.0"
+msgstr "2.17.0"
+
+msgid "2.17.1"
+msgstr "2.17.1"
+
+msgid "2.18.0"
+msgstr "2.18.0"
+
+msgid "2.19.0"
+msgstr "2.19.0"
+
+msgid "2.19.1"
+msgstr "2.19.1"
+
+msgid "2.19.2"
+msgstr "2.19.2"
+
+msgid "2.20.0"
+msgstr "2.20.0"
+
+msgid "2.21.0"
+msgstr "2.21.0"
+
+msgid "2.21.1"
+msgstr "2.21.1"
+
+msgid "2.22.0"
+msgstr "2.22.0"
+
+msgid "2.23.0"
+msgstr "2.23.0"
+
+msgid "2.23.1"
+msgstr "2.23.1"
+
+msgid "2.23.2"
+msgstr "2.23.2"
+
+msgid "2.23.3"
+msgstr "2.23.3"
+
+msgid "2.24.0"
+msgstr "2.24.0"
+
+msgid "2.25.0"
+msgstr "2.25.0"
+
+msgid "2.25.1"
+msgstr "2.25.1"
+
+msgid "2.26.0"
+msgstr "2.26.0"
+
+msgid "2.27.0"
+msgstr "2.27.0"
+
+msgid "2.28.0"
+msgstr "2.28.0"
+
+msgid "2.28.1"
+msgstr "2.28.1"
+
+msgid "2.29.1"
+msgstr "2.29.1"
+
+msgid "2.29.2"
+msgstr "2.29.2"
+
+msgid "2.30.0"
+msgstr "2.30.0"
+
+msgid "2.30.1"
+msgstr "2.30.1"
+
+msgid "2.31.1"
+msgstr "2.31.1"
+
+msgid "2.32.0"
+msgstr "2.32.0"
+
+msgid "2.33.0"
+msgstr "2.33.0"
+
+msgid "2.34.0"
+msgstr "2.34.0"
+
+msgid "2023.1 Series Release Notes"
+msgstr "2023.1 Series Release Notes"
+
+msgid "2023.2 Series Release Notes"
+msgstr "2023.2 Series Release Notes"
+
+msgid "2024.1 Series Release Notes"
+msgstr "2024.1 Series Release Notes"
+
+msgid "3 for user exit"
+msgstr "3 for user exit"
+
+msgid ""
+"A 'compact' command has been added to ``swift-manage-shard-ranges`` that "
+"enables sequences of contiguous shards with low object counts to be "
+"compacted into another existing shard, or into the root container."
+msgstr ""
+"A 'compact' command has been added to ``swift-manage-shard-ranges`` that "
+"enables sequences of contiguous shards with low object counts to be "
+"compacted into another existing shard, or into the root container."
+
+msgid ""
+"A PUT or POST to a container will now update the container's Last-Modified "
+"time, and that value will be included in a GET/HEAD response."
+msgstr ""
+"A PUT or POST to a container will now update the container's Last-Modified "
+"time, and that value will be included in a GET/HEAD response."
+
+msgid ""
+"A ``--no-auto-shard`` option has been added to ``swift-container-sharder``."
+msgstr ""
+"A ``--no-auto-shard`` option has been added to ``swift-container-sharder``."
+
+msgid ""
+"A comparable group, ``.reseller_reader``, is now available for development "
+"purposes when authenticating using tempauth."
+msgstr ""
+"A comparable group, ``.reseller_reader``, is now available for development "
+"purposes when authenticating using tempauth."
+
+msgid ""
+"A composite ring comprises two or more component rings that are combined to "
+"form a single ring with a replica count equal to the sum of the component "
+"rings. The component rings are built independently, using distinct devices "
+"in distinct regions, which means that the dispersion of replicas between the "
+"components can be guaranteed."
+msgstr ""
+"A composite ring comprises two or more component rings that are combined to "
+"form a single ring with a replica count equal to the sum of the component "
+"rings. The component rings are built independently, using distinct devices "
+"in distinct regions, which means that the dispersion of replicas between the "
+"components can be guaranteed."
+
+msgid ""
+"A new ``item_size_warning_threshold`` option may be used to monitor for "
+"values that are approaching the limit of what can be stored in memcache. See "
+"the memcache sample config for more information."
+msgstr ""
+"A new ``item_size_warning_threshold`` option may be used to monitor for "
+"values that are approaching the limit of what can be stored in memcache. See "
+"the memcache sample config for more information."
+
+msgid ""
+"A variety of performance improvements have been made for sharded container "
+"databases."
+msgstr ""
+"A variety of performance improvements have been made for sharded container "
+"databases."
+
+msgid "ACLs now work with unicode in user/account names."
+msgstr "ACLs now work with Unicode in user/account names."
+
+msgid ""
+"Accept a trade off of dispersion for balance in the ring builder that will "
+"result in getting to balanced rings much more quickly in some cases."
+msgstr ""
+"Accept a trade off of dispersion for balance in the ring builder that will "
+"result in getting to balanced rings much more quickly in some cases."
+
+msgid ""
+"Account and container databases will now be quarantined if the database "
+"schema has been corrupted."
+msgstr ""
+"Account and container databases will now be quarantined if the database "
+"schema has been corrupted."
+
+msgid ""
+"Account and container info metrics now include the response status code when "
+"backend requests are made."
+msgstr ""
+"Account and container info metrics now include the response status code when "
+"backend requests are made."
+
+msgid ""
+"Account and container replication stats logs now include ``remote_merges``, "
+"the number of times a whole database was sent to another node."
+msgstr ""
+"Account and container replication stats logs now include ``remote_merges``, "
+"the number of times a whole database was sent to another node."
+
+msgid ""
+"Account and container replicators can now be configured with a "
+"``handoff_delete`` option, similar to object replicators and reconstructors. "
+"See the sample config for more information."
+msgstr ""
+"Account and container replicators can now be configured with a "
+"``handoff_delete`` option, similar to object replicators and reconstructors. "
+"See the sample config for more information."
+
+msgid "Account quotas are now enforced even on empty accounts."
+msgstr "Account quotas are now enforced even on empty accounts."
+
+msgid ""
+"Account, container, and object log fields are now correctly identified when "
+"returning ``BadDigest`` responses to S3 requests."
+msgstr ""
+"Account, container, and object log fields are now correctly identified when "
+"returning ``BadDigest`` responses to S3 requests."
+
+msgid "Add Composite Ring Functionality"
+msgstr "Add Composite Ring Functionality"
+
+msgid "Add Vary headers for CORS responses."
+msgstr "Add Vary headers for CORS responses."
+
+msgid ""
+"Add ``databases_per_second`` to the account-replicator, container-"
+"replicator, and container-sharder. This prevents them from using a full CPU "
+"core when they are not IO limited."
+msgstr ""
+"Add ``databases_per_second`` to the account-replicator, container-"
+"replicator, and container-sharder. This prevents them from using a full CPU "
+"core when they are not IO limited."
+
+msgid ""
+"Add a ``--drop-prefixes`` flag to swift-account-info, swift-container-info, "
+"and swift-object-info. This makes the output between the three more "
+"consistent."
+msgstr ""
+"Add a ``--drop-prefixes`` flag to swift-account-info, swift-container-info, "
+"and swift-object-info. This makes the output between the three more "
+"consistent."
+
+msgid ""
+"Add a multiprocess mode to the object replicator. Setting the "
+"``replicator_workers`` setting to a positive value N will result in the "
+"replicator using up to N worker processes to perform replication tasks. At "
+"most one worker per disk will be spawned."
+msgstr ""
+"Add a multiprocess mode to the object replicator. Setting the "
+"``replicator_workers`` setting to a positive value N will result in the "
+"replicator using up to N worker processes to perform replication tasks. At "
+"most one worker per disk will be spawned."
+
+msgid ""
+"Add a new ``concurrent_ec_extra_requests`` option to allow the proxy to make "
+"some extra backend requests immediately. The proxy will respond as soon as "
+"there are enough responses available to reconstruct."
+msgstr ""
+"Add a new ``concurrent_ec_extra_requests`` option to allow the proxy to make "
+"some extra backend requests immediately. The proxy will respond as soon as "
+"there are enough responses available to reconstruct."
+
+msgid ""
+"Add basic read support for S3 object locking. This improves compatibility "
+"with an Ansible S3 module. Write support is not yet implemented, so get-"
+"object-lock-configuration will always 404."
+msgstr ""
+"Add basic read support for S3 object locking. This improves compatibility "
+"with an Ansible S3 module. Write support is not yet implemented, so get-"
+"object-lock-configuration will always 404."
+
+msgid ""
+"Add basic read support for object tagging. This improves compatibility with "
+"AWS CLI version 2. Write support is not yet implemented, so the tag set will "
+"always be empty."
+msgstr ""
+"Add basic read support for object tagging. This improves compatibility with "
+"AWS CLI version 2. Write support is not yet implemented, so the tag set will "
+"always be empty."
+
+msgid ""
+"Add basic support for ?versions bucket listings. We still do not have "
+"support for toggling S3 bucket versioning, but we can at least support "
+"getting the latest versions of all objects."
+msgstr ""
+"Add basic support for ?versions bucket listings. We still do not have "
+"support for toggling S3 bucket versioning, but we can at least support "
+"getting the latest versions of all objects."
+
+msgid "Add checksum to object extended attributes."
+msgstr "Add checksum to object extended attributes."
+
+msgid ""
+"Add fallocate_reserve to account and container servers. This allows disks "
+"shared between account/container and object rings to avoid getting 100% "
+"full. The default value of 1% matches the existing default on object servers."
+msgstr ""
+"Add fallocate_reserve to account and container servers. This allows disks "
+"shared between account/container and object rings to avoid getting 100% "
+"full. The default value of 1% matches the existing default on object servers."
+
+msgid "Add root containers with compactible ranges to recon cache."
+msgstr "Add root containers with compatible ranges to recon cache."
+
+msgid ""
+"Add slo_manifest_hook callback to allow other middlewares to impose "
+"additional constraints on or make edits to SLO manifests before being "
+"written. For example, a middleware could enforce minimum segment size or "
+"insert data segments."
+msgstr ""
+"Add slo_manifest_hook callback to allow other middlewares to impose "
+"additional constraints on or make edits to SLO manifests before being "
+"written. For example, a middleware could enforce minimum segment size or "
+"insert data segments."
+
+msgid ""
+"Add support for PROXY protocol v1 to the proxy server. This allows the Swift "
+"proxy server to log accurate client IP addresses when there is a proxy or "
+"SSL-terminator between the client and the Swift proxy server.  Example "
+"servers supporting this PROXY protocol include stunnel, haproxy, hitch, and "
+"varnish. See the sample proxy server config file for the appropriate config "
+"setting to enable or disable this functionality."
+msgstr ""
+"Add support for PROXY protocol v1 to the proxy server. This allows the Swift "
+"proxy server to log accurate client IP addresses when there is a proxy or "
+"SSL-terminator between the client and the Swift proxy server.  Example "
+"servers supporting this PROXY protocol include stunnel, HAProxy, hitch, and "
+"Varnish. See the sample proxy server config file for the appropriate config "
+"setting to enable or disable this functionality."
+
+msgid ""
+"Add support for multiple root encryption secrets for the trivial and KMIP "
+"keymasters. This allows operators to rotate encryption keys over time "
+"without needing to re-encrypt all existing data in the cluster. Please see "
+"the included sample config files for instructions on how to multiple "
+"encryption keys."
+msgstr ""
+"Add support for multiple root encryption secrets for the trivial and KMIP "
+"keymasters. This allows operators to rotate encryption keys over time "
+"without needing to re-encrypt all existing data in the cluster. Please see "
+"the included sample config files for instructions on how to multiple "
+"encryption keys."
+
+msgid ""
+"Add support to increase object ring partition power transparently to end "
+"users and with no cluster downtime. Increasing the ring part power allows "
+"for incremental adjustment to the upper bound of the cluster size. Please "
+"review the `full docs <https://docs.openstack.org/swift/latest/"
+"ring_partpower.html>`__ for more information."
+msgstr ""
+"Add support to increase object ring partition power transparently to end "
+"users and with no cluster downtime. Increasing the ring part power allows "
+"for incremental adjustment to the upper bound of the cluster size. Please "
+"review the `full docs <https://docs.openstack.org/swift/latest/"
+"ring_partpower.html>`__ for more information."
+
+msgid ""
+"Added \"audit watcher\" hooks to allow operators to run arbitrary code "
+"against every diskfile in a cluster. For more information, see `the "
+"documentation <https://docs.openstack.org/swift/latest/development_watchers."
+"html>`__."
+msgstr ""
+"Added \"audit watcher\" hooks to allow operators to run arbitrary code "
+"against every diskfile in a cluster. For more information, see `the "
+"documentation <https://docs.openstack.org/swift/latest/development_watchers."
+"html>`__."
+
+msgid ""
+"Added \"emergency mode\" hooks in the account and container replicators. "
+"These options may be used to prioritize moving handoff partitions to primary "
+"locations more quickly. This helps when adding capacity to a ring."
+msgstr ""
+"Added \"emergency mode\" hooks in the account and container replicators. "
+"These options may be used to prioritise moving handoff partitions to primary "
+"locations more quickly. This helps when adding capacity to a ring."
+
+msgid ""
+"Added \"static symlinks\", which perform some validation as they follow "
+"redirects and include more information about their target in container "
+"listings. For more information, see the `symlink middleware <https://docs."
+"openstack.org/swift/latest/middleware.html#symlink>`__ section of the "
+"documentation."
+msgstr ""
+"Added \"static symlinks\", which perform some validation as they follow "
+"redirects and include more information about their target in container "
+"listings. For more information, see the `symlink middleware <https://docs."
+"openstack.org/swift/latest/middleware.html#symlink>`__ section of the "
+"documentation."
+
+msgid ""
+"Added ``--swift-versions`` to ``swift-recon`` CLI to compare installed "
+"versions in the cluster."
+msgstr ""
+"Added ``--swift-versions`` to ``swift-recon`` CLI to compare installed "
+"versions in the cluster."
+
+msgid "Added ``-d <devs>`` and ``-p <partitions>`` command line options."
+msgstr "Added ``-d <devs>`` and ``-p <partitions>`` command line options."
+
+msgid ""
+"Added ``Accept-Ranges: bytes`` to object responses. Range requests have "
+"always been supported; now, that support is properly advertised."
+msgstr ""
+"Added ``Accept-Ranges: bytes`` to object responses. Range requests have "
+"always been supported; now, that support is properly advertised."
+
+msgid "Added ``tasks_per_second`` option to rate-limit the object-expirer."
+msgstr "Added ``tasks_per_second`` option to rate-limit the object-expirer."
+
+msgid ""
+"Added ``ttfb`` (Time to First Byte) and ``pid`` (Process ID) to the set of "
+"available proxy-server log fields. For more information, see `the "
+"documentation <https://docs.openstack.org/swift/latest/logs.html>`__."
+msgstr ""
+"Added ``ttfb`` (Time to First Byte) and ``pid`` (Process ID) to the set of "
+"available proxy-server log fields. For more information, see `the "
+"documentation <https://docs.openstack.org/swift/latest/logs.html>`__."
+
+msgid ""
+"Added ``usedforsecurity`` annotations for use on FIPS-compliant systems."
+msgstr ""
+"Added ``usedforsecurity`` annotations for use on FIPS-compliant systems."
+
+msgid ""
+"Added a \"user\" option to the drive-audit config file. Its value is used to "
+"set the owner of the drive-audit recon cache."
+msgstr ""
+"Added a \"user\" option to the drive-audit config file. Its value is used to "
+"set the owner of the drive-audit recon cache."
+
+msgid "Added a ``--dry-run`` option for the 'compact' command."
+msgstr "Added a ``--dry-run`` option for the 'compact' command."
+
+msgid ""
+"Added a ``--includes`` option for the 'show' command to only output shard "
+"ranges that may include a given object name."
+msgstr ""
+"Added a ``--includes`` option for the 'show' command to only output shard "
+"ranges that may include a given object name."
+
+msgid ""
+"Added a ``keep_cache_slo_manifest`` option to the object server to better "
+"control whether SLO manifests are dropped from the page cache."
+msgstr ""
+"Added a ``keep_cache_slo_manifest`` option to the object server to better "
+"control whether SLO manifests are dropped from the page cache."
+
+msgid ""
+"Added a ``keep_idle`` config option to configure KEEPIDLE time for TCP "
+"sockets. The default value is the old constant of 600."
+msgstr ""
+"Added a ``keep_idle`` config option to configure KEEPIDLE time for TCP "
+"sockets. The default value is the old constant of 600."
+
+msgid ""
+"Added a ``keepalive_timeout`` option to the proxy server to limit how long "
+"to wait for a client to initiate a request, separate from the general "
+"``client_timeout`` option. Note that this requires eventlet 0.33.4 "
+"(currently unreleased) or later."
+msgstr ""
+"Added a ``keepalive_timeout`` option to the proxy server to limit how long "
+"to wait for a client to initiate a request, separate from the general "
+"``client_timeout`` option. Note that this requires eventlet 0.33.4 "
+"(currently unreleased) or later."
+
+msgid ""
+"Added a ``log_rsync_transfers`` option to the object-replicator. Set it to "
+"false to disable logging rsync \"send\" lines; during large rebalances, such "
+"logging can overwhelm log aggregation while providing little useful "
+"information."
+msgstr ""
+"Added a ``log_rsync_transfers`` option to the object-replicator. Set it to "
+"false to disable logging rsync \"send\" lines; during large rebalances, such "
+"logging can overwhelm log aggregation while providing little useful "
+"information."
+
+msgid ""
+"Added a ``ring_ip`` option for various object services. This may be used to "
+"find own devices in the ring in a containerized environment where the "
+"``bind_ip`` may not appear in the ring at all."
+msgstr ""
+"Added a ``ring_ip`` option for various object services. This may be used to "
+"find own devices in the ring in a containerised environment where the "
+"``bind_ip`` may not appear in the ring at all."
+
+msgid ""
+"Added a ``swift-reload`` command to assist with safely reloading WSGI "
+"servers."
+msgstr ""
+"Added a ``swift-reload`` command to assist with safely reloading WSGI "
+"servers."
+
+msgid ""
+"Added a configurable URL base to staticweb, fixing issues when the "
+"accessible endpoint isn't known to the Swift cluster (eg http vs https)."
+msgstr ""
+"Added a configurable URL base to staticweb, fixing issues when the "
+"accessible endpoint isn't known to the Swift cluster (eg http vs https)."
+
+msgid "Added a configurable URL base to staticweb."
+msgstr "Added a configurable URL base to staticweb."
+
+msgid "Added a counter metric to the proxy server when caching shard ranges."
+msgstr "Added a counter metric to the proxy server when caching shard ranges."
+
+msgid ""
+"Added a delay before deleting non-durable data. A new configuration option, "
+"``commit_window`` in the ``[DEFAULT]`` section of object-server.conf, "
+"adjusts this delay; the default is 60 seconds. This improves the durability "
+"of both back-dated PUTs (from the reconciler or container-sync, for example) "
+"and fresh writes to handoffs by preventing the reconstructor from deleting "
+"data that the object-server was still writing."
+msgstr ""
+"Added a delay before deleting non-durable data. A new configuration option, "
+"``commit_window`` in the ``[DEFAULT]`` section of object-server.conf, "
+"adjusts this delay; the default is 60 seconds. This improves the durability "
+"of both back-dated PUTs (from the reconciler or container-sync, for example) "
+"and fresh writes to handoffs by preventing the reconstructor from deleting "
+"data that the object-server was still writing."
+
+msgid "Added a handoffs-only mode."
+msgstr "Added a handoffs-only mode."
+
+msgid ""
+"Added a new 'analyze' command to automatically identify overlapping shard "
+"ranges and recommend a resolution based on a JSON listing of shard ranges "
+"such as produced by the 'show' command."
+msgstr ""
+"Added a new 'analyze' command to automatically identify overlapping shard "
+"ranges and recommend a resolution based on a JSON listing of shard ranges "
+"such as produced by the 'show' command."
+
+msgid ""
+"Added a new 'repair' command to automatically identify and optionally "
+"resolve overlapping shard ranges."
+msgstr ""
+"Added a new 'repair' command to automatically identify and optionally "
+"resolve overlapping shard ranges."
+
+msgid ""
+"Added a new ``swift.proxy_logging_status`` request environment key that "
+"middlewares may use to override the logged status for a request."
+msgstr ""
+"Added a new ``swift.proxy_logging_status`` request environment key that "
+"middlewares may use to override the logged status for a request."
+
+msgid ""
+"Added a new config option, ``minimum_shard_size``. When scanning for shard "
+"ranges, if the final shard would otherwise contain fewer than this many "
+"objects, the previous shard will instead be expanded to the end of the "
+"namespace (and so may contain up to ``rows_per_shard + minimum_shard_size`` "
+"objects). This reduces the number of small shards generated. The default "
+"value is ``rows_per_shard / 5``."
+msgstr ""
+"Added a new config option, ``minimum_shard_size``. When scanning for shard "
+"ranges, if the final shard would otherwise contain fewer than this many "
+"objects, the previous shard will instead be expanded to the end of the "
+"namespace (and so may contain up to ``rows_per_shard + minimum_shard_size`` "
+"objects). This reduces the number of small shards generated. The default "
+"value is ``rows_per_shard / 5``."
+
+msgid ""
+"Added a new config option, ``rows_per_shard``, to specify how many objects "
+"should be in each shard when scanning for ranges. The default is "
+"``shard_container_threshold / 2``, preserving existing behavior."
+msgstr ""
+"Added a new config option, ``rows_per_shard``, to specify how many objects "
+"should be in each shard when scanning for ranges. The default is "
+"``shard_container_threshold / 2``, preserving existing behaviour."
+
+msgid ""
+"Added a new config option, ``shrink_threshold``, to specify the absolute "
+"size below which a shard will be considered for shrinking. This overrides "
+"the ``shard_shrink_point`` configuration option, which expressed this as a "
+"percentage of ``shard_container_threshold``. ``shard_shrink_point`` is now "
+"deprecated."
+msgstr ""
+"Added a new config option, ``shrink_threshold``, to specify the absolute "
+"size below which a shard will be considered for shrinking. This overrides "
+"the ``shard_shrink_point`` configuration option, which expressed this as a "
+"percentage of ``shard_container_threshold``. ``shard_shrink_point`` is now "
+"deprecated."
+
+msgid ""
+"Added a new middleware that allows users and operators to configure accounts "
+"and containers to use RFC-compliant (i.e., double-quoted) ETags. This may be "
+"useful when using Swift as an origin for some content delivery networks. For "
+"more information, see `the middleware documentation <https://docs.openstack."
+"org/swift/latest/middleware.html#etag-quoter>`__."
+msgstr ""
+"Added a new middleware that allows users and operators to configure accounts "
+"and containers to use RFC-compliant (i.e., double-quoted) ETags. This may be "
+"useful when using Swift as an origin for some content delivery networks. For "
+"more information, see `the middleware documentation <https://docs.openstack."
+"org/swift/latest/middleware.html#etag-quoter>`__."
+
+msgid ""
+"Added a new middleware to allow accounts and containers to opt-in to RFC-"
+"compliant ETags. For more information, see `the documentation <https://docs."
+"openstack.org/swift/latest/middleware.html#module-swift.common.middleware."
+"etag_quoter>`__. Clients should be aware of the fact that ETags may be "
+"quoted for RFC compliance; this may become the default behavior in some "
+"future release."
+msgstr ""
+"Added a new middleware to allow accounts and containers to opt-in to RFC-"
+"compliant ETags. For more information, see `the documentation <https://docs."
+"openstack.org/swift/latest/middleware.html#module-swift.common.middleware."
+"etag_quoter>`__. Clients should be aware of the fact that ETags may be "
+"quoted for RFC compliance; this may become the default behaviour in some "
+"future release."
+
+msgid ""
+"Added a new object versioning mode, with APIs for querying and accessing old "
+"versions. For more information, see `the documentation <https://docs."
+"openstack.org/swift/latest/middleware.html#module-swift.common.middleware."
+"versioned_writes.object_versioning>`__."
+msgstr ""
+"Added a new object versioning mode, with APIs for querying and accessing old "
+"versions. For more information, see `the documentation <https://docs."
+"openstack.org/swift/latest/middleware.html#module-swift.common.middleware."
+"versioned_writes.object_versioning>`__."
+
+msgid ""
+"Added a new optional proxy-logging field ``{wire_status_int}`` for the "
+"status code returned to the client. For more information, see `the "
+"documentation <https://docs.openstack.org/swift/latest/logs.html#proxy-"
+"logs>`__."
+msgstr ""
+"Added a new optional proxy-logging field ``{wire_status_int}`` for the "
+"status code returned to the client. For more information, see `the "
+"documentation <https://docs.openstack.org/swift/latest/logs.html#proxy-"
+"logs>`__."
+
+msgid ""
+"Added a proxy-server configuration option: ``allow_open_expired``. This "
+"defaults to false; if true, clients may intereact with expired objects by "
+"including an ``X-Open-Expired: true`` header in GET, HEAD, or POST requests."
+msgstr ""
+"Added a proxy-server configuration option: ``allow_open_expired``. This "
+"defaults to false; if true, clients may interact with expired objects by "
+"including an ``X-Open-Expired: true`` header in GET, HEAD, or POST requests."
+
+msgid ""
+"Added an experimental ``swift-ring-composer`` CLI tool to build composite "
+"rings."
+msgstr ""
+"Added an experimental ``swift-ring-composer`` CLI tool to build composite "
+"rings."
+
+msgid ""
+"Added an operator tool, ``swift-container-deleter``, to asynchronously "
+"delete some or all objects in a container using the object expirers."
+msgstr ""
+"Added an operator tool, ``swift-container-deleter``, to asynchronously "
+"delete some or all objects in a container using the object expirers."
+
+msgid "Added an option to drop privileges when running the relinker as root."
+msgstr "Added an option to drop privileges when running the relinker as root."
+
+msgid ""
+"Added an option to rate-limit how quickly data files are relinked or cleaned "
+"up. This may be used to reduce I/O load during partition power increases, "
+"improving end-user performance."
+msgstr ""
+"Added an option to rate-limit how quickly data files are relinked or cleaned "
+"up. This may be used to reduce I/O load during partition power increases, "
+"improving end-user performance."
+
+msgid ""
+"Added an option to write EC fragments with legacy CRC to ensure a smooth "
+"upgrade from liberasurecode<=1.5.0 to >=1.6.2. For more information, see "
+"`bug 1886088 <https://bugs.launchpad.net/liberasurecode/+bug/1886088>`__."
+msgstr ""
+"Added an option to write EC fragments with legacy CRC to ensure a smooth "
+"upgrade from liberasurecode<=1.5.0 to >=1.6.2. For more information, see "
+"`bug 1886088 <https://bugs.launchpad.net/liberasurecode/+bug/1886088>`__."
+
+msgid ""
+"Added an option, ``ratelimit_as_client_error``, to return 429s for rate-"
+"limited responses. Several clients/SDKs have seem to support retries with "
+"backoffs on 429, and having it as a client error cleans up logging and "
+"metrics. By default, Swift will respond 503, matching AWS documentation."
+msgstr ""
+"Added an option, ``ratelimit_as_client_error``, to return 429s for rate-"
+"limited responses. Several clients/SDKs have seem to support retries with "
+"backoffs on 429, and having it as a client error cleans up logging and "
+"metrics. By default, Swift will respond 503, matching AWS documentation."
+
+msgid ""
+"Added an optional ``read_only`` middleware to make an entire cluster or "
+"individual accounts read only."
+msgstr ""
+"Added an optional ``read_only`` middleware to make an entire cluster or "
+"individual accounts read only."
+
+msgid ""
+"Added container sharding, an operator controlled feature that may be used to "
+"shard very large container databases into a number of smaller shard "
+"containers. This mitigates the issues with one large DB by distributing the "
+"data across multiple smaller databases throughout the cluster. Please read "
+"the full overview at https://docs.openstack.org/swift/latest/"
+"overview_container_sharding.html"
+msgstr ""
+"Added container sharding, an operator controlled feature that may be used to "
+"shard very large container databases into a number of smaller shard "
+"containers. This mitigates the issues with one large DB by distributing the "
+"data across multiple smaller databases throughout the cluster. Please read "
+"the full overview at https://docs.openstack.org/swift/latest/"
+"overview_container_sharding.html"
+
+msgid "Added container/object listing with prefix to InternalClient."
+msgstr "Added container/object listing with prefix to InternalClient."
+
+msgid ""
+"Added metrics to count skipped, delayed, and assigned tasks as they're "
+"enumerated."
+msgstr ""
+"Added metrics to count skipped, delayed, and assigned tasks as they're "
+"enumerated."
+
+msgid ""
+"Added metrics to the formpost and tempurl middlewares to monitor digest "
+"usage in signatures."
+msgstr ""
+"Added metrics to the formpost and tempurl middlewares to monitor digest "
+"usage in signatures."
+
+msgid ""
+"Added more metrics to the container-server, allowing GET and PUT timings to "
+"be broken out for listings, shard range operations, and container creation."
+msgstr ""
+"Added more metrics to the container-server, allowing GET and PUT timings to "
+"be broken out for listings, shard range operations, and container creation."
+
+msgid ""
+"Added per-account and per-container reaping delays. These may be used to "
+"offer some grace period in which to recover expired objects."
+msgstr ""
+"Added per-account and per-container reaping delays. These may be used to "
+"offer some grace period in which to recover expired objects."
+
+msgid "Added support for Python 3.8."
+msgstr "Added support for Python 3.8."
+
+msgid "Added support for Python 3.9."
+msgstr "Added support for Python 3.9."
+
+msgid "Added support for S3 versioning using the above new mode."
+msgstr "Added support for S3 versioning using the above new mode."
+
+msgid "Added support for inline data segments in SLO manifests."
+msgstr "Added support for inline data segments in SLO manifests."
+
+msgid ""
+"Added support for per-policy proxy config options. This allows per-policy "
+"affinity options to be set for use with duplicated EC policies and composite "
+"rings. Certain options found in per-policy conf sections will override their "
+"equivalents that may be set in the [app:proxy-server] section. Currently the "
+"options handled that way are ``sorting_method``, ``read_affinity``, "
+"``write_affinity``, ``write_affinity_node_count``, and "
+"``write_affinity_handoff_delete_count``."
+msgstr ""
+"Added support for per-policy proxy config options. This allows per-policy "
+"affinity options to be set for use with duplicated EC policies and composite "
+"rings. Certain options found in per-policy conf sections will override their "
+"equivalents that may be set in the [app:proxy-server] section. Currently the "
+"options handled that way are ``sorting_method``, ``read_affinity``, "
+"``write_affinity``, ``write_affinity_node_count``, and "
+"``write_affinity_handoff_delete_count``."
+
+msgid "Added support for recent versions of eventlet."
+msgstr "Added support for recent versions of eventlet."
+
+msgid ""
+"Added support for retrieving the encryption root secret from an external key "
+"management system. In practice, this is currently limited to Barbican."
+msgstr ""
+"Added support for retrieving the encryption root secret from an external key "
+"management system. In practice, this is currently limited to Barbican."
+
+msgid ""
+"Added support for system-scoped \"reader\" roles when authenticating using "
+"Keystone. Operators may configure this using the ``system_reader_roles`` "
+"option in the ``[filter:keystoneauth]`` section of their proxy-server.conf."
+msgstr ""
+"Added support for system-scoped \"reader\" roles when authenticating using "
+"Keystone. Operators may configure this using the ``system_reader_roles`` "
+"option in the ``[filter:keystoneauth]`` section of their proxy-server.conf."
+
+msgid "Added symlink objects support."
+msgstr "Added symlink objects support."
+
+msgid ""
+"Added the ability for reseller admins to set per-policy account quotas by "
+"posting metadata of the form ``X-Account-Quota-Bytes-Policy-<policy name>``."
+msgstr ""
+"Added the ability for reseller admins to set per-policy account quotas by "
+"posting metadata of the form ``X-Account-Quota-Bytes-Policy-<policy name>``."
+
+msgid "Added the ability to configure auth region in s3token middleware."
+msgstr "Added the ability to configure auth region in s3token middleware."
+
+msgid ""
+"Added the ability to connect to memcached over TLS. See the ``tls_*`` "
+"options in etc/memcache.conf-sample"
+msgstr ""
+"Added the ability to connect to Memcached over TLS. See the ``tls_*`` "
+"options in etc/memcache.conf-sample"
+
+msgid ""
+"Added the ability to read options from object-server.conf, similar to "
+"background daemons."
+msgstr ""
+"Added the ability to read options from object-server.conf, similar to "
+"background daemons."
+
+msgid "After upgrading, re-enable and restart the object-reconstructor."
+msgstr "After upgrading, re-enable and restart the object-reconstructor."
+
+msgid ""
+"All 416 responses will now include a Content-Range header with an "
+"unsatisfied-range value. This allows the caller to know the valid range "
+"request value for an object."
+msgstr ""
+"All 416 responses will now include a Content-Range header with an "
+"unsatisfied-range value. This allows the caller to know the valid range "
+"request value for an object."
+
+msgid ""
+"All background daemons now use the replication network. This allows better "
+"isolation between external, client-facing traffic and internal, background "
+"traffic. Note that during a rolling upgrade, replication servers may respond "
+"with ``405 Method Not Allowed``. To avoid this, operators should remove the "
+"config option ``replication_server = true`` from their replication servers; "
+"this will allow them to handle all request methods before upgrading."
+msgstr ""
+"All background daemons now use the replication network. This allows better "
+"isolation between external, client-facing traffic and internal, background "
+"traffic. Note that during a rolling upgrade, replication servers may respond "
+"with ``405 Method Not Allowed``. To avoid this, operators should remove the "
+"config option ``replication_server = true`` from their replication servers; "
+"this will allow them to handle all request methods before upgrading."
+
+msgid "Allow ``fallocate_reserve`` to be specified as a percentage."
+msgstr "Allow ``fallocate_reserve`` to be specified as a percentage."
+
+msgid "Allow direct_client users to overwrite the ``X-Timestamp`` header."
+msgstr "Allow direct_client users to overwrite the ``X-Timestamp`` header."
+
+msgid ""
+"Allow operators to pass either raw or URL-quoted paths to ``swift-get-"
+"nodes``. Notably, this allows ``swift-get-nodes`` to work with the reserved "
+"namespace used for object versioning."
+msgstr ""
+"Allow operators to pass either raw or URL-quoted paths to ``swift-get-"
+"nodes``. Notably, this allows ``swift-get-nodes`` to work with the reserved "
+"namespace used for object versioning."
+
+msgid "Allow proxy-logging middlewares to be configured more independently."
+msgstr "Allow proxy-logging middlewares to be configured more independently."
+
+msgid ""
+"Allow ratelimit to be placed multiple times in a proxy pipeline, such as "
+"both before s3api and auth (to handle swift requests without needing to make "
+"an auth decision) and after (to limit S3 requests)."
+msgstr ""
+"Allow ratelimit to be placed multiple times in a proxy pipeline, such as "
+"both before s3api and auth (to handle swift requests without needing to make "
+"an auth decision) and after (to limit S3 requests)."
+
+msgid ""
+"Allow static large object segments to be deleted asynchronously. Operators "
+"may opt into this new behavior by enabling the new ``allow_async_delete`` "
+"option in the ``[filter:slo]`` section in their proxy-server.conf. For more "
+"information, see `the documentation <https://docs.openstack.org/swift/latest/"
+"overview_large_objects.html#deleting-a-large-object>`__."
+msgstr ""
+"Allow static large object segments to be deleted asynchronously. Operators "
+"may opt into this new behaviour by enabling the new ``allow_async_delete`` "
+"option in the ``[filter:slo]`` section in their proxy-server.conf. For more "
+"information, see `the documentation <https://docs.openstack.org/swift/latest/"
+"overview_large_objects.html#deleting-a-large-object>`__."
+
+msgid "Allow the expirer to gracefully move past updating stale work items."
+msgstr "Allow the expirer to gracefully move past updating stale work items."
+
+msgid "Always set Swift processes to use UTC."
+msgstr "Always set Swift processes to use UTC."
+
+msgid ""
+"As a result, some errors that previously resulted in exit code 2 will now "
+"exit with code 1."
+msgstr ""
+"As a result, some errors that previously resulted in exit code 2 will now "
+"exit with code 1."
+
+msgid ""
+"Avoid upgrading liberasurecode until swift and liberasurecode better-support "
+"a rolling upgrade. Swift remains compatible with liberasurecode 1.5.0 and "
+"earlier."
+msgstr ""
+"Avoid upgrading liberasurecode until swift and liberasurecode better-support "
+"a rolling upgrade. Swift remains compatible with liberasurecode 1.5.0 and "
+"earlier."
+
+msgid "Background corruption-detection improvements"
+msgstr "Background corruption-detection improvements"
+
+msgid "Bug Fixes"
+msgstr "Bug Fixes"
+
+msgid "COPY now works with unicode account names."
+msgstr "COPY now works with Unicode account names."
+
+msgid "Cache all answers from nameservers in cname_lookup."
+msgstr "Cache all answers from nameservers in cname_lookup."
+
+msgid ""
+"Certain S3 API headers are now lower case as they would be coming from AWS."
+msgstr ""
+"Certain S3 API headers are now lower case as they would be coming from AWS."
+
+msgid ""
+"Change the behavior of the EC reconstructor to perform a fragment rebuild to "
+"a handoff node when a primary peer responds with 507 to the REPLICATE "
+"request. This changes EC to match the existing behavior of replication when "
+"drives fail. After a rebalance of EC rings (potentially removing unmounted/"
+"failed devices), it's most IO efficient to run in handoffs_only mode to "
+"avoid unnecessary rebuilds."
+msgstr ""
+"Change the behaviour of the EC reconstructor to perform a fragment rebuild "
+"to a handoff node when a primary peer responds with 507 to the REPLICATE "
+"request. This changes EC to match the existing behaviour of replication when "
+"drives fail. After a rebalance of EC rings (potentially removing unmounted/"
+"failed devices), it's most IO efficient to run in handoffs_only mode to "
+"avoid unnecessary rebuilds."
+
+msgid ""
+"Changed where liberasurecode-devel for CentOS 7 is referenced and installed "
+"as a dependency."
+msgstr ""
+"Changed where liberasurecode-devel for CentOS 7 is referenced and installed "
+"as a dependency."
+
+msgid "Cleaned up logged tracebacks when talking to memcached servers."
+msgstr "Cleaned up logged tracebacks when talking to memcached servers."
+
+msgid ""
+"Closed a bug where ssync may have written bad fragment data in some "
+"circumstances. A check was added to ensure the correct number of bytes is "
+"written for a fragment before finalizing the write. Also, erasure coded "
+"fragment metadata will now be validated on read requests and, if bad data is "
+"found, the fragment will be quarantined."
+msgstr ""
+"Closed a bug where ssync may have written bad fragment data in some "
+"circumstances. A check was added to ensure the correct number of bytes is "
+"written for a fragment before finalising the write. Also, erasure coded "
+"fragment metadata will now be validated on read requests and, if bad data is "
+"found, the fragment will be quarantined."
+
+msgid ""
+"Closed a bug where ssync may have written bad fragment data in some "
+"circumstances. A check was added to ensure the correct number of bytes is "
+"written for a fragment before finalizing the write. Also, erasure coded "
+"fragment metadata will now be validated when read and, if bad data is found, "
+"the fragment will be quarantined."
+msgstr ""
+"Closed a bug where sync may have written bad fragment data in some "
+"circumstances. A check was added to ensure the correct number of bytes is "
+"written for a fragment before finalising the write. Also, erasure coded "
+"fragment metadata will now be validated when read and, if bad data is found, "
+"the fragment will be quarantined."
+
+msgid "CompleteMultipartUpload requests may now be safely retried."
+msgstr "CompleteMultipartUpload requests may now be safely retried."
+
+msgid "CompleteMultipartUpload requests with a ``Content-MD5`` now work."
+msgstr "CompleteMultipartUpload requests with a ``Content-MD5`` now work."
+
+msgid ""
+"Composite rings can be used for explicit replica placement and \"replicated "
+"EC\" for global erasure codes policies."
+msgstr ""
+"Composite rings can be used for explicit replica placement and \"replicated "
+"EC\" for global erasure codes policies."
+
+msgid ""
+"Composite rings support 'cooperative' rebalance which means that during "
+"rebalance all component rings will be consulted before a partition is moved "
+"in any component ring. This avoids the same partition being simultaneously "
+"moved in multiple components."
+msgstr ""
+"Composite rings support 'cooperative' rebalance which means that during "
+"rebalance all component rings will be consulted before a partition is moved "
+"in any component ring. This avoids the same partition being simultaneously "
+"moved in multiple components."
+
+msgid ""
+"Container metadata related to sharding are now removed when no longer needed."
+msgstr ""
+"Container metadata related to sharding are now removed when no longer needed."
+
+msgid ""
+"Container read ACLs now work with object versioning. This only allows access "
+"to the most-recent version via an unversioned URL."
+msgstr ""
+"Container read ACLs now work with object versioning. This only allows access "
+"to the most-recent version via an unversioned URL."
+
+msgid ""
+"Container sync can now copy SLOs more efficiently by allowing the manifest "
+"to be synced before all of the referenced segments. This fixes a bug where "
+"container sync would not copy SLO manifests."
+msgstr ""
+"Container sync can now copy SLOs more efficiently by allowing the manifest "
+"to be synced before all of the referenced segments. This fixes a bug where "
+"container sync would not copy SLO manifests."
+
+msgid ""
+"Container sync now synchronizes static symlinks in a way similar to static "
+"large objects."
+msgstr ""
+"Container sync now synchronizes static symlinks in a way similar to static "
+"large objects."
+
+msgid "Correctly handle deleted files with if-none-match requests."
+msgstr "Correctly handle deleted files with if-none-match requests."
+
+msgid ""
+"Correctly send 412 Precondition Failed if a user sends an invalid copy "
+"destination. Previously Swift would send a 500 Internal Server Error."
+msgstr ""
+"Correctly send 412 Precondition Failed if a user sends an invalid copy "
+"destination. Previously Swift would send a 500 Internal Server Error."
+
+msgid "Correctness improvements"
+msgstr "Correctness improvements"
+
+msgid "Critical Issues"
+msgstr "Critical Issues"
+
+msgid ""
+"Cross-account symlinks now store correct account information in container "
+"listings. This was previously fixed in 2.22.0."
+msgstr ""
+"Cross-account symlinks now store correct account information in container "
+"listings. This was previously fixed in 2.22.0."
+
+msgid "Current (Unreleased) Release Notes"
+msgstr "Current (Unreleased) Release Notes"
+
+msgid ""
+"Currently the default is still only one process, and no workers. Set "
+"``reconstructor_workers`` in the ``[object-reconstructor]`` section to some "
+"whole number <= the number of devices on a node to get that many "
+"reconstructor workers."
+msgstr ""
+"Currently the default is still only one process, and no workers. Set "
+"``reconstructor_workers`` in the ``[object-reconstructor]`` section to some "
+"whole number <= the number of devices on a node to get that many "
+"reconstructor workers."
+
+msgid "Daemons using InternalClient can now be properly killed with SIGTERM."
+msgstr "Daemons using InternalClient can now be properly killed with SIGTERM."
+
+msgid "Data encryption updates"
+msgstr "Data encryption updates"
+
+msgid ""
+"Deleted shard containers are no longer considered root containers. This "
+"prevents unnecessary sharding audit failures and allows the deleted shard "
+"database to actually be unlinked."
+msgstr ""
+"Deleted shard containers are no longer considered root containers. This "
+"prevents unnecessary sharding audit failures and allows the deleted shard "
+"database to actually be unlinked."
+
+msgid ""
+"Deleting an expiring object will now cause less work in the system. The "
+"number of async pending files written has been reduced for all objects and "
+"greatly reduced for erasure-coded objects. This dramatically reduces the "
+"burden on container servers."
+msgstr ""
+"Deleting an expiring object will now cause less work in the system. The "
+"number of async pending files written has been reduced for all objects and "
+"greatly reduced for erasure-coded objects. This dramatically reduces the "
+"burden on container servers."
+
+msgid ""
+"Deployers with clusters that relied on the old implicit default location of "
+"\"US\" should explicitly set ``location = US`` in the ``[filter:s3api]`` "
+"section of proxy-server.conf before upgrading."
+msgstr ""
+"Deployers with clusters that relied on the old implicit default location of "
+"\"US\" should explicitly set ``location = US`` in the ``[filter:s3api]`` "
+"section of proxy-server.conf before upgrading."
+
+msgid ""
+"Deprecate swift-temp-url and call python-swiftclient's implementation "
+"instead. This adds python-swiftclient as an optional dependency of Swift."
+msgstr ""
+"Deprecate swift-temp-url and call python-swiftclient's implementation "
+"instead. This adds python-swiftclient as an optional dependency of Swift."
+
+msgid "Deprecation Notes"
+msgstr "Deprecation Notes"
+
+msgid "Detect and remove invalid entries from ``hashes.pkl``"
+msgstr "Detect and remove invalid entries from ``hashes.pkl``"
+
+msgid ""
+"Device region and zone can now be changed via ``swift-ring-builder``. Note "
+"that this may cause a lot of data movement on the next rebalance as the "
+"builder tries to reach full dispersion."
+msgstr ""
+"Device region and zone can now be changed via ``swift-ring-builder``. Note "
+"that this may cause a lot of data movement on the next rebalance as the "
+"builder tries to reach full dispersion."
+
+msgid "Disallow X-Delete-At header values equal to the X-Timestamp header."
+msgstr "Disallow X-Delete-At header values equal to the X-Timestamp header."
+
+msgid "Display crypto data/metadata details in swift-object-info."
+msgstr "Display crypto data/metadata details in swift-object-info."
+
+msgid "Display more info on empty rings."
+msgstr "Display more info on empty rings."
+
+msgid "Do not follow CNAME when host is in storage_domain."
+msgstr "Do not follow CNAME when host is in storage_domain."
+
+msgid "Don't inject shard ranges when user quits."
+msgstr "Don't inject shard ranges when user quits."
+
+msgid "Drop support for auth-server from common/manager.py and `swift-init`."
+msgstr "Drop support for auth-server from common/manager.py and `swift-init`."
+
+msgid ""
+"During rebalances, clients should no longer get 404s for data that exists "
+"but whose replicas are overloaded."
+msgstr ""
+"During rebalances, clients should no longer get 404s for data that exists "
+"but whose replicas are overloaded."
+
+msgid "EC Fragment Duplication - Foundational Global EC Cluster Support."
+msgstr "EC Fragment Duplication - Foundational Global EC Cluster Support."
+
+msgid ""
+"Empty container databases (such as might be created on handoffs) now shard "
+"much more quickly."
+msgstr ""
+"Empty container databases (such as might be created on handoffs) now shard "
+"much more quickly."
+
+msgid ""
+"Enable cluster-wide CORS Expose-Headers setting via \"cors_expose_headers\"."
+msgstr ""
+"Enable cluster-wide CORS Expose-Headers setting via \"cors_expose_headers\"."
+
+msgid "Enabled versioned writes on Dynamic Large Objects (DLOs)."
+msgstr "Enabled versioned writes on Dynamic Large Objects (DLOs)."
+
+msgid ""
+"Ensure update of the container by object-updater, removing a rare "
+"possibility that objects would never be added to a container listing."
+msgstr ""
+"Ensure update of the container by object-updater, removing a rare "
+"possibility that objects would never be added to a container listing."
+
+msgid ""
+"Erasure code GET performance has been significantly improved in clusters "
+"that are not completely healthy."
+msgstr ""
+"Erasure code GET performance has been significantly improved in clusters "
+"that are not completely healthy."
+
+msgid ""
+"Erasure code reconstruction handles moving data from handoff nodes better. "
+"Instead of moving the data to another handoff, it waits until it can be "
+"moved to a primary node."
+msgstr ""
+"Erasure code reconstruction handles moving data from hand-off nodes better. "
+"Instead of moving the data to another hand-off, it waits until it can be "
+"moved to a primary node."
+
+msgid ""
+"Erasure-coded storage policies using ``isa_l_rs_vand`` and ``nparity`` >= 5 "
+"must be configured as deprecated, preventing any new containers from being "
+"created with such a policy. This configuration is known to harm data "
+"durability. Any data in such policies should be migrated to a new policy. "
+"See See `Launchpad bug 1639691 <https://bugs.launchpad.net/swift/"
+"+bug/1639691>`__ for more information."
+msgstr ""
+"Erasure-coded storage policies using ``isa_l_rs_vand`` and ``nparity`` >= 5 "
+"must be configured as deprecated, preventing any new containers from being "
+"created with such a policy. This configuration is known to harm data "
+"durability. Any data in such policies should be migrated to a new policy. "
+"See See `Launchpad bug 1639691 <https://bugs.launchpad.net/swift/"
+"+bug/1639691>`__ for more information."
+
+msgid ""
+"Errors encountered while validating static symlink targets no longer cause "
+"BadResponseLength errors in the proxy-server."
+msgstr ""
+"Errors encountered while validating static symlink targets no longer cause "
+"BadResponseLength errors in the proxy-server."
+
+msgid ""
+"Errors encountered while validating static symlink targets no longer cause "
+"``BadResponseLength`` errors in the proxy-server."
+msgstr ""
+"Errors encountered while validating static symlink targets no longer cause "
+"``BadResponseLength`` errors in the proxy-server."
+
+msgid ""
+"Experimental support for Python 3.6 and 3.7 is now available. Note that this "
+"requires ``eventlet>=0.25.0``. All unit tests pass, and running functional "
+"tests under Python 2 will pass against services running under Python 3. "
+"Expect full support in the next minor release."
+msgstr ""
+"Experimental support for Python 3.6 and 3.7 is now available. Note that this "
+"requires ``eventlet>=0.25.0``. All unit tests pass, and running functional "
+"tests under Python 2 will pass against services running under Python 3. "
+"Expect full support in the next minor release."
+
+msgid ""
+"Extend concurrent reads to erasure coded policies. Previously, the options "
+"``concurrent_gets`` and ``concurrency_timeout`` only applied to replicated "
+"policies."
+msgstr ""
+"Extend concurrent reads to erasure coded policies. Previously, the options "
+"``concurrent_gets`` and ``concurrency_timeout`` only applied to replicated "
+"policies."
+
+msgid "Fix SLO delete for accounts with non-ASCII names."
+msgstr "Fix SLO delete for accounts with non-ASCII names."
+
+msgid ""
+"Fix a proxy-server error when retrieving erasure coded data when there are "
+"durable fragments but not enough to reconstruct."
+msgstr ""
+"Fix a proxy-server error when retrieving erasure coded data when there are "
+"durable fragments but not enough to reconstruct."
+
+msgid "Fix an error in the proxy server when finalizing data."
+msgstr "Fix an error in the proxy server when finalising data."
+
+msgid ""
+"Fixed 500 from cname_lookup middleware. Previously, if the looked-up domain "
+"was used by domain_remap to update the request path, the server would "
+"respond Internal Error."
+msgstr ""
+"Fixed 500 from cname_lookup middleware. Previously, if the looked-up domain "
+"was used by domain_remap to update the request path, the server would "
+"respond Internal Error."
+
+msgid ""
+"Fixed UnicodeDecodeError in the object reconstructor that would prevent "
+"objects with non-ascii names from being reconstructed and caused the "
+"reconstructor process to hang."
+msgstr ""
+"Fixed UnicodeDecodeError in the object reconstructor that would prevent "
+"objects with non-ASCII names from being reconstructed and caused the "
+"reconstructor process to hang."
+
+msgid ""
+"Fixed XML responses (eg on bulk extractions and SLO upload failures) to be "
+"more correct. The enclosing \"delete\" tag was removed where it doesn't make "
+"sense and replaced with \"extract\" or \"upload\" depending on the context."
+msgstr ""
+"Fixed XML responses (e.g. on bulk extractions and SLO upload failures) to be "
+"more correct. The enclosing \"delete\" tag was removed where it doesn't make "
+"sense and replaced with \"extract\" or \"upload\" depending on the context."
+
+msgid "Fixed ``rsync`` output parsing."
+msgstr "Fixed ``rsync`` output parsing."
+
+msgid "Fixed a bug in domain_remap when obj starts/ends with slash."
+msgstr "Fixed a bug in domain_remap when obj starts/ends with slash."
+
+msgid ""
+"Fixed a bug in how Swift uses eventlet that was exposed under high "
+"concurrency."
+msgstr ""
+"Fixed a bug in how Swift uses eventlet that was exposed under high "
+"concurrency."
+
+msgid ""
+"Fixed a bug in the EC reconstructor where an unsuccessful sync would cause "
+"extra disk I/O load on the remote server. Now the extra checking work is "
+"only requested if the sync request was successful."
+msgstr ""
+"Fixed a bug in the EC reconstructor where an unsuccessful sync would cause "
+"extra disk I/O load on the remote server. Now the extra checking work is "
+"only requested if the sync request was successful."
+
+msgid ""
+"Fixed a bug in the new object versioning API that would cause more than "
+"``limit`` results to be returned when listing."
+msgstr ""
+"Fixed a bug in the new object versioning API that would cause more than "
+"``limit`` results to be returned when listing."
+
+msgid ""
+"Fixed a bug introduced in 2.15.0 where the object reconstructor would exit "
+"with a traceback if no EC policy was configured."
+msgstr ""
+"Fixed a bug introduced in 2.15.0 where the object reconstructor would exit "
+"with a traceback if no EC policy was configured."
+
+msgid "Fixed a bug where SSYNC would fail to replicate unexpired object."
+msgstr "Fixed a bug where SSYNC would fail to replicate unexpired object."
+
+msgid ""
+"Fixed a bug where a container listing delimiter wouldn't work with "
+"encryption."
+msgstr ""
+"Fixed a bug where a container listing delimiter wouldn't work with "
+"encryption."
+
+msgid ""
+"Fixed a bug where an SLO download with a range request may have resulted in "
+"a 5xx series response."
+msgstr ""
+"Fixed a bug where an SLO download with a range request may have resulted in "
+"a 5xx series response."
+
+msgid ""
+"Fixed a bug where encryption would store the incorrect key metadata if the "
+"object name starts with a slash."
+msgstr ""
+"Fixed a bug where encryption would store the incorrect key metadata if the "
+"object name starts with a slash."
+
+msgid ""
+"Fixed a bug where some headers weren't being copied correctly in a COPY "
+"request."
+msgstr ""
+"Fixed a bug where some headers weren't being copied correctly in a COPY "
+"request."
+
+msgid "Fixed a bug where some tombstone files might never be reclaimed."
+msgstr "Fixed a bug where some tombstone files might never be reclaimed."
+
+msgid ""
+"Fixed a bug where the ring builder would not allow removal of a device when "
+"min_part_seconds_left was greater than zero."
+msgstr ""
+"Fixed a bug where the ring builder would not allow removal of a device when "
+"min_part_seconds_left was greater than zero."
+
+msgid ""
+"Fixed a bug where zero-byte PUTs would not work properly with \"If-None-"
+"Match: \\*\" conditional requests."
+msgstr ""
+"Fixed a bug where zero-byte PUTs would not work properly with \"If-None-"
+"Match: \\*\" conditional requests."
+
+msgid ""
+"Fixed a cache invalidation issue related to GET and PUT requests to "
+"containers that would occasionally cause object PUTs to a container to 404 "
+"after the container had been successfully created."
+msgstr ""
+"Fixed a cache invalidation issue related to GET and PUT requests to "
+"containers that would occasionally cause object PUTs to a container to 404 "
+"after the container had been successfully created."
+
+msgid "Fixed a few areas where the ``swiftdir`` option was not respected."
+msgstr "Fixed a few areas where the ``swiftdir`` option was not respected."
+
+msgid ""
+"Fixed a race condition in updating hashes.pkl where a partition suffix "
+"invalidation may have been skipped."
+msgstr ""
+"Fixed a race condition in updating hashes.pkl where a partition suffix "
+"invalidation may have been skipped."
+
+msgid "Fixed a rare infinite loop in `swift-ring-builder` while placing parts."
+msgstr ""
+"Fixed a rare infinite loop in `swift-ring-builder` while placing parts."
+
+msgid ""
+"Fixed a rare issue where multiple backend timeouts could result in bad data "
+"being returned to the client."
+msgstr ""
+"Fixed a rare issue where multiple backend timeouts could result in bad data "
+"being returned to the client."
+
+msgid "Fixed a socket leak in copy middleware when a large object was copied."
+msgstr "Fixed a socket leak in copy middleware when a large object was copied."
+
+msgid ""
+"Fixed an error when reading encrypted data that was written while running "
+"Python 2 for a path that includes non-ASCII characters."
+msgstr ""
+"Fixed an error when reading encrypted data that was written while running "
+"Python 2 for a path that includes non-ASCII characters."
+
+msgid ""
+"Fixed an issue in COPY where concurrent requests may have copied the wrong "
+"data."
+msgstr ""
+"Fixed an issue in COPY where concurrent requests may have copied the wrong "
+"data."
+
+msgid ""
+"Fixed an issue that caused Delete Multiple Objects requests with large "
+"bodies to 400. This was previously fixed in 2.20.0."
+msgstr ""
+"Fixed an issue that caused Delete Multiple Objects requests with large "
+"bodies to 400. This was previously fixed in 2.20.0."
+
+msgid ""
+"Fixed an issue when reading or writing objects with a content-type like "
+"``message/*``. Previously, Swift would fail to respond."
+msgstr ""
+"Fixed an issue when reading or writing objects with a content-type like "
+"``message/*``. Previously, Swift would fail to respond."
+
+msgid ""
+"Fixed an issue where S3 API v4 signatures would not be validated against the "
+"body of the request, allowing a replay attack if request headers were "
+"captured by a malicious third party."
+msgstr ""
+"Fixed an issue where S3 API v4 signatures would not be validated against the "
+"body of the request, allowing a replay attack if request headers were "
+"captured by a malicious third party."
+
+msgid ""
+"Fixed an issue where a failed drive could prevent the container sharder from "
+"making progress."
+msgstr ""
+"Fixed an issue where a failed drive could prevent the container sharder from "
+"making progress."
+
+msgid ""
+"Fixed an issue where an object server failure during a client download could "
+"leave an open socket between the proxy and client."
+msgstr ""
+"Fixed an issue where an object server failure during a client download could "
+"leave an open socket between the proxy and client."
+
+msgid ""
+"Fixed an issue where background consistency daemon child processes would "
+"deadlock waiting on the same file descriptor."
+msgstr ""
+"Fixed an issue where background consistency daemon child processes would "
+"deadlock waiting on the same file descriptor."
+
+msgid ""
+"Fixed an issue where deleted EC objects didn't have their on-disk "
+"directories cleaned up. This would cause extra resource usage on the object "
+"servers."
+msgstr ""
+"Fixed an issue where deleted EC objects didn't have their on-disk "
+"directories cleaned up. This would cause extra resource usage on the object "
+"servers."
+
+msgid ""
+"Fixed an issue where multipart uploads with the S3 API would sometimes "
+"report an error despite all segments being upload successfully."
+msgstr ""
+"Fixed an issue where multipart uploads with the S3 API would sometimes "
+"report an error despite all segments being upload successfully."
+
+msgid ""
+"Fixed an issue where non-ASCII Keystone EC2 credentials would not get mapped "
+"to the correct account. This was previously fixed in 2.20.0."
+msgstr ""
+"Fixed an issue where non-ASCII Keystone EC2 credentials would not get mapped "
+"to the correct account. This was previously fixed in 2.20.0."
+
+msgid ""
+"Fixed an issue where v4 signatures would not be validated against the body "
+"of the request, allowing a replay attack if request headers were captured by "
+"a malicious third party. Note that unsigned payloads still function normally."
+msgstr ""
+"Fixed an issue where v4 signatures would not be validated against the body "
+"of the request, allowing a replay attack if request headers were captured by "
+"a malicious third party. Note that unsigned payloads still function normally."
+
+msgid ""
+"Fixed an issue with SSYNC requests to ensure that only one request can be "
+"running on a partition at a time."
+msgstr ""
+"Fixed an issue with SSYNC requests to ensure that only one request can be "
+"running on a partition at a time."
+
+msgid ""
+"Fixed an issue with multi-region EC policies that caused the EC "
+"reconstructor to constantly attempt cross-region rebuild traffic."
+msgstr ""
+"Fixed an issue with multi-region EC policies that caused the EC "
+"reconstructor to constantly attempt cross-region rebuild traffic."
+
+msgid "Fixed deadlock when logging from a tpool thread."
+msgstr "Fixed deadlock when logging from a tpool thread."
+
+msgid ""
+"Fixed deadlock when logging from a tpool thread. The object server runs "
+"certain IO-intensive methods outside the main pthread for performance. "
+"Previously, if one of those methods tried to log, this can cause a crash "
+"that eventually leads to an object server with hundreds or thousands of "
+"greenthreads, all deadlocked. The fix is to use a mutex that works across "
+"different greenlets and different pthreads."
+msgstr ""
+"Fixed deadlock when logging from a tpool thread. The object server runs "
+"certain IO-intensive methods outside the main pthread for performance. "
+"Previously, if one of those methods tried to log, this can cause a crash "
+"that eventually leads to an object server with hundreds or thousands of "
+"greenthreads, all deadlocked. The fix is to use a mutex that works across "
+"different greenlets and different pthreads."
+
+msgid ""
+"Fixed encoding issue in ssync where a mix of ascii and non-ascii metadata "
+"values would cause an error."
+msgstr ""
+"Fixed encoding issue in ssync where a mix of ASCII and non-ASCII metadata "
+"values would cause an error."
+
+msgid ""
+"Fixed error where a container drive error resulted in double space usage on "
+"rest drives. When drive with container or account database is unmounted, the "
+"bug would create handoff replicas on all remaining drives, increasing the "
+"drive space used and filling the cluster."
+msgstr ""
+"Fixed error where a container drive error resulted in double space usage on "
+"rest drives. When drive with container or account database is unmounted, the "
+"bug would create hand-off replicas on all remaining drives, increasing the "
+"drive space used and filling the cluster."
+
+msgid ""
+"Fixed issue where bulk requests using xml and expect 100-continue would "
+"return a malformed HTTP response."
+msgstr ""
+"Fixed issue where bulk requests using XML and expect 100-continue would "
+"return a malformed HTTP response."
+
+msgid "Fixed listings for sharded containers."
+msgstr "Fixed listings for sharded containers."
+
+msgid "Fixed non-ASCII account metadata handling."
+msgstr "Fixed non-ASCII account metadata handling."
+
+msgid ""
+"Fixed non-deterministic suffix updates in hashes.pkl where a partition may "
+"be updated much less often than expected."
+msgstr ""
+"Fixed non-deterministic suffix updates in hashes.pkl where a partition may "
+"be updated much less often than expected."
+
+msgid "Fixed rare socket leak on range requests to erasure-coded objects."
+msgstr "Fixed rare socket leak on range requests to erasure-coded objects."
+
+msgid ""
+"Fixed regression in consolidate_hashes that occured when a new file was "
+"stored to new suffix to a non-empty partition. This bug was introduced in "
+"2.7.0 and could cause an increase in rsync replication stats during and "
+"after upgrade, due to inconsistent hashing of partition suffixes."
+msgstr ""
+"Fixed regression in consolidate_hashes that occurred when a new file was "
+"stored to new suffix to a non-empty partition. This bug was introduced in "
+"2.7.0 and could cause an increase in rsync replication stats during and "
+"after upgrade, due to inconsistent hashing of partition suffixes."
+
+msgid ""
+"Fixed regression in consolidate_hashes that occurred when a new file was "
+"stored to new suffix to a non-empty partition. This bug was introduced in "
+"2.7.0 and could cause an increase in rsync replication stats during and "
+"after upgrade, due to inconsistent hashing of partition suffixes."
+msgstr ""
+"Fixed regression in consolidate_hashes that occurred when a new file was "
+"stored to new suffix to a non-empty partition. This bug was introduced in "
+"2.7.0 and could cause an increase in rsync replication stats during and "
+"after upgrade, due to inconsistent hashing of partition suffixes."
+
+msgid "Fixed some SignatureDoesNotMatch errors when using the AWS .NET SDK."
+msgstr "Fixed some SignatureDoesNotMatch errors when using the AWS .NET SDK."
+
+msgid "Fixed some minor test compatibility issues."
+msgstr "Fixed some minor test compatibility issues."
+
+msgid "Fixed some title-casing of headers."
+msgstr "Fixed some title-casing of headers."
+
+msgid "Fixed the KeyError message when auditor finds an expired object."
+msgstr "Fixed the KeyError message when auditor finds an expired object."
+
+msgid "Fixed the stats calculation in the erasure code reconstructor."
+msgstr "Fixed the stats calculation in the erasure code reconstructor."
+
+msgid "Fixed time skew when using X-Delete-After."
+msgstr "Fixed time skew when using X-Delete-After."
+
+msgid ""
+"Fixed using ``swift-ring-builder set_weight`` with more than one device."
+msgstr ""
+"Fixed using ``swift-ring-builder set_weight`` with more than one device."
+
+msgid "Fixed v1 listings that end with a non-ASCII object name."
+msgstr "Fixed v1 listings that end with a non-ASCII object name."
+
+msgid ""
+"For further information see the `docs <https://docs.openstack.org/swift/"
+"latest/overview_ring.html#module-swift.common.ring.composite_builder>`__"
+msgstr ""
+"For further information see the `docs <https://docs.openstack.org/swift/"
+"latest/overview_ring.html#module-swift.common.ring.composite_builder>`__"
+
+msgid ""
+"For new multipart-uploads via the S3 API, the ETag that is stored will be "
+"calculated in the same way that AWS uses. This ETag will be used in GET/HEAD "
+"responses, bucket listings, and conditional requests via the S3 API. "
+"Accessing the same object via the Swift API will use the SLO Etag; however, "
+"in JSON container listings the multipart upload etag will be exposed in a "
+"new \"s3_etag\" key. Previously, some S3 clients would complain about "
+"download corruption when the ETag did not have a '-'."
+msgstr ""
+"For new multipart-uploads via the S3 API, the ETag that is stored will be "
+"calculated in the same way that AWS uses. This ETag will be used in GET/HEAD "
+"responses, bucket listings, and conditional requests via the S3 API. "
+"Accessing the same object via the Swift API will use the SLO Etag; however, "
+"in JSON container listings the multipart upload etag will be exposed in a "
+"new \"s3_etag\" key. Previously, some S3 clients would complain about "
+"download corruption when the ETag did not have a '-'."
+
+msgid "Fractional replicas are no longer allowed for erasure code policies."
+msgstr "Fractional replicas are no longer allowed for erasure code policies."
+
+msgid ""
+"GET and HEAD requests to a symlink will operate on the referenced object and "
+"require appropriate permission in the target container. DELETE and PUT "
+"requests will operate on the symlink object itself. POST requests are not "
+"forwarded to the referenced object. POST requests sent to a symlink will "
+"result in a 307 Temporary Redirect response."
+msgstr ""
+"GET and HEAD requests to a symlink will operate on the referenced object and "
+"require appropriate permission in the target container. DELETE and PUT "
+"requests will operate on the symlink object itself. POST requests are not "
+"forwarded to the referenced object. POST requests sent to a symlink will "
+"result in a 307 Temporary Redirect response."
+
+msgid ""
+"Getting an SLO manifest with ``?format=raw`` now responds with an ETag that "
+"matches the MD5 of the generated body rather than the MD5 of the manifest "
+"stored on disk."
+msgstr ""
+"Getting an SLO manifest with ``?format=raw`` now responds with an ETag that "
+"matches the MD5 of the generated body rather than the MD5 of the manifest "
+"stored on disk."
+
+msgid ""
+"Hashes are no longer invalidated after a successful ssync; they were already "
+"invalidated during the data transfer."
+msgstr ""
+"Hashes are no longer invalidated after a successful ssync; they were already "
+"invalidated during the data transfer."
+
+msgid "I/O priority is now supported on AArch64 architecture."
+msgstr "I/O priority is now supported on AArch64 architecture."
+
+msgid ""
+"If a proxy server is configured to autocreate accounts and the account "
+"create fails, it will now return a server error (500) instead of Not Found "
+"(404)."
+msgstr ""
+"If a proxy server is configured to autocreate accounts and the account "
+"create fails, it will now return a server error (500) instead of Not Found "
+"(404)."
+
+msgid ""
+"If proxy and object layers can be upgraded independently and proxies can be "
+"upgraded quickly:"
+msgstr ""
+"If proxy and object layers can be upgraded independently and proxies can be "
+"upgraded quickly:"
+
+msgid "If running Swift under Python 3, ``eventlet`` must be at least 0.25.0."
+msgstr "If running Swift under Python 3, ``eventlet`` must be at least 0.25.0."
+
+msgid ""
+"If the sharder encounters shard range gaps while cleaving, it will now log "
+"an error and halt sharding progress. Previously, rows may not have been "
+"moved properly, leading to data loss."
+msgstr ""
+"If the sharder encounters shard range gaps while cleaving, it will now log "
+"an error and halt sharding progress. Previously, rows may not have been "
+"moved properly, leading to data loss."
+
+msgid ""
+"If upgrading from Swift 2.20.0 or Swift 2.19.1 or earlier, set "
+"``meta_version_to_write = 1`` in your keymaster configuration *prior* to "
+"upgrading."
+msgstr ""
+"If upgrading from Swift 2.20.0 or Swift 2.19.1 or earlier, set "
+"``meta_version_to_write = 1`` in your keymaster configuration *prior* to "
+"upgrading."
+
+msgid ""
+"If using erasure coding with ISA-L in rs_vand mode and 5 or more parity "
+"fragments, Swift will emit a warning. This is a configuration that is known "
+"to harm data durability. In a future release, this warning will be upgraded "
+"to an error unless the policy is marked as deprecated. All data in an "
+"erasure code storage policy using isa_l_rs_vand with 5 or more parity should "
+"be migrated as soon as possible. Please see https://bugs.launchpad.net/swift/"
+"+bug/1639691 for more information."
+msgstr ""
+"If using erasure coding with ISA-L in rs_vand mode and 5 or more parity "
+"fragments, Swift will emit a warning. This is a configuration that is known "
+"to harm data durability. In a future release, this warning will be upgraded "
+"to an error unless the policy is marked as deprecated. All data in an "
+"erasure code storage policy using isa_l_rs_vand with 5 or more parity should "
+"be migrated as soon as possible. Please see https://bugs.launchpad.net/swift/"
+"+bug/1639691 for more information."
+
+msgid "If you have a config file like this::"
+msgstr "If you have a config file like this::"
+
+msgid "If you upgrade and roll back, you must delete all `hashes.pkl` files."
+msgstr "If you upgrade and roll back, you must delete all `hashes.pkl` files."
+
+msgid "If you want updates to be processed exactly as before, do this::"
+msgstr "If you want updates to be processed exactly as before, do this::"
+
+msgid ""
+"If you've been testing Swift on Python 3, upgrade at your earliest "
+"convenience."
+msgstr ""
+"If you've been testing Swift on Python 3, upgrade at your earliest "
+"convenience."
+
+msgid ""
+"If your users can tolerate it, consider a read-only rolling upgrade. Before "
+"upgrading, enable the `read-only middleware <https://docs.openstack.org/"
+"swift/latest/middleware.html#read-only>`__ cluster-wide to prevent new "
+"writes during the upgrade. Additionally, stop and disable the object-"
+"reconstructor as above. Upgrade normally, then disable the read-only "
+"middleware and re-enable and restart the object-reconstructor."
+msgstr ""
+"If your users can tolerate it, consider a read-only rolling upgrade. Before "
+"upgrading, enable the `read-only middleware <https://docs.openstack.org/"
+"swift/latest/middleware.html#read-only>`__ cluster-wide to prevent new "
+"writes during the upgrade. Additionally, stop and disable the object-"
+"reconstructor as above. Upgrade normally, then disable the read-only "
+"middleware and re-enable and restart the object-reconstructor."
+
+msgid "Imported docs content from openstack-manuals project."
+msgstr "Imported docs content from openstack-manuals project."
+
+msgid "Improve performance when increasing partition power."
+msgstr "Improve performance when increasing partition power."
+
+msgid "Improved S3 API compatibility."
+msgstr "Improved S3 API compatibility."
+
+msgid ""
+"Improved ``object-updater`` stats logging. It now tells you all of its stats "
+"(successes, failures, quarantines due to bad pickles, unlinks, and errors), "
+"and it tells you incremental progress every five minutes. The logging at the "
+"end of a pass remains and has been expanded to also include all stats."
+msgstr ""
+"Improved ``object-updater`` stats logging. It now tells you all of its stats "
+"(successes, failures, quarantines due to bad pickles, unlinks, and errors), "
+"and it tells you incremental progress every five minutes. The logging at the "
+"end of a pass remains and has been expanded to also include all stats."
+
+msgid "Improved cache management for account and container responses."
+msgstr "Improved cache management for account and container responses."
+
+msgid "Improved compatibility with certain FIPS-mode-enabled systems."
+msgstr "Improved compatibility with certain FIPS-mode-enabled systems."
+
+msgid ""
+"Improved container-sharder stat reporting to reduce load on root container "
+"databases."
+msgstr ""
+"Improved container-sharder stat reporting to reduce load on root container "
+"databases."
+
+msgid ""
+"Improved container-sync performance when data has already been deleted or "
+"overwritten."
+msgstr ""
+"Improved container-sync performance when data has already been deleted or "
+"overwritten."
+
+msgid ""
+"Improved how containers reclaim deleted rows to reduce locking and object "
+"update throughput."
+msgstr ""
+"Improved how containers reclaim deleted rows to reduce locking and object "
+"update throughput."
+
+msgid ""
+"Improved logging and statsd metrics. Be aware that this will cause an "
+"increase in the proxy-logging statsd metrics emited for S3 responses. "
+"However, this should more accurately reflect the state of the system."
+msgstr ""
+"Improved logging and statsd metrics. Be aware that this will cause an "
+"increase in the proxy-logging statsd metrics emitted for S3 responses. "
+"However, this should more accurately reflect the state of the system."
+
+msgid ""
+"Improved performance by eliminating an unneeded directory structure hash."
+msgstr ""
+"Improved performance by eliminating an unneeded directory structure hash."
+
+msgid ""
+"Improved performance of sharded container listings when performing prefix "
+"listings."
+msgstr ""
+"Improved performance of sharded container listings when performing prefix "
+"listings."
+
+msgid ""
+"Improved proxy-server performance by reducing unnecessary locking, memory "
+"copies, and eventlet scheduling."
+msgstr ""
+"Improved proxy-server performance by reducing unnecessary locking, memory "
+"copies, and eventlet scheduling."
+
+msgid "Improved proxy-to-backend requests to be more RFC-compliant."
+msgstr "Improved proxy-to-backend requests to be more RFC-compliant."
+
+msgid "Improved quota-exceeded error messages."
+msgstr "Improved quota-exceeded error messages."
+
+msgid ""
+"Improved relinker progress logging, and started collecting progress "
+"information for swift-recon."
+msgstr ""
+"Improved relinker progress logging, and started collecting progress "
+"information for swift-recon."
+
+msgid ""
+"Improved safety during cleanup to ensure files have been relinked "
+"appropriately before unlinking."
+msgstr ""
+"Improved safety during cleanup to ensure files have been relinked "
+"appropriately before unlinking."
+
+msgid ""
+"Improved the error message when deleting a bucket that's ever had versioning "
+"enabled and still has versions in it."
+msgstr ""
+"Improved the error message when deleting a bucket that's ever had versioning "
+"enabled and still has versions in it."
+
+msgid ""
+"Improved the granularity of the ring dispersion metric so that small "
+"improvements after a rebalance can show changes in the dispersion number. "
+"Dispersion in existing and new rings can be recalculated using the new ``--"
+"recalculate`` option to ``swift-ring-builder``."
+msgstr ""
+"Improved the granularity of the ring dispersion metric so that small "
+"improvements after a rebalance can show changes in the dispersion number. "
+"Dispersion in existing and new rings can be recalculated using the new ``--"
+"recalculate`` option to ``swift-ring-builder``."
+
+msgid "Improvements in key parts of the consistency engine"
+msgstr "Improvements in key parts of the consistency engine"
+
+msgid ""
+"In SLO manifests, the `etag` and `size_bytes` keys are now fully optional "
+"and not required. Previously, the keys needed to exist but the values were "
+"optional. The only required key is `path`."
+msgstr ""
+"In SLO manifests, the `etag` and `size_bytes` keys are now fully optional "
+"and not required. Previously, the keys needed to exist but the values were "
+"optional. The only required key is `path`."
+
+msgid ""
+"In a rolling upgrade from liberasurecode 1.5.0 or earlier to 1.6.0 or later, "
+"object-servers may quarantine newly-written data, leading to availability "
+"issues or even data loss. See `bug 1886088 <https://bugs.launchpad.net/"
+"liberasurecode/+bug/1886088>`__ for more information, including how to "
+"determine whether you are affected. Several mitigations are available to "
+"operators:"
+msgstr ""
+"In a rolling upgrade from liberasurecode 1.5.0 or earlier to 1.6.0 or later, "
+"object-servers may quarantine newly-written data, leading to availability "
+"issues or even data loss. See `bug 1886088 <https://bugs.launchpad.net/"
+"liberasurecode/+bug/1886088>`__ for more information, including how to "
+"determine whether you are affected. Several mitigations are available to "
+"operators:"
+
+msgid ""
+"In the ratelimit middleware, account whitelist and blacklist settings have "
+"been deprecated and may be removed in a future release. When found, a "
+"deprecation message will be logged. Instead of these config file values, set "
+"X-Account-Sysmeta- Global-Write-Ratelimit:WHITELIST and X-Account-Sysmeta-"
+"Global- Write-Ratelimit:BLACKLIST on the particular accounts that need to be "
+"whitelisted or blacklisted. System metadata cannot be added or modified by "
+"standard clients. Use the internal client to set sysmeta."
+msgstr ""
+"In the ratelimit middleware, account whitelist and blacklist settings have "
+"been deprecated and may be removed in a future release. When found, a "
+"deprecation message will be logged. Instead of these config file values, set "
+"X-Account-Sysmeta- Global-Write-Ratelimit:WHITELIST and X-Account-Sysmeta-"
+"Global- Write-Ratelimit:BLACKLIST on the particular accounts that need to be "
+"whitelisted or blacklisted. System metadata cannot be added or modified by "
+"standard clients. Use the internal client to set sysmeta."
+
+msgid "Include ``Vary: Origin`` header when CORS responses vary by origin."
+msgstr "Include ``Vary: Origin`` header when CORS responses vary by origin."
+
+msgid ""
+"Include object sysmeta in POST responses. Sysmeta is still stripped from the "
+"response before being sent to the client, but this allows middleware to make "
+"use of the information."
+msgstr ""
+"Include object sysmeta in POST responses. Sysmeta is still stripped from the "
+"response before being sent to the client, but this allows middleware to make "
+"use of the information."
+
+msgid "Include received fragment index in reconstructor log warnings."
+msgstr "Include received fragment index in reconstructor log warnings."
+
+msgid ""
+"Instead of using a separate .durable file to indicate the durable status of "
+"an EC fragment archive, we rename the .data to include a durable marker in "
+"the filename. This saves one inode for every EC .data file. Existing ."
+"durable files will not be removed, and they will continue to work just fine."
+msgstr ""
+"Instead of using a separate .durable file to indicate the durable status of "
+"an EC fragment archive, we rename the .data to include a durable marker in "
+"the filename. This saves one inode for every EC .data file. Existing ."
+"durable files will not be removed, and they will continue to work just fine."
+
+msgid "Internal client no longer logs object DELETEs as status 499."
+msgstr "Internal client no longer logs object DELETEs as status 499."
+
+msgid ""
+"Internal clients now correctly use their configured ``User-Agent`` in "
+"backend requests, rather than only using it for logging."
+msgstr ""
+"Internal clients now correctly use their configured ``User-Agent`` in "
+"backend requests, rather than only using it for logging."
+
+msgid "Known Issues"
+msgstr "Known Issues"
+
+msgid "Large object reads log fewer client disconnects."
+msgstr "Large object reads log fewer client disconnects."
+
+msgid ""
+"Let clients request heartbeats during SLO PUTs by including the query "
+"parameter ``heartbeat=on``."
+msgstr ""
+"Let clients request heartbeats during SLO PUTs by including the query "
+"parameter ``heartbeat=on``."
+
+msgid ""
+"Listing containers in accounts with json or xml now includes a "
+"`last_modified` time. This does not change any on-disk data, but simply "
+"exposes the value to offer consistency with the object listings on "
+"containers."
+msgstr ""
+"Listing containers in accounts with JSON or XML now includes a "
+"`last_modified` time. This does not change any on-disk data, but simply "
+"exposes the value to offer consistency with the object listings on "
+"containers."
+
+msgid ""
+"Lock timeouts in the container updater are now logged at INFO level, not "
+"ERROR."
+msgstr ""
+"Lock timeouts in the container updater are now logged at INFO level, not "
+"ERROR."
+
+msgid "Log correct status code for conditional requests."
+msgstr "Log correct status code for conditional requests."
+
+msgid ""
+"Log deprecation warning for ``allow_versions`` in the container server "
+"config. Configure the ``versioned_writes`` middleware in the proxy server "
+"instead. This option will be ignored in a future release."
+msgstr ""
+"Log deprecation warning for ``allow_versions`` in the container server "
+"config. Configure the ``versioned_writes`` middleware in the proxy server "
+"instead. This option will be ignored in a future release."
+
+msgid ""
+"Log deprecation warnings for ``run_pause``. This setting was deprecated in "
+"Swift 2.4.0 and is replaced by ``interval``. It may be removed in a future "
+"release."
+msgstr ""
+"Log deprecation warnings for ``run_pause``. This setting was deprecated in "
+"Swift 2.4.0 and is replaced by ``interval``. It may be removed in a future "
+"release."
+
+msgid ""
+"Log formats are now more configurable and include support for anonymization. "
+"See the ``log_msg_template`` option in ``proxy-server.conf`` and `the Swift "
+"documentation <https://docs.openstack.org/swift/latest/logs.html#proxy-"
+"logs>`__ for more information."
+msgstr ""
+"Log formats are now more configurable and include support for anonymization. "
+"See the ``log_msg_template`` option in ``proxy-server.conf`` and `the Swift "
+"documentation <https://docs.openstack.org/swift/latest/logs.html#proxy-"
+"logs>`__ for more information."
+
+msgid "Log progress per partition when relinking/cleaning up."
+msgstr "Log progress per partition when relinking/cleaning up."
+
+msgid "Log the correct request type of a subrequest downstream of copy."
+msgstr "Log the correct request type of a sub-request downstream of copy."
+
+msgid "Logging improvements"
+msgstr "Logging improvements"
+
+msgid ""
+"Lower bounds of dependencies have been updated to reflect what is actually "
+"tested."
+msgstr ""
+"Lower bounds of dependencies have been updated to reflect what is actually "
+"tested."
+
+msgid ""
+"Make mount_check option usable in containerized environments by adding a "
+"check for an \".ismount\" file at the root directory of a device."
+msgstr ""
+"Make mount_check option usable in containerised environments by adding a "
+"check for an \".ismount\" file at the root directory of a device."
+
+msgid ""
+"Metrics are now emitted for a variety of S3 error responses, in the form "
+"``s3api.<status_int>.<error_class>[.<reason>]``"
+msgstr ""
+"Metrics are now emitted for a variety of S3 error responses, in the form "
+"``s3api.<status_int>.<error_class>[.<reason>]``"
+
+msgid ""
+"Metrics are now emitted for whether databases used for cleaving were created "
+"or already existed, allowing a better understanding of the reason for "
+"handoffs in the cluster."
+msgstr ""
+"Metrics are now emitted for whether databases used for cleaving were created "
+"or already existed, allowing a better understanding of the reason for "
+"handoffs in the cluster."
+
+msgid "Metrics improvements:"
+msgstr "Metrics improvements:"
+
+msgid "Mirror X-Trans-Id to X-Openstack-Request-Id."
+msgstr "Mirror X-Trans-Id to X-Openstack-Request-Id."
+
+msgid "Misplaced tombstone records are now properly cleaved."
+msgstr "Misplaced tombstone records are now properly cleaved."
+
+msgid ""
+"Misplaced-record stats are now also emitted to statsd. Previously, these "
+"were only available in logs."
+msgstr ""
+"Misplaced-record stats are now also emitted to statsd. Previously, these "
+"were only available in logs."
+
+msgid "More daemons now support systemd notify sockets."
+msgstr "More daemons now support systemd notify sockets."
+
+msgid ""
+"More headers are now copied from multi-part upload markers to their "
+"completed objects, including ``Content-Encoding``."
+msgstr ""
+"More headers are now copied from multi-part upload markers to their "
+"completed objects, including ``Content-Encoding``."
+
+msgid ""
+"More information is now synced to the fresh database when sharding. "
+"Previously, a database could lose the fact that it had been marked as "
+"deleted."
+msgstr ""
+"More information is now synced to the fresh database when sharding. "
+"Previously, a database could lose the fact that it had been marked as "
+"deleted."
+
+msgid ""
+"Move listing formatting out to a new proxy middleware named "
+"``listing_formats``. ``listing_formats`` should be just right of the first "
+"proxy-logging middleware, and left of most other middlewares. If it is not "
+"already present, it will be automatically inserted for you."
+msgstr ""
+"Move listing formatting out to a new proxy middleware named "
+"``listing_formats``. ``listing_formats`` should be just right of the first "
+"proxy-logging middleware, and left of most other middleware. If it is not "
+"already present, it will be automatically inserted for you."
+
+msgid "Moved Zuul v3 tox jobs into the Swift code repo."
+msgstr "Moved Zuul v3 tox jobs into the Swift code repo."
+
+msgid ""
+"Moved other-requirements.txt to bindep.txt. bindep.txt lists non-python "
+"dependencies of Swift."
+msgstr ""
+"Moved other-requirements.txt to bindep.txt. bindep.txt lists non-Python "
+"dependencies of Swift."
+
+msgid ""
+"Multi-character strings may now be used as delimiters in account and "
+"container listings."
+msgstr ""
+"Multi-character strings may now be used as delimiters in account and "
+"container listings."
+
+msgid ""
+"Multipart object segments are now actually deleted when the multipart object "
+"is deleted via the S3 API."
+msgstr ""
+"Multipart object segments are now actually deleted when the multipart object "
+"is deleted via the S3 API."
+
+msgid "Multipart upload parts may now be copied from other multipart uploads."
+msgstr "Multipart upload parts may now be copied from other multipart uploads."
+
+msgid ""
+"Multiple keymaster middlewares are now supported. This allows migration from "
+"one key provider to another."
+msgstr ""
+"Multiple keymaster middlewares are now supported. This allows migration from "
+"one key provider to another."
+
+msgid "New Features"
+msgstr "New Features"
+
+msgid ""
+"New buckets created via the S3 API will now store multi-part upload data in "
+"the same storage policy as other data rather than the cluster's default "
+"storage policy."
+msgstr ""
+"New buckets created via the S3 API will now store multi-part upload data in "
+"the same storage policy as other data rather than the cluster's default "
+"storage policy."
+
+msgid ""
+"New config variables to change the schedule priority and I/O scheduling "
+"class. Servers and daemons now understand `nice_priority`, `ionice_class`, "
+"and `ionice_priority` to schedule their relative importance. Please read "
+"http://docs.openstack.org/developer/swift/deployment_guide.html for full "
+"config details."
+msgstr ""
+"New config variables to change the schedule priority and I/O scheduling "
+"class. Servers and daemons now understand `nice_priority`, `ionice_class`, "
+"and `ionice_priority` to schedule their relative importance. Please read "
+"http://docs.openstack.org/developer/swift/deployment_guide.html for full "
+"config details."
+
+msgid "Newton Series Release Notes"
+msgstr "Newton Series Release Notes"
+
+msgid "Non-durable fragments can now be reverted from handoffs."
+msgstr "Non-durable fragments can now be reverted from handoffs."
+
+msgid ""
+"Note that ``secret_id`` values must remain unique across all keymasters in a "
+"given pipeline. If they are not unique, the right-most keymaster will take "
+"precedence."
+msgstr ""
+"Note that ``secret_id`` values must remain unique across all keymasters in a "
+"given pipeline. If they are not unique, the right-most keymaster will take "
+"precedence."
+
+msgid ""
+"Note that after writing EC data with Swift 2.11.0 or later, that data will "
+"not be accessible to earlier versions of Swift."
+msgstr ""
+"Note that after writing EC data with Swift 2.11.0 or later, that data will "
+"not be accessible to earlier versions of Swift."
+
+msgid ""
+"Note: if you have a custom middleware that makes account or container "
+"listings, it will only receive listings in JSON format."
+msgstr ""
+"Note: if you have a custom middleware that makes account or container "
+"listings, it will only receive listings in JSON format."
+
+msgid ""
+"Now Swift will use ``write_affinity_handoff_delete_count`` to define how "
+"many local handoff nodes should swift send request to get more candidates "
+"for the final response. The default value \"auto\" means Swift will "
+"calculate the number automatically based on the number of replicas and "
+"current cluster topology."
+msgstr ""
+"Now Swift will use ``write_affinity_handoff_delete_count`` to define how "
+"many local hand-off nodes should swift send request to get more candidates "
+"for the final response. The default value \"auto\" means Swift will "
+"calculate the number automatically based on the number of replicas and "
+"current cluster topology."
+
+msgid "Now ``swift-recon-cron`` works with conf.d configs."
+msgstr "Now ``swift-recon-cron`` works with conf.d configs."
+
+msgid ""
+"O_TMPFILE support is now detected by attempting to use it instead of looking "
+"at the kernel version. This allows older kernels with backported patches to "
+"take advantage of the O_TMPFILE functionality."
+msgstr ""
+"O_TMPFILE support is now detected by attempting to use it instead of looking "
+"at the kernel version. This allows older kernels with backported patches to "
+"take advantage of the O_TMPFILE functionality."
+
+msgid ""
+"Object expiration respects the ``expiring_objects_container_divisor`` config "
+"option."
+msgstr ""
+"Object expiration respects the ``expiring_objects_container_divisor`` config "
+"option."
+
+msgid "Object expiry improvements"
+msgstr "Object expiry improvements"
+
+msgid ""
+"Object reconstructor logs are now prefixed with information about the "
+"specific worker process logging the message. This makes reading the logs and "
+"understanding the messages much simpler."
+msgstr ""
+"Object reconstructor logs are now prefixed with information about the "
+"specific worker process logging the message. This makes reading the logs and "
+"understanding the messages much simpler."
+
+msgid ""
+"Object versioning now supports a \"history\" mode in addition to the older "
+"\"stack\" mode. The difference is in how DELETE requests are handled. For "
+"full details, please read http://docs.openstack.org/developer/swift/"
+"overview_object_versioning.html."
+msgstr ""
+"Object versioning now supports a \"history\" mode in addition to the older "
+"\"stack\" mode. The difference is in how DELETE requests are handled. For "
+"full details, please read http://docs.openstack.org/developer/swift/"
+"overview_object_versioning.html."
+
+msgid ""
+"Object writes to a container whose existence cannot be verified now 503 "
+"instead of 404."
+msgstr ""
+"Object writes to a container whose existence cannot be verified now 503 "
+"instead of 404."
+
+msgid ""
+"Objects with an ``X-Delete-At`` value in the far future no longer cause "
+"backend server errors."
+msgstr ""
+"Objects with an ``X-Delete-At`` value in the far future no longer cause "
+"backend server errors."
+
+msgid "Ocata Series Release Notes"
+msgstr "Ocata Series Release Notes"
+
+msgid ""
+"On Python 3, certain S3 API headers are now lower case as they would be "
+"coming from AWS."
+msgstr ""
+"On Python 3, certain S3 API headers are now lower case as they would be "
+"coming from AWS."
+
+msgid ""
+"On Python 3, fixed a RecursionError in swift-dispersion-report when using "
+"TLS."
+msgstr ""
+"On Python 3, fixed a RecursionError in swift-dispersion-report when using "
+"TLS."
+
+msgid ""
+"On Python 3, fixed an issue when reading or writing objects with a content "
+"type like ``message/*``. Previously, Swift would fail to respond."
+msgstr ""
+"On Python 3, fixed an issue when reading or writing objects with a content "
+"type like ``message/*``. Previously, Swift would fail to respond."
+
+msgid ""
+"On Python 3, the KMS keymaster now works with secrets stored in Barbican "
+"with a ``text/plain`` payload-content-type."
+msgstr ""
+"On Python 3, the KMS keymaster now works with secrets stored in Barbican "
+"with a ``text/plain`` payload-content-type."
+
+msgid "On Python 3, the formpost middleware now works with unicode file names."
+msgstr ""
+"On Python 3, the formpost middleware now works with Unicode file names."
+
+msgid ""
+"On newer kernels (3.15+ when using xfs), Swift will use the O_TMPFILE flag "
+"when opening a file instead of creating a temporary file and renaming it on "
+"commit. This makes the data path simpler and allows the filesystem to more "
+"efficiently optimize the files on disk, resulting in better performance."
+msgstr ""
+"On newer kernels (3.15+ when using xfs), Swift will use the O_TMPFILE flag "
+"when opening a file instead of creating a temporary file and renaming it on "
+"commit. This makes the data path simpler and allows the filesystem to more "
+"efficiently optimise the files on disk, resulting in better performance."
+
+msgid ""
+"On upgrade, a node configured with concurrency=N will still handle async "
+"updates N-at-a-time, but will do so using only one process instead of N."
+msgstr ""
+"On upgrade, a node configured with concurrency=N will still handle async "
+"updates N-at-a-time, but will do so using only one process instead of N."
+
+msgid ""
+"Operators should verify that encryption is not enabled in their reconciler "
+"pipelines; having it enabled there may harm data durability. For more "
+"information, see `bug 1910804 <https://launchpad.net/bugs/1910804>`__."
+msgstr ""
+"Operators should verify that encryption is not enabled in their reconciler "
+"pipelines; having it enabled there may harm data durability. For more "
+"information, see `bug 1910804 <https://launchpad.net/bugs/1910804>`__."
+
+msgid ""
+"Optimize the Erasure Code reconstructor protocol to reduce IO load on "
+"servers."
+msgstr ""
+"Optimise the Erasure Code reconstructor protocol to reduce I/O load on "
+"servers."
+
+msgid ""
+"Optimized the common case for hashing filesystem trees, thus eliminating a "
+"lot of extraneous disk I/O."
+msgstr ""
+"Optimised the common case for hashing filesystem trees, thus eliminating a "
+"lot of extraneous disk I/O."
+
+msgid ""
+"Ordinary objects in S3 use the MD5 of the object as the ETag, just like "
+"Swift. Multipart Uploads follow a different format, notably including a dash "
+"followed by the number of segments. To that end (and for S3 API requests "
+"*only*), SLO responses via the S3 API have a literal '-N' added on the end "
+"of the ETag."
+msgstr ""
+"Ordinary objects in S3 use the MD5 of the object as the ETag, just like "
+"Swift. Multipart Uploads follow a different format, notably including a dash "
+"followed by the number of segments. To that end (and for S3 API requests "
+"*only*), SLO responses via the S3 API have a literal '-N' added on the end "
+"of the ETag."
+
+msgid "Other Notes"
+msgstr "Other Notes"
+
+msgid ""
+"Overlapping shrinking shards no longer generate audit warnings; these are "
+"expected to sometimes overlap."
+msgstr ""
+"Overlapping shrinking shards no longer generate audit warnings; these are "
+"expected to sometimes overlap."
+
+msgid ""
+"PUT subrequests generated from a client-side COPY will now properly log the "
+"SSC (server-side copy) Swift source field. See https://docs.openstack.org/"
+"developer/swift/logs.html#swift-source for more information."
+msgstr ""
+"PUT sub-requests generated from a client-side COPY will now properly log the "
+"SSC (server-side copy) Swift source field. See https://docs.openstack.org/"
+"developer/swift/logs.html#swift-source for more information."
+
+msgid ""
+"Partition cleanup is more robust, decreasing the likelihood of leaving "
+"behind mostly-empty partitions from the old partition power."
+msgstr ""
+"Partition cleanup is more robust, decreasing the likelihood of leaving "
+"behind mostly-empty partitions from the old partition power."
+
+msgid "Partition power increase fixes:"
+msgstr "Partition power increase fixes:"
+
+msgid "Partition power increase improvements:"
+msgstr "Partition power increase improvements:"
+
+msgid ""
+"Partitions that encountered errors during relinking are no longer marked as "
+"completed in the relinker state file. This ensures that a subsequent relink "
+"will retry the failed partitions."
+msgstr ""
+"Partitions that encountered errors during relinking are no longer marked as "
+"completed in the relinker state file. This ensures that a subsequent relink "
+"will retry the failed partitions."
+
+msgid ""
+"Per-service ``auto_create_account_prefix`` settings are now deprecated and "
+"may be ignored in a future release; if you need to use this, please set it "
+"in the ``[swift-constraints]`` section of ``/etc/swift/swift.conf``."
+msgstr ""
+"Per-service ``auto_create_account_prefix`` settings are now deprecated and "
+"may be ignored in a future release; if you need to use this, please set it "
+"in the ``[swift-constraints]`` section of ``/etc/swift/swift.conf``."
+
+msgid ""
+"Pickle support has been removed from Swift's memcache client. Support had "
+"been deprecated since Swift 1.7.0."
+msgstr ""
+"Pickle support has been removed from Swift's memcache client. Support had "
+"been deprecated since Swift 1.7.0."
+
+msgid "Pike Series Release Notes"
+msgstr "Pike Series Release Notes"
+
+msgid ""
+"Preflight requests do not contain enough information to map a bucket to an "
+"account/container pair; a new cluster-wide option "
+"``cors_preflight_allow_origin`` may be configured for such OPTIONS requests. "
+"The default (blank) rejects all S3 preflight requests."
+msgstr ""
+"Preflight requests do not contain enough information to map a bucket to an "
+"account/container pair; a new cluster-wide option "
+"``cors_preflight_allow_origin`` may be configured for such OPTIONS requests. "
+"The default (blank) rejects all S3 preflight requests."
+
+msgid ""
+"Prevent PyKMIP's kmip_protocol logger from logging at DEBUG. Previously, "
+"some versions of PyKMIP would include all wire data when the root logger was "
+"configured to log at DEBUG; this could expose key material in logs. Only the "
+"``kmip_keymaster`` was affected."
+msgstr ""
+"Prevent PyKMIP's kmip_protocol logger from logging at DEBUG. Previously, "
+"some versions of PyKMIP would include all wire data when the root logger was "
+"configured to log at DEBUG; this could expose key material in logs. Only the "
+"``kmip_keymaster`` was affected."
+
+msgid ""
+"Prevent PyKMIP's kmip_protocol logger from logging at DEBUG. Previously, "
+"some versions of PyKMIP would include all wire data when the root logger was "
+"configured to log at DEBUG; this could expose key material in logs. Only the "
+"kmip_keymaster was affected."
+msgstr ""
+"Prevent PyKMIP's kmip_protocol logger from logging at DEBUG. Previously, "
+"some versions of PyKMIP would include all wire data when the root logger was "
+"configured to log at DEBUG; this could expose key material in logs. Only the "
+"kmip_keymaster was affected."
+
+msgid ""
+"Prevent logged traceback in object-server on client disconnect for chunked "
+"transfers to replicated policies."
+msgstr ""
+"Prevent logged traceback in object-server on client disconnect for chunked "
+"transfers to replicated policies."
+
+msgid ""
+"Prevent object updates from auto-creating shard containers. This ensures "
+"more consistent listings for sharded containers during rebalances."
+msgstr ""
+"Prevent object updates from auto-creating shard containers. This ensures "
+"more consistent listings for sharded containers during rebalances."
+
+msgid ""
+"Prevent shard databases from losing track of their root database when "
+"deleted."
+msgstr ""
+"Prevent shard databases from losing track of their root database when "
+"deleted."
+
+msgid ""
+"Prevent sharded root databases from being reclaimed to ensure that shards "
+"can detect that they have been deleted."
+msgstr ""
+"Prevent sharded root databases from being reclaimed to ensure that shards "
+"can detect that they have been deleted."
+
+msgid ""
+"Previously, when deleting objects in multi-region swift deployment with "
+"write affinity configured, users always get 404 when deleting object before "
+"it's replicated to appropriate nodes."
+msgstr ""
+"Previously, when deleting objects in multi-region swift deployment with "
+"write affinity configured, users always get 404 when deleting object before "
+"it's replicated to appropriate nodes."
+
+msgid ""
+"Provide an S3 API compatibility layer. The external \"swift3\" project has "
+"been imported into Swift's codebase as the \"s3api\" middleware."
+msgstr ""
+"Provide an S3 API compatibility layer. The external \"swift3\" project has "
+"been imported into Swift's codebase as the \"s3api\" middleware."
+
+msgid ""
+"Provide useful status codes in logs for some versioning and symlink "
+"subrequests that were previously logged as 499."
+msgstr ""
+"Provide useful status codes in logs for some versioning and symlink "
+"subrequests that were previously logged as 499."
+
+msgid ""
+"Proxy logging for Complete Multipart Upload requests is now more consistent "
+"when requests have been retried."
+msgstr ""
+"Proxy logging for Complete Multipart Upload requests is now more consistent "
+"when requests have been retried."
+
+msgid ""
+"Proxy, account, container, and object servers now support \"seamless "
+"reloads\" via ``SIGUSR1``. This is similar to the existing graceful restarts "
+"but keeps the server socket open the whole time, reducing service downtime."
+msgstr ""
+"Proxy, account, container, and object servers now support \"seamless "
+"reloads\" via ``SIGUSR1``. This is similar to the existing graceful restarts "
+"but keeps the server socket open the whole time, reducing service downtime."
+
+msgid "Python 3 bug fixes:"
+msgstr "Python 3 bug fixes:"
+
+msgid "Python 3 fixes:"
+msgstr "Python 3 fixes:"
+
+msgid "Python 3.11 is now supported."
+msgstr "Python 3.11 is now supported."
+
+msgid ""
+"Python 3.6 and 3.7 are now fully supported. If you've been testing Swift on "
+"Python 3, upgrade at your earliest convenience."
+msgstr ""
+"Python 3.6 and 3.7 are now fully supported. If you've been testing Swift on "
+"Python 3, upgrade at your earliest convenience."
+
+msgid "Queens Series Release Notes"
+msgstr "Queens Series Release Notes"
+
+msgid "Reduced log noise for common ssync errors."
+msgstr "Reduced log noise for common ssync errors."
+
+msgid ""
+"Reduced object-replicator and object-reconstructor CPU usage by only "
+"checking that the device list is current when rings change."
+msgstr ""
+"Reduced object-replicator and object-reconstructor CPU usage by only "
+"checking that the device list is current when rings change."
+
+msgid ""
+"Reduced the backend load of making ``?versions`` requests to a container "
+"that has never had object versioning enabled."
+msgstr ""
+"Reduced the backend load of making ``?versions`` requests to a container "
+"that has never had object versioning enabled."
+
+msgid ""
+"Reduced the frequency of ``Reclaimable db stuck waiting for shrinking`` "
+"messages when a root DB has been deleted but its shards have not been shrunk "
+"away."
+msgstr ""
+"Reduced the frequency of ``Reclaimable db stuck waiting for shrinking`` "
+"messages when a root DB has been deleted but its shards have not been shrunk "
+"away."
+
+msgid ""
+"Region name config option is now respected when configuring S3 credential "
+"caching."
+msgstr ""
+"Region name config option is now respected when configuring S3 credential "
+"caching."
+
+msgid ""
+"Rehash partitions during the partition power increase. Previously, we relied "
+"on the replication engine to perform the rehash, which could cause an "
+"unexpected I/O spike after a partition power increase."
+msgstr ""
+"Rehash partitions during the partition power increase. Previously, we relied "
+"on the replication engine to perform the rehash, which could cause an "
+"unexpected I/O spike after a partition power increase."
+
+msgid ""
+"Remove ``swift-temp-url`` script. The functionality has been in swiftclient "
+"for a long time and this script has been deprecated since 2.10.0."
+msgstr ""
+"Remove ``swift-temp-url`` script. The functionality has been in swiftclient "
+"for a long time and this script has been deprecated since 2.10.0."
+
+msgid "Remove deprecated ``vm_test_mode`` option."
+msgstr "Remove deprecated ``vm_test_mode`` option."
+
+msgid "Remove empty db hash and suffix directories if a db gets quarantined."
+msgstr "Remove empty DB hash and suffix directories if a DB gets quarantined."
+
+msgid ""
+"Removed \"in-process-\" from func env tox name to work with upstream CI."
+msgstr ""
+"Removed \"in-process-\" from func env tox name to work with upstream CI."
+
+msgid ""
+"Removed a race condition that could cause newly-written data to not be "
+"linked into the new partition for the new partition power."
+msgstr ""
+"Removed a race condition that could cause newly-written data to not be "
+"linked into the new partition for the new partition power."
+
+msgid ""
+"Removed a race condition where a POST to an SLO could modify the X-Static-"
+"Large-Object metadata."
+msgstr ""
+"Removed a race condition where a POST to an SLO could modify the X-Static-"
+"Large-Object metadata."
+
+msgid ""
+"Removed a request-smuggling vector when running a mixed py2/py3 cluster."
+msgstr ""
+"Removed a request-smuggling vector when running a mixed py2/py3 cluster."
+
+msgid ""
+"Removed all ``post_as_copy`` related code and configs. The option has been "
+"deprecated since 2.13.0."
+msgstr ""
+"Removed all ``post_as_copy`` related code and configs. The option has been "
+"deprecated since 2.13.0."
+
+msgid ""
+"Removed per-device reconstruction stats. Now that the reconstructor is "
+"shuffling parts before going through them, those stats no longer make sense."
+msgstr ""
+"Removed per-device reconstruction stats. Now that the reconstructor is "
+"shuffling parts before going through them, those stats no longer make sense."
+
+msgid ""
+"Removed the hard dependency on netifaces; it may still be used if the "
+"``getifaddrs`` C function is not available. This fallback support may be "
+"removed in a future release."
+msgstr ""
+"Removed the hard dependency on netifaces; it may still be used if the "
+"``getifaddrs`` C function is not available. This fallback support may be "
+"removed in a future release."
+
+msgid ""
+"Replaced ``replication_one_per_device`` by custom count defined by "
+"``replication_concurrency_per_device``. The original config value is "
+"deprecated, but continues to function for now. If both values are defined, "
+"the old ``replication_one_per_device`` is ignored."
+msgstr ""
+"Replaced ``replication_one_per_device`` by custom count defined by "
+"``replication_concurrency_per_device``. The original config value is "
+"deprecated, but continues to function for now. If both values are defined, "
+"the old ``replication_one_per_device`` is ignored."
+
+msgid "Replication fixes:"
+msgstr "Replication fixes:"
+
+msgid "Replication improvements:"
+msgstr "Replication improvements:"
+
+msgid ""
+"Replication servers can now handle all request methods. This allows ssync to "
+"work with a separate replication network."
+msgstr ""
+"Replication servers can now handle all request methods. This allows ssync to "
+"work with a separate replication network."
+
+msgid ""
+"Requesting multiple ranges from a Dynamic Large Object now returns the "
+"entire object instead of incorrect data. This was previously fixed in 2.23.0."
+msgstr ""
+"Requesting multiple ranges from a Dynamic Large Object now returns the "
+"entire object instead of incorrect data. This was previously fixed in 2.23.0."
+
+msgid "Require that known-bad EC schemes be deprecated"
+msgstr "Require that known-bad EC schemes be deprecated"
+
+msgid "Respect server type for --md5 check in swift-recon."
+msgstr "Respect server type for --md5 check in swift-recon."
+
+msgid ""
+"Respond 400 Bad Request when Accept headers fail to parse instead of "
+"returning 406 Not Acceptable."
+msgstr ""
+"Respond 400 Bad Request when Accept headers fail to parse instead of "
+"returning 406 Not Acceptable."
+
+msgid ""
+"Return an error if the SLO manifest could not be parsed. Previously, a zero-"
+"byte response was returned."
+msgstr ""
+"Return an error if the SLO manifest could not be parsed. Previously, a zero-"
+"byte response was returned."
+
+msgid "Ring builder output tables better display weights over 1000."
+msgstr "Ring builder output tables better display weights over 1000."
+
+msgid ""
+"Ring files now include byteorder information about the endian of the machine "
+"used to generate the file, and the values are appropriately byteswapped if "
+"deserialized on a machine with a different endianness. Newly created ring "
+"files will be byteorder agnostic, but previously generated ring files will "
+"still fail on different endian architectures. Regenerating older ring files "
+"will cause them to become byteorder agnostic. The regeneration of the ring "
+"files will not cause any new data movement. Newer ring files will still be "
+"usable by older versions of Swift (on machines with the same endianness--"
+"this maintains existing behavior)."
+msgstr ""
+"Ring files now include byteorder information about the endian of the machine "
+"used to generate the file, and the values are appropriately byteswapped if "
+"deserialised on a machine with a different endianness. Newly created ring "
+"files will be byteorder agnostic, but previously generated ring files will "
+"still fail on different endian architectures. Regenerating older ring files "
+"will cause them to become byteorder agnostic. The regeneration of the ring "
+"files will not cause any new data movement. Newer ring files will still be "
+"usable by older versions of Swift (on machines with the same endianness--"
+"this maintains existing behaviour)."
+
+msgid ""
+"Rings with min_part_hours set to zero will now only move one partition "
+"replica per rebalance, thus matching behavior when min_part_hours is greater "
+"than zero."
+msgstr ""
+"Rings with min_part_hours set to zero will now only move one partition "
+"replica per rebalance, thus matching behaviour when min_part_hours is "
+"greater than zero."
+
+msgid "Rocky Series Release Notes"
+msgstr "Rocky Series Release Notes"
+
+msgid "S3 API compatibility updates"
+msgstr "S3 API compatibility updates"
+
+msgid "S3 API fixes:"
+msgstr "S3 API fixes:"
+
+msgid "S3 API improvements"
+msgstr "S3 API improvements"
+
+msgid "S3 API improvements:"
+msgstr "S3 API improvements:"
+
+msgid ""
+"S3 API now allows multipart uploads with non-ASCII characters in the object "
+"name."
+msgstr ""
+"S3 API now allows multipart uploads with non-ASCII characters in the object "
+"name."
+
+msgid ""
+"S3 API now translates ``503 Service Unavailable`` responses to a more S3-"
+"like response instead of raising an error."
+msgstr ""
+"S3 API now translates ``503 Service Unavailable`` responses to a more S3-"
+"like response instead of raising an error."
+
+msgid "S3 ETag for SLOs now include a '-'."
+msgstr "S3 ETag for SLOs now include a '-'."
+
+msgid "S3 requests are now less demanding on the container layer."
+msgstr "S3 requests are now less demanding on the container layer."
+
+msgid ""
+"SHA-1 signatures are now deprecated for the formpost and tempurl "
+"middlewares. At some point in the future, SHA-1 will no longer be enabled by "
+"default; eventually, support for it will be removed entirely."
+msgstr ""
+"SHA-1 signatures are now deprecated for the formpost and tempurl "
+"middlewares. At some point in the future, SHA-1 will no longer be enabled by "
+"default; eventually, support for it will be removed entirely."
+
+msgid ""
+"SLO manifest PUT requests can now be properly validated by sending an ETag "
+"header of the md5 sum of the concatenated md5 sums of the referenced "
+"segments."
+msgstr ""
+"SLO manifest PUT requests can now be properly validated by sending an ETag "
+"header of the MD5 sum of the concatenated MD5 sums of the referenced "
+"segments."
+
+msgid ""
+"SLO will now concurrently HEAD segments, resulting in much faster manifest "
+"validation and object creation. By default, two HEAD requests will be done "
+"at a time, but this can be changed by the operator via the new `concurrency` "
+"setting in the \"[filter:slo]\" section of the proxy server config."
+msgstr ""
+"SLO will now concurrently HEAD segments, resulting in much faster manifest "
+"validation and object creation. By default, two HEAD requests will be done "
+"at a time, but this can be changed by the operator via the new `concurrency` "
+"setting in the \"[filter:slo]\" section of the proxy server config."
+
+msgid ""
+"SSYNC replication mode now removes as much of the directory structure as "
+"possible as soon at it observes that the directory is empty. This reduces "
+"the work needed for subsequent replication passes."
+msgstr ""
+"SSYNC replication mode now removes as much of the directory structure as "
+"possible as soon at it observes that the directory is empty. This reduces "
+"the work needed for subsequent replication passes."
+
+msgid ""
+"Save the ring when dispersion improves, even if balance doesn't improve."
+msgstr ""
+"Save the ring when dispersion improves, even if balance doesn't improve."
+
+msgid "Security Issues"
+msgstr "Security Issues"
+
+msgid ""
+"See the provided ``keymaster.conf-sample`` for more information about this "
+"setting."
+msgstr ""
+"See the provided ``keymaster.conf-sample`` for more information about this "
+"setting."
+
+msgid "Send ETag header in 206 Partial Content responses to SLO reads."
+msgstr "Send ETag header in 206 Partial Content responses to SLO reads."
+
+msgid ""
+"Server errors encountered when validating the first segment of a Static or "
+"Dynamic Large Object now return a 503 to the client, rather than a 409."
+msgstr ""
+"Server errors encountered when validating the first segment of a Static or "
+"Dynamic Large Object now return a 503 to the client, rather than a 409."
+
+msgid ""
+"Server workers may now be gracefully terminated via ``SIGHUP`` or "
+"``SIGUSR1``. The parent process will then spawn a fresh worker."
+msgstr ""
+"Server workers may now be gracefully terminated via ``SIGHUP`` or "
+"``SIGUSR1``. The parent process will then spawn a fresh worker."
+
+msgid ""
+"Server-side copying of erasure-coded data to a replicated policy no longer "
+"copies EC sysmeta. The previous behavior had no material effect, but could "
+"confuse operators examining data on disk."
+msgstr ""
+"Server-side copying of erasure-coded data to a replicated policy no longer "
+"copies EC sysmeta. The previous behaviour had no material effect but could "
+"confuse operators examining data on disk."
+
+msgid ""
+"Servers now open one listen socket per worker, ensuring each worker serves "
+"roughly the same number of concurrent connections."
+msgstr ""
+"Servers now open one listen socket per worker, ensuring each worker serves "
+"roughly the same number of concurrent connections."
+
+msgid ""
+"Several fixes to prepare for Python 3.12 support. While not yet tested in "
+"the gate, initial manual testing looks promising."
+msgstr ""
+"Several fixes to prepare for Python 3.12 support. While not yet tested in "
+"the gate, initial manual testing looks promising."
+
+msgid "Several utility scripts now work better on Python 3:"
+msgstr "Several utility scripts now work better on Python 3:"
+
+msgid ""
+"Shard ranges with no rows to cleave could previously be left in the CREATED "
+"state after cleaving. Now, they are advanced to CLEAVED."
+msgstr ""
+"Shard ranges with no rows to cleave could previously be left in the CREATED "
+"state after cleaving. Now, they are advanced to CLEAVED."
+
+msgid ""
+"Sharding cycle time and last-completion time are now available via swift-"
+"recon."
+msgstr ""
+"Sharding cycle time and last-completion time are now available via swift-"
+"recon."
+
+msgid "Sharding fixes"
+msgstr "Sharding fixes"
+
+msgid "Sharding fixes:"
+msgstr "Sharding fixes:"
+
+msgid "Sharding improvements"
+msgstr "Sharding improvements"
+
+msgid "Sharding improvements:"
+msgstr "Sharding improvements:"
+
+msgid ""
+"Sharding metadata is no longer cleared when databases are deleted. This "
+"could previously cause deleted shards that still had rows to become stuck "
+"and never move them to the correct database."
+msgstr ""
+"Sharding metadata is no longer cleared when databases are deleted. This "
+"could previously cause deleted shards that still had rows to become stuck "
+"and never move them to the correct database."
+
+msgid ""
+"Shards no longer report stats to the root database when they are in the "
+"``CREATED`` state."
+msgstr ""
+"Shards no longer report stats to the root database when they are in the "
+"``CREATED`` state."
+
+msgid ""
+"Shuffle object-updater work. This somewhat reduces the impact a single "
+"overloaded database has on other containers' listings."
+msgstr ""
+"Shuffle object-updater work. This somewhat reduces the impact a single "
+"overloaded database has on other containers' listings."
+
+msgid ""
+"Signal handling is more consistently logged at notice level. Previously, "
+"signal handling would sometimes be logged at info or error levels."
+msgstr ""
+"Signal handling is more consistently logged at notice level. Previously, "
+"signal handling would sometimes be logged at info or error levels."
+
+msgid ""
+"Significant improvements to the api-ref doc available at http://developer."
+"openstack.org/api-ref/object-storage/."
+msgstr ""
+"Significant improvements to the api-ref doc available at http://developer."
+"openstack.org/api-ref/object-storage/."
+
+msgid ""
+"Similar to above, ``expansion_limit`` was added as an absolute-size "
+"replacement for the now-deprecated ``shard_shrink_merge_point`` "
+"configuration option."
+msgstr ""
+"Similar to above, ``expansion_limit`` was added as an absolute-size "
+"replacement for the now-deprecated ``shard_shrink_merge_point`` "
+"configuration option."
+
+msgid ""
+"Ssync no longer corrupts unencrypted non-ASCII metadata during transfers."
+msgstr ""
+"Ssync no longer corrupts unencrypted non-ASCII metadata during transfers."
+
+msgid ""
+"Static Large Object (SLO) manifest may now (again) have zero-byte last "
+"segments."
+msgstr ""
+"Static Large Object (SLO) manifest may now (again) have zero-byte last "
+"segments."
+
+msgid ""
+"Static Large Object sizes in listings for versioned containers are now more "
+"accurate."
+msgstr ""
+"Static Large Object sizes in listings for versioned containers are now more "
+"accurate."
+
+msgid "Static large object fixes:"
+msgstr "Static large object fixes:"
+
+msgid ""
+"Staticweb correctly handles listings when paths include non-ASCII characters."
+msgstr ""
+"Staticweb correctly handles listings when paths include non-ASCII characters."
+
+msgid "Stein Series Release Notes"
+msgstr "Stein Series Release Notes"
+
+msgid ""
+"Stop and disable the object-reconstructor before upgrading. This ensures no "
+"upgraded object server starts writing new fragments that old object servers "
+"would quarantine."
+msgstr ""
+"Stop and disable the object-reconstructor before upgrading. This ensures no "
+"upgraded object server starts writing new fragments that old object servers "
+"would quarantine."
+
+msgid ""
+"Stop logging tracebacks in the ``object-replicator`` when it runs out of "
+"handoff locations."
+msgstr ""
+"Stop logging tracebacks in the ``object-replicator`` when it runs out of "
+"handoff locations."
+
+msgid "Stopped logging tracebacks when receiving an unexpected response."
+msgstr "Stopped logging tracebacks when receiving an unexpected response."
+
+msgid ""
+"Storage policy definitions in swift.conf can now define the diskfile to use "
+"to access objects. See the included swift.conf-sample file for a description "
+"of usage."
+msgstr ""
+"Storage policy definitions in swift.conf can now define the diskfile to use "
+"to access objects. See the included swift.conf-sample file for a description "
+"of usage."
+
+msgid "Support multi-range GETs for static large objects."
+msgstr "Support multi-range GETs for static large objects."
+
+msgid "Suppress unexpected-file warnings for rsync temp files."
+msgstr "Suppress unexpected-file warnings for rsync temp files."
+
+msgid "Suppressed ``RemoteDisconnected`` tracebacks."
+msgstr "Suppressed ``RemoteDisconnected`` tracebacks."
+
+msgid "Suppressed the KeyError message when auditor finds an expired object."
+msgstr "Suppressed the KeyError message when auditor finds an expired object."
+
+msgid "Swift Release Notes"
+msgstr "Swift Release Notes"
+
+msgid ""
+"Swift can now cache the S3 secret from Keystone to use for subsequent "
+"requests. This functionality is disabled by default but can be enabled by "
+"setting the ``secret_cache_duration`` in the ``[filter:s3token]`` section of "
+"the proxy server config to a number greater than 0."
+msgstr ""
+"Swift can now cache the S3 secret from Keystone to use for subsequent "
+"requests. This functionality is disabled by default but can be enabled by "
+"setting the ``secret_cache_duration`` in the ``[filter:s3token]`` section of "
+"the proxy server config to a number greater than 0."
+
+msgid ""
+"Swift now returns a 503 (instead of a 500) when an account auto-create fails."
+msgstr ""
+"Swift now returns a 503 (instead of a 500) when an account auto-create fails."
+
+msgid "Swift path and on-disk path are now included with all sharder logging."
+msgstr "Swift path and on-disk path are now included with all sharder logging."
+
+msgid ""
+"Swift-all-in-one Docker images are now built and published to https://hub."
+"docker.com/r/openstackswift/saio. These are intended for use as development "
+"targets, but will hopefully be useful as a starting point for other work "
+"involving containerizing Swift."
+msgstr ""
+"Swift-all-in-one Docker images are now built and published to https://hub."
+"docker.com/r/openstackswift/saio. These are intended for use as development "
+"targets, but will hopefully be useful as a starting point for other work "
+"involving containerizing Swift."
+
+msgid ""
+"Symlink objects reference one other object. They are created by creating an "
+"empty object with an X-Symlink-Target header. The value of the header is of "
+"the format <container>/<object>, and the target does not need to exist at "
+"the time of symlink creation. Cross-account symlinks can be created by "
+"including the X-Symlink-Target-Account header."
+msgstr ""
+"Symlink objects reference one other object. They are created by creating an "
+"empty object with an X-Symlink-Target header. The value of the header is of "
+"the format <container>/<object>, and the target does not need to exist at "
+"the time of symlink creation. Cross-account symlinks can be created by "
+"including the X-Symlink-Target-Account header."
+
+msgid ""
+"TempURLs now support IP range restrictions. Please see https://docs."
+"openstack.org/swift/latest/middleware.html#client-usage for more information "
+"on how to use this additional restriction."
+msgstr ""
+"TempURLs now support IP range restrictions. Please see https://docs."
+"openstack.org/swift/latest/middleware.html#client-usage for more information "
+"on how to use this additional restriction."
+
+msgid ""
+"TempURLs now support a validation against a common prefix. A prefix-based "
+"signature grants access to all objects which share the same prefix. This "
+"avoids the creation of a large amount of signatures, when a whole container "
+"or pseudofolder is shared."
+msgstr ""
+"TempURLs now support a validation against a common prefix. A prefix-based "
+"signature grants access to all objects which share the same prefix. This "
+"avoids the creation of a large amount of signatures, when a whole container "
+"or pseudofolder is shared."
+
+msgid ""
+"TempURLs using the \"inline\" parameter can now also set the \"filename\" "
+"parameter. Both are used in the Content-Disposition response header."
+msgstr ""
+"TempURLs using the \"inline\" parameter can now also set the \"filename\" "
+"parameter. Both are used in the Content-Disposition response header."
+
+msgid ""
+"Temporary URLs now support one common form of ISO 8601 timestamps in "
+"addition to Unix seconds-since-epoch timestamps. The ISO 8601 format "
+"accepted is '%Y-%m-%dT%H:%M:%SZ'. This makes TempURLs more user-friendly to "
+"produce and consume."
+msgstr ""
+"Temporary URLs now support one common form of ISO 8601 timestamps in "
+"addition to Unix seconds-since-epoch timestamps. The ISO 8601 format "
+"accepted is '%Y-%m-%dT%H:%M:%SZ'. This makes TempURLs more user-friendly to "
+"produce and consume."
+
+msgid ""
+"The 'compact' command now outputs the total number of compactible sequences."
+msgstr ""
+"The 'compact' command now outputs the total number of compactible sequences."
+
+msgid ""
+"The EC reconstructor process has been dramatically improved by adding "
+"support for multiple concurrent workers. Multiple processes are required to "
+"get high concurrency, and this change results in much faster rebalance times "
+"on servers with many drives."
+msgstr ""
+"The EC reconstructor process has been dramatically improved by adding "
+"support for multiple concurrent workers. Multiple processes are required to "
+"get high concurrency, and this change results in much faster rebalance times "
+"on servers with many drives."
+
+msgid ""
+"The EC reconstructor will now attempt to remove empty directories "
+"immediately, while the inodes are still cached, rather than waiting until "
+"the next run."
+msgstr ""
+"The EC reconstructor will now attempt to remove empty directories "
+"immediately, while the inodes are still cached, rather than waiting until "
+"the next run."
+
+msgid "The ETag-quoting middleware no longer raises TypeErrors."
+msgstr "The ETag-quoting middleware no longer raises TypeErrors."
+
+msgid "The S3 ACL and Delete Multiple APIs are now less case-sensitive."
+msgstr "The S3 ACL and Delete Multiple APIs are now less case-sensitive."
+
+msgid ""
+"The ``container-replicator`` now correctly enqueues ``container-reconciler`` "
+"work for sharded containers."
+msgstr ""
+"The ``container-replicator`` now correctly enqueues ``container-reconciler`` "
+"work for sharded containers."
+
+msgid ""
+"The ``container-replicator`` now only attempts to fetch shard ranges if the "
+"remote indicates that it has shard ranges. Further, it does so with a "
+"timeout to prevent the process from hanging in certain cases."
+msgstr ""
+"The ``container-replicator`` now only attempts to fetch shard ranges if the "
+"remote indicates that it has shard ranges. Further, it does so with a "
+"timeout to prevent the process from hanging in certain cases."
+
+msgid ""
+"The ``domain_remap`` middleware now supports the ``mangle_client_paths`` "
+"option. Its default \"false\" value changes ``domain_remap`` parsing to stop "
+"stripping the ``path_root`` value from URL paths. If users depend on this "
+"path mangling, operators should set ``mangle_client_paths`` to \"True\" "
+"before upgrading."
+msgstr ""
+"The ``domain_remap`` middleware now supports the ``mangle_client_paths`` "
+"option. Its default \"false\" value changes ``domain_remap`` parsing to stop "
+"stripping the ``path_root`` value from URL paths. If users depend on this "
+"path mangling, operators should set ``mangle_client_paths`` to \"True\" "
+"before upgrading."
+
+msgid ""
+"The ``kmip_keymaster`` middleware can now be configured directly in the "
+"proxy-server config file. The existing behavior of using an external config "
+"file is still supported."
+msgstr ""
+"The ``kmip_keymaster`` middleware can now be configured directly in the "
+"proxy-server config file. The existing behaviour of using an external config "
+"file is still supported."
+
+msgid ""
+"The ``object-expirer`` may now be configured in ``object-server.conf``. This "
+"is in anticipation of a future change to allow the ``object-expirer`` to be "
+"deployed on all nodes that run the ``object-server``."
+msgstr ""
+"The ``object-expirer`` may now be configured in ``object-server.conf``. This "
+"is in anticipation of a future change to allow the ``object-expirer`` to be "
+"deployed on all nodes that run the ``object-server``."
+
+msgid ""
+"The ``proxy-server`` now caches 'updating' shards, improving write "
+"performance for sharded containers. A new config option, "
+"``recheck_updating_shard_ranges``, controls the cache time; set it to 0 to "
+"disable caching."
+msgstr ""
+"The ``proxy-server`` now caches 'updating' shards, improving write "
+"performance for sharded containers. A new config option, "
+"``recheck_updating_shard_ranges``, controls the cache time; set it to 0 to "
+"disable caching."
+
+msgid ""
+"The ``proxy-server`` now ignores 404 responses from handoffs that have no "
+"data when deciding on the correct response for object requests, similar to "
+"what it already does for account and container requests."
+msgstr ""
+"The ``proxy-server`` now ignores 404 responses from handoffs that have no "
+"data when deciding on the correct response for object requests, similar to "
+"what it already does for account and container requests."
+
+msgid ""
+"The ``proxy-server`` now ignores 404 responses from handoffs without "
+"databases when deciding on the correct response for account and container "
+"requests."
+msgstr ""
+"The ``proxy-server`` now ignores 404 responses from handoffs without "
+"databases when deciding on the correct response for account and container "
+"requests."
+
+msgid ""
+"The ``recoverable_node_timeout`` option no longer applies to ``X-Newest`` "
+"GET requests."
+msgstr ""
+"The ``recoverable_node_timeout`` option no longer applies to ``X-Newest`` "
+"GET requests."
+
+msgid ""
+"The ``swift-drive-audit`` tool now works with ISO timestamps in kernel logs."
+msgstr ""
+"The ``swift-drive-audit`` tool now works with ISO timestamps in kernel logs."
+
+msgid ""
+"The ``swift-manage-shard-ranges`` tool has a new mode to repair gaps in the "
+"namespace."
+msgstr ""
+"The ``swift-manage-shard-ranges`` tool has a new mode to repair gaps in the "
+"namespace."
+
+msgid "The ``swift-recon-cron`` tool now better handles missing directories."
+msgstr "The ``swift-recon-cron`` tool now better handles missing directories."
+
+msgid ""
+"The above bug was caused by a difference in string types that resulted in "
+"ambiguity when decrypting. To prevent the ambiguity for new data, set "
+"``meta_version_to_write = 3`` in your keymaster configuration *after* "
+"upgrading all proxy servers."
+msgstr ""
+"The above bug was caused by a difference in string types that resulted in "
+"ambiguity when decrypting. To prevent the ambiguity for new data, set "
+"``meta_version_to_write = 3`` in your keymaster configuration *after* "
+"upgrading all proxy servers."
+
+msgid ""
+"The account and container auditors now log and update recon before going to "
+"sleep."
+msgstr ""
+"The account and container auditors now log and update recon before going to "
+"sleep."
+
+msgid ""
+"The bulk extract middleware once again allows clients to specify metadata "
+"(including expiration timestamps) for all objects in the archive."
+msgstr ""
+"The bulk extract middleware once again allows clients to specify metadata "
+"(including expiration timestamps) for all objects in the archive."
+
+msgid ""
+"The concurrent read options (``concurrent_gets``, ``concurrency_timeout``, "
+"and ``concurrent_ec_extra_requests``) may now be configured per storage-"
+"policy."
+msgstr ""
+"The concurrent read options (``concurrent_gets``, ``concurrency_timeout``, "
+"and ``concurrent_ec_extra_requests``) may now be configured per storage-"
+"policy."
+
+msgid ""
+"The container sharder can now handle containers with special characters in "
+"their names."
+msgstr ""
+"The container sharder can now handle containers with special characters in "
+"their names."
+
+msgid ""
+"The container-reconciler now scales out better with new ``processes``, "
+"``process``, and ``concurrency`` options, similar to the object-expirer."
+msgstr ""
+"The container-reconciler now scales out better with new ``processes``, "
+"``process``, and ``concurrency`` options, similar to the object-expirer."
+
+msgid ""
+"The container-updater now reports zero objects and bytes used for child DBs "
+"in sharded containers. This prevents double-counting in utilization reports."
+msgstr ""
+"The container-updater now reports zero objects and bytes used for child DBs "
+"in sharded containers. This prevents double-counting in utilisation reports."
+
+msgid "The correct storage policy is now logged for S3 requests."
+msgstr "The correct storage policy is now logged for S3 requests."
+
+msgid ""
+"The dark-data audit watcher now requires that all primary locations for an "
+"object's container agree that the data does not appear in listings to "
+"consider data \"dark\". Previously, a network partition that left an object "
+"node isolated could cause it to quarantine or delete all of its data."
+msgstr ""
+"The dark-data audit watcher now requires that all primary locations for an "
+"object's container agree that the data does not appear in listings to "
+"consider data \"dark\". Previously, a network partition that left an object "
+"node isolated could cause it to quarantine or delete all of its data."
+
+msgid ""
+"The dark-data audit watcher now skips objects younger than a new "
+"configurable ``grace_age`` period. This avoids issues where data could be "
+"flagged, quarantined, or deleted because of listing consistency issues. The "
+"default is one week."
+msgstr ""
+"The dark-data audit watcher now skips objects younger than a new "
+"configurable ``grace_age`` period. This avoids issues where data could be "
+"flagged, quarantined, or deleted because of listing consistency issues. The "
+"default is one week."
+
+msgid ""
+"The dark-data object audit watcher now works with sharded containers. "
+"Previously, it would think that all data files were absent from listings."
+msgstr ""
+"The dark-data object audit watcher now works with sharded containers. "
+"Previously, it would think that all data files were absent from listings."
+
+msgid ""
+"The default for `object_post_as_copy` has been changed to False. The option "
+"is now deprecated and will be removed in a future release. If your cluster "
+"is still running with post-as-copy enabled, please update it to use the "
+"\"fast-post\" method. Future versions of Swift will not support post-as-"
+"copy, and future features will not be supported under post-as-copy. (\"Fast-"
+"post\" is where `object_post_as_copy` is false)."
+msgstr ""
+"The default for `object_post_as_copy` has been changed to False. The option "
+"is now deprecated and will be removed in a future release. If your cluster "
+"is still running with post-as-copy enabled, please update it to use the "
+"\"fast-post\" method. Future versions of Swift will not support post-as-"
+"copy, and future features will not be supported under post-as-copy. (\"Fast-"
+"post\" is where `object_post_as_copy` is false)."
+
+msgid ""
+"The default location is now set to \"us-east-1\". This is more likely to be "
+"the default region that a client will try when using v4 signatures."
+msgstr ""
+"The default location is now set to \"us-east-1\". This is more likely to be "
+"the default region that a client will try when using v4 signatures."
+
+msgid ""
+"The erasure code reconstructor `handoffs_first` option has been deprecated "
+"in favor of `handoffs_only`. `handoffs_only` is far more useful, and just "
+"like `handoffs_first` mode in the replicator, it gives the operator the "
+"option of forcing the consistency engine to focus solely on revert (handoff) "
+"jobs, thus improving the speed of rebalances.  The `handoffs_only` behavior "
+"is somewhat consistent with the replicator's `handoffs_first` option (any "
+"error on any handoff in the replicator will make it essentially handoff only "
+"forever) but the `handoff_only` option does what you want and is named "
+"correctly in the reconstructor."
+msgstr ""
+"The erasure code reconstructor `handoffs_first` option has been deprecated "
+"in favour of `handoffs_only`. `handoffs_only` is far more useful, and just "
+"like `handoffs_first` mode in the replicator, it gives the operator the "
+"option of forcing the consistency engine to focus solely on revert (handoff) "
+"jobs, thus improving the speed of rebalances.  The `handoffs_only` behaviour "
+"is somewhat consistent with the replicator's `handoffs_first` option (any "
+"error on any hand-off in the replicator will make it essentially hand-off "
+"only forever) but the `handoff_only` option does what you want and is named "
+"correctly in the reconstructor."
+
+msgid ""
+"The erasure code reconstructor will now shuffle work jobs across all disks "
+"instead of going disk-by-disk. This eliminates single-disk I/O contention "
+"and allows continued scaling as concurrency is increased."
+msgstr ""
+"The erasure code reconstructor will now shuffle work jobs across all disks "
+"instead of going disk-by-disk. This eliminates single-disk I/O contention "
+"and allows continued scaling as concurrency is increased."
+
+msgid ""
+"The formpost digest algorithm is now configurable via the new "
+"``allowed_digests`` option, and support is added for both SHA-256 and "
+"SHA-512. Supported formpost digests are exposed to clients in ``/info``. "
+"Additionally, formpost signatures can now be base64 encoded."
+msgstr ""
+"The formpost digest algorithm is now configurable via the new "
+"``allowed_digests`` option, and support is added for both SHA-256 and "
+"SHA-512. Supported formpost digests are exposed to clients in ``/info``. "
+"Additionally, formpost signatures can now be base64 encoded."
+
+msgid ""
+"The formpost middleware now properly supports uploading multiple files with "
+"different content-types."
+msgstr ""
+"The formpost middleware now properly supports uploading multiple files with "
+"different content-types."
+
+msgid "The formpost middleware now works with unicode file names."
+msgstr "The formpost middleware now works with Unicode file names."
+
+msgid ""
+"The improvements to EC reads made in Swift 2.10.0 have also been applied to "
+"the reconstructor. This allows fragments to be rebuilt in more "
+"circumstances, resulting in faster recovery from failures."
+msgstr ""
+"The improvements to EC reads made in Swift 2.10.0 have also been applied to "
+"the reconstructor. This allows fragments to be rebuilt in more "
+"circumstances, resulting in faster recovery from failures."
+
+msgid ""
+"The message template for proxy logging may now include a ``{domain}`` field "
+"for the client-provided ``Host`` header."
+msgstr ""
+"The message template for proxy logging may now include a ``{domain}`` field "
+"for the client-provided ``Host`` header."
+
+msgid ""
+"The more-efficient shard range structure from the last release is now used "
+"when fetching ranges from the backend."
+msgstr ""
+"The more-efficient shard range structure from the last release is now used "
+"when fetching ranges from the backend."
+
+msgid ""
+"The number of container updates on object PUTs (ie to update listings) has "
+"been recomputed to be far more efficient  while maintaining durability "
+"guarantees. Specifically, object PUTs to erasure-coded policies will now "
+"normally result in far fewer container updates."
+msgstr ""
+"The number of container updates on object PUTs (ie to update listings) has "
+"been recomputed to be far more efficient  while maintaining durability "
+"guarantees. Specifically, object PUTs to erasure-coded policies will now "
+"normally result in far fewer container updates."
+
+msgid ""
+"The object and container server config option ``slowdown`` has been "
+"deprecated in favor of the new ``objects_per_second`` and "
+"``containers_per_second`` options."
+msgstr ""
+"The object and container server config option ``slowdown`` has been "
+"deprecated in favour of the new ``objects_per_second`` and "
+"``containers_per_second`` options."
+
+msgid ""
+"The object reconstructor can now rebuild an EC fragment for an expired "
+"object."
+msgstr ""
+"The object reconstructor can now rebuild an EC fragment for an expired "
+"object."
+
+msgid ""
+"The object reconstructor will now fork all available worker processes when "
+"operating on a subset of local devices."
+msgstr ""
+"The object reconstructor will now fork all available worker processes when "
+"operating on a subset of local devices."
+
+msgid ""
+"The object server runs certain IO-intensive methods outside the main pthread "
+"for performance. Previously, if one of those methods tried to log, this can "
+"cause a crash that eventually leads to an object server with hundreds or "
+"thousands of greenthreads, all deadlocked. The fix is to use a mutex that "
+"works across different greenlets and different pthreads."
+msgstr ""
+"The object server runs certain IO-intensive methods outside the main pthread "
+"for performance. Previously, if one of those methods tried to log, this can "
+"cause a crash that eventually leads to an object server with hundreds or "
+"thousands of greenthreads, all deadlocked. The fix is to use a mutex that "
+"works across different greenlets and different pthreads."
+
+msgid ""
+"The object updater now supports two configuration settings: \"concurrency\" "
+"and \"updater_workers\". The latter controls how many worker processes are "
+"spawned, while the former controls how many concurrent container updates are "
+"performed by each worker process. This should speed the processing of "
+"async_pendings."
+msgstr ""
+"The object updater now supports two configuration settings: \"concurrency\" "
+"and \"updater_workers\". The latter controls how many worker processes are "
+"spawned, while the former controls how many concurrent container updates are "
+"performed by each worker process. This should speed the processing of "
+"async_pendings."
+
+msgid "The object-expirer logs fewer client disconnects."
+msgstr "The object-expirer logs fewer client disconnects."
+
+msgid ""
+"The object-expirer now only cleans up empty containers. Previously, it would "
+"attempt to delete all processed containers, regardless of whether there were "
+"entries which were skipped or had errors."
+msgstr ""
+"The object-expirer now only cleans up empty containers. Previously, it would "
+"attempt to delete all processed containers, regardless of whether there were "
+"entries which were skipped or had errors."
+
+msgid ""
+"The object-replicator now logs successful rsync transfers at debug instead "
+"of info."
+msgstr ""
+"The object-replicator now logs successful rsync transfers at debug instead "
+"of info."
+
+msgid ""
+"The object-updater now defers rate-limited updates to the end of its cycle; "
+"these deferred updates will be processed (at the limited rate) until the "
+"configured ``interval`` elapses. A new ``max_deferred_updates`` option may "
+"be used to bound the deferral queue."
+msgstr ""
+"The object-updater now defers rate-limited updates to the end of its cycle; "
+"these deferred updates will be processed (at the limited rate) until the "
+"configured ``interval`` elapses. A new ``max_deferred_updates`` option may "
+"be used to bound the deferral queue."
+
+msgid ""
+"The output of devices from ``swift-ring-builder`` has been reordered by "
+"region, zone, ip, and device."
+msgstr ""
+"The output of devices from ``swift-ring-builder`` has been reordered by "
+"region, zone, ip, and device."
+
+msgid ""
+"The post-rsync REPLICATE call no longer recalculates hashes immediately."
+msgstr ""
+"The post-rsync REPLICATE call no longer recalculates hashes immediately."
+
+msgid ""
+"The proxy server now applies error-limiting to the correct node when "
+"handling a recoverable node error."
+msgstr ""
+"The proxy server now applies error-limiting to the correct node when "
+"handling a recoverable node error."
+
+msgid ""
+"The proxy-server now caches 'listing' shards, improving listing performance "
+"for sharded containers. A new config option, "
+"``recheck_listing_shard_ranges``, controls the cache time and defaults to 10 "
+"minutes; set it to 0 to disable caching (the previous behavior)."
+msgstr ""
+"The proxy-server now caches 'listing' shards, improving listing performance "
+"for sharded containers. A new config option, "
+"``recheck_listing_shard_ranges``, controls the cache time and defaults to 10 "
+"minutes; set it to 0 to disable caching (the previous behaviour)."
+
+msgid ""
+"The reconciler now defers working on policies that have a partition power "
+"increase in progress to avoid issues with concurrent writes."
+msgstr ""
+"The reconciler now defers working on policies that have a partition power "
+"increase in progress to avoid issues with concurrent writes."
+
+msgid ""
+"The relinker better handles data found from earlier partition power "
+"increases."
+msgstr ""
+"The relinker better handles data found from earlier partition power "
+"increases."
+
+msgid ""
+"The relinker better handles tombstones found for the same object but with "
+"different inodes."
+msgstr ""
+"The relinker better handles tombstones found for the same object but with "
+"different inodes."
+
+msgid ""
+"The relinker can now target specific storage policies or partitions by using "
+"the new ``--policy`` and ``--partition`` options."
+msgstr ""
+"The relinker can now target specific storage policies or partitions by using "
+"the new ``--policy`` and ``--partition`` options."
+
+msgid ""
+"The relinker now performs eventlet-hub selection the same way as other "
+"daemons. In particular, ``epolls`` will no longer be selected, as it seemed "
+"to cause occassional hangs."
+msgstr ""
+"The relinker now performs eventlet-hub selection the same way as other "
+"daemons. In particular, ``epolls`` will no longer be selected, as it seemed "
+"to cause occasional hangs."
+
+msgid ""
+"The relinker now spawns multiple subprocesses to process disks in parallel. "
+"By default, one worker is spawned per disk; use the new ``--workers`` option "
+"to control how many subprocesses are used. Use ``--workers=0`` to maintain "
+"the previous behavior."
+msgstr ""
+"The relinker now spawns multiple subprocesses to process disks in parallel. "
+"By default, one worker is spawned per disk; use the new ``--workers`` option "
+"to control how many subprocesses are used. Use ``--workers=0`` to maintain "
+"the previous behaviour."
+
+msgid ""
+"The sharder and swift-manage-shard-ranges now consider total row count "
+"(instead of just object count) when deciding whether a shard is a candidate "
+"for shrinking."
+msgstr ""
+"The sharder and swift-manage-shard-ranges now consider total row count "
+"(instead of just object count) when deciding whether a shard is a candidate "
+"for shrinking."
+
+msgid ""
+"The sharder daemon has been enhanced to better support the shrinking of "
+"shards that are no longer required. Shard containers will now discover from "
+"their root container if they should be shrinking. They will also discover "
+"the shards into which they should shrink, which may include the root "
+"container itself."
+msgstr ""
+"The sharder daemon has been enhanced to better support the shrinking of "
+"shards that are no longer required. Shard containers will now discover from "
+"their root container if they should be shrinking. They will also discover "
+"the shards into which they should shrink, which may include the root "
+"container itself."
+
+msgid ""
+"The sharder now correctly identifies and fails audits for shard ranges that "
+"overlap exactly."
+msgstr ""
+"The sharder now correctly identifies and fails audits for shard ranges that "
+"overlap exactly."
+
+msgid ""
+"The sharding progress reports in recon cache now continue to be included for "
+"a period of time after sharding has completed. The time period may be "
+"configured using the ``recon_sharded_timeout`` option in the ``[container-"
+"sharder]`` section of container-server.conf, and defaults to 12 hours."
+msgstr ""
+"The sharding progress reports in recon cache now continue to be included for "
+"a period of time after sharding has completed. The time period may be "
+"configured using the ``recon_sharded_timeout`` option in the ``[container-"
+"sharder]`` section of container-server.conf, and defaults to 12 hours."
+
+msgid ""
+"The standard-library ``logging`` module is no longer monkey-patched when "
+"importing ``swift.common.utils``, making it easier to re-use swift code in "
+"other contexts."
+msgstr ""
+"The standard-library ``logging`` module is no longer monkey-patched when "
+"importing ``swift.common.utils``, making it easier to re-use Swift code in "
+"other contexts."
+
+msgid ""
+"The staticweb middleware now allows empty listings at the root of a "
+"container. Previously, this would result in a 404 response."
+msgstr ""
+"The staticweb middleware now allows empty listings at the root of a "
+"container. Previously, this would result in a 404 response."
+
+msgid ""
+"The structure of cached shard ranges has changed, improving performance when "
+"listing or writing to sharded containers. Note that immediately after "
+"upgrade, the new structures will all be cache misses, which may lead to a "
+"thundering herd problem. To avoid this, upgrade just a few nodes first, let "
+"them service some fraction of traffic to populate the cache, then upgrade "
+"the rest of the cluster."
+msgstr ""
+"The structure of cached shard ranges has changed, improving performance when "
+"listing or writing to sharded containers. Note that immediately after "
+"upgrade, the new structures will all be cache misses, which may lead to a "
+"thundering herd problem. To avoid this, upgrade just a few nodes first, let "
+"them service some fraction of traffic to populate the cache, then upgrade "
+"the rest of the cluster."
+
+msgid ""
+"The tempurl digest algorithm is now configurable, and Swift added support "
+"for both SHA-256 and SHA-512. Supported tempurl digests are exposed to "
+"clients in ``/info``. Additionally, tempurl signatures can now be base64 "
+"encoded."
+msgstr ""
+"The tempurl digest algorithm is now configurable, and Swift added support "
+"for both SHA-256 and SHA-512. Supported tempurl digests are exposed to "
+"clients in ``/info``. Additionally, tempurl signatures can now be base64 "
+"encoded."
+
+msgid ""
+"The tempurl middleware has been updated to return a 503 if storing a token "
+"in memcache fails. Third party authentication middlewares are encouraged to "
+"also use the new ``raise_on_error`` keyword argument when storing ephemeral "
+"tokens in memcache."
+msgstr ""
+"The tempurl middleware has been updated to return a 503 if storing a token "
+"in memcache fails. Third party authentication middlewares are encouraged to "
+"also use the new ``raise_on_error`` keyword argument when storing ephemeral "
+"tokens in memcache."
+
+msgid "This is the final stable branch that will support Python 2.7."
+msgstr "This is the final stable branch that will support Python 2.7."
+
+msgid ""
+"Throttle update_auditor_status calls so it updates no more than once per "
+"minute."
+msgstr ""
+"Throttle update_auditor_status calls so it updates no more than once per "
+"minute."
+
+msgid ""
+"Throttle update_auditor_status calls so it updates no more than once per "
+"minute. This prevents excessive IO on a new cluster."
+msgstr ""
+"Throttle update_auditor_status calls so it updates no more than once per "
+"minute. This prevents excessive IO on a new cluster."
+
+msgid "Train Series Release Notes"
+msgstr "Train Series Release Notes"
+
+msgid "Transaction IDs are included in more error responses."
+msgstr "Transaction IDs are included in more error responses."
+
+msgid ""
+"Transaction IDs are now only included in daemon log lines in a request/"
+"response context."
+msgstr ""
+"Transaction IDs are now only included in daemon log lines in a request/"
+"response context."
+
+msgid "Truncate error logs to prevent log handler from running out of buffer."
+msgstr "Truncate error logs to prevent log handler from running out of buffer."
+
+msgid ""
+"Turned off thread-logging when monkey-patching with eventlet. This addresses "
+"a potential hang in the proxy-server while logging client disconnects."
+msgstr ""
+"Turned off thread-logging when monkey-patching with eventlet. This addresses "
+"a potential hang in the proxy-server while logging client disconnects."
+
+msgid ""
+"Ubuntu 18.04 and RDO's CentOS 7 repos package liberasurecode 1.5.0, while "
+"Ubuntu 20.04 and RDO's CentOS 8 repos currently package liberasurecode 1.6.0 "
+"or 1.6.1. Take care when upgrading major distro versions!"
+msgstr ""
+"Ubuntu 18.04 and RDO's CentOS 7 repos package liberasurecode 1.5.0, while "
+"Ubuntu 20.04 and RDO's CentOS 8 repos currently package liberasurecode 1.6.0 "
+"or 1.6.1. Take care when upgrading major distro versions!"
+
+msgid "Unsigned payloads work with v4 signatures once more."
+msgstr "Unsigned payloads work with v4 signatures once more."
+
+msgid ""
+"Update dnspython dependency to 1.14, removing the need to have separate "
+"dnspython dependencies for Py2 and Py3."
+msgstr ""
+"Update dnspython dependency to 1.14, removing the need to have separate "
+"dnspython dependencies for Py2 and Py3."
+
+msgid "Updated docs to reference appropriate ports."
+msgstr "Updated docs to reference appropriate ports."
+
+msgid "Updated requirements.txt to match global exclusions and formatting."
+msgstr "Updated requirements.txt to match global exclusions and formatting."
+
+msgid "Updated the PyECLib dependency to 1.3.1."
+msgstr "Updated the PyECLib dependency to 1.3.1."
+
+msgid ""
+"Updated the `hashes.pkl` file format to include timestamp information for "
+"race detection. Also simplified hashing logic to prevent race conditions and "
+"optimize for the common case."
+msgstr ""
+"Updated the `hashes.pkl` file format to include timestamp information for "
+"race detection. Also simplified hashing logic to prevent race conditions and "
+"optimise for the common case."
+
+msgid ""
+"Upgrade Impact: If you upgrade and roll back, you must delete all `hashes."
+"pkl` files."
+msgstr ""
+"Upgrade Impact: If you upgrade and roll back, you must delete all `hashes."
+"pkl` files."
+
+msgid "Upgrade Notes"
+msgstr "Upgrade Notes"
+
+msgid ""
+"Upgrade impact -- during a rolling upgrade, an updated proxy server may "
+"write a manifest that an out-of-date proxy server will not be able to read. "
+"This will resolve itself once the upgrade completes on all nodes."
+msgstr ""
+"Upgrade impact -- during a rolling upgrade, an updated proxy server may "
+"write a manifest that an out-of-date proxy server will not be able to read. "
+"This will resolve itself once the upgrade completes on all nodes."
+
+msgid ""
+"Upgrade liberasurecode on all object servers. Object servers can now read "
+"both old and new fragments."
+msgstr ""
+"Upgrade liberasurecode on all object servers. Object servers can now read "
+"both old and new fragments."
+
+msgid ""
+"Upgrade liberasurecode on all proxy servers. Newly-written data will now use "
+"new fragments. Note that not-yet-upgraded proxies will not be able to read "
+"these newly-written fragments but will instead respond ``500 Internal Server "
+"Error``."
+msgstr ""
+"Upgrade liberasurecode on all proxy servers. Newly-written data will now use "
+"new fragments. Note that not-yet-upgraded proxies will not be able to read "
+"these newly-written fragments but will instead respond ``500 Internal Server "
+"Error``."
+
+msgid ""
+"User metadata is now exposed via CORS when encryption is enabled, matching "
+"the behavior when encryption is not enabled."
+msgstr ""
+"User metadata is now exposed via CORS when encryption is enabled, matching "
+"the behaviour when encryption is not enabled."
+
+msgid "Ussuri Series Release Notes"
+msgstr "Ussuri Series Release Notes"
+
+msgid "Various logging and metrics improvements when talking to memcache."
+msgstr "Various logging and metrics improvements when talking to memcache."
+
+msgid "Various other minor bug fixes and improvements."
+msgstr "Various other minor bug fixes and improvements."
+
+msgid "Various other minor bug fixes."
+msgstr "Various other minor bug fixes."
+
+msgid "Victoria Series Release Notes"
+msgstr "Victoria Series Release Notes"
+
+msgid ""
+"WARNING: If you are using the ISA-L library for erasure codes, please "
+"upgrade to liberasurecode 1.3.1 (or later) as soon as possible. If you are "
+"using isa_l_rs_vand with more than 4 parity, please read https://bugs."
+"launchpad.net/swift/+bug/1639691 and take necessary action."
+msgstr ""
+"WARNING: If you are using the ISA-L library for erasure codes, please "
+"upgrade to liberasurecode 1.3.1 (or later) as soon as possible. If you are "
+"using isa_l_rs_vand with more than 4 parity, please read https://bugs."
+"launchpad.net/swift/+bug/1639691 and take necessary action."
+
+msgid "WSGI server processes can now notify systemd when they are ready."
+msgstr "WSGI server processes can now notify systemd when they are ready."
+
+msgid "Wallaby Series Release Notes"
+msgstr "Wallaby Series Release Notes"
+
+msgid "Warn when relinking/cleaning up and any disks are unmounted."
+msgstr "Warn when relinking/cleaning up and any disks are unmounted."
+
+msgid ""
+"We do not yet have CLI tools for creating composite rings, but the "
+"functionality has been enabled in the ring modules to support this advanced "
+"functionality. CLI tools will be delivered in a subsequent release."
+msgstr ""
+"We do not yet have CLI tools for creating composite rings, but the "
+"functionality has been enabled in the ring modules to support this advanced "
+"functionality. CLI tools will be delivered in a subsequent release."
+
+msgid ""
+"When building a listing from shards, any failure to retrieve listings will "
+"result in a 503 response. Previously, failures fetching a partiucular shard "
+"would result in a gap in listings."
+msgstr ""
+"When building a listing from shards, any failure to retrieve listings will "
+"result in a 503 response. Previously, failures fetching a particular shard "
+"would result in a gap in listings."
+
+msgid ""
+"When listing objects in a container in json format, static large objects "
+"(SLOs) will now include an additional new \"slo_etag\" key that matches the "
+"etag returned when requesting the SLO. The existing \"hash\" key remains "
+"unchanged as the MD5 of the SLO manifest. Text and XML listings are "
+"unaffected by this change."
+msgstr ""
+"When listing objects in a container in json format, static large objects "
+"(SLOs) will now include an additional new \"slo_etag\" key that matches the "
+"etag returned when requesting the SLO. The existing \"hash\" key remains "
+"unchanged as the MD5 of the SLO manifest. Text and XML listings are "
+"unaffected by this change."
+
+msgid ""
+"When looking for the active root secret, only the right-most keymaster is "
+"used."
+msgstr ""
+"When looking for the active root secret, only the right-most keymaster is "
+"used."
+
+msgid ""
+"When making backend requests, the ``proxy-server`` now ensures query "
+"parameters are always properly quoted. Previously, the proxy would encounter "
+"an error on Python 2.7.17 if the client included non-ASCII query parameters "
+"in object requests. This was previously fixed in 2.23.0."
+msgstr ""
+"When making backend requests, the ``proxy-server`` now ensures query "
+"parameters are always properly quoted. Previously, the proxy would encounter "
+"an error on Python 2.7.17 if the client included non-ASCII query parameters "
+"in object requests. This was previously fixed in 2.23.0."
+
+msgid ""
+"When object path is not a directory, just quarantine it, rather than the "
+"whole suffix."
+msgstr ""
+"When object path is not a directory, just quarantine it, rather than the "
+"whole suffix."
+
+msgid ""
+"When refetching Static Large Object manifests, non-manifest responses are "
+"now handled better."
+msgstr ""
+"When refetching Static Large Object manifests, non-manifest responses are "
+"now handled better."
+
+msgid ""
+"When requesting objects, return 404 if a tombstone is found and is newer "
+"than any data found. Previous behavior was to return stale data."
+msgstr ""
+"When requesting objects, return 404 if a tombstone is found and is newer "
+"than any data found. Previous behaviour was to return stale data."
+
+msgid ""
+"When running with ``s3_acl`` disabled, ``bucket-owner-full-control`` and "
+"``bucket-owner-read`` canned ACLs will be translated to the same Swift ACLs "
+"as ``private``."
+msgstr ""
+"When running with ``s3_acl`` disabled, ``bucket-owner-full-control`` and "
+"``bucket-owner-read`` canned ACLs will be translated to the same Swift ACLs "
+"as ``private``."
+
+msgid ""
+"When the object auditor examines an object, it will now add any missing "
+"metadata checksums."
+msgstr ""
+"When the object auditor examines an object, it will now add any missing "
+"metadata checksums."
+
+msgid ""
+"With heartbeating turned on, the proxy will start its response immediately "
+"with 202 Accepted then send a single whitespace character periodically until "
+"the request completes. At that point, a final summary chunk will be sent "
+"which includes a \"Response Status\" key indicating success or failure and "
+"(if successful) an \"Etag\" key indicating the Etag of the resulting SLO."
+msgstr ""
+"With heartbeating turned on, the proxy will start its response immediately "
+"with 202 Accepted then send a single whitespace character periodically until "
+"the request completes. At that point, a final summary chunk will be sent "
+"which includes a \"Response Status\" key indicating success or failure and "
+"(if successful) an \"Etag\" key indicating the Etag of the resulting SLO."
+
+msgid ""
+"Worker process logs will have a bit of information prepended so operators "
+"can tell which messages came from which worker. The prefix is \"[worker M/N "
+"pid=P] \", where M is the worker's index, N is the total number of workers, "
+"and P is the process ID. Every message from the replicator's logger will "
+"have the prefix"
+msgstr ""
+"Worker process logs will have a bit of information prepended so operators "
+"can tell which messages came from which worker. The prefix is \"[worker M/N "
+"pid=P] \", where M is the worker's index, N is the total number of workers, "
+"and P is the process ID. Every message from the replicator's logger will "
+"have the prefix"
+
+msgid "Write-affinity aware object deletion"
+msgstr "Write-affinity aware object deletion"
+
+msgid ""
+"X-Delete-At computation now uses X-Timestamp instead of system time. This "
+"prevents clock skew causing inconsistent expiry data."
+msgstr ""
+"X-Delete-At computation now uses X-Timestamp instead of system time. This "
+"prevents clock skew causing inconsistent expiry data."
+
+msgid "Xena Series Release Notes"
+msgstr "Xena Series Release Notes"
+
+msgid "Yoga Series Release Notes"
+msgstr "Yoga Series Release Notes"
+
+msgid "Zed Series Release Notes"
+msgstr "Zed Series Release Notes"
+
+msgid "``Content-Type`` can now be updated when copying an object."
+msgstr "``Content-Type`` can now be updated when copying an object."
+
+msgid ""
+"``EIO`` errors during read now cause object diskfiles to be quarantined."
+msgstr ""
+"``EIO`` errors during read now cause object diskfiles to be quarantined."
+
+msgid ""
+"``ENOENT`` and ``ENODATA`` errors are better handled in the object "
+"replicator and auditor."
+msgstr ""
+"``ENOENT`` and ``ENODATA`` errors are better handled in the object "
+"replicator and auditor."
+
+msgid "``EPIPE`` errors no longer log tracebacks."
+msgstr "``EPIPE`` errors no longer log tracebacks."
+
+msgid ""
+"``LastModified`` timestamps in listings are now rounded up to whole seconds, "
+"like they are in responses from AWS."
+msgstr ""
+"``LastModified`` timestamps in listings are now rounded up to whole seconds "
+"like they are in responses from AWS."
+
+msgid "``fallocate_reserve`` may be specified as a percentage in more places."
+msgstr "``fallocate_reserve`` may be specified as a percentage in more places."
+
+msgid ""
+"``s3token`` no longer mangles request paths that include the Access Key ID."
+msgstr ""
+"``s3token`` no longer mangles request paths that include the Access Key ID."
+
+msgid "``swift-account-audit``"
+msgstr "``swift-account-audit``"
+
+msgid ""
+"``swift-account-info`` and ``swift-container-info`` now accept a ``--sync`` "
+"flag to show information from the incoming/outgoing sync tables."
+msgstr ""
+"``swift-account-info`` and ``swift-container-info`` now accept a ``--sync`` "
+"flag to show information from the incoming/outgoing sync tables."
+
+msgid ""
+"``swift-container-info`` now summarizes shard range information. Pass ``-v``/"
+"``--verbose`` if you want to see all of them."
+msgstr ""
+"``swift-container-info`` now summarizes shard range information. Pass ``-v``/"
+"``--verbose`` if you want to see all of them."
+
+msgid "``swift-dispersion-populate``"
+msgstr "``swift-dispersion-populate``"
+
+msgid "``swift-drive-recon``"
+msgstr "``swift-drive-recon``"
+
+msgid ""
+"``swift-manage-shard-ranges`` can now accept a config file; this may be used "
+"to ensure consistency of threshold values with the container-sharder config."
+msgstr ""
+"``swift-manage-shard-ranges`` can now accept a config file; this may be used "
+"to ensure consistency of threshold values with the container-sharder config."
+
+msgid "``swift-manage-shard-ranges`` improvements:"
+msgstr "``swift-manage-shard-ranges`` improvements:"
+
+msgid ""
+"``swift-recon-cron`` now includes the last time it was run in the recon "
+"information."
+msgstr ""
+"``swift-recon-cron`` now includes the last time it was run in the recon "
+"information."
+
+msgid "``swift-recon``"
+msgstr "``swift-recon``"
+
+msgid "``swift-ring-builder`` improvements"
+msgstr "``swift-ring-builder`` improvements"
+
+msgid ""
+"``swift_source`` is set for more sub-requests in the proxy-server. See `the "
+"documentation <https://docs.openstack.org/swift/latest/logs.html#swift-"
+"source>`__."
+msgstr ""
+"``swift_source`` is set for more sub-requests in the proxy-server. See `the "
+"documentation <https://docs.openstack.org/swift/latest/logs.html#swift-"
+"source>`__."
+
+msgid "and you want to take advantage of faster updates, then do this::"
+msgstr "and you want to take advantage of faster updates, then do this::"
+
+msgid ""
+"cname_lookup middleware now accepts a ``nameservers`` config variable that, "
+"if defined, will be used for DNS lookups instead of the system default."
+msgstr ""
+"cname_lookup middleware now accepts a ``nameservers`` config variable that, "
+"if defined, will be used for DNS lookups instead of the system default."
+
+msgid "domain_remap now accepts a list of domains in \"storage_domain\"."
+msgstr "domain_remap now accepts a list of domains in \"storage_domain\"."
+
+msgid "formpost can now accept a content-encoding parameter."
+msgstr "formpost can now accept a content-encoding parameter."
+
+msgid "name_check and cname_lookup keys have been added to `/info`."
+msgstr "name_check and cname_lookup keys have been added to `/info`."
+
+msgid ""
+"s3api now mimics some forms of AWS server-side encryption based on whether "
+"Swift's at-rest encryption functionality is enabled. Note that S3 API users "
+"are now able to know more about how the cluster is configured than they were "
+"previously, ie knowledge of encryption at-rest functionality being enabled "
+"or not."
+msgstr ""
+"s3api now mimics some forms of AWS server-side encryption based on whether "
+"Swift's at-rest encryption functionality is enabled. Note that S3 API users "
+"are now able to know more about how the cluster is configured than they were "
+"previously, i.e. knowledge of encryption at-rest functionality being enabled "
+"or not."
+
+msgid ""
+"s3api now mimics the AWS S3 behavior of periodically sending whitespace "
+"characters on a Complete Multipart Upload request to keep the connection "
+"from timing out. Note that since a request could fail after the initial 200 "
+"OK response has been sent, it is important to check the response body to "
+"determine if the request succeeded."
+msgstr ""
+"s3api now mimics the AWS S3 behaviour of periodically sending whitespace "
+"characters on a Complete Multipart Upload request to keep the connection "
+"from timing out. Note that since a request could fail after the initial 200 "
+"OK response has been sent, it is important to check the response body to "
+"determine if the request succeeded."
+
+msgid ""
+"s3api now properly handles ``x-amz-metadata-directive`` headers on COPY "
+"operations."
+msgstr ""
+"s3api now properly handles ``x-amz-metadata-directive`` headers on COPY "
+"operations."
+
+msgid ""
+"s3api now uses concurrency (default 2) to handle multi-delete requests. This "
+"allows multi-delete requests to be processed much more quickly."
+msgstr ""
+"s3api now uses concurrency (default 2) to handle multi-delete requests. This "
+"allows multi-delete requests to be processed much more quickly."
+
+msgid "s3api responses now include a '-' in multipart ETags."
+msgstr "s3api responses now include a '-' in multipart ETags."
+
+msgid ""
+"statsd error messages correspond to 5xx responses only. This makes "
+"monitoring more useful because actual errors (5xx) will not be hidden by "
+"common user requests (4xx). Previously, some 4xx responses would be included "
+"in timing information in the statsd error messages."
+msgstr ""
+"statsd error messages correspond to 5xx responses only. This makes "
+"monitoring more useful because actual errors (5xx) will not be hidden by "
+"common user requests (4xx). Previously, some 4xx responses would be included "
+"in timing information in the statsd error messages."
+
+msgid "swift-recon now respects storage policy aliases."
+msgstr "swift-recon now respects storage policy aliases."
+
+msgid "tempauth user names now support unicode characters."
+msgstr "tempauth user names now support Unicode characters."
diff --git a/releasenotes/source/locale/ja/LC_MESSAGES/releasenotes.po b/releasenotes/source/locale/ja/LC_MESSAGES/releasenotes.po
new file mode 100644
index 0000000000..2a0836d53e
--- /dev/null
+++ b/releasenotes/source/locale/ja/LC_MESSAGES/releasenotes.po
@@ -0,0 +1,1351 @@
+# Shu Muto <shu-mutou@rf.jp.nec.com>, 2017. #zanata
+# Shu Muto <shu-mutou@rf.jp.nec.com>, 2018. #zanata
+msgid ""
+msgstr ""
+"Project-Id-Version: Swift Release Notes\n"
+"Report-Msgid-Bugs-To: \n"
+"POT-Creation-Date: 2018-02-28 19:39+0000\n"
+"MIME-Version: 1.0\n"
+"Content-Type: text/plain; charset=UTF-8\n"
+"Content-Transfer-Encoding: 8bit\n"
+"PO-Revision-Date: 2018-02-08 07:28+0000\n"
+"Last-Translator: Shu Muto <shu-mutou@rf.jp.nec.com>\n"
+"Language-Team: Japanese\n"
+"Language: ja\n"
+"X-Generator: Zanata 4.3.3\n"
+"Plural-Forms: nplurals=1; plural=0\n"
+
+msgid "2.10.0"
+msgstr "2.10.0"
+
+msgid "2.10.1"
+msgstr "2.10.1"
+
+msgid "2.10.2"
+msgstr "2.10.2"
+
+msgid "2.11.0"
+msgstr "2.11.0"
+
+msgid "2.12.0"
+msgstr "2.12.0"
+
+msgid "2.13.0"
+msgstr "2.13.0"
+
+msgid "2.13.1"
+msgstr "2.13.1"
+
+msgid "2.14.0"
+msgstr "2.14.0"
+
+msgid "2.15.0"
+msgstr "2.15.0"
+
+msgid "2.15.1"
+msgstr "2.15.1"
+
+msgid "2.16.0"
+msgstr "2.16.0"
+
+msgid "2.17.0"
+msgstr "2.17.0"
+
+msgid ""
+"A PUT or POST to a container will now update the container's Last-Modified "
+"time, and that value will be included in a GET/HEAD response."
+msgstr ""
+"コンテナーへの PUT または POST は、コンテナーの最終更新時刻を更新し、その値"
+"は GET/HEAD レスポンスに含まれます。"
+
+msgid ""
+"A composite ring comprises two or more component rings that are combined to "
+"form a single ring with a replica count equal to the sum of the component "
+"rings. The component rings are built independently, using distinct devices "
+"in distinct regions, which means that the dispersion of replicas between the "
+"components can be guaranteed."
+msgstr ""
+"複合リングは、コンポーネントリングの合計に等しい複製数を有して形成する単一リ"
+"ングが結合されたコンポーネントリングを２つ以上含みます。 コンポーネントリング"
+"は、別個の領域に別個のデバイスを使用して独立して構築されているため、コンポー"
+"ネント間のレプリカの分散を保証できます。"
+
+msgid ""
+"Accept a trade off of dispersion for balance in the ring builder that will "
+"result in getting to balanced rings much more quickly in some cases."
+msgstr ""
+"リングビルダーのバランスのために、分散のトレードオフを受け入れ、場合によって"
+"はバランスされたリングにより早く到達します。"
+
+msgid ""
+"Account and container databases will now be quarantined if the database "
+"schema has been corrupted."
+msgstr ""
+"データベーススキーマが壊れていると、アカウントとコンテナーのデータベースが隔"
+"離されるようになりました。"
+
+msgid ""
+"Account and container replication stats logs now include ``remote_merges``, "
+"the number of times a whole database was sent to another node."
+msgstr ""
+"アカウントとコンテナー複製の統計ログに、データベース全体が別のノードに送信さ"
+"れた回数、``remote_merges`` が追加されました。"
+
+msgid "Add Composite Ring Functionality"
+msgstr "複合リング機能を追加しました。"
+
+msgid "Add Vary headers for CORS responses."
+msgstr "CORS 応答用の Vary ヘッダーを追加しました。"
+
+msgid "Add checksum to object extended attributes."
+msgstr "オブジェクトの拡張属性にチェックサムを追加します。"
+
+msgid ""
+"Add support to increase object ring partition power transparently to end "
+"users and with no cluster downtime. Increasing the ring part power allows "
+"for incremental adjustment to the upper bound of the cluster size. Please "
+"review the `full docs <https://docs.openstack.org/swift/latest/"
+"ring_partpower.html>`__ for more information."
+msgstr ""
+"エンドユーザーにオブジェクトのリング・パーティション・パワーを透過的に増加さ"
+"せるためのクラスタのダウンタイムが発生しないサポートを追加しました。リングの"
+"部分力を増加させることにより、クラスタサイズの上限に増分調整が可能になりま"
+"す。詳細は `フルドキュメント\n"
+" <https://docs.openstack.org/swift/latest/ring_partpower.html>`__ を参照して"
+"ください。"
+
+msgid ""
+"Added ``--swift-versions`` to ``swift-recon`` CLI to compare installed "
+"versions in the cluster."
+msgstr ""
+"クラスターにインストールされているバージョンを比較するために、``swift-"
+"recon`` CLI に ``--swift-versions`` を追加しました。"
+
+msgid ""
+"Added a \"user\" option to the drive-audit config file. Its value is used to "
+"set the owner of the drive-audit recon cache."
+msgstr ""
+"ドライブ監査設定ファイルに \"user\" オプションを追加しました。その値は、ドラ"
+"イブ監査の調整キャッシュの所有者を設定するために使用されます。"
+
+msgid ""
+"Added a configurable URL base to staticweb, fixing issues when the "
+"accessible endpoint isn't known to the Swift cluster (eg http vs https)."
+msgstr ""
+"静的ウェブに対する設定可能な URL ベースを追加し、アクセス可能なエンドポイント"
+"が Swiftクラスタに知らされていない場合の問題を修正しました（例えば、httpと"
+"https）。"
+
+msgid "Added a configurable URL base to staticweb."
+msgstr "静的ウェブに対する設定可能な URL ベースを追加しました。"
+
+msgid "Added container/object listing with prefix to InternalClient."
+msgstr ""
+"InternalClient のコンテナー／オブジェクトの一覧作成で接頭辞を指定できるように"
+"なりました。"
+
+msgid "Added support for inline data segments in SLO manifests."
+msgstr "SLO マニフェストにおけるインラインデータセグメントをサポートしました。"
+
+msgid ""
+"Added support for per-policy proxy config options. This allows per-policy "
+"affinity options to be set for use with duplicated EC policies and composite "
+"rings. Certain options found in per-policy conf sections will override their "
+"equivalents that may be set in the [app:proxy-server] section. Currently the "
+"options handled that way are ``sorting_method``, ``read_affinity``, "
+"``write_affinity``, ``write_affinity_node_count``, and "
+"``write_affinity_handoff_delete_count``."
+msgstr ""
+"ポリシーごとのプロキシー設定オプションのサポートが追加されました。これによ"
+"り、ポリシーごとのアフィニティオプションを、複製された EC ポリシーおよび複合"
+"リングで使用するように設定できます。ポリシーごとの conf セクションにある特定"
+"のオプションは、 [app：proxy-server] セクションで設定できる同等のものよりも優"
+"先されます。現在、このように処理されるオプションは ``sorting_method``、 "
+"``read_affinity``、 ``write_affinity``、 ``write_affinity_node_count``、 "
+"``write_affinity_handoff_delete_count`` です。"
+
+msgid ""
+"Added support for retrieving the encryption root secret from an external key "
+"management system. In practice, this is currently limited to Barbican."
+msgstr ""
+"外部鍵管理システムからの暗号化ルートシークレットの取得をサポートしました。現"
+"在 Barbican に限定されています。"
+
+msgid "Added symlink objects support."
+msgstr "シンボリックリンクオブジェクトをサポートしました。"
+
+msgid ""
+"All 416 responses will now include a Content-Range header with an "
+"unsatisfied-range value. This allows the caller to know the valid range "
+"request value for an object."
+msgstr ""
+"416 のすべてのレスポンスには、範囲の値を持つ Content-Range ヘッダーが含まれる"
+"ようになりました。 これにより、呼び出し元はオブジェクトの有効範囲要求値を知る"
+"ことができます。"
+
+msgid "Allow the expirer to gracefully move past updating stale work items."
+msgstr "expirer が安全に古い作業項目を移動できるようになりました。"
+
+msgid "Always set Swift processes to use UTC."
+msgstr "Swift プロセスがいつも UTC を使うように設定しました。"
+
+msgid "Bug Fixes"
+msgstr "バグ修正"
+
+msgid "Cache all answers from nameservers in cname_lookup."
+msgstr "cname_lookup でネームサーバーからのすべての応答をキャッシュします。"
+
+msgid ""
+"Changed where liberasurecode-devel for CentOS 7 is referenced and installed "
+"as a dependency."
+msgstr ""
+"CentOS 7 での、liberasurecode-devel が参照、インストールされる場所を変更しま"
+"した。"
+
+msgid "Cleaned up logged tracebacks when talking to memcached servers."
+msgstr ""
+"memcached サーバーと通信するときのトレースバックログをクリーンアップしまし"
+"た。"
+
+msgid ""
+"Closed a bug where ssync may have written bad fragment data in some "
+"circumstances. A check was added to ensure the correct number of bytes is "
+"written for a fragment before finalizing the write. Also, erasure coded "
+"fragment metadata will now be validated on read requests and, if bad data is "
+"found, the fragment will be quarantined."
+msgstr ""
+"いくつかの状況で ssync が不正なフラグメントデータを書き込むバグをクローズしま"
+"した。書き込みを終了する前に、正しいバイト数がフラグメントに書き込まれている"
+"ことを確認するためのチェックが追加されました。また、消去コード化されたフラグ"
+"メントメタデータが読み取り要求で検証され、不良データが見つかると、そのフラグ"
+"メントが隔離されます。"
+
+msgid ""
+"Closed a bug where ssync may have written bad fragment data in some "
+"circumstances. A check was added to ensure the correct number of bytes is "
+"written for a fragment before finalizing the write. Also, erasure coded "
+"fragment metadata will now be validated when read and, if bad data is found, "
+"the fragment will be quarantined."
+msgstr ""
+"いくつかの状況で ssync が不正なフラグメントデータを書き込むバグをクローズしま"
+"した。書き込みを終了する前に、正しいバイト数がフラグメントに書き込まれている"
+"ことを確認するためのチェックが追加されました。また、消去コード化されたフラグ"
+"メントメタデータが読み取り要求で検証され、不良データが見つかると、そのフラグ"
+"メントが隔離されます。"
+
+msgid ""
+"Composite rings can be used for explicit replica placement and \"replicated "
+"EC\" for global erasure codes policies."
+msgstr ""
+"複合リングは、明示的なレプリカの配置と、グローバル消去コードポリシーのための"
+"「複製された EC」に使用できます。"
+
+msgid ""
+"Composite rings support 'cooperative' rebalance which means that during "
+"rebalance all component rings will be consulted before a partition is moved "
+"in any component ring. This avoids the same partition being simultaneously "
+"moved in multiple components."
+msgstr ""
+"複合リングは「協調的」リバランスをサポートしています。つまり、リバランス時"
+"に、コンポーネントリング内でパーティションを移動する前に、すべてのコンポーネ"
+"ントリングに諮られます。 これにより、複数のコンポーネントで同じパーティション"
+"を同時に移動されることがなくなります。"
+
+msgid ""
+"Container sync can now copy SLOs more efficiently by allowing the manifest "
+"to be synced before all of the referenced segments. This fixes a bug where "
+"container sync would not copy SLO manifests."
+msgstr ""
+"コンテナーシンクでは、マニフェストをすべての参照されるセグメントの前に同期さ"
+"せることで、SLO をより効率的にコピーできます。 これにより、コンテナーの同期"
+"が SLO マニフェストをコピーしないバグが修正されました。"
+
+msgid "Correctly handle deleted files with if-none-match requests."
+msgstr "if-none-match 要求で削除されたファイルを正しく処理します。"
+
+msgid ""
+"Correctly send 412 Precondition Failed if a user sends an invalid copy "
+"destination. Previously Swift would send a 500 Internal Server Error."
+msgstr ""
+"ユーザーが無効なコピー先を送信した場合は、 412 Precondition Failed を正しく送"
+"信します。以前は、Swift は 500 の内部サーバーエラーを送信しました。"
+
+msgid "Critical Issues"
+msgstr "致命的な問題"
+
+msgid "Current (Unreleased) Release Notes"
+msgstr "開発中バージョンのリリースノート"
+
+msgid ""
+"Currently the default is still only one process, and no workers. Set "
+"``reconstructor_workers`` in the ``[object-reconstructor]`` section to some "
+"whole number <= the number of devices on a node to get that many "
+"reconstructor workers."
+msgstr ""
+"現在のところ、デフォルトはまだ１つのプロセスしかなく、ワーカーはいません。多"
+"くの再構成ワーカーを得るためには、 ``[object-reconstructor]`` セクションの "
+"``reconstructor_workers`` をいくつかの合計数（ <= ノード上にあるデバイスの"
+"数）を設定してください。"
+
+msgid "Daemons using InternalClient can now be properly killed with SIGTERM."
+msgstr ""
+"InternalClient を使用するデーモンは、 SIGTERM を使用して適切に停止できます。"
+
+msgid ""
+"Deleting an expiring object will now cause less work in the system. The "
+"number of async pending files written has been reduced for all objects and "
+"greatly reduced for erasure-coded objects. This dramatically reduces the "
+"burden on container servers."
+msgstr ""
+"期限切れオブジェクトの削除は、システムでの作業を削減します。非同期で保留され"
+"ているファイルの数は、すべてのオブジェクトで削減され、消去コード付きオブジェ"
+"クトでは大幅に削減されます。これにより、コンテナーサーバーの負担が劇的に軽減"
+"しました。"
+
+msgid ""
+"Deprecate swift-temp-url and call python-swiftclient's implementation "
+"instead. This adds python-swiftclient as an optional dependency of Swift."
+msgstr ""
+"swift-temp-url を非推奨にし、代わりに python-swiftclient の実装を呼び出してく"
+"ださい。これにより、python-swiftclient が Swift のオプションの依存関係として"
+"追加されます。"
+
+msgid "Deprecation Notes"
+msgstr "廃止予定の機能"
+
+msgid "Disallow X-Delete-At header values equal to the X-Timestamp header."
+msgstr ""
+"X-Delete-At ヘッダーの値が X-Timestamp ヘッダーと等しいことを禁止します。"
+
+msgid "Display more info on empty rings."
+msgstr "空のリングに詳細情報を表示します。"
+
+msgid "Do not follow CNAME when host is in storage_domain."
+msgstr "ホストが storage_domain にある場合、CNAME に従わないようにしました。"
+
+msgid "Drop support for auth-server from common/manager.py and `swift-init`."
+msgstr ""
+"common/manager.pyと `swift-init` から auth-server のサポートを削除しました。"
+
+msgid "EC Fragment Duplication - Foundational Global EC Cluster Support."
+msgstr ""
+"EC フラグメント複製 - 基盤的なグローバル EC クラスタをサポートしました。"
+
+msgid ""
+"Enable cluster-wide CORS Expose-Headers setting via \"cors_expose_headers\"."
+msgstr ""
+"\"cors_expose_headers\" でクラスタ全体の CORS Expose-Headers 設定を有効にしま"
+"す。"
+
+msgid "Enabled versioned writes on Dynamic Large Objects (DLOs)."
+msgstr ""
+"ダイナミックラージオブジェクト（DLO）でのバージョン管理された書き込みを有効に"
+"しました。"
+
+msgid ""
+"Ensure update of the container by object-updater, removing a rare "
+"possibility that objects would never be added to a container listing."
+msgstr ""
+"オブジェクトがコンテナーリスティングに追加されるない、まれな可能性を排除し、"
+"オブジェクトアップデータによるコンテナーの更新を確実にしました。"
+
+msgid ""
+"Erasure code GET performance has been significantly improved in clusters "
+"that are not completely healthy."
+msgstr ""
+"完全に健全でないクラスターにおける、消去コードの GET 性能が大幅に向上しまし"
+"た。"
+
+msgid ""
+"Erasure code reconstruction handles moving data from handoff nodes better. "
+"Instead of moving the data to another handoff, it waits until it can be "
+"moved to a primary node."
+msgstr ""
+"消失コード再構成は、ハンドオフノードからの移動データをより良く処理します。 "
+"データを別のハンドオフに移動する代わりに、プライマリーノードに移動できるよう"
+"になるまで待機します。"
+
+msgid ""
+"Erasure-coded storage policies using ``isa_l_rs_vand`` and ``nparity`` >= 5 "
+"must be configured as deprecated, preventing any new containers from being "
+"created with such a policy. This configuration is known to harm data "
+"durability. Any data in such policies should be migrated to a new policy. "
+"See See `Launchpad bug 1639691 <https://bugs.launchpad.net/swift/"
+"+bug/1639691>`__ for more information."
+msgstr ""
+"``isa_l_rs_vand`` と ``nparity`` >= 5 を使った消去コード化ストレージポリシー"
+"は廃止予定にする必要があり、このようなポリシーで新しいコンテナーが作成されな"
+"いようにする必要があります。この設定は、データ耐久性に害を与えることが知られ"
+"ています。そのようなポリシー内のデータは、新しいポリシーに移行する必要があり"
+"ます。詳細は、 `Launchpad bug 1639691 <https://bugs.launchpad.net/swift/"
+"+bug/1639691>`__ を参照してください。"
+
+msgid ""
+"Fixed UnicodeDecodeError in the object reconstructor that would prevent "
+"objects with non-ascii names from being reconstructed and caused the "
+"reconstructor process to hang."
+msgstr ""
+"非 ASCII 名のオブジェクトが再構築されず、再構築プロセスがハングアップする原因"
+"となるオブジェクト再構成の UnicodeDecodeError が修正されました。"
+
+msgid ""
+"Fixed XML responses (eg on bulk extractions and SLO upload failures) to be "
+"more correct. The enclosing \"delete\" tag was removed where it doesn't make "
+"sense and replaced with \"extract\" or \"upload\" depending on the context."
+msgstr ""
+"XML レスポンス（一括抽出や SLO アップロードの失敗など）がより正確になりまし"
+"た。意味のない \"delete\" の閉じタグは削除され、コンテキストに応じた "
+"\"extract\" あるいは \"upload\" に置き換えられました。"
+
+msgid "Fixed a bug in domain_remap when obj starts/ends with slash."
+msgstr ""
+"オブジェクトがスラッシュで開始/終了するときの domain_remap のバグを修正しまし"
+"た。"
+
+msgid ""
+"Fixed a bug in the EC reconstructor where an unsuccessful sync would cause "
+"extra disk I/O load on the remote server. Now the extra checking work is "
+"only requested if the sync request was successful."
+msgstr ""
+"失敗した同期がリモートサーバー上で余分なディスク I/O 負荷を引き起こす EC 再構"
+"成のバグを修正しました。同期要求が成功した場合にのみ、追加のチェック作業が要"
+"求されるようになりました。"
+
+msgid ""
+"Fixed a bug introduced in 2.15.0 where the object reconstructor would exit "
+"with a traceback if no EC policy was configured."
+msgstr ""
+"2.15.0 で導入されたバグを修正しました。 EC ポリシーが設定されていない場合は、"
+"オブジェクト再構成ツールがトレースバックで終了します。"
+
+msgid "Fixed a bug where SSYNC would fail to replicate unexpired object."
+msgstr "SSYNC が期限切れのオブジェクトを複製できないバグを修正しました。"
+
+msgid ""
+"Fixed a bug where a container listing delimiter wouldn't work with "
+"encryption."
+msgstr "コンテナーのリスト区切り文字が暗号化で機能しないバグを修正しました。"
+
+msgid ""
+"Fixed a bug where an SLO download with a range request may have resulted in "
+"a 5xx series response."
+msgstr ""
+"範囲リクエストで SLO をダウンロードした結果、 5xx シリーズの応答が発生する可"
+"能性があるバグを修正しました。"
+
+msgid ""
+"Fixed a bug where some headers weren't being copied correctly in a COPY "
+"request."
+msgstr ""
+"一部のヘッダーが COPY リクエストで正しくコピーされていなかったバグを修正しま"
+"した。"
+
+msgid "Fixed a bug where some tombstone files might never be reclaimed."
+msgstr ""
+"いくつかの廃棄済みオブジェクト (tombstone) ファイルが再利用されないかもしれな"
+"いバグを修正しました。"
+
+msgid ""
+"Fixed a bug where the ring builder would not allow removal of a device when "
+"min_part_seconds_left was greater than zero."
+msgstr ""
+"min_part_seconds_left が 0 より大きい場合、リングビルダーがデバイスの削除を許"
+"可しないバグを修正しました。"
+
+msgid "Fixed a few areas where the ``swiftdir`` option was not respected."
+msgstr ""
+"``swiftdir`` オプションが尊重されなかったいくつかの領域を修正しました。"
+
+msgid ""
+"Fixed a race condition in updating hashes.pkl where a partition suffix "
+"invalidation may have been skipped."
+msgstr ""
+"パーティションサフィックスの無効化がスキップされた可能性のある hashes.pkl の"
+"更新時の競合状態を修正しました。"
+
+msgid "Fixed a rare infinite loop in `swift-ring-builder` while placing parts."
+msgstr ""
+"パーツを置いている間の`swift-ring-builder` のまれな無限ループを修正しました。"
+
+msgid ""
+"Fixed a rare issue where multiple backend timeouts could result in bad data "
+"being returned to the client."
+msgstr ""
+"複数のバックエンドのタイムアウトが原因で、クライアントに不正なデータが返され"
+"るという稀な問題を修正しました。"
+
+msgid "Fixed a socket leak in copy middleware when a large object was copied."
+msgstr ""
+"ラージオブジェクトをコピーしたときの copy ミドルウェアのソケットリークを修正"
+"しました。"
+
+msgid ""
+"Fixed an issue where background consistency daemon child processes would "
+"deadlock waiting on the same file descriptor."
+msgstr ""
+"バックグラウンド一貫性デーモンの子プロセスが同じファイル記述子を待ってデッド"
+"ロックする問題を修正しました。"
+
+msgid "Fixed deadlock when logging from a tpool thread."
+msgstr "tpool スレッドからのロギング時のデッドロックを修正しました。"
+
+msgid ""
+"Fixed encoding issue in ssync where a mix of ascii and non-ascii metadata "
+"values would cause an error."
+msgstr ""
+"ASCII メタデータ値と非 ASCII メタデータ値が混在するとエラーが発生する、 "
+"ssync のエンコードの問題を修正しました。"
+
+msgid ""
+"Fixed error where a container drive error resulted in double space usage on "
+"rest drives. When drive with container or account database is unmounted, the "
+"bug would create handoff replicas on all remaining drives, increasing the "
+"drive space used and filling the cluster."
+msgstr ""
+"コンテナードライブのエラーにより、残りのドライブに二重のスペースが使用される"
+"というエラーを修正しました。コンテナーまたはアカウントデータベースを使用した"
+"ドライブのマウントが解除されたときに、このバグは残りのすべてのドライブにハン"
+"ドオフレプリカを作成し、ドライブの使用容量を増やし、クラスターを満たしていま"
+"した。。"
+
+msgid ""
+"Fixed non-deterministic suffix updates in hashes.pkl where a partition may "
+"be updated much less often than expected."
+msgstr ""
+"パーティションが予想よりもずっと少なく更新される可能性がある hashes.pkl の固"
+"定の非確定的なサフィックスの更新を修正しました。"
+
+msgid "Fixed rare socket leak on range requests to erasure-coded objects."
+msgstr ""
+"消去コード付きオブジェクトへの範囲リクエストでの稀なソケットリークを修正しま"
+"した。"
+
+msgid ""
+"Fixed regression in consolidate_hashes that occured when a new file was "
+"stored to new suffix to a non-empty partition. This bug was introduced in "
+"2.7.0 and could cause an increase in rsync replication stats during and "
+"after upgrade, due to inconsistent hashing of partition suffixes."
+msgstr ""
+"新しいファイルが空でないパーティションに新しいサフィックスで格納されたときに"
+"発生した consolidate_hash の退行バグを修正しました。 このバグは2.7.0で導入さ"
+"れ、パーティションサフィックスの一貫性のないハッシュのために、アップグレード"
+"中およびアップグレード後に rsync のレプリケーション統計を増加する可能性があり"
+"ます。"
+
+msgid ""
+"Fixed regression in consolidate_hashes that occurred when a new file was "
+"stored to new suffix to a non-empty partition. This bug was introduced in "
+"2.7.0 and could cause an increase in rsync replication stats during and "
+"after upgrade, due to inconsistent hashing of partition suffixes."
+msgstr ""
+"新しいファイルが空でないパーティションに新しいサフィックスで格納されたときに"
+"発生した consolidate_hash の退行バグを修正しました。 このバグは2.7.0で導入さ"
+"れ、パーティションサフィックスの一貫性のないハッシュのために、アップグレード"
+"中およびアップグレード後に rsync のレプリケーション統計を増加する可能性があり"
+"ます。"
+
+msgid "Fixed some minor test compatibility issues."
+msgstr "いくつかのテストの互換性の問題を修正しました。"
+
+msgid "Fixed the KeyError message when auditor finds an expired object."
+msgstr ""
+"監査が期限切れのオブジェクトを見つけたときの KeyError メッセージを修正しまし"
+"た。"
+
+msgid "Fixed the stats calculation in the erasure code reconstructor."
+msgstr "消去コード再構成の統計計算を修正しました。"
+
+msgid ""
+"Fixed using ``swift-ring-builder set_weight`` with more than one device."
+msgstr ""
+"複数のデバイスでの``swift-ring-builder set_weight`` の使用を修正しました。"
+
+msgid ""
+"For further information see the `docs <https://docs.openstack.org/swift/"
+"latest/overview_ring.html#module-swift.common.ring.composite_builder>`__"
+msgstr ""
+"詳細は `docs <https://docs.openstack.org/swift/latest/overview_ring."
+"html#module-swift.common.ring.composite_builder>`__ を参照してください。"
+
+msgid "Fractional replicas are no longer allowed for erasure code policies."
+msgstr "断片的な複製は、消去コードポリシーには使用できなくなりました。"
+
+msgid ""
+"GET and HEAD requests to a symlink will operate on the referenced object and "
+"require appropriate permission in the target container. DELETE and PUT "
+"requests will operate on the symlink object itself. POST requests are not "
+"forwarded to the referenced object. POST requests sent to a symlink will "
+"result in a 307 Temporary Redirect response."
+msgstr ""
+"シンボリックリンクに対する GET と HEAD リクエストは、参照されたオブジェクトに"
+"対して操作が行われ、対象となるコンテナーへの適切な権限を必要とします。DELETE "
+"と PUT リクエストは、シンボリックリンクオブジェクト自身に操作が行われます。"
+"POST リクエストは参照されているオブジェクトに転送されません。シンボリックリン"
+"クに対する POST リクエストの送信は、307 Temporary Redirect レスポンスになりま"
+"す。"
+
+msgid "I/O priority is now supported on AArch64 architecture."
+msgstr ""
+"AArch64 アーキテクチャーで I/O 優先順位がサポートされるようになりました。"
+
+msgid ""
+"If a proxy server is configured to autocreate accounts and the account "
+"create fails, it will now return a server error (500) instead of Not Found "
+"(404)."
+msgstr ""
+"プロキシサーバーにアカウント自動作成が設定されていて、アカウント作成に失敗す"
+"ると、Not Found (404) ではなく、サーバーエラー (500) が返されます。"
+
+msgid ""
+"If using erasure coding with ISA-L in rs_vand mode and 5 or more parity "
+"fragments, Swift will emit a warning. This is a configuration that is known "
+"to harm data durability. In a future release, this warning will be upgraded "
+"to an error unless the policy is marked as deprecated. All data in an "
+"erasure code storage policy using isa_l_rs_vand with 5 or more parity should "
+"be migrated as soon as possible. Please see https://bugs.launchpad.net/swift/"
+"+bug/1639691 for more information."
+msgstr ""
+"rs_vand モードで消去コードに ISA-L を使用し、パリティフラグメントが5つ以上あ"
+"る場合、 Swift は警告を発します。これは、データの耐久性を損なうことが知られて"
+"いる設定です。将来のリリースでは、ポリシーが廃止予定とマークされていない限"
+"り、この警告はエラーにアップグレードされる予定です。 isa_l_rs_vand を 5 以上"
+"のパリティで使用する消去コード格納ポリシーのすべてのデータは、できるだけ早く"
+"移行する必要があります。詳細については、 https://bugs.launchpad.net/swift/"
+"+bug/1639691\n"
+" を参照してください。"
+
+msgid "If you upgrade and roll back, you must delete all `hashes.pkl` files."
+msgstr ""
+"アップグレードしてロールバックする場合は、すべての `hashes.pkl` ファイルを削"
+"除する必要があります。"
+
+msgid "Imported docs content from openstack-manuals project."
+msgstr ""
+"openstack-manuals プロジェクトからドキュメントコンテンツをインポートしまし"
+"た。"
+
+msgid ""
+"Improved ``object-updater`` stats logging. It now tells you all of its stats "
+"(successes, failures, quarantines due to bad pickles, unlinks, and errors), "
+"and it tells you incremental progress every five minutes. The logging at the "
+"end of a pass remains and has been expanded to also include all stats."
+msgstr ""
+"``object-updater`` 統計ログを改善しました。すべての統計（成功、失敗、悪いピク"
+"ルスによる検疫、リンク解除、エラー）を出力し、また、５分毎に進捗状況を出力し"
+"ます。成功の最後のログは残り、すべての統計情報も含むように拡張されました。"
+
+msgid ""
+"Improved performance by eliminating an unneeded directory structure hash."
+msgstr ""
+"不要なディレクトリ構造ハッシュを排除してパフォーマンスを向上させました。"
+
+msgid ""
+"Improved the granularity of the ring dispersion metric so that small "
+"improvements after a rebalance can show changes in the dispersion number. "
+"Dispersion in existing and new rings can be recalculated using the new ``--"
+"recalculate`` option to ``swift-ring-builder``."
+msgstr ""
+"再分散後の小さな改善により分散数の変化を示すことができるように、リング分散メ"
+"トリックの粒度を改善しました。既存、および新しいリングの分散は、``swift-ring-"
+"builder`` の新しい ``--recalculate`` オプションを使うことで再計算されます。"
+
+msgid "Improvements in key parts of the consistency engine"
+msgstr "整合性エンジンの重要な部分を改善しました。"
+
+msgid ""
+"In SLO manifests, the `etag` and `size_bytes` keys are now fully optional "
+"and not required. Previously, the keys needed to exist but the values were "
+"optional. The only required key is `path`."
+msgstr ""
+"SLO マニフェストでは、 `etag` と `size_bytes` キーは完全にオプションであり、"
+"必須ではありません。 以前は、キーが必要でしたが、値はオプションでした。唯一必"
+"要なキーは `path` です。"
+
+msgid ""
+"Include object sysmeta in POST responses. Sysmeta is still stripped from the "
+"response before being sent to the client, but this allows middleware to make "
+"use of the information."
+msgstr ""
+"POST 応答にオブジェクト sysmeta を含めます。 Sysmeta は依然としてクライアント"
+"に送信される前に応答から取り除かれますが、ミドルウェアはその情報を利用できま"
+"す。"
+
+msgid "Include received fragment index in reconstructor log warnings."
+msgstr "受信したフラグメントインデックスを再構築ログの警告に含めました。"
+
+msgid ""
+"Instead of using a separate .durable file to indicate the durable status of "
+"an EC fragment archive, we rename the .data to include a durable marker in "
+"the filename. This saves one inode for every EC .data file. Existing ."
+"durable files will not be removed, and they will continue to work just fine."
+msgstr ""
+"別の .durable ファイルを使用して EC フラグメントアーカイブの耐久性ステータス"
+"を示す代わりに、ファイル名に耐久マーカーを含めるように .data の名前を変更しま"
+"す。 これにより、すべてのEC .data ファイルに対して1つの inode が節約されま"
+"す。 既存の .durable ファイルは削除されず、正常に動作し続けます。"
+
+msgid ""
+"Let clients request heartbeats during SLO PUTs by including the query "
+"parameter ``heartbeat=on``."
+msgstr ""
+"SLO PUT の間、クエリーパラメーター ``heartbeat=on`` を含めることで、クライア"
+"ントがハートビートを要求できるようにしました。"
+
+msgid ""
+"Listing containers in accounts with json or xml now includes a "
+"`last_modified` time. This does not change any on-disk data, but simply "
+"exposes the value to offer consistency with the object listings on "
+"containers."
+msgstr ""
+"json または xml を使用してアカウントのコンテナーを表示するときに、 "
+"`last_modified` 時刻が追加されました。これにより、ディスク上のデータは変更さ"
+"れませんが、値を公開してコンテナーのオブジェクトリストとの一貫性を提供しま"
+"す。"
+
+msgid "Log correct status code for conditional requests."
+msgstr "条件付きリクエストの正しいステータスコードを記録します。"
+
+msgid ""
+"Log deprecation warning for ``allow_versions`` in the container server "
+"config. Configure the ``versioned_writes`` middleware in the proxy server "
+"instead. This option will be ignored in a future release."
+msgstr ""
+"コンテナーサーバーの設定の ``allow_versions`` のために、非推奨警告ログを出力"
+"します。代わりに ``versioned_writes`` ミドルウェアをプロキシサーバーに設定し"
+"ます。このオプションは将来のリリースでは無視されます。"
+
+msgid "Log the correct request type of a subrequest downstream of copy."
+msgstr "サブリクエストの正しいリクエストタイプをコピーの後ろに記録します。"
+
+msgid ""
+"Make mount_check option usable in containerized environments by adding a "
+"check for an \".ismount\" file at the root directory of a device."
+msgstr ""
+"デバイスのルートディレクトリの \".ismount\" ファイルのチェックを追加すること"
+"により、コンテナー化された環境で mount_check オプションを使用可能にします。"
+
+msgid "Mirror X-Trans-Id to X-Openstack-Request-Id."
+msgstr "X-Trans-Id を X-Openstack-Request-Id に写します。"
+
+msgid ""
+"Move listing formatting out to a new proxy middleware named "
+"``listing_formats``. ``listing_formats`` should be just right of the first "
+"proxy-logging middleware, and left of most other middlewares. If it is not "
+"already present, it will be automatically inserted for you."
+msgstr ""
+"リストの成型を ``listing_formats`` という新しいプロキシミドルウェアに移動しま"
+"した。``listing_formats`` は、最初の proxy-logging ミドルウェアの直ぐ右にあ"
+"り、他のミドルウェアの左になければなりません。まだ存在しない場合は、自動的に"
+"挿入されます。"
+
+msgid "Moved Zuul v3 tox jobs into the Swift code repo."
+msgstr "Zuul v3 の tox ジョブを Swift のリポジトリに移動しました。"
+
+msgid ""
+"Moved other-requirements.txt to bindep.txt. bindep.txt lists non-python "
+"dependencies of Swift."
+msgstr ""
+"other-requirements.txt を bindep.txt に移動しました。 bindep.txt は、 Swift "
+"の非 Python 依存関係をリストします。"
+
+msgid "New Features"
+msgstr "新機能"
+
+msgid ""
+"New config variables to change the schedule priority and I/O scheduling "
+"class. Servers and daemons now understand `nice_priority`, `ionice_class`, "
+"and `ionice_priority` to schedule their relative importance. Please read "
+"http://docs.openstack.org/developer/swift/deployment_guide.html for full "
+"config details."
+msgstr ""
+"スケジュール優先度と I/O スケジューリングクラスを変更する新しい設定変数を追加"
+"しました。サーバーとデーモンは `nice_priority`、`ionice_class`、"
+"`ionice_priority` を理解し、相対的な重要性をスケジューリングするようになりま"
+"した。 設定の詳細については、http://docs.openstack.org/developer/swift/"
+"deployment_guide.html を参照してください。"
+
+msgid "Newton Series Release Notes"
+msgstr "Newton バージョンのリリースノート"
+
+msgid ""
+"Note that after writing EC data with Swift 2.11.0 or later, that data will "
+"not be accessible to earlier versions of Swift."
+msgstr ""
+"Swift 2.11.0 以降で EC データを書き込んだ後は、以前のバージョンの Swift では"
+"そのデータにアクセスできないことに注意してください。"
+
+msgid ""
+"Note: if you have a custom middleware that makes account or container "
+"listings, it will only receive listings in JSON format."
+msgstr ""
+"注意: アカウントやコンテナー一覧を作るカスタムミドルウェアがある場合、受け取"
+"る一覧は JSON 形式のみです。"
+
+msgid ""
+"Now Swift will use ``write_affinity_handoff_delete_count`` to define how "
+"many local handoff nodes should swift send request to get more candidates "
+"for the final response. The default value \"auto\" means Swift will "
+"calculate the number automatically based on the number of replicas and "
+"current cluster topology."
+msgstr ""
+"Swiftは、 ``write_affinity_handoff_delete_count`` を使って、最終応答の候補を"
+"もっと多く得るために、どのくらいのローカルハンドオフノードが要求を送信するべ"
+"きかを定義します。デフォルト値 \"auto\" は、 Swift がレプリカの数と現在のクラ"
+"スタートポロジーに基づいて自動的に数を計算することを意味します。"
+
+msgid "Now ``swift-recon-cron`` works with conf.d configs."
+msgstr "``swift-recon-cron`` は conf.d の設定で動作するようになりました。"
+
+msgid "Object expiry improvements"
+msgstr "オブジェクトの有効期限の改善"
+
+msgid ""
+"Object versioning now supports a \"history\" mode in addition to the older "
+"\"stack\" mode. The difference is in how DELETE requests are handled. For "
+"full details, please read http://docs.openstack.org/developer/swift/"
+"overview_object_versioning.html."
+msgstr ""
+"オブジェクトのバージョン管理は、古い \"stack\" モードに加えて、 \"history\" "
+"モードをサポートするようになりました。 違いは、 DELETE 要求の処理方法にありま"
+"す。 詳細については、 http://docs.openstack.org/developer/swift/"
+"overview_object_versioning.html を参照してください。"
+
+msgid "Ocata Series Release Notes"
+msgstr "Ocata バージョンのリリースノート"
+
+msgid ""
+"On newer kernels (3.15+ when using xfs), Swift will use the O_TMPFILE flag "
+"when opening a file instead of creating a temporary file and renaming it on "
+"commit. This makes the data path simpler and allows the filesystem to more "
+"efficiently optimize the files on disk, resulting in better performance."
+msgstr ""
+"新しいカーネル（xfsを使用する場合 3.15+ ）では、一時ファイルを作成してコミッ"
+"ト時に名前を変更する代わりに、ファイルを開くときに Swift が O_TMPFILE フラグ"
+"を使用します。これにより、データパスが簡単になり、ファイルシステムがディスク"
+"上のファイルをより効率的に最適化できるようになり、パフォーマンスが向上しま"
+"す。"
+
+msgid ""
+"Optimize the Erasure Code reconstructor protocol to reduce IO load on "
+"servers."
+msgstr ""
+"消去コード再構成プロトコルを最適化して、サーバーの IO 負荷を軽減します。"
+
+msgid ""
+"Optimized the common case for hashing filesystem trees, thus eliminating a "
+"lot of extraneous disk I/O."
+msgstr ""
+"ファイルシステムツリーをハッシュするための一般的なケースを最適化し、多くの余"
+"分なディスク I/O を無くしました。"
+
+msgid "Other Notes"
+msgstr "その他の注意点"
+
+msgid ""
+"PUT subrequests generated from a client-side COPY will now properly log the "
+"SSC (server-side copy) Swift source field. See https://docs.openstack.org/"
+"developer/swift/logs.html#swift-source for more information."
+msgstr ""
+"クライアント側の COPY から生成された PUT サブリクエストは、 SSC （サーバー側"
+"のコピー） Swift ソースフィールドを適切に記録するようになりました。詳細につい"
+"ては、\n"
+"https://docs.openstack.org/developer/swift/logs.html#swift-source を参照して"
+"ください。"
+
+msgid "Pike Series Release Notes"
+msgstr "Pike バージョンのリリースノート"
+
+msgid ""
+"Prevent logged traceback in object-server on client disconnect for chunked "
+"transfers to replicated policies."
+msgstr ""
+"複製されたポリシーへのチャンクされた転送時のクライアント切断で、オブジェクト"
+"サーバーにログされたトレースバックを防止します。"
+
+msgid ""
+"Previously, when deleting objects in multi-region swift deployment with "
+"write affinity configured, users always get 404 when deleting object before "
+"it's replicated to appropriate nodes."
+msgstr ""
+"以前は、書き込みアフィニティを設定したマルチリージョンの Swift 構成でオブジェ"
+"クトを削除すると、オブジェクトが適切なノードにレプリケートされる前にオブジェ"
+"クトを削除すると常に 404 となりました。"
+
+msgid ""
+"Remove ``swift-temp-url`` script. The functionality has been in swiftclient "
+"for a long time and this script has been deprecated since 2.10.0."
+msgstr ""
+"``swift-temp-url`` スクリプトを削除しました。この機能は、長い間 swiftclient "
+"にありましたが、2.10.0 から非推奨でした。"
+
+msgid "Remove deprecated ``vm_test_mode`` option."
+msgstr "非推奨の ``vm_test_mode`` オプションを削除しました。"
+
+msgid "Remove empty db hash and suffix directories if a db gets quarantined."
+msgstr ""
+"DB が隔離された場合に、空の DB ハッシュとサフィックスディレクトリを削除しま"
+"す。"
+
+msgid ""
+"Removed \"in-process-\" from func env tox name to work with upstream CI."
+msgstr ""
+"上流の CI で動作するように、func env tox 名から \"in-process-\" を削除しまし"
+"た。"
+
+msgid ""
+"Removed a race condition where a POST to an SLO could modify the X-Static-"
+"Large-Object metadata."
+msgstr ""
+"SLO クラウドへの POST が X-Static-Large-Object メタデータを変更できる、競合状"
+"態を削除しました。"
+
+msgid ""
+"Removed all ``post_as_copy`` related code and configs. The option has been "
+"deprecated since 2.13.0."
+msgstr ""
+"``post_as_copy`` に関連するすべてのコードと設定を削除しました。このオプション"
+"は、2.13.0 から非推奨でした。"
+
+msgid ""
+"Removed per-device reconstruction stats. Now that the reconstructor is "
+"shuffling parts before going through them, those stats no longer make sense."
+msgstr ""
+"デバイスごとの再構成の統計を削除しました。再構成は、それらを通過する前にパー"
+"ツをシャッフルするので、それらの統計はもはや意味をなしません。"
+
+msgid ""
+"Replaced ``replication_one_per_device`` by custom count defined by "
+"``replication_concurrency_per_device``. The original config value is "
+"deprecated, but continues to function for now. If both values are defined, "
+"the old ``replication_one_per_device`` is ignored."
+msgstr ""
+"``replication_one_per_device`` を ``replication_concurrency_per_device`` に"
+"よって定義されるカスタムカウントに置き換えました。元の設定値は非推奨となりま"
+"したが、引き続き機能します。両方の値が定義された場合、古い "
+"``replication_one_per_device`` は無視されます。"
+
+msgid "Require that known-bad EC schemes be deprecated"
+msgstr "既知の悪い EC スキームの要件を非推奨にしました。"
+
+msgid "Respect server type for --md5 check in swift-recon."
+msgstr "swift-recon での --md5 チェックのサーバー種別を尊重します。"
+
+msgid ""
+"Respond 400 Bad Request when Accept headers fail to parse instead of "
+"returning 406 Not Acceptable."
+msgstr ""
+"Accept ヘッダーの解析に失敗した時、406 Not Acceptable の代わりに 400 Bad "
+"Request が返されます。"
+
+msgid ""
+"Ring files now include byteorder information about the endian of the machine "
+"used to generate the file, and the values are appropriately byteswapped if "
+"deserialized on a machine with a different endianness. Newly created ring "
+"files will be byteorder agnostic, but previously generated ring files will "
+"still fail on different endian architectures. Regenerating older ring files "
+"will cause them to become byteorder agnostic. The regeneration of the ring "
+"files will not cause any new data movement. Newer ring files will still be "
+"usable by older versions of Swift (on machines with the same endianness--"
+"this maintains existing behavior)."
+msgstr ""
+"リングファイルには、ファイルを生成するために使用されたマシンのエンディアンに"
+"関するバイトオーダー情報が含まれるようになりました。エンディアンが異なるマシ"
+"ンでデシリアライズされた場合、値は適切にバイトスワップされます。新しく作成さ"
+"れたリングファイルはバイトオーダーには依存しませんが、以前に生成されたリング"
+"ファイルは引き続き異なるエンディアンアーキテクチャで失敗します。古いリング"
+"ファイルを再生成すると、それらはバイトオーダーに無関係になります。リングファ"
+"イルを再生成しても、新しいデータの移動は発生しません。最新のリングファイルは "
+"Swift の古いバージョンでも使用できます（同じエンディアンのマシンでは、これは"
+"既存の動作を維持します）。"
+
+msgid ""
+"Rings with min_part_hours set to zero will now only move one partition "
+"replica per rebalance, thus matching behavior when min_part_hours is greater "
+"than zero."
+msgstr ""
+"min_part_hours が 0 に設定されたリングは、リバランスのたびに１つのパーティ"
+"ションレプリカのみを移動するため、 min_part_hours が 0 より大きい場合の動作が"
+"一致します。"
+
+msgid ""
+"SLO manifest PUT requests can now be properly validated by sending an ETag "
+"header of the md5 sum of the concatenated md5 sums of the referenced "
+"segments."
+msgstr ""
+"参照されたセグメントの md5 合計が連結されたものの md5 合計を ETag ヘッダーで"
+"送信することによって、SLO マニフェストの PUT 要求を適切に検証することができま"
+"す。"
+
+msgid ""
+"SLO will now concurrently HEAD segments, resulting in much faster manifest "
+"validation and object creation. By default, two HEAD requests will be done "
+"at a time, but this can be changed by the operator via the new `concurrency` "
+"setting in the \"[filter:slo]\" section of the proxy server config."
+msgstr ""
+"SLO は現在、 HEAD セグメントを同時に処理するため、マニフェストの検証とオブ"
+"ジェクト作成が大幅に高速化されます。 デフォルトでは、一度に２つの HEAD リクエ"
+"ストが実行されますが、これはプロキシーサーバーの設定の \"[filter：slo]\" セク"
+"ションの新しい `concurrency` 設定によってオペレーターが変更できます。"
+
+msgid ""
+"Save the ring when dispersion improves, even if balance doesn't improve."
+msgstr ""
+"バランスが改善されない場合でも、分散が改善されたときにリングを保存します。"
+
+msgid "Send ETag header in 206 Partial Content responses to SLO reads."
+msgstr ""
+"SLO 読み込みへの 206 Partial Content 応答で ETag ヘッダーを送信します。"
+
+msgid ""
+"Significant improvements to the api-ref doc available at http://developer."
+"openstack.org/api-ref/object-storage/."
+msgstr ""
+"http://developer.openstack.org/api-ref/object-storage/ の api-ref ドキュメン"
+"トに対する重要な改善が行われました。"
+
+msgid ""
+"Static Large Object (SLO) manifest may now (again) have zero-byte last "
+"segments."
+msgstr ""
+"Static Large Object (SLO) マニフェストは、0 バイトの最終セグメントを再度持つ"
+"ようになりました。"
+
+msgid ""
+"Stop logging tracebacks in the ``object-replicator`` when it runs out of "
+"handoff locations."
+msgstr ""
+"``object-replicator`` を実行する場所を使い果たした時のトレースバックのログを"
+"停止しました。"
+
+msgid "Stopped logging tracebacks when receiving an unexpected response."
+msgstr "想定外の応答を受信した時のトレースバックのログを停止しました。"
+
+msgid "Support multi-range GETs for static large objects."
+msgstr "静的ラージオブジェクトの multi-range GET をサポートしました。"
+
+msgid "Suppress unexpected-file warnings for rsync temp files."
+msgstr "rsync の一時ファイルに対する unexpected-file 警告を抑制しました。"
+
+msgid "Suppressed the KeyError message when auditor finds an expired object."
+msgstr ""
+"監査が期限切れのオブジェクトを見つけたときの KeyError メッセージを抑制しまし"
+"た。"
+
+msgid "Swift Release Notes"
+msgstr "Swift リリースノート"
+
+msgid ""
+"Symlink objects reference one other object. They are created by creating an "
+"empty object with an X-Symlink-Target header. The value of the header is of "
+"the format <container>/<object>, and the target does not need to exist at "
+"the time of symlink creation. Cross-account symlinks can be created by "
+"including the X-Symlink-Target-Account header."
+msgstr ""
+"Symlink オブジェクトは他のオブジェクトを参照します。これらは、X-Symlink-"
+"Target ヘッダーを持つ空のオブジェクトの作成によって作られます。ヘッダーの値"
+"は <container>/<object> 形式であり、シンボリックリンク作成時にターゲットが存"
+"在する必要はありません。クロスアカウントのシンボリックリンクは、X-Symlink-"
+"Target-Account ヘッダーを含むことによって作成できます。"
+
+msgid ""
+"TempURLs now support a validation against a common prefix. A prefix-based "
+"signature grants access to all objects which share the same prefix. This "
+"avoids the creation of a large amount of signatures, when a whole container "
+"or pseudofolder is shared."
+msgstr ""
+"TempURL は、共通プレフィックスに対する検証をサポートするようになりました。接"
+"頭辞ベースの署名は、同じ接頭辞を共有するすべてのオブジェクトへのアクセスを許"
+"可します。これにより、コンテナーまたは擬似フォルダーの全体を共有するときに、"
+"大量の署名を作成することがなくなります。"
+
+msgid ""
+"TempURLs using the \"inline\" parameter can now also set the \"filename\" "
+"parameter. Both are used in the Content-Disposition response header."
+msgstr ""
+"「インライン」パラメータを使用する TempURL では、「ファイル名」パラメータも設"
+"定できるようになりました。どちらも Content-Disposition レスポンスヘッダーで使"
+"用されます。"
+
+msgid ""
+"Temporary URLs now support one common form of ISO 8601 timestamps in "
+"addition to Unix seconds-since-epoch timestamps. The ISO 8601 format "
+"accepted is '%Y-%m-%dT%H:%M:%SZ'. This makes TempURLs more user-friendly to "
+"produce and consume."
+msgstr ""
+"現在、 TempURL は、Unix エポック秒のタイムスタンプに加えて、 ISO 8601 タイム"
+"スタンプの一般的な形式をサポートするようになりました。受け入れられる ISO "
+"8601 形式は、 '%Y-%m-%dT%H:%M:%SZ' です。これにより、一時 URL の作成と使用が"
+"ユーザーフレンドリーになります。"
+
+msgid ""
+"The EC reconstructor process has been dramatically improved by adding "
+"support for multiple concurrent workers. Multiple processes are required to "
+"get high concurrency, and this change results in much faster rebalance times "
+"on servers with many drives."
+msgstr ""
+"EC 再構成プロセスは、複数の並列ワーカーのサポートを追加することによって劇的に"
+"改善されました。 高い並列性を得るためには複数のプロセスが必要です。この変更に"
+"より、多くのドライブを搭載したサーバーでは大幅に高速なリバランスが行われま"
+"す。"
+
+msgid ""
+"The ``domain_remap`` middleware now supports the ``mangle_client_paths`` "
+"option. Its default \"false\" value changes ``domain_remap`` parsing to stop "
+"stripping the ``path_root`` value from URL paths. If users depend on this "
+"path mangling, operators should set ``mangle_client_paths`` to \"True\" "
+"before upgrading."
+msgstr ""
+"``domain_remap`` ミドルウェアは、``mangle_client_paths`` オプションをサポート"
+"しました。デフォルト値 \"false\" では、``domain_remap`` の解析で URL のパスか"
+"ら ``path_root`` 値を取り除かなくなります。このパスの切り取りに依存している場"
+"合は、アップグレードする前に、オペレーターは ``mangle_client_paths`` を "
+"\"True\" に設定する必要があります。"
+
+msgid ""
+"The default for `object_post_as_copy` has been changed to False. The option "
+"is now deprecated and will be removed in a future release. If your cluster "
+"is still running with post-as-copy enabled, please update it to use the "
+"\"fast-post\" method. Future versions of Swift will not support post-as-"
+"copy, and future features will not be supported under post-as-copy. (\"Fast-"
+"post\" is where `object_post_as_copy` is false)."
+msgstr ""
+"`object_post_as_copy` のデフォルトは False に変更されました。このオプションは"
+"廃止され、将来のリリースで削除される予定です。あなたのクラスターが post-as-"
+"copy を有効にして実行している場合は、 \"fast-post\" 方式を使用するように更新"
+"してください。 Swift の将来のバージョンは post-as-copyをサポートしませんし、"
+"将来の機能は post-as-copyの下ではサポートされません。（「Fast-post」は "
+"`object_post_as_copy` が false のところです）。"
+
+msgid ""
+"The erasure code reconstructor `handoffs_first` option has been deprecated "
+"in favor of `handoffs_only`. `handoffs_only` is far more useful, and just "
+"like `handoffs_first` mode in the replicator, it gives the operator the "
+"option of forcing the consistency engine to focus solely on revert (handoff) "
+"jobs, thus improving the speed of rebalances.  The `handoffs_only` behavior "
+"is somewhat consistent with the replicator's `handoffs_first` option (any "
+"error on any handoff in the replicator will make it essentially handoff only "
+"forever) but the `handoff_only` option does what you want and is named "
+"correctly in the reconstructor."
+msgstr ""
+"消去コード再構成の `handoffs_first` オプションは `handoffs_only` のために廃止"
+"されました。 `handoffs_only` ははるかに便利で、レプリケーターの "
+"`handoffs_first` モードと同様に、一貫性エンジンに復帰（ハンドオフ）ジョブだけ"
+"に注力させるオプションをオペレーターに与え、リバランスのスピードを向上させま"
+"す。 `handoffs_only` の振る舞いは、レプリケーターの `handoffs_first` オプショ"
+"ンと一貫しています（レプリケーターのハンドオフ時にエラーが発生すると永久にハ"
+"ンドオフのみになります）が、`handoff_only` オプションは必要な処理を行い、再構"
+"成で正しく命名されます。"
+
+msgid ""
+"The erasure code reconstructor will now shuffle work jobs across all disks "
+"instead of going disk-by-disk. This eliminates single-disk I/O contention "
+"and allows continued scaling as concurrency is increased."
+msgstr ""
+"消去コード再構成は、ディスク単位で作業するのではなく、すべてのディスクで作業"
+"ジョブをシャッフルします。これにより、シングルディスクの I/O 競合がなくなり、"
+"並行性が高まるにつれて継続的なスケーリングが可能になります。"
+
+msgid ""
+"The improvements to EC reads made in Swift 2.10.0 have also been applied to "
+"the reconstructor. This allows fragments to be rebuilt in more "
+"circumstances, resulting in faster recovery from failures."
+msgstr ""
+"Swift 2.10.0 で作成された EC 読み取りの改善も、再構成に適用されています。これ"
+"により、より多くの状況でフラグメントを再構築することができ、障害からの迅速な"
+"回復が可能になります。"
+
+msgid ""
+"The number of container updates on object PUTs (ie to update listings) has "
+"been recomputed to be far more efficient  while maintaining durability "
+"guarantees. Specifically, object PUTs to erasure-coded policies will now "
+"normally result in far fewer container updates."
+msgstr ""
+"オブジェクトの PUT によるコンテナー更新の数（つまり、一覧の更新）は、耐久性の"
+"保証を維持しながら、遥かに効率的に再計算されます。具体的には、消去符号化ポリ"
+"シーへのオブジェクトの PUT は、通常、コンテナーの更新が大幅に少なくなります。"
+
+msgid ""
+"The object and container server config option ``slowdown`` has been "
+"deprecated in favor of the new ``objects_per_second`` and "
+"``containers_per_second`` options."
+msgstr ""
+"オブジェクトとコンテナーのサーバー設定オプション ``slowdown`` は、新しい "
+"``objects_per_second`` オプションと ``containers_per_second`` オプションのた"
+"めに廃止されました。"
+
+msgid ""
+"The object reconstructor can now rebuild an EC fragment for an expired "
+"object."
+msgstr ""
+"オブジェクト再構成は、期限切れのオブジェクトの EC フラグメントを再構築できる"
+"ようになりました。"
+
+msgid ""
+"The object server runs certain IO-intensive methods outside the main pthread "
+"for performance. Previously, if one of those methods tried to log, this can "
+"cause a crash that eventually leads to an object server with hundreds or "
+"thousands of greenthreads, all deadlocked. The fix is to use a mutex that "
+"works across different greenlets and different pthreads."
+msgstr ""
+"オブジェクトサーバーは、パフォーマンスのためにメインの pthread の外部で特定"
+"の IO 集約型メソッドを実行します。以前は、これらのメソッドの 1 つがログに記録"
+"しようとすると、クラッシュが発生し、最終的にオブジェクトサーバーはデッドロッ"
+"クされた数百または数千のグリーンスレッドを持つに至ります。この修正は、異なる "
+"greenlet と異なる pthread にまたがって動作する mutex を使用することです。"
+
+msgid ""
+"The output of devices from ``swift-ring-builder`` has been reordered by "
+"region, zone, ip, and device."
+msgstr ""
+"``swift-ring-builder`` からのデバイスの出力は、リージョン、ゾーン、IP、デバイ"
+"スによって、並べ替えられます。"
+
+msgid ""
+"The tempurl digest algorithm is now configurable, and Swift added support "
+"for both SHA-256 and SHA-512. Supported tempurl digests are exposed to "
+"clients in ``/info``. Additionally, tempurl signatures can now be base64 "
+"encoded."
+msgstr ""
+"tmpurl のダイジェストアルゴリズムが設定可能になり、Swift は、SHA-256 および "
+"SHA-512 の両方のサポートを追加しました。サポートされる tmpurl ダイジェスト"
+"は、``/info`` にてクライアントに公開されます。さらに、tempurl の署名を "
+"base64 でエンコードできるようになりました。"
+
+msgid ""
+"Throttle update_auditor_status calls so it updates no more than once per "
+"minute."
+msgstr ""
+"update_auditor_status の呼び出しを絞りました。なので、1分に1回しか更新しませ"
+"ん。"
+
+msgid ""
+"Throttle update_auditor_status calls so it updates no more than once per "
+"minute. This prevents excessive IO on a new cluster."
+msgstr ""
+"update_auditor_status の呼び出しを絞りました。なので、1分に1回しか更新しませ"
+"ん。これにより、新しいクラスタで過剰な I/O が発生するのを防ぎます。"
+
+msgid ""
+"Update dnspython dependency to 1.14, removing the need to have separate "
+"dnspython dependencies for Py2 and Py3."
+msgstr ""
+"dnspython の依存関係を 1.14 に更新し、dnspython の依存関係を Python 2 と "
+"Python 3 に分ける必要性をなくしました。"
+
+msgid "Updated docs to reference appropriate ports."
+msgstr "適切なポートを参照するようにドキュメントを更新しました。"
+
+msgid "Updated the PyECLib dependency to 1.3.1."
+msgstr "PyECLib の依存関係を 1.3.1 に更新しました。"
+
+msgid ""
+"Updated the `hashes.pkl` file format to include timestamp information for "
+"race detection. Also simplified hashing logic to prevent race conditions and "
+"optimize for the common case."
+msgstr ""
+"競合検出のタイムスタンプ情報を含むように `hashes.pkl` ファイル形式を更新しま"
+"した。また競合状態を防止し、一般的なケースを最適化するために、ハッシュロジッ"
+"クを簡略化しました。"
+
+msgid ""
+"Upgrade Impact: If you upgrade and roll back, you must delete all `hashes."
+"pkl` files."
+msgstr ""
+"アップグレードの影響: アップグレードしてロールバックする場合は、すべての "
+"`hashes.pkl` ファイルを削除する必要があります。"
+
+msgid "Upgrade Notes"
+msgstr "アップグレード時の注意"
+
+msgid ""
+"Upgrade impact -- during a rolling upgrade, an updated proxy server may "
+"write a manifest that an out-of-date proxy server will not be able to read. "
+"This will resolve itself once the upgrade completes on all nodes."
+msgstr ""
+"アップグレードの影響 -- ローリングアップグレード中に、更新されたプロキシサー"
+"バーは、期限切れのプロキシサーバーが読み込むことができないマニフェストを書き"
+"出す可能性があります。これは、すべてのノードでアップグレードが完了すると自ず"
+"と解決します。"
+
+msgid "Various other minor bug fixes and improvements."
+msgstr "様々な他のマイナーなバグ修正と改善。"
+
+msgid ""
+"WARNING: If you are using the ISA-L library for erasure codes, please "
+"upgrade to liberasurecode 1.3.1 (or later) as soon as possible. If you are "
+"using isa_l_rs_vand with more than 4 parity, please read https://bugs."
+"launchpad.net/swift/+bug/1639691 and take necessary action."
+msgstr ""
+"警告: 消去コードに ISA-L ライブラリを使用している場合は、できるだけ早く "
+"liberasurecode 1.3.1 （またはそれ以降）にアップグレードしてください。 4つ以上"
+"のパリティを持つ isa_l_rs_vand を使用している場合は、 https://bugs.launchpad."
+"net/swift/+bug/1639691 を参照して必要な処置を行ってください。"
+
+msgid ""
+"We do not yet have CLI tools for creating composite rings, but the "
+"functionality has been enabled in the ring modules to support this advanced "
+"functionality. CLI tools will be delivered in a subsequent release."
+msgstr ""
+"複合リングを作成するための CLI ツールはまだありませんが、この高度な機能をサ"
+"ポートするためにリングモジュールで機能が有効になっています。 CLI ツールは、以"
+"降のリリースで提供されます。"
+
+msgid ""
+"When requesting objects, return 404 if a tombstone is found and is newer "
+"than any data found. Previous behavior was to return stale data."
+msgstr ""
+"オブジェクトを要求するとき、廃棄済みオブジェクト (tombstone) があり、他のデー"
+"タよりも新しい場合には 404 を返します。以前の動作では、古いデータが返されてい"
+"ました。"
+
+msgid ""
+"When the object auditor examines an object, it will now add any missing "
+"metadata checksums."
+msgstr ""
+"オブジェクト監査がオブジェクトを検査するとき、欠落しているメタデータのチェッ"
+"クサムを追加します。"
+
+msgid ""
+"With heartbeating turned on, the proxy will start its response immediately "
+"with 202 Accepted then send a single whitespace character periodically until "
+"the request completes. At that point, a final summary chunk will be sent "
+"which includes a \"Response Status\" key indicating success or failure and "
+"(if successful) an \"Etag\" key indicating the Etag of the resulting SLO."
+msgstr ""
+"ハートビートをオンにすると、プロキシは 直ぐに 202 Accepted で応答を開始し、リ"
+"クエストが完了するまで一つの空白文字を定期的に送信します。その時点で、成功か"
+"失敗かを示す「Response Status 」キーと、成功した場合には SLO の結果として生じ"
+"る Etag を示す「Etag」キーを含む最終サマリーチャンクが送信されるようになりま"
+"す。"
+
+msgid "Write-affinity aware object deletion"
+msgstr "書き込みアフィニティは、オブジェクトの削除を認識します。"
+
+msgid ""
+"X-Delete-At computation now uses X-Timestamp instead of system time. This "
+"prevents clock skew causing inconsistent expiry data."
+msgstr ""
+"X-Delete-At の計算に、システム時間の代わりに X-Timestamp を使うようになりまし"
+"た。これは、時刻の誤差によって起こる期限データの矛盾を防止します。"
+
+msgid "``swift-ring-builder`` improvements"
+msgstr "``swift-ring-builder`` の改善"
+
+msgid ""
+"cname_lookup middleware now accepts a ``nameservers`` config variable that, "
+"if defined, will be used for DNS lookups instead of the system default."
+msgstr ""
+"cname_lookup ミドルウェアは、定義されていれば、システムのデフォルトではなく "
+"DNS ルックアップに使用される ``nameservers`` 設定変数を受け入れるようになりま"
+"した。"
+
+msgid "domain_remap now accepts a list of domains in \"storage_domain\"."
+msgstr ""
+"domain_remap は \"storage_domain\" にあるドメインのリストを受け入れるようにな"
+"りました。"
+
+msgid "name_check and cname_lookup keys have been added to `/info`."
+msgstr "name_check と cname_lookup キーが `/info` に追加されました。"
+
+msgid "swift-recon now respects storage policy aliases."
+msgstr "swift-recon はストレージポリシーの別名を尊重するようになりました。"
diff --git a/releasenotes/source/newton.rst b/releasenotes/source/newton.rst
new file mode 100644
index 0000000000..59418a33dd
--- /dev/null
+++ b/releasenotes/source/newton.rst
@@ -0,0 +1,6 @@
+=============================
+ Newton Series Release Notes
+=============================
+
+.. release-notes::
+   :branch: stable/newton
diff --git a/releasenotes/source/ocata.rst b/releasenotes/source/ocata.rst
new file mode 100644
index 0000000000..53fb86e386
--- /dev/null
+++ b/releasenotes/source/ocata.rst
@@ -0,0 +1,6 @@
+===================================
+ Ocata Series Release Notes
+===================================
+
+.. release-notes::
+   :branch: stable/ocata
diff --git a/releasenotes/source/pike.rst b/releasenotes/source/pike.rst
new file mode 100644
index 0000000000..e43bfc0ce1
--- /dev/null
+++ b/releasenotes/source/pike.rst
@@ -0,0 +1,6 @@
+===================================
+ Pike Series Release Notes
+===================================
+
+.. release-notes::
+   :branch: stable/pike
diff --git a/releasenotes/source/queens.rst b/releasenotes/source/queens.rst
new file mode 100644
index 0000000000..36ac6160ca
--- /dev/null
+++ b/releasenotes/source/queens.rst
@@ -0,0 +1,6 @@
+===================================
+ Queens Series Release Notes
+===================================
+
+.. release-notes::
+   :branch: stable/queens
diff --git a/releasenotes/source/rocky.rst b/releasenotes/source/rocky.rst
new file mode 100644
index 0000000000..40dd517b75
--- /dev/null
+++ b/releasenotes/source/rocky.rst
@@ -0,0 +1,6 @@
+===================================
+ Rocky Series Release Notes
+===================================
+
+.. release-notes::
+   :branch: stable/rocky
diff --git a/releasenotes/source/stein.rst b/releasenotes/source/stein.rst
new file mode 100644
index 0000000000..efaceb667b
--- /dev/null
+++ b/releasenotes/source/stein.rst
@@ -0,0 +1,6 @@
+===================================
+ Stein Series Release Notes
+===================================
+
+.. release-notes::
+   :branch: stable/stein
diff --git a/releasenotes/source/train.rst b/releasenotes/source/train.rst
new file mode 100644
index 0000000000..583900393c
--- /dev/null
+++ b/releasenotes/source/train.rst
@@ -0,0 +1,6 @@
+==========================
+Train Series Release Notes
+==========================
+
+.. release-notes::
+   :branch: stable/train
diff --git a/releasenotes/source/ussuri.rst b/releasenotes/source/ussuri.rst
new file mode 100644
index 0000000000..e21e50e0c6
--- /dev/null
+++ b/releasenotes/source/ussuri.rst
@@ -0,0 +1,6 @@
+===========================
+Ussuri Series Release Notes
+===========================
+
+.. release-notes::
+   :branch: stable/ussuri
diff --git a/releasenotes/source/victoria.rst b/releasenotes/source/victoria.rst
new file mode 100644
index 0000000000..8ce9334198
--- /dev/null
+++ b/releasenotes/source/victoria.rst
@@ -0,0 +1,6 @@
+=============================
+Victoria Series Release Notes
+=============================
+
+.. release-notes::
+   :branch: unmaintained/victoria
diff --git a/releasenotes/source/wallaby.rst b/releasenotes/source/wallaby.rst
new file mode 100644
index 0000000000..bcf35c5f80
--- /dev/null
+++ b/releasenotes/source/wallaby.rst
@@ -0,0 +1,6 @@
+============================
+Wallaby Series Release Notes
+============================
+
+.. release-notes::
+   :branch: unmaintained/wallaby
diff --git a/releasenotes/source/xena.rst b/releasenotes/source/xena.rst
new file mode 100644
index 0000000000..d19eda4886
--- /dev/null
+++ b/releasenotes/source/xena.rst
@@ -0,0 +1,6 @@
+=========================
+Xena Series Release Notes
+=========================
+
+.. release-notes::
+   :branch: unmaintained/xena
diff --git a/releasenotes/source/yoga.rst b/releasenotes/source/yoga.rst
new file mode 100644
index 0000000000..43cafdea89
--- /dev/null
+++ b/releasenotes/source/yoga.rst
@@ -0,0 +1,6 @@
+=========================
+Yoga Series Release Notes
+=========================
+
+.. release-notes::
+   :branch: unmaintained/yoga
diff --git a/releasenotes/source/zed.rst b/releasenotes/source/zed.rst
new file mode 100644
index 0000000000..6cc2b1554c
--- /dev/null
+++ b/releasenotes/source/zed.rst
@@ -0,0 +1,6 @@
+========================
+Zed Series Release Notes
+========================
+
+.. release-notes::
+   :branch: unmaintained/zed
diff --git a/requirements.txt b/requirements.txt
new file mode 100644
index 0000000000..4ae431c958
--- /dev/null
+++ b/requirements.txt
@@ -0,0 +1,13 @@
+# The order of packages is significant, because pip processes them in the order
+# of appearance. Changing the order has an impact on the overall integration
+# process, which may cause wedges in the gate later.
+
+eventlet>=0.25.0,!=0.34.3               # MIT
+greenlet>=0.4.14
+PasteDeploy>=2.0.0
+lxml>=4.2.3
+requests>=2.14.2                        # Apache-2.0
+xattr>=0.7.2;sys_platform!='win32'      # MIT
+PyECLib>=1.3.1,!=1.6.2,!=1.6.3          # BSD
+cryptography>=2.0.2                     # BSD/Apache-2.0
+dnspython>=1.15.0                       # http://www.dnspython.org/LICENSE
diff --git a/roles/additional-keystone-users/tasks/main.yaml b/roles/additional-keystone-users/tasks/main.yaml
new file mode 100644
index 0000000000..e2b9879853
--- /dev/null
+++ b/roles/additional-keystone-users/tasks/main.yaml
@@ -0,0 +1,169 @@
+- name: Set S3 endpoint
+  ini_file:
+    path: /etc/swift/test.conf
+    section: func_test
+    option: s3_storage_url
+    value: http://localhost:8080
+  become: true
+
+- name: Create primary S3 user
+  shell: >
+    openstack --os-auth-url http://localhost/identity
+    --os-project-domain-id default --os-project-name admin
+    --os-user-domain-id default --os-username admin
+    --os-password secretadmin
+    credential create --type ec2 --project swiftprojecttest1 swiftusertest1
+    '{"access": "s3-user1", "secret": "s3-secret1"}'
+- name: Add primary S3 user to test.conf
+  ini_file:
+    path: /etc/swift/test.conf
+    section: func_test
+    option: s3_access_key
+    value: s3-user1
+  become: true
+- name: Add primary S3 user secret to test.conf
+  ini_file:
+    path: /etc/swift/test.conf
+    section: func_test
+    option: s3_secret_key
+    value: s3-secret1
+  become: true
+- name: Add primary S3 user to test.conf for cross-compat tests
+  ini_file:
+    path: /etc/swift/test.conf
+    section: s3api_test
+    option: access_key1
+    value: s3-user1
+  become: true
+- name: Add primary S3 user secret to test.conf for cross-compat tests
+  ini_file:
+    path: /etc/swift/test.conf
+    section: s3api_test
+    option: secret_key1
+    value: s3-secret1
+  become: true
+
+- name: Clear secondary S3 user from test.conf
+  ini_file:
+    path: /etc/swift/test.conf
+    section: func_test
+    option: s3_access_key2
+    value: ""
+  become: true
+- name: Clear secondary S3 user from test.conf for cross-compat tests
+  ini_file:
+    path: /etc/swift/test.conf
+    section: s3api_test
+    option: access_key2
+    value: ""
+  become: true
+
+- name: Create restricted S3 user
+  shell: >
+    openstack --os-auth-url http://localhost/identity
+    --os-project-domain-id default --os-project-name admin
+    --os-user-domain-id default --os-username admin
+    --os-password secretadmin
+    credential create --type ec2 --project swiftprojecttest1 swiftusertest3
+    '{"access": "s3-user3", "secret": "s3-secret3"}'
+- name: Add restricted S3 user to test.conf
+  ini_file:
+    path: /etc/swift/test.conf
+    section: func_test
+    option: s3_access_key3
+    value: s3-user3
+  become: true
+- name: Add restricted S3 user secret to test.conf
+  ini_file:
+    path: /etc/swift/test.conf
+    section: func_test
+    option: s3_secret_key3
+    value: s3-secret3
+  become: true
+- name: Add restricted S3 user to test.conf for cross-compat tests
+  ini_file:
+    path: /etc/swift/test.conf
+    section: s3api_test
+    option: access_key3
+    value: s3-user3
+  become: true
+- name: Add restricted S3 user secret to test.conf for cross-compat tests
+  ini_file:
+    path: /etc/swift/test.conf
+    section: s3api_test
+    option: secret_key3
+    value: s3-secret3
+  become: true
+
+- name: Create service role
+  shell: >
+    openstack --os-auth-url http://localhost/identity
+    --os-project-domain-id default --os-project-name admin
+    --os-user-domain-id default --os-username admin
+    --os-password secretadmin
+    role create swift_service
+- name: Create service project
+  shell: >
+    openstack --os-auth-url http://localhost/identity
+    --os-project-domain-id default --os-project-name admin
+    --os-user-domain-id default --os-username admin
+    --os-password secretadmin
+    project create --domain default swiftprojecttest5
+- name: Create service user
+  shell: >
+    openstack --os-auth-url http://localhost/identity
+    --os-project-domain-id default --os-project-name admin
+    --os-user-domain-id default --os-username admin
+    --os-password secretadmin
+    user create --domain default --project swiftprojecttest5 swiftusertest5 --password testing5
+- name: Assign service role
+  shell: >
+    openstack --os-auth-url http://localhost/identity
+    --os-project-domain-id default --os-project-name admin
+    --os-user-domain-id default --os-username admin
+    --os-password secretadmin
+    role add --project swiftprojecttest5 --user swiftusertest5 swift_service
+
+- name: Add service_roles to proxy-server.conf
+  ini_file:
+    path: /etc/swift/proxy-server.conf
+    section: filter:keystoneauth
+    option: SERVICE_KEY_service_roles
+    value: swift_service
+  become: true
+- name: Update reseller prefixes in proxy-server.conf
+  ini_file:
+    path: /etc/swift/proxy-server.conf
+    section: filter:keystoneauth
+    option: reseller_prefix
+    value: AUTH, SERVICE_KEY
+  become: true
+
+- name: Add service account to test.conf
+  ini_file:
+    path: /etc/swift/test.conf
+    section: func_test
+    option: account5
+    value: swiftprojecttest5
+  become: true
+- name: Add service user to test.conf
+  ini_file:
+    path: /etc/swift/test.conf
+    section: func_test
+    option: username5
+    value: swiftusertest5
+  become: true
+- name: Add service password to test.conf
+  ini_file:
+    path: /etc/swift/test.conf
+    section: func_test
+    option: password5
+    value: testing5
+  become: true
+- name: Add service prefix to test.conf
+  ini_file:
+    path: /etc/swift/test.conf
+    section: func_test
+    option: service_prefix
+    value: SERVICE_KEY
+  become: true
diff --git a/roles/additional-tempauth-users/tasks/main.yaml b/roles/additional-tempauth-users/tasks/main.yaml
new file mode 100644
index 0000000000..204a56011f
--- /dev/null
+++ b/roles/additional-tempauth-users/tasks/main.yaml
@@ -0,0 +1,47 @@
+- name: Configure service auth prefix for tempauth tests
+  ini_file:
+    path: /etc/swift/proxy-server.conf
+    section: filter:tempauth
+    option: reseller_prefix
+    value: TEMPAUTH, SERVICE_TA
+  become: true
+
+- name: Configure service group for tempauth tests
+  ini_file:
+    path: /etc/swift/proxy-server.conf
+    section: filter:tempauth
+    option: SERVICE_TA_require_group
+    value: service
+  become: true
+
+- name: Configure service account for tempauth tests
+  ini_file:
+    path: "{{ ansible_env.HOME }}/{{ zuul.project.src_dir }}/../swift/test/sample.conf"
+    section: func_test
+    option: account5
+    value: test5
+  become: true
+
+- name: Configure service username for tempauth tests
+  ini_file:
+    path: "{{ ansible_env.HOME }}/{{ zuul.project.src_dir }}/../swift/test/sample.conf"
+    section: func_test
+    option: username5
+    value: tester5
+  become: true
+
+- name: Configure service user password for tempauth tests
+  ini_file:
+    path: "{{ ansible_env.HOME }}/{{ zuul.project.src_dir }}/../swift/test/sample.conf"
+    section: func_test
+    option: password5
+    value: testing5
+  become: true
+
+- name: Configure service prefix for tempauth tests
+  ini_file:
+    path: "{{ ansible_env.HOME }}/{{ zuul.project.src_dir }}/../swift/test/sample.conf"
+    section: func_test
+    option: service_prefix
+    value: SERVICE_TA
+  become: true
diff --git a/roles/dsvm-additional-middlewares/tasks/main.yaml b/roles/dsvm-additional-middlewares/tasks/main.yaml
new file mode 100644
index 0000000000..ed30b12435
--- /dev/null
+++ b/roles/dsvm-additional-middlewares/tasks/main.yaml
@@ -0,0 +1,150 @@
+- name: Add domain_remap and etag-quoter to pipeline
+  replace:
+    path: "/etc/swift/proxy-server.conf"
+    regexp: "cache listing_formats"
+    replace: "cache domain_remap etag-quoter listing_formats"
+  become: true
+
+- name: Set domain_remap domain
+  ini_file:
+    path: /etc/swift/proxy-server.conf
+    section: filter:domain_remap
+    option: storage_domain
+    value: example.com
+  become: true
+
+- name: Set storage_domain in test.conf (for Keystone tests)
+  ini_file:
+    path: /etc/swift/test.conf
+    section: func_test
+    option: storage_domain
+    value: example.com
+  become: true
+
+- name: Turn off s3_acl_tests_enabled in test.conf (for Keystone tests)
+  ini_file:
+    path: /etc/swift/test.conf
+    section: s3api_test
+    option: s3_acl_tests_enabled
+    value: false
+  become: true
+
+- name: Set storage_domain in test/sample.conf (for tempauth tests)
+  ini_file:
+    path: "{{ ansible_env.HOME }}/{{ zuul.project.src_dir }}/../swift/test/sample.conf"
+    section: func_test
+    option: storage_domain
+    value: example.com
+  become: true
+
+- name: Turn off s3_acl_tests_enabled in test/sample.conf (for tempauth tests)
+  ini_file:
+    path: "{{ ansible_env.HOME }}/{{ zuul.project.src_dir }}/../swift/test/sample.conf"
+    section: s3api_test
+    option: s3_acl_tests_enabled
+    value: false
+  become: true
+
+- name: Enable object versioning
+  ini_file:
+    path: /etc/swift/proxy-server.conf
+    section: filter:versioned_writes
+    option: allow_object_versioning
+    value: true
+  become: true
+
+- name: Configure s3api force_swift_request_proxy_log
+  ini_file:
+    path: /etc/swift/proxy-server.conf
+    section: filter:s3api
+    option: force_swift_request_proxy_log
+    value: true
+  become: true
+
+- name: "Configure s3token: auth_url"
+  ini_file:
+    path: /etc/swift/proxy-server.conf
+    section: filter:s3token
+    option: auth_url
+    value: http://localhost/identity
+  become: true
+
+- name: "Configure s3token: project_domain_name"
+  ini_file:
+    path: /etc/swift/proxy-server.conf
+    section: filter:s3token
+    option: project_domain_name
+    value: Default
+  become: true
+
+- name: "Configure s3token: project_name"
+  ini_file:
+    path: /etc/swift/proxy-server.conf
+    section: filter:s3token
+    option: project_name
+    value: service
+  become: true
+
+- name: "Configure s3token: user_domain_name"
+  ini_file:
+    path: /etc/swift/proxy-server.conf
+    section: filter:s3token
+    option: user_domain_name
+    value: Default
+  become: true
+
+- name: "Configure s3token: username"
+  ini_file:
+    path: /etc/swift/proxy-server.conf
+    section: filter:s3token
+    option: username
+    value: swift
+  become: true
+
+- name: "Configure s3token: password"
+  ini_file:
+    path: /etc/swift/proxy-server.conf
+    section: filter:s3token
+    option: password
+    value: secretservice
+  become: true
+
+- name: "Configure s3token: auth_type"
+  ini_file:
+    path: /etc/swift/proxy-server.conf
+    section: filter:s3token
+    option: auth_type
+    value: password
+  become: true
+
+- name: "Configure s3token: interface"
+  ini_file:
+    path: /etc/swift/proxy-server.conf
+    section: filter:s3token
+    option: interface
+    value: public
+  become: true
+
+- name: Copy ring for Policy-1
+  copy:
+    remote_src: true
+    src: /etc/swift/object.ring.gz
+    dest: /etc/swift/object-1.ring.gz
+  become: true
+
+- name: Add Policy-1 to swift.conf
+  ini_file:
+    path: /etc/swift/swift.conf
+    section: storage-policy:1
+    option: name
+    value: Policy-1
+  become: true
+
+- name: Restart service to pick up config changes
+  command: systemctl restart devstack@s-{{ item }}.service
+  become: true
+  with_items:
+    - proxy
+    - account
+    - container
+    - object
diff --git a/setup.cfg b/setup.cfg
index 409348eb71..830268bb3f 100644
--- a/setup.cfg
+++ b/setup.cfg
@@ -1,31 +1,148 @@
-[build_sphinx]
-all_files = 1
-build-dir = doc/build
-source-dir = doc/source
-
-[egg_info]
-tag_build = 
-tag_date = 0
-tag_svn_revision = 0
-
-[compile_catalog]
-directory = locale
-domain = swift
-
-[update_catalog]
-domain = swift
-output_dir = locale
-input_file = locale/swift.pot
-
-[extract_messages]
-keywords = _ l_ lazy_gettext
-mapping_file = babel.cfg
-output_file = locale/swift.pot
-
-[nosetests]
-exe=1
-verbosity=2
-detailed-errors=1
-cover-package = swift
-cover-html = true
-cover-erase = true
+[metadata]
+name = swift
+summary = OpenStack Object Storage
+description_file =
+    README.rst
+long_description_content_type = text/x-rst
+author = OpenStack
+author_email = openstack-discuss@lists.openstack.org
+url = https://docs.openstack.org/swift/latest/
+python_requires = >=3.7
+project_urls =
+    Documentation = https://docs.openstack.org/swift/latest/
+    Bug Tracker = https://bugs.launchpad.net/swift
+    Source Code = https://opendev.org/openstack/swift/
+    Release Notes = https://opendev.org/openstack/swift/src/branch/master/CHANGELOG
+classifier =
+    Development Status :: 5 - Production/Stable
+    Environment :: OpenStack
+    Intended Audience :: Information Technology
+    Intended Audience :: System Administrators
+    License :: OSI Approved :: Apache Software License
+    Operating System :: POSIX :: Linux
+    Programming Language :: Python
+    Programming Language :: Python :: 3
+    Programming Language :: Python :: 3.7
+    Programming Language :: Python :: 3.8
+    Programming Language :: Python :: 3.9
+    Programming Language :: Python :: 3.10
+    Programming Language :: Python :: 3.11
+    Programming Language :: Python :: 3.12
+
+[pbr]
+skip_authors = True
+skip_changelog = True
+skip_reno = True
+
+[options]
+packages =
+    swift
+
+[extras]
+kms_keymaster =
+    oslo.config>=5.2.0 # Apache-2.0
+    castellan>=0.13.0 # Apache-2.0
+
+kmip_keymaster =
+    pykmip>=0.7.0 # Apache-2.0
+
+keystone =
+    keystonemiddleware>=4.17.0
+
+[entry_points]
+console_scripts =
+    swift-account-audit = swift.cli.account_audit:main
+    swift-account-auditor = swift.account.auditor:main
+    swift-account-info = swift.cli.info:account_main
+    swift-account-reaper = swift.account.reaper:main
+    swift-account-replicator = swift.account.replicator:main
+    swift-account-server = swift.account.server:main
+    swift-config = swift.cli.config:main
+    swift-container-auditor = swift.container.auditor:main
+    swift-container-deleter = swift.cli.container_deleter:main
+    swift-container-info = swift.cli.info:container_main
+    swift-container-replicator = swift.container.replicator:main
+    swift-container-reconciler = swift.container.reconciler:main
+    swift-container-server = swift.container.server:main
+    swift-container-sharder = swift.container.sharder:main
+    swift-container-sync = swift.container.sync:main
+    swift-container-updater = swift.container.updater:main
+    swift-dispersion-populate = swift.cli.dispersion_populate:main
+    swift-dispersion-report = swift.cli.dispersion_report:main
+    swift-drive-audit = swift.cli.drive_audit:main
+    swift-form-signature = swift.cli.form_signature:main
+    swift-get-nodes = swift.cli.get_nodes:main
+    swift-init = swift.common.manager:main
+    swift-manage-shard-ranges = swift.cli.manage_shard_ranges:main
+    swift-object-auditor = swift.obj.auditor:main
+    swift-object-expirer = swift.obj.expirer:main
+    swift-object-info = swift.cli.info:obj_main
+    swift-object-reconstructor = swift.obj.reconstructor:main
+    swift-object-relinker = swift.cli.relinker:main
+    swift-object-replicator = swift.obj.replicator:main
+    swift-object-server = swift.obj.server:main
+    swift-object-updater = swift.obj.updater:main
+    swift-oldies = swift.cli.oldies:main
+    swift-orphans = swift.cli.orphans:main
+    swift-proxy-server = swift.proxy.server:main
+    swift-recon = swift.cli.recon:main
+    swift-recon-cron = swift.cli.recon_cron:main
+    swift-reconciler-enqueue = swift.cli.reconciler_enqueue:main
+    swift-reload = swift.cli.reload:main
+    swift-ring-builder = swift.cli.ringbuilder:error_handling_main
+    swift-ring-builder-analyzer = swift.cli.ring_builder_analyzer:main
+    swift-ring-composer = swift.cli.ringcomposer:main
+
+paste.app_factory =
+    proxy = swift.proxy.server:app_factory
+    object = swift.obj.server:app_factory
+    mem_object = swift.obj.mem_server:app_factory
+    container = swift.container.server:app_factory
+    account = swift.account.server:app_factory
+
+paste.filter_factory =
+    healthcheck = swift.common.middleware.healthcheck:filter_factory
+    crossdomain = swift.common.middleware.crossdomain:filter_factory
+    memcache = swift.common.middleware.memcache:filter_factory
+    read_only = swift.common.middleware.read_only:filter_factory
+    ratelimit = swift.common.middleware.ratelimit:filter_factory
+    backend_ratelimit = swift.common.middleware.backend_ratelimit:filter_factory
+    cname_lookup = swift.common.middleware.cname_lookup:filter_factory
+    catch_errors = swift.common.middleware.catch_errors:filter_factory
+    domain_remap = swift.common.middleware.domain_remap:filter_factory
+    staticweb = swift.common.middleware.staticweb:filter_factory
+    tempauth = swift.common.middleware.tempauth:filter_factory
+    keystoneauth = swift.common.middleware.keystoneauth:filter_factory
+    recon = swift.common.middleware.recon:filter_factory
+    tempurl = swift.common.middleware.tempurl:filter_factory
+    formpost = swift.common.middleware.formpost:filter_factory
+    name_check = swift.common.middleware.name_check:filter_factory
+    bulk = swift.common.middleware.bulk:filter_factory
+    container_quotas = swift.common.middleware.container_quotas:filter_factory
+    account_quotas = swift.common.middleware.account_quotas:filter_factory
+    proxy_logging = swift.common.middleware.proxy_logging:filter_factory
+    dlo = swift.common.middleware.dlo:filter_factory
+    slo = swift.common.middleware.slo:filter_factory
+    list_endpoints = swift.common.middleware.list_endpoints:filter_factory
+    gatekeeper = swift.common.middleware.gatekeeper:filter_factory
+    container_sync = swift.common.middleware.container_sync:filter_factory
+    xprofile = swift.common.middleware.xprofile:filter_factory
+    versioned_writes = swift.common.middleware.versioned_writes:filter_factory
+    copy = swift.common.middleware.copy:filter_factory
+    keymaster = swift.common.middleware.crypto.keymaster:filter_factory
+    encryption = swift.common.middleware.crypto:filter_factory
+    kms_keymaster = swift.common.middleware.crypto.kms_keymaster:filter_factory
+    kmip_keymaster = swift.common.middleware.crypto.kmip_keymaster:filter_factory
+    listing_formats = swift.common.middleware.listing_formats:filter_factory
+    symlink = swift.common.middleware.symlink:filter_factory
+    s3api = swift.common.middleware.s3api.s3api:filter_factory
+    s3token = swift.common.middleware.s3api.s3token:filter_factory
+    etag_quoter = swift.common.middleware.etag_quoter:filter_factory
+
+swift.diskfile =
+    replication.fs = swift.obj.diskfile:DiskFileManager
+    erasure_coding.fs = swift.obj.diskfile:ECDiskFileManager
+
+swift.object_audit_watcher =
+    dark_data = swift.obj.watchers.dark_data:DarkDataWatcher
+
diff --git a/setup.py b/setup.py
index 8c3dfee83f..22cfdce874 100644
--- a/setup.py
+++ b/setup.py
@@ -1,5 +1,5 @@
-#!/usr/bin/python
-# Copyright (c) 2010-2012 OpenStack, LLC.
+#!/usr/bin/env python3
+# Copyright (c) 2013 Hewlett-Packard Development Company, L.P.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -14,89 +14,8 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-from setuptools import setup, find_packages
+import setuptools
 
-from swift import __canonical_version__ as version
-
-
-name = 'swift'
-
-
-setup(
-    name=name,
-    version=version,
-    description='Swift',
-    license='Apache License (2.0)',
-    author='OpenStack, LLC.',
-    author_email='openstack-admins@lists.launchpad.net',
-    url='https://launchpad.net/swift',
-    packages=find_packages(exclude=['test', 'bin']),
-    test_suite='nose.collector',
-    classifiers=[
-        'Development Status :: 4 - Beta',
-        'License :: OSI Approved :: Apache Software License',
-        'Operating System :: POSIX :: Linux',
-        'Programming Language :: Python :: 2.6',
-        'Environment :: No Input/Output (Daemon)',
-        'Environment :: OpenStack',
-    ],
-    install_requires=[],  # removed for better compat
-    scripts=[
-        'bin/swift-account-audit',
-        'bin/swift-account-auditor',
-        'bin/swift-account-reaper',
-        'bin/swift-account-replicator',
-        'bin/swift-account-server',
-        'bin/swift-bench',
-        'bin/swift-bench-client',
-        'bin/swift-container-auditor',
-        'bin/swift-container-replicator',
-        'bin/swift-container-server',
-        'bin/swift-container-sync',
-        'bin/swift-container-updater',
-        'bin/swift-dispersion-populate',
-        'bin/swift-dispersion-report',
-        'bin/swift-drive-audit',
-        'bin/swift-form-signature',
-        'bin/swift-get-nodes',
-        'bin/swift-init',
-        'bin/swift-object-auditor',
-        'bin/swift-object-expirer',
-        'bin/swift-object-info',
-        'bin/swift-object-replicator',
-        'bin/swift-object-server',
-        'bin/swift-object-updater',
-        'bin/swift-oldies',
-        'bin/swift-orphans',
-        'bin/swift-proxy-server',
-        'bin/swift-recon',
-        'bin/swift-recon-cron',
-        'bin/swift-ring-builder',
-        'bin/swift-temp-url',
-    ],
-    entry_points={
-        'paste.app_factory': [
-            'proxy=swift.proxy.server:app_factory',
-            'object=swift.obj.server:app_factory',
-            'container=swift.container.server:app_factory',
-            'account=swift.account.server:app_factory',
-        ],
-        'paste.filter_factory': [
-            'healthcheck=swift.common.middleware.healthcheck:filter_factory',
-            'memcache=swift.common.middleware.memcache:filter_factory',
-            'ratelimit=swift.common.middleware.ratelimit:filter_factory',
-            'cname_lookup=swift.common.middleware.cname_lookup:filter_factory',
-            'catch_errors=swift.common.middleware.catch_errors:filter_factory',
-            'domain_remap=swift.common.middleware.domain_remap:filter_factory',
-            'staticweb=swift.common.middleware.staticweb:filter_factory',
-            'tempauth=swift.common.middleware.tempauth:filter_factory',
-            'keystoneauth=swift.common.middleware.keystoneauth:filter_factory',
-            'recon=swift.common.middleware.recon:filter_factory',
-            'tempurl=swift.common.middleware.tempurl:filter_factory',
-            'formpost=swift.common.middleware.formpost:filter_factory',
-            'name_check=swift.common.middleware.name_check:filter_factory',
-            'proxy_logging=swift.common.middleware.proxy_logging:'
-            'filter_factory',
-        ],
-    },
-)
+setuptools.setup(
+    setup_requires=['pbr'],
+    pbr=True)
diff --git a/swift/__init__.py b/swift/__init__.py
index b8dc14e47b..280a902e39 100644
--- a/swift/__init__.py
+++ b/swift/__init__.py
@@ -1,21 +1,55 @@
-import gettext
+# Copyright (c) 2013 Hewlett-Packard Development Company, L.P.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
 
+import warnings
 
-class Version(object):
-    def __init__(self, canonical_version, final):
-        self.canonical_version = canonical_version
-        self.final = final
+__version__ = None
 
-    @property
-    def pretty_version(self):
-        if self.final:
-            return self.canonical_version
-        else:
-            return '%s-dev' % (self.canonical_version,)
+# First, try to get our version out of PKG-INFO. If we're installed,
+# this'll let us find our version without pulling in pbr. After all, if
+# we're installed on a system, we're not in a Git-managed source tree, so
+# pbr doesn't really buy us anything.
+try:
+    import importlib.metadata
+except ImportError:
+    # python < 3.8
+    import pkg_resources
+    try:
+        __version__ = __canonical_version__ = pkg_resources.get_provider(
+            pkg_resources.Requirement.parse('swift')).version
+    except pkg_resources.DistributionNotFound:
+        pass
+else:
+    try:
+        __version__ = __canonical_version__ = importlib.metadata.distribution(
+            'swift').version
+    except importlib.metadata.PackageNotFoundError:
+        pass
 
+if __version__ is None:
+    # No PKG-INFO? We're probably running from a checkout, then. Let pbr do
+    # its thing to figure out a version number.
+    import pbr.version
+    _version_info = pbr.version.VersionInfo('swift')
+    __version__ = _version_info.release_string()
+    __canonical_version__ = _version_info.version_string()
 
-_version = Version('1.7.6', False)
-__version__ = _version.pretty_version
-__canonical_version__ = _version.canonical_version
 
-gettext.install('swift')
+warnings.filterwarnings('ignore', module='cryptography|OpenSSL', message=(
+    'Python 2 is no longer supported by the Python core team. '
+    'Support for it is now deprecated in cryptography'))
+warnings.filterwarnings('ignore', message=(
+    'Python 3.6 is no longer supported by the Python core team. '
+    'Therefore, support for it is deprecated in cryptography'))
diff --git a/swift/account/auditor.py b/swift/account/auditor.py
index eeb73d8dfe..0b0799c5bc 100644
--- a/swift/account/auditor.py
+++ b/swift/account/auditor.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,112 +13,46 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-import os
-import time
-from random import random
 
-import swift.common.db
-from swift.account import server as account_server
-from swift.common.db import AccountBroker
-from swift.common.utils import get_logger, audit_location_generator, \
-    config_true_value, dump_recon_cache
-from swift.common.daemon import Daemon
+from swift.account.backend import AccountBroker
+from swift.common.exceptions import InvalidAccountInfo
+from swift.common.daemon import run_daemon
+from swift.common.db_auditor import DatabaseAuditor
+from swift.common.utils import parse_options
 
-from eventlet import Timeout
 
-
-class AccountAuditor(Daemon):
+class AccountAuditor(DatabaseAuditor):
     """Audit accounts."""
 
-    def __init__(self, conf):
-        self.conf = conf
-        self.logger = get_logger(conf, log_route='account-auditor')
-        self.devices = conf.get('devices', '/srv/node')
-        self.mount_check = config_true_value(conf.get('mount_check', 'true'))
-        self.interval = int(conf.get('interval', 1800))
-        self.account_passes = 0
-        self.account_failures = 0
-        swift.common.db.DB_PREALLOCATION = \
-            config_true_value(conf.get('db_preallocation', 'f'))
-        self.recon_cache_path = conf.get('recon_cache_path',
-                                         '/var/cache/swift')
-        self.rcache = os.path.join(self.recon_cache_path, "account.recon")
-
-    def _one_audit_pass(self, reported):
-        all_locs = audit_location_generator(self.devices,
-                                            account_server.DATADIR,
-                                            mount_check=self.mount_check,
-                                            logger=self.logger)
-        for path, device, partition in all_locs:
-            self.account_audit(path)
-            if time.time() - reported >= 3600:  # once an hour
-                self.logger.info(_('Since %(time)s: Account audits: '
-                                   '%(passed)s passed audit,'
-                                   '%(failed)s failed audit'),
-                                 {'time': time.ctime(reported),
-                                 'passed': self.account_passes,
-                                 'failed': self.account_failures})
-                self.account_audit(path)
-                dump_recon_cache({'account_audits_since': reported,
-                                  'account_audits_passed': self.account_passes,
-                                  'account_audits_failed':
-                                  self.account_failures},
-                                 self.rcache, self.logger)
-                reported = time.time()
-                self.account_passes = 0
-                self.account_failures = 0
-        return reported
-
-    def run_forever(self, *args, **kwargs):
-        """Run the account audit until stopped."""
-        reported = time.time()
-        time.sleep(random() * self.interval)
-        while True:
-            self.logger.info(_('Begin account audit pass.'))
-            begin = time.time()
-            try:
-                reported = self._one_audit_pass(reported)
-            except (Exception, Timeout):
-                self.logger.increment('errors')
-                self.logger.exception(_('ERROR auditing'))
-            elapsed = time.time() - begin
-            if elapsed < self.interval:
-                time.sleep(self.interval - elapsed)
-            self.logger.info(
-                _('Account audit pass completed: %.02fs'), elapsed)
-            dump_recon_cache({'account_auditor_pass_completed': elapsed},
-                             self.rcache, self.logger)
-
-    def run_once(self, *args, **kwargs):
-        """Run the account audit once."""
-        self.logger.info(_('Begin account audit "once" mode'))
-        begin = reported = time.time()
-        self._one_audit_pass(reported)
-        elapsed = time.time() - begin
-        self.logger.info(
-            _('Account audit "once" mode completed: %.02fs'), elapsed)
-        dump_recon_cache({'account_auditor_pass_completed': elapsed},
-                         self.rcache, self.logger)
-
-    def account_audit(self, path):
-        """
-        Audits the given account path
-
-        :param path: the path to an account db
-        """
-        start_time = time.time()
-        try:
-            if not path.endswith('.db'):
-                return
-            broker = AccountBroker(path)
-            if not broker.is_deleted():
-                info = broker.get_info()
-                self.logger.increment('passes')
-                self.account_passes += 1
-                self.logger.debug(_('Audit passed for %s') % broker.db_file)
-        except (Exception, Timeout):
-            self.logger.increment('failures')
-            self.account_failures += 1
-            self.logger.exception(_('ERROR Could not get account info %s'),
-                                  (broker.db_file))
-        self.logger.timing_since('timing', start_time)
+    server_type = "account"
+    broker_class = AccountBroker
+
+    def _audit(self, info, broker):
+        # Validate per policy counts
+        policy_stats = broker.get_policy_stats(do_migrations=True)
+        policy_totals = {
+            'container_count': 0,
+            'object_count': 0,
+            'bytes_used': 0,
+        }
+        for policy_stat in policy_stats.values():
+            for key in policy_totals:
+                policy_totals[key] += policy_stat[key]
+
+        for key in policy_totals:
+            if policy_totals[key] == info[key]:
+                continue
+            return InvalidAccountInfo(
+                'The total %(key)s for the account %(account)s (%(total)s) '
+                'does not match the sum of %(key)s across policies (%(sum)s)'
+                % {'key': key, 'account': info.get('account'),
+                   'total': info[key], 'sum': policy_totals[key]})
+
+
+def main():
+    conf_file, options = parse_options(once=True)
+    run_daemon(AccountAuditor, conf_file, **options)
+
+
+if __name__ == '__main__':
+    main()
diff --git a/swift/account/backend.py b/swift/account/backend.py
new file mode 100644
index 0000000000..fc8201cb0b
--- /dev/null
+++ b/swift/account/backend.py
@@ -0,0 +1,662 @@
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""
+Pluggable Back-end for Account Server
+"""
+
+
+import sqlite3
+
+from swift.common.utils import Timestamp, RESERVED_BYTE
+from swift.common.db import DatabaseBroker, zero_like
+
+DATADIR = 'accounts'
+
+
+POLICY_STAT_TRIGGER_SCRIPT = """
+    CREATE TRIGGER container_insert_ps AFTER INSERT ON container
+    BEGIN
+        INSERT OR IGNORE INTO policy_stat
+            (storage_policy_index, container_count, object_count, bytes_used)
+            VALUES (new.storage_policy_index, 0, 0, 0);
+        UPDATE policy_stat
+        SET container_count = container_count + (1 - new.deleted),
+            object_count = object_count + new.object_count,
+            bytes_used = bytes_used + new.bytes_used
+        WHERE storage_policy_index = new.storage_policy_index;
+    END;
+    CREATE TRIGGER container_delete_ps AFTER DELETE ON container
+    BEGIN
+        UPDATE policy_stat
+        SET container_count = container_count - (1 - old.deleted),
+            object_count = object_count - old.object_count,
+            bytes_used = bytes_used - old.bytes_used
+        WHERE storage_policy_index = old.storage_policy_index;
+    END;
+
+"""
+
+
+class AccountBroker(DatabaseBroker):
+    """Encapsulates working with an account database."""
+    db_type = 'account'
+    db_contains_type = 'container'
+    db_reclaim_timestamp = 'delete_timestamp'
+
+    def _initialize(self, conn, put_timestamp, **kwargs):
+        """
+        Create a brand new account database (tables, indices, triggers, etc.)
+
+        :param conn: DB connection object
+        :param put_timestamp: put timestamp
+        """
+        if not self.account:
+            raise ValueError(
+                'Attempting to create a new database with no account set')
+        self.create_container_table(conn)
+        self.create_account_stat_table(conn, put_timestamp)
+        self.create_policy_stat_table(conn)
+
+    def create_container_table(self, conn):
+        """
+        Create container table which is specific to the account DB.
+
+        :param conn: DB connection object
+        """
+        conn.executescript("""
+            CREATE TABLE container (
+                ROWID INTEGER PRIMARY KEY AUTOINCREMENT,
+                name TEXT,
+                put_timestamp TEXT,
+                delete_timestamp TEXT,
+                object_count INTEGER,
+                bytes_used INTEGER,
+                deleted INTEGER DEFAULT 0,
+                storage_policy_index INTEGER DEFAULT 0
+            );
+
+            CREATE INDEX ix_container_deleted_name ON
+                container (deleted, name);
+
+            CREATE TRIGGER container_insert AFTER INSERT ON container
+            BEGIN
+                UPDATE account_stat
+                SET container_count = container_count + (1 - new.deleted),
+                    object_count = object_count + new.object_count,
+                    bytes_used = bytes_used + new.bytes_used,
+                    hash = chexor(hash, new.name,
+                                  new.put_timestamp || '-' ||
+                                    new.delete_timestamp || '-' ||
+                                    new.object_count || '-' || new.bytes_used);
+            END;
+
+            CREATE TRIGGER container_update BEFORE UPDATE ON container
+            BEGIN
+                SELECT RAISE(FAIL, 'UPDATE not allowed; DELETE and INSERT');
+            END;
+
+
+            CREATE TRIGGER container_delete AFTER DELETE ON container
+            BEGIN
+                UPDATE account_stat
+                SET container_count = container_count - (1 - old.deleted),
+                    object_count = object_count - old.object_count,
+                    bytes_used = bytes_used - old.bytes_used,
+                    hash = chexor(hash, old.name,
+                                  old.put_timestamp || '-' ||
+                                    old.delete_timestamp || '-' ||
+                                    old.object_count || '-' || old.bytes_used);
+            END;
+        """ + POLICY_STAT_TRIGGER_SCRIPT)
+
+    def create_account_stat_table(self, conn, put_timestamp):
+        """
+        Create account_stat table which is specific to the account DB.
+        Not a part of Pluggable Back-ends, internal to the baseline code.
+
+        :param conn: DB connection object
+        :param put_timestamp: put timestamp
+        """
+        conn.executescript("""
+            CREATE TABLE account_stat (
+                account TEXT,
+                created_at TEXT,
+                put_timestamp TEXT DEFAULT '0',
+                delete_timestamp TEXT DEFAULT '0',
+                container_count INTEGER,
+                object_count INTEGER DEFAULT 0,
+                bytes_used INTEGER DEFAULT 0,
+                hash TEXT default '00000000000000000000000000000000',
+                id TEXT,
+                status TEXT DEFAULT '',
+                status_changed_at TEXT DEFAULT '0',
+                metadata TEXT DEFAULT ''
+            );
+
+            INSERT INTO account_stat (container_count) VALUES (0);
+        """)
+
+        conn.execute('''
+            UPDATE account_stat SET account = ?, created_at = ?, id = ?,
+                   put_timestamp = ?, status_changed_at = ?
+            ''', (self.account, Timestamp.now().internal, self._new_db_id(),
+                  put_timestamp, put_timestamp))
+
+    def create_policy_stat_table(self, conn):
+        """
+        Create policy_stat table which is specific to the account DB.
+        Not a part of Pluggable Back-ends, internal to the baseline code.
+
+        :param conn: DB connection object
+        """
+        conn.executescript("""
+            CREATE TABLE policy_stat (
+                storage_policy_index INTEGER PRIMARY KEY,
+                container_count INTEGER DEFAULT 0,
+                object_count INTEGER DEFAULT 0,
+                bytes_used INTEGER DEFAULT 0
+            );
+            INSERT OR IGNORE INTO policy_stat (
+                storage_policy_index, container_count, object_count,
+                bytes_used
+            )
+            SELECT 0, container_count, object_count, bytes_used
+            FROM account_stat
+            WHERE container_count > 0;
+        """)
+
+    def get_db_version(self, conn):
+        if self._db_version == -1:
+            self._db_version = 0
+            for row in conn.execute('''
+                    SELECT name FROM sqlite_master
+                    WHERE name = 'ix_container_deleted_name' '''):
+                self._db_version = 1
+        return self._db_version
+
+    def _commit_puts_load(self, item_list, entry):
+        """See :func:`swift.common.db.DatabaseBroker._commit_puts_load`"""
+        # check to see if the update includes policy_index or not
+        (name, put_timestamp, delete_timestamp, object_count, bytes_used,
+         deleted) = entry[:6]
+        if len(entry) > 6:
+            storage_policy_index = entry[6]
+        else:
+            # legacy support during upgrade until first non legacy storage
+            # policy is defined
+            storage_policy_index = 0
+        item_list.append(
+            {'name': name,
+             'put_timestamp': put_timestamp,
+             'delete_timestamp': delete_timestamp,
+             'object_count': object_count,
+             'bytes_used': bytes_used,
+             'deleted': deleted,
+             'storage_policy_index': storage_policy_index})
+
+    def empty(self):
+        """
+        Check if the account DB is empty.
+
+        :returns: True if the database has no active containers.
+        """
+        self._commit_puts_stale_ok()
+        with self.get() as conn:
+            row = conn.execute(
+                'SELECT container_count from account_stat').fetchone()
+            return zero_like(row[0])
+
+    def make_tuple_for_pickle(self, record):
+        return (record['name'], record['put_timestamp'],
+                record['delete_timestamp'], record['object_count'],
+                record['bytes_used'], record['deleted'],
+                record['storage_policy_index'])
+
+    def put_container(self, name, put_timestamp, delete_timestamp,
+                      object_count, bytes_used, storage_policy_index):
+        """
+        Create a container with the given attributes.
+
+        :param name: name of the container to create (a native string)
+        :param put_timestamp: put_timestamp of the container to create
+        :param delete_timestamp: delete_timestamp of the container to create
+        :param object_count: number of objects in the container
+        :param bytes_used: number of bytes used by the container
+        :param storage_policy_index:  the storage policy for this container
+        """
+        if Timestamp(delete_timestamp) > Timestamp(put_timestamp) and \
+                zero_like(object_count):
+            deleted = 1
+        else:
+            deleted = 0
+        record = {'name': name, 'put_timestamp': put_timestamp,
+                  'delete_timestamp': delete_timestamp,
+                  'object_count': object_count,
+                  'bytes_used': bytes_used,
+                  'deleted': deleted,
+                  'storage_policy_index': storage_policy_index}
+        self.put_record(record)
+
+    def _is_deleted_info(self, status, container_count, delete_timestamp,
+                         put_timestamp):
+        """
+        Apply delete logic to database info.
+
+        :returns: True if the DB is considered to be deleted, False otherwise
+        """
+        return status == 'DELETED' or zero_like(container_count) and (
+            Timestamp(delete_timestamp) > Timestamp(put_timestamp))
+
+    def _is_deleted(self, conn):
+        """
+        Check account_stat table and evaluate info.
+
+        :param conn: database conn
+
+        :returns: True if the DB is considered to be deleted, False otherwise
+        """
+        info = conn.execute('''
+            SELECT put_timestamp, delete_timestamp, container_count, status
+            FROM account_stat''').fetchone()
+        return self._is_deleted_info(**info)
+
+    def is_status_deleted(self):
+        """Only returns true if the status field is set to DELETED."""
+        with self.get() as conn:
+            row = conn.execute('''
+                SELECT put_timestamp, delete_timestamp, status
+                FROM account_stat''').fetchone()
+            return row['status'] == "DELETED" or (
+                row['delete_timestamp'] > row['put_timestamp'])
+
+    def get_policy_stats(self, do_migrations=False):
+        """
+        Get global policy stats for the account.
+
+        :param do_migrations: boolean, if True the policy stat dicts will
+                              always include the 'container_count' key;
+                              otherwise it may be omitted on legacy databases
+                              until they are migrated.
+
+        :returns: dict of policy stats where the key is the policy index and
+                  the value is a dictionary like {'object_count': M,
+                  'bytes_used': N, 'container_count': L}
+        """
+        columns = [
+            'storage_policy_index',
+            'container_count',
+            'object_count',
+            'bytes_used',
+        ]
+
+        def run_query():
+            return (conn.execute('''
+                SELECT %s
+                FROM policy_stat
+                ''' % ', '.join(columns)).fetchall())
+
+        self._commit_puts_stale_ok()
+        info = []
+        with self.get() as conn:
+            try:
+                info = run_query()
+            except sqlite3.OperationalError as err:
+                if "no such column: container_count" in str(err):
+                    if do_migrations:
+                        self._migrate_add_container_count(conn)
+                    else:
+                        columns.remove('container_count')
+                    info = run_query()
+                elif "no such table: policy_stat" in str(err):
+                    if do_migrations:
+                        self.create_policy_stat_table(conn)
+                        info = run_query()
+                    # else, pass and let the results be empty
+                else:
+                    raise
+
+        policy_stats = {}
+        for row in info:
+            stats = dict(row)
+            key = stats.pop('storage_policy_index')
+            policy_stats[key] = stats
+        return policy_stats
+
+    def get_info(self):
+        """
+        Get global data for the account.
+
+        :returns: dict with keys: account, created_at, put_timestamp,
+                  delete_timestamp, status_changed_at, container_count,
+                  object_count, bytes_used, hash, id
+        """
+        self._commit_puts_stale_ok()
+        with self.get() as conn:
+            data = dict(conn.execute('''
+                SELECT account, created_at,  put_timestamp, delete_timestamp,
+                       status_changed_at, container_count, object_count,
+                       bytes_used, hash, id
+                FROM account_stat
+            ''').fetchone())
+        self.account = data['account']
+        return data
+
+    def _populate_instance_cache(self):
+        """
+        Lazily hydrate instance attributes used for logging and other
+        read-mostly flows. Use `self.account is None` as the only
+        indicator that we haven't populated yet.
+        """
+        if self.account is None:
+            self.get_info()
+
+    @property
+    def path(self):
+        """
+        Logical namespace path used for logging.
+
+        For AccountBroker we return just "<account>".
+        """
+        self._populate_instance_cache()
+        return self.account
+
+    def list_containers_iter(self, limit, marker, end_marker, prefix,
+                             delimiter, reverse=False, allow_reserved=False):
+        """
+        Get a list of containers sorted by name starting at marker onward, up
+        to limit entries. Entries will begin with the prefix and will not have
+        the delimiter after the prefix.
+
+        :param limit: maximum number of entries to get
+        :param marker: marker query
+        :param end_marker: end marker query
+        :param prefix: prefix query
+        :param delimiter: delimiter for query
+        :param reverse: reverse the result order.
+        :param allow_reserved: exclude names with reserved-byte by default
+
+        :returns: list of tuples of (name, object_count, bytes_used,
+                  put_timestamp, storage_policy_index, is_subdir)
+        """
+        delim_force_gte = False
+        if reverse:
+            # Reverse the markers if we are reversing the listing.
+            marker, end_marker = end_marker, marker
+        self._commit_puts_stale_ok()
+        if delimiter and not prefix:
+            prefix = ''
+        if prefix:
+            end_prefix = prefix[:-1] + chr(ord(prefix[-1]) + 1)
+        orig_marker = marker
+        with self.get() as conn:
+            results = []
+            while len(results) < limit:
+                query = """
+                    SELECT name, object_count, bytes_used, put_timestamp,
+                    {storage_policy_index}, 0
+                    FROM container
+                    WHERE """
+                query_args = []
+                if end_marker and (not prefix or end_marker < end_prefix):
+                    query += ' name < ? AND'
+                    query_args.append(end_marker)
+                elif prefix:
+                    query += ' name < ? AND'
+                    query_args.append(end_prefix)
+
+                if delim_force_gte:
+                    query += ' name >= ? AND'
+                    query_args.append(marker)
+                    # Always set back to False
+                    delim_force_gte = False
+                elif marker and (not prefix or marker >= prefix):
+                    query += ' name > ? AND'
+                    query_args.append(marker)
+                elif prefix:
+                    query += ' name >= ? AND'
+                    query_args.append(prefix)
+                if not allow_reserved:
+                    query += ' name >= ? AND'
+                    query_args.append(chr(ord(RESERVED_BYTE) + 1))
+                if self.get_db_version(conn) < 1:
+                    query += ' +deleted = 0'
+                else:
+                    query += ' deleted = 0'
+                query += ' ORDER BY name %s LIMIT ?' % \
+                         ('DESC' if reverse else '')
+                query_args.append(limit - len(results))
+                try:
+                    # First, try querying with the storage policy index.
+                    curs = conn.execute(
+                        query.format(
+                            storage_policy_index="storage_policy_index"),
+                        query_args)
+                except sqlite3.OperationalError as err:
+                    # If the storage policy column is not available,
+                    # the database has not been migrated to the new schema
+                    # with storage_policy_index. Re-run the query with
+                    # storage_policy_index set to 0, which is what
+                    # would be set once the database is migrated.
+                    # TODO(callumdickinson): If support for migrating
+                    # pre-storage policy versions of Swift is dropped,
+                    # then this special handling can be removed.
+                    if "no such column: storage_policy_index" in str(err):
+                        curs = conn.execute(
+                            query.format(storage_policy_index="0"),
+                            query_args)
+                    else:
+                        raise
+                curs.row_factory = None
+
+                # Delimiters without a prefix is ignored, further if there
+                # is no delimiter then we can simply return the result as
+                # prefixes are now handled in the SQL statement.
+                if prefix is None or not delimiter:
+                    return [r for r in curs]
+
+                # We have a delimiter and a prefix (possibly empty string) to
+                # handle
+                rowcount = 0
+                for row in curs:
+                    rowcount += 1
+                    name = row[0]
+                    if reverse:
+                        end_marker = name
+                    else:
+                        marker = name
+
+                    if len(results) >= limit:
+                        curs.close()
+                        return results
+                    end = name.find(delimiter, len(prefix))
+                    if end >= 0:
+                        if reverse:
+                            end_marker = name[:end + len(delimiter)]
+                        else:
+                            marker = ''.join([
+                                name[:end],
+                                delimiter[:-1],
+                                chr(ord(delimiter[-1:]) + 1),
+                            ])
+                            # we want result to be inclusive of delim+1
+                            delim_force_gte = True
+                        dir_name = name[:end + len(delimiter)]
+                        if dir_name != orig_marker:
+                            results.append([dir_name, 0, 0, '0', -1, 1])
+                        curs.close()
+                        break
+                    results.append(row)
+                if not rowcount:
+                    break
+            return results
+
+    def merge_items(self, item_list, source=None):
+        """
+        Merge items into the container table.
+
+        :param item_list: list of dictionaries of {'name', 'put_timestamp',
+                          'delete_timestamp', 'object_count', 'bytes_used',
+                          'deleted', 'storage_policy_index'}
+        :param source: if defined, update incoming_sync with the source
+        """
+        def _really_merge_items(conn):
+            max_rowid = -1
+            curs = conn.cursor()
+            for rec in item_list:
+                rec.setdefault('storage_policy_index', 0)  # legacy
+                record = [rec['name'], rec['put_timestamp'],
+                          rec['delete_timestamp'], rec['object_count'],
+                          rec['bytes_used'], rec['deleted'],
+                          rec['storage_policy_index']]
+                query = '''
+                    SELECT name, put_timestamp, delete_timestamp,
+                           object_count, bytes_used, deleted,
+                           storage_policy_index
+                    FROM container WHERE name = ?
+                '''
+                if self.get_db_version(conn) >= 1:
+                    query += ' AND deleted IN (0, 1)'
+                curs_row = curs.execute(query, (rec['name'],))
+                curs_row.row_factory = None
+                row = curs_row.fetchone()
+                if row:
+                    row = list(row)
+                    for i in range(5):
+                        if record[i] is None and row[i] is not None:
+                            record[i] = row[i]
+                    if Timestamp(row[1]) > \
+                       Timestamp(record[1]):  # Keep newest put_timestamp
+                        record[1] = row[1]
+                    if Timestamp(row[2]) > \
+                       Timestamp(record[2]):  # Keep newest delete_timestamp
+                        record[2] = row[2]
+                    # If deleted, mark as such
+                    if Timestamp(record[2]) > Timestamp(record[1]) and \
+                            zero_like(record[3]):
+                        record[5] = 1
+                    else:
+                        record[5] = 0
+                curs.execute('''
+                    DELETE FROM container WHERE name = ? AND
+                                                deleted IN (0, 1)
+                ''', (record[0],))
+                curs.execute('''
+                    INSERT INTO container (name, put_timestamp,
+                        delete_timestamp, object_count, bytes_used,
+                        deleted, storage_policy_index)
+                    VALUES (?, ?, ?, ?, ?, ?, ?)
+                ''', record)
+                if source:
+                    max_rowid = max(max_rowid, rec['ROWID'])
+            if source:
+                try:
+                    curs.execute('''
+                        INSERT INTO incoming_sync (sync_point, remote_id)
+                        VALUES (?, ?)
+                    ''', (max_rowid, source))
+                except sqlite3.IntegrityError:
+                    curs.execute('''
+                        UPDATE incoming_sync
+                        SET sync_point=max(?, sync_point)
+                        WHERE remote_id=?
+                    ''', (max_rowid, source))
+            conn.commit()
+
+        with self.get() as conn:
+            # create the policy stat table if needed and add spi to container
+            try:
+                _really_merge_items(conn)
+            except sqlite3.OperationalError as err:
+                if 'no such column: storage_policy_index' not in str(err):
+                    raise
+                self._migrate_add_storage_policy_index(conn)
+                _really_merge_items(conn)
+
+    def _migrate_add_container_count(self, conn):
+        """
+        Add the container_count column to the 'policy_stat' table and
+        update it
+
+        :param conn: DB connection object
+        """
+        # add the container_count column
+        curs = conn.cursor()
+        curs.executescript('''
+            DROP TRIGGER container_delete_ps;
+            DROP TRIGGER container_insert_ps;
+            ALTER TABLE policy_stat
+            ADD COLUMN container_count INTEGER DEFAULT 0;
+        ''' + POLICY_STAT_TRIGGER_SCRIPT)
+
+        # keep the simple case simple, if there's only one entry in the
+        # policy_stat table we just copy the total container count from the
+        # account_stat table
+
+        # if that triggers an update then the where changes <> 0 *would* exist
+        # and the insert or replace from the count subqueries won't execute
+
+        curs.executescript("""
+        UPDATE policy_stat
+        SET container_count = (
+            SELECT container_count
+            FROM account_stat)
+        WHERE (
+            SELECT COUNT(storage_policy_index)
+            FROM policy_stat
+        ) <= 1;
+
+        INSERT OR REPLACE INTO policy_stat (
+            storage_policy_index,
+            container_count,
+            object_count,
+            bytes_used
+        )
+        SELECT p.storage_policy_index,
+               c.count,
+               p.object_count,
+               p.bytes_used
+        FROM (
+            SELECT storage_policy_index,
+                   COUNT(*) as count
+            FROM container
+            WHERE deleted = 0
+            GROUP BY storage_policy_index
+        ) c
+        JOIN policy_stat p
+        ON p.storage_policy_index = c.storage_policy_index
+        WHERE NOT EXISTS(
+            SELECT changes() as change
+            FROM policy_stat
+            WHERE change <> 0
+        );
+        """)
+        conn.commit()
+
+    def _migrate_add_storage_policy_index(self, conn):
+        """
+        Add the storage_policy_index column to the 'container' table and
+        set up triggers, creating the policy_stat table if needed.
+
+        :param conn: DB connection object
+        """
+        try:
+            self.create_policy_stat_table(conn)
+        except sqlite3.OperationalError as err:
+            if 'table policy_stat already exists' not in str(err):
+                raise
+        conn.executescript('''
+            ALTER TABLE container
+            ADD COLUMN storage_policy_index INTEGER DEFAULT 0;
+        ''' + POLICY_STAT_TRIGGER_SCRIPT)
diff --git a/swift/account/reaper.py b/swift/account/reaper.py
index 385d95275e..0061e790ac 100644
--- a/swift/account/reaper.py
+++ b/swift/account/reaper.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -15,20 +15,28 @@
 
 import os
 import random
+import socket
 from logging import DEBUG
 from math import sqrt
 from time import time
+import itertools
 
 from eventlet import GreenPool, sleep, Timeout
 
 import swift.common.db
-from swift.account.server import DATADIR
-from swift.common.db import AccountBroker
-from swift.common.direct_client import ClientException, \
-    direct_delete_container, direct_delete_object, direct_get_container
+from swift.account.backend import AccountBroker, DATADIR
+from swift.common.constraints import check_drive
+from swift.common.daemon import run_daemon
+from swift.common.direct_client import direct_delete_container, \
+    direct_delete_object, direct_get_container
+from swift.common.exceptions import ClientException
+from swift.common.request_helpers import USE_REPLICATION_NETWORK_HEADER
 from swift.common.ring import Ring
-from swift.common.utils import get_logger, whataremyips, config_true_value
+from swift.common.ring.utils import is_local_device
+from swift.common.utils import get_logger, whataremyips, config_true_value, \
+    Timestamp, md5, node_to_string, parse_options
 from swift.common.daemon import Daemon
+from swift.common.storage_policy import POLICIES, PolicyError
 
 
 class AccountReaper(Daemon):
@@ -52,19 +60,20 @@ class AccountReaper(Daemon):
     configuration parameters.
     """
 
-    def __init__(self, conf):
+    def __init__(self, conf, logger=None):
         self.conf = conf
-        self.logger = get_logger(conf, log_route='account-reaper')
+        self.logger = logger or get_logger(conf, log_route='account-reaper')
         self.devices = conf.get('devices', '/srv/node')
         self.mount_check = config_true_value(conf.get('mount_check', 'true'))
-        self.interval = int(conf.get('interval', 3600))
+        self.interval = float(conf.get('interval', 3600))
         self.swift_dir = conf.get('swift_dir', '/etc/swift')
         self.account_ring = None
         self.container_ring = None
         self.object_ring = None
-        self.node_timeout = int(conf.get('node_timeout', 10))
+        self.node_timeout = float(conf.get('node_timeout', 10))
         self.conn_timeout = float(conf.get('conn_timeout', 0.5))
-        self.myips = whataremyips()
+        self.myips = whataremyips(conf.get('bind_ip', '0.0.0.0'))
+        self.bind_port = int(conf.get('bind_port', 6202))
         self.concurrency = int(conf.get('concurrency', 25))
         self.container_concurrency = self.object_concurrency = \
             sqrt(self.concurrency)
@@ -72,32 +81,39 @@ def __init__(self, conf):
         swift.common.db.DB_PREALLOCATION = \
             config_true_value(conf.get('db_preallocation', 'f'))
         self.delay_reaping = int(conf.get('delay_reaping') or 0)
+        reap_warn_after = float(conf.get('reap_warn_after') or 86400 * 30)
+        self.reap_not_done_after = reap_warn_after + self.delay_reaping
+        self.start_time = time()
+        self.reset_stats()
 
     def get_account_ring(self):
-        """ The account :class:`swift.common.ring.Ring` for the cluster. """
+        """The account :class:`swift.common.ring.Ring` for the cluster."""
         if not self.account_ring:
             self.account_ring = Ring(self.swift_dir, ring_name='account')
         return self.account_ring
 
     def get_container_ring(self):
-        """ The container :class:`swift.common.ring.Ring` for the cluster. """
+        """The container :class:`swift.common.ring.Ring` for the cluster."""
         if not self.container_ring:
             self.container_ring = Ring(self.swift_dir, ring_name='container')
         return self.container_ring
 
-    def get_object_ring(self):
-        """ The object :class:`swift.common.ring.Ring` for the cluster. """
-        if not self.object_ring:
-            self.object_ring = Ring(self.swift_dir, ring_name='object')
-        return self.object_ring
+    def get_object_ring(self, policy_idx):
+        """
+        Get the ring identified by the policy index
 
-    def run_forever(self, *args, **kwargs):
+        :param policy_idx: Storage policy index
+        :returns: A ring matching the storage policy
         """
-        Main entry point when running the reaper in its normal daemon mode.
-        This repeatedly calls :func:`reap_once` no quicker than the
+        return POLICIES.get_object_ring(policy_idx, self.swift_dir)
+
+    def run_forever(self, *args, **kwargs):
+        """Main entry point when running the reaper in normal daemon mode.
+
+        This repeatedly calls :func:`run_once` no quicker than the
         configuration interval.
         """
-        self.logger.debug(_('Daemon started.'))
+        self.logger.debug('Daemon started.')
         sleep(random.random() * self.interval)
         while True:
             begin = time()
@@ -113,22 +129,22 @@ def run_once(self, *args, **kwargs):
         repeatedly by :func:`run_forever`. This will call :func:`reap_device`
         once for each device on the server.
         """
-        self.logger.debug(_('Begin devices pass: %s'), self.devices)
+        self.logger.debug('Begin devices pass: %s', self.devices)
         begin = time()
         try:
             for device in os.listdir(self.devices):
-                if self.mount_check and not os.path.ismount(
-                        os.path.join(self.devices, device)):
+                try:
+                    check_drive(self.devices, device, self.mount_check)
+                except ValueError as err:
                     self.logger.increment('errors')
-                    self.logger.debug(
-                        _('Skipping %s as it is not mounted'), device)
+                    self.logger.debug('Skipping: %s', err)
                     continue
                 self.reap_device(device)
         except (Exception, Timeout):
-            self.logger.exception(_("Exception in top-level account reaper "
-                                    "loop"))
+            self.logger.exception("Exception in top-level account reaper "
+                                  "loop")
         elapsed = time() - begin
-        self.logger.info(_('Devices pass completed: %.02fs'), elapsed)
+        self.logger.info('Devices pass completed: %.02fs', elapsed)
 
     def reap_device(self, device):
         """
@@ -151,9 +167,18 @@ def reap_device(self, device):
             if not partition.isdigit():
                 continue
             nodes = self.get_account_ring().get_part_nodes(int(partition))
-            if nodes[0]['ip'] not in self.myips or \
-                    not os.path.isdir(partition_path):
+            if not os.path.isdir(partition_path):
                 continue
+            container_shard = None
+            for container_shard, node in enumerate(nodes):
+                if is_local_device(self.myips, None, node['ip'], None) and \
+                        (not self.bind_port or
+                         self.bind_port == node['port']) and \
+                        (device == node['device']):
+                    break
+            else:
+                continue
+
             for suffix in os.listdir(partition_path):
                 suffix_path = os.path.join(partition_path, suffix)
                 if not os.path.isdir(suffix_path):
@@ -168,12 +193,24 @@ def reap_device(self, device):
                         elif fname.endswith('.db'):
                             self.start_time = time()
                             broker = \
-                                AccountBroker(os.path.join(hsh_path, fname))
+                                AccountBroker(os.path.join(hsh_path, fname),
+                                              logger=self.logger)
                             if broker.is_status_deleted() and \
                                     not broker.empty():
-                                self.reap_account(broker, partition, nodes)
+                                self.reap_account(
+                                    broker, partition, nodes,
+                                    container_shard=container_shard)
 
-    def reap_account(self, broker, partition, nodes):
+    def reset_stats(self):
+        self.stats_return_codes = {}
+        self.stats_containers_deleted = 0
+        self.stats_objects_deleted = 0
+        self.stats_containers_remaining = 0
+        self.stats_objects_remaining = 0
+        self.stats_containers_possibly_remaining = 0
+        self.stats_objects_possibly_remaining = 0
+
+    def reap_account(self, broker, partition, nodes, container_shard=None):
         """
         Called once per pass for each account this server is the primary for
         and attempts to delete the data for the given account. The reaper will
@@ -200,10 +237,12 @@ def reap_account(self, broker, partition, nodes):
         :param broker: The AccountBroker for the account to delete.
         :param partition: The partition in the account ring the account is on.
         :param nodes: The primary node dicts for the account to delete.
+        :param container_shard: int used to shard containers reaped. If None,
+                                will reap all containers.
 
         .. seealso::
 
-            :class:`swift.common.db.AccountBroker` for the broker class.
+            :class:`swift.account.backend.AccountBroker` for the broker class.
 
         .. seealso::
 
@@ -212,62 +251,74 @@ def reap_account(self, broker, partition, nodes):
         """
         begin = time()
         info = broker.get_info()
-        if time() - float(info['delete_timestamp']) <= self.delay_reaping:
+        if time() - float(Timestamp(info['delete_timestamp'])) <= \
+                self.delay_reaping:
             return False
         account = info['account']
-        self.logger.info(_('Beginning pass on account %s'), account)
-        self.stats_return_codes = {}
-        self.stats_containers_deleted = 0
-        self.stats_objects_deleted = 0
-        self.stats_containers_remaining = 0
-        self.stats_objects_remaining = 0
-        self.stats_containers_possibly_remaining = 0
-        self.stats_objects_possibly_remaining = 0
+        self.logger.info('Beginning pass on account %s', account)
+        self.reset_stats()
+        container_limit = 1000
+        if container_shard is not None:
+            container_limit *= len(nodes)
         try:
-            marker = ''
-            while True:
-                containers = \
-                    list(broker.list_containers_iter(1000, marker, None, None,
-                                                     None))
-                if not containers:
-                    break
+            containers = list(broker.list_containers_iter(
+                container_limit, '', None, None, None, allow_reserved=True))
+            while containers:
                 try:
-                    for (container, _junk, _junk, _junk) in containers:
+                    for row in containers:
+                        container = row[0]
+                        this_shard = (
+                            int(md5(container.encode('utf-8'),
+                                    usedforsecurity=False)
+                                .hexdigest(), 16) % len(nodes))
+                        if container_shard not in (this_shard, None):
+                            continue
+
                         self.container_pool.spawn(self.reap_container, account,
                                                   partition, nodes, container)
                     self.container_pool.waitall()
                 except (Exception, Timeout):
                     self.logger.exception(
-                        _('Exception with containers for account %s'), account)
-                marker = containers[-1][0]
-            log = 'Completed pass on account %s' % account
+                        'Exception with containers for account %s', account)
+                containers = list(broker.list_containers_iter(
+                    container_limit, containers[-1][0], None, None, None,
+                    allow_reserved=True))
+            log_buf = ['Completed pass on account %s' % account]
         except (Exception, Timeout):
-            self.logger.exception(
-                _('Exception with account %s'), account)
-            log = _('Incomplete pass on account %s') % account
+            self.logger.exception('Exception with account %s', account)
+            log_buf = ['Incomplete pass on account %s' % account]
         if self.stats_containers_deleted:
-            log += _(', %s containers deleted') % self.stats_containers_deleted
+            log_buf.append(', %s containers deleted' %
+                           self.stats_containers_deleted)
         if self.stats_objects_deleted:
-            log += _(', %s objects deleted') % self.stats_objects_deleted
+            log_buf.append(', %s objects deleted' % self.stats_objects_deleted)
         if self.stats_containers_remaining:
-            log += _(', %s containers remaining') % \
-                self.stats_containers_remaining
+            log_buf.append(', %s containers remaining' %
+                           self.stats_containers_remaining)
         if self.stats_objects_remaining:
-            log += _(', %s objects remaining') % self.stats_objects_remaining
+            log_buf.append(', %s objects remaining' %
+                           self.stats_objects_remaining)
         if self.stats_containers_possibly_remaining:
-            log += _(', %s containers possibly remaining') % \
-                self.stats_containers_possibly_remaining
+            log_buf.append(', %s containers possibly remaining' %
+                           self.stats_containers_possibly_remaining)
         if self.stats_objects_possibly_remaining:
-            log += _(', %s objects possibly remaining') % \
-                self.stats_objects_possibly_remaining
+            log_buf.append(', %s objects possibly remaining' %
+                           self.stats_objects_possibly_remaining)
         if self.stats_return_codes:
-            log += _(', return codes: ')
-            for code in sorted(self.stats_return_codes.keys()):
-                log += '%s %sxxs, ' % (self.stats_return_codes[code], code)
-            log = log[:-2]
-        log += _(', elapsed: %.02fs') % (time() - begin)
-        self.logger.info(log)
+            log_buf.append(', return codes: ')
+            for code in sorted(self.stats_return_codes):
+                log_buf.append('%s %sxxs, ' % (self.stats_return_codes[code],
+                                               code))
+            log_buf[-1] = log_buf[-1][:-2]
+        log_buf.append(', elapsed: %.02fs' % (time() - begin))
+        self.logger.info(''.join(log_buf))
         self.logger.timing_since('timing', self.start_time)
+        delete_timestamp = Timestamp(info['delete_timestamp'])
+        if self.stats_containers_remaining and \
+           begin - float(delete_timestamp) >= self.reap_not_done_after:
+            self.logger.warning(
+                'Account %(account)s has not been reaped since %(time)s' %
+                {'account': account, 'time': delete_timestamp.isoformat})
         return True
 
     def reap_container(self, account, account_partition, account_nodes,
@@ -314,40 +365,47 @@ def reap_container(self, account, account_partition, account_nodes,
         while True:
             objects = None
             try:
-                objects = direct_get_container(
+                headers, objects = direct_get_container(
                     node, part, account, container,
                     marker=marker,
                     conn_timeout=self.conn_timeout,
-                    response_timeout=self.node_timeout)[1]
+                    response_timeout=self.node_timeout,
+                    headers={USE_REPLICATION_NETWORK_HEADER: 'true'})
                 self.stats_return_codes[2] = \
                     self.stats_return_codes.get(2, 0) + 1
                 self.logger.increment('return_codes.2')
-            except ClientException, err:
+            except ClientException as err:
                 if self.logger.getEffectiveLevel() <= DEBUG:
                     self.logger.exception(
-                        _('Exception with %(ip)s:%(port)s/%(device)s'), node)
-                self.stats_return_codes[err.http_status / 100] = \
-                    self.stats_return_codes.get(err.http_status / 100, 0) + 1
+                        'Exception with %s', node_to_string(node))
+                self.stats_return_codes[err.http_status // 100] = \
+                    self.stats_return_codes.get(err.http_status // 100, 0) + 1
                 self.logger.increment(
-                    'return_codes.%d' % (err.http_status / 100,))
+                    'return_codes.%d' % (err.http_status // 100,))
+            except (Timeout, socket.error):
+                self.logger.error(
+                    'Timeout Exception with %s', node_to_string(node))
             if not objects:
                 break
             try:
+                policy_index = headers.get('X-Backend-Storage-Policy-Index', 0)
+                policy = POLICIES.get_by_index(policy_index)
+                if not policy:
+                    self.logger.error('ERROR: invalid storage policy index: %r'
+                                      % policy_index)
                 for obj in objects:
-                    if isinstance(obj['name'], unicode):
-                        obj['name'] = obj['name'].encode('utf8')
                     pool.spawn(self.reap_object, account, container, part,
-                               nodes, obj['name'])
+                               nodes, obj['name'], policy_index)
                 pool.waitall()
             except (Exception, Timeout):
-                self.logger.exception(_('Exception with objects for container '
-                                        '%(container)s for account %(account)s'
-                                        ),
+                self.logger.exception('Exception with objects for container '
+                                      '%(container)s for account %(account)s',
                                       {'container': container,
                                        'account': account})
             marker = objects[-1]['name']
         successes = 0
         failures = 0
+        timestamp = Timestamp.now()
         for node in nodes:
             anode = account_nodes.pop()
             try:
@@ -358,21 +416,28 @@ def reap_container(self, account, account_partition, account_nodes,
                     headers={'X-Account-Host': '%(ip)s:%(port)s' % anode,
                              'X-Account-Partition': str(account_partition),
                              'X-Account-Device': anode['device'],
-                             'X-Account-Override-Deleted': 'yes'})
+                             'X-Account-Override-Deleted': 'yes',
+                             'X-Timestamp': timestamp.internal,
+                             USE_REPLICATION_NETWORK_HEADER: 'true'})
                 successes += 1
                 self.stats_return_codes[2] = \
                     self.stats_return_codes.get(2, 0) + 1
                 self.logger.increment('return_codes.2')
-            except ClientException, err:
+            except ClientException as err:
                 if self.logger.getEffectiveLevel() <= DEBUG:
                     self.logger.exception(
-                        _('Exception with %(ip)s:%(port)s/%(device)s'), node)
+                        'Exception with %s', node_to_string(node))
                 failures += 1
                 self.logger.increment('containers_failures')
-                self.stats_return_codes[err.http_status / 100] = \
-                    self.stats_return_codes.get(err.http_status / 100, 0) + 1
+                self.stats_return_codes[err.http_status // 100] = \
+                    self.stats_return_codes.get(err.http_status // 100, 0) + 1
                 self.logger.increment(
-                    'return_codes.%d' % (err.http_status / 100,))
+                    'return_codes.%d' % (err.http_status // 100,))
+            except (Timeout, socket.error):
+                self.logger.error(
+                    'Timeout Exception with %s', node_to_string(node))
+                failures += 1
+                self.logger.increment('containers_failures')
         if successes > failures:
             self.stats_containers_deleted += 1
             self.logger.increment('containers_deleted')
@@ -384,7 +449,7 @@ def reap_container(self, account, account_partition, account_nodes,
             self.logger.increment('containers_possibly_remaining')
 
     def reap_object(self, account, container, container_partition,
-                    container_nodes, obj):
+                    container_nodes, obj, policy_index):
         """
         Deletes the given object by issuing a delete request to each node for
         the object. The format of the delete request is such that each object
@@ -400,16 +465,25 @@ def reap_object(self, account, container, container_partition,
                                     container ring.
         :param container_nodes: The primary node dicts for the container.
         :param obj: The name of the object to delete.
+        :param policy_index: The storage policy index of the object's container
 
         * See also: :func:`swift.common.ring.Ring.get_nodes` for a description
           of the container node dicts.
         """
-        container_nodes = list(container_nodes)
-        part, nodes = self.get_object_ring().get_nodes(account, container, obj)
+        cnodes = itertools.cycle(container_nodes)
+        try:
+            ring = self.get_object_ring(policy_index)
+        except PolicyError:
+            self.stats_objects_remaining += 1
+            self.logger.increment('objects_remaining')
+            return
+        part, nodes = ring.get_nodes(account, container, obj)
         successes = 0
         failures = 0
+        timestamp = Timestamp.now()
+
         for node in nodes:
-            cnode = container_nodes.pop()
+            cnode = next(cnodes)
             try:
                 direct_delete_object(
                     node, part, account, container, obj,
@@ -417,21 +491,29 @@ def reap_object(self, account, container, container_partition,
                     response_timeout=self.node_timeout,
                     headers={'X-Container-Host': '%(ip)s:%(port)s' % cnode,
                              'X-Container-Partition': str(container_partition),
-                             'X-Container-Device': cnode['device']})
+                             'X-Container-Device': cnode['device'],
+                             'X-Backend-Storage-Policy-Index': policy_index,
+                             'X-Timestamp': timestamp.internal,
+                             USE_REPLICATION_NETWORK_HEADER: 'true'})
                 successes += 1
                 self.stats_return_codes[2] = \
                     self.stats_return_codes.get(2, 0) + 1
                 self.logger.increment('return_codes.2')
-            except ClientException, err:
+            except ClientException as err:
                 if self.logger.getEffectiveLevel() <= DEBUG:
                     self.logger.exception(
-                        _('Exception with %(ip)s:%(port)s/%(device)s'), node)
+                        'Exception with %s', node_to_string(node))
                 failures += 1
                 self.logger.increment('objects_failures')
-                self.stats_return_codes[err.http_status / 100] = \
-                    self.stats_return_codes.get(err.http_status / 100, 0) + 1
+                self.stats_return_codes[err.http_status // 100] = \
+                    self.stats_return_codes.get(err.http_status // 100, 0) + 1
                 self.logger.increment(
-                    'return_codes.%d' % (err.http_status / 100,))
+                    'return_codes.%d' % (err.http_status // 100,))
+            except (Timeout, socket.error):
+                failures += 1
+                self.logger.increment('objects_failures')
+                self.logger.error(
+                    'Timeout Exception with %s', node_to_string(node))
             if successes > failures:
                 self.stats_objects_deleted += 1
                 self.logger.increment('objects_deleted')
@@ -441,3 +523,12 @@ def reap_object(self, account, container, container_partition,
             else:
                 self.stats_objects_possibly_remaining += 1
                 self.logger.increment('objects_possibly_remaining')
+
+
+def main():
+    conf_file, options = parse_options(once=True)
+    run_daemon(AccountReaper, conf_file, **options)
+
+
+if __name__ == '__main__':
+    main()
diff --git a/swift/account/replicator.py b/swift/account/replicator.py
index c7f93d9b90..71be882e02 100644
--- a/swift/account/replicator.py
+++ b/swift/account/replicator.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,12 +13,34 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-from swift.account import server as account_server
-from swift.common import db, db_replicator
+import optparse
+
+from swift.account.backend import AccountBroker, DATADIR
+from swift.common import db_replicator
+from swift.common.daemon import run_daemon
+from swift.common.utils import parse_options
 
 
 class AccountReplicator(db_replicator.Replicator):
     server_type = 'account'
-    brokerclass = db.AccountBroker
-    datadir = account_server.DATADIR
-    default_port = 6002
+    brokerclass = AccountBroker
+    datadir = DATADIR
+    default_port = 6202
+
+
+def main():
+    parser = optparse.OptionParser("%prog CONFIG [options]")
+    parser.add_option('-d', '--devices',
+                      help=('Replicate only given devices. '
+                            'Comma-separated list. '
+                            'Only has effect if --once is used.'))
+    parser.add_option('-p', '--partitions',
+                      help=('Replicate only given partitions. '
+                            'Comma-separated list. '
+                            'Only has effect if --once is used.'))
+    conf_file, options = parse_options(parser=parser, once=True)
+    run_daemon(AccountReplicator, conf_file, **options)
+
+
+if __name__ == '__main__':
+    main()
diff --git a/swift/account/server.py b/swift/account/server.py
index 5b3df742a5..2134056d02 100644
--- a/swift/account/server.py
+++ b/swift/account/server.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,361 +13,327 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-from __future__ import with_statement
-
+import json
 import os
+import sys
 import time
 import traceback
-from urllib import unquote
-from xml.sax import saxutils
 
 from eventlet import Timeout
 
 import swift.common.db
-from swift.common.db import AccountBroker
-from swift.common.utils import get_logger, get_param, hash_path, public, \
-    normalize_timestamp, split_path, storage_directory, config_true_value, \
-    validate_device_partition, json, timing_stats
-from swift.common.constraints import ACCOUNT_LISTING_LIMIT, \
-    check_mount, check_float, check_utf8, FORMAT2CONTENT_TYPE
+from swift.account.backend import AccountBroker, DATADIR
+from swift.account.utils import account_listing_response, get_response_headers
+from swift.common.db import DatabaseConnectionError, DatabaseAlreadyExists
+from swift.common.request_helpers import get_param, \
+    split_and_validate_path, validate_internal_account, \
+    validate_internal_container, constrain_req_limit
+from swift.common.utils import get_logger, hash_path, public, \
+    Timestamp, storage_directory, config_true_value, \
+    replication, get_log_line, \
+    config_fallocate_value, fs_has_free_space, parse_options
+from swift.common.constraints import valid_timestamp, check_utf8, \
+    check_drive, AUTO_CREATE_ACCOUNT_PREFIX
+from swift.common import constraints
 from swift.common.db_replicator import ReplicatorRpc
+from swift.common.base_storage_server import BaseStorageServer, timing_stats
+from swift.common.middleware import listing_formats
 from swift.common.swob import HTTPAccepted, HTTPBadRequest, \
     HTTPCreated, HTTPForbidden, HTTPInternalServerError, \
     HTTPMethodNotAllowed, HTTPNoContent, HTTPNotFound, \
-    HTTPPreconditionFailed, HTTPConflict, Request, Response, \
-    HTTPInsufficientStorage, HTTPNotAcceptable
+    HTTPPreconditionFailed, HTTPConflict, Request, \
+    HTTPInsufficientStorage, HTTPException, wsgi_to_str
+from swift.common.request_helpers import is_sys_or_user_meta
+from swift.common.wsgi import run_wsgi
+
+
+def get_account_name_and_placement(req):
+    """
+    Split and validate path for an account.
+
+    :param req: a swob request
+
+    :returns: a tuple of path parts as strings
+    """
+    drive, part, account = split_and_validate_path(req, 3)
+    validate_internal_account(account)
+    return drive, part, account
 
 
-DATADIR = 'accounts'
+def get_container_name_and_placement(req):
+    """
+    Split and validate path for a container.
 
+    :param req: a swob request
 
-class AccountController(object):
+    :returns: a tuple of path parts as strings
+    """
+    drive, part, account, container = split_and_validate_path(req, 3, 4)
+    validate_internal_container(account, container)
+    return drive, part, account, container
+
+
+class AccountController(BaseStorageServer):
     """WSGI controller for the account server."""
 
-    def __init__(self, conf):
-        self.logger = get_logger(conf, log_route='account-server')
+    server_type = 'account-server'
+
+    def __init__(self, conf, logger=None):
+        super(AccountController, self).__init__(conf)
+        self.logger = logger or get_logger(conf, log_route='account-server')
+        self.log_requests = config_true_value(conf.get('log_requests', 'true'))
         self.root = conf.get('devices', '/srv/node')
         self.mount_check = config_true_value(conf.get('mount_check', 'true'))
         self.replicator_rpc = ReplicatorRpc(self.root, DATADIR, AccountBroker,
                                             self.mount_check,
                                             logger=self.logger)
-        self.auto_create_account_prefix = \
-            conf.get('auto_create_account_prefix') or '.'
+        self.auto_create_account_prefix = AUTO_CREATE_ACCOUNT_PREFIX
+
         swift.common.db.DB_PREALLOCATION = \
             config_true_value(conf.get('db_preallocation', 'f'))
+        swift.common.db.QUERY_LOGGING = \
+            config_true_value(conf.get('db_query_logging', 'f'))
+        self.fallocate_reserve, self.fallocate_is_percent = \
+            config_fallocate_value(conf.get('fallocate_reserve', '1%'))
 
-    def _get_account_broker(self, drive, part, account):
+    def _get_account_broker(self, drive, part, account, **kwargs):
         hsh = hash_path(account)
         db_dir = storage_directory(DATADIR, part, hsh)
         db_path = os.path.join(self.root, drive, db_dir, hsh + '.db')
-        return AccountBroker(db_path, account=account, logger=self.logger)
+        kwargs.setdefault('account', account)
+        kwargs.setdefault('logger', self.logger)
+        return AccountBroker(db_path, **kwargs)
+
+    def _deleted_response(self, broker, req, resp, body=''):
+        # We are here since either the account does not exist or
+        # it exists but marked for deletion.
+        headers = {}
+        # Try to check if account exists and is marked for deletion
+        try:
+            if broker.is_status_deleted():
+                # Account does exist and is marked for deletion
+                headers = {'X-Account-Status': 'Deleted'}
+        except DatabaseConnectionError:
+            # Account does not exist!
+            pass
+        return resp(request=req, headers=headers, charset='utf-8', body=body)
+
+    def check_free_space(self, drive):
+        drive_root = os.path.join(self.root, drive)
+        return fs_has_free_space(
+            drive_root, self.fallocate_reserve, self.fallocate_is_percent)
 
     @public
-    @timing_stats
+    @timing_stats()
     def DELETE(self, req):
         """Handle HTTP DELETE request."""
+        drive, part, account = get_account_name_and_placement(req)
         try:
-            drive, part, account = split_path(unquote(req.path), 3)
-            validate_device_partition(drive, part)
-        except ValueError, err:
-            return HTTPBadRequest(body=str(err), content_type='text/plain',
-                                  request=req)
-        if self.mount_check and not check_mount(self.root, drive):
+            check_drive(self.root, drive, self.mount_check)
+        except ValueError:
             return HTTPInsufficientStorage(drive=drive, request=req)
-        if 'x-timestamp' not in req.headers or \
-                not check_float(req.headers['x-timestamp']):
-            return HTTPBadRequest(body='Missing timestamp', request=req,
-                                  content_type='text/plain')
+        req_timestamp = valid_timestamp(req)
         broker = self._get_account_broker(drive, part, account)
         if broker.is_deleted():
-            return HTTPNotFound(request=req)
-        broker.delete_db(req.headers['x-timestamp'])
-        return HTTPNoContent(request=req)
+            return self._deleted_response(broker, req, HTTPNotFound)
+        broker.delete_db(req_timestamp.internal)
+        return self._deleted_response(broker, req, HTTPNoContent)
+
+    def _update_metadata(self, req, broker, req_timestamp):
+        metadata = {
+            wsgi_to_str(key): (wsgi_to_str(value), req_timestamp.internal)
+            for key, value in req.headers.items()
+            if is_sys_or_user_meta('account', key)}
+        if metadata:
+            broker.update_metadata(metadata, validate_metadata=True)
 
     @public
-    @timing_stats
+    @timing_stats()
     def PUT(self, req):
         """Handle HTTP PUT request."""
+        drive, part, account, container = get_container_name_and_placement(req)
         try:
-            drive, part, account, container = split_path(unquote(req.path),
-                                                         3, 4)
-            validate_device_partition(drive, part)
-        except ValueError, err:
-            return HTTPBadRequest(body=str(err), content_type='text/plain',
-                                  request=req)
-        if self.mount_check and not check_mount(self.root, drive):
+            check_drive(self.root, drive, self.mount_check)
+        except ValueError:
+            return HTTPInsufficientStorage(drive=drive, request=req)
+        if not self.check_free_space(drive):
             return HTTPInsufficientStorage(drive=drive, request=req)
-        broker = self._get_account_broker(drive, part, account)
         if container:   # put account container
+            if 'x-timestamp' not in req.headers:
+                timestamp = Timestamp.now()
+            else:
+                timestamp = valid_timestamp(req)
+            pending_timeout = None
+            container_policy_index = \
+                req.headers.get('X-Backend-Storage-Policy-Index', 0)
             if 'x-trans-id' in req.headers:
-                broker.pending_timeout = 3
+                pending_timeout = 3
+            broker = self._get_account_broker(drive, part, account,
+                                              pending_timeout=pending_timeout)
             if account.startswith(self.auto_create_account_prefix) and \
                     not os.path.exists(broker.db_file):
-                broker.initialize(normalize_timestamp(
-                    req.headers.get('x-timestamp') or time.time()))
-            if req.headers.get('x-account-override-deleted', 'no').lower() != \
-                    'yes' and broker.is_deleted():
+                try:
+                    broker.initialize(timestamp.internal)
+                except DatabaseAlreadyExists:
+                    pass
+            if (req.headers.get('x-account-override-deleted', 'no').lower() !=
+                    'yes' and broker.is_deleted()) \
+                    or not os.path.exists(broker.db_file):
                 return HTTPNotFound(request=req)
             broker.put_container(container, req.headers['x-put-timestamp'],
                                  req.headers['x-delete-timestamp'],
                                  req.headers['x-object-count'],
-                                 req.headers['x-bytes-used'])
+                                 req.headers['x-bytes-used'],
+                                 container_policy_index)
             if req.headers['x-delete-timestamp'] > \
                     req.headers['x-put-timestamp']:
                 return HTTPNoContent(request=req)
             else:
                 return HTTPCreated(request=req)
         else:   # put account
-            timestamp = normalize_timestamp(req.headers['x-timestamp'])
+            timestamp = valid_timestamp(req)
+            broker = self._get_account_broker(drive, part, account)
             if not os.path.exists(broker.db_file):
-                broker.initialize(timestamp)
-                created = True
+                try:
+                    broker.initialize(timestamp.internal)
+                    created = True
+                except DatabaseAlreadyExists:
+                    created = False
             elif broker.is_status_deleted():
-                return HTTPForbidden(request=req, body='Recently deleted')
+                return self._deleted_response(broker, req, HTTPForbidden,
+                                              body='Recently deleted')
             else:
                 created = broker.is_deleted()
-                broker.update_put_timestamp(timestamp)
+                broker.update_put_timestamp(timestamp.internal)
                 if broker.is_deleted():
                     return HTTPConflict(request=req)
-            metadata = {}
-            metadata.update((key, (value, timestamp))
-                            for key, value in req.headers.iteritems()
-                            if key.lower().startswith('x-account-meta-'))
-            if metadata:
-                broker.update_metadata(metadata)
+            self._update_metadata(req, broker, timestamp)
             if created:
                 return HTTPCreated(request=req)
             else:
                 return HTTPAccepted(request=req)
 
     @public
-    @timing_stats
+    @timing_stats()
     def HEAD(self, req):
         """Handle HTTP HEAD request."""
-        # TODO(refactor): The account server used to provide a 'account and
-        # container existence check all-in-one' call by doing a HEAD with a
-        # container path. However, container existence is now checked with the
-        # container servers directly so this is no longer needed. We should
-        # refactor out the container existence check here and retest
-        # everything.
+        drive, part, account = get_account_name_and_placement(req)
+        out_content_type = listing_formats.get_listing_content_type(req)
         try:
-            drive, part, account, container = split_path(unquote(req.path),
-                                                         3, 4)
-            validate_device_partition(drive, part)
-        except ValueError, err:
-            return HTTPBadRequest(body=str(err), content_type='text/plain',
-                                  request=req)
-        if self.mount_check and not check_mount(self.root, drive):
+            check_drive(self.root, drive, self.mount_check)
+        except ValueError:
             return HTTPInsufficientStorage(drive=drive, request=req)
-        broker = self._get_account_broker(drive, part, account)
-        if not container:
-            broker.pending_timeout = 0.1
-            broker.stale_reads_ok = True
+        broker = self._get_account_broker(drive, part, account,
+                                          pending_timeout=0.1,
+                                          stale_reads_ok=True)
         if broker.is_deleted():
-            return HTTPNotFound(request=req)
-        info = broker.get_info()
-        headers = {
-            'X-Account-Container-Count': info['container_count'],
-            'X-Account-Object-Count': info['object_count'],
-            'X-Account-Bytes-Used': info['bytes_used'],
-            'X-Timestamp': info['created_at'],
-            'X-PUT-Timestamp': info['put_timestamp']}
-        if container:
-            container_ts = broker.get_container_timestamp(container)
-            if container_ts is not None:
-                headers['X-Container-Timestamp'] = container_ts
-        headers.update((key, value)
-                       for key, (value, timestamp) in
-                       broker.metadata.iteritems() if value != '')
-        if get_param(req, 'format'):
-            req.accept = FORMAT2CONTENT_TYPE.get(
-                get_param(req, 'format').lower(), FORMAT2CONTENT_TYPE['plain'])
-        headers['Content-Type'] = req.accept.best_match(
-            ['text/plain', 'application/json', 'application/xml', 'text/xml'])
-        if not headers['Content-Type']:
-            return HTTPNotAcceptable(request=req)
+            return self._deleted_response(broker, req, HTTPNotFound)
+        headers = get_response_headers(broker)
+        headers['Content-Type'] = out_content_type
+        headers['Content-Length'] = 0
         return HTTPNoContent(request=req, headers=headers, charset='utf-8')
 
     @public
-    @timing_stats
+    @timing_stats()
     def GET(self, req):
         """Handle HTTP GET request."""
+        drive, part, account = get_account_name_and_placement(req)
+        prefix = get_param(req, 'prefix')
+        delimiter = get_param(req, 'delimiter')
+        reverse = config_true_value(get_param(req, 'reverse'))
+        limit = constrain_req_limit(req, constraints.ACCOUNT_LISTING_LIMIT)
+        marker = get_param(req, 'marker', '')
+        end_marker = get_param(req, 'end_marker')
+        out_content_type = listing_formats.get_listing_content_type(req)
+
         try:
-            drive, part, account = split_path(unquote(req.path), 3)
-            validate_device_partition(drive, part)
-        except ValueError, err:
-            return HTTPBadRequest(body=str(err), content_type='text/plain',
-                                  request=req)
-        if self.mount_check and not check_mount(self.root, drive):
+            check_drive(self.root, drive, self.mount_check)
+        except ValueError:
             return HTTPInsufficientStorage(drive=drive, request=req)
-        broker = self._get_account_broker(drive, part, account)
-        broker.pending_timeout = 0.1
-        broker.stale_reads_ok = True
+        broker = self._get_account_broker(drive, part, account,
+                                          pending_timeout=0.1,
+                                          stale_reads_ok=True)
         if broker.is_deleted():
-            return HTTPNotFound(request=req)
-        info = broker.get_info()
-        resp_headers = {
-            'X-Account-Container-Count': info['container_count'],
-            'X-Account-Object-Count': info['object_count'],
-            'X-Account-Bytes-Used': info['bytes_used'],
-            'X-Timestamp': info['created_at'],
-            'X-PUT-Timestamp': info['put_timestamp']}
-        resp_headers.update((key, value)
-                            for key, (value, timestamp) in
-                            broker.metadata.iteritems() if value != '')
-        try:
-            prefix = get_param(req, 'prefix')
-            delimiter = get_param(req, 'delimiter')
-            if delimiter and (len(delimiter) > 1 or ord(delimiter) > 254):
-                # delimiters can be made more flexible later
-                return HTTPPreconditionFailed(body='Bad delimiter')
-            limit = ACCOUNT_LISTING_LIMIT
-            given_limit = get_param(req, 'limit')
-            if given_limit and given_limit.isdigit():
-                limit = int(given_limit)
-                if limit > ACCOUNT_LISTING_LIMIT:
-                    return HTTPPreconditionFailed(request=req,
-                                                  body='Maximum limit is %d' %
-                                                  ACCOUNT_LISTING_LIMIT)
-            marker = get_param(req, 'marker', '')
-            end_marker = get_param(req, 'end_marker')
-            query_format = get_param(req, 'format')
-        except UnicodeDecodeError, err:
-            return HTTPBadRequest(body='parameters not utf8',
-                                  content_type='text/plain', request=req)
-        if query_format:
-            req.accept = FORMAT2CONTENT_TYPE.get(query_format.lower(),
-                                                 FORMAT2CONTENT_TYPE['plain'])
-        out_content_type = req.accept.best_match(
-            ['text/plain', 'application/json', 'application/xml', 'text/xml'])
-        if not out_content_type:
-            return HTTPNotAcceptable(request=req)
-        account_list = broker.list_containers_iter(limit, marker, end_marker,
-                                                   prefix, delimiter)
-        if out_content_type == 'application/json':
-            data = []
-            for (name, object_count, bytes_used, is_subdir) in account_list:
-                if is_subdir:
-                    data.append({'subdir': name})
-                else:
-                    data.append({'name': name, 'count': object_count,
-                                'bytes': bytes_used})
-            account_list = json.dumps(data)
-        elif out_content_type.endswith('/xml'):
-            output_list = ['<?xml version="1.0" encoding="UTF-8"?>',
-                           '<account name="%s">' % account]
-            for (name, object_count, bytes_used, is_subdir) in account_list:
-                name = saxutils.escape(name)
-                if is_subdir:
-                    output_list.append('<subdir name="%s" />' % name)
-                else:
-                    item = '<container><name>%s</name><count>%s</count>' \
-                           '<bytes>%s</bytes></container>' % \
-                           (name, object_count, bytes_used)
-                    output_list.append(item)
-            output_list.append('</account>')
-            account_list = '\n'.join(output_list)
-        else:
-            if not account_list:
-                return HTTPNoContent(request=req, headers=resp_headers)
-            account_list = '\n'.join(r[0] for r in account_list) + '\n'
-        ret = Response(body=account_list, request=req, headers=resp_headers)
-        ret.content_type = out_content_type
-        ret.charset = 'utf-8'
-        return ret
+            return self._deleted_response(broker, req, HTTPNotFound)
+        return account_listing_response(account, req, out_content_type, broker,
+                                        limit, marker, end_marker, prefix,
+                                        delimiter, reverse)
 
     @public
-    @timing_stats
+    @replication
+    @timing_stats()
     def REPLICATE(self, req):
         """
         Handle HTTP REPLICATE request.
         Handler for RPC calls for account replication.
         """
+        post_args = split_and_validate_path(req, 3)
+        drive, partition, hash = post_args
         try:
-            post_args = split_path(unquote(req.path), 3)
-            drive, partition, hash = post_args
-            validate_device_partition(drive, partition)
-        except ValueError, err:
-            return HTTPBadRequest(body=str(err), content_type='text/plain',
-                                  request=req)
-        if self.mount_check and not check_mount(self.root, drive):
+            check_drive(self.root, drive, self.mount_check)
+        except ValueError:
+            return HTTPInsufficientStorage(drive=drive, request=req)
+        if not self.check_free_space(drive):
             return HTTPInsufficientStorage(drive=drive, request=req)
         try:
             args = json.load(req.environ['wsgi.input'])
-        except ValueError, err:
+        except ValueError as err:
             return HTTPBadRequest(body=str(err), content_type='text/plain')
         ret = self.replicator_rpc.dispatch(post_args, args)
         ret.request = req
         return ret
 
     @public
-    @timing_stats
+    @timing_stats()
     def POST(self, req):
         """Handle HTTP POST request."""
+        drive, part, account = get_account_name_and_placement(req)
+        req_timestamp = valid_timestamp(req)
         try:
-            drive, part, account = split_path(unquote(req.path), 3)
-            validate_device_partition(drive, part)
-        except ValueError, err:
-            return HTTPBadRequest(body=str(err), content_type='text/plain',
-                                  request=req)
-        if 'x-timestamp' not in req.headers or \
-                not check_float(req.headers['x-timestamp']):
-            return HTTPBadRequest(body='Missing or bad timestamp',
-                                  request=req,
-                                  content_type='text/plain')
-        if self.mount_check and not check_mount(self.root, drive):
+            check_drive(self.root, drive, self.mount_check)
+        except ValueError:
+            return HTTPInsufficientStorage(drive=drive, request=req)
+        if not self.check_free_space(drive):
             return HTTPInsufficientStorage(drive=drive, request=req)
         broker = self._get_account_broker(drive, part, account)
         if broker.is_deleted():
-            return HTTPNotFound(request=req)
-        timestamp = normalize_timestamp(req.headers['x-timestamp'])
-        metadata = {}
-        metadata.update((key, (value, timestamp))
-                        for key, value in req.headers.iteritems()
-                        if key.lower().startswith('x-account-meta-'))
-        if metadata:
-            broker.update_metadata(metadata)
+            return self._deleted_response(broker, req, HTTPNotFound)
+        self._update_metadata(req, broker, req_timestamp)
         return HTTPNoContent(request=req)
 
     def __call__(self, env, start_response):
         start_time = time.time()
         req = Request(env)
         self.logger.txn_id = req.headers.get('x-trans-id', None)
-        if not check_utf8(req.path_info):
+        if not check_utf8(wsgi_to_str(req.path_info), internal=True):
             res = HTTPPreconditionFailed(body='Invalid UTF8')
         else:
             try:
                 # disallow methods which are not publicly accessible
-                try:
-                    method = getattr(self, req.method)
-                    getattr(method, 'publicly_accessible')
-                except AttributeError:
+                if req.method not in self.allowed_methods:
                     res = HTTPMethodNotAllowed()
                 else:
-                    res = method(req)
+                    res = getattr(self, req.method)(req)
+            except HTTPException as error_response:
+                res = error_response
             except (Exception, Timeout):
-                self.logger.exception(_('ERROR __call__ error with %(method)s'
-                                        ' %(path)s '),
+                self.logger.exception('ERROR __call__ error with %(method)s'
+                                      ' %(path)s ',
                                       {'method': req.method, 'path': req.path})
                 res = HTTPInternalServerError(body=traceback.format_exc())
-        trans_time = '%.4f' % (time.time() - start_time)
-        additional_info = ''
-        if res.headers.get('x-container-timestamp') is not None:
-            additional_info += 'x-container-timestamp: %s' % \
-                res.headers['x-container-timestamp']
-        log_message = '%s - - [%s] "%s %s" %s %s "%s" "%s" "%s" %s "%s"' % (
-            req.remote_addr,
-            time.strftime('%d/%b/%Y:%H:%M:%S +0000', time.gmtime()),
-            req.method, req.path,
-            res.status.split()[0], res.content_length or '-',
-            req.headers.get('x-trans-id', '-'),
-            req.referer or '-', req.user_agent or '-',
-            trans_time,
-            additional_info)
-        if req.method.upper() == 'REPLICATE':
-            self.logger.debug(log_message)
-        else:
-            self.logger.info(log_message)
+        if self.log_requests:
+            trans_time = time.time() - start_time
+            additional_info = ''
+            if res.headers.get('x-container-timestamp') is not None:
+                additional_info += 'x-container-timestamp: %s' % \
+                    res.headers['x-container-timestamp']
+            log_msg = get_log_line(req, res, trans_time, additional_info,
+                                   self.log_format, self.anonymization_method,
+                                   self.anonymization_salt)
+            if req.method.upper() == 'REPLICATE':
+                self.logger.debug(log_msg)
+            else:
+                self.logger.info(log_msg)
         return res(env, start_response)
 
 
@@ -376,3 +342,12 @@ def app_factory(global_conf, **local_conf):
     conf = global_conf.copy()
     conf.update(local_conf)
     return AccountController(conf)
+
+
+def main():
+    conf_file, options = parse_options(test_config=True)
+    sys.exit(run_wsgi(conf_file, 'account-server', **options))
+
+
+if __name__ == '__main__':
+    main()
diff --git a/swift/account/utils.py b/swift/account/utils.py
new file mode 100644
index 0000000000..2a540faaeb
--- /dev/null
+++ b/swift/account/utils.py
@@ -0,0 +1,123 @@
+# Copyright (c) 2010-2013 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import json
+
+from swift.common import constraints
+from swift.common.middleware import listing_formats
+from swift.common.swob import HTTPOk, HTTPNoContent, str_to_wsgi
+from swift.common.utils import Timestamp
+from swift.common.storage_policy import POLICIES
+
+
+class FakeAccountBroker(object):
+    """
+    Quacks like an account broker, but doesn't actually do anything. Responds
+    like an account broker would for a real, empty account with no metadata.
+    """
+    def get_info(self):
+        now = Timestamp.now().internal
+        return {'container_count': 0,
+                'object_count': 0,
+                'bytes_used': 0,
+                'created_at': now,
+                'put_timestamp': now}
+
+    def list_containers_iter(self, *_, **__):
+        return []
+
+    @property
+    def metadata(self):
+        return {}
+
+    def get_policy_stats(self):
+        return {}
+
+
+def get_response_headers(broker):
+    info = broker.get_info()
+    resp_headers = {
+        'X-Account-Container-Count': info['container_count'],
+        'X-Account-Object-Count': info['object_count'],
+        'X-Account-Bytes-Used': info['bytes_used'],
+        'X-Timestamp': Timestamp(info['created_at']).normal,
+        'X-PUT-Timestamp': Timestamp(info['put_timestamp']).normal}
+    policy_stats = broker.get_policy_stats()
+    for policy_idx, stats in policy_stats.items():
+        policy = POLICIES.get_by_index(policy_idx)
+        if not policy:
+            continue
+        header_prefix = 'X-Account-Storage-Policy-%s-%%s' % policy.name
+        for key, value in stats.items():
+            header_name = header_prefix % key.replace('_', '-')
+            resp_headers[header_name] = value
+    resp_headers.update((str_to_wsgi(key), str_to_wsgi(value))
+                        for key, (value, _timestamp) in
+                        broker.metadata.items() if value != '')
+    return resp_headers
+
+
+def account_listing_response(account, req, response_content_type, broker=None,
+                             limit=constraints.ACCOUNT_LISTING_LIMIT,
+                             marker='', end_marker='', prefix='', delimiter='',
+                             reverse=False):
+    if broker is None:
+        broker = FakeAccountBroker()
+
+    resp_headers = get_response_headers(broker)
+
+    account_list = broker.list_containers_iter(limit, marker, end_marker,
+                                               prefix, delimiter, reverse,
+                                               req.allow_reserved_names)
+    data = []
+    for (name, object_count, bytes_used, put_timestamp,
+         storage_policy_index, is_subdir) \
+            in account_list:
+        if is_subdir:
+            data.append({'subdir': name})
+        else:
+            container = {
+                'name': name,
+                'count': object_count,
+                'bytes': bytes_used,
+                'last_modified': Timestamp(put_timestamp).isoformat}
+            # Add the container's storage policy to the response, unless
+            # storage_policy_index was not found in POLICIES, which means
+            # the storage policy is missing from the Swift configuration
+            # or otherwise could not be determined.
+            #
+            # The storage policy should always be returned when
+            # everything is configured correctly, but clients are
+            # expected to be able to handle this case regardless,
+            # if only to support older versions of swift.
+            if storage_policy_index in POLICIES:
+                container['storage_policy'] = (
+                    POLICIES[storage_policy_index].name
+                )
+            data.append(container)
+    if response_content_type.endswith('/xml'):
+        account_list = listing_formats.account_to_xml(data, account)
+        ret = HTTPOk(body=account_list, request=req, headers=resp_headers)
+    elif response_content_type.endswith('/json'):
+        account_list = json.dumps(data).encode('ascii')
+        ret = HTTPOk(body=account_list, request=req, headers=resp_headers)
+    elif data:
+        account_list = listing_formats.listing_to_text(data)
+        ret = HTTPOk(body=account_list, request=req, headers=resp_headers)
+    else:
+        ret = HTTPNoContent(request=req, headers=resp_headers)
+    ret.content_type = response_content_type
+    ret.charset = 'utf-8'
+    return ret
diff --git a/test/functionalnosetests/__init__.py b/swift/cli/__init__.py
similarity index 100%
rename from test/functionalnosetests/__init__.py
rename to swift/cli/__init__.py
diff --git a/bin/swift-account-audit b/swift/cli/account_audit.py
similarity index 71%
rename from bin/swift-account-audit
rename to swift/cli/account_audit.py
index 000048fa1a..6e67fff8e6 100755
--- a/bin/swift-account-audit
+++ b/swift/cli/account_audit.py
@@ -1,5 +1,5 @@
 #!/usr/bin/env python
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -16,17 +16,17 @@
 
 import os
 import sys
-from urllib import quote
-from hashlib import md5
 import getopt
 from itertools import chain
 
-import simplejson
+import json
 from eventlet.greenpool import GreenPool
 from eventlet.event import Event
+from urllib.parse import quote
 
 from swift.common.ring import Ring
 from swift.common.utils import split_path
+from swift.common.utils.base import md5
 from swift.common.bufferedhttp import http_connect
 
 
@@ -43,9 +43,9 @@
 
 Examples!
 
-    %(cmd)s SOSO_88ad0b83-b2c5-4fa1-b2d6-60c597202076
-    %(cmd)s SOSO_88ad0b83-b2c5-4fa1-b2d6-60c597202076/container/object
-    %(cmd)s -e errors.txt SOSO_88ad0b83-b2c5-4fa1-b2d6-60c597202076/container
+    %(cmd)s AUTH_88ad0b83-b2c5-4fa1-b2d6-60c597202076
+    %(cmd)s AUTH_88ad0b83-b2c5-4fa1-b2d6-60c597202076/container/object
+    %(cmd)s -e errors.txt AUTH_88ad0b83-b2c5-4fa1-b2d6-60c597202076/container
     %(cmd)s < errors.txt
     %(cmd)s -c 25 -d < errors.txt
 """ % {'cmd': sys.argv[0]}
@@ -55,10 +55,9 @@ class Auditor(object):
     def __init__(self, swift_dir='/etc/swift', concurrency=50, deep=False,
                  error_file=None):
         self.pool = GreenPool(concurrency)
-        self.object_ring = Ring(os.path.join(swift_dir, ring_name='object'))
-        self.container_ring = \
-            Ring(os.path.join(swift_dir, ring_name='container'))
-        self.account_ring = Ring(os.path.join(swift_dir, ring_name='account'))
+        self.object_ring = Ring(swift_dir, ring_name='object')
+        self.container_ring = Ring(swift_dir, ring_name='container')
+        self.account_ring = Ring(swift_dir, ring_name='account')
         self.deep = deep
         self.error_file = error_file
         # zero out stats
@@ -79,7 +78,7 @@ def audit_object(self, account, container, name):
         container_listing = self.audit_container(account, container)
         consistent = True
         if name not in container_listing:
-            print "  Object %s missing in container listing!" % path
+            print("  Object %s missing in container listing!" % path)
             consistent = False
             hash = None
         else:
@@ -91,7 +90,7 @@ def audit_object(self, account, container, name):
                     conn = http_connect(node['ip'], node['port'],
                                         node['device'], part, 'GET', path, {})
                     resp = conn.getresponse()
-                    calc_hash = md5()
+                    calc_hash = md5(usedforsecurity=False)
                     chunk = True
                     while chunk:
                         chunk = resp.read(8192)
@@ -100,15 +99,15 @@ def audit_object(self, account, container, name):
                     if resp.status // 100 != 2:
                         self.object_not_found += 1
                         consistent = False
-                        print '  Bad status GETting object "%s" on %s/%s' \
-                            % (path, node['ip'], node['device'])
+                        print('  Bad status %s GETting object "%s" on %s/%s'
+                              % (resp.status, path,
+                                 node['ip'], node['device']))
                         continue
                     if resp.getheader('ETag').strip('"') != calc_hash:
                         self.object_checksum_mismatch += 1
                         consistent = False
-                        print '  MD5 doesnt match etag for "%s" on %s/%s' \
-                            % (path, node['ip'], node['device'])
-                    etags.append(resp.getheader('ETag'))
+                        print('  MD5 does not match etag for "%s" on %s/%s'
+                              % (path, node['ip'], node['device']))
                 else:
                     conn = http_connect(node['ip'], node['port'],
                                         node['device'], part, 'HEAD',
@@ -117,28 +116,36 @@ def audit_object(self, account, container, name):
                     if resp.status // 100 != 2:
                         self.object_not_found += 1
                         consistent = False
-                        print '  Bad status HEADing object "%s" on %s/%s' \
-                            % (path, node['ip'], node['device'])
+                        print('  Bad status %s HEADing object "%s" on %s/%s'
+                              % (resp.status, path,
+                                 node['ip'], node['device']))
                         continue
-                    etags.append(resp.getheader('ETag'))
+
+                override_etag = resp.getheader(
+                    'X-Object-Sysmeta-Container-Update-Override-Etag')
+                if override_etag:
+                    etags.append((override_etag, node))
+                else:
+                    etags.append((resp.getheader('ETag'), node))
             except Exception:
                 self.object_exceptions += 1
                 consistent = False
-                print '  Exception fetching object "%s" on %s/%s' \
-                    % (path, node['ip'], node['device'])
+                print('  Exception fetching object "%s" on %s/%s'
+                      % (path, node['ip'], node['device']))
                 continue
         if not etags:
             consistent = False
-            print "  Failed fo fetch object %s at all!" % path
+            print("  Failed fo fetch object %s at all!" % path)
         elif hash:
-            for etag in etags:
-                if resp.getheader('ETag').strip('"') != hash:
+            for etag, node in etags:
+                if etag.strip('"') != hash:
                     consistent = False
                     self.object_checksum_mismatch += 1
-                    print '  ETag mismatch for "%s" on %s/%s' \
-                        % (path, node['ip'], node['device'])
+                    print('  ETag mismatch for "%s" on %s/%s'
+                          % (path, node['ip'], node['device']))
         if not consistent and self.error_file:
-            print >>open(self.error_file, 'a'), path
+            with open(self.error_file, 'a') as err_file:
+                print(path, file=err_file)
         self.objects_checked += 1
 
     def audit_container(self, account, name, recurse=False):
@@ -147,13 +154,13 @@ def audit_container(self, account, name, recurse=False):
         if (account, name) in self.list_cache:
             return self.list_cache[(account, name)]
         self.in_progress[(account, name)] = Event()
-        print 'Auditing container "%s"' % name
+        print('Auditing container "%s"' % name)
         path = '/%s/%s' % (account, name)
         account_listing = self.audit_account(account)
         consistent = True
         if name not in account_listing:
             consistent = False
-            print "  Container %s not in account listing!" % path
+            print("  Container %s not in account listing!" % path)
         part, nodes = \
             self.container_ring.get_nodes(account, name.encode('utf-8'))
         rec_d = {}
@@ -162,7 +169,6 @@ def audit_container(self, account, name, recurse=False):
             marker = ''
             results = True
             while results:
-                node_id = node['id']
                 try:
                     conn = http_connect(node['ip'], node['port'],
                                         node['device'], part, 'GET',
@@ -177,13 +183,14 @@ def audit_container(self, account, name, recurse=False):
                               (path, node['ip'], node['device']))
                         break
                     if node['id'] not in responses:
-                        responses[node['id']] = dict(resp.getheaders())
-                    results = simplejson.loads(resp.read())
+                        responses[node['id']] = {
+                            h.lower(): v for h, v in resp.getheaders()}
+                    results = json.loads(resp.read())
                 except Exception:
                     self.container_exceptions += 1
                     consistent = False
-                    print '  Exception GETting container "%s" on %s/%s' % \
-                        (path, node['ip'], node['device'])
+                    print('  Exception GETting container "%s" on %s/%s' %
+                          (path, node['ip'], node['device']))
                     break
                 if results:
                     marker = results[-1]['name']
@@ -204,13 +211,15 @@ def audit_container(self, account, name, recurse=False):
                       for header in responses.values()]
         if not obj_counts:
             consistent = False
-            print "  Failed to fetch container %s at all!" % path
+            print("  Failed to fetch container %s at all!" % path)
         else:
             if len(set(obj_counts)) != 1:
                 self.container_count_mismatch += 1
                 consistent = False
-                print "  Container databases don't agree on number of objects."
-                print "  Max: %s, Min: %s" % (max(obj_counts), min(obj_counts))
+                print(
+                    "  Container databases don't agree on number of objects.")
+                print(
+                    "  Max: %s, Min: %s" % (max(obj_counts), min(obj_counts)))
         self.containers_checked += 1
         self.list_cache[(account, name)] = rec_d
         self.in_progress[(account, name)].send(True)
@@ -219,7 +228,8 @@ def audit_container(self, account, name, recurse=False):
             for obj in rec_d.keys():
                 self.pool.spawn_n(self.audit_object, account, name, obj)
         if not consistent and self.error_file:
-            print >>open(self.error_file, 'a'), path
+            with open(self.error_file, 'a') as error_file:
+                print(path, file=error_file)
         return rec_d
 
     def audit_account(self, account, recurse=False):
@@ -228,7 +238,7 @@ def audit_account(self, account, recurse=False):
         if account in self.list_cache:
             return self.list_cache[account]
         self.in_progress[account] = Event()
-        print 'Auditing account "%s"' % account
+        print('Auditing account "%s"' % account)
         consistent = True
         path = '/%s' % account
         part, nodes = self.account_ring.get_nodes(account)
@@ -248,22 +258,23 @@ def audit_account(self, account, recurse=False):
                         self.account_not_found += 1
                         consistent = False
                         print("  Bad status GETting account '%s' "
-                              " from %ss:%ss" %
+                              " from %s:%s" %
                               (account, node['ip'], node['device']))
                         break
-                    results = simplejson.loads(resp.read())
+                    results = json.loads(resp.read())
                 except Exception:
                     self.account_exceptions += 1
                     consistent = False
-                    print("  Exception GETting account '%s' on %ss:%ss" %
+                    print("  Exception GETting account '%s' on %s:%s" %
                           (account, node['ip'], node['device']))
                     break
                 if node_id not in responses:
-                    responses[node_id] = [dict(resp.getheaders()), []]
+                    responses[node_id] = [
+                        {h.lower(): v for h, v in resp.getheaders()}, []]
                 responses[node_id][1].extend(results)
                 if results:
                     marker = results[-1]['name']
-        headers = [resp[0] for resp in responses.values()]
+        headers = [r[0] for r in responses.values()]
         cont_counts = [int(header['x-account-container-count'])
                        for header in headers]
         if len(set(cont_counts)) != 1:
@@ -272,8 +283,8 @@ def audit_account(self, account, recurse=False):
             print("  Account databases for '%s' don't agree on"
                   " number of containers." % account)
             if cont_counts:
-                print "  Max: %s, Min: %s" % (max(cont_counts),
-                                              min(cont_counts))
+                print("  Max: %s, Min: %s" % (max(cont_counts),
+                                              min(cont_counts)))
         obj_counts = [int(header['x-account-object-count'])
                       for header in headers]
         if len(set(obj_counts)) != 1:
@@ -282,8 +293,8 @@ def audit_account(self, account, recurse=False):
             print("  Account databases for '%s' don't agree on"
                   " number of objects." % account)
             if obj_counts:
-                print "  Max: %s, Min: %s" % (max(obj_counts),
-                                              min(obj_counts))
+                print("  Max: %s, Min: %s" % (max(obj_counts),
+                                              min(obj_counts)))
         containers = set()
         for resp in responses.values():
             containers.update(container['name'] for container in resp[1])
@@ -296,7 +307,8 @@ def audit_account(self, account, recurse=False):
                 self.pool.spawn_n(self.audit_container, account,
                                   container, True)
         if not consistent and self.error_file:
-            print >>open(self.error_file, 'a'), path
+            with open(self.error_file, 'a') as error_file:
+                print(path, error_file)
         return containers
 
     def audit(self, account, container=None, obj=None):
@@ -311,45 +323,50 @@ def wait(self):
         self.pool.waitall()
 
     def print_stats(self):
-        print
-        print "  Accounts checked: %d" % self.accounts_checked
+
+        def _print_stat(name, stat):
+            # Right align stat name in a field of 18 characters
+            print("{0:>18}: {1}".format(name, stat))
+
+        print()
+        _print_stat("Accounts checked", self.accounts_checked)
         if self.account_not_found:
-            print "  Missing Replicas: %d" % self.account_not_found
+            _print_stat("Missing Replicas", self.account_not_found)
         if self.account_exceptions:
-            print "        Exceptions: %d" % self.account_exceptions
+            _print_stat("Exceptions", self.account_exceptions)
         if self.account_container_mismatch:
-            print " Cntainer mismatch: %d" % self.account_container_mismatch
+            _print_stat("Container mismatch", self.account_container_mismatch)
         if self.account_object_mismatch:
-            print "   Object mismatch: %d" % self.account_object_mismatch
-        print
-        print "Containers checked: %d" % self.containers_checked
+            _print_stat("Object mismatch", self.account_object_mismatch)
+        print()
+        _print_stat("Containers checked", self.containers_checked)
         if self.container_not_found:
-            print "  Missing Replicas: %d" % self.container_not_found
+            _print_stat("Missing Replicas", self.container_not_found)
         if self.container_exceptions:
-            print "        Exceptions: %d" % self.container_exceptions
+            _print_stat("Exceptions", self.container_exceptions)
         if self.container_count_mismatch:
-            print "    Count mismatch: %d" % self.container_count_mismatch
+            _print_stat("Count mismatch", self.container_count_mismatch)
         if self.container_obj_mismatch:
-            print "      Obj mismatch: %d" % self.container_obj_mismatch
-        print
-        print "   Objects checked: %d" % self.objects_checked
+            _print_stat("Object mismatch", self.container_obj_mismatch)
+        print()
+        _print_stat("Objects checked", self.objects_checked)
         if self.object_not_found:
-            print "  Missing Replicas: %d" % self.object_not_found
+            _print_stat("Missing Replicas", self.object_not_found)
         if self.object_exceptions:
-            print "        Exceptions: %d" % self.object_exceptions
+            _print_stat("Exceptions", self.object_exceptions)
         if self.object_checksum_mismatch:
-            print "      MD5 Mismatch: %d" % self.object_checksum_mismatch
+            _print_stat("MD5 Mismatch", self.object_checksum_mismatch)
 
 
-if __name__ == '__main__':
+def main():
     try:
         optlist, args = getopt.getopt(sys.argv[1:], 'c:r:e:d')
-    except getopt.GetoptError, err:
-        print str(err)
-        print usage
+    except getopt.GetoptError as err:
+        print(str(err))
+        print(usage)
         sys.exit(2)
     if not args and os.isatty(sys.stdin.fileno()):
-        print usage
+        print(usage)
         sys.exit()
     opts = dict(optlist)
     options = {
@@ -366,3 +383,7 @@ def print_stats(self):
         auditor.audit(*split_path(path, 1, 3, True))
     auditor.wait()
     auditor.print_stats()
+
+
+if __name__ == '__main__':
+    main()
diff --git a/swift/cli/config.py b/swift/cli/config.py
new file mode 100755
index 0000000000..447f77520a
--- /dev/null
+++ b/swift/cli/config.py
@@ -0,0 +1,90 @@
+#!/usr/bin/env python
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import optparse
+import os
+import sys
+
+from swift.common.manager import Server
+from swift.common.utils import readconf
+from swift.common.wsgi import appconfig
+
+parser = optparse.OptionParser('%prog [options] SERVER')
+parser.add_option('-c', '--config-num', metavar="N", type="int",
+                  dest="number", default=0,
+                  help="parse config for the Nth server only")
+parser.add_option('-s', '--section', help="only display matching sections")
+parser.add_option('-w', '--wsgi', action='store_true',
+                  help="use wsgi/paste parser instead of readconf")
+
+
+def _context_name(context):
+    return ':'.join((context.object_type.name, context.name))
+
+
+def inspect_app_config(app_config):
+    conf = {}
+    context = app_config.context
+    section_name = _context_name(context)
+    conf[section_name] = context.config()
+    if context.object_type.name == 'pipeline':
+        filters = context.filter_contexts
+        pipeline = []
+        for filter_context in filters:
+            conf[_context_name(filter_context)] = filter_context.config()
+            pipeline.append(filter_context.entry_point_name)
+        app_context = context.app_context
+        conf[_context_name(app_context)] = app_context.config()
+        pipeline.append(app_context.entry_point_name)
+        conf[section_name]['pipeline'] = ' '.join(pipeline)
+    return conf
+
+
+def main():
+    options, args = parser.parse_args()
+    options = dict(vars(options))
+
+    if not args:
+        return 'ERROR: specify type of server or conf_path'
+    conf_files = []
+    for arg in args:
+        if os.path.exists(arg):
+            conf_files.append(arg)
+        else:
+            conf_files += Server(arg).conf_files(**options)
+    for conf_file in conf_files:
+        print('# %s' % conf_file)
+        if options['wsgi']:
+            app_config = appconfig(conf_file)
+            conf = inspect_app_config(app_config)
+        else:
+            conf = readconf(conf_file)
+        flat_vars = {}
+        for k, v in conf.items():
+            if options['section'] and k != options['section']:
+                continue
+            if not isinstance(v, dict):
+                flat_vars[k] = v
+                continue
+            print('[%s]' % k)
+            for opt, value in v.items():
+                print('%s = %s' % (opt, value))
+            print()
+        for k, v in flat_vars.items():
+            print('# %s = %s' % (k, v))
+        print()
+
+
+if __name__ == "__main__":
+    sys.exit(main())
diff --git a/swift/cli/container_deleter.py b/swift/cli/container_deleter.py
new file mode 100644
index 0000000000..7b3ae95892
--- /dev/null
+++ b/swift/cli/container_deleter.py
@@ -0,0 +1,168 @@
+# Licensed under the Apache License, Version 2.0 (the "License"); you may not
+# use this file except in compliance with the License. You may obtain a copy
+# of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
+# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
+# License for the specific language governing permissions and limitations
+# under the License.
+
+'''
+Enqueue background jobs to delete portions of a container's namespace.
+
+Accepts prefix, marker, and end-marker args that work as in container
+listings. Objects found in the listing will be marked to be deleted
+by the object-expirer; until the object is actually deleted, it will
+continue to appear in listings.
+
+If there are many objects, this operation may take some time. Stats will
+periodically be emitted so you know the process hasn't hung. These will
+also include the last object marked for deletion; if there is a failure,
+pass this as the ``--marker`` when retrying to minimize duplicative work.
+'''
+
+import argparse
+import io
+import itertools
+import json
+import time
+
+from swift.common.internal_client import InternalClient
+from swift.common.utils import Timestamp, MD5_OF_EMPTY_STRING
+from swift.obj.expirer import build_task_obj, ASYNC_DELETE_TYPE
+
+OBJECTS_PER_UPDATE = 10000
+
+
+def make_delete_jobs(account, container, objects, timestamp):
+    '''
+    Create a list of async-delete jobs
+
+    :param account: (native or unicode string) account to delete from
+    :param container: (native or unicode string) container to delete from
+    :param objects: (list of native or unicode strings) objects to delete
+    :param timestamp: (Timestamp) time at which objects should be marked
+                      deleted
+    :returns: list of dicts appropriate for an UPDATE request to an
+              expiring-object queue
+    '''
+    return [
+        {
+            'name': build_task_obj(
+                timestamp, account, container,
+                obj, high_precision=True),
+            'deleted': 0,
+            'created_at': timestamp.internal,
+            'etag': MD5_OF_EMPTY_STRING,
+            'size': 0,
+            'storage_policy_index': 0,
+            'content_type': ASYNC_DELETE_TYPE,
+        } for obj in objects]
+
+
+def mark_for_deletion(swift, account, container, marker, end_marker,
+                      prefix, timestamp=None, yield_time=10):
+    '''
+    Enqueue jobs to async-delete some portion of a container's namespace
+
+    :param swift: InternalClient to use
+    :param account: account to delete from
+    :param container: container to delete from
+    :param marker: only delete objects after this name
+    :param end_marker: only delete objects before this name. Use ``None`` or
+                       empty string to delete to the end of the namespace.
+    :param prefix: only delete objects starting with this prefix
+    :param timestamp: delete all objects as of this time. If ``None``, the
+                      current time will be used.
+    :param yield_time: approximate period with which intermediate results
+                       should be returned. If ``None``, disable intermediate
+                       results.
+    :returns: If ``yield_time`` is ``None``, the number of objects marked for
+              deletion. Otherwise, a generator that will yield out tuples of
+              ``(number of marked objects, last object name)`` approximately
+              every ``yield_time`` seconds. The final tuple will have ``None``
+              as the second element. This form allows you to retry when an
+              error occurs partway through while minimizing duplicate work.
+    '''
+    if timestamp is None:
+        timestamp = Timestamp.now()
+
+    def enqueue_deletes():
+        deleted = 0
+        obj_iter = swift.iter_objects(
+            account, container,
+            marker=marker, end_marker=end_marker, prefix=prefix)
+        time_marker = time.time()
+        while True:
+            to_delete = [obj['name'] for obj in itertools.islice(
+                obj_iter, OBJECTS_PER_UPDATE)]
+            if not to_delete:
+                break
+            delete_jobs = make_delete_jobs(
+                account, container, to_delete, timestamp)
+            swift.make_request(
+                'UPDATE',
+                swift.make_path('.expiring_objects', str(int(timestamp))),
+                headers={'X-Backend-Allow-Private-Methods': 'True',
+                         'X-Backend-Storage-Policy-Index': '0',
+                         'X-Timestamp': timestamp.internal},
+                acceptable_statuses=(2,),
+                body_file=io.BytesIO(json.dumps(delete_jobs).encode('ascii')))
+            deleted += len(delete_jobs)
+            if yield_time is not None and \
+                    time.time() - time_marker > yield_time:
+                yield deleted, to_delete[-1]
+                time_marker = time.time()
+        yield deleted, None
+
+    if yield_time is None:
+        for deleted, marker in enqueue_deletes():
+            if marker is None:
+                return deleted
+    else:
+        return enqueue_deletes()
+
+
+def main(args=None):
+    parser = argparse.ArgumentParser(
+        description=__doc__,
+        formatter_class=argparse.RawTextHelpFormatter)
+    parser.add_argument('--config', default='/etc/swift/internal-client.conf',
+                        help=('internal-client config file '
+                              '(default: /etc/swift/internal-client.conf'))
+    parser.add_argument('--request-tries', type=int, default=3,
+                        help='(default: 3)')
+    parser.add_argument('account', help='account from which to delete')
+    parser.add_argument('container', help='container from which to delete')
+    parser.add_argument(
+        '--prefix', default='',
+        help='only delete objects with this prefix (default: none)')
+    parser.add_argument(
+        '--marker', default='',
+        help='only delete objects after this marker (default: none)')
+    parser.add_argument(
+        '--end-marker', default='',
+        help='only delete objects before this end-marker (default: none)')
+    parser.add_argument(
+        '--timestamp', type=Timestamp, default=Timestamp.now(),
+        help='delete all objects as of this time (default: now)')
+    args = parser.parse_args(args)
+
+    swift = InternalClient(
+        args.config, 'Swift Container Deleter', args.request_tries,
+        global_conf={'log_name': 'container-deleter-ic'})
+    for deleted, marker in mark_for_deletion(
+            swift, args.account, args.container,
+            args.marker, args.end_marker, args.prefix, args.timestamp):
+        if marker is None:
+            print('Finished. Marked %d objects for deletion.' % deleted)
+        else:
+            print('Marked %d objects for deletion, through %r' % (
+                deleted, marker))
+
+
+if __name__ == '__main__':
+    main()
diff --git a/swift/cli/dispersion_populate.py b/swift/cli/dispersion_populate.py
new file mode 100755
index 0000000000..b9508f551c
--- /dev/null
+++ b/swift/cli/dispersion_populate.py
@@ -0,0 +1,284 @@
+#!/usr/bin/env python
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import io
+import traceback
+from optparse import OptionParser
+from sys import exit, stdout
+from time import time
+
+from eventlet import GreenPool, patcher, sleep
+from eventlet.pools import Pool
+from configparser import ConfigParser
+
+from swift.common.internal_client import SimpleClient
+from swift.common.ring import Ring
+from swift.common.utils import compute_eta, get_time_units, config_true_value
+from swift.common.storage_policy import POLICIES
+
+insecure = False
+
+
+def put_container(connpool, container, report, headers):
+    global retries_done
+    try:
+        with connpool.item() as conn:
+            conn.put_container(container, headers=headers)
+            retries_done += conn.attempts - 1
+        if report:
+            report(True)
+    except Exception:
+        if report:
+            report(False)
+        raise
+
+
+def put_object(connpool, container, obj, report):
+    global retries_done
+    try:
+        with connpool.item() as conn:
+            data = io.BytesIO(obj.encode('utf8'))
+            conn.put_object(container, obj, data,
+                            headers={'x-object-meta-dispersion': obj})
+            retries_done += conn.attempts - 1
+        if report:
+            report(True)
+    except Exception:
+        if report:
+            report(False)
+        raise
+
+
+def report(success):
+    global begun, created, item_type, next_report, need_to_create, retries_done
+    if not success:
+        traceback.print_exc()
+        exit('Gave up due to error(s).')
+    created += 1
+    if time() < next_report:
+        return
+    next_report = time() + 5
+    eta, eta_unit = compute_eta(begun, created, need_to_create)
+    print('\r\x1B[KCreating %s: %d of %d, %d%s left, %d retries'
+          % (item_type, created, need_to_create, round(eta), eta_unit,
+             retries_done), end='')
+    stdout.flush()
+
+
+def main():
+    global begun, created, item_type, next_report, need_to_create, retries_done
+    patcher.monkey_patch()
+    try:
+        # Delay importing so urllib3 will import monkey-patched modules
+        from swiftclient import get_auth
+    except ImportError:
+        from swift.common.internal_client import get_auth
+
+    conffile = '/etc/swift/dispersion.conf'
+
+    parser = OptionParser(usage='''
+Usage: %%prog [options] [conf_file]
+
+[conf_file] defaults to %s'''.strip() % conffile)
+    parser.add_option('--container-only', action='store_true', default=False,
+                      help='Only run container population')
+    parser.add_option('--object-only', action='store_true', default=False,
+                      help='Only run object population')
+    parser.add_option('--container-suffix-start', type=int, default=0,
+                      help='container suffix start value, defaults to 0')
+    parser.add_option('--object-suffix-start', type=int, default=0,
+                      help='object suffix start value, defaults to 0')
+    parser.add_option('--insecure', action='store_true', default=False,
+                      help='Allow accessing insecure keystone server. '
+                           'The keystone\'s certificate will not be verified.')
+    parser.add_option('--no-overlap', action='store_true', default=False,
+                      help="No overlap of partitions if running populate \
+                      more than once. Will increase coverage by amount shown \
+                      in dispersion.conf file")
+    parser.add_option('-P', '--policy-name', dest='policy_name',
+                      help="Specify storage policy name")
+
+    options, args = parser.parse_args()
+
+    if args:
+        conffile = args.pop(0)
+
+    c = ConfigParser()
+    if not c.read(conffile):
+        exit('Unable to read config file: %s' % conffile)
+    conf = dict(c.items('dispersion'))
+
+    if options.policy_name is None:
+        policy = POLICIES.default
+    else:
+        policy = POLICIES.get_by_name(options.policy_name)
+        if policy is None:
+            exit('Unable to find policy: %s' % options.policy_name)
+    print('Using storage policy: %s ' % policy.name)
+
+    swift_dir = conf.get('swift_dir', '/etc/swift')
+    dispersion_coverage = float(conf.get('dispersion_coverage', 1))
+    retries = int(conf.get('retries', 5))
+    concurrency = int(conf.get('concurrency', 25))
+    endpoint_type = str(conf.get('endpoint_type', 'publicURL'))
+    region_name = str(conf.get('region_name', ''))
+    user_domain_name = str(conf.get('user_domain_name', ''))
+    project_domain_name = str(conf.get('project_domain_name', ''))
+    project_name = str(conf.get('project_name', ''))
+    insecure = options.insecure \
+        or config_true_value(conf.get('keystone_api_insecure', 'no'))
+    container_populate = config_true_value(
+        conf.get('container_populate', 'yes')) and not options.object_only
+    object_populate = config_true_value(
+        conf.get('object_populate', 'yes')) and not options.container_only
+
+    if not (object_populate or container_populate):
+        exit("Neither container or object populate is set to run")
+
+    coropool = GreenPool(size=concurrency)
+    retries_done = 0
+
+    os_options = {'endpoint_type': endpoint_type}
+    if user_domain_name:
+        os_options['user_domain_name'] = user_domain_name
+    if project_domain_name:
+        os_options['project_domain_name'] = project_domain_name
+    if project_name:
+        os_options['project_name'] = project_name
+    if region_name:
+        os_options['region_name'] = region_name
+
+    url, token = get_auth(conf['auth_url'], conf['auth_user'],
+                          conf['auth_key'],
+                          auth_version=conf.get('auth_version', '1.0'),
+                          os_options=os_options,
+                          insecure=insecure)
+    account = url.rsplit('/', 1)[1]
+    connpool = Pool(max_size=concurrency)
+    headers = {}
+    headers['X-Storage-Policy'] = policy.name
+    connpool.create = lambda: SimpleClient(
+        url=url, token=token, retries=retries)
+
+    if container_populate:
+        container_ring = Ring(swift_dir, ring_name='container')
+        parts_left = dict((x, x)
+                          for x in range(container_ring.partition_count))
+
+        if options.no_overlap:
+            with connpool.item() as conn:
+                containers = [cont['name'] for cont in conn.get_account(
+                    prefix='dispersion_%d' % policy.idx, full_listing=True)[1]]
+            containers_listed = len(containers)
+            if containers_listed > 0:
+                for container in containers:
+                    partition, _junk = container_ring.get_nodes(account,
+                                                                container)
+                    if partition in parts_left:
+                        del parts_left[partition]
+
+        item_type = 'containers'
+        created = 0
+        retries_done = 0
+        need_to_create = need_to_queue = \
+            dispersion_coverage / 100.0 * container_ring.partition_count
+        begun = next_report = time()
+        next_report += 2
+        suffix = 0
+        while need_to_queue >= 1 and parts_left:
+            container = 'dispersion_%d_%d' % (policy.idx, suffix)
+            part = container_ring.get_part(account, container)
+            if part in parts_left:
+                if suffix >= options.container_suffix_start:
+                    coropool.spawn(put_container, connpool, container, report,
+                                   headers)
+                    sleep()
+                else:
+                    report(True)
+                del parts_left[part]
+                need_to_queue -= 1
+            suffix += 1
+        coropool.waitall()
+        elapsed, elapsed_unit = get_time_units(time() - begun)
+        print('\r\x1B[KCreated %d containers for dispersion reporting, '
+              '%d%s, %d retries' %
+              ((need_to_create - need_to_queue), round(elapsed), elapsed_unit,
+               retries_done))
+        if options.no_overlap:
+            con_coverage = container_ring.partition_count - len(parts_left)
+            print('\r\x1B[KTotal container coverage is now %.2f%%.' %
+                  ((float(con_coverage) / container_ring.partition_count
+                    * 100)))
+        stdout.flush()
+
+    if object_populate:
+        container = 'dispersion_objects_%d' % policy.idx
+        put_container(connpool, container, None, headers)
+        object_ring = Ring(swift_dir, ring_name=policy.ring_name)
+        parts_left = dict((x, x) for x in range(object_ring.partition_count))
+
+        if options.no_overlap:
+            with connpool.item() as conn:
+                obj_container = [cont_b['name'] for cont_b in conn.get_account(
+                    prefix=container, full_listing=True)[1]]
+            if obj_container:
+                with connpool.item() as conn:
+                    objects = [o['name'] for o in
+                               conn.get_container(container,
+                                                  prefix='dispersion_',
+                                                  full_listing=True)[1]]
+                for my_object in objects:
+                    partition = object_ring.get_part(account, container,
+                                                     my_object)
+                    if partition in parts_left:
+                        del parts_left[partition]
+
+        item_type = 'objects'
+        created = 0
+        retries_done = 0
+        need_to_create = need_to_queue = \
+            dispersion_coverage / 100.0 * object_ring.partition_count
+        begun = next_report = time()
+        next_report += 2
+        suffix = 0
+        while need_to_queue >= 1 and parts_left:
+            obj = 'dispersion_%d' % suffix
+            part = object_ring.get_part(account, container, obj)
+            if part in parts_left:
+                if suffix >= options.object_suffix_start:
+                    coropool.spawn(
+                        put_object, connpool, container, obj, report)
+                    sleep()
+                else:
+                    report(True)
+                del parts_left[part]
+                need_to_queue -= 1
+            suffix += 1
+        coropool.waitall()
+        elapsed, elapsed_unit = get_time_units(time() - begun)
+        print('\r\x1B[KCreated %d objects for dispersion reporting, '
+              '%d%s, %d retries' %
+              ((need_to_create - need_to_queue), round(elapsed), elapsed_unit,
+               retries_done))
+        if options.no_overlap:
+            obj_coverage = object_ring.partition_count - len(parts_left)
+            print('\r\x1B[KTotal object coverage is now %.2f%%.' %
+                  ((float(obj_coverage) / object_ring.partition_count * 100)))
+        stdout.flush()
+
+
+if __name__ == '__main__':
+    main()
diff --git a/bin/swift-dispersion-report b/swift/cli/dispersion_report.py
old mode 100755
new mode 100644
similarity index 56%
rename from bin/swift-dispersion-report
rename to swift/cli/dispersion_report.py
index 590dede13c..20b0f7e114
--- a/bin/swift-dispersion-report
+++ b/swift/cli/dispersion_report.py
@@ -1,5 +1,5 @@
 #!/usr/bin/env python
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -14,29 +14,30 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-import os
-from ConfigParser import ConfigParser
+import json
+from collections import defaultdict
+from configparser import ConfigParser
 from optparse import OptionParser
 from sys import exit, stdout, stderr
 from time import time
-try:
-    import simplejson as json
-except ImportError:
-    import json
 
 from eventlet import GreenPool, hubs, patcher, Timeout
 from eventlet.pools import Pool
 
 from swift.common import direct_client
-from swiftclient import ClientException, Connection, get_auth
+from swift.common.internal_client import SimpleClient
 from swift.common.ring import Ring
-from swift.common.utils import compute_eta, get_time_units, config_true_value
+from swift.common.exceptions import ClientException
+from swift.common.utils import compute_eta, get_time_units, \
+    config_true_value, node_to_string
+from swift.common.storage_policy import POLICIES
 
 
 unmounted = []
 notfound = []
 json_output = False
 debug = False
+insecure = False
 
 
 def get_error_log(prefix):
@@ -50,103 +51,106 @@ def error_log(msg_or_exc):
             if msg_or_exc.http_status == 507:
                 if identifier not in unmounted:
                     unmounted.append(identifier)
-                    print >>stderr, 'ERROR: %s is unmounted -- This will ' \
-                        'cause replicas designated for that device to be ' \
-                        'considered missing until resolved or the ring is ' \
-                        'updated.' % (identifier)
+                    print('ERROR: %s is unmounted -- This will '
+                          'cause replicas designated for that device to be '
+                          'considered missing until resolved or the ring is '
+                          'updated.' % (identifier), file=stderr)
                     stderr.flush()
             if debug and identifier not in notfound:
                 notfound.append(identifier)
-                print >>stderr, 'ERROR: %s returned a 404' % (identifier)
+                print('ERROR: %s returned a 404' % (identifier), file=stderr)
                 stderr.flush()
         if not hasattr(msg_or_exc, 'http_status') or \
                 msg_or_exc.http_status not in (404, 507):
-            print >>stderr, 'ERROR: %s: %s' % (prefix, msg_or_exc)
+            print('ERROR: %s: %s' % (prefix, msg_or_exc), file=stderr)
             stderr.flush()
     return error_log
 
 
 def container_dispersion_report(coropool, connpool, account, container_ring,
-                                retries, output_missing_partitions):
+                                retries, output_missing_partitions, policy):
     with connpool.item() as conn:
         containers = [c['name'] for c in conn.get_account(
-            prefix='dispersion_', full_listing=True)[1]]
+            prefix='dispersion_%d' % policy.idx, full_listing=True)[1]]
     containers_listed = len(containers)
     if not containers_listed:
-        print >>stderr, 'No containers to query. Has ' \
-                        'swift-dispersion-populate been run?'
+        print('No containers to query. Has '
+              'swift-dispersion-populate been run?', file=stderr)
         stderr.flush()
         return
     retries_done = [0]
     containers_queried = [0]
-    container_copies_found = [0] * (container_ring.replica_count + 1)
+    container_copies_missing = defaultdict(int)
+    container_copies_found = [0]
+    container_copies_expected = [0]
     begun = time()
     next_report = [time() + 2]
 
     def direct(container, part, nodes):
         found_count = 0
         for node in nodes:
-            error_log = get_error_log('%(ip)s:%(port)s/%(device)s' % node)
+            error_log = get_error_log(node_to_string(node))
             try:
                 attempts, _junk = direct_client.retry(
                     direct_client.direct_head_container, node, part, account,
                     container, error_log=error_log, retries=retries)
                 retries_done[0] += attempts - 1
                 found_count += 1
-            except ClientException, err:
+            except ClientException as err:
                 if err.http_status not in (404, 507):
                     error_log('Giving up on /%s/%s/%s: %s' % (part, account,
                               container, err))
-            except (Exception, Timeout), err:
+            except (Exception, Timeout) as err:
                 error_log('Giving up on /%s/%s/%s: %s' % (part, account,
                           container, err))
         if output_missing_partitions and \
-                found_count < container_ring.replica_count:
-            missing = container_ring.replica_count - found_count
-            print '\r\x1B[K',
+                found_count < len(nodes):
+            missing = len(nodes) - found_count
+            print('\r\x1B[K', end='')
             stdout.flush()
-            print >>stderr, '# Container partition %s missing %s cop%s' % (
-                part, missing, 'y' if missing == 1 else 'ies')
-        container_copies_found[found_count] += 1
+            print('# Container partition %s missing %s cop%s' % (
+                part, missing, 'y' if missing == 1 else 'ies'), file=stderr)
+        container_copies_found[0] += found_count
         containers_queried[0] += 1
+        container_copies_missing[len(nodes) - found_count] += 1
         if time() >= next_report[0]:
             next_report[0] = time() + 5
             eta, eta_unit = compute_eta(begun, containers_queried[0],
                                         containers_listed)
             if not json_output:
-                print '\r\x1B[KQuerying containers: %d of %d, %d%s left, %d ' \
+                print('\r\x1B[KQuerying containers: %d of %d, %d%s left, %d '
                       'retries' % (containers_queried[0], containers_listed,
-                      round(eta), eta_unit, retries_done[0]),
+                                   round(eta), eta_unit, retries_done[0]),
+                      end='')
                 stdout.flush()
     container_parts = {}
     for container in containers:
         part, nodes = container_ring.get_nodes(account, container)
         if part not in container_parts:
+            container_copies_expected[0] += len(nodes)
             container_parts[part] = part
             coropool.spawn(direct, container, part, nodes)
     coropool.waitall()
     distinct_partitions = len(container_parts)
-    copies_expected = distinct_partitions * container_ring.replica_count
-    copies_found = sum(a * b for a, b in enumerate(container_copies_found))
+    copies_found = container_copies_found[0]
+    copies_expected = container_copies_expected[0]
     value = 100.0 * copies_found / copies_expected
     elapsed, elapsed_unit = get_time_units(time() - begun)
+    container_copies_missing.pop(0, None)
     if not json_output:
-        print '\r\x1B[KQueried %d containers for dispersion reporting, ' \
+        print('\r\x1B[KQueried %d containers for dispersion reporting, '
               '%d%s, %d retries' % (containers_listed, round(elapsed),
-              elapsed_unit, retries_done[0])
+                                    elapsed_unit, retries_done[0]))
         if containers_listed - distinct_partitions:
-            print 'There were %d overlapping partitions' % (
-                  containers_listed - distinct_partitions)
-        for copies in xrange(container_ring.replica_count - 1, -1, -1):
-            missing_copies = container_ring.replica_count - copies
-            if container_copies_found[copies]:
-                print missing_string(container_copies_found[copies],
-                                     missing_copies,
-                                     container_ring.replica_count)
-        print '%.02f%% of container copies found (%d of %d)' % (
-            value, copies_found, copies_expected)
-        print 'Sample represents %.02f%% of the container partition space' % (
-            100.0 * distinct_partitions / container_ring.partition_count)
+            print('There were %d overlapping partitions' % (
+                  containers_listed - distinct_partitions))
+        for missing_copies, num_parts in container_copies_missing.items():
+            print(missing_string(num_parts, missing_copies,
+                                 container_ring.replica_count))
+        print('%.02f%% of container copies found (%d of %d)' % (
+            value, copies_found, copies_expected))
+        print('Sample represents %.02f%% of the container partition space' % (
+            100.0 * distinct_partitions / container_ring.partition_count))
         stdout.flush()
         return None
     else:
@@ -155,102 +159,112 @@ def direct(container, part, nodes):
                    'pct_found': value,
                    'copies_found': copies_found,
                    'copies_expected': copies_expected}
-        for copies in xrange(container_ring.replica_count):
-            missing_copies = container_ring.replica_count - copies
-            results['missing_%d' % (missing_copies)] = \
-                container_copies_found[copies]
+        for missing_copies, num_parts in container_copies_missing.items():
+            results['missing_%d' % (missing_copies)] = num_parts
         return results
 
 
 def object_dispersion_report(coropool, connpool, account, object_ring,
-                             retries, output_missing_partitions):
-    container = 'dispersion_objects'
+                             retries, output_missing_partitions, policy):
+    container = 'dispersion_objects_%d' % policy.idx
     with connpool.item() as conn:
         try:
             objects = [o['name'] for o in conn.get_container(
                 container, prefix='dispersion_', full_listing=True)[1]]
-        except ClientException, err:
+        except ClientException as err:
             if err.http_status != 404:
                 raise
-            print >>stderr, 'No objects to query. Has ' \
-                            'swift-dispersion-populate been run?'
+
+            print('No objects to query. Has '
+                  'swift-dispersion-populate been run?', file=stderr)
             stderr.flush()
             return
     objects_listed = len(objects)
     if not objects_listed:
-        print >>stderr, 'No objects to query. Has swift-dispersion-populate ' \
-                        'been run?'
+        print('No objects to query. Has swift-dispersion-populate '
+              'been run?', file=stderr)
         stderr.flush()
         return
     retries_done = [0]
     objects_queried = [0]
-    object_copies_found = [0] * (object_ring.replica_count + 1)
+    object_copies_found = [0]
+    object_copies_expected = [0]
+    object_copies_missing = defaultdict(int)
     begun = time()
     next_report = [time() + 2]
 
+    headers = None
+    if policy is not None:
+        headers = {}
+        headers['X-Backend-Storage-Policy-Index'] = int(policy)
+
     def direct(obj, part, nodes):
         found_count = 0
         for node in nodes:
-            error_log = get_error_log('%(ip)s:%(port)s/%(device)s' % node)
+            error_log = get_error_log(node_to_string(node))
             try:
                 attempts, _junk = direct_client.retry(
                     direct_client.direct_head_object, node, part, account,
-                    container, obj, error_log=error_log, retries=retries)
+                    container, obj, error_log=error_log, retries=retries,
+                    headers=headers)
                 retries_done[0] += attempts - 1
                 found_count += 1
-            except ClientException, err:
+            except ClientException as err:
                 if err.http_status not in (404, 507):
                     error_log('Giving up on /%s/%s/%s/%s: %s' % (part, account,
                               container, obj, err))
-            except (Exception, Timeout), err:
+            except (Exception, Timeout) as err:
                 error_log('Giving up on /%s/%s/%s/%s: %s' % (part, account,
                           container, obj, err))
         if output_missing_partitions and \
-                found_count < object_ring.replica_count:
-            missing = object_ring.replica_count - found_count
-            print '\r\x1B[K',
+                found_count < len(nodes):
+            missing = len(nodes) - found_count
+            print('\r\x1B[K', end='')
             stdout.flush()
-            print >>stderr, '# Object partition %s missing %s cop%s' % (
-                part, missing, 'y' if missing == 1 else 'ies')
-        object_copies_found[found_count] += 1
+            print('# Object partition %s missing %s cop%s' % (
+                part, missing, 'y' if missing == 1 else 'ies'), file=stderr)
+        object_copies_found[0] += found_count
+        object_copies_missing[len(nodes) - found_count] += 1
         objects_queried[0] += 1
         if time() >= next_report[0]:
             next_report[0] = time() + 5
             eta, eta_unit = compute_eta(begun, objects_queried[0],
                                         objects_listed)
             if not json_output:
-                print '\r\x1B[KQuerying objects: %d of %d, %d%s left, %d ' \
+                print('\r\x1B[KQuerying objects: %d of %d, %d%s left, %d '
                       'retries' % (objects_queried[0], objects_listed,
                                    round(eta), eta_unit, retries_done[0]),
+                      end='')
             stdout.flush()
     object_parts = {}
     for obj in objects:
         part, nodes = object_ring.get_nodes(account, container, obj)
         if part not in object_parts:
+            object_copies_expected[0] += len(nodes)
             object_parts[part] = part
             coropool.spawn(direct, obj, part, nodes)
     coropool.waitall()
     distinct_partitions = len(object_parts)
-    copies_expected = distinct_partitions * object_ring.replica_count
-    copies_found = sum(a * b for a, b in enumerate(object_copies_found))
+    copies_found = object_copies_found[0]
+    copies_expected = object_copies_expected[0]
     value = 100.0 * copies_found / copies_expected
     elapsed, elapsed_unit = get_time_units(time() - begun)
     if not json_output:
-        print '\r\x1B[KQueried %d objects for dispersion reporting, ' \
+        print('\r\x1B[KQueried %d objects for dispersion reporting, '
               '%d%s, %d retries' % (objects_listed, round(elapsed),
-              elapsed_unit, retries_done[0])
+                                    elapsed_unit, retries_done[0]))
         if objects_listed - distinct_partitions:
-            print 'There were %d overlapping partitions' % (
-                  objects_listed - distinct_partitions)
-        for copies in xrange(object_ring.replica_count - 1, -1, -1):
-            missing_copies = object_ring.replica_count - copies
-            if object_copies_found[copies]:
-                print missing_string(object_copies_found[copies],
-                                     missing_copies, object_ring.replica_count)
-        print '%.02f%% of object copies found (%d of %d)' % \
-            (value, copies_found, copies_expected)
-        print 'Sample represents %.02f%% of the object partition space' % (
-            100.0 * distinct_partitions / object_ring.partition_count)
+            print('There were %d overlapping partitions' % (
+                  objects_listed - distinct_partitions))
+
+        for missing_copies, num_parts in object_copies_missing.items():
+            print(missing_string(num_parts, missing_copies,
+                                 object_ring.replica_count))
+
+        print('%.02f%% of object copies found (%d of %d)' %
+              (value, copies_found, copies_expected))
+        print('Sample represents %.02f%% of the object partition space' % (
+            100.0 * distinct_partitions / object_ring.partition_count))
         stdout.flush()
         return None
     else:
@@ -259,10 +273,9 @@ def direct(obj, part, nodes):
                    'pct_found': value,
                    'copies_found': copies_found,
                    'copies_expected': copies_expected}
-        for copies in xrange(object_ring.replica_count):
-            missing_copies = object_ring.replica_count - copies
-            results['missing_%d' % (missing_copies)] = \
-                object_copies_found[copies]
+
+        for missing_copies, num_parts in object_copies_missing.items():
+            results['missing_%d' % (missing_copies,)] = num_parts
         return results
 
 
@@ -281,9 +294,9 @@ def missing_string(partition_count, missing_copies, copy_count):
         verb_string = 'were'
         partition_string = 'partitions'
 
-    copy_string = 'copy'
-    if missing_copies > 1:
-        copy_string = 'copies'
+    copy_string = 'copies'
+    if missing_copies == 1:
+        copy_string = 'copy'
 
     return '%sThere %s %d %s missing %s %s.' % (
         exclamations, verb_string, partition_count, partition_string,
@@ -291,7 +304,7 @@ def missing_string(partition_count, missing_copies, copy_count):
     )
 
 
-if __name__ == '__main__':
+def main():
     patcher.monkey_patch()
     hubs.get_hub().debug_exceptions = False
 
@@ -311,52 +324,110 @@ def missing_string(partition_count, missing_copies, copy_count):
                       help='Only run container report')
     parser.add_option('--object-only', action='store_true', default=False,
                       help='Only run object report')
-    options, args = parser.parse_args()
+    parser.add_option('--insecure', action='store_true', default=False,
+                      help='Allow accessing insecure keystone server. '
+                           'The keystone\'s certificate will not be verified.')
+    parser.add_option('-P', '--policy-name', dest='policy_name',
+                      help="Specify storage policy name")
 
+    options, args = parser.parse_args()
     if args:
         conffile = args.pop(0)
 
+    if options.debug:
+        global debug
+        debug = True
+
     c = ConfigParser()
     if not c.read(conffile):
         exit('Unable to read config file: %s' % conffile)
     conf = dict(c.items('dispersion'))
+
+    if options.dump_json:
+        conf['dump_json'] = 'yes'
+    if options.object_only:
+        conf['container_report'] = 'no'
+    if options.container_only:
+        conf['object_report'] = 'no'
+    if options.insecure:
+        conf['keystone_api_insecure'] = 'yes'
+    if options.partitions:
+        conf['partitions'] = 'yes'
+
+    output = generate_report(conf, options.policy_name)
+
+    if json_output:
+        print(json.dumps(output))
+
+
+def generate_report(conf, policy_name=None):
+    try:
+        # Delay importing so urllib3 will import monkey-patched modules
+        from swiftclient import get_auth
+    except ImportError:
+        from swift.common.internal_client import get_auth
+    global json_output
+    json_output = config_true_value(conf.get('dump_json', 'no'))
+    if policy_name is None:
+        policy = POLICIES.default
+    else:
+        policy = POLICIES.get_by_name(policy_name)
+        if policy is None:
+            exit('Unable to find policy: %s' % policy_name)
+    if not json_output:
+        print('Using storage policy: %s ' % policy.name)
+
     swift_dir = conf.get('swift_dir', '/etc/swift')
-    dispersion_coverage = int(conf.get('dispersion_coverage', 1))
     retries = int(conf.get('retries', 5))
     concurrency = int(conf.get('concurrency', 25))
-    if options.dump_json or config_true_value(conf.get('dump_json', 'no')):
-        json_output = True
-    container_report = config_true_value(conf.get('container_report', 'yes')) \
-        and not options.object_only
-    object_report = config_true_value(conf.get('object_report', 'yes')) \
-        and not options.container_only
+    endpoint_type = str(conf.get('endpoint_type', 'publicURL'))
+    region_name = str(conf.get('region_name', ''))
+    container_report = config_true_value(conf.get('container_report', 'yes'))
+    object_report = config_true_value(conf.get('object_report', 'yes'))
     if not (object_report or container_report):
         exit("Neither container or object report is set to run")
-    if options.debug:
-        debug = True
+    user_domain_name = str(conf.get('user_domain_name', ''))
+    project_domain_name = str(conf.get('project_domain_name', ''))
+    project_name = str(conf.get('project_name', ''))
+    insecure = config_true_value(conf.get('keystone_api_insecure', 'no'))
 
     coropool = GreenPool(size=concurrency)
 
+    os_options = {'endpoint_type': endpoint_type}
+    if user_domain_name:
+        os_options['user_domain_name'] = user_domain_name
+    if project_domain_name:
+        os_options['project_domain_name'] = project_domain_name
+    if project_name:
+        os_options['project_name'] = project_name
+    if region_name:
+        os_options['region_name'] = region_name
+
     url, token = get_auth(conf['auth_url'], conf['auth_user'],
                           conf['auth_key'],
-                          auth_version=conf.get('auth_version', '1.0'))
+                          auth_version=conf.get('auth_version', '1.0'),
+                          os_options=os_options,
+                          insecure=insecure)
     account = url.rsplit('/', 1)[1]
     connpool = Pool(max_size=concurrency)
-    connpool.create = lambda: Connection(
-        conf['auth_url'], conf['auth_user'], conf['auth_key'], retries=retries,
-        preauthurl=url, preauthtoken=token)
+    connpool.create = lambda: SimpleClient(
+        url=url, token=token, retries=retries)
 
     container_ring = Ring(swift_dir, ring_name='container')
-    object_ring = Ring(swift_dir, ring_name='object')
+    object_ring = Ring(swift_dir, ring_name=policy.ring_name)
 
     output = {}
     if container_report:
         output['container'] = container_dispersion_report(
             coropool, connpool, account, container_ring, retries,
-            options.partitions)
+            conf.get('partitions'), policy)
     if object_report:
         output['object'] = object_dispersion_report(
             coropool, connpool, account, object_ring, retries,
-            options.partitions)
-    if json_output:
-        print json.dumps(output)
+            conf.get('partitions'), policy)
+
+    return output
+
+
+if __name__ == '__main__':
+    main()
diff --git a/swift/cli/drive_audit.py b/swift/cli/drive_audit.py
new file mode 100755
index 0000000000..fa8367895c
--- /dev/null
+++ b/swift/cli/drive_audit.py
@@ -0,0 +1,266 @@
+#!/usr/bin/env python
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import datetime
+import glob
+import locale
+import os
+import os.path
+import re
+import subprocess
+import sys
+
+
+from configparser import ConfigParser
+
+from swift.common.utils import backward, get_logger, dump_recon_cache, \
+    config_true_value
+
+
+def get_devices(device_dir, logger):
+    devices = []
+    majmin_devices = {}
+
+    # List /dev/block
+    # Using os.scandir on recent versions of python, else os.listdir
+    if 'scandir' in dir(os):
+        with os.scandir("/dev/block") as it:
+            for ent in it:
+                if ent.is_symlink():
+                    dev_name = os.path.basename(os.readlink(ent.path))
+                    majmin = os.path.basename(ent.path).split(':')
+                    majmin_devices[dev_name] = {'major': majmin[0],
+                                                'minor': majmin[1]}
+    else:
+        for ent in os.listdir("/dev/block"):
+            ent_path = os.path.join("/dev/block", ent)
+            if os.path.is_symlink(ent_path):
+                dev_name = os.path.basename(os.readlink(ent_path))
+                majmin = os.path.basename(ent_path).split(':')
+                majmin_devices[dev_name] = {'major': majmin[0],
+                                            'minor': majmin[1]}
+
+    for line in open('/proc/mounts').readlines():
+        data = line.strip().split()
+        block_device = data[0]
+        mount_point = data[1]
+        if mount_point.startswith(device_dir):
+            device = {}
+            device['mount_point'] = mount_point
+            device['block_device'] = block_device
+            dev_name = os.path.basename(block_device)
+            if dev_name in majmin_devices:
+                # If symlink is in /dev/block
+                device['major'] = majmin_devices[dev_name]['major']
+                device['minor'] = majmin_devices[dev_name]['minor']
+            else:
+                # Else we try to stat block_device
+                try:
+                    device_num = os.stat(block_device).st_rdev
+                except OSError:
+                    # If we can't stat the device,
+                    # then something weird is going on
+                    logger.error(
+                        'Could not determine major:minor numbers for %s '
+                        '(mounted at %s)! Skipping...',
+                        block_device, mount_point)
+                    continue
+                device['major'] = str(os.major(device_num))
+                device['minor'] = str(os.minor(device_num))
+            devices.append(device)
+    for line in open('/proc/partitions').readlines()[2:]:
+        major, minor, blocks, kernel_device = line.strip().split()
+        device = [d for d in devices
+                  if d['major'] == major and d['minor'] == minor]
+        if device:
+            device[0]['kernel_device'] = kernel_device
+    return devices
+
+
+def get_errors(error_re, log_file_pattern, minutes, logger,
+               log_file_encoding):
+    # Assuming log rotation is being used, we need to examine
+    # recently rotated files in case the rotation occurred
+    # just before the script is being run - the data we are
+    # looking for may have rotated.
+    #
+    # The globbing used before would not work with all out-of-box
+    # distro setup for logrotate and syslog therefore moving this
+    # to the config where one can set it with the desired
+    # globbing pattern.
+    log_files = [f for f in glob.glob(log_file_pattern)]
+    try:
+        log_files.sort(key=lambda f: os.stat(f).st_mtime, reverse=True)
+    except (IOError, OSError) as exc:
+        logger.error(exc)
+        print(exc)
+        sys.exit(1)
+
+    now_time = datetime.datetime.now()
+    end_time = now_time - datetime.timedelta(minutes=minutes)
+    # kern.log does not contain the year so we need to keep
+    # track of the year and month in case the year recently
+    # ticked over
+    year = now_time.year
+    prev_ent_month = now_time.strftime('%b')
+    errors = {}
+
+    reached_old_logs = False
+    for path in log_files:
+        try:
+            f = open(path, 'rb')
+        except IOError:
+            logger.error("Error: Unable to open " + path)
+            print("Unable to open " + path)
+            sys.exit(1)
+        for line in backward(f):
+            line = line.decode(log_file_encoding, 'surrogateescape')
+            if '[    0.000000]' in line \
+                or 'KERNEL supported cpus:' in line \
+                    or 'BIOS-provided physical RAM map:' in line:
+                # Ignore anything before the last boot
+                reached_old_logs = True
+                break
+            # Solves the problem with year change - kern.log does not
+            # keep track of the year.
+            log_time_ent = line.split()[:3]
+            if log_time_ent[0] == 'Dec' and prev_ent_month == 'Jan':
+                year -= 1
+            prev_ent_month = log_time_ent[0]
+            log_time_string = '%d %s' % (year, ' '.join(log_time_ent))
+            try:
+                log_time = datetime.datetime.strptime(
+                    log_time_string, '%Y %b %d %H:%M:%S')
+            except ValueError:
+                # Some versions use ISO timestamps instead
+                try:
+                    log_time = datetime.datetime.strptime(
+                        line[0:19], '%Y-%m-%dT%H:%M:%S')
+                except ValueError:
+                    continue
+            if log_time > end_time:
+                for err in error_re:
+                    for device in err.findall(line):
+                        errors[device] = errors.get(device, 0) + 1
+            else:
+                reached_old_logs = True
+                break
+        if reached_old_logs:
+            break
+    return errors
+
+
+def comment_fstab(mount_point):
+    with open('/etc/fstab', 'r') as fstab:
+        with open('/etc/fstab.new', 'w') as new_fstab:
+            for line in fstab:
+                parts = line.split()
+                if len(parts) > 2 \
+                    and parts[1] == mount_point \
+                        and not line.startswith('#'):
+                    new_fstab.write('#' + line)
+                else:
+                    new_fstab.write(line)
+    os.rename('/etc/fstab.new', '/etc/fstab')
+
+
+def main():
+    c = ConfigParser()
+    try:
+        conf_path = sys.argv[1]
+    except Exception:
+        print("Usage: %s CONF_FILE" % sys.argv[0].split('/')[-1])
+        sys.exit(1)
+    if not c.read(conf_path):
+        print("Unable to read config file %s" % conf_path)
+        sys.exit(1)
+    conf = dict(c.items('drive-audit'))
+    device_dir = conf.get('device_dir', '/srv/node')
+    minutes = int(conf.get('minutes', 60))
+    error_limit = int(conf.get('error_limit', 1))
+    recon_cache_path = conf.get('recon_cache_path', "/var/cache/swift")
+    log_file_pattern = conf.get('log_file_pattern',
+                                '/var/log/kern.*[!.][!g][!z]')
+    log_file_encoding = conf.get('log_file_encoding', 'auto')
+    if log_file_encoding == 'auto':
+        log_file_encoding = locale.getpreferredencoding()
+    log_to_console = config_true_value(conf.get('log_to_console', False))
+    error_re = []
+    for conf_key in conf:
+        if conf_key.startswith('regex_pattern_'):
+            error_pattern = conf[conf_key]
+            try:
+                r = re.compile(error_pattern)
+            except re.error:
+                sys.exit('Error: unable to compile regex pattern "%s"' %
+                         error_pattern)
+            error_re.append(r)
+    if not error_re:
+        error_re = [
+            re.compile(r'\berror\b.*\b(sd[a-z]{1,2}\d?)\b'),
+            re.compile(r'\b(sd[a-z]{1,2}\d?)\b.*\berror\b'),
+        ]
+    conf['log_name'] = conf.get('log_name', 'drive-audit')
+    logger = get_logger(conf, log_to_console=log_to_console,
+                        log_route='drive-audit')
+    devices = get_devices(device_dir, logger)
+    logger.debug("Devices found: %s" % str(devices))
+    if not devices:
+        logger.error("Error: No devices found!")
+    recon_errors = {}
+    total_errors = 0
+    for device in devices:
+        recon_errors[device['mount_point']] = 0
+    errors = get_errors(error_re, log_file_pattern, minutes, logger,
+                        log_file_encoding)
+    logger.debug("Errors found: %s" % str(errors))
+    unmounts = 0
+    for kernel_device, count in errors.items():
+        if count >= error_limit:
+            device = \
+                [d for d in devices if d['kernel_device'] == kernel_device]
+            if device:
+                mount_point = device[0]['mount_point']
+                if mount_point.startswith(device_dir):
+                    if config_true_value(conf.get('unmount_failed_device',
+                                                  True)):
+                        logger.info("Unmounting %s with %d errors" %
+                                    (mount_point, count))
+                        subprocess.call(['umount', '-fl', mount_point])
+                        logger.info("Commenting out %s from /etc/fstab" %
+                                    (mount_point))
+                        comment_fstab(mount_point)
+                        unmounts += 1
+                    else:
+                        logger.info("Detected %s with %d errors "
+                                    "(Device not unmounted)" %
+                                    (mount_point, count))
+                    recon_errors[mount_point] = count
+                    total_errors += count
+    recon_file = recon_cache_path + "/drive.recon"
+    dump_recon_cache(recon_errors, recon_file, logger)
+    dump_recon_cache({'drive_audit_errors': total_errors}, recon_file, logger,
+                     set_owner=conf.get("user", "swift"))
+
+    if unmounts == 0:
+        logger.info("No drives were unmounted")
+    elif os.path.isdir("/run/systemd/system"):
+        logger.debug("fstab updated, calling systemctl daemon-reload")
+        subprocess.call(["/usr/bin/systemctl", "daemon-reload"])
+
+
+if __name__ == '__main__':
+    main()
diff --git a/swift/cli/form_signature.py b/swift/cli/form_signature.py
new file mode 100644
index 0000000000..7a8bff7250
--- /dev/null
+++ b/swift/cli/form_signature.py
@@ -0,0 +1,131 @@
+# Copyright (c) 2010-2012 OpenStack Foundation
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""
+Script for generating a form signature for use with FormPost middleware.
+"""
+import hmac
+from hashlib import sha1
+from os.path import basename
+from time import time
+
+
+def main(argv):
+    if len(argv) != 7:
+        prog = basename(argv[0])
+        print('Syntax: %s <path> <redirect> <max_file_size> '
+              '<max_file_count> <seconds> <key>' % prog)
+        print()
+        print('Where:')
+        print('  <path>            The prefix to use for form uploaded')
+        print('                    objects. For example:')
+        print('                    /v1/account/container/object_prefix_ would')
+        print('                    ensure all form uploads have that path')
+        print('                    prepended to the browser-given file name.')
+        print('  <redirect>        The URL to redirect the browser to after')
+        print('                    the uploads have completed.')
+        print('  <max_file_size>   The maximum file size per file uploaded.')
+        print('  <max_file_count>  The maximum number of uploaded files')
+        print('                    allowed.')
+        print('  <seconds>         The number of seconds from now to allow')
+        print('                    the form post to begin.')
+        print('  <key>             The X-Account-Meta-Temp-URL-Key for the')
+        print('                    account.')
+        print()
+        print('Example output:')
+        print('    Expires: 1323842228')
+        print('  Signature: 18de97e47345a82c4dbfb3b06a640dbb')
+        print()
+        print('Sample form:')
+        print()
+        print('NOTE: the <form> tag\'s "action" attribute does not contain '
+              'the Swift cluster\'s hostname.')
+        print('You should manually add it before using the form.')
+        print()
+        print('<form action="/v1/a/c/o" method="POST" '
+              'enctype="multipart/form-data">')
+        print('  <input type="hidden" name="max_file_size" value="123" />')
+        print('  ... more HTML ...')
+        print('  <input type="submit" />')
+        print('</form>')
+        return 1
+    path, redirect, max_file_size, max_file_count, seconds, key = argv[1:]
+    try:
+        max_file_size = int(max_file_size)
+    except ValueError:
+        max_file_size = -1
+    if max_file_size < 0:
+        print('Please use a <max_file_size> value greater than or equal to 0.')
+        return 1
+    try:
+        max_file_count = int(max_file_count)
+    except ValueError:
+        max_file_count = 0
+    if max_file_count < 1:
+        print('Please use a positive <max_file_count> value.')
+        return 1
+    try:
+        expires = int(time() + int(seconds))
+    except ValueError:
+        expires = 0
+    if expires < 1:
+        print('Please use a positive <seconds> value.')
+        return 1
+    parts = path.split('/', 4)
+    # Must be four parts, ['', 'v1', 'a', 'c'], must be a v1 request, have
+    # account and container values, and optionally have an object prefix.
+    if len(parts) < 4 or parts[0] or parts[1] != 'v1' or not parts[2] or \
+            not parts[3]:
+        print('<path> must point to a container at least.')
+        print('For example: /v1/account/container')
+        print('         Or: /v1/account/container/object_prefix')
+        return 1
+    data = '%s\n%s\n%s\n%s\n%s' % (path, redirect, max_file_size,
+                                   max_file_count, expires)
+    data = data.encode('utf8')
+    key = key if isinstance(key, bytes) else \
+        key.encode('utf8')
+    sig = hmac.new(key, data,
+                   sha1).hexdigest()
+    print('  Expires:', expires)
+    print('Signature:', sig)
+    print('')
+
+    print('Sample form:\n')
+
+    print('NOTE: the <form> tag\'s "action" attribute does not '
+          'contain the Swift cluster\'s hostname.')
+    print('You should manually add it before using the form.\n')
+
+    print('<form action="%s" method="POST" enctype="multipart/form-data">'
+          % path)
+    if redirect:
+        print('  <input type="hidden" name="redirect" value="%s" />'
+              % redirect)
+    print('  <input type="hidden" name="max_file_size" value="%d" />'
+          % max_file_size)
+    print('  <input type="hidden" name="max_file_count" value="%d" />'
+          % max_file_count)
+    print('  <input type="hidden" name="expires" value="%d" />' % expires)
+    print('  <input type="hidden" name="signature" value="%s" />' % sig)
+    print('  <!-- This signature allows for at most %d files, -->'
+          % max_file_count)
+    print('  <!-- but it may also have any smaller number. -->')
+    print('  <!-- Remove file inputs as needed. -->')
+    for i in range(max_file_count):
+        print('  <input type="file" name="file%d" />' % i)
+        print('  <br />')
+    print('  <input type="submit" />')
+    print('</form>')
+    return 0
diff --git a/swift/cli/get_nodes.py b/swift/cli/get_nodes.py
new file mode 100755
index 0000000000..7586cd3b46
--- /dev/null
+++ b/swift/cli/get_nodes.py
@@ -0,0 +1,80 @@
+#!/usr/bin/env python
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import sys
+from optparse import OptionParser
+from os.path import basename
+
+from swift.common.ring import Ring
+from swift.common.storage_policy import reload_storage_policies
+from swift.common.utils import set_swift_dir
+from swift.cli.info import (parse_get_node_args, print_item_locations,
+                            InfoSystemExit)
+
+
+def main():
+
+    usage = '''
+    Shows the nodes responsible for the item specified.
+    Usage: %prog [-a] <ring.gz> <account> [<container> [<object>]]
+    Or:    %prog [-a] <ring.gz> -p partition
+    Or:    %prog [-a] -P policy_name <account> [<container> [<object>]]
+    Or:    %prog [-a] -P policy_name -p partition
+    Note: account, container, object can also be a single arg separated by /
+    Example:
+        $ %prog -a /etc/swift/account.ring.gz MyAccount
+        Partition 5743883
+        Hash 96ae332a60b58910784e4417a03e1ad0
+        10.1.1.7:8000 sdd1
+        10.1.9.2:8000 sdb1
+        10.1.5.5:8000 sdf1
+        10.1.5.9:8000 sdt1 # [Handoff]
+    '''
+    parser = OptionParser(usage)
+    parser.add_option('-a', '--all', action='store_true',
+                      help='Show all handoff nodes')
+    parser.add_option('-p', '--partition', metavar='PARTITION',
+                      help='Show nodes for a given partition')
+    parser.add_option('-P', '--policy-name', dest='policy_name',
+                      help='Specify which policy to use')
+    parser.add_option('-d', '--swift-dir', default='/etc/swift',
+                      dest='swift_dir', help='Path to swift directory')
+    parser.add_option('-Q', '--quoted', action='store_true',
+                      help='Assume swift paths are quoted')
+    options, args = parser.parse_args()
+
+    if set_swift_dir(options.swift_dir):
+        reload_storage_policies()
+
+    try:
+        ring_path, args = parse_get_node_args(options, args)
+    except InfoSystemExit as e:
+        parser.print_help()
+        sys.exit('ERROR: %s' % e)
+
+    ring = ring_name = None
+    if ring_path:
+        ring_name = basename(ring_path)[:-len('.ring.gz')]
+        ring = Ring(ring_path)
+
+    try:
+        print_item_locations(ring, ring_name, *args, **vars(options))
+    except InfoSystemExit:
+        sys.exit(1)
+
+
+if __name__ == '__main__':
+    main()
diff --git a/swift/cli/info.py b/swift/cli/info.py
new file mode 100644
index 0000000000..ffaaee253a
--- /dev/null
+++ b/swift/cli/info.py
@@ -0,0 +1,813 @@
+# Licensed under the Apache License, Version 2.0 (the "License"); you may not
+# use this file except in compliance with the License. You may obtain a copy
+# of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
+# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
+# License for the specific language governing permissions and limitations
+# under the License.
+
+
+import codecs
+import itertools
+import json
+from optparse import OptionParser
+import os
+import sqlite3
+import sys
+from collections import defaultdict
+
+import urllib
+
+from swift.common.exceptions import LockTimeout
+from swift.common.utils import hash_path, storage_directory, \
+    Timestamp, is_valid_ipv6
+from swift.common.ring import Ring
+from swift.common.request_helpers import is_sys_meta, is_user_meta, \
+    strip_sys_meta_prefix, strip_user_meta_prefix, \
+    is_object_transient_sysmeta, strip_object_transient_sysmeta_prefix
+from swift.account.backend import AccountBroker, DATADIR as ABDATADIR
+from swift.container.backend import ContainerBroker, DATADIR as CBDATADIR
+from swift.obj.diskfile import get_data_dir, read_metadata, DATADIR_BASE, \
+    extract_policy
+from swift.common.storage_policy import POLICIES, reload_storage_policies
+from swift.common.swob import wsgi_to_str
+from swift.common.middleware.crypto.crypto_utils import load_crypto_meta
+from swift.common.utils import md5, set_swift_dir
+
+
+class InfoSystemExit(Exception):
+    """
+    Indicates to the caller that a sys.exit(1) should be performed.
+    """
+    pass
+
+
+def parse_get_node_args(options, args):
+    """
+    Parse the get_nodes commandline args
+
+    :returns: a tuple, (ring_path, args)
+    """
+    ring_path = None
+
+    if options.policy_name:
+        if POLICIES.get_by_name(options.policy_name) is None:
+            raise InfoSystemExit('No policy named %r' % options.policy_name)
+    elif args and args[0].endswith('.ring.gz'):
+        if os.path.exists(args[0]):
+            ring_path = args.pop(0)
+        else:
+            raise InfoSystemExit('Ring file does not exist')
+
+    if options.quoted:
+        args = [urllib.parse.unquote(arg) for arg in args]
+    if len(args) == 1:
+        args = args[0].strip('/').split('/', 2)
+
+    if not ring_path and not options.policy_name:
+        raise InfoSystemExit('Need to specify policy_name or <ring.gz>')
+
+    if not (args or options.partition):
+        raise InfoSystemExit('No target specified')
+
+    if len(args) > 3:
+        raise InfoSystemExit('Invalid arguments')
+
+    return ring_path, args
+
+
+def curl_head_command(ip, port, device, part, target, policy_index):
+    """
+    Provide a string that is a well formatted curl command to HEAD an object
+    on a storage node.
+
+    :param ip: the ip of the node
+    :param port: the port of the node
+    :param device: the device of the node
+    :param target: the path of the target resource
+    :param policy_index: the policy_index of the target resource (can be None)
+
+    :returns: a string, a well formatted curl command
+    """
+    if is_valid_ipv6(ip):
+        formatted_ip = '[%s]' % ip
+    else:
+        formatted_ip = ip
+
+    cmd = 'curl -g -I -XHEAD "http://%s:%s/%s/%s/%s"' % (
+        formatted_ip, port, device, part, urllib.parse.quote(target))
+    if policy_index is not None:
+        cmd += ' -H "%s: %s"' % ('X-Backend-Storage-Policy-Index',
+                                 policy_index)
+    cmd += ' --path-as-is'
+    return cmd
+
+
+def print_ring_locations(ring, datadir, account, container=None, obj=None,
+                         tpart=None, all_nodes=False, policy_index=None):
+    """
+    print out ring locations of specified type
+
+    :param ring: ring instance
+    :param datadir: name of directory where things are stored. Usually one of
+                    "accounts", "containers", "objects", or "objects-N".
+    :param account: account name
+    :param container: container name
+    :param obj: object name
+    :param tpart: target partition in ring
+    :param all_nodes: include all handoff nodes. If false, only the N primary
+                      nodes and first N handoffs will be printed.
+    :param policy_index: include policy_index in curl headers
+    """
+    if not ring:
+        raise ValueError("No ring specified")
+    if not datadir:
+        raise ValueError("No datadir specified")
+    if tpart is None and not account:
+        raise ValueError("No partition or account/container/object specified")
+    if not account and (container or obj):
+        raise ValueError("Container/object specified without account")
+    if obj and not container:
+        raise ValueError('Object specified without container')
+
+    if obj:
+        target = '%s/%s/%s' % (account, container, obj)
+    elif container:
+        target = '%s/%s' % (account, container)
+    else:
+        target = '%s' % (account)
+
+    if tpart:
+        part = int(tpart)
+    else:
+        part = ring.get_part(account, container, obj)
+
+    primary_nodes = ring.get_part_nodes(part)
+    handoff_nodes = ring.get_more_nodes(part)
+    if not all_nodes:
+        handoff_nodes = itertools.islice(handoff_nodes, len(primary_nodes))
+    handoff_nodes = list(handoff_nodes)
+
+    if account and not tpart:
+        path_hash = hash_path(account, container, obj)
+    else:
+        path_hash = None
+    print('Partition\t%s' % part)
+    print('Hash     \t%s\n' % path_hash)
+
+    for node in primary_nodes:
+        print('Server:Port Device\t%s:%s %s' % (node['ip'], node['port'],
+                                                node['device']))
+    for node in handoff_nodes:
+        print('Server:Port Device\t%s:%s %s\t [Handoff]' % (
+            node['ip'], node['port'], node['device']))
+
+    print("\n")
+
+    for node in primary_nodes:
+        cmd = curl_head_command(node['ip'], node['port'], node['device'],
+                                part, target, policy_index)
+        print(cmd)
+    for node in handoff_nodes:
+        cmd = curl_head_command(node['ip'], node['port'], node['device'],
+                                part, target, policy_index)
+        cmd += ' # [Handoff]'
+        print(cmd)
+
+    print("\n\nUse your own device location of servers:")
+    print("such as \"export DEVICE=/srv/node\"")
+    if path_hash:
+        for node in primary_nodes:
+            print('ssh %s "ls -lah ${DEVICE:-/srv/node*}/%s/%s"' %
+                  (node['ip'], node['device'],
+                   storage_directory(datadir, part, path_hash)))
+        for node in handoff_nodes:
+            print('ssh %s "ls -lah ${DEVICE:-/srv/node*}/%s/%s" # [Handoff]' %
+                  (node['ip'], node['device'],
+                   storage_directory(datadir, part, path_hash)))
+    else:
+        for node in primary_nodes:
+            print('ssh %s "ls -lah ${DEVICE:-/srv/node*}/%s/%s/%d"' %
+                  (node['ip'], node['device'], datadir, part))
+        for node in handoff_nodes:
+            print('ssh %s "ls -lah ${DEVICE:-/srv/node*}/%s/%s/%d"'
+                  ' # [Handoff]' %
+                  (node['ip'], node['device'], datadir, part))
+
+    print('\nnote: `/srv/node*` is used as default value of `devices`, the '
+          'real value is set in the config file on each storage node.')
+
+
+def get_max_len_sync_item(syncs, item, title):
+    def map_func(element):
+        return str(element[item])
+    return max(list(map(len, map(map_func, syncs))) + [len(title)])
+
+
+def print_db_syncs(incoming, syncs):
+    max_sync_point_len = get_max_len_sync_item(syncs, 'sync_point',
+                                               "Sync Point")
+    max_remote_len = get_max_len_sync_item(syncs, 'remote_id', "Remote ID")
+    print('%s Syncs:' % ('Incoming' if incoming else 'Outgoing'))
+    print('  %s\t%s\t%s' % ("Sync Point".ljust(max_sync_point_len),
+                            "Remote ID".ljust(max_remote_len),
+                            "Updated At"))
+    for sync in syncs:
+        print('  %s\t%s\t%s (%s)' % (
+            str(sync['sync_point']).ljust(max_sync_point_len),
+            sync['remote_id'].ljust(max_remote_len),
+            Timestamp(sync['updated_at']).isoformat,
+            sync['updated_at']))
+
+
+def print_db_info_metadata(db_type, info, metadata, drop_prefixes=False,
+                           verbose=False):
+    """
+    print out data base info/metadata based on its type
+
+    :param db_type: database type, account or container
+    :param info: dict of data base info
+    :param metadata: dict of data base metadata
+    :param drop_prefixes: if True, strip "X-Account-Meta-",
+                          "X-Container-Meta-", "X-Account-Sysmeta-", and
+                          "X-Container-Sysmeta-" when displaying
+                          User Metadata and System Metadata dicts
+    """
+    if info is None:
+        raise ValueError('DB info is None')
+
+    if db_type not in ['container', 'account']:
+        raise ValueError('Wrong DB type')
+
+    try:
+        account = info['account']
+        container = None
+
+        if db_type == 'container':
+            container = info['container']
+            path = '/%s/%s' % (account, container)
+        else:
+            path = '/%s' % account
+
+        print('Path: %s' % path)
+        print('  Account: %s' % account)
+
+        if db_type == 'container':
+            print('  Container: %s' % container)
+
+        print('  Deleted: %s' % info['is_deleted'])
+        path_hash = hash_path(account, container)
+        if db_type == 'container':
+            print('  Container Hash: %s' % path_hash)
+        else:
+            print('  Account Hash: %s' % path_hash)
+
+        print('Metadata:')
+        print('  Created at: %s (%s)' %
+              (Timestamp(info['created_at']).isoformat,
+               info['created_at']))
+        print('  Put Timestamp: %s (%s)' %
+              (Timestamp(info['put_timestamp']).isoformat,
+               info['put_timestamp']))
+        print('  Delete Timestamp: %s (%s)' %
+              (Timestamp(info['delete_timestamp']).isoformat,
+               info['delete_timestamp']))
+        print('  Status Timestamp: %s (%s)' %
+              (Timestamp(info['status_changed_at']).isoformat,
+               info['status_changed_at']))
+        if db_type == 'account':
+            print('  Container Count: %s' % info['container_count'])
+        print('  Object Count: %s' % info['object_count'])
+        print('  Bytes Used: %s' % info['bytes_used'])
+        if db_type == 'container':
+            try:
+                policy_name = POLICIES[info['storage_policy_index']].name
+            except KeyError:
+                policy_name = 'Unknown'
+            print('  Storage Policy: %s (%s)' % (
+                policy_name, info['storage_policy_index']))
+            print('  Reported Put Timestamp: %s (%s)' %
+                  (Timestamp(info['reported_put_timestamp']).isoformat,
+                   info['reported_put_timestamp']))
+            print('  Reported Delete Timestamp: %s (%s)' %
+                  (Timestamp(info['reported_delete_timestamp']).isoformat,
+                   info['reported_delete_timestamp']))
+            print('  Reported Object Count: %s' %
+                  info['reported_object_count'])
+            print('  Reported Bytes Used: %s' % info['reported_bytes_used'])
+        print('  Chexor: %s' % info['hash'])
+        print('  UUID: %s' % info['id'])
+    except KeyError as e:
+        raise ValueError('Info is incomplete: %s' % e)
+
+    meta_prefix = 'x_' + db_type + '_'
+    for key, value in info.items():
+        if key.lower().startswith(meta_prefix):
+            title = key.replace('_', '-').title()
+            print('  %s: %s' % (title, value))
+    user_metadata = {}
+    sys_metadata = {}
+    for key, (value, timestamp) in metadata.items():
+        if is_user_meta(db_type, key):
+            if drop_prefixes:
+                key = strip_user_meta_prefix(db_type, key)
+            user_metadata[key] = value
+        elif is_sys_meta(db_type, key):
+            if drop_prefixes:
+                key = strip_sys_meta_prefix(db_type, key)
+            sys_metadata[key] = value
+        else:
+            title = key.replace('_', '-').title()
+            print('  %s: %s' % (title, value))
+    if sys_metadata:
+        print('  System Metadata:')
+        for key, value in sys_metadata.items():
+            print('    %s: %s' % (key, value))
+    else:
+        print('No system metadata found in db file')
+
+    if user_metadata:
+        print('  User Metadata:')
+        for key, value in user_metadata.items():
+            print('    %s: %s' % (key, value))
+    else:
+        print('No user metadata found in db file')
+
+    if db_type == 'container':
+        print('Sharding Metadata:')
+        shard_type = 'root' if info['is_root'] else 'shard'
+        print('  Type: %s' % shard_type)
+        print('  State: %s' % info['db_state'])
+    if info.get('shard_ranges'):
+        num_shards = len(info['shard_ranges'])
+        print('Shard Ranges (%d):' % num_shards)
+        count_by_state = defaultdict(int)
+        for srange in info['shard_ranges']:
+            count_by_state[(srange.state, srange.state_text)] += 1
+        print('  States:')
+        for key_state, count in sorted(count_by_state.items()):
+            key, state = key_state
+            print('    %9s: %s' % (state, count))
+        if verbose:
+            for srange in info['shard_ranges']:
+                srange = dict(srange, state_text=srange.state_text)
+                print('  Name: %(name)s' % srange)
+                print('    lower: %(lower)r, upper: %(upper)r' % srange)
+                print('    Object Count: %(object_count)d, Bytes Used: '
+                      '%(bytes_used)d, State: %(state_text)s (%(state)d)'
+                      % srange)
+                print('    Created at: %s (%s)'
+                      % (Timestamp(srange['timestamp']).isoformat,
+                         srange['timestamp']))
+                print('    Meta Timestamp: %s (%s)'
+                      % (Timestamp(srange['meta_timestamp']).isoformat,
+                         srange['meta_timestamp']))
+        else:
+            print('(Use -v/--verbose to show more Shard Ranges details)')
+
+
+def print_obj_metadata(metadata, drop_prefixes=False):
+    """
+    Print out basic info and metadata from object, as returned from
+    :func:`swift.obj.diskfile.read_metadata`.
+
+    Metadata should include the keys: name, Content-Type, and
+    X-Timestamp.
+
+    Additional metadata is displayed unmodified.
+
+    :param metadata: dict of object metadata
+    :param drop_prefixes: if True, strip "X-Object-Meta-", "X-Object-Sysmeta-",
+                          and "X-Object-Transient-Sysmeta-" when displaying
+                          User Metadata, System Metadata, and Transient
+                          System Metadata entries
+
+    :raises ValueError:
+    """
+    user_metadata = {}
+    sys_metadata = {}
+    transient_sys_metadata = {}
+    other_metadata = {}
+
+    if not metadata:
+        raise ValueError('Metadata is None')
+    path = metadata.pop('name', '')
+    content_type = metadata.pop('Content-Type', '')
+    ts = Timestamp(metadata.pop('X-Timestamp', Timestamp.zero()))
+    account = container = obj = obj_hash = None
+    if path:
+        try:
+            account, container, obj = path.split('/', 3)[1:]
+        except ValueError:
+            raise ValueError('Path is invalid for object %r' % path)
+        else:
+            obj_hash = hash_path(account, container, obj)
+        print('Path: %s' % path)
+        print('  Account: %s' % account)
+        print('  Container: %s' % container)
+        print('  Object: %s' % obj)
+        print('  Object hash: %s' % obj_hash)
+    else:
+        print('Path: Not found in metadata')
+    if content_type:
+        print('Content-Type: %s' % content_type)
+    else:
+        print('Content-Type: Not found in metadata')
+    if ts:
+        print('Timestamp: %s (%s)' % (ts.isoformat, ts.internal))
+    else:
+        print('Timestamp: Not found in metadata')
+
+    for key, value in metadata.items():
+        if is_user_meta('Object', key):
+            if drop_prefixes:
+                key = strip_user_meta_prefix('Object', key)
+            user_metadata[key] = value
+        elif is_sys_meta('Object', key):
+            if drop_prefixes:
+                key = strip_sys_meta_prefix('Object', key)
+            sys_metadata[key] = value
+        elif is_object_transient_sysmeta(key):
+            if drop_prefixes:
+                key = strip_object_transient_sysmeta_prefix(key)
+            transient_sys_metadata[key] = value
+        else:
+            other_metadata[key] = value
+
+    def print_metadata(title, items):
+        print(title)
+        if items:
+            for key, value in sorted(items.items()):
+                print('  %s: %s' % (key, value))
+        else:
+            print('  No metadata found')
+
+    print_metadata('System Metadata:', sys_metadata)
+    print_metadata('Transient System Metadata:', transient_sys_metadata)
+    print_metadata('User Metadata:', user_metadata)
+    print_metadata('Other Metadata:', other_metadata)
+    for label, meta in [
+        ('Data crypto details',
+         sys_metadata.get('X-Object-Sysmeta-Crypto-Body-Meta')),
+        ('Metadata crypto details',
+         transient_sys_metadata.get('X-Object-Transient-Sysmeta-Crypto-Meta')),
+    ]:
+        if meta is None:
+            continue
+        print('%s: %s' % (
+            label,
+            json.dumps(load_crypto_meta(meta, b64decode=False), indent=2,
+                       sort_keys=True, separators=(',', ': '))))
+
+
+def print_info(db_type, db_file, swift_dir='/etc/swift', stale_reads_ok=False,
+               drop_prefixes=False, verbose=False, sync=False):
+    if db_type not in ('account', 'container'):
+        print("Unrecognized DB type: internal error")
+        raise InfoSystemExit()
+    if not os.path.exists(db_file) or not db_file.endswith('.db'):
+        print("DB file doesn't exist")
+        raise InfoSystemExit()
+    if not db_file.startswith(('/', './')):
+        db_file = './' + db_file  # don't break if the bare db file is given
+    if db_type == 'account':
+        broker = AccountBroker(db_file, stale_reads_ok=stale_reads_ok)
+        datadir = ABDATADIR
+    else:
+        broker = ContainerBroker(db_file, stale_reads_ok=stale_reads_ok)
+        datadir = CBDATADIR
+    try:
+        info = broker.get_info()
+    except sqlite3.OperationalError as err:
+        if 'no such table' in str(err):
+            print("Does not appear to be a DB of type \"%s\": %s"
+                  % (db_type, db_file))
+            raise InfoSystemExit()
+        raise
+    account = info['account']
+    container = None
+    info['is_deleted'] = broker.is_deleted()
+    if db_type == 'container':
+        container = info['container']
+        info['is_root'] = broker.is_root_container()
+        sranges = broker.get_shard_ranges()
+        if sranges:
+            info['shard_ranges'] = sranges
+    print_db_info_metadata(
+        db_type, info, broker.metadata, drop_prefixes, verbose)
+    if sync:
+        # Print incoming / outgoing sync tables.
+        for incoming in (True, False):
+            print_db_syncs(incoming, broker.get_syncs(incoming,
+                                                      include_timestamp=True))
+    try:
+        ring = Ring(swift_dir, ring_name=db_type)
+    except Exception:
+        ring = None
+    else:
+        print_ring_locations(ring, datadir, account, container)
+
+
+def print_obj(datafile, check_etag=True, swift_dir='/etc/swift',
+              policy_name='', drop_prefixes=False):
+    """
+    Display information about an object read from the datafile.
+    Optionally verify the datafile content matches the ETag metadata.
+
+    :param datafile: path on disk to object file
+    :param check_etag: boolean, will read datafile content and verify
+                       computed checksum matches value stored in
+                       metadata.
+    :param swift_dir: the path on disk to rings
+    :param policy_name: optionally the name to use when finding the ring
+    :param drop_prefixes: if True, strip "X-Object-Meta-", "X-Object-Sysmeta-",
+                          and "X-Object-Transient-Sysmeta-" when displaying
+                          User Metadata, System Metadata, and Transient
+                          System Metadata entries
+    """
+    if not os.path.exists(datafile):
+        print("Data file doesn't exist")
+        raise InfoSystemExit()
+    if not datafile.startswith(('/', './')):
+        datafile = './' + datafile
+
+    policy_index = None
+    ring = None
+    datadir = DATADIR_BASE
+
+    # try to extract policy index from datafile disk path
+    fullpath = os.path.abspath(datafile)
+    policy_index = int(extract_policy(fullpath) or POLICIES.legacy)
+
+    try:
+        if policy_index:
+            datadir += '-' + str(policy_index)
+            ring = Ring(swift_dir, ring_name='object-' + str(policy_index))
+        elif policy_index == 0:
+            ring = Ring(swift_dir, ring_name='object')
+    except IOError:
+        # no such ring
+        pass
+
+    if policy_name:
+        policy = POLICIES.get_by_name(policy_name)
+        if policy:
+            policy_index_for_name = policy.idx
+            if (policy_index is not None and
+               policy_index_for_name is not None and
+               policy_index != policy_index_for_name):
+                print('WARNING: Ring does not match policy!')
+                print('Double check your policy name!')
+            if not ring and policy_index_for_name:
+                ring = POLICIES.get_object_ring(policy_index_for_name,
+                                                swift_dir)
+                datadir = get_data_dir(policy_index_for_name)
+
+    with open(datafile, 'rb') as fp:
+        try:
+            metadata = read_metadata(fp)
+        except EOFError:
+            print("Invalid metadata")
+            raise InfoSystemExit()
+        metadata = {wsgi_to_str(k): v if k == 'name' else wsgi_to_str(v)
+                    for k, v in metadata.items()}
+
+        etag = metadata.pop('ETag', '')
+        length = metadata.pop('Content-Length', '')
+        path = metadata.get('name', '')
+        print_obj_metadata(metadata, drop_prefixes)
+
+        # Optional integrity check; it's useful, but slow.
+        file_len = None
+        if check_etag:
+            h = md5(usedforsecurity=False)
+            file_len = 0
+            while True:
+                data = fp.read(64 * 1024)
+                if not data:
+                    break
+                h.update(data)
+                file_len += len(data)
+            h = h.hexdigest()
+            if etag:
+                if h == etag:
+                    print('ETag: %s (valid)' % etag)
+                else:
+                    print("ETag: %s doesn't match file hash of %s!" %
+                          (etag, h))
+            else:
+                print('ETag: Not found in metadata')
+        else:
+            print('ETag: %s (not checked)' % etag)
+            file_len = os.fstat(fp.fileno()).st_size
+
+        if length:
+            if file_len == int(length):
+                print('Content-Length: %s (valid)' % length)
+            else:
+                print("Content-Length: %s doesn't match file length of %s"
+                      % (length, file_len))
+        else:
+            print('Content-Length: Not found in metadata')
+
+        account, container, obj = path.split('/', 3)[1:]
+        if ring:
+            print_ring_locations(ring, datadir, account, container, obj,
+                                 policy_index=policy_index)
+
+
+def print_item_locations(ring, ring_name=None, account=None, container=None,
+                         obj=None, **kwargs):
+    """
+    Display placement information for an item based on ring lookup.
+
+    If a ring is provided it always takes precedence, but warnings will be
+    emitted if it doesn't match other optional arguments like the policy_name
+    or ring_name.
+
+    If no ring is provided the ring_name and/or policy_name will be used to
+    lookup the ring.
+
+    :param ring: a ring instance
+    :param ring_name: server type, or storage policy ring name if object ring
+    :param account: account name
+    :param container: container name
+    :param obj: object name
+    :param partition: part number for non path lookups
+    :param policy_name: name of storage policy to use to lookup the ring
+    :param all_nodes: include all handoff nodes. If false, only the N primary
+                      nodes and first N handoffs will be printed.
+    """
+
+    policy_name = kwargs.get('policy_name', None)
+    part = kwargs.get('partition', None)
+    all_nodes = kwargs.get('all', False)
+    swift_dir = kwargs.get('swift_dir', '/etc/swift')
+
+    if ring and policy_name:
+        policy = POLICIES.get_by_name(policy_name)
+        if policy:
+            if ring_name != policy.ring_name:
+                print('WARNING: mismatch between ring and policy name!')
+        else:
+            print('WARNING: Policy %s is not valid' % policy_name)
+
+    policy_index = None
+    if ring is None and (obj or part):
+        if not policy_name:
+            print('Need a ring or policy')
+            raise InfoSystemExit()
+        policy = POLICIES.get_by_name(policy_name)
+        if not policy:
+            print('No policy named %r' % policy_name)
+            raise InfoSystemExit()
+        policy_index = int(policy)
+        ring = POLICIES.get_object_ring(policy_index, swift_dir)
+        ring_name = (POLICIES.get_by_name(policy_name)).ring_name
+
+    if (container or obj) and not account:
+        print('No account specified')
+        raise InfoSystemExit()
+
+    if obj and not container:
+        print('No container specified')
+        raise InfoSystemExit()
+
+    if not account and not part:
+        print('No target specified')
+        raise InfoSystemExit()
+
+    loc = '<type>'
+    if part and ring_name:
+        if '-' in ring_name and ring_name.startswith('object'):
+            loc = 'objects-' + ring_name.split('-', 1)[1]
+        else:
+            loc = ring_name + 's'
+    if account and container and obj:
+        loc = 'objects'
+        if '-' in ring_name and ring_name.startswith('object'):
+            policy_index = int(ring_name.rsplit('-', 1)[1])
+            loc = 'objects-%d' % policy_index
+    if account and container and not obj:
+        loc = 'containers'
+        if not any([ring, ring_name]):
+            ring = Ring(swift_dir, ring_name='container')
+        else:
+            if ring_name != 'container':
+                print('WARNING: account/container specified ' +
+                      'but ring not named "container"')
+    if account and not container and not obj:
+        loc = 'accounts'
+        if not any([ring, ring_name]):
+            ring = Ring(swift_dir, ring_name='account')
+        else:
+            if ring_name != 'account':
+                print('WARNING: account specified ' +
+                      'but ring not named "account"')
+
+    if account:
+        print('\nAccount  \t%s' % urllib.parse.quote(account))
+    if container:
+        print('Container\t%s' % urllib.parse.quote(container))
+    if obj:
+        print('Object   \t%s\n\n' % urllib.parse.quote(obj))
+    print_ring_locations(ring, loc, account, container, obj, part, all_nodes,
+                         policy_index=policy_index)
+
+
+def obj_main():
+    # Make stdout able to write escaped bytes
+    sys.stdout = codecs.getwriter("utf-8")(
+        sys.stdout.detach(), errors='surrogateescape')
+
+    parser = OptionParser('%prog [options] OBJECT_FILE')
+    parser.add_option(
+        '-n', '--no-check-etag', default=True,
+        action="store_false", dest="check_etag",
+        help="Don't verify file contents against stored etag")
+    parser.add_option(
+        '-d', '--swift-dir', default='/etc/swift', dest='swift_dir',
+        help="Pass location of swift directory")
+    parser.add_option(
+        '--drop-prefixes', default=False, action="store_true",
+        help="When outputting metadata, drop the per-section common prefixes")
+    parser.add_option(
+        '-P', '--policy-name', dest='policy_name',
+        help="Specify storage policy name")
+
+    options, args = parser.parse_args()
+
+    if len(args) != 1:
+        sys.exit(parser.print_help())
+
+    if set_swift_dir(options.swift_dir):
+        reload_storage_policies()
+
+    try:
+        print_obj(*args, **vars(options))
+    except InfoSystemExit:
+        sys.exit(1)
+
+
+def run_print_info(db_type, args, opts):
+    try:
+        print_info(db_type, *args, **opts)
+    except InfoSystemExit:
+        sys.exit(1)
+    except (sqlite3.OperationalError, LockTimeout) as e:
+        if not opts.get('stale_reads_ok'):
+            opts['stale_reads_ok'] = True
+            print('WARNING: Possibly Stale Data')
+            run_print_info(db_type, args, opts)
+            sys.exit(2)
+        else:
+            print('%s info failed: %s' % (db_type.title(), e))
+            sys.exit(1)
+
+
+def container_main():
+    parser = OptionParser('%prog [options] CONTAINER_DB_FILE')
+    parser.add_option(
+        '-d', '--swift-dir', default='/etc/swift',
+        help="Pass location of swift directory")
+    parser.add_option(
+        '--drop-prefixes', default=False, action="store_true",
+        help="When outputting metadata, drop the per-section common prefixes")
+    parser.add_option(
+        '-v', '--verbose', default=False, action="store_true",
+        help="Show all shard ranges. By default, only the number of shard "
+             "ranges is displayed if there are many shards.")
+    parser.add_option(
+        '--sync', '-s', default=False, action="store_true",
+        help="Output the contents of the incoming/outging sync tables")
+
+    options, args = parser.parse_args()
+
+    if len(args) != 1:
+        sys.exit(parser.print_help())
+
+    run_print_info('container', args, vars(options))
+
+
+def account_main():
+    parser = OptionParser('%prog [options] ACCOUNT_DB_FILE')
+    parser.add_option(
+        '-d', '--swift-dir', default='/etc/swift',
+        help="Pass location of swift directory")
+    parser.add_option(
+        '--drop-prefixes', default=False, action="store_true",
+        help="When outputting metadata, drop the per-section common prefixes")
+    parser.add_option(
+        '--sync', '-s', default=False, action="store_true",
+        help="Output the contents of the incoming/outging sync tables")
+
+    options, args = parser.parse_args()
+
+    if len(args) != 1:
+        sys.exit(parser.print_help())
+
+    run_print_info('account', args, vars(options))
diff --git a/swift/cli/manage_shard_ranges.py b/swift/cli/manage_shard_ranges.py
new file mode 100644
index 0000000000..8bfe01a9ae
--- /dev/null
+++ b/swift/cli/manage_shard_ranges.py
@@ -0,0 +1,1215 @@
+# Licensed under the Apache License, Version 2.0 (the "License"); you may not
+# use this file except in compliance with the License. You may obtain a copy
+# of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
+# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
+# License for the specific language governing permissions and limitations
+# under the License.
+"""
+The ``swift-manage-shard-ranges`` tool provides commands for initiating
+sharding of a container. ``swift-manage-shard-ranges`` operates directly on a
+container database file.
+
+.. note::
+
+    ``swift-manage-shard-ranges`` must only be used on one replica of a
+    container database to avoid inconsistent results. The modifications made by
+    ``swift-manage-shard-ranges`` will be automatically copied to other
+    replicas of the container database via normal replication processes.
+
+There are three steps in the process of initiating sharding, each of which may
+be performed in isolation or, as shown below, using a single command.
+
+#. The ``find`` sub-command scans the container database to identify how many
+   shard containers will be required and which objects they will manage. Each
+   shard container manages a range of the object namespace defined by a
+   ``lower`` and ``upper`` bound. The maximum number of objects to be allocated
+   to each shard container is specified on the command line. For example::
+
+    $ swift-manage-shard-ranges <path_to_db> find 500000
+    Loaded db broker for AUTH_test/c1.
+    [
+      {
+        "index": 0,
+        "lower": "",
+        "object_count": 500000,
+        "upper": "o_01086834"
+      },
+      {
+        "index": 1,
+        "lower": "o_01086834",
+        "object_count": 500000,
+        "upper": "o_01586834"
+      },
+      {
+        "index": 2,
+        "lower": "o_01586834",
+        "object_count": 500000,
+        "upper": "o_02087570"
+      },
+      {
+        "index": 3,
+        "lower": "o_02087570",
+        "object_count": 500000,
+        "upper": "o_02587572"
+      },
+      {
+        "index": 4,
+        "lower": "o_02587572",
+        "object_count": 500000,
+        "upper": "o_03087572"
+      },
+      {
+        "index": 5,
+        "lower": "o_03087572",
+        "object_count": 500000,
+        "upper": "o_03587572"
+      },
+      {
+        "index": 6,
+        "lower": "o_03587572",
+        "object_count": 349194,
+        "upper": ""
+      }
+    ]
+    Found 7 ranges in 4.37222s (total object count 3349194)
+
+   This command returns a list of shard ranges each of which describes the
+   namespace to be managed by a shard container. No other action is taken by
+   this command and the container database is unchanged. The output may be
+   redirected to a file for subsequent retrieval by the ``replace`` command.
+   For example::
+
+    $ swift-manage-shard-ranges <path_to_db> find 500000 > my_shard_ranges
+    Loaded db broker for AUTH_test/c1.
+    Found 7 ranges in 2.448s (total object count 3349194)
+
+#. The ``replace`` sub-command deletes any shard ranges that might already be
+   in the container database and inserts shard ranges from a given file. The
+   file contents should be in the format generated by the ``find`` sub-command.
+   For example::
+
+    $ swift-manage-shard-ranges <path_to_db> replace my_shard_ranges
+    Loaded db broker for AUTH_test/c1.
+    No shard ranges found to delete.
+    Injected 7 shard ranges.
+    Run container-replicator to replicate them to other nodes.
+    Use the enable sub-command to enable sharding.
+
+   The container database is modified to store the shard ranges, but the
+   container will not start sharding until sharding is enabled. The ``info``
+   sub-command may be used to inspect the state of the container database at
+   any point, and the ``show`` sub-command may be used to display the inserted
+   shard ranges.
+
+   Shard ranges stored in the container database may be replaced using the
+   ``replace`` sub-command. This will first delete all existing shard ranges
+   before storing new shard ranges. Shard ranges may also be deleted from the
+   container database using the ``delete`` sub-command.
+
+   Shard ranges should not be replaced or deleted using
+   ``swift-manage-shard-ranges`` once the next step of enabling sharding has
+   been taken.
+
+#. The ``enable`` sub-command enables the container for sharding. The sharder
+   daemon and/or container replicator daemon will replicate shard ranges to
+   other replicas of the container DB and the sharder daemon will proceed to
+   shard the container. This process may take some time depending on the size
+   of the container, the number of shard ranges and the underlying hardware.
+
+   .. note::
+
+       Once the ``enable`` sub-command has been used there is no supported
+       mechanism to revert sharding. Do not use ``swift-manage-shard-ranges``
+       to make any further changes to the shard ranges in the container DB.
+
+   For example::
+
+    $ swift-manage-shard-ranges <path_to_db> enable
+    Loaded db broker for AUTH_test/c1.
+    Container moved to state 'sharding' with epoch 1525345093.22908.
+    Run container-sharder on all nodes to shard the container.
+
+   This does not shard the container - sharding is performed by the
+   :ref:`sharder_daemon` - but sets the necessary state in the database for the
+   daemon to subsequently start the sharding process.
+
+   The ``epoch`` value displayed in the output is the time at which sharding
+   was enabled. When the :ref:`sharder_daemon` starts sharding this container
+   it creates a new container database file using the epoch in the filename to
+   distinguish it from the retiring DB that is being sharded.
+
+All three steps may be performed with one sub-command::
+
+    $ swift-manage-shard-ranges <path_to_db> find_and_replace 500000 --enable \
+--force
+    Loaded db broker for AUTH_test/c1.
+    No shard ranges found to delete.
+    Injected 7 shard ranges.
+    Run container-replicator to replicate them to other nodes.
+    Container moved to state 'sharding' with epoch 1525345669.46153.
+    Run container-sharder on all nodes to shard the container.
+
+"""
+import argparse
+import json
+import os.path
+import sys
+import time
+from contextlib import contextmanager
+
+from swift.common.utils import Timestamp, get_logger, ShardRange, readconf, \
+    ShardRangeList, non_negative_int, config_positive_int_value
+from swift.container.backend import ContainerBroker, UNSHARDED
+from swift.container.sharder import make_shard_ranges, sharding_enabled, \
+    CleavingContext, process_compactible_shard_sequences, \
+    find_compactible_shard_sequences, find_overlapping_ranges, \
+    find_paths, rank_paths, finalize_shrinking, DEFAULT_SHARDER_CONF, \
+    ContainerSharderConf, find_paths_with_gaps, combine_shard_ranges, \
+    update_own_shard_range_stats
+
+EXIT_SUCCESS = 0
+EXIT_ERROR = 1
+EXIT_INVALID_ARGS = 2  # consistent with argparse exit code for invalid args
+EXIT_USER_QUIT = 3
+
+MIN_SHARD_RANGE_AGE_FOR_REPAIR = 4 * 3600
+
+# Some CLI options derive their default values from DEFAULT_SHARDER_CONF if
+# they have not been set. It is therefore important that the CLI parser
+# provides None as a default so that we can detect that no value was set on the
+# command line. We use this alias to act as a reminder.
+USE_SHARDER_DEFAULT = object()
+
+
+class ManageShardRangesException(Exception):
+    pass
+
+
+class GapsFoundException(ManageShardRangesException):
+    pass
+
+
+class InvalidStateException(ManageShardRangesException):
+    pass
+
+
+class InvalidSolutionException(ManageShardRangesException):
+    def __init__(self, msg, acceptor_path, overlapping_donors):
+        super(InvalidSolutionException, self).__init__(msg)
+        self.acceptor_path = acceptor_path
+        self.overlapping_donors = overlapping_donors
+
+
+def wrap_for_argparse(func, msg=None):
+    """
+    Wrap the given ``func`` to catch any ``ValueError`` and raise an
+    ``argparse.ArgumentTypeError`` instead.
+
+    :param func: a function.
+    :param msg: an optional message to use with any exception that is used; if
+        not given then the string representation of the ValueError will be
+        used.
+    :return: a function wrapper.
+    """
+    def wrapped_func(*args, **kwargs):
+        try:
+            return func(*args, **kwargs)
+        except ValueError as err:
+            raise argparse.ArgumentTypeError(str(err) if msg is None else msg)
+    return wrapped_func
+
+
+def _proceed(args):
+    if args.dry_run:
+        choice = 'no'
+    elif args.yes:
+        choice = 'yes'
+    else:
+        try:
+            choice = input('Do you want to apply these changes to the '
+                           'container DB? [yes/N]')
+        except (EOFError, KeyboardInterrupt):
+            choice = 'no'
+    if choice != 'yes':
+        print('No changes applied')
+
+    return choice == 'yes'
+
+
+def _print_shard_range(sr, level=0):
+    indent = '  ' * level
+    print(indent + '%r' % sr.name)
+    print(indent + '  objects: %9d, tombstones: %9d, lower: %r'
+          % (sr.object_count, sr.tombstones, sr.lower_str))
+    print(indent + '    state: %9s, deleted: %d             upper: %r'
+          % (sr.state_text, sr.deleted, sr.upper_str))
+
+
+@contextmanager
+def _open_input(args):
+    if args.input == '-':
+        args.input = '<STDIN>'
+        yield sys.stdin
+    else:
+        with open(args.input, 'r') as fd:
+            yield fd
+
+
+def _load_and_validate_shard_data(args, require_index=True):
+    required_keys = ['lower', 'upper', 'object_count']
+    if require_index:
+        required_keys.append('index')
+    try:
+        with _open_input(args) as fd:
+            try:
+                data = json.load(fd)
+                if not isinstance(data, list):
+                    raise ValueError('Shard data must be a list of dicts')
+                for k in required_keys:
+                    for shard in data:
+                        shard[k]  # trigger KeyError for missing required key
+                return data
+            except (TypeError, ValueError, KeyError) as err:
+                print('Failed to load valid shard range data: %r' % err,
+                      file=sys.stderr)
+                exit(2)
+    except IOError as err:
+        print('Failed to open file %s: %s' % (args.input, err),
+              file=sys.stderr)
+        exit(2)
+
+
+def _check_shard_ranges(own_shard_range, shard_ranges):
+    reasons = []
+
+    def reason(x, y):
+        if x != y:
+            reasons.append('%s != %s' % (x, y))
+
+    if not shard_ranges:
+        reasons.append('No shard ranges.')
+    else:
+        reason(own_shard_range.lower, shard_ranges[0].lower)
+        reason(own_shard_range.upper, shard_ranges[-1].upper)
+        for x, y in zip(shard_ranges, shard_ranges[1:]):
+            reason(x.upper, y.lower)
+
+    if reasons:
+        print('WARNING: invalid shard ranges: %s.' % reasons)
+        print('Aborting.')
+        exit(EXIT_ERROR)
+
+
+def _check_own_shard_range(broker, args):
+    # TODO: this check is weak - if the shards prefix changes then we may not
+    # identify a shard container. The goal is to not inadvertently create an
+    # entire namespace default shard range for a shard container.
+    is_shard = broker.account.startswith(args.shards_account_prefix)
+    own_shard_range = broker.get_own_shard_range(no_default=is_shard)
+    if not own_shard_range:
+        print('WARNING: shard container missing own shard range.')
+        print('Aborting.')
+        exit(2)
+    return own_shard_range
+
+
+def _find_ranges(broker, args, status_file=None):
+    start = last_report = time.time()
+    limit = 5 if status_file else -1
+    shard_data, last_found = broker.find_shard_ranges(
+        args.rows_per_shard, limit=limit,
+        minimum_shard_size=args.minimum_shard_size)
+    if shard_data:
+        while not last_found:
+            if last_report + 10 < time.time():
+                print('Found %d ranges in %gs; looking for more...' % (
+                    len(shard_data), time.time() - start), file=status_file)
+                last_report = time.time()
+            # prefix doesn't matter since we aren't persisting it
+            found_ranges = make_shard_ranges(broker, shard_data, '.shards_')
+            more_shard_data, last_found = broker.find_shard_ranges(
+                args.rows_per_shard, existing_ranges=found_ranges, limit=5,
+                minimum_shard_size=args.minimum_shard_size)
+            shard_data.extend(more_shard_data)
+    return shard_data, time.time() - start
+
+
+def find_ranges(broker, args):
+    shard_data, delta_t = _find_ranges(broker, args, sys.stderr)
+    print(json.dumps(shard_data, sort_keys=True, indent=2))
+    print('Found %d ranges in %gs (total object count %s)' %
+          (len(shard_data), delta_t,
+           sum(r['object_count'] for r in shard_data)),
+          file=sys.stderr)
+    return EXIT_SUCCESS
+
+
+def show_shard_ranges(broker, args):
+    shard_ranges = broker.get_shard_ranges(
+        includes=getattr(args, 'includes', None),
+        include_deleted=getattr(args, 'include_deleted', False))
+    shard_data = [dict(sr, state=sr.state_text)
+                  for sr in shard_ranges]
+
+    if not shard_data:
+        print("No shard data found.", file=sys.stderr)
+    elif getattr(args, 'brief', False):
+        print("Existing shard ranges:", file=sys.stderr)
+        print(json.dumps([(sd['lower'], sd['upper']) for sd in shard_data],
+                         sort_keys=True, indent=2))
+    else:
+        print("Existing shard ranges:", file=sys.stderr)
+        print(json.dumps(shard_data, sort_keys=True, indent=2))
+    return EXIT_SUCCESS
+
+
+def db_info(broker, args):
+    print('Sharding enabled = %s' % sharding_enabled(broker))
+    own_sr = broker.get_own_shard_range(no_default=True)
+    print('Own shard range: %s' %
+          (json.dumps(dict(own_sr, state=own_sr.state_text),
+                      sort_keys=True, indent=2)
+           if own_sr else None))
+    db_state = broker.get_db_state()
+    print('db_state = %s' % db_state)
+    info = broker.get_info()
+    print('object_count = %d' % info['object_count'])
+    print('bytes_used = %d' % info['bytes_used'])
+    if db_state == 'sharding':
+        print('Retiring db id: %s' % broker.get_brokers()[0].get_info()['id'])
+        print('Cleaving context: %s' %
+              json.dumps(dict(CleavingContext.load(broker)),
+                         sort_keys=True, indent=2))
+    print('Metadata:')
+    for k, (v, t) in broker.metadata.items():
+        print('  %s = %s' % (k, v))
+    return EXIT_SUCCESS
+
+
+def delete_shard_ranges(broker, args):
+    shard_ranges = broker.get_shard_ranges()
+    if not shard_ranges:
+        print("No shard ranges found to delete.")
+        return EXIT_SUCCESS
+
+    while not args.force:
+        print('This will delete existing %d shard ranges.' % len(shard_ranges))
+        if broker.get_db_state() != UNSHARDED:
+            print('WARNING: Be very cautious about deleting existing shard '
+                  'ranges. Deleting all ranges in this db does not guarantee '
+                  'deletion of all ranges on all replicas of the db.')
+            print('  - this db is in state %s' % broker.get_db_state())
+            print('  - %d existing shard ranges have started sharding' %
+                  [sr.state != ShardRange.FOUND
+                   for sr in shard_ranges].count(True))
+        try:
+            choice = input('Do you want to show the existing ranges [s], '
+                           'delete the existing ranges [yes] '
+                           'or quit without deleting [q]? ')
+        except (EOFError, KeyboardInterrupt):
+            choice = 'q'
+
+        if choice == 's':
+            show_shard_ranges(broker, args)
+            continue
+        elif choice == 'q':
+            return EXIT_USER_QUIT
+        elif choice == 'yes':
+            break
+        else:
+            print('Please make a valid choice.')
+            print()
+
+    now = Timestamp.now()
+    for sr in shard_ranges:
+        sr.deleted = 1
+        sr.timestamp = now
+    broker.merge_shard_ranges(shard_ranges)
+    print('Deleted %s existing shard ranges.' % len(shard_ranges))
+    return EXIT_SUCCESS
+
+
+def merge_shard_ranges(broker, args):
+    _check_own_shard_range(broker, args)
+    shard_data = _load_and_validate_shard_data(args, require_index=False)
+    new_shard_ranges = ShardRangeList([ShardRange.from_dict(sr)
+                                       for sr in shard_data])
+    new_shard_ranges.sort(key=ShardRange.sort_key)
+
+    # do some checks before merging...
+    existing_shard_ranges = ShardRangeList(
+        broker.get_shard_ranges(include_deleted=True))
+    outcome = combine_shard_ranges(new_shard_ranges, existing_shard_ranges)
+    if args.verbose:
+        print('This change will result in the following shard ranges in the '
+              'affected namespace:')
+        print(json.dumps([dict(sr) for sr in outcome], indent=2))
+    overlaps = find_overlapping_ranges(outcome)
+    if overlaps:
+        print('WARNING: this change will result in shard ranges overlaps!')
+    paths_with_gaps = find_paths_with_gaps(outcome)
+    gaps = [gap for start_path, gap, end_path in paths_with_gaps
+            if existing_shard_ranges.includes(gap)]
+    if gaps:
+        print('WARNING: this change will result in shard ranges gaps!')
+
+    if not _proceed(args):
+        return EXIT_USER_QUIT
+
+    with broker.updated_timeout(args.replace_timeout):
+        broker.merge_shard_ranges(new_shard_ranges)
+    print('Injected %d shard ranges.' % len(new_shard_ranges))
+    print('Run container-replicator to replicate them to other nodes.')
+    return EXIT_SUCCESS
+
+
+def _replace_shard_ranges(broker, args, shard_data, timeout=0):
+    own_shard_range = _check_own_shard_range(broker, args)
+    shard_ranges = make_shard_ranges(
+        broker, shard_data, args.shards_account_prefix)
+    _check_shard_ranges(own_shard_range, shard_ranges)
+
+    if args.verbose > 0:
+        print('New shard ranges to be injected:')
+        print(json.dumps([dict(sr) for sr in shard_ranges],
+                         sort_keys=True, indent=2))
+
+    # Crank up the timeout in an effort to *make sure* this succeeds
+    with broker.updated_timeout(max(timeout, args.replace_timeout)):
+        delete_status = delete_shard_ranges(broker, args)
+        if delete_status != EXIT_SUCCESS:
+            return delete_status
+        broker.merge_shard_ranges(shard_ranges)
+
+    print('Injected %d shard ranges.' % len(shard_ranges))
+    print('Run container-replicator to replicate them to other nodes.')
+    if args.enable:
+        return enable_sharding(broker, args)
+    else:
+        print('Use the enable sub-command to enable sharding.')
+        return EXIT_SUCCESS
+
+
+def replace_shard_ranges(broker, args):
+    shard_data = _load_and_validate_shard_data(args)
+    return _replace_shard_ranges(broker, args, shard_data)
+
+
+def find_replace_shard_ranges(broker, args):
+    shard_data, delta_t = _find_ranges(broker, args, sys.stdout)
+    # Since we're trying to one-shot this, and the previous step probably
+    # took a while, make the timeout for writing *at least* that long
+    return _replace_shard_ranges(broker, args, shard_data, timeout=delta_t)
+
+
+def _enable_sharding(broker, own_shard_range, args):
+    if own_shard_range.update_state(ShardRange.SHARDING):
+        own_shard_range.epoch = Timestamp.now()
+        own_shard_range.state_timestamp = own_shard_range.epoch
+    # initialise own_shard_range with current broker object stats...
+    update_own_shard_range_stats(broker, own_shard_range)
+
+    with broker.updated_timeout(args.enable_timeout):
+        broker.merge_shard_ranges([own_shard_range])
+        broker.update_metadata({'X-Container-Sysmeta-Sharding':
+                                ('True', Timestamp.now().normal)})
+    return own_shard_range
+
+
+def enable_sharding(broker, args):
+    own_shard_range = _check_own_shard_range(broker, args)
+    _check_shard_ranges(own_shard_range, broker.get_shard_ranges())
+
+    if own_shard_range.state == ShardRange.ACTIVE:
+        own_shard_range = _enable_sharding(broker, own_shard_range, args)
+        print('Container moved to state %r with epoch %s.' %
+              (own_shard_range.state_text, own_shard_range.epoch.internal))
+    elif own_shard_range.state == ShardRange.SHARDING:
+        if own_shard_range.epoch:
+            print('Container already in state %r with epoch %s.' %
+                  (own_shard_range.state_text, own_shard_range.epoch.internal))
+            print('No action required.')
+        else:
+            print('Container already in state %r but missing epoch.' %
+                  own_shard_range.state_text)
+            own_shard_range = _enable_sharding(broker, own_shard_range, args)
+            print('Container in state %r given epoch %s.' %
+                  (own_shard_range.state_text, own_shard_range.epoch.internal))
+    else:
+        print('WARNING: container in state %s (should be active or sharding).'
+              % own_shard_range.state_text)
+        print('Aborting.')
+        return EXIT_ERROR
+
+    print('Run container-sharder on all nodes to shard the container.')
+    return EXIT_SUCCESS
+
+
+def compact_shard_ranges(broker, args):
+    if not broker.is_root_container():
+        print('WARNING: Shard containers cannot be compacted.')
+        print('This command should be used on a root container.')
+        return EXIT_ERROR
+
+    if not broker.is_sharded():
+        print('WARNING: Container is not yet sharded so cannot be compacted.')
+        return EXIT_ERROR
+
+    shard_ranges = broker.get_shard_ranges()
+    if find_overlapping_ranges([sr for sr in shard_ranges if
+                                sr.state != ShardRange.SHRINKING]):
+        print('WARNING: Container has overlapping shard ranges so cannot be '
+              'compacted.')
+        return EXIT_ERROR
+
+    compactible = find_compactible_shard_sequences(broker,
+                                                   args.shrink_threshold,
+                                                   args.expansion_limit,
+                                                   args.max_shrinking,
+                                                   args.max_expanding)
+    if not compactible:
+        print('No shards identified for compaction.')
+        return EXIT_SUCCESS
+
+    for sequence in compactible:
+        if sequence[-1].state not in (ShardRange.ACTIVE, ShardRange.SHARDED):
+            print('ERROR: acceptor not in correct state: %s' % sequence[-1],
+                  file=sys.stderr)
+            return EXIT_ERROR
+
+    for sequence in compactible:
+        acceptor = sequence[-1]
+        donors = sequence[:-1]
+        print('Donor shard range(s) with total of %d rows:'
+              % donors.row_count)
+        for donor in donors:
+            _print_shard_range(donor, level=1)
+        print('can be compacted into acceptor shard range:')
+        _print_shard_range(acceptor, level=1)
+    print('Total of %d shard sequences identified for compaction.'
+          % len(compactible))
+    print('Once applied to the broker these changes will result in shard '
+          'range compaction the next time the sharder runs.')
+
+    if not _proceed(args):
+        return EXIT_USER_QUIT
+
+    process_compactible_shard_sequences(broker, compactible)
+    print('Updated %s shard sequences for compaction.' % len(compactible))
+    print('Run container-replicator to replicate the changes to other '
+          'nodes.')
+    print('Run container-sharder on all nodes to compact shards.')
+    return EXIT_SUCCESS
+
+
+def _remove_illegal_overlapping_donors(
+        acceptor_path, overlapping_donors, args):
+    # Check parent-children relationship in overlaps between acceptors and
+    # donors, remove any overlapping parent or child shard range from donors.
+    # Note: we can use set() here, since shard range object is hashed by
+    # id and all shard ranges in overlapping_donors are unique already.
+    parent_child_donors = set()
+    for acceptor in acceptor_path:
+        parent_child_donors.update(
+            [donor for donor in overlapping_donors
+                if acceptor.is_child_of(donor) or donor.is_child_of(acceptor)])
+    if parent_child_donors:
+        overlapping_donors = ShardRangeList(
+            [sr for sr in overlapping_donors
+                if sr not in parent_child_donors])
+        print('%d donor shards ignored due to parent-child relationship '
+              'checks' % len(parent_child_donors))
+
+    # Check minimum age requirement in overlaps between acceptors and donors.
+    if args.min_shard_age == 0:
+        return acceptor_path, overlapping_donors
+    ts_now = Timestamp.now()
+    # Remove overlapping donor shard ranges who were created recently within
+    # 'min_shard_age' age limit.
+    qualified_donors = ShardRangeList(
+        [sr for sr in overlapping_donors
+            if float(sr.timestamp) + args.min_shard_age < float(ts_now)])
+    young_donors = len(overlapping_donors) - len(qualified_donors)
+    if young_donors > 0:
+        print('%d overlapping donor shards ignored due to minimum age '
+              'limit' % young_donors)
+    if not qualified_donors:
+        return acceptor_path, None
+    # Remove those overlapping donors whose overlapping acceptors were created
+    # within age limit.
+    donors_with_young_overlap_acceptor = set()
+    for acceptor_sr in acceptor_path:
+        if float(acceptor_sr.timestamp) + args.min_shard_age < float(ts_now):
+            continue
+        donors_with_young_overlap_acceptor.update(
+            [sr for sr in qualified_donors if acceptor_sr.overlaps(sr)])
+    if donors_with_young_overlap_acceptor:
+        qualified_donors = ShardRangeList(
+            [sr for sr in qualified_donors
+             if sr not in donors_with_young_overlap_acceptor])
+        print('%d donor shards ignored due to existence of overlapping young '
+              'acceptors' % len(donors_with_young_overlap_acceptor))
+
+    return acceptor_path, qualified_donors
+
+
+def _find_overlapping_donors(shard_ranges, own_sr, args):
+    shard_ranges = ShardRangeList(shard_ranges)
+    if ShardRange.SHARDING in shard_ranges.states:
+        # This may be over-cautious, but for now we'll avoid dealing with
+        # SHARDING shards (which by design will temporarily overlap with their
+        # sub-shards) and require repair to be re-tried once sharding has
+        # completed. Note that once a shard ranges moves from SHARDING to
+        # SHARDED state and is deleted, some replicas of the shard may still be
+        # in the process of sharding but we cannot detect that at the root.
+        raise InvalidStateException('Found shard ranges in sharding state')
+    if ShardRange.SHRINKING in shard_ranges.states:
+        # Also stop now if there are SHRINKING shard ranges: we would need to
+        # ensure that these were not chosen as acceptors, but for now it is
+        # simpler to require repair to be re-tried once shrinking has
+        # completes.
+        raise InvalidStateException('Found shard ranges in shrinking state')
+
+    paths = find_paths(shard_ranges)
+    ranked_paths = rank_paths(paths, own_sr)
+    if not (ranked_paths and ranked_paths[0].includes(own_sr)):
+        # individual paths do not have gaps within them; if no path spans the
+        # entire namespace then there must be a gap in the shard_ranges
+        raise GapsFoundException
+
+    # simple repair strategy: choose the highest ranked complete sequence and
+    # shrink all other shard ranges into it
+    acceptor_path = ranked_paths[0]
+    acceptor_names = set(sr.name for sr in acceptor_path)
+    overlapping_donors = ShardRangeList([sr for sr in shard_ranges
+                                         if sr.name not in acceptor_names])
+
+    # check that the solution makes sense: if the acceptor path has the most
+    # progressed continuous cleaving, which has reached cleaved_upper, then we
+    # don't expect any shard ranges beyond cleaved_upper to be in states
+    # CLEAVED or ACTIVE, otherwise there should have been a better acceptor
+    # path that reached them.
+    cleaved_states = {ShardRange.CLEAVED, ShardRange.ACTIVE}
+    cleaved_upper = acceptor_path.find_lower(
+        lambda sr: sr.state not in cleaved_states)
+    beyond_cleaved = acceptor_path.filter(marker=cleaved_upper)
+    if beyond_cleaved.states.intersection(cleaved_states):
+        raise InvalidSolutionException(
+            'Isolated cleaved and/or active shard ranges in acceptor path',
+            acceptor_path, overlapping_donors)
+    beyond_cleaved = overlapping_donors.filter(marker=cleaved_upper)
+    if beyond_cleaved.states.intersection(cleaved_states):
+        raise InvalidSolutionException(
+            'Isolated cleaved and/or active shard ranges in donor ranges',
+            acceptor_path, overlapping_donors)
+
+    return _remove_illegal_overlapping_donors(
+        acceptor_path, overlapping_donors, args)
+
+
+def _fix_gaps(broker, args, paths_with_gaps):
+    timestamp = Timestamp.now()
+    solutions = []
+    print('Found %d gaps:' % len(paths_with_gaps))
+    for start_path, gap_range, end_path in paths_with_gaps:
+        if end_path[0].state == ShardRange.ACTIVE:
+            expanding_range = end_path[0]
+            solutions.append((gap_range, expanding_range))
+        elif start_path[-1].state == ShardRange.ACTIVE:
+            expanding_range = start_path[-1]
+            solutions.append((gap_range, expanding_range))
+        else:
+            expanding_range = None
+        print('  gap: %r - %r'
+              % (gap_range.lower, gap_range.upper))
+        print('    apparent gap contents:')
+        for sr in broker.get_shard_ranges(marker=gap_range.lower,
+                                          end_marker=gap_range.upper,
+                                          include_deleted=True):
+            _print_shard_range(sr, 3)
+        if expanding_range:
+            print('    gap can be fixed by expanding neighbor range:')
+            _print_shard_range(expanding_range, 3)
+        else:
+            print('WARNING: cannot fix gap: non-ACTIVE neighbors')
+
+    if args.max_expanding >= 0:
+        solutions = solutions[:args.max_expanding]
+
+    # it's possible that an expanding range is used twice, expanding both down
+    # and up; if so, we only want one copy of it in our merged shard ranges
+    expanding_ranges = {}
+    for gap_range, expanding_range in solutions:
+        expanding_range.expand([gap_range])
+        expanding_range.timestamp = timestamp
+        expanding_ranges[expanding_range.name] = expanding_range
+
+    print('')
+    print('Repairs necessary to fill gaps.')
+    print('The following expanded shard range(s) will be applied to the DB:')
+    for expanding_range in sorted(expanding_ranges.values(),
+                                  key=lambda s: s.lower):
+        _print_shard_range(expanding_range, 2)
+    print('')
+    print(
+        'It is recommended that no other concurrent changes are made to the \n'
+        'shard ranges while fixing gaps. If necessary, abort this change \n'
+        'and stop any auto-sharding processes before repeating this command.'
+    )
+    print('')
+
+    if not _proceed(args):
+        return EXIT_USER_QUIT
+
+    broker.merge_shard_ranges(list(expanding_ranges.values()))
+    print('Run container-replicator to replicate the changes to other nodes.')
+    print('Run container-sharder on all nodes to fill gaps.')
+    return EXIT_SUCCESS
+
+
+def repair_gaps(broker, args):
+    shard_ranges = broker.get_shard_ranges()
+    paths_with_gaps = find_paths_with_gaps(shard_ranges)
+    if paths_with_gaps:
+        return _fix_gaps(broker, args, paths_with_gaps)
+    else:
+        print('Found one complete sequence of %d shard ranges with no gaps.'
+              % len(shard_ranges))
+        print('No repairs necessary.')
+        return EXIT_SUCCESS
+
+
+def print_repair_solution(acceptor_path, overlapping_donors):
+    print('Donors:')
+    for donor in sorted(overlapping_donors):
+        _print_shard_range(donor, level=1)
+    print('Acceptors:')
+    for acceptor in acceptor_path:
+        _print_shard_range(acceptor, level=1)
+
+
+def find_repair_solution(shard_ranges, own_sr, args):
+    try:
+        acceptor_path, overlapping_donors = _find_overlapping_donors(
+            shard_ranges, own_sr, args)
+    except GapsFoundException:
+        print('Found no complete sequence of shard ranges.')
+        print('Repairs necessary to fill gaps.')
+        print('Gap filling not supported by this tool. No repairs performed.')
+        raise
+    except InvalidStateException as exc:
+        print('WARNING: %s' % exc)
+        print('No repairs performed.')
+        raise
+    except InvalidSolutionException as exc:
+        print('ERROR: %s' % exc)
+        print_repair_solution(exc.acceptor_path, exc.overlapping_donors)
+        print('No repairs performed.')
+        raise
+
+    if not overlapping_donors:
+        print('Found one complete sequence of %d shard ranges and no '
+              'overlapping shard ranges.' % len(acceptor_path))
+        print('No repairs necessary.')
+        return None, None
+
+    print('Repairs necessary to remove overlapping shard ranges.')
+    print('Chosen a complete sequence of %d shard ranges with current total '
+          'of %d object records to accept object records from %d overlapping '
+          'donor shard ranges.' %
+          (len(acceptor_path), acceptor_path.object_count,
+           len(overlapping_donors)))
+    if args.verbose:
+        print_repair_solution(acceptor_path, overlapping_donors)
+
+    print('Once applied to the broker these changes will result in:')
+    print('    %d shard ranges being removed.' % len(overlapping_donors))
+    print('    %d object records being moved to the chosen shard ranges.'
+          % overlapping_donors.object_count)
+
+    return acceptor_path, overlapping_donors
+
+
+def repair_overlaps(broker, args):
+    shard_ranges = broker.get_shard_ranges()
+    if not shard_ranges:
+        print('No shards found, nothing to do.')
+        return EXIT_SUCCESS
+
+    own_sr = broker.get_own_shard_range()
+    try:
+        acceptor_path, overlapping_donors = find_repair_solution(
+            shard_ranges, own_sr, args)
+    except ManageShardRangesException:
+        return EXIT_ERROR
+
+    if not acceptor_path:
+        return EXIT_SUCCESS
+
+    if not _proceed(args):
+        return EXIT_USER_QUIT
+
+    # merge changes to the broker...
+    # note: acceptors do not need to be modified since they already span the
+    # complete range
+    ts_now = Timestamp.now()
+    finalize_shrinking(broker, [], overlapping_donors, ts_now)
+    print('Updated %s donor shard ranges.' % len(overlapping_donors))
+    print('Run container-replicator to replicate the changes to other nodes.')
+    print('Run container-sharder on all nodes to repair shards.')
+    return EXIT_SUCCESS
+
+
+def repair_shard_ranges(broker, args):
+    if not broker.is_root_container():
+        print('WARNING: Shard containers cannot be repaired.')
+        print('This command should be used on a root container.')
+        return EXIT_ERROR
+    if args.gaps:
+        return repair_gaps(broker, args)
+    else:
+        return repair_overlaps(broker, args)
+
+
+def analyze_shard_ranges(args):
+    shard_data = _load_and_validate_shard_data(args, require_index=False)
+    for data in shard_data:
+        # allow for incomplete shard range data that may have been scraped from
+        # swift-container-info output
+        data.setdefault('epoch', None)
+    shard_ranges = [ShardRange.from_dict(data) for data in shard_data]
+    whole_sr = ShardRange('whole/namespace', 0)
+    try:
+        find_repair_solution(shard_ranges, whole_sr, args)
+    except ManageShardRangesException:
+        return EXIT_ERROR
+    return EXIT_SUCCESS
+
+
+def _add_find_args(parser):
+    parser.add_argument(
+        'rows_per_shard', nargs='?', type=int, default=USE_SHARDER_DEFAULT,
+        help='Target number of rows for newly created shards. '
+        'Default is half of the shard_container_threshold value if that is '
+        'given in a conf file specified with --config, otherwise %s.'
+        % DEFAULT_SHARDER_CONF['rows_per_shard'])
+    parser.add_argument(
+        '--minimum-shard-size',
+        type=wrap_for_argparse(config_positive_int_value, 'must be > 0'),
+        default=USE_SHARDER_DEFAULT,
+        help='Minimum size of the final shard range. If this is greater than '
+        'one then the final shard range may be extended to more than '
+        'rows_per_shard in order to avoid a further shard range with less '
+        'than minimum-shard-size rows.')
+
+
+def _add_account_prefix_arg(parser):
+    parser.add_argument(
+        '--shards_account_prefix', metavar='shards_account_prefix', type=str,
+        required=False, default='.shards_',
+        help="Prefix for shards account. The default is '.shards_'. This "
+             "should only be changed if the auto_create_account_prefix option "
+             "has been similarly changed in swift.conf.")
+
+
+def _add_replace_args(parser):
+    _add_account_prefix_arg(parser)
+    parser.add_argument(
+        '--replace-timeout', type=int, default=600,
+        help='Minimum DB timeout to use when replacing shard ranges.')
+    parser.add_argument(
+        '--force', '-f', action='store_true', default=False,
+        help='Delete existing shard ranges; no questions asked.')
+    parser.add_argument(
+        '--enable', action='store_true', default=False,
+        help='Enable sharding after adding shard ranges.')
+
+
+def _add_enable_args(parser):
+    parser.add_argument(
+        '--enable-timeout', type=int, default=300,
+        help='DB timeout to use when enabling sharding.')
+
+
+def _add_prompt_args(parser):
+    group = parser.add_mutually_exclusive_group()
+    group.add_argument(
+        '--yes', '-y', action='store_true', default=False,
+        help='Apply shard range changes to broker without prompting. '
+             'Cannot be used with --dry-run option.')
+    group.add_argument(
+        '--dry-run', '-n', action='store_true', default=False,
+        help='Do not apply any shard range changes to broker. '
+             'Cannot be used with --yes option.')
+
+
+def _add_skip_or_force_commits_arg(parser):
+    """
+    We merge in the pending file by default, this is always correct and
+    useful for probe tests where shard containers have unrealistically low
+    numbers of objects, of which a significant proportion may still be in the
+    pending file.  If you have 10GB databases with 100M objects you can use
+    --skip-commits and the selected shard ranges probably won't be that
+    different. The --force-commits option is redundant and may be deprecated.
+    """
+    group = parser.add_mutually_exclusive_group()
+    group.add_argument(
+        '--skip-commits', action='store_true', dest='skip_commits',
+        default=False,
+        help='Skip commits for pending object updates. By default the broker'
+             ' will commit pending object updates.')
+    group.add_argument(
+        '--force-commits', action='store_false', dest='skip_commits',
+        default=argparse.SUPPRESS, help=argparse.SUPPRESS)
+
+
+def _add_max_expanding_arg(parser):
+    parser.add_argument(
+        '--max-expanding', nargs='?',
+        type=wrap_for_argparse(config_positive_int_value, 'must be > 0'),
+        default=USE_SHARDER_DEFAULT,
+        help='Maximum number of shards that should be '
+        'expanded. Defaults to unlimited.')
+
+
+def _make_parser():
+    parser = argparse.ArgumentParser(description='Manage shard ranges')
+    parser.add_argument('path_to_file',
+                        help='Path to a container DB file or, for the analyze '
+                        'subcommand, a shard data file.')
+    parser.add_argument('--config', dest='conf_file', required=False,
+                        help='Path to config file with [container-sharder] '
+                             'section. The following subcommand options will '
+                             'be loaded from a config file if they are not '
+                             'given on the command line: '
+                             'rows_per_shard, '
+                             'max_shrinking, '
+                             'max_expanding, '
+                             'shrink_threshold, '
+                             'expansion_limit')
+    parser.add_argument('--verbose', '-v', action='count', default=0,
+                        help='Increase output verbosity')
+    _add_skip_or_force_commits_arg(parser)
+
+    subparsers = parser.add_subparsers(
+        dest='subcommand', help='Sub-command help', title='Sub-commands')
+
+    # find
+    find_parser = subparsers.add_parser(
+        'find', help='Find and display shard ranges')
+    _add_find_args(find_parser)
+    find_parser.set_defaults(func=find_ranges)
+
+    # delete
+    delete_parser = subparsers.add_parser(
+        'delete', help='Delete all existing shard ranges from db')
+    delete_parser.add_argument(
+        '--force', '-f', action='store_true', default=False,
+        help='Delete existing shard ranges; no questions asked.')
+    delete_parser.set_defaults(func=delete_shard_ranges)
+
+    # show
+    show_parser = subparsers.add_parser(
+        'show', help='Print shard range data')
+    show_parser.add_argument(
+        '--include_deleted', '-d', action='store_true', default=False,
+        help='Include deleted shard ranges in output.')
+    show_parser.add_argument(
+        '--brief', '-b', action='store_true', default=False,
+        help='Show only shard range bounds in output.')
+    show_parser.add_argument('--includes',
+                             help='limit shard ranges to include key')
+    show_parser.set_defaults(func=show_shard_ranges)
+
+    # info
+    info_parser = subparsers.add_parser(
+        'info', help='Print container db info')
+    info_parser.set_defaults(func=db_info)
+
+    # merge
+    merge_parser = subparsers.add_parser(
+        'merge',
+        help='Merge shard range(s) from file with existing shard ranges. This '
+             'subcommand should only be used if you are confident that you '
+             'know what you are doing. Shard ranges should not typically be '
+             'modified in this way.')
+    merge_parser.add_argument('input', metavar='input_file',
+                              type=str, help='Name of file')
+    merge_parser.add_argument(
+        '--replace-timeout', type=int, default=600,
+        help='Minimum DB timeout to use when merging shard ranges.')
+    _add_account_prefix_arg(merge_parser)
+    _add_prompt_args(merge_parser)
+    merge_parser.set_defaults(func=merge_shard_ranges)
+
+    # replace
+    replace_parser = subparsers.add_parser(
+        'replace',
+        help='Replace existing shard ranges. User will be prompted before '
+             'deleting any existing shard ranges.')
+    replace_parser.add_argument('input', metavar='input_file',
+                                type=str, help='Name of file')
+    _add_replace_args(replace_parser)
+    replace_parser.set_defaults(func=replace_shard_ranges)
+
+    # find_and_replace
+    find_replace_parser = subparsers.add_parser(
+        'find_and_replace',
+        help='Find new shard ranges and replace existing shard ranges. '
+             'User will be prompted before deleting any existing shard ranges.'
+    )
+    _add_find_args(find_replace_parser)
+    _add_replace_args(find_replace_parser)
+    _add_enable_args(find_replace_parser)
+    find_replace_parser.set_defaults(func=find_replace_shard_ranges)
+
+    # enable
+    enable_parser = subparsers.add_parser(
+        'enable', help='Enable sharding and move db to sharding state.')
+    _add_enable_args(enable_parser)
+    enable_parser.set_defaults(func=enable_sharding)
+    _add_replace_args(enable_parser)
+
+    # compact
+    compact_parser = subparsers.add_parser(
+        'compact',
+        help='Compact shard ranges with less than the shrink-threshold number '
+             'of rows. This command only works on root containers.')
+    _add_prompt_args(compact_parser)
+    compact_parser.add_argument(
+        '--shrink-threshold', nargs='?',
+        type=wrap_for_argparse(config_positive_int_value, 'must be > 0'),
+        default=USE_SHARDER_DEFAULT,
+        help='The number of rows below which a shard can qualify for '
+        'shrinking. '
+        'Defaults to %d' % DEFAULT_SHARDER_CONF['shrink_threshold'])
+    compact_parser.add_argument(
+        '--expansion-limit', nargs='?',
+        type=wrap_for_argparse(config_positive_int_value, 'must be > 0'),
+        default=USE_SHARDER_DEFAULT,
+        help='Maximum number of rows for an expanding shard to have after '
+        'compaction has completed. '
+        'Defaults to %d' % DEFAULT_SHARDER_CONF['expansion_limit'])
+    # If just one donor shard is chosen to shrink to an acceptor then the
+    # expanded acceptor will handle object listings as soon as the donor shard
+    # has shrunk. If more than one donor shard are chosen to shrink to an
+    # acceptor then the acceptor may not handle object listings for some donor
+    # shards that have shrunk until *all* donors have shrunk, resulting in
+    # temporary gap(s) in object listings where the shrunk donors are missing.
+    compact_parser.add_argument(
+        '--max-shrinking', nargs='?',
+        type=wrap_for_argparse(config_positive_int_value, 'must be > 0'),
+        default=USE_SHARDER_DEFAULT,
+        help='Maximum number of shards that should be '
+        'shrunk into each expanding shard. '
+        'Defaults to 1. Using values greater '
+        'than 1 may result in temporary gaps in '
+        'object listings until all selected '
+        'shards have shrunk.')
+    _add_max_expanding_arg(compact_parser)
+    compact_parser.set_defaults(func=compact_shard_ranges)
+
+    # repair
+    repair_parser = subparsers.add_parser(
+        'repair',
+        help='Repair overlapping shard ranges. No action will be taken '
+             'without user confirmation unless the -y option is used.')
+    _add_prompt_args(repair_parser)
+    repair_parser.add_argument(
+        '--min-shard-age', nargs='?',
+        type=wrap_for_argparse(non_negative_int, 'must be >= 0'),
+        default=MIN_SHARD_RANGE_AGE_FOR_REPAIR,
+        help='Minimum age of a shard for it to be considered as an overlap '
+        'that is due for repair. Overlapping shards younger than this '
+        'age will be ignored. Value of 0 means no recent shards will be '
+        'ignored. Defaults to %d.' % MIN_SHARD_RANGE_AGE_FOR_REPAIR)
+    # TODO: maybe this should be a separate subcommand given that it needs
+    #  some extra options vs repairing overlaps?
+    repair_parser.add_argument(
+        '--gaps', action='store_true', default=False,
+        help='Repair gaps in shard ranges.')
+    _add_max_expanding_arg(repair_parser)
+    repair_parser.set_defaults(func=repair_shard_ranges)
+
+    # analyze
+    analyze_parser = subparsers.add_parser(
+        'analyze',
+        help='Analyze shard range json data read from file. Use -v to see '
+             'more detailed analysis.')
+    analyze_parser.add_argument(
+        '--min-shard-age', nargs='?',
+        type=wrap_for_argparse(non_negative_int, 'must be >= 0'),
+        default=0,
+        help='Minimum age of a shard for it to be considered as an overlap '
+        'that is due for repair. Overlapping shards younger than this '
+        'age will be ignored. Value of 0 means no recent shards will be '
+        'ignored. Defaults to 0.')
+    analyze_parser.set_defaults(func=analyze_shard_ranges)
+
+    return parser
+
+
+def main(cli_args=None):
+    parser = _make_parser()
+    args = parser.parse_args(cli_args)
+    if not args.subcommand:
+        # On py2, subparsers are required; on py3 they are not; see
+        # https://bugs.python.org/issue9253. py37 added a `required` kwarg
+        # to let you control it, but prior to that, there was no choice in
+        # the matter. So, check whether the destination was set and bomb
+        # out if not.
+        parser.print_help()
+        print('\nA sub-command is required.', file=sys.stderr)
+        return EXIT_INVALID_ARGS
+
+    try:
+        conf = {}
+        if args.conf_file:
+            conf = readconf(args.conf_file, 'container-sharder')
+        conf.update(dict((k, v) for k, v in vars(args).items()
+                         if v != USE_SHARDER_DEFAULT))
+        conf_args = ContainerSharderConf(conf)
+    except (OSError, IOError) as exc:
+        print('Error opening config file %s: %s' % (args.conf_file, exc),
+              file=sys.stderr)
+        return EXIT_ERROR
+    except (TypeError, ValueError) as exc:
+        print('Error loading config: %s' % exc, file=sys.stderr)
+        return EXIT_INVALID_ARGS
+
+    for k, v in vars(args).items():
+        # set any un-set cli args from conf_args
+        if v is USE_SHARDER_DEFAULT:
+            setattr(args, k, getattr(conf_args, k))
+
+    try:
+        ContainerSharderConf.validate_conf(args)
+    except ValueError as err:
+        print('Invalid config: %s' % err, file=sys.stderr)
+        return EXIT_INVALID_ARGS
+
+    if args.func in (analyze_shard_ranges,):
+        args.input = args.path_to_file
+        return args.func(args) or 0
+
+    logger = get_logger({}, name='ContainerBroker', log_to_console=True)
+    broker = ContainerBroker(os.path.realpath(args.path_to_file),
+                             logger=logger,
+                             skip_commits=args.skip_commits)
+    try:
+        broker.get_info()
+    except Exception as exc:
+        print('Error opening container DB %s: %s' % (args.path_to_file, exc),
+              file=sys.stderr)
+        return EXIT_ERROR
+    print('Loaded db broker for %s' % broker.path, file=sys.stderr)
+    return args.func(broker, args)
+
+
+if __name__ == '__main__':
+    exit(main())
diff --git a/swift/cli/oldies.py b/swift/cli/oldies.py
new file mode 100755
index 0000000000..7c6abe0bb2
--- /dev/null
+++ b/swift/cli/oldies.py
@@ -0,0 +1,93 @@
+#!/usr/bin/env python
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import optparse
+import subprocess
+import sys
+
+
+def main():
+    parser = optparse.OptionParser(usage='''%prog [options]
+
+Lists old Swift processes.
+        '''.strip())
+    parser.add_option('-a', '--age', dest='hours', type='int', default=720,
+                      help='look for processes at least HOURS old; '
+                      'default: 720 (30 days)')
+    parser.add_option('-p', '--pids', action='store_true',
+                      help='only print the pids found; for example, to pipe '
+                      'to xargs kill')
+    (options, args) = parser.parse_args()
+
+    listing = []
+    for line in subprocess.Popen(
+            ['ps', '-eo', 'etime,pid,args', '--no-headers'],
+            stdout=subprocess.PIPE).communicate()[0].split(b'\n'):
+        if not line:
+            continue
+        hours = 0
+        try:
+            etime, pid, args = line.decode('ascii').split(None, 2)
+        except ValueError:
+            # This covers both decoding and not-enough-values-to-unpack errors
+            sys.exit('Could not process ps line %r' % line)
+        if not args.startswith((
+                '/usr/bin/python /usr/bin/swift-',
+                '/usr/bin/python /usr/local/bin/swift-',
+                '/bin/python /usr/bin/swift-',
+                '/usr/bin/python3 /usr/bin/swift-',
+                '/usr/bin/python3 /usr/local/bin/swift-',
+                '/bin/python3 /usr/bin/swift-')):
+            continue
+        args = args.split('-', 1)[1]
+        etime = etime.split('-')
+        if len(etime) == 2:
+            hours = int(etime[0]) * 24
+            etime = etime[1]
+        elif len(etime) == 1:
+            etime = etime[0]
+        else:
+            sys.exit('Could not process etime value from %r' % line)
+        etime = etime.split(':')
+        if len(etime) == 3:
+            hours += int(etime[0])
+        elif len(etime) != 2:
+            sys.exit('Could not process etime value from %r' % line)
+        if hours >= options.hours:
+            listing.append((str(hours), pid, args))
+
+    if not listing:
+        sys.exit()
+
+    if options.pids:
+        for hours, pid, args in listing:
+            print(pid)
+    else:
+        hours_len = len('Hours')
+        pid_len = len('PID')
+        args_len = len('Command')
+        for hours, pid, args in listing:
+            hours_len = max(hours_len, len(hours))
+            pid_len = max(pid_len, len(pid))
+            args_len = max(args_len, len(args))
+        args_len = min(args_len, 78 - hours_len - pid_len)
+
+        print('%*s %*s %s' % (hours_len, 'Hours', pid_len, 'PID', 'Command'))
+        for hours, pid, args in listing:
+            print('%*s %*s %s' % (hours_len, hours, pid_len,
+                                  pid, args[:args_len]))
+
+
+if __name__ == '__main__':
+    main()
diff --git a/bin/swift-orphans b/swift/cli/orphans.py
similarity index 64%
rename from bin/swift-orphans
rename to swift/cli/orphans.py
index 3eb799c0e5..d957afd7d4 100755
--- a/bin/swift-orphans
+++ b/swift/cli/orphans.py
@@ -1,13 +1,28 @@
 #!/usr/bin/env python
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
 
 import optparse
 import os
+import re
 import signal
 import subprocess
 import sys
 
+from swift.common.manager import RUN_DIR
 
-if __name__ == '__main__':
+
+def main():
     parser = optparse.OptionParser(usage='''%prog [options]
 
 Lists and optionally kills orphaned Swift processes. This is done by scanning
@@ -28,36 +43,44 @@
     parser.add_option('-w', '--wide', dest='wide', default=False,
                       action='store_true',
                       help="don't clip the listing at 80 characters")
+    parser.add_option('-r', '--run-dir', type="str",
+                      dest="run_dir", default=RUN_DIR,
+                      help="alternative directory to store running pid files "
+                      "default: %s" % RUN_DIR)
     (options, args) = parser.parse_args()
 
     pids = []
-    for root, directories, files in os.walk('/var/run/swift'):
+
+    for root, directories, files in os.walk(options.run_dir):
         for name in files:
-            if name.endswith('.pid'):
+            if name.endswith(('.pid', '.pid.d')):
                 pids.append(open(os.path.join(root, name)).read().strip())
                 pids.extend(subprocess.Popen(
                     ['ps', '--ppid', pids[-1], '-o', 'pid', '--no-headers'],
-                    stdout=subprocess.PIPE).communicate()[0].split())
+                    stdout=subprocess.PIPE).communicate()[0].decode().split())
 
     listing = []
+    swift_cmd_re = re.compile(
+        '^/usr/bin/python[23]? /usr(?:/local)?/bin/swift-')
     for line in subprocess.Popen(
             ['ps', '-eo', 'etime,pid,args', '--no-headers'],
-            stdout=subprocess.PIPE).communicate()[0].split('\n'):
+            stdout=subprocess.PIPE).communicate()[0].split(b'\n'):
         if not line:
             continue
         hours = 0
         try:
-            etime, pid, args = line.split(None, 2)
+            etime, pid, args = line.decode('ascii').split(None, 2)
         except ValueError:
             sys.exit('Could not process ps line %r' % line)
         if pid in pids:
             continue
-        if (not args.startswith('/usr/bin/python /usr/bin/swift-') and
-            not args.startswith('/usr/bin/python /usr/local/bin/swift-')) or \
-                'swift-orphans' in args or \
-                'once' in args.split():
+        if any([
+            not swift_cmd_re.match(args),
+            'swift-orphans' in args,
+            'once' in args.split(),
+        ]):
             continue
-        args = args.split('-', 1)[1]
+        args = args.split('swift-', 1)[1]
         etime = etime.split('-')
         if len(etime) == 2:
             hours = int(etime[0]) * 24
@@ -75,7 +98,7 @@
             listing.append((str(hours), pid, args))
 
     if not listing:
-        exit()
+        sys.exit()
 
     hours_len = len('Hours')
     pid_len = len('PID')
@@ -86,11 +109,11 @@
         args_len = max(args_len, len(args))
     args_len = min(args_len, 78 - hours_len - pid_len)
 
-    print ('%%%ds %%%ds %%s' % (hours_len, pid_len)) % \
-          ('Hours', 'PID', 'Command')
+    print('%*s %*s %s' %
+          (hours_len, 'Hours', pid_len, 'PID', 'Command'))
     for hours, pid, args in listing:
-        print ('%%%ds %%%ds %%s' % (hours_len, pid_len)) % \
-              (hours, pid, args[:args_len])
+        print('%*s %*s %s' %
+              (hours_len, hours, pid_len, pid, args[:args_len]))
 
     if options.signal:
         try:
@@ -102,7 +125,12 @@
         if not signum:
             sys.exit('Could not translate %r to a signal number.' %
                      options.signal)
-        print 'Sending processes %s (%d) signal...' % (options.signal, signum),
+        print('Sending processes %s (%d) signal...' % (options.signal, signum),
+              end='')
         for hours, pid, args in listing:
             os.kill(int(pid), signum)
-        print 'Done.'
+        print('Done.')
+
+
+if __name__ == '__main__':
+    main()
diff --git a/swift/cli/recon.py b/swift/cli/recon.py
new file mode 100644
index 0000000000..d693be287a
--- /dev/null
+++ b/swift/cli/recon.py
@@ -0,0 +1,1295 @@
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""
+    cmdline utility to perform cluster reconnaissance
+"""
+
+
+from eventlet.green import socket
+from urllib.parse import urlparse
+
+from swift.common.utils import (
+    SWIFT_CONF_FILE, md5_hash_for_file, set_swift_dir)
+from swift.common.ring import Ring
+from swift.common.storage_policy import POLICIES, reload_storage_policies
+import eventlet
+import json
+import optparse
+import time
+import sys
+import os
+
+from eventlet.green.urllib import request as urllib_request
+
+
+def seconds2timeunit(seconds):
+    elapsed = seconds
+    unit = 'seconds'
+    if elapsed >= 60:
+        elapsed = elapsed / 60.0
+        unit = 'minutes'
+        if elapsed >= 60:
+            elapsed = elapsed / 60.0
+            unit = 'hours'
+            if elapsed >= 24:
+                elapsed = elapsed / 24.0
+                unit = 'days'
+    return elapsed, unit
+
+
+def size_suffix(size):
+    suffixes = ['bytes', 'kB', 'MB', 'GB', 'TB', 'PB', 'EB', 'ZB', 'YB']
+    for suffix in suffixes:
+        if size < 1000:
+            return "%s %s" % (size, suffix)
+        size = size // 1000
+    return "%s %s" % (size, suffix)
+
+
+class Scout(object):
+    """
+    Obtain swift recon information
+    """
+
+    def __init__(self, recon_type, verbose=False, suppress_errors=False,
+                 timeout=5):
+        self.recon_type = recon_type
+        self.verbose = verbose
+        self.suppress_errors = suppress_errors
+        self.timeout = timeout
+
+    def scout_host(self, base_url, recon_type):
+        """
+        Perform the actual HTTP request to obtain swift recon telemetry.
+
+        :param base_url: the base url of the host you wish to check. str of the
+                        format 'http://127.0.0.1:6200/recon/'
+        :param recon_type: the swift recon check to request.
+        :returns: tuple of (recon url used, response body, and status)
+        """
+        url = base_url + recon_type
+        try:
+            body = urllib_request.urlopen(url, timeout=self.timeout).read()
+            if isinstance(body, bytes):
+                body = body.decode('utf8')
+            content = json.loads(body)
+            if self.verbose:
+                print("-> %s: %s" % (url, content))
+            status = 200
+        except urllib_request.HTTPError as err:
+            if not self.suppress_errors or self.verbose:
+                print("-> %s: %s" % (url, err))
+            content = err
+            status = err.code
+        except (urllib_request.URLError, socket.timeout) as err:
+            if not self.suppress_errors or self.verbose:
+                print("-> %s: %s" % (url, err))
+            content = err
+            status = -1
+        return url, content, status
+
+    def scout(self, host):
+        """
+        Obtain telemetry from a host running the swift recon middleware.
+
+        :param host: host to check
+        :returns: tuple of (recon url used, response body, status, time start
+                  and time end)
+        """
+        base_url = "http://%s:%s/recon/" % (host[0], host[1])
+        ts_start = time.time()
+        url, content, status = self.scout_host(base_url, self.recon_type)
+        ts_end = time.time()
+        return url, content, status, ts_start, ts_end
+
+    def scout_server_type(self, host):
+        """
+        Obtain Server header by calling OPTIONS.
+
+        :param host: host to check
+        :returns: Server type, status
+        """
+        try:
+            url = "http://%s:%s/" % (host[0], host[1])
+            req = urllib_request.Request(url)
+            req.get_method = lambda: 'OPTIONS'
+            conn = urllib_request.urlopen(req)
+            header = conn.info().get('Server')
+            server_header = header.split('/')
+            content = server_header[0]
+            status = 200
+        except urllib_request.HTTPError as err:
+            if not self.suppress_errors or self.verbose:
+                print("-> %s: %s" % (url, err))
+            content = err
+            status = err.code
+        except (urllib_request.URLError, socket.timeout) as err:
+            if not self.suppress_errors or self.verbose:
+                print("-> %s: %s" % (url, err))
+            content = err
+            status = -1
+        return url, content, status
+
+
+class SwiftRecon(object):
+    """
+    Retrieve and report cluster info from hosts running recon middleware.
+    """
+
+    def __init__(self):
+        self.verbose = False
+        self.suppress_errors = False
+        self.timeout = 5
+        self.pool_size = 30
+        self.pool = eventlet.GreenPool(self.pool_size)
+        self.check_types = ['account', 'container', 'object']
+        self.server_type = 'object'
+
+    def _gen_stats(self, stats, name=None):
+        """Compute various stats from a list of values."""
+        cstats = [x for x in stats if x is not None]
+        if len(cstats) > 0:
+            ret_dict = {'low': min(cstats), 'high': max(cstats),
+                        'total': sum(cstats), 'reported': len(cstats),
+                        'number_none': len(stats) - len(cstats), 'name': name}
+            ret_dict['average'] = ret_dict['total'] / float(len(cstats))
+            ret_dict['perc_none'] = \
+                ret_dict['number_none'] * 100.0 / len(stats)
+        else:
+            ret_dict = {'reported': 0}
+        return ret_dict
+
+    def _print_stats(self, stats):
+        """
+        print out formatted stats to console
+
+        :param stats: dict of stats generated by _gen_stats
+        """
+        print('[%(name)s] low: %(low)d, high: %(high)d, avg: '
+              '%(average).1f, total: %(total)d, '
+              'Failed: %(perc_none).1f%%, no_result: %(number_none)d, '
+              'reported: %(reported)d' % stats)
+
+    def _ptime(self, timev=None):
+        """
+        :param timev: a unix timestamp or None
+        :returns: a pretty string of the current time or provided time in UTC
+        """
+        if timev:
+            return time.strftime("%Y-%m-%d %H:%M:%S", time.gmtime(timev))
+        else:
+            return time.strftime("%Y-%m-%d %H:%M:%S", time.gmtime())
+
+    def get_hosts(self, region_filter, zone_filter, swift_dir, ring_names):
+        """
+        Get a list of hosts in the rings.
+
+        :param region_filter: Only list regions matching given filter
+        :param zone_filter: Only list zones matching given filter
+        :param swift_dir: Directory of swift config, usually /etc/swift
+        :param ring_names: Collection of ring names, such as
+         ['object', 'object-2']
+        :returns: a set of tuples containing the ip and port of hosts
+        """
+        rings = [Ring(swift_dir, ring_name=n) for n in ring_names]
+        devs = [d for r in rings for d in r.devs if d]
+        if region_filter is not None:
+            devs = [d for d in devs if d['region'] == region_filter]
+        if zone_filter is not None:
+            devs = [d for d in devs if d['zone'] == zone_filter]
+        return set((d['ip'], d['port']) for d in devs)
+
+    def get_ringmd5(self, hosts, swift_dir):
+        """
+        Compare ring md5sum's with those on remote host
+
+        :param hosts: set of hosts to check. in the format of:
+            set([('127.0.0.1', 6220), ('127.0.0.2', 6230)])
+        :param swift_dir: The local directory with the ring files.
+        """
+        matches = 0
+        errors = 0
+        ring_names = set()
+        if self.server_type == 'object':
+            for ring_name in os.listdir(swift_dir):
+                if ring_name.startswith('object') and \
+                        ring_name.endswith('.ring.gz'):
+                    ring_names.add(ring_name)
+        else:
+            ring_name = '%s.ring.gz' % self.server_type
+            ring_names.add(ring_name)
+        rings = {}
+        for ring_name in ring_names:
+            rings[ring_name] = md5_hash_for_file(
+                os.path.join(swift_dir, ring_name))
+        recon = Scout("ringmd5", self.verbose, self.suppress_errors,
+                      self.timeout)
+        print("[%s] Checking ring md5sums" % self._ptime())
+        if self.verbose:
+            for ring_file, ring_sum in rings.items():
+                print("-> On disk %s md5sum: %s" % (ring_file, ring_sum))
+        for url, response, status, ts_start, ts_end in self.pool.imap(
+                recon.scout, hosts):
+            if status != 200:
+                errors = errors + 1
+                continue
+            success = True
+            for remote_ring_file, remote_ring_sum in response.items():
+                remote_ring_name = os.path.basename(remote_ring_file)
+                if not remote_ring_name.startswith(self.server_type):
+                    continue
+                ring_sum = rings.get(remote_ring_name, None)
+                if remote_ring_sum != ring_sum:
+                    success = False
+                    print("!! %s (%s => %s) doesn't match on disk md5sum" % (
+                        url, remote_ring_name, remote_ring_sum))
+            if not success:
+                errors += 1
+                continue
+            matches += 1
+            if self.verbose:
+                print("-> %s matches." % url)
+        print("%s/%s hosts matched, %s error[s] while checking hosts." % (
+            matches, len(hosts), errors))
+        print("=" * 79)
+
+    def get_swiftconfmd5(self, hosts, printfn=print):
+        """
+        Compare swift.conf md5sum with that on remote hosts
+
+        :param hosts: set of hosts to check. in the format of:
+            set([('127.0.0.1', 6220), ('127.0.0.2', 6230)])
+        :param printfn: function to print text; defaults to print()
+        """
+        matches = 0
+        errors = 0
+        conf_sum = md5_hash_for_file(SWIFT_CONF_FILE)
+        recon = Scout("swiftconfmd5", self.verbose, self.suppress_errors,
+                      self.timeout)
+        printfn("[%s] Checking swift.conf md5sum" % self._ptime())
+        if self.verbose:
+            printfn("-> On disk swift.conf md5sum: %s" % (conf_sum,))
+        for url, response, status, ts_start, ts_end in self.pool.imap(
+                recon.scout, hosts):
+            if status == 200:
+                if response[SWIFT_CONF_FILE] != conf_sum:
+                    printfn("!! %s (%s) doesn't match on disk md5sum" %
+                            (url, response[SWIFT_CONF_FILE]))
+                else:
+                    matches = matches + 1
+                    if self.verbose:
+                        printfn("-> %s matches." % url)
+            else:
+                errors = errors + 1
+        printfn("%s/%s hosts matched, %s error[s] while checking hosts."
+                % (matches, len(hosts), errors))
+        printfn("=" * 79)
+
+    def async_check(self, hosts):
+        """
+        Obtain and print async pending statistics
+
+        :param hosts: set of hosts to check. in the format of:
+            set([('127.0.0.1', 6220), ('127.0.0.2', 6230)])
+        """
+        scan = {}
+        recon = Scout("async", self.verbose, self.suppress_errors,
+                      self.timeout)
+        print("[%s] Checking async pendings" % self._ptime())
+        for url, response, status, ts_start, ts_end in self.pool.imap(
+                recon.scout, hosts):
+            if status == 200:
+                scan[url] = response['async_pending']
+        stats = self._gen_stats(scan.values(), 'async_pending')
+        if stats['reported'] > 0:
+            self._print_stats(stats)
+        else:
+            print("[async_pending] - No hosts returned valid data.")
+        print("=" * 79)
+
+    def driveaudit_check(self, hosts):
+        """
+        Obtain and print drive audit error statistics
+
+        :param hosts: set of hosts to check. in the format of:
+            set([('127.0.0.1', 6220), ('127.0.0.2', 6230)]
+        """
+        scan = {}
+        recon = Scout("driveaudit", self.verbose, self.suppress_errors,
+                      self.timeout)
+        print("[%s] Checking drive-audit errors" % self._ptime())
+        for url, response, status, ts_start, ts_end in self.pool.imap(
+                recon.scout, hosts):
+            if status == 200:
+                scan[url] = response['drive_audit_errors']
+        stats = self._gen_stats(scan.values(), 'drive_audit_errors')
+        if stats['reported'] > 0:
+            self._print_stats(stats)
+        else:
+            print("[drive_audit_errors] - No hosts returned valid data.")
+        print("=" * 79)
+
+    def umount_check(self, hosts):
+        """
+        Check for and print unmounted drives
+
+        :param hosts: set of hosts to check. in the format of:
+            set([('127.0.0.1', 6220), ('127.0.0.2', 6230)])
+        """
+        unmounted = {}
+        errors = {}
+        recon = Scout("unmounted", self.verbose, self.suppress_errors,
+                      self.timeout)
+        print("[%s] Getting unmounted drives from %s hosts..." %
+              (self._ptime(), len(hosts)))
+        for url, response, status, ts_start, ts_end in self.pool.imap(
+                recon.scout, hosts):
+            if status == 200:
+                unmounted[url] = []
+                errors[url] = []
+                for i in response:
+                    if not isinstance(i['mounted'], bool):
+                        errors[url].append(i['device'])
+                    else:
+                        unmounted[url].append(i['device'])
+        for host in unmounted:
+            node = urlparse(host).netloc
+            for entry in unmounted[host]:
+                print("Not mounted: %s on %s" % (entry, node))
+        for host in errors:
+            node = urlparse(host).netloc
+            for entry in errors[host]:
+                print("Device errors: %s on %s" % (entry, node))
+        print("=" * 79)
+
+    def server_type_check(self, hosts):
+        """
+        Check for server types on the ring
+
+        :param hosts: set of hosts to check. in the format of:
+            set([('127.0.0.1', 6220), ('127.0.0.2', 6230)])
+        """
+        errors = {}
+        recon = Scout("server_type_check", self.verbose, self.suppress_errors,
+                      self.timeout)
+        print("[%s] Validating server type '%s' on %s hosts..." %
+              (self._ptime(), self.server_type, len(hosts)))
+        for url, response, status in self.pool.imap(
+                recon.scout_server_type, hosts):
+            if status == 200:
+                if response != self.server_type + '-server':
+                    errors[url] = response
+        print("%s/%s hosts ok, %s error[s] while checking hosts." % (
+            len(hosts) - len(errors), len(hosts), len(errors)))
+        for host in errors:
+            print("Invalid: %s is %s" % (host, errors[host]))
+        print("=" * 79)
+
+    def expirer_check(self, hosts):
+        """
+        Obtain and print expirer statistics
+
+        :param hosts: set of hosts to check. in the format of:
+            set([('127.0.0.1', 6220), ('127.0.0.2', 6230)])
+        """
+        stats = {'object_expiration_pass': [], 'expired_last_pass': []}
+        recon = Scout("expirer/%s" % self.server_type, self.verbose,
+                      self.suppress_errors, self.timeout)
+        print("[%s] Checking on expirers" % self._ptime())
+        for url, response, status, ts_start, ts_end in self.pool.imap(
+                recon.scout, hosts):
+            if status == 200:
+                stats['object_expiration_pass'].append(
+                    response.get('object_expiration_pass'))
+                stats['expired_last_pass'].append(
+                    response.get('expired_last_pass'))
+        for k in stats:
+            if stats[k]:
+                computed = self._gen_stats(stats[k], name=k)
+                if computed['reported'] > 0:
+                    self._print_stats(computed)
+                else:
+                    print("[%s] - No hosts returned valid data." % k)
+            else:
+                print("[%s] - No hosts returned valid data." % k)
+        print("=" * 79)
+
+    def _calculate_least_and_most_recent(self, url_time_data):
+        """calulate and print the least and most recent urls
+
+        Given a list of url and time tuples calulate the most and least
+        recent timings and print it out.
+        :param url_time_data: list of url and time tuples: [(url, time_), ..]
+        """
+        least_recent_time = 9999999999
+        least_recent_url = None
+        most_recent_time = 0
+        most_recent_url = None
+
+        for url, last in url_time_data:
+            if last is None:
+                continue
+            if last < least_recent_time:
+                least_recent_time = last
+                least_recent_url = url
+            if last > most_recent_time:
+                most_recent_time = last
+                most_recent_url = url
+
+        if least_recent_url is not None:
+            host = urlparse(least_recent_url).netloc
+            if not least_recent_time:
+                print('Oldest completion was NEVER by %s.' % host)
+            else:
+                elapsed = time.time() - least_recent_time
+                elapsed, elapsed_unit = seconds2timeunit(elapsed)
+                print('Oldest completion was %s (%d %s ago) by %s.' % (
+                    self._ptime(least_recent_time),
+                    elapsed, elapsed_unit, host))
+        if most_recent_url is not None:
+            host = urlparse(most_recent_url).netloc
+            elapsed = time.time() - most_recent_time
+            elapsed, elapsed_unit = seconds2timeunit(elapsed)
+            print('Most recent completion was %s (%d %s ago) by %s.' % (
+                self._ptime(most_recent_time),
+                elapsed, elapsed_unit, host))
+
+    def reconstruction_check(self, hosts):
+        """
+        Obtain and print reconstructon statistics
+
+        :param hosts: set of hosts to check. in the format of:
+            set([('127.0.0.1', 6020), ('127.0.0.2', 6030)])
+        """
+        stats = []
+        last_stats = []
+        recon = Scout("reconstruction/%s" % self.server_type, self.verbose,
+                      self.suppress_errors, self.timeout)
+        print("[%s] Checking on reconstructors" % self._ptime())
+        for url, response, status, ts_start, ts_end in self.pool.imap(
+                recon.scout, hosts):
+            if status == 200:
+                stats.append(response.get('object_reconstruction_time'))
+                last = response.get('object_reconstruction_last', 0)
+                last_stats.append((url, last))
+        if stats:
+            computed = self._gen_stats(stats,
+                                       name='object_reconstruction_time')
+            if computed['reported'] > 0:
+                self._print_stats(computed)
+            else:
+                print("[object_reconstruction_time] - No hosts returned "
+                      "valid data.")
+        else:
+            print("[object_reconstruction_time] - No hosts returned "
+                  "valid data.")
+        self._calculate_least_and_most_recent(last_stats)
+        print("=" * 79)
+
+    def replication_check(self, hosts):
+        """
+        Obtain and print replication statistics
+
+        :param hosts: set of hosts to check. in the format of:
+            set([('127.0.0.1', 6220), ('127.0.0.2', 6230)])
+        """
+        stats = {'replication_time': [], 'failure': [], 'success': [],
+                 'attempted': []}
+        last_stats = []
+        recon = Scout("replication/%s" % self.server_type, self.verbose,
+                      self.suppress_errors, self.timeout)
+        print("[%s] Checking on replication" % self._ptime())
+        for url, response, status, ts_start, ts_end in self.pool.imap(
+                recon.scout, hosts):
+            if status == 200:
+                stats['replication_time'].append(
+                    response.get('replication_time',
+                                 response.get('object_replication_time', 0)))
+                repl_stats = response.get('replication_stats')
+                if repl_stats:
+                    for stat_key in ['attempted', 'failure', 'success']:
+                        stats[stat_key].append(repl_stats.get(stat_key))
+                last = response.get('replication_last',
+                                    response.get('object_replication_last', 0))
+                last_stats.append((url, last))
+        for k in stats:
+            if stats[k]:
+                if k != 'replication_time':
+                    computed = self._gen_stats(stats[k],
+                                               name='replication_%s' % k)
+                else:
+                    computed = self._gen_stats(stats[k], name=k)
+                if computed['reported'] > 0:
+                    self._print_stats(computed)
+                else:
+                    print("[%s] - No hosts returned valid data." % k)
+            else:
+                print("[%s] - No hosts returned valid data." % k)
+        self._calculate_least_and_most_recent(last_stats)
+        print("=" * 79)
+
+    def updater_check(self, hosts):
+        """
+        Obtain and print updater statistics
+
+        :param hosts: set of hosts to check. in the format of:
+            set([('127.0.0.1', 6220), ('127.0.0.2', 6230)])
+        """
+        stats = []
+        recon = Scout("updater/%s" % self.server_type, self.verbose,
+                      self.suppress_errors, self.timeout)
+        print("[%s] Checking updater times" % self._ptime())
+        for url, response, status, ts_start, ts_end in self.pool.imap(
+                recon.scout, hosts):
+            if status == 200:
+                if response['%s_updater_sweep' % self.server_type]:
+                    stats.append(response['%s_updater_sweep' %
+                                          self.server_type])
+        if len(stats) > 0:
+            computed = self._gen_stats(stats, name='updater_last_sweep')
+            if computed['reported'] > 0:
+                self._print_stats(computed)
+            else:
+                print("[updater_last_sweep] - No hosts returned valid data.")
+        else:
+            print("[updater_last_sweep] - No hosts returned valid data.")
+        print("=" * 79)
+
+    def auditor_check(self, hosts):
+        """
+        Obtain and print obj auditor statistics
+
+        :param hosts: set of hosts to check. in the format of:
+            set([('127.0.0.1', 6220), ('127.0.0.2', 6230)])
+        """
+        scan = {}
+        adone = '%s_auditor_pass_completed' % self.server_type
+        afail = '%s_audits_failed' % self.server_type
+        apass = '%s_audits_passed' % self.server_type
+        asince = '%s_audits_since' % self.server_type
+        recon = Scout("auditor/%s" % self.server_type, self.verbose,
+                      self.suppress_errors, self.timeout)
+        print("[%s] Checking auditor stats" % self._ptime())
+        for url, response, status, ts_start, ts_end in self.pool.imap(
+                recon.scout, hosts):
+            if status == 200:
+                scan[url] = response
+        if len(scan) < 1:
+            print("Error: No hosts available")
+            return
+        stats = {}
+        stats[adone] = [scan[i][adone] for i in scan
+                        if scan[i][adone] is not None]
+        stats[afail] = [scan[i][afail] for i in scan
+                        if scan[i][afail] is not None]
+        stats[apass] = [scan[i][apass] for i in scan
+                        if scan[i][apass] is not None]
+        stats[asince] = [scan[i][asince] for i in scan
+                         if scan[i][asince] is not None]
+        for k in stats:
+            if len(stats[k]) < 1:
+                print("[%s] - No hosts returned valid data." % k)
+            else:
+                if k != asince:
+                    computed = self._gen_stats(stats[k], k)
+                    if computed['reported'] > 0:
+                        self._print_stats(computed)
+        if len(stats[asince]) >= 1:
+            low = min(stats[asince])
+            high = max(stats[asince])
+            total = sum(stats[asince])
+            average = total / len(stats[asince])
+            print('[last_pass] oldest: %s, newest: %s, avg: %s' %
+                  (self._ptime(low), self._ptime(high), self._ptime(average)))
+        print("=" * 79)
+
+    def nested_get_value(self, key, recon_entry):
+        """
+        Generator that yields all values for given key in a recon cache entry.
+        This is for use with object auditor recon cache entries.  If the
+        object auditor has run in parallel, the recon cache will have entries
+        of the form:  {'object_auditor_stats_ALL': { 'disk1': {..},
+                                                     'disk2': {..},
+                                                     'disk3': {..},
+                                                   ...}}
+        If the object auditor hasn't run in parallel, the recon cache will have
+        entries of the form:  {'object_auditor_stats_ALL': {...}}.
+        The ZBF auditor doesn't run in parallel.  However, if a subset of
+        devices is selected for auditing, the recon cache will have an entry
+        of the form:  {'object_auditor_stats_ZBF': { 'disk1disk2..diskN': {}}
+        We use this generator to find all instances of a particular key in
+        these multi-level dictionaries.
+        """
+        for k, v in recon_entry.items():
+            if isinstance(v, dict):
+                for value in self.nested_get_value(key, v):
+                    yield value
+            if k == key:
+                yield v
+
+    def object_auditor_check(self, hosts):
+        """
+        Obtain and print obj auditor statistics
+
+        :param hosts: set of hosts to check. in the format of:
+            set([('127.0.0.1', 6220), ('127.0.0.2', 6230)])
+        """
+        all_scan = {}
+        zbf_scan = {}
+        atime = 'audit_time'
+        bprocessed = 'bytes_processed'
+        passes = 'passes'
+        errors = 'errors'
+        quarantined = 'quarantined'
+        recon = Scout("auditor/object", self.verbose, self.suppress_errors,
+                      self.timeout)
+        print("[%s] Checking auditor stats " % self._ptime())
+        for url, response, status, ts_start, ts_end in self.pool.imap(
+                recon.scout, hosts):
+            if status == 200:
+                if response['object_auditor_stats_ALL']:
+                    all_scan[url] = response['object_auditor_stats_ALL']
+                if response['object_auditor_stats_ZBF']:
+                    zbf_scan[url] = response['object_auditor_stats_ZBF']
+        if len(all_scan) > 0:
+            stats = {}
+            stats[atime] = [sum(self.nested_get_value(atime, all_scan[i]))
+                            for i in all_scan]
+            stats[bprocessed] = [sum(self.nested_get_value(bprocessed,
+                                 all_scan[i])) for i in all_scan]
+            stats[passes] = [sum(self.nested_get_value(passes, all_scan[i]))
+                             for i in all_scan]
+            stats[errors] = [sum(self.nested_get_value(errors, all_scan[i]))
+                             for i in all_scan]
+            stats[quarantined] = [sum(self.nested_get_value(quarantined,
+                                  all_scan[i])) for i in all_scan]
+            for k in stats:
+                if None in stats[k]:
+                    stats[k] = [x for x in stats[k] if x is not None]
+                if len(stats[k]) < 1:
+                    print("[Auditor %s] - No hosts returned valid data." % k)
+                else:
+                    computed = self._gen_stats(stats[k],
+                                               name='ALL_%s_last_path' % k)
+                    if computed['reported'] > 0:
+                        self._print_stats(computed)
+                    else:
+                        print("[ALL_auditor] - No hosts returned valid data.")
+        else:
+            print("[ALL_auditor] - No hosts returned valid data.")
+        if len(zbf_scan) > 0:
+            stats = {}
+            stats[atime] = [sum(self.nested_get_value(atime, zbf_scan[i]))
+                            for i in zbf_scan]
+            stats[bprocessed] = [sum(self.nested_get_value(bprocessed,
+                                 zbf_scan[i])) for i in zbf_scan]
+            stats[errors] = [sum(self.nested_get_value(errors, zbf_scan[i]))
+                             for i in zbf_scan]
+            stats[quarantined] = [sum(self.nested_get_value(quarantined,
+                                  zbf_scan[i])) for i in zbf_scan]
+            for k in stats:
+                if None in stats[k]:
+                    stats[k] = [x for x in stats[k] if x is not None]
+                if len(stats[k]) < 1:
+                    print("[Auditor %s] - No hosts returned valid data." % k)
+                else:
+                    computed = self._gen_stats(stats[k],
+                                               name='ZBF_%s_last_path' % k)
+                    if computed['reported'] > 0:
+                        self._print_stats(computed)
+                    else:
+                        print("[ZBF_auditor] - No hosts returned valid data.")
+        else:
+            print("[ZBF_auditor] - No hosts returned valid data.")
+        print("=" * 79)
+
+    def sharding_check(self, hosts):
+        """
+        Obtain and print sharding statistics
+
+        :param hosts: set of hosts to check. in the format of:
+            set([('127.0.0.1', 6221), ('127.0.0.2', 6231)])
+        """
+        stats = {'sharding_time': [],
+                 'attempted': [], 'failure': [], 'success': []}
+        recon = Scout("sharding", self.verbose,
+                      self.suppress_errors, self.timeout)
+        print("[%s] Checking on sharders" % self._ptime())
+        least_recent_time = 9999999999
+        least_recent_url = None
+        most_recent_time = 0
+        most_recent_url = None
+        for url, response, status, ts_start, ts_end in self.pool.imap(
+                recon.scout, hosts):
+            if status == 200:
+                stats['sharding_time'].append(response.get('sharding_time', 0))
+                shard_stats = response.get('sharding_stats')
+                if shard_stats:
+                    # Sharding has a ton more stats, like "no_change".
+                    # Not sure if we need them at all, or maybe for -v.
+                    for stat_key in ['attempted', 'failure', 'success']:
+                        stats[stat_key].append(shard_stats.get(stat_key))
+                last = response.get('sharding_last', 0)
+                if last is None:
+                    continue
+                if last < least_recent_time:
+                    least_recent_time = last
+                    least_recent_url = url
+                if last > most_recent_time:
+                    most_recent_time = last
+                    most_recent_url = url
+        for k in stats:
+            if stats[k]:
+                computed = self._gen_stats(stats[k], name=k)
+                if computed['reported'] > 0:
+                    self._print_stats(computed)
+                else:
+                    print("[%s] - No hosts returned valid data." % k)
+            else:
+                print("[%s] - No hosts returned valid data." % k)
+        if least_recent_url is not None:
+            host = urlparse(least_recent_url).netloc
+            if not least_recent_time:
+                print('Oldest completion was NEVER by %s.' % host)
+            else:
+                elapsed = time.time() - least_recent_time
+                elapsed, elapsed_unit = seconds2timeunit(elapsed)
+                print('Oldest completion was %s (%d %s ago) by %s.' % (
+                    self._ptime(least_recent_time),
+                    elapsed, elapsed_unit, host))
+        if most_recent_url is not None:
+            host = urlparse(most_recent_url).netloc
+            elapsed = time.time() - most_recent_time
+            elapsed, elapsed_unit = seconds2timeunit(elapsed)
+            print('Most recent completion was %s (%d %s ago) by %s.' % (
+                self._ptime(most_recent_time),
+                elapsed, elapsed_unit, host))
+        print("=" * 79)
+
+    def load_check(self, hosts):
+        """
+        Obtain and print load average statistics
+
+        :param hosts: set of hosts to check. in the format of:
+            set([('127.0.0.1', 6220), ('127.0.0.2', 6230)])
+        """
+        load1 = {}
+        load5 = {}
+        load15 = {}
+        recon = Scout("load", self.verbose, self.suppress_errors,
+                      self.timeout)
+        print("[%s] Checking load averages" % self._ptime())
+        for url, response, status, ts_start, ts_end in self.pool.imap(
+                recon.scout, hosts):
+            if status == 200:
+                load1[url] = response['1m']
+                load5[url] = response['5m']
+                load15[url] = response['15m']
+        stats = {"1m": load1, "5m": load5, "15m": load15}
+        for item in stats:
+            if len(stats[item]) > 0:
+                computed = self._gen_stats(stats[item].values(),
+                                           name='%s_load_avg' % item)
+                self._print_stats(computed)
+            else:
+                print("[%s_load_avg] - No hosts returned valid data." % item)
+        print("=" * 79)
+
+    def quarantine_check(self, hosts):
+        """
+        Obtain and print quarantine statistics
+
+        :param hosts: set of hosts to check. in the format of:
+            set([('127.0.0.1', 6220), ('127.0.0.2', 6230)])
+        """
+        objq = {}
+        conq = {}
+        acctq = {}
+        stats = {}
+        recon = Scout("quarantined", self.verbose, self.suppress_errors,
+                      self.timeout)
+        print("[%s] Checking quarantine" % self._ptime())
+        for url, response, status, ts_start, ts_end in self.pool.imap(
+                recon.scout, hosts):
+            if status == 200:
+                objq[url] = response['objects']
+                conq[url] = response['containers']
+                acctq[url] = response['accounts']
+                for key in response.get('policies', {}):
+                    pkey = "objects_%s" % key
+                    stats.setdefault(pkey, {})
+                    stats[pkey][url] = response['policies'][key]['objects']
+        stats.update({"objects": objq, "containers": conq, "accounts": acctq})
+        for item in stats:
+            if len(stats[item]) > 0:
+                computed = self._gen_stats(stats[item].values(),
+                                           name='quarantined_%s' % item)
+                self._print_stats(computed)
+            else:
+                print("No hosts returned valid data.")
+        print("=" * 79)
+
+    def socket_usage(self, hosts):
+        """
+        Obtain and print /proc/net/sockstat statistics
+
+        :param hosts: set of hosts to check. in the format of:
+            set([('127.0.0.1', 6220), ('127.0.0.2', 6230)])
+        """
+        inuse4 = {}
+        mem = {}
+        inuse6 = {}
+        timewait = {}
+        orphan = {}
+        recon = Scout("sockstat", self.verbose, self.suppress_errors,
+                      self.timeout)
+        print("[%s] Checking socket usage" % self._ptime())
+        for url, response, status, ts_start, ts_end in self.pool.imap(
+                recon.scout, hosts):
+            if status == 200:
+                inuse4[url] = response['tcp_in_use']
+                mem[url] = response['tcp_mem_allocated_bytes']
+                inuse6[url] = response.get('tcp6_in_use', 0)
+                timewait[url] = response['time_wait']
+                orphan[url] = response['orphan']
+        stats = {"tcp_in_use": inuse4, "tcp_mem_allocated_bytes": mem,
+                 "tcp6_in_use": inuse6, "time_wait": timewait,
+                 "orphan": orphan}
+        for item in stats:
+            if len(stats[item]) > 0:
+                computed = self._gen_stats(stats[item].values(), item)
+                self._print_stats(computed)
+            else:
+                print("No hosts returned valid data.")
+        print("=" * 79)
+
+    def disk_usage(self, hosts, top=0, lowest=0, human_readable=False):
+        """
+        Obtain and print disk usage statistics
+
+        :param hosts: set of hosts to check. in the format of:
+            set([('127.0.0.1', 6220), ('127.0.0.2', 6230)])
+        """
+        stats = {}
+        highs = []
+        lows = []
+        raw_total_used = []
+        raw_total_avail = []
+        percents = {}
+        top_percents = [(None, 0)] * top
+        low_percents = [(None, 100)] * lowest
+        recon = Scout("diskusage", self.verbose, self.suppress_errors,
+                      self.timeout)
+        # We want to only query each host once, but we don't care
+        # which of the available ports we use. So we filter hosts by
+        # constructing a host->port dictionary, since the dict
+        # constructor ensures each key is unique, thus each host
+        # appears only once in filtered_hosts.
+        filtered_hosts = set(dict(hosts).items())
+        print("[%s] Checking disk usage now" % self._ptime())
+        for url, response, status, ts_start, ts_end in self.pool.imap(
+                recon.scout, filtered_hosts):
+            if status == 200:
+                hostusage = []
+                for entry in response:
+                    if not isinstance(entry['mounted'], bool):
+                        print("-> %s/%s: Error: %s" % (url, entry['device'],
+                                                       entry['mounted']))
+                    elif entry['mounted']:
+                        used = float(entry['used']) / float(entry['size']) \
+                            * 100.0
+                        raw_total_used.append(entry['used'])
+                        raw_total_avail.append(entry['avail'])
+                        hostusage.append(round(used, 2))
+                        for ident, oused in top_percents:
+                            if oused < used:
+                                top_percents.append(
+                                    (url + ' ' + entry['device'], used))
+                                top_percents.sort(key=lambda x: -x[1])
+                                top_percents.pop()
+                                break
+                        for ident, oused in low_percents:
+                            if oused > used:
+                                low_percents.append(
+                                    (url + ' ' + entry['device'], used))
+                                low_percents.sort(key=lambda x: x[1])
+                                low_percents.pop()
+                                break
+                stats[url] = hostusage
+
+        for url in stats:
+            if len(stats[url]) > 0:
+                # get per host hi/los for another day
+                low = min(stats[url])
+                high = max(stats[url])
+                highs.append(high)
+                lows.append(low)
+                for percent in stats[url]:
+                    percents[int(percent)] = percents.get(int(percent), 0) + 1
+            else:
+                print("-> %s: Error. No drive info available." % url)
+
+        if len(lows) > 0:
+            low = min(lows)
+            high = max(highs)
+            # dist graph shamelessly stolen from https://github.com/gholt/tcod
+            print("Distribution Graph:")
+            mul = 69.0 / max(percents.values())
+            for percent in sorted(percents):
+                print('% 3d%%%5d %s' % (percent, percents[percent],
+                                        '*' * int(percents[percent] * mul)))
+            raw_used = sum(raw_total_used)
+            raw_avail = sum(raw_total_avail)
+            raw_total = raw_used + raw_avail
+            avg_used = 100.0 * raw_used / raw_total
+            if human_readable:
+                raw_used = size_suffix(raw_used)
+                raw_avail = size_suffix(raw_avail)
+                raw_total = size_suffix(raw_total)
+            print("Disk usage: space used: %s of %s" % (raw_used, raw_total))
+            print("Disk usage: space free: %s of %s" % (raw_avail, raw_total))
+            print("Disk usage: lowest: %s%%, highest: %s%%, avg: %s%%" %
+                  (low, high, avg_used))
+        else:
+            print("No hosts returned valid data.")
+        print("=" * 79)
+        if top_percents:
+            print('TOP %s' % top)
+            for ident, used in top_percents:
+                if ident:
+                    url, device = ident.split()
+                    host = urlparse(url).netloc.split(':')[0]
+                    print('%.02f%%  %s' % (used, '%-15s %s' % (host, device)))
+        if low_percents:
+            print('LOWEST %s' % lowest)
+            for ident, used in low_percents:
+                if ident:
+                    url, device = ident.split()
+                    host = urlparse(url).netloc.split(':')[0]
+                    print('%.02f%%  %s' % (used, '%-15s %s' % (host, device)))
+
+    def time_check(self, hosts, jitter=0.0):
+        """
+        Check a time synchronization of hosts with current time
+
+        :param hosts: set of hosts to check. in the format of:
+            set([('127.0.0.1', 6220), ('127.0.0.2', 6230)])
+        :param jitter: Maximal allowed time jitter
+        """
+
+        jitter = abs(jitter)
+        matches = 0
+        errors = 0
+        recon = Scout("time", self.verbose, self.suppress_errors,
+                      self.timeout)
+        print("[%s] Checking time-sync" % self._ptime())
+        for url, ts_remote, status, ts_start, ts_end in self.pool.imap(
+                recon.scout, hosts):
+            if status != 200:
+                errors = errors + 1
+                continue
+            if (ts_remote + jitter < ts_start or ts_remote - jitter > ts_end):
+                diff = abs(ts_end - ts_remote)
+                ts_end_f = self._ptime(ts_end)
+                ts_remote_f = self._ptime(ts_remote)
+
+                print("!! %s current time is %s, but remote is %s, "
+                      "differs by %.4f sec" % (
+                          url,
+                          ts_end_f,
+                          ts_remote_f,
+                          diff))
+                continue
+            matches += 1
+            if self.verbose:
+                print("-> %s matches." % url)
+        print("%s/%s hosts matched, %s error[s] while checking hosts." % (
+            matches, len(hosts), errors))
+        print("=" * 79)
+
+    def version_check(self, hosts):
+        """
+        Check OS Swift version of hosts. Inform if differs.
+
+        :param hosts: set of hosts to check. in the format of:
+            set([('127.0.0.1', 6220), ('127.0.0.2', 6230)])
+        """
+        versions = set()
+        errors = 0
+        print("[%s] Checking versions" % self._ptime())
+        recon = Scout("version", self.verbose, self.suppress_errors,
+                      self.timeout)
+        for url, response, status, ts_start, ts_end in self.pool.imap(
+                recon.scout, hosts):
+            if status != 200:
+                errors = errors + 1
+                continue
+            versions.add(response['version'])
+            if self.verbose:
+                print("-> %s installed version %s" % (
+                    url, response['version']))
+
+        if not len(versions):
+            print("No hosts returned valid data.")
+        elif len(versions) == 1:
+            print("Versions matched (%s), "
+                  "%s error[s] while checking hosts." % (
+                      versions.pop(), errors))
+        else:
+            print("Versions not matched (%s), "
+                  "%s error[s] while checking hosts." % (
+                      ", ".join(sorted(versions)), errors))
+
+        print("=" * 79)
+
+    def _get_ring_names(self, policy=None):
+        """
+        Retrieve name of ring files.
+
+        If no policy is passed and the server type is object,
+        the ring names of all storage-policies are retrieved.
+
+        :param policy: name or index of storage policy, only applicable
+         with server_type==object.
+         :returns: list of ring names.
+        """
+        if self.server_type == 'object':
+            ring_names = [p.ring_name for p in POLICIES if (
+                p.name == policy or not policy or (
+                    policy.isdigit() and int(policy) == int(p) or
+                    (isinstance(policy, str)
+                     and policy in p.aliases)))]
+        else:
+            ring_names = [self.server_type]
+
+        return ring_names
+
+    def main(self):
+        """
+        Retrieve and report cluster info from hosts running recon middleware.
+        """
+        print("=" * 79)
+        usage = '''
+        usage: %prog <server_type> [<server_type> [<server_type>]]
+        [-v] [--suppress] [-a] [-r] [-u] [-d] [-R]
+        [-l] [-T] [--md5] [--auditor] [--updater] [--expirer] [--sockstat]
+        [--human-readable]
+
+        <server_type>\taccount|container|object
+        Defaults to object server.
+
+        ex: %prog container -l --auditor
+        '''
+        args = optparse.OptionParser(usage)
+        args.add_option('--verbose', '-v', action="store_true",
+                        help="Print verbose info")
+        args.add_option('--suppress', action="store_true",
+                        help="Suppress most connection related errors")
+        args.add_option('--async', '-a',
+                        action="store_true", dest="async_check",
+                        help="Get async stats")
+        args.add_option('--replication', '-r', action="store_true",
+                        help="Get replication stats")
+        args.add_option('--reconstruction', '-R', action="store_true",
+                        help="Get reconstruction stats")
+        args.add_option('--auditor', action="store_true",
+                        help="Get auditor stats")
+        args.add_option('--updater', action="store_true",
+                        help="Get updater stats")
+        args.add_option('--expirer', action="store_true",
+                        help="Get expirer stats")
+        args.add_option('--sharding', action="store_true",
+                        help="Get sharding stats")
+        args.add_option('--unmounted', '-u', action="store_true",
+                        help="Check cluster for unmounted devices")
+        args.add_option('--diskusage', '-d', action="store_true",
+                        help="Get disk usage stats")
+        args.add_option('--human-readable', action="store_true",
+                        help="Use human readable suffix for disk usage stats")
+        args.add_option('--loadstats', '-l', action="store_true",
+                        help="Get cluster load average stats")
+        args.add_option('--quarantined', '-q', action="store_true",
+                        help="Get cluster quarantine stats")
+        args.add_option('--validate-servers', action="store_true",
+                        help="Validate servers on the ring")
+        args.add_option('--md5', action="store_true",
+                        help="Get md5sum of servers ring and compare to "
+                        "local copy")
+        args.add_option('--sockstat', action="store_true",
+                        help="Get cluster socket usage stats")
+        args.add_option('--driveaudit', action="store_true",
+                        help="Get drive audit error stats")
+        args.add_option('--time', '-T', action="store_true",
+                        help="Check time synchronization")
+        args.add_option('--jitter', type="float", default=0.0,
+                        help="Maximal allowed time jitter")
+        args.add_option('--swift-versions', action="store_true",
+                        help="Check swift versions")
+        args.add_option('--top', type='int', metavar='COUNT', default=0,
+                        help='Also show the top COUNT entries in rank order.')
+        args.add_option('--lowest', type='int', metavar='COUNT', default=0,
+                        help='Also show the lowest COUNT entries in rank \
+                        order.')
+        args.add_option('--all', action="store_true",
+                        help="Perform all checks. Equal to \t\t\t-arRudlqT "
+                        "--md5 --sockstat --auditor --updater --expirer "
+                        "--driveaudit --validate-servers --swift-versions")
+        args.add_option('--region', type="int",
+                        help="Only query servers in specified region")
+        args.add_option('--zone', '-z', type="int",
+                        help="Only query servers in specified zone")
+        args.add_option('--timeout', '-t', type="int", metavar="SECONDS",
+                        help="Time to wait for a response from a server",
+                        default=5)
+        args.add_option('--swiftdir', default="/etc/swift",
+                        help="Default = /etc/swift")
+        args.add_option('--policy', '-p',
+                        help='Only query object servers in specified '
+                        'storage policy (specified as name or index).')
+        options, arguments = args.parse_args()
+
+        if len(sys.argv) <= 1 or len(arguments) > len(self.check_types):
+            args.print_help()
+            sys.exit(0)
+
+        if arguments:
+            arguments = set(arguments)
+            if arguments.issubset(self.check_types):
+                server_types = arguments
+            else:
+                print("Invalid Server Type")
+                args.print_help()
+                sys.exit(1)
+        else:  # default
+            server_types = ['object']
+
+        swift_dir = options.swiftdir
+        if set_swift_dir(swift_dir):
+            reload_storage_policies()
+
+        self.verbose = options.verbose
+        self.suppress_errors = options.suppress
+        self.timeout = options.timeout
+
+        for server_type in server_types:
+            self.server_type = server_type
+            ring_names = self._get_ring_names(options.policy)
+            if not ring_names:
+                print('Invalid Storage Policy: %s' % options.policy)
+                args.print_help()
+                sys.exit(0)
+            hosts = self.get_hosts(options.region, options.zone,
+                                   swift_dir, ring_names)
+            print("--> Starting reconnaissance on %s hosts (%s)" %
+                  (len(hosts), self.server_type))
+            print("=" * 79)
+            if options.all:
+                if self.server_type == 'object':
+                    self.async_check(hosts)
+                    self.object_auditor_check(hosts)
+                    self.updater_check(hosts)
+                    self.expirer_check(hosts)
+                    self.reconstruction_check(hosts)
+                elif self.server_type == 'container':
+                    self.auditor_check(hosts)
+                    self.updater_check(hosts)
+                    self.sharding_check(hosts)
+                elif self.server_type == 'account':
+                    self.auditor_check(hosts)
+                self.replication_check(hosts)
+                self.umount_check(hosts)
+                self.load_check(hosts)
+                self.disk_usage(hosts, options.top, options.lowest,
+                                options.human_readable)
+                self.get_ringmd5(hosts, swift_dir)
+                self.get_swiftconfmd5(hosts)
+                self.quarantine_check(hosts)
+                self.socket_usage(hosts)
+                self.server_type_check(hosts)
+                self.driveaudit_check(hosts)
+                self.time_check(hosts, options.jitter)
+                self.version_check(hosts)
+            else:
+                if options.async_check:
+                    if self.server_type == 'object':
+                        self.async_check(hosts)
+                    else:
+                        print("Error: Can't check asyncs on non object "
+                              "servers.")
+                        print("=" * 79)
+                if options.unmounted:
+                    self.umount_check(hosts)
+                if options.replication:
+                    self.replication_check(hosts)
+                if options.auditor:
+                    if self.server_type == 'object':
+                        self.object_auditor_check(hosts)
+                    else:
+                        self.auditor_check(hosts)
+                if options.updater:
+                    if self.server_type == 'account':
+                        print("Error: Can't check updaters on account "
+                              "servers.")
+                        print("=" * 79)
+                    else:
+                        self.updater_check(hosts)
+                if options.expirer:
+                    if self.server_type == 'object':
+                        self.expirer_check(hosts)
+                    else:
+                        print("Error: Can't check expirer on non object "
+                              "servers.")
+                        print("=" * 79)
+                if options.sharding:
+                    if self.server_type == 'container':
+                        self.sharding_check(hosts)
+                    else:
+                        print("Error: Can't check sharding on non container "
+                              "servers.")
+                        print("=" * 79)
+                if options.reconstruction:
+                    if self.server_type == 'object':
+                        self.reconstruction_check(hosts)
+                    else:
+                        print("Error: Can't check reconstruction stats on "
+                              "non object servers.")
+                        print("=" * 79)
+                if options.validate_servers:
+                    self.server_type_check(hosts)
+                if options.loadstats:
+                    self.load_check(hosts)
+                if options.diskusage:
+                    self.disk_usage(hosts, options.top, options.lowest,
+                                    options.human_readable)
+                if options.md5:
+                    self.get_ringmd5(hosts, swift_dir)
+                    self.get_swiftconfmd5(hosts)
+                if options.quarantined:
+                    self.quarantine_check(hosts)
+                if options.sockstat:
+                    self.socket_usage(hosts)
+                if options.driveaudit:
+                    self.driveaudit_check(hosts)
+                if options.time:
+                    self.time_check(hosts, options.jitter)
+                if options.swift_versions:
+                    self.version_check(hosts)
+
+
+def main():
+    try:
+        reconnoiter = SwiftRecon()
+        reconnoiter.main()
+    except KeyboardInterrupt:
+        print('\n')
diff --git a/swift/cli/recon_cron.py b/swift/cli/recon_cron.py
new file mode 100644
index 0000000000..bd1dd22052
--- /dev/null
+++ b/swift/cli/recon_cron.py
@@ -0,0 +1,73 @@
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import os
+import sys
+import time
+
+from eventlet import Timeout
+
+from swift.common.utils import get_logger, dump_recon_cache, readconf, \
+    lock_path, listdir
+from swift.common.recon import RECON_OBJECT_FILE, DEFAULT_RECON_CACHE_PATH
+from swift.obj.diskfile import ASYNCDIR_BASE
+
+
+def get_async_count(device_dir):
+    async_count = 0
+    for i in listdir(device_dir):
+        device = os.path.join(device_dir, i)
+        if not os.path.isdir(device):
+            continue
+        for asyncdir in listdir(device):
+            # skip stuff like "accounts", "containers", etc.
+            if not (asyncdir == ASYNCDIR_BASE or
+                    asyncdir.startswith(ASYNCDIR_BASE + '-')):
+                continue
+            async_pending = os.path.join(device, asyncdir)
+
+            if os.path.isdir(async_pending):
+                for entry in listdir(async_pending):
+                    if os.path.isdir(os.path.join(async_pending, entry)):
+                        async_hdir = os.path.join(async_pending, entry)
+                        async_count += len(listdir(async_hdir))
+    return async_count
+
+
+def main():
+    try:
+        conf_path = sys.argv[1]
+    except Exception:
+        print("Usage: %s CONF_FILE" % sys.argv[0].split('/')[-1])
+        print("ex: swift-recon-cron /etc/swift/object-server.conf")
+        return 1
+    conf = readconf(conf_path, 'filter:recon')
+    device_dir = conf.get('devices', '/srv/node')
+    recon_cache_path = conf.get('recon_cache_path', DEFAULT_RECON_CACHE_PATH)
+    recon_lock_path = conf.get('recon_lock_path', '/var/lock')
+    cache_file = os.path.join(recon_cache_path, RECON_OBJECT_FILE)
+    lock_dir = os.path.join(recon_lock_path, "swift-recon-object-cron")
+    conf['log_name'] = conf.get('log_name', 'recon-cron')
+    logger = get_logger(conf, log_route='recon-cron')
+    try:
+        with lock_path(lock_dir):
+            asyncs = get_async_count(device_dir)
+            dump_recon_cache({
+                'async_pending': asyncs,
+                'async_pending_last': time.time(),
+            }, cache_file, logger)
+    except (Exception, Timeout) as err:
+        msg = 'Exception during recon-cron while accessing devices'
+        logger.exception(msg)
+        print('%s: %s' % (msg, err))
+        return 1
diff --git a/swift/cli/reconciler_enqueue.py b/swift/cli/reconciler_enqueue.py
new file mode 100644
index 0000000000..367b0b5e08
--- /dev/null
+++ b/swift/cli/reconciler_enqueue.py
@@ -0,0 +1,74 @@
+#!/usr/bin/env python
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import sys
+from optparse import OptionParser
+
+import eventlet.debug
+
+from swift.common.ring import Ring
+from swift.common.utils import split_path
+from swift.common.storage_policy import POLICIES
+
+from swift.container.reconciler import add_to_reconciler_queue
+"""
+This tool is primarily for debugging and development but can be used an example
+of how an operator could enqueue objects manually if a problem is discovered -
+might be particularly useful if you need to hack a fix into the reconciler
+and re-run it.
+"""
+
+USAGE = """
+%prog <policy_index> </a/c/o> <timestamp> [options]
+
+This script enqueues an object to be evaluated by the reconciler.
+
+Arguments:
+policy_index: the policy the object is currently stored in.
+      /a/c/o: the full path of the object - utf-8
+   timestamp: the timestamp of the datafile/tombstone.
+
+""".strip()
+
+parser = OptionParser(USAGE)
+parser.add_option('-X', '--op', default='PUT', choices=('PUT', 'DELETE'),
+                  help='the method of the misplaced operation')
+parser.add_option('-f', '--force', action='store_true',
+                  help='force an object to be re-enqueued')
+
+
+def main():
+    eventlet.debug.hub_exceptions(True)
+    options, args = parser.parse_args()
+    try:
+        policy_index, path, timestamp = args
+    except ValueError:
+        sys.exit(parser.print_help())
+    container_ring = Ring('/etc/swift/container.ring.gz')
+    policy = POLICIES.get_by_index(policy_index)
+    if not policy:
+        return 'ERROR: invalid storage policy index: %s' % policy
+    try:
+        account, container, obj = split_path(path, 3, 3, True)
+    except ValueError as e:
+        return 'ERROR: %s' % e
+    container_name = add_to_reconciler_queue(
+        container_ring, account, container, obj,
+        policy.idx, timestamp, options.op, force=options.force)
+    if not container_name:
+        return 'ERROR: unable to enqueue!'
+    print(container_name)
+
+
+if __name__ == "__main__":
+    sys.exit(main())
diff --git a/swift/cli/relinker.py b/swift/cli/relinker.py
new file mode 100644
index 0000000000..38e82fa6cf
--- /dev/null
+++ b/swift/cli/relinker.py
@@ -0,0 +1,953 @@
+#!/usr/bin/env python
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+
+import argparse
+import datetime
+import errno
+import fcntl
+import json
+import logging
+import os
+import time
+from collections import defaultdict
+
+from eventlet import hubs
+
+from swift.common.exceptions import LockTimeout
+from swift.common.storage_policy import POLICIES
+from swift.common.utils import replace_partition_in_path, config_true_value, \
+    audit_location_generator, get_logger, readconf, drop_privileges, \
+    RateLimitedIterator, distribute_evenly, get_prefixed_logger, \
+    non_negative_float, non_negative_int, config_auto_int_value, \
+    dump_recon_cache, get_partition_from_path, get_hub
+from swift.common.utils.logs import SwiftLogAdapter
+from swift.obj import diskfile
+from swift.common.recon import RECON_RELINKER_FILE, DEFAULT_RECON_CACHE_PATH
+
+
+LOCK_FILE = '.relink.{datadir}.lock'
+STATE_FILE = 'relink.{datadir}.json'
+STATE_TMP_FILE = '.relink.{datadir}.json.tmp'
+STEP_RELINK = 'relink'
+STEP_CLEANUP = 'cleanup'
+EXIT_SUCCESS = 0
+EXIT_NO_APPLICABLE_POLICY = 2
+EXIT_ERROR = 1
+DEFAULT_STATS_INTERVAL = 300.0
+
+
+def recursive_defaultdict():
+    return defaultdict(recursive_defaultdict)
+
+
+def policy(policy_name_or_index):
+    value = POLICIES.get_by_name_or_index(policy_name_or_index)
+    if value is None:
+        raise ValueError
+    return value
+
+
+def _aggregate_stats(base_stats, update_stats):
+    for key, value in update_stats.items():
+        base_stats.setdefault(key, 0)
+        base_stats[key] += value
+
+    return base_stats
+
+
+def _aggregate_recon_stats(base_stats, updated_stats):
+    for k, v in updated_stats.items():
+        if k == 'stats':
+            base_stats['stats'] = _aggregate_stats(base_stats['stats'], v)
+        elif k == "start_time":
+            base_stats[k] = min(base_stats.get(k, v), v)
+        elif k in ("timestamp", "total_time"):
+            base_stats[k] = max(base_stats.get(k, 0), v)
+        elif k in ('parts_done', 'total_parts'):
+            base_stats[k] += v
+
+    return base_stats
+
+
+def _zero_stats():
+    return {
+        'hash_dirs': 0,
+        'files': 0,
+        'linked': 0,
+        'removed': 0,
+        'errors': 0}
+
+
+def _zero_collated_stats():
+    return {
+        'parts_done': 0,
+        'total_parts': 0,
+        'total_time': 0,
+        'stats': _zero_stats()}
+
+
+class Relinker(object):
+    def __init__(self, conf, logger, device_list=None, do_cleanup=False):
+        self.conf = conf
+        self.recon_cache = os.path.join(self.conf['recon_cache_path'],
+                                        RECON_RELINKER_FILE)
+        self.logger = logger
+        self.device_list = device_list or []
+        self.do_cleanup = do_cleanup
+        self.root = self.conf['devices']
+        if len(self.device_list) == 1:
+            self.root = os.path.join(self.root, list(self.device_list)[0])
+        self.part_power = self.next_part_power = None
+        self.diskfile_mgr = None
+        self.dev_lock = None
+        self._last_recon_update = time.time()
+        self.stats_interval = float(conf.get(
+            'stats_interval', DEFAULT_STATS_INTERVAL))
+        self.diskfile_router = diskfile.DiskFileRouter(self.conf, self.logger)
+        self.stats = _zero_stats()
+        self.devices_data = recursive_defaultdict()
+        self.policy_count = 0
+        self.pid = os.getpid()
+        self.linked_into_partitions = set()
+
+    def _aggregate_dev_policy_stats(self):
+        for dev_data in self.devices_data.values():
+            dev_data.update(_zero_collated_stats())
+            for policy_data in dev_data.get('policies', {}).values():
+                _aggregate_recon_stats(dev_data, policy_data)
+
+    def _update_recon(self, device=None, force_dump=False):
+        if not force_dump and self._last_recon_update + self.stats_interval \
+                > time.time():
+            # not time yet!
+            return
+        if device:
+            # dump recon stats for the device
+            num_parts_done = sum(
+                1 for part_done in self.states["state"].values()
+                if part_done)
+            num_total_parts = len(self.states["state"])
+            step = STEP_CLEANUP if self.do_cleanup else STEP_RELINK
+            policy_dev_progress = {'step': step,
+                                   'parts_done': num_parts_done,
+                                   'total_parts': num_total_parts,
+                                   'timestamp': time.time()}
+            self.devices_data[device]['policies'][self.policy.idx].update(
+                policy_dev_progress)
+
+        # aggregate device policy level values into device level
+        self._aggregate_dev_policy_stats()
+
+        # We want to periodically update the worker recon timestamp so we know
+        # it's still running
+        recon_data = self._update_worker_stats(recon_dump=False)
+
+        recon_data.update({'devices': self.devices_data})
+        if device:
+            self.logger.debug("Updating recon for %s", device)
+        else:
+            self.logger.debug("Updating recon")
+        self._last_recon_update = time.time()
+        dump_recon_cache(recon_data, self.recon_cache, self.logger)
+
+    @property
+    def total_errors(self):
+        # first make sure the policy data is aggregated down to the device
+        # level
+        self._aggregate_dev_policy_stats()
+        return sum([sum([
+            dev.get('stats', {}).get('errors', 0),
+            dev.get('stats', {}).get('unmounted', 0),
+            dev.get('stats', {}).get('unlistable_partitions', 0)])
+            for dev in self.devices_data.values()])
+
+    def devices_filter(self, _, devices):
+        if self.device_list:
+            devices = [d for d in devices if d in self.device_list]
+
+        return set(devices)
+
+    def hook_pre_device(self, device_path):
+        lock_file = os.path.join(device_path,
+                                 LOCK_FILE.format(datadir=self.datadir))
+
+        fd = os.open(lock_file, os.O_CREAT | os.O_WRONLY)
+        fcntl.flock(fd, fcntl.LOCK_EX)
+        self.dev_lock = fd
+
+        state_file = os.path.join(device_path,
+                                  STATE_FILE.format(datadir=self.datadir))
+        self.states["state"].clear()
+        try:
+            with open(state_file, 'rt') as f:
+                state_from_disk = json.load(f)
+                if state_from_disk["next_part_power"] != \
+                        self.states["next_part_power"]:
+                    raise ValueError
+                on_disk_part_power = state_from_disk["part_power"]
+                if on_disk_part_power != self.states["part_power"]:
+                    self.states["prev_part_power"] = on_disk_part_power
+                    raise ValueError
+                self.states["state"].update(state_from_disk["state"])
+        except (ValueError, TypeError, KeyError):
+            # Bad state file: remove the file to restart from scratch
+            os.unlink(state_file)
+        except IOError as err:
+            # Ignore file not found error
+            if err.errno != errno.ENOENT:
+                raise
+
+        # initialise the device in recon.
+        device = os.path.basename(device_path)
+        self.devices_data[device]['policies'][self.policy.idx] = {
+            'start_time': time.time(), 'stats': _zero_stats(),
+            'part_power': self.states["part_power"],
+            'next_part_power': self.states["next_part_power"]}
+        self.stats = \
+            self.devices_data[device]['policies'][self.policy.idx]['stats']
+        self._update_recon(device)
+
+    def hook_post_device(self, device_path):
+        os.close(self.dev_lock)
+        self.dev_lock = None
+        device = os.path.basename(device_path)
+        pol_stats = self.devices_data[device]['policies'][self.policy.idx]
+        total_time = time.time() - pol_stats['start_time']
+        pol_stats.update({'total_time': total_time, 'stats': self.stats})
+        self._update_recon(device, force_dump=True)
+
+    def partitions_filter(self, datadir_path, partitions):
+        # Remove all non partitions first (eg: auditor_status_ALL.json)
+        partitions = [p for p in partitions if p.isdigit()]
+
+        relinking = (self.part_power != self.next_part_power)
+        if relinking:
+            # All partitions in the upper half are new partitions and there is
+            # nothing to relink there
+            partitions = [part for part in partitions
+                          if int(part) < 2 ** self.part_power]
+        elif "prev_part_power" in self.states:
+            # All partitions in the upper half are new partitions and there is
+            # nothing to clean up there
+            partitions = [part for part in partitions
+                          if int(part) < 2 ** self.states["prev_part_power"]]
+
+        # Format: { 'part': processed }
+        if self.states["state"]:
+            missing = list(set(partitions) - set(self.states["state"].keys()))
+            if missing:
+                # All missing partitions were created after the first run of
+                # the relinker with this part_power/next_part_power pair. This
+                # is expected when relinking, where new partitions appear that
+                # are appropriate for the target part power. In such cases,
+                # there's nothing to be done. Err on the side of caution
+                # during cleanup, however.
+                for part in missing:
+                    self.states["state"][part] = relinking
+            partitions = [
+                str(part) for part, processed in self.states["state"].items()
+                if not processed]
+        else:
+            self.states["state"].update({
+                str(part): False for part in partitions})
+
+        # Always scan the partitions in reverse order to minimize the amount
+        # of IO (it actually only matters for relink, not for cleanup).
+        #
+        # Initial situation:
+        #  objects/0/000/00000000...00000000/12345.data
+        #  -> relinked to objects/1/000/10000000...00000000/12345.data
+        #
+        # If the relinker then scan partition 1, it will listdir that object
+        # while it's unnecessary. By working in reverse order of partitions,
+        # this is avoided.
+        partitions = sorted(partitions, key=int, reverse=True)
+
+        # do this last so that self.states, and thus the state file, has been
+        # initiated with *all* partitions before partitions are restricted for
+        # this particular run...
+        conf_partitions = self.conf.get('partitions')
+        if conf_partitions:
+            partitions = [p for p in partitions if int(p) in conf_partitions]
+
+        return partitions
+
+    def hook_pre_partition(self, partition_path):
+        self.pre_partition_errors = self.total_errors
+        self.linked_into_partitions = set()
+
+    def hook_post_partition(self, partition_path):
+        datadir_path, partition = os.path.split(
+            os.path.abspath(partition_path))
+        device_path, datadir_name = os.path.split(datadir_path)
+        device = os.path.basename(device_path)
+        state_tmp_file = os.path.join(
+            device_path, STATE_TMP_FILE.format(datadir=datadir_name))
+        state_file = os.path.join(
+            device_path, STATE_FILE.format(datadir=datadir_name))
+
+        # We started with a partition space like
+        #   |0              N|
+        #   |ABCDEFGHIJKLMNOP|
+        #
+        # After relinking, it will be more like
+        #   |0                             2N|
+        #   |AABBCCDDEEFFGGHHIIJJKKLLMMNNOOPP|
+        #
+        # We want to hold off on rehashing until after cleanup, since that is
+        # the point at which we've finished with filesystem manipulations. But
+        # there's a slight complication: we know the upper half has nothing to
+        # clean up, so the cleanup phase only looks at
+        #   |0                             2N|
+        #   |AABBCCDDEEFFGGHH                |
+        #
+        # To ensure that the upper half gets rehashed, too, do it as part of
+        # relinking; as we finish
+        #   |0              N|
+        #   |        IJKLMNOP|
+        # shift to the new partition space and rehash
+        #   |0                             2N|
+        #   |                IIJJKKLLMMNNOOPP|
+        for dirty_partition in self.linked_into_partitions:
+            if self.do_cleanup or \
+                    dirty_partition >= 2 ** self.states['part_power']:
+                self.diskfile_mgr.get_hashes(
+                    device, dirty_partition, [], self.policy)
+
+        if self.do_cleanup:
+            try:
+                hashes = self.diskfile_mgr.get_hashes(
+                    device, int(partition), [], self.policy)
+            except LockTimeout:
+                hashes = 1  # truthy, but invalid
+            # In any reasonably-large cluster, we'd expect all old
+            # partitions P to be empty after cleanup (i.e., it's unlikely
+            # that there's another partition Q := P//2 that also has data
+            # on this device).
+            #
+            # Try to clean up empty partitions now, so operators can use
+            # existing rebalance-complete metrics to monitor relinking
+            # progress (provided there are few/no handoffs when relinking
+            # starts and little data is written to handoffs during the
+            # increase).
+            if not hashes:
+                try:
+                    with self.diskfile_mgr.replication_lock(
+                            device, self.policy, partition), \
+                        self.diskfile_mgr.partition_lock(
+                            device, self.policy, partition):
+                        # Order here is somewhat important for crash-tolerance
+                        for f in ('hashes.pkl', 'hashes.invalid', '.lock',
+                                  '.lock-replication'):
+                            try:
+                                os.unlink(os.path.join(partition_path, f))
+                            except OSError as e:
+                                if e.errno != errno.ENOENT:
+                                    raise
+                    # Note that as soon as we've deleted the lock files, some
+                    # other process could come along and make new ones -- so
+                    # this may well complain that the directory is not empty
+                    os.rmdir(partition_path)
+                except (OSError, LockTimeout):
+                    # Most likely, some data landed in here or we hit an error
+                    # above. Let the replicator deal with things; it was worth
+                    # a shot.
+                    pass
+
+        # If there were no errors, mark this partition as done. This is handy
+        # in case the process is interrupted and needs to resume, or there
+        # were errors and the relinker needs to run again.
+        if self.pre_partition_errors == self.total_errors:
+            self.states["state"][partition] = True
+            with open(state_tmp_file, 'wt') as f:
+                json.dump(self.states, f)
+                os.fsync(f.fileno())
+            os.rename(state_tmp_file, state_file)
+        num_parts_done = sum(
+            1 for part in self.states["state"].values()
+            if part)
+        step = STEP_CLEANUP if self.do_cleanup else STEP_RELINK
+        num_total_parts = len(self.states["state"])
+        self.logger.info(
+            "Step: %s Device: %s Policy: %s Partitions: %d/%d",
+            step, device, self.policy.name, num_parts_done, num_total_parts)
+        self._update_recon(device)
+
+    def hashes_filter(self, suff_path, hashes):
+        hashes = list(hashes)
+        for hsh in hashes:
+            fname = os.path.join(suff_path, hsh)
+            if fname == replace_partition_in_path(
+                    self.conf['devices'], fname, self.next_part_power):
+                hashes.remove(hsh)
+        return hashes
+
+    def do_relink(self, device, hash_path, new_hash_path, filename,
+                  already_quarantined=False):
+        """
+        Attempt to relink a file from old location to new location.
+
+        :param device: device name
+        :param hash_path: source hash directory path
+        :param new_hash_path: destination hash directory path
+        :param filename: filename to relink
+        :param already_quarantined: whether quarantine has already been
+                                    attempted
+        :returns: tuple of (success, created) where success is True if the link
+                  is successfully verified, and created is True if a new link
+                  needed to be created for successful verification (if created
+                  is True for any new link in any hash_path some caller above
+                  us should ideally invalidate the whole suffix)
+        """
+        old_file = os.path.join(hash_path, filename)
+        new_file = os.path.join(new_hash_path, filename)
+        success = created = False
+        try:
+            created = diskfile.relink_paths(old_file, new_file)
+            success = True
+        except FileExistsError:
+            # we've detected a hardlink collision, so we need to handle it
+            # depending on what kind of file it is and our mode and
+            # configuration
+            if filename.endswith('.ts'):
+                # special case for duplicate tombstones, see:
+                # https://bugs.launchpad.net/swift/+bug/1921718
+                # https://bugs.launchpad.net/swift/+bug/1934142
+                self.logger.debug(
+                    "Relinking%s: tolerating different inodes for "
+                    "tombstone with same timestamp: %s to %s",
+                    ' (cleanup)' if self.do_cleanup else '',
+                    old_file, new_file)
+                success = True
+            elif self.conf['clobber_hardlink_collisions']:
+                if self.do_cleanup:
+                    # At this point your clients are already *in* the new part
+                    # dir, if the "better" data was in the old part dir you're
+                    # already hurting and maybe flipped back to retry the
+                    # relink phase again?  If you're moving forward with the
+                    # cleanup presumably you're ready for this circus to be
+                    # over and doing extra io to quarantine the data you're
+                    # currently using and replace it with old data seems less
+                    # attractive than letting the un-referenced data get
+                    # cleaned up.  But there might be a case to argue that
+                    # clobber_hardlink_collision should quarantine old_file
+                    # here before returning success.
+                    self.logger.debug(
+                        "Relinking%s: tolerating hardlink collision: "
+                        "%s to %s",
+                        ' (cleanup)' if self.do_cleanup else '',
+                        old_file, new_file)
+                    success = True
+                elif already_quarantined:
+                    # Already attempted quarantine, this is a failure, but user
+                    # can retry (or already_quarantined becomes a counter?)
+                    # N.B. this can exit non-zero w/o logging at "error"
+                    self.logger.warning(
+                        "Relinking%s: hardlink collision persists after "
+                        "quarantine: %s to %s",
+                        ' (cleanup)' if self.do_cleanup else '',
+                        old_file, new_file)
+                else:
+                    # During relink phase, quarantine and retry once
+                    dev_path = os.path.join(self.diskfile_mgr.devices, device)
+                    to_dir = diskfile.quarantine_renamer(dev_path, new_file)
+                    self.logger.info(
+                        "Relinking%s: clobbering hardlink collision: "
+                        "%s moved to %s",
+                        ' (cleanup)' if self.do_cleanup else '',
+                        new_file, to_dir)
+                    # retry with quarantine flag set
+                    return self.do_relink(
+                        device, hash_path, new_hash_path, filename,
+                        already_quarantined=True)
+            else:
+                self.logger.error(
+                    "Error relinking%s: hardlink collision: "
+                    "%s to %s (consider enabling clobber_hardlink_collisions)",
+                    ' (cleanup)' if self.do_cleanup else '',
+                    old_file, new_file)
+        except Exception as exc:
+            # Depending on what kind of errors these are, it might be
+            # reasonable to consider them "warnings" if we expect re-running
+            # the relinker would be able to fix them (like if it's just a
+            # general file-system corruption error and your auditor is still
+            # running maybe it will quarantine bad paths to clear the way).
+            # But AFAIK all currently known/observed error conditions are
+            # enumerated above and any unknown error conditions may not be
+            # fixable by simply re-running the relinker: so we log them as
+            # error to match the expected non-zero return code.
+            self.logger.error(
+                "Error relinking%s: failed to relink %s to %s: %s",
+                ' (cleanup)' if self.do_cleanup else '',
+                old_file, new_file, exc)
+        if created:
+            self.logger.debug(
+                "Relinking%s created link: %s to %s",
+                ' (cleanup)' if self.do_cleanup else '',
+                old_file, new_file)
+        return success, created
+
+    def process_location(self, device, hash_path, new_hash_path):
+        """
+        Handle relink of all files in a hash_dir path.
+
+        Compare the contents of each hash dir with contents of same hash
+        dir in its new partition to verify that the new location has the
+        most up to date set of files. The new location may have newer
+        files if it has been updated since relinked.
+
+        If any new links are created the suffix will be invalidated.
+        In cleanup mode, the unwanted files in the old hash_path will be
+        removed as long as there are no errors.
+
+        :param device: device name
+        :param hash_path: old hash directory path
+        :param new_hash_path: new hash directory path
+        """
+        self.stats['hash_dirs'] += 1
+
+        # Get on disk data for new and old locations, cleaning up any
+        # reclaimable or obsolete files in each. The new location is
+        # cleaned up *before* the old location to prevent false negatives
+        # where the old still has a file that has been cleaned up in the
+        # new; cleaning up the new location first ensures that the old will
+        # always be 'cleaner' than the new.
+        new_df_data = self.diskfile_mgr.cleanup_ondisk_files(new_hash_path)
+        old_df_data = self.diskfile_mgr.cleanup_ondisk_files(hash_path)
+        # Now determine the most up to date set of on disk files would be
+        # given the content of old and new locations...
+        new_files = set(new_df_data['files'])
+        old_files = set(old_df_data['files'])
+        union_files = new_files.union(old_files)
+        union_data = self.diskfile_mgr.get_ondisk_files(
+            union_files, '', verify=False)
+        obsolete_files = set(info['filename']
+                             for info in union_data.get('obsolete', []))
+        # drop 'obsolete' files but retain 'unexpected' files which might
+        # be misplaced diskfiles from another policy
+        required_files = union_files.difference(obsolete_files)
+        required_links = required_files.intersection(old_files)
+
+        missing_links = 0
+        created_links = 0
+        unwanted_files = []
+        for filename in required_links:
+            # Before removing old files, be sure that the corresponding
+            # required new files exist by calling relink_paths again. There
+            # are several possible outcomes:
+            #  - The common case is that the new file exists, in which case
+            #    relink_paths checks that the new file has the same inode
+            #    as the old file. An exception is raised if the inode of
+            #    the new file is not the same as the old file.
+            #  - The new file may not exist because the relinker failed to
+            #    create the link to the old file and has erroneously moved
+            #    on to cleanup. In this case the relink_paths will create
+            #    the link now or raise an exception if that fails.
+            #  - The new file may not exist because some other process,
+            #    such as an object server handling a request, has cleaned
+            #    it up since we called cleanup_ondisk_files(new_hash_path).
+            #    In this case a new link will be created to the old file.
+            #    This is unnecessary but simpler than repeating the
+            #    evaluation of what links are now required and safer than
+            #    assuming that a non-existent file that *was* required is
+            #    no longer required. The new file will eventually be
+            #    cleaned up again.
+            self.stats['files'] += 1
+            success, created = self.do_relink(
+                device, hash_path, new_hash_path, filename)
+            if success:
+                if created:
+                    created_links += 1
+                    self.stats['linked'] += 1
+            else:
+                self.stats['errors'] += 1
+                missing_links += 1
+        if created_links:
+            self.linked_into_partitions.add(get_partition_from_path(
+                self.conf['devices'], new_hash_path))
+            try:
+                diskfile.invalidate_hash(os.path.dirname(new_hash_path))
+            except (Exception, LockTimeout) as exc:
+                # at this point, the link's created. even if we counted it as
+                # an error, a subsequent run wouldn't find any work to do. so,
+                # don't bother; instead, wait for replication to be re-enabled
+                # so post-replication rehashing or periodic rehashing can
+                # eventually pick up the change
+                self.logger.warning(
+                    'Error invalidating suffix for %s: %r',
+                    new_hash_path, exc)
+
+        if self.do_cleanup and not missing_links:
+            # use the sorted list to help unit testing
+            unwanted_files = old_df_data['files']
+
+        # the new partition hash dir has the most up to date set of on
+        # disk files so it is safe to delete the old location...
+        rehash = False
+        for filename in unwanted_files:
+            old_file = os.path.join(hash_path, filename)
+            try:
+                os.remove(old_file)
+            except OSError as exc:
+                # N.B. if we want to allow old_file to get quarantined this
+                # should probably be robust to ENOENT
+                self.logger.warning('Error cleaning up %s: %r', old_file, exc)
+                self.stats['errors'] += 1
+            else:
+                rehash = True
+                self.stats['removed'] += 1
+                self.logger.debug("Removed %s", old_file)
+
+        if rehash:
+            # Even though we're invalidating the suffix, don't update
+            # self.linked_into_partitions -- we only care about them for
+            # relinking into the new part-power space
+            try:
+                diskfile.invalidate_hash(os.path.dirname(hash_path))
+            except (Exception, LockTimeout) as exc:
+                # note: not counted as an error
+                self.logger.warning(
+                    'Error invalidating suffix for %s: %r',
+                    hash_path, exc)
+
+    def place_policy_stat(self, dev, policy, stat, value):
+        stats = self.devices_data[dev]['policies'][policy.idx].setdefault(
+            "stats", _zero_stats())
+        stats[stat] = stats.get(stat, 0) + value
+
+    def process_policy(self, policy):
+        self.logger.info(
+            'Processing files for policy %s under %s (cleanup=%s)',
+            policy.name, self.root, self.do_cleanup)
+        self.part_power = policy.object_ring.part_power
+        self.next_part_power = policy.object_ring.next_part_power
+        self.diskfile_mgr = self.diskfile_router[policy]
+        self.datadir = diskfile.get_data_dir(policy)
+        self.states = {
+            "part_power": self.part_power,
+            "next_part_power": self.next_part_power,
+            "state": {},
+        }
+        audit_stats = {}
+
+        locations = audit_location_generator(
+            self.conf['devices'],
+            self.datadir,
+            mount_check=self.conf['mount_check'],
+            devices_filter=self.devices_filter,
+            hook_pre_device=self.hook_pre_device,
+            hook_post_device=self.hook_post_device,
+            partitions_filter=self.partitions_filter,
+            hook_pre_partition=self.hook_pre_partition,
+            hook_post_partition=self.hook_post_partition,
+            hashes_filter=self.hashes_filter,
+            logger=self.logger,
+            error_counter=audit_stats,
+            yield_hash_dirs=True
+        )
+        if self.conf['files_per_second'] > 0:
+            locations = RateLimitedIterator(
+                locations, self.conf['files_per_second'])
+        for hash_path, device, _part_num in locations:
+            # note, in cleanup step next_part_power == part_power
+            new_hash_path = replace_partition_in_path(
+                self.conf['devices'], hash_path, self.next_part_power)
+            if new_hash_path == hash_path:
+                continue
+            self.process_location(device, hash_path, new_hash_path)
+
+        # any unmounted devices don't trigger the pre_device trigger.
+        # so we'll deal with them here.
+        for dev in audit_stats.get('unmounted', []):
+            self.place_policy_stat(dev, policy, 'unmounted', 1)
+
+        # Further unlistable_partitions doesn't trigger the post_device, so
+        # we also need to deal with them here.
+        for datadir in audit_stats.get('unlistable_partitions', []):
+            device_path, _ = os.path.split(datadir)
+            device = os.path.basename(device_path)
+            self.place_policy_stat(device, policy, 'unlistable_partitions', 1)
+
+    def _update_worker_stats(self, recon_dump=True, return_code=None):
+        worker_stats = {'devices': self.device_list,
+                        'timestamp': time.time(),
+                        'return_code': return_code}
+        worker_data = {"workers": {str(self.pid): worker_stats}}
+        if recon_dump:
+            dump_recon_cache(worker_data, self.recon_cache, self.logger)
+        return worker_data
+
+    def run(self):
+        num_policies = 0
+        self._update_worker_stats()
+        for policy in self.conf['policies']:
+            self.policy = policy
+            policy.object_ring = None  # Ensure it will be reloaded
+            policy.load_ring(self.conf['swift_dir'])
+            ring = policy.object_ring
+            if not ring.next_part_power:
+                continue
+            part_power_increased = ring.next_part_power == ring.part_power
+            if self.do_cleanup != part_power_increased:
+                continue
+
+            num_policies += 1
+            self.process_policy(policy)
+
+        # Some stat collation happens during _update_recon and we want to force
+        # this to happen at the end of the run
+        self._update_recon(force_dump=True)
+        if not num_policies:
+            self.logger.warning(
+                "No policy found to increase the partition power.")
+            self._update_worker_stats(return_code=EXIT_NO_APPLICABLE_POLICY)
+            return EXIT_NO_APPLICABLE_POLICY
+
+        if self.total_errors > 0:
+            log_method = self.logger.warning
+            # NB: audit_location_generator logs unmounted disks as warnings,
+            # but we want to treat them as errors
+            status = EXIT_ERROR
+        else:
+            log_method = self.logger.info
+            status = EXIT_SUCCESS
+
+        stats = _zero_stats()
+        for dev_stats in self.devices_data.values():
+            stats = _aggregate_stats(stats, dev_stats.get('stats', {}))
+        hash_dirs = stats.pop('hash_dirs')
+        files = stats.pop('files')
+        linked = stats.pop('linked')
+        removed = stats.pop('removed')
+        action_errors = stats.pop('errors')
+        unmounted = stats.pop('unmounted', 0)
+        if unmounted:
+            self.logger.warning('%d disks were unmounted', unmounted)
+        listdir_errors = stats.pop('unlistable_partitions', 0)
+        if listdir_errors:
+            self.logger.warning(
+                'There were %d errors listing partition directories',
+                listdir_errors)
+        if stats:
+            self.logger.warning(
+                'There were unexpected errors while enumerating disk '
+                'files: %r', stats)
+
+        log_method(
+            '%d hash dirs processed (cleanup=%s) (%d files, %d linked, '
+            '%d removed, %d errors)', hash_dirs, self.do_cleanup, files,
+            linked, removed, action_errors + listdir_errors)
+
+        self._update_worker_stats(return_code=status)
+        return status
+
+
+def _reset_recon(recon_cache, logger):
+    device_progress_recon = {'devices': {}, 'workers': {}}
+    dump_recon_cache(device_progress_recon, recon_cache, logger)
+
+
+def parallel_process(do_cleanup, conf, logger, device_list=None):
+    """
+    Fork Relinker workers based on config and wait for them to finish.
+
+    :param do_cleanup: boolean, if workers should perform cleanup step
+    :param conf: dict, config options
+    :param logger: SwiftLogAdapter instance
+    :kwarg device_list: list of strings, optionally limit to specific devices
+
+    :returns: int, exit code; zero on success
+    """
+
+    # initialise recon dump for collection
+    # Lets start by always deleting last run's stats
+    recon_cache = os.path.join(conf['recon_cache_path'], RECON_RELINKER_FILE)
+    _reset_recon(recon_cache, logger)
+
+    device_list = sorted(set(device_list or os.listdir(conf['devices'])))
+    workers = conf['workers']
+    if workers == 'auto':
+        workers = len(device_list)
+    else:
+        workers = min(workers, len(device_list))
+
+    start = time.time()
+    logger.info('Starting relinker (cleanup=%s) using %d workers: %s' %
+                (do_cleanup, workers,
+                 time.strftime('%X %x %Z', time.gmtime(start))))
+    if workers == 0 or len(device_list) in (0, 1):
+        ret = Relinker(
+            conf, logger, device_list, do_cleanup=do_cleanup).run()
+        logger.info('Finished relinker (cleanup=%s): %s (%s elapsed)' %
+                    (do_cleanup, time.strftime('%X %x %Z', time.gmtime()),
+                     datetime.timedelta(seconds=time.time() - start)))
+        return ret
+
+    children = {}
+    for worker_devs in distribute_evenly(device_list, workers):
+        pid = os.fork()
+        if pid == 0:
+            logger = get_prefixed_logger(logger, '[pid=%s, devs=%s] ' % (
+                os.getpid(), ','.join(worker_devs)))
+            os._exit(Relinker(
+                conf, logger, worker_devs, do_cleanup=do_cleanup).run())
+        else:
+            children[pid] = worker_devs
+
+    final_status = EXIT_SUCCESS
+    final_messages = []
+    while children:
+        pid, status = os.wait()
+        sig = status & 0xff
+        status = status >> 8
+        time_delta = time.time() - start
+        devs = children.pop(pid, ['unknown device'])
+        worker_desc = '(pid=%s, devs=%s)' % (pid, ','.join(devs))
+        if sig != 0:
+            final_status = EXIT_ERROR
+            final_messages.append(
+                'Worker %s exited in %.1fs after receiving signal: %s'
+                % (worker_desc, time_delta, sig))
+            continue
+
+        if status == EXIT_SUCCESS:
+            continue
+
+        if status == EXIT_NO_APPLICABLE_POLICY:
+            if final_status == EXIT_SUCCESS:
+                final_status = status
+            continue
+
+        final_status = EXIT_ERROR
+        if status == EXIT_ERROR:
+            final_messages.append(
+                'Worker %s completed in %.1fs with errors'
+                % (worker_desc, time_delta))
+        else:
+            final_messages.append(
+                'Worker %s exited in %.1fs with unexpected status %s'
+                % (worker_desc, time_delta, status))
+
+    for msg in final_messages:
+        logger.warning(msg)
+    logger.info('Finished relinker (cleanup=%s): %s (%s elapsed)' %
+                (do_cleanup, time.strftime('%X %x %Z', time.gmtime()),
+                 datetime.timedelta(seconds=time.time() - start)))
+    return final_status
+
+
+def auto_or_int(value):
+    return config_auto_int_value(value, default='auto')
+
+
+def main(args=None):
+    parser = argparse.ArgumentParser(
+        description='Relink and cleanup objects to increase partition power')
+    parser.add_argument('action', choices=['relink', 'cleanup'])
+    parser.add_argument('conf_file', nargs='?', help=(
+        'Path to config file with [object-relinker] section'))
+    parser.add_argument('--swift-dir', default=None,
+                        dest='swift_dir', help='Path to swift directory')
+    parser.add_argument(
+        '--policy', default=[], dest='policies',
+        action='append', type=policy,
+        help='Policy to relink; may specify multiple (default: all)')
+    parser.add_argument('--devices', default=None,
+                        dest='devices', help='Path to swift device directory')
+    parser.add_argument('--user', default=None, dest='user',
+                        help='Drop privileges to this user before relinking')
+    parser.add_argument('--device',
+                        default=[], dest='device_list', action='append',
+                        help='Device name to relink (default: all)')
+    parser.add_argument('--partition', '-p', default=[], dest='partitions',
+                        type=non_negative_int, action='append',
+                        help='Partition to relink (default: all)')
+    parser.add_argument('--skip-mount-check', default=False,
+                        help='Don\'t test if disk is mounted',
+                        action="store_true", dest='skip_mount_check')
+    parser.add_argument('--files-per-second', default=None,
+                        type=non_negative_float, dest='files_per_second',
+                        help='Used to limit I/O. Zero implies no limit '
+                             '(default: no limit).')
+    parser.add_argument('--stats-interval', default=None,
+                        type=non_negative_float, dest='stats_interval',
+                        help='Emit stats to recon roughly every N seconds. '
+                             '(default: %d).' % DEFAULT_STATS_INTERVAL)
+    parser.add_argument(
+        '--workers', default=None, type=auto_or_int, help=(
+            'Process devices across N workers '
+            '(default: one worker per device)'))
+    parser.add_argument('--logfile', default=None, dest='logfile',
+                        help='Set log file name. Ignored if using conf_file.')
+    parser.add_argument('--debug', default=False, action='store_true',
+                        help='Enable debug mode')
+    parser.add_argument('--clobber-hardlink-collisions', action='store_true',
+                        help='Tolerate hard link collisions when relinking'
+                             'object files. If the action is relink then the '
+                             'file in the new target part dir is quarantined '
+                             'and the relink is retried. If the action is '
+                             'cleanup then the file in the new target dir is '
+                             'retained and the file in the old target dir is '
+                             'removed. (default: false)')
+
+    args = parser.parse_args(args)
+    hubs.use_hub(get_hub())
+    if args.conf_file:
+        conf = readconf(args.conf_file, 'object-relinker')
+        if args.debug:
+            conf['log_level'] = 'DEBUG'
+        user = args.user or conf.get('user')
+        if user:
+            drop_privileges(user)
+        logger = get_logger(conf)
+    else:
+        level = 'DEBUG' if args.debug else 'INFO'
+        conf = {'log_level': level}
+        if args.user:
+            # Drop privs before creating log file
+            drop_privileges(args.user)
+            conf['user'] = args.user
+        logging.basicConfig(
+            format='%(message)s',
+            level=getattr(logging, level),
+            filename=args.logfile)
+        logger = SwiftLogAdapter(logging.getLogger(), server='relinker')
+
+    conf.update({
+        'swift_dir': args.swift_dir or conf.get('swift_dir', '/etc/swift'),
+        'devices': args.devices or conf.get('devices', '/srv/node'),
+        'mount_check': (config_true_value(conf.get('mount_check', 'true'))
+                        and not args.skip_mount_check),
+        'files_per_second': (
+            args.files_per_second if args.files_per_second is not None
+            else non_negative_float(conf.get('files_per_second', '0'))),
+        'policies': set(args.policies) or POLICIES,
+        'partitions': set(args.partitions),
+        'workers': config_auto_int_value(
+            conf.get('workers') if args.workers is None else args.workers,
+            'auto'),
+        'recon_cache_path': conf.get('recon_cache_path',
+                                     DEFAULT_RECON_CACHE_PATH),
+        'stats_interval': non_negative_float(
+            args.stats_interval or conf.get('stats_interval',
+                                            DEFAULT_STATS_INTERVAL)),
+        'clobber_hardlink_collisions': (
+            args.clobber_hardlink_collisions or
+            config_true_value(conf.get('clobber_hardlink_collisions',
+                                       'false'))),
+    })
+    return parallel_process(
+        args.action == 'cleanup', conf, logger, args.device_list)
diff --git a/swift/cli/reload.py b/swift/cli/reload.py
new file mode 100755
index 0000000000..9d84e39c71
--- /dev/null
+++ b/swift/cli/reload.py
@@ -0,0 +1,135 @@
+# Copyright (c) 2022 NVIDIA
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""
+Safely reload WSGI servers while minimizing client downtime and errors by
+
+   * validating that the process is a Swift WSGI server manager,
+   * checking that the configuration file used is valid,
+   * sending the "seamless reload" signal, and
+   * waiting for the reload to complete.
+"""
+
+import argparse
+import errno
+import os
+import os.path
+import signal
+import socket
+import subprocess
+import sys
+
+from swift.common.utils import NotificationServer
+
+
+EXIT_BAD_PID = 2  # similar to argparse exiting 2 on an unknown arg
+EXIT_RELOAD_FAILED = 1
+EXIT_RELOAD_TIMEOUT = 128 + errno.ETIMEDOUT
+
+
+def validate_manager_pid(pid):
+    try:
+        with open('/proc/%d/cmdline' % pid, 'r') as fp:
+            cmd = fp.read().strip('\x00').split('\x00')
+        sid = os.getsid(pid)
+    except (IOError, OSError):
+        print("Failed to get process information for %s" % pid,
+              file=sys.stderr)
+        exit(EXIT_BAD_PID)
+
+    scripts = [os.path.basename(c) for c in cmd
+               if '/bin/' in c and '/bin/python' not in c]
+
+    if len(scripts) != 1 or not scripts[0].startswith("swift-"):
+        print("Non-swift process: %r" % ' '.join(cmd), file=sys.stderr)
+        exit(EXIT_BAD_PID)
+
+    if scripts[0] not in {"swift-proxy-server", "swift-account-server",
+                          "swift-container-server", "swift-object-server"}:
+        print("Process does not support config checks: %s" % scripts[0],
+              file=sys.stderr)
+        exit(EXIT_BAD_PID)
+
+    if sid != pid:
+        print("Process appears to be a %s worker, not a manager. "
+              "Did you mean %s?" % (scripts[0], sid), file=sys.stderr)
+        exit(EXIT_BAD_PID)
+
+    return cmd, scripts[0]
+
+
+def main(args=None):
+    parser = argparse.ArgumentParser(__doc__)
+    parser.add_argument("pid", type=int,
+                        help="server PID which should be reloaded")
+    wait_group = parser.add_mutually_exclusive_group()
+    wait_group.add_argument("-t", "--timeout", type=float, default=300.0,
+                            help="max time to wait for reload to complete")
+    wait_group.add_argument("-w", "--no-wait",
+                            action="store_false", dest="wait",
+                            help="skip waiting for reload to complete")
+    parser.add_argument("-v", "--verbose", action="store_true",
+                        help="display more information as the process reloads")
+    args = parser.parse_args(args)
+
+    cmd, script = validate_manager_pid(args.pid)
+
+    if args.verbose:
+        print("Checking config for %s" % script)
+    try:
+        subprocess.check_call(cmd + ["--test-config"])
+    except subprocess.CalledProcessError:
+        print("Failed to validate config", file=sys.stderr)
+        exit(EXIT_RELOAD_FAILED)
+
+    if args.wait:
+        try:
+            with NotificationServer(args.pid, args.timeout) as notifications:
+                if args.verbose:
+                    print("Sending USR1 signal")
+                os.kill(args.pid, signal.SIGUSR1)
+
+                try:
+                    ready = False
+                    while not ready:
+                        data = notifications.receive()
+                        for data in data.split(b"\n"):
+                            if args.verbose:
+                                if data in (b"READY=1", b"RELOADING=1",
+                                            b"STOPPING=1"):
+                                    print("Process is %s" %
+                                          data.decode("ascii")[:-2])
+                                else:
+                                    print("Received notification %r" % data)
+
+                            if data == b"READY=1":
+                                ready = True
+                except socket.timeout:
+                    print("Timed out reloading %s" % script, file=sys.stderr)
+                    exit(EXIT_RELOAD_TIMEOUT)
+        except OSError as e:
+            print("Could not bind notification socket: %s" % e,
+                  file=sys.stderr)
+            exit(EXIT_RELOAD_FAILED)
+    else:  # --no-wait
+        if args.verbose:
+            print("Sending USR1 signal")
+        os.kill(args.pid, signal.SIGUSR1)
+
+    print("Reloaded %s" % script)
+
+
+if __name__ == "__main__":
+    main()
diff --git a/swift/cli/ring_builder_analyzer.py b/swift/cli/ring_builder_analyzer.py
new file mode 100644
index 0000000000..c385643389
--- /dev/null
+++ b/swift/cli/ring_builder_analyzer.py
@@ -0,0 +1,349 @@
+# Copyright (c) 2015 Samuel Merritt <sam@swiftstack.com>
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""
+This is a tool for analyzing how well the ring builder performs its job
+in a particular scenario. It is intended to help developers quantify any
+improvements or regressions in the ring builder; it is probably not useful
+to others.
+
+The ring builder analyzer takes a scenario file containing some initial
+parameters for a ring builder plus a certain number of rounds. In each
+round, some modifications are made to the builder, e.g. add a device, remove
+a device, change a device's weight. Then, the builder is repeatedly
+rebalanced until it settles down. Data about that round is printed, and the
+next round begins.
+
+Scenarios are specified in JSON. Example scenario for a gradual device
+addition::
+
+    {
+        "part_power": 12,
+        "replicas": 3,
+        "overload": 0.1,
+        "random_seed": 203488,
+
+        "rounds": [
+            [
+                ["add", "r1z2-10.20.30.40:6200/sda", 8000],
+                ["add", "r1z2-10.20.30.40:6200/sdb", 8000],
+                ["add", "r1z2-10.20.30.40:6200/sdc", 8000],
+                ["add", "r1z2-10.20.30.40:6200/sdd", 8000],
+
+                ["add", "r1z2-10.20.30.41:6200/sda", 8000],
+                ["add", "r1z2-10.20.30.41:6200/sdb", 8000],
+                ["add", "r1z2-10.20.30.41:6200/sdc", 8000],
+                ["add", "r1z2-10.20.30.41:6200/sdd", 8000],
+
+                ["add", "r1z2-10.20.30.43:6200/sda", 8000],
+                ["add", "r1z2-10.20.30.43:6200/sdb", 8000],
+                ["add", "r1z2-10.20.30.43:6200/sdc", 8000],
+                ["add", "r1z2-10.20.30.43:6200/sdd", 8000],
+
+                ["add", "r1z2-10.20.30.44:6200/sda", 8000],
+                ["add", "r1z2-10.20.30.44:6200/sdb", 8000],
+                ["add", "r1z2-10.20.30.44:6200/sdc", 8000]
+            ], [
+                ["add", "r1z2-10.20.30.44:6200/sdd", 1000]
+            ], [
+                ["set_weight", 15, 2000]
+            ], [
+                ["remove", 3],
+                ["set_weight", 15, 3000]
+            ], [
+                ["set_weight", 15, 4000]
+            ], [
+                ["set_weight", 15, 5000]
+            ], [
+                ["set_weight", 15, 6000]
+            ], [
+                ["set_weight", 15, 7000]
+            ], [
+                ["set_weight", 15, 8000]
+            ]]
+    }
+
+"""
+
+import argparse
+import json
+import sys
+
+from swift.common.ring import builder
+from swift.common.ring.utils import parse_add_value
+
+
+ARG_PARSER = argparse.ArgumentParser(
+    description='Put the ring builder through its paces')
+ARG_PARSER.add_argument(
+    '--check', '-c', action='store_true',
+    help="Just check the scenario, don't execute it.")
+ARG_PARSER.add_argument(
+    'scenario_path',
+    help="Path to the scenario file")
+
+
+class ParseCommandError(ValueError):
+
+    def __init__(self, name, round_index, command_index, msg):
+        msg = "Invalid %s (round %s, command %s): %s" % (
+            name, round_index, command_index, msg)
+        super(ParseCommandError, self).__init__(msg)
+
+
+def _parse_weight(round_index, command_index, weight_str):
+    try:
+        weight = float(weight_str)
+    except ValueError as err:
+        raise ParseCommandError('weight', round_index, command_index, err)
+    if weight < 0:
+        raise ParseCommandError('weight', round_index, command_index,
+                                'cannot be negative')
+    return weight
+
+
+def _parse_add_command(round_index, command_index, command):
+    if len(command) != 3:
+        raise ParseCommandError(
+            'add command', round_index, command_index,
+            'expected array of length 3, but got %r' % command)
+
+    dev_str = command[1]
+    weight_str = command[2]
+
+    try:
+        dev = parse_add_value(dev_str)
+    except ValueError as err:
+        raise ParseCommandError('device specifier', round_index,
+                                command_index, err)
+
+    dev['weight'] = _parse_weight(round_index, command_index, weight_str)
+
+    if dev['region'] is None:
+        dev['region'] = 1
+
+    default_key_map = {
+        'replication_ip': 'ip',
+        'replication_port': 'port',
+    }
+    for empty_key, default_key in default_key_map.items():
+        if dev[empty_key] is None:
+            dev[empty_key] = dev[default_key]
+
+    return ['add', dev]
+
+
+def _parse_remove_command(round_index, command_index, command):
+    if len(command) != 2:
+        raise ParseCommandError('remove commnd', round_index, command_index,
+                                "expected array of length 2, but got %r" %
+                                (command,))
+
+    dev_str = command[1]
+
+    try:
+        dev_id = int(dev_str)
+    except ValueError as err:
+        raise ParseCommandError('device ID in remove',
+                                round_index, command_index, err)
+
+    return ['remove', dev_id]
+
+
+def _parse_set_weight_command(round_index, command_index, command):
+    if len(command) != 3:
+        raise ParseCommandError('remove command', round_index, command_index,
+                                "expected array of length 3, but got %r" %
+                                (command,))
+
+    dev_str = command[1]
+    weight_str = command[2]
+
+    try:
+        dev_id = int(dev_str)
+    except ValueError as err:
+        raise ParseCommandError('device ID in set_weight',
+                                round_index, command_index, err)
+
+    weight = _parse_weight(round_index, command_index, weight_str)
+    return ['set_weight', dev_id, weight]
+
+
+def _parse_save_command(round_index, command_index, command):
+    if len(command) != 2:
+        raise ParseCommandError(
+            command, round_index, command_index,
+            "expected array of length 2 but got %r" % (command,))
+    return ['save', command[1]]
+
+
+def parse_scenario(scenario_data):
+    """
+    Takes a serialized scenario and turns it into a data structure suitable
+    for feeding to run_scenario().
+
+    :returns: scenario
+    :raises ValueError: on invalid scenario
+    """
+
+    parsed_scenario = {}
+
+    try:
+        raw_scenario = json.loads(scenario_data)
+    except ValueError as err:
+        raise ValueError("Invalid JSON in scenario file: %s" % err)
+
+    if not isinstance(raw_scenario, dict):
+        raise ValueError("Scenario must be a JSON object, not array or string")
+
+    if 'part_power' not in raw_scenario:
+        raise ValueError("part_power missing")
+    try:
+        parsed_scenario['part_power'] = int(raw_scenario['part_power'])
+    except ValueError as err:
+        raise ValueError("part_power not an integer: %s" % err)
+    if not 1 <= parsed_scenario['part_power'] <= 32:
+        raise ValueError("part_power must be between 1 and 32, but was %d"
+                         % raw_scenario['part_power'])
+
+    if 'replicas' not in raw_scenario:
+        raise ValueError("replicas missing")
+    try:
+        parsed_scenario['replicas'] = float(raw_scenario['replicas'])
+    except ValueError as err:
+        raise ValueError("replicas not a float: %s" % err)
+    if parsed_scenario['replicas'] < 1:
+        raise ValueError("replicas must be at least 1, but is %f"
+                         % parsed_scenario['replicas'])
+
+    if 'overload' not in raw_scenario:
+        raise ValueError("overload missing")
+    try:
+        parsed_scenario['overload'] = float(raw_scenario['overload'])
+    except ValueError as err:
+        raise ValueError("overload not a float: %s" % err)
+    if parsed_scenario['overload'] < 0:
+        raise ValueError("overload must be non-negative, but is %f"
+                         % parsed_scenario['overload'])
+
+    if 'random_seed' not in raw_scenario:
+        raise ValueError("random_seed missing")
+    try:
+        parsed_scenario['random_seed'] = int(raw_scenario['random_seed'])
+    except ValueError as err:
+        raise ValueError("replicas not an integer: %s" % err)
+
+    if 'rounds' not in raw_scenario:
+        raise ValueError("rounds missing")
+    if not isinstance(raw_scenario['rounds'], list):
+        raise ValueError("rounds must be an array")
+
+    parser_for_command = {
+        'add': _parse_add_command,
+        'remove': _parse_remove_command,
+        'set_weight': _parse_set_weight_command,
+        'save': _parse_save_command,
+    }
+
+    parsed_scenario['rounds'] = []
+    for round_index, raw_round in enumerate(raw_scenario['rounds']):
+        if not isinstance(raw_round, list):
+            raise ValueError("round %d not an array" % round_index)
+
+        parsed_round = []
+        for command_index, command in enumerate(raw_round):
+            if command[0] not in parser_for_command:
+                raise ValueError(
+                    "Unknown command (round %d, command %d): "
+                    "'%s' should be one of %s" %
+                    (round_index, command_index, command[0],
+                     parser_for_command.keys()))
+            parsed_round.append(
+                parser_for_command[command[0]](
+                    round_index, command_index, command))
+        parsed_scenario['rounds'].append(parsed_round)
+    return parsed_scenario
+
+
+def run_scenario(scenario):
+    """
+    Takes a parsed scenario (like from parse_scenario()) and runs it.
+    """
+    seed = scenario['random_seed']
+
+    rb = builder.RingBuilder(scenario['part_power'], scenario['replicas'], 1)
+    rb.set_overload(scenario['overload'])
+
+    command_map = {
+        'add': rb.add_dev,
+        'remove': rb.remove_dev,
+        'set_weight': rb.set_dev_weight,
+        'save': rb.save,
+    }
+
+    for round_index, commands in enumerate(scenario['rounds']):
+        print("Round %d" % (round_index + 1))
+
+        for command in commands:
+            key = command.pop(0)
+            try:
+                command_f = command_map[key]
+            except KeyError:
+                raise ValueError("unknown command %r" % key)
+            command_f(*command)
+
+        rebalance_number = 1
+        parts_moved, old_balance, removed_devs = rb.rebalance(seed=seed)
+        rb.pretend_min_part_hours_passed()
+        print("\tRebalance 1: moved %d parts, balance is %.6f, %d removed "
+              "devs" % (parts_moved, old_balance, removed_devs))
+
+        while True:
+            rebalance_number += 1
+            parts_moved, new_balance, removed_devs = rb.rebalance(seed=seed)
+            rb.pretend_min_part_hours_passed()
+            print("\tRebalance %d: moved %d parts, balance is %.6f, "
+                  "%d removed devs" % (rebalance_number, parts_moved,
+                                       new_balance, removed_devs))
+            if parts_moved == 0 and removed_devs == 0:
+                break
+            if abs(new_balance - old_balance) < 1 and not (
+                    old_balance == builder.MAX_BALANCE and
+                    new_balance == builder.MAX_BALANCE):
+                break
+            old_balance = new_balance
+
+
+def main(argv=None):
+    args = ARG_PARSER.parse_args(argv)
+
+    try:
+        with open(args.scenario_path) as sfh:
+            scenario_data = sfh.read()
+    except OSError as err:
+        sys.stderr.write("Error opening scenario %s: %s\n" %
+                         (args.scenario_path, err))
+        return 1
+
+    try:
+        scenario = parse_scenario(scenario_data)
+    except ValueError as err:
+        sys.stderr.write("Invalid scenario %s: %s\n" %
+                         (args.scenario_path, err))
+        return 1
+
+    if not args.check:
+        run_scenario(scenario)
+    return 0
diff --git a/swift/cli/ringbuilder.py b/swift/cli/ringbuilder.py
new file mode 100644
index 0000000000..2f609ad018
--- /dev/null
+++ b/swift/cli/ringbuilder.py
@@ -0,0 +1,1779 @@
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import logging
+
+from collections import defaultdict
+from errno import EEXIST
+from itertools import islice
+from operator import itemgetter
+from os import mkdir
+from os.path import basename, abspath, dirname, exists, join as pathjoin
+import sys
+from sys import argv as sys_argv, exit, stdout
+from textwrap import wrap
+from time import time
+import traceback
+from datetime import timedelta
+import optparse
+import math
+
+from swift.common import exceptions
+from swift.common.ring import RingBuilder, Ring, RingData
+from swift.common.ring.builder import MAX_BALANCE
+from swift.common.ring.composite_builder import CompositeRingBuilder
+from swift.common.ring.ring import RING_CODECS, DEFAULT_RING_FORMAT_VERSION
+from swift.common.ring.utils import validate_args, \
+    validate_and_normalize_ip, build_dev_from_opts, \
+    parse_builder_ring_filename_args, parse_search_value, \
+    parse_search_values_from_opts, parse_change_values_from_opts, \
+    dispersion_report, parse_add_value
+from swift.common.utils import lock_parent_directory, is_valid_ipv6
+
+MAJOR_VERSION = 1
+MINOR_VERSION = 3
+EXIT_SUCCESS = 0
+EXIT_WARNING = 1
+EXIT_ERROR = 2
+
+FORMAT_CHOICES = [str(v) for v in RING_CODECS]
+
+global argv, backup_dir, builder, builder_file, ring_file
+argv = backup_dir = builder = builder_file = ring_file = None
+
+
+def format_device(dev):
+    """
+    Format a device for display.
+    """
+    copy_dev = dev.copy()
+    for key in ('ip', 'replication_ip'):
+        if ':' in copy_dev[key]:
+            copy_dev[key] = '[' + copy_dev[key] + ']'
+    return ('d%(id)sr%(region)sz%(zone)s-%(ip)s:%(port)sR'
+            '%(replication_ip)s:%(replication_port)s/%(device)s_'
+            '"%(meta)s"' % copy_dev)
+
+
+def _parse_search_values(argvish):
+
+    new_cmd_format, opts, args = validate_args(argvish)
+
+    # We'll either parse the all-in-one-string format or the
+    # --options format,
+    # but not both. If both are specified, raise an error.
+    try:
+        search_values = {}
+        if len(args) > 0:
+            if new_cmd_format or len(args) != 1:
+                print(Commands.search.__doc__.strip())
+                exit(EXIT_ERROR)
+            search_values = parse_search_value(args[0])
+        else:
+            search_values = parse_search_values_from_opts(opts)
+        return search_values
+    except ValueError as e:
+        print(e)
+        exit(EXIT_ERROR)
+
+
+def _find_parts(devs):
+    devs = [d['id'] for d in devs]
+    if not devs or not builder._replica2part2dev:
+        return None
+
+    partition_count = {}
+    for replica in builder._replica2part2dev:
+        for partition, device in enumerate(replica):
+            if device in devs:
+                if partition not in partition_count:
+                    partition_count[partition] = 0
+                partition_count[partition] += 1
+
+    # Sort by number of found replicas to keep the output format
+    sorted_partition_count = sorted(
+        partition_count.items(), key=itemgetter(1), reverse=True)
+
+    return sorted_partition_count
+
+
+def _parse_list_parts_values(argvish):
+
+    new_cmd_format, opts, args = validate_args(argvish)
+
+    # We'll either parse the all-in-one-string format or the
+    # --options format,
+    # but not both. If both are specified, raise an error.
+    try:
+        devs = []
+        if len(args) > 0:
+            if new_cmd_format:
+                print(Commands.list_parts.__doc__.strip())
+                exit(EXIT_ERROR)
+
+            for arg in args:
+                devs.extend(
+                    builder.search_devs(parse_search_value(arg)) or [])
+        else:
+            devs.extend(builder.search_devs(
+                parse_search_values_from_opts(opts)) or [])
+
+        return devs
+    except ValueError as e:
+        print(e)
+        exit(EXIT_ERROR)
+
+
+def _parse_add_values(argvish):
+    """
+    Parse devices to add as specified on the command line.
+
+    Will exit on error and spew warnings.
+
+    :returns: array of device dicts
+    """
+    new_cmd_format, opts, args = validate_args(argvish)
+
+    # We'll either parse the all-in-one-string format or the
+    # --options format,
+    # but not both. If both are specified, raise an error.
+    parsed_devs = []
+    if len(args) > 0:
+        if new_cmd_format or len(args) % 2 != 0:
+            print(Commands.add.__doc__.strip())
+            exit(EXIT_ERROR)
+
+        devs_and_weights = zip(islice(args, 0, len(args), 2),
+                               islice(args, 1, len(args), 2))
+
+        for devstr, weightstr in devs_and_weights:
+            dev_dict = parse_add_value(devstr)
+
+            if dev_dict['region'] is None:
+                print('WARNING: No region specified for %s. '
+                      'Defaulting to region 1.\n' % devstr, file=sys.stderr)
+                dev_dict['region'] = 1
+
+            if dev_dict['replication_ip'] is None:
+                dev_dict['replication_ip'] = dev_dict['ip']
+
+            if dev_dict['replication_port'] is None:
+                dev_dict['replication_port'] = dev_dict['port']
+
+            weight = float(weightstr)
+            if weight < 0:
+                raise ValueError('Invalid weight value: %s' % devstr)
+            dev_dict['weight'] = weight
+
+            parsed_devs.append(dev_dict)
+    else:
+        parsed_devs.append(build_dev_from_opts(opts))
+
+    return parsed_devs
+
+
+def check_devs(devs, input_question, opts, abort_msg):
+
+    if not devs:
+        print('Search value matched 0 devices.\n'
+              'The on-disk ring builder is unchanged.')
+        exit(EXIT_ERROR)
+
+    if len(devs) > 1:
+        print('Matched more than one device:')
+        for dev in devs:
+            print('    %s' % format_device(dev))
+        try:
+            abort = not opts.yes and input(input_question) != 'y'
+        except (EOFError, KeyboardInterrupt):
+            abort = True
+        if abort:
+            print(abort_msg)
+            exit(EXIT_ERROR)
+
+
+def _set_weight_values(devs, weight, opts):
+
+    input_question = 'Are you sure you want to update the weight for these ' \
+                     '%s devices? (y/N) ' % len(devs)
+    abort_msg = 'Aborting device modifications'
+    check_devs(devs, input_question, opts, abort_msg)
+
+    for dev in devs:
+        builder.set_dev_weight(dev['id'], weight)
+        print('%s weight set to %s' % (format_device(dev),
+                                       dev['weight']))
+
+
+def _set_region_values(devs, region, opts):
+
+    input_question = 'Are you sure you want to update the region for these ' \
+                     '%s devices? (y/N) ' % len(devs)
+    abort_msg = 'Aborting device modifications'
+    check_devs(devs, input_question, opts, abort_msg)
+
+    for dev in devs:
+        builder.set_dev_region(dev['id'], region)
+        print('%s region set to %s' % (format_device(dev),
+                                       dev['region']))
+
+
+def _set_zone_values(devs, zone, opts):
+
+    input_question = 'Are you sure you want to update the zone for these ' \
+                     '%s devices? (y/N) ' % len(devs)
+    abort_msg = 'Aborting device modifications'
+    check_devs(devs, input_question, opts, abort_msg)
+
+    for dev in devs:
+        builder.set_dev_zone(dev['id'], zone)
+        print('%s zone set to %s' % (format_device(dev),
+                                     dev['zone']))
+
+
+def _parse_set_weight_values(argvish):
+
+    new_cmd_format, opts, args = validate_args(argvish)
+
+    # We'll either parse the all-in-one-string format or the
+    # --options format,
+    # but not both. If both are specified, raise an error.
+    try:
+        if not new_cmd_format:
+            if len(args) % 2 != 0:
+                print(Commands.set_weight.__doc__.strip())
+                exit(EXIT_ERROR)
+
+            devs_and_weights = zip(islice(argvish, 0, len(argvish), 2),
+                                   islice(argvish, 1, len(argvish), 2))
+            for devstr, weightstr in devs_and_weights:
+                devs = (builder.search_devs(
+                    parse_search_value(devstr)) or [])
+                weight = float(weightstr)
+                _set_weight_values(devs, weight, opts)
+        else:
+            if len(args) != 1:
+                print(Commands.set_weight.__doc__.strip())
+                exit(EXIT_ERROR)
+
+            devs = (builder.search_devs(
+                parse_search_values_from_opts(opts)) or [])
+            weight = float(args[0])
+            _set_weight_values(devs, weight, opts)
+    except ValueError as e:
+        print(e)
+        exit(EXIT_ERROR)
+
+
+def _set_info_values(devs, change, opts):
+
+    input_question = 'Are you sure you want to update the info for these ' \
+                     '%s devices? (y/N) ' % len(devs)
+    abort_msg = 'Aborting device modifications'
+    check_devs(devs, input_question, opts, abort_msg)
+
+    for dev in devs:
+        orig_dev_string = format_device(dev)
+        test_dev = dict(dev)
+        for key in change:
+            test_dev[key] = change[key]
+        for check_dev in builder.devs:
+            if not check_dev or check_dev['id'] == test_dev['id']:
+                continue
+            if check_dev['ip'] == test_dev['ip'] and \
+                    check_dev['port'] == test_dev['port'] and \
+                    check_dev['device'] == test_dev['device']:
+                print('Device %d already uses %s:%d/%s.' %
+                      (check_dev['id'], check_dev['ip'],
+                       check_dev['port'], check_dev['device']))
+                exit(EXIT_ERROR)
+        for key in change:
+            dev[key] = change[key]
+        print('Device %s is now %s' % (orig_dev_string,
+                                       format_device(dev)))
+
+
+def calculate_change_value(change_value, change, v_name, v_name_port):
+    ip = ''
+    if change_value and change_value[0].isdigit():
+        i = 1
+        while (i < len(change_value) and
+               change_value[i] in '0123456789.'):
+            i += 1
+        ip = change_value[:i]
+        change_value = change_value[i:]
+    elif change_value and change_value.startswith('['):
+        i = 1
+        while i < len(change_value) and change_value[i] != ']':
+            i += 1
+        i += 1
+        ip = change_value[:i].lstrip('[').rstrip(']')
+        change_value = change_value[i:]
+    if ip:
+        change[v_name] = validate_and_normalize_ip(ip)
+    if change_value.startswith(':'):
+        i = 1
+        while i < len(change_value) and change_value[i].isdigit():
+            i += 1
+        change[v_name_port] = int(change_value[1:i])
+        change_value = change_value[i:]
+    return change_value
+
+
+def _parse_set_region_values(argvish):
+
+    new_cmd_format, opts, args = validate_args(argvish)
+
+    # We'll either parse the all-in-one-string format or the
+    # --options format,
+    # but not both. If both are specified, raise an error.
+    try:
+        devs = []
+        if not new_cmd_format:
+            if len(args) % 2 != 0:
+                print(Commands.set_region.__doc__.strip())
+                exit(EXIT_ERROR)
+
+            devs_and_regions = zip(islice(argvish, 0, len(argvish), 2),
+                                   islice(argvish, 1, len(argvish), 2))
+            for devstr, regionstr in devs_and_regions:
+                devs.extend(builder.search_devs(
+                    parse_search_value(devstr)) or [])
+                region = int(regionstr)
+                _set_region_values(devs, region, opts)
+        else:
+            if len(args) != 1:
+                print(Commands.set_region.__doc__.strip())
+                exit(EXIT_ERROR)
+
+            devs.extend(builder.search_devs(
+                parse_search_values_from_opts(opts)) or [])
+            region = int(args[0])
+            _set_region_values(devs, region, opts)
+    except ValueError as e:
+        print(e)
+        exit(EXIT_ERROR)
+
+
+def _parse_set_zone_values(argvish):
+
+    new_cmd_format, opts, args = validate_args(argvish)
+
+    # We'll either parse the all-in-one-string format or the
+    # --options format,
+    # but not both. If both are specified, raise an error.
+    try:
+        devs = []
+        if not new_cmd_format:
+            if len(args) % 2 != 0:
+                print(Commands.set_zone.__doc__.strip())
+                exit(EXIT_ERROR)
+
+            devs_and_zones = zip(islice(argvish, 0, len(argvish), 2),
+                                 islice(argvish, 1, len(argvish), 2))
+            for devstr, zonestr in devs_and_zones:
+                devs.extend(builder.search_devs(
+                    parse_search_value(devstr)) or [])
+                zone = int(zonestr)
+                _set_zone_values(devs, zone, opts)
+        else:
+            if len(args) != 1:
+                print(Commands.set_zone.__doc__.strip())
+                exit(EXIT_ERROR)
+
+            devs.extend(builder.search_devs(
+                parse_search_values_from_opts(opts)) or [])
+            zone = int(args[0])
+            _set_zone_values(devs, zone, opts)
+    except ValueError as e:
+        print(e)
+        exit(EXIT_ERROR)
+
+
+def _parse_set_info_values(argvish):
+
+    new_cmd_format, opts, args = validate_args(argvish)
+
+    # We'll either parse the all-in-one-string format or the
+    # --options format,
+    # but not both. If both are specified, raise an error.
+    if not new_cmd_format:
+        if len(args) % 2 != 0:
+            print(Commands.search.__doc__.strip())
+            exit(EXIT_ERROR)
+
+        searches_and_changes = zip(islice(argvish, 0, len(argvish), 2),
+                                   islice(argvish, 1, len(argvish), 2))
+
+        for search_value, change_value in searches_and_changes:
+            devs = builder.search_devs(parse_search_value(search_value))
+            change = {}
+
+            change_value = calculate_change_value(change_value, change,
+                                                  'ip', 'port')
+
+            if change_value.startswith('R'):
+                change_value = change_value[1:]
+                change_value = calculate_change_value(change_value, change,
+                                                      'replication_ip',
+                                                      'replication_port')
+            if change_value.startswith('/'):
+                i = 1
+                while i < len(change_value) and change_value[i] != '_':
+                    i += 1
+                change['device'] = change_value[1:i]
+                change_value = change_value[i:]
+            if change_value.startswith('_'):
+                change['meta'] = change_value[1:]
+                change_value = ''
+            if change_value or not change:
+                raise ValueError('Invalid set info change value: %s' %
+                                 repr(argvish[1]))
+            _set_info_values(devs, change, opts)
+    else:
+        devs = builder.search_devs(parse_search_values_from_opts(opts))
+        change = parse_change_values_from_opts(opts)
+        _set_info_values(devs, change, opts)
+
+
+def _parse_remove_values(argvish):
+
+    new_cmd_format, opts, args = validate_args(argvish)
+
+    # We'll either parse the all-in-one-string format or the
+    # --options format,
+    # but not both. If both are specified, raise an error.
+    try:
+        devs = []
+        if len(args) > 0:
+            if new_cmd_format:
+                print(Commands.remove.__doc__.strip())
+                exit(EXIT_ERROR)
+
+            for arg in args:
+                devs.extend(builder.search_devs(
+                    parse_search_value(arg)) or [])
+        else:
+            devs.extend(builder.search_devs(
+                parse_search_values_from_opts(opts)))
+
+        return (devs, opts)
+    except ValueError as e:
+        print(e)
+        exit(EXIT_ERROR)
+
+
+def _make_display_device_table(builder):
+    ip_width = 10
+    port_width = 4
+    rep_ip_width = 14
+    rep_port_width = 4
+    ip_ipv6 = rep_ipv6 = False
+    weight_width = 6
+    for dev in builder._iter_devs():
+        if is_valid_ipv6(dev['ip']):
+            ip_ipv6 = True
+        if is_valid_ipv6(dev['replication_ip']):
+            rep_ipv6 = True
+        ip_width = max(len(dev['ip']), ip_width)
+        rep_ip_width = max(len(dev['replication_ip']), rep_ip_width)
+        port_width = max(len(str(dev['port'])), port_width)
+        rep_port_width = max(len(str(dev['replication_port'])),
+                             rep_port_width)
+        weight_width = max(len('%6.02f' % dev['weight']),
+                           weight_width)
+    if ip_ipv6:
+        ip_width += 2
+    if rep_ipv6:
+        rep_ip_width += 2
+    header_line = ('Devices:%5s %6s %4s %' + str(ip_width)
+                   + 's:%-' + str(port_width) + 's %' +
+                   str(rep_ip_width) + 's:%-' + str(rep_port_width) +
+                   's %5s %' + str(weight_width) + 's %10s %7s %5s %s') % (
+                       'id', 'region', 'zone', 'ip address',
+                       'port', 'replication ip', 'port', 'name',
+                       'weight', 'partitions', 'balance', 'flags',
+                       'meta')
+
+    def print_dev_f(dev, balance_per_dev=0.00, flags=''):
+        def get_formated_ip(key):
+            value = dev[key]
+            if ':' in value:
+                value = '[%s]' % value
+            return value
+        dev_ip = get_formated_ip('ip')
+        dev_replication_ip = get_formated_ip('replication_ip')
+        format_string = ''.join(['%13d %6d %4d ',
+                                 '%', str(ip_width), 's:%-',
+                                 str(port_width), 'd ', '%',
+                                 str(rep_ip_width), 's', ':%-',
+                                 str(rep_port_width), 'd %5s %',
+                                 str(weight_width), '.02f'
+                                 ' %10s %7.02f %5s %s'])
+        args = (dev['id'], dev['region'], dev['zone'], dev_ip, dev['port'],
+                dev_replication_ip, dev['replication_port'], dev['device'],
+                dev['weight'], dev['parts'], balance_per_dev, flags,
+                dev['meta'])
+        print(format_string % args)
+
+    return header_line, print_dev_f
+
+
+class Commands(object):
+    @staticmethod
+    def unknown():
+        print('Unknown command: %s' % argv[2])
+        exit(EXIT_ERROR)
+
+    @staticmethod
+    def create():
+        """
+swift-ring-builder <builder_file> create <part_power> <replicas>
+                                         <min_part_hours>
+    Creates <builder_file> with 2^<part_power> partitions and <replicas>.
+    <min_part_hours> is number of hours to restrict moving a partition more
+    than once.
+        """
+        if len(argv) < 6:
+            print(Commands.create.__doc__.strip())
+            exit(EXIT_ERROR)
+        try:
+            builder = RingBuilder(int(argv[3]), float(argv[4]), int(argv[5]))
+        except ValueError as e:
+            print(e)
+            exit(EXIT_ERROR)
+        backup_dir = pathjoin(dirname(builder_file), 'backups')
+        try:
+            mkdir(backup_dir)
+        except OSError as err:
+            if err.errno != EEXIST:
+                raise
+        builder.save(pathjoin(backup_dir,
+                              '%d.' % time() + basename(builder_file)))
+        builder.save(builder_file)
+        exit(EXIT_SUCCESS)
+
+    @staticmethod
+    def default():
+        """
+swift-ring-builder <builder_file>
+    Shows information about the ring and the devices within. Output
+    includes a table that describes the report parameters (id, region,
+    port, flags, etc).
+    flags: possible values are 'DEL' and ''
+        DEL - indicates that the device is marked for removal from
+              ring and will be removed in next rebalance.
+        """
+        try:
+            builder_id = builder.id
+        except AttributeError:
+            builder_id = "(not assigned)"
+        print('%s, build version %d, id %s' %
+              (builder_file, builder.version, builder_id))
+        balance = 0
+        ring_empty_error = None
+        regions = len(set(d['region'] for d in builder.devs
+                          if d is not None))
+        zones = len(set((d['region'], d['zone']) for d in builder.devs
+                        if d is not None))
+        dev_count = len([dev for dev in builder.devs
+                         if dev is not None])
+        try:
+            balance = builder.get_balance()
+        except exceptions.EmptyRingError as e:
+            ring_empty_error = str(e)
+        dispersion_trailer = '' if builder.dispersion is None else (
+            ', %.02f dispersion' % (builder.dispersion))
+        print('%d partitions, %.6f replicas, %d regions, %d zones, '
+              '%d devices, %d-byte IDs, %.02f balance%s' % (
+                  builder.parts, builder.replicas, regions, zones, dev_count,
+                  builder.dev_id_bytes, balance, dispersion_trailer))
+        print('The minimum number of hours before a partition can be '
+              'reassigned is %s (%s remaining)' % (
+                  builder.min_part_hours,
+                  timedelta(seconds=builder.min_part_seconds_left)))
+        print('The overload factor is %0.2f%% (%.6f)' % (
+            builder.overload * 100, builder.overload))
+
+        ring_dict = None
+        builder_dict = builder.get_ring().to_dict()
+
+        # compare ring file against builder file
+        if not exists(ring_file):
+            print('Ring file %s not found, '
+                  'probably it hasn\'t been written yet' % ring_file)
+        else:
+            try:
+                ring_dict = RingData.load(ring_file).to_dict()
+            except Exception as exc:
+                print('Ring file %s is invalid: %r' % (ring_file, exc))
+            else:
+                # mostly just an implementation detail
+                builder_dict.pop('dev_id_bytes', None)
+                ring_dict.pop('dev_id_bytes', None)
+                if builder_dict == ring_dict:
+                    print('Ring file %s is up-to-date' % ring_file)
+                else:
+                    print('Ring file %s is obsolete' % ring_file)
+
+        if ring_empty_error:
+            balance_per_dev = defaultdict(int)
+        else:
+            balance_per_dev = builder._build_balance_per_dev()
+        header_line, print_dev_f = _make_display_device_table(builder)
+        print(header_line)
+        for dev in sorted(
+            builder._iter_devs(),
+            key=lambda x: (x['region'], x['zone'], x['ip'], x['device'])
+        ):
+            flags = 'DEL' if dev in builder._remove_devs else ''
+            print_dev_f(dev, balance_per_dev[dev['id']], flags)
+
+        # Print some helpful info if partition power increase in progress
+        if (builder.next_part_power and
+                builder.next_part_power == (builder.part_power + 1)):
+            print('\nPreparing increase of partition power (%d -> %d)' % (
+                  builder.part_power, builder.next_part_power))
+            print('Run "swift-object-relinker relink" on all nodes before '
+                  'moving on to increase_partition_power.')
+        if (builder.next_part_power and
+                builder.part_power == builder.next_part_power):
+            print('\nIncreased partition power (%d -> %d)' % (
+                  builder.part_power, builder.next_part_power))
+            if builder_dict != ring_dict:
+                print('First run "swift-ring-builder <builderfile> write_ring"'
+                      ' now and copy the updated .ring.gz file to all nodes.')
+            print('Run "swift-object-relinker cleanup" on all nodes before '
+                  'moving on to finish_increase_partition_power.')
+
+        if ring_empty_error:
+            print(ring_empty_error)
+        exit(EXIT_SUCCESS)
+
+    @staticmethod
+    def version():
+        """
+swift-ring-builder <ring_file> version
+        """
+        if len(argv) < 3:
+            print(Commands.create.__doc__.strip())
+            exit(EXIT_ERROR)
+        try:
+            rd = RingData.load(ring_file, metadata_only=True)
+        except ValueError as e:
+            print(e)
+            exit(EXIT_ERROR)
+        print('%s: Serialization version: %d (%d-byte IDs), '
+              'build version: %d' %
+              (ring_file, rd.format_version, rd.dev_id_bytes, rd.version))
+        exit(EXIT_SUCCESS)
+
+    @staticmethod
+    def search():
+        """
+swift-ring-builder <builder_file> search <search-value>
+
+or
+
+swift-ring-builder <builder_file> search
+    --region <region> --zone <zone> --ip <ip or hostname> --port <port>
+    --replication-ip <r_ip or r_hostname> --replication-port <r_port>
+    --device <device_name> --meta <meta> --weight <weight>
+
+    Where <r_ip>, <r_hostname> and <r_port> are replication ip, hostname
+    and port.
+    Any of the options are optional in both cases.
+
+    Shows information about matching devices.
+        """
+        if len(argv) < 4:
+            print(Commands.search.__doc__.strip())
+            print()
+            print(parse_search_value.__doc__.strip())
+            exit(EXIT_ERROR)
+
+        devs = builder.search_devs(_parse_search_values(argv[3:]))
+
+        if not devs:
+            print('No matching devices found')
+            exit(EXIT_ERROR)
+        print('Devices:    id  region  zone      ip address  port  '
+              'replication ip  replication port      name weight partitions '
+              'balance meta')
+        weighted_parts = builder.parts * builder.replicas / \
+            sum(d['weight'] for d in builder.devs if d is not None)
+        for dev in devs:
+            if not dev['weight']:
+                if dev['parts']:
+                    balance = MAX_BALANCE
+                else:
+                    balance = 0
+            else:
+                balance = 100.0 * dev['parts'] / \
+                    (dev['weight'] * weighted_parts) - 100.0
+            print('         %5d %7d %5d %15s %5d %15s %17d %9s %6.02f %10s '
+                  '%7.02f %s' %
+                  (dev['id'], dev['region'], dev['zone'], dev['ip'],
+                   dev['port'], dev['replication_ip'], dev['replication_port'],
+                   dev['device'], dev['weight'], dev['parts'], balance,
+                   dev['meta']))
+        exit(EXIT_SUCCESS)
+
+    @staticmethod
+    def list_parts():
+        """
+swift-ring-builder <builder_file> list_parts <search-value> [<search-value>] ..
+
+or
+
+swift-ring-builder <builder_file> list_parts
+    --region <region> --zone <zone> --ip <ip or hostname> --port <port>
+    --replication-ip <r_ip or r_hostname> --replication-port <r_port>
+    --device <device_name> --meta <meta> --weight <weight>
+
+    Where <r_ip>, <r_hostname> and <r_port> are replication ip, hostname
+    and port.
+    Any of the options are optional in both cases.
+
+    Returns a 2 column list of all the partitions that are assigned to any of
+    the devices matching the search values given. The first column is the
+    assigned partition number and the second column is the number of device
+    matches for that partition. The list is ordered from most number of matches
+    to least. If there are a lot of devices to match against, this command
+    could take a while to run.
+        """
+        if len(argv) < 4:
+            print(Commands.list_parts.__doc__.strip())
+            print()
+            print(parse_search_value.__doc__.strip())
+            exit(EXIT_ERROR)
+
+        if not builder._replica2part2dev:
+            print('Specified builder file \"%s\" is not rebalanced yet. '
+                  'Please rebalance first.' % builder_file)
+            exit(EXIT_ERROR)
+
+        devs = _parse_list_parts_values(argv[3:])
+        if not devs:
+            print('No matching devices found')
+            exit(EXIT_ERROR)
+
+        sorted_partition_count = _find_parts(devs)
+
+        if not sorted_partition_count:
+            print('No matching devices found')
+            exit(EXIT_ERROR)
+
+        print('Partition   Matches')
+        for partition, count in sorted_partition_count:
+            print('%9d   %7d' % (partition, count))
+        exit(EXIT_SUCCESS)
+
+    @staticmethod
+    def add():
+        """
+swift-ring-builder <builder_file> add
+    [r<region>]z<zone>-<ip>:<port>[R<r_ip>:<r_port>]/<device_name>_<meta>
+     <weight>
+    [[r<region>]z<zone>-<ip>:<port>[R<r_ip>:<r_port>]/<device_name>_<meta>
+     <weight>] ...
+
+    Where <r_ip> and <r_port> are replication ip and port.
+
+or
+
+swift-ring-builder <builder_file> add
+    --region <region> --zone <zone> --ip <ip or hostname> --port <port>
+    [--replication-ip <r_ip or r_hostname>] [--replication-port <r_port>]
+    --device <device_name> --weight <weight>
+    [--meta <meta>]
+
+    Adds devices to the ring with the given information. No partitions will be
+    assigned to the new device until after running 'rebalance'. This is so you
+    can make multiple device changes and rebalance them all just once.
+        """
+        if len(argv) < 5:
+            print(Commands.add.__doc__.strip())
+            exit(EXIT_ERROR)
+
+        if builder.next_part_power:
+            print('Partition power increase in progress. You need ')
+            print('to finish the increase first before adding devices.')
+            exit(EXIT_ERROR)
+
+        try:
+            for new_dev in _parse_add_values(argv[3:]):
+                for dev in builder.devs:
+                    if dev is None:
+                        continue
+                    if dev['ip'] == new_dev['ip'] and \
+                            dev['port'] == new_dev['port'] and \
+                            dev['device'] == new_dev['device']:
+                        print('Device %d already uses %s:%d/%s.' %
+                              (dev['id'], dev['ip'],
+                               dev['port'], dev['device']))
+                        print("The on-disk ring builder is unchanged.\n")
+                        exit(EXIT_ERROR)
+                dev_id = builder.add_dev(new_dev)
+                print('Device %s with %s weight got id %s' %
+                      (format_device(new_dev), new_dev['weight'], dev_id))
+        except ValueError as err:
+            print(err)
+            print('The on-disk ring builder is unchanged.')
+            exit(EXIT_ERROR)
+
+        builder.save(builder_file)
+        exit(EXIT_SUCCESS)
+
+    @staticmethod
+    def set_weight():
+        """
+swift-ring-builder <builder_file> set_weight <search-value> <new_weight>
+    [<search-value> <new_weight>] ...
+    [--yes]
+
+or
+
+swift-ring-builder <builder_file> set_weight
+    --region <region> --zone <zone> --ip <ip or hostname> --port <port>
+    --replication-ip <r_ip or r_hostname> --replication-port <r_port>
+    --device <device_name> --meta <meta> --weight <weight> <new_weight>
+    [--yes]
+
+    Where <r_ip>, <r_hostname> and <r_port> are replication ip, hostname
+    and port. <weight> and <new_weight> are the search weight and new
+    weight values respectively.
+    Any of the options are optional in both cases.
+
+    Resets the devices' weights. No partitions will be reassigned to or from
+    the device until after running 'rebalance'. This is so you can make
+    multiple device changes and rebalance them all just once.
+
+    Option --yes assume a yes response to all questions.
+        """
+        # if len(argv) < 5 or len(argv) % 2 != 1:
+        if len(argv) < 5:
+            print(Commands.set_weight.__doc__.strip())
+            print()
+            print(parse_search_value.__doc__.strip())
+            exit(EXIT_ERROR)
+
+        _parse_set_weight_values(argv[3:])
+
+        builder.save(builder_file)
+        exit(EXIT_SUCCESS)
+
+    @staticmethod
+    def set_region():
+        """
+swift-ring-builder <builder_file> set_region <search-value> <region>
+    [<search-value> <region] ...
+
+or
+
+swift-ring-builder <builder_file> set_region
+    --region <region> --zone <zone> --ip <ip or hostname> --port <port>
+    --replication-ip <r_ip or r_hostname> --replication-port <r_port>
+    --device <device_name> --meta <meta> <new region> [--yes]
+
+    Where <r_ip>, <r_hostname> and <r_port> are replication ip, hostname
+    and port.
+    Any of the options are optional in both cases.
+
+    Resets the devices' regions. No partitions will be reassigned to or from
+    the device until after running 'rebalance'. This is so you can make
+    multiple device changes and rebalance them all just once.
+
+    Option --yes assume a yes response to all questions.
+        """
+        if len(argv) < 5:
+            print(Commands.set_region.__doc__.strip())
+            print()
+            print(parse_search_value.__doc__.strip())
+            exit(EXIT_ERROR)
+
+        _parse_set_region_values(argv[3:])
+
+        builder.save(builder_file)
+        exit(EXIT_SUCCESS)
+
+    @staticmethod
+    def set_zone():
+        """
+swift-ring-builder <builder_file> set_zone <search-value> <zone>
+    [<search-value> <zone] ...
+
+or
+
+swift-ring-builder <builder_file> set_zone
+    --region <region> --zone <zone> --ip <ip or hostname> --port <port>
+    --replication-ip <r_ip or r_hostname> --replication-port <r_port>
+    --device <device_name> --meta <meta> <new zone> [--yes]
+
+    Where <r_ip>, <r_hostname> and <r_port> are replication ip, hostname
+    and port.
+    Any of the options are optional in both cases.
+
+    Resets the devices' zones. No partitions will be reassigned to or from
+    the device until after running 'rebalance'. This is so you can make
+    multiple device changes and rebalance them all just once.
+
+    Option --yes assume a yes response to all questions.
+        """
+        # if len(argv) < 5 or len(argv) % 2 != 1:
+        if len(argv) < 5:
+            print(Commands.set_zone.__doc__.strip())
+            print()
+            print(parse_search_value.__doc__.strip())
+            exit(EXIT_ERROR)
+
+        _parse_set_zone_values(argv[3:])
+
+        builder.save(builder_file)
+        exit(EXIT_SUCCESS)
+
+    @staticmethod
+    def set_info():
+        """
+swift-ring-builder <builder_file> set_info
+    <search-value> <ip>:<port>[R<r_ip>:<r_port>]/<device_name>_<meta>
+    [<search-value> <ip>:<port>[R<r_ip>:<r_port>]/<device_name>_<meta>] ...
+    [--yes]
+
+or
+
+swift-ring-builder <builder_file> set_info
+    --ip <ip or hostname> --port <port>
+    --replication-ip <r_ip or r_hostname> --replication-port <r_port>
+    --device <device_name> --meta <meta>
+    --change-ip <ip or hostname> --change-port <port>
+    --change-replication-ip <r_ip or r_hostname>
+    --change-replication-port <r_port>
+    --change-device <device_name>
+    --change-meta <meta>
+    [--yes]
+
+    Where <r_ip>, <r_hostname> and <r_port> are replication ip, hostname
+    and port.
+    Any of the options are optional in both cases.
+
+    For each search-value, resets the matched device's information.
+    This information isn't used to assign partitions, so you can use
+    'write_ring' afterward to rewrite the current ring with the newer
+    device information. Any of the parts are optional in the final
+    <ip>:<port>/<device_name>_<meta> parameter; just give what you
+    want to change. For instance set_info d74 _"snet: 5.6.7.8" would
+    just update the meta data for device id 74.
+
+    Option --yes assume a yes response to all questions.
+        """
+        if len(argv) < 5:
+            print(Commands.set_info.__doc__.strip())
+            print()
+            print(parse_search_value.__doc__.strip())
+            exit(EXIT_ERROR)
+
+        try:
+            _parse_set_info_values(argv[3:])
+        except ValueError as err:
+            print(err)
+            exit(EXIT_ERROR)
+
+        builder.save(builder_file)
+        exit(EXIT_SUCCESS)
+
+    @staticmethod
+    def remove():
+        """
+swift-ring-builder <builder_file> remove <search-value> [search-value ...]
+    [--yes]
+
+or
+
+swift-ring-builder <builder_file> remove
+    --region <region> --zone <zone> --ip <ip or hostname> --port <port>
+    --replication-ip <r_ip or r_hostname> --replication-port <r_port>
+    --device <device_name> --meta <meta> --weight <weight>
+    [--yes]
+
+    Where <r_ip>, <r_hostname> and <r_port> are replication ip, hostname
+    and port.
+    Any of the options are optional in both cases.
+
+    Removes the device(s) from the ring. This should normally just be used for
+    a device that has failed. For a device you wish to decommission, it's best
+    to set its weight to 0, wait for it to drain all its data, then use this
+    remove command. This will not take effect until after running 'rebalance'.
+    This is so you can make multiple device changes and rebalance them all just
+    once.
+
+    Option --yes assume a yes response to all questions.
+        """
+        if len(argv) < 4:
+            print(Commands.remove.__doc__.strip())
+            print()
+            print(parse_search_value.__doc__.strip())
+            exit(EXIT_ERROR)
+
+        if builder.next_part_power:
+            print('Partition power increase in progress. You need ')
+            print('to finish the increase first before removing devices.')
+            exit(EXIT_ERROR)
+
+        devs, opts = _parse_remove_values(argv[3:])
+
+        input_question = 'Are you sure you want to remove these ' \
+                         '%s devices? (y/N) ' % len(devs)
+        abort_msg = 'Aborting device removals'
+        check_devs(devs, input_question, opts, abort_msg)
+
+        for dev in devs:
+            try:
+                builder.remove_dev(dev['id'])
+            except exceptions.RingBuilderError as e:
+                print('-' * 79)
+                print(
+                    'An error occurred while removing device with id %d\n'
+                    'This usually means that you attempted to remove\n'
+                    'the last device in a ring. If this is the case,\n'
+                    'consider creating a new ring instead.\n'
+                    'The on-disk ring builder is unchanged.\n'
+                    'Original exception message: %s' %
+                    (dev['id'], e))
+                print('-' * 79)
+                exit(EXIT_ERROR)
+
+            print('%s marked for removal and will '
+                  'be removed next rebalance.' % format_device(dev))
+        builder.save(builder_file)
+        exit(EXIT_SUCCESS)
+
+    @staticmethod
+    def rebalance():
+        """
+swift-ring-builder <builder_file> rebalance [options]
+    Attempts to rebalance the ring by reassigning partitions that haven't been
+    recently reassigned.
+        """
+        usage = Commands.rebalance.__doc__.strip()
+        parser = optparse.OptionParser(usage)
+        parser.add_option('-f', '--force', action='store_true',
+                          help='Force a rebalanced ring to save even '
+                          'if < 1% of parts changed')
+        parser.add_option('-s', '--seed', help="seed to use for rebalance")
+        parser.add_option('-d', '--debug', action='store_true',
+                          help="print debug information")
+        parser.add_option('--format-version',
+                          choices=FORMAT_CHOICES, default=None,
+                          help="specify ring format version")
+        options, args = parser.parse_args(argv)
+        if options.format_version is None:
+            print("Defaulting to --format-version=1. This ensures the ring\n"
+                  "written will be readable by older versions of Swift.\n"
+                  "In a future release, the default will change to\n"
+                  "--format-version=2\n")
+            options.format_version = DEFAULT_RING_FORMAT_VERSION
+        else:
+            # N.B. choices doesn't work with type=int
+            options.format_version = int(options.format_version)
+
+        def get_seed(index):
+            if options.seed:
+                return options.seed
+            try:
+                return args[index]
+            except IndexError:
+                pass
+
+        if options.debug:
+            logger = logging.getLogger("swift.ring.builder")
+            logger.disabled = False
+            logger.setLevel(logging.DEBUG)
+            handler = logging.StreamHandler(stdout)
+            formatter = logging.Formatter("%(levelname)s: %(message)s")
+            handler.setFormatter(formatter)
+            logger.addHandler(handler)
+
+        if builder.next_part_power:
+            print('Partition power increase in progress.')
+            print('You need to finish the increase first before rebalancing.')
+            exit(EXIT_ERROR)
+
+        devs_changed = builder.devs_changed
+        min_part_seconds_left = builder.min_part_seconds_left
+        try:
+            last_balance = builder.get_balance()
+            last_dispersion = builder.dispersion
+            parts, balance, removed_devs = builder.rebalance(seed=get_seed(3))
+            dispersion = builder.dispersion
+        except exceptions.RingBuilderError as e:
+            print('-' * 79)
+            print("An error has occurred during ring validation. Common\n"
+                  "causes of failure are rings that are empty or do not\n"
+                  "have enough devices to accommodate the replica count.\n"
+                  "Original exception message:\n %s" %
+                  (e,))
+            print('-' * 79)
+            exit(EXIT_ERROR)
+        if not (parts or options.force or removed_devs):
+            print('No partitions could be reassigned.')
+            if min_part_seconds_left > 0:
+                print('The time between rebalances must be at least '
+                      'min_part_hours: %s hours (%s remaining)' % (
+                          builder.min_part_hours,
+                          timedelta(seconds=builder.min_part_seconds_left)))
+            else:
+                print('There is no need to do so at this time')
+            exit(EXIT_WARNING)
+        # If we set device's weight to zero, currently balance will be set
+        # special value(MAX_BALANCE) until zero weighted device return all
+        # its partitions. So we cannot check balance has changed.
+        # Thus we need to check balance or last_balance is special value.
+        be_cowardly = True
+        if options.force:
+            # User said save it, so we save it.
+            be_cowardly = False
+        elif devs_changed:
+            # We must save if a device changed; this could be something like
+            # a changed IP address.
+            be_cowardly = False
+        else:
+            # If balance or dispersion changed (presumably improved), then
+            # we should save to get the improvement.
+            balance_changed = (
+                abs(last_balance - balance) >= 1 or
+                (last_balance == MAX_BALANCE and balance == MAX_BALANCE))
+            dispersion_changed = last_dispersion is None or (
+                abs(last_dispersion - dispersion) >= 1)
+            if balance_changed or dispersion_changed:
+                be_cowardly = False
+
+        if be_cowardly:
+            print('Cowardly refusing to save rebalance as it did not change '
+                  'at least 1%.')
+            exit(EXIT_WARNING)
+        try:
+            builder.validate()
+        except exceptions.RingValidationError as e:
+            print('-' * 79)
+            print("An error has occurred during ring validation. Common\n"
+                  "causes of failure are rings that are empty or do not\n"
+                  "have enough devices to accommodate the replica count.\n"
+                  "Original exception message:\n %s" %
+                  (e,))
+            print('-' * 79)
+            exit(EXIT_ERROR)
+        print('Reassigned %d (%.02f%%) partitions. '
+              'Balance is now %.02f.  '
+              'Dispersion is now %.02f' % (
+                  parts, 100.0 * parts / builder.parts,
+                  balance,
+                  builder.dispersion))
+        status = EXIT_SUCCESS
+        if builder.dispersion > 0:
+            print('-' * 79)
+            print(
+                'NOTE: Dispersion of %.06f indicates some parts are not\n'
+                '      optimally dispersed.\n\n'
+                '      You may want to adjust some device weights, increase\n'
+                '      the overload or review the dispersion report.' %
+                builder.dispersion)
+            status = EXIT_WARNING
+            print('-' * 79)
+        elif balance > 5 and balance / 100.0 > builder.overload:
+            print('-' * 79)
+            print('NOTE: Balance of %.02f indicates you should push this ' %
+                  balance)
+            print('      ring, wait at least %d hours, and rebalance/repush.'
+                  % builder.min_part_hours)
+            print('-' * 79)
+            status = EXIT_WARNING
+        ts = time()
+        builder.get_ring().save(
+            pathjoin(backup_dir, '%d.' % ts + basename(ring_file)),
+            format_version=options.format_version)
+        builder.save(pathjoin(backup_dir, '%d.' % ts + basename(builder_file)))
+        builder.get_ring().save(
+            ring_file, format_version=options.format_version)
+        builder.save(builder_file)
+        exit(status)
+
+    @staticmethod
+    def dispersion():
+        r"""
+swift-ring-builder <builder_file> dispersion <search_filter> [options]
+
+    Output report on dispersion.
+
+    --recalculate option will rebuild cached dispersion info and save builder
+    --verbose option will display dispersion graph broken down by tier
+
+    You can filter which tiers are evaluated to drill down using a regex
+    in the optional search_filter argument.  i.e.
+
+        swift-ring-builder <builder_file> dispersion "r\d+z\d+$" -v
+
+    ... would only display rows for the zone tiers
+
+        swift-ring-builder <builder_file> dispersion ".*\-[^/]*$" -v
+
+    ... would only display rows for the server tiers
+
+    The reports columns are:
+
+    Tier  : the name of the tier
+    parts : the total number of partitions with assignment in the tier
+    %     : the percentage of parts in the tier with replicas over assigned
+    max   : maximum replicas a part should have assigned at the tier
+    0 - N : the number of parts with that many replicas assigned
+
+    e.g.
+        Tier:  parts      %   max   0    1    2   3
+        r1z1    1022  79.45     1   2  210  784  28
+
+        r1z1 has 1022 total parts assigned, 79% of them have more than the
+        recommend max replica count of 1 assigned.  Only 2 parts in the ring
+        are *not* assigned in this tier (0 replica count), 210 parts have
+        the recommend replica count of 1, 784 have 2 replicas, and 28 sadly
+        have all three replicas in this tier.
+        """
+        status = EXIT_SUCCESS
+        if not builder._replica2part2dev:
+            print('Specified builder file \"%s\" is not rebalanced yet. '
+                  'Please rebalance first.' % builder_file)
+            exit(EXIT_ERROR)
+        usage = Commands.dispersion.__doc__.strip()
+        parser = optparse.OptionParser(usage)
+        parser.add_option('--recalculate', action='store_true',
+                          help='Rebuild cached dispersion info and save')
+        parser.add_option('-v', '--verbose', action='store_true',
+                          help='Display dispersion report for tiers')
+        options, args = parser.parse_args(argv)
+        if args[3:]:
+            search_filter = args[3]
+        else:
+            search_filter = None
+        orig_version = builder.version
+        report = dispersion_report(builder, search_filter=search_filter,
+                                   verbose=options.verbose,
+                                   recalculate=options.recalculate)
+        if builder.version != orig_version:
+            # we've already done the work, better go ahead and save it!
+            builder.save(builder_file)
+        print('Dispersion is %.06f, Balance is %.06f, Overload is %0.2f%%' % (
+            builder.dispersion, builder.get_balance(), builder.overload * 100))
+        print('Required overload is %.6f%%' % (
+            builder.get_required_overload() * 100))
+        if report['worst_tier']:
+            status = EXIT_WARNING
+            print('Worst tier is %.06f (%s)' % (report['max_dispersion'],
+                                                report['worst_tier']))
+        if report['graph']:
+            replica_range = list(range(int(math.ceil(builder.replicas + 1))))
+            part_count_width = '%%%ds' % max(len(str(builder.parts)), 5)
+            replica_counts_tmpl = ' '.join(part_count_width for i in
+                                           replica_range)
+            tiers = (tier for tier, _junk in report['graph'])
+            tier_width = max(max(map(len, tiers)), 30)
+            header_line = ('%-' + str(tier_width) +
+                           's ' + part_count_width +
+                           ' %6s %6s ' + replica_counts_tmpl) % tuple(
+                               ['Tier', 'Parts', '%', 'Max'] + replica_range)
+            underline = '-' * len(header_line)
+            print(underline)
+            print(header_line)
+            print(underline)
+            for tier_name, dispersion in report['graph']:
+                replica_counts_repr = replica_counts_tmpl % tuple(
+                    dispersion['replicas'])
+                template = ''.join([
+                    '%-', str(tier_width), 's ',
+                    part_count_width,
+                    ' %6.02f %6d %s',
+                ])
+                args = (
+                    tier_name,
+                    dispersion['placed_parts'],
+                    dispersion['dispersion'],
+                    dispersion['max_replicas'],
+                    replica_counts_repr,
+                )
+                print(template % args)
+        exit(status)
+
+    @staticmethod
+    def validate():
+        """
+swift-ring-builder <builder_file> validate
+    Just runs the validation routines on the ring.
+        """
+        builder.validate()
+        exit(EXIT_SUCCESS)
+
+    @staticmethod
+    def write_ring():
+        """
+swift-ring-builder <builder_file> write_ring
+    Just rewrites the distributable ring file. This is done automatically after
+    a successful rebalance, so really this is only useful after one or more
+    'set_info' calls when no rebalance is needed but you want to send out the
+    new device information.
+        """
+        usage = Commands.write_ring.__doc__.strip()
+        parser = optparse.OptionParser(usage)
+        parser.add_option('--format-version',
+                          choices=FORMAT_CHOICES, default=None,
+                          help="specify ring format version")
+        options, args = parser.parse_args(argv)
+        if options.format_version is None:
+            print("Defaulting to --format-version=1. This ensures the ring\n"
+                  "written will be readable by older versions of Swift.\n"
+                  "In a future release, the default will change to\n"
+                  "--format-version=2\n")
+            options.format_version = DEFAULT_RING_FORMAT_VERSION
+        else:
+            # N.B. choices doesn't work with type=int
+            options.format_version = int(options.format_version)
+
+        if not builder.devs:
+            print('Unable to write empty ring.')
+            exit(EXIT_ERROR)
+
+        ring_data = builder.get_ring()
+        if not ring_data._replica2part2dev_id:
+            if ring_data.devs:
+                print('WARNING: Writing a ring with no partition '
+                      'assignments but with devices; did you forget to run '
+                      '"rebalance"?', file=sys.stderr)
+        ring_data.save(
+            pathjoin(backup_dir, '%d.' % time() + basename(ring_file)),
+            format_version=options.format_version)
+        ring_data.save(ring_file, format_version=options.format_version)
+        exit(EXIT_SUCCESS)
+
+    @staticmethod
+    def write_builder():
+        """
+swift-ring-builder <ring_file> write_builder [min_part_hours]
+    Recreate a builder from a ring file (lossy) if you lost your builder
+    backups.  (Protip: don't lose your builder backups).
+    [min_part_hours] is one of those numbers lost to the builder,
+    you can change it with set_min_part_hours.
+        """
+        if exists(builder_file):
+            print('Cowardly refusing to overwrite existing '
+                  'Ring Builder file: %s' % builder_file)
+            exit(EXIT_ERROR)
+        if len(argv) > 3:
+            min_part_hours = int(argv[3])
+        else:
+            print("WARNING: default min_part_hours may not match "
+                  "the value in the lost builder.\n", file=sys.stderr)
+            min_part_hours = 24
+        ring = Ring(ring_file)
+        for dev in ring.devs:
+            if dev is None:
+                continue
+            dev.update({
+                'parts': 0,
+                'parts_wanted': 0,
+            })
+        builder_dict = {
+            'part_power': 32 - ring._part_shift,
+            'replicas': float(ring.replica_count),
+            'min_part_hours': min_part_hours,
+            'parts': ring.partition_count,
+            'devs': ring.devs,
+            'devs_changed': False,
+            'version': ring.version or 0,
+            '_replica2part2dev': ring._replica2part2dev_id,
+            '_last_part_moves_epoch': None,
+            '_last_part_moves': None,
+            '_last_part_gather_start': 0,
+            '_remove_devs': [],
+        }
+        builder = RingBuilder.from_dict(builder_dict)
+        for parts in builder._replica2part2dev:
+            for dev_id in parts:
+                builder.devs[dev_id]['parts'] += 1
+        builder.save(builder_file)
+
+    @staticmethod
+    def pretend_min_part_hours_passed():
+        """
+swift-ring-builder <builder_file> pretend_min_part_hours_passed
+    Resets the clock on the last time a rebalance happened, thus
+    circumventing the min_part_hours check.
+
+    *****************************
+    USE THIS WITH EXTREME CAUTION
+    *****************************
+
+    If you run this command and deploy rebalanced rings before a replication
+    pass completes, you may introduce unavailability in your cluster. This
+    has an end-user impact.
+        """
+        builder.pretend_min_part_hours_passed()
+        builder.save(builder_file)
+        exit(EXIT_SUCCESS)
+
+    @staticmethod
+    def set_min_part_hours():
+        """
+swift-ring-builder <builder_file> set_min_part_hours <hours>
+    Changes the <min_part_hours> to the given <hours>. This should be set to
+    however long a full replication/update cycle takes. We're working on a way
+    to determine this more easily than scanning logs.
+        """
+        if len(argv) < 4:
+            print(Commands.set_min_part_hours.__doc__.strip())
+            exit(EXIT_ERROR)
+        builder.change_min_part_hours(int(argv[3]))
+        print('The minimum number of hours before a partition can be '
+              'reassigned is now set to %s' % argv[3])
+        builder.save(builder_file)
+        exit(EXIT_SUCCESS)
+
+    @staticmethod
+    def set_replicas():
+        """
+swift-ring-builder <builder_file> set_replicas <replicas>
+    Changes the replica count to the given <replicas>. <replicas> may
+    be a floating-point value, in which case some partitions will have
+    floor(<replicas>) replicas and some will have ceiling(<replicas>)
+    in the correct proportions.
+
+    A rebalance is needed to make the change take effect.
+    """
+        if len(argv) < 4:
+            print(Commands.set_replicas.__doc__.strip())
+            exit(EXIT_ERROR)
+
+        new_replicas = argv[3]
+        try:
+            new_replicas = float(new_replicas)
+        except ValueError:
+            print(Commands.set_replicas.__doc__.strip())
+            print("\"%s\" is not a valid number." % new_replicas)
+            exit(EXIT_ERROR)
+
+        if new_replicas < 1:
+            print("Replica count must be at least 1.")
+            exit(EXIT_ERROR)
+
+        builder.set_replicas(new_replicas)
+        print('The replica count is now %.6f.' % builder.replicas)
+        print('The change will take effect after the next rebalance.')
+        builder.save(builder_file)
+        exit(EXIT_SUCCESS)
+
+    @staticmethod
+    def set_overload():
+        """
+swift-ring-builder <builder_file> set_overload <overload>[%]
+    Changes the overload factor to the given <overload>.
+
+    A rebalance is needed to make the change take effect.
+    """
+        if len(argv) < 4:
+            print(Commands.set_overload.__doc__.strip())
+            exit(EXIT_ERROR)
+
+        new_overload = argv[3]
+        if new_overload.endswith('%'):
+            percent = True
+            new_overload = new_overload.rstrip('%')
+        else:
+            percent = False
+        try:
+            new_overload = float(new_overload)
+        except ValueError:
+            print(Commands.set_overload.__doc__.strip())
+            print("%r is not a valid number." % new_overload)
+            exit(EXIT_ERROR)
+
+        if percent:
+            new_overload *= 0.01
+        if new_overload < 0:
+            print("Overload must be non-negative.")
+            exit(EXIT_ERROR)
+
+        if new_overload > 1 and not percent:
+            print("!?! Warning overload is greater than 100% !?!")
+            status = EXIT_WARNING
+        else:
+            status = EXIT_SUCCESS
+
+        builder.set_overload(new_overload)
+        print('The overload factor is now %0.2f%% (%.6f)' % (
+            builder.overload * 100, builder.overload))
+        print('The change will take effect after the next rebalance.')
+        builder.save(builder_file)
+        exit(status)
+
+    @staticmethod
+    def prepare_increase_partition_power():
+        """
+swift-ring-builder <builder_file> prepare_increase_partition_power
+    Prepare the ring to increase the partition power by one.
+
+    A write_ring command is needed to make the change take effect.
+
+    Once the updated rings have been deployed to all servers you need to run
+    the swift-object-relinker tool to relink existing data.
+
+    *****************************
+    USE THIS WITH EXTREME CAUTION
+    *****************************
+
+    If you increase the partition power and deploy changed rings, you may
+    introduce unavailability in your cluster. This has an end-user impact. Make
+    sure you execute required operations to increase the partition power
+    accurately.
+
+    """
+        if len(argv) < 3:
+            print(Commands.prepare_increase_partition_power.__doc__.strip())
+            exit(EXIT_ERROR)
+
+        if "object" not in basename(builder_file):
+            print(
+                'Partition power increase is only supported for object rings.')
+            exit(EXIT_ERROR)
+
+        if not builder.prepare_increase_partition_power():
+            print('Ring is already prepared for partition power increase.')
+            exit(EXIT_ERROR)
+
+        builder.save(builder_file)
+
+        print('The next partition power is now %d.' % builder.next_part_power)
+        print('The change will take effect after the next write_ring.')
+        print('Ensure your proxy-servers, object-replicators and ')
+        print('reconstructors are using the changed rings and relink ')
+        print('(using swift-object-relinker) your existing data')
+        print('before the partition power increase')
+        exit(EXIT_SUCCESS)
+
+    @staticmethod
+    def increase_partition_power():
+        """
+swift-ring-builder <builder_file> increase_partition_power
+    Increases the partition power by one. Needs to be run after
+    prepare_increase_partition_power has been run and all existing data has
+    been relinked using the swift-object-relinker tool.
+
+    A write_ring command is needed to make the change take effect.
+
+    Once the updated rings have been deployed to all servers you need to run
+    the swift-object-relinker tool to cleanup old data.
+
+    *****************************
+    USE THIS WITH EXTREME CAUTION
+    *****************************
+
+    If you increase the partition power and deploy changed rings, you may
+    introduce unavailability in your cluster. This has an end-user impact. Make
+    sure you execute required operations to increase the partition power
+    accurately.
+
+    """
+        if len(argv) < 3:
+            print(Commands.increase_partition_power.__doc__.strip())
+            exit(EXIT_ERROR)
+
+        if builder.increase_partition_power():
+            print('The partition power is now %d.' % builder.part_power)
+            print('The change will take effect after the next write_ring.')
+
+            builder._update_last_part_moves()
+            builder.save(builder_file)
+
+            exit(EXIT_SUCCESS)
+        else:
+            print('Ring partition power cannot be increased. Either the ring')
+            print('was not prepared yet, or this operation has already run.')
+            exit(EXIT_ERROR)
+
+    @staticmethod
+    def cancel_increase_partition_power():
+        """
+swift-ring-builder <builder_file> cancel_increase_partition_power
+    Cancel the increase of the partition power.
+
+    A write_ring command is needed to make the change take effect.
+
+    Once the updated rings have been deployed to all servers you need to run
+    the swift-object-relinker tool to cleanup unneeded links.
+
+    *****************************
+    USE THIS WITH EXTREME CAUTION
+    *****************************
+
+    If you increase the partition power and deploy changed rings, you may
+    introduce unavailability in your cluster. This has an end-user impact. Make
+    sure you execute required operations to increase the partition power
+    accurately.
+
+    """
+        if len(argv) < 3:
+            print(Commands.cancel_increase_partition_power.__doc__.strip())
+            exit(EXIT_ERROR)
+
+        if not builder.cancel_increase_partition_power():
+            print('Ring partition power increase cannot be canceled.')
+            exit(EXIT_ERROR)
+
+        builder.save(builder_file)
+
+        print('The next partition power is now %d.' % builder.next_part_power)
+        print('The change will take effect after the next write_ring.')
+        print('Ensure your object-servers are using the changed rings and')
+        print('cleanup (using swift-object-relinker) the hard links')
+        exit(EXIT_SUCCESS)
+
+    @staticmethod
+    def finish_increase_partition_power():
+        """
+swift-ring-builder <builder_file> finish_increase_partition_power
+    Finally removes the next_part_power flag. Has to be run after the
+    swift-object-relinker tool has been used to cleanup old existing data.
+
+    A write_ring command is needed to make the change take effect.
+
+    *****************************
+    USE THIS WITH EXTREME CAUTION
+    *****************************
+
+    If you increase the partition power and deploy changed rings, you may
+    introduce unavailability in your cluster. This has an end-user impact. Make
+    sure you execute required operations to increase the partition power
+    accurately.
+
+    """
+        if len(argv) < 3:
+            print(Commands.finish_increase_partition_power.__doc__.strip())
+            exit(EXIT_ERROR)
+
+        if not builder.finish_increase_partition_power():
+            print('Ring partition power increase cannot be finished.')
+            exit(EXIT_ERROR)
+
+        print('The change will take effect after the next write_ring.')
+        builder.save(builder_file)
+
+        exit(EXIT_SUCCESS)
+
+
+def main(arguments=None):
+    global argv, backup_dir, builder, builder_file, ring_file
+    if arguments is not None:
+        argv = arguments
+    else:
+        argv = sys_argv
+
+    if len(argv) < 2:
+        print("swift-ring-builder %(MAJOR_VERSION)s.%(MINOR_VERSION)s\n" %
+              globals())
+        print(Commands.default.__doc__.strip())
+        print()
+        cmds = [c for c in dir(Commands)
+                if getattr(Commands, c).__doc__ and not c.startswith('_') and
+                c != 'default']
+        cmds.sort()
+        for cmd in cmds:
+            print(getattr(Commands, cmd).__doc__.strip())
+            print()
+        print(parse_search_value.__doc__.strip())
+        print()
+        for line in wrap(' '.join(cmds), 79, initial_indent='Quick list: ',
+                         subsequent_indent='            '):
+            print(line)
+        print('Exit codes: 0 = operation successful\n'
+              '            1 = operation completed with warnings\n'
+              '            2 = error')
+        exit(EXIT_SUCCESS)
+
+    builder_file, ring_file = parse_builder_ring_filename_args(argv)
+    if builder_file != argv[1]:
+        if len(argv) > 2 and argv[2] in ('write_builder', 'version'):
+            pass
+        else:
+            print('Note: using %s instead of %s as builder file' % (
+                builder_file, argv[1]))
+
+    try:
+        builder = RingBuilder.load(builder_file)
+    except exceptions.UnPicklingError as e:
+        msg = str(e)
+        try:
+            CompositeRingBuilder.load(builder_file)
+            msg += ' (it appears to be a composite ring builder file?)'
+        except Exception:  # noqa
+            pass
+        print(msg)
+        exit(EXIT_ERROR)
+    except (exceptions.FileNotFoundError, exceptions.PermissionError) as e:
+        if len(argv) < 3 or argv[2] not in ('create', 'write_builder',
+                                            'version'):
+            print(e)
+            exit(EXIT_ERROR)
+    except Exception as e:
+        print('Problem occurred while reading builder file: %s. %s' %
+              (builder_file, e))
+        exit(EXIT_ERROR)
+
+    backup_dir = pathjoin(dirname(builder_file), 'backups')
+    try:
+        mkdir(backup_dir)
+    except OSError as err:
+        if err.errno != EEXIST:
+            raise
+
+    if len(argv) == 2:
+        command = "default"
+    else:
+        command = argv[2]
+    if argv[0].endswith('-safe'):
+        try:
+            with lock_parent_directory(abspath(builder_file), 15):
+                getattr(Commands, command, Commands.unknown)()
+        except exceptions.LockTimeout:
+            print("Ring/builder dir currently locked.")
+            exit(2)
+    else:
+        getattr(Commands, command, Commands.unknown)()
+
+
+def error_handling_main():
+    # We exit code 1 on WARNING statuses, 2 on ERROR. This means we need
+    # to handle any uncaught exceptions by printing the usual backtrace,
+    # but then exiting 2 (not 1 as is usual for a python
+    # exception).
+
+    # We *don't* want to do this in main(), however, because we don't want to
+    # pollute the test environment or cause a bunch of test churn to mock out
+    # sys.excepthook
+
+    def exit_with_status_two(tp, val, tb):
+        traceback.print_exception(tp, val, tb)
+        exit(2)
+
+    sys.excepthook = exit_with_status_two
+    main()
+
+
+if __name__ == '__main__':
+    error_handling_main()
diff --git a/swift/cli/ringcomposer.py b/swift/cli/ringcomposer.py
new file mode 100644
index 0000000000..99b7ce6ccf
--- /dev/null
+++ b/swift/cli/ringcomposer.py
@@ -0,0 +1,182 @@
+# Copyright (c) 2017 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""
+``swift-ring-composer`` is an experimental tool for building a composite ring
+file from other existing component ring builder files. Its CLI, name or
+implementation may change or be removed altogether in future versions of Swift.
+
+Currently its interface is similar to that of the ``swift-ring-builder``. The
+command structure takes the form of::
+
+    swift-ring-composer <composite builder file> <sub-command> <options>
+
+where ``<composite builder file>`` is a special builder which stores a json
+blob of composite ring metadata. This metadata describes the component
+``RingBuilder``'s used in the composite ring, their order and version.
+
+There are currently 2 sub-commands: ``show`` and ``compose``. The ``show``
+sub-command takes no additional arguments and displays the current contents of
+of the composite builder file::
+
+    swift-ring-composer <composite builder file> show
+
+The ``compose`` sub-command is the one that actually stitches the component
+ring builders together to create both the composite ring file and composite
+builder file. The command takes the form::
+
+    swift-ring-composer <composite builder file> compose <builder1> \\
+    <builder2> [<builder3> .. <builderN>] --output <composite ring file> \\
+    [--force]
+
+There may look like there is a lot going on there but it's actually quite
+simple. The ``compose`` command takes in the list of builders to stitch
+together and the filename for the composite ring file via the ``--output``
+option. The ``--force`` option overrides checks on the ring composition.
+
+To change ring devices, first add or remove devices from the component ring
+builders and then use the ``compose`` sub-command to create a new composite
+ring file.
+
+.. note::
+
+    ``swift-ring-builder`` cannot be used to inspect the generated composite
+    ring file because there is no conventional builder file corresponding to
+    the composite ring file name. You can either programmatically look inside
+    the composite ring file using the swift ring classes or create a temporary
+    builder file from the composite ring file using::
+
+        swift-ring-builder <composite ring file> write_builder
+
+    Do not use this builder file to manage ring devices.
+
+For further details use::
+
+  swift-ring-composer -h
+"""
+import argparse
+import json
+import os
+import sys
+
+from swift.common.ring.composite_builder import CompositeRingBuilder
+
+EXIT_SUCCESS = 0
+EXIT_ERROR = 2
+
+WARNING = """
+NOTE: This tool is for experimental use and may be
+      removed in future versions of Swift.
+"""
+
+DESCRIPTION = """
+This is a tool for building a composite ring file from other existing ring
+builder files. The component ring builders must all have the same partition
+power. Each device must only be used in a single component builder. Each region
+must only be used in a single component builder.
+"""
+
+
+def _print_to_stderr(msg):
+    print(msg, file=sys.stderr)
+
+
+def _print_err(msg, err):
+    _print_to_stderr('%s\nOriginal exception message:\n%s' % (msg, err))
+
+
+def show(composite_builder, args):
+    print(json.dumps(composite_builder.to_dict(), indent=4, sort_keys=True))
+    return EXIT_SUCCESS
+
+
+def compose(composite_builder, args):
+    composite_builder = composite_builder or CompositeRingBuilder()
+    try:
+        ring_data = composite_builder.compose(
+            args.builder_files, force=args.force, require_modified=True)
+    except Exception as err:
+        _print_err(
+            'An error occurred while composing the ring.', err)
+        return EXIT_ERROR
+    try:
+        ring_data.save(args.output)
+    except Exception as err:
+        _print_err(
+            'An error occurred while writing the composite ring file.', err)
+        return EXIT_ERROR
+    try:
+        composite_builder.save(args.composite_builder_file)
+    except Exception as err:
+        _print_err(
+            'An error occurred while writing the composite builder file.', err)
+        return EXIT_ERROR
+    return EXIT_SUCCESS
+
+
+def main(arguments=None):
+    if arguments is not None:
+        argv = arguments
+    else:
+        argv = sys.argv
+
+    parser = argparse.ArgumentParser(description=DESCRIPTION)
+    parser.add_argument(
+        'composite_builder_file',
+        metavar='composite_builder_file', type=str,
+        help='Name of composite builder file')
+
+    subparsers = parser.add_subparsers(
+        help='subcommand help', title='subcommands')
+
+    # show
+    show_parser = subparsers.add_parser(
+        'show', help='show composite ring builder metadata')
+    show_parser.set_defaults(func=show)
+
+    # compose
+    compose_parser = subparsers.add_parser(
+        'compose', help='compose composite ring',
+        usage='%(prog)s [-h] '
+              '[builder_file builder_file [builder_file ...] '
+              '--output ring_file [--force]')
+    bf_help = ('Paths to component ring builder files to include in composite '
+               'ring')
+    compose_parser.add_argument('builder_files', metavar='builder_file',
+                                nargs='*', type=str, help=bf_help)
+    compose_parser.add_argument('--output', metavar='output_file', type=str,
+                                required=True, help='Name of output ring file')
+    compose_parser.add_argument(
+        '--force', action='store_true',
+        help='Force new composite ring file to be written')
+    compose_parser.set_defaults(func=compose)
+
+    _print_to_stderr(WARNING)
+    args = parser.parse_args(argv[1:])
+    composite_builder = None
+    if args.func != compose or os.path.exists(args.composite_builder_file):
+        try:
+            composite_builder = CompositeRingBuilder.load(
+                args.composite_builder_file)
+        except Exception as err:
+            _print_err(
+                'An error occurred while loading the composite builder file.',
+                err)
+            exit(EXIT_ERROR)
+
+    exit(args.func(composite_builder, args))
+
+
+if __name__ == '__main__':
+    main()
diff --git a/swift/cli/shard-info.py b/swift/cli/shard-info.py
new file mode 100644
index 0000000000..fdcfdf5d3e
--- /dev/null
+++ b/swift/cli/shard-info.py
@@ -0,0 +1,196 @@
+# Copyright (c) 2017 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import os
+from collections import defaultdict
+
+from swift.common import utils
+from swift.common.db_replicator import roundrobin_datadirs
+from swift.common.ring import ring
+from swift.common.utils import Timestamp
+from swift.container.backend import ContainerBroker, DATADIR
+
+TAB = '    '
+
+
+def broker_key(broker):
+    broker.get_info()
+    return broker.path
+
+
+def container_type(broker):
+    return 'ROOT' if broker.is_root_container() else 'SHARD'
+
+
+def collect_brokers(conf_path, names2nodes):
+    conf = utils.readconf(conf_path, 'container-replicator')
+    root = conf.get('devices', '/srv/node')
+    swift_dir = conf.get('swift_dir', '/etc/swift')
+    c_ring = ring.Ring(swift_dir, ring_name='container')
+    dirs = []
+    brokers = defaultdict(dict)
+    for node in c_ring.devs:
+        if node is None:
+            continue
+        datadir = os.path.join(root, node['device'], DATADIR)
+        if os.path.isdir(datadir):
+            dirs.append((datadir, node['id'], lambda *args: True))
+    for part, object_file, node_id in roundrobin_datadirs(dirs):
+        broker = ContainerBroker(object_file)
+        for node in c_ring.get_part_nodes(int(part)):
+            if node['id'] == node_id:
+                node_index = str(node['index'])
+                break
+        else:
+            node_index = 'handoff'
+        names2nodes[broker_key(broker)][(node_id, node_index)] = broker
+    return brokers
+
+
+def print_broker_info(node, broker, indent_level=0):
+    indent = indent_level * TAB
+    info = broker.get_info()
+    raw_info = broker._get_info()
+    deleted_at = float(info['delete_timestamp'])
+    if deleted_at:
+        deleted_at = Timestamp(info['delete_timestamp']).isoformat
+    else:
+        deleted_at = ' - '
+    print('%s(%s) %s, objs: %s, bytes: %s, actual_objs: %s, put: %s, '
+          'deleted: %s' %
+          (indent, node[1][0], broker.get_db_state(),
+           info['object_count'], info['bytes_used'], raw_info['object_count'],
+           Timestamp(info['put_timestamp']).isoformat, deleted_at))
+
+
+def print_db(node, broker, expect_type='ROOT', indent_level=0):
+    indent = indent_level * TAB
+    print('%s(%s) %s node id: %s, node index: %s' %
+          (indent, node[1][0], broker.db_file, node[0], node[1]))
+    actual_type = container_type(broker)
+    if actual_type != expect_type:
+        print('%s        ERROR expected %s but found %s' %
+              (indent, expect_type, actual_type))
+
+
+def print_own_shard_range(node, sr, indent_level):
+    indent = indent_level * TAB
+    range = '%r - %r' % (sr.lower, sr.upper)
+    print('%s(%s) %23s, objs: %3s, bytes: %3s, timestamp: %s (%s), '
+          'modified: %s (%s), %7s: %s (%s), deleted: %s, epoch: %s' %
+          (indent, node[1][0], range, sr.object_count, sr.bytes_used,
+           sr.timestamp.isoformat, sr.timestamp.internal,
+           sr.meta_timestamp.isoformat, sr.meta_timestamp.internal,
+           sr.state_text, sr.state_timestamp.isoformat,
+           sr.state_timestamp.internal, sr.deleted,
+           sr.epoch.internal if sr.epoch else None))
+
+
+def print_own_shard_range_info(node, shard_ranges, indent_level=0):
+    shard_ranges.sort(key=lambda x: x.deleted)
+    for sr in shard_ranges:
+        print_own_shard_range(node, sr, indent_level)
+
+
+def print_shard_range(node, sr, indent_level):
+    indent = indent_level * TAB
+    range = '%r - %r' % (sr.lower, sr.upper)
+    print('%s(%s) %23s, objs: %3s, bytes: %3s, timestamp: %s (%s), '
+          'modified: %s (%s), %7s: %s (%s), deleted: %s, epoch: %s %s' %
+          (indent, node[1][0], range, sr.object_count, sr.bytes_used,
+           sr.timestamp.isoformat, sr.timestamp.internal,
+           sr.meta_timestamp.isoformat, sr.meta_timestamp.internal,
+           sr.state_text, sr.state_timestamp.isoformat,
+           sr.state_timestamp.internal, sr.deleted,
+           sr.epoch.internal if sr.epoch else None, sr.name))
+
+
+def print_shard_range_info(node, shard_ranges, indent_level=0):
+    shard_ranges.sort(key=lambda x: x.deleted)
+    for sr in shard_ranges:
+        print_shard_range(node, sr, indent_level)
+
+
+def print_sharding_info(node, broker, indent_level=0):
+    indent = indent_level * TAB
+    print('%s(%s) %s' % (indent, node[1][0], broker.get_sharding_sysmeta()))
+
+
+def print_container(name, name2nodes2brokers, expect_type='ROOT',
+                    indent_level=0, used_names=None):
+    used_names = used_names or set()
+    indent = indent_level * TAB
+    node2broker = name2nodes2brokers[name]
+    ordered_by_index = sorted(node2broker.keys(), key=lambda x: x[1])
+    brokers = [(node, node2broker[node]) for node in ordered_by_index]
+
+    print('%sName: %s' % (indent, name))
+    if name in used_names:
+        print('%s  (Details already listed)\n' % indent)
+        return
+
+    used_names.add(name)
+    print(indent + 'DB files:')
+    for node, broker in brokers:
+        print_db(node, broker, expect_type, indent_level=indent_level + 1)
+
+    print(indent + 'Info:')
+    for node, broker in brokers:
+        print_broker_info(node, broker, indent_level=indent_level + 1)
+
+    print(indent + 'Sharding info:')
+    for node, broker in brokers:
+        print_sharding_info(node, broker, indent_level=indent_level + 1)
+    print(indent + 'Own shard range:')
+    for node, broker in brokers:
+        shard_ranges = broker.get_shard_ranges(
+            include_deleted=True, include_own=True, exclude_others=True)
+        print_own_shard_range_info(node, shard_ranges,
+                                   indent_level=indent_level + 1)
+    print(indent + 'Shard ranges:')
+    shard_names = set()
+    for node, broker in brokers:
+        shard_ranges = broker.get_shard_ranges(include_deleted=True)
+        for sr_name in shard_ranges:
+            shard_names.add(sr_name.name)
+        print_shard_range_info(node, shard_ranges,
+                               indent_level=indent_level + 1)
+    print(indent + 'Shards:')
+    for sr_name in shard_names:
+        print_container(sr_name, name2nodes2brokers, expect_type='SHARD',
+                        indent_level=indent_level + 1, used_names=used_names)
+    print('\n')
+
+
+def run(conf_paths):
+    # container_name -> (node id, node index) -> broker
+    name2nodes2brokers = defaultdict(dict)
+    for conf_path in conf_paths:
+        collect_brokers(conf_path, name2nodes2brokers)
+
+    print('First column on each line is (node index)\n')
+    for name, node2broker in name2nodes2brokers.items():
+        expect_root = False
+        for node, broker in node2broker.items():
+            expect_root = broker.is_root_container() or expect_root
+        if expect_root:
+            print_container(name, name2nodes2brokers)
+
+
+if __name__ == '__main__':
+    conf_dir = '/etc/swift/container-server'
+    conf_paths = [os.path.join(conf_dir, p) for p in os.listdir(conf_dir)
+                  if p.endswith(('conf', 'conf.d'))]
+    run(conf_paths)
diff --git a/swift/common/__init__.py b/swift/common/__init__.py
index 880a66aa87..56aa6012d4 100644
--- a/swift/common/__init__.py
+++ b/swift/common/__init__.py
@@ -1 +1 @@
-""" Code common to all of Swift. """
+"""Code common to all of Swift."""
diff --git a/swift/common/base_storage_server.py b/swift/common/base_storage_server.py
new file mode 100644
index 0000000000..7ba30703d2
--- /dev/null
+++ b/swift/common/base_storage_server.py
@@ -0,0 +1,141 @@
+# Copyright (c) 2010-2014 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import inspect
+import time
+import functools
+
+from swift import __version__ as swift_version
+from swift.common.utils import public, config_true_value, \
+    LOG_LINE_DEFAULT_FORMAT
+from swift.common.http import is_server_error
+from swift.common.swob import Response, HTTPException
+
+
+def labeled_timing_stats(metric, **dec_kwargs):
+    """
+    Returns a decorator that emits labeled metrics timing events or errors
+    for public methods in swift's wsgi server controllers, based on response
+    code.
+
+    The controller methods are not allowed to override the following labels:
+    'method', 'status'.
+    """
+    def decorating_func(func):
+
+        @functools.wraps(func)
+        def _timing_stats(ctrl, req, *args, **kwargs):
+            labels = {}
+            start_time = time.time()
+            req_method = req.method
+            try:
+                resp = func(
+                    ctrl, req, *args, timing_stats_labels=labels, **kwargs)
+            except HTTPException as e:
+                resp = e
+            labels['method'] = req_method
+            labels['status'] = resp.status_int
+
+            ctrl.statsd.timing_since(metric, start_time, labels=labels,
+                                     **dec_kwargs)
+            return resp
+
+        return _timing_stats
+    return decorating_func
+
+
+def timing_stats(**dec_kwargs):
+    """
+    Returns a decorator that logs timing events or errors for public methods in
+    swift's wsgi server controllers, based on response code.
+    """
+    def decorating_func(func):
+        method = func.__name__
+
+        @functools.wraps(func)
+        def _timing_stats(ctrl, *args, **kwargs):
+            start_time = time.time()
+            try:
+                resp = func(ctrl, *args, **kwargs)
+            except HTTPException as e:
+                resp = e
+            # .timing is for successful responses *or* error codes that are
+            # not Swift's fault. For example, 500 is definitely the server's
+            # fault, but 412 is an error code (4xx are all errors) that is
+            # due to a header the client sent.
+            #
+            # .errors.timing is for failures that *are* Swift's fault.
+            # Examples include 507 for an unmounted drive or 500 for an
+            # unhandled exception.
+            if not is_server_error(resp.status_int):
+                ctrl.logger.timing_since(method + '.timing',
+                                         start_time, **dec_kwargs)
+            else:
+                ctrl.logger.timing_since(method + '.errors.timing',
+                                         start_time, **dec_kwargs)
+            return resp
+
+        return _timing_stats
+    return decorating_func
+
+
+class BaseStorageServer(object):
+    """
+    Implements common OPTIONS method for object, account, container servers.
+    """
+
+    def __init__(self, conf, **kwargs):
+        self._allowed_methods = None
+        self.replication_server = config_true_value(
+            conf.get('replication_server', 'true'))
+        self.log_format = conf.get('log_format', LOG_LINE_DEFAULT_FORMAT)
+        self.anonymization_method = conf.get('log_anonymization_method', 'md5')
+        self.anonymization_salt = conf.get('log_anonymization_salt', '')
+
+    @property
+    def server_type(self):
+        raise NotImplementedError(
+            'Storage nodes have not implemented the Server type.')
+
+    @property
+    def allowed_methods(self):
+        if self._allowed_methods is None:
+            self._allowed_methods = []
+            all_methods = inspect.getmembers(self, predicate=callable)
+            for name, m in all_methods:
+                if not getattr(m, 'publicly_accessible', False):
+                    continue
+                if getattr(m, 'replication', False) and \
+                        not self.replication_server:
+                    continue
+                self._allowed_methods.append(name)
+            self._allowed_methods.sort()
+        return self._allowed_methods
+
+    @public
+    @timing_stats()
+    def OPTIONS(self, req):
+        """
+        Base handler for OPTIONS requests
+
+        :param req: swob.Request object
+        :returns: swob.Response object
+        """
+        # Prepare the default response
+        headers = {'Allow': ', '.join(self.allowed_methods),
+                   'Server': '%s/%s' % (self.server_type, swift_version)}
+        resp = Response(status=200, request=req, headers=headers)
+
+        return resp
diff --git a/swift/common/bench.py b/swift/common/bench.py
deleted file mode 100644
index 7eef51a57d..0000000000
--- a/swift/common/bench.py
+++ /dev/null
@@ -1,486 +0,0 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#    http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-# implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-import re
-import sys
-import uuid
-import time
-import random
-import signal
-import socket
-import logging
-from contextlib import contextmanager
-from optparse import Values
-
-import eventlet
-import eventlet.pools
-from eventlet.green.httplib import CannotSendRequest
-
-from swift.common.utils import config_true_value, LogAdapter
-import swiftclient as client
-from swift.common import direct_client
-from swift.common.http import HTTP_CONFLICT
-
-try:
-    import simplejson as json
-except ImportError:
-    import json
-
-
-def _func_on_containers(logger, conf, concurrency_key, func):
-    """Run a function on each container with concurrency."""
-
-    bench = Bench(logger, conf, [])
-    pool = eventlet.GreenPool(int(getattr(conf, concurrency_key)))
-    for container in conf.containers:
-        pool.spawn_n(func, bench.url, bench.token, container)
-    pool.waitall()
-
-
-def delete_containers(logger, conf):
-    """Utility function to delete benchmark containers."""
-
-    def _deleter(url, token, container):
-        try:
-            client.delete_container(url, token, container)
-        except client.ClientException, e:
-            if e.http_status != HTTP_CONFLICT:
-                logger.warn("Unable to delete container '%s'. "
-                            "Got http status '%d'."
-                            % (container, e.http_status))
-
-    _func_on_containers(logger, conf, 'del_concurrency', _deleter)
-
-
-def create_containers(logger, conf):
-    """Utility function to create benchmark containers."""
-
-    _func_on_containers(logger, conf, 'put_concurrency', client.put_container)
-
-
-class SourceFile(object):
-    """
-    Iterable, file-like object to lazily emit a bunch of zeros in
-    reasonable-size chunks.
-
-    swift.common.direct_client wants iterables, but swiftclient wants
-    file-like objects where hasattr(thing, 'read') is true. Therefore,
-    this class can do both.
-    """
-
-    def __init__(self, size, chunk_size=1024 * 64):
-        self.pos = 0
-        self.size = size
-        self.chunk_size = chunk_size
-
-    def __iter__(self):
-        return self
-
-    def __len__(self):
-        return self.size
-
-    def next(self):
-        if self.pos >= self.size:
-            raise StopIteration
-        chunk_size = min(self.size - self.pos, self.chunk_size)
-        yield '0' * chunk_size
-        self.pos += chunk_size
-
-    def read(self, desired_size):
-        chunk_size = min(self.size - self.pos, desired_size)
-        self.pos += chunk_size
-        return '0' * chunk_size
-
-
-class ConnectionPool(eventlet.pools.Pool):
-
-    def __init__(self, url, size):
-        self.url = url
-        eventlet.pools.Pool.__init__(self, size, size)
-
-    def create(self):
-        return client.http_connection(self.url)
-
-
-class BenchServer(object):
-    """
-    A BenchServer binds to an IP/port and listens for bench jobs.  A bench
-    job consists of the normal conf "dict" encoded in JSON, terminated with an
-    EOF.  The log level is at least INFO, but DEBUG may also be specified in
-    the conf dict.
-
-    The server will wait forever for jobs, running them one at a time.
-    """
-    def __init__(self, logger, bind_ip, bind_port):
-        self.logger = logger
-        self.bind_ip = bind_ip
-        self.bind_port = int(bind_port)
-
-    def run(self):
-        s = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
-        self.logger.info('Binding to %s:%s', self.bind_ip, self.bind_port)
-        s.bind((self.bind_ip, self.bind_port))
-        s.listen(20)
-        while True:
-            client, address = s.accept()
-            self.logger.debug('Accepting connection from %s:%s', *address)
-            client_file = client.makefile('rb+', 1)
-            json_data = client_file.read()
-            conf = Values(json.loads(json_data))
-
-            self.logger.info(
-                'Starting run for %s:%s [put/get/del_concurrency: %s/%s/%s, '
-                'num_objects: %s, num_gets: %s]', address[0], address[1],
-                conf.put_concurrency, conf.get_concurrency,
-                conf.del_concurrency, conf.num_objects, conf.num_gets)
-
-            logger = logging.getLogger('bench-server')
-            level = logging.DEBUG if conf.log_level.lower() == 'debug' \
-                else logging.INFO
-            logger.setLevel(level)
-            loghandler = logging.StreamHandler(client_file)
-            logformat = logging.Formatter(
-                '%(server)s %(asctime)s %(levelname)s %(message)s')
-            loghandler.setFormatter(logformat)
-            logger.addHandler(loghandler)
-            logger = LogAdapter(logger, 'swift-bench-server')
-
-            controller = BenchController(logger, conf)
-            try:
-                controller.run()
-            except socket.error:
-                logger.warning('Socket error', exc_info=1)
-
-            logger.logger.removeHandler(loghandler)
-            client_file.close()
-            client.close()
-
-            self.logger.info('...bench run completed; waiting for next run.')
-
-
-class Bench(object):
-
-    def __init__(self, logger, conf, names):
-        self.logger = logger
-        self.aborted = False
-        self.user = conf.user
-        self.key = conf.key
-        self.auth_url = conf.auth
-        self.use_proxy = config_true_value(conf.use_proxy)
-        self.auth_version = conf.auth_version
-        self.logger.info("Auth version: %s" % self.auth_version)
-        if self.use_proxy:
-            url, token = client.get_auth(self.auth_url, self.user, self.key,
-                                         auth_version=self.auth_version)
-            self.token = token
-            self.account = url.split('/')[-1]
-            if conf.url == '':
-                self.url = url
-            else:
-                self.url = conf.url
-        else:
-            self.token = 'SlapChop!'
-            self.account = conf.account
-            self.url = conf.url
-            self.ip, self.port = self.url.split('/')[2].split(':')
-
-        self.object_size = int(conf.object_size)
-        self.object_sources = conf.object_sources
-        self.lower_object_size = int(conf.lower_object_size)
-        self.upper_object_size = int(conf.upper_object_size)
-        self.files = []
-        if self.object_sources:
-            self.object_sources = self.object_sources.split()
-            self.files = [file(f, 'rb').read() for f in self.object_sources]
-
-        self.put_concurrency = int(conf.put_concurrency)
-        self.get_concurrency = int(conf.get_concurrency)
-        self.del_concurrency = int(conf.del_concurrency)
-        self.total_objects = int(conf.num_objects)
-        self.total_gets = int(conf.num_gets)
-        self.timeout = int(conf.timeout)
-        self.devices = conf.devices.split()
-        self.names = names
-        self.conn_pool = ConnectionPool(self.url,
-                                        max(self.put_concurrency,
-                                            self.get_concurrency,
-                                            self.del_concurrency))
-
-    def _log_status(self, title):
-        total = time.time() - self.beginbeat
-        self.logger.info(_('%(complete)s %(title)s [%(fail)s failures], '
-                           '%(rate).01f/s'),
-                         {'title': title, 'complete': self.complete,
-                          'fail': self.failures,
-                          'rate': (float(self.complete) / total)})
-
-    @contextmanager
-    def connection(self):
-        try:
-            hc = self.conn_pool.get()
-            try:
-                yield hc
-            except CannotSendRequest:
-                self.logger.info(_("CannotSendRequest.  Skipping..."))
-                try:
-                    hc.close()
-                except Exception:
-                    pass
-                self.failures += 1
-                hc = self.conn_pool.create()
-        finally:
-            self.conn_pool.put(hc)
-
-    def run(self):
-        pool = eventlet.GreenPool(self.concurrency)
-        self.beginbeat = self.heartbeat = time.time()
-        self.heartbeat -= 13    # just to get the first report quicker
-        self.failures = 0
-        self.complete = 0
-        for i in xrange(self.total):
-            if self.aborted:
-                break
-            pool.spawn_n(self._run, i)
-        pool.waitall()
-        self._log_status(self.msg + ' **FINAL**')
-
-    def _run(self, thread):
-        return
-
-
-class DistributedBenchController(object):
-    """
-    This class manages a distributed swift-bench run.  For this Controller
-    class to make sense, the conf.bench_clients list must contain at least one
-    entry.
-
-    The idea is to split the configured load between one or more
-    swift-bench-client processes, each of which use eventlet for concurrency.
-    We deliberately take a simple, naive approach with these limitations:
-        1) Concurrency, num_objects, and num_gets are spread evenly between the
-           swift-bench-client processes.  With a low concurrency to
-           swift-bench-client count ratio, rounding may result in a greater
-           than desired aggregate concurrency.
-        2) Each swift-bench-client process runs independently so some may
-           finish up before others, i.e. the target aggregate concurrency is
-           not necessarily present the whole time.  This may bias aggregate
-           reported rates lower than a more efficient architecture.
-        3) Because of #2, some swift-bench-client processes may be running GETs
-           while others are still runinng their PUTs.  Because of this
-           potential skew, distributed runs will not isolate one operation at a
-           time like a single swift-bench run will.
-        3) Reported aggregate rates are simply the sum of each
-           swift-bench-client process reported FINAL number.  That's probably
-           inaccurate somehow.
-    """
-
-    def __init__(self, logger, conf):
-        self.logger = logger
-        # ... INFO 1000 PUTS **FINAL** [0 failures], 34.9/s
-        self.final_re = re.compile(
-            'INFO (\d+) (.*) \*\*FINAL\*\* \[(\d+) failures\], (\d+\.\d+)/s')
-        self.clients = conf.bench_clients
-        del conf.bench_clients
-        for k in ['put_concurrency', 'get_concurrency', 'del_concurrency',
-                  'num_objects', 'num_gets']:
-            setattr(conf, k, max(1, int(getattr(conf, k)) / len(self.clients)))
-        self.conf = conf
-
-    def run(self):
-        eventlet.patcher.monkey_patch(socket=True)
-        pool = eventlet.GreenPool(size=len(self.clients))
-        pile = eventlet.GreenPile(pool)
-        for client in self.clients:
-            pile.spawn(self.do_run, client)
-        results = {
-            'PUTS': dict(count=0, failures=0, rate=0.0),
-            'GETS': dict(count=0, failures=0, rate=0.0),
-            'DEL': dict(count=0, failures=0, rate=0.0),
-        }
-        for result in pile:
-            for k, v in result.iteritems():
-                target = results[k]
-                target['count'] += int(v['count'])
-                target['failures'] += int(v['failures'])
-                target['rate'] += float(v['rate'])
-        for k in ['PUTS', 'GETS', 'DEL']:
-            v = results[k]
-            self.logger.info('%d %s **FINAL** [%d failures], %.1f/s' % (
-                v['count'], k, v['failures'], v['rate']))
-
-    def do_run(self, client):
-        s = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
-        ip, port = client.split(':')
-        s.connect((ip, int(port)))
-        s.sendall(json.dumps(self.conf.__dict__))
-        s.shutdown(socket.SHUT_WR)
-        s_file = s.makefile('rb', 1)
-        result = {}
-        for line in s_file:
-            match = self.final_re.search(line)
-            if match:
-                g = match.groups()
-                result[g[1]] = {
-                    'count': g[0],
-                    'failures': g[2],
-                    'rate': g[3],
-                }
-            else:
-                sys.stderr.write('%s %s' % (client, line))
-        return result
-
-
-class BenchController(object):
-
-    def __init__(self, logger, conf):
-        self.logger = logger
-        self.conf = conf
-        self.names = []
-        self.delete = config_true_value(conf.delete)
-        self.gets = int(conf.num_gets)
-        self.aborted = False
-
-    def sigint1(self, signum, frame):
-        if self.delete:
-            print >>sys.stderr, (
-                'SIGINT received; finishing up and running DELETE.\n'
-                'Send one more SIGINT to exit *immediately*.')
-            self.aborted = True
-            if self.running and not isinstance(self.running, BenchDELETE):
-                self.running.aborted = True
-            signal.signal(signal.SIGINT, self.sigint2)
-        else:
-            self.sigint2(signum, frame)
-
-    def sigint2(self, signum, frame):
-        sys.exit('Final SIGINT received.')
-
-    def run(self):
-        signal.signal(signal.SIGINT, self.sigint1)
-        puts = BenchPUT(self.logger, self.conf, self.names)
-        self.running = puts
-        puts.run()
-        if self.gets and not self.aborted:
-            gets = BenchGET(self.logger, self.conf, self.names)
-            self.running = gets
-            gets.run()
-        if self.delete:
-            dels = BenchDELETE(self.logger, self.conf, self.names)
-            self.running = dels
-            dels.run()
-
-
-class BenchDELETE(Bench):
-
-    def __init__(self, logger, conf, names):
-        Bench.__init__(self, logger, conf, names)
-        self.concurrency = self.del_concurrency
-        self.total = len(names)
-        self.msg = 'DEL'
-
-    def _run(self, thread):
-        if time.time() - self.heartbeat >= 15:
-            self.heartbeat = time.time()
-            self._log_status('DEL')
-        device, partition, name, container_name = self.names.pop()
-        with self.connection() as conn:
-            try:
-                if self.use_proxy:
-                    client.delete_object(self.url, self.token,
-                                         container_name, name, http_conn=conn)
-                else:
-                    node = {'ip': self.ip, 'port': self.port, 'device': device}
-                    direct_client.direct_delete_object(node, partition,
-                                                       self.account,
-                                                       container_name, name)
-            except client.ClientException, e:
-                self.logger.debug(str(e))
-                self.failures += 1
-        self.complete += 1
-
-
-class BenchGET(Bench):
-
-    def __init__(self, logger, conf, names):
-        Bench.__init__(self, logger, conf, names)
-        self.concurrency = self.get_concurrency
-        self.total = self.total_gets
-        self.msg = 'GETS'
-
-    def _run(self, thread):
-        if time.time() - self.heartbeat >= 15:
-            self.heartbeat = time.time()
-            self._log_status('GETS')
-        device, partition, name, container_name = random.choice(self.names)
-        with self.connection() as conn:
-            try:
-                if self.use_proxy:
-                    client.get_object(self.url, self.token,
-                                      container_name, name, http_conn=conn)
-                else:
-                    node = {'ip': self.ip, 'port': self.port, 'device': device}
-                    direct_client.direct_get_object(node, partition,
-                                                    self.account,
-                                                    container_name, name)
-            except client.ClientException, e:
-                self.logger.debug(str(e))
-                self.failures += 1
-        self.complete += 1
-
-
-class BenchPUT(Bench):
-
-    def __init__(self, logger, conf, names):
-        Bench.__init__(self, logger, conf, names)
-        self.concurrency = self.put_concurrency
-        self.total = self.total_objects
-        self.msg = 'PUTS'
-        self.containers = conf.containers
-
-    def _run(self, thread):
-        if time.time() - self.heartbeat >= 15:
-            self.heartbeat = time.time()
-            self._log_status('PUTS')
-        name = uuid.uuid4().hex
-        if self.object_sources:
-            source = random.choice(self.files)
-        elif self.upper_object_size > self.lower_object_size:
-            source = SourceFile(random.randint(self.lower_object_size,
-                                               self.upper_object_size))
-        else:
-            source = SourceFile(self.object_size)
-        device = random.choice(self.devices)
-        partition = str(random.randint(1, 3000))
-        container_name = random.choice(self.containers)
-        with self.connection() as conn:
-            try:
-                if self.use_proxy:
-                    client.put_object(self.url, self.token,
-                                      container_name, name, source,
-                                      content_length=len(source),
-                                      http_conn=conn)
-                else:
-                    node = {'ip': self.ip, 'port': self.port, 'device': device}
-                    direct_client.direct_put_object(node, partition,
-                                                    self.account,
-                                                    container_name, name,
-                                                    source,
-                                                    content_length=len(source))
-            except client.ClientException, e:
-                self.logger.debug(str(e))
-                self.failures += 1
-            else:
-                self.names.append((device, partition, name, container_name))
-        self.complete += 1
diff --git a/swift/common/bufferedhttp.py b/swift/common/bufferedhttp.py
index 00e58da756..62c07e1623 100644
--- a/swift/common/bufferedhttp.py
+++ b/swift/common/bufferedhttp.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -26,12 +26,23 @@
     make all calls through httplib.
 """
 
-from urllib import quote
+from swift.common import constraints
+import http.client
 import logging
 import time
+import socket
 
-from eventlet.green.httplib import CONTINUE, HTTPConnection, HTTPMessage, \
-    HTTPResponse, HTTPSConnection, _UNKNOWN
+from eventlet.green.http.client import CONTINUE, HTTPConnection, \
+    HTTPResponse, HTTPSConnection, _UNKNOWN, ImproperConnectionState
+from urllib.parse import quote, parse_qsl, urlencode
+
+from eventlet.green.http import client as green_http_client
+
+# Apparently http.server uses this to decide when/whether to send a 431.
+# Give it some slack, so the app is more likely to get the chance to reject
+# with a 400 instead.
+http.client._MAXHEADERS = constraints.MAX_HEADER_COUNT * 1.6
+green_http_client._MAXHEADERS = constraints.MAX_HEADER_COUNT * 1.6
 
 
 class BufferedHTTPResponse(HTTPResponse):
@@ -39,13 +50,24 @@ class BufferedHTTPResponse(HTTPResponse):
 
     def __init__(self, sock, debuglevel=0, strict=0,
                  method=None):          # pragma: no cover
+        # sock should be an eventlet.greenio.GreenSocket
         self.sock = sock
-        self.fp = sock.makefile('rb')
+        if sock is None:
+            # ...but it could be None if we close the connection as we're
+            # getting it wrapped up in a Response
+            self._real_socket = None
+            # No socket means no file-like -- set it to None like in
+            # HTTPResponse.close()
+            self.fp = None
+        else:
+            # sock.fd is a socket.socket, which should have a _real_close
+            self._real_socket = sock.fd
+            self.fp = sock.makefile('rb')
         self.debuglevel = debuglevel
         self.strict = strict
         self._method = method
 
-        self.msg = None
+        self._headers = self.msg = None
 
         # from the Status-Line of the response
         self.version = _UNKNOWN         # HTTP-Version
@@ -56,11 +78,45 @@ def __init__(self, sock, debuglevel=0, strict=0,
         self.chunk_left = _UNKNOWN      # bytes left to read in current chunk
         self.length = _UNKNOWN          # number of bytes left in response
         self.will_close = _UNKNOWN      # conn will close at end of response
+        self._readline_buffer = b''
+
+    @property
+    def headers(self):
+        return self._headers
+
+    @headers.setter
+    def headers(self, hdrs):
+        try:
+            header_payload = hdrs.get_payload()
+        except AttributeError:
+            pass
+        else:
+            if isinstance(header_payload, list) and len(header_payload) == 1:
+                header_payload = header_payload[0].get_payload()
+            if header_payload:
+                # This shouldn't be here. We must've bumped up against
+                # https://bugs.python.org/issue37093
+                for line in header_payload.rstrip('\r\n').split('\n'):
+                    if ':' not in line or line[:1] in ' \t':
+                        # Well, we're no more broken than we were before...
+                        # Should we support line folding?
+                        # How can/should we handle a bad header line?
+                        break
+                    header, value = line.split(':', 1)
+                    value = value.strip(' \t\n\r')
+                    hdrs.add_header(header, value)
+                # Clear the payload now that all headers are present.
+                # Otherwise, we may double-up the headers parsed here
+                # if/when repeatedly setting the headers property.
+                hdrs.set_payload(None)
+        self._headers = hdrs
 
     def expect_response(self):
         if self.fp:
             self.fp.close()
             self.fp = None
+        if not self.sock:
+            raise ImproperConnectionState('Socket already closed')
         self.fp = self.sock.makefile('rb', 0)
         version, status, reason = self._read_status()
         if status != CONTINUE:
@@ -70,12 +126,49 @@ def expect_response(self):
             self.status = status
             self.reason = reason.strip()
             self.version = 11
-            self.msg = HTTPMessage(self.fp, 0)
-            self.msg.fp = None
+            self.headers = self.msg = http.client.parse_headers(self.fp)
+
+    def read(self, amt=None):
+        if not self._readline_buffer:
+            return HTTPResponse.read(self, amt)
+
+        if amt is None:
+            # Unbounded read: send anything we have buffered plus whatever
+            # is left.
+            buffered = self._readline_buffer
+            self._readline_buffer = b''
+            return buffered + HTTPResponse.read(self, amt)
+        elif amt <= len(self._readline_buffer):
+            # Bounded read that we can satisfy entirely from our buffer
+            res = self._readline_buffer[:amt]
+            self._readline_buffer = self._readline_buffer[amt:]
+            return res
+        else:
+            # Bounded read that wants more bytes than we have
+            smaller_amt = amt - len(self._readline_buffer)
+            buf = self._readline_buffer
+            self._readline_buffer = b''
+            return buf + HTTPResponse.read(self, smaller_amt)
+
+    def nuke_from_orbit(self):
+        """
+        Terminate the socket with extreme prejudice.
+
+        Closes the underlying socket regardless of whether or not anyone else
+        has references to it. Use this when you are certain that nobody else
+        you care about has a reference to this socket.
+        """
+        if self._real_socket:
+            # Hopefully this is equivalent to py2's _real_socket.close()?
+            # TODO: verify that this does everything ^^^^ does for py2
+            self._real_socket._real_close()
+        self._real_socket = None
+        self.close()
 
     def close(self):
         HTTPResponse.close(self)
         self.sock = None
+        self._real_socket = None
 
 
 class BufferedHTTPConnection(HTTPConnection):
@@ -84,24 +177,41 @@ class BufferedHTTPConnection(HTTPConnection):
 
     def connect(self):
         self._connected_time = time.time()
-        return HTTPConnection.connect(self)
+        ret = HTTPConnection.connect(self)
+        self.sock.setsockopt(socket.IPPROTO_TCP, socket.TCP_NODELAY, 1)
+        return ret
 
     def putrequest(self, method, url, skip_host=0, skip_accept_encoding=0):
+        '''Send a request to the server.
+
+        :param method: specifies an HTTP request method, e.g. 'GET'.
+        :param url: specifies the object being requested, e.g. '/index.html'.
+        :param skip_host: if True does not add automatically a 'Host:' header
+        :param skip_accept_encoding: if True does not add automatically an
+           'Accept-Encoding:' header
+        '''
         self._method = method
         self._path = url
         return HTTPConnection.putrequest(self, method, url, skip_host,
                                          skip_accept_encoding)
 
+    def putheader(self, header, value):
+        if not isinstance(header, bytes):
+            header = header.encode('latin-1')
+        HTTPConnection.putheader(self, header, value)
+
     def getexpect(self):
-        response = BufferedHTTPResponse(self.sock, strict=self.strict,
-                                        method=self._method)
+        kwargs = {'method': self._method}
+        if hasattr(self, 'strict'):
+            kwargs['strict'] = self.strict
+        response = BufferedHTTPResponse(self.sock, **kwargs)
         response.expect_response()
         return response
 
     def getresponse(self):
         response = HTTPConnection.getresponse(self)
-        logging.debug(_("HTTP PERF: %(time).5f seconds to %(method)s "
-                        "%(host)s:%(port)s %(path)s)"),
+        logging.debug("HTTP PERF: %(time).5f seconds to %(method)s "
+                      "%(host)s:%(port)s %(path)s)",
                       {'time': time.time() - self._connected_time,
                        'method': self._method, 'host': self.host,
                        'port': self.port, 'path': self._path})
@@ -126,12 +236,15 @@ def http_connect(ipaddr, port, device, partition, method, path,
     :param ssl: set True if SSL should be used (default: False)
     :returns: HTTPConnection object
     """
-    if isinstance(path, unicode):
-        try:
-            path = path.encode("utf-8")
-        except UnicodeError:
-            pass   # what should I do?
-    path = quote('/' + device + '/' + str(partition) + path)
+    if isinstance(path, str):
+        path = path.encode("utf-8")
+    if isinstance(device, str):
+        device = device.encode("utf-8")
+    if isinstance(partition, str):
+        partition = partition.encode('utf-8')
+    elif isinstance(partition, int):
+        partition = str(partition).encode('ascii')
+    path = quote(b'/' + device + b'/' + partition + path)
     return http_connect_raw(
         ipaddr, port, method, path, headers, query_string, ssl)
 
@@ -159,11 +272,16 @@ def http_connect_raw(ipaddr, port, method, path, headers=None,
     else:
         conn = BufferedHTTPConnection('%s:%s' % (ipaddr, port))
     if query_string:
+        # Round trip to ensure proper quoting
+        query_string = urlencode(
+            parse_qsl(query_string, keep_blank_values=True,
+                      encoding='latin1'),
+            encoding='latin1')
         path += '?' + query_string
     conn.path = path
     conn.putrequest(method, path, skip_host=(headers and 'Host' in headers))
     if headers:
-        for header, value in headers.iteritems():
+        for header, value in headers.items():
             conn.putheader(header, str(value))
     conn.endheaders()
     return conn
diff --git a/swift/common/constraints.py b/swift/common/constraints.py
index 07bf44e494..204a0d029e 100644
--- a/swift/common/constraints.py
+++ b/swift/common/constraints.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,89 +13,158 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
+import functools
 import os
+from os.path import isdir  # tighter scoped import for mocking
+
+from configparser import ConfigParser, NoSectionError, NoOptionError
 import urllib
-from ConfigParser import ConfigParser, NoSectionError, NoOptionError, \
-    RawConfigParser
 
+from swift.common import utils, exceptions
 from swift.common.swob import HTTPBadRequest, HTTPLengthRequired, \
-    HTTPRequestEntityTooLarge
+    HTTPRequestEntityTooLarge, HTTPPreconditionFailed, HTTPNotImplemented, \
+    HTTPException, wsgi_to_str, wsgi_to_bytes
 
-constraints_conf = ConfigParser()
-constraints_conf.read('/etc/swift/swift.conf')
+MAX_FILE_SIZE = 5368709122
+MAX_META_NAME_LENGTH = 128
+MAX_META_VALUE_LENGTH = 256
+MAX_META_COUNT = 90
+MAX_META_OVERALL_SIZE = 4096
+MAX_HEADER_SIZE = 8192
+MAX_REQUEST_LINE = 8192
+MAX_OBJECT_NAME_LENGTH = 1024
+CONTAINER_LISTING_LIMIT = 10000
+ACCOUNT_LISTING_LIMIT = 10000
+MAX_ACCOUNT_NAME_LENGTH = 256
+MAX_CONTAINER_NAME_LENGTH = 256
+VALID_API_VERSIONS = ["v1", "v1.0"]
+EXTRA_HEADER_COUNT = 0
+AUTO_CREATE_ACCOUNT_PREFIX = '.'
 
+# If adding an entry to DEFAULT_CONSTRAINTS, note that
+# these constraints are automatically published by the
+# proxy server in responses to /info requests, with values
+# updated by reload_constraints()
+DEFAULT_CONSTRAINTS = {
+    'max_file_size': MAX_FILE_SIZE,
+    'max_meta_name_length': MAX_META_NAME_LENGTH,
+    'max_meta_value_length': MAX_META_VALUE_LENGTH,
+    'max_meta_count': MAX_META_COUNT,
+    'max_meta_overall_size': MAX_META_OVERALL_SIZE,
+    'max_header_size': MAX_HEADER_SIZE,
+    'max_request_line': MAX_REQUEST_LINE,
+    'max_object_name_length': MAX_OBJECT_NAME_LENGTH,
+    'container_listing_limit': CONTAINER_LISTING_LIMIT,
+    'account_listing_limit': ACCOUNT_LISTING_LIMIT,
+    'max_account_name_length': MAX_ACCOUNT_NAME_LENGTH,
+    'max_container_name_length': MAX_CONTAINER_NAME_LENGTH,
+    'valid_api_versions': VALID_API_VERSIONS,
+    'extra_header_count': EXTRA_HEADER_COUNT,
+    'auto_create_account_prefix': AUTO_CREATE_ACCOUNT_PREFIX,
+}
 
-def constraints_conf_int(name, default):
-    try:
-        return int(constraints_conf.get('swift-constraints', name))
-    except (NoSectionError, NoOptionError):
-        return default
-
-
-#: Max file size allowed for objects
-MAX_FILE_SIZE = constraints_conf_int('max_file_size',
-                                     5368709122)  # 5 * 1024 * 1024 * 1024 + 2
-#: Max length of the name of a key for metadata
-MAX_META_NAME_LENGTH = constraints_conf_int('max_meta_name_length', 128)
-#: Max length of the value of a key for metadata
-MAX_META_VALUE_LENGTH = constraints_conf_int('max_meta_value_length', 256)
-#: Max number of metadata items
-MAX_META_COUNT = constraints_conf_int('max_meta_count', 90)
-#: Max overall size of metadata
-MAX_META_OVERALL_SIZE = constraints_conf_int('max_meta_overall_size', 4096)
-#: Max object name length
-MAX_OBJECT_NAME_LENGTH = constraints_conf_int('max_object_name_length', 1024)
-#: Max object list length of a get request for a container
-CONTAINER_LISTING_LIMIT = constraints_conf_int('container_listing_limit',
-                                               10000)
-#: Max container list length of a get request for an account
-ACCOUNT_LISTING_LIMIT = constraints_conf_int('account_listing_limit', 10000)
-#: Max account name length
-MAX_ACCOUNT_NAME_LENGTH = constraints_conf_int('max_account_name_length', 256)
-#: Max container name length
-MAX_CONTAINER_NAME_LENGTH = constraints_conf_int('max_container_name_length',
-                                                 256)
-
-
-#: Query string format= values to their corresponding content-type values
-FORMAT2CONTENT_TYPE = {'plain': 'text/plain', 'json': 'application/json',
-                       'xml': 'application/xml'}
+SWIFT_CONSTRAINTS_LOADED = False
+OVERRIDE_CONSTRAINTS = {}  # any constraints overridden by SWIFT_CONF_FILE
+EFFECTIVE_CONSTRAINTS = {}  # populated by reload_constraints
+
+
+def reload_constraints():
+    """
+    Parse SWIFT_CONF_FILE and reset module level global constraint attrs,
+    populating OVERRIDE_CONSTRAINTS AND EFFECTIVE_CONSTRAINTS along the way.
+    """
+    global SWIFT_CONSTRAINTS_LOADED, OVERRIDE_CONSTRAINTS
+    SWIFT_CONSTRAINTS_LOADED = False
+    OVERRIDE_CONSTRAINTS = {}
+    constraints_conf = ConfigParser()
+    if constraints_conf.read(utils.SWIFT_CONF_FILE):
+        SWIFT_CONSTRAINTS_LOADED = True
+        for name, default in DEFAULT_CONSTRAINTS.items():
+            try:
+                value = constraints_conf.get('swift-constraints', name)
+            except NoOptionError:
+                pass
+            except NoSectionError:
+                # We are never going to find the section for another option
+                break
+            else:
+                if isinstance(default, int):
+                    value = int(value)  # Go ahead and let it error
+                elif isinstance(default, str):
+                    pass  # No translation needed, I guess
+                else:
+                    # Hope we want a list!
+                    value = utils.list_from_csv(value)
+                OVERRIDE_CONSTRAINTS[name] = value
+    for name, default in DEFAULT_CONSTRAINTS.items():
+        value = OVERRIDE_CONSTRAINTS.get(name, default)
+        EFFECTIVE_CONSTRAINTS[name] = value
+        # "globals" in this context is module level globals, always.
+        globals()[name.upper()] = value
+
+
+reload_constraints()
+
+
+# By default the maximum number of allowed headers depends on the number of max
+# allowed metadata settings plus a default value of 36 for swift internally
+# generated headers and regular http headers.  If for some reason this is not
+# enough (custom middleware for example) it can be increased with the
+# extra_header_count constraint.
+MAX_HEADER_COUNT = MAX_META_COUNT + 36 + max(EXTRA_HEADER_COUNT, 0)
 
 
 def check_metadata(req, target_type):
     """
-    Check metadata sent in the request headers.
+    Check metadata sent in the request headers.  This should only check
+    that the metadata in the request given is valid.  Checks against
+    account/container overall metadata should be forwarded on to its
+    respective server to be checked.
 
     :param req: request object
     :param target_type: str: one of: object, container, or account: indicates
                         which type the target storage for the metadata is
-    :raises HTTPBadRequest: bad metadata
+    :returns: HTTPBadRequest with bad metadata otherwise None
     """
-    prefix = 'x-%s-meta-' % target_type.lower()
+    target_type = target_type.lower()
+    prefix = 'x-%s-meta-' % target_type
     meta_count = 0
     meta_size = 0
-    for key, value in req.headers.iteritems():
+    for key, value in req.headers.items():
+        if (isinstance(value, str)
+           and len(value) > MAX_HEADER_SIZE):
+
+            return HTTPBadRequest(body=b'Header value too long: %s' %
+                                  wsgi_to_bytes(key[:MAX_META_NAME_LENGTH]),
+                                  request=req, content_type='text/plain')
         if not key.lower().startswith(prefix):
             continue
         key = key[len(prefix):]
         if not key:
             return HTTPBadRequest(body='Metadata name cannot be empty',
                                   request=req, content_type='text/plain')
+        bad_key = not check_utf8(wsgi_to_str(key))
+        bad_value = value and not check_utf8(wsgi_to_str(value))
+        if target_type in ('account', 'container') and (bad_key or bad_value):
+            return HTTPBadRequest(body='Metadata must be valid UTF-8',
+                                  request=req, content_type='text/plain')
         meta_count += 1
         meta_size += len(key) + len(value)
         if len(key) > MAX_META_NAME_LENGTH:
             return HTTPBadRequest(
-                body='Metadata name too long; max %d' % MAX_META_NAME_LENGTH,
+                body=wsgi_to_bytes('Metadata name too long: %s%s' % (
+                    prefix, key)),
                 request=req, content_type='text/plain')
-        elif len(value) > MAX_META_VALUE_LENGTH:
+        if len(value) > MAX_META_VALUE_LENGTH:
             return HTTPBadRequest(
-                body='Metadata value too long; max %d' % MAX_META_VALUE_LENGTH,
+                body=wsgi_to_bytes('Metadata value longer than %d: %s%s' % (
+                    MAX_META_VALUE_LENGTH, prefix, key)),
                 request=req, content_type='text/plain')
-        elif meta_count > MAX_META_COUNT:
+        if meta_count > MAX_META_COUNT:
             return HTTPBadRequest(
                 body='Too many metadata items; max %d' % MAX_META_COUNT,
                 request=req, content_type='text/plain')
-        elif meta_size > MAX_META_OVERALL_SIZE:
+        if meta_size > MAX_META_OVERALL_SIZE:
             return HTTPBadRequest(
                 body='Total metadata too large; max %d'
                 % MAX_META_OVERALL_SIZE,
@@ -109,61 +178,102 @@ def check_object_creation(req, object_name):
 
     :param req: HTTP request object
     :param object_name: name of object to be created
-    :raises HTTPRequestEntityTooLarge: the object is too large
-    :raises HTTPLengthRequered: missing content-length header and not
-                                a chunked request
-    :raises HTTPBadRequest: missing or bad content-type header, or
-                            bad metadata
+    :returns: HTTPRequestEntityTooLarge -- the object is too large
+    :returns: HTTPLengthRequired -- missing content-length header and not
+                                    a chunked request
+    :returns: HTTPBadRequest -- missing or bad content-type header, or
+                                bad metadata
+    :returns: HTTPNotImplemented -- unsupported transfer-encoding header value
     """
-    if req.content_length and req.content_length > MAX_FILE_SIZE:
+    try:
+        ml = req.message_length()
+    except ValueError as e:
+        return HTTPBadRequest(request=req, content_type='text/plain',
+                              body=str(e))
+    except AttributeError as e:
+        return HTTPNotImplemented(request=req, content_type='text/plain',
+                                  body=str(e))
+    if ml is not None and ml > MAX_FILE_SIZE:
         return HTTPRequestEntityTooLarge(body='Your request is too large.',
                                          request=req,
                                          content_type='text/plain')
     if req.content_length is None and \
             req.headers.get('transfer-encoding') != 'chunked':
-        return HTTPLengthRequired(request=req)
-    if 'X-Copy-From' in req.headers and req.content_length:
-        return HTTPBadRequest(body='Copy requests require a zero byte body',
-                              request=req, content_type='text/plain')
+        return HTTPLengthRequired(body='Missing Content-Length header.',
+                                  request=req,
+                                  content_type='text/plain')
+
     if len(object_name) > MAX_OBJECT_NAME_LENGTH:
         return HTTPBadRequest(body='Object name length of %d longer than %d' %
                               (len(object_name), MAX_OBJECT_NAME_LENGTH),
                               request=req, content_type='text/plain')
+
     if 'Content-Type' not in req.headers:
         return HTTPBadRequest(request=req, content_type='text/plain',
-                              body='No content type')
-    if not check_utf8(req.headers['Content-Type']):
+                              body=b'No content type')
+
+    try:
+        req = check_delete_headers(req)
+    except HTTPException as e:
+        return HTTPBadRequest(request=req, body=e.body,
+                              content_type='text/plain')
+
+    if not check_utf8(wsgi_to_str(req.headers['Content-Type'])):
         return HTTPBadRequest(request=req, body='Invalid Content-Type',
                               content_type='text/plain')
-    if 'x-object-manifest' in req.headers:
-        value = req.headers['x-object-manifest']
-        container = prefix = None
-        try:
-            container, prefix = value.split('/', 1)
-        except ValueError:
-            pass
-        if not container or not prefix or '?' in value or '&' in value or \
-                prefix[0] == '/':
-            return HTTPBadRequest(
-                request=req,
-                body='X-Object-Manifest must in the format container/prefix')
     return check_metadata(req, 'object')
 
 
+def check_dir(root, drive):
+    """
+    Verify that the path to the device is a directory and is a lesser
+    constraint that is enforced when a full mount_check isn't possible
+    with, for instance, a VM using loopback or partitions.
+
+    :param root:  base path where the dir is
+    :param drive: drive name to be checked
+    :returns: full path to the device
+    :raises ValueError: if drive fails to validate
+    """
+    return check_drive(root, drive, False)
+
+
 def check_mount(root, drive):
     """
     Verify that the path to the device is a mount point and mounted.  This
     allows us to fast fail on drives that have been unmounted because of
-    issues, and also prevents us for accidently filling up the root partition.
+    issues, and also prevents us for accidentally filling up the root
+    partition.
 
     :param root:  base path where the devices are mounted
     :param drive: drive name to be checked
-    :returns: True if it is a valid mounted device, False otherwise
+    :returns: full path to the device
+    :raises ValueError: if drive fails to validate
     """
-    if not (urllib.quote_plus(drive) == drive):
-        return False
+    return check_drive(root, drive, True)
+
+
+def check_drive(root, drive, mount_check):
+    """
+    Validate the path given by root and drive is a valid existing directory.
+
+    :param root:  base path where the devices are mounted
+    :param drive: drive name to be checked
+    :param mount_check: additionally require path is mounted
+
+    :returns: full path to the device
+    :raises ValueError: if drive fails to validate
+    """
+    if not (urllib.parse.quote_plus(drive) == drive):
+        raise ValueError('%s is not a valid drive name' % drive)
     path = os.path.join(root, drive)
-    return os.path.exists(path) and os.path.ismount(path)
+    if mount_check:
+        if not utils.ismount(path):
+            raise ValueError('%s is not mounted' % path)
+    else:
+        if not isdir(path):
+            raise ValueError('%s is not a directory' % path)
+    return path
 
 
 def check_float(string):
@@ -180,22 +290,149 @@ def check_float(string):
         return False
 
 
-def check_utf8(string):
+def valid_timestamp(request):
+    """
+    Helper function to extract a timestamp from requests that require one.
+
+    :param request: the swob request object
+
+    :returns: a valid Timestamp instance
+    :raises HTTPBadRequest: on missing or invalid X-Timestamp
+    """
+    try:
+        return request.timestamp
+    except exceptions.InvalidTimestamp as e:
+        raise HTTPBadRequest(body=str(e), request=request,
+                             content_type='text/plain')
+
+
+def check_delete_headers(request):
+    """
+    Check that 'x-delete-after' and 'x-delete-at' headers have valid values.
+    Values should be positive integers and correspond to a time greater than
+    the request timestamp.
+
+    If the 'x-delete-after' header is found then its value is used to compute
+    an 'x-delete-at' value which takes precedence over any existing
+    'x-delete-at' header.
+
+    :param request: the swob request object
+    :raises: HTTPBadRequest in case of invalid values
+    :returns: the swob request object
+    """
+    now = float(valid_timestamp(request))
+    if 'x-delete-after' in request.headers:
+        try:
+            x_delete_after = int(request.headers['x-delete-after'])
+        except ValueError:
+            raise HTTPBadRequest(request=request,
+                                 content_type='text/plain',
+                                 body='Non-integer X-Delete-After')
+        actual_del_time = utils.normalize_delete_at_timestamp(
+            now + x_delete_after)
+        if int(actual_del_time) <= now:
+            raise HTTPBadRequest(request=request,
+                                 content_type='text/plain',
+                                 body='X-Delete-After in past')
+        request.headers['x-delete-at'] = actual_del_time
+        del request.headers['x-delete-after']
+
+    if 'x-delete-at' in request.headers:
+        try:
+            x_delete_at = int(utils.normalize_delete_at_timestamp(
+                int(request.headers['x-delete-at'])))
+        except ValueError:
+            raise HTTPBadRequest(request=request, content_type='text/plain',
+                                 body='Non-integer X-Delete-At')
+
+        if x_delete_at <= now and not utils.config_true_value(
+                request.headers.get('x-backend-replication', 'f')):
+            raise HTTPBadRequest(request=request, content_type='text/plain',
+                                 body='X-Delete-At in past')
+    return request
+
+
+def check_utf8(string, internal=False):
     """
-    Validate if a string is valid UTF-8 str or unicode
+    Validate if a string is valid UTF-8 str or unicode and that it
+    does not contain any reserved characters.
 
     :param string: string to be validated
-    :returns: True if the string is valid utf-8 str or unicode, False otherwise
+    :param internal: boolean, allows reserved characters if True
+    :returns: True if the string is valid utf-8 str or unicode and
+              contains no null characters, False otherwise
     """
     if not string:
         return False
     try:
-        if isinstance(string, unicode):
-            string.encode('utf-8')
+        if isinstance(string, str):
+            encoded = string.encode('utf-8')
+            decoded = string
         else:
-            string.decode('UTF-8')
-        return True
+            encoded = string
+            decoded = string.decode('UTF-8')
+            if decoded.encode('UTF-8') != encoded:
+                return False
+        # A UTF-8 string with surrogates in it is invalid.
+        #
+        # Note: this check is only useful on Python 2. On Python 3, a
+        # bytestring with a UTF-8-encoded surrogate codepoint is (correctly)
+        # treated as invalid, so the decode() call above will fail.
+        #
+        # Note 2: this check requires us to use a wide build of Python 2. On
+        # narrow builds of Python 2, potato = u"\U0001F954" will have length
+        # 2, potato[0] == u"\ud83e" (surrogate), and potato[1] == u"\udda0"
+        # (also a surrogate), so even if it is correctly UTF-8 encoded as
+        # b'\xf0\x9f\xa6\xa0', it will not pass this check. Fortunately,
+        # most Linux distributions build Python 2 wide, and Python 3.3+
+        # removed the wide/narrow distinction entirely.
+        if any(0xD800 <= ord(codepoint) <= 0xDFFF
+               for codepoint in decoded):
+            return False
+        if b'\x00' != utils.RESERVED_BYTE and b'\x00' in encoded:
+            return False
+        return True if internal else utils.RESERVED_BYTE not in encoded
     # If string is unicode, decode() will raise UnicodeEncodeError
     # So, we should catch both UnicodeDecodeError & UnicodeEncodeError
     except UnicodeError:
         return False
+
+
+def check_name_format(req, name, target_type):
+    """
+    Validate that the header contains valid account or container name.
+
+    :param req: HTTP request object
+    :param name: header value to validate
+    :param target_type: which header is being validated (Account or Container)
+    :returns: A properly encoded account name or container name
+    :raise HTTPPreconditionFailed: if account header
+            is not well formatted.
+    """
+    if not name:
+        raise HTTPPreconditionFailed(
+            request=req,
+            body='%s name cannot be empty' % target_type)
+    if '/' in name:
+        raise HTTPPreconditionFailed(
+            request=req,
+            body='%s name cannot contain slashes' % target_type)
+    return name
+
+
+check_account_format = functools.partial(check_name_format,
+                                         target_type='Account')
+check_container_format = functools.partial(check_name_format,
+                                           target_type='Container')
+
+
+def valid_api_version(version):
+    """
+    Checks if the requested version is valid.
+
+    Currently Swift only supports "v1" and "v1.0".
+    """
+    global VALID_API_VERSIONS
+    if not isinstance(VALID_API_VERSIONS, list):
+        VALID_API_VERSIONS = [str(VALID_API_VERSIONS)]
+    return version in VALID_API_VERSIONS
diff --git a/swift/common/container_sync_realms.py b/swift/common/container_sync_realms.py
new file mode 100644
index 0000000000..a9832ba437
--- /dev/null
+++ b/swift/common/container_sync_realms.py
@@ -0,0 +1,167 @@
+# Copyright (c) 2013 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import errno
+import hashlib
+import hmac
+import os
+import time
+
+import configparser
+
+from swift.common.utils import get_valid_utf8_str
+
+
+class ContainerSyncRealms(object):
+    """
+    Loads and parses the container-sync-realms.conf, occasionally
+    checking the file's mtime to see if it needs to be reloaded.
+    """
+
+    def __init__(self, conf_path, logger):
+        self.conf_path = conf_path
+        self.logger = logger
+        self.next_mtime_check = 0
+        self.mtime_check_interval = 300
+        self.conf_path_mtime = 0
+        self.data = {}
+        self.reload()
+
+    def reload(self):
+        """Forces a reload of the conf file."""
+        self.next_mtime_check = 0
+        self.conf_path_mtime = 0
+        self._reload()
+
+    def _reload(self):
+        now = time.time()
+        if now >= self.next_mtime_check:
+            self.next_mtime_check = now + self.mtime_check_interval
+            try:
+                mtime = os.path.getmtime(self.conf_path)
+            except OSError as err:
+                if err.errno == errno.ENOENT:
+                    log_func = self.logger.debug
+                else:
+                    log_func = self.logger.error
+                log_func('Could not load %(conf)r: %(error)s', {
+                         'conf': self.conf_path, 'error': err})
+            else:
+                if mtime != self.conf_path_mtime:
+                    self.conf_path_mtime = mtime
+                    try:
+                        conf = configparser.ConfigParser()
+                        conf.read(self.conf_path)
+                    except configparser.ParsingError as err:
+                        self.logger.error(
+                            'Could not load %(conf)r: %(error)s',
+                            {'conf': self.conf_path, 'error': err})
+                    else:
+                        try:
+                            self.mtime_check_interval = conf.getfloat(
+                                'DEFAULT', 'mtime_check_interval')
+                            self.next_mtime_check = \
+                                now + self.mtime_check_interval
+                        except configparser.NoOptionError:
+                            self.mtime_check_interval = 300
+                            self.next_mtime_check = \
+                                now + self.mtime_check_interval
+                        except (configparser.ParsingError, ValueError) as err:
+                            self.logger.error(
+                                'Error in %(conf)r with '
+                                'mtime_check_interval: %(error)s',
+                                {'conf': self.conf_path, 'error': err})
+                        realms = {}
+                        for section in conf.sections():
+                            realm = {}
+                            clusters = {}
+                            for option, value in conf.items(section):
+                                if option in ('key', 'key2'):
+                                    realm[option] = value
+                                elif option.startswith('cluster_'):
+                                    clusters[option[8:].upper()] = value
+                            realm['clusters'] = clusters
+                            realms[section.upper()] = realm
+                        self.data = realms
+
+    def realms(self):
+        """Returns a list of realms."""
+        self._reload()
+        return list(self.data.keys())
+
+    def key(self, realm):
+        """Returns the key for the realm."""
+        self._reload()
+        result = self.data.get(realm.upper())
+        if result:
+            result = result.get('key')
+        return result
+
+    def key2(self, realm):
+        """Returns the key2 for the realm."""
+        self._reload()
+        result = self.data.get(realm.upper())
+        if result:
+            result = result.get('key2')
+        return result
+
+    def clusters(self, realm):
+        """Returns a list of clusters for the realm."""
+        self._reload()
+        result = self.data.get(realm.upper())
+        if result:
+            result = result.get('clusters')
+            if result:
+                result = list(result.keys())
+        return result or []
+
+    def endpoint(self, realm, cluster):
+        """Returns the endpoint for the cluster in the realm."""
+        self._reload()
+        result = None
+        realm_data = self.data.get(realm.upper())
+        if realm_data:
+            cluster_data = realm_data.get('clusters')
+            if cluster_data:
+                result = cluster_data.get(cluster.upper())
+        return result
+
+    def get_sig(self, request_method, path, x_timestamp, nonce, realm_key,
+                user_key):
+        """
+        Returns the hexdigest string of the HMAC-SHA1 (RFC 2104) for
+        the information given.
+
+        :param request_method: HTTP method of the request.
+        :param path: The path to the resource (url-encoded).
+        :param x_timestamp: (str) The X-Timestamp header value for the request.
+        :param nonce: A unique value for the request.
+        :param realm_key: Shared secret at the cluster operator level.
+        :param user_key: Shared secret at the user's container level.
+        :returns: hexdigest str of the HMAC-SHA1 for the request.
+        """
+        nonce = get_valid_utf8_str(nonce)
+        realm_key = get_valid_utf8_str(realm_key)
+        user_key = get_valid_utf8_str(user_key)
+        # XXX We don't know what is the best here yet; wait for container
+        # sync to be tested.
+        if isinstance(path, str):
+            path = path.encode('utf-8')
+        return hmac.new(
+            realm_key,
+            b'%s\n%s\n%s\n%s\n%s' % (
+                request_method.encode('ascii'), path,
+                x_timestamp.encode('ascii'), nonce, user_key),
+            hashlib.sha1).hexdigest()
diff --git a/swift/common/daemon.py b/swift/common/daemon.py
index 009619cc78..d6c431b6d1 100644
--- a/swift/common/daemon.py
+++ b/swift/common/daemon.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,18 +13,39 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
+import errno
 import os
 import sys
+import time
 import signal
 from re import sub
 
+import eventlet
 import eventlet.debug
 
 from swift.common import utils
 
 
 class Daemon(object):
-    """Daemon base class"""
+    """
+    Daemon base class
+
+    A daemon has a run method that accepts a ``once`` kwarg and will dispatch
+    to :meth:`run_once` or :meth:`run_forever`.
+
+    A subclass of Daemon must implement :meth:`run_once` and
+    :meth:`run_forever`.
+
+    A subclass of Daemon may override :meth:`get_worker_args` to dispatch
+    arguments to individual child process workers and :meth:`is_healthy` to
+    perform context specific periodic wellness checks which can reset worker
+    arguments.
+
+    Implementations of Daemon do not know *how* to daemonize, or execute
+    multiple daemonized workers, they simply provide the behavior of the daemon
+    and context specific knowledge about how workers should be started.
+    """
+    WORKERS_HEALTHCHECK_INTERVAL = 5.0
 
     def __init__(self, conf):
         self.conf = conf
@@ -39,42 +60,240 @@ def run_forever(self, *args, **kwargs):
         raise NotImplementedError('run_forever not implemented')
 
     def run(self, once=False, **kwargs):
-        """Run the daemon"""
+        if once:
+            self.run_once(**kwargs)
+        else:
+            self.run_forever(**kwargs)
+
+    def post_multiprocess_run(self):
+        """
+        Override this to do something after running using multiple worker
+        processes. This method is called in the parent process.
+
+        This is probably only useful for run-once mode since there is no
+        "after running" in run-forever mode.
+        """
+        pass
+
+    def get_worker_args(self, once=False, **kwargs):
+        """
+        For each worker yield a (possibly empty) dict of kwargs to pass along
+        to the daemon's :meth:`run` method after fork.  The length of elements
+        returned from this method will determine the number of processes
+        created.
+
+        If the returned iterable is empty, the Strategy will fallback to
+        run-inline strategy.
+
+        :param once: False if the worker(s) will be daemonized, True if the
+            worker(s) will be run once
+        :param kwargs: plumbed through via command line argparser
+
+        :returns: an iterable of dicts, each element represents the kwargs to
+                  be passed to a single worker's :meth:`run` method after fork.
+        """
+        return []
+
+    def is_healthy(self):
+        """
+        This method is called very frequently on the instance of the daemon
+        held by the parent process.  If it returns False, all child workers are
+        terminated, and new workers will be created.
+
+        :returns: a boolean, True only if all workers should continue to run
+        """
+        return True
+
+
+class DaemonStrategy(object):
+    """
+    This is the execution strategy for using subclasses of Daemon.  The default
+    behavior is to invoke the daemon's :meth:`Daemon.run` method from within
+    the parent process.  When the :meth:`Daemon.run` method returns the parent
+    process will exit.
+
+    However, if the Daemon returns a non-empty iterable from
+    :meth:`Daemon.get_worker_args`, the daemon's :meth:`Daemon.run` method will
+    be invoked in child processes, with the arguments provided from the parent
+    process's instance of the daemon.  If a child process exits it will be
+    restarted with the same options, unless it was executed in once mode.
+
+    :param daemon: an instance of a :class:`Daemon` (has a `run` method)
+    :param logger: a logger instance
+    """
+
+    def __init__(self, daemon, logger):
+        self.daemon = daemon
+        self.logger = logger
+        self.running = False
+        # only used by multi-worker strategy
+        self.options_by_pid = {}
+        self.unspawned_worker_options = []
+
+    def setup(self, **kwargs):
         utils.validate_configuration()
-        utils.drop_privileges(self.conf.get('user', 'swift'))
+        utils.drop_privileges(self.daemon.conf.get('user', 'swift'))
+        utils.clean_up_daemon_hygiene()
         utils.capture_stdio(self.logger, **kwargs)
 
         def kill_children(*args):
+            self.running = False
+            self.logger.notice('SIGTERM received (%s)', os.getpid())
             signal.signal(signal.SIGTERM, signal.SIG_IGN)
             os.killpg(0, signal.SIGTERM)
-            sys.exit()
+            os._exit(0)
 
         signal.signal(signal.SIGTERM, kill_children)
-        if once:
-            self.run_once(**kwargs)
+        self.running = True
+        utils.systemd_notify(self.logger)
+
+    def _run_inline(self, once=False, **kwargs):
+        """Run the daemon"""
+        self.daemon.run(once=once, **kwargs)
+
+    def run(self, once=False, **kwargs):
+        """Daemonize and execute our strategy"""
+        self.setup(**kwargs)
+        try:
+            self._run(once=once, **kwargs)
+        except KeyboardInterrupt:
+            self.logger.notice('User quit')
+        finally:
+            self.cleanup(stopping=True)
+        self.running = False
+
+    def _fork(self, once, **kwargs):
+        pid = os.fork()
+        if pid == 0:
+            signal.signal(signal.SIGHUP, signal.SIG_DFL)
+            signal.signal(signal.SIGTERM, signal.SIG_DFL)
+            # only MAINPID should be sending notifications
+            os.environ.pop('NOTIFY_SOCKET', None)
+
+            self.daemon.run(once, **kwargs)
+
+            self.logger.debug('Forked worker %s finished', os.getpid())
+            # do not return from this stack, nor execute any finally blocks
+            os._exit(0)
         else:
-            self.run_forever(**kwargs)
+            self.register_worker_start(pid, kwargs)
+        return pid
+
+    def iter_unspawned_workers(self):
+        while True:
+            try:
+                per_worker_options = self.unspawned_worker_options.pop()
+            except IndexError:
+                return
+            yield per_worker_options
+
+    def spawned_pids(self):
+        return list(self.options_by_pid.keys())
+
+    def register_worker_start(self, pid, per_worker_options):
+        self.logger.debug('Spawned worker %s with %r', pid, per_worker_options)
+        self.options_by_pid[pid] = per_worker_options
+
+    def register_worker_exit(self, pid):
+        self.unspawned_worker_options.append(self.options_by_pid.pop(pid))
+
+    def ask_daemon_to_prepare_workers(self, once, **kwargs):
+        self.unspawned_worker_options = list(
+            self.daemon.get_worker_args(once=once, **kwargs))
+
+    def abort_workers_if_daemon_would_like(self):
+        if not self.daemon.is_healthy():
+            self.logger.debug(
+                'Daemon needs to change options, aborting workers')
+            self.cleanup()
+            return True
+        return False
+
+    def check_on_all_running_workers(self):
+        for p in self.spawned_pids():
+            try:
+                pid, status = os.waitpid(p, os.WNOHANG)
+            except OSError as err:
+                if err.errno not in (errno.EINTR, errno.ECHILD):
+                    raise
+                self.logger.notice('Worker %s died', p)
+            else:
+                if pid == 0:
+                    # child still running
+                    continue
+                self.logger.debug('Worker %s exited', p)
+            self.register_worker_exit(p)
+
+    def _run(self, once, **kwargs):
+        self.ask_daemon_to_prepare_workers(once, **kwargs)
+        if not self.unspawned_worker_options:
+            return self._run_inline(once, **kwargs)
+        for per_worker_options in self.iter_unspawned_workers():
+            if self._fork(once, **per_worker_options) == 0:
+                return 0
+        while self.running:
+            if self.abort_workers_if_daemon_would_like():
+                self.ask_daemon_to_prepare_workers(once, **kwargs)
+            self.check_on_all_running_workers()
+            if not once:
+                for per_worker_options in self.iter_unspawned_workers():
+                    if self._fork(once, **per_worker_options) == 0:
+                        return 0
+            else:
+                if not self.spawned_pids():
+                    self.logger.notice('Finished %s', os.getpid())
+                    break
+            time.sleep(self.daemon.WORKERS_HEALTHCHECK_INTERVAL)
+        self.daemon.post_multiprocess_run()
+        return 0
+
+    def cleanup(self, stopping=False):
+        """
+        Cleanup worker processes
+
+        :param stopping: if set, tell systemd we're stopping
+        """
+
+        if stopping:
+            utils.systemd_notify(self.logger, "STOPPING=1")
+        for p in self.spawned_pids():
+            try:
+                os.kill(p, signal.SIGTERM)
+            except OSError as err:
+                if err.errno not in (errno.ESRCH, errno.EINTR, errno.ECHILD):
+                    raise
+            self.register_worker_exit(p)
+            self.logger.debug('Cleaned up worker %s', p)
 
 
 def run_daemon(klass, conf_file, section_name='', once=False, **kwargs):
     """
-    Loads settings from conf, then instantiates daemon "klass" and runs the
-    daemon with the specified once kwarg.  The section_name will be derived
-    from the daemon "klass" if not provided (e.g. ObjectReplicator =>
+    Loads settings from conf, then instantiates daemon ``klass`` and runs the
+    daemon with the specified ``once`` kwarg.  The section_name will be derived
+    from the daemon ``klass`` if not provided (e.g. ObjectReplicator =>
     object-replicator).
 
-    :param klass: Class to instantiate, subclass of common.daemon.Daemon
+    :param klass: Class to instantiate, subclass of :class:`Daemon`
     :param conf_file: Path to configuration file
     :param section_name: Section name from conf file to load config from
-    :param once: Passed to daemon run method
+    :param once: Passed to daemon :meth:`Daemon.run` method
     """
     # very often the config section_name is based on the class name
     # the None singleton will be passed through to readconf as is
-    if section_name is '':
+    if section_name == '':
         section_name = sub(r'([a-z])([A-Z])', r'\1-\2',
                            klass.__name__).lower()
-    conf = utils.readconf(conf_file, section_name,
-                          log_name=kwargs.get('log_name'))
+    try:
+        conf = utils.readconf(conf_file, section_name,
+                              log_name=kwargs.get('log_name'))
+    except (ValueError, IOError) as e:
+        # The message will be printed to stderr
+        # and results in an exit code of 1.
+        sys.exit(e)
+
+    # patch eventlet/logging early
+    utils.monkey_patch()
+    eventlet.hubs.use_hub(utils.get_hub())
 
     # once on command line (i.e. daemonize=false) will over-ride config
     once = once or not utils.config_true_value(conf.get('daemonize', 'true'))
@@ -87,16 +306,30 @@ def run_daemon(klass, conf_file, section_name='', once=False, **kwargs):
                                   log_to_console=kwargs.pop('verbose', False),
                                   log_route=section_name)
 
+    # optional nice/ionice priority scheduling
+    utils.modify_priority(conf, logger)
+
     # disable fallocate if desired
     if utils.config_true_value(conf.get('disable_fallocate', 'no')):
         utils.disable_fallocate()
+    # set utils.FALLOCATE_RESERVE if desired
+    utils.FALLOCATE_RESERVE, utils.FALLOCATE_IS_PERCENT = \
+        utils.config_fallocate_value(conf.get('fallocate_reserve', '1%'))
 
     # By default, disable eventlet printing stacktraces
     eventlet_debug = utils.config_true_value(conf.get('eventlet_debug', 'no'))
     eventlet.debug.hub_exceptions(eventlet_debug)
 
+    # Ensure TZ environment variable exists to avoid stat('/etc/localtime') on
+    # some platforms. This locks in reported times to UTC.
+    os.environ['TZ'] = 'UTC+0'
+    time.tzset()
+
+    logger.notice('Starting %s', os.getpid())
     try:
-        klass(conf).run(once=once, **kwargs)
+        d = klass(conf)
+        DaemonStrategy(d, logger).run(once=once, **kwargs)
     except KeyboardInterrupt:
         logger.info('User quit')
-    logger.info('Exited')
+    logger.notice('Exited %s', os.getpid())
+    return d
diff --git a/swift/common/db.py b/swift/common/db.py
index 06f7c6295f..447228f130 100644
--- a/swift/common/db.py
+++ b/swift/common/db.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -15,39 +15,77 @@
 
 """ Database code for Swift """
 
-from __future__ import with_statement
-from contextlib import contextmanager
-import hashlib
+from contextlib import contextmanager, closing
+import base64
+import json
 import logging
-import operator
 import os
 from uuid import uuid4
-import sys
 import time
-import cPickle as pickle
 import errno
+import pickle  # nosec: B403
 from tempfile import mkstemp
 
 from eventlet import sleep, Timeout
 import sqlite3
 
-from swift.common.utils import json, normalize_timestamp, renamer, \
-    mkdirs, lock_parent_directory, fallocate
+from swift.common.constraints import MAX_META_COUNT, MAX_META_OVERALL_SIZE, \
+    check_utf8
+from swift.common.utils import Timestamp, renamer, \
+    mkdirs, lock_parent_directory, fallocate, md5
 from swift.common.exceptions import LockTimeout
+from swift.common.swob import HTTPBadRequest
 
 
 #: Whether calls will be made to preallocate disk space for database files.
-DB_PREALLOCATION = True
+DB_PREALLOCATION = False
+#: Whether calls will be made to log queries (py3 only)
+QUERY_LOGGING = False
 #: Timeout for trying to connect to a DB
 BROKER_TIMEOUT = 25
 #: Pickle protocol to use
 PICKLE_PROTOCOL = 2
-#: Max number of pending entries
+#: Max size of .pending file in bytes. When this is exceeded, the pending
+# records will be merged.
 PENDING_CAP = 131072
 
+SQLITE_ARG_LIMIT = 999
+RECLAIM_PAGE_SIZE = 10000
 
-def utf8encode(*args):
-    return [(s.encode('utf8') if isinstance(s, unicode) else s) for s in args]
+
+def native_str_keys_and_values(metadata):
+    bin_keys = [k for k in metadata if isinstance(k, bytes)]
+    for k in bin_keys:
+        sv = metadata[k]
+        del metadata[k]
+        metadata[k.decode('utf-8')] = [
+            x.decode('utf-8') if isinstance(x, bytes) else x
+            for x in sv]
+
+
+ZERO_LIKE_VALUES = {None, '', 0, '0'}
+
+
+def zero_like(count):
+    """
+    We've cargo culted our consumers to be tolerant of various expressions of
+    zero in our databases for backwards compatibility with less disciplined
+    producers.
+    """
+    return count in ZERO_LIKE_VALUES
+
+
+def _db_timeout(timeout, db_file, call):
+    with LockTimeout(timeout, db_file):
+        retry_wait = 0.001
+        while True:
+            try:
+                return call()
+            except sqlite3.OperationalError as e:
+                if 'locked' not in str(e):
+                    raise
+            sleep(retry_wait)
+            retry_wait = min(retry_wait * 2, 0.05)
 
 
 class DatabaseConnectionError(sqlite3.DatabaseError):
@@ -63,31 +101,66 @@ def __str__(self):
             self.path, self.timeout, self.msg)
 
 
+class DatabaseAlreadyExists(sqlite3.DatabaseError):
+    """More friendly error messages for DB Errors."""
+
+    def __init__(self, path):
+        self.path = path
+
+    def __str__(self):
+        return 'DB %s already exists' % self.path
+
+
 class GreenDBConnection(sqlite3.Connection):
     """SQLite DB Connection handler that plays well with eventlet."""
+    # slots are needed for python 3.11.0 (there's an issue fixed in 3.11.1,
+    # see https://github.com/python/cpython/issues/99886)
+    __slots__ = ('timeout', 'db_file')
 
-    def __init__(self, *args, **kwargs):
-        self.timeout = kwargs.get('timeout', BROKER_TIMEOUT)
-        kwargs['timeout'] = 0
-        self.db_file = args and args[0] or '-'
-        sqlite3.Connection.__init__(self, *args, **kwargs)
+    def __init__(self, database, timeout=None, *args, **kwargs):
+        if timeout is None:
+            timeout = BROKER_TIMEOUT
+        self.timeout = timeout
+        self.db_file = database
+        super(GreenDBConnection, self).__init__(
+            database, timeout=0, *args, **kwargs)
 
-    def _timeout(self, call):
-        with LockTimeout(self.timeout, self.db_file):
-            while True:
-                try:
-                    return call()
-                except sqlite3.OperationalError, e:
-                    if 'locked' not in str(e):
-                        raise
-                sleep(0.05)
+    def cursor(self, cls=None):
+        if cls is None:
+            cls = GreenDBCursor
+        return sqlite3.Connection.cursor(self, cls)
 
     def execute(self, *args, **kwargs):
-        return self._timeout(lambda: sqlite3.Connection.execute(
-            self, *args, **kwargs))
+        # py311 stopped calling self.cursor() to get the cursor;
+        # see https://github.com/python/cpython/pull/31351
+        curs = self.cursor()
+        curs.execute(*args, **kwargs)
+        return curs
 
     def commit(self):
-        return self._timeout(lambda: sqlite3.Connection.commit(self))
+        return _db_timeout(
+            self.timeout, self.db_file,
+            lambda: sqlite3.Connection.commit(self))
+
+
+class GreenDBCursor(sqlite3.Cursor):
+    """SQLite Cursor handler that plays well with eventlet."""
+    # slots are needed for python 3.11.0 (there's an issue fixed in 3.11.1,
+    # see https://github.com/python/cpython/issues/99886)
+    __slots__ = ('timeout', 'db_file')
+
+    def __init__(self, *args, **kwargs):
+        self.timeout = args[0].timeout
+        self.db_file = args[0].db_file
+        super(GreenDBCursor, self).__init__(*args, **kwargs)
+
+    def execute(self, *args, **kwargs):
+        return _db_timeout(
+            self.timeout, self.db_file, lambda: sqlite3.Cursor.execute(
+                self, *args, **kwargs))
+
+    # NB: executemany and executescript are *not* greened, and never have been
+    # (as far as I can tell)
 
 
 def dict_factory(crs, row):
@@ -107,19 +180,18 @@ def chexor(old, name, timestamp):
 
     :param old: hex representation of the current DB hash
     :param name: name of the object or container being inserted
-    :param timestamp: timestamp of the new record
-    :returns: a hex representation of the new hash value
+    :param timestamp: a string representation of attributes of the item being
+        inserted, for example the string representation of the item's
+        timestamp.
     """
     if name is None:
         raise Exception('name is None!')
-    old = old.decode('hex')
-    new = hashlib.md5(('%s-%s' % (name, timestamp)).encode('utf_8')).digest()
-    response = ''.join(
-        map(chr, map(operator.xor, map(ord, old), map(ord, new))))
-    return response.encode('hex')
+    new = md5(('%s-%s' % (name, timestamp)).encode('utf8'),
+              usedforsecurity=False).hexdigest()
+    return '%032x' % (int(old, 16) ^ int(new, 16))
 
 
-def get_db_connection(path, timeout=30, okay_to_create=False):
+def get_db_connection(path, timeout=30, logger=None, okay_to_create=False):
     """
     Returns a properly configured SQLite database connection.
 
@@ -132,7 +204,9 @@ def get_db_connection(path, timeout=30, okay_to_create=False):
         connect_time = time.time()
         conn = sqlite3.connect(path, check_same_thread=False,
                                factory=GreenDBConnection, timeout=timeout)
-        if path != ':memory:' and not okay_to_create:
+        if QUERY_LOGGING and logger:
+            conn.set_trace_callback(logger.debug)
+        if not okay_to_create:
             # attempt to detect and fail when connect creates the db file
             stat = os.stat(path)
             if stat.st_size == 0 and stat.st_ctime >= connect_time:
@@ -141,10 +215,11 @@ def get_db_connection(path, timeout=30, okay_to_create=False):
                                               'DB file created by connect?')
         conn.row_factory = sqlite3.Row
         conn.text_factory = str
-        conn.execute('PRAGMA synchronous = NORMAL')
-        conn.execute('PRAGMA count_changes = OFF')
-        conn.execute('PRAGMA temp_store = MEMORY')
-        conn.execute('PRAGMA journal_mode = DELETE')
+        with closing(conn.cursor()) as cur:
+            cur.execute('PRAGMA synchronous = NORMAL')
+            cur.execute('PRAGMA count_changes = OFF')
+            cur.execute('PRAGMA temp_store = MEMORY')
+            cur.execute('PRAGMA journal_mode = DELETE')
         conn.create_function('chexor', 3, chexor)
     except sqlite3.DatabaseError:
         import traceback
@@ -153,17 +228,111 @@ def get_db_connection(path, timeout=30, okay_to_create=False):
     return conn
 
 
+class TombstoneReclaimer(object):
+    """Encapsulates reclamation of deleted rows in a database."""
+    def __init__(self, broker, age_timestamp):
+        """
+        Encapsulates reclamation of deleted rows in a database.
+
+        :param broker: an instance of :class:`~swift.common.db.DatabaseBroker`.
+        :param age_timestamp: a float timestamp: tombstones older than this
+            time will be deleted.
+        """
+        self.broker = broker
+        self.age_timestamp = age_timestamp
+        self.marker = ''
+        self.remaining_tombstones = self.reclaimed = 0
+        self.finished = False
+        # limit 1 offset N gives back the N+1th matching row; that row is used
+        # as an exclusive end_marker for a batch of deletes, so a batch
+        # comprises rows satisfying self.marker <= name < end_marker.
+        self.batch_query = '''
+            SELECT name FROM %s WHERE deleted = 1
+            AND name >= ?
+            ORDER BY NAME LIMIT 1 OFFSET ?
+        ''' % self.broker.db_contains_type
+        self.clean_batch_query = '''
+            DELETE FROM %s WHERE deleted = 1
+            AND name >= ? AND %s < '%s'
+        ''' % (self.broker.db_contains_type, self.broker.db_reclaim_timestamp,
+               self.age_timestamp)
+
+    def _reclaim(self, conn):
+        curs = conn.execute(self.batch_query, (self.marker, RECLAIM_PAGE_SIZE))
+        row = curs.fetchone()
+        end_marker = row[0] if row else ''
+        if end_marker:
+            # do a single book-ended DELETE and bounce out
+            curs = conn.execute(self.clean_batch_query + ' AND name < ?',
+                                (self.marker, end_marker))
+            self.marker = end_marker
+            self.reclaimed += curs.rowcount
+            self.remaining_tombstones += RECLAIM_PAGE_SIZE - curs.rowcount
+        else:
+            # delete off the end
+            curs = conn.execute(self.clean_batch_query, (self.marker,))
+            self.finished = True
+            self.reclaimed += curs.rowcount
+
+    def reclaim(self):
+        """
+        Perform reclaim of deleted rows older than ``age_timestamp``.
+        """
+        while not self.finished:
+            with self.broker.get() as conn:
+                self._reclaim(conn)
+                conn.commit()
+
+    def get_tombstone_count(self):
+        """
+        Return the number of remaining tombstones newer than ``age_timestamp``.
+        Executes the ``reclaim`` method if it has not already been called on
+        this instance.
+
+        :return: The number of tombstones in the ``broker`` that are newer than
+            ``age_timestamp``.
+        """
+        if not self.finished:
+            self.reclaim()
+        with self.broker.get() as conn:
+            curs = conn.execute('''
+                SELECT COUNT(*) FROM %s WHERE deleted = 1
+                AND name >= ?
+            ''' % (self.broker.db_contains_type,), (self.marker,))
+        tombstones = curs.fetchone()[0]
+        self.remaining_tombstones += tombstones
+        return self.remaining_tombstones
+
+
 class DatabaseBroker(object):
     """Encapsulates working with a database."""
 
+    delete_meta_whitelist = []
+
     def __init__(self, db_file, timeout=BROKER_TIMEOUT, logger=None,
-                 account=None, container=None, pending_timeout=10,
-                 stale_reads_ok=False):
-        """ Encapsulates working with a database. """
+                 account=None, container=None, pending_timeout=None,
+                 stale_reads_ok=False, skip_commits=False):
+        """Encapsulates working with a database.
+
+        :param db_file: path to a database file.
+        :param timeout: timeout used for database operations.
+        :param logger: a logger instance.
+        :param account: name of account.
+        :param container: name of container.
+        :param pending_timeout: timeout used when attempting to take a lock to
+            write to pending file.
+        :param stale_reads_ok: if True then no error is raised if pending
+            commits cannot be committed before the database is read, otherwise
+            an error is raised.
+        :param skip_commits: if True then this broker instance will never
+            commit records from the pending file to the database;
+            :meth:`~swift.common.db.DatabaseBroker.put_record` should not
+            called on brokers with skip_commits True.
+        """
         self.conn = None
-        self.db_file = db_file
-        self.pending_file = self.db_file + '.pending'
-        self.pending_timeout = pending_timeout
+        self._db_file = db_file
+        self.pending_file = self._db_file + '.pending'
+        self.pending_timeout = pending_timeout or 10
         self.stale_reads_ok = stale_reads_ok
         self.db_dir = os.path.dirname(db_file)
         self.timeout = timeout
@@ -171,27 +340,39 @@ def __init__(self, db_file, timeout=BROKER_TIMEOUT, logger=None,
         self.account = account
         self.container = container
         self._db_version = -1
+        self.skip_commits = skip_commits
+
+    def __str__(self):
+        """
+        Returns a string identifying the entity under broker to a human.
+        The baseline implementation returns a full pathname to a database.
+        This is vital for useful diagnostics.
+        """
+        return self.db_file
 
-    def initialize(self, put_timestamp=None):
+    def initialize(self, put_timestamp=None, storage_policy_index=None):
         """
         Create the DB
 
-        :param put_timestamp: timestamp of initial PUT request
+        The storage_policy_index is passed through to the subclass's
+        ``_initialize`` method.  It is ignored by ``AccountBroker``.
+
+        :param put_timestamp: internalized timestamp of initial PUT request
+        :param storage_policy_index: only required for containers
         """
-        if self.db_file == ':memory:':
-            tmp_db_file = None
-            conn = get_db_connection(self.db_file, self.timeout)
-        else:
-            mkdirs(self.db_dir)
-            fd, tmp_db_file = mkstemp(suffix='.tmp', dir=self.db_dir)
-            os.close(fd)
-            conn = sqlite3.connect(tmp_db_file, check_same_thread=False,
-                                   factory=GreenDBConnection, timeout=0)
+        mkdirs(self.db_dir)
+        fd, tmp_db_file = mkstemp(suffix='.tmp', dir=self.db_dir)
+        os.close(fd)
+        conn = sqlite3.connect(tmp_db_file, check_same_thread=False,
+                               factory=GreenDBConnection, timeout=0)
+        if QUERY_LOGGING:
+            conn.set_trace_callback(self.logger.debug)
         # creating dbs implicitly does a lot of transactions, so we
         # pick fast, unsafe options here and do a big fsync at the end.
-        conn.execute('PRAGMA synchronous = OFF')
-        conn.execute('PRAGMA temp_store = MEMORY')
-        conn.execute('PRAGMA journal_mode = MEMORY')
+        with closing(conn.cursor()) as cur:
+            cur.execute('PRAGMA synchronous = OFF')
+            cur.execute('PRAGMA temp_store = MEMORY')
+            cur.execute('PRAGMA journal_mode = MEMORY')
         conn.create_function('chexor', 3, chexor)
         conn.row_factory = sqlite3.Row
         conn.text_factory = str
@@ -232,8 +413,9 @@ def initialize(self, put_timestamp=None):
             END;
         """)
         if not put_timestamp:
-            put_timestamp = normalize_timestamp(0)
-        self._initialize(conn, put_timestamp)
+            put_timestamp = Timestamp.zero().internal
+        self._initialize(conn, put_timestamp,
+                         storage_policy_index=storage_policy_index)
         conn.commit()
         if tmp_db_file:
             conn.close()
@@ -243,11 +425,10 @@ def initialize(self, put_timestamp=None):
                 if os.path.exists(self.db_file):
                     # It's as if there was a "condition" where different parts
                     # of the system were "racing" each other.
-                    raise DatabaseConnectionError(
-                        self.db_file,
-                        'DB created by someone else while working?')
+                    raise DatabaseAlreadyExists(self.db_file)
                 renamer(tmp_db_file, self.db_file)
-            self.conn = get_db_connection(self.db_file, self.timeout)
+            self.conn = get_db_connection(self.db_file, self.timeout,
+                                          self.logger)
         else:
             self.conn = conn
 
@@ -255,60 +436,114 @@ def delete_db(self, timestamp):
         """
         Mark the DB as deleted
 
-        :param timestamp: delete timestamp
+        :param timestamp: internalized delete timestamp
         """
-        timestamp = normalize_timestamp(timestamp)
         # first, clear the metadata
         cleared_meta = {}
-        for k in self.metadata.iterkeys():
+        for k in self.metadata:
+            if k.lower() in self.delete_meta_whitelist:
+                continue
             cleared_meta[k] = ('', timestamp)
         self.update_metadata(cleared_meta)
         # then mark the db as deleted
         with self.get() as conn:
-            self._delete_db(conn, timestamp)
+            conn.execute(
+                """
+                UPDATE %s_stat
+                SET delete_timestamp = ?,
+                    status = 'DELETED',
+                    status_changed_at = ?
+                WHERE delete_timestamp < ? """ % self.db_type,
+                (timestamp, timestamp, timestamp))
             conn.commit()
 
-    def possibly_quarantine(self, exc_type, exc_value, exc_traceback):
+    @property
+    def db_file(self):
+        return self._db_file
+
+    def get_device_path(self):
+        suffix_path = os.path.dirname(self.db_dir)
+        partition_path = os.path.dirname(suffix_path)
+        dbs_path = os.path.dirname(partition_path)
+        return os.path.dirname(dbs_path)
+
+    def quarantine(self, reason):
         """
-        Checks the exception info to see if it indicates a quarantine situation
-        (malformed or corrupted database). If not, the original exception will
-        be reraised. If so, the database will be quarantined and a new
+        The database will be quarantined and a
         sqlite3.DatabaseError will be raised indicating the action taken.
         """
-        if 'database disk image is malformed' in str(exc_value):
-            exc_hint = 'malformed'
-        elif 'file is encrypted or is not a database' in str(exc_value):
-            exc_hint = 'corrupted'
-        else:
-            raise exc_type(*exc_value.args), None, exc_traceback
-        prefix_path = os.path.dirname(self.db_dir)
-        partition_path = os.path.dirname(prefix_path)
-        dbs_path = os.path.dirname(partition_path)
-        device_path = os.path.dirname(dbs_path)
+        device_path = self.get_device_path()
         quar_path = os.path.join(device_path, 'quarantined',
                                  self.db_type + 's',
                                  os.path.basename(self.db_dir))
         try:
-            renamer(self.db_dir, quar_path)
-        except OSError, e:
+            renamer(self.db_dir, quar_path, fsync=False)
+        except OSError as e:
             if e.errno not in (errno.EEXIST, errno.ENOTEMPTY):
                 raise
             quar_path = "%s-%s" % (quar_path, uuid4().hex)
-            renamer(self.db_dir, quar_path)
-        detail = _('Quarantined %s to %s due to %s database') % \
-                  (self.db_dir, quar_path, exc_hint)
+            renamer(self.db_dir, quar_path, fsync=False)
+        detail = ('Quarantined %(db_dir)s to %(quar_path)s due to '
+                  '%(reason)s') % {'db_dir': self.db_dir,
+                                   'quar_path': quar_path,
+                                   'reason': reason}
         self.logger.error(detail)
         raise sqlite3.DatabaseError(detail)
 
+    def possibly_quarantine(self, err):
+        """
+        Checks the exception info to see if it indicates a quarantine situation
+        (malformed or corrupted database). If not, the original exception will
+        be reraised. If so, the database will be quarantined and a new
+        sqlite3.DatabaseError will be raised indicating the action taken.
+        """
+        if 'database disk image is malformed' in str(err):
+            exc_hint = 'malformed database'
+        elif 'malformed database schema' in str(err):
+            exc_hint = 'malformed database'
+        elif ' is not a database' in str(err):
+            # older versions said 'file is not a database'
+            # now 'file is encrypted or is not a database'
+            exc_hint = 'corrupted database'
+        elif 'disk I/O error' in str(err):
+            exc_hint = 'disk error while accessing database'
+        else:
+            raise err
+
+        self.quarantine(exc_hint)
+
+    @contextmanager
+    def updated_timeout(self, new_timeout):
+        """Use with "with" statement; updates ``timeout`` within the block."""
+        old_timeout = self.timeout
+        try:
+            self.timeout = new_timeout
+            if self.conn:
+                self.conn.timeout = new_timeout
+            yield old_timeout
+        finally:
+            self.timeout = old_timeout
+            if self.conn:
+                self.conn.timeout = old_timeout
+
+    @contextmanager
+    def maybe_get(self, conn):
+        if conn:
+            yield conn
+        else:
+            with self.get() as conn:
+                yield conn
+
     @contextmanager
     def get(self):
         """Use with the "with" statement; returns a database connection."""
         if not self.conn:
-            if self.db_file != ':memory:' and os.path.exists(self.db_file):
+            if os.path.exists(self.db_file):
                 try:
-                    self.conn = get_db_connection(self.db_file, self.timeout)
-                except (sqlite3.DatabaseError, DatabaseConnectionError):
-                    self.possibly_quarantine(*sys.exc_info())
+                    self.conn = get_db_connection(self.db_file, self.timeout,
+                                                  self.logger)
+                except (sqlite3.DatabaseError, DatabaseConnectionError) as e:
+                    self.possibly_quarantine(e)
             else:
                 raise DatabaseConnectionError(self.db_file, "DB doesn't exist")
         conn = self.conn
@@ -317,12 +552,12 @@ def get(self):
             yield conn
             conn.rollback()
             self.conn = conn
-        except sqlite3.DatabaseError:
+        except sqlite3.DatabaseError as e:
             try:
                 conn.close()
-            except:
+            except Exception:
                 pass
-            self.possibly_quarantine(*sys.exc_info())
+            self.possibly_quarantine(e)
         except (Exception, Timeout):
             conn.close()
             raise
@@ -331,8 +566,9 @@ def get(self):
     def lock(self):
         """Use with the "with" statement; locks a database."""
         if not self.conn:
-            if self.db_file != ':memory:' and os.path.exists(self.db_file):
-                self.conn = get_db_connection(self.db_file, self.timeout)
+            if os.path.exists(self.db_file):
+                self.conn = get_db_connection(self.db_file, self.timeout,
+                                              self.logger)
             else:
                 raise DatabaseConnectionError(self.db_file, "DB doesn't exist")
         conn = self.conn
@@ -342,16 +578,19 @@ def lock(self):
         conn.execute('BEGIN IMMEDIATE')
         try:
             yield True
-        except (Exception, Timeout):
-            pass
-        try:
-            conn.execute('ROLLBACK')
-            conn.isolation_level = orig_isolation_level
-            self.conn = conn
-        except (Exception, Timeout):
-            logging.exception(
-                _('Broker error trying to rollback locked connection'))
-            conn.close()
+        finally:
+            try:
+                conn.execute('ROLLBACK')
+                conn.isolation_level = orig_isolation_level
+                self.conn = conn
+            except (Exception, Timeout):
+                logging.exception(
+                    'Broker error trying to rollback locked connection')
+                conn.close()
+
+    def _new_db_id(self):
+        device_name = os.path.basename(self.get_device_path())
+        return "%s-%s" % (str(uuid4()), device_name)
 
     def newid(self, remote_id):
         """
@@ -362,7 +601,7 @@ def newid(self, remote_id):
         with self.get() as conn:
             row = conn.execute('''
                 UPDATE %s_stat SET id=?
-            ''' % self.db_type, (str(uuid4()),))
+            ''' % self.db_type, (self._new_db_id(),))
             row = conn.execute('''
                 SELECT ROWID FROM %s ORDER BY ROWID DESC LIMIT 1
             ''' % self.db_contains_type).fetchone()
@@ -378,6 +617,45 @@ def _newid(self, conn):
         # Override for additional work when receiving an rsynced db.
         pass
 
+    def _is_deleted(self, conn):
+        """
+        Check if the database is considered deleted
+
+        :param conn: database conn
+
+        :returns: True if the DB is considered to be deleted, False otherwise
+        """
+        raise NotImplementedError()
+
+    def is_deleted(self):
+        """
+        Check if the DB is considered to be deleted.
+
+        :returns: True if the DB is considered to be deleted, False otherwise
+        """
+        if not os.path.exists(self.db_file):
+            return True
+        self._commit_puts_stale_ok()
+        with self.get() as conn:
+            return self._is_deleted(conn)
+
+    def empty(self):
+        """
+        Check if the broker abstraction contains any undeleted records.
+        """
+        raise NotImplementedError()
+
+    def is_reclaimable(self, now, reclaim_age):
+        """
+        Check if the broker abstraction is empty, and has been marked deleted
+        for at least a reclaim age.
+        """
+        info = self.get_replication_info()
+        return (zero_like(info['count']) and
+                (Timestamp(now - reclaim_age) >
+                 Timestamp(info['delete_timestamp']) >
+                 Timestamp(info['put_timestamp'])))
+
     def merge_timestamps(self, created_at, put_timestamp, delete_timestamp):
         """
         Used in replication to handle updating timestamps.
@@ -387,11 +665,16 @@ def merge_timestamps(self, created_at, put_timestamp, delete_timestamp):
         :param delete_timestamp: delete timestamp
         """
         with self.get() as conn:
+            old_status = self._is_deleted(conn)
             conn.execute('''
                 UPDATE %s_stat SET created_at=MIN(?, created_at),
                                    put_timestamp=MAX(?, put_timestamp),
                                    delete_timestamp=MAX(?, delete_timestamp)
             ''' % self.db_type, (created_at, put_timestamp, delete_timestamp))
+            if old_status != self._is_deleted(conn):
+                timestamp = Timestamp.now()
+                self._update_status_changed_at(conn, timestamp.internal)
+
             conn.commit()
 
     def get_items_since(self, start, count):
@@ -402,11 +685,7 @@ def get_items_since(self, start, count):
         :param count: number to get
         :returns: list of objects between start and end
         """
-        try:
-            self._commit_puts()
-        except LockTimeout:
-            if not self.stale_reads_ok:
-                raise
+        self._commit_puts_stale_ok()
         with self.get() as conn:
             curs = conn.execute('''
                 SELECT * FROM %s WHERE ROWID > ? ORDER BY ROWID ASC LIMIT ?
@@ -431,58 +710,179 @@ def get_sync(self, id, incoming=True):
                 return -1
             return row['sync_point']
 
-    def get_syncs(self, incoming=True):
+    def get_syncs(self, incoming=True, include_timestamp=False):
         """
         Get a serialized copy of the sync table.
 
         :param incoming: if True, get the last incoming sync, otherwise get
                          the last outgoing sync
-        :returns: list of {'remote_id', 'sync_point'}
+        :param include_timestamp: If True include the updated_at timestamp
+        :returns: list of {'remote_id', 'sync_point'} or
+                 {'remote_id', 'sync_point', 'updated_at'}
+                 if include_timestamp is True.
         """
         with self.get() as conn:
+            columns = 'remote_id, sync_point'
+            if include_timestamp:
+                columns += ', updated_at'
             curs = conn.execute('''
-                SELECT remote_id, sync_point FROM %s_sync
-            ''' % 'incoming' if incoming else 'outgoing')
-            result = []
-            for row in curs:
-                result.append({'remote_id': row[0], 'sync_point': row[1]})
-            return result
+                SELECT %s FROM %s_sync
+            ''' % (columns, 'incoming' if incoming else 'outgoing'))
+            curs.row_factory = dict_factory
+            return [r for r in curs]
+
+    def get_max_row(self, table=None):
+        if not table:
+            table = self.db_contains_type
+        query = '''
+            SELECT SQLITE_SEQUENCE.seq
+            FROM SQLITE_SEQUENCE
+            WHERE SQLITE_SEQUENCE.name == '%s'
+            LIMIT 1
+        ''' % (table, )
+        with self.get() as conn:
+            row = conn.execute(query).fetchone()
+        return row[0] if row else -1
 
     def get_replication_info(self):
         """
         Get information about the DB required for replication.
 
-        :returns: dict containing keys: hash, id, created_at, put_timestamp,
-            delete_timestamp, count, max_row, and metadata
+        :returns: dict containing keys from get_info plus max_row and metadata
+
+        Note:: get_info's <db_contains_type>_count is translated to just
+               "count" and metadata is the raw string.
         """
-        try:
-            self._commit_puts()
-        except LockTimeout:
-            if not self.stale_reads_ok:
-                raise
-        query_part1 = '''
-            SELECT hash, id, created_at, put_timestamp, delete_timestamp,
-                %s_count AS count,
-                CASE WHEN SQLITE_SEQUENCE.seq IS NOT NULL
-                    THEN SQLITE_SEQUENCE.seq ELSE -1 END AS max_row, ''' % \
-            self.db_contains_type
-        query_part2 = '''
-            FROM (%s_stat LEFT JOIN SQLITE_SEQUENCE
-                  ON SQLITE_SEQUENCE.name == '%s') LIMIT 1
-        ''' % (self.db_type, self.db_contains_type)
+        info = self.get_info()
+        info['count'] = info.pop('%s_count' % self.db_contains_type)
+        info['metadata'] = self.get_raw_metadata()
+        info['max_row'] = self.get_max_row()
+        return info
+
+    def get_info(self):
+        self._commit_puts_stale_ok()
         with self.get() as conn:
-            try:
-                curs = conn.execute(query_part1 + 'metadata' + query_part2)
-            except sqlite3.OperationalError, err:
-                if 'no such column: metadata' not in str(err):
-                    raise
-                curs = conn.execute(query_part1 + "'' as metadata" +
-                                    query_part2)
+            curs = conn.execute('SELECT * from %s_stat' % self.db_type)
             curs.row_factory = dict_factory
             return curs.fetchone()
 
-    def _commit_puts(self):
-        pass    # stub to be overridden if need be
+    def put_record(self, record):
+        """
+        Put a record into the DB. If the DB has an associated pending file with
+        space then the record is appended to that file and a commit to the DB
+        is deferred. If its pending file is full then the record will be
+        committed immediately.
+
+        :param record: a record to be added to the DB.
+        :raises DatabaseConnectionError: if the DB file does not exist or if
+            ``skip_commits`` is True.
+        :raises LockTimeout: if a timeout occurs while waiting to take a lock
+            to write to the pending file.
+        """
+        if not os.path.exists(self.db_file):
+            raise DatabaseConnectionError(self.db_file, "DB doesn't exist")
+        if self.skip_commits:
+            raise DatabaseConnectionError(self.db_file,
+                                          'commits not accepted')
+        with lock_parent_directory(self.pending_file, self.pending_timeout):
+            pending_size = 0
+            try:
+                pending_size = os.path.getsize(self.pending_file)
+            except OSError as err:
+                if err.errno != errno.ENOENT:
+                    raise
+            if pending_size > PENDING_CAP:
+                self._commit_puts([record])
+            else:
+                with open(self.pending_file, 'a+b') as fp:
+                    # Colons aren't used in base64 encoding; so they are our
+                    # delimiter
+                    fp.write(b':')
+                    fp.write(base64.b64encode(pickle.dumps(
+                        self.make_tuple_for_pickle(record),
+                        protocol=PICKLE_PROTOCOL)))
+                    fp.flush()
+
+    def _skip_commit_puts(self):
+        return self.skip_commits or not os.path.exists(self.pending_file)
+
+    def _commit_puts(self, item_list=None):
+        """
+        Scan for .pending files and commit the found records by feeding them
+        to merge_items(). Assume that lock_parent_directory has already been
+        called.
+
+        :param item_list: A list of items to commit in addition to .pending
+        """
+        if self._skip_commit_puts():
+            if item_list:
+                # this broker instance should not be used to commit records,
+                # but if it is then raise an error rather than quietly
+                # discarding the records in item_list.
+                raise DatabaseConnectionError(self.db_file,
+                                              'commits not accepted')
+            return
+        if item_list is None:
+            item_list = []
+        self._preallocate()
+        if not os.path.getsize(self.pending_file):
+            if item_list:
+                self.merge_items(item_list)
+            return
+        with open(self.pending_file, 'r+b') as fp:
+            for entry in fp.read().split(b':'):
+                if entry:
+                    try:
+                        data = pickle.loads(base64.b64decode(entry),
+                                            encoding='utf8')  # nosec: B301
+                        self._commit_puts_load(item_list, data)
+                    except Exception:
+                        self.logger.exception(
+                            'Invalid pending entry %(file)s: %(entry)s',
+                            {'file': self.pending_file, 'entry': entry})
+            if item_list:
+                self.merge_items(item_list)
+            try:
+                os.ftruncate(fp.fileno(), 0)
+            except OSError as err:
+                if err.errno != errno.ENOENT:
+                    raise
+
+    def _commit_puts_stale_ok(self):
+        """
+        Catch failures of _commit_puts() if broker is intended for
+        reading of stats, and thus does not care for pending updates.
+        """
+        if self._skip_commit_puts():
+            return
+        try:
+            with lock_parent_directory(self.pending_file,
+                                       self.pending_timeout):
+                self._commit_puts()
+        except (LockTimeout, sqlite3.OperationalError):
+            if not self.stale_reads_ok:
+                raise
+
+    def _commit_puts_load(self, item_list, entry):
+        """
+        Unmarshall the :param:entry tuple and append it to :param:item_list.
+        This is implemented by a particular broker to be compatible
+        with its :func:`merge_items`.
+        """
+        raise NotImplementedError
+
+    def merge_items(self, item_list, source=None):
+        """
+        Save :param:item_list to the database.
+        """
+        raise NotImplementedError
+
+    def make_tuple_for_pickle(self, record):
+        """
+        Turn this db record dict into the format this service uses for
+        pending pickles.
+        """
+        raise NotImplementedError
 
     def merge_syncs(self, sync_points, incoming=True):
         """
@@ -515,7 +915,7 @@ def _preallocate(self):
         within 512k of a boundary, it allocates to the next boundary.
         Boundaries are 2m, 5m, 10m, 25m, 50m, then every 50m after.
         """
-        if not DB_PREALLOCATION or self.db_file == ':memory:':
+        if not DB_PREALLOCATION:
             return
         MB = (1024 * 1024)
 
@@ -537,6 +937,21 @@ def prealloc_points():
             with open(self.db_file, 'rb+') as fp:
                 fallocate(fp.fileno(), int(prealloc_size))
 
+    def get_raw_metadata(self):
+        with self.get() as conn:
+            try:
+                row = conn.execute('SELECT metadata FROM %s_stat' %
+                                   self.db_type).fetchone()
+                if not row:
+                    self.quarantine("missing row in %s_stat table" %
+                                    self.db_type)
+                metadata = row[0]
+            except sqlite3.OperationalError as err:
+                if 'no such column: metadata' not in str(err):
+                    raise
+                metadata = ''
+        return metadata
+
     @property
     def metadata(self):
         """
@@ -544,65 +959,151 @@ def metadata(self):
         are tuples of (value, timestamp) where the timestamp indicates when
         that key was set to that value.
         """
-        with self.get() as conn:
-            try:
-                metadata = conn.execute('SELECT metadata FROM %s_stat' %
-                                        self.db_type).fetchone()[0]
-            except sqlite3.OperationalError, err:
-                if 'no such column: metadata' not in str(err):
-                    raise
-                metadata = ''
+        metadata = self.get_raw_metadata()
         if metadata:
             metadata = json.loads(metadata)
+            native_str_keys_and_values(metadata)
         else:
             metadata = {}
         return metadata
 
-    def update_metadata(self, metadata_updates):
+    @staticmethod
+    def validate_metadata(metadata):
+        """
+        Validates that metadata falls within acceptable limits.
+
+        :param metadata: to be validated
+        :raises HTTPBadRequest: if MAX_META_COUNT or MAX_META_OVERALL_SIZE
+                 is exceeded, or if metadata contains non-UTF-8 data
+        """
+        meta_count = 0
+        meta_size = 0
+        for key, (value, timestamp) in metadata.items():
+            if key and not check_utf8(key):
+                raise HTTPBadRequest('Metadata must be valid UTF-8')
+            if value and not check_utf8(value):
+                raise HTTPBadRequest('Metadata must be valid UTF-8')
+            key = key.lower()
+            if value and key.startswith(('x-account-meta-',
+                                         'x-container-meta-')):
+                prefix = 'x-account-meta-'
+                if key.startswith('x-container-meta-'):
+                    prefix = 'x-container-meta-'
+                key = key[len(prefix):]
+                meta_count = meta_count + 1
+                meta_size = meta_size + len(key) + len(value)
+        if meta_count > MAX_META_COUNT:
+            raise HTTPBadRequest('Too many metadata items; max %d'
+                                 % MAX_META_COUNT)
+        if meta_size > MAX_META_OVERALL_SIZE:
+            raise HTTPBadRequest('Total metadata too large; max %d'
+                                 % MAX_META_OVERALL_SIZE)
+
+    def update_metadata(self, metadata_updates, validate_metadata=False):
         """
         Updates the metadata dict for the database. The metadata dict values
-        are tuples of (value, timestamp) where the timestamp indicates when
-        that key was set to that value. Key/values will only be overwritten if
-        the timestamp is newer. To delete a key, set its value to ('',
-        timestamp). These empty keys will eventually be removed by
-        :func:reclaim
+        are tuples of (value, timestamp) where the timestamp is an internalized
+        timestamp string that indicates when that key was set to that value.
+        Key/values will only be overwritten if the timestamp is newer. To
+        delete a key, set its value to ('', timestamp). These empty keys will
+        eventually be removed by :func:`reclaim`
         """
         old_metadata = self.metadata
         if set(metadata_updates).issubset(set(old_metadata)):
-            for key, (value, timestamp) in metadata_updates.iteritems():
+            for key, (value, timestamp) in metadata_updates.items():
                 if timestamp > old_metadata[key][1]:
                     break
             else:
                 return
         with self.get() as conn:
             try:
-                md = conn.execute('SELECT metadata FROM %s_stat' %
-                                  self.db_type).fetchone()[0]
-                md = md and json.loads(md) or {}
-            except sqlite3.OperationalError, err:
+                row = conn.execute('SELECT metadata FROM %s_stat' %
+                                   self.db_type).fetchone()
+                if not row:
+                    self.quarantine("missing row in %s_stat table" %
+                                    self.db_type)
+                md = row[0]
+                md = json.loads(md) if md else {}
+                native_str_keys_and_values(md)
+            except sqlite3.OperationalError as err:
                 if 'no such column: metadata' not in str(err):
                     raise
                 conn.execute("""
                     ALTER TABLE %s_stat
                     ADD COLUMN metadata TEXT DEFAULT '' """ % self.db_type)
                 md = {}
-            for key, value_timestamp in metadata_updates.iteritems():
+            for key, value_timestamp in metadata_updates.items():
                 value, timestamp = value_timestamp
                 if key not in md or timestamp > md[key][1]:
                     md[key] = value_timestamp
+            if validate_metadata:
+                DatabaseBroker.validate_metadata(md)
             conn.execute('UPDATE %s_stat SET metadata = ?' % self.db_type,
                          (json.dumps(md),))
             conn.commit()
 
-    def reclaim(self, timestamp):
-        """Removes any empty metadata values older than the timestamp"""
-        if not self.metadata:
-            return
+    def reclaim(self, age_timestamp, sync_timestamp):
+        """
+        Delete reclaimable rows and metadata from the db.
+
+        By default this method will delete rows from the db_contains_type table
+        that are marked deleted and whose created_at timestamp is <
+        age_timestamp, and deletes rows from incoming_sync and outgoing_sync
+        where the updated_at timestamp is < sync_timestamp. In addition, this
+        calls the :meth:`_reclaim_metadata` method.
+
+        Subclasses may reclaim other items by overriding :meth:`_reclaim`.
+
+        :param age_timestamp: (float) the max created_at timestamp of object
+            rows to delete
+        :param sync_timestamp: (float) the max update_at timestamp of sync rows
+            to delete
+        """
+        if not self._skip_commit_puts():
+            with lock_parent_directory(self.pending_file,
+                                       self.pending_timeout):
+                self._commit_puts()
+
+        tombstone_reclaimer = TombstoneReclaimer(self, age_timestamp)
+        tombstone_reclaimer.reclaim()
         with self.get() as conn:
-            if self._reclaim(conn, timestamp):
-                conn.commit()
+            self._reclaim_other_stuff(conn, age_timestamp, sync_timestamp)
+            conn.commit()
+        return tombstone_reclaimer
+
+    def _reclaim_other_stuff(self, conn, age_timestamp, sync_timestamp):
+        """
+        This is only called once at the end of reclaim after tombstone reclaim
+        has been completed.
+
+        :param conn: db connection
+        :param age_timestamp: (float) the max created_at timestamp of object
+            rows to delete
+        :param sync_timestamp: (float) the max update_at timestamp of sync rows
+            to delete
+        """
+        self._reclaim_sync(conn, sync_timestamp)
+        self._reclaim_metadata(conn, age_timestamp)
 
-    def _reclaim(self, conn, timestamp):
+    def _reclaim_sync(self, conn, sync_timestamp):
+        """
+        :param conn: db connection
+        :param sync_timestamp: (float) the max update_at timestamp of sync rows
+            to delete
+        """
+        try:
+            conn.execute('''
+                DELETE FROM outgoing_sync WHERE updated_at < ?
+            ''', (sync_timestamp,))
+            conn.execute('''
+                DELETE FROM incoming_sync WHERE updated_at < ?
+            ''', (sync_timestamp,))
+        except sqlite3.OperationalError as err:
+            # Old dbs didn't have updated_at in the _sync tables.
+            if 'no such column: updated_at' not in str(err):
+                raise
+
+    def _reclaim_metadata(self, conn, timestamp):
         """
         Removes any empty metadata values older than the timestamp using the
         given database connection. This function will not call commit on the
@@ -611,18 +1112,23 @@ def _reclaim(self, conn, timestamp):
         from other related functions.
 
         :param conn: Database connection to reclaim metadata within.
-        :param timestamp: Empty metadata items last updated before this
+        :param timestamp: (float) Empty metadata items last updated before this
                           timestamp will be removed.
         :returns: True if conn.commit() should be called
         """
+        timestamp = Timestamp(timestamp)
         try:
-            md = conn.execute('SELECT metadata FROM %s_stat' %
-                              self.db_type).fetchone()[0]
+            row = conn.execute('SELECT metadata FROM %s_stat' %
+                               self.db_type).fetchone()
+            if not row:
+                self.quarantine("missing row in %s_stat table" %
+                                self.db_type)
+            md = row[0]
             if md:
                 md = json.loads(md)
                 keys_to_delete = []
-                for key, (value, value_timestamp) in md.iteritems():
-                    if value == '' and value_timestamp < timestamp:
+                for key, (value, value_timestamp) in md.items():
+                    if value == '' and Timestamp(value_timestamp) < timestamp:
                         keys_to_delete.append(key)
                 if keys_to_delete:
                     for key in keys_to_delete:
@@ -630,1061 +1136,39 @@ def _reclaim(self, conn, timestamp):
                     conn.execute('UPDATE %s_stat SET metadata = ?' %
                                  self.db_type, (json.dumps(md),))
                     return True
-        except sqlite3.OperationalError, err:
+        except sqlite3.OperationalError as err:
             if 'no such column: metadata' not in str(err):
                 raise
         return False
 
-
-class ContainerBroker(DatabaseBroker):
-    """Encapsulates working with a container database."""
-    db_type = 'container'
-    db_contains_type = 'object'
-
-    def _initialize(self, conn, put_timestamp):
-        """Creates a brand new database (tables, indices, triggers, etc.)"""
-        if not self.account:
-            raise ValueError(
-                'Attempting to create a new database with no account set')
-        if not self.container:
-            raise ValueError(
-                'Attempting to create a new database with no container set')
-        self.create_object_table(conn)
-        self.create_container_stat_table(conn, put_timestamp)
-
-    def create_object_table(self, conn):
-        """
-        Create the object table which is specifc to the container DB.
-
-        :param conn: DB connection object
-        """
-        conn.executescript("""
-            CREATE TABLE object (
-                ROWID INTEGER PRIMARY KEY AUTOINCREMENT,
-                name TEXT,
-                created_at TEXT,
-                size INTEGER,
-                content_type TEXT,
-                etag TEXT,
-                deleted INTEGER DEFAULT 0
-            );
-
-            CREATE INDEX ix_object_deleted_name ON object (deleted, name);
-
-            CREATE TRIGGER object_insert AFTER INSERT ON object
-            BEGIN
-                UPDATE container_stat
-                SET object_count = object_count + (1 - new.deleted),
-                    bytes_used = bytes_used + new.size,
-                    hash = chexor(hash, new.name, new.created_at);
-            END;
-
-            CREATE TRIGGER object_update BEFORE UPDATE ON object
-            BEGIN
-                SELECT RAISE(FAIL, 'UPDATE not allowed; DELETE and INSERT');
-            END;
-
-            CREATE TRIGGER object_delete AFTER DELETE ON object
-            BEGIN
-                UPDATE container_stat
-                SET object_count = object_count - (1 - old.deleted),
-                    bytes_used = bytes_used - old.size,
-                    hash = chexor(hash, old.name, old.created_at);
-            END;
-        """)
-
-    def create_container_stat_table(self, conn, put_timestamp=None):
-        """
-        Create the container_stat table which is specific to the container DB.
-
-        :param conn: DB connection object
-        :param put_timestamp: put timestamp
-        """
-        if put_timestamp is None:
-            put_timestamp = normalize_timestamp(0)
-        conn.executescript("""
-            CREATE TABLE container_stat (
-                account TEXT,
-                container TEXT,
-                created_at TEXT,
-                put_timestamp TEXT DEFAULT '0',
-                delete_timestamp TEXT DEFAULT '0',
-                object_count INTEGER,
-                bytes_used INTEGER,
-                reported_put_timestamp TEXT DEFAULT '0',
-                reported_delete_timestamp TEXT DEFAULT '0',
-                reported_object_count INTEGER DEFAULT 0,
-                reported_bytes_used INTEGER DEFAULT 0,
-                hash TEXT default '00000000000000000000000000000000',
-                id TEXT,
-                status TEXT DEFAULT '',
-                status_changed_at TEXT DEFAULT '0',
-                metadata TEXT DEFAULT '',
-                x_container_sync_point1 INTEGER DEFAULT -1,
-                x_container_sync_point2 INTEGER DEFAULT -1
-            );
-
-            INSERT INTO container_stat (object_count, bytes_used)
-                VALUES (0, 0);
-        """)
-        conn.execute('''
-            UPDATE container_stat
-            SET account = ?, container = ?, created_at = ?, id = ?,
-                put_timestamp = ?
-        ''', (self.account, self.container, normalize_timestamp(time.time()),
-              str(uuid4()), put_timestamp))
-
-    def get_db_version(self, conn):
-        if self._db_version == -1:
-            self._db_version = 0
-            for row in conn.execute('''
-                    SELECT name FROM sqlite_master
-                    WHERE name = 'ix_object_deleted_name' '''):
-                self._db_version = 1
-        return self._db_version
-
-    def _newid(self, conn):
-        conn.execute('''
-            UPDATE container_stat
-            SET reported_put_timestamp = 0, reported_delete_timestamp = 0,
-                reported_object_count = 0, reported_bytes_used = 0''')
-
     def update_put_timestamp(self, timestamp):
         """
         Update the put_timestamp.  Only modifies it if it is greater than
         the current timestamp.
 
-        :param timestamp: put timestamp
+        :param timestamp: internalized put timestamp
         """
         with self.get() as conn:
-            conn.execute('''
-                UPDATE container_stat SET put_timestamp = ?
-                WHERE put_timestamp < ? ''', (timestamp, timestamp))
+            conn.execute(
+                'UPDATE %s_stat SET put_timestamp = ?'
+                ' WHERE put_timestamp < ?' % self.db_type,
+                (timestamp, timestamp))
             conn.commit()
 
-    def _delete_db(self, conn, timestamp):
+    def update_status_changed_at(self, timestamp):
         """
-        Mark the DB as deleted
+        Update the status_changed_at field in the stat table.  Only
+        modifies status_changed_at if the timestamp is greater than the
+        current status_changed_at timestamp.
 
-        :param conn: DB connection object
-        :param timestamp: timestamp to mark as deleted
+        :param timestamp: internalized timestamp
         """
-        conn.execute("""
-            UPDATE container_stat
-            SET delete_timestamp = ?,
-                status = 'DELETED',
-                status_changed_at = ?
-            WHERE delete_timestamp < ? """, (timestamp, timestamp, timestamp))
-
-    def empty(self):
-        """
-        Check if the DB is empty.
-
-        :returns: True if the database has no active objects, False otherwise
-        """
-        try:
-            self._commit_puts()
-        except LockTimeout:
-            if not self.stale_reads_ok:
-                raise
         with self.get() as conn:
-            row = conn.execute(
-                'SELECT object_count from container_stat').fetchone()
-            return (row[0] == 0)
-
-    def _commit_puts(self, item_list=None):
-        """Handles commiting rows in .pending files."""
-        if self.db_file == ':memory:' or not os.path.exists(self.pending_file):
-            return
-        if item_list is None:
-            item_list = []
-        with lock_parent_directory(self.pending_file, self.pending_timeout):
-            self._preallocate()
-            if not os.path.getsize(self.pending_file):
-                if item_list:
-                    self.merge_items(item_list)
-                return
-            with open(self.pending_file, 'r+b') as fp:
-                for entry in fp.read().split(':'):
-                    if entry:
-                        try:
-                            (name, timestamp, size, content_type, etag,
-                                deleted) = pickle.loads(entry.decode('base64'))
-                            item_list.append({'name': name,
-                                              'created_at': timestamp,
-                                              'size': size,
-                                              'content_type': content_type,
-                                              'etag': etag,
-                                              'deleted': deleted})
-                        except Exception:
-                            self.logger.exception(
-                                _('Invalid pending entry %(file)s: %(entry)s'),
-                                {'file': self.pending_file, 'entry': entry})
-                if item_list:
-                    self.merge_items(item_list)
-                try:
-                    os.ftruncate(fp.fileno(), 0)
-                except OSError, err:
-                    if err.errno != errno.ENOENT:
-                        raise
-
-    def reclaim(self, object_timestamp, sync_timestamp):
-        """
-        Delete rows from the object table that are marked deleted and
-        whose created_at timestamp is < object_timestamp.  Also deletes rows
-        from incoming_sync and outgoing_sync where the updated_at timestamp is
-        < sync_timestamp.
-
-        In addition, this calls the DatabaseBroker's :func:_reclaim method.
-
-        :param object_timestamp: max created_at timestamp of object rows to
-                                 delete
-        :param sync_timestamp: max update_at timestamp of sync rows to delete
-        """
-        self._commit_puts()
-        with self.get() as conn:
-            conn.execute("""
-                    DELETE FROM object
-                    WHERE deleted = 1
-                    AND created_at < ?""", (object_timestamp,))
-            try:
-                conn.execute('''
-                    DELETE FROM outgoing_sync WHERE updated_at < ?
-                ''', (sync_timestamp,))
-                conn.execute('''
-                    DELETE FROM incoming_sync WHERE updated_at < ?
-                ''', (sync_timestamp,))
-            except sqlite3.OperationalError, err:
-                # Old dbs didn't have updated_at in the _sync tables.
-                if 'no such column: updated_at' not in str(err):
-                    raise
-            DatabaseBroker._reclaim(self, conn, object_timestamp)
-            conn.commit()
-
-    def delete_object(self, name, timestamp):
-        """
-        Mark an object deleted.
-
-        :param name: object name to be deleted
-        :param timestamp: timestamp when the object was marked as deleted
-        """
-        self.put_object(name, timestamp, 0, 'application/deleted', 'noetag', 1)
-
-    def put_object(self, name, timestamp, size, content_type, etag, deleted=0):
-        """
-        Creates an object in the DB with its metadata.
-
-        :param name: object name to be created
-        :param timestamp: timestamp of when the object was created
-        :param size: object size
-        :param content_type: object content-type
-        :param etag: object etag
-        :param deleted: if True, marks the object as deleted and sets the
-                        deteleted_at timestamp to timestamp
-        """
-        record = {'name': name, 'created_at': timestamp, 'size': size,
-                  'content_type': content_type, 'etag': etag,
-                  'deleted': deleted}
-        if self.db_file == ':memory:':
-            self.merge_items([record])
-            return
-        if not os.path.exists(self.db_file):
-            raise DatabaseConnectionError(self.db_file, "DB doesn't exist")
-        pending_size = 0
-        try:
-            pending_size = os.path.getsize(self.pending_file)
-        except OSError, err:
-            if err.errno != errno.ENOENT:
-                raise
-        if pending_size > PENDING_CAP:
-            self._commit_puts([record])
-        else:
-            with lock_parent_directory(
-                    self.pending_file, self.pending_timeout):
-                with open(self.pending_file, 'a+b') as fp:
-                    # Colons aren't used in base64 encoding; so they are our
-                    # delimiter
-                    fp.write(':')
-                    fp.write(pickle.dumps(
-                        (name, timestamp, size, content_type, etag, deleted),
-                        protocol=PICKLE_PROTOCOL).encode('base64'))
-                    fp.flush()
-
-    def is_deleted(self, timestamp=None):
-        """
-        Check if the DB is considered to be deleted.
-
-        :returns: True if the DB is considered to be deleted, False otherwise
-        """
-        if self.db_file != ':memory:' and not os.path.exists(self.db_file):
-            return True
-        try:
-            self._commit_puts()
-        except LockTimeout:
-            if not self.stale_reads_ok:
-                raise
-        with self.get() as conn:
-            row = conn.execute('''
-                SELECT put_timestamp, delete_timestamp, object_count
-                FROM container_stat''').fetchone()
-            # leave this db as a tombstone for a consistency window
-            if timestamp and row['delete_timestamp'] > timestamp:
-                return False
-            # The container is considered deleted if the delete_timestamp
-            # value is greater than the put_timestamp, and there are no
-            # objects in the container.
-            return (row['object_count'] in (None, '', 0, '0')) and \
-                (float(row['delete_timestamp']) > float(row['put_timestamp']))
-
-    def get_info(self, include_metadata=False):
-        """
-        Get global data for the container.
-
-        :returns: dict with keys: account, container, created_at,
-                  put_timestamp, delete_timestamp, object_count, bytes_used,
-                  reported_put_timestamp, reported_delete_timestamp,
-                  reported_object_count, reported_bytes_used, hash, id,
-                  x_container_sync_point1, and x_container_sync_point2.
-                  If include_metadata is set, metadata is included as a key
-                  pointing to a dict of tuples of the metadata
-        """
-        try:
-            self._commit_puts()
-        except LockTimeout:
-            if not self.stale_reads_ok:
-                raise
-        with self.get() as conn:
-            data = None
-            trailing1 = 'metadata'
-            trailing2 = 'x_container_sync_point1, x_container_sync_point2'
-            while not data:
-                try:
-                    data = conn.execute('''
-                        SELECT account, container, created_at, put_timestamp,
-                            delete_timestamp, object_count, bytes_used,
-                            reported_put_timestamp, reported_delete_timestamp,
-                            reported_object_count, reported_bytes_used, hash,
-                            id, %s, %s
-                        FROM container_stat
-                    ''' % (trailing1, trailing2)).fetchone()
-                except sqlite3.OperationalError, err:
-                    if 'no such column: metadata' in str(err):
-                        trailing1 = "'' as metadata"
-                    elif 'no such column: x_container_sync_point' in str(err):
-                        trailing2 = '-1 AS x_container_sync_point1, ' \
-                                    '-1 AS x_container_sync_point2'
-                    else:
-                        raise
-            data = dict(data)
-            if include_metadata:
-                try:
-                    data['metadata'] = json.loads(data.get('metadata', ''))
-                except ValueError:
-                    data['metadata'] = {}
-            elif 'metadata' in data:
-                del data['metadata']
-            return data
-
-    def set_x_container_sync_points(self, sync_point1, sync_point2):
-        with self.get() as conn:
-            orig_isolation_level = conn.isolation_level
-            try:
-                # We turn off auto-transactions to ensure the alter table
-                # commands are part of the transaction.
-                conn.isolation_level = None
-                conn.execute('BEGIN')
-                try:
-                    self._set_x_container_sync_points(conn, sync_point1,
-                                                      sync_point2)
-                except sqlite3.OperationalError, err:
-                    if 'no such column: x_container_sync_point' not in \
-                            str(err):
-                        raise
-                    conn.execute('''
-                        ALTER TABLE container_stat
-                        ADD COLUMN x_container_sync_point1 INTEGER DEFAULT -1
-                    ''')
-                    conn.execute('''
-                        ALTER TABLE container_stat
-                        ADD COLUMN x_container_sync_point2 INTEGER DEFAULT -1
-                    ''')
-                    self._set_x_container_sync_points(conn, sync_point1,
-                                                      sync_point2)
-                conn.execute('COMMIT')
-            finally:
-                conn.isolation_level = orig_isolation_level
-
-    def _set_x_container_sync_points(self, conn, sync_point1, sync_point2):
-        if sync_point1 is not None and sync_point2 is not None:
-            conn.execute('''
-                UPDATE container_stat
-                SET x_container_sync_point1 = ?,
-                    x_container_sync_point2 = ?
-            ''', (sync_point1, sync_point2))
-        elif sync_point1 is not None:
-            conn.execute('''
-                UPDATE container_stat
-                SET x_container_sync_point1 = ?
-            ''', (sync_point1,))
-        elif sync_point2 is not None:
-            conn.execute('''
-                UPDATE container_stat
-                SET x_container_sync_point2 = ?
-            ''', (sync_point2,))
-
-    def reported(self, put_timestamp, delete_timestamp, object_count,
-                 bytes_used):
-        """
-        Update reported stats.
-
-        :param put_timestamp: put_timestamp to update
-        :param delete_timestamp: delete_timestamp to update
-        :param object_count: object_count to update
-        :param bytes_used: bytes_used to update
-        """
-        with self.get() as conn:
-            conn.execute('''
-                UPDATE container_stat
-                SET reported_put_timestamp = ?, reported_delete_timestamp = ?,
-                    reported_object_count = ?, reported_bytes_used = ?
-            ''', (put_timestamp, delete_timestamp, object_count, bytes_used))
-            conn.commit()
-
-    def list_objects_iter(self, limit, marker, end_marker, prefix, delimiter,
-                          path=None):
-        """
-        Get a list of objects sorted by name starting at marker onward, up
-        to limit entries.  Entries will begin with the prefix and will not
-        have the delimiter after the prefix.
-
-        :param limit: maximum number of entries to get
-        :param marker: marker query
-        :param end_marker: end marker query
-        :param prefix: prefix query
-        :param delimeter: delimeter for query
-        :param path: if defined, will set the prefix and delimter based on
-                     the path
-
-        :returns: list of tuples of (name, created_at, size, content_type,
-                  etag)
-        """
-        (marker, end_marker, prefix, delimiter, path) = utf8encode(
-            marker, end_marker, prefix, delimiter, path)
-        try:
-            self._commit_puts()
-        except LockTimeout:
-            if not self.stale_reads_ok:
-                raise
-        if path is not None:
-            prefix = path
-            if path:
-                prefix = path = path.rstrip('/') + '/'
-            delimiter = '/'
-        elif delimiter and not prefix:
-            prefix = ''
-        orig_marker = marker
-        with self.get() as conn:
-            results = []
-            while len(results) < limit:
-                query = '''SELECT name, created_at, size, content_type, etag
-                           FROM object WHERE'''
-                query_args = []
-                if end_marker:
-                    query += ' name < ? AND'
-                    query_args.append(end_marker)
-                if marker and marker >= prefix:
-                    query += ' name > ? AND'
-                    query_args.append(marker)
-                elif prefix:
-                    query += ' name >= ? AND'
-                    query_args.append(prefix)
-                if self.get_db_version(conn) < 1:
-                    query += ' +deleted = 0'
-                else:
-                    query += ' deleted = 0'
-                query += ' ORDER BY name LIMIT ?'
-                query_args.append(limit - len(results))
-                curs = conn.execute(query, query_args)
-                curs.row_factory = None
-
-                if prefix is None:
-                    return [r for r in curs]
-                if not delimiter:
-                    return [r for r in curs if r[0].startswith(prefix)]
-                rowcount = 0
-                for row in curs:
-                    rowcount += 1
-                    marker = name = row[0]
-                    if len(results) >= limit or not name.startswith(prefix):
-                        curs.close()
-                        return results
-                    end = name.find(delimiter, len(prefix))
-                    if path is not None:
-                        if name == path:
-                            continue
-                        if end >= 0 and len(name) > end + len(delimiter):
-                            marker = name[:end] + chr(ord(delimiter) + 1)
-                            curs.close()
-                            break
-                    elif end > 0:
-                        marker = name[:end] + chr(ord(delimiter) + 1)
-                        dir_name = name[:end + 1]
-                        if dir_name != orig_marker:
-                            results.append([dir_name, '0', 0, None, ''])
-                        curs.close()
-                        break
-                    results.append(row)
-                if not rowcount:
-                    break
-            return results
-
-    def merge_items(self, item_list, source=None):
-        """
-        Merge items into the object table.
-
-        :param item_list: list of dictionaries of {'name', 'created_at',
-                          'size', 'content_type', 'etag', 'deleted'}
-        :param source: if defined, update incoming_sync with the source
-        """
-        with self.get() as conn:
-            max_rowid = -1
-            for rec in item_list:
-                query = '''
-                    DELETE FROM object
-                    WHERE name = ? AND (created_at < ?)
-                '''
-                if self.get_db_version(conn) >= 1:
-                    query += ' AND deleted IN (0, 1)'
-                conn.execute(query, (rec['name'], rec['created_at']))
-                query = 'SELECT 1 FROM object WHERE name = ?'
-                if self.get_db_version(conn) >= 1:
-                    query += ' AND deleted IN (0, 1)'
-                if not conn.execute(query, (rec['name'],)).fetchall():
-                    conn.execute('''
-                        INSERT INTO object (name, created_at, size,
-                            content_type, etag, deleted)
-                        VALUES (?, ?, ?, ?, ?, ?)
-                    ''', ([rec['name'], rec['created_at'], rec['size'],
-                          rec['content_type'], rec['etag'], rec['deleted']]))
-                if source:
-                    max_rowid = max(max_rowid, rec['ROWID'])
-            if source:
-                try:
-                    conn.execute('''
-                        INSERT INTO incoming_sync (sync_point, remote_id)
-                        VALUES (?, ?)
-                    ''', (max_rowid, source))
-                except sqlite3.IntegrityError:
-                    conn.execute('''
-                        UPDATE incoming_sync SET sync_point=max(?, sync_point)
-                        WHERE remote_id=?
-                    ''', (max_rowid, source))
-            conn.commit()
-
-
-class AccountBroker(DatabaseBroker):
-    """Encapsulates working with a account database."""
-    db_type = 'account'
-    db_contains_type = 'container'
-
-    def _initialize(self, conn, put_timestamp):
-        """
-        Create a brand new database (tables, indices, triggers, etc.)
-
-        :param conn: DB connection object
-        :param put_timestamp: put timestamp
-        """
-        if not self.account:
-            raise ValueError(
-                'Attempting to create a new database with no account set')
-        self.create_container_table(conn)
-        self.create_account_stat_table(conn, put_timestamp)
-
-    def create_container_table(self, conn):
-        """
-        Create container table which is specific to the account DB.
-
-        :param conn: DB connection object
-        """
-        conn.executescript("""
-            CREATE TABLE container (
-                ROWID INTEGER PRIMARY KEY AUTOINCREMENT,
-                name TEXT,
-                put_timestamp TEXT,
-                delete_timestamp TEXT,
-                object_count INTEGER,
-                bytes_used INTEGER,
-                deleted INTEGER DEFAULT 0
-            );
-
-            CREATE INDEX ix_container_deleted_name ON
-                container (deleted, name);
-
-            CREATE TRIGGER container_insert AFTER INSERT ON container
-            BEGIN
-                UPDATE account_stat
-                SET container_count = container_count + (1 - new.deleted),
-                    object_count = object_count + new.object_count,
-                    bytes_used = bytes_used + new.bytes_used,
-                    hash = chexor(hash, new.name,
-                                  new.put_timestamp || '-' ||
-                                    new.delete_timestamp || '-' ||
-                                    new.object_count || '-' || new.bytes_used);
-            END;
-
-            CREATE TRIGGER container_update BEFORE UPDATE ON container
-            BEGIN
-                SELECT RAISE(FAIL, 'UPDATE not allowed; DELETE and INSERT');
-            END;
-
-
-            CREATE TRIGGER container_delete AFTER DELETE ON container
-            BEGIN
-                UPDATE account_stat
-                SET container_count = container_count - (1 - old.deleted),
-                    object_count = object_count - old.object_count,
-                    bytes_used = bytes_used - old.bytes_used,
-                    hash = chexor(hash, old.name,
-                                  old.put_timestamp || '-' ||
-                                    old.delete_timestamp || '-' ||
-                                    old.object_count || '-' || old.bytes_used);
-            END;
-        """)
-
-    def create_account_stat_table(self, conn, put_timestamp):
-        """
-        Create account_stat table which is specific to the account DB.
-
-        :param conn: DB connection object
-        :param put_timestamp: put timestamp
-        """
-        conn.executescript("""
-            CREATE TABLE account_stat (
-                account TEXT,
-                created_at TEXT,
-                put_timestamp TEXT DEFAULT '0',
-                delete_timestamp TEXT DEFAULT '0',
-                container_count INTEGER,
-                object_count INTEGER DEFAULT 0,
-                bytes_used INTEGER DEFAULT 0,
-                hash TEXT default '00000000000000000000000000000000',
-                id TEXT,
-                status TEXT DEFAULT '',
-                status_changed_at TEXT DEFAULT '0',
-                metadata TEXT DEFAULT ''
-            );
-
-            INSERT INTO account_stat (container_count) VALUES (0);
-        """)
-
-        conn.execute('''
-            UPDATE account_stat SET account = ?, created_at = ?, id = ?,
-                   put_timestamp = ?
-            ''', (self.account, normalize_timestamp(time.time()), str(uuid4()),
-                  put_timestamp))
-
-    def get_db_version(self, conn):
-        if self._db_version == -1:
-            self._db_version = 0
-            for row in conn.execute('''
-                    SELECT name FROM sqlite_master
-                    WHERE name = 'ix_container_deleted_name' '''):
-                self._db_version = 1
-        return self._db_version
-
-    def update_put_timestamp(self, timestamp):
-        """
-        Update the put_timestamp.  Only modifies it if it is greater than
-        the current timestamp.
-
-        :param timestamp: put timestamp
-        """
-        with self.get() as conn:
-            conn.execute('''
-                UPDATE account_stat SET put_timestamp = ?
-                WHERE put_timestamp < ? ''', (timestamp, timestamp))
+            self._update_status_changed_at(conn, timestamp)
             conn.commit()
 
-    def _delete_db(self, conn, timestamp, force=False):
-        """
-        Mark the DB as deleted.
-
-        :param conn: DB connection object
-        :param timestamp: timestamp to mark as deleted
-        """
-        conn.execute("""
-            UPDATE account_stat
-            SET delete_timestamp = ?,
-                status = 'DELETED',
-                status_changed_at = ?
-            WHERE delete_timestamp < ? """, (timestamp, timestamp, timestamp))
-
-    def _commit_puts(self, item_list=None):
-        """Handles commiting rows in .pending files."""
-        if self.db_file == ':memory:' or not os.path.exists(self.pending_file):
-            return
-        if item_list is None:
-            item_list = []
-        with lock_parent_directory(self.pending_file, self.pending_timeout):
-            self._preallocate()
-            if not os.path.getsize(self.pending_file):
-                if item_list:
-                    self.merge_items(item_list)
-                return
-            with open(self.pending_file, 'r+b') as fp:
-                for entry in fp.read().split(':'):
-                    if entry:
-                        try:
-                            (name, put_timestamp, delete_timestamp,
-                             object_count, bytes_used, deleted) = \
-                                pickle.loads(entry.decode('base64'))
-                            item_list.append(
-                                {'name': name,
-                                 'put_timestamp': put_timestamp,
-                                 'delete_timestamp': delete_timestamp,
-                                 'object_count': object_count,
-                                 'bytes_used': bytes_used,
-                                 'deleted': deleted})
-                        except Exception:
-                            self.logger.exception(
-                                _('Invalid pending entry %(file)s: %(entry)s'),
-                                {'file': self.pending_file, 'entry': entry})
-                if item_list:
-                    self.merge_items(item_list)
-                try:
-                    os.ftruncate(fp.fileno(), 0)
-                except OSError, err:
-                    if err.errno != errno.ENOENT:
-                        raise
-
-    def empty(self):
-        """
-        Check if the account DB is empty.
-
-        :returns: True if the database has no active containers.
-        """
-        try:
-            self._commit_puts()
-        except LockTimeout:
-            if not self.stale_reads_ok:
-                raise
-        with self.get() as conn:
-            row = conn.execute(
-                'SELECT container_count from account_stat').fetchone()
-            return (row[0] == 0)
-
-    def reclaim(self, container_timestamp, sync_timestamp):
-        """
-        Delete rows from the container table that are marked deleted and
-        whose created_at timestamp is < container_timestamp.  Also deletes rows
-        from incoming_sync and outgoing_sync where the updated_at timestamp is
-        < sync_timestamp.
-
-        In addition, this calls the DatabaseBroker's :func:_reclaim method.
-
-        :param container_timestamp: max created_at timestamp of container rows
-                                    to delete
-        :param sync_timestamp: max update_at timestamp of sync rows to delete
-        """
-
-        self._commit_puts()
-        with self.get() as conn:
-            conn.execute('''
-                DELETE FROM container WHERE
-                deleted = 1 AND delete_timestamp < ?
-            ''', (container_timestamp,))
-            try:
-                conn.execute('''
-                    DELETE FROM outgoing_sync WHERE updated_at < ?
-                ''', (sync_timestamp,))
-                conn.execute('''
-                    DELETE FROM incoming_sync WHERE updated_at < ?
-                ''', (sync_timestamp,))
-            except sqlite3.OperationalError, err:
-                # Old dbs didn't have updated_at in the _sync tables.
-                if 'no such column: updated_at' not in str(err):
-                    raise
-            DatabaseBroker._reclaim(self, conn, container_timestamp)
-            conn.commit()
-
-    def get_container_timestamp(self, container_name):
-        """
-        Get the put_timestamp of a container.
-
-        :param container_name: container name
-
-        :returns: put_timestamp of the container
-        """
-        try:
-            self._commit_puts()
-        except LockTimeout:
-            if not self.stale_reads_ok:
-                raise
-        with self.get() as conn:
-            ret = conn.execute('''
-                SELECT put_timestamp FROM container
-                WHERE name = ? AND deleted != 1''',
-                              (container_name,)).fetchone()
-            if ret:
-                ret = ret[0]
-            return ret
-
-    def put_container(self, name, put_timestamp, delete_timestamp,
-                      object_count, bytes_used):
-        """
-        Create a container with the given attributes.
-
-        :param name: name of the container to create
-        :param put_timestamp: put_timestamp of the container to create
-        :param delete_timestamp: delete_timestamp of the container to create
-        :param object_count: number of objects in the container
-        :param bytes_used: number of bytes used by the container
-        """
-        if delete_timestamp > put_timestamp and \
-                object_count in (None, '', 0, '0'):
-            deleted = 1
-        else:
-            deleted = 0
-        record = {'name': name, 'put_timestamp': put_timestamp,
-                  'delete_timestamp': delete_timestamp,
-                  'object_count': object_count,
-                  'bytes_used': bytes_used,
-                  'deleted': deleted}
-        if self.db_file == ':memory:':
-            self.merge_items([record])
-            return
-        if not os.path.exists(self.db_file):
-            raise DatabaseConnectionError(self.db_file, "DB doesn't exist")
-        pending_size = 0
-        try:
-            pending_size = os.path.getsize(self.pending_file)
-        except OSError, err:
-            if err.errno != errno.ENOENT:
-                raise
-        if pending_size > PENDING_CAP:
-            self._commit_puts([record])
-        else:
-            with lock_parent_directory(self.pending_file,
-                                       self.pending_timeout):
-                with open(self.pending_file, 'a+b') as fp:
-                    # Colons aren't used in base64 encoding; so they are our
-                    # delimiter
-                    fp.write(':')
-                    fp.write(pickle.dumps(
-                        (name, put_timestamp, delete_timestamp, object_count,
-                         bytes_used, deleted),
-                        protocol=PICKLE_PROTOCOL).encode('base64'))
-                    fp.flush()
-
-    def can_delete_db(self, cutoff):
-        """
-        Check if the accont DB can be deleted.
-
-        :returns: True if the account can be deleted, False otherwise
-        """
-        self._commit_puts()
-        with self.get() as conn:
-            row = conn.execute('''
-                SELECT status, put_timestamp, delete_timestamp, container_count
-                FROM account_stat''').fetchone()
-            # The account is considered deleted if its status is marked
-            # as 'DELETED" and the delete_timestamp is older than the supplied
-            # cutoff date; or if the delete_timestamp value is greater than
-            # the put_timestamp, and there are no containers for the account
-            status_del = (row['status'] == 'DELETED')
-            deltime = float(row['delete_timestamp'])
-            past_cutoff = (deltime < cutoff)
-            time_later = (row['delete_timestamp'] > row['put_timestamp'])
-            no_containers = (row['container_count'] in (None, '', 0, '0'))
-            return (
-                (status_del and past_cutoff) or (time_later and no_containers))
-
-    def is_deleted(self):
-        """
-        Check if the account DB is considered to be deleted.
-
-        :returns: True if the account DB is considered to be deleted, False
-                  otherwise
-        """
-        if self.db_file != ':memory:' and not os.path.exists(self.db_file):
-            return True
-        try:
-            self._commit_puts()
-        except LockTimeout:
-            if not self.stale_reads_ok:
-                raise
-        with self.get() as conn:
-            row = conn.execute('''
-                SELECT put_timestamp, delete_timestamp, container_count, status
-                FROM account_stat''').fetchone()
-            return row['status'] == 'DELETED' or (
-                row['container_count'] in (None, '', 0, '0') and
-                row['delete_timestamp'] > row['put_timestamp'])
-
-    def is_status_deleted(self):
-        """Only returns true if the status field is set to DELETED."""
-        with self.get() as conn:
-            row = conn.execute('''
-                SELECT status
-                FROM account_stat''').fetchone()
-            return (row['status'] == "DELETED")
-
-    def get_info(self):
-        """
-        Get global data for the account.
-
-        :returns: dict with keys: account, created_at, put_timestamp,
-                  delete_timestamp, container_count, object_count,
-                  bytes_used, hash, id
-        """
-        try:
-            self._commit_puts()
-        except LockTimeout:
-            if not self.stale_reads_ok:
-                raise
-        with self.get() as conn:
-            return dict(conn.execute('''
-                SELECT account, created_at,  put_timestamp, delete_timestamp,
-                       container_count, object_count, bytes_used, hash, id
-                FROM account_stat
-            ''').fetchone())
-
-    def list_containers_iter(self, limit, marker, end_marker, prefix,
-                             delimiter):
-        """
-        Get a list of containerss sorted by name starting at marker onward, up
-        to limit entries.  Entries will begin with the prefix and will not
-        have the delimiter after the prefix.
-
-        :param limit: maximum number of entries to get
-        :param marker: marker query
-        :param end_marker: end marker query
-        :param prefix: prefix query
-        :param delimiter: delimiter for query
-
-        :returns: list of tuples of (name, object_count, bytes_used, 0)
-        """
-        (marker, end_marker, prefix, delimiter) = utf8encode(
-            marker, end_marker, prefix, delimiter)
-        try:
-            self._commit_puts()
-        except LockTimeout:
-            if not self.stale_reads_ok:
-                raise
-        if delimiter and not prefix:
-            prefix = ''
-        orig_marker = marker
-        with self.get() as conn:
-            results = []
-            while len(results) < limit:
-                query = """
-                    SELECT name, object_count, bytes_used, 0
-                    FROM container
-                    WHERE deleted = 0 AND """
-                query_args = []
-                if end_marker:
-                    query += ' name < ? AND'
-                    query_args.append(end_marker)
-                if marker and marker >= prefix:
-                    query += ' name > ? AND'
-                    query_args.append(marker)
-                elif prefix:
-                    query += ' name >= ? AND'
-                    query_args.append(prefix)
-                if self.get_db_version(conn) < 1:
-                    query += ' +deleted = 0'
-                else:
-                    query += ' deleted = 0'
-                query += ' ORDER BY name LIMIT ?'
-                query_args.append(limit - len(results))
-                curs = conn.execute(query, query_args)
-                curs.row_factory = None
-
-                if prefix is None:
-                    return [r for r in curs]
-                if not delimiter:
-                    return [r for r in curs if r[0].startswith(prefix)]
-                rowcount = 0
-                for row in curs:
-                    rowcount += 1
-                    marker = name = row[0]
-                    if len(results) >= limit or not name.startswith(prefix):
-                        curs.close()
-                        return results
-                    end = name.find(delimiter, len(prefix))
-                    if end > 0:
-                        marker = name[:end] + chr(ord(delimiter) + 1)
-                        dir_name = name[:end + 1]
-                        if dir_name != orig_marker:
-                            results.append([dir_name, 0, 0, 1])
-                        curs.close()
-                        break
-                    results.append(row)
-                if not rowcount:
-                    break
-            return results
-
-    def merge_items(self, item_list, source=None):
-        """
-        Merge items into the container table.
-
-        :param item_list: list of dictionaries of {'name', 'put_timestamp',
-                          'delete_timestamp', 'object_count', 'bytes_used',
-                          'deleted'}
-        :param source: if defined, update incoming_sync with the source
-        """
-        with self.get() as conn:
-            max_rowid = -1
-            for rec in item_list:
-                record = [rec['name'], rec['put_timestamp'],
-                          rec['delete_timestamp'], rec['object_count'],
-                          rec['bytes_used'], rec['deleted']]
-                query = '''
-                    SELECT name, put_timestamp, delete_timestamp,
-                           object_count, bytes_used, deleted
-                    FROM container WHERE name = ?
-                '''
-                if self.get_db_version(conn) >= 1:
-                    query += ' AND deleted IN (0, 1)'
-                curs = conn.execute(query, (rec['name'],))
-                curs.row_factory = None
-                row = curs.fetchone()
-                if row:
-                    row = list(row)
-                    for i in xrange(5):
-                        if record[i] is None and row[i] is not None:
-                            record[i] = row[i]
-                    if row[1] > record[1]:  # Keep newest put_timestamp
-                        record[1] = row[1]
-                    if row[2] > record[2]:  # Keep newest delete_timestamp
-                        record[2] = row[2]
-                    # If deleted, mark as such
-                    if record[2] > record[1] and \
-                            record[3] in (None, '', 0, '0'):
-                        record[5] = 1
-                    else:
-                        record[5] = 0
-                conn.execute('''
-                    DELETE FROM container WHERE name = ? AND
-                                                deleted IN (0, 1)
-                ''', (record[0],))
-                conn.execute('''
-                    INSERT INTO container (name, put_timestamp,
-                        delete_timestamp, object_count, bytes_used,
-                        deleted)
-                    VALUES (?, ?, ?, ?, ?, ?)
-                ''', record)
-                if source:
-                    max_rowid = max(max_rowid, rec['ROWID'])
-            if source:
-                try:
-                    conn.execute('''
-                        INSERT INTO incoming_sync (sync_point, remote_id)
-                        VALUES (?, ?)
-                    ''', (max_rowid, source))
-                except sqlite3.IntegrityError:
-                    conn.execute('''
-                        UPDATE incoming_sync SET sync_point=max(?, sync_point)
-                        WHERE remote_id=?
-                    ''', (max_rowid, source))
-            conn.commit()
+    def _update_status_changed_at(self, conn, timestamp):
+        conn.execute(
+            'UPDATE %s_stat SET status_changed_at = ?'
+            ' WHERE status_changed_at < ?' % self.db_type,
+            (timestamp, timestamp))
diff --git a/swift/common/db_auditor.py b/swift/common/db_auditor.py
new file mode 100644
index 0000000000..5a4d7f7831
--- /dev/null
+++ b/swift/common/db_auditor.py
@@ -0,0 +1,168 @@
+# Copyright (c) 2010-2018 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import os
+import time
+from random import random
+
+from eventlet import Timeout
+
+import swift.common.db
+from swift.common.utils import get_logger, audit_location_generator, \
+    config_true_value, dump_recon_cache, EventletRateLimiter
+from swift.common.daemon import Daemon
+from swift.common.exceptions import DatabaseAuditorException
+from swift.common.recon import DEFAULT_RECON_CACHE_PATH, \
+    server_type_to_recon_file
+
+
+class DatabaseAuditor(Daemon):
+    """Base Database Auditor."""
+
+    @property
+    def rcache(self):
+        return os.path.join(
+            self.recon_cache_path,
+            server_type_to_recon_file(self.server_type))
+
+    @property
+    def server_type(self):
+        raise NotImplementedError
+
+    @property
+    def broker_class(self):
+        raise NotImplementedError
+
+    def __init__(self, conf, logger=None):
+        self.conf = conf
+        self.logger = logger or get_logger(conf, log_route='{}-auditor'.format(
+            self.server_type))
+        self.devices = conf.get('devices', '/srv/node')
+        self.mount_check = config_true_value(conf.get('mount_check', 'true'))
+        self.interval = float(conf.get('interval', 1800))
+        self.logging_interval = 3600  # once an hour
+        self.passes = 0
+        self.failures = 0
+        self.max_dbs_per_second = \
+            float(conf.get('{}s_per_second'.format(self.server_type), 200))
+        self.rate_limiter = EventletRateLimiter(self.max_dbs_per_second)
+        swift.common.db.DB_PREALLOCATION = \
+            config_true_value(conf.get('db_preallocation', 'f'))
+        self.recon_cache_path = conf.get('recon_cache_path',
+                                         DEFAULT_RECON_CACHE_PATH)
+        self.datadir = '{}s'.format(self.server_type)
+
+    def _one_audit_pass(self, reported):
+        all_locs = audit_location_generator(self.devices, self.datadir, '.db',
+                                            mount_check=self.mount_check,
+                                            logger=self.logger)
+        for path, device, partition in all_locs:
+            self.audit(path)
+            if time.time() - reported >= self.logging_interval:
+                self.logger.info(
+                    'Since %(time)s: %(server_type)s audits: %(pass)s '
+                    'passed audit, %(fail)s failed audit',
+                    {'time': time.ctime(reported),
+                     'pass': self.passes,
+                     'fail': self.failures,
+                     'server_type': self.server_type})
+                dump_recon_cache(
+                    {'{}_audits_since'.format(self.server_type): reported,
+                     '{}_audits_passed'.format(self.server_type): self.passes,
+                     '{}_audits_failed'.format(self.server_type):
+                         self.failures},
+                    self.rcache, self.logger)
+                reported = time.time()
+                self.passes = 0
+                self.failures = 0
+            self.rate_limiter.wait()
+        return reported
+
+    def run_forever(self, *args, **kwargs):
+        """Run the database audit until stopped."""
+        reported = time.time()
+        time.sleep(random() * self.interval)
+        while True:
+            self.logger.info(
+                'Begin %s audit pass.', self.server_type)
+            begin = time.time()
+            try:
+                reported = self._one_audit_pass(reported)
+            except (Exception, Timeout):
+                self.logger.increment('errors')
+                self.logger.exception('ERROR auditing')
+            elapsed = time.time() - begin
+            self.logger.info(
+                '%(server_type)s audit pass completed: %(elapsed).02fs',
+                {'elapsed': elapsed, 'server_type': self.server_type.title()})
+            dump_recon_cache({
+                '{}_auditor_pass_completed'.format(self.server_type): elapsed},
+                self.rcache, self.logger)
+            if elapsed < self.interval:
+                time.sleep(self.interval - elapsed)
+
+    def run_once(self, *args, **kwargs):
+        """Run the database audit once."""
+        self.logger.info(
+            'Begin %s audit "once" mode', self.server_type)
+        begin = reported = time.time()
+        self._one_audit_pass(reported)
+        elapsed = time.time() - begin
+        self.logger.info(
+            '%(server_type)s audit "once" mode completed: %(elapsed).02fs',
+            {'elapsed': elapsed, 'server_type': self.server_type.title()})
+        dump_recon_cache(
+            {'{}_auditor_pass_completed'.format(self.server_type): elapsed},
+            self.rcache, self.logger)
+
+    def audit(self, path):
+        """
+        Audits the given database path
+
+        :param path: the path to a db
+        """
+        start_time = time.time()
+        try:
+            broker = self.broker_class(path, logger=self.logger)
+            if not broker.is_deleted():
+                info = broker.get_info()
+                err = self._audit(info, broker)
+                if err:
+                    raise err
+                self.logger.increment('passes')
+                self.passes += 1
+                self.logger.debug('Audit passed for %s', broker)
+        except DatabaseAuditorException as e:
+            self.logger.increment('failures')
+            self.failures += 1
+            self.logger.error('Audit Failed for %(path)s: %(err)s',
+                              {'path': path, 'err': str(e)})
+        except (Exception, Timeout):
+            self.logger.increment('failures')
+            self.failures += 1
+            self.logger.exception(
+                'ERROR Could not get %(server_type)s info %(path)s',
+                {'server_type': self.server_type, 'path': path})
+        self.logger.timing_since('timing', start_time)
+
+    def _audit(self, info, broker):
+        """
+        Run any additional audit checks in sub auditor classes
+
+        :param info: The DB <account/container>_info
+        :param broker: The broker
+        :return: None on success, otherwise an exception to throw.
+        """
+        raise NotImplementedError
diff --git a/swift/common/db_replicator.py b/swift/common/db_replicator.py
index ed16177ed5..37403bd03f 100644
--- a/swift/common/db_replicator.py
+++ b/swift/common/db_replicator.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,7 +13,8 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-from __future__ import with_statement
+import json
+import logging
 import os
 import random
 import math
@@ -22,22 +23,31 @@
 import uuid
 import errno
 import re
+from contextlib import contextmanager
 
 from eventlet import GreenPool, sleep, Timeout
 from eventlet.green import subprocess
-import simplejson
 
 import swift.common.db
+from swift.common.constraints import check_drive
 from swift.common.utils import get_logger, whataremyips, storage_directory, \
     renamer, mkdirs, lock_parent_directory, config_true_value, \
-    unlink_older_than, dump_recon_cache, rsync_ip
+    unlink_older_than, dump_recon_cache, rsync_module_interpolation, \
+    parse_override_options, round_robin_iter, Everything, get_db_files, \
+    parse_db_filename, quote, RateLimitedIterator, config_auto_int_value, \
+    listdir, unlink_paths_older_than
+
 from swift.common import ring
-from swift.common.http import HTTP_NOT_FOUND, HTTP_INSUFFICIENT_STORAGE
+from swift.common.ring.utils import is_local_device
+from swift.common.http import HTTP_NOT_FOUND, HTTP_INSUFFICIENT_STORAGE, \
+    is_success
 from swift.common.bufferedhttp import BufferedHTTPConnection
-from swift.common.exceptions import DriveNotMounted, ConnectionTimeout
+from swift.common.exceptions import DriveNotMounted
 from swift.common.daemon import Daemon
 from swift.common.swob import Response, HTTPNotFound, HTTPNoContent, \
-    HTTPAccepted, HTTPInsufficientStorage, HTTPBadRequest
+    HTTPAccepted, HTTPBadRequest
+from swift.common.recon import DEFAULT_RECON_CACHE_PATH, \
+    server_type_to_recon_file
 
 
 DEBUG_TIMINGS_THRESHOLD = 10
@@ -57,12 +67,23 @@ def quarantine_db(object_file, server_type):
         os.path.join(object_dir, '..', '..', '..', '..', 'quarantined',
                      server_type + 's', os.path.basename(object_dir)))
     try:
-        renamer(object_dir, quarantine_dir)
-    except OSError, e:
+        renamer(object_dir, quarantine_dir, fsync=False)
+    except OSError as e:
         if e.errno not in (errno.EEXIST, errno.ENOTEMPTY):
             raise
         quarantine_dir = "%s-%s" % (quarantine_dir, uuid.uuid4().hex)
-        renamer(object_dir, quarantine_dir)
+        renamer(object_dir, quarantine_dir, fsync=False)
+
+
+def looks_like_partition(dir_name):
+    """
+    True if the directory name is a valid partition number, False otherwise.
+    """
+    try:
+        part = int(dir_name)
+        return part >= 0
+    except ValueError:
+        return False
 
 
 def roundrobin_datadirs(datadirs):
@@ -72,38 +93,59 @@ def roundrobin_datadirs(datadirs):
     found (in their proper places). The partitions within each data
     dir are walked randomly, however.
 
-    :param datadirs: a list of (path, node_id) to walk
-    :returns: A generator of (partition, path_to_db_file, node_id)
+    :param datadirs: a list of tuples of (path, context, partition_filter) to
+                     walk. The context may be any object; the context is not
+                     used by this function but is included with each yielded
+                     tuple.
+    :returns: A generator of (partition, path_to_db_file, context)
     """
 
-    def walk_datadir(datadir, node_id):
-        partitions = os.listdir(datadir)
+    def walk_datadir(datadir, context, part_filter):
+        partitions = [pd for pd in os.listdir(datadir)
+                      if looks_like_partition(pd) and part_filter(pd)]
         random.shuffle(partitions)
         for partition in partitions:
             part_dir = os.path.join(datadir, partition)
             if not os.path.isdir(part_dir):
                 continue
             suffixes = os.listdir(part_dir)
+            if not suffixes:
+                os.rmdir(part_dir)
+                continue
             for suffix in suffixes:
                 suff_dir = os.path.join(part_dir, suffix)
                 if not os.path.isdir(suff_dir):
                     continue
                 hashes = os.listdir(suff_dir)
+                if not hashes:
+                    os.rmdir(suff_dir)
+                    continue
                 for hsh in hashes:
                     hash_dir = os.path.join(suff_dir, hsh)
                     if not os.path.isdir(hash_dir):
                         continue
                     object_file = os.path.join(hash_dir, hsh + '.db')
+                    # common case
                     if os.path.exists(object_file):
-                        yield (partition, object_file, node_id)
+                        yield (partition, object_file, context)
+                        continue
+                    # look for any alternate db filenames
+                    db_files = get_db_files(object_file)
+                    if db_files:
+                        yield (partition, db_files[-1], context)
+                        continue
+                    try:
+                        os.rmdir(hash_dir)
+                    except OSError as e:
+                        if e.errno != errno.ENOTEMPTY:
+                            raise
 
-    its = [walk_datadir(datadir, node_id) for datadir, node_id in datadirs]
-    while its:
-        for it in its:
-            try:
-                yield it.next()
-            except StopIteration:
-                its.remove(it)
+    its = [walk_datadir(datadir, context, filt)
+           for datadir, context, filt in datadirs]
+
+    rr_its = round_robin_iter(its)
+    for datadir in rr_its:
+        yield datadir
 
 
 class ReplConnection(BufferedHTTPConnection):
@@ -112,10 +154,10 @@ class ReplConnection(BufferedHTTPConnection):
     """
 
     def __init__(self, node, partition, hash_, logger):
-        ""
         self.logger = logger
         self.node = node
-        BufferedHTTPConnection.__init__(self, '%(ip)s:%(port)s' % node)
+        host = "%s:%s" % (node['replication_ip'], node['replication_port'])
+        BufferedHTTPConnection.__init__(self, host)
         self.path = '/%s/%s/%s' % (node['device'], partition, hash_)
 
     def replicate(self, *args):
@@ -124,90 +166,193 @@ def replicate(self, *args):
 
         :param args: list of json-encodable objects
 
-        :returns: httplib response object
+        :returns: bufferedhttp response object
         """
         try:
-            body = simplejson.dumps(args)
+            body = json.dumps(args)
             self.request('REPLICATE', self.path, body,
                          {'Content-Type': 'application/json'})
             response = self.getresponse()
             response.data = response.read()
             return response
         except (Exception, Timeout):
+            self.close()
             self.logger.exception(
-                _('ERROR reading HTTP response from %s'), self.node)
+                'ERROR reading HTTP response from %s', self.node)
             return None
 
 
+class BrokerAnnotatedLogger:
+    """
+    Formats log messages with broker details.
+
+    This class augments messages with the broker's container path and DB
+    file path so that logs are easier to correlate during replication
+    and sharding workflows.
+    """
+    def __init__(self, logger):
+        self.logger = logger
+
+    def _get_broker_details(self, broker):
+        try:
+            db_file = broker.db_file
+        except Exception:  # noqa
+            db_file = ''
+        try:
+            path = broker.path
+        except Exception:  # noqa
+            path = ''
+        return path, db_file
+
+    def _format_log_msg(self, broker, msg, *args):
+        # make best effort to include broker properties...
+        path, db_file = self._get_broker_details(broker)
+        if args:
+            if len(args) == 1 and isinstance(args[0], dict):
+                args = args[0]
+            msg = msg % args
+        return '%s, path: %s, db: %s' % (msg, quote(path), db_file)
+
+    def _log(self, level, broker, msg, *args, **kwargs):
+        if not self.logger.isEnabledFor(level):
+            return
+        self.logger.log(level, self._format_log_msg(broker, msg, *args))
+
+    def debug(self, broker, msg, *args, **kwargs):
+        self._log(logging.DEBUG, broker, msg, *args, **kwargs)
+
+    def info(self, broker, msg, *args, **kwargs):
+        self._log(logging.INFO, broker, msg, *args, **kwargs)
+
+    def warning(self, broker, msg, *args, **kwargs):
+        self._log(logging.WARNING, broker, msg, *args, **kwargs)
+
+    def error(self, broker, msg, *args, **kwargs):
+        self._log(logging.ERROR, broker, msg, *args, **kwargs)
+
+    def exception(self, broker, msg, *args, **kwargs):
+        if not self.logger.isEnabledFor(logging.ERROR):
+            return
+        self.logger.exception(self._format_log_msg(broker, msg, *args))
+
+
 class Replicator(Daemon):
     """
     Implements the logic for directing db replication.
     """
 
-    def __init__(self, conf):
+    def __init__(self, conf, logger=None):
         self.conf = conf
-        self.logger = get_logger(conf, log_route='replicator')
+        self.logger = logger or get_logger(conf, log_route='replicator')
         self.root = conf.get('devices', '/srv/node')
         self.mount_check = config_true_value(conf.get('mount_check', 'true'))
+        self.bind_ip = conf.get('bind_ip', '0.0.0.0')
         self.port = int(conf.get('bind_port', self.default_port))
         concurrency = int(conf.get('concurrency', 8))
         self.cpool = GreenPool(size=concurrency)
         swift_dir = conf.get('swift_dir', '/etc/swift')
         self.ring = ring.Ring(swift_dir, ring_name=self.server_type)
+        self._local_device_ids = {}
         self.per_diff = int(conf.get('per_diff', 1000))
         self.max_diffs = int(conf.get('max_diffs') or 100)
-        self.interval = int(conf.get('interval') or
-                            conf.get('run_pause') or 30)
-        self.vm_test_mode = config_true_value(conf.get('vm_test_mode', 'no'))
-        self.node_timeout = int(conf.get('node_timeout', 10))
+        self.interval = float(conf.get('interval') or
+                              conf.get('run_pause') or 30)
+        if 'run_pause' in conf:
+            if 'interval' in conf:
+                self.logger.warning(
+                    'Option %(type)s-replicator/run_pause is deprecated '
+                    'and %(type)s-replicator/interval is already configured. '
+                    'You can safely remove run_pause; it is now ignored and '
+                    'will be removed in a future version.'
+                    % {'type': self.server_type})
+            else:
+                self.logger.warning(
+                    'Option %(type)s-replicator/run_pause is deprecated '
+                    'and will be removed in a future version. '
+                    'Update your configuration to use option '
+                    '%(type)s-replicator/interval.'
+                    % {'type': self.server_type})
+        self.databases_per_second = float(
+            conf.get('databases_per_second', 50))
+        self.node_timeout = float(conf.get('node_timeout', 10))
         self.conn_timeout = float(conf.get('conn_timeout', 0.5))
+        self.rsync_compress = config_true_value(
+            conf.get('rsync_compress', 'no'))
+        self.rsync_module = conf.get('rsync_module', '').rstrip('/')
+        if not self.rsync_module:
+            self.rsync_module = '{replication_ip}::%s' % self.server_type
         self.reclaim_age = float(conf.get('reclaim_age', 86400 * 7))
         swift.common.db.DB_PREALLOCATION = \
             config_true_value(conf.get('db_preallocation', 'f'))
+        swift.common.db.QUERY_LOGGING = \
+            config_true_value(conf.get('db_query_logging', 'f'))
         self._zero_stats()
         self.recon_cache_path = conf.get('recon_cache_path',
-                                         '/var/cache/swift')
-        self.recon_replicator = '%s.recon' % self.server_type
+                                         DEFAULT_RECON_CACHE_PATH)
+        self.recon_replicator = server_type_to_recon_file(self.server_type)
         self.rcache = os.path.join(self.recon_cache_path,
                                    self.recon_replicator)
         self.extract_device_re = re.compile('%s%s([^%s]+)' % (
             self.root, os.path.sep, os.path.sep))
+        self.handoffs_only = config_true_value(conf.get('handoffs_only', 'no'))
+        self.handoff_delete = config_auto_int_value(
+            conf.get('handoff_delete', 'auto'), 0)
+        if self.handoff_delete >= self.ring.replica_count:
+            self.logger.warning(
+                'handoff_delete=%d is too high to have an effect on a ring '
+                'with replica count %d. Disabling.',
+                self.handoff_delete, self.ring.replica_count)
+            self.handoff_delete = 0
+        self.db_logger = BrokerAnnotatedLogger(logger=self.logger)
 
     def _zero_stats(self):
         """Zero out the stats."""
         self.stats = {'attempted': 0, 'success': 0, 'failure': 0, 'ts_repl': 0,
                       'no_change': 0, 'hashmatch': 0, 'rsync': 0, 'diff': 0,
                       'remove': 0, 'empty': 0, 'remote_merge': 0,
-                      'start': time.time(), 'diff_capped': 0}
+                      'start': time.time(), 'diff_capped': 0, 'deferred': 0,
+                      'failure_nodes': {}}
 
     def _report_stats(self):
         """Report the current stats to the logs."""
+        now = time.time()
         self.logger.info(
-            _('Attempted to replicate %(count)d dbs in %(time).5f seconds '
-              '(%(rate).5f/s)'),
+            'Attempted to replicate %(count)d dbs in %(time).5f seconds '
+            '(%(rate).5f/s)',
             {'count': self.stats['attempted'],
-             'time': time.time() - self.stats['start'],
+             'time': now - self.stats['start'],
              'rate': self.stats['attempted'] /
-                (time.time() - self.stats['start'] + 0.0000001)})
-        self.logger.info(_('Removed %(remove)d dbs') % self.stats)
-        self.logger.info(_('%(success)s successes, %(failure)s failures')
-                         % self.stats)
+                (now - self.stats['start'] + 0.0000001)})
+        self.logger.info('Removed %(remove)d dbs', self.stats)
+        self.logger.info('%(success)s successes, %(failure)s failures',
+                         self.stats)
         dump_recon_cache(
             {'replication_stats': self.stats,
-             'replication_time': time.time() - self.stats['start']},
+             'replication_time': now - self.stats['start'],
+             'replication_last': now},
             self.rcache, self.logger)
         self.logger.info(' '.join(['%s:%s' % item for item in
-                         self.stats.items() if item[0] in
+                         sorted(self.stats.items()) if item[0] in
                          ('no_change', 'hashmatch', 'rsync', 'diff', 'ts_repl',
-                          'empty', 'diff_capped')]))
+                          'empty', 'diff_capped', 'remote_merge')]))
+
+    def _add_failure_stats(self, failure_devs_info):
+        for node, dev in failure_devs_info:
+            self.stats['failure'] += 1
+            failure_devs = self.stats['failure_nodes'].setdefault(node, {})
+            failure_devs.setdefault(dev, 0)
+            failure_devs[dev] += 1
 
-    def _rsync_file(self, db_file, remote_file, whole_file=True):
+    def _rsync_file(self, broker, remote_file, whole_file=True,
+                    different_region=False):
         """
         Sync a single file using rsync. Used by _rsync_db to handle syncing.
 
-        :param db_file: file to be synced
+        :param broker: DB broker object of DB to be synced
         :param remote_file: remote location to sync the DB file to
         :param whole-file: if True, uses rsync's --whole-file flag
+        :param different_region: if True, the destination node is in a
+                                 different region
 
         :returns: True if the sync was successful, False otherwise
         """
@@ -216,16 +361,25 @@ def _rsync_file(self, db_file, remote_file, whole_file=True):
                       '--contimeout=%s' % int(math.ceil(self.conn_timeout))]
         if whole_file:
             popen_args.append('--whole-file')
-        popen_args.extend([db_file, remote_file])
+
+        if self.rsync_compress and different_region:
+            # Allow for compression, but only if the remote node is in
+            # a different region than the local one.
+            popen_args.append('--compress')
+
+        popen_args.extend([broker.db_file, remote_file])
         proc = subprocess.Popen(popen_args)
         proc.communicate()
         if proc.returncode != 0:
-            self.logger.error(_('ERROR rsync failed with %(code)s: %(args)s'),
-                              {'code': proc.returncode, 'args': popen_args})
+            self.db_logger.error(
+                broker,
+                'ERROR rsync failed with %s: %r',
+                proc.returncode, popen_args)
         return proc.returncode == 0
 
     def _rsync_db(self, broker, device, http, local_id,
-                  replicate_method='complete_rsync', replicate_timeout=None):
+                  replicate_method='complete_rsync', replicate_timeout=None,
+                  different_region=False):
         """
         Sync a whole db using rsync.
 
@@ -235,28 +389,38 @@ def _rsync_db(self, broker, device, http, local_id,
         :param local_id: unique ID of the local database replica
         :param replicate_method: remote operation to perform after rsync
         :param replicate_timeout: timeout to wait in seconds
+        :param different_region: if True, the destination node is in a
+                                 different region
         """
-        device_ip = rsync_ip(device['ip'])
-        if self.vm_test_mode:
-            remote_file = '%s::%s%s/%s/tmp/%s' % (
-                device_ip, self.server_type, device['port'], device['device'],
-                local_id)
-        else:
-            remote_file = '%s::%s/%s/tmp/%s' % (
-                device_ip, self.server_type, device['device'], local_id)
+        rsync_module = rsync_module_interpolation(self.rsync_module, device)
+        rsync_path = '%s/tmp/%s' % (device['device'], local_id)
+        remote_file = '%s/%s' % (rsync_module, rsync_path)
         mtime = os.path.getmtime(broker.db_file)
-        if not self._rsync_file(broker.db_file, remote_file):
+        if not self._rsync_file(broker, remote_file,
+                                different_region=different_region):
             return False
         # perform block-level sync if the db was modified during the first sync
         if os.path.exists(broker.db_file + '-journal') or \
                 os.path.getmtime(broker.db_file) > mtime:
             # grab a lock so nobody else can modify it
             with broker.lock():
-                if not self._rsync_file(broker.db_file, remote_file, False):
+                if not self._rsync_file(broker, remote_file, whole_file=False,
+                                        different_region=different_region):
                     return False
         with Timeout(replicate_timeout or self.node_timeout):
-            response = http.replicate(replicate_method, local_id)
-        return response and response.status >= 200 and response.status < 300
+            response = http.replicate(replicate_method, local_id,
+                                      os.path.basename(broker.db_file))
+        return response and 200 <= response.status < 300
+
+    def _send_replicate_request(self, http, *repl_args):
+        with Timeout(self.node_timeout):
+            response = http.replicate(*repl_args)
+        if not response or not is_success(response.status):
+            if response:
+                self.logger.error('ERROR Bad response %s from %s',
+                                  response.status, http.host)
+            return False
+        return True
 
     def _usync_db(self, point, broker, http, remote_id, local_id):
         """
@@ -272,34 +436,43 @@ def _usync_db(self, point, broker, http, remote_id, local_id):
         """
         self.stats['diff'] += 1
         self.logger.increment('diffs')
-        self.logger.debug(_('Syncing chunks with %s'), http.host)
+        self.db_logger.debug(
+            broker,
+            'usyncing chunks to %s, starting at row %s',
+            '%(ip)s:%(port)s/%(device)s' % http.node, point)
+        start = time.time()
         sync_table = broker.get_syncs()
         objects = broker.get_items_since(point, self.per_diff)
         diffs = 0
         while len(objects) and diffs < self.max_diffs:
             diffs += 1
-            with Timeout(self.node_timeout):
-                response = http.replicate('merge_items', objects, local_id)
-            if not response or response.status >= 300 or response.status < 200:
-                if response:
-                    self.logger.error(_('ERROR Bad response %(status)s from '
-                                        '%(host)s'),
-                                      {'status': response.status,
-                                       'host': http.host})
+            if not self._send_replicate_request(
+                    http, 'merge_items', objects, local_id):
                 return False
+            # replication relies on db order to send the next merge batch in
+            # order with no gaps
             point = objects[-1]['ROWID']
             objects = broker.get_items_since(point, self.per_diff)
+
+        self.db_logger.debug(
+            broker,
+            'usyncing chunks to %s, finished at row %s (%gs)',
+            '%(ip)s:%(port)s/%(device)s' % http.node,
+            point,
+            time.time() - start
+        )
+
         if objects:
-            self.logger.debug(_(
-                'Synchronization for %s has fallen more than '
-                '%s rows behind; moving on and will try again next pass.') %
-                (broker.db_file, self.max_diffs * self.per_diff))
+            self.db_logger.debug(
+                broker, 'Synchronization has fallen more than '
+                '%s rows behind; moving on and will try again next pass',
+                self.max_diffs * self.per_diff)
             self.stats['diff_capped'] += 1
             self.logger.increment('diff_caps')
         else:
             with Timeout(self.node_timeout):
                 response = http.replicate('merge_syncs', sync_table)
-            if response and response.status >= 200 and response.status < 300:
+            if response and 200 <= response.status < 300:
                 broker.merge_syncs([{'remote_id': remote_id,
                                      'sync_point': point}],
                                    incoming=False)
@@ -335,16 +508,24 @@ def _http_connect(self, node, partition, db_file):
         Make an http_connection using ReplConnection
 
         :param node: node dictionary from the ring
-        :param partition: partition partition to send in the url
+        :param partition: partition to send in the url
         :param db_file: DB file
 
         :returns: ReplConnection object
         """
-        return ReplConnection(node, partition,
-                              os.path.basename(db_file).split('.', 1)[0],
-                              self.logger)
+        hsh, other, ext = parse_db_filename(db_file)
+        return ReplConnection(node, partition, hsh, self.logger)
 
-    def _repl_to_node(self, node, broker, partition, info):
+    def _gather_sync_args(self, info):
+        """
+        Convert local replication_info to sync args tuple.
+        """
+        sync_args_order = ('max_row', 'hash', 'id', 'created_at',
+                           'put_timestamp', 'delete_timestamp', 'metadata')
+        return tuple(info[key] for key in sync_args_order)
+
+    def _repl_to_node(self, node, broker, partition, info,
+                      different_region=False):
         """
         Replicate a database to a node.
 
@@ -354,44 +535,127 @@ def _repl_to_node(self, node, broker, partition, info):
         :param info: DB info as a dictionary of {'max_row', 'hash', 'id',
                      'created_at', 'put_timestamp', 'delete_timestamp',
                      'metadata'}
+        :param different_region: if True, the destination node is in a
+                                 different region
 
         :returns: True if successful, False otherwise
         """
-        with ConnectionTimeout(self.conn_timeout):
-            http = self._http_connect(node, partition, broker.db_file)
-        if not http:
-            self.logger.error(
-                _('ERROR Unable to connect to remote server: %s'), node)
-            return False
+        http = self._http_connect(node, partition, broker.db_file)
+        sync_args = self._gather_sync_args(info)
         with Timeout(self.node_timeout):
-            response = http.replicate(
-                'sync', info['max_row'], info['hash'], info['id'],
-                info['created_at'], info['put_timestamp'],
-                info['delete_timestamp'], info['metadata'])
+            response = http.replicate('sync', *sync_args)
         if not response:
             return False
-        elif response.status == HTTP_NOT_FOUND:  # completely missing, rsync
+        return self._handle_sync_response(node, response, info, broker, http,
+                                          different_region=different_region)
+
+    def _handle_sync_response(self, node, response, info, broker, http,
+                              different_region=False):
+        if response.status == HTTP_NOT_FOUND:  # completely missing, rsync
             self.stats['rsync'] += 1
             self.logger.increment('rsyncs')
-            return self._rsync_db(broker, node, http, info['id'])
+            return self._rsync_db(broker, node, http, info['id'],
+                                  different_region=different_region)
         elif response.status == HTTP_INSUFFICIENT_STORAGE:
             raise DriveNotMounted()
-        elif response.status >= 200 and response.status < 300:
-            rinfo = simplejson.loads(response.data)
+        elif 200 <= response.status < 300:
+            rinfo = json.loads(response.data)
             local_sync = broker.get_sync(rinfo['id'], incoming=False)
-            if self._in_sync(rinfo, info, broker, local_sync):
-                return True
-            # if the difference in rowids between the two differs by
-            # more than 50%, rsync then do a remote merge.
-            if rinfo['max_row'] / float(info['max_row']) < 0.5:
-                self.stats['remote_merge'] += 1
-                self.logger.increment('remote_merges')
-                return self._rsync_db(broker, node, http, info['id'],
-                                      replicate_method='rsync_then_merge',
-                                      replicate_timeout=(info['count'] / 2000))
-            # else send diffs over to the remote server
-            return self._usync_db(max(rinfo['point'], local_sync),
-                                  broker, http, rinfo['id'], info['id'])
+            if rinfo.get('metadata', ''):
+                broker.update_metadata(json.loads(rinfo['metadata']))
+            return self._choose_replication_mode(
+                node, rinfo, info, local_sync, broker, http,
+                different_region)
+        return False
+
+    def _choose_replication_mode(self, node, rinfo, info, local_sync, broker,
+                                 http, different_region):
+        if self._in_sync(rinfo, info, broker, local_sync):
+            self.db_logger.debug(
+                broker,
+                'in sync with %(ip)s:%(port)s/%(device)s, '
+                'nothing to do', node)
+            return True
+
+        # if the difference in rowids between the two differs by
+        # more than 50% and the difference is greater than per_diff,
+        # rsync then do a remote merge.
+        # NOTE: difference > per_diff stops us from dropping to rsync
+        # on smaller containers, who have only a few rows to sync.
+        if (rinfo['max_row'] / float(info['max_row']) < 0.5 and
+                info['max_row'] - rinfo['max_row'] > self.per_diff):
+            self.stats['remote_merge'] += 1
+            self.logger.increment('remote_merges')
+            return self._rsync_db(broker, node, http, info['id'],
+                                  replicate_method='rsync_then_merge',
+                                  replicate_timeout=(info['count'] / 2000),
+                                  different_region=different_region)
+        # else send diffs over to the remote server
+        return self._usync_db(max(rinfo['point'], local_sync),
+                              broker, http, rinfo['id'], info['id'])
+
+    def _post_replicate_hook(self, broker, info, responses):
+        """
+        :param broker: broker instance for the database that just replicated
+        :param info: pre-replication full info dict
+        :param responses: a list of bools indicating success from nodes
+        """
+        pass
+
+    def cleanup_post_replicate(self, broker, orig_info, responses):
+        """
+        Cleanup non primary database from disk if needed.
+
+        :param broker: the broker for the database we're replicating
+        :param orig_info: snapshot of the broker replication info dict taken
+            before replication
+        :param responses: a list of boolean success values for each replication
+                          request to other nodes
+
+        :return success: returns False if deletion of the database was
+            attempted but unsuccessful, otherwise returns True.
+        """
+        log_template = 'Not deleting db (%s)'
+        max_row_delta = broker.get_max_row() - orig_info['max_row']
+        if max_row_delta < 0:
+            reason = 'negative max_row_delta: %s' % max_row_delta
+            self.db_logger.error(broker, log_template, reason)
+            return True
+        if max_row_delta:
+            reason = '%s new rows' % max_row_delta
+            self.db_logger.debug(broker, log_template, reason)
+            return True
+        if self.handoff_delete:
+            # delete handoff if we have had handoff_delete successes
+            successes_count = len([resp for resp in responses if resp])
+            delete_handoff = successes_count >= self.handoff_delete
+        else:
+            delete_handoff = responses and all(responses)
+        if not delete_handoff:
+            reason = '%s/%s success' % (responses.count(True), len(responses))
+            self.db_logger.debug(broker, log_template, reason)
+            return True
+        # If the db has been successfully synced to all of its peers, it can be
+        # removed. Callers should have already checked that the db is not on a
+        # primary node.
+        if not self.delete_db(broker):
+            self.db_logger.debug(broker, 'Failed to delete db')
+            return False
+        self.db_logger.debug(broker, 'Successfully deleted db')
+        return True
+
+    def _reclaim_tmp_dbs(self, broker, now):
+        fnames = listdir(broker.db_dir)
+        fnames = [os.path.join(broker.db_dir, fname) for fname in fnames
+                  if fname.endswith('.tmp')]
+        unlink_paths_older_than(fnames, now - self.reclaim_age)
+
+    def _reclaim(self, broker, now=None):
+        if not now:
+            now = time.time()
+        self._reclaim_tmp_dbs(broker, now)
+        return broker.reclaim(now - self.reclaim_age,
+                              now - (self.reclaim_age * 2))
 
     def _replicate_object(self, partition, object_file, node_id):
         """
@@ -400,90 +664,163 @@ def _replicate_object(self, partition, object_file, node_id):
 
         :param partition: partition to be replicated to
         :param object_file: DB file name to be replicated
-        :param node_id: node id of the node to be replicated to
+        :param node_id: node id of the node to be replicated from
+        :returns: a tuple (success, responses). ``success`` is a boolean that
+            is True if the method completed successfully, False otherwise.
+            ``responses`` is a list of booleans each of which indicates the
+            success or not of replicating to a peer node if replication has
+            been attempted. ``success`` is False if any of ``responses`` is
+            False; when ``responses`` is empty, ``success`` may be either True
+            or False.
         """
-        start_time = time.time()
-        self.logger.debug(_('Replicating db %s'), object_file)
+        start_time = now = time.time()
+        self.logger.debug('Replicating db %s', object_file)
         self.stats['attempted'] += 1
         self.logger.increment('attempts')
+        shouldbehere = True
+        responses = []
+        broker = None
         try:
-            broker = self.brokerclass(object_file, pending_timeout=30)
-            broker.reclaim(time.time() - self.reclaim_age,
-                           time.time() - (self.reclaim_age * 2))
+            broker = self.brokerclass(object_file, pending_timeout=30,
+                                      logger=self.logger)
+            self._reclaim(broker, now)
             info = broker.get_replication_info()
-            full_info = broker.get_info()
-        except (Exception, Timeout), e:
+            bpart = self.ring.get_part(
+                info['account'], info.get('container'))
+            if bpart != int(partition):
+                partition = bpart
+                # Important to set this false here since the later check only
+                # checks if it's on the proper device, not partition.
+                shouldbehere = False
+                self.db_logger.error(
+                    broker,
+                    'Found db that should be on partition %s; will '
+                    'replicate out and remove' % bpart)
+        except (Exception, Timeout) as e:
             if 'no such table' in str(e):
-                self.logger.error(_('Quarantining DB %s'), object_file)
+                if broker is None:
+                    self.logger.error('Quarantining DB %s', object_file)
+                else:
+                    self.db_logger.error(broker, 'Quarantining DB')
                 quarantine_db(broker.db_file, broker.db_type)
             else:
-                self.logger.exception(_('ERROR reading db %s'), object_file)
-            self.stats['failure'] += 1
+                if broker is None:
+                    self.logger.exception('ERROR reading db from %s',
+                                          object_file)
+                else:
+                    self.db_logger.exception(broker, 'ERROR reading db')
+            nodes = self.ring.get_part_nodes(int(partition))
+            self._add_failure_stats([(failure_dev['replication_ip'],
+                                      failure_dev['device'])
+                                     for failure_dev in nodes])
             self.logger.increment('failures')
-            return
-        # The db is considered deleted if the delete_timestamp value is greater
-        # than the put_timestamp, and there are no objects.
-        delete_timestamp = 0
-        try:
-            delete_timestamp = float(info['delete_timestamp'])
-        except ValueError:
-            pass
-        put_timestamp = 0
-        try:
-            put_timestamp = float(info['put_timestamp'])
-        except ValueError:
-            pass
-        if delete_timestamp < (time.time() - self.reclaim_age) and \
-                delete_timestamp > put_timestamp and \
-                info['count'] in (None, '', 0, '0'):
-            if self.report_up_to_date(full_info):
-                self.delete_db(object_file)
+            return False, responses
+        if broker.is_reclaimable(now, self.reclaim_age):
+            if self.report_up_to_date(info):
+                self.delete_db(broker)
             self.logger.timing_since('timing', start_time)
-            return
-        responses = []
+            return True, responses
+        failure_devs_info = set()
         nodes = self.ring.get_part_nodes(int(partition))
-        shouldbehere = bool([n for n in nodes if n['id'] == node_id])
+        local_dev = None
+        for node in nodes:
+            if node['id'] == node_id:
+                local_dev = node
+                break
+        if shouldbehere:
+            shouldbehere = bool([n for n in nodes if n['id'] == node_id])
         # See Footnote [1] for an explanation of the repl_nodes assignment.
-        i = 0
-        while i < len(nodes) and nodes[i]['id'] != node_id:
-            i += 1
-        repl_nodes = nodes[i + 1:] + nodes[:i]
+        if len(nodes) > 1:
+            i = 0
+            while i < len(nodes) and nodes[i]['id'] != node_id:
+                i += 1
+            repl_nodes = nodes[i + 1:] + nodes[:i]
+        else:  # Special case if using only a single replica
+            repl_nodes = nodes
         more_nodes = self.ring.get_more_nodes(int(partition))
+        if not local_dev:
+            # Check further if local device is a handoff node
+            for node in self.ring.get_more_nodes(int(partition)):
+                if node['id'] == node_id:
+                    local_dev = node
+                    break
         for node in repl_nodes:
+            different_region = False
+            if local_dev and local_dev['region'] != node['region']:
+                # This additional information will help later if we
+                # want to handle syncing to a node in different
+                # region with some optimizations.
+                different_region = True
             success = False
             try:
-                success = self._repl_to_node(node, broker, partition, info)
+                success = self._repl_to_node(node, broker, partition, info,
+                                             different_region)
             except DriveNotMounted:
-                repl_nodes.append(more_nodes.next())
-                self.logger.error(_('ERROR Remote drive not mounted %s'), node)
+                try:
+                    repl_nodes.append(next(more_nodes))
+                except StopIteration:
+                    self.db_logger.error(
+                        broker,
+                        'ERROR There are not enough handoff nodes to reach '
+                        'replica count for partition %s',
+                        partition)
+                self.db_logger.error(
+                    broker,
+                    'ERROR Remote drive not mounted %s', node)
             except (Exception, Timeout):
-                self.logger.exception(_('ERROR syncing %(file)s with node'
-                                        ' %(node)s'),
-                                      {'file': object_file, 'node': node})
-            self.stats['success' if success else 'failure'] += 1
+                self.db_logger.exception(
+                    broker, "ERROR syncing with %s", node)
+
+            if not success:
+                failure_devs_info.add((node['replication_ip'], node['device']))
             self.logger.increment('successes' if success else 'failures')
             responses.append(success)
-        if not shouldbehere and all(responses):
-            # If the db shouldn't be on this node and has been successfully
-            # synced to all of its peers, it can be removed.
-            self.delete_db(object_file)
+        try:
+            self._post_replicate_hook(broker, info, responses)
+        except (Exception, Timeout):
+            self.db_logger.exception(
+                broker, 'UNHANDLED EXCEPTION: in post replicate hook')
+        if not shouldbehere:
+            if not self.cleanup_post_replicate(broker, info, responses):
+                failure_devs_info.update(
+                    [(failure_dev['replication_ip'], failure_dev['device'])
+                     for failure_dev in repl_nodes])
+        target_devs_info = set([(target_dev['replication_ip'],
+                                 target_dev['device'])
+                                for target_dev in repl_nodes])
+        self.stats['success'] += len(target_devs_info - failure_devs_info)
+        self._add_failure_stats(failure_devs_info)
+
         self.logger.timing_since('timing', start_time)
+        if shouldbehere:
+            responses.append(True)
+        return all(responses), responses
 
-    def delete_db(self, object_file):
+    def delete_db(self, broker):
+        object_file = broker.db_file
         hash_dir = os.path.dirname(object_file)
         suf_dir = os.path.dirname(hash_dir)
         with lock_parent_directory(object_file):
             shutil.rmtree(hash_dir, True)
-        try:
-            os.rmdir(suf_dir)
-        except OSError, err:
-            if err.errno not in (errno.ENOENT, errno.ENOTEMPTY):
-                self.logger.exception(
-                    _('ERROR while trying to clean up %s') % suf_dir)
         self.stats['remove'] += 1
         device_name = self.extract_device(object_file)
         self.logger.increment('removes.' + device_name)
 
+        for parent_dir in (suf_dir, os.path.dirname(suf_dir)):
+            try:
+                os.rmdir(parent_dir)
+            except OSError as err:
+                if err.errno == errno.ENOTEMPTY:
+                    break
+                elif err.errno == errno.ENOENT:
+                    continue
+                else:
+                    self.db_logger.exception(
+                        broker,
+                        'ERROR while trying to clean up %s', parent_dir)
+                    return False
+        return True
+
     def extract_device(self, object_file):
         """
         Extract the device name from an object path.  Returns "UNKNOWN" if the
@@ -496,36 +833,98 @@ def extract_device(self, object_file):
             return match.groups()[0]
         return "UNKNOWN"
 
+    def _partition_dir_filter(self, device_id, partitions_to_replicate):
+
+        def filt(partition_dir):
+            partition = int(partition_dir)
+            if self.handoffs_only:
+                primary_node_ids = [
+                    d['id'] for d in self.ring.get_part_nodes(partition)]
+                if device_id in primary_node_ids:
+                    return False
+
+            if partition not in partitions_to_replicate:
+                return False
+
+            return True
+
+        return filt
+
     def report_up_to_date(self, full_info):
         return True
 
+    def roundrobin_datadirs(self, dirs):
+        return RateLimitedIterator(
+            roundrobin_datadirs(dirs),
+            elements_per_second=self.databases_per_second)
+
     def run_once(self, *args, **kwargs):
         """Run a replication pass once."""
+        override_options = parse_override_options(once=True, **kwargs)
+
+        devices_to_replicate = override_options.devices or Everything()
+        partitions_to_replicate = override_options.partitions or Everything()
+
         self._zero_stats()
         dirs = []
-        ips = whataremyips()
+        ips = whataremyips(self.bind_ip)
         if not ips:
-            self.logger.error(_('ERROR Failed to get my own IPs?'))
+            self.logger.error('ERROR Failed to get my own IPs?')
             return
+
+        if self.handoffs_only or self.handoff_delete:
+            self.logger.warning(
+                'Starting replication pass with handoffs_only '
+                'and/or handoffs_delete enabled. '
+                'These modes are not intended for normal '
+                'operation; use these options with care.')
+
+        self._local_device_ids = {}
+        found_local = False
         for node in self.ring.devs:
-            if node and node['ip'] in ips and node['port'] == self.port:
-                if self.mount_check and not os.path.ismount(
-                        os.path.join(self.root, node['device'])):
-                    self.logger.warn(
-                        _('Skipping %(device)s as it is not mounted') % node)
+            if node and is_local_device(ips, self.port,
+                                        node['replication_ip'],
+                                        node['replication_port']):
+                found_local = True
+                try:
+                    dev_path = check_drive(self.root, node['device'],
+                                           self.mount_check)
+                except ValueError as err:
+                    self._add_failure_stats(
+                        [(failure_dev['replication_ip'],
+                          failure_dev['device'])
+                         for failure_dev in self.ring.devs if failure_dev])
+                    self.logger.warning('Skipping: %s', err)
+                    continue
+                if node['device'] not in devices_to_replicate:
+                    self.logger.debug(
+                        'Skipping device %s due to given arguments',
+                        node['device'])
                     continue
                 unlink_older_than(
-                    os.path.join(self.root, node['device'], 'tmp'),
+                    os.path.join(dev_path, 'tmp'),
                     time.time() - self.reclaim_age)
                 datadir = os.path.join(self.root, node['device'], self.datadir)
                 if os.path.isdir(datadir):
-                    dirs.append((datadir, node['id']))
-        self.logger.info(_('Beginning replication run'))
-        for part, object_file, node_id in roundrobin_datadirs(dirs):
+                    self._local_device_ids[node['id']] = node
+                    part_filt = self._partition_dir_filter(
+                        node['id'], partitions_to_replicate)
+                    dirs.append((datadir, node['id'], part_filt))
+        if not found_local:
+            self.logger.error("Can't find itself %s with port %s in ring "
+                              "file, not replicating",
+                              ", ".join(ips), self.port)
+        self.logger.info('Beginning replication run')
+        for part, object_file, node_id in self.roundrobin_datadirs(dirs):
             self.cpool.spawn_n(
                 self._replicate_object, part, object_file, node_id)
         self.cpool.waitall()
-        self.logger.info(_('Replication run OVER'))
+        self.logger.info('Replication run OVER')
+        if self.handoffs_only or self.handoff_delete:
+            self.logger.warning(
+                'Finished replication pass with handoffs_only and/or '
+                'handoffs_delete enabled. If these are no longer required, '
+                'disable them.')
         self._report_stats()
 
     def run_forever(self, *args, **kwargs):
@@ -538,7 +937,7 @@ def run_forever(self, *args, **kwargs):
             try:
                 self.run_once()
             except (Exception, Timeout):
-                self.logger.exception(_('ERROR trying to replicate'))
+                self.logger.exception('ERROR trying to replicate')
             elapsed = time.time() - begin
             if elapsed < self.interval:
                 sleep(self.interval - elapsed)
@@ -554,16 +953,21 @@ def __init__(self, root, datadir, broker_class, mount_check=True,
         self.broker_class = broker_class
         self.mount_check = mount_check
         self.logger = logger or get_logger({}, log_route='replicator-rpc')
+        self.db_logger = BrokerAnnotatedLogger(logger=self.logger)
+
+    def _db_file_exists(self, db_path):
+        return os.path.exists(db_path)
 
     def dispatch(self, replicate_args, args):
         if not hasattr(args, 'pop'):
             return HTTPBadRequest(body='Invalid object type')
         op = args.pop(0)
         drive, partition, hsh = replicate_args
-        if self.mount_check and \
-                not os.path.ismount(os.path.join(self.root, drive)):
+        try:
+            dev_path = check_drive(self.root, drive, self.mount_check)
+        except ValueError:
             return Response(status='507 %s is not mounted' % drive)
-        db_file = os.path.join(self.root, drive,
+        db_file = os.path.join(dev_path,
                                storage_directory(self.datadir, partition, hsh),
                                hsh + '.db')
         if op == 'rsync_then_merge':
@@ -574,59 +978,102 @@ def dispatch(self, replicate_args, args):
             # someone might be about to rsync a db to us,
             # make sure there's a tmp dir to receive it.
             mkdirs(os.path.join(self.root, drive, 'tmp'))
-            if not os.path.exists(db_file):
+            if not self._db_file_exists(db_file):
                 return HTTPNotFound()
-            return getattr(self, op)(self.broker_class(db_file), args)
+            return getattr(self, op)(
+                self.broker_class(db_file, logger=self.logger), args)
 
-    def sync(self, broker, args):
-        (remote_sync, hash_, id_, created_at, put_timestamp,
-         delete_timestamp, metadata) = args
+    @contextmanager
+    def debug_timing(self, name):
         timemark = time.time()
-        try:
-            info = broker.get_replication_info()
-        except (Exception, Timeout), e:
-            if 'no such table' in str(e):
-                self.logger.error(_("Quarantining DB %s") % broker.db_file)
-                quarantine_db(broker.db_file, broker.db_type)
-                return HTTPNotFound()
-            raise
+        yield
         timespan = time.time() - timemark
         if timespan > DEBUG_TIMINGS_THRESHOLD:
-            self.logger.debug(_('replicator-rpc-sync time for info: %.02fs') %
-                              timespan)
+            self.logger.debug(
+                'replicator-rpc-sync time for %s: %.02fs' % (
+                    name, timespan))
+
+    def _parse_sync_args(self, args):
+        """
+        Convert remote sync args to remote_info dictionary.
+        """
+        (remote_sync, hash_, id_, created_at, put_timestamp,
+         delete_timestamp, metadata) = args[:7]
+        remote_metadata = {}
         if metadata:
-            timemark = time.time()
-            broker.update_metadata(simplejson.loads(metadata))
-            timespan = time.time() - timemark
-            if timespan > DEBUG_TIMINGS_THRESHOLD:
-                self.logger.debug(_('replicator-rpc-sync time for '
-                                    'update_metadata: %.02fs') % timespan)
-        if info['put_timestamp'] != put_timestamp or \
-                info['created_at'] != created_at or \
-                info['delete_timestamp'] != delete_timestamp:
-            timemark = time.time()
-            broker.merge_timestamps(
-                created_at, put_timestamp, delete_timestamp)
-            timespan = time.time() - timemark
-            if timespan > DEBUG_TIMINGS_THRESHOLD:
-                self.logger.debug(_('replicator-rpc-sync time for '
-                                    'merge_timestamps: %.02fs') % timespan)
-        timemark = time.time()
-        info['point'] = broker.get_sync(id_)
-        timespan = time.time() - timemark
-        if timespan > DEBUG_TIMINGS_THRESHOLD:
-            self.logger.debug(_('replicator-rpc-sync time for get_sync: '
-                                '%.02fs') % timespan)
-        if hash_ == info['hash'] and info['point'] < remote_sync:
-            timemark = time.time()
-            broker.merge_syncs([{'remote_id': id_,
-                                 'sync_point': remote_sync}])
-            info['point'] = remote_sync
-            timespan = time.time() - timemark
-            if timespan > DEBUG_TIMINGS_THRESHOLD:
-                self.logger.debug(_('replicator-rpc-sync time for '
-                                    'merge_syncs: %.02fs') % timespan)
-        return Response(simplejson.dumps(info))
+            try:
+                remote_metadata = json.loads(metadata)
+            except ValueError:
+                self.logger.error("Unable to decode remote metadata %r",
+                                  metadata)
+        remote_info = {
+            'point': remote_sync,
+            'hash': hash_,
+            'id': id_,
+            'created_at': created_at,
+            'put_timestamp': put_timestamp,
+            'delete_timestamp': delete_timestamp,
+            'metadata': remote_metadata,
+        }
+        return remote_info
+
+    def sync(self, broker, args):
+        remote_info = self._parse_sync_args(args)
+        return self._handle_sync_request(broker, remote_info)
+
+    def _get_synced_replication_info(self, broker, remote_info):
+        """
+        Apply any changes to the broker based on remote_info and return the
+        current replication info.
+
+        :param broker: the database broker
+        :param remote_info: the remote replication info
+
+        :returns: local broker replication info
+        """
+        return broker.get_replication_info()
+
+    def _handle_sync_request(self, broker, remote_info):
+        """
+        Update metadata, timestamps, sync points.
+        """
+        with self.debug_timing('info'):
+            try:
+                info = self._get_synced_replication_info(broker, remote_info)
+            except (Exception, Timeout) as e:
+                if 'no such table' in str(e):
+                    self.db_logger.error(broker, "Quarantining DB", )
+                    quarantine_db(broker.db_file, broker.db_type)
+                    return HTTPNotFound()
+                raise
+        # TODO(mattoliverau) At this point in the RPC, we have the callers
+        # replication info and ours, so it would be cool to be able to make
+        # an educated guess here on the size of the incoming replication (maybe
+        # average object table row size * difference in ROWIDs or something)
+        # and the fallocate_reserve setting so we could return a 507.
+        # This would make db fallocate_reserve more or less on par with the
+        # object's.
+        if remote_info['metadata']:
+            with self.debug_timing('update_metadata'):
+                broker.update_metadata(remote_info['metadata'])
+        sync_timestamps = ('created_at', 'put_timestamp', 'delete_timestamp')
+        if any(info[ts] != remote_info[ts] for ts in sync_timestamps):
+            with self.debug_timing('merge_timestamps'):
+                broker.merge_timestamps(*(remote_info[ts] for ts in
+                                          sync_timestamps))
+        with self.debug_timing('get_sync'):
+            info['point'] = broker.get_sync(remote_info['id'])
+        if remote_info['hash'] == info['hash'] and \
+                info['point'] < remote_info['point']:
+            with self.debug_timing('merge_syncs'):
+                translate = {
+                    'remote_id': 'id',
+                    'sync_point': 'point',
+                }
+                data = dict((k, remote_info[v]) for k, v in translate.items())
+                broker.merge_syncs([data])
+                info['point'] = remote_info['point']
+        return Response(json.dumps(info))
 
     def merge_syncs(self, broker, args):
         broker.merge_syncs(args[0])
@@ -638,21 +1085,32 @@ def merge_items(self, broker, args):
 
     def complete_rsync(self, drive, db_file, args):
         old_filename = os.path.join(self.root, drive, 'tmp', args[0])
+        if args[1:]:
+            db_file = os.path.join(os.path.dirname(db_file), args[1])
         if os.path.exists(db_file):
             return HTTPNotFound()
         if not os.path.exists(old_filename):
             return HTTPNotFound()
-        broker = self.broker_class(old_filename)
+        broker = self.broker_class(old_filename, logger=self.logger)
         broker.newid(args[0])
         renamer(old_filename, db_file)
         return HTTPNoContent()
 
+    def _abort_rsync_then_merge(self, db_file, tmp_filename):
+        return not (self._db_file_exists(db_file) and
+                    os.path.exists(tmp_filename))
+
+    def _post_rsync_then_merge_hook(self, existing_broker, new_broker):
+        # subclasses may override to make custom changes to the new broker
+        pass
+
     def rsync_then_merge(self, drive, db_file, args):
-        old_filename = os.path.join(self.root, drive, 'tmp', args[0])
-        if not os.path.exists(db_file) or not os.path.exists(old_filename):
+        tmp_filename = os.path.join(self.root, drive, 'tmp', args[0])
+        if self._abort_rsync_then_merge(db_file, tmp_filename):
             return HTTPNotFound()
-        new_broker = self.broker_class(old_filename)
-        existing_broker = self.broker_class(db_file)
+        new_broker = self.broker_class(tmp_filename, logger=self.logger)
+        existing_broker = self.broker_class(db_file, logger=self.logger)
+        db_file = existing_broker.db_file
         point = -1
         objects = existing_broker.get_items_since(point, 1000)
         while len(objects):
@@ -660,8 +1118,13 @@ def rsync_then_merge(self, drive, db_file, args):
             point = objects[-1]['ROWID']
             objects = existing_broker.get_items_since(point, 1000)
             sleep()
+        new_broker.merge_syncs(existing_broker.get_syncs())
+        self._post_rsync_then_merge_hook(existing_broker, new_broker)
         new_broker.newid(args[0])
-        renamer(old_filename, db_file)
+        new_broker.update_metadata(existing_broker.metadata)
+        if self._abort_rsync_then_merge(db_file, tmp_filename):
+            return HTTPNotFound()
+        renamer(tmp_filename, db_file)
         return HTTPNoContent()
 
 # Footnote [1]:
diff --git a/swift/common/digest.py b/swift/common/digest.py
new file mode 100644
index 0000000000..36bc47a9bd
--- /dev/null
+++ b/swift/common/digest.py
@@ -0,0 +1,141 @@
+# Copyright (c) 2022 NVIDIA
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import binascii
+import hmac
+
+from swift.common.utils import strict_b64decode
+
+
+DEFAULT_ALLOWED_DIGESTS = 'sha1 sha256 sha512'
+DEPRECATED_DIGESTS = {'sha1'}
+SUPPORTED_DIGESTS = set(DEFAULT_ALLOWED_DIGESTS.split()) | DEPRECATED_DIGESTS
+
+
+def get_hmac(request_method, path, expires, key, digest="sha1",
+             ip_range=None):
+    """
+    Returns the hexdigest string of the HMAC (see RFC 2104) for
+    the request.
+
+    :param request_method: Request method to allow.
+    :param path: The path to the resource to allow access to.
+    :param expires: Unix timestamp as an int for when the URL
+                    expires.
+    :param key: HMAC shared secret.
+    :param digest: constructor or the string name for the digest to use in
+                   calculating the HMAC
+                   Defaults to SHA1
+    :param ip_range: The ip range from which the resource is allowed
+                     to be accessed. We need to put the ip_range as the
+                     first argument to hmac to avoid manipulation of the path
+                     due to newlines being valid in paths
+                     e.g. /v1/a/c/o\\n127.0.0.1
+    :returns: hexdigest str of the HMAC for the request using the specified
+              digest algorithm.
+    """
+    # These are the three mandatory fields.
+    parts = [request_method, str(expires), path]
+    formats = [b"%s", b"%s", b"%s"]
+
+    if ip_range:
+        parts.insert(0, ip_range)
+        formats.insert(0, b"ip=%s")
+
+    if isinstance(key, str):
+        key = key.encode('utf8')
+
+    message = b'\n'.join(
+        fmt % (part if isinstance(part, bytes)
+               else part.encode("utf-8"))
+        for fmt, part in zip(formats, parts))
+
+    return hmac.new(key, message, digest).hexdigest()
+
+
+def get_allowed_digests(conf_digests, logger=None):
+    """
+    Pulls out 'allowed_digests' from the supplied conf. Then compares them with
+    the list of supported and deprecated digests and returns whatever remain.
+
+    When something is unsupported or deprecated it'll log a warning.
+
+    :param conf_digests: iterable of allowed digests. If empty, defaults to
+        DEFAULT_ALLOWED_DIGESTS.
+    :param logger: optional logger; if provided, use it issue deprecation
+        warnings
+    :returns: A set of allowed digests that are supported and a set of
+        deprecated digests.
+    :raises: ValueError, if there are no digests left to return.
+    """
+    allowed_digests = set(digest.lower() for digest in conf_digests)
+    if not allowed_digests:
+        allowed_digests = SUPPORTED_DIGESTS
+
+    not_supported = allowed_digests - SUPPORTED_DIGESTS
+    if not_supported:
+        if logger:
+            logger.warning('The following digest algorithms are configured '
+                           'but not supported: %s', ', '.join(not_supported))
+        allowed_digests -= not_supported
+    deprecated = allowed_digests & DEPRECATED_DIGESTS
+    if deprecated and logger:
+        if not conf_digests:
+            logger.warning('The following digest algorithms are allowed by '
+                           'default but deprecated: %s. Support will be '
+                           'disabled by default in a future release, and '
+                           'later removed entirely.', ', '.join(deprecated))
+        else:
+            logger.warning('The following digest algorithms are configured '
+                           'but deprecated: %s. Support will be removed in a '
+                           'future release.', ', '.join(deprecated))
+    if not allowed_digests:
+        raise ValueError('No valid digest algorithms are configured')
+
+    return allowed_digests, deprecated
+
+
+def extract_digest_and_algorithm(value):
+    """
+    Returns a tuple of (digest_algorithm, hex_encoded_digest)
+    from a client-provided string of the form::
+
+       <hex-encoded digest>
+
+    or::
+
+       <algorithm>:<base64-encoded digest>
+
+    Note that hex-encoded strings must use one of sha1, sha256, or sha512.
+
+    :raises: ValueError on parse failures
+    """
+    if ':' in value:
+        algo, value = value.split(':', 1)
+        # accept both standard and url-safe base64
+        if ('-' in value or '_' in value) and not (
+                '+' in value or '/' in value):
+            value = value.replace('-', '+').replace('_', '/')
+        value = binascii.hexlify(
+            strict_b64decode(value + '==')).decode('ascii')
+    else:
+        binascii.unhexlify(value)  # make sure it decodes
+        algo = {
+            40: 'sha1',
+            64: 'sha256',
+            128: 'sha512',
+        }.get(len(value))
+        if not algo:
+            raise ValueError('Bad digest length')
+    return algo, value
diff --git a/swift/common/direct_client.py b/swift/common/direct_client.py
index 4078ec3348..94a4558384 100644
--- a/swift/common/direct_client.py
+++ b/swift/common/direct_client.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -18,80 +18,269 @@
 through the proxy.
 """
 
+import json
+import os
 import socket
-from httplib import HTTPException
-from time import time
-from urllib import quote as _quote
 
 from eventlet import sleep, Timeout
-
-from swift.common.bufferedhttp import http_connect
-from swiftclient import ClientException, json_loads
-from swift.common.utils import normalize_timestamp
+import pickle  # nosec: B403
+from http.client import HTTPException
+
+from swift.common.bufferedhttp import http_connect, http_connect_raw
+from swift.common.exceptions import ClientException
+from swift.common.request_helpers import USE_REPLICATION_NETWORK_HEADER, \
+    get_ip_port
+from swift.common.swob import normalize_etag
+from swift.common.utils import Timestamp, FileLikeIter, quote
 from swift.common.http import HTTP_NO_CONTENT, HTTP_INSUFFICIENT_STORAGE, \
     is_success, is_server_error
+from swift.common.header_key_dict import HeaderKeyDict
+
+
+class DirectClientException(ClientException):
+
+    def __init__(self, stype, method, node, part, path, resp, host=None):
+        # host can be used to override the node ip and port reported in
+        # the exception
+        host = host if host is not None else node
+        if isinstance(path, bytes):
+            path = path.decode("utf-8")
+        full_path = quote('/%s/%s%s' % (node['device'], part, path))
+        msg = '%s server %s:%s direct %s %r gave status %s' % (
+            stype, host['ip'], host['port'], method, full_path, resp.status)
+        headers = HeaderKeyDict(resp.getheaders())
+        super(DirectClientException, self).__init__(
+            msg, http_host=host['ip'], http_port=host['port'],
+            http_device=node['device'], http_status=resp.status,
+            http_reason=resp.reason, http_headers=headers)
 
 
-def quote(value, safe='/'):
-    if isinstance(value, unicode):
-        value = value.encode('utf8')
-    return _quote(value, safe)
+class DirectClientReconException(ClientException):
 
+    def __init__(self, method, node, path, resp):
+        if isinstance(path, bytes):
+            path = path.decode("utf-8")
+        msg = 'server %s:%s direct %s %r gave status %s' % (
+            node['ip'], node['port'], method, path, resp.status)
+        headers = HeaderKeyDict(resp.getheaders())
+        super(DirectClientReconException, self).__init__(
+            msg, http_host=node['ip'], http_port=node['port'],
+            http_status=resp.status, http_reason=resp.reason,
+            http_headers=headers)
 
-def direct_get_account(node, part, account, marker=None, limit=None,
-                       prefix=None, delimiter=None, conn_timeout=5,
-                       response_timeout=15):
+
+def _make_path(*components):
+    return u'/' + u'/'.join(
+        x.decode('utf-8') if isinstance(x, bytes) else x
+        for x in components)
+
+
+def _make_req(node, part, method, path, headers, stype,
+              conn_timeout=5, response_timeout=15, send_timeout=15,
+              contents=None, content_length=None, chunk_size=65535):
     """
-    Get listings directly from the account server.
+    Make request to backend storage node.
+    (i.e. 'Account', 'Container', 'Object')
+    :param node: a node dict from a ring
+    :param part: an integer, the partition number
+    :param method: a string, the HTTP method (e.g. 'PUT', 'DELETE', etc)
+    :param path: a string, the request path
+    :param headers: a dict, header name => value
+    :param stype: a string, describing the type of service
+    :param conn_timeout: timeout while waiting for connection; default is 5
+        seconds
+    :param response_timeout: timeout while waiting for response; default is 15
+        seconds
+    :param send_timeout: timeout for sending request body; default is 15
+        seconds
+    :param contents: an iterable or string to read object data from
+    :param content_length: value to send as content-length header
+    :param chunk_size: if defined, chunk size of data to send
+    :returns: an HTTPResponse object
+    :raises DirectClientException: if the response status is not 2xx
+    :raises eventlet.Timeout: if either conn_timeout or response_timeout is
+        exceeded
+    """
+    if contents is not None:
+        if content_length is not None:
+            headers['Content-Length'] = str(content_length)
+        else:
+            for n, v in headers.items():
+                if n.lower() == 'content-length':
+                    content_length = int(v)
+        if not contents:
+            headers['Content-Length'] = '0'
+        if isinstance(contents, str):
+            contents = [contents]
+        if content_length is None:
+            headers['Transfer-Encoding'] = 'chunked'
+
+    ip, port = get_ip_port(node, headers)
+    headers.setdefault('X-Backend-Allow-Reserved-Names', 'true')
+    with Timeout(conn_timeout):
+        conn = http_connect(ip, port, node['device'], part,
+                            method, path, headers=headers)
+
+    if contents is not None:
+        contents_f = FileLikeIter(contents)
+
+        with Timeout(send_timeout):
+            if content_length is None:
+                chunk = contents_f.read(chunk_size)
+                while chunk:
+                    conn.send(b'%x\r\n%s\r\n' % (len(chunk), chunk))
+                    chunk = contents_f.read(chunk_size)
+                conn.send(b'0\r\n\r\n')
+            else:
+                left = content_length
+                while left > 0:
+                    size = chunk_size
+                    if size > left:
+                        size = left
+                    chunk = contents_f.read(size)
+                    if not chunk:
+                        break
+                    conn.send(chunk)
+                    left -= len(chunk)
 
-    :param node: node dictionary from the ring
-    :param part: partition the account is on
-    :param account: account name
-    :param marker: marker query
-    :param limit: query limit
-    :param prefix: prefix query
-    :param delimeter: delimeter for the query
-    :param conn_timeout: timeout in seconds for establishing the connection
-    :param response_timeout: timeout in seconds for getting the response
-    :returns: a tuple of (response headers, a list of containers) The response
-              headers will be a dict and all header names will be lowercase.
+    with Timeout(response_timeout):
+        resp = conn.getresponse()
+        resp.read()
+    if not is_success(resp.status):
+        raise DirectClientException(stype, method, node, part, path, resp)
+    return resp
+
+
+def _get_direct_account_container(path, stype, node, part,
+                                  marker=None, limit=None,
+                                  prefix=None, delimiter=None,
+                                  conn_timeout=5, response_timeout=15,
+                                  end_marker=None, reverse=None, headers=None,
+                                  extra_params=None):
+    """Base function for get direct account and container.
+
+    Do not use directly use the direct_get_account or
+    direct_get_container instead.
     """
-    path = '/' + account
-    qs = 'format=json'
+    if headers is None:
+        headers = {}
+
+    params = {'format': 'json'}
+    if extra_params:
+        for key, value in extra_params.items():
+            if value is not None:
+                params[key] = value
     if marker:
-        qs += '&marker=%s' % quote(marker)
+        if 'marker' in params:
+            raise TypeError('duplicate values for keyword arg: marker')
+        params['marker'] = quote(marker)
     if limit:
-        qs += '&limit=%d' % limit
+        if 'limit' in params:
+            raise TypeError('duplicate values for keyword arg: limit')
+        params['limit'] = '%d' % limit
     if prefix:
-        qs += '&prefix=%s' % quote(prefix)
+        if 'prefix' in params:
+            raise TypeError('duplicate values for keyword arg: prefix')
+        params['prefix'] = quote(prefix)
     if delimiter:
-        qs += '&delimiter=%s' % quote(delimiter)
+        if 'delimiter' in params:
+            raise TypeError('duplicate values for keyword arg: delimiter')
+        params['delimiter'] = quote(delimiter)
+    if end_marker:
+        if 'end_marker' in params:
+            raise TypeError('duplicate values for keyword arg: end_marker')
+        params['end_marker'] = quote(end_marker)
+    if reverse:
+        if 'reverse' in params:
+            raise TypeError('duplicate values for keyword arg: reverse')
+        params['reverse'] = quote(reverse)
+    qs = '&'.join('%s=%s' % (k, v) for k, v in params.items())
+
+    ip, port = get_ip_port(node, headers)
     with Timeout(conn_timeout):
-        conn = http_connect(node['ip'], node['port'], node['device'], part,
-                            'GET', path, query_string=qs)
+        conn = http_connect(ip, port, node['device'], part,
+                            'GET', path, query_string=qs,
+                            headers=gen_headers(hdrs_in=headers))
     with Timeout(response_timeout):
         resp = conn.getresponse()
     if not is_success(resp.status):
         resp.read()
-        raise ClientException(
-            'Account server %s:%s direct GET %s gave status %s' %
-            (node['ip'], node['port'],
-             repr('/%s/%s%s' % (node['device'], part, path)),
-             resp.status),
-            http_host=node['ip'], http_port=node['port'],
-            http_device=node['device'], http_status=resp.status,
-            http_reason=resp.reason)
-    resp_headers = {}
+        raise DirectClientException(stype, 'GET', node, part, path, resp)
+
+    resp_headers = HeaderKeyDict()
     for header, value in resp.getheaders():
-        resp_headers[header.lower()] = value
+        resp_headers[header] = value
     if resp.status == HTTP_NO_CONTENT:
         resp.read()
         return resp_headers, []
-    return resp_headers, json_loads(resp.read())
+    return resp_headers, json.loads(resp.read())
+
+
+def gen_headers(hdrs_in=None, add_ts=True):
+    """
+    Get the headers ready for a request. All requests should have a User-Agent
+    string, but if one is passed in don't over-write it. Not all requests will
+    need an X-Timestamp, but if one is passed in do not over-write it.
+
+    :param headers: dict or None, base for HTTP headers
+    :param add_ts: boolean, should be True for any "unsafe" HTTP request
+
+    :returns: HeaderKeyDict based on headers and ready for the request
+    """
+    hdrs_out = HeaderKeyDict(hdrs_in) if hdrs_in else HeaderKeyDict()
+    if add_ts and 'X-Timestamp' not in hdrs_out:
+        hdrs_out['X-Timestamp'] = Timestamp.now().internal
+    if 'user-agent' not in hdrs_out:
+        hdrs_out['User-Agent'] = 'direct-client %s' % os.getpid()
+    hdrs_out.setdefault('X-Backend-Allow-Reserved-Names', 'true')
+    return hdrs_out
+
+
+def direct_get_account(node, part, account, marker=None, limit=None,
+                       prefix=None, delimiter=None, conn_timeout=5,
+                       response_timeout=15, end_marker=None, reverse=None,
+                       headers=None):
+    """
+    Get listings directly from the account server.
+
+    :param node: node dictionary from the ring
+    :param part: partition the account is on
+    :param account: account name
+    :param marker: marker query
+    :param limit: query limit
+    :param prefix: prefix query
+    :param delimiter: delimiter for the query
+    :param conn_timeout: timeout in seconds for establishing the connection
+    :param response_timeout: timeout in seconds for getting the response
+    :param end_marker: end_marker query
+    :param reverse: reverse the returned listing
+    :returns: a tuple of (response headers, a list of containers) The response
+              headers will HeaderKeyDict.
+    """
+    path = _make_path(account)
+    return _get_direct_account_container(path, "Account", node, part,
+                                         headers=headers,
+                                         marker=marker,
+                                         limit=limit, prefix=prefix,
+                                         delimiter=delimiter,
+                                         end_marker=end_marker,
+                                         reverse=reverse,
+                                         conn_timeout=conn_timeout,
+                                         response_timeout=response_timeout)
+
+
+def direct_delete_account(node, part, account, conn_timeout=5,
+                          response_timeout=15, headers=None):
+    if headers is None:
+        headers = {}
+
+    path = _make_path(account)
+    _make_req(node, part, 'DELETE', path, gen_headers(headers, True),
+              'Account', conn_timeout, response_timeout)
 
 
 def direct_head_container(node, part, account, container, conn_timeout=5,
-                          response_timeout=15):
+                          response_timeout=15, headers=None):
     """
     Request container information directly from the container server.
 
@@ -101,34 +290,26 @@ def direct_head_container(node, part, account, container, conn_timeout=5,
     :param container: container name
     :param conn_timeout: timeout in seconds for establishing the connection
     :param response_timeout: timeout in seconds for getting the response
-    :returns: a dict containing the response's headers (all header names will
-              be lowercase)
+    :returns: a dict containing the response's headers in a HeaderKeyDict
+    :raises ClientException: HTTP HEAD request failed
     """
-    path = '/%s/%s' % (account, container)
-    with Timeout(conn_timeout):
-        conn = http_connect(node['ip'], node['port'], node['device'], part,
-                            'HEAD', path)
-    with Timeout(response_timeout):
-        resp = conn.getresponse()
-        resp.read()
-    if not is_success(resp.status):
-        raise ClientException(
-            'Container server %s:%s direct HEAD %s gave status %s' %
-            (node['ip'], node['port'],
-             repr('/%s/%s%s' % (node['device'], part, path)),
-             resp.status),
-            http_host=node['ip'], http_port=node['port'],
-            http_device=node['device'], http_status=resp.status,
-            http_reason=resp.reason)
-    resp_headers = {}
+    if headers is None:
+        headers = {}
+
+    path = _make_path(account, container)
+    resp = _make_req(node, part, 'HEAD', path, gen_headers(headers),
+                     'Container', conn_timeout, response_timeout)
+
+    resp_headers = HeaderKeyDict()
     for header, value in resp.getheaders():
-        resp_headers[header.lower()] = value
+        resp_headers[header] = value
     return resp_headers
 
 
 def direct_get_container(node, part, account, container, marker=None,
                          limit=None, prefix=None, delimiter=None,
-                         conn_timeout=5, response_timeout=15):
+                         conn_timeout=5, response_timeout=15, end_marker=None,
+                         reverse=None, headers=None, extra_params=None):
     """
     Get container listings directly from the container server.
 
@@ -139,68 +320,142 @@ def direct_get_container(node, part, account, container, marker=None,
     :param marker: marker query
     :param limit: query limit
     :param prefix: prefix query
-    :param delimeter: delimeter for the query
+    :param delimiter: delimiter for the query
     :param conn_timeout: timeout in seconds for establishing the connection
     :param response_timeout: timeout in seconds for getting the response
+    :param end_marker: end_marker query
+    :param reverse: reverse the returned listing
+    :param headers: headers to be included in the request
+    :param extra_params: a dict of extra parameters to be included in the
+        request. It can be used to pass additional parameters, e.g,
+        {'states':'updating'} can be used with shard_range/namespace listing.
+        It can also be used to pass the existing keyword args, like 'marker' or
+        'limit', but if the same parameter appears twice in both keyword arg
+        (not None) and extra_params, this function will raise TypeError.
     :returns: a tuple of (response headers, a list of objects) The response
-              headers will be a dict and all header names will be lowercase.
+              headers will be a HeaderKeyDict.
     """
-    path = '/%s/%s' % (account, container)
-    qs = 'format=json'
-    if marker:
-        qs += '&marker=%s' % quote(marker)
-    if limit:
-        qs += '&limit=%d' % limit
-    if prefix:
-        qs += '&prefix=%s' % quote(prefix)
-    if delimiter:
-        qs += '&delimiter=%s' % quote(delimiter)
-    with Timeout(conn_timeout):
-        conn = http_connect(node['ip'], node['port'], node['device'], part,
-                            'GET', path, query_string=qs)
-    with Timeout(response_timeout):
-        resp = conn.getresponse()
-    if not is_success(resp.status):
-        resp.read()
-        raise ClientException(
-            'Container server %s:%s direct GET %s gave stats %s' %
-            (node['ip'], node['port'],
-             repr('/%s/%s%s' % (node['device'], part, path)),
-             resp.status),
-            http_host=node['ip'], http_port=node['port'],
-            http_device=node['device'], http_status=resp.status,
-            http_reason=resp.reason)
-    resp_headers = {}
-    for header, value in resp.getheaders():
-        resp_headers[header.lower()] = value
-    if resp.status == HTTP_NO_CONTENT:
-        resp.read()
-        return resp_headers, []
-    return resp_headers, json_loads(resp.read())
+    path = _make_path(account, container)
+    return _get_direct_account_container(path, "Container", node,
+                                         part, marker=marker,
+                                         limit=limit, prefix=prefix,
+                                         delimiter=delimiter,
+                                         end_marker=end_marker,
+                                         reverse=reverse,
+                                         conn_timeout=conn_timeout,
+                                         response_timeout=response_timeout,
+                                         headers=headers,
+                                         extra_params=extra_params)
 
 
 def direct_delete_container(node, part, account, container, conn_timeout=5,
-                            response_timeout=15, headers={}):
-    path = '/%s/%s' % (account, container)
-    headers['X-Timestamp'] = normalize_timestamp(time())
-    with Timeout(conn_timeout):
-        conn = http_connect(node['ip'], node['port'], node['device'], part,
-                            'DELETE', path, headers)
-    with Timeout(response_timeout):
-        resp = conn.getresponse()
-        resp.read()
-    if not is_success(resp.status):
-        raise ClientException(
-            'Container server %s:%s direct DELETE %s gave status %s' %
-            (node['ip'], node['port'],
-             repr('/%s/%s%s' % (node['device'], part, path)), resp.status),
-            http_host=node['ip'], http_port=node['port'],
-            http_device=node['device'], http_status=resp.status,
-            http_reason=resp.reason)
+                            response_timeout=15, headers=None):
+    """
+    Delete container directly from the container server.
+
+    :param node: node dictionary from the ring
+    :param part: partition the container is on
+    :param account: account name
+    :param container: container name
+    :param conn_timeout: timeout in seconds for establishing the connection
+    :param response_timeout: timeout in seconds for getting the response
+    :param headers: dict to be passed into HTTPConnection headers
+    :raises ClientException: HTTP DELETE request failed
+    """
+    if headers is None:
+        headers = {}
+
+    path = _make_path(account, container)
+    add_timestamp = 'x-timestamp' not in (k.lower() for k in headers)
+    _make_req(node, part, 'DELETE', path, gen_headers(headers, add_timestamp),
+              'Container', conn_timeout, response_timeout)
+
+
+def direct_put_container(node, part, account, container, conn_timeout=5,
+                         response_timeout=15, headers=None, contents=None,
+                         content_length=None, chunk_size=65535):
+    """
+    Make a PUT request to a container server.
+
+    :param node: node dictionary from the ring
+    :param part: partition the container is on
+    :param account: account name
+    :param container: container name
+    :param conn_timeout: timeout in seconds for establishing the connection
+    :param response_timeout: timeout in seconds for getting the response
+    :param headers: additional headers to include in the request
+    :param contents: an iterable or string to send in request body (optional)
+    :param content_length: value to send as content-length header (optional)
+    :param chunk_size: chunk size of data to send (optional)
+    :raises ClientException: HTTP PUT request failed
+    """
+    if headers is None:
+        headers = {}
+
+    lower_headers = set(k.lower() for k in headers)
+    headers_out = gen_headers(headers,
+                              add_ts='x-timestamp' not in lower_headers)
+    path = _make_path(account, container)
+    _make_req(node, part, 'PUT', path, headers_out, 'Container', conn_timeout,
+              response_timeout, contents=contents,
+              content_length=content_length, chunk_size=chunk_size)
+
+
+def direct_post_container(node, part, account, container, conn_timeout=5,
+                          response_timeout=15, headers=None):
+    """
+    Make a POST request to a container server.
+
+    :param node: node dictionary from the ring
+    :param part: partition the container is on
+    :param account: account name
+    :param container: container name
+    :param conn_timeout: timeout in seconds for establishing the connection
+    :param response_timeout: timeout in seconds for getting the response
+    :param headers: additional headers to include in the request
+    :raises ClientException: HTTP PUT request failed
+    """
+    if headers is None:
+        headers = {}
+
+    lower_headers = set(k.lower() for k in headers)
+    headers_out = gen_headers(headers,
+                              add_ts='x-timestamp' not in lower_headers)
+    path = _make_path(account, container)
+    return _make_req(node, part, 'POST', path, headers_out, 'Container',
+                     conn_timeout, response_timeout)
+
+
+def direct_put_container_object(node, part, account, container, obj,
+                                conn_timeout=5, response_timeout=15,
+                                headers=None):
+    if headers is None:
+        headers = {}
+
+    have_x_timestamp = 'x-timestamp' in (k.lower() for k in headers)
+
+    path = _make_path(account, container, obj)
+    _make_req(node, part, 'PUT', path,
+              gen_headers(headers, add_ts=(not have_x_timestamp)),
+              'Container', conn_timeout, response_timeout)
+
+
+def direct_delete_container_object(node, part, account, container, obj,
+                                   conn_timeout=5, response_timeout=15,
+                                   headers=None):
+    if headers is None:
+        headers = {}
+
+    headers = gen_headers(headers, add_ts='x-timestamp' not in (
+        k.lower() for k in headers))
+
+    path = _make_path(account, container, obj)
+    _make_req(node, part, 'DELETE', path, headers,
+              'Container', conn_timeout, response_timeout)
 
 
 def direct_head_object(node, part, account, container, obj, conn_timeout=5,
-                       response_timeout=15):
+                       response_timeout=15, headers=None):
     """
     Request object information directly from the object server.
 
@@ -211,33 +466,27 @@ def direct_head_object(node, part, account, container, obj, conn_timeout=5,
     :param obj: object name
     :param conn_timeout: timeout in seconds for establishing the connection
     :param response_timeout: timeout in seconds for getting the response
-    :returns: a dict containing the response's headers (all header names will
-              be lowercase)
+    :param headers: dict to be passed into HTTPConnection headers
+    :returns: a dict containing the response's headers in a HeaderKeyDict
+    :raises ClientException: HTTP HEAD request failed
     """
-    path = '/%s/%s/%s' % (account, container, obj)
-    with Timeout(conn_timeout):
-        conn = http_connect(node['ip'], node['port'], node['device'], part,
-                            'HEAD', path)
-    with Timeout(response_timeout):
-        resp = conn.getresponse()
-        resp.read()
-    if not is_success(resp.status):
-        raise ClientException(
-            'Object server %s:%s direct HEAD %s gave status %s' %
-            (node['ip'], node['port'],
-             repr('/%s/%s%s' % (node['device'], part, path)),
-             resp.status),
-            http_host=node['ip'], http_port=node['port'],
-            http_device=node['device'], http_status=resp.status,
-            http_reason=resp.reason)
-    resp_headers = {}
+    if headers is None:
+        headers = {}
+
+    headers = gen_headers(headers)
+
+    path = _make_path(account, container, obj)
+    resp = _make_req(node, part, 'HEAD', path, headers,
+                     'Object', conn_timeout, response_timeout)
+
+    resp_headers = HeaderKeyDict()
     for header, value in resp.getheaders():
-        resp_headers[header.lower()] = value
+        resp_headers[header] = value
     return resp_headers
 
 
 def direct_get_object(node, part, account, container, obj, conn_timeout=5,
-                      response_timeout=15, resp_chunk_size=None, headers={}):
+                      response_timeout=15, resp_chunk_size=None, headers=None):
     """
     Get object directly from the object server.
 
@@ -251,23 +500,23 @@ def direct_get_object(node, part, account, container, obj, conn_timeout=5,
     :param resp_chunk_size: if defined, chunk size of data to read.
     :param headers: dict to be passed into HTTPConnection headers
     :returns: a tuple of (response headers, the object's contents) The response
-              headers will be a dict and all header names will be lowercase.
+              headers will be a HeaderKeyDict.
+    :raises ClientException: HTTP GET request failed
     """
-    path = '/%s/%s/%s' % (account, container, obj)
+    if headers is None:
+        headers = {}
+
+    ip, port = get_ip_port(node, headers)
+    path = _make_path(account, container, obj)
     with Timeout(conn_timeout):
-        conn = http_connect(node['ip'], node['port'], node['device'], part,
-                            'GET', path, headers=headers)
+        conn = http_connect(ip, port, node['device'], part,
+                            'GET', path, headers=gen_headers(headers))
     with Timeout(response_timeout):
         resp = conn.getresponse()
     if not is_success(resp.status):
         resp.read()
-        raise ClientException(
-            'Object server %s:%s direct GET %s gave status %s' %
-            (node['ip'], node['port'],
-             repr('/%s/%s%s' % (node['device'], part, path)), resp.status),
-            http_host=node['ip'], http_port=node['port'],
-            http_device=node['device'], http_status=resp.status,
-            http_reason=resp.reason)
+        raise DirectClientException('Object', 'GET', node, part, path, resp)
+
     if resp_chunk_size:
 
         def _object_body():
@@ -278,16 +527,16 @@ def _object_body():
         object_body = _object_body()
     else:
         object_body = resp.read()
-    resp_headers = {}
+    resp_headers = HeaderKeyDict()
     for header, value in resp.getheaders():
-        resp_headers[header.lower()] = value
+        resp_headers[header] = value
     return resp_headers, object_body
 
 
 def direct_put_object(node, part, account, container, name, contents,
                       content_length=None, etag=None, content_type=None,
                       headers=None, conn_timeout=5, response_timeout=15,
-                      resp_chunk_size=None):
+                      chunk_size=65535):
     """
     Put object directly from the object server.
 
@@ -305,42 +554,27 @@ def direct_put_object(node, part, account, container, name, contents,
     :param response_timeout: timeout in seconds for getting the response
     :param chunk_size: if defined, chunk size of data to send.
     :returns: etag from the server response
+    :raises ClientException: HTTP PUT request failed
     """
-    # TODO: Add chunked puts
-    path = '/%s/%s/%s' % (account, container, name)
+
+    path = _make_path(account, container, name)
     if headers is None:
         headers = {}
     if etag:
-        headers['ETag'] = etag.strip('"')
-    if content_length is not None:
-        headers['Content-Length'] = str(content_length)
+        headers['ETag'] = normalize_etag(etag)
     if content_type is not None:
         headers['Content-Type'] = content_type
     else:
         headers['Content-Type'] = 'application/octet-stream'
-    if not contents:
-        headers['Content-Length'] = '0'
-    if isinstance(contents, basestring):
-        contents = [contents]
-    headers['X-Timestamp'] = normalize_timestamp(time())
-    with Timeout(conn_timeout):
-        conn = http_connect(node['ip'], node['port'], node['device'], part,
-                            'PUT', path, headers=headers)
-    for chunk in contents:
-        conn.send(chunk)
-    with Timeout(response_timeout):
-        resp = conn.getresponse()
-        resp.read()
-    if not is_success(resp.status):
-        raise ClientException(
-            'Object server %s:%s direct PUT %s gave status %s' %
-            (node['ip'], node['port'],
-             repr('/%s/%s%s' % (node['device'], part, path)),
-             resp.status),
-            http_host=node['ip'], http_port=node['port'],
-            http_device=node['device'], http_status=resp.status,
-            http_reason=resp.reason)
-    return resp.getheader('etag').strip('"')
+    # Incase the caller want to insert an object with specific age
+    add_ts = 'X-Timestamp' not in headers
+
+    resp = _make_req(
+        node, part, 'PUT', path, gen_headers(headers, add_ts=add_ts),
+        'Object', conn_timeout, response_timeout, contents=contents,
+        content_length=content_length, chunk_size=chunk_size)
+
+    return normalize_etag(resp.getheader('etag'))
 
 
 def direct_post_object(node, part, account, container, name, headers,
@@ -358,27 +592,13 @@ def direct_post_object(node, part, account, container, name, headers,
     :param response_timeout: timeout in seconds for getting the response
     :raises ClientException: HTTP POST request failed
     """
-    path = '/%s/%s/%s' % (account, container, name)
-    headers['X-Timestamp'] = normalize_timestamp(time())
-    with Timeout(conn_timeout):
-        conn = http_connect(node['ip'], node['port'], node['device'], part,
-                            'POST', path, headers=headers)
-    with Timeout(response_timeout):
-        resp = conn.getresponse()
-        resp.read()
-    if not is_success(resp.status):
-        raise ClientException(
-            'Object server %s:%s direct POST %s gave status %s' %
-            (node['ip'], node['port'],
-             repr('/%s/%s%s' % (node['device'], part, path)),
-             resp.status),
-            http_host=node['ip'], http_port=node['port'],
-            http_device=node['device'], http_status=resp.status,
-            http_reason=resp.reason)
+    path = _make_path(account, container, name)
+    _make_req(node, part, 'POST', path, gen_headers(headers, True),
+              'Object', conn_timeout, response_timeout)
 
 
 def direct_delete_object(node, part, account, container, obj,
-                         conn_timeout=5, response_timeout=15, headers={}):
+                         conn_timeout=5, response_timeout=15, headers=None):
     """
     Delete object directly from the object server.
 
@@ -389,25 +609,54 @@ def direct_delete_object(node, part, account, container, obj,
     :param obj: object name
     :param conn_timeout: timeout in seconds for establishing the connection
     :param response_timeout: timeout in seconds for getting the response
-    :returns: response from server
+    :raises ClientException: HTTP DELETE request failed
     """
-    path = '/%s/%s/%s' % (account, container, obj)
-    headers['X-Timestamp'] = normalize_timestamp(time())
+    if headers is None:
+        headers = {}
+
+    headers = gen_headers(headers, add_ts='x-timestamp' not in (
+        k.lower() for k in headers))
+
+    path = _make_path(account, container, obj)
+    _make_req(node, part, 'DELETE', path, headers,
+              'Object', conn_timeout, response_timeout)
+
+
+def direct_get_suffix_hashes(node, part, suffixes, conn_timeout=5,
+                             response_timeout=15, headers=None):
+    """
+    Get suffix hashes directly from the object server.
+
+    Note that unlike other ``direct_client`` functions, this one defaults
+    to using the replication network to make requests.
+
+    :param node: node dictionary from the ring
+    :param part: partition the container is on
+    :param conn_timeout: timeout in seconds for establishing the connection
+    :param response_timeout: timeout in seconds for getting the response
+    :param headers: dict to be passed into HTTPConnection headers
+    :returns: dict of suffix hashes
+    :raises ClientException: HTTP REPLICATE request failed
+    """
+    if headers is None:
+        headers = {}
+
+    headers.setdefault(USE_REPLICATION_NETWORK_HEADER, 'true')
+    ip, port = get_ip_port(node, headers)
+    path = '/%s' % '-'.join(suffixes)
     with Timeout(conn_timeout):
-        conn = http_connect(node['ip'], node['port'], node['device'], part,
-                            'DELETE', path, headers)
+        conn = http_connect(ip, port,
+                            node['device'], part, 'REPLICATE', path,
+                            headers=gen_headers(headers))
     with Timeout(response_timeout):
         resp = conn.getresponse()
-        resp.read()
     if not is_success(resp.status):
-        raise ClientException(
-            'Object server %s:%s direct DELETE %s gave status %s' %
-            (node['ip'], node['port'],
-             repr('/%s/%s%s' % (node['device'], part, path)),
-             resp.status),
-            http_host=node['ip'], http_port=node['port'],
-            http_device=node['device'], http_status=resp.status,
-            http_reason=resp.reason)
+        raise DirectClientException('Object', 'REPLICATE',
+                                    node, part, path, resp,
+                                    host={'ip': node['replication_ip'],
+                                          'port': node['replication_port']}
+                                    )
+    return pickle.loads(resp.read())  # nosec: B301
 
 
 def retry(func, *args, **kwargs):
@@ -421,28 +670,23 @@ def retry(func, *args, **kwargs):
     :param kwargs: keyward arguments to send to func (if retries or
                    error_log are sent, they will be deleted from kwargs
                    before sending on to func)
-    :returns: restult of func
-    """
-    retries = 5
-    if 'retries' in kwargs:
-        retries = kwargs['retries']
-        del kwargs['retries']
-    error_log = None
-    if 'error_log' in kwargs:
-        error_log = kwargs['error_log']
-        del kwargs['error_log']
+    :returns: result of func
+    :raises ClientException: all retries failed
+    """
+    retries = kwargs.pop('retries', 5)
+    error_log = kwargs.pop('error_log', None)
     attempts = 0
     backoff = 1
     while attempts <= retries:
         attempts += 1
         try:
             return attempts, func(*args, **kwargs)
-        except (socket.error, HTTPException, Timeout), err:
+        except (socket.error, HTTPException, Timeout) as err:
             if error_log:
                 error_log(err)
             if attempts > retries:
                 raise
-        except ClientException, err:
+        except ClientException as err:
             if error_log:
                 error_log(err)
             if attempts > retries or not is_server_error(err.http_status) or \
@@ -453,8 +697,36 @@ def retry(func, *args, **kwargs):
     # Shouldn't actually get down here, but just in case.
     if args and 'ip' in args[0]:
         raise ClientException('Raise too many retries',
-                              http_host=args[
-                              0]['ip'], http_port=args[0]['port'],
+                              http_host=args[0]['ip'],
+                              http_port=args[0]['port'],
                               http_device=args[0]['device'])
     else:
         raise ClientException('Raise too many retries')
+
+
+def direct_get_recon(node, recon_command, conn_timeout=5, response_timeout=15,
+                     headers=None):
+    """
+    Get recon json directly from the storage server.
+
+    :param node: node dictionary from the ring
+    :param recon_command: recon string (post /recon/)
+    :param conn_timeout: timeout in seconds for establishing the connection
+    :param response_timeout: timeout in seconds for getting the response
+    :param headers: dict to be passed into HTTPConnection headers
+    :returns: deserialized json response
+    :raises DirectClientReconException: HTTP GET request failed
+    """
+    if headers is None:
+        headers = {}
+
+    ip, port = get_ip_port(node, headers)
+    path = '/recon/%s' % recon_command
+    with Timeout(conn_timeout):
+        conn = http_connect_raw(ip, port, 'GET', path,
+                                headers=gen_headers(headers))
+    with Timeout(response_timeout):
+        resp = conn.getresponse()
+    if not is_success(resp.status):
+        raise DirectClientReconException('GET', node, path, resp)
+    return json.loads(resp.read())
diff --git a/swift/common/error_limiter.py b/swift/common/error_limiter.py
new file mode 100644
index 0000000000..715c326847
--- /dev/null
+++ b/swift/common/error_limiter.py
@@ -0,0 +1,93 @@
+# Copyright (c) 2021 NVIDIA
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import collections
+from time import time
+
+from swift.common.utils import node_to_string
+
+
+class ErrorLimiter(object):
+    """
+    Tracks the number of errors that have occurred for nodes. A node will be
+    considered to be error-limited for a given interval of time after it has
+    accumulated more errors than a given limit.
+
+    :param suppression_interval: The number of seconds for which a node is
+        error-limited once it has accumulated more than ``suppression_limit``
+        errors. Should be a float value.
+    :param suppression_limit: The number of errors that a node must accumulate
+        before it is considered to be error-limited. Should be an int value.
+    """
+    def __init__(self, suppression_interval, suppression_limit):
+        self.suppression_interval = float(suppression_interval)
+        self.suppression_limit = int(suppression_limit)
+        self.stats = collections.defaultdict(dict)
+
+    def node_key(self, node):
+        """
+        Get the key under which a node's error stats will be stored.
+
+        :param node: dictionary describing a node.
+        :return: string key.
+        """
+        return node_to_string(node)
+
+    def is_limited(self, node):
+        """
+        Check if the node is currently error limited.
+
+        :param node: dictionary of node to check
+        :returns: True if error limited, False otherwise
+        """
+        now = time()
+        node_key = self.node_key(node)
+        error_stats = self.stats.get(node_key)
+
+        if error_stats is None or 'errors' not in error_stats:
+            return False
+
+        if 'last_error' in error_stats and error_stats['last_error'] < \
+                now - self.suppression_interval:
+            self.stats.pop(node_key)
+            return False
+        return error_stats['errors'] > self.suppression_limit
+
+    def limit(self, node):
+        """
+        Mark a node as error limited. This immediately pretends the
+        node received enough errors to trigger error suppression. Use
+        this for errors like Insufficient Storage. For other errors
+        use :func:`increment`.
+
+        :param node: dictionary of node to error limit
+        """
+        node_key = self.node_key(node)
+        error_stats = self.stats[node_key]
+        error_stats['errors'] = self.suppression_limit + 1
+        error_stats['last_error'] = time()
+
+    def increment(self, node):
+        """
+        Increment the error count and update the time of the last error for
+        the given ``node``.
+
+        :param node: dictionary describing a node.
+        :returns: True if suppression_limit is exceeded, False otherwise
+        """
+        node_key = self.node_key(node)
+        error_stats = self.stats[node_key]
+        error_stats['errors'] = error_stats.get('errors', 0) + 1
+        error_stats['last_error'] = time()
+        return error_stats['errors'] > self.suppression_limit
diff --git a/swift/common/exceptions.py b/swift/common/exceptions.py
index d377009698..74d1540c0d 100644
--- a/swift/common/exceptions.py
+++ b/swift/common/exceptions.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -14,6 +14,7 @@
 # limitations under the License.
 
 from eventlet import Timeout
+from swift.common.utils.timestamp import Timestamp
 
 
 class MessageTimeout(Timeout):
@@ -30,11 +31,33 @@ class SwiftException(Exception):
     pass
 
 
-class SwiftConfigurationError(SwiftException):
+class PutterConnectError(Exception):
+
+    def __init__(self, status=None):
+        self.status = status
+
+
+class InvalidTimestamp(SwiftException):
+    pass
+
+
+class InsufficientStorage(SwiftException):
+    pass
+
+
+class FooterNotSupported(SwiftException):
+    pass
+
+
+class MultiphasePUTNotSupported(SwiftException):
+    pass
+
+
+class SuffixSyncError(SwiftException):
     pass
 
 
-class AuditException(SwiftException):
+class RangeAlreadyComplete(SwiftException):
     pass
 
 
@@ -42,7 +65,67 @@ class DiskFileError(SwiftException):
     pass
 
 
-class DiskFileNotExist(SwiftException):
+class DiskFileNotOpen(DiskFileError):
+    pass
+
+
+class DiskFileQuarantined(DiskFileError):
+    pass
+
+
+class DiskFileCollision(DiskFileError):
+    pass
+
+
+class DiskFileNotExist(DiskFileError):
+    pass
+
+
+class DiskFileStateChanged(DiskFileError):
+    """
+    Raised when state of a DiskFile changes while it is being opened (e.g. the
+    list of on-disk files changes). Retrying the DiskFile interface may
+    succeed.
+    """
+
+
+class DiskFileDeleted(DiskFileNotExist):
+
+    def __init__(self, metadata=None):
+        self.metadata = metadata or {}
+        self.timestamp = Timestamp(
+            self.metadata.get('X-Timestamp', Timestamp.zero()))
+
+
+class DiskFileExpired(DiskFileDeleted):
+    pass
+
+
+class DiskFileNoSpace(DiskFileError):
+    pass
+
+
+class DiskFileDeviceUnavailable(DiskFileError):
+    pass
+
+
+class DiskFileXattrNotSupported(DiskFileError):
+    pass
+
+
+class DiskFileBadMetadataChecksum(DiskFileError):
+    pass
+
+
+class DeviceUnavailable(SwiftException):
+    pass
+
+
+class DatabaseAuditorException(SwiftException):
+    pass
+
+
+class InvalidAccountInfo(DatabaseAuditorException):
     pass
 
 
@@ -50,7 +133,15 @@ class PathNotDir(OSError):
     pass
 
 
-class AuthException(SwiftException):
+class DevIdBytesTooSmall(ValueError):
+    pass
+
+
+class ChunkReadError(SwiftException):
+    pass
+
+
+class ShortReadError(SwiftException):
     pass
 
 
@@ -66,6 +157,10 @@ class ConnectionTimeout(Timeout):
     pass
 
 
+class ResponseTimeout(Timeout):
+    pass
+
+
 class DriveNotMounted(SwiftException):
     pass
 
@@ -74,6 +169,10 @@ class LockTimeout(MessageTimeout):
     pass
 
 
+class RingLoadError(SwiftException):
+    pass
+
+
 class RingBuilderError(SwiftException):
     pass
 
@@ -90,6 +189,18 @@ class DuplicateDeviceError(RingBuilderError):
     pass
 
 
+class UnPicklingError(SwiftException):
+    pass
+
+
+class FileNotFoundError(SwiftException):
+    pass
+
+
+class PermissionError(SwiftException):
+    pass
+
+
 class ListingIterError(SwiftException):
     pass
 
@@ -102,3 +213,114 @@ class ListingIterNotAuthorized(ListingIterError):
 
     def __init__(self, aresp):
         self.aresp = aresp
+
+
+class SegmentError(SwiftException):
+    pass
+
+
+class LinkIterError(SwiftException):
+    pass
+
+
+class ReplicationException(Exception):
+    pass
+
+
+class ReplicationLockTimeout(LockTimeout):
+    pass
+
+
+class PartitionLockTimeout(LockTimeout):
+    pass
+
+
+class MimeInvalid(SwiftException):
+    pass
+
+
+class APIVersionError(SwiftException):
+    pass
+
+
+class EncryptionException(SwiftException):
+    pass
+
+
+class UnknownSecretIdError(EncryptionException):
+    pass
+
+
+class QuarantineRequest(SwiftException):
+    pass
+
+
+class MemcacheConnectionError(Exception):
+    pass
+
+
+class MemcacheIncrNotFoundError(MemcacheConnectionError):
+    pass
+
+
+class MemcachePoolTimeout(Timeout):
+    pass
+
+
+class ClientException(Exception):
+
+    def __init__(self, msg, http_scheme='', http_host='', http_port='',
+                 http_path='', http_query='', http_status=None, http_reason='',
+                 http_device='', http_response_content='', http_headers=None):
+        super(ClientException, self).__init__(msg)
+        self.msg = msg
+        self.http_scheme = http_scheme
+        self.http_host = http_host
+        self.http_port = http_port
+        self.http_path = http_path
+        self.http_query = http_query
+        self.http_status = http_status
+        self.http_reason = http_reason
+        self.http_device = http_device
+        self.http_response_content = http_response_content
+        self.http_headers = http_headers or {}
+
+    def __str__(self):
+        a = self.msg
+        b = ''
+        if self.http_scheme:
+            b += '%s://' % self.http_scheme
+        if self.http_host:
+            b += self.http_host
+        if self.http_port:
+            b += ':%s' % self.http_port
+        if self.http_path:
+            b += self.http_path
+        if self.http_query:
+            b += '?%s' % self.http_query
+        if self.http_status:
+            if b:
+                b = '%s %s' % (b, self.http_status)
+            else:
+                b = str(self.http_status)
+        if self.http_reason:
+            if b:
+                b = '%s %s' % (b, self.http_reason)
+            else:
+                b = '- %s' % self.http_reason
+        if self.http_device:
+            if b:
+                b = '%s: device %s' % (b, self.http_device)
+            else:
+                b = 'device %s' % self.http_device
+        if self.http_response_content:
+            if len(self.http_response_content) <= 60:
+                b += '   %s' % self.http_response_content
+            else:
+                b += '  [first 60 chars of response] %s' \
+                    % self.http_response_content[:60]
+        return b and '%s: %s' % (a, b) or a
+
+
+class InvalidPidFileException(Exception):
+    pass
diff --git a/swift/common/header_key_dict.py b/swift/common/header_key_dict.py
new file mode 100644
index 0000000000..f6b906a15e
--- /dev/null
+++ b/swift/common/header_key_dict.py
@@ -0,0 +1,69 @@
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+
+class HeaderKeyDict(dict):
+    """
+    A dict that title-cases all keys on the way in, so as to be
+    case-insensitive.
+
+    Note that all keys and values are expected to be wsgi strings,
+    though some allowances are made when setting values.
+    """
+    def __init__(self, base_headers=None, **kwargs):
+        if base_headers:
+            self.update(base_headers)
+        self.update(kwargs)
+
+    @staticmethod
+    def _title(s):
+        return s.encode('latin1').title().decode('latin1')
+
+    def update(self, other):
+        if hasattr(other, 'keys'):
+            for key in other.keys():
+                self[self._title(key)] = other[key]
+        else:
+            for key, value in other:
+                self[self._title(key)] = value
+
+    def __getitem__(self, key):
+        return dict.get(self, self._title(key))
+
+    def __setitem__(self, key, value):
+        key = self._title(key)
+        if value is None:
+            self.pop(key, None)
+        elif isinstance(value, bytes):
+            return dict.__setitem__(self, key, value.decode('latin-1'))
+        else:
+            return dict.__setitem__(self, key, str(value))
+
+    def __contains__(self, key):
+        return dict.__contains__(self, self._title(key))
+
+    def __delitem__(self, key):
+        return dict.__delitem__(self, self._title(key))
+
+    def get(self, key, default=None):
+        return dict.get(self, self._title(key), default)
+
+    def setdefault(self, key, value=None):
+        if key not in self:
+            self[key] = value
+        return self[key]
+
+    def pop(self, key, default=None):
+        return dict.pop(self, self._title(key), default)
diff --git a/swift/common/http.py b/swift/common/http.py
index cc4bd6fdcb..6dc396062d 100644
--- a/swift/common/http.py
+++ b/swift/common/http.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -21,7 +21,7 @@ def is_informational(status):
     :param status: http status code
     :returns: True if status is successful, else False
     """
-    return 100 <= status and status <= 199
+    return 100 <= status <= 199
 
 
 def is_success(status):
@@ -31,7 +31,7 @@ def is_success(status):
     :param status: http status code
     :returns: True if status is successful, else False
     """
-    return 200 <= status and status <= 299
+    return 200 <= status <= 299
 
 
 def is_redirection(status):
@@ -41,7 +41,7 @@ def is_redirection(status):
     :param status: http status code
     :returns: True if status is redirection, else False
     """
-    return 300 <= status and status <= 399
+    return 300 <= status <= 399
 
 
 def is_client_error(status):
@@ -51,7 +51,7 @@ def is_client_error(status):
     :param status: http status code
     :returns: True if status is client error, else False
     """
-    return 400 <= status and status <= 499
+    return 400 <= status <= 499
 
 
 def is_server_error(status):
@@ -61,13 +61,13 @@ def is_server_error(status):
     :param status: http status code
     :returns: True if status is server error, else False
     """
-    return 500 <= status and status <= 599
+    return 500 <= status <= 599
 
 
 # List of HTTP status codes
 
 ###############################################################################
-## 1xx Informational
+# 1xx Informational
 ###############################################################################
 
 HTTP_CONTINUE = 100
@@ -77,7 +77,7 @@ def is_server_error(status):
 HTTP_REQUEST_URI_TOO_LONG = 122
 
 ###############################################################################
-## 2xx Success
+# 2xx Success
 ###############################################################################
 
 HTTP_OK = 200
@@ -91,7 +91,7 @@ def is_server_error(status):
 HTTP_IM_USED = 226
 
 ###############################################################################
-## 3xx Redirection
+# 3xx Redirection
 ###############################################################################
 
 HTTP_MULTIPLE_CHOICES = 300
@@ -105,7 +105,7 @@ def is_server_error(status):
 HTTP_RESUME_INCOMPLETE = 308
 
 ###############################################################################
-## 4xx Client Error
+# 4xx Client Error
 ###############################################################################
 
 HTTP_BAD_REQUEST = 400
@@ -138,10 +138,11 @@ def is_server_error(status):
 HTTP_NO_RESPONSE = 444
 HTTP_RETRY_WITH = 449
 HTTP_BLOCKED_BY_WINDOWS_PARENTAL_CONTROLS = 450
+HTTP_RATE_LIMITED = 498
 HTTP_CLIENT_CLOSED_REQUEST = 499
 
 ###############################################################################
-## 5xx Server Error
+# 5xx Server Error
 ###############################################################################
 
 HTTP_INTERNAL_SERVER_ERROR = 500
diff --git a/swift/common/http_protocol.py b/swift/common/http_protocol.py
new file mode 100644
index 0000000000..cce7a9ebd4
--- /dev/null
+++ b/swift/common/http_protocol.py
@@ -0,0 +1,373 @@
+# Copyright (c) 2010-2022 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from eventlet import wsgi, websocket
+
+from swift.common.utils import generate_trans_id
+from swift.common.http import HTTP_NO_CONTENT, HTTP_RESET_CONTENT, \
+    HTTP_NOT_MODIFIED
+
+from eventlet.green.http import client as http_client
+from html import escape
+
+
+class SwiftHttpProtocol(wsgi.HttpProtocol):
+    default_request_version = "HTTP/1.0"
+    reject_bad_requests = False
+
+    def __init__(self, *args, **kwargs):
+        # See https://github.com/eventlet/eventlet/pull/590
+        self.pre_shutdown_bugfix_eventlet = not getattr(
+            websocket.WebSocketWSGI, '_WSGI_APP_ALWAYS_IDLE', None)
+        super().__init__(*args, **kwargs)
+
+    def log_request(self, *a):
+        """
+        Turn off logging requests by the underlying WSGI software.
+        """
+        pass
+
+    def log_message(self, f, *a):
+        """
+        Redirect logging other messages by the underlying WSGI software.
+        """
+        logger = getattr(self.server.app, 'logger', None)
+        if logger:
+            logger.error('ERROR WSGI: ' + f, *a)
+        else:
+            # eventlet<=0.17.4 doesn't have an error method, and in newer
+            # versions the output from error is same as info anyway
+            self.server.log.info('ERROR WSGI: ' + f, *a)
+
+    class MessageClass(wsgi.HttpProtocol.MessageClass):
+        """Subclass to see when the client didn't provide a Content-Type"""
+        def get_default_type(self):
+            """If the client didn't provide a content type, leave it blank."""
+            return ''
+
+    def parse_request(self):
+        """Parse a request (inlined from cpython@7e293984).
+
+        The request should be stored in self.raw_requestline; the results
+        are in self.command, self.path, self.request_version and
+        self.headers.
+
+        Return True for success, False for failure; on failure, any relevant
+        error response has already been sent back.
+
+        """
+        self.command = None  # set in case of error on the first line
+        self.request_version = version = self.default_request_version
+        self.close_connection = True
+        requestline = self.raw_requestline.decode('iso-8859-1')
+        requestline = requestline.rstrip('\r\n')
+        self.requestline = requestline
+        # Split off \x20 explicitly (see https://bugs.python.org/issue33973)
+        words = requestline.split(' ')
+        if len(words) == 0:
+            return False
+
+        if len(words) >= 3:  # Enough to determine protocol version
+            version = words[-1]
+            try:
+                if not version.startswith('HTTP/'):
+                    raise ValueError
+                base_version_number = version.split('/', 1)[1]
+                version_number = base_version_number.split(".")
+                # RFC 2145 section 3.1 says there can be only one "." and
+                #   - major and minor numbers MUST be treated as
+                #      separate integers;
+                #   - HTTP/2.4 is a lower version than HTTP/2.13, which in
+                #      turn is lower than HTTP/12.3;
+                #   - Leading zeros MUST be ignored by recipients.
+                if len(version_number) != 2:
+                    raise ValueError
+                version_number = int(version_number[0]), int(version_number[1])
+            except (ValueError, IndexError):
+                self.send_error(
+                    400,
+                    "Bad request version (%r)" % version)
+                return False
+            if version_number >= (1, 1) and \
+                    self.protocol_version >= "HTTP/1.1":
+                self.close_connection = False
+            if version_number >= (2, 0):
+                self.send_error(
+                    505,
+                    "Invalid HTTP version (%s)" % base_version_number)
+                return False
+            self.request_version = version
+
+        if not 2 <= len(words) <= 3:
+            self.send_error(
+                400,
+                "Bad request syntax (%r)" % requestline)
+            return False
+        command, path = words[:2]
+        if len(words) == 2:
+            self.close_connection = True
+            if command != 'GET':
+                self.send_error(
+                    400,
+                    "Bad HTTP/0.9 request type (%r)" % command)
+                return False
+
+        if path.startswith(('http://', 'https://')):
+            host, sep, rest = path.partition('//')[2].partition('/')
+            if sep:
+                path = '/' + rest
+
+        self.command, self.path = command, path
+
+        # Examine the headers and look for a Connection directive.
+        try:
+            self.headers = http_client.parse_headers(
+                self.rfile,
+                _class=self.MessageClass)
+        except http_client.LineTooLong as err:
+            self.send_error(
+                431,
+                "Line too long",
+                str(err))
+            return False
+        except http_client.HTTPException as err:
+            self.send_error(
+                431,
+                "Too many headers",
+                str(err)
+            )
+            return False
+
+        conntype = self.headers.get('Connection', "")
+        if conntype.lower() == 'close':
+            self.close_connection = True
+        elif (conntype.lower() == 'keep-alive' and
+              self.protocol_version >= "HTTP/1.1"):
+            self.close_connection = False
+        # Examine the headers and look for an Expect directive
+        expect = self.headers.get('Expect', "")
+        if (expect.lower() == "100-continue" and
+                self.protocol_version >= "HTTP/1.1" and
+                self.request_version >= "HTTP/1.1"):
+            if not self.handle_expect_100():
+                return False
+        return True
+
+    def get_environ(self, *args, **kwargs):
+        environ = wsgi.HttpProtocol.get_environ(self, *args, **kwargs)
+        header_payload = self.headers.get_payload()
+        if isinstance(header_payload, list) and len(header_payload) == 1:
+            header_payload = header_payload[0].get_payload()
+        if header_payload:
+            # This shouldn't be here. We must've bumped up against
+            # https://bugs.python.org/issue37093
+            headers_raw = list(environ['headers_raw'])
+            for line in header_payload.rstrip('\r\n').split('\n'):
+                if ':' not in line or line[:1] in ' \t':
+                    # Well, we're no more broken than we were before...
+                    # Should we support line folding?
+                    # Should we 400 a bad header line?
+                    break
+                header, value = line.split(':', 1)
+                value = value.strip(' \t\n\r')
+                # NB: Eventlet looks at the headers obj to figure out
+                # whether the client said the connection should close;
+                # see https://github.com/eventlet/eventlet/blob/v0.25.0/
+                # eventlet/wsgi.py#L504
+                self.headers.add_header(header, value)
+                headers_raw.append((header, value))
+                wsgi_key = 'HTTP_' + header.replace('-', '_').encode(
+                    'latin1').upper().decode('latin1')
+                if wsgi_key in ('HTTP_CONTENT_LENGTH',
+                                'HTTP_CONTENT_TYPE'):
+                    wsgi_key = wsgi_key[5:]
+                environ[wsgi_key] = value
+            environ['headers_raw'] = tuple(headers_raw)
+            # Since we parsed some more headers, check to see if they
+            # change how our wsgi.input should behave
+            te = environ.get('HTTP_TRANSFER_ENCODING', '').lower()
+            if te.rsplit(',', 1)[-1].strip() == 'chunked':
+                environ['wsgi.input'].chunked_input = True
+            else:
+                length = environ.get('CONTENT_LENGTH')
+                if length:
+                    length = int(length)
+                environ['wsgi.input'].content_length = length
+            if environ.get('HTTP_EXPECT', '').lower() == '100-continue':
+                environ['wsgi.input'].wfile = self.wfile
+                environ['wsgi.input'].wfile_line = \
+                    b'HTTP/1.1 100 Continue\r\n'
+        return environ
+
+    def _read_request_line(self):
+        got = super()._read_request_line()
+        # See https://github.com/eventlet/eventlet/pull/590
+        if self.pre_shutdown_bugfix_eventlet:
+            self.conn_state[2] = wsgi.STATE_REQUEST
+        return got
+
+    def handle_one_request(self):
+        got = super().handle_one_request()
+        # See https://github.com/eventlet/eventlet/pull/590
+        if self.pre_shutdown_bugfix_eventlet:
+            if self.conn_state[2] != wsgi.STATE_CLOSE:
+                self.conn_state[2] = wsgi.STATE_IDLE
+        return got
+
+    def send_error(self, code, message=None, explain=None):
+        """Send and log an error reply, we are overriding the cpython parent
+        class method, so we can have logger generate txn_id's for error
+        response from wsgi since we are at the edge of the proxy server.
+        This sends an error response (so it must be called before any output
+        has been generated), logs the error, and finally sends a piece of HTML
+        explaining the error to the user.
+
+        :param code:    an HTTP error code
+                   3 digits
+        :param message: a simple optional 1 line reason phrase.
+                   *( HTAB / SP / VCHAR / %x80-FF )
+                   defaults to short entry matching the response code
+        :param explain: a detailed message defaults to the long entry
+                   matching the response code.
+        """
+
+        try:
+            shortmsg, longmsg = self.responses[code]
+        except KeyError:
+            shortmsg, longmsg = '???', '???'
+        if message is None:
+            message = shortmsg
+        if explain is None:
+            explain = longmsg
+
+        try:
+            # assume we have a LogAdapter
+            txn_id = self.server.app.logger.txn_id  # just in case it was set
+        except AttributeError:
+            # turns out we don't have a LogAdapter, so go direct
+            txn_id = generate_trans_id('')
+            self.log_error("code %d, message %s, (txn: %s)", code,
+                           message, txn_id)
+        else:
+            # we do have a LogAdapter, but likely not yet a txn_id
+            txn_id = txn_id or generate_trans_id('')
+            self.server.app.logger.txn_id = txn_id
+            self.log_error("code %d, message %s", code, message)
+        self.send_response(code, message)
+        self.send_header('Connection', 'close')
+
+        # Message body is omitted for cases described in:
+        #  - RFC7230: 3.3. 1xx, 204(No Content), 304(Not Modified)
+        #  - RFC7231: 6.3.6. 205(Reset Content)
+        body = None
+        exclude_status = (HTTP_NO_CONTENT,
+                          HTTP_RESET_CONTENT,
+                          HTTP_NOT_MODIFIED)
+        if (code >= 200 and
+                code not in exclude_status):
+            # HTML encode to prevent Cross Site Scripting attacks
+            # (see bug https://bugs.python.org/issue1100201)
+            content = (self.error_message_format % {
+                'code': code,
+                'message': escape(message, quote=False),
+                'explain': escape(explain, quote=False)
+            })
+            body = content.encode('UTF-8', 'replace')
+            self.send_header("Content-Type", self.error_content_type)
+            self.send_header('Content-Length', str(len(body)))
+            self.send_header('X-Trans-Id', txn_id)
+            self.send_header('X-Openstack-Request-Id', txn_id)
+        self.end_headers()
+
+        if self.command != 'HEAD' and body:
+            self.wfile.write(body)
+
+
+class SwiftHttpProxiedProtocol(SwiftHttpProtocol):
+    """
+    Protocol object that speaks HTTP, including multiple requests, but with
+    a single PROXY line as the very first thing coming in over the socket.
+    This is so we can learn what the client's IP address is when Swift is
+    behind a TLS terminator, like hitch, that does not understand HTTP and
+    so cannot add X-Forwarded-For or other similar headers.
+
+    See http://www.haproxy.org/download/1.7/doc/proxy-protocol.txt for
+    protocol details.
+    """
+    def __init__(self, *a, **kw):
+        self.proxy_address = None
+        SwiftHttpProtocol.__init__(self, *a, **kw)
+
+    def handle_error(self, connection_line):
+        connection_line = connection_line.decode('latin-1')
+
+        # No further processing will proceed on this connection under any
+        # circumstances.  We always send the request into the superclass to
+        # handle any cleanup - this ensures that the request will not be
+        # processed.
+        self.rfile.close()
+        # We don't really have any confidence that an HTTP Error will be
+        # processable by the client as our transmission broken down between
+        # ourselves and our gateway proxy before processing the client
+        # protocol request.  Hopefully the operator will know what to do!
+        msg = 'Invalid PROXY line %r' % connection_line
+        # Even assuming HTTP we don't even known what version of HTTP the
+        # client is sending?  This entire endeavor seems questionable.
+        self.request_version = self.default_request_version
+        # appease http.server
+        self.command = 'PROXY'
+        self.send_error(400, msg)
+
+    def handle(self):
+        """Handle multiple requests if necessary."""
+        # ensure the opening line for the connection is a valid PROXY protcol
+        # line; this is the only IO we do on this connection before any
+        # additional wrapping further pollutes the raw socket.
+        connection_line = self.rfile.readline(self.server.url_length_limit)
+
+        if not connection_line.startswith(b'PROXY '):
+            return self.handle_error(connection_line)
+
+        proxy_parts = connection_line.strip(b'\r\n').split(b' ')
+        if proxy_parts[1].startswith(b'UNKNOWN'):
+            # "UNKNOWN", in PROXY protocol version 1, means "not
+            # TCP4 or TCP6". This includes completely legitimate
+            # things like QUIC or Unix domain sockets. The PROXY
+            # protocol (section 2.1) states that the receiver
+            # (that's us) MUST ignore anything after "UNKNOWN" and
+            # before the CRLF, essentially discarding the first
+            # line.
+            pass
+        elif proxy_parts[1] in (b'TCP4', b'TCP6') and len(proxy_parts) == 6:
+            self.client_address = (
+                proxy_parts[2].decode('latin-1'),
+                proxy_parts[4].decode('latin-1'))
+            self.proxy_address = (
+                proxy_parts[3].decode('latin-1'),
+                proxy_parts[5].decode('latin-1'))
+        else:
+            self.handle_error(connection_line)
+
+        return SwiftHttpProtocol.handle(self)
+
+    def get_environ(self, *args, **kwargs):
+        environ = SwiftHttpProtocol.get_environ(self, *args, **kwargs)
+        if self.proxy_address:
+            environ['SERVER_ADDR'] = self.proxy_address[0]
+            environ['SERVER_PORT'] = self.proxy_address[1]
+            if self.proxy_address[1] == '443':
+                environ['wsgi.url_scheme'] = 'https'
+                environ['HTTPS'] = 'on'
+        return environ
diff --git a/swift/common/internal_client.py b/swift/common/internal_client.py
index f861412cae..883cd4e16e 100644
--- a/swift/common/internal_client.py
+++ b/swift/common/internal_client.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,17 +13,26 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-from eventlet import sleep, Timeout
+from eventlet import sleep, Timeout, spawn
+from eventlet.green import socket
+from eventlet.green.http import client as http_client
+from eventlet.green.urllib import request as urllib_request
 import json
-from paste.deploy import loadapp
+import urllib
 import struct
-from sys import exc_info
-from urllib import quote
+from sys import exit
 import zlib
+from time import gmtime, strftime, time
 from zlib import compressobj
 
-from swift.common.http import HTTP_NOT_FOUND
-from swift.common.swob import Request
+from swift.common.exceptions import ClientException
+from swift.common.http import (HTTP_NOT_FOUND, HTTP_MULTIPLE_CHOICES,
+                               is_client_error, is_server_error)
+from swift.common.middleware.gatekeeper import GatekeeperMiddleware
+from swift.common.request_helpers import USE_REPLICATION_NETWORK_HEADER
+from swift.common.swob import Request, bytes_to_wsgi
+from swift.common.utils import quote, close_if_possible, drain_and_close
+from swift.common.wsgi import loadapp
 
 
 class UnexpectedResponse(Exception):
@@ -35,7 +44,7 @@ class UnexpectedResponse(Exception):
     """
 
     def __init__(self, message, resp):
-        super(UnexpectedResponse, self).__init__(self, message)
+        super(UnexpectedResponse, self).__init__(message)
         self.resp = resp
 
 
@@ -49,13 +58,25 @@ class CompressingFileReader(object):
 
     :param file_obj: File object to wrap.
     :param compresslevel:  Compression level, defaults to 9.
+    :param chunk_size:  Size of chunks read when iterating using object,
+                        defaults to 4096.
     """
 
-    def __init__(self, file_obj, compresslevel=9):
+    def __init__(self, file_obj, compresslevel=9, chunk_size=4096):
         self._f = file_obj
+        self.compresslevel = compresslevel
+        self.chunk_size = chunk_size
+        self.set_initial_state()
+
+    def set_initial_state(self):
+        """
+        Sets the object to the state needed for the first read.
+        """
+
+        self._f.seek(0)
         self._compressor = compressobj(
-            compresslevel, zlib.DEFLATED, -zlib.MAX_WBITS, zlib.DEF_MEM_LEVEL,
-            0)
+            self.compresslevel, zlib.DEFLATED, -zlib.MAX_WBITS,
+            zlib.DEF_MEM_LEVEL, 0)
         self.done = False
         self.first = True
         self.crc32 = 0
@@ -71,36 +92,41 @@ def read(self, *a, **kw):
         """
 
         if self.done:
-            return ''
+            return b''
         x = self._f.read(*a, **kw)
         if x:
-            self.crc32 = zlib.crc32(x, self.crc32) & 0xffffffffL
+            self.crc32 = zlib.crc32(x, self.crc32) & 0xffffffff
             self.total_size += len(x)
             compressed = self._compressor.compress(x)
             if not compressed:
                 compressed = self._compressor.flush(zlib.Z_SYNC_FLUSH)
         else:
             compressed = self._compressor.flush(zlib.Z_FINISH)
-            crc32 = struct.pack("<L", self.crc32 & 0xffffffffL)
-            size = struct.pack("<L", self.total_size & 0xffffffffL)
+            crc32 = struct.pack("<L", self.crc32 & 0xffffffff)
+            size = struct.pack("<L", self.total_size & 0xffffffff)
             footer = crc32 + size
             compressed += footer
             self.done = True
         if self.first:
             self.first = False
-            header = '\037\213\010\000\000\000\000\000\002\377'
+            header = b'\037\213\010\000\000\000\000\000\002\377'
             compressed = header + compressed
         return compressed
 
     def __iter__(self):
         return self
 
-    def next(self):
-        chunk = self.read()
+    def __next__(self):
+        chunk = self.read(self.chunk_size)
         if chunk:
             return chunk
         raise StopIteration
 
+    def seek(self, offset, whence=0):
+        if not (offset == 0 and whence == 0):
+            raise NotImplementedError('Seek implemented on offset 0 only')
+        self.set_initial_state()
+
 
 class InternalClient(object):
     """
@@ -112,17 +138,53 @@ class InternalClient(object):
     :param user_agent: User agent to be sent to requests to Swift.
     :param request_tries: Number of tries before InternalClient.make_request()
                           gives up.
+    :param use_replication_network: Force the client to use the replication
+        network over the cluster.
+    :param global_conf: a dict of options to update the loaded proxy config.
+        Options in ``global_conf`` will override those in ``conf_path`` except
+        where the ``conf_path`` option is preceded by ``set``.
+    :param app: Optionally provide a WSGI app for the internal client to use.
     """
 
-    def __init__(self, conf_path, user_agent, request_tries):
-        self.app = loadapp('config:' + conf_path)
-        self.user_agent = user_agent
+    def __init__(self, conf_path, user_agent, request_tries,
+                 use_replication_network=False, global_conf=None, app=None,
+                 **kwargs):
+        if request_tries < 1:
+            raise ValueError('request_tries must be positive')
+        # Internal clients don't use the gatekeeper and the pipeline remains
+        # static so we never allow anything to modify the proxy pipeline.
+        if kwargs.get('allow_modify_pipeline'):
+            raise ValueError("'allow_modify_pipeline' is no longer supported")
+        self.app = app or loadapp(conf_path, global_conf=global_conf,
+                                  allow_modify_pipeline=False,)
+        self.check_gatekeeper_not_loaded(self.app)
+        self.user_agent = \
+            self.app._pipeline_final_app.backend_user_agent = user_agent
         self.request_tries = request_tries
+        self.use_replication_network = use_replication_network
+        self.get_object_ring = self.app._pipeline_final_app.get_object_ring
+        self.container_ring = self.app._pipeline_final_app.container_ring
+        self.account_ring = self.app._pipeline_final_app.account_ring
+        self.auto_create_account_prefix = \
+            self.app._pipeline_final_app.auto_create_account_prefix
+
+    @staticmethod
+    def check_gatekeeper_not_loaded(app):
+        # the Gatekeeper middleware would prevent an InternalClient passing
+        # X-Backend-* headers to the proxy app, so ensure it's not present
+        try:
+            for app in app._pipeline:
+                if isinstance(app, GatekeeperMiddleware):
+                    raise ValueError(
+                        "Gatekeeper middleware is not allowed in the "
+                        "InternalClient proxy pipeline")
+        except AttributeError:
+            pass
 
     def make_request(
-            self, method, path, headers, acceptable_statuses, body_file=None):
-        """
-        Makes a request to Swift with retries.
+            self, method, path, headers, acceptable_statuses, body_file=None,
+            params=None):
+        """Makes a request to Swift with retries.
 
         :param method: HTTP method of request.
         :param path: Path of request.
@@ -130,8 +192,10 @@ def make_request(
         :param acceptable_statuses: List of acceptable statuses for request.
         :param body_file: Body file to be passed along with request,
                           defaults to None.
+        :param params: A dict of params to be set in request query string,
+                       defaults to None.
 
-        :returns : Response object on success.
+        :returns: Response object on success.
 
         :raises UnexpectedResponse: Exception raised when make_request() fails
                                     to get a response with an acceptable status
@@ -141,31 +205,62 @@ def make_request(
 
         headers = dict(headers)
         headers['user-agent'] = self.user_agent
-        resp = exc_type = exc_value = exc_traceback = None
-        for attempt in xrange(self.request_tries):
+        headers.setdefault('x-backend-allow-reserved-names', 'true')
+        if self.use_replication_network:
+            headers.setdefault(USE_REPLICATION_NETWORK_HEADER, 'true')
+
+        for attempt in range(self.request_tries):
+            resp = err = None
             req = Request.blank(
                 path, environ={'REQUEST_METHOD': method}, headers=headers)
             if body_file is not None:
                 if hasattr(body_file, 'seek'):
                     body_file.seek(0)
                 req.body_file = body_file
+            if params:
+                req.params = params
             try:
-                resp = req.get_response(self.app)
+                # execute in a separate greenthread to not polute corolocals
+                resp = spawn(req.get_response, self.app).wait()
+            except (Exception, Timeout) as e:
+                err = e
+            else:
                 if resp.status_int in acceptable_statuses or \
                         resp.status_int // 100 in acceptable_statuses:
                     return resp
-            except (Exception, Timeout):
-                exc_type, exc_value, exc_traceback = exc_info()
-            sleep(2 ** (attempt + 1))
+                elif not is_server_error(resp.status_int):
+                    # No sense retrying when we expect the same result
+                    break
+            # sleep only between tries, not after each one
+            if attempt < self.request_tries - 1:
+                if resp:
+                    # for non 2XX requests it's safe and useful to drain
+                    # the response body so we log the correct status code
+                    if resp.status_int // 100 != 2:
+                        drain_and_close(resp)
+                    else:
+                        # Just close; the 499 is appropriate
+                        close_if_possible(resp.app_iter)
+                sleep(2 ** (attempt + 1))
         if resp:
-            raise UnexpectedResponse(
-                _('Unexpected response: %s' % (resp.status,)), resp)
-        if exc_type:
-            # To make pep8 tool happy, in place of raise t, v, tb:
-            raise exc_type(*exc_value.args), None, exc_traceback
+            msg = 'Unexpected response: %s' % resp.status
+            if resp.status_int // 100 != 2 and resp.body:
+                # provide additional context (and drain the response body) for
+                # non 2XX responses
+                msg += ' (%s)' % resp.body
+            raise UnexpectedResponse(msg, resp)
+        if err:
+            raise err
+
+    def handle_request(self, *args, **kwargs):
+        resp = self.make_request(*args, **kwargs)
+        # Drain the response body to prevent unexpected disconnect
+        # in proxy-server
+        drain_and_close(resp)
 
     def _get_metadata(
-            self, path, metadata_prefix='', acceptable_statuses=(2,)):
+            self, path, metadata_prefix='', acceptable_statuses=(2,),
+            headers=None, params=None):
         """
         Gets metadata by doing a HEAD on a path and using the metadata_prefix
         to get values from the headers returned.
@@ -176,8 +271,10 @@ def _get_metadata(
                                 keys in the dict returned.  Defaults to ''.
         :param acceptable_statuses: List of status for valid responses,
                                     defaults to (2,).
+        :param headers: extra headers to send
 
-        :returns : A dict of metadata with metadata_prefix stripped from keys.
+        :returns: A dict of metadata with metadata_prefix stripped from keys.
+                  Keys will be lowercase.
 
         :raises UnexpectedResponse: Exception raised when requests fail
                                     to get a response with an acceptable status
@@ -185,18 +282,18 @@ def _get_metadata(
                            unexpected way.
         """
 
-        resp = self.make_request('HEAD', path, {}, acceptable_statuses)
-        if resp.status_int // 100 != 2:
-            return {}
+        headers = headers or {}
+        resp = self.make_request('HEAD', path, headers, acceptable_statuses,
+                                 params=params)
         metadata_prefix = metadata_prefix.lower()
         metadata = {}
-        for k, v in resp.headers.iteritems():
+        for k, v in resp.headers.items():
             if k.lower().startswith(metadata_prefix):
-                metadata[k[len(metadata_prefix):]] = v
+                metadata[k[len(metadata_prefix):].lower()] = v
         return metadata
 
     def _iter_items(
-            self, path, marker='', end_marker='',
+            self, path, marker='', end_marker='', prefix='',
             acceptable_statuses=(2, HTTP_NOT_FOUND)):
         """
         Returns an iterator of items from a json listing.  Assumes listing has
@@ -206,6 +303,7 @@ def _iter_items(
         :param marker: Prefix of first desired item, defaults to ''.
         :param end_marker: Last item returned will be 'less' than this,
                            defaults to ''.
+        :param prefix: Prefix of items
         :param acceptable_statuses: List of status for valid responses,
                                     defaults to (2, HTTP_NOT_FOUND).
 
@@ -214,16 +312,23 @@ def _iter_items(
         :raises Exception: Exception is raised when code fails in an
                            unexpected way.
         """
-        if isinstance(marker, unicode):
+        if not isinstance(marker, bytes):
             marker = marker.encode('utf8')
-        if isinstance(end_marker, unicode):
+        if not isinstance(end_marker, bytes):
             end_marker = end_marker.encode('utf8')
+        if not isinstance(prefix, bytes):
+            prefix = prefix.encode('utf8')
+
         while True:
             resp = self.make_request(
-                'GET', '%s?format=json&marker=%s&end_marker=%s' %
-                (path, quote(marker), quote(end_marker)),
+                'GET', '%s?format=json&marker=%s&end_marker=%s&prefix=%s' %
+                (path, bytes_to_wsgi(quote(marker)),
+                 bytes_to_wsgi(quote(end_marker)),
+                 bytes_to_wsgi(quote(prefix))),
                 {}, acceptable_statuses)
-            if resp.status_int != 200:
+            if not resp.status_int == 200:
+                if resp.status_int >= HTTP_MULTIPLE_CHOICES:
+                    b''.join(resp.app_iter)
                 break
             data = json.loads(resp.body)
             if not data:
@@ -245,15 +350,6 @@ def make_path(self, account, container=None, obj=None):
                             not.
         """
 
-        if isinstance(account, unicode):
-            account = account.encode('utf-8')
-
-        if isinstance(container, unicode):
-            container = container.encode('utf-8')
-
-        if isinstance(obj, unicode):
-            obj = obj.encode('utf-8')
-
         path = '/v1/%s' % quote(account)
         if container:
             path += '/%s' % quote(container)
@@ -286,17 +382,17 @@ def _set_metadata(
         """
 
         headers = {}
-        for k, v in metadata.iteritems():
+        for k, v in metadata.items():
             if k.lower().startswith(metadata_prefix):
                 headers[k] = v
             else:
                 headers['%s%s' % (metadata_prefix, k)] = v
-        self.make_request('POST', path, headers, acceptable_statuses)
+        self.handle_request('POST', path, headers, acceptable_statuses)
 
     # account methods
 
     def iter_containers(
-            self, account, marker='', end_marker='',
+            self, account, marker='', end_marker='', prefix='',
             acceptable_statuses=(2, HTTP_NOT_FOUND)):
         """
         Returns an iterator of containers dicts from an account.
@@ -305,6 +401,7 @@ def iter_containers(
         :param marker: Prefix of first desired item, defaults to ''.
         :param end_marker: Last item returned will be 'less' than this,
                            defaults to ''.
+        :param prefix: Prefix of containers
         :param acceptable_statuses: List of status for valid responses,
                                     defaults to (2, HTTP_NOT_FOUND).
 
@@ -315,7 +412,36 @@ def iter_containers(
         """
 
         path = self.make_path(account)
-        return self._iter_items(path, marker, end_marker, acceptable_statuses)
+        return self._iter_items(path, marker, end_marker, prefix,
+                                acceptable_statuses)
+
+    def create_account(self, account):
+        """
+        Creates an account.
+
+        :param account: Account to create.
+        :raises UnexpectedResponse: Exception raised when requests fail
+                                    to get a response with an acceptable status
+        :raises Exception: Exception is raised when code fails in an
+                           unexpected way.
+        """
+        path = self.make_path(account)
+        self.handle_request('PUT', path, {}, (201, 202))
+
+    def delete_account(self, account, acceptable_statuses=(2, HTTP_NOT_FOUND)):
+        """
+        Deletes an account.
+
+        :param account: Account to delete.
+        :param acceptable_statuses: List of status for valid responses,
+                                    defaults to (2, HTTP_NOT_FOUND).
+        :raises UnexpectedResponse: Exception raised when requests fail
+                                    to get a response with an acceptable status
+        :raises Exception: Exception is raised when code fails in an
+                           unexpected way.
+        """
+        path = self.make_path(account)
+        self.handle_request('DELETE', path, {}, acceptable_statuses)
 
     def get_account_info(
             self, account, acceptable_statuses=(2, HTTP_NOT_FOUND)):
@@ -334,13 +460,15 @@ def get_account_info(
 
         path = self.make_path(account)
         resp = self.make_request('HEAD', path, {}, acceptable_statuses)
+        if not resp.status_int // 100 == 2:
+            return (0, 0)
         return (int(resp.headers.get('x-account-container-count', 0)),
                 int(resp.headers.get('x-account-object-count', 0)))
 
     def get_account_metadata(
-            self, account, metadata_prefix='', acceptable_statuses=(2,)):
-        """
-        Gets account metadata.
+            self, account, metadata_prefix='', acceptable_statuses=(2,),
+            params=None):
+        """Gets account metadata.
 
         :param account: Account on which to get the metadata.
         :param metadata_prefix: Used to filter values from the headers
@@ -349,7 +477,7 @@ def get_account_metadata(
         :param acceptable_statuses: List of status for valid responses,
                                     defaults to (2,).
 
-        :returns : Returns dict of account metadata.
+        :returns: Returns dict of account metadata.  Keys will be lowercase.
 
         :raises UnexpectedResponse: Exception raised when requests fail
                                     to get a response with an acceptable status
@@ -358,7 +486,8 @@ def get_account_metadata(
         """
 
         path = self.make_path(account)
-        return self._get_metadata(path, metadata_prefix, acceptable_statuses)
+        return self._get_metadata(path, metadata_prefix, acceptable_statuses,
+                                  headers=None, params=params)
 
     def set_account_metadata(
             self, account, metadata, metadata_prefix='',
@@ -390,23 +519,22 @@ def set_account_metadata(
     # container methods
 
     def container_exists(self, account, container):
-        """
-        Checks to see if a container exists.
+        """Checks to see if a container exists.
 
         :param account: The container's account.
         :param container: Container to check.
 
-        :returns : True if container exists, false otherwise.
-
         :raises UnexpectedResponse: Exception raised when requests fail
                                     to get a response with an acceptable status
         :raises Exception: Exception is raised when code fails in an
                            unexpected way.
+
+        :returns: True if container exists, false otherwise.
         """
 
         path = self.make_path(account, container)
         resp = self.make_request('HEAD', path, {}, (2, HTTP_NOT_FOUND))
-        return resp.status_int != HTTP_NOT_FOUND
+        return not resp.status_int == HTTP_NOT_FOUND
 
     def create_container(
             self, account, container, headers=None, acceptable_statuses=(2,)):
@@ -427,10 +555,11 @@ def create_container(
 
         headers = headers or {}
         path = self.make_path(account, container)
-        self.make_request('PUT', path, headers, acceptable_statuses)
+        self.handle_request('PUT', path, headers, acceptable_statuses)
 
     def delete_container(
-            self, account, container, acceptable_statuses=(2, HTTP_NOT_FOUND)):
+            self, account, container, headers=None,
+            acceptable_statuses=(2, HTTP_NOT_FOUND)):
         """
         Deletes a container.
 
@@ -445,14 +574,14 @@ def delete_container(
                            unexpected way.
         """
 
+        headers = headers or {}
         path = self.make_path(account, container)
-        self.make_request('DELETE', path, {}, acceptable_statuses)
+        self.handle_request('DELETE', path, headers, acceptable_statuses)
 
     def get_container_metadata(
             self, account, container, metadata_prefix='',
-            acceptable_statuses=(2,)):
-        """
-        Gets container metadata.
+            acceptable_statuses=(2,), params=None):
+        """Gets container metadata.
 
         :param account: The container's account.
         :param container: Container to get metadata on.
@@ -462,7 +591,7 @@ def get_container_metadata(
         :param acceptable_statuses: List of status for valid responses,
                                     defaults to (2,).
 
-        :returns : Returns dict of container metadata.
+        :returns: Returns dict of container metadata.  Keys will be lowercase.
 
         :raises UnexpectedResponse: Exception raised when requests fail
                                     to get a response with an acceptable status
@@ -471,10 +600,11 @@ def get_container_metadata(
         """
 
         path = self.make_path(account, container)
-        return self._get_metadata(path, metadata_prefix, acceptable_statuses)
+        return self._get_metadata(path, metadata_prefix, acceptable_statuses,
+                                  params=params)
 
     def iter_objects(
-            self, account, container, marker='', end_marker='',
+            self, account, container, marker='', end_marker='', prefix='',
             acceptable_statuses=(2, HTTP_NOT_FOUND)):
         """
         Returns an iterator of object dicts from a container.
@@ -484,6 +614,7 @@ def iter_objects(
         :param marker: Prefix of first desired item, defaults to ''.
         :param end_marker: Last item returned will be 'less' than this,
                            defaults to ''.
+        :param prefix: Prefix of objects
         :param acceptable_statuses: List of status for valid responses,
                                     defaults to (2, HTTP_NOT_FOUND).
 
@@ -494,7 +625,8 @@ def iter_objects(
         """
 
         path = self.make_path(account, container)
-        return self._iter_items(path, marker, end_marker, acceptable_statuses)
+        return self._iter_items(path, marker, end_marker, prefix,
+                                acceptable_statuses)
 
     def set_container_metadata(
             self, account, container, metadata, metadata_prefix='',
@@ -528,7 +660,8 @@ def set_container_metadata(
 
     def delete_object(
             self, account, container, obj,
-            acceptable_statuses=(2, HTTP_NOT_FOUND)):
+            acceptable_statuses=(2, HTTP_NOT_FOUND),
+            headers=None):
         """
         Deletes an object.
 
@@ -537,6 +670,7 @@ def delete_object(
         :param obj: The object.
         :param acceptable_statuses: List of status for valid responses,
                                     defaults to (2, HTTP_NOT_FOUND).
+        :param headers: extra headers to send with request
 
         :raises UnexpectedResponse: Exception raised when requests fail
                                     to get a response with an acceptable status
@@ -545,13 +679,13 @@ def delete_object(
         """
 
         path = self.make_path(account, container, obj)
-        self.make_request('DELETE', path, {}, acceptable_statuses)
+        self.handle_request('DELETE', path, (headers or {}),
+                            acceptable_statuses)
 
     def get_object_metadata(
             self, account, container, obj, metadata_prefix='',
-            acceptable_statuses=(2,)):
-        """
-        Gets object metadata.
+            acceptable_statuses=(2,), headers=None, params=None):
+        """Gets object metadata.
 
         :param account: The object's account.
         :param container: The object's container.
@@ -561,8 +695,9 @@ def get_object_metadata(
                                 keys in the dict returned.  Defaults to ''.
         :param acceptable_statuses: List of status for valid responses,
                                     defaults to (2,).
+        :param headers: extra headers to send with request
 
-        :returns : Dict of object metadata.
+        :returns: Dict of object metadata.
 
         :raises UnexpectedResponse: Exception raised when requests fail
                                     to get a response with an acceptable status
@@ -571,7 +706,35 @@ def get_object_metadata(
         """
 
         path = self.make_path(account, container, obj)
-        return self._get_metadata(path, metadata_prefix, acceptable_statuses)
+        return self._get_metadata(path, metadata_prefix, acceptable_statuses,
+                                  headers=headers, params=params)
+
+    def get_object(self, account, container, obj, headers=None,
+                   acceptable_statuses=(2,), params=None):
+        """
+        Gets an object.
+
+        :param account: The object's account.
+        :param container: The object's container.
+        :param obj: The object name.
+        :param headers: Headers to send with request, defaults to empty dict.
+        :param acceptable_statuses: List of status for valid responses,
+                                    defaults to (2,).
+        :param params: A dict of params to be set in request query string,
+                       defaults to None.
+
+        :raises UnexpectedResponse: Exception raised when requests fail
+                                    to get a response with an acceptable status
+        :raises Exception: Exception is raised when code fails in an
+                           unexpected way.
+        :returns: A 3-tuple (status, headers, iterator of object body)
+        """
+
+        headers = headers or {}
+        path = self.make_path(account, container, obj)
+        resp = self.make_request(
+            'GET', path, headers, acceptable_statuses, params=params)
+        return (resp.status_int, resp.headers, resp.app_iter)
 
     def iter_object_lines(
             self, account, container, obj, headers=None,
@@ -584,7 +747,7 @@ def iter_object_lines(
 
         :param account: The object's account.
         :param container: The object's container.
-        :param objec_namet: The object.
+        :param obj: The object.
         :param acceptable_statuses: List of status for valid responses,
                                     defaults to (2,).
 
@@ -596,10 +759,11 @@ def iter_object_lines(
 
         headers = headers or {}
         path = self.make_path(account, container, obj)
-
         resp = self.make_request('GET', path, headers, acceptable_statuses)
+        if not resp.status_int // 100 == 2:
+            return
 
-        last_part = ''
+        last_part = b''
         compressed = obj.endswith('.gz')
         # magic in the following zlib.decompressobj argument is courtesy of
         # Python decompressing gzip chunk-by-chunk
@@ -608,7 +772,7 @@ def iter_object_lines(
         for chunk in resp.app_iter:
             if compressed:
                 chunk = d.decompress(chunk)
-            parts = chunk.split('\n')
+            parts = chunk.split(b'\n')
             if len(parts) == 1:
                 last_part = last_part + parts[0]
             else:
@@ -647,13 +811,17 @@ def set_object_metadata(
             path, metadata, metadata_prefix, acceptable_statuses)
 
     def upload_object(
-            self, fobj, account, container, obj, headers=None):
+            self, fobj, account, container, obj, headers=None,
+            acceptable_statuses=(2,), params=None):
         """
         :param fobj: File object to read object's content from.
         :param account: The object's account.
         :param container: The object's container.
         :param obj: The object.
-        :param headers: Headers to send with request, defaults ot empty dict.
+        :param headers: Headers to send with request, defaults to empty dict.
+        :param acceptable_statuses: List of acceptable statuses for request.
+        :param params: A dict of params to be set in request query string,
+                       defaults to None.
 
         :raises UnexpectedResponse: Exception raised when requests fail
                                     to get a response with an acceptable status
@@ -662,6 +830,174 @@ def upload_object(
         """
 
         headers = dict(headers or {})
-        headers['Transfer-Encoding'] = 'chunked'
+        if 'Content-Length' not in headers:
+            headers['Transfer-Encoding'] = 'chunked'
         path = self.make_path(account, container, obj)
-        self.make_request('PUT', path, headers, (2,), fobj)
+        self.handle_request('PUT', path, headers, acceptable_statuses, fobj,
+                            params=params)
+
+
+def get_auth(url, user, key, auth_version='1.0', **kwargs):
+    if auth_version != '1.0':
+        exit('ERROR: swiftclient missing, only auth v1.0 supported')
+    req = urllib_request.Request(url)
+    req.add_header('X-Auth-User', user)
+    req.add_header('X-Auth-Key', key)
+    conn = urllib_request.urlopen(req)
+    headers = conn.info()
+    return (
+        headers.getheader('X-Storage-Url'),
+        headers.getheader('X-Auth-Token'))
+
+
+class SimpleClient(object):
+    """
+    Simple client that is used in bin/swift-dispersion-* and container sync
+    """
+    def __init__(self, url=None, token=None, starting_backoff=1,
+                 max_backoff=5, retries=5):
+        self.url = url
+        self.token = token
+        self.attempts = 0  # needed in swif-dispersion-populate
+        self.starting_backoff = starting_backoff
+        self.max_backoff = max_backoff
+        self.retries = retries
+
+    def base_request(self, method, container=None, name=None, prefix=None,
+                     headers=None, proxy=None, contents=None,
+                     full_listing=None, logger=None, additional_info=None,
+                     timeout=None, marker=None):
+        # Common request method
+        trans_start = time()
+        url = self.url
+
+        if full_listing:
+            info, body_data = self.base_request(
+                method, container, name, prefix, headers, proxy,
+                timeout=timeout, marker=marker)
+            listing = body_data
+            while listing:
+                marker = listing[-1]['name']
+                info, listing = self.base_request(
+                    method, container, name, prefix, headers, proxy,
+                    timeout=timeout, marker=marker)
+                if listing:
+                    body_data.extend(listing)
+            return [info, body_data]
+
+        if headers is None:
+            headers = {}
+
+        if self.token:
+            headers['X-Auth-Token'] = self.token
+
+        if container:
+            url = '%s/%s' % (url.rstrip('/'), quote(container))
+
+        if name:
+            url = '%s/%s' % (url.rstrip('/'), quote(name))
+        else:
+            params = ['format=json']
+            if prefix:
+                params.append('prefix=%s' % prefix)
+
+            if marker:
+                params.append('marker=%s' % quote(marker))
+
+            url += '?' + '&'.join(params)
+
+        req = urllib_request.Request(url, headers=headers, data=contents)
+        if proxy:
+            proxy = urllib.parse.urlparse(proxy)
+            req.set_proxy(proxy.netloc, proxy.scheme)
+        req.get_method = lambda: method
+        conn = urllib_request.urlopen(req, timeout=timeout)
+        body = conn.read()
+        info = conn.info()
+        try:
+            body_data = json.loads(body)
+        except ValueError:
+            body_data = None
+        trans_stop = time()
+        if logger:
+            sent_content_length = 0
+            for n, v in headers.items():
+                nl = n.lower()
+                if nl == 'content-length':
+                    try:
+                        sent_content_length = int(v)
+                        break
+                    except ValueError:
+                        pass
+            logger.debug("-> " + " ".join(
+                quote(str(x) if x else "-", ":/")
+                for x in (
+                    strftime('%Y-%m-%dT%H:%M:%S', gmtime(trans_stop)),
+                    method,
+                    url,
+                    conn.getcode(),
+                    sent_content_length,
+                    info['content-length'],
+                    trans_start,
+                    trans_stop,
+                    trans_stop - trans_start,
+                    additional_info
+                )))
+        return [info, body_data]
+
+    def retry_request(self, method, **kwargs):
+        retries = kwargs.pop('retries', self.retries)
+        self.attempts = 0
+        backoff = self.starting_backoff
+        while self.attempts <= retries:
+            self.attempts += 1
+            try:
+                return self.base_request(method, **kwargs)
+            except urllib_request.HTTPError as err:
+                if is_client_error(err.getcode() or 500):
+                    raise ClientException('Client error',
+                                          http_status=err.getcode())
+                elif self.attempts > retries:
+                    raise ClientException('Raise too many retries',
+                                          http_status=err.getcode())
+            except (socket.error, http_client.HTTPException,
+                    urllib_request.URLError):
+                if self.attempts > retries:
+                    raise
+            sleep(backoff)
+            backoff = min(backoff * 2, self.max_backoff)
+
+    def get_account(self, *args, **kwargs):
+        # Used in swift-dispersion-populate
+        return self.retry_request('GET', **kwargs)
+
+    def put_container(self, container, **kwargs):
+        # Used in swift-dispersion-populate
+        return self.retry_request('PUT', container=container, **kwargs)
+
+    def get_container(self, container, **kwargs):
+        # Used in swift-dispersion-populate
+        return self.retry_request('GET', container=container, **kwargs)
+
+    def put_object(self, container, name, contents, **kwargs):
+        # Used in swift-dispersion-populate
+        return self.retry_request('PUT', container=container, name=name,
+                                  contents=contents.read(), **kwargs)
+
+
+def head_object(url, **kwargs):
+    """For usage with container sync """
+    client = SimpleClient(url=url)
+    return client.retry_request('HEAD', **kwargs)
+
+
+def put_object(url, **kwargs):
+    """For usage with container sync """
+    client = SimpleClient(url=url)
+    client.retry_request('PUT', **kwargs)
+
+
+def delete_object(url, **kwargs):
+    """For usage with container sync """
+    client = SimpleClient(url=url)
+    client.retry_request('DELETE', **kwargs)
diff --git a/swift/common/linkat.py b/swift/common/linkat.py
new file mode 100644
index 0000000000..a85463a325
--- /dev/null
+++ b/swift/common/linkat.py
@@ -0,0 +1,82 @@
+# Copyright (c) 2016 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import os
+import ctypes
+from ctypes.util import find_library
+
+__all__ = ['linkat']
+
+
+class Linkat(object):
+
+    # From include/uapi/linux/fcntl.h
+    AT_FDCWD = -100
+    AT_SYMLINK_FOLLOW = 0x400
+
+    __slots__ = '_c_linkat'
+
+    def __init__(self):
+        libc = ctypes.CDLL(find_library('c'), use_errno=True)
+
+        try:
+            c_linkat = libc.linkat
+        except AttributeError:
+            self._c_linkat = None
+            return
+
+        c_linkat.argtypes = [ctypes.c_int, ctypes.c_char_p,
+                             ctypes.c_int, ctypes.c_char_p,
+                             ctypes.c_int]
+        c_linkat.restype = ctypes.c_int
+
+        def errcheck(result, func, arguments):
+            if result == -1:
+                errno = ctypes.set_errno(0)
+                raise IOError(errno, 'linkat: %s' % os.strerror(errno))
+            else:
+                return result
+
+        c_linkat.errcheck = errcheck
+
+        self._c_linkat = c_linkat
+
+    @property
+    def available(self):
+        return self._c_linkat is not None
+
+    def __call__(self, olddirfd, oldpath, newdirfd, newpath, flags):
+        """
+        linkat() creates a new link (also known as a hard link)
+        to an existing file.
+
+        See `man 2 linkat` for more info.
+        """
+        if not self.available:
+            raise EnvironmentError('linkat not available')
+
+        if not isinstance(olddirfd, int) or not isinstance(newdirfd, int):
+            raise TypeError("fd must be an integer.")
+
+        if isinstance(oldpath, str):
+            oldpath = oldpath.encode('utf8')
+        if isinstance(newpath, str):
+            newpath = newpath.encode('utf8')
+
+        return self._c_linkat(olddirfd, oldpath, newdirfd, newpath, flags)
+
+
+linkat = Linkat()
+del Linkat
diff --git a/swift/common/manager.py b/swift/common/manager.py
index 855a965d09..68dd2089a9 100644
--- a/swift/common/manager.py
+++ b/swift/common/manager.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,41 +13,52 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-from __future__ import with_statement
+
 import functools
 import errno
+from optparse import OptionParser
 import os
 import resource
 import signal
 import time
 import subprocess
 import re
+import sys
+import tempfile
+from shutil import which
 
-from swift.common.utils import search_tree, remove_file, write_file
+from swift.common.utils import search_tree, remove_file, write_file, readconf
+from swift.common.exceptions import InvalidPidFileException
 
 SWIFT_DIR = '/etc/swift'
 RUN_DIR = '/var/run/swift'
+PROC_DIR = '/proc'
 
-# auth-server has been removed from ALL_SERVERS, start it explicitly
 ALL_SERVERS = ['account-auditor', 'account-server', 'container-auditor',
-               'container-replicator', 'container-server', 'container-sync',
+               'container-replicator', 'container-reconciler',
+               'container-server', 'container-sharder', 'container-sync',
                'container-updater', 'object-auditor', 'object-server',
-               'object-expirer', 'object-replicator', 'object-updater',
+               'object-expirer', 'object-replicator',
+               'object-reconstructor', 'object-updater',
                'proxy-server', 'account-replicator', 'account-reaper']
 MAIN_SERVERS = ['proxy-server', 'account-server', 'container-server',
                 'object-server']
 REST_SERVERS = [s for s in ALL_SERVERS if s not in MAIN_SERVERS]
-GRACEFUL_SHUTDOWN_SERVERS = MAIN_SERVERS + ['auth-server']
+# aliases mapping
+ALIASES = {'all': ALL_SERVERS, 'main': MAIN_SERVERS, 'rest': REST_SERVERS}
+GRACEFUL_SHUTDOWN_SERVERS = MAIN_SERVERS
+SEAMLESS_SHUTDOWN_SERVERS = MAIN_SERVERS
 START_ONCE_SERVERS = REST_SERVERS
 # These are servers that match a type (account-*, container-*, object-*) but
 # don't use that type-server.conf file and instead use their own.
-STANDALONE_SERVERS = ['object-expirer']
+STANDALONE_SERVERS = ['container-reconciler']
 
-KILL_WAIT = 15  # seconds to wait for servers to die
+KILL_WAIT = 15  # seconds to wait for servers to die (by default)
 WARNING_WAIT = 3  # seconds to wait after message that may just be a warning
 
 MAX_DESCRIPTORS = 32768
 MAX_MEMORY = (1024 * 1024 * 1024) * 2  # 2 GB
+MAX_PROCS = 8192  # workers * disks, can get high
 
 
 def setup_env():
@@ -56,13 +67,26 @@ def setup_env():
     try:
         resource.setrlimit(resource.RLIMIT_NOFILE,
                            (MAX_DESCRIPTORS, MAX_DESCRIPTORS))
+    except ValueError:
+        print("WARNING: Unable to modify file descriptor limit.  "
+              "Running as non-root?")
+
+    try:
         resource.setrlimit(resource.RLIMIT_DATA,
                            (MAX_MEMORY, MAX_MEMORY))
     except ValueError:
-        print _("WARNING: Unable to increase file descriptor limit.  "
-                "Running as non-root?")
+        print("WARNING: Unable to modify memory limit.  "
+              "Running as non-root?")
+
+    try:
+        resource.setrlimit(resource.RLIMIT_NPROC,
+                           (MAX_PROCS, MAX_PROCS))
+    except ValueError:
+        print("WARNING: Unable to modify max process limit.  "
+              "Running as non-root?")
 
-    os.environ['PYTHON_EGG_CACHE'] = '/tmp'
+    # Set PYTHON_EGG_CACHE if it isn't already set
+    os.environ.setdefault('PYTHON_EGG_CACHE', tempfile.gettempdir())
 
 
 def command(func):
@@ -75,14 +99,16 @@ def command(func):
     func.publicly_accessible = True
 
     @functools.wraps(func)
-    def wrapped(*a, **kw):
-        rv = func(*a, **kw)
+    def wrapped(self, *a, **kw):
+        rv = func(self, *a, **kw)
+        if len(self.servers) == 0:
+            return 1
         return 1 if rv else 0
     return wrapped
 
 
 def watch_server_pids(server_pids, interval=1, **kwargs):
-    """Monitor a collection of server pids yeilding back those pids that
+    """Monitor a collection of server pids yielding back those pids that
     aren't responding to signals.
 
     :param server_pids: a dict, lists of pids [int,...] keyed on
@@ -98,7 +124,7 @@ def watch_server_pids(server_pids, interval=1, **kwargs):
                 try:
                     # let pid stop if it wants to
                     os.waitpid(pid, os.WNOHANG)
-                except OSError, e:
+                except OSError as e:
                     if e.errno not in (errno.ECHILD, errno.ESRCH):
                         raise  # else no such child/process
             # check running pids for server
@@ -118,36 +144,117 @@ def watch_server_pids(server_pids, interval=1, **kwargs):
             time.sleep(0.1)
 
 
+def safe_kill(pid, sig, name):
+    """Send signal to process and check process name
+
+    : param pid: process id
+    : param sig: signal to send
+    : param name: name to ensure target process
+    """
+
+    # check process name for SIG_DFL
+    if sig == signal.SIG_DFL:
+        try:
+            proc_file = '%s/%d/cmdline' % (PROC_DIR, pid)
+            if os.path.exists(proc_file):
+                with open(proc_file, 'r') as fd:
+                    if name not in fd.read():
+                        # unknown process is using the pid
+                        raise InvalidPidFileException()
+        except IOError:
+            pass
+
+    os.kill(pid, sig)
+
+
+def kill_group(pid, sig):
+    """Send signal to process group
+
+    : param pid: process id
+    : param sig: signal to send
+    """
+    # Negative PID means process group
+    os.kill(-pid, sig)
+
+
+def get_child_pids(pid):
+    """
+    Get the current set of all child PIDs for a PID.
+
+    :param pid: process id
+    """
+    output = subprocess.check_output(
+        ["ps", "--ppid", str(pid), "--no-headers", "-o", "pid"])
+    return {int(pid) for pid in output.split()}
+
+
+def format_server_name(servername):
+    """
+    Formats server name as swift compatible server names
+    E.g. swift-object-server
+
+    :param servername: server name
+    :returns: swift compatible server name and its binary name
+    """
+    if '.' in servername:
+        servername = servername.split('.', 1)[0]
+    if '-' not in servername:
+        servername = '%s-server' % servername
+    cmd = 'swift-%s' % servername
+    return servername, cmd
+
+
+def verify_server(server):
+    """
+    Check whether the server is among swift servers or not, and also
+    checks whether the server's binaries are installed or not.
+
+    :param server: name of the server
+    :returns: True, when the server name is valid and its binaries are found.
+              False, otherwise.
+    """
+    if not server:
+        return False
+    _, cmd = format_server_name(server)
+    if which(cmd) is None:
+        return False
+    return True
+
+
 class UnknownCommandError(Exception):
     pass
 
 
-class Manager():
+class Manager(object):
     """Main class for performing commands on groups of servers.
 
     :param servers: list of server names as strings
 
     """
 
-    def __init__(self, servers):
-        server_names = set()
+    def __init__(self, servers, run_dir=RUN_DIR):
+        self.server_names = set()
+        self._default_strict = True
         for server in servers:
-            if server == 'all':
-                server_names.update(ALL_SERVERS)
-            elif server == 'main':
-                server_names.update(MAIN_SERVERS)
-            elif server == 'rest':
-                server_names.update(REST_SERVERS)
+            if server in ALIASES:
+                self.server_names.update(ALIASES[server])
+                self._default_strict = False
             elif '*' in server:
                 # convert glob to regex
-                server_names.update([s for s in ALL_SERVERS if
-                                     re.match(server.replace('*', '.*'), s)])
+                self.server_names.update([
+                    s for s in ALL_SERVERS if
+                    re.match(server.replace('*', '.*'), s)])
+                self._default_strict = False
             else:
-                server_names.add(server)
+                self.server_names.add(server)
 
         self.servers = set()
-        for name in server_names:
-            self.servers.add(Server(name))
+        for name in self.server_names:
+            if verify_server(name):
+                self.servers.add(Server(name, run_dir))
+
+    def __iter__(self):
+        return iter(self.servers)
 
     @command
     def status(self, **kwargs):
@@ -165,14 +272,23 @@ def start(self, **kwargs):
         setup_env()
         status = 0
 
+        strict = kwargs.get('strict')
+        # if strict not set explicitly
+        if strict is None:
+            strict = self._default_strict
+
         for server in self.servers:
-            server.launch(**kwargs)
+            status += 0 if server.launch(**kwargs) else 1
+
+        if not strict:
+            status = 0
+
         if not kwargs.get('daemon', True):
             for server in self.servers:
                 try:
                     status += server.interact(**kwargs)
                 except KeyboardInterrupt:
-                    print _('\nuser quit')
+                    print('\nuser quit')
                     self.stop(**kwargs)
                     break
         elif kwargs.get('wait', True):
@@ -209,7 +325,7 @@ def stop(self, **kwargs):
         for server in self.servers:
             signaled_pids = server.stop(**kwargs)
             if not signaled_pids:
-                print _('No %s running') % server
+                print('No %s running' % server)
             else:
                 server_pids[server] = signaled_pids
 
@@ -218,23 +334,56 @@ def stop(self, **kwargs):
                          for p in pids]
         # keep track of the pids yeiled back as killed for all servers
         killed_pids = set()
+        kill_wait = kwargs.get('kill_wait', KILL_WAIT)
         for server, killed_pid in watch_server_pids(server_pids,
-                                                    interval=KILL_WAIT,
+                                                    interval=kill_wait,
                                                     **kwargs):
-            print _("%s (%s) appears to have stopped") % (server, killed_pid)
+            print("%(server)s (%(pid)s) appears to have stopped" %
+                  {'server': server, 'pid': killed_pid})
             killed_pids.add(killed_pid)
             if not killed_pids.symmetric_difference(signaled_pids):
-                # all proccesses have been stopped
+                # all processes have been stopped
                 return 0
 
         # reached interval n watch_pids w/o killing all servers
+        kill_after_timeout = kwargs.get('kill_after_timeout', False)
         for server, pids in server_pids.items():
             if not killed_pids.issuperset(pids):
                 # some pids of this server were not killed
-                print _('Waited %s seconds for %s to die; giving up') % (
-                    KILL_WAIT, server)
+                if kill_after_timeout:
+                    print('Waited %(kill_wait)s seconds for %(server)s '
+                          'to die; killing' %
+                          {'kill_wait': kill_wait, 'server': server})
+                    # Send SIGKILL to all remaining pids
+                    for pid in set(pids.keys()) - killed_pids:
+                        print('Signal %(server)s  pid: %(pid)s  signal: '
+                              '%(signal)s' % {'server': server,
+                                              'pid': pid,
+                                              'signal': signal.SIGKILL})
+                        # Send SIGKILL to process group
+                        try:
+                            kill_group(pid, signal.SIGKILL)
+                        except OSError as e:
+                            # PID died before kill_group can take action?
+                            if e.errno != errno.ESRCH:
+                                raise
+                else:
+                    print('Waited %(kill_wait)s seconds for %(server)s '
+                          'to die; giving up' %
+                          {'kill_wait': kill_wait, 'server': server})
         return 1
 
+    @command
+    def kill(self, **kwargs):
+        """stop a server (no error if not running)
+        """
+        status = self.stop(**kwargs)
+        kwargs['quiet'] = True
+        if status and not self.status(**kwargs):
+            # only exit error if the server is still running
+            return status
+        return 0
+
     @command
     def shutdown(self, **kwargs):
         """allow current requests to finish on supporting servers
@@ -259,12 +408,37 @@ def reload(self, **kwargs):
         """
         kwargs['graceful'] = True
         status = 0
-        for server in self.servers:
-            m = Manager([server.server])
+        for server in self.server_names:
+            m = Manager([server])
             status += m.stop(**kwargs)
             status += m.start(**kwargs)
         return status
 
+    @command
+    def reload_seamless(self, **kwargs):
+        """seamlessly re-exec, then shutdown of old listen sockets on
+           supporting servers
+        """
+        kwargs.pop('graceful', None)
+        kwargs['seamless'] = True
+        status = 0
+        for server in self.servers:
+            signaled_pids = server.stop(**kwargs)
+            if not signaled_pids:
+                print('No %s running' % server)
+                status += 1
+        return status
+
+    def kill_child_pids(self, **kwargs):
+        """kill child pids, optionally servicing accepted connections"""
+        status = 0
+        for server in self.servers:
+            signaled_pids = server.kill_child_pids(**kwargs)
+            if not signaled_pids:
+                print('No %s running' % server)
+                status += 1
+        return status
+
     @command
     def force_reload(self, **kwargs):
         """alias for reload
@@ -279,9 +453,8 @@ def get_command(self, cmd):
 
         """
         cmd = cmd.lower().replace('-', '_')
-        try:
-            f = getattr(self, cmd)
-        except AttributeError:
+        f = getattr(self, cmd, None)
+        if f is None:
             raise UnknownCommandError(cmd)
         if not hasattr(f, 'publicly_accessible'):
             raise UnknownCommandError(cmd)
@@ -309,19 +482,22 @@ def run_command(self, cmd, **kwargs):
         return f(**kwargs)
 
 
-class Server():
+class Server(object):
     """Manage operations on a server or group of servers of similar type
 
     :param server: name of server
     """
 
-    def __init__(self, server):
-        if '-' not in server:
-            server = '%s-server' % server
+    def __init__(self, server, run_dir=RUN_DIR):
         self.server = server.lower()
-        self.type = server.rsplit('-', 1)[0]
-        self.cmd = 'swift-%s' % server
+        if '.' in self.server:
+            self.server, self.conf = self.server.rsplit('.', 1)
+        else:
+            self.conf = None
+        self.server, self.cmd = format_server_name(self.server)
+        self.type = self.server.rsplit('-', 1)[0]
         self.procs = []
+        self.run_dir = run_dir
 
     def __str__(self):
         return self.server
@@ -338,6 +514,9 @@ def __eq__(self, other):
         except AttributeError:
             return False
 
+    def __ne__(self, other):
+        return not self.__eq__(other)
+
     def get_pid_file_name(self, conf_file):
         """Translate conf_file to a corresponding pid_file
 
@@ -347,9 +526,9 @@ def get_pid_file_name(self, conf_file):
 
         """
         return conf_file.replace(
-            os.path.normpath(SWIFT_DIR), RUN_DIR, 1).replace(
-                '%s-server' % self.type, self.server, 1).rsplit(
-                    '.conf', 1)[0] + '.pid'
+            os.path.normpath(SWIFT_DIR), self.run_dir, 1).replace(
+                '%s-server' % self.type, self.server, 1).replace(
+                    '.conf', '.pid', 1)
 
     def get_conf_file_name(self, pid_file):
         """Translate pid_file to a corresponding conf_file
@@ -361,27 +540,50 @@ def get_conf_file_name(self, pid_file):
         """
         if self.server in STANDALONE_SERVERS:
             return pid_file.replace(
-                os.path.normpath(RUN_DIR), SWIFT_DIR, 1)\
-                .rsplit('.pid', 1)[0] + '.conf'
+                os.path.normpath(self.run_dir), SWIFT_DIR, 1).replace(
+                    '.pid', '.conf', 1)
         else:
             return pid_file.replace(
-                os.path.normpath(RUN_DIR), SWIFT_DIR, 1).replace(
-                    self.server, '%s-server' % self.type, 1).rsplit(
-                        '.pid', 1)[0] + '.conf'
+                os.path.normpath(self.run_dir), SWIFT_DIR, 1).replace(
+                    self.server, '%s-server' % self.type, 1).replace(
+                        '.pid', '.conf', 1)
+
+    def _find_conf_files(self, server_search):
+        if self.conf is not None:
+            return search_tree(SWIFT_DIR, server_search, self.conf + '.conf',
+                               dir_ext=self.conf + '.conf.d')
+        else:
+            return search_tree(SWIFT_DIR, server_search + '*', '.conf',
+                               dir_ext='.conf.d')
 
     def conf_files(self, **kwargs):
         """Get conf files for this server
 
-        :param: number, if supplied will only lookup the nth server
+        :param number: if supplied will only lookup the nth server
 
         :returns: list of conf files
         """
-        if self.server in STANDALONE_SERVERS:
-            found_conf_files = search_tree(SWIFT_DIR, self.server + '*',
-                                           '.conf')
+        if self.server == 'object-expirer':
+            def has_expirer_section(conf_path):
+                try:
+                    readconf(conf_path, section_name="object-expirer")
+                except ValueError:
+                    return False
+                else:
+                    return True
+
+            # config of expirer is preferentially read from object-server
+            # section. If all object-server.conf doesn't have object-expirer
+            # section, object-expirer.conf is used.
+            found_conf_files = [
+                conf for conf in self._find_conf_files("object-server")
+                if has_expirer_section(conf)
+            ] or self._find_conf_files("object-expirer")
+        elif self.server in STANDALONE_SERVERS:
+            found_conf_files = self._find_conf_files(self.server)
         else:
-            found_conf_files = search_tree(SWIFT_DIR, '%s-server*' % self.type,
-                                           '.conf')
+            found_conf_files = self._find_conf_files("%s-server" % self.type)
+
         number = kwargs.get('number')
         if number:
             try:
@@ -390,27 +592,47 @@ def conf_files(self, **kwargs):
                 conf_files = []
         else:
             conf_files = found_conf_files
+
+        def dump_found_configs():
+            if found_conf_files:
+                print('Found configs:')
+            for i, conf_file in enumerate(found_conf_files):
+                print('  %d) %s' % (i + 1, conf_file))
+
         if not conf_files:
             # maybe there's a config file(s) out there, but I couldn't find it!
             if not kwargs.get('quiet'):
-                print _('Unable to locate config %sfor %s') % (
-                    ('number %s ' % number if number else ''), self.server)
+                if number:
+                    print('Unable to locate config number %(number)s for'
+                          ' %(server)s' %
+                          {'number': number, 'server': self.server})
+                else:
+                    print('Unable to locate config for %s' % self.server)
             if kwargs.get('verbose') and not kwargs.get('quiet'):
-                if found_conf_files:
-                    print _('Found configs:')
-                for i, conf_file in enumerate(found_conf_files):
-                    print '  %d) %s' % (i + 1, conf_file)
+                dump_found_configs()
+        elif any(["object-expirer" in name for name in conf_files]) and \
+                not kwargs.get('quiet'):
+            print("WARNING: object-expirer.conf is deprecated. "
+                  "Move object-expirers' configuration into "
+                  "object-server.conf.")
+            if kwargs.get('verbose'):
+                dump_found_configs()
 
         return conf_files
 
     def pid_files(self, **kwargs):
         """Get pid files for this server
 
-        :param: number, if supplied will only lookup the nth server
+        :param number: if supplied will only lookup the nth server
 
         :returns: list of pid files
         """
-        pid_files = search_tree(RUN_DIR, '%s*' % self.server, '.pid')
+        if self.conf is not None:
+            pid_files = search_tree(self.run_dir, '%s*' % self.server,
+                                    exts=[self.conf + '.pid',
+                                          self.conf + '.pid.d'])
+        else:
+            pid_files = search_tree(self.run_dir, '%s*' % self.server)
         if kwargs.get('number', 0):
             conf_files = self.conf_files(**kwargs)
             # filter pid_files to match the index of numbered conf_file
@@ -422,7 +644,37 @@ def iter_pid_files(self, **kwargs):
         """Generator, yields (pid_file, pids)
         """
         for pid_file in self.pid_files(**kwargs):
-            yield pid_file, int(open(pid_file).read().strip())
+            try:
+                pid = int(open(pid_file).read().strip())
+            except ValueError:
+                pid = None
+            yield pid_file, pid
+
+    def _signal_pid(self, sig, pid, pid_file, verbose):
+        try:
+            if sig != signal.SIG_DFL:
+                print('Signal %(server)s  pid: %(pid)s  signal: '
+                      '%(signal)s' %
+                      {'server': self.server, 'pid': pid, 'signal': sig})
+            safe_kill(pid, sig, 'swift-%s' % self.server)
+        except InvalidPidFileException:
+            if verbose:
+                print('Removing pid file %(pid_file)s with wrong pid '
+                      '%(pid)d' % {'pid_file': pid_file, 'pid': pid})
+            remove_file(pid_file)
+            return False
+        except OSError as e:
+            if e.errno == errno.ESRCH:
+                # pid does not exist
+                if verbose:
+                    print("Removing stale pid file %s" % pid_file)
+                remove_file(pid_file)
+            elif e.errno == errno.EPERM:
+                print("No permission to signal PID %d" % pid)
+            return False
+        else:
+            # process exists
+            return True
 
     def signal_pids(self, sig, **kwargs):
         """Send a signal to pids for this server
@@ -434,24 +686,33 @@ def signal_pids(self, sig, **kwargs):
         """
         pids = {}
         for pid_file, pid in self.iter_pid_files(**kwargs):
-            try:
-                if sig != signal.SIG_DFL:
-                    print _('Signal %s  pid: %s  signal: %s') % (self.server,
-                                                                 pid, sig)
-                os.kill(pid, sig)
-            except OSError, e:
-                if e.errno == errno.ESRCH:
-                    # pid does not exist
-                    if kwargs.get('verbose'):
-                        print _("Removing stale pid file %s") % pid_file
-                    remove_file(pid_file)
-                elif e.errno == errno.EPERM:
-                    print _("No permission to signal PID %d") % pid
-            else:
-                # process exists
+            if not pid:  # Catches None and 0
+                print('Removing pid file %s with invalid pid' % pid_file)
+                remove_file(pid_file)
+                continue
+            if self._signal_pid(sig, pid, pid_file, kwargs.get('verbose')):
                 pids[pid] = pid_file
         return pids
 
+    def signal_children(self, sig, **kwargs):
+        """Send a signal to child pids for this server
+
+        :param sig: signal to send
+
+        :returns: a dict mapping pids (ints) to pid_files (paths)
+
+        """
+        pids = {}
+        for pid_file, pid in self.iter_pid_files(**kwargs):
+            if not pid:  # Catches None and 0
+                print('Removing pid file %s with invalid pid' % pid_file)
+                remove_file(pid_file)
+                continue
+            for pid in get_child_pids(pid):
+                if self._signal_pid(sig, pid, pid_file, kwargs.get('verbose')):
+                    pids[pid] = pid_file
+        return pids
+
     def get_running_pids(self, **kwargs):
         """Get running pids
 
@@ -464,22 +725,45 @@ def kill_running_pids(self, **kwargs):
         """Kill running pids
 
         :param graceful: if True, attempt SIGHUP on supporting servers
+        :param seamless: if True, attempt SIGUSR1 on supporting servers
 
         :returns: a dict mapping pids (ints) to pid_files (paths)
 
         """
         graceful = kwargs.get('graceful')
+        seamless = kwargs.get('seamless')
         if graceful and self.server in GRACEFUL_SHUTDOWN_SERVERS:
             sig = signal.SIGHUP
+        elif seamless and self.server in SEAMLESS_SHUTDOWN_SERVERS:
+            sig = signal.SIGUSR1
         else:
             sig = signal.SIGTERM
         return self.signal_pids(sig, **kwargs)
 
+    def kill_child_pids(self, **kwargs):
+        """Kill child pids, leaving server overseer to respawn them
+
+        :param graceful: if True, attempt SIGHUP on supporting servers
+        :param seamless: if True, attempt SIGUSR1 on supporting servers
+
+        :returns: a dict mapping pids (ints) to pid_files (paths)
+
+        """
+        graceful = kwargs.get('graceful')
+        seamless = kwargs.get('seamless')
+        if graceful and self.server in GRACEFUL_SHUTDOWN_SERVERS:
+            sig = signal.SIGHUP
+        elif seamless and self.server in SEAMLESS_SHUTDOWN_SERVERS:
+            sig = signal.SIGUSR1
+        else:
+            sig = signal.SIGTERM
+        return self.signal_children(sig, **kwargs)
+
     def status(self, pids=None, **kwargs):
         """Display status of server
 
-        :param: pids, if not supplied pids will be populated automatically
-        :param: number, if supplied will only lookup the nth server
+        :param pids: if not supplied pids will be populated automatically
+        :param number: if supplied will only lookup the nth server
 
         :returns: 1 if server is not running, 0 otherwise
         """
@@ -491,25 +775,30 @@ def status(self, pids=None, **kwargs):
                 kwargs['quiet'] = True
                 conf_files = self.conf_files(**kwargs)
                 if conf_files:
-                    print _("%s #%d not running (%s)") % (self.server, number,
-                                                          conf_files[0])
+                    print("%(server)s #%(number)d not running (%(conf)s)" %
+                          {'server': self.server, 'number': number,
+                           'conf': conf_files[0]})
             else:
-                print _("No %s running") % self.server
+                print("No %s running" % self.server)
             return 1
         for pid, pid_file in pids.items():
             conf_file = self.get_conf_file_name(pid_file)
-            print _("%s running (%s - %s)") % (self.server, pid, conf_file)
+            print("%(server)s running (%(pid)s - %(conf)s)" %
+                  {'server': self.server, 'pid': pid, 'conf': conf_file})
         return 0
 
-    def spawn(self, conf_file, once=False, wait=True, daemon=True, **kwargs):
+    def spawn(self, conf_file, once=False, wait=True, daemon=True,
+              additional_args=None, **kwargs):
         """Launch a subprocess for this server.
 
         :param conf_file: path to conf_file to use as first arg
         :param once: boolean, add once argument to command
         :param wait: boolean, if true capture stdout with a pipe
-        :param daemon: boolean, if true ask server to log to console
+        :param daemon: boolean, if false ask server to log to console
+        :param additional_args: list of additional arguments to pass
+                                on the command line
 
-        :returns : the pid of the spawned process
+        :returns: the pid of the spawned process
         """
         args = [self.cmd, conf_file]
         if once:
@@ -517,6 +806,10 @@ def spawn(self, conf_file, once=False, wait=True, daemon=True, **kwargs):
         if not daemon:
             # ask the server to log to console
             args.append('verbose')
+        if additional_args:
+            if isinstance(additional_args, str):
+                additional_args = [additional_args]
+            args.extend(additional_args)
 
         # figure out what we're going to do with stdio
         if not daemon:
@@ -542,10 +835,20 @@ def wait(self, **kwargs):
         """
         status = 0
         for proc in self.procs:
-            # wait for process to close its stdout
-            output = proc.stdout.read()
+            # wait for process to close its stdout (if we haven't done that)
+            if proc.stdout.closed:
+                output = ''
+            else:
+                output = proc.stdout.read().decode('utf8', 'backslashreplace')
+                proc.stdout.close()
+
+            if kwargs.get('once', False):
+                # if you don't want once to wait you can send it to the
+                # background on the command line, I generally just run with
+                # no-daemon anyway, but this is quieter
+                proc.wait()
             if output:
-                print output
+                print(output)
                 start = time.time()
                 # wait for process to die (output may just be a warning)
                 while time.time() - start < WARNING_WAIT:
@@ -562,7 +865,7 @@ def interact(self, **kwargs):
         status = 0
         for proc in self.procs:
             # wait for process to terminate
-            proc.communicate()
+            proc.communicate()  # should handle closing pipes
             if proc.returncode:
                 status += 1
         return status
@@ -573,7 +876,7 @@ def launch(self, **kwargs):
         """
         conf_files = self.conf_files(**kwargs)
         if not conf_files:
-            return []
+            return {}
 
         pids = self.get_running_pids(**kwargs)
 
@@ -586,14 +889,17 @@ def launch(self, **kwargs):
             # any unstarted instances
             if conf_file in conf_files:
                 already_started = True
-                print _("%s running (%s - %s)") % (self.server, pid, conf_file)
+                print("%(server)s running (%(pid)s - %(conf)s)" %
+                      {'server': self.server, 'pid': pid, 'conf': conf_file})
             elif not kwargs.get('number', 0):
                 already_started = True
-                print _("%s running (%s - %s)") % (self.server, pid, pid_file)
+                print("%(server)s running (%(pid)s - %(pid_file)s)" %
+                      {'server': self.server, 'pid': pid,
+                       'pid_file': pid_file})
 
         if already_started:
-            print _("%s already started...") % self.server
-            return []
+            print("%s already started..." % self.server)
+            return {}
 
         if self.server not in START_ONCE_SERVERS:
             kwargs['once'] = False
@@ -601,17 +907,19 @@ def launch(self, **kwargs):
         pids = {}
         for conf_file in conf_files:
             if kwargs.get('once'):
-                msg = _('Running %s once') % self.server
+                msg = 'Running %s once' % self.server
             else:
-                msg = _('Starting %s') % self.server
-            print '%s...(%s)' % (msg, conf_file)
+                msg = 'Starting %s' % self.server
+            print('%s...(%s)' % (msg, conf_file))
             try:
                 pid = self.spawn(conf_file, **kwargs)
-            except OSError, e:
+            except OSError as e:
                 if e.errno == errno.ENOENT:
-                    # TODO: should I check if self.cmd exists earlier?
-                    print _("%s does not exist") % self.cmd
+                    # TODO(clayg): should I check if self.cmd exists earlier?
+                    print("%s does not exist" % self.cmd)
                     break
+                else:
+                    raise
             pids[pid] = conf_file
 
         return pids
@@ -623,3 +931,102 @@ def stop(self, **kwargs):
 
         """
         return self.kill_running_pids(**kwargs)
+
+
+USAGE = \
+    """%prog <server>[.<config>] [<server>[.<config>] ...] <command> [options]
+
+where:
+    <server>  is the name of a swift service e.g. proxy-server.
+              The '-server' part of the name may be omitted.
+              'all', 'main' and 'rest' are reserved words that represent a
+              group of services.
+              all: Expands to all swift daemons.
+              main: Expands to main swift daemons.
+                    (proxy, container, account, object)
+              rest: Expands to all remaining background daemons (beyond
+                    "main").
+                    (updater, replicator, auditor, etc)
+    <config>  is an explicit configuration filename without the
+              .conf extension. If <config> is specified then <server> should
+              refer to a directory containing the configuration file, e.g.:
+
+                  swift-init object.1 start
+
+              will start an object-server using the configuration file
+              /etc/swift/object-server/1.conf
+    <command> is a command from the list below.
+
+Commands:
+""" + '\n'.join(["%16s: %s" % x for x in Manager.list_commands()])
+
+
+def main():
+    parser = OptionParser(USAGE)
+    parser.add_option('-v', '--verbose', action="store_true",
+                      default=False, help="display verbose output")
+    parser.add_option('-w', '--no-wait', action="store_false", dest="wait",
+                      default=True, help="won't wait for server to start "
+                      "before returning")
+    parser.add_option('-o', '--once', action="store_true",
+                      default=False, help="only run one pass of daemon")
+    # this is a negative option, default is options.daemon = True
+    parser.add_option('-n', '--no-daemon', action="store_false", dest="daemon",
+                      default=True, help="start server interactively")
+    parser.add_option('-g', '--graceful', action="store_true",
+                      default=False, help="send SIGHUP to supporting servers")
+    parser.add_option('-c', '--config-num', metavar="N", type="int",
+                      dest="number", default=0,
+                      help="send command to the Nth server only")
+    parser.add_option('-k', '--kill-wait', metavar="N", type="int",
+                      dest="kill_wait", default=KILL_WAIT,
+                      help="wait N seconds for processes to die (default 15)")
+    parser.add_option('-r', '--run-dir', type="str",
+                      dest="run_dir", default=RUN_DIR,
+                      help="alternative directory to store running pid files "
+                      "default: %s" % RUN_DIR)
+    # Changing behaviour if missing config
+    parser.add_option('--strict', dest='strict', action='store_true',
+                      help="Return non-zero status code if some config is "
+                           "missing. Default mode if all servers are "
+                           "explicitly named.")
+    # a negative option for strict
+    parser.add_option('--non-strict', dest='strict', action='store_false',
+                      help="Return zero status code even if some config is "
+                           "missing. Default mode if any server is a glob or "
+                           "one of aliases `all`, `main` or `rest`.")
+    # SIGKILL daemon after kill_wait period
+    parser.add_option('--kill-after-timeout', dest='kill_after_timeout',
+                      action='store_true',
+                      help="Kill daemon and all children after kill-wait "
+                           "period.")
+
+    options, args = parser.parse_args()
+
+    if len(args) < 2:
+        parser.print_help()
+        print('ERROR: specify server(s) and command')
+        return 1
+
+    command = args[-1]
+    servers = args[:-1]
+
+    # this is just a silly swap for me cause I always try to "start main"
+    commands = dict(Manager.list_commands()).keys()
+    if command not in commands and servers[0] in commands:
+        servers.append(command)
+        command = servers.pop(0)
+
+    manager = Manager(servers, run_dir=options.run_dir)
+    try:
+        status = manager.run_command(command, **options.__dict__)
+    except UnknownCommandError:
+        parser.print_help()
+        print('ERROR: unknown command, %s' % command)
+        status = 1
+
+    return 1 if status else 0
+
+
+if __name__ == "__main__":
+    sys.exit(main())
diff --git a/swift/common/memcached.py b/swift/common/memcached.py
index 42e9b34efd..9ffd861f34 100644
--- a/swift/common/memcached.py
+++ b/swift/common/memcached.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -14,43 +14,83 @@
 # limitations under the License.
 
 """
+Why our own memcache client?
+By Michael Barton
+
+python-memcached doesn't use consistent hashing, so adding or
+removing a memcache server from the pool invalidates a huge
+percentage of cached items.
+
+If you keep a pool of python-memcached client objects, each client
+object has its own connection to every memcached server, only one of
+which is ever in use.  So you wind up with n * m open sockets and
+almost all of them idle. This client effectively has a pool for each
+server, so the number of backend connections is hopefully greatly
+reduced.
+
+python-memcache uses pickle to store things, and there was already a
+huge stink about Swift using pickles in memcache
+(http://osvdb.org/show/osvdb/86581).  That seemed sort of unfair,
+since nova and keystone and everyone else use pickles for memcache
+too, but it's hidden behind a "standard" library. But changing would
+be a security regression at this point.
+
+Also, pylibmc wouldn't work for us because it needs to use python
+sockets in order to play nice with eventlet.
+
 Lucid comes with memcached: v1.4.2.  Protocol documentation for that
 version is at:
 
 http://github.com/memcached/memcached/blob/1.4.2/doc/protocol.txt
 """
 
-import cPickle as pickle
+import os
+import json
 import logging
-import socket
-import time
+# the name of 'time' module is changed to 'tm', to avoid changing the
+# signatures of member functions in this file.
+import time as tm
 from bisect import bisect
-from hashlib import md5
 
-try:
-    import simplejson as json
-except ImportError:
-    import json
+from eventlet.green import socket, ssl
+from eventlet.pools import Pool
+from eventlet import Timeout
+from configparser import ConfigParser, NoSectionError, NoOptionError
+from swift.common import utils
+from swift.common.exceptions import MemcacheConnectionError, \
+    MemcacheIncrNotFoundError, MemcachePoolTimeout
+from swift.common.utils import md5, human_readable, config_true_value, \
+    memcached_timing_stats
 
 DEFAULT_MEMCACHED_PORT = 11211
 
 CONN_TIMEOUT = 0.3
+POOL_TIMEOUT = 1.0  # WAG
 IO_TIMEOUT = 2.0
 PICKLE_FLAG = 1
 JSON_FLAG = 2
 NODE_WEIGHT = 50
-PICKLE_PROTOCOL = 2
 TRY_COUNT = 3
 
 # if ERROR_LIMIT_COUNT errors occur in ERROR_LIMIT_TIME seconds, the server
 # will be considered failed for ERROR_LIMIT_DURATION seconds.
 ERROR_LIMIT_COUNT = 10
-ERROR_LIMIT_TIME = 60
-ERROR_LIMIT_DURATION = 60
+ERROR_LIMIT_TIME = ERROR_LIMIT_DURATION = 60
+DEFAULT_ITEM_SIZE_WARNING_THRESHOLD = -1
+
+# Different sample rates for emitting Memcached timing stats.
+TIMING_SAMPLE_RATE_HIGH = 0.1
+TIMING_SAMPLE_RATE_MEDIUM = 0.01
+TIMING_SAMPLE_RATE_LOW = 0.001
+
+# The max value of a delta expiration time.
+EXPTIME_MAXDELTA = 30 * 24 * 60 * 60
 
 
 def md5hash(key):
-    return md5(key).hexdigest()
+    if not isinstance(key, bytes):
+        key = key.encode('utf-8', errors='surrogateescape')
+    return md5(key, usedforsecurity=False).hexdigest().encode('ascii')
 
 
 def sanitize_timeout(timeout):
@@ -60,13 +100,95 @@ def sanitize_timeout(timeout):
     translates negative values to mean a delta of 30 days in seconds (and 1
     additional second), client beware.
     """
-    if timeout > (30 * 24 * 60 * 60):
-        timeout += time.time()
-    return timeout
+    if timeout > EXPTIME_MAXDELTA:
+        timeout += tm.time()
+    return int(timeout)
+
+
+def set_msg(key, flags, timeout, value):
+    if not isinstance(key, bytes):
+        raise TypeError('key must be bytes')
+    if not isinstance(value, bytes):
+        raise TypeError('value must be bytes')
+    return b' '.join([
+        b'set',
+        key,
+        str(flags).encode('ascii'),
+        str(timeout).encode('ascii'),
+        str(len(value)).encode('ascii'),
+    ]) + (b'\r\n' + value + b'\r\n')
+
+
+class MemcacheConnPool(Pool):
+    """
+    Connection pool for Memcache Connections
+
+    The *server* parameter can be a hostname, an IPv4 address, or an IPv6
+    address with an optional port. See
+    :func:`swift.common.utils.parse_socket_string` for details.
+    """
+
+    def __init__(self, server, size, connect_timeout, tls_context=None):
+        Pool.__init__(self, max_size=size)
+        self.host, self.port = utils.parse_socket_string(
+            server, DEFAULT_MEMCACHED_PORT)
+        self._connect_timeout = connect_timeout
+        self._tls_context = tls_context
+
+    def create(self):
+        addrs = socket.getaddrinfo(self.host, self.port, socket.AF_UNSPEC,
+                                   socket.SOCK_STREAM)
+        family, socktype, proto, canonname, sockaddr = addrs[0]
+        sock = socket.socket(family, socket.SOCK_STREAM)
+        sock.setsockopt(socket.IPPROTO_TCP, socket.TCP_NODELAY, 1)
+        try:
+            with Timeout(self._connect_timeout):
+                sock.connect(sockaddr)
+            if self._tls_context:
+                sock = self._tls_context.wrap_socket(sock,
+                                                     server_hostname=self.host)
+        except (Exception, Timeout):
+            sock.close()
+            raise
+        return (sock.makefile('rwb'), sock)
+
+    def get(self):
+        fp, sock = super(MemcacheConnPool, self).get()
+        try:
+            if fp is None:
+                # An error happened previously, so we need a new connection
+                fp, sock = self.create()
+            return fp, sock
+        except MemcachePoolTimeout:
+            # This is the only place that knows an item was successfully taken
+            # from the pool, so it has to be responsible for repopulating it.
+            # Any other errors should get handled in _get_conns(); see the
+            # comment about timeouts during create() there.
+            self.put((None, None))
+            raise
+
+
+class MemcacheCommand(object):
+    """
+    Helper class that encapsulates common parameters of a command.
+
+    :param method: the name of the MemcacheRing method that was called.
+    :param key: the memcached key.
+    """
+    __slots__ = ('method', 'key', 'command', 'hash_key')
 
+    def __init__(self, method, key):
+        self.method = method
+        self.key = key
+        self.command = method.encode()
+        self.hash_key = md5hash(key)
 
-class MemcacheConnectionError(Exception):
-    pass
+    @property
+    def key_prefix(self):
+        # get the prefix of a user provided memcache key by removing the
+        # content after the last '/', all current usages within swift are using
+        # prefix, such as "shard-updating-v2", "nvratelimit" and etc.
+        return self.key.rsplit('/', 1)[0]
 
 
 class MemcacheRing(object):
@@ -74,140 +196,299 @@ class MemcacheRing(object):
     Simple, consistent-hashed memcache client.
     """
 
-    def __init__(self, servers, connect_timeout=CONN_TIMEOUT,
-                 io_timeout=IO_TIMEOUT, tries=TRY_COUNT,
-                 allow_pickle=False, allow_unpickle=False):
+    def __init__(
+            self, servers, connect_timeout=CONN_TIMEOUT,
+            io_timeout=IO_TIMEOUT, pool_timeout=POOL_TIMEOUT,
+            tries=TRY_COUNT,
+            max_conns=2, tls_context=None, logger=None,
+            error_limit_count=ERROR_LIMIT_COUNT,
+            error_limit_time=ERROR_LIMIT_TIME,
+            error_limit_duration=ERROR_LIMIT_DURATION,
+            item_size_warning_threshold=DEFAULT_ITEM_SIZE_WARNING_THRESHOLD):
         self._ring = {}
         self._errors = dict(((serv, []) for serv in servers))
         self._error_limited = dict(((serv, 0) for serv in servers))
+        self._error_limit_count = error_limit_count
+        self._error_limit_time = error_limit_time
+        self._error_limit_duration = error_limit_duration
         for server in sorted(servers):
-            for i in xrange(NODE_WEIGHT):
+            for i in range(NODE_WEIGHT):
                 self._ring[md5hash('%s-%s' % (server, i))] = server
         self._tries = tries if tries <= len(servers) else len(servers)
-        self._sorted = sorted(self._ring.keys())
-        self._client_cache = dict(((server, []) for server in servers))
+        self._sorted = sorted(self._ring)
+        self._client_cache = dict((
+            (server, MemcacheConnPool(server, max_conns, connect_timeout,
+                                      tls_context=tls_context))
+            for server in servers))
         self._connect_timeout = connect_timeout
         self._io_timeout = io_timeout
-        self._allow_pickle = allow_pickle
-        self._allow_unpickle = allow_unpickle or allow_pickle
+        self._pool_timeout = pool_timeout
+        if logger is None:
+            self.logger = logging.getLogger()
+        else:
+            self.logger = logger
+        self.item_size_warning_threshold = item_size_warning_threshold
+
+    @property
+    def memcache_servers(self):
+        return list(self._client_cache.keys())
+
+    def _log_error(self, server, cmd, action, msg):
+        self.logger.error(
+            "Error %(action)s to memcached: %(server)s"
+            ": with key_prefix %(key_prefix)s, method %(method)s: %(msg)s",
+            {'action': action, 'server': server, 'key_prefix': cmd.key_prefix,
+             'method': cmd.method, 'msg': msg})
 
-    def _exception_occurred(self, server, e, action='talking'):
-        if isinstance(e, socket.timeout):
-            logging.error(_("Timeout %(action)s to memcached: %(server)s"),
-                          {'action': action, 'server': server})
+    """
+    Handles exceptions.
+
+    :param server: a server.
+    :param e: an exception.
+    :param cmd: an instance of MemcacheCommand.
+    :param conn_start_time: the time at which the failed operation started.
+    :param action: a verb describing the operation.
+    :param sock: an optional socket that needs to be closed by this method.
+    :param fp: an optional file pointer that needs to be closed by this method.
+    :param got_connection: if ``True``, the server's connection will be reset
+        in the cached connection pool.
+    """
+    def _exception_occurred(self, server, e, cmd, conn_start_time,
+                            action='talking', sock=None,
+                            fp=None, got_connection=True):
+        if isinstance(e, Timeout):
+            self.logger.error(
+                "Timeout %(action)s to memcached: %(server)s"
+                ": with key_prefix %(key_prefix)s, method %(method)s, "
+                "config_timeout %(config_timeout)s, time_spent %(time_spent)s",
+                {'action': action, 'server': server,
+                 'key_prefix': cmd.key_prefix, 'method': cmd.method,
+                 'config_timeout': e.seconds,
+                 'time_spent': tm.time() - conn_start_time})
+            self.logger.timing_since(
+                'memcached.' + cmd.method + '.timeout.timing',
+                conn_start_time)
+        elif isinstance(e, (socket.error, MemcacheConnectionError)):
+            self.logger.error(
+                "Error %(action)s to memcached: %(server)s: "
+                "with key_prefix %(key_prefix)s, method %(method)s, "
+                "time_spent %(time_spent)s, %(err)s",
+                {'action': action, 'server': server,
+                 'key_prefix': cmd.key_prefix, 'method': cmd.method,
+                 'time_spent': tm.time() - conn_start_time, 'err': e})
+            self.logger.timing_since(
+                'memcached.' + cmd.method + '.conn_err.timing',
+                conn_start_time)
         else:
-            logging.exception(_("Error %(action)s to memcached: %(server)s"),
-                              {'action': action, 'server': server})
-        now = time.time()
-        self._errors[server].append(time.time())
-        if len(self._errors[server]) > ERROR_LIMIT_COUNT:
+            self.logger.exception(
+                "Error %(action)s to memcached: %(server)s"
+                ": with key_prefix %(key_prefix)s, method %(method)s, "
+                "time_spent %(time_spent)s",
+                {'action': action, 'server': server,
+                 'key_prefix': cmd.key_prefix, 'method': cmd.method,
+                 'time_spent': tm.time() - conn_start_time})
+            self.logger.timing_since(
+                'memcached.' + cmd.method + '.errors.timing', conn_start_time)
+
+        try:
+            if fp:
+                fp.close()
+                del fp
+        except Exception:
+            pass
+        try:
+            if sock:
+                sock.close()
+                del sock
+        except Exception:
+            pass
+        if got_connection:
+            # We need to return something to the pool
+            # A new connection will be created the next time it is retrieved
+            self._return_conn(server, None, None)
+
+        if isinstance(e, MemcacheIncrNotFoundError):
+            # these errors can be caused by other greenthreads not yielding to
+            # the incr greenthread often enough, rather than a server problem,
+            # so don't error limit the server
+            return
+
+        if self._error_limit_time <= 0 or self._error_limit_duration <= 0:
+            return
+
+        now = tm.time()
+        self._errors[server].append(now)
+        if len(self._errors[server]) > self._error_limit_count:
             self._errors[server] = [err for err in self._errors[server]
-                                    if err > now - ERROR_LIMIT_TIME]
-            if len(self._errors[server]) > ERROR_LIMIT_COUNT:
-                self._error_limited[server] = now + ERROR_LIMIT_DURATION
-                logging.error(_('Error limiting server %s'), server)
+                                    if err > now - self._error_limit_time]
+            if len(self._errors[server]) > self._error_limit_count:
+                self._error_limited[server] = now + self._error_limit_duration
+                self.logger.error('Error limiting server %s', server)
 
-    def _get_conns(self, key):
+    def _get_conns(self, cmd):
         """
         Retrieves a server conn from the pool, or connects a new one.
         Chooses the server based on a consistent hash of "key".
+
+        :param cmd: an instance of MemcacheCommand.
+        :return: generator to serve memcached connection
         """
-        pos = bisect(self._sorted, key)
+        pos = bisect(self._sorted, cmd.hash_key)
         served = []
+        any_yielded = False
         while len(served) < self._tries:
             pos = (pos + 1) % len(self._sorted)
             server = self._ring[self._sorted[pos]]
             if server in served:
                 continue
             served.append(server)
-            if self._error_limited[server] > time.time():
+            pool_start_time = tm.time()
+            if self._error_limited[server] > pool_start_time:
                 continue
+            sock = None
             try:
-                fp, sock = self._client_cache[server].pop()
+                with MemcachePoolTimeout(self._pool_timeout):
+                    fp, sock = self._client_cache[server].get()
+                any_yielded = True
                 yield server, fp, sock
-            except IndexError:
-                try:
-                    if ':' in server:
-                        host, port = server.split(':')
-                    else:
-                        host = server
-                        port = DEFAULT_MEMCACHED_PORT
-                    sock = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
-                    sock.setsockopt(socket.IPPROTO_TCP, socket.TCP_NODELAY, 1)
-                    sock.settimeout(self._connect_timeout)
-                    sock.connect((host, int(port)))
-                    sock.settimeout(self._io_timeout)
-                    yield server, sock.makefile(), sock
-                except Exception, e:
-                    self._exception_occurred(server, e, 'connecting')
+            except MemcachePoolTimeout as e:
+                self._exception_occurred(server, e, cmd, pool_start_time,
+                                         action='getting a connection',
+                                         got_connection=False)
+            except (Exception, Timeout) as e:
+                # Typically a Timeout exception caught here is the one raised
+                # by the create() method of this server's MemcacheConnPool
+                # object.
+                self._exception_occurred(server, e, cmd, pool_start_time,
+                                         action='connecting', sock=sock)
+        if not any_yielded:
+            self._log_error('ALL', cmd, 'connecting',
+                            'No more memcached servers to try')
 
     def _return_conn(self, server, fp, sock):
-        """ Returns a server connection to the pool """
-        self._client_cache[server].append((fp, sock))
-
-    def set(self, key, value, serialize=True, timeout=0):
+        """Returns a server connection to the pool."""
+        self._client_cache[server].put((fp, sock))
+
+    # Sample rates of different memcached operations are based on generic
+    # swift usage patterns.
+    @memcached_timing_stats(sample_rate=TIMING_SAMPLE_RATE_HIGH)
+    def set(self, key, value, serialize=True, time=0,
+            min_compress_len=0, raise_on_error=False):
         """
         Set a key/value pair in memcache
 
         :param key: key
         :param value: value
         :param serialize: if True, value is serialized with JSON before sending
-                          to memcache, or with pickle if configured to use
-                          pickle instead of JSON (to avoid cache poisoning)
-        :param timeout: ttl in memcache
+                          to memcache
+        :param time: the time to live
+        :param min_compress_len: minimum compress length, this parameter was
+                                 added to keep the signature compatible with
+                                 python-memcached interface. This
+                                 implementation ignores it.
+        :param raise_on_error: if True, propagate Timeouts and other errors.
+                               By default, errors are ignored.
         """
-        key = md5hash(key)
-        timeout = sanitize_timeout(timeout)
+        cmd = MemcacheCommand('set', key)
+        timeout = sanitize_timeout(time)
         flags = 0
-        if serialize and self._allow_pickle:
-            value = pickle.dumps(value, PICKLE_PROTOCOL)
-            flags |= PICKLE_FLAG
-        elif serialize:
-            value = json.dumps(value)
+        if serialize:
+            if isinstance(value, bytes):
+                value = value.decode('utf8')
+            value = json.dumps(value).encode('ascii')
             flags |= JSON_FLAG
-        for (server, fp, sock) in self._get_conns(key):
+        elif not isinstance(value, bytes):
+            value = str(value).encode('utf-8')
+
+        if 0 <= self.item_size_warning_threshold <= len(value):
+            self.logger.warning(
+                "Item size larger than warning threshold: "
+                "%d (%s) >= %d (%s)", len(value),
+                human_readable(len(value)),
+                self.item_size_warning_threshold,
+                human_readable(self.item_size_warning_threshold))
+
+        for (server, fp, sock) in self._get_conns(cmd):
+            conn_start_time = tm.time()
             try:
-                sock.sendall('set %s %d %d %s noreply\r\n%s\r\n' %
-                             (key, flags, timeout, len(value), value))
-                self._return_conn(server, fp, sock)
-                return
-            except Exception, e:
-                self._exception_occurred(server, e)
-
-    def get(self, key):
+                with Timeout(self._io_timeout):
+                    sock.sendall(set_msg(cmd.hash_key, flags, timeout, value))
+                    # Wait for the set to complete
+                    msg = fp.readline().strip()
+                    if msg != b'STORED':
+                        msg = msg.decode('ascii')
+                        raise MemcacheConnectionError('failed set: %s' % msg)
+                    self._return_conn(server, fp, sock)
+                    return
+            except (Exception, Timeout) as e:
+                self._exception_occurred(server, e, cmd, conn_start_time,
+                                         sock=sock, fp=fp)
+        if raise_on_error:
+            raise MemcacheConnectionError(
+                "No memcached connections succeeded.")
+
+    @memcached_timing_stats(sample_rate=TIMING_SAMPLE_RATE_MEDIUM)
+    def get(self, key, raise_on_error=False):
         """
         Gets the object specified by key.  It will also unserialize the object
-        before returning if it is serialized in memcache with JSON, or if it
-        is pickled and unpickling is allowed.
+        before returning if it is serialized in memcache with JSON.
 
         :param key: key
+        :param raise_on_error: if True, propagate Timeouts and other errors.
+                               By default, errors are treated as cache misses.
         :returns: value of the key in memcache
         """
-        key = md5hash(key)
+        cmd = MemcacheCommand('get', key)
         value = None
-        for (server, fp, sock) in self._get_conns(key):
+        for (server, fp, sock) in self._get_conns(cmd):
+            conn_start_time = tm.time()
             try:
-                sock.sendall('get %s\r\n' % key)
-                line = fp.readline().strip().split()
-                while line[0].upper() != 'END':
-                    if line[0].upper() == 'VALUE' and line[1] == key:
-                        size = int(line[3])
-                        value = fp.read(size)
-                        if int(line[2]) & PICKLE_FLAG:
-                            if self._allow_unpickle:
-                                value = pickle.loads(value)
-                            else:
-                                value = None
-                        elif int(line[2]) & JSON_FLAG:
-                            value = json.loads(value)
-                        fp.readline()
+                with Timeout(self._io_timeout):
+                    sock.sendall(b'get ' + cmd.hash_key + b'\r\n')
                     line = fp.readline().strip().split()
-                self._return_conn(server, fp, sock)
-                return value
-            except Exception, e:
-                self._exception_occurred(server, e)
-
-    def incr(self, key, delta=1, timeout=0):
+                    while True:
+                        if not line:
+                            raise MemcacheConnectionError('incomplete read')
+                        if line[0].upper() == b'END':
+                            break
+                        if (line[0].upper() == b'VALUE' and
+                                line[1] == cmd.hash_key):
+                            size = int(line[3])
+                            value = fp.read(size)
+                            if int(line[2]) & PICKLE_FLAG:
+                                value = None
+                            if int(line[2]) & JSON_FLAG:
+                                value = json.loads(value)
+                            fp.readline()
+                        line = fp.readline().strip().split()
+                    self._return_conn(server, fp, sock)
+                    return value
+            except (Exception, Timeout) as e:
+                self._exception_occurred(server, e, cmd, conn_start_time,
+                                         sock=sock, fp=fp)
+        if raise_on_error:
+            raise MemcacheConnectionError(
+                "No memcached connections succeeded.")
+
+    def _incr_or_decr(self, fp, sock, cmd, delta):
+        sock.sendall(b' '.join([cmd.command, cmd.hash_key, delta]) + b'\r\n')
+        line = fp.readline().strip().split()
+        if not line:
+            raise MemcacheConnectionError('incomplete read')
+        if line[0].upper() == b'NOT_FOUND':
+            return None
+        return int(line[0].strip())
+
+    def _add(self, fp, sock, cmd, add_val, timeout):
+        sock.sendall(b' '.join([
+            b'add', cmd.hash_key, b'0', str(timeout).encode('ascii'),
+            str(len(add_val)).encode('ascii')
+        ]) + b'\r\n' + add_val + b'\r\n')
+        line = fp.readline().strip().split()
+        return None if line[0].upper() == b'NOT_STORED' else int(add_val)
+
+    @memcached_timing_stats(sample_rate=TIMING_SAMPLE_RATE_LOW)
+    def incr(self, key, delta=1, time=0):
         """
         Increments a key which has a numeric value by delta.
         If the key can't be found, it's added as delta or 0 if delta < 0.
@@ -220,41 +501,40 @@ def incr(self, key, delta=1, timeout=0):
         :param key: key
         :param delta: amount to add to the value of key (or set as the value
                       if the key is not found) will be cast to an int
-        :param timeout: ttl in memcache
+        :param time: the time to live
+        :returns: result of incrementing
         :raises MemcacheConnectionError:
         """
-        key = md5hash(key)
-        command = 'incr'
-        if delta < 0:
-            command = 'decr'
-        delta = str(abs(int(delta)))
-        timeout = sanitize_timeout(timeout)
-        for (server, fp, sock) in self._get_conns(key):
+        cmd = MemcacheCommand('incr' if delta >= 0 else 'decr', key)
+        delta_val = str(abs(int(delta))).encode('ascii')
+        timeout = sanitize_timeout(time)
+        for (server, fp, sock) in self._get_conns(cmd):
+            conn_start_time = tm.time()
             try:
-                sock.sendall('%s %s %s\r\n' % (command, key, delta))
-                line = fp.readline().strip().split()
-                if line[0].upper() == 'NOT_FOUND':
-                    add_val = delta
-                    if command == 'decr':
-                        add_val = '0'
-                    sock.sendall('add %s %d %d %s\r\n%s\r\n' %
-                                 (key, 0, timeout, len(add_val), add_val))
-                    line = fp.readline().strip().split()
-                    if line[0].upper() == 'NOT_STORED':
-                        sock.sendall('%s %s %s\r\n' % (command, key, delta))
-                        line = fp.readline().strip().split()
-                        ret = int(line[0].strip())
-                    else:
-                        ret = int(add_val)
-                else:
-                    ret = int(line[0].strip())
-                self._return_conn(server, fp, sock)
-                return ret
-            except Exception, e:
-                self._exception_occurred(server, e)
-        raise MemcacheConnectionError("No Memcached connections succeeded.")
-
-    def decr(self, key, delta=1, timeout=0):
+                with Timeout(self._io_timeout):
+                    new_val = self._incr_or_decr(fp, sock, cmd, delta_val)
+                    if new_val is None:
+                        add_val = b'0' if cmd.method == 'decr' else delta_val
+                        new_val = self._add(fp, sock, cmd, add_val, timeout)
+                        if new_val is None:
+                            new_val = self._incr_or_decr(
+                                fp, sock, cmd, delta_val)
+                            if new_val is None:
+                                # This can happen if this thread takes more
+                                # than the TTL to get from the first failed
+                                # incr to the second incr, during which time
+                                # the key was concurrently added and expired.
+                                raise MemcacheIncrNotFoundError(
+                                    'expired ttl=%s' % time)
+                    self._return_conn(server, fp, sock)
+                    return new_val
+            except (Exception, Timeout) as e:
+                self._exception_occurred(server, e, cmd, conn_start_time,
+                                         sock=sock, fp=fp)
+        raise MemcacheConnectionError("No memcached connections succeeded.")
+
+    @memcached_timing_stats(sample_rate=TIMING_SAMPLE_RATE_LOW)
+    def decr(self, key, delta=1, time=0):
         """
         Decrements a key which has a numeric value by delta. Calls incr with
         -delta.
@@ -263,97 +543,215 @@ def decr(self, key, delta=1, timeout=0):
         :param delta: amount to subtract to the value of key (or set the
                       value to 0 if the key is not found) will be cast to
                       an int
-        :param timeout: ttl in memcache
+        :param time: the time to live
+        :returns: result of decrementing
         :raises MemcacheConnectionError:
         """
-        self.incr(key, delta=-delta, timeout=timeout)
+        return self.incr(key, delta=-delta, time=time)
 
-    def delete(self, key):
+    @memcached_timing_stats(sample_rate=TIMING_SAMPLE_RATE_HIGH)
+    def delete(self, key, server_key=None):
         """
         Deletes a key/value pair from memcache.
 
         :param key: key to be deleted
+        :param server_key: key to use in determining which server in the ring
+                            is used
         """
-        key = md5hash(key)
-        for (server, fp, sock) in self._get_conns(key):
+        cmd = server_cmd = MemcacheCommand('delete', key)
+        if server_key:
+            server_cmd = MemcacheCommand('delete', server_key)
+        for (server, fp, sock) in self._get_conns(server_cmd):
+            conn_start_time = tm.time()
             try:
-                sock.sendall('delete %s noreply\r\n' % key)
-                self._return_conn(server, fp, sock)
-                return
-            except Exception, e:
-                self._exception_occurred(server, e)
-
-    def set_multi(self, mapping, server_key, serialize=True, timeout=0):
+                with Timeout(self._io_timeout):
+                    sock.sendall(b'delete ' + cmd.hash_key + b'\r\n')
+                    # Wait for the delete to complete
+                    fp.readline()
+                    self._return_conn(server, fp, sock)
+                    return
+            except (Exception, Timeout) as e:
+                self._exception_occurred(server, e, cmd, conn_start_time,
+                                         sock=sock, fp=fp)
+
+    @memcached_timing_stats(sample_rate=TIMING_SAMPLE_RATE_HIGH)
+    def set_multi(self, mapping, server_key, serialize=True, time=0,
+                  min_compress_len=0):
         """
         Sets multiple key/value pairs in memcache.
 
-        :param mapping: dictonary of keys and values to be set in memcache
-        :param servery_key: key to use in determining which server in the ring
+        :param mapping: dictionary of keys and values to be set in memcache
+        :param server_key: key to use in determining which server in the ring
                             is used
         :param serialize: if True, value is serialized with JSON before sending
-                          to memcache, or with pickle if configured to use
-                          pickle instead of JSON (to avoid cache poisoning)
-        :param timeout: ttl for memcache
+                          to memcache.
+        :param time: the time to live
+        :min_compress_len: minimum compress length, this parameter was added
+                           to keep the signature compatible with
+                           python-memcached interface. This implementation
+                           ignores it
         """
-        server_key = md5hash(server_key)
-        timeout = sanitize_timeout(timeout)
-        msg = ''
-        for key, value in mapping.iteritems():
+        cmd = MemcacheCommand('set_multi', server_key)
+        timeout = sanitize_timeout(time)
+        msg = []
+        for key, value in mapping.items():
             key = md5hash(key)
             flags = 0
-            if serialize and self._allow_pickle:
-                value = pickle.dumps(value, PICKLE_PROTOCOL)
-                flags |= PICKLE_FLAG
-            elif serialize:
-                value = json.dumps(value)
+            if serialize:
+                if isinstance(value, bytes):
+                    value = value.decode('utf8')
+                value = json.dumps(value).encode('ascii')
                 flags |= JSON_FLAG
-            msg += ('set %s %d %d %s noreply\r\n%s\r\n' %
-                    (key, flags, timeout, len(value), value))
-        for (server, fp, sock) in self._get_conns(server_key):
+            msg.append(set_msg(key, flags, timeout, value))
+        for (server, fp, sock) in self._get_conns(cmd):
+            conn_start_time = tm.time()
             try:
-                sock.sendall(msg)
-                self._return_conn(server, fp, sock)
-                return
-            except Exception, e:
-                self._exception_occurred(server, e)
+                with Timeout(self._io_timeout):
+                    sock.sendall(b''.join(msg))
+                    # Wait for the set to complete
+                    for line in range(len(mapping)):
+                        fp.readline()
+                    self._return_conn(server, fp, sock)
+                    return
+            except (Exception, Timeout) as e:
+                self._exception_occurred(server, e, cmd, conn_start_time,
+                                         sock=sock, fp=fp)
 
+    @memcached_timing_stats(sample_rate=TIMING_SAMPLE_RATE_HIGH)
     def get_multi(self, keys, server_key):
         """
         Gets multiple values from memcache for the given keys.
 
         :param keys: keys for values to be retrieved from memcache
-        :param servery_key: key to use in determining which server in the ring
-                            is used
+        :param server_key: key to use in determining which server in the ring
+                           is used
         :returns: list of values
         """
-        server_key = md5hash(server_key)
-        keys = [md5hash(key) for key in keys]
-        for (server, fp, sock) in self._get_conns(server_key):
+        cmd = MemcacheCommand('get_multi', server_key)
+        hash_keys = [md5hash(key) for key in keys]
+        for (server, fp, sock) in self._get_conns(cmd):
+            conn_start_time = tm.time()
             try:
-                sock.sendall('get %s\r\n' % ' '.join(keys))
-                line = fp.readline().strip().split()
-                responses = {}
-                while line[0].upper() != 'END':
-                    if line[0].upper() == 'VALUE':
-                        size = int(line[3])
-                        value = fp.read(size)
-                        if int(line[2]) & PICKLE_FLAG:
-                            if self._allow_unpickle:
-                                value = pickle.loads(value)
-                            else:
-                                value = None
-                        elif int(line[2]) & JSON_FLAG:
-                            value = json.loads(value)
-                        responses[line[1]] = value
-                        fp.readline()
+                with Timeout(self._io_timeout):
+                    sock.sendall(b'get ' + b' '.join(hash_keys) + b'\r\n')
                     line = fp.readline().strip().split()
-                values = []
-                for key in keys:
-                    if key in responses:
-                        values.append(responses[key])
-                    else:
-                        values.append(None)
-                self._return_conn(server, fp, sock)
-                return values
-            except Exception, e:
-                self._exception_occurred(server, e)
+                    responses = {}
+                    while True:
+                        if not line:
+                            raise MemcacheConnectionError('incomplete read')
+                        if line[0].upper() == b'END':
+                            break
+                        if line[0].upper() == b'VALUE':
+                            size = int(line[3])
+                            value = fp.read(size)
+                            if int(line[2]) & PICKLE_FLAG:
+                                value = None
+                            elif int(line[2]) & JSON_FLAG:
+                                value = json.loads(value)
+                            responses[line[1]] = value
+                            fp.readline()
+                        line = fp.readline().strip().split()
+                    values = []
+                    for key in hash_keys:
+                        if key in responses:
+                            values.append(responses[key])
+                        else:
+                            values.append(None)
+                    self._return_conn(server, fp, sock)
+                    return values
+            except (Exception, Timeout) as e:
+                self._exception_occurred(server, e, cmd, conn_start_time,
+                                         sock=sock, fp=fp)
+
+
+def load_memcache(conf, logger):
+    """
+    Build a MemcacheRing object from the given config.  It will also use the
+    passed in logger.
+
+    :param conf: a dict, the config options
+    :param logger: a logger
+    """
+    memcache_servers = conf.get('memcache_servers')
+    try:
+        # Originally, while we documented using memcache_max_connections
+        # we only accepted max_connections
+        max_conns = int(conf.get('memcache_max_connections',
+                                 conf.get('max_connections', 0)))
+    except ValueError:
+        max_conns = 0
+
+    memcache_options = {}
+    if (not memcache_servers
+            or max_conns <= 0):
+        path = os.path.join(conf.get('swift_dir', '/etc/swift'),
+                            'memcache.conf')
+        memcache_conf = ConfigParser()
+        if memcache_conf.read(path):
+            # if memcache.conf exists we'll start with those base options
+            try:
+                memcache_options = dict(memcache_conf.items('memcache'))
+            except NoSectionError:
+                pass
+
+            if not memcache_servers:
+                try:
+                    memcache_servers = \
+                        memcache_conf.get('memcache', 'memcache_servers')
+                except (NoSectionError, NoOptionError):
+                    pass
+            if max_conns <= 0:
+                try:
+                    new_max_conns = \
+                        memcache_conf.get('memcache',
+                                          'memcache_max_connections')
+                    max_conns = int(new_max_conns)
+                except (NoSectionError, NoOptionError, ValueError):
+                    pass
+
+    # while memcache.conf options are the base for the memcache
+    # middleware, if you set the same option also in the filter
+    # section of the proxy config it is more specific.
+    memcache_options.update(conf)
+    connect_timeout = float(memcache_options.get(
+        'connect_timeout', CONN_TIMEOUT))
+    pool_timeout = float(memcache_options.get(
+        'pool_timeout', POOL_TIMEOUT))
+    tries = int(memcache_options.get('tries', TRY_COUNT))
+    io_timeout = float(memcache_options.get('io_timeout', IO_TIMEOUT))
+    if config_true_value(memcache_options.get('tls_enabled', 'false')):
+        tls_cafile = memcache_options.get('tls_cafile')
+        tls_certfile = memcache_options.get('tls_certfile')
+        tls_keyfile = memcache_options.get('tls_keyfile')
+        tls_context = ssl.create_default_context(
+            cafile=tls_cafile)
+        if tls_certfile:
+            tls_context.load_cert_chain(tls_certfile, tls_keyfile)
+    else:
+        tls_context = None
+    error_suppression_interval = float(memcache_options.get(
+        'error_suppression_interval', ERROR_LIMIT_TIME))
+    error_suppression_limit = float(memcache_options.get(
+        'error_suppression_limit', ERROR_LIMIT_COUNT))
+    item_size_warning_threshold = int(memcache_options.get(
+        'item_size_warning_threshold', DEFAULT_ITEM_SIZE_WARNING_THRESHOLD))
+
+    if not memcache_servers:
+        memcache_servers = '127.0.0.1:11211'
+    if max_conns <= 0:
+        max_conns = 2
+
+    return MemcacheRing(
+        [s.strip() for s in memcache_servers.split(',')
+         if s.strip()],
+        connect_timeout=connect_timeout,
+        pool_timeout=pool_timeout,
+        tries=tries,
+        io_timeout=io_timeout,
+        max_conns=max_conns,
+        tls_context=tls_context,
+        logger=logger,
+        error_limit_count=error_suppression_limit,
+        error_limit_time=error_suppression_interval,
+        error_limit_duration=error_suppression_interval,
+        item_size_warning_threshold=item_size_warning_threshold)
diff --git a/swift/common/middleware/__init__.py b/swift/common/middleware/__init__.py
index e69de29bb2..c465a5caf3 100644
--- a/swift/common/middleware/__init__.py
+++ b/swift/common/middleware/__init__.py
@@ -0,0 +1,40 @@
+# Copyright (c) 2010-2017 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import re
+from swift.common.wsgi import WSGIContext
+
+
+def app_property(name):
+    return property(lambda self: getattr(self.app, name))
+
+
+class RewriteContext(WSGIContext):
+    base_re = None
+
+    def __init__(self, app, requested, rewritten):
+        super(RewriteContext, self).__init__(app)
+        self.requested = requested
+        self.rewritten_re = re.compile(self.base_re % re.escape(rewritten))
+
+    def handle_request(self, env, start_response):
+        resp_iter = self._app_call(env)
+        for i, (header, value) in enumerate(self._response_headers):
+            if header.lower() in ('location', 'content-location'):
+                self._response_headers[i] = (header, self.rewritten_re.sub(
+                    r'\1%s\2' % self.requested, value))
+        start_response(self._response_status, self._response_headers,
+                       self._response_exc_info)
+        return resp_iter
diff --git a/swift/common/middleware/account_quotas.py b/swift/common/middleware/account_quotas.py
new file mode 100644
index 0000000000..ca8d1f0d7a
--- /dev/null
+++ b/swift/common/middleware/account_quotas.py
@@ -0,0 +1,283 @@
+# Copyright (c) 2013 OpenStack Foundation.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""
+``account_quotas`` is a middleware which blocks write requests (PUT, POST) if a
+given account quota (in bytes) is exceeded while DELETE requests are still
+allowed.
+
+``account_quotas`` uses the following metadata entries to store the account
+quota
+
++---------------------------------------------+-------------------------------+
+|Metadata                                     | Use                           |
++=============================================+===============================+
+| X-Account-Meta-Quota-Bytes (obsoleted)      | Maximum overall bytes stored  |
+|                                             | in account across containers. |
++---------------------------------------------+-------------------------------+
+| X-Account-Quota-Bytes                       | Maximum overall bytes stored  |
+|                                             | in account across containers. |
++---------------------------------------------+-------------------------------+
+| X-Account-Quota-Bytes-Policy-<policyname>   | Maximum overall bytes stored  |
+|                                             | in account across containers, |
+|                                             | for the given policy.         |
++---------------------------------------------+-------------------------------+
+| X-Account-Quota-Count                       | Maximum object count under    |
+|                                             | account.                      |
++---------------------------------------------+-------------------------------+
+| X-Account-Quota-Count-Policy-<policyname>   | Maximum object count under    |
+|                                             | account, for the given policy.|
++---------------------------------------------+-------------------------------+
+
+
+Write requests to those metadata entries are only permitted for resellers.
+There is no overall byte or object count limit set if the corresponding
+metadata entries are not set.
+
+Additionally, account quotas, of type quota-bytes or quota-count, may be set
+for each storage policy, using metadata of the form ``x-account-<quota type>-\
+policy-<policy name>``. Again, only resellers may update these metadata, and
+there will be no limit for a particular policy if the corresponding metadata
+is not set.
+
+.. note::
+   Per-policy quotas need not sum to the overall account quota, and the sum of
+   all :ref:`container_quotas` for a given policy need not sum to the account's
+   policy quota.
+
+The ``account_quotas`` middleware should be added to the pipeline in your
+``/etc/swift/proxy-server.conf`` file just after any auth middleware.
+For example::
+
+    [pipeline:main]
+    pipeline = catch_errors cache tempauth account_quotas proxy-server
+
+    [filter:account_quotas]
+    use = egg:swift#account_quotas
+
+To set the quota on an account::
+
+    swift -A http://127.0.0.1:8080/auth/v1.0 -U account:reseller -K secret \
+post -m quota-bytes:10000
+
+Remove the quota::
+
+    swift -A http://127.0.0.1:8080/auth/v1.0 -U account:reseller -K secret \
+post -m quota-bytes:
+
+The same limitations apply for the account quotas as for the container quotas.
+
+For example, when uploading an object without a content-length header the proxy
+server doesn't know the final size of the currently uploaded object and the
+upload will be allowed if the current account size is within the quota.
+Due to the eventual consistency further uploads might be possible until the
+account size has been updated.
+"""
+
+from swift.common.swob import HTTPForbidden, HTTPBadRequest, \
+    HTTPRequestEntityTooLarge, wsgify
+from swift.common.registry import register_swift_info
+from swift.common.storage_policy import POLICIES
+from swift.proxy.controllers.base import get_account_info, get_container_info
+
+
+class AccountQuotaMiddleware(object):
+    """Account quota middleware
+
+    See above for a full description.
+
+    """
+    def __init__(self, app, *args, **kwargs):
+        self.app = app
+
+    def quota_exceeded(self, request, body):
+        # request.environ['swift.authorize'](req) is delayed and not called
+        # immediately to support container acls. However, the middleware should
+        # still return immediately if any quota is exceeded.
+        resp = HTTPRequestEntityTooLarge(body=body)
+        if 'swift.authorize' in request.environ:
+            orig_authorize = request.environ['swift.authorize']
+
+            def reject_authorize(*args, **kwargs):
+                aresp = orig_authorize(*args, **kwargs)
+                if aresp:
+                    return aresp
+                return resp
+            request.environ['swift.authorize'] = reject_authorize
+            return self.app
+        else:
+            return resp
+
+    def validate_and_translate_quotas(self, request, quota_type):
+        new_quotas = {}
+        new_quotas[None] = request.headers.get(
+            'X-Account-%s' % quota_type)
+        if request.headers.get(
+                'X-Remove-Account-%s' % quota_type):
+            new_quotas[None] = ''  # X-Remove dominates if both are present
+
+        for policy in POLICIES:
+            tail = 'Account-%s-Policy-%s' % (quota_type, policy.name)
+            if request.headers.get('X-Remove-' + tail):
+                new_quotas[policy.idx] = ''
+            else:
+                quota = request.headers.pop('X-' + tail, None)
+                new_quotas[policy.idx] = quota
+
+        if request.environ.get('reseller_request') is True:
+            if any(quota and not quota.isdigit()
+                    for quota in new_quotas.values()):
+                raise HTTPBadRequest()
+            for idx, quota in new_quotas.items():
+                if idx is None:
+                    hdr = 'X-Account-Sysmeta-%s' % quota_type
+                else:
+                    hdr = 'X-Account-Sysmeta-%s-Policy-%d' % (quota_type, idx)
+                request.headers[hdr] = quota
+        elif any(quota is not None for quota in new_quotas.values()):
+            # deny quota set for non-reseller
+            raise HTTPForbidden()
+
+    def handle_account(self, request):
+        if request.method in ("POST", "PUT"):
+            # Support old meta format
+            for legacy_header in [
+                'X-Account-Meta-Quota-Bytes',
+                'X-Remove-Account-Meta-Quota-Bytes',
+            ]:
+                new_header = legacy_header.replace('-Meta-', '-')
+                legacy_value = request.headers.get(legacy_header)
+                if legacy_value is not None and not \
+                        request.headers.get(new_header):
+                    request.headers[new_header] = legacy_value
+            # account request, so we pay attention to the quotas
+            self.validate_and_translate_quotas(request, "Quota-Bytes")
+            self.validate_and_translate_quotas(request, "Quota-Count")
+        resp = request.get_response(self.app)
+        # Non-resellers can't update quotas, but they *can* see them
+        # Global quotas
+        postfixes = ('Quota-Bytes', 'Quota-Count')
+        for postfix in postfixes:
+            value = resp.headers.get('X-Account-Sysmeta-%s' % postfix)
+            if value:
+                resp.headers['X-Account-%s' % postfix] = value
+
+        # Per policy quotas
+        for policy in POLICIES:
+            infixes = ('Quota-Bytes-Policy', 'Quota-Count-Policy')
+            for infix in infixes:
+                value = resp.headers.get('X-Account-Sysmeta-%s-%d' % (
+                    infix, policy.idx))
+                if value:
+                    resp.headers['X-Account-%s-%s' % (
+                        infix, policy.name)] = value
+        return resp
+
+    @wsgify
+    def __call__(self, request):
+
+        try:
+            ver, account, container, obj = request.split_path(
+                2, 4, rest_with_last=True)
+        except ValueError:
+            return self.app
+
+        if not container:
+            return self.handle_account(request)
+        # container or object request; even if the quota headers are set
+        # in the request, they're meaningless
+
+        if not (request.method == "PUT" and obj):
+            return self.app
+        # OK, object PUT
+
+        if request.environ.get('reseller_request') is True:
+            # but resellers aren't constrained by quotas :-)
+            return self.app
+
+        # Object PUT request
+        content_length = (request.content_length or 0)
+
+        account_info = get_account_info(request.environ, self.app,
+                                        swift_source='AQ')
+        if not account_info:
+            return self.app
+
+        # Check for quota byte violation
+        try:
+            quota = int(
+                account_info["sysmeta"].get(
+                    "quota-bytes", account_info["meta"].get("quota-bytes", -1)
+                )
+            )
+        except ValueError:
+            quota = -1
+        if quota >= 0:
+            new_size = int(account_info['bytes']) + content_length
+            if quota < new_size:
+                return self.quota_exceeded(request, "Upload exceeds quota.")
+
+        # Check for quota count violation
+        try:
+            quota = int(account_info['sysmeta'].get('quota-count', -1))
+        except ValueError:
+            quota = -1
+        if quota >= 0:
+            new_count = int(account_info['total_object_count']) + 1
+            if quota < new_count:
+                return self.quota_exceeded(request, "Upload exceeds quota.")
+
+        container_info = get_container_info(request.environ, self.app,
+                                            swift_source='AQ')
+        if not container_info:
+            return self.app
+        policy_idx = container_info['storage_policy']
+
+        # Check quota-byte per policy
+        sysmeta_key = 'quota-bytes-policy-%s' % policy_idx
+        try:
+            policy_quota = int(account_info['sysmeta'].get(sysmeta_key, -1))
+        except ValueError:
+            policy_quota = -1
+        if policy_quota >= 0:
+            policy_stats = account_info['storage_policies'].get(policy_idx, {})
+            new_size = int(policy_stats.get('bytes', 0)) + content_length
+            if policy_quota < new_size:
+                return self.quota_exceeded(
+                    request, "Upload exceeds policy quota.")
+
+        # Check quota-count per policy
+        sysmeta_key = 'quota-count-policy-%s' % policy_idx
+        try:
+            policy_quota = int(account_info['sysmeta'].get(sysmeta_key, -1))
+        except ValueError:
+            policy_quota = -1
+        if policy_quota >= 0:
+            policy_stats = account_info['storage_policies'].get(policy_idx, {})
+            new_size = int(policy_stats.get('object_count', 0)) + 1
+            if policy_quota < new_size:
+                return self.quota_exceeded(
+                    request, "Upload exceeds policy quota.")
+
+        return self.app
+
+
+def filter_factory(global_conf, **local_conf):
+    """Returns a WSGI filter app for use with paste.deploy."""
+    register_swift_info('account_quotas')
+
+    def account_quota_filter(app):
+        return AccountQuotaMiddleware(app)
+    return account_quota_filter
diff --git a/swift/common/middleware/acl.py b/swift/common/middleware/acl.py
index b542493fff..a8c0e04bce 100644
--- a/swift/common/middleware/acl.py
+++ b/swift/common/middleware/acl.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,7 +13,8 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-from swift.common.utils import urlparse
+import json
+from urllib.parse import unquote, urlparse
 
 
 def clean_acl(name, value):
@@ -89,35 +90,98 @@ def clean_acl(name, value):
     values = []
     for raw_value in value.split(','):
         raw_value = raw_value.strip()
-        if raw_value:
-            if ':' not in raw_value:
-                values.append(raw_value)
-            else:
-                first, second = (v.strip() for v in raw_value.split(':', 1))
-                if not first or first[0] != '.':
-                    values.append(raw_value)
-                elif first in ('.r', '.ref', '.referer', '.referrer'):
-                    if 'write' in name:
-                        raise ValueError('Referrers not allowed in write ACL: '
-                                         '%s' % repr(raw_value))
-                    negate = False
-                    if second and second[0] == '-':
-                        negate = True
-                        second = second[1:].strip()
-                    if second and second != '*' and second[0] == '*':
-                        second = second[1:].strip()
-                    if not second or second == '.':
-                        raise ValueError('No host/domain value after referrer '
-                                         'designation in ACL: %s' %
-                                         repr(raw_value))
-                    values.append('.r:%s%s' % (negate and '-' or '', second))
-                else:
-                    raise ValueError('Unknown designator %s in ACL: %s' %
-                                     (repr(first), repr(raw_value)))
+        if not raw_value:
+            continue
+        if ':' not in raw_value:
+            values.append(raw_value)
+            continue
+        first, second = (v.strip() for v in raw_value.split(':', 1))
+        if not first or not first.startswith('.'):
+            values.append(raw_value)
+        elif first in ('.r', '.ref', '.referer', '.referrer'):
+            if 'write' in name:
+                raise ValueError('Referrers not allowed in write ACL: '
+                                 '%s' % repr(raw_value))
+            negate = False
+            if second and second.startswith('-'):
+                negate = True
+                second = second[1:].strip()
+            if second and second != '*' and second.startswith('*'):
+                second = second[1:].strip()
+            if not second or second == '.':
+                raise ValueError('No host/domain value after referrer '
+                                 'designation in ACL: %s' % repr(raw_value))
+            values.append('.r:%s%s' % ('-' if negate else '', second))
+        else:
+            raise ValueError('Unknown designator %s in ACL: %s' %
+                             (repr(first), repr(raw_value)))
     return ','.join(values)
 
 
-def parse_acl(acl_string):
+def format_acl_v1(groups=None, referrers=None, header_name=None):
+    """
+    Returns a standard Swift ACL string for the given inputs.
+
+    Caller is responsible for ensuring that :referrers: parameter is only given
+    if the ACL is being generated for X-Container-Read.  (X-Container-Write
+    and the account ACL headers don't support referrers.)
+
+    :param groups: a list of groups (and/or members in most auth systems) to
+                   grant access
+    :param referrers: a list of referrer designations (without the leading .r:)
+    :param header_name: (optional) header name of the ACL we're preparing, for
+                        clean_acl; if None, returned ACL won't be cleaned
+    :returns: a Swift ACL string for use in X-Container-{Read,Write},
+              X-Account-Access-Control, etc.
+    """
+    groups, referrers = groups or [], referrers or []
+    referrers = ['.r:%s' % r for r in referrers]
+    result = ','.join(groups + referrers)
+    return (clean_acl(header_name, result) if header_name else result)
+
+
+def format_acl_v2(acl_dict):
+    r"""
+    Returns a version-2 Swift ACL JSON string.
+
+    HTTP headers for Version 2 ACLs have the following form:
+      Header-Name: {"arbitrary":"json","encoded":"string"}
+
+    JSON will be forced ASCII (containing six-char \uNNNN sequences rather
+    than UTF-8; UTF-8 is valid JSON but clients vary in their support for
+    UTF-8 headers), and without extraneous whitespace.
+
+    Advantages over V1: forward compatibility (new keys don't cause parsing
+    exceptions); Unicode support; no reserved words (you can have a user
+    named .rlistings if you want).
+
+    :param acl_dict: dict of arbitrary data to put in the ACL; see specific
+                     auth systems such as tempauth for supported values
+    :returns: a JSON string which encodes the ACL
+    """
+    return json.dumps(acl_dict, ensure_ascii=True, separators=(',', ':'),
+                      sort_keys=True)
+
+
+def format_acl(version=1, **kwargs):
+    """
+    Compatibility wrapper to help migrate ACL syntax from version 1 to 2.
+    Delegates to the appropriate version-specific format_acl method, defaulting
+    to version 1 for backward compatibility.
+
+    :param kwargs: keyword args appropriate for the selected ACL syntax version
+                   (see :func:`format_acl_v1` or :func:`format_acl_v2`)
+    """
+    if version == 1:
+        return format_acl_v1(
+            groups=kwargs.get('groups'), referrers=kwargs.get('referrers'),
+            header_name=kwargs.get('header_name'))
+    elif version == 2:
+        return format_acl_v2(kwargs.get('acl_dict'))
+    raise ValueError("Invalid ACL version: %r" % version)
+
+
+def parse_acl_v1(acl_string):
     """
     Parses a standard Swift ACL string into a referrers list and groups list.
 
@@ -135,10 +199,53 @@ def parse_acl(acl_string):
             if value.startswith('.r:'):
                 referrers.append(value[len('.r:'):])
             else:
-                groups.append(value)
+                groups.append(unquote(value))
     return referrers, groups
 
 
+def parse_acl_v2(data):
+    """
+    Parses a version-2 Swift ACL string and returns a dict of ACL info.
+
+    :param data: string containing the ACL data in JSON format
+    :returns: A dict (possibly empty) containing ACL info, e.g.:
+              {"groups": [...], "referrers": [...]}
+    :returns: None if data is None, is not valid JSON or does not parse
+        as a dict
+    :returns: empty dictionary if data is an empty string
+    """
+    if data is None:
+        return None
+    if data == '':
+        return {}
+    try:
+        result = json.loads(data)
+        return (result if type(result) is dict else None)
+    except ValueError:
+        return None
+
+
+def parse_acl(*args, **kwargs):
+    """
+    Compatibility wrapper to help migrate ACL syntax from version 1 to 2.
+    Delegates to the appropriate version-specific parse_acl method, attempting
+    to determine the version from the types of args/kwargs.
+
+    :param args: positional args for the selected ACL syntax version
+    :param kwargs: keyword args for the selected ACL syntax version
+                   (see :func:`parse_acl_v1` or :func:`parse_acl_v2`)
+    :returns: the return value of :func:`parse_acl_v1` or :func:`parse_acl_v2`
+    """
+    version = kwargs.pop('version', None)
+    if version in (1, None):
+        return parse_acl_v1(*args)
+    elif version == 2:
+        return parse_acl_v2(*args, **kwargs)
+    else:
+        raise ValueError('Unknown ACL version: parse_acl(%r, %r)' %
+                         (args, kwargs))
+
+
 def referrer_allowed(referrer, referrer_acl):
     """
     Returns True if the referrer should be allowed based on the referrer_acl
@@ -155,12 +262,39 @@ def referrer_allowed(referrer, referrer_acl):
     if referrer_acl:
         rhost = urlparse(referrer or '').hostname or 'unknown'
         for mhost in referrer_acl:
-            if mhost[0] == '-':
+            if mhost.startswith('-'):
                 mhost = mhost[1:]
-                if mhost == rhost or (mhost[0] == '.' and
+                if mhost == rhost or (mhost.startswith('.') and
                                       rhost.endswith(mhost)):
                     allow = False
             elif mhost == '*' or mhost == rhost or \
-                    (mhost[0] == '.' and rhost.endswith(mhost)):
+                    (mhost.startswith('.') and rhost.endswith(mhost)):
                 allow = True
     return allow
+
+
+def acls_from_account_info(info):
+    """
+    Extract the account ACLs from the given account_info, and return the ACLs.
+
+    :param info: a dict of the form returned by get_account_info
+    :returns: None (no ACL system metadata is set), or a dict of the form::
+       {'admin': [...], 'read-write': [...], 'read-only': [...]}
+
+    :raises ValueError: on a syntactically invalid header
+    """
+    acl = parse_acl(
+        version=2, data=info.get('sysmeta', {}).get('core-access-control'))
+    if acl is None:
+        return None
+    admin_members = acl.get('admin', [])
+    readwrite_members = acl.get('read-write', [])
+    readonly_members = acl.get('read-only', [])
+    if not any((admin_members, readwrite_members, readonly_members)):
+        return None
+
+    return {
+        'admin': admin_members,
+        'read-write': readwrite_members,
+        'read-only': readonly_members,
+    }
diff --git a/swift/common/middleware/backend_ratelimit.py b/swift/common/middleware/backend_ratelimit.py
new file mode 100644
index 0000000000..696d926ae8
--- /dev/null
+++ b/swift/common/middleware/backend_ratelimit.py
@@ -0,0 +1,230 @@
+# Copyright (c) 2022 NVIDIA
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import os
+import time
+
+from swift.common.request_helpers import split_and_validate_path
+from swift.common.swob import Request, HTTPTooManyBackendRequests, \
+    HTTPException
+from swift.common.utils import get_logger, non_negative_float, \
+    EventletRateLimiter, readconf
+
+RATE_LIMITED_METHODS = ('GET', 'HEAD', 'PUT', 'POST', 'DELETE', 'UPDATE',
+                        'REPLICATE')
+BACKEND_RATELIMIT_CONFIG_SECTION = 'backend_ratelimit'
+DEFAULT_BACKEND_RATELIMIT_CONF_FILE = 'backend-ratelimit.conf'
+DEFAULT_CONFIG_RELOAD_INTERVAL = 60.0
+DEFAULT_REQUESTS_PER_DEVICE_PER_SECOND = 0.0
+DEFAULT_REQUESTS_PER_DEVICE_RATE_BUFFER = 1.0
+
+
+class BackendRateLimitMiddleware(object):
+    """
+    Backend rate-limiting middleware.
+
+    Rate-limits requests to backend storage node devices. Each (device, request
+    method) combination is independently rate-limited. All requests with a
+    'GET', 'HEAD', 'PUT', 'POST', 'DELETE', 'UPDATE' or 'REPLICATE' method are
+    rate limited on a per-device basis by both a method-specific rate and an
+    overall device rate limit.
+
+    If a request would cause the rate-limit to be exceeded for the method
+    and/or device then a response with a 529 status code is returned.
+    """
+    def __init__(self, app, filter_conf, logger=None):
+        self.app = app
+        self.filter_conf = filter_conf
+        self.logger = logger or get_logger(self.filter_conf,
+                                           log_route='backend_ratelimit')
+        self.requests_per_device_rate_buffer = \
+            DEFAULT_REQUESTS_PER_DEVICE_RATE_BUFFER
+        # map (device, method) -> rate
+        self.requests_per_device_per_second = {}
+        # map (device, method) -> RateLimiter, populated on-demand
+        self.rate_limiters = {}
+
+        # some config options are *only* read from filter conf at startup...
+        default_conf_path = os.path.join(
+            self.filter_conf.get('swift_dir', '/etc/swift'),
+            DEFAULT_BACKEND_RATELIMIT_CONF_FILE)
+        try:
+            self.conf_path = self.filter_conf['backend_ratelimit_conf_path']
+            self.is_config_file_expected = True
+        except KeyError:
+            self.conf_path = default_conf_path
+            self.is_config_file_expected = False
+        self.config_reload_interval = non_negative_float(
+            filter_conf.get('config_reload_interval',
+                            DEFAULT_CONFIG_RELOAD_INTERVAL))
+
+        # other conf options are read from filter section at startup but may
+        # also be overridden by options in a separate config file...
+        self._last_config_reload_attempt = time.time()
+        self._apply_config(self.filter_conf)
+        self._load_config_file()
+
+    def _refresh_ratelimiters(self):
+        # note: if we ever wanted to prune the ratelimiters (in case devices
+        # have been removed) we could inspect each ratelimiter's running_time
+        # and remove those with very old running_time
+        for (dev, method), rl in self.rate_limiters.items():
+            rl.set_max_rate(self.requests_per_device_per_second[method])
+            rl.set_rate_buffer(self.requests_per_device_rate_buffer)
+
+    def _apply_config(self, conf):
+        modified = False
+        reqs_per_device_rate_buffer = non_negative_float(
+            conf.get('requests_per_device_rate_buffer',
+                     DEFAULT_REQUESTS_PER_DEVICE_RATE_BUFFER))
+
+        # note: 'None' key holds the aggregate per-device limit for all methods
+        reqs_per_device_per_second = {None: non_negative_float(
+            conf.get('requests_per_device_per_second', 0.0))}
+        for method in RATE_LIMITED_METHODS:
+            val = non_negative_float(
+                conf.get('%s_requests_per_device_per_second'
+                         % method.lower(), 0.0))
+            reqs_per_device_per_second[method] = val
+
+        if reqs_per_device_rate_buffer != self.requests_per_device_rate_buffer:
+            self.requests_per_device_rate_buffer = reqs_per_device_rate_buffer
+            modified = True
+        if reqs_per_device_per_second != self.requests_per_device_per_second:
+            self.requests_per_device_per_second = reqs_per_device_per_second
+            self.is_any_rate_limit_configured = any(
+                self.requests_per_device_per_second.values())
+            modified = True
+        if modified:
+            self._refresh_ratelimiters()
+        return modified
+
+    def _load_config_file(self):
+        # If conf file can be read then apply its options to the filter conf
+        # options, discarding *all* options previously loaded from the conf
+        # file i.e. options deleted from the conf file will revert to the
+        # filter conf value or default value. If the conf file cannot be read
+        # or is invalid, then the current config is left unchanged.
+        try:
+            new_conf = dict(self.filter_conf)  # filter_conf not current conf
+            new_conf.update(
+                readconf(self.conf_path, BACKEND_RATELIMIT_CONFIG_SECTION))
+            modified = self._apply_config(new_conf)
+            if modified:
+                self.logger.info('Loaded config file %s, config changed',
+                                 self.conf_path)
+            elif not self.is_config_file_expected:
+                self.logger.info('Loaded new config file %s, config unchanged',
+                                 self.conf_path)
+            else:
+                self.logger.debug(
+                    'Loaded existing config file %s, config unchanged',
+                    self.conf_path)
+            self.is_config_file_expected = True
+        except IOError as err:
+            if self.is_config_file_expected:
+                self.logger.warning(
+                    'Failed to load config file, config unchanged: %s', err)
+            self.is_config_file_expected = False
+        except ValueError as err:
+            # ...but if it exists it should be valid
+            self.logger.warning('Invalid config file %s, config unchanged: %s',
+                                self.conf_path, err)
+
+    def _maybe_reload_config(self):
+        if self.config_reload_interval:
+            now = time.time()
+            if (now - self._last_config_reload_attempt
+                    >= self.config_reload_interval):
+                try:
+                    self._load_config_file()
+                except Exception:  # noqa
+                    self.logger.exception('Error reloading config file')
+                finally:
+                    # always reset last loaded time to avoid re-try storm
+                    self._last_config_reload_attempt = now
+
+    def _get_ratelimiter(self, device, method=None):
+        """
+        Get a rate limiter for the (device, method) combination. If a rate
+        limiter does not yet exist for the given (device, method) combination
+        then it is created and added to the map of rate limiters.
+
+        :param: the device.
+        :method: the request method; if None then the aggregate rate limiter
+            for all requests to the device is returned.
+        :returns: an instance of ``EventletRateLimiter``.
+        """
+        try:
+            rl = self.rate_limiters[(device, method)]
+        except KeyError:
+            rl = EventletRateLimiter(
+                max_rate=self.requests_per_device_per_second[method],
+                rate_buffer=self.requests_per_device_rate_buffer,
+                running_time=time.time(),
+                burst_after_idle=True)
+            self.rate_limiters[(device, method)] = rl
+        return rl
+
+    def _is_allowed(self, device, method):
+        """
+        Evaluate backend rate-limiting policies for the incoming request.
+
+        A request is allowed when neither the per-(device, method) rate-limit
+        nor the per-device rate-limit has been reached.
+
+        Note: a request will be disallowed if the aggregate per-device
+        rate-limit has been reached, even if the per-(device, method)
+        rate-limit has not been reached for the request's method.
+
+        :param: the device.
+        :method: the request method.
+        :returns: boolean, is_allowed.
+        """
+        return (self._get_ratelimiter(device, None).is_allowed()
+                and self._get_ratelimiter(device, method).is_allowed())
+
+    def __call__(self, env, start_response):
+        """
+        WSGI entry point.
+
+        :param env: WSGI environment dictionary
+        :param start_response: WSGI callable
+        """
+        self._maybe_reload_config()
+        req = Request(env)
+        handler = self.app
+        if (self.is_any_rate_limit_configured
+                and req.method in RATE_LIMITED_METHODS):
+            try:
+                device, partition, _ = split_and_validate_path(req, 1, 3, True)
+                int(partition)  # check it's a valid partition
+            except (ValueError, HTTPException):
+                # request may not have device/partition e.g. a healthcheck req
+                pass
+            else:
+                if not self._is_allowed(device, req.method):
+                    self.logger.increment('backend.ratelimit')
+                    handler = HTTPTooManyBackendRequests()
+        return handler(env, start_response)
+
+
+def filter_factory(global_conf, **local_conf):
+    conf = global_conf.copy()
+    conf.update(local_conf)
+
+    def backend_ratelimit_filter(app):
+        return BackendRateLimitMiddleware(app, conf)
+
+    return backend_ratelimit_filter
diff --git a/swift/common/middleware/bulk.py b/swift/common/middleware/bulk.py
new file mode 100644
index 0000000000..cf26c7ef5a
--- /dev/null
+++ b/swift/common/middleware/bulk.py
@@ -0,0 +1,728 @@
+# Copyright (c) 2013 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""
+Middleware that will perform many operations on a single request.
+
+---------------
+Extract Archive
+---------------
+
+Expand tar files into a Swift account. Request must be a PUT with the
+query parameter ``?extract-archive=format`` specifying the format of archive
+file. Accepted formats are tar, tar.gz, and tar.bz2.
+
+For a PUT to the following url::
+
+    /v1/AUTH_Account/$UPLOAD_PATH?extract-archive=tar.gz
+
+UPLOAD_PATH is where the files will be expanded to. UPLOAD_PATH can be a
+container, a pseudo-directory within a container, or an empty string. The
+destination of a file in the archive will be built as follows::
+
+    /v1/AUTH_Account/$UPLOAD_PATH/$FILE_PATH
+
+Where FILE_PATH is the file name from the listing in the tar file.
+
+If the UPLOAD_PATH is an empty string, containers will be auto created
+accordingly and files in the tar that would not map to any container (files
+in the base directory) will be ignored.
+
+Only regular files will be uploaded. Empty directories, symlinks, etc will
+not be uploaded.
+
+------------
+Content Type
+------------
+
+If the content-type header is set in the extract-archive call, Swift will
+assign that content-type to all the underlying files. The bulk middleware
+will extract the archive file and send the internal files using PUT
+operations using the same headers from the original request
+(e.g. auth-tokens, content-Type, etc.). Notice that any middleware call
+that follows the bulk middleware does not know if this was a bulk request
+or if these were individual requests sent by the user.
+
+In order to make Swift detect the content-type for the files based on the
+file extension, the content-type in the extract-archive call should not be
+set. Alternatively, it is possible to explicitly tell Swift to detect the
+content type using this header::
+
+    X-Detect-Content-Type: true
+
+For example::
+
+    curl -X PUT http://127.0.0.1/v1/AUTH_acc/cont/$?extract-archive=tar
+     -T backup.tar
+     -H "Content-Type: application/x-tar"
+     -H "X-Auth-Token: xxx"
+     -H "X-Detect-Content-Type: true"
+
+------------------
+Assigning Metadata
+------------------
+
+The tar file format (1) allows for UTF-8 key/value pairs to be associated
+with each file in an archive. If a file has extended attributes, then tar
+will store those as key/value pairs. The bulk middleware can read those
+extended attributes and convert them to Swift object metadata. Attributes
+starting with "user.meta" are converted to object metadata, and
+"user.mime_type" is converted to Content-Type.
+
+For example::
+
+    setfattr -n user.mime_type -v "application/python-setup" setup.py
+    setfattr -n user.meta.lunch -v "burger and fries" setup.py
+    setfattr -n user.meta.dinner -v "baked ziti" setup.py
+    setfattr -n user.stuff -v "whee" setup.py
+
+Will get translated to headers::
+
+    Content-Type: application/python-setup
+    X-Object-Meta-Lunch: burger and fries
+    X-Object-Meta-Dinner: baked ziti
+
+The bulk middleware  will handle xattrs stored by both GNU and BSD tar (2).
+Only xattrs ``user.mime_type`` and ``user.meta.*`` are processed. Other
+attributes are ignored.
+
+In addition to the extended attributes, the object metadata and the
+x-delete-at/x-delete-after headers set in the request are also assigned to the
+extracted objects.
+
+Notes:
+
+(1) The POSIX 1003.1-2001 (pax) format. The default format on GNU tar
+1.27.1 or later.
+
+(2) Even with pax-format tarballs, different encoders store xattrs slightly
+differently; for example, GNU tar stores the xattr "user.userattribute" as
+pax header "SCHILY.xattr.user.userattribute", while BSD tar (which uses
+libarchive) stores it as "LIBARCHIVE.xattr.user.userattribute".
+
+--------
+Response
+--------
+
+The response from bulk operations functions differently from other Swift
+responses. This is because a short request body sent from the client could
+result in many operations on the proxy server and precautions need to be
+made to prevent the request from timing out due to lack of activity. To
+this end, the client will always receive a 200 OK response, regardless of
+the actual success of the call.  The body of the response must be parsed to
+determine the actual success of the operation. In addition to this the
+client may receive zero or more whitespace characters prepended to the
+actual response body while the proxy server is completing the request.
+
+The format of the response body defaults to text/plain but can be either
+json or xml depending on the ``Accept`` header. Acceptable formats are
+``text/plain``, ``application/json``, ``application/xml``, and ``text/xml``.
+An example body is as follows::
+
+    {"Response Status": "201 Created",
+     "Response Body": "",
+     "Errors": [],
+     "Number Files Created": 10}
+
+If all valid files were uploaded successfully the Response Status will be
+201 Created.  If any files failed to be created the response code
+corresponds to the subrequest's error. Possible codes are 400, 401, 502 (on
+server errors), etc. In both cases the response body will specify the
+number of files successfully uploaded and a list of the files that failed.
+
+There are proxy logs created for each file (which becomes a subrequest) in
+the tar. The subrequest's proxy log will have a swift.source set to "EA"
+the log's content length will reflect the unzipped size of the file. If
+double proxy-logging is used the leftmost logger will not have a
+swift.source set and the content length will reflect the size of the
+payload sent to the proxy (the unexpanded size of the tar.gz).
+
+-----------
+Bulk Delete
+-----------
+
+Will delete multiple objects or containers from their account with a
+single request. Responds to POST requests with query parameter
+``?bulk-delete`` set. The request url is your storage url. The Content-Type
+should be set to ``text/plain``. The body of the POST request will be a
+newline separated list of url encoded objects to delete. You can delete
+10,000 (configurable) objects per request. The objects specified in the
+POST request body must be URL encoded and in the form::
+
+    /container_name/obj_name
+
+or for a container (which must be empty at time of delete)::
+
+    /container_name
+
+The response is similar to extract archive as in every response will be a
+200 OK and you must parse the response body for actual results. An example
+response is::
+
+    {"Number Not Found": 0,
+     "Response Status": "200 OK",
+     "Response Body": "",
+     "Errors": [],
+     "Number Deleted": 6}
+
+If all items were successfully deleted (or did not exist), the Response
+Status will be 200 OK. If any failed to delete, the response code
+corresponds to the subrequest's error. Possible codes are 400, 401, 502 (on
+server errors), etc. In all cases the response body will specify the number
+of items successfully deleted, not found, and a list of those that failed.
+The return body will be formatted in the way specified in the request's
+``Accept`` header. Acceptable formats are ``text/plain``, ``application/json``,
+``application/xml``, and ``text/xml``.
+
+There are proxy logs created for each object or container (which becomes a
+subrequest) that is deleted. The subrequest's proxy log will have a
+swift.source set to "BD" the log's content length of 0. If double
+proxy-logging is used the leftmost logger will not have a
+swift.source set and the content length will reflect the size of the
+payload sent to the proxy (the list of objects/containers to be deleted).
+"""
+
+from swift.common.request_helpers import get_heartbeat_response_body
+import tarfile
+from time import time
+from eventlet import sleep
+import zlib
+from swift.common.swob import Request, HTTPBadGateway, \
+    HTTPCreated, HTTPBadRequest, HTTPNotFound, HTTPUnauthorized, HTTPOk, \
+    HTTPPreconditionFailed, HTTPRequestEntityTooLarge, HTTPNotAcceptable, \
+    HTTPLengthRequired, HTTPException, HTTPServerError, wsgify, \
+    bytes_to_wsgi, str_to_wsgi, wsgi_unquote, wsgi_quote, wsgi_to_str
+from swift.common.utils import get_logger, StreamingPile
+from swift.common.registry import register_swift_info
+from swift.common import constraints
+from swift.common.http import HTTP_UNAUTHORIZED, HTTP_NOT_FOUND, HTTP_CONFLICT
+from swift.common.request_helpers import is_user_meta
+from swift.common.wsgi import make_subrequest
+
+
+class CreateContainerError(Exception):
+    def __init__(self, msg, status_int, status):
+        self.status_int = status_int
+        self.status = status
+        super(CreateContainerError, self).__init__(msg)
+
+
+ACCEPTABLE_FORMATS = ['text/plain', 'application/json', 'application/xml',
+                      'text/xml']
+
+
+def pax_key_to_swift_header(pax_key):
+    if (pax_key == u"SCHILY.xattr.user.mime_type" or
+            pax_key == u"LIBARCHIVE.xattr.user.mime_type"):
+        return "Content-Type"
+    elif pax_key.startswith(u"SCHILY.xattr.user.meta."):
+        useful_part = pax_key[len(u"SCHILY.xattr.user.meta."):]
+        return str_to_wsgi("X-Object-Meta-" + useful_part)
+    elif pax_key.startswith(u"LIBARCHIVE.xattr.user.meta."):
+        useful_part = pax_key[len(u"LIBARCHIVE.xattr.user.meta."):]
+        return str_to_wsgi("X-Object-Meta-" + useful_part)
+    else:
+        # You can get things like atime/mtime/ctime or filesystem ACLs in
+        # pax headers; those aren't really user metadata. The same goes for
+        # other, non-user metadata.
+        return None
+
+
+class Bulk(object):
+
+    def __init__(self, app, conf, max_containers_per_extraction=10000,
+                 max_failed_extractions=1000, max_deletes_per_request=10000,
+                 max_failed_deletes=1000, yield_frequency=10,
+                 delete_concurrency=2, retry_count=0, retry_interval=1.5,
+                 logger=None):
+        self.app = app
+        self.logger = logger or get_logger(conf, log_route='bulk')
+        self.max_containers = max_containers_per_extraction
+        self.max_failed_extractions = max_failed_extractions
+        self.max_failed_deletes = max_failed_deletes
+        self.max_deletes_per_request = max_deletes_per_request
+        self.yield_frequency = yield_frequency
+        self.delete_concurrency = min(1000, max(1, delete_concurrency))
+        self.retry_count = retry_count
+        self.retry_interval = retry_interval
+        self.max_path_length = constraints.MAX_OBJECT_NAME_LENGTH \
+            + constraints.MAX_CONTAINER_NAME_LENGTH + 2
+
+    def create_container(self, req, container_path):
+        """
+        Checks if the container exists and if not try to create it.
+        :params container_path: an unquoted path to a container to be created
+        :returns: True if created container, False if container exists
+        :raises CreateContainerError: when unable to create container
+        """
+        head_cont_req = make_subrequest(
+            req.environ, method='HEAD', path=wsgi_quote(container_path),
+            headers={'X-Auth-Token': req.headers.get('X-Auth-Token')},
+            swift_source='EA')
+        resp = head_cont_req.get_response(self.app)
+        if resp.is_success:
+            return False
+        if resp.status_int == HTTP_NOT_FOUND:
+            create_cont_req = make_subrequest(
+                req.environ, method='PUT', path=wsgi_quote(container_path),
+                headers={'X-Auth-Token': req.headers.get('X-Auth-Token')},
+                swift_source='EA')
+            resp = create_cont_req.get_response(self.app)
+            if resp.is_success:
+                return True
+        raise CreateContainerError(
+            "Create Container Failed: " + container_path,
+            resp.status_int, resp.status)
+
+    def get_objs_to_delete(self, req):
+        """
+        Will populate objs_to_delete with data from request input.
+        :params req: a Swob request
+        :returns: a list of the contents of req.body when separated by newline.
+        :raises HTTPException: on failures
+        """
+        line = b''
+        data_remaining = True
+        objs_to_delete = []
+        if req.content_length is None and \
+                req.headers.get('transfer-encoding', '').lower() != 'chunked':
+            raise HTTPLengthRequired(request=req)
+
+        while data_remaining:
+            if b'\n' in line:
+                obj_to_delete, line = line.split(b'\n', 1)
+                # yeah, all this chaining is pretty terrible...
+                # but it gets even worse trying to use UTF-8 and
+                # errors='surrogateescape' when dealing with terrible
+                # input like b'\xe2%98\x83'
+                obj_to_delete = wsgi_to_str(wsgi_unquote(
+                    bytes_to_wsgi(obj_to_delete.strip())))
+                objs_to_delete.append({'name': obj_to_delete})
+            else:
+                data = req.body_file.read(self.max_path_length)
+                if data:
+                    line += data
+                else:
+                    data_remaining = False
+                    obj_to_delete = wsgi_to_str(wsgi_unquote(
+                        bytes_to_wsgi(line.strip())))
+                    if obj_to_delete:
+                        objs_to_delete.append({'name': obj_to_delete})
+            if len(objs_to_delete) > self.max_deletes_per_request:
+                raise HTTPRequestEntityTooLarge(
+                    'Maximum Bulk Deletes: %d per request' %
+                    self.max_deletes_per_request)
+            if len(line) > self.max_path_length * 2:
+                raise HTTPBadRequest('Invalid File Name')
+        return objs_to_delete
+
+    def handle_delete_iter(self, req, objs_to_delete=None,
+                           user_agent='BulkDelete', swift_source='BD',
+                           out_content_type='text/plain'):
+        """
+        A generator that can be assigned to a swob Response's app_iter which,
+        when iterated over, will delete the objects specified in request body.
+        Will occasionally yield whitespace while request is being processed.
+        When the request is completed will yield a response body that can be
+        parsed to determine success. See above documentation for details.
+
+        :params req: a swob Request
+        :params objs_to_delete: a list of dictionaries that specifies the
+            (native string) objects to be deleted. If None, uses
+            self.get_objs_to_delete to query request.
+        """
+        last_yield = time()
+        if out_content_type and out_content_type.endswith('/xml'):
+            to_yield = b'<?xml version="1.0" encoding="UTF-8"?>\n'
+        else:
+            to_yield = b' '
+        separator = b''
+        failed_files = []
+        resp_dict = {'Response Status': HTTPOk().status,
+                     'Response Body': '',
+                     'Number Deleted': 0,
+                     'Number Not Found': 0}
+        req.environ['eventlet.minimum_write_chunk_size'] = 0
+        try:
+            if not out_content_type:
+                raise HTTPNotAcceptable(request=req)
+
+            try:
+                vrs, account, _junk = req.split_path(2, 3, True)
+            except ValueError:
+                raise HTTPNotFound(request=req)
+            vrs = wsgi_to_str(vrs)
+            account = wsgi_to_str(account)
+
+            incoming_format = req.headers.get('Content-Type')
+            if incoming_format and \
+                    not incoming_format.startswith('text/plain'):
+                # For now only accept newline separated object names
+                raise HTTPNotAcceptable(request=req)
+
+            if objs_to_delete is None:
+                objs_to_delete = self.get_objs_to_delete(req)
+            failed_file_response = {'type': HTTPBadRequest}
+
+            def delete_filter(predicate, objs_to_delete):
+                for obj_to_delete in objs_to_delete:
+                    obj_name = obj_to_delete['name']
+                    if not obj_name:
+                        continue
+                    if not predicate(obj_name):
+                        continue
+                    if obj_to_delete.get('error'):
+                        if obj_to_delete['error']['code'] == HTTP_NOT_FOUND:
+                            resp_dict['Number Not Found'] += 1
+                        else:
+                            failed_files.append([
+                                wsgi_quote(str_to_wsgi(obj_name)),
+                                obj_to_delete['error']['message']])
+                        continue
+                    delete_path = '/'.join(['', vrs, account,
+                                            obj_name.lstrip('/')])
+                    if not constraints.check_utf8(delete_path):
+                        failed_files.append([wsgi_quote(str_to_wsgi(obj_name)),
+                                             HTTPPreconditionFailed().status])
+                        continue
+                    yield (obj_name, delete_path,
+                           obj_to_delete.get('version_id'))
+
+            def objs_then_containers(objs_to_delete):
+                # process all objects first
+                yield delete_filter(lambda name: '/' in name.strip('/'),
+                                    objs_to_delete)
+                # followed by containers
+                yield delete_filter(lambda name: '/' not in name.strip('/'),
+                                    objs_to_delete)
+
+            def do_delete(obj_name, delete_path, version_id):
+                delete_obj_req = make_subrequest(
+                    req.environ, method='DELETE',
+                    path=wsgi_quote(str_to_wsgi(delete_path)),
+                    headers={'X-Auth-Token': req.headers.get('X-Auth-Token')},
+                    body='', agent='%(orig)s ' + user_agent,
+                    swift_source=swift_source)
+                if version_id is None:
+                    delete_obj_req.params = {}
+                else:
+                    delete_obj_req.params = {'version-id': version_id}
+                return (delete_obj_req.get_response(self.app), obj_name, 0)
+
+            with StreamingPile(self.delete_concurrency) as pile:
+                for names_to_delete in objs_then_containers(objs_to_delete):
+                    for resp, obj_name, retry in pile.asyncstarmap(
+                            do_delete, names_to_delete):
+                        if last_yield + self.yield_frequency < time():
+                            last_yield = time()
+                            yield to_yield
+                            to_yield, separator = b' ', b'\r\n\r\n'
+                        self._process_delete(resp, pile, obj_name,
+                                             resp_dict, failed_files,
+                                             failed_file_response, retry)
+                        if len(failed_files) >= self.max_failed_deletes:
+                            # Abort, but drain off the in-progress deletes
+                            for resp, obj_name, retry in pile:
+                                if last_yield + self.yield_frequency < time():
+                                    last_yield = time()
+                                    yield to_yield
+                                    to_yield, separator = b' ', b'\r\n\r\n'
+                                # Don't pass in the pile, as we shouldn't retry
+                                self._process_delete(
+                                    resp, None, obj_name, resp_dict,
+                                    failed_files, failed_file_response, retry)
+                            msg = 'Max delete failures exceeded'
+                            raise HTTPBadRequest(msg)
+
+            if failed_files:
+                resp_dict['Response Status'] = \
+                    failed_file_response['type']().status
+            elif not (resp_dict['Number Deleted'] or
+                      resp_dict['Number Not Found']):
+                resp_dict['Response Status'] = HTTPBadRequest().status
+                resp_dict['Response Body'] = 'Invalid bulk delete.'
+
+        except HTTPException as err:
+            resp_dict['Response Status'] = err.status
+            resp_dict['Response Body'] = err.body.decode('utf-8')
+        except Exception:
+            self.logger.exception('Error in bulk delete.')
+            resp_dict['Response Status'] = HTTPServerError().status
+
+        yield separator + get_heartbeat_response_body(out_content_type,
+                                                      resp_dict, failed_files,
+                                                      'delete')
+
+    def handle_extract_iter(self, req, compress_type,
+                            out_content_type='text/plain'):
+        """
+        A generator that can be assigned to a swob Response's app_iter which,
+        when iterated over, will extract and PUT the objects pulled from the
+        request body. Will occasionally yield whitespace while request is being
+        processed. When the request is completed will yield a response body
+        that can be parsed to determine success. See above documentation for
+        details.
+
+        :params req: a swob Request
+        :params compress_type: specifying the compression type of the tar.
+            Accepts '', 'gz', or 'bz2'
+        """
+        resp_dict = {'Response Status': HTTPCreated().status,
+                     'Response Body': '', 'Number Files Created': 0}
+        failed_files = []
+        last_yield = time()
+        if out_content_type and out_content_type.endswith('/xml'):
+            to_yield = b'<?xml version="1.0" encoding="UTF-8"?>\n'
+        else:
+            to_yield = b' '
+        separator = b''
+        containers_accessed = set()
+        req.environ['eventlet.minimum_write_chunk_size'] = 0
+        try:
+            if not out_content_type:
+                raise HTTPNotAcceptable(request=req)
+
+            if req.content_length is None and \
+                    req.headers.get('transfer-encoding',
+                                    '').lower() != 'chunked':
+                raise HTTPLengthRequired(request=req)
+            try:
+                vrs, account, extract_base = req.split_path(2, 3, True)
+            except ValueError:
+                raise HTTPNotFound(request=req)
+            extract_base = extract_base or ''
+            extract_base = extract_base.rstrip('/')
+            tar = tarfile.open(mode='r|' + compress_type,
+                               fileobj=req.body_file)
+            failed_response_type = HTTPBadRequest
+            containers_created = 0
+            while True:
+                if last_yield + self.yield_frequency < time():
+                    last_yield = time()
+                    yield to_yield
+                    to_yield, separator = b' ', b'\r\n\r\n'
+                tar_info = tar.next()
+                if tar_info is None or \
+                        len(failed_files) >= self.max_failed_extractions:
+                    break
+                if tar_info.isfile():
+                    obj_path = tar_info.name.encode('utf-8', 'surrogateescape')
+                    obj_path = bytes_to_wsgi(obj_path)
+                    if obj_path.startswith('./'):
+                        obj_path = obj_path[2:]
+                    obj_path = obj_path.lstrip('/')
+                    if extract_base:
+                        obj_path = extract_base + '/' + obj_path
+                    if '/' not in obj_path:
+                        continue  # ignore base level file
+
+                    destination = '/'.join(
+                        ['', vrs, account, obj_path])
+                    container = obj_path.split('/', 1)[0]
+                    if not constraints.check_utf8(wsgi_to_str(destination)):
+                        failed_files.append(
+                            [wsgi_quote(obj_path[:self.max_path_length]),
+                             HTTPPreconditionFailed().status])
+                        continue
+                    if tar_info.size > constraints.MAX_FILE_SIZE:
+                        failed_files.append([
+                            wsgi_quote(obj_path[:self.max_path_length]),
+                            HTTPRequestEntityTooLarge().status])
+                        continue
+                    container_failure = None
+                    if container not in containers_accessed:
+                        cont_path = '/'.join(['', vrs, account, container])
+                        try:
+                            if self.create_container(req, cont_path):
+                                containers_created += 1
+                                if containers_created > self.max_containers:
+                                    raise HTTPBadRequest(
+                                        'More than %d containers to create '
+                                        'from tar.' % self.max_containers)
+                        except CreateContainerError as err:
+                            # the object PUT to this container still may
+                            # succeed if acls are set
+                            container_failure = [
+                                wsgi_quote(cont_path[:self.max_path_length]),
+                                err.status]
+                            if err.status_int == HTTP_UNAUTHORIZED:
+                                raise HTTPUnauthorized(request=req)
+                        except ValueError:
+                            failed_files.append([
+                                wsgi_quote(obj_path[:self.max_path_length]),
+                                HTTPBadRequest().status])
+                            continue
+
+                    tar_file = tar.extractfile(tar_info)
+                    create_headers = {
+                        'Content-Length': tar_info.size,
+                        'X-Auth-Token': req.headers.get('X-Auth-Token'),
+                    }
+
+                    # Copy some whitelisted headers to the subrequest
+                    for k, v in req.headers.items():
+                        if ((k.lower() in ('x-delete-at', 'x-delete-after'))
+                                or is_user_meta('object', k)):
+                            create_headers[k] = v
+
+                    create_obj_req = make_subrequest(
+                        req.environ, method='PUT',
+                        path=wsgi_quote(destination),
+                        headers=create_headers,
+                        agent='%(orig)s BulkExpand', swift_source='EA')
+                    create_obj_req.environ['wsgi.input'] = tar_file
+
+                    for pax_key, pax_value in tar_info.pax_headers.items():
+                        header_name = pax_key_to_swift_header(pax_key)
+                        if header_name:
+                            # Both pax_key and pax_value are unicode
+                            # strings; the key is already UTF-8 encoded, but
+                            # we still have to encode the value.
+                            create_obj_req.headers[header_name] = \
+                                pax_value.encode("utf-8")
+
+                    resp = create_obj_req.get_response(self.app)
+                    containers_accessed.add(container)
+                    if resp.is_success:
+                        resp_dict['Number Files Created'] += 1
+                    else:
+                        if container_failure:
+                            failed_files.append(container_failure)
+                        if resp.status_int == HTTP_UNAUTHORIZED:
+                            failed_files.append([
+                                wsgi_quote(obj_path[:self.max_path_length]),
+                                HTTPUnauthorized().status])
+                            raise HTTPUnauthorized(request=req)
+                        if resp.status_int // 100 == 5:
+                            failed_response_type = HTTPBadGateway
+                        failed_files.append([
+                            wsgi_quote(obj_path[:self.max_path_length]),
+                            resp.status])
+
+            if failed_files:
+                resp_dict['Response Status'] = failed_response_type().status
+            elif not resp_dict['Number Files Created']:
+                resp_dict['Response Status'] = HTTPBadRequest().status
+                resp_dict['Response Body'] = 'Invalid Tar File: No Valid Files'
+
+        except HTTPException as err:
+            resp_dict['Response Status'] = err.status
+            resp_dict['Response Body'] = err.body.decode('utf-8')
+        except (tarfile.TarError, zlib.error) as tar_error:
+            resp_dict['Response Status'] = HTTPBadRequest().status
+            resp_dict['Response Body'] = 'Invalid Tar File: %s' % tar_error
+        except Exception:
+            self.logger.exception('Error in extract archive.')
+            resp_dict['Response Status'] = HTTPServerError().status
+
+        yield separator + get_heartbeat_response_body(
+            out_content_type, resp_dict, failed_files, 'extract')
+
+    def _process_delete(self, resp, pile, obj_name, resp_dict,
+                        failed_files, failed_file_response, retry=0):
+        if resp.status_int // 100 == 2:
+            resp_dict['Number Deleted'] += 1
+        elif resp.status_int == HTTP_NOT_FOUND:
+            resp_dict['Number Not Found'] += 1
+        elif resp.status_int == HTTP_UNAUTHORIZED:
+            failed_files.append([wsgi_quote(str_to_wsgi(obj_name)),
+                                 HTTPUnauthorized().status])
+        elif resp.status_int == HTTP_CONFLICT and pile and \
+                self.retry_count > 0 and self.retry_count > retry:
+            retry += 1
+            sleep(self.retry_interval ** retry)
+            delete_obj_req = Request.blank(resp.environ['PATH_INFO'],
+                                           resp.environ)
+
+            def _retry(req, app, obj_name, retry):
+                return req.get_response(app), obj_name, retry
+            pile.spawn(_retry, delete_obj_req, self.app, obj_name, retry)
+        else:
+            if resp.status_int // 100 == 5:
+                failed_file_response['type'] = HTTPBadGateway
+            failed_files.append([wsgi_quote(str_to_wsgi(obj_name)),
+                                 resp.status])
+
+    @wsgify
+    def __call__(self, req):
+        extract_type = req.params.get('extract-archive')
+        resp = None
+        if extract_type is not None and req.method == 'PUT':
+            archive_type = {
+                'tar': '', 'tar.gz': 'gz',
+                'tar.bz2': 'bz2'}.get(extract_type.lower().strip('.'))
+            if archive_type is not None:
+                resp = HTTPOk(request=req)
+                try:
+                    out_content_type = req.accept.best_match(
+                        ACCEPTABLE_FORMATS)
+                except ValueError:
+                    out_content_type = None  # Ignore invalid header
+                if out_content_type:
+                    resp.content_type = out_content_type
+                resp.app_iter = self.handle_extract_iter(
+                    req, archive_type, out_content_type=out_content_type)
+            else:
+                resp = HTTPBadRequest("Unsupported archive format")
+        if 'bulk-delete' in req.params and req.method in ['POST', 'DELETE']:
+            resp = HTTPOk(request=req)
+            try:
+                out_content_type = req.accept.best_match(ACCEPTABLE_FORMATS)
+            except ValueError:
+                out_content_type = None  # Ignore invalid header
+            if out_content_type:
+                resp.content_type = out_content_type
+            resp.app_iter = self.handle_delete_iter(
+                req, out_content_type=out_content_type)
+
+        return resp or self.app
+
+
+def filter_factory(global_conf, **local_conf):
+    conf = global_conf.copy()
+    conf.update(local_conf)
+
+    max_containers_per_extraction = \
+        int(conf.get('max_containers_per_extraction', 10000))
+    max_failed_extractions = int(conf.get('max_failed_extractions', 1000))
+    max_deletes_per_request = int(conf.get('max_deletes_per_request', 10000))
+    max_failed_deletes = int(conf.get('max_failed_deletes', 1000))
+    yield_frequency = int(conf.get('yield_frequency', 10))
+    delete_concurrency = min(1000, max(1, int(
+        conf.get('delete_concurrency', 2))))
+    retry_count = int(conf.get('delete_container_retry_count', 0))
+    retry_interval = 1.5
+
+    register_swift_info(
+        'bulk_upload',
+        max_containers_per_extraction=max_containers_per_extraction,
+        max_failed_extractions=max_failed_extractions)
+    register_swift_info(
+        'bulk_delete',
+        max_deletes_per_request=max_deletes_per_request,
+        max_failed_deletes=max_failed_deletes)
+
+    def bulk_filter(app):
+        return Bulk(
+            app, conf,
+            max_containers_per_extraction=max_containers_per_extraction,
+            max_failed_extractions=max_failed_extractions,
+            max_deletes_per_request=max_deletes_per_request,
+            max_failed_deletes=max_failed_deletes,
+            yield_frequency=yield_frequency,
+            delete_concurrency=delete_concurrency,
+            retry_count=retry_count,
+            retry_interval=retry_interval)
+    return bulk_filter
diff --git a/swift/common/middleware/catch_errors.py b/swift/common/middleware/catch_errors.py
index 4053825376..0b3d37626b 100644
--- a/swift/common/middleware/catch_errors.py
+++ b/swift/common/middleware/catch_errors.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,39 +13,124 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-from eventlet import Timeout
-import uuid
-
 from swift.common.swob import Request, HTTPServerError
-from swift.common.utils import get_logger
+from swift.common.utils import get_logger, generate_trans_id, close_if_possible
 from swift.common.wsgi import WSGIContext
 
 
+class BadResponseLength(Exception):
+    pass
+
+
+class ByteEnforcer(object):
+    """
+    Enforces that inner_iter yields exactly <nbytes> bytes before
+    exhaustion.
+
+    If inner_iter fails to do so, BadResponseLength is raised.
+
+    :param inner_iter: iterable of bytestrings
+    :param nbytes: number of bytes expected
+
+    N.B. since we require the nbytes param and require the inner_iter to yield
+    exactly that many bytes we can support the __len__ interface for anyone
+    happens to expect non chunked resp iterables to support that
+    (e.g.  eventlet's wsgi.server).
+    """
+
+    def __init__(self, inner_iter, nbytes):
+        self.inner_iter = inner_iter
+        self.nbytes = nbytes
+
+    def __len__(self):
+        return self.nbytes
+
+    def __iter__(self):
+        try:
+            bytes_left = self.nbytes
+            for chunk in self.inner_iter:
+                if bytes_left >= len(chunk):
+                    yield chunk
+                    bytes_left -= len(chunk)
+                else:
+                    yield chunk[:bytes_left]
+                    raise BadResponseLength(
+                        "Too many bytes; truncating after %d bytes "
+                        "with at least %d surplus bytes remaining" % (
+                            self.nbytes, len(chunk) - bytes_left))
+
+            if bytes_left:
+                raise BadResponseLength('Expected another %d bytes' % (
+                    bytes_left,))
+        finally:
+            close_if_possible(self.inner_iter)
+
+
 class CatchErrorsContext(WSGIContext):
 
-    def __init__(self, app, logger):
+    def __init__(self, app, logger, trans_id_suffix=''):
         super(CatchErrorsContext, self).__init__(app)
         self.logger = logger
+        self.trans_id_suffix = trans_id_suffix
 
     def handle_request(self, env, start_response):
-        trans_id = 'tx' + uuid.uuid4().hex
+        trans_id_suffix = self.trans_id_suffix
+        trans_id_extra = env.get('HTTP_X_TRANS_ID_EXTRA')
+        if trans_id_extra:
+            trans_id_suffix += '-' + trans_id_extra[:32]
+
+        trans_id = generate_trans_id(trans_id_suffix)
         env['swift.trans_id'] = trans_id
         self.logger.txn_id = trans_id
         try:
             # catch any errors in the pipeline
             resp = self._app_call(env)
-        except (Exception, Timeout), err:
-            self.logger.exception(_('Error: %s'), err)
+        except:  # noqa
+            self.logger.exception('Error: An error occurred')
             resp = HTTPServerError(request=Request(env),
-                                   body='An error occurred',
+                                   body=b'An error occurred',
                                    content_type='text/plain')
-            resp.headers['x-trans-id'] = trans_id
+            resp.headers['X-Trans-Id'] = trans_id
+            resp.headers['X-Openstack-Request-Id'] = trans_id
             return resp(env, start_response)
 
+        # If the app specified a Content-Length, enforce that it sends that
+        # many bytes.
+        #
+        # If an app gives too few bytes, then the client will wait for the
+        # remainder before sending another HTTP request on the same socket;
+        # since no more bytes are coming, this will result in either an
+        # infinite wait or a timeout. In this case, we want to raise an
+        # exception to signal to the WSGI server that it should close the
+        # TCP connection.
+        #
+        # If an app gives too many bytes, then we can deadlock with the
+        # client; if the client reads its N bytes and then sends a large-ish
+        # request (enough to fill TCP buffers), it'll block until we read
+        # some of the request. However, we won't read the request since
+        # we'll be trying to shove the rest of our oversized response out
+        # the socket. In that case, we truncate the response body at N bytes
+        # and raise an exception to stop any more bytes from being
+        # generated and also to kill the TCP connection.
+        if env['REQUEST_METHOD'] == 'HEAD':
+            resp = ByteEnforcer(resp, 0)
+
+        elif self._response_headers:
+            content_lengths = [val for header, val in self._response_headers
+                               if header.lower() == "content-length"]
+            if len(content_lengths) == 1:
+                try:
+                    content_length = int(content_lengths[0])
+                except ValueError:
+                    pass
+                else:
+                    resp = ByteEnforcer(resp, content_length)
+
         # make sure the response has the trans_id
         if self._response_headers is None:
             self._response_headers = []
-        self._response_headers.append(('x-trans-id', trans_id))
+        self._response_headers.append(('X-Trans-Id', trans_id))
+        self._response_headers.append(('X-Openstack-Request-Id', trans_id))
         start_response(self._response_status, self._response_headers,
                        self._response_exc_info)
         return resp
@@ -60,12 +145,15 @@ class CatchErrorMiddleware(object):
     def __init__(self, app, conf):
         self.app = app
         self.logger = get_logger(conf, log_route='catch-errors')
+        self.trans_id_suffix = conf.get('trans_id_suffix', '')
 
     def __call__(self, env, start_response):
         """
         If used, this should be the first middleware in pipeline.
         """
-        context = CatchErrorsContext(self.app, self.logger)
+        context = CatchErrorsContext(self.app,
+                                     self.logger,
+                                     self.trans_id_suffix)
         return context.handle_request(env, start_response)
 
 
diff --git a/swift/common/middleware/cname_lookup.py b/swift/common/middleware/cname_lookup.py
index 87363b2308..b9ef4f616f 100644
--- a/swift/common/middleware/cname_lookup.py
+++ b/swift/common/middleware/cname_lookup.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -29,35 +29,49 @@
 
 try:
     import dns.resolver
-    from dns.exception import DNSException
-    from dns.resolver import NXDOMAIN, NoAnswer
+    import dns.exception
 except ImportError:
     # catch this to allow docs to be built without the dependency
     MODULE_DEPENDENCY_MET = False
 else:  # executed if the try block finishes with no errors
     MODULE_DEPENDENCY_MET = True
 
-from swift.common.swob import Request, HTTPBadRequest
-from swift.common.utils import cache_from_env, get_logger
+from swift.common.middleware import RewriteContext
+from swift.common.swob import Request, HTTPBadRequest, \
+    str_to_wsgi, wsgi_to_str
+from swift.common.utils import cache_from_env, get_logger, is_valid_ip, \
+    list_from_csv, parse_socket_string
+from swift.common.registry import register_swift_info
 
 
-def lookup_cname(domain):  # pragma: no cover
+def lookup_cname(domain, resolver):  # pragma: no cover
     """
     Given a domain, returns its DNS CNAME mapping and DNS ttl.
 
     :param domain: domain to query on
+    :param resolver: dns.resolver.Resolver() instance used for executing DNS
+                     queries
     :returns: (ttl, result)
     """
     try:
-        answer = dns.resolver.query(domain, 'CNAME').rrset
+        answer = resolver.query(domain, 'CNAME').rrset
         ttl = answer.ttl
-        result = answer.items[0].to_text()
+        result = list(answer.items)[0].to_text()
         result = result.rstrip('.')
         return ttl, result
-    except (DNSException, NXDOMAIN, NoAnswer):
+    except (dns.resolver.NXDOMAIN, dns.resolver.NoAnswer):
+        # As the memcache lib returns None when nothing is found in cache,
+        # returning false helps to distinguish between "nothing in cache"
+        # (None) and "nothing to cache" (False).
+        return 60, False
+    except (dns.exception.DNSException):
         return 0, None
 
 
+class _CnameLookupContext(RewriteContext):
+    base_re = r'^(https?://)%s(/.*)?$'
+
+
 class CNAMELookupMiddleware(object):
     """
     CNAME Lookup Middleware
@@ -74,60 +88,94 @@ def __init__(self, app, conf):
             # reraise the exception if the dependency wasn't met
             raise ImportError('dnspython is required for this module')
         self.app = app
-        self.storage_domain = conf.get('storage_domain', 'example.com')
-        if self.storage_domain and self.storage_domain[0] != '.':
-            self.storage_domain = '.' + self.storage_domain
+        storage_domain = conf.get('storage_domain', 'example.com')
+        self.storage_domain = ['.' + s for s in
+                               list_from_csv(storage_domain)
+                               if not s.startswith('.')]
+        self.storage_domain += [s for s in list_from_csv(storage_domain)
+                                if s.startswith('.')]
         self.lookup_depth = int(conf.get('lookup_depth', '1'))
+        nameservers = list_from_csv(conf.get('nameservers'))
+        try:
+            for i, server in enumerate(nameservers):
+                ip_or_host, maybe_port = nameservers[i] = \
+                    parse_socket_string(server, None)
+                if not is_valid_ip(ip_or_host):
+                    raise ValueError
+                if maybe_port is not None:
+                    int(maybe_port)
+        except ValueError:
+            raise ValueError('Invalid cname_lookup/nameservers configuration '
+                             'found. All nameservers must be valid IPv4 or '
+                             'IPv6, followed by an optional :<integer> port.')
+        self.resolver = dns.resolver.Resolver()
+        if nameservers:
+            self.resolver.nameservers = [ip for (ip, port) in nameservers]
+            self.resolver.nameserver_ports = {
+                ip: int(port) for (ip, port) in nameservers
+                if port is not None}
         self.memcache = None
         self.logger = get_logger(conf, log_route='cname-lookup')
 
+    def _domain_endswith_in_storage_domain(self, a_domain):
+        a_domain = '.' + a_domain
+        for domain in self.storage_domain:
+            if a_domain.endswith(domain):
+                return True
+        return False
+
     def __call__(self, env, start_response):
         if not self.storage_domain:
             return self.app(env, start_response)
-        given_domain = env['HTTP_HOST']
+        if 'HTTP_HOST' in env:
+            requested_host = env['HTTP_HOST']
+        else:
+            requested_host = env['SERVER_NAME']
+        given_domain = wsgi_to_str(requested_host)
         port = ''
         if ':' in given_domain:
             given_domain, port = given_domain.rsplit(':', 1)
-        if given_domain == self.storage_domain[1:]:  # strip initial '.'
+        if is_valid_ip(given_domain):
             return self.app(env, start_response)
         a_domain = given_domain
-        if not a_domain.endswith(self.storage_domain):
+        if not self._domain_endswith_in_storage_domain(a_domain):
             if self.memcache is None:
                 self.memcache = cache_from_env(env)
             error = True
-            for tries in xrange(self.lookup_depth):
+            for tries in range(self.lookup_depth):
                 found_domain = None
                 if self.memcache:
                     memcache_key = ''.join(['cname-', a_domain])
                     found_domain = self.memcache.get(memcache_key)
-                if not found_domain:
-                    ttl, found_domain = lookup_cname(a_domain)
-                    if self.memcache:
+                if found_domain is None:
+                    ttl, found_domain = lookup_cname(a_domain, self.resolver)
+                    if self.memcache and ttl > 0:
                         memcache_key = ''.join(['cname-', given_domain])
                         self.memcache.set(memcache_key, found_domain,
-                                          timeout=ttl)
-                if found_domain is None or found_domain == a_domain:
+                                          time=ttl)
+                if not found_domain or found_domain == a_domain:
                     # no CNAME records or we're at the last lookup
                     error = True
                     found_domain = None
                     break
-                elif found_domain.endswith(self.storage_domain):
+                elif self._domain_endswith_in_storage_domain(found_domain):
                     # Found it!
                     self.logger.info(
-                        _('Mapped %(given_domain)s to %(found_domain)s') %
+                        'Mapped %(given_domain)s to %(found_domain)s',
                         {'given_domain': given_domain,
                          'found_domain': found_domain})
                     if port:
-                        env['HTTP_HOST'] = ':'.join([found_domain, port])
+                        env['HTTP_HOST'] = ':'.join([
+                            str_to_wsgi(found_domain), port])
                     else:
-                        env['HTTP_HOST'] = found_domain
+                        env['HTTP_HOST'] = str_to_wsgi(found_domain)
                     error = False
                     break
                 else:
                     # try one more deep in the chain
                     self.logger.debug(
-                        _('Following CNAME chain for  '
-                          '%(given_domain)s to %(found_domain)s') %
+                        'Following CNAME chain for  '
+                        '%(given_domain)s to %(found_domain)s',
                         {'given_domain': given_domain,
                          'found_domain': found_domain})
                     a_domain = found_domain
@@ -140,6 +188,11 @@ def __call__(self, env, start_response):
                 resp = HTTPBadRequest(request=Request(env), body=msg,
                                       content_type='text/plain')
                 return resp(env, start_response)
+            else:
+                context = _CnameLookupContext(self.app, requested_host,
+                                              env['HTTP_HOST'])
+                return context.handle_request(env, start_response)
+
         return self.app(env, start_response)
 
 
@@ -147,6 +200,9 @@ def filter_factory(global_conf, **local_conf):  # pragma: no cover
     conf = global_conf.copy()
     conf.update(local_conf)
 
+    register_swift_info('cname_lookup',
+                        lookup_depth=int(conf.get('lookup_depth', '1')))
+
     def cname_filter(app):
         return CNAMELookupMiddleware(app, conf)
     return cname_filter
diff --git a/swift/common/middleware/container_quotas.py b/swift/common/middleware/container_quotas.py
new file mode 100644
index 0000000000..2a10c8d2ce
--- /dev/null
+++ b/swift/common/middleware/container_quotas.py
@@ -0,0 +1,122 @@
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""
+The ``container_quotas`` middleware implements simple quotas that can be
+imposed on swift containers by a user with the ability to set container
+metadata, most likely the account administrator.  This can be useful for
+limiting the scope of containers that are delegated to non-admin users, exposed
+to ``formpost`` uploads, or just as a self-imposed sanity check.
+
+Any object PUT operations that exceed these quotas return a 413 response
+(request entity too large) with a descriptive body.
+
+Quotas are subject to several limitations: eventual consistency, the timeliness
+of the cached container_info (60 second ttl by default), and it's unable to
+reject chunked transfer uploads that exceed the quota (though once the quota
+is exceeded, new chunked transfers will be refused).
+
+Quotas are set by adding meta values to the container, and are validated when
+set:
+
++---------------------------------------------+-------------------------------+
+|Metadata                                     | Use                           |
++=============================================+===============================+
+| X-Container-Meta-Quota-Bytes                | Maximum size of the           |
+|                                             | container, in bytes.          |
++---------------------------------------------+-------------------------------+
+| X-Container-Meta-Quota-Count                | Maximum object count of the   |
+|                                             | container.                    |
++---------------------------------------------+-------------------------------+
+
+The ``container_quotas`` middleware should be added to the pipeline in your
+``/etc/swift/proxy-server.conf`` file just after any auth middleware.
+For example::
+
+    [pipeline:main]
+    pipeline = catch_errors cache tempauth container_quotas proxy-server
+
+    [filter:container_quotas]
+    use = egg:swift#container_quotas
+"""
+from swift.common.http import is_success
+from swift.common.swob import HTTPRequestEntityTooLarge, HTTPBadRequest, \
+    wsgify
+from swift.common.registry import register_swift_info
+from swift.proxy.controllers.base import get_container_info
+
+
+class ContainerQuotaMiddleware(object):
+    def __init__(self, app, *args, **kwargs):
+        self.app = app
+
+    def bad_response(self, req, container_info):
+        # 401 if the user couldn't have PUT this object in the first place.
+        # This prevents leaking the container's existence to unauthed users.
+        if 'swift.authorize' in req.environ:
+            req.acl = container_info['write_acl']
+            aresp = req.environ['swift.authorize'](req)
+            if aresp:
+                return aresp
+        return HTTPRequestEntityTooLarge(body='Upload exceeds quota.')
+
+    @wsgify
+    def __call__(self, req):
+        try:
+            (version, account, container, obj) = req.split_path(3, 4, True)
+        except ValueError:
+            return self.app
+
+        # verify new quota headers are properly formatted
+        if not obj and req.method in ('PUT', 'POST'):
+            val = req.headers.get('X-Container-Meta-Quota-Bytes')
+            if val and not val.isdigit():
+                return HTTPBadRequest(body='Invalid bytes quota.')
+            val = req.headers.get('X-Container-Meta-Quota-Count')
+            if val and not val.isdigit():
+                return HTTPBadRequest(body='Invalid count quota.')
+
+        # check user uploads against quotas
+        elif obj and req.method in ('PUT'):
+            container_info = get_container_info(
+                req.environ, self.app, swift_source='CQ')
+            if not container_info or not is_success(container_info['status']):
+                # this will hopefully 404 later
+                return self.app
+
+            if 'quota-bytes' in container_info.get('meta', {}) and \
+                    'bytes' in container_info and \
+                    container_info['meta']['quota-bytes'].isdigit():
+                content_length = (req.content_length or 0)
+                new_size = int(container_info['bytes']) + content_length
+                if int(container_info['meta']['quota-bytes']) < new_size:
+                    return self.bad_response(req, container_info)
+
+            if 'quota-count' in container_info.get('meta', {}) and \
+                    'object_count' in container_info and \
+                    container_info['meta']['quota-count'].isdigit():
+                new_count = int(container_info['object_count']) + 1
+                if int(container_info['meta']['quota-count']) < new_count:
+                    return self.bad_response(req, container_info)
+
+        return self.app
+
+
+def filter_factory(global_conf, **local_conf):
+    register_swift_info('container_quotas')
+
+    def container_quota_filter(app):
+        return ContainerQuotaMiddleware(app)
+    return container_quota_filter
diff --git a/swift/common/middleware/container_sync.py b/swift/common/middleware/container_sync.py
new file mode 100644
index 0000000000..35b1a7d4b6
--- /dev/null
+++ b/swift/common/middleware/container_sync.py
@@ -0,0 +1,174 @@
+# Copyright (c) 2013 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import os
+
+from swift.common.constraints import valid_api_version
+from swift.common.container_sync_realms import ContainerSyncRealms
+from swift.common.request_helpers import append_log_info
+from swift.common.swob import HTTPBadRequest, HTTPUnauthorized, wsgify
+from swift.common.utils import (
+    config_true_value, get_logger, streq_const_time)
+from swift.proxy.controllers.base import get_container_info
+from swift.common.registry import register_swift_info
+
+
+class ContainerSync(object):
+    """
+    WSGI middleware that validates an incoming container sync request
+    using the container-sync-realms.conf style of container sync.
+    """
+
+    def __init__(self, app, conf, logger=None):
+        self.app = app
+        self.conf = conf
+        self.logger = logger or get_logger(conf, log_route='container_sync')
+        self.realms_conf = ContainerSyncRealms(
+            os.path.join(
+                conf.get('swift_dir', '/etc/swift'),
+                'container-sync-realms.conf'),
+            self.logger)
+        self.allow_full_urls = config_true_value(
+            conf.get('allow_full_urls', 'true'))
+        # configure current realm/cluster for /info
+        self.realm = self.cluster = None
+        current = conf.get('current', None)
+        if current:
+            try:
+                self.realm, self.cluster = (p.upper() for p in
+                                            current.strip('/').split('/'))
+            except ValueError:
+                self.logger.error('Invalid current //REALM/CLUSTER (%s)',
+                                  current)
+        self.register_info()
+
+    def register_info(self):
+        dct = {}
+        for realm in self.realms_conf.realms():
+            clusters = self.realms_conf.clusters(realm)
+            if clusters:
+                dct[realm] = {'clusters': dict((c, {}) for c in clusters)}
+        if self.realm and self.cluster:
+            try:
+                dct[self.realm]['clusters'][self.cluster]['current'] = True
+            except KeyError:
+                self.logger.error('Unknown current //REALM/CLUSTER (%s)',
+                                  '//%s/%s' % (self.realm, self.cluster))
+        register_swift_info('container_sync', realms=dct)
+
+    @wsgify
+    def __call__(self, req):
+        if req.path == '/info':
+            # Ensure /info requests get the freshest results
+            self.register_info()
+            return self.app
+
+        try:
+            (version, acc, cont, obj) = req.split_path(3, 4, True)
+            bad_path = False
+        except ValueError:
+            bad_path = True
+
+        # use of bad_path bool is to avoid recursive tracebacks
+        if bad_path or not valid_api_version(version):
+            return self.app
+
+        # validate container-sync metdata update
+        info = get_container_info(
+            req.environ, self.app, swift_source='CS')
+        sync_to = req.headers.get('x-container-sync-to')
+        if req.method in ('PUT', 'POST') and cont and not obj:
+            versions_cont = info.get(
+                'sysmeta', {}).get('versions-container')
+            if sync_to and versions_cont:
+                raise HTTPBadRequest(
+                    'Cannot configure container sync on a container '
+                    'with object versioning configured.',
+                    request=req)
+
+        if not self.allow_full_urls:
+            if sync_to and not sync_to.startswith('//'):
+                raise HTTPBadRequest(
+                    body='Full URLs are not allowed for X-Container-Sync-To '
+                         'values. Only realm values of the format '
+                         '//realm/cluster/account/container are allowed.\n',
+                    request=req)
+        auth = req.headers.get('x-container-sync-auth')
+        if auth:
+            valid = False
+            auth = auth.split()
+            if len(auth) != 3:
+                append_log_info(req.environ, 'cs:not-3-args')
+            else:
+                realm, nonce, sig = auth
+                realm_key = self.realms_conf.key(realm)
+                realm_key2 = self.realms_conf.key2(realm)
+                if not realm_key:
+                    append_log_info(req.environ, 'cs:no-local-realm-key')
+                else:
+                    user_key = info.get('sync_key')
+                    if not user_key:
+                        append_log_info(req.environ, 'cs:no-local-user-key')
+                    else:
+                        # x-timestamp headers get shunted by gatekeeper
+                        if 'x-backend-inbound-x-timestamp' in req.headers:
+                            req.headers['x-timestamp'] = req.headers.pop(
+                                'x-backend-inbound-x-timestamp')
+
+                        expected = self.realms_conf.get_sig(
+                            req.method, req.path,
+                            req.headers.get('x-timestamp', '0'), nonce,
+                            realm_key, user_key)
+                        expected2 = self.realms_conf.get_sig(
+                            req.method, req.path,
+                            req.headers.get('x-timestamp', '0'), nonce,
+                            realm_key2, user_key) if realm_key2 else expected
+                        if not streq_const_time(sig, expected) and \
+                                not streq_const_time(sig, expected2):
+                            append_log_info(req.environ, 'cs:invalid-sig')
+                        else:
+                            append_log_info(req.environ, 'cs:valid')
+                            valid = True
+            if not valid:
+                exc = HTTPUnauthorized(
+                    body='X-Container-Sync-Auth header not valid; '
+                         'contact cluster operator for support.',
+                    headers={'content-type': 'text/plain'},
+                    request=req)
+                exc.headers['www-authenticate'] = ' '.join([
+                    'SwiftContainerSync',
+                    exc.www_authenticate().split(None, 1)[1]])
+                raise exc
+            else:
+                req.environ['swift.authorize_override'] = True
+                # An SLO manifest will already be in the internal manifest
+                # syntax and might be synced before its segments, so stop SLO
+                # middleware from performing the usual manifest validation.
+                req.environ['swift.slo_override'] = True
+                # Similar arguments for static symlinks
+                req.environ['swift.symlink_override'] = True
+
+        return self.app
+
+
+def filter_factory(global_conf, **local_conf):
+    conf = global_conf.copy()
+    conf.update(local_conf)
+    register_swift_info('container_sync')
+
+    def cache_filter(app):
+        return ContainerSync(app, conf)
+
+    return cache_filter
diff --git a/swift/common/middleware/copy.py b/swift/common/middleware/copy.py
new file mode 100644
index 0000000000..fed8f860fe
--- /dev/null
+++ b/swift/common/middleware/copy.py
@@ -0,0 +1,538 @@
+# Copyright (c) 2015 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""
+Server side copy is a feature that enables users/clients to COPY objects
+between accounts and containers without the need to download and then
+re-upload objects, thus eliminating additional bandwidth consumption and
+also saving time. This may be used when renaming/moving an object which
+in Swift is a (COPY + DELETE) operation.
+
+The server side copy middleware should be inserted in the pipeline after auth
+and before the quotas and large object middlewares. If it is not present in the
+pipeline in the proxy-server configuration file, it will be inserted
+automatically. There is no configurable option provided to turn off server
+side copy.
+
+--------
+Metadata
+--------
+* All metadata of source object is preserved during object copy.
+* One can also provide additional metadata during PUT/COPY request. This will
+  over-write any existing conflicting keys.
+* Server side copy can also be used to change content-type of an existing
+  object.
+
+-----------
+Object Copy
+-----------
+* The destination container must exist before requesting copy of the object.
+* When several replicas exist, the system copies from the most recent replica.
+  That is, the copy operation behaves as though the X-Newest header is in the
+  request.
+* The request to copy an object should have no body (i.e. content-length of the
+  request must be zero).
+
+There are two ways in which an object can be copied:
+
+1. Send a PUT request to the new object (destination/target) with an additional
+   header named ``X-Copy-From`` specifying the source object
+   (in '/container/object' format). Example::
+
+    curl -i -X PUT http://<storage_url>/container1/destination_obj
+     -H 'X-Auth-Token: <token>'
+     -H 'X-Copy-From: /container2/source_obj'
+     -H 'Content-Length: 0'
+
+2. Send a COPY request with an existing object in URL with an additional header
+   named ``Destination`` specifying the destination/target object
+   (in '/container/object' format). Example::
+
+    curl -i -X COPY http://<storage_url>/container2/source_obj
+     -H 'X-Auth-Token: <token>'
+     -H 'Destination: /container1/destination_obj'
+     -H 'Content-Length: 0'
+
+Note that if the incoming request has some conditional headers (e.g. ``Range``,
+``If-Match``), the *source* object will be evaluated for these headers (i.e. if
+PUT with both ``X-Copy-From`` and ``Range``, Swift will make a partial copy to
+the destination object).
+
+-------------------------
+Cross Account Object Copy
+-------------------------
+Objects can also be copied from one account to another account if the user
+has the necessary permissions (i.e. permission to read from container
+in source account and permission to write to container in destination account).
+
+Similar to examples mentioned above, there are two ways to copy objects across
+accounts:
+
+1. Like the example above, send PUT request to copy object but with an
+   additional header named ``X-Copy-From-Account`` specifying the source
+   account. Example::
+
+    curl -i -X PUT http://<host>:<port>/v1/AUTH_test1/container/destination_obj
+     -H 'X-Auth-Token: <token>'
+     -H 'X-Copy-From: /container/source_obj'
+     -H 'X-Copy-From-Account: AUTH_test2'
+     -H 'Content-Length: 0'
+
+2. Like the previous example, send a COPY request but with an additional header
+   named ``Destination-Account`` specifying the name of destination account.
+   Example::
+
+    curl -i -X COPY http://<host>:<port>/v1/AUTH_test2/container/source_obj
+     -H 'X-Auth-Token: <token>'
+     -H 'Destination: /container/destination_obj'
+     -H 'Destination-Account: AUTH_test1'
+     -H 'Content-Length: 0'
+
+-------------------
+Large Object Copy
+-------------------
+The best option to copy a large object is to copy segments individually.
+To copy the manifest object of a large object, add the query parameter to
+the copy request::
+
+    ?multipart-manifest=get
+
+If a request is sent without the query parameter, an attempt will be made to
+copy the whole object but will fail if the object size is
+greater than 5GB.
+
+"""
+
+from swift.common.utils import get_logger, config_true_value, FileLikeIter, \
+    close_if_possible
+from swift.common.swob import Request, HTTPPreconditionFailed, \
+    HTTPRequestEntityTooLarge, HTTPBadRequest, HTTPException, \
+    wsgi_quote, wsgi_unquote
+from swift.common.http import HTTP_MULTIPLE_CHOICES, is_success, HTTP_OK
+from swift.common.constraints import check_account_format, MAX_FILE_SIZE
+from swift.common.request_helpers import copy_header_subset, remove_items, \
+    is_sys_meta, is_sys_or_user_meta, is_object_transient_sysmeta, \
+    check_path_header, OBJECT_SYSMETA_CONTAINER_UPDATE_OVERRIDE_PREFIX
+from swift.common.wsgi import WSGIContext, make_subrequest
+import eventlet
+from swift.common.request_helpers import get_heartbeat_response_body
+
+
+def _check_copy_from_header(req):
+    """
+    Validate that the value from x-copy-from header is
+    well formatted. We assume the caller ensures that
+    x-copy-from header is present in req.headers.
+
+    :param req: HTTP request object
+    :returns: A tuple with container name and object name
+    :raise HTTPPreconditionFailed: if x-copy-from value
+            is not well formatted.
+    """
+    return check_path_header(req, 'X-Copy-From', 2,
+                             'X-Copy-From header must be of the form '
+                             '<container name>/<object name>')
+
+
+def _check_destination_header(req):
+    """
+    Validate that the value from destination header is
+    well formatted. We assume the caller ensures that
+    destination header is present in req.headers.
+
+    :param req: HTTP request object
+    :returns: A tuple with container name and object name
+    :raise HTTPPreconditionFailed: if destination value
+            is not well formatted.
+    """
+    return check_path_header(req, 'Destination', 2,
+                             'Destination header must be of the form '
+                             '<container name>/<object name>')
+
+
+def _copy_headers(src, dest):
+    """
+    Will copy desired headers from src to dest.
+
+    :params src: an instance of collections.Mapping
+    :params dest: an instance of collections.Mapping
+    """
+    for k, v in src.items():
+        if (is_sys_or_user_meta('object', k) or
+                is_object_transient_sysmeta(k) or
+                k.lower() == 'x-delete-at'):
+            dest[k] = v
+
+
+class ServerSideCopyWebContext(WSGIContext):
+
+    def __init__(self, app, logger, yield_frequency=10):
+        super(ServerSideCopyWebContext, self).__init__(app)
+        self.app = app
+        self.logger = logger
+        self.yield_frequency = yield_frequency
+
+    def get_source_resp(self, req):
+        sub_req = make_subrequest(
+            req.environ, path=wsgi_quote(req.path_info), headers=req.headers,
+            swift_source='SSC')
+        return sub_req.get_response(self.app)
+
+    def send_put_req(self, req, additional_resp_headers, start_response):
+        heartbeat = config_true_value(req.params.get('heartbeat'))
+        ACCEPTABLE_FORMATS = ['text/plain', 'application/json']
+
+        try:
+            out_content_type = req.accept.best_match(ACCEPTABLE_FORMATS)
+        except ValueError:
+            out_content_type = 'text/plain'
+        if not out_content_type:
+            out_content_type = 'text/plain'
+
+        if heartbeat:
+            gt = eventlet.spawn(self._app_call,
+                                req.environ)
+            start_response('202 Accepted',
+                           [('Content-Type', out_content_type)])
+
+            def resp_iter():
+                # Send an initial heartbeat
+                yield b' '
+                app_iter = [b'']
+                try:
+                    while not gt.dead:
+                        try:
+                            with eventlet.Timeout(self.yield_frequency):
+                                app_iter = gt.wait()
+                        except eventlet.Timeout:
+                            yield b' '
+                except Exception as e:
+                    # Send back the status to the client if error
+                    self._response_status = '500 Internal Error'
+                    app_iter = [str(e).encode('utf8')]
+                finally:
+                    response_body = b''.join(app_iter).decode('utf8')
+                    resp_dict = {'Response Status': self._response_status,
+                                 'Response Body': response_body}
+                    errors = []
+
+                    if not is_success(self._get_status_int()):
+                        src_path = additional_resp_headers['X-Copied-From']
+                        errors.append((
+                            wsgi_quote(src_path),
+                            self._response_status,
+                        ))
+
+                    for k, v in additional_resp_headers.items():
+                        if not k.lower().startswith(('x-object-sysmeta-',
+                                                    'x-backend')):
+                            resp_dict[k] = v
+
+                    for k, v in self._response_headers:
+                        if not k.lower().startswith(('x-object-sysmeta-',
+                                                    'x-backend')):
+                            resp_dict[k] = v
+                    yield get_heartbeat_response_body(out_content_type,
+                                                      resp_dict,
+                                                      errors, 'copy')
+                    close_if_possible(gt)
+
+            return resp_iter()
+
+        else:
+            app_resp = self._app_call(req.environ)
+            self._adjust_put_response(req, additional_resp_headers)
+            start_response(self._response_status,
+                           self._response_headers,
+                           self._response_exc_info)
+            return app_resp
+
+    def _adjust_put_response(self, req, additional_resp_headers):
+        if is_success(self._get_status_int()):
+            for header, value in additional_resp_headers.items():
+                self._response_headers.append((header, value))
+
+    def handle_OPTIONS_request(self, req, start_response):
+        app_resp = self._app_call(req.environ)
+        if is_success(self._get_status_int()):
+            for i, (header, value) in enumerate(self._response_headers):
+                if header.lower() == 'allow' and 'COPY' not in value:
+                    self._response_headers[i] = ('Allow', value + ', COPY')
+                if header.lower() == 'access-control-allow-methods' and \
+                        'COPY' not in value:
+                    self._response_headers[i] = \
+                        ('Access-Control-Allow-Methods', value + ', COPY')
+        start_response(self._response_status,
+                       self._response_headers,
+                       self._response_exc_info)
+        return app_resp
+
+
+class ServerSideCopyMiddleware(object):
+
+    def __init__(self, app, conf):
+        self.app = app
+        self.logger = get_logger(conf, log_route="copy")
+        self.yield_frequency = int(conf.get('yield_frequency', 10))
+
+    def __call__(self, env, start_response):
+        req = Request(env)
+        try:
+            (version, account, container, obj) = req.split_path(4, 4, True)
+            is_obj_req = True
+        except ValueError:
+            is_obj_req = False
+        if not is_obj_req:
+            # If obj component is not present in req, do not proceed further.
+            return self.app(env, start_response)
+
+        try:
+            # In some cases, save off original request method since it gets
+            # mutated into PUT during handling. This way logging can display
+            # the method the client actually sent.
+            if req.method == 'PUT' and req.headers.get('X-Copy-From'):
+                return self.handle_PUT(req, start_response)
+            elif req.method == 'COPY':
+                req.environ['swift.orig_req_method'] = req.method
+                return self.handle_COPY(req, start_response,
+                                        account, container, obj)
+            elif req.method == 'OPTIONS':
+                # Does not interfere with OPTIONS response from
+                # (account,container) servers and /info response.
+                return self.handle_OPTIONS(req, start_response)
+
+        except HTTPException as e:
+            return e(req.environ, start_response)
+
+        return self.app(env, start_response)
+
+    def handle_COPY(self, req, start_response, account, container, obj):
+        if not req.headers.get('Destination'):
+            return HTTPPreconditionFailed(request=req,
+                                          body='Destination header required'
+                                          )(req.environ, start_response)
+        dest_account = account
+        if 'Destination-Account' in req.headers:
+            dest_account = wsgi_unquote(req.headers.get('Destination-Account'))
+            dest_account = check_account_format(req, dest_account)
+            req.headers['X-Copy-From-Account'] = wsgi_quote(account)
+            account = dest_account
+            del req.headers['Destination-Account']
+        dest_container, dest_object = _check_destination_header(req)
+        source = '/%s/%s' % (container, obj)
+        container = dest_container
+        obj = dest_object
+        # re-write the existing request as a PUT instead of creating a new one
+        req.method = 'PUT'
+        # As this the path info is updated with destination container,
+        # the proxy server app will use the right object controller
+        # implementation corresponding to the container's policy type.
+        ver, _junk = req.split_path(1, 2, rest_with_last=True)
+        req.path_info = '/%s/%s/%s/%s' % (
+            ver, dest_account, dest_container, dest_object)
+        req.headers['Content-Length'] = 0
+        req.headers['X-Copy-From'] = wsgi_quote(source)
+        del req.headers['Destination']
+        return self.handle_PUT(req, start_response)
+
+    def _get_source_object(self, ssc_ctx, source_path, req):
+        source_req = req.copy_get()
+
+        # make sure the source request uses it's container_info
+        source_req.headers.pop('X-Backend-Storage-Policy-Index', None)
+        source_req.path_info = source_path
+        source_req.headers['X-Newest'] = 'true'
+
+        # in case we are copying an SLO manifest, set format=raw parameter
+        params = source_req.params
+        if params.get('multipart-manifest') == 'get':
+            params['format'] = 'raw'
+            source_req.params = params
+
+        source_resp = ssc_ctx.get_source_resp(source_req)
+
+        if source_resp.content_length is None:
+            # This indicates a transfer-encoding: chunked source object,
+            # which currently only happens because there are more than
+            # CONTAINER_LISTING_LIMIT segments in a segmented object. In
+            # this case, we're going to refuse to do the server-side copy.
+            close_if_possible(source_resp.app_iter)
+            return HTTPRequestEntityTooLarge(request=req)
+
+        if source_resp.content_length > MAX_FILE_SIZE:
+            close_if_possible(source_resp.app_iter)
+            return HTTPRequestEntityTooLarge(request=req)
+
+        return source_resp
+
+    def _create_response_headers(self, source_path, source_resp, sink_req):
+        resp_headers = dict()
+        acct, path = source_path.split('/', 3)[2:4]
+        resp_headers['X-Copied-From-Account'] = wsgi_quote(acct)
+        resp_headers['X-Copied-From'] = wsgi_quote(path)
+        if 'last-modified' in source_resp.headers:
+            resp_headers['X-Copied-From-Last-Modified'] = \
+                source_resp.headers['last-modified']
+        if 'X-Object-Version-Id' in source_resp.headers:
+            resp_headers['X-Copied-From-Version-Id'] = \
+                source_resp.headers['X-Object-Version-Id']
+        # Existing sys and user meta of source object is added to response
+        # headers in addition to the new ones.
+        _copy_headers(sink_req.headers, resp_headers)
+        return resp_headers
+
+    def handle_PUT(self, req, start_response):
+        if req.content_length:
+            return HTTPBadRequest(body='Copy requests require a zero byte '
+                                  'body', request=req,
+                                  content_type='text/plain')(req.environ,
+                                                             start_response)
+        # If heartbeat is enabled, set minimum_write_chunk_size directly
+        # in the original client request before making subrequests
+        if config_true_value(req.params.get('heartbeat')):
+            wsgi_input = req.environ.get('wsgi.input')
+            if hasattr(wsgi_input, 'environ'):
+                wsgi_input.environ['eventlet.minimum_write_chunk_size'] = 0
+            # Not sure if we also need to set it in
+            # the current request's environ
+            req.environ['eventlet.minimum_write_chunk_size'] = 0
+
+        # Form the path of source object to be fetched
+        ver, acct, _rest = req.split_path(2, 3, True)
+        src_account_name = req.headers.get('X-Copy-From-Account')
+        if src_account_name:
+            src_account_name = check_account_format(
+                req, wsgi_unquote(src_account_name))
+        else:
+            src_account_name = acct
+        src_container_name, src_obj_name = _check_copy_from_header(req)
+        source_path = '/%s/%s/%s/%s' % (ver, src_account_name,
+                                        src_container_name, src_obj_name)
+
+        # GET the source object, bail out on error
+        ssc_ctx = ServerSideCopyWebContext(self.app, self.logger,
+                                           self.yield_frequency)
+        source_resp = self._get_source_object(ssc_ctx, source_path, req)
+        if source_resp.status_int >= HTTP_MULTIPLE_CHOICES:
+            return source_resp(source_resp.environ, start_response)
+
+        # Create a new Request object based on the original request instance.
+        # This will preserve original request environ including headers.
+        sink_req = Request.blank(req.path_info, environ=req.environ)
+
+        def is_object_sysmeta(k):
+            return is_sys_meta('object', k)
+
+        if config_true_value(req.headers.get('x-fresh-metadata', 'false')):
+            # x-fresh-metadata only applies to copy, not post-as-copy: ignore
+            # existing user metadata, update existing sysmeta with new
+            copy_header_subset(source_resp, sink_req, is_object_sysmeta)
+            copy_header_subset(req, sink_req, is_object_sysmeta)
+        else:
+            # First copy existing sysmeta, user meta and other headers from the
+            # source to the sink, apart from headers that are conditionally
+            # copied below and timestamps.
+            exclude_headers = ('x-static-large-object', 'x-object-manifest',
+                               'etag', 'content-type', 'x-timestamp',
+                               'x-backend-timestamp')
+            copy_header_subset(source_resp, sink_req,
+                               lambda k: k.lower() not in exclude_headers)
+            # now update with original req headers
+            sink_req.headers.update(req.headers)
+
+        params = sink_req.params
+        params_updated = False
+
+        if params.get('multipart-manifest') == 'get':
+            if 'X-Static-Large-Object' in source_resp.headers:
+                params['multipart-manifest'] = 'put'
+            if 'X-Object-Manifest' in source_resp.headers:
+                del params['multipart-manifest']
+                sink_req.headers['X-Object-Manifest'] = \
+                    source_resp.headers['X-Object-Manifest']
+            params_updated = True
+
+        if 'version-id' in params:
+            del params['version-id']
+            params_updated = True
+
+        if params_updated:
+            sink_req.params = params
+
+        # Set swift.source, data source, content length and etag
+        # for the PUT request
+        sink_req.environ['swift.source'] = 'SSC'
+        sink_req.environ['wsgi.input'] = FileLikeIter(source_resp.app_iter)
+        sink_req.content_length = source_resp.content_length
+        if (source_resp.status_int == HTTP_OK and
+                'X-Static-Large-Object' not in source_resp.headers and
+                ('X-Object-Manifest' not in source_resp.headers or
+                 req.params.get('multipart-manifest') == 'get')):
+            # copy source etag so that copied content is verified, unless:
+            #  - not a 200 OK response: source etag may not match the actual
+            #    content, for example with a 206 Partial Content response to a
+            #    ranged request
+            #  - SLO manifest: etag cannot be specified in manifest PUT; SLO
+            #    generates its own etag value which may differ from source
+            #  - SLO: etag in SLO response is not hash of actual content
+            #  - DLO: etag in DLO response is not hash of actual content
+            sink_req.headers['Etag'] = source_resp.etag
+        else:
+            # since we're not copying the source etag, make sure that any
+            # container update override values are not copied.
+            remove_items(sink_req.headers, lambda k: k.startswith(
+                OBJECT_SYSMETA_CONTAINER_UPDATE_OVERRIDE_PREFIX.title()))
+
+        # We no longer need these headers
+        sink_req.headers.pop('X-Copy-From', None)
+        sink_req.headers.pop('X-Copy-From-Account', None)
+
+        # If the copy request does not explicitly override content-type,
+        # use the one present in the source object.
+        if not req.headers.get('content-type'):
+            sink_req.headers['Content-Type'] = \
+                source_resp.headers['Content-Type']
+
+        # Create response headers for PUT response
+        resp_headers = self._create_response_headers(source_path,
+                                                     source_resp, sink_req)
+
+        put_resp = ssc_ctx.send_put_req(sink_req, resp_headers, start_response)
+
+        # For heartbeat=on, we need to cleanup the resp iter
+        if config_true_value(req.params.get('heartbeat')):
+            def clean_iter(app_iter):
+                try:
+                    for chunk in app_iter:
+                        yield chunk
+                finally:
+                    close_if_possible(source_resp.app_iter)
+            return clean_iter(put_resp)
+
+        close_if_possible(source_resp.app_iter)
+        return put_resp
+
+    def handle_OPTIONS(self, req, start_response):
+        return ServerSideCopyWebContext(self.app, self.logger).\
+            handle_OPTIONS_request(req, start_response)
+
+
+def filter_factory(global_conf, **local_conf):
+    conf = global_conf.copy()
+    conf.update(local_conf)
+
+    def copy_filter(app):
+        return ServerSideCopyMiddleware(app, conf)
+
+    return copy_filter
diff --git a/swift/common/middleware/crossdomain.py b/swift/common/middleware/crossdomain.py
new file mode 100644
index 0000000000..c15e524548
--- /dev/null
+++ b/swift/common/middleware/crossdomain.py
@@ -0,0 +1,105 @@
+# Copyright (c) 2013 OpenStack Foundation.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from swift.common.swob import Request, Response
+from swift.common.registry import register_swift_info
+
+
+class CrossDomainMiddleware(object):
+
+    """
+    Cross domain middleware used to respond to requests for cross domain
+    policy information.
+
+    If the path is ``/crossdomain.xml`` it will respond with an xml cross
+    domain policy document. This allows web pages hosted elsewhere to use
+    client side technologies such as Flash, Java and Silverlight to interact
+    with the Swift API.
+
+    To enable this middleware, add it to the pipeline in your proxy-server.conf
+    file. It should be added before any authentication (e.g., tempauth or
+    keystone) middleware. In this example ellipsis (...) indicate other
+    middleware you may have chosen to use:
+
+    .. code:: cfg
+
+        [pipeline:main]
+        pipeline =  ... crossdomain ... authtoken ... proxy-server
+
+    And add a filter section, such as:
+
+    .. code:: cfg
+
+        [filter:crossdomain]
+        use = egg:swift#crossdomain
+        cross_domain_policy = <allow-access-from domain="*.example.com" />
+            <allow-access-from domain="www.example.com" secure="false" />
+
+    For continuation lines, put some whitespace before the continuation
+    text. Ensure you put a completely blank line to terminate the
+    ``cross_domain_policy`` value.
+
+    The ``cross_domain_policy`` name/value is optional. If omitted, the policy
+    defaults as if you had specified:
+
+    .. code:: cfg
+
+        cross_domain_policy = <allow-access-from domain="*" secure="false" />
+
+    .. note::
+
+       The default policy is very permissive; this is appropriate
+       for most public cloud deployments, but may not be appropriate
+       for all deployments. See also:
+       `CWE-942 <https://cwe.mitre.org/data/definitions/942.html>`__
+
+
+    """
+
+    def __init__(self, app, conf, *args, **kwargs):
+        self.app = app
+        self.conf = conf
+        default_domain_policy = '<allow-access-from domain="*"' \
+                                ' secure="false" />'
+        self.cross_domain_policy = self.conf.get('cross_domain_policy',
+                                                 default_domain_policy)
+
+    def GET(self, req):
+        """Returns a 200 response with cross domain policy information """
+        body = '<?xml version="1.0"?>\n' \
+               '<!DOCTYPE cross-domain-policy SYSTEM ' \
+               '"http://www.adobe.com/xml/dtds/cross-domain-policy.dtd" >\n' \
+               '<cross-domain-policy>\n' \
+               '%s\n' \
+               '</cross-domain-policy>' % self.cross_domain_policy
+        return Response(request=req, body=body.encode('utf-8'),
+                        content_type="application/xml")
+
+    def __call__(self, env, start_response):
+        req = Request(env)
+        if req.path == '/crossdomain.xml' and req.method == 'GET':
+            return self.GET(req)(env, start_response)
+        else:
+            return self.app(env, start_response)
+
+
+def filter_factory(global_conf, **local_conf):
+    conf = global_conf.copy()
+    conf.update(local_conf)
+    register_swift_info('crossdomain')
+
+    def crossdomain_filter(app):
+        return CrossDomainMiddleware(app, conf)
+    return crossdomain_filter
diff --git a/swift/common/middleware/crypto/__init__.py b/swift/common/middleware/crypto/__init__.py
new file mode 100644
index 0000000000..a70e7b8609
--- /dev/null
+++ b/swift/common/middleware/crypto/__init__.py
@@ -0,0 +1,36 @@
+# Copyright (c) 2016 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""
+Implements middleware for object encryption which comprises an instance of a
+:class:`~swift.common.middleware.crypto.decrypter.Decrypter` combined with an
+instance of an :class:`~swift.common.middleware.crypto.encrypter.Encrypter`.
+"""
+from swift.common.middleware.crypto.decrypter import Decrypter
+from swift.common.middleware.crypto.encrypter import Encrypter
+
+from swift.common.utils import config_true_value
+from swift.common.registry import register_swift_info
+
+
+def filter_factory(global_conf, **local_conf):
+    """Provides a factory function for loading encryption middleware."""
+    conf = global_conf.copy()
+    conf.update(local_conf)
+    enabled = not config_true_value(conf.get('disable_encryption', 'false'))
+    register_swift_info('encryption', admin=True, enabled=enabled)
+
+    def encryption_filter(app):
+        return Decrypter(Encrypter(app, conf), conf)
+    return encryption_filter
diff --git a/swift/common/middleware/crypto/crypto_utils.py b/swift/common/middleware/crypto/crypto_utils.py
new file mode 100644
index 0000000000..980bebb912
--- /dev/null
+++ b/swift/common/middleware/crypto/crypto_utils.py
@@ -0,0 +1,292 @@
+# Copyright (c) 2015-2016 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import base64
+import binascii
+import json
+import os
+
+from cryptography.hazmat.backends import default_backend
+from cryptography.hazmat.primitives.ciphers import Cipher, algorithms, modes
+import urllib.parse
+
+from swift.common.exceptions import EncryptionException, UnknownSecretIdError
+from swift.common.swob import HTTPInternalServerError
+from swift.common.utils import get_logger, parse_header
+from swift.common.wsgi import WSGIContext
+
+CRYPTO_KEY_CALLBACK = 'swift.callback.fetch_crypto_keys'
+
+
+class Crypto(object):
+    """
+    Used by middleware: Calls cryptography library
+    """
+    cipher = 'AES_CTR_256'
+    # AES will accept several key sizes - we are using 256 bits i.e. 32 bytes
+    key_length = 32
+    iv_length = algorithms.AES.block_size // 8
+
+    def __init__(self, conf=None):
+        self.logger = get_logger(conf, log_route="crypto")
+        # memoize backend to avoid repeated iteration over entry points
+        self.backend = default_backend()
+
+    def create_encryption_ctxt(self, key, iv):
+        """
+        Creates a crypto context for encrypting
+
+        :param key: 256-bit key
+        :param iv: 128-bit iv or nonce used for encryption
+        :raises ValueError: on invalid key or iv
+        :returns: an instance of an encryptor
+        """
+        self.check_key(key)
+        engine = Cipher(algorithms.AES(key), modes.CTR(iv),
+                        backend=self.backend)
+        return engine.encryptor()
+
+    def create_decryption_ctxt(self, key, iv, offset):
+        """
+        Creates a crypto context for decrypting
+
+        :param key: 256-bit key
+        :param iv: 128-bit iv or nonce used for decryption
+        :param offset: offset into the message; used for range reads
+        :returns: an instance of a decryptor
+        """
+        self.check_key(key)
+        if offset < 0:
+            raise ValueError('Offset must not be negative')
+        if offset:
+            # Adjust IV so that it is correct for decryption at offset.
+            # The CTR mode offset is incremented for every AES block and taken
+            # modulo 2^128.
+            offset_blocks, offset_in_block = divmod(offset, self.iv_length)
+            ivl = int(binascii.hexlify(iv), 16) + offset_blocks
+            ivl %= 1 << algorithms.AES.block_size
+            iv = bytes(bytearray.fromhex(format(
+                ivl, '0%dx' % (2 * self.iv_length))))
+        else:
+            offset_in_block = 0
+
+        engine = Cipher(algorithms.AES(key), modes.CTR(iv),
+                        backend=self.backend)
+        dec = engine.decryptor()
+        # Adjust decryption boundary within current AES block
+        dec.update(b'*' * offset_in_block)
+        return dec
+
+    def create_iv(self):
+        return os.urandom(self.iv_length)
+
+    def create_crypto_meta(self):
+        # create a set of parameters
+        return {'iv': self.create_iv(), 'cipher': self.cipher}
+
+    def check_crypto_meta(self, meta):
+        """
+        Check that crypto meta dict has valid items.
+
+        :param meta: a dict
+        :raises EncryptionException: if an error is found in the crypto meta
+        """
+        try:
+            if meta['cipher'] != self.cipher:
+                raise EncryptionException('Bad crypto meta: Cipher must be %s'
+                                          % self.cipher)
+            if len(meta['iv']) != self.iv_length:
+                raise EncryptionException(
+                    'Bad crypto meta: IV must be length %s bytes'
+                    % self.iv_length)
+        except KeyError as err:
+            raise EncryptionException(
+                'Bad crypto meta: Missing %s' % err)
+
+    def create_random_key(self):
+        # helper method to create random key of correct length
+        return os.urandom(self.key_length)
+
+    def wrap_key(self, wrapping_key, key_to_wrap):
+        # we don't use an RFC 3394 key wrap algorithm such as cryptography's
+        # aes_wrap_key because it's slower and we have iv material readily
+        # available so don't need a deterministic algorithm
+        iv = self.create_iv()
+        encryptor = Cipher(algorithms.AES(wrapping_key), modes.CTR(iv),
+                           backend=self.backend).encryptor()
+        return {'key': encryptor.update(key_to_wrap), 'iv': iv}
+
+    def unwrap_key(self, wrapping_key, context):
+        # unwrap a key from dict of form returned by wrap_key
+        # check the key length early - unwrapping won't change the length
+        self.check_key(context['key'])
+        decryptor = Cipher(algorithms.AES(wrapping_key),
+                           modes.CTR(context['iv']),
+                           backend=self.backend).decryptor()
+        return decryptor.update(context['key'])
+
+    def check_key(self, key):
+        if len(key) != self.key_length:
+            raise ValueError("Key must be length %s bytes" % self.key_length)
+
+
+class CryptoWSGIContext(WSGIContext):
+    """
+    Base class for contexts used by crypto middlewares.
+    """
+    def __init__(self, crypto_app, server_type, logger):
+        super(CryptoWSGIContext, self).__init__(crypto_app.app)
+        self.crypto = crypto_app.crypto
+        self.logger = logger
+        self.server_type = server_type
+
+    def get_keys(self, env, required=None, key_id=None):
+        # Get the key(s) from the keymaster
+        required = required if required is not None else [self.server_type]
+        try:
+            fetch_crypto_keys = env[CRYPTO_KEY_CALLBACK]
+        except KeyError:
+            self.logger.exception('ERROR get_keys() missing callback')
+            raise HTTPInternalServerError(
+                "Unable to retrieve encryption keys.")
+
+        err = None
+        try:
+            keys = fetch_crypto_keys(key_id=key_id)
+        except UnknownSecretIdError as err:
+            self.logger.error('get_keys(): unknown key id: %s', err)
+            raise
+        except Exception as err:  # noqa
+            self.logger.exception('get_keys(): from callback: %s', err)
+            raise HTTPInternalServerError(
+                "Unable to retrieve encryption keys.")
+
+        for name in required:
+            try:
+                key = keys[name]
+                self.crypto.check_key(key)
+                continue
+            except KeyError:
+                self.logger.exception("Missing key for %r", name)
+            except TypeError:
+                self.logger.exception("Did not get a keys dict")
+            except ValueError as e:
+                # don't include the key in any messages!
+                self.logger.exception("Bad key for %(name)r: %(err)s",
+                                      {'name': name, 'err': e})
+            raise HTTPInternalServerError(
+                "Unable to retrieve encryption keys.")
+
+        return keys
+
+    def get_multiple_keys(self, env):
+        # get a list of keys from the keymaster containing one dict of keys for
+        # each of the keymaster root secret ids
+        keys = [self.get_keys(env)]
+        active_key_id = keys[0]['id']
+        for other_key_id in keys[0].get('all_ids', []):
+            if other_key_id == active_key_id:
+                continue
+            keys.append(self.get_keys(env, key_id=other_key_id))
+        return keys
+
+
+def dump_crypto_meta(crypto_meta):
+    """
+    Serialize crypto meta to a form suitable for including in a header value.
+
+    The crypto-meta is serialized as a json object. The iv and key values are
+    random bytes and as a result need to be base64 encoded before sending over
+    the wire. Base64 encoding returns a bytes object in py3, to future proof
+    the code, decode this data to produce a string, which is what the
+    json.dumps function expects.
+
+    :param crypto_meta: a dict containing crypto meta items
+    :returns: a string serialization of a crypto meta dict
+    """
+    def b64_encode_meta(crypto_meta):
+        return {
+            name: (base64.b64encode(value).decode() if name in ('iv', 'key')
+                   else b64_encode_meta(value) if isinstance(value, dict)
+                   else value)
+            for name, value in crypto_meta.items()}
+
+    # use sort_keys=True to make serialized form predictable for testing
+    return urllib.parse.quote_plus(
+        json.dumps(b64_encode_meta(crypto_meta), sort_keys=True))
+
+
+def load_crypto_meta(value, b64decode=True):
+    """
+    Build the crypto_meta from the json object.
+
+    Note that json.loads always produces unicode strings; to ensure the
+    resultant crypto_meta matches the original object:
+        * cast all keys to str (effectively a no-op on py3),
+        * base64 decode 'key' and 'iv' values to bytes, and
+        * encode remaining string values as UTF-8 on py2 (while leaving them
+          as native unicode strings on py3).
+
+    :param value: a string serialization of a crypto meta dict
+    :param b64decode: decode the 'key' and 'iv' values to bytes, default True
+    :returns: a dict containing crypto meta items
+    :raises EncryptionException: if an error occurs while parsing the
+                                 crypto meta
+    """
+    def b64_decode_meta(crypto_meta):
+        return {
+            str(name): (
+                base64.b64decode(val) if name in ('iv', 'key') and b64decode
+                else b64_decode_meta(val) if isinstance(val, dict)
+                else val)
+            for name, val in crypto_meta.items()}
+
+    try:
+        if not isinstance(value, str):
+            raise ValueError('crypto meta not a string')
+        val = json.loads(urllib.parse.unquote_plus(value))
+        if not isinstance(val, dict):
+            raise ValueError('crypto meta not a Mapping')
+        return b64_decode_meta(val)
+    except (KeyError, ValueError, TypeError) as err:
+        msg = 'Bad crypto meta %r: %s' % (value, err)
+        raise EncryptionException(msg)
+
+
+def append_crypto_meta(value, crypto_meta):
+    """
+    Serialize and append crypto metadata to an encrypted value.
+
+    :param value: value to which serialized crypto meta will be appended.
+    :param crypto_meta: a dict of crypto meta
+    :return: a string of the form <value>; swift_meta=<serialized crypto meta>
+    """
+    if not isinstance(value, str):
+        raise ValueError
+    return '%s; swift_meta=%s' % (value, dump_crypto_meta(crypto_meta))
+
+
+def extract_crypto_meta(value):
+    """
+    Extract and deserialize any crypto meta from the end of a value.
+
+    :param value: string that may have crypto meta at end
+    :return: a tuple of the form:
+            (<value without crypto meta>, <deserialized crypto meta> or None)
+    """
+    swift_meta = None
+    value, meta = parse_header(value)
+    if 'swift_meta' in meta:
+        swift_meta = load_crypto_meta(meta['swift_meta'])
+    return value, swift_meta
diff --git a/swift/common/middleware/crypto/decrypter.py b/swift/common/middleware/crypto/decrypter.py
new file mode 100644
index 0000000000..7caa34aee6
--- /dev/null
+++ b/swift/common/middleware/crypto/decrypter.py
@@ -0,0 +1,481 @@
+# Copyright (c) 2015-2016 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import base64
+import json
+
+from swift.common.constraints import valid_api_version, check_utf8
+from swift.common.header_key_dict import HeaderKeyDict
+from swift.common.http import is_success
+from swift.common.middleware.crypto.crypto_utils import CryptoWSGIContext, \
+    load_crypto_meta, extract_crypto_meta, Crypto
+from swift.common.exceptions import EncryptionException, UnknownSecretIdError
+from swift.common.request_helpers import get_object_transient_sysmeta, \
+    get_sys_meta_prefix, get_user_meta_prefix, \
+    get_container_update_override_key
+from swift.common.swob import Request, HTTPException, \
+    HTTPInternalServerError, wsgi_to_bytes, bytes_to_wsgi, wsgi_to_str
+from swift.common.utils import get_logger, config_true_value, \
+    parse_content_range, closing_if_possible, parse_content_type, \
+    FileLikeIter, multipart_byteranges_to_document_iters
+
+DECRYPT_CHUNK_SIZE = 65536
+
+
+def purge_crypto_sysmeta_headers(headers):
+    return [h for h in headers if not
+            h[0].lower().startswith(
+                (get_object_transient_sysmeta('crypto-'),
+                 get_sys_meta_prefix('object') + 'crypto-'))]
+
+
+class BaseDecrypterContext(CryptoWSGIContext):
+    def get_crypto_meta(self, header_name, check=True):
+        """
+        Extract a crypto_meta dict from a header.
+
+        :param header_name: name of header that may have crypto_meta
+        :param check: if True validate the crypto meta
+        :return: A dict containing crypto_meta items
+        :raises EncryptionException: if an error occurs while parsing the
+                                     crypto meta
+        """
+        crypto_meta_json = self._response_header_value(header_name)
+
+        if crypto_meta_json is None:
+            return None
+        crypto_meta = load_crypto_meta(crypto_meta_json)
+        if check:
+            self.crypto.check_crypto_meta(crypto_meta)
+        return crypto_meta
+
+    def get_unwrapped_key(self, crypto_meta, wrapping_key):
+        """
+        Get a wrapped key from crypto-meta and unwrap it using the provided
+        wrapping key.
+
+        :param crypto_meta: a dict of crypto-meta
+        :param wrapping_key: key to be used to decrypt the wrapped key
+        :return: an unwrapped key
+        :raises HTTPInternalServerError: if the crypto-meta has no wrapped key
+                                         or the unwrapped key is invalid
+        """
+        try:
+            return self.crypto.unwrap_key(wrapping_key,
+                                          crypto_meta['body_key'])
+        except KeyError as err:
+            self.logger.error(
+                'Error decrypting %(resp_type)s: Missing %(key)s',
+                {'resp_type': self.server_type, 'key': err})
+        except ValueError as err:
+            self.logger.error('Error decrypting %(resp_type)s: %(reason)s',
+                              {'resp_type': self.server_type, 'reason': err})
+        raise HTTPInternalServerError(
+            body='Error decrypting %s' % self.server_type,
+            content_type='text/plain')
+
+    def decrypt_value_with_meta(self, value, key, required, decoder):
+        """
+        Base64-decode and decrypt a value if crypto meta can be extracted from
+        the value itself, otherwise return the value unmodified.
+
+        A value should either be a string that does not contain the ';'
+        character or should be of the form::
+
+            <base64-encoded ciphertext>;swift_meta=<crypto meta>
+
+        :param value: value to decrypt
+        :param key: crypto key to use
+        :param required: if True then the value is required to be decrypted
+                         and an EncryptionException will be raised if the
+                         header cannot be decrypted due to missing crypto meta.
+        :param decoder: function to turn the decrypted bytes into useful data
+        :returns: decrypted value if crypto meta is found, otherwise the
+                  unmodified value
+        :raises EncryptionException: if an error occurs while parsing crypto
+                                     meta or if the header value was required
+                                     to be decrypted but crypto meta was not
+                                     found.
+        """
+        extracted_value, crypto_meta = extract_crypto_meta(value)
+        if crypto_meta:
+            self.crypto.check_crypto_meta(crypto_meta)
+            value = self.decrypt_value(
+                extracted_value, key, crypto_meta, decoder)
+        elif required:
+            raise EncryptionException(
+                "Missing crypto meta in value %s" % value)
+
+        return value
+
+    def decrypt_value(self, value, key, crypto_meta, decoder):
+        """
+        Base64-decode and decrypt a value using the crypto_meta provided.
+
+        :param value: a base64-encoded value to decrypt
+        :param key: crypto key to use
+        :param crypto_meta: a crypto-meta dict of form returned by
+            :py:func:`~swift.common.middleware.crypto.Crypto.get_crypto_meta`
+        :param decoder: function to turn the decrypted bytes into useful data
+        :returns: decrypted value
+        """
+        if not value:
+            return decoder(b'')
+        crypto_ctxt = self.crypto.create_decryption_ctxt(
+            key, crypto_meta['iv'], 0)
+        return decoder(crypto_ctxt.update(base64.b64decode(value)))
+
+    def get_decryption_keys(self, req, crypto_meta=None):
+        """
+        Determine if a response should be decrypted, and if so then fetch keys.
+
+        :param req: a Request object
+        :param crypto_meta: a dict of crypto metadata
+        :returns: a dict of decryption keys
+        """
+        if config_true_value(req.environ.get('swift.crypto.override')):
+            self.logger.debug('No decryption is necessary because of override')
+            return None
+
+        key_id = crypto_meta.get('key_id') if crypto_meta else None
+        return self.get_keys(req.environ, key_id=key_id)
+
+
+class DecrypterObjContext(BaseDecrypterContext):
+    def __init__(self, decrypter, logger):
+        super(DecrypterObjContext, self).__init__(decrypter, 'object', logger)
+
+    def _decrypt_header(self, header, value, key, required=False):
+        """
+        Attempt to decrypt a header value that may be encrypted.
+
+        :param header: the header name
+        :param value: the header value
+        :param key: decryption key
+        :param required: if True then the header is required to be decrypted
+                         and an HTTPInternalServerError will be raised if the
+                         header cannot be decrypted due to missing crypto meta.
+        :return: decrypted value or the original value if it was not encrypted.
+        :raises HTTPInternalServerError: if an error occurred during decryption
+                                         or if the header value was required to
+                                         be decrypted but crypto meta was not
+                                         found.
+        """
+        try:
+            return self.decrypt_value_with_meta(
+                value, key, required, bytes_to_wsgi)
+        except EncryptionException as err:
+            self.logger.error(
+                "Error decrypting header %(header)s: %(error)s",
+                {'header': header, 'error': err})
+            raise HTTPInternalServerError(
+                body='Error decrypting header',
+                content_type='text/plain')
+
+    def decrypt_user_metadata(self, keys):
+        prefix = get_object_transient_sysmeta('crypto-meta-')
+        prefix_len = len(prefix)
+        new_prefix = get_user_meta_prefix(self.server_type).title()
+        result = []
+        for name, val in self._response_headers:
+            if name.lower().startswith(prefix) and val:
+                short_name = name[prefix_len:]
+                decrypted_value = self._decrypt_header(
+                    name, val, keys[self.server_type], required=True)
+                result.append((new_prefix + short_name, decrypted_value))
+        return result
+
+    def decrypt_resp_headers(self, put_keys, post_keys, update_cors_exposed):
+        """
+        Find encrypted headers and replace with the decrypted versions.
+
+        :param put_keys: a dict of decryption keys used for object PUT.
+        :param post_keys: a dict of decryption keys used for object POST.
+        :return: A list of headers with any encrypted headers replaced by their
+                 decrypted values.
+        :raises HTTPInternalServerError: if any error occurs while decrypting
+                                         headers
+        """
+        mod_hdr_pairs = []
+
+        if put_keys:
+            # Decrypt plaintext etag and place in Etag header for client
+            # response
+            etag_header = 'X-Object-Sysmeta-Crypto-Etag'
+            encrypted_etag = self._response_header_value(etag_header)
+            if encrypted_etag:
+                decrypted_etag = self._decrypt_header(
+                    etag_header, encrypted_etag, put_keys['object'],
+                    required=True)
+                mod_hdr_pairs.append(('Etag', decrypted_etag))
+
+            etag_header = get_container_update_override_key('etag')
+            encrypted_etag = self._response_header_value(etag_header)
+            if encrypted_etag:
+                decrypted_etag = self._decrypt_header(
+                    etag_header, encrypted_etag, put_keys['container'])
+                mod_hdr_pairs.append((etag_header, decrypted_etag))
+
+        # Decrypt all user metadata. Encrypted user metadata values are stored
+        # in the x-object-transient-sysmeta-crypto-meta- namespace. Those are
+        # decrypted and moved back to the x-object-meta- namespace. Prior to
+        # decryption, the response should have no x-object-meta- headers, but
+        # if it does then they will be overwritten by any decrypted headers
+        # that map to the same x-object-meta- header names i.e. decrypted
+        # headers win over unexpected, unencrypted headers.
+        if post_keys:
+            decrypted_meta = self.decrypt_user_metadata(post_keys)
+            mod_hdr_pairs.extend(decrypted_meta)
+        else:
+            decrypted_meta = []
+
+        mod_hdr_names = {h.lower() for h, v in mod_hdr_pairs}
+
+        found_aceh = False
+        for header, value in self._response_headers:
+            lheader = header.lower()
+            if lheader in mod_hdr_names:
+                continue
+            if lheader == 'access-control-expose-headers':
+                found_aceh = True
+                mod_hdr_pairs.append((header, value + ', ' + ', '.join(
+                    meta.lower() for meta, _data in decrypted_meta)))
+            else:
+                mod_hdr_pairs.append((header, value))
+        if update_cors_exposed and not found_aceh:
+            mod_hdr_pairs.append(('Access-Control-Expose-Headers', ', '.join(
+                meta.lower() for meta, _data in decrypted_meta)))
+        return mod_hdr_pairs
+
+    def multipart_response_iter(self, resp, boundary, body_key, crypto_meta):
+        """
+        Decrypts a multipart mime doc response body.
+
+        :param resp: application response
+        :param boundary: multipart boundary string
+        :param body_key: decryption key for the response body
+        :param crypto_meta: crypto_meta for the response body
+        :return: generator for decrypted response body
+        """
+        with closing_if_possible(resp):
+            parts_iter = multipart_byteranges_to_document_iters(
+                FileLikeIter(resp), boundary)
+            for first_byte, last_byte, length, headers, body in parts_iter:
+                yield b"--" + boundary + b"\r\n"
+
+                for header, value in headers:
+                    yield b"%s: %s\r\n" % (wsgi_to_bytes(header),
+                                           wsgi_to_bytes(value))
+
+                yield b"\r\n"
+
+                decrypt_ctxt = self.crypto.create_decryption_ctxt(
+                    body_key, crypto_meta['iv'], first_byte)
+                for chunk in iter(lambda: body.read(DECRYPT_CHUNK_SIZE), b''):
+                    yield decrypt_ctxt.update(chunk)
+
+                yield b"\r\n"
+
+            yield b"--" + boundary + b"--"
+
+    def response_iter(self, resp, body_key, crypto_meta, offset):
+        """
+        Decrypts a response body.
+
+        :param resp: application response
+        :param body_key: decryption key for the response body
+        :param crypto_meta: crypto_meta for the response body
+        :param offset: offset into object content at which response body starts
+        :return: generator for decrypted response body
+        """
+        decrypt_ctxt = self.crypto.create_decryption_ctxt(
+            body_key, crypto_meta['iv'], offset)
+        with closing_if_possible(resp):
+            for chunk in resp:
+                yield decrypt_ctxt.update(chunk)
+
+    def _read_crypto_meta(self, header, check):
+        crypto_meta = None
+        if (is_success(self._get_status_int()) or
+                self._get_status_int() in (304, 412)):
+            try:
+                crypto_meta = self.get_crypto_meta(header, check)
+            except EncryptionException as err:
+                self.logger.error('Error decrypting object: %s', err)
+                raise HTTPInternalServerError(
+                    body='Error decrypting object', content_type='text/plain')
+        return crypto_meta
+
+    def handle(self, req, start_response):
+        app_resp = self._app_call(req.environ)
+
+        try:
+            put_crypto_meta = self._read_crypto_meta(
+                'X-Object-Sysmeta-Crypto-Body-Meta', True)
+            put_keys = self.get_decryption_keys(req, put_crypto_meta)
+            post_crypto_meta = self._read_crypto_meta(
+                'X-Object-Transient-Sysmeta-Crypto-Meta', False)
+            post_keys = self.get_decryption_keys(req, post_crypto_meta)
+        except EncryptionException as err:
+            self.logger.error(
+                "Error decrypting object: %s",
+                err)
+            raise HTTPInternalServerError(
+                body='Error decrypting object',
+                content_type='text/plain')
+
+        if put_keys is None and post_keys is None:
+            # skip decryption
+            start_response(self._response_status, self._response_headers,
+                           self._response_exc_info)
+            return app_resp
+
+        mod_resp_headers = self.decrypt_resp_headers(
+            put_keys, post_keys,
+            update_cors_exposed=bool(req.headers.get('origin')))
+
+        if put_crypto_meta and req.method == 'GET' and \
+                is_success(self._get_status_int()):
+            # 2xx response and encrypted body
+            body_key = self.get_unwrapped_key(
+                put_crypto_meta, put_keys['object'])
+            content_type, content_type_attrs = parse_content_type(
+                self._response_header_value('Content-Type'))
+
+            if (self._get_status_int() == 206 and
+                    content_type == 'multipart/byteranges'):
+                boundary = wsgi_to_bytes(dict(content_type_attrs)["boundary"])
+                resp_iter = self.multipart_response_iter(
+                    app_resp, boundary, body_key, put_crypto_meta)
+            else:
+                offset = 0
+                content_range = self._response_header_value('Content-Range')
+                if content_range:
+                    # Determine offset within the whole object if ranged GET
+                    offset, end, total = parse_content_range(content_range)
+                resp_iter = self.response_iter(
+                    app_resp, body_key, put_crypto_meta, offset)
+        else:
+            # don't decrypt body of unencrypted or non-2xx responses
+            resp_iter = app_resp
+
+        mod_resp_headers = purge_crypto_sysmeta_headers(mod_resp_headers)
+        start_response(self._response_status, mod_resp_headers,
+                       self._response_exc_info)
+
+        return resp_iter
+
+
+class DecrypterContContext(BaseDecrypterContext):
+    def __init__(self, decrypter, logger):
+        super(DecrypterContContext, self).__init__(
+            decrypter, 'container', logger)
+
+    def handle(self, req, start_response):
+        app_resp = self._app_call(req.environ)
+
+        if is_success(self._get_status_int()):
+            # only decrypt body of 2xx responses
+            headers = HeaderKeyDict(self._response_headers)
+            content_type = headers.get('content-type', '').split(';', 1)[0]
+            if content_type == 'application/json':
+                app_resp = self.process_json_resp(req, app_resp)
+
+        start_response(self._response_status,
+                       self._response_headers,
+                       self._response_exc_info)
+
+        return app_resp
+
+    def process_json_resp(self, req, resp_iter):
+        """
+        Parses json body listing and decrypt encrypted entries. Updates
+        Content-Length header with new body length and return a body iter.
+        """
+        with closing_if_possible(resp_iter):
+            resp_body = b''.join(resp_iter)
+        body_json = json.loads(resp_body)
+        new_body = json.dumps([self.decrypt_obj_dict(req, obj_dict)
+                               for obj_dict in body_json]).encode('ascii')
+        self.update_content_length(len(new_body))
+        return [new_body]
+
+    def decrypt_obj_dict(self, req, obj_dict):
+        if 'hash' in obj_dict:
+            # each object's etag may have been encrypted with a different key
+            # so fetch keys based on its crypto meta
+            ciphertext, crypto_meta = extract_crypto_meta(obj_dict['hash'])
+            bad_keys = set()
+            if crypto_meta:
+                try:
+                    self.crypto.check_crypto_meta(crypto_meta)
+                    keys = self.get_decryption_keys(req, crypto_meta)
+                    # Note that symlinks (for example) may put swift paths in
+                    # the listing ETag, so we can't just use ASCII.
+                    obj_dict['hash'] = self.decrypt_value(
+                        ciphertext, keys['container'], crypto_meta,
+                        decoder=lambda x: x.decode('utf-8'))
+                except EncryptionException as err:
+                    if not isinstance(err, UnknownSecretIdError) or \
+                            err.args[0] not in bad_keys:
+                        # Only warn about an unknown key once per listing
+                        self.logger.error(
+                            "Error decrypting container listing: %s",
+                            err)
+                    if isinstance(err, UnknownSecretIdError):
+                        bad_keys.add(err.args[0])
+                    obj_dict['hash'] = '<unknown>'
+        return obj_dict
+
+
+class Decrypter(object):
+    """Middleware for decrypting data and user metadata."""
+
+    def __init__(self, app, conf):
+        self.app = app
+        self.logger = get_logger(conf, log_route="decrypter")
+        self.crypto = Crypto(conf)
+
+    def __call__(self, env, start_response):
+        req = Request(env)
+        try:
+            parts = req.split_path(3, 4, True)
+            is_cont_or_obj_req = True
+        except ValueError:
+            is_cont_or_obj_req = False
+
+        if not is_cont_or_obj_req:
+            return self.app(env, start_response)
+        if not valid_api_version(parts[0]):
+            # Not a swift request
+            return self.app(env, start_response)
+        if not check_utf8(wsgi_to_str(req.path_info),
+                          internal=req.allow_reserved_names):
+            # Not a valid swift request
+            return self.app(env, start_response)
+        # TODO any other invalid paths we want to ignore??
+
+        if parts[3] and req.method in ('GET', 'HEAD'):
+            handler = DecrypterObjContext(self, self.logger).handle
+        elif parts[2] and req.method == 'GET':
+            handler = DecrypterContContext(self, self.logger).handle
+        else:
+            # url and/or request verb is not handled by decrypter
+            return self.app(env, start_response)
+
+        try:
+            return handler(req, start_response)
+        except HTTPException as err_resp:
+            return err_resp(env, start_response)
diff --git a/swift/common/middleware/crypto/encrypter.py b/swift/common/middleware/crypto/encrypter.py
new file mode 100644
index 0000000000..b33aaeaf7a
--- /dev/null
+++ b/swift/common/middleware/crypto/encrypter.py
@@ -0,0 +1,383 @@
+# Copyright (c) 2015-2016 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import base64
+import hashlib
+import hmac
+from contextlib import contextmanager
+
+from swift.common.constraints import check_metadata
+from swift.common.http import is_success
+from swift.common.middleware.crypto.crypto_utils import CryptoWSGIContext, \
+    dump_crypto_meta, append_crypto_meta, Crypto
+from swift.common.request_helpers import get_object_transient_sysmeta, \
+    strip_user_meta_prefix, is_user_meta, update_etag_is_at_header, \
+    get_container_update_override_key
+from swift.common.swob import Request, Match, HTTPException, \
+    HTTPUnprocessableEntity, wsgi_to_bytes, bytes_to_wsgi, normalize_etag
+from swift.common.utils import get_logger, config_true_value, \
+    MD5_OF_EMPTY_STRING, md5, InputProxy
+
+
+def encrypt_header_val(crypto, value, key):
+    """
+    Encrypt a header value using the supplied key.
+
+    :param crypto: a Crypto instance
+    :param value: value to encrypt
+    :param key: crypto key to use
+    :returns: a tuple of (encrypted value, crypto_meta) where crypto_meta is a
+        dict of form returned by
+        :py:func:`~swift.common.middleware.crypto.Crypto.get_crypto_meta`
+    :raises ValueError: if value is empty
+    """
+    if not value:
+        raise ValueError('empty value is not acceptable')
+
+    crypto_meta = crypto.create_crypto_meta()
+    crypto_ctxt = crypto.create_encryption_ctxt(key, crypto_meta['iv'])
+    enc_val = bytes_to_wsgi(base64.b64encode(
+        crypto_ctxt.update(wsgi_to_bytes(value))))
+    return enc_val, crypto_meta
+
+
+def _hmac_etag(key, etag):
+    """
+    Compute an HMAC-SHA256 using given key and etag.
+
+    :param key: The starting key for the hash.
+    :param etag: The etag to hash.
+    :returns: a Base64-encoded representation of the HMAC
+    """
+    if not isinstance(etag, bytes):
+        etag = wsgi_to_bytes(etag)
+    result = hmac.new(key, etag, digestmod=hashlib.sha256).digest()
+    return base64.b64encode(result).decode()
+
+
+class EncInputWrapper(InputProxy):
+    """File-like object to be swapped in for wsgi.input."""
+    def __init__(self, crypto, keys, req, logger):
+        super().__init__(req.environ['wsgi.input'])
+        self.env = req.environ
+        self.path = req.path
+        self.crypto = crypto
+        self.body_crypto_ctxt = None
+        self.keys = keys
+        self.plaintext_md5 = None
+        self.ciphertext_md5 = None
+        self.logger = logger
+        self.install_footers_callback(req)
+
+    def _init_encryption_context(self):
+        # do this once when body is first read
+        if self.body_crypto_ctxt is None:
+            self.body_crypto_meta = self.crypto.create_crypto_meta()
+            body_key = self.crypto.create_random_key()
+            # wrap the body key with object key
+            self.body_crypto_meta['body_key'] = self.crypto.wrap_key(
+                self.keys['object'], body_key)
+            self.body_crypto_meta['key_id'] = self.keys['id']
+            self.body_crypto_ctxt = self.crypto.create_encryption_ctxt(
+                body_key, self.body_crypto_meta.get('iv'))
+            self.plaintext_md5 = md5(usedforsecurity=False)
+            self.ciphertext_md5 = md5(usedforsecurity=False)
+
+    def install_footers_callback(self, req):
+        # the proxy controller will call back for footer metadata after
+        # body has been sent
+        inner_callback = req.environ.get('swift.callback.update_footers')
+        # remove any Etag from headers, it won't be valid for ciphertext and
+        # we'll send the ciphertext Etag later in footer metadata
+        client_etag = req.headers.pop('etag', None)
+        override_header = get_container_update_override_key('etag')
+        container_listing_etag_header = req.headers.get(override_header)
+
+        def footers_callback(footers):
+            if inner_callback:
+                # pass on footers dict to any other callback that was
+                # registered before this one. It may override any footers that
+                # were set.
+                inner_callback(footers)
+
+            plaintext_etag = None
+            if self.body_crypto_ctxt:
+                plaintext_etag = self.plaintext_md5.hexdigest()
+                # If client (or other middleware) supplied etag, then validate
+                # against plaintext etag
+                etag_to_check = footers.get('Etag') or client_etag
+                if (etag_to_check is not None and
+                        plaintext_etag != etag_to_check):
+                    raise HTTPUnprocessableEntity(request=Request(self.env))
+
+                # override any previous notion of etag with the ciphertext etag
+                footers['Etag'] = self.ciphertext_md5.hexdigest()
+
+                # Encrypt the plaintext etag using the object key and persist
+                # as sysmeta along with the crypto parameters that were used.
+                encrypted_etag, etag_crypto_meta = encrypt_header_val(
+                    self.crypto, plaintext_etag, self.keys['object'])
+                footers['X-Object-Sysmeta-Crypto-Etag'] = \
+                    append_crypto_meta(encrypted_etag, etag_crypto_meta)
+                footers['X-Object-Sysmeta-Crypto-Body-Meta'] = \
+                    dump_crypto_meta(self.body_crypto_meta)
+
+                # Also add an HMAC of the etag for use when evaluating
+                # conditional requests
+                footers['X-Object-Sysmeta-Crypto-Etag-Mac'] = _hmac_etag(
+                    self.keys['object'], plaintext_etag)
+            else:
+                # No data was read from body, nothing was encrypted, so don't
+                # set any crypto sysmeta for the body, but do re-instate any
+                # etag provided in inbound request if other middleware has not
+                # already set a value.
+                if client_etag is not None:
+                    footers.setdefault('Etag', client_etag)
+
+            # When deciding on the etag that should appear in container
+            # listings, look for:
+            #   * override in the footer, otherwise
+            #   * override in the header, and finally
+            #   * MD5 of the plaintext received
+            # This may be None if no override was set and no data was read. An
+            # override value of '' will be passed on.
+            container_listing_etag = footers.get(
+                override_header, container_listing_etag_header)
+
+            if container_listing_etag is None:
+                container_listing_etag = plaintext_etag
+
+            if (container_listing_etag and
+                    (container_listing_etag != MD5_OF_EMPTY_STRING or
+                     plaintext_etag)):
+                # Encrypt the container-listing etag using the container key
+                # and a random IV, and use it to override the container update
+                # value, with the crypto parameters appended. We use the
+                # container key here so that only that key is required to
+                # decrypt all etag values in a container listing when handling
+                # a container GET request. Don't encrypt an MD5_OF_EMPTY_STRING
+                # unless there actually was some body content, in which case
+                # the container-listing etag is possibly conveying some
+                # non-obvious information.
+                val, crypto_meta = encrypt_header_val(
+                    self.crypto, container_listing_etag,
+                    self.keys['container'])
+                crypto_meta['key_id'] = self.keys['id']
+                footers[override_header] = \
+                    append_crypto_meta(val, crypto_meta)
+            # else: no override was set and no data was read
+
+        req.environ['swift.callback.update_footers'] = footers_callback
+
+    def chunk_update(self, chunk, eof, *args, **kwargs):
+        if chunk:
+            self._init_encryption_context()
+            self.plaintext_md5.update(chunk)
+            # Encrypt one chunk at a time
+            ciphertext = self.body_crypto_ctxt.update(chunk)
+            self.ciphertext_md5.update(ciphertext)
+            return ciphertext
+
+        return chunk
+
+
+class EncrypterObjContext(CryptoWSGIContext):
+    def __init__(self, encrypter, logger):
+        super(EncrypterObjContext, self).__init__(
+            encrypter, 'object', logger)
+
+    def _check_headers(self, req):
+        # Check the user-metadata length before encrypting and encoding
+        error_response = check_metadata(req, self.server_type)
+        if error_response:
+            raise error_response
+
+    def encrypt_user_metadata(self, req, keys):
+        """
+        Encrypt user-metadata header values. Replace each x-object-meta-<key>
+        user metadata header with a corresponding
+        x-object-transient-sysmeta-crypto-meta-<key> header which has the
+        crypto metadata required to decrypt appended to the encrypted value.
+
+        :param req: a swob Request
+        :param keys: a dict of encryption keys
+        """
+        prefix = get_object_transient_sysmeta('crypto-meta-')
+        user_meta_headers = [h for h in req.headers.items() if
+                             is_user_meta(self.server_type, h[0]) and h[1]]
+        crypto_meta = None
+        for name, val in user_meta_headers:
+            short_name = strip_user_meta_prefix(self.server_type, name)
+            new_name = prefix + short_name
+            enc_val, crypto_meta = encrypt_header_val(
+                self.crypto, val, keys[self.server_type])
+            req.headers[new_name] = append_crypto_meta(enc_val, crypto_meta)
+            req.headers.pop(name)
+        # store a single copy of the crypto meta items that are common to all
+        # encrypted user metadata independently of any such meta that is stored
+        # with the object body because it might change on a POST. This is done
+        # for future-proofing - the meta stored here is not currently used
+        # during decryption.
+        if crypto_meta:
+            meta = dump_crypto_meta({'cipher': crypto_meta['cipher'],
+                                     'key_id': keys['id']})
+            req.headers[get_object_transient_sysmeta('crypto-meta')] = meta
+
+    def handle_put(self, req, start_response):
+        self._check_headers(req)
+        keys = self.get_keys(req.environ, required=['object', 'container'])
+        self.encrypt_user_metadata(req, keys)
+
+        enc_input_proxy = EncInputWrapper(self.crypto, keys, req, self.logger)
+        req.environ['wsgi.input'] = enc_input_proxy
+
+        resp = self._app_call(req.environ)
+
+        # If an etag is in the response headers and a plaintext etag was
+        # calculated, then overwrite the response value with the plaintext etag
+        # provided it matches the ciphertext etag. If it does not match then do
+        # not overwrite and allow the response value to return to client.
+        mod_resp_headers = self._response_headers
+        if (is_success(self._get_status_int()) and
+                enc_input_proxy.plaintext_md5):
+            plaintext_etag = enc_input_proxy.plaintext_md5.hexdigest()
+            ciphertext_etag = enc_input_proxy.ciphertext_md5.hexdigest()
+            mod_resp_headers = [
+                (h, v if (h.lower() != 'etag' or
+                          normalize_etag(v) != ciphertext_etag)
+                    else plaintext_etag)
+                for h, v in mod_resp_headers]
+
+        start_response(self._response_status, mod_resp_headers,
+                       self._response_exc_info)
+        return resp
+
+    def handle_post(self, req, start_response):
+        """
+        Encrypt the new object headers with a new iv and the current crypto.
+        Note that an object may have encrypted headers while the body may
+        remain unencrypted.
+        """
+        self._check_headers(req)
+        keys = self.get_keys(req.environ)
+        self.encrypt_user_metadata(req, keys)
+
+        resp = self._app_call(req.environ)
+        start_response(self._response_status, self._response_headers,
+                       self._response_exc_info)
+        return resp
+
+    @contextmanager
+    def _mask_conditional_etags(self, req, header_name):
+        """
+        Calculate HMACs of etags in header value and append to existing list.
+        The HMACs are calculated in the same way as was done for the object
+        plaintext etag to generate the value of
+        X-Object-Sysmeta-Crypto-Etag-Mac when the object was PUT. The object
+        server can therefore use these HMACs to evaluate conditional requests.
+        HMACs of the etags are appended for the current root secrets and
+        historic root secrets because it is not known which of them may have
+        been used to generate the on-disk etag HMAC.
+
+        The existing etag values are left in the list of values to match in
+        case the object was not encrypted when it was PUT. It is unlikely that
+        a masked etag value would collide with an unmasked value.
+
+        :param req: an instance of swob.Request
+        :param header_name: name of header that has etags to mask
+        :return: True if any etags were masked, False otherwise
+        """
+        masked = False
+        old_etags = req.headers.get(header_name)
+        if old_etags:
+            all_keys = self.get_multiple_keys(req.environ)
+            new_etags = []
+            for etag in Match(old_etags).tags:
+                if etag == '*':
+                    new_etags.append(etag)
+                    continue
+                new_etags.append('"%s"' % etag)
+                for keys in all_keys:
+                    masked_etag = _hmac_etag(keys['object'], etag)
+                    new_etags.append('"%s"' % masked_etag)
+                masked = True
+
+            req.headers[header_name] = ', '.join(new_etags)
+
+        try:
+            yield masked
+        finally:
+            if old_etags:
+                req.headers[header_name] = old_etags
+
+    def handle_get_or_head(self, req, start_response):
+        with self._mask_conditional_etags(req, 'If-Match') as masked1:
+            with self._mask_conditional_etags(req, 'If-None-Match') as masked2:
+                if masked1 or masked2:
+                    update_etag_is_at_header(
+                        req, 'X-Object-Sysmeta-Crypto-Etag-Mac')
+                resp = self._app_call(req.environ)
+                start_response(self._response_status, self._response_headers,
+                               self._response_exc_info)
+        return resp
+
+
+class Encrypter(object):
+    """Middleware for encrypting data and user metadata.
+
+    By default all PUT or POST'ed object data and/or metadata will be
+    encrypted. Encryption of new data and/or metadata may be disabled by
+    setting the ``disable_encryption`` option to True. However, this middleware
+    should remain in the pipeline in order for existing encrypted data to be
+    read.
+    """
+
+    def __init__(self, app, conf):
+        self.app = app
+        self.logger = get_logger(conf, log_route="encrypter")
+        self.crypto = Crypto(conf)
+        self.disable_encryption = config_true_value(
+            conf.get('disable_encryption', 'false'))
+
+    def __call__(self, env, start_response):
+        # If override is set in env, then just pass along
+        if config_true_value(env.get('swift.crypto.override')):
+            return self.app(env, start_response)
+
+        req = Request(env)
+
+        if self.disable_encryption and req.method in ('PUT', 'POST'):
+            return self.app(env, start_response)
+        try:
+            req.split_path(4, 4, True)
+            is_object_request = True
+        except ValueError:
+            is_object_request = False
+        if not is_object_request:
+            return self.app(env, start_response)
+
+        if req.method in ('GET', 'HEAD'):
+            handler = EncrypterObjContext(self, self.logger).handle_get_or_head
+        elif req.method == 'PUT':
+            handler = EncrypterObjContext(self, self.logger).handle_put
+        elif req.method == 'POST':
+            handler = EncrypterObjContext(self, self.logger).handle_post
+        else:
+            # anything else
+            return self.app(env, start_response)
+
+        try:
+            return handler(req, start_response)
+        except HTTPException as err_resp:
+            return err_resp(env, start_response)
diff --git a/swift/common/middleware/crypto/keymaster.py b/swift/common/middleware/crypto/keymaster.py
new file mode 100644
index 0000000000..cea9fc62ff
--- /dev/null
+++ b/swift/common/middleware/crypto/keymaster.py
@@ -0,0 +1,385 @@
+# Copyright (c) 2015 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import hashlib
+import hmac
+
+from swift.common.exceptions import UnknownSecretIdError
+from swift.common.middleware.crypto.crypto_utils import CRYPTO_KEY_CALLBACK
+from swift.common.swob import Request, HTTPException, wsgi_to_str, str_to_wsgi
+from swift.common.utils import readconf, strict_b64decode, get_logger, \
+    split_path, load_multikey_opts
+from swift.common.wsgi import WSGIContext
+
+
+class KeyMasterContext(WSGIContext):
+    """
+    The simple scheme for key derivation is as follows: every path is
+    associated with a key, where the key is derived from the path itself in a
+    deterministic fashion such that the key does not need to be stored.
+    Specifically, the key for any path is an HMAC of a root key and the path
+    itself, calculated using an SHA256 hash function::
+
+      <path_key> = HMAC_SHA256(<root_secret>, <path>)
+    """
+    def __init__(self, keymaster, account, container, obj,
+                 meta_version_to_write='2'):
+        """
+        :param keymaster: a Keymaster instance
+        :param account: account name
+        :param container: container name
+        :param obj: object name
+        """
+        super(KeyMasterContext, self).__init__(keymaster.app)
+        self.keymaster = keymaster
+        self.account = account
+        self.container = container
+        self.obj = obj
+        self._keys = {}
+        self.alternate_fetch_keys = None
+        self.meta_version_to_write = meta_version_to_write
+
+    def _make_key_id(self, path, secret_id, version):
+        if version in ('1', '2'):
+            path = str_to_wsgi(path)
+        key_id = {'v': version, 'path': path}
+        if secret_id:
+            # stash secret_id so that decrypter can pass it back to get the
+            # same keys
+            key_id['secret_id'] = secret_id
+        return key_id
+
+    def fetch_crypto_keys(self, key_id=None, *args, **kwargs):
+        """
+        Setup container and object keys based on the request path.
+
+        Keys are derived from request path. The 'id' entry in the results dict
+        includes the part of the path used to derive keys. Other keymaster
+        implementations may use a different strategy to generate keys and may
+        include a different type of 'id', so callers should treat the 'id' as
+        opaque keymaster-specific data.
+
+        :param key_id: if given this should be a dict with the items included
+            under the ``id`` key of a dict returned by this method.
+        :returns: A dict containing encryption keys for 'object' and
+          'container', and entries 'id' and 'all_ids'. The 'all_ids' entry is a
+          list of key id dicts for all root secret ids including the one used
+          to generate the returned keys.
+        """
+        if key_id:
+            secret_id = key_id.get('secret_id')
+            version = key_id['v']
+            if version not in ('1', '2', '3'):
+                raise ValueError('Unknown key_id version: %s' % version)
+
+            if version == '1' and not key_id['path'].startswith(
+                    '/' + self.account + '/'):
+                # Well shoot. This was the bug that made us notice we needed
+                # a v2! Hope the current account/container was the original!
+                key_acct, key_cont, key_obj = (
+                    self.account, self.container, key_id['path'])
+            else:
+                key_acct, key_cont, key_obj = split_path(
+                    key_id['path'], 1, 3, True)
+
+            check_path = (
+                self.account, self.container or key_cont, self.obj or key_obj)
+            if version in ('1', '2') and (
+                    key_acct, key_cont, key_obj) != check_path:
+                # Older py3 proxies may have written down crypto meta as WSGI
+                # strings; we still need to be able to read that
+                try:
+                    alt_path = tuple(
+                        part.encode('latin1').decode('utf-8')
+                        for part in (key_acct, key_cont, key_obj))
+                except UnicodeError:
+                    # Well, it was worth a shot
+                    pass
+                else:
+                    if check_path == alt_path or (
+                            check_path[:2] == alt_path[:2] and not self.obj):
+                        # This object is affected by bug #1888037
+                        key_acct, key_cont, key_obj = alt_path
+
+            if (key_acct, key_cont, key_obj) != check_path:
+                # Pipeline may have been misconfigured, with copy right of
+                # encryption. In that case, path in meta may not be the
+                # request path.
+                self.keymaster.logger.info(
+                    "Path stored in meta (%r) does not match path from "
+                    "request (%r)! Using path from meta.",
+                    key_id['path'],
+                    '/' + '/'.join(x for x in [
+                        self.account, self.container, self.obj] if x))
+        else:
+            secret_id = self.keymaster.active_secret_id
+            # v1 had a bug where we would claim the path was just the object
+            # name if the object started with a slash.
+            # v1 and v2 had a bug on py3 where we'd write the path in meta as
+            # a WSGI string (ie, as Latin-1 chars decoded from UTF-8 bytes).
+            # Bump versions to establish that we can trust the path.
+            version = self.meta_version_to_write
+            key_acct, key_cont, key_obj = (
+                self.account, self.container, self.obj)
+
+        if (secret_id, version) in self._keys:
+            return self._keys[(secret_id, version)]
+
+        keys = {}
+        account_path = '/' + key_acct
+
+        try:
+            # self.account/container/obj reflect the level of the *request*,
+            # which may be different from the level of the key_id-path. Only
+            # fetch the keys that the request needs.
+            if self.container:
+                path = account_path + '/' + key_cont
+                keys['container'] = self.keymaster.create_key(
+                    path, secret_id=secret_id)
+
+                if self.obj:
+                    if key_obj.startswith('/') and version == '1':
+                        path = key_obj
+                    else:
+                        path = path + '/' + key_obj
+                    keys['object'] = self.keymaster.create_key(
+                        path, secret_id=secret_id)
+
+                # For future-proofing include a keymaster version number and
+                # the path used to derive keys in the 'id' entry of the
+                # results. The encrypter will persist this as part of the
+                # crypto-meta for encrypted data and metadata. If we ever
+                # change the way keys are generated then the decrypter could
+                # pass the persisted 'id' value when it calls fetch_crypto_keys
+                # to inform the keymaster as to how that particular data or
+                # metadata had its keys generated. Currently we have no need to
+                # do that, so we are simply persisting this information for
+                # future use.
+                keys['id'] = self._make_key_id(path, secret_id, version)
+                # pass back a list of key id dicts for all other secret ids in
+                # case the caller is interested, in which case the caller can
+                # call this method again for different secret ids; this avoided
+                # changing the return type of the callback or adding another
+                # callback. Note that the caller should assume no knowledge of
+                # the content of these key id dicts.
+                keys['all_ids'] = [self._make_key_id(path, id_, version)
+                                   for id_ in self.keymaster.root_secret_ids]
+                if self.alternate_fetch_keys:
+                    alternate_keys = self.alternate_fetch_keys(
+                        key_id=None, *args, **kwargs)
+                    keys['all_ids'].extend(alternate_keys.get('all_ids', []))
+
+                self._keys[(secret_id, version)] = keys
+
+            return keys
+        except UnknownSecretIdError:
+            if self.alternate_fetch_keys:
+                return self.alternate_fetch_keys(key_id, *args, **kwargs)
+            raise
+
+    def handle_request(self, req, start_response):
+        self.alternate_fetch_keys = req.environ.get(CRYPTO_KEY_CALLBACK)
+        req.environ[CRYPTO_KEY_CALLBACK] = self.fetch_crypto_keys
+        resp = self._app_call(req.environ)
+        start_response(self._response_status, self._response_headers,
+                       self._response_exc_info)
+        return resp
+
+
+class BaseKeyMaster(object):
+    """Base middleware for providing encryption keys.
+
+    This provides some basic helpers for:
+
+    - loading from a separate config path,
+    - deriving keys based on path, and
+    - installing a ``swift.callback.fetch_crypto_keys`` hook
+      in the request environment.
+
+    Subclasses should define ``log_route``, ``keymaster_opts``, and
+    ``keymaster_conf_section`` attributes, and implement the
+    ``_get_root_secret`` function.
+    """
+    @property
+    def log_route(self):
+        raise NotImplementedError
+
+    @property
+    def keymaster_opts(self):
+        raise NotImplementedError
+
+    @property
+    def keymaster_conf_section(self):
+        raise NotImplementedError
+
+    def _get_root_secret(self, conf):
+        raise NotImplementedError
+
+    def __init__(self, app, conf):
+        self.app = app
+        self.logger = get_logger(conf, log_route=self.log_route)
+        self.keymaster_config_path = conf.get('keymaster_config_path')
+        conf = self._load_keymaster_config_file(conf)
+
+        # The _get_root_secret() function is overridden by other keymasters
+        # which may historically only return a single value
+        self._root_secrets = self._get_root_secret(conf)
+        if not isinstance(self._root_secrets, dict):
+            self._root_secrets = {None: self._root_secrets}
+        self.active_secret_id = conf.get('active_root_secret_id') or None
+        if self.active_secret_id not in self._root_secrets:
+            raise ValueError('No secret loaded for active_root_secret_id %s' %
+                             self.active_secret_id)
+        for secret_id, secret in self._root_secrets.items():
+            if not isinstance(secret, bytes):
+                raise ValueError('Secret with id %s is %s, not bytes' % (
+                    secret_id, type(secret)))
+
+        self.meta_version_to_write = conf.get('meta_version_to_write') or '2'
+        if self.meta_version_to_write not in ('1', '2', '3'):
+            raise ValueError('Unknown/unsupported metadata version: %r' %
+                             self.meta_version_to_write)
+
+    @property
+    def root_secret(self):
+        # Returns the default root secret; this is here for historical reasons
+        # to support tests and any third party code that might have used it
+        return self._root_secrets.get(self.active_secret_id)
+
+    @property
+    def root_secret_ids(self):
+        # Only sorted to simplify testing
+        return sorted(self._root_secrets.keys(), key=lambda x: x or '')
+
+    def _load_keymaster_config_file(self, conf):
+        if not self.keymaster_config_path:
+            return conf
+
+        # Keymaster options specified in the filter section would be ignored if
+        # a separate keymaster config file is specified. To avoid confusion,
+        # prohibit them existing in the filter section.
+        bad_opts = []
+        for opt in conf:
+            for km_opt in self.keymaster_opts:
+                if ((km_opt.endswith('*') and opt.startswith(km_opt[:-1])) or
+                        opt == km_opt):
+                    bad_opts.append(opt)
+        if bad_opts:
+            raise ValueError('keymaster_config_path is set, but there '
+                             'are other config options specified: %s' %
+                             ", ".join(bad_opts))
+        return readconf(self.keymaster_config_path,
+                        self.keymaster_conf_section)
+
+    def __call__(self, env, start_response):
+        req = Request(env)
+
+        try:
+            parts = [wsgi_to_str(part) for part in req.split_path(2, 4, True)]
+        except ValueError:
+            return self.app(env, start_response)
+
+        if req.method in ('PUT', 'POST', 'GET', 'HEAD'):
+            # handle only those request methods that may require keys
+            km_context = KeyMasterContext(
+                self, *parts[1:],
+                meta_version_to_write=self.meta_version_to_write)
+            try:
+                return km_context.handle_request(req, start_response)
+            except HTTPException as err_resp:
+                return err_resp(env, start_response)
+
+        # anything else
+        return self.app(env, start_response)
+
+    def create_key(self, path, secret_id=None):
+        """
+        Creates an encryption key that is unique for the given path.
+
+        :param path: the (WSGI string) path of the resource being encrypted.
+        :param secret_id: the id of the root secret from which the key should
+            be derived.
+        :return: an encryption key.
+        :raises UnknownSecretIdError: if the secret_id is not recognised.
+        """
+        try:
+            key = self._root_secrets[secret_id]
+        except KeyError:
+            self.logger.warning('Unrecognised secret id: %s' % secret_id)
+            raise UnknownSecretIdError(secret_id)
+        else:
+            path = path.encode('utf-8')
+            return hmac.new(key, path, digestmod=hashlib.sha256).digest()
+
+
+class KeyMaster(BaseKeyMaster):
+    """Middleware for providing encryption keys.
+
+    The middleware requires its encryption root secret to be set. This is the
+    root secret from which encryption keys are derived. This must be set before
+    first use to a value that is at least 256 bits. The security of all
+    encrypted data critically depends on this key, therefore it should be set
+    to a high-entropy value. For example, a suitable value may be obtained by
+    generating a 32 byte (or longer) value using a cryptographically secure
+    random number generator. Changing the root secret is likely to result in
+    data loss.
+    """
+    log_route = 'keymaster'
+    keymaster_opts = ('encryption_root_secret*', 'active_root_secret_id')
+    keymaster_conf_section = 'keymaster'
+
+    def _get_root_secret(self, conf):
+        """
+        This keymaster requires ``encryption_root_secret[_id]`` options to be
+        set. At least one must be set before first use to a value that is a
+        base64 encoding of at least 32 bytes. The encryption root secrets are
+        specified in either proxy-server.conf, or in an external file
+        referenced from proxy-server.conf using ``keymaster_config_path``.
+
+        :param conf: the keymaster config section from proxy-server.conf
+        :type conf: dict
+
+        :return: a dict mapping secret ids to encryption root secret binary
+            bytes
+        :rtype: dict
+        """
+        root_secrets = {}
+        for opt, secret_id, value in load_multikey_opts(
+                conf, 'encryption_root_secret', allow_none_key=True):
+            try:
+                secret = self._decode_root_secret(value)
+            except ValueError:
+                raise ValueError(
+                    '%s option in %s must be a base64 encoding of at '
+                    'least 32 raw bytes' %
+                    (opt, self.keymaster_config_path or 'proxy-server.conf'))
+            root_secrets[secret_id] = secret
+        return root_secrets
+
+    def _decode_root_secret(self, b64_root_secret):
+        binary_root_secret = strict_b64decode(b64_root_secret,
+                                              allow_line_breaks=True)
+        if len(binary_root_secret) < 32:
+            raise ValueError
+        return binary_root_secret
+
+
+def filter_factory(global_conf, **local_conf):
+    conf = global_conf.copy()
+    conf.update(local_conf)
+
+    def keymaster_filter(app):
+        return KeyMaster(app, conf)
+
+    return keymaster_filter
diff --git a/swift/common/middleware/crypto/kmip_keymaster.py b/swift/common/middleware/crypto/kmip_keymaster.py
new file mode 100644
index 0000000000..9bc9b79964
--- /dev/null
+++ b/swift/common/middleware/crypto/kmip_keymaster.py
@@ -0,0 +1,178 @@
+# -*- coding: utf-8 -*-
+#  Copyright (c) 2018 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import logging
+import os
+
+from swift.common.middleware.crypto import keymaster
+from swift.common.utils import LogLevelFilter, load_multikey_opts
+
+from kmip.pie.client import ProxyKmipClient
+
+"""
+This middleware enables Swift to fetch a root secret from a KMIP service.
+The root secret is expected to have been previously created in the KMIP service
+and is referenced by its unique identifier. The secret should be an AES-256
+symmetric key.
+
+To use this middleware, edit the swift proxy-server.conf to insert the
+middleware in the wsgi pipeline, replacing any other keymaster middleware::
+
+    [pipeline:main]
+    pipeline = catch_errors gatekeeper healthcheck proxy-logging \
+        <other middleware> kmip_keymaster encryption proxy-logging proxy-server
+
+and add a new filter section::
+
+    [filter:kmip_keymaster]
+    use = egg:swift#kmip_keymaster
+    key_id = <unique id of secret to be fetched from the KMIP service>
+    key_id_<secret_id> = <unique id of additional secret to be fetched>
+    active_root_secret_id = <secret_id to be used for new encryptions>
+    host = <KMIP server host>
+    port = <KMIP server port>
+    certfile = /path/to/client/cert.pem
+    keyfile = /path/to/client/key.pem
+    ca_certs = /path/to/server/cert.pem
+    username = <KMIP username>
+    password = <KMIP password>
+
+Apart from ``use``, ``key_id*``, ``active_root_secret_id`` the options are
+as defined for a PyKMIP client. The authoritative definition of these options
+can be found at `https://pykmip.readthedocs.io/en/latest/client.html`_
+
+The value of each ``key_id*`` option should be a unique identifier for a secret
+to be retrieved from the KMIP service. Any of these secrets may be used for
+*decryption*.
+
+The value of the ``active_root_secret_id`` option should be the ``secret_id``
+for the secret that should be used for all new *encryption*. If not specified,
+the ``key_id`` secret will be used.
+
+.. note::
+
+    To ensure there is no loss of data availability, deploying a new key to
+    your cluster requires a two-stage config change. First, add the new key
+    to the ``key_id_<secret_id>`` option and restart the proxy-server. Do this
+    for all proxies. Next, set the ``active_root_secret_id`` option to the
+    new secret id and restart the proxy. Again, do this for all proxies. This
+    process ensures that all proxies will have the new key available for
+    *decryption* before any proxy uses it for *encryption*.
+
+The keymaster configuration can alternatively be defined in a separate config
+file by using the ``keymaster_config_path`` option::
+
+    [filter:kmip_keymaster]
+    use = egg:swift#kmip_keymaster
+    keymaster_config_path=/etc/swift/kmip_keymaster.conf
+
+In this case, the ``filter:kmip_keymaster`` section should contain no other
+options than ``use`` and ``keymaster_config_path``. All other options should be
+defined in the separate config file in a section named ``kmip_keymaster``. For
+example::
+
+    [kmip_keymaster]
+    key_id = 1234567890
+    key_id_foo = 2468024680
+    key_id_bar = 1357913579
+    active_root_secret_id = foo
+    host = 127.0.0.1
+    port = 5696
+    certfile = /etc/swift/kmip_client.crt
+    keyfile = /etc/swift/kmip_client.key
+    ca_certs = /etc/swift/kmip_server.crt
+    username = swift
+    password = swift_password
+"""
+
+
+class KmipKeyMaster(keymaster.BaseKeyMaster):
+    log_route = 'kmip_keymaster'
+    keymaster_opts = ('host', 'port', 'certfile', 'keyfile',
+                      'ca_certs', 'username', 'password',
+                      'active_root_secret_id', 'key_id*')
+    keymaster_conf_section = 'kmip_keymaster'
+
+    def _load_keymaster_config_file(self, conf):
+        conf = super(KmipKeyMaster, self)._load_keymaster_config_file(conf)
+        if self.keymaster_config_path:
+            section = self.keymaster_conf_section
+        else:
+            # __name__ is just the filter name, not the whole section name.
+            # Luckily, PasteDeploy only uses the one prefix for filters.
+            section = 'filter:' + conf['__name__']
+
+        if os.path.isdir(conf['__file__']):
+            raise ValueError(
+                'KmipKeyMaster config cannot be read from conf dir %s. Use '
+                'keymaster_config_path option in the proxy server config to '
+                'specify a config file.')
+
+        # Make sure we've got the kmip log handler set up before
+        # we instantiate a client
+        kmip_logger = logging.getLogger('kmip')
+        for handler in self.logger.logger.handlers:
+            kmip_logger.addHandler(handler)
+
+        debug_filter = LogLevelFilter(logging.DEBUG)
+        for name in (
+                # The kmip_protocol logger includes hex-encoded data off the
+                # wire, which may include key material!! We *NEVER* want that
+                # enabled.
+                'kmip.services.server.kmip_protocol',
+                # The config_helper logger includes any password that may be
+                # provided, which doesn't seem great either.
+                'kmip.core.config_helper',
+        ):
+            logging.getLogger(name).addFilter(debug_filter)
+
+        self.proxy_kmip_client = ProxyKmipClient(
+            config=section,
+            config_file=conf['__file__']
+        )
+        return conf
+
+    def _get_root_secret(self, conf):
+        multikey_opts = load_multikey_opts(conf, 'key_id', allow_none_key=True)
+        kmip_to_secret = {}
+        root_secrets = {}
+        with self.proxy_kmip_client as client:
+            for opt, secret_id, kmip_id in multikey_opts:
+                if kmip_id in kmip_to_secret:
+                    # Save some round trips if there are multiple
+                    # secret_ids for a single kmip_id
+                    root_secrets[secret_id] = root_secrets[
+                        kmip_to_secret[kmip_id]]
+                    continue
+                secret = client.get(kmip_id)
+                algo = secret.cryptographic_algorithm.name
+                length = secret.cryptographic_length
+                if (algo, length) != ('AES', 256):
+                    raise ValueError(
+                        'Expected key %s to be an AES-256 key, not %s-%d' % (
+                            kmip_id, algo, length))
+                root_secrets[secret_id] = secret.value
+                kmip_to_secret.setdefault(kmip_id, secret_id)
+        return root_secrets
+
+
+def filter_factory(global_conf, **local_conf):
+    conf = global_conf.copy()
+    conf.update(local_conf)
+
+    def keymaster_filter(app):
+        return KmipKeyMaster(app, conf)
+
+    return keymaster_filter
diff --git a/swift/common/middleware/crypto/kms_keymaster.py b/swift/common/middleware/crypto/kms_keymaster.py
new file mode 100644
index 0000000000..a44a219d7f
--- /dev/null
+++ b/swift/common/middleware/crypto/kms_keymaster.py
@@ -0,0 +1,122 @@
+# Copyright (c) 2016 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from castellan import key_manager, options
+from castellan.common.credentials import keystone_password
+from oslo_config import cfg
+from swift.common.middleware.crypto.keymaster import BaseKeyMaster
+from swift.common.utils import load_multikey_opts
+
+
+class KmsKeyMaster(BaseKeyMaster):
+    """Middleware for retrieving a encryption root secret from an external KMS.
+
+    The middleware accesses the encryption root secret from an external key
+    management system (KMS), e.g., a Barbican service, using Castellan. To be
+    able to do so, the appropriate configuration options shall be set in the
+    proxy-server.conf file, or in the configuration pointed to using the
+    keymaster_config_path configuration value in the proxy-server.conf file.
+    """
+    log_route = 'kms_keymaster'
+    keymaster_opts = ('username', 'password', 'project_name',
+                      'user_domain_name', 'project_domain_name',
+                      'user_id', 'user_domain_id', 'trust_id',
+                      'domain_id', 'domain_name', 'project_id',
+                      'project_domain_id', 'reauthenticate',
+                      'auth_endpoint', 'api_class', 'key_id*',
+                      'barbican_endpoint', 'barbican_region_name',
+                      'active_root_secret_id')
+    keymaster_conf_section = 'kms_keymaster'
+
+    def _get_root_secret(self, conf):
+        """
+        Retrieve the root encryption secret from an external key management
+        system using Castellan.
+
+        :param conf: the keymaster config section from proxy-server.conf
+        :type conf: dict
+
+        :return: the encryption root secret binary bytes
+        :rtype: bytearray
+        """
+        ctxt = keystone_password.KeystonePassword(
+            auth_url=conf.get('auth_endpoint'),
+            username=conf.get('username'),
+            password=conf.get('password'),
+            project_name=conf.get('project_name'),
+            user_domain_name=conf.get('user_domain_name'),
+            project_domain_name=conf.get(
+                'project_domain_name'),
+            user_id=conf.get('user_id'),
+            user_domain_id=conf.get('user_domain_id'),
+            trust_id=conf.get('trust_id'),
+            domain_id=conf.get('domain_id'),
+            domain_name=conf.get('domain_name'),
+            project_id=conf.get('project_id'),
+            project_domain_id=conf.get('project_domain_id'),
+            reauthenticate=conf.get('reauthenticate'))
+        oslo_conf = cfg.ConfigOpts()
+        options.set_defaults(
+            oslo_conf, auth_endpoint=conf.get('auth_endpoint'),
+            barbican_endpoint=conf.get('barbican_endpoint'),
+            api_class=conf.get('api_class')
+        )
+        # Set barbican_region_name if provided in config
+        # This is used by Castellan's BarbicanKeyManager for endpoint discovery
+        if conf.get('barbican_region_name'):
+            oslo_conf.set_default('barbican_region_name',
+                                  conf.get('barbican_region_name'),
+                                  group='barbican')
+        options.enable_logging()
+        manager = key_manager.API(oslo_conf)
+
+        root_secrets = {}
+        for opt, secret_id, key_id in load_multikey_opts(
+                conf, 'key_id', allow_none_key=True):
+            key = manager.get(ctxt, key_id)
+            if key is None:
+                raise ValueError("Retrieval of encryption root secret with "
+                                 "key_id '%s' returned None."
+                                 % (key_id, ))
+            try:
+                if (key.bit_length < 256) or (key.algorithm.lower() != "aes"):
+                    raise ValueError('encryption root secret stored in the '
+                                     'external KMS must be an AES key of at '
+                                     'least 256 bits (provided key '
+                                     'length: %d, provided key algorithm: %s)'
+                                     % (key.bit_length, key.algorithm))
+                if (key.format != 'RAW'):
+                    raise ValueError('encryption root secret stored in the '
+                                     'external KMS must be in RAW format and '
+                                     'not e.g., as a base64 encoded string '
+                                     '(format of key with uuid %s: %s)' %
+                                     (key_id, key.format))
+            except Exception:
+                raise ValueError("Secret with key_id '%s' is not a symmetric "
+                                 "key (type: %s)" % (key_id, str(type(key))))
+            secret = key.get_encoded()
+            if not isinstance(secret, bytes):
+                secret = secret.encode('utf-8')
+            root_secrets[secret_id] = secret
+        return root_secrets
+
+
+def filter_factory(global_conf, **local_conf):
+    conf = global_conf.copy()
+    conf.update(local_conf)
+
+    def kms_keymaster_filter(app):
+        return KmsKeyMaster(app, conf)
+
+    return kms_keymaster_filter
diff --git a/swift/common/middleware/dlo.py b/swift/common/middleware/dlo.py
new file mode 100644
index 0000000000..1b41ac9091
--- /dev/null
+++ b/swift/common/middleware/dlo.py
@@ -0,0 +1,470 @@
+# Copyright (c) 2013 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""
+Middleware that will provide Dynamic Large Object (DLO) support.
+
+---------------
+Using ``swift``
+---------------
+
+The quickest way to try out this feature is use the ``swift`` Swift Tool
+included with the `python-swiftclient`_ library.  You can use the ``-S``
+option to specify the segment size to use when splitting a large file. For
+example::
+
+    swift upload test_container -S 1073741824 large_file
+
+This would split the large_file into 1G segments and begin uploading those
+segments in parallel. Once all the segments have been uploaded, ``swift`` will
+then create the manifest file so the segments can be downloaded as one.
+
+So now, the following ``swift`` command would download the entire large
+object::
+
+    swift download test_container large_file
+
+``swift`` command uses a strict convention for its segmented object
+support. In the above example it will upload all the segments into a
+second container named test_container_segments. These segments will
+have names like large_file/1290206778.25/21474836480/00000000,
+large_file/1290206778.25/21474836480/00000001, etc.
+
+The main benefit for using a separate container is that the main container
+listings will not be polluted with all the segment names. The reason for using
+the segment name format of <name>/<timestamp>/<size>/<segment> is so that an
+upload of a new file with the same name won't overwrite the contents of the
+first until the last moment when the manifest file is updated.
+
+``swift`` will manage these segment files for you, deleting old segments on
+deletes and overwrites, etc. You can override this behavior with the
+``--leave-segments`` option if desired; this is useful if you want to have
+multiple versions of the same large object available.
+
+.. _`python-swiftclient`: http://github.com/openstack/python-swiftclient
+
+----------
+Direct API
+----------
+
+You can also work with the segments and manifests directly with HTTP
+requests instead of having ``swift`` do that for you. You can just
+upload the segments like you would any other object and the manifest
+is just a zero-byte (not enforced) file with an extra
+``X-Object-Manifest`` header.
+
+All the object segments need to be in the same container, have a common object
+name prefix, and sort in the order in which they should be concatenated.
+Object names are sorted lexicographically as UTF-8 byte strings.
+They don't have to be in the same container as the manifest file will be, which
+is useful to keep container listings clean as explained above with ``swift``.
+
+The manifest file is simply a zero-byte (not enforced) file with the extra
+``X-Object-Manifest: <container>/<prefix>`` header, where ``<container>`` is
+the container the object segments are in and ``<prefix>`` is the common prefix
+for all the segments.
+
+It is best to upload all the segments first and then create or update the
+manifest. In this way, the full object won't be available for downloading
+until the upload is complete. Also, you can upload a new set of segments to
+a second location and then update the manifest to point to this new location.
+During the upload of the new segments, the original manifest will still be
+available to download the first set of segments.
+
+.. note::
+
+    When updating a manifest object using a POST request, a
+    ``X-Object-Manifest`` header must be included for the object to
+    continue to behave as a manifest object.
+
+    The manifest file should have no content. However, this is not enforced.
+    If the manifest path itself conforms to container/prefix specified in
+    ``X-Object-Manifest``, and if manifest has some content/data in it, it
+    would also be considered as segment and manifest's content will be part of
+    the concatenated GET response. The order of concatenation follows the usual
+    DLO logic which is - the order of concatenation adheres to order returned
+    when segment names are sorted.
+
+
+Here's an example using ``curl`` with tiny 1-byte segments::
+
+    # First, upload the segments
+    curl -X PUT -H 'X-Auth-Token: <token>' \
+        http://<storage_url>/container/myobject/00000001 --data-binary '1'
+    curl -X PUT -H 'X-Auth-Token: <token>' \
+        http://<storage_url>/container/myobject/00000002 --data-binary '2'
+    curl -X PUT -H 'X-Auth-Token: <token>' \
+        http://<storage_url>/container/myobject/00000003 --data-binary '3'
+
+    # Next, create the manifest file
+    curl -X PUT -H 'X-Auth-Token: <token>' \
+        -H 'X-Object-Manifest: container/myobject/' \
+        http://<storage_url>/container/myobject --data-binary ''
+
+    # And now we can download the segments as a single object
+    curl -H 'X-Auth-Token: <token>' \
+        http://<storage_url>/container/myobject
+"""
+
+import json
+
+from swift.common import constraints
+from swift.common.exceptions import ListingIterError, SegmentError
+from swift.common.http import is_success
+from swift.common.swob import Request, Response, HTTPException, \
+    HTTPRequestedRangeNotSatisfiable, HTTPBadRequest, HTTPConflict, \
+    str_to_wsgi, wsgi_to_str, wsgi_quote, wsgi_unquote, normalize_etag
+from swift.common.utils import get_logger, \
+    RateLimitedIterator, quote, close_if_possible, closing_if_possible, \
+    drain_and_close, md5
+from swift.common.request_helpers import SegmentedIterable, \
+    update_ignore_range_header
+from swift.common.wsgi import WSGIContext, make_subrequest, load_app_config
+
+
+class GetContext(WSGIContext):
+    def __init__(self, dlo, logger):
+        super(GetContext, self).__init__(dlo.app)
+        self.dlo = dlo
+        self.logger = logger
+
+    def _get_container_listing(self, req, version, account, container,
+                               prefix, marker=''):
+        '''
+        :param version: whatever
+        :param account: native
+        :param container: native
+        :param prefix: native
+        :param marker: native
+        '''
+        con_req = make_subrequest(
+            req.environ,
+            path=wsgi_quote('/'.join([
+                '', str_to_wsgi(version),
+                str_to_wsgi(account), str_to_wsgi(container)])),
+            method='GET',
+            headers={'x-auth-token': req.headers.get('x-auth-token')},
+            agent=('%(orig)s ' + 'DLO MultipartGET'), swift_source='DLO')
+        con_req.query_string = 'prefix=%s' % quote(prefix)
+        if marker:
+            con_req.query_string += '&marker=%s' % quote(marker)
+
+        con_resp = con_req.get_response(self.dlo.app)
+        if not is_success(con_resp.status_int):
+            if req.method == 'HEAD':
+                con_resp.body = b''
+            return con_resp, None
+        with closing_if_possible(con_resp.app_iter):
+            return None, json.loads(b''.join(con_resp.app_iter))
+
+    def _segment_listing_iterator(self, req, version, account, container,
+                                  prefix, segments, first_byte=None,
+                                  last_byte=None):
+        '''
+        :param req: upstream request
+        :param version: native
+        :param account: native
+        :param container: native
+        :param prefix: native
+        :param segments: array of dicts, with native strings
+        :param first_byte: number
+        :param last_byte: number
+        '''
+        # It's sort of hokey that this thing takes in the first page of
+        # segments as an argument, but we need to compute the etag and content
+        # length from the first page, and it's better to have a hokey
+        # interface than to make redundant requests.
+        if first_byte is None:
+            first_byte = 0
+        if last_byte is None:
+            last_byte = float("inf")
+
+        while True:
+            for segment in segments:
+                seg_length = int(segment['bytes'])
+
+                if first_byte >= seg_length:
+                    # don't need any bytes from this segment
+                    first_byte = max(first_byte - seg_length, -1)
+                    last_byte = max(last_byte - seg_length, -1)
+                    continue
+                elif last_byte < 0:
+                    # no bytes are needed from this or any future segment
+                    break
+
+                seg_name = segment['name']
+
+                # We deliberately omit the etag and size here;
+                # SegmentedIterable will check size and etag if
+                # specified, but we don't want it to. DLOs only care
+                # that the objects' names match the specified prefix.
+                # SegmentedIterable will instead check that the data read
+                # from each segment matches the response headers.
+                _path = "/".join(["", version, account, container, seg_name])
+                _first = None if first_byte <= 0 else first_byte
+                _last = None if last_byte >= seg_length - 1 else last_byte
+                yield {
+                    'path': _path,
+                    'first_byte': _first,
+                    'last_byte': _last
+                }
+
+                first_byte = max(first_byte - seg_length, -1)
+                last_byte = max(last_byte - seg_length, -1)
+
+            if len(segments) < constraints.CONTAINER_LISTING_LIMIT:
+                # a short page means that we're done with the listing
+                break
+            elif last_byte < 0:
+                break
+
+            marker = segments[-1]['name']
+            error_response, segments = self._get_container_listing(
+                req, version, account, container, prefix, marker)
+            if error_response:
+                # we've already started sending the response body to the
+                # client, so all we can do is raise an exception to make the
+                # WSGI server close the connection early
+                close_if_possible(error_response.app_iter)
+                raise ListingIterError(
+                    "Got status %d listing container /%s/%s" %
+                    (error_response.status_int, account, container))
+
+    def get_or_head_response(self, req, x_object_manifest):
+        '''
+        :param req: user's request
+        :param x_object_manifest: as unquoted, native string
+        '''
+        response_headers = self._response_headers
+
+        container, obj_prefix = x_object_manifest.split('/', 1)
+
+        version, account, _junk = req.split_path(2, 3, True)
+        version = wsgi_to_str(version)
+        account = wsgi_to_str(account)
+        error_response, segments = self._get_container_listing(
+            req, version, account, container, obj_prefix)
+        if error_response:
+            return error_response
+        have_complete_listing = len(segments) < \
+            constraints.CONTAINER_LISTING_LIMIT
+
+        first_byte = last_byte = None
+        actual_content_length = None
+        content_length_for_swob_range = None
+        if req.range and len(req.range.ranges) == 1:
+            content_length_for_swob_range = sum(o['bytes'] for o in segments)
+
+            # This is a hack to handle suffix byte ranges (e.g. "bytes=-5"),
+            # which we can't honor unless we have a complete listing.
+            _junk, range_end = req.range.ranges_for_length(float("inf"))[0]
+
+            # If this is all the segments, we know whether or not this
+            # range request is satisfiable.
+            #
+            # Alternately, we may not have all the segments, but this range
+            # falls entirely within the first page's segments, so we know
+            # that it is satisfiable.
+            if (have_complete_listing
+               or range_end < content_length_for_swob_range):
+                byteranges = req.range.ranges_for_length(
+                    content_length_for_swob_range)
+                if not byteranges:
+                    headers = {'Accept-Ranges': 'bytes'}
+                    if have_complete_listing:
+                        headers['Content-Range'] = 'bytes */%d' % (
+                            content_length_for_swob_range, )
+                    return HTTPRequestedRangeNotSatisfiable(
+                        request=req, headers=headers)
+                first_byte, last_byte = byteranges[0]
+                # For some reason, swob.Range.ranges_for_length adds 1 to the
+                # last byte's position.
+                last_byte -= 1
+                actual_content_length = last_byte - first_byte + 1
+            else:
+                # The range may or may not be satisfiable, but we can't tell
+                # based on just one page of listing, and we're not going to go
+                # get more pages because that would use up too many resources,
+                # so we ignore the Range header and return the whole object.
+                actual_content_length = None
+                content_length_for_swob_range = None
+                req.range = None
+        else:
+            req.range = None
+
+        response_headers = [
+            (h, v) for h, v in response_headers
+            if h.lower() not in ("content-length", "content-range")]
+
+        if content_length_for_swob_range is not None:
+            # Here, we have to give swob a big-enough content length so that
+            # it can compute the actual content length based on the Range
+            # header. This value will not be visible to the client; swob will
+            # substitute its own Content-Length.
+            #
+            # Note: if the manifest points to at least CONTAINER_LISTING_LIMIT
+            # segments, this may be less than the sum of all the segments'
+            # sizes. However, it'll still be greater than the last byte in the
+            # Range header, so it's good enough for swob.
+            response_headers.append(('Content-Length',
+                                     str(content_length_for_swob_range)))
+        elif have_complete_listing:
+            actual_content_length = sum(o['bytes'] for o in segments)
+            response_headers.append(('Content-Length',
+                                     str(actual_content_length)))
+
+        if have_complete_listing:
+            response_headers = [(h, v) for h, v in response_headers
+                                if h.lower() != "etag"]
+            etag = md5(usedforsecurity=False)
+            for seg_dict in segments:
+                etag.update(normalize_etag(seg_dict['hash']).encode('utf8'))
+            response_headers.append(('Etag', '"%s"' % etag.hexdigest()))
+
+        app_iter = None
+        if req.method == 'GET':
+            listing_iter = RateLimitedIterator(
+                self._segment_listing_iterator(
+                    req, version, account, container, obj_prefix, segments,
+                    first_byte=first_byte, last_byte=last_byte),
+                self.dlo.rate_limit_segments_per_sec,
+                limit_after=self.dlo.rate_limit_after_segment)
+
+            app_iter = SegmentedIterable(
+                req, self.dlo.app, listing_iter, ua_suffix="DLO MultipartGET",
+                swift_source="DLO", name=req.path, logger=self.logger,
+                max_get_time=self.dlo.max_get_time,
+                response_body_length=actual_content_length)
+
+            try:
+                app_iter.validate_first_segment()
+            except HTTPException as err_resp:
+                return err_resp
+            except (SegmentError, ListingIterError):
+                return HTTPConflict(request=req)
+
+        resp = Response(request=req, headers=response_headers,
+                        conditional_response=True,
+                        app_iter=app_iter)
+
+        return resp
+
+    def handle_request(self, req, start_response):
+        """
+        Take a GET or HEAD request, and if it is for a dynamic large object
+        manifest, return an appropriate response.
+
+        Otherwise, simply pass it through.
+        """
+        update_ignore_range_header(req, 'X-Object-Manifest')
+        resp_iter = self._app_call(req.environ)
+
+        # make sure this response is for a dynamic large object manifest
+        for header, value in self._response_headers:
+            if (header.lower() == 'x-object-manifest'):
+                content_length = self._response_header_value('content-length')
+                if content_length is not None and int(content_length) < 1024:
+                    # Go ahead and consume small bodies
+                    drain_and_close(resp_iter)
+                close_if_possible(resp_iter)
+                response = self.get_or_head_response(
+                    req, wsgi_to_str(wsgi_unquote(value)))
+                return response(req.environ, start_response)
+        # Not a dynamic large object manifest; just pass it through.
+        start_response(self._response_status,
+                       self._response_headers,
+                       self._response_exc_info)
+        return resp_iter
+
+
+class DynamicLargeObject(object):
+    def __init__(self, app, conf):
+        self.app = app
+        self.logger = get_logger(conf, log_route='dlo')
+
+        # DLO functionality used to live in the proxy server, not middleware,
+        # so let's try to go find config values in the proxy's config section
+        # to ease cluster upgrades.
+        self._populate_config_from_old_location(conf)
+
+        self.max_get_time = int(conf.get('max_get_time', '86400'))
+        self.rate_limit_after_segment = int(conf.get(
+            'rate_limit_after_segment', '10'))
+        self.rate_limit_segments_per_sec = int(conf.get(
+            'rate_limit_segments_per_sec', '1'))
+
+    def _populate_config_from_old_location(self, conf):
+        if ('rate_limit_after_segment' in conf or
+                'rate_limit_segments_per_sec' in conf or
+                'max_get_time' in conf or
+                '__file__' not in conf):
+            return
+
+        proxy_conf = load_app_config(conf['__file__'])
+        for setting in ('rate_limit_after_segment',
+                        'rate_limit_segments_per_sec',
+                        'max_get_time'):
+            if setting in proxy_conf:
+                conf[setting] = proxy_conf[setting]
+
+    def __call__(self, env, start_response):
+        """
+        WSGI entry point
+        """
+        req = Request(env)
+        try:
+            vrs, account, container, obj = req.split_path(4, 4, True)
+            is_obj_req = True
+        except ValueError:
+            is_obj_req = False
+        if not is_obj_req:
+            return self.app(env, start_response)
+
+        if ((req.method == 'GET' or req.method == 'HEAD') and
+                req.params.get('multipart-manifest') != 'get'):
+            return GetContext(self, self.logger).\
+                handle_request(req, start_response)
+        elif req.method == 'PUT':
+            error_response = self._validate_x_object_manifest_header(req)
+            if error_response:
+                return error_response(env, start_response)
+        return self.app(env, start_response)
+
+    def _validate_x_object_manifest_header(self, req):
+        """
+        Make sure that X-Object-Manifest is valid if present.
+        """
+        if 'X-Object-Manifest' in req.headers:
+            value = req.headers['X-Object-Manifest']
+            container = prefix = None
+            try:
+                container, prefix = value.split('/', 1)
+            except ValueError:
+                pass
+            if not container or not prefix or '?' in value or '&' in value or \
+                    prefix.startswith('/'):
+                return HTTPBadRequest(
+                    request=req,
+                    body=('X-Object-Manifest must be in the '
+                          'format container/prefix'))
+
+
+def filter_factory(global_conf, **local_conf):
+    conf = global_conf.copy()
+    conf.update(local_conf)
+
+    def dlo_filter(app):
+        return DynamicLargeObject(app, conf)
+    return dlo_filter
diff --git a/swift/common/middleware/domain_remap.py b/swift/common/middleware/domain_remap.py
index 025ae4b050..aec8e90e93 100644
--- a/swift/common/middleware/domain_remap.py
+++ b/swift/common/middleware/domain_remap.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -17,39 +17,95 @@
 """
 Domain Remap Middleware
 
-Middleware that translates container and account parts of a domain to
-path parameters that the proxy server understands.
+Middleware that translates container and account parts of a domain to path
+parameters that the proxy server understands.
 
-container.account.storageurl/object gets translated to
-container.account.storageurl/path_root/account/container/object
+Translation is only performed when the request URL's host domain matches one of
+a list of domains. This list may be configured by the option
+``storage_domain``, and defaults to the single domain ``example.com``.
 
-account.storageurl/path_root/container/object gets translated to
-account.storageurl/path_root/account/container/object
+If not already present, a configurable ``path_root``, which defaults to ``v1``,
+will be added to the start of the translated path.
 
-Browsers can convert a host header to lowercase, so check that reseller
-prefix on the account is the correct case. This is done by comparing the
-items in the reseller_prefixes config option to the found prefix. If they
-match except for case, the item from reseller_prefixes will be used
-instead of the found reseller prefix. The reseller_prefixes list is
-exclusive. If defined, any request with an account prefix not in that list
-will be ignored by this middleware. reseller_prefixes defaults to 'AUTH'.
+For example, with the default configuration::
+
+    container.AUTH-account.example.com/object
+    container.AUTH-account.example.com/v1/object
+
+would both be translated to::
+
+    container.AUTH-account.example.com/v1/AUTH_account/container/object
+
+and::
+
+    AUTH-account.example.com/container/object
+    AUTH-account.example.com/v1/container/object
+
+would both be translated to::
+
+    AUTH-account.example.com/v1/AUTH_account/container/object
+
+Additionally, translation is only performed when the account name in the
+translated path starts with a reseller prefix matching one of a list configured
+by the option ``reseller_prefixes``, or when no match is found but a
+``default_reseller_prefix`` has been configured.
+
+The ``reseller_prefixes`` list defaults to the single prefix ``AUTH``. The
+``default_reseller_prefix`` is not configured by default.
+
+Browsers can convert a host header to lowercase, so the middleware checks that
+the reseller prefix on the account name is the correct case. This is done by
+comparing the items in the ``reseller_prefixes`` config option to the found
+prefix. If they match except for case, the item from ``reseller_prefixes`` will
+be used instead of the found reseller prefix. The middleware will also replace
+any hyphen ('-') in the account name with an underscore ('_').
+
+For example, with the default configuration::
+
+    auth-account.example.com/container/object
+    AUTH-account.example.com/container/object
+    auth_account.example.com/container/object
+    AUTH_account.example.com/container/object
+
+would all be translated to::
+
+    <unchanged>.example.com/v1/AUTH_account/container/object
+
+When no match is found in ``reseller_prefixes``, the
+``default_reseller_prefix`` config option is used. When no
+``default_reseller_prefix`` is configured, any request with an account prefix
+not in the ``reseller_prefixes`` list will be ignored by this middleware.
+
+For example, with ``default_reseller_prefix = AUTH``::
+
+    account.example.com/container/object
+
+would be translated to::
+
+    account.example.com/v1/AUTH_account/container/object
 
 Note that this middleware requires that container names and account names
-(except as described above) must be DNS-compatible. This means that the
-account name created in the system and the containers created by users
-cannot exceed 63 characters or have UTF-8 characters. These are
-restrictions over and above what swift requires and are not explicitly
-checked. Simply put, the this middleware will do a best-effort attempt to
-derive account and container names from elements in the domain name and
-put those derived values into the URL path (leaving the Host header
-unchanged).
-
-Also note that using container sync with remapped domain names is not
-advised. With container sync, you should use the true storage end points as
-sync destinations.
+(except as described above) must be DNS-compatible. This means that the account
+name created in the system and the containers created by users cannot exceed 63
+characters or have UTF-8 characters. These are restrictions over and above what
+Swift requires and are not explicitly checked. Simply put, this middleware
+will do a best-effort attempt to derive account and container names from
+elements in the domain name and put those derived values into the URL path
+(leaving the ``Host`` header unchanged).
+
+Also note that using :doc:`overview_container_sync` with remapped domain names
+is not advised. With :doc:`overview_container_sync`, you should use the true
+storage end points as sync destinations.
 """
 
-from swift.common.swob import Request, HTTPBadRequest
+from swift.common.middleware import RewriteContext
+from swift.common.swob import Request, HTTPBadRequest, wsgi_quote
+from swift.common.utils import config_true_value, list_from_csv
+from swift.common.registry import register_swift_info
+
+
+class _DomainRemapContext(RewriteContext):
+    base_re = r'^(https?://[^/]+)%s(.*)$'
 
 
 class DomainRemapMiddleware(object):
@@ -65,25 +121,35 @@ class DomainRemapMiddleware(object):
 
     def __init__(self, app, conf):
         self.app = app
-        self.storage_domain = conf.get('storage_domain', 'example.com')
-        if self.storage_domain and self.storage_domain[0] != '.':
-            self.storage_domain = '.' + self.storage_domain
-        self.path_root = conf.get('path_root', 'v1').strip('/')
+        storage_domain = conf.get('storage_domain', 'example.com')
+        self.storage_domain = ['.' + s for s in
+                               list_from_csv(storage_domain)
+                               if not s.startswith('.')]
+        self.storage_domain += [s for s in list_from_csv(storage_domain)
+                                if s.startswith('.')]
+        self.path_root = conf.get('path_root', 'v1').strip('/') + '/'
         prefixes = conf.get('reseller_prefixes', 'AUTH')
-        self.reseller_prefixes = [x.strip() for x in prefixes.split(',')
-                                  if x.strip()]
+        self.reseller_prefixes = list_from_csv(prefixes)
         self.reseller_prefixes_lower = [x.lower()
                                         for x in self.reseller_prefixes]
+        self.default_reseller_prefix = conf.get('default_reseller_prefix')
+        self.mangle_client_paths = config_true_value(
+            conf.get('mangle_client_paths'))
 
     def __call__(self, env, start_response):
         if not self.storage_domain:
             return self.app(env, start_response)
-        given_domain = env['HTTP_HOST']
+        if 'HTTP_HOST' in env:
+            given_domain = env['HTTP_HOST']
+        else:
+            given_domain = env['SERVER_NAME']
         port = ''
         if ':' in given_domain:
             given_domain, port = given_domain.rsplit(':', 1)
-        if given_domain.endswith(self.storage_domain):
-            parts_to_parse = given_domain[:-len(self.storage_domain)]
+        storage_domain = next((domain for domain in self.storage_domain
+                               if given_domain.endswith(domain)), None)
+        if storage_domain:
+            parts_to_parse = given_domain[:-len(storage_domain)]
             parts_to_parse = parts_to_parse.strip('.').split('.')
             len_parts_to_parse = len(parts_to_parse)
             if len_parts_to_parse == 2:
@@ -92,31 +158,44 @@ def __call__(self, env, start_response):
                 container, account = None, parts_to_parse[0]
             else:
                 resp = HTTPBadRequest(request=Request(env),
-                                      body='Bad domain in host header',
+                                      body=b'Bad domain in host header',
                                       content_type='text/plain')
                 return resp(env, start_response)
-            if '_' not in account and '-' in account:
-                account = account.replace('-', '_', 1)
-            account_reseller_prefix = account.split('_', 1)[0].lower()
-            if account_reseller_prefix not in self.reseller_prefixes_lower:
-                # account prefix is not in config list. bail.
-                return self.app(env, start_response)
-            prefix_index = self.reseller_prefixes_lower.index(
-                account_reseller_prefix)
-            real_prefix = self.reseller_prefixes[prefix_index]
-            if not account.startswith(real_prefix):
-                account_suffix = account[len(real_prefix):]
-                account = real_prefix + account_suffix
-            path = env['PATH_INFO'].strip('/')
-            new_path_parts = ['', self.path_root, account]
+            if len(self.reseller_prefixes) > 0:
+                if '_' not in account and '-' in account:
+                    account = account.replace('-', '_', 1)
+                account_reseller_prefix = account.split('_', 1)[0].lower()
+
+                if account_reseller_prefix in self.reseller_prefixes_lower:
+                    prefix_index = self.reseller_prefixes_lower.index(
+                        account_reseller_prefix)
+                    real_prefix = self.reseller_prefixes[prefix_index]
+                    if not account.startswith(real_prefix):
+                        account_suffix = account[len(real_prefix):]
+                        account = real_prefix + account_suffix
+                elif self.default_reseller_prefix:
+                    # account prefix is not in config list. Add default one.
+                    account = "%s_%s" % (self.default_reseller_prefix, account)
+                else:
+                    # account prefix is not in config list. bail.
+                    return self.app(env, start_response)
+
+            requested_path = env['PATH_INFO']
+            path = requested_path[1:]
+            new_path_parts = ['', self.path_root[:-1], account]
             if container:
                 new_path_parts.append(container)
-            if path.startswith(self.path_root):
-                path = path[len(self.path_root):].lstrip('/')
-            if path:
-                new_path_parts.append(path)
+            if self.mangle_client_paths and (path + '/').startswith(
+                    self.path_root):
+                path = path[len(self.path_root):]
+            new_path_parts.append(path)
             new_path = '/'.join(new_path_parts)
             env['PATH_INFO'] = new_path
+
+            context = _DomainRemapContext(
+                self.app, wsgi_quote(requested_path), wsgi_quote(new_path))
+            return context.handle_request(env, start_response)
+
         return self.app(env, start_response)
 
 
@@ -124,6 +203,10 @@ def filter_factory(global_conf, **local_conf):
     conf = global_conf.copy()
     conf.update(local_conf)
 
+    register_swift_info(
+        'domain_remap',
+        default_reseller_prefix=conf.get('default_reseller_prefix'))
+
     def domain_filter(app):
         return DomainRemapMiddleware(app, conf)
     return domain_filter
diff --git a/swift/common/middleware/etag_quoter.py b/swift/common/middleware/etag_quoter.py
new file mode 100644
index 0000000000..d67c1b48b7
--- /dev/null
+++ b/swift/common/middleware/etag_quoter.py
@@ -0,0 +1,128 @@
+# Copyright (c) 2010-2020 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""
+This middleware fix the Etag header of responses so that it is RFC compliant.
+`RFC 7232 <https://tools.ietf.org/html/rfc7232#section-2.3>`__ specifies that
+the value of the Etag header must be double quoted.
+
+It must be placed at the beggining of the pipeline, right after cache::
+
+   [pipeline:main]
+   pipeline = ...  cache etag-quoter ...
+
+   [filter:etag-quoter]
+   use = egg:swift#etag_quoter
+
+Set ``X-Account-Rfc-Compliant-Etags: true`` at the account
+level to have any Etags in object responses be double quoted, as in
+``"d41d8cd98f00b204e9800998ecf8427e"``. Alternatively, you may
+only fix Etags in a single container by setting
+``X-Container-Rfc-Compliant-Etags: true`` on the container.
+This may be necessary for Swift to work properly with some CDNs.
+
+Either option may also be explicitly *disabled*, so you may enable quoted
+Etags account-wide as above but turn them off for individual containers
+with ``X-Container-Rfc-Compliant-Etags: false``. This may be
+useful if some subset of applications expect Etags to be bare MD5s.
+"""
+
+from swift.common.constraints import valid_api_version
+from swift.common.http import is_success
+from swift.common.swob import Request
+from swift.common.utils import config_true_value
+from swift.common.registry import register_swift_info
+from swift.proxy.controllers.base import get_account_info, get_container_info
+
+
+class EtagQuoterMiddleware(object):
+    def __init__(self, app, conf):
+        self.app = app
+        self.conf = conf
+
+    def __call__(self, env, start_response):
+        req = Request(env)
+        try:
+            version, account, container, obj = req.split_path(
+                2, 4, rest_with_last=True)
+            is_swifty_request = valid_api_version(version)
+        except ValueError:
+            is_swifty_request = False
+
+        if not is_swifty_request:
+            return self.app(env, start_response)
+
+        if not obj:
+            typ = 'Container' if container else 'Account'
+            client_header = 'X-%s-Rfc-Compliant-Etags' % typ
+            sysmeta_header = 'X-%s-Sysmeta-Rfc-Compliant-Etags' % typ
+            if client_header in req.headers:
+                if req.headers[client_header]:
+                    req.headers[sysmeta_header] = config_true_value(
+                        req.headers[client_header])
+                else:
+                    req.headers[sysmeta_header] = ''
+            if req.headers.get(client_header.replace('X-', 'X-Remove-', 1)):
+                req.headers[sysmeta_header] = ''
+
+            def translating_start_response(status, headers, exc_info=None):
+                return start_response(status, [
+                    (client_header if h.title() == sysmeta_header else h,
+                     v) for h, v in headers
+                ], exc_info)
+
+            return self.app(env, translating_start_response)
+
+        container_info = get_container_info(env, self.app, 'EQ')
+        if not container_info or not is_success(container_info['status']):
+            return self.app(env, start_response)
+
+        flag = container_info.get('sysmeta', {}).get('rfc-compliant-etags')
+        if flag is None:
+            account_info = get_account_info(env, self.app, 'EQ')
+            if not account_info or not is_success(account_info['status']):
+                return self.app(env, start_response)
+
+            flag = account_info.get('sysmeta', {}).get(
+                'rfc-compliant-etags')
+
+        if flag is None:
+            flag = self.conf.get('enable_by_default', 'false')
+
+        if not config_true_value(flag):
+            return self.app(env, start_response)
+
+        status, headers, resp_iter = req.call_application(self.app)
+
+        headers = [
+            (header, value) if header.lower() != 'etag' or (
+                value.startswith(('"', 'W/"')) and value.endswith('"'))
+            else (header, '"%s"' % value)
+            for header, value in headers]
+
+        start_response(status, headers)
+        return resp_iter
+
+
+def filter_factory(global_conf, **local_conf):
+    conf = global_conf.copy()
+    conf.update(local_conf)
+    register_swift_info(
+        'etag_quoter', enable_by_default=config_true_value(
+            conf.get('enable_by_default', 'false')))
+
+    def etag_quoter_filter(app):
+        return EtagQuoterMiddleware(app, conf)
+    return etag_quoter_filter
diff --git a/swift/common/middleware/formpost.py b/swift/common/middleware/formpost.py
index 9dee49c902..9c75bc79b2 100644
--- a/swift/common/middleware/formpost.py
+++ b/swift/common/middleware/formpost.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2011 OpenStack, LLC.
+# Copyright (c) 2011 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,7 +13,7 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-"""
+r"""
 FormPost Middleware
 
 Translates a browser form post into a regular Swift object PUT.
@@ -31,7 +31,24 @@
       <input type="submit" />
     </form>
 
-The <swift-url> is the URL to the Swift desination, such as::
+Optionally, if you want the uploaded files to be temporary you can set
+x-delete-at or x-delete-after attributes by adding one of these as a
+form input::
+
+    <input type="hidden" name="x_delete_at" value="<unix-timestamp>" />
+    <input type="hidden" name="x_delete_after" value="<seconds>" />
+
+If you want to specify the content type or content encoding of the files you
+can set content-encoding or content-type by adding them to the form input::
+
+    <input type="hidden" name="content-type" value="text/html" />
+    <input type="hidden" name="content-encoding" value="gzip" />
+
+The above example applies these parameters to all uploaded files. You can also
+set the content-type and content-encoding on a per-file basis by adding the
+parameters to each part of the upload.
+
+The <swift-url> is the URL of the Swift destination, such as::
 
     https://swift-cluster.example.com/v1/AUTH_account/container/object_prefix
 
@@ -49,11 +66,12 @@
 Note the form method must be POST and the enctype must be set as
 "multipart/form-data".
 
-The redirect attribute is the URL to redirect the browser to after
-the upload completes. The URL will have status and message query
-parameters added to it, indicating the HTTP status code for the
-upload (2xx is success) and a possible message for further
-information if there was an error (such as "max_file_size exceeded").
+The redirect attribute is the URL to redirect the browser to after the upload
+completes. This is an optional parameter. If you are uploading the form via an
+XMLHttpRequest the redirect should not be included. The URL will have status
+and message query parameters added to it, indicating the HTTP status code for
+the upload (2xx is success) and a possible message for further information if
+there was an error (such as "max_file_size exceeded").
 
 The max_file_size attribute must be included and indicates the
 largest single file upload that can be done, in bytes.
@@ -66,26 +84,29 @@
 The expires attribute is the Unix timestamp before which the form
 must be submitted before it is invalidated.
 
-The signature attribute is the HMAC-SHA1 signature of the form. Here is
+The signature attribute is the HMAC signature of the form. Here is
 sample code for computing the signature::
 
     import hmac
-    from hashlib import sha1
+    from hashlib import sha512
     from time import time
     path = '/v1/account/container/object_prefix'
-    redirect = 'https://myserver.com/some-page'
+    redirect = 'https://srv.com/some-page'  # set to '' if redirect not in form
     max_file_size = 104857600
     max_file_count = 10
     expires = int(time() + 600)
     key = 'mykey'
-    hmac_body = '%s\\n%s\\n%s\\n%s\\n%s' % (path, redirect,
+    hmac_body = '%s\n%s\n%s\n%s\n%s' % (path, redirect,
         max_file_size, max_file_count, expires)
-    signature = hmac.new(key, hmac_body, sha1).hexdigest()
+    signature = hmac.new(key, hmac_body, sha512).hexdigest()
 
-The key is the value of the X-Account-Meta-Temp-URL-Key header on the
-account.
+The key is the value of either the account (X-Account-Meta-Temp-URL-Key,
+X-Account-Meta-Temp-Url-Key-2) or the container
+(X-Container-Meta-Temp-URL-Key, X-Container-Meta-Temp-Url-Key-2) TempURL keys.
 
 Be certain to use the full path, from the /v1/ onward.
+Note that x_delete_at and x_delete_after are not used in signature generation
+as they are both optional attributes.
 
 The command line tool ``swift-form-signature`` may be used (mostly
 just when testing) to compute expires and signature.
@@ -102,16 +123,23 @@
 __all__ = ['FormPost', 'filter_factory', 'READ_CHUNK_SIZE', 'MAX_VALUE_LENGTH']
 
 import hmac
-import re
-import rfc822
-from hashlib import sha1
-from StringIO import StringIO
-from time import gmtime, strftime, time
-from urllib import quote, unquote
+from time import time
 
-from swift.common.utils import get_logger, streq_const_time
-from swift.common.wsgi import make_pre_authed_env
-from swift.common.http import HTTP_BAD_REQUEST
+from urllib.parse import quote
+
+from swift.common.constraints import valid_api_version
+from swift.common.exceptions import MimeInvalid
+from swift.common.middleware.tempurl import get_tempurl_keys_from_metadata
+from swift.common.digest import get_allowed_digests, \
+    extract_digest_and_algorithm, DEFAULT_ALLOWED_DIGESTS
+from swift.common.utils import streq_const_time, parse_content_disposition, \
+    parse_mime_headers, iter_multipart_mime_documents, reiterate, \
+    closing_if_possible, get_logger, InputProxy
+from swift.common.registry import register_swift_info
+from swift.common.wsgi import WSGIContext, make_pre_authed_env
+from swift.common.swob import HTTPUnauthorized, wsgi_to_str, str_to_wsgi
+from swift.common.http import is_success
+from swift.proxy.controllers.base import get_account_info, get_container_info
 
 
 #: The size of data to read from the form at any given time.
@@ -121,134 +149,16 @@
 #: truncated.
 MAX_VALUE_LENGTH = 4096
 
-#: Regular expression to match form attributes.
-ATTRIBUTES_RE = re.compile(r'(\w+)=(".*?"|[^";]+)(; ?|$)')
-
 
 class FormInvalid(Exception):
     pass
 
 
-def _parse_attrs(header):
-    """
-    Given the value of a header like:
-    Content-Disposition: form-data; name="somefile"; filename="test.html"
-
-    Return data like
-    ("form-data", {"name": "somefile", "filename": "test.html"})
-
-    :param header: Value of a header (the part after the ': ').
-    :returns: (value name, dict) of the attribute data parsed (see above).
-    """
-    attributes = {}
-    attrs = ''
-    if '; ' in header:
-        header, attrs = header.split('; ', 1)
-    m = True
-    while m:
-        m = ATTRIBUTES_RE.match(attrs)
-        if m:
-            attrs = attrs[len(m.group(0)):]
-            attributes[m.group(1)] = m.group(2).strip('"')
-    return header, attributes
-
-
-class _IterRequestsFileLikeObject(object):
-
-    def __init__(self, wsgi_input, boundary, input_buffer):
-        self.no_more_data_for_this_file = False
-        self.no_more_files = False
-        self.wsgi_input = wsgi_input
-        self.boundary = boundary
-        self.input_buffer = input_buffer
-
-    def read(self, length=None):
-        if not length:
-            length = READ_CHUNK_SIZE
-        if self.no_more_data_for_this_file:
-            return ''
-
-        # read enough data to know whether we're going to run
-        # into a boundary in next [length] bytes
-        if len(self.input_buffer) < length + len(self.boundary) + 2:
-            to_read = length + len(self.boundary) + 2
-            while to_read > 0:
-                chunk = self.wsgi_input.read(to_read)
-                to_read -= len(chunk)
-                self.input_buffer += chunk
-                if not chunk:
-                    self.no_more_files = True
-                    break
-
-        boundary_pos = self.input_buffer.find(self.boundary)
-
-        # boundary does not exist in the next (length) bytes
-        if boundary_pos == -1 or boundary_pos > length:
-            ret = self.input_buffer[:length]
-            self.input_buffer = self.input_buffer[length:]
-        # if it does, just return data up to the boundary
-        else:
-            ret, self.input_buffer = self.input_buffer.split(self.boundary, 1)
-            self.no_more_files = self.input_buffer.startswith('--')
-            self.no_more_data_for_this_file = True
-            self.input_buffer = self.input_buffer[2:]
-        return ret
-
-    def readline(self):
-        if self.no_more_data_for_this_file:
-            return ''
-        boundary_pos = newline_pos = -1
-        while newline_pos < 0 and boundary_pos < 0:
-            chunk = self.wsgi_input.read(READ_CHUNK_SIZE)
-            self.input_buffer += chunk
-            newline_pos = self.input_buffer.find('\r\n')
-            boundary_pos = self.input_buffer.find(self.boundary)
-            if not chunk:
-                self.no_more_files = True
-                break
-        # found a newline
-        if newline_pos >= 0 and \
-                (boundary_pos < 0 or newline_pos < boundary_pos):
-            # Use self.read to ensure any logic there happens...
-            ret = ''
-            to_read = newline_pos + 2
-            while to_read > 0:
-                chunk = self.read(to_read)
-                # Should never happen since we're reading from input_buffer,
-                # but just for completeness...
-                if not chunk:
-                    break
-                to_read -= len(chunk)
-                ret += chunk
-            return ret
-        else:  # no newlines, just return up to next boundary
-            return self.read(len(self.input_buffer))
-
+class FormUnauthorized(Exception):
+    pass
 
-def _iter_requests(wsgi_input, boundary):
-    """
-    Given a multi-part mime encoded input file object and boundary,
-    yield file-like objects for each part.
 
-    :param wsgi_input: The file-like object to read from.
-    :param boundary: The mime boundary to separate new file-like
-                     objects on.
-    :returns: A generator of file-like objects for each part.
-    """
-    boundary = '--' + boundary
-    if wsgi_input.readline().strip() != boundary:
-        raise FormInvalid('invalid starting boundary')
-    boundary = '\r\n' + boundary
-    input_buffer = ''
-    done = False
-    while not done:
-        it = _IterRequestsFileLikeObject(wsgi_input, boundary, input_buffer)
-        yield it
-        done = it.no_more_files
-        input_buffer = it.input_buffer
-
-
-class _CappedFileLikeObject(object):
+class _CappedFileLikeObject(InputProxy):
     """
     A file-like object wrapping another file-like object that raises
     an EOFError if the amount of data read exceeds a given
@@ -260,23 +170,15 @@ class _CappedFileLikeObject(object):
     """
 
     def __init__(self, fp, max_file_size):
-        self.fp = fp
+        super().__init__(fp)
         self.max_file_size = max_file_size
-        self.amount_read = 0
-
-    def read(self, size=None):
-        ret = self.fp.read(size)
-        self.amount_read += len(ret)
-        if self.amount_read > self.max_file_size:
-            raise EOFError('max_file_size exceeded')
-        return ret
+        self.file_size_exceeded = False
 
-    def readline(self):
-        ret = self.fp.readline()
-        self.amount_read += len(ret)
-        if self.amount_read > self.max_file_size:
+    def chunk_update(self, chunk, eof, *args, **kwargs):
+        if self.bytes_received > self.max_file_size:
+            self.file_size_exceeded = True
             raise EOFError('max_file_size exceeded')
-        return ret
+        return chunk
 
 
 class FormPost(object):
@@ -285,20 +187,25 @@ class FormPost(object):
 
     See above for a full description.
 
+    The proxy logs created for any subrequests made will have swift.source set
+    to "FP".
+
     :param app: The next WSGI filter or app in the paste.deploy
                 chain.
     :param conf: The configuration dict for the middleware.
     """
 
-    def __init__(self, app, conf):
+    def __init__(self, app, conf, logger=None):
         #: The next WSGI application/filter in the paste.deploy pipeline.
         self.app = app
         #: The filter configuration dict.
         self.conf = conf
-        #: The logger to use with this middleware.
-        self.logger = get_logger(conf, log_route='formpost')
-        #: The HTTP user agent to use with subrequests.
-        self.agent = '%(orig)s FormPost'
+        self.logger = logger or get_logger(conf, log_route='formpost')
+        # Defaulting to SUPPORTED_DIGESTS just so we don't completely
+        # deprecate sha1 yet. We'll change this to DEFAULT_ALLOWED_DIGESTS
+        # later.
+        self.allowed_digests = conf.get(
+            'allowed_digests', DEFAULT_ALLOWED_DIGESTS.split())
 
     def __call__(self, env, start_response):
         """
@@ -311,22 +218,34 @@ def __call__(self, env, start_response):
         if env['REQUEST_METHOD'] == 'POST':
             try:
                 content_type, attrs = \
-                    _parse_attrs(env.get('CONTENT_TYPE') or '')
+                    parse_content_disposition(env.get('CONTENT_TYPE') or '')
                 if content_type == 'multipart/form-data' and \
                         'boundary' in attrs:
+                    http_user_agent = "%s FormPost" % (
+                        env.get('HTTP_USER_AGENT', ''))
+                    env['HTTP_USER_AGENT'] = http_user_agent.strip()
                     status, headers, body = self._translate_form(
                         env, attrs['boundary'])
-                    self._log_request(env, int(status.split(' ', 1)[0]))
                     start_response(status, headers)
-                    return body
-            except (FormInvalid, EOFError), err:
-                self._log_request(env, HTTP_BAD_REQUEST)
-                body = 'FormPost: %s' % err
+                    return [body]
+            except MimeInvalid:
+                body = b'FormPost: invalid starting boundary'
+                start_response(
+                    '400 Bad Request',
+                    (('Content-Type', 'text/plain'),
+                     ('Content-Length', str(len(body)))))
+                return [body]
+            except (FormInvalid, EOFError) as err:
+                body = ('FormPost: %s' % err).encode('utf-8')
                 start_response(
                     '400 Bad Request',
                     (('Content-Type', 'text/plain'),
                      ('Content-Length', str(len(body)))))
                 return [body]
+            except FormUnauthorized as err:
+                message = 'FormPost: %s' % str(err).title()
+                return HTTPUnauthorized(body=message)(
+                    env, start_response)
         return self.app(env, start_response)
 
     def _translate_form(self, env, boundary):
@@ -338,14 +257,19 @@ def _translate_form(self, env, boundary):
         :param boundary: The MIME type boundary to look for.
         :returns: status_line, headers_list, body
         """
-        key = self._get_key(env)
+        keys = self._get_keys(env)
+        boundary = boundary.encode('utf-8')
         status = message = ''
         attributes = {}
+        file_attributes = {}
+        subheaders = []
+        resp_body = None
         file_count = 0
-        for fp in _iter_requests(env['wsgi.input'], boundary):
-            hdrs = rfc822.Message(fp, 0)
-            disp, attrs = \
-                _parse_attrs(hdrs.getheader('Content-Disposition', ''))
+        for fp in iter_multipart_mime_documents(
+                env['wsgi.input'], boundary, read_chunk_size=READ_CHUNK_SIZE):
+            hdrs = parse_mime_headers(fp)
+            disp, attrs = parse_content_disposition(
+                hdrs.get('Content-Disposition', ''))
             if disp == 'form-data' and attrs.get('filename'):
                 file_count += 1
                 try:
@@ -355,16 +279,22 @@ def _translate_form(self, env, boundary):
                         break
                 except ValueError:
                     raise FormInvalid('max_file_count not an integer')
-                attributes['filename'] = attrs['filename'] or 'filename'
+                file_attributes = attributes.copy()
+                file_attributes['filename'] = attrs['filename'] or 'filename'
                 if 'content-type' not in attributes and 'content-type' in hdrs:
-                    attributes['content-type'] = \
+                    file_attributes['content-type'] = \
                         hdrs['Content-Type'] or 'application/octet-stream'
-                status, message = self._perform_subrequest(env, attributes, fp,
-                                                           key)
-                if status[:1] != '2':
+                if 'content-encoding' not in attributes and \
+                        'content-encoding' in hdrs:
+                    file_attributes['content-encoding'] = \
+                        hdrs['Content-Encoding']
+                status, subheaders, resp_body = \
+                    self._perform_subrequest(env, file_attributes, fp, keys)
+                status_code = int(status.split(' ', 1)[0])
+                if not is_success(status_code):
                     break
             else:
-                data = ''
+                data = b''
                 mxln = MAX_VALUE_LENGTH
                 while mxln:
                     chunk = fp.read(mxln)
@@ -374,29 +304,42 @@ def _translate_form(self, env, boundary):
                     data += chunk
                 while fp.read(READ_CHUNK_SIZE):
                     pass
+                data = data.decode('utf-8')
                 if 'name' in attrs:
                     attributes[attrs['name'].lower()] = data.rstrip('\r\n--')
         if not status:
             status = '400 Bad Request'
             message = 'no files to process'
-        if not attributes.get('redirect'):
+
+        status_code = int(status.split(' ', 1)[0])
+        headers = [(k, v) for k, v in subheaders
+                   if k.lower().startswith('access-control')]
+
+        redirect = attributes.get('redirect')
+        if not redirect:
             body = status
             if message:
                 body = status + '\r\nFormPost: ' + message.title()
-            headers = [('Content-Type', 'text/plain'),
-                       ('Content-Length', len(body))]
+            body = body.encode('utf-8')
+            if not is_success(status_code) and resp_body:
+                body = resp_body
+            headers.extend([('Content-Type', 'text/plain'),
+                            ('Content-Length', len(body))])
             return status, headers, body
-        status = status.split(' ', 1)[0]
-        body = '<html><body><p><a href="%s?status=%s&message=%s">Click to ' \
-               'continue...</a></p></body></html>' % \
-               (attributes['redirect'], quote(status), quote(message))
-        headers = [
-            ('Location', '%s?status=%s&message=%s' % (
-                attributes['redirect'], quote(status), quote(message))),
-            ('Content-Length', str(len(body)))]
+        if '?' in redirect:
+            redirect += '&'
+        else:
+            redirect += '?'
+        redirect += 'status=%s&message=%s' % (quote(str(status_code)),
+                                              quote(message))
+        body = '<html><body><p><a href="%s">' \
+               'Click to continue...</a></p></body></html>' % redirect
+        body = body.encode('utf-8')
+        headers.extend(
+            [('Location', redirect), ('Content-Length', str(len(body)))])
         return '303 See Other', headers, body
 
-    def _perform_subrequest(self, orig_env, attributes, fp, key):
+    def _perform_subrequest(self, orig_env, attributes, fp, keys):
         """
         Performs the subrequest and returns the response.
 
@@ -404,135 +347,125 @@ def _perform_subrequest(self, orig_env, attributes, fp, key):
                          to form a new env for the subrequest.
         :param attributes: dict of the attributes of the form so far.
         :param fp: The file-like object containing the request body.
-        :param key: The account key to validate the signature with.
-        :returns: (status_line, message)
+        :param keys: The account keys to validate the signature with.
+        :returns: (status_line, headers_list)
         """
-        if not key:
-            return '401 Unauthorized', 'invalid signature'
+        if not keys:
+            raise FormUnauthorized('invalid signature')
         try:
             max_file_size = int(attributes.get('max_file_size') or 0)
         except ValueError:
             raise FormInvalid('max_file_size not an integer')
-        subenv = make_pre_authed_env(orig_env, 'PUT', agent=self.agent)
+        subenv = make_pre_authed_env(orig_env, 'PUT', agent=None,
+                                     swift_source='FP')
+        if 'QUERY_STRING' in subenv:
+            del subenv['QUERY_STRING']
         subenv['HTTP_TRANSFER_ENCODING'] = 'chunked'
         subenv['wsgi.input'] = _CappedFileLikeObject(fp, max_file_size)
-        if subenv['PATH_INFO'][-1] != '/' and \
+        if not subenv['PATH_INFO'].endswith('/') and \
                 subenv['PATH_INFO'].count('/') < 4:
             subenv['PATH_INFO'] += '/'
-        subenv['PATH_INFO'] += attributes['filename'] or 'filename'
+        subenv['PATH_INFO'] += str_to_wsgi(
+            attributes['filename'] or 'filename')
+        if 'x_delete_at' in attributes:
+            try:
+                subenv['HTTP_X_DELETE_AT'] = int(attributes['x_delete_at'])
+            except ValueError:
+                raise FormInvalid('x_delete_at not an integer: '
+                                  'Unix timestamp required.')
+        if 'x_delete_after' in attributes:
+            try:
+                subenv['HTTP_X_DELETE_AFTER'] = int(
+                    attributes['x_delete_after'])
+            except ValueError:
+                raise FormInvalid('x_delete_after not an integer: '
+                                  'Number of seconds required.')
         if 'content-type' in attributes:
             subenv['CONTENT_TYPE'] = \
                 attributes['content-type'] or 'application/octet-stream'
-        elif 'CONTENT_TYPE' in subenv:
-            del subenv['CONTENT_TYPE']
+        if 'content-encoding' in attributes:
+            subenv['HTTP_CONTENT_ENCODING'] = attributes['content-encoding']
         try:
             if int(attributes.get('expires') or 0) < time():
-                return '401 Unauthorized', 'form expired'
+                raise FormUnauthorized('form expired')
         except ValueError:
             raise FormInvalid('expired not an integer')
         hmac_body = '%s\n%s\n%s\n%s\n%s' % (
-            orig_env['PATH_INFO'],
+            wsgi_to_str(orig_env['PATH_INFO']),
             attributes.get('redirect') or '',
             attributes.get('max_file_size') or '0',
             attributes.get('max_file_count') or '0',
             attributes.get('expires') or '0')
-        sig = hmac.new(key, hmac_body, sha1).hexdigest()
-        if not streq_const_time(sig, (attributes.get('signature') or
-                                      'invalid')):
-            return '401 Unauthorized', 'invalid signature'
-        substatus = [None]
-
-        def _start_response(status, headers, exc_info=None):
-            substatus[0] = status
+        hmac_body = hmac_body.encode('utf-8')
 
-        i = iter(self.app(subenv, _start_response))
+        has_valid_sig = False
+        signature = attributes.get('signature', '')
         try:
-            i.next()
-        except StopIteration:
-            pass
-        return substatus[0], ''
-
-    def _get_key(self, env):
+            hash_name, signature = extract_digest_and_algorithm(signature)
+        except ValueError:
+            raise FormUnauthorized('invalid signature')
+        if hash_name not in self.allowed_digests:
+            raise FormUnauthorized('invalid signature')
+
+        for key in keys:
+            # Encode key like in swift.common.utls.get_hmac.
+            if not isinstance(key, bytes):
+                key = key.encode('utf8')
+            sig = hmac.new(key, hmac_body, hash_name).hexdigest()
+            if streq_const_time(sig, signature):
+                has_valid_sig = True
+        if not has_valid_sig:
+            raise FormUnauthorized('invalid signature')
+        self.logger.increment('formpost.digests.%s' % hash_name)
+        wsgi_ctx = WSGIContext(self.app)
+        wsgi_input = subenv['wsgi.input']
+        resp = wsgi_ctx._app_call(subenv)
+        if wsgi_input.file_size_exceeded:
+            raise EOFError("max_file_size exceeded")
+        with closing_if_possible(reiterate(resp)):
+            body = b''.join(resp)
+        return wsgi_ctx._response_status, wsgi_ctx._response_headers, body
+
+    def _get_keys(self, env):
         """
-        Returns the X-Account-Meta-Temp-URL-Key header value for the
-        account, or None if none is set.
+        Returns the X-[Account|Container]-Meta-Temp-URL-Key[-2] header values
+        for the account or container, or an empty list if none are set.
+
+        Returns 0-4 elements depending on how many keys are set in the
+        account's or container's metadata.
+
+        Also validate that the request
+        path indicates a valid container; if not, no keys will be returned.
 
         :param env: The WSGI environment for the request.
-        :returns: X-Account-Meta-Temp-URL-Key str value, or None.
+        :returns: list of tempurl keys
         """
         parts = env['PATH_INFO'].split('/', 4)
-        if len(parts) < 4 or parts[0] or parts[1] != 'v1' or not parts[2] or \
-                not parts[3]:
-            return None
-        account = parts[2]
-        key = None
-        memcache = env.get('swift.cache')
-        if memcache:
-            key = memcache.get('temp-url-key/%s' % account)
-        if not key:
-            newenv = make_pre_authed_env(env, 'HEAD', '/v1/' + account,
-                                         self.agent)
-            newenv['CONTENT_LENGTH'] = '0'
-            newenv['wsgi.input'] = StringIO('')
-            key = [None]
-
-            def _start_response(status, response_headers, exc_info=None):
-                for h, v in response_headers:
-                    if h.lower() == 'x-account-meta-temp-url-key':
-                        key[0] = v
-
-            i = iter(self.app(newenv, _start_response))
-            try:
-                i.next()
-            except StopIteration:
-                pass
-            key = key[0]
-            if key and memcache:
-                memcache.set('temp-url-key/%s' % account, key, timeout=60)
-        return key
-
-    def _log_request(self, env, response_status_int):
-        """
-        Used when a request might not be logged by the underlying
-        WSGI application, but we'd still like to record what
-        happened. An early 401 Unauthorized is a good example of
-        this.
+        if len(parts) < 4 or parts[0] or not valid_api_version(parts[1]) \
+                or not parts[2] or not parts[3]:
+            return []
 
-        :param env: The WSGI environment for the request.
-        :param response_status_int: The HTTP status we'll be replying
-                                    to the request with.
-        """
-        the_request = quote(unquote(env.get('PATH_INFO') or '/'))
-        if env.get('QUERY_STRING'):
-            the_request = the_request + '?' + env['QUERY_STRING']
-        client = env.get('HTTP_X_CLUSTER_CLIENT_IP')
-        if not client and 'HTTP_X_FORWARDED_FOR' in env:
-            # remote host for other lbs
-            client = env['HTTP_X_FORWARDED_FOR'].split(',')[0].strip()
-        if not client:
-            client = env.get('REMOTE_ADDR')
-        self.logger.info(' '.join(quote(str(x)) for x in (
-            client or '-',
-            env.get('REMOTE_ADDR') or '-',
-            strftime('%d/%b/%Y/%H/%M/%S', gmtime()),
-            env.get('REQUEST_METHOD') or 'GET',
-            the_request,
-            env.get('SERVER_PROTOCOL') or '1.0',
-            response_status_int,
-            env.get('HTTP_REFERER') or '-',
-            (env.get('HTTP_USER_AGENT') or '-') + ' FormPOST',
-            env.get('HTTP_X_AUTH_TOKEN') or '-',
-            '-',
-            '-',
-            '-',
-            env.get('swift.trans_id') or '-',
-            '-',
-            '-',
-        )))
+        account_info = get_account_info(env, self.app, swift_source='FP')
+        account_keys = get_tempurl_keys_from_metadata(account_info['meta'])
+
+        container_info = get_container_info(env, self.app, swift_source='FP')
+        container_keys = get_tempurl_keys_from_metadata(
+            container_info.get('meta', []))
+
+        return account_keys + container_keys
 
 
 def filter_factory(global_conf, **local_conf):
-    """ Returns the WSGI filter for use with paste.deploy. """
+    """Returns the WSGI filter for use with paste.deploy."""
     conf = global_conf.copy()
     conf.update(local_conf)
+
+    logger = get_logger(conf, log_route='formpost')
+    allowed_digests, deprecated_digests = get_allowed_digests(
+        conf.get('allowed_digests', '').split(), logger)
+    info = {'allowed_digests': sorted(allowed_digests)}
+    if deprecated_digests:
+        info['deprecated_digests'] = sorted(deprecated_digests)
+    register_swift_info('formpost', **info)
+    conf.update(info)
     return lambda app: FormPost(app, conf)
diff --git a/swift/common/middleware/gatekeeper.py b/swift/common/middleware/gatekeeper.py
new file mode 100644
index 0000000000..dfb5ef04b0
--- /dev/null
+++ b/swift/common/middleware/gatekeeper.py
@@ -0,0 +1,138 @@
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""
+The ``gatekeeper`` middleware imposes restrictions on the headers that
+may be included with requests and responses. Request headers are filtered
+to remove headers that should never be generated by a client. Similarly,
+response headers are filtered to remove private headers that should
+never be passed to a client.
+
+The ``gatekeeper`` middleware must always be present in the proxy server
+wsgi pipeline. It should be configured close to the start of the pipeline
+specified in ``/etc/swift/proxy-server.conf``, immediately after catch_errors
+and before any other middleware. It is essential that it is configured ahead
+of all middlewares using system metadata in order that they function
+correctly.
+
+If ``gatekeeper`` middleware is not configured in the pipeline then it will be
+automatically inserted close to the start of the pipeline by the proxy server.
+"""
+
+
+from swift.common.swob import Request
+from swift.common.utils import get_logger, config_true_value
+from swift.common.request_helpers import (
+    remove_items, get_sys_meta_prefix, OBJECT_TRANSIENT_SYSMETA_PREFIX
+)
+from urllib.parse import urlsplit
+import re
+
+#: A list of python regular expressions that will be used to
+#: match against inbound request headers. Matching headers will
+#: be removed from the request.
+# Exclude headers starting with a sysmeta prefix.
+# Exclude headers starting with object transient system metadata prefix.
+# Exclude headers starting with an internal backend header prefix.
+# If adding to this list, note that these are regex patterns,
+# so use a trailing $ to constrain to an exact header match
+# rather than prefix match.
+inbound_exclusions = [get_sys_meta_prefix('account'),
+                      get_sys_meta_prefix('container'),
+                      get_sys_meta_prefix('object'),
+                      OBJECT_TRANSIENT_SYSMETA_PREFIX,
+                      'x-backend']
+
+
+#: A list of python regular expressions that will be used to
+#: match against outbound response headers. Matching headers will
+#: be removed from the response.
+outbound_exclusions = inbound_exclusions
+
+
+def make_exclusion_test(exclusions):
+    expr = '|'.join(exclusions)
+    test = re.compile(expr, re.IGNORECASE)
+    return test.match
+
+
+class GatekeeperMiddleware(object):
+    def __init__(self, app, conf):
+        self.app = app
+        self.logger = get_logger(conf, log_route='gatekeeper')
+        self.inbound_condition = make_exclusion_test(inbound_exclusions)
+        self.outbound_condition = make_exclusion_test(outbound_exclusions)
+        self.shunt_x_timestamp = config_true_value(
+            conf.get('shunt_inbound_x_timestamp', 'true'))
+        self.allow_reserved_names_header = config_true_value(
+            conf.get('allow_reserved_names_header', 'false'))
+
+    def __call__(self, env, start_response):
+        req = Request(env)
+        removed = remove_items(req.headers, self.inbound_condition)
+        if removed:
+            self.logger.debug('removed request headers: %s' % removed)
+
+        if 'X-Timestamp' in req.headers and self.shunt_x_timestamp:
+            ts = req.headers.pop('X-Timestamp')
+            req.headers['X-Backend-Inbound-X-Timestamp'] = ts
+            # log in a similar format as the removed headers
+            self.logger.debug('shunted request headers: %s' %
+                              [('X-Timestamp', ts)])
+
+        if 'X-Allow-Reserved-Names' in req.headers \
+                and self.allow_reserved_names_header:
+            req.headers['X-Backend-Allow-Reserved-Names'] = \
+                req.headers.pop('X-Allow-Reserved-Names')
+
+        def gatekeeper_response(status, response_headers, exc_info=None):
+            def fixed_response_headers():
+                def relative_path(value):
+                    parsed = urlsplit(value)
+                    new_path = parsed.path
+                    if parsed.query:
+                        new_path += ('?%s' % parsed.query)
+                    if parsed.fragment:
+                        new_path += ('#%s' % parsed.fragment)
+                    return new_path
+
+                if not env.get('swift.leave_relative_location'):
+                    return response_headers
+                else:
+                    return [
+                        (k, v) if k.lower() != 'location' else
+                        (k, relative_path(v)) for (k, v) in response_headers
+                    ]
+
+            response_headers = fixed_response_headers()
+            removed = [(header, value) for header, value in response_headers
+                       if self.outbound_condition(header)]
+
+            if removed:
+                self.logger.debug('removed response headers: %s' % removed)
+                new_headers = [
+                    (header, value) for header, value in response_headers
+                    if not self.outbound_condition(header)]
+                return start_response(status, new_headers, exc_info)
+            return start_response(status, response_headers, exc_info)
+        return self.app(env, gatekeeper_response)
+
+
+def filter_factory(global_conf, **local_conf):
+    conf = global_conf.copy()
+    conf.update(local_conf)
+
+    def gatekeeper_filter(app):
+        return GatekeeperMiddleware(app, conf)
+    return gatekeeper_filter
diff --git a/swift/common/middleware/healthcheck.py b/swift/common/middleware/healthcheck.py
index 75deda250a..f9f6b24ea9 100644
--- a/swift/common/middleware/healthcheck.py
+++ b/swift/common/middleware/healthcheck.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -31,29 +31,24 @@ class HealthCheckMiddleware(object):
 
     def __init__(self, app, conf):
         self.app = app
-        self.conf = conf
         self.disable_path = conf.get('disable_path', '')
 
     def GET(self, req):
         """Returns a 200 response with "OK" in the body."""
-        return Response(request=req, body="OK", content_type="text/plain")
+        return Response(request=req, body=b"OK", content_type="text/plain")
 
     def DISABLED(self, req):
         """Returns a 503 response with "DISABLED BY FILE" in the body."""
-        return Response(request=req, status=503, body="DISABLED BY FILE",
+        return Response(request=req, status=503, body=b"DISABLED BY FILE",
                         content_type="text/plain")
 
     def __call__(self, env, start_response):
         req = Request(env)
-        try:
-            if req.path == '/healthcheck':
-                handler = self.GET
-                if self.disable_path and os.path.exists(self.disable_path):
-                    handler = self.DISABLED
-                return handler(req)(env, start_response)
-        except UnicodeError:
-            # definitely, this is not /healthcheck
-            pass
+        if req.path == '/healthcheck':
+            handler = self.GET
+            if self.disable_path and os.path.exists(self.disable_path):
+                handler = self.DISABLED
+            return handler(req)(env, start_response)
         return self.app(env, start_response)
 
 
diff --git a/swift/common/middleware/keystoneauth.py b/swift/common/middleware/keystoneauth.py
index b7cdd347cb..ff25b9f347 100644
--- a/swift/common/middleware/keystoneauth.py
+++ b/swift/common/middleware/keystoneauth.py
@@ -1,6 +1,4 @@
-# vim: tabstop=4 shiftwidth=4 softtabstop=4
-
-# Copyright 2012 OpenStack LLC
+# Copyright 2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License"); you may
 # not use this file except in compliance with the License. You may obtain
@@ -15,39 +13,51 @@
 # under the License.
 
 from swift.common import utils as swift_utils
+from swift.common.http import is_success
 from swift.common.middleware import acl as swift_acl
+from swift.common.request_helpers import get_sys_meta_prefix
 from swift.common.swob import HTTPNotFound, HTTPForbidden, HTTPUnauthorized
+from swift.common.utils import config_read_reseller_options, list_from_csv
+from swift.proxy.controllers.base import get_account_info
+import functools
+
+PROJECT_DOMAIN_ID_HEADER = 'x-account-project-domain-id'
+PROJECT_DOMAIN_ID_SYSMETA_HEADER = \
+    get_sys_meta_prefix('account') + 'project-domain-id'
+# a string that is unique w.r.t valid ids
+UNKNOWN_ID = '_unknown'
 
 
 class KeystoneAuth(object):
     """Swift middleware to Keystone authorization system.
 
-    In Swift's proxy-server.conf add this middleware to your pipeline::
-
-        [pipeline:main]
-        pipeline = catch_errors cache authtoken keystoneauth proxy-server
-
-    Make sure you have the authtoken middleware before the
-    keystoneauth middleware.
+    In Swift's proxy-server.conf add this keystoneauth middleware and the
+    authtoken middleware to your pipeline. Make sure you have the authtoken
+    middleware before the keystoneauth middleware.
 
     The authtoken middleware will take care of validating the user and
     keystoneauth will authorize access.
 
-    The authtoken middleware is shipped directly with keystone it
-    does not have any other dependences than itself so you can either
+    The sample proxy-server.conf shows a sample pipeline that uses keystone.
+
+    :download:`proxy-server.conf-sample </../../etc/proxy-server.conf-sample>`
+
+    The authtoken middleware is shipped with keystonemiddleware - it
+    does not have any other dependencies than itself so you can either
     install it by copying the file directly in your python path or by
-    installing keystone.
+    installing keystonemiddleware.
 
     If support is required for unvalidated users (as with anonymous
-    access) or for tempurl/formpost middleware, authtoken will need
-    to be configured with delay_auth_decision set to 1.  See the
-    Keystone documentation for more detail on how to configure the
+    access) or for formpost/staticweb/tempurl middleware, authtoken will
+    need to be configured with ``delay_auth_decision`` set to true.  See
+    the Keystone documentation for more detail on how to configure the
     authtoken middleware.
 
     In proxy-server.conf you will need to have the setting account
     auto creation to true::
 
-        [app:proxy-server] account_autocreate = true
+        [app:proxy-server]
+        account_autocreate = true
 
     And add a swift authorization filter section, such as::
 
@@ -55,28 +65,107 @@ class KeystoneAuth(object):
         use = egg:swift#keystoneauth
         operator_roles = admin, swiftoperator
 
-    This maps tenants to account in Swift.
-
-    The user whose able to give ACL / create Containers permissions
-    will be the one that are inside the operator_roles
+    The user who is able to give ACL / create Containers permissions
+    will be the user with a role listed in the ``operator_roles``
     setting which by default includes the admin and the swiftoperator
     roles.
 
-    The option is_admin if set to true will allow the
-    username that has the same name as the account name to be the owner.
-
-    Example: If we have the account called hellocorp with a user
-    hellocorp that user will be admin on that account and can give ACL
-    to all other users for hellocorp.
+    The keystoneauth middleware maps a Keystone project/tenant to an account
+    in Swift by adding a prefix (``AUTH_`` by default) to the tenant/project
+    id.. For example, if the project id is ``1234``, the path is
+    ``/v1/AUTH_1234``.
 
     If you need to have a different reseller_prefix to be able to
     mix different auth servers you can configure the option
-    reseller_prefix in your keystoneauth entry like this :
+    ``reseller_prefix`` in your keystoneauth entry like this::
+
+        reseller_prefix = NEWAUTH
+
+    Don't forget to also update the Keystone service endpoint configuration to
+    use NEWAUTH in the path.
+
+    It is possible to have several accounts associated with the same project.
+    This is done by listing several prefixes as shown in the following
+    example::
 
-        reseller_prefix = NEWAUTH_
+        reseller_prefix = AUTH, SERVICE
 
-    Make sure you have a underscore at the end of your new
-    reseller_prefix option.
+    This means that for project id '1234', the paths '/v1/AUTH_1234' and
+    '/v1/SERVICE_1234' are associated with the project and are authorized
+    using roles that a user has with that project. The core use of this feature
+    is that it is possible to provide different rules for each account
+    prefix. The following parameters may be prefixed with the appropriate
+    prefix::
+
+        operator_roles
+        service_roles
+
+    For backward compatibility, if either of these parameters is specified
+    without a prefix then it applies to all reseller_prefixes. Here is an
+    example, using two prefixes::
+
+        reseller_prefix = AUTH, SERVICE
+        # The next three lines have identical effects (since the first applies
+        # to both prefixes).
+        operator_roles = admin, swiftoperator
+        AUTH_operator_roles = admin, swiftoperator
+        SERVICE_operator_roles = admin, swiftoperator
+        # The next line only applies to accounts with the SERVICE prefix
+        SERVICE_operator_roles = admin, some_other_role
+
+    X-Service-Token tokens are supported by the inclusion of the service_roles
+    configuration option. When present, this option requires that the
+    X-Service-Token header supply a token from a user who has a role listed
+    in service_roles. Here is an example configuration::
+
+        reseller_prefix = AUTH, SERVICE
+        AUTH_operator_roles = admin, swiftoperator
+        SERVICE_operator_roles = admin, swiftoperator
+        SERVICE_service_roles = service
+
+    The keystoneauth middleware supports cross-tenant access control using the
+    syntax ``<tenant>:<user>`` to specify a grantee in container Access Control
+    Lists (ACLs). For a request to be granted by an ACL, the grantee
+    ``<tenant>`` must match the UUID of the tenant to which the request
+    X-Auth-Token is scoped and the grantee ``<user>`` must match the UUID of
+    the user authenticated by that token.
+
+    Note that names must no longer be used in cross-tenant ACLs because with
+    the introduction of domains in keystone names are no longer globally
+    unique.
+
+    For backwards compatibility, ACLs using names will be granted by
+    keystoneauth when it can be established that the grantee tenant,
+    the grantee user and the tenant being accessed are either not yet in a
+    domain (e.g. the X-Auth-Token has been obtained via the keystone v2
+    API) or are all in the default domain to which legacy accounts would
+    have been migrated. The default domain is identified by its UUID,
+    which by default has the value ``default``. This can be changed by
+    setting the ``default_domain_id`` option in the keystoneauth
+    configuration::
+
+        default_domain_id = default
+
+    The backwards compatible behavior can be disabled by setting the config
+    option ``allow_names_in_acls`` to false::
+
+        allow_names_in_acls = false
+
+    To enable this backwards compatibility, keystoneauth will attempt to
+    determine the domain id of a tenant when any new account is created,
+    and persist this as account metadata. If an account is created for a tenant
+    using a token with reselleradmin role that is not scoped on that tenant,
+    keystoneauth is unable to determine the domain id of the tenant;
+    keystoneauth will assume that the tenant may not be in the default domain
+    and therefore not match names in ACLs for that account.
+
+    By default, middleware higher in the WSGI pipeline may override auth
+    processing, useful for middleware such as tempurl and formpost. If you know
+    you're not going to use such middleware and you want a bit of extra
+    security you can disable this behaviour by setting the ``allow_overrides``
+    option to ``false``::
+
+        allow_overrides = false
 
     :param app: The next WSGI app in the pipeline
     :param conf: The dict of configuration values
@@ -85,149 +174,360 @@ def __init__(self, app, conf):
         self.app = app
         self.conf = conf
         self.logger = swift_utils.get_logger(conf, log_route='keystoneauth')
-        self.reseller_prefix = conf.get('reseller_prefix', 'AUTH_').strip()
-        self.operator_roles = conf.get('operator_roles',
-                                       'admin, swiftoperator')
+        self.reseller_prefixes, self.account_rules = \
+            config_read_reseller_options(conf,
+                                         dict(operator_roles=['admin',
+                                                              'swiftoperator'],
+                                              service_roles=[],
+                                              project_reader_roles=[]))
         self.reseller_admin_role = conf.get('reseller_admin_role',
-                                            'ResellerAdmin')
+                                            'ResellerAdmin').lower()
+        self.system_reader_roles = {role.lower() for role in list_from_csv(
+            conf.get('system_reader_roles', ''))}
+
         config_is_admin = conf.get('is_admin', "false").lower()
-        self.is_admin = swift_utils.config_true_value(config_is_admin)
+        if swift_utils.config_true_value(config_is_admin):
+            self.logger.warning("The 'is_admin' option for keystoneauth is no "
+                                "longer supported. Remove the 'is_admin' "
+                                "option from your keystoneauth config")
+
         config_overrides = conf.get('allow_overrides', 't').lower()
         self.allow_overrides = swift_utils.config_true_value(config_overrides)
+        self.default_domain_id = conf.get('default_domain_id', 'default')
+        self.allow_names_in_acls = swift_utils.config_true_value(
+            conf.get('allow_names_in_acls', 'true'))
 
     def __call__(self, environ, start_response):
-        identity = self._keystone_identity(environ)
+        env_identity = self._keystone_identity(environ)
 
         # Check if one of the middleware like tempurl or formpost have
         # set the swift.authorize_override environ and want to control the
         # authentication
         if (self.allow_overrides and
                 environ.get('swift.authorize_override', False)):
-            msg = 'Authorizing from an overriding middleware (i.e: tempurl)'
+            msg = 'Authorizing from an overriding middleware'
             self.logger.debug(msg)
             return self.app(environ, start_response)
 
-        if identity:
-            self.logger.debug('Using identity: %r' % (identity))
-            environ['keystone.identity'] = identity
-            environ['REMOTE_USER'] = identity.get('tenant')
-            environ['swift.authorize'] = self.authorize
+        if env_identity:
+            self.logger.debug('Using identity: %r', env_identity)
+            environ['REMOTE_USER'] = env_identity.get('tenant')
+            environ['keystone.identity'] = env_identity
+            environ['swift.authorize'] = functools.partial(
+                self.authorize, env_identity)
+            user_roles = (r.lower() for r in env_identity.get('roles', []))
+            if self.reseller_admin_role in user_roles:
+                environ['reseller_request'] = True
+            # Set access_user_id for consistent logging across auth middlewares
+            access_logging = environ.setdefault('swift.access_logging', {})
+            user_id, user_name = env_identity.get('user', (None, None))
+            access_logging['user_id'] = user_id or user_name
         else:
             self.logger.debug('Authorizing as anonymous')
             environ['swift.authorize'] = self.authorize_anonymous
 
         environ['swift.clean_acl'] = swift_acl.clean_acl
 
-        return self.app(environ, start_response)
+        def keystone_start_response(status, response_headers, exc_info=None):
+            project_domain_id = None
+            for key, val in response_headers:
+                if key.lower() == PROJECT_DOMAIN_ID_SYSMETA_HEADER:
+                    project_domain_id = val
+                    break
+            if project_domain_id:
+                response_headers.append((PROJECT_DOMAIN_ID_HEADER,
+                                         project_domain_id))
+            return start_response(status, response_headers, exc_info)
+
+        return self.app(environ, keystone_start_response)
 
     def _keystone_identity(self, environ):
         """Extract the identity from the Keystone auth component."""
-        if environ.get('HTTP_X_IDENTITY_STATUS') != 'Confirmed':
+        if (environ.get('HTTP_X_IDENTITY_STATUS') != 'Confirmed'
+            or environ.get(
+                'HTTP_X_SERVICE_IDENTITY_STATUS') not in (None, 'Confirmed')):
             return
-        roles = []
-        if 'HTTP_X_ROLES' in environ:
-            roles = environ['HTTP_X_ROLES'].split(',')
-        identity = {'user': environ.get('HTTP_X_USER_NAME'),
-                    'tenant': (environ.get('HTTP_X_TENANT_ID'),
-                               environ.get('HTTP_X_TENANT_NAME')),
-                    'roles': roles}
+        roles = list_from_csv(environ.get('HTTP_X_ROLES', ''))
+        service_roles = list_from_csv(environ.get('HTTP_X_SERVICE_ROLES', ''))
+        identity = {'user': (environ.get('HTTP_X_USER_ID'),
+                             environ.get('HTTP_X_USER_NAME')),
+                    'tenant': (environ.get('HTTP_X_PROJECT_ID',
+                                           environ.get('HTTP_X_TENANT_ID')),
+                               environ.get('HTTP_X_PROJECT_NAME',
+                                           environ.get('HTTP_X_TENANT_NAME'))),
+                    'roles': roles,
+                    'service_roles': service_roles}
+        token_info = environ.get('keystone.token_info', {})
+        auth_version = 0
+        user_domain = project_domain = (None, None)
+        if 'access' in token_info:
+            # ignore any domain id headers that authtoken may have set
+            auth_version = 2
+        elif 'token' in token_info:
+            auth_version = 3
+            user_domain = (environ.get('HTTP_X_USER_DOMAIN_ID'),
+                           environ.get('HTTP_X_USER_DOMAIN_NAME'))
+            project_domain = (environ.get('HTTP_X_PROJECT_DOMAIN_ID'),
+                              environ.get('HTTP_X_PROJECT_DOMAIN_NAME'))
+        identity['user_domain'] = user_domain
+        identity['project_domain'] = project_domain
+        identity['auth_version'] = auth_version
         return identity
 
-    def _get_account_for_tenant(self, tenant_id):
-        return '%s%s' % (self.reseller_prefix, tenant_id)
+    def _get_account_name(self, prefix, tenant_id):
+        return '%s%s' % (prefix, tenant_id)
 
-    def _reseller_check(self, account, tenant_id):
-        """Check reseller prefix."""
-        return account == self._get_account_for_tenant(tenant_id)
+    def _account_matches_tenant(self, account, tenant_id):
+        """Check if account belongs to a project/tenant"""
+        for prefix in self.reseller_prefixes:
+            if self._get_account_name(prefix, tenant_id) == account:
+                return True
+        return False
+
+    def _get_account_prefix(self, account):
+        """Get the prefix of an account"""
+        # Empty prefix matches everything, so try to match others first
+        for prefix in [pre for pre in self.reseller_prefixes if pre != '']:
+            if account.startswith(prefix):
+                return prefix
+        if '' in self.reseller_prefixes:
+            return ''
+        return None
+
+    def _get_project_domain_id(self, environ):
+        info = get_account_info(environ, self.app, 'KS')
+        domain_id = info.get('sysmeta', {}).get('project-domain-id')
+        exists = (is_success(info.get('status', 0))
+                  and info.get('account_really_exists', True))
+        return exists, domain_id
+
+    def _set_project_domain_id(self, req, path_parts, env_identity):
+        '''
+        Try to determine the project domain id and save it as
+        account metadata. Do this for a PUT or POST to the
+        account, and also for a container PUT in case that
+        causes the account to be auto-created.
+        '''
+        if PROJECT_DOMAIN_ID_SYSMETA_HEADER in req.headers:
+            return
+
+        version, account, container, obj = path_parts
+        method = req.method
+        if (obj or (container and method != 'PUT')
+                or method not in ['PUT', 'POST']):
+            return
 
-    def _authorize_cross_tenant(self, user, tenant_id, tenant_name, roles):
-        """ Check cross-tenant ACLs
+        tenant_id, tenant_name = env_identity['tenant']
+        exists, sysmeta_id = self._get_project_domain_id(req.environ)
+        req_has_id, req_id, new_id = False, None, None
+        if self._account_matches_tenant(account, tenant_id):
+            # domain id can be inferred from request (may be None)
+            req_has_id = True
+            req_id = env_identity['project_domain'][0]
+        if not exists:
+            # new account so set a domain id
+            new_id = req_id if req_has_id else UNKNOWN_ID
+        elif sysmeta_id is None and req_id == self.default_domain_id:
+            # legacy account, update if default domain id in req
+            new_id = req_id
+        elif sysmeta_id == UNKNOWN_ID and req_has_id:
+            # unknown domain, update if req confirms domain
+            new_id = req_id or ''
+        elif req_has_id and sysmeta_id != req_id:
+            self.logger.warning("Inconsistent project domain id: " +
+                                "%s in token vs %s in account metadata."
+                                % (req_id, sysmeta_id))
+
+        if new_id is not None:
+            req.headers[PROJECT_DOMAIN_ID_SYSMETA_HEADER] = new_id
+
+    def _is_name_allowed_in_acl(self, req, path_parts, identity):
+        if not self.allow_names_in_acls:
+            return False
+        user_domain_id = identity['user_domain'][0]
+        if user_domain_id and user_domain_id != self.default_domain_id:
+            return False
 
-        Match tenant_id:user, tenant_name:user, and *:user.
+        proj_domain_id = identity['project_domain'][0]
+        if proj_domain_id and proj_domain_id != self.default_domain_id:
+            return False
 
-        :param user: The user name from the identity token.
+        # request user and scoped project are both in default domain
+        tenant_id, tenant_name = identity['tenant']
+        version, account, container, obj = path_parts
+        if self._account_matches_tenant(account, tenant_id):
+            # account == scoped project, so account is also in default domain
+            allow = True
+        else:
+            # retrieve account project domain id from account sysmeta
+            exists, acc_domain_id = self._get_project_domain_id(req.environ)
+            allow = exists and acc_domain_id in [self.default_domain_id, None]
+        if allow:
+            self.logger.debug("Names allowed in acls.")
+        return allow
+
+    def _authorize_cross_tenant(self, user_id, user_name,
+                                tenant_id, tenant_name, roles,
+                                allow_names=True):
+        """Check cross-tenant ACLs.
+
+        Match tenant:user, tenant and user could be its id, name or '*'
+
+        :param user_id: The user id from the identity token.
+        :param user_name: The user name from the identity token.
         :param tenant_id: The tenant ID from the identity token.
         :param tenant_name: The tenant name from the identity token.
         :param roles: The given container ACL.
+        :param allow_names: If True then attempt to match tenant and user names
+                            as well as id's.
 
-        :returns: True if tenant_id:user, tenant_name:user, or *:user matches
-                  the given ACL. False otherwise.
+        :returns: matched string if tenant(name/id/*):user(name/id/*) matches
+                  the given ACL.
+                  None otherwise.
 
         """
-        wildcard_tenant_match = '*:%s' % (user)
-        tenant_id_user_match = '%s:%s' % (tenant_id, user)
-        tenant_name_user_match = '%s:%s' % (tenant_name, user)
-
-        return (wildcard_tenant_match in roles
-                or tenant_id_user_match in roles
-                or tenant_name_user_match in roles)
-
-    def authorize(self, req):
-        env = req.environ
-        env_identity = env.get('keystone.identity', {})
-        tenant_id, tenant_name = env_identity.get('tenant')
-        user = env_identity.get('user', '')
+        tenant_match = [tenant_id, '*']
+        user_match = [user_id, '*']
+        if allow_names:
+            tenant_match = tenant_match + [tenant_name]
+            user_match = user_match + [user_name]
+        for tenant in tenant_match:
+            for user in user_match:
+                s = '%s:%s' % (tenant, user)
+                if s in roles:
+                    return s
+        return None
+
+    def authorize(self, env_identity, req):
+        # Cleanup - make sure that a previously set swift_owner setting is
+        # cleared now. This might happen for example with COPY requests.
+        req.environ.pop('swift_owner', None)
+
+        tenant_id, tenant_name = env_identity['tenant']
+        user_id, user_name = env_identity['user']
         referrers, roles = swift_acl.parse_acl(getattr(req, 'acl', None))
 
+        # allow OPTIONS requests to proceed as normal
+        if req.method == 'OPTIONS':
+            return
+
         try:
-            part = swift_utils.split_path(req.path, 1, 4, True)
+            part = req.split_path(1, 4, True)
             version, account, container, obj = part
         except ValueError:
             return HTTPNotFound(request=req)
 
-        user_roles = env_identity.get('roles', [])
+        self._set_project_domain_id(req, part, env_identity)
 
-        # Give unconditional access to a user with the reseller_admin
-        # role.
+        user_roles = [r.lower() for r in env_identity.get('roles', [])]
+        user_service_roles = [r.lower() for r in env_identity.get(
+                              'service_roles', [])]
+
+        # Give unconditional access to a user with the reseller_admin role.
         if self.reseller_admin_role in user_roles:
             msg = 'User %s has reseller admin authorizing'
-            self.logger.debug(msg % tenant_id)
+            self.logger.debug(msg, tenant_id)
             req.environ['swift_owner'] = True
             return
 
+        # Being in system_reader_roles is almost as good as reseller_admin.
+        if self.system_reader_roles.intersection(user_roles):
+            # Note that if a system reader is trying to write, we're letting
+            # the request fall on other access checks below. This way,
+            # a compliance auditor can write a log file as a normal member.
+            if req.method in ('GET', 'HEAD'):
+                msg = 'User %s has system reader authorizing'
+                self.logger.debug(msg, tenant_id)
+                # We aren't setting 'swift_owner' nor 'reseller_request'
+                # because they are only ever used for something that modifies
+                # the contents of the cluster (setting ACL, deleting accounts).
+                return
+
+        # If we are not reseller admin and user is trying to delete its own
+        # account then deny it.
+        if not container and not obj and req.method == 'DELETE':
+            # User is not allowed to issue a DELETE on its own account
+            msg = 'User %s:%s is not allowed to delete its own account'
+            self.logger.debug(msg, tenant_name, user_name)
+            return self.denied_response(req)
+
         # cross-tenant authorization
-        if self._authorize_cross_tenant(user, tenant_id, tenant_name, roles):
-            log_msg = 'user %s:%s, %s:%s, or *:%s allowed in ACL authorizing'
-            self.logger.debug(log_msg % (tenant_name, user,
-                                         tenant_id, user, user))
+        matched_acl = None
+        if roles:
+            allow_names = self._is_name_allowed_in_acl(req, part, env_identity)
+            matched_acl = self._authorize_cross_tenant(user_id, user_name,
+                                                       tenant_id, tenant_name,
+                                                       roles, allow_names)
+        if matched_acl is not None:
+            log_msg = 'user %s allowed in ACL authorizing.'
+            self.logger.debug(log_msg, matched_acl)
+            return
+
+        acl_authorized = self._authorize_unconfirmed_identity(req, obj,
+                                                              referrers,
+                                                              roles)
+        if acl_authorized:
             return
 
         # Check if a user tries to access an account that does not match their
         # token
-        if not self._reseller_check(account, tenant_id):
-            log_msg = 'tenant mismatch: %s != %s' % (account, tenant_id)
-            self.logger.debug(log_msg)
+        if not self._account_matches_tenant(account, tenant_id):
+            log_msg = 'tenant mismatch: %s != %s'
+            self.logger.debug(log_msg, account, tenant_id)
             return self.denied_response(req)
 
-        # Check the roles the user is belonging to. If the user is
-        # part of the role defined in the config variable
-        # operator_roles (like admin) then it will be
-        # promoted as an admin of the account/tenant.
-        for role in self.operator_roles.split(','):
-            role = role.strip()
-            if role in user_roles:
-                log_msg = 'allow user with role %s as account admin' % (role)
-                self.logger.debug(log_msg)
-                req.environ['swift_owner'] = True
-                return
-
-        # If user is of the same name of the tenant then make owner of it.
-        if self.is_admin and user == tenant_name:
+        # Compare roles from tokens against the configuration options:
+        #
+        # X-Auth-Token role  Has specified  X-Service-Token role  Grant
+        # in operator_roles? service_roles? in service_roles?     swift_owner?
+        # ------------------ -------------- --------------------  ------------
+        # yes                yes            yes                   yes
+        # yes                yes            no                    no
+        # yes                no             don't care            yes
+        # no                 don't care     don't care            no
+        # ------------------ -------------- --------------------  ------------
+        account_prefix = self._get_account_prefix(account)
+        operator_roles = self.account_rules[account_prefix]['operator_roles']
+        have_operator_role = set(operator_roles).intersection(
+            set(user_roles))
+        service_roles = self.account_rules[account_prefix]['service_roles']
+        have_service_role = set(service_roles).intersection(
+            set(user_service_roles))
+        allowed = False
+        if have_operator_role and (service_roles and have_service_role):
+            allowed = True
+        elif have_operator_role and not service_roles:
+            allowed = True
+        if allowed:
+            log_msg = 'allow user with role(s) %s as account admin'
+            self.logger.debug(log_msg, ','.join(have_operator_role.union(
+                                                have_service_role)))
             req.environ['swift_owner'] = True
             return
 
-        authorized = self._authorize_unconfirmed_identity(req, obj, referrers,
-                                                          roles)
-        if authorized:
-            return
-        elif authorized is not None:
+        # The project_reader_roles is almost as good as operator_roles. But
+        # it does not work with service tokens and does not get 'swift_owner'.
+        # And, it only serves GET requests, obviously.
+        project_reader_roles = self.account_rules[account_prefix][
+            'project_reader_roles']
+        have_reader_role = set(project_reader_roles).intersection(
+            set(user_roles))
+        if have_reader_role:
+            if req.method in ('GET', 'HEAD'):
+                msg = 'User %s with role(s) %s has project reader authorizing'
+                self.logger.debug(msg, tenant_id,
+                                  ','.join(project_reader_roles))
+                return
+
+        if acl_authorized is not None:
             return self.denied_response(req)
 
         # Check if we have the role in the userroles and allow it
         for user_role in user_roles:
-            if user_role in roles:
+            if user_role in (r.lower() for r in roles):
                 log_msg = 'user %s:%s allowed in ACL: %s authorizing'
-                self.logger.debug(log_msg % (tenant_name, user, user_role))
+                self.logger.debug(log_msg, tenant_name, user_name,
+                                  user_role)
                 return
 
         return self.denied_response(req)
@@ -239,13 +539,18 @@ def authorize_anonymous(self, req):
         :returns: None if authorization is granted, an error page otherwise.
         """
         try:
-            part = swift_utils.split_path(req.path, 1, 4, True)
+            part = req.split_path(1, 4, True)
             version, account, container, obj = part
         except ValueError:
             return HTTPNotFound(request=req)
 
+        # allow OPTIONS requests to proceed as normal
+        if req.method == 'OPTIONS':
+            return
+
         is_authoritative_authz = (account and
-                                  account.startswith(self.reseller_prefix))
+                                  (self._get_account_prefix(account) in
+                                   self.reseller_prefixes))
         if not is_authoritative_authz:
             return self.denied_response(req)
 
@@ -268,15 +573,15 @@ def _authorize_unconfirmed_identity(self, req, obj, referrers, roles):
                 and (req.environ['swift_sync_key'] ==
                      req.headers.get('x-container-sync-key', None))
                 and 'x-timestamp' in req.headers):
-            log_msg = 'allowing proxy %s for container-sync' % req.remote_addr
-            self.logger.debug(log_msg)
+            log_msg = 'allowing proxy %s for container-sync'
+            self.logger.debug(log_msg, req.remote_addr)
             return True
 
         # Check if referrer is allowed.
         if swift_acl.referrer_allowed(req.referer, referrers):
             if obj or '.rlistings' in roles:
-                log_msg = 'authorizing %s via referer ACL' % req.referrer
-                self.logger.debug(log_msg)
+                log_msg = 'authorizing %s via referer ACL'
+                self.logger.debug(log_msg, req.referrer)
                 return True
             return False
 
diff --git a/swift/common/middleware/list_endpoints.py b/swift/common/middleware/list_endpoints.py
new file mode 100644
index 0000000000..edceec421e
--- /dev/null
+++ b/swift/common/middleware/list_endpoints.py
@@ -0,0 +1,264 @@
+# Copyright (c) 2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""
+List endpoints for an object, account or container.
+
+This middleware makes it possible to integrate swift with software
+that relies on data locality information to avoid network overhead,
+such as Hadoop.
+
+Using the original API, answers requests of the form::
+
+    /endpoints/{account}/{container}/{object}
+    /endpoints/{account}/{container}
+    /endpoints/{account}
+    /endpoints/v1/{account}/{container}/{object}
+    /endpoints/v1/{account}/{container}
+    /endpoints/v1/{account}
+
+with a JSON-encoded list of endpoints of the form::
+
+    http://{server}:{port}/{dev}/{part}/{acc}/{cont}/{obj}
+    http://{server}:{port}/{dev}/{part}/{acc}/{cont}
+    http://{server}:{port}/{dev}/{part}/{acc}
+
+correspondingly, e.g.::
+
+    http://10.1.1.1:6200/sda1/2/a/c2/o1
+    http://10.1.1.1:6200/sda1/2/a/c2
+    http://10.1.1.1:6200/sda1/2/a
+
+Using the v2 API, answers requests of the form::
+
+    /endpoints/v2/{account}/{container}/{object}
+    /endpoints/v2/{account}/{container}
+    /endpoints/v2/{account}
+
+with a JSON-encoded dictionary containing a key 'endpoints' that maps to a list
+of endpoints having the same form as described above, and a key 'headers' that
+maps to a dictionary of headers that should be sent with a request made to
+the endpoints, e.g.::
+
+    { "endpoints": {"http://10.1.1.1:6210/sda1/2/a/c3/o1",
+                    "http://10.1.1.1:6230/sda3/2/a/c3/o1",
+                    "http://10.1.1.1:6240/sda4/2/a/c3/o1"},
+      "headers": {"X-Backend-Storage-Policy-Index": "1"}}
+
+In this example, the 'headers' dictionary indicates that requests to the
+endpoint URLs should include the header 'X-Backend-Storage-Policy-Index: 1'
+because the object's container is using storage policy index 1.
+
+The '/endpoints/' path is customizable ('list_endpoints_path'
+configuration parameter).
+
+Intended for consumption by third-party services living inside the
+cluster (as the endpoints make sense only inside the cluster behind
+the firewall); potentially written in a different language.
+
+This is why it's provided as a REST API and not just a Python API:
+to avoid requiring clients to write their own ring parsers in their
+languages, and to avoid the necessity to distribute the ring file
+to clients and keep it up-to-date.
+
+Note that the call is not authenticated, which means that a proxy
+with this middleware enabled should not be open to an untrusted
+environment (everyone can query the locality data using this middleware).
+"""
+
+import json
+
+from urllib.parse import quote, unquote
+
+from swift.common.ring import Ring
+from swift.common.utils import get_logger, split_path
+from swift.common.swob import Request, Response
+from swift.common.swob import HTTPBadRequest, HTTPMethodNotAllowed
+from swift.common.storage_policy import POLICIES
+from swift.proxy.controllers.base import get_container_info
+
+RESPONSE_VERSIONS = (1.0, 2.0)
+
+
+class ListEndpointsMiddleware(object):
+    """
+    List endpoints for an object, account or container.
+
+    See above for a full description.
+
+    Uses configuration parameter `swift_dir` (default `/etc/swift`).
+
+    :param app: The next WSGI filter or app in the paste.deploy
+                chain.
+    :param conf: The configuration dict for the middleware.
+    """
+
+    def __init__(self, app, conf):
+        self.app = app
+        self.logger = get_logger(conf, log_route='endpoints')
+        self.swift_dir = conf.get('swift_dir', '/etc/swift')
+        self.account_ring = Ring(self.swift_dir, ring_name='account')
+        self.container_ring = Ring(self.swift_dir, ring_name='container')
+        self.endpoints_path = conf.get('list_endpoints_path', '/endpoints/')
+        if not self.endpoints_path.endswith('/'):
+            self.endpoints_path += '/'
+        self.default_response_version = 1.0
+        self.response_map = {
+            1.0: self.v1_format_response,
+            2.0: self.v2_format_response,
+        }
+
+    def get_object_ring(self, policy_idx):
+        """
+        Get the ring object to use to handle a request based on its policy.
+
+        :policy_idx: policy index as defined in swift.conf
+        :returns: appropriate ring object
+        """
+        return POLICIES.get_object_ring(policy_idx, self.swift_dir)
+
+    def _parse_version(self, raw_version):
+        err_msg = 'Unsupported version %r' % raw_version
+        try:
+            version = float(raw_version.lstrip('v'))
+        except ValueError:
+            raise ValueError(err_msg)
+        if not any(version == v for v in RESPONSE_VERSIONS):
+            raise ValueError(err_msg)
+        return version
+
+    def _parse_path(self, request):
+        """
+        Parse path parts of request into a tuple of version, account,
+        container, obj.  Unspecified container or obj is filled in as
+        None; account is required; version is always returned as a
+        float using the configured default response version if not
+        specified in the request.
+
+        :param request: the swob request
+
+        :returns: parsed path parts as a tuple with version filled in as
+                  configured default response version if not specified.
+        :raises ValueError: if path is invalid, message will say why.
+        """
+        clean_path = request.path[len(self.endpoints_path) - 1:]
+        # try to peel off version
+        try:
+            raw_version, rest = split_path(clean_path, 1, 2, True)
+        except ValueError:
+            raise ValueError('No account specified')
+        try:
+            version = self._parse_version(raw_version)
+        except ValueError:
+            if raw_version.startswith('v') and '_' not in raw_version:
+                # looks more like an invalid version than an account
+                raise
+            # probably no version specified, but if the client really
+            # said /endpoints/v_3/account they'll probably be sorta
+            # confused by the useless response and lack of error.
+            version = self.default_response_version
+            rest = clean_path
+        else:
+            rest = '/' + rest if rest else '/'
+        try:
+            account, container, obj = split_path(rest, 1, 3, True)
+        except ValueError:
+            raise ValueError('No account specified')
+        return version, account, container, obj
+
+    def v1_format_response(self, req, endpoints, **kwargs):
+        return Response(json.dumps(endpoints),
+                        content_type='application/json')
+
+    def v2_format_response(self, req, endpoints, storage_policy_index,
+                           **kwargs):
+        resp = {
+            'endpoints': endpoints,
+            'headers': {},
+        }
+        if storage_policy_index is not None:
+            resp['headers'][
+                'X-Backend-Storage-Policy-Index'] = str(storage_policy_index)
+        return Response(json.dumps(resp),
+                        content_type='application/json')
+
+    def __call__(self, env, start_response):
+        request = Request(env)
+        if not request.path.startswith(self.endpoints_path):
+            return self.app(env, start_response)
+
+        if request.method != 'GET':
+            return HTTPMethodNotAllowed(
+                req=request, headers={"Allow": "GET"})(env, start_response)
+
+        try:
+            version, account, container, obj = self._parse_path(request)
+        except ValueError as err:
+            return HTTPBadRequest(str(err))(env, start_response)
+
+        account = unquote(account)
+        if container is not None:
+            container = unquote(container)
+        if obj is not None:
+            obj = unquote(obj)
+
+        storage_policy_index = None
+        if obj is not None:
+            container_info = get_container_info(
+                {'PATH_INFO': '/v1/%s/%s' % (account, container)},
+                self.app, swift_source='LE')
+            storage_policy_index = container_info['storage_policy']
+            obj_ring = self.get_object_ring(storage_policy_index)
+            partition, nodes = obj_ring.get_nodes(
+                account, container, obj)
+            endpoint_template = 'http://{ip}:{port}/{device}/{partition}/' + \
+                                '{account}/{container}/{obj}'
+        elif container is not None:
+            partition, nodes = self.container_ring.get_nodes(
+                account, container)
+            endpoint_template = 'http://{ip}:{port}/{device}/{partition}/' + \
+                                '{account}/{container}'
+        else:
+            partition, nodes = self.account_ring.get_nodes(
+                account)
+            endpoint_template = 'http://{ip}:{port}/{device}/{partition}/' + \
+                                '{account}'
+
+        endpoints = []
+        for node in nodes:
+            endpoint = endpoint_template.format(
+                ip=node['ip'],
+                port=node['port'],
+                device=node['device'],
+                partition=partition,
+                account=quote(account),
+                container=quote(container or ''),
+                obj=quote(obj or ''))
+            endpoints.append(endpoint)
+
+        resp = self.response_map[version](
+            request, endpoints=endpoints,
+            storage_policy_index=storage_policy_index)
+        return resp(env, start_response)
+
+
+def filter_factory(global_conf, **local_conf):
+    conf = global_conf.copy()
+    conf.update(local_conf)
+
+    def list_endpoints_filter(app):
+        return ListEndpointsMiddleware(app, conf)
+
+    return list_endpoints_filter
diff --git a/swift/common/middleware/listing_formats.py b/swift/common/middleware/listing_formats.py
new file mode 100644
index 0000000000..290a73152a
--- /dev/null
+++ b/swift/common/middleware/listing_formats.py
@@ -0,0 +1,265 @@
+# Copyright (c) 2017 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import json
+from xml.etree.cElementTree import Element, SubElement, tostring
+
+from swift.common.constraints import valid_api_version
+from swift.common.header_key_dict import HeaderKeyDict
+from swift.common.http import HTTP_NO_CONTENT
+from swift.common.request_helpers import get_param
+from swift.common.swob import HTTPException, HTTPNotAcceptable, Request, \
+    RESPONSE_REASONS, HTTPBadRequest, wsgi_quote, wsgi_to_bytes
+from swift.common.utils import RESERVED, get_logger, list_from_csv
+
+
+#: Mapping of query string ``format=`` values to their corresponding
+#: content-type values.
+FORMAT2CONTENT_TYPE = {'plain': 'text/plain', 'json': 'application/json',
+                       'xml': 'application/xml'}
+#: Maximum size of a valid JSON container listing body. If we receive
+#: a container listing response larger than this, assume it's a staticweb
+#: response and pass it on to the client.
+# Default max object length is 1024, default container listing limit is 1e4;
+# add a fudge factor for things like hash, last_modified, etc.
+MAX_CONTAINER_LISTING_CONTENT_LENGTH = 1024 * 10000 * 2
+
+
+def get_listing_content_type(req):
+    """
+    Determine the content type to use for an account or container listing
+    response.
+
+    :param req: request object
+    :returns: content type as a string (e.g. text/plain, application/json)
+    :raises HTTPNotAcceptable: if the requested content type is not acceptable
+    :raises HTTPBadRequest: if the 'format' query param is provided and
+             not valid UTF-8
+    """
+    query_format = get_param(req, 'format')
+    if query_format:
+        req.accept = FORMAT2CONTENT_TYPE.get(
+            query_format.lower(), FORMAT2CONTENT_TYPE['plain'])
+    try:
+        out_content_type = req.accept.best_match(
+            ['text/plain', 'application/json', 'application/xml', 'text/xml'])
+    except ValueError:
+        raise HTTPBadRequest(request=req, body=b'Invalid Accept header')
+    if not out_content_type:
+        raise HTTPNotAcceptable(request=req)
+    return out_content_type
+
+
+def to_xml(document_element):
+    result = tostring(document_element, encoding='UTF-8').replace(
+        b"<?xml version='1.0' encoding='UTF-8'?>",
+        b'<?xml version="1.0" encoding="UTF-8"?>', 1)
+    if not result.startswith(b'<?xml '):
+        # py3 tostring doesn't (necessarily?) include the XML declaration;
+        # add it if it's missing.
+        result = b'<?xml version="1.0" encoding="UTF-8"?>\n' + result
+    return result
+
+
+def account_to_xml(listing, account_name):
+    doc = Element('account', name=account_name)
+    doc.text = '\n'
+    for record in listing:
+        if 'subdir' in record:
+            name = record.pop('subdir')
+            sub = SubElement(doc, 'subdir', name=name)
+        else:
+            sub = SubElement(doc, 'container')
+            for field in ('name', 'count', 'bytes', 'last_modified'):
+                SubElement(sub, field).text = str(record.pop(field))
+            for field in ('storage_policy',):
+                if field in record:
+                    SubElement(sub, field).text = str(record.pop(field))
+        sub.tail = '\n'
+    return to_xml(doc)
+
+
+def container_to_xml(listing, base_name):
+    doc = Element('container', name=base_name)
+    for record in listing:
+        if 'subdir' in record:
+            name = record.pop('subdir')
+            sub = SubElement(doc, 'subdir', name=name)
+            SubElement(sub, 'name').text = name
+        else:
+            sub = SubElement(doc, 'object')
+            for field in ('name', 'hash', 'bytes', 'content_type',
+                          'last_modified'):
+                SubElement(sub, field).text = str(record.pop(field))
+    return to_xml(doc)
+
+
+def listing_to_text(listing):
+    def get_lines():
+        for item in listing:
+            if 'name' in item:
+                yield item['name'].encode('utf-8') + b'\n'
+            else:
+                yield item['subdir'].encode('utf-8') + b'\n'
+    return b''.join(get_lines())
+
+
+class ListingFilter(object):
+    def __init__(self, app, conf, logger=None):
+        self.app = app
+        self.logger = logger or get_logger(conf, log_route='listing-filter')
+
+    def filter_reserved(self, listing, account, container):
+        new_listing = []
+        for entry in list(listing):
+            for key in ('name', 'subdir'):
+                value = entry.get(key, '')
+                if RESERVED in value:
+                    if container:
+                        self.logger.warning(
+                            'Container listing for %s/%s had '
+                            'reserved byte in %s: %r',
+                            wsgi_quote(account), wsgi_quote(container),
+                            key, value)
+                    else:
+                        self.logger.warning(
+                            'Account listing for %s had '
+                            'reserved byte in %s: %r',
+                            wsgi_quote(account), key, value)
+                    break  # out of the *key* loop; check next entry
+            else:
+                new_listing.append(entry)
+        return new_listing
+
+    def __call__(self, env, start_response):
+        req = Request(env)
+        try:
+            # account and container only
+            version, acct, cont = req.split_path(2, 3)
+        except ValueError:
+            is_account_or_container_req = False
+        else:
+            is_account_or_container_req = True
+        if not is_account_or_container_req:
+            return self.app(env, start_response)
+
+        if not valid_api_version(version) or req.method not in ('GET', 'HEAD'):
+            return self.app(env, start_response)
+
+        # OK, definitely have an account/container request.
+        # Get the desired content-type, then force it to a JSON request.
+        try:
+            out_content_type = get_listing_content_type(req)
+        except HTTPException as err:
+            return err(env, start_response)
+
+        params = req.params
+        can_vary = 'format' not in params
+        params['format'] = 'json'
+        req.params = params
+
+        # Give other middlewares a chance to be in charge
+        env.setdefault('swift.format_listing', True)
+        status, headers, resp_iter = req.call_application(self.app)
+        if not env.get('swift.format_listing'):
+            start_response(status, headers)
+            return resp_iter
+
+        if not status.startswith(('200 ', '204 ')):
+            start_response(status, headers)
+            return resp_iter
+
+        headers_dict = HeaderKeyDict(headers)
+        resp_content_type = headers_dict.get(
+            'content-type', '').partition(';')[0]
+        resp_length = headers_dict.get('content-length')
+
+        if can_vary:
+            if 'vary' in headers_dict:
+                value = headers_dict['vary']
+                if 'accept' not in list_from_csv(value.lower()):
+                    headers_dict['vary'] = value + ', Accept'
+            else:
+                headers_dict['vary'] = 'Accept'
+
+        if resp_content_type != 'application/json':
+            start_response(status, list(headers_dict.items()))
+            return resp_iter
+
+        if req.method == 'HEAD':
+            headers_dict['content-type'] = out_content_type + '; charset=utf-8'
+            # proxy logging (and maybe other mw?) seem to be good about
+            # sticking this on HEAD/204 but we do it here to be responsible
+            # and explicit
+            headers_dict['content-length'] = 0
+            start_response(status, list(headers_dict.items()))
+            return resp_iter
+
+        if resp_length is None or \
+                int(resp_length) > MAX_CONTAINER_LISTING_CONTENT_LENGTH:
+            start_response(status, list(headers_dict.items()))
+            return resp_iter
+
+        body = b''.join(resp_iter)
+        try:
+            listing = json.loads(body)
+            # Do a couple sanity checks
+            if not isinstance(listing, list):
+                raise ValueError
+            if not all(isinstance(item, dict) for item in listing):
+                raise ValueError
+        except ValueError:
+            # Static web listing that's returning invalid JSON?
+            # Just pass it straight through; that's about all we *can* do.
+            start_response(status, list(headers_dict.items()))
+            return [body]
+
+        if not req.allow_reserved_names:
+            listing = self.filter_reserved(listing, acct, cont)
+
+        try:
+            if out_content_type.endswith('/xml'):
+                if cont:
+                    body = container_to_xml(
+                        listing, wsgi_to_bytes(cont).decode('utf-8'))
+                else:
+                    body = account_to_xml(
+                        listing, wsgi_to_bytes(acct).decode('utf-8'))
+            elif out_content_type == 'text/plain':
+                body = listing_to_text(listing)
+            else:
+                body = json.dumps(listing).encode('ascii')
+        except KeyError:
+            # listing was in a bad format -- funky static web listing??
+            start_response(status, list(headers_dict.items()))
+            return [body]
+
+        if not body:
+            status = '%s %s' % (HTTP_NO_CONTENT,
+                                RESPONSE_REASONS[HTTP_NO_CONTENT][0])
+
+        headers_dict['content-type'] = out_content_type + '; charset=utf-8'
+        headers_dict['content-length'] = len(body)
+        start_response(status, list(headers_dict.items()))
+        return [body]
+
+
+def filter_factory(global_conf, **local_conf):
+    conf = global_conf.copy()
+    conf.update(local_conf)
+
+    def listing_filter(app):
+        return ListingFilter(app, conf)
+    return listing_filter
diff --git a/swift/common/middleware/memcache.py b/swift/common/middleware/memcache.py
index 13e16d4c68..1bb142657d 100644
--- a/swift/common/middleware/memcache.py
+++ b/swift/common/middleware/memcache.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,10 +13,8 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-import os
-from ConfigParser import ConfigParser, NoSectionError, NoOptionError
-
-from swift.common.memcached import MemcacheRing
+from swift.common.memcached import load_memcache
+from swift.common.utils import get_logger
 
 
 class MemcacheMiddleware(object):
@@ -26,39 +24,8 @@ class MemcacheMiddleware(object):
 
     def __init__(self, app, conf):
         self.app = app
-        self.memcache_servers = conf.get('memcache_servers')
-        serialization_format = conf.get('memcache_serialization_support')
-
-        if not self.memcache_servers or serialization_format is None:
-            path = os.path.join(conf.get('swift_dir', '/etc/swift'),
-                                'memcache.conf')
-            memcache_conf = ConfigParser()
-            if memcache_conf.read(path):
-                if not self.memcache_servers:
-                    try:
-                        self.memcache_servers = \
-                            memcache_conf.get('memcache', 'memcache_servers')
-                    except (NoSectionError, NoOptionError):
-                        pass
-                if serialization_format is None:
-                    try:
-                        serialization_format = \
-                            memcache_conf.get('memcache',
-                                              'memcache_serialization_support')
-                    except (NoSectionError, NoOptionError):
-                        pass
-
-        if not self.memcache_servers:
-            self.memcache_servers = '127.0.0.1:11211'
-        if serialization_format is None:
-            serialization_format = 2
-        else:
-            serialization_format = int(serialization_format)
-
-        self.memcache = MemcacheRing(
-            [s.strip() for s in self.memcache_servers.split(',') if s.strip()],
-            allow_pickle=(serialization_format == 0),
-            allow_unpickle=(serialization_format <= 1))
+        self.logger = get_logger(conf, log_route='memcache')
+        self.memcache = load_memcache(conf, self.logger)
 
     def __call__(self, env, start_response):
         env['swift.cache'] = self.memcache
diff --git a/swift/common/middleware/name_check.py b/swift/common/middleware/name_check.py
index 39411690c9..b13c5a76bd 100644
--- a/swift/common/middleware/name_check.py
+++ b/swift/common/middleware/name_check.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2012 OpenStack, LLC.
+# Copyright (c) 2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -15,14 +15,17 @@
 '''
 Created on February 27, 2012
 
-A filter that disallows any paths that contain defined forbidden characters
-or that exceed a defined length.
+A filter that disallows any paths that contain defined forbidden characters or
+that exceed a defined length.
 
-Place in proxy filter before proxy, e.g.
+Place early in the proxy-server pipeline after the left-most occurrence of the
+``proxy-logging`` middleware (if present) and before the final
+``proxy-logging`` middleware (if present) or the ``proxy-serer`` app itself,
+e.g.::
 
     [pipeline:main]
-    pipeline = catch_errors healthcheck name_check cache ratelimit tempauth sos
-               proxy-logging proxy-server
+    pipeline = catch_errors healthcheck proxy-logging name_check cache \
+ratelimit tempauth sos proxy-logging proxy-server
 
     [filter:name_check]
     use = egg:swift#name_check
@@ -39,14 +42,14 @@
 
 import re
 from swift.common.utils import get_logger
-from urllib2 import unquote
+from swift.common.registry import register_swift_info
 
 from swift.common.swob import Request, HTTPBadRequest
 
 
 FORBIDDEN_CHARS = "\'\"`<>"
 MAX_LENGTH = 255
-FORBIDDEN_REGEXP = "/\./|/\.\./|/\.$|/\.\.$"
+FORBIDDEN_REGEXP = r"/\./|/\.\./|/\.$|/\.\.$"
 
 
 class NameCheckMiddleware(object):
@@ -56,7 +59,7 @@ def __init__(self, app, conf):
         self.conf = conf
         self.forbidden_chars = self.conf.get('forbidden_chars',
                                              FORBIDDEN_CHARS)
-        self.maximum_length = self.conf.get('maximum_length', MAX_LENGTH)
+        self.maximum_length = int(self.conf.get('maximum_length', MAX_LENGTH))
         self.forbidden_regexp = self.conf.get('forbidden_regexp',
                                               FORBIDDEN_REGEXP)
         if self.forbidden_regexp:
@@ -65,6 +68,15 @@ def __init__(self, app, conf):
             self.forbidden_regexp_compiled = None
         self.logger = get_logger(self.conf, log_route='name_check')
 
+        self.register_info()
+
+    def register_info(self):
+        register_swift_info('name_check',
+                            forbidden_chars=self.forbidden_chars,
+                            maximum_length=self.maximum_length,
+                            forbidden_regexp=self.forbidden_regexp
+                            )
+
     def check_character(self, req):
         '''
         Checks req.path for any forbidden characters
@@ -75,12 +87,7 @@ def check_character(self, req):
         self.logger.debug("name_check: self.forbidden_chars %s" %
                           self.forbidden_chars)
 
-        for c in unquote(req.path):
-            if c in self.forbidden_chars:
-                return True
-            else:
-                pass
-        return False
+        return any((c in req.path_info) for c in self.forbidden_chars)
 
     def check_length(self, req):
         '''
@@ -88,11 +95,8 @@ def check_length(self, req):
         Returns True if the length exceeds the maximum
         Returns False if the length is <= the maximum
         '''
-        length = len(unquote(req.path))
-        if length > self.maximum_length:
-            return True
-        else:
-            return False
+        length = len(req.path_info)
+        return length > self.maximum_length
 
     def check_regexp(self, req):
         '''
@@ -107,8 +111,7 @@ def check_regexp(self, req):
         self.logger.debug("name_check: self.forbidden_regexp %s" %
                           self.forbidden_regexp)
 
-        unquoted_path = unquote(req.path)
-        match = self.forbidden_regexp_compiled.search(unquoted_path)
+        match = self.forbidden_regexp_compiled.search(req.path_info)
         return (match is not None)
 
     def __call__(self, env, start_response):
@@ -117,18 +120,20 @@ def __call__(self, env, start_response):
         if self.check_character(req):
             return HTTPBadRequest(
                 request=req,
-                body=("Object/Container name contains forbidden chars from %s"
+                body=("Object/Container/Account name contains forbidden "
+                      "chars from %s"
                       % self.forbidden_chars))(env, start_response)
         elif self.check_length(req):
             return HTTPBadRequest(
                 request=req,
-                body=("Object/Container name longer than the allowed maximum "
+                body=("Object/Container/Account name longer than the "
+                      "allowed maximum "
                       "%s" % self.maximum_length))(env, start_response)
         elif self.check_regexp(req):
             return HTTPBadRequest(
                 request=req,
-                body=("Object/Container name contains a forbidden substring "
-                      "from regular expression %s"
+                body=("Object/Container/Account name contains a forbidden "
+                      "substring from regular expression %s"
                       % self.forbidden_regexp))(env, start_response)
         else:
             # Pass on to downstream WSGI component
diff --git a/swift/common/middleware/proxy_logging.py b/swift/common/middleware/proxy_logging.py
index a63e10436f..5fc46b9715 100644
--- a/swift/common/middleware/proxy_logging.py
+++ b/swift/common/middleware/proxy_logging.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2011 OpenStack, LLC.
+# Copyright (c) 2010-2011 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -19,70 +19,170 @@
 This serves as both the default logging implementation and an example of how
 to plug in your own logging format/method.
 
-The logging format implemented below is as follows:
+The logging format implemented below is as follows::
 
-client_ip remote_addr datetime request_method request_path protocol
-    status_int referer user_agent auth_token bytes_recvd bytes_sent
-    client_etag transaction_id headers request_time source
+    client_ip remote_addr end_time.datetime method path protocol
+        status_int referer user_agent auth_token bytes_recvd bytes_sent
+        client_etag transaction_id headers request_time source log_info
+        start_time end_time policy_index
 
 These values are space-separated, and each is url-encoded, so that they can
-be separated with a simple .split()
+be separated with a simple ``.split()``.
 
-* remote_addr is the contents of the REMOTE_ADDR environment variable, while
-  client_ip is swift's best guess at the end-user IP, extracted variously
-  from the X-Forwarded-For header, X-Cluster-Ip header, or the REMOTE_ADDR
-  environment variable.
+* ``remote_addr`` is the contents of the REMOTE_ADDR environment variable,
+  while ``client_ip`` is swift's best guess at the end-user IP, extracted
+  variously from the X-Forwarded-For header, X-Cluster-Ip header, or the
+  REMOTE_ADDR environment variable.
+
+* ``status_int`` is the integer part of the ``status`` string passed to this
+  middleware's start_response function, unless the WSGI environment has an item
+  with key ``swift.proxy_logging_status``, in which case the value of that item
+  is used. Other middleware's may set ``swift.proxy_logging_status`` to
+  override the logging of ``status_int``. In either case, the logged
+  ``status_int`` value is forced to 499 if a client disconnect is detected
+  while this middleware is handling a request, or 500 if an exception is caught
+  while handling a request.
+
+* ``source`` (``swift.source`` in the WSGI environment) indicates the code
+  that generated the request, such as most middleware. (See below for
+  more detail.)
+
+* ``log_info`` (``swift.log_info`` in the WSGI environment) is for additional
+  information that could prove quite useful, such as any ``x-delete-at``
+  value or other "behind the scenes" activity that might not
+  otherwise be detectable from the plain log information. Code that
+  wishes to add additional log information should use code like
+  ``env.setdefault('swift.log_info', []).append(your_info)`` so as to
+  not disturb others' log information.
 
 * Values that are missing (e.g. due to a header not being present) or zero
   are generally represented by a single hyphen ('-').
+
+.. note::
+   The message format may be configured using the ``log_msg_template`` option,
+   allowing fields to be added, removed, re-ordered, and even anonymized. For
+   more information, see https://docs.openstack.org/swift/latest/logs.html
+
+The proxy-logging can be used twice in the proxy server's pipeline when there
+is middleware installed that can return custom responses that don't follow the
+standard pipeline to the proxy server.
+
+For example, with staticweb, the middleware might intercept a request to
+/v1/AUTH_acc/cont/, make a subrequest to the proxy to retrieve
+/v1/AUTH_acc/cont/index.html and, in effect, respond to the client's original
+request using the 2nd request's body. In this instance the subrequest will be
+logged by the rightmost middleware (with a ``swift.source`` set) and the
+outgoing request (with body overridden) will be logged by leftmost middleware.
+
+Requests that follow the normal pipeline (use the same wsgi environment
+throughout) will not be double logged because an environment variable
+(``swift.proxy_access_log_made``) is checked/set when a log is made.
+
+All middleware making subrequests should take care to set ``swift.source`` when
+needed. With the doubled proxy logs, any consumer/processor of swift's proxy
+logs should look at the ``swift.source`` field, the rightmost log value, to
+decide if this is a middleware subrequest or not. A log processor calculating
+bandwidth usage will want to only sum up logs with no ``swift.source``.
 """
 
+import os
 import time
-from urllib import quote, unquote
+from collections import ChainMap
 
+from swift.common.constraints import valid_api_version
+from swift.common.middleware.catch_errors import ByteEnforcer
+from swift.common.middleware.s3api.utils import extract_bucket_and_key, \
+    is_s3_req
+from swift.common.request_helpers import get_log_info
 from swift.common.swob import Request
 from swift.common.utils import (get_logger, get_remote_client,
-                                get_valid_utf8_str, config_true_value)
+                                config_true_value, reiterate,
+                                close_if_possible, cap_length,
+                                InputProxy, list_from_csv,
+                                get_policy_index, LogStringFormatter,
+                                split_path, StrAnonymizer, StrFormatTime)
+from swift.common.statsd_client import get_labeled_statsd_client
+
+from swift.common.storage_policy import POLICIES
+from swift.common.registry import get_sensitive_headers, \
+    get_sensitive_params, register_sensitive_header
+
+
+def statsd_metric_resp_labels(base_labels, status_int=None, policy_index=None):
+    # compose labels used for response metrics
+    extra_labels = {}
+    if policy_index is not None:
+        extra_labels['policy'] = policy_index
+    if status_int:
+        extra_labels['status'] = status_int
+    labels_source = ChainMap(extra_labels, base_labels)
+    return labels_source
 
 
-class InputProxy(object):
+class CallbackInputProxy(InputProxy):
     """
-    File-like object that counts bytes read.
-    To be swapped in for wsgi.input for accounting purposes.
+    :param wsgi_input: file-like object to be wrapped
+    :param callback: a function or a callable that
+        accept args (chunk, eof),
+        and returns chunk or a modified chunk.
+        eof is ``True`` if there are no more bytes to
+        read from the wrapped input, ``False`` otherwise.
     """
-    def __init__(self, wsgi_input):
-        """
-        :param wsgi_input: file-like object to wrap the functionality of
-        """
-        self.wsgi_input = wsgi_input
-        self.bytes_received = 0
-        self.client_disconnect = False
+    def __init__(self, wsgi_input, callback):
+        super().__init__(wsgi_input)
+        self.callback = callback
 
-    def read(self, *args, **kwargs):
-        """
-        Pass read request to the underlying file-like object and
-        add bytes read to total.
-        """
-        try:
-            chunk = self.wsgi_input.read(*args, **kwargs)
-        except Exception:
-            self.client_disconnect = True
-            raise
-        self.bytes_received += len(chunk)
-        return chunk
+    def chunk_update(self, chunk, eof, *arg, **kwargs):
+        return self.callback(chunk, eof)
 
-    def readline(self, *args, **kwargs):
-        """
-        Pass readline request to the underlying file-like object and
-        add bytes read to total.
+
+class BufferXferEmitCallback(object):
+    def __init__(self, metric_name, labels, statsd,
+                 emit_buffer_xfer_bytes_sec):
+        self.metric_name = metric_name
+        self.labels = labels
+        self.statsd = statsd
+        self.emit_buffer_xfer_bytes_sec = emit_buffer_xfer_bytes_sec
+        self.emit_bytes = 0
+        self.next_emit_time = 0
+        if self.emit_buffer_xfer_bytes_sec > 0:
+            self.next_emit_time = (time.time() +
+                                   self.emit_buffer_xfer_bytes_sec)
+
+    def __call__(self, buffer, eof=False):
+        self._maybe_emit_stat(buffer, eof)
+        return buffer
+
+    def _maybe_emit_stat(self, buffer, eof=False):
         """
-        try:
-            line = self.wsgi_input.readline(*args, **kwargs)
-        except Exception:
-            self.client_disconnect = True
-            raise
-        self.bytes_received += len(line)
-        return line
+           Accumulate the length of ``buffer`` and periodically emit a stat
+           with the accumulated length.
+
+           :param buffer: the buffer that has been read.
+           :param eof: if True, a stat is emitted immediately; otherwise a
+               stat will be emitted when ``next_emit_time`` has been reached.
+           """
+
+        if self.emit_buffer_xfer_bytes_sec < 0:
+            return
+        buffer_len = len(buffer)
+        self.emit_bytes += buffer_len
+        if not self.labels.get('account', None):
+            # tolerate no account, maybe it'll be there in time for next stat
+            return
+
+        now = time.time()
+        if eof is False and self.next_emit_time > now:
+            return
+
+        if self.emit_bytes != 0:
+            self.statsd.update_stats(
+                self.metric_name,
+                self.emit_bytes,
+                labels=self.labels,
+            )
+        self.emit_bytes = 0
+        self.next_emit_time = (now + self.emit_buffer_xfer_bytes_sec)
 
 
 class ProxyLoggingMiddleware(object):
@@ -90,9 +190,29 @@ class ProxyLoggingMiddleware(object):
     Middleware that logs Swift proxy requests in the swift log format.
     """
 
-    def __init__(self, app, conf):
+    def __init__(self, app, conf, logger=None):
         self.app = app
-        self.log_hdrs = config_true_value(conf.get('log_headers', 'no'))
+        self.pid = os.getpid()
+        self.log_formatter = LogStringFormatter(default='-', quote=True)
+        self.log_msg_template = conf.get(
+            'log_msg_template', (
+                '{client_ip} {remote_addr} {end_time.datetime} {method} '
+                '{path} {protocol} {status_int} {referer} {user_agent} '
+                '{auth_token} {bytes_recvd} {bytes_sent} {client_etag} '
+                '{transaction_id} {headers} {request_time} {source} '
+                '{log_info} {start_time} {end_time} {policy_index} '
+                '{access_user_id}'))
+        # The salt is only used in StrAnonymizer. This class requires bytes,
+        # convert it now to prevent useless convertion later.
+        self.anonymization_method = conf.get('log_anonymization_method', 'md5')
+        self.anonymization_salt = conf.get('log_anonymization_salt', '')
+        self.storage_domains = list_from_csv(conf.get('storage_domain', ''))
+        self.log_hdrs = config_true_value(conf.get(
+            'access_log_headers',
+            conf.get('log_headers', 'no')))
+        log_hdrs_only = list_from_csv(conf.get(
+            'access_log_headers_only', ''))
+        self.log_hdrs_only = [x.title() for x in log_hdrs_only]
 
         # The leading access_* check is in case someone assumes that
         # log_statsd_valid_http_methods behaves like the other log_statsd_*
@@ -100,135 +220,483 @@ def __init__(self, app, conf):
         self.valid_methods = conf.get(
             'access_log_statsd_valid_http_methods',
             conf.get('log_statsd_valid_http_methods',
-                     'GET,HEAD,POST,PUT,DELETE,COPY,OPTIONS'))
+                     'GET,HEAD,POST,PUT,DELETE,COPY,OPTIONS,UPDATE'))
         self.valid_methods = [m.strip().upper() for m in
                               self.valid_methods.split(',') if m.strip()]
+
+        # Copy supported access_log_* options to the corresponding log_*
+        # option, possibly overriding the log_* option. Note that this includes
+        # some statsd options that have access_log_* or log_* prefixes.
         access_log_conf = {}
         for key in ('log_facility', 'log_name', 'log_level', 'log_udp_host',
                     'log_udp_port', 'log_statsd_host', 'log_statsd_port',
                     'log_statsd_default_sample_rate',
+                    'log_statsd_sample_rate_factor',
                     'log_statsd_metric_prefix'):
             value = conf.get('access_' + key, conf.get(key, None))
             if value:
                 access_log_conf[key] = value
-        self.access_logger = get_logger(access_log_conf,
-                                        log_route='proxy-access')
-        self.access_logger.set_statsd_prefix('proxy-server')
+        for key, value in conf.items():
+            if key.startswith('statsd_'):
+                access_log_conf[key] = value
+        self.access_logger = logger or get_logger(
+            access_log_conf,
+            log_route=conf.get('access_log_route', 'proxy-access'),
+            statsd_tail_prefix='proxy-server')
+        self.statsd = get_labeled_statsd_client(
+            access_log_conf, self.access_logger.logger)
+        self.reveal_sensitive_prefix = int(
+            conf.get('reveal_sensitive_prefix', 16))
+        self.check_log_msg_template_validity()
+        self.emit_buffer_xfer_bytes_sec = float(
+            conf.get('statsd_emit_buffer_xfer_bytes_seconds', -1))
+
+    def check_log_msg_template_validity(self):
+        replacements = {
+            # Time information
+            'end_time': StrFormatTime(1000001),
+            'start_time': StrFormatTime(1000000),
+            # Information worth to anonymize
+            'client_ip': StrAnonymizer('1.2.3.4', self.anonymization_method,
+                                       self.anonymization_salt),
+            'remote_addr': StrAnonymizer('4.3.2.1', self.anonymization_method,
+                                         self.anonymization_salt),
+            'domain': StrAnonymizer('', self.anonymization_method,
+                                    self.anonymization_salt),
+            'path': StrAnonymizer('/', self.anonymization_method,
+                                  self.anonymization_salt),
+            'referer': StrAnonymizer('ref', self.anonymization_method,
+                                     self.anonymization_salt),
+            'user_agent': StrAnonymizer('swift', self.anonymization_method,
+                                        self.anonymization_salt),
+            'headers': StrAnonymizer('header', self.anonymization_method,
+                                     self.anonymization_salt),
+            'client_etag': StrAnonymizer('etag', self.anonymization_method,
+                                         self.anonymization_salt),
+            'account': StrAnonymizer('a', self.anonymization_method,
+                                     self.anonymization_salt),
+            'container': StrAnonymizer('c', self.anonymization_method,
+                                       self.anonymization_salt),
+            'object': StrAnonymizer('', self.anonymization_method,
+                                    self.anonymization_salt),
+            # Others information
+            'method': 'GET',
+            'protocol': '',
+            'status_int': '0',
+            'auth_token': '1234...',  # nosec B105
+            'bytes_recvd': '1',
+            'bytes_sent': '0',
+            'transaction_id': 'tx1234',
+            'request_time': '0.05',
+            'source': '',
+            'log_info': '',
+            'policy_index': '',
+            'ttfb': '0.05',
+            'pid': '42',
+            'wire_status_int': '200',
+            'access_user_id': StrAnonymizer('AKIAIOSFODNN7EXAMPLE',
+                                            self.anonymization_method,
+                                            self.anonymization_salt),
+        }
+        try:
+            self.log_formatter.format(self.log_msg_template, **replacements)
+        except Exception as e:
+            raise ValueError('Cannot interpolate log_msg_template: %s' % e)
+
+    def method_from_req(self, req):
+        return req.environ.get('swift.orig_req_method', req.method)
+
+    def req_already_logged(self, env):
+        return env.get('swift.proxy_access_log_made')
+
+    def mark_req_logged(self, env):
+        env['swift.proxy_access_log_made'] = True
+
+    def obscure_sensitive(self, value):
+        return cap_length(value, self.reveal_sensitive_prefix)
+
+    def obscure_req(self, req):
+        for header in get_sensitive_headers():
+            if header in req.headers:
+                req.headers[header] = \
+                    self.obscure_sensitive(req.headers[header])
+
+        obscure_params = get_sensitive_params()
+        new_params = []
+        any_obscured = False
+        for k, v in req.params.items():
+            if k in obscure_params:
+                new_params.append((k, self.obscure_sensitive(v)))
+                any_obscured = True
+            else:
+                new_params.append((k, v))
+        if any_obscured:
+            req.params = new_params
+
+    def get_access_user_id(self, req):
+        """
+        Get access user ID from request environ.
+
+        :param req: swob.Request object for the request
+        :returns: User ID for logging if available, None otherwise
+        """
+        return req.environ.get('swift.access_logging', {}).get('user_id')
 
-    def log_request(self, env, status_int, bytes_received, bytes_sent,
-                    request_time, client_disconnect):
+    def log_request(self, req, status_int, bytes_received, bytes_sent,
+                    start_time, end_time, resp_headers=None, ttfb=0,
+                    wire_status_int=None):
         """
         Log a request.
 
-        :param env: WSGI environment
+        :param req: swob.Request object for the request
         :param status_int: integer code for the response status
         :param bytes_received: bytes successfully read from the request body
         :param bytes_sent: bytes yielded to the WSGI server
-        :param request_time: time taken to satisfy the request, in seconds
+        :param start_time: timestamp request started
+        :param end_time: timestamp request completed
+        :param resp_headers: dict of the response headers
+        :param ttfb: time to first byte
+        :param wire_status_int: the on the wire status int
         """
-        req = Request(env)
-        if client_disconnect:  # log disconnected clients as '499' status code
-            status_int = 499
-        req_path = get_valid_utf8_str(req.path)
-        the_request = quote(unquote(req_path))
-        if req.query_string:
-            the_request = the_request + '?' + req.query_string
+        self.obscure_req(req)
+        domain = req.environ.get('HTTP_HOST',
+                                 req.environ.get('SERVER_NAME', None))
+        if ':' in domain:
+            domain, port = domain.rsplit(':', 1)
+        resp_headers = resp_headers or {}
         logged_headers = None
         if self.log_hdrs:
-            logged_headers = '\n'.join('%s: %s' % (k, v)
-                                       for k, v in req.headers.items())
-        method = req.environ.get('swift.orig_req_method', req.method)
-        self.access_logger.info(' '.join(
-            quote(str(x) if x else '-')
-            for x in (
-                get_remote_client(req),
-                req.remote_addr,
-                time.strftime('%d/%b/%Y/%H/%M/%S', time.gmtime()),
-                method,
-                the_request,
+            if self.log_hdrs_only:
+                logged_headers = '\n'.join('%s: %s' % (k, v)
+                                           for k, v in req.headers.items()
+                                           if k in self.log_hdrs_only)
+            else:
+                logged_headers = '\n'.join('%s: %s' % (k, v)
+                                           for k, v in req.headers.items())
+
+        method = self.method_from_req(req)
+        duration_time_str = "%.4f" % (end_time - start_time)
+        policy_index = get_policy_index(req.headers, resp_headers)
+
+        swift_path = req.environ.get('swift.backend_path', req.path)
+        acc, cont, obj = self.get_aco_from_path(swift_path)
+
+        replacements = {
+            # Time information
+            'end_time': StrFormatTime(end_time),
+            'start_time': StrFormatTime(start_time),
+            # Information worth to anonymize
+            'client_ip': StrAnonymizer(get_remote_client(req),
+                                       self.anonymization_method,
+                                       self.anonymization_salt),
+            'remote_addr': StrAnonymizer(req.remote_addr,
+                                         self.anonymization_method,
+                                         self.anonymization_salt),
+            'domain': StrAnonymizer(domain, self.anonymization_method,
+                                    self.anonymization_salt),
+            'path': StrAnonymizer(req.path_qs, self.anonymization_method,
+                                  self.anonymization_salt),
+            'referer': StrAnonymizer(req.referer, self.anonymization_method,
+                                     self.anonymization_salt),
+            'user_agent': StrAnonymizer(req.user_agent,
+                                        self.anonymization_method,
+                                        self.anonymization_salt),
+            'headers': StrAnonymizer(logged_headers, self.anonymization_method,
+                                     self.anonymization_salt),
+            'client_etag': StrAnonymizer(req.headers.get('etag'),
+                                         self.anonymization_method,
+                                         self.anonymization_salt),
+            'account': StrAnonymizer(acc, self.anonymization_method,
+                                     self.anonymization_salt),
+            'container': StrAnonymizer(cont, self.anonymization_method,
+                                       self.anonymization_salt),
+            'object': StrAnonymizer(obj, self.anonymization_method,
+                                    self.anonymization_salt),
+            # Others information
+            'method': method,
+            'protocol':
                 req.environ.get('SERVER_PROTOCOL'),
-                status_int,
-                req.referer,
-                req.user_agent,
+            'status_int': status_int,
+            'auth_token':
                 req.headers.get('x-auth-token'),
-                bytes_received,
-                bytes_sent,
-                req.headers.get('etag', None),
-                req.environ.get('swift.trans_id'),
-                logged_headers,
-                '%.4f' % request_time,
-                req.environ.get('swift.source'),
-            )))
-        # Log timing and bytes-transfered data to StatsD
-        if req.path.startswith('/v1/'):
-            try:
-                stat_type = [None, 'account', 'container',
-                             'object'][req.path.strip('/').count('/')]
-            except IndexError:
-                stat_type = 'object'
-        else:
-            stat_type = env.get('swift.source')
-        # Only log data for valid controllers (or SOS) to keep the metric count
-        # down (egregious errors will get logged by the proxy server itself).
-        if stat_type:
-            stat_method = method if method in self.valid_methods \
-                else 'BAD_METHOD'
-            metric_name = '.'.join((stat_type, stat_method, str(status_int)))
-            self.access_logger.timing(metric_name + '.timing',
-                                      request_time * 1000)
-            self.access_logger.update_stats(metric_name + '.xfer',
+            'bytes_recvd': bytes_received,
+            'bytes_sent': bytes_sent,
+            'transaction_id': req.environ.get('swift.trans_id'),
+            'request_time': duration_time_str,
+            'source': req.environ.get('swift.source'),
+            'log_info': get_log_info(req.environ),
+            'policy_index': policy_index,
+            'ttfb': ttfb,
+            'pid': self.pid,
+            'wire_status_int': wire_status_int or status_int,
+            'access_user_id': StrAnonymizer(
+                self.get_access_user_id(req), self.anonymization_method,
+                self.anonymization_salt),
+        }
+        self.access_logger.info(
+            self.log_formatter.format(self.log_msg_template,
+                                      **replacements))
+
+        # Log timing and bytes-transferred data to StatsD
+        metric_method = self.statsd_metric_method(method)
+        metric_name = self.statsd_metric_name(req, status_int, metric_method)
+        metric_name_policy = self.statsd_metric_name_policy(
+            req, status_int, metric_method, policy_index)
+
+        self.access_logger.timing(metric_name + '.timing',
+                                  (end_time - start_time) * 1000)
+        self.access_logger.update_stats(metric_name + '.xfer',
+                                        bytes_received + bytes_sent)
+        if metric_name_policy:
+            self.access_logger.timing(metric_name_policy + '.timing',
+                                      (end_time - start_time) * 1000)
+            self.access_logger.update_stats(metric_name_policy + '.xfer',
                                             bytes_received + bytes_sent)
 
+        labels = self.statsd_metric_labels(
+            req, status_int, metric_method,
+            acc=acc, cont=cont, policy_index=policy_index)
+        self.statsd.timing(
+            'swift_proxy_server_request_timing',
+            (end_time - start_time) * 1000,
+            labels=labels,
+        )
+        self.statsd.update_stats(
+            'swift_proxy_server_request_body_bytes',
+            bytes_received,
+            labels=labels,
+        )
+        self.statsd.update_stats(
+            'swift_proxy_server_response_body_bytes',
+            bytes_sent,
+            labels=labels,
+        )
+
+    def get_aco_from_path(self, swift_path):
+        try:
+            version, acc, cont, obj = split_path(swift_path, 1, 4, True)
+            if not valid_api_version(version):
+                raise ValueError
+        except ValueError:
+            acc, cont, obj = None, None, None
+        return acc, cont, obj
+
+    def get_resource_type_from_aco(self, req, acc, cont, obj):
+        if obj:
+            return 'object'
+        if cont:
+            return 'container'
+        if acc:
+            return 'account'
+        return req.environ.get('swift.source') or 'UNKNOWN'
+
+    def get_resource_type(self, req):
+        swift_path = req.environ.get('swift.backend_path', req.path)
+        acc, cont, obj = self.get_aco_from_path(swift_path)
+        return self.get_resource_type_from_aco(req, acc, cont, obj)
+
+    def statsd_metric_method(self, method):
+        return method if method in self.valid_methods else 'BAD_METHOD'
+
+    def statsd_metric_name(self, req, status_int, metric_method):
+        resource_type = self.get_resource_type(req)
+        return '.'.join((resource_type, metric_method, str(status_int)))
+
+    def update_swift_base_labels(self, req):
+        acc, cont, obj = self.get_aco_from_path(req.path)
+        base_labels = req.environ.get('swift.base_labels')
+        if base_labels is None:
+            # expected in the left-most proxy_logging instance
+            if acc is None and is_s3_req(req):
+                cont, obj = extract_bucket_and_key(
+                    req, self.storage_domains, False)
+
+            method = self.method_from_req(req)
+            metric_method = self.statsd_metric_method(method)
+            resource_type = self.get_resource_type_from_aco(
+                req, acc, cont, obj)
+            base_labels = {
+                'method': metric_method,
+            }
+            base_labels['api'] = 'S3' if is_s3_req(req) else 'swift'
+            if resource_type != 'UNKNOWN' or not is_s3_req(req):
+                base_labels['resource'] = resource_type
+            if acc:
+                base_labels['account'] = acc
+            if cont:
+                base_labels['container'] = cont
+            req.environ['swift.base_labels'] = base_labels
+        elif acc:
+            # expected in the right-most proxy_logging instance
+            resource_type = self.get_resource_type_from_aco(
+                req, acc, cont, obj)
+            base_labels.setdefault('account', acc)
+            base_labels.setdefault('resource', resource_type)
+
+    def statsd_metric_name_policy(self, req, status_int, metric_method,
+                                  policy_index):
+        if policy_index is None:
+            return None
+        resource_type = self.get_resource_type(req)
+        if resource_type == 'object':
+            # The policy may not exist
+            policy = POLICIES.get_by_index(policy_index)
+            if policy:
+                return '.'.join((resource_type, 'policy', str(policy_index),
+                                 metric_method, str(status_int)))
+            else:
+                return None
+        else:
+            return None
+
+    def statsd_metric_labels(self, req, status_int, metric_method, acc=None,
+                             cont=None, policy_index=None):
+        # overlay freshly derived labels onto base_labels just in case any
+        # changed w.r.t. base labels while the request was being handled (in
+        # particular, container may be different in swift.backend_path)
+        # TODO: remove unnecessary duplication in the overlay e.g. method,
+        # account
+        resource_type = self.get_resource_type(req)
+
+        labels = {
+            'resource': resource_type,
+            'method': metric_method,
+            'status': status_int,
+        }
+        if acc:
+            labels['account'] = acc
+        if cont:
+            labels['container'] = cont
+        if resource_type == 'object' and \
+                policy_index is not None and \
+                POLICIES.get_by_index(policy_index) is not None:
+            labels['policy'] = policy_index
+        return ChainMap(labels, req.environ['swift.base_labels'])
+
     def __call__(self, env, start_response):
+        req = Request(env)
+        self.update_swift_base_labels(req)
+
+        if self.req_already_logged(env):
+            return self.app(env, start_response)
+
+        self.mark_req_logged(env)
+
         start_response_args = [None]
-        input_proxy = InputProxy(env['wsgi.input'])
+
+        xfer_metric_name = 'swift_proxy_server_request_body_streaming_bytes'
+        base_labels = req.environ.get('swift.base_labels')
+
+        statsd_emit_callback = BufferXferEmitCallback(
+            xfer_metric_name, base_labels, self.statsd,
+            self.emit_buffer_xfer_bytes_sec)
+        input_proxy = CallbackInputProxy(env['wsgi.input'],
+                                         statsd_emit_callback)
         env['wsgi.input'] = input_proxy
         start_time = time.time()
 
         def my_start_response(status, headers, exc_info=None):
             start_response_args[0] = (status, list(headers), exc_info)
 
+        def status_int_for_logging():
+            # log disconnected clients as '499' status code
+            if input_proxy.client_disconnect:
+                return 499
+            return env.get('swift.proxy_logging_status')
+
         def iter_response(iterable):
-            iterator = iter(iterable)
-            try:
-                chunk = iterator.next()
-                while not chunk:
-                    chunk = iterator.next()
-            except StopIteration:
-                chunk = ''
+            iterator = reiterate(iterable)
+            content_length = None
             for h, v in start_response_args[0][1]:
-                if h.lower() in ('content-length', 'transfer-encoding'):
+                if h.lower() == 'content-length':
+                    content_length = int(v)
+                    break
+                elif h.lower() == 'transfer-encoding':
                     break
             else:
-                if not chunk:
-                    start_response_args[0][1].append(('content-length', '0'))
-                elif isinstance(iterable, list):
+                if isinstance(iterator, list):
+                    content_length = sum(len(i) for i in iterator)
                     start_response_args[0][1].append(
-                        ('content-length', str(sum(len(i) for i in iterable))))
+                        ('Content-Length', str(content_length)))
+
+            method = self.method_from_req(req)
+            if method == 'HEAD':
+                content_length = 0
+            if content_length is not None:
+                iterator = ByteEnforcer(iterator, content_length)
+
+            wire_status_int = int(start_response_args[0][0].split(' ', 1)[0])
+            resp_headers = dict(start_response_args[0][1])
             start_response(*start_response_args[0])
+
+            policy_index = get_policy_index(req.headers, resp_headers)
+
+            # Log timing information for time-to-first-byte (GET requests only)
+            ttfb = 0.0
+            if method == 'GET':
+                swift_path = req.environ.get('swift.backend_path', req.path)
+                acc, cont, _ = self.get_aco_from_path(swift_path)
+                labels = self.statsd_metric_labels(
+                    req, wire_status_int, method,
+                    acc=acc, cont=cont, policy_index=policy_index)
+                metric_name = self.statsd_metric_name(
+                    req, wire_status_int, method)
+                metric_name_policy = self.statsd_metric_name_policy(
+                    req, wire_status_int, method, policy_index)
+
+                ttfb = time.time() - start_time
+                if metric_name:
+                    self.access_logger.timing(
+                        metric_name + '.first-byte.timing', ttfb * 1000)
+                if metric_name_policy:
+                    self.access_logger.timing(
+                        metric_name_policy + '.first-byte.timing', ttfb * 1000)
+
+                self.statsd.timing(
+                    'swift_proxy_server_request_ttfb',
+                    ttfb * 1000,
+                    labels=labels,
+                )
+
+            resp_xfer_labels = statsd_metric_resp_labels(
+                base_labels, status_int=wire_status_int,
+                policy_index=policy_index)
+
             bytes_sent = 0
-            client_disconnect = False
+            statsd_emit_callback = BufferXferEmitCallback(
+                'swift_proxy_server_response_body_streaming_bytes',
+                resp_xfer_labels,
+                self.statsd, self.emit_buffer_xfer_bytes_sec)
             try:
-                while chunk:
+                for chunk in iterator:
                     bytes_sent += len(chunk)
+                    statsd_emit_callback(chunk)
                     yield chunk
-                    chunk = iterator.next()
             except GeneratorExit:  # generator was closed before we finished
-                client_disconnect = True
+                env['swift.proxy_logging_status'] = 499
+                raise
+            except Exception:
+                env['swift.proxy_logging_status'] = 500
                 raise
             finally:
-                status_int = int(start_response_args[0][0].split(' ', 1)[0])
+                statsd_emit_callback(b'', eof=True)
+                env.setdefault('swift.proxy_logging_status', wire_status_int)
+                status_int = status_int_for_logging()
                 self.log_request(
-                    env, status_int, input_proxy.bytes_received, bytes_sent,
-                    time.time() - start_time,
-                    client_disconnect or input_proxy.client_disconnect)
+                    req, status_int, input_proxy.bytes_received, bytes_sent,
+                    start_time, time.time(), resp_headers=resp_headers,
+                    ttfb=ttfb, wire_status_int=wire_status_int)
+                close_if_possible(iterator)
 
         try:
             iterable = self.app(env, my_start_response)
         except Exception:
+            req = Request(env)
+            env['swift.proxy_logging_status'] = 500
+            status_int = status_int_for_logging()
             self.log_request(
-                env, 500, input_proxy.bytes_received, 0,
-                time.time() - start_time, input_proxy.client_disconnect)
+                req, status_int, input_proxy.bytes_received, 0, start_time,
+                time.time())
             raise
         else:
             return iter_response(iterable)
@@ -238,6 +706,12 @@ def filter_factory(global_conf, **local_conf):
     conf = global_conf.copy()
     conf.update(local_conf)
 
+    # Normally it would be the middleware that uses the header that
+    # would register it, but because there could be 3rd party auth middlewares
+    # that use 'x-auth-token' or 'x-storage-token' we special case it here.
+    register_sensitive_header('x-auth-token')
+    register_sensitive_header('x-storage-token')
+
     def proxy_logger(app):
         return ProxyLoggingMiddleware(app, conf)
     return proxy_logger
diff --git a/swift/common/middleware/ratelimit.py b/swift/common/middleware/ratelimit.py
index cee3e0637d..365f2dfcf2 100644
--- a/swift/common/middleware/ratelimit.py
+++ b/swift/common/middleware/ratelimit.py
@@ -1,3 +1,4 @@
+# Copyright (c) 2010-2013 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -12,14 +13,74 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 import time
+
 import eventlet
 
-from swift.common.utils import split_path, cache_from_env, get_logger
-from swift.proxy.controllers.base import get_container_memcache_key
+from swift.common.utils import cache_from_env, get_logger
+from swift.common.registry import register_swift_info
+from swift.proxy.controllers.base import get_account_info, get_container_info
+from swift.common.constraints import valid_api_version
 from swift.common.memcached import MemcacheConnectionError
 from swift.common.swob import Request, Response
 
 
+def interpret_conf_limits(conf, name_prefix, info=None):
+    """
+    Parses general parms for rate limits looking for things that
+    start with the provided name_prefix within the provided conf
+    and returns lists for both internal use and for /info
+
+    :param conf: conf dict to parse
+    :param name_prefix: prefix of config parms to look for
+    :param info: set to return extra stuff for /info registration
+    """
+    conf_limits = []
+    for conf_key in conf:
+        if conf_key.startswith(name_prefix):
+            cont_size = int(conf_key[len(name_prefix):])
+            rate = float(conf[conf_key])
+            conf_limits.append((cont_size, rate))
+
+    conf_limits.sort()
+    ratelimits = []
+    conf_limits_info = list(conf_limits)
+    while conf_limits:
+        cur_size, cur_rate = conf_limits.pop(0)
+        if conf_limits:
+            next_size, next_rate = conf_limits[0]
+            slope = (float(next_rate) - float(cur_rate)) \
+                / (next_size - cur_size)
+
+            def new_scope(cur_size, slope, cur_rate):
+                # making new scope for variables
+                return lambda x: (x - cur_size) * slope + cur_rate
+            line_func = new_scope(cur_size, slope, cur_rate)
+        else:
+            line_func = lambda x: cur_rate
+
+        ratelimits.append((cur_size, cur_rate, line_func))
+    if info is None:
+        return ratelimits
+    else:
+        return ratelimits, conf_limits_info
+
+
+def get_maxrate(ratelimits, size):
+    """
+    Returns number of requests allowed per second for given size.
+    """
+    last_func = None
+    if size:
+        size = int(size)
+        for ratesize, rate, func in ratelimits:
+            if size < ratesize:
+                break
+            last_func = func
+        if last_func:
+            return last_func(size)
+    return None
+
+
 class MaxSleepTimeHitError(Exception):
     pass
 
@@ -35,11 +96,10 @@ class RateLimitMiddleware(object):
     BLACK_LIST_SLEEP = 1
 
     def __init__(self, app, conf, logger=None):
+
         self.app = app
-        if logger:
-            self.logger = logger
-        else:
-            self.logger = get_logger(conf, log_route='ratelimit')
+        self.logger = logger or get_logger(conf, log_route='ratelimit')
+        self.memcache_client = None
         self.account_ratelimit = float(conf.get('account_ratelimit', 0))
         self.max_sleep_time_seconds = \
             float(conf.get('max_sleep_time_seconds', 60))
@@ -50,94 +110,98 @@ def __init__(self, app, conf, logger=None):
         self.ratelimit_whitelist = \
             [acc.strip() for acc in
                 conf.get('account_whitelist', '').split(',') if acc.strip()]
+        if self.ratelimit_whitelist:
+            self.logger.warning('Option account_whitelist is deprecated. Use '
+                                'an internal client to POST a `X-Account-'
+                                'Sysmeta-Global-Write-Ratelimit: WHITELIST` '
+                                'header to the specific accounts instead.')
         self.ratelimit_blacklist = \
             [acc.strip() for acc in
                 conf.get('account_blacklist', '').split(',') if acc.strip()]
-        self.memcache_client = None
-        conf_limits = []
-        for conf_key in conf.keys():
-            if conf_key.startswith('container_ratelimit_'):
-                cont_size = int(conf_key[len('container_ratelimit_'):])
-                rate = float(conf[conf_key])
-                conf_limits.append((cont_size, rate))
-
-        conf_limits.sort()
-        self.container_ratelimits = []
-        while conf_limits:
-            cur_size, cur_rate = conf_limits.pop(0)
-            if conf_limits:
-                next_size, next_rate = conf_limits[0]
-                slope = (float(next_rate) - float(cur_rate)) \
-                    / (next_size - cur_size)
-
-                def new_scope(cur_size, slope, cur_rate):
-                    # making new scope for variables
-                    return lambda x: (x - cur_size) * slope + cur_rate
-                line_func = new_scope(cur_size, slope, cur_rate)
-            else:
-                line_func = lambda x: cur_rate
-
-            self.container_ratelimits.append((cur_size, cur_rate, line_func))
+        if self.ratelimit_blacklist:
+            self.logger.warning('Option account_blacklist is deprecated. Use '
+                                'an internal client to POST a `X-Account-'
+                                'Sysmeta-Global-Write-Ratelimit: BLACKLIST` '
+                                'header to the specific accounts instead.')
+        self.container_ratelimits = interpret_conf_limits(
+            conf, 'container_ratelimit_')
+        self.container_listing_ratelimits = interpret_conf_limits(
+            conf, 'container_listing_ratelimit_')
 
-    def get_container_maxrate(self, container_size):
-        """
-        Returns number of requests allowed per second for given container size.
-        """
-        last_func = None
-        if container_size:
-            container_size = int(container_size)
-            for size, rate, func in self.container_ratelimits:
-                if container_size < size:
-                    break
-                last_func = func
-            if last_func:
-                return last_func(container_size)
-        return None
+    def get_container_size(self, env):
+        rv = 0
+        container_info = get_container_info(
+            env, self.app, swift_source='RL')
+        if isinstance(container_info, dict):
+            rv = container_info.get(
+                'object_count', container_info.get('container_size', 0))
+        return rv
 
-    def get_ratelimitable_key_tuples(self, req_method, account_name,
-                                     container_name=None, obj_name=None):
+    def get_ratelimitable_key_tuples(self, req, account_name,
+                                     container_name=None, obj_name=None,
+                                     global_ratelimit=None):
         """
         Returns a list of key (used in memcache), ratelimit tuples. Keys
         should be checked in order.
 
-        :param req_method: HTTP method
+        :param req: swob request
         :param account_name: account name from path
         :param container_name: container name from path
         :param obj_name: object name from path
+        :param global_ratelimit: this account has an account wide
+                                 ratelimit on all writes combined
         """
         keys = []
         # COPYs are not limited
+
         if self.account_ratelimit and \
                 account_name and container_name and not obj_name and \
-                req_method in ('PUT', 'DELETE'):
+                req.method in ('PUT', 'DELETE'):
             keys.append(("ratelimit/%s" % account_name,
                          self.account_ratelimit))
 
         if account_name and container_name and obj_name and \
-                req_method in ('PUT', 'DELETE', 'POST'):
-            container_size = None
-            memcache_key = get_container_memcache_key(account_name,
-                                                      container_name)
-            container_info = self.memcache_client.get(memcache_key)
-            if isinstance(container_info, dict):
-                container_size = container_info.get(
-                    'count', container_info.get('container_size', 0))
-                container_rate = self.get_container_maxrate(container_size)
-                if container_rate:
-                    keys.append(("ratelimit/%s/%s" % (account_name,
-                                                      container_name),
-                                 container_rate))
+                req.method in ('PUT', 'DELETE', 'POST', 'COPY'):
+            container_size = self.get_container_size(req.environ)
+            container_rate = get_maxrate(
+                self.container_ratelimits, container_size)
+            if container_rate:
+                keys.append((
+                    "ratelimit/%s/%s" % (account_name, container_name),
+                    container_rate))
+
+        if account_name and container_name and not obj_name and \
+                req.method == 'GET':
+            container_size = self.get_container_size(req.environ)
+            container_rate = get_maxrate(
+                self.container_listing_ratelimits, container_size)
+            if container_rate:
+                keys.append((
+                    "ratelimit_listing/%s/%s" % (account_name, container_name),
+                    container_rate))
+
+        if account_name and req.method in ('PUT', 'DELETE', 'POST', 'COPY'):
+            if global_ratelimit:
+                try:
+                    global_ratelimit = float(global_ratelimit)
+                    if global_ratelimit > 0:
+                        keys.append((
+                            "ratelimit/global-write/%s" % account_name,
+                            global_ratelimit))
+                except ValueError:
+                    pass
+
         return keys
 
     def _get_sleep_time(self, key, max_rate):
-        '''
+        """
         Returns the amount of time (a float in seconds) that the app
         should sleep.
 
         :param key: a memcache key
         :param max_rate: maximum rate allowed in requests per second
-        :raises: MaxSleepTimeHitError if max sleep time is exceeded.
-        '''
+        :raises MaxSleepTimeHitError: if max sleep time is exceeded.
+        """
         try:
             now_m = int(round(time.time() * self.clock_accuracy))
             time_per_request_m = int(round(self.clock_accuracy / max_rate))
@@ -166,43 +230,66 @@ def _get_sleep_time(self, key, max_rate):
             return 0
 
     def handle_ratelimit(self, req, account_name, container_name, obj_name):
-        '''
+        """
         Performs rate limiting and account white/black listing.  Sleeps
-        if necessary.
+        if necessary. If self.memcache_client is not set, immediately returns
+        None.
 
         :param account_name: account name from path
         :param container_name: container name from path
         :param obj_name: object name from path
-        '''
-        if account_name in self.ratelimit_blacklist:
-            self.logger.error(_('Returning 497 because of blacklisting: %s'),
+        """
+        if not self.memcache_client:
+            return None
+
+        if req.environ.get('swift.ratelimit.handled'):
+            return None
+        req.environ['swift.ratelimit.handled'] = True
+
+        try:
+            account_info = get_account_info(req.environ, self.app,
+                                            swift_source='RL')
+            account_global_ratelimit = \
+                account_info.get('sysmeta', {}).get('global-write-ratelimit')
+        except ValueError:
+            account_global_ratelimit = None
+
+        if account_name in self.ratelimit_whitelist or \
+                account_global_ratelimit == 'WHITELIST':
+            return None
+
+        if account_name in self.ratelimit_blacklist or \
+                account_global_ratelimit == 'BLACKLIST':
+            self.logger.error('Returning 497 because of blacklisting: %s',
                               account_name)
             eventlet.sleep(self.BLACK_LIST_SLEEP)
             return Response(status='497 Blacklisted',
                             body='Your account has been blacklisted',
                             request=req)
-        if account_name in self.ratelimit_whitelist:
-            return None
+
         for key, max_rate in self.get_ratelimitable_key_tuples(
-                req.method, account_name, container_name=container_name,
-                obj_name=obj_name):
+                req, account_name, container_name=container_name,
+                obj_name=obj_name, global_ratelimit=account_global_ratelimit):
             try:
                 need_to_sleep = self._get_sleep_time(key, max_rate)
                 if self.log_sleep_time_seconds and \
                         need_to_sleep > self.log_sleep_time_seconds:
                     self.logger.warning(
-                        _("Ratelimit sleep log: %(sleep)s for "
-                          "%(account)s/%(container)s/%(object)s"),
+                        "Ratelimit sleep log: %(sleep)s for "
+                        "%(account)s/%(container)s/%(object)s",
                         {'sleep': need_to_sleep, 'account': account_name,
                          'container': container_name, 'object': obj_name})
                 if need_to_sleep > 0:
                     eventlet.sleep(need_to_sleep)
-            except MaxSleepTimeHitError, e:
+            except MaxSleepTimeHitError as e:
+                if obj_name:
+                    path = '/'.join((account_name, container_name, obj_name))
+                else:
+                    path = '/'.join((account_name, container_name))
                 self.logger.error(
-                    _('Returning 498 for %(meth)s to %(acc)s/%(cont)s/%(obj)s '
-                      '. Ratelimit (Max Sleep) %(e)s'),
-                    {'meth': req.method, 'acc': account_name,
-                     'cont': container_name, 'obj': obj_name, 'e': str(e)})
+                    'Returning 498 for %(meth)s to %(path)s. '
+                    'Ratelimit (Max Sleep) %(e)s',
+                    {'meth': req.method, 'path': path, 'e': str(e)})
                 error_resp = Response(status='498 Rate Limited',
                                       body='Slow down', request=req)
                 return error_resp
@@ -221,12 +308,14 @@ def __call__(self, env, start_response):
             self.memcache_client = cache_from_env(env)
         if not self.memcache_client:
             self.logger.warning(
-                _('Warning: Cannot ratelimit without a memcached client'))
+                'Cannot ratelimit without a memcached client')
             return self.app(env, start_response)
         try:
-            version, account, container, obj = split_path(req.path, 1, 4, True)
+            version, account, container, obj = req.split_path(1, 4, True)
         except ValueError:
             return self.app(env, start_response)
+        if not valid_api_version(version):
+            return self.app(env, start_response)
         ratelimit_resp = self.handle_ratelimit(req, account, container, obj)
         if ratelimit_resp is None:
             return self.app(env, start_response)
@@ -241,6 +330,20 @@ def filter_factory(global_conf, **local_conf):
     conf = global_conf.copy()
     conf.update(local_conf)
 
+    account_ratelimit = float(conf.get('account_ratelimit', 0))
+    max_sleep_time_seconds = float(conf.get('max_sleep_time_seconds', 60))
+    container_ratelimits, cont_limit_info = interpret_conf_limits(
+        conf, 'container_ratelimit_', info=1)
+    container_listing_ratelimits, cont_list_limit_info = \
+        interpret_conf_limits(conf, 'container_listing_ratelimit_', info=1)
+    # not all limits are exposed (intentionally)
+    register_swift_info('ratelimit',
+                        account_ratelimit=account_ratelimit,
+                        max_sleep_time_seconds=max_sleep_time_seconds,
+                        container_ratelimits=cont_limit_info,
+                        container_listing_ratelimits=cont_list_limit_info)
+
     def limit_filter(app):
         return RateLimitMiddleware(app, conf)
+
     return limit_filter
diff --git a/swift/common/middleware/read_only.py b/swift/common/middleware/read_only.py
new file mode 100644
index 0000000000..b905ff1c97
--- /dev/null
+++ b/swift/common/middleware/read_only.py
@@ -0,0 +1,125 @@
+# Copyright (c) 2010-2015 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from swift.common.constraints import check_account_format, valid_api_version
+from swift.common.swob import HTTPMethodNotAllowed, Request
+from swift.common.utils import get_logger, config_true_value
+from swift.common.registry import register_swift_info
+from swift.proxy.controllers.base import get_info
+
+"""
+=========
+Read Only
+=========
+
+The ability to make an entire cluster or individual accounts read only is
+implemented as pluggable middleware.  When a cluster or an account is in read
+only mode, requests that would result in writes to the cluser are not allowed.
+A 405 is returned on such requests.  "COPY", "DELETE", "POST", and
+"PUT" are the HTTP methods that are considered writes.
+
+-------------
+Configuration
+-------------
+
+All configuration is optional.
+
+============= ======= ====================================================
+Option        Default Description
+------------- ------- ----------------------------------------------------
+read_only     false   Set to 'true' to put the entire cluster in read only
+                      mode.
+allow_deletes false   Set to 'true' to allow deletes.
+============= ======= ====================================================
+
+---------------------------
+Marking Individual Accounts
+---------------------------
+
+If a system administrator wants to mark individual accounts as read only,
+he/she can set X-Account-Sysmeta-Read-Only on an account to 'true'.
+
+If a system administrator wants to allow writes to individual accounts,
+when a cluster is in read only mode, he/she can set
+X-Account-Sysmeta-Read-Only on an account to 'false'.
+
+This header will be hidden from the user, because of the gatekeeper middleware,
+and can only be set using a direct client to the account nodes.
+"""
+
+
+class ReadOnlyMiddleware(object):
+    """
+    Middleware that make an entire cluster or individual accounts read only.
+    """
+
+    def __init__(self, app, conf, logger=None):
+        self.app = app
+        self.logger = logger or get_logger(conf, log_route='read_only')
+        self.read_only = config_true_value(conf.get('read_only'))
+        self.write_methods = {'COPY', 'POST', 'PUT'}
+        if not config_true_value(conf.get('allow_deletes')):
+            self.write_methods.add('DELETE')
+
+    def __call__(self, env, start_response):
+        req = Request(env)
+
+        if req.method not in self.write_methods:
+            return self.app(env, start_response)
+
+        try:
+            version, account, container, obj = req.split_path(2, 4, True)
+            if not valid_api_version(version):
+                raise ValueError
+        except ValueError:
+            return self.app(env, start_response)
+
+        if req.method == 'COPY' and 'Destination-Account' in req.headers:
+            dest_account = req.headers.get('Destination-Account')
+            account = check_account_format(req, dest_account)
+
+        if self.account_read_only(req, account):
+            msg = 'Writes are disabled for this account.'
+            return HTTPMethodNotAllowed(body=msg)(env, start_response)
+
+        return self.app(env, start_response)
+
+    def account_read_only(self, req, account):
+        """
+        Check whether an account should be read-only.
+
+        This considers both the cluster-wide config value as well as the
+        per-account override in X-Account-Sysmeta-Read-Only.
+        """
+        info = get_info(self.app, req.environ, account, swift_source='RO')
+        read_only = info.get('sysmeta', {}).get('read-only', '')
+        if not read_only:
+            return self.read_only
+        return config_true_value(read_only)
+
+
+def filter_factory(global_conf, **local_conf):
+    """
+    paste.deploy app factory for creating WSGI proxy apps.
+    """
+    conf = global_conf.copy()
+    conf.update(local_conf)
+
+    if config_true_value(conf.get('read_only')):
+        register_swift_info('read_only')
+
+    def read_only_filter(app):
+        return ReadOnlyMiddleware(app, conf)
+
+    return read_only_filter
diff --git a/swift/common/middleware/recon.py b/swift/common/middleware/recon.py
index 4bcb8f6db6..0a6d35d07c 100644
--- a/swift/common/middleware/recon.py
+++ b/swift/common/middleware/recon.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -14,17 +14,19 @@
 # limitations under the License.
 
 import errno
+import json
 import os
+import time
+from resource import getpagesize
 
-from swift.common.swob import Request, Response
-from swift.common.utils import split_path, get_logger, config_true_value
+from swift import __version__ as swiftver
 from swift.common.constraints import check_mount
-from resource import getpagesize
-from hashlib import md5
-try:
-    import simplejson as json
-except ImportError:
-    import json
+from swift.common.storage_policy import POLICIES
+from swift.common.swob import Request, Response
+from swift.common.utils import get_logger, SWIFT_CONF_FILE, md5_hash_for_file
+from swift.common.recon import RECON_OBJECT_FILE, RECON_CONTAINER_FILE, \
+    RECON_ACCOUNT_FILE, RECON_DRIVE_FILE, RECON_RELINKER_FILE, \
+    DEFAULT_RECON_CACHE_PATH
 
 
 class ReconMiddleware(object):
@@ -33,8 +35,8 @@ class ReconMiddleware(object):
 
     /recon/load|mem|async... will return various system metrics.
 
-    Needs to be added to the pipeline and a requires a filter
-    declaration in the object-server.conf:
+    Needs to be added to the pipeline and requires a filter
+    declaration in the [account|container|object]-server conf file:
 
     [filter:recon]
     use = egg:swift#recon
@@ -43,44 +45,61 @@ class ReconMiddleware(object):
 
     def __init__(self, app, conf, *args, **kwargs):
         self.app = app
-        self.devices = conf.get('devices', '/srv/node/')
+        self.devices = conf.get('devices', '/srv/node')
         swift_dir = conf.get('swift_dir', '/etc/swift')
         self.logger = get_logger(conf, log_route='recon')
         self.recon_cache_path = conf.get('recon_cache_path',
-                                         '/var/cache/swift')
+                                         DEFAULT_RECON_CACHE_PATH)
         self.object_recon_cache = os.path.join(self.recon_cache_path,
-                                               'object.recon')
+                                               RECON_OBJECT_FILE)
         self.container_recon_cache = os.path.join(self.recon_cache_path,
-                                                  'container.recon')
+                                                  RECON_CONTAINER_FILE)
         self.account_recon_cache = os.path.join(self.recon_cache_path,
-                                                'account.recon')
+                                                RECON_ACCOUNT_FILE)
+        self.drive_recon_cache = os.path.join(self.recon_cache_path,
+                                              RECON_DRIVE_FILE)
+        self.relink_recon_cache = os.path.join(self.recon_cache_path,
+                                               RECON_RELINKER_FILE)
         self.account_ring_path = os.path.join(swift_dir, 'account.ring.gz')
         self.container_ring_path = os.path.join(swift_dir, 'container.ring.gz')
-        self.object_ring_path = os.path.join(swift_dir, 'object.ring.gz')
-        self.rings = [self.account_ring_path, self.container_ring_path,
-                      self.object_ring_path]
-        self.mount_check = config_true_value(conf.get('mount_check', 'true'))
 
-    def _from_recon_cache(self, cache_keys, cache_file, openr=open):
+        self.rings = [self.account_ring_path, self.container_ring_path]
+        # include all object ring files (for all policies)
+        for policy in POLICIES:
+            self.rings.append(os.path.join(swift_dir,
+                                           policy.ring_name + '.ring.gz'))
+
+    def _from_recon_cache(self, cache_keys, cache_file, openr=open,
+                          ignore_missing=False):
         """retrieve values from a recon cache file
 
         :params cache_keys: list of cache items to retrieve
         :params cache_file: cache file to retrieve items from.
         :params openr: open to use [for unittests]
-        :return: dict of cache items and their value or none if not found
+        :params ignore_missing: Some recon stats are very temporary, in this
+            case it would be better to not log if things are missing.
+        :return: dict of cache items and their values or none if not found
         """
         try:
             with openr(cache_file, 'r') as f:
                 recondata = json.load(f)
-                return dict((key, recondata.get(key)) for key in cache_keys)
-        except IOError:
-            self.logger.exception(_('Error reading recon cache file'))
+                return {key: recondata.get(key) for key in cache_keys}
+        except IOError as err:
+            if err.errno == errno.ENOENT and ignore_missing:
+                pass
+            else:
+                self.logger.exception('Error reading recon cache file')
         except ValueError:
-            self.logger.exception(_('Error parsing recon cache file'))
+            self.logger.exception('Error parsing recon cache file')
         except Exception:
-            self.logger.exception(_('Error retrieving recon data'))
+            self.logger.exception('Error retrieving recon data')
         return dict((key, None) for key in cache_keys)
 
+    def get_version(self):
+        """get swift version"""
+        verinfo = {'version': swiftver}
+        return verinfo
+
     def get_mounted(self, openr=open):
         """get ALL mounted fs from /proc/mounts"""
         mounts = []
@@ -115,31 +134,53 @@ def get_mem(self, openr=open):
 
     def get_async_info(self):
         """get # of async pendings"""
-        return self._from_recon_cache(['async_pending'],
+        return self._from_recon_cache(['async_pending', 'async_pending_last'],
                                       self.object_recon_cache)
 
+    def get_driveaudit_error(self):
+        """get # of drive audit errors"""
+        return self._from_recon_cache(['drive_audit_errors'],
+                                      self.drive_recon_cache)
+
+    def get_sharding_info(self):
+        """get sharding info"""
+        return self._from_recon_cache(["sharding_stats",
+                                       "sharding_time",
+                                       "sharding_last"],
+                                      self.container_recon_cache)
+
     def get_replication_info(self, recon_type):
         """get replication info"""
+        replication_list = ['replication_time',
+                            'replication_stats',
+                            'replication_last']
         if recon_type == 'account':
-            return self._from_recon_cache(['replication_time',
-                                           'replication_stats'],
+            return self._from_recon_cache(replication_list,
                                           self.account_recon_cache)
         elif recon_type == 'container':
-            return self._from_recon_cache(['replication_time',
-                                           'replication_stats'],
+            return self._from_recon_cache(replication_list,
                                           self.container_recon_cache)
         elif recon_type == 'object':
-            return self._from_recon_cache(['object_replication_time'],
+            replication_list += ['object_replication_time',
+                                 'object_replication_last']
+            return self._from_recon_cache(replication_list,
                                           self.object_recon_cache)
         else:
             return None
 
+    def get_reconstruction_info(self):
+        """get reconstruction info"""
+        reconstruction_list = ['object_reconstruction_last',
+                               'object_reconstruction_time']
+        return self._from_recon_cache(reconstruction_list,
+                                      self.object_recon_cache)
+
     def get_device_info(self):
         """get devices"""
         try:
             return {self.devices: os.listdir(self.devices)}
         except Exception:
-            self.logger.exception(_('Error listing devices'))
+            self.logger.exception('Error listing devices')
             return {self.devices: None}
 
     def get_updater_info(self, recon_type):
@@ -148,7 +189,9 @@ def get_updater_info(self, recon_type):
             return self._from_recon_cache(['container_updater_sweep'],
                                           self.container_recon_cache)
         elif recon_type == 'object':
-            return self._from_recon_cache(['object_updater_sweep'],
+            return self._from_recon_cache(['object_updater_sweep',
+                                           'object_updater_stats',
+                                           'object_updater_last'],
                                           self.object_recon_cache)
         else:
             return None
@@ -185,17 +228,36 @@ def get_unmounted(self):
         """list unmounted (failed?) devices"""
         mountlist = []
         for entry in os.listdir(self.devices):
-            mpoint = {'device': entry,
-                      'mounted': check_mount(self.devices, entry)}
-            if not mpoint['mounted']:
-                mountlist.append(mpoint)
+            if not os.path.isdir(os.path.join(self.devices, entry)):
+                continue
+
+            try:
+                check_mount(self.devices, entry)
+            except OSError as err:
+                mounted = str(err)
+            except ValueError:
+                mounted = False
+            else:
+                continue
+            mountlist.append({'device': entry, 'mounted': mounted})
         return mountlist
 
     def get_diskusage(self):
         """get disk utilization statistics"""
         devices = []
         for entry in os.listdir(self.devices):
-            if check_mount(self.devices, entry):
+            if not os.path.isdir(os.path.join(self.devices, entry)):
+                continue
+
+            try:
+                check_mount(self.devices, entry)
+            except OSError as err:
+                devices.append({'device': entry, 'mounted': str(err),
+                                'size': '', 'used': '', 'avail': ''})
+            except ValueError:
+                devices.append({'device': entry, 'mounted': False,
+                                'size': '', 'used': '', 'avail': ''})
+            else:
                 path = os.path.join(self.devices, entry)
                 disk = os.statvfs(path)
                 capacity = disk.f_bsize * disk.f_blocks
@@ -204,41 +266,55 @@ def get_diskusage(self):
                 devices.append({'device': entry, 'mounted': True,
                                 'size': capacity, 'used': used,
                                 'avail': available})
-            else:
-                devices.append({'device': entry, 'mounted': False,
-                                'size': '', 'used': '', 'avail': ''})
         return devices
 
-    def get_ring_md5(self, openr=open):
+    def get_ring_md5(self):
         """get all ring md5sum's"""
         sums = {}
         for ringfile in self.rings:
-            md5sum = md5()
             if os.path.exists(ringfile):
                 try:
-                    with openr(ringfile, 'rb') as f:
-                        block = f.read(4096)
-                        while block:
-                            md5sum.update(block)
-                            block = f.read(4096)
-                    sums[ringfile] = md5sum.hexdigest()
-                except IOError, err:
+                    sums[ringfile] = md5_hash_for_file(ringfile)
+                except IOError as err:
                     sums[ringfile] = None
                     if err.errno != errno.ENOENT:
-                        self.logger.exception(_('Error reading ringfile'))
+                        self.logger.exception('Error reading ringfile')
         return sums
 
+    def get_swift_conf_md5(self):
+        """get md5 of swift.conf"""
+        hexsum = None
+        try:
+            hexsum = md5_hash_for_file(SWIFT_CONF_FILE)
+        except IOError as err:
+            if err.errno != errno.ENOENT:
+                self.logger.exception('Error reading swift.conf')
+        return {SWIFT_CONF_FILE: hexsum}
+
     def get_quarantine_count(self):
         """get obj/container/account quarantine counts"""
-        qcounts = {"objects": 0, "containers": 0, "accounts": 0}
+        qcounts = {"objects": 0, "containers": 0, "accounts": 0,
+                   "policies": {}}
         qdir = "quarantined"
         for device in os.listdir(self.devices):
-            for qtype in qcounts:
-                qtgt = os.path.join(self.devices, device, qdir, qtype)
-                if os.path.exists(qtgt):
+            qpath = os.path.join(self.devices, device, qdir)
+            if os.path.exists(qpath):
+                for qtype in os.listdir(qpath):
+                    qtgt = os.path.join(qpath, qtype)
                     linkcount = os.lstat(qtgt).st_nlink
                     if linkcount > 2:
-                        qcounts[qtype] += linkcount - 2
+                        if qtype.startswith('objects'):
+                            if '-' in qtype:
+                                pkey = qtype.split('-', 1)[1]
+                            else:
+                                pkey = '0'
+                            qcounts['policies'].setdefault(pkey,
+                                                           {'objects': 0})
+                            qcounts['policies'][pkey]['objects'] \
+                                += linkcount - 2
+                            qcounts['objects'] += linkcount - 2
+                        else:
+                            qcounts[qtype] += linkcount - 2
         return qcounts
 
     def get_socket_info(self, openr=open):
@@ -272,8 +348,21 @@ def get_socket_info(self, openr=open):
                 raise
         return sockstat
 
+    def get_time(self):
+        """get current time"""
+
+        return time.time()
+
+    def get_relinker_info(self):
+        """get relinker info, if any"""
+
+        stat_keys = ['devices', 'workers']
+        return self._from_recon_cache(stat_keys,
+                                      self.relink_recon_cache,
+                                      ignore_missing=True)
+
     def GET(self, req):
-        root, rcheck, rtype = split_path(req.path, 1, 3, True)
+        root, rcheck, rtype = req.split_path(1, 3, True)
         all_rtypes = ['account', 'container', 'object']
         if rcheck == "mem":
             content = self.get_mem()
@@ -284,7 +373,7 @@ def GET(self, req):
         elif rcheck == 'replication' and rtype in all_rtypes:
             content = self.get_replication_info(rtype)
         elif rcheck == 'replication' and rtype is None:
-            #handle old style object replication requests
+            # handle old style object replication requests
             content = self.get_replication_info('object')
         elif rcheck == "devices":
             content = self.get_device_info()
@@ -302,10 +391,24 @@ def GET(self, req):
             content = self.get_diskusage()
         elif rcheck == "ringmd5":
             content = self.get_ring_md5()
+        elif rcheck == "swiftconfmd5":
+            content = self.get_swift_conf_md5()
         elif rcheck == "quarantined":
             content = self.get_quarantine_count()
         elif rcheck == "sockstat":
             content = self.get_socket_info()
+        elif rcheck == "version":
+            content = self.get_version()
+        elif rcheck == "driveaudit":
+            content = self.get_driveaudit_error()
+        elif rcheck == "time":
+            content = self.get_time()
+        elif rcheck == "sharding":
+            content = self.get_sharding_info()
+        elif rcheck == "relinker":
+            content = self.get_relinker_info()
+        elif rcheck == "reconstruction" and rtype == 'object':
+            content = self.get_reconstruction_info()
         else:
             content = "Invalid path: %s" % req.path
             return Response(request=req, status="404 Not Found",
diff --git a/swift/common/middleware/s3api/__init__.py b/swift/common/middleware/s3api/__init__.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/swift/common/middleware/s3api/acl_handlers.py b/swift/common/middleware/s3api/acl_handlers.py
new file mode 100644
index 0000000000..f5b8c587b9
--- /dev/null
+++ b/swift/common/middleware/s3api/acl_handlers.py
@@ -0,0 +1,485 @@
+# Copyright (c) 2014 OpenStack Foundation.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""
+------------
+Acl Handlers
+------------
+
+Why do we need this
+^^^^^^^^^^^^^^^^^^^
+
+To make controller classes clean, we need these handlers.
+It is really useful for customizing acl checking algorithms for
+each controller.
+
+Basic Information
+^^^^^^^^^^^^^^^^^
+
+BaseAclHandler wraps basic Acl handling.
+(i.e. it will check acl from ACL_MAP by using HEAD)
+
+How to extend
+^^^^^^^^^^^^^
+
+Make a handler with the name of the controller.
+(e.g. BucketAclHandler is for BucketController)
+It consists of method(s) for actual S3 method on controllers as follows.
+
+Example::
+
+   class BucketAclHandler(BaseAclHandler):
+       def PUT:
+           << put acl handling algorithms here for PUT bucket >>
+
+.. note::
+  If the method DON'T need to recall _get_response in outside of
+  acl checking, the method have to return the response it needs at
+  the end of method.
+
+"""
+from swift.common.middleware.s3api.subresource import ACL, Owner, encode_acl
+from swift.common.middleware.s3api.s3response import MissingSecurityHeader, \
+    MalformedACLError, UnexpectedContent, AccessDenied
+from swift.common.middleware.s3api.etree import fromstring, XMLSyntaxError, \
+    DocumentInvalid
+from swift.common.middleware.s3api.utils import MULTIUPLOAD_SUFFIX, \
+    sysmeta_header
+
+
+def get_acl_handler(controller_name):
+    for base_klass in [BaseAclHandler, MultiUploadAclHandler]:
+        # pylint: disable-msg=E1101
+        for handler in base_klass.__subclasses__():
+            handler_suffix_len = len('AclHandler') \
+                if not handler.__name__ == 'S3AclHandler' else len('Handler')
+            if handler.__name__[:-handler_suffix_len] == controller_name:
+                return handler
+    return BaseAclHandler
+
+
+class BaseAclHandler(object):
+    """
+    BaseAclHandler: Handling ACL for basic requests mapped on ACL_MAP
+    """
+    def __init__(self, req, logger, container=None, obj=None, headers=None):
+        self.req = req
+        self.container = req.container_name if container is None else container
+        self.obj = req.object_name if obj is None else obj
+        self.method = req.environ['REQUEST_METHOD']
+        self.user_id = self.req.user_id
+        self.headers = req.headers if headers is None else headers
+        self.logger = logger
+
+    def request_with(self, container, obj, headers):
+        return type(self)(self.req, self.logger,
+                          container=container, obj=obj, headers=headers)
+
+    def handle_acl(self, app, method, container=None, obj=None, headers=None):
+        method = method or self.method
+
+        ah = self.request_with(container, obj, headers)
+        if hasattr(ah, method):
+            return getattr(ah, method)(app)
+        else:
+            return ah._handle_acl(app, method)
+
+    def _handle_acl(self, app, sw_method, container=None, obj=None,
+                    permission=None, headers=None):
+        """
+        General acl handling method.
+        This method expects to call Request._get_response() in outside of
+        this method so that this method returns response only when sw_method
+        is HEAD.
+        """
+
+        container = self.container if container is None else container
+        obj = self.obj if obj is None else obj
+        sw_method = sw_method or self.req.environ['REQUEST_METHOD']
+        resource = 'object' if obj else 'container'
+        headers = self.headers if headers is None else headers
+
+        self.logger.debug(
+            'checking permission: %s %s %s %s' %
+            (container, obj, sw_method, dict(headers)))
+
+        if not container:
+            return
+
+        if not permission and (self.method, sw_method, resource) in ACL_MAP:
+            acl_check = ACL_MAP[(self.method, sw_method, resource)]
+            resource = acl_check.get('Resource') or resource
+            permission = acl_check['Permission']
+
+        if not permission:
+            self.logger.debug(
+                '%s %s %s %s' % (container, obj, sw_method, headers))
+            raise Exception('No permission to be checked exists')
+
+        if resource == 'object':
+            version_id = self.req.params.get('versionId')
+            if version_id is None:
+                query = {}
+            else:
+                query = {'version-id': version_id}
+            if self.req.method == 'HEAD':
+                # This HEAD for ACL is going to also be the definitive response
+                # to the client so we need to include client params. We don't
+                # do this for other client request methods because they may
+                # have invalid combinations of params and headers for a swift
+                # HEAD request.
+                part_number = self.req.params.get('partNumber')
+                if part_number is not None:
+                    query['part-number'] = part_number
+            resp = self.req.get_acl_response(app, 'HEAD',
+                                             container, obj,
+                                             headers, query=query)
+            acl = resp.object_acl
+        elif resource == 'container':
+            resp = self.req.get_acl_response(app, 'HEAD',
+                                             container, '')
+            acl = resp.bucket_acl
+
+        try:
+            acl.check_permission(self.user_id, permission)
+        except Exception as e:
+            self.logger.debug(acl)
+            self.logger.debug('permission denined: %s %s %s' %
+                              (e, self.user_id, permission))
+            raise
+
+        if sw_method == 'HEAD':
+            return resp
+
+    def get_acl(self, headers, body, bucket_owner, object_owner=None):
+        """
+        Get ACL instance from S3 (e.g. x-amz-grant) headers or S3 acl xml body.
+        """
+        acl = ACL.from_headers(headers, bucket_owner, object_owner,
+                               as_private=False)
+
+        if acl is None:
+            # Get acl from request body if possible.
+            if not body:
+                raise MissingSecurityHeader(missing_header_name='x-amz-acl')
+            try:
+                elem = fromstring(body, ACL.root_tag)
+                acl = ACL.from_elem(
+                    elem, True, self.req.conf.allow_no_owner)
+            except (XMLSyntaxError, DocumentInvalid):
+                raise MalformedACLError()
+            except Exception as e:
+                self.logger.error(e)
+                raise
+        else:
+            if body:
+                # Specifying grant with both header and xml is not allowed.
+                raise UnexpectedContent()
+
+        return acl
+
+
+class BucketAclHandler(BaseAclHandler):
+    """
+    BucketAclHandler: Handler for BucketController
+    """
+    def DELETE(self, app):
+        if self.container.endswith(MULTIUPLOAD_SUFFIX):
+            # anyways, delete multiupload container doesn't need acls
+            # because it depends on GET segment container result for
+            # cleanup
+            pass
+        else:
+            return self._handle_acl(app, 'DELETE')
+
+    def HEAD(self, app):
+        if self.method == 'DELETE':
+            return self._handle_acl(app, 'DELETE')
+        else:
+            return self._handle_acl(app, 'HEAD')
+
+    def GET(self, app):
+        if self.method == 'DELETE' and \
+                self.container.endswith(MULTIUPLOAD_SUFFIX):
+            pass
+        else:
+            return self._handle_acl(app, 'GET')
+
+    def PUT(self, app):
+        req_acl = ACL.from_headers(self.req.headers,
+                                   Owner(self.user_id, self.user_id))
+
+        if not self.req.environ.get('swift_owner'):
+            raise AccessDenied()
+
+        # To avoid overwriting the existing bucket's ACL, we send PUT
+        # request first before setting the ACL to make sure that the target
+        # container does not exist.
+        self.req.get_acl_response(app, 'PUT', self.container)
+
+        # update metadata
+        self.req.bucket_acl = req_acl
+
+        # FIXME If this request is failed, there is a possibility that the
+        # bucket which has no ACL is left.
+        return self.req.get_acl_response(app, 'POST')
+
+
+class ObjectAclHandler(BaseAclHandler):
+    """
+    ObjectAclHandler: Handler for ObjectController
+    """
+    def HEAD(self, app):
+        # No check object permission needed at DELETE Object
+        if self.method != 'DELETE':
+            return self._handle_acl(app, 'HEAD')
+
+    def PUT(self, app):
+        b_resp = self._handle_acl(app, 'HEAD', obj='')
+        req_acl = ACL.from_headers(self.req.headers,
+                                   b_resp.bucket_acl.owner,
+                                   Owner(self.user_id, self.user_id))
+        self.req.object_acl = req_acl
+
+
+class S3AclHandler(BaseAclHandler):
+    """
+    S3AclHandler: Handler for S3AclController
+    """
+    def HEAD(self, app):
+        self._handle_acl(app, 'HEAD', permission='READ_ACP')
+
+    def GET(self, app):
+        self._handle_acl(app, 'HEAD', permission='READ_ACP')
+
+    def PUT(self, app):
+        if self.req.is_object_request:
+            b_resp = self.req.get_acl_response(app, 'HEAD', obj='')
+            o_resp = self._handle_acl(app, 'HEAD', permission='WRITE_ACP')
+            req_acl = self.get_acl(self.req.headers,
+                                   self.req.xml(ACL.max_xml_length),
+                                   b_resp.bucket_acl.owner,
+                                   o_resp.object_acl.owner)
+
+            # Don't change the owner of the resource by PUT acl request.
+            o_resp.object_acl.check_owner(req_acl.owner.id)
+
+            for g in req_acl.grants:
+                self.logger.debug(
+                    'Grant %s %s permission on the object /%s/%s' %
+                    (g.grantee, g.permission, self.req.container_name,
+                     self.req.object_name))
+            self.req.object_acl = req_acl
+        else:
+            self._handle_acl(app, self.method)
+
+    def POST(self, app):
+        if self.req.is_bucket_request:
+            resp = self._handle_acl(app, 'HEAD', permission='WRITE_ACP')
+
+            req_acl = self.get_acl(self.req.headers,
+                                   self.req.xml(ACL.max_xml_length),
+                                   resp.bucket_acl.owner)
+
+            # Don't change the owner of the resource by PUT acl request.
+            resp.bucket_acl.check_owner(req_acl.owner.id)
+
+            for g in req_acl.grants:
+                self.logger.debug(
+                    'Grant %s %s permission on the bucket /%s' %
+                    (g.grantee, g.permission, self.req.container_name))
+            self.req.bucket_acl = req_acl
+        else:
+            self._handle_acl(app, self.method)
+
+
+class MultiObjectDeleteAclHandler(BaseAclHandler):
+    """
+    MultiObjectDeleteAclHandler: Handler for MultiObjectDeleteController
+    """
+    def HEAD(self, app):
+        # Only bucket write acl is required
+        if not self.obj:
+            return self._handle_acl(app, 'HEAD')
+
+    def DELETE(self, app):
+        # Only bucket write acl is required
+        pass
+
+
+class MultiUploadAclHandler(BaseAclHandler):
+    """
+    MultiUpload stuff requires acl checking just once for BASE container
+    so that MultiUploadAclHandler extends BaseAclHandler to check acl only
+    when the verb defined. We should define the verb as the first step to
+    request to backend Swift at incoming request.
+
+    Basic Rules:
+      - BASE container name is always w/o 'MULTIUPLOAD_SUFFIX'
+      - Any check timing is ok but we should check it as soon as possible.
+
+    ========== ====== ============= ==========
+    Controller Verb   CheckResource Permission
+    ========== ====== ============= ==========
+    Part       PUT    Container     WRITE
+    Uploads    GET    Container     READ
+    Uploads    POST   Container     WRITE
+    Upload     GET    Container     READ
+    Upload     DELETE Container     WRITE
+    Upload     POST   Container     WRITE
+    ========== ====== ============= ==========
+
+    """
+    def __init__(self, req, logger, **kwargs):
+        super(MultiUploadAclHandler, self).__init__(req, logger, **kwargs)
+        self.acl_checked = False
+
+    def handle_acl(self, app, method, container=None, obj=None, headers=None):
+        method = method or self.method
+        ah = self.request_with(container, obj, headers)
+        # MultiUpload stuffs don't need acl check basically.
+        if hasattr(ah, method):
+            return getattr(ah, method)(app)
+
+    def HEAD(self, app):
+        # For _check_upload_info
+        self._handle_acl(app, 'HEAD', self.container, '')
+
+
+class PartAclHandler(MultiUploadAclHandler):
+    """
+    PartAclHandler: Handler for PartController
+    """
+    def __init__(self, req, logger, **kwargs):
+        # pylint: disable-msg=E1003
+        super(MultiUploadAclHandler, self).__init__(req, logger, **kwargs)
+
+    def HEAD(self, app):
+        if self.container.endswith(MULTIUPLOAD_SUFFIX):
+            # For _check_upload_info
+            container = self.container[:-len(MULTIUPLOAD_SUFFIX)]
+            self._handle_acl(app, 'HEAD', container, '')
+        else:
+            # For check_copy_source
+            return self._handle_acl(app, 'HEAD', self.container, self.obj)
+
+
+class UploadsAclHandler(MultiUploadAclHandler):
+    """
+    UploadsAclHandler: Handler for UploadsController
+    """
+    def handle_acl(self, app, method, *args, **kwargs):
+        method = method or self.method
+        if hasattr(self, method):
+            return getattr(self, method)(app)
+        else:
+            pass
+
+    def GET(self, app):
+        # List Multipart Upload
+        self._handle_acl(app, 'GET', self.container, '')
+
+    def PUT(self, app):
+        if not self.acl_checked:
+            resp = self._handle_acl(app, 'HEAD', obj='')
+            req_acl = ACL.from_headers(self.req.headers,
+                                       resp.bucket_acl.owner,
+                                       Owner(self.user_id, self.user_id))
+            acl_headers = encode_acl('object', req_acl)
+            self.req.headers[sysmeta_header('object', 'tmpacl')] = \
+                acl_headers[sysmeta_header('object', 'acl')]
+            self.acl_checked = True
+
+
+class UploadAclHandler(MultiUploadAclHandler):
+    """
+    UploadAclHandler: Handler for UploadController
+    """
+    def handle_acl(self, app, method, *args, **kwargs):
+        method = method or self.method
+        if hasattr(self, method):
+            return getattr(self, method)(app)
+        else:
+            pass
+
+    def HEAD(self, app):
+        # FIXME: GET HEAD case conflicts with GET service
+        method = 'GET' if self.method == 'GET' else 'HEAD'
+        self._handle_acl(app, method, self.container, '')
+
+    def PUT(self, app):
+        container = self.req.container_name + MULTIUPLOAD_SUFFIX
+        obj = '%s/%s' % (self.obj, self.req.params['uploadId'])
+        resp = self.req._get_response(app, 'HEAD', container, obj)
+        self.req.headers[sysmeta_header('object', 'acl')] = \
+            resp.sysmeta_headers.get(sysmeta_header('object', 'tmpacl'))
+
+
+"""
+ACL_MAP =
+    {
+        ('<s3_method>', '<swift_method>', '<swift_resource>'):
+        {'Resource': '<check_resource>',
+         'Permission': '<check_permission>'},
+        ...
+    }
+
+s3_method: Method of S3 Request from user to s3api
+swift_method: Method of Swift Request from s3api to swift
+swift_resource: Resource of Swift Request from s3api to swift
+check_resource: <container/object>
+check_permission: <OWNER/READ/WRITE/READ_ACP/WRITE_ACP>
+"""
+ACL_MAP = {
+    # HEAD Bucket
+    ('HEAD', 'HEAD', 'container'):
+    {'Permission': 'READ'},
+    # GET Service
+    ('GET', 'HEAD', 'container'):
+    {'Permission': 'OWNER'},
+    # GET Bucket, List Parts, List Multipart Upload
+    ('GET', 'GET', 'container'):
+    {'Permission': 'READ'},
+    # PUT Object, PUT Object Copy
+    ('PUT', 'HEAD', 'container'):
+    {'Permission': 'WRITE'},
+    # DELETE Bucket
+    ('DELETE', 'DELETE', 'container'):
+    {'Permission': 'OWNER'},
+    # HEAD Object
+    ('HEAD', 'HEAD', 'object'):
+    {'Permission': 'READ'},
+    # GET Object
+    ('GET', 'GET', 'object'):
+    {'Permission': 'READ'},
+    # PUT Object Copy, Upload Part Copy
+    ('PUT', 'HEAD', 'object'):
+    {'Permission': 'READ'},
+    # Abort Multipart Upload
+    ('DELETE', 'HEAD', 'container'):
+    {'Permission': 'WRITE'},
+    # Delete Object
+    ('DELETE', 'DELETE', 'object'):
+    {'Resource': 'container',
+     'Permission': 'WRITE'},
+    # Complete Multipart Upload, DELETE Multiple Objects,
+    # Initiate Multipart Upload
+    ('POST', 'HEAD', 'container'):
+    {'Permission': 'WRITE'},
+    # Versioning
+    ('PUT', 'POST', 'container'):
+    {'Permission': 'WRITE'},
+    ('DELETE', 'GET', 'container'):
+    {'Permission': 'WRITE'},
+}
diff --git a/swift/common/middleware/s3api/acl_utils.py b/swift/common/middleware/s3api/acl_utils.py
new file mode 100644
index 0000000000..b2821a3d2b
--- /dev/null
+++ b/swift/common/middleware/s3api/acl_utils.py
@@ -0,0 +1,100 @@
+# Copyright (c) 2014 OpenStack Foundation.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from swift.common.middleware.s3api.exception import ACLError
+from swift.common.middleware.s3api.etree import fromstring, XMLSyntaxError, \
+    DocumentInvalid, XMLNS_XSI
+from swift.common.middleware.s3api.s3response import S3NotImplemented, \
+    MalformedACLError, InvalidArgument
+
+
+def swift_acl_translate(acl, group='', user='', xml=False):
+    """
+    Takes an S3 style ACL and returns a list of header/value pairs that
+    implement that ACL in Swift, or "NotImplemented" if there isn't a way to do
+    that yet.
+    """
+    swift_acl = {}
+    swift_acl['public-read'] = [['X-Container-Read', '.r:*,.rlistings']]
+    # Swift does not support public write:
+    # https://answers.launchpad.net/swift/+question/169541
+    swift_acl['public-read-write'] = [['X-Container-Write', '.r:*'],
+                                      ['X-Container-Read',
+                                       '.r:*,.rlistings']]
+
+    # TODO: if there's a way to get group and user, this should work for
+    # private:
+    # swift_acl['private'] = \
+    #     [['HTTP_X_CONTAINER_WRITE',  group + ':' + user], \
+    #      ['HTTP_X_CONTAINER_READ', group + ':' + user]]
+    swift_acl['private'] = [['X-Container-Write', '.'],
+                            ['X-Container-Read', '.']]
+
+    # Swift doesn't have per-object ACLs, so this is best-effort
+    swift_acl['bucket-owner-full-control'] = swift_acl['private']
+    swift_acl['bucket-owner-read'] = swift_acl['private']
+
+    if xml:
+        # We are working with XML and need to parse it
+        try:
+            elem = fromstring(acl, 'AccessControlPolicy')
+        except (XMLSyntaxError, DocumentInvalid):
+            raise MalformedACLError()
+        acl = 'unknown'
+        for grant in elem.findall('./AccessControlList/Grant'):
+            permission = grant.find('./Permission').text
+            grantee = grant.find('./Grantee').get('{%s}type' % XMLNS_XSI)
+            if permission == "FULL_CONTROL" and grantee == 'CanonicalUser' and\
+                    acl != 'public-read' and acl != 'public-read-write':
+                acl = 'private'
+            elif permission == "READ" and grantee == 'Group' and\
+                    acl != 'public-read-write':
+                acl = 'public-read'
+            elif permission == "WRITE" and grantee == 'Group':
+                acl = 'public-read-write'
+            else:
+                acl = 'unsupported'
+
+    if acl in ('authenticated-read', 'log-delivery-write'):
+        raise S3NotImplemented()
+    elif acl not in swift_acl:
+        raise ACLError()
+
+    return swift_acl[acl]
+
+
+def handle_acl_header(req):
+    """
+    Handle the x-amz-acl header.
+    Note that this header currently used for only normal-acl
+    (not implemented) on s3acl.
+    TODO: add translation to swift acl like as x-container-read to s3acl
+    """
+
+    amz_acl = req.environ['HTTP_X_AMZ_ACL']
+    # Translate the Amazon ACL to something that can be
+    # implemented in Swift, 501 otherwise. Swift uses POST
+    # for ACLs, whereas S3 uses PUT.
+    del req.environ['HTTP_X_AMZ_ACL']
+    if req.query_string:
+        req.query_string = ''
+
+    try:
+        translated_acl = swift_acl_translate(amz_acl)
+    except ACLError:
+        raise InvalidArgument('x-amz-acl', amz_acl)
+
+    for header, acl in translated_acl:
+        req.headers[header] = acl
diff --git a/swift/common/middleware/s3api/controllers/__init__.py b/swift/common/middleware/s3api/controllers/__init__.py
new file mode 100644
index 0000000000..9e14bd0035
--- /dev/null
+++ b/swift/common/middleware/s3api/controllers/__init__.py
@@ -0,0 +1,58 @@
+# Copyright (c) 2014 OpenStack Foundation.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from swift.common.middleware.s3api.controllers.base import Controller, \
+    UnsupportedController
+from swift.common.middleware.s3api.controllers.service import ServiceController
+from swift.common.middleware.s3api.controllers.bucket import BucketController
+from swift.common.middleware.s3api.controllers.obj import ObjectController
+
+from swift.common.middleware.s3api.controllers.acl import AclController
+from swift.common.middleware.s3api.controllers.s3_acl import S3AclController
+from swift.common.middleware.s3api.controllers.multi_delete import \
+    MultiObjectDeleteController
+from swift.common.middleware.s3api.controllers.multi_upload import \
+    UploadController, PartController, UploadsController
+from swift.common.middleware.s3api.controllers.location import \
+    LocationController
+from swift.common.middleware.s3api.controllers.logging import \
+    LoggingStatusController
+from swift.common.middleware.s3api.controllers.versioning import \
+    VersioningController
+from swift.common.middleware.s3api.controllers.tagging import \
+    TaggingController
+from swift.common.middleware.s3api.controllers.object_lock import \
+    ObjectLockController
+
+__all__ = [
+    'Controller',
+    'ServiceController',
+    'BucketController',
+    'ObjectController',
+
+    'AclController',
+    'S3AclController',
+    'MultiObjectDeleteController',
+    'PartController',
+    'UploadsController',
+    'UploadController',
+    'LocationController',
+    'LoggingStatusController',
+    'VersioningController',
+    'TaggingController',
+    'ObjectLockController',
+
+    'UnsupportedController',
+]
diff --git a/swift/common/middleware/s3api/controllers/acl.py b/swift/common/middleware/s3api/controllers/acl.py
new file mode 100644
index 0000000000..09d49a0bb1
--- /dev/null
+++ b/swift/common/middleware/s3api/controllers/acl.py
@@ -0,0 +1,131 @@
+# Copyright (c) 2010-2014 OpenStack Foundation.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from swift.common.http import HTTP_OK
+from swift.common.middleware.acl import parse_acl, referrer_allowed
+from swift.common.utils import public
+
+from swift.common.middleware.s3api.exception import ACLError
+from swift.common.middleware.s3api.controllers.base import Controller
+from swift.common.middleware.s3api.s3response import (
+    HTTPOk, S3NotImplemented, MalformedACLError, UnexpectedContent,
+    MissingSecurityHeader)
+from swift.common.middleware.s3api.etree import Element, SubElement, tostring
+from swift.common.middleware.s3api.acl_utils import swift_acl_translate, \
+    XMLNS_XSI
+
+
+MAX_ACL_BODY_SIZE = 200 * 1024
+
+
+def get_acl(account_name, headers):
+    """
+    Attempts to construct an S3 ACL based on what is found in the swift headers
+    """
+
+    elem = Element('AccessControlPolicy')
+    owner = SubElement(elem, 'Owner')
+    SubElement(owner, 'ID').text = account_name
+    SubElement(owner, 'DisplayName').text = account_name
+    access_control_list = SubElement(elem, 'AccessControlList')
+
+    # grant FULL_CONTROL to myself by default
+    grant = SubElement(access_control_list, 'Grant')
+    grantee = SubElement(grant, 'Grantee', nsmap={'xsi': XMLNS_XSI})
+    grantee.set('{%s}type' % XMLNS_XSI, 'CanonicalUser')
+    SubElement(grantee, 'ID').text = account_name
+    SubElement(grantee, 'DisplayName').text = account_name
+    SubElement(grant, 'Permission').text = 'FULL_CONTROL'
+
+    referrers, _ = parse_acl(headers.get('x-container-read'))
+    if referrer_allowed('unknown', referrers):
+        # grant public-read access
+        grant = SubElement(access_control_list, 'Grant')
+        grantee = SubElement(grant, 'Grantee', nsmap={'xsi': XMLNS_XSI})
+        grantee.set('{%s}type' % XMLNS_XSI, 'Group')
+        SubElement(grantee, 'URI').text = \
+            'http://acs.amazonaws.com/groups/global/AllUsers'
+        SubElement(grant, 'Permission').text = 'READ'
+
+    referrers, _ = parse_acl(headers.get('x-container-write'))
+    if referrer_allowed('unknown', referrers):
+        # grant public-write access
+        grant = SubElement(access_control_list, 'Grant')
+        grantee = SubElement(grant, 'Grantee', nsmap={'xsi': XMLNS_XSI})
+        grantee.set('{%s}type' % XMLNS_XSI, 'Group')
+        SubElement(grantee, 'URI').text = \
+            'http://acs.amazonaws.com/groups/global/AllUsers'
+        SubElement(grant, 'Permission').text = 'WRITE'
+
+    body = tostring(elem)
+
+    return HTTPOk(body=body, content_type="text/plain")
+
+
+class AclController(Controller):
+    """
+    Handles the following APIs:
+
+    * GET Bucket acl
+    * PUT Bucket acl
+    * GET Object acl
+    * PUT Object acl
+
+    Those APIs are logged as ACL operations in the S3 server log.
+    """
+    @public
+    def GET(self, req):
+        """
+        Handles GET Bucket acl and GET Object acl.
+        """
+        resp = req.get_response(self.app, method='HEAD')
+
+        return get_acl(req.user_id, resp.headers)
+
+    @public
+    def PUT(self, req):
+        """
+        Handles PUT Bucket acl and PUT Object acl.
+        """
+        if req.is_object_request:
+            # Handle Object ACL
+            raise S3NotImplemented()
+        else:
+            # Handle Bucket ACL
+            xml = req.xml(MAX_ACL_BODY_SIZE)
+            if all(['HTTP_X_AMZ_ACL' in req.environ, xml]):
+                # S3 doesn't allow to give ACL with both ACL header and body.
+                raise UnexpectedContent()
+            elif not any(['HTTP_X_AMZ_ACL' in req.environ, xml]):
+                # Both canned ACL header and xml body are missing
+                raise MissingSecurityHeader(missing_header_name='x-amz-acl')
+            else:
+                # correct ACL exists in the request
+                if xml:
+                    # We very likely have an XML-based ACL request.
+                    # let's try to translate to the request header
+                    try:
+                        translated_acl = swift_acl_translate(xml, xml=True)
+                    except ACLError:
+                        raise MalformedACLError()
+
+                    for header, acl in translated_acl:
+                        req.headers[header] = acl
+
+            resp = req.get_response(self.app, 'POST')
+            resp.status = HTTP_OK
+            resp.headers.update({'Location': req.container_name})
+
+            return resp
diff --git a/swift/common/middleware/s3api/controllers/base.py b/swift/common/middleware/s3api/controllers/base.py
new file mode 100644
index 0000000000..3652b151fa
--- /dev/null
+++ b/swift/common/middleware/s3api/controllers/base.py
@@ -0,0 +1,100 @@
+# Copyright (c) 2010-2014 OpenStack Foundation.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import functools
+
+from swift.common.middleware.s3api.s3response import S3NotImplemented, \
+    InvalidRequest
+from swift.common.middleware.s3api.utils import camel_to_snake
+
+
+def bucket_operation(func=None, err_resp=None, err_msg=None):
+    """
+    A decorator to ensure that the request is a bucket operation.  If the
+    target resource is an object, this decorator updates the request by default
+    so that the controller handles it as a bucket operation.  If 'err_resp' is
+    specified, this raises it on error instead.
+    """
+    def _bucket_operation(func):
+        @functools.wraps(func)
+        def wrapped(self, req):
+            if not req.is_bucket_request:
+                if err_resp:
+                    raise err_resp(msg=err_msg)
+
+                self.logger.debug('A key is specified for bucket API.')
+                req.object_name = None
+
+            return func(self, req)
+
+        return wrapped
+
+    if func:
+        return _bucket_operation(func)
+    else:
+        return _bucket_operation
+
+
+def object_operation(func):
+    """
+    A decorator to ensure that the request is an object operation.  If the
+    target resource is not an object, this raises an error response.
+    """
+    @functools.wraps(func)
+    def wrapped(self, req):
+        if not req.is_object_request:
+            raise InvalidRequest('A key must be specified')
+
+        return func(self, req)
+
+    return wrapped
+
+
+def check_container_existence(func):
+    """
+    A decorator to ensure the container existence.
+    """
+    @functools.wraps(func)
+    def check_container(self, req):
+        req.get_container_info(self.app)
+        return func(self, req)
+
+    return check_container
+
+
+class Controller(object):
+    """
+    Base WSGI controller class for the middleware
+    """
+    def __init__(self, app, conf, logger, **kwargs):
+        self.app = app
+        self.conf = conf
+        self.logger = logger
+
+    @classmethod
+    def resource_type(cls):
+        """
+        Returns the target resource type of this controller.
+        """
+        name = cls.__name__[:-len('Controller')]
+        return camel_to_snake(name).upper()
+
+
+class UnsupportedController(Controller):
+    """
+    Handles unsupported requests.
+    """
+    def __init__(self, app, conf, logger, **kwargs):
+        raise S3NotImplemented('The requested resource is not implemented')
diff --git a/swift/common/middleware/s3api/controllers/bucket.py b/swift/common/middleware/s3api/controllers/bucket.py
new file mode 100644
index 0000000000..c4c8530c16
--- /dev/null
+++ b/swift/common/middleware/s3api/controllers/bucket.py
@@ -0,0 +1,415 @@
+# Copyright (c) 2010-2014 OpenStack Foundation.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from base64 import standard_b64encode as b64encode
+from base64 import standard_b64decode as b64decode
+
+from urllib.parse import quote
+
+from swift.common import swob
+from swift.common.http import HTTP_OK
+from swift.common.middleware.versioned_writes.object_versioning import \
+    DELETE_MARKER_CONTENT_TYPE
+from swift.common.utils import json, public, config_true_value, Timestamp, \
+    cap_length
+from swift.common.registry import get_swift_info
+
+from swift.common.middleware.s3api.controllers.base import Controller
+from swift.common.middleware.s3api.etree import Element, SubElement, \
+    tostring, fromstring, XMLSyntaxError, DocumentInvalid
+from swift.common.middleware.s3api.s3response import \
+    HTTPOk, S3NotImplemented, InvalidArgument, \
+    MalformedXML, InvalidLocationConstraint, NoSuchBucket, \
+    BucketNotEmpty, VersionedBucketNotEmpty, InternalError, \
+    ServiceUnavailable, NoSuchKey
+from swift.common.middleware.s3api.utils import MULTIUPLOAD_SUFFIX, S3Timestamp
+
+MAX_PUT_BUCKET_BODY_SIZE = 10240
+
+
+class BucketController(Controller):
+    """
+    Handles bucket request.
+    """
+    def _delete_segments_bucket(self, req):
+        """
+        Before delete bucket, delete segments bucket if existing.
+        """
+        container = req.container_name + MULTIUPLOAD_SUFFIX
+        marker = ''
+        seg = ''
+
+        try:
+            resp = req.get_response(self.app, 'HEAD')
+            if int(resp.sw_headers['X-Container-Object-Count']) > 0:
+                if resp.sw_headers.get('X-Container-Sysmeta-Versions-Enabled'):
+                    raise VersionedBucketNotEmpty()
+                else:
+                    raise BucketNotEmpty()
+            # FIXME: This extra HEAD saves unexpected segment deletion
+            # but if a complete multipart upload happen while cleanup
+            # segment container below, completed object may be missing its
+            # segments unfortunately. To be safer, it might be good
+            # to handle if the segments can be deleted for each object.
+        except NoSuchBucket:
+            pass
+
+        try:
+            while True:
+                # delete all segments
+                resp = req.get_response(self.app, 'GET', container,
+                                        query={'format': 'json',
+                                               'marker': marker})
+                segments = json.loads(resp.body)
+                for seg in segments:
+                    try:
+                        req.get_response(
+                            self.app, 'DELETE', container,
+                            swob.bytes_to_wsgi(seg['name'].encode('utf8')))
+                    except NoSuchKey:
+                        pass
+                    except InternalError:
+                        raise ServiceUnavailable()
+                if segments:
+                    marker = seg['name']
+                else:
+                    break
+            req.get_response(self.app, 'DELETE', container)
+        except NoSuchBucket:
+            return
+        except (BucketNotEmpty, InternalError):
+            raise ServiceUnavailable()
+
+    @public
+    def HEAD(self, req):
+        """
+        Handle HEAD Bucket (Get Metadata) request
+        """
+        resp = req.get_response(self.app)
+
+        return HTTPOk(headers=resp.headers)
+
+    def _parse_request_options(self, req, max_keys):
+        encoding_type = req.params.get('encoding-type')
+        if encoding_type is not None and encoding_type != 'url':
+            err_msg = 'Invalid Encoding Method specified in Request'
+            raise InvalidArgument('encoding-type', encoding_type, err_msg)
+
+        # in order to judge that truncated is valid, check whether
+        # max_keys + 1 th element exists in swift.
+        query = {
+            'limit': max_keys + 1,
+        }
+        if 'prefix' in req.params:
+            query['prefix'] = swob.wsgi_to_str(req.params['prefix'])
+        if 'delimiter' in req.params:
+            query['delimiter'] = swob.wsgi_to_str(req.params['delimiter'])
+        fetch_owner = False
+        if 'versions' in req.params:
+            query['versions'] = swob.wsgi_to_str(req.params['versions'])
+            listing_type = 'object-versions'
+            version_marker = swob.wsgi_to_str(req.params.get(
+                'version-id-marker'))
+            if 'key-marker' in req.params:
+                query['marker'] = swob.wsgi_to_str(req.params['key-marker'])
+                if version_marker is not None:
+                    if version_marker != 'null':
+                        try:
+                            Timestamp(version_marker)
+                        except ValueError:
+                            raise InvalidArgument(
+                                'version-id-marker', version_marker,
+                                'Invalid version id specified')
+                    query['version_marker'] = version_marker
+            elif version_marker is not None:
+                err_msg = ('A version-id marker cannot be specified without '
+                           'a key marker.')
+                raise InvalidArgument('version-id-marker',
+                                      version_marker, err_msg)
+        elif int(req.params.get('list-type', '1')) == 2:
+            listing_type = 'version-2'
+            if 'start-after' in req.params:
+                query['marker'] = swob.wsgi_to_str(req.params['start-after'])
+            # continuation-token overrides start-after
+            if 'continuation-token' in req.params:
+                decoded = b64decode(
+                    req.params['continuation-token']).decode('utf8')
+                query['marker'] = decoded
+            if 'fetch-owner' in req.params:
+                fetch_owner = config_true_value(req.params['fetch-owner'])
+        else:
+            listing_type = 'version-1'
+            if 'marker' in req.params:
+                query['marker'] = swob.wsgi_to_str(req.params['marker'])
+
+        return encoding_type, query, listing_type, fetch_owner
+
+    def _build_versions_result(self, req, objects, encoding_type,
+                               tag_max_keys, is_truncated):
+        elem = Element('ListVersionsResult')
+        SubElement(elem, 'Name').text = req.container_name
+        prefix = swob.wsgi_to_str(req.params.get('prefix'))
+        if prefix and encoding_type == 'url':
+            prefix = quote(prefix)
+        SubElement(elem, 'Prefix').text = prefix
+        key_marker = swob.wsgi_to_str(req.params.get('key-marker'))
+        if key_marker and encoding_type == 'url':
+            key_marker = quote(key_marker)
+        SubElement(elem, 'KeyMarker').text = key_marker
+        SubElement(elem, 'VersionIdMarker').text = swob.wsgi_to_str(
+            req.params.get('version-id-marker'))
+        if is_truncated:
+            if 'name' in objects[-1]:
+                SubElement(elem, 'NextKeyMarker').text = \
+                    objects[-1]['name']
+                SubElement(elem, 'NextVersionIdMarker').text = \
+                    objects[-1].get('version') or 'null'
+            if 'subdir' in objects[-1]:
+                SubElement(elem, 'NextKeyMarker').text = \
+                    objects[-1]['subdir']
+                SubElement(elem, 'NextVersionIdMarker').text = 'null'
+        SubElement(elem, 'MaxKeys').text = str(tag_max_keys)
+        delimiter = swob.wsgi_to_str(req.params.get('delimiter'))
+        if delimiter is not None:
+            if encoding_type == 'url':
+                delimiter = quote(delimiter)
+            SubElement(elem, 'Delimiter').text = delimiter
+        if encoding_type == 'url':
+            SubElement(elem, 'EncodingType').text = encoding_type
+        SubElement(elem, 'IsTruncated').text = \
+            'true' if is_truncated else 'false'
+        return elem
+
+    def _build_base_listing_element(self, req, encoding_type):
+        elem = Element('ListBucketResult')
+        SubElement(elem, 'Name').text = req.container_name
+        prefix = swob.wsgi_to_str(req.params.get('prefix'))
+        if prefix and encoding_type == 'url':
+            prefix = quote(prefix)
+        SubElement(elem, 'Prefix').text = prefix
+        return elem
+
+    def _build_list_bucket_result_type_one(self, req, objects, encoding_type,
+                                           tag_max_keys, is_truncated):
+        elem = self._build_base_listing_element(req, encoding_type)
+        marker = swob.wsgi_to_str(req.params.get('marker'))
+        if marker and encoding_type == 'url':
+            marker = quote(marker)
+        SubElement(elem, 'Marker').text = marker
+        if is_truncated and 'delimiter' in req.params:
+            if 'name' in objects[-1]:
+                name = objects[-1]['name']
+            else:
+                name = objects[-1]['subdir']
+            if encoding_type == 'url':
+                name = quote(name.encode('utf-8'))
+            SubElement(elem, 'NextMarker').text = name
+        # XXX: really? no NextMarker when no delimiter??
+        SubElement(elem, 'MaxKeys').text = str(tag_max_keys)
+        delimiter = swob.wsgi_to_str(req.params.get('delimiter'))
+        if delimiter:
+            if encoding_type == 'url':
+                delimiter = quote(delimiter)
+            SubElement(elem, 'Delimiter').text = delimiter
+        if encoding_type == 'url':
+            SubElement(elem, 'EncodingType').text = encoding_type
+        SubElement(elem, 'IsTruncated').text = \
+            'true' if is_truncated else 'false'
+        return elem
+
+    def _build_list_bucket_result_type_two(self, req, objects, encoding_type,
+                                           tag_max_keys, is_truncated):
+        elem = self._build_base_listing_element(req, encoding_type)
+        if is_truncated:
+            if 'name' in objects[-1]:
+                SubElement(elem, 'NextContinuationToken').text = \
+                    b64encode(objects[-1]['name'].encode('utf8'))
+            if 'subdir' in objects[-1]:
+                SubElement(elem, 'NextContinuationToken').text = \
+                    b64encode(objects[-1]['subdir'].encode('utf8'))
+        if 'continuation-token' in req.params:
+            SubElement(elem, 'ContinuationToken').text = \
+                swob.wsgi_to_str(req.params['continuation-token'])
+        start_after = swob.wsgi_to_str(req.params.get('start-after'))
+        if start_after is not None:
+            if encoding_type == 'url':
+                start_after = quote(start_after)
+            SubElement(elem, 'StartAfter').text = start_after
+        SubElement(elem, 'KeyCount').text = str(len(objects))
+        SubElement(elem, 'MaxKeys').text = str(tag_max_keys)
+        delimiter = swob.wsgi_to_str(req.params.get('delimiter'))
+        if delimiter:
+            if encoding_type == 'url':
+                delimiter = quote(delimiter)
+            SubElement(elem, 'Delimiter').text = delimiter
+        if encoding_type == 'url':
+            SubElement(elem, 'EncodingType').text = encoding_type
+        SubElement(elem, 'IsTruncated').text = \
+            'true' if is_truncated else 'false'
+        return elem
+
+    def _add_subdir(self, elem, o, encoding_type):
+        common_prefixes = SubElement(elem, 'CommonPrefixes')
+        name = o['subdir']
+        if encoding_type == 'url':
+            name = quote(name.encode('utf-8'))
+        SubElement(common_prefixes, 'Prefix').text = name
+
+    def _add_object(self, req, elem, o, encoding_type, listing_type,
+                    fetch_owner):
+        name = o['name']
+        if encoding_type == 'url':
+            name = quote(name.encode('utf-8'))
+
+        if listing_type == 'object-versions':
+            if o['content_type'] == DELETE_MARKER_CONTENT_TYPE:
+                contents = SubElement(elem, 'DeleteMarker')
+            else:
+                contents = SubElement(elem, 'Version')
+            SubElement(contents, 'Key').text = name
+            SubElement(contents, 'VersionId').text = o.get(
+                'version_id') or 'null'
+            if 'object_versioning' in get_swift_info():
+                SubElement(contents, 'IsLatest').text = (
+                    'true' if o['is_latest'] else 'false')
+            else:
+                SubElement(contents, 'IsLatest').text = 'true'
+        else:
+            contents = SubElement(elem, 'Contents')
+            SubElement(contents, 'Key').text = name
+        SubElement(contents, 'LastModified').text = \
+            S3Timestamp.from_isoformat(o['last_modified']).s3xmlformat
+        if contents.tag != 'DeleteMarker':
+            if 's3_etag' in o:
+                # New-enough MUs are already in the right format
+                etag = o['s3_etag']
+            elif 'slo_etag' in o:
+                # SLOs may be in something *close* to the MU format
+                etag = '"%s-N"' % o['slo_etag'].strip('"')
+            else:
+                # Normal objects just use the MD5
+                etag = o['hash']
+                if len(etag) < 2 or etag[::len(etag) - 1] != '""':
+                    # Normal objects just use the MD5
+                    etag = '"%s"' % o['hash']
+                    # This also catches sufficiently-old SLOs, but we have
+                    # no way to identify those from container listings
+                # Otherwise, somebody somewhere (proxyfs, maybe?) made this
+                # look like an RFC-compliant ETag; we don't need to
+                # quote-wrap.
+            SubElement(contents, 'ETag').text = etag
+            SubElement(contents, 'Size').text = str(o['bytes'])
+        if fetch_owner or listing_type != 'version-2':
+            owner = SubElement(contents, 'Owner')
+            SubElement(owner, 'ID').text = req.user_id
+            SubElement(owner, 'DisplayName').text = req.user_id
+        if contents.tag != 'DeleteMarker':
+            SubElement(contents, 'StorageClass').text = 'STANDARD'
+
+    def _add_objects_to_result(self, req, elem, objects, encoding_type,
+                               listing_type, fetch_owner):
+        for o in objects:
+            if 'subdir' in o:
+                self._add_subdir(elem, o, encoding_type)
+            else:
+                self._add_object(req, elem, o, encoding_type, listing_type,
+                                 fetch_owner)
+
+    @public
+    def GET(self, req):
+        """
+        Handle GET Bucket (List Objects) request
+        """
+        tag_max_keys = req.get_validated_param(
+            'max-keys', self.conf.max_bucket_listing)
+        # TODO: Separate max_bucket_listing and default_bucket_listing
+        max_keys = min(tag_max_keys, self.conf.max_bucket_listing)
+
+        encoding_type, query, listing_type, fetch_owner = \
+            self._parse_request_options(req, max_keys)
+
+        resp = req.get_response(self.app, query=query)
+
+        try:
+            objects = json.loads(resp.body)
+        except (TypeError, ValueError):
+            self.logger.error('Got non-JSON response trying to list %s: %r',
+                              req.path, cap_length(resp.body, 60))
+            raise
+
+        is_truncated = max_keys > 0 and len(objects) > max_keys
+        objects = objects[:max_keys]
+
+        if listing_type == 'object-versions':
+            func = self._build_versions_result
+        elif listing_type == 'version-2':
+            func = self._build_list_bucket_result_type_two
+        else:
+            func = self._build_list_bucket_result_type_one
+        elem = func(req, objects, encoding_type, tag_max_keys, is_truncated)
+        self._add_objects_to_result(
+            req, elem, objects, encoding_type, listing_type, fetch_owner)
+
+        body = tostring(elem)
+
+        return HTTPOk(body=body, content_type='application/xml')
+
+    @public
+    def PUT(self, req):
+        """
+        Handle PUT Bucket request
+        """
+        xml = req.xml(MAX_PUT_BUCKET_BODY_SIZE)
+        if xml:
+            # check location
+            try:
+                elem = fromstring(
+                    xml, 'CreateBucketConfiguration', self.logger)
+                location = elem.find('./LocationConstraint').text
+            except (XMLSyntaxError, DocumentInvalid):
+                raise MalformedXML()
+            except Exception as e:
+                self.logger.error(e)
+                raise
+
+            if location not in (self.conf.location,
+                                self.conf.location.lower()):
+                # s3api cannot support multiple regions currently.
+                raise InvalidLocationConstraint()
+
+        resp = req.get_response(self.app)
+
+        resp.status = HTTP_OK
+        resp.location = '/' + req.container_name
+
+        return resp
+
+    @public
+    def DELETE(self, req):
+        """
+        Handle DELETE Bucket request
+        """
+        # NB: object_versioning is responsible for cleaning up its container
+        if self.conf.allow_multipart_uploads:
+            self._delete_segments_bucket(req)
+        resp = req.get_response(self.app)
+        return resp
+
+    @public
+    def POST(self, req):
+        """
+        Handle POST Bucket request
+        """
+        raise S3NotImplemented()
diff --git a/swift/common/middleware/s3api/controllers/location.py b/swift/common/middleware/s3api/controllers/location.py
new file mode 100644
index 0000000000..b4b288d833
--- /dev/null
+++ b/swift/common/middleware/s3api/controllers/location.py
@@ -0,0 +1,42 @@
+# Copyright (c) 2010-2014 OpenStack Foundation.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from swift.common.utils import public
+
+from swift.common.middleware.s3api.controllers.base import Controller, \
+    bucket_operation
+from swift.common.middleware.s3api.etree import Element, tostring
+from swift.common.middleware.s3api.s3response import HTTPOk
+
+
+class LocationController(Controller):
+    """
+    Handles GET Bucket location, which is logged as a LOCATION operation in the
+    S3 server log.
+    """
+    @public
+    @bucket_operation
+    def GET(self, req):
+        """
+        Handles GET Bucket location.
+        """
+        req.get_response(self.app, method='HEAD')
+
+        elem = Element('LocationConstraint')
+        if self.conf.location != 'us-east-1':
+            elem.text = self.conf.location
+        body = tostring(elem)
+
+        return HTTPOk(body=body, content_type='application/xml')
diff --git a/swift/common/middleware/s3api/controllers/logging.py b/swift/common/middleware/s3api/controllers/logging.py
new file mode 100644
index 0000000000..5eec0151bc
--- /dev/null
+++ b/swift/common/middleware/s3api/controllers/logging.py
@@ -0,0 +1,54 @@
+# Copyright (c) 2010-2014 OpenStack Foundation.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from swift.common.utils import public
+
+from swift.common.middleware.s3api.controllers.base import Controller, \
+    bucket_operation
+from swift.common.middleware.s3api.etree import Element, tostring
+from swift.common.middleware.s3api.s3response import (
+    HTTPOk, S3NotImplemented, NoLoggingStatusForKey)
+
+
+class LoggingStatusController(Controller):
+    """
+    Handles the following APIs:
+
+    * GET Bucket logging
+    * PUT Bucket logging
+
+    Those APIs are logged as LOGGING_STATUS operations in the S3 server log.
+    """
+    @public
+    @bucket_operation(err_resp=NoLoggingStatusForKey)
+    def GET(self, req):
+        """
+        Handles GET Bucket logging.
+        """
+        req.get_response(self.app, method='HEAD')
+
+        # logging disabled
+        elem = Element('BucketLoggingStatus')
+        body = tostring(elem)
+
+        return HTTPOk(body=body, content_type='application/xml')
+
+    @public
+    @bucket_operation(err_resp=NoLoggingStatusForKey)
+    def PUT(self, req):
+        """
+        Handles PUT Bucket logging.
+        """
+        raise S3NotImplemented()
diff --git a/swift/common/middleware/s3api/controllers/multi_delete.py b/swift/common/middleware/s3api/controllers/multi_delete.py
new file mode 100644
index 0000000000..e6d00dbd0d
--- /dev/null
+++ b/swift/common/middleware/s3api/controllers/multi_delete.py
@@ -0,0 +1,181 @@
+# Copyright (c) 2010-2014 OpenStack Foundation.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import copy
+import json
+
+from swift.common.constraints import MAX_OBJECT_NAME_LENGTH
+from swift.common.http import HTTP_NO_CONTENT
+from swift.common.swob import str_to_wsgi
+from swift.common.utils import public, StreamingPile
+from swift.common.registry import get_swift_info
+
+from swift.common.middleware.s3api.controllers.base import Controller, \
+    bucket_operation
+from swift.common.middleware.s3api.etree import Element, SubElement, \
+    fromstring, tostring, XMLSyntaxError, DocumentInvalid
+from swift.common.middleware.s3api.s3response import HTTPOk, \
+    S3NotImplemented, NoSuchKey, ErrorResponse, MalformedXML, \
+    UserKeyMustBeSpecified, AccessDenied, MissingRequestBodyError
+
+
+class MultiObjectDeleteController(Controller):
+    """
+    Handles Delete Multiple Objects, which is logged as a MULTI_OBJECT_DELETE
+    operation in the S3 server log.
+    """
+    def _gen_error_body(self, error, elem, delete_list):
+        for key, version in delete_list:
+            error_elem = SubElement(elem, 'Error')
+            SubElement(error_elem, 'Key').text = key
+            if version is not None:
+                SubElement(error_elem, 'VersionId').text = version
+            SubElement(error_elem, 'Code').text = error.__class__.__name__
+            SubElement(error_elem, 'Message').text = error._msg
+
+        return tostring(elem)
+
+    @public
+    @bucket_operation
+    def POST(self, req):
+        """
+        Handles Delete Multiple Objects.
+        """
+        def object_key_iter(elem):
+            for obj in elem.iterchildren('Object'):
+                key = obj.find('./Key').text
+                if not key:
+                    raise UserKeyMustBeSpecified()
+                version = obj.find('./VersionId')
+                if version is not None:
+                    version = version.text
+
+                yield key, version
+
+        max_body_size = min(
+            # FWIW, AWS limits multideletes to 1000 keys, and swift limits
+            # object names to 1024 bytes (by default). Add a factor of two to
+            # allow some slop.
+            2 * self.conf.max_multi_delete_objects * MAX_OBJECT_NAME_LENGTH,
+            # But, don't let operators shoot themselves in the foot
+            10 * 1024 * 1024)
+
+        try:
+            xml = req.xml(max_body_size)
+            if not xml:
+                raise MissingRequestBodyError()
+
+            req.require_md5(xml)
+            elem = fromstring(xml, 'Delete', self.logger)
+
+            quiet = elem.find('./Quiet')
+            self.quiet = quiet is not None and quiet.text.lower() == 'true'
+
+            delete_list = list(object_key_iter(elem))
+            if len(delete_list) > self.conf.max_multi_delete_objects:
+                raise MalformedXML()
+        except (XMLSyntaxError, DocumentInvalid):
+            raise MalformedXML()
+        except ErrorResponse:
+            raise
+        except Exception as e:
+            self.logger.error(e)
+            raise
+
+        elem = Element('DeleteResult')
+
+        # check bucket existence
+        try:
+            req.get_response(self.app, 'HEAD')
+        except AccessDenied as error:
+            body = self._gen_error_body(error, elem, delete_list)
+            return HTTPOk(body=body)
+
+        if 'object_versioning' not in get_swift_info() and any(
+                version not in ('null', None)
+                for _key, version in delete_list):
+            raise S3NotImplemented()
+
+        def do_delete(base_req, key, version):
+            req = copy.copy(base_req)
+            req.environ = copy.copy(base_req.environ)
+            req.object_name = str_to_wsgi(key)
+            if version:
+                req.params = {'version-id': version, 'symlink': 'get'}
+
+            try:
+                try:
+                    query = req.gen_multipart_manifest_delete_query(
+                        self.app, version=version)
+                except NoSuchKey:
+                    query = {}
+                if version:
+                    query['version-id'] = version
+                    query['symlink'] = 'get'
+
+                resp = req.get_response(self.app, method='DELETE', query=query,
+                                        headers={'Accept': 'application/json'})
+                # If async segment cleanup is available, we expect to get
+                # back a 204; otherwise, the delete is synchronous and we
+                # have to read the response to actually do the SLO delete
+                if query.get('multipart-manifest') and \
+                        resp.status_int != HTTP_NO_CONTENT:
+                    try:
+                        delete_result = json.loads(resp.body)
+                        if delete_result['Errors']:
+                            # NB: bulk includes 404s in "Number Not Found",
+                            # not "Errors"
+                            msg_parts = [delete_result['Response Status']]
+                            msg_parts.extend(
+                                '%s: %s' % (obj, status)
+                                for obj, status in delete_result['Errors'])
+                            return key, {'code': 'SLODeleteError',
+                                         'message': '\n'.join(msg_parts)}
+                        # else, all good
+                    except (ValueError, TypeError, KeyError):
+                        # Logs get all the gory details
+                        self.logger.exception(
+                            'Could not parse SLO delete response (%s): %s',
+                            resp.status, resp.body)
+                        # Client gets something more generic
+                        return key, {'code': 'SLODeleteError',
+                                     'message': 'Unexpected swift response'}
+            except NoSuchKey:
+                pass
+            except ErrorResponse as e:
+                return key, {'code': e.__class__.__name__, 'message': e._msg}
+            except Exception:
+                self.logger.exception(
+                    'Unexpected Error handling DELETE of %r %r' % (
+                        req.container_name, key))
+                return key, {'code': 'Server Error', 'message': 'Server Error'}
+
+            return key, None
+
+        with StreamingPile(self.conf.multi_delete_concurrency) as pile:
+            for key, err in pile.asyncstarmap(do_delete, (
+                    (req, key, version) for key, version in delete_list)):
+                if err:
+                    error = SubElement(elem, 'Error')
+                    SubElement(error, 'Key').text = key
+                    SubElement(error, 'Code').text = err['code']
+                    SubElement(error, 'Message').text = err['message']
+                elif not self.quiet:
+                    deleted = SubElement(elem, 'Deleted')
+                    SubElement(deleted, 'Key').text = key
+
+        body = tostring(elem)
+
+        return HTTPOk(body=body)
diff --git a/swift/common/middleware/s3api/controllers/multi_upload.py b/swift/common/middleware/s3api/controllers/multi_upload.py
new file mode 100644
index 0000000000..657d9f30df
--- /dev/null
+++ b/swift/common/middleware/s3api/controllers/multi_upload.py
@@ -0,0 +1,858 @@
+# Copyright (c) 2010-2014 OpenStack Foundation.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""
+Implementation of S3 Multipart Upload.
+
+This module implements S3 Multipart Upload APIs with the Swift SLO feature.
+The following explains how S3api uses swift container and objects to store S3
+upload information:
+
+-----------------
+[bucket]+segments
+-----------------
+
+A container to store upload information. [bucket] is the original bucket
+where multipart upload is initiated.
+
+-----------------------------
+[bucket]+segments/[upload_id]
+-----------------------------
+
+An object of the ongoing upload id. The object is empty and used for
+checking the target upload status. If the object exists, it means that the
+upload is initiated but not either completed or aborted.
+
+-------------------------------------------
+[bucket]+segments/[upload_id]/[part_number]
+-------------------------------------------
+
+The last suffix is the part number under the upload id. When the client uploads
+the parts, they will be stored in the namespace with
+[bucket]+segments/[upload_id]/[part_number].
+
+Example listing result in the [bucket]+segments container::
+
+  [bucket]+segments/[upload_id1]  # upload id object for upload_id1
+  [bucket]+segments/[upload_id1]/1  # part object for upload_id1
+  [bucket]+segments/[upload_id1]/2  # part object for upload_id1
+  [bucket]+segments/[upload_id1]/3  # part object for upload_id1
+  [bucket]+segments/[upload_id2]  # upload id object for upload_id2
+  [bucket]+segments/[upload_id2]/1  # part object for upload_id2
+  [bucket]+segments/[upload_id2]/2  # part object for upload_id2
+     .
+     .
+
+Those part objects are directly used as segments of a Swift
+Static Large Object when the multipart upload is completed.
+
+"""
+
+import binascii
+import copy
+import os
+import re
+import time
+
+from swift.common import constraints
+from swift.common.swob import Range, bytes_to_wsgi, normalize_etag, \
+    wsgi_to_str
+from swift.common.utils import json, public, reiterate, md5, Timestamp
+from swift.common.request_helpers import get_container_update_override_key, \
+    get_param
+
+from urllib.parse import quote, urlparse
+
+from swift.common.middleware.s3api.controllers.base import Controller, \
+    bucket_operation, object_operation, check_container_existence
+from swift.common.middleware.s3api.s3response import InvalidArgument, \
+    ErrorResponse, MalformedXML, KeyTooLongError, InvalidPart, \
+    BucketAlreadyExists, EntityTooSmall, InvalidPartOrder, InvalidRequest, \
+    HTTPOk, HTTPNoContent, NoSuchKey, NoSuchUpload, NoSuchBucket, \
+    BucketAlreadyOwnedByYou, ServiceUnavailable, PreconditionFailed, \
+    S3NotImplemented
+from swift.common.middleware.s3api.utils import unique_id, \
+    MULTIUPLOAD_SUFFIX, S3Timestamp, sysmeta_header
+from swift.common.middleware.s3api.etree import Element, SubElement, \
+    fromstring, tostring, XMLSyntaxError, DocumentInvalid
+from swift.common.storage_policy import POLICIES
+
+DEFAULT_MAX_PARTS_LISTING = 1000
+DEFAULT_MAX_UPLOADS = 1000
+
+MAX_COMPLETE_UPLOAD_BODY_SIZE = 2048 * 1024
+
+
+def _get_upload_info(req, app, upload_id):
+    """
+    Make a HEAD request for existing upload object metadata. Tries the upload
+    marker first, and then falls back to the manifest object.
+
+    :param req: an S3Request object.
+    :param app: the wsgi app.
+    :param upload_id: the upload id.
+    :returns: a tuple of (S3Response, boolean) where the boolean is True if the
+        response is from the upload marker and False otherwise.
+    :raises: NoSuchUpload if neither the marker nor the manifest were found.
+    """
+
+    container = req.container_name + MULTIUPLOAD_SUFFIX
+    obj = '%s/%s' % (req.object_name, upload_id)
+
+    # XXX: if we leave the copy-source header, somewhere later we might
+    # drop in a ?version-id=... query string that's utterly inappropriate
+    # for the upload marker. Until we get around to fixing that, just pop
+    # it off for now...
+    copy_source = req.headers.pop('X-Amz-Copy-Source', None)
+    try:
+        resp = req.get_response(app, 'HEAD', container=container, obj=obj)
+        return resp, True
+    except NoSuchKey:
+        # ensure consistent path and policy are logged despite manifest HEAD
+        upload_marker_path = req.environ.get('s3api.backend_path')
+        policy_index = req.policy_index
+        try:
+            resp = req.get_response(app, 'HEAD')
+            if resp.sysmeta_headers.get(sysmeta_header(
+                    'object', 'upload-id')) == upload_id:
+                return resp, False
+        except NoSuchKey:
+            pass
+        finally:
+            # Ops often find it more useful for us to log the upload marker
+            # path, so put it back
+            if upload_marker_path is not None:
+                req.environ['s3api.backend_path'] = upload_marker_path
+            if policy_index is not None:
+                req.policy_index = policy_index
+        raise NoSuchUpload(upload_id=upload_id)
+    finally:
+        # ...making sure to restore any copy-source before returning
+        if copy_source is not None:
+            req.headers['X-Amz-Copy-Source'] = copy_source
+
+
+def _make_complete_body(req, s3_etag, yielded_anything):
+    result_elem = Element('CompleteMultipartUploadResult')
+
+    # NOTE: boto with sig v4 appends port to HTTP_HOST value at
+    # the request header when the port is non default value and it
+    # makes req.host_url like as http://localhost:8080:8080/path
+    # that obviously invalid. Probably it should be resolved at
+    # swift.common.swob though, tentatively we are parsing and
+    # reconstructing the correct host_url info here.
+    # in detail, https://github.com/boto/boto/pull/3513
+    parsed_url = urlparse(req.host_url)
+    host_url = '%s://%s' % (parsed_url.scheme, parsed_url.hostname)
+    # Why are we doing our own port parsing? Because py3 decided
+    # to start raising ValueErrors on access after parsing such
+    # an invalid port
+    netloc = parsed_url.netloc.split('@')[-1].split(']')[-1]
+    if ':' in netloc:
+        port = netloc.split(':', 2)[1]
+        host_url += ':%s' % port
+
+    SubElement(result_elem, 'Location').text = host_url + req.path
+    SubElement(result_elem, 'Bucket').text = req.container_name
+    SubElement(result_elem, 'Key').text = wsgi_to_str(req.object_name)
+    SubElement(result_elem, 'ETag').text = '"%s"' % s3_etag
+    body = tostring(result_elem, xml_declaration=not yielded_anything)
+    if yielded_anything:
+        return b'\n' + body
+    return body
+
+
+class PartController(Controller):
+    """
+    Handles the following APIs:
+
+    * Upload Part
+    * Upload Part - Copy
+
+    Those APIs are logged as PART operations in the S3 server log.
+    """
+    @public
+    @object_operation
+    @check_container_existence
+    def PUT(self, req):
+        """
+        Handles Upload Part and Upload Part Copy.
+        """
+
+        if 'uploadId' not in req.params:
+            raise InvalidArgument('ResourceType', 'partNumber',
+                                  'Unexpected query string parameter')
+
+        part_number = req.validate_part_number()
+
+        upload_id = get_param(req, 'uploadId')
+        _get_upload_info(req, self.app, upload_id)
+
+        req.container_name += MULTIUPLOAD_SUFFIX
+        req.object_name = '%s/%s/%d' % (req.object_name, upload_id,
+                                        part_number)
+
+        req_timestamp = S3Timestamp.now()
+        req.headers['X-Timestamp'] = req_timestamp.internal
+        source_resp = req.check_copy_source(self.app)
+        if 'X-Amz-Copy-Source' in req.headers and \
+                'X-Amz-Copy-Source-Range' in req.headers:
+            rng = req.headers['X-Amz-Copy-Source-Range']
+
+            header_valid = True
+            try:
+                rng_obj = Range(rng)
+                if len(rng_obj.ranges) != 1:
+                    header_valid = False
+            except ValueError:
+                header_valid = False
+            if not header_valid:
+                err_msg = ('The x-amz-copy-source-range value must be of the '
+                           'form bytes=first-last where first and last are '
+                           'the zero-based offsets of the first and last '
+                           'bytes to copy')
+                raise InvalidArgument('x-amz-source-range', rng, err_msg)
+
+            source_size = int(source_resp.headers['Content-Length'])
+            if not rng_obj.ranges_for_length(source_size):
+                err_msg = ('Range specified is not valid for source object '
+                           'of size: %s' % source_size)
+                raise InvalidArgument('x-amz-source-range', rng, err_msg)
+
+            req.headers['Range'] = rng
+            del req.headers['X-Amz-Copy-Source-Range']
+        if 'X-Amz-Copy-Source' in req.headers:
+            # Clear some problematic headers that might be on the source
+            req.headers.update({
+                sysmeta_header('object', 'etag'): '',
+                'X-Object-Sysmeta-Swift3-Etag': '',  # for legacy data
+                'X-Object-Sysmeta-Slo-Etag': '',
+                'X-Object-Sysmeta-Slo-Size': '',
+                get_container_update_override_key('etag'): '',
+            })
+        resp = req.get_response(self.app)
+
+        if 'X-Amz-Copy-Source' in req.headers:
+            resp.append_copy_resp_body(req.controller_name,
+                                       req_timestamp.s3xmlformat)
+
+        resp.status = 200
+        return resp
+
+
+class UploadsController(Controller):
+    """
+    Handles the following APIs:
+
+    * List Multipart Uploads
+    * Initiate Multipart Upload
+
+    Those APIs are logged as UPLOADS operations in the S3 server log.
+    """
+    @public
+    @bucket_operation(err_resp=InvalidRequest,
+                      err_msg="Key is not expected for the GET method "
+                              "?uploads subresource")
+    @check_container_existence
+    def GET(self, req):
+        """
+        Handles List Multipart Uploads
+        """
+
+        def separate_uploads(uploads, prefix, delimiter):
+            """
+            separate_uploads will separate uploads into non_delimited_uploads
+            (a subset of uploads) and common_prefixes according to the
+            specified delimiter. non_delimited_uploads is a list of uploads
+            which exclude the delimiter. common_prefixes is a set of prefixes
+            prior to the specified delimiter. Note that the prefix in the
+            common_prefixes includes the delimiter itself.
+
+            i.e. if '/' delimiter specified and then the uploads is consists of
+            ['foo', 'foo/bar'], this function will return (['foo'], ['foo/']).
+
+            :param uploads: A list of uploads dictionary
+            :param prefix: A string of prefix reserved on the upload path.
+                           (i.e. the delimiter must be searched behind the
+                            prefix)
+            :param delimiter: A string of delimiter to split the path in each
+                              upload
+
+            :return (non_delimited_uploads, common_prefixes)
+            """
+            non_delimited_uploads = []
+            common_prefixes = set()
+            for upload in uploads:
+                key = upload['key']
+                end = key.find(delimiter, len(prefix))
+                if end >= 0:
+                    common_prefix = key[:end + len(delimiter)]
+                    common_prefixes.add(common_prefix)
+                else:
+                    non_delimited_uploads.append(upload)
+            return non_delimited_uploads, sorted(common_prefixes)
+
+        encoding_type = get_param(req, 'encoding-type')
+        if encoding_type is not None and encoding_type != 'url':
+            err_msg = 'Invalid Encoding Method specified in Request'
+            raise InvalidArgument('encoding-type', encoding_type, err_msg)
+
+        keymarker = get_param(req, 'key-marker', '')
+        uploadid = get_param(req, 'upload-id-marker', '')
+        maxuploads = req.get_validated_param(
+            'max-uploads', DEFAULT_MAX_UPLOADS, DEFAULT_MAX_UPLOADS)
+
+        query = {
+            'format': 'json',
+            'marker': '',
+        }
+
+        if uploadid and keymarker:
+            query.update({'marker': '%s/%s' % (keymarker, uploadid)})
+        elif keymarker:
+            query.update({'marker': '%s/~' % (keymarker)})
+        if 'prefix' in req.params:
+            query.update({'prefix': get_param(req, 'prefix')})
+
+        container = req.container_name + MULTIUPLOAD_SUFFIX
+        uploads = []
+        prefixes = []
+
+        def object_to_upload(object_info):
+            obj, upid = object_info['name'].rsplit('/', 1)
+            obj_dict = {'key': obj,
+                        'upload_id': upid,
+                        'last_modified': object_info['last_modified']}
+            return obj_dict
+
+        is_segment = re.compile('.*/[0-9]+$')
+
+        while len(uploads) < maxuploads:
+            try:
+                resp = req.get_response(self.app, container=container,
+                                        query=query)
+                objects = json.loads(resp.body)
+            except NoSuchBucket:
+                # Assume NoSuchBucket as no uploads
+                objects = []
+            if not objects:
+                break
+
+            new_uploads = [object_to_upload(obj) for obj in objects
+                           if not is_segment.match(obj.get('name', ''))]
+            new_prefixes = []
+            if 'delimiter' in req.params:
+                prefix = get_param(req, 'prefix', '')
+                delimiter = get_param(req, 'delimiter')
+                new_uploads, new_prefixes = separate_uploads(
+                    new_uploads, prefix, delimiter)
+            uploads.extend(new_uploads)
+            prefixes.extend(new_prefixes)
+            query['marker'] = objects[-1]['name']
+
+        truncated = len(uploads) >= maxuploads
+        if len(uploads) > maxuploads:
+            uploads = uploads[:maxuploads]
+
+        nextkeymarker = ''
+        nextuploadmarker = ''
+        if len(uploads) > 1:
+            nextuploadmarker = uploads[-1]['upload_id']
+            nextkeymarker = uploads[-1]['key']
+
+        result_elem = Element('ListMultipartUploadsResult')
+        SubElement(result_elem, 'Bucket').text = req.container_name
+        SubElement(result_elem, 'KeyMarker').text = keymarker
+        SubElement(result_elem, 'UploadIdMarker').text = uploadid
+        SubElement(result_elem, 'NextKeyMarker').text = nextkeymarker
+        SubElement(result_elem, 'NextUploadIdMarker').text = nextuploadmarker
+        if 'delimiter' in req.params:
+            SubElement(result_elem, 'Delimiter').text = \
+                get_param(req, 'delimiter')
+        if 'prefix' in req.params:
+            SubElement(result_elem, 'Prefix').text = get_param(req, 'prefix')
+        SubElement(result_elem, 'MaxUploads').text = str(maxuploads)
+        if encoding_type is not None:
+            SubElement(result_elem, 'EncodingType').text = encoding_type
+        SubElement(result_elem, 'IsTruncated').text = \
+            'true' if truncated else 'false'
+
+        # TODO: don't show uploads which are initiated before this bucket is
+        # created.
+        for u in uploads:
+            upload_elem = SubElement(result_elem, 'Upload')
+            name = u['key']
+            if encoding_type == 'url':
+                name = quote(name)
+            SubElement(upload_elem, 'Key').text = name
+            SubElement(upload_elem, 'UploadId').text = u['upload_id']
+            initiator_elem = SubElement(upload_elem, 'Initiator')
+            SubElement(initiator_elem, 'ID').text = req.user_id
+            SubElement(initiator_elem, 'DisplayName').text = req.user_id
+            owner_elem = SubElement(upload_elem, 'Owner')
+            SubElement(owner_elem, 'ID').text = req.user_id
+            SubElement(owner_elem, 'DisplayName').text = req.user_id
+            SubElement(upload_elem, 'StorageClass').text = 'STANDARD'
+            SubElement(upload_elem, 'Initiated').text = \
+                S3Timestamp.from_isoformat(u['last_modified']).s3xmlformat
+
+        for p in prefixes:
+            elem = SubElement(result_elem, 'CommonPrefixes')
+            SubElement(elem, 'Prefix').text = p
+
+        body = tostring(result_elem)
+
+        return HTTPOk(body=body, content_type='application/xml')
+
+    @public
+    @object_operation
+    @check_container_existence
+    def POST(self, req):
+        """
+        Handles Initiate Multipart Upload.
+        """
+        if len(req.object_name) > constraints.MAX_OBJECT_NAME_LENGTH:
+            # Note that we can still run into trouble where the MPU is just
+            # within the limit, which means the segment names will go over
+            raise KeyTooLongError()
+
+        # Create a unique S3 upload id from UUID to avoid duplicates.
+        upload_id = unique_id()
+
+        seg_container = req.container_name + MULTIUPLOAD_SUFFIX
+        content_type = req.headers.get('Content-Type')
+        if content_type:
+            req.headers[sysmeta_header('object', 'has-content-type')] = 'yes'
+            req.headers[
+                sysmeta_header('object', 'content-type')] = content_type
+        else:
+            req.headers[sysmeta_header('object', 'has-content-type')] = 'no'
+        req.headers['Content-Type'] = 'application/directory'
+
+        try:
+            seg_req = copy.copy(req)
+            seg_req.environ = copy.copy(req.environ)
+            seg_req.container_name = seg_container
+            seg_req.get_container_info(self.app)
+        except NoSuchBucket:
+            try:
+                # multi-upload bucket doesn't exist, create one with
+                # same storage policy and acls as the primary bucket
+                info = req.get_container_info(self.app)
+                policy_name = POLICIES[info['storage_policy']].name
+                hdrs = {'X-Storage-Policy': policy_name}
+                if info.get('read_acl'):
+                    hdrs['X-Container-Read'] = info['read_acl']
+                if info.get('write_acl'):
+                    hdrs['X-Container-Write'] = info['write_acl']
+                seg_req.get_response(self.app, 'PUT', seg_container, '',
+                                     headers=hdrs)
+            except (BucketAlreadyExists, BucketAlreadyOwnedByYou):
+                pass
+
+        obj = '%s/%s' % (req.object_name, upload_id)
+
+        req.headers.pop('Etag', None)
+        req.headers.pop('Content-Md5', None)
+
+        req.get_response(self.app, 'PUT', seg_container, obj, body='')
+
+        result_elem = Element('InitiateMultipartUploadResult')
+        SubElement(result_elem, 'Bucket').text = req.container_name
+        SubElement(result_elem, 'Key').text = wsgi_to_str(req.object_name)
+        SubElement(result_elem, 'UploadId').text = upload_id
+
+        body = tostring(result_elem)
+
+        return HTTPOk(body=body, content_type='application/xml')
+
+
+class UploadController(Controller):
+    """
+    Handles the following APIs:
+
+    * List Parts
+    * Abort Multipart Upload
+    * Complete Multipart Upload
+
+    Those APIs are logged as UPLOAD operations in the S3 server log.
+    """
+    @public
+    @object_operation
+    @check_container_existence
+    def GET(self, req):
+        """
+        Handles List Parts.
+        """
+        def filter_part_num_marker(o):
+            try:
+                num = int(os.path.basename(o['name']))
+                return num > part_num_marker
+            except ValueError:
+                return False
+
+        encoding_type = get_param(req, 'encoding-type')
+        if encoding_type is not None and encoding_type != 'url':
+            err_msg = 'Invalid Encoding Method specified in Request'
+            raise InvalidArgument('encoding-type', encoding_type, err_msg)
+
+        upload_id = get_param(req, 'uploadId')
+        _get_upload_info(req, self.app, upload_id)
+
+        maxparts = req.get_validated_param(
+            'max-parts', DEFAULT_MAX_PARTS_LISTING,
+            self.conf.max_parts_listing)
+        part_num_marker = req.get_validated_param(
+            'part-number-marker', 0)
+
+        object_name = wsgi_to_str(req.object_name)
+        query = {
+            'format': 'json',
+            'prefix': '%s/%s/' % (object_name, upload_id),
+            'delimiter': '/',
+            'marker': '',
+        }
+
+        container = req.container_name + MULTIUPLOAD_SUFFIX
+        # Because the parts are out of order in Swift, we list up to the
+        # maximum number of parts and then apply the marker and limit options.
+        objects = []
+        while True:
+            resp = req.get_response(self.app, container=container, obj='',
+                                    query=query)
+            new_objects = json.loads(resp.body)
+            if not new_objects:
+                break
+            objects.extend(new_objects)
+            query['marker'] = new_objects[-1]['name']
+
+        last_part = 0
+
+        # If the caller requested a list starting at a specific part number,
+        # construct a sub-set of the object list.
+        objList = [obj for obj in objects if filter_part_num_marker(obj)]
+
+        # pylint: disable-msg=E1103
+        objList.sort(key=lambda o: int(o['name'].split('/')[-1]))
+
+        if len(objList) > maxparts:
+            objList = objList[:maxparts]
+            truncated = True
+        else:
+            truncated = False
+        # TODO: We have to retrieve object list again when truncated is True
+        # and some objects filtered by invalid name because there could be no
+        # enough objects for limit defined by maxparts.
+
+        if objList:
+            o = objList[-1]
+            last_part = os.path.basename(o['name'])
+
+        result_elem = Element('ListPartsResult')
+        SubElement(result_elem, 'Bucket').text = req.container_name
+        if encoding_type == 'url':
+            object_name = quote(object_name)
+        SubElement(result_elem, 'Key').text = object_name
+        SubElement(result_elem, 'UploadId').text = upload_id
+
+        initiator_elem = SubElement(result_elem, 'Initiator')
+        SubElement(initiator_elem, 'ID').text = req.user_id
+        SubElement(initiator_elem, 'DisplayName').text = req.user_id
+        owner_elem = SubElement(result_elem, 'Owner')
+        SubElement(owner_elem, 'ID').text = req.user_id
+        SubElement(owner_elem, 'DisplayName').text = req.user_id
+
+        SubElement(result_elem, 'StorageClass').text = 'STANDARD'
+        SubElement(result_elem, 'PartNumberMarker').text = str(part_num_marker)
+        SubElement(result_elem, 'NextPartNumberMarker').text = str(last_part)
+        SubElement(result_elem, 'MaxParts').text = str(maxparts)
+        if 'encoding-type' in req.params:
+            SubElement(result_elem, 'EncodingType').text = \
+                get_param(req, 'encoding-type')
+        SubElement(result_elem, 'IsTruncated').text = \
+            'true' if truncated else 'false'
+
+        for i in objList:
+            part_elem = SubElement(result_elem, 'Part')
+            SubElement(part_elem, 'PartNumber').text = i['name'].split('/')[-1]
+            SubElement(part_elem, 'LastModified').text = \
+                S3Timestamp.from_isoformat(i['last_modified']).s3xmlformat
+            SubElement(part_elem, 'ETag').text = '"%s"' % i['hash']
+            SubElement(part_elem, 'Size').text = str(i['bytes'])
+
+        body = tostring(result_elem)
+
+        return HTTPOk(body=body, content_type='application/xml')
+
+    @public
+    @object_operation
+    @check_container_existence
+    def DELETE(self, req):
+        """
+        Handles Abort Multipart Upload.
+        """
+        upload_id = get_param(req, 'uploadId')
+        _get_upload_info(req, self.app, upload_id)
+
+        # First check to see if this multi-part upload was already
+        # completed.  Look in the primary container, if the object exists,
+        # then it was completed and we return an error here.
+        container = req.container_name + MULTIUPLOAD_SUFFIX
+        obj = '%s/%s' % (req.object_name, upload_id)
+        req.get_response(self.app, container=container, obj=obj)
+
+        # The completed object was not found so this
+        # must be a multipart upload abort.
+        # We must delete any uploaded segments for this UploadID and then
+        # delete the object in the main container as well
+        object_name = wsgi_to_str(req.object_name)
+        query = {
+            'format': 'json',
+            'prefix': '%s/%s/' % (object_name, upload_id),
+            'delimiter': '/',
+        }
+
+        resp = req.get_response(self.app, 'GET', container, '', query=query)
+
+        #  Iterate over the segment objects and delete them individually
+        objects = json.loads(resp.body)
+        while objects:
+            for o in objects:
+                container = req.container_name + MULTIUPLOAD_SUFFIX
+                obj = bytes_to_wsgi(o['name'].encode('utf-8'))
+                req.get_response(self.app, container=container, obj=obj)
+            query['marker'] = objects[-1]['name']
+            resp = req.get_response(self.app, 'GET', container, '',
+                                    query=query)
+            objects = json.loads(resp.body)
+
+        return HTTPNoContent()
+
+    @public
+    @object_operation
+    @check_container_existence
+    def POST(self, req):
+        """
+        Handles Complete Multipart Upload.
+        """
+        upload_id = get_param(req, 'uploadId')
+        # Check for conditional requests before getting upload info so the
+        # headers can't bleed into the HEAD
+        if req.headers.get('If-None-Match', '*') != '*' or any(
+                h in req.headers for h in (
+                    'If-Match', 'If-Modified-Since', 'If-Unmodified-Since')):
+            raise S3NotImplemented(
+                'Conditional uploads are not supported.')
+
+        resp, is_marker = _get_upload_info(req, self.app, upload_id)
+        if (is_marker and
+                resp.sw_headers.get('X-Backend-Timestamp') >= Timestamp.now()):
+            # Somehow the marker was created in the future w.r.t. this thread's
+            # clock. The manifest PUT may succeed but the subsequent marker
+            # DELETE will fail, so don't attempt either.
+            raise ServiceUnavailable
+
+        headers = {'Accept': 'application/json',
+                   sysmeta_header('object', 'upload-id'): upload_id}
+        for key, val in resp.headers.items():
+            _key = key.lower()
+            if _key.startswith('x-amz-meta-'):
+                headers['x-object-meta-' + _key[11:]] = val
+            elif _key in ('content-encoding', 'content-language',
+                          'content-disposition', 'expires', 'cache-control'):
+                headers[key] = val
+
+        hct_header = sysmeta_header('object', 'has-content-type')
+        if resp.sysmeta_headers.get(hct_header) == 'yes':
+            content_type = resp.sysmeta_headers.get(
+                sysmeta_header('object', 'content-type'))
+        elif hct_header in resp.sysmeta_headers:
+            # has-content-type is present but false, so no content type was
+            # set on initial upload. In that case, we won't set one on our
+            # PUT request. Swift will end up guessing one based on the
+            # object name.
+            content_type = None
+        else:
+            content_type = resp.headers.get('Content-Type')
+
+        if content_type:
+            headers['Content-Type'] = content_type
+
+        container = req.container_name + MULTIUPLOAD_SUFFIX
+        s3_etag_hasher = md5(usedforsecurity=False)
+        manifest = []
+        previous_number = 0
+        try:
+            xml = req.xml(MAX_COMPLETE_UPLOAD_BODY_SIZE)
+            if not xml:
+                raise InvalidRequest(msg='You must specify at least one part')
+            # If an MD5 was provided, we need to verify it.
+            if req.check_md5(xml):
+                # We're only interested in the body here, in the
+                # multipart-upload controller -- *don't* let etag get
+                # plumbed down to the object-server
+                req.headers.pop('etag', None)
+
+            complete_elem = fromstring(
+                xml, 'CompleteMultipartUpload', self.logger)
+            for part_elem in complete_elem.iterchildren('Part'):
+                part_number = int(part_elem.find('./PartNumber').text)
+
+                if part_number <= previous_number:
+                    raise InvalidPartOrder(upload_id=upload_id)
+                previous_number = part_number
+
+                etag = normalize_etag(part_elem.find('./ETag').text)
+                if etag is None:
+                    raise InvalidPart(upload_id=upload_id,
+                                      part_number=part_number,
+                                      e_tag=etag)
+                if len(etag) != 32 or any(c not in '0123456789abcdef'
+                                          for c in etag):
+                    raise InvalidPart(upload_id=upload_id,
+                                      part_number=part_number,
+                                      e_tag=etag)
+                manifest.append({
+                    'path': '/%s/%s/%s/%d' % (
+                        wsgi_to_str(container), wsgi_to_str(req.object_name),
+                        upload_id, part_number),
+                    'etag': etag})
+                s3_etag_hasher.update(binascii.a2b_hex(etag))
+        except (XMLSyntaxError, DocumentInvalid):
+            # NB: our schema definitions catch uploads with no parts here
+            raise MalformedXML()
+        except ErrorResponse:
+            raise
+        except Exception as e:
+            self.logger.error(e)
+            raise
+
+        s3_etag = '%s-%d' % (s3_etag_hasher.hexdigest(), len(manifest))
+        s3_etag_header = sysmeta_header('object', 'etag')
+        # This header should only already be present if the upload marker
+        # has been cleaned up and the current target uses the same upload-id
+        already_uploaded_s3_etag = resp.sysmeta_headers.get(s3_etag_header)
+        if already_uploaded_s3_etag == s3_etag:
+            # If the segments to use haven't changed, the work is already done
+            return HTTPOk(body=_make_complete_body(req, s3_etag, False),
+                          content_type='application/xml')
+        elif already_uploaded_s3_etag:
+            # If the header's present but *doesn't* match, upload-id is
+            # no longer valid
+            raise NoSuchUpload(upload_id=upload_id)
+        headers[s3_etag_header] = s3_etag
+        # Leave base header value blank; SLO will populate
+        c_etag = '; s3_etag=%s' % s3_etag
+        headers[get_container_update_override_key('etag')] = c_etag
+
+        too_small_message = ('s3api requires that each segment be at least '
+                             '%d bytes' % self.conf.min_segment_size)
+
+        def size_checker(manifest):
+            # Check the size of each segment except the last and make sure
+            # they are all more than the minimum upload chunk size.
+            # Note that we need to use the *internal* keys, since we're
+            # looking at the manifest that's about to be written.
+            return [
+                (item['name'], too_small_message)
+                for item in manifest[:-1]
+                if item and item['bytes'] < self.conf.min_segment_size]
+
+        req.environ['swift.callback.slo_manifest_hook'] = size_checker
+        start_time = time.time()
+
+        def response_iter():
+            # NB: XML requires that the XML declaration, if present, be at the
+            # very start of the document. Clients *will* call us out on not
+            # being valid XML if we pass through whitespace before it.
+            # Track whether we've sent anything yet so we can yield out that
+            # declaration *first*
+            yielded_anything = False
+
+            try:
+                try:
+                    # TODO: add support for versioning
+                    put_resp = req.get_response(
+                        self.app, 'PUT', body=json.dumps(manifest),
+                        query={'multipart-manifest': 'put',
+                               'heartbeat': 'on'},
+                        headers=headers)
+                    if put_resp.status_int == 202:
+                        body = []
+                        put_resp.fix_conditional_response()
+                        for chunk in put_resp.response_iter:
+                            if not chunk.strip():
+                                if time.time() - start_time < 10:
+                                    # Include some grace period to keep
+                                    # ceph-s3tests happy
+                                    continue
+                                if not yielded_anything:
+                                    yield (b'<?xml version="1.0" '
+                                           b'encoding="UTF-8"?>\n')
+                                yielded_anything = True
+                                yield chunk
+                                continue
+                            body.append(chunk)
+                        body = json.loads(b''.join(body))
+                        if body['Response Status'] == \
+                                '412 Precondition Failed':
+                            raise PreconditionFailed
+                        elif body['Response Status'] != '201 Created':
+                            for seg, err in body['Errors']:
+                                if err == too_small_message:
+                                    raise EntityTooSmall()
+                                elif err in ('Etag Mismatch', '404 Not Found'):
+                                    raise InvalidPart(upload_id=upload_id)
+                            raise InvalidRequest(
+                                status=body['Response Status'],
+                                msg='\n'.join(': '.join(err)
+                                              for err in body['Errors']))
+                except InvalidRequest as err_resp:
+                    msg = err_resp._msg
+                    if too_small_message in msg:
+                        raise EntityTooSmall(msg)
+                    elif ', Etag Mismatch' in msg:
+                        raise InvalidPart(upload_id=upload_id)
+                    elif ', 404 Not Found' in msg:
+                        raise InvalidPart(upload_id=upload_id)
+                    else:
+                        raise
+
+                # clean up the multipart-upload record
+                obj = '%s/%s' % (req.object_name, upload_id)
+                try:
+                    req.get_response(self.app, 'DELETE', container, obj)
+                except NoSuchKey:
+                    # The important thing is that we wrote out a tombstone to
+                    # make sure the marker got cleaned up. If it's already
+                    # gone (e.g., because of concurrent completes or a retried
+                    # complete), so much the better.
+                    pass
+
+                yield _make_complete_body(req, s3_etag, yielded_anything)
+            except ErrorResponse as err_resp:
+                if yielded_anything:
+                    err_resp.xml_declaration = False
+                    yield b'\n'
+                else:
+                    # Oh good, we can still change HTTP status code, too!
+                    resp.status = err_resp.status
+                for chunk in err_resp({}, lambda *a: None):
+                    yield chunk
+
+        resp = HTTPOk()  # assume we're good for now... but see above!
+        resp.app_iter = reiterate(response_iter())
+        resp.content_type = "application/xml"
+
+        return resp
diff --git a/swift/common/middleware/s3api/controllers/obj.py b/swift/common/middleware/s3api/controllers/obj.py
new file mode 100644
index 0000000000..930beb0fe3
--- /dev/null
+++ b/swift/common/middleware/s3api/controllers/obj.py
@@ -0,0 +1,269 @@
+# Copyright (c) 2010-2014 OpenStack Foundation.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from io import BytesIO
+import json
+
+from swift.common import constraints
+from swift.common.http import HTTP_OK, HTTP_PARTIAL_CONTENT, HTTP_NO_CONTENT
+from swift.common.request_helpers import update_etag_is_at_header
+from swift.common.swob import Range, content_range_header_value, \
+    normalize_etag
+from swift.common.utils import public, list_from_csv
+from swift.common.registry import get_swift_info
+
+from swift.common.middleware.versioned_writes.object_versioning import \
+    DELETE_MARKER_CONTENT_TYPE
+from swift.common.middleware.s3api.utils import S3Timestamp, sysmeta_header
+from swift.common.middleware.s3api.controllers.base import Controller
+from swift.common.middleware.s3api.s3response import S3NotImplemented, \
+    InvalidRange, NoSuchKey, NoSuchVersion, InvalidArgument, HTTPNoContent, \
+    PreconditionFailed, KeyTooLongError
+
+
+class ObjectController(Controller):
+    """
+    Handles requests on objects
+    """
+    def _gen_head_range_resp(self, req_range, resp):
+        """
+        Swift doesn't handle Range header for HEAD requests.
+        So, this method generates HEAD range response from HEAD response.
+        S3 return HEAD range response, if the value of range satisfies the
+        conditions which are described in the following document.
+        - http://www.w3.org/Protocols/rfc2616/rfc2616-sec14.html#sec14.35
+        """
+        length = int(resp.headers.get('Content-Length'))
+
+        try:
+            content_range = Range(req_range)
+        except ValueError:
+            return resp
+
+        ranges = content_range.ranges_for_length(length)
+        if ranges == []:
+            raise InvalidRange()
+        elif ranges:
+            if len(ranges) == 1:
+                start, end = ranges[0]
+                resp.headers['Content-Range'] = \
+                    content_range_header_value(start, end, length)
+                resp.headers['Content-Length'] = (end - start)
+                resp.status = HTTP_PARTIAL_CONTENT
+                return resp
+            else:
+                # TODO: It is necessary to confirm whether need to respond to
+                #       multi-part response.(e.g. bytes=0-10,20-30)
+                pass
+
+        return resp
+
+    def GETorHEAD(self, req):
+        had_match = False
+        for match_header in ('if-match', 'if-none-match'):
+            if match_header not in req.headers:
+                continue
+            had_match = True
+            for value in list_from_csv(req.headers[match_header]):
+                value = normalize_etag(value)
+                if value.endswith('-N'):
+                    # Deal with fake S3-like etags for SLOs uploaded via Swift
+                    req.headers[match_header] += ', ' + value[:-2]
+
+        if had_match:
+            # Update where to look
+            update_etag_is_at_header(req, sysmeta_header('object', 'etag'))
+
+        object_name = req.object_name
+        version_id = req.params.get('versionId')
+        if version_id not in ('null', None) and \
+                'object_versioning' not in get_swift_info():
+            raise S3NotImplemented()
+        part_number = req.validate_part_number(check_max=False)
+
+        query = {}
+        if version_id is not None:
+            query['version-id'] = version_id
+        if part_number is not None:
+            query['part-number'] = part_number
+
+        if version_id not in ('null', None):
+            container_info = req.get_container_info(self.app)
+            if not container_info.get(
+                    'sysmeta', {}).get('versions-container', ''):
+                # Versioning has never been enabled
+                raise NoSuchVersion(object_name, version_id)
+
+        resp = req.get_response(self.app, query=query)
+
+        if not resp.is_slo:
+            # SLO ignores part_number for non-slo objects, but s3api only
+            # allows the query param for non-MPU if it's exactly 1.
+            part_number = req.validate_part_number(parts_count=1)
+            if part_number == 1:
+                # When the query param *is* exactly 1 the response status code
+                # and headers are updated.
+                resp.status = HTTP_PARTIAL_CONTENT
+                resp.headers['Content-Range'] = \
+                    'bytes 0-%d/%s' % (int(resp.headers['Content-Length']) - 1,
+                                       resp.headers['Content-Length'])
+            # else: part_number is None
+
+        if req.method == 'HEAD':
+            resp.app_iter = None
+
+        if 'x-amz-meta-deleted' in resp.headers:
+            raise NoSuchKey(object_name)
+
+        for key in ('content-type', 'content-language', 'expires',
+                    'cache-control', 'content-disposition',
+                    'content-encoding'):
+            if 'response-' + key in req.params:
+                resp.headers[key] = req.params['response-' + key]
+
+        return resp
+
+    @public
+    def HEAD(self, req):
+        """
+        Handle HEAD Object request
+        """
+        resp = self.GETorHEAD(req)
+
+        if 'range' in req.headers:
+            req_range = req.headers['range']
+            resp = self._gen_head_range_resp(req_range, resp)
+
+        return resp
+
+    @public
+    def GET(self, req):
+        """
+        Handle GET Object request
+        """
+        return self.GETorHEAD(req)
+
+    @public
+    def PUT(self, req):
+        """
+        Handle PUT Object and PUT Object (Copy) request
+        """
+        if len(req.object_name) > constraints.MAX_OBJECT_NAME_LENGTH:
+            raise KeyTooLongError()
+        # set X-Timestamp by s3api to use at copy resp body
+        req_timestamp = S3Timestamp.now()
+        req.headers['X-Timestamp'] = req_timestamp.internal
+        if all(h in req.headers
+               for h in ('X-Amz-Copy-Source', 'X-Amz-Copy-Source-Range')):
+            raise InvalidArgument('x-amz-copy-source-range',
+                                  req.headers['X-Amz-Copy-Source-Range'],
+                                  'Illegal copy header')
+        req.check_copy_source(self.app)
+        if not req.headers.get('Content-Type'):
+            # can't setdefault because it can be None for some reason
+            req.headers['Content-Type'] = 'binary/octet-stream'
+        resp = req.get_response(self.app)
+
+        if 'X-Amz-Copy-Source' in req.headers:
+            resp.append_copy_resp_body(req.controller_name,
+                                       req_timestamp.s3xmlformat)
+            # delete object metadata from response
+            for key in list(resp.headers.keys()):
+                if key.lower().startswith('x-amz-meta-'):
+                    del resp.headers[key]
+
+        resp.status = HTTP_OK
+        return resp
+
+    @public
+    def POST(self, req):
+        raise S3NotImplemented()
+
+    def _restore_on_delete(self, req):
+        resp = req.get_response(self.app, 'GET', req.container_name, '',
+                                query={'prefix': req.object_name,
+                                       'versions': True})
+        if resp.status_int != HTTP_OK:
+            return resp
+        old_versions = json.loads(resp.body)
+        resp = None
+        for item in old_versions:
+            if item['content_type'] == DELETE_MARKER_CONTENT_TYPE:
+                resp = None
+                break
+            try:
+                resp = req.get_response(self.app, 'PUT', query={
+                    'version-id': item['version_id']})
+            except PreconditionFailed:
+                self.logger.debug('skipping failed PUT?version-id=%s' %
+                                  item['version_id'])
+                continue
+            # if that worked, we'll go ahead and fix up the status code
+            resp.status_int = HTTP_NO_CONTENT
+            break
+        return resp
+
+    @public
+    def DELETE(self, req):
+        """
+        Handle DELETE Object request
+        """
+        if 'versionId' in req.params and \
+                req.params['versionId'] != 'null' and \
+                'object_versioning' not in get_swift_info():
+            raise S3NotImplemented()
+
+        version_id = req.params.get('versionId')
+        if version_id not in ('null', None):
+            container_info = req.get_container_info(self.app)
+            if not container_info.get(
+                    'sysmeta', {}).get('versions-container', ''):
+                # Versioning has never been enabled
+                return HTTPNoContent(headers={'x-amz-version-id': version_id})
+
+        try:
+            try:
+                query = req.gen_multipart_manifest_delete_query(
+                    self.app, version=version_id)
+            except NoSuchKey:
+                query = {}
+
+            req.headers['Content-Type'] = None  # Ignore client content-type
+
+            if version_id is not None:
+                query['version-id'] = version_id
+                query['symlink'] = 'get'
+
+            resp = req.get_response(self.app, query=query)
+            # If we're going to continue using this request, we need to
+            # replace the now-spent body
+            req.environ['wsgi.input'] = BytesIO(b'')
+            req.headers['content-length'] = '0'
+            req.headers.pop('transfer-encoding', None)
+            if query.get('multipart-manifest') and resp.status_int == HTTP_OK:
+                for chunk in resp.app_iter:
+                    pass  # drain the bulk-deleter response
+                resp.status = HTTP_NO_CONTENT
+                resp.body = b''
+            if resp.sw_headers.get('X-Object-Current-Version-Id') == 'null':
+                new_resp = self._restore_on_delete(req)
+                if new_resp:
+                    resp = new_resp
+        except NoSuchKey:
+            # expect to raise NoSuchBucket when the bucket doesn't exist
+            req.get_container_info(self.app)
+            # else -- it's gone! Success.
+            return HTTPNoContent()
+        return resp
diff --git a/swift/common/middleware/s3api/controllers/object_lock.py b/swift/common/middleware/s3api/controllers/object_lock.py
new file mode 100644
index 0000000000..69a5295727
--- /dev/null
+++ b/swift/common/middleware/s3api/controllers/object_lock.py
@@ -0,0 +1,44 @@
+# Copyright (c) 2010-2023 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from swift.common.utils import public
+
+from swift.common.middleware.s3api.controllers.base import Controller, \
+    bucket_operation, S3NotImplemented
+from swift.common.middleware.s3api.s3response import \
+    ObjectLockConfigurationNotFoundError
+
+
+class ObjectLockController(Controller):
+    """
+    Handles GET object-lock request, which always returns
+    <ObjectLockEnabled>Disabled</ObjectLockEnabled>
+    """
+    @public
+    @bucket_operation
+    def GET(self, req):
+        """
+        Handles GET object-lock param calls.
+        """
+        raise ObjectLockConfigurationNotFoundError(req.container_name)
+
+    @public
+    @bucket_operation
+    def PUT(self, req):
+        """
+        Handles PUT object-lock param calls.
+        """
+        # Basically we don't support it, so return a 501
+        raise S3NotImplemented('The requested resource is not implemented')
diff --git a/swift/common/middleware/s3api/controllers/s3_acl.py b/swift/common/middleware/s3api/controllers/s3_acl.py
new file mode 100644
index 0000000000..ddd7fbe3d2
--- /dev/null
+++ b/swift/common/middleware/s3api/controllers/s3_acl.py
@@ -0,0 +1,67 @@
+# Copyright (c) 2014 OpenStack Foundation.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from urllib.parse import quote
+from swift.common.utils import public
+
+from swift.common.middleware.s3api.controllers.base import Controller
+from swift.common.middleware.s3api.s3response import HTTPOk
+from swift.common.middleware.s3api.etree import tostring
+
+
+class S3AclController(Controller):
+    """
+    Handles the following APIs:
+
+    * GET Bucket acl
+    * PUT Bucket acl
+    * GET Object acl
+    * PUT Object acl
+
+    Those APIs are logged as ACL operations in the S3 server log.
+    """
+    @public
+    def GET(self, req):
+        """
+        Handles GET Bucket acl and GET Object acl.
+        """
+        resp = req.get_response(self.app, method='HEAD')
+
+        acl = resp.object_acl if req.is_object_request else resp.bucket_acl
+
+        resp = HTTPOk()
+        resp.body = tostring(acl.elem())
+
+        return resp
+
+    @public
+    def PUT(self, req):
+        """
+        Handles PUT Bucket acl and PUT Object acl.
+        """
+        if req.is_object_request:
+            headers = {}
+            src_path = '/%s/%s' % (req.container_name, req.object_name)
+
+            # object-sysmeta' can be updated by 'Copy' method,
+            # but can not be by 'POST' method.
+            # So headers['X-Copy-From'] for copy request is added here.
+            headers['X-Copy-From'] = quote(src_path)
+            headers['Content-Length'] = 0
+            req.get_response(self.app, 'PUT', headers=headers)
+        else:
+            req.get_response(self.app, 'POST')
+
+        return HTTPOk()
diff --git a/swift/common/middleware/s3api/controllers/service.py b/swift/common/middleware/s3api/controllers/service.py
new file mode 100644
index 0000000000..1a6564eb88
--- /dev/null
+++ b/swift/common/middleware/s3api/controllers/service.py
@@ -0,0 +1,70 @@
+# Copyright (c) 2010-2014 OpenStack Foundation.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from swift.common.swob import bytes_to_wsgi
+from swift.common.utils import json, public
+
+from swift.common.middleware.s3api.controllers.base import Controller
+from swift.common.middleware.s3api.etree import Element, SubElement, tostring
+from swift.common.middleware.s3api.s3response import HTTPOk, AccessDenied, \
+    NoSuchBucket
+from swift.common.middleware.s3api.utils import validate_bucket_name
+
+
+class ServiceController(Controller):
+    """
+    Handles account level requests.
+    """
+    @public
+    def GET(self, req):
+        """
+        Handle GET Service request
+        """
+        resp = req.get_response(self.app, query={'format': 'json'})
+
+        containers = json.loads(resp.body)
+
+        containers = filter(
+            lambda item: validate_bucket_name(
+                item['name'], self.conf.dns_compliant_bucket_names),
+            containers)
+
+        # we don't keep the creation time of a bucket (s3cmd doesn't
+        # work without that) so we use something bogus.
+        elem = Element('ListAllMyBucketsResult')
+
+        owner = SubElement(elem, 'Owner')
+        SubElement(owner, 'ID').text = req.user_id
+        SubElement(owner, 'DisplayName').text = req.user_id
+
+        buckets = SubElement(elem, 'Buckets')
+        for c in containers:
+            if self.conf.s3_acl and self.conf.check_bucket_owner:
+                container = bytes_to_wsgi(c['name'].encode('utf8'))
+                try:
+                    req.get_response(self.app, 'HEAD', container)
+                except AccessDenied:
+                    continue
+                except NoSuchBucket:
+                    continue
+
+            bucket = SubElement(buckets, 'Bucket')
+            SubElement(bucket, 'Name').text = c['name']
+            SubElement(bucket, 'CreationDate').text = \
+                '2009-02-03T16:45:09.000Z'
+
+        body = tostring(elem)
+
+        return HTTPOk(content_type='application/xml', body=body)
diff --git a/swift/common/middleware/s3api/controllers/tagging.py b/swift/common/middleware/s3api/controllers/tagging.py
new file mode 100644
index 0000000000..ca7bc853d2
--- /dev/null
+++ b/swift/common/middleware/s3api/controllers/tagging.py
@@ -0,0 +1,57 @@
+# Copyright (c) 2014 OpenStack Foundation.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from swift.common.utils import public
+
+from swift.common.middleware.s3api.controllers.base import Controller, \
+    S3NotImplemented
+from swift.common.middleware.s3api.s3response import HTTPOk
+from swift.common.middleware.s3api.etree import Element, tostring, \
+    SubElement
+
+
+class TaggingController(Controller):
+    """
+    Handles the following APIs:
+
+    * GET Bucket and Object tagging
+    * PUT Bucket and Object tagging
+    * DELETE Bucket and Object tagging
+
+    """
+    @public
+    def GET(self, req):
+        """
+        Handles GET Bucket and Object tagging.
+        """
+        elem = Element('Tagging')
+        SubElement(elem, 'TagSet')
+        body = tostring(elem)
+
+        return HTTPOk(body=body, content_type=None)
+
+    @public
+    def PUT(self, req):
+        """
+        Handles PUT Bucket and Object tagging.
+        """
+        raise S3NotImplemented('The requested resource is not implemented')
+
+    @public
+    def DELETE(self, req):
+        """
+        Handles DELETE Bucket and Object tagging.
+        """
+        raise S3NotImplemented('The requested resource is not implemented')
diff --git a/swift/common/middleware/s3api/controllers/versioning.py b/swift/common/middleware/s3api/controllers/versioning.py
new file mode 100644
index 0000000000..2d31d2af50
--- /dev/null
+++ b/swift/common/middleware/s3api/controllers/versioning.py
@@ -0,0 +1,82 @@
+# Copyright (c) 2010-2014 OpenStack Foundation.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from swift.common.utils import public, config_true_value
+from swift.common.registry import get_swift_info
+
+from swift.common.middleware.s3api.controllers.base import Controller, \
+    bucket_operation
+from swift.common.middleware.s3api.etree import Element, tostring, \
+    fromstring, XMLSyntaxError, DocumentInvalid, SubElement
+from swift.common.middleware.s3api.s3response import HTTPOk, \
+    S3NotImplemented, MalformedXML
+
+MAX_PUT_VERSIONING_BODY_SIZE = 10240
+
+
+class VersioningController(Controller):
+    """
+    Handles the following APIs:
+
+    * GET Bucket versioning
+    * PUT Bucket versioning
+
+    Those APIs are logged as VERSIONING operations in the S3 server log.
+    """
+    @public
+    @bucket_operation
+    def GET(self, req):
+        """
+        Handles GET Bucket versioning.
+        """
+        sysmeta = req.get_container_info(self.app).get('sysmeta', {})
+
+        elem = Element('VersioningConfiguration')
+        if sysmeta.get('versions-enabled'):
+            SubElement(elem, 'Status').text = (
+                'Enabled' if config_true_value(sysmeta['versions-enabled'])
+                else 'Suspended')
+        body = tostring(elem)
+
+        return HTTPOk(body=body, content_type=None)
+
+    @public
+    @bucket_operation
+    def PUT(self, req):
+        """
+        Handles PUT Bucket versioning.
+        """
+        if 'object_versioning' not in get_swift_info():
+            raise S3NotImplemented()
+
+        xml = req.xml(MAX_PUT_VERSIONING_BODY_SIZE)
+        try:
+            elem = fromstring(xml, 'VersioningConfiguration')
+            status = elem.find('./Status').text
+        except (XMLSyntaxError, DocumentInvalid):
+            raise MalformedXML()
+        except Exception as e:
+            self.logger.error(e)
+            raise
+
+        if status not in ['Enabled', 'Suspended']:
+            raise MalformedXML()
+
+        # Set up versioning
+        # NB: object_versioning responsible for ensuring its container exists
+        req.headers['X-Versions-Enabled'] = str(status == 'Enabled').lower()
+        req.get_response(self.app, 'POST')
+
+        return HTTPOk()
diff --git a/swift/common/middleware/s3api/etree.py b/swift/common/middleware/s3api/etree.py
new file mode 100644
index 0000000000..e5d4112b8f
--- /dev/null
+++ b/swift/common/middleware/s3api/etree.py
@@ -0,0 +1,150 @@
+# Copyright (c) 2014 OpenStack Foundation.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import lxml.etree
+from copy import deepcopy
+try:
+    # importlib.resources was introduced in py37, but couldn't handle
+    # resources in subdirectories (which we use); files() added support
+    from importlib.resources import files
+    del files
+except ImportError:
+    # python < 3.9
+    from pkg_resources import resource_stream  # pylint: disable-msg=E0611
+else:
+    import importlib.resources
+    resource_stream = None
+
+from swift.common.utils import get_logger
+from swift.common.middleware.s3api.exception import S3Exception
+from swift.common.middleware.s3api.utils import camel_to_snake, \
+    utf8decode
+
+XMLNS_S3 = 'http://s3.amazonaws.com/doc/2006-03-01/'
+XMLNS_XSI = 'http://www.w3.org/2001/XMLSchema-instance'
+
+
+class XMLSyntaxError(S3Exception):
+    pass
+
+
+class DocumentInvalid(S3Exception):
+    pass
+
+
+def cleanup_namespaces(elem):
+    def remove_ns(tag, ns):
+        if tag.startswith('{%s}' % ns):
+            tag = tag[len('{%s}' % ns):]
+        return tag
+
+    if not isinstance(elem.tag, str):
+        # elem is a comment element.
+        return
+
+    # remove s3 namespace
+    elem.tag = remove_ns(elem.tag, XMLNS_S3)
+
+    # remove default namespace
+    if elem.nsmap and None in elem.nsmap:
+        elem.tag = remove_ns(elem.tag, elem.nsmap[None])
+
+    for e in elem.iterchildren():
+        cleanup_namespaces(e)
+
+
+def fromstring(text, root_tag=None, logger=None):
+    try:
+        elem = lxml.etree.fromstring(text, parser)
+    except lxml.etree.XMLSyntaxError as e:
+        if logger:
+            logger.debug(e)
+        raise XMLSyntaxError(e)
+
+    cleanup_namespaces(elem)
+
+    if root_tag is not None:
+        # validate XML
+        try:
+            path = 'schema/%s.rng' % camel_to_snake(root_tag)
+            if resource_stream:
+                # python < 3.9
+                stream = resource_stream(__name__, path)
+            else:
+                stream = importlib.resources.files(
+                    __name__.rsplit('.', 1)[0]).joinpath(path).open('rb')
+            with stream as rng:
+                lxml.etree.RelaxNG(file=rng).assertValid(elem)
+        except IOError as e:
+            # Probably, the schema file doesn't exist.
+            logger = logger or get_logger({}, log_route='s3api')
+            logger.error(e)
+            raise
+        except lxml.etree.DocumentInvalid as e:
+            if logger:
+                logger.debug(e)
+            raise DocumentInvalid(e)
+
+    return elem
+
+
+def tostring(tree, use_s3ns=True, xml_declaration=True):
+    if use_s3ns:
+        nsmap = tree.nsmap.copy()
+        nsmap[None] = XMLNS_S3
+
+        root = Element(tree.tag, attrib=tree.attrib, nsmap=nsmap)
+        root.text = tree.text
+        root.extend(deepcopy(list(tree)))
+        tree = root
+
+    return lxml.etree.tostring(tree, xml_declaration=xml_declaration,
+                               encoding='UTF-8')
+
+
+class _Element(lxml.etree.ElementBase):
+    """
+    Wrapper Element class of lxml.etree.Element to support
+    a utf-8 encoded non-ascii string as a text.
+
+    Why we need this?:
+    Original lxml.etree.Element supports only unicode for the text.
+    It declines maintainability because we have to call a lot of encode/decode
+    methods to apply account/container/object name (i.e. PATH_INFO) to each
+    Element instance. When using this class, we can remove such a redundant
+    codes from swift.common.middleware.s3api middleware.
+    """
+    def __init__(self, *args, **kwargs):
+        # pylint: disable-msg=E1002
+        super(_Element, self).__init__(*args, **kwargs)
+
+    @property
+    def text(self):
+        """
+        utf-8 wrapper property of lxml.etree.Element.text
+        """
+        return lxml.etree.ElementBase.text.__get__(self)
+
+    @text.setter
+    def text(self, value):
+        lxml.etree.ElementBase.text.__set__(self, utf8decode(value))
+
+
+parser_lookup = lxml.etree.ElementDefaultClassLookup(element=_Element)
+parser = lxml.etree.XMLParser(resolve_entities=False, no_network=True)
+parser.set_element_class_lookup(parser_lookup)
+
+Element = parser.makeelement
+SubElement = lxml.etree.SubElement
diff --git a/swift/common/middleware/s3api/exception.py b/swift/common/middleware/s3api/exception.py
new file mode 100644
index 0000000000..c12ee3f3ac
--- /dev/null
+++ b/swift/common/middleware/s3api/exception.py
@@ -0,0 +1,122 @@
+# Copyright (c) 2014 OpenStack Foundation.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+
+class S3Exception(Exception):
+    pass
+
+
+class NotS3Request(S3Exception):
+    pass
+
+
+class ACLError(S3Exception):
+    pass
+
+
+class InvalidBucketNameParseError(S3Exception):
+
+    def __init__(self, bucket):
+        self.bucket_name = bucket
+
+
+class InvalidURIParseError(S3Exception):
+
+    def __init__(self, uri):
+        self.uri = uri
+
+
+class InvalidSubresource(S3Exception):
+    def __init__(self, resource, cause):
+        self.resource = resource
+        self.cause = cause
+
+
+class S3InputError(BaseException):
+    """
+    There was an error with the client input detected on read().
+
+    Inherit from BaseException (rather than Exception) so it cuts from the
+    proxy-server app (which will presumably be the one reading the input)
+    through all the layers of the pipeline back to s3api. It should never
+    escape the s3api middleware.
+    """
+
+
+class S3InputIncomplete(S3InputError):
+    pass
+
+
+class S3InputSizeError(S3InputError):
+    def __init__(self, expected, provided):
+        self.expected = expected
+        self.provided = provided
+
+
+class S3InputChunkTooSmall(S3InputError):
+    def __init__(self, bad_chunk_size, chunk_number):
+        self.bad_chunk_size = bad_chunk_size
+        self.chunk_number = chunk_number
+
+
+class S3InputMalformedTrailer(S3InputError):
+    pass
+
+
+class S3InputChunkSignatureMismatch(S3InputError):
+    """
+    Client provided a chunk-signature, but it doesn't match the data.
+
+    This should result in a 403 going back to the client.
+    """
+
+
+class S3InputMissingSecret(S3InputError):
+    """
+    Client provided per-chunk signatures, but we have no secret with which to
+    verify them.
+
+    This happens if the auth middleware responsible for the user never called
+    the provided ``check_signature`` callback.
+    """
+
+
+class S3InputSHA256Mismatch(S3InputError):
+    """
+    Client provided a X-Amz-Content-SHA256, but it doesn't match the data.
+
+    This should result in a BadDigest going back to the client.
+    """
+    def __init__(self, expected, computed):
+        self.expected = expected
+        self.computed = computed
+
+
+class S3InputChecksumMismatch(S3InputError):
+    """
+    Client provided a X-Amz-Checksum-* header, but it doesn't match the data.
+
+    This should result in a InvalidRequest going back to the client.
+    """
+
+
+class S3InputChecksumTrailerInvalid(S3InputError):
+    """
+    Client provided a X-Amz-Checksum-* trailer, but it is not a valid format.
+
+    This should result in a InvalidRequest going back to the client.
+    """
+    def __init__(self, trailer_name):
+        self.trailer = trailer_name
diff --git a/swift/common/middleware/s3api/s3api.py b/swift/common/middleware/s3api/s3api.py
new file mode 100644
index 0000000000..bd928049e0
--- /dev/null
+++ b/swift/common/middleware/s3api/s3api.py
@@ -0,0 +1,600 @@
+# Copyright (c) 2010-2014 OpenStack Foundation.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""
+The s3api middleware will emulate the S3 REST api on top of swift.
+
+To enable this middleware to your configuration, add the s3api middleware
+in front of the auth middleware. See ``proxy-server.conf-sample`` for more
+detail and configurable options.
+
+To set up your client, ensure you are using the tempauth or keystone auth
+system for swift project.
+When your swift on a SAIO environment, make sure you have setting the tempauth
+middleware configuration in ``proxy-server.conf``, and the access key will be
+the concatenation of the account and user strings that should look like
+test:tester, and the secret access key is the account password. The host should
+also point to the swift storage hostname.
+
+The tempauth option example:
+
+.. code-block:: ini
+
+   [filter:tempauth]
+   use = egg:swift#tempauth
+   user_admin_admin = admin .admin .reseller_admin
+   user_test_tester = testing
+
+An example client using tempauth with the python boto library is as follows:
+
+.. code-block:: python
+
+    from boto.s3.connection import S3Connection
+    connection = S3Connection(
+        aws_access_key_id='test:tester',
+        aws_secret_access_key='testing',
+        port=8080,
+        host='127.0.0.1',
+        is_secure=False,
+        calling_format=boto.s3.connection.OrdinaryCallingFormat())
+
+And if you using keystone auth, you need the ec2 credentials, which can
+be downloaded from the API Endpoints tab of the dashboard or by openstack
+ec2 command.
+
+Here is showing to create an EC2 credential:
+
+.. code-block:: console
+
+  # openstack ec2 credentials create
+  +------------+---------------------------------------------------+
+  | Field      | Value                                             |
+  +------------+---------------------------------------------------+
+  | access     | c2e30f2cd5204b69a39b3f1130ca8f61                  |
+  | links      | {u'self': u'http://controller:5000/v3/......'}    |
+  | project_id | 407731a6c2d0425c86d1e7f12a900488                  |
+  | secret     | baab242d192a4cd6b68696863e07ed59                  |
+  | trust_id   | None                                              |
+  | user_id    | 00f0ee06afe74f81b410f3fe03d34fbc                  |
+  +------------+---------------------------------------------------+
+
+An example client using keystone auth with the python boto library will be:
+
+.. code-block:: python
+
+    from boto.s3.connection import S3Connection
+    connection = S3Connection(
+        aws_access_key_id='c2e30f2cd5204b69a39b3f1130ca8f61',
+        aws_secret_access_key='baab242d192a4cd6b68696863e07ed59',
+        port=8080,
+        host='127.0.0.1',
+        is_secure=False,
+        calling_format=boto.s3.connection.OrdinaryCallingFormat())
+
+----------
+Deployment
+----------
+
+Proxy-Server Setting
+^^^^^^^^^^^^^^^^^^^^
+
+Set s3api before your auth in your pipeline in ``proxy-server.conf`` file.
+To enable all compatibility currently supported, you should make sure that
+bulk, slo, and your auth middleware are also included in your proxy
+pipeline setting.
+
+Using tempauth, the minimum example config is:
+
+.. code-block:: ini
+
+    [pipeline:main]
+    pipeline = proxy-logging cache s3api tempauth bulk slo proxy-logging \
+proxy-server
+
+When using keystone, the config will be:
+
+.. code-block:: ini
+
+    [pipeline:main]
+    pipeline = proxy-logging cache authtoken s3api s3token keystoneauth bulk \
+slo proxy-logging proxy-server
+
+Finally, add the s3api middleware section:
+
+.. code-block:: ini
+
+   [filter:s3api]
+   use = egg:swift#s3api
+
+.. note::
+    ``keystonemiddleware.authtoken`` can be located before/after s3api but
+    we recommend to put it before s3api because when authtoken is after s3api,
+    both authtoken and s3token will issue the acceptable token to keystone
+    (i.e. authenticate twice). And in the ``keystonemiddleware.authtoken``
+    middleware , you should set ``delay_auth_decision`` option to ``True``.
+
+-----------
+Constraints
+-----------
+Currently, the s3api is being ported from https://github.com/openstack/swift3
+so any existing issues in swift3 are still remaining. Please make sure
+descriptions in the example ``proxy-server.conf`` and what happens with the
+config, before enabling the options.
+
+-------------
+Supported API
+-------------
+The compatibility will continue to be improved upstream, you can keep and
+eye on compatibility via a check tool build by SwiftStack. See
+https://github.com/swiftstack/s3compat in detail.
+
+"""
+
+import json
+from paste.deploy import loadwsgi
+from urllib.parse import parse_qs
+
+from swift.common import swob
+from swift.common.constraints import valid_api_version
+from swift.common.middleware.listing_formats import \
+    MAX_CONTAINER_LISTING_CONTENT_LENGTH
+from swift.common.request_helpers import append_log_info
+from swift.common.wsgi import PipelineWrapper, loadcontext, WSGIContext
+from swift.common.statsd_client import get_labeled_statsd_client
+
+from swift.common.middleware import app_property
+from swift.common.middleware.s3api.exception import NotS3Request, \
+    InvalidSubresource
+from swift.common.middleware.s3api import s3request
+from swift.common.middleware.s3api.s3response import ErrorResponse, \
+    InternalError, MethodNotAllowed, S3ResponseBase, S3NotImplemented
+from swift.common.utils import get_logger, config_true_value, \
+    config_positive_int_value, split_path, closing_if_possible, \
+    list_from_csv, parse_header, checksum
+from swift.common.middleware.s3api.utils import Config, \
+    classify_checksum_header_value, make_header_label
+from swift.common.middleware.s3api.acl_handlers import get_acl_handler
+from swift.common.registry import register_swift_info, \
+    register_sensitive_header, register_sensitive_param
+
+
+# https://docs.aws.amazon.com/AmazonS3/latest/API/sigv4-auth-using-authorization-header.html
+WELL_KNOWN_SPECIFIC_SHA256_VALUES = (
+    'UNSIGNED-PAYLOAD',
+    'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+    'STREAMING-AWS4-HMAC-SHA256-PAYLOAD',
+    'STREAMING-AWS4-HMAC-SHA256-PAYLOAD-TRAILER',
+    'STREAMING-AWS4-ECDSA-P256-SHA256-PAYLOAD',
+    'STREAMING-AWS4-ECDSA-P256-SHA256-PAYLOAD-TRAILER'
+)
+# https://docs.aws.amazon.com/AmazonS3/latest/userguide/checking-object-integrity.html
+# https://docs.aws.amazon.com/AmazonS3/latest/API/API_Object.html#AmazonS3-Type-Object-ChecksumAlgorithm
+# https://docs.aws.amazon.com/AmazonS3/latest/API/API_PutObject.html
+# docs are unclear whether the header value is the (un-)hyphenated form
+
+# algorithms for x-amz-checksum-algorithm/ x-amz-sdk-checksum-algorithm
+WELL_KNOWN_CHECKSUM_ALGORITHMS = (
+    'CRC64NVME',
+    'CRC32',
+    'CRC32C',
+    'SHA1',
+    'SHA256'
+)
+WELL_KNOWN_CHECKSUM_HEADERS = (
+    'x-amz-checksum-crc32',
+    'x-amz-checksum-crc32c',
+    'x-amz-checksum-sha1',
+    'x-amz-checksum-sha256',
+    'x-amz-checksum-crc64nvme'
+)
+
+
+class ListingEtagMiddleware(object):
+    def __init__(self, app):
+        self.app = app
+
+    # Pass these along so get_container_info will have the configured
+    # odds to skip cache
+    _pipeline_final_app = app_property('_pipeline_final_app')
+    _pipeline_request_logging_app = app_property(
+        '_pipeline_request_logging_app')
+
+    def __call__(self, env, start_response):
+        # a lot of this is cribbed from listing_formats / swob.Request
+        if env['REQUEST_METHOD'] != 'GET':
+            # Nothing to translate
+            return self.app(env, start_response)
+
+        try:
+            v, a, c = split_path(env.get('SCRIPT_NAME', '') +
+                                 env['PATH_INFO'], 3, 3)
+            if not valid_api_version(v):
+                raise ValueError
+        except ValueError:
+            is_container_req = False
+        else:
+            is_container_req = True
+        if not is_container_req:
+            # pass through
+            return self.app(env, start_response)
+
+        ctx = WSGIContext(self.app)
+        resp_iter = ctx._app_call(env)
+
+        content_type = content_length = cl_index = None
+        for index, (header, value) in enumerate(ctx._response_headers):
+            header = header.lower()
+            if header == 'content-type':
+                content_type = value.split(';', 1)[0].strip()
+                if content_length:
+                    break
+            elif header == 'content-length':
+                cl_index = index
+                try:
+                    content_length = int(value)
+                except ValueError:
+                    pass  # ignore -- we'll bail later
+                if content_type:
+                    break
+
+        if content_type != 'application/json' or content_length is None or \
+                content_length > MAX_CONTAINER_LISTING_CONTENT_LENGTH:
+            start_response(ctx._response_status, ctx._response_headers,
+                           ctx._response_exc_info)
+            return resp_iter
+
+        # We've done our sanity checks, slurp the response into memory
+        with closing_if_possible(resp_iter):
+            body = b''.join(resp_iter)
+
+        try:
+            listing = json.loads(body)
+            for item in listing:
+                if 'subdir' in item:
+                    continue
+                value, params = parse_header(item['hash'])
+                if 's3_etag' in params:
+                    item['s3_etag'] = '"%s"' % params.pop('s3_etag')
+                    item['hash'] = value + ''.join(
+                        '; %s=%s' % kv for kv in params.items())
+        except (TypeError, KeyError, ValueError):
+            # If anything goes wrong above, drop back to original response
+            start_response(ctx._response_status, ctx._response_headers,
+                           ctx._response_exc_info)
+            return [body]
+
+        body = json.dumps(listing).encode('ascii')
+        ctx._response_headers[cl_index] = (
+            ctx._response_headers[cl_index][0],
+            str(len(body)),
+        )
+        start_response(ctx._response_status, ctx._response_headers,
+                       ctx._response_exc_info)
+        return [body]
+
+
+class S3ApiMiddleware(object):
+    """S3Api: S3 compatibility middleware"""
+    def __init__(self, app, wsgi_conf, *args, **kwargs):
+        self.app = app
+        self.conf = Config()
+
+        # Set default values if they are not configured
+        self.conf.allow_no_owner = config_true_value(
+            wsgi_conf.get('allow_no_owner', False))
+        self.conf.location = wsgi_conf.get('location', 'us-east-1')
+        self.conf.dns_compliant_bucket_names = config_true_value(
+            wsgi_conf.get('dns_compliant_bucket_names', True))
+        self.conf.max_bucket_listing = config_positive_int_value(
+            wsgi_conf.get('max_bucket_listing', 1000))
+        self.conf.max_parts_listing = config_positive_int_value(
+            wsgi_conf.get('max_parts_listing', 1000))
+        self.conf.max_multi_delete_objects = config_positive_int_value(
+            wsgi_conf.get('max_multi_delete_objects', 1000))
+        self.conf.multi_delete_concurrency = config_positive_int_value(
+            wsgi_conf.get('multi_delete_concurrency', 2))
+        self.conf.s3_acl = config_true_value(
+            wsgi_conf.get('s3_acl', False))
+        self.conf.storage_domains = list_from_csv(
+            wsgi_conf.get('storage_domain', ''))
+        self.conf.auth_pipeline_check = config_true_value(
+            wsgi_conf.get('auth_pipeline_check', True))
+        self.conf.max_upload_part_num = config_positive_int_value(
+            wsgi_conf.get('max_upload_part_num', 1000))
+        self.conf.check_bucket_owner = config_true_value(
+            wsgi_conf.get('check_bucket_owner', False))
+        self.conf.force_swift_request_proxy_log = config_true_value(
+            wsgi_conf.get('force_swift_request_proxy_log', False))
+        self.conf.allow_multipart_uploads = config_true_value(
+            wsgi_conf.get('allow_multipart_uploads', True))
+        self.conf.min_segment_size = config_positive_int_value(
+            wsgi_conf.get('min_segment_size', 5242880))
+        self.conf.allowable_clock_skew = config_positive_int_value(
+            wsgi_conf.get('allowable_clock_skew', 15 * 60))
+        self.conf.cors_preflight_allow_origin = list_from_csv(wsgi_conf.get(
+            'cors_preflight_allow_origin', ''))
+        if '*' in self.conf.cors_preflight_allow_origin and \
+                len(self.conf.cors_preflight_allow_origin) > 1:
+            raise ValueError('if cors_preflight_allow_origin should include '
+                             'all domains, * must be the only entry')
+        self.conf.ratelimit_as_client_error = config_true_value(
+            wsgi_conf.get('ratelimit_as_client_error', False))
+
+        self.logger = get_logger(
+            wsgi_conf, log_route='s3api', statsd_tail_prefix='s3api')
+        self.statsd = get_labeled_statsd_client(wsgi_conf, self.logger)
+
+        self.check_pipeline(wsgi_conf)
+        checksum.log_selected_implementation(self.logger)
+
+    def is_s3_cors_preflight(self, env):
+        if env['REQUEST_METHOD'] != 'OPTIONS' or not env.get('HTTP_ORIGIN'):
+            # Not a CORS preflight
+            return False
+        acrh = env.get('HTTP_ACCESS_CONTROL_REQUEST_HEADERS', '').lower()
+        if 'authorization' in acrh and \
+                not env['PATH_INFO'].startswith(('/v1/', '/v1.0/')):
+            return True
+        q = parse_qs(env.get('QUERY_STRING', ''))
+        if 'AWSAccessKeyId' in q or 'X-Amz-Credential' in q:
+            return True
+        # Not S3, apparently
+        return False
+
+    def _make_req_header_labels(self, env):
+        req_headers = swob.HeaderEnvironProxy(env)
+        labels = {}
+        for hdr_key, hdr_val in req_headers.items():
+            label_val = None
+            hdr_key = hdr_key.lower()
+            label_key = make_header_label(hdr_key)
+            if hdr_key == 'content-encoding':
+                if 'aws-chunked' in list_from_csv(hdr_val.lower()):
+                    label_val = 'aws-chunked'
+            elif hdr_key == 'transfer-encoding':
+                if 'chunked' in list_from_csv(hdr_val.lower()):
+                    label_val = 'chunked'
+            elif hdr_key == 'x-amz-decoded-content-length':
+                label_val = True
+            elif hdr_key == 'x-amz-content-sha256':
+                if hdr_val in WELL_KNOWN_SPECIFIC_SHA256_VALUES:
+                    label_val = hdr_val
+                else:
+                    label_val = classify_checksum_header_value(hdr_val)
+            elif hdr_key == 'content-md5':
+                label_val = classify_checksum_header_value(hdr_val)
+            elif hdr_key in s3request.CHECKSUMS_BY_HEADER.keys():
+                label_val = classify_checksum_header_value(hdr_val)
+            elif hdr_key == 'x-amz-trailer':
+                if hdr_val.lower() in s3request.CHECKSUMS_BY_HEADER.keys():
+                    label_val = hdr_val.lower()
+                else:
+                    label_val = 'unknown'
+            elif hdr_key in ('x-amz-checksum-algorithm',
+                             'x-amz-sdk-checksum-algorithm'):
+                hdr_val_normalised = hdr_val.upper().replace('-', '')
+                if hdr_val_normalised in WELL_KNOWN_CHECKSUM_ALGORITHMS:
+                    label_val = hdr_val_normalised
+                else:
+                    label_val = 'unknown'
+
+            if label_val is not None:
+                labels[label_key] = label_val
+
+        return labels
+
+    def _emit_response_header_stats(self, env, resp, labels):
+        if not labels:
+            return
+
+        labels['status'] = resp.status_int
+        labels['method'] = env.get('REQUEST_METHOD')
+        swift_path = env.get('swift.backend_path')
+        if swift_path:
+            vers, acc, con, obj = split_path(swift_path, 1, 4, True)
+            if obj:
+                labels['type'] = 'object'
+                labels['account'] = acc
+                labels['container'] = con
+            elif con:
+                labels['type'] = 'container'
+                labels['account'] = acc
+                labels['container'] = con
+            elif acc:
+                labels['account'] = acc
+                labels['type'] = 'account'
+            else:
+                labels['type'] = 'UNKNOWN'
+        else:
+            labels['type'] = 'UNKNOWN'
+
+        self.statsd.increment("swift_s3_checksum_algo_request", labels=labels)
+
+    def __call__(self, env, start_response):
+        # get metrics header labels before any mutation of the headers
+        req_header_labels = self._make_req_header_labels(env)
+        origin = env.get('HTTP_ORIGIN')
+        if self.conf.cors_preflight_allow_origin and \
+                self.is_s3_cors_preflight(env):
+            # I guess it's likely going to be an S3 request? *shrug*
+            if self.conf.cors_preflight_allow_origin != ['*'] and \
+                    origin not in self.conf.cors_preflight_allow_origin:
+                start_response('401 Unauthorized', [
+                    ('Allow', 'GET, HEAD, PUT, POST, DELETE, OPTIONS'),
+                ])
+                return [b'']
+
+            headers = [
+                ('Allow', 'GET, HEAD, PUT, POST, DELETE, OPTIONS'),
+                ('Access-Control-Allow-Origin', origin),
+                ('Access-Control-Allow-Methods',
+                 'GET, HEAD, PUT, POST, DELETE, OPTIONS'),
+                ('Vary', 'Origin, Access-Control-Request-Headers'),
+            ]
+            acrh = set(list_from_csv(
+                env.get('HTTP_ACCESS_CONTROL_REQUEST_HEADERS', '').lower()))
+            if acrh:
+                headers.append((
+                    'Access-Control-Allow-Headers',
+                    ', '.join(acrh)))
+
+            start_response('200 OK', headers)
+            return [b'']
+
+        try:
+            req_class = s3request.get_request_class(env, self.conf.s3_acl)
+            req = req_class(env, self.app, self.conf)
+            resp = self.handle_request(req)
+        except NotS3Request:
+            return self.app(env, start_response)
+        except InvalidSubresource as e:
+            self.logger.debug(e.cause)
+        except ErrorResponse as err_resp:
+            self.logger.increment(err_resp.metric_name)
+            append_log_info(env, 's3:err:%s' % err_resp.summary)
+            if isinstance(err_resp, InternalError):
+                self.logger.exception(err_resp)
+            resp = err_resp
+        except Exception as e:
+            self.logger.exception(e)
+            resp = InternalError(reason=str(e))
+
+        if isinstance(resp, S3ResponseBase) and 'swift.trans_id' in env:
+            resp.headers['x-amz-id-2'] = env['swift.trans_id']
+            resp.headers['x-amz-request-id'] = env['swift.trans_id']
+
+        if 's3api.backend_path' in env and 'swift.backend_path' not in env:
+            env['swift.backend_path'] = env['s3api.backend_path']
+
+        # emit metric with header labels now path and status may be available
+        self._emit_response_header_stats(env, resp, req_header_labels)
+
+        return resp(env, start_response)
+
+    def handle_request(self, req):
+        self.logger.debug('Calling S3Api Middleware')
+        try:
+            controller = req.controller(self.app, self.conf, self.logger)
+        except S3NotImplemented:
+            # TODO: Probably we should distinct the error to log this warning
+            self.logger.warning('multipart: No SLO middleware in pipeline')
+            raise
+
+        acl_handler = get_acl_handler(req.controller_name)(req, self.logger)
+        req.set_acl_handler(acl_handler)
+
+        if hasattr(controller, req.method):
+            handler = getattr(controller, req.method)
+            if not getattr(handler, 'publicly_accessible', False):
+                raise MethodNotAllowed(req.method,
+                                       req.controller.resource_type())
+            res = handler(req)
+        else:
+            raise MethodNotAllowed(req.method,
+                                   req.controller.resource_type())
+
+        if req.policy_index is not None:
+            res.headers.setdefault('X-Backend-Storage-Policy-Index',
+                                   req.policy_index)
+        return res
+
+    def check_pipeline(self, wsgi_conf):
+        """
+        Check that proxy-server.conf has an appropriate pipeline for s3api.
+        """
+        if wsgi_conf.get('__file__', None) is None:
+            return
+
+        ctx = loadcontext(loadwsgi.APP, wsgi_conf['__file__'])
+        pipeline = str(PipelineWrapper(ctx)).split(' ')
+
+        # Add compatible with 3rd party middleware.
+        self.check_filter_order(pipeline, ['s3api', 'proxy-server'])
+
+        auth_pipeline = pipeline[pipeline.index('s3api') + 1:
+                                 pipeline.index('proxy-server')]
+
+        # Check SLO middleware
+        if self.conf.allow_multipart_uploads and 'slo' not in auth_pipeline:
+            self.conf.allow_multipart_uploads = False
+            self.logger.warning('s3api middleware requires SLO middleware '
+                                'to support multi-part upload, please add it '
+                                'in pipeline')
+
+        if not self.conf.auth_pipeline_check:
+            self.logger.debug('Skip pipeline auth check.')
+            return
+
+        if 'tempauth' in auth_pipeline:
+            self.logger.debug('Use tempauth middleware.')
+        elif 'keystoneauth' in auth_pipeline:
+            self.check_filter_order(
+                auth_pipeline,
+                ['s3token', 'keystoneauth'])
+            self.logger.debug('Use keystone middleware.')
+        elif len(auth_pipeline):
+            self.logger.debug('Use third party(unknown) auth middleware.')
+        else:
+            raise ValueError('Invalid pipeline %r: expected auth between '
+                             's3api and proxy-server ' % pipeline)
+
+    def check_filter_order(self, pipeline, required_filters):
+        """
+        Check that required filters are present in order in the pipeline.
+        """
+        indexes = []
+        missing_filters = []
+        for required_filter in required_filters:
+            try:
+                indexes.append(pipeline.index(required_filter))
+            except ValueError as e:
+                self.logger.debug(e)
+                missing_filters.append(required_filter)
+
+        if missing_filters:
+            raise ValueError('Invalid pipeline %r: missing filters %r' % (
+                pipeline, missing_filters))
+
+        if indexes != sorted(indexes):
+            raise ValueError('Invalid pipeline %r: expected filter %s' % (
+                pipeline, ' before '.join(required_filters)))
+
+
+def filter_factory(global_conf, **local_conf):
+    """Standard filter factory to use the middleware with paste.deploy"""
+    conf = global_conf.copy()
+    conf.update(local_conf)
+
+    register_swift_info(
+        's3api',
+        # TODO: make default values as variables
+        max_bucket_listing=int(conf.get('max_bucket_listing', 1000)),
+        max_parts_listing=int(conf.get('max_parts_listing', 1000)),
+        max_upload_part_num=int(conf.get('max_upload_part_num', 1000)),
+        max_multi_delete_objects=int(
+            conf.get('max_multi_delete_objects', 1000)),
+        allow_multipart_uploads=config_true_value(
+            conf.get('allow_multipart_uploads', True)),
+        min_segment_size=int(conf.get('min_segment_size', 5242880)),
+        s3_acl=config_true_value(conf.get('s3_acl', False)),
+    )
+
+    register_sensitive_header('authorization')
+    register_sensitive_param('Signature')
+    register_sensitive_param('X-Amz-Signature')
+
+    def s3api_filter(app):
+        return S3ApiMiddleware(ListingEtagMiddleware(app), conf)
+
+    return s3api_filter
diff --git a/swift/common/middleware/s3api/s3request.py b/swift/common/middleware/s3api/s3request.py
new file mode 100644
index 0000000000..9f3641f067
--- /dev/null
+++ b/swift/common/middleware/s3api/s3request.py
@@ -0,0 +1,2465 @@
+# Copyright (c) 2014 OpenStack Foundation.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import base64
+import binascii
+from collections import defaultdict, OrderedDict
+import contextlib
+from email.header import Header
+from hashlib import sha1, sha256
+import hmac
+import re
+# pylint: disable-msg=import-error
+from urllib.parse import quote, unquote, parse_qsl
+import string
+
+from swift.common.utils import split_path, json, md5, streq_const_time, \
+    close_if_possible, InputProxy, get_policy_index, list_from_csv, \
+    strict_b64decode, base64_str, checksum
+from swift.common.registry import get_swift_info
+from swift.common import swob
+from swift.common.http import HTTP_OK, HTTP_CREATED, HTTP_ACCEPTED, \
+    HTTP_NO_CONTENT, HTTP_UNAUTHORIZED, HTTP_FORBIDDEN, HTTP_NOT_FOUND, \
+    HTTP_CONFLICT, HTTP_UNPROCESSABLE_ENTITY, HTTP_REQUEST_ENTITY_TOO_LARGE, \
+    HTTP_PARTIAL_CONTENT, HTTP_NOT_MODIFIED, HTTP_PRECONDITION_FAILED, \
+    HTTP_REQUESTED_RANGE_NOT_SATISFIABLE, HTTP_LENGTH_REQUIRED, \
+    HTTP_BAD_REQUEST, HTTP_REQUEST_TIMEOUT, HTTP_SERVICE_UNAVAILABLE, \
+    HTTP_TOO_MANY_REQUESTS, HTTP_RATE_LIMITED, is_success, \
+    HTTP_CLIENT_CLOSED_REQUEST
+
+from swift.proxy.controllers.base import get_container_info
+from swift.common.request_helpers import check_path_header
+
+from swift.common.middleware.s3api.controllers import ServiceController, \
+    ObjectController, AclController, MultiObjectDeleteController, \
+    LocationController, LoggingStatusController, PartController, \
+    UploadController, UploadsController, VersioningController, \
+    UnsupportedController, S3AclController, BucketController, \
+    TaggingController, ObjectLockController
+from swift.common.middleware.s3api.s3response import AccessDenied, \
+    InvalidArgument, InvalidDigest, BucketAlreadyOwnedByYou, \
+    RequestTimeTooSkewed, S3Response, SignatureDoesNotMatch, \
+    BucketAlreadyExists, BucketNotEmpty, EntityTooLarge, \
+    InternalError, NoSuchBucket, NoSuchKey, PreconditionFailed, InvalidRange, \
+    MissingContentLength, InvalidStorageClass, S3NotImplemented, InvalidURI, \
+    MalformedXML, InvalidRequest, RequestTimeout, InvalidBucketName, \
+    BadDigest, AuthorizationHeaderMalformed, SlowDown, \
+    AuthorizationQueryParametersError, ServiceUnavailable, BrokenMPU, \
+    XAmzContentSHA256Mismatch, IncompleteBody, InvalidChunkSizeError, \
+    InvalidPartNumber, InvalidPartArgument, MalformedTrailerError
+from swift.common.middleware.s3api.exception import NotS3Request, \
+    S3InputError, S3InputSizeError, S3InputIncomplete, \
+    S3InputChunkSignatureMismatch, S3InputChunkTooSmall, \
+    S3InputMalformedTrailer, S3InputMissingSecret, \
+    S3InputSHA256Mismatch, S3InputChecksumMismatch, \
+    S3InputChecksumTrailerInvalid
+from swift.common.middleware.s3api.utils import utf8encode, \
+    S3Timestamp, mktime, MULTIUPLOAD_SUFFIX
+from swift.common.middleware.s3api.subresource import decode_acl, encode_acl
+from swift.common.middleware.s3api.utils import sysmeta_header, \
+    parse_host, parse_path, Config
+from swift.common.middleware.s3api.exception import \
+    InvalidBucketNameParseError, InvalidURIParseError
+from swift.common.middleware.s3api.acl_utils import handle_acl_header
+
+
+# List of sub-resources that must be maintained as part of the HMAC
+# signature string.
+ALLOWED_SUB_RESOURCES = sorted([
+    'acl', 'delete', 'lifecycle', 'location', 'logging', 'notification',
+    'partNumber', 'policy', 'requestPayment', 'torrent', 'uploads', 'uploadId',
+    'versionId', 'versioning', 'versions', 'website',
+    'response-cache-control', 'response-content-disposition',
+    'response-content-encoding', 'response-content-language',
+    'response-content-type', 'response-expires', 'cors', 'tagging', 'restore',
+    'object-lock'
+])
+
+
+MAX_32BIT_INT = 2147483647
+SIGV2_TIMESTAMP_FORMAT = '%Y-%m-%dT%H:%M:%S'
+SIGV4_X_AMZ_DATE_FORMAT = '%Y%m%dT%H%M%SZ'
+SIGV4_CHUNK_MIN_SIZE = 8192
+SERVICE = 's3'  # useful for mocking out in tests
+
+
+CHECKSUMS_BY_HEADER = {
+    'x-amz-checksum-crc32': checksum.crc32,
+    'x-amz-checksum-crc32c': checksum.crc32c,
+    'x-amz-checksum-crc64nvme': checksum.crc64nvme,
+    'x-amz-checksum-sha1': sha1,
+    'x-amz-checksum-sha256': sha256,
+}
+
+
+def _get_checksum_hasher(header):
+    try:
+        return CHECKSUMS_BY_HEADER[header]()
+    except (KeyError, NotImplementedError):
+        raise S3NotImplemented('The %s algorithm is not supported.' % header)
+
+
+def _validate_checksum_value(checksum_hasher, b64digest):
+    return strict_b64decode(
+        b64digest,
+        exact_size=checksum_hasher.digest_size,
+    )
+
+
+def _validate_checksum_header_cardinality(num_checksum_headers,
+                                          headers_and_trailer=False):
+    if num_checksum_headers > 1:
+        # inconsistent messaging for AWS compatibility...
+        msg = 'Expecting a single x-amz-checksum- header'
+        if not headers_and_trailer:
+            msg += '. Multiple checksum Types are not allowed.'
+        raise InvalidRequest(msg)
+
+
+def _is_streaming(aws_sha256):
+    return aws_sha256 in (
+        'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+        'STREAMING-AWS4-HMAC-SHA256-PAYLOAD',
+        'STREAMING-AWS4-HMAC-SHA256-PAYLOAD-TRAILER',
+        'STREAMING-AWS4-ECDSA-P256-SHA256-PAYLOAD',
+        'STREAMING-AWS4-ECDSA-P256-SHA256-PAYLOAD-TRAILER',
+    )
+
+
+def _header_strip(value):
+    # S3 seems to strip *all* control characters
+    if value is None:
+        return None
+    stripped = _header_strip.re.sub('', value)
+    if value and not stripped:
+        # If there's nothing left after stripping,
+        # behave as though it wasn't provided
+        return None
+    return stripped
+
+
+_header_strip.re = re.compile('^[\x00-\x20]*|[\x00-\x20]*$')
+
+
+def _header_acl_property(resource):
+    """
+    Set and retrieve the acl in self.headers
+    """
+
+    def getter(self):
+        return getattr(self, '_%s' % resource)
+
+    def setter(self, value):
+        self.headers.update(encode_acl(resource, value))
+        setattr(self, '_%s' % resource, value)
+
+    def deleter(self):
+        self.headers[sysmeta_header(resource, 'acl')] = ''
+
+    return property(getter, setter, deleter,
+                    doc='Get and set the %s acl property' % resource)
+
+
+def _parse_path(req, bucket_in_host, dns_compliant_bucket_names):
+    try:
+        return parse_path(req, bucket_in_host, dns_compliant_bucket_names)
+    except InvalidURIParseError as err:
+        raise InvalidURI(err.uri)
+    except InvalidBucketNameParseError as err:
+        raise InvalidBucketName(err.bucket_name)
+
+
+class HashingInput(InputProxy):
+    """
+    wsgi.input wrapper to verify the SHA256 of the input as it's read.
+    """
+
+    def __init__(self, wsgi_input, content_length, expected_hex_hash):
+        super().__init__(wsgi_input)
+        self._expected_length = content_length
+        self._hasher = sha256()
+        self._expected_hash = expected_hex_hash
+        if content_length == 0 and \
+                self._hasher.hexdigest() != self._expected_hash.lower():
+            self.close()
+            raise XAmzContentSHA256Mismatch(
+                client_computed_content_s_h_a256=self._expected_hash,
+                s3_computed_content_s_h_a256=self._hasher.hexdigest(),
+            )
+
+    def chunk_update(self, chunk, eof, *args, **kwargs):
+        # Note that "chunk" is just whatever was read from the input; this
+        # says nothing about whether the underlying stream uses aws-chunked
+        self._hasher.update(chunk)
+
+        if self.bytes_received < self._expected_length:
+            error = eof
+        elif self.bytes_received == self._expected_length:
+            error = self._hasher.hexdigest() != self._expected_hash.lower()
+        else:
+            error = True
+
+        if error:
+            self.close()
+            # Since we don't return the last chunk, the PUT never completes
+            raise S3InputSHA256Mismatch(
+                self._expected_hash,
+                self._hasher.hexdigest())
+
+        return chunk
+
+
+class ChecksummingInput(InputProxy):
+    """
+    wsgi.input wrapper to calculate the X-Amz-Checksum-* of the input as it's
+    read. The calculated value is checked against an expected value that is
+    sent in either the request headers or trailers. To allow for the latter,
+    the expected value is lazy fetched once the input has been read.
+
+    :param wsgi_input: file-like object to be wrapped.
+    :param content_length: the expected number of bytes to be read.
+    :param checksum_hasher: a hasher to calculate the checksum of read bytes.
+    :param checksum_key: the name of the header or trailer that will have
+        the expected checksum value to be checked.
+    :param checksum_source: a dict that will have the ``checksum_key``.
+    """
+
+    def __init__(self, wsgi_input, content_length, checksum_hasher,
+                 checksum_key, checksum_source):
+        super().__init__(wsgi_input)
+        self._expected_length = content_length
+        self._checksum_hasher = checksum_hasher
+        self._checksum_key = checksum_key
+        self._checksum_source = checksum_source
+
+    def chunk_update(self, chunk, eof, *args, **kwargs):
+        # Note that "chunk" is just whatever was read from the input; this
+        # says nothing about whether the underlying stream uses aws-chunked
+        self._checksum_hasher.update(chunk)
+        if self.bytes_received < self._expected_length:
+            # wrapped input is likely to have timed out before this clause is
+            # reached with eof==True, but just in case...
+            error = eof
+        elif self.bytes_received == self._expected_length:
+            # Lazy fetch checksum value because it may have come in trailers
+            b64digest = self._checksum_source.get(self._checksum_key)
+            try:
+                expected_raw_checksum = _validate_checksum_value(
+                    self._checksum_hasher, b64digest)
+            except ValueError:
+                # If the checksum value came in a header then it would have
+                # been validated before the body was read, so if the validation
+                # fails here then we can infer that the checksum value came in
+                # a trailer. The S3InputChecksumTrailerInvalid raised here will
+                # propagate all the way back up the middleware stack to s3api
+                # where it is caught and translated to an InvalidRequest.
+                raise S3InputChecksumTrailerInvalid(self._checksum_key)
+            error = self._checksum_hasher.digest() != expected_raw_checksum
+        else:
+            # the underlying wsgi.Input stops reading at content-length so we
+            # don't expect to reach this clause, but just in case...
+            error = True
+
+        if error:
+            self.close()
+            # Since we don't return the last chunk, the PUT never completes
+            raise S3InputChecksumMismatch(self._checksum_hasher.name.upper())
+        return chunk
+
+
+class ChunkReader(InputProxy):
+    """
+    wsgi.input wrapper to read a single chunk from an aws-chunked input and
+    validate its signature.
+
+    :param wsgi_input: a wsgi input.
+    :param chunk_size: number of bytes to read.
+    :param validator: function to call to validate the chunk's content.
+    :param chunk_params: string of params from the chunk's header.
+    """
+    def __init__(self, wsgi_input, chunk_size, validator, chunk_params):
+        super().__init__(wsgi_input)
+        self.chunk_size = chunk_size
+        self._validator = validator
+        if self._validator is None:
+            self._signature = None
+        else:
+            self._signature = self._parse_chunk_signature(chunk_params)
+        self._sha256 = sha256()
+
+    def _parse_chunk_signature(self, chunk_params):
+        if not chunk_params:
+            raise S3InputIncomplete
+        start, _, chunk_sig = chunk_params.partition('=')
+        if start.strip() != 'chunk-signature':
+            # Call the validator to update the string to sign
+            self._validator('', '')
+            raise S3InputChunkSignatureMismatch
+        if ';' in chunk_sig:
+            raise S3InputIncomplete
+        chunk_sig = chunk_sig.strip()
+        if not chunk_sig:
+            raise S3InputIncomplete
+        return chunk_sig
+
+    @property
+    def to_read(self):
+        return self.chunk_size - self.bytes_received
+
+    def read(self, size=None, *args, **kwargs):
+        if size is None or size < 0 or size > self.to_read:
+            size = self.to_read
+        return super().read(size)
+
+    def readline(self, size=None, *args, **kwargs):
+        if size is None or size < 0 or size > self.to_read:
+            size = self.to_read
+        return super().readline(size)
+
+    def chunk_update(self, chunk, eof, *args, **kwargs):
+        # Note that "chunk" is just whatever was read from the input
+        self._sha256.update(chunk)
+        if self.bytes_received == self.chunk_size:
+            if self._validator and not self._validator(
+                    self._sha256.hexdigest(), self._signature):
+                self.close()
+                raise S3InputChunkSignatureMismatch
+        return chunk
+
+
+class StreamingInput:
+    """
+    wsgi.input wrapper to read a chunked input, verifying each chunk as it's
+    read. Once all chunks have been read, any trailers are read.
+
+    :param input: a wsgi input.
+    :param decoded_content_length: the number of payload bytes expected to be
+        extracted from chunks.
+    :param expected_trailers: the set of trailer names expected.
+    :param sig_checker: an instance of SigCheckerV4 that will be called to
+        verify each chunk's signature.
+    """
+    def __init__(self, input, decoded_content_length,
+                 expected_trailers, sig_checker):
+        self._input = input
+        self._decoded_content_length = decoded_content_length
+        self._expected_trailers = expected_trailers
+        self._sig_checker = sig_checker
+        # Length of the payload remaining; i.e., number of bytes a caller
+        # still expects to be able to read. Once exhausted, we should be
+        # exactly at the trailers (if present)
+        self._to_read = decoded_content_length
+        # Reader for the current chunk that's in progress
+        self._chunk_reader = None
+        # Track the chunk number, for error messages
+        self._chunk_number = 0
+        # Track the size of the most recently read chunk. AWS enforces an 8k
+        # min chunk size (except the final chunk)
+        self._last_chunk_size = None
+        # When True, we've read the payload, but not necessarily the trailers
+        self._completed_payload = False
+        # When True, we've read the trailers
+        self._completed_trailers = False
+        # Any trailers present after the payload (not available until after
+        # caller has read full payload; i.e., until after _to_read is 0)
+        self.trailers = {}
+
+    def _read_chunk_header(self):
+        """
+        Read a chunk header, reading at most one line from the raw input.
+
+        Parse out the next chunk size and any other params.
+
+        :returns: a tuple of (chunk_size, chunk_params). chunk_size is an int,
+            chunk_params is string.
+        """
+        self._chunk_number += 1
+        chunk_header = swob.bytes_to_wsgi(self._input.readline())
+        if chunk_header[-2:] != '\r\n':
+            raise S3InputIncomplete('invalid chunk header: %s' % chunk_header)
+        chunk_size, _, chunk_params = chunk_header[:-2].partition(';')
+
+        try:
+            chunk_size = int(chunk_size, 16)
+            if chunk_size < 0:
+                raise ValueError
+        except ValueError:
+            raise S3InputIncomplete('invalid chunk header: %s' % chunk_header)
+
+        if self._last_chunk_size is not None and \
+                self._last_chunk_size < SIGV4_CHUNK_MIN_SIZE and \
+                chunk_size != 0:
+            raise S3InputChunkTooSmall(self._last_chunk_size,
+                                       self._chunk_number)
+        self._last_chunk_size = chunk_size
+
+        if chunk_size > self._to_read:
+            raise S3InputSizeError(
+                self._decoded_content_length,
+                self._decoded_content_length - self._to_read + chunk_size)
+        return chunk_size, chunk_params
+
+    def _read_payload(self, size, readline=False):
+        bufs = []
+        bytes_read = 0
+        while not self._completed_payload and (
+                bytes_read < size
+                # Make sure we read the trailing zero-byte chunk at the end
+                or self._to_read == 0):
+            if self._chunk_reader is None:
+                # OK, we're at the start of a new chunk
+                chunk_size, chunk_params = self._read_chunk_header()
+                self._chunk_reader = ChunkReader(
+                    self._input,
+                    chunk_size,
+                    self._sig_checker and
+                    self._sig_checker.check_chunk_signature,
+                    chunk_params)
+            if readline:
+                buf = self._chunk_reader.readline(size - bytes_read)
+            else:
+                buf = self._chunk_reader.read(size - bytes_read)
+            bufs.append(buf)
+            if self._chunk_reader.to_read == 0:
+                # If it's the final chunk, we're in (possibly empty) trailers
+                # Otherwise, there's a CRLF chunk-separator
+                if self._chunk_reader.chunk_size == 0:
+                    self._completed_payload = True
+                elif self._input.read(2) != b'\r\n':
+                    raise S3InputIncomplete
+                self._chunk_reader = None
+            bytes_read += len(buf)
+            self._to_read -= len(buf)
+            if readline and buf[-1:] == b'\n':
+                break
+        return b''.join(bufs)
+
+    def _read_trailers(self):
+        if self._expected_trailers:
+            for line in iter(self._input.readline, b''):
+                if not line.endswith(b'\r\n'):
+                    raise S3InputIncomplete
+                if line == b'\r\n':
+                    break
+                key, _, value = swob.bytes_to_wsgi(line).partition(':')
+                if key.lower() not in self._expected_trailers:
+                    raise S3InputMalformedTrailer
+                self.trailers[key.strip()] = value.strip()
+            if 'x-amz-trailer-signature' in self._expected_trailers \
+                    and 'x-amz-trailer-signature' not in self.trailers:
+                raise S3InputIncomplete
+            if set(self.trailers.keys()) != self._expected_trailers:
+                raise S3InputMalformedTrailer
+            if 'x-amz-trailer-signature' in self._expected_trailers \
+                    and self._sig_checker is not None:
+                if not self._sig_checker.check_trailer_signature(
+                        self.trailers):
+                    raise S3InputChunkSignatureMismatch
+                if len(self.trailers) == 1:
+                    raise S3InputIncomplete
+            # Now that we've read them, we expect no more
+            self._expected_trailers = set()
+        elif self._input.read(2) not in (b'', b'\r\n'):
+            raise S3InputIncomplete
+
+        self._completed_trailers = True
+
+    def _read(self, size, readline=False):
+        data = self._read_payload(size, readline)
+        if self._completed_payload:
+            if not self._completed_trailers:
+                # read trailers, if present
+                self._read_trailers()
+            # At this point, we should have read everything; if we haven't,
+            # that's an error
+            if self._to_read:
+                raise S3InputSizeError(
+                    self._decoded_content_length,
+                    self._decoded_content_length - self._to_read)
+        return data
+
+    def read(self, size=None):
+        if size is None or size < 0 or size > self._to_read:
+            size = self._to_read
+        try:
+            return self._read(size)
+        except S3InputError:
+            self.close()
+            raise
+
+    def readline(self, size=None):
+        if size is None or size < 0 or size > self._to_read:
+            size = self._to_read
+        try:
+            return self._read(size, True)
+        except S3InputError:
+            self.close()
+            raise
+
+    def close(self):
+        close_if_possible(self._input)
+
+
+class BaseSigChecker:
+    def __init__(self, req):
+        self.req = req
+        self.signature = req.signature
+        self.string_to_sign = self._string_to_sign()
+        self._secret = None
+
+    def _string_to_sign(self):
+        raise NotImplementedError
+
+    def _derive_secret(self, secret):
+        return utf8encode(secret)
+
+    def _check_signature(self):
+        raise NotImplementedError
+
+    def check_signature(self, secret):
+        self._secret = self._derive_secret(secret)
+        return self._check_signature()
+
+
+class SigCheckerV2(BaseSigChecker):
+    def _string_to_sign(self):
+        """
+        Create 'StringToSign' value in Amazon terminology for v2.
+        """
+        buf = [swob.wsgi_to_bytes(wsgi_str) for wsgi_str in [
+            self.req.method,
+            _header_strip(self.req.headers.get('Content-MD5')) or '',
+            _header_strip(self.req.headers.get('Content-Type')) or '']]
+
+        if 'headers_raw' in self.req.environ:  # eventlet >= 0.19.0
+            # See https://github.com/eventlet/eventlet/commit/67ec999
+            amz_headers = defaultdict(list)
+            for key, value in self.req.environ['headers_raw']:
+                key = key.lower()
+                if not key.startswith('x-amz-'):
+                    continue
+                amz_headers[key.strip()].append(value.strip())
+            amz_headers = dict((key, ','.join(value))
+                               for key, value in amz_headers.items())
+        else:  # mostly-functional fallback
+            amz_headers = dict((key.lower(), value)
+                               for key, value in self.req.headers.items()
+                               if key.lower().startswith('x-amz-'))
+
+        if self.req._is_header_auth:
+            if 'x-amz-date' in amz_headers:
+                buf.append(b'')
+            elif 'Date' in self.req.headers:
+                buf.append(swob.wsgi_to_bytes(self.req.headers['Date']))
+        elif self.req._is_query_auth:
+            buf.append(swob.wsgi_to_bytes(self.req.params['Expires']))
+        else:
+            # Should have already raised NotS3Request in _parse_auth_info,
+            # but as a sanity check...
+            raise AccessDenied(reason='not_s3')
+
+        for key, value in sorted(amz_headers.items()):
+            buf.append(swob.wsgi_to_bytes("%s:%s" % (key, value)))
+
+        path = self.req._canonical_uri()
+        if self.req.query_string:
+            path += '?' + self.req.query_string
+        params = []
+        if '?' in path:
+            path, args = path.split('?', 1)
+            for key, value in sorted(self.req.params.items()):
+                if key in ALLOWED_SUB_RESOURCES:
+                    params.append('%s=%s' % (key, value) if value else key)
+        if params:
+            buf.append(swob.wsgi_to_bytes('%s?%s' % (path, '&'.join(params))))
+        else:
+            buf.append(swob.wsgi_to_bytes(path))
+        return b'\n'.join(buf)
+
+    def _check_signature(self):
+        valid_signature = base64_str(
+            hmac.new(self._secret, self.string_to_sign, sha1).digest())
+        return streq_const_time(self.signature, valid_signature)
+
+
+class SigCheckerV4(BaseSigChecker):
+    def __init__(self, req):
+        super().__init__(req)
+        self._all_chunk_signatures_valid = True
+
+    def _string_to_sign(self):
+        return b'\n'.join([
+            b'AWS4-HMAC-SHA256',
+            self.req.timestamp.amz_date_format.encode('ascii'),
+            '/'.join(self.req.scope.values()).encode('utf8'),
+            sha256(self.req._canonical_request()).hexdigest().encode('ascii')])
+
+    def _derive_secret(self, secret):
+        derived_secret = b'AWS4' + super()._derive_secret(secret)
+        for scope_piece in self.req.scope.values():
+            derived_secret = hmac.new(
+                derived_secret, scope_piece.encode('utf8'), sha256).digest()
+        return derived_secret
+
+    def _check_signature(self):
+        if self._secret is None:
+            raise S3InputMissingSecret
+        valid_signature = hmac.new(
+            self._secret, self.string_to_sign, sha256).hexdigest()
+        return streq_const_time(self.signature, valid_signature)
+
+    def _chunk_string_to_sign(self, data_sha256):
+        """
+        Create 'ChunkStringToSign' value in Amazon terminology for v4.
+        """
+        return b'\n'.join([
+            b'AWS4-HMAC-SHA256-PAYLOAD',
+            self.req.timestamp.amz_date_format.encode('ascii'),
+            '/'.join(self.req.scope.values()).encode('utf8'),
+            self.signature.encode('utf8'),
+            sha256(b'').hexdigest().encode('utf8'),
+            data_sha256.encode('utf8')
+        ])
+
+    def check_chunk_signature(self, chunk_sha256, signature):
+        """
+        Check the validity of a chunk's signature.
+
+        This method verifies the signature of a given chunk using its SHA-256
+        hash. It updates the string to sign and the current signature, then
+        checks if the signature is valid. If any chunk signature is invalid,
+        it returns False.
+
+        :param chunk_sha256: (str) The SHA-256 hash of the chunk.
+        :param signature: (str) The signature to be verified.
+        :returns: True if all chunk signatures are valid, False otherwise.
+        """
+        if not self._all_chunk_signatures_valid:
+            return False
+        # NB: string_to_sign is calculated using the previous signature
+        self.string_to_sign = self._chunk_string_to_sign(chunk_sha256)
+        # So we have to update the signature to compare against *after*
+        # the string-to-sign
+        self.signature = signature
+        self._all_chunk_signatures_valid &= self._check_signature()
+        return self._all_chunk_signatures_valid
+
+    def _trailer_string_to_sign(self, trailers):
+        """
+        Create 'TrailerChunkStringToSign' value in Amazon terminology for v4.
+        """
+        canonical_trailers = swob.wsgi_to_bytes(''.join(
+            f'{key}:{value}\n'
+            for key, value in sorted(
+                trailers.items(),
+                key=lambda kvp: swob.wsgi_to_bytes(kvp[0]).lower(),
+            )
+            if key != 'x-amz-trailer-signature'
+        ))
+        if not canonical_trailers:
+            canonical_trailers = b'\n'
+        return b'\n'.join([
+            b'AWS4-HMAC-SHA256-TRAILER',
+            self.req.timestamp.amz_date_format.encode('ascii'),
+            '/'.join(self.req.scope.values()).encode('utf8'),
+            self.signature.encode('utf8'),
+            sha256(canonical_trailers).hexdigest().encode('utf8'),
+        ])
+
+    def check_trailer_signature(self, trailers):
+        """
+        Check the validity of a chunk's signature.
+
+        This method verifies the trailers received after the main payload.
+
+        :param trailers: (dict[str, str]) The trailers received.
+        :returns: True if x-amz-trailer-signature is valid, False otherwise.
+        """
+        if not self._all_chunk_signatures_valid:
+            # if there was a breakdown earlier, this can't be right
+            return False
+        # NB: string_to_sign is calculated using the previous signature
+        self.string_to_sign = self._trailer_string_to_sign(trailers)
+        # So we have to update the signature to compare against *after*
+        # the string-to-sign
+        self.signature = trailers['x-amz-trailer-signature']
+        self._all_chunk_signatures_valid &= self._check_signature()
+        return self._all_chunk_signatures_valid
+
+
+def _parse_credential(credential_string):
+    """
+    Parse an AWS credential string into its components.
+
+    This method splits the given credential string into its constituent parts:
+    access key ID, date, AWS region, AWS service, and terminal identifier.
+    The credential string must follow the format:
+    <access-key-id>/<date>/<AWS-region>/<AWS-service>/aws4_request.
+
+    :param credential_string: (str) The AWS credential string to be parsed.
+    :raises AccessDenied: If the credential string is invalid or does not
+        follow the required format.
+    :returns: A dict containing the parsed components of the credential string.
+    """
+    parts = credential_string.split("/")
+    # credential must be in following format:
+    # <access-key-id>/<date>/<AWS-region>/<AWS-service>/aws4_request
+    if not parts[0] or len(parts) != 5:
+        raise AccessDenied(reason='invalid_credential')
+    return dict(zip(['access', 'date', 'region', 'service', 'terminal'],
+                    parts))
+
+
+class SigV4Mixin(object):
+    """
+    A request class mixin to provide S3 signature v4 functionality
+    """
+
+    @property
+    def _is_query_auth(self):
+        return 'X-Amz-Credential' in self.params
+
+    @property
+    def _is_x_amz_content_sha256_required(self):
+        return not self._is_query_auth
+
+    @property
+    def timestamp(self):
+        """
+        Return timestamp string according to the auth type
+        The difference from v2 is v4 have to see 'X-Amz-Date' even though
+        it's query auth type.
+        """
+        if not self._timestamp:
+            try:
+                if self._is_query_auth and 'X-Amz-Date' in self.params:
+                    # NOTE(andrey-mp): Date in Signature V4 has different
+                    # format
+                    timestamp = mktime(
+                        self.params['X-Amz-Date'], SIGV4_X_AMZ_DATE_FORMAT)
+                else:
+                    if self.headers.get('X-Amz-Date'):
+                        timestamp = mktime(
+                            self.headers.get('X-Amz-Date'),
+                            SIGV4_X_AMZ_DATE_FORMAT)
+                    else:
+                        timestamp = mktime(self.headers.get('Date'))
+            except (ValueError, TypeError):
+                raise AccessDenied('AWS authentication requires a valid Date '
+                                   'or x-amz-date header',
+                                   reason='invalid_date')
+
+            if timestamp < 0:
+                raise AccessDenied('AWS authentication requires a valid Date '
+                                   'or x-amz-date header',
+                                   reason='invalid_date')
+
+            try:
+                self._timestamp = S3Timestamp(timestamp)
+            except ValueError:
+                # Must be far-future; blame clock skew
+                raise RequestTimeTooSkewed()
+
+        return self._timestamp
+
+    def _validate_expire_param(self):
+        """
+        Validate X-Amz-Expires in query parameter
+        :raises: AccessDenied
+        :raises: AuthorizationQueryParametersError
+        :raises: AccessDenined
+        """
+        err = None
+        try:
+            expires = int(self.params['X-Amz-Expires'])
+        except KeyError:
+            raise AccessDenied(reason='invalid_expires')
+        except ValueError:
+            err = 'X-Amz-Expires should be a number'
+        else:
+            if expires < 0:
+                err = 'X-Amz-Expires must be non-negative'
+            elif expires >= 2 ** 63:
+                err = 'X-Amz-Expires should be a number'
+            elif expires > 604800:
+                err = ('X-Amz-Expires must be less than a week (in seconds); '
+                       'that is, the given X-Amz-Expires must be less than '
+                       '604800 seconds')
+        if err:
+            raise AuthorizationQueryParametersError(err)
+
+        if int(self.timestamp) + expires < S3Timestamp.now():
+            raise AccessDenied('Request has expired', reason='expired')
+
+    def _parse_query_authentication(self):
+        """
+        Parse v4 query authentication
+        - version 4:
+            'X-Amz-Credential' and 'X-Amz-Signature' should be in param
+        :raises: AccessDenied
+        :raises: AuthorizationHeaderMalformed
+        """
+        if self.params.get('X-Amz-Algorithm') != 'AWS4-HMAC-SHA256':
+            raise InvalidArgument('X-Amz-Algorithm',
+                                  self.params.get('X-Amz-Algorithm'))
+        try:
+            cred_param = _parse_credential(
+                swob.wsgi_to_str(self.params['X-Amz-Credential']))
+            sig = swob.wsgi_to_str(self.params['X-Amz-Signature'])
+            if not sig:
+                raise AccessDenied(reason='invalid_query_auth')
+        except KeyError:
+            raise AccessDenied(reason='invalid_query_auth')
+
+        try:
+            signed_headers = swob.wsgi_to_str(
+                self.params['X-Amz-SignedHeaders'])
+        except KeyError:
+            # TODO: make sure if is it malformed request?
+            raise AuthorizationHeaderMalformed()
+
+        self._signed_headers = set(signed_headers.split(';'))
+
+        invalid_messages = {
+            'date': 'Invalid credential date "%s". This date is not the same '
+                    'as X-Amz-Date: "%s".',
+            'region': "Error parsing the X-Amz-Credential parameter; "
+                    "the region '%s' is wrong; expecting '%s'",
+            'service': 'Error parsing the X-Amz-Credential parameter; '
+                    'incorrect service "%s". This endpoint belongs to "%s".',
+            'terminal': 'Error parsing the X-Amz-Credential parameter; '
+                    'incorrect terminal "%s". This endpoint uses "%s".',
+        }
+        for key in ('date', 'region', 'service', 'terminal'):
+            if cred_param[key] != self.scope[key]:
+                kwargs = {}
+                if key == 'region':
+                    # Allow lowercase region name
+                    # for AWS .NET SDK compatibility
+                    if not self.scope[key].islower() and \
+                            cred_param[key] == self.scope[key].lower():
+                        self.location = self.location.lower()
+                        continue
+                    kwargs = {'region': self.scope['region']}
+                raise AuthorizationQueryParametersError(
+                    invalid_messages[key] % (cred_param[key], self.scope[key]),
+                    **kwargs)
+
+        return cred_param['access'], sig
+
+    def _parse_header_authentication(self):
+        """
+        Parse v4 header authentication
+        - version 4:
+            'X-Amz-Credential' and 'X-Amz-Signature' should be in param
+        :raises: AccessDenied
+        :raises: AuthorizationHeaderMalformed
+        """
+
+        auth_str = swob.wsgi_to_str(self.headers['Authorization'])
+        cred_param = _parse_credential(auth_str.partition(
+            "Credential=")[2].split(',')[0])
+        sig = auth_str.partition("Signature=")[2].split(',')[0]
+        if not sig:
+            raise AccessDenied(reason='invalid_header_auth')
+        signed_headers = auth_str.partition(
+            "SignedHeaders=")[2].split(',', 1)[0]
+        if not signed_headers:
+            # TODO: make sure if is it Malformed?
+            raise AuthorizationHeaderMalformed()
+
+        invalid_messages = {
+            'date': 'Invalid credential date "%s". This date is not the same '
+                    'as X-Amz-Date: "%s".',
+            'region': "The authorization header is malformed; the region '%s' "
+                    "is wrong; expecting '%s'",
+            'service': 'The authorization header is malformed; incorrect '
+                    'service "%s". This endpoint belongs to "%s".',
+            'terminal': 'The authorization header is malformed; incorrect '
+                    'terminal "%s". This endpoint uses "%s".',
+        }
+        for key in ('date', 'region', 'service', 'terminal'):
+            if cred_param[key] != self.scope[key]:
+                kwargs = {}
+                if key == 'region':
+                    # Allow lowercase region name
+                    # for AWS .NET SDK compatibility
+                    if not self.scope[key].islower() and \
+                            cred_param[key] == self.scope[key].lower():
+                        self.location = self.location.lower()
+                        continue
+                    kwargs = {'region': self.scope['region']}
+                raise AuthorizationHeaderMalformed(
+                    invalid_messages[key] % (cred_param[key], self.scope[key]),
+                    **kwargs)
+
+        self._signed_headers = set(signed_headers.split(';'))
+
+        return cred_param['access'], sig
+
+    def _canonical_query_string(self):
+        return '&'.join(
+            '%s=%s' % (swob.wsgi_quote(key, safe='-_.~'),
+                       swob.wsgi_quote(value, safe='-_.~'))
+            for key, value in sorted(self.params.items())
+            if key not in ('Signature', 'X-Amz-Signature')).encode('ascii')
+
+    def _headers_to_sign(self):
+        """
+        Select the headers from the request that need to be included
+        in the StringToSign.
+
+        :return : dict of headers to sign, the keys are all lower case
+        """
+        if 'headers_raw' in self.environ:  # eventlet >= 0.19.0
+            # See https://github.com/eventlet/eventlet/commit/67ec999
+            headers_lower_dict = defaultdict(list)
+            for key, value in self.environ['headers_raw']:
+                headers_lower_dict[key.lower().strip()].append(
+                    ' '.join(_header_strip(value or '').split()))
+            headers_lower_dict = {k: ','.join(v)
+                                  for k, v in headers_lower_dict.items()}
+        else:  # mostly-functional fallback
+            headers_lower_dict = dict(
+                (k.lower().strip(), ' '.join(_header_strip(v or '').split()))
+                for (k, v) in self.headers.items())
+
+        if 'host' in headers_lower_dict and re.match(
+                'Boto/2.[0-9].[0-2]',
+                headers_lower_dict.get('user-agent', '')):
+            # Boto versions < 2.9.3 strip the port component of the host:port
+            # header, so detect the user-agent via the header and strip the
+            # port if we detect an old boto version.
+            headers_lower_dict['host'] = \
+                headers_lower_dict['host'].split(':')[0]
+
+        headers_to_sign = [
+            (key, value) for key, value in sorted(headers_lower_dict.items())
+            if swob.wsgi_to_str(key) in self._signed_headers]
+
+        if len(headers_to_sign) != len(self._signed_headers):
+            # NOTE: if we are missing the header suggested via
+            # signed_header in actual header, it results in
+            # SignatureDoesNotMatch in actual S3 so we can raise
+            # the error immediately here to save redundant check
+            # process.
+            raise SignatureDoesNotMatch()
+
+        return headers_to_sign
+
+    def _canonical_uri(self):
+        """
+        It won't require bucket name in canonical_uri for v4.
+        """
+        return swob.wsgi_to_bytes(swob.wsgi_quote(
+            self.environ.get('PATH_INFO', self.path), safe='-_.~/'))
+
+    def _canonical_request(self):
+        # prepare 'canonical_request'
+        # Example requests are like following:
+        #
+        # GET
+        # /
+        # Action=ListUsers&Version=2010-05-08
+        # content-type:application/x-www-form-urlencoded; charset=utf-8
+        # host:iam.amazonaws.com
+        # x-amz-date:20150830T123600Z
+        #
+        # content-type;host;x-amz-date
+        # e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855
+        #
+
+        # 1. Add verb like: GET
+        cr = [swob.wsgi_to_bytes(self.method)]
+
+        # 2. Add path like: /
+        path = self._canonical_uri()
+        cr.append(path)
+
+        # 3. Add query like: Action=ListUsers&Version=2010-05-08
+        cr.append(self._canonical_query_string())
+
+        # 4. Add headers like:
+        # content-type:application/x-www-form-urlencoded; charset=utf-8
+        # host:iam.amazonaws.com
+        # x-amz-date:20150830T123600Z
+        headers_to_sign = self._headers_to_sign()
+        cr.append(b''.join(swob.wsgi_to_bytes('%s:%s\n' % (key, value))
+                           for key, value in headers_to_sign))
+
+        # 5. Add signed headers into canonical request like
+        # content-type;host;x-amz-date
+        cr.append(b';'.join(swob.wsgi_to_bytes(k) for k, v in headers_to_sign))
+
+        # 6. Add payload string at the tail
+        hashed_payload = self.headers.get('X-Amz-Content-SHA256',
+                                          'UNSIGNED-PAYLOAD')
+
+        cr.append(swob.wsgi_to_bytes(hashed_payload))
+        return b'\n'.join(cr)
+
+    @property
+    def scope(self):
+        return OrderedDict([
+            ('date', self.timestamp.amz_date_format.split('T')[0]),
+            ('region', self.location),
+            ('service', SERVICE),
+            ('terminal', 'aws4_request'),
+        ])
+
+    def signature_does_not_match_kwargs(self):
+        kwargs = super(SigV4Mixin, self).signature_does_not_match_kwargs()
+        cr = self._canonical_request()
+        kwargs.update({
+            'canonical_request': cr,
+            'canonical_request_bytes': ' '.join(
+                format(b, '02x') for b in cr),
+        })
+        return kwargs
+
+
+def get_request_class(env, s3_acl):
+    """
+    Helper function to find a request class to use from Map
+    """
+    if s3_acl:
+        request_classes = (S3AclRequest, SigV4S3AclRequest)
+    else:
+        request_classes = (S3Request, SigV4Request)
+
+    req = swob.Request(env)
+    if 'X-Amz-Credential' in req.params or \
+            req.headers.get('Authorization', '').startswith(
+                'AWS4-HMAC-SHA256 '):
+        # This is an Amazon SigV4 request
+        return request_classes[1]
+    else:
+        # The others using Amazon SigV2 class
+        return request_classes[0]
+
+
+class S3Request(swob.Request):
+    """
+    S3 request object.
+    """
+
+    bucket_acl = _header_acl_property('container')
+    object_acl = _header_acl_property('object')
+
+    def __init__(self, env, app=None, conf=None):
+        # NOTE: app is not used by this class, need for compatibility of S3acl
+        swob.Request.__init__(self, env)
+        self.conf = conf or Config()
+        self.location = self.conf.location
+        self._timestamp = None
+        self.access_key, self.signature = self._parse_auth_info()
+        self.bucket_in_host = parse_host(self.environ,
+                                         self.conf.storage_domains)
+        self.container_name, self.object_name = _parse_path(
+            self, self.bucket_in_host, self.conf.dns_compliant_bucket_names)
+        self._validate_headers()
+        if isinstance(self, SigV4Mixin):
+            # this is a deliberate but only partial shift away from the
+            # 'inherit and override from mixin' pattern towards a 'compose
+            # adapters' pattern.
+            self.sig_checker = SigCheckerV4(self)
+        else:
+            self.sig_checker = SigCheckerV2(self)
+        aws_sha256 = self.headers.get('x-amz-content-sha256')
+        if self.method in ('PUT', 'POST'):
+            checksum_hasher, checksum_header, checksum_trailer = \
+                self._validate_checksum_headers()
+            if _is_streaming(aws_sha256):
+                if checksum_trailer:
+                    streaming_input = self._install_streaming_input_wrapper(
+                        aws_sha256, checksum_trailer=checksum_trailer)
+                    checksum_key = checksum_trailer
+                    checksum_source = streaming_input.trailers
+                else:
+                    self._install_streaming_input_wrapper(aws_sha256)
+                    checksum_key = checksum_header
+                    checksum_source = self.headers
+            elif checksum_trailer:
+                raise MalformedTrailerError
+            else:
+                self._install_non_streaming_input_wrapper(aws_sha256)
+                checksum_key = checksum_header
+                checksum_source = self.headers
+
+            if self.method == 'PUT':
+                verify_checksum = True
+            elif self.method == 'POST':
+                if 'delete' in self.params:
+                    verify_checksum = True
+                else:
+                    # S3 doesn't check the checksum for some POSTs (e.g. MPU
+                    # complete)
+                    verify_checksum = False
+            else:
+                verify_checksum = False
+
+            if checksum_key and verify_checksum:
+                self._install_checksumming_input_wrapper(
+                    checksum_hasher, checksum_key, checksum_source)
+
+        # Lock in string-to-sign now, before we start messing with query params
+        self.environ['s3api.auth_details'] = {
+            'access_key': self.access_key,
+            'signature': self.signature,
+            'string_to_sign': self.sig_checker.string_to_sign,
+            'check_signature': self.sig_checker.check_signature,
+        }
+        # Set the logging field (if not set already)
+        # Because auth mw to our right will only see a copy of the SwiftRequest
+        # environ we use a mutable value to back-propagate updates to proxy-log
+        access_key_value = (self.access_key[:125] + '...'
+                            if len(self.access_key) > 128
+                            else self.access_key)
+        self.environ.setdefault('swift.access_logging', {}).setdefault(
+            'user_id', access_key_value)
+        self.account = None
+        self.user_id = None
+        self.policy_index = None
+
+        # Avoids that swift.swob.Response replaces Location header value
+        # by full URL when absolute path given. See swift.swob for more detail.
+        self.environ['swift.leave_relative_location'] = True
+
+    def validate_part_number(self, parts_count=None, check_max=True):
+        """
+        Get the partNumber param, if it exists, and check it is valid.
+
+        To be valid, a partNumber must satisfy two criteria. First, it must be
+        an integer between 1 and the maximum allowed parts, inclusive. The
+        maximum allowed parts is the maximum of the configured
+        ``max_upload_part_num`` and, if given, ``parts_count``. Second, the
+        partNumber must be less than or equal to the ``parts_count``, if it is
+        given.
+
+        :param parts_count: if given, this is the number of parts in an
+            existing object.
+        :raises InvalidPartArgument: if the partNumber param is invalid i.e.
+            less than 1 or greater than the maximum allowed parts.
+        :raises InvalidPartNumber: if the partNumber param is valid but greater
+            than ``num_parts``.
+        :return: an integer part number if the partNumber param exists,
+            otherwise ``None``.
+        """
+        part_number = self.params.get('partNumber')
+        if part_number is None:
+            return None
+
+        if self.range:
+            raise InvalidRequest('Cannot specify both Range header and '
+                                 'partNumber query parameter')
+
+        try:
+            parts_count = int(parts_count)
+        except (TypeError, ValueError):
+            # an invalid/empty param is treated like parts_count=max_parts
+            parts_count = self.conf.max_upload_part_num
+        # max_parts may be raised to the number of existing parts
+        max_parts = max(self.conf.max_upload_part_num, parts_count)
+
+        try:
+            part_number = int(part_number)
+            if part_number < 1:
+                raise ValueError
+        except ValueError:
+            raise InvalidPartArgument(max_parts, part_number)  # 400
+
+        if check_max:
+            if part_number > max_parts:
+                raise InvalidPartArgument(max_parts, part_number)  # 400
+            if part_number > parts_count:
+                raise InvalidPartNumber()  # 416
+
+        return part_number
+
+    @property
+    def timestamp(self):
+        """
+        S3Timestamp from Date header. If X-Amz-Date header specified, it
+        will be prior to Date header.
+
+        :return : S3Timestamp instance
+        """
+        if not self._timestamp:
+            try:
+                if self._is_query_auth and 'Timestamp' in self.params:
+                    # If Timestamp specified in query, it should be prior
+                    # to any Date header (is this right?)
+                    timestamp = mktime(
+                        self.params['Timestamp'], SIGV2_TIMESTAMP_FORMAT)
+                else:
+                    timestamp = mktime(
+                        self.headers.get('X-Amz-Date',
+                                         self.headers.get('Date')))
+            except ValueError:
+                raise AccessDenied('AWS authentication requires a valid Date '
+                                   'or x-amz-date header',
+                                   reason='invalid_date')
+
+            if timestamp < 0:
+                raise AccessDenied('AWS authentication requires a valid Date '
+                                   'or x-amz-date header',
+                                   reason='invalid_date')
+            try:
+                self._timestamp = S3Timestamp(timestamp)
+            except ValueError:
+                # Must be far-future; blame clock skew
+                raise RequestTimeTooSkewed()
+
+        return self._timestamp
+
+    @property
+    def _is_header_auth(self):
+        return 'Authorization' in self.headers
+
+    @property
+    def _is_query_auth(self):
+        return 'AWSAccessKeyId' in self.params
+
+    @property
+    def _is_x_amz_content_sha256_required(self):
+        return False
+
+    def _parse_query_authentication(self):
+        """
+        Parse v2 authentication query args
+        TODO: make sure if 0, 1, 3 is supported?
+        - version 0, 1, 2, 3:
+            'AWSAccessKeyId' and 'Signature' should be in param
+
+        :return: a tuple of access_key and signature
+        :raises: AccessDenied
+        """
+        try:
+            access = swob.wsgi_to_str(self.params['AWSAccessKeyId'])
+            expires = swob.wsgi_to_str(self.params['Expires'])
+            sig = swob.wsgi_to_str(self.params['Signature'])
+        except KeyError:
+            raise AccessDenied(reason='invalid_query_auth')
+
+        if not all([access, sig, expires]):
+            raise AccessDenied(reason='invalid_query_auth')
+
+        return access, sig
+
+    def _parse_header_authentication(self):
+        """
+        Parse v2 header authentication info
+
+        :returns: a tuple of access_key and signature
+        :raises: AccessDenied
+        """
+        auth_str = swob.wsgi_to_str(self.headers['Authorization'])
+        if not auth_str.startswith('AWS ') or ':' not in auth_str:
+            raise AccessDenied(reason='invalid_header_auth')
+        # This means signature format V2
+        access, sig = auth_str.split(' ', 1)[1].rsplit(':', 1)
+        return access, sig
+
+    def _parse_auth_info(self):
+        """Extract the access key identifier and signature.
+
+        :returns: a tuple of access_key and signature
+        :raises: NotS3Request
+        """
+        if self._is_query_auth:
+            self._validate_expire_param()
+            return self._parse_query_authentication()
+        elif self._is_header_auth:
+            self._validate_dates()
+            return self._parse_header_authentication()
+        else:
+            # if this request is neither query auth nor header auth
+            # s3api regard this as not s3 request
+            raise NotS3Request()
+
+    def _validate_expire_param(self):
+        """
+        Validate Expires in query parameters
+        :raises: AccessDenied
+        """
+        # Expires header is a float since epoch
+        try:
+            ex = S3Timestamp(float(self.params['Expires']))
+        except (KeyError, ValueError):
+            raise AccessDenied(reason='invalid_expires')
+
+        if S3Timestamp.now() > ex:
+            raise AccessDenied('Request has expired', reason='expired')
+
+        if ex >= 2 ** 31:
+            raise AccessDenied(
+                'Invalid date (should be seconds since epoch): %s' %
+                self.params['Expires'], reason='invalid_expires')
+
+    def _validate_dates(self):
+        """
+        Validate Date/X-Amz-Date headers for signature v2
+        :raises: AccessDenied
+        :raises: RequestTimeTooSkewed
+        """
+        date_header = self.headers.get('Date')
+        amz_date_header = self.headers.get('X-Amz-Date')
+        if not date_header and not amz_date_header:
+            raise AccessDenied('AWS authentication requires a valid Date '
+                               'or x-amz-date header',
+                               reason='invalid_date')
+
+        # Anyways, request timestamp should be validated
+        epoch = S3Timestamp.zero()
+        if self.timestamp < epoch:
+            raise AccessDenied(reason='invalid_date')
+
+        # If the standard date is too far ahead or behind, it is an
+        # error
+        delta = abs(int(self.timestamp) - int(S3Timestamp.now()))
+        if delta > self.conf.allowable_clock_skew:
+            raise RequestTimeTooSkewed()
+
+    def _validate_sha256(self):
+        aws_sha256 = self.headers.get('x-amz-content-sha256')
+        if not aws_sha256:
+            if self._is_x_amz_content_sha256_required:
+                msg = 'Missing required header for this request: ' \
+                      'x-amz-content-sha256'
+                raise InvalidRequest(msg)
+            else:
+                return
+
+        looks_like_sha256 = (
+            aws_sha256 and len(aws_sha256) == 64 and
+            all(c in '0123456789abcdef' for c in aws_sha256.lower()))
+        if aws_sha256 == 'UNSIGNED-PAYLOAD':
+            pass
+        elif _is_streaming(aws_sha256):
+            decoded_content_length = self.headers.get(
+                'x-amz-decoded-content-length')
+            try:
+                decoded_content_length = int(decoded_content_length)
+            except (ValueError, TypeError):
+                raise MissingContentLength
+            if decoded_content_length < 0:
+                raise InvalidArgument('x-amz-decoded-content-length',
+                                      decoded_content_length)
+
+            if not isinstance(self, SigV4Mixin) or self._is_query_auth:
+                if decoded_content_length < (self.content_length or 0):
+                    raise IncompleteBody(
+                        number_bytes_expected=decoded_content_length,
+                        number_bytes_provided=self.content_length,
+                    )
+                body = self.body_file.read()
+                raise XAmzContentSHA256Mismatch(
+                    client_computed_content_s_h_a256=aws_sha256,
+                    s3_computed_content_s_h_a256=sha256(body).hexdigest(),
+                )
+            elif aws_sha256 in (
+                'STREAMING-AWS4-ECDSA-P256-SHA256-PAYLOAD',
+                'STREAMING-AWS4-ECDSA-P256-SHA256-PAYLOAD-TRAILER',
+            ):
+                raise S3NotImplemented(
+                    "Don't know how to validate %s streams"
+                    % aws_sha256)
+
+        elif not looks_like_sha256 and self._is_x_amz_content_sha256_required:
+            raise InvalidArgument(
+                'x-amz-content-sha256',
+                aws_sha256,
+                'x-amz-content-sha256 must be UNSIGNED-PAYLOAD, '
+                'STREAMING-UNSIGNED-PAYLOAD-TRAILER, '
+                'STREAMING-AWS4-HMAC-SHA256-PAYLOAD, '
+                'STREAMING-AWS4-HMAC-SHA256-PAYLOAD-TRAILER or '
+                'a valid sha256 value.')
+
+        return aws_sha256
+
+    def _cleanup_content_encoding(self):
+        if 'aws-chunked' in self.headers.get('Content-Encoding', ''):
+            new_enc = ', '.join(
+                enc for enc in list_from_csv(
+                    self.headers.pop('Content-Encoding'))
+                # TODO: test what's stored w/ 'aws-chunked, aws-chunked'
+                if enc != 'aws-chunked')
+            if new_enc:
+                # used to be, AWS would store '', but not any more
+                self.headers['Content-Encoding'] = new_enc
+
+    def _install_streaming_input_wrapper(self, aws_sha256,
+                                         checksum_trailer=None):
+        """
+        Wrap the wsgi input with a reader that parses an aws-chunked body.
+
+        :param aws_sha256: the value of the 'x-amz-content-sha256' header.
+        :param checksum_trailer: the name of an 'x-amz-checksum-*' trailer
+            (if any) that is to be expected at the end of the body.
+        :return: an instance of StreamingInput.
+        """
+        self._cleanup_content_encoding()
+        self.content_length = int(self.headers.get(
+            'x-amz-decoded-content-length'))
+        expected_trailers = set()
+        if aws_sha256 == 'STREAMING-AWS4-HMAC-SHA256-PAYLOAD-TRAILER':
+            expected_trailers.add('x-amz-trailer-signature')
+        if checksum_trailer:
+            expected_trailers.add(checksum_trailer)
+        streaming_input = StreamingInput(
+            self.environ['wsgi.input'],
+            self.content_length,
+            expected_trailers,
+            None if aws_sha256 == 'STREAMING-UNSIGNED-PAYLOAD-TRAILER'
+            else self.sig_checker)
+        self.environ['wsgi.input'] = streaming_input
+        return streaming_input
+
+    def _install_non_streaming_input_wrapper(self, aws_sha256):
+        if (aws_sha256 not in (None, 'UNSIGNED-PAYLOAD') and
+                self.content_length is not None):
+            self.environ['wsgi.input'] = HashingInput(
+                self.environ['wsgi.input'],
+                self.content_length,
+                aws_sha256)
+        # If no content-length, either client's trying to do a HTTP chunked
+        # transfer, or a HTTP/1.0-style transfer (in which case swift will
+        # reject with length-required and we'll translate back to
+        # MissingContentLength)
+
+    def _validate_x_amz_checksum_headers(self):
+        """
+        Validate and return a header that specifies a checksum value. A valid
+        header must be named x-amz-checksum-<algorithm> where <algorithm> is
+        one of the supported checksum algorithms.
+
+        :raises: InvalidRequest if more than one checksum header is found or if
+            an invalid algorithm is specified.
+        :return: a dict containing at most a single checksum header name:value
+            pair.
+        """
+        checksum_headers = {
+            h.lower(): v
+            for h, v in self.headers.items()
+            if (h.lower().startswith('x-amz-checksum-')
+                and h.lower() not in ('x-amz-checksum-algorithm',
+                                      'x-amz-checksum-type'))
+        }
+        if any(h not in CHECKSUMS_BY_HEADER
+               for h in checksum_headers):
+            raise InvalidRequest('The algorithm type you specified in '
+                                 'x-amz-checksum- header is invalid.')
+        _validate_checksum_header_cardinality(len(checksum_headers))
+        return checksum_headers
+
+    def _validate_x_amz_trailer_header(self):
+        """
+        Validate and return the name of a checksum trailer that is declared by
+        an ``x-amz-trailer`` header. A valid trailer must be named
+        x-amz-checksum-<algorithm> where <algorithm> is one of the supported
+        checksum algorithms.
+
+        :raises: InvalidRequest if more than one checksum trailer is declared
+            by the ``x-amz-trailer`` header, or if an invalid algorithm is
+            specified.
+        :return: a list containing at most a single checksum header name.
+        """
+        header = self.headers.get('x-amz-trailer', '').strip()
+        checksum_headers = [
+            v.strip() for v in header.rstrip(',').split(',')
+        ] if header else []
+        if any(h not in CHECKSUMS_BY_HEADER
+               for h in checksum_headers):
+            raise InvalidRequest('The value specified in the x-amz-trailer '
+                                 'header is not supported')
+        _validate_checksum_header_cardinality(len(checksum_headers))
+        return checksum_headers
+
+    def _validate_checksum_headers(self):
+        """
+        A checksum for the request is specified by a checksum header of the
+        form:
+
+          x-amz-checksum-<algorithm>: <checksum>
+
+        where <algorithm> is one of the supported checksum algorithms and
+        <checksum> is the value to be checked. A checksum header may be sent in
+        either the headers or the trailers. An ``x-amz-trailer`` header is used
+        to declare that a checksum header is to be expected in the trailers.
+
+        At most one checksum header is allowed in the headers or trailers. If
+        this condition is met, this method returns the name of the checksum
+        header or trailer and a hasher for the checksum algorithm that it
+        declares.
+
+        :raises InvalidRequest: if any of the following conditions occur: more
+            than one checksum header is declared; the checksum header specifies
+            an invalid algorithm; the algorithm does not match the value of any
+            ``x-amz-sdk-checksum-algorithm`` header that is also present; the
+            checksum value is invalid.
+        :raises S3NotImplemented: if the declared algorithm is valid but not
+            supported.
+        :return: a tuple of
+            (hasher, checksum header name, checksum trailer name) where at
+            least one of (checksum header name, checksum trailer name) will be
+            None.
+        """
+        checksum_headers = self._validate_x_amz_checksum_headers()
+        checksum_trailer_headers = self._validate_x_amz_trailer_header()
+        _validate_checksum_header_cardinality(
+            len(checksum_headers) + len(checksum_trailer_headers),
+            headers_and_trailer=True
+        )
+
+        if checksum_headers:
+            checksum_trailer = None
+            checksum_header, b64digest = list(checksum_headers.items())[0]
+            checksum_hasher = _get_checksum_hasher(checksum_header)
+            try:
+                # early check on the value...
+                _validate_checksum_value(checksum_hasher, b64digest)
+            except ValueError:
+                raise InvalidRequest(
+                    'Value for %s header is invalid.' % checksum_header)
+        elif checksum_trailer_headers:
+            checksum_header = None
+            checksum_trailer = checksum_trailer_headers[0]
+            checksum_hasher = _get_checksum_hasher(checksum_trailer)
+            # checksum should appear at end of request in trailers
+        else:
+            checksum_hasher = checksum_header = checksum_trailer = None
+
+        checksum_algo = self.headers.get('x-amz-sdk-checksum-algorithm')
+        if checksum_algo:
+            if not checksum_hasher:
+                raise InvalidRequest(
+                    'x-amz-sdk-checksum-algorithm specified, but no '
+                    'corresponding x-amz-checksum-* or x-amz-trailer '
+                    'headers were found.')
+            if checksum_algo.lower() != checksum_hasher.name:
+                raise InvalidRequest('Value for x-amz-sdk-checksum-algorithm '
+                                     'header is invalid.')
+
+        return checksum_hasher, checksum_header, checksum_trailer
+
+    def _install_checksumming_input_wrapper(
+            self, checksum_hasher, checksum_key, checksum_source):
+        self.environ['wsgi.input'] = ChecksummingInput(
+            self.environ['wsgi.input'],
+            self.content_length,
+            checksum_hasher,
+            checksum_key,
+            checksum_source
+        )
+
+    def _validate_headers(self):
+        if 'CONTENT_LENGTH' in self.environ:
+            try:
+                if self.content_length < 0:
+                    raise InvalidArgument('Content-Length',
+                                          self.content_length)
+            except (ValueError, TypeError):
+                raise InvalidArgument('Content-Length',
+                                      self.environ['CONTENT_LENGTH'])
+
+        if self.method == 'PUT' and (
+                any(h in self.headers for h in (
+                    'If-Match', 'If-Modified-Since', 'If-Unmodified-Since'))
+                or self.headers.get('If-None-Match', '*') != '*'):
+            raise S3NotImplemented(
+                'Conditional object PUTs are not supported.')
+
+        if 'X-Amz-Copy-Source' in self.headers:
+            try:
+                check_path_header(self, 'X-Amz-Copy-Source', 2, '')
+            except swob.HTTPException:
+                msg = 'Copy Source must mention the source bucket and key: ' \
+                      'sourcebucket/sourcekey'
+                raise InvalidArgument('x-amz-copy-source',
+                                      self.headers['X-Amz-Copy-Source'],
+                                      msg)
+        if 'x-amz-metadata-directive' in self.headers:
+            value = self.headers['x-amz-metadata-directive']
+            if value not in ('COPY', 'REPLACE'):
+                err_msg = 'Unknown metadata directive.'
+                raise InvalidArgument('x-amz-metadata-directive', value,
+                                      err_msg)
+
+        if 'x-amz-storage-class' in self.headers:
+            # Only STANDARD is supported now.
+            if self.headers['x-amz-storage-class'] != 'STANDARD':
+                raise InvalidStorageClass()
+
+        if 'x-amz-mfa' in self.headers:
+            raise S3NotImplemented('MFA Delete is not supported.')
+
+        sse_value = self.headers.get('x-amz-server-side-encryption')
+        if sse_value is not None:
+            if sse_value not in ('aws:kms', 'AES256'):
+                raise InvalidArgument(
+                    'x-amz-server-side-encryption', sse_value,
+                    'The encryption method specified is not supported')
+            encryption_enabled = get_swift_info(admin=True)['admin'].get(
+                'encryption', {}).get('enabled')
+            if not encryption_enabled or sse_value != 'AES256':
+                raise S3NotImplemented(
+                    'Server-side encryption is not supported.')
+
+        if 'x-amz-website-redirect-location' in self.headers:
+            raise S3NotImplemented('Website redirection is not supported.')
+
+        self._validate_sha256()
+
+        value = _header_strip(self.headers.get('Content-MD5'))
+        if value is not None:
+            if not re.match('^[A-Za-z0-9+/]+={0,2}$', value):
+                # Non-base64-alphabet characters in value.
+                raise InvalidDigest(content_md5=value)
+            try:
+                self.headers['ETag'] = binascii.b2a_hex(
+                    binascii.a2b_base64(value))
+            except binascii.Error:
+                # incorrect padding, most likely
+                raise InvalidDigest(content_md5=value)
+
+            if len(self.headers['ETag']) != 32:
+                raise InvalidDigest(content_md5=value)
+
+        if 'x-amz-tagging' in self.headers:
+            raise S3NotImplemented('Object tagging is not supported.')
+
+    @property
+    def body(self):
+        """
+        swob.Request.body is not secure against malicious input.  It consumes
+        too much memory without any check when the request body is excessively
+        large.  Use xml() instead.
+        """
+        raise AttributeError("No attribute 'body'")
+
+    def xml(self, max_length):
+        """
+        Similar to swob.Request.body, but it checks the content length before
+        creating a body string.
+        """
+        te = self.headers.get('transfer-encoding', '')
+        te = [x.strip() for x in te.split(',') if x.strip()]
+        if te and (len(te) > 1 or te[-1] != 'chunked'):
+            raise S3NotImplemented('A header you provided implies '
+                                   'functionality that is not implemented',
+                                   header='Transfer-Encoding')
+
+        ml = self.message_length()
+        if ml and ml > max_length:
+            raise MalformedXML()
+
+        if te or ml:
+            # Limit the read similar to how SLO handles manifests
+            with self.translate_read_errors():
+                body = self.body_file.read(max_length)
+        else:
+            # No (or zero) Content-Length provided, and not chunked transfer;
+            # no body. Assume zero-length, and enforce a required body below.
+            return None
+
+        return body
+
+    def check_md5(self, body):
+        """
+        Check the md5 of the request body against the content-md5 header if the
+        header is present.
+
+        :raise BadDigest: if the header is present but does not match the
+            calculated body md5.
+        :return: True if the header is present, False otherwise.
+        """
+        content_md5 = self.environ.get('HTTP_CONTENT_MD5')
+        if not content_md5:
+            return False
+        digest = base64_str(md5(body, usedforsecurity=False).digest())
+        if content_md5 != digest:
+            raise BadDigest(expected_digest=content_md5)
+        return True
+
+    def require_md5(self, body):
+        allowed_checksum_env_keys = [
+            'HTTP_' + hdr.upper().replace('-', '_')
+            for hdr in CHECKSUMS_BY_HEADER.keys()
+        ]
+        allowed_checksum_env_keys.append('HTTP_CONTENT_MD5')
+        if not any(k in self.environ for k in allowed_checksum_env_keys):
+            raise InvalidRequest('Missing required header for this request: '
+                                 'Content-MD5 OR x-amz-checksum-*')
+        self.check_md5(body)
+
+    def _copy_source_headers(self):
+        env = {}
+        for key, value in self.environ.items():
+            if key.startswith('HTTP_X_AMZ_COPY_SOURCE_'):
+                env[key.replace('X_AMZ_COPY_SOURCE_', '')] = value
+
+        return swob.HeaderEnvironProxy(env)
+
+    def check_copy_source(self, app):
+        """
+        check_copy_source checks the copy source existence and if copying an
+        object to itself, for illegal request parameters
+
+        :returns: the source HEAD response
+        """
+        try:
+            src_path = self.headers['X-Amz-Copy-Source']
+        except KeyError:
+            return None
+
+        src_path, qs = src_path.partition('?')[::2]
+        parsed = parse_qsl(qs, True)
+        if not parsed:
+            query = {}
+        elif len(parsed) == 1 and parsed[0][0] == 'versionId':
+            query = {'version-id': parsed[0][1]}
+        else:
+            raise InvalidArgument('X-Amz-Copy-Source',
+                                  self.headers['X-Amz-Copy-Source'],
+                                  'Unsupported copy source parameter.')
+
+        src_path = unquote(src_path)
+        src_path = src_path if src_path.startswith('/') else ('/' + src_path)
+        src_bucket, src_obj = split_path(src_path, 0, 2, True)
+
+        headers = swob.HeaderKeyDict()
+        headers.update(self._copy_source_headers())
+
+        src_resp = self.get_response(app, 'HEAD', src_bucket,
+                                     swob.str_to_wsgi(src_obj),
+                                     headers=headers, query=query)
+        if src_resp.status_int == 304:  # pylint: disable-msg=E1101
+            raise PreconditionFailed()
+
+        if (self.container_name == src_bucket and
+                self.object_name == src_obj and
+                self.headers.get('x-amz-metadata-directive',
+                                 'COPY') == 'COPY' and
+                not query):
+            raise InvalidRequest("This copy request is illegal "
+                                 "because it is trying to copy an "
+                                 "object to itself without "
+                                 "changing the object's metadata, "
+                                 "storage class, website redirect "
+                                 "location or encryption "
+                                 "attributes.")
+        # We've done some normalizing; write back so it's ready for
+        # to_swift_req
+        self.headers['X-Amz-Copy-Source'] = quote(src_path)
+        if query:
+            self.headers['X-Amz-Copy-Source'] += \
+                '?versionId=' + query['version-id']
+        return src_resp
+
+    def _canonical_uri(self):
+        """
+        Require bucket name in canonical_uri for v2 in virtual hosted-style.
+        """
+        raw_path_info = self.environ.get('RAW_PATH_INFO', self.path)
+        if self.bucket_in_host:
+            raw_path_info = '/' + self.bucket_in_host + raw_path_info
+        return raw_path_info
+
+    def signature_does_not_match_kwargs(self):
+        return {
+            'a_w_s_access_key_id': self.access_key,
+            'string_to_sign': self.sig_checker.string_to_sign,
+            'signature_provided': self.signature,
+            'string_to_sign_bytes': ' '.join(
+                format(b, '02x') for b in self.sig_checker.string_to_sign),
+        }
+
+    @property
+    def controller_name(self):
+        return self.controller.__name__[:-len('Controller')]
+
+    @property
+    def controller(self):
+        if self.is_service_request:
+            return ServiceController
+
+        if not self.conf.allow_multipart_uploads:
+            multi_part = ['partNumber', 'uploadId', 'uploads']
+            if len([p for p in multi_part if p in self.params]):
+                raise S3NotImplemented("Multi-part feature isn't support")
+
+        if 'acl' in self.params:
+            return AclController
+        if 'delete' in self.params:
+            return MultiObjectDeleteController
+        if 'location' in self.params:
+            return LocationController
+        if 'logging' in self.params:
+            return LoggingStatusController
+        if 'partNumber' in self.params:
+            if self.method == 'PUT':
+                return PartController
+            else:
+                return ObjectController
+        if 'uploadId' in self.params:
+            return UploadController
+        if 'uploads' in self.params:
+            return UploadsController
+        if 'versioning' in self.params:
+            return VersioningController
+        if 'tagging' in self.params:
+            return TaggingController
+        if 'object-lock' in self.params:
+            return ObjectLockController
+
+        unsupported = ('notification', 'policy', 'requestPayment', 'torrent',
+                       'website', 'cors', 'restore')
+        if set(unsupported) & set(self.params):
+            return UnsupportedController
+
+        if self.is_object_request:
+            return ObjectController
+        return BucketController
+
+    @property
+    def is_service_request(self):
+        return not self.container_name
+
+    @property
+    def is_bucket_request(self):
+        return self.container_name and not self.object_name
+
+    @property
+    def is_object_request(self):
+        return self.container_name and self.object_name
+
+    @property
+    def is_authenticated(self):
+        return self.account is not None
+
+    def to_swift_req(self, method, container, obj, query=None,
+                     body=None, headers=None):
+        """
+        Create a Swift request based on this request's environment.
+        """
+        if self.account is None:
+            account = swob.str_to_wsgi(self.access_key)
+        else:
+            account = self.account
+
+        env = self.environ.copy()
+        env['swift.infocache'] = self.environ.setdefault('swift.infocache', {})
+
+        def sanitize(value):
+            if set(value).issubset(string.printable):
+                return value
+
+            value = Header(value, 'UTF-8').encode()
+            if value.startswith('=?utf-8?q?'):
+                return '=?UTF-8?Q?' + value[10:]
+            elif value.startswith('=?utf-8?b?'):
+                return '=?UTF-8?B?' + value[10:]
+            else:
+                return value
+
+        if 'headers_raw' in env:  # eventlet >= 0.19.0
+            # See https://github.com/eventlet/eventlet/commit/67ec999
+            for key, value in env['headers_raw']:
+                if not key.lower().startswith('x-amz-meta-'):
+                    continue
+                # AWS ignores user-defined headers with these characters
+                if any(c in key for c in ' "),/;<=>?@[\\]{}'):
+                    # NB: apparently, '(' *is* allowed
+                    continue
+                # Note that this may have already been deleted, e.g. if the
+                # client sent multiple headers with the same name, or both
+                # x-amz-meta-foo-bar and x-amz-meta-foo_bar
+                env.pop('HTTP_' + key.replace('-', '_').upper(), None)
+                # Need to preserve underscores. Since we know '=' can't be
+                # present, quoted-printable seems appropriate.
+                key = key.replace('_', '=5F').replace('-', '_').upper()
+                key = 'HTTP_X_OBJECT_META_' + key[11:]
+                if key in env:
+                    env[key] += ',' + sanitize(value)
+                else:
+                    env[key] = sanitize(value)
+        else:  # mostly-functional fallback
+            for key in self.environ:
+                if not key.startswith('HTTP_X_AMZ_META_'):
+                    continue
+                # AWS ignores user-defined headers with these characters
+                if any(c in key for c in ' "),/;<=>?@[\\]{}'):
+                    # NB: apparently, '(' *is* allowed
+                    continue
+                env['HTTP_X_OBJECT_META_' + key[16:]] = sanitize(env[key])
+                del env[key]
+
+        copy_from_version_id = ''
+        if 'HTTP_X_AMZ_COPY_SOURCE' in env and env['REQUEST_METHOD'] == 'PUT':
+            env['HTTP_X_COPY_FROM'], copy_from_version_id = env[
+                'HTTP_X_AMZ_COPY_SOURCE'].partition('?versionId=')[::2]
+            del env['HTTP_X_AMZ_COPY_SOURCE']
+            env['CONTENT_LENGTH'] = '0'
+            if env.pop('HTTP_X_AMZ_METADATA_DIRECTIVE', None) == 'REPLACE':
+                env['HTTP_X_FRESH_METADATA'] = 'True'
+            else:
+                copy_exclude_headers = ('HTTP_CONTENT_DISPOSITION',
+                                        'HTTP_CONTENT_ENCODING',
+                                        'HTTP_CONTENT_LANGUAGE',
+                                        'CONTENT_TYPE',
+                                        'HTTP_EXPIRES',
+                                        'HTTP_CACHE_CONTROL',
+                                        'HTTP_X_ROBOTS_TAG')
+                for key in copy_exclude_headers:
+                    env.pop(key, None)
+                for key in list(env.keys()):
+                    if key.startswith('HTTP_X_OBJECT_META_'):
+                        del env[key]
+
+        if self.conf.force_swift_request_proxy_log:
+            env['swift.proxy_access_log_made'] = False
+        env['swift.source'] = 'S3'
+        if method is not None:
+            env['REQUEST_METHOD'] = method
+
+        if obj:
+            path = '/v1/%s/%s/%s' % (account, container, obj)
+        elif container:
+            path = '/v1/%s/%s' % (account, container)
+        else:
+            path = '/v1/%s' % (account)
+        env['PATH_INFO'] = path
+
+        params = []
+        if query is not None:
+            for key, value in sorted(query.items()):
+                if value is not None:
+                    params.append('%s=%s' % (key, quote(str(value))))
+                else:
+                    params.append(key)
+        if copy_from_version_id and not (query and query.get('version-id')):
+            params.append('version-id=' + copy_from_version_id)
+        env['QUERY_STRING'] = '&'.join(params)
+
+        return swob.Request.blank(quote(path), environ=env, body=body,
+                                  headers=headers)
+
+    def _swift_success_codes(self, method, container, obj):
+        """
+        Returns a list of expected success codes from Swift.
+        """
+        if not container:
+            # Swift account access.
+            code_map = {
+                'GET': [
+                    HTTP_OK,
+                ],
+            }
+        elif not obj:
+            # Swift container access.
+            code_map = {
+                'HEAD': [
+                    HTTP_NO_CONTENT,
+                ],
+                'GET': [
+                    HTTP_OK,
+                    HTTP_NO_CONTENT,
+                ],
+                'PUT': [
+                    HTTP_CREATED,
+                ],
+                'POST': [
+                    HTTP_NO_CONTENT,
+                ],
+                'DELETE': [
+                    HTTP_NO_CONTENT,
+                ],
+            }
+        else:
+            # Swift object access.
+            code_map = {
+                'HEAD': [
+                    HTTP_OK,
+                    HTTP_PARTIAL_CONTENT,
+                    HTTP_NOT_MODIFIED,
+                ],
+                'GET': [
+                    HTTP_OK,
+                    HTTP_PARTIAL_CONTENT,
+                    HTTP_NOT_MODIFIED,
+                ],
+                'PUT': [
+                    HTTP_CREATED,
+                    HTTP_ACCEPTED,  # For SLO with heartbeating
+                ],
+                'POST': [
+                    HTTP_ACCEPTED,
+                ],
+                'DELETE': [
+                    HTTP_OK,
+                    HTTP_NO_CONTENT,
+                ],
+            }
+
+        return code_map[method]
+
+    def _bucket_put_accepted_error(self, container, app):
+        sw_req = self.to_swift_req('HEAD', container, None)
+        info = get_container_info(sw_req.environ, app, swift_source='S3')
+        sysmeta = info.get('sysmeta', {})
+        try:
+            acl = json.loads(sysmeta.get('s3api-acl',
+                                         sysmeta.get('swift3-acl', '{}')))
+            owner = acl.get('Owner')
+        except (ValueError, TypeError, KeyError):
+            owner = None
+        if owner is None or owner == self.user_id:
+            raise BucketAlreadyOwnedByYou(container)
+        raise BucketAlreadyExists(container)
+
+    def _swift_error_codes(self, method, container, obj, env, app):
+        """
+        Returns a dict from expected Swift error codes to the corresponding S3
+        error responses.
+        """
+        if not container:
+            # Swift account access.
+            code_map = {
+                'GET': {
+                },
+            }
+        elif not obj:
+            # Swift container access.
+            code_map = {
+                'HEAD': {
+                    HTTP_NOT_FOUND: (NoSuchBucket, container),
+                },
+                'GET': {
+                    HTTP_NOT_FOUND: (NoSuchBucket, container),
+                },
+                'PUT': {
+                    HTTP_ACCEPTED: (self._bucket_put_accepted_error, container,
+                                    app),
+                },
+                'POST': {
+                    HTTP_NOT_FOUND: (NoSuchBucket, container),
+                },
+                'DELETE': {
+                    HTTP_NOT_FOUND: (NoSuchBucket, container),
+                    HTTP_CONFLICT: BucketNotEmpty,
+                },
+            }
+        else:
+            # Swift object access.
+
+            # 404s differ depending upon whether the bucket exists
+            # Note that base-container-existence checks happen elsewhere for
+            # multi-part uploads, and get_container_info should be pulling
+            # from the env cache
+            def not_found_handler():
+                if container.endswith(MULTIUPLOAD_SUFFIX) or \
+                        is_success(get_container_info(
+                            env, app, swift_source='S3').get('status')):
+                    return NoSuchKey(obj)
+                return NoSuchBucket(container)
+
+            # Since BadDigest ought to plumb in some client-provided values,
+            # defer evaluation until we know they're provided
+            def bad_digest_handler():
+                etag = binascii.hexlify(base64.b64decode(
+                    env['HTTP_CONTENT_MD5']))
+                return BadDigest(
+                    expected_digest=etag,  # yes, really hex
+                    # TODO: plumb in calculated_digest, as b64
+                )
+
+            code_map = {
+                'HEAD': {
+                    HTTP_NOT_FOUND: not_found_handler,
+                    HTTP_PRECONDITION_FAILED: PreconditionFailed,
+                },
+                'GET': {
+                    HTTP_NOT_FOUND: not_found_handler,
+                    HTTP_PRECONDITION_FAILED: PreconditionFailed,
+                },
+                'PUT': {
+                    HTTP_NOT_FOUND: (NoSuchBucket, container),
+                    HTTP_UNPROCESSABLE_ENTITY: bad_digest_handler,
+                    HTTP_REQUEST_ENTITY_TOO_LARGE: EntityTooLarge,
+                    HTTP_LENGTH_REQUIRED: MissingContentLength,
+                    HTTP_REQUEST_TIMEOUT: RequestTimeout,
+                    HTTP_PRECONDITION_FAILED: PreconditionFailed,
+                    HTTP_CLIENT_CLOSED_REQUEST: RequestTimeout,
+                },
+                'POST': {
+                    HTTP_NOT_FOUND: not_found_handler,
+                    HTTP_PRECONDITION_FAILED: PreconditionFailed,
+                },
+                'DELETE': {
+                    HTTP_NOT_FOUND: (NoSuchKey, obj),
+                },
+            }
+
+        return code_map[method]
+
+    @contextlib.contextmanager
+    def translate_read_errors(self):
+        try:
+            yield
+        except S3InputIncomplete:
+            raise IncompleteBody('The request body terminated unexpectedly')
+        except S3InputSHA256Mismatch as err:
+            # hopefully by now any modifications to the path (e.g. tenant to
+            # account translation) will have been made by auth middleware
+            raise XAmzContentSHA256Mismatch(
+                client_computed_content_s_h_a256=err.expected,
+                s3_computed_content_s_h_a256=err.computed,
+            )
+        except S3InputChecksumMismatch as e:
+            raise BadDigest(
+                'The %s you specified did not '
+                'match the calculated checksum.' % e.args[0])
+        except S3InputChecksumTrailerInvalid as e:
+            raise InvalidRequest(
+                'Value for %s trailing header is invalid.' % e.trailer)
+        except S3InputChunkSignatureMismatch:
+            raise SignatureDoesNotMatch(
+                **self.signature_does_not_match_kwargs())
+        except S3InputSizeError as e:
+            raise IncompleteBody(
+                number_bytes_expected=e.expected,
+                number_bytes_provided=e.provided,
+            )
+        except S3InputChunkTooSmall as e:
+            raise InvalidChunkSizeError(
+                chunk=e.chunk_number,
+                bad_chunk_size=e.bad_chunk_size,
+            )
+        except S3InputMalformedTrailer:
+            raise MalformedTrailerError
+        except S3InputMissingSecret:
+            # XXX: We should really log something here. The poor user can't do
+            # anything about this; we need to notify the operator to notify the
+            # auth middleware developer
+            raise S3NotImplemented('Transferring payloads in multiple chunks '
+                                   'using aws-chunked is not supported.')
+        except S3InputError:
+            # All cases should be covered above, but belt & braces
+            # NB: general exception handler in s3api.py will log traceback
+            raise InternalError
+
+    def _get_response(self, app, method, container, obj,
+                      headers=None, body=None, query=None):
+        """
+        Calls the application with this request's environment.  Returns a
+        S3Response object that wraps up the application's result.
+        """
+
+        method = method or self.environ['REQUEST_METHOD']
+
+        if container is None:
+            container = self.container_name
+        if obj is None:
+            obj = self.object_name
+
+        sw_req = self.to_swift_req(method, container, obj, headers=headers,
+                                   body=body, query=query)
+
+        try:
+            with self.translate_read_errors():
+                sw_resp = sw_req.get_response(app)
+        finally:
+            # reuse account
+            _, self.account, _ = split_path(sw_req.environ['PATH_INFO'],
+                                            2, 3, True)
+            self.environ['s3api.backend_path'] = sw_req.environ['PATH_INFO']
+
+        # keep a record of the backend policy index so that the s3api can add
+        # it to the headers of whatever response it returns, which may not
+        # necessarily be this resp.
+        self.policy_index = get_policy_index(sw_req.headers, sw_resp.headers)
+        resp = S3Response.from_swift_resp(sw_resp)
+        status = resp.status_int  # pylint: disable-msg=E1101
+
+        if not self.user_id:
+            if 'HTTP_X_USER_NAME' in sw_resp.environ:
+                # keystone
+                self.user_id = "%s:%s" % (
+                    sw_resp.environ['HTTP_X_TENANT_NAME'],
+                    sw_resp.environ['HTTP_X_USER_NAME'])
+            else:
+                # tempauth
+                self.user_id = self.access_key
+
+        success_codes = self._swift_success_codes(method, container, obj)
+        error_codes = self._swift_error_codes(method, container, obj,
+                                              sw_req.environ, app)
+
+        if status in success_codes:
+            return resp
+
+        err_msg = resp.body
+
+        if status in error_codes:
+            err_resp = \
+                error_codes[sw_resp.status_int]  # pylint: disable-msg=E1101
+            if isinstance(err_resp, tuple):
+                raise err_resp[0](*err_resp[1:])
+            elif b'quota' in err_msg:
+                raise err_resp(err_msg)
+            else:
+                raise err_resp()
+
+        if status == HTTP_BAD_REQUEST:
+            err_str = err_msg.decode('utf8')
+            if 'X-Delete-At' in err_str:
+                raise InvalidArgument('X-Delete-At',
+                                      self.headers['X-Delete-At'],
+                                      err_str)
+            if 'X-Delete-After' in err_str:
+                raise InvalidArgument('X-Delete-After',
+                                      self.headers['X-Delete-After'],
+                                      err_str)
+            else:
+                raise InvalidRequest(msg=err_str)
+        if status == HTTP_UNAUTHORIZED:
+            raise SignatureDoesNotMatch(
+                **self.signature_does_not_match_kwargs())
+        if status == HTTP_FORBIDDEN:
+            raise AccessDenied(reason='forbidden')
+        if status == HTTP_REQUESTED_RANGE_NOT_SATISFIABLE:
+            self.validate_part_number(
+                parts_count=resp.headers.get('x-amz-mp-parts-count'))
+            raise InvalidRange()
+        if status == HTTP_SERVICE_UNAVAILABLE:
+            raise ServiceUnavailable()
+        if status in (HTTP_RATE_LIMITED, HTTP_TOO_MANY_REQUESTS):
+            if self.conf.ratelimit_as_client_error:
+                raise SlowDown(status='429 Slow Down')
+            raise SlowDown()
+        if resp.status_int == HTTP_CONFLICT:
+            if self.method == 'GET':
+                raise BrokenMPU()
+            else:
+                raise ServiceUnavailable()
+
+        raise InternalError('unexpected status code %d' % status)
+
+    def get_response(self, app, method=None, container=None, obj=None,
+                     headers=None, body=None, query=None):
+        """
+        get_response is an entry point to be extended for child classes.
+        If additional tasks needed at that time of getting swift response,
+        we can override this method.
+        swift.common.middleware.s3api.s3request.S3Request need to just call
+        _get_response to get pure swift response.
+        """
+
+        if 'HTTP_X_AMZ_ACL' in self.environ:
+            handle_acl_header(self)
+
+        return self._get_response(app, method, container, obj,
+                                  headers, body, query)
+
+    def get_validated_param(self, param, default, limit=MAX_32BIT_INT):
+        value = default
+        if param in self.params:
+            try:
+                value = int(self.params[param])
+                if value < 0:
+                    err_msg = 'Argument %s must be an integer between 0 and' \
+                              ' %d' % (param, MAX_32BIT_INT)
+                    raise InvalidArgument(param, self.params[param], err_msg)
+
+                if value > MAX_32BIT_INT:
+                    # check the value because int() could build either a long
+                    # instance or a 64bit integer.
+                    raise ValueError()
+
+                if limit < value:
+                    value = limit
+
+            except ValueError:
+                err_msg = 'Provided %s not an integer or within ' \
+                          'integer range' % param
+                raise InvalidArgument(param, self.params[param], err_msg)
+
+        return value
+
+    def get_container_info(self, app):
+        """
+        get_container_info will return a result dict of get_container_info
+        from the backend Swift.
+
+        :returns: a dictionary of container info from
+                  swift.controllers.base.get_container_info
+        :raises: NoSuchBucket when the container doesn't exist
+        :raises: InternalError when the request failed without 404
+        """
+        if not self.is_authenticated:
+            sw_req = self.to_swift_req('TEST', None, None, body='')
+            # don't show log message of this request
+            sw_req.environ['swift.proxy_access_log_made'] = True
+
+            sw_resp = sw_req.get_response(app)
+
+            if not sw_req.remote_user:
+                raise SignatureDoesNotMatch(
+                    **self.signature_does_not_match_kwargs())
+
+            _, self.account, _ = split_path(sw_resp.environ['PATH_INFO'],
+                                            2, 3, True)
+        sw_req = self.to_swift_req('TEST', self.container_name, None)
+        info = get_container_info(sw_req.environ, app, swift_source='S3')
+        if is_success(info['status']):
+            return info
+        elif info['status'] == HTTP_NOT_FOUND:
+            raise NoSuchBucket(self.container_name)
+        elif info['status'] == HTTP_SERVICE_UNAVAILABLE:
+            raise ServiceUnavailable()
+        else:
+            raise InternalError(
+                'unexpected status code %d' % info['status'])
+
+    def gen_multipart_manifest_delete_query(self, app, obj=None, version=None):
+        if not self.conf.allow_multipart_uploads:
+            return {}
+        if not obj:
+            obj = self.object_name
+        query = {'symlink': 'get'}
+        if version is not None:
+            query['version-id'] = version
+        resp = self.get_response(app, 'HEAD', obj=obj, query=query)
+        if not resp.is_slo:
+            return {}
+        elif resp.sysmeta_headers.get(sysmeta_header('object', 'etag')):
+            # Even if allow_async_delete is turned off, SLO will just handle
+            # the delete synchronously, so we don't need to check before
+            # setting async=on
+            return {'multipart-manifest': 'delete', 'async': 'on'}
+        else:
+            return {'multipart-manifest': 'delete'}
+
+    def set_acl_handler(self, handler):
+        pass
+
+
+class S3AclRequest(S3Request):
+    """
+    S3Acl request object.
+    """
+
+    def __init__(self, env, app=None, conf=None):
+        super(S3AclRequest, self).__init__(env, app, conf)
+        self.authenticate(app)
+        self.acl_handler = None
+
+    @property
+    def controller(self):
+        if 'acl' in self.params and not self.is_service_request:
+            return S3AclController
+        return super(S3AclRequest, self).controller
+
+    def authenticate(self, app):
+        """
+        authenticate method will run pre-authenticate request and retrieve
+        account information.
+        Note that it currently supports only keystone and tempauth.
+        (no support for the third party authentication middleware)
+        """
+        sw_req = self.to_swift_req('TEST', None, None, body='')
+        # don't show log message of this request
+        sw_req.environ['swift.proxy_access_log_made'] = True
+
+        sw_resp = sw_req.get_response(app)
+
+        if not sw_req.remote_user:
+            raise SignatureDoesNotMatch(
+                **self.signature_does_not_match_kwargs())
+
+        _, self.account, _ = split_path(sw_resp.environ['PATH_INFO'],
+                                        2, 3, True)
+
+        if 'HTTP_X_USER_NAME' in sw_resp.environ:
+            # keystone
+            self.user_id = "%s:%s" % (sw_resp.environ['HTTP_X_TENANT_NAME'],
+                                      sw_resp.environ['HTTP_X_USER_NAME'])
+        else:
+            # tempauth
+            self.user_id = self.access_key
+
+        sw_req.environ.get('swift.authorize', lambda req: None)(sw_req)
+        self.environ['swift_owner'] = sw_req.environ.get('swift_owner', False)
+        if 'REMOTE_USER' in sw_req.environ:
+            self.environ['REMOTE_USER'] = sw_req.environ['REMOTE_USER']
+
+        # Need to skip S3 authorization on subsequent requests to prevent
+        # overwriting the account in PATH_INFO
+        del self.environ['s3api.auth_details']
+
+    def to_swift_req(self, method, container, obj, query=None,
+                     body=None, headers=None):
+        sw_req = super(S3AclRequest, self).to_swift_req(
+            method, container, obj, query, body, headers)
+        if self.account:
+            sw_req.environ['swift_owner'] = True  # needed to set ACL
+            sw_req.environ['swift.authorize_override'] = True
+            sw_req.environ['swift.authorize'] = lambda req: None
+        return sw_req
+
+    def get_acl_response(self, app, method=None, container=None, obj=None,
+                         headers=None, body=None, query=None):
+        """
+        Wrapper method of _get_response to add s3 acl information
+        from response sysmeta headers.
+        """
+
+        resp = self._get_response(
+            app, method, container, obj, headers, body, query)
+        resp.bucket_acl = decode_acl(
+            'container', resp.sysmeta_headers, self.conf.allow_no_owner)
+        resp.object_acl = decode_acl(
+            'object', resp.sysmeta_headers, self.conf.allow_no_owner)
+
+        return resp
+
+    def get_response(self, app, method=None, container=None, obj=None,
+                     headers=None, body=None, query=None):
+        """
+        Wrap up get_response call to hook with acl handling method.
+        """
+        if not self.acl_handler:
+            # we should set acl_handler all time before calling get_response
+            raise Exception('get_response called before set_acl_handler')
+        resp = self.acl_handler.handle_acl(
+            app, method, container, obj, headers)
+
+        # possible to skip recalling get_response_acl if resp is not
+        # None (e.g. HEAD)
+        if resp:
+            return resp
+        return self.get_acl_response(app, method, container, obj,
+                                     headers, body, query)
+
+    def set_acl_handler(self, acl_handler):
+        self.acl_handler = acl_handler
+
+
+class SigV4Request(SigV4Mixin, S3Request):
+    pass
+
+
+class SigV4S3AclRequest(SigV4Mixin, S3AclRequest):
+    pass
diff --git a/swift/common/middleware/s3api/s3response.py b/swift/common/middleware/s3api/s3response.py
new file mode 100644
index 0000000000..7a84411d28
--- /dev/null
+++ b/swift/common/middleware/s3api/s3response.py
@@ -0,0 +1,818 @@
+# Copyright (c) 2014 OpenStack Foundation.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import re
+from collections.abc import MutableMapping
+from functools import partial
+
+from swift.common import header_key_dict
+from swift.common import swob
+from swift.common.utils import config_true_value
+from swift.common.request_helpers import is_sys_meta
+
+from swift.common.middleware.s3api.utils import snake_to_camel, \
+    sysmeta_prefix, sysmeta_header
+from swift.common.middleware.s3api.etree import Element, SubElement, tostring
+from swift.common.middleware.versioned_writes.object_versioning import \
+    DELETE_MARKER_CONTENT_TYPE
+
+
+class HeaderKeyDict(header_key_dict.HeaderKeyDict):
+    """
+    Similar to the Swift's normal HeaderKeyDict class, but its key name is
+    normalized as S3 clients expect.
+    """
+    @staticmethod
+    def _title(s):
+        s = header_key_dict.HeaderKeyDict._title(s)
+        if s.lower() == 'etag':
+            # AWS Java SDK expects only 'ETag'.
+            return 'ETag'
+        if s.lower().startswith('x-amz-'):
+            # AWS headers returned by S3 are lowercase.
+            return swob.bytes_to_wsgi(swob.wsgi_to_bytes(s).lower())
+        return s
+
+
+def translate_swift_to_s3(key, val):
+    _key = swob.bytes_to_wsgi(swob.wsgi_to_bytes(key).lower())
+
+    def translate_meta_key(_key):
+        if not _key.startswith('x-object-meta-'):
+            return _key
+        # Note that AWS allows user-defined metadata with underscores in the
+        # header, while WSGI (and other protocols derived from CGI) does not
+        # differentiate between an underscore and a dash. Fortunately,
+        # eventlet exposes the raw headers from the client, so we could
+        # translate '_' to '=5F' on the way in. Now, we translate back.
+        return 'x-amz-meta-' + _key[14:].replace('=5f', '_')
+
+    if _key.startswith('x-object-meta-'):
+        return translate_meta_key(_key), val
+    elif _key in ('accept-ranges', 'content-length', 'content-type',
+                  'content-range', 'content-encoding',
+                  'content-disposition', 'content-language',
+                  'etag', 'last-modified', 'x-robots-tag',
+                  'cache-control', 'expires'):
+        return key, val
+    elif _key == 'x-object-version-id':
+        return 'x-amz-version-id', val
+    elif _key == 'x-parts-count':
+        return 'x-amz-mp-parts-count', val
+    elif _key == 'x-copied-from-version-id':
+        return 'x-amz-copy-source-version-id', val
+    elif _key == 'x-backend-content-type' and \
+            val == DELETE_MARKER_CONTENT_TYPE:
+        return 'x-amz-delete-marker', 'true'
+    elif _key == 'access-control-expose-headers':
+        exposed_headers = val.split(', ')
+        exposed_headers.extend([
+            'x-amz-request-id',
+            'x-amz-id-2',
+        ])
+        return 'access-control-expose-headers', ', '.join(
+            translate_meta_key(h) for h in exposed_headers)
+    elif _key == 'access-control-allow-methods':
+        methods = val.split(', ')
+        try:
+            methods.remove('COPY')  # that's not a thing in S3
+        except ValueError:
+            pass  # not there? don't worry about it
+        return key, ', '.join(methods)
+    elif _key.startswith('access-control-'):
+        return key, val
+    # else, drop the header
+    return None
+
+
+class S3ResponseBase(object):
+    """
+    Base class for swift3 responses.
+    """
+    pass
+
+
+class S3Response(S3ResponseBase, swob.Response):
+    """
+    Similar to the Response class in Swift, but uses our HeaderKeyDict for
+    headers instead of Swift's HeaderKeyDict.  This also translates Swift
+    specific headers to S3 headers.
+    """
+
+    def __init__(self, *args, **kwargs):
+        swob.Response.__init__(self, *args, **kwargs)
+
+        s3_sysmeta_headers = swob.HeaderKeyDict()
+        sw_headers = swob.HeaderKeyDict()
+        headers = HeaderKeyDict()
+        self.is_slo = False
+
+        def is_swift3_sysmeta(sysmeta_key, server_type):
+            swift3_sysmeta_prefix = (
+                'x-%s-sysmeta-swift3' % server_type).lower()
+            return sysmeta_key.lower().startswith(swift3_sysmeta_prefix)
+
+        def is_s3api_sysmeta(sysmeta_key, server_type):
+            s3api_sysmeta_prefix = sysmeta_prefix(_server_type).lower()
+            return sysmeta_key.lower().startswith(s3api_sysmeta_prefix)
+
+        for key, val in self.headers.items():
+            if is_sys_meta('object', key) or is_sys_meta('container', key):
+                _server_type = key.split('-')[1]
+                if is_swift3_sysmeta(key, _server_type):
+                    # To be compatible with older swift3, translate swift3
+                    # sysmeta to s3api sysmeta here
+                    key = sysmeta_prefix(_server_type) + \
+                        key[len('x-%s-sysmeta-swift3-' % _server_type):]
+
+                    if key not in s3_sysmeta_headers:
+                        # To avoid overwrite s3api sysmeta by older swift3
+                        # sysmeta set the key only when the key does not exist
+                        s3_sysmeta_headers[key] = val
+                elif is_s3api_sysmeta(key, _server_type):
+                    s3_sysmeta_headers[key] = val
+                else:
+                    sw_headers[key] = val
+            else:
+                sw_headers[key] = val
+
+        # Handle swift headers
+        for key, val in sw_headers.items():
+            s3_pair = translate_swift_to_s3(key, val)
+            if s3_pair is None:
+                continue
+            headers[s3_pair[0]] = s3_pair[1]
+
+        self.is_slo = config_true_value(sw_headers.get(
+            'x-static-large-object'))
+
+        # Check whether we stored the AWS-style etag on upload
+        override_etag = s3_sysmeta_headers.get(
+            sysmeta_header('object', 'etag'))
+        if override_etag not in (None, ''):
+            # Multipart uploads in AWS have ETags like
+            #   <MD5(part_etag1 || ... || part_etagN)>-<number of parts>
+            headers['etag'] = override_etag
+        elif self.is_slo and 'etag' in headers:
+            # Many AWS clients use the presence of a '-' to decide whether
+            # to attempt client-side download validation, so even if we
+            # didn't store the AWS-style header, tack on a '-N'. (Use 'N'
+            # because we don't actually know how many parts there are.)
+            headers['etag'] += '-N'
+
+        self.headers = headers
+
+        if self.etag:
+            # add double quotes to the etag header
+            self.etag = self.etag
+
+        # Used for pure swift header handling at the request layer
+        self.sw_headers = sw_headers
+        self.sysmeta_headers = s3_sysmeta_headers
+
+    @classmethod
+    def from_swift_resp(cls, sw_resp):
+        """
+        Create a new S3 response object based on the given Swift response.
+        """
+        if sw_resp.app_iter:
+            body = None
+            app_iter = sw_resp.app_iter
+        else:
+            body = sw_resp.body
+            app_iter = None
+
+        resp = cls(status=sw_resp.status, headers=sw_resp.headers,
+                   request=sw_resp.request, body=body, app_iter=app_iter,
+                   conditional_response=sw_resp.conditional_response)
+        resp.environ.update(sw_resp.environ)
+
+        return resp
+
+    def append_copy_resp_body(self, controller_name, last_modified):
+        elem = Element('Copy%sResult' % controller_name)
+        SubElement(elem, 'LastModified').text = last_modified
+        SubElement(elem, 'ETag').text = '"%s"' % self.etag
+        self.headers['Content-Type'] = 'application/xml'
+        self.body = tostring(elem)
+        self.etag = None
+
+
+HTTPOk = partial(S3Response, status=200)
+HTTPCreated = partial(S3Response, status=201)
+HTTPAccepted = partial(S3Response, status=202)
+HTTPNoContent = partial(S3Response, status=204)
+HTTPPartialContent = partial(S3Response, status=206)
+
+
+class ErrorResponse(S3ResponseBase, swob.HTTPException):
+    """
+    S3 error object.
+
+    Reference information about S3 errors is available at:
+    http://docs.aws.amazon.com/AmazonS3/latest/API/ErrorResponses.html
+    """
+    _status = ''
+    _msg = ''
+    _code = ''
+    xml_declaration = True
+
+    def __init__(self, msg=None, reason=None, *args, **kwargs):
+        if msg:
+            self._msg = msg
+        if not self._code:
+            self._code = self.__class__.__name__
+        self.reason = reason
+
+        self.info = kwargs.copy()
+        for reserved_key in ('headers', 'body'):
+            if self.info.get(reserved_key):
+                del (self.info[reserved_key])
+
+        swob.HTTPException.__init__(
+            self, status=kwargs.pop('status', self._status),
+            # we use an app_iter, so that we can add our trans_id to the resp
+            # xml *after* we've been called - technically any non-None app_iter
+            # would do, we override swob.Response._response_iter anyway.
+            app_iter=self._body_iter(),
+            content_type='application/xml', *args,
+            **kwargs)
+        self.headers = HeaderKeyDict(self.headers)
+
+    @property
+    def summary(self):
+        """Provide a summary of the error code and reason."""
+        if self.reason:
+            summary = '.'.join([self._code, self.reason])
+        else:
+            summary = self._code
+        return summary.replace(' ', '_')
+
+    @property
+    def metric_name(self):
+        return '.'.join([str(self.status_int), self.summary])
+
+    def _body_iter(self):
+        error_elem = Element('Error')
+        SubElement(error_elem, 'Code').text = self._code
+        SubElement(error_elem, 'Message').text = self._msg
+        # N.B. swob.Response objects don't normally have an environ attribute
+        # when they're created, but swob always gives this to us when we're
+        # __call__'d
+        if 'swift.trans_id' in self.environ:
+            request_id = self.environ['swift.trans_id']
+            SubElement(error_elem, 'RequestId').text = request_id
+
+        self._dict_to_etree(error_elem, self.info)
+
+        yield tostring(error_elem, use_s3ns=False,
+                       xml_declaration=self.xml_declaration)
+
+    def _response_iter(self, app_iter, body):
+        # we don't actually want our _response_iter to be a generator, a list
+        # of strings is much better for eventlet.wsgi.server connection
+        # handling and request pipelining and ErrorResponses are small.  FWIW
+        # we now have self.environ, app_iter=self._body_iter() and body is None
+        return super()._response_iter(list(app_iter), body)
+
+    def _dict_to_etree(self, parent, d):
+        for key, value in d.items():
+            tag = re.sub(r'\W', '', snake_to_camel(key))
+            elem = SubElement(parent, tag)
+
+            if isinstance(value, (dict, MutableMapping)):
+                self._dict_to_etree(elem, value)
+            else:
+                if isinstance(value, (int, float, bool)):
+                    value = str(value)
+                try:
+                    elem.text = value
+                except ValueError:
+                    # We set an invalid string for XML.
+                    elem.text = '(invalid string)'
+
+
+class AccessDenied(ErrorResponse):
+    _status = '403 Forbidden'
+    _msg = 'Access Denied.'
+
+
+class AccountProblem(ErrorResponse):
+    _status = '403 Forbidden'
+    _msg = 'There is a problem with your AWS account that prevents the ' \
+           'operation from completing successfully.'
+
+
+class AmbiguousGrantByEmailAddress(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'The e-mail address you provided is associated with more than ' \
+           'one account.'
+
+
+class AuthorizationHeaderMalformed(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'The authorization header is malformed; the authorization ' \
+           'header requires three components: Credential, SignedHeaders, ' \
+           'and Signature.'
+
+
+class AuthorizationQueryParametersError(ErrorResponse):
+    _status = '400 Bad Request'
+
+
+class BadDigest(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'The Content-MD5 you specified did not match what we received.'
+
+
+class XAmzContentSHA256Mismatch(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = "The provided 'x-amz-content-sha256' header does not match what " \
+           "was computed."
+
+
+class BucketAlreadyExists(ErrorResponse):
+    _status = '409 Conflict'
+    _msg = 'The requested bucket name is not available. The bucket ' \
+           'namespace is shared by all users of the system. Please select a ' \
+           'different name and try again.'
+
+    def __init__(self, bucket, msg=None, *args, **kwargs):
+        ErrorResponse.__init__(self, msg, bucket_name=bucket, *args, **kwargs)
+
+
+class BucketAlreadyOwnedByYou(ErrorResponse):
+    _status = '409 Conflict'
+    _msg = 'Your previous request to create the named bucket succeeded and ' \
+           'you already own it.'
+
+    def __init__(self, bucket, msg=None, *args, **kwargs):
+        ErrorResponse.__init__(self, msg, bucket_name=bucket, *args, **kwargs)
+
+
+class BucketNotEmpty(ErrorResponse):
+    _status = '409 Conflict'
+    _msg = 'The bucket you tried to delete is not empty'
+
+
+class VersionedBucketNotEmpty(BucketNotEmpty):
+    _msg = 'The bucket you tried to delete is not empty. ' \
+           'You must delete all versions in the bucket.'
+    _code = 'BucketNotEmpty'
+
+
+class CredentialsNotSupported(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'This request does not support credentials.'
+
+
+class CrossLocationLoggingProhibited(ErrorResponse):
+    _status = '403 Forbidden'
+    _msg = 'Cross location logging not allowed. Buckets in one geographic ' \
+           'location cannot log information to a bucket in another location.'
+
+
+class EntityTooSmall(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'Your proposed upload is smaller than the minimum allowed object ' \
+           'size.'
+
+
+class EntityTooLarge(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'Your proposed upload exceeds the maximum allowed object size.'
+
+
+class ExpiredToken(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'The provided token has expired.'
+
+
+class IllegalVersioningConfigurationException(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'The Versioning configuration specified in the request is invalid.'
+
+
+class IncompleteBody(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'You did not provide the number of bytes specified by the ' \
+           'Content-Length HTTP header'
+
+
+class IncorrectNumberOfFilesInPostRequest(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'POST requires exactly one file upload per request.'
+
+
+class InlineDataTooLarge(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'Inline data exceeds the maximum allowed size.'
+
+
+class InternalError(ErrorResponse):
+    _status = '500 Internal Server Error'
+    _msg = 'We encountered an internal error. Please try again.'
+
+    def __str__(self):
+        return '%s: %s (%s)' % (
+            self.__class__.__name__, self.status, self._msg)
+
+
+class InvalidAccessKeyId(ErrorResponse):
+    _status = '403 Forbidden'
+    _msg = 'The AWS Access Key Id you provided does not exist in our records.'
+
+
+class InvalidArgument(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'Invalid Argument.'
+
+    def __init__(self, name, value, msg=None, *args, **kwargs):
+        ErrorResponse.__init__(self, msg, argument_name=name,
+                               argument_value=value, *args, **kwargs)
+
+
+class InvalidBucketName(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'The specified bucket is not valid.'
+
+    def __init__(self, bucket, msg=None, *args, **kwargs):
+        ErrorResponse.__init__(self, msg, bucket_name=bucket, *args, **kwargs)
+
+
+class InvalidBucketState(ErrorResponse):
+    _status = '409 Conflict'
+    _msg = 'The request is not valid with the current state of the bucket.'
+
+
+class InvalidChunkSizeError(ErrorResponse):
+    _status = '403 Forbidden'
+    _msg = 'Only the last chunk is allowed to have a size less than 8192 bytes'
+
+
+class InvalidDigest(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'The Content-MD5 you specified was invalid.'
+
+
+class InvalidLocationConstraint(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'The specified location constraint is not valid.'
+
+
+class InvalidObjectState(ErrorResponse):
+    _status = '403 Forbidden'
+    _msg = 'The operation is not valid for the current state of the object.'
+
+
+class InvalidPartArgument(InvalidArgument):
+    _code = 'InvalidArgument'
+
+    def __init__(self, max_parts, value):
+        err_msg = ('Part number must be an integer between '
+                   '1 and %s, inclusive' % max_parts)
+        super(InvalidArgument, self).__init__(err_msg,
+                                              argument_name='partNumber',
+                                              argument_value=value)
+
+
+class InvalidPart(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'One or more of the specified parts could not be found.  The ' \
+           'part may not have been uploaded, or the specified entity tag ' \
+           'may not match the part\'s entity tag.'
+
+
+class InvalidPartOrder(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'The list of parts was not in ascending order.Parts list must ' \
+           'specified in order by part number.'
+
+
+class InvalidPayer(ErrorResponse):
+    _status = '403 Forbidden'
+    _msg = 'All access to this object has been disabled.'
+
+
+class InvalidPolicyDocument(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'The content of the form does not meet the conditions specified ' \
+           'in the policy document.'
+
+
+class InvalidRange(ErrorResponse):
+    _status = '416 Requested Range Not Satisfiable'
+    _msg = 'The requested range cannot be satisfied.'
+
+
+class InvalidPartNumber(ErrorResponse):
+    _status = '416 Requested Range Not Satisfiable'
+    _msg = 'The requested partnumber is not satisfiable'
+
+
+class InvalidRequest(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'Invalid Request.'
+
+
+class InvalidSecurity(ErrorResponse):
+    _status = '403 Forbidden'
+    _msg = 'The provided security credentials are not valid.'
+
+
+class InvalidSOAPRequest(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'The SOAP request body is invalid.'
+
+
+class InvalidStorageClass(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'The storage class you specified is not valid.'
+
+
+class InvalidTargetBucketForLogging(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'The target bucket for logging does not exist, is not owned by ' \
+           'you, or does not have the appropriate grants for the ' \
+           'log-delivery group.'
+
+    def __init__(self, bucket, msg=None, *args, **kwargs):
+        ErrorResponse.__init__(self, msg, target_bucket=bucket, *args,
+                               **kwargs)
+
+
+class InvalidToken(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'The provided token is malformed or otherwise invalid.'
+
+
+class InvalidURI(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'Couldn\'t parse the specified URI.'
+
+    def __init__(self, uri, msg=None, *args, **kwargs):
+        ErrorResponse.__init__(self, msg, uri=uri, *args, **kwargs)
+
+
+class KeyTooLongError(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'Your key is too long.'
+
+
+class MalformedACLError(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'The XML you provided was not well-formed or did not validate ' \
+           'against our published schema.'
+
+
+class MalformedPOSTRequest(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'The body of your POST request is not well-formed ' \
+           'multipart/form-data.'
+
+
+class MalformedTrailerError(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'The request contained trailing data that was not well-formed ' \
+           'or did not conform to our published schema.'
+
+
+class MalformedXML(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'The XML you provided was not well-formed or did not validate ' \
+           'against our published schema'
+
+
+class MaxMessageLengthExceeded(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'Your request was too big.'
+
+
+class MaxPostPreDataLengthExceededError(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'Your POST request fields preceding the upload file were too large.'
+
+
+class MetadataTooLarge(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'Your metadata headers exceed the maximum allowed metadata size.'
+
+
+class MethodNotAllowed(ErrorResponse):
+    _status = '405 Method Not Allowed'
+    _msg = 'The specified method is not allowed against this resource.'
+
+    def __init__(self, method, resource_type, msg=None, *args, **kwargs):
+        ErrorResponse.__init__(self, msg, method=method,
+                               resource_type=resource_type, *args, **kwargs)
+
+
+class MissingContentLength(ErrorResponse):
+    _status = '411 Length Required'
+    _msg = 'You must provide the Content-Length HTTP header.'
+
+
+class MissingRequestBodyError(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'Request body is empty.'
+
+
+class MissingSecurityElement(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'The SOAP 1.1 request is missing a security element.'
+
+
+class MissingSecurityHeader(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'Your request was missing a required header.'
+
+
+class NoLoggingStatusForKey(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'There is no such thing as a logging status sub-resource for a key.'
+
+
+class NoSuchBucket(ErrorResponse):
+    _status = '404 Not Found'
+    _msg = 'The specified bucket does not exist.'
+
+    def __init__(self, bucket, msg=None, *args, **kwargs):
+        if not bucket:
+            raise InternalError()
+        ErrorResponse.__init__(self, msg, bucket_name=bucket, *args, **kwargs)
+
+
+class NoSuchKey(ErrorResponse):
+    _status = '404 Not Found'
+    _msg = 'The specified key does not exist.'
+
+    def __init__(self, key, msg=None, *args, **kwargs):
+        if not key:
+            raise InternalError()
+        ErrorResponse.__init__(self, msg, key=key, *args, **kwargs)
+
+
+class ObjectLockConfigurationNotFoundError(ErrorResponse):
+    _status = '404 Not found'
+    _msg = 'Object Lock configuration does not exist for this bucket'
+
+    def __init__(self, bucket, msg=None, *args, **kwargs):
+        if not bucket:
+            raise InternalError()
+        ErrorResponse.__init__(self, msg, bucket_name=bucket, *args, **kwargs)
+
+
+class NoSuchLifecycleConfiguration(ErrorResponse):
+    _status = '404 Not Found'
+    _msg = 'The lifecycle configuration does not exist. .'
+
+
+class NoSuchUpload(ErrorResponse):
+    _status = '404 Not Found'
+    _msg = 'The specified multipart upload does not exist. The upload ID ' \
+           'might be invalid, or the multipart upload might have been ' \
+           'aborted or completed.'
+
+
+class NoSuchVersion(ErrorResponse):
+    _status = '404 Not Found'
+    _msg = 'The specified version does not exist.'
+
+    def __init__(self, key, version_id, msg=None, *args, **kwargs):
+        if not key:
+            raise InternalError()
+        ErrorResponse.__init__(self, msg, key=key, version_id=version_id,
+                               *args, **kwargs)
+
+
+# NotImplemented is a python built-in constant.  Use S3NotImplemented instead.
+class S3NotImplemented(ErrorResponse):
+    _status = '501 Not Implemented'
+    _msg = 'Not implemented.'
+    _code = 'NotImplemented'
+
+
+class NotSignedUp(ErrorResponse):
+    _status = '403 Forbidden'
+    _msg = 'Your account is not signed up for the Amazon S3 service.'
+
+
+class NotSuchBucketPolicy(ErrorResponse):
+    _status = '404 Not Found'
+    _msg = 'The specified bucket does not have a bucket policy.'
+
+
+class OperationAborted(ErrorResponse):
+    _status = '409 Conflict'
+    _msg = 'A conflicting conditional operation is currently in progress ' \
+           'against this resource. Please try again.'
+
+
+class PermanentRedirect(ErrorResponse):
+    _status = '301 Moved Permanently'
+    _msg = 'The bucket you are attempting to access must be addressed using ' \
+           'the specified endpoint. Please send all future requests to this ' \
+           'endpoint.'
+
+
+class PreconditionFailed(ErrorResponse):
+    _status = '412 Precondition Failed'
+    _msg = 'At least one of the preconditions you specified did not hold.'
+
+
+class Redirect(ErrorResponse):
+    _status = '307 Moved Temporarily'
+    _msg = 'Temporary redirect.'
+
+
+class RestoreAlreadyInProgress(ErrorResponse):
+    _status = '409 Conflict'
+    _msg = 'Object restore is already in progress.'
+
+
+class RequestIsNotMultiPartContent(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'Bucket POST must be of the enclosure-type multipart/form-data.'
+
+
+class RequestTimeout(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'Your socket connection to the server was not read from or ' \
+           'written to within the timeout period.'
+
+
+class RequestTimeTooSkewed(ErrorResponse):
+    _status = '403 Forbidden'
+    _msg = 'The difference between the request time and the current time ' \
+           'is too large.'
+
+
+class RequestTorrentOfBucketError(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'Requesting the torrent file of a bucket is not permitted.'
+
+
+class SignatureDoesNotMatch(ErrorResponse):
+    _status = '403 Forbidden'
+    _msg = 'The request signature we calculated does not match the ' \
+           'signature you provided. Check your key and signing method.'
+
+
+class ServiceUnavailable(ErrorResponse):
+    _status = '503 Service Unavailable'
+    _msg = 'Please reduce your request rate.'
+
+
+class SlowDown(ErrorResponse):
+    _status = '503 Slow Down'
+    _msg = 'Please reduce your request rate.'
+
+
+class TemporaryRedirect(ErrorResponse):
+    _status = '307 Moved Temporarily'
+    _msg = 'You are being redirected to the bucket while DNS updates.'
+
+
+class TokenRefreshRequired(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'The provided token must be refreshed.'
+
+
+class TooManyBuckets(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'You have attempted to create more buckets than allowed.'
+
+
+class UnexpectedContent(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'This request does not support content.'
+
+
+class UnresolvableGrantByEmailAddress(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'The e-mail address you provided does not match any account on ' \
+           'record.'
+
+
+class UserKeyMustBeSpecified(ErrorResponse):
+    _status = '400 Bad Request'
+    _msg = 'The bucket POST must contain the specified field name. If it is ' \
+           'specified, please check the order of the fields.'
+
+
+class BrokenMPU(ErrorResponse):
+    # This is very much a Swift-ism, and we wish we didn't need it
+    _status = '409 Conflict'
+    _msg = 'Multipart upload has broken segment data.'
diff --git a/swift/common/middleware/s3api/s3token.py b/swift/common/middleware/s3api/s3token.py
new file mode 100644
index 0000000000..41f87cb375
--- /dev/null
+++ b/swift/common/middleware/s3api/s3token.py
@@ -0,0 +1,438 @@
+# Copyright 2012 OpenStack Foundation
+# Copyright 2010 United States Government as represented by the
+# Administrator of the National Aeronautics and Space Administration.
+# Copyright 2011,2012 Akira YOSHIYAMA <akirayoshiyama@gmail.com>
+# All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License"); you may
+# not use this file except in compliance with the License. You may obtain
+# a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
+# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
+# License for the specific language governing permissions and limitations
+# under the License.
+
+# This source code is based ./auth_token.py and ./ec2_token.py.
+# See them for their copyright.
+
+"""
+-------------------
+S3 Token Middleware
+-------------------
+s3token middleware is for authentication with s3api + keystone.
+This middleware:
+
+* Gets a request from the s3api middleware with an S3 Authorization
+  access key.
+* Validates s3 token with Keystone.
+* Transforms the account name to AUTH_%(tenant_name).
+* Optionally can retrieve and cache secret from keystone
+  to validate signature locally
+
+.. note::
+   If upgrading from swift3, the ``auth_version`` config option has been
+   removed, and the ``auth_uri`` option now includes the Keystone API
+   version. If you previously had a configuration like
+
+   .. code-block:: ini
+
+      [filter:s3token]
+      use = egg:swift3#s3token
+      auth_uri = https://keystonehost:35357
+      auth_version = 3
+
+   you should now use
+
+   .. code-block:: ini
+
+      [filter:s3token]
+      use = egg:swift#s3token
+      auth_uri = https://keystonehost:35357/v3
+"""
+
+import base64
+import json
+
+from keystoneclient.v3 import client as keystone_client
+from keystoneauth1 import session as keystone_session
+from keystoneauth1 import loading as keystone_loading
+import requests
+import urllib
+
+from swift.common.swob import Request, HTTPBadRequest, HTTPUnauthorized, \
+    HTTPException, str_to_wsgi
+from swift.common.utils import config_true_value, split_path, get_logger, \
+    cache_from_env, append_underscore
+from swift.common.wsgi import ConfigFileError
+
+
+PROTOCOL_NAME = 'S3 Token Authentication'
+
+# Headers to purge if they came from (or may have come from) the client
+KEYSTONE_AUTH_HEADERS = (
+    'X-Identity-Status', 'X-Service-Identity-Status',
+    'X-Domain-Id', 'X-Service-Domain-Id',
+    'X-Domain-Name', 'X-Service-Domain-Name',
+    'X-Project-Id', 'X-Service-Project-Id',
+    'X-Project-Name', 'X-Service-Project-Name',
+    'X-Project-Domain-Id', 'X-Service-Project-Domain-Id',
+    'X-Project-Domain-Name', 'X-Service-Project-Domain-Name',
+    'X-User-Id', 'X-Service-User-Id',
+    'X-User-Name', 'X-Service-User-Name',
+    'X-User-Domain-Id', 'X-Service-User-Domain-Id',
+    'X-User-Domain-Name', 'X-Service-User-Domain-Name',
+    'X-Roles', 'X-Service-Roles',
+    'X-Is-Admin-Project',
+    'X-Service-Catalog',
+    # Deprecated headers, too...
+    'X-Tenant-Id',
+    'X-Tenant-Name',
+    'X-Tenant',
+    'X-User',
+    'X-Role',
+)
+
+
+def parse_v2_response(token):
+    access_info = token['access']
+    headers = {
+        'X-Identity-Status': 'Confirmed',
+        'X-Roles': ','.join(r['name']
+                            for r in access_info['user']['roles']),
+        'X-User-Id': access_info['user']['id'],
+        'X-User-Name': access_info['user']['name'],
+        'X-Tenant-Id': access_info['token']['tenant']['id'],
+        'X-Tenant-Name': access_info['token']['tenant']['name'],
+        'X-Project-Id': access_info['token']['tenant']['id'],
+        'X-Project-Name': access_info['token']['tenant']['name'],
+    }
+    return headers, access_info['token']['tenant']
+
+
+def parse_v3_response(token):
+    token = token['token']
+    headers = {
+        'X-Identity-Status': 'Confirmed',
+        'X-Roles': ','.join(r['name']
+                            for r in token['roles']),
+        'X-User-Id': token['user']['id'],
+        'X-User-Name': token['user']['name'],
+        'X-User-Domain-Id': token['user']['domain']['id'],
+        'X-User-Domain-Name': token['user']['domain']['name'],
+        'X-Tenant-Id': token['project']['id'],
+        'X-Tenant-Name': token['project']['name'],
+        'X-Project-Id': token['project']['id'],
+        'X-Project-Name': token['project']['name'],
+        'X-Project-Domain-Id': token['project']['domain']['id'],
+        'X-Project-Domain-Name': token['project']['domain']['name'],
+    }
+    return headers, token['project']
+
+
+class S3Token(object):
+    """Middleware that handles S3 authentication."""
+
+    def __init__(self, app, conf):
+        """Common initialization code."""
+        self._app = app
+        self._logger = get_logger(
+            conf, log_route=conf.get('log_name', 's3token'))
+        self._logger.debug('Starting the %s component', PROTOCOL_NAME)
+        self._timeout = float(conf.get('http_timeout', '10.0'))
+        if not (0 < self._timeout <= 60):
+            raise ValueError('http_timeout must be between 0 and 60 seconds')
+        self._reseller_prefix = append_underscore(
+            conf.get('reseller_prefix', 'AUTH'))
+        self._delay_auth_decision = config_true_value(
+            conf.get('delay_auth_decision'))
+
+        # where to find the auth service (we use this to validate tokens)
+        self._request_uri = conf.get('auth_uri', '').rstrip('/') + '/s3tokens'
+        parsed = urllib.parse.urlsplit(self._request_uri)
+        if not parsed.scheme or not parsed.hostname:
+            raise ConfigFileError(
+                'Invalid auth_uri; must include scheme and host')
+        if parsed.scheme not in ('http', 'https'):
+            raise ConfigFileError(
+                'Invalid auth_uri; scheme must be http or https')
+        if parsed.query or parsed.fragment or '@' in parsed.netloc:
+            raise ConfigFileError('Invalid auth_uri; must not include '
+                                  'username, query, or fragment')
+
+        # SSL
+        insecure = config_true_value(conf.get('insecure'))
+        cert_file = conf.get('certfile')
+        key_file = conf.get('keyfile')
+
+        if insecure:
+            self._verify = False
+        elif cert_file and key_file:
+            self._verify = (cert_file, key_file)
+        elif cert_file:
+            self._verify = cert_file
+        else:
+            self._verify = None
+
+        self._secret_cache_duration = int(
+            conf.get('secret_cache_duration', 60))
+        if self._secret_cache_duration < 0:
+            raise ValueError('secret_cache_duration must be non-negative')
+
+        # Service authentication for s3tokens API calls
+        self.keystoneclient = None
+        try:
+            auth_plugin = keystone_loading.get_plugin_loader(
+                conf.get('auth_type', 'password'))
+            available_auth_options = auth_plugin.get_options()
+            auth_options = {}
+            for option in available_auth_options:
+                name = option.name.replace('-', '_')
+                value = conf.get(name)
+                if value:
+                    auth_options[name] = value
+
+            if not auth_options:
+                self._logger.warning(
+                    "No service auth configuration. "
+                    "s3tokens API calls will be unauthenticated. "
+                    "New versions of keystone require service auth.")
+            else:
+                auth = auth_plugin.load_from_options(**auth_options)
+                session = keystone_session.Session(auth=auth)
+                self.keystoneclient = keystone_client.Client(
+                    session=session,
+                    region_name=conf.get('region_name'))
+                self._logger.info(
+                    "Service authentication configured for s3tokens API")
+        except Exception:
+            self._logger.warning(
+                "Unable to load service auth configuration. "
+                "s3tokens API calls will be unauthenticated "
+                "and secret caching will be unavailable.",
+                exc_info=True)
+
+        if self._secret_cache_duration and self.keystoneclient:
+            self._logger.info("Caching s3tokens for %s seconds",
+                              self._secret_cache_duration)
+        else:
+            self._secret_cache_duration = 0
+
+    def _deny_request(self, code):
+        error_cls, message = {
+            'AccessDenied': (HTTPUnauthorized, 'Access denied'),
+            'InvalidURI': (HTTPBadRequest,
+                           'Could not parse the specified URI'),
+        }[code]
+        resp = error_cls(content_type='text/xml')
+        error_msg = ('<?xml version="1.0" encoding="UTF-8"?>\r\n'
+                     '<Error>\r\n  <Code>%s</Code>\r\n  '
+                     '<Message>%s</Message>\r\n</Error>\r\n' %
+                     (code, message)).encode()
+        resp.body = error_msg
+        return resp
+
+    def _json_request(self, creds_json):
+        headers = {'Content-Type': 'application/json'}
+
+        # Add service authentication headers if configured
+        if self.keystoneclient:
+            try:
+                headers.update(
+                    self.keystoneclient.session.get_auth_headers())
+            except Exception:
+                self._logger.warning("Failed to get service token",
+                                     exc_info=True)
+
+        try:
+            response = requests.post(self._request_uri,
+                                     headers=headers, data=creds_json,
+                                     verify=self._verify,
+                                     timeout=self._timeout)
+        except requests.exceptions.RequestException as e:
+            self._logger.info('HTTP connection exception: %s', e)
+            raise self._deny_request('InvalidURI')
+
+        if response.status_code < 200 or response.status_code >= 300:
+            self._logger.debug('Keystone reply error: status=%s reason=%s',
+                               response.status_code, response.reason)
+            raise self._deny_request('AccessDenied')
+
+        return response
+
+    def __call__(self, environ, start_response):
+        """Handle incoming request. authenticate and send downstream."""
+        req = Request(environ)
+        self._logger.debug('Calling S3Token middleware.')
+
+        # Always drop auth headers if we're first in the pipeline
+        if 'keystone.token_info' not in req.environ:
+            req.headers.update({h: None for h in KEYSTONE_AUTH_HEADERS})
+
+        try:
+            parts = split_path(urllib.parse.unquote(req.path), 1, 4, True)
+            version, account, container, obj = parts
+        except ValueError:
+            msg = 'Not a path query: %s, skipping.' % req.path
+            self._logger.debug(msg)
+            return self._app(environ, start_response)
+
+        # Read request signature and access id.
+        s3_auth_details = req.environ.get('s3api.auth_details')
+        if not s3_auth_details:
+            msg = 'No authorization details from s3api. skipping.'
+            self._logger.debug(msg)
+            return self._app(environ, start_response)
+
+        access = s3_auth_details['access_key']
+        if isinstance(access, bytes):
+            access = access.decode('utf-8')
+
+        signature = s3_auth_details['signature']
+        if isinstance(signature, bytes):
+            signature = signature.decode('utf-8')
+
+        string_to_sign = s3_auth_details['string_to_sign']
+        if isinstance(string_to_sign, str):
+            string_to_sign = string_to_sign.encode('utf-8')
+        token = base64.urlsafe_b64encode(string_to_sign)
+        if isinstance(token, bytes):
+            token = token.decode('ascii')
+
+        # NOTE(chmou): This is to handle the special case with nova
+        # when we have the option s3_affix_tenant. We will force it to
+        # connect to another account than the one
+        # authenticated. Before people start getting worried about
+        # security, I should point that we are connecting with
+        # username/token specified by the user but instead of
+        # connecting to its own account we will force it to go to an
+        # another account. In a normal scenario if that user don't
+        # have the reseller right it will just fail but since the
+        # reseller account can connect to every account it is allowed
+        # by the swift_auth middleware.
+        force_tenant = None
+        if ':' in access:
+            access, force_tenant = access.split(':')
+
+        # Authenticate request.
+        creds = {'credentials': {'access': access,
+                                 'token': token,
+                                 'signature': signature}}
+
+        memcache_client = None
+        memcache_token_key = 's3secret/%s' % access
+        if self._secret_cache_duration > 0:
+            memcache_client = cache_from_env(environ)
+        cached_auth_data = None
+
+        if memcache_client:
+            cached_auth_data = memcache_client.get(memcache_token_key)
+            if cached_auth_data:
+                if len(cached_auth_data) == 4:
+                    # Old versions of swift may have cached token, too,
+                    # but we don't need it
+                    headers, _token, tenant, secret = cached_auth_data
+                else:
+                    headers, tenant, secret = cached_auth_data
+
+                if s3_auth_details['check_signature'](secret):
+                    self._logger.debug("Cached creds valid")
+                else:
+                    self._logger.debug("Cached creds invalid")
+                    cached_auth_data = None
+
+        if not cached_auth_data:
+            creds_json = json.dumps(creds)
+            self._logger.debug('Connecting to Keystone sending this JSON: %s',
+                               creds_json)
+            # NOTE(vish): We could save a call to keystone by having
+            #             keystone return token, tenant, user, and roles
+            #             from this call.
+            #
+            # NOTE(chmou): We still have the same problem we would need to
+            #              change token_auth to detect if we already
+            #              identified and not doing a second query and just
+            #              pass it through to swiftauth in this case.
+            try:
+                # NB: requests.Response, not swob.Response
+                resp = self._json_request(creds_json)
+            except HTTPException as e_resp:
+                if self._delay_auth_decision:
+                    msg = ('Received error, deferring rejection based on '
+                           'error: %s')
+                    self._logger.debug(msg, e_resp.status)
+                    return self._app(environ, start_response)
+                else:
+                    msg = 'Received error, rejecting request with error: %s'
+                    self._logger.debug(msg, e_resp.status)
+                    # NB: swob.Response, not requests.Response
+                    return e_resp(environ, start_response)
+
+            self._logger.debug('Keystone Reply: Status: %d, Output: %s',
+                               resp.status_code, resp.content)
+
+            try:
+                token = resp.json()
+                if 'access' in token:
+                    headers, tenant = parse_v2_response(token)
+                elif 'token' in token:
+                    headers, tenant = parse_v3_response(token)
+                else:
+                    raise ValueError
+                if memcache_client:
+                    user_id = headers.get('X-User-Id')
+                    if not user_id:
+                        raise ValueError
+                    try:
+                        cred_ref = self.keystoneclient.ec2.get(
+                            user_id=user_id,
+                            access=access)
+                        memcache_client.set(
+                            memcache_token_key,
+                            (headers, tenant, cred_ref.secret),
+                            time=self._secret_cache_duration)
+                        self._logger.debug("Cached keystone credentials")
+                    except Exception:
+                        self._logger.warning("Unable to cache secret",
+                                             exc_info=True)
+
+                # Populate the environment similar to auth_token,
+                # so we don't have to contact Keystone again.
+                #
+                # Note that although the strings are unicode following json
+                # deserialization, Swift's HeaderEnvironProxy handles ensuring
+                # they're stored as native strings
+                req.environ['keystone.token_info'] = token
+            except (ValueError, KeyError, TypeError):
+                if self._delay_auth_decision:
+                    error = ('Error on keystone reply: %d %s - '
+                             'deferring rejection downstream')
+                    self._logger.debug(error, resp.status_code, resp.content)
+                    return self._app(environ, start_response)
+                else:
+                    error = ('Error on keystone reply: %d %s - '
+                             'rejecting request')
+                    self._logger.debug(error, resp.status_code, resp.content)
+                    return self._deny_request('InvalidURI')(
+                        environ, start_response)
+
+        req.headers.update(headers)
+        tenant_to_connect = force_tenant or tenant['id']
+        self._logger.debug('Connecting with tenant: %s', tenant_to_connect)
+        new_tenant_name = '%s%s' % (self._reseller_prefix, tenant_to_connect)
+        environ['PATH_INFO'] = environ['PATH_INFO'].replace(
+            str_to_wsgi(account), str_to_wsgi(new_tenant_name), 1)
+        return self._app(environ, start_response)
+
+
+def filter_factory(global_conf, **local_conf):
+    """Returns a WSGI filter app for use with paste.deploy."""
+    conf = global_conf.copy()
+    conf.update(local_conf)
+
+    def auth_filter(app):
+        return S3Token(app, conf)
+    return auth_filter
diff --git a/swift/common/middleware/s3api/schema/access_control_policy.rng b/swift/common/middleware/s3api/schema/access_control_policy.rng
new file mode 100644
index 0000000000..5308a12f32
--- /dev/null
+++ b/swift/common/middleware/s3api/schema/access_control_policy.rng
@@ -0,0 +1,16 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<grammar xmlns="http://relaxng.org/ns/structure/1.0">
+  <include href="common.rng"/>
+  <start>
+    <element name="AccessControlPolicy">
+      <interleave>
+        <element name="Owner">
+          <ref name="CanonicalUser"/>
+        </element>
+        <element name="AccessControlList">
+          <ref name="AccessControlList"/>
+        </element>
+      </interleave>
+    </element>
+  </start>
+</grammar>
diff --git a/swift/common/middleware/s3api/schema/bucket_logging_status.rng b/swift/common/middleware/s3api/schema/bucket_logging_status.rng
new file mode 100644
index 0000000000..27ea1e1dd0
--- /dev/null
+++ b/swift/common/middleware/s3api/schema/bucket_logging_status.rng
@@ -0,0 +1,25 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<grammar xmlns="http://relaxng.org/ns/structure/1.0" datatypeLibrary="http://www.w3.org/2001/XMLSchema-datatypes">
+  <include href="common.rng"/>
+  <start>
+    <element name="BucketLoggingStatus">
+      <optional>
+        <element name="LoggingEnabled">
+          <interleave>
+            <element name="TargetBucket">
+              <data type="string"/>
+            </element>
+            <element name="TargetPrefix">
+              <data type="string"/>
+            </element>
+            <optional>
+              <element name="TargetGrants">
+                <ref name="AccessControlList"/>
+              </element>
+            </optional>
+          </interleave>
+        </element>
+      </optional>
+    </element>
+  </start>
+</grammar>
diff --git a/swift/common/middleware/s3api/schema/common.rng b/swift/common/middleware/s3api/schema/common.rng
new file mode 100644
index 0000000000..22319c0ebd
--- /dev/null
+++ b/swift/common/middleware/s3api/schema/common.rng
@@ -0,0 +1,66 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<grammar xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns="http://relaxng.org/ns/structure/1.0" datatypeLibrary="http://www.w3.org/2001/XMLSchema-datatypes">
+  <define name="CanonicalUser">
+    <interleave>
+      <element name="ID">
+        <data type="string"/>
+      </element>
+      <optional>
+        <element name="DisplayName">
+          <data type="string"/>
+        </element>
+      </optional>
+    </interleave>
+  </define>
+  <define name="StorageClass">
+    <choice>
+      <value>STANDARD</value>
+      <value>REDUCED_REDUNDANCY</value>
+      <value>GLACIER</value>
+      <value>UNKNOWN</value>
+    </choice>
+  </define>
+  <define name="AccessControlList">
+    <zeroOrMore>
+      <element name="Grant">
+        <interleave>
+          <element name="Grantee">
+            <choice>
+              <group>
+                <attribute name="xsi:type">
+                  <value>AmazonCustomerByEmail</value>
+                </attribute>
+                <element name="EmailAddress">
+                  <data type="string"/>
+                </element>
+              </group>
+              <group>
+                <attribute name="xsi:type">
+                  <value>CanonicalUser</value>
+                </attribute>
+                <ref name="CanonicalUser"/>
+              </group>
+              <group>
+                <attribute name="xsi:type">
+                  <value>Group</value>
+                </attribute>
+                <element name="URI">
+                  <data type="string"/>
+                </element>
+              </group>
+            </choice>
+          </element>
+          <element name="Permission">
+            <choice>
+              <value>READ</value>
+              <value>WRITE</value>
+              <value>READ_ACP</value>
+              <value>WRITE_ACP</value>
+              <value>FULL_CONTROL</value>
+            </choice>
+          </element>
+        </interleave>
+      </element>
+    </zeroOrMore>
+  </define>
+</grammar>
diff --git a/swift/common/middleware/s3api/schema/complete_multipart_upload.rng b/swift/common/middleware/s3api/schema/complete_multipart_upload.rng
new file mode 100644
index 0000000000..55aefa464e
--- /dev/null
+++ b/swift/common/middleware/s3api/schema/complete_multipart_upload.rng
@@ -0,0 +1,44 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<grammar xmlns="http://relaxng.org/ns/structure/1.0" datatypeLibrary="http://www.w3.org/2001/XMLSchema-datatypes">
+  <start>
+    <element name="CompleteMultipartUpload">
+      <oneOrMore>
+        <element name="Part">
+          <interleave>
+            <element name="PartNumber">
+              <data type="int"/>
+            </element>
+            <element name="ETag">
+              <data type="string"/>
+            </element>
+            <optional>
+              <element name="ChecksumCRC32">
+                <data type="string"/>
+              </element>
+            </optional>
+            <optional>
+              <element name="ChecksumCRC32C">
+                <data type="string"/>
+              </element>
+            </optional>
+            <optional>
+              <element name="ChecksumCRC64NVME">
+                <data type="string"/>
+              </element>
+            </optional>
+            <optional>
+              <element name="ChecksumSHA1">
+                <data type="string"/>
+              </element>
+            </optional>
+            <optional>
+              <element name="ChecksumSHA256">
+                <data type="string"/>
+              </element>
+            </optional>
+          </interleave>
+        </element>
+      </oneOrMore>
+    </element>
+  </start>
+</grammar>
diff --git a/swift/common/middleware/s3api/schema/complete_multipart_upload_result.rng b/swift/common/middleware/s3api/schema/complete_multipart_upload_result.rng
new file mode 100644
index 0000000000..47406e1c5e
--- /dev/null
+++ b/swift/common/middleware/s3api/schema/complete_multipart_upload_result.rng
@@ -0,0 +1,19 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<grammar xmlns="http://relaxng.org/ns/structure/1.0" datatypeLibrary="http://www.w3.org/2001/XMLSchema-datatypes">
+  <start>
+    <element name="CompleteMultipartUploadResult">
+      <element name="Location">
+        <data type="anyURI"/>
+      </element>
+      <element name="Bucket">
+        <data type="string"/>
+      </element>
+      <element name="Key">
+        <data type="string"/>
+      </element>
+      <element name="ETag">
+        <data type="string"/>
+      </element>
+    </element>
+  </start>
+</grammar>
diff --git a/swift/common/middleware/s3api/schema/copy_object_result.rng b/swift/common/middleware/s3api/schema/copy_object_result.rng
new file mode 100644
index 0000000000..ec0ac95f2c
--- /dev/null
+++ b/swift/common/middleware/s3api/schema/copy_object_result.rng
@@ -0,0 +1,13 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<grammar xmlns="http://relaxng.org/ns/structure/1.0" datatypeLibrary="http://www.w3.org/2001/XMLSchema-datatypes">
+  <start>
+    <element name="CopyObjectResult">
+      <element name="LastModified">
+        <data type="dateTime"/>
+      </element>
+      <element name="ETag">
+        <data type="string"/>
+      </element>
+    </element>
+  </start>
+</grammar>
diff --git a/swift/common/middleware/s3api/schema/copy_part_result.rng b/swift/common/middleware/s3api/schema/copy_part_result.rng
new file mode 100644
index 0000000000..0370daad6b
--- /dev/null
+++ b/swift/common/middleware/s3api/schema/copy_part_result.rng
@@ -0,0 +1,13 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<grammar xmlns="http://relaxng.org/ns/structure/1.0" datatypeLibrary="http://www.w3.org/2001/XMLSchema-datatypes">
+  <start>
+    <element name="CopyPartResult">
+      <element name="LastModified">
+        <data type="dateTime"/>
+      </element>
+      <element name="ETag">
+        <data type="string"/>
+      </element>
+    </element>
+  </start>
+</grammar>
diff --git a/swift/common/middleware/s3api/schema/create_bucket_configuration.rng b/swift/common/middleware/s3api/schema/create_bucket_configuration.rng
new file mode 100644
index 0000000000..882edc465f
--- /dev/null
+++ b/swift/common/middleware/s3api/schema/create_bucket_configuration.rng
@@ -0,0 +1,11 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<grammar xmlns="http://relaxng.org/ns/structure/1.0" datatypeLibrary="http://www.w3.org/2001/XMLSchema-datatypes">
+  <start>
+    <element>
+      <anyName/>
+      <element name="LocationConstraint">
+        <data type="string"/>
+      </element>
+    </element>
+  </start>
+</grammar>
diff --git a/swift/common/middleware/s3api/schema/delete.rng b/swift/common/middleware/s3api/schema/delete.rng
new file mode 100644
index 0000000000..f0659fc1c0
--- /dev/null
+++ b/swift/common/middleware/s3api/schema/delete.rng
@@ -0,0 +1,28 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<grammar xmlns="http://relaxng.org/ns/structure/1.0" datatypeLibrary="http://www.w3.org/2001/XMLSchema-datatypes">
+  <start>
+    <element name="Delete">
+      <interleave>
+        <optional>
+          <element name="Quiet">
+            <data type="string"/>
+          </element>
+        </optional>
+        <oneOrMore>
+          <element name="Object">
+            <interleave>
+              <element name="Key">
+                <data type="string"/>
+              </element>
+              <optional>
+                <element name="VersionId">
+                  <data type="string"/>
+                </element>
+              </optional>
+            </interleave>
+          </element>
+        </oneOrMore>
+      </interleave>
+    </element>
+  </start>
+</grammar>
diff --git a/swift/common/middleware/s3api/schema/delete_result.rng b/swift/common/middleware/s3api/schema/delete_result.rng
new file mode 100644
index 0000000000..1e28b3ceb8
--- /dev/null
+++ b/swift/common/middleware/s3api/schema/delete_result.rng
@@ -0,0 +1,47 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<grammar xmlns="http://relaxng.org/ns/structure/1.0" datatypeLibrary="http://www.w3.org/2001/XMLSchema-datatypes">
+  <start>
+    <element name="DeleteResult">
+      <zeroOrMore>
+        <choice>
+          <element name="Deleted">
+            <element name="Key">
+              <data type="string"/>
+            </element>
+            <optional>
+              <element name="VersionId">
+                <data type="string"/>
+              </element>
+            </optional>
+            <optional>
+              <element name="DeleteMarker">
+                <data type="boolean"/>
+              </element>
+            </optional>
+            <optional>
+              <element name="DeleteMarkerVersionId">
+                <data type="string"/>
+              </element>
+            </optional>
+          </element>
+          <element name="Error">
+            <element name="Key">
+              <data type="string"/>
+            </element>
+            <optional>
+              <element name="VersionId">
+                <data type="string"/>
+              </element>
+            </optional>
+            <element name="Code">
+              <data type="string"/>
+            </element>
+            <element name="Message">
+              <data type="string"/>
+            </element>
+          </element>
+        </choice>
+      </zeroOrMore>
+    </element>
+  </start>
+</grammar>
diff --git a/swift/common/middleware/s3api/schema/error.rng b/swift/common/middleware/s3api/schema/error.rng
new file mode 100644
index 0000000000..a0d61d4853
--- /dev/null
+++ b/swift/common/middleware/s3api/schema/error.rng
@@ -0,0 +1,30 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<grammar xmlns="http://relaxng.org/ns/structure/1.0" datatypeLibrary="http://www.w3.org/2001/XMLSchema-datatypes">
+  <start>
+    <element name="Error">
+      <element name="Code">
+        <data type="string"/>
+      </element>
+      <element name="Message">
+        <data type="string"/>
+      </element>
+      <zeroOrMore>
+        <ref name="DebugInfo"/>
+      </zeroOrMore>
+    </element>
+  </start>
+  <define name="DebugInfo">
+    <element>
+      <anyName/>
+      <zeroOrMore>
+        <choice>
+          <attribute>
+            <anyName/>
+          </attribute>
+          <text/>
+          <ref name="DebugInfo"/>
+        </choice>
+      </zeroOrMore>
+    </element>
+  </define>
+</grammar>
diff --git a/swift/common/middleware/s3api/schema/initiate_multipart_upload_result.rng b/swift/common/middleware/s3api/schema/initiate_multipart_upload_result.rng
new file mode 100644
index 0000000000..67d03016da
--- /dev/null
+++ b/swift/common/middleware/s3api/schema/initiate_multipart_upload_result.rng
@@ -0,0 +1,16 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<grammar xmlns="http://relaxng.org/ns/structure/1.0" datatypeLibrary="http://www.w3.org/2001/XMLSchema-datatypes">
+  <start>
+    <element name="InitiateMultipartUploadResult">
+      <element name="Bucket">
+        <data type="string"/>
+      </element>
+      <element name="Key">
+        <data type="string"/>
+      </element>
+      <element name="UploadId">
+        <data type="string"/>
+      </element>
+    </element>
+  </start>
+</grammar>
diff --git a/swift/common/middleware/s3api/schema/lifecycle_configuration.rng b/swift/common/middleware/s3api/schema/lifecycle_configuration.rng
new file mode 100644
index 0000000000..dd0816e2f5
--- /dev/null
+++ b/swift/common/middleware/s3api/schema/lifecycle_configuration.rng
@@ -0,0 +1,56 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<grammar xmlns="http://relaxng.org/ns/structure/1.0" datatypeLibrary="http://www.w3.org/2001/XMLSchema-datatypes">
+  <include href="common.rng"/>
+  <start>
+    <element name="LifecycleConfiguration">
+      <oneOrMore>
+        <element name="Rule">
+          <interleave>
+            <optional>
+              <element name="ID">
+                <data type="string"/>
+              </element>
+            </optional>
+            <element name="Prefix">
+              <data type="string"/>
+            </element>
+            <element name="Status">
+              <choice>
+                <value>Enabled</value>
+                <value>Disabled</value>
+              </choice>
+            </element>
+            <optional>
+              <element name="Transition">
+                <ref name="Transition"/>
+              </element>
+            </optional>
+            <optional>
+              <element name="Expiration">
+                <ref name="Expiration"/>
+              </element>
+            </optional>
+          </interleave>
+        </element>
+      </oneOrMore>
+    </element>
+  </start>
+  <define name="Expiration">
+    <choice>
+      <element name="Days">
+        <data type="int"/>
+      </element>
+      <element name="Date">
+        <data type="dateTime"/>
+      </element>
+    </choice>
+  </define>
+  <define name="Transition">
+    <interleave>
+      <ref name="Expiration"/>
+      <element name="StorageClass">
+        <ref name="StorageClass"/>
+      </element>
+    </interleave>
+  </define>
+</grammar>
diff --git a/swift/common/middleware/s3api/schema/list_all_my_buckets_result.rng b/swift/common/middleware/s3api/schema/list_all_my_buckets_result.rng
new file mode 100644
index 0000000000..76959d7b81
--- /dev/null
+++ b/swift/common/middleware/s3api/schema/list_all_my_buckets_result.rng
@@ -0,0 +1,23 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<grammar xmlns="http://relaxng.org/ns/structure/1.0" datatypeLibrary="http://www.w3.org/2001/XMLSchema-datatypes">
+  <include href="common.rng"/>
+  <start>
+    <element name="ListAllMyBucketsResult">
+      <element name="Owner">
+        <ref name="CanonicalUser"/>
+      </element>
+      <element name="Buckets">
+        <zeroOrMore>
+          <element name="Bucket">
+            <element name="Name">
+              <data type="string"/>
+            </element>
+            <element name="CreationDate">
+              <data type="dateTime"/>
+            </element>
+          </element>
+        </zeroOrMore>
+      </element>
+    </element>
+  </start>
+</grammar>
diff --git a/swift/common/middleware/s3api/schema/list_bucket_result.rng b/swift/common/middleware/s3api/schema/list_bucket_result.rng
new file mode 100644
index 0000000000..b3181238e6
--- /dev/null
+++ b/swift/common/middleware/s3api/schema/list_bucket_result.rng
@@ -0,0 +1,93 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<grammar xmlns="http://relaxng.org/ns/structure/1.0" datatypeLibrary="http://www.w3.org/2001/XMLSchema-datatypes">
+  <include href="common.rng"/>
+  <start>
+    <element name="ListBucketResult">
+      <element name="Name">
+        <data type="string"/>
+      </element>
+      <element name="Prefix">
+        <data type="string"/>
+      </element>
+      <choice>
+        <group>
+          <element name="Marker">
+            <data type="string"/>
+          </element>
+          <optional>
+            <element name="NextMarker">
+              <data type="string"/>
+            </element>
+          </optional>
+        </group>
+        <group>
+          <optional>
+            <element name="NextContinuationToken">
+              <data type="string"/>
+            </element>
+          </optional>
+          <optional>
+            <element name="ContinuationToken">
+              <data type="string"/>
+            </element>
+          </optional>
+          <optional>
+            <element name="StartAfter">
+              <data type="string"/>
+            </element>
+          </optional>
+          <element name="KeyCount">
+            <data type="int"/>
+          </element>
+        </group>
+      </choice>
+      <element name="MaxKeys">
+        <data type="int"/>
+      </element>
+      <optional>
+        <element name="Delimiter">
+          <data type="string"/>
+        </element>
+      </optional>
+      <optional>
+        <element name="EncodingType">
+          <data type="string"/>
+        </element>
+      </optional>
+      <element name="IsTruncated">
+        <data type="boolean"/>
+      </element>
+      <zeroOrMore>
+        <element name="Contents">
+          <element name="Key">
+            <data type="string"/>
+          </element>
+          <element name="LastModified">
+            <data type="dateTime"/>
+          </element>
+          <element name="ETag">
+            <data type="string"/>
+          </element>
+          <element name="Size">
+            <data type="long"/>
+          </element>
+          <optional>
+            <element name="Owner">
+              <ref name="CanonicalUser"/>
+            </element>
+          </optional>
+          <element name="StorageClass">
+            <ref name="StorageClass"/>
+          </element>
+        </element>
+      </zeroOrMore>
+      <zeroOrMore>
+        <element name="CommonPrefixes">
+          <element name="Prefix">
+            <data type="string"/>
+          </element>
+        </element>
+      </zeroOrMore>
+    </element>
+  </start>
+</grammar>
diff --git a/swift/common/middleware/s3api/schema/list_multipart_uploads_result.rng b/swift/common/middleware/s3api/schema/list_multipart_uploads_result.rng
new file mode 100644
index 0000000000..2e20c840ec
--- /dev/null
+++ b/swift/common/middleware/s3api/schema/list_multipart_uploads_result.rng
@@ -0,0 +1,73 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<grammar xmlns="http://relaxng.org/ns/structure/1.0" datatypeLibrary="http://www.w3.org/2001/XMLSchema-datatypes">
+  <include href="common.rng"/>
+  <start>
+    <element name="ListMultipartUploadsResult">
+      <element name="Bucket">
+        <data type="string"/>
+      </element>
+      <element name="KeyMarker">
+        <data type="string"/>
+      </element>
+      <element name="UploadIdMarker">
+        <data type="string"/>
+      </element>
+      <element name="NextKeyMarker">
+        <data type="string"/>
+      </element>
+      <element name="NextUploadIdMarker">
+        <data type="string"/>
+      </element>
+      <optional>
+        <element name="Delimiter">
+          <data type="string"/>
+        </element>
+      </optional>
+      <optional>
+        <element name="Prefix">
+          <data type="string"/>
+        </element>
+      </optional>
+      <element name="MaxUploads">
+        <data type="int"/>
+      </element>
+      <optional>
+        <element name="EncodingType">
+          <data type="string"/>
+        </element>
+      </optional>
+      <element name="IsTruncated">
+        <data type="boolean"/>
+      </element>
+      <zeroOrMore>
+        <element name="Upload">
+          <element name="Key">
+            <data type="string"/>
+          </element>
+          <element name="UploadId">
+            <data type="string"/>
+          </element>
+          <element name="Initiator">
+            <ref name="CanonicalUser"/>
+          </element>
+          <element name="Owner">
+            <ref name="CanonicalUser"/>
+          </element>
+          <element name="StorageClass">
+            <ref name="StorageClass"/>
+          </element>
+          <element name="Initiated">
+            <data type="dateTime"/>
+          </element>
+        </element>
+      </zeroOrMore>
+      <zeroOrMore>
+        <element name="CommonPrefixes">
+          <element name="Prefix">
+            <data type="string"/>
+          </element>
+        </element>
+      </zeroOrMore>
+    </element>
+  </start>
+</grammar>
diff --git a/swift/common/middleware/s3api/schema/list_parts_result.rng b/swift/common/middleware/s3api/schema/list_parts_result.rng
new file mode 100644
index 0000000000..4cf5a0ce7d
--- /dev/null
+++ b/swift/common/middleware/s3api/schema/list_parts_result.rng
@@ -0,0 +1,59 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<grammar xmlns="http://relaxng.org/ns/structure/1.0" datatypeLibrary="http://www.w3.org/2001/XMLSchema-datatypes">
+  <include href="common.rng"/>
+  <start>
+    <element name="ListPartsResult">
+      <element name="Bucket">
+        <data type="string"/>
+      </element>
+      <element name="Key">
+        <data type="string"/>
+      </element>
+      <element name="UploadId">
+        <data type="string"/>
+      </element>
+      <element name="Initiator">
+        <ref name="CanonicalUser"/>
+      </element>
+      <element name="Owner">
+        <ref name="CanonicalUser"/>
+      </element>
+      <element name="StorageClass">
+        <ref name="StorageClass"/>
+      </element>
+      <element name="PartNumberMarker">
+        <data type="int"/>
+      </element>
+      <element name="NextPartNumberMarker">
+        <data type="int"/>
+      </element>
+      <element name="MaxParts">
+        <data type="int"/>
+      </element>
+      <optional>
+        <element name="EncodingType">
+          <data type="string"/>
+        </element>
+      </optional>
+      <element name="IsTruncated">
+        <data type="boolean"/>
+      </element>
+      <zeroOrMore>
+        <element name="Part">
+          <element name="PartNumber">
+            <data type="int"/>
+          </element>
+          <element name="LastModified">
+            <data type="dateTime"/>
+          </element>
+          <element name="ETag">
+            <data type="string"/>
+          </element>
+          <element name="Size">
+            <data type="long"/>
+          </element>
+        </element>
+      </zeroOrMore>
+    </element>
+  </start>
+</grammar>
diff --git a/swift/common/middleware/s3api/schema/list_versions_result.rng b/swift/common/middleware/s3api/schema/list_versions_result.rng
new file mode 100644
index 0000000000..464cfbcc48
--- /dev/null
+++ b/swift/common/middleware/s3api/schema/list_versions_result.rng
@@ -0,0 +1,104 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<grammar xmlns="http://relaxng.org/ns/structure/1.0" datatypeLibrary="http://www.w3.org/2001/XMLSchema-datatypes">
+  <include href="common.rng"/>
+  <start>
+    <element name="ListVersionsResult">
+      <element name="Name">
+        <data type="string"/>
+      </element>
+      <element name="Prefix">
+        <data type="string"/>
+      </element>
+      <element name="KeyMarker">
+        <data type="string"/>
+      </element>
+      <element name="VersionIdMarker">
+        <data type="string"/>
+      </element>
+      <optional>
+        <element name="NextKeyMarker">
+          <data type="string"/>
+        </element>
+      </optional>
+      <optional>
+        <element name="NextVersionIdMarker">
+          <data type="string"/>
+        </element>
+      </optional>
+      <element name="MaxKeys">
+        <data type="int"/>
+      </element>
+      <optional>
+        <element name="EncodingType">
+          <data type="string"/>
+        </element>
+      </optional>
+      <optional>
+        <element name="Delimiter">
+          <data type="string"/>
+        </element>
+      </optional>
+      <element name="IsTruncated">
+        <data type="boolean"/>
+      </element>
+      <zeroOrMore>
+        <choice>
+          <element name="Version">
+            <element name="Key">
+              <data type="string"/>
+            </element>
+            <element name="VersionId">
+              <data type="string"/>
+            </element>
+            <element name="IsLatest">
+              <data type="boolean"/>
+            </element>
+            <element name="LastModified">
+              <data type="dateTime"/>
+            </element>
+            <element name="ETag">
+              <data type="string"/>
+            </element>
+            <element name="Size">
+              <data type="long"/>
+            </element>
+            <optional>
+              <element name="Owner">
+                <ref name="CanonicalUser"/>
+              </element>
+            </optional>
+            <element name="StorageClass">
+              <ref name="StorageClass"/>
+            </element>
+          </element>
+          <element name="DeleteMarker">
+            <element name="Key">
+              <data type="string"/>
+            </element>
+            <element name="VersionId">
+              <data type="string"/>
+            </element>
+            <element name="IsLatest">
+              <data type="boolean"/>
+            </element>
+            <element name="LastModified">
+              <data type="dateTime"/>
+            </element>
+            <optional>
+              <element name="Owner">
+                <ref name="CanonicalUser"/>
+              </element>
+            </optional>
+          </element>
+        </choice>
+      </zeroOrMore>
+      <zeroOrMore>
+        <element name="CommonPrefixes">
+          <element name="Prefix">
+            <data type="string"/>
+          </element>
+        </element>
+      </zeroOrMore>
+    </element>
+  </start>
+</grammar>
diff --git a/swift/common/middleware/s3api/schema/location_constraint.rng b/swift/common/middleware/s3api/schema/location_constraint.rng
new file mode 100644
index 0000000000..2f3a143b27
--- /dev/null
+++ b/swift/common/middleware/s3api/schema/location_constraint.rng
@@ -0,0 +1,8 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<grammar xmlns="http://relaxng.org/ns/structure/1.0" datatypeLibrary="http://www.w3.org/2001/XMLSchema-datatypes">
+  <start>
+    <element name="LocationConstraint">
+      <data type="string"/>
+    </element>
+  </start>
+</grammar>
diff --git a/swift/common/middleware/s3api/schema/versioning_configuration.rng b/swift/common/middleware/s3api/schema/versioning_configuration.rng
new file mode 100644
index 0000000000..3d6d3d1238
--- /dev/null
+++ b/swift/common/middleware/s3api/schema/versioning_configuration.rng
@@ -0,0 +1,25 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<grammar xmlns="http://relaxng.org/ns/structure/1.0">
+  <start>
+    <element name="VersioningConfiguration">
+      <interleave>
+        <optional>
+          <element name="Status">
+            <choice>
+              <value>Enabled</value>
+              <value>Suspended</value>
+            </choice>
+          </element>
+        </optional>
+        <optional>
+          <element name="MfaDelete">
+            <choice>
+              <value>Enabled</value>
+              <value>Disabled</value>
+            </choice>
+          </element>
+        </optional>
+      </interleave>
+    </element>
+  </start>
+</grammar>
diff --git a/swift/common/middleware/s3api/subresource.py b/swift/common/middleware/s3api/subresource.py
new file mode 100644
index 0000000000..42af24bd05
--- /dev/null
+++ b/swift/common/middleware/s3api/subresource.py
@@ -0,0 +1,574 @@
+# Copyright (c) 2014 OpenStack Foundation.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""
+---------------------------
+s3api's ACLs implementation
+---------------------------
+s3api uses a different implementation approach to achieve S3 ACLs.
+
+First, we should understand what we have to design to achieve real S3 ACLs.
+Current s3api(real S3)'s ACLs Model is as follows::
+
+    AccessControlPolicy:
+        Owner:
+        AccessControlList:
+            Grant[n]:
+                (Grantee, Permission)
+
+Each bucket or object has its own acl consisting of Owner and
+AcessControlList. AccessControlList can contain some Grants.
+By default, AccessControlList has only one Grant to allow FULL
+CONTROLL to owner. Each Grant includes single pair with Grantee,
+Permission. Grantee is the user (or user group) allowed the given permission.
+
+This module defines the groups and the relation tree.
+
+If you wanna get more information about S3's ACLs model in detail,
+please see official documentation here,
+
+http://docs.aws.amazon.com/AmazonS3/latest/dev/acl-overview.html
+
+"""
+from functools import partial
+
+from swift.common.utils import json
+
+from swift.common.middleware.s3api.s3response import InvalidArgument, \
+    MalformedACLError, S3NotImplemented, InvalidRequest, AccessDenied
+from swift.common.middleware.s3api.etree import Element, SubElement, tostring
+from swift.common.middleware.s3api.utils import sysmeta_header
+from swift.common.middleware.s3api.exception import InvalidSubresource
+
+XMLNS_XSI = 'http://www.w3.org/2001/XMLSchema-instance'
+PERMISSIONS = ['FULL_CONTROL', 'READ', 'WRITE', 'READ_ACP', 'WRITE_ACP']
+LOG_DELIVERY_USER = '.log_delivery'
+
+
+def encode_acl(resource, acl):
+    """
+    Encode an ACL instance to Swift metadata.
+
+    Given a resource type and an ACL instance, this method returns HTTP
+    headers, which can be used for Swift metadata.
+    """
+    header_value = {"Owner": acl.owner.id}
+    grants = []
+    for grant in acl.grants:
+        grant = {"Permission": grant.permission,
+                 "Grantee": str(grant.grantee)}
+        grants.append(grant)
+    header_value.update({"Grant": grants})
+    headers = {}
+    key = sysmeta_header(resource, 'acl')
+    headers[key] = json.dumps(header_value, separators=(',', ':'))
+
+    return headers
+
+
+def decode_acl(resource, headers, allow_no_owner):
+    """
+    Decode Swift metadata to an ACL instance.
+
+    Given a resource type and HTTP headers, this method returns an ACL
+    instance.
+    """
+    value = ''
+
+    key = sysmeta_header(resource, 'acl')
+    if key in headers:
+        value = headers[key]
+
+    if value == '':
+        # Fix me: In the case of value is empty or not dict instance,
+        # I want an instance of Owner as None.
+        # However, in the above process would occur error in reference
+        # to an instance variable of Owner.
+        return ACL(Owner(None, None), [], True, allow_no_owner)
+
+    try:
+        encode_value = json.loads(value)
+        if not isinstance(encode_value, dict):
+            return ACL(Owner(None, None), [], True, allow_no_owner)
+
+        id = None
+        name = None
+        grants = []
+        if 'Owner' in encode_value:
+            id = encode_value['Owner']
+            name = encode_value['Owner']
+        if 'Grant' in encode_value:
+            for grant in encode_value['Grant']:
+                grantee = None
+                # pylint: disable-msg=E1101
+                for group in Group.__subclasses__():
+                    if group.__name__ == grant['Grantee']:
+                        grantee = group()
+                if not grantee:
+                    grantee = User(grant['Grantee'])
+                permission = grant['Permission']
+                grants.append(Grant(grantee, permission))
+        return ACL(Owner(id, name), grants, True, allow_no_owner)
+    except Exception as e:
+        raise InvalidSubresource((resource, 'acl', value), e)
+
+
+class Grantee(object):
+    """
+    Base class for grantee.
+
+    Methods:
+
+    * init: create a Grantee instance
+    * elem: create an ElementTree from itself
+
+    Static Methods:
+
+    * from_header: convert a grantee string in the HTTP header
+                   to an Grantee instance.
+    * from_elem: convert a ElementTree to an Grantee instance.
+
+    """
+    # Needs confirmation whether we really need these methods or not.
+    # * encode (method): create a JSON which includes whole own elements
+    # * encode_from_elem (static method): convert from an ElementTree to a JSON
+    # * elem_from_json (static method): convert from a JSON to an ElementTree
+    # * from_json (static method): convert a Json string to an Grantee
+    #                              instance.
+
+    def __contains__(self, key):
+        """
+        The key argument is a S3 user id.  This method checks that the user id
+        belongs to this class.
+        """
+        raise S3NotImplemented()
+
+    def elem(self):
+        """
+        Get an etree element of this instance.
+        """
+        raise S3NotImplemented()
+
+    @staticmethod
+    def from_elem(elem):
+        type = elem.get('{%s}type' % XMLNS_XSI)
+        if type == 'CanonicalUser':
+            value = elem.find('./ID').text
+            return User(value)
+        elif type == 'Group':
+            value = elem.find('./URI').text
+            subclass = get_group_subclass_from_uri(value)
+            return subclass()
+        elif type == 'AmazonCustomerByEmail':
+            raise S3NotImplemented()
+        else:
+            raise MalformedACLError()
+
+    @staticmethod
+    def from_header(grantee):
+        """
+        Convert a grantee string in the HTTP header to an Grantee instance.
+        """
+        grantee_type, value = grantee.split('=', 1)
+        grantee_type = grantee_type.lower()
+        value = value.strip('"\'')
+        if grantee_type == 'id':
+            return User(value)
+        elif grantee_type == 'emailaddress':
+            raise S3NotImplemented()
+        elif grantee_type == 'uri':
+            # return a subclass instance of Group class
+            subclass = get_group_subclass_from_uri(value)
+            return subclass()
+        else:
+            raise InvalidArgument(grantee_type, value,
+                                  'Argument format not recognized')
+
+
+class User(Grantee):
+    """
+    Canonical user class for S3 accounts.
+    """
+    type = 'CanonicalUser'
+
+    def __init__(self, name):
+        self.id = name
+        self.display_name = name
+
+    def __contains__(self, key):
+        return key == self.id
+
+    def elem(self):
+        elem = Element('Grantee', nsmap={'xsi': XMLNS_XSI})
+        elem.set('{%s}type' % XMLNS_XSI, self.type)
+        SubElement(elem, 'ID').text = self.id
+        SubElement(elem, 'DisplayName').text = self.display_name
+        return elem
+
+    def __str__(self):
+        return self.display_name
+
+    def __lt__(self, other):
+        if not isinstance(other, User):
+            return NotImplemented
+        return self.id < other.id
+
+
+class Owner(object):
+    """
+    Owner class for S3 accounts
+    """
+    def __init__(self, id, name):
+        self.id = id
+        if not (name is None or isinstance(name, str)):
+            raise TypeError('name must be a string or None')
+        self.name = name
+
+
+def get_group_subclass_from_uri(uri):
+    """
+    Convert a URI to one of the predefined groups.
+    """
+    for group in Group.__subclasses__():  # pylint: disable-msg=E1101
+        if group.uri == uri:
+            return group
+    raise InvalidArgument('uri', uri, 'Invalid group uri')
+
+
+class Group(Grantee):
+    """
+    Base class for Amazon S3 Predefined Groups
+    """
+    type = 'Group'
+    uri = ''
+
+    def __init__(self):
+        # Initialize method to clarify this has nothing to do
+        pass
+
+    def elem(self):
+        elem = Element('Grantee', nsmap={'xsi': XMLNS_XSI})
+        elem.set('{%s}type' % XMLNS_XSI, self.type)
+        SubElement(elem, 'URI').text = self.uri
+
+        return elem
+
+    def __str__(self):
+        return self.__class__.__name__
+
+
+def canned_acl_grantees(bucket_owner, object_owner=None):
+    """
+    A set of predefined grants supported by AWS S3.
+    """
+    owner = object_owner or bucket_owner
+
+    return {
+        'private': [
+            ('FULL_CONTROL', User(owner.name)),
+        ],
+        'public-read': [
+            ('READ', AllUsers()),
+            ('FULL_CONTROL', User(owner.name)),
+        ],
+        'public-read-write': [
+            ('READ', AllUsers()),
+            ('WRITE', AllUsers()),
+            ('FULL_CONTROL', User(owner.name)),
+        ],
+        'authenticated-read': [
+            ('READ', AuthenticatedUsers()),
+            ('FULL_CONTROL', User(owner.name)),
+        ],
+        'bucket-owner-read': [
+            ('READ', User(bucket_owner.name)),
+            ('FULL_CONTROL', User(owner.name)),
+        ],
+        'bucket-owner-full-control': [
+            ('FULL_CONTROL', User(owner.name)),
+            ('FULL_CONTROL', User(bucket_owner.name)),
+        ],
+        'log-delivery-write': [
+            ('WRITE', LogDelivery()),
+            ('READ_ACP', LogDelivery()),
+            ('FULL_CONTROL', User(owner.name)),
+        ],
+    }
+
+
+class AuthenticatedUsers(Group):
+    """
+    This group represents all AWS accounts.  Access permission to this group
+    allows any AWS account to access the resource.  However, all requests must
+    be signed (authenticated).
+    """
+    uri = 'http://acs.amazonaws.com/groups/global/AuthenticatedUsers'
+
+    def __contains__(self, key):
+        # s3api handles only signed requests.
+        return True
+
+
+class AllUsers(Group):
+    """
+    Access permission to this group allows anyone to access the resource.  The
+    requests can be signed (authenticated) or unsigned (anonymous).  Unsigned
+    requests omit the Authentication header in the request.
+
+    Note: s3api regards unsigned requests as Swift API accesses, and bypasses
+    them to Swift.  As a result, AllUsers behaves completely same as
+    AuthenticatedUsers.
+    """
+    uri = 'http://acs.amazonaws.com/groups/global/AllUsers'
+
+    def __contains__(self, key):
+        return True
+
+
+class LogDelivery(Group):
+    """
+    WRITE and READ_ACP permissions on a bucket enables this group to write
+    server access logs to the bucket.
+    """
+    uri = 'http://acs.amazonaws.com/groups/s3/LogDelivery'
+
+    def __contains__(self, key):
+        if ':' in key:
+            tenant, user = key.split(':', 1)
+        else:
+            user = key
+        return user == LOG_DELIVERY_USER
+
+
+class Grant(object):
+    """
+    Grant Class which includes both Grantee and Permission
+    """
+
+    def __init__(self, grantee, permission):
+        """
+        :param grantee: a grantee class or its subclass
+        :param permission: string
+        """
+        if permission.upper() not in PERMISSIONS:
+            raise S3NotImplemented()
+        if not isinstance(grantee, Grantee):
+            raise ValueError()
+        self.grantee = grantee
+        self.permission = permission
+
+    @classmethod
+    def from_elem(cls, elem):
+        """
+        Convert an ElementTree to an ACL instance
+        """
+        grantee = Grantee.from_elem(elem.find('./Grantee'))
+        permission = elem.find('./Permission').text
+        return cls(grantee, permission)
+
+    def elem(self):
+        """
+        Create an etree element.
+        """
+        elem = Element('Grant')
+        elem.append(self.grantee.elem())
+        SubElement(elem, 'Permission').text = self.permission
+
+        return elem
+
+    def allow(self, grantee, permission):
+        return permission == self.permission and grantee in self.grantee
+
+
+class ACL(object):
+    """
+    S3 ACL class.
+
+    Refs (S3 API - acl-overview:
+          http://docs.aws.amazon.com/AmazonS3/latest/dev/acl-overview.html):
+
+    The sample ACL includes an Owner element identifying the owner via the
+    AWS account's canonical user ID. The Grant element identifies the grantee
+    (either an AWS account or a predefined group), and the permission granted.
+    This default ACL has one Grant element for the owner. You grant permissions
+    by adding Grant elements, each grant identifying the grantee and the
+    permission.
+    """
+    metadata_name = 'acl'
+    root_tag = 'AccessControlPolicy'
+    max_xml_length = 200 * 1024
+
+    def __init__(self, owner, grants=None, s3_acl=False, allow_no_owner=False):
+        """
+        :param owner: Owner instance for ACL instance
+        :param grants: a list of Grant instances
+        :param s3_acl: boolean indicates whether this class is used under
+            s3_acl is True or False (from s3api middleware configuration)
+        :param allow_no_owner: boolean indicates this ACL instance can be
+            handled when no owner information found
+        """
+        self.owner = owner
+        self.grants = grants or []
+        self.s3_acl = s3_acl
+        self.allow_no_owner = allow_no_owner
+
+    def __bytes__(self):
+        return tostring(self.elem())
+
+    def __repr__(self):
+        return self.__bytes__().decode('utf8')
+
+    @classmethod
+    def from_elem(cls, elem, s3_acl=False, allow_no_owner=False):
+        """
+        Convert an ElementTree to an ACL instance
+        """
+        id = elem.find('./Owner/ID').text
+        try:
+            name = elem.find('./Owner/DisplayName').text
+        except AttributeError:
+            name = id
+
+        grants = [Grant.from_elem(e)
+                  for e in elem.findall('./AccessControlList/Grant')]
+        return cls(Owner(id, name), grants, s3_acl, allow_no_owner)
+
+    def elem(self):
+        """
+        Decode the value to an ACL instance.
+        """
+        elem = Element(self.root_tag)
+
+        owner = SubElement(elem, 'Owner')
+        SubElement(owner, 'ID').text = self.owner.id
+        SubElement(owner, 'DisplayName').text = self.owner.name
+
+        SubElement(elem, 'AccessControlList').extend(
+            g.elem() for g in self.grants
+        )
+
+        return elem
+
+    def check_owner(self, user_id):
+        """
+        Check that the user is an owner.
+        """
+        if not self.s3_acl:
+            # Ignore S3api ACL.
+            return
+
+        if not self.owner.id:
+            if self.allow_no_owner:
+                # No owner means public.
+                return
+            raise AccessDenied()
+
+        if user_id != self.owner.id:
+            raise AccessDenied()
+
+    def check_permission(self, user_id, permission):
+        """
+        Check that the user has a permission.
+        """
+        if not self.s3_acl:
+            # Ignore S3api ACL.
+            return
+
+        try:
+            # owners have full control permission
+            self.check_owner(user_id)
+            return
+        except AccessDenied:
+            pass
+
+        if permission in PERMISSIONS:
+            for g in self.grants:
+                if g.allow(user_id, 'FULL_CONTROL') or \
+                        g.allow(user_id, permission):
+                    return
+
+        raise AccessDenied()
+
+    @classmethod
+    def from_headers(cls, headers, bucket_owner, object_owner=None,
+                     as_private=True):
+        """
+        Convert HTTP headers to an ACL instance.
+        """
+        grants = []
+        try:
+            for key, value in headers.items():
+                if key.lower().startswith('x-amz-grant-'):
+                    permission = key[len('x-amz-grant-'):]
+                    permission = permission.upper().replace('-', '_')
+                    if permission not in PERMISSIONS:
+                        continue
+                    for grantee in value.split(','):
+                        grants.append(
+                            Grant(Grantee.from_header(grantee), permission))
+
+            if 'x-amz-acl' in headers:
+                try:
+                    acl = headers['x-amz-acl']
+                    if len(grants) > 0:
+                        err_msg = 'Specifying both Canned ACLs and Header ' \
+                            'Grants is not allowed'
+                        raise InvalidRequest(err_msg)
+                    grantees = canned_acl_grantees(
+                        bucket_owner, object_owner)[acl]
+                    for permission, grantee in grantees:
+                        grants.append(Grant(grantee, permission))
+                except KeyError:
+                    # expects canned_acl_grantees()[] raises KeyError
+                    raise InvalidArgument('x-amz-acl', headers['x-amz-acl'])
+        except (KeyError, ValueError):
+            # TODO: think about we really catch this except sequence
+            raise InvalidRequest()
+
+        if len(grants) == 0:
+            # No ACL headers
+            if as_private:
+                return ACLPrivate(bucket_owner, object_owner)
+            else:
+                return None
+
+        return cls(object_owner or bucket_owner, grants)
+
+
+class CannedACL(object):
+    """
+    A dict-like object that returns canned ACL.
+    """
+    def __getitem__(self, key):
+        def acl(key, bucket_owner, object_owner=None,
+                s3_acl=False, allow_no_owner=False):
+            grants = []
+            grantees = canned_acl_grantees(bucket_owner, object_owner)[key]
+            for permission, grantee in grantees:
+                grants.append(Grant(grantee, permission))
+            return ACL(object_owner or bucket_owner,
+                       grants, s3_acl, allow_no_owner)
+
+        return partial(acl, key)
+
+
+canned_acl = CannedACL()
+
+ACLPrivate = canned_acl['private']
+ACLPublicRead = canned_acl['public-read']
+ACLPublicReadWrite = canned_acl['public-read-write']
+ACLAuthenticatedRead = canned_acl['authenticated-read']
+ACLBucketOwnerRead = canned_acl['bucket-owner-read']
+ACLBucketOwnerFullControl = canned_acl['bucket-owner-full-control']
+ACLLogDeliveryWrite = canned_acl['log-delivery-write']
diff --git a/swift/common/middleware/s3api/utils.py b/swift/common/middleware/s3api/utils.py
new file mode 100644
index 0000000000..dc956a189b
--- /dev/null
+++ b/swift/common/middleware/s3api/utils.py
@@ -0,0 +1,372 @@
+# Copyright (c) 2014 OpenStack Foundation.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import base64
+import calendar
+import datetime
+import email.utils
+import re
+import time
+import uuid
+
+from swift.common import utils
+from swift.common.constraints import check_utf8
+from swift.common.swob import wsgi_to_str
+from swift.common.middleware.s3api.exception import \
+    InvalidBucketNameParseError, InvalidURIParseError
+
+MULTIUPLOAD_SUFFIX = '+segments'
+
+
+def sysmeta_prefix(resource):
+    """
+    Returns the system metadata prefix for given resource type.
+    """
+    if resource.lower() == 'object':
+        return 'x-object-sysmeta-s3api-'
+    else:
+        return 'x-container-sysmeta-s3api-'
+
+
+def sysmeta_header(resource, name):
+    """
+    Returns the system metadata header for given resource type and name.
+    """
+    return sysmeta_prefix(resource) + name
+
+
+def camel_to_snake(camel):
+    return re.sub('(.)([A-Z])', r'\1_\2', camel).lower()
+
+
+def snake_to_camel(snake):
+    return snake.title().replace('_', '')
+
+
+def make_header_label(header):
+    return 'header_' + header.lower().replace('-', '_')
+
+
+def unique_id():
+    result = base64.urlsafe_b64encode(str(uuid.uuid4()).encode('ascii'))
+    return result.decode('ascii')
+
+
+def utf8encode(s):
+    if s is None or isinstance(s, bytes):
+        return s
+    return s.encode('utf8')
+
+
+def utf8decode(s):
+    if isinstance(s, bytes):
+        s = s.decode('utf8')
+    return s
+
+
+def is_valid_base64(s):
+    try:
+        base64.b64decode(s)
+        return True
+    except Exception:
+        return False
+
+
+def is_valid_hash(hash_string):
+    try:
+        int(hash_string, 16)
+    except ValueError:
+        return False
+    return True
+
+
+def classify_checksum_header_value(value):
+    if is_valid_hash(value):
+        if len(value) in (8, 16, 20, 32, 64, 128, 256, 512):
+            return 'hash_%d' % len(value)
+    elif is_valid_base64(value):
+        # crc32 -> b64_8
+        # crc64 -> b64_12
+        # md5 -> b64_24
+        # sha1 -> b64_28
+        # sha256 -> b64_44
+        if len(value) in (8, 12, 24, 28, 44):
+            return 'b64_%d' % len(value)
+    return 'unknown'
+
+
+def validate_bucket_name(name, dns_compliant_bucket_names):
+    """
+    Validates the name of the bucket against S3 criteria,
+    http://docs.amazonwebservices.com/AmazonS3/latest/BucketRestrictions.html
+    True is valid, False is invalid.
+    """
+    valid_chars = '-.a-z0-9'
+    if not dns_compliant_bucket_names:
+        valid_chars += 'A-Z_'
+    max_len = 63 if dns_compliant_bucket_names else 255
+
+    if len(name) < 3 or len(name) > max_len or not name[0].isalnum():
+        # Bucket names should be between 3 and 63 (or 255) characters long
+        # Bucket names must start with a letter or a number
+        return False
+    elif dns_compliant_bucket_names and (
+            '.-' in name or '-.' in name or '..' in name or
+            not name[-1].isalnum()):
+        # Bucket names cannot contain dashes next to periods
+        # Bucket names cannot contain two adjacent periods
+        # Bucket names must end with a letter or a number
+        return False
+    elif name.endswith('.'):
+        # Bucket names must not end with dot
+        return False
+    elif re.match(r"^(([0-9]|[1-9][0-9]|1[0-9]{2}|2[0-4][0-9]|25[0-5])\.)"
+                  r"{3}([0-9]|[1-9][0-9]|1[0-9]{2}|2[0-4][0-9]|25[0-5])$",
+                  name):
+        # Bucket names cannot be formatted as an IP Address
+        return False
+    elif not re.match("^[%s]*$" % valid_chars, name):
+        # Bucket names can contain lowercase letters, numbers, and hyphens.
+        return False
+    else:
+        return True
+
+
+def get_s3_access_key_id(req):
+    """
+    Return the S3 access_key_id user for the request,
+    or None if it does not look like an S3 request.
+
+    :param req: a swob.Request instance
+
+    :returns: access_key_id if available, else None
+    """
+
+    authorization = req.headers.get('Authorization', '')
+    if authorization.startswith('AWS '):
+        # v2
+        return authorization[4:].rsplit(':', 1)[0]
+    if authorization.startswith('AWS4-HMAC-SHA256 '):
+        # v4
+        return authorization.partition('Credential=')[2].split('/', 1)[0]
+    params = req.params
+    if 'AWSAccessKeyId' in params:
+        # v2
+        return params['AWSAccessKeyId']
+    if 'X-Amz-Credential' in params:
+        # v4
+        return params['X-Amz-Credential'].split('/', 1)[0]
+
+    return None
+
+
+def is_s3_req(req):
+    """
+    Check whether a request looks like it ought to be an S3 request.
+
+    :param req: a swob.Request instance
+
+    :returns: True if access_key_id is available, False if not
+    """
+    return bool(get_s3_access_key_id(req))
+
+
+def parse_host(environ, storage_domains):
+    """
+    A bucket-in-host request has the bucket name as the first part of a
+    ``.``-separated host. If the host ends with any of
+    the given storage_domains then the bucket name is returned.
+    Otherwise ``None`` is returned.
+
+    :param environ: an environment dict
+    :param storage_domains: a list of storage domains for which bucket-in-host
+                            is supported.
+    :returns: bucket name or None
+    """
+
+    if 'HTTP_HOST' in environ:
+        given_domain = environ['HTTP_HOST']
+    elif 'SERVER_NAME' in environ:
+        given_domain = environ['SERVER_NAME']
+    else:
+        return None
+    if ':' in given_domain:
+        given_domain = given_domain.rsplit(':', 1)[0]
+
+    for storage_domain in storage_domains:
+        if not storage_domain.startswith('.'):
+            storage_domain = '.' + storage_domain
+
+        if given_domain.endswith(storage_domain):
+            return given_domain[:-len(storage_domain)]
+
+    return None
+
+
+def parse_path(req, bucket_in_host, dns_compliant_bucket_names):
+    """
+    :params req: a swob.Request instance
+    :params bucket_in_host: A bucket-in-host request has the bucket name as
+                            the first part of a ``.``-separated host.
+    :params dns_compliant_bucket_names: whether to validate that the bucket
+                                        name must be dns compliant
+
+    :returns: WSGI string
+    """
+    if not check_utf8(wsgi_to_str(req.environ['PATH_INFO'])):
+        raise InvalidURIParseError(req.path)
+
+    if bucket_in_host:
+        obj = req.environ['PATH_INFO'][1:] or None
+        return bucket_in_host, obj
+
+    bucket, obj = req.split_path(0, 2, True)
+
+    if bucket and not validate_bucket_name(
+            bucket, dns_compliant_bucket_names):
+        # Ignore GET service case
+        raise InvalidBucketNameParseError(bucket)
+    return bucket, obj
+
+
+def extract_bucket_and_key(req, storage_domains,
+                           dns_compliant_bucket_names):
+    """
+    Extract the bucket and object key from the request's PATH_INFO. Support
+    bucket-in-host if storage_domains and HTTP_HOST or SERVER_NAME are
+    specified. Otherwise the bucket is parsed from PATH_INFO.
+
+    :param req: a swob.Request instance
+    :param storage_domains: a list of storage domains for which bucket-in-host
+                            is supported.
+    :param dns_compliant_bucket_names: whether to validate that the bucket
+                                       name must be dns compliant
+
+    :returns: a tuple of (bucket, key). If the request path is invalid
+              the tuple (None, None) is returned.
+    """
+    try:
+        bucket_in_host = parse_host(req.environ, storage_domains)
+        bucket, key = parse_path(
+            req, bucket_in_host, dns_compliant_bucket_names)
+    except (InvalidBucketNameParseError, InvalidURIParseError):
+        bucket, key = None, None
+    return bucket, key
+
+
+class S3Timestamp(utils.Timestamp):
+    S3_XML_FORMAT = "%Y-%m-%dT%H:%M:%S.000Z"
+
+    @property
+    def s3xmlformat(self):
+        dt = datetime.datetime.fromtimestamp(
+            self.ceil(), datetime.timezone.utc)
+        return dt.strftime(self.S3_XML_FORMAT)
+
+    @classmethod
+    def from_s3xmlformat(cls, date_string):
+        dt = datetime.datetime.strptime(date_string, cls.S3_XML_FORMAT)
+        dt = dt.replace(tzinfo=datetime.timezone.utc)
+        seconds = calendar.timegm(dt.timetuple())
+        return cls(seconds)
+
+    @property
+    def amz_date_format(self):
+        """
+        this format should be like 'YYYYMMDDThhmmssZ'
+        """
+        return self.isoformat.replace(
+            '-', '').replace(':', '')[:-7] + 'Z'
+
+
+def mktime(timestamp_str, time_format='%Y-%m-%dT%H:%M:%S'):
+    """
+    mktime creates a float instance in epoch time really like as time.mktime
+
+    the difference from time.mktime is allowing to 2 formats string for the
+    argument for the S3 testing usage.
+    TODO: support
+
+    :param timestamp_str: a string of timestamp formatted as
+                          (a) RFC2822 (e.g. date header)
+                          (b) %Y-%m-%dT%H:%M:%S (e.g. copy result)
+    :param time_format: a string of format to parse in (b) process
+    :returns: a float instance in epoch time
+    """
+    # time_tuple is the *remote* local time
+    time_tuple = email.utils.parsedate_tz(timestamp_str)
+    if time_tuple is None:
+        time_tuple = time.strptime(timestamp_str, time_format)
+        # add timezone info as utc (no time difference)
+        time_tuple += (0, )
+
+    # We prefer calendar.gmtime and a manual adjustment over
+    # email.utils.mktime_tz because older versions of Python (<2.7.4) may
+    # double-adjust for timezone in some situations (such when swift changes
+    # os.environ['TZ'] without calling time.tzset()).
+    epoch_time = calendar.timegm(time_tuple) - time_tuple[9]
+
+    return epoch_time
+
+
+class Config(dict):
+    DEFAULTS = {
+        'storage_domains': [],
+        'location': 'us-east-1',
+        'force_swift_request_proxy_log': False,
+        'dns_compliant_bucket_names': True,
+        'allow_multipart_uploads': True,
+        'allow_no_owner': False,
+        'allowable_clock_skew': 900,
+        'ratelimit_as_client_error': False,
+        'max_upload_part_num': 1000,
+    }
+
+    def __init__(self, base=None):
+        self.update(self.DEFAULTS)
+        if base is not None:
+            self.update(base)
+
+    def __getattr__(self, name):
+        if name not in self:
+            raise AttributeError("No attribute '%s'" % name)
+
+        return self[name]
+
+    def __setattr__(self, name, value):
+        self[name] = value
+
+    def __delattr__(self, name):
+        del self[name]
+
+    def update(self, other):
+        if hasattr(other, 'keys'):
+            for key in other.keys():
+                self[key] = other[key]
+        else:
+            for key, value in other:
+                self[key] = value
+
+    def __setitem__(self, key, value):
+        if isinstance(self.get(key), bool):
+            dict.__setitem__(self, key, utils.config_true_value(value))
+        elif isinstance(self.get(key), int):
+            try:
+                dict.__setitem__(self, key, int(value))
+            except ValueError:
+                if value:  # No need to raise the error if value is ''
+                    raise
+        else:
+            dict.__setitem__(self, key, value)
diff --git a/swift/common/middleware/slo.py b/swift/common/middleware/slo.py
new file mode 100644
index 0000000000..6a62166ce6
--- /dev/null
+++ b/swift/common/middleware/slo.py
@@ -0,0 +1,1919 @@
+# Copyright (c) 2018 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+r"""
+Middleware that will provide Static Large Object (SLO) support.
+
+This feature is very similar to Dynamic Large Object (DLO) support in that
+it allows the user to upload many objects concurrently and afterwards
+download them as a single object. It is different in that it does not rely
+on eventually consistent container listings to do so. Instead, a user
+defined manifest of the object segments is used.
+
+----------------------
+Uploading the Manifest
+----------------------
+
+After the user has uploaded the objects to be concatenated, a manifest is
+uploaded. The request must be a ``PUT`` with the query parameter::
+
+    ?multipart-manifest=put
+
+The body of this request will be an ordered list of segment descriptions in
+JSON format. The data to be supplied for each segment is either:
+
+=========== ========================================================
+Key         Description
+=========== ========================================================
+path        the path to the segment object (not including account)
+            /container/object_name
+etag        (optional) the ETag given back when the segment object
+            was PUT
+size_bytes  (optional) the size of the complete segment object in
+            bytes
+range       (optional) the (inclusive) range within the object to
+            use as a segment. If omitted, the entire object is used
+=========== ========================================================
+
+Or:
+
+=========== ========================================================
+Key         Description
+=========== ========================================================
+data        base64-encoded data to be returned
+=========== ========================================================
+
+.. note::
+    At least one object-backed segment must be included. If you'd like
+    to create a manifest consisting purely of data segments, consider
+    uploading a normal object instead.
+
+The format of the list will be::
+
+    [{"path": "/cont/object",
+      "etag": "etagoftheobjectsegment",
+      "size_bytes": 10485760,
+      "range": "1048576-2097151"},
+     {"data": base64.b64encode("interstitial data")},
+     {"path": "/cont/another-object", ...},
+     ...]
+
+The number of object-backed segments is limited to ``max_manifest_segments``
+(configurable in proxy-server.conf, default 1000). Each segment must be at
+least 1 byte. On upload, the middleware will head every object-backed segment
+passed in to verify:
+
+1. the segment exists (i.e. the ``HEAD`` was successful);
+2. the segment meets minimum size requirements;
+3. if the user provided a non-null ``etag``, the etag matches;
+4. if the user provided a non-null ``size_bytes``, the size_bytes matches; and
+5. if the user provided a ``range``, it is a singular, syntactically correct
+   range that is satisfiable given the size of the object referenced.
+
+For inlined data segments, the middleware verifies each is valid, non-empty
+base64-encoded binary data. Note that data segments *do not* count against
+``max_manifest_segments``.
+
+Note that the ``etag`` and ``size_bytes`` keys are optional; if omitted, the
+verification is not performed. If any of the objects fail to verify (not
+found, size/etag mismatch, below minimum size, invalid range) then the user
+will receive a 4xx error response. If everything does match, the user will
+receive a 2xx response and the SLO object is ready for downloading.
+
+Note that large manifests may take a long time to verify; historically,
+clients would need to use a long read timeout for the connection to give
+Swift enough time to send a final ``201 Created`` or ``400 Bad Request``
+response. Now, clients should use the query parameters::
+
+    ?multipart-manifest=put&heartbeat=on
+
+to request that Swift send an immediate ``202 Accepted`` response and periodic
+whitespace to keep the connection alive. A final response code will appear in
+the body. The format of the response body defaults to text/plain but can be
+either json or xml depending on the ``Accept`` header. An example body is as
+follows::
+
+    Response Status: 201 Created
+    Response Body:
+    Etag: "8f481cede6d2ddc07cb36aa084d9a64d"
+    Last Modified: Wed, 25 Oct 2017 17:08:55 GMT
+    Errors:
+
+Or, as a json response::
+
+    {"Response Status": "201 Created",
+     "Response Body": "",
+     "Etag": "\"8f481cede6d2ddc07cb36aa084d9a64d\"",
+     "Last Modified": "Wed, 25 Oct 2017 17:08:55 GMT",
+     "Errors": []}
+
+Behind the scenes, on success, a JSON manifest generated from the user input is
+sent to object servers with an extra ``X-Static-Large-Object: True`` header
+and a modified ``Content-Type``. The items in this manifest will include the
+``etag`` and ``size_bytes`` for each segment, regardless of whether the client
+specified them for verification. The parameter ``swift_bytes=$total_size`` will
+be appended to the existing ``Content-Type``, where ``$total_size`` is the sum
+of all the included segments' ``size_bytes``. This extra parameter will be
+hidden from the user.
+
+Manifest files can reference objects in separate containers, which will improve
+concurrent upload speed. Objects can be referenced by multiple manifests. The
+segments of a SLO manifest can even be other SLO manifests. Treat them as any
+other object i.e., use the ``Etag`` and ``Content-Length`` given on the ``PUT``
+of the sub-SLO in the manifest to the parent SLO.
+
+While uploading a manifest, a user can send ``Etag`` for verification. It needs
+to be md5 of the segments' etags, if there is no range specified. For example,
+if the manifest to be uploaded looks like this::
+
+    [{"path": "/cont/object1",
+      "etag": "etagoftheobjectsegment1",
+      "size_bytes": 10485760},
+     {"path": "/cont/object2",
+      "etag": "etagoftheobjectsegment2",
+      "size_bytes": 10485760}]
+
+The Etag of the above manifest would be md5 of ``etagoftheobjectsegment1`` and
+``etagoftheobjectsegment2``. This could be computed in the following way::
+
+    echo -n 'etagoftheobjectsegment1etagoftheobjectsegment2' | md5sum
+
+If a manifest to be uploaded with a segment range looks like this::
+
+    [{"path": "/cont/object1",
+      "etag": "etagoftheobjectsegmentone",
+      "size_bytes": 10485760,
+      "range": "1-2"},
+     {"path": "/cont/object2",
+      "etag": "etagoftheobjectsegmenttwo",
+      "size_bytes": 10485760,
+      "range": "3-4"}]
+
+While computing the Etag of the above manifest, internally each segment's etag
+will be taken in the form of ``etagvalue:rangevalue;``. Hence the Etag of the
+above manifest would be::
+
+    echo -n 'etagoftheobjectsegmentone:1-2;etagoftheobjectsegmenttwo:3-4;' \
+    | md5sum
+
+For the purposes of Etag computations, inlined data segments are considered to
+have an etag of the md5 of the raw data (i.e., *not* base64-encoded).
+
+
+-------------------
+Range Specification
+-------------------
+
+Users now have the ability to specify ranges for SLO segments.
+Users can include an optional ``range`` field in segment descriptions
+to specify which bytes from the underlying object should be used for the
+segment data. Only one range may be specified per segment.
+
+.. note::
+
+    The ``etag`` and ``size_bytes`` fields still describe the backing object
+    as a whole.
+
+If a user uploads this manifest::
+
+    [{"path": "/con/obj_seg_1", "size_bytes": 2097152, "range": "0-1048576"},
+     {"path": "/con/obj_seg_2", "size_bytes": 2097152,
+      "range": "512-1550000"},
+     {"path": "/con/obj_seg_1", "size_bytes": 2097152, "range": "-2048"}]
+
+The segment will consist of the first 1048576 bytes of /con/obj_seg_1,
+followed by bytes 513 through 1550000 (inclusive) of /con/obj_seg_2, and
+finally bytes 2095104 through 2097152 (i.e., the last 2048 bytes) of
+/con/obj_seg_1.
+
+.. note::
+
+    The minimum sized range is 1 byte. This is the same as the minimum
+    segment size.
+
+
+-------------------------
+Inline Data Specification
+-------------------------
+
+When uploading a manifest, users can include 'data' segments that should
+be included along with objects. The data in these segments must be
+base64-encoded binary data and will be included in the etag of the
+resulting large object exactly as if that data had been uploaded and
+referenced as separate objects.
+
+.. note::
+
+    This feature is primarily aimed at reducing the need for storing
+    many tiny objects, and as such any supplied data must fit within
+    the maximum manifest size (default is 8MiB). This maximum size
+    can be configured via ``max_manifest_size`` in proxy-server.conf.
+
+
+-------------------------
+Retrieving a Large Object
+-------------------------
+
+A ``GET`` request to the manifest object will return the concatenation of the
+objects from the manifest much like DLO. If any of the segments from the
+manifest are not found or their ``Etag``/``Content-Length`` have changed since
+upload, the connection will drop. In this case a ``409 Conflict`` will be
+logged in the proxy logs and the user will receive incomplete results. Note
+that this will be enforced regardless of whether the user performed per-segment
+validation during upload.
+
+The headers from this ``GET`` or ``HEAD`` request will return the metadata
+attached to the manifest object itself with some exceptions:
+
+===================== ==================================================
+Header                Value
+===================== ==================================================
+Content-Length        the total size of the SLO (the sum of the sizes of
+                      the segments in the manifest)
+X-Static-Large-Object the string "True"
+Etag                  the etag of the SLO (generated the same way as DLO)
+===================== ==================================================
+
+A ``GET`` request with the query parameter::
+
+    ?multipart-manifest=get
+
+will return a transformed version of the original manifest, containing
+additional fields and different key names. For example, the first manifest in
+the example above would look like this::
+
+    [{"name": "/cont/object",
+      "hash": "etagoftheobjectsegment",
+      "bytes": 10485760,
+      "range": "1048576-2097151"}, ...]
+
+As you can see, some of the fields are renamed compared to the put request:
+*path* is *name*, *etag* is *hash*, *size_bytes* is *bytes*.  The *range* field
+remains the same (if present).
+
+A GET request with the query parameters::
+
+    ?multipart-manifest=get&format=raw
+
+will return the contents of the original manifest as it was sent by the client.
+The main purpose for both calls is solely debugging.
+
+A GET request to a manifest object with the query parameter::
+
+    ?part-number=<n>
+
+will return the contents of the ``nth`` segment. Segments are indexed from 1,
+so ``n`` must be an integer between 1 and the total number of segments in the
+manifest. The response status will be ``206 Partial Content`` and its headers
+will include: an ``X-Parts-Count`` header equal to the total number of
+segments; a ``Content-Length`` header equal to the length of the specified
+segment; a ``Content-Range`` header describing the byte range of the specified
+part within the SLO. A HEAD request with a ``part-number`` parameter will also
+return a response with status ``206 Partial Content`` and the same headers.
+
+.. note::
+
+    When the manifest object is uploaded you are more or less guaranteed that
+    every segment in the manifest exists and matched the specifications.
+    However, there is nothing that prevents the user from breaking the SLO
+    download by deleting/replacing a segment referenced in the manifest. It is
+    left to the user to use caution in handling the segments.
+
+
+-----------------------
+Deleting a Large Object
+-----------------------
+
+A ``DELETE`` request will just delete the manifest object itself. The segment
+data referenced by the manifest will remain unchanged.
+
+A ``DELETE`` with a query parameter::
+
+    ?multipart-manifest=delete
+
+will delete all the segments referenced in the manifest and then the manifest
+itself. The failure response will be similar to the bulk delete middleware.
+
+A ``DELETE`` with the query parameters::
+
+    ?multipart-manifest=delete&async=yes
+
+will schedule all the segments referenced in the manifest to be deleted
+asynchronously and then delete the manifest itself. Note that segments will
+continue to appear in listings and be counted for quotas until they are
+cleaned up by the object-expirer. This option is only available when all
+segments are in the same container and none of them are nested SLOs.
+
+------------------------
+Modifying a Large Object
+------------------------
+
+``PUT`` and ``POST`` requests will work as expected; ``PUT``\s will just
+overwrite the manifest object for example.
+
+------------------
+Container Listings
+------------------
+
+In a container listing the size listed for SLO manifest objects will be the
+``total_size`` of the concatenated segments in the manifest. The overall
+``X-Container-Bytes-Used`` for the container (and subsequently for the account)
+will not reflect ``total_size`` of the manifest but the actual size of the JSON
+data stored. The reason for this somewhat confusing discrepancy is we want the
+container listing to reflect the size of the manifest object when it is
+downloaded. We do not, however, want to count the bytes-used twice (for both
+the manifest and the segments it's referring to) in the container and account
+metadata which can be used for stats and billing purposes.
+"""
+
+import base64
+from collections import defaultdict
+from datetime import datetime
+import json
+import mimetypes
+import re
+import time
+
+from swift.cli.container_deleter import make_delete_jobs
+from swift.common.header_key_dict import HeaderKeyDict
+from swift.common.exceptions import ListingIterError, SegmentError
+from swift.common.middleware.listing_formats import \
+    MAX_CONTAINER_LISTING_CONTENT_LENGTH
+from swift.common.swob import Request, HTTPBadRequest, HTTPServerError, \
+    HTTPMethodNotAllowed, HTTPRequestEntityTooLarge, HTTPLengthRequired, \
+    HTTPOk, HTTPPreconditionFailed, HTTPException, HTTPNotFound, \
+    HTTPUnauthorized, HTTPConflict, HTTPUnprocessableEntity, \
+    HTTPServiceUnavailable, Response, Range, normalize_etag, \
+    RESPONSE_REASONS, str_to_wsgi, bytes_to_wsgi, wsgi_to_str, wsgi_quote
+from swift.common.utils import get_logger, config_true_value, \
+    override_bytes_from_content_type, split_path, \
+    RateLimitedIterator, quote, closing_if_possible, \
+    LRUCache, StreamingPile, strict_b64decode, Timestamp, friendly_close, \
+    md5, parse_header
+from swift.common.registry import register_swift_info
+from swift.common.request_helpers import SegmentedIterable, \
+    get_sys_meta_prefix, update_etag_is_at_header, resolve_etag_is_at_header, \
+    get_container_update_override_key, update_ignore_range_header, \
+    get_param, get_valid_part_num, get_heartbeat_response_body
+from swift.common.constraints import check_utf8
+from swift.common.http import HTTP_NOT_FOUND, HTTP_UNAUTHORIZED
+from swift.common.wsgi import WSGIContext, make_subrequest, make_env, \
+    make_pre_authed_request
+from swift.common.middleware.bulk import ACCEPTABLE_FORMATS, Bulk
+from swift.obj import expirer
+from swift.proxy.controllers.base import get_container_info
+
+
+DEFAULT_RATE_LIMIT_UNDER_SIZE = 1024 ** 2  # 1 MiB
+DEFAULT_MAX_MANIFEST_SEGMENTS = 1000
+DEFAULT_MAX_MANIFEST_SIZE = 8 * (1024 ** 2)  # 8 MiB
+DEFAULT_YIELD_FREQUENCY = 10
+
+
+SLO_KEYS = {
+    # required: optional
+    'data': set(),
+    'path': {'range', 'etag', 'size_bytes'},
+}
+
+SYSMETA_SLO_ETAG = get_sys_meta_prefix('object') + 'slo-etag'
+SYSMETA_SLO_SIZE = get_sys_meta_prefix('object') + 'slo-size'
+
+
+def parse_and_validate_input(req_body, req_path):
+    """
+    Given a request body, parses it and returns a list of dictionaries.
+
+    The output structure is nearly the same as the input structure, but it
+    is not an exact copy. Given a valid object-backed input dictionary
+    ``d_in``, its corresponding output dictionary ``d_out`` will be as follows:
+
+    * d_out['etag'] == d_in['etag']
+
+    * d_out['path'] == d_in['path']
+
+    * d_in['size_bytes'] can be a string ("12") or an integer (12), but
+      d_out['size_bytes'] is an integer.
+
+    * (optional) d_in['range'] is a string of the form "M-N", "M-", or
+      "-N", where M and N are non-negative integers. d_out['range'] is the
+      corresponding swob.Range object. If d_in does not have a key
+      'range', neither will d_out.
+
+    Inlined data dictionaries will have any extraneous padding stripped.
+
+    :raises: HTTPException on parse errors or semantic errors (e.g. bogus
+             JSON structure, syntactically invalid ranges)
+
+    :returns: a list of dictionaries on success
+    """
+    try:
+        parsed_data = json.loads(req_body)
+    except ValueError:
+        raise HTTPBadRequest("Manifest must be valid JSON.\n")
+
+    if not isinstance(parsed_data, list):
+        raise HTTPBadRequest("Manifest must be a list.\n")
+
+    # If we got here, req_path refers to an object, so this won't ever raise
+    # ValueError.
+    vrs, account, _junk = split_path(req_path, 3, 3, True)
+
+    errors = []
+    for seg_index, seg_dict in enumerate(parsed_data):
+        if not isinstance(seg_dict, dict):
+            errors.append(b"Index %d: not a JSON object" % seg_index)
+            continue
+
+        for required in SLO_KEYS:
+            if required in seg_dict:
+                segment_type = required
+                break
+        else:
+            errors.append(
+                b"Index %d: expected keys to include one of %s"
+                % (seg_index,
+                   b" or ".join(repr(required) for required in SLO_KEYS)))
+            continue
+
+        allowed_keys = SLO_KEYS[segment_type].union([segment_type])
+        extraneous_keys = [k for k in seg_dict if k not in allowed_keys]
+        if extraneous_keys:
+            errors.append(
+                b"Index %d: extraneous keys %s"
+                % (seg_index,
+                   b", ".join(json.dumps(ek).encode('ascii')
+                              for ek in sorted(extraneous_keys))))
+            continue
+
+        if segment_type == 'path':
+            if not isinstance(seg_dict['path'], str):
+                errors.append(b"Index %d: \"path\" must be a string" %
+                              seg_index)
+                continue
+            if not (seg_dict.get('etag') is None or
+                    isinstance(seg_dict['etag'], str)):
+                errors.append(b'Index %d: "etag" must be a string or null '
+                              b'(if provided)' % seg_index)
+                continue
+
+            if '/' not in seg_dict['path'].strip('/'):
+                errors.append(
+                    b"Index %d: path does not refer to an object. Path must "
+                    b"be of the form /container/object." % seg_index)
+                continue
+
+            seg_size = seg_dict.get('size_bytes')
+            if seg_size is not None:
+                try:
+                    seg_size = int(seg_size)
+                    seg_dict['size_bytes'] = seg_size
+                except (TypeError, ValueError):
+                    errors.append(b"Index %d: invalid size_bytes" % seg_index)
+                    continue
+                if seg_size < 1 and seg_index != (len(parsed_data) - 1):
+                    errors.append(b"Index %d: too small; each segment must be "
+                                  b"at least 1 byte."
+                                  % (seg_index,))
+                    continue
+
+            obj_path = '/'.join(['', vrs, account,
+                                 quote(seg_dict['path'].lstrip('/'))])
+            if req_path == obj_path:
+                errors.append(
+                    b"Index %d: manifest must not include itself as a segment"
+                    % seg_index)
+                continue
+
+            if seg_dict.get('range'):
+                try:
+                    seg_dict['range'] = Range('bytes=%s' % seg_dict['range'])
+                except ValueError:
+                    errors.append(b"Index %d: invalid range" % seg_index)
+                    continue
+
+                if len(seg_dict['range'].ranges) > 1:
+                    errors.append(b"Index %d: multiple ranges "
+                                  b"(only one allowed)" % seg_index)
+                    continue
+
+                # If the user *told* us the object's size, we can check range
+                # satisfiability right now. If they lied about the size, we'll
+                # fail that validation later.
+                if (seg_size is not None and 1 != len(
+                        seg_dict['range'].ranges_for_length(seg_size))):
+                    errors.append(b"Index %d: unsatisfiable range" % seg_index)
+                    continue
+
+        elif segment_type == 'data':
+            # Validate that the supplied data is non-empty and base64-encoded
+            try:
+                data = strict_b64decode(seg_dict['data'])
+            except ValueError:
+                errors.append(
+                    b"Index %d: data must be valid base64" % seg_index)
+                continue
+            if len(data) < 1:
+                errors.append(b"Index %d: too small; each segment must be "
+                              b"at least 1 byte."
+                              % (seg_index,))
+                continue
+            # re-encode to normalize padding
+            seg_dict['data'] = base64.b64encode(data).decode('ascii')
+
+    if parsed_data and all('data' in d for d in parsed_data):
+        errors.append(b"Inline data segments require at least one "
+                      b"object-backed segment.")
+
+    if errors:
+        error_message = b"".join(e + b"\n" for e in errors)
+        raise HTTPBadRequest(error_message,
+                             headers={"Content-Type": "text/plain"})
+
+    return parsed_data
+
+
+def _annotate_segments(segments, logger=None):
+    """
+    Decode any inlined data and update sub_slo segments bytes from content-type
+    when available; then annotate segment dicts in segments list with
+    'segment_length'.
+
+    N.B. raw_data segments don't have a bytes key and range-segments need to
+    calculate their length from their range key but afterwards all segments
+    dicts will have 'segment_length' representing the length of the segment.
+    """
+    for seg_dict in segments:
+        if 'data' in seg_dict:
+            seg_dict['raw_data'] = base64.b64decode(seg_dict.pop('data'))
+            segment_length = len(seg_dict['raw_data'])
+        else:
+            if config_true_value(seg_dict.get('sub_slo')):
+                override_bytes_from_content_type(
+                    seg_dict, logger=logger)
+            seg_range = seg_dict.get('range')
+            if seg_range is not None:
+                # The range is of the form N-M, where N and M are both
+                # positive decimal integers. We know this because this
+                # middleware is the only thing that creates the SLO
+                # manifests stored in the cluster.
+                range_start, range_end = [
+                    int(x) for x in seg_range.split('-')]
+                segment_length = (range_end - range_start) + 1
+            else:
+                segment_length = int(seg_dict['bytes'])
+        seg_dict['segment_length'] = segment_length
+
+
+def calculate_byterange_for_part_num(req, segments, part_num):
+    """
+    Helper function to calculate the byterange for a part_num response.
+
+    N.B. as a side-effect of calculating the single tuple representing the
+    byterange required for a part_num response this function will also mutate
+    the request's Range header so that swob knows to return 206.
+
+    :param req: the request object
+    :param segments: the list of seg_dicts
+    :param part_num: the part number of the object to return
+
+    :returns: a tuple representing the byterange
+    """
+    start = 0
+    for seg in segments[:part_num - 1]:
+        start += seg['segment_length']
+    last = start + segments[part_num - 1]['segment_length']
+    # We need to mutate the request's Range header so that swob knows to
+    # handle these partial content requests correctly.
+    req.range = "bytes=%d-%d" % (start, last - 1)
+    return start, last - 1
+
+
+def calculate_byteranges(req, segments, resp_attrs, part_num):
+    """
+    Calculate the byteranges based on the request, segments, and part number.
+
+    N.B. as a side-effect of calculating the single tuple representing the
+    byterange required for a part_num response this function will also mutate
+    the request's Range header so that swob knows to return 206.
+
+    :param req: the request object
+    :param segments: the list of seg_dicts
+    :param resp_attrs: the slo response attributes
+    :param part_num: the part number of the object to return
+
+    :returns: a list of tuples representing byteranges
+    """
+    if req.range:
+        byteranges = [
+            # For some reason, swob.Range.ranges_for_length adds 1 to the
+            # last byte's position.
+            (start, end - 1) for start, end
+            in req.range.ranges_for_length(resp_attrs.slo_size)]
+    elif part_num:
+        byteranges = [
+            calculate_byterange_for_part_num(req, segments, part_num)]
+    else:
+        byteranges = [(0, resp_attrs.slo_size - 1)]
+
+    return byteranges
+
+
+class RespAttrs(object):
+    """
+    Encapsulate properties of a GET or HEAD response that are pertinent to
+    handling a potential SLO response.
+
+    Instances of this class are typically constructed using the
+    ``from_headers`` method.
+
+    :param is_slo: True if the response appears to be an SLO manifest, False
+        otherwise.
+    :param timestamp: a value from which an instance of
+        :class:`~swift.common.utils.Timestamp` can be constructed.
+    :param manifest_etag: the Etag of the manifest object, or None if
+        ``is_slo`` is False.
+    :param slo_etag: the Etag of the SLO.
+    :param slo_size: the size of the SLO.
+    """
+    def __init__(self, is_slo, timestamp, manifest_etag, slo_etag, slo_size):
+        self.is_slo = bool(is_slo)
+        self.timestamp = Timestamp(timestamp or Timestamp.zero())
+        # manifest_etag is unambiguous, but json_md5 is even more explicit
+        self.json_md5 = manifest_etag or ''
+        self.slo_etag = slo_etag or ''
+        try:
+            # even though it's from sysmeta, we have to worry about empty
+            # values - see test_get_invalid_sysmeta_passthrough
+            self.slo_size = int(slo_size)
+        except (ValueError, TypeError):
+            self.slo_size = -1
+        self.is_legacy = not self._has_size_and_etag()
+
+    def _has_size_and_etag(self):
+        return self.slo_size >= 0 and self.slo_etag
+
+    @classmethod
+    def from_headers(cls, response_headers):
+        """
+        Inspect response headers and extract any resp_attrs we can find.
+
+        :param response_headers: list of tuples from a object response
+        :returns: an instance of RespAttrs to represent the response headers
+        """
+        is_slo = False
+        timestamp = None
+        found_etag = None
+        slo_etag = None
+        slo_size = None
+        for header, value in response_headers:
+            header = header.lower()
+            if header == 'x-static-large-object':
+                is_slo = config_true_value(value)
+            elif header == 'x-backend-timestamp':
+                timestamp = value
+            elif header == 'etag':
+                found_etag = value
+            elif header == SYSMETA_SLO_ETAG:
+                slo_etag = value
+            elif header == SYSMETA_SLO_SIZE:
+                slo_size = value
+        manifest_etag = found_etag if is_slo else None
+        return cls(is_slo, timestamp, manifest_etag, slo_etag, slo_size)
+
+    def update_from_segments(self, segments):
+        """
+        Always called if SLO has fetched the manifest response body, for
+        legacy manifests we'll calculate size/etag values we wouldn't have
+        gotten from sys-meta headers.
+        """
+        # we only have to set size/etag once; it doesn't matter if we got the
+        # values from sysmeta headers or segments
+        if self._has_size_and_etag():
+            return
+
+        calculated_size = 0
+        calculated_etag = md5(usedforsecurity=False)
+
+        for seg_dict in segments:
+            calculated_size += seg_dict['segment_length']
+
+            if 'raw_data' in seg_dict:
+                r = md5(seg_dict['raw_data'],
+                        usedforsecurity=False).hexdigest()
+            elif seg_dict.get('range'):
+                r = '%s:%s;' % (seg_dict['hash'], seg_dict['range'])
+            else:
+                r = seg_dict['hash']
+            calculated_etag.update(r.encode('ascii'))
+
+        self.slo_size = calculated_size
+        self.slo_etag = calculated_etag.hexdigest()
+
+
+class SloGetContext(WSGIContext):
+
+    max_slo_recursion_depth = 10
+
+    def __init__(self, slo):
+        self.slo = slo
+        super(SloGetContext, self).__init__(slo.app)
+        # we'll know more after we look at the response metadata
+        self.segment_listing_needed = False
+
+    def _fetch_sub_slo_segments(self, req, version, acc, con, obj):
+        """
+        Fetch the submanifest, parse it, and return it.
+        Raise exception on failures.
+
+        :param req: the upstream request
+        :param version: whatever
+        :param acc: native
+        :param con: native
+        :param obj: native
+        """
+        sub_req = make_subrequest(
+            req.environ,
+            path=wsgi_quote('/'.join([
+                '', str_to_wsgi(version),
+                str_to_wsgi(acc), str_to_wsgi(con), str_to_wsgi(obj)])),
+            method='GET',
+            headers={'x-auth-token': req.headers.get('x-auth-token')},
+            agent='%(orig)s SLO MultipartGET', swift_source='SLO')
+        params_copy = dict(req.params)
+        params_copy.pop('part-number', None)
+        sub_req.params = params_copy
+        sub_resp = sub_req.get_response(self.slo.app)
+
+        if not sub_resp.is_success:
+            # Error message should be short
+            body = sub_resp.body.decode('utf-8')
+            msg = ('while fetching %s, GET of submanifest %s '
+                   'failed with status %d (%s)')
+            raise ListingIterError(msg % (
+                req.path, sub_req.path, sub_resp.status_int,
+                body if len(body) <= 60 else body[:57] + '...'))
+
+        try:
+            return self._parse_segments(sub_resp.app_iter)
+        except HTTPException as err:
+            raise ListingIterError(
+                'while fetching %s, JSON-decoding of submanifest %s '
+                'failed with %s' % (req.path, sub_req.path, err))
+
+    def _segment_path(self, version, account, seg_dict):
+        return "/{ver}/{acc}/{conobj}".format(
+            ver=version, acc=account,
+            conobj=seg_dict['name'].lstrip('/')
+        )
+
+    def _segment_listing_iterator(self, req, version, account, segments,
+                                  byteranges):
+        # We handle the range stuff here so that we can be smart about
+        # skipping unused submanifests. For example, if our first segment is a
+        # submanifest referencing 50 MiB total, but start_byte falls in
+        # the 51st MiB, then we can avoid fetching the first submanifest.
+        #
+        # If we were to make SegmentedIterable handle all the range
+        # calculations, we would be unable to make this optimization.
+
+        # Cache segments from sub-SLOs in case more than one byterange
+        # includes data from a particular sub-SLO. We only cache a few sets
+        # of segments so that a malicious user cannot build a giant SLO tree
+        # and then GET it to run the proxy out of memory.
+        #
+        # LRUCache is a little awkward to use this way, but it beats doing
+        # things manually.
+        #
+        # 20 is sort of an arbitrary choice; it's twice our max recursion
+        # depth, so we know this won't expand memory requirements by too
+        # much.
+        cached_fetch_sub_slo_segments = \
+            LRUCache(maxsize=20)(self._fetch_sub_slo_segments)
+
+        for first_byte, last_byte in byteranges:
+            byterange_listing_iter = self._byterange_listing_iterator(
+                req, version, account, segments, first_byte, last_byte,
+                cached_fetch_sub_slo_segments)
+            for seg_info in byterange_listing_iter:
+                yield seg_info
+
+    def _byterange_listing_iterator(self, req, version, account, segments,
+                                    first_byte, last_byte,
+                                    cached_fetch_sub_slo_segments,
+                                    recursion_depth=1):
+        """
+        Iterable that generates a filtered and annotated stream of segment
+        dicts describing the sub-segment ranges that would be used by the
+        SegmentedIterable to construct the bytes for a ranged response.
+
+        :param req: original request object
+        :param version: version
+        :param account: account
+        :param segments: segments dictionary
+        :param first_byte: offset into the large object for the first byte
+          that is returned to the client
+        :param last_byte: offset into the large object for the last byte
+          that is returned to the client
+        :param cached_fetch_sub_slo_segments: LRU cache used for fetching
+          sub-segments
+        :param recursion_depth: max number of recursive sub_slo calls
+        """
+        last_sub_path = None
+        for seg_dict in segments:
+            seg_length = seg_dict['segment_length']
+            if first_byte >= seg_length:
+                # don't need any bytes from this segment
+                first_byte -= seg_length
+                last_byte -= seg_length
+                continue
+
+            if last_byte < 0:
+                # no bytes are needed from this or any future segment
+                return
+
+            if 'raw_data' in seg_dict:
+                yield dict(seg_dict,
+                           first_byte=max(0, first_byte),
+                           last_byte=min(seg_length - 1, last_byte))
+                first_byte -= seg_length
+                last_byte -= seg_length
+                continue
+
+            seg_range = seg_dict.get('range')
+            if seg_range is None:
+                range_start, range_end = 0, seg_length - 1
+            else:
+                # This simple parsing of the range is valid because we already
+                # validated and supplied concrete values for the range
+                # during SLO manifest creation
+                range_start, range_end = map(int, seg_range.split('-'))
+
+            if config_true_value(seg_dict.get('sub_slo')):
+                # Do this check here so that we can avoid fetching this last
+                # manifest before raising the exception
+                if recursion_depth >= self.max_slo_recursion_depth:
+                    raise ListingIterError(
+                        "While processing manifest %r, "
+                        "max recursion depth was exceeded" % req.path)
+
+                sub_path = seg_dict['name']
+                sub_cont, sub_obj = split_path(sub_path, 2, 2, True)
+                if last_sub_path != sub_path:
+                    sub_segments = cached_fetch_sub_slo_segments(
+                        req, version, account, sub_cont, sub_obj)
+                last_sub_path = sub_path
+
+                # Use the existing machinery to slice into the sub-SLO.
+                for sub_seg_dict in self._byterange_listing_iterator(
+                        req, version, account, sub_segments,
+                        # This adjusts first_byte and last_byte to be
+                        # relative to the sub-SLO.
+                        range_start + max(0, first_byte),
+                        min(range_end, range_start + last_byte),
+
+                        cached_fetch_sub_slo_segments,
+                        recursion_depth=recursion_depth + 1):
+                    yield sub_seg_dict
+            else:
+                yield dict(seg_dict,
+                           first_byte=max(0, first_byte) + range_start,
+                           last_byte=min(range_end, range_start + last_byte))
+
+            first_byte -= seg_length
+            last_byte -= seg_length
+
+    def _is_body_complete(self):
+        content_range = ''
+        for header, value in self._response_headers:
+            if header.lower() == 'content-range':
+                content_range = value
+                break
+        # e.g. Content-Range: bytes 0-14289/14290
+        match = re.match(r'bytes (\d+)-(\d+)/(\d+)$', content_range)
+        if not match:
+            # Malformed or missing, so we don't know what we got.
+            return False
+        first_byte, last_byte, length = [int(x) for x in match.groups()]
+        # If and only if we actually got back the full manifest body, then
+        # we can avoid re-fetching the object.
+        return first_byte == 0 and last_byte == length - 1
+
+    def _need_to_refetch_manifest(self, req, resp_attrs, is_part_num_request):
+        """
+        Check if the segments will be needed to service the request and update
+        the segment_listing_needed attribute.
+
+        :return: boolean indicating if we need to refetch, only if the segments
+                 ARE needed we MAY need to refetch them!
+        """
+        if req.method == 'HEAD':
+            # There may be some cases in the future where a HEAD resp on even a
+            # modern manifest should refetch, e.g. lp bug #2029174
+            self.segment_listing_needed = (resp_attrs.is_legacy or
+                                           is_part_num_request)
+            # it will always be the case that a HEAD must re-fetch iff
+            # segment_listing_needed
+            return self.segment_listing_needed
+
+        last_resp_status_int = self._get_status_int()
+        # These are based on etag (or last-modified), but the SLO's etag is
+        # almost certainly not the manifest object's etag. Still, it's highly
+        # likely that the submitted If-None-Match won't match the manifest
+        # object's etag, so we can avoid re-fetching the manifest if we got a
+        # successful response.
+        if last_resp_status_int in (412, 304):
+            # a conditional response from a modern manifest would have an
+            # accurate SLO etag, AND comparison with the etag-is-at header, but
+            # for legacy manifests responses (who always need to calculate the
+            # correct etag, even for if-[un]modified-since errors) we can't say
+            # what the etag is or if it matches unless we calculate it from
+            # segments - so we always need them
+            self.segment_listing_needed = resp_attrs.is_legacy
+            # if we need them; we can't get them from the error
+            return self.segment_listing_needed
+
+        # This is GET request for an SLO object, if we're going to return a
+        # successful response we're going to need the segments, but this
+        # resp_iter may not contain the entire SLO manifest.
+        self.segment_listing_needed = True
+
+        # modern swift object-servers should ignore Range headers on manifests,
+        # but during upgrade if we get a range response we'll probably have to
+        # refetch
+        if last_resp_status_int == 416:
+            # if the range wasn't satisfiable we need to refetch
+            return True
+        elif last_resp_status_int == 206:
+            # a partial response might included the whole content-range?!
+            return not self._is_body_complete()
+        else:
+            # a good number of error responses would have returned earlier for
+            # lacking is_slo sys-meta, at this point we've filtered all the
+            # other response codes, so this is a prefectly normal 200 response,
+            # no need to refetch
+            return False
+
+    def _refetch_manifest(self, req, resp_iter, orig_resp_attrs):
+        req.environ['swift.non_client_disconnect'] = True
+        friendly_close(resp_iter)
+        del req.environ['swift.non_client_disconnect']
+
+        headers_subset = ['x-auth-token', 'x-open-expired']
+        get_req = make_subrequest(
+            req.environ, method='GET',
+            headers={k: req.headers.get(k)
+                     for k in headers_subset if k in req.headers},
+            agent='%(orig)s SLO MultipartGET', swift_source='SLO')
+        resp_iter = self._app_call(get_req.environ)
+        new_resp_attrs = RespAttrs.from_headers(self._response_headers)
+        if new_resp_attrs.timestamp < orig_resp_attrs.timestamp and \
+                not new_resp_attrs.is_slo:
+            # Our *orig_resp_attrs* saw *newer* data that indicated it was an
+            # SLO, but on refetch it's an older object or error; 503 seems
+            # reasonable?
+            friendly_close(resp_iter)
+            raise HTTPServiceUnavailable(request=req)
+        # else, the caller will know how to return this response
+        return new_resp_attrs, resp_iter
+
+    def _parse_segments(self, resp_iter):
+        """
+        Read the manifest body and parse segments.
+
+        :returns: segments
+        :raises: HTTPServerError
+        """
+        segments = self._get_manifest_read(resp_iter)
+        _annotate_segments(segments, logger=self.slo.logger)
+        return segments
+
+    def _return_manifest_response(self, req, start_response, resp_iter,
+                                  is_format_raw):
+        if is_format_raw:
+            json_data = self.convert_segment_listing(resp_iter)
+            # we've created a new response body
+            resp_iter = [json_data]
+            replace_headers = {
+                # Note that we have to return the large object's content-type
+                # (not application/json) so it's like what the client sent on
+                # PUT. Otherwise, server-side copy won't work.
+                'Content-Length': len(json_data),
+                'Etag': md5(json_data, usedforsecurity=False).hexdigest(),
+            }
+        else:
+            # we're going to return the manifest resp_iter as-is
+            replace_headers = {
+                'Content-Type': 'application/json; charset=utf-8',
+            }
+        return self._return_response(req, start_response, resp_iter,
+                                     replace_headers)
+
+    def _return_slo_response(self, req, start_response, resp_iter, resp_attrs):
+        headers = {
+            'Etag': '"%s"' % resp_attrs.slo_etag,
+            'X-Manifest-Etag': resp_attrs.json_md5,
+            # swob will fix this for a GET with Range
+            'Content-Length': str(resp_attrs.slo_size),
+            # ignore bogus content-range, make swob figure it out
+            'Content-Range': None,
+        }
+        if self.segment_listing_needed:
+            # consume existing resp_iter; we'll create a new one
+            segments = self._parse_segments(resp_iter)
+            resp_attrs.update_from_segments(segments)
+            headers['Etag'] = '"%s"' % resp_attrs.slo_etag
+            headers['Content-Length'] = str(resp_attrs.slo_size)
+            part_num = get_valid_part_num(req)
+            if part_num:
+                headers['X-Parts-Count'] = len(segments)
+
+            if part_num and part_num > len(segments):
+                if req.method == 'HEAD':
+                    resp_iter = []
+                    headers['Content-Length'] = '0'
+                else:
+                    body = b'The requested part number is not satisfiable'
+                    resp_iter = [body]
+                    headers['Content-Length'] = len(body)
+                headers['Content-Range'] = 'bytes */%d' % resp_attrs.slo_size
+                self._response_status = '416 Requested Range Not Satisfiable'
+            elif part_num and req.method == 'HEAD':
+                resp_iter = []
+                headers['Content-Length'] = \
+                    segments[part_num - 1].get('segment_length')
+                start, end = calculate_byterange_for_part_num(
+                    req, segments, part_num)
+                headers['Content-Range'] = \
+                    'bytes {}-{}/{}'.format(start, end,
+                                            resp_attrs.slo_size)
+                # The RFC specifies 206 in the context of Range requests, and
+                # Range headers MUST be ignored for HEADs [1], so a HEAD will
+                # not normally return a 206. However, a part-number HEAD
+                # returns Content-Length equal to the part size, rather than
+                # the whole object size, so in this case we do return 206.
+                # [1] https://www.rfc-editor.org/rfc/rfc9110#name-range
+                self._response_status = '206 Partial Content'
+            elif req.method == 'HEAD':
+                resp_iter = []
+            else:
+                byteranges = calculate_byteranges(
+                    req, segments, resp_attrs, part_num)
+                resp_iter = self._build_resp_iter(req, segments, byteranges)
+        return self._return_response(req, start_response, resp_iter,
+                                     replace_headers=headers)
+
+    def _return_response(self, req, start_response, resp_iter,
+                         replace_headers):
+        if req.method == 'HEAD' or self._get_status_int() in (412, 304):
+            # we should drain HEAD and unmet condition responses since they
+            # don't have bodies
+            friendly_close(resp_iter)
+            resp_iter = b''
+        resp_headers = HeaderKeyDict(self._response_headers, **replace_headers)
+        resp = Response(
+            status=self._response_status,
+            headers=resp_headers,
+            app_iter=resp_iter,
+            request=req,
+            conditional_response=True,
+            conditional_etag=resolve_etag_is_at_header(req, resp_headers))
+        return resp(req.environ, start_response)
+
+    def _return_non_slo_response(self, req, start_response, resp_iter):
+        # our "pass-through" response may have been from a manifest refetch w/o
+        # range/conditional headers that turned out to be a real object, and
+        # now we want out.  But if the original client request included Range
+        # or Conditional headers we can trust swob to do the right conversion
+        # back into a 206/416/304/412 (as long as the response we have is a
+        # normal successful response and we respect any forwarding middleware's
+        # etag-is-at header that we stripped off for the refetch!)
+        resp = Response(
+            status=self._response_status,
+            headers=self._response_headers,
+            app_iter=resp_iter,
+            request=req,
+            conditional_response=self._get_status_int() == 200,
+            conditional_etag=resolve_etag_is_at_header(
+                req, self._response_headers)
+        )
+        return resp(req.environ, start_response)
+
+    def handle_slo_get_or_head(self, req, start_response):
+        """
+        Takes a request and a start_response callable and does the normal WSGI
+        thing with them. Returns an iterator suitable for sending up the WSGI
+        chain.
+
+        :param req: :class:`~swift.common.swob.Request` object; is a ``GET`` or
+                    ``HEAD`` request aimed at what may (or may not) be a static
+                    large object manifest.
+        :param start_response: WSGI start_response callable
+        """
+        is_manifest_get = get_param(req, 'multipart-manifest') == 'get'
+        is_format_raw = is_manifest_get and get_param(req, 'format') == 'raw'
+
+        if not is_manifest_get:
+            # If this object is an SLO manifest, we may have saved off the
+            # large object etag during the original PUT. Send an
+            # X-Backend-Etag-Is-At header so that, if the SLO etag *was* saved,
+            # we can trust the object-server to respond appropriately to
+            # If-Match/If-None-Match requests.
+            update_etag_is_at_header(req, SYSMETA_SLO_ETAG)
+            # Tell the object server that if it's a manifest,
+            # we want the whole thing
+            update_ignore_range_header(req, 'X-Static-Large-Object')
+
+        # process original request
+        orig_path_info = req.path_info
+        resp_iter = self._app_call(req.environ)
+        resp_attrs = RespAttrs.from_headers(self._response_headers)
+        if resp_attrs.is_slo and not is_manifest_get:
+            try:
+                # only validate part-number if the request is to an SLO
+                part_num = get_valid_part_num(req)
+            except HTTPException:
+                friendly_close(resp_iter)
+                raise
+            # the next two calls hide a couple side effects, sorry:
+            #
+            # 1) regardless of the return value the "need_to_refetch" check
+            #    *may* also set self.segment_listing_needed = True (it's
+            #    commented to help you wrap your head around that one,
+            #    good luck)
+            # 2) if we refetch, we overwrite the current resp_iter and
+            #    resp_attrs variables, partly because we *might* get back a NOT
+            #    resp_attrs.is_slo response (even if we had one to start), but
+            #    hopefully they're just the manifest resp we needed to refetch!
+            if self._need_to_refetch_manifest(req, resp_attrs, part_num):
+                # reset path in case it was modified during original request
+                # (e.g. object versioning might re-write the path)
+                req.path_info = orig_path_info
+                resp_attrs, resp_iter = self._refetch_manifest(
+                    req, resp_iter, resp_attrs)
+
+        if not resp_attrs.is_slo:
+            # even if the original resp_attrs may have been SLO we may have
+            # refetched, this also handles the server error case
+            return self._return_non_slo_response(
+                req, start_response, resp_iter)
+
+        if is_manifest_get:
+            # manifest pass through doesn't require resp_attrs
+            return self._return_manifest_response(req, start_response,
+                                                  resp_iter, is_format_raw)
+
+        # this a GET/HEAD response for the SLO object (not the manifest)
+        return self._return_slo_response(req, start_response, resp_iter,
+                                         resp_attrs)
+
+    def convert_segment_listing(self, resp_iter):
+        """
+        Converts the manifest data to match with the format
+        that was put in through ?multipart-manifest=put
+
+        :param resp_iter: a response iterable
+
+        :raises HTTPServerError:
+        :returns: the json-serialized raw format (as bytes)
+        """
+        segments = self._get_manifest_read(resp_iter)
+
+        for seg_dict in segments:
+            if 'data' in seg_dict:
+                continue
+            seg_dict.pop('content_type', None)
+            seg_dict.pop('last_modified', None)
+            seg_dict.pop('sub_slo', None)
+            seg_dict['path'] = seg_dict.pop('name', None)
+            seg_dict['size_bytes'] = seg_dict.pop('bytes', None)
+            seg_dict['etag'] = seg_dict.pop('hash', None)
+
+        json_data = json.dumps(segments, sort_keys=True)  # convert to string
+        return json_data.encode('utf-8')
+
+    def _get_manifest_read(self, resp_iter):
+        with closing_if_possible(resp_iter):
+            resp_body = b''.join(resp_iter)
+        try:
+            segments = json.loads(resp_body)
+        except ValueError as e:
+            msg = 'Unable to load SLO manifest'
+            self.slo.logger.error('%s: %s', msg, e)
+            raise HTTPServerError(msg)
+        return segments
+
+    def _build_resp_iter(self, req, segments, byteranges):
+        """
+        Build a response iterable for a GET request.
+
+        :param req: the request object
+        :param segments: the list of seg_dicts
+        :param byteranges: a list of tuples representing byteranges
+
+        :returns: a segmented iterable
+        """
+        ver, account, _junk = req.split_path(3, 3, rest_with_last=True)
+        account = wsgi_to_str(account)
+        plain_listing_iter = self._segment_listing_iterator(
+            req, ver, account, segments, byteranges)
+
+        def ratelimit_predicate(seg_dict):
+            if 'raw_data' in seg_dict:
+                return False  # it's already in memory anyway
+            start = seg_dict.get('start_byte') or 0
+            end = seg_dict.get('end_byte')
+            if end is None:
+                end = int(seg_dict['bytes']) - 1
+            is_small = (end - start + 1) < self.slo.rate_limit_under_size
+            return is_small
+
+        ratelimited_listing_iter = RateLimitedIterator(
+            plain_listing_iter,
+            self.slo.rate_limit_segments_per_sec,
+            limit_after=self.slo.rate_limit_after_segment,
+            ratelimit_if=ratelimit_predicate)
+
+        # data segments are already in the correct format, but object-backed
+        # segments need a path key added
+        segment_listing_iter = (
+            seg_dict if 'raw_data' in seg_dict else
+            dict(seg_dict, path=self._segment_path(ver, account, seg_dict))
+            for seg_dict in ratelimited_listing_iter)
+
+        segmented_iter = SegmentedIterable(
+            req, self.slo.app, segment_listing_iter,
+            name=req.path, logger=self.slo.logger,
+            ua_suffix="SLO MultipartGET",
+            swift_source="SLO",
+            max_get_time=self.slo.max_get_time)
+
+        try:
+            segmented_iter.validate_first_segment()
+        except (ListingIterError, SegmentError):
+            # Copy from the SLO explanation in top of this file.
+            # If any of the segments from the manifest are not found or
+            # their Etag/Content Length no longer match the connection
+            # will drop. In this case a 409 Conflict will be logged in
+            # the proxy logs and the user will receive incomplete results.
+            raise HTTPConflict(request=req)
+        return segmented_iter
+
+
+class StaticLargeObject(object):
+    """
+    StaticLargeObject Middleware
+
+    See above for a full description.
+
+    The proxy logs created for any subrequests made will have swift.source set
+    to "SLO".
+
+    :param app: The next WSGI filter or app in the paste.deploy chain.
+    :param conf: The configuration dict for the middleware.
+    :param max_manifest_segments: The maximum number of segments allowed in
+                                  newly-created static large objects.
+    :param max_manifest_size: The maximum size (in bytes) of newly-created
+                              static-large-object manifests.
+    :param yield_frequency: If the client included ``heartbeat=on`` in the
+                            query parameters when creating a new static large
+                            object, the period of time to wait between sending
+                            whitespace to keep the connection alive.
+    """
+
+    def __init__(self, app, conf,
+                 max_manifest_segments=DEFAULT_MAX_MANIFEST_SEGMENTS,
+                 max_manifest_size=DEFAULT_MAX_MANIFEST_SIZE,
+                 yield_frequency=DEFAULT_YIELD_FREQUENCY,
+                 allow_async_delete=True):
+        self.conf = conf
+        self.app = app
+        self.logger = get_logger(conf, log_route='slo')
+        self.max_manifest_segments = max_manifest_segments
+        self.max_manifest_size = max_manifest_size
+        self.yield_frequency = yield_frequency
+        self.allow_async_delete = allow_async_delete
+        self.max_get_time = int(self.conf.get('max_get_time', 86400))
+        self.rate_limit_under_size = int(self.conf.get(
+            'rate_limit_under_size', DEFAULT_RATE_LIMIT_UNDER_SIZE))
+        self.rate_limit_after_segment = int(self.conf.get(
+            'rate_limit_after_segment', '10'))
+        self.rate_limit_segments_per_sec = int(self.conf.get(
+            'rate_limit_segments_per_sec', '1'))
+        self.concurrency = min(1000, max(0, int(self.conf.get(
+            'concurrency', '2'))))
+        delete_concurrency = int(self.conf.get(
+            'delete_concurrency', self.concurrency))
+        self.bulk_deleter = Bulk(
+            app, {},
+            max_deletes_per_request=float('inf'),
+            delete_concurrency=delete_concurrency,
+            logger=self.logger)
+
+        self.expirer_config = expirer.ExpirerConfig(conf, logger=self.logger)
+
+    def handle_multipart_get_or_head(self, req, start_response):
+        """
+        Handles the GET or HEAD of a SLO manifest.
+
+        The response body (only on GET, of course) will consist of the
+        concatenation of the segments.
+
+        :param req: a :class:`~swift.common.swob.Request` with a path
+                    referencing an object
+        :param start_response: WSGI start_response callable
+        :raises HttpException: on errors
+        """
+        return SloGetContext(self).handle_slo_get_or_head(req, start_response)
+
+    def handle_multipart_put(self, req, start_response):
+        """
+        Will handle the PUT of a SLO manifest.
+        Heads every object in manifest to check if is valid and if so will
+        save a manifest generated from the user input. Uses WSGIContext to
+        call self and start_response and returns a WSGI iterator.
+
+        :param req: a :class:`~swift.common.swob.Request` with an obj in path
+        :param start_response: WSGI start_response callable
+        :raises HttpException: on errors
+        """
+        vrs, account, container, obj = req.split_path(4, rest_with_last=True)
+        if req.headers.get('X-Copy-From'):
+            raise HTTPMethodNotAllowed(
+                'Multipart Manifest PUTs cannot be COPY requests')
+        if req.content_length is None:
+            if req.headers.get('transfer-encoding', '').lower() != 'chunked':
+                raise HTTPLengthRequired(request=req)
+        else:
+            if req.content_length > self.max_manifest_size:
+                raise HTTPRequestEntityTooLarge(
+                    "Manifest File > %d bytes" % self.max_manifest_size)
+        parsed_data = parse_and_validate_input(
+            req.body_file.read(self.max_manifest_size),
+            wsgi_to_str(req.path))
+        problem_segments = []
+
+        object_segments = [seg for seg in parsed_data if 'path' in seg]
+        if len(object_segments) > self.max_manifest_segments:
+            raise HTTPRequestEntityTooLarge(
+                'Number of object-backed segments must be <= %d' %
+                self.max_manifest_segments)
+        try:
+            out_content_type = req.accept.best_match(ACCEPTABLE_FORMATS)
+        except ValueError:
+            out_content_type = 'text/plain'  # Ignore invalid header
+        if not out_content_type:
+            out_content_type = 'text/plain'
+        data_for_storage = [None] * len(parsed_data)
+        total_size = 0
+        path2indices = defaultdict(list)
+        for index, seg_dict in enumerate(parsed_data):
+            if 'data' in seg_dict:
+                data_for_storage[index] = seg_dict
+                total_size += len(base64.b64decode(seg_dict['data']))
+            else:
+                path2indices[seg_dict['path']].append(index)
+
+        def do_head(obj_name):
+            obj_path = '/'.join(['', vrs, account,
+                                 str_to_wsgi(obj_name.lstrip('/'))])
+            obj_path = wsgi_quote(obj_path)
+
+            sub_req = make_subrequest(
+                req.environ, path=obj_path + '?',  # kill the query string
+                method='HEAD',
+                headers={'x-auth-token': req.headers.get('x-auth-token')},
+                agent='%(orig)s SLO MultipartPUT', swift_source='SLO')
+            return obj_name, sub_req.get_response(self)
+
+        def validate_seg_dict(seg_dict, head_seg_resp, allow_empty_segment):
+            obj_name = seg_dict['path']
+            if not head_seg_resp.is_success:
+                problem_segments.append([quote(obj_name),
+                                         head_seg_resp.status])
+                return 0, None
+
+            segment_length = head_seg_resp.content_length
+            if seg_dict.get('range'):
+                # Since we now know the length, we can normalize the
+                # range. We know that there is exactly one range
+                # requested since we checked that earlier in
+                # parse_and_validate_input().
+                ranges = seg_dict['range'].ranges_for_length(
+                    head_seg_resp.content_length)
+
+                if not ranges:
+                    problem_segments.append([quote(obj_name),
+                                             'Unsatisfiable Range'])
+                elif ranges == [(0, head_seg_resp.content_length)]:
+                    # Just one range, and it exactly matches the object.
+                    # Why'd we do this again?
+                    del seg_dict['range']
+                    segment_length = head_seg_resp.content_length
+                else:
+                    rng = ranges[0]
+                    seg_dict['range'] = '%d-%d' % (rng[0], rng[1] - 1)
+                    segment_length = rng[1] - rng[0]
+
+            if segment_length < 1 and not allow_empty_segment:
+                problem_segments.append(
+                    [quote(obj_name),
+                     'Too small; each segment must be at least 1 byte.'])
+
+            _size_bytes = seg_dict.get('size_bytes')
+            size_mismatch = (
+                _size_bytes is not None and
+                _size_bytes != head_seg_resp.content_length
+            )
+            if size_mismatch:
+                problem_segments.append([quote(obj_name), 'Size Mismatch'])
+
+            _etag = seg_dict.get('etag')
+            etag_mismatch = (
+                _etag is not None and
+                _etag != head_seg_resp.etag
+            )
+            if etag_mismatch:
+                problem_segments.append([quote(obj_name), 'Etag Mismatch'])
+
+            if head_seg_resp.last_modified:
+                last_modified = head_seg_resp.last_modified
+            else:
+                # shouldn't happen
+                last_modified = datetime.now()
+
+            last_modified_formatted = last_modified.strftime(
+                '%Y-%m-%dT%H:%M:%S.%f'
+            )
+            seg_data = {
+                'name': '/' + seg_dict['path'].lstrip('/'),
+                'bytes': head_seg_resp.content_length,
+                'hash': head_seg_resp.etag,
+                'content_type': head_seg_resp.content_type,
+                'last_modified': last_modified_formatted
+            }
+            if seg_dict.get('range'):
+                seg_data['range'] = seg_dict['range']
+            if config_true_value(
+                    head_seg_resp.headers.get('X-Static-Large-Object')):
+                seg_data['sub_slo'] = True
+
+            return segment_length, seg_data
+
+        heartbeat = config_true_value(req.params.get('heartbeat'))
+        separator = b''
+        if heartbeat:
+            # Apparently some ways of deploying require that this to happens
+            # *before* the return? Not sure why.
+            req.environ['eventlet.minimum_write_chunk_size'] = 0
+            start_response('202 Accepted', [  # NB: not 201 !
+                ('Content-Type', out_content_type),
+            ])
+            separator = b'\r\n\r\n'
+
+        def resp_iter(total_size=total_size):
+            # wsgi won't propagate start_response calls until some data has
+            # been yielded so make sure first heartbeat is sent immediately
+            if heartbeat:
+                yield b' '
+            last_yield_time = time.time()
+            with StreamingPile(self.concurrency) as pile:
+                for obj_name, resp in pile.asyncstarmap(do_head, (
+                        (path, ) for path in path2indices)):
+                    now = time.time()
+                    if heartbeat and (now - last_yield_time >
+                                      self.yield_frequency):
+                        # Make sure we've called start_response before
+                        # sending data
+                        yield b' '
+                        last_yield_time = now
+                    for i in path2indices[obj_name]:
+                        segment_length, seg_data = validate_seg_dict(
+                            parsed_data[i], resp,
+                            allow_empty_segment=(i == len(parsed_data) - 1))
+                        data_for_storage[i] = seg_data
+                        total_size += segment_length
+
+            # Middleware left of SLO can add a callback to the WSGI
+            # environment to perform additional validation and/or
+            # manipulation on the manifest that will be written.
+            hook = req.environ.get('swift.callback.slo_manifest_hook')
+            if hook:
+                more_problems = hook(data_for_storage)
+                if more_problems:
+                    problem_segments.extend(more_problems)
+
+            if problem_segments:
+                err = HTTPBadRequest(content_type=out_content_type)
+                resp_dict = {}
+                if heartbeat:
+                    resp_dict['Response Status'] = err.status
+                    err_body = err.body.decode('utf-8')
+                    resp_dict['Response Body'] = err_body or '\n'.join(
+                        RESPONSE_REASONS.get(err.status_int, ['']))
+                else:
+                    start_response(err.status,
+                                   [(h, v) for h, v in err.headers.items()
+                                    if h.lower() != 'content-length'])
+                yield separator + get_heartbeat_response_body(
+                    out_content_type, resp_dict, problem_segments, 'upload')
+                return
+
+            slo_etag = md5(usedforsecurity=False)
+            for seg_data in data_for_storage:
+                if 'data' in seg_data:
+                    raw_data = base64.b64decode(seg_data['data'])
+                    r = md5(raw_data, usedforsecurity=False).hexdigest()
+                elif seg_data.get('range'):
+                    r = '%s:%s;' % (seg_data['hash'], seg_data['range'])
+                else:
+                    r = seg_data['hash']
+                slo_etag.update(r.encode('ascii'))
+
+            slo_etag = slo_etag.hexdigest()
+            client_etag = normalize_etag(req.headers.get('Etag'))
+            if client_etag and client_etag != slo_etag:
+                err = HTTPUnprocessableEntity(request=req)
+                if heartbeat:
+                    resp_dict = {}
+                    resp_dict['Response Status'] = err.status
+                    err_body = err.body
+                    if isinstance(err_body, bytes):
+                        err_body = err_body.decode('utf-8', errors='replace')
+                    resp_dict['Response Body'] = err_body or '\n'.join(
+                        RESPONSE_REASONS.get(err.status_int, ['']))
+                    yield separator + get_heartbeat_response_body(
+                        out_content_type, resp_dict, problem_segments,
+                        'upload')
+                else:
+                    for chunk in err(req.environ, start_response):
+                        yield chunk
+                return
+
+            json_data = json.dumps(data_for_storage).encode('utf-8')
+            req.body = json_data
+            req.headers.update({
+                SYSMETA_SLO_ETAG: slo_etag,
+                SYSMETA_SLO_SIZE: total_size,
+                'X-Static-Large-Object': 'True',
+                'Etag': md5(json_data, usedforsecurity=False).hexdigest(),
+            })
+
+            # Ensure container listings have both etags. However, if any
+            # middleware to the left of us touched the base value, trust them.
+            override_header = get_container_update_override_key('etag')
+            val, sep, params = req.headers.get(
+                override_header, '').partition(';')
+            req.headers[override_header] = '%s; slo_etag=%s' % (
+                (val or req.headers['Etag']) + sep + params, slo_etag)
+
+            env = req.environ
+            if not env.get('CONTENT_TYPE'):
+                guessed_type, _junk = mimetypes.guess_type(
+                    wsgi_to_str(req.path_info))
+                env['CONTENT_TYPE'] = (guessed_type or
+                                       'application/octet-stream')
+            env['swift.content_type_overridden'] = True
+            env['CONTENT_TYPE'] += ";swift_bytes=%d" % total_size
+
+            resp = req.get_response(self.app)
+            resp_dict = {'Response Status': resp.status}
+            if resp.is_success:
+                resp.etag = slo_etag
+                resp_dict['Etag'] = resp.headers['Etag']
+                resp_dict['Last Modified'] = resp.headers['Last-Modified']
+
+            if heartbeat:
+                resp_body = resp.body
+                if isinstance(resp_body, bytes):
+                    resp_body = resp_body.decode('utf-8')
+                resp_dict['Response Body'] = resp_body
+                yield separator + get_heartbeat_response_body(
+                    out_content_type, resp_dict, [], 'upload')
+            else:
+                for chunk in resp(req.environ, start_response):
+                    yield chunk
+
+        return resp_iter()
+
+    def get_segments_to_delete_iter(self, req):
+        """
+        A generator function to be used to delete all the segments and
+        sub-segments referenced in a manifest.
+
+        :param req: a :class:`~swift.common.swob.Request` with an SLO manifest
+                    in path
+        :raises HTTPPreconditionFailed: on invalid UTF8 in request path
+        :raises HTTPBadRequest: on too many buffered sub segments and
+                                on invalid SLO manifest path
+        """
+        if not check_utf8(wsgi_to_str(req.path_info)):
+            raise HTTPPreconditionFailed(
+                request=req, body='Invalid UTF8 or contains NULL')
+        vrs, account, container, obj = req.split_path(4, 4, True)
+        obj_path = '/%s/%s' % (wsgi_to_str(container), wsgi_to_str(obj))
+
+        segments = [{
+            'sub_slo': True,
+            'name': obj_path}]
+        if 'version-id' in req.params:
+            segments[0]['version_id'] = req.params['version-id']
+
+        while segments:
+            # We chose not to set the limit at max_manifest_segments
+            # in the case this value was decreased by operators.
+            # Still it is important to set a limit to avoid this list
+            # growing too large and causing OOM failures.
+            # x10 is a best guess as to how much operators would change
+            # the value of max_manifest_segments.
+            if len(segments) > self.max_manifest_segments * 10:
+                raise HTTPBadRequest(
+                    'Too many buffered slo segments to delete.')
+            seg_data = segments.pop(0)
+            if 'data' in seg_data:
+                continue
+            if seg_data.get('sub_slo'):
+                try:
+                    segments.extend(
+                        self.get_slo_segments(seg_data['name'], req))
+                except HTTPException as err:
+                    # allow bulk delete response to report errors
+                    err_body = err.body
+                    if isinstance(err_body, bytes):
+                        err_body = err_body.decode('utf-8', errors='replace')
+                    seg_data['error'] = {'code': err.status_int,
+                                         'message': err_body}
+
+                # add manifest back to be deleted after segments
+                seg_data['sub_slo'] = False
+                segments.append(seg_data)
+            else:
+                yield seg_data
+
+    def get_slo_segments(self, obj_name, req):
+        """
+        Performs a :class:`~swift.common.swob.Request` and returns the SLO
+        manifest's segments.
+
+        :param obj_name: the name of the object being deleted,
+                         as ``/container/object``
+        :param req: the base :class:`~swift.common.swob.Request`
+        :raises HTTPServerError: on unable to load obj_name or
+                                 on unable to load the SLO manifest data.
+        :raises HTTPBadRequest: on not an SLO manifest
+        :raises HTTPNotFound: on SLO manifest not found
+        :returns: SLO manifest's segments
+        """
+        vrs, account, _junk = req.split_path(2, 3, True)
+        new_env = req.environ.copy()
+        new_env['REQUEST_METHOD'] = 'GET'
+        del new_env['wsgi.input']
+        new_env['QUERY_STRING'] = 'multipart-manifest=get'
+        if 'version-id' in req.params:
+            new_env['QUERY_STRING'] += \
+                '&version-id=' + req.params['version-id']
+        new_env['CONTENT_LENGTH'] = 0
+        new_env['HTTP_USER_AGENT'] = \
+            '%s MultipartDELETE' % new_env.get('HTTP_USER_AGENT')
+        new_env['swift.source'] = 'SLO'
+        new_env['PATH_INFO'] = (
+            '/%s/%s/%s' % (vrs, account, str_to_wsgi(obj_name.lstrip('/')))
+        )
+        # Just request the last byte of non-SLO objects so we don't waste
+        # a resources in friendly_close() below
+        manifest_req = Request.blank('', new_env, range='bytes=-1')
+        update_ignore_range_header(manifest_req, 'X-Static-Large-Object')
+        resp = manifest_req.get_response(self.app)
+
+        if resp.is_success and config_true_value(resp.headers.get(
+                'X-Static-Large-Object')) and len(resp.body) == 1:
+            # pre-2.24.0 object-server
+            manifest_req = Request.blank('', new_env)
+            resp = manifest_req.get_response(self.app)
+
+        if resp.is_success:
+            if config_true_value(resp.headers.get('X-Static-Large-Object')):
+                try:
+                    return json.loads(resp.body)
+                except ValueError:
+                    raise HTTPServerError('Unable to load SLO manifest')
+            else:
+                # Drain and close GET request (prevents socket leaks)
+                friendly_close(resp)
+                raise HTTPBadRequest('Not an SLO manifest')
+        elif resp.status_int == HTTP_NOT_FOUND:
+            raise HTTPNotFound('SLO manifest not found')
+        elif resp.status_int == HTTP_UNAUTHORIZED:
+            raise HTTPUnauthorized('401 Unauthorized')
+        else:
+            raise HTTPServerError('Unable to load SLO manifest or segment.')
+
+    def handle_async_delete(self, req):
+        if not check_utf8(wsgi_to_str(req.path_info)):
+            raise HTTPPreconditionFailed(
+                request=req, body='Invalid UTF8 or contains NULL')
+        vrs, account, container, obj = req.split_path(4, 4, True)
+        obj_path = '/%s/%s' % (wsgi_to_str(container), wsgi_to_str(obj))
+        segments = [seg for seg in self.get_slo_segments(obj_path, req)
+                    if 'data' not in seg]
+        if not segments:
+            # Degenerate case: just delete the manifest
+            return self.app
+
+        segment_containers, segment_objects = zip(*(
+            split_path(seg['name'], 2, 2, True) for seg in segments))
+        segment_containers = set(segment_containers)
+        if len(segment_containers) > 1:
+            container_csv = ', '.join(
+                '"%s"' % quote(c) for c in segment_containers)
+            raise HTTPBadRequest('All segments must be in one container. '
+                                 'Found segments in %s' % container_csv)
+        if any(seg.get('sub_slo') for seg in segments):
+            raise HTTPBadRequest('No segments may be large objects.')
+
+        # Auth checks
+        segment_container = segment_containers.pop()
+        if 'swift.authorize' in req.environ:
+            container_info = get_container_info(
+                req.environ, self.app, swift_source='SLO')
+            req.acl = container_info.get('write_acl')
+            aresp = req.environ['swift.authorize'](req)
+            req.acl = None
+            if aresp:
+                return aresp
+
+            if bytes_to_wsgi(segment_container.encode('utf-8')) != container:
+                path = '/%s/%s/%s' % (vrs, account, bytes_to_wsgi(
+                    segment_container.encode('utf-8')))
+                seg_container_info = get_container_info(
+                    make_env(req.environ, path=path, swift_source='SLO'),
+                    self.app, swift_source='SLO')
+                req.acl = seg_container_info.get('write_acl')
+                aresp = req.environ['swift.authorize'](req)
+                req.acl = None
+                if aresp:
+                    return aresp
+
+        # Did our sanity checks; schedule segments to be deleted
+        ts = req.ensure_x_timestamp()
+        expirer_jobs = make_delete_jobs(
+            wsgi_to_str(account), segment_container, segment_objects, ts)
+        expiring_objects_account, expirer_cont = \
+            self.expirer_config.get_expirer_account_and_container(
+                ts, wsgi_to_str(account), wsgi_to_str(container),
+                wsgi_to_str(obj))
+        enqueue_req = make_pre_authed_request(
+            req.environ,
+            method='UPDATE',
+            path="/v1/%s/%s" % (expiring_objects_account, expirer_cont),
+            body=json.dumps(expirer_jobs),
+            headers={'Content-Type': 'application/json',
+                     'X-Backend-Storage-Policy-Index': '0',
+                     'X-Backend-Allow-Private-Methods': 'True'},
+        )
+        resp = enqueue_req.get_response(self.app)
+        if not resp.is_success:
+            self.logger.error(
+                'Failed to enqueue expiration entries: %s\n%s',
+                resp.status, resp.body)
+            return HTTPServiceUnavailable()
+        # consume the response (should be short)
+        friendly_close(resp)
+
+        # Finally, delete the manifest
+        return self.app
+
+    def handle_multipart_delete(self, req):
+        """
+        Will delete all the segments in the SLO manifest and then, if
+        successful, will delete the manifest file.
+
+        :param req: a :class:`~swift.common.swob.Request` with an obj in path
+        :returns: swob.Response whose app_iter set to Bulk.handle_delete_iter
+        """
+        if self.allow_async_delete and config_true_value(
+                req.params.get('async')):
+            return self.handle_async_delete(req)
+
+        req.headers['Content-Type'] = None  # Ignore content-type from client
+        resp = HTTPOk(request=req)
+        try:
+            out_content_type = req.accept.best_match(ACCEPTABLE_FORMATS)
+        except ValueError:
+            out_content_type = None  # Ignore invalid header
+        if out_content_type:
+            resp.content_type = out_content_type
+        resp.app_iter = self.bulk_deleter.handle_delete_iter(
+            req, objs_to_delete=self.get_segments_to_delete_iter(req),
+            user_agent='MultipartDELETE', swift_source='SLO',
+            out_content_type=out_content_type)
+        return resp
+
+    def handle_container_listing(self, req, start_response):
+        resp = req.get_response(self.app)
+        if not resp.is_success or resp.content_type != 'application/json':
+            return resp(req.environ, start_response)
+        if resp.content_length is None or \
+                resp.content_length > MAX_CONTAINER_LISTING_CONTENT_LENGTH:
+            return resp(req.environ, start_response)
+        try:
+            listing = json.loads(resp.body)
+        except ValueError:
+            return resp(req.environ, start_response)
+
+        for item in listing:
+            if 'subdir' in item:
+                continue
+            etag, params = parse_header(item['hash'])
+            if 'slo_etag' in params:
+                item['slo_etag'] = '"%s"' % params.pop('slo_etag')
+                item['hash'] = etag + ''.join(
+                    '; %s=%s' % kv for kv in params.items())
+
+        resp.body = json.dumps(listing).encode('ascii')
+        return resp(req.environ, start_response)
+
+    def __call__(self, env, start_response):
+        """
+        WSGI entry point
+        """
+        if env.get('swift.slo_override'):
+            return self.app(env, start_response)
+
+        req = Request(env)
+        try:
+            vrs, account, container, obj = req.split_path(3, 4, True)
+            is_cont_or_obj_req = True
+        except ValueError:
+            is_cont_or_obj_req = False
+        if not is_cont_or_obj_req:
+            return self.app(env, start_response)
+
+        if not obj:
+            if req.method == 'GET':
+                return self.handle_container_listing(req, start_response)
+            return self.app(env, start_response)
+
+        try:
+            if req.method == 'PUT' and \
+                    req.params.get('multipart-manifest') == 'put':
+                return self.handle_multipart_put(req, start_response)
+            if req.method == 'DELETE' and \
+                    req.params.get('multipart-manifest') == 'delete':
+                return self.handle_multipart_delete(req)(env, start_response)
+            if req.method == 'GET' or req.method == 'HEAD':
+                return self.handle_multipart_get_or_head(req, start_response)
+            if 'X-Static-Large-Object' in req.headers:
+                raise HTTPBadRequest(
+                    request=req,
+                    body='X-Static-Large-Object is a reserved header. '
+                    'To create a static large object add query param '
+                    'multipart-manifest=put.')
+        except HTTPException as err_resp:
+            return err_resp(env, start_response)
+
+        return self.app(env, start_response)
+
+
+def filter_factory(global_conf, **local_conf):
+    conf = global_conf.copy()
+    conf.update(local_conf)
+
+    max_manifest_segments = int(conf.get('max_manifest_segments',
+                                         DEFAULT_MAX_MANIFEST_SEGMENTS))
+    max_manifest_size = int(conf.get('max_manifest_size',
+                                     DEFAULT_MAX_MANIFEST_SIZE))
+    yield_frequency = int(conf.get('yield_frequency',
+                                   DEFAULT_YIELD_FREQUENCY))
+    allow_async_delete = config_true_value(conf.get('allow_async_delete',
+                                                    'true'))
+
+    register_swift_info('slo',
+                        max_manifest_segments=max_manifest_segments,
+                        max_manifest_size=max_manifest_size,
+                        yield_frequency=yield_frequency,
+                        # this used to be configurable; report it as 1 for
+                        # clients that might still care
+                        min_segment_size=1,
+                        allow_async_delete=allow_async_delete)
+
+    def slo_filter(app):
+        return StaticLargeObject(
+            app, conf,
+            max_manifest_segments=max_manifest_segments,
+            max_manifest_size=max_manifest_size,
+            yield_frequency=yield_frequency,
+            allow_async_delete=allow_async_delete)
+    return slo_filter
diff --git a/swift/common/middleware/staticweb.py b/swift/common/middleware/staticweb.py
index 6aaeaa0ee9..d63032ae69 100644
--- a/swift/common/middleware/staticweb.py
+++ b/swift/common/middleware/staticweb.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2016 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -16,8 +16,11 @@
 """
 This StaticWeb WSGI middleware will serve container data as a static web site
 with index file and error file resolution and optional file listings. This mode
-is normally only active for anonymous requests. If you want to use it with
-authenticated requests, set the ``X-Web-Mode: true`` header on the request.
+is normally only active for anonymous requests. When using keystone for
+authentication set ``delay_auth_decision = true`` in the authtoken middleware
+configuration in your ``/etc/swift/proxy-server.conf`` file.  If you want to
+use it with authenticated requests, set the ``X-Web-Mode: true`` header on the
+request.
 
 The ``staticweb`` filter should be added to the pipeline in your
 ``/etc/swift/proxy-server.conf`` file just after any auth middleware. Also, the
@@ -28,26 +31,16 @@
     ...
 
     [pipeline:main]
-    pipeline = catch_errors healthcheck cache ratelimit tempauth staticweb
-               proxy-logging proxy-server
+    pipeline = catch_errors healthcheck proxy-logging cache ratelimit tempauth
+               staticweb proxy-logging proxy-server
 
     ...
 
     [filter:staticweb]
     use = egg:swift#staticweb
-    # Seconds to cache container x-container-meta-web-* header values.
-    # cache_timeout = 300
-    # You can override the default log routing for this filter here:
-    # set log_name = staticweb
-    # set log_facility = LOG_LOCAL0
-    # set log_level = INFO
-    # set access_log_name = staticweb
-    # set access_log_facility = LOG_LOCAL0
-    # set access_log_level = INFO
-    # set log_headers = False
 
 Any publicly readable containers (for example, ``X-Container-Read: .r:*``, see
-`acls`_ for more information on this) will be checked for
+:ref:`acls` for more information on this) will be checked for
 X-Container-Meta-Web-Index and X-Container-Meta-Web-Error header values::
 
     X-Container-Meta-Web-Index  <index.name>
@@ -64,9 +57,10 @@
 ``X-Container-Meta-Web-Error: error.html`` will serve .../404error.html for
 requests for paths not found.
 
-For psuedo paths that have no <index.name>, this middleware can serve HTML file
+For pseudo paths that have no <index.name>, this middleware can serve HTML file
 listings if you set the ``X-Container-Meta-Web-Listings: true`` metadata item
-on the container.
+on the container. Note that the listing must be authorized; you may want a
+container ACL like ``X-Container-Read: .r:*,.rlistings``.
 
 If listings are enabled, the listings can have a custom style sheet by setting
 the X-Container-Meta-Web-Listings-CSS header. For instance, setting
@@ -75,6 +69,29 @@
 listing page, you will see the well defined document structure that can be
 styled.
 
+Additionally, prefix-based :ref:`tempurl` parameters may be used to authorize
+requests instead of making the whole container publicly readable. This gives
+clients dynamic discoverability of the objects available within that prefix.
+
+.. note::
+
+    ``temp_url_prefix`` values should typically end with a slash (``/``) when
+    used with StaticWeb. StaticWeb's redirects will not carry over any TempURL
+    parameters, as they likely indicate that the user created an overly-broad
+    TempURL.
+
+By default, the listings will be rendered with a label of
+"Listing of /v1/account/container/path".  This can be altered by
+setting a ``X-Container-Meta-Web-Listings-Label: <label>``.  For example,
+if the label is set to "example.com", a label of
+"Listing of example.com/path" will be used instead.
+
+The content-type of directory marker objects can be modified by setting
+the ``X-Container-Meta-Web-Directory-Type`` header.  If the header is not set,
+application/directory is used by default.  Directory marker objects are
+0-byte objects that represent directories to create a simulated hierarchical
+structure.
+
 Example usage of this middleware via ``swift``:
 
     Make the container publicly readable::
@@ -93,6 +110,7 @@
 
     Turn on listings::
 
+        swift post -r '.r:*,.rlistings' container
         swift post -m 'web-listings: true' container
 
     Now you should see object listings for paths and pseudo paths that have no
@@ -107,34 +125,31 @@
         swift post -m 'web-error:error.html' container
 
     Now 401's should load 401error.html, 404's should load 404error.html, etc.
-"""
 
+    Set Content-Type of directory marker object::
 
-try:
-    import simplejson as json
-except ImportError:
-    import json
+        swift post -m 'web-directory-type:text/directory' container
 
-import cgi
-import time
-from urllib import unquote, quote as urllib_quote
+    Now 0-byte objects with a content-type of text/directory will be treated
+    as directories rather than objects.
+"""
 
 
-from swift.common.utils import cache_from_env, get_logger, human_readable, \
-    split_path, config_true_value
-from swift.common.wsgi import make_pre_authed_env, make_pre_authed_request, \
-    WSGIContext
-from swift.common.http import is_success, is_redirection, HTTP_NOT_FOUND
-from swift.common.swob import Response, HTTPMovedPermanently, HTTPNotFound
+import html
+import json
+import time
 
+from urllib.parse import urlparse
 
-def quote(value, safe='/'):
-    """
-    Patched version of urllib.quote that encodes utf-8 strings before quoting
-    """
-    if isinstance(value, unicode):
-        value = value.encode('utf-8')
-    return urllib_quote(value, safe)
+from swift.common.utils import human_readable, split_path, config_true_value, \
+    quote, get_logger
+from swift.common.registry import register_swift_info
+from swift.common.wsgi import make_env, WSGIContext
+from swift.common.http import is_success, is_redirection, HTTP_NOT_FOUND
+from swift.common.swob import Response, HTTPMovedPermanently, HTTPNotFound, \
+    Request, wsgi_quote, wsgi_to_str, str_to_wsgi
+from swift.common.middleware.tempurl import get_temp_url_info
+from swift.proxy.controllers.base import get_container_info
 
 
 class _StaticWebContext(WSGIContext):
@@ -146,6 +161,12 @@ class _StaticWebContext(WSGIContext):
     that might need to be handled to make keeping contextual
     information about the request a bit simpler than storing it in
     the WSGI env.
+
+    :param staticweb: The staticweb middleware object in use.
+    :param version: A WSGI string representation of the swift api version.
+    :param account: A WSGI string representation of the account name.
+    :param container: A WSGI string representation of the container name.
+    :param obj: A WSGI string representation of the object name.
     """
 
     def __init__(self, staticweb, version, account, container, obj):
@@ -155,13 +176,12 @@ def __init__(self, staticweb, version, account, container, obj):
         self.container = container
         self.obj = obj
         self.app = staticweb.app
-        self.cache_timeout = staticweb.cache_timeout
-        self.logger = staticweb.logger
-        self.access_logger = staticweb.access_logger
-        self.log_headers = staticweb.log_headers
+        self.url_scheme = staticweb.url_scheme
+        self.url_host = staticweb.url_host
         self.agent = '%(orig)s StaticWeb'
         # Results from the last call to self._get_container_info.
-        self._index = self._error = self._listings = self._listings_css = None
+        self._index = self._error = self._listings = self._listings_css = \
+            self._dir_type = self._listings_label = None
 
     def _error_response(self, response, env, start_response):
         """
@@ -172,7 +192,6 @@ def _error_response(self, response, env, start_response):
         :param env: The original request WSGI environment.
         :param start_response: The WSGI start_response hook.
         """
-        self._log_response(env, self._get_status_int())
         if not self._error:
             start_response(self._response_status, self._response_headers,
                            self._response_exc_info)
@@ -180,11 +199,11 @@ def _error_response(self, response, env, start_response):
         save_response_status = self._response_status
         save_response_headers = self._response_headers
         save_response_exc_info = self._response_exc_info
-        resp = self._app_call(make_pre_authed_env(
+        resp = self._app_call(make_env(
             env, 'GET', '/%s/%s/%s/%s%s' % (
                 self.version, self.account, self.container,
                 self._get_status_int(), self._error),
-            self.agent))
+            self.agent, swift_source='SW'))
         if is_success(self._get_status_int()):
             start_response(save_response_status, self._response_headers,
                            self._response_exc_info)
@@ -196,79 +215,113 @@ def _error_response(self, response, env, start_response):
     def _get_container_info(self, env):
         """
         Retrieves x-container-meta-web-index, x-container-meta-web-error,
-        x-container-meta-web-listings, and x-container-meta-web-listings-css
-        from memcache or from the cluster and stores the result in memcache and
-        in self._index, self._error, self._listings, and self._listings_css.
+        x-container-meta-web-listings, x-container-meta-web-listings-css,
+        and x-container-meta-web-directory-type from memcache or from the
+        cluster and stores the result in memcache and in self._index,
+        self._error, self._listings, self._listings_css and self._dir_type.
 
         :param env: The WSGI environment dict.
+        :return: The container_info dict.
         """
-        self._index = self._error = self._listings = self._listings_css = None
-        memcache_client = cache_from_env(env)
-        if memcache_client:
-            memcache_key = '/staticweb/%s/%s/%s' % (self.version, self.account,
-                                                    self.container)
-            cached_data = memcache_client.get(memcache_key)
-            if cached_data:
-                (self._index, self._error, self._listings,
-                 self._listings_css) = cached_data
-                return
-        resp = make_pre_authed_request(
-            env, 'HEAD', '/%s/%s/%s' % (
-                self.version, self.account, self.container),
-            agent=self.agent).get_response(self.app)
-        if is_success(resp.status_int):
-            self._index = \
-                resp.headers.get('x-container-meta-web-index', '').strip()
-            self._error = \
-                resp.headers.get('x-container-meta-web-error', '').strip()
-            self._listings = \
-                resp.headers.get('x-container-meta-web-listings', '').strip()
-            self._listings_css = \
-                resp.headers.get('x-container-meta-web-listings-css',
-                                 '').strip()
-            if memcache_client:
-                memcache_client.set(memcache_key,
-                                    (self._index, self._error, self._listings,
-                                     self._listings_css),
-                                    timeout=self.cache_timeout)
-
-    def _listing(self, env, start_response, prefix=None):
+        self._index = self._error = self._listings = self._listings_css = \
+            self._dir_type = None
+        container_info = get_container_info(
+            env, self.app, swift_source='SW')
+        if is_success(container_info['status']):
+            meta = container_info.get('meta', {})
+            self._index = meta.get('web-index', '').strip()
+            self._error = meta.get('web-error', '').strip()
+            self._listings = meta.get('web-listings', '').strip()
+            self._listings_label = meta.get('web-listings-label', '').strip()
+            self._listings_css = meta.get('web-listings-css', '').strip()
+            self._dir_type = meta.get('web-directory-type', '').strip()
+        return container_info
+
+    def _listing(self, env, start_response, prefix=''):
         """
         Sends an HTML object listing to the remote client.
 
         :param env: The original WSGI environment dict.
         :param start_response: The original WSGI start_response hook.
-        :param prefix: Any prefix desired for the container listing.
+        :param prefix: Any WSGI-str prefix desired for the container listing.
         """
+        label = wsgi_to_str(env['PATH_INFO'])
+        if self._listings_label:
+            groups = wsgi_to_str(env['PATH_INFO']).split('/')
+            label = '{0}/{1}'.format(self._listings_label,
+                                     '/'.join(groups[4:]))
+
         if not config_true_value(self._listings):
-            resp = HTTPNotFound()(env, self._start_response)
+            body = '<!DOCTYPE html>\n' \
+                '<html>\n' \
+                '<head>\n' \
+                '<title>Listing of %s</title>\n' % html.escape(label)
+            if self._listings_css:
+                body += '  <link rel="stylesheet" type="text/css" ' \
+                    'href="%s" />\n' % self._build_css_path(prefix or '')
+            else:
+                body += '  <style type="text/css">\n' \
+                    '   h1 {font-size: 1em; font-weight: bold;}\n' \
+                    '   p {font-size: 2}\n' \
+                    '  </style>\n'
+            body += '</head>\n<body>' \
+                '  <h1>Web Listing Disabled</h1>' \
+                '   <p>The owner of this web site has disabled web listing.' \
+                '   <p>If you are the owner of this web site, you can enable' \
+                '   web listing by setting X-Container-Meta-Web-Listings.</p>'
+            if self._index:
+                body += '<h1>Index File Not Found</h1>' \
+                    ' <p>The owner of this web site has set ' \
+                    ' <b>X-Container-Meta-Web-Index: %s</b>. ' \
+                    ' However, this file is not found.</p>' % self._index
+            body += ' </body>\n</html>\n'
+            resp = HTTPNotFound(body=body)(env, self._start_response)
             return self._error_response(resp, env, start_response)
-        tmp_env = make_pre_authed_env(
+        tmp_env = make_env(
             env, 'GET', '/%s/%s/%s' % (
                 self.version, self.account, self.container),
-            self.agent)
-        tmp_env['QUERY_STRING'] = 'delimiter=/&format=json'
+            self.agent, swift_source='SW')
+        tmp_env['QUERY_STRING'] = 'delimiter=/'
         if prefix:
-            tmp_env['QUERY_STRING'] += '&prefix=%s' % quote(prefix)
+            tmp_env['QUERY_STRING'] += '&prefix=%s' % wsgi_quote(prefix)
         else:
             prefix = ''
         resp = self._app_call(tmp_env)
         if not is_success(self._get_status_int()):
             return self._error_response(resp, env, start_response)
         listing = None
-        body = ''.join(resp)
+        body = b''.join(resp)
         if body:
             listing = json.loads(body)
-        if not listing:
+        if prefix and not listing:
             resp = HTTPNotFound()(env, self._start_response)
             return self._error_response(resp, env, start_response)
-        headers = {'Content-Type': 'text/html; charset=UTF-8'}
-        body = '<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01 ' \
-               'Transitional//EN" "http://www.w3.org/TR/html4/loose.dtd">\n' \
+
+        tempurl_qs = tempurl_prefix = ''
+        if env.get('REMOTE_USER') == '.wsgi.tempurl':
+            sig, expires, tempurl_prefix, _filename, inline, ip_range = \
+                get_temp_url_info(env)
+            if tempurl_prefix is None:
+                tempurl_prefix = ''
+            else:
+                parts = [
+                    'temp_url_prefix=%s' % quote(tempurl_prefix),
+                    'temp_url_expires=%s' % quote(str(expires)),
+                    'temp_url_sig=%s' % sig,
+                ]
+                if ip_range:
+                    parts.append('temp_url_ip_range=%s' % quote(ip_range))
+                if inline:
+                    parts.append('inline')
+                tempurl_qs = '?' + '&amp;'.join(parts)
+
+        headers = {'Content-Type': 'text/html; charset=UTF-8',
+                   'X-Backend-Content-Generator': 'staticweb'}
+        body = '<!DOCTYPE html>\n' \
                '<html>\n' \
                ' <head>\n' \
                '  <title>Listing of %s</title>\n' % \
-               cgi.escape(env['PATH_INFO'])
+               html.escape(label)
         if self._listings_css:
             body += '  <link rel="stylesheet" type="text/css" ' \
                     'href="%s" />\n' % (self._build_css_path(prefix))
@@ -287,46 +340,47 @@ def _listing(self, env, start_response, prefix=None):
                 '    <th class="colname">Name</th>\n' \
                 '    <th class="colsize">Size</th>\n' \
                 '    <th class="coldate">Date</th>\n' \
-                '   </tr>\n' % \
-                cgi.escape(env['PATH_INFO'])
-        if prefix:
+                '   </tr>\n' % html.escape(label)
+        if len(prefix) > len(tempurl_prefix):
             body += '   <tr id="parent" class="item">\n' \
-                    '    <td class="colname"><a href="../">../</a></td>\n' \
+                    '    <td class="colname"><a href="../%s">../</a></td>\n' \
                     '    <td class="colsize">&nbsp;</td>\n' \
                     '    <td class="coldate">&nbsp;</td>\n' \
-                    '   </tr>\n'
+                    '   </tr>\n' % tempurl_qs
         for item in listing:
             if 'subdir' in item:
                 subdir = item['subdir']
                 if prefix:
-                    subdir = subdir[len(prefix):]
+                    subdir = subdir[len(wsgi_to_str(prefix)):]
                 body += '   <tr class="item subdir">\n' \
                         '    <td class="colname"><a href="%s">%s</a></td>\n' \
                         '    <td class="colsize">&nbsp;</td>\n' \
                         '    <td class="coldate">&nbsp;</td>\n' \
                         '   </tr>\n' % \
-                        (quote(subdir), cgi.escape(subdir))
+                        (quote(subdir) + tempurl_qs, html.escape(subdir))
         for item in listing:
             if 'name' in item:
                 name = item['name']
                 if prefix:
-                    name = name[len(prefix):]
+                    name = name[len(wsgi_to_str(prefix)):]
+                content_type = item['content_type']
+                bytes = human_readable(item['bytes'])
+                last_modified = (
+                    html.escape(item['last_modified']).
+                    split('.')[0].replace('T', ' '))
                 body += '   <tr class="item %s">\n' \
                         '    <td class="colname"><a href="%s">%s</a></td>\n' \
                         '    <td class="colsize">%s</td>\n' \
                         '    <td class="coldate">%s</td>\n' \
                         '   </tr>\n' % \
-                        (' '.join('type-' + cgi.escape(t.lower(), quote=True)
-                                  for t in item['content_type'].split('/')),
-                         quote(name), cgi.escape(name),
-                         human_readable(item['bytes']),
-                         cgi.escape(item['last_modified']).split('.')[0].
-                            replace('T', ' '))
+                        (' '.join('type-' + html.escape(t.lower())
+                                  for t in content_type.split('/')),
+                         quote(name) + tempurl_qs, html.escape(name),
+                         bytes, last_modified)
         body += '  </table>\n' \
                 ' </body>\n' \
                 '</html>\n'
         resp = Response(headers=headers, body=body)
-        self._log_response(env, resp.status_int)
         return resp(env, start_response)
 
     def _build_css_path(self, prefix=''):
@@ -342,6 +396,17 @@ def _build_css_path(self, prefix=''):
             css_path = '../' * prefix.count('/') + quote(self._listings_css)
         return css_path
 
+    def _redirect_with_slash(self, env_, start_response):
+        env = {}
+        env.update(env_)
+        if self.url_scheme:
+            env['wsgi.url_scheme'] = self.url_scheme
+        if self.url_host:
+            env['HTTP_HOST'] = self.url_host
+        resp = HTTPMovedPermanently(
+            location=wsgi_quote(env['PATH_INFO'] + '/'))
+        return resp(env, start_response)
+
     def handle_container(self, env, start_response):
         """
         Handles a possible static web request for a container.
@@ -349,27 +414,33 @@ def handle_container(self, env, start_response):
         :param env: The original WSGI environment dict.
         :param start_response: The original WSGI start_response hook.
         """
-        self._get_container_info(env)
+        container_info = self._get_container_info(env)
+        req = Request(env)
+        req.acl = container_info['read_acl']
+        # we checked earlier that swift.authorize is set in env
+        aresp = env['swift.authorize'](req)
+        if aresp:
+            resp = aresp(env, self._start_response)
+            return self._error_response(resp, env, start_response)
+
         if not self._listings and not self._index:
             if config_true_value(env.get('HTTP_X_WEB_MODE', 'f')):
                 return HTTPNotFound()(env, start_response)
             return self.app(env, start_response)
-        if env['PATH_INFO'][-1] != '/':
-            resp = HTTPMovedPermanently(
-                location=(env['PATH_INFO'] + '/'))
-            self._log_response(env, resp.status_int)
-            return resp(env, start_response)
+        if not env['PATH_INFO'].endswith('/'):
+            return self._redirect_with_slash(env, start_response)
         if not self._index:
             return self._listing(env, start_response)
         tmp_env = dict(env)
         tmp_env['HTTP_USER_AGENT'] = \
             '%s StaticWeb' % env.get('HTTP_USER_AGENT')
-        tmp_env['PATH_INFO'] += self._index
+        tmp_env['swift.source'] = 'SW'
+        tmp_env['PATH_INFO'] += str_to_wsgi(self._index)
         resp = self._app_call(tmp_env)
         status_int = self._get_status_int()
         if status_int == HTTP_NOT_FOUND:
             return self._listing(env, start_response)
-        elif not is_success(self._get_status_int()) or \
+        elif not is_success(self._get_status_int()) and \
                 not is_redirection(self._get_status_int()):
             return self._error_response(resp, env, start_response)
         start_response(self._response_status, self._response_headers,
@@ -387,122 +458,75 @@ def handle_object(self, env, start_response):
         tmp_env = dict(env)
         tmp_env['HTTP_USER_AGENT'] = \
             '%s StaticWeb' % env.get('HTTP_USER_AGENT')
+        tmp_env['swift.source'] = 'SW'
         resp = self._app_call(tmp_env)
         status_int = self._get_status_int()
+        self._get_container_info(env)
         if is_success(status_int) or is_redirection(status_int):
-            start_response(self._response_status, self._response_headers,
-                           self._response_exc_info)
-            return resp
+            # Treat directory marker objects as not found
+            if not self._dir_type:
+                self._dir_type = 'application/directory'
+            content_length = self._response_header_value('content-length')
+            content_length = int(content_length) if content_length else 0
+            if self._response_header_value('content-type') == self._dir_type \
+                    and content_length <= 1:
+                status_int = HTTP_NOT_FOUND
+            else:
+                start_response(self._response_status, self._response_headers,
+                               self._response_exc_info)
+                return resp
         if status_int != HTTP_NOT_FOUND:
+            # Retaining the previous code's behavior of not using custom error
+            # pages for non-404 errors.
+            self._error = None
             return self._error_response(resp, env, start_response)
-        self._get_container_info(env)
         if not self._listings and not self._index:
-            return self.app(env, start_response)
+            start_response(self._response_status, self._response_headers,
+                           self._response_exc_info)
+            return resp
         status_int = HTTP_NOT_FOUND
         if self._index:
             tmp_env = dict(env)
             tmp_env['HTTP_USER_AGENT'] = \
                 '%s StaticWeb' % env.get('HTTP_USER_AGENT')
-            if tmp_env['PATH_INFO'][-1] != '/':
+            tmp_env['swift.source'] = 'SW'
+            if not tmp_env['PATH_INFO'].endswith('/'):
                 tmp_env['PATH_INFO'] += '/'
-            tmp_env['PATH_INFO'] += self._index
+            tmp_env['PATH_INFO'] += str_to_wsgi(self._index)
             resp = self._app_call(tmp_env)
             status_int = self._get_status_int()
             if is_success(status_int) or is_redirection(status_int):
-                if env['PATH_INFO'][-1] != '/':
-                    resp = HTTPMovedPermanently(
-                        location=env['PATH_INFO'] + '/')
-                    self._log_response(env, resp.status_int)
-                    return resp(env, start_response)
+                if not env['PATH_INFO'].endswith('/'):
+                    return self._redirect_with_slash(env, start_response)
                 start_response(self._response_status, self._response_headers,
                                self._response_exc_info)
                 return resp
         if status_int == HTTP_NOT_FOUND:
-            if env['PATH_INFO'][-1] != '/':
-                tmp_env = make_pre_authed_env(
+            if not env['PATH_INFO'].endswith('/'):
+                tmp_env = make_env(
                     env, 'GET', '/%s/%s/%s' % (
                         self.version, self.account, self.container),
-                    self.agent)
-                tmp_env['QUERY_STRING'] = 'limit=1&format=json&delimiter' \
-                    '=/&limit=1&prefix=%s' % quote(self.obj + '/')
+                    self.agent, swift_source='SW')
+                tmp_env['QUERY_STRING'] = 'limit=1&delimiter=/&prefix=%s' % (
+                    quote(wsgi_to_str(self.obj) + '/'), )
                 resp = self._app_call(tmp_env)
-                body = ''.join(resp)
+                body = b''.join(resp)
                 if not is_success(self._get_status_int()) or not body or \
                         not json.loads(body):
                     resp = HTTPNotFound()(env, self._start_response)
                     return self._error_response(resp, env, start_response)
-                resp = HTTPMovedPermanently(location=env['PATH_INFO'] + '/')
-                self._log_response(env, resp.status_int)
-                return resp(env, start_response)
+                return self._redirect_with_slash(env, start_response)
             return self._listing(env, start_response, self.obj)
 
-    def _log_response(self, env, status_int):
-        """
-        Logs an access line for StaticWeb responses; use when the next app in
-        the pipeline will not be handling the final response to the remote
-        user.
-
-        Assumes that the request and response bodies are 0 bytes or very near 0
-        so no bytes transferred are tracked or logged.
-
-        This does mean that the listings responses that actually do transfer
-        content will not be logged with any bytes transferred, but in counter
-        to that the full bytes for the underlying listing will be logged by the
-        proxy even if the remote client disconnects early for the StaticWeb
-        listing.
-
-        I didn't think the extra complexity of getting the bytes transferred
-        exactly correct for these requests was worth it, but perhaps someone
-        else will think it is.
-
-        To get things exact, this filter would need to use an
-        eventlet.posthooks logger like the proxy does and any log processing
-        systems would need to ignore some (but not all) proxy requests made by
-        StaticWeb if they were just interested in the bytes transferred to the
-        remote client.
-        """
-        trans_time = '%.4f' % (time.time() -
-                               env.get('staticweb.start_time', time.time()))
-        the_request = quote(unquote(env['PATH_INFO']))
-        if env.get('QUERY_STRING'):
-            the_request = the_request + '?' + env['QUERY_STRING']
-        # remote user for zeus
-        client = env.get('HTTP_X_CLUSTER_CLIENT_IP')
-        if not client and 'HTTP_X_FORWARDED_FOR' in env:
-            # remote user for other lbs
-            client = env['HTTP_X_FORWARDED_FOR'].split(',')[0].strip()
-        logged_headers = None
-        if self.log_headers:
-            headers = []
-            for k, v in env.iteritems():
-                if k.startswith('HTTP_'):
-                    k = k[len('HTTP_'):].replace('_', '-').title()
-                    headers.append((k, v))
-            logged_headers = '\n'.join('%s: %s' % (k, v) for k, v in headers)
-        self.access_logger.info(' '.join(quote(str(x)) for x in (
-            client or '-',
-            env.get('REMOTE_ADDR', '-'),
-            time.strftime('%d/%b/%Y/%H/%M/%S', time.gmtime()),
-            env['REQUEST_METHOD'],
-            the_request,
-            env['SERVER_PROTOCOL'],
-            status_int,
-            env.get('HTTP_REFERER', '-'),
-            env.get('HTTP_USER_AGENT', '-'),
-            env.get('HTTP_X_AUTH_TOKEN', '-'),
-            '-',
-            '-',
-            env.get('HTTP_ETAG', '-'),
-            env.get('swift.trans_id', '-'),
-            logged_headers or '-',
-            trans_time)))
-
 
 class StaticWeb(object):
     """
     The Static Web WSGI middleware filter; serves container data as a static
     web site. See `staticweb`_ for an overview.
 
+    The proxy logs created for any subrequests made will have swift.source set
+    to "SW".
+
     :param app: The next WSGI application/filter in the paste.deploy pipeline.
     :param conf: The filter configuration dict.
     """
@@ -510,22 +534,19 @@ class StaticWeb(object):
     def __init__(self, app, conf):
         #: The next WSGI application/filter in the paste.deploy pipeline.
         self.app = app
-        #: The filter configuration dict.
+        #: The filter configuration dict. Only used in tests.
         self.conf = conf
-        #: The seconds to cache the x-container-meta-web-* headers.,
-        self.cache_timeout = int(conf.get('cache_timeout', 300))
-        #: Logger for this filter.
         self.logger = get_logger(conf, log_route='staticweb')
-        access_log_conf = {}
-        for key in ('log_facility', 'log_name', 'log_level'):
-            value = conf.get('access_' + key, conf.get(key, None))
-            if value:
-                access_log_conf[key] = value
-        #: Web access logger for this filter.
-        self.access_logger = get_logger(access_log_conf,
-                                        log_route='staticweb-access')
-        #: Indicates whether full HTTP headers should be logged or not.
-        self.log_headers = config_true_value(conf.get('log_headers', 'no'))
+
+        # We expose a more general "url_base" parameter in case we want
+        # to incorporate the path prefix later. Currently it is discarded.
+        url_base = conf.get('url_base', None)
+        self.url_scheme = None
+        self.url_host = None
+        if url_base:
+            parsed = urlparse(url_base)
+            self.url_scheme = parsed.scheme
+            self.url_host = parsed.netloc
 
     def __call__(self, env, start_response):
         """
@@ -535,22 +556,20 @@ def __call__(self, env, start_response):
         :param start_response: The WSGI start_response hook.
         """
         env['staticweb.start_time'] = time.time()
+        if 'swift.authorize' not in env:
+            self.logger.warning(
+                'No authentication middleware authorized request yet. '
+                'Skipping staticweb')
+            return self.app(env, start_response)
         try:
             (version, account, container, obj) = \
                 split_path(env['PATH_INFO'], 2, 4, True)
         except ValueError:
             return self.app(env, start_response)
-        if env['REQUEST_METHOD'] in ('PUT', 'POST') and container and not obj:
-            memcache_client = cache_from_env(env)
-            if memcache_client:
-                memcache_key = \
-                    '/staticweb/%s/%s/%s' % (version, account, container)
-                memcache_client.delete(memcache_key)
-            return self.app(env, start_response)
         if env['REQUEST_METHOD'] not in ('HEAD', 'GET'):
             return self.app(env, start_response)
-        if env.get('REMOTE_USER') and \
-                not config_true_value(env.get('HTTP_X_WEB_MODE', 'f')):
+        if env.get('REMOTE_USER') and env['REMOTE_USER'] != '.wsgi.tempurl' \
+                and not config_true_value(env.get('HTTP_X_WEB_MODE', 'f')):
             return self.app(env, start_response)
         if not container:
             return self.app(env, start_response)
@@ -561,9 +580,10 @@ def __call__(self, env, start_response):
 
 
 def filter_factory(global_conf, **local_conf):
-    """ Returns a Static Web WSGI filter for use with paste.deploy. """
+    """Returns a Static Web WSGI filter for use with paste.deploy."""
     conf = global_conf.copy()
     conf.update(local_conf)
+    register_swift_info('staticweb')
 
     def staticweb_filter(app):
         return StaticWeb(app, conf)
diff --git a/swift/common/middleware/symlink.py b/swift/common/middleware/symlink.py
new file mode 100644
index 0000000000..8f8d6e4e53
--- /dev/null
+++ b/swift/common/middleware/symlink.py
@@ -0,0 +1,772 @@
+# Copyright (c) 2010-2017 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""
+Symlink Middleware
+
+Symlinks are objects stored in Swift that contain a reference to another
+object (hereinafter, this is called "target object"). They are analogous to
+symbolic links in Unix-like operating systems. The existence of a symlink
+object does not affect the target object in any way. An important use case is
+to use a path in one container to access an object in a different container,
+with a different policy. This allows policy cost/performance trade-offs to be
+made on individual objects.
+
+Clients create a Swift symlink by performing a zero-length PUT request
+with the header ``X-Symlink-Target: <container>/<object>``. For a cross-account
+symlink, the header ``X-Symlink-Target-Account: <account>`` must be included.
+If omitted, it is inserted automatically with the account of the symlink
+object in the PUT request process.
+
+Symlinks must be zero-byte objects. Attempting to PUT a symlink with a
+non-empty request body will result in a 400-series error. Also, POST with
+``X-Symlink-Target`` header always results in a 400-series error. The target
+object need not exist at symlink creation time.
+
+Clients may optionally include a ``X-Symlink-Target-Etag: <etag>`` header
+during the PUT. If present, this will create a "static symlink" instead of a
+"dynamic symlink".  Static symlinks point to a specific object rather than a
+specific name.  They do this by using the value set in their
+``X-Symlink-Target-Etag`` header when created to verify it still matches the
+ETag of the object they're pointing at on a GET.  In contrast to a dynamic
+symlink the target object referenced in the ``X-Symlink-Target`` header must
+exist and its ETag must match the ``X-Symlink-Target-Etag`` or the symlink
+creation will return a client error.
+
+A GET/HEAD request to a symlink will result in a request to the target
+object referenced by the symlink's ``X-Symlink-Target-Account`` and
+``X-Symlink-Target`` headers. The response of the GET/HEAD request will contain
+a ``Content-Location`` header with the path location of the target object. A
+GET/HEAD request to a symlink with the query parameter ``?symlink=get`` will
+result in the request targeting the symlink itself.
+
+A symlink can point to another symlink. Chained symlinks will be traversed
+until the target is not a symlink. If the number of chained symlinks exceeds
+the limit ``symloop_max`` an error response will be produced. The value of
+``symloop_max`` can be defined in the symlink config section of
+`proxy-server.conf`. If not specified, the default ``symloop_max`` value is 2.
+If a value less than 1 is specified, the default value will be used.
+
+If a static symlink (i.e. a symlink created with a ``X-Symlink-Target-Etag``
+header) targets another static symlink, both of the ``X-Symlink-Target-Etag``
+headers must match the target object for the GET to succeed.  If a static
+symlink targets a dynamic symlink (i.e. a symlink created without a
+``X-Symlink-Target-Etag`` header) then the ``X-Symlink-Target-Etag`` header of
+the static symlink must be the Etag of the zero-byte object.  If a symlink with
+a ``X-Symlink-Target-Etag`` targets a large object manifest it must match the
+ETag of the manifest (e.g. the ETag as returned by ``multipart-manifest=get``
+or value in the ``X-Manifest-Etag`` header).
+
+A HEAD/GET request to a symlink object behaves as a normal HEAD/GET request
+to the target object. Therefore issuing a HEAD request to the symlink will
+return the target metadata, and issuing a GET request to the symlink will
+return the data and metadata of the target object. To return the symlink
+metadata (with its empty body) a GET/HEAD request with the ``?symlink=get``
+query parameter must be sent to a symlink object.
+
+A POST request to a symlink will result in a 307 Temporary Redirect response.
+The response will contain a ``Location`` header with the path of the target
+object as the value. The request is never redirected to the target object by
+Swift. Nevertheless, the metadata in the POST request will be applied to the
+symlink because object servers cannot know for sure if the current object is a
+symlink or not in eventual consistency.
+
+A symlink's ``Content-Type`` is completely independent from its target.  As a
+convenience Swift will automatically set the ``Content-Type`` on a symlink PUT
+if not explicitly set by the client.  If the client sends a
+``X-Symlink-Target-Etag`` Swift will set the symlink's ``Content-Type`` to that
+of the target, otherwise it will be set to ``application/symlink``.  You can
+review a symlink's ``Content-Type`` using the ``?symlink=get`` interface.  You
+can change a symlink's ``Content-Type`` using a POST request.  The symlink's
+``Content-Type`` will appear in the container listing.
+
+A DELETE request to a symlink will delete the symlink itself. The target
+object will not be deleted.
+
+A COPY request, or a PUT request with a ``X-Copy-From`` header, to a symlink
+will copy the target object. The same request to a symlink with the query
+parameter ``?symlink=get`` will copy the symlink itself.
+
+An OPTIONS request to a symlink will respond with the options for the symlink
+only; the request will not be redirected to the target object. Please note that
+if the symlink's target object is in another container with CORS settings, the
+response will not reflect the settings.
+
+Tempurls can be used to GET/HEAD symlink objects, but PUT is not allowed and
+will result in a 400-series error. The GET/HEAD tempurls honor the scope of
+the tempurl key. Container tempurl will only work on symlinks where the target
+container is the same as the symlink. In case a symlink targets an object
+in a different container, a GET/HEAD request will result in a 401 Unauthorized
+error. The account level tempurl will allow cross-container symlinks, but not
+cross-account symlinks.
+
+If a symlink object is overwritten while it is in a versioned container, the
+symlink object itself is versioned, not the referenced object.
+
+A GET request with query parameter ``?format=json`` to a container which
+contains symlinks will respond with additional information ``symlink_path``
+for each symlink object in the container listing. The ``symlink_path`` value
+is the target path of the symlink. Clients can differentiate symlinks and
+other objects by this function. Note that responses in any other format
+(e.g. ``?format=xml``) won't include ``symlink_path`` info.  If a
+``X-Symlink-Target-Etag`` header was included on the symlink, JSON container
+listings will include that value in a ``symlink_etag`` key and the target
+object's ``Content-Length`` will be included in the key ``symlink_bytes``.
+
+If a static symlink targets a static large object manifest it will carry
+forward the SLO's size and slo_etag in the container listing using the
+``symlink_bytes`` and ``slo_etag`` keys.  However, manifests created before
+swift v2.12.0 (released Dec 2016) do not contain enough metadata to propagate
+the extra SLO information to the listing.  Clients may recreate the manifest
+(COPY w/ ``?multipart-manfiest=get``) before creating a static symlink to add
+the requisite metadata.
+
+Errors
+
+* PUT with the header ``X-Symlink-Target`` with non-zero Content-Length
+  will produce a 400 BadRequest error.
+
+* POST with the header ``X-Symlink-Target`` will produce a
+  400 BadRequest error.
+
+* GET/HEAD traversing more than ``symloop_max`` chained symlinks will
+  produce a 409 Conflict error.
+
+* PUT/GET/HEAD on a symlink that inclues a ``X-Symlink-Target-Etag`` header
+  that does not match the target will poduce a 409 Conflict error.
+
+* POSTs will produce a 307 Temporary Redirect error.
+
+----------
+Deployment
+----------
+
+Symlinks are enabled by adding the `symlink` middleware to the proxy server
+WSGI pipeline and including a corresponding filter configuration section in the
+`proxy-server.conf` file. The `symlink` middleware should be placed after
+`slo`, `dlo` and `versioned_writes` middleware, but before `encryption`
+middleware in the pipeline. See the `proxy-server.conf-sample` file for further
+details. :ref:`Additional steps <symlink_container_sync_client_config>` are
+required if the container sync feature is being used.
+
+.. note::
+
+    Once you have deployed `symlink` middleware in your pipeline, you should
+    neither remove the `symlink` middleware nor downgrade swift to a version
+    earlier than symlinks being supported. Doing so may result in unexpected
+    container listing results in addition to symlink objects behaving like a
+    normal object.
+
+.. _symlink_container_sync_client_config:
+
+Container sync configuration
+----------------------------
+
+If container sync is being used then the `symlink` middleware
+must be added to the container sync internal client pipeline. The following
+configuration steps are required:
+
+#. Create a custom internal client configuration file for container sync (if
+   one is not already in use) based on the sample file
+   `internal-client.conf-sample`. For example, copy
+   `internal-client.conf-sample` to `/etc/swift/container-sync-client.conf`.
+#. Modify this file to include the `symlink` middleware in the pipeline in
+   the same way as described above for the proxy server.
+#. Modify the container-sync section of all container server config files to
+   point to this internal client config file using the
+   ``internal_client_conf_path`` option. For example::
+
+     internal_client_conf_path = /etc/swift/container-sync-client.conf
+
+.. note::
+
+    These container sync configuration steps will be necessary for container
+    sync probe tests to pass if the `symlink` middleware is included in the
+    proxy pipeline of a test cluster.
+"""
+
+import json
+import os
+
+from swift.common.utils import get_logger, split_path, \
+    MD5_OF_EMPTY_STRING, close_if_possible, closing_if_possible, \
+    config_true_value, drain_and_close, parse_header
+from swift.common.registry import register_swift_info
+from swift.common.constraints import check_account_format
+from swift.common.wsgi import WSGIContext, make_subrequest, \
+    make_pre_authed_request
+from swift.common.request_helpers import get_sys_meta_prefix, \
+    check_path_header, get_container_update_override_key, \
+    update_ignore_range_header
+from swift.common.swob import Request, HTTPBadRequest, HTTPTemporaryRedirect, \
+    HTTPException, HTTPConflict, HTTPPreconditionFailed, wsgi_quote, \
+    wsgi_unquote, status_map, normalize_etag
+from swift.common.http import is_success, HTTP_NOT_FOUND
+from swift.common.exceptions import LinkIterError
+from swift.common.header_key_dict import HeaderKeyDict
+
+DEFAULT_SYMLOOP_MAX = 2
+# Header values for symlink target path strings will be quoted values.
+TGT_OBJ_SYMLINK_HDR = 'x-symlink-target'
+TGT_ACCT_SYMLINK_HDR = 'x-symlink-target-account'
+TGT_ETAG_SYMLINK_HDR = 'x-symlink-target-etag'
+TGT_BYTES_SYMLINK_HDR = 'x-symlink-target-bytes'
+TGT_OBJ_SYSMETA_SYMLINK_HDR = get_sys_meta_prefix('object') + 'symlink-target'
+TGT_ACCT_SYSMETA_SYMLINK_HDR = \
+    get_sys_meta_prefix('object') + 'symlink-target-account'
+TGT_ETAG_SYSMETA_SYMLINK_HDR = \
+    get_sys_meta_prefix('object') + 'symlink-target-etag'
+TGT_BYTES_SYSMETA_SYMLINK_HDR = \
+    get_sys_meta_prefix('object') + 'symlink-target-bytes'
+SYMLOOP_EXTEND = get_sys_meta_prefix('object') + 'symloop-extend'
+ALLOW_RESERVED_NAMES = get_sys_meta_prefix('object') + 'allow-reserved-names'
+
+
+def _validate_and_prep_request_headers(req):
+    """
+    Validate that the value from x-symlink-target header is well formatted
+    and that the x-symlink-target-etag header (if present) does not contain
+    problematic characters. We assume the caller ensures that
+    x-symlink-target header is present in req.headers.
+
+    :param req: HTTP request object
+    :returns: a tuple, the full versioned path to the object (as a WSGI string)
+              and the X-Symlink-Target-Etag header value which may be None
+    :raise: HTTPPreconditionFailed if x-symlink-target value
+            is not well formatted.
+    :raise: HTTPBadRequest if the x-symlink-target value points to the request
+            path.
+    :raise: HTTPBadRequest if the x-symlink-target-etag value contains
+            a semicolon, double-quote, or backslash.
+    """
+    # N.B. check_path_header doesn't assert the leading slash and
+    # copy middleware may accept the format. In the symlink, API
+    # says apparently to use "container/object" format so add the
+    # validation first, here.
+    error_body = 'X-Symlink-Target header must be of the form ' \
+                 '<container name>/<object name>'
+    if wsgi_unquote(req.headers[TGT_OBJ_SYMLINK_HDR]).startswith('/'):
+        raise HTTPPreconditionFailed(
+            body=error_body,
+            request=req, content_type='text/plain')
+
+    # check container and object format
+    container, obj = check_path_header(
+        req, TGT_OBJ_SYMLINK_HDR, 2,
+        error_body)
+    req.headers[TGT_OBJ_SYMLINK_HDR] = wsgi_quote('%s/%s' % (container, obj))
+
+    # Check account format if it exists
+    account = check_account_format(
+        req, wsgi_unquote(req.headers[TGT_ACCT_SYMLINK_HDR])) \
+        if TGT_ACCT_SYMLINK_HDR in req.headers else None
+
+    # Extract request path
+    _junk, req_acc, req_cont, req_obj = req.split_path(4, 4, True)
+
+    if account:
+        req.headers[TGT_ACCT_SYMLINK_HDR] = wsgi_quote(account)
+    else:
+        account = req_acc
+
+    # Check if symlink targets the symlink itself or not
+    if (account, container, obj) == (req_acc, req_cont, req_obj):
+        raise HTTPBadRequest(
+            body='Symlink cannot target itself',
+            request=req, content_type='text/plain')
+    etag = normalize_etag(req.headers.get(TGT_ETAG_SYMLINK_HDR, None))
+    if etag and any(c in etag for c in ';"\\'):
+        # See utils.parse_header for why the above chars are problematic
+        raise HTTPBadRequest(
+            body='Bad %s format' % TGT_ETAG_SYMLINK_HDR.title(),
+            request=req, content_type='text/plain')
+    if not (etag or req.headers.get('Content-Type')):
+        req.headers['Content-Type'] = 'application/symlink'
+    return '/v1/%s/%s/%s' % (account, container, obj), etag
+
+
+def symlink_usermeta_to_sysmeta(headers):
+    """
+    Helper function to translate from client-facing X-Symlink-* headers
+    to cluster-facing X-Object-Sysmeta-Symlink-* headers.
+
+    :param headers: request headers dict. Note that the headers dict
+        will be updated directly.
+    """
+    # To preseve url-encoded value in the symlink header, use raw value
+    for user_hdr, sysmeta_hdr in (
+            (TGT_OBJ_SYMLINK_HDR, TGT_OBJ_SYSMETA_SYMLINK_HDR),
+            (TGT_ACCT_SYMLINK_HDR, TGT_ACCT_SYSMETA_SYMLINK_HDR)):
+        if user_hdr in headers:
+            headers[sysmeta_hdr] = headers.pop(user_hdr)
+
+
+def symlink_sysmeta_to_usermeta(headers):
+    """
+    Helper function to translate from cluster-facing
+    X-Object-Sysmeta-Symlink-* headers to client-facing X-Symlink-* headers.
+
+    :param headers: request headers dict. Note that the headers dict
+        will be updated directly.
+    """
+    for user_hdr, sysmeta_hdr in (
+            (TGT_OBJ_SYMLINK_HDR, TGT_OBJ_SYSMETA_SYMLINK_HDR),
+            (TGT_ACCT_SYMLINK_HDR, TGT_ACCT_SYSMETA_SYMLINK_HDR),
+            (TGT_ETAG_SYMLINK_HDR, TGT_ETAG_SYSMETA_SYMLINK_HDR),
+            (TGT_BYTES_SYMLINK_HDR, TGT_BYTES_SYSMETA_SYMLINK_HDR)):
+        if sysmeta_hdr in headers:
+            headers[user_hdr] = headers.pop(sysmeta_hdr)
+
+
+class SymlinkContainerContext(WSGIContext):
+    def __init__(self, wsgi_app, logger):
+        super(SymlinkContainerContext, self).__init__(wsgi_app)
+        self.logger = logger
+
+    def handle_container(self, req, start_response):
+        """
+        Handle container requests.
+
+        :param req: a :class:`~swift.common.swob.Request`
+        :param start_response: start_response function
+
+        :return: Response Iterator after start_response called.
+        """
+        app_resp = self._app_call(req.environ)
+
+        if req.method == 'GET' and is_success(self._get_status_int()):
+            app_resp = self._process_json_resp(app_resp, req)
+
+        start_response(self._response_status, self._response_headers,
+                       self._response_exc_info)
+
+        return app_resp
+
+    def _process_json_resp(self, resp_iter, req):
+        """
+        Iterate through json body looking for symlinks and modify its content
+        :return: modified json body
+        """
+        with closing_if_possible(resp_iter):
+            resp_body = b''.join(resp_iter)
+        body_json = json.loads(resp_body)
+        swift_version, account, _junk = split_path(req.path, 2, 3, True)
+        new_body = json.dumps(
+            [self._extract_symlink_path_json(obj_dict, swift_version, account)
+             for obj_dict in body_json]).encode('ascii')
+        self.update_content_length(len(new_body))
+        return [new_body]
+
+    def _extract_symlink_path_json(self, obj_dict, swift_version, account):
+        """
+        Extract the symlink info from the hash value
+        :return: object dictionary with additional key:value pairs when object
+                 is a symlink. i.e. new symlink_path, symlink_etag and
+                 symlink_bytes keys
+        """
+        if 'hash' in obj_dict:
+            hash_value, meta = parse_header(obj_dict['hash'])
+            obj_dict['hash'] = hash_value
+            target = None
+            for key in meta:
+                if key == 'symlink_target':
+                    target = meta[key]
+                elif key == 'symlink_target_account':
+                    account = meta[key]
+                elif key == 'symlink_target_etag':
+                    obj_dict['symlink_etag'] = meta[key]
+                elif key == 'symlink_target_bytes':
+                    obj_dict['symlink_bytes'] = int(meta[key])
+                else:
+                    # make sure to add all other (key, values) back in place
+                    obj_dict['hash'] += '; %s=%s' % (key, meta[key])
+            else:
+                if target:
+                    obj_dict['symlink_path'] = os.path.join(
+                        '/', swift_version, account, target)
+
+        return obj_dict
+
+
+class SymlinkObjectContext(WSGIContext):
+
+    def __init__(self, wsgi_app, logger, symloop_max):
+        super(SymlinkObjectContext, self).__init__(wsgi_app)
+        self.symloop_max = symloop_max
+        self.logger = logger
+        # N.B. _loop_count and _last_target_path are used to keep
+        # the statement in the _recursive_get. Hence they should not be touched
+        # from other resources.
+        self._loop_count = 0
+        self._last_target_path = None
+
+    def handle_get_head_symlink(self, req):
+        """
+        Handle get/head request when client sent parameter ?symlink=get
+
+        :param req: HTTP GET or HEAD object request with param ?symlink=get
+        :returns: Response Iterator
+        """
+        resp = self._app_call(req.environ)
+        response_header_dict = HeaderKeyDict(self._response_headers)
+        symlink_sysmeta_to_usermeta(response_header_dict)
+        self._response_headers = list(response_header_dict.items())
+        return resp
+
+    def handle_get_head(self, req):
+        """
+        Handle get/head request and in case the response is a symlink,
+        redirect request to target object.
+
+        :param req: HTTP GET or HEAD object request
+        :returns: Response Iterator
+        """
+        update_ignore_range_header(req, TGT_OBJ_SYSMETA_SYMLINK_HDR)
+        try:
+            return self._recursive_get_head(req)
+        except LinkIterError:
+            errmsg = 'Too many levels of symbolic links, ' \
+                     'maximum allowed is %d' % self.symloop_max
+            raise HTTPConflict(body=errmsg, request=req,
+                               content_type='text/plain')
+
+    def _recursive_get_head(self, req, target_etag=None,
+                            follow_softlinks=True, orig_req=None):
+        if not orig_req:
+            orig_req = req
+        resp = self._app_call(req.environ)
+
+        def build_traversal_req(symlink_target):
+            """
+            :returns: new request for target path if it's symlink otherwise
+                      None
+            """
+            version, account, _junk = req.split_path(2, 3, True)
+            account = self._response_header_value(
+                TGT_ACCT_SYSMETA_SYMLINK_HDR) or wsgi_quote(account)
+            target_path = os.path.join(
+                '/', version, account,
+                symlink_target.lstrip('/'))
+            self._last_target_path = target_path
+
+            subreq_headers = dict(req.headers)
+            if self._response_header_value(ALLOW_RESERVED_NAMES):
+                # this symlink's sysmeta says it can point to reserved names,
+                # we're infering that some piece of middleware had previously
+                # authorized this request because users can't access reserved
+                # names directly
+                subreq_meth = make_pre_authed_request
+                subreq_headers['X-Backend-Allow-Reserved-Names'] = 'true'
+            else:
+                subreq_meth = make_subrequest
+            new_req = subreq_meth(orig_req.environ, path=target_path,
+                                  method=req.method, headers=subreq_headers,
+                                  swift_source='SYM')
+            new_req.headers.pop('X-Backend-Storage-Policy-Index', None)
+            return new_req
+
+        symlink_target = self._response_header_value(
+            TGT_OBJ_SYSMETA_SYMLINK_HDR)
+        resp_etag = self._response_header_value(
+            TGT_ETAG_SYSMETA_SYMLINK_HDR)
+        if symlink_target and (resp_etag or follow_softlinks):
+            # Should be a zero-byte object
+            drain_and_close(resp)
+            found_etag = resp_etag or self._response_header_value('etag')
+            if target_etag and target_etag != found_etag:
+                raise HTTPConflict(
+                    body='X-Symlink-Target-Etag headers do not match',
+                    headers={
+                        'Content-Type': 'text/plain',
+                        'Content-Location': self._last_target_path})
+            if self._loop_count >= self.symloop_max:
+                raise LinkIterError()
+            # format: /<account name>/<container name>/<object name>
+            new_req = build_traversal_req(symlink_target)
+            if not config_true_value(
+                    self._response_header_value(SYMLOOP_EXTEND)):
+                self._loop_count += 1
+            return self._recursive_get_head(new_req, target_etag=resp_etag,
+                                            orig_req=req)
+        else:
+            final_etag = self._response_header_value('etag')
+            if final_etag and target_etag and target_etag != final_etag:
+                # do *not* drain; we don't know how big this is
+                close_if_possible(resp)
+                body = ('Object Etag %r does not match '
+                        'X-Symlink-Target-Etag header %r')
+                raise HTTPConflict(
+                    body=body % (final_etag, target_etag),
+                    headers={
+                        'Content-Type': 'text/plain',
+                        'Content-Location': self._last_target_path})
+
+            if self._last_target_path:
+                # Content-Location will be applied only when one or more
+                # symlink recursion occurred.
+                # In this case, Content-Location is applied to show which
+                # object path caused the error response.
+                # To preserve '%2F'(= quote('/')) in X-Symlink-Target
+                # header value as it is, Content-Location value comes from
+                # TGT_OBJ_SYMLINK_HDR, not req.path
+                self._response_headers.extend(
+                    [('Content-Location', self._last_target_path)])
+
+            return resp
+
+    def _validate_etag_and_update_sysmeta(self, req, symlink_target_path,
+                                          etag):
+        if req.environ.get('swift.symlink_override'):
+            req.headers[TGT_ETAG_SYSMETA_SYMLINK_HDR] = etag
+            req.headers[TGT_BYTES_SYSMETA_SYMLINK_HDR] = \
+                req.headers[TGT_BYTES_SYMLINK_HDR]
+            return
+
+        # next we'll make sure the E-Tag matches a real object
+        new_req = make_subrequest(
+            req.environ, path=wsgi_quote(symlink_target_path), method='HEAD',
+            swift_source='SYM')
+        if req.allow_reserved_names:
+            new_req.headers['X-Backend-Allow-Reserved-Names'] = 'true'
+        self._last_target_path = symlink_target_path
+        resp = self._recursive_get_head(new_req, target_etag=etag,
+                                        follow_softlinks=False)
+        if self._get_status_int() == HTTP_NOT_FOUND:
+            raise HTTPConflict(
+                body='X-Symlink-Target does not exist',
+                request=req,
+                headers={
+                    'Content-Type': 'text/plain',
+                    'Content-Location': self._last_target_path})
+        if not is_success(self._get_status_int()):
+            drain_and_close(resp)
+            raise status_map[self._get_status_int()](request=req)
+        response_headers = HeaderKeyDict(self._response_headers)
+        # carry forward any etag update params (e.g. "slo_etag"), we'll append
+        # symlink_target_* params to this header after this method returns
+        override_header = get_container_update_override_key('etag')
+        if override_header in response_headers and \
+                override_header not in req.headers:
+            sep, params = response_headers[override_header].partition(';')[1:]
+            req.headers[override_header] = MD5_OF_EMPTY_STRING + sep + params
+
+        # It's troublesome that there's so much leakage with SLO
+        if 'X-Object-Sysmeta-Slo-Etag' in response_headers and \
+                override_header not in req.headers:
+            req.headers[override_header] = '%s; slo_etag=%s' % (
+                MD5_OF_EMPTY_STRING,
+                response_headers['X-Object-Sysmeta-Slo-Etag'])
+        req.headers[TGT_BYTES_SYSMETA_SYMLINK_HDR] = (
+            response_headers.get('x-object-sysmeta-slo-size') or
+            response_headers['Content-Length'])
+
+        req.headers[TGT_ETAG_SYSMETA_SYMLINK_HDR] = etag
+
+        if not req.headers.get('Content-Type'):
+            req.headers['Content-Type'] = response_headers['Content-Type']
+
+    def handle_put(self, req):
+        """
+        Handle put request when it contains X-Symlink-Target header.
+
+        Symlink headers are validated and moved to sysmeta namespace.
+        :param req: HTTP PUT object request
+        :returns: Response Iterator
+        """
+        if req.content_length is None:
+            has_body = (req.body_file.read(1) != b'')
+        else:
+            has_body = (req.content_length != 0)
+        if has_body:
+            raise HTTPBadRequest(
+                body='Symlink requests require a zero byte body',
+                request=req,
+                content_type='text/plain')
+
+        symlink_target_path, etag = _validate_and_prep_request_headers(req)
+        if etag:
+            self._validate_etag_and_update_sysmeta(
+                req, symlink_target_path, etag)
+        # N.B. TGT_ETAG_SYMLINK_HDR was converted as part of verifying it
+        symlink_usermeta_to_sysmeta(req.headers)
+        # Store info in container update that this object is a symlink.
+        # We have a design decision to use etag space to store symlink info for
+        # object listing because it's immutable unless the object is
+        # overwritten. This may impact the downgrade scenario that the symlink
+        # info can appear as the suffix in the hash value of object
+        # listing result for clients.
+        # To create override etag easily, we have a constraint that the symlink
+        # must be 0 byte so we can add etag of the empty string + symlink info
+        # here, simply (if no other override etag was provided). Note that this
+        # override etag may be encrypted in the container db by encryption
+        # middleware.
+
+        etag_override = [
+            req.headers.get(get_container_update_override_key('etag'),
+                            MD5_OF_EMPTY_STRING),
+            'symlink_target=%s' % req.headers[TGT_OBJ_SYSMETA_SYMLINK_HDR]
+        ]
+        if TGT_ACCT_SYSMETA_SYMLINK_HDR in req.headers:
+            etag_override.append(
+                'symlink_target_account=%s' %
+                req.headers[TGT_ACCT_SYSMETA_SYMLINK_HDR])
+        if TGT_ETAG_SYSMETA_SYMLINK_HDR in req.headers:
+            # if _validate_etag_and_update_sysmeta or a middleware sets
+            # TGT_ETAG_SYSMETA_SYMLINK_HDR then they need to also set
+            # TGT_BYTES_SYSMETA_SYMLINK_HDR.  If they forget, they get a
+            # KeyError traceback and client gets a ServerError
+            etag_override.extend([
+                'symlink_target_etag=%s' %
+                req.headers[TGT_ETAG_SYSMETA_SYMLINK_HDR],
+                'symlink_target_bytes=%s' %
+                req.headers[TGT_BYTES_SYSMETA_SYMLINK_HDR],
+            ])
+        req.headers[get_container_update_override_key('etag')] = \
+            '; '.join(etag_override)
+
+        return self._app_call(req.environ)
+
+    def handle_post(self, req):
+        """
+        Handle post request. If POSTing to a symlink, a HTTPTemporaryRedirect
+        error message is returned to client.
+
+        Clients that POST to symlinks should understand that the POST is not
+        redirected to the target object like in a HEAD/GET request. POSTs to a
+        symlink will be handled just like a normal object by the object server.
+        It cannot reject it because it may not have symlink state when the POST
+        lands.  The object server has no knowledge of what is a symlink object
+        is. On the other hand, on POST requests, the object server returns all
+        sysmeta of the object. This method uses that sysmeta to determine if
+        the stored object is a symlink or not.
+
+        :param req: HTTP POST object request
+        :raises: HTTPTemporaryRedirect if POSTing to a symlink.
+        :returns: Response Iterator
+        """
+        if TGT_OBJ_SYMLINK_HDR in req.headers:
+            raise HTTPBadRequest(
+                body='A PUT request is required to set a symlink target',
+                request=req,
+                content_type='text/plain')
+
+        resp = self._app_call(req.environ)
+        if not is_success(self._get_status_int()):
+            return resp
+
+        tgt_co = self._response_header_value(TGT_OBJ_SYSMETA_SYMLINK_HDR)
+        if tgt_co:
+            version, account, _junk = req.split_path(2, 3, True)
+            target_acc = self._response_header_value(
+                TGT_ACCT_SYSMETA_SYMLINK_HDR) or wsgi_quote(account)
+            location_hdr = os.path.join(
+                '/', version, target_acc, tgt_co)
+            headers = {'location': location_hdr}
+            tgt_etag = self._response_header_value(
+                TGT_ETAG_SYSMETA_SYMLINK_HDR)
+            if tgt_etag:
+                headers[TGT_ETAG_SYMLINK_HDR] = tgt_etag
+            req.environ['swift.leave_relative_location'] = True
+            errmsg = 'The requested POST was applied to a symlink. POST ' +\
+                     'directly to the target to apply requested metadata.'
+            for key, value in self._response_headers:
+                if key.lower().startswith('x-object-sysmeta-'):
+                    headers[key] = value
+            raise HTTPTemporaryRedirect(
+                body=errmsg, headers=headers)
+        else:
+            return resp
+
+    def handle_object(self, req, start_response):
+        """
+        Handle object requests.
+
+        :param req: a :class:`~swift.common.swob.Request`
+        :param start_response: start_response function
+        :returns: Response Iterator after start_response has been called
+        """
+        if req.method in ('GET', 'HEAD'):
+            if req.params.get('symlink') == 'get':
+                resp = self.handle_get_head_symlink(req)
+            else:
+                resp = self.handle_get_head(req)
+        elif req.method == 'PUT' and (TGT_OBJ_SYMLINK_HDR in req.headers):
+            resp = self.handle_put(req)
+        elif req.method == 'POST':
+            resp = self.handle_post(req)
+        else:
+            # DELETE and OPTIONS reqs for a symlink and
+            # PUT reqs without X-Symlink-Target behave like any other object
+            resp = self._app_call(req.environ)
+
+        start_response(self._response_status, self._response_headers,
+                       self._response_exc_info)
+
+        return resp
+
+
+class SymlinkMiddleware(object):
+    """
+    Middleware that implements symlinks.
+
+    Symlinks are objects stored in Swift that contain a reference to another
+    object (i.e., the target object). An important use case is to use a path in
+    one container to access an object in a different container, with a
+    different policy. This allows policy cost/performance trade-offs to be made
+    on individual objects.
+    """
+
+    def __init__(self, app, conf, symloop_max):
+        self.app = app
+        self.conf = conf
+        self.logger = get_logger(self.conf, log_route='symlink')
+        self.symloop_max = symloop_max
+
+    def __call__(self, env, start_response):
+        req = Request(env)
+        try:
+            version, acc, cont, obj = req.split_path(3, 4, True)
+            is_cont_or_obj_req = True
+        except ValueError:
+            is_cont_or_obj_req = False
+        if not is_cont_or_obj_req:
+            return self.app(env, start_response)
+
+        try:
+            if obj:
+                # object context
+                context = SymlinkObjectContext(self.app, self.logger,
+                                               self.symloop_max)
+                return context.handle_object(req, start_response)
+            else:
+                # container context
+                context = SymlinkContainerContext(self.app, self.logger)
+                return context.handle_container(req, start_response)
+        except HTTPException as err_resp:
+            return err_resp(env, start_response)
+
+
+def filter_factory(global_conf, **local_conf):
+    conf = global_conf.copy()
+    conf.update(local_conf)
+
+    symloop_max = int(conf.get('symloop_max', DEFAULT_SYMLOOP_MAX))
+    if symloop_max < 1:
+        symloop_max = int(DEFAULT_SYMLOOP_MAX)
+    register_swift_info('symlink', symloop_max=symloop_max, static_links=True)
+
+    def symlink_mw(app):
+        return SymlinkMiddleware(app, conf, symloop_max)
+    return symlink_mw
diff --git a/swift/common/middleware/tempauth.py b/swift/common/middleware/tempauth.py
index 0277eb5026..4daaac4f4b 100644
--- a/swift/common/middleware/tempauth.py
+++ b/swift/common/middleware/tempauth.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2011 OpenStack, LLC.
+# Copyright (c) 2011-2014 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,91 +13,253 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-from time import gmtime, strftime, time
-from traceback import format_exc
-from urllib import quote, unquote
-from uuid import uuid4
-from hashlib import sha1
-import hmac
-import base64
+"""
+Test authentication and authorization system.
 
-from eventlet import Timeout
-from swift.common.swob import Response, Request
-from swift.common.swob import HTTPBadRequest, HTTPForbidden, HTTPNotFound, \
-    HTTPUnauthorized
+Add to your pipeline in proxy-server.conf, such as::
 
-from swift.common.middleware.acl import clean_acl, parse_acl, referrer_allowed
-from swift.common.utils import cache_from_env, get_logger, get_remote_client, \
-    split_path, config_true_value
-from swift.common.http import HTTP_CLIENT_CLOSED_REQUEST
+    [pipeline:main]
+    pipeline = catch_errors cache tempauth proxy-server
 
+Set account auto creation to true in proxy-server.conf::
 
-class TempAuth(object):
-    """
-    Test authentication and authorization system.
+    [app:proxy-server]
+    account_autocreate = true
+
+And add a tempauth filter section, such as::
+
+    [filter:tempauth]
+    use = egg:swift#tempauth
+    user_admin_admin = admin .admin .reseller_admin
+    user_test_tester = testing .admin
+    user_test2_tester2 = testing2 .admin
+    user_test_tester3 = testing3
+    # To allow accounts/users with underscores you can base64 encode them.
+    # Here is the account "under_score" and username "a_b" (note the lack
+    # of padding equal signs):
+    user64_dW5kZXJfc2NvcmU_YV9i = testing4
 
-    Add to your pipeline in proxy-server.conf, such as::
+See the proxy-server.conf-sample for more information.
 
-        [pipeline:main]
-        pipeline = catch_errors cache tempauth proxy-server
+Account/User List
+^^^^^^^^^^^^^^^^^
 
-    Set account auto creation to true in proxy-server.conf::
+All accounts/users are listed in the filter section. The format is::
 
-        [app:proxy-server]
-        account_autocreate = true
+    user_<account>_<user> = <key> [group] [group] [...] [storage_url]
+
+If you want to be able to include underscores in the ``<account>`` or
+``<user>`` portions, you can base64 encode them (with *no* equal signs)
+in a line like this::
+
+    user64_<account_b64>_<user_b64> = <key> [group] [...] [storage_url]
 
-    And add a tempauth filter section, such as::
+There are three special groups:
+
+* ``.reseller_admin`` -- can do anything to any account for this auth
+* ``.reseller_reader`` -- can GET/HEAD anything in any account for this auth
+* ``.admin`` -- can do anything within the account
 
-        [filter:tempauth]
-        use = egg:swift#tempauth
-        user_admin_admin = admin .admin .reseller_admin
-        user_test_tester = testing .admin
-        user_test2_tester2 = testing2 .admin
-        user_test_tester3 = testing3
-        # To allow accounts/users with underscores you can base64 encode them.
-        # Here is the account "under_score" and username "a_b" (note the lack
-        # of padding equal signs):
-        user64_dW5kZXJfc2NvcmU_YV9i = testing4
+If none of these groups are specified, the user can only access
+containers that have been explicitly allowed for them by a ``.admin`` or
+``.reseller_admin``.
+
+The trailing optional ``storage_url`` allows you to specify an alternate
+URL to hand back to the user upon authentication. If not specified, this
+defaults to::
+
+    $HOST/v1/<reseller_prefix>_<account>
+
+Where ``$HOST`` will do its best to resolve to what the requester would
+need to use to reach this host, ``<reseller_prefix>`` is from this section,
+and ``<account>`` is from the ``user_<account>_<user>`` name. Note that
+``$HOST`` cannot possibly handle when you have a load balancer in front of
+it that does https while TempAuth itself runs with http; in such a case,
+you'll have to specify the  ``storage_url_scheme`` configuration value as
+an override.
+
+Multiple Reseller Prefix Items
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+The reseller prefix specifies which parts of the account namespace this
+middleware is responsible for managing authentication and authorization.
+By default, the prefix is ``AUTH`` so accounts and tokens are prefixed
+by ``AUTH_``. When a request's token and/or path start with ``AUTH_``, this
+middleware knows it is responsible.
+
+We allow the reseller prefix to be a list. In tempauth, the first item
+in the list is used as the prefix for tokens and user groups. The
+other prefixes provide alternate accounts that user's can access. For
+example if the reseller prefix list is ``AUTH, OTHER``, a user with
+admin access to ``AUTH_account`` also has admin access to
+``OTHER_account``.
+
+Required Group
+^^^^^^^^^^^^^^
+
+The group ``.admin`` is normally needed to access an account (ACLs provide
+an additional way to access an account). You can specify the
+``require_group`` parameter. This means that you also need the named group
+to access an account. If you have several reseller prefix items, prefix
+the ``require_group`` parameter with the appropriate prefix.
+
+X-Service-Token
+^^^^^^^^^^^^^^^
+
+If an ``X-Service-Token`` is presented in the request headers, the groups
+derived from the token are appended to the roles derived from
+``X-Auth-Token``. If ``X-Auth-Token`` is missing or invalid,
+``X-Service-Token`` is not processed.
+
+The ``X-Service-Token`` is useful when combined with multiple reseller
+prefix items. In the following configuration, accounts prefixed
+``SERVICE_`` are only accessible if ``X-Auth-Token`` is from the end-user
+and ``X-Service-Token`` is from the ``glance`` user::
+
+   [filter:tempauth]
+   use = egg:swift#tempauth
+   reseller_prefix = AUTH, SERVICE
+   SERVICE_require_group = .service
+   user_admin_admin = admin .admin .reseller_admin
+   user_joeacct_joe = joepw .admin
+   user_maryacct_mary = marypw .admin
+   user_glance_glance = glancepw .service
+
+The name ``.service`` is an example. Unlike ``.admin``, ``.reseller_admin``,
+``.reseller_reader`` it is not a reserved name.
+
+Please note that ACLs can be set on service accounts and are matched
+against the identity validated by ``X-Auth-Token``. As such ACLs can grant
+access to a service account's container without needing to provide a
+service token, just like any other cross-reseller request using ACLs.
+
+Account ACLs
+^^^^^^^^^^^^
+
+If a swift_owner issues a POST or PUT to the account with the
+``X-Account-Access-Control`` header set in the request, then this may
+allow certain types of access for additional users.
+
+* Read-Only: Users with read-only access can list containers in the
+  account, list objects in any container, retrieve objects, and view
+  unprivileged account/container/object metadata.
+* Read-Write: Users with read-write access can (in addition to the
+  read-only privileges) create objects, overwrite existing objects,
+  create new containers, and set unprivileged container/object
+  metadata.
+* Admin: Users with admin access are swift_owners and can perform
+  any action, including viewing/setting privileged metadata (e.g.
+  changing account ACLs).
+
+To generate headers for setting an account ACL::
+
+    from swift.common.middleware.acl import format_acl
+    acl_data = { 'admin': ['alice'], 'read-write': ['bob', 'carol'] }
+    header_value = format_acl(version=2, acl_dict=acl_data)
+
+To generate a curl command line from the above::
+
+    token=...
+    storage_url=...
+    python -c '
+      from swift.common.middleware.acl import format_acl
+      acl_data = { 'admin': ['alice'], 'read-write': ['bob', 'carol'] }
+      headers = {'X-Account-Access-Control':
+                 format_acl(version=2, acl_dict=acl_data)}
+      header_str = ' '.join(["-H '%s: %s'" % (k, v)
+                             for k, v in headers.items()])
+      print('curl -D- -X POST -H "x-auth-token: $token" %s '
+            '$storage_url' % header_str)
+    '
+"""
+
+
+import json
+from time import time
+from traceback import format_exc
+from uuid import uuid4
+import base64
+import zlib
+
+from cryptography import fernet
+from eventlet import Timeout
+from swift.common.memcached import MemcacheConnectionError
+from swift.common.swob import (
+    Response, Request, wsgi_to_str, str_to_wsgi, wsgi_unquote,
+    HTTPBadRequest, HTTPForbidden, HTTPNotFound,
+    HTTPUnauthorized, HTTPMethodNotAllowed, HTTPServiceUnavailable,
+)
+
+from swift.common.request_helpers import get_sys_meta_prefix
+from swift.common.middleware.acl import (
+    clean_acl, parse_acl, referrer_allowed, acls_from_account_info)
+from swift.common.utils import cache_from_env, get_logger, \
+    split_path, config_true_value, load_multikey_opts
+from swift.common.registry import register_swift_info
+from swift.common.utils import config_read_reseller_options, quote
+from swift.proxy.controllers.base import get_account_info
 
 
-    See the proxy-server.conf-sample for more information.
+DEFAULT_TOKEN_LIFE = 86400
 
+
+class TempAuth(object):
+    """
     :param app: The next WSGI app in the pipeline
-    :param conf: The dict of configuration values
+    :param conf: The dict of configuration values from the Paste config file
     """
 
     def __init__(self, app, conf):
         self.app = app
         self.conf = conf
-        self.logger = get_logger(conf, log_route='tempauth')
+        self.reseller_prefixes, self.account_rules = \
+            config_read_reseller_options(conf, dict(require_group=''))
+        self.reseller_prefix = self.reseller_prefixes[0]
+        statsd_tail_prefix = 'tempauth.%s' % (
+            self.reseller_prefix if self.reseller_prefix else 'NONE',)
+        self.logger = get_logger(conf, log_route='tempauth',
+                                 statsd_tail_prefix=statsd_tail_prefix)
         self.log_headers = config_true_value(conf.get('log_headers', 'f'))
-        self.reseller_prefix = conf.get('reseller_prefix', 'AUTH').strip()
-        if self.reseller_prefix and self.reseller_prefix[-1] != '_':
-            self.reseller_prefix += '_'
-        self.logger.set_statsd_prefix('tempauth.%s' % (
-            self.reseller_prefix if self.reseller_prefix else 'NONE',))
         self.auth_prefix = conf.get('auth_prefix', '/auth/')
-        if not self.auth_prefix:
+        if not self.auth_prefix or not self.auth_prefix.strip('/'):
+            self.logger.warning('Rewriting invalid auth prefix "%s" to '
+                                '"/auth/" (Non-empty auth prefix path '
+                                'is required)' % self.auth_prefix)
             self.auth_prefix = '/auth/'
-        if self.auth_prefix[0] != '/':
+        if not self.auth_prefix.startswith('/'):
             self.auth_prefix = '/' + self.auth_prefix
-        if self.auth_prefix[-1] != '/':
+        if not self.auth_prefix.endswith('/'):
             self.auth_prefix += '/'
-        self.token_life = int(conf.get('token_life', 86400))
+        self.token_life = int(conf.get('token_life', DEFAULT_TOKEN_LIFE))
+        self.fernet_keys = {
+            key_id: fernet.Fernet(key)
+            for _, key_id, key in load_multikey_opts(conf, 'fernet_key')
+        }
+        self.fernet = (fernet.MultiFernet(self.fernet_keys.values())
+                       if self.fernet_keys else None)
+        self.active_fernet_key_id = conf.get('active_fernet_key_id')
+        if self.active_fernet_key_id and \
+                self.active_fernet_key_id not in self.fernet_keys:
+            raise ValueError("key_id %r not found; %r are available" % (
+                self.active_fernet_key_id, sorted(self.fernet_keys.keys())))
         self.allow_overrides = config_true_value(
             conf.get('allow_overrides', 't'))
         self.storage_url_scheme = conf.get('storage_url_scheme', 'default')
         self.users = {}
         for conf_key in conf:
-            if conf_key.startswith('user_') or conf_key.startswith('user64_'):
-                account, username = conf_key.split('_', 1)[1].split('_')
+            if conf_key.startswith(('user_', 'user64_')):
+                try:
+                    account, username = conf_key.split('_', 1)[1].split('_')
+                except ValueError:
+                    raise ValueError("key %s was provided in an "
+                                     "invalid format" % conf_key)
                 if conf_key.startswith('user64_'):
                     # Because trailing equal signs would screw up config file
                     # parsing, we auto-pad with '=' chars.
                     account += '=' * (len(account) % 4)
-                    account = base64.b64decode(account)
+                    account = base64.b64decode(account).decode('utf8')
                     username += '=' * (len(username) % 4)
-                    username = base64.b64decode(username)
+                    username = base64.b64decode(username).decode('utf8')
                 values = conf[conf_key].split()
                 if not values:
                     raise ValueError('%s has no key set' % conf_key)
@@ -105,7 +267,8 @@ def __init__(self, app, conf):
                 if values and ('://' in values[-1] or '$HOST' in values[-1]):
                     url = values.pop()
                 else:
-                    url = '$HOST/v1/%s%s' % (self.reseller_prefix, account)
+                    url = '$HOST/v1/%s%s' % (
+                        self.reseller_prefix, quote(account))
                 self.users[account + ':' + username] = {
                     'key': key, 'url': url, 'groups': values}
 
@@ -133,147 +296,411 @@ def __call__(self, env, start_response):
             return self.app(env, start_response)
         if env.get('PATH_INFO', '').startswith(self.auth_prefix):
             return self.handle(env, start_response)
-        s3 = env.get('HTTP_AUTHORIZATION')
+        s3 = env.get('s3api.auth_details') or env.get('swift3.auth_details')
         token = env.get('HTTP_X_AUTH_TOKEN', env.get('HTTP_X_STORAGE_TOKEN'))
+        service_token = env.get('HTTP_X_SERVICE_TOKEN')
         if s3 or (token and token.startswith(self.reseller_prefix)):
             # Note: Empty reseller_prefix will match all tokens.
             groups = self.get_groups(env, token)
+            if service_token:
+                service_groups = self.get_groups(env, service_token)
+                if groups and service_groups:
+                    groups += ',' + service_groups
             if groups:
+                group_list = groups.split(',', 2)
+                if len(group_list) > 1:
+                    user = group_list[1]
+                else:
+                    user = group_list[0]
+                trans_id = env.get('swift.trans_id')
+                self.logger.debug('User: %s uses token %s (trans_id %s)' %
+                                  (user, 's3' if s3 else token, trans_id))
                 env['REMOTE_USER'] = groups
-                user = groups and groups.split(',', 1)[0] or ''
-                # We know the proxy logs the token, so we augment it just a bit
-                # to also log the authenticated user.
-                env['HTTP_X_AUTH_TOKEN'] = \
-                    '%s,%s' % (user, 's3' if s3 else token)
                 env['swift.authorize'] = self.authorize
                 env['swift.clean_acl'] = clean_acl
+                # Set access_user_id for consistent logging across middlewares
+                env.setdefault('swift.access_logging', {})['user_id'] = user
+                if '.reseller_admin' in groups:
+                    env['reseller_request'] = True
             else:
                 # Unauthorized token
-                if self.reseller_prefix:
+                if self.reseller_prefix and not s3:
                     # Because I know I'm the definitive auth for this token, I
                     # can deny it outright.
                     self.logger.increment('unauthorized')
-                    return HTTPUnauthorized()(env, start_response)
+                    try:
+                        vrs, realm, rest = split_path(env['PATH_INFO'],
+                                                      2, 3, True)
+                    except ValueError:
+                        realm = 'unknown'
+                    return HTTPUnauthorized(headers={
+                        'Www-Authenticate': 'Swift realm="%s"' % realm})(
+                            env, start_response)
                 # Because I'm not certain if I'm the definitive auth for empty
                 # reseller_prefixed tokens, I won't overwrite swift.authorize.
                 elif 'swift.authorize' not in env:
                     env['swift.authorize'] = self.denied_response
         else:
-            if self.reseller_prefix:
-                # With a non-empty reseller_prefix, I would like to be called
-                # back for anonymous access to accounts I know I'm the
-                # definitive auth for.
-                try:
-                    version, rest = split_path(env.get('PATH_INFO', ''),
-                                               1, 2, True)
-                except ValueError:
-                    version, rest = None, None
-                    self.logger.increment('errors')
-                if rest and rest.startswith(self.reseller_prefix):
-                    # Handle anonymous access to accounts I'm the definitive
-                    # auth for.
+            if self._is_definitive_auth(env.get('PATH_INFO', '')):
+                # Handle anonymous access to accounts I'm the definitive
+                # auth for.
+                env['swift.authorize'] = self.authorize
+                env['swift.clean_acl'] = clean_acl
+            elif self.reseller_prefix == '':
+                # Because I'm not certain if I'm the definitive auth, I won't
+                # overwrite swift.authorize.
+                if 'swift.authorize' not in env:
                     env['swift.authorize'] = self.authorize
                     env['swift.clean_acl'] = clean_acl
+            else:
                 # Not my token, not my account, I can't authorize this request,
                 # deny all is a good idea if not already set...
-                elif 'swift.authorize' not in env:
+                if 'swift.authorize' not in env:
                     env['swift.authorize'] = self.denied_response
-            # Because I'm not certain if I'm the definitive auth for empty
-            # reseller_prefixed accounts, I won't overwrite swift.authorize.
-            elif 'swift.authorize' not in env:
-                env['swift.authorize'] = self.authorize
-                env['swift.clean_acl'] = clean_acl
+
         return self.app(env, start_response)
 
-    def get_groups(self, env, token):
+    def _is_definitive_auth(self, path):
         """
-        Get groups for the given token.
+        Determine if we are the definitive auth
 
-        :param env: The current WSGI environment dictionary.
-        :param token: Token to validate and return a group string for.
+        Determines if we are the definitive auth for a given path.
+        If the account name is prefixed with something matching one
+        of the reseller_prefix items, then we are the auth (return True)
+        Non-matching: we are not the auth.
+        However, one of the reseller_prefix items can be blank. If
+        so, we cannot always be definite so return False.
 
-        :returns: None if the token is invalid or a string containing a comma
-                  separated list of groups the authenticated user is a member
-                  of. The first group in the list is also considered a unique
-                  identifier for that user.
+        :param path: A path (e.g., /v1/AUTH_joesaccount/c/o)
+        :return:True if we are definitive auth
         """
-        groups = None
+        try:
+            version, account, rest = split_path(path, 1, 3, True)
+        except ValueError:
+            return False
+        if account:
+            return bool(self._get_account_prefix(account))
+        return False
+
+    def _non_empty_reseller_prefixes(self):
+        return iter([pre for pre in self.reseller_prefixes if pre != ''])
+
+    def _get_account_prefix(self, account):
+        """
+        Get the prefix of an account
+
+        Determines which reseller prefix matches the account and returns
+        that prefix. If account does not start with one of the known
+        reseller prefixes, returns None.
+
+        :param account: Account name (e.g., AUTH_joesaccount) or None
+        :return: The prefix string (examples: 'AUTH_', 'SERVICE_', '')
+                 If we can't match the prefix of the account, return None
+        """
+        if account is None:
+            return None
+        # Empty prefix matches everything, so try to match others first
+        for prefix in self._non_empty_reseller_prefixes():
+            if account.startswith(prefix):
+                return prefix
+        if '' in self.reseller_prefixes:
+            return ''
+        return None
+
+    def _dot_account(self, account):
+        """
+        Detect if account starts with dot character after the prefix
+
+        :param account: account in path (e.g., AUTH_joesaccount)
+        :return:True if name starts with dot character
+        """
+        prefix = self._get_account_prefix(account)
+        return prefix is not None and account[len(prefix)] == '.'
+
+    def _get_user_groups(self, account, account_user, account_id):
+        """
+        :param account: example: test
+        :param account_user: example: test:tester
+        :param account_id: example: AUTH_test
+        :return: a comma separated string of group names. The group names are
+                 as follows: account,account_user,groups...
+                 If .admin is in the groups, this is replaced by all the
+                 possible account ids. For example, for user joe, account acct
+                 and resellers AUTH_, OTHER_, the returned string is as
+                 follows: acct,acct:joe,AUTH_acct,OTHER_acct
+        """
+        groups = [account, account_user]
+        groups.extend(self.users[account_user]['groups'])
+        if '.admin' in groups:
+            groups.remove('.admin')
+            for prefix in self._non_empty_reseller_prefixes():
+                groups.append('%s%s' % (prefix, account))
+            if account_id not in groups:
+                groups.append(account_id)
+        groups = ','.join(groups)
+        return groups
+
+    def groups_from_fernet(self, env, token):
+        try:
+            if self.fernet:
+                return self.fernet.decrypt(
+                    token.encode('ascii'),
+                    ttl=self.token_life).decode('utf8')
+        except (ValueError, fernet.InvalidToken):
+            pass
+        return None
+
+    def groups_from_compressed_fernet(self, env, token):
+        try:
+            if self.fernet:
+                return zlib.decompress(self.fernet.decrypt(
+                    token.encode('ascii'),
+                    ttl=self.token_life)).decode('utf8')
+        except (ValueError, fernet.InvalidToken):
+            pass
+        return None
+
+    def groups_from_memcache(self, env, token):
         memcache_client = cache_from_env(env)
         if not memcache_client:
             raise Exception('Memcache required')
-        memcache_token_key = '%s/token/%s' % (self.reseller_prefix, token)
+        memcache_token_key = '%s/token/%stk%s' % (
+            self.reseller_prefix, self.reseller_prefix, token)
         cached_auth_data = memcache_client.get(memcache_token_key)
+        groups = None
         if cached_auth_data:
             expires, groups = cached_auth_data
             if expires < time():
                 groups = None
+        return groups
 
-        if env.get('HTTP_AUTHORIZATION'):
-            account_user, sign = \
-                env['HTTP_AUTHORIZATION'].split(' ')[1].rsplit(':', 1)
-            if account_user not in self.users:
-                return None
-            account, user = account_user.split(':', 1)
-            account_id = self.users[account_user]['url'].rsplit('/', 1)[-1]
-            path = env['PATH_INFO']
-            env['PATH_INFO'] = path.replace(account_user, account_id, 1)
-            msg = base64.urlsafe_b64decode(unquote(token))
-            key = self.users[account_user]['key']
-            s = base64.encodestring(hmac.new(key, msg, sha1).digest()).strip()
-            if s != sign:
-                return None
-            groups = [account, account_user]
-            groups.extend(self.users[account_user]['groups'])
-            if '.admin' in groups:
-                groups.remove('.admin')
-                groups.append(account_id)
-            groups = ','.join(groups)
+    def get_groups(self, env, token):
+        """
+        Get groups for the given token.
 
-        return groups
+        :param env: The current WSGI environment dictionary.
+        :param token: Token to validate and return a group string for.
+        :returns: None if the token is invalid or a string containing a comma
+                  separated list of groups the authenticated user is a member
+                  of. The first group in the list is also considered a unique
+                  identifier for that user.
+        """
+        handlers = [
+            ('zftk', self.groups_from_compressed_fernet),
+            ('ftk', self.groups_from_fernet),
+            ('tk', self.groups_from_memcache),
+        ]
+        if token:
+            for prefix, handler in handlers:
+                prefix = self.reseller_prefix + prefix
+                if token.startswith(prefix):
+                    groups = handler(env, token[len(prefix):])
+                    if groups:
+                        return groups
+
+        s3_auth_details = env.get('s3api.auth_details') or\
+            env.get('swift3.auth_details')
+        if not s3_auth_details:
+            return None
+
+        if 'check_signature' not in s3_auth_details:
+            self.logger.warning(
+                'Swift3 did not provide a check_signature function; '
+                'upgrade Swift3 if you want to use it with tempauth')
+            return None
+        account_user = s3_auth_details['access_key']
+        if account_user not in self.users:
+            return None
+        user = self.users[account_user]
+        account = account_user.split(':', 1)[0]
+        account_id = user['url'].rsplit('/', 1)[-1]
+        if not s3_auth_details['check_signature'](user['key']):
+            return None
+        env['PATH_INFO'] = env['PATH_INFO'].replace(
+            str_to_wsgi(account_user), wsgi_unquote(account_id), 1)
+        return self._get_user_groups(account, account_user, account_id)
+
+    def account_acls(self, req):
+        """
+        Return a dict of ACL data from the account server via get_account_info.
+
+        Auth systems may define their own format, serialization, structure,
+        and capabilities implemented in the ACL headers and persisted in the
+        sysmeta data.  However, auth systems are strongly encouraged to be
+        interoperable with Tempauth.
+
+        Account ACLs are set and retrieved via the header
+           X-Account-Access-Control
+
+        For header format and syntax, see:
+         * :func:`swift.common.middleware.acl.parse_acl()`
+         * :func:`swift.common.middleware.acl.format_acl()`
+        """
+        info = get_account_info(req.environ, self.app, swift_source='TA')
+        try:
+            acls = acls_from_account_info(info)
+        except ValueError as e1:
+            self.logger.warning("Invalid ACL stored in metadata: %r" % e1)
+            return None
+        except NotImplementedError as e2:
+            self.logger.warning(
+                "ACL version exceeds middleware version: %r"
+                % e2)
+            return None
+        return acls
+
+    def extract_acl_and_report_errors(self, req):
+        """
+        Return a user-readable string indicating the errors in the input ACL,
+        or None if there are no errors.
+        """
+        acl_header = 'x-account-access-control'
+        acl_data = wsgi_to_str(req.headers.get(acl_header))
+        result = parse_acl(version=2, data=acl_data)
+        if result is None:
+            return 'Syntax error in input (%r)' % acl_data
+
+        tempauth_acl_keys = 'admin read-write read-only'.split()
+        for key in result:
+            # While it is possible to construct auth systems that collaborate
+            # on ACLs, TempAuth is not such an auth system.  At this point,
+            # it thinks it is authoritative.
+            if key not in tempauth_acl_keys:
+                return "Key %s not recognized" % json.dumps(key)
+
+        for key in tempauth_acl_keys:
+            if key not in result:
+                continue
+            if not isinstance(result[key], list):
+                return "Value for key %s must be a list" % json.dumps(key)
+            for grantee in result[key]:
+                if not isinstance(grantee, str):
+                    return "Elements of %s list must be strings" % json.dumps(
+                        key)
+
+        # Everything looks fine, no errors found
+        internal_hdr = get_sys_meta_prefix('account') + 'core-access-control'
+        req.headers[internal_hdr] = req.headers.pop(acl_header)
+        return None
 
     def authorize(self, req):
         """
         Returns None if the request is authorized to continue or a standard
         WSGI response callable if not.
         """
-
         try:
-            version, account, container, obj = split_path(req.path, 1, 4, True)
+            _junk, account, container, obj = req.split_path(1, 4, True)
         except ValueError:
             self.logger.increment('errors')
             return HTTPNotFound(request=req)
-        if not account or not account.startswith(self.reseller_prefix):
+
+        if self._get_account_prefix(account) is None:
+            self.logger.debug("Account name: %s doesn't start with "
+                              "reseller_prefix(s): %s."
+                              % (account, ','.join(self.reseller_prefixes)))
             return self.denied_response(req)
+
+        # At this point, TempAuth is convinced that it is authoritative.
+        # If you are sending an ACL header, it must be syntactically valid
+        # according to TempAuth's rules for ACL syntax.
+        acl_data = req.headers.get('x-account-access-control')
+        if acl_data is not None:
+            error = self.extract_acl_and_report_errors(req)
+            if error:
+                msg = 'X-Account-Access-Control invalid: %s\n\nInput: %s\n' % (
+                    error, acl_data)
+                headers = [('Content-Type', 'text/plain; charset=UTF-8')]
+                return HTTPBadRequest(request=req, headers=headers, body=msg)
+
         user_groups = (req.remote_user or '').split(',')
+        account_user = user_groups[1] if len(user_groups) > 1 else None
+
         if '.reseller_admin' in user_groups and \
-                account != self.reseller_prefix and \
-                account[len(self.reseller_prefix)] != '.':
+                account not in self.reseller_prefixes and \
+                not self._dot_account(account):
             req.environ['swift_owner'] = True
+            self.logger.debug("User %s has reseller admin authorizing."
+                              % account_user)
             return None
-        if account in user_groups and \
-                (req.method not in ('DELETE', 'PUT') or container):
-            # If the user is admin for the account and is not trying to do an
-            # account DELETE or PUT...
-            req.environ['swift_owner'] = True
+
+        if '.reseller_reader' in user_groups and \
+                account not in self.reseller_prefixes and \
+                not self._dot_account(account) and \
+                req.method in ('GET', 'HEAD'):
+            self.logger.debug("User %s has reseller reader authorizing."
+                              % account_user)
             return None
+
+        if wsgi_to_str(account) in user_groups and \
+                (req.method not in ('DELETE', 'PUT') or container):
+            # The user is admin for the account and is not trying to do an
+            # account DELETE or PUT
+            account_prefix = self._get_account_prefix(account)
+            require_group = self.account_rules.get(account_prefix).get(
+                'require_group')
+            if require_group and require_group in user_groups:
+                req.environ['swift_owner'] = True
+                self.logger.debug("User %s has admin and %s group."
+                                  " Authorizing." % (account_user,
+                                                     require_group))
+                return None
+            elif not require_group:
+                req.environ['swift_owner'] = True
+                self.logger.debug("User %s has admin authorizing."
+                                  % account_user)
+                return None
+
         if (req.environ.get('swift_sync_key')
                 and (req.environ['swift_sync_key'] ==
                      req.headers.get('x-container-sync-key', None))
                 and 'x-timestamp' in req.headers):
+            self.logger.debug("Allow request with container sync-key: %s."
+                              % req.environ['swift_sync_key'])
             return None
+
         if req.method == 'OPTIONS':
-            #allow OPTIONS requests to proceed as normal
+            # allow OPTIONS requests to proceed as normal
+            self.logger.debug("Allow OPTIONS request.")
             return None
+
         referrers, groups = parse_acl(getattr(req, 'acl', None))
+
         if referrer_allowed(req.referer, referrers):
             if obj or '.rlistings' in groups:
+                self.logger.debug("Allow authorizing %s via referer ACL."
+                                  % req.referer)
                 return None
-            return self.denied_response(req)
-        if not req.remote_user:
-            return self.denied_response(req)
+
         for user_group in user_groups:
             if user_group in groups:
+                self.logger.debug("User %s allowed in ACL: %s authorizing."
+                                  % (account_user, user_group))
                 return None
+
+        # Check for access via X-Account-Access-Control
+        acct_acls = self.account_acls(req)
+        if acct_acls:
+            # At least one account ACL is set in this account's sysmeta data,
+            # so we should see whether this user is authorized by the ACLs.
+            user_group_set = set(user_groups)
+            if user_group_set.intersection(acct_acls['admin']):
+                req.environ['swift_owner'] = True
+                self.logger.debug('User %s allowed by X-Account-Access-Control'
+                                  ' (admin)' % account_user)
+                return None
+            if (user_group_set.intersection(acct_acls['read-write']) and
+                    (container or req.method in ('GET', 'HEAD'))):
+                # The RW ACL allows all operations to containers/objects, but
+                # only GET/HEAD to accounts (and OPTIONS, above)
+                self.logger.debug('User %s allowed by X-Account-Access-Control'
+                                  ' (read-write)' % account_user)
+                return None
+            if (user_group_set.intersection(acct_acls['read-only']) and
+                    req.method in ('GET', 'HEAD')):
+                self.logger.debug('User %s allowed by X-Account-Access-Control'
+                                  ' (read-only)' % account_user)
+                return None
+
         return self.denied_response(req)
 
     def denied_response(self, req):
@@ -301,29 +728,16 @@ def handle(self, env, start_response):
             req = Request(env)
             if self.auth_prefix:
                 req.path_info_pop()
-            req.bytes_transferred = '-'
-            req.client_disconnect = False
             if 'x-storage-token' in req.headers and \
                     'x-auth-token' not in req.headers:
                 req.headers['x-auth-token'] = req.headers['x-storage-token']
-            if 'eventlet.posthooks' in env:
-                env['eventlet.posthooks'].append(
-                    (self.posthooklogger, (req,), {}))
-                return self.handle_request(req)(env, start_response)
-            else:
-                # Lack of posthook support means that we have to log on the
-                # start of the response, rather than after all the data has
-                # been sent. This prevents logging client disconnects
-                # differently than full transmissions.
-                response = self.handle_request(req)(env, start_response)
-                self.posthooklogger(env, req)
-                return response
+            return self.handle_request(req)(env, start_response)
         except (Exception, Timeout):
-            print "EXCEPTION IN handle: %s: %s" % (format_exc(), env)
+            print("EXCEPTION IN handle: %s: %s" % (format_exc(), env))
             self.logger.increment('errors')
             start_response('500 Server Error',
                            [('Content-Type', 'text/plain')])
-            return ['Internal server error.\n']
+            return [b'Internal server error.\n']
 
     def handle_request(self, req):
         """
@@ -334,12 +748,12 @@ def handle_request(self, req):
         """
         req.start_time = time()
         handler = None
+        if req.method != 'GET':
+            req.response = HTTPMethodNotAllowed(request=req)
+            return req.response
         try:
-            version, account, user, _junk = split_path(
-                req.path_info,
-                minsegs=1,
-                maxsegs=4,
-                rest_with_last=True)
+            version, account, user, _junk = split_path(req.path_info,
+                                                       1, 4, True)
         except ValueError:
             self.logger.increment('errors')
             return HTTPNotFound(request=req)
@@ -353,6 +767,45 @@ def handle_request(self, req):
             req.response = handler(req)
         return req.response
 
+    def _create_new_token(self, memcache_client,
+                          account, account_user, account_id):
+        if self.active_fernet_key_id:
+            expires = time() + self.token_life
+            token_prefix = 'ftk'  # nosec: B105
+            groups = self._get_user_groups(
+                account,
+                account_user,
+                account_id,
+            ).encode('utf8')
+            compressed = zlib.compress(groups)
+            if len(compressed) < len(groups):
+                token_prefix = 'zftk'  # nosec: B105
+                groups = compressed
+            token = ''.join([
+                self.reseller_prefix,
+                token_prefix,
+                self.fernet_keys[self.active_fernet_key_id].encrypt(
+                    groups).decode('ascii'),
+            ])
+            return token, expires
+
+        # Generate new token
+        token = '%stk%s' % (self.reseller_prefix, uuid4().hex)
+        expires = time() + self.token_life
+        groups = self._get_user_groups(account, account_user, account_id)
+        # Save token
+        memcache_token_key = '%s/token/%s' % (self.reseller_prefix, token)
+        memcache_client.set(memcache_token_key, (expires, groups),
+                            time=float(expires - time()),
+                            raise_on_error=True)
+        # Record the token with the user info for future use.
+        memcache_user_key = \
+            '%s/user/%s' % (self.reseller_prefix, account_user)
+        memcache_client.set(memcache_user_key, token,
+                            time=float(expires - time()),
+                            raise_on_error=True)
+        return token, expires
+
     def handle_get_token(self, req):
         """
         Handles the various `request for token and service end point(s)` calls.
@@ -379,8 +832,7 @@ def handle_get_token(self, req):
         """
         # Validate the request info
         try:
-            pathsegs = split_path(req.path_info, minsegs=1, maxsegs=3,
-                                  rest_with_last=True)
+            pathsegs = split_path(req.path_info, 1, 3, True)
         except ValueError:
             self.logger.increment('errors')
             return HTTPNotFound(request=req)
@@ -391,11 +843,15 @@ def handle_get_token(self, req):
                 user = req.headers.get('x-auth-user')
                 if not user or ':' not in user:
                     self.logger.increment('token_denied')
-                    return HTTPUnauthorized(request=req)
+                    auth = 'Swift realm="%s"' % account
+                    return HTTPUnauthorized(request=req,
+                                            headers={'Www-Authenticate': auth})
                 account2, user = user.split(':', 1)
-                if account != account2:
+                if wsgi_to_str(account) != account2:
                     self.logger.increment('token_denied')
-                    return HTTPUnauthorized(request=req)
+                    auth = 'Swift realm="%s"' % account
+                    return HTTPUnauthorized(request=req,
+                                            headers={'Www-Authenticate': auth})
             key = req.headers.get('x-storage-pass')
             if not key:
                 key = req.headers.get('x-auth-key')
@@ -405,110 +861,80 @@ def handle_get_token(self, req):
                 user = req.headers.get('x-storage-user')
             if not user or ':' not in user:
                 self.logger.increment('token_denied')
-                return HTTPUnauthorized(request=req)
+                auth = 'Swift realm="unknown"'
+                return HTTPUnauthorized(request=req,
+                                        headers={'Www-Authenticate': auth})
             account, user = user.split(':', 1)
             key = req.headers.get('x-auth-key')
             if not key:
                 key = req.headers.get('x-storage-pass')
         else:
             return HTTPBadRequest(request=req)
+        unauthed_headers = {
+            'Www-Authenticate': 'Swift realm="%s"' % (account or 'unknown'),
+        }
         if not all((account, user, key)):
             self.logger.increment('token_denied')
-            return HTTPUnauthorized(request=req)
+            return HTTPUnauthorized(request=req, headers=unauthed_headers)
         # Authenticate user
+        account = wsgi_to_str(account)
+        user = wsgi_to_str(user)
+        key = wsgi_to_str(key)
         account_user = account + ':' + user
+        req.environ.setdefault(
+            'swift.access_logging', {})['user_id'] = account_user
         if account_user not in self.users:
             self.logger.increment('token_denied')
-            return HTTPUnauthorized(request=req)
+            return HTTPUnauthorized(request=req, headers=unauthed_headers)
         if self.users[account_user]['key'] != key:
             self.logger.increment('token_denied')
-            return HTTPUnauthorized(request=req)
-        # Get memcache client
+            return HTTPUnauthorized(request=req, headers=unauthed_headers)
+        account_id = self.users[account_user]['url'].rsplit('/', 1)[-1]
+        # Try to get memcache client
         memcache_client = cache_from_env(req.environ)
-        if not memcache_client:
+        if not (memcache_client or self.active_fernet_key_id):
             raise Exception('Memcache required')
         # See if a token already exists and hasn't expired
         token = None
-        memcache_user_key = '%s/user/%s' % (self.reseller_prefix, account_user)
-        candidate_token = memcache_client.get(memcache_user_key)
-        if candidate_token:
-            memcache_token_key = \
-                '%s/token/%s' % (self.reseller_prefix, candidate_token)
-            cached_auth_data = memcache_client.get(memcache_token_key)
-            if cached_auth_data:
-                expires, groups = cached_auth_data
-                if expires > time():
-                    token = candidate_token
+        if memcache_client:
+            memcache_user_key = '%s/user/%s' % (
+                self.reseller_prefix, account_user)
+            candidate_token = memcache_client.get(memcache_user_key)
+            if candidate_token:
+                memcache_token_key = \
+                    '%s/token/%s' % (self.reseller_prefix, candidate_token)
+                cached_auth_data = memcache_client.get(memcache_token_key)
+                if cached_auth_data:
+                    expires, old_groups = cached_auth_data
+                    old_groups = [group for group in old_groups.split(',')]
+                    new_groups = self._get_user_groups(account, account_user,
+                                                       account_id)
+
+                    if expires > time() and \
+                            set(old_groups) == set(new_groups.split(',')):
+                        token = candidate_token
         # Create a new token if one didn't exist
         if not token:
-            # Generate new token
-            token = '%stk%s' % (self.reseller_prefix, uuid4().hex)
-            expires = time() + self.token_life
-            groups = [account, account_user]
-            groups.extend(self.users[account_user]['groups'])
-            if '.admin' in groups:
-                groups.remove('.admin')
-                account_id = self.users[account_user]['url'].rsplit('/', 1)[-1]
-                groups.append(account_id)
-            groups = ','.join(groups)
-            # Save token
-            memcache_token_key = '%s/token/%s' % (self.reseller_prefix, token)
-            memcache_client.set(memcache_token_key, (expires, groups),
-                                timeout=float(expires - time()))
-            # Record the token with the user info for future use.
-            memcache_user_key = \
-                '%s/user/%s' % (self.reseller_prefix, account_user)
-            memcache_client.set(memcache_user_key, token,
-                                timeout=float(expires - time()))
+            try:
+                token, expires = self._create_new_token(
+                    memcache_client, account, account_user, account_id)
+            except MemcacheConnectionError:
+                return HTTPServiceUnavailable(request=req)
         resp = Response(request=req, headers={
-            'x-auth-token': token, 'x-storage-token': token})
-        url = self.users[account_user]['url'].replace('$HOST', resp.host_url())
+            'x-auth-token': token, 'x-storage-token': token,
+            'x-auth-token-expires': str(int(expires - time()))})
+        url = self.users[account_user]['url'].replace('$HOST', resp.host_url)
         if self.storage_url_scheme != 'default':
             url = self.storage_url_scheme + ':' + url.split(':', 1)[1]
         resp.headers['x-storage-url'] = url
         return resp
 
-    def posthooklogger(self, env, req):
-        if not req.path.startswith(self.auth_prefix):
-            return
-        response = getattr(req, 'response', None)
-        if not response:
-            return
-        trans_time = '%.4f' % (time() - req.start_time)
-        the_request = quote(unquote(req.path))
-        if req.query_string:
-            the_request = the_request + '?' + req.query_string
-        # remote user for zeus
-        client = req.headers.get('x-cluster-client-ip')
-        if not client and 'x-forwarded-for' in req.headers:
-            # remote user for other lbs
-            client = req.headers['x-forwarded-for'].split(',')[0].strip()
-        logged_headers = None
-        if self.log_headers:
-            logged_headers = '\n'.join('%s: %s' % (k, v)
-                                       for k, v in req.headers.items())
-        status_int = response.status_int
-        if getattr(req, 'client_disconnect', False) or \
-                getattr(response, 'client_disconnect', False):
-            status_int = HTTP_CLIENT_CLOSED_REQUEST
-        self.logger.info(
-            ' '.join(quote(str(x)) for x in (client or '-',
-            req.remote_addr or '-', strftime('%d/%b/%Y/%H/%M/%S', gmtime()),
-            req.method, the_request, req.environ['SERVER_PROTOCOL'],
-            status_int, req.referer or '-', req.user_agent or '-',
-            req.headers.get('x-auth-token',
-                            req.headers.get('x-auth-admin-user', '-')),
-            getattr(req, 'bytes_transferred', 0) or '-',
-            getattr(response, 'bytes_transferred', 0) or '-',
-            req.headers.get('etag', '-'),
-            req.environ.get('swift.trans_id', '-'), logged_headers or '-',
-            trans_time)))
-
 
 def filter_factory(global_conf, **local_conf):
     """Returns a WSGI filter app for use with paste.deploy."""
     conf = global_conf.copy()
     conf.update(local_conf)
+    register_swift_info('tempauth', account_acls=True)
 
     def auth_filter(app):
         return TempAuth(app, conf)
diff --git a/swift/common/middleware/tempurl.py b/swift/common/middleware/tempurl.py
index 0c87536117..2e119e0b6b 100644
--- a/swift/common/middleware/tempurl.py
+++ b/swift/common/middleware/tempurl.py
@@ -1,4 +1,19 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2011-2014 Greg Holt
+# Copyright (c) 2012-2013 John Dickinson
+# Copyright (c) 2012 Felipe Reyes
+# Copyright (c) 2012 Peter Portante
+# Copyright (c) 2012 Victor Rodionov
+# Copyright (c) 2013-2014 Samuel Merritt
+# Copyright (c) 2013 Chuck Thier
+# Copyright (c) 2013 David Goetz
+# Copyright (c) 2013 Dirk Mueller
+# Copyright (c) 2013 Donagh McCabe
+# Copyright (c) 2013 Fabien Boucher
+# Copyright (c) 2013 Greg Lange
+# Copyright (c) 2013 Kun Huang
+# Copyright (c) 2013 Richard Hawkins
+# Copyright (c) 2013 Tong Li
+# Copyright (c) 2013 ZhiQiang Fan
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,7 +28,7 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-"""
+r"""
 TempURL Middleware
 
 Allows the creation of URLs to provide temporary access to objects.
@@ -29,46 +44,252 @@
 accidentally post it on a forum, etc. the direct access would be
 limited to the expiration time set when the website created the link.
 
-To create such temporary URLs, first an X-Account-Meta-Temp-URL-Key
-header must be set on the Swift account. Then, an HMAC-SHA1 (RFC 2104)
-signature is generated using the HTTP method to allow (GET or PUT),
-the Unix timestamp the access should be allowed until, the full path
-to the object, and the key set on the account.
+Beyond that, the middleware provides the ability to create URLs, which
+contain signatures which are valid for all objects which share a
+common prefix. These prefix-based URLs are useful for sharing a set
+of objects.
+
+Restrictions can also be placed on the ip that the resource is allowed
+to be accessed from. This can be useful for locking down where the urls
+can be used from.
+
+------------
+Client Usage
+------------
+
+To create temporary URLs, first an ``X-Account-Meta-Temp-URL-Key``
+header must be set on the Swift account. Then, an HMAC (RFC 2104)
+signature is generated using the HTTP method to allow (``GET``, ``PUT``,
+``DELETE``, etc.), the Unix timestamp until which the access should be allowed,
+the full path to the object, and the key set on the account.
+
+The digest algorithm to be used may be configured by the operator. By default,
+HMAC-SHA256 and HMAC-SHA512 are supported. Check the
+``tempurl.allowed_digests`` entry in the cluster's capabilities response to
+see which algorithms are supported by your deployment; see
+:doc:`api/discoverability` for more information. On older clusters,
+the ``tempurl`` key may be present while the ``allowed_digests`` subkey
+is not; in this case, only HMAC-SHA1 is supported.
 
-For example, here is code generating the signature for a GET for 60
-seconds on /v1/AUTH_account/container/object::
+For example, here is code generating the signature for a ``GET`` for 60
+seconds on ``/v1/AUTH_account/container/object``::
 
     import hmac
-    from hashlib import sha1
+    from hashlib import sha256
     from time import time
     method = 'GET'
     expires = int(time() + 60)
     path = '/v1/AUTH_account/container/object'
     key = 'mykey'
-    hmac_body = '%s\\n%s\\n%s' % (method, expires, path)
-    sig = hmac.new(key, hmac_body, sha1).hexdigest()
+    hmac_body = '%s\n%s\n%s' % (method, expires, path)
+    sig = hmac.new(key, hmac_body, sha256).hexdigest()
+
+Be certain to use the full path, from the ``/v1/`` onward.
+
+Let's say ``sig`` ends up equaling
+``732fcac368abb10c78a4cbe95c3fab7f311584532bf779abd5074e13cbe8b88b`` and
+``expires`` ends up ``1512508563``. Then, for example, the website could
+provide a link to::
+
+    https://swift-cluster.example.com/v1/AUTH_account/container/object?
+    temp_url_sig=732fcac368abb10c78a4cbe95c3fab7f311584532bf779abd5074e13cbe8b88b&
+    temp_url_expires=1512508563
+
+For longer hashes, a hex encoding becomes unwieldy. Base64 encoding is also
+supported, and indicated by prefixing the signature with ``"<digest name>:"``.
+This is *required* for HMAC-SHA512 signatures. For example, comparable code
+for generating a HMAC-SHA512 signature would be::
+
+    import base64
+    import hmac
+    from hashlib import sha512
+    from time import time
+    method = 'GET'
+    expires = int(time() + 60)
+    path = '/v1/AUTH_account/container/object'
+    key = 'mykey'
+    hmac_body = '%s\n%s\n%s' % (method, expires, path)
+    sig = 'sha512:' + base64.urlsafe_b64encode(hmac.new(
+        key, hmac_body, sha512).digest())
+
+Supposing that ``sig`` ends up equaling
+``sha512:ZrSijn0GyDhsv1ltIj9hWUTrbAeE45NcKXyBaz7aPbSMvROQ4jtYH4nRAmm
+5ErY2X11Yc1Yhy2OMCyN3yueeXg==`` and ``expires`` ends up
+``1516741234``, then the website could provide a link to::
+
+    https://swift-cluster.example.com/v1/AUTH_account/container/object?
+    temp_url_sig=sha512:ZrSijn0GyDhsv1ltIj9hWUTrbAeE45NcKXyBaz7aPbSMvRO
+    Q4jtYH4nRAmm5ErY2X11Yc1Yhy2OMCyN3yueeXg==&
+    temp_url_expires=1516741234
+
+You may also use ISO 8601 UTC timestamps with the format
+``"%Y-%m-%dT%H:%M:%SZ"`` instead of UNIX timestamps in the URL
+(but NOT in the code above for generating the signature!).
+So, the above HMAC-SHA246 URL could also be formulated as::
+
+    https://swift-cluster.example.com/v1/AUTH_account/container/object?
+    temp_url_sig=732fcac368abb10c78a4cbe95c3fab7f311584532bf779abd5074e13cbe8b88b&
+    temp_url_expires=2017-12-05T21:16:03Z
+
+If a prefix-based signature with the prefix ``pre`` is desired, set path to::
+
+    path = 'prefix:/v1/AUTH_account/container/pre'
+
+The generated signature would be valid for all objects starting
+with ``pre``. The middleware detects a prefix-based temporary URL by
+a query parameter called ``temp_url_prefix``. So, if ``sig`` and ``expires``
+would end up like above, following URL would be valid::
+
+    https://swift-cluster.example.com/v1/AUTH_account/container/pre/object?
+    temp_url_sig=732fcac368abb10c78a4cbe95c3fab7f311584532bf779abd5074e13cbe8b88b&
+    temp_url_expires=1512508563&
+    temp_url_prefix=pre
+
+Another valid URL::
+
+    https://swift-cluster.example.com/v1/AUTH_account/container/pre/
+    subfolder/another_object?
+    temp_url_sig=732fcac368abb10c78a4cbe95c3fab7f311584532bf779abd5074e13cbe8b88b&
+    temp_url_expires=1512508563&
+    temp_url_prefix=pre
+
+If you wish to lock down the ip ranges from where the resource can be accessed
+to the ip ``1.2.3.4``::
+
+    import hmac
+    from hashlib import sha256
+    from time import time
+    method = 'GET'
+    expires = int(time() + 60)
+    path = '/v1/AUTH_account/container/object'
+    ip_range = '1.2.3.4'
+    key = b'mykey'
+    hmac_body = 'ip=%s\n%s\n%s\n%s' % (ip_range, method, expires, path)
+    sig = hmac.new(key, hmac_body.encode('ascii'), sha256).hexdigest()
+
+The generated signature would only be valid from the ip ``1.2.3.4``. The
+middleware detects an ip-based temporary URL by a query parameter called
+``temp_url_ip_range``. So, if ``sig`` and ``expires`` would end up like
+above, following URL would be valid::
+
+    https://swift-cluster.example.com/v1/AUTH_account/container/object?
+    temp_url_sig=3f48476acaf5ec272acd8e99f7b5bad96c52ddba53ed27c60613711774a06f0c&
+    temp_url_expires=1648082711&
+    temp_url_ip_range=1.2.3.4
+
+Similarly to lock down the ip to a range of ``1.2.3.X`` so starting
+from the ip ``1.2.3.0`` to ``1.2.3.255``::
 
-Be certain to use the full path, from the /v1/ onward.
+    import hmac
+    from hashlib import sha256
+    from time import time
+    method = 'GET'
+    expires = int(time() + 60)
+    path = '/v1/AUTH_account/container/object'
+    ip_range = '1.2.3.0/24'
+    key = b'mykey'
+    hmac_body = 'ip=%s\n%s\n%s\n%s' % (ip_range, method, expires, path)
+    sig = hmac.new(key, hmac_body.encode('ascii'), sha256).hexdigest()
 
-Let's say the sig ends up equaling
-da39a3ee5e6b4b0d3255bfef95601890afd80709 and expires ends up
-1323479485. Then, for example, the website could provide a link to::
+Then the following url would be valid::
 
     https://swift-cluster.example.com/v1/AUTH_account/container/object?
-    temp_url_sig=da39a3ee5e6b4b0d3255bfef95601890afd80709&
-    temp_url_expires=1323479485
+    temp_url_sig=6ff81256b8a3ba11d239da51a703b9c06a56ffddeb8caab74ca83af8f73c9c83&
+    temp_url_expires=1648082711&
+    temp_url_ip_range=1.2.3.0/24
+
 
-Any alteration of the resource path or query arguments would result
-in 401 Unauthorized. Similary, a PUT where GET was the allowed method
-would 401. HEAD is allowed if GET or PUT is allowed.
+Any alteration of the resource path or query arguments of a temporary URL
+would result in ``401 Unauthorized``. Similarly, a ``PUT`` where ``GET`` was
+the allowed method would be rejected with ``401 Unauthorized``.
+However, ``HEAD`` is allowed if ``GET``, ``PUT``, or ``POST`` is allowed.
 
 Using this in combination with browser form post translation
 middleware could also allow direct-from-browser uploads to specific
 locations in Swift.
 
-Note that changing the X-Account-Meta-Temp-URL-Key will invalidate
-any previously generated temporary URLs within 60 seconds (the
-memcache time for the key).
+TempURL supports both account and container level keys.  Each allows up to two
+keys to be set, allowing key rotation without invalidating all existing
+temporary URLs.  Account keys are specified by ``X-Account-Meta-Temp-URL-Key``
+and ``X-Account-Meta-Temp-URL-Key-2``, while container keys are specified by
+``X-Container-Meta-Temp-URL-Key`` and ``X-Container-Meta-Temp-URL-Key-2``.
+Signatures are checked against account and container keys, if
+present.
+
+With ``GET`` TempURLs, a ``Content-Disposition`` header will be set on the
+response so that browsers will interpret this as a file attachment to
+be saved. The filename chosen is based on the object name, but you
+can override this with a filename query parameter. Modifying the
+above example::
+
+    https://swift-cluster.example.com/v1/AUTH_account/container/object?
+    temp_url_sig=732fcac368abb10c78a4cbe95c3fab7f311584532bf779abd5074e13cbe8b88b&
+    temp_url_expires=1512508563&filename=My+Test+File.pdf
+
+If you do not want the object to be downloaded, you can cause
+``Content-Disposition: inline`` to be set on the response by adding the
+``inline`` parameter to the query string, like so::
+
+    https://swift-cluster.example.com/v1/AUTH_account/container/object?
+    temp_url_sig=732fcac368abb10c78a4cbe95c3fab7f311584532bf779abd5074e13cbe8b88b&
+    temp_url_expires=1512508563&inline
+
+In some cases, the client might not able to present the content of the object,
+but you still want the content able to save to local with the specific
+filename. So you can cause ``Content-Disposition: inline; filename=...`` to be
+set on the response by adding the ``inline&filename=...`` parameter to the
+query string, like so::
+
+    https://swift-cluster.example.com/v1/AUTH_account/container/object?
+    temp_url_sig=732fcac368abb10c78a4cbe95c3fab7f311584532bf779abd5074e13cbe8b88b&
+    temp_url_expires=1512508563&inline&filename=My+Test+File.pdf
+
+---------------------
+Cluster Configuration
+---------------------
+
+This middleware understands the following configuration settings:
+
+``incoming_remove_headers``
+    A whitespace-delimited list of the headers to remove from
+    incoming requests. Names may optionally end with ``*`` to
+    indicate a prefix match. ``incoming_allow_headers`` is a
+    list of exceptions to these removals.
+    Default: ``x-timestamp x-open-expired``
+
+``incoming_allow_headers``
+    A whitespace-delimited list of the headers allowed as
+    exceptions to ``incoming_remove_headers``. Names may
+    optionally end with ``*`` to indicate a prefix match.
+
+    Default: None
+
+``outgoing_remove_headers``
+    A whitespace-delimited list of the headers to remove from
+    outgoing responses. Names may optionally end with ``*`` to
+    indicate a prefix match. ``outgoing_allow_headers`` is a
+    list of exceptions to these removals.
+
+    Default: ``x-object-meta-*``
+
+``outgoing_allow_headers``
+    A whitespace-delimited list of the headers allowed as
+    exceptions to ``outgoing_remove_headers``. Names may
+    optionally end with ``*`` to indicate a prefix match.
+
+    Default: ``x-object-meta-public-*``
+
+``methods``
+    A whitespace delimited list of request methods that are
+    allowed to be used with a temporary URL.
+
+    Default: ``GET HEAD PUT POST DELETE``
+
+``allowed_digests``
+    A whitespace delimited list of digest algorithms that are allowed
+    to be used when calculating the signature for a temporary URL.
+
+    Default: ``sha256 sha512``
 """
 
 __all__ = ['TempURL', 'filter_factory',
@@ -77,25 +298,33 @@
            'DEFAULT_OUTGOING_REMOVE_HEADERS',
            'DEFAULT_OUTGOING_ALLOW_HEADERS']
 
-
-import hmac
-from hashlib import sha1
+from calendar import timegm
 from os.path import basename
-from StringIO import StringIO
-from time import gmtime, strftime, time
-from urllib import quote, unquote
-from urlparse import parse_qs
+from time import time, strptime
+from ipaddress import ip_address, ip_network
+
+from urllib.parse import parse_qs, urlencode
 
-from swift.common.utils import get_logger
-from swift.common.wsgi import make_pre_authed_env
-from swift.common.http import HTTP_UNAUTHORIZED
+from swift.proxy.controllers.base import get_account_info, get_container_info
+from swift.common.header_key_dict import HeaderKeyDict
+from swift.common.http import is_success
+from swift.common.digest import get_allowed_digests, \
+    extract_digest_and_algorithm, DEFAULT_ALLOWED_DIGESTS, get_hmac
+from swift.common.swob import header_to_environ_key, HTTPUnauthorized, \
+    HTTPBadRequest, wsgi_to_str, date_header_format
+from swift.common.utils import split_path, \
+    streq_const_time, quote, get_logger, close_if_possible
+from swift.common.registry import register_swift_info, register_sensitive_param
+from swift.common.wsgi import WSGIContext
 
 
+DISALLOWED_INCOMING_HEADERS = 'x-object-manifest x-symlink-target'
+
 #: Default headers to remove from incoming requests. Simply a whitespace
 #: delimited list of header names and names can optionally end with '*' to
 #: indicate a prefix match. DEFAULT_INCOMING_ALLOW_HEADERS is a list of
 #: exceptions to these removals.
-DEFAULT_INCOMING_REMOVE_HEADERS = 'x-timestamp'
+DEFAULT_INCOMING_REMOVE_HEADERS = 'x-timestamp x-open-expired'
 
 #: Default headers as exceptions to DEFAULT_INCOMING_REMOVE_HEADERS. Simply a
 #: whitespace delimited list of header names and names can optionally end with
@@ -113,106 +342,194 @@
 #: '*' to indicate a prefix match.
 DEFAULT_OUTGOING_ALLOW_HEADERS = 'x-object-meta-public-*'
 
+CONTAINER_SCOPE = 'container'
+ACCOUNT_SCOPE = 'account'
+
+EXPIRES_ISO8601_FORMAT = '%Y-%m-%dT%H:%M:%SZ'
+
+
+def get_tempurl_keys_from_metadata(meta):
+    """
+    Extracts the tempurl keys from metadata.
+
+    :param meta: account metadata
+    :returns: list of keys found (possibly empty if no keys set)
+
+    Example:
+      meta = get_account_info(...)['meta']
+      keys = get_tempurl_keys_from_metadata(meta)
+    """
+    return [value for key, value in meta.items()
+            if key.lower() in ('temp-url-key', 'temp-url-key-2')]
+
+
+def normalize_temp_url_expires(value):
+    """
+    Returns the normalized expiration value as an int
+
+    If not None, the value is converted to an int if possible or 0
+    if not, and checked for expiration (returns 0 if expired).
+    """
+    if value is None:
+        return value
+    try:
+        temp_url_expires = int(value)
+    except ValueError:
+        try:
+            temp_url_expires = timegm(strptime(
+                value, EXPIRES_ISO8601_FORMAT))
+        except ValueError:
+            temp_url_expires = 0
+    if temp_url_expires < time():
+        temp_url_expires = 0
+    return temp_url_expires
+
+
+def get_temp_url_info(env):
+    """
+    Returns the provided temporary URL parameters (sig, expires, prefix,
+    temp_url_ip_range), if given and syntactically valid.
+    Either sig, expires or prefix could be None if not provided.
+
+    :param env: The WSGI environment for the request.
+    :returns: (sig, expires, prefix, filename, inline,
+        temp_url_ip_range) as described above.
+    """
+    sig = expires = prefix = ip_range = filename = inline = None
+    qs = parse_qs(env.get('QUERY_STRING', ''), keep_blank_values=True)
+    if 'temp_url_ip_range' in qs:
+        ip_range = qs['temp_url_ip_range'][0]
+    if 'temp_url_sig' in qs:
+        sig = qs['temp_url_sig'][0]
+    if 'temp_url_expires' in qs:
+        expires = qs['temp_url_expires'][0]
+    if 'temp_url_prefix' in qs:
+        prefix = qs['temp_url_prefix'][0]
+    if 'filename' in qs:
+        filename = qs['filename'][0]
+    if 'inline' in qs:
+        inline = True
+    return (sig, expires, prefix, filename, inline, ip_range)
+
+
+def disposition_format(disposition_type, filename):
+    # Content-Disposition in HTTP is defined in
+    # https://tools.ietf.org/html/rfc6266 and references
+    # https://tools.ietf.org/html/rfc5987#section-3.2
+    # to explain the filename*= encoding format. The summary
+    # is that it's the charset, then an optional (and empty) language
+    # then the filename. Looks funny, but it's right.
+    return '''%s; filename="%s"; filename*=UTF-8''%s''' % (
+        disposition_type, quote(filename, safe=' /'), quote(filename))
+
+
+def authorize_same_account(account_to_match):
+
+    def auth_callback_same_account(req):
+        try:
+            _ver, acc, _rest = req.split_path(2, 3, True)
+        except ValueError:
+            return HTTPUnauthorized(request=req)
+
+        if wsgi_to_str(acc) == account_to_match:
+            return None
+        else:
+            return HTTPUnauthorized(request=req)
+
+    return auth_callback_same_account
+
+
+def authorize_same_container(account_to_match, container_to_match):
+
+    def auth_callback_same_container(req):
+        try:
+            _ver, acc, con, _rest = req.split_path(3, 4, True)
+        except ValueError:
+            return HTTPUnauthorized(request=req)
+
+        if wsgi_to_str(acc) == account_to_match and \
+           wsgi_to_str(con) == container_to_match:
+            return None
+        else:
+            return HTTPUnauthorized(request=req)
+
+    return auth_callback_same_container
+
 
 class TempURL(object):
     """
     WSGI Middleware to grant temporary URLs specific access to Swift
     resources. See the overview for more information.
 
-    This middleware understands the following configuration settings::
-
-        incoming_remove_headers
-            The headers to remove from incoming requests. Simply a
-            whitespace delimited list of header names and names can
-            optionally end with '*' to indicate a prefix match.
-            incoming_allow_headers is a list of exceptions to these
-            removals.
-            Default: x-timestamp
-
-        incoming_allow_headers
-            The headers allowed as exceptions to
-            incoming_remove_headers. Simply a whitespace delimited
-            list of header names and names can optionally end with
-            '*' to indicate a prefix match.
-            Default: None
-
-        outgoing_remove_headers
-            The headers to remove from outgoing responses. Simply a
-            whitespace delimited list of header names and names can
-            optionally end with '*' to indicate a prefix match.
-            outgoing_allow_headers is a list of exceptions to these
-            removals.
-            Default: x-object-meta-*
-
-        outgoing_allow_headers
-            The headers allowed as exceptions to
-            outgoing_remove_headers. Simply a whitespace delimited
-            list of header names and names can optionally end with
-            '*' to indicate a prefix match.
-            Default: x-object-meta-public-*
+    The proxy logs created for any subrequests made will have swift.source set
+    to "TU".
 
     :param app: The next WSGI filter or app in the paste.deploy
                 chain.
     :param conf: The configuration dict for the middleware.
     """
 
-    def __init__(self, app, conf):
+    def __init__(self, app, conf, logger=None):
         #: The next WSGI application/filter in the paste.deploy pipeline.
         self.app = app
         #: The filter configuration dict.
         self.conf = conf
-        #: The logger to use with this middleware.
-        self.logger = get_logger(conf, log_route='tempurl')
-
-        headers = DEFAULT_INCOMING_REMOVE_HEADERS
-        if 'incoming_remove_headers' in conf:
-            headers = conf['incoming_remove_headers']
-        headers = \
-            ['HTTP_' + h.upper().replace('-', '_') for h in headers.split()]
+        self.logger = logger or get_logger(conf, log_route='tempurl')
+
+        self.allowed_digests = conf.get(
+            'allowed_digests', DEFAULT_ALLOWED_DIGESTS.split())
+
+        self.disallowed_headers = set(
+            header_to_environ_key(h)
+            for h in DISALLOWED_INCOMING_HEADERS.split())
+
+        headers = [header_to_environ_key(h)
+                   for h in conf.get('incoming_remove_headers',
+                                     DEFAULT_INCOMING_REMOVE_HEADERS.split())]
         #: Headers to remove from incoming requests. Uppercase WSGI env style,
         #: like `HTTP_X_PRIVATE`.
-        self.incoming_remove_headers = [h for h in headers if h[-1] != '*']
+        self.incoming_remove_headers = \
+            [h for h in headers if not h.endswith('*')]
         #: Header with match prefixes to remove from incoming requests.
         #: Uppercase WSGI env style, like `HTTP_X_SENSITIVE_*`.
         self.incoming_remove_headers_startswith = \
-            [h[:-1] for h in headers if h[-1] == '*']
+            [h[:-1] for h in headers if h.endswith('*')]
 
-        headers = DEFAULT_INCOMING_ALLOW_HEADERS
-        if 'incoming_allow_headers' in conf:
-            headers = conf['incoming_allow_headers']
-        headers = \
-            ['HTTP_' + h.upper().replace('-', '_') for h in headers.split()]
+        headers = [header_to_environ_key(h)
+                   for h in conf.get('incoming_allow_headers',
+                                     DEFAULT_INCOMING_ALLOW_HEADERS.split())]
         #: Headers to allow in incoming requests. Uppercase WSGI env style,
         #: like `HTTP_X_MATCHES_REMOVE_PREFIX_BUT_OKAY`.
-        self.incoming_allow_headers = [h for h in headers if h[-1] != '*']
+        self.incoming_allow_headers = \
+            [h for h in headers if not h.endswith('*')]
         #: Header with match prefixes to allow in incoming requests. Uppercase
         #: WSGI env style, like `HTTP_X_MATCHES_REMOVE_PREFIX_BUT_OKAY_*`.
         self.incoming_allow_headers_startswith = \
-            [h[:-1] for h in headers if h[-1] == '*']
+            [h[:-1] for h in headers if h.endswith('*')]
 
-        headers = DEFAULT_OUTGOING_REMOVE_HEADERS
-        if 'outgoing_remove_headers' in conf:
-            headers = conf['outgoing_remove_headers']
-        headers = [h.lower() for h in headers.split()]
+        headers = [h.title()
+                   for h in conf.get('outgoing_remove_headers',
+                                     DEFAULT_OUTGOING_REMOVE_HEADERS.split())]
         #: Headers to remove from outgoing responses. Lowercase, like
         #: `x-account-meta-temp-url-key`.
-        self.outgoing_remove_headers = [h for h in headers if h[-1] != '*']
+        self.outgoing_remove_headers = \
+            [h for h in headers if not h.endswith('*')]
         #: Header with match prefixes to remove from outgoing responses.
         #: Lowercase, like `x-account-meta-private-*`.
         self.outgoing_remove_headers_startswith = \
-            [h[:-1] for h in headers if h[-1] == '*']
+            [h[:-1] for h in headers if h.endswith('*')]
 
-        headers = DEFAULT_OUTGOING_ALLOW_HEADERS
-        if 'outgoing_allow_headers' in conf:
-            headers = conf['outgoing_allow_headers']
-        headers = [h.lower() for h in headers.split()]
+        headers = [h.title()
+                   for h in conf.get('outgoing_allow_headers',
+                                     DEFAULT_OUTGOING_ALLOW_HEADERS.split())]
         #: Headers to allow in outgoing responses. Lowercase, like
         #: `x-matches-remove-prefix-but-okay`.
-        self.outgoing_allow_headers = [h for h in headers if h[-1] != '*']
+        self.outgoing_allow_headers = \
+            [h for h in headers if not h.endswith('*')]
         #: Header with match prefixes to allow in outgoing responses.
         #: Lowercase, like `x-matches-remove-prefix-but-okay-*`.
         self.outgoing_allow_headers_startswith = \
-            [h[:-1] for h in headers if h[-1] == '*']
+            [h[:-1] for h in headers if h.endswith('*')]
         #: HTTP user agent to use for subrequests.
         self.agent = '%(orig)s TempURL'
 
@@ -224,150 +541,245 @@ def __call__(self, env, start_response):
         :param start_response: The WSGI start_response hook.
         :returns: Response as per WSGI.
         """
-        temp_url_sig, temp_url_expires = self._get_temp_url_info(env)
+        if env['REQUEST_METHOD'] == 'OPTIONS':
+            return self.app(env, start_response)
+        info = get_temp_url_info(env)
+        temp_url_sig, client_temp_url_expires, temp_url_prefix, filename, \
+            inline_disposition, temp_url_ip_range = info
+        temp_url_expires = normalize_temp_url_expires(client_temp_url_expires)
         if temp_url_sig is None and temp_url_expires is None:
             return self.app(env, start_response)
         if not temp_url_sig or not temp_url_expires:
             return self._invalid(env, start_response)
-        account = self._get_account(env)
-        if not account:
+
+        try:
+            hash_algorithm, temp_url_sig = extract_digest_and_algorithm(
+                temp_url_sig)
+        except ValueError:
             return self._invalid(env, start_response)
-        key = self._get_key(env, account)
-        if not key:
+        if hash_algorithm not in self.allowed_digests:
             return self._invalid(env, start_response)
-        if env['REQUEST_METHOD'] == 'HEAD':
-            hmac_val = self._get_hmac(env, temp_url_expires, key,
-                                      request_method='GET')
-            if temp_url_sig != hmac_val:
-                hmac_val = self._get_hmac(env, temp_url_expires, key,
-                                          request_method='PUT')
-                if temp_url_sig != hmac_val:
+
+        account, container, obj = self._get_path_parts(
+            env, allow_container_root=(
+                env['REQUEST_METHOD'] in ('GET', 'HEAD') and
+                temp_url_prefix == ""))
+        if not account:
+            return self._invalid(env, start_response)
+
+        if temp_url_ip_range:
+            client_address = env.get('REMOTE_ADDR')
+            if client_address is None:
+                return self._invalid(env, start_response)
+            try:
+                allowed_ip_ranges = ip_network(str(temp_url_ip_range))
+                if ip_address(str(client_address)) not in allowed_ip_ranges:
                     return self._invalid(env, start_response)
+            except ValueError:
+                return self._invalid(env, start_response)
+
+        keys = self._get_keys(env)
+        if not keys:
+            return self._invalid(env, start_response)
+        if temp_url_prefix is None:
+            path = '/v1/%s/%s/%s' % (account, container, obj)
         else:
-            hmac_val = self._get_hmac(env, temp_url_expires, key)
-            if temp_url_sig != hmac_val:
+            if not obj.startswith(temp_url_prefix):
                 return self._invalid(env, start_response)
+            path = 'prefix:/v1/%s/%s/%s' % (account, container,
+                                            temp_url_prefix)
+        if env['REQUEST_METHOD'] == 'HEAD':
+            hmac_vals = [
+                hmac for method in ('HEAD', 'GET', 'POST', 'PUT')
+                for hmac in self._get_hmacs(
+                    env, temp_url_expires, path, keys, hash_algorithm,
+                    request_method=method, ip_range=temp_url_ip_range)]
+        else:
+            hmac_vals = self._get_hmacs(
+                env, temp_url_expires, path, keys, hash_algorithm,
+                ip_range=temp_url_ip_range)
+
+        is_valid_hmac = False
+        hmac_scope = None
+        for hmac, scope in hmac_vals:
+            # While it's true that we short-circuit, this doesn't affect the
+            # timing-attack resistance since the only way this will
+            # short-circuit is when a valid signature is passed in.
+            if streq_const_time(temp_url_sig, hmac):
+                is_valid_hmac = True
+                hmac_scope = scope
+                break
+        if not is_valid_hmac:
+            return self._invalid(env, start_response)
+        self.logger.increment('tempurl.digests.%s' % hash_algorithm)
+        # disallowed headers prevent accidentally allowing upload of a pointer
+        # to data that the PUT tempurl would not otherwise allow access for.
+        # It should be safe to provide a GET tempurl for data that an
+        # untrusted client just uploaded with a PUT tempurl.
+        resp = self._clean_disallowed_headers(env, start_response)
+        if resp:
+            return resp
         self._clean_incoming_headers(env)
-        env['swift.authorize'] = lambda req: None
+
+        if hmac_scope == ACCOUNT_SCOPE:
+            env['swift.authorize'] = authorize_same_account(account)
+        else:
+            env['swift.authorize'] = authorize_same_container(account,
+                                                              container)
         env['swift.authorize_override'] = True
         env['REMOTE_USER'] = '.wsgi.tempurl'
+        qs = {'temp_url_sig': temp_url_sig,
+              'temp_url_expires': client_temp_url_expires}
+        if temp_url_prefix is not None:
+            qs['temp_url_prefix'] = temp_url_prefix
+        if filename:
+            qs['filename'] = filename
+        env['QUERY_STRING'] = urlencode(qs)
+
+        ctx = WSGIContext(self.app)
+        app_iter = ctx._app_call(env)
+        ctx._response_headers = self._clean_outgoing_headers(
+            ctx._response_headers)
+        if env['REQUEST_METHOD'] in ('GET', 'HEAD') and \
+                is_success(ctx._get_status_int()):
+            # figure out the right value for content-disposition
+            # 1) use the value from the query string
+            # 2) use the value from the object metadata
+            # 3) use the object name (default)
+            out_headers = []
+            existing_disposition = None
+            content_generator = None
+            for h, v in ctx._response_headers:
+                if h.lower() == 'x-backend-content-generator':
+                    content_generator = v
+
+                if h.lower() != 'content-disposition':
+                    out_headers.append((h, v))
+                else:
+                    existing_disposition = v
+            if content_generator == 'staticweb':
+                inline_disposition = True
+            elif obj == "":
+                # Generally, tempurl requires an object. We carved out an
+                # exception to allow GETs at the container root for the sake
+                # of staticweb, but we can't tell whether we'll have a
+                # staticweb response or not until after we call the app
+                close_if_possible(app_iter)
+                return self._invalid(env, start_response)
 
-        def _start_response(status, headers, exc_info=None):
-            headers = self._clean_outgoing_headers(headers)
-            if env['REQUEST_METHOD'] == 'GET':
-                already = False
-                for h, v in headers:
-                    if h.lower() == 'content-disposition':
-                        already = True
-                        break
-                if not already:
-                    headers.append(
-                        ('Content-Disposition', 'attachment; filename=%s' %
-                            (quote(basename(env['PATH_INFO'])))))
-            return start_response(status, headers, exc_info)
-
-        return self.app(env, _start_response)
-
-    def _get_account(self, env):
+            if inline_disposition:
+                if filename:
+                    disposition_value = disposition_format('inline',
+                                                           filename)
+                else:
+                    disposition_value = 'inline'
+            elif filename:
+                disposition_value = disposition_format('attachment',
+                                                       filename)
+            elif existing_disposition:
+                disposition_value = existing_disposition
+            else:
+                name = basename(wsgi_to_str(env['PATH_INFO']).rstrip('/'))
+                disposition_value = disposition_format('attachment',
+                                                       name)
+            # this is probably just paranoia, I couldn't actually get a
+            # newline into existing_disposition
+            value = disposition_value.replace('\n', '%0A')
+            out_headers.append(('Content-Disposition', value))
+
+            # include Expires header for better cache-control
+            out_headers.append((
+                'Expires',
+                date_header_format(temp_url_expires)))
+            ctx._response_headers = out_headers
+        start_response(
+            ctx._response_status,
+            ctx._response_headers,
+            ctx._response_exc_info)
+        return app_iter
+
+    def _get_path_parts(self, env, allow_container_root=False):
         """
-        Returns just the account for the request, if it's an object GET, PUT,
-        or HEAD request; otherwise, None is returned.
+        Return the account, container and object name for the request,
+        if it's an object request and one of the configured methods;
+        otherwise, None is returned.
 
-        :param env: The WSGI environment for the request.
-        :returns: Account str or None.
-        """
-        account = None
-        if env['REQUEST_METHOD'] in ('GET', 'PUT', 'HEAD'):
-            parts = env['PATH_INFO'].split('/', 4)
-            # Must be five parts, ['', 'v1', 'a', 'c', 'o'], must be a v1
-            # request, have account, container, and object values, and the
-            # object value can't just have '/'s.
-            if len(parts) == 5 and not parts[0] and parts[1] == 'v1' and \
-                    parts[2] and parts[3] and parts[4].strip('/'):
-                account = parts[2]
-        return account
-
-    def _get_temp_url_info(self, env):
-        """
-        Returns the provided temporary URL parameters (sig, expires),
-        if given and syntactically valid. Either sig or expires could
-        be None if not provided. If provided, expires is also
-        converted to an int if possible or 0 if not, and checked for
-        expiration (returns 0 if expired).
+        If it's a container request and allow_root_container is true,
+        the object name returned will be the empty string.
 
         :param env: The WSGI environment for the request.
-        :returns: (sig, expires) as described above.
+        :param allow_container_root: Whether requests to the root of a
+            container should be allowed.
+        :returns: (Account str, container str, object str) or
+            (None, None, None).
         """
-        temp_url_sig = temp_url_expires = None
-        qs = parse_qs(env.get('QUERY_STRING', ''))
-        if 'temp_url_sig' in qs:
-            temp_url_sig = qs['temp_url_sig'][0]
-        if 'temp_url_expires' in qs:
+        if env['REQUEST_METHOD'] in self.conf['methods']:
             try:
-                temp_url_expires = int(qs['temp_url_expires'][0])
+                ver, acc, cont, obj = split_path(
+                    env['PATH_INFO'], 3 if allow_container_root else 4,
+                    4, True)
             except ValueError:
-                temp_url_expires = 0
-            if temp_url_expires < time():
-                temp_url_expires = 0
-        return temp_url_sig, temp_url_expires
+                return (None, None, None)
+            if ver == 'v1' and (allow_container_root or obj.strip('/')):
+                return (wsgi_to_str(acc), wsgi_to_str(cont),
+                        wsgi_to_str(obj) if obj else '')
+        return (None, None, None)
 
-    def _get_key(self, env, account):
+    def _get_keys(self, env):
         """
-        Returns the X-Account-Meta-Temp-URL-Key header value for the
-        account, or None if none is set.
+        Returns the X-[Account|Container]-Meta-Temp-URL-Key[-2] header values
+        for the account or container, or an empty list if none are set. Each
+        value comes as a 2-tuple (key, scope), where scope is either
+        CONTAINER_SCOPE or ACCOUNT_SCOPE.
+
+        Returns 0-4 elements depending on how many keys are set in the
+        account's or container's metadata.
 
         :param env: The WSGI environment for the request.
-        :param account: Account str.
-        :returns: X-Account-Meta-Temp-URL-Key str value, or None.
-        """
-        key = None
-        memcache = env.get('swift.cache')
-        if memcache:
-            key = memcache.get('temp-url-key/%s' % account)
-        if not key:
-            newenv = make_pre_authed_env(env, 'HEAD', '/v1/' + account,
-                                         self.agent)
-            newenv['CONTENT_LENGTH'] = '0'
-            newenv['wsgi.input'] = StringIO('')
-            key = [None]
-
-            def _start_response(status, response_headers, exc_info=None):
-                for h, v in response_headers:
-                    if h.lower() == 'x-account-meta-temp-url-key':
-                        key[0] = v
-
-            i = iter(self.app(newenv, _start_response))
-            try:
-                i.next()
-            except StopIteration:
-                pass
-            key = key[0]
-            if key and memcache:
-                memcache.set('temp-url-key/%s' % account, key, timeout=60)
-        return key
-
-    def _get_hmac(self, env, expires, key, request_method=None):
+        :returns: [
+            (X-Account-Meta-Temp-URL-Key str value, ACCOUNT_SCOPE) if set,
+            (X-Account-Meta-Temp-URL-Key-2 str value, ACCOUNT_SCOPE if set,
+            (X-Container-Meta-Temp-URL-Key str value, CONTAINER_SCOPE) if set,
+            (X-Container-Meta-Temp-URL-Key-2 str value, CONTAINER_SCOPE if set,
+        ]
         """
-        Returns the hexdigest string of the HMAC-SHA1 (RFC 2104) for
-        the request.
+        account_info = get_account_info(env, self.app, swift_source='TU')
+        account_keys = get_tempurl_keys_from_metadata(account_info['meta'])
+
+        container_info = get_container_info(env, self.app, swift_source='TU')
+        container_keys = get_tempurl_keys_from_metadata(
+            container_info.get('meta', []))
+
+        return ([(ak, ACCOUNT_SCOPE) for ak in account_keys] +
+                [(ck, CONTAINER_SCOPE) for ck in container_keys])
 
+    def _get_hmacs(self, env, expires, path, scoped_keys, hash_algorithm,
+                   request_method=None, ip_range=None):
+        """
         :param env: The WSGI environment for the request.
         :param expires: Unix timestamp as an int for when the URL
                         expires.
-        :param key: Key str, from the X-Account-Meta-Temp-URL-Key of
-                    the account.
+        :param path: The path which is used for hashing.
+        :param scoped_keys: (key, scope) tuples like _get_keys() returns
+        :param hash_algorithm: The hash algorithm to use.
         :param request_method: Optional override of the request in
                                the WSGI env. For example, if a HEAD
                                does not match, you may wish to
                                override with GET to still allow the
                                HEAD.
-        :returns: hexdigest str of the HMAC-SHA1 for the request.
+        :param ip_range: The ip range from which the resource is allowed
+                         to be accessed
+        :returns: a list of (hmac, scope) 2-tuples
         """
         if not request_method:
             request_method = env['REQUEST_METHOD']
-        return hmac.new(
-            key, '%s\n%s\n%s' % (request_method, expires,
-                                 env['PATH_INFO']), sha1).hexdigest()
+
+        return [
+            (get_hmac(
+                request_method, path, expires, key,
+                digest=hash_algorithm, ip_range=ip_range
+            ), scope)
+            for (key, scope) in scoped_keys]
 
     def _invalid(self, env, start_response):
         """
@@ -378,14 +790,27 @@ def _invalid(self, env, start_response):
         :param start_response: The WSGI start_response hook.
         :returns: 401 response as per WSGI.
         """
-        self._log_request(env, HTTP_UNAUTHORIZED)
-        body = '401 Unauthorized: Temp URL invalid\n'
-        start_response('401 Unauthorized',
-                       [('Content-Type', 'text/plain'),
-                        ('Content-Length', str(len(body)))])
         if env['REQUEST_METHOD'] == 'HEAD':
-            return []
-        return [body]
+            body = None
+        else:
+            body = '401 Unauthorized: Temp URL invalid\n'
+        return HTTPUnauthorized(body=body)(env, start_response)
+
+    def _clean_disallowed_headers(self, env, start_response):
+        """
+        Validate the absence of disallowed headers for "unsafe" operations.
+
+        :returns: None for safe operations or swob.HTTPBadResponse if the
+                  request includes disallowed headers.
+        """
+        if env['REQUEST_METHOD'] in ('GET', 'HEAD', 'OPTIONS'):
+            return
+        for h in env:
+            if h in self.disallowed_headers:
+                return HTTPBadRequest(
+                    body='The header %r is not allowed in this tempurl' %
+                    h[len('HTTP_'):].title().replace('_', '-'))(
+                        env, start_response)
 
     def _clean_incoming_headers(self, env):
         """
@@ -394,23 +819,20 @@ def _clean_incoming_headers(self, env):
 
         :param env: The WSGI environment for the request.
         """
-        for h in env.keys():
-            remove = h in self.incoming_remove_headers
-            if not remove:
+        for h in list(env.keys()):
+            if h in self.incoming_allow_headers:
+                continue
+            for p in self.incoming_allow_headers_startswith:
+                if h.startswith(p):
+                    break
+            else:
+                if h in self.incoming_remove_headers:
+                    del env[h]
+                    continue
                 for p in self.incoming_remove_headers_startswith:
                     if h.startswith(p):
-                        remove = True
-                        break
-            if remove:
-                if h in self.incoming_allow_headers:
-                    remove = False
-            if remove:
-                for p in self.incoming_allow_headers_startswith:
-                    if h.startswith(p):
-                        remove = False
+                        del env[h]
                         break
-            if remove:
-                del env[h]
 
     def _clean_outgoing_headers(self, headers):
         """
@@ -424,68 +846,49 @@ def _clean_outgoing_headers(self, headers):
                   removed as per the middlware configuration for
                   outgoing responses.
         """
-        headers = dict(headers)
-        for h in headers.keys():
-            remove = h in self.outgoing_remove_headers
-            if not remove:
+        headers = HeaderKeyDict(headers)
+        for h in list(headers.keys()):
+            if h in self.outgoing_allow_headers:
+                continue
+            for p in self.outgoing_allow_headers_startswith:
+                if h.startswith(p):
+                    break
+            else:
+                if h in self.outgoing_remove_headers:
+                    del headers[h]
+                    continue
                 for p in self.outgoing_remove_headers_startswith:
                     if h.startswith(p):
-                        remove = True
+                        del headers[h]
                         break
-            if remove:
-                if h in self.outgoing_allow_headers:
-                    remove = False
-            if remove:
-                for p in self.outgoing_allow_headers_startswith:
-                    if h.startswith(p):
-                        remove = False
-                        break
-            if remove:
-                del headers[h]
-        return headers.items()
-
-    def _log_request(self, env, response_status_int):
-        """
-        Used when a request might not be logged by the underlying
-        WSGI application, but we'd still like to record what
-        happened. An early 401 Unauthorized is a good example of
-        this.
-
-        :param env: The WSGI environment for the request.
-        :param response_status_int: The HTTP status we'll be replying
-                                    to the request with.
-        """
-        the_request = quote(unquote(env.get('PATH_INFO') or '/'))
-        if env.get('QUERY_STRING'):
-            the_request = the_request + '?' + env['QUERY_STRING']
-        client = env.get('HTTP_X_CLUSTER_CLIENT_IP')
-        if not client and 'HTTP_X_FORWARDED_FOR' in env:
-            # remote host for other lbs
-            client = env['HTTP_X_FORWARDED_FOR'].split(',')[0].strip()
-        if not client:
-            client = env.get('REMOTE_ADDR')
-        self.logger.info(' '.join(quote(str(x)) for x in (
-            client or '-',
-            env.get('REMOTE_ADDR') or '-',
-            strftime('%d/%b/%Y/%H/%M/%S', gmtime()),
-            env.get('REQUEST_METHOD') or 'GET',
-            the_request,
-            env.get('SERVER_PROTOCOL') or '1.0',
-            response_status_int,
-            env.get('HTTP_REFERER') or '-',
-            (env.get('HTTP_USER_AGENT') or '-') + ' TempURL',
-            env.get('HTTP_X_AUTH_TOKEN') or '-',
-            '-',
-            '-',
-            '-',
-            env.get('swift.trans_id') or '-',
-            '-',
-            '-',
-        )))
+        return list(headers.items())
 
 
 def filter_factory(global_conf, **local_conf):
-    """ Returns the WSGI filter for use with paste.deploy. """
+    """Returns the WSGI filter for use with paste.deploy."""
     conf = global_conf.copy()
     conf.update(local_conf)
-    return lambda app: TempURL(app, conf)
+
+    logger = get_logger(conf, log_route='tempurl')
+
+    defaults = {
+        'methods': 'GET HEAD PUT POST DELETE',
+        'incoming_remove_headers': DEFAULT_INCOMING_REMOVE_HEADERS,
+        'incoming_allow_headers': DEFAULT_INCOMING_ALLOW_HEADERS,
+        'outgoing_remove_headers': DEFAULT_OUTGOING_REMOVE_HEADERS,
+        'outgoing_allow_headers': DEFAULT_OUTGOING_ALLOW_HEADERS,
+    }
+    info_conf = {k: conf.get(k, v).split() for k, v in defaults.items()}
+
+    allowed_digests, deprecated_digests = get_allowed_digests(
+        conf.get('allowed_digests', '').split(), logger)
+    info_conf['allowed_digests'] = sorted(allowed_digests)
+    if deprecated_digests:
+        info_conf['deprecated_digests'] = sorted(deprecated_digests)
+
+    register_swift_info('tempurl', **info_conf)
+    conf.update(info_conf)
+
+    register_sensitive_param('temp_url_sig')
+
+    return lambda app: TempURL(app, conf, logger)
diff --git a/swift/common/middleware/versioned_writes/__init__.py b/swift/common/middleware/versioned_writes/__init__.py
new file mode 100644
index 0000000000..368cb9b716
--- /dev/null
+++ b/swift/common/middleware/versioned_writes/__init__.py
@@ -0,0 +1,51 @@
+# Copyright (c) 2019 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""
+Implements middleware for object versioning which comprises an instance of a
+:class:`~swift.common.middleware.versioned_writes.legacy.
+VersionedWritesMiddleware` combined with an instance of an
+:class:`~swift.common.middleware.versioned_writes.object_versioning.
+ObjectVersioningMiddleware`.
+"""
+from swift.common.middleware.versioned_writes. \
+    legacy import CLIENT_VERSIONS_LOC, CLIENT_HISTORY_LOC, \
+    VersionedWritesMiddleware
+from swift.common.middleware.versioned_writes. \
+    object_versioning import ObjectVersioningMiddleware
+
+from swift.common.utils import config_true_value
+from swift.common.registry import register_swift_info, get_swift_info
+
+
+def filter_factory(global_conf, **local_conf):
+    """Provides a factory function for loading versioning middleware."""
+    conf = global_conf.copy()
+    conf.update(local_conf)
+    if config_true_value(conf.get('allow_versioned_writes')):
+        register_swift_info('versioned_writes', allowed_flags=(
+            CLIENT_VERSIONS_LOC, CLIENT_HISTORY_LOC))
+
+    allow_object_versioning = config_true_value(conf.get(
+        'allow_object_versioning'))
+    if allow_object_versioning:
+        register_swift_info('object_versioning')
+
+    def versioning_filter(app):
+        if allow_object_versioning:
+            if 'symlink' not in get_swift_info():
+                raise ValueError('object versioning requires symlinks')
+            app = ObjectVersioningMiddleware(app, conf)
+        return VersionedWritesMiddleware(app, conf)
+    return versioning_filter
diff --git a/swift/common/middleware/versioned_writes/legacy.py b/swift/common/middleware/versioned_writes/legacy.py
new file mode 100644
index 0000000000..c16504eb02
--- /dev/null
+++ b/swift/common/middleware/versioned_writes/legacy.py
@@ -0,0 +1,872 @@
+# Copyright (c) 2014 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""
+.. note::
+    This middleware supports two legacy modes of object versioning that is
+    now replaced by a new mode. It is recommended to use the new
+    :ref:`Object Versioning <object_versioning>` mode for new containers.
+
+Object versioning in swift is implemented by setting a flag on the container
+to tell swift to version all objects in the container. The value of the flag is
+the URL-encoded container name where the versions are stored (commonly referred
+to as the "archive container"). The flag itself is one of two headers, which
+determines how object ``DELETE`` requests are handled:
+
+* ``X-History-Location``
+
+  On ``DELETE``, copy the current version of the object to the archive
+  container, write a zero-byte "delete marker" object that notes when the
+  delete took place, and delete the object from the versioned container. The
+  object will no longer appear in container listings for the versioned
+  container and future requests there will return ``404 Not Found``. However,
+  the content will still be recoverable from the archive container.
+
+* ``X-Versions-Location``
+
+  On ``DELETE``, only remove the current version of the object. If any
+  previous versions exist in the archive container, the most recent one is
+  copied over the current version, and the copy in the archive container is
+  deleted. As a result, if you have 5 total versions of the object, you must
+  delete the object 5 times for that object name to start responding with
+  ``404 Not Found``.
+
+Either header may be used for the various containers within an account, but
+only one may be set for any given container. Attempting to set both
+simulataneously will result in a ``400 Bad Request`` response.
+
+.. note::
+    It is recommended to use a different archive container for
+    each container that is being versioned.
+
+.. note::
+    Enabling versioning on an archive container is not recommended.
+
+When data is ``PUT`` into a versioned container (a container with the
+versioning flag turned on), the existing data in the file is redirected to a
+new object in the archive container and the data in the ``PUT`` request is
+saved as the data for the versioned object. The new object name (for the
+previous version) is ``<archive_container>/<length><object_name>/<timestamp>``,
+where ``length`` is the 3-character zero-padded hexadecimal length of the
+``<object_name>`` and ``<timestamp>`` is the timestamp of when the previous
+version was created.
+
+A ``GET`` to a versioned object will return the current version of the object
+without having to do any request redirects or metadata lookups.
+
+A ``POST`` to a versioned object will update the object metadata as normal,
+but will not create a new version of the object. In other words, new versions
+are only created when the content of the object changes.
+
+A ``DELETE`` to a versioned object will be handled in one of two ways,
+as described above.
+
+To restore a previous version of an object, find the desired version in the
+archive container then issue a ``COPY`` with a ``Destination`` header
+indicating the original location. This will archive the current version similar
+to a ``PUT`` over the versioned object. If the client additionally wishes to
+permanently delete what was the current version, it must find the newly-created
+archive in the archive container and issue a separate ``DELETE`` to it.
+
+--------------------------------------------------
+How to Enable Object Versioning in a Swift Cluster
+--------------------------------------------------
+
+This middleware was written as an effort to refactor parts of the proxy server,
+so this functionality was already available in previous releases and every
+attempt was made to maintain backwards compatibility. To allow operators to
+perform a seamless upgrade, it is not required to add the middleware to the
+proxy pipeline and the flag ``allow_versions`` in the container server
+configuration files are still valid, but only when using
+``X-Versions-Location``. In future releases, ``allow_versions`` will be
+deprecated in favor of adding this middleware to the pipeline to enable or
+disable the feature.
+
+In case the middleware is added to the proxy pipeline, you must also
+set ``allow_versioned_writes`` to ``True`` in the middleware options
+to enable the information about this middleware to be returned in a /info
+request.
+
+.. note::
+    You need to add the middleware to the proxy pipeline and set
+    ``allow_versioned_writes = True`` to use ``X-History-Location``. Setting
+    ``allow_versions = True`` in the container server is not sufficient to
+    enable the use of ``X-History-Location``.
+
+
+Upgrade considerations
+++++++++++++++++++++++
+
+If ``allow_versioned_writes`` is set in the filter configuration, you can leave
+the ``allow_versions`` flag in the container server configuration files
+untouched. If you decide to disable or remove the ``allow_versions`` flag, you
+must re-set any existing containers that had the ``X-Versions-Location`` flag
+configured so that it can now be tracked by the versioned_writes middleware.
+
+Clients should not use the ``X-History-Location`` header until all proxies in
+the cluster have been upgraded to a version of Swift that supports it.
+Attempting to use ``X-History-Location`` during a rolling upgrade may result
+in some requests being served by proxies running old code, leading to data
+loss.
+
+----------------------------------------------------
+Examples Using ``curl`` with ``X-Versions-Location``
+----------------------------------------------------
+
+First, create a container with the ``X-Versions-Location`` header or add the
+header to an existing container. Also make sure the container referenced by
+the ``X-Versions-Location`` exists. In this example, the name of that
+container is "versions"::
+
+    curl -i -XPUT -H "X-Auth-Token: <token>" \
+-H "X-Versions-Location: versions" http://<storage_url>/container
+    curl -i -XPUT -H "X-Auth-Token: <token>" http://<storage_url>/versions
+
+Create an object (the first version)::
+
+    curl -i -XPUT --data-binary 1 -H "X-Auth-Token: <token>" \
+http://<storage_url>/container/myobject
+
+Now create a new version of that object::
+
+    curl -i -XPUT --data-binary 2 -H "X-Auth-Token: <token>" \
+http://<storage_url>/container/myobject
+
+See a listing of the older versions of the object::
+
+    curl -i -H "X-Auth-Token: <token>" \
+http://<storage_url>/versions?prefix=008myobject/
+
+Now delete the current version of the object and see that the older version is
+gone from 'versions' container and back in 'container' container::
+
+    curl -i -XDELETE -H "X-Auth-Token: <token>" \
+http://<storage_url>/container/myobject
+    curl -i -H "X-Auth-Token: <token>" \
+http://<storage_url>/versions?prefix=008myobject/
+    curl -i -XGET -H "X-Auth-Token: <token>" \
+http://<storage_url>/container/myobject
+
+---------------------------------------------------
+Examples Using ``curl`` with ``X-History-Location``
+---------------------------------------------------
+
+As above, create a container with the ``X-History-Location`` header and ensure
+that the container referenced by the ``X-History-Location`` exists. In this
+example, the name of that container is "versions"::
+
+    curl -i -XPUT -H "X-Auth-Token: <token>" \
+-H "X-History-Location: versions" http://<storage_url>/container
+    curl -i -XPUT -H "X-Auth-Token: <token>" http://<storage_url>/versions
+
+Create an object (the first version)::
+
+    curl -i -XPUT --data-binary 1 -H "X-Auth-Token: <token>" \
+http://<storage_url>/container/myobject
+
+Now create a new version of that object::
+
+    curl -i -XPUT --data-binary 2 -H "X-Auth-Token: <token>" \
+http://<storage_url>/container/myobject
+
+Now delete the current version of the object. Subsequent requests will 404::
+
+    curl -i -XDELETE -H "X-Auth-Token: <token>" \
+http://<storage_url>/container/myobject
+    curl -i -H "X-Auth-Token: <token>" \
+http://<storage_url>/container/myobject
+
+A listing of the older versions of the object will include both the first and
+second versions of the object, as well as a "delete marker" object::
+
+    curl -i -H "X-Auth-Token: <token>" \
+http://<storage_url>/versions?prefix=008myobject/
+
+To restore a previous version, simply ``COPY`` it from the archive container::
+
+    curl -i -XCOPY -H "X-Auth-Token: <token>" \
+http://<storage_url>/versions/008myobject/<timestamp> \
+-H "Destination: container/myobject"
+
+Note that the archive container still has all previous versions of the object,
+including the source for the restore::
+
+    curl -i -H "X-Auth-Token: <token>" \
+http://<storage_url>/versions?prefix=008myobject/
+
+To permanently delete a previous version, ``DELETE`` it from the archive
+container::
+
+    curl -i -XDELETE -H "X-Auth-Token: <token>" \
+http://<storage_url>/versions/008myobject/<timestamp>
+
+---------------------------------------------------
+How to Disable Object Versioning in a Swift Cluster
+---------------------------------------------------
+
+If you want to disable all functionality, set ``allow_versioned_writes`` to
+``False`` in the middleware options.
+
+Disable versioning from a container (x is any value except empty)::
+
+    curl -i -XPOST -H "X-Auth-Token: <token>" \
+-H "X-Remove-Versions-Location: x" http://<storage_url>/container
+"""
+
+import json
+
+from swift.common.utils import get_logger, Timestamp, \
+    config_true_value, close_if_possible, FileLikeIter, drain_and_close
+from swift.common.request_helpers import get_sys_meta_prefix, \
+    copy_header_subset
+from swift.common.wsgi import WSGIContext, make_pre_authed_request
+from swift.common.constraints import check_container_format, MAX_FILE_SIZE
+from swift.proxy.controllers.base import get_container_info
+from swift.common.http import (
+    is_success, is_client_error, HTTP_NOT_FOUND)
+from swift.common.swob import HTTPPreconditionFailed, HTTPServiceUnavailable, \
+    HTTPServerError, HTTPBadRequest, str_to_wsgi, bytes_to_wsgi, wsgi_quote, \
+    wsgi_unquote, Request, HTTPException, HTTPRequestEntityTooLarge, \
+    parse_date_header
+from swift.common.exceptions import (
+    ListingIterNotFound, ListingIterError)
+
+
+DELETE_MARKER_CONTENT_TYPE = 'application/x-deleted;swift_versions_deleted=1'
+CLIENT_VERSIONS_LOC = 'x-versions-location'
+CLIENT_HISTORY_LOC = 'x-history-location'
+SYSMETA_VERSIONS_LOC = get_sys_meta_prefix('container') + 'versions-location'
+SYSMETA_VERSIONS_MODE = get_sys_meta_prefix('container') + 'versions-mode'
+
+
+class VersionedWritesContext(WSGIContext):
+
+    def __init__(self, wsgi_app, logger):
+        WSGIContext.__init__(self, wsgi_app)
+        self.logger = logger
+
+    def _listing_iter(self, account_name, lcontainer, lprefix, req):
+        try:
+            for page in self._listing_pages_iter(account_name, lcontainer,
+                                                 lprefix, req):
+                for item in page:
+                    yield item
+        except ListingIterNotFound:
+            pass
+        except ListingIterError:
+            raise HTTPServerError(request=req)
+
+    def _in_proxy_reverse_listing(self, account_name, lcontainer, lprefix,
+                                  req, failed_marker, failed_listing):
+        '''Get the complete prefix listing and reverse it on the proxy.
+
+        This is only necessary if we encounter a response from a
+        container-server that does not respect the ``reverse`` param
+        included by default in ``_listing_pages_iter``. This may happen
+        during rolling upgrades from pre-2.6.0 swift.
+
+        :param failed_marker: the marker that was used when we encountered
+                              the non-reversed listing
+        :param failed_listing: the non-reversed listing that was encountered.
+                               If ``failed_marker`` is blank, we can use this
+                               to save ourselves a request
+        :returns: an iterator over all objects starting with ``lprefix`` (up
+                  to but not including the failed marker) in reverse order
+        '''
+        complete_listing = []
+        if not failed_marker:
+            # We've never gotten a reversed listing. So save a request and
+            # use the failed listing.
+            complete_listing.extend(failed_listing)
+            marker = bytes_to_wsgi(complete_listing[-1]['name'].encode('utf8'))
+        else:
+            # We've gotten at least one reversed listing. Have to start at
+            # the beginning.
+            marker = ''
+
+        # First, take the *entire* prefix listing into memory
+        try:
+            for page in self._listing_pages_iter(
+                    account_name, lcontainer, lprefix,
+                    req, marker, end_marker=failed_marker, reverse=False):
+                complete_listing.extend(page)
+        except ListingIterNotFound:
+            pass
+
+        # Now that we've got everything, return the whole listing as one giant
+        # reversed page
+        return reversed(complete_listing)
+
+    def _listing_pages_iter(self, account_name, lcontainer, lprefix,
+                            req, marker='', end_marker='', reverse=True):
+        '''Get "pages" worth of objects that start with a prefix.
+
+        The optional keyword arguments ``marker``, ``end_marker``, and
+        ``reverse`` are used similar to how they are for containers. We're
+        either coming:
+
+           - directly from ``_listing_iter``, in which case none of the
+             optional args are specified, or
+
+           - from ``_in_proxy_reverse_listing``, in which case ``reverse``
+             is ``False`` and both ``marker`` and ``end_marker`` are specified
+             (although they may still be blank).
+        '''
+        while True:
+            lreq = make_pre_authed_request(
+                req.environ, method='GET', swift_source='VW',
+                path=wsgi_quote('/v1/%s/%s' % (account_name, lcontainer)))
+            lreq.environ['QUERY_STRING'] = \
+                'prefix=%s&marker=%s' % (wsgi_quote(lprefix),
+                                         wsgi_quote(marker))
+            if end_marker:
+                lreq.environ['QUERY_STRING'] += '&end_marker=%s' % (
+                    wsgi_quote(end_marker))
+            if reverse:
+                lreq.environ['QUERY_STRING'] += '&reverse=on'
+            lresp = lreq.get_response(self.app)
+            if not is_success(lresp.status_int):
+                # errors should be short
+                drain_and_close(lresp)
+                if lresp.status_int == HTTP_NOT_FOUND:
+                    raise ListingIterNotFound()
+                elif is_client_error(lresp.status_int):
+                    raise HTTPPreconditionFailed(request=req)
+                else:
+                    raise ListingIterError()
+
+            if not lresp.body:
+                break
+
+            sublisting = json.loads(lresp.body)
+            if not sublisting:
+                break
+
+            # When using the ``reverse`` param, check that the listing is
+            # actually reversed
+            first_item = bytes_to_wsgi(sublisting[0]['name'].encode('utf-8'))
+            last_item = bytes_to_wsgi(sublisting[-1]['name'].encode('utf-8'))
+            page_is_after_marker = marker and first_item > marker
+            if reverse and (first_item < last_item or page_is_after_marker):
+                # Apparently there's at least one pre-2.6.0 container server
+                yield self._in_proxy_reverse_listing(
+                    account_name, lcontainer, lprefix,
+                    req, marker, sublisting)
+                return
+
+            marker = last_item
+            yield sublisting
+
+    def _get_source_object(self, req, path_info):
+        # make a pre_auth request in case the user has write access
+        # to container, but not READ. This was allowed in previous version
+        # (i.e., before middleware) so keeping the same behavior here
+        get_req = make_pre_authed_request(
+            req.environ, path=wsgi_quote(path_info) + '?symlink=get',
+            headers={'X-Newest': 'True'}, method='GET', swift_source='VW')
+        source_resp = get_req.get_response(self.app)
+
+        if source_resp.content_length is None or \
+                source_resp.content_length > MAX_FILE_SIZE:
+            # Consciously *don't* drain the response before closing;
+            # any logged 499 is actually rather appropriate here
+            close_if_possible(source_resp.app_iter)
+            return HTTPRequestEntityTooLarge(request=req)
+
+        return source_resp
+
+    def _put_versioned_obj(self, req, put_path_info, source_resp):
+        # Create a new Request object to PUT to the container, copying
+        # all headers from the source object apart from x-timestamp.
+        put_req = make_pre_authed_request(
+            req.environ, path=wsgi_quote(put_path_info), method='PUT',
+            swift_source='VW')
+        copy_header_subset(source_resp, put_req,
+                           lambda k: k.lower() != 'x-timestamp')
+        slo_size = put_req.headers.get('X-Object-Sysmeta-Slo-Size')
+        if slo_size:
+            put_req.headers['Content-Type'] += '; swift_bytes=' + slo_size
+            put_req.environ['swift.content_type_overridden'] = True
+
+        put_req.environ['wsgi.input'] = FileLikeIter(source_resp.app_iter)
+        put_resp = put_req.get_response(self.app)
+        # the PUT was responsible for draining
+        close_if_possible(source_resp.app_iter)
+        return put_resp
+
+    def _check_response_error(self, req, resp):
+        """
+        Raise Error Response in case of error
+        """
+        if is_success(resp.status_int):
+            return
+        # any error should be short
+        drain_and_close(resp)
+        if is_client_error(resp.status_int):
+            # missing container or bad permissions
+            raise HTTPPreconditionFailed(request=req)
+        # could not version the data, bail
+        raise HTTPServiceUnavailable(request=req)
+
+    def _build_versions_object_prefix(self, object_name):
+        return '%03x%s/' % (
+            len(object_name),
+            object_name)
+
+    def _build_versions_object_name(self, object_name, ts):
+        """
+        :param object_name: (str) name of object
+        :param ts: (str) timestamp of object version
+        """
+        return ''.join((
+            self._build_versions_object_prefix(object_name),
+            Timestamp(ts).internal))
+
+    def _copy_current(self, req, versions_cont, api_version, account_name,
+                      object_name):
+        # validate the write access to the versioned container before
+        # making any backend requests
+        if 'swift.authorize' in req.environ:
+            container_info = get_container_info(
+                req.environ, self.app, swift_source='VW')
+            req.acl = container_info.get('write_acl')
+            aresp = req.environ['swift.authorize'](req)
+            if aresp:
+                raise aresp
+
+        get_resp = self._get_source_object(req, req.path_info)
+
+        if get_resp.status_int == HTTP_NOT_FOUND:
+            # nothing to version, proceed with original request
+            drain_and_close(get_resp)
+            return
+
+        # check for any other errors
+        self._check_response_error(req, get_resp)
+
+        # if there's an existing object, then copy it to
+        # X-Versions-Location
+        ts_source = get_resp.headers.get(
+            'x-timestamp',
+            str(parse_date_header(get_resp.headers['last-modified'])))
+        vers_obj_name = self._build_versions_object_name(
+            object_name, ts_source)
+
+        put_path_info = "/%s/%s/%s/%s" % (
+            api_version, account_name, versions_cont, vers_obj_name)
+        req.environ['QUERY_STRING'] = ''
+        put_resp = self._put_versioned_obj(req, put_path_info, get_resp)
+
+        self._check_response_error(req, put_resp)
+        # successful PUT response should be short
+        drain_and_close(put_resp)
+
+    def handle_obj_versions_put(self, req, versions_cont, api_version,
+                                account_name, object_name):
+        """
+        Copy current version of object to versions_container before proceeding
+        with original request.
+
+        :param req: original request.
+        :param versions_cont: container where previous versions of the object
+                              are stored.
+        :param api_version: api version.
+        :param account_name: account name.
+        :param object_name: name of object of original request
+        """
+        self._copy_current(req, versions_cont, api_version, account_name,
+                           object_name)
+        return self.app
+
+    def handle_obj_versions_delete_push(self, req, versions_cont, api_version,
+                                        account_name, container_name,
+                                        object_name):
+        """
+        Handle DELETE requests when in history mode.
+
+        Copy current version of object to versions_container and write a
+        delete marker before proceeding with original request.
+
+        :param req: original request.
+        :param versions_cont: container where previous versions of the object
+                              are stored.
+        :param api_version: api version.
+        :param account_name: account name.
+        :param object_name: name of object of original request
+        """
+        self._copy_current(req, versions_cont, api_version, account_name,
+                           object_name)
+
+        marker_path = "/%s/%s/%s/%s" % (
+            api_version, account_name, versions_cont,
+            self._build_versions_object_name(object_name,
+                                             Timestamp.now().internal))
+        marker_headers = {
+            # Definitive source of truth is Content-Type, and since we add
+            # a swift_* param, we know users haven't set it themselves.
+            # This is still open to users POSTing to update the content-type
+            # but they're just shooting themselves in the foot then.
+            'content-type': DELETE_MARKER_CONTENT_TYPE,
+            'content-length': '0',
+            'x-auth-token': req.headers.get('x-auth-token')}
+        marker_req = make_pre_authed_request(
+            req.environ, path=wsgi_quote(marker_path),
+            headers=marker_headers, method='PUT', swift_source='VW')
+        marker_req.environ['swift.content_type_overridden'] = True
+        marker_resp = marker_req.get_response(self.app)
+        self._check_response_error(req, marker_resp)
+        drain_and_close(marker_resp)
+
+        # successfully copied and created delete marker; safe to delete
+        return self.app
+
+    def _restore_data(self, req, versions_cont, api_version, account_name,
+                      container_name, object_name, prev_obj_name):
+        get_path = "/%s/%s/%s/%s" % (
+            api_version, account_name, versions_cont, prev_obj_name)
+
+        get_resp = self._get_source_object(req, get_path)
+
+        # if the version isn't there, keep trying with previous version
+        if get_resp.status_int == HTTP_NOT_FOUND:
+            drain_and_close(get_resp)
+            return False
+
+        self._check_response_error(req, get_resp)
+
+        put_path_info = "/%s/%s/%s/%s" % (
+            api_version, account_name, container_name, object_name)
+        put_resp = self._put_versioned_obj(req, put_path_info, get_resp)
+
+        self._check_response_error(req, put_resp)
+        drain_and_close(put_resp)
+        return get_path
+
+    def handle_obj_versions_delete_pop(self, req, versions_cont, api_version,
+                                       account_name, container_name,
+                                       object_name):
+        """
+        Handle DELETE requests when in stack mode.
+
+        Delete current version of object and pop previous version in its place.
+
+        :param req: original request.
+        :param versions_cont: container where previous versions of the object
+                              are stored.
+        :param api_version: api version.
+        :param account_name: account name.
+        :param container_name: container name.
+        :param object_name: object name.
+        """
+        listing_prefix = self._build_versions_object_prefix(object_name)
+        item_iter = self._listing_iter(account_name, versions_cont,
+                                       listing_prefix, req)
+
+        auth_token_header = {'X-Auth-Token': req.headers.get('X-Auth-Token')}
+        authed = False
+        for previous_version in item_iter:
+            if not authed:
+                # validate the write access to the versioned container before
+                # making any backend requests
+                if 'swift.authorize' in req.environ:
+                    container_info = get_container_info(
+                        req.environ, self.app, swift_source='VW')
+                    req.acl = container_info.get('write_acl')
+                    aresp = req.environ['swift.authorize'](req)
+                    if aresp:
+                        return aresp
+                    authed = True
+
+            if previous_version['content_type'] == DELETE_MARKER_CONTENT_TYPE:
+                # check whether we have data in the versioned container
+                obj_head_headers = {'X-Newest': 'True'}
+                obj_head_headers.update(auth_token_header)
+                head_req = make_pre_authed_request(
+                    req.environ, path=wsgi_quote(req.path_info), method='HEAD',
+                    headers=obj_head_headers, swift_source='VW')
+                hresp = head_req.get_response(self.app)
+                drain_and_close(hresp)
+
+                if hresp.status_int != HTTP_NOT_FOUND:
+                    self._check_response_error(req, hresp)
+                    # if there's an existing object, then just let the delete
+                    # through (i.e., restore to the delete-marker state):
+                    break
+
+                # no data currently in the container (delete marker is current)
+                for version_to_restore in item_iter:
+                    if version_to_restore['content_type'] == \
+                            DELETE_MARKER_CONTENT_TYPE:
+                        # Nothing to restore
+                        break
+                    obj_to_restore = bytes_to_wsgi(
+                        version_to_restore['name'].encode('utf-8'))
+                    req.environ['QUERY_STRING'] = ''
+                    restored_path = self._restore_data(
+                        req, versions_cont, api_version, account_name,
+                        container_name, object_name, obj_to_restore)
+                    if not restored_path:
+                        continue
+
+                    old_del_req = make_pre_authed_request(
+                        req.environ, path=wsgi_quote(restored_path),
+                        method='DELETE', headers=auth_token_header,
+                        swift_source='VW')
+                    del_resp = old_del_req.get_response(self.app)
+                    drain_and_close(del_resp)
+                    if del_resp.status_int != HTTP_NOT_FOUND:
+                        self._check_response_error(req, del_resp)
+                        # else, well, it existed long enough to do the
+                        # copy; we won't worry too much
+                    break
+                prev_obj_name = bytes_to_wsgi(
+                    previous_version['name'].encode('utf-8'))
+                marker_path = "/%s/%s/%s/%s" % (
+                    api_version, account_name, versions_cont,
+                    prev_obj_name)
+                # done restoring, redirect the delete to the marker
+                req = make_pre_authed_request(
+                    req.environ, path=wsgi_quote(marker_path), method='DELETE',
+                    headers=auth_token_header, swift_source='VW')
+            else:
+                # there are older versions so copy the previous version to the
+                # current object and delete the previous version
+                prev_obj_name = bytes_to_wsgi(
+                    previous_version['name'].encode('utf-8'))
+                req.environ['QUERY_STRING'] = ''
+                restored_path = self._restore_data(
+                    req, versions_cont, api_version, account_name,
+                    container_name, object_name, prev_obj_name)
+                if not restored_path:
+                    continue
+
+                # redirect the original DELETE to the source of the reinstated
+                # version object - we already auth'd original req so make a
+                # pre-authed request
+                req = make_pre_authed_request(
+                    req.environ, path=wsgi_quote(restored_path),
+                    method='DELETE', headers=auth_token_header,
+                    swift_source='VW')
+
+            # remove 'X-If-Delete-At', since it is not for the older copy
+            if 'X-If-Delete-At' in req.headers:
+                del req.headers['X-If-Delete-At']
+            break
+
+        # handle DELETE request here in case it was modified
+        return req.get_response(self.app)
+
+    def handle_container_request(self, env, start_response):
+        app_resp = self._app_call(env)
+        if self._response_headers is None:
+            self._response_headers = []
+        mode = location = ''
+        for key, val in self._response_headers:
+            if key.lower() == SYSMETA_VERSIONS_LOC:
+                location = val
+            elif key.lower() == SYSMETA_VERSIONS_MODE:
+                mode = val
+
+        if location:
+            if mode == 'history':
+                self._response_headers.extend([
+                    (CLIENT_HISTORY_LOC.title(), location)])
+            else:
+                self._response_headers.extend([
+                    (CLIENT_VERSIONS_LOC.title(), location)])
+
+        start_response(self._response_status,
+                       self._response_headers,
+                       self._response_exc_info)
+        return app_resp
+
+
+class VersionedWritesMiddleware(object):
+
+    def __init__(self, app, conf):
+        self.app = app
+        self.conf = conf
+        self.logger = get_logger(conf, log_route='versioned_writes')
+
+    def container_request(self, req, start_response, enabled):
+        if CLIENT_VERSIONS_LOC in req.headers and \
+                CLIENT_HISTORY_LOC in req.headers:
+            if not req.headers[CLIENT_HISTORY_LOC]:
+                # defer to versions location entirely
+                del req.headers[CLIENT_HISTORY_LOC]
+            elif req.headers[CLIENT_VERSIONS_LOC]:
+                raise HTTPBadRequest(
+                    request=req, content_type='text/plain',
+                    body='Only one of %s or %s may be specified' % (
+                        CLIENT_VERSIONS_LOC, CLIENT_HISTORY_LOC))
+            else:
+                # history location is present and versions location is
+                # present but empty -- clean it up
+                del req.headers[CLIENT_VERSIONS_LOC]
+
+        if CLIENT_VERSIONS_LOC in req.headers or \
+                CLIENT_HISTORY_LOC in req.headers:
+            if CLIENT_VERSIONS_LOC in req.headers:
+                val = req.headers[CLIENT_VERSIONS_LOC]
+                mode = 'stack'
+            else:
+                val = req.headers[CLIENT_HISTORY_LOC]
+                mode = 'history'
+
+            if not val:
+                # empty value is the same as X-Remove-Versions-Location
+                req.headers['X-Remove-Versions-Location'] = 'x'
+            elif not config_true_value(enabled) and \
+                    req.method in ('PUT', 'POST'):
+                # differently from previous version, we are actually
+                # returning an error if user tries to set versions location
+                # while feature is explicitly disabled.
+                raise HTTPPreconditionFailed(
+                    request=req, content_type='text/plain',
+                    body='Versioned Writes is disabled')
+            else:
+                # OK, we received a value, have versioning enabled, and aren't
+                # trying to set two modes at once. Validate the value and
+                # translate to sysmeta.
+                location = check_container_format(req, val)
+                req.headers[SYSMETA_VERSIONS_LOC] = location
+                req.headers[SYSMETA_VERSIONS_MODE] = mode
+
+                # reset original header on container server to maintain sanity
+                # now only sysmeta is source of Versions Location
+                req.headers[CLIENT_VERSIONS_LOC] = ''
+
+                # if both add and remove headers are in the same request
+                # adding location takes precedence over removing
+                for header in ['X-Remove-Versions-Location',
+                               'X-Remove-History-Location']:
+                    if header in req.headers:
+                        del req.headers[header]
+
+        if any(req.headers.get(header) for header in [
+                'X-Remove-Versions-Location',
+                'X-Remove-History-Location']):
+            req.headers.update({CLIENT_VERSIONS_LOC: '',
+                                SYSMETA_VERSIONS_LOC: '',
+                                SYSMETA_VERSIONS_MODE: ''})
+            for header in ['X-Remove-Versions-Location',
+                           'X-Remove-History-Location']:
+                if header in req.headers:
+                    del req.headers[header]
+
+        # send request and translate sysmeta headers from response
+        vw_ctx = VersionedWritesContext(self.app, self.logger)
+        return vw_ctx.handle_container_request(req.environ, start_response)
+
+    def object_request(self, req, api_version, account, container, obj,
+                       allow_versioned_writes):
+        """
+        Handle request for object resource.
+
+        Note that account, container, obj should be unquoted by caller
+        if the url path is under url encoding (e.g. %FF)
+
+        :param req: swift.common.swob.Request instance
+        :param api_version: should be v1 unless swift bumps api version
+        :param account: account name string
+        :param container: container name string
+        :param object: object name string
+        """
+        resp = None
+        is_enabled = config_true_value(allow_versioned_writes)
+        container_info = get_container_info(
+            req.environ, self.app, swift_source='VW')
+
+        # To maintain backwards compatibility, container version
+        # location could be stored as sysmeta or not, need to check both.
+        # If stored as sysmeta, check if middleware is enabled. If sysmeta
+        # is not set, but versions property is set in container_info, then
+        # for backwards compatibility feature is enabled.
+        versions_cont = container_info.get(
+            'sysmeta', {}).get('versions-location')
+        versioning_mode = container_info.get(
+            'sysmeta', {}).get('versions-mode', 'stack')
+        if not versions_cont:
+            versions_cont = container_info.get('versions')
+            # if allow_versioned_writes is not set in the configuration files
+            # but 'versions' is configured, enable feature to maintain
+            # backwards compatibility
+            if not allow_versioned_writes and versions_cont:
+                is_enabled = True
+
+        if is_enabled and versions_cont:
+            versions_cont = wsgi_unquote(str_to_wsgi(
+                versions_cont)).split('/')[0]
+            vw_ctx = VersionedWritesContext(self.app, self.logger)
+            if req.method == 'PUT':
+                resp = vw_ctx.handle_obj_versions_put(
+                    req, versions_cont, api_version, account,
+                    obj)
+            # handle DELETE
+            elif versioning_mode == 'history':
+                resp = vw_ctx.handle_obj_versions_delete_push(
+                    req, versions_cont, api_version, account,
+                    container, obj)
+            else:
+                resp = vw_ctx.handle_obj_versions_delete_pop(
+                    req, versions_cont, api_version, account,
+                    container, obj)
+
+        if resp:
+            return resp
+        else:
+            return self.app
+
+    def __call__(self, env, start_response):
+        req = Request(env)
+        try:
+            (api_version, account, container, obj) = req.split_path(3, 4, True)
+            is_cont_or_obj_req = True
+        except ValueError:
+            is_cont_or_obj_req = False
+        if not is_cont_or_obj_req:
+            return self.app(env, start_response)
+
+        # In case allow_versioned_writes is set in the filter configuration,
+        # the middleware becomes the authority on whether object
+        # versioning is enabled or not. In case it is not set, then
+        # the option in the container configuration is still checked
+        # for backwards compatibility
+
+        # For a container request, first just check if option is set,
+        # can be either true or false.
+        # If set, check if enabled when actually trying to set container
+        # header. If not set, let request be handled by container server
+        # for backwards compatibility.
+        # For an object request, also check if option is set (either T or F).
+        # If set, check if enabled when checking versions container in
+        # sysmeta property. If it is not set check 'versions' property in
+        # container_info
+        allow_versioned_writes = self.conf.get('allow_versioned_writes')
+        if allow_versioned_writes and container and not obj:
+            try:
+                return self.container_request(req, start_response,
+                                              allow_versioned_writes)
+            except HTTPException as error_response:
+                return error_response(env, start_response)
+        elif (obj and req.method in ('PUT', 'DELETE')):
+            try:
+                return self.object_request(
+                    req, api_version, account, container, obj,
+                    allow_versioned_writes)(env, start_response)
+            except HTTPException as error_response:
+                return error_response(env, start_response)
+        else:
+            return self.app(env, start_response)
diff --git a/swift/common/middleware/versioned_writes/object_versioning.py b/swift/common/middleware/versioned_writes/object_versioning.py
new file mode 100644
index 0000000000..8b9d58738f
--- /dev/null
+++ b/swift/common/middleware/versioned_writes/object_versioning.py
@@ -0,0 +1,1482 @@
+# Copyright (c) 2020 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""
+Object versioning in Swift has 3 different modes. There are two
+:ref:`legacy modes <versioned_writes>` that have similar API with a slight
+difference in behavior and this middleware introduces a new mode with a
+completely redesigned API and implementation.
+
+In terms of the implementation, this middleware relies heavily on the use of
+static links to reduce the amount of backend data movement that was part of the
+two legacy modes. It also introduces a new API for enabling the feature and to
+interact with older versions of an object.
+
+Compatibility between modes
+===========================
+
+This new mode is not backwards compatible or interchangeable with the
+two legacy modes. This means that existing containers that are being versioned
+by the two legacy modes cannot enable the new mode. The new mode can only be
+enabled on a new container or a container without either
+``X-Versions-Location`` or ``X-History-Location`` header set. Attempting to
+enable the new mode on a container with either header will result in a
+``400 Bad Request`` response.
+
+Enable Object Versioning in a Container
+=======================================
+
+After the introduction of this feature containers in a Swift cluster will be
+in one of either 3 possible states: 1. Object versioning never enabled,
+2. Object Versioning Enabled or 3. Object Versioning Disabled. Once versioning
+has been enabled on a container, it will always have a flag stating whether it
+is either enabled or disabled.
+
+Clients enable object versioning on a container by performing either a PUT or
+POST request with the header ``X-Versions-Enabled: true``. Upon enabling the
+versioning for the first time, the middleware will create a hidden container
+where object versions are stored. This hidden container will inherit the same
+Storage Policy as its parent container.
+
+To disable, clients send a POST request with the header
+``X-Versions-Enabled: false``. When versioning is disabled, the old versions
+remain unchanged.
+
+To delete a versioned container, versioning must be disabled and all versions
+of all objects must be deleted before the container can be deleted. At such
+time, the hidden container will also be deleted.
+
+Object CRUD Operations to a Versioned Container
+===============================================
+
+When data is ``PUT`` into a versioned container (a container with the
+versioning flag enabled), the actual object is written to a hidden container
+and a symlink object is written to the parent container. Every object is
+assigned a version id. This id can be retrieved from the
+``X-Object-Version-Id`` header in the PUT response.
+
+.. note::
+
+    When object versioning is disabled on a container, new data will no longer
+    be versioned, but older versions remain untouched. Any new data ``PUT``
+    will result in a object with a ``null`` version-id. The versioning API can
+    be used to both list and operate on previous versions even while versioning
+    is disabled.
+
+    If versioning is re-enabled and an overwrite occurs on a `null` id object.
+    The object will be versioned off with a regular version-id.
+
+A ``GET`` to a versioned object will return the current version of the object.
+The ``X-Object-Version-Id`` header is also returned in the response.
+
+A ``POST`` to a versioned object will update the most current object metadata
+as normal, but will not create a new version of the object. In other words,
+new versions are only created when the content of the object changes.
+
+On ``DELETE``, the middleware will write a zero-byte "delete marker" object
+version that notes **when** the delete took place. The symlink object will also
+be deleted from the versioned container. The object will no longer appear in
+container listings for the versioned container and future requests there will
+return ``404 Not Found``. However, the previous versions content will still be
+recoverable.
+
+Object Versioning API
+=====================
+
+Clients can now operate on previous versions of an object using this new
+versioning API.
+
+First to list previous versions, issue a a ``GET`` request to the versioned
+container with query parameter::
+
+    ?versions
+
+To list a container with a large number of object versions, clients can
+also use the ``version_marker`` parameter together with the ``marker``
+parameter.  While the ``marker`` parameter is used to specify an object name
+the ``version_marker`` will be used specify the version id.
+
+All other pagination parameters can be used in conjunction with the
+``versions`` parameter.
+
+During container listings, delete markers can be identified with the
+content-type ``application/x-deleted;swift_versions_deleted=1``. The most
+current version of an object can be identified by the field ``is_latest``.
+
+To operate on previous versions, clients can use the query parameter::
+
+    ?version-id=<id>
+
+where the ``<id>`` is the value from the ``X-Object-Version-Id`` header.
+
+Only COPY, HEAD, GET and DELETE operations can be performed on previous
+versions. Either a PUT or POST request with a ``version-id`` parameter will
+result in a ``400 Bad Request`` response.
+
+A HEAD/GET request to a delete-marker will result in a ``404 Not Found``
+response.
+
+When issuing DELETE requests with a ``version-id`` parameter, delete markers
+are not written down. A DELETE request with a ``version-id`` parameter to
+the current object will result in a both the symlink and the backing data
+being deleted. A DELETE to any other version will result in that version only
+be deleted and no changes made to the symlink pointing to the current version.
+
+How to Enable Object Versioning in a Swift Cluster
+==================================================
+
+To enable this new mode in a Swift cluster the ``versioned_writes`` and
+``symlink`` middlewares must be added to the proxy pipeline, you must also set
+the option ``allow_object_versioning`` to ``True``.
+"""
+
+import itertools
+import json
+
+from urllib.parse import unquote
+
+from swift.common.constraints import MAX_FILE_SIZE, valid_api_version, \
+    ACCOUNT_LISTING_LIMIT, CONTAINER_LISTING_LIMIT
+from swift.common.http import is_success, is_client_error, HTTP_NOT_FOUND, \
+    HTTP_CONFLICT
+from swift.common.request_helpers import get_sys_meta_prefix, \
+    copy_header_subset, get_reserved_name, split_reserved_name, \
+    constrain_req_limit
+from swift.common.middleware import app_property
+from swift.common.middleware.symlink import TGT_OBJ_SYMLINK_HDR, \
+    TGT_ETAG_SYSMETA_SYMLINK_HDR, SYMLOOP_EXTEND, ALLOW_RESERVED_NAMES, \
+    TGT_BYTES_SYSMETA_SYMLINK_HDR, TGT_ACCT_SYMLINK_HDR
+from swift.common.swob import HTTPPreconditionFailed, HTTPServiceUnavailable, \
+    HTTPBadRequest, str_to_wsgi, bytes_to_wsgi, wsgi_quote, \
+    wsgi_to_str, wsgi_unquote, Request, HTTPNotFound, HTTPException, \
+    HTTPRequestEntityTooLarge, HTTPInternalServerError, HTTPNotAcceptable, \
+    HTTPConflict, HTTPLengthRequired, parse_date_header
+from swift.common.storage_policy import POLICIES
+from swift.common.utils import get_logger, Timestamp, drain_and_close, \
+    config_true_value, close_if_possible, closing_if_possible, \
+    FileLikeIter, split_path, parse_content_type, parse_header, RESERVED_STR
+from swift.common.wsgi import WSGIContext, make_pre_authed_request
+from swift.proxy.controllers.base import get_container_info
+
+
+DELETE_MARKER_CONTENT_TYPE = 'application/x-deleted;swift_versions_deleted=1'
+CLIENT_VERSIONS_ENABLED = 'x-versions-enabled'
+SYSMETA_VERSIONS_ENABLED = \
+    get_sys_meta_prefix('container') + 'versions-enabled'
+SYSMETA_VERSIONS_CONT = get_sys_meta_prefix('container') + 'versions-container'
+SYSMETA_PARENT_CONT = get_sys_meta_prefix('container') + 'parent-container'
+SYSMETA_VERSIONS_SYMLINK = get_sys_meta_prefix('object') + 'versions-symlink'
+
+
+def build_listing(*to_splice, **kwargs):
+    reverse = kwargs.pop('reverse')
+    limit = kwargs.pop('limit')
+    if kwargs:
+        raise TypeError('Invalid keyword arguments received: %r' % kwargs)
+
+    def merge_key(item):
+        if 'subdir' in item:
+            return item['subdir']
+        return item['name']
+
+    return json.dumps(sorted(
+        itertools.chain(*to_splice),
+        key=merge_key,
+        reverse=reverse,
+    )[:limit]).encode('ascii')
+
+
+def non_expiry_header(header):
+    return header.lower() not in ('x-delete-at', 'x-delete-after')
+
+
+class ByteCountingReader(object):
+    """
+    Counts bytes read from file_like so we know how big the object is that
+    the client just PUT.
+
+    This is particularly important when the client sends a chunk-encoded body,
+    so we don't have a Content-Length header available.
+    """
+    def __init__(self, file_like):
+        self.file_like = file_like
+        self.bytes_read = 0
+
+    def read(self, amt=-1):
+        chunk = self.file_like.read(amt)
+        self.bytes_read += len(chunk)
+        return chunk
+
+
+class ObjectVersioningContext(WSGIContext):
+    def __init__(self, wsgi_app, logger):
+        super(ObjectVersioningContext, self).__init__(wsgi_app)
+        self.logger = logger
+
+    def _build_versions_object_prefix(self, object_name):
+        return get_reserved_name(object_name, '')
+
+    def _build_versions_container_name(self, container_name):
+        return get_reserved_name('versions', container_name)
+
+    def _build_versions_object_name(self, object_name, ts):
+        """
+        :param object_name: (str) name of object
+        :param ts: (str) timestamp of object version
+        """
+        inv = ~Timestamp(ts)
+        return get_reserved_name(object_name, inv.internal)
+
+    def _split_version_from_name(self, versioned_name):
+        try:
+            name, inv = split_reserved_name(versioned_name)
+            ts = ~Timestamp(inv)
+        except ValueError:
+            return versioned_name, None
+        return name, ts
+
+    def _split_versions_container_name(self, versions_container):
+        try:
+            versions, container_name = split_reserved_name(versions_container)
+        except ValueError:
+            return versions_container
+
+        if versions != 'versions':
+            return versions_container
+
+        return container_name
+
+
+class ObjectContext(ObjectVersioningContext):
+
+    def _get_source_object(self, req, path_info):
+        # make a pre_auth request in case the user has write access
+        # to container, but not READ. This was allowed in previous version
+        # (i.e., before middleware) so keeping the same behavior here
+        get_req = make_pre_authed_request(
+            req.environ, path=wsgi_quote(path_info) + '?symlink=get',
+            headers={'X-Newest': 'True'}, method='GET', swift_source='OV')
+        source_resp = get_req.get_response(self.app)
+
+        if source_resp.content_length is None or \
+                source_resp.content_length > MAX_FILE_SIZE:
+            close_if_possible(source_resp.app_iter)
+            return HTTPRequestEntityTooLarge(request=req)
+
+        return source_resp
+
+    def _put_versioned_obj(self, req, put_path_info, source_resp):
+        # Create a new Request object to PUT to the versions container, copying
+        # all headers from the source object apart from x-timestamp.
+        put_req = make_pre_authed_request(
+            req.environ, path=wsgi_quote(put_path_info), method='PUT',
+            headers={'X-Backend-Allow-Reserved-Names': 'true'},
+            swift_source='OV')
+        copy_header_subset(source_resp, put_req,
+                           lambda k: k.lower() != 'x-timestamp')
+        put_req.environ['wsgi.input'] = FileLikeIter(source_resp.app_iter)
+        slo_size = put_req.headers.get('X-Object-Sysmeta-Slo-Size')
+        if slo_size:
+            put_req.headers['Content-Type'] += '; swift_bytes=%s' % slo_size
+            put_req.environ['swift.content_type_overridden'] = True
+        put_resp = put_req.get_response(self.app)
+        drain_and_close(put_resp)
+        # the PUT should have already drained source_resp
+        close_if_possible(source_resp.app_iter)
+        return put_resp
+
+    def _put_versioned_obj_from_client(self, req, versions_cont, api_version,
+                                       account_name, object_name):
+        vers_obj_name = self._build_versions_object_name(
+            object_name, req.timestamp.internal)
+        put_path_info = "/%s/%s/%s/%s" % (
+            api_version, account_name, versions_cont, vers_obj_name)
+        # Consciously *do not* set swift_source here -- this req is in charge
+        # of reading bytes from the client, don't let it look like that data
+        # movement is due to some internal-to-swift thing
+        put_req = make_pre_authed_request(
+            req.environ, path=wsgi_quote(put_path_info), method='PUT',
+            headers={'X-Backend-Allow-Reserved-Names': 'true'},
+            swift_source='OV')
+        # move the client request body over
+        # note that the WSGI environ may be *further* manipulated; hold on to
+        # a reference to the byte counter so we can get the bytes_read
+        if req.message_length() is None:
+            put_req.headers['transfer-encoding'] = \
+                req.headers.get('transfer-encoding')
+        else:
+            put_req.content_length = req.content_length
+        byte_counter = ByteCountingReader(req.environ['wsgi.input'])
+        put_req.environ['wsgi.input'] = byte_counter
+        req.body = b''
+        # move metadata over, including sysmeta
+
+        copy_header_subset(req, put_req, non_expiry_header)
+        if 'swift.content_type_overridden' in req.environ:
+            put_req.environ['swift.content_type_overridden'] = \
+                req.environ.pop('swift.content_type_overridden')
+
+        # do the write
+        put_resp = put_req.get_response(self.app)
+        close_if_possible(put_req.environ['wsgi.input'])
+
+        if put_resp.status_int == HTTP_NOT_FOUND:
+            drain_and_close(put_resp)
+            raise HTTPInternalServerError(
+                request=req, content_type='text/plain',
+                body=b'The versions container does not exist. You may '
+                     b'want to re-enable object versioning.')
+
+        self._check_response_error(req, put_resp)
+        drain_and_close(put_resp)
+        put_bytes = byte_counter.bytes_read
+        # N.B. this is essentially the same hack that symlink does in
+        # _validate_etag_and_update_sysmeta to deal with SLO
+        slo_size = put_req.headers.get('X-Object-Sysmeta-Slo-Size')
+        if slo_size:
+            put_bytes = slo_size
+        put_content_type = parse_content_type(
+            put_req.headers['Content-Type'])[0]
+
+        return (put_resp, vers_obj_name, put_bytes, put_content_type)
+
+    def _put_symlink_to_version(self, req, versions_cont, put_vers_obj_name,
+                                api_version, account_name, object_name,
+                                put_etag, put_bytes, put_content_type):
+
+        req.method = 'PUT'
+        # inch x-timestamp forward, just in case
+        req.ensure_x_timestamp()
+        req.headers['X-Timestamp'] = Timestamp(
+            req.timestamp, offset=1).internal
+        req.headers[TGT_ETAG_SYSMETA_SYMLINK_HDR] = put_etag
+        req.headers[TGT_BYTES_SYSMETA_SYMLINK_HDR] = put_bytes
+        # N.B. in stack mode DELETE we use content_type from listing
+        req.headers['Content-Type'] = put_content_type
+        req.headers[TGT_OBJ_SYMLINK_HDR] = wsgi_quote('%s/%s' % (
+            versions_cont, put_vers_obj_name))
+        req.headers[SYSMETA_VERSIONS_SYMLINK] = 'true'
+        req.headers[SYMLOOP_EXTEND] = 'true'
+        req.headers[ALLOW_RESERVED_NAMES] = 'true'
+        req.headers['X-Backend-Allow-Reserved-Names'] = 'true'
+        not_for_symlink_headers = (
+            'ETag', 'X-If-Delete-At', TGT_ACCT_SYMLINK_HDR,
+            'X-Object-Manifest', 'X-Static-Large-Object',
+            'X-Object-Sysmeta-Slo-Etag', 'X-Object-Sysmeta-Slo-Size',
+        )
+        for header in not_for_symlink_headers:
+            req.headers.pop(header, None)
+
+        # *do* set swift_source here; this PUT is an implementation detail
+        req.environ['swift.source'] = 'OV'
+        req.body = b''
+        resp = req.get_response(self.app)
+        resp.headers['ETag'] = put_etag
+        resp.headers['X-Object-Version-Id'] = self._split_version_from_name(
+            put_vers_obj_name)[1].internal
+        return resp
+
+    def _check_response_error(self, req, resp):
+        """
+        Raise Error Response in case of error
+        """
+        if is_success(resp.status_int):
+            return
+        body = resp.body
+        drain_and_close(resp)
+        if is_client_error(resp.status_int):
+            # missing container or bad permissions
+            if resp.status_int == 404:
+                raise HTTPPreconditionFailed(request=req)
+            raise HTTPException(body=body, status=resp.status,
+                                headers=resp.headers)
+        # could not version the data, bail
+        raise HTTPServiceUnavailable(request=req)
+
+    def _copy_current(self, req, versions_cont, api_version, account_name,
+                      object_name):
+        '''
+        Check if the current version of the object is a versions-symlink
+        if not, it's because this object was added to the container when
+        versioning was not enabled. We'll need to copy it into the versions
+        containers now.
+
+        :param req: original request.
+        :param versions_cont: container where previous versions of the object
+                              are stored.
+        :param api_version: api version.
+        :param account_name: account name.
+        :param object_name: name of object of original request
+        '''
+        # validate the write access to the versioned container before
+        # making any backend requests
+        if 'swift.authorize' in req.environ:
+            container_info = get_container_info(
+                req.environ, self.app, swift_source='OV')
+            req.acl = container_info.get('write_acl')
+            aresp = req.environ['swift.authorize'](req)
+            if aresp:
+                raise aresp
+
+        get_resp = self._get_source_object(req, req.path_info)
+
+        if get_resp.status_int == HTTP_NOT_FOUND:
+            # nothing to version, proceed with original request
+            drain_and_close(get_resp)
+            return get_resp
+
+        # check for any other errors
+        self._check_response_error(req, get_resp)
+
+        if get_resp.headers.get(SYSMETA_VERSIONS_SYMLINK) == 'true':
+            # existing object is a VW symlink; no action required
+            drain_and_close(get_resp)
+            return get_resp
+
+        # if there's an existing object, then copy it to
+        # X-Versions-Location
+        ts_source = get_resp.headers.get(
+            'x-timestamp',
+            str(parse_date_header(get_resp.headers['last-modified'])))
+        vers_obj_name = self._build_versions_object_name(
+            object_name, ts_source)
+
+        put_path_info = "/%s/%s/%s/%s" % (
+            api_version, account_name, versions_cont, vers_obj_name)
+        put_resp = self._put_versioned_obj(req, put_path_info, get_resp)
+
+        if put_resp.status_int == HTTP_NOT_FOUND:
+            raise HTTPInternalServerError(
+                request=req, content_type='text/plain',
+                body=b'The versions container does not exist. You may '
+                     b'want to re-enable object versioning.')
+
+        self._check_response_error(req, put_resp)
+
+    def handle_put(self, req, versions_cont, api_version,
+                   account_name, object_name, is_enabled):
+        """
+        Check if the current version of the object is a versions-symlink
+        if not, it's because this object was added to the container when
+        versioning was not enabled. We'll need to copy it into the versions
+        containers now that versioning is enabled.
+
+        Also, put the new data from the client into the versions container
+        and add a static symlink in the versioned container.
+
+        :param req: original request.
+        :param versions_cont: container where previous versions of the object
+                              are stored.
+        :param api_version: api version.
+        :param account_name: account name.
+        :param object_name: name of object of original request
+        """
+        # handle object request for a disabled versioned container.
+        if not is_enabled:
+            return req.get_response(self.app)
+
+        # attempt to copy current object to versions container
+        self._copy_current(req, versions_cont, api_version, account_name,
+                           object_name)
+
+        # write client's put directly to versioned container
+        req.ensure_x_timestamp()
+        put_resp, put_vers_obj_name, put_bytes, put_content_type = \
+            self._put_versioned_obj_from_client(req, versions_cont,
+                                                api_version, account_name,
+                                                object_name)
+
+        # and add an static symlink to original container
+        target_etag = put_resp.headers['Etag']
+        return self._put_symlink_to_version(req, versions_cont,
+                                            put_vers_obj_name, api_version,
+                                            account_name, object_name,
+                                            target_etag, put_bytes,
+                                            put_content_type)
+
+    def handle_delete(self, req, versions_cont, api_version,
+                      account_name, container_name,
+                      object_name, is_enabled):
+        """
+        Handle DELETE requests.
+
+        Copy current version of object to versions_container and write a
+        delete marker before proceeding with original request.
+
+        :param req: original request.
+        :param versions_cont: container where previous versions of the object
+                              are stored.
+        :param api_version: api version.
+        :param account_name: account name.
+        :param object_name: name of object of original request
+        """
+        # handle object request for a disabled versioned container.
+        if not is_enabled:
+            return req.get_response(self.app)
+
+        self._copy_current(req, versions_cont, api_version,
+                           account_name, object_name)
+
+        req.ensure_x_timestamp()
+        marker_name = self._build_versions_object_name(
+            object_name, req.timestamp.internal)
+        marker_path = "/%s/%s/%s/%s" % (
+            api_version, account_name, versions_cont, marker_name)
+        marker_headers = {
+            # Definitive source of truth is Content-Type, and since we add
+            # a swift_* param, we know users haven't set it themselves.
+            # This is still open to users POSTing to update the content-type
+            # but they're just shooting themselves in the foot then.
+            'content-type': DELETE_MARKER_CONTENT_TYPE,
+            'content-length': '0',
+            'x-auth-token': req.headers.get('x-auth-token'),
+            'X-Backend-Allow-Reserved-Names': 'true',
+        }
+        marker_req = make_pre_authed_request(
+            req.environ, path=wsgi_quote(marker_path),
+            headers=marker_headers, method='PUT', swift_source='OV')
+        marker_req.environ['swift.content_type_overridden'] = True
+        marker_resp = marker_req.get_response(self.app)
+        self._check_response_error(req, marker_resp)
+        drain_and_close(marker_resp)
+
+        # successfully copied and created delete marker; safe to delete
+        resp = req.get_response(self.app)
+        if resp.is_success or resp.status_int == 404:
+            resp.headers['X-Object-Version-Id'] = \
+                self._split_version_from_name(marker_name)[1].internal
+            resp.headers['X-Backend-Content-Type'] = DELETE_MARKER_CONTENT_TYPE
+        drain_and_close(resp)
+        return resp
+
+    def handle_post(self, req, versions_cont, account):
+        '''
+        Handle a POST request to an object in a versioned container.
+
+        If the response is a 307 because the POST went to a symlink,
+        follow the symlink and send the request to the versioned object
+
+        :param req: original request.
+        :param versions_cont: container where previous versions of the object
+                              are stored.
+        :param account: account name.
+        '''
+        # create eventual post request before
+        # encryption middleware changes the request headers
+        post_req = make_pre_authed_request(
+            req.environ, path=wsgi_quote(req.path_info), method='POST',
+            headers={'X-Backend-Allow-Reserved-Names': 'true'},
+            swift_source='OV')
+        copy_header_subset(req, post_req, non_expiry_header)
+
+        # send original request
+        resp = req.get_response(self.app)
+
+        # if it's a versioning symlink, send post to versioned object
+        if resp.status_int == 307 and config_true_value(
+                resp.headers.get(SYSMETA_VERSIONS_SYMLINK, 'false')):
+            loc = wsgi_unquote(resp.headers['Location'])
+
+            # Only follow if the version container matches
+            if split_path(loc, 4, 4, True)[1:3] == [
+                    account, versions_cont]:
+                drain_and_close(resp)
+                post_req.path_info = loc
+                resp = post_req.get_response(self.app)
+        return resp
+
+    def _check_head(self, req, auth_token_header):
+        obj_head_headers = {
+            'X-Newest': 'True',
+        }
+        obj_head_headers.update(auth_token_header)
+        head_req = make_pre_authed_request(
+            req.environ, path=wsgi_quote(req.path_info) + '?symlink=get',
+            method='HEAD', headers=obj_head_headers, swift_source='OV')
+        hresp = head_req.get_response(self.app)
+        head_is_tombstone = False
+        symlink_target = None
+        if hresp.status_int == HTTP_NOT_FOUND:
+            head_is_tombstone = True
+        else:
+            head_is_tombstone = False
+            # if there's any other kind of error with a broken link...
+            # I guess give up?
+            self._check_response_error(req, hresp)
+            if hresp.headers.get(SYSMETA_VERSIONS_SYMLINK) == 'true':
+                symlink_target = hresp.headers.get(TGT_OBJ_SYMLINK_HDR)
+        drain_and_close(hresp)
+        return head_is_tombstone, symlink_target
+
+    def handle_delete_version(self, req, versions_cont, api_version,
+                              account_name, container_name,
+                              object_name, is_enabled, version):
+        if version == 'null':
+            # let the request go directly through to the is_latest link
+            return
+        auth_token_header = {'X-Auth-Token': req.headers.get('X-Auth-Token')}
+        head_is_tombstone, symlink_target = self._check_head(
+            req, auth_token_header)
+
+        versions_obj = self._build_versions_object_name(
+            object_name, version)
+        req_obj_path = '%s/%s' % (versions_cont, versions_obj)
+        if head_is_tombstone or not symlink_target or (
+           wsgi_unquote(symlink_target) != wsgi_unquote(req_obj_path)):
+            # If there's no current version (i.e., tombstone or unversioned
+            # object) or if current version links to another version, then
+            # just delete the version requested to be deleted
+            req.path_info = "/%s/%s/%s/%s" % (
+                api_version, account_name, versions_cont, versions_obj)
+            req.headers['X-Backend-Allow-Reserved-Names'] = 'true'
+            if head_is_tombstone or not symlink_target:
+                resp_version_id = 'null'
+            else:
+                _, vers_obj_name = wsgi_unquote(symlink_target).split('/', 1)
+                resp_version_id = self._split_version_from_name(
+                    vers_obj_name)[1].internal
+        else:
+            # if version-id is the latest version, delete the link too
+            # First, kill the link...
+            req.environ['QUERY_STRING'] = ''
+            link_resp = req.get_response(self.app)
+            self._check_response_error(req, link_resp)
+            drain_and_close(link_resp)
+
+            # *then* the backing data
+            req.path_info = "/%s/%s/%s/%s" % (
+                api_version, account_name, versions_cont, versions_obj)
+            req.headers['X-Backend-Allow-Reserved-Names'] = 'true'
+            resp_version_id = 'null'
+        resp = req.get_response(self.app)
+        resp.headers['X-Object-Version-Id'] = version
+        resp.headers['X-Object-Current-Version-Id'] = resp_version_id
+        return resp
+
+    def handle_put_version(self, req, versions_cont, api_version, account_name,
+                           container, object_name, is_enabled, version):
+        """
+        Handle a PUT?version-id request and create/update the is_latest link to
+        point to the specific version. Expects a valid 'version' id.
+        """
+        if req.is_chunked:
+            has_body = (req.body_file.read(1) != b'')
+        elif req.content_length is None:
+            raise HTTPLengthRequired(request=req)
+        else:
+            has_body = (req.content_length != 0)
+        if has_body:
+            raise HTTPBadRequest(
+                body='PUT version-id requests require a zero byte body',
+                request=req,
+                content_type='text/plain')
+        versions_obj_name = self._build_versions_object_name(
+            object_name, version)
+        versioned_obj_path = "/%s/%s/%s/%s" % (
+            api_version, account_name, versions_cont, versions_obj_name)
+        obj_head_headers = {'X-Backend-Allow-Reserved-Names': 'true'}
+        head_req = make_pre_authed_request(
+            req.environ, path=wsgi_quote(versioned_obj_path) + '?symlink=get',
+            method='HEAD', headers=obj_head_headers, swift_source='OV')
+        head_resp = head_req.get_response(self.app)
+        if head_resp.status_int == HTTP_NOT_FOUND:
+            drain_and_close(head_resp)
+            if is_success(get_container_info(
+                    head_req.environ, self.app, swift_source='OV')['status']):
+                raise HTTPNotFound(
+                    request=req, content_type='text/plain',
+                    body=b'The specified version does not exist')
+            else:
+                raise HTTPInternalServerError(
+                    request=req, content_type='text/plain',
+                    body=b'The versions container does not exist. You may '
+                         b'want to re-enable object versioning.')
+
+        self._check_response_error(req, head_resp)
+        drain_and_close(head_resp)
+
+        put_etag = head_resp.headers['ETag']
+        put_bytes = head_resp.content_length
+        put_content_type = head_resp.headers['Content-Type']
+        resp = self._put_symlink_to_version(
+            req, versions_cont, versions_obj_name, api_version, account_name,
+            object_name, put_etag, put_bytes, put_content_type)
+        return resp
+
+    def handle_versioned_request(self, req, versions_cont, api_version,
+                                 account, container, obj, is_enabled, version):
+        """
+        Handle 'version-id' request for object resource. When a request
+        contains a ``version-id=<id>`` parameter, the request is acted upon
+        the actual version of that object. Version-aware operations
+        require that the container is versioned, but do not require that
+        the versioning is currently enabled. Users should be able to
+        operate on older versions of an object even if versioning is
+        currently suspended.
+
+        PUT and POST requests are not allowed as that would overwrite
+        the contents of the versioned object.
+
+        :param req: The original request
+        :param versions_cont: container holding versions of the requested obj
+        :param api_version: should be v1 unless swift bumps api version
+        :param account: account name string
+        :param container: container name string
+        :param object: object name string
+        :param is_enabled: is versioning currently enabled
+        :param version: version of the object to act on
+        """
+        # ?version-id requests are allowed for GET, HEAD, DELETE reqs
+        if req.method == 'POST':
+            raise HTTPBadRequest(
+                '%s to a specific version is not allowed' % req.method,
+                request=req)
+        elif not versions_cont and version != 'null':
+            raise HTTPBadRequest(
+                'version-aware operations require that the container is '
+                'versioned', request=req)
+        if version != 'null':
+            try:
+                Timestamp(version)
+            except ValueError:
+                raise HTTPBadRequest('Invalid version parameter', request=req)
+
+        if req.method == 'DELETE':
+            return self.handle_delete_version(
+                req, versions_cont, api_version, account,
+                container, obj, is_enabled, version)
+        elif req.method == 'PUT':
+            return self.handle_put_version(
+                req, versions_cont, api_version, account,
+                container, obj, is_enabled, version)
+        if version == 'null':
+            resp = req.get_response(self.app)
+            if resp.is_success:
+                if get_reserved_name('versions', '') in wsgi_unquote(
+                        resp.headers.get('Content-Location', '')):
+                    # Have a latest version, but it's got a real version-id.
+                    # Since the user specifically asked for null, return 404
+                    close_if_possible(resp.app_iter)
+                    raise HTTPNotFound(request=req)
+                resp.headers['X-Object-Version-Id'] = 'null'
+                if req.method == 'HEAD':
+                    drain_and_close(resp)
+            return resp
+        else:
+            # Re-write the path; most everything else goes through normally
+            req.path_info = "/%s/%s/%s/%s" % (
+                api_version, account, versions_cont,
+                self._build_versions_object_name(obj, version))
+            req.headers['X-Backend-Allow-Reserved-Names'] = 'true'
+
+            resp = req.get_response(self.app)
+            if resp.is_success:
+                resp.headers['X-Object-Version-Id'] = version
+
+            # Well, except for some delete marker business...
+            is_del_marker = DELETE_MARKER_CONTENT_TYPE == resp.headers.get(
+                'X-Backend-Content-Type', resp.headers['Content-Type'])
+
+            if req.method == 'HEAD':
+                drain_and_close(resp)
+
+            if is_del_marker:
+                hdrs = {'X-Object-Version-Id': version,
+                        'Content-Type': DELETE_MARKER_CONTENT_TYPE}
+                raise HTTPNotFound(request=req, headers=hdrs)
+            return resp
+
+    def handle_request(self, req, versions_cont, api_version, account,
+                       container, obj, is_enabled):
+        if req.method == 'PUT':
+            return self.handle_put(
+                req, versions_cont, api_version, account, obj,
+                is_enabled)
+        elif req.method == 'POST':
+            return self.handle_post(req, versions_cont, account)
+        elif req.method == 'DELETE':
+            return self.handle_delete(
+                req, versions_cont, api_version, account,
+                container, obj, is_enabled)
+
+        # GET/HEAD/OPTIONS
+        resp = req.get_response(self.app)
+
+        resp.headers['X-Object-Version-Id'] = 'null'
+        # Check for a "real" version
+        loc = wsgi_unquote(resp.headers.get('Content-Location', ''))
+        if loc:
+            _, acct, cont, version_obj = split_path(loc, 4, 4, True)
+            if acct == account and cont == versions_cont:
+                _, version = self._split_version_from_name(version_obj)
+                if version is not None:
+                    resp.headers['X-Object-Version-Id'] = version.internal
+                    content_loc = wsgi_quote('/%s/%s/%s/%s' % (
+                        api_version, account, container, obj,
+                    )) + '?version-id=%s' % (version.internal,)
+                    resp.headers['Content-Location'] = content_loc
+        symlink_target = wsgi_unquote(resp.headers.get('X-Symlink-Target', ''))
+        if symlink_target:
+            cont, version_obj = split_path('/%s' % symlink_target, 2, 2, True)
+            if cont == versions_cont:
+                _, version = self._split_version_from_name(version_obj)
+                if version is not None:
+                    resp.headers['X-Object-Version-Id'] = version.internal
+                    symlink_target = wsgi_quote('%s/%s' % (container, obj)) + \
+                        '?version-id=%s' % (version.internal,)
+                    resp.headers['X-Symlink-Target'] = symlink_target
+        return resp
+
+
+class ContainerContext(ObjectVersioningContext):
+    def handle_request(self, req, start_response):
+        """
+        Handle request for container resource.
+
+        On PUT, POST set version location and enabled flag sysmeta.
+        For container listings of a versioned container, update the object's
+        bytes and etag to use the target's instead of using the symlink info.
+        """
+        app_resp = self._app_call(req.environ)
+        _, account, container, _ = req.split_path(3, 4, True)
+        location = ''
+        curr_bytes = 0
+        bytes_idx = -1
+        for i, (header, value) in enumerate(self._response_headers):
+            if header == 'X-Container-Bytes-Used':
+                curr_bytes = value
+                bytes_idx = i
+            if header.lower() == SYSMETA_VERSIONS_CONT:
+                location = value
+            if header.lower() == SYSMETA_VERSIONS_ENABLED:
+                self._response_headers.extend([
+                    (CLIENT_VERSIONS_ENABLED.title(), value)])
+
+        if location:
+            location = wsgi_unquote(location)
+
+            # update bytes header
+            if bytes_idx > -1:
+                head_req = make_pre_authed_request(
+                    req.environ, method='HEAD', swift_source='OV',
+                    path=wsgi_quote('/v1/%s/%s' % (account, location)),
+                    headers={'X-Backend-Allow-Reserved-Names': 'true'})
+                vresp = head_req.get_response(self.app)
+                if vresp.is_success:
+                    ver_bytes = vresp.headers.get('X-Container-Bytes-Used', 0)
+                    self._response_headers[bytes_idx] = (
+                        'X-Container-Bytes-Used',
+                        str(int(curr_bytes) + int(ver_bytes)))
+                drain_and_close(vresp)
+        elif is_success(self._get_status_int()):
+            # If client is doing a version-aware listing for a container that
+            # (as best we could tell) has never had versioning enabled,
+            # err on the side of there being data anyway -- the metadata we
+            # found may not be the most up-to-date.
+
+            # Note that any extra listing request we make will likely 404.
+            try:
+                location = self._build_versions_container_name(container)
+            except ValueError:
+                # may be internal listing to a reserved namespace container
+                pass
+        # else, we won't need location anyway
+
+        if is_success(self._get_status_int()) and req.method == 'GET':
+            with closing_if_possible(app_resp):
+                body = b''.join(app_resp)
+            try:
+                listing = json.loads(body)
+            except ValueError:
+                app_resp = [body]
+            else:
+                for item in listing:
+                    if not all(x in item for x in (
+                            'symlink_path',
+                            'symlink_etag',
+                            'symlink_bytes')):
+                        continue
+                    path = wsgi_unquote(bytes_to_wsgi(
+                        item['symlink_path'].encode('utf-8')))
+                    _, tgt_acct, tgt_container, tgt_obj = split_path(
+                        path, 4, 4, True)
+                    if tgt_container != location:
+                        # if the archive container changed, leave the extra
+                        # info unmodified
+                        continue
+                    _, meta = parse_header(item['hash'])
+                    tgt_bytes = int(item.pop('symlink_bytes'))
+                    item['bytes'] = tgt_bytes
+                    item['version_symlink'] = True
+                    item['hash'] = item.pop('symlink_etag') + ''.join(
+                        '; %s=%s' % (k, v) for k, v in meta.items())
+                    tgt_obj, version = self._split_version_from_name(tgt_obj)
+                    if version is not None and 'versions' not in req.params:
+                        sp = wsgi_quote('/v1/%s/%s/%s' % (
+                            tgt_acct, container, tgt_obj,
+                        )) + '?version-id=' + version.internal
+                        item['symlink_path'] = sp
+
+                if 'versions' in req.params:
+                    return self._list_versions(
+                        req, start_response, location,
+                        listing)
+
+                body = json.dumps(listing).encode('ascii')
+                self.update_content_length(len(body))
+                app_resp = [body]
+
+        start_response(self._response_status,
+                       self._response_headers,
+                       self._response_exc_info)
+        return app_resp
+
+    def handle_delete(self, req, start_response):
+        """
+        Handle request to delete a user's container.
+
+        As part of deleting a container, this middleware will also delete
+        the hidden container holding object versions.
+
+        Before a user's container can be deleted, swift must check
+        if there are still old object versions from that container.
+        Only after disabling versioning and deleting *all* object versions
+        can a container be deleted.
+        """
+        container_info = get_container_info(req.environ, self.app,
+                                            swift_source='OV')
+
+        versions_cont = unquote(container_info.get(
+            'sysmeta', {}).get('versions-container', ''))
+
+        if versions_cont:
+            account = req.split_path(3, 3, True)[1]
+            # using a HEAD request here as opposed to get_container_info
+            # to make sure we get an up-to-date value
+            versions_req = make_pre_authed_request(
+                req.environ, method='HEAD', swift_source='OV',
+                path=wsgi_quote('/v1/%s/%s' % (
+                    account, str_to_wsgi(versions_cont))),
+                headers={'X-Backend-Allow-Reserved-Names': 'true'})
+            vresp = versions_req.get_response(self.app)
+            drain_and_close(vresp)
+            if vresp.is_success and int(vresp.headers.get(
+                    'X-Container-Object-Count', 0)) > 0:
+                raise HTTPConflict(
+                    'Delete all versions before deleting container.',
+                    request=req)
+            elif not vresp.is_success and vresp.status_int != 404:
+                raise HTTPInternalServerError(
+                    'Error deleting versioned container')
+            else:
+                versions_req.method = 'DELETE'
+                resp = versions_req.get_response(self.app)
+                drain_and_close(resp)
+                if not is_success(resp.status_int) and resp.status_int != 404:
+                    raise HTTPInternalServerError(
+                        'Error deleting versioned container')
+
+        app_resp = self._app_call(req.environ)
+
+        start_response(self._response_status,
+                       self._response_headers,
+                       self._response_exc_info)
+        return app_resp
+
+    def enable_versioning(self, req, start_response):
+        container_info = get_container_info(req.environ, self.app,
+                                            swift_source='OV')
+
+        # if container is already configured to use old style versioning,
+        # we don't allow user to enable object versioning here. They must
+        # choose which middleware to use, only one style of versioning
+        # is supported for a given container
+        versions_cont = container_info.get(
+            'sysmeta', {}).get('versions-location')
+        legacy_versions_cont = container_info.get('versions')
+        if versions_cont or legacy_versions_cont:
+            raise HTTPBadRequest(
+                'Cannot enable object versioning on a container '
+                'that is already using the legacy versioned writes '
+                'feature.',
+                request=req)
+
+        # versioning and container-sync do not yet work well together
+        # container-sync needs to be enhanced to sync previous versions
+        sync_to = container_info.get('sync_to')
+        if sync_to:
+            raise HTTPBadRequest(
+                'Cannot enable object versioning on a container '
+                'configured as source of container syncing.',
+                request=req)
+
+        versions_cont = container_info.get(
+            'sysmeta', {}).get('versions-container')
+        is_enabled = config_true_value(
+            req.headers[CLIENT_VERSIONS_ENABLED])
+
+        req.headers[SYSMETA_VERSIONS_ENABLED] = is_enabled
+
+        # TODO: a POST request to a primary container that doesn't exist
+        # will fail, so we will create and delete the versions container
+        # for no reason
+        if config_true_value(is_enabled):
+            (version, account, container, _) = req.split_path(3, 4, True)
+
+            # Attempt to use same policy as primary container, otherwise
+            # use default policy
+            if is_success(container_info['status']):
+                primary_policy_idx = container_info['storage_policy']
+                if POLICIES[primary_policy_idx].is_deprecated:
+                    # Do an auth check now, so we don't leak information
+                    # about the container
+                    aresp = req.environ['swift.authorize'](req)
+                    if aresp:
+                        raise aresp
+
+                    # Proxy controller would catch the deprecated policy, too,
+                    # but waiting until then would mean the error message
+                    # would be a generic "Error enabling object versioning".
+                    raise HTTPBadRequest(
+                        'Cannot enable object versioning on a container '
+                        'that uses a deprecated storage policy.',
+                        request=req)
+                hdrs = {'X-Storage-Policy': POLICIES[primary_policy_idx].name}
+            else:
+                if req.method == 'PUT' and \
+                        'X-Storage-Policy' in req.headers:
+                    hdrs = {'X-Storage-Policy':
+                            req.headers['X-Storage-Policy']}
+                else:
+                    hdrs = {}
+            hdrs['X-Backend-Allow-Reserved-Names'] = 'true'
+
+            versions_cont = self._build_versions_container_name(container)
+            versions_cont_path = "/%s/%s/%s" % (
+                version, account, versions_cont)
+            ver_cont_req = make_pre_authed_request(
+                req.environ, path=wsgi_quote(versions_cont_path),
+                method='PUT', headers=hdrs, swift_source='OV')
+            resp = ver_cont_req.get_response(self.app)
+            # Should always be short; consume the body
+            drain_and_close(resp)
+            if is_success(resp.status_int) or resp.status_int == HTTP_CONFLICT:
+                req.headers[SYSMETA_VERSIONS_CONT] = wsgi_quote(versions_cont)
+            else:
+                raise HTTPInternalServerError(
+                    'Error enabling object versioning')
+
+        # make original request
+        app_resp = self._app_call(req.environ)
+
+        # if we just created a versions container but the original
+        # request failed, delete the versions container
+        # and let user retry later
+        if not is_success(self._get_status_int()) and \
+                SYSMETA_VERSIONS_CONT in req.headers:
+            versions_cont_path = "/%s/%s/%s" % (
+                version, account, versions_cont)
+            ver_cont_req = make_pre_authed_request(
+                req.environ, path=wsgi_quote(versions_cont_path),
+                method='DELETE', headers=hdrs, swift_source='OV')
+
+            # TODO: what if this one fails??
+            resp = ver_cont_req.get_response(self.app)
+            drain_and_close(resp)
+
+        if self._response_headers is None:
+            self._response_headers = []
+        for key, val in self._response_headers:
+            if key.lower() == SYSMETA_VERSIONS_ENABLED:
+                self._response_headers.extend([
+                    (CLIENT_VERSIONS_ENABLED.title(), val)])
+
+        start_response(self._response_status,
+                       self._response_headers,
+                       self._response_exc_info)
+        return app_resp
+
+    def _list_versions(self, req, start_response, location, primary_listing):
+        # Only supports JSON listings
+        req.environ['swift.format_listing'] = False
+        if not req.accept.best_match(['application/json']):
+            raise HTTPNotAcceptable(request=req)
+
+        params = req.params
+        if 'version_marker' in params:
+            if 'marker' not in params:
+                raise HTTPBadRequest('version_marker param requires marker')
+
+            if params['version_marker'] != 'null':
+                try:
+                    ts = Timestamp(params.pop('version_marker'))
+                except ValueError:
+                    raise HTTPBadRequest('invalid version_marker param')
+
+                params['marker'] = self._build_versions_object_name(
+                    params['marker'], ts.internal)
+        elif 'marker' in params:
+            params['marker'] = self._build_versions_object_prefix(
+                params['marker']) + ':'  # just past all numbers
+
+        delim = params.get('delimiter', '')
+        # Exclude the set of chars used in version_id from user delimiters
+        if set(delim).intersection('0123456789.%s' % RESERVED_STR):
+            raise HTTPBadRequest('invalid delimiter param')
+
+        null_listing = []
+        subdir_set = set()
+        current_versions = {}
+        is_latest_set = set()
+        for item in primary_listing:
+            if 'name' not in item:
+                subdir_set.add(item['subdir'])
+            else:
+                if item.get('version_symlink'):
+                    path = wsgi_to_str(wsgi_unquote(bytes_to_wsgi(
+                        item['symlink_path'].encode('utf-8'))))
+                    current_versions[path] = item
+                else:
+                    null_listing.append(dict(
+                        item, version_id='null', is_latest=True))
+                    is_latest_set.add(item['name'])
+
+        account = req.split_path(3, 3, True)[1]
+        versions_req = make_pre_authed_request(
+            req.environ, method='GET', swift_source='OV',
+            path=wsgi_quote('/v1/%s/%s' % (account, location)),
+            headers={'X-Backend-Allow-Reserved-Names': 'true'},
+        )
+        # NB: Not using self._build_versions_object_name here because
+        # we don't want to bookend the prefix with RESERVED_NAME as user
+        # could be using just part of object name as the prefix.
+        if 'prefix' in params:
+            params['prefix'] = get_reserved_name(params['prefix'])
+
+        # NB: no end_marker support (yet)
+        if get_container_info(versions_req.environ, self.app,
+                              swift_source='OV')['status'] == 404:
+            # we don't usually like to LBYL like this, but 404s tend to be
+            # expensive (since we check all primaries and a bunch of handoffs)
+            # and we expect this to be a reasonably common way to listing
+            # objects since it's more complete from the user's perspective
+            # (see also: s3api and that client ecosystem)
+            versions_resp = None
+        else:
+            versions_req.params = {
+                k: params.get(k, '') for k in (
+                    'prefix', 'marker', 'limit', 'delimiter', 'reverse')}
+            versions_resp = versions_req.get_response(self.app)
+
+        if versions_resp is None \
+                or versions_resp.status_int == HTTP_NOT_FOUND:
+            subdir_listing = [{'subdir': s} for s in subdir_set]
+            broken_listing = []
+            for item in current_versions.values():
+                linked_name = wsgi_to_str(wsgi_unquote(bytes_to_wsgi(
+                    item['symlink_path'].encode('utf8')))).split('/', 4)[-1]
+                name, ts = self._split_version_from_name(linked_name)
+                if ts is None:
+                    continue
+                is_latest = False
+                if name not in is_latest_set:
+                    is_latest_set.add(name)
+                    is_latest = True
+                broken_listing.append({
+                    'name': name,
+                    'is_latest': is_latest,
+                    'version_id': ts.internal,
+                    'content_type': item['content_type'],
+                    'bytes': item['bytes'],
+                    'hash': item['hash'],
+                    'last_modified': item['last_modified'],
+                })
+            limit = constrain_req_limit(req, CONTAINER_LISTING_LIMIT)
+            body = build_listing(
+                null_listing, subdir_listing, broken_listing,
+                reverse=config_true_value(params.get('reverse', 'no')),
+                limit=limit)
+            self.update_content_length(len(body))
+            app_resp = [body]
+            drain_and_close(versions_resp)
+        elif is_success(versions_resp.status_int):
+            try:
+                listing = json.loads(versions_resp.body)
+            except ValueError:
+                app_resp = [body]
+            else:
+                versions_listing = []
+                for item in listing:
+                    if 'name' not in item:
+                        # remove reserved chars from subdir
+                        subdir = split_reserved_name(item['subdir'])[0]
+                        subdir_set.add(subdir)
+                    else:
+                        name, ts = self._split_version_from_name(item['name'])
+                        if ts is None:
+                            continue
+                        path = '/v1/%s/%s/%s' % (
+                            wsgi_to_str(account),
+                            wsgi_to_str(location),
+                            item['name'])
+
+                        if path in current_versions:
+                            item['is_latest'] = True
+                            is_latest_set.add(name)
+                            del current_versions[path]
+                        elif (item['content_type'] ==
+                              DELETE_MARKER_CONTENT_TYPE
+                              and name not in is_latest_set):
+                            item['is_latest'] = True
+                            is_latest_set.add(name)
+                        else:
+                            item['is_latest'] = False
+
+                        item['name'] = name
+                        item['version_id'] = ts.internal
+                        versions_listing.append(item)
+
+                subdir_listing = [{'subdir': s} for s in subdir_set]
+                broken_listing = []
+                for item in current_versions.values():
+                    link_path = wsgi_to_str(wsgi_unquote(bytes_to_wsgi(
+                        item['symlink_path'].encode('utf-8'))))
+                    name, ts = self._split_version_from_name(
+                        link_path.split('/', 1)[1])
+                    if ts is None:
+                        continue
+                    broken_listing.append({
+                        'name': name,
+                        'is_latest': True,
+                        'version_id': ts.internal,
+                        'content_type': item['content_type'],
+                        'bytes': item['bytes'],
+                        'hash': item['hash'],
+                        'last_modified': item['last_modified'],
+                    })
+
+                limit = constrain_req_limit(req, CONTAINER_LISTING_LIMIT)
+                body = build_listing(
+                    null_listing, versions_listing,
+                    subdir_listing, broken_listing,
+                    reverse=config_true_value(params.get('reverse', 'no')),
+                    limit=limit,
+                )
+                self.update_content_length(len(body))
+                app_resp = [body]
+        else:
+            return versions_resp(versions_req.environ, start_response)
+
+        start_response(self._response_status,
+                       self._response_headers,
+                       self._response_exc_info)
+        return app_resp
+
+
+class AccountContext(ObjectVersioningContext):
+    def list_containers(self, req, api_version, account, start_response):
+        app_resp = self._app_call(req.environ)
+
+        if is_success(self._get_status_int()):
+            with closing_if_possible(app_resp):
+                body = b''.join(app_resp)
+            try:
+                listing = json.loads(body)
+            except ValueError:
+                app_resp = [body]
+            else:
+                # list hidden versions containers
+                # It might be necessary to issue multiple listing requests
+                # because of paging limitations, hence the while loop.
+                params = req.params
+                versions_dict = {}
+                versions_req = make_pre_authed_request(
+                    req.environ, method='GET', swift_source='OV',
+                    path=wsgi_quote('/v1/%s' % account),
+                    headers={'X-Backend-Allow-Reserved-Names': 'true'},
+                )
+                if 'prefix' in params:
+                    try:
+                        params['prefix'] = \
+                            self._build_versions_container_name(
+                                params['prefix'])
+                    except ValueError:
+                        # don't touch params['prefix'],
+                        # RESERVED_STR probably came from looping around
+                        pass
+                else:
+                    params['prefix'] = get_reserved_name('versions')
+
+                for p in ('marker', 'end_marker'):
+                    if p in params:
+                        try:
+                            params[p] = \
+                                self._build_versions_container_name(
+                                    params[p])
+                        except ValueError:
+                            # don't touch params[p]
+                            pass
+
+                versions_req.params = params
+                versions_resp = versions_req.get_response(self.app)
+                try:
+                    versions_listing = json.loads(versions_resp.body)
+                except ValueError:
+                    versions_listing = []
+                finally:
+                    close_if_possible(versions_resp.app_iter)
+
+                # create a dict from versions listing to facilitate
+                # look-up by name. Ignore 'subdir' items
+                for item in [item for item in versions_listing
+                             if 'name' in item]:
+                    container_name = self._split_versions_container_name(
+                        item['name'])
+                    versions_dict[container_name] = item
+
+                # update bytes from original listing with bytes from
+                # versions cont
+                if len(versions_dict) > 0:
+                    # ignore 'subdir' items
+                    for item in [item for item in listing if 'name' in item]:
+                        if item['name'] in versions_dict:
+                            v_info = versions_dict.pop(item['name'])
+                            item['bytes'] = item['bytes'] + v_info['bytes']
+
+                # if there are items left in versions_dict, it indicates an
+                # error scenario where there are orphan hidden containers
+                # (possibly storing data) that should have been deleted
+                # along with the primary container. In this case, let's add
+                # those containers to listing so users can be aware and
+                # clean them up
+                for key, item in versions_dict.items():
+                    item['name'] = key
+                    item['count'] = 0  # None of these are current
+                    listing.append(item)
+
+                limit = constrain_req_limit(req, ACCOUNT_LISTING_LIMIT)
+                body = build_listing(
+                    listing,
+                    reverse=config_true_value(params.get('reverse', 'no')),
+                    limit=limit,
+                )
+                self.update_content_length(len(body))
+                app_resp = [body]
+
+        start_response(self._response_status,
+                       self._response_headers,
+                       self._response_exc_info)
+        return app_resp
+
+
+class ObjectVersioningMiddleware(object):
+
+    def __init__(self, app, conf):
+        self.app = app
+        self.conf = conf
+        self.logger = get_logger(conf, log_route='object_versioning')
+
+    # Pass these along so get_container_info will have the configured
+    # odds to skip cache
+    _pipeline_final_app = app_property('_pipeline_final_app')
+    _pipeline_request_logging_app = app_property(
+        '_pipeline_request_logging_app')
+
+    def account_request(self, req, api_version, account, start_response):
+        account_ctx = AccountContext(self.app, self.logger)
+        if req.method == 'GET':
+            return account_ctx.list_containers(
+                req, api_version, account, start_response)
+        else:
+            return self.app(req.environ, start_response)
+
+    def container_request(self, req, start_response):
+        container_ctx = ContainerContext(self.app, self.logger)
+        if req.method in ('PUT', 'POST') and \
+                CLIENT_VERSIONS_ENABLED in req.headers:
+            return container_ctx.enable_versioning(req, start_response)
+        elif req.method == 'DELETE':
+            return container_ctx.handle_delete(req, start_response)
+
+        # send request and translate sysmeta headers from response
+        return container_ctx.handle_request(req, start_response)
+
+    def object_request(self, req, api_version, account, container, obj):
+        """
+        Handle request for object resource.
+
+        Note that account, container, obj should be unquoted by caller
+        if the url path is under url encoding (e.g. %FF)
+
+        :param req: swift.common.swob.Request instance
+        :param api_version: should be v1 unless swift bumps api version
+        :param account: account name string
+        :param container: container name string
+        :param object: object name string
+        """
+        resp = None
+        container_info = get_container_info(
+            req.environ, self.app, swift_source='OV')
+
+        versions_cont = container_info.get(
+            'sysmeta', {}).get('versions-container', '')
+        is_enabled = config_true_value(container_info.get(
+            'sysmeta', {}).get('versions-enabled'))
+
+        if versions_cont:
+            versions_cont = wsgi_unquote(str_to_wsgi(
+                versions_cont)).split('/')[0]
+
+        if req.params.get('version-id'):
+            vw_ctx = ObjectContext(self.app, self.logger)
+            resp = vw_ctx.handle_versioned_request(
+                req, versions_cont, api_version, account, container, obj,
+                is_enabled, req.params['version-id'])
+        elif versions_cont:
+            # handle object request for a enabled versioned container
+            vw_ctx = ObjectContext(self.app, self.logger)
+            resp = vw_ctx.handle_request(
+                req, versions_cont, api_version, account, container, obj,
+                is_enabled)
+
+        if resp:
+            return resp
+        else:
+            return self.app
+
+    def __call__(self, env, start_response):
+        req = Request(env)
+        try:
+            (api_version, account, container, obj) = req.split_path(2, 4, True)
+            bad_path = False
+        except ValueError:
+            bad_path = True
+
+        # use of bad_path bool is to avoid recursive tracebacks
+        if bad_path or not valid_api_version(api_version):
+            return self.app(env, start_response)
+
+        try:
+            if not container:
+                return self.account_request(req, api_version, account,
+                                            start_response)
+            if container and not obj:
+                return self.container_request(req, start_response)
+            else:
+                return self.object_request(
+                    req, api_version, account, container,
+                    obj)(env, start_response)
+        except HTTPException as error_response:
+            return error_response(env, start_response)
diff --git a/swift/common/middleware/x_profile/__init__.py b/swift/common/middleware/x_profile/__init__.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bin/swift-object-expirer b/swift/common/middleware/x_profile/exceptions.py
old mode 100755
new mode 100644
similarity index 58%
rename from bin/swift-object-expirer
rename to swift/common/middleware/x_profile/exceptions.py
index f3dbbdd7c7..3f2c4c7fd5
--- a/bin/swift-object-expirer
+++ b/swift/common/middleware/x_profile/exceptions.py
@@ -1,4 +1,3 @@
-#!/usr/bin/env python
 # Copyright (c) 2010-2012 OpenStack, LLC.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
@@ -14,11 +13,30 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-from swift.common.daemon import run_daemon
-from swift.common.utils import parse_options
-from swift.obj.expirer import ObjectExpirer
+class ProfileException(Exception):
 
+    def __init__(self, msg):
+        self.msg = msg
 
-if __name__ == '__main__':
-    conf_file, options = parse_options(once=True)
-    run_daemon(ObjectExpirer, conf_file, **options)
+    def __str__(self):
+        return 'Profiling Error: %s' % self.msg
+
+
+class NotFoundException(ProfileException):
+    pass
+
+
+class MethodNotAllowed(ProfileException):
+    pass
+
+
+class ODFLIBNotInstalled(ProfileException):
+    pass
+
+
+class PLOTLIBNotInstalled(ProfileException):
+    pass
+
+
+class DataLoadFailure(ProfileException):
+    pass
diff --git a/swift/common/middleware/x_profile/html_viewer.py b/swift/common/middleware/x_profile/html_viewer.py
new file mode 100644
index 0000000000..e385663f84
--- /dev/null
+++ b/swift/common/middleware/x_profile/html_viewer.py
@@ -0,0 +1,535 @@
+# Copyright (c) 2010-2012 OpenStack, LLC.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import html
+import os
+import random
+import re
+import string
+import tempfile
+
+from swift.common.middleware.x_profile.exceptions import PLOTLIBNotInstalled
+from swift.common.middleware.x_profile.exceptions import ODFLIBNotInstalled
+from swift.common.middleware.x_profile.exceptions import NotFoundException
+from swift.common.middleware.x_profile.exceptions import MethodNotAllowed
+from swift.common.middleware.x_profile.exceptions import DataLoadFailure
+from swift.common.middleware.x_profile.exceptions import ProfileException
+from swift.common.middleware.x_profile.profile_model import Stats2
+
+PLOTLIB_INSTALLED = True
+try:
+    import matplotlib
+    # use agg backend for writing to file, not for rendering in a window.
+    # otherwise some platform will complain "no display name and $DISPLAY
+    # environment variable"
+    matplotlib.use('agg')
+    import matplotlib.pyplot as plt
+except ImportError:
+    PLOTLIB_INSTALLED = False
+
+
+empty_description = """
+        The default profile of current process or the profile you requested is
+        empty. <input type="submit" name="refresh" value="Refresh"/>
+"""
+
+profile_tmpl = """
+              <select name="profile">
+                <option value="current">current</option>
+                <option value="all">all</option>
+                ${profile_list}
+              </select>
+"""
+
+sort_tmpl = """
+              <select name="sort">
+                <option value="time">time</option>
+                <option value="cumulative">cumulative</option>
+                <option value="calls">calls</option>
+                <option value="pcalls">pcalls</option>
+                <option value="name">name</option>
+                <option value="file">file</option>
+                <option value="module">module</option>
+                <option value="line">line</option>
+                <option value="nfl">nfl</option>
+                <option value="stdname">stdname</option>
+              </select>
+"""
+
+limit_tmpl = """
+              <select name="limit">
+                <option value="-1">all</option>
+                <option value="0.1">10%</option>
+                <option value="0.2">20%</option>
+                <option value="0.3">30%</option>
+                <option value="10">10</option>
+                <option value="20">20</option>
+                <option value="30">30</option>
+                <option value="50">50</option>
+                <option value="100">100</option>
+                <option value="200">200</option>
+                <option value="300">300</option>
+                <option value="400">400</option>
+                <option value="500">500</option>
+              </select>
+"""
+
+fulldirs_tmpl = """
+              <input type="checkbox" name="fulldirs" value="1"
+              ${fulldir_checked}/>
+"""
+
+mode_tmpl = """
+              <select name="mode">
+                <option value="stats">stats</option>
+                <option value="callees">callees</option>
+                <option value="callers">callers</option>
+              </select>
+"""
+
+nfl_filter_tmpl = """
+              <input type="text" name="nfl_filter" value="${nfl_filter}"
+              placeholder="filename part" />
+"""
+
+formelements_tmpl = """
+      <div>
+        <table>
+          <tr>
+            <td>
+              <strong>Profile</strong>
+            <td>
+              <strong>Sort</strong>
+            </td>
+            <td>
+              <strong>Limit</strong>
+            </td>
+            <td>
+              <strong>Full Path</strong>
+            </td>
+            <td>
+              <strong>Filter</strong>
+            </td>
+            <td>
+            </td>
+            <td>
+              <strong>Plot Metric</strong>
+            </td>
+            <td>
+              <strong>Plot Type</strong>
+            <td>
+            </td>
+            <td>
+              <strong>Format</strong>
+            </td>
+            <td>
+            <td>
+            </td>
+            <td>
+            </td>
+
+          </tr>
+          <tr>
+            <td>
+               ${profile}
+            <td>
+               ${sort}
+            </td>
+            <td>
+               ${limit}
+            </td>
+            <td>
+              ${fulldirs}
+            </td>
+            <td>
+              ${nfl_filter}
+            </td>
+            <td>
+              <input type="submit" name="query" value="query"/>
+            </td>
+            <td>
+              <select name='metric'>
+                <option value='nc'>call count</option>
+                <option value='cc'>primitive call count</option>
+                <option value='tt'>total time</option>
+                <option value='ct'>cumulative time</option>
+              </select>
+            </td>
+            <td>
+              <select name='plottype'>
+                <option value='bar'>bar</option>
+                <option value='pie'>pie</option>
+              </select>
+            <td>
+              <input type="submit" name="plot" value="plot"/>
+            </td>
+            <td>
+              <select name='format'>
+                <option value='default'>binary</option>
+                <option value='json'>json</option>
+                <option value='csv'>csv</option>
+                <option value='ods'>ODF.ods</option>
+              </select>
+            </td>
+            <td>
+              <input type="submit" name="download" value="download"/>
+            </td>
+            <td>
+              <input type="submit" name="clear" value="clear"/>
+            </td>
+          </tr>
+        </table>
+      </div>
+"""
+
+index_tmpl = """
+<html>
+  <head>
+    <title>profile results</title>
+    <style>
+    <!--
+      tr.normal { background-color: #ffffff }
+      tr.hover { background-color: #88eeee }
+    //-->
+    </style>
+  </head>
+  <body>
+
+    <form action="${action}" method="POST">
+
+      <div class="form-text">
+        ${description}
+      </div>
+      <hr />
+      ${formelements}
+
+    </form>
+    <pre>
+${profilehtml}
+    </pre>
+
+  </body>
+</html>
+"""
+
+
+class HTMLViewer(object):
+
+    format_dict = {'default': 'application/octet-stream',
+                   'json': 'application/json',
+                   'csv': 'text/csv',
+                   'ods': 'application/vnd.oasis.opendocument.spreadsheet',
+                   'python': 'text/html'}
+
+    def __init__(self, app_path, profile_module, profile_log):
+        self.app_path = app_path
+        self.profile_module = profile_module
+        self.profile_log = profile_log
+
+    def _get_param(self, query_dict, key, default=None, multiple=False):
+        value = query_dict.get(key, default)
+        if value is None or value == '':
+            return default
+        if multiple:
+            return value
+        if isinstance(value, list):
+            return int(value[0]) if isinstance(default, int) else value[0]
+        else:
+            return value
+
+    def render(self, url, method, path_entry, query_dict, clear_callback):
+        plot = self._get_param(query_dict, 'plot', None)
+        download = self._get_param(query_dict, 'download', None)
+        clear = self._get_param(query_dict, 'clear', None)
+        action = plot or download or clear
+        profile_id = self._get_param(query_dict, 'profile', 'current')
+        sort = self._get_param(query_dict, 'sort', 'time')
+        limit = self._get_param(query_dict, 'limit', -1)
+        fulldirs = self._get_param(query_dict, 'fulldirs', 0)
+        nfl_filter = self._get_param(query_dict, 'nfl_filter', '').strip()
+        metric_selected = self._get_param(query_dict, 'metric', 'cc')
+        plot_type = self._get_param(query_dict, 'plottype', 'bar')
+        download_format = self._get_param(query_dict, 'format', 'default')
+        content = ''
+        # GET  /__profile, POST /__profile
+        if len(path_entry) == 2 and method in ['GET', 'POST']:
+            log_files = self.profile_log.get_logfiles(profile_id)
+            if action == 'plot':
+                content, headers = self.plot(log_files, sort, limit,
+                                             nfl_filter, metric_selected,
+                                             plot_type)
+            elif action == 'download':
+                content, headers = self.download(log_files, sort, limit,
+                                                 nfl_filter, download_format)
+            else:
+                if action == 'clear':
+                    self.profile_log.clear(profile_id)
+                    clear_callback and clear_callback()
+                content, headers = self.index_page(log_files, sort, limit,
+                                                   fulldirs, nfl_filter,
+                                                   profile_id, url)
+        # GET /__profile__/all
+        # GET /__profile__/current
+        # GET /__profile__/profile_id
+        # GET /__profile__/profile_id/
+        # GET /__profile__/profile_id/account.py:50(GETorHEAD)
+        # GET /__profile__/profile_id/swift/proxy/controllers
+        #      /account.py:50(GETorHEAD)
+        # with QUERY_STRING:   ?format=[default|json|csv|ods]
+        elif len(path_entry) > 2 and method == 'GET':
+            profile_id = path_entry[2]
+            log_files = self.profile_log.get_logfiles(profile_id)
+            pids = self.profile_log.get_all_pids()
+            # return all profiles in a json format by default.
+            # GET /__profile__/
+            if profile_id == '':
+                content = '{"profile_ids": ["' + '","'.join(pids) + '"]}'
+                headers = [('content-type', self.format_dict['json'])]
+            else:
+                if len(path_entry) > 3 and path_entry[3] != '':
+                    nfl_filter = '/'.join(path_entry[3:])
+                    if path_entry[-1].find(':0') == -1:
+                        nfl_filter = '/' + nfl_filter
+                content, headers = self.download(log_files, sort, -1,
+                                                 nfl_filter, download_format)
+            headers.append(('Access-Control-Allow-Origin', '*'))
+        else:
+            raise MethodNotAllowed('method %s is not allowed.' % method)
+        return content, headers
+
+    def index_page(self, log_files=None, sort='time', limit=-1,
+                   fulldirs=0, nfl_filter='', profile_id='current', url='#'):
+        headers = [('content-type', 'text/html')]
+        if len(log_files) == 0:
+            return empty_description, headers
+        try:
+            stats = Stats2(*log_files)
+        except (IOError, ValueError):
+            raise DataLoadFailure('Can not load profile data from %s.'
+                                  % log_files)
+        if not fulldirs:
+            stats.strip_dirs()
+        stats.sort_stats(sort)
+        nfl_filter_esc = nfl_filter.replace(r'(', r'\(').replace(r')', r'\)')
+        amount = [nfl_filter_esc, limit] if nfl_filter_esc else [limit]
+        profile_html = self.generate_stats_html(stats, self.app_path,
+                                                profile_id, *amount)
+        description = "Profiling information is generated by using\
+                      '%s' profiler." % self.profile_module
+        sort_repl = '<option value="%s">' % sort
+        sort_selected = '<option value="%s" selected>' % sort
+        sort = sort_tmpl.replace(sort_repl, sort_selected)
+        plist = ''.join(['<option value="%s">%s</option>' % (p, p)
+                         for p in self.profile_log.get_all_pids()])
+        profile_element = string.Template(profile_tmpl).substitute(
+            {'profile_list': plist})
+        profile_repl = '<option value="%s">' % profile_id
+        profile_selected = '<option value="%s" selected>' % profile_id
+        profile_element = profile_element.replace(profile_repl,
+                                                  profile_selected)
+        limit_repl = '<option value="%s">' % limit
+        limit_selected = '<option value="%s" selected>' % limit
+        limit = limit_tmpl.replace(limit_repl, limit_selected)
+        fulldirs_checked = 'checked' if fulldirs else ''
+        fulldirs_element = string.Template(fulldirs_tmpl).substitute(
+            {'fulldir_checked': fulldirs_checked})
+        nfl_filter_element = string.Template(nfl_filter_tmpl).\
+            substitute({'nfl_filter': nfl_filter})
+        form_elements = string.Template(formelements_tmpl).substitute(
+            {'description': description,
+             'action': url,
+             'profile': profile_element,
+             'sort': sort,
+             'limit': limit,
+             'fulldirs': fulldirs_element,
+             'nfl_filter': nfl_filter_element,
+             }
+        )
+        content = string.Template(index_tmpl).substitute(
+            {'formelements': form_elements,
+             'action': url,
+             'description': description,
+             'profilehtml': profile_html,
+             })
+        return content, headers
+
+    def download(self, log_files, sort='time', limit=-1, nfl_filter='',
+                 output_format='default'):
+        if len(log_files) == 0:
+            raise NotFoundException('no log file found')
+        try:
+            nfl_esc = nfl_filter.replace(r'(', r'\(').replace(r')', r'\)')
+            # remove the slash that is intentionally added in the URL
+            # to avoid failure of filtering stats data.
+            if nfl_esc.startswith('/'):
+                nfl_esc = nfl_esc[1:]
+            stats = Stats2(*log_files)
+            stats.sort_stats(sort)
+            if output_format == 'python':
+                data = self.format_source_code(nfl_filter)
+            elif output_format == 'json':
+                data = stats.to_json(nfl_esc, limit)
+            elif output_format == 'csv':
+                data = stats.to_csv(nfl_esc, limit)
+            elif output_format == 'ods':
+                data = stats.to_ods(nfl_esc, limit)
+            else:
+                data = stats.print_stats()
+            return data, [('content-type', self.format_dict[output_format])]
+        except ODFLIBNotInstalled:
+            raise
+        except Exception as ex:
+            raise ProfileException('Data download error: %s' % ex)
+
+    def plot(self, log_files, sort='time', limit=10, nfl_filter='',
+             metric_selected='cc', plot_type='bar'):
+        if not PLOTLIB_INSTALLED:
+            raise PLOTLIBNotInstalled('python-matplotlib not installed.')
+        if len(log_files) == 0:
+            raise NotFoundException('no log file found')
+        try:
+            stats = Stats2(*log_files)
+            stats.sort_stats(sort)
+            stats_dict = stats.stats
+            __, func_list = stats.get_print_list([nfl_filter, limit])
+            nfls = []
+            performance = []
+            names = {'nc': 'Total Call Count', 'cc': 'Primitive Call Count',
+                     'tt': 'Total Time', 'ct': 'Cumulative Time'}
+            for func in func_list:
+                cc, nc, tt, ct, __ = stats_dict[func]
+                metric = {'cc': cc, 'nc': nc, 'tt': tt, 'ct': ct}
+                nfls.append(func[2])
+                performance.append(metric[metric_selected])
+            y_pos = range(len(nfls))
+            error = [random.random() for _unused in y_pos]
+            plt.clf()
+            if plot_type == 'pie':
+                plt.pie(x=performance, explode=None, labels=nfls,
+                        autopct='%1.1f%%')
+            else:
+                plt.barh(y_pos, performance, xerr=error, align='center',
+                         alpha=0.4)
+                plt.yticks(y_pos, nfls)
+                plt.xlabel(names[metric_selected])
+            plt.title('Profile Statistics (by %s)' % names[metric_selected])
+            # plt.gcf().tight_layout(pad=1.2)
+            with tempfile.TemporaryFile() as profile_img:
+                plt.savefig(profile_img, format='png', dpi=300)
+                profile_img.seek(0)
+                data = profile_img.read()
+                return data, [('content-type', 'image/jpg')]
+        except Exception as ex:
+            raise ProfileException('plotting results failed due to %s' % ex)
+
+    def format_source_code(self, nfl):
+        nfls = re.split('[:()]', nfl)
+        file_path = nfls[0]
+        try:
+            lineno = int(nfls[1])
+        except (TypeError, ValueError, IndexError):
+            lineno = 0
+        # for security reason, this need to be fixed.
+        if not file_path.endswith('.py'):
+            return 'The file type are forbidden to access!'
+        try:
+            data = []
+            i = 0
+            with open(file_path) as f:
+                lines = f.readlines()
+                max_width = str(len(str(len(lines))))
+                fmt = '<span id="L%d" rel="#L%d">%' + max_width\
+                    + 'd|<code>%s</code></span>'
+                for line in lines:
+                    el = html.escape(line)
+                    i = i + 1
+                    if i == lineno:
+                        fmt2 = '<span id="L%d" style="background-color: \
+                            rgb(127,255,127)">%' + max_width +\
+                            'd|<code>%s</code></span>'
+                        data.append(fmt2 % (i, i, el))
+                    else:
+                        data.append(fmt % (i, i, i, el))
+            data = ''.join(data)
+        except Exception:
+            return 'Can not access the file %s.' % file_path
+        return '<pre>%s</pre>' % data
+
+    def generate_stats_html(self, stats, app_path, profile_id, *selection):
+        html = []
+        for filename in stats.files:
+            html.append('<p>%s</p>' % filename)
+        try:
+            for func in stats.top_level:
+                html.append('<p>%s</p>' % func[2])
+            html.append('%s function calls' % stats.total_calls)
+            if stats.total_calls != stats.prim_calls:
+                html.append("(%d primitive calls)" % stats.prim_calls)
+            html.append('in %.3f seconds' % stats.total_tt)
+            if stats.fcn_list:
+                stat_list = stats.fcn_list[:]
+                msg = "<p>Ordered by: %s</p>" % stats.sort_type
+            else:
+                stat_list = stats.stats.keys()
+                msg = '<p>Random listing order was used</p>'
+            for sel in selection:
+                stat_list, msg = stats.eval_print_amount(sel, stat_list, msg)
+            html.append(msg)
+            html.append('<table style="border-width: 1px">')
+            if stat_list:
+                html.append('<tr><th>#</th><th>Call Count</th>\
+                                    <th>Total Time</th><th>Time/Call</th>\
+                                    <th>Cumulative Time</th>\
+                                    <th>Cumulative Time/Call</th>\
+                                    <th>Filename:Lineno(Function)</th>\
+                                    <th>JSON</th>\
+                                </tr>')
+                count = 0
+                for func in stat_list:
+                    count = count + 1
+                    html.append('<tr onMouseOver="this.className=\'hover\'"\
+                                     onMouseOut="this.className=\'normal\'">\
+                                     <td>%d)</td>' % count)
+                    cc, nc, tt, ct, __ = stats.stats[func]
+                    c = str(nc)
+                    if nc != cc:
+                        c = c + '/' + str(cc)
+                    html.append('<td>%s</td>' % c)
+                    html.append('<td>%f</td>' % tt)
+                    if nc == 0:
+                        html.append('<td>-</td>')
+                    else:
+                        html.append('<td>%f</td>' % (float(tt) / nc))
+                    html.append('<td>%f</td>' % ct)
+                    if cc == 0:
+                        html.append('<td>-</td>')
+                    else:
+                        html.append('<td>%f</td>' % (float(ct) / cc))
+                    nfls = html.escape(stats.func_std_string(func))
+                    if nfls.split(':')[0] not in ['', 'profile'] and\
+                            os.path.isfile(nfls.split(':')[0]):
+                        html.append('<td><a href="%s/%s%s?format=python#L%d">\
+                                     %s</a></td>' % (app_path, profile_id,
+                                                     nfls, func[1], nfls))
+                    else:
+                        html.append('<td>%s</td>' % nfls)
+                    if not nfls.startswith('/'):
+                        nfls = '/' + nfls
+                    html.append('<td><a href="%s/%s%s?format=json">\
+                                --></a></td></tr>' % (app_path,
+                                                      profile_id, nfls))
+        except Exception as ex:
+            html.append("Exception:" + str(ex))
+        return ''.join(html)
diff --git a/swift/common/middleware/x_profile/profile_model.py b/swift/common/middleware/x_profile/profile_model.py
new file mode 100644
index 0000000000..bf2602bbdb
--- /dev/null
+++ b/swift/common/middleware/x_profile/profile_model.py
@@ -0,0 +1,280 @@
+# Copyright (c) 2010-2012 OpenStack, LLC.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import glob
+import json
+import os
+import pstats
+import tempfile
+import time
+
+from swift.common.middleware.x_profile.exceptions import ODFLIBNotInstalled
+
+
+ODFLIB_INSTALLED = True
+try:
+    from odf.opendocument import OpenDocumentSpreadsheet
+    from odf.table import Table, TableRow, TableCell
+    from odf.text import P
+except ImportError:
+    ODFLIB_INSTALLED = False
+
+
+class Stats2(pstats.Stats):
+
+    def __init__(self, *args, **kwds):
+        pstats.Stats.__init__(self, *args, **kwds)
+
+    def func_to_dict(self, func):
+        return {'module': func[0], 'line': func[1], 'function': func[2]}
+
+    def func_std_string(self, func):
+        return pstats.func_std_string(func)
+
+    def to_json(self, *selection):
+        d = dict()
+        d['files'] = [f for f in self.files]
+        d['prim_calls'] = (self.prim_calls)
+        d['total_calls'] = (self.total_calls)
+        if hasattr(self, 'sort_type'):
+            d['sort_type'] = self.sort_type
+        else:
+            d['sort_type'] = 'random'
+        d['total_tt'] = (self.total_tt)
+        if self.fcn_list:
+            stat_list = self.fcn_list[:]
+        else:
+            stat_list = self.stats.keys()
+        for s in selection:
+            stat_list, __ = self.eval_print_amount(s, stat_list, '')
+
+        self.calc_callees()
+        function_calls = []
+        for func in stat_list:
+            cc, nc, tt, ct, callers = self.stats[func]
+            fdict = dict()
+            fdict.update(self.func_to_dict(func))
+            fdict.update({'cc': (cc), 'nc': (nc), 'tt': (tt),
+                          'ct': (ct)})
+            if self.all_callees:
+                fdict.update({'callees': []})
+                for key in self.all_callees[func]:
+                    cee = self.func_to_dict(key)
+                    metric = self.all_callees[func][key]
+                    # FIXME: eventlet profiler don't provide full list of
+                    # the metrics
+                    if type(metric) is tuple:
+                        cc1, nc1, tt1, ct1 = metric
+                        cee.update({'cc': cc1, 'nc': nc1, 'tt': tt1,
+                                    'ct': ct1})
+                    else:
+                        cee['nc'] = metric
+                    fdict['callees'].append(cee)
+            cer = []
+            for caller in callers:
+                fd = self.func_to_dict(caller)
+                metric2 = callers[caller]
+                if isinstance(metric2, tuple):
+                    cc2, nc2, tt2, ct2 = metric2
+                    fd.update({'cc': cc2, 'nc': nc2, 'tt': tt2, 'ct': ct2})
+                else:
+                    fd.update({'nc': metric2})
+                cer.append(fd)
+            fdict.update({'callers': cer})
+            function_calls.append(fdict)
+        d['stats'] = function_calls
+        return json.dumps(d, indent=2)
+
+    def to_csv(self, *selection):
+        if self.fcn_list:
+            stat_list = self.fcn_list[:]
+            order_text = "Ordered by: " + self.sort_type + '\r\n'
+        else:
+            stat_list = self.stats.keys()
+            order_text = "Random listing order was used\r\n"
+        for s in selection:
+            stat_list, __ = self.eval_print_amount(s, stat_list, '')
+
+        csv = '%d function calls (%d primitive calls) in %.6f seconds.' % (
+            self.total_calls, self.prim_calls, self.total_tt)
+        csv = csv + order_text + 'call count(nc), primitive call count(cc), \
+                                  total time(tt), time per call, \
+                                  cumulative time(ct), time per call, \
+                                  function\r\n'
+        for func in stat_list:
+            cc, nc, tt, ct, __ = self.stats[func]
+            tpc = '' if nc == 0 else '%3f' % (tt / nc)
+            cpc = '' if cc == 0 else '%3f' % (ct / cc)
+            fn = '%s:%d(%s)' % (func[0], func[1], func[2])
+            csv = csv + '%d,%d,%3f,%s,%3f,%s,%s\r\n' % (
+                nc, cc, tt, tpc, ct, cpc, fn)
+        return csv
+
+    def to_ods(self, *selection):
+        if not ODFLIB_INSTALLED:
+            raise ODFLIBNotInstalled('odfpy not installed.')
+        if self.fcn_list:
+            stat_list = self.fcn_list[:]
+            order_text = "   Ordered by: " + self.sort_type + '\n'
+        else:
+            stat_list = self.stats.keys()
+            order_text = "   Random listing order was used\n"
+        for s in selection:
+            stat_list, __ = self.eval_print_amount(s, stat_list, '')
+        spreadsheet = OpenDocumentSpreadsheet()
+        table = Table(name="Profile")
+        for fn in self.files:
+            tcf = TableCell()
+            tcf.addElement(P(text=fn))
+            trf = TableRow()
+            trf.addElement(tcf)
+            table.addElement(trf)
+
+        tc_summary = TableCell()
+        summary_text = '%d function calls (%d primitive calls) in %.6f \
+                        seconds' % (self.total_calls, self.prim_calls,
+                                    self.total_tt)
+        tc_summary.addElement(P(text=summary_text))
+        tr_summary = TableRow()
+        tr_summary.addElement(tc_summary)
+        table.addElement(tr_summary)
+
+        tc_order = TableCell()
+        tc_order.addElement(P(text=order_text))
+        tr_order = TableRow()
+        tr_order.addElement(tc_order)
+        table.addElement(tr_order)
+
+        tr_header = TableRow()
+        tc_cc = TableCell()
+        tc_cc.addElement(P(text='Total Call Count'))
+        tr_header.addElement(tc_cc)
+
+        tc_pc = TableCell()
+        tc_pc.addElement(P(text='Primitive Call Count'))
+        tr_header.addElement(tc_pc)
+
+        tc_tt = TableCell()
+        tc_tt.addElement(P(text='Total Time(seconds)'))
+        tr_header.addElement(tc_tt)
+
+        tc_pc = TableCell()
+        tc_pc.addElement(P(text='Time Per call(seconds)'))
+        tr_header.addElement(tc_pc)
+
+        tc_ct = TableCell()
+        tc_ct.addElement(P(text='Cumulative Time(seconds)'))
+        tr_header.addElement(tc_ct)
+
+        tc_pt = TableCell()
+        tc_pt.addElement(P(text='Cumulative Time per call(seconds)'))
+        tr_header.addElement(tc_pt)
+
+        tc_nfl = TableCell()
+        tc_nfl.addElement(P(text='filename:lineno(function)'))
+        tr_header.addElement(tc_nfl)
+
+        table.addElement(tr_header)
+
+        for func in stat_list:
+            cc, nc, tt, ct, __ = self.stats[func]
+            tr_header = TableRow()
+            tc_nc = TableCell()
+            tc_nc.addElement(P(text=nc))
+            tr_header.addElement(tc_nc)
+
+            tc_pc = TableCell()
+            tc_pc.addElement(P(text=cc))
+            tr_header.addElement(tc_pc)
+
+            tc_tt = TableCell()
+            tc_tt.addElement(P(text=tt))
+            tr_header.addElement(tc_tt)
+
+            tc_tpc = TableCell()
+            tc_tpc.addElement(P(text=(None if nc == 0 else float(tt) / nc)))
+            tr_header.addElement(tc_tpc)
+
+            tc_ct = TableCell()
+            tc_ct.addElement(P(text=ct))
+            tr_header.addElement(tc_ct)
+
+            tc_tpt = TableCell()
+            tc_tpt.addElement(P(text=(None if cc == 0 else float(ct) / cc)))
+            tr_header.addElement(tc_tpt)
+
+            tc_nfl = TableCell()
+            tc_nfl.addElement(P(text=func))
+            tr_header.addElement(tc_nfl)
+            table.addElement(tr_header)
+
+        spreadsheet.spreadsheet.addElement(table)
+        with tempfile.TemporaryFile() as tmp_ods:
+            spreadsheet.write(tmp_ods)
+            tmp_ods.seek(0)
+            data = tmp_ods.read()
+            return data
+
+
+class ProfileLog(object):
+
+    def __init__(self, log_filename_prefix, dump_timestamp):
+        self.log_filename_prefix = log_filename_prefix
+        self.dump_timestamp = dump_timestamp
+
+    def get_all_pids(self):
+        profile_ids = [l.replace(self.log_filename_prefix, '') for l
+                       in glob.glob(self.log_filename_prefix + '*')
+                       if not l.endswith('.tmp')]
+        return sorted(profile_ids, reverse=True)
+
+    def get_logfiles(self, id_or_name):
+        # The first file with timestamp in the sorted log_files
+        # (PREFIX)(PROCESS_ID)-(TIMESTAMP)
+        if id_or_name in ['all']:
+            if self.dump_timestamp:
+                latest_dict = {}
+                for pid in self.get_all_pids():
+                    [process_id, __] = pid.split('-')
+                    if process_id not in latest_dict.keys():
+                        latest_dict[process_id] = self.log_filename_prefix +\
+                            pid
+                log_files = latest_dict.values()
+            else:
+                log_files = [l for l in glob.glob(self.log_filename_prefix
+                             + '*') if not l.endswith('.tmp')]
+        else:
+            pid = str(os.getpid()) if id_or_name in [None, '', 'current']\
+                else id_or_name
+            log_files = [l for l in glob.glob(self.log_filename_prefix +
+                         pid + '*') if not l.endswith('.tmp')]
+            if len(log_files) > 0:
+                log_files = sorted(log_files, reverse=True)[0:1]
+        return log_files
+
+    def dump_profile(self, profiler, pid):
+        if self.log_filename_prefix:
+            pfn = self.log_filename_prefix + str(pid)
+            if self.dump_timestamp:
+                pfn = pfn + "-" + str(time.time())
+            tmpfn = pfn + ".tmp"
+            profiler.dump_stats(tmpfn)
+            os.rename(tmpfn, pfn)
+            return pfn
+
+    def clear(self, id_or_name):
+        log_files = self.get_logfiles(id_or_name)
+        for l in log_files:
+            os.path.exists(l) and os.remove(l)
diff --git a/swift/common/middleware/xprofile.py b/swift/common/middleware/xprofile.py
new file mode 100644
index 0000000000..a7f4f3e16b
--- /dev/null
+++ b/swift/common/middleware/xprofile.py
@@ -0,0 +1,261 @@
+# Copyright (c) 2010-2012 OpenStack, LLC.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""
+Profiling middleware for Swift Servers.
+
+.. note::
+    This middleware is intended for development and testing environments only,
+    not production. No authentication is expected or required for the web UI,
+    and profiling may incur noticeable performance penalties.
+
+The current implementation is based on eventlet aware profiler.(For the
+future, more profilers could be added in to collect more data for analysis.)
+Profiling all incoming requests and accumulating cpu timing statistics
+information for performance tuning and optimization. An mini web UI is also
+provided for profiling data analysis. It can be accessed from the URL as
+below.
+
+Index page for browse profile data::
+
+    http://SERVER_IP:PORT/__profile__
+
+List all profiles to return profile ids in json format::
+
+    http://SERVER_IP:PORT/__profile__/
+    http://SERVER_IP:PORT/__profile__/all
+
+Retrieve specific profile data in different formats::
+
+    http://SERVER_IP:PORT/__profile__/PROFILE_ID?format=[default|json|csv|ods]
+    http://SERVER_IP:PORT/__profile__/current?format=[default|json|csv|ods]
+    http://SERVER_IP:PORT/__profile__/all?format=[default|json|csv|ods]
+
+Retrieve metrics from specific function in json format::
+
+    http://SERVER_IP:PORT/__profile__/PROFILE_ID/NFL?format=json
+    http://SERVER_IP:PORT/__profile__/current/NFL?format=json
+    http://SERVER_IP:PORT/__profile__/all/NFL?format=json
+
+    NFL is defined by concatenation of file name, function name and the first
+    line number.
+    e.g.::
+        account.py:50(GETorHEAD)
+    or with full path:
+        opt/stack/swift/swift/proxy/controllers/account.py:50(GETorHEAD)
+
+    A list of URL examples:
+
+    http://localhost:8080/__profile__    (proxy server)
+    http://localhost:6200/__profile__/all    (object server)
+    http://localhost:6201/__profile__/current    (container server)
+    http://localhost:6202/__profile__/12345?format=json    (account server)
+
+The profiling middleware can be configured in paste file for WSGI servers such
+as proxy, account, container and object servers. Please refer to the sample
+configuration files in etc directory.
+
+The profiling data is provided with four formats such as binary(by default),
+json, csv and odf spreadsheet which requires installing odfpy library::
+
+    sudo pip install odfpy
+
+There's also a simple visualization capability which is enabled by using
+matplotlib toolkit. it is also required to be installed if you want to use
+it to visualize statistic data::
+
+    sudo apt-get install python-matplotlib
+"""
+
+import os
+import sys
+import time
+
+from eventlet import greenthread, GreenPool, patcher
+import eventlet.green.profile as eprofile
+import urllib
+
+from swift.common.utils import get_logger, config_true_value
+from swift.common.swob import Request
+from swift.common.middleware.x_profile.exceptions import MethodNotAllowed
+from swift.common.middleware.x_profile.exceptions import NotFoundException
+from swift.common.middleware.x_profile.exceptions import ProfileException
+from swift.common.middleware.x_profile.html_viewer import HTMLViewer
+from swift.common.middleware.x_profile.profile_model import ProfileLog
+
+
+DEFAULT_PROFILE_PREFIX = '/tmp/log/swift/profile/default.profile'  # nosec B108
+
+# unwind the iterator; it may call start_response, do lots of work, etc
+PROFILE_EXEC_EAGER = """
+app_iter = self.app(environ, start_response)
+app_iter_ = list(app_iter)
+if hasattr(app_iter, 'close'):
+    app_iter.close()
+"""
+
+# don't unwind the iterator (don't consume resources)
+PROFILE_EXEC_LAZY = """
+app_iter_ = self.app(environ, start_response)
+"""
+
+thread = patcher.original('_thread')  # non-monkeypatched module needed
+
+
+# This monkey patch code fix the problem of eventlet profile tool
+# which can not accumulate profiling results across multiple calls
+# of runcalls and runctx.
+def new_setup(self):
+    self._has_setup = True
+    self.cur = None
+    self.timings = {}
+    self.current_tasklet = greenthread.getcurrent()
+    self.thread_id = thread.get_ident()
+    self.simulate_call("profiler")
+
+
+def new_runctx(self, cmd, globals, locals):
+    if not getattr(self, '_has_setup', False):
+        self._setup()
+    try:
+        return self.base.runctx(self, cmd, globals, locals)
+    finally:
+        self.TallyTimings()
+
+
+def new_runcall(self, func, *args, **kw):
+    if not getattr(self, '_has_setup', False):
+        self._setup()
+    try:
+        return self.base.runcall(self, func, *args, **kw)
+    finally:
+        self.TallyTimings()
+
+
+class ProfileMiddleware(object):
+
+    def __init__(self, app, conf):
+        self.app = app
+        self.logger = get_logger(conf, log_route='profile')
+        self.log_filename_prefix = conf.get('log_filename_prefix',
+                                            DEFAULT_PROFILE_PREFIX)
+        dirname = os.path.dirname(self.log_filename_prefix)
+        # Notes: this effort may fail due to permission denied.
+        # it is better to be created and authorized to current
+        # user in advance.
+        if not os.path.exists(dirname):
+            os.makedirs(dirname)
+        self.dump_interval = float(conf.get('dump_interval', 5.0))
+        self.dump_timestamp = config_true_value(conf.get(
+            'dump_timestamp', 'no'))
+        self.flush_at_shutdown = config_true_value(conf.get(
+            'flush_at_shutdown', 'no'))
+        self.path = conf.get('path', '__profile__').replace('/', '')
+        self.unwind = config_true_value(conf.get('unwind', 'no'))
+        self.profile_module = conf.get('profile_module',
+                                       'eventlet.green.profile')
+        self.profiler = get_profiler(self.profile_module)
+        self.profile_log = ProfileLog(self.log_filename_prefix,
+                                      self.dump_timestamp)
+        self.viewer = HTMLViewer(self.path, self.profile_module,
+                                 self.profile_log)
+        self.dump_pool = GreenPool(1000)
+        self.last_dump_at = None
+
+    def __del__(self):
+        if self.flush_at_shutdown:
+            self.profile_log.clear(str(os.getpid()))
+
+    def _combine_body_qs(self, request):
+        wsgi_input = request.environ['wsgi.input']
+        query_dict = request.params
+        qs_in_body = wsgi_input.read().decode('utf-8')
+        query_dict.update(urllib.parse.parse_qs(qs_in_body,
+                                                keep_blank_values=True,
+                                                strict_parsing=False))
+        return query_dict
+
+    def dump_checkpoint(self):
+        current_time = time.time()
+        if self.last_dump_at is None or self.last_dump_at +\
+                self.dump_interval < current_time:
+            self.dump_pool.spawn_n(self.profile_log.dump_profile,
+                                   self.profiler, os.getpid())
+            self.last_dump_at = current_time
+
+    def __call__(self, environ, start_response):
+        request = Request(environ)
+        path_entry = request.path_info.split('/')
+        # hijack favicon request sent by browser so that it doesn't
+        # invoke profiling hook and contaminate the data.
+        if path_entry[1] == 'favicon.ico':
+            start_response('200 OK', [])
+            return ''
+        elif path_entry[1] == self.path:
+            try:
+                self.dump_checkpoint()
+                query_dict = self._combine_body_qs(request)
+                content, headers = self.viewer.render(request.url,
+                                                      request.method,
+                                                      path_entry,
+                                                      query_dict,
+                                                      self.renew_profile)
+                start_response('200 OK', headers)
+                if isinstance(content, str):
+                    content = content.encode('utf-8')
+                return [content]
+            except MethodNotAllowed as mx:
+                start_response('405 Method Not Allowed', [])
+                return '%s' % mx
+            except NotFoundException as nx:
+                start_response('404 Not Found', [])
+                return '%s' % nx
+            except ProfileException as pf:
+                start_response('500 Internal Server Error', [])
+                return '%s' % pf
+            except Exception as ex:
+                start_response('500 Internal Server Error', [])
+                return 'Error on render profiling results: %s' % ex
+        else:
+            _locals = locals()
+            code = self.unwind and PROFILE_EXEC_EAGER or\
+                PROFILE_EXEC_LAZY
+            self.profiler.runctx(code, globals(), _locals)
+            app_iter = _locals['app_iter_']
+            self.dump_checkpoint()
+            return app_iter
+
+    def renew_profile(self):
+        self.profiler = get_profiler(self.profile_module)
+
+
+def get_profiler(profile_module):
+    if profile_module == 'eventlet.green.profile':
+        eprofile.Profile._setup = new_setup
+        eprofile.Profile.runctx = new_runctx
+        eprofile.Profile.runcall = new_runcall
+    # hacked method to import profile module supported in python 2.6
+    __import__(profile_module)
+    return sys.modules[profile_module].Profile()
+
+
+def filter_factory(global_conf, **local_conf):
+    conf = global_conf.copy()
+    conf.update(local_conf)
+
+    def profile_filter(app):
+        return ProfileMiddleware(app, conf)
+
+    return profile_filter
diff --git a/bin/swift-account-replicator b/swift/common/recon.py
old mode 100755
new mode 100644
similarity index 50%
rename from bin/swift-account-replicator
rename to swift/common/recon.py
index b112f015d7..f1928e2f1c
--- a/bin/swift-account-replicator
+++ b/swift/common/recon.py
@@ -1,5 +1,4 @@
-#!/usr/bin/env python
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2021 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -14,10 +13,16 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-from swift.account.replicator import AccountReplicator
-from swift.common.utils import parse_options
-from swift.common.daemon import run_daemon
+RECON_RELINKER_FILE = 'relinker.recon'
+RECON_OBJECT_FILE = 'object.recon'
+RECON_CONTAINER_FILE = 'container.recon'
+RECON_ACCOUNT_FILE = 'account.recon'
+RECON_DRIVE_FILE = 'drive.recon'
+DEFAULT_RECON_CACHE_PATH = '/var/cache/swift'
 
-if __name__ == '__main__':
-    conf_file, options = parse_options(once=True)
-    run_daemon(AccountReplicator, conf_file, **options)
+
+def server_type_to_recon_file(server_type):
+    if not isinstance(server_type, str) or \
+            server_type.lower() not in ('account', 'container', 'object'):
+        raise ValueError('Invalid server_type')
+    return "%s.recon" % server_type.lower()
diff --git a/swift/common/registry.py b/swift/common/registry.py
new file mode 100644
index 0000000000..f1b147ce80
--- /dev/null
+++ b/swift/common/registry.py
@@ -0,0 +1,147 @@
+# Copyright (c) 2022 NVIDIA
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+# Used by get_swift_info and register_swift_info to store information about
+# the swift cluster.
+from copy import deepcopy
+
+_swift_info = {}
+_swift_admin_info = {}
+
+
+def get_swift_info(admin=False, disallowed_sections=None):
+    """
+    Returns information about the swift cluster that has been previously
+    registered with the register_swift_info call.
+
+    :param admin: boolean value, if True will additionally return an 'admin'
+                  section with information previously registered as admin
+                  info.
+    :param disallowed_sections: list of section names to be withheld from the
+                                information returned.
+    :returns: dictionary of information about the swift cluster.
+    """
+    disallowed_sections = disallowed_sections or []
+    info = deepcopy(_swift_info)
+    for section in disallowed_sections:
+        key_to_pop = None
+        sub_section_dict = info
+        for sub_section in section.split('.'):
+            if key_to_pop:
+                sub_section_dict = sub_section_dict.get(key_to_pop, {})
+                if not isinstance(sub_section_dict, dict):
+                    sub_section_dict = {}
+                    break
+            key_to_pop = sub_section
+        sub_section_dict.pop(key_to_pop, None)
+
+    if admin:
+        info['admin'] = dict(_swift_admin_info)
+        info['admin']['disallowed_sections'] = list(disallowed_sections)
+    return info
+
+
+def register_swift_info(name='swift', admin=False, **kwargs):
+    """
+    Registers information about the swift cluster to be retrieved with calls
+    to get_swift_info.
+
+    NOTE: Do not use "." in the param: name or any keys in kwargs. "." is used
+          in the disallowed_sections to remove unwanted keys from /info.
+
+    :param name: string, the section name to place the information under.
+    :param admin: boolean, if True, information will be registered to an
+                  admin section which can optionally be withheld when
+                  requesting the information.
+    :param kwargs: key value arguments representing the information to be
+                   added.
+    :raises ValueError: if name or any of the keys in kwargs has "." in it
+    """
+    if name == 'admin' or name == 'disallowed_sections':
+        raise ValueError('\'{0}\' is reserved name.'.format(name))
+
+    if admin:
+        dict_to_use = _swift_admin_info
+    else:
+        dict_to_use = _swift_info
+    if name not in dict_to_use:
+        if "." in name:
+            raise ValueError('Cannot use "." in a swift_info key: %s' % name)
+        dict_to_use[name] = {}
+    for key, val in kwargs.items():
+        if "." in key:
+            raise ValueError('Cannot use "." in a swift_info key: %s' % key)
+        dict_to_use[name][key] = val
+
+
+_sensitive_headers = set()
+_sensitive_params = set()
+
+
+def get_sensitive_headers():
+    """
+    Returns the set of registered sensitive headers.
+
+    Used by :mod:`swift.common.middleware.proxy_logging` to perform redactions
+    prior to logging.
+    """
+    return frozenset(_sensitive_headers)
+
+
+def register_sensitive_header(header):
+    """
+    Register a header as being "sensitive".
+
+    Sensitive headers are automatically redacted when logging. See the
+    ``reveal_sensitive_prefix`` option in the proxy-server sample config
+    for more information.
+
+    :param header: The (case-insensitive) header name which, if present, may
+        contain sensitive information. Examples include ``X-Auth-Token`` and
+        (if s3api is enabled) ``Authorization``. Limited to ASCII characters.
+    """
+    if not isinstance(header, str):
+        raise TypeError
+    header.encode('ascii')
+    _sensitive_headers.add(header.lower())
+
+
+def get_sensitive_params():
+    """
+    Returns the set of registered sensitive query parameters.
+
+    Used by :mod:`swift.common.middleware.proxy_logging` to perform redactions
+    prior to logging.
+    """
+    return frozenset(_sensitive_params)
+
+
+def register_sensitive_param(query_param):
+    """
+    Register a query parameter as being "sensitive".
+
+    Sensitive query parameters are automatically redacted when logging. See
+    the ``reveal_sensitive_prefix`` option in the proxy-server sample config
+    for more information.
+
+    :param query_param: The (case-sensitive) query parameter name which, if
+        present, may contain sensitive information. Examples include
+        ``temp_url_signature`` and (if s3api is enabled) ``X-Amz-Signature``.
+        Limited to ASCII characters.
+    """
+    if not isinstance(query_param, str):
+        raise TypeError
+    query_param.encode('ascii')
+    _sensitive_params.add(query_param)
diff --git a/swift/common/request_helpers.py b/swift/common/request_helpers.py
new file mode 100644
index 0000000000..63e63ac69c
--- /dev/null
+++ b/swift/common/request_helpers.py
@@ -0,0 +1,1053 @@
+# Copyright (c) 2010-2013 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""
+Miscellaneous utility functions for use in generating responses.
+
+Why not swift.common.utils, you ask? Because this way we can import things
+from swob in here without creating circular imports.
+"""
+
+import itertools
+import time
+import json
+from xml.sax.saxutils import escape  # nosec B406
+
+from swift.common.header_key_dict import HeaderKeyDict
+
+from swift.common.constraints import AUTO_CREATE_ACCOUNT_PREFIX, \
+    CONTAINER_LISTING_LIMIT
+from swift.common.storage_policy import POLICIES
+from swift.common.exceptions import ListingIterError, SegmentError
+from swift.common.http import is_success, is_server_error
+from swift.common.swob import HTTPBadRequest, \
+    HTTPServiceUnavailable, Range, is_chunked, multi_range_iterator, \
+    HTTPPreconditionFailed, wsgi_to_bytes, wsgi_unquote, wsgi_to_str
+from swift.common.utils import split_path, validate_device_partition, \
+    close_if_possible, friendly_close, \
+    maybe_multipart_byteranges_to_document_iters, \
+    multipart_byteranges_to_document_iters, parse_content_type, \
+    parse_content_range, csv_append, list_from_csv, Spliterator, quote, \
+    RESERVED, config_true_value, md5, CloseableChain, select_ip_port
+from swift.common.wsgi import make_subrequest
+
+
+OBJECT_TRANSIENT_SYSMETA_PREFIX = 'x-object-transient-sysmeta-'
+OBJECT_SYSMETA_CONTAINER_UPDATE_OVERRIDE_PREFIX = \
+    'x-object-sysmeta-container-update-override-'
+USE_REPLICATION_NETWORK_HEADER = 'x-backend-use-replication-network'
+MISPLACED_OBJECTS_ACCOUNT = '.misplaced_objects'
+
+
+def get_param(req, name, default=None):
+    """
+    Get a parameter from an HTTP request ensuring proper handling UTF-8
+    encoding.
+
+    :param req: request object
+    :param name: parameter name
+    :param default: result to return if the parameter is not found
+    :returns: HTTP request parameter value, as a native (not WSGI) string
+    :raises HTTPBadRequest: if param not valid UTF-8 byte sequence
+    """
+    value = req.params.get(name, default)
+    if value:
+        # req.params is a dict of WSGI strings, so encoding will succeed
+        value = value.encode('latin1')
+        try:
+            # Ensure UTF8ness since we're at it
+            value = value.decode('utf8')
+        except UnicodeDecodeError:
+            raise HTTPBadRequest(
+                request=req, content_type='text/plain',
+                body='"%s" parameter not valid UTF-8' % name)
+    return value
+
+
+def get_valid_part_num(req):
+    """
+    Any non-range GET or HEAD request for a SLO object may include a
+    part-number parameter in query string.  If the passed in request
+    includes a part-number parameter it will be parsed into a valid integer
+    and returned.  If the passed in request does not include a part-number
+    param we will return None.  If the part-number parameter is invalid for
+    the given request we will raise the appropriate HTTP exception
+
+    :param req: the request object
+
+    :returns: validated part-number value or None
+    :raises HTTPBadRequest: if request or part-number param is not valid
+    """
+    part_number_param = get_param(req, 'part-number')
+    if part_number_param is None:
+        return None
+    try:
+        part_number = int(part_number_param)
+        if part_number <= 0:
+            raise ValueError
+    except ValueError:
+        raise HTTPBadRequest('Part number must be an integer greater '
+                             'than 0')
+
+    if req.range:
+        raise HTTPBadRequest(req=req,
+                             body='Range requests are not supported '
+                                  'with part number queries')
+
+    return part_number
+
+
+def validate_params(req, names):
+    """
+    Get list of parameters from an HTTP request, validating the encoding of
+    each parameter.
+
+    :param req: request object
+    :param names: parameter names
+    :returns: a dict mapping parameter names to values for each name that
+              appears in the request parameters
+    :raises HTTPBadRequest: if any parameter value is not a valid UTF-8 byte
+            sequence
+    """
+    params = {}
+    for name in names:
+        value = get_param(req, name)
+        if value is None:
+            continue
+        params[name] = value
+    return params
+
+
+def constrain_req_limit(req, constrained_limit):
+    given_limit = get_param(req, 'limit')
+    limit = constrained_limit
+    if given_limit and given_limit.isdigit():
+        limit = int(given_limit)
+        if limit > constrained_limit:
+            raise HTTPPreconditionFailed(
+                request=req, body='Maximum limit is %d' % constrained_limit)
+    return limit
+
+
+def validate_container_params(req):
+    params = validate_params(req, ('marker', 'end_marker', 'prefix',
+                                   'delimiter', 'path', 'format', 'reverse',
+                                   'states', 'includes'))
+    params['limit'] = constrain_req_limit(req, CONTAINER_LISTING_LIMIT)
+    return params
+
+
+def _validate_internal_name(name, type_='name'):
+    if RESERVED in name and not name.startswith(RESERVED):
+        raise HTTPBadRequest(body='Invalid reserved-namespace %s' % (type_))
+
+
+def validate_internal_account(account):
+    """
+    Validate internal account name.
+
+    :raises: HTTPBadRequest
+    """
+    _validate_internal_name(account, 'account')
+
+
+def validate_internal_container(account, container):
+    """
+    Validate internal account and container names.
+
+    :raises: HTTPBadRequest
+    """
+    if not account:
+        raise ValueError('Account is required')
+    validate_internal_account(account)
+    if container:
+        _validate_internal_name(container, 'container')
+
+
+def validate_internal_obj(account, container, obj):
+    """
+    Validate internal account, container and object names.
+
+    :raises: HTTPBadRequest
+    """
+    if not account:
+        raise ValueError('Account is required')
+    if not container:
+        raise ValueError('Container is required')
+    validate_internal_container(account, container)
+    if obj and not (account.startswith(AUTO_CREATE_ACCOUNT_PREFIX) or
+                    account == MISPLACED_OBJECTS_ACCOUNT):
+        _validate_internal_name(obj, 'object')
+        if container.startswith(RESERVED) and not obj.startswith(RESERVED):
+            raise HTTPBadRequest(body='Invalid user-namespace object '
+                                 'in reserved-namespace container')
+        elif obj.startswith(RESERVED) and not container.startswith(RESERVED):
+            raise HTTPBadRequest(body='Invalid reserved-namespace object '
+                                 'in user-namespace container')
+
+
+def get_name_and_placement(request, minsegs=1, maxsegs=None,
+                           rest_with_last=False):
+    """
+    Utility function to split and validate the request path and storage
+    policy.  The storage policy index is extracted from the headers of
+    the request and converted to a StoragePolicy instance.  The
+    remaining args are passed through to
+    :meth:`split_and_validate_path`.
+
+    :returns: a list, result of :meth:`split_and_validate_path` with
+              the BaseStoragePolicy instance appended on the end
+    :raises HTTPServiceUnavailable: if the path is invalid or no policy exists
+             with the extracted policy_index.
+    """
+    policy_index = request.headers.get('X-Backend-Storage-Policy-Index')
+    policy = POLICIES.get_by_index(policy_index)
+    if not policy:
+        raise HTTPServiceUnavailable(
+            body="No policy with index %s" % policy_index,
+            request=request, content_type='text/plain')
+    results = split_and_validate_path(request, minsegs=minsegs,
+                                      maxsegs=maxsegs,
+                                      rest_with_last=rest_with_last)
+    results.append(policy)
+    return results
+
+
+def split_and_validate_path(request, minsegs=1, maxsegs=None,
+                            rest_with_last=False):
+    """
+    Utility function to split and validate the request path.
+
+    :returns: result of :meth:`~swift.common.utils.split_path` if
+              everything's okay, as native strings
+    :raises HTTPBadRequest: if something's not okay
+    """
+    try:
+        segs = request.split_path(minsegs, maxsegs, rest_with_last)
+        validate_device_partition(segs[0], segs[1])
+        return [wsgi_to_str(seg) for seg in segs]
+    except ValueError as err:
+        raise HTTPBadRequest(body=str(err), request=request,
+                             content_type='text/plain')
+
+
+def is_user_meta(server_type, key):
+    """
+    Tests if a header key starts with and is longer than the user
+    metadata prefix for given server type.
+
+    :param server_type: type of backend server i.e. [account|container|object]
+    :param key: header key
+    :returns: True if the key satisfies the test, False otherwise
+    """
+    if len(key) <= 8 + len(server_type):
+        return False
+    return key.lower().startswith(get_user_meta_prefix(server_type))
+
+
+def is_sys_meta(server_type, key):
+    """
+    Tests if a header key starts with and is longer than the system
+    metadata prefix for given server type.
+
+    :param server_type: type of backend server i.e. [account|container|object]
+    :param key: header key
+    :returns: True if the key satisfies the test, False otherwise
+    """
+    if len(key) <= 11 + len(server_type):
+        return False
+    return key.lower().startswith(get_sys_meta_prefix(server_type))
+
+
+def is_sys_or_user_meta(server_type, key):
+    """
+    Tests if a header key starts with and is longer than the user or system
+    metadata prefix for given server type.
+
+    :param server_type: type of backend server i.e. [account|container|object]
+    :param key: header key
+    :returns: True if the key satisfies the test, False otherwise
+    """
+    return is_user_meta(server_type, key) or is_sys_meta(server_type, key)
+
+
+def is_object_transient_sysmeta(key):
+    """
+    Tests if a header key starts with and is longer than the prefix for object
+    transient system metadata.
+
+    :param key: header key
+    :returns: True if the key satisfies the test, False otherwise
+    """
+    if len(key) <= len(OBJECT_TRANSIENT_SYSMETA_PREFIX):
+        return False
+    return key.lower().startswith(OBJECT_TRANSIENT_SYSMETA_PREFIX)
+
+
+def strip_user_meta_prefix(server_type, key):
+    """
+    Removes the user metadata prefix for a given server type from the start
+    of a header key.
+
+    :param server_type: type of backend server i.e. [account|container|object]
+    :param key: header key
+    :returns: stripped header key
+    """
+    if not is_user_meta(server_type, key):
+        raise ValueError('Key is not user meta')
+    return key[len(get_user_meta_prefix(server_type)):]
+
+
+def strip_sys_meta_prefix(server_type, key):
+    """
+    Removes the system metadata prefix for a given server type from the start
+    of a header key.
+
+    :param server_type: type of backend server i.e. [account|container|object]
+    :param key: header key
+    :returns: stripped header key
+    """
+    if not is_sys_meta(server_type, key):
+        raise ValueError('Key is not sysmeta')
+    return key[len(get_sys_meta_prefix(server_type)):]
+
+
+def strip_object_transient_sysmeta_prefix(key):
+    """
+    Removes the object transient system metadata prefix from the start of a
+    header key.
+
+    :param key: header key
+    :returns: stripped header key
+    """
+    if not is_object_transient_sysmeta(key):
+        raise ValueError('Key is not object transient sysmeta')
+    return key[len(OBJECT_TRANSIENT_SYSMETA_PREFIX):]
+
+
+def get_user_meta_prefix(server_type):
+    """
+    Returns the prefix for user metadata headers for given server type.
+
+    This prefix defines the namespace for headers that will be persisted
+    by backend servers.
+
+    :param server_type: type of backend server i.e. [account|container|object]
+    :returns: prefix string for server type's user metadata headers
+    """
+    return 'x-%s-%s-' % (server_type.lower(), 'meta')
+
+
+def get_sys_meta_prefix(server_type):
+    """
+    Returns the prefix for system metadata headers for given server type.
+
+    This prefix defines the namespace for headers that will be persisted
+    by backend servers.
+
+    :param server_type: type of backend server i.e. [account|container|object]
+    :returns: prefix string for server type's system metadata headers
+    """
+    return 'x-%s-%s-' % (server_type.lower(), 'sysmeta')
+
+
+def get_object_transient_sysmeta(key):
+    """
+    Returns the Object Transient System Metadata header for key.
+    The Object Transient System Metadata namespace will be persisted by
+    backend object servers. These headers are treated in the same way as
+    object user metadata i.e. all headers in this namespace will be
+    replaced on every POST request.
+
+    :param key: metadata key
+    :returns: the entire object transient system metadata header for key
+    """
+    return '%s%s' % (OBJECT_TRANSIENT_SYSMETA_PREFIX, key)
+
+
+def get_container_update_override_key(key):
+    """
+    Returns the full X-Object-Sysmeta-Container-Update-Override-* header key.
+
+    :param key: the key you want to override in the container update
+    :returns: the full header key
+    """
+    header = '%s%s' % (OBJECT_SYSMETA_CONTAINER_UPDATE_OVERRIDE_PREFIX, key)
+    return header.title()
+
+
+def get_reserved_name(*parts):
+    """
+    Generate a valid reserved name that joins the component parts.
+
+    :returns: a string
+    """
+    if any(RESERVED in p for p in parts):
+        raise ValueError('Invalid reserved part in components')
+    return RESERVED + RESERVED.join(parts)
+
+
+def split_reserved_name(name):
+    """
+    Separate a valid reserved name into the component parts.
+
+    :returns: a list of strings
+    """
+    if not name.startswith(RESERVED):
+        raise ValueError('Invalid reserved name')
+    return name.split(RESERVED)[1:]
+
+
+def remove_items(headers, condition):
+    """
+    Removes items from a dict whose keys satisfy
+    the given condition.
+
+    :param headers: a dict of headers
+    :param condition: a function that will be passed the header key as a
+                      single argument and should return True if the header
+                      is to be removed.
+    :returns: a dict, possibly empty, of headers that have been removed
+    """
+    removed = {}
+    keys = [key for key in headers if condition(key)]
+    removed.update((key, headers.pop(key)) for key in keys)
+    return removed
+
+
+def copy_header_subset(from_r, to_r, condition):
+    """
+    Will copy desired subset of headers from from_r to to_r.
+
+    :param from_r: a swob Request or Response
+    :param to_r: a swob Request or Response
+    :param condition: a function that will be passed the header key as a
+                      single argument and should return True if the header
+                      is to be copied.
+    """
+    for k, v in from_r.headers.items():
+        if condition(k):
+            to_r.headers[k] = v
+
+
+def check_path_header(req, name, length, error_msg):
+    """
+    Validate that the value of path-like header is
+    well formatted. We assume the caller ensures that
+    specific header is present in req.headers.
+
+    :param req: HTTP request object
+    :param name: header name
+    :param length: length of path segment check
+    :param error_msg: error message for client
+    :returns: A tuple with path parts according to length
+    :raise: HTTPPreconditionFailed if header value
+            is not well formatted.
+    """
+    hdr = wsgi_unquote(req.headers.get(name))
+    if not hdr.startswith('/'):
+        hdr = '/' + hdr
+    try:
+        return split_path(hdr, length, length, True)
+    except ValueError:
+        raise HTTPPreconditionFailed(
+            request=req,
+            body=error_msg)
+
+
+class SegmentedIterable(object):
+    """
+    Iterable that returns the object contents for a large object.
+
+    :param req: original request object
+    :param app: WSGI application from which segments will come
+
+    :param listing_iter: iterable yielding the object segments to fetch,
+        along with the byte sub-ranges to fetch. Each yielded item should be a
+        dict with the following keys: ``path`` or ``raw_data``,
+        ``first-byte``, ``last-byte``, ``hash`` (optional), ``bytes``
+        (optional).
+
+        If ``hash`` is None, no MD5 verification will be done.
+
+        If ``bytes`` is None, no length verification will be done.
+
+        If ``first-byte`` and ``last-byte`` are None, then the entire object
+        will be fetched.
+
+    :param max_get_time: maximum permitted duration of a GET request (seconds)
+    :param logger: logger object
+    :param swift_source: value of swift.source in subrequest environ
+                         (just for logging)
+    :param ua_suffix: string to append to user-agent.
+    :param name: name of manifest (used in logging only)
+    :param response_body_length: optional response body length for
+                                 the response being sent to the client.
+    """
+
+    def __init__(self, req, app, listing_iter, max_get_time,
+                 logger, ua_suffix, swift_source,
+                 name='<not specified>', response_body_length=None):
+        self.req = req
+        self.app = app
+        self.listing_iter = listing_iter
+        self.max_get_time = max_get_time
+        self.logger = logger
+        self.ua_suffix = " " + ua_suffix
+        self.swift_source = swift_source
+        self.name = name
+        self.response_body_length = response_body_length
+        self.peeked_chunk = None
+        self.app_iter = self._internal_iter()
+        self.validated_first_segment = False
+        self.current_resp = None
+
+    def _coalesce_requests(self):
+        pending_req = pending_etag = pending_size = None
+        try:
+            for seg_dict in self.listing_iter:
+                if 'raw_data' in seg_dict:
+                    if pending_req:
+                        yield pending_req, pending_etag, pending_size
+
+                    to_yield = seg_dict['raw_data'][
+                        seg_dict['first_byte']:seg_dict['last_byte'] + 1]
+                    yield to_yield, None, len(seg_dict['raw_data'])
+                    pending_req = pending_etag = pending_size = None
+                    continue
+
+                seg_path, seg_etag, seg_size, first_byte, last_byte = (
+                    seg_dict['path'], seg_dict.get('hash'),
+                    seg_dict.get('bytes'),
+                    seg_dict['first_byte'], seg_dict['last_byte'])
+                if seg_size is not None:
+                    seg_size = int(seg_size)
+                first_byte = first_byte or 0
+                go_to_end = last_byte is None or (
+                    seg_size is not None and last_byte == seg_size - 1)
+                # The "multipart-manifest=get" query param ensures that the
+                # segment is a plain old object, not some flavor of large
+                # object; therefore, its etag is its MD5sum and hence we can
+                # check it.
+                path = quote(seg_path) + '?multipart-manifest=get'
+                seg_req = make_subrequest(
+                    self.req.environ, path=path, method='GET',
+                    headers={h: self.req.headers.get(h)
+                             for h in ('x-auth-token', 'x-open-expired')},
+                    agent=('%(orig)s ' + self.ua_suffix),
+                    swift_source=self.swift_source)
+
+                seg_req_rangeval = None
+                if first_byte != 0 or not go_to_end:
+                    seg_req_rangeval = "%s-%s" % (
+                        first_byte, '' if go_to_end else last_byte)
+                    seg_req.headers['Range'] = "bytes=" + seg_req_rangeval
+
+                # We can only coalesce if paths match and we know the segment
+                # size (so we can check that the ranges will be allowed)
+                if pending_req and pending_req.path == seg_req.path and \
+                        seg_size is not None:
+
+                    # Make a new Range object so that we don't goof up the
+                    # existing one in case of invalid ranges. Note that a
+                    # range set with too many individual byteranges is
+                    # invalid, so we can combine N valid byteranges and 1
+                    # valid byterange and get an invalid range set.
+                    if pending_req.range:
+                        new_range_str = str(pending_req.range)
+                    else:
+                        new_range_str = "bytes=0-%d" % (seg_size - 1)
+
+                    if seg_req.range:
+                        new_range_str += "," + seg_req_rangeval
+                    else:
+                        new_range_str += ",0-%d" % (seg_size - 1)
+
+                    if Range(new_range_str).ranges_for_length(seg_size):
+                        # Good news! We can coalesce the requests
+                        pending_req.headers['Range'] = new_range_str
+                        continue
+                    # else, Too many ranges, or too much backtracking, or ...
+
+                if pending_req:
+                    yield pending_req, pending_etag, pending_size
+                pending_req = seg_req
+                pending_etag = seg_etag
+                pending_size = seg_size
+
+        except ListingIterError as e:
+            if pending_req:
+                yield pending_req, pending_etag, pending_size
+            raise e
+
+        if pending_req:
+            yield pending_req, pending_etag, pending_size
+
+    def _requests_to_bytes_iter(self):
+        # Take the requests out of self._coalesce_requests, actually make
+        # the requests, and generate the bytes from the responses.
+        #
+        # Yields 2-tuples (segment-name, byte-chunk). The segment name is
+        # used for logging.
+        for data_or_req, seg_etag, seg_size in self._coalesce_requests():
+            if isinstance(data_or_req, bytes):  # ugly, awful overloading
+                yield ('data segment', data_or_req)
+                continue
+            seg_req = data_or_req
+            seg_resp = seg_req.get_response(self.app)
+            if not is_success(seg_resp.status_int):
+                # Error body should be short
+                body = seg_resp.body.decode('utf8')
+                msg = 'While processing manifest %s, got %d (%s) ' \
+                    'while retrieving %s' % (
+                        self.name, seg_resp.status_int,
+                        body if len(body) <= 60 else body[:57] + '...',
+                        seg_req.path)
+                if is_server_error(seg_resp.status_int):
+                    self.logger.error(msg)
+                    raise HTTPServiceUnavailable(
+                        request=seg_req, content_type='text/plain')
+                raise SegmentError(msg)
+            elif ((seg_etag and (seg_resp.etag != seg_etag)) or
+                    (seg_size and (seg_resp.content_length != seg_size) and
+                     not seg_req.range)):
+                # The content-length check is for security reasons. Seems
+                # possible that an attacker could upload a >1mb object and
+                # then replace it with a much smaller object with same
+                # etag. Then create a big nested SLO that calls that
+                # object many times which would hammer our obj servers. If
+                # this is a range request, don't check content-length
+                # because it won't match.
+                close_if_possible(seg_resp.app_iter)
+                raise SegmentError(
+                    'Object segment no longer valid: '
+                    '%(path)s etag: %(r_etag)s != %(s_etag)s or '
+                    '%(r_size)s != %(s_size)s.' %
+                    {'path': seg_req.path, 'r_etag': seg_resp.etag,
+                     'r_size': seg_resp.content_length,
+                     's_etag': seg_etag,
+                     's_size': seg_size})
+            else:
+                self.current_resp = seg_resp
+
+            resp_len = 0
+            seg_hash = None
+            if seg_resp.etag and not seg_req.headers.get('Range'):
+                # Only calculate the MD5 if it we can use it to validate
+                seg_hash = md5(usedforsecurity=False)
+
+            document_iters = maybe_multipart_byteranges_to_document_iters(
+                seg_resp.app_iter,
+                seg_resp.headers['Content-Type'])
+
+            for chunk in itertools.chain.from_iterable(document_iters):
+                if seg_hash:
+                    seg_hash.update(chunk)
+                    resp_len += len(chunk)
+                yield (seg_req.path, chunk)
+            close_if_possible(seg_resp.app_iter)
+
+            if seg_hash:
+                if resp_len != seg_resp.content_length:
+                    raise SegmentError(
+                        "Bad response length for %(seg)s as part of %(name)s: "
+                        "headers had %(from_headers)s, but response length "
+                        "was actually %(actual)s" %
+                        {'seg': seg_req.path,
+                         'from_headers': seg_resp.content_length,
+                         'name': self.name, 'actual': resp_len})
+                if seg_hash.hexdigest() != seg_resp.etag:
+                    raise SegmentError(
+                        "Bad MD5 checksum for %(seg)s as part of %(name)s: "
+                        "headers had %(etag)s, but object MD5 was actually "
+                        "%(actual)s" %
+                        {'seg': seg_req.path, 'etag': seg_resp.etag,
+                         'name': self.name, 'actual': seg_hash.hexdigest()})
+
+    def _byte_counting_iter(self):
+        # Checks that we give the client the right number of bytes. Raises
+        # SegmentError if the number of bytes is wrong.
+        bytes_left = self.response_body_length
+
+        for seg_name, chunk in self._requests_to_bytes_iter():
+            if bytes_left is None:
+                yield chunk
+            elif bytes_left >= len(chunk):
+                yield chunk
+                bytes_left -= len(chunk)
+            else:
+                yield chunk[:bytes_left]
+                bytes_left -= len(chunk)
+                raise SegmentError(
+                    'Too many bytes for %(name)s; truncating in '
+                    '%(seg)s with %(left)d bytes left' %
+                    {'name': self.name, 'seg': seg_name,
+                     'left': -bytes_left})
+
+        if bytes_left:
+            raise SegmentError('Expected another %d bytes for %s; '
+                               'closing connection' % (bytes_left, self.name))
+
+    def _time_limited_iter(self):
+        # Makes sure a GET response doesn't take more than self.max_get_time
+        # seconds to process. Raises an exception if things take too long.
+        start_time = time.time()
+        for chunk in self._byte_counting_iter():
+            now = time.time()
+            yield chunk
+            if now - start_time > self.max_get_time:
+                raise SegmentError(
+                    'While processing manifest %s, '
+                    'max LO GET time of %ds exceeded' %
+                    (self.name, self.max_get_time))
+
+    def _internal_iter(self):
+        # Top level of our iterator stack: pass bytes through; catch and
+        # handle exceptions.
+        try:
+            for chunk in self._time_limited_iter():
+                yield chunk
+        except (ListingIterError, SegmentError) as err:
+            self.logger.error(err)
+            if not self.validated_first_segment:
+                raise
+        finally:
+            if self.current_resp:
+                close_if_possible(self.current_resp.app_iter)
+
+    def app_iter_range(self, *a, **kw):
+        """
+        swob.Response will only respond with a 206 status in certain cases; one
+        of those is if the body iterator responds to .app_iter_range().
+
+        However, this object (or really, its listing iter) is smart enough to
+        handle the range stuff internally, so we just no-op this out for swob.
+        """
+        return self
+
+    def app_iter_ranges(self, ranges, content_type, boundary, content_size):
+        """
+        This method assumes that iter(self) yields all the data bytes that
+        go into the response, but none of the MIME stuff. For example, if
+        the response will contain three MIME docs with data "abcd", "efgh",
+        and "ijkl", then iter(self) will give out the bytes "abcdefghijkl".
+
+        This method inserts the MIME stuff around the data bytes.
+        """
+        si = Spliterator(self)
+        mri = multi_range_iterator(
+            ranges, content_type, boundary, content_size,
+            lambda start, end_plus_one: si.take(end_plus_one - start))
+        try:
+            for x in mri:
+                yield x
+        finally:
+            # Spliterator and multi_range_iterator can't possibly know we've
+            # consumed the whole of the app_iter, but we want to read/close the
+            # final segment response
+            friendly_close(self.app_iter)
+
+    def validate_first_segment(self):
+        """
+        Start fetching object data to ensure that the first segment (if any) is
+        valid. This is to catch cases like "first segment is missing" or
+        "first segment's etag doesn't match manifest".
+
+        Note: this does not validate that you have any segments. A
+        zero-segment large object is not erroneous; it is just empty.
+        """
+        if self.validated_first_segment:
+            return
+
+        try:
+            self.peeked_chunk = next(self.app_iter)
+        except StopIteration:
+            pass
+        finally:
+            self.validated_first_segment = True
+
+    def __iter__(self):
+        if self.peeked_chunk is not None:
+            pc = self.peeked_chunk
+            self.peeked_chunk = None
+            return CloseableChain([pc], self.app_iter)
+        else:
+            return self.app_iter
+
+    def close(self):
+        """
+        Called when the client disconnect. Ensure that the connection to the
+        backend server is closed.
+        """
+        close_if_possible(self.app_iter)
+
+
+def http_response_to_document_iters(response, read_chunk_size=4096):
+    """
+    Takes a successful object-GET HTTP response and turns it into an
+    iterator of (first-byte, last-byte, length, headers, body-file)
+    5-tuples.
+
+    The response must either be a 200 or a 206; if you feed in a 204 or
+    something similar, this probably won't work.
+
+    :param response: HTTP response, like from bufferedhttp.http_connect(),
+        not a swob.Response.
+    """
+    chunked = is_chunked(dict(response.getheaders()))
+
+    if response.status == 200:
+        if chunked:
+            # Single "range" that's the whole object with an unknown length
+            return iter([(0, None, None, response.getheaders(),
+                          response)])
+
+        # Single "range" that's the whole object
+        content_length = int(response.getheader('Content-Length'))
+        return iter([(0, content_length - 1, content_length,
+                      response.getheaders(), response)])
+
+    content_type, params_list = parse_content_type(
+        response.getheader('Content-Type'))
+    if content_type != 'multipart/byteranges':
+        # Single range; no MIME framing, just the bytes. The start and end
+        # byte indices are in the Content-Range header.
+        start, end, length = parse_content_range(
+            response.getheader('Content-Range'))
+        return iter([(start, end, length, response.getheaders(), response)])
+    else:
+        # Multiple ranges; the response body is a multipart/byteranges MIME
+        # document, and we have to parse it using the MIME boundary
+        # extracted from the Content-Type header.
+        params = dict(params_list)
+        return multipart_byteranges_to_document_iters(
+            response, wsgi_to_bytes(params['boundary']), read_chunk_size)
+
+
+def update_etag_is_at_header(req, name):
+    """
+    Helper function to update an X-Backend-Etag-Is-At header whose value is a
+    list of alternative header names at which the actual object etag may be
+    found. This informs the object server where to look for the actual object
+    etag when processing conditional requests.
+
+    Since the proxy server and/or middleware may set alternative etag header
+    names, the value of X-Backend-Etag-Is-At is a comma separated list which
+    the object server inspects in order until it finds an etag value.
+
+    :param req: a swob Request
+    :param name: name of a sysmeta where alternative etag may be found
+    """
+    if ',' in name:
+        # HTTP header names should not have commas but we'll check anyway
+        raise ValueError('Header name must not contain commas')
+    existing = req.headers.get("X-Backend-Etag-Is-At")
+    req.headers["X-Backend-Etag-Is-At"] = csv_append(
+        existing, name)
+
+
+def resolve_etag_is_at_header(req, metadata):
+    """
+    Helper function to resolve an alternative etag value that may be stored in
+    metadata under an alternate name.
+
+    The value of the request's X-Backend-Etag-Is-At header (if it exists) is a
+    comma separated list of alternate names in the metadata at which an
+    alternate etag value may be found. This list is processed in order until an
+    alternate etag is found.
+
+    The left most value in X-Backend-Etag-Is-At will have been set by the left
+    most middleware, or if no middleware, by ECObjectController, if an EC
+    policy is in use. The left most middleware is assumed to be the authority
+    on what the etag value of the object content is.
+
+    The resolver will work from left to right in the list until it finds a
+    value that is a name in the given metadata. So the left most wins, IF it
+    exists in the metadata.
+
+    By way of example, assume the encrypter middleware is installed. If an
+    object is *not* encrypted then the resolver will not find the encrypter
+    middleware's alternate etag sysmeta (X-Object-Sysmeta-Crypto-Etag) but will
+    then find the EC alternate etag (if EC policy). But if the object *is*
+    encrypted then X-Object-Sysmeta-Crypto-Etag is found and used, which is
+    correct because it should be preferred over X-Object-Sysmeta-Ec-Etag.
+
+    :param req: a swob Request
+    :param metadata: a dict containing object metadata
+    :return: an alternate etag value if any is found, otherwise None
+    """
+    alternate_etag = None
+    metadata = HeaderKeyDict(metadata)
+    if "X-Backend-Etag-Is-At" in req.headers:
+        names = list_from_csv(req.headers["X-Backend-Etag-Is-At"])
+        for name in names:
+            if name in metadata:
+                alternate_etag = metadata[name]
+                break
+    return alternate_etag
+
+
+def update_ignore_range_header(req, name):
+    """
+    Helper function to update an X-Backend-Ignore-Range-If-Metadata-Present
+    header whose value is a list of header names which, if any are present
+    on an object, mean the object server should respond with a 200 instead
+    of a 206 or 416.
+
+    :param req: a swob Request
+    :param name: name of a header which, if found, indicates the proxy will
+                 want the whole object
+    """
+    if ',' in name:
+        # HTTP header names should not have commas but we'll check anyway
+        raise ValueError('Header name must not contain commas')
+    hdr = 'X-Backend-Ignore-Range-If-Metadata-Present'
+    req.headers[hdr] = csv_append(req.headers.get(hdr), name)
+
+
+def resolve_ignore_range_header(req, metadata):
+    """
+    Helper function to remove Range header from request if metadata matching
+    the X-Backend-Ignore-Range-If-Metadata-Present header is found.
+
+    :param req: a swob Request
+    :param metadata: dictionary of object metadata
+    """
+    ignore_range_headers = set(
+        h.strip().lower()
+        for h in req.headers.get(
+            'X-Backend-Ignore-Range-If-Metadata-Present',
+            '').split(','))
+    if ignore_range_headers.intersection(
+            h.lower() for h in metadata):
+        req.headers.pop('Range', None)
+
+
+def is_use_replication_network(headers=None):
+    """
+    Determine if replication network should be used.
+
+    :param headers: a dict of headers
+    :return: the value of the ``x-backend-use-replication-network`` item from
+        ``headers``. If no ``headers`` are given or the item is not found then
+        False is returned.
+    """
+    if headers:
+        for h, v in headers.items():
+            if h.lower() == USE_REPLICATION_NETWORK_HEADER:
+                return config_true_value(v)
+    return False
+
+
+def get_ip_port(node, headers):
+    """
+    Get the ip address and port that should be used for the given ``node``.
+    The normal ip address and port are returned unless the ``node`` or
+    ``headers`` indicate that the replication ip address and port should be
+    used.
+
+    If the ``headers`` dict has an item with key
+    ``x-backend-use-replication-network`` and a truthy value then the
+    replication ip address and port are returned. Otherwise if the ``node``
+    dict has an item with key ``use_replication`` and truthy value then the
+    replication ip address and port are returned. Otherwise the normal ip
+    address and port are returned.
+
+    :param node: a dict describing a node
+    :param headers: a dict of headers
+    :return: a tuple of (ip address, port)
+    """
+    return select_ip_port(
+        node, use_replication=is_use_replication_network(headers))
+
+
+def is_open_expired(app, req):
+    """
+    Helper function to check if a request with the header 'x-open-expired'
+    can access an object that has not yet been reaped by the object-expirer
+    based on the allow_open_expired global config.
+
+    :param app: the application instance
+    :param req: request object
+    """
+    return (config_true_value(app.allow_open_expired) and
+            config_true_value(req.headers.get('x-open-expired')))
+
+
+def is_backend_open_expired(request):
+    """
+    Helper function to check if a request has either the headers
+    'x-backend-open-expired' or 'x-backend-replication' for the backend
+    to access expired objects.
+
+    :param request: request object
+    """
+    x_backend_open_expired = config_true_value(request.headers.get(
+        'x-backend-open-expired', 'false'))
+    x_backend_replication = config_true_value(request.headers.get(
+        'x-backend-replication', 'false'))
+    return x_backend_open_expired or x_backend_replication
+
+
+def append_log_info(environ, log_info):
+    environ.setdefault('swift.log_info', []).append(log_info)
+
+
+def get_log_info(environ):
+    return ','.join(environ.get('swift.log_info', []))
+
+
+def get_heartbeat_response_body(data_format, data_dict, error_list, root_tag):
+    """
+    Returns a response body for heartbeat according to format.
+
+    Handles json and xml, otherwise will return text/plain.
+    Note: xml response does not include xml declaration.
+
+    :params data_format: resulting format
+    :params data_dict: generated data about results.
+    :params error_list: list of quoted filenames that failed
+    :params root_tag: the tag name to use for root elements when returning XML;
+                      e.g. 'extract' or 'delete'
+    """
+    if data_format == 'application/json':
+        data_dict['Errors'] = error_list
+        return json.dumps(data_dict).encode('ascii')
+    if data_format and data_format.endswith('/xml'):
+        output = ['<', root_tag, '>\n']
+        for key in sorted(data_dict):
+            xml_key = key.replace(' ', '_').lower()
+            output.extend([
+                '<', xml_key, '>',
+                escape(str(data_dict[key])),
+                '</', xml_key, '>\n',
+            ])
+        output.append('<errors>\n')
+        for name, status in error_list:
+            output.extend([
+                '<object><name>', escape(name), '</name><status>',
+                escape(status), '</status></object>\n',
+            ])
+        output.extend(['</errors>\n</', root_tag, '>\n'])
+        return ''.join(output).encode('utf-8')
+
+    output = []
+    for key in sorted(data_dict):
+        output.append('%s: %s\n' % (key, data_dict[key]))
+    output.append('Errors:\n')
+    output.extend(
+        '%s, %s\n' % (name, status)
+        for name, status in error_list)
+    return ''.join(output).encode('utf-8')
diff --git a/swift/common/ring/__init__.py b/swift/common/ring/__init__.py
index 6040b860e3..9103cb9689 100644
--- a/swift/common/ring/__init__.py
+++ b/swift/common/ring/__init__.py
@@ -1,2 +1,24 @@
-from ring import RingData, Ring
-from builder import RingBuilder
+# Copyright (c) 2010-2017 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+
+from swift.common.ring.ring import RingData, Ring
+from swift.common.ring.builder import RingBuilder
+
+__all__ = [
+    'RingData',
+    'Ring',
+    'RingBuilder',
+]
diff --git a/swift/common/ring/builder.py b/swift/common/ring/builder.py
index e871f0216c..e4ea373909 100644
--- a/swift/common/ring/builder.py
+++ b/swift/common/ring/builder.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,20 +13,56 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-import bisect
+import contextlib
+import copy
+import errno
 import itertools
+import logging
 import math
-import cPickle as pickle
+import random
+import uuid
 
+import pickle  # nosec: B403
+from copy import deepcopy
+from contextlib import contextmanager
 
 from array import array
 from collections import defaultdict
-from random import randint, shuffle
 from time import time
 
 from swift.common import exceptions
-from swift.common.ring import RingData
-from swift.common.ring.utils import tiers_for_dev, build_tier_tree
+from swift.common.ring.ring import RingData
+from swift.common.ring.utils import tiers_for_dev, build_tier_tree, \
+    validate_and_normalize_address, validate_replicas_by_tier, pretty_dev, \
+    none_dev_id, calc_dev_id_bytes, BYTES_TO_TYPE_CODE, resize_array
+
+# we can't store None's in the replica2part2dev array, so we high-jack
+# the max value for magic to represent the part is not currently
+# assigned to any device.
+MAX_BALANCE = 999.99
+MAX_BALANCE_GATHER_COUNT = 3
+
+
+class RingValidationWarning(Warning):
+    pass
+
+
+@contextlib.contextmanager
+def _set_random_seed(seed):
+    # If random seed is set when entering this context then reset original
+    # random state when exiting the context. This avoids a test calling this
+    # method with a fixed seed value causing all subsequent tests to use a
+    # repeatable random sequence.
+    random_state = None
+    if seed is not None:
+        random_state = random.getstate()
+        random.seed(seed)
+    try:
+        yield
+    finally:
+        if random_state:
+            # resetting state rather than calling seed() eases unit testing
+            random.setstate(random_state)
 
 
 class RingBuilder(object):
@@ -40,19 +76,35 @@ class RingBuilder(object):
     a rebalance request is an isolated request or due to added, changed, or
     removed devices.
 
-    :param part_power: number of partitions = 2**part_power
+    :param part_power: number of partitions = 2**part_power.
     :param replicas: number of replicas for each partition
     :param min_part_hours: minimum number of hours between partition changes
     """
 
     def __init__(self, part_power, replicas, min_part_hours):
+        if part_power > 32:
+            raise ValueError("part_power must be at most 32 (was %d)"
+                             % (part_power,))
+        if part_power < 0:
+            raise ValueError("part_power must be at least 0 (was %d)"
+                             % (part_power,))
+        if replicas < 1:
+            raise ValueError("replicas must be at least 1 (was %.6f)"
+                             % (replicas,))
+        if min_part_hours < 0:
+            raise ValueError("min_part_hours must be non-negative (was %d)"
+                             % (min_part_hours,))
+
         self.part_power = part_power
+        self.next_part_power = None
         self.replicas = replicas
         self.min_part_hours = min_part_hours
         self.parts = 2 ** self.part_power
         self.devs = []
         self.devs_changed = False
         self.version = 0
+        self.overload = 0.0
+        self._id = None
 
         # _replica2part2dev maps from replica number to partition number to
         # device id. So, for a three replica, 2**23 ring, it's an array of
@@ -63,21 +115,112 @@ def __init__(self, part_power, replicas, min_part_hours):
         # a while ago, code-wise, when I last tried it).
         self._replica2part2dev = None
 
-        # _last_part_moves is a 2**23 array of unsigned bytes representing the
-        # number of hours since a given partition was last moved. This is used
-        # to guarantee we don't move a partition twice within a given number of
-        # hours (24 is my usual test). Removing a device or setting its weight
-        # to 0 overrides this behavior as it's assumed those actions are done
-        # because of device failure.
+        # _last_part_moves is an array of unsigned bytes representing
+        # the number of hours since a given partition was last moved.
+        # This is used to guarantee we don't move a partition twice
+        # within a given number of hours (24 is my usual test). Removing
+        # a device overrides this behavior as it's assumed that's only
+        # done because of device failure.
+        self._last_part_moves = array('B', itertools.repeat(0, self.parts))
+        # _part_moved_bitmap record parts have been moved
+        self._part_moved_bitmap = None
         # _last_part_moves_epoch indicates the time the offsets in
         # _last_part_moves is based on.
-        self._last_part_moves_epoch = None
-        self._last_part_moves = None
+        self._last_part_moves_epoch = 0
 
         self._last_part_gather_start = 0
+
+        self._dispersion_graph = {}
+        self.dispersion = 0.0
         self._remove_devs = []
         self._ring = None
 
+        self.logger = logging.getLogger("swift.ring.builder")
+        if not self.logger.handlers:
+            self.logger.disabled = True
+            # silence "no handler for X" error messages
+            self.logger.addHandler(logging.NullHandler())
+
+    @property
+    def id(self):
+        if self._id is None:
+            # We don't automatically assign an id here because we want a caller
+            # to explicitly know when a builder needs an id to be assigned. In
+            # that case the caller must save the builder in order that a newly
+            # assigned id is persisted.
+            raise AttributeError(
+                'id attribute has not been initialised by calling save()')
+        return self._id
+
+    @property
+    def part_shift(self):
+        return 32 - self.part_power
+
+    @property
+    def dev_id_bytes(self):
+        if not self._replica2part2dev:
+            max_dev_id = len(self.devs) - 1 if self.devs else 0
+            return calc_dev_id_bytes(max_dev_id)
+        return self._replica2part2dev[0].itemsize
+
+    def set_dev_id_bytes(self, new_dev_id_bytes):
+        if self._replica2part2dev:
+            self._replica2part2dev = [
+                resize_array(p2d, new_dev_id_bytes)
+                for p2d in self._replica2part2dev]
+
+    @property
+    def dev_id_type_code(self):
+        return BYTES_TO_TYPE_CODE[self.dev_id_bytes]
+
+    @property
+    def max_dev_id(self):
+        return none_dev_id(self.dev_id_bytes) - 1
+
+    @property
+    def none_dev_id(self):
+        return none_dev_id(self.dev_id_bytes)
+
+    @property
+    def ever_rebalanced(self):
+        return self._replica2part2dev is not None
+
+    def _set_part_moved(self, part):
+        self._last_part_moves[part] = 0
+        byte, bit = divmod(part, 8)
+        self._part_moved_bitmap[byte] |= (128 >> bit)
+
+    def _has_part_moved(self, part):
+        byte, bit = divmod(part, 8)
+        return bool(self._part_moved_bitmap[byte] & (128 >> bit))
+
+    def _can_part_move(self, part):
+        # if min_part_hours is zero then checking _last_part_moves will not
+        # indicate if the part has already moved during the current rebalance,
+        # but _has_part_moved will.
+        return (self._last_part_moves[part] >= self.min_part_hours and
+                not self._has_part_moved(part))
+
+    @contextmanager
+    def debug(self):
+        """
+        Temporarily enables debug logging, useful in tests, e.g.::
+
+            with rb.debug():
+                rb.rebalance()
+        """
+        old_val, self.logger.disabled = self.logger.disabled, False
+        try:
+            yield
+        finally:
+            self.logger.disabled = old_val
+
+    @property
+    def min_part_seconds_left(self):
+        """Get the total seconds until a rebalance can be performed"""
+        elapsed_seconds = int(time() - self._last_part_moves_epoch)
+        return max((self.min_part_hours * 3600) - elapsed_seconds, 0)
+
     def weight_of_one_part(self):
         """
         Returns the weight of each partition as calculated from the
@@ -91,6 +234,12 @@ def weight_of_one_part(self):
                                             'ring, or all devices have been '
                                             'deleted')
 
+    @classmethod
+    def from_dict(cls, builder_data):
+        b = cls(1, 1, 1)  # Dummy values
+        b.copy_from(builder_data)
+        return b
+
     def copy_from(self, builder):
         """
         Reinitializes this RingBuilder instance from data obtained from the
@@ -104,32 +253,59 @@ def copy_from(self, builder):
         """
         if hasattr(builder, 'devs'):
             self.part_power = builder.part_power
+            self.next_part_power = builder.next_part_power
             self.replicas = builder.replicas
             self.min_part_hours = builder.min_part_hours
             self.parts = builder.parts
             self.devs = builder.devs
             self.devs_changed = builder.devs_changed
+            self.overload = builder.overload
             self.version = builder.version
             self._replica2part2dev = builder._replica2part2dev
             self._last_part_moves_epoch = builder._last_part_moves_epoch
-            self._last_part_moves = builder._last_part_moves
+            if builder._last_part_moves is None:
+                self._last_part_moves = array(
+                    'B', itertools.repeat(0, self.parts))
+            else:
+                self._last_part_moves = builder._last_part_moves
             self._last_part_gather_start = builder._last_part_gather_start
             self._remove_devs = builder._remove_devs
+            self._id = getattr(builder, '_id', None)
         else:
             self.part_power = builder['part_power']
+            self.next_part_power = builder.get('next_part_power')
             self.replicas = builder['replicas']
             self.min_part_hours = builder['min_part_hours']
             self.parts = builder['parts']
             self.devs = builder['devs']
             self.devs_changed = builder['devs_changed']
+            self.overload = builder.get('overload', 0.0)
             self.version = builder['version']
             self._replica2part2dev = builder['_replica2part2dev']
             self._last_part_moves_epoch = builder['_last_part_moves_epoch']
-            self._last_part_moves = builder['_last_part_moves']
+            if builder['_last_part_moves'] is None:
+                self._last_part_moves = array(
+                    'B', itertools.repeat(0, self.parts))
+            else:
+                self._last_part_moves = builder['_last_part_moves']
             self._last_part_gather_start = builder['_last_part_gather_start']
+            self._dispersion_graph = builder.get('_dispersion_graph', {})
+            self.dispersion = builder.get('dispersion')
             self._remove_devs = builder['_remove_devs']
+            self._id = builder.get('id')
         self._ring = None
 
+        # Old builders may not have a region defined for their devices, in
+        # which case we default it to 1.
+        for dev in self._iter_devs():
+            dev.setdefault("region", 1)
+
+        if not self._last_part_moves_epoch:
+            self._last_part_moves_epoch = 0
+
+    def __deepcopy__(self, memo):
+        return type(self).from_dict(deepcopy(self.to_dict(), memo))
+
     def to_dict(self):
         """
         Returns a dict that can be used later with copy_from to
@@ -138,17 +314,23 @@ def to_dict(self):
         copy_from.
         """
         return {'part_power': self.part_power,
+                'next_part_power': self.next_part_power,
                 'replicas': self.replicas,
                 'min_part_hours': self.min_part_hours,
                 'parts': self.parts,
                 'devs': self.devs,
                 'devs_changed': self.devs_changed,
+                'dev_id_bytes': self.dev_id_bytes,
                 'version': self.version,
+                'overload': self.overload,
                 '_replica2part2dev': self._replica2part2dev,
                 '_last_part_moves_epoch': self._last_part_moves_epoch,
                 '_last_part_moves': self._last_part_moves,
                 '_last_part_gather_start': self._last_part_gather_start,
-                '_remove_devs': self._remove_devs}
+                '_dispersion_graph': self._dispersion_graph,
+                'dispersion': self.dispersion,
+                '_remove_devs': self._remove_devs,
+                'id': self._id}
 
     def change_min_part_hours(self, min_part_hours):
         """
@@ -167,6 +349,26 @@ def change_min_part_hours(self, min_part_hours):
         """
         self.min_part_hours = min_part_hours
 
+    def set_replicas(self, new_replica_count):
+        """
+        Changes the number of replicas in this ring.
+
+        If the new replica count is sufficiently different that
+        self._replica2part2dev will change size, sets
+        self.devs_changed. This is so tools like
+        bin/swift-ring-builder can know to write out the new ring
+        rather than bailing out due to lack of balance change.
+        """
+        old_slots_used = int(self.parts * self.replicas)
+        new_slots_used = int(self.parts * new_replica_count)
+        if old_slots_used != new_slots_used:
+            self.devs_changed = True
+
+        self.replicas = new_replica_count
+
+    def set_overload(self, overload):
+        self.overload = overload
+
     def get_ring(self):
         """
         Get the ring, or more specifically, the swift.common.ring.RingData.
@@ -189,12 +391,15 @@ def get_ring(self):
             # shift an unsigned int >I right to obtain the partition for the
             # int).
             if not self._replica2part2dev:
-                self._ring = RingData([], devs, 32 - self.part_power)
+                self._ring = RingData([], devs, self.part_shift,
+                                      version=self.version)
             else:
                 self._ring = \
-                    RingData([array('H', p2d) for p2d in
-                              self._replica2part2dev],
-                             devs, 32 - self.part_power)
+                    RingData([array(self.dev_id_type_code, p2d)
+                              for p2d in self._replica2part2dev],
+                             devs, self.part_shift,
+                             self.next_part_power,
+                             self.version)
         return self._ring
 
     def add_dev(self, dev):
@@ -208,9 +413,10 @@ def add_dev(self, dev):
         weight  a float of the relative weight of this device as compared to
                 others; this indicates how many partitions the builder will try
                 to assign to this device
+        region  integer indicating which region the device is in
         zone    integer indicating which zone the device is in; a given
                 partition will not be assigned to multiple devices within the
-                same zone
+                same (region, zone) pair if there is any alternative
         ip      the ip address of the device
         port    the tcp port of the device
         device  the device's name on disk (sdb1, for example)
@@ -223,23 +429,38 @@ def add_dev(self, dev):
             make multiple changes for a single rebalance.
 
         :param dev: device dict
+
+        :returns: id of device (not used in the tree anymore, but unknown
+                  users may depend on it)
         """
         if 'id' not in dev:
             dev['id'] = 0
             if self.devs:
-                dev['id'] = max(d['id'] for d in self.devs if d) + 1
+                try:
+                    dev['id'] = self.devs.index(None)
+                except ValueError:
+                    dev['id'] = len(self.devs)
         if dev['id'] < len(self.devs) and self.devs[dev['id']] is not None:
             raise exceptions.DuplicateDeviceError(
                 'Duplicate device id: %d' % dev['id'])
+        if dev['id'] > self.max_dev_id:
+            self.set_dev_id_bytes(calc_dev_id_bytes(dev['id']))
+
         # Add holes to self.devs to ensure self.devs[dev['id']] will be the dev
         while dev['id'] >= len(self.devs):
             self.devs.append(None)
+        required_keys = ('region', 'zone', 'ip', 'port', 'device', 'weight')
+        missing = tuple(key for key in required_keys if key not in dev)
+        if missing:
+            raise ValueError('%r is missing required key(s): %s' % (
+                dev, ', '.join(missing)))
         dev['weight'] = float(dev['weight'])
         dev['parts'] = 0
+        dev.setdefault('meta', '')
         self.devs[dev['id']] = dev
-        self._set_parts_wanted()
         self.devs_changed = True
         self.version += 1
+        return dev['id']
 
     def set_dev_weight(self, dev_id, weight):
         """
@@ -254,8 +475,50 @@ def set_dev_weight(self, dev_id, weight):
         :param dev_id: device id
         :param weight: new weight for device
         """
+        if any(dev_id == d['id'] for d in self._remove_devs):
+            raise ValueError("Can not set weight of dev_id %s because it "
+                             "is marked for removal" % (dev_id,))
         self.devs[dev_id]['weight'] = weight
-        self._set_parts_wanted()
+        self.devs_changed = True
+        self.version += 1
+
+    def set_dev_region(self, dev_id, region):
+        """
+        Set the region of a device. This should be called rather than just
+        altering the region key in the device dict directly, as the builder
+        will need to rebuild some internal state to reflect the change.
+
+        .. note::
+            This will not rebalance the ring immediately as you may want to
+            make multiple changes for a single rebalance.
+
+        :param dev_id: device id
+        :param region: new region for device
+        """
+        if any(dev_id == d['id'] for d in self._remove_devs):
+            raise ValueError("Can not set region of dev_id %s because it "
+                             "is marked for removal" % (dev_id,))
+        self.devs[dev_id]['region'] = region
+        self.devs_changed = True
+        self.version += 1
+
+    def set_dev_zone(self, dev_id, zone):
+        """
+        Set the zone of a device. This should be called rather than just
+        altering the zone key in the device dict directly, as the builder
+        will need to rebuild some internal state to reflect the change.
+
+        .. note::
+            This will not rebalance the ring immediately as you may want to
+            make multiple changes for a single rebalance.
+
+        :param dev_id: device id
+        :param zone: new zone for device
+        """
+        if any(dev_id == d['id'] for d in self._remove_devs):
+            raise ValueError("Can not set zone of dev_id %s because it "
+                             "is marked for removal" % (dev_id,))
+        self.devs[dev_id]['zone'] = zone
         self.devs_changed = True
         self.version += 1
 
@@ -272,11 +535,10 @@ def remove_dev(self, dev_id):
         dev = self.devs[dev_id]
         dev['weight'] = 0
         self._remove_devs.append(dev)
-        self._set_parts_wanted()
         self.devs_changed = True
         self.version += 1
 
-    def rebalance(self):
+    def rebalance(self, seed=None):
         """
         Rebalance the ring.
 
@@ -288,34 +550,166 @@ def rebalance(self):
         lot more analysis and therefore a lot more time -- I had code that did
         that before). Because of this, it keeps rebalancing until the device
         skew (number of partitions a device wants compared to what it has) gets
-        below 1% or doesn't change by more than 1% (only happens with ring that
-        can't be balanced no matter what -- like with 3 zones of differing
-        weights with replicas set to 3).
+        below 1% or doesn't change by more than 1% (only happens with a ring
+        that can't be balanced no matter what).
 
-        :returns: (number_of_partitions_altered, resulting_balance)
+        :param seed: a value for the random seed (optional)
+        :returns: (number_of_partitions_altered, resulting_balance,
+                   number_of_removed_devices)
         """
+        # count up the devs, and cache some stuff
+        num_devices = 0
+        for dev in self._iter_devs():
+            dev['tiers'] = tiers_for_dev(dev)
+            if dev['weight'] > 0:
+                num_devices += 1
+        if num_devices < self.replicas:
+            raise exceptions.RingValidationError(
+                "Replica count of %(replicas)s requires more "
+                "than %(num_devices)s devices" % {
+                    'replicas': self.replicas,
+                    'num_devices': num_devices,
+                })
+
         self._ring = None
-        if self._last_part_moves_epoch is None:
-            self._initial_balance()
-            self.devs_changed = False
-            return self.parts, self.get_balance()
-        retval = 0
+
+        old_replica2part2dev = copy.deepcopy(self._replica2part2dev)
+
+        if not self.ever_rebalanced:
+            self.logger.debug("New builder; performing initial balance")
+
         self._update_last_part_moves()
-        last_balance = 0
-        while True:
-            reassign_parts = self._gather_reassign_parts()
-            self._reassign_parts(reassign_parts)
-            retval += len(reassign_parts)
-            while self._remove_devs:
-                self.devs[self._remove_devs.pop()['id']] = None
-            balance = self.get_balance()
-            if balance < 1 or abs(last_balance - balance) < 1 or \
-                    retval == self.parts:
-                break
-            last_balance = balance
+
+        with _set_random_seed(seed):
+            replica_plan = self._build_replica_plan()
+            self._set_parts_wanted(replica_plan)
+
+            assign_parts = defaultdict(list)
+            # gather parts from replica count adjustment
+            self._adjust_replica2part2dev_size(assign_parts)
+            # gather parts from failed devices
+            self._gather_parts_from_failed_devices(assign_parts)
+            # gather parts for dispersion (N.B. this only picks up parts that
+            # *must* disperse according to the replica plan)
+            self._gather_parts_for_dispersion(assign_parts, replica_plan)
+            removed_devs = self._remove_failed_devices()
+
+            # we'll gather a few times, or until we archive the plan
+            for gather_count in range(MAX_BALANCE_GATHER_COUNT):
+                self._gather_parts_for_balance(assign_parts, replica_plan,
+                                               # firsrt attempt go for disperse
+                                               gather_count == 0)
+                if not assign_parts:
+                    # most likely min part hours
+                    finish_status = 'Unable to finish'
+                    break
+                assign_parts_list = list(assign_parts.items())
+                # shuffle the parts to be reassigned, we have no preference on
+                # the order in which the replica plan is fulfilled.
+                random.shuffle(assign_parts_list)
+                # reset assign_parts map for next iteration
+                assign_parts = defaultdict(list)
+
+                num_part_replicas = sum(len(r) for p, r in assign_parts_list)
+                self.logger.debug("Gathered %d parts", num_part_replicas)
+                self._reassign_parts(assign_parts_list, replica_plan)
+                self.logger.debug("Assigned %d parts", num_part_replicas)
+
+                if not sum(d['parts_wanted'] < 0 for d in
+                           self._iter_devs()):
+                    finish_status = 'Finished'
+                    break
+            else:
+                finish_status = 'Unable to finish'
+            self.logger.debug(
+                '%(status)s rebalance plan after %(count)s attempts',
+                {'status': finish_status, 'count': gather_count + 1})
+
         self.devs_changed = False
+        changed_parts = self._build_dispersion_graph(old_replica2part2dev)
+
+        # clean up the cache
+        for dev in self._iter_devs():
+            dev.pop('tiers', None)
+
+        return changed_parts, self.get_balance(), removed_devs
+
+    def _build_dispersion_graph(self, old_replica2part2dev=None):
+        """
+        Build a dict of all tiers in the cluster to a list of the number of
+        parts with a replica count at each index.  The values of the dict will
+        be lists of length the maximum whole replica + 1 so that the
+        graph[tier][3] is the number of parts within the tier with 3 replicas
+        and graph [tier][0] is the number of parts not assigned in this tier.
+
+        i.e.
+        {
+            <tier>: [
+                <number_of_parts_with_0_replicas>,
+                <number_of_parts_with_1_replicas>,
+                ...
+                <number_of_parts_with_n_replicas>,
+                ],
+            ...
+        }
+
+        :param old_replica2part2dev: if called from rebalance, the
+            old_replica2part2dev can be used to count moved parts.
+
+        :returns: number of parts with different assignments than
+            old_replica2part2dev if provided
+        """
+
+        # Since we're going to loop over every replica of every part we'll
+        # also count up changed_parts if old_replica2part2dev is passed in
+        old_replica2part2dev = old_replica2part2dev or []
+        # Compare the partition allocation before and after the rebalance
+        # Only changed device ids are taken into account; devices might be
+        # "touched" during the rebalance, but actually not really moved
+        changed_parts = 0
+
+        int_replicas = int(math.ceil(self.replicas))
+        max_allowed_replicas = self._build_max_replicas_by_tier()
+        parts_at_risk = 0
+
+        dispersion_graph = {}
+        # go over all the devices holding each replica part by part
+        for part_id, dev_ids in enumerate(zip(*self._replica2part2dev)):
+            # count the number of replicas of this part for each tier of each
+            # device, some devices may have overlapping tiers!
+            replicas_at_tier = defaultdict(int)
+            for rep_id, dev in enumerate(iter(
+                    self.devs[dev_id] for dev_id in dev_ids)):
+                for tier in (dev.get('tiers') or tiers_for_dev(dev)):
+                    replicas_at_tier[tier] += 1
+                # IndexErrors will be raised if the replicas are increased or
+                # decreased, and that actually means the partition has changed
+                try:
+                    old_device = old_replica2part2dev[rep_id][part_id]
+                except IndexError:
+                    changed_parts += 1
+                    continue
+
+                if old_device != dev['id']:
+                    changed_parts += 1
+            # update running totals for each tiers' number of parts with a
+            # given replica count
+            part_risk_depth = defaultdict(int)
+            part_risk_depth[0] = 0
+            for tier, replicas in replicas_at_tier.items():
+                if tier not in dispersion_graph:
+                    dispersion_graph[tier] = [self.parts] + [0] * int_replicas
+                dispersion_graph[tier][0] -= 1
+                dispersion_graph[tier][replicas] += 1
+                if replicas > max_allowed_replicas[tier]:
+                    part_risk_depth[len(tier)] += (
+                        replicas - max_allowed_replicas[tier])
+            # count each part-replica once at tier where dispersion is worst
+            parts_at_risk += max(part_risk_depth.values())
+        self._dispersion_graph = dispersion_graph
+        self.dispersion = 100.0 * parts_at_risk / (self.parts * self.replicas)
         self.version += 1
-        return retval, balance
+        return changed_parts
 
     def validate(self, stats=False):
         """
@@ -335,28 +729,66 @@ def validate(self, stats=False):
         :raises RingValidationError: problem was found with the ring.
         """
 
-        if sum(d['parts'] for d in self._iter_devs()) != \
-                self.parts * self.replicas:
+        # "len" showed up in profiling, so it's just computed once.
+        dev_len = len(self.devs)
+
+        parts_on_devs = sum(d['parts'] for d in self._iter_devs())
+
+        if not self._replica2part2dev:
+            raise exceptions.RingValidationError(
+                '_replica2part2dev empty; did you forget to rebalance?')
+
+        parts_in_map = sum(len(p2d) for p2d in self._replica2part2dev)
+        if parts_on_devs != parts_in_map:
             raise exceptions.RingValidationError(
                 'All partitions are not double accounted for: %d != %d' %
-                (sum(d['parts'] for d in self._iter_devs()),
-                 self.parts * self.replicas))
+                (parts_on_devs, parts_in_map))
         if stats:
             # dev_usage[dev_id] will equal the number of partitions assigned to
             # that device.
-            dev_usage = array('I', (0 for _junk in xrange(len(self.devs))))
+            dev_usage = array('I', (0 for _junk in range(dev_len)))
             for part2dev in self._replica2part2dev:
                 for dev_id in part2dev:
                     dev_usage[dev_id] += 1
 
-        for part in xrange(self.parts):
-            for replica in xrange(self.replicas):
+        for dev in self._iter_devs():
+            if not isinstance(dev['port'], int):
+                raise exceptions.RingValidationError(
+                    "Device %d has port %r, which is not an integer." %
+                    (dev['id'], dev['port']))
+
+        int_replicas = int(math.ceil(self.replicas))
+        rep2part_len = list(map(len, self._replica2part2dev))
+        # check the assignments of each part's replicas
+        for part in range(self.parts):
+            devs_for_part = []
+            for replica, part_len in enumerate(rep2part_len):
+                if part_len <= part:
+                    # last replica may be short on parts because of floating
+                    # replica count
+                    if replica + 1 < int_replicas:
+                        raise exceptions.RingValidationError(
+                            "The partition assignments of replica %r were "
+                            "shorter than expected (%s < %s) - this should "
+                            "only happen for the last replica" % (
+                                replica,
+                                len(self._replica2part2dev[replica]),
+                                self.parts,
+                            ))
+                    break
                 dev_id = self._replica2part2dev[replica][part]
-                if dev_id >= len(self.devs) or not self.devs[dev_id]:
+                if dev_id == self.none_dev_id or dev_id >= dev_len or \
+                        self.devs[dev_id] is None:
                     raise exceptions.RingValidationError(
                         "Partition %d, replica %d was not allocated "
                         "to a device." %
                         (part, replica))
+                devs_for_part.append(dev_id)
+            if len(devs_for_part) != len(set(devs_for_part)):
+                raise exceptions.RingValidationError(
+                    "The partition %s has been assigned to "
+                    "duplicate devices %r" % (
+                        part, devs_for_part))
 
         if stats:
             weight_of_one_part = self.weight_of_one_part()
@@ -366,9 +798,9 @@ def validate(self, stats=False):
                     if dev_usage[dev['id']]:
                         # If a device has no weight, but has partitions, then
                         # its overage is considered "infinity" and therefore
-                        # always the worst possible. We show 999.99 for
+                        # always the worst possible. We show MAX_BALANCE for
                         # convenience.
-                        worst = 999.99
+                        worst = MAX_BALANCE
                         break
                     continue
                 skew = abs(100.0 * dev_usage[dev['id']] /
@@ -378,51 +810,104 @@ def validate(self, stats=False):
             return dev_usage, worst
         return None, None
 
-    def get_balance(self):
+    def _build_balance_per_dev(self):
         """
-        Get the balance of the ring. The balance value is the highest
-        percentage off the desired amount of partitions a given device wants.
-        For instance, if the "worst" device wants (based on its relative weight
-        and its zone's relative weight) 123 partitions and it has 124
-        partitions, the balance value would be 0.83 (1 extra / 123 wanted * 100
-        for percentage).
+        Build a map of <device_id> => <balance> where <balance> is a float
+        representing the percentage difference from the desired amount of
+        partitions a given device wants and the amount it has.
 
-        :returns: balance of the ring
+        N.B. this method only considers a device's weight and the parts
+        assigned, not the parts wanted according to the replica plan.
         """
-        balance = 0
         weight_of_one_part = self.weight_of_one_part()
+        balance_per_dev = {}
         for dev in self._iter_devs():
             if not dev['weight']:
                 if dev['parts']:
                     # If a device has no weight, but has partitions, then its
                     # overage is considered "infinity" and therefore always the
-                    # worst possible. We show 999.99 for convenience.
-                    balance = 999.99
-                    break
-                continue
-            dev_balance = abs(100.0 * dev['parts'] /
-                              (dev['weight'] * weight_of_one_part) - 100.0)
-            if dev_balance > balance:
-                balance = dev_balance
-        return balance
+                    # worst possible. We show MAX_BALANCE for convenience.
+                    balance = MAX_BALANCE
+                else:
+                    balance = 0
+            else:
+                balance = 100.0 * dev['parts'] / (
+                    dev['weight'] * weight_of_one_part) - 100.0
+            balance_per_dev[dev['id']] = balance
+        return balance_per_dev
+
+    def get_balance(self):
+        """
+        Get the balance of the ring. The balance value is the highest
+        percentage of the desired amount of partitions a given device
+        wants. For instance, if the "worst" device wants (based on its
+        weight relative to the sum of all the devices' weights) 123
+        partitions and it has 124 partitions, the balance value would
+        be 0.83 (1 extra / 123 wanted * 100 for percentage).
+
+        :returns: balance of the ring
+        """
+        balance_per_dev = self._build_balance_per_dev()
+        return max(abs(b) for b in balance_per_dev.values())
+
+    def get_required_overload(self, weighted=None, wanted=None):
+        """
+        Returns the minimum overload value required to make the ring maximally
+        dispersed.
+
+        The required overload is the largest percentage change of any single
+        device from its weighted replicanth to its wanted replicanth (note:
+        under weighted devices have a negative percentage change) to archive
+        dispersion - that is to say a single device that must be overloaded by
+        5% is worse than 5 devices in a single tier overloaded by 1%.
+        """
+        weighted = weighted or self._build_weighted_replicas_by_tier()
+        wanted = wanted or self._build_wanted_replicas_by_tier()
+        max_overload = 0.0
+        for dev in self._iter_devs():
+            tier = (dev['region'], dev['zone'], dev['ip'], dev['id'])
+            if not dev['weight']:
+                if tier not in wanted or not wanted[tier]:
+                    continue
+                raise exceptions.RingValidationError(
+                    'Device %s has zero weight and '
+                    'should not want any replicas' % (tier,))
+            required = (wanted[tier] - weighted[tier]) / weighted[tier]
+            self.logger.debug('%(tier)s wants %(wanted)s and is weighted for '
+                              '%(weight)s so therefore requires %(required)s '
+                              'overload', {'tier': pretty_dev(dev),
+                                           'wanted': wanted[tier],
+                                           'weight': weighted[tier],
+                                           'required': required})
+            if required > max_overload:
+                max_overload = required
+        return max_overload
 
     def pretend_min_part_hours_passed(self):
         """
         Override min_part_hours by marking all partitions as having been moved
-        255 hours ago. This can be used to force a full rebalance on the next
-        call to rebalance.
+        255 hours ago and last move epoch to 'the beginning of time'. This can
+        be used to force a full rebalance on the next call to rebalance.
         """
-        for part in xrange(self.parts):
+        self._last_part_moves_epoch = 0
+        if not self._last_part_moves:
+            return
+        for part in range(self.parts):
             self._last_part_moves[part] = 0xff
 
     def get_part_devices(self, part):
         """
-        Get the devices that are responsible for the partition.
+        Get the devices that are responsible for the partition,
+        filtering out duplicates.
 
         :param part: partition to get devices for
         :returns: list of device dicts
         """
-        return [self.devs[r[part]] for r in self._replica2part2dev]
+        devices = []
+        for dev in self._devs_for_part(part):
+            if dev not in devices:
+                devices.append(dev)
+        return devices
 
     def _iter_devs(self):
         """
@@ -435,15 +920,63 @@ def _iter_devs(self):
             if dev is not None:
                 yield dev
 
-    def _set_parts_wanted(self):
+    def _build_tier2children(self):
+        """
+        Wrap helper build_tier_tree so exclude zero-weight devices.
+        """
+        return build_tier_tree(d for d in self._iter_devs() if d['weight'])
+
+    def _set_parts_wanted(self, replica_plan):
         """
         Sets the parts_wanted key for each of the devices to the number of
         partitions the device wants based on its relative weight. This key is
         used to sort the devices according to "most wanted" during rebalancing
         to best distribute partitions. A negative parts_wanted indicates the
         device is "overweight" and wishes to give partitions away if possible.
+
+        :param replica_plan: a dict of dicts, as returned from
+                             _build_replica_plan, that maps
+                             each tier to it's target replicanths.
         """
-        weight_of_one_part = self.weight_of_one_part()
+        tier2children = self._build_tier2children()
+
+        parts_by_tier = defaultdict(int)
+
+        def place_parts(tier, parts):
+            parts_by_tier[tier] = parts
+            sub_tiers = sorted(tier2children[tier])
+            if not sub_tiers:
+                return
+            to_place = defaultdict(int)
+            for t in sub_tiers:
+                to_place[t] = min(parts, int(math.floor(
+                    replica_plan[t]['target'] * self.parts)))
+                parts -= to_place[t]
+
+            # if there's some parts left over, just throw 'em about
+            sub_tier_gen = itertools.cycle(sorted(
+                sub_tiers, key=lambda t: replica_plan[t]['target']))
+            while parts > 0:
+                t = next(sub_tier_gen)
+                to_place[t] += 1
+                parts -= 1
+
+            for t, p in to_place.items():
+                place_parts(t, p)
+
+        total_parts = int(self.replicas * self.parts)
+        place_parts((), total_parts)
+
+        # belts & suspenders/paranoia -  at every level, the sum of
+        # parts_by_tier should be total_parts for the ring
+        tiers = ['cluster', 'regions', 'zones', 'servers', 'devices']
+        for i, tier_name in enumerate(tiers):
+            parts_at_tier = sum(parts_by_tier[t] for t in parts_by_tier
+                                if len(t) == i)
+            if parts_at_tier != total_parts:
+                raise exceptions.RingValidationError(
+                    '%s != %s at tier %s' % (
+                        parts_at_tier, total_parts, tier_name))
 
         for dev in self._iter_devs():
             if not dev['weight']:
@@ -452,22 +985,8 @@ def _set_parts_wanted(self):
                 # indicate its strong desire to give up everything it has.
                 dev['parts_wanted'] = -self.parts * self.replicas
             else:
-                dev['parts_wanted'] = \
-                    int(weight_of_one_part * dev['weight']) - dev['parts']
-
-    def _initial_balance(self):
-        """
-        Initial partition assignment is the same as rebalancing an
-        existing ring, but with some initial setup beforehand.
-        """
-        self._replica2part2dev = \
-            [array('H', (0 for _junk in xrange(self.parts)))
-             for _junk in xrange(self.replicas)]
-
-        replicas = range(self.replicas)
-        self._last_part_moves = array('B', (0 for _junk in xrange(self.parts)))
-        self._last_part_moves_epoch = int(time())
-        self._reassign_parts((p, replicas) for p in xrange(self.parts))
+                tier = (dev['region'], dev['zone'], dev['ip'], dev['id'])
+                dev['parts_wanted'] = parts_by_tier[tier] - dev['parts']
 
     def _update_last_part_moves(self):
         """
@@ -475,121 +994,355 @@ def _update_last_part_moves(self):
         current time. The builder won't move a partition that has been moved
         more recently than min_part_hours.
         """
-        elapsed_hours = int(time() - self._last_part_moves_epoch) / 3600
-        for part in xrange(self.parts):
-            self._last_part_moves[part] = \
-                min(self._last_part_moves[part] + elapsed_hours, 0xff)
+        self._part_moved_bitmap = bytearray(max(2 ** (self.part_power - 3), 1))
+        elapsed_hours = int(time() - self._last_part_moves_epoch) // 3600
+        if elapsed_hours <= 0:
+            return
+        for part in range(self.parts):
+            # The "min(self._last_part_moves[part] + elapsed_hours, 0xff)"
+            # which was here showed up in profiling, so it got inlined.
+            last_plus_elapsed = self._last_part_moves[part] + elapsed_hours
+            if last_plus_elapsed < 0xff:
+                self._last_part_moves[part] = last_plus_elapsed
+            else:
+                self._last_part_moves[part] = 0xff
         self._last_part_moves_epoch = int(time())
 
-    def _gather_reassign_parts(self):
+    def _gather_parts_from_failed_devices(self, assign_parts):
         """
-        Returns a list of (partition, replicas) pairs to be reassigned by
-        gathering from removed devices, insufficiently-far-apart replicas, and
-        overweight drives.
+        Update the map of partition => [replicas] to be reassigned from
+        removed devices.
         """
         # First we gather partitions from removed devices. Since removed
         # devices usually indicate device failures, we have no choice but to
         # reassign these partitions. However, we mark them as moved so later
         # choices will skip other replicas of the same partition if possible.
-        removed_dev_parts = defaultdict(list)
+
+        gathered_parts = 0
         if self._remove_devs:
             dev_ids = [d['id'] for d in self._remove_devs if d['parts']]
             if dev_ids:
-                for replica in xrange(self.replicas):
-                    part2dev = self._replica2part2dev[replica]
-                    for part in xrange(self.parts):
-                        if part2dev[part] in dev_ids:
-                            self._last_part_moves[part] = 0
-                            removed_dev_parts[part].append(replica)
+                for part, replica in self._each_part_replica():
+                    dev_id = self._replica2part2dev[replica][part]
+                    if dev_id in dev_ids:
+                        self._replica2part2dev[replica][part] = \
+                            self.none_dev_id
+                        self._set_part_moved(part)
+                        assign_parts[part].append(replica)
+                        gathered_parts += 1
+                        self.logger.debug(
+                            "Gathered %d/%d from dev %d [dev removed]",
+                            part, replica, dev_id)
+        return gathered_parts
+
+    def _remove_failed_devices(self):
+        removed_devs = 0
+        while self._remove_devs:
+            remove_dev_id = self._remove_devs.pop()['id']
+            self.logger.debug("Removing dev %d", remove_dev_id)
+            self.devs[remove_dev_id] = None
+            removed_devs += 1
+
+        # Trim the dev list
+        while self.devs and self.devs[-1] is None:
+            self.devs.pop()
+
+        if self.dev_id_bytes > 2:
+            # Consider shrinking the device IDs themselves
+            new_dev_id_bytes = self.dev_id_bytes // 2
+            new_none_dev_id = none_dev_id(new_dev_id_bytes)
+            # Only shrink if the IDs all fit in the lower half of the next size
+            # down; this avoids excess churn when adding/removing devices near
+            # the limit of a particular dev_id_bytes
+            if len(self.devs) < new_none_dev_id // 2:
+                self.set_dev_id_bytes(new_dev_id_bytes)
+
+        return removed_devs
+
+    def _adjust_replica2part2dev_size(self, to_assign):
+        """
+        Make sure that the lengths of the arrays in _replica2part2dev
+        are correct for the current value of self.replicas.
+
+        Example:
+        self.part_power = 8
+        self.replicas = 2.25
 
+        self._replica2part2dev will contain 3 arrays: the first 2 of
+        length 256 (2**8), and the last of length 64 (0.25 * 2**8).
+
+        Update the mapping of partition => [replicas] that need assignment.
+        """
+        fractional_replicas, whole_replicas = math.modf(self.replicas)
+        whole_replicas = int(whole_replicas)
+        removed_parts = 0
+        new_parts = 0
+
+        desired_lengths = [self.parts] * whole_replicas
+        if fractional_replicas:
+            desired_lengths.append(int(self.parts * fractional_replicas))
+
+        if self._replica2part2dev is not None:
+            # If we crossed an integer threshold (say, 4.1 --> 4),
+            # we'll have a partial extra replica clinging on here. Clean
+            # up any such extra stuff.
+            for part2dev in self._replica2part2dev[len(desired_lengths):]:
+                for dev_id in part2dev:
+                    dev_losing_part = self.devs[dev_id]
+                    dev_losing_part['parts'] -= 1
+                    removed_parts -= 1
+            self._replica2part2dev = \
+                self._replica2part2dev[:len(desired_lengths)]
+        else:
+            self._replica2part2dev = []
+
+        for replica, desired_length in enumerate(desired_lengths):
+            if replica < len(self._replica2part2dev):
+                part2dev = self._replica2part2dev[replica]
+                if len(part2dev) < desired_length:
+                    # Not long enough: needs to be extended and the
+                    # newly-added pieces assigned to devices.
+                    for part in range(len(part2dev), desired_length):
+                        to_assign[part].append(replica)
+                        part2dev.append(self.none_dev_id)
+                        new_parts += 1
+                elif len(part2dev) > desired_length:
+                    # Too long: truncate this mapping.
+                    for part in range(desired_length, len(part2dev)):
+                        dev_losing_part = self.devs[part2dev[part]]
+                        dev_losing_part['parts'] -= 1
+                        removed_parts -= 1
+                    self._replica2part2dev[replica] = part2dev[:desired_length]
+            else:
+                # Mapping not present at all: make one up and assign
+                # all of it.
+                for part in range(desired_length):
+                    to_assign[part].append(replica)
+                    new_parts += 1
+                self._replica2part2dev.append(
+                    array(self.dev_id_type_code,
+                          itertools.repeat(self.none_dev_id, desired_length)))
+
+        self.logger.debug(
+            "%d new parts and %d removed parts from replica-count change",
+            new_parts, removed_parts)
+
+    def _gather_parts_for_dispersion(self, assign_parts, replica_plan):
+        """
+        Update the map of partition => [replicas] to be reassigned from
+        insufficiently-far-apart replicas.
+        """
         # Now we gather partitions that are "at risk" because they aren't
         # currently sufficient spread out across the cluster.
-        spread_out_parts = defaultdict(list)
-        max_allowed_replicas = self._build_max_replicas_by_tier()
-        for part in xrange(self.parts):
-            # Only move one replica at a time if possible.
-            if part in removed_dev_parts:
+        for part in range(self.parts):
+            if (not self._can_part_move(part)):
                 continue
-
             # First, add up the count of replicas at each tier for each
             # partition.
-            replicas_at_tier = defaultdict(lambda: 0)
-            for replica in xrange(self.replicas):
-                dev = self.devs[self._replica2part2dev[replica][part]]
-                for tier in tiers_for_dev(dev):
+            replicas_at_tier = defaultdict(int)
+            for dev in self._devs_for_part(part):
+                for tier in dev['tiers']:
                     replicas_at_tier[tier] += 1
 
-            # Now, look for partitions not yet spread out enough and not
-            # recently moved.
-            for replica in xrange(self.replicas):
-                dev = self.devs[self._replica2part2dev[replica][part]]
-                removed_replica = False
-                for tier in tiers_for_dev(dev):
-                    if (replicas_at_tier[tier] > max_allowed_replicas[tier] and
-                            self._last_part_moves[part] >=
-                            self.min_part_hours):
-                        self._last_part_moves[part] = 0
-                        spread_out_parts[part].append(replica)
-                        dev['parts_wanted'] += 1
-                        dev['parts'] -= 1
-                        removed_replica = True
-                        break
-                if removed_replica:
-                    for tier in tiers_for_dev(dev):
-                        replicas_at_tier[tier] -= 1
+            # Now, look for partitions not yet spread out enough.
+            undispersed_dev_replicas = []
+            for replica in self._replicas_for_part(part):
+                dev_id = self._replica2part2dev[replica][part]
+                if dev_id == self.none_dev_id:
+                    continue
+                dev = self.devs[dev_id]
+                if all(replicas_at_tier[tier] <=
+                       replica_plan[tier]['max']
+                       for tier in dev['tiers']):
+                    continue
+                undispersed_dev_replicas.append((dev, replica))
+
+            if not undispersed_dev_replicas:
+                continue
+
+            undispersed_dev_replicas.sort(
+                key=lambda dr: dr[0]['parts_wanted'])
+            for dev, replica in undispersed_dev_replicas:
+                # the min part hour check is ignored if and only if a device
+                # has more than one replica of a part assigned to it - which
+                # would have only been possible on rings built with an older
+                # version of the code
+                if (not self._can_part_move(part) and
+                        not replicas_at_tier[dev['tiers'][-1]] > 1):
+                    continue
+                dev['parts_wanted'] += 1
+                dev['parts'] -= 1
+                assign_parts[part].append(replica)
+                self.logger.debug(
+                    "Gathered %d/%d from dev %s [dispersion]",
+                    part, replica, pretty_dev(dev))
+                self._replica2part2dev[replica][part] = self.none_dev_id
+                for tier in dev['tiers']:
+                    replicas_at_tier[tier] -= 1
+                self._set_part_moved(part)
+
+    def _gather_parts_for_balance_can_disperse(self, assign_parts, start,
+                                               replica_plan):
+        """
+        Update the map of partition => [replicas] to be reassigned from
+        overweight drives where the replicas can be better dispersed to
+        another failure domain.
 
+        :param assign_parts: the map of partition => [replica] to update
+        :param start: offset into self.parts to begin search
+        :param replica_plan: replicanth targets for tiers
+        """
+        tier2children = self._build_tier2children()
+        parts_wanted_in_tier = defaultdict(int)
+        for dev in self._iter_devs():
+            wanted = max(dev['parts_wanted'], 0)
+            for tier in dev['tiers']:
+                parts_wanted_in_tier[tier] += wanted
         # Last, we gather partitions from devices that are "overweight" because
         # they have more partitions than their parts_wanted.
-        reassign_parts = defaultdict(list)
+        for offset in range(self.parts):
+            part = (start + offset) % self.parts
+            if (not self._can_part_move(part)):
+                continue
+            # For each part we'll look at the devices holding those parts and
+            # see if any are overweight, keeping track of replicas_at_tier as
+            # we go
+            overweight_dev_replica = []
+            replicas_at_tier = defaultdict(int)
+            for replica in self._replicas_for_part(part):
+                dev_id = self._replica2part2dev[replica][part]
+                if dev_id == self.none_dev_id:
+                    continue
+                dev = self.devs[dev_id]
+                for tier in dev['tiers']:
+                    replicas_at_tier[tier] += 1
+                if dev['parts_wanted'] < 0:
+                    overweight_dev_replica.append((dev, replica))
 
-        # We randomly pick a new starting point in the "circular" ring of
-        # partitions to try to get a better rebalance when called multiple
-        # times.
-        start = self._last_part_gather_start / 4 + randint(0, self.parts / 2)
-        self._last_part_gather_start = start
-        for replica in xrange(self.replicas):
-            part2dev = self._replica2part2dev[replica]
-            for part in itertools.chain(xrange(start, self.parts),
-                                        xrange(0, start)):
-                if self._last_part_moves[part] < self.min_part_hours:
+            if not overweight_dev_replica:
+                continue
+
+            overweight_dev_replica.sort(
+                key=lambda dr: dr[0]['parts_wanted'])
+            for dev, replica in overweight_dev_replica:
+                if any(replica_plan[tier]['min'] <=
+                       replicas_at_tier[tier] <
+                       replica_plan[tier]['max']
+                       for tier in dev['tiers']):
+                    # we're stuck by replica plan
                     continue
-                if part in removed_dev_parts or part in spread_out_parts:
+                for t in reversed(dev['tiers']):
+                    if replicas_at_tier[t] - 1 < replica_plan[t]['min']:
+                        # we're stuck at tier t
+                        break
+                if sum(parts_wanted_in_tier[c]
+                       for c in tier2children[t]
+                       if c not in dev['tiers']) <= 0:
+                    # we're stuck by weight
                     continue
-                dev = self.devs[part2dev[part]]
+                # this is the most overweight_device holding a replica
+                # of this part that can shed it according to the plan
+                dev['parts_wanted'] += 1
+                dev['parts'] -= 1
+                assign_parts[part].append(replica)
+                self.logger.debug(
+                    "Gathered %d/%d from dev %s [weight disperse]",
+                    part, replica, pretty_dev(dev))
+                self._replica2part2dev[replica][part] = self.none_dev_id
+                for tier in dev['tiers']:
+                    replicas_at_tier[tier] -= 1
+                    parts_wanted_in_tier[tier] -= 1
+                self._set_part_moved(part)
+                break
+
+    def _gather_parts_for_balance(self, assign_parts, replica_plan,
+                                  disperse_first):
+        """
+        Gather parts that look like they should move for balance reasons.
+
+        A simple gathers of parts that looks dispersible normally works out,
+        we'll switch strategies if things don't seem to move.
+        :param disperse_first: boolean, avoid replicas on overweight devices
+                               that need to be there for dispersion
+        """
+        # pick a random starting point on the other side of the ring
+        quarter_turn = (self.parts // 4)
+        random_half = random.randint(0, self.parts // 2)
+        start = (self._last_part_gather_start + quarter_turn +
+                 random_half) % self.parts
+        self.logger.debug('Gather start is %(start)s '
+                          '(Last start was %(last_start)s)',
+                          {'start': start,
+                           'last_start': self._last_part_gather_start})
+        self._last_part_gather_start = start
+
+        if disperse_first:
+            self._gather_parts_for_balance_can_disperse(
+                assign_parts, start, replica_plan)
+        self._gather_parts_for_balance_forced(assign_parts, start)
+
+    def _gather_parts_for_balance_forced(self, assign_parts, start, **kwargs):
+        """
+        Update the map of partition => [replicas] to be reassigned from
+        overweight drives without restriction, parts gathered from this method
+        may be placed back onto devices that are no better (or worse) than the
+        device from which they are gathered.
+
+        This method allows devices to flop around enough to unlock replicas
+        that would have otherwise potentially been locked because of
+        dispersion - it should be used as a last resort.
+
+        :param assign_parts: the map of partition => [replica] to update
+        :param start: offset into self.parts to begin search
+        """
+        for offset in range(self.parts):
+            part = (start + offset) % self.parts
+            if (not self._can_part_move(part)):
+                continue
+            overweight_dev_replica = []
+            for replica in self._replicas_for_part(part):
+                dev_id = self._replica2part2dev[replica][part]
+                if dev_id == self.none_dev_id:
+                    continue
+                dev = self.devs[dev_id]
                 if dev['parts_wanted'] < 0:
-                    self._last_part_moves[part] = 0
-                    dev['parts_wanted'] += 1
-                    dev['parts'] -= 1
-                    reassign_parts[part].append(replica)
-
-        reassign_parts.update(spread_out_parts)
-        reassign_parts.update(removed_dev_parts)
-
-        reassign_parts_list = list(reassign_parts.iteritems())
-        # We shuffle the partitions to reassign so we get a more even
-        # distribution later. There has been discussion of trying to distribute
-        # partitions more "regularly" because that would actually reduce risk
-        # but 1) it is really difficult to do this with uneven clusters and 2)
-        # it would concentrate load during failure recovery scenarios
-        # (increasing risk). The "right" answer has yet to be debated to
-        # conclusion, but working code wins for now.
-        shuffle(reassign_parts_list)
-        return reassign_parts_list
-
-    def _reassign_parts(self, reassign_parts):
-        """
-        For an existing ring data set, partitions are reassigned similarly to
-        the initial assignment. The devices are ordered by how many partitions
-        they still want and kept in that order throughout the process. The
-        gathered partitions are iterated through, assigning them to devices
-        according to the "most wanted" while keeping the replicas as "far
-        apart" as possible. Two different zones are considered the
-        farthest-apart things, followed by different ip/port pairs within a
-        zone; the least-far-apart things are different devices with the same
-        ip/port pair in the same zone.
-
-        If you want more replicas than devices, you won't get all your
-        replicas.
+                    overweight_dev_replica.append((dev, replica))
+
+            if not overweight_dev_replica:
+                continue
+
+            overweight_dev_replica.sort(
+                key=lambda dr: dr[0]['parts_wanted'])
+
+            dev, replica = overweight_dev_replica[0]
+            # this is the most overweight_device holding a replica of this
+            # part we don't know where it's going to end up - but we'll
+            # pick it up and hope for the best.
+            dev['parts_wanted'] += 1
+            dev['parts'] -= 1
+            assign_parts[part].append(replica)
+            self.logger.debug(
+                "Gathered %d/%d from dev %s [weight forced]",
+                part, replica, pretty_dev(dev))
+            self._replica2part2dev[replica][part] = self.none_dev_id
+            self._set_part_moved(part)
+
+    def _reassign_parts(self, reassign_parts, replica_plan):
+        """
+        For an existing ring data set, partitions are reassigned similar to
+        the initial assignment.
+
+        The devices are ordered by how many partitions they still want and
+        kept in that order throughout the process.
+
+        The gathered partitions are iterated through, assigning them to
+        devices according to the "most wanted" while keeping the replicas as
+        "far apart" as possible.
+
+        Two different regions are considered the farthest-apart things,
+        followed by zones, then different ip within a zone; the
+        least-far-apart things are different devices with the same ip in the
+        same zone.
 
         :param reassign_parts: An iterable of (part, replicas_to_replace)
                                pairs. replicas_to_replace is an iterable of the
@@ -597,256 +1350,625 @@ def _reassign_parts(self, reassign_parts):
                                replicas_to_replace may be shared for multiple
                                partitions, so be sure you do not modify it.
         """
+        parts_available_in_tier = defaultdict(int)
         for dev in self._iter_devs():
             dev['sort_key'] = self._sort_key_for(dev)
+            # Note: this represents how many partitions may be assigned to a
+            # given tier (region/zone/server/disk). It does not take into
+            # account how many partitions a given tier wants to shed.
+            #
+            # If we did not do this, we could have a zone where, at some
+            # point during an assignment, number-of-parts-to-gain equals
+            # number-of-parts-to-shed. At that point, no further placement
+            # into that zone would occur since its parts_available_in_tier
+            # would be 0. This would happen any time a zone had any device
+            # with partitions to shed, which is any time a device is being
+            # removed, which is a pretty frequent operation.
+            wanted = max(dev['parts_wanted'], 0)
+            for tier in dev['tiers']:
+                parts_available_in_tier[tier] += wanted
+
         available_devs = \
             sorted((d for d in self._iter_devs() if d['weight']),
                    key=lambda x: x['sort_key'])
 
-        tier2children = build_tier_tree(available_devs)
-
         tier2devs = defaultdict(list)
-        tier2sort_key = defaultdict(list)
-        tiers_by_depth = defaultdict(set)
+        tier2sort_key = defaultdict(tuple)
+        tier2dev_sort_key = defaultdict(list)
+        max_tier_depth = 0
         for dev in available_devs:
-            for tier in tiers_for_dev(dev):
+            for tier in dev['tiers']:
                 tier2devs[tier].append(dev)  # <-- starts out sorted!
-                tier2sort_key[tier].append(dev['sort_key'])
-                tiers_by_depth[len(tier)].add(tier)
+                tier2dev_sort_key[tier].append(dev['sort_key'])
+                tier2sort_key[tier] = dev['sort_key']
+                if len(tier) > max_tier_depth:
+                    max_tier_depth = len(tier)
+
+        tier2children_sets = build_tier_tree(available_devs)
+        tier2children = defaultdict(list)
+        tier2children_sort_key = {}
+        tiers_list = [()]
+        depth = 1
+        while depth <= max_tier_depth:
+            new_tiers_list = []
+            for tier in tiers_list:
+                child_tiers = list(tier2children_sets[tier])
+                child_tiers.sort(key=tier2sort_key.__getitem__)
+                tier2children[tier] = child_tiers
+                tier2children_sort_key[tier] = map(
+                    tier2sort_key.__getitem__, child_tiers)
+                new_tiers_list.extend(child_tiers)
+            tiers_list = new_tiers_list
+            depth += 1
 
         for part, replace_replicas in reassign_parts:
-            # Gather up what other tiers (zones, ip_ports, and devices) the
-            # replicas not-to-be-moved are in for this part.
-            other_replicas = defaultdict(lambda: 0)
-            for replica in xrange(self.replicas):
-                if replica not in replace_replicas:
-                    dev = self.devs[self._replica2part2dev[replica][part]]
-                    for tier in tiers_for_dev(dev):
-                        other_replicas[tier] += 1
-
-            def find_home_for_replica(tier=(), depth=1):
-                # Order the tiers by how many replicas of this
-                # partition they already have. Then, of the ones
-                # with the smallest number of replicas, pick the
-                # tier with the hungriest drive and then continue
-                # searching in that subtree.
-                #
-                # There are other strategies we could use here,
-                # such as hungriest-tier (i.e. biggest
-                # sum-of-parts-wanted) or picking one at random.
-                # However, hungriest-drive is what was used here
-                # before, and it worked pretty well in practice.
-                #
-                # Note that this allocator will balance things as
-                # evenly as possible at each level of the device
-                # layout. If your layout is extremely unbalanced,
-                # this may produce poor results.
-                candidate_tiers = tier2children[tier]
-                min_count = min(other_replicas[t] for t in candidate_tiers)
-                candidate_tiers = [t for t in candidate_tiers
-                                   if other_replicas[t] == min_count]
-                candidate_tiers.sort(
-                    key=lambda t: tier2sort_key[t][-1])
-
-                if depth == max(tiers_by_depth.keys()):
-                    return tier2devs[candidate_tiers[-1]][-1]
-
-                return find_home_for_replica(tier=candidate_tiers[-1],
-                                             depth=depth + 1)
+            # always update part_moves for min_part_hours
+            self._last_part_moves[part] = 0
+            # count up where these replicas be
+            replicas_at_tier = defaultdict(int)
+            for dev in self._devs_for_part(part):
+                for tier in dev['tiers']:
+                    replicas_at_tier[tier] += 1
 
             for replica in replace_replicas:
-                dev = find_home_for_replica()
+                # Find a new home for this replica
+                tier = ()
+                # This used to be a cute, recursive function, but it's been
+                # unrolled for performance.
+                depth = 1
+                while depth <= max_tier_depth:
+                    # Choose the roomiest tier among those that don't
+                    # already have their max replicas assigned according
+                    # to the replica_plan.
+                    candidates = [t for t in tier2children[tier] if
+                                  replicas_at_tier[t] <
+                                  replica_plan[t]['max']]
+
+                    if not candidates:
+                        raise Exception('no home for %s/%s %s' % (
+                            part, replica, {t: (
+                                replicas_at_tier[t],
+                                replica_plan[t]['max'],
+                            ) for t in tier2children[tier]}))
+                    tier = max(candidates, key=lambda t:
+                               parts_available_in_tier[t])
+
+                    depth += 1
+
+                dev = tier2devs[tier][-1]
                 dev['parts_wanted'] -= 1
                 dev['parts'] += 1
-                old_sort_key = dev['sort_key']
-                new_sort_key = dev['sort_key'] = self._sort_key_for(dev)
-                for tier in tiers_for_dev(dev):
-                    other_replicas[tier] += 1
-
-                    index = bisect.bisect_left(tier2sort_key[tier],
-                                               old_sort_key)
-                    tier2devs[tier].pop(index)
-                    tier2sort_key[tier].pop(index)
-
-                    new_index = bisect.bisect_left(tier2sort_key[tier],
-                                                   new_sort_key)
-                    tier2devs[tier].insert(new_index, dev)
-                    tier2sort_key[tier].insert(new_index, new_sort_key)
+                for tier in dev['tiers']:
+                    parts_available_in_tier[tier] -= 1
+                    replicas_at_tier[tier] += 1
 
                 self._replica2part2dev[replica][part] = dev['id']
+                self.logger.debug(
+                    "Placed %d/%d onto dev %s", part, replica, pretty_dev(dev))
 
         # Just to save memory and keep from accidental reuse.
         for dev in self._iter_devs():
             del dev['sort_key']
 
-    def _sort_key_for(self, dev):
-        # The maximum value of self.parts is 2^32, which is 9 hex
-        # digits wide (0x100000000). Using a width of 16 here gives us
-        # plenty of breathing room; you'd need more than 2^28 replicas
-        # to overflow it.
-        # Since the sort key is a string and therefore an ascii sort applies,
-        # the maximum_parts_wanted + parts_wanted is used so negative
-        # parts_wanted end up sorted above positive parts_wanted.
-        return '%016x.%04x.%04x' % (
-            (self.parts * self.replicas) + dev['parts_wanted'],
-            randint(0, 0xffff),
-            dev['id'])
+    @staticmethod
+    def _sort_key_for(dev):
+        return (dev['parts_wanted'], random.randint(0, 0xFFFF), dev['id'])
 
-    def _build_max_replicas_by_tier(self):
+    def _build_max_replicas_by_tier(self, bound=math.ceil):
         """
-        Returns a dict of (tier: replica_count) for all tiers in the ring.
+        Returns a defaultdict of (tier: replica_count) for all tiers in the
+        ring excluding zero weight devices.
 
         There will always be a () entry as the root of the structure, whose
         replica_count will equal the ring's replica_count.
 
-        Then there will be (dev_id,) entries for each device, indicating the
-        maximum number of replicas the device might have for any given
-        partition. Anything greater than 1 indicates a partition at serious
-        risk, as the data on that partition will not be stored distinctly at
-        the ring's replica_count.
-
-        Next there will be (dev_id, ip_port) entries for each device,
-        indicating the maximum number of replicas the device shares with other
-        devices on the same ip_port for any given partition. Anything greater
-        than 1 indicates a partition at elevated risk, as if that ip_port were
-        to fail multiple replicas of that partition would be unreachable.
-
-        Last there will be (dev_id, ip_port, zone) entries for each device,
-        indicating the maximum number of replicas the device shares with other
-        devices within the same zone for any given partition. Anything greater
-        than 1 indicates a partition at slightly elevated risk, as if that zone
-        were to fail multiple replicas of that partition would be unreachable.
+        Then there will be (region,) entries for each region, indicating the
+        maximum number of replicas the region might have for any given
+        partition.
+
+        Next there will be (region, zone) entries for each zone, indicating
+        the maximum number of replicas in a given region and zone.  Anything
+        greater than 1 indicates a partition at slightly elevated risk, as if
+        that zone were to fail multiple replicas of that partition would be
+        unreachable.
+
+        Next there will be (region, zone, ip_port) entries for each node,
+        indicating the maximum number of replicas stored on a node in a given
+        region and zone.  Anything greater than 1 indicates a partition at
+        elevated risk, as if that ip_port were to fail multiple replicas of
+        that partition would be unreachable.
+
+        Last there will be (region, zone, ip_port, device) entries for each
+        device, indicating the maximum number of replicas the device shares
+        with other devices on the same node for any given partition.
+        Anything greater than 1 indicates a partition at serious risk, as the
+        data on that partition will not be stored distinctly at the ring's
+        replica_count.
 
         Example return dict for the common SAIO setup::
 
-            {(): 3,
-             (1,): 1.0,
-             (1, '127.0.0.1:6010'): 1.0,
-             (1, '127.0.0.1:6010', 0): 1.0,
-             (2,): 1.0,
-             (2, '127.0.0.1:6020'): 1.0,
-             (2, '127.0.0.1:6020', 1): 1.0,
-             (3,): 1.0,
-             (3, '127.0.0.1:6030'): 1.0,
-             (3, '127.0.0.1:6030', 2): 1.0,
-             (4,): 1.0,
-             (4, '127.0.0.1:6040'): 1.0,
-             (4, '127.0.0.1:6040', 3): 1.0}
+            {(): 3.0,
+            (1,): 3.0,
+            (1, 1): 1.0,
+            (1, 1, '127.0.0.1:6210'): 1.0,
+            (1, 1, '127.0.0.1:6210', 0): 1.0,
+            (1, 2): 1.0,
+            (1, 2, '127.0.0.1:6220'): 1.0,
+            (1, 2, '127.0.0.1:6220', 1): 1.0,
+            (1, 3): 1.0,
+            (1, 3, '127.0.0.1:6230'): 1.0,
+            (1, 3, '127.0.0.1:6230', 2): 1.0,
+            (1, 4): 1.0,
+            (1, 4, '127.0.0.1:6240'): 1.0,
+            (1, 4, '127.0.0.1:6240', 3): 1.0}
+
         """
         # Used by walk_tree to know what entries to create for each recursive
         # call.
-        tier2children = build_tier_tree(self._iter_devs())
+        tier2children = self._build_tier2children()
 
         def walk_tree(tier, replica_count):
+            if len(tier) == 4:
+                # special case for device, it's not recursive
+                replica_count = min(1, replica_count)
             mr = {tier: replica_count}
             if tier in tier2children:
                 subtiers = tier2children[tier]
                 for subtier in subtiers:
-                    submax = math.ceil(float(replica_count) / len(subtiers))
+                    submax = bound(float(replica_count) / len(subtiers))
                     mr.update(walk_tree(subtier, submax))
             return mr
-        return walk_tree((), self.replicas)
+        mr = defaultdict(float)
+        mr.update(walk_tree((), self.replicas))
+        return mr
+
+    def _build_weighted_replicas_by_tier(self):
+        """
+        Returns a dict mapping <tier> => replicanths for all tiers in
+        the ring based on their weights.
+        """
+        weight_of_one_part = self.weight_of_one_part()
+
+        # assign each device some replicanths by weight (can't be > 1)
+        weighted_replicas_for_dev = {}
+        devices_with_room = []
+        for dev in self._iter_devs():
+            if not dev['weight']:
+                continue
+            weighted_replicas = (
+                dev['weight'] * weight_of_one_part / self.parts)
+            if weighted_replicas < 1:
+                devices_with_room.append(dev['id'])
+            else:
+                weighted_replicas = 1
+            weighted_replicas_for_dev[dev['id']] = weighted_replicas
+
+        while True:
+            remaining = self.replicas - sum(weighted_replicas_for_dev.values())
+            if remaining < 1e-10:
+                break
+            devices_with_room = [d for d in devices_with_room if
+                                 weighted_replicas_for_dev[d] < 1]
+            rel_weight = remaining / sum(
+                weighted_replicas_for_dev[d] for d in devices_with_room)
+            for d in devices_with_room:
+                weighted_replicas_for_dev[d] = min(
+                    1, weighted_replicas_for_dev[d] * (rel_weight + 1))
+
+        weighted_replicas_by_tier = defaultdict(float)
+        for dev in self._iter_devs():
+            if not dev['weight']:
+                continue
+            assigned_replicanths = weighted_replicas_for_dev[dev['id']]
+            dev_tier = (dev['region'], dev['zone'], dev['ip'], dev['id'])
+            for i in range(len(dev_tier) + 1):
+                tier = dev_tier[:i]
+                weighted_replicas_by_tier[tier] += assigned_replicanths
+
+        # belts & suspenders/paranoia -  at every level, the sum of
+        # weighted_replicas should be very close to the total number of
+        # replicas for the ring
+        validate_replicas_by_tier(self.replicas, weighted_replicas_by_tier)
+
+        return weighted_replicas_by_tier
+
+    def _build_wanted_replicas_by_tier(self):
+        """
+        Returns a defaultdict of (tier: replicanths) for all tiers in the ring
+        based on unique-as-possible (full dispersion) with respect to their
+        weights and device counts.
+
+        N.B.  _build_max_replicas_by_tier calculates the upper bound on the
+        replicanths each tier may hold irrespective of the weights of the
+        tier; this method will calculate the minimum replicanth <=
+        max_replicas[tier] that will still solve dispersion.  However, it is
+        not guaranteed to return a fully dispersed solution if failure domains
+        are over-weighted for their device count.
+        """
+        weighted_replicas = self._build_weighted_replicas_by_tier()
+        dispersed_replicas = {
+            t: {
+                'min': math.floor(r),
+                'max': math.ceil(r),
+            } for (t, r) in
+            self._build_max_replicas_by_tier(bound=float).items()
+        }
+
+        # watch out for device limited tiers
+        num_devices = defaultdict(int)
+        for d in self._iter_devs():
+            if d['weight'] <= 0:
+                continue
+            for t in (d.get('tiers') or tiers_for_dev(d)):
+                num_devices[t] += 1
+            num_devices[()] += 1
+
+        tier2children = self._build_tier2children()
+
+        wanted_replicas = defaultdict(float)
+
+        def place_replicas(tier, replicanths):
+            if replicanths > num_devices[tier]:
+                raise exceptions.RingValidationError(
+                    'More replicanths (%s) than devices (%s) '
+                    'in tier (%s)' % (replicanths, num_devices[tier], tier))
+            wanted_replicas[tier] = replicanths
+            sub_tiers = sorted(tier2children[tier])
+            if not sub_tiers:
+                return
+
+            to_place = defaultdict(float)
+            remaining = replicanths
+            tiers_to_spread = sub_tiers
+            device_limited = False
+
+            while True:
+                rel_weight = remaining / sum(weighted_replicas[t]
+                                             for t in tiers_to_spread)
+                for t in tiers_to_spread:
+                    replicas = to_place[t] + (
+                        weighted_replicas[t] * rel_weight)
+                    if replicas < dispersed_replicas[t]['min']:
+                        replicas = dispersed_replicas[t]['min']
+                    elif (replicas > dispersed_replicas[t]['max'] and
+                          not device_limited):
+                        replicas = dispersed_replicas[t]['max']
+                    if replicas > num_devices[t]:
+                        replicas = num_devices[t]
+                    to_place[t] = replicas
+
+                remaining = replicanths - sum(to_place.values())
+
+                if remaining < -1e-10:
+                    tiers_to_spread = [
+                        t for t in sub_tiers
+                        if to_place[t] > dispersed_replicas[t]['min']
+                    ]
+                elif remaining > 1e-10:
+                    tiers_to_spread = [
+                        t for t in sub_tiers
+                        if (num_devices[t] > to_place[t] <
+                            dispersed_replicas[t]['max'])
+                    ]
+                    if not tiers_to_spread:
+                        device_limited = True
+                        tiers_to_spread = [
+                            t for t in sub_tiers
+                            if to_place[t] < num_devices[t]
+                        ]
+                else:
+                    # remaining is "empty"
+                    break
+
+            for t in sub_tiers:
+                self.logger.debug('Planning %s on %s',
+                                  to_place[t], t)
+                place_replicas(t, to_place[t])
+
+        # place all replicas in the cluster tier
+        place_replicas((), self.replicas)
+
+        # belts & suspenders/paranoia -  at every level, the sum of
+        # wanted_replicas should be very close to the total number of
+        # replicas for the ring
+        validate_replicas_by_tier(self.replicas, wanted_replicas)
+
+        return wanted_replicas
+
+    def _build_target_replicas_by_tier(self):
+        """
+        Build a map of <tier> => <target_replicas> accounting for device
+        weights, unique-as-possible dispersion and overload.
+
+        <tier> - a tuple, describing each tier in the ring topology
+        <target_replicas> - a float, the target replicanths at the tier
+        """
+        weighted_replicas = self._build_weighted_replicas_by_tier()
+        wanted_replicas = self._build_wanted_replicas_by_tier()
+        max_overload = self.get_required_overload(weighted=weighted_replicas,
+                                                  wanted=wanted_replicas)
+        if max_overload <= 0.0:
+            return wanted_replicas
+        else:
+            overload = min(self.overload, max_overload)
+        self.logger.debug("Using effective overload of %f", overload)
+        target_replicas = defaultdict(float)
+        for tier, weighted in weighted_replicas.items():
+            m = (wanted_replicas[tier] - weighted) / max_overload
+            target_replicas[tier] = m * overload + weighted
+
+        # belts & suspenders/paranoia -  at every level, the sum of
+        # target_replicas should be very close to the total number
+        # of replicas for the ring
+        validate_replicas_by_tier(self.replicas, target_replicas)
+
+        return target_replicas
+
+    def _build_replica_plan(self):
+        """
+        Wraps return value of _build_target_replicas_by_tier to include
+        pre-calculated min and max values for each tier.
+
+        :returns: a dict, mapping <tier> => <replica_plan>, where
+                  <replica_plan> is itself a dict
+
+        <replica_plan> include at least the following keys:
+
+            min - the minimum number of replicas at the tier
+            target - the target replicanths at the tier
+            max - the maximum number of replicas at the tier
+        """
+        # replica part-y planner!
+        target_replicas = self._build_target_replicas_by_tier()
+        replica_plan = defaultdict(
+            lambda: {'min': 0, 'target': 0, 'max': 0})
+        replica_plan.update({
+            t: {
+                'min': math.floor(r + 1e-10),
+                'target': r,
+                'max': math.ceil(r - 1e-10),
+            } for (t, r) in
+            target_replicas.items()
+        })
+        return replica_plan
+
+    def _devs_for_part(self, part):
+        """
+        Returns a list of devices for a specified partition.
+
+        Deliberately includes duplicates.
+        """
+        if self._replica2part2dev is None:
+            return []
+        devs = []
+        for part2dev in self._replica2part2dev:
+            if part >= len(part2dev):
+                continue
+            dev_id = part2dev[part]
+            if dev_id == self.none_dev_id:
+                continue
+            devs.append(self.devs[dev_id])
+        return devs
+
+    def _replicas_for_part(self, part):
+        """
+        Returns a list of replicas for a specified partition.
+
+        These can be used as indices into self._replica2part2dev
+        without worrying about IndexErrors.
+        """
+        return [replica for replica, part2dev
+                in enumerate(self._replica2part2dev)
+                if part < len(part2dev)]
+
+    def _each_part_replica(self):
+        """
+        Generator yielding every (partition, replica) pair in the ring.
+        """
+        for replica, part2dev in enumerate(self._replica2part2dev):
+            for part in range(len(part2dev)):
+                yield (part, replica)
 
     @classmethod
-    def load(cls, builder_file, open=open):
+    def load(cls, builder_file, open=open, **kwargs):
         """
         Obtain RingBuilder instance of the provided builder file
 
         :param builder_file: path to builder file to load
         :return: RingBuilder instance
         """
-        builder = pickle.load(open(builder_file, 'rb'))
+        try:
+            fp = open(builder_file, 'rb')
+        except IOError as e:
+            if e.errno == errno.ENOENT:
+                raise exceptions.FileNotFoundError(
+                    'Ring Builder file does not exist: %s' % builder_file)
+            elif e.errno in [errno.EPERM, errno.EACCES]:
+                raise exceptions.PermissionError(
+                    'Ring Builder file cannot be accessed: %s' % builder_file)
+            else:
+                raise
+        else:
+            with fp:
+                try:
+                    builder = pickle.load(fp)  # nosec: B301
+                except Exception:
+                    # raise error during unpickling as UnPicklingError
+                    raise exceptions.UnPicklingError(
+                        'Ring Builder file is invalid: %s' % builder_file)
+
         if not hasattr(builder, 'devs'):
             builder_dict = builder
-            builder = RingBuilder(1, 1, 1)
+            builder = cls(1, 1, 1, **kwargs)
             builder.copy_from(builder_dict)
+
+        if not hasattr(builder, '_id'):
+            builder._id = None
+
         for dev in builder.devs:
-            #really old rings didn't have meta keys
+            # really old rings didn't have meta keys
             if dev and 'meta' not in dev:
                 dev['meta'] = ''
+            # NOTE(akscram): An old ring builder file don't contain
+            #                replication parameters.
+            if dev:
+                dev.setdefault('replication_ip', dev['ip'])
+                dev.setdefault('replication_port', dev['port'])
         return builder
 
-    def search_devs(self, search_value):
-        """
-The <search-value> can be of the form:
-    d<device_id>z<zone>-<ip>:<port>/<device_name>_<meta>
-    Any part is optional, but you must include at least one part.
-    Examples:
-        d74              Matches the device id 74
-        z1               Matches devices in zone 1
-        z1-1.2.3.4       Matches devices in zone 1 with the ip 1.2.3.4
-        1.2.3.4          Matches devices in any zone with the ip 1.2.3.4
-        z1:5678          Matches devices in zone 1 using port 5678
-        :5678            Matches devices that use port 5678
-        /sdb1            Matches devices with the device name sdb1
-        _shiny           Matches devices with shiny in the meta data
-        _"snet: 5.6.7.8" Matches devices with snet: 5.6.7.8 in the meta data
-        [::1]            Matches devices in any zone with the ip ::1
-        z1-[::1]:5678    Matches devices in zone 1 with ip ::1 and port 5678
-    Most specific example:
-        d74z1-1.2.3.4:5678/sdb1_"snet: 5.6.7.8"
-    Nerd explanation:
-        All items require their single character prefix except the ip, in which
-        case the - is optional unless the device id or zone is also included.
-        """
-        orig_search_value = search_value
-        match = []
-        if search_value.startswith('d'):
-            i = 1
-            while i < len(search_value) and search_value[i].isdigit():
-                i += 1
-            match.append(('id', int(search_value[1:i])))
-            search_value = search_value[i:]
-        if search_value.startswith('z'):
-            i = 1
-            while i < len(search_value) and search_value[i].isdigit():
-                i += 1
-            match.append(('zone', int(search_value[1:i])))
-            search_value = search_value[i:]
-        if search_value.startswith('-'):
-            search_value = search_value[1:]
-        if len(search_value) and search_value[0].isdigit():
-            i = 1
-            while i < len(search_value) and search_value[i] in '0123456789.':
-                i += 1
-            match.append(('ip', search_value[:i]))
-            search_value = search_value[i:]
-        elif len(search_value) and search_value[0] == '[':
-            i = 1
-            while i < len(search_value) and search_value[i] != ']':
-                i += 1
-            i += 1
-            match.append(('ip', search_value[:i].lstrip('[').rstrip(']')))
-            search_value = search_value[i:]
-        if search_value.startswith(':'):
-            i = 1
-            while i < len(search_value) and search_value[i].isdigit():
-                i += 1
-            match.append(('port', int(search_value[1:i])))
-            search_value = search_value[i:]
-        if search_value.startswith('/'):
-            i = 1
-            while i < len(search_value) and search_value[i] != '_':
-                i += 1
-            match.append(('device', search_value[1:i]))
-            search_value = search_value[i:]
-        if search_value.startswith('_'):
-            match.append(('meta', search_value[1:]))
-            search_value = ''
-        if search_value:
-            raise ValueError('Invalid <search-value>: %s' %
-                             repr(orig_search_value))
+    def save(self, builder_file):
+        """Serialize this RingBuilder instance to disk.
+
+        :param builder_file: path to builder file to save
+        """
+        # We want to be sure the builder id's are persistent, so this is the
+        # only place where the id is assigned. Newly created instances of this
+        # class, or instances loaded from legacy builder files that have no
+        # persisted id, must be saved in order for an id to be assigned.
+        id_persisted = True
+        if self._id is None:
+            id_persisted = False
+            self._id = uuid.uuid4().hex
+        try:
+            with open(builder_file, 'wb') as f:
+                pickle.dump(self.to_dict(), f, protocol=2)
+        except Exception:
+            if not id_persisted:
+                self._id = None
+            raise
+
+    def search_devs(self, search_values):
+        """Search devices by parameters.
+
+        :param search_values: a dictionary with search values to filter
+                              devices, supported parameters are id,
+                              region, zone, ip, port, replication_ip,
+                              replication_port, device, weight, meta
+
+        :returns: list of device dicts
+        """
         matched_devs = []
         for dev in self.devs:
             if not dev:
                 continue
             matched = True
-            for key, value in match:
-                if key == 'meta':
-                    if value not in dev.get(key):
-                        matched = False
-                elif dev.get(key) != value:
-                    matched = False
+            for key in ('id', 'region', 'zone', 'ip', 'port', 'replication_ip',
+                        'replication_port', 'device', 'weight', 'meta'):
+                if key in search_values:
+                    value = search_values.get(key)
+                    if value is not None:
+                        if key == 'meta':
+                            if value not in dev.get(key):
+                                matched = False
+                        elif key == 'ip' or key == 'replication_ip':
+                            cdev = ''
+                            try:
+                                cdev = validate_and_normalize_address(
+                                    dev.get(key, ''))
+                            except ValueError:
+                                pass
+                            if cdev != value:
+                                matched = False
+                        elif dev.get(key) != value:
+                            matched = False
             if matched:
                 matched_devs.append(dev)
         return matched_devs
+
+    def prepare_increase_partition_power(self):
+        """
+        Prepares a ring for partition power increase.
+
+        This makes it possible to compute the future location of any object
+        based on the next partition power.
+
+        In this phase object servers should create hard links when finalizing a
+        write to the new location as well. A relinker will be run after
+        restarting object-servers, creating hard links to all existing objects
+        in their future location.
+
+        :returns: False if next_part_power was not set, otherwise True.
+        """
+        if self.next_part_power:
+            return False
+        self.next_part_power = self.part_power + 1
+        self.version += 1
+        return True
+
+    def increase_partition_power(self):
+        """
+        Increases ring partition power by one.
+
+        Devices will be assigned to partitions like this:
+
+        OLD: 0, 3, 7, 5, 2, 1, ...
+        NEW: 0, 0, 3, 3, 7, 7, 5, 5, 2, 2, 1, 1, ...
+
+        :returns: False if next_part_power was not set or is equal to current
+                  part_power, None if something went wrong, otherwise True.
+        """
+
+        if not self.next_part_power:
+            return False
+
+        if self.next_part_power != (self.part_power + 1):
+            return False
+
+        new_replica2part2dev = []
+        for replica in self._replica2part2dev:
+            new_replica = array(self.dev_id_type_code)
+            for device in replica:
+                new_replica.append(device)
+                new_replica.append(device)  # append device a second time
+            new_replica2part2dev.append(new_replica)
+        self._replica2part2dev = new_replica2part2dev
+
+        for device in self._iter_devs():
+            device['parts'] *= 2
+
+        # We need to update the time when a partition has been moved the last
+        # time. Since this is an array of all partitions, we need to double it
+        # too
+        new_last_part_moves = []
+        for partition in self._last_part_moves:
+            new_last_part_moves.append(partition)
+            new_last_part_moves.append(partition)
+        self._last_part_moves = new_last_part_moves
+
+        self.part_power = self.next_part_power
+        self.parts *= 2
+        self.version += 1
+        return True
+
+    def cancel_increase_partition_power(self):
+        """
+        Cancels a ring partition power increasement.
+
+        This sets the next_part_power to the current part_power. Object
+        replicators will still skip replication, and a cleanup is still
+        required. Finally, a finish_increase_partition_power needs to be run.
+
+        :returns: False if next_part_power was not set or is equal to current
+                  part_power, otherwise True.
+        """
+
+        if not self.next_part_power:
+            return False
+
+        if self.next_part_power != (self.part_power + 1):
+            return False
+
+        self.next_part_power = self.part_power
+        self.version += 1
+        return True
+
+    def finish_increase_partition_power(self):
+        """Finish the partition power increase.
+
+        The hard links from the old object locations should be removed by now.
+        """
+        if self.next_part_power and self.next_part_power == self.part_power:
+            self.next_part_power = None
+            self.version += 1
+            return True
+        return False
diff --git a/swift/common/ring/composite_builder.py b/swift/common/ring/composite_builder.py
new file mode 100644
index 0000000000..929e03b105
--- /dev/null
+++ b/swift/common/ring/composite_builder.py
@@ -0,0 +1,746 @@
+# Copyright (c) 2010-2017 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""
+A standard ring built using the :ref:`ring-builder <ring_builder>` will attempt
+to randomly disperse replicas or erasure-coded fragments across failure
+domains, but does not provide any guarantees such as placing at least one
+replica of every partition into each region. Composite rings are intended to
+provide operators with greater control over the dispersion of object replicas
+or fragments across a cluster, in particular when there is a desire to
+have strict guarantees that some replicas or fragments are placed in certain
+failure domains. This is particularly important for policies with duplicated
+erasure-coded fragments.
+
+A composite ring comprises two or more component rings that are combined to
+form a single ring with a replica count equal to the sum of replica counts
+from the component rings. The component rings are built independently, using
+distinct devices in distinct regions, which means that the dispersion of
+replicas between the components can be guaranteed. The ``composite_builder``
+utilities may then be used to combine components into a composite ring.
+
+For example, consider a normal ring ``ring0`` with replica count of 4 and
+devices in two regions ``r1`` and ``r2``. Despite the best efforts of the
+ring-builder, it is possible for there to be three replicas of a particular
+partition placed in one region and only one replica placed in the other region.
+For example::
+
+  part_n -> r1z1h110/sdb r1z2h12/sdb r1z3h13/sdb r2z1h21/sdb
+
+Now consider two normal rings each with replica count of 2: ``ring1`` has
+devices in only ``r1``; ``ring2`` has devices in only ``r2``.
+When these rings are combined into a composite ring then every partition is
+guaranteed to be mapped to two devices in each of ``r1`` and ``r2``, for
+example::
+
+  part_n -> r1z1h10/sdb r1z2h20/sdb  r2z1h21/sdb r2z2h22/sdb
+            |_____________________|  |_____________________|
+                       |                        |
+                     ring1                    ring2
+
+The dispersion of partition replicas across failure domains within each of the
+two component rings may change as they are modified and rebalanced, but the
+dispersion of replicas between the two regions is guaranteed by the use of a
+composite ring.
+
+For rings to be formed into a composite they must satisfy the following
+requirements:
+
+* All component rings must have the same part power (and therefore number of
+  partitions)
+* All component rings must have an integer replica count
+* Each region may only be used in one component ring
+* Each device may only be used in one component ring
+
+Under the hood, the composite ring has a ``_replica2part2dev_id`` table that is
+the union of the tables from the component rings. Whenever the component rings
+are rebalanced, the composite ring must be rebuilt. There is no dynamic
+rebuilding of the composite ring.
+
+.. note::
+    The order in which component rings are combined into a composite ring is
+    very significant because it determines the order in which the
+    Ring.get_part_nodes() method will provide primary nodes for the composite
+    ring and consequently the node indexes assigned to the primary nodes. For
+    an erasure-coded policy, inadvertent changes to the primary node indexes
+    could result in large amounts of data movement due to fragments being moved
+    to their new correct primary.
+
+    The ``id`` of each component RingBuilder is therefore stored in metadata of
+    the composite and used to check for the component ordering when the same
+    composite ring is re-composed. RingBuilder ``id``\\s are normally assigned
+    when a RingBuilder instance is first saved. Older RingBuilder instances
+    loaded from file may not have an ``id`` assigned and will need to be saved
+    before they can be used as components of a composite ring. This can be
+    achieved by, for example::
+
+        swift-ring-builder <builder-file> rebalance --force
+
+"""
+
+import copy
+import json
+import os
+
+from random import shuffle
+
+from swift.common.exceptions import RingBuilderError
+from swift.common.ring import RingBuilder
+from swift.common.ring import RingData
+from swift.common.ring.utils import calc_dev_id_bytes
+from swift.common.ring.utils import resize_array
+from collections import defaultdict
+from itertools import combinations
+
+MUST_MATCH_ATTRS = (
+    'part_power',
+)
+
+
+def pre_validate_all_builders(builders):
+    """
+    Pre-validation for all component ring builders that are to be included in
+    the composite ring. Checks that all component rings are valid with respect
+    to each other.
+
+    :param builders: a list of :class:`swift.common.ring.builder.RingBuilder`
+        instances
+    :raises ValueError: if the builders are invalid with respect to each other
+    """
+    if len(builders) < 2:
+        raise ValueError('Two or more component builders are required.')
+
+    # all ring builders should be consistent for each MUST_MATCH_ATTRS
+    for attr in MUST_MATCH_ATTRS:
+        attr_dict = defaultdict(list)
+        for i, builder in enumerate(builders):
+            value = getattr(builder, attr, None)
+            attr_dict[value].append(i)
+        if len(attr_dict) > 1:
+            variations = ['%s=%s found at indexes %s' %
+                          (attr, val, indexes)
+                          for val, indexes in attr_dict.items()]
+            raise ValueError(
+                'All builders must have same value for %r.\n%s'
+                % (attr, '\n  '.join(variations)))
+
+    # all ring builders should have int replica count and not have dirty mods
+    errors = []
+    for index, builder in enumerate(builders):
+        if int(builder.replicas) != builder.replicas:
+            errors.append(
+                'Non integer replica count %s found at index %s' %
+                (builder.replicas, index))
+        if builder.devs_changed:
+            errors.append(
+                'Builder needs rebalance to apply changes at index %s' %
+                index)
+    if errors:
+        raise ValueError(
+            'Problem with builders.\n%s' % ('\n  '.join(errors)))
+
+    # check regions
+    regions_info = {}
+    for builder in builders:
+        regions_info[builder] = set(
+            dev['region'] for dev in builder._iter_devs())
+    for first_region_set, second_region_set in combinations(
+            regions_info.values(), 2):
+        inter = first_region_set & second_region_set
+        if inter:
+            raise ValueError('Same region found in different rings')
+
+    # check device uniqueness
+    check_for_dev_uniqueness(builders)
+
+
+def check_for_dev_uniqueness(builders):
+    """
+    Check that no device appears in more than one of the given list of
+    builders.
+
+    :param builders: a list of :class:`swift.common.ring.builder.RingBuilder`
+        instances
+    :raises ValueError: if the same device is found in more than one builder
+    """
+    builder2devs = []
+    for i, builder in enumerate(builders):
+        dev_set = set()
+        for dev in builder._iter_devs():
+            ip, port, device = (dev['ip'], dev['port'], dev['device'])
+            for j, (other_builder, devs) in enumerate(builder2devs):
+                if (ip, port, device) in devs:
+                    raise ValueError(
+                        'Duplicate ip/port/device combination %s/%s/%s found '
+                        'in builders at indexes %s and %s' %
+                        (ip, port, device, j, i)
+                    )
+            dev_set.add((ip, port, device))
+        builder2devs.append((builder, dev_set))
+
+
+def _make_composite_ring(builders):
+    """
+    Given a list of component ring builders, return a composite RingData
+    instance.
+
+    :param builders: a list of
+        :class:`swift.common.ring.builder.RingBuilder` instances
+    :return: a new RingData instance built from the component builders
+    :raises ValueError: if the builders are invalid with respect to each other
+    """
+    total_devices = sum(len(builder.devs) for builder in builders)
+    dev_id_bytes = calc_dev_id_bytes(total_devices)
+
+    composite_r2p2d = []
+    composite_devs = []
+    device_offset = 0
+    for builder in builders:
+        # copy all devs list and replica2part2dev table to be able
+        # to modify the id for each dev
+        devs = copy.deepcopy(builder.devs)
+        # Note that resize_array() always makes a copy
+        r2p2d = [resize_array(p2d, dev_id_bytes)
+                 for p2d in builder._replica2part2dev]
+        for part2dev in r2p2d:
+            for part, dev in enumerate(part2dev):
+                part2dev[part] += device_offset
+        for dev in [d for d in devs if d]:
+            # note that some devs may not be referenced in r2p2d but update
+            # their dev id nonetheless
+            dev['id'] += device_offset
+        composite_r2p2d.extend(r2p2d)
+        composite_devs.extend(devs)
+        device_offset += len(builder.devs)
+
+    return RingData(composite_r2p2d, composite_devs, builders[0].part_shift)
+
+
+def compose_rings(builders):
+    """
+    Given a list of component ring builders, perform validation on the list of
+    builders and return a composite RingData instance.
+
+    :param builders: a list of
+        :class:`swift.common.ring.builder.RingBuilder` instances
+    :return: a new RingData instance built from the component builders
+    :raises ValueError: if the builders are invalid with respect to each other
+    """
+    pre_validate_all_builders(builders)
+    rd = _make_composite_ring(builders)
+    return rd
+
+
+def _make_component_meta(builder):
+    """
+    Return a dict of selected builder attributes to save in composite meta. The
+    dict has keys ``version``, ``replicas`` and ``id``.
+    :param builder: a :class:`swift.common.ring.builder.RingBuilder`
+        instance
+    :return: a dict of component metadata
+    """
+    attrs = ['version', 'replicas', 'id']
+    metadata = dict((attr, getattr(builder, attr)) for attr in attrs)
+    return metadata
+
+
+def _make_composite_metadata(builders):
+    """
+    Return a dict with key ``components`` that maps to a list of dicts, each
+    dict being of the form returned by :func:`_make_component_meta`.
+
+    :param builders: a list of
+        :class:`swift.common.ring.builder.RingBuilder` instances
+    :return: a dict of composite metadata
+    """
+    component_meta = [_make_component_meta(builder) for builder in builders]
+    return {'components': component_meta}
+
+
+def check_same_builder(old_component, new_component):
+    """
+    Check that the given new_component metadata describes the same builder as
+    the given old_component metadata. The new_component builder does not
+    necessarily need to be in the same state as when the old_component metadata
+    was created to satisfy this check e.g. it may have changed devs and been
+    rebalanced.
+
+    :param old_component: a dict of metadata describing a component builder
+    :param new_component: a dict of metadata describing a component builder
+    :raises ValueError: if the new_component is not the same as that described
+        by the old_component
+    """
+    for key in ['replicas', 'id']:
+        if old_component[key] != new_component[key]:
+            raise ValueError("Attribute mismatch for %s: %r != %r" %
+                             (key, old_component[key], new_component[key]))
+
+
+def is_builder_newer(old_component, new_component):
+    """
+    Return True if the given builder has been modified with respect to its
+    state when the given component_meta was created.
+
+    :param old_component: a dict of metadata describing a component ring
+    :param new_component: a dict of metadata describing a component ring
+    :return: True if the builder has been modified, False otherwise.
+    :raises ValueError: if the version of the new_component is older than the
+                        version of the existing component.
+    """
+
+    if new_component['version'] < old_component['version']:
+        raise ValueError('Older builder version: %s < %s' %
+                         (new_component['version'], old_component['version']))
+    return old_component['version'] < new_component['version']
+
+
+def check_against_existing(old_composite_meta, new_composite_meta):
+    """
+    Check that the given builders and their order are the same as that
+    used to build an existing composite ring. Return True if any of the given
+    builders has been modified with respect to its state when the given
+    component_meta was created.
+
+    :param old_composite_meta: a dict of the form returned by
+        :func:`_make_composite_meta`
+    :param new_composite_meta: a dict of the form returned by
+        :func:`_make_composite_meta`
+    :return: True if any of the components has been modified, False otherwise.
+    :raises Value Error: if proposed new components do not match any existing
+        components.
+    """
+    errors = []
+    newer = False
+    old_components = old_composite_meta['components']
+    new_components = new_composite_meta['components']
+    for i, old_component in enumerate(old_components):
+        try:
+            new_component = new_components[i]
+        except IndexError:
+            errors.append("Missing builder at index %d" % i)
+            continue
+        try:
+            # check we have same component builder in this position vs existing
+            check_same_builder(old_component, new_component)
+            newer |= is_builder_newer(old_component, new_component)
+        except ValueError as err:
+            errors.append("Invalid builder change at index %d: %s" % (i, err))
+
+    for j, new_component in enumerate(new_components[i + 1:], start=i + 1):
+        errors.append("Unexpected extra builder at index %d: %r" %
+                      (j, new_component))
+    if errors:
+        raise ValueError('\n'.join(errors))
+    return newer
+
+
+def check_builder_ids(builders):
+    """
+    Check that all builders in the given list have id's assigned and that no
+    id appears more than once in the list.
+
+    :param builders: a list instances of
+        :class:`swift.common.ring.builder.RingBuilder`
+    :raises: ValueError if any builder id is missing or repeated
+    """
+    id2index = defaultdict(list)
+    errors = []
+    for i, builder in enumerate(builders):
+        try:
+            id2index[builder.id].append(str(i))
+        except AttributeError as err:
+            errors.append("Problem with builder at index %d: %s" % (i, err))
+
+    for builder_id, index in id2index.items():
+        if len(index) > 1:
+            errors.append("Builder id %r used at indexes %s" %
+                          (builder_id, ', '.join(index)))
+
+    if errors:
+        raise ValueError('\n'.join(errors))
+
+
+class CompositeRingBuilder(object):
+    """
+    Provides facility to create, persist, load, rebalance  and update composite
+    rings, for example::
+
+        # create a CompositeRingBuilder instance with a list of
+        # component builder files
+        crb = CompositeRingBuilder(["region1.builder", "region2.builder"])
+
+        # perform a cooperative rebalance of the component builders
+        crb.rebalance()
+
+        # call compose which will make a new RingData instance
+        ring_data = crb.compose()
+
+        # save the composite ring file
+        ring_data.save("composite_ring.gz")
+
+        # save the composite metadata file
+        crb.save("composite_builder.composite")
+
+        # load the persisted composite metadata file
+        crb = CompositeRingBuilder.load("composite_builder.composite")
+
+        # compose (optionally update the paths to the component builder files)
+        crb.compose(["/path/to/region1.builder", "/path/to/region2.builder"])
+
+    Composite ring metadata is persisted to file in JSON format. The metadata
+    has the structure shown below (using example values)::
+
+      {
+        "version": 4,
+        "components": [
+          {
+            "version": 3,
+            "id": "8e56f3b692d43d9a666440a3d945a03a",
+            "replicas": 1
+          },
+          {
+            "version": 5,
+            "id": "96085923c2b644999dbfd74664f4301b",
+            "replicas": 1
+          }
+        ]
+        "component_builder_files": {
+            "8e56f3b692d43d9a666440a3d945a03a": "/etc/swift/region1.builder",
+            "96085923c2b644999dbfd74664f4301b": "/etc/swift/region2.builder",
+        }
+        "serialization_version": 1,
+        "saved_path": "/etc/swift/multi-ring-1.composite",
+      }
+
+    `version` is an integer representing the current version of the composite
+    ring, which increments each time the ring is successfully (re)composed.
+
+    `components` is a list of dicts, each of which describes relevant
+    properties of a component ring
+
+    `component_builder_files` is a dict that maps component ring builder ids to
+    the file from which that component ring builder was loaded.
+
+    `serialization_version` is an integer constant.
+
+    `saved_path` is the path to which the metadata was written.
+
+    :params builder_files: a list of paths to builder files that will be used
+        as components of the composite ring.
+    """
+    def __init__(self, builder_files=None):
+        self.version = 0
+        self.components = []
+        self.ring_data = None
+        self._builder_files = None
+        self._set_builder_files(builder_files or [])
+        self._builders = None  # these are lazy loaded in _load_components
+
+    def _set_builder_files(self, builder_files):
+        self._builder_files = [os.path.abspath(bf) for bf in builder_files]
+
+    @classmethod
+    def load(cls, path_to_file):
+        """
+        Load composite ring metadata.
+
+        :param path_to_file: Absolute path to a composite ring JSON file.
+        :return: an instance of :class:`CompositeRingBuilder`
+        :raises IOError: if there is a problem opening the file
+        :raises ValueError: if the file does not contain valid composite ring
+                            metadata
+        """
+        try:
+            with open(path_to_file, 'rt') as fp:
+                metadata = json.load(fp)
+            builder_files = [metadata['component_builder_files'][comp['id']]
+                             for comp in metadata['components']]
+
+            builder = CompositeRingBuilder(builder_files)
+            builder.components = metadata['components']
+            builder.version = metadata['version']
+        except (ValueError, TypeError, KeyError):
+            raise ValueError("File does not contain valid composite ring data")
+        return builder
+
+    def to_dict(self):
+        """
+        Transform the composite ring attributes to a dict. See
+        :class:`CompositeRingBuilder` for details of the persisted metadata
+        format.
+
+        :return: a composite ring metadata dict
+        """
+        id2builder_file = dict((component['id'], self._builder_files[i])
+                               for i, component in enumerate(self.components))
+        return {'components': self.components,
+                'component_builder_files': id2builder_file,
+                'version': self.version}
+
+    def save(self, path_to_file):
+        """
+        Save composite ring metadata to given file. See
+        :class:`CompositeRingBuilder` for details of the persisted metadata
+        format.
+
+        :param path_to_file: Absolute path to a composite ring file
+        :raises ValueError: if no composite ring has been built yet with this
+                            instance
+        """
+        if not self.components or not self._builder_files:
+            raise ValueError("No composed ring to save.")
+        # persist relative paths to builder files
+        with open(path_to_file, 'wt') as fp:
+            metadata = self.to_dict()
+            # future-proofing:
+            # - saving abs path to component builder files and this file should
+            # allow the relative paths to be derived if required when loading
+            # a set of {composite builder file, component builder files} that
+            # has been moved, so long as their relative locations are
+            # unchanged.
+            # - save a serialization format version number
+            metadata['saved_path'] = os.path.abspath(path_to_file)
+            metadata['serialization_version'] = 1
+            json.dump(metadata, fp)
+
+    def _load_components(self, builder_files=None, force=False,
+                         require_modified=False):
+        if self._builders:
+            return self._builder_files, self._builders
+
+        builder_files = builder_files or self._builder_files
+        if len(builder_files) < 2:
+            raise ValueError('Two or more component builders are required.')
+
+        builders = []
+        for builder_file in builder_files:
+            # each component builder gets a reference to this composite builder
+            # so that it can delegate part movement decisions to the composite
+            # builder during rebalance
+            builders.append(CooperativeRingBuilder.load(builder_file,
+                                                        parent_builder=self))
+        check_builder_ids(builders)
+        new_metadata = _make_composite_metadata(builders)
+        if self.components and self._builder_files and not force:
+            modified = check_against_existing(self.to_dict(), new_metadata)
+            if require_modified and not modified:
+                raise ValueError(
+                    "None of the component builders has been modified"
+                    " since the existing composite ring was built.")
+        self._set_builder_files(builder_files)
+        self._builders = builders
+        return self._builder_files, self._builders
+
+    def load_components(self, builder_files=None, force=False,
+                        require_modified=False):
+        """
+        Loads component ring builders from builder files. Previously loaded
+        component ring builders will discarded and reloaded.
+
+        If a list of component ring builder files is given then that will be
+        used to load component ring builders. Otherwise, component ring
+        builders will be loaded using the list of builder files that was set
+        when the instance was constructed.
+
+        In either case, if metadata for an existing composite ring has been
+        loaded then the component ring builders are verified for consistency
+        with the existing composition of builders, unless the optional
+        ``force`` flag if set True.
+
+        :param builder_files: Optional list of paths to ring builder
+            files that will be used to load the component ring builders.
+            Typically the list of component builder files will have been set
+            when the instance was constructed, for example when using the
+            load() class method. However, this parameter may be used if the
+            component builder file paths have moved, or, in conjunction with
+            the ``force`` parameter, if a new list of component builders is to
+            be used.
+        :param force: if True then do not verify given builders are
+            consistent with any existing composite ring (default is False).
+        :param require_modified: if True and ``force`` is False, then
+            verify that at least one of the given builders has been modified
+            since the composite ring was last built (default is False).
+        :return: A tuple of (builder files, loaded builders)
+        :raises: ValueError if the component ring builders are not suitable for
+            composing with each other, or are inconsistent with any existing
+            composite ring, or if require_modified is True and there has been
+            no change with respect to the existing ring.
+        """
+        self._builders = None  # force a reload of builders
+        return self._load_components(
+            builder_files, force, require_modified)
+
+    def compose(self, builder_files=None, force=False, require_modified=False):
+        """
+        Builds a composite ring using component ring builders loaded from a
+        list of builder files and updates composite ring metadata.
+
+        If a list of component ring builder files is given then that will be
+        used to load component ring builders. Otherwise, component ring
+        builders will be loaded using the list of builder files that was set
+        when the instance was constructed.
+
+        In either case, if metadata for an existing composite ring has been
+        loaded then the component ring builders are verified for consistency
+        with the existing composition of builders, unless the optional
+        ``force`` flag if set True.
+
+        :param builder_files: Optional list of paths to ring builder
+            files that will be used to load the component ring builders.
+            Typically the list of component builder files will have been set
+            when the instance was constructed, for example when using the
+            load() class method. However, this parameter may be used if the
+            component builder file paths have moved, or, in conjunction with
+            the ``force`` parameter, if a new list of component builders is to
+            be used.
+        :param force: if True then do not verify given builders are
+            consistent with any existing composite ring (default is False).
+        :param require_modified: if True and ``force`` is False, then
+            verify that at least one of the given builders has been modified
+            since the composite ring was last built (default is False).
+        :return: An instance of :class:`swift.common.ring.ring.RingData`
+        :raises: ValueError if the component ring builders are not suitable for
+            composing with each other, or are inconsistent with any existing
+            composite ring, or if require_modified is True and there has been
+            no change with respect to the existing ring.
+        """
+        self.load_components(builder_files, force=force,
+                             require_modified=require_modified)
+        self.ring_data = compose_rings(self._builders)
+        self.version += 1
+        new_metadata = _make_composite_metadata(self._builders)
+        self.components = new_metadata['components']
+        return self.ring_data
+
+    def rebalance(self):
+        """
+        Cooperatively rebalances all component ring builders.
+
+        This method does not change the state of the composite ring; a
+        subsequent call to :meth:`compose` is required to generate updated
+        composite :class:`RingData`.
+
+        :return: A list of dicts, one per component builder, each having the
+            following keys:
+
+            * 'builder_file' maps to the component builder file;
+            * 'builder' maps to the corresponding instance of
+              :class:`swift.common.ring.builder.RingBuilder`;
+            * 'result' maps to the results of the rebalance of that component
+              i.e. a tuple of: `(number_of_partitions_altered,
+              resulting_balance, number_of_removed_devices)`
+
+            The list has the same order as components in the composite ring.
+        :raises RingBuilderError: if there is an error while rebalancing any
+            component builder.
+        """
+        self._load_components()
+        self.update_last_part_moves()
+        component_builders = list(zip(self._builder_files, self._builders))
+        # don't let the same builder go first each time
+        shuffle(component_builders)
+        results = {}
+        for builder_file, builder in component_builders:
+            try:
+                results[builder] = {
+                    'builder': builder,
+                    'builder_file': builder_file,
+                    'result': builder.rebalance()
+                }
+                builder.validate()
+            except RingBuilderError as err:
+                self._builders = None
+                raise RingBuilderError(
+                    'An error occurred while rebalancing component %s: %s' %
+                    (builder_file, err))
+
+        for builder_file, builder in component_builders:
+            builder.save(builder_file)
+        # return results in component order
+        return [results[builder] for builder in self._builders]
+
+    def can_part_move(self, part):
+        """
+        Check with all component builders that it is ok to move a partition.
+
+        :param part: The partition to check.
+        :return: True if all component builders agree that the partition can be
+            moved, False otherwise.
+        """
+        # Called by component builders.
+        return all(b.can_part_move(part) for b in self._builders)
+
+    def update_last_part_moves(self):
+        """
+        Updates the record of how many hours ago each partition was moved in
+        all component builders.
+        """
+        # Called at start of each composite rebalance. We need all component
+        # builders to be at same last_part_moves epoch before any builder
+        # starts moving parts; this will effectively be a no-op for builders
+        # that have already been updated in last hour
+        for b in self._builders:
+            b.update_last_part_moves()
+
+
+class CooperativeRingBuilder(RingBuilder):
+    """
+    A subclass of :class:`RingBuilder` that participates in cooperative
+    rebalance.
+
+    During rebalance this subclass will consult with its `parent_builder`
+    before moving a partition. The `parent_builder` may in turn check with
+    co-builders (including this instance) to verify that none have moved that
+    partition in the last `min_part_hours`.
+
+    :param part_power: number of partitions = 2**part_power.
+    :param replicas: number of replicas for each partition.
+    :param min_part_hours: minimum number of hours between partition changes.
+    :param parent_builder: an instance of :class:`CompositeRingBuilder`.
+    """
+    def __init__(self, part_power, replicas, min_part_hours, parent_builder):
+        super(CooperativeRingBuilder, self).__init__(
+            part_power, replicas, min_part_hours)
+        self.parent_builder = parent_builder
+
+    def _can_part_move(self, part):
+        # override superclass method to delegate to the parent builder
+        return self.parent_builder.can_part_move(part)
+
+    def can_part_move(self, part):
+        """
+        Check that in the context of this builder alone it is ok to move a
+        partition.
+
+        :param part: The partition to check.
+        :return: True if the partition can be moved, False otherwise.
+        """
+        # called by parent_builder - now forward to the superclass
+        return (not self.ever_rebalanced or
+                super(CooperativeRingBuilder, self)._can_part_move(part))
+
+    def _update_last_part_moves(self):
+        # overrides superclass method - parent builder should have called
+        # update_last_part_moves() before rebalance; calling the superclass
+        # method here would reset _part_moved_bitmap which is state we rely on
+        # when min_part_hours is zero
+        pass
+
+    def update_last_part_moves(self):
+        """
+        Updates the record of how many hours ago each partition was moved in
+        in this builder.
+        """
+        # called by parent_builder - now forward to the superclass
+        return super(CooperativeRingBuilder, self)._update_last_part_moves()
diff --git a/swift/common/ring/io.py b/swift/common/ring/io.py
new file mode 100644
index 0000000000..fbdd94ddbc
--- /dev/null
+++ b/swift/common/ring/io.py
@@ -0,0 +1,650 @@
+# Copyright (c) 2022 NVIDIA
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import collections
+import contextlib
+import dataclasses
+import gzip
+import hashlib
+import json
+import os
+import string
+import struct
+import tempfile
+import zlib
+
+from swift.common.ring.utils import BYTES_TO_TYPE_CODE, network_order_array, \
+    read_network_order_array
+
+ZLIB_FLUSH_MARKER = b"\x00\x00\xff\xff"
+# we could pull from io.DEFAULT_BUFFER_SIZE, but... 8k seems small
+DEFAULT_BUFFER_SIZE = 2 ** 16
+# v2 rings have sizes written with each section, as well as offsets at the end
+# We *hope* we never need to go past 2**32-1 for those, but just in case...
+V2_SIZE_FORMAT = "!Q"
+
+
+class _RingGzReader(object):
+    chunk_size = DEFAULT_BUFFER_SIZE
+
+    def __init__(self, fileobj):
+        self.fp = fileobj
+        self.reset_decompressor()
+
+    @property
+    def name(self):
+        return self.fp.name
+
+    def close(self):
+        self.fp.close()
+
+    def read_sizes(self):
+        """
+        Read the uncompressed and compressed sizes of the whole file.
+
+        Gzip writes the uncompressed length (mod 2**32) write at the end.
+        Then we just need to ``tell()`` to get the compressed length.
+        """
+        self.fp.seek(-4, os.SEEK_END)
+        uncompressed_size, = struct.unpack("<L", self.fp.read(4))
+        # between the seek(-4, SEEK_END) and the read(4), we're at the end
+        compressed_size = self.fp.tell()
+        return uncompressed_size, compressed_size
+
+    def reset_decompressor(self):
+        self.pos = self.fp.tell()
+        if self.pos == 0:
+            # Expect gzip header
+            wbits = 16 + zlib.MAX_WBITS
+        else:
+            # Bare deflate stream
+            wbits = -zlib.MAX_WBITS
+        self.decompressor = zlib.decompressobj(wbits)
+        self.buffer = self.compressed_buffer = b""
+
+    def compressed_seek(self, pos, whence=os.SEEK_SET):
+        """
+        Seek to the given point in the compressed stream.
+
+        Buffers are dropped and a new decompressor is created (unless using
+        ``os.SEEK_SET`` and the reader is already at the desired position).
+        As a result, callers should be careful to ``seek()`` to flush
+        boundaries, to ensure that subsequent ``read()`` calls work properly.
+
+        Note that when using ``_RingGzWriter``, all ``tell()`` results will be
+        flush boundaries and appropriate to later use as ``seek()`` arguments.
+        """
+        if (pos, whence) == (self.pos, os.SEEK_SET):
+            # small optimization for linear reads
+            return
+        self.fp.seek(pos, whence)
+        self.reset_decompressor()
+
+    def compressed_tell(self):
+        return self.fp.tell()
+
+    @classmethod
+    @contextlib.contextmanager
+    def open(cls, filename):
+        """
+        Open the ring file ``filename``
+
+        :returns: a context manager that provides an instance of this class
+        """
+        with open(filename, 'rb') as fp:
+            yield cls(fp)
+
+    def _decompress_from_buffer(self, offset):
+        if offset < 0:
+            raise ValueError('buffer offset must be non-negative')
+        chunk = self.compressed_buffer[:offset]
+        self.compressed_buffer = self.compressed_buffer[offset:]
+        self.pos += len(chunk)
+        self.buffer += self.decompressor.decompress(chunk)
+
+    def _buffer_chunk(self):
+        """
+        Buffer some data.
+
+        The underlying file-like may or may not be read, though ``pos`` should
+        always advance (unless we're already at EOF).
+
+        Callers (i.e., ``read`` and ``readline``) should call this in a loop
+        and monitor the size of ``buffer`` and whether we've hit EOF.
+
+        :returns: True if we hit the end of the file, False otherwise
+        """
+        # stop at flushes, so we can save buffers on seek during a linear read
+        x = self.compressed_buffer.find(ZLIB_FLUSH_MARKER)
+        if x >= 0:
+            self._decompress_from_buffer(x + len(ZLIB_FLUSH_MARKER))
+            return False
+
+        chunk = self.fp.read(self.chunk_size)
+        if not chunk:
+            self._decompress_from_buffer(len(self.compressed_buffer))
+            return True
+        self.compressed_buffer += chunk
+
+        # if we found a flush marker in the new chunk, only go that far
+        x = self.compressed_buffer.find(ZLIB_FLUSH_MARKER)
+        if x >= 0:
+            self._decompress_from_buffer(x + len(ZLIB_FLUSH_MARKER))
+            return False
+
+        # we may have *almost* found the flush marker;
+        # gotta keep some of the tail
+        keep = len(ZLIB_FLUSH_MARKER) - 1
+        # note that there's no guarantee that buffer will actually grow --
+        # but we don't want to have more in compressed_buffer than strictly
+        # necessary
+        self._decompress_from_buffer(len(self.compressed_buffer) - keep)
+        return False
+
+    def read(self, amount=-1):
+        """
+        Read ``amount`` uncompressed bytes.
+
+        :raises IOError: if you try to read everything
+        :raises zlib.error: if ``seek()`` was last called with a position
+                            not at a flush boundary
+        """
+        if amount < 0:
+            raise IOError("don't be greedy")
+
+        while amount > len(self.buffer):
+            if self._buffer_chunk():
+                break
+
+        data, self.buffer = self.buffer[:amount], self.buffer[amount:]
+        return data
+
+
+class SectionReader(object):
+    """
+    A file-like wrapper that limits how many bytes may be read.
+
+    Also verify data integrity.
+
+    :param fp: a file-like object opened with mode "rb"
+    :param length: the maximum number of bytes that should be read
+    :param digest: hex digest of the expected bytes
+    :param checksum: checksumming instance to be fed bytes and later compared
+                     against ``digest``; e.g. ``hashlib.sha256()``
+    """
+    def __init__(self, fp, length, digest=None, checksum=None):
+        self._fp = fp
+        self._remaining = length
+        self._digest = digest
+        self._checksum = checksum
+
+    def read(self, amt=None):
+        """
+        Read ``amt`` bytes, defaulting to "all remaining available bytes".
+        """
+        if amt is None or amt < 0:
+            amt = self._remaining
+        amt = min(amt, self._remaining)
+        data = self._fp.read(amt)
+        self._remaining -= len(data)
+        self._checksum.update(data)
+        return data
+
+    def read_ring_table(self, itemsize, partition_count):
+        max_row_len = itemsize * partition_count
+        type_code = BYTES_TO_TYPE_CODE[itemsize]
+        return [
+            read_network_order_array(type_code, row)
+            for row in iter(lambda: self.read(max_row_len), b'')
+        ]
+
+    def close(self):
+        """
+        Verify that all bytes were read.
+
+        If a digest was provided, also verify that the bytes read match
+        the digest. Does *not* close the underlying file-like.
+
+        :raises ValueError: if verification fails
+        """
+        if self._remaining:
+            raise ValueError('Incomplete read; expected %d more bytes '
+                             'to be read' % self._remaining)
+        if self._digest and self._checksum.hexdigest() != self._digest:
+            raise ValueError('Hash mismatch in block: %r found; %r expected' %
+                             (self._checksum.hexdigest(), self._digest))
+
+    def __enter__(self):
+        return self
+
+    def __exit__(self, *args):
+        self.close()
+
+
+@dataclasses.dataclass(frozen=True)
+class IndexEntry:
+    compressed_start: int
+    uncompressed_start: int
+    compressed_end: int
+    uncompressed_end: int
+    checksum_method: str
+    checksum_value: str
+
+    @property
+    def uncompressed_length(self) -> int:
+        return self.uncompressed_end - self.uncompressed_start
+
+    @property
+    def compressed_length(self) -> int:
+        return self.compressed_end - self.compressed_start
+
+    @property
+    def compression_ratio(self) -> float:
+        return 1 - self.compressed_length / self.uncompressed_length
+
+
+class RingReader(_RingGzReader):
+    """
+    Helper for reading ring files.
+
+    Provides format-version detection, and loads the index for v2 rings.
+    """
+    chunk_size = DEFAULT_BUFFER_SIZE
+
+    def __init__(self, fileobj):
+        super(RingReader, self).__init__(fileobj)
+        self.index = {}
+
+        magic = self.read(4)
+        if magic != b"R1NG":
+            raise ValueError(f"Bad ring magic: {magic!r}")
+
+        self.version, = struct.unpack("!H", self.read(2))
+        if self.version not in (1, 2):
+            msg = f"Unsupported ring version: {self.version}"
+            if hasattr(fileobj, "name"):
+                msg += f" for {fileobj.name!r}"
+            raise ValueError(msg)
+
+        # NB: In a lot of places, "raw" implies "file on disk", i.e., the
+        # compressed stream -- but here it's actually the uncompressed stream.
+        self.raw_size, self.size = self.read_sizes()
+
+        self.load_index()
+
+        self.compressed_seek(0)
+
+    def load_index(self):
+        """
+        If this is a v2 ring, load the index stored at the end.
+
+        This will be done as part of initialization; users shouldn't need to
+        do this themselves.
+        """
+        if self.version != 2:
+            return
+
+        # See notes in RingWriter.write_index and RingWriter.__exit__ for
+        # where this 31 (= 18 + 13) came from.
+        self.compressed_seek(-31, os.SEEK_END)
+        try:
+            index_start, = struct.unpack(V2_SIZE_FORMAT, self.read(8))
+        except zlib.error:
+            # TODO: we can still fix this if we're willing to read everything
+            raise IOError("Could not read index offset "
+                          "(was the file recompressed?)")
+        self.compressed_seek(index_start)
+        # ensure index entries are sorted by position
+        self.index = collections.OrderedDict(sorted(
+            ((section, IndexEntry(*entry))
+             for section, entry in json.loads(self.read_blob()).items()),
+            key=lambda x: x[1].compressed_start))
+
+    def __contains__(self, section):
+        if self.version != 2:
+            return False
+        return section in self.index
+
+    def read_blob(self, fmt=V2_SIZE_FORMAT):
+        """
+        Read a length-value encoded BLOB
+
+        Note that the RingReader needs to already be positioned correctly.
+
+        :param fmt: the format code used to write the length of the BLOB.
+                    All v2 BLOBs use ``!Q``, but v1 may require ``!I``
+        :returns: the BLOB value
+        """
+        prefix = self.read(struct.calcsize(fmt))
+        blob_length, = struct.unpack(fmt, prefix)
+        return self.read(blob_length)
+
+    def read_section(self, section):
+        """
+        Seek to a section and read all its data
+        """
+        with self.open_section(section) as reader:
+            return reader.read()
+
+    @contextlib.contextmanager
+    def open_section(self, section):
+        """
+        Open up a section without buffering the whole thing in memory
+
+        :raises ValueError: if there is no index
+        :raises KeyError: if ``section`` is not in the index
+        :raises IOError: if there is a conflict between the section size in
+                         the index and the length at the start of the blob
+
+        :returns: a ``SectionReader`` wrapping the section
+        """
+        if not self.index:
+            raise ValueError("No index loaded")
+        entry = self.index[section]
+        self.compressed_seek(entry.compressed_start)
+        size_len = struct.calcsize(V2_SIZE_FORMAT)
+        prefix = self.read(size_len)
+        blob_length, = struct.unpack(V2_SIZE_FORMAT, prefix)
+        if entry.compressed_end is not None and \
+                size_len + blob_length != entry.uncompressed_length:
+            raise IOError("Inconsistent section size")
+
+        if entry.checksum_method in ('md5', 'sha1', 'sha256', 'sha512'):
+            checksum = getattr(hashlib, entry.checksum_method)(prefix)
+            checksum_value = entry.checksum_value
+        else:
+            raise ValueError(f"Unsupported checksum {entry.checksum_method}:"
+                             f"{entry.checksum_value} for section  {section}")
+
+        with SectionReader(
+            self,
+            blob_length,
+            digest=checksum_value,
+            checksum=checksum,
+        ) as reader:
+            yield reader
+
+
+class _RingGzWriter(object):
+    def __init__(self, fileobj, filename='', mtime=1300507380.0):
+        self.raw_fp = fileobj
+        self.gzip_fp = gzip.GzipFile(
+            filename,
+            mode='wb',
+            fileobj=self.raw_fp,
+            mtime=mtime)
+        self.flushed = True
+
+    @classmethod
+    @contextlib.contextmanager
+    def open(cls, filename, *a, **kw):
+        """
+        Open a compressed writer for ``filename``
+
+        Note that this also guarantees atomic writes using a temporary file
+
+        :returns: a context manager that provides a ``_RingGzWriter`` instance
+        """
+        fp = tempfile.NamedTemporaryFile(
+            dir=os.path.dirname(filename),
+            prefix=os.path.basename(filename),
+            delete=False)
+        try:
+            with cls(fp, filename, *a, **kw) as writer:
+                yield writer
+        except BaseException:
+            fp.close()
+            os.unlink(fp.name)
+            raise
+        else:
+            fp.flush()
+            os.fsync(fp.fileno())
+            fp.close()
+            os.chmod(fp.name, 0o644)
+            os.rename(fp.name, filename)
+
+    def __enter__(self):
+        return self
+
+    def __exit__(self, e, v, t):
+        if e is None:
+            # only finalize if there was no error
+            self.close()
+
+    def close(self):
+        # This does three things:
+        #   * Flush the underlying compressobj (with Z_FINISH) and write
+        #     the result
+        #   * Write the (4-byte) CRC
+        #   * Write the (4-byte) uncompressed length
+        # NB: if we wrote an index, the flush writes exactly 5 bytes,
+        # for 13 bytes total
+        self.gzip_fp.close()
+
+    def write(self, data):
+        if not data:
+            return 0
+        self.flushed = False
+        return self.gzip_fp.write(data)
+
+    def flush(self):
+        """
+        Ensure the gzip stream has been flushed using Z_FULL_FLUSH.
+
+        By default, the gzip module uses Z_SYNC_FLUSH; this ensures that all
+        data is compressed and written to the stream, but retains some state
+        in the compressor. A full flush, by contrast, ensures no state may
+        carry over, allowing a reader to seek to the end of the flush and
+        start reading with a fresh decompressor.
+        """
+        if not self.flushed:
+            # always use full flushes; this allows us to just start reading
+            # at the start of any section
+            self.gzip_fp.flush(zlib.Z_FULL_FLUSH)
+            self.flushed = True
+
+    def compressed_tell(self):
+        """
+        Return the position in the underlying (compressed) stream.
+
+        Since this is primarily useful to get a position you may seek to later
+        and start reading, flush the writer first.
+        """
+        self.flush()
+        return self.raw_fp.tell()
+
+    def tell(self):
+        """
+        Return the position in the decompressed stream.
+        """
+        self.flush()
+        return self.gzip_fp.tell()
+
+    def _set_compression_level(self, lvl):
+        # two valid deflate streams may be concatenated to produce another
+        # valid deflate stream, so finish the one stream...
+        self.flush()
+        # ... so we can start up another with whatever level we want
+        self.gzip_fp.compress = zlib.compressobj(
+            lvl, zlib.DEFLATED, -zlib.MAX_WBITS, zlib.DEF_MEM_LEVEL, 0)
+
+
+class RingWriter(_RingGzWriter):
+    """
+    Helper for writing ring files to later be read by a ``RingReader``
+
+    This has a few key features on top of a standard ``GzipFile``:
+
+    * Helpers for writing length-value encoded BLOBs
+    * The ability to define named sections which will be written as
+      an index at the end of the file
+    * Flushes always use Z_FULL_FLUSH to support seeking.
+
+    Note that the index will only be written if named sections were defined.
+    """
+    checksum_method = 'sha256'
+
+    def __init__(self, *a, **kw):
+        super(RingWriter, self).__init__(*a, **kw)
+        # index entries look like
+        #   section: [
+        #     compressed start,
+        #     uncompressed start,
+        #     compressed end,
+        #     uncompressed end,
+        #     checksum_method,
+        #     checksum_value
+        #   ]
+        self.index = {}
+        self.current_section = None
+        self.checksum = None
+
+    @contextlib.contextmanager
+    def section(self, name):
+        """
+        Define a named section.
+
+        Return a context manager; the section contains whatever data is written
+        within that context.
+
+        The index will be updated to include the section and its starting
+        positions upon entering the context; upon exiting normally, the index
+        will be updated again with the ending positions and checksum
+        information.
+        """
+        if self.current_section:
+            raise ValueError('Cannot create new section; currently writing %r'
+                             % self.current_section)
+        allowed = string.ascii_letters + string.digits + '/-'
+        if any(c not in allowed for c in name):
+            raise ValueError('Section has invalid name: %s' % name)
+        if name in self.index:
+            raise ValueError('Cannot write duplicate section: %s' % name)
+        self.flush()
+        self.current_section = name
+        compressed_start = self.compressed_tell()
+        uncompressed_start = self.tell()
+        checksum_class = getattr(hashlib, self.checksum_method)
+        self.checksum = checksum_class()
+        try:
+            yield self
+            self.flush()
+            self.index[name] = IndexEntry(
+                compressed_start,
+                uncompressed_start,
+                compressed_end=self.compressed_tell(),
+                uncompressed_end=self.tell(),
+                checksum_method=self.checksum_method,
+                checksum_value=self.checksum.hexdigest(),
+            )
+        finally:
+            self.flush()
+            self.checksum = None
+            self.current_section = None
+
+    def write(self, data):
+        if self.checksum:
+            self.checksum.update(data)
+        return super().write(data)
+
+    def close(self):
+        if self.index:
+            # only write index if we made use of any sections
+            self.write_index()
+        super().close()
+
+    def write_magic(self, version):
+        """
+        Write our file magic for identifying Swift rings.
+
+        :param version: the ring version; should be 1 or 2
+        """
+        if self.tell() != 0:
+            raise IOError("Magic must be written at the start of the file")
+        # switch to uncompressed, so libmagic can know what to expect
+        self._set_compression_level(0)
+        self.write(struct.pack("!4sH", b"R1NG", version))
+        self._set_compression_level(9)
+
+    def write_size(self, size, fmt=V2_SIZE_FORMAT):
+        """
+        Write a size (often a BLOB-length, but sometimes a file offset).
+
+        :param data: the size to write
+        :param fmt: the struct format to use when writing the length.
+                    All v2 BLOBs should use ``!Q``.
+        """
+        self.write(struct.pack(fmt, size))
+
+    def write_blob(self, data, fmt=V2_SIZE_FORMAT):
+        """
+        Write a length-value encoded BLOB.
+
+        :param data: the bytes to write
+        :param fmt: the struct format to use when writing the length.
+                    All v2 BLOBs should use ``!Q``.
+        """
+        self.write_size(len(data), fmt)
+        self.write(data)
+
+    def write_json(self, data, fmt=V2_SIZE_FORMAT):
+        """
+        Write a length-value encoded JSON BLOB.
+
+        :param data: the JSON-serializable data to write
+        :param fmt: the struct format to use when writing the length.
+                    All v2 BLOBs should use ``!Q``.
+        """
+        json_data = json.dumps(data, sort_keys=True, ensure_ascii=True)
+        self.write_blob(json_data.encode('ascii'), fmt)
+
+    def write_ring_table(self, table):
+        """
+        Write a length-value encoded replica2part2dev table, or similar.
+        Should *not* be used for v1 rings, as there's always a ``!Q`` size
+        prefix, and values are written in network order.
+        :param table: list of arrays
+        """
+        dev_id_bytes = table[0].itemsize if table else 0
+        assignments = sum(len(a) for a in table)
+        self.write_size(assignments * dev_id_bytes)
+        for row in table:
+            with network_order_array(row):
+                row.tofile(self)
+
+    def write_index(self):
+        """
+        Write the index and its starting position at the end of the file.
+
+        Callers should not need to use this themselves; it will be done
+        automatically when using the writer as a context manager.
+        """
+        uncompressed_start = self.tell()
+        compressed_start = self.compressed_tell()
+        self.write_json({
+            k: dataclasses.astuple(v)
+            for k, v in self.index.items()
+        })
+        # switch to uncompressed
+        self._set_compression_level(0)
+        # ... which allows us to know that each of these write_size/flush pairs
+        # will write exactly 18 bytes to disk
+        self.write_size(uncompressed_start)
+        self.flush()
+        # This is the one we really care about in Swift code, but sometimes
+        # ops write their own tools and sometimes those just buffer all the
+        # decoded content
+        self.write_size(compressed_start)
+        self.flush()
diff --git a/swift/common/ring/ring.py b/swift/common/ring/ring.py
index 1f97ee2ccb..ccbb480d65 100644
--- a/swift/common/ring/ring.py
+++ b/swift/common/ring/ring.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -14,100 +14,298 @@
 # limitations under the License.
 
 import array
-import cPickle as pickle
+
+import json
 from collections import defaultdict
-from gzip import GzipFile
 from os.path import getmtime
 import struct
 from time import time
 import os
-from io import BufferedReader
+from itertools import chain, count
+import sys
 
-from swift.common.utils import hash_path, validate_configuration
+from swift.common.exceptions import RingLoadError, DevIdBytesTooSmall
+from swift.common.utils import hash_path, validate_configuration, md5
+from swift.common.ring.io import RingReader, RingWriter
 from swift.common.ring.utils import tiers_for_dev
 
-try:
-    import simplejson as json
-except ImportError:
-    import json
+
+DEFAULT_RELOAD_TIME = 15
+RING_CODECS = {
+    1: {
+        "serialize": lambda ring_data, writer: ring_data.serialize_v1(writer),
+        "deserialize": lambda cls, reader, metadata_only, _include_devices:
+            cls.deserialize_v1(reader, metadata_only=metadata_only),
+    },
+    2: {
+        "serialize": lambda ring_data, writer: ring_data.serialize_v2(writer),
+        "deserialize": lambda cls, reader, metadata_only, include_devices:
+            cls.deserialize_v2(reader, metadata_only=metadata_only,
+                               include_devices=include_devices),
+    },
+}
+DEFAULT_RING_FORMAT_VERSION = 1
+
+
+def calc_replica_count(replica2part2dev_id):
+    if not replica2part2dev_id:
+        return 0
+    base = len(replica2part2dev_id) - 1
+    extra = 1.0 * len(replica2part2dev_id[-1]) / len(replica2part2dev_id[0])
+    return base + extra
+
+
+def normalize_devices(devs):
+    # NOTE(akscram): Replication parameters like replication_ip
+    #                and replication_port are required for
+    #                replication process. An old replication
+    #                ring doesn't contain this parameters into
+    #                device.
+    for dev in devs:
+        if dev is None:
+            continue
+        if 'ip' in dev:
+            dev.setdefault('replication_ip', dev['ip'])
+        if 'port' in dev:
+            dev.setdefault('replication_port', dev['port'])
 
 
 class RingData(object):
     """Partitioned consistent hashing ring data (used for serialization)."""
 
-    def __init__(self, replica2part2dev_id, devs, part_shift):
+    def __init__(self, replica2part2dev_id, devs, part_shift,
+                 next_part_power=None, version=None):
+        normalize_devices(devs)
         self.devs = devs
+        for i, part2dev_id in enumerate(replica2part2dev_id):
+            if not isinstance(part2dev_id, array.array):
+                replica2part2dev_id[i] = array.array('H', part2dev_id)
         self._replica2part2dev_id = replica2part2dev_id
         self._part_shift = part_shift
+        self.next_part_power = next_part_power
+        self.version = version
+        self.format_version = None
+        self.size = self.raw_size = None
+        # Next two are used when replica2part2dev is empty
+        self._dev_id_bytes = 2
+        self._replica_count = 0
+        self._num_devs = sum(1 if dev is not None else 0 for dev in self.devs)
+
+    @property
+    def replica_count(self):
+        """Number of replicas (full or partial) used in the ring."""
+        if self._replica2part2dev_id:
+            return calc_replica_count(self._replica2part2dev_id)
+        else:
+            return self._replica_count
+
+    @property
+    def part_power(self):
+        return 32 - self._part_shift
+
+    @property
+    def dev_id_bytes(self):
+        if self._replica2part2dev_id:
+            # There's an assumption that these will all have the same itemsize,
+            # but just in case...
+            return max(part2dev_id.itemsize
+                       for part2dev_id in self._replica2part2dev_id)
+        else:
+            return self._dev_id_bytes
 
     @classmethod
-    def deserialize_v1(cls, gz_file):
-        json_len, = struct.unpack('!I', gz_file.read(4))
-        ring_dict = json.loads(gz_file.read(json_len))
+    def deserialize_v1(cls, reader, metadata_only=False):
+        """
+        Deserialize a v1 ring file into a dictionary with `devs`, `part_shift`,
+        and `replica2part2dev_id` keys.
+
+        If the optional kwarg `metadata_only` is True, then the
+        `replica2part2dev_id` is not loaded and that key in the returned
+        dictionary just has the value `[]`.
+
+        :param RingReader reader: An opened RingReader at the start of the file
+        :param bool metadata_only: If True, only load `devs` and `part_shift`
+        :returns: A dict containing `devs`, `part_shift`, and
+                  `replica2part2dev_id`
+        """
+        magic = reader.read(6)
+        if magic != b'R1NG\x00\x01':
+            raise ValueError('unexpected magic: %r' % magic)
+
+        ring_dict = json.loads(reader.read_blob('!I'))
         ring_dict['replica2part2dev_id'] = []
+
+        if metadata_only:
+            return ring_dict
+
+        byteswap = (ring_dict.get('byteorder', sys.byteorder) != sys.byteorder)
+
         partition_count = 1 << (32 - ring_dict['part_shift'])
-        for x in xrange(ring_dict['replica_count']):
-            ring_dict['replica2part2dev_id'].append(
-                array.array('H', gz_file.read(2 * partition_count)))
+        for x in range(ring_dict['replica_count']):
+            part2dev = array.array('H', reader.read(2 * partition_count))
+            if byteswap:
+                part2dev.byteswap()
+            ring_dict['replica2part2dev_id'].append(part2dev)
+
         return ring_dict
 
     @classmethod
-    def load(cls, filename):
+    def deserialize_v2(cls, reader, metadata_only=False, include_devices=True):
+        """
+        Deserialize a v2 ring file into a dictionary with ``devs``,
+        ``part_shift``, and ``replica2part2dev_id`` keys.
+
+        If the optional kwarg ``metadata_only`` is True, then the
+        ``replica2part2dev_id`` is not loaded and that key in the returned
+        dictionary just has the value ``[]``.
+
+        If the optional kwarg ``include_devices`` is False, then the ``devs``
+        list is not loaded and that key in the returned dictionary just has
+        the value ``[]``.
+
+        :param RingReader reader: An opened RingReader which has already
+                                  loaded up the index at the end of the file.
+        :param bool metadata_only: If True, skip loading
+                                   ``replica2part2dev_id``
+        :param bool include_devices: If False, skip loading ``devs``
+        :returns: A dict containing ``devs``, ``part_shift``,
+                  ``dev_id_bytes``, and ``replica2part2dev_id``
+        """
+
+        ring_dict = json.loads(reader.read_section('swift/ring/metadata'))
+        ring_dict['replica2part2dev_id'] = []
+        ring_dict['devs'] = []
+
+        if include_devices:
+            ring_dict['devs'] = json.loads(
+                reader.read_section('swift/ring/devices'))
+
+        if metadata_only:
+            return ring_dict
+
+        partition_count = 1 << (32 - ring_dict['part_shift'])
+
+        with reader.open_section('swift/ring/assignments') as section:
+            ring_dict['replica2part2dev_id'] = section.read_ring_table(
+                ring_dict['dev_id_bytes'], partition_count)
+
+        return ring_dict
+
+    @classmethod
+    def load(cls, filename, metadata_only=False, include_devices=True):
         """
         Load ring data from a file.
 
         :param filename: Path to a file serialized by the save() method.
+        :param bool metadata_only: If True, only load `devs` and `part_shift`.
         :returns: A RingData instance containing the loaded data.
         """
-        gz_file = GzipFile(filename, 'rb')
-        # Python 2.6 GzipFile doesn't support BufferedIO
-        if hasattr(gz_file, '_checkReadable'):
-            gz_file = BufferedReader(gz_file)
-
-        # See if the file is in the new format
-        magic = gz_file.read(4)
-        if magic == 'R1NG':
-            version, = struct.unpack('!H', gz_file.read(2))
-            if version == 1:
-                ring_data = cls.deserialize_v1(gz_file)
-            else:
-                raise Exception('Unknown ring format version %d' % version)
-        else:
-            # Assume old-style pickled ring
-            gz_file.seek(0)
-            ring_data = pickle.load(gz_file)
-        if not hasattr(ring_data, 'devs'):
-            ring_data = RingData(ring_data['replica2part2dev_id'],
-                                 ring_data['devs'], ring_data['part_shift'])
+        with RingReader.open(filename) as reader:
+            if reader.version not in RING_CODECS:
+                raise Exception('Unknown ring format version %d for %r' % (
+                                reader.version, filename))
+            ring_data = RING_CODECS[reader.version]['deserialize'](
+                cls, reader, metadata_only, include_devices)
+
+        ring_data = cls.from_dict(ring_data)
+        ring_data.format_version = reader.version
+        for attr in ('size', 'raw_size'):
+            setattr(ring_data, attr, getattr(reader, attr))
         return ring_data
 
-    def serialize_v1(self, file_obj):
+    @classmethod
+    def from_dict(cls, ring_data):
+        ring = cls(ring_data['replica2part2dev_id'],
+                   ring_data['devs'], ring_data['part_shift'],
+                   ring_data.get('next_part_power'),
+                   ring_data.get('version'))
+        # For loading with metadata_only=True
+        if 'replica_count' in ring_data:
+            ring._replica_count = ring_data['replica_count']
+        # dev_id_bytes only written down in v2 and above
+        ring._dev_id_bytes = ring_data.get('dev_id_bytes', 2)
+        return ring
+
+    def serialize_v1(self, writer):
+        if self.dev_id_bytes != 2:
+            raise DevIdBytesTooSmall('Ring v1 only supports 2-byte dev IDs')
         # Write out new-style serialization magic and version:
-        file_obj.write(struct.pack('!4sH', 'R1NG', 1))
+        writer.write_magic(version=1)
         ring = self.to_dict()
-        json_text = json.dumps(
-            {'devs': ring['devs'], 'part_shift': ring['part_shift'],
-             'replica_count': len(ring['replica2part2dev_id'])})
+
+        # Only include next_part_power if it is set in the
+        # builder, otherwise just ignore it
+        _text = {'devs': ring['devs'], 'part_shift': ring['part_shift'],
+                 'replica_count': len(ring['replica2part2dev_id']),
+                 'byteorder': sys.byteorder}
+
+        if ring['version'] is not None:
+            _text['version'] = ring['version']
+
+        next_part_power = ring.get('next_part_power')
+        if next_part_power is not None:
+            _text['next_part_power'] = next_part_power
+
+        json_text = json.dumps(_text, sort_keys=True,
+                               ensure_ascii=True).encode('ascii')
         json_len = len(json_text)
-        file_obj.write(struct.pack('!I', json_len))
-        file_obj.write(json_text)
+        writer.write(struct.pack('!I', json_len))
+        writer.write(json_text)
         for part2dev_id in ring['replica2part2dev_id']:
-            file_obj.write(part2dev_id.tostring())
+            part2dev_id.tofile(writer)
+
+    def serialize_v2(self, writer):
+        writer.write_magic(version=2)
+        ring = self.to_dict()
+
+        # Only include next_part_power if it is set in the
+        # builder, otherwise just ignore it
+        _text = {
+            'part_shift': ring['part_shift'],
+            'dev_id_bytes': ring['dev_id_bytes'],
+            'replica_count': calc_replica_count(ring['replica2part2dev_id']),
+            'version': ring['version']}
 
-    def save(self, filename):
+        next_part_power = ring.get('next_part_power')
+        if next_part_power is not None:
+            _text['next_part_power'] = next_part_power
+
+        with writer.section('swift/ring/metadata'):
+            writer.write_json(_text)
+
+        with writer.section('swift/ring/devices'):
+            writer.write_json(ring['devs'])
+
+        with writer.section('swift/ring/assignments'):
+            writer.write_ring_table(ring['replica2part2dev_id'])
+
+    def save(self, filename, mtime=1300507380.0,
+             format_version=DEFAULT_RING_FORMAT_VERSION):
         """
         Serialize this RingData instance to disk.
 
         :param filename: File into which this instance should be serialized.
+        :param mtime: time used to override mtime for gzip, default or None
+                      if the caller wants to include time
+        :param format_version: one of 0, 1, or 2. Older versions are retained
+                               for the sake of clusters on older versions
         """
-        gz_file = GzipFile(filename, 'wb')
-        self.serialize_v1(gz_file)
-        gz_file.close()
+        if format_version not in RING_CODECS:
+            raise ValueError("format_version must be one of %r" % (tuple(
+                RING_CODECS.keys()),))
+        # Override the timestamp so that the same ring data creates
+        # the same bytes on disk. This makes a checksum comparison a
+        # good way to see if two rings are identical.
+        with RingWriter.open(filename, mtime) as writer:
+            RING_CODECS[format_version]['serialize'](self, writer)
 
     def to_dict(self):
         return {'devs': self.devs,
                 'replica2part2dev_id': self._replica2part2dev_id,
-                'part_shift': self._part_shift}
+                'part_shift': self._part_shift,
+                'next_part_power': self.next_part_power,
+                'dev_id_bytes': self.dev_id_bytes,
+                'version': self.version}
 
 
 class Ring(object):
@@ -116,9 +314,14 @@ class Ring(object):
 
     :param serialized_path: path to serialized RingData instance
     :param reload_time: time interval in seconds to check for a ring change
+    :param ring_name: ring name string (basically specified from policy)
+    :param validation_hook: hook point to validate ring configuration ontime
+
+    :raises RingLoadError: if the loaded ring data violates its constraint
     """
 
-    def __init__(self, serialized_path, reload_time=15, ring_name=None):
+    def __init__(self, serialized_path, reload_time=None, ring_name=None,
+                 validation_hook=lambda ring_data: None):
         # can't use the ring unless HASH_PATH_SUFFIX is set
         validate_configuration()
         if ring_name:
@@ -126,19 +329,103 @@ def __init__(self, serialized_path, reload_time=15, ring_name=None):
                                                 ring_name + '.ring.gz')
         else:
             self.serialized_path = os.path.join(serialized_path)
-        self.reload_time = reload_time
+        self.reload_time = (DEFAULT_RELOAD_TIME if reload_time is None
+                            else reload_time)
+        self._validation_hook = validation_hook
         self._reload(force=True)
 
     def _reload(self, force=False):
         self._rtime = time() + self.reload_time
         if force or self.has_changed():
             ring_data = RingData.load(self.serialized_path)
+
+            try:
+                self._validation_hook(ring_data)
+            except RingLoadError:
+                if force:
+                    raise
+                else:
+                    # In runtime reload at working server, it's ok to use old
+                    # ring data if the new ring data is invalid.
+                    return
+
             self._mtime = getmtime(self.serialized_path)
             self._devs = ring_data.devs
-
+            self._dev_id_bytes = ring_data._dev_id_bytes
             self._replica2part2dev_id = ring_data._replica2part2dev_id
             self._part_shift = ring_data._part_shift
             self._rebuild_tier_data()
+            self._update_bookkeeping()
+            self._next_part_power = ring_data.next_part_power
+            self._version = ring_data.version
+            self._size = ring_data.size
+            self._raw_size = ring_data.raw_size
+
+    def _update_bookkeeping(self):
+        # Do this now, when we know the data has changed, rather than
+        # doing it on every call to get_more_nodes().
+        #
+        # Since this is to speed up the finding of handoffs, we only
+        # consider devices with at least one partition assigned. This
+        # way, a region, zone, or server with no partitions assigned
+        # does not count toward our totals, thereby keeping the early
+        # bailouts in get_more_nodes() working.
+        dev_ids_with_parts = set()
+        for part2dev_id in self._replica2part2dev_id:
+            for dev_id in part2dev_id:
+                dev_ids_with_parts.add(dev_id)
+        regions = set()
+        zones = set()
+        ips = set()
+        self._num_devs = 0
+        self._num_assigned_devs = 0
+        self._num_weighted_devs = 0
+        for dev in self._devs:
+            if dev is None:
+                continue
+            self._num_devs += 1
+            if dev.get('weight', 0) > 0:
+                self._num_weighted_devs += 1
+            if dev['id'] in dev_ids_with_parts:
+                regions.add(dev['region'])
+                zones.add((dev['region'], dev['zone']))
+                ips.add((dev['region'], dev['zone'], dev['ip']))
+                self._num_assigned_devs += 1
+        self._num_regions = len(regions)
+        self._num_zones = len(zones)
+        self._num_ips = len(ips)
+
+    @property
+    def dev_id_bytes(self):
+        if self._replica2part2dev_id:
+            # There's an assumption that these will all have the same itemsize,
+            # but just in case...
+            return max(part2dev_id.itemsize
+                       for part2dev_id in self._replica2part2dev_id)
+        else:
+            return self._dev_id_bytes
+
+    @property
+    def next_part_power(self):
+        if time() > self._rtime:
+            self._reload()
+        return self._next_part_power
+
+    @property
+    def part_power(self):
+        return 32 - self._part_shift
+
+    @property
+    def version(self):
+        return self._version
+
+    @property
+    def size(self):
+        return self._size
+
+    @property
+    def raw_size(self):
+        return self._raw_size
 
     def _rebuild_tier_data(self):
         self.tier2devs = defaultdict(list)
@@ -149,7 +436,7 @@ def _rebuild_tier_data(self):
                 self.tier2devs[tier].append(dev)
 
         tiers_by_length = defaultdict(list)
-        for tier in self.tier2devs.keys():
+        for tier in self.tier2devs:
             tiers_by_length[len(tier)].append(tier)
         self.tiers_by_length = sorted(tiers_by_length.values(),
                                       key=lambda x: len(x[0]))
@@ -158,14 +445,29 @@ def _rebuild_tier_data(self):
 
     @property
     def replica_count(self):
-        """Number of replicas used in the ring."""
-        return len(self._replica2part2dev_id)
+        """Number of replicas (full or partial) used in the ring."""
+        return calc_replica_count(self._replica2part2dev_id)
 
     @property
     def partition_count(self):
         """Number of partitions in the ring."""
         return len(self._replica2part2dev_id[0])
 
+    @property
+    def device_count(self):
+        """Number of devices in the ring."""
+        return self._num_devs
+
+    @property
+    def weighted_device_count(self):
+        """Number of devices with weight in the ring."""
+        return self._num_weighted_devs
+
+    @property
+    def assigned_device_count(self):
+        """Number of devices with assignments in the ring."""
+        return self._num_assigned_devs
+
     @property
     def devs(self):
         """devices in the ring"""
@@ -182,6 +484,32 @@ def has_changed(self):
         """
         return getmtime(self.serialized_path) != self._mtime
 
+    def _get_part_nodes(self, part):
+        part_nodes = []
+        seen_ids = set()
+        for r2p2d in self._replica2part2dev_id:
+            if part < len(r2p2d):
+                dev_id = r2p2d[part]
+                if dev_id not in seen_ids:
+                    part_nodes.append(self.devs[dev_id])
+                    seen_ids.add(dev_id)
+        return [dict(node, index=i) for i, node in enumerate(part_nodes)]
+
+    def get_part(self, account, container=None, obj=None):
+        """
+        Get the partition for an account/container/object.
+
+        :param account: account name
+        :param container: container name
+        :param obj: object name
+        :returns: the partition number
+        """
+        key = hash_path(account, container, obj, raw_digest=True)
+        if time() > self._rtime:
+            self._reload()
+        part = struct.unpack_from('>I', key)[0] >> self._part_shift
+        return part
+
     def get_part_nodes(self, part):
         """
         Get the nodes that are responsible for the partition. If one
@@ -196,9 +524,7 @@ def get_part_nodes(self, part):
 
         if time() > self._rtime:
             self._reload()
-        seen_ids = set()
-        return [self._devs[r[part]] for r in self._replica2part2dev_id
-                if not (r[part] in seen_ids or seen_ids.add(r[part]))]
+        return self._get_part_nodes(part)
 
     def get_nodes(self, account, container=None, obj=None):
         """
@@ -215,6 +541,7 @@ def get_nodes(self, account, container=None, obj=None):
 
         ======  ===============================================================
         id      unique integer identifier amongst devices
+        index   offset into the primary node list for the partition
         weight  a float of the relative weight of this device as compared to
                 others; this indicates how many partitions the builder will try
                 to assign to this device
@@ -228,18 +555,18 @@ def get_nodes(self, account, container=None, obj=None):
                 hardware description
         ======  ===============================================================
         """
-        key = hash_path(account, container, obj, raw_digest=True)
-        if time() > self._rtime:
-            self._reload()
-        part = struct.unpack_from('>I', key)[0] >> self._part_shift
-        seen_ids = set()
-        return part, [self._devs[r[part]] for r in self._replica2part2dev_id
-                      if not (r[part] in seen_ids or seen_ids.add(r[part]))]
+        part = self.get_part(account, container, obj)
+        return part, self._get_part_nodes(part)
 
     def get_more_nodes(self, part):
         """
         Generator to get extra nodes for a partition for hinted handoff.
 
+        The handoff nodes will try to be in zones other than the
+        primary zones, will take into account the device weights, and
+        will usually keep the same sequences of handoffs even with
+        ring changes.
+
         :param part: partition to get handoff nodes for
         :returns: generator of node dicts
 
@@ -247,22 +574,105 @@ def get_more_nodes(self, part):
         """
         if time() > self._rtime:
             self._reload()
-        used_tiers = set()
-        for part2dev_id in self._replica2part2dev_id:
-            for tier in tiers_for_dev(self._devs[part2dev_id[part]]):
-                used_tiers.add(tier)
-
-        for level in self.tiers_by_length:
-            tiers = list(level)
-            while tiers:
-                tier = tiers.pop(part % len(tiers))
-                if tier in used_tiers:
-                    continue
-                for i in xrange(len(self.tier2devs[tier])):
-                    dev = self.tier2devs[tier][(part + i) %
-                                               len(self.tier2devs[tier])]
-                    if not dev.get('weight'):
-                        continue
-                    yield dev
-                    used_tiers.update(tiers_for_dev(dev))
-                    break
+        primary_nodes = self._get_part_nodes(part)
+        used = set(d['id'] for d in primary_nodes)
+        index = count()
+        same_regions = set(d['region'] for d in primary_nodes)
+        same_zones = set((d['region'], d['zone']) for d in primary_nodes)
+        same_ips = set(
+            (d['region'], d['zone'], d['ip']) for d in primary_nodes)
+
+        parts = len(self._replica2part2dev_id[0])
+        part_hash = md5(str(part).encode('ascii'),
+                        usedforsecurity=False).digest()
+        start = struct.unpack_from('>I', part_hash)[0] >> self._part_shift
+        inc = int(parts / 65536) or 1
+        # Multiple loops for execution speed; the checks and bookkeeping get
+        # simpler as you go along
+        hit_all_regions = len(same_regions) == self._num_regions
+        for handoff_part in chain(range(start, parts, inc),
+                                  range(inc - ((parts - start) % inc),
+                                        start, inc)):
+            if hit_all_regions:
+                # At this point, there are no regions left untouched, so we
+                # can stop looking.
+                break
+            for part2dev_id in self._replica2part2dev_id:
+                if handoff_part < len(part2dev_id):
+                    dev_id = part2dev_id[handoff_part]
+                    dev = self._devs[dev_id]
+                    region = dev['region']
+                    if dev_id not in used and region not in same_regions:
+                        yield dict(dev, handoff_index=next(index))
+                        used.add(dev_id)
+                        same_regions.add(region)
+                        zone = dev['zone']
+                        ip = (region, zone, dev['ip'])
+                        same_zones.add((region, zone))
+                        same_ips.add(ip)
+                        if len(same_regions) == self._num_regions:
+                            hit_all_regions = True
+                            break
+
+        hit_all_zones = len(same_zones) == self._num_zones
+        for handoff_part in chain(range(start, parts, inc),
+                                  range(inc - ((parts - start) % inc),
+                                        start, inc)):
+            if hit_all_zones:
+                # Much like we stopped looking for fresh regions before, we
+                # can now stop looking for fresh zones; there are no more.
+                break
+            for part2dev_id in self._replica2part2dev_id:
+                if handoff_part < len(part2dev_id):
+                    dev_id = part2dev_id[handoff_part]
+                    dev = self._devs[dev_id]
+                    zone = (dev['region'], dev['zone'])
+                    if dev_id not in used and zone not in same_zones:
+                        yield dict(dev, handoff_index=next(index))
+                        used.add(dev_id)
+                        same_zones.add(zone)
+                        ip = zone + (dev['ip'],)
+                        same_ips.add(ip)
+                        if len(same_zones) == self._num_zones:
+                            hit_all_zones = True
+                            break
+
+        hit_all_ips = len(same_ips) == self._num_ips
+        for handoff_part in chain(range(start, parts, inc),
+                                  range(inc - ((parts - start) % inc),
+                                        start, inc)):
+            if hit_all_ips:
+                # We've exhausted the pool of unused backends, so stop
+                # looking.
+                break
+            for part2dev_id in self._replica2part2dev_id:
+                if handoff_part < len(part2dev_id):
+                    dev_id = part2dev_id[handoff_part]
+                    dev = self._devs[dev_id]
+                    ip = (dev['region'], dev['zone'], dev['ip'])
+                    if dev_id not in used and ip not in same_ips:
+                        yield dict(dev, handoff_index=next(index))
+                        used.add(dev_id)
+                        same_ips.add(ip)
+                        if len(same_ips) == self._num_ips:
+                            hit_all_ips = True
+                            break
+
+        hit_all_devs = len(used) == self._num_assigned_devs
+        for handoff_part in chain(range(start, parts, inc),
+                                  range(inc - ((parts - start) % inc),
+                                        start, inc)):
+            if hit_all_devs:
+                # We've used every device we have, so let's stop looking for
+                # unused devices now.
+                break
+            for part2dev_id in self._replica2part2dev_id:
+                if handoff_part < len(part2dev_id):
+                    dev_id = part2dev_id[handoff_part]
+                    if dev_id not in used:
+                        dev = self._devs[dev_id]
+                        yield dict(dev, handoff_index=next(index))
+                        used.add(dev_id)
+                        if len(used) == self._num_assigned_devs:
+                            hit_all_devs = True
+                            break
diff --git a/swift/common/ring/utils.py b/swift/common/ring/utils.py
index afe1a16a46..bdb0e9692d 100644
--- a/swift/common/ring/utils.py
+++ b/swift/common/ring/utils.py
@@ -1,4 +1,93 @@
+# Copyright (c) 2010-2013 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import array
 from collections import defaultdict
+import contextlib
+import optparse
+import re
+import socket
+import sys
+
+from swift.common import exceptions
+from swift.common.utils import expand_ipv6, is_valid_ip, is_valid_ipv4, \
+    is_valid_ipv6
+
+
+BYTES_TO_TYPE_CODE = {
+    # We don't support 1 byte arrays. For backwards compatibility reasons.
+    2: 'H',
+    # Note that on some platforms, array.array('I') will be limited to 2-byte
+    # values. At the same time, however, using 'L' would get us 8-byte values
+    # on many platforms we care about. Use 'I' for now; hold off on writing
+    # custom array (de)serialization methods until someone actually complains.
+    4: 'I',
+    # This just seems excessive; besides, array.array() only takes it on py33+
+    # 8: 'Q',
+}
+
+
+def none_dev_id(dev_id_bytes):
+    '''
+    we can't store None's in the replica2part2dev array, so we high-jack
+    the max value for magic to represent the part is not currently
+    assigned to any device.
+    '''
+    return 2 ** (8 * dev_id_bytes) - 1
+
+
+def calc_dev_id_bytes(max_dev_id):
+    if max_dev_id < 0:
+        raise ValueError("Can't have negative device IDs")
+    for x in sorted(BYTES_TO_TYPE_CODE):
+        if max_dev_id < none_dev_id(x):
+            return x
+    else:
+        # > 4B devices??
+        raise exceptions.DevIdBytesTooSmall('Way too many devices!')
+
+
+def resize_array(old_arr, new_dev_id_bytes):
+    """
+    Copy an array to use a new itemsize, while preserving none_dev_id values
+    """
+    old_none_dev = none_dev_id(old_arr.itemsize)
+    new_none_dev = none_dev_id(new_dev_id_bytes)
+    return array.array(
+        BYTES_TO_TYPE_CODE[new_dev_id_bytes],
+        (new_none_dev if dev_id == old_none_dev else dev_id
+         for dev_id in old_arr))
+
+
+@contextlib.contextmanager
+def network_order_array(arr):
+    if sys.byteorder == 'little':
+        # Switch to network-order for serialization
+        arr.byteswap()
+    try:
+        yield arr
+    finally:
+        if sys.byteorder == 'little':
+            # Didn't make a copy; switch it back
+            arr.byteswap()
+
+
+def read_network_order_array(type_code, data):
+    arr = array.array(type_code, data)
+    if sys.byteorder == 'little':
+        arr.byteswap()
+    return arr
 
 
 def tiers_for_dev(dev):
@@ -8,13 +97,15 @@ def tiers_for_dev(dev):
 
     :returns: tuple of tiers
     """
-    t1 = dev['zone']
-    t2 = "{ip}:{port}".format(ip=dev.get('ip'), port=dev.get('port'))
-    t3 = dev['id']
+    t1 = dev['region']
+    t2 = dev['zone']
+    t3 = dev['ip']
+    t4 = dev['id']
 
     return ((t1,),
             (t1, t2),
-            (t1, t2, t3))
+            (t1, t2, t3),
+            (t1, t2, t3, t4))
 
 
 def build_tier_tree(devices):
@@ -27,52 +118,72 @@ def build_tier_tree(devices):
 
     Example:
 
-    zone 1 -+---- 192.168.1.1:6000 -+---- device id 0
-            |                       |
-            |                       +---- device id 1
-            |                       |
-            |                       +---- device id 2
-            |
-            +---- 192.168.1.2:6000 -+---- device id 3
-                                    |
-                                    +---- device id 4
-                                    |
-                                    +---- device id 5
-
-
-    zone 2 -+---- 192.168.2.1:6000 -+---- device id 6
-            |                       |
-            |                       +---- device id 7
-            |                       |
-            |                       +---- device id 8
-            |
-            +---- 192.168.2.2:6000 -+---- device id 9
-                                    |
-                                    +---- device id 10
-                                    |
-                                    +---- device id 11
+    region 1 -+---- zone 1 -+---- 192.168.101.1 -+---- device id 0
+              |             |                    |
+              |             |                    +---- device id 1
+              |             |                    |
+              |             |                    +---- device id 2
+              |             |
+              |             +---- 192.168.101.2 -+---- device id 3
+              |                                  |
+              |                                  +---- device id 4
+              |                                  |
+              |                                  +---- device id 5
+              |
+              +---- zone 2 -+---- 192.168.102.1 -+---- device id 6
+                            |                    |
+                            |                    +---- device id 7
+                            |                    |
+                            |                    +---- device id 8
+                            |
+                            +---- 192.168.102.2 -+---- device id 9
+                                                 |
+                                                 +---- device id 10
+
+
+    region 2 -+---- zone 1 -+---- 192.168.201.1 -+---- device id 12
+                            |                    |
+                            |                    +---- device id 13
+                            |                    |
+                            |                    +---- device id 14
+                            |
+                            +---- 192.168.201.2 -+---- device id 15
+                                                 |
+                                                 +---- device id 16
+                                                 |
+                                                 +---- device id 17
 
     The tier tree would look like:
     {
       (): [(1,), (2,)],
 
-      (1,): [(1, 192.168.1.1:6000),
-             (1, 192.168.1.2:6000)],
-      (2,): [(1, 192.168.2.1:6000),
-             (1, 192.168.2.2:6000)],
-
-      (1, 192.168.1.1:6000): [(1, 192.168.1.1:6000, 0),
-                              (1, 192.168.1.1:6000, 1),
-                              (1, 192.168.1.1:6000, 2)],
-      (1, 192.168.1.2:6000): [(1, 192.168.1.2:6000, 3),
-                              (1, 192.168.1.2:6000, 4),
-                              (1, 192.168.1.2:6000, 5)],
-      (2, 192.168.2.1:6000): [(1, 192.168.2.1:6000, 6),
-                              (1, 192.168.2.1:6000, 7),
-                              (1, 192.168.2.1:6000, 8)],
-      (2, 192.168.2.2:6000): [(1, 192.168.2.2:6000, 9),
-                              (1, 192.168.2.2:6000, 10),
-                              (1, 192.168.2.2:6000, 11)],
+      (1,): [(1, 1), (1, 2)],
+      (2,): [(2, 1)],
+
+      (1, 1): [(1, 1, 192.168.101.1),
+               (1, 1, 192.168.101.2)],
+      (1, 2): [(1, 2, 192.168.102.1),
+               (1, 2, 192.168.102.2)],
+      (2, 1): [(2, 1, 192.168.201.1),
+               (2, 1, 192.168.201.2)],
+
+      (1, 1, 192.168.101.1): [(1, 1, 192.168.101.1, 0),
+                              (1, 1, 192.168.101.1, 1),
+                              (1, 1, 192.168.101.1, 2)],
+      (1, 1, 192.168.101.2): [(1, 1, 192.168.101.2, 3),
+                              (1, 1, 192.168.101.2, 4),
+                              (1, 1, 192.168.101.2, 5)],
+      (1, 2, 192.168.102.1): [(1, 2, 192.168.102.1, 6),
+                              (1, 2, 192.168.102.1, 7),
+                              (1, 2, 192.168.102.1, 8)],
+      (1, 2, 192.168.102.2): [(1, 2, 192.168.102.2, 9),
+                              (1, 2, 192.168.102.2, 10)],
+      (2, 1, 192.168.201.1): [(2, 1, 192.168.201.1, 12),
+                              (2, 1, 192.168.201.1, 13),
+                              (2, 1, 192.168.201.1, 14)],
+      (2, 1, 192.168.201.2): [(2, 1, 192.168.201.2, 15),
+                              (2, 1, 192.168.201.2, 16),
+                              (2, 1, 192.168.201.2, 17)],
     }
 
     :devices: device dicts from which to generate the tree
@@ -87,3 +198,570 @@ def build_tier_tree(devices):
             else:
                 tier2children[()].add(tier)
     return tier2children
+
+
+def validate_and_normalize_ip(ip):
+    """
+    Return normalized ip if the ip is a valid ip.
+    Otherwise raise ValueError Exception. The hostname is
+    normalized to all lower case. IPv6-addresses are converted to
+    lowercase and fully expanded.
+    """
+    # first convert to lower case
+    new_ip = ip.lower()
+    if is_valid_ipv4(new_ip):
+        return new_ip
+    elif is_valid_ipv6(new_ip):
+        return expand_ipv6(new_ip)
+    else:
+        raise ValueError('Invalid ip %s' % ip)
+
+
+def validate_and_normalize_address(address):
+    """
+    Return normalized address if the address is a valid ip or hostname.
+    Otherwise raise ValueError Exception. The hostname is
+    normalized to all lower case. IPv6-addresses are converted to
+    lowercase and fully expanded.
+
+    RFC1123 2.1 Host Names and Nubmers
+    DISCUSSION
+        This last requirement is not intended to specify the complete
+        syntactic form for entering a dotted-decimal host number;
+        that is considered to be a user-interface issue.  For
+        example, a dotted-decimal number must be enclosed within
+        "[ ]" brackets for SMTP mail (see Section 5.2.17).  This
+        notation could be made universal within a host system,
+        simplifying the syntactic checking for a dotted-decimal
+        number.
+
+        If a dotted-decimal number can be entered without such
+        identifying delimiters, then a full syntactic check must be
+        made, because a segment of a host domain name is now allowed
+        to begin with a digit and could legally be entirely numeric
+        (see Section 6.1.2.4).  However, a valid host name can never
+        have the dotted-decimal form #.#.#.#, since at least the
+        highest-level component label will be alphabetic.
+    """
+    new_address = address.lstrip('[').rstrip(']')
+    if address.startswith('[') and address.endswith(']'):
+        return validate_and_normalize_ip(new_address)
+
+    new_address = new_address.lower()
+    if is_valid_ipv4(new_address):
+        return new_address
+    elif is_valid_ipv6(new_address):
+        return expand_ipv6(new_address)
+    elif is_valid_hostname(new_address):
+        return new_address
+    else:
+        raise ValueError('Invalid address %s' % address)
+
+
+def is_valid_hostname(hostname):
+    """
+    Return True if the provided hostname is a valid hostname
+    """
+    if len(hostname) < 1 or len(hostname) > 255:
+        return False
+    if hostname.endswith('.'):
+        # strip exactly one dot from the right, if present
+        hostname = hostname[:-1]
+    allowed = re.compile(r"(?!-)[A-Z\d-]{1,63}(?<!-)$", re.IGNORECASE)
+    return all(allowed.match(x) for x in hostname.split("."))
+
+
+def is_local_device(my_ips, my_port, dev_ip, dev_port):
+    """
+    Return True if the provided dev_ip and dev_port are among the IP
+    addresses specified in my_ips and my_port respectively.
+
+    To support accurate locality determination in the server-per-port
+    deployment, when my_port is None, only IP addresses are used for
+    determining locality (dev_port is ignored).
+
+    If dev_ip is a hostname then it is first translated to an IP
+    address before checking it against my_ips.
+    """
+    candidate_ips = []
+    if not is_valid_ip(dev_ip) and is_valid_hostname(dev_ip):
+        try:
+            # get the ip for this host; use getaddrinfo so that
+            # it works for both ipv4 and ipv6 addresses
+            addrinfo = socket.getaddrinfo(dev_ip, dev_port)
+            for addr in addrinfo:
+                family = addr[0]
+                dev_ip = addr[4][0]  # get the ip-address
+                if family == socket.AF_INET6:
+                    dev_ip = expand_ipv6(dev_ip)
+                candidate_ips.append(dev_ip)
+        except socket.gaierror:
+            return False
+    else:
+        if is_valid_ipv6(dev_ip):
+            dev_ip = expand_ipv6(dev_ip)
+        candidate_ips = [dev_ip]
+
+    for dev_ip in candidate_ips:
+        if dev_ip in my_ips and (my_port is None or dev_port == my_port):
+            return True
+
+    return False
+
+
+def parse_search_value(search_value):
+    """The <search-value> can be of the form::
+
+        d<device_id>r<region>z<zone>-<ip>:<port>R<r_ip>:<r_port>/
+         <device_name>_<meta>
+
+    Where <r_ip> and <r_port> are replication ip and port.
+
+    Any part is optional, but you must include at least one part.
+
+    Examples::
+
+        d74              Matches the device id 74
+        r4               Matches devices in region 4
+        z1               Matches devices in zone 1
+        z1-1.2.3.4       Matches devices in zone 1 with the ip 1.2.3.4
+        1.2.3.4          Matches devices in any zone with the ip 1.2.3.4
+        z1:5678          Matches devices in zone 1 using port 5678
+        :5678            Matches devices that use port 5678
+        R5.6.7.8         Matches devices that use replication ip 5.6.7.8
+        R:5678           Matches devices that use replication port 5678
+        1.2.3.4R5.6.7.8  Matches devices that use ip 1.2.3.4 and replication ip
+                         5.6.7.8
+        /sdb1            Matches devices with the device name sdb1
+        _shiny           Matches devices with shiny in the meta data
+        _"snet: 5.6.7.8" Matches devices with snet: 5.6.7.8 in the meta data
+        [::1]            Matches devices in any zone with the ip ::1
+        z1-[::1]:5678    Matches devices in zone 1 with ip ::1 and port 5678
+
+    Most specific example::
+
+        d74r4z1-1.2.3.4:5678/sdb1_"snet: 5.6.7.8"
+
+    Nerd explanation:
+
+        All items require their single character prefix except the ip, in which
+        case the - is optional unless the device id or zone is also included.
+    """
+    orig_search_value = search_value
+    match = {}
+    if search_value.startswith('d'):
+        i = 1
+        while i < len(search_value) and search_value[i].isdigit():
+            i += 1
+        match['id'] = int(search_value[1:i])
+        search_value = search_value[i:]
+    if search_value.startswith('r'):
+        i = 1
+        while i < len(search_value) and search_value[i].isdigit():
+            i += 1
+        match['region'] = int(search_value[1:i])
+        search_value = search_value[i:]
+    if search_value.startswith('z'):
+        i = 1
+        while i < len(search_value) and search_value[i].isdigit():
+            i += 1
+        match['zone'] = int(search_value[1:i])
+        search_value = search_value[i:]
+    if search_value.startswith('-'):
+        search_value = search_value[1:]
+    if search_value and search_value[0].isdigit():
+        i = 1
+        while i < len(search_value) and search_value[i] in '0123456789.':
+            i += 1
+        match['ip'] = search_value[:i]
+        search_value = search_value[i:]
+    elif search_value and search_value.startswith('['):
+        i = 1
+        while i < len(search_value) and search_value[i] != ']':
+            i += 1
+        i += 1
+        match['ip'] = search_value[:i].lstrip('[').rstrip(']')
+        search_value = search_value[i:]
+
+    if 'ip' in match:
+        # ipv6 addresses are converted to all lowercase
+        # and use the fully expanded representation
+        match['ip'] = validate_and_normalize_ip(match['ip'])
+
+    if search_value.startswith(':'):
+        i = 1
+        while i < len(search_value) and search_value[i].isdigit():
+            i += 1
+        match['port'] = int(search_value[1:i])
+        search_value = search_value[i:]
+    # replication parameters
+    if search_value.startswith('R'):
+        search_value = search_value[1:]
+        if search_value and search_value[0].isdigit():
+            i = 1
+            while (i < len(search_value) and
+                   search_value[i] in '0123456789.'):
+                i += 1
+            match['replication_ip'] = search_value[:i]
+            search_value = search_value[i:]
+        elif search_value and search_value.startswith('['):
+            i = 1
+            while i < len(search_value) and search_value[i] != ']':
+                i += 1
+            i += 1
+            match['replication_ip'] = search_value[:i].lstrip('[').rstrip(']')
+            search_value = search_value[i:]
+
+        if 'replication_ip' in match:
+            # ipv6 addresses are converted to all lowercase
+            # and use the fully expanded representation
+            match['replication_ip'] = \
+                validate_and_normalize_ip(match['replication_ip'])
+
+        if search_value.startswith(':'):
+            i = 1
+            while i < len(search_value) and search_value[i].isdigit():
+                i += 1
+            match['replication_port'] = int(search_value[1:i])
+            search_value = search_value[i:]
+    if search_value.startswith('/'):
+        i = 1
+        while i < len(search_value) and search_value[i] != '_':
+            i += 1
+        match['device'] = search_value[1:i]
+        search_value = search_value[i:]
+    if search_value.startswith('_'):
+        match['meta'] = search_value[1:]
+        search_value = ''
+    if search_value:
+        raise ValueError('Invalid <search-value>: %s' %
+                         repr(orig_search_value))
+    return match
+
+
+def parse_search_values_from_opts(opts):
+    """
+    Convert optparse style options into a dictionary for searching.
+
+    :param opts: optparse style options
+    :returns: a dictionary with search values to filter devices,
+              supported parameters are id, region, zone, ip, port,
+              replication_ip, replication_port, device, weight, meta
+    """
+
+    search_values = {}
+    for key in ('id', 'region', 'zone', 'ip', 'port', 'replication_ip',
+                'replication_port', 'device', 'weight', 'meta'):
+        value = getattr(opts, key, None)
+        if value:
+            if key == 'ip' or key == 'replication_ip':
+                value = validate_and_normalize_address(value)
+        search_values[key] = value
+    return search_values
+
+
+def parse_change_values_from_opts(opts):
+    """
+    Convert optparse style options into a dictionary for changing.
+
+    :param opts: optparse style options
+    :returns: a dictonary with change values to filter devices,
+              supported parameters are ip, port, replication_ip,
+              replication_port
+    """
+
+    change_values = {}
+    for key in ('change_ip', 'change_port', 'change_replication_ip',
+                'change_replication_port', 'change_device', 'change_meta'):
+        value = getattr(opts, key, None)
+        if value:
+            if key == 'change_ip' or key == 'change_replication_ip':
+                value = validate_and_normalize_address(value)
+            change_values[key.replace('change_', '')] = value
+    return change_values
+
+
+def parse_add_value(add_value):
+    """
+    Convert an add value, like 'r1z2-10.1.2.3:7878/sdf', to a dictionary.
+
+    If the string does not start with 'r<N>', then the value of 'region' in
+    the returned dictionary will be None. Callers should check for this and
+    set a reasonable default. This is done so callers can emit errors or
+    warnings if desired.
+
+    Similarly, 'replication_ip' and 'replication_port' will be None if not
+    specified.
+
+    :returns: dictionary with keys 'region', 'zone', 'ip', 'port', 'device',
+        'replication_ip', 'replication_port', 'meta'
+    :raises ValueError: if add_value is malformed
+    """
+    region = None
+    rest = add_value
+    if add_value.startswith('r'):
+        i = 1
+        while i < len(add_value) and add_value[i].isdigit():
+            i += 1
+        region = int(add_value[1:i])
+        rest = add_value[i:]
+
+    if not rest.startswith('z'):
+        raise ValueError('Invalid add value: %s' % add_value)
+    i = 1
+    while i < len(rest) and rest[i].isdigit():
+        i += 1
+    zone = int(rest[1:i])
+    rest = rest[i:]
+
+    if not rest.startswith('-'):
+        raise ValueError('Invalid add value: %s' % add_value)
+
+    ip, port, rest = parse_address(rest[1:])
+
+    replication_ip = replication_port = None
+    if rest.startswith('R'):
+        replication_ip, replication_port, rest =  \
+            parse_address(rest[1:])
+    if not rest.startswith('/'):
+        raise ValueError(
+            'Invalid add value: %s' % add_value)
+    i = 1
+    while i < len(rest) and rest[i] != '_':
+        i += 1
+    device_name = rest[1:i]
+    if not validate_device_name(device_name):
+        raise ValueError('Invalid device name')
+
+    rest = rest[i:]
+
+    meta = ''
+    if rest.startswith('_'):
+        meta = rest[1:]
+
+    return {'region': region, 'zone': zone, 'ip': ip, 'port': port,
+            'device': device_name, 'replication_ip': replication_ip,
+            'replication_port': replication_port, 'meta': meta}
+
+
+def parse_address(rest):
+    if rest.startswith('['):
+        # remove first [] for ip
+        rest = rest.replace('[', '', 1).replace(']', '', 1)
+
+    pos = 0
+    while (pos < len(rest) and
+           not (rest[pos] == 'R' or rest[pos] == '/')):
+        pos += 1
+    address = rest[:pos]
+    rest = rest[pos:]
+
+    port_start = address.rfind(':')
+    if port_start == -1:
+        raise ValueError('Invalid port in add value')
+
+    ip = address[:port_start]
+    try:
+        port = int(address[(port_start + 1):])
+    except (TypeError, ValueError):
+        raise ValueError(
+            'Invalid port %s in add value' % address[port_start:])
+
+    # if this is an ipv6 address then we want to convert it
+    # to all lowercase and use its fully expanded representation
+    # to make searches easier
+    ip = validate_and_normalize_ip(ip)
+
+    return (ip, port, rest)
+
+
+def validate_args(argvish):
+    """
+    Build OptionParse and validate it whether the format is new command-line
+    format or not.
+    """
+    opts, args = parse_args(argvish)
+    # id can be 0 (swift starts generating id from 0),
+    # also zone, region and weight can be set to zero.
+    new_cmd_format = opts.id is not None or opts.region is not None or \
+        opts.zone is not None or opts.ip or opts.port or \
+        opts.replication_ip or opts.replication_port or \
+        opts.device or opts.weight is not None or opts.meta
+    return (new_cmd_format, opts, args)
+
+
+def parse_args(argvish):
+    """
+    Build OptionParser and evaluate command line arguments.
+    """
+    parser = optparse.OptionParser()
+    parser.add_option('-u', '--id', type="int",
+                      help="Device ID")
+    parser.add_option('-r', '--region', type="int",
+                      help="Region")
+    parser.add_option('-z', '--zone', type="int",
+                      help="Zone")
+    parser.add_option('-i', '--ip', type="string",
+                      help="IP address")
+    parser.add_option('-p', '--port', type="int",
+                      help="Port number")
+    parser.add_option('-j', '--replication-ip', type="string",
+                      help="Replication IP address")
+    parser.add_option('-q', '--replication-port', type="int",
+                      help="Replication port number")
+    parser.add_option('-d', '--device', type="string",
+                      help="Device name (e.g. md0, sdb1)")
+    parser.add_option('-w', '--weight', type="float",
+                      help="Device weight")
+    parser.add_option('-m', '--meta', type="string", default="",
+                      help="Extra device info (just a string)")
+    parser.add_option('-I', '--change-ip', type="string",
+                      help="IP address for change")
+    parser.add_option('-P', '--change-port', type="int",
+                      help="Port number for change")
+    parser.add_option('-J', '--change-replication-ip', type="string",
+                      help="Replication IP address for change")
+    parser.add_option('-Q', '--change-replication-port', type="int",
+                      help="Replication port number for change")
+    parser.add_option('-D', '--change-device', type="string",
+                      help="Device name (e.g. md0, sdb1) for change")
+    parser.add_option('-M', '--change-meta', type="string", default="",
+                      help="Extra device info (just a string) for change")
+    parser.add_option('-y', '--yes', default=False, action="store_true",
+                      help="Assume a yes response to all questions")
+    return parser.parse_args(argvish)
+
+
+def parse_builder_ring_filename_args(argvish):
+    first_arg = argvish[1]
+    if first_arg.endswith('.ring.gz'):
+        ring_file = first_arg
+        builder_file = first_arg[:-len('.ring.gz')] + '.builder'
+    else:
+        builder_file = first_arg
+        if not builder_file.endswith('.builder'):
+            ring_file = first_arg
+        else:
+            ring_file = builder_file[:-len('.builder')]
+        ring_file += '.ring.gz'
+    return builder_file, ring_file
+
+
+def build_dev_from_opts(opts):
+    """
+    Convert optparse stype options into a device dictionary.
+    """
+    for attribute, shortopt, longopt in (['region', '-r', '--region'],
+                                         ['zone', '-z', '--zone'],
+                                         ['ip', '-i', '--ip'],
+                                         ['port', '-p', '--port'],
+                                         ['device', '-d', '--device'],
+                                         ['weight', '-w', '--weight']):
+        if getattr(opts, attribute, None) is None:
+            raise ValueError('Required argument %s/%s not specified.' %
+                             (shortopt, longopt))
+
+    ip = validate_and_normalize_address(opts.ip)
+    replication_ip = validate_and_normalize_address(
+        (opts.replication_ip or opts.ip))
+    replication_port = opts.replication_port or opts.port
+
+    if not validate_device_name(opts.device):
+        raise ValueError('Invalid device name')
+
+    return {'region': opts.region, 'zone': opts.zone, 'ip': ip,
+            'port': opts.port, 'device': opts.device, 'meta': opts.meta,
+            'replication_ip': replication_ip,
+            'replication_port': replication_port, 'weight': opts.weight}
+
+
+def dispersion_report(builder, search_filter=None,
+                      verbose=False, recalculate=False):
+    if recalculate or not builder._dispersion_graph:
+        builder._build_dispersion_graph()
+    max_allowed_replicas = builder._build_max_replicas_by_tier()
+    worst_tier = None
+    max_dispersion = 0.0
+    sorted_graph = []
+    for tier, replica_counts in sorted(builder._dispersion_graph.items()):
+        tier_name = get_tier_name(tier, builder)
+        if search_filter and not re.match(search_filter, tier_name):
+            continue
+        max_replicas = int(max_allowed_replicas[tier])
+        at_risk_parts = sum(replica_counts[i] * (i - max_replicas)
+                            for i in range(max_replicas + 1,
+                                           len(replica_counts)))
+        placed_parts = sum(replica_counts[i] * i for i in range(
+            1, len(replica_counts)))
+        tier_dispersion = 100.0 * at_risk_parts / placed_parts
+        if tier_dispersion > max_dispersion:
+            max_dispersion = tier_dispersion
+            worst_tier = tier_name
+        if not verbose:
+            continue
+
+        tier_report = {
+            'max_replicas': max_replicas,
+            'placed_parts': placed_parts,
+            'dispersion': tier_dispersion,
+            'replicas': replica_counts,
+        }
+        sorted_graph.append((tier_name, tier_report))
+
+    return {
+        'max_dispersion': max_dispersion,
+        'worst_tier': worst_tier,
+        'graph': sorted_graph,
+    }
+
+
+def validate_replicas_by_tier(replicas, replicas_by_tier):
+    """
+    Validate the sum of the replicas at each tier.
+    The sum of the replicas at each tier should be less than or very close to
+    the upper limit indicated by replicas
+
+    :param replicas: float,the upper limit of replicas
+    :param replicas_by_tier: defaultdict,the replicas by tier
+    """
+    tiers = ['cluster', 'regions', 'zones', 'servers', 'devices']
+    for i, tier_name in enumerate(tiers):
+        replicas_at_tier = sum(replicas_by_tier[t] for t in
+                               replicas_by_tier if len(t) == i)
+        if abs(replicas - replicas_at_tier) > 1e-10:
+            raise exceptions.RingValidationError(
+                '%s != %s at tier %s' % (
+                    replicas_at_tier, replicas, tier_name))
+
+
+def format_device(region=None, zone=None, ip=None, device=None, **kwargs):
+    """
+    Convert device dict or tier attributes to a representative string.
+
+    :returns: a string, the normalized format of a device tier
+    """
+    return "r%sz%s-%s/%s" % (region, zone, ip, device)
+
+
+def get_tier_name(tier, builder):
+    if len(tier) == 1:
+        return "r%s" % (tier[0], )
+    if len(tier) == 2:
+        return "r%sz%s" % (tier[0], tier[1])
+    if len(tier) == 3:
+        return "r%sz%s-%s" % (tier[0], tier[1], tier[2])
+    if len(tier) == 4:
+        device = builder.devs[tier[3]] or {}
+        return format_device(tier[0], tier[1], tier[2], device.get(
+            'device', 'IDd%s' % tier[3]))
+
+
+def validate_device_name(device_name):
+    return not (
+        device_name.startswith(' ') or
+        device_name.endswith(' ') or
+        len(device_name) == 0)
+
+
+def pretty_dev(device):
+    return format_device(**device)
diff --git a/swift/common/splice.py b/swift/common/splice.py
new file mode 100644
index 0000000000..9c2384e25f
--- /dev/null
+++ b/swift/common/splice.py
@@ -0,0 +1,203 @@
+# Copyright (c) 2014 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+'''
+Bindings to the `tee` and `splice` system calls
+'''
+
+import os
+import ctypes
+import ctypes.util
+
+__all__ = ['tee', 'splice']
+
+
+c_loff_t = ctypes.c_long
+
+
+class Tee(object):
+    '''Binding to `tee`'''
+
+    __slots__ = '_c_tee',
+
+    def __init__(self):
+        libc = ctypes.CDLL(ctypes.util.find_library('c'), use_errno=True)
+
+        try:
+            c_tee = libc.tee
+        except AttributeError:
+            self._c_tee = None
+            return
+
+        c_tee.argtypes = [
+            ctypes.c_int,
+            ctypes.c_int,
+            ctypes.c_size_t,
+            ctypes.c_uint
+        ]
+
+        c_tee.restype = ctypes.c_ssize_t
+
+        def errcheck(result, func, arguments):
+            if result == -1:
+                errno = ctypes.set_errno(0)
+
+                raise IOError(errno, 'tee: %s' % os.strerror(errno))
+            else:
+                return result
+
+        c_tee.errcheck = errcheck
+
+        self._c_tee = c_tee
+
+    def __call__(self, fd_in, fd_out, len_, flags):
+        '''See `man 2 tee`
+
+        File-descriptors can be file-like objects with a `fileno` method, or
+        integers.
+
+        Flags can be an integer value, or a list of flags (exposed on
+        `splice`).
+
+        This function returns the number of bytes transferred (i.e. the actual
+        result of the call to `tee`).
+
+        Upon other errors, an `IOError` is raised with the proper `errno` set.
+        '''
+
+        if not self.available:
+            raise EnvironmentError('tee not available')
+
+        if not isinstance(flags, int):
+            c_flags = 0
+            for flag in flags:
+                c_flags |= flag
+        else:
+            c_flags = flags
+
+        c_fd_in = getattr(fd_in, 'fileno', lambda: fd_in)()
+        c_fd_out = getattr(fd_out, 'fileno', lambda: fd_out)()
+
+        return self._c_tee(c_fd_in, c_fd_out, len_, c_flags)
+
+    @property
+    def available(self):
+        '''Availability of `tee`'''
+
+        return self._c_tee is not None
+
+
+tee = Tee()
+del Tee
+
+
+class Splice(object):
+    '''Binding to `splice`'''
+
+    # From `bits/fcntl-linux.h`
+    SPLICE_F_MOVE = 1
+    SPLICE_F_NONBLOCK = 2
+    SPLICE_F_MORE = 4
+    SPLICE_F_GIFT = 8
+
+    __slots__ = '_c_splice',
+
+    def __init__(self):
+        libc = ctypes.CDLL(ctypes.util.find_library('c'), use_errno=True)
+
+        try:
+            c_splice = libc.splice
+        except AttributeError:
+            self._c_splice = None
+            return
+
+        c_loff_t_p = ctypes.POINTER(c_loff_t)
+
+        c_splice.argtypes = [
+            ctypes.c_int, c_loff_t_p,
+            ctypes.c_int, c_loff_t_p,
+            ctypes.c_size_t,
+            ctypes.c_uint
+        ]
+
+        c_splice.restype = ctypes.c_ssize_t
+
+        def errcheck(result, func, arguments):
+            if result == -1:
+                errno = ctypes.set_errno(0)
+
+                raise IOError(errno, 'splice: %s' % os.strerror(errno))
+            else:
+                off_in = arguments[1]
+                off_out = arguments[3]
+
+                return (
+                    result,
+                    off_in.contents.value if off_in is not None else None,
+                    off_out.contents.value if off_out is not None else None)
+
+        c_splice.errcheck = errcheck
+
+        self._c_splice = c_splice
+
+    def __call__(self, fd_in, off_in, fd_out, off_out, len_, flags):
+        '''See `man 2 splice`
+
+        File-descriptors can be file-like objects with a `fileno` method, or
+        integers.
+
+        Flags can be an integer value, or a list of flags (exposed on this
+        object).
+
+        Returns a tuple of the result of the `splice` call, the output value of
+        `off_in` and the output value of `off_out` (or `None` for any of these
+        output values, if applicable).
+
+        Upon other errors, an `IOError` is raised with the proper `errno` set.
+
+        Note: if you want to pass `NULL` as value for `off_in` or `off_out` to
+        the system call, you must pass `None`, *not* 0!
+        '''
+
+        if not self.available:
+            raise EnvironmentError('splice not available')
+
+        if not isinstance(flags, int):
+            c_flags = 0
+            for flag in flags:
+                c_flags |= flag
+        else:
+            c_flags = flags
+
+        c_fd_in = getattr(fd_in, 'fileno', lambda: fd_in)()
+        c_fd_out = getattr(fd_out, 'fileno', lambda: fd_out)()
+
+        c_off_in = \
+            ctypes.pointer(c_loff_t(off_in)) if off_in is not None else None
+        c_off_out = \
+            ctypes.pointer(c_loff_t(off_out)) if off_out is not None else None
+
+        return self._c_splice(
+            c_fd_in, c_off_in, c_fd_out, c_off_out, len_, c_flags)
+
+    @property
+    def available(self):
+        '''Availability of `splice`'''
+
+        return self._c_splice is not None
+
+
+splice = Splice()
+del Splice
diff --git a/swift/common/statsd_client.py b/swift/common/statsd_client.py
new file mode 100644
index 0000000000..1435f15a84
--- /dev/null
+++ b/swift/common/statsd_client.py
@@ -0,0 +1,648 @@
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+""" Statsd Client """
+
+import time
+import warnings
+import re
+from contextlib import closing
+from random import random
+
+from eventlet.green import socket
+
+from swift.common.utils.config import config_true_value
+
+
+STATSD_CONF_USER_LABEL_PREFIX = 'statsd_user_label_'
+STATSD_USER_LABEL_NAMESPACE = 'user_'
+USER_LABEL_PATTERN = re.compile(r"[^0-9a-zA-Z_]")
+USER_VALUE_PATTERN = re.compile(r"[^0-9a-zA-Z_.]")
+
+
+def _build_line_parts(metric, value, metric_type, sample_rate):
+    line = '%s:%s|%s' % (metric, value, metric_type)
+    if sample_rate < 1:
+        line += '|@%s' % (sample_rate,)
+    return line
+
+
+def librato(metric, value, metric_type, sample_rate, labels):
+    # https://www.librato.com/docs/kb/collect/collection_agents/stastd/#stat-level-tags
+    if labels:
+        metric += '#' + ','.join('%s=%s' % (k, v) for k, v in labels)
+    line = _build_line_parts(metric, value, metric_type, sample_rate)
+    return line
+
+
+def influxdb(metric, value, metric_type, sample_rate, labels):
+    # https://www.influxdata.com/blog/getting-started-with-sending-statsd-metrics-to-telegraf-influxdb/#introducing-influx-statsd
+    if labels:
+        metric += ''.join(',%s=%s' % (k, v) for k, v in labels)
+    line = _build_line_parts(metric, value, metric_type, sample_rate)
+    return line
+
+
+def graphite(metric, value, metric_type, sample_rate, labels):
+    # https://graphite.readthedocs.io/en/latest/tags.html#carbon
+    if labels:
+        metric += ''.join(';%s=%s' % (k, v) for k, v in labels)
+    line = _build_line_parts(metric, value, metric_type, sample_rate)
+    return line
+
+
+def dogstatsd(metric, value, metric_type, sample_rate, labels):
+    # https://docs.datadoghq.com/developers/dogstatsd/datagram_shell/?tab=metrics
+    line = _build_line_parts(metric, value, metric_type, sample_rate)
+    if labels:
+        line += '|#' + ','.join('%s:%s' % (k, v) for k, v in labels)
+    return line
+
+
+LABEL_MODES = {
+    'disabled': None,
+    'librato': librato,
+    'influxdb': influxdb,
+    'graphite': graphite,
+    'dogstatsd': dogstatsd,
+}
+
+
+def _get_labeled_statsd_formatter(label_mode):
+    """
+    Returns a label formatting function for the given ``label_mode``.
+
+    :param label_mode: A label mode.
+    :raises ValueError: if ``label_mode`` is not supported by ``LabelFormats``.
+    :returns: a label formatting function.
+    """
+    try:
+        return LABEL_MODES[label_mode]
+    except KeyError:
+        label_modes = LABEL_MODES.keys()
+        raise ValueError(
+            'unknown statsd_label_mode %r; '
+            'expected one of %r' % (label_mode, label_modes))
+
+
+def get_statsd_client(conf=None, tail_prefix='', logger=None):
+    """
+    Get an instance of StatsdClient using config settings.
+
+    **config and defaults**::
+
+        log_statsd_host = (disabled)
+        log_statsd_port = 8125
+        log_statsd_default_sample_rate = 1.0
+        log_statsd_sample_rate_factor = 1.0
+        log_statsd_metric_prefix = (empty-string)
+        statsd_emit_legacy = true
+
+    :param conf: Configuration dict to read settings from
+    :param tail_prefix: tail prefix to pass to statsd client
+    :param logger: stdlib logger instance used by statsd client for logging
+    :return: an instance of ``StatsdClient``
+    """
+    conf = conf or {}
+
+    host = conf.get('log_statsd_host')
+    port = int(conf.get('log_statsd_port', 8125))
+    base_prefix = conf.get('log_statsd_metric_prefix', '')
+    default_sample_rate = float(
+        conf.get('log_statsd_default_sample_rate', 1))
+    sample_rate_factor = float(
+        conf.get('log_statsd_sample_rate_factor', 1))
+
+    emit_legacy = config_true_value(conf.get(
+        'statsd_emit_legacy', 'true'))
+
+    return StatsdClient(
+        host, port,
+        base_prefix=base_prefix,
+        tail_prefix=tail_prefix,
+        default_sample_rate=default_sample_rate,
+        sample_rate_factor=sample_rate_factor,
+        emit_legacy=emit_legacy,
+        logger=logger)
+
+
+def get_labeled_statsd_client(conf=None, logger=None):
+    """
+    Get an instance of LabeledStatsdClient using config settings.
+
+    **config and defaults**::
+
+        log_statsd_host = (disabled)
+        log_statsd_port = 8125
+        log_statsd_default_sample_rate = 1.0
+        log_statsd_sample_rate_factor = 1.0
+        statsd_label_mode = disabled
+
+    :param conf: Configuration dict to read settings from
+    :param logger: stdlib logger instance used by statsd client for logging
+    :return: an instance of ``LabeledStatsdClient``
+    """
+    conf = conf or {}
+
+    host = conf.get('log_statsd_host')
+    port = int(conf.get('log_statsd_port', 8125))
+    default_sample_rate = float(
+        conf.get('log_statsd_default_sample_rate', 1))
+    sample_rate_factor = float(
+        conf.get('log_statsd_sample_rate_factor', 1))
+
+    label_mode = conf.get(
+        'statsd_label_mode', 'disabled').lower()
+
+    default_labels = {}
+    for k, v in conf.items():
+        if not k.startswith(STATSD_CONF_USER_LABEL_PREFIX):
+            continue
+        conf_label = k[len(STATSD_CONF_USER_LABEL_PREFIX):]
+        result = USER_LABEL_PATTERN.search(conf_label)
+        if result is not None:
+            raise ValueError(
+                'invalid character in statsd user label '
+                'configuration {0!r}: {1!r}'.format(
+                    k, result.group(0)))
+        result = USER_VALUE_PATTERN.search(v)
+        if result is not None:
+            raise ValueError(
+                'invalid character in configuration {0!r} '
+                'value {1!r}: {2!r}'.format(
+                    k, v, result.group(0)))
+        conf_label = STATSD_USER_LABEL_NAMESPACE + conf_label
+        default_labels[conf_label] = v
+
+    return LabeledStatsdClient(
+        host, port,
+        default_sample_rate=default_sample_rate,
+        sample_rate_factor=sample_rate_factor,
+        label_mode=label_mode,
+        default_labels=default_labels,
+        logger=logger)
+
+
+class AbstractStatsdClient:
+    """
+    Base class to facilitate sending metrics to a socket. Sub-classes are
+    responsible for formatting metrics lines.
+
+    :param host: Statsd host name. If ``None`` then metrics are not sent.
+    :param port: Statsd host port.
+    :param default_sample_rate: The default rate at which metrics should be
+        sampled if no sample rate is otherwise specified. Should be a float
+        value between 0 and 1.
+    :param sample_rate_factor: A multiplier to apply to the rate at which
+        metrics are sampled. Should be a float value between 0 and 1.
+    :param logger: A stdlib logger instance.
+    """
+    def __init__(self, host, port, default_sample_rate=1,
+                 sample_rate_factor=1, logger=None):
+        self._host = host
+        self._port = port
+        self._default_sample_rate = default_sample_rate
+        self._sample_rate_factor = sample_rate_factor
+        self.random = random
+        self.logger = logger
+        self._sock_family = self._target = None
+
+        if self._host:
+            self._set_sock_family_and_target(self._host, self._port)
+
+    def _set_sock_family_and_target(self, host, port):
+        # Determine if host is IPv4 or IPv6
+        addr_info = None
+        try:
+            addr_info = socket.getaddrinfo(host, port, socket.AF_INET)
+            self._sock_family = socket.AF_INET
+        except socket.gaierror:
+            try:
+                addr_info = socket.getaddrinfo(host, port, socket.AF_INET6)
+                self._sock_family = socket.AF_INET6
+            except socket.gaierror:
+                # Don't keep the server from starting from what could be a
+                # transient DNS failure.  Any hostname will get re-resolved as
+                # necessary in the .sendto() calls.
+                # However, we don't know if we're IPv4 or IPv6 in this case, so
+                # we assume legacy IPv4.
+                self._sock_family = socket.AF_INET
+
+        # NOTE: we use the original host value, not the DNS-resolved one
+        # because if host is a hostname, we don't want to cache the DNS
+        # resolution for the entire lifetime of this process.  Let standard
+        # name resolution caching take effect.  This should help operators use
+        # DNS trickery if they want.
+        if addr_info is not None:
+            # addr_info is a list of 5-tuples with the following structure:
+            #     (family, socktype, proto, canonname, sockaddr)
+            # where sockaddr is the only thing of interest to us, and we only
+            # use the first result.  We want to use the originally supplied
+            # host (see note above) and the remainder of the variable-length
+            # sockaddr: IPv4 has (address, port) while IPv6 has (address,
+            # port, flow info, scope id).
+            sockaddr = addr_info[0][-1]
+            self._target = (host,) + (sockaddr[1:])
+        else:
+            self._target = (host, port)
+
+    def _is_emitted(self, sample_rate):
+        """
+        Adjust the given ``sample_rate`` by the configured
+        ``sample_rate_factor`` and, based on the adjusted sample rate,
+        determine if a stat should be emitted on this occasion.
+
+        Sub-classes should call this method before sending a metric line with
+        ``_send_line``.
+
+        :param sample_rate: The sample_rate given in the call to emit a stat.
+            If ``None`` then this will default to the configured
+            ``default_sample_rate``.
+        :returns: a tuple ``(<boolean>, <adjusted_sample_rate>)``. The boolean
+            is ``True`` if a stat should be emitted on this occasion, ``False``
+            otherwise.
+        """
+        if not self._host:
+            # StatsD not configured
+            return False, None
+
+        if sample_rate is None:
+            sample_rate = self._default_sample_rate
+        adjusted_sample_rate = sample_rate * self._sample_rate_factor
+
+        if adjusted_sample_rate < 1 and self.random() >= adjusted_sample_rate:
+            return False, None
+
+        return True, adjusted_sample_rate
+
+    def _send_line(self, line):
+        """
+        Send a ``line`` of metrics to socket.
+
+        Sub-classes should call ``_is_emitted`` before calling this method.
+
+        :param line: The string to be sent to the socket. If ``None`` then
+            nothing is sent.
+        """
+
+        if line is None:
+            return
+
+        # Ideally, we'd cache a sending socket in self, but that
+        # results in a socket getting shared by multiple green threads.
+        with closing(self._open_socket()) as sock:
+            try:
+                return sock.sendto(line.encode('utf-8'), self._target)
+            except IOError as err:
+                if self.logger:
+                    self.logger.warning(
+                        'Error sending UDP message to %(target)r: %(err)s',
+                        {'target': self._target, 'err': err})
+
+    def _open_socket(self):
+        return socket.socket(self._sock_family, socket.SOCK_DGRAM)
+
+    def _update_stats(self, metric, value, **kwargs):
+        # This method was added to disaggregate *crement metrics when testing
+        return self._send(metric, value, 'c', **kwargs)
+
+    def update_stats(self, metric, value, **kwargs):
+        self._update_stats(metric, value, **kwargs)
+
+    def increment(self, metric, **kwargs):
+        return self._update_stats(metric, 1, **kwargs)
+
+    def decrement(self, metric, **kwargs):
+        return self._update_stats(metric, -1, **kwargs)
+
+    def _timing(self, metric, timing_ms, **kwargs):
+        # This method was added to disaggregate timing metrics when testing
+        return self._send(metric, round(timing_ms, 4), 'ms', **kwargs)
+
+    def timing(self, metric, timing_ms, **kwargs):
+        return self._timing(metric, timing_ms, **kwargs)
+
+    def timing_since(self, metric, orig_time, **kwargs):
+        return self._timing(
+            metric, (time.time() - orig_time) * 1000, **kwargs)
+
+    def transfer_rate(self, metric, elapsed_time, byte_xfer, **kwargs):
+        if byte_xfer:
+            return self._timing(
+                metric, elapsed_time * 1000 / byte_xfer * 1000, **kwargs)
+
+
+class StatsdClient(AbstractStatsdClient):
+    """
+    A legacy statsd client.  This client does not support labeled metrics.
+
+    A prefix may be specified using the ``base_prefix`` and ``tail_prefix``
+    arguments. The prefix is added to the name of every metric such that the
+    emitted metric name has the form:
+
+        [<base_prefix>.][tail_prefix.]<metric name>
+
+    :param host: Statsd host name. If ``None`` then metrics are not sent.
+    :param port: Statsd host port.
+    :param base_prefix: (optional) A string that will form the first part of a
+        prefix added to each metric name. The prefix is separated from the
+        metric name by a '.' character.
+    :param tail_prefix: (optional) A string that will form the second part of a
+        prefix added to each metric name. The prefix is separated from the
+        metric name by a '.' character.
+    :param default_sample_rate: The default rate at which metrics should be
+        sampled if no sample rate is otherwise specified. Should be a float
+        value between 0 and 1.
+    :param sample_rate_factor: A multiplier to apply to the rate at which
+        metrics are sampled. Should be a float value between 0 and 1.
+    :param emit_legacy: if ``True`` then the client will emit metrics; if
+        ``False``  then the client will emit no metrics.
+    :param logger: A stdlib logger instance.
+    """
+    def __init__(self, host, port,
+                 base_prefix='', tail_prefix='',
+                 default_sample_rate=1, sample_rate_factor=1,
+                 emit_legacy=True,
+                 logger=None):
+        super().__init__(
+            host, port, default_sample_rate, sample_rate_factor, logger)
+        self._base_prefix = base_prefix
+
+        self.emit_legacy = emit_legacy
+
+        self._set_prefix(tail_prefix)
+
+    def _send(self, metric, value, metric_type, sample_rate=None):
+        is_emitted, adjusted_sample_rate = self._is_emitted(sample_rate)
+        if self.emit_legacy and is_emitted:
+            metric = self._prefix + metric
+            line = _build_line_parts(
+                metric, value, metric_type, adjusted_sample_rate)
+            return self._send_line(line)
+
+    def _set_prefix(self, tail_prefix):
+        """
+        Modifies the prefix that is added to metric names. The resulting prefix
+        is the concatenation of the component parts `base_prefix` and
+        `tail_prefix`. Only truthy components are included. Each included
+        component is followed by a period, e.g.::
+
+            <base_prefix>.<tail_prefix>.
+            <tail_prefix>.
+            <base_prefix>.
+            <the empty string>
+
+        Note: this method is expected to be called from the constructor only,
+        but exists to provide backwards compatible functionality for the
+        deprecated set_prefix() method.
+
+        :param tail_prefix: The new value of tail_prefix
+        """
+        if tail_prefix and self._base_prefix:
+            self._prefix = '.'.join([self._base_prefix, tail_prefix, ''])
+        elif tail_prefix:
+            self._prefix = tail_prefix + '.'
+        elif self._base_prefix:
+            self._prefix = self._base_prefix + '.'
+        else:
+            self._prefix = ''
+
+    def set_prefix(self, tail_prefix):
+        """
+        This method is deprecated; use the ``tail_prefix`` argument of the
+        constructor when instantiating the class instead.
+        """
+        warnings.warn(
+            'set_prefix() is deprecated; use the ``tail_prefix`` argument of '
+            'the constructor when instantiating the class instead.',
+            DeprecationWarning, stacklevel=2
+        )
+        self._set_prefix(tail_prefix)
+
+    # for backwards compat StatsdClient supports sample_rate as positional arg
+    def update_stats(self, metric, value, sample_rate=None):
+        """
+        Update a counter, aggregated metric changed by value.
+
+        :param metric: name of the metric
+        :param value: int, the counter delta
+        :param sample_rate: float, override default sample_rate
+        """
+        return super().update_stats(metric, value,
+                                    sample_rate=sample_rate)
+
+    def increment(self, metric, sample_rate=None):
+        """
+        Increment a counter, aggregated metric increased by one.
+
+        :param metric: name of the metric
+        :param sample_rate: float, override default sample_rate
+        """
+        return super().increment(metric, sample_rate=sample_rate)
+
+    def decrement(self, metric, sample_rate=None):
+        """
+        Decrement a counter, aggregated metric decreased by one.
+
+        :param metric: name of the metric
+        :param sample_rate: float, override default sample_rate
+        """
+        return super().decrement(metric, sample_rate=sample_rate)
+
+    def timing(self, metric, timing_ms, sample_rate=None):
+        """
+        Update a timing metric, aggregated percentiles recalculated.
+
+        :param metric: name of the metric
+        :param timing_ms: float, total timing of operation
+        :param sample_rate: float, override default sample_rate
+        """
+        return super().timing(metric, timing_ms, sample_rate=sample_rate)
+
+    def timing_since(self, metric, orig_time, sample_rate=None):
+        """
+        Update a timing metric, aggregated percentiles recalculated.
+
+        This is an alternative spelling of timing which calculates
+        timing_ms=(time.time() - orig_time) for you.
+
+        :param metric: name of the metric
+        :param orig_time: float, time.time() from start of operation
+        :param sample_rate: float, override default sample_rate
+        """
+        return super().timing_since(metric, orig_time,
+                                    sample_rate=sample_rate)
+
+    def transfer_rate(self, metric, elapsed_time, byte_xfer,
+                      sample_rate=None):
+        """
+        Update a timing metric, aggregated percentiles recalculated.
+
+        This is a timing metric, but adjusts the timing data per kB transferred
+        (ms/kB) for each non-zero-byte update.  Allegedly this could be used to
+        monitor problematic devices, where higher is bad.
+
+        :param metric: name of the metric
+        :param elapsed_time: float, total timing of operation
+        :param byte_xfer: int, number of bytes
+        :param sample_rate: float, override default sample_rate
+        """
+        return super().transfer_rate(metric, elapsed_time, byte_xfer,
+                                     sample_rate=sample_rate)
+
+
+class LabeledStatsdClient(AbstractStatsdClient):
+    """
+    A statsd client that supports annotating metrics with labels.
+
+    Labeled metrics can be emitted in the style of Graphite, Librato, InfluxDB,
+    or DogStatsD, by specifying the corresponding ``label_mode`` when
+    constructing a client. If ``label_mode`` is ``disabled`` then no metrics
+    are emitted by the client.
+
+    Label keys should contain only ASCII letters ('a-z', 'A-Z'), digits
+    ('0-9') and the underscore character ('_'). Label values may also contain
+    the period ('.') character.
+
+    Callers should avoid using labels that have a high cardinality of values
+    since this may result in an unreasonable number of distinct time series for
+    collectors to maintain. For example, labels should NOT be used for object
+    names or transaction ids.
+
+    :param host: Statsd host name. If ``None`` then metrics are not sent.
+    :param port: Statsd host port.
+    :param default_sample_rate: The default rate at which metrics should be
+        sampled if no sample rate is otherwise specified. Should be a float
+        value between 0 and 1.
+    :param sample_rate_factor: A multiplier to apply to the rate at which
+        metrics are sampled. Should be a float value between 0 and 1.
+    :param label_mode: one of 'graphite', 'dogstatsd', 'librato', 'influxdb'
+        or 'disabled'.
+    :param default_labels: a dictionary of labels that will be added to every
+        metric emitted by the client.
+    :param logger: A stdlib logger instance.
+    """
+    def __init__(self, host, port,
+                 default_sample_rate=1, sample_rate_factor=1,
+                 label_mode='disabled', default_labels=None,
+                 logger=None):
+        super().__init__(
+            host, port, default_sample_rate, sample_rate_factor, logger)
+        self.default_labels = default_labels or {}
+        self.label_formatter = _get_labeled_statsd_formatter(label_mode)
+        if self.logger:
+            self.logger.debug('Labeled statsd mode: %s (%s)',
+                              label_mode, self.logger.name)
+
+    def _send(self, metric, value, metric_type, labels=None, sample_rate=None):
+        if not self.label_formatter:
+            return
+
+        is_emitted, adjusted_sample_rate = self._is_emitted(sample_rate)
+        if is_emitted:
+            return self._send_line(self._build_line(
+                metric, value, metric_type, labels, adjusted_sample_rate))
+
+    def _build_line(self, metric, value, metric_type, labels, sample_rate):
+        all_labels = dict(self.default_labels)
+        if labels:
+            all_labels.update(labels)
+        return self.label_formatter(
+            metric,
+            value,
+            metric_type,
+            sample_rate,
+            sorted(all_labels.items()))
+
+    def update_stats(self, metric, value, *, labels=None, sample_rate=None):
+        """
+        Update a counter, aggregated metric changed by value.
+
+        :param metric: name of the metric
+        :param value: int, the counter delta
+        :param labels: dict, metric labels
+        :param sample_rate: float, override default sample_rate
+        """
+        return super().update_stats(metric, value, labels=labels,
+                                    sample_rate=sample_rate)
+
+    def increment(self, metric, *, labels=None, sample_rate=None):
+        """
+        Increment a counter, aggregated metric increased by one.
+
+        :param metric: name of the metric
+        :param labels: dict, metric labels
+        :param sample_rate: float, override default sample_rate
+        """
+        return super().increment(metric, labels=labels,
+                                 sample_rate=sample_rate)
+
+    def decrement(self, metric, *, labels=None, sample_rate=None):
+        """
+        Decrement a counter, aggregated metric decreased by one.
+
+        :param metric: name of the metric
+        :param labels: dict, metric labels
+        :param sample_rate: float, override default sample_rate
+        """
+        return super().decrement(metric, labels=labels,
+                                 sample_rate=sample_rate)
+
+    def timing(self, metric, timing_ms, *, labels=None, sample_rate=None):
+        """
+        Update a timing metric, aggregated percentiles recalculated.
+
+        :param metric: name of the metric
+        :param timing_ms: float, total timing of operation
+        :param labels: dict, metric labels
+        :param sample_rate: float, override default sample_rate
+        """
+        return super().timing(metric, timing_ms, labels=labels,
+                              sample_rate=sample_rate)
+
+    def timing_since(self, metric, orig_time, *,
+                     labels=None, sample_rate=None):
+        """
+        Update a timing metric, aggregated percentiles recalculated.
+
+        This is an alternative spelling of timing which calculates
+        timing_ms=(time.time() - orig_time) for you.
+
+        :param metric: name of the metric
+        :param orig_time: float, time.time() from start of operation
+        :param labels: dict, metric labels
+        :param sample_rate: float, override default sample_rate
+        """
+        return super().timing_since(metric, orig_time, labels=labels,
+                                    sample_rate=sample_rate)
+
+    def transfer_rate(self, metric, elapsed_time, byte_xfer, *,
+                      labels=None, sample_rate=None):
+        """
+        Update a timing metric, aggregated percentiles recalculated.
+
+        This is a timing metric, but adjusts the timing data per kB transferred
+        (ms/kB) for each non-zero-byte update.  Allegedly this could be used to
+        monitor problematic devices, where higher is bad.
+
+        :param metric: name of the metric
+        :param elapsed_time: float, total timing of operation
+        :param byte_xfer: int, number of bytes
+        :param labels: dict, metric labels
+        :param sample_rate: float, override default sample_rate
+        """
+        return super().transfer_rate(metric, elapsed_time, byte_xfer,
+                                     labels=labels,
+                                     sample_rate=sample_rate)
diff --git a/swift/common/storage_policy.py b/swift/common/storage_policy.py
new file mode 100644
index 0000000000..a1bcfc4130
--- /dev/null
+++ b/swift/common/storage_policy.py
@@ -0,0 +1,993 @@
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+
+import logging
+import os
+import string
+import sys
+import textwrap
+from configparser import ConfigParser
+from swift.common.utils import (
+    config_true_value, quorum_size, whataremyips, list_from_csv,
+    config_positive_int_value, get_zero_indexed_base_string, load_pkg_resource)
+from swift.common.ring import Ring, RingData
+from swift.common import utils
+from swift.common.exceptions import RingLoadError
+from pyeclib.ec_iface import ECDriver, ECDriverError, VALID_EC_TYPES
+
+LEGACY_POLICY_NAME = 'Policy-0'
+VALID_CHARS = '-' + string.ascii_letters + string.digits
+
+DEFAULT_POLICY_TYPE = REPL_POLICY = 'replication'
+EC_POLICY = 'erasure_coding'
+
+DEFAULT_EC_OBJECT_SEGMENT_SIZE = 1048576
+
+
+class BindPortsCache(object):
+    def __init__(self, swift_dir, ring_ip):
+        self.swift_dir = swift_dir
+        self.mtimes_by_ring_path = {}
+        self.portsets_by_ring_path = {}
+        self.my_ips = set(whataremyips(ring_ip))
+
+    def all_bind_ports_for_node(self):
+        """
+        Given an iterable of IP addresses identifying a storage backend server,
+        return a set of all bind ports defined in all rings for this storage
+        backend server.
+
+        The caller is responsible for not calling this method (which performs
+        at least a stat on all ring files) too frequently.
+        """
+        # NOTE: we don't worry about disappearing rings here because you can't
+        # ever delete a storage policy.
+
+        for policy in POLICIES:
+            # NOTE: we must NOT use policy.load_ring to load the ring.  Users
+            # of this utility function will not need the actual ring data, just
+            # the bind ports.
+            #
+            # This is duplicated with Ring.__init__ just a bit...
+            serialized_path = os.path.join(self.swift_dir,
+                                           policy.ring_name + '.ring.gz')
+            try:
+                new_mtime = os.path.getmtime(serialized_path)
+            except OSError:
+                continue
+            old_mtime = self.mtimes_by_ring_path.get(serialized_path)
+            if not old_mtime or old_mtime != new_mtime:
+                self.portsets_by_ring_path[serialized_path] = set(
+                    dev['port']
+                    for dev in RingData.load(serialized_path,
+                                             metadata_only=True).devs
+                    if dev and dev['ip'] in self.my_ips)
+                self.mtimes_by_ring_path[serialized_path] = new_mtime
+                # No "break" here so that the above line will update the
+                # mtimes_by_ring_path entry for any ring that changes, not just
+                # the first one we notice.
+
+        # Return the requested set of ports from our (now-freshened) cache
+        res = set()
+        for ports in self.portsets_by_ring_path.values():
+            res.update(ports)
+        return res
+
+
+class PolicyError(ValueError):
+    def __init__(self, msg, index=None):
+        if index is not None:
+            msg += ', for index %r' % index
+        super(PolicyError, self).__init__(msg)
+
+
+def _get_policy_string(base, policy_index):
+    return get_zero_indexed_base_string(base, policy_index)
+
+
+def get_policy_string(base, policy_or_index):
+    """
+    Helper function to construct a string from a base and the policy.
+    Used to encode the policy index into either a file name or a
+    directory name by various modules.
+
+    :param base: the base string
+    :param policy_or_index: StoragePolicy instance, or an index
+                            (string or int), if None the legacy
+                            storage Policy-0 is assumed.
+
+    :returns: base name with policy index added
+    :raises PolicyError: if no policy exists with the given policy_index
+    """
+    if isinstance(policy_or_index, BaseStoragePolicy):
+        policy = policy_or_index
+    else:
+        policy = POLICIES.get_by_index(policy_or_index)
+        if policy is None:
+            raise PolicyError("Unknown policy", index=policy_or_index)
+    return _get_policy_string(base, int(policy))
+
+
+def split_policy_string(policy_string):
+    """
+    Helper function to convert a string representing a base and a
+    policy.  Used to decode the policy from either a file name or
+    a directory name by various modules.
+
+    :param policy_string: base name with policy index added
+
+    :raises PolicyError: if given index does not map to a valid policy
+    :returns: a tuple, in the form (base, policy) where base is the base
+              string and policy is the StoragePolicy instance for the
+              index encoded in the policy_string.
+    """
+    if '-' in policy_string:
+        base, policy_index = policy_string.rsplit('-', 1)
+    else:
+        base, policy_index = policy_string, None
+    policy = POLICIES.get_by_index(policy_index)
+    if get_policy_string(base, policy) != policy_string:
+        raise PolicyError("Unknown policy", index=policy_index)
+    return base, policy
+
+
+class BaseStoragePolicy(object):
+    """
+    Represents a storage policy.  Not meant to be instantiated directly;
+    implement a derived subclasses (e.g. StoragePolicy, ECStoragePolicy, etc)
+    or use :func:`~swift.common.storage_policy.reload_storage_policies` to
+    load POLICIES from ``swift.conf``.
+
+    The object_ring property is lazy loaded once the service's ``swift_dir``
+    is known via :meth:`~StoragePolicyCollection.get_object_ring`, but it may
+    be over-ridden via object_ring kwarg at create time for testing or
+    actively loaded with :meth:`~StoragePolicy.load_ring`.
+    """
+
+    policy_type_to_policy_cls = {}
+
+    def __init__(self, idx, name='', is_default=False, is_deprecated=False,
+                 object_ring=None, aliases='',
+                 diskfile_module='egg:swift#replication.fs'):
+        # do not allow BaseStoragePolicy class to be instantiated directly
+        if type(self) is BaseStoragePolicy:
+            raise TypeError("Can't instantiate BaseStoragePolicy directly")
+        # policy parameter validation
+        try:
+            self.idx = int(idx)
+        except ValueError:
+            raise PolicyError('Invalid index', idx)
+        if self.idx < 0:
+            raise PolicyError('Invalid index', idx)
+        self.alias_list = []
+        self.add_name(name)
+        if aliases:
+            names_list = list_from_csv(aliases)
+            for alias in names_list:
+                if alias == name:
+                    continue
+                self.add_name(alias)
+        self.is_deprecated = config_true_value(is_deprecated)
+        self.is_default = config_true_value(is_default)
+        if self.policy_type not in BaseStoragePolicy.policy_type_to_policy_cls:
+            raise PolicyError('Invalid type', self.policy_type)
+        if self.is_deprecated and self.is_default:
+            raise PolicyError('Deprecated policy can not be default.  '
+                              'Invalid config', self.idx)
+
+        self.ring_name = _get_policy_string('object', self.idx)
+        self.object_ring = object_ring
+
+        self.diskfile_module = diskfile_module
+
+    @property
+    def name(self):
+        return self.alias_list[0]
+
+    @name.setter
+    def name_setter(self, name):
+        self._validate_policy_name(name)
+        self.alias_list[0] = name
+
+    @property
+    def aliases(self):
+        return ", ".join(self.alias_list)
+
+    def __int__(self):
+        return self.idx
+
+    def __hash__(self):
+        return hash(self.idx)
+
+    def __eq__(self, other):
+        return self.idx == int(other)
+
+    def __ne__(self, other):
+        return self.idx != int(other)
+
+    def __lt__(self, other):
+        return self.idx < int(other)
+
+    def __gt__(self, other):
+        return self.idx > int(other)
+
+    def __repr__(self):
+        return ("%s(%d, %r, is_default=%s, "
+                "is_deprecated=%s, policy_type=%r)") % \
+               (self.__class__.__name__, self.idx, self.alias_list,
+                self.is_default, self.is_deprecated, self.policy_type)
+
+    @classmethod
+    def register(cls, policy_type):
+        """
+        Decorator for Storage Policy implementations to register
+        their StoragePolicy class.  This will also set the policy_type
+        attribute on the registered implementation.
+        """
+
+        def register_wrapper(policy_cls):
+            if policy_type in cls.policy_type_to_policy_cls:
+                raise PolicyError(
+                    '%r is already registered for the policy_type %r' % (
+                        cls.policy_type_to_policy_cls[policy_type],
+                        policy_type))
+            cls.policy_type_to_policy_cls[policy_type] = policy_cls
+            policy_cls.policy_type = policy_type
+            return policy_cls
+
+        return register_wrapper
+
+    @classmethod
+    def _config_options_map(cls):
+        """
+        Map config option name to StoragePolicy parameter name.
+        """
+        return {
+            'name': 'name',
+            'aliases': 'aliases',
+            'policy_type': 'policy_type',
+            'default': 'is_default',
+            'deprecated': 'is_deprecated',
+            'diskfile_module': 'diskfile_module'
+        }
+
+    @classmethod
+    def from_config(cls, policy_index, options):
+        config_to_policy_option_map = cls._config_options_map()
+        policy_options = {}
+        for config_option, value in options.items():
+            try:
+                policy_option = config_to_policy_option_map[config_option]
+            except KeyError:
+                raise PolicyError('Invalid option %r in '
+                                  'storage-policy section' % config_option,
+                                  index=policy_index)
+            policy_options[policy_option] = value
+        return cls(policy_index, **policy_options)
+
+    def get_info(self, config=False):
+        """
+        Return the info dict and conf file options for this policy.
+
+        :param config: boolean, if True all config options are returned
+        """
+        info = {}
+        for config_option, policy_attribute in \
+                self._config_options_map().items():
+            info[config_option] = getattr(self, policy_attribute)
+        if not config:
+            # remove some options for public consumption
+            if not self.is_default:
+                info.pop('default')
+            if not self.is_deprecated:
+                info.pop('deprecated')
+            info.pop('policy_type')
+            info.pop('diskfile_module')
+        return info
+
+    def _validate_policy_name(self, name):
+        """
+        Helper function to determine the validity of a policy name. Used
+        to check policy names before setting them.
+
+        :param name: a name string for a single policy name.
+        :raises PolicyError: if the policy name is invalid.
+        """
+        if not name:
+            raise PolicyError('Invalid name %r' % name, self.idx)
+        # this is defensively restrictive, but could be expanded in the future
+        if not all(c in VALID_CHARS for c in name):
+            msg = 'Names are used as HTTP headers, and can not ' \
+                  'reliably contain any characters not in %r. ' \
+                  'Invalid name %r' % (VALID_CHARS, name)
+            raise PolicyError(msg, self.idx)
+        if name.upper() == LEGACY_POLICY_NAME.upper() and self.idx != 0:
+            msg = 'The name %s is reserved for policy index 0. ' \
+                  'Invalid name %r' % (LEGACY_POLICY_NAME, name)
+            raise PolicyError(msg, self.idx)
+        if name.upper() in (existing_name.upper() for existing_name
+                            in self.alias_list):
+            msg = 'The name %s is already assigned to this policy.' % name
+            raise PolicyError(msg, self.idx)
+
+    def add_name(self, name):
+        """
+        Adds an alias name to the storage policy. Shouldn't be called
+        directly from the storage policy but instead through the
+        storage policy collection class, so lookups by name resolve
+        correctly.
+
+        :param name: a new alias for the storage policy
+        """
+        self._validate_policy_name(name)
+        self.alias_list.append(name)
+
+    def remove_name(self, name):
+        """
+        Removes an alias name from the storage policy. Shouldn't be called
+        directly from the storage policy but instead through the storage
+        policy collection class, so lookups by name resolve correctly. If
+        the name removed is the primary name then the next available alias
+        will be adopted as the new primary name.
+
+        :param name: a name assigned to the storage policy
+        """
+        if name not in self.alias_list:
+            raise PolicyError("%s is not a name assigned to policy %s"
+                              % (name, self.idx))
+        if len(self.alias_list) == 1:
+            raise PolicyError("Cannot remove only name %s from policy %s. "
+                              "Policies must have at least one name."
+                              % (name, self.idx))
+        else:
+            self.alias_list.remove(name)
+
+    def change_primary_name(self, name):
+        """
+        Changes the primary/default name of the policy to a specified name.
+
+        :param name: a string name to replace the current primary name.
+        """
+        if name == self.name:
+            return
+        elif name in self.alias_list:
+            self.remove_name(name)
+        else:
+            self._validate_policy_name(name)
+        self.alias_list.insert(0, name)
+
+    def validate_ring_data(self, ring_data):
+        """
+        Validation hook used when loading the ring; currently only used for EC
+        """
+
+    def load_ring(self, swift_dir, reload_time=None):
+        """
+        Load the ring for this policy immediately.
+
+        :param swift_dir: path to rings
+        :param reload_time: time interval in seconds to check for a ring change
+        """
+        if self.object_ring:
+            if reload_time is not None:
+                self.object_ring.reload_time = reload_time
+            return
+
+        self.object_ring = Ring(
+            swift_dir, ring_name=self.ring_name,
+            validation_hook=self.validate_ring_data, reload_time=reload_time)
+
+    @property
+    def quorum(self):
+        """
+        Number of successful backend requests needed for the proxy to
+        consider the client request successful.
+        """
+        raise NotImplementedError()
+
+    def get_diskfile_manager(self, *args, **kwargs):
+        """
+        Return an instance of the diskfile manager class configured for this
+        storage policy.
+
+        :param args: positional args to pass to the diskfile manager
+            constructor.
+        :param kwargs: keyword args to pass to the diskfile manager
+            constructor.
+        :return: A disk file manager instance.
+        """
+        try:
+            dfm_cls = load_pkg_resource('swift.diskfile', self.diskfile_module)
+        except ImportError as err:
+            raise PolicyError(
+                'Unable to load diskfile_module %s for policy %s: %s' %
+                (self.diskfile_module, self.name, err))
+        try:
+            dfm_cls.check_policy(self)
+        except ValueError:
+            raise PolicyError(
+                'Invalid diskfile_module %s for policy %s:%s (%s)' %
+                (self.diskfile_module, int(self), self.name, self.policy_type))
+
+        return dfm_cls(*args, **kwargs)
+
+
+@BaseStoragePolicy.register(REPL_POLICY)
+class StoragePolicy(BaseStoragePolicy):
+    """
+    Represents a storage policy of type 'replication'.  Default storage policy
+    class unless otherwise overridden from swift.conf.
+
+    Not meant to be instantiated directly; use
+    :func:`~swift.common.storage_policy.reload_storage_policies` to load
+    POLICIES from ``swift.conf``.
+    """
+
+    @property
+    def quorum(self):
+        """
+        Quorum concept in the replication case:
+            floor(number of replica / 2) + 1
+        """
+        if not self.object_ring:
+            raise PolicyError('Ring is not loaded')
+        return quorum_size(self.object_ring.replica_count)
+
+
+@BaseStoragePolicy.register(EC_POLICY)
+class ECStoragePolicy(BaseStoragePolicy):
+    """
+    Represents a storage policy of type 'erasure_coding'.
+
+    Not meant to be instantiated directly; use
+    :func:`~swift.common.storage_policy.reload_storage_policies` to load
+    POLICIES from ``swift.conf``.
+    """
+
+    def __init__(self, idx, name='', aliases='', is_default=False,
+                 is_deprecated=False, object_ring=None,
+                 diskfile_module='egg:swift#erasure_coding.fs',
+                 ec_segment_size=DEFAULT_EC_OBJECT_SEGMENT_SIZE,
+                 ec_type=None, ec_ndata=None, ec_nparity=None,
+                 ec_duplication_factor=1):
+
+        super(ECStoragePolicy, self).__init__(
+            idx=idx, name=name, aliases=aliases, is_default=is_default,
+            is_deprecated=is_deprecated, object_ring=object_ring,
+            diskfile_module=diskfile_module)
+
+        # Validate erasure_coding policy specific members
+        # ec_type is one of the EC implementations supported by PyEClib
+        if ec_type is None:
+            raise PolicyError('Missing ec_type')
+        if ec_type not in VALID_EC_TYPES:
+            raise PolicyError('Wrong ec_type %s for policy %s, should be one'
+                              ' of "%s"' % (ec_type, self.name,
+                                            ', '.join(VALID_EC_TYPES)))
+        self._ec_type = ec_type
+
+        # Define _ec_ndata as the number of EC data fragments
+        # Accessible as the property "ec_ndata"
+        try:
+            value = int(ec_ndata)
+            if value <= 0:
+                raise ValueError
+            self._ec_ndata = value
+        except (TypeError, ValueError):
+            raise PolicyError('Invalid ec_num_data_fragments %r' %
+                              ec_ndata, index=self.idx)
+
+        # Define _ec_nparity as the number of EC parity fragments
+        # Accessible as the property "ec_nparity"
+        try:
+            value = int(ec_nparity)
+            if value <= 0:
+                raise ValueError
+            self._ec_nparity = value
+        except (TypeError, ValueError):
+            raise PolicyError('Invalid ec_num_parity_fragments %r'
+                              % ec_nparity, index=self.idx)
+
+        # Define _ec_segment_size as the encode segment unit size
+        # Accessible as the property "ec_segment_size"
+        try:
+            value = int(ec_segment_size)
+            if value <= 0:
+                raise ValueError
+            self._ec_segment_size = value
+        except (TypeError, ValueError):
+            raise PolicyError('Invalid ec_object_segment_size %r' %
+                              ec_segment_size, index=self.idx)
+
+        if self._ec_type == 'isa_l_rs_vand' and self._ec_nparity >= 5:
+            logger = logging.getLogger("swift.common.storage_policy")
+            if not logger.handlers:
+                # If nothing else, log to stderr
+                logger.addHandler(logging.StreamHandler(sys.__stderr__))
+            logger.warning(
+                'Storage policy %s uses an EC configuration known to harm '
+                'data durability. Any data in this policy should be migrated. '
+                'See https://bugs.launchpad.net/swift/+bug/1639691 for '
+                'more information.' % self.name)
+            if not is_deprecated:
+                raise PolicyError(
+                    'Storage policy %s uses an EC configuration known to harm '
+                    'data durability. This policy MUST be deprecated.'
+                    % self.name)
+
+        # Initialize PyECLib EC backend
+        try:
+            self.pyeclib_driver = \
+                ECDriver(k=self._ec_ndata, m=self._ec_nparity,
+                         ec_type=self._ec_type)
+        except ECDriverError as e:
+            raise PolicyError("Error creating EC policy (%s)" % e,
+                              index=self.idx)
+
+        # quorum size in the EC case depends on the choice of EC scheme.
+        self._ec_quorum_size = \
+            self._ec_ndata + self.pyeclib_driver.min_parity_fragments_needed()
+        self._fragment_size = None
+
+        self._ec_duplication_factor = \
+            config_positive_int_value(ec_duplication_factor)
+
+    @property
+    def ec_type(self):
+        return self._ec_type
+
+    @property
+    def ec_ndata(self):
+        return self._ec_ndata
+
+    @property
+    def ec_nparity(self):
+        return self._ec_nparity
+
+    @property
+    def ec_n_unique_fragments(self):
+        return self._ec_ndata + self._ec_nparity
+
+    @property
+    def ec_segment_size(self):
+        return self._ec_segment_size
+
+    @property
+    def fragment_size(self):
+        """
+        Maximum length of a fragment, including header.
+
+        NB: a fragment archive is a sequence of 0 or more max-length
+        fragments followed by one possibly-shorter fragment.
+        """
+        # Technically pyeclib's get_segment_info signature calls for
+        # (data_len, segment_size) but on a ranged GET we don't know the
+        # ec-content-length header before we need to compute where in the
+        # object we should request to align with the fragment size.  So we
+        # tell pyeclib a lie - from it's perspective, as long as data_len >=
+        # segment_size it'll give us the answer we want.  From our
+        # perspective, because we only use this answer to calculate the
+        # *minimum* size we should read from an object body even if data_len <
+        # segment_size we'll still only read *the whole one and only last
+        # fragment* and pass than into pyeclib who will know what to do with
+        # it just as it always does when the last fragment is < fragment_size.
+        if self._fragment_size is None:
+            self._fragment_size = self.pyeclib_driver.get_segment_info(
+                self.ec_segment_size, self.ec_segment_size)['fragment_size']
+
+        return self._fragment_size
+
+    @property
+    def ec_scheme_description(self):
+        """
+        This short hand form of the important parts of the ec schema is stored
+        in Object System Metadata on the EC Fragment Archives for debugging.
+        """
+        return "%s %d+%d" % (self._ec_type, self._ec_ndata, self._ec_nparity)
+
+    @property
+    def ec_duplication_factor(self):
+        return self._ec_duplication_factor
+
+    def __repr__(self):
+        extra_info = ''
+        if self.ec_duplication_factor != 1:
+            extra_info = ', ec_duplication_factor=%d' % \
+                self.ec_duplication_factor
+        return ("%s, EC config(ec_type=%s, ec_segment_size=%d, "
+                "ec_ndata=%d, ec_nparity=%d%s)") % \
+               (super(ECStoragePolicy, self).__repr__(), self.ec_type,
+                self.ec_segment_size, self.ec_ndata, self.ec_nparity,
+                extra_info)
+
+    @classmethod
+    def _config_options_map(cls):
+        options = super(ECStoragePolicy, cls)._config_options_map()
+        options.update({
+            'ec_type': 'ec_type',
+            'ec_object_segment_size': 'ec_segment_size',
+            'ec_num_data_fragments': 'ec_ndata',
+            'ec_num_parity_fragments': 'ec_nparity',
+            'ec_duplication_factor': 'ec_duplication_factor',
+        })
+        return options
+
+    def get_info(self, config=False):
+        info = super(ECStoragePolicy, self).get_info(config=config)
+        if not config:
+            info.pop('ec_object_segment_size')
+            info.pop('ec_num_data_fragments')
+            info.pop('ec_num_parity_fragments')
+            info.pop('ec_type')
+            info.pop('ec_duplication_factor')
+        return info
+
+    @property
+    def quorum(self):
+        """
+        Number of successful backend requests needed for the proxy to consider
+        the client PUT request successful.
+
+        The quorum size for EC policies defines the minimum number
+        of data + parity elements required to be able to guarantee
+        the desired fault tolerance, which is the number of data
+        elements supplemented by the minimum number of parity
+        elements required by the chosen erasure coding scheme.
+
+        For example, for Reed-Solomon, the minimum number parity
+        elements required is 1, and thus the quorum_size requirement
+        is ec_ndata + 1.
+
+        Given the number of parity elements required is not the same
+        for every erasure coding scheme, consult PyECLib for
+        min_parity_fragments_needed()
+        """
+        return self._ec_quorum_size * self.ec_duplication_factor
+
+    def validate_ring_data(self, ring_data):
+        """
+        EC specific validation
+
+        Replica count check - we need _at_least_ (#data + #parity) replicas
+        configured.  Also if the replica count is larger than exactly that
+        number there's a non-zero risk of error for code that is
+        considering the number of nodes in the primary list from the ring.
+        """
+
+        configured_fragment_count = ring_data.replica_count
+        required_fragment_count = \
+            (self.ec_n_unique_fragments) * self.ec_duplication_factor
+        if configured_fragment_count != required_fragment_count:
+            raise RingLoadError(
+                'EC ring for policy %s needs to be configured with '
+                'exactly %d replicas. Got %s.' % (
+                    self.name, required_fragment_count,
+                    configured_fragment_count))
+
+    def get_backend_index(self, node_index):
+        """
+        Backend index for PyECLib
+
+        :param node_index: integer of node index
+        :return: integer of actual fragment index. if param is not an integer,
+                 return None instead
+        """
+        try:
+            node_index = int(node_index)
+        except ValueError:
+            return None
+
+        return node_index % self.ec_n_unique_fragments
+
+
+class StoragePolicyCollection(object):
+    """
+    This class represents the collection of valid storage policies for the
+    cluster and is instantiated as :class:`StoragePolicy` objects are added to
+    the collection when ``swift.conf`` is parsed by
+    :func:`parse_storage_policies`.
+
+    When a StoragePolicyCollection is created, the following validation
+    is enforced:
+
+    * If a policy with index 0 is not declared and no other policies defined,
+      Swift will create one
+    * The policy index must be a non-negative integer
+    * If no policy is declared as the default and no other policies are
+      defined, the policy with index 0 is set as the default
+    * Policy indexes must be unique
+    * Policy names are required
+    * Policy names are case insensitive
+    * Policy names must contain only letters, digits or a dash
+    * Policy names must be unique
+    * The policy name 'Policy-0' can only be used for the policy with index 0
+    * If any policies are defined, exactly one policy must be declared default
+    * Deprecated policies can not be declared the default
+
+    """
+
+    def __init__(self, pols):
+        self.default = []
+        self.by_name = {}
+        self.by_index = {}
+        self._validate_policies(pols)
+
+    def _add_policy(self, policy):
+        """
+        Add pre-validated policies to internal indexes.
+        """
+        for name in policy.alias_list:
+            self.by_name[name.upper()] = policy
+        self.by_index[int(policy)] = policy
+
+    def __repr__(self):
+        return (textwrap.dedent("""
+    StoragePolicyCollection([
+        %s
+    ])
+    """) % ',\n    '.join(repr(p) for p in self)).strip()
+
+    def __len__(self):
+        return len(self.by_index)
+
+    def __getitem__(self, key):
+        return self.by_index[key]
+
+    def __iter__(self):
+        return iter(self.by_index.values())
+
+    def _validate_policies(self, policies):
+        """
+        :param policies: list of policies
+        """
+
+        for policy in policies:
+            if int(policy) in self.by_index:
+                raise PolicyError('Duplicate index %s conflicts with %s' % (
+                    policy, self.get_by_index(int(policy))))
+            for name in policy.alias_list:
+                if name.upper() in self.by_name:
+                    raise PolicyError('Duplicate name %s conflicts with %s' % (
+                        policy, self.get_by_name(name)))
+            if policy.is_default:
+                if not self.default:
+                    self.default = policy
+                else:
+                    raise PolicyError(
+                        'Duplicate default %s conflicts with %s' % (
+                            policy, self.default))
+            self._add_policy(policy)
+
+        # If a 0 policy wasn't explicitly given, or nothing was
+        # provided, create the 0 policy now
+        if 0 not in self.by_index:
+            if len(self) != 0:
+                raise PolicyError('You must specify a storage policy '
+                                  'section for policy index 0 in order '
+                                  'to define multiple policies')
+            self._add_policy(StoragePolicy(0, name=LEGACY_POLICY_NAME))
+
+        # at least one policy must be enabled
+        enabled_policies = [p for p in self if not p.is_deprecated]
+        if not enabled_policies:
+            raise PolicyError("Unable to find policy that's not deprecated!")
+
+        # if needed, specify default
+        if not self.default:
+            if len(self) > 1:
+                raise PolicyError("Unable to find default policy")
+            self.default = self[0]
+            self.default.is_default = True
+
+    def get_by_name(self, name):
+        """
+        Find a storage policy by its name.
+
+        :param name: name of the policy
+        :returns: storage policy, or None
+        """
+        return self.by_name.get(name.upper())
+
+    def get_by_index(self, index):
+        """
+        Find a storage policy by its index.
+
+        An index of None will be treated as 0.
+
+        :param index: numeric index of the storage policy
+        :returns: storage policy, or None if no such policy
+        """
+        # makes it easier for callers to just pass in a header value
+        if index in ('', None):
+            index = 0
+        else:
+            try:
+                index = int(index)
+            except ValueError:
+                return None
+        return self.by_index.get(index)
+
+    def get_by_name_or_index(self, name_or_index):
+        by_name = self.get_by_name(name_or_index)
+        by_index = self.get_by_index(name_or_index)
+        if by_name and by_index and by_name != by_index:
+            raise PolicyError(
+                "Found different polices when searching by "
+                "name (%s) and by index (%s)" % (by_name, by_index))
+        return by_name or by_index
+
+    @property
+    def legacy(self):
+        return self.get_by_index(None)
+
+    def get_object_ring(self, policy_idx, swift_dir):
+        """
+        Get the ring object to use to handle a request based on its policy.
+
+        An index of None will be treated as 0.
+
+        :param policy_idx: policy index as defined in swift.conf
+        :param swift_dir: swift_dir used by the caller
+        :returns: appropriate ring object
+        """
+        policy = self.get_by_index(policy_idx)
+        if not policy:
+            raise PolicyError("No policy with index %s" % policy_idx)
+        if not policy.object_ring:
+            policy.load_ring(swift_dir)
+        return policy.object_ring
+
+    def get_policy_info(self):
+        """
+        Build info about policies for the /info endpoint
+
+        :returns: list of dicts containing relevant policy information
+        """
+        policy_info = []
+        for pol in self:
+            # delete from /info if deprecated
+            if pol.is_deprecated:
+                continue
+            policy_entry = pol.get_info()
+            policy_info.append(policy_entry)
+        return policy_info
+
+    def add_policy_alias(self, policy_index, *aliases):
+        """
+        Adds a new name or names to a policy
+
+        :param policy_index: index of a policy in this policy collection.
+        :param aliases: arbitrary number of string policy names to add.
+        """
+        policy = self.get_by_index(policy_index)
+        for alias in aliases:
+            if alias.upper() in self.by_name:
+                raise PolicyError('Duplicate name %s in use '
+                                  'by policy %s' % (alias,
+                                                    self.get_by_name(alias)))
+            else:
+                policy.add_name(alias)
+                self.by_name[alias.upper()] = policy
+
+    def remove_policy_alias(self, *aliases):
+        """
+        Removes a name or names from a policy. If the name removed is the
+        primary name then the next available alias will be adopted
+        as the new primary name.
+
+        :param aliases: arbitrary number of existing policy names to remove.
+        """
+        for alias in aliases:
+            policy = self.get_by_name(alias)
+            if not policy:
+                raise PolicyError('No policy with name %s exists.' % alias)
+            if len(policy.alias_list) == 1:
+                raise PolicyError('Policy %s with name %s has only one name. '
+                                  'Policies must have at least one name.' % (
+                                      policy, alias))
+            else:
+                policy.remove_name(alias)
+                del self.by_name[alias.upper()]
+
+    def change_policy_primary_name(self, policy_index, new_name):
+        """
+        Changes the primary or default name of a policy. The new primary
+        name can be an alias that already belongs to the policy or a
+        completely new name.
+
+        :param policy_index: index of a policy in this policy collection.
+        :param new_name: a string name to set as the new default name.
+        """
+        policy = self.get_by_index(policy_index)
+        name_taken = self.get_by_name(new_name)
+        # if the name belongs to some other policy in the collection
+        if name_taken and name_taken != policy:
+            raise PolicyError('Other policy %s with name %s exists.' %
+                              (self.get_by_name(new_name).idx, new_name))
+        else:
+            policy.change_primary_name(new_name)
+            self.by_name[new_name.upper()] = policy
+
+
+def parse_storage_policies(conf):
+    """
+    Parse storage policies in ``swift.conf`` - note that validation
+    is done when the :class:`StoragePolicyCollection` is instantiated.
+
+    :param conf: ConfigParser parser object for swift.conf
+    """
+    policies = []
+    for section in conf.sections():
+        if not section.startswith('storage-policy:'):
+            continue
+        policy_index = section.split(':', 1)[1]
+        config_options = dict(conf.items(section))
+        policy_type = config_options.pop('policy_type', DEFAULT_POLICY_TYPE)
+        policy_cls = BaseStoragePolicy.policy_type_to_policy_cls[policy_type]
+        policy = policy_cls.from_config(policy_index, config_options)
+        policies.append(policy)
+
+    return StoragePolicyCollection(policies)
+
+
+class StoragePolicySingleton(object):
+    """
+    An instance of this class is the primary interface to storage policies
+    exposed as a module level global named ``POLICIES``.  This global
+    reference wraps ``_POLICIES`` which is normally instantiated by parsing
+    ``swift.conf`` and will result in an instance of
+    :class:`StoragePolicyCollection`.
+
+    You should never patch this instance directly, instead patch the module
+    level ``_POLICIES`` instance so that swift code which imported
+    ``POLICIES`` directly will reference the patched
+    :class:`StoragePolicyCollection`.
+    """
+
+    def __iter__(self):
+        return iter(_POLICIES)
+
+    def __len__(self):
+        return len(_POLICIES)
+
+    def __getitem__(self, key):
+        return _POLICIES[key]
+
+    def __getattribute__(self, name):
+        return getattr(_POLICIES, name)
+
+    def __repr__(self):
+        return repr(_POLICIES)
+
+
+def reload_storage_policies():
+    """
+    Reload POLICIES from ``swift.conf``.
+    """
+    global _POLICIES
+    # Python disallows section or option duplicates by default
+    # strict=False allows them, which Swift has always done
+    policy_conf = ConfigParser(strict=False)
+    policy_conf.read(utils.SWIFT_CONF_FILE)
+    try:
+        _POLICIES = parse_storage_policies(policy_conf)
+    except PolicyError as e:
+        raise SystemExit('ERROR: Invalid Storage Policy Configuration '
+                         'in %s (%s)' % (utils.SWIFT_CONF_FILE, e))
+
+
+# parse configuration and setup singleton
+_POLICIES = None
+reload_storage_policies()
+POLICIES = StoragePolicySingleton()
diff --git a/swift/common/swob.py b/swift/common/swob.py
old mode 100755
new mode 100644
index 1fcff0423f..d6e653de23
--- a/swift/common/swob.py
+++ b/swift/common/swob.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -19,20 +19,41 @@
 This library has a very similar API to Webob.  It wraps WSGI request
 environments and response values into objects that are more friendly to
 interact with.
-"""
 
-from cStringIO import StringIO
-import UserDict
+Why Swob and not just use WebOb?
+By Michael Barton
+
+We used webob for years. The main problem was that the interface
+wasn't stable. For a while, each of our several test suites required
+a slightly different version of webob to run, and none of them worked
+with the then-current version. It was a huge headache, so we just
+scrapped it.
+
+This is kind of a ton of code, but it's also been a huge relief to
+not have to scramble to add a bunch of code branches all over the
+place to keep Swift working every time webob decides some interface
+needs to change.
+"""
+import calendar
+from collections import defaultdict
+from collections.abc import MutableMapping
 import time
 from functools import partial
-from datetime import datetime, date, timedelta, tzinfo
+from datetime import datetime
+from datetime import timezone
 from email.utils import parsedate
-import urlparse
-import urllib2
 import re
 import random
+import functools
+from io import BytesIO
+
+from io import StringIO
+import urllib
 
-from swift.common.utils import reiterate
+from swift.common.header_key_dict import HeaderKeyDict
+from swift.common.utils import reiterate, split_path, Timestamp, pairs, \
+    close_if_possible, closing_if_possible, config_true_value, friendly_close
+from swift.common.exceptions import InvalidTimestamp
 
 
 RESPONSE_REASONS = {
@@ -43,7 +64,9 @@
     204: ('No Content', ''),
     206: ('Partial Content', ''),
     301: ('Moved Permanently', 'The resource has moved permanently.'),
-    302: ('Found', ''),
+    302: ('Found', 'The resource has moved temporarily.'),
+    303: ('See Other', 'The response to the request can be found under a '
+          'different URI.'),
     304: ('Not Modified', ''),
     307: ('Temporary Redirect', 'The resource has moved temporarily.'),
     400: ('Bad Request', 'The server could not comply with the request since '
@@ -87,21 +110,68 @@
     504: ('Gateway Timeout', 'A timeout has occurred speaking to a '
           'backend server.'),
     507: ('Insufficient Storage', 'There was not enough space to save the '
-          'resource.'),
+          'resource. Drive: %(drive)s'),
+    529: ('Too Many Backend Requests', 'The server is incapable of performing '
+          'the requested operation due to too many requests. Slow down.')
 }
 
+MAX_RANGE_OVERLAPS = 2
+MAX_NONASCENDING_RANGES = 8
+MAX_RANGES = 50
 
-class _UTC(tzinfo):
+
+class WsgiBytesIO(BytesIO):
+    """
+    This class adds support for the additional wsgi.input methods defined on
+    eventlet.wsgi.Input to the BytesIO class which would otherwise be a fine
+    stand-in for the file-like object in the WSGI environment.
     """
-    A tzinfo class for datetime objects that returns a 0 timedelta (UTC time)
+
+    def set_hundred_continue_response_headers(self, headers):
+        pass
+
+    def send_hundred_continue_response(self):
+        pass
+
+
+DATE_HEADER_FORMAT_STRING = "%a, %d %b %Y %H:%M:%S GMT"
+
+
+def date_header_format(value):
+    """
+    Given a Timestamp or numeric epoch, return a string in the IMF-fixdate
+    format specified by RFC7231 [1] and defined in RFC5322 [2], e.g.:
+
+        Sun, 06 Nov 1994 08:49:37 GMT
+
+    This format should be used for headers such as Date, Last-Modified,
+    If-Modified-Since and If-Unmodified-Since.
+
+    If ``value`` is a Timestamp instance then ``value.ceil()`` is used as the
+    numeric epoch.
+
+    [1] https://datatracker.ietf.org/doc/html/rfc7231#section-7.1.1.1
+    [2] https://datatracker.ietf.org/doc/html/rfc5322
+
+    :param value: a Timestamp or numeric epoch
+    :returns: an RFC5322 format HTTP date string.
+    """
+    if isinstance(value, Timestamp):
+        value = value.ceil()
+    return time.strftime(DATE_HEADER_FORMAT_STRING, time.gmtime(value))
+
+
+def parse_date_header(value):
     """
-    def dst(self, dt):
-        return timedelta(0)
-    utcoffset = dst
+    Given a string in the IMF-fixdate format specified by RFC7231 [1] and
+    defined in RFC5322 [2], return seconds since Unix epoch.
 
-    def tzname(self, dt):
-        return 'UTC'
-UTC = _UTC()
+        Sun, 06 Nov 1994 08:49:37 GMT
+
+    :param value: a string in the IMF-fixdate format.
+    :returns: integer seconds since Unix epoch.
+    """
+    return calendar.timegm(time.strptime(value, DATE_HEADER_FORMAT_STRING))
 
 
 def _datetime_property(header):
@@ -109,7 +179,7 @@ def _datetime_property(header):
     Set and retrieve the datetime value of self.headers[header]
     (Used by both request and response)
     The header is parsed on retrieval and a datetime object is returned.
-    The header can be set using a datetime, numeric value, or str.
+    The header can be set using a datetime, numeric value, Timestamp, or str.
     If a value of None is given, the header is deleted.
 
     :param header: name of the header, e.g. "Content-Length"
@@ -119,19 +189,15 @@ def getter(self):
         if value is not None:
             try:
                 parts = parsedate(self.headers[header])[:7]
-                date = datetime(*(parts + (UTC,)))
+                return datetime(*(parts + (timezone.utc,)))
             except Exception:
                 return None
-            if date.year < 1970:
-                raise ValueError('Somehow an invalid year')
-            return date
 
     def setter(self, value):
-        if isinstance(value, (float, int, long)):
-            self.headers[header] = time.strftime(
-                "%a, %d %b %Y %H:%M:%S GMT", time.gmtime(value))
+        if isinstance(value, (float, int, Timestamp)):
+            self.headers[header] = date_header_format(value)
         elif isinstance(value, datetime):
-            self.headers[header] = value.strftime("%a, %d %b %Y %H:%M:%S GMT")
+            self.headers[header] = value.strftime(DATE_HEADER_FORMAT_STRING)
         else:
             self.headers[header] = value
 
@@ -146,7 +212,7 @@ def _header_property(header):
     (Used by both request and response)
     If a value of None is given, the header is deleted.
 
-    :param header: name of the header, e.g. "Content-Length"
+    :param header: name of the header, e.g. "Transfer-Encoding"
     """
     def getter(self):
         return self.headers.get(header, None)
@@ -180,7 +246,24 @@ def setter(self, value):
                     doc="Retrieve and set the %s header as an int" % header)
 
 
-class HeaderEnvironProxy(UserDict.DictMixin):
+def header_to_environ_key(header_name):
+    # Why the to/from wsgi dance? Headers that include something like b'\xff'
+    # on the wire get translated to u'\u00ff' on py3, which gets upper()ed to
+    # u'\u0178', which is nonsense in a WSGI string.
+    # Note that we have to only get as far as bytes because something like
+    # b'\xc3\x9f' on the wire would be u'\u00df' as a native string on py3,
+    # which would upper() to 'SS'.
+    real_header = wsgi_to_bytes(header_name)
+    header_name = 'HTTP_' + bytes_to_wsgi(
+        real_header.upper()).replace('-', '_')
+    if header_name == 'HTTP_CONTENT_LENGTH':
+        return 'CONTENT_LENGTH'
+    if header_name == 'HTTP_CONTENT_TYPE':
+        return 'CONTENT_TYPE'
+    return header_name
+
+
+class HeaderEnvironProxy(MutableMapping):
     """
     A dict-like object that proxies requests to a wsgi environ,
     rewriting header keys to environ keys.
@@ -191,34 +274,35 @@ class HeaderEnvironProxy(UserDict.DictMixin):
     def __init__(self, environ):
         self.environ = environ
 
-    def _normalize(self, key):
-        key = 'HTTP_' + key.replace('-', '_').upper()
-        if key == 'HTTP_CONTENT_LENGTH':
-            return 'CONTENT_LENGTH'
-        if key == 'HTTP_CONTENT_TYPE':
-            return 'CONTENT_TYPE'
-        return key
+    def __iter__(self):
+        for k in self.keys():
+            yield k
+
+    def __len__(self):
+        return len(self.keys())
 
     def __getitem__(self, key):
-        return self.environ[self._normalize(key)]
+        return self.environ[header_to_environ_key(key)]
 
     def __setitem__(self, key, value):
         if value is None:
-            self.environ.pop(self._normalize(key), None)
-        elif isinstance(value, unicode):
-            self.environ[self._normalize(key)] = value.encode('utf-8')
+            self.environ.pop(header_to_environ_key(key), None)
+        elif isinstance(value, bytes):
+            self.environ[header_to_environ_key(key)] = value.decode('latin1')
         else:
-            self.environ[self._normalize(key)] = str(value)
+            self.environ[header_to_environ_key(key)] = str(value)
 
     def __contains__(self, key):
-        return self._normalize(key) in self.environ
+        return header_to_environ_key(key) in self.environ
 
     def __delitem__(self, key):
-        del self.environ[self._normalize(key)]
+        del self.environ[header_to_environ_key(key)]
 
     def keys(self):
-        keys = [key[5:].replace('_', '-').title()
-                for key in self.environ.iterkeys() if key.startswith('HTTP_')]
+        # See the to/from WSGI comment in header_to_environ_key
+        keys = [
+            bytes_to_wsgi(wsgi_to_bytes(key[5:]).replace(b'_', b'-').title())
+            for key in self.environ if key.startswith('HTTP_')]
         if 'CONTENT_LENGTH' in self.environ:
             keys.append('Content-Length')
         if 'CONTENT_TYPE' in self.environ:
@@ -226,43 +310,48 @@ def keys(self):
         return keys
 
 
-class HeaderKeyDict(dict):
-    """
-    A dict that lower-cases all keys on the way in, so as to be
-    case-insensitive.
-    """
-    def __init__(self, *args, **kwargs):
-        for arg in args:
-            self.update(arg)
-        self.update(kwargs)
-
-    def update(self, other):
-        if hasattr(other, 'keys'):
-            for key in other.keys():
-                self[key.lower()] = other[key]
-        else:
-            for key, value in other:
-                self[key.lower()] = value
+def wsgi_to_bytes(wsgi_str):
+    if wsgi_str is None:
+        return None
+    return wsgi_str.encode('latin1')
 
-    def __getitem__(self, key):
-        return dict.get(self, key.lower())
 
-    def __setitem__(self, key, value):
-        if value is None:
-            self.pop(key.lower(), None)
-        elif isinstance(value, unicode):
-            return dict.__setitem__(self, key.lower(), value.encode('utf-8'))
-        else:
-            return dict.__setitem__(self, key.lower(), str(value))
+def wsgi_to_str(wsgi_str):
+    if wsgi_str is None:
+        return None
+    return wsgi_to_bytes(wsgi_str).decode('utf8', errors='surrogateescape')
 
-    def __contains__(self, key):
-        return dict.__contains__(self, key.lower())
 
-    def __delitem__(self, key):
-        return dict.__delitem__(self, key.lower())
+def bytes_to_wsgi(byte_str):
+    return byte_str.decode('latin1')
+
+
+def str_to_wsgi(native_str):
+    return bytes_to_wsgi(native_str.encode('utf8', errors='surrogateescape'))
+
+
+def wsgi_quote(wsgi_str, safe='/'):
+    if not isinstance(wsgi_str, str) or any(ord(x) > 255 for x in wsgi_str):
+        raise TypeError('Expected a WSGI string; got %r' % wsgi_str)
+    return urllib.parse.quote(wsgi_str, safe=safe, encoding='latin-1')
+
+
+def wsgi_unquote(wsgi_str):
+    if not isinstance(wsgi_str, str) or any(ord(x) > 255 for x in wsgi_str):
+        raise TypeError('Expected a WSGI string; got %r' % wsgi_str)
+    return urllib.parse.unquote(wsgi_str, encoding='latin-1')
+
 
-    def get(self, key, default=None):
-        return dict.get(self, key.lower(), default)
+def wsgi_quote_plus(wsgi_str):
+    if not isinstance(wsgi_str, str) or any(ord(x) > 255 for x in wsgi_str):
+        raise TypeError('Expected a WSGI string; got %r' % wsgi_str)
+    return urllib.parse.quote_plus(wsgi_str, encoding='latin-1')
+
+
+def wsgi_unquote_plus(wsgi_str):
+    if not isinstance(wsgi_str, str) or any(ord(x) > 255 for x in wsgi_str):
+        raise TypeError('Expected a WSGI string; got %r' % wsgi_str)
+    return urllib.parse.unquote_plus(wsgi_str, encoding='latin-1')
 
 
 def _resp_status_property():
@@ -277,12 +366,10 @@ def getter(self):
         return '%s %s' % (self.status_int, self.title)
 
     def setter(self, value):
-        if isinstance(value, (int, long)):
+        if isinstance(value, int):
             self.status_int = value
             self.explanation = self.title = RESPONSE_REASONS[value][0]
         else:
-            if isinstance(value, unicode):
-                value = value.encode('utf-8')
             self.status_int = int(value.split(' ', 1)[0])
             self.explanation = self.title = value.split(' ', 1)[1]
 
@@ -300,16 +387,18 @@ def _resp_body_property():
     def getter(self):
         if not self._body:
             if not self._app_iter:
-                return ''
-            self._body = ''.join(self._app_iter)
+                return b''
+            with closing_if_possible(self._app_iter):
+                self._body = b''.join(self._app_iter)
             self._app_iter = None
         return self._body
 
     def setter(self, value):
-        if isinstance(value, unicode):
-            value = value.encode('utf-8')
         if isinstance(value, str):
+            raise TypeError('WSGI responses must be bytes')
+        if isinstance(value, bytes):
             self.content_length = len(value)
+            close_if_possible(self._app_iter)
             self._app_iter = None
         self._body = value
 
@@ -390,10 +479,15 @@ def getter(self):
 
     def setter(self, value):
         if isinstance(value, (list, tuple)):
+            for i, item in enumerate(value):
+                if not isinstance(item, bytes):
+                    raise TypeError('WSGI responses must be bytes; '
+                                    'got %s for item %d' % (type(item), i))
             self.content_length = sum(map(len, value))
         elif value is not None:
             self.content_length = None
             self._body = None
+        close_if_possible(self._app_iter)
         self._app_iter = value
 
     return property(getter, setter,
@@ -434,8 +528,8 @@ class Range(object):
     After initialization, "range.ranges" is populated with a list
     of (start, end) tuples denoting the requested ranges.
 
-    If there were any syntactically-invalid byte-range-spec values,
-    "range.ranges" will be an empty list, per the relevant RFC:
+    If there were any syntactically-invalid byte-range-spec values, the
+    constructor will raise a ValueError, per the relevant RFC:
 
     "The recipient of a byte-range-set that includes one or more syntactically
     invalid byte-range-spec values MUST ignore the header field that includes
@@ -460,6 +554,8 @@ class Range(object):
     :param headerval: value of the header as a str
     """
     def __init__(self, headerval):
+        if not headerval:
+            raise ValueError('Invalid Range header: %r' % headerval)
         headerval = headerval.replace(' ', '')
         if not headerval.lower().startswith('bytes='):
             raise ValueError('Invalid Range header: %s' % headerval)
@@ -476,10 +572,14 @@ def __init__(self, headerval):
             else:
                 start = None
             if end:
-                # when end contains non numeric value, this also causes
-                # ValueError
+                # We could just rely on int() raising the ValueError, but
+                # this catches things like '--0'
+                if not end.isdigit():
+                    raise ValueError('Invalid Range header: %s' % headerval)
                 end = int(end)
-                if start is not None and end < start:
+                if end < 0:
+                    raise ValueError('Invalid Range header: %s' % headerval)
+                elif start is not None and end < start:
                     raise ValueError('Invalid Range header: %s' % headerval)
             else:
                 end = None
@@ -489,14 +589,15 @@ def __init__(self, headerval):
 
     def __str__(self):
         string = 'bytes='
-        for start, end in self.ranges:
+        for i, (start, end) in enumerate(self.ranges):
             if start is not None:
                 string += str(start)
             string += '-'
             if end is not None:
                 string += str(end)
-            string += ','
-        return string.rstrip(',')
+            if i < len(self.ranges) - 1:
+                string += ','
+        return string
 
     def ranges_for_length(self, length):
         """
@@ -559,25 +660,72 @@ def ranges_for_length(self, length):
                 # the total length of the content
                 all_ranges.append((begin, min(end + 1, length)))
 
+        # RFC 7233 section 6.1 ("Denial-of-Service Attacks Using Range") says:
+        #
+        # Unconstrained multiple range requests are susceptible to denial-of-
+        # service attacks because the effort required to request many
+        # overlapping ranges of the same data is tiny compared to the time,
+        # memory, and bandwidth consumed by attempting to serve the requested
+        # data in many parts.  Servers ought to ignore, coalesce, or reject
+        # egregious range requests, such as requests for more than two
+        # overlapping ranges or for many small ranges in a single set,
+        # particularly when the ranges are requested out of order for no
+        # apparent reason.  Multipart range requests are not designed to
+        # support random access.
+        #
+        # We're defining "egregious" here as:
+        #
+        # * more than 50 requested ranges OR
+        # * more than 2 overlapping ranges OR
+        # * more than 8 non-ascending-order ranges
+        if len(all_ranges) > MAX_RANGES:
+            return []
+
+        overlaps = 0
+        for ((start1, end1), (start2, end2)) in pairs(all_ranges):
+            if ((start1 < start2 < end1) or (start1 < end2 < end1) or
+               (start2 < start1 < end2) or (start2 < end1 < end2)):
+                overlaps += 1
+                if overlaps > MAX_RANGE_OVERLAPS:
+                    return []
+
+        ascending = True
+        for start1, start2 in zip(all_ranges, all_ranges[1:]):
+            if start1 > start2:
+                ascending = False
+                break
+        if not ascending and len(all_ranges) >= MAX_NONASCENDING_RANGES:
+            return []
+
         return all_ranges
 
 
+def normalize_etag(tag):
+    if tag and tag.startswith('"') and tag.endswith('"') and tag != '"':
+        return tag[1:-1]
+    return tag
+
+
 class Match(object):
     """
-    Wraps a Request's If-None-Match header as a friendly object.
+    Wraps a Request's If-[None-]Match header as a friendly object.
 
     :param headerval: value of the header as a str
     """
     def __init__(self, headerval):
         self.tags = set()
-        for tag in headerval.split(', '):
-            if tag.startswith('"') and tag.endswith('"'):
-                self.tags.add(tag[1:-1])
-            else:
-                self.tags.add(tag)
+        for tag in headerval.split(','):
+            tag = tag.strip()
+            if not tag:
+                continue
+            self.tags.add(normalize_etag(tag))
 
     def __contains__(self, val):
-        return '*' in self.tags or val in self.tags
+        return '*' in self.tags or normalize_etag(val) in self.tags
+
+    def __repr__(self):
+        return '%s(%r)' % (
+            self.__class__.__name__, ', '.join(sorted(self.tags)))
 
 
 class Accept(object):
@@ -586,9 +734,17 @@ class Accept(object):
 
     :param headerval: value of the header as a str
     """
-    token = r'[^()<>@,;:\"/\[\]?={}\x00-\x20\x7f]+'  # RFC 2616 2.2
-    acc_pattern = re.compile(r'^\s*(' + token + r')/(' + token +
-                             r')(;\s*q=([\d.]+))?\s*$')
+
+    # RFC 2616 section 2.2
+    token = r'[^()<>@,;:\"/\[\]?={}\x00-\x20\x7f]+'  # nosec B105
+    qdtext = r'[^"]'
+    quoted_pair = r'(?:\\.)'
+    quoted_string = r'"(?:' + qdtext + r'|' + quoted_pair + r')*"'
+    extension = (r'(?:\s*;\s*(?:' + token + r")\s*=\s*" + r'(?:' + token +
+                 r'|' + quoted_string + r'))')
+    acc = (r'^\s*(' + token + r')/(' + token +
+           r')(' + extension + r'*?\s*)$')
+    acc_pattern = re.compile(acc)
 
     def __init__(self, headerval):
         self.headerval = headerval
@@ -601,8 +757,22 @@ def _get_types(self):
             type_parms = self.acc_pattern.findall(typ)
             if not type_parms:
                 raise ValueError('Invalid accept header')
-            typ, subtype, parms, quality = type_parms[0]
-            quality = float(quality or '1.0')
+            typ, subtype, parms = type_parms[0]
+            parms = [p.strip() for p in parms.split(';') if p.strip()]
+
+            seen_q_already = False
+            quality = 1.0
+
+            for parm in parms:
+                name, value = parm.split('=')
+                name = name.strip()
+                value = value.strip()
+                if name == 'q':
+                    if seen_q_already:
+                        raise ValueError('Multiple "q" params')
+                    seen_q_already = True
+                    quality = float(value)
+
             pattern = '^' + \
                 (self.token if typ == '*' else re.escape(typ)) + '/' + \
                 (self.token if subtype == '*' else re.escape(subtype)) + '$'
@@ -617,11 +787,9 @@ def best_match(self, options):
         Returns None if no available options are acceptable to the client.
 
         :param options: a list of content-types the server can respond with
+        :raises ValueError: if the header is malformed
         """
-        try:
-            types = self._get_types()
-        except ValueError:
-            return None
+        types = self._get_types()
         if not types and options:
             return options[0]
         for pattern in types:
@@ -634,15 +802,21 @@ def __repr__(self):
         return self.headerval
 
 
-def _req_environ_property(environ_field):
+def _req_environ_property(environ_field, is_wsgi_string_field=True):
     """
     Set and retrieve value of the environ_field entry in self.environ.
-    (Used by both request and response)
+    (Used by Request)
     """
     def getter(self):
         return self.environ.get(environ_field, None)
 
     def setter(self, value):
+        if is_wsgi_string_field:
+            # Check that input is valid before setting
+            if isinstance(value, str):
+                value.encode('latin1').decode('utf-8')
+            if isinstance(value, bytes):
+                value = value.decode('latin1')
         self.environ[environ_field] = value
 
     return property(getter, setter, doc=("Get and set the %s property "
@@ -652,21 +826,65 @@ def setter(self, value):
 def _req_body_property():
     """
     Set and retrieve the Request.body parameter.  It consumes wsgi.input and
-    returns the results.  On assignment, uses a StringIO to create a new
+    returns the results.  On assignment, uses a WsgiBytesIO to create a new
     wsgi.input.
     """
     def getter(self):
         body = self.environ['wsgi.input'].read()
-        self.environ['wsgi.input'] = StringIO(body)
+        self.environ['wsgi.input'] = WsgiBytesIO(body)
         return body
 
     def setter(self, value):
-        self.environ['wsgi.input'] = StringIO(value)
+        if not isinstance(value, bytes):
+            value = value.encode('utf8')
+        self.environ['wsgi.input'] = WsgiBytesIO(value)
         self.environ['CONTENT_LENGTH'] = str(len(value))
 
     return property(getter, setter, doc="Get and set the request body str")
 
 
+def _host_url_property():
+    """
+    Retrieves the best guess that can be made for an absolute location up to
+    the path, for example: https://host.com:1234
+    """
+    def getter(self):
+        if 'HTTP_HOST' in self.environ:
+            host = self.environ['HTTP_HOST']
+        else:
+            host = '%s:%s' % (self.environ['SERVER_NAME'],
+                              self.environ['SERVER_PORT'])
+        scheme = self.environ.get('wsgi.url_scheme', 'http')
+        if scheme == 'http' and host.endswith(':80'):
+            host, port = host.rsplit(':', 1)
+        elif scheme == 'https' and host.endswith(':443'):
+            host, port = host.rsplit(':', 1)
+        return '%s://%s' % (scheme, host)
+
+    return property(getter, doc="Get url for request/response up to path")
+
+
+def is_chunked(headers):
+    te = None
+    for key in headers:
+        if key.lower() == 'transfer-encoding':
+            te = headers.get(key)
+    if te:
+        encodings = te.split(',')
+        if len(encodings) > 1:
+            raise AttributeError('Unsupported Transfer-Coding header'
+                                 ' value specified in Transfer-Encoding'
+                                 ' header')
+        # If there are more than one transfer encoding value, the last
+        # one must be chunked, see RFC 2616 Sec. 3.6
+        if encodings[-1].lower() == 'chunked':
+            return True
+        else:
+            raise ValueError('Invalid Transfer-Encoding header value')
+    else:
+        return False
+
+
 class Request(object):
     """
     WSGI Request object.
@@ -679,61 +897,94 @@ class Request(object):
     script_name = _req_environ_property('SCRIPT_NAME')
     path_info = _req_environ_property('PATH_INFO')
     host = _req_environ_property('HTTP_HOST')
+    host_url = _host_url_property()
     remote_addr = _req_environ_property('REMOTE_ADDR')
     remote_user = _req_environ_property('REMOTE_USER')
     user_agent = _req_environ_property('HTTP_USER_AGENT')
     query_string = _req_environ_property('QUERY_STRING')
-    if_match = _req_environ_property('HTTP_IF_MATCH')
-    body_file = _req_environ_property('wsgi.input')
+    if_match = _req_fancy_property(Match, 'if-match')
+    body_file = _req_environ_property('wsgi.input',
+                                      is_wsgi_string_field=False)
     content_length = _header_int_property('content-length')
     if_modified_since = _datetime_property('if-modified-since')
     if_unmodified_since = _datetime_property('if-unmodified-since')
     body = _req_body_property()
     charset = None
     _params_cache = None
-    acl = _req_environ_property('swob.ACL')
+    _timestamp = None
+    acl = _req_environ_property('swob.ACL', is_wsgi_string_field=False)
 
     def __init__(self, environ):
         self.environ = environ
         self.headers = HeaderEnvironProxy(self.environ)
 
     @classmethod
-    def blank(cls, path, environ=None, headers=None, body=None):
+    def blank(cls, path, environ=None, headers=None, body=None, **kwargs):
         """
         Create a new request object with the given parameters, and an
         environment otherwise filled in with non-surprising default values.
+
+        :param path: encoded, parsed, and unquoted into PATH_INFO
+        :param environ: WSGI environ dictionary
+        :param headers: HTTP headers
+        :param body: stuffed in a WsgiBytesIO and hung on wsgi.input
+        :param kwargs: any environ key with an property setter
         """
         headers = headers or {}
         environ = environ or {}
-        if '?' in path:
-            path_info, query_string = path.split('?')
+        if isinstance(path, bytes):
+            path = path.decode('latin1')
         else:
-            path_info = path
-            query_string = ''
+            # Check that the input is valid
+            path.encode('latin1')
+
+        parsed_path = urllib.parse.urlparse(path)
+        server_name = 'localhost'
+        if parsed_path.netloc:
+            server_name = parsed_path.netloc.split(':', 1)[0]
+
+        server_port = parsed_path.port
+        if server_port is None:
+            server_port = {'http': 80,
+                           'https': 443}.get(parsed_path.scheme, 80)
+        if parsed_path.scheme and parsed_path.scheme not in ['http', 'https']:
+            raise TypeError('Invalid scheme: %s' % parsed_path.scheme)
         env = {
             'REQUEST_METHOD': 'GET',
             'SCRIPT_NAME': '',
-            'QUERY_STRING': query_string,
-            'PATH_INFO': urllib2.unquote(path_info),
-            'SERVER_NAME': 'localhost',
-            'SERVER_PORT': '80',
-            'HTTP_HOST': 'localhost:80',
+            'QUERY_STRING': parsed_path.query,
+            'PATH_INFO': wsgi_unquote(parsed_path.path),
+            'SERVER_NAME': server_name,
+            'SERVER_PORT': str(server_port),
+            'HTTP_HOST': '%s:%d' % (server_name, server_port),
             'SERVER_PROTOCOL': 'HTTP/1.0',
             'wsgi.version': (1, 0),
-            'wsgi.url_scheme': 'http',
-            'wsgi.errors': StringIO(''),
+            'wsgi.url_scheme': parsed_path.scheme or 'http',
+            'wsgi.errors': StringIO(),
             'wsgi.multithread': False,
             'wsgi.multiprocess': False
         }
         env.update(environ)
         if body is not None:
-            env['wsgi.input'] = StringIO(body)
+            if not isinstance(body, bytes):
+                body = body.encode('utf8')
+            env['wsgi.input'] = WsgiBytesIO(body)
             env['CONTENT_LENGTH'] = str(len(body))
         elif 'wsgi.input' not in env:
-            env['wsgi.input'] = StringIO('')
+            env['wsgi.input'] = WsgiBytesIO()
         req = Request(env)
-        for key, val in headers.iteritems():
+        for key, val in headers.items():
             req.headers[key] = val
+        for key, val in kwargs.items():
+            prop = getattr(Request, key, None)
+            if prop and isinstance(prop, property):
+                try:
+                    setattr(req, key, val)
+                except AttributeError:
+                    pass
+                else:
+                    continue
+            raise TypeError("got unexpected keyword argument %r" % key)
         return req
 
     @property
@@ -741,13 +992,63 @@ def params(self):
         "Provides QUERY_STRING parameters as a dictionary"
         if self._params_cache is None:
             if 'QUERY_STRING' in self.environ:
-                self._params_cache = dict(
-                    urlparse.parse_qsl(self.environ['QUERY_STRING'], True))
+                self._params_cache = dict(urllib.parse.parse_qsl(
+                    self.environ['QUERY_STRING'],
+                    keep_blank_values=True, encoding='latin-1'))
             else:
                 self._params_cache = {}
         return self._params_cache
     str_params = params
 
+    @params.setter
+    def params(self, param_pairs):
+        self._params_cache = None
+        self.query_string = urllib.parse.urlencode(param_pairs,
+                                                   encoding='latin-1')
+
+    def ensure_x_timestamp(self):
+        """
+        Similar to :attr:`timestamp`, but the ``X-Timestamp`` header will be
+        set if not present.
+
+        :raises HTTPBadRequest: if X-Timestamp is already set but not a valid
+                                :class:`~swift.common.utils.Timestamp`
+        :returns: the request's X-Timestamp header,
+                  as a :class:`~swift.common.utils.Timestamp`
+        """
+        # The container sync feature includes an x-timestamp header with
+        # requests. If present this is checked and preserved, otherwise a fresh
+        # timestamp is added.
+        if 'HTTP_X_TIMESTAMP' in self.environ:
+            try:
+                self._timestamp = Timestamp(self.environ['HTTP_X_TIMESTAMP'])
+            except ValueError:
+                raise HTTPBadRequest(
+                    request=self, content_type='text/plain',
+                    body='X-Timestamp should be a UNIX timestamp float value; '
+                         'was %r' % self.environ['HTTP_X_TIMESTAMP'])
+        else:
+            self._timestamp = Timestamp.now()
+        # Always normalize it to the internal form
+        self.environ['HTTP_X_TIMESTAMP'] = self._timestamp.internal
+        return self._timestamp
+
+    @property
+    def timestamp(self):
+        """
+        Provides HTTP_X_TIMESTAMP as a :class:`~swift.common.utils.Timestamp`
+        """
+        if self._timestamp is None:
+            try:
+                raw_timestamp = self.environ['HTTP_X_TIMESTAMP']
+            except KeyError:
+                raise InvalidTimestamp('Missing X-Timestamp header')
+            try:
+                self._timestamp = Timestamp(raw_timestamp)
+            except ValueError:
+                raise InvalidTimestamp('Invalid X-Timestamp header')
+        return self._timestamp
+
     @property
     def path_qs(self):
         """The path of the request, without host but with query string."""
@@ -759,8 +1060,38 @@ def path_qs(self):
     @property
     def path(self):
         "Provides the full path of the request, excluding the QUERY_STRING"
-        return urllib2.quote(self.environ.get('SCRIPT_NAME', '') +
-                             self.environ['PATH_INFO'])
+        return wsgi_quote(self.environ.get('SCRIPT_NAME', '') +
+                          self.environ['PATH_INFO'])
+
+    @property
+    def swift_entity_path(self):
+        """
+        Provides the (native string) account/container/object path,
+        sans API version.
+
+        This can be useful when constructing a path to send to a backend
+        server, as that path will need everything after the "/v1".
+        """
+        _ver, entity_path = self.split_path(1, 2, rest_with_last=True)
+        if entity_path is not None:
+            return '/' + wsgi_to_str(entity_path)
+
+    @property
+    def is_chunked(self):
+        return is_chunked(self.headers)
+
+    @property
+    def url(self):
+        "Provides the full url of the request"
+        return self.host_url + self.path_qs
+
+    @property
+    def allow_reserved_names(self):
+        return config_true_value(self.environ.get(
+            'HTTP_X_BACKEND_ALLOW_RESERVED_NAMES'))
+
+    def as_referer(self):
+        return self.method + ' ' + self.url
 
     def path_info_pop(self):
         """
@@ -769,7 +1100,7 @@ def path_info_pop(self):
         the path segment.
         """
         path_info = self.path_info
-        if not path_info or path_info[0] != '/':
+        if not path_info or not path_info.startswith('/'):
             return None
         try:
             slash_loc = path_info.index('/', 1)
@@ -787,7 +1118,7 @@ def copy_get(self):
         env.update({
             'REQUEST_METHOD': 'GET',
             'CONTENT_LENGTH': '0',
-            'wsgi.input': StringIO(''),
+            'wsgi.input': WsgiBytesIO(),
         })
         return Request(env)
 
@@ -809,6 +1140,8 @@ def start_response(status, headers, exc_info=None):
             app_iter = output
         if not captured:
             app_iter = reiterate(app_iter)
+        if not captured:
+            raise RuntimeError('application never called start_response')
         return (captured[0], captured[1], app_iter)
 
     def get_response(self, application):
@@ -822,24 +1155,75 @@ def get_response(self, application):
         return Response(status=status, headers=dict(headers),
                         app_iter=app_iter, request=self)
 
+    def split_path(self, minsegs=1, maxsegs=None, rest_with_last=False):
+        """
+        Validate and split the Request's path.
+
+        **Examples**::
+
+            ['a'] = split_path('/a')
+            ['a', None] = split_path('/a', 1, 2)
+            ['a', 'c'] = split_path('/a/c', 1, 2)
+            ['a', 'c', 'o/r'] = split_path('/a/c/o/r', 1, 3, True)
+
+        :param minsegs: Minimum number of segments to be extracted
+        :param maxsegs: Maximum number of segments to be extracted
+        :param rest_with_last: If True, trailing data will be returned as part
+                               of last segment.  If False, and there is
+                               trailing data, raises ValueError.
+        :returns: list of segments with a length of maxsegs (non-existent
+                  segments will return as None)
+        :raises ValueError: if given an invalid path
+        """
+        return split_path(
+            self.environ.get('SCRIPT_NAME', '') + self.environ['PATH_INFO'],
+            minsegs, maxsegs, rest_with_last)
+
+    def message_length(self):
+        """
+        Properly determine the message length for this request. It will return
+        an integer if the headers explicitly contain the message length, or
+        None if the headers don't contain a length. The ValueError exception
+        will be raised if the headers are invalid.
+
+        :raises ValueError: if either transfer-encoding or content-length
+            headers have bad values
+        :raises AttributeError: if the last value of the transfer-encoding
+            header is not "chunked"
+        """
+        if not is_chunked(self.headers):
+            # Because we are not using chunked transfer encoding we can pay
+            # attention to the content-length header.
+            fsize = self.headers.get('content-length', None)
+            if fsize is not None:
+                try:
+                    fsize = int(fsize)
+                except ValueError:
+                    raise ValueError('Invalid Content-Length header value')
+        else:
+            fsize = None
+        return fsize
+
 
 def content_range_header_value(start, stop, size):
     return 'bytes %s-%s/%s' % (start, (stop - 1), size)
 
 
 def content_range_header(start, stop, size):
-    return "Content-Range: " + content_range_header_value(start, stop, size)
+    value = content_range_header_value(start, stop, size)
+    return b"Content-Range: " + value.encode('ascii')
 
 
 def multi_range_iterator(ranges, content_type, boundary, size, sub_iter_gen):
     for start, stop in ranges:
-        yield ''.join(['\r\n--', boundary, '\r\n',
-                       'Content-Type: ', content_type, '\r\n'])
-        yield content_range_header(start, stop, size) + '\r\n\r\n'
+        yield b''.join([b'--', boundary, b'\r\n',
+                       b'Content-Type: ', content_type, b'\r\n'])
+        yield content_range_header(start, stop, size) + b'\r\n\r\n'
         sub_iter = sub_iter_gen(start, stop)
         for chunk in sub_iter:
             yield chunk
-    yield '\r\n--' + boundary + '--\r\n'
+        yield b'\r\n'
+    yield b'--' + boundary + b'--'
 
 
 class Response(object):
@@ -851,30 +1235,71 @@ class Response(object):
     content_range = _header_property('content-range')
     etag = _resp_etag_property()
     status = _resp_status_property()
+    status_int = None
     body = _resp_body_property()
+    host_url = _host_url_property()
     last_modified = _datetime_property('last-modified')
     location = _header_property('location')
     accept_ranges = _header_property('accept-ranges')
     charset = _resp_charset_property()
     app_iter = _resp_app_iter_property()
 
-    def __init__(self, body=None, status=200, headers={}, app_iter=None,
-                 request=None, conditional_response=False, **kw):
+    def __init__(self, body=None, status=200, headers=None, app_iter=None,
+                 request=None, conditional_response=False,
+                 conditional_etag=None, **kw):
         self.headers = HeaderKeyDict(
             [('Content-Type', 'text/html; charset=UTF-8')])
         self.conditional_response = conditional_response
+        self._conditional_etag = conditional_etag
         self.request = request
+        self._app_iter = None
+        # Allow error messages to come as natural strings on py3.
+        if isinstance(body, str):
+            body = body.encode('utf8')
         self.body = body
         self.app_iter = app_iter
+        self.response_iter = None
         self.status = status
-        self.boundary = "%.32x" % random.randint(0, 256 ** 16)
+        self.boundary = b"%.32x" % random.randint(0, 256 ** 16)
         if request:
             self.environ = request.environ
         else:
             self.environ = {}
-        self.headers.update(headers)
-        for key, value in kw.iteritems():
+        if headers:
+            if self._body and 'Content-Length' in headers:
+                # If body is not empty, prioritize actual body length over
+                # content_length in headers
+                del headers['Content-Length']
+            self.headers.update(headers)
+        if self.status_int == 401 and 'www-authenticate' not in self.headers:
+            self.headers.update({'www-authenticate': self.www_authenticate()})
+        for key, value in kw.items():
             setattr(self, key, value)
+        # When specifying both 'content_type' and 'charset' in the kwargs,
+        # charset needs to be applied *after* content_type, otherwise charset
+        # can get wiped out when content_type sorts later in dict order.
+        if 'charset' in kw and 'content_type' in kw:
+            self.charset = kw['charset']
+
+    @property
+    def conditional_etag(self):
+        """
+        The conditional_etag keyword argument for Response will allow the
+        conditional match value of a If-Match request to be compared to a
+        non-standard value.
+
+        This is available for Storage Policies that do not store the client
+        object data verbatim on the storage nodes, but still need support
+        conditional requests.
+
+        It's most effectively used with X-Backend-Etag-Is-At which would
+        define the additional Metadata key(s) where the original ETag of the
+        clear-form client request data may be found.
+        """
+        if self._conditional_etag is not None:
+            return self._conditional_etag
+        else:
+            return self.etag
 
     def _prepare_for_ranges(self, ranges):
         """
@@ -882,41 +1307,121 @@ def _prepare_for_ranges(self, ranges):
         """
 
         content_size = self.content_length
-        content_type = self.content_type
-        self.content_type = ''.join(['multipart/byteranges;',
-                                     'boundary=', self.boundary])
-
-        # This section calculate the total size of the targeted response
-        # The value 12 is the length of total bytes of hyphen, new line
-        # form feed for each section header. The value 8 is the length of
-        # total bytes of hyphen, new line, form feed characters for the
-        # closing boundary which appears only once
-        section_header_fixed_len = 12 + (len(self.boundary) +
-                                         len('Content-Type: ') +
-                                         len(content_type) +
-                                         len('Content-Range: bytes '))
+        content_type = self.headers['content-type'].encode('utf8')
+        self.content_type = b''.join([b'multipart/byteranges;',
+                                      b'boundary=', self.boundary])
+
+        # This section calculates the total size of the response.
+        section_header_fixed_len = sum([
+            # --boundary\r\n
+            2, len(self.boundary), 2,
+            # Content-Type: <type>\r\n
+            len('Content-Type: '), len(content_type), 2,
+            # Content-Range: <value>\r\n; <value> accounted for later
+            len('Content-Range: '), 2,
+            # \r\n at end of headers
+            2])
+
         body_size = 0
         for start, end in ranges:
             body_size += section_header_fixed_len
-            body_size += len(str(start) + '-' + str(end - 1) + '/' +
-                             str(content_size)) + (end - start)
-        body_size += 8 + len(self.boundary)
+
+            # length of the value of Content-Range, not including the \r\n
+            # since that's already accounted for
+            cr = content_range_header_value(start, end, content_size)
+            body_size += len(cr)
+
+            # the actual bytes (note: this range is half-open, i.e. begins
+            # with byte <start> and ends with byte <end - 1>, so there's no
+            # fencepost error here)
+            body_size += (end - start)
+
+            # \r\n prior to --boundary
+            body_size += 2
+
+        # --boundary-- terminates the message
+        body_size += len(self.boundary) + 4
+
         self.content_length = body_size
         self.content_range = None
         return content_size, content_type
 
+    def _get_conditional_response_status(self):
+        """Checks for a conditional response from an If-Match
+        or If-Modified. request. If so, returns the correct status code
+        (304 or 412).
+        :returns: conditional response status (304 or 412) or None
+        """
+        if self.conditional_etag and self.request.if_none_match and \
+                self.conditional_etag in self.request.if_none_match:
+            return 304
+
+        if self.conditional_etag and self.request.if_match and \
+                self.conditional_etag not in self.request.if_match:
+            return 412
+
+        if self.status_int == 404 and self.request.if_match \
+                and '*' in self.request.if_match:
+            # If none of the entity tags match, or if "*" is given and no
+            # current entity exists, the server MUST NOT perform the
+            # requested method, and MUST return a 412 (Precondition
+            # Failed) response. [RFC 2616 section 14.24]
+            return 412
+
+        if self.last_modified and self.request.if_modified_since \
+                and self.last_modified <= self.request.if_modified_since:
+            return 304
+
+        if self.last_modified and self.request.if_unmodified_since \
+                and self.last_modified > self.request.if_unmodified_since:
+            return 412
+
+        return None
+
     def _response_iter(self, app_iter, body):
+        if self.conditional_response and self.request:
+            empty_resp = self._get_conditional_response_status()
+            if empty_resp is not None:
+                self.status = empty_resp
+                self.content_length = 0
+                # the existing successful response and it's app_iter have been
+                # determined to not meet the conditions of the reqeust, the
+                # response app_iter should be closed but not drained.
+                close_if_possible(app_iter)
+                return [b'']
+
         if self.request and self.request.method == 'HEAD':
             # We explicitly do NOT want to set self.content_length to 0 here
-            return ['']
+            friendly_close(app_iter)  # be friendly to our app_iter
+            return [b'']
+
         if self.conditional_response and self.request and \
                 self.request.range and self.request.range.ranges and \
                 not self.content_range:
             ranges = self.request.range.ranges_for_length(self.content_length)
             if ranges == []:
                 self.status = 416
-                self.content_length = 0
-                return ['']
+                close_if_possible(app_iter)
+                self.headers['Content-Range'] = \
+                    'bytes */%d' % self.content_length
+                # Setting body + app_iter to None makes us emit the default
+                # body text from RESPONSE_REASONS.
+                body = None
+                app_iter = None
+            elif self.content_length == 0:
+                # If ranges_for_length found ranges but our content length
+                # is 0, then that means we got a suffix-byte-range request
+                # (e.g. "bytes=-512"). This is asking for *up to* the last N
+                # bytes of the file. If we had any bytes to send at all,
+                # we'd return a 206 with an appropriate Content-Range header,
+                # but we can't construct a Content-Range header because we
+                # have no byte indices because we have no bytes.
+                #
+                # The only reasonable thing to do is to return a 200 with
+                # the whole object (all zero bytes of it). This is also what
+                # Apache and Nginx do, so if we're wrong, at least we're in
+                # good company.
+                pass
             elif ranges:
                 range_size = len(ranges)
                 if range_size > 0:
@@ -963,27 +1468,24 @@ def _body_slicer(start, stop):
         if self.status_int in RESPONSE_REASONS:
             title, exp = RESPONSE_REASONS[self.status_int]
             if exp:
-                body = '<html><h1>%s</h1><p>%s</p></html>' % (title, exp)
+                body = '<html><h1>%s</h1><p>%s</p></html>' % (
+                    title,
+                    exp % defaultdict(lambda: 'unknown', self.__dict__))
+                body = body.encode('utf8')
                 self.content_length = len(body)
                 return [body]
-        return ['']
+        return [b'']
 
-    def host_url(self):
+    def fix_conditional_response(self):
         """
-        Returns the best guess that can be made for an absolute location up to
-        the path, for example: https://host.com:1234
+        You may call this once you have set the content_length to the whole
+        object length and body or app_iter to reset the content_length
+        properties on the request.
+
+        It is ok to not call this method, the conditional response will be
+        maintained for you when you __call__ the response.
         """
-        if 'HTTP_HOST' in self.environ:
-            host = self.environ['HTTP_HOST']
-        else:
-            host = '%s:%s' % (self.environ['SERVER_NAME'],
-                              self.environ['SERVER_PORT'])
-        scheme = self.environ.get('wsgi.url_scheme', 'http')
-        if scheme == 'http' and host.endswith(':80'):
-            host, port = host.rsplit(':', 1)
-        elif scheme == 'https' and host.endswith(':443'):
-            host, port = host.rsplit(':', 1)
-        return '%s://%s' % (scheme, host)
+        self.response_iter = self._response_iter(self.app_iter, self._body)
 
     def absolute_location(self):
         """
@@ -991,32 +1493,107 @@ def absolute_location(self):
         """
         if not self.location.startswith('/'):
             return self.location
-        return self.host_url() + self.location
+        return self.host_url + self.location
+
+    def www_authenticate(self):
+        """
+        Construct a suitable value for WWW-Authenticate response header
+
+        If we have a request and a valid-looking path, the realm
+        is the account; otherwise we set it to 'unknown'.
+        """
+        try:
+            vrs, realm, rest = self.request.split_path(2, 3, True)
+            if realm in ('v1.0', 'auth'):
+                realm = 'unknown'
+        except (AttributeError, ValueError):
+            realm = 'unknown'
+        return 'Swift realm="%s"' % wsgi_quote(realm)
+
+    @property
+    def is_success(self):
+        return self.status_int // 100 == 2
 
     def __call__(self, env, start_response):
+        """
+        Respond to the WSGI request.
+
+        .. warning::
+
+            This will translate any relative Location header value to an
+            absolute URL using the WSGI environment's HOST_URL as a
+            prefix, as RFC 2616 specifies.
+
+            However, it is quite common to use relative redirects,
+            especially when it is difficult to know the exact HOST_URL
+            the browser would have used when behind several CNAMEs, CDN
+            services, etc. All modern browsers support relative
+            redirects.
+
+            To skip over RFC enforcement of the Location header value,
+            you may set ``env['swift.leave_relative_location'] = True``
+            in the WSGI environment.
+        """
+        if not self.request:
+            self.request = Request(env)
         self.environ = env
-        app_iter = self._response_iter(self.app_iter, self._body)
-        if 'location' in self.headers:
+
+        if not self.response_iter:
+            self.response_iter = self._response_iter(self.app_iter, self._body)
+
+        if 'location' in self.headers and \
+                not env.get('swift.leave_relative_location'):
             self.location = self.absolute_location()
-        start_response(self.status, self.headers.items())
-        return app_iter
+        start_response(self.status, list(self.headers.items()))
+        return self.response_iter
+
+
+class HTTPException(Response, Exception):
+
+    def __init__(self, *args, **kwargs):
+        Response.__init__(self, *args, **kwargs)
+        Exception.__init__(self, self.status)
+
+
+def wsgify(func):
+    """
+    A decorator for translating functions which take a swob Request object and
+    return a Response object into WSGI callables.  Also catches any raised
+    HTTPExceptions and treats them as a returned Response.
+    """
+    @functools.wraps(func)
+    def _wsgify(*args):
+        env, start_response = args[-2:]
+        new_args = args[:-2] + (Request(env), )
+        try:
+            return func(*new_args)(env, start_response)
+        except HTTPException as err_resp:
+            return err_resp(env, start_response)
+    return _wsgify
 
 
 class StatusMap(object):
     """
-    A dict-like object that returns Response subclasses/factory functions
+    A dict-like object that returns HTTPException subclasses/factory functions
     where the given key is the status code.
     """
     def __getitem__(self, key):
-        return partial(Response, status=key)
+        return partial(HTTPException, status=key)
+
+
 status_map = StatusMap()
 
 
-HTTPAccepted = status_map[202]
+HTTPOk = status_map[200]
 HTTPCreated = status_map[201]
+HTTPAccepted = status_map[202]
 HTTPNoContent = status_map[204]
+HTTPPartialContent = status_map[206]
 HTTPMovedPermanently = status_map[301]
+HTTPFound = status_map[302]
+HTTPSeeOther = status_map[303]
 HTTPNotModified = status_map[304]
+HTTPTemporaryRedirect = status_map[307]
 HTTPBadRequest = status_map[400]
 HTTPUnauthorized = status_map[401]
 HTTPForbidden = status_map[403]
@@ -1028,9 +1605,13 @@ def __getitem__(self, key):
 HTTPLengthRequired = status_map[411]
 HTTPPreconditionFailed = status_map[412]
 HTTPRequestEntityTooLarge = status_map[413]
+HTTPRequestedRangeNotSatisfiable = status_map[416]
 HTTPUnprocessableEntity = status_map[422]
 HTTPClientDisconnect = status_map[499]
 HTTPServerError = status_map[500]
 HTTPInternalServerError = status_map[500]
+HTTPNotImplemented = status_map[501]
+HTTPBadGateway = status_map[502]
 HTTPServiceUnavailable = status_map[503]
 HTTPInsufficientStorage = status_map[507]
+HTTPTooManyBackendRequests = status_map[529]
diff --git a/swift/common/utils.py b/swift/common/utils.py
deleted file mode 100644
index bf5311cafd..0000000000
--- a/swift/common/utils.py
+++ /dev/null
@@ -1,1526 +0,0 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#    http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-# implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-"""Miscellaneous utility functions for use with Swift."""
-
-import errno
-import fcntl
-import os
-import pwd
-import sys
-import time
-import functools
-from hashlib import md5
-from random import random, shuffle
-from urllib import quote
-from contextlib import contextmanager, closing
-import ctypes
-import ctypes.util
-from ConfigParser import ConfigParser, NoSectionError, NoOptionError, \
-    RawConfigParser
-from optparse import OptionParser
-from tempfile import mkstemp, NamedTemporaryFile
-try:
-    import simplejson as json
-except ImportError:
-    import json
-import cPickle as pickle
-import glob
-from urlparse import urlparse as stdlib_urlparse, ParseResult
-import socket
-import itertools
-import types
-
-import eventlet
-from eventlet import GreenPool, sleep, Timeout
-from eventlet.green import socket, threading
-import netifaces
-import codecs
-utf8_decoder = codecs.getdecoder('utf-8')
-utf8_encoder = codecs.getencoder('utf-8')
-
-from swift.common.exceptions import LockTimeout, MessageTimeout
-from swift.common.http import is_success, is_redirection, HTTP_NOT_FOUND
-
-# logging doesn't import patched as cleanly as one would like
-from logging.handlers import SysLogHandler
-import logging
-logging.thread = eventlet.green.thread
-logging.threading = eventlet.green.threading
-logging._lock = logging.threading.RLock()
-# setup notice level logging
-NOTICE = 25
-logging._levelNames[NOTICE] = 'NOTICE'
-SysLogHandler.priority_map['NOTICE'] = 'notice'
-
-# These are lazily pulled from libc elsewhere
-_sys_fsync = None
-_sys_fallocate = None
-_posix_fadvise = None
-
-# Used by hash_path to offer a bit more security when generating hashes for
-# paths. It simply appends this value to all paths; guessing the hash a path
-# will end up with would also require knowing this suffix.
-hash_conf = ConfigParser()
-HASH_PATH_SUFFIX = ''
-if hash_conf.read('/etc/swift/swift.conf'):
-    try:
-        HASH_PATH_SUFFIX = hash_conf.get('swift-hash',
-                                         'swift_hash_path_suffix')
-    except (NoSectionError, NoOptionError):
-        pass
-
-# Used when reading config values
-TRUE_VALUES = set(('true', '1', 'yes', 'on', 't', 'y'))
-
-
-def config_true_value(value):
-    """
-    Returns True if the value is either True or a string in TRUE_VALUES.
-    Returns False otherwise.
-    """
-    return value is True or \
-        (isinstance(value, basestring) and value.lower() in TRUE_VALUES)
-
-
-def noop_libc_function(*args):
-    return 0
-
-
-def validate_configuration():
-    if HASH_PATH_SUFFIX == '':
-        sys.exit("Error: [swift-hash]: swift_hash_path_suffix missing "
-                 "from /etc/swift/swift.conf")
-
-
-def load_libc_function(func_name, log_error=True):
-    """
-    Attempt to find the function in libc, otherwise return a no-op func.
-
-    :param func_name: name of the function to pull from libc.
-    """
-    try:
-        libc = ctypes.CDLL(ctypes.util.find_library('c'), use_errno=True)
-        return getattr(libc, func_name)
-    except AttributeError:
-        if log_error:
-            logging.warn(_("Unable to locate %s in libc.  Leaving as a "
-                         "no-op."), func_name)
-        return noop_libc_function
-
-
-def get_param(req, name, default=None):
-    """
-    Get parameters from an HTTP request ensuring proper handling UTF-8
-    encoding.
-
-    :param req: request object
-    :param name: parameter name
-    :param default: result to return if the parameter is not found
-    :returns: HTTP request parameter value
-    """
-    value = req.params.get(name, default)
-    if value and not isinstance(value, unicode):
-        value.decode('utf8')    # Ensure UTF8ness
-    return value
-
-
-class FallocateWrapper(object):
-
-    def __init__(self, noop=False):
-        if noop:
-            self.func_name = 'posix_fallocate'
-            self.fallocate = noop_libc_function
-            return
-        ## fallocate is prefered because we need the on-disk size to match
-        ## the allocated size. Older versions of sqlite require that the
-        ## two sizes match. However, fallocate is Linux only.
-        for func in ('fallocate', 'posix_fallocate'):
-            self.func_name = func
-            self.fallocate = load_libc_function(func, log_error=False)
-            if self.fallocate is not noop_libc_function:
-                break
-        if self.fallocate is noop_libc_function:
-            logging.warn(_("Unable to locate fallocate, posix_fallocate in "
-                         "libc.  Leaving as a no-op."))
-
-    def __call__(self, fd, mode, offset, len):
-        args = {
-            'fallocate': (fd, mode, offset, len),
-            'posix_fallocate': (fd, offset, len)
-        }
-        return self.fallocate(*args[self.func_name])
-
-
-def disable_fallocate():
-    global _sys_fallocate
-    _sys_fallocate = FallocateWrapper(noop=True)
-
-
-def fallocate(fd, size):
-    """
-    Pre-allocate disk space for a file.
-
-    :param fd: file descriptor
-    :param size: size to allocate (in bytes)
-    """
-    global _sys_fallocate
-    if _sys_fallocate is None:
-        _sys_fallocate = FallocateWrapper()
-    if size > 0:
-        # 1 means "FALLOC_FL_KEEP_SIZE", which means it pre-allocates invisibly
-        ret = _sys_fallocate(fd, 1, 0, ctypes.c_uint64(size))
-        err = ctypes.get_errno()
-        if ret and err not in (0, errno.ENOSYS, errno.EOPNOTSUPP,
-                               errno.EINVAL):
-            raise OSError(err, 'Unable to fallocate(%s)' % size)
-
-
-class FsyncWrapper(object):
-
-    def __init__(self):
-        if hasattr(os, 'fdatasync'):
-            self.func_name = 'fdatasync'
-            self.fsync = os.fdatasync
-            self.fcntl_flag = None
-        elif hasattr(fcntl, 'F_FULLFSYNC'):
-            self.func_name = 'fcntl'
-            self.fsync = fcntl.fcntl
-            self.fcntl_flag = fcntl.F_FULLFSYNC
-        else:
-            self.func_name = 'fsync'
-            self.fsync = os.fsync
-            self.fcntl_flag = None
-
-    def __call__(self, fd):
-        args = {
-            'fdatasync': (fd, ),
-            'fsync': (fd, ),
-            'fcntl': (fd, self.fcntl_flag)
-        }
-        return self.fsync(*args[self.func_name])
-
-
-def fsync(fd):
-    """
-    Write buffered changes to disk.
-
-    :param fd: file descriptor
-    """
-
-    global _sys_fsync
-    if _sys_fsync is None:
-        _sys_fsync = FsyncWrapper()
-
-    ret = _sys_fsync(fd)
-    err = ctypes.get_errno()
-    if ret and err != 0:
-        raise OSError(err, 'Unable to fsync(%s)' % fd)
-
-
-def drop_buffer_cache(fd, offset, length):
-    """
-    Drop 'buffer' cache for the given range of the given file.
-
-    :param fd: file descriptor
-    :param offset: start offset
-    :param length: length
-    """
-    global _posix_fadvise
-    if _posix_fadvise is None:
-        _posix_fadvise = load_libc_function('posix_fadvise64')
-    # 4 means "POSIX_FADV_DONTNEED"
-    ret = _posix_fadvise(fd, ctypes.c_uint64(offset),
-                         ctypes.c_uint64(length), 4)
-    if ret != 0:
-        logging.warn("posix_fadvise64(%s, %s, %s, 4) -> %s"
-                     % (fd, offset, length, ret))
-
-
-def normalize_timestamp(timestamp):
-    """
-    Format a timestamp (string or numeric) into a standardized
-    xxxxxxxxxx.xxxxx format.
-
-    :param timestamp: unix timestamp
-    :returns: normalized timestamp as a string
-    """
-    return "%016.05f" % (float(timestamp))
-
-
-def mkdirs(path):
-    """
-    Ensures the path is a directory or makes it if not. Errors if the path
-    exists but is a file or on permissions failure.
-
-    :param path: path to create
-    """
-    if not os.path.isdir(path):
-        try:
-            os.makedirs(path)
-        except OSError, err:
-            if err.errno != errno.EEXIST or not os.path.isdir(path):
-                raise
-
-
-def renamer(old, new):
-    """
-    Attempt to fix / hide race conditions like empty object directories
-    being removed by backend processes during uploads, by retrying.
-
-    :param old: old path to be renamed
-    :param new: new path to be renamed to
-    """
-    try:
-        mkdirs(os.path.dirname(new))
-        os.rename(old, new)
-    except OSError, err:
-        mkdirs(os.path.dirname(new))
-        os.rename(old, new)
-
-
-def split_path(path, minsegs=1, maxsegs=None, rest_with_last=False):
-    """
-    Validate and split the given HTTP request path.
-
-    **Examples**::
-
-        ['a'] = split_path('/a')
-        ['a', None] = split_path('/a', 1, 2)
-        ['a', 'c'] = split_path('/a/c', 1, 2)
-        ['a', 'c', 'o/r'] = split_path('/a/c/o/r', 1, 3, True)
-
-    :param path: HTTP Request path to be split
-    :param minsegs: Minimum number of segments to be extracted
-    :param maxsegs: Maximum number of segments to be extracted
-    :param rest_with_last: If True, trailing data will be returned as part
-                           of last segment.  If False, and there is
-                           trailing data, raises ValueError.
-    :returns: list of segments with a length of maxsegs (non-existant
-              segments will return as None)
-    :raises: ValueError if given an invalid path
-    """
-    if not maxsegs:
-        maxsegs = minsegs
-    if minsegs > maxsegs:
-        raise ValueError('minsegs > maxsegs: %d > %d' % (minsegs, maxsegs))
-    if rest_with_last:
-        segs = path.split('/', maxsegs)
-        minsegs += 1
-        maxsegs += 1
-        count = len(segs)
-        if (segs[0] or count < minsegs or count > maxsegs or
-                '' in segs[1:minsegs]):
-            raise ValueError('Invalid path: %s' % quote(path))
-    else:
-        minsegs += 1
-        maxsegs += 1
-        segs = path.split('/', maxsegs)
-        count = len(segs)
-        if (segs[0] or count < minsegs or count > maxsegs + 1 or
-                '' in segs[1:minsegs] or
-                (count == maxsegs + 1 and segs[maxsegs])):
-            raise ValueError('Invalid path: %s' % quote(path))
-    segs = segs[1:maxsegs]
-    segs.extend([None] * (maxsegs - 1 - len(segs)))
-    return segs
-
-
-def validate_device_partition(device, partition):
-    """
-    Validate that a device and a partition are valid and won't lead to
-    directory traversal when used.
-
-    :param device: device to validate
-    :param partition: partition to validate
-    :raises: ValueError if given an invalid device or partition
-    """
-    invalid_device = False
-    invalid_partition = False
-    if not device or '/' in device or device in ['.', '..']:
-        invalid_device = True
-    if not partition or '/' in partition or partition in ['.', '..']:
-        invalid_partition = True
-
-    if invalid_device:
-        raise ValueError('Invalid device: %s' % quote(device or ''))
-    elif invalid_partition:
-        raise ValueError('Invalid partition: %s' % quote(partition or ''))
-
-
-class NullLogger():
-    """A no-op logger for eventlet wsgi."""
-
-    def write(self, *args):
-        #"Logs" the args to nowhere
-        pass
-
-
-class LoggerFileObject(object):
-
-    def __init__(self, logger):
-        self.logger = logger
-
-    def write(self, value):
-        value = value.strip()
-        if value:
-            if 'Connection reset by peer' in value:
-                self.logger.error(_('STDOUT: Connection reset by peer'))
-            else:
-                self.logger.error(_('STDOUT: %s'), value)
-
-    def writelines(self, values):
-        self.logger.error(_('STDOUT: %s'), '#012'.join(values))
-
-    def close(self):
-        pass
-
-    def flush(self):
-        pass
-
-    def __iter__(self):
-        return self
-
-    def next(self):
-        raise IOError(errno.EBADF, 'Bad file descriptor')
-
-    def read(self, size=-1):
-        raise IOError(errno.EBADF, 'Bad file descriptor')
-
-    def readline(self, size=-1):
-        raise IOError(errno.EBADF, 'Bad file descriptor')
-
-    def tell(self):
-        return 0
-
-    def xreadlines(self):
-        return self
-
-
-class StatsdClient(object):
-    def __init__(self, host, port, base_prefix='', tail_prefix='',
-                 default_sample_rate=1):
-        self._host = host
-        self._port = port
-        self._base_prefix = base_prefix
-        self.set_prefix(tail_prefix)
-        self._default_sample_rate = default_sample_rate
-        self._target = (self._host, self._port)
-        self.random = random
-
-    def set_prefix(self, new_prefix):
-        if new_prefix and self._base_prefix:
-            self._prefix = '.'.join([self._base_prefix, new_prefix, ''])
-        elif new_prefix:
-            self._prefix = new_prefix + '.'
-        elif self._base_prefix:
-            self._prefix = self._base_prefix + '.'
-        else:
-            self._prefix = ''
-
-    def _send(self, m_name, m_value, m_type, sample_rate):
-        if sample_rate is None:
-            sample_rate = self._default_sample_rate
-        parts = ['%s%s:%s' % (self._prefix, m_name, m_value), m_type]
-        if sample_rate < 1:
-            if self.random() < sample_rate:
-                parts.append('@%s' % (sample_rate,))
-            else:
-                return
-        # Ideally, we'd cache a sending socket in self, but that
-        # results in a socket getting shared by multiple green threads.
-        with closing(self._open_socket()) as sock:
-            return sock.sendto('|'.join(parts), self._target)
-
-    def _open_socket(self):
-        return socket.socket(socket.AF_INET, socket.SOCK_DGRAM)
-
-    def update_stats(self, m_name, m_value, sample_rate=None):
-        return self._send(m_name, m_value, 'c', sample_rate)
-
-    def increment(self, metric, sample_rate=None):
-        return self.update_stats(metric, 1, sample_rate)
-
-    def decrement(self, metric, sample_rate=None):
-        return self.update_stats(metric, -1, sample_rate)
-
-    def timing(self, metric, timing_ms, sample_rate=None):
-        return self._send(metric, timing_ms, 'ms', sample_rate)
-
-    def timing_since(self, metric, orig_time, sample_rate=None):
-        return self.timing(metric, (time.time() - orig_time) * 1000,
-                           sample_rate)
-
-
-def timing_stats(func):
-    """
-    Decorator that logs timing events or errors for public methods in swift's
-    wsgi server controllers, based on response code.
-    """
-    method = func.func_name
-
-    @functools.wraps(func)
-    def _timing_stats(ctrl, *args, **kwargs):
-        start_time = time.time()
-        resp = func(ctrl, *args, **kwargs)
-        if is_success(resp.status_int) or is_redirection(resp.status_int) or \
-                resp.status_int == HTTP_NOT_FOUND:
-            ctrl.logger.timing_since(method + '.timing', start_time)
-        else:
-            ctrl.logger.timing_since(method + '.errors.timing', start_time)
-        return resp
-
-    return _timing_stats
-
-
-# double inheritance to support property with setter
-class LogAdapter(logging.LoggerAdapter, object):
-    """
-    A Logger like object which performs some reformatting on calls to
-    :meth:`exception`.  Can be used to store a threadlocal transaction id and
-    client ip.
-    """
-
-    _cls_thread_local = threading.local()
-
-    def __init__(self, logger, server):
-        logging.LoggerAdapter.__init__(self, logger, {})
-        self.server = server
-        setattr(self, 'warn', self.warning)
-
-    @property
-    def txn_id(self):
-        if hasattr(self._cls_thread_local, 'txn_id'):
-            return self._cls_thread_local.txn_id
-
-    @txn_id.setter
-    def txn_id(self, value):
-        self._cls_thread_local.txn_id = value
-
-    @property
-    def client_ip(self):
-        if hasattr(self._cls_thread_local, 'client_ip'):
-            return self._cls_thread_local.client_ip
-
-    @client_ip.setter
-    def client_ip(self, value):
-        self._cls_thread_local.client_ip = value
-
-    @property
-    def thread_locals(self):
-        return (self.txn_id, self.client_ip)
-
-    @thread_locals.setter
-    def thread_locals(self, value):
-        self.txn_id, self.client_ip = value
-
-    def getEffectiveLevel(self):
-        return self.logger.getEffectiveLevel()
-
-    def process(self, msg, kwargs):
-        """
-        Add extra info to message
-        """
-        kwargs['extra'] = {'server': self.server, 'txn_id': self.txn_id,
-                           'client_ip': self.client_ip}
-        return msg, kwargs
-
-    def notice(self, msg, *args, **kwargs):
-        """
-        Convenience function for syslog priority LOG_NOTICE. The python
-        logging lvl is set to 25, just above info.  SysLogHandler is
-        monkey patched to map this log lvl to the LOG_NOTICE syslog
-        priority.
-        """
-        self.log(NOTICE, msg, *args, **kwargs)
-
-    def _exception(self, msg, *args, **kwargs):
-        logging.LoggerAdapter.exception(self, msg, *args, **kwargs)
-
-    def exception(self, msg, *args, **kwargs):
-        _junk, exc, _junk = sys.exc_info()
-        call = self.error
-        emsg = ''
-        if isinstance(exc, OSError):
-            if exc.errno in (errno.EIO, errno.ENOSPC):
-                emsg = str(exc)
-            else:
-                call = self._exception
-        elif isinstance(exc, socket.error):
-            if exc.errno == errno.ECONNREFUSED:
-                emsg = _('Connection refused')
-            elif exc.errno == errno.EHOSTUNREACH:
-                emsg = _('Host unreachable')
-            elif exc.errno == errno.ETIMEDOUT:
-                emsg = _('Connection timeout')
-            else:
-                call = self._exception
-        elif isinstance(exc, eventlet.Timeout):
-            emsg = exc.__class__.__name__
-            if hasattr(exc, 'seconds'):
-                emsg += ' (%ss)' % exc.seconds
-            if isinstance(exc, MessageTimeout):
-                if exc.msg:
-                    emsg += ' %s' % exc.msg
-        else:
-            call = self._exception
-        call('%s: %s' % (msg, emsg), *args, **kwargs)
-
-    def set_statsd_prefix(self, prefix):
-        """
-        The StatsD client prefix defaults to the "name" of the logger.  This
-        method may override that default with a specific value.  Currently used
-        in the proxy-server to differentiate the Account, Container, and Object
-        controllers.
-        """
-        if self.logger.statsd_client:
-            self.logger.statsd_client.set_prefix(prefix)
-
-    def statsd_delegate(statsd_func_name):
-        """
-        Factory which creates methods which delegate to methods on
-        self.logger.statsd_client (an instance of StatsdClient).  The
-        created methods conditionally delegate to a method whose name is given
-        in 'statsd_func_name'.  The created delegate methods are a no-op when
-        StatsD logging is not configured.  The created delegate methods also
-        handle the defaulting of sample_rate (to either the default specified
-        in the config with 'log_statsd_default_sample_rate' or the value passed
-        into delegate function).
-
-        :param statsd_func_name: the name of a method on StatsdClient.
-        """
-
-        func = getattr(StatsdClient, statsd_func_name)
-
-        @functools.wraps(func)
-        def wrapped(self, *a, **kw):
-            if getattr(self.logger, 'statsd_client'):
-                return func(self.logger.statsd_client, *a, **kw)
-        return wrapped
-
-    update_stats = statsd_delegate('update_stats')
-    increment = statsd_delegate('increment')
-    decrement = statsd_delegate('decrement')
-    timing = statsd_delegate('timing')
-    timing_since = statsd_delegate('timing_since')
-
-
-class SwiftLogFormatter(logging.Formatter):
-    """
-    Custom logging.Formatter will append txn_id to a log message if the record
-    has one and the message does not.
-    """
-
-    def format(self, record):
-        if not hasattr(record, 'server'):
-            # Catch log messages that were not initiated by swift
-            # (for example, the keystone auth middleware)
-            record.server = record.name
-            return logging.Formatter.format(self, record)
-        msg = logging.Formatter.format(self, record)
-        if (record.txn_id and record.levelno != logging.INFO and
-                record.txn_id not in msg):
-            msg = "%s (txn: %s)" % (msg, record.txn_id)
-        if (record.client_ip and record.levelno != logging.INFO and
-                record.client_ip not in msg):
-            msg = "%s (client_ip: %s)" % (msg, record.client_ip)
-        return msg
-
-
-def get_logger(conf, name=None, log_to_console=False, log_route=None,
-               fmt="%(server)s %(message)s"):
-    """
-    Get the current system logger using config settings.
-
-    **Log config and defaults**::
-
-        log_facility = LOG_LOCAL0
-        log_level = INFO
-        log_name = swift
-        log_udp_host = (disabled)
-        log_udp_port = logging.handlers.SYSLOG_UDP_PORT
-        log_address = /dev/log
-        log_statsd_host = (disabled)
-        log_statsd_port = 8125
-        log_statsd_default_sample_rate = 1
-        log_statsd_metric_prefix = (empty-string)
-
-    :param conf: Configuration dict to read settings from
-    :param name: Name of the logger
-    :param log_to_console: Add handler which writes to console on stderr
-    :param log_route: Route for the logging, not emitted to the log, just used
-                      to separate logging configurations
-    :param fmt: Override log format
-    """
-    if not conf:
-        conf = {}
-    if name is None:
-        name = conf.get('log_name', 'swift')
-    if not log_route:
-        log_route = name
-    logger = logging.getLogger(log_route)
-    logger.propagate = False
-    # all new handlers will get the same formatter
-    formatter = SwiftLogFormatter(fmt)
-
-    # get_logger will only ever add one SysLog Handler to a logger
-    if not hasattr(get_logger, 'handler4logger'):
-        get_logger.handler4logger = {}
-    if logger in get_logger.handler4logger:
-        logger.removeHandler(get_logger.handler4logger[logger])
-
-    # facility for this logger will be set by last call wins
-    facility = getattr(SysLogHandler, conf.get('log_facility', 'LOG_LOCAL0'),
-                       SysLogHandler.LOG_LOCAL0)
-    udp_host = conf.get('log_udp_host')
-    if udp_host:
-        udp_port = conf.get('log_udp_port', logging.handlers.SYSLOG_UDP_PORT)
-        handler = SysLogHandler(address=(udp_host, udp_port),
-                                facility=facility)
-    else:
-        log_address = conf.get('log_address', '/dev/log')
-        try:
-            handler = SysLogHandler(address=log_address, facility=facility)
-        except socket.error, e:
-            # Either /dev/log isn't a UNIX socket or it does not exist at all
-            if e.errno not in [errno.ENOTSOCK, errno.ENOENT]:
-                raise e
-            handler = SysLogHandler(facility=facility)
-    handler.setFormatter(formatter)
-    logger.addHandler(handler)
-    get_logger.handler4logger[logger] = handler
-
-    # setup console logging
-    if log_to_console or hasattr(get_logger, 'console_handler4logger'):
-        # remove pre-existing console handler for this logger
-        if not hasattr(get_logger, 'console_handler4logger'):
-            get_logger.console_handler4logger = {}
-        if logger in get_logger.console_handler4logger:
-            logger.removeHandler(get_logger.console_handler4logger[logger])
-
-        console_handler = logging.StreamHandler(sys.__stderr__)
-        console_handler.setFormatter(formatter)
-        logger.addHandler(console_handler)
-        get_logger.console_handler4logger[logger] = console_handler
-
-    # set the level for the logger
-    logger.setLevel(
-        getattr(logging, conf.get('log_level', 'INFO').upper(), logging.INFO))
-
-    # Setup logger with a StatsD client if so configured
-    statsd_host = conf.get('log_statsd_host')
-    if statsd_host:
-        statsd_port = int(conf.get('log_statsd_port', 8125))
-        base_prefix = conf.get('log_statsd_metric_prefix', '')
-        default_sample_rate = float(conf.get(
-            'log_statsd_default_sample_rate', 1))
-        statsd_client = StatsdClient(statsd_host, statsd_port, base_prefix,
-                                     name, default_sample_rate)
-        logger.statsd_client = statsd_client
-    else:
-        logger.statsd_client = None
-
-    adapted_logger = LogAdapter(logger, name)
-    other_handlers = conf.get('log_custom_handlers', None)
-    if other_handlers:
-        log_custom_handlers = [s.strip() for s in other_handlers.split(',')
-                               if s.strip()]
-        for hook in log_custom_handlers:
-            try:
-                mod, fnc = hook.rsplit('.', 1)
-                logger_hook = getattr(__import__(mod, fromlist=[fnc]), fnc)
-                logger_hook(conf, name, log_to_console, log_route, fmt,
-                            logger, adapted_logger)
-            except (AttributeError, ImportError):
-                print >>sys.stderr, 'Error calling custom handler [%s]' % hook
-            except ValueError:
-                print >>sys.stderr, 'Invalid custom handler format [%s]' % hook
-    return adapted_logger
-
-
-def drop_privileges(user):
-    """
-    Sets the userid/groupid of the current process, get session leader, etc.
-
-    :param user: User name to change privileges to
-    """
-    user = pwd.getpwnam(user)
-    if os.geteuid() == 0:
-        os.setgroups([])
-    os.setgid(user[3])
-    os.setuid(user[2])
-    os.environ['HOME'] = user[5]
-    try:
-        os.setsid()
-    except OSError:
-        pass
-    os.chdir('/')  # in case you need to rmdir on where you started the daemon
-    os.umask(022)  # ensure files are created with the correct privileges
-
-
-def capture_stdio(logger, **kwargs):
-    """
-    Log unhandled exceptions, close stdio, capture stdout and stderr.
-
-    param logger: Logger object to use
-    """
-    # log uncaught exceptions
-    sys.excepthook = lambda * exc_info: \
-        logger.critical(_('UNCAUGHT EXCEPTION'), exc_info=exc_info)
-
-    # collect stdio file desc not in use for logging
-    stdio_files = [sys.stdin, sys.stdout, sys.stderr]
-    console_fds = [h.stream.fileno() for _junk, h in getattr(
-        get_logger, 'console_handler4logger', {}).items()]
-    stdio_files = [f for f in stdio_files if f.fileno() not in console_fds]
-
-    with open(os.devnull, 'r+b') as nullfile:
-        # close stdio (excludes fds open for logging)
-        for f in stdio_files:
-            # some platforms throw an error when attempting an stdin flush
-            try:
-                f.flush()
-            except IOError:
-                pass
-
-            try:
-                os.dup2(nullfile.fileno(), f.fileno())
-            except OSError:
-                pass
-
-    # redirect stdio
-    if kwargs.pop('capture_stdout', True):
-        sys.stdout = LoggerFileObject(logger)
-    if kwargs.pop('capture_stderr', True):
-        sys.stderr = LoggerFileObject(logger)
-
-
-def parse_options(parser=None, once=False, test_args=None):
-    """
-    Parse standard swift server/daemon options with optparse.OptionParser.
-
-    :param parser: OptionParser to use. If not sent one will be created.
-    :param once: Boolean indicating the "once" option is available
-    :param test_args: Override sys.argv; used in testing
-
-    :returns : Tuple of (config, options); config is an absolute path to the
-               config file, options is the parser options as a dictionary.
-
-    :raises SystemExit: First arg (CONFIG) is required, file must exist
-    """
-    if not parser:
-        parser = OptionParser(usage="%prog CONFIG [options]")
-    parser.add_option("-v", "--verbose", default=False, action="store_true",
-                      help="log to console")
-    if once:
-        parser.add_option("-o", "--once", default=False, action="store_true",
-                          help="only run one pass of daemon")
-
-    # if test_args is None, optparse will use sys.argv[:1]
-    options, args = parser.parse_args(args=test_args)
-
-    if not args:
-        parser.print_usage()
-        print _("Error: missing config file argument")
-        sys.exit(1)
-    config = os.path.abspath(args.pop(0))
-    if not os.path.exists(config):
-        parser.print_usage()
-        print _("Error: unable to locate %s") % config
-        sys.exit(1)
-
-    extra_args = []
-    # if any named options appear in remaining args, set the option to True
-    for arg in args:
-        if arg in options.__dict__:
-            setattr(options, arg, True)
-        else:
-            extra_args.append(arg)
-
-    options = vars(options)
-    if extra_args:
-        options['extra_args'] = extra_args
-    return config, options
-
-
-def whataremyips():
-    """
-    Get the machine's ip addresses
-
-    :returns: list of Strings of ip addresses
-    """
-    addresses = []
-    for interface in netifaces.interfaces():
-        try:
-            iface_data = netifaces.ifaddresses(interface)
-            for family in iface_data:
-                if family not in (netifaces.AF_INET, netifaces.AF_INET6):
-                    continue
-                for address in iface_data[family]:
-                    addresses.append(address['addr'])
-        except ValueError:
-            pass
-    return addresses
-
-
-def storage_directory(datadir, partition, hash):
-    """
-    Get the storage directory
-
-    :param datadir: Base data directory
-    :param partition: Partition
-    :param hash: Account, container or object hash
-    :returns: Storage directory
-    """
-    return os.path.join(datadir, str(partition), hash[-3:], hash)
-
-
-def hash_path(account, container=None, object=None, raw_digest=False):
-    """
-    Get the connonical hash for an account/container/object
-
-    :param account: Account
-    :param container: Container
-    :param object: Object
-    :param raw_digest: If True, return the raw version rather than a hex digest
-    :returns: hash string
-    """
-    if object and not container:
-        raise ValueError('container is required if object is provided')
-    paths = [account]
-    if container:
-        paths.append(container)
-    if object:
-        paths.append(object)
-    if raw_digest:
-        return md5('/' + '/'.join(paths) + HASH_PATH_SUFFIX).digest()
-    else:
-        return md5('/' + '/'.join(paths) + HASH_PATH_SUFFIX).hexdigest()
-
-
-@contextmanager
-def lock_path(directory, timeout=10):
-    """
-    Context manager that acquires a lock on a directory.  This will block until
-    the lock can be acquired, or the timeout time has expired (whichever occurs
-    first).
-
-    For locking exclusively, file or directory has to be opened in Write mode.
-    Python doesn't allow directories to be opened in Write Mode. So we
-    workaround by locking a hidden file in the directory.
-
-    :param directory: directory to be locked
-    :param timeout: timeout (in seconds)
-    """
-    mkdirs(directory)
-    lockpath = '%s/.lock' % directory
-    fd = os.open(lockpath, os.O_WRONLY | os.O_CREAT)
-    try:
-        with LockTimeout(timeout, lockpath):
-            while True:
-                try:
-                    fcntl.flock(fd, fcntl.LOCK_EX | fcntl.LOCK_NB)
-                    break
-                except IOError, err:
-                    if err.errno != errno.EAGAIN:
-                        raise
-                sleep(0.01)
-        yield True
-    finally:
-        os.close(fd)
-
-
-@contextmanager
-def lock_file(filename, timeout=10, append=False, unlink=True):
-    """
-    Context manager that acquires a lock on a file.  This will block until
-    the lock can be acquired, or the timeout time has expired (whichever occurs
-    first).
-
-    :param filename: file to be locked
-    :param timeout: timeout (in seconds)
-    :param append: True if file should be opened in append mode
-    :param unlink: True if the file should be unlinked at the end
-    """
-    flags = os.O_CREAT | os.O_RDWR
-    if append:
-        flags |= os.O_APPEND
-        mode = 'a+'
-    else:
-        mode = 'r+'
-    fd = os.open(filename, flags)
-    file_obj = os.fdopen(fd, mode)
-    try:
-        with LockTimeout(timeout, filename):
-            while True:
-                try:
-                    fcntl.flock(fd, fcntl.LOCK_EX | fcntl.LOCK_NB)
-                    break
-                except IOError, err:
-                    if err.errno != errno.EAGAIN:
-                        raise
-                sleep(0.01)
-        yield file_obj
-    finally:
-        try:
-            file_obj.close()
-        except UnboundLocalError:
-            pass  # may have not actually opened the file
-        if unlink:
-            os.unlink(filename)
-
-
-def lock_parent_directory(filename, timeout=10):
-    """
-    Context manager that acquires a lock on the parent directory of the given
-    file path.  This will block until the lock can be acquired, or the timeout
-    time has expired (whichever occurs first).
-
-    :param filename: file path of the parent directory to be locked
-    :param timeout: timeout (in seconds)
-    """
-    return lock_path(os.path.dirname(filename), timeout=timeout)
-
-
-def get_time_units(time_amount):
-    """
-    Get a nomralized length of time in the largest unit of time (hours,
-    minutes, or seconds.)
-
-    :param time_amount: length of time in seconds
-    :returns: A touple of (length of time, unit of time) where unit of time is
-              one of ('h', 'm', 's')
-    """
-    time_unit = 's'
-    if time_amount > 60:
-        time_amount /= 60
-        time_unit = 'm'
-        if time_amount > 60:
-            time_amount /= 60
-            time_unit = 'h'
-    return time_amount, time_unit
-
-
-def compute_eta(start_time, current_value, final_value):
-    """
-    Compute an ETA.  Now only if we could also have a progress bar...
-
-    :param start_time: Unix timestamp when the operation began
-    :param current_value: Current value
-    :param final_value: Final value
-    :returns: ETA as a tuple of (length of time, unit of time) where unit of
-              time is one of ('h', 'm', 's')
-    """
-    elapsed = time.time() - start_time
-    completion = (float(current_value) / final_value) or 0.00001
-    return get_time_units(1.0 / completion * elapsed - elapsed)
-
-
-def iter_devices_partitions(devices_dir, item_type):
-    """
-    Iterate over partitions accross all devices.
-
-    :param devices_dir: Path to devices
-    :param item_type: One of 'accounts', 'containers', or 'objects'
-    :returns: Each iteration returns a tuple of (device, partition)
-    """
-    devices = listdir(devices_dir)
-    shuffle(devices)
-    devices_partitions = []
-    for device in devices:
-        partitions = listdir(os.path.join(devices_dir, device, item_type))
-        shuffle(partitions)
-        devices_partitions.append((device, iter(partitions)))
-    yielded = True
-    while yielded:
-        yielded = False
-        for device, partitions in devices_partitions:
-            try:
-                yield device, partitions.next()
-                yielded = True
-            except StopIteration:
-                pass
-
-
-def unlink_older_than(path, mtime):
-    """
-    Remove any file in a given path that that was last modified before mtime.
-
-    :param path: path to remove file from
-    :mtime: timestamp of oldest file to keep
-    """
-    if os.path.exists(path):
-        for fname in listdir(path):
-            fpath = os.path.join(path, fname)
-            try:
-                if os.path.getmtime(fpath) < mtime:
-                    os.unlink(fpath)
-            except OSError:
-                pass
-
-
-def item_from_env(env, item_name):
-    """
-    Get a value from the wsgi environment
-
-    :param env: wsgi environment dict
-    :param item_name: name of item to get
-
-    :returns: the value from the environment
-    """
-    item = env.get(item_name, None)
-    if item is None:
-        logging.error("ERROR: %s could not be found in env!" % item_name)
-    return item
-
-
-def cache_from_env(env):
-    """
-    Get memcache connection pool from the environment (which had been
-    previously set by the memcache middleware
-
-    :param env: wsgi environment dict
-
-    :returns: swift.common.memcached.MemcacheRing from environment
-    """
-    return item_from_env(env, 'swift.cache')
-
-
-def readconf(conffile, section_name=None, log_name=None, defaults=None,
-             raw=False):
-    """
-    Read config file and return config items as a dict
-
-    :param conffile: path to config file, or a file-like object (hasattr
-                     readline)
-    :param section_name: config section to read (will return all sections if
-                     not defined)
-    :param log_name: name to be used with logging (will use section_name if
-                     not defined)
-    :param defaults: dict of default values to pre-populate the config with
-    :returns: dict of config items
-    """
-    if defaults is None:
-        defaults = {}
-    if raw:
-        c = RawConfigParser(defaults)
-    else:
-        c = ConfigParser(defaults)
-    if hasattr(conffile, 'readline'):
-        c.readfp(conffile)
-    else:
-        if not c.read(conffile):
-            print _("Unable to read config file %s") % conffile
-            sys.exit(1)
-    if section_name:
-        if c.has_section(section_name):
-            conf = dict(c.items(section_name))
-        else:
-            print _("Unable to find %s config section in %s") % \
-                (section_name, conffile)
-            sys.exit(1)
-        if "log_name" not in conf:
-            if log_name is not None:
-                conf['log_name'] = log_name
-            else:
-                conf['log_name'] = section_name
-    else:
-        conf = {}
-        for s in c.sections():
-            conf.update({s: dict(c.items(s))})
-        if 'log_name' not in conf:
-            conf['log_name'] = log_name
-    conf['__file__'] = conffile
-    return conf
-
-
-def write_pickle(obj, dest, tmp=None, pickle_protocol=0):
-    """
-    Ensure that a pickle file gets written to disk.  The file
-    is first written to a tmp location, ensure it is synced to disk, then
-    perform a move to its final location
-
-    :param obj: python object to be pickled
-    :param dest: path of final destination file
-    :param tmp: path to tmp to use, defaults to None
-    :param pickle_protocol: protocol to pickle the obj with, defaults to 0
-    """
-    if tmp is None:
-        tmp = os.path.dirname(dest)
-    fd, tmppath = mkstemp(dir=tmp, suffix='.tmp')
-    with os.fdopen(fd, 'wb') as fo:
-        pickle.dump(obj, fo, pickle_protocol)
-        fo.flush()
-        os.fsync(fd)
-        renamer(tmppath, dest)
-
-
-def search_tree(root, glob_match, ext):
-    """Look in root, for any files/dirs matching glob, recurively traversing
-    any found directories looking for files ending with ext
-
-    :param root: start of search path
-    :param glob_match: glob to match in root, matching dirs are traversed with
-                       os.walk
-    :param ext: only files that end in ext will be returned
-
-    :returns: list of full paths to matching files, sorted
-
-    """
-    found_files = []
-    for path in glob.glob(os.path.join(root, glob_match)):
-        if path.endswith(ext):
-            found_files.append(path)
-        else:
-            for root, dirs, files in os.walk(path):
-                for file in files:
-                    if file.endswith(ext):
-                        found_files.append(os.path.join(root, file))
-    return sorted(found_files)
-
-
-def write_file(path, contents):
-    """Write contents to file at path
-
-    :param path: any path, subdirs will be created as needed
-    :param contents: data to write to file, will be converted to string
-
-    """
-    dirname, name = os.path.split(path)
-    if not os.path.exists(dirname):
-        try:
-            os.makedirs(dirname)
-        except OSError, err:
-            if err.errno == errno.EACCES:
-                sys.exit('Unable to create %s.  Running as '
-                         'non-root?' % dirname)
-    with open(path, 'w') as f:
-        f.write('%s' % contents)
-
-
-def remove_file(path):
-    """Quiet wrapper for os.unlink, OSErrors are suppressed
-
-    :param path: first and only argument passed to os.unlink
-    """
-    try:
-        os.unlink(path)
-    except OSError:
-        pass
-
-
-def audit_location_generator(devices, datadir, mount_check=True, logger=None):
-    '''
-    Given a devices path and a data directory, yield (path, device,
-    partition) for all files in that directory
-
-    :param devices: parent directory of the devices to be audited
-    :param datadir: a directory located under self.devices. This should be
-                    one of the DATADIR constants defined in the account,
-                    container, and object servers.
-    :param mount_check: Flag to check if a mount check should be performed
-                    on devices
-    :param logger: a logger object
-    '''
-    device_dir = listdir(devices)
-    # randomize devices in case of process restart before sweep completed
-    shuffle(device_dir)
-    for device in device_dir:
-        if mount_check and not \
-                os.path.ismount(os.path.join(devices, device)):
-            if logger:
-                logger.debug(
-                    _('Skipping %s as it is not mounted'), device)
-            continue
-        datadir_path = os.path.join(devices, device, datadir)
-        if not os.path.exists(datadir_path):
-            continue
-        partitions = listdir(datadir_path)
-        for partition in partitions:
-            part_path = os.path.join(datadir_path, partition)
-            if not os.path.isdir(part_path):
-                continue
-            suffixes = listdir(part_path)
-            for suffix in suffixes:
-                suff_path = os.path.join(part_path, suffix)
-                if not os.path.isdir(suff_path):
-                    continue
-                hashes = listdir(suff_path)
-                for hsh in hashes:
-                    hash_path = os.path.join(suff_path, hsh)
-                    if not os.path.isdir(hash_path):
-                        continue
-                    for fname in sorted(listdir(hash_path),
-                                        reverse=True):
-                        path = os.path.join(hash_path, fname)
-                        yield path, device, partition
-
-
-def ratelimit_sleep(running_time, max_rate, incr_by=1, rate_buffer=5):
-    '''
-    Will eventlet.sleep() for the appropriate time so that the max_rate
-    is never exceeded.  If max_rate is 0, will not ratelimit.  The
-    maximum recommended rate should not exceed (1000 * incr_by) a second
-    as eventlet.sleep() does involve some overhead.  Returns running_time
-    that should be used for subsequent calls.
-
-    :param running_time: the running time of the next allowable request. Best
-                         to start at zero.
-    :param max_rate: The maximum rate per second allowed for the process.
-    :param incr_by: How much to increment the counter.  Useful if you want
-                    to ratelimit 1024 bytes/sec and have differing sizes
-                    of requests. Must be >= 0.
-    :param rate_buffer: Number of seconds the rate counter can drop and be
-                        allowed to catch up (at a faster than listed rate).
-                        A larger number will result in larger spikes in rate
-                        but better average accuracy.
-    '''
-    if not max_rate or incr_by <= 0:
-        return running_time
-    clock_accuracy = 1000.0
-    now = time.time() * clock_accuracy
-    time_per_request = clock_accuracy * (float(incr_by) / max_rate)
-    if now - running_time > rate_buffer * clock_accuracy:
-        running_time = now
-    elif running_time - now > time_per_request:
-        eventlet.sleep((running_time - now) / clock_accuracy)
-    return running_time + time_per_request
-
-
-class ContextPool(GreenPool):
-    "GreenPool subclassed to kill its coros when it gets gc'ed"
-
-    def __enter__(self):
-        return self
-
-    def __exit__(self, type, value, traceback):
-        for coro in list(self.coroutines_running):
-            coro.kill()
-
-
-class ModifiedParseResult(ParseResult):
-    "Parse results class for urlparse."
-
-    @property
-    def hostname(self):
-        netloc = self.netloc.split('@', 1)[-1]
-        if netloc.startswith('['):
-            return netloc[1:].split(']')[0]
-        elif ':' in netloc:
-            return netloc.rsplit(':')[0]
-        return netloc
-
-    @property
-    def port(self):
-        netloc = self.netloc.split('@', 1)[-1]
-        if netloc.startswith('['):
-            netloc = netloc.rsplit(']')[1]
-        if ':' in netloc:
-            return int(netloc.rsplit(':')[1])
-        return None
-
-
-def urlparse(url):
-    """
-    urlparse augmentation.
-    This is necessary because urlparse can't handle RFC 2732 URLs.
-
-    :param url: URL to parse.
-    """
-    return ModifiedParseResult(*stdlib_urlparse(url))
-
-
-def validate_sync_to(value, allowed_sync_hosts):
-    if not value:
-        return None
-    p = urlparse(value)
-    if p.scheme not in ('http', 'https'):
-        return _('Invalid scheme %r in X-Container-Sync-To, must be "http" '
-                 'or "https".') % p.scheme
-    if not p.path:
-        return _('Path required in X-Container-Sync-To')
-    if p.params or p.query or p.fragment:
-        return _('Params, queries, and fragments not allowed in '
-                 'X-Container-Sync-To')
-    if p.hostname not in allowed_sync_hosts:
-        return _('Invalid host %r in X-Container-Sync-To') % p.hostname
-    return None
-
-
-def get_remote_client(req):
-    # remote host for zeus
-    client = req.headers.get('x-cluster-client-ip')
-    if not client and 'x-forwarded-for' in req.headers:
-        # remote host for other lbs
-        client = req.headers['x-forwarded-for'].split(',')[0].strip()
-    if not client:
-        client = req.remote_addr
-    return client
-
-
-def human_readable(value):
-    """
-    Returns the number in a human readable format; for example 1048576 = "1Mi".
-    """
-    value = float(value)
-    index = -1
-    suffixes = 'KMGTPEZY'
-    while value >= 1024 and index + 1 < len(suffixes):
-        index += 1
-        value = round(value / 1024)
-    if index == -1:
-        return '%d' % value
-    return '%d%si' % (round(value), suffixes[index])
-
-
-def dump_recon_cache(cache_dict, cache_file, logger, lock_timeout=2):
-    """Update recon cache values
-
-    :param cache_dict: Dictionary of cache key/value pairs to write out
-    :param cache_file: cache file to update
-    :param logger: the logger to use to log an encountered error
-    :param lock_timeout: timeout (in seconds)
-    """
-    try:
-        with lock_file(cache_file, lock_timeout, unlink=False) as cf:
-            cache_entry = {}
-            try:
-                existing_entry = cf.readline()
-                if existing_entry:
-                    cache_entry = json.loads(existing_entry)
-            except ValueError:
-                #file doesn't have a valid entry, we'll recreate it
-                pass
-            for cache_key, cache_value in cache_dict.items():
-                cache_entry[cache_key] = cache_value
-            try:
-                with NamedTemporaryFile(dir=os.path.dirname(cache_file),
-                                        delete=False) as tf:
-                    tf.write(json.dumps(cache_entry) + '\n')
-                os.rename(tf.name, cache_file)
-            finally:
-                try:
-                    os.unlink(tf.name)
-                except OSError, err:
-                    if err.errno != errno.ENOENT:
-                        raise
-    except (Exception, Timeout):
-        logger.exception(_('Exception dumping recon cache'))
-
-
-def listdir(path):
-    try:
-        return os.listdir(path)
-    except OSError, err:
-        if err.errno != errno.ENOENT:
-            raise
-    return []
-
-
-def streq_const_time(s1, s2):
-    """Constant-time string comparison.
-
-    :params s1: the first string
-    :params s2: the second string
-
-    :return: True if the strings are equal.
-
-    This function takes two strings and compares them.  It is intended to be
-    used when doing a comparison for authentication purposes to help guard
-    against timing attacks.
-    """
-    if len(s1) != len(s2):
-        return False
-    result = 0
-    for (a, b) in zip(s1, s2):
-        result |= ord(a) ^ ord(b)
-    return result == 0
-
-
-def public(func):
-    """
-    Decorator to declare which methods are publicly accessible as HTTP
-    requests
-
-    :param func: function to make public
-    """
-    func.publicly_accessible = True
-
-    @functools.wraps(func)
-    def wrapped(*a, **kw):
-        return func(*a, **kw)
-    return wrapped
-
-
-def rsync_ip(ip):
-    """
-    Transform ip string to an rsync-compatible form
-
-    Will return ipv4 addresses unchanged, but will nest ipv6 addresses
-    inside square brackets.
-
-    :param ip: an ip string (ipv4 or ipv6)
-
-    :returns: a string ip address
-    """
-    try:
-        socket.inet_pton(socket.AF_INET6, ip)
-    except socket.error:  # it's IPv4
-        return ip
-    else:
-        return '[%s]' % ip
-
-
-def get_valid_utf8_str(str_or_unicode):
-    """
-    Get valid parts of utf-8 str from str, unicode and even invalid utf-8 str
-
-    :param str_or_unicode: a string or an unicode which can be invalid utf-8
-    """
-    if isinstance(str_or_unicode, unicode):
-        (str_or_unicode, _len) = utf8_encoder(str_or_unicode, 'replace')
-    (valid_utf8_str, _len) = utf8_decoder(str_or_unicode, 'replace')
-    return valid_utf8_str.encode('utf-8')
-
-
-def list_from_csv(comma_separated_str):
-    """
-    Splits the str given and returns a properly stripped list of the comma
-    separated values.
-    """
-    if comma_separated_str:
-        return [v.strip() for v in comma_separated_str.split(',') if v.strip()]
-    return []
-
-
-def reiterate(iterable):
-    """
-    Consume the first item from an iterator, then re-chain it to the rest of
-    the iterator.  This is useful when you want to make sure the prologue to
-    downstream generators have been executed before continuing.
-
-    :param iterable: an iterable object
-    """
-    if isinstance(iterable, (list, tuple)):
-        return iterable
-    else:
-        iterator = iter(iterable)
-        try:
-            chunk = ''
-            while not chunk:
-                chunk = next(iterable)
-            return itertools.chain([chunk], iterable)
-        except StopIteration:
-            return []
diff --git a/swift/common/utils/__init__.py b/swift/common/utils/__init__.py
new file mode 100644
index 0000000000..b0e29f5b25
--- /dev/null
+++ b/swift/common/utils/__init__.py
@@ -0,0 +1,5504 @@
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""Miscellaneous utility functions for use with Swift."""
+
+
+import base64
+import binascii
+import bisect
+import collections
+import errno
+import fcntl
+import grp
+import json
+import os
+import pwd
+import re
+import string
+import struct
+import sys
+import time
+import uuid
+import functools
+import email.parser
+from random import shuffle
+from contextlib import contextmanager, closing
+import ctypes
+import ctypes.util
+from optparse import OptionParser
+import traceback
+import warnings
+
+from tempfile import gettempdir, mkstemp, NamedTemporaryFile
+import glob
+import itertools
+import stat
+
+import eventlet
+import eventlet.debug
+import eventlet.greenthread
+import eventlet.patcher
+import eventlet.semaphore
+try:
+    import importlib.metadata
+    pkg_resources = None
+except ImportError:
+    # python < 3.8
+    import pkg_resources
+from eventlet import GreenPool, sleep, Timeout
+from eventlet.event import Event
+from eventlet.green import socket
+import eventlet.hubs
+import eventlet.queue
+
+import pickle  # nosec: B403
+from configparser import (ConfigParser, NoSectionError,
+                          NoOptionError)
+from urllib.parse import unquote, urlparse
+from collections import UserList
+
+import swift.common.exceptions
+from swift.common.header_key_dict import HeaderKeyDict
+from swift.common.linkat import linkat
+
+# For backwards compatability with 3rd party middlewares
+from swift.common.registry import register_swift_info, get_swift_info  # noqa
+
+from .base import (  # noqa
+    md5, get_valid_utf8_str, quote, split_path)
+from swift.common.utils.logs import (   # noqa
+    SysLogHandler,  # t.u.helpers.setup_servers monkey patch is sketch
+    logging_monkey_patch,
+    get_swift_logger,
+    get_prefixed_swift_logger,
+    LogLevelFilter,
+    NullLogger,
+    capture_stdio,
+    SwiftLogFormatter,
+    LoggerFileObject,
+    PipeMutex,
+    NoopMutex,
+    ThreadSafeSysLogHandler,
+    StrAnonymizer,
+    get_log_line,
+    StrFormatTime,
+    LogStringFormatter,
+    get_policy_index,
+    LOG_LINE_DEFAULT_FORMAT,
+    NOTICE,
+)
+from swift.common.utils.config import (  # noqa
+    TRUE_VALUES,
+    NicerInterpolation,
+    config_true_value,
+    append_underscore,
+    non_negative_float,
+    non_negative_int,
+    config_positive_int_value,
+    config_positive_float_value,
+    config_float_value,
+    config_auto_int_value,
+    config_percent_value,
+    config_request_node_count_value,
+    config_fallocate_value,
+    config_read_prefixed_options,
+    config_read_reseller_options,
+    parse_prefixed_conf,
+    affinity_locality_predicate,
+    affinity_key_function,
+    readconf,
+    read_conf_dir,
+)
+from swift.common.utils.libc import (  # noqa
+    F_SETPIPE_SZ,
+    load_libc_function,
+    drop_buffer_cache,
+    get_md5_socket,
+    modify_priority,
+    _LibcWrapper,
+)
+from swift.common.utils.timestamp import (  # noqa
+    NORMAL_FORMAT,
+    INTERNAL_FORMAT,
+    SHORT_FORMAT,
+    MAX_OFFSET,
+    PRECISION,
+    Timestamp,
+    encode_timestamps,
+    decode_timestamps,
+    normalize_timestamp,
+    EPOCH,
+    last_modified_date_to_timestamp,
+    normalize_delete_at_timestamp
+)
+from swift.common.utils.ipaddrs import (  # noqa
+    is_valid_ip,
+    is_valid_ipv4,
+    is_valid_ipv6,
+    expand_ipv6,
+    parse_socket_string,
+    whataremyips,
+)
+from swift.common.statsd_client import StatsdClient, get_statsd_client
+import logging
+
+EUCLEAN = getattr(errno, 'EUCLEAN', 117)  # otherwise not present on osx
+
+# These are lazily pulled from libc elsewhere
+_sys_fallocate = None
+
+# If set to non-zero, fallocate routines will fail based on free space
+# available being at or below this amount, in bytes.
+FALLOCATE_RESERVE = 0
+# Indicates if FALLOCATE_RESERVE is the percentage of free space (True) or
+# the number of bytes (False).
+FALLOCATE_IS_PERCENT = False
+
+# from /usr/include/linux/falloc.h
+FALLOC_FL_KEEP_SIZE = 1
+FALLOC_FL_PUNCH_HOLE = 2
+
+
+# Used by hash_path to offer a bit more security when generating hashes for
+# paths. It simply appends this value to all paths; guessing the hash a path
+# will end up with would also require knowing this suffix.
+HASH_PATH_SUFFIX = b''
+HASH_PATH_PREFIX = b''
+
+SWIFT_CONF_FILE = '/etc/swift/swift.conf'
+
+# These constants are Linux-specific, and Python doesn't seem to know
+# about them. We ask anyway just in case that ever gets fixed.
+#
+# The values were copied from the Linux 3.x kernel headers.
+O_TMPFILE = getattr(os, 'O_TMPFILE', 0o20000000 | os.O_DIRECTORY)
+
+MD5_OF_EMPTY_STRING = 'd41d8cd98f00b204e9800998ecf8427e'
+
+RESERVED_BYTE = b'\x00'
+RESERVED_STR = u'\x00'
+RESERVED = '\x00'
+
+
+DEFAULT_LOCK_TIMEOUT = 10
+# this is coupled with object-server.conf's network_chunk_size; if someone is
+# running that unreasonably small they may find this number inefficient, but in
+# the more likely case they've increased the value to optimize high througput
+# transfers this will still cut off the transfer after the first chunk.
+DEFAULT_DRAIN_LIMIT = 65536
+
+
+def _patch_statsd_methods(target, statsd_client_source):
+    """
+    Note: this function is only used to create backwards compatible
+    legacy "hybrid" loggers that also have a StatsdClient interface.
+    It should not otherwise be used to patch arbitrary objects to
+    have a StatsdClient interface.
+
+    Patch the ``target`` object with methods that present an interface to a
+    ``StatsdClient`` instance that is an attribute ``statsd_client`` of
+    ``statsd_client_source``.
+
+    Note: ``statsd_client_source`` is an object that *has a* ``StatsdClient``
+        and not an object that *is a* ``StatsdClient`` instance, because the
+        actual ``StatsdClient`` instance may change. The patched target
+        therefore forwards its methods to whatever instance of ``StatsdClient``
+        the ``statsd_client_source`` currently has.
+
+    :param target: an object that will be patched to present an interface to a
+        ``StatsdClient``.
+    :param statsd_client_source: an object that must have an attribute
+        ``statsd_client`` that must be an instance of a ``StatsdClient``.
+        This is typically a core ``logging.Logger`` that has been patched with
+        a ``StatsdClient`` by ``get_logger()``.
+    """
+    try:
+        if not isinstance(statsd_client_source.statsd_client, StatsdClient):
+            raise ValueError()
+    except (AttributeError, ValueError):
+        raise ValueError(
+            'statsd_client_source must have a statsd_client attribute')
+
+    def set_statsd_prefix(prefix):
+        """
+        This method is deprecated. Callers should use the
+        ``statsd_tail_prefix`` argument of ``get_logger`` when instantiating a
+        logger.
+
+        The StatsD client prefix defaults to the "name" of the logger.  This
+        method may override that default with a specific value.  Currently used
+        in the proxy-server to differentiate the Account, Container, and Object
+        controllers.
+        """
+        warnings.warn(
+            'set_statsd_prefix() is deprecated; use the '
+            '``statsd_tail_prefix`` argument to ``get_logger`` instead.',
+            DeprecationWarning, stacklevel=2
+        )
+        if getattr(statsd_client_source, 'statsd_client'):
+            statsd_client_source.statsd_client._set_prefix(prefix)
+
+    def statsd_delegate(statsd_func_name):
+        """
+        Factory to create methods which delegate to methods on
+        ``statsd_client_source.statsd_client`` (an instance of StatsdClient).
+        The created methods conditionally delegate to a method whose name is
+        given in 'statsd_func_name'.  The created delegate methods are a no-op
+        when StatsD logging is not configured.
+
+        :param statsd_func_name: the name of a method on ``StatsdClient``.
+        """
+        func = getattr(StatsdClient, statsd_func_name)
+
+        @functools.wraps(func)
+        def wrapped(*a, **kw):
+            func = getattr(statsd_client_source.statsd_client,
+                           statsd_func_name)
+            return func(*a, **kw)
+        return wrapped
+
+    target.update_stats = statsd_delegate('update_stats')
+    target.increment = statsd_delegate('increment')
+    target.decrement = statsd_delegate('decrement')
+    target.timing = statsd_delegate('timing')
+    target.timing_since = statsd_delegate('timing_since')
+    target.transfer_rate = statsd_delegate('transfer_rate')
+    target.set_statsd_prefix = set_statsd_prefix
+    target.statsd_client_source = statsd_client_source
+
+
+def get_logger(conf, name=None, log_to_console=False, log_route=None,
+               fmt="%(server)s: %(message)s", statsd_tail_prefix=None):
+    """
+    Returns a ``SwiftLogAdapter`` that has been patched to also provide an
+        interface to a ``StatsdClient``.
+
+    :param conf: Configuration dict to read settings from
+    :param name: This value is used to populate the ``server`` field in the log
+                 format, as the prefix for statsd messages, and as the default
+                 value for ``log_route``; defaults to the ``log_name`` value in
+                 ``conf``, if it exists, or to 'swift'.
+    :param log_to_console: Add handler which writes to console on stderr.
+    :param log_route: Route for the logging, not emitted to the log, just used
+                      to separate logging configurations; defaults to the value
+                      of ``name`` or whatever ``name`` defaults to. This value
+                      is used as the name attribute of the
+                      ``SwiftLogAdapter`` that is returned.
+    :param fmt: Override log format.
+    :param statsd_tail_prefix: tail prefix to pass to ``StatsdClient``; if None
+        then the tail prefix defaults to the value of ``name``.
+    :return: an instance of ``SwiftLogAdapter``.
+    """
+    conf = conf or {}
+    swift_logger = get_swift_logger(
+        conf, name, log_to_console, log_route, fmt)
+    name = conf.get('log_name', 'swift') if name is None else name
+    tail_prefix = name if statsd_tail_prefix is None else statsd_tail_prefix
+    statsd_client = get_statsd_client(conf, tail_prefix, swift_logger.logger)
+    swift_logger.logger.statsd_client = statsd_client
+    _patch_statsd_methods(swift_logger, swift_logger.logger)
+    return swift_logger
+
+
+def get_prefixed_logger(swift_logger, prefix):
+    """
+    Return a clone of the given ``swift_logger`` with a new prefix string
+    that replaces the prefix string of the given ``swift_logger``
+
+    If the given ``swift_logger`` has been patched with an interface to a
+    ``StatsdClient`` instance then the returned ``SwiftLogAdapter`` will also
+    be patched with an interface to the same ``StatsdClient`` instance.
+
+    :param swift_logger: an instance of ``SwiftLogAdapter``.
+    :param prefix: a string prefix.
+    :returns: a new instance of ``SwiftLogAdapter``.
+    """
+    new_logger = get_prefixed_swift_logger(swift_logger, prefix=prefix)
+    if hasattr(swift_logger, 'statsd_client_source'):
+        _patch_statsd_methods(
+            new_logger, swift_logger.statsd_client_source)
+    return new_logger
+
+
+class InvalidHashPathConfigError(ValueError):
+
+    def __str__(self):
+        return "[swift-hash]: both swift_hash_path_suffix and " \
+            "swift_hash_path_prefix are missing from %s" % SWIFT_CONF_FILE
+
+
+def set_swift_dir(swift_dir):
+    """
+    Sets the directory from which swift config files will be read. If the given
+    directory differs from that already set then the swift.conf file in the new
+    directory will be validated and storage policies will be reloaded from the
+    new swift.conf file.
+
+    :param swift_dir: non-default directory to read swift.conf from
+    """
+    global HASH_PATH_SUFFIX
+    global HASH_PATH_PREFIX
+    global SWIFT_CONF_FILE
+    if (swift_dir is not None and
+            swift_dir != os.path.dirname(SWIFT_CONF_FILE)):
+        SWIFT_CONF_FILE = os.path.join(
+            swift_dir, os.path.basename(SWIFT_CONF_FILE))
+        HASH_PATH_PREFIX = b''
+        HASH_PATH_SUFFIX = b''
+        validate_configuration()
+        return True
+    return False
+
+
+def validate_hash_conf():
+    global HASH_PATH_SUFFIX
+    global HASH_PATH_PREFIX
+    if not HASH_PATH_SUFFIX and not HASH_PATH_PREFIX:
+        hash_conf = ConfigParser()
+
+        # Use Latin1 to accept arbitrary bytes in the hash prefix/suffix
+        with open(SWIFT_CONF_FILE, encoding='latin1') as swift_conf_file:
+            hash_conf.read_file(swift_conf_file)
+
+        try:
+            HASH_PATH_SUFFIX = hash_conf.get(
+                'swift-hash', 'swift_hash_path_suffix').encode('latin1')
+        except (NoSectionError, NoOptionError):
+            pass
+        try:
+            HASH_PATH_PREFIX = hash_conf.get(
+                'swift-hash', 'swift_hash_path_prefix').encode('latin1')
+        except (NoSectionError, NoOptionError):
+            pass
+
+        if not HASH_PATH_SUFFIX and not HASH_PATH_PREFIX:
+            raise InvalidHashPathConfigError()
+
+
+try:
+    validate_hash_conf()
+except (InvalidHashPathConfigError, IOError):
+    # could get monkey patched or lazy loaded
+    pass
+
+
+def backward(f, blocksize=4096):
+    """
+    A generator returning lines from a file starting with the last line,
+    then the second last line, etc. i.e., it reads lines backwards.
+    Stops when the first line (if any) is read.
+    This is useful when searching for recent activity in very
+    large files.
+
+    :param f: file object to read
+    :param blocksize: no of characters to go backwards at each block
+    """
+    f.seek(0, os.SEEK_END)
+    if f.tell() == 0:
+        return
+    last_row = b''
+    while f.tell() != 0:
+        try:
+            f.seek(-blocksize, os.SEEK_CUR)
+        except IOError:
+            blocksize = f.tell()
+            f.seek(-blocksize, os.SEEK_CUR)
+        block = f.read(blocksize)
+        f.seek(-blocksize, os.SEEK_CUR)
+        rows = block.split(b'\n')
+        rows[-1] = rows[-1] + last_row
+        while rows:
+            last_row = rows.pop(-1)
+            if rows and last_row:
+                yield last_row
+    yield last_row
+
+
+def eventlet_monkey_patch():
+    """
+    Install the appropriate Eventlet monkey patches.
+    """
+    # NOTE(sileht):
+    #     monkey-patching thread is required by python-keystoneclient;
+    #     monkey-patching select is required by oslo.messaging pika driver
+    #         if thread is monkey-patched.
+    eventlet.patcher.monkey_patch(all=False, socket=True, select=True,
+                                  thread=True)
+
+
+def monkey_patch():
+    """
+    Apply all swift monkey patching consistently in one place.
+    """
+    eventlet_monkey_patch()
+    logging_monkey_patch()
+
+
+def validate_configuration():
+    try:
+        validate_hash_conf()
+    except InvalidHashPathConfigError as e:
+        sys.exit("Error: %s" % e)
+
+
+def generate_trans_id(trans_id_suffix):
+    return 'tx%s-%010x%s' % (
+        uuid.uuid4().hex[:21], int(time.time()), quote(trans_id_suffix))
+
+
+def get_trans_id_time(trans_id):
+    if len(trans_id) >= 34 and \
+       trans_id.startswith('tx') and trans_id[23] == '-':
+        try:
+            return int(trans_id[24:34], 16)
+        except ValueError:
+            pass
+    return None
+
+
+class FileLikeIter(object):
+
+    def __init__(self, iterable):
+        """
+        Wraps an iterable to behave as a file-like object.
+
+        The iterable must be a byte string or yield byte strings.
+        """
+        if isinstance(iterable, bytes):
+            iterable = (iterable, )
+        self.iterator = iter(iterable)
+        self.buf = None
+        self.closed = False
+
+    def __iter__(self):
+        return self
+
+    def __next__(self):
+        """
+        :raise StopIteration: if there are no more values to iterate.
+        :raise ValueError: if the close() method has been called.
+        :return: the next value.
+        """
+        if self.closed:
+            raise ValueError('I/O operation on closed file')
+        if self.buf:
+            rv = self.buf
+            self.buf = None
+            return rv
+        else:
+            return next(self.iterator)
+
+    def read(self, size=-1):
+        """
+        :param size: (optional) the maximum number of bytes to read. The
+        default value of ``-1`` means 'unlimited' i.e. read until the wrapped
+        iterable is exhausted.
+        :raise ValueError: if the close() method has been called.
+        :return: a bytes literal; if the wrapped iterable has been exhausted
+            then a zero-length bytes literal is returned.
+        """
+        size = -1 if size is None else size
+        if self.closed:
+            raise ValueError('I/O operation on closed file')
+        if size < 0:
+            return b''.join(self)
+        elif not size:
+            chunk = b''
+        elif self.buf:
+            chunk = self.buf
+            self.buf = None
+        else:
+            try:
+                chunk = next(self.iterator)
+            except StopIteration:
+                return b''
+        if len(chunk) > size:
+            self.buf = chunk[size:]
+            chunk = chunk[:size]
+        return chunk
+
+    def readline(self, size=-1):
+        """
+        Read the next line.
+
+        :param size: (optional) the maximum number of bytes of the next line to
+            read. The default value of ``-1`` means 'unlimited' i.e. read to
+            the end of the line or until the wrapped iterable is exhausted,
+            whichever is first.
+        :raise ValueError: if the close() method has been called.
+        :return: a bytes literal; if the wrapped iterable has been exhausted
+            then a zero-length bytes literal is returned.
+        """
+        size = -1 if size is None else size
+        if self.closed:
+            raise ValueError('I/O operation on closed file')
+        data = b''
+        while b'\n' not in data and (size < 0 or len(data) < size):
+            if size < 0:
+                chunk = self.read(1024)
+            else:
+                chunk = self.read(size - len(data))
+            if not chunk:
+                break
+            data += chunk
+        if b'\n' in data:
+            data, sep, rest = data.partition(b'\n')
+            data += sep
+            if self.buf:
+                self.buf = rest + self.buf
+            else:
+                self.buf = rest
+        return data
+
+    def readlines(self, sizehint=-1):
+        """
+        Call readline() repeatedly and return a list of the lines so read.
+
+        :param sizehint: (optional) an approximate bound on the total number of
+            bytes in the lines returned. Lines are read until ``sizehint`` has
+            been exceeded but complete lines are always returned, so the total
+            bytes read may exceed ``sizehint``.
+        :raise ValueError: if the close() method has been called.
+        :return: a list of bytes literals, each a line from the file.
+        """
+        sizehint = -1 if sizehint is None else sizehint
+        if self.closed:
+            raise ValueError('I/O operation on closed file')
+        lines = []
+        while True:
+            line = self.readline(sizehint)
+            if not line:
+                break
+            lines.append(line)
+            if sizehint >= 0:
+                sizehint -= len(line)
+                if sizehint <= 0:
+                    break
+        return lines
+
+    def close(self):
+        """
+        Close the iter.
+
+        Once close() has been called the iter cannot be used for further I/O
+        operations. close() may be called more than once without error.
+        """
+        self.iterator = None
+        self.closed = True
+
+
+def fs_has_free_space(fs_path_or_fd, space_needed, is_percent):
+    """
+    Check to see whether or not a filesystem has the given amount of space
+    free. Unlike fallocate(), this does not reserve any space.
+
+    :param fs_path_or_fd: path to a file or directory on the filesystem, or an
+        open file descriptor; if a directory, typically the path to the
+        filesystem's mount point
+
+    :param space_needed: minimum bytes or percentage of free space
+
+    :param is_percent: if True, then space_needed is treated as a percentage
+        of the filesystem's capacity; if False, space_needed is a number of
+        free bytes.
+
+    :returns: True if the filesystem has at least that much free space,
+        False otherwise
+
+    :raises OSError: if fs_path does not exist
+    """
+    if isinstance(fs_path_or_fd, int):
+        st = os.fstatvfs(fs_path_or_fd)
+    else:
+        st = os.statvfs(fs_path_or_fd)
+    free_bytes = st.f_frsize * st.f_bavail
+    if is_percent:
+        size_bytes = st.f_frsize * st.f_blocks
+        free_percent = float(free_bytes) / float(size_bytes) * 100
+        return free_percent >= space_needed
+    else:
+        return free_bytes >= space_needed
+
+
+_fallocate_enabled = True
+_fallocate_warned_about_missing = False
+_sys_fallocate = _LibcWrapper('fallocate')
+_sys_posix_fallocate = _LibcWrapper('posix_fallocate')
+
+
+def disable_fallocate():
+    global _fallocate_enabled
+    _fallocate_enabled = False
+
+
+def fallocate(fd, size, offset=0):
+    """
+    Pre-allocate disk space for a file.
+
+    This function can be disabled by calling disable_fallocate(). If no
+    suitable C function is available in libc, this function is a no-op.
+
+    :param fd: file descriptor
+    :param size: size to allocate (in bytes)
+    """
+    global _fallocate_enabled
+    if not _fallocate_enabled:
+        return
+
+    if size < 0:
+        size = 0  # Done historically; not really sure why
+    if size >= (1 << 63):
+        raise ValueError('size must be less than 2 ** 63')
+    if offset < 0:
+        raise ValueError('offset must be non-negative')
+    if offset >= (1 << 63):
+        raise ValueError('offset must be less than 2 ** 63')
+
+    # Make sure there's some (configurable) amount of free space in
+    # addition to the number of bytes we're allocating.
+    if FALLOCATE_RESERVE:
+        st = os.fstatvfs(fd)
+        free = st.f_frsize * st.f_bavail - size
+        if FALLOCATE_IS_PERCENT:
+            free = (float(free) / float(st.f_frsize * st.f_blocks)) * 100
+        if float(free) <= float(FALLOCATE_RESERVE):
+            raise OSError(
+                errno.ENOSPC,
+                'FALLOCATE_RESERVE fail %g <= %g' %
+                (free, FALLOCATE_RESERVE))
+
+    if _sys_fallocate.available:
+        # Parameters are (fd, mode, offset, length).
+        #
+        # mode=FALLOC_FL_KEEP_SIZE pre-allocates invisibly (without
+        # affecting the reported file size).
+        ret = _sys_fallocate(
+            fd, FALLOC_FL_KEEP_SIZE, ctypes.c_uint64(offset),
+            ctypes.c_uint64(size))
+        err = ctypes.get_errno()
+    elif _sys_posix_fallocate.available:
+        # Parameters are (fd, offset, length).
+        ret = _sys_posix_fallocate(fd, ctypes.c_uint64(offset),
+                                   ctypes.c_uint64(size))
+        err = ctypes.get_errno()
+    else:
+        # No suitable fallocate-like function is in our libc. Warn about it,
+        # but just once per process, and then do nothing.
+        global _fallocate_warned_about_missing
+        if not _fallocate_warned_about_missing:
+            logging.warning("Unable to locate fallocate, posix_fallocate in "
+                            "libc.  Leaving as a no-op.")
+            _fallocate_warned_about_missing = True
+        return
+
+    if ret and err not in (0, errno.ENOSYS, errno.EOPNOTSUPP,
+                           errno.EINVAL):
+        raise OSError(err, 'Unable to fallocate(%s)' % size)
+
+
+def punch_hole(fd, offset, length):
+    """
+    De-allocate disk space in the middle of a file.
+
+    :param fd: file descriptor
+    :param offset: index of first byte to de-allocate
+    :param length: number of bytes to de-allocate
+    """
+    if offset < 0:
+        raise ValueError('offset must be non-negative')
+    if offset >= (1 << 63):
+        raise ValueError('offset must be less than 2 ** 63')
+    if length <= 0:
+        raise ValueError('length must be positive')
+    if length >= (1 << 63):
+        raise ValueError('length must be less than 2 ** 63')
+
+    if _sys_fallocate.available:
+        # Parameters are (fd, mode, offset, length).
+        ret = _sys_fallocate(
+            fd,
+            FALLOC_FL_KEEP_SIZE | FALLOC_FL_PUNCH_HOLE,
+            ctypes.c_uint64(offset),
+            ctypes.c_uint64(length))
+        err = ctypes.get_errno()
+        if ret and err:
+            mode_str = "FALLOC_FL_KEEP_SIZE | FALLOC_FL_PUNCH_HOLE"
+            raise OSError(err, "Unable to fallocate(%d, %s, %d, %d)" % (
+                fd, mode_str, offset, length))
+    else:
+        raise OSError(errno.ENOTSUP,
+                      'No suitable C function found for hole punching')
+
+
+def fsync(fd):
+    """
+    Sync modified file data and metadata to disk.
+
+    :param fd: file descriptor
+    """
+    if hasattr(fcntl, 'F_FULLSYNC'):
+        try:
+            fcntl.fcntl(fd, fcntl.F_FULLSYNC)
+        except IOError as e:
+            raise OSError(e.errno, 'Unable to F_FULLSYNC(%s)' % fd)
+    else:
+        os.fsync(fd)
+
+
+def fdatasync(fd):
+    """
+    Sync modified file data to disk.
+
+    :param fd: file descriptor
+    """
+    try:
+        os.fdatasync(fd)
+    except AttributeError:
+        fsync(fd)
+
+
+def fsync_dir(dirpath):
+    """
+    Sync directory entries to disk.
+
+    :param dirpath: Path to the directory to be synced.
+    """
+    dirfd = None
+    try:
+        dirfd = os.open(dirpath, os.O_DIRECTORY | os.O_RDONLY)
+        fsync(dirfd)
+    except OSError as err:
+        if err.errno == errno.ENOTDIR:
+            # Raise error if someone calls fsync_dir on a non-directory
+            raise
+        logging.warning('Unable to perform fsync() on directory %(dir)s:'
+                        ' %(err)s',
+                        {'dir': dirpath, 'err': os.strerror(err.errno)})
+    finally:
+        if dirfd:
+            os.close(dirfd)
+
+
+def mkdirs(path):
+    """
+    Ensures the path is a directory or makes it if not. Errors if the path
+    exists but is a file or on permissions failure.
+
+    :param path: path to create
+    """
+    if not os.path.isdir(path):
+        try:
+            os.makedirs(path)
+        except OSError as err:
+            if err.errno != errno.EEXIST or not os.path.isdir(path):
+                raise
+
+
+def makedirs_count(path, count=0):
+    """
+    Same as os.makedirs() except that this method returns the number of
+    new directories that had to be created.
+
+    Also, this does not raise an error if target directory already exists.
+    This behaviour is similar to Python 3.x's os.makedirs() called with
+    exist_ok=True. Also similar to swift.common.utils.mkdirs()
+
+    https://hg.python.org/cpython/file/v3.4.2/Lib/os.py#l212
+    """
+    head, tail = os.path.split(path)
+    if not tail:
+        head, tail = os.path.split(head)
+    if head and tail and not os.path.exists(head):
+        count = makedirs_count(head, count)
+        if tail == os.path.curdir:
+            return
+    try:
+        os.mkdir(path)
+    except OSError as e:
+        # EEXIST may also be raised if path exists as a file
+        # Do not let that pass.
+        if e.errno != errno.EEXIST or not os.path.isdir(path):
+            raise
+    else:
+        count += 1
+    return count
+
+
+def renamer(old, new, fsync=True):
+    """
+    Attempt to fix / hide race conditions like empty object directories
+    being removed by backend processes during uploads, by retrying.
+
+    The containing directory of 'new' and of all newly created directories are
+    fsync'd by default. This _will_ come at a performance penalty. In cases
+    where these additional fsyncs are not necessary, it is expected that the
+    caller of renamer() turn it off explicitly.
+
+    :param old: old path to be renamed
+    :param new: new path to be renamed to
+    :param fsync: fsync on containing directory of new and also all
+                  the newly created directories.
+    """
+    dirpath = os.path.dirname(new)
+    try:
+        count = makedirs_count(dirpath)
+        os.rename(old, new)
+    except OSError:
+        count = makedirs_count(dirpath)
+        os.rename(old, new)
+    if fsync:
+        # If count=0, no new directories were created. But we still need to
+        # fsync leaf dir after os.rename().
+        # If count>0, starting from leaf dir, fsync parent dirs of all
+        # directories created by makedirs_count()
+        for i in range(0, count + 1):
+            fsync_dir(dirpath)
+            dirpath = os.path.dirname(dirpath)
+
+
+def link_fd_to_path(fd, target_path, dirs_created=0, retries=2, fsync=True):
+    """
+    Creates a link to file descriptor at target_path specified. This method
+    does not close the fd for you. Unlike rename, as linkat() cannot
+    overwrite target_path if it exists, we unlink and try again.
+
+    Attempts to fix / hide race conditions like empty object directories
+    being removed by backend processes during uploads, by retrying.
+
+    :param fd: File descriptor to be linked
+    :param target_path: Path in filesystem where fd is to be linked
+    :param dirs_created: Number of newly created directories that needs to
+                         be fsync'd.
+    :param retries: number of retries to make
+    :param fsync: fsync on containing directory of target_path and also all
+                  the newly created directories.
+    """
+    dirpath = os.path.dirname(target_path)
+    attempts = 0
+    while True:
+        attempts += 1
+        try:
+            linkat(linkat.AT_FDCWD, "/proc/self/fd/%d" % (fd),
+                   linkat.AT_FDCWD, target_path, linkat.AT_SYMLINK_FOLLOW)
+            break
+        except IOError as err:
+            if attempts > retries:
+                raise
+            if err.errno == errno.ENOENT:
+                dirs_created = makedirs_count(dirpath)
+            elif err.errno == errno.EEXIST:
+                try:
+                    os.unlink(target_path)
+                except OSError as e:
+                    if e.errno != errno.ENOENT:
+                        raise
+            else:
+                raise
+
+    if fsync:
+        for i in range(0, dirs_created + 1):
+            fsync_dir(dirpath)
+            dirpath = os.path.dirname(dirpath)
+
+
+def validate_device_partition(device, partition):
+    """
+    Validate that a device and a partition are valid and won't lead to
+    directory traversal when used.
+
+    :param device: device to validate
+    :param partition: partition to validate
+    :raises ValueError: if given an invalid device or partition
+    """
+    if not device or '/' in device or device in ['.', '..']:
+        raise ValueError('Invalid device: %s' % quote(device or ''))
+    if not partition or '/' in partition or partition in ['.', '..']:
+        raise ValueError('Invalid partition: %s' % quote(partition or ''))
+
+
+class RateLimitedIterator(object):
+    """
+    Wrap an iterator to only yield elements at a rate of N per second.
+
+    :param iterable: iterable to wrap
+    :param elements_per_second: the rate at which to yield elements
+    :param limit_after: rate limiting kicks in only after yielding
+                        this many elements; default is 0 (rate limit
+                        immediately)
+    """
+
+    def __init__(self, iterable, elements_per_second, limit_after=0,
+                 ratelimit_if=lambda _junk: True):
+        self.iterator = iter(iterable)
+        self.elements_per_second = elements_per_second
+        self.limit_after = limit_after
+        self.rate_limiter = EventletRateLimiter(elements_per_second)
+        self.ratelimit_if = ratelimit_if
+
+    def __iter__(self):
+        return self
+
+    def __next__(self):
+        next_value = next(self.iterator)
+
+        if self.ratelimit_if(next_value):
+            if self.limit_after > 0:
+                self.limit_after -= 1
+            else:
+                self.rate_limiter.wait()
+        return next_value
+
+
+class GreenthreadSafeIterator(object):
+    """
+    Wrap an iterator to ensure that only one greenthread is inside its next()
+    method at a time.
+
+    This is useful if an iterator's next() method may perform network IO, as
+    that may trigger a greenthread context switch (aka trampoline), which can
+    give another greenthread a chance to call next(). At that point, you get
+    an error like "ValueError: generator already executing". By wrapping calls
+    to next() with a mutex, we avoid that error.
+    """
+
+    def __init__(self, unsafe_iterable):
+        self.unsafe_iter = iter(unsafe_iterable)
+        self.semaphore = eventlet.semaphore.Semaphore(value=1)
+
+    def __iter__(self):
+        return self
+
+    def __next__(self):
+        with self.semaphore:
+            return next(self.unsafe_iter)
+
+
+def memcached_timing_stats(**dec_kwargs):
+    """
+    Returns a decorator that logs timing events or errors for public methods in
+    MemcacheRing class, such as memcached set, get and etc.
+    """
+    def decorating_func(func):
+        method = func.__name__
+
+        @functools.wraps(func)
+        def _timing_stats(cache, *args, **kwargs):
+            start_time = time.time()
+            result = func(cache, *args, **kwargs)
+            cache.logger.timing_since(
+                'memcached.' + method + '.timing', start_time, **dec_kwargs)
+            return result
+
+        return _timing_stats
+    return decorating_func
+
+
+def get_hub():
+    """
+    Checks whether poll is available and falls back
+    on select if it isn't.
+
+    Note about epoll:
+
+    Review: https://review.opendev.org/#/c/18806/
+
+    There was a problem where once out of every 30 quadrillion
+    connections, a coroutine wouldn't wake up when the client
+    closed its end. Epoll was not reporting the event or it was
+    getting swallowed somewhere. Then when that file descriptor
+    was re-used, eventlet would freak right out because it still
+    thought it was waiting for activity from it in some other coro.
+
+    Another note about epoll: it's hard to use when forking. epoll works
+    like so:
+
+    * create an epoll instance: ``efd = epoll_create(...)``
+
+    * register file descriptors of interest with
+      ``epoll_ctl(efd, EPOLL_CTL_ADD, fd, ...)``
+
+    * wait for events with ``epoll_wait(efd, ...)``
+
+    If you fork, you and all your child processes end up using the same
+    epoll instance, and everyone becomes confused. It is possible to use
+    epoll and fork and still have a correct program as long as you do the
+    right things, but eventlet doesn't do those things. Really, it can't
+    even try to do those things since it doesn't get notified of forks.
+
+    In contrast, both poll() and select() specify the set of interesting
+    file descriptors with each call, so there's no problem with forking.
+
+    As eventlet monkey patching is now done before call get_hub() in wsgi.py
+    if we use 'import select' we get the eventlet version, but since version
+    0.20.0 eventlet removed select.poll() function in patched select (see:
+    http://eventlet.net/doc/changelog.html and
+    https://github.com/eventlet/eventlet/commit/614a20462).
+
+    We use eventlet.patcher.original function to get python select module
+    to test if poll() is available on platform.
+    """
+    try:
+        select = eventlet.patcher.original('select')
+        if hasattr(select, "poll"):
+            return "poll"
+        return "selects"
+    except ImportError:
+        return None
+
+
+def drop_privileges(user):
+    """
+    Sets the userid/groupid of the current process, get session leader, etc.
+
+    :param user: User name to change privileges to
+    """
+    if os.geteuid() == 0:
+        groups = [g.gr_gid for g in grp.getgrall() if user in g.gr_mem]
+        os.setgroups(groups)
+    user = pwd.getpwnam(user)
+    os.setgid(user[3])
+    os.setuid(user[2])
+    os.environ['HOME'] = user[5]
+
+
+def clean_up_daemon_hygiene():
+    try:
+        os.setsid()
+    except OSError:
+        pass
+    os.chdir('/')   # in case you need to rmdir on where you started the daemon
+    os.umask(0o22)  # ensure files are created with the correct privileges
+
+
+def parse_options(parser=None, once=False, test_config=False, test_args=None):
+    """Parse standard swift server/daemon options with optparse.OptionParser.
+
+    :param parser: OptionParser to use. If not sent one will be created.
+    :param once: Boolean indicating the "once" option is available
+    :param test_config: Boolean indicating the "test-config" option is
+                        available
+    :param test_args: Override sys.argv; used in testing
+
+    :returns: Tuple of (config, options); config is an absolute path to the
+              config file, options is the parser options as a dictionary.
+
+    :raises SystemExit: First arg (CONFIG) is required, file must exist
+    """
+    if not parser:
+        parser = OptionParser(usage="%prog CONFIG [options]")
+    parser.add_option("-v", "--verbose", default=False, action="store_true",
+                      help="log to console")
+    if once:
+        parser.add_option("-o", "--once", default=False, action="store_true",
+                          help="only run one pass of daemon")
+    if test_config:
+        parser.add_option("-t", "--test-config",
+                          default=False, action="store_true",
+                          help="exit after loading and validating config; "
+                               "do not run the daemon")
+
+    # if test_args is None, optparse will use sys.argv[:1]
+    options, args = parser.parse_args(args=test_args)
+
+    if not args:
+        parser.print_usage()
+        print("Error: missing config path argument")
+        sys.exit(1)
+    config = os.path.abspath(args.pop(0))
+    if not os.path.exists(config):
+        parser.print_usage()
+        print("Error: unable to locate %s" % config)
+        sys.exit(1)
+
+    extra_args = []
+    # if any named options appear in remaining args, set the option to True
+    for arg in args:
+        if arg in options.__dict__:
+            setattr(options, arg, True)
+        else:
+            extra_args.append(arg)
+
+    options = vars(options)
+    if extra_args:
+        options['extra_args'] = extra_args
+    return config, options
+
+
+def select_ip_port(node_dict, use_replication=False):
+    """
+    Get the ip address and port that should be used for the given
+    ``node_dict``.
+
+    If ``use_replication`` is True then the replication ip address and port are
+    returned.
+
+    If ``use_replication`` is False (the default) and the ``node`` dict has an
+    item with key ``use_replication`` then that item's value will determine if
+    the replication ip address and port are returned.
+
+    If neither ``use_replication`` nor ``node_dict['use_replication']``
+    indicate otherwise then the normal ip address and port are returned.
+
+    :param node_dict: a dict describing a node
+    :param use_replication: if True then the replication ip address and port
+        are returned.
+    :return: a tuple of (ip address, port)
+    """
+    if use_replication or node_dict.get('use_replication', False):
+        node_ip = node_dict['replication_ip']
+        node_port = node_dict['replication_port']
+    else:
+        node_ip = node_dict['ip']
+        node_port = node_dict['port']
+    return node_ip, node_port
+
+
+def node_to_string(node_dict, replication=False):
+    """
+    Get a string representation of a node's location.
+
+    :param node_dict: a dict describing a node
+    :param replication: if True then the replication ip address and port are
+        used, otherwise the normal ip address and port are used.
+    :return: a string of the form <ip address>:<port>/<device>
+    """
+    node_ip, node_port = select_ip_port(node_dict, use_replication=replication)
+    if ':' in node_ip:
+        # IPv6
+        node_ip = '[%s]' % node_ip
+    return '{}:{}/{}'.format(node_ip, node_port, node_dict['device'])
+
+
+def storage_directory(datadir, partition, name_hash):
+    """
+    Get the storage directory
+
+    :param datadir: Base data directory
+    :param partition: Partition
+    :param name_hash: Account, container or object name hash
+    :returns: Storage directory
+    """
+    return os.path.join(datadir, str(partition), name_hash[-3:], name_hash)
+
+
+def hash_path(account, container=None, object=None, raw_digest=False):
+    """
+    Get the canonical hash for an account/container/object
+
+    :param account: Account
+    :param container: Container
+    :param object: Object
+    :param raw_digest: If True, return the raw version rather than a hex digest
+    :returns: hash string
+    """
+    if object and not container:
+        raise ValueError('container is required if object is provided')
+    paths = [account if isinstance(account, bytes)
+             else account.encode('utf8')]
+    if container:
+        paths.append(container if isinstance(container, bytes)
+                     else container.encode('utf8'))
+    if object:
+        paths.append(object if isinstance(object, bytes)
+                     else object.encode('utf8'))
+    if raw_digest:
+        return md5(HASH_PATH_PREFIX + b'/' + b'/'.join(paths)
+                   + HASH_PATH_SUFFIX, usedforsecurity=False).digest()
+    else:
+        return md5(HASH_PATH_PREFIX + b'/' + b'/'.join(paths)
+                   + HASH_PATH_SUFFIX, usedforsecurity=False).hexdigest()
+
+
+def get_zero_indexed_base_string(base, index):
+    """
+    This allows the caller to make a list of things with indexes, where the
+    first item (zero indexed) is just the bare base string, and subsequent
+    indexes are appended '-1', '-2', etc.
+
+    e.g.::
+
+      'lock', None => 'lock'
+      'lock', 0    => 'lock'
+      'lock', 1    => 'lock-1'
+      'object', 2  => 'object-2'
+
+    :param base: a string, the base string; when ``index`` is 0 (or None) this
+                 is the identity function.
+    :param index: a digit, typically an integer (or None); for values other
+                  than 0 or None this digit is appended to the base string
+                  separated by a hyphen.
+    """
+    if index == 0 or index is None:
+        return_string = base
+    else:
+        return_string = base + "-%d" % int(index)
+    return return_string
+
+
+def _get_any_lock(fds):
+    for fd in fds:
+        try:
+            fcntl.flock(fd, fcntl.LOCK_EX | fcntl.LOCK_NB)
+            return True
+        except IOError as err:
+            if err.errno != errno.EAGAIN:
+                raise
+    return False
+
+
+@contextmanager
+def lock_path(directory, timeout=None, timeout_class=None,
+              limit=1, name=None):
+    """
+    Context manager that acquires a lock on a directory.  This will block until
+    the lock can be acquired, or the timeout time has expired (whichever occurs
+    first).
+
+    For locking exclusively, file or directory has to be opened in Write mode.
+    Python doesn't allow directories to be opened in Write Mode. So we
+    workaround by locking a hidden file in the directory.
+
+    :param directory: directory to be locked
+    :param timeout: timeout (in seconds). If None, defaults to
+        DEFAULT_LOCK_TIMEOUT
+    :param timeout_class: The class of the exception to raise if the
+        lock cannot be granted within the timeout. Will be
+        constructed as timeout_class(timeout, lockpath). Default:
+        LockTimeout
+    :param limit: The maximum number of locks that may be held concurrently on
+        the same directory at the time this method is called. Note that this
+        limit is only applied during the current call to this method and does
+        not prevent subsequent calls giving a larger limit. Defaults to 1.
+    :param name: A string to distinguishes different type of locks in a
+        directory
+    :raises TypeError: if limit is not an int.
+    :raises ValueError: if limit is less than 1.
+    """
+    if timeout is None:
+        timeout = DEFAULT_LOCK_TIMEOUT
+    if timeout_class is None:
+        timeout_class = swift.common.exceptions.LockTimeout
+    if limit < 1:
+        raise ValueError('limit must be greater than or equal to 1')
+    mkdirs(directory)
+    lockpath = '%s/.lock' % directory
+    if name:
+        lockpath += '-%s' % str(name)
+    fds = [os.open(get_zero_indexed_base_string(lockpath, i),
+                   os.O_WRONLY | os.O_CREAT)
+           for i in range(limit)]
+    sleep_time = 0.01
+    slower_sleep_time = max(timeout * 0.01, sleep_time)
+    slowdown_at = timeout * 0.01
+    time_slept = 0
+    try:
+        with timeout_class(timeout, lockpath):
+            while True:
+                if _get_any_lock(fds):
+                    break
+                if time_slept > slowdown_at:
+                    sleep_time = slower_sleep_time
+                sleep(sleep_time)
+                time_slept += sleep_time
+        yield True
+    finally:
+        for fd in fds:
+            os.close(fd)
+
+
+@contextmanager
+def lock_file(filename, timeout=None, append=False, unlink=True):
+    """
+    Context manager that acquires a lock on a file.  This will block until
+    the lock can be acquired, or the timeout time has expired (whichever occurs
+    first).
+
+    :param filename: file to be locked
+    :param timeout: timeout (in seconds). If None, defaults to
+        DEFAULT_LOCK_TIMEOUT
+    :param append: True if file should be opened in append mode
+    :param unlink: True if the file should be unlinked at the end
+    """
+    if timeout is None:
+        timeout = DEFAULT_LOCK_TIMEOUT
+    flags = os.O_CREAT | os.O_RDWR
+    if append:
+        flags |= os.O_APPEND
+        mode = 'a+b'
+    else:
+        mode = 'r+b'
+    while True:
+        fd = os.open(filename, flags)
+        file_obj = os.fdopen(fd, mode)
+        try:
+            with swift.common.exceptions.LockTimeout(timeout, filename):
+                while True:
+                    try:
+                        fcntl.flock(fd, fcntl.LOCK_EX | fcntl.LOCK_NB)
+                        break
+                    except IOError as err:
+                        if err.errno != errno.EAGAIN:
+                            raise
+                    sleep(0.01)
+            try:
+                if os.stat(filename).st_ino != os.fstat(fd).st_ino:
+                    continue
+            except OSError as err:
+                if err.errno == errno.ENOENT:
+                    continue
+                raise
+            yield file_obj
+            if unlink:
+                os.unlink(filename)
+            break
+        finally:
+            file_obj.close()
+
+
+def lock_parent_directory(filename, timeout=None):
+    """
+    Context manager that acquires a lock on the parent directory of the given
+    file path.  This will block until the lock can be acquired, or the timeout
+    time has expired (whichever occurs first).
+
+    :param filename: file path of the parent directory to be locked
+    :param timeout: timeout (in seconds). If None, defaults to
+        DEFAULT_LOCK_TIMEOUT
+    """
+    return lock_path(os.path.dirname(filename), timeout=timeout)
+
+
+def get_time_units(time_amount):
+    """
+    Get a nomralized length of time in the largest unit of time (hours,
+    minutes, or seconds.)
+
+    :param time_amount: length of time in seconds
+    :returns: A touple of (length of time, unit of time) where unit of time is
+              one of ('h', 'm', 's')
+    """
+    time_unit = 's'
+    if time_amount > 60:
+        time_amount /= 60
+        time_unit = 'm'
+        if time_amount > 60:
+            time_amount /= 60
+            time_unit = 'h'
+    return time_amount, time_unit
+
+
+def compute_eta(start_time, current_value, final_value):
+    """
+    Compute an ETA.  Now only if we could also have a progress bar...
+
+    :param start_time: Unix timestamp when the operation began
+    :param current_value: Current value
+    :param final_value: Final value
+    :returns: ETA as a tuple of (length of time, unit of time) where unit of
+              time is one of ('h', 'm', 's')
+    """
+    elapsed = time.time() - start_time
+    completion = (float(current_value) / final_value) or 0.00001
+    return get_time_units(1.0 / completion * elapsed - elapsed)
+
+
+def unlink_older_than(path, mtime):
+    """
+    Remove any file in a given path that was last modified before mtime.
+
+    :param path: path to remove file from
+    :param mtime: timestamp of oldest file to keep
+    """
+    filepaths = map(functools.partial(os.path.join, path), listdir(path))
+    return unlink_paths_older_than(filepaths, mtime)
+
+
+def unlink_paths_older_than(filepaths, mtime):
+    """
+    Remove any files from the given list that were
+    last modified before mtime.
+
+    :param filepaths: a list of strings, the full paths of files to check
+    :param mtime: timestamp of oldest file to keep
+    """
+    for fpath in filepaths:
+        try:
+            if os.path.getmtime(fpath) < mtime:
+                os.unlink(fpath)
+        except OSError:
+            pass
+
+
+def item_from_env(env, item_name, allow_none=False):
+    """
+    Get a value from the wsgi environment
+
+    :param env: wsgi environment dict
+    :param item_name: name of item to get
+
+    :returns: the value from the environment
+    """
+    item = env.get(item_name, None)
+    if item is None and not allow_none:
+        logging.error("ERROR: %s could not be found in env!", item_name)
+    return item
+
+
+def cache_from_env(env, allow_none=False):
+    """
+    Get memcache connection pool from the environment (which had been
+    previously set by the memcache middleware
+
+    :param env: wsgi environment dict
+
+    :returns: swift.common.memcached.MemcacheRing from environment
+    """
+    return item_from_env(env, 'swift.cache', allow_none)
+
+
+def load_multikey_opts(conf, prefix, allow_none_key=False):
+    """
+    Read multi-key options of the form "<prefix>_<key> = <value>"
+
+    :param conf: a config dict
+    :param prefix: the prefix for which to search
+    :param allow_none_key: if True, also parse "<prefix> = <value>" and
+                           include it in the result as ``(None, value)``
+    :returns: a sorted list of (<key>, <value>) tuples
+    :raises ValueError: if an option starts with prefix but cannot be parsed
+    """
+    result = []
+    for k, v in conf.items():
+        if not k.startswith(prefix):
+            continue
+        suffix = k[len(prefix):]
+        if not suffix and allow_none_key:
+            result.append((k, None, v))
+            continue
+        if len(suffix) >= 2 and suffix[0] == '_':
+            result.append((k, suffix[1:], v))
+            continue
+        raise ValueError('Malformed multi-key option name %s' % k)
+    return sorted(result)
+
+
+class CooperativeCachePopulator(object):
+    """
+    A cooperative token is used to avoid the thundering herd problem when
+    caching is used in front of slow backend(s). Here is it how it works:
+
+    * When lots of in-flight requests try to get the cached item specified by
+      a key from memcache and get cache misses, only the first few (limited by
+      ``num_tokens``) of query requests will be able to get a cooperative
+      token by creating or incrementing an internal memcache key.
+    * Those callers with tokens can send backend requests to fetch data from
+      backend servers and set data into memcache.
+    * All other cache miss requests without a token should wait for cache
+      filling to finish, instead of all querying the backend servers at the
+      same time.
+    * After those requests with a token are done, they will release the token
+      by deleting the internal cache key, and finish this usage session. As
+      such, one token usage session starts when the first request gets a token
+      after cache misses and ends when all requests with a token are done.
+
+    Multiple tokens are available in each usage session in order to increase
+    fault tolerance in the distributed environment. When one request with a
+    token hangs or exits, any other request with a token can still set new
+    fetched data into memcache and finish the current usage session. The
+    CooperativeCachePopulator class uses ``num_tokens`` to define the maximum
+    number of tokens during each usage session. The default is 3.
+
+    In the rare case of all 3 requests with tokens failing, the existing usage
+    session ends after a ``token_ttl`` period is reached and the token key
+    expires. If this happens then other pending requests which have no token
+    will exit waiting in the same order as entering the token session, and fall
+    back to querying the backend and setting data in memcache. After any of
+    those requests without a token successfully sets data in the memcache, the
+    following requests in waiting can fetch that data from memcache as they
+    continue retrying. The ``token_ttl`` is designed to be a back-off time
+    window for retrying the backend; it will work for the same purpose in this
+    case as well. When one token session ends after ``token_ttl``, requests
+    which see a cache miss will start a new cooperative token session.
+
+    :param app: the application instance containing app.logger, app.statsd
+    :param infocache: the infocache instance.
+    :param memcache: the memcache instance, must be a valid MemcacheRing.
+    :param cache_key: the cache key.
+    :param cache_ttl: time-to-live of the data fetched from backend to set into
+        memcached.
+    :param avg_backend_fetch_time: The average time in seconds expected for the
+        backend fetch operation ``do_fetch_backend`` to complete. This duration
+        serves as a base unit for calculating exponential backoff delays when
+        awaiting cache population by other requests, and for determining the
+        cooperative token's time-to-live (``token_ttl``) which is set to 10x
+        this value. Should be greater than 0.
+    :param num_tokens: the minimum limit of tokens per each usage session,
+        also the minimum limit of in-flight requests allowed to fetch data
+        from backend. The default is 3, which gives redundancy when any request
+        with token fails to fetch data from the backend or fails to set new
+        data into memcached; 0 means no cooperative token is used.
+    :param labels: the default labels for emitting labeled metrics, for example
+        resource or operation type, account, container, etc.
+    """
+
+    def __init__(self, app, infocache, memcache,
+                 cache_key, cache_ttl, avg_backend_fetch_time, num_tokens=3,
+                 labels=None):
+        self._logger = app.logger
+        self._statsd = app.statsd
+        self._labels = labels or {}
+        self._infocache = infocache
+        self._memcache = memcache
+        self._cache_key = cache_key
+        self._cache_ttl = cache_ttl
+        self._token_key = '_cache_token/%s' % cache_key
+        self._avg_backend_fetch_time = avg_backend_fetch_time
+        # Time-to-live of the cooperative token when set in memcached, this
+        # defines the typical worse time that a token request would need to
+        # fetch the data from the backend when it's busy, default to be 10
+        # times of the average time spent on ``do_fetch_backend`` which is
+        # the ``avg_backend_fetch_time``.
+        self._token_ttl = avg_backend_fetch_time * 10
+        self._num_tokens = num_tokens
+        # The status of cache operation which sets backend data into Memcached.
+        self.set_cache_state = None
+        # Indicates if this request has acquired one token.
+        self.token_acquired = False
+        # Indicates if the request has no token and doesn't get enough retries.
+        self.lack_retries = False
+        # The HttpResponse object returned by ``do_fetch_backend`` if called.
+        self.backend_resp = None
+        # Track if fetch_data has been called to enforce one-shot usage
+        self._fetch_called = False
+
+    def do_fetch_backend(self):
+        """
+        To fetch data from the backend, needs to be implemented by sub-class.
+
+        :returns: a tuple of (data, response).
+        """
+        raise NotImplementedError
+
+    def cache_encoder(self, data):
+        """
+        To encode data to be stored in Memcached, default to return the data
+        as is.
+
+        :returns: encoded data.
+        """
+        return data
+
+    def cache_decoder(self, data):
+        """
+        To decode data from Memcached, default to return the data as is.
+
+        :returns: decoded data.
+        """
+        return data
+
+    def _query_backend_and_set_cache(self):
+        """
+        Fetch data from the backend and set the value in the Memcached.
+
+        :returns: value of the data fetched from backend; None if not exist.
+        """
+        data, self.backend_resp = self.do_fetch_backend()
+        if not data:
+            return None
+
+        if self._infocache is not None:
+            self._infocache[self._cache_key] = data
+        try:
+            encoded_data = self.cache_encoder(data)
+            self._memcache.set(
+                self._cache_key, encoded_data,
+                time=self._cache_ttl, raise_on_error=True)
+        except swift.common.exceptions.MemcacheConnectionError:
+            self.set_cache_state = 'set_error'
+        else:
+            self.set_cache_state = 'set'
+        return data
+
+    def _sleep_and_retry_memcache(self):
+        """
+        Wait for cache value to be set by other requests with intermittent and
+        limited number of sleeps. With ``token_ttl`` set as 10 times of
+        ``avg_backend_fetch_time`` and the exponential backoff doubling the
+        retry interval after each retry, this function will normally sleep and
+        retry 3 times maximum.
+        The first retry is 1.5 times of the ``avg_backend_fetch_time``, the
+        second is 3 times, and the third is 6 times of it, so total is 10.5
+        times of the ``avg_backend_fetch_time``. This roughly equals to the
+        ``token_ttl`` which is 10 times of the ``avg_backend_fetch_time``.
+
+        :returns: value of the data fetched from Memcached; None if not exist.
+        """
+        cur_time = time.time()
+        cutoff_time = cur_time + self._token_ttl
+        retry_interval = self._avg_backend_fetch_time * 1.5
+        num_waits = 0
+        while cur_time < cutoff_time or num_waits < 3:
+            if cur_time < cutoff_time:
+                sleep(retry_interval)
+                num_waits += 1
+            else:
+                # Request has no token and doesn't get enough retries.
+                self.lack_retries = True
+
+                # To have one last check, when eventlet scheduling didn't give
+                # this greenthread enough cpu cycles and it didn't have enough
+                # times of retries.
+                num_waits = 3
+            cache_data = self._memcache.get(
+                self._cache_key, raise_on_error=False)
+            if cache_data:
+                # cache hit.
+                decoded_data = self.cache_decoder(cache_data)
+                return decoded_data
+            # cache miss, retry again with exponential backoff
+            retry_interval *= 2
+            cur_time = time.time()
+        return None
+
+    def _fetch_data(self):
+        total_requests = 0
+        try:
+            total_requests = self._memcache.incr(
+                self._token_key, time=self._token_ttl)
+        except swift.common.exceptions.MemcacheConnectionError:
+            self._labels['token'] = 'error'  # nosec bandit B105
+
+        if not total_requests:
+            # Couldn't connect to the memcache to increment the token key
+            data = self._query_backend_and_set_cache()
+        elif total_requests <= self._num_tokens:
+            # Acquired a cooperative token, go fetching data from backend and
+            # set the data in memcache.
+            self.token_acquired = True
+            data = self._query_backend_and_set_cache()
+
+            if self.set_cache_state == 'set':
+                # Since the successful finish of one whole cooperative token
+                # session only depends on a single successful request. So when
+                # any request with a token finishes both backend fetching and
+                # memcache set successful, it can remove all cooperative tokens
+                #  of this token session.
+                self._memcache.delete(self._token_key)
+        else:
+            # No token acquired, it means that there are requests in-flight
+            # which will fetch data form the backend servers and update them in
+            # cache, let's wait for them to finish with limited retries.
+            data = self._sleep_and_retry_memcache()
+            self._labels['lack_retries'] = self.lack_retries
+            if data is None:
+                # Still no cache data fetched.
+                data = self._query_backend_and_set_cache()
+        return data
+
+    def fetch_data(self):
+        """
+        Coalescing all requests which are asking for the same data from the
+        backend into a few with cooperative token.
+
+        :returns: value of the data fetched from backend or memcache; None if
+            not exist.
+        """
+        if self._fetch_called:
+            raise RuntimeError("fetch_data() can only be called once per "
+                               "CooperativeCachePopulator instance")
+        self._fetch_called = True
+
+        if not self._num_tokens:
+            # Cooperative token disabled, fetch from backend.
+            data = self._query_backend_and_set_cache()
+            self._labels['token'] = 'disabled'  # nosec bandit B105
+        else:
+            data = self._fetch_data()
+            if 'token' not in self._labels:
+                self._labels['token'] = 'with_token' if self.token_acquired \
+                    else 'no_token'
+
+        if self.backend_resp:
+            self._labels['event'] = 'backend_reqs'
+            self._labels['status'] = self.backend_resp.status_int
+        else:
+            self._labels['event'] = 'cache_served'
+        if self.set_cache_state:
+            self._labels['set_cache_state'] = self.set_cache_state
+        self._statsd.increment('swift_coop_cache', labels=self._labels)
+        return data
+
+
+def write_pickle(obj, dest, tmp=None, pickle_protocol=0):
+    """
+    Ensure that a pickle file gets written to disk.  The file
+    is first written to a tmp location, ensure it is synced to disk, then
+    perform a move to its final location
+
+    :param obj: python object to be pickled
+    :param dest: path of final destination file
+    :param tmp: path to tmp to use, defaults to None
+    :param pickle_protocol: protocol to pickle the obj with, defaults to 0
+    """
+    if tmp is None:
+        tmp = os.path.dirname(dest)
+    mkdirs(tmp)
+    fd, tmppath = mkstemp(dir=tmp, suffix='.tmp')
+    with os.fdopen(fd, 'wb') as fo:
+        pickle.dump(obj, fo, pickle_protocol)
+        fo.flush()
+        os.fsync(fd)
+        renamer(tmppath, dest)
+
+
+def search_tree(root, glob_match, ext='', exts=None, dir_ext=None):
+    """Look in root, for any files/dirs matching glob, recursively traversing
+    any found directories looking for files ending with ext
+
+    :param root: start of search path
+    :param glob_match: glob to match in root, matching dirs are traversed with
+                       os.walk
+    :param ext: only files that end in ext will be returned
+    :param exts: a list of file extensions; only files that end in one of these
+                 extensions will be returned; if set this list overrides any
+                 extension specified using the 'ext' param.
+    :param dir_ext: if present directories that end with dir_ext will not be
+                    traversed and instead will be returned as a matched path
+
+    :returns: list of full paths to matching files, sorted
+
+    """
+    exts = exts or [ext]
+    found_files = []
+    for path in glob.glob(os.path.join(root, glob_match)):
+        if os.path.isdir(path):
+            for root, dirs, files in os.walk(path):
+                if dir_ext and root.endswith(dir_ext):
+                    found_files.append(root)
+                    # the root is a config dir, descend no further
+                    break
+                for file_ in files:
+                    if any(exts) and not any(file_.endswith(e) for e in exts):
+                        continue
+                    found_files.append(os.path.join(root, file_))
+                found_dir = False
+                for dir_ in dirs:
+                    if dir_ext and dir_.endswith(dir_ext):
+                        found_dir = True
+                        found_files.append(os.path.join(root, dir_))
+                if found_dir:
+                    # do not descend further into matching directories
+                    break
+        else:
+            if ext and not path.endswith(ext):
+                continue
+            found_files.append(path)
+    return sorted(found_files)
+
+
+def write_file(path, contents):
+    """Write contents to file at path
+
+    :param path: any path, subdirs will be created as needed
+    :param contents: data to write to file, will be converted to string
+
+    """
+    dirname, name = os.path.split(path)
+    if not os.path.exists(dirname):
+        try:
+            os.makedirs(dirname)
+        except OSError as err:
+            if err.errno == errno.EACCES:
+                sys.exit('Unable to create %s.  Running as '
+                         'non-root?' % dirname)
+    with open(path, 'w') as f:
+        f.write('%s' % contents)
+
+
+def remove_file(path):
+    """Quiet wrapper for os.unlink, OSErrors are suppressed
+
+    :param path: first and only argument passed to os.unlink
+    """
+    try:
+        os.unlink(path)
+    except OSError:
+        pass
+
+
+def remove_directory(path):
+    """Wrapper for os.rmdir, ENOENT and ENOTEMPTY are ignored
+
+    :param path: first and only argument passed to os.rmdir
+    """
+    try:
+        os.rmdir(path)
+    except OSError as e:
+        if e.errno not in (errno.ENOENT, errno.ENOTEMPTY):
+            raise
+
+
+def is_file_older(path, age):
+    """
+    Test if a file mtime is older than the given age, suppressing any OSErrors.
+
+    :param path: first and only argument passed to os.stat
+    :param age: age in seconds
+    :return: True if age is less than or equal to zero or if the file mtime is
+        more than ``age`` in the past; False if age is greater than zero and
+        the file mtime is less than or equal to ``age`` in the past or if there
+        is an OSError while stat'ing the file.
+    """
+    if age <= 0:
+        return True
+    try:
+        return time.time() - os.stat(path).st_mtime > age
+    except OSError:
+        return False
+
+
+def audit_location_generator(devices, datadir, suffix='',
+                             mount_check=True, logger=None,
+                             devices_filter=None, partitions_filter=None,
+                             suffixes_filter=None, hashes_filter=None,
+                             hook_pre_device=None, hook_post_device=None,
+                             hook_pre_partition=None, hook_post_partition=None,
+                             hook_pre_suffix=None, hook_post_suffix=None,
+                             hook_pre_hash=None, hook_post_hash=None,
+                             error_counter=None, yield_hash_dirs=False):
+    """
+    Given a devices path and a data directory, yield (path, device,
+    partition) for all files in that directory
+
+    (devices|partitions|suffixes|hashes)_filter are meant to modify the list of
+    elements that will be iterated. eg: they can be used to exclude some
+    elements based on a custom condition defined by the caller.
+
+    hook_pre_(device|partition|suffix|hash) are called before yielding the
+    element, hook_pos_(device|partition|suffix|hash) are called after the
+    element was yielded. They are meant to do some pre/post processing.
+    eg: saving a progress status.
+
+    :param devices: parent directory of the devices to be audited
+    :param datadir: a directory located under self.devices. This should be
+                    one of the DATADIR constants defined in the account,
+                    container, and object servers.
+    :param suffix: path name suffix required for all names returned
+                   (ignored if yield_hash_dirs is True)
+    :param mount_check: Flag to check if a mount check should be performed
+                    on devices
+    :param logger: a logger object
+    :param devices_filter: a callable taking (devices, [list of devices]) as
+                           parameters and returning a [list of devices]
+    :param partitions_filter: a callable taking (datadir_path, [list of parts])
+                              as parameters and returning a [list of parts]
+    :param suffixes_filter: a callable taking (part_path, [list of suffixes])
+                            as parameters and returning a [list of suffixes]
+    :param hashes_filter: a callable taking (suff_path, [list of hashes]) as
+                          parameters and returning a [list of hashes]
+    :param hook_pre_device: a callable taking device_path as parameter
+    :param hook_post_device: a callable taking device_path as parameter
+    :param hook_pre_partition: a callable taking part_path as parameter
+    :param hook_post_partition: a callable taking part_path as parameter
+    :param hook_pre_suffix: a callable taking suff_path as parameter
+    :param hook_post_suffix: a callable taking suff_path as parameter
+    :param hook_pre_hash: a callable taking hash_path as parameter
+    :param hook_post_hash: a callable taking hash_path as parameter
+    :param error_counter: a dictionary used to accumulate error counts; may
+                          add keys 'unmounted' and 'unlistable_partitions'
+    :param yield_hash_dirs: if True, yield hash dirs instead of individual
+                            files
+    """
+    device_dir = listdir(devices)
+    # randomize devices in case of process restart before sweep completed
+    shuffle(device_dir)
+    if devices_filter:
+        device_dir = devices_filter(devices, device_dir)
+    for device in device_dir:
+        if mount_check and not ismount(os.path.join(devices, device)):
+            if error_counter is not None:
+                error_counter.setdefault('unmounted', [])
+                error_counter['unmounted'].append(device)
+            if logger:
+                logger.warning(
+                    'Skipping %s as it is not mounted', device)
+            continue
+        if hook_pre_device:
+            hook_pre_device(os.path.join(devices, device))
+        datadir_path = os.path.join(devices, device, datadir)
+        try:
+            partitions = listdir(datadir_path)
+        except OSError as e:
+            # NB: listdir ignores non-existent datadir_path
+            if error_counter is not None:
+                error_counter.setdefault('unlistable_partitions', [])
+                error_counter['unlistable_partitions'].append(datadir_path)
+            if logger:
+                logger.warning('Skipping %(datadir)s because %(err)s',
+                               {'datadir': datadir_path, 'err': e})
+            continue
+        if partitions_filter:
+            partitions = partitions_filter(datadir_path, partitions)
+        for partition in partitions:
+            part_path = os.path.join(datadir_path, partition)
+            if hook_pre_partition:
+                hook_pre_partition(part_path)
+            try:
+                suffixes = listdir(part_path)
+            except OSError as e:
+                if e.errno != errno.ENOTDIR:
+                    raise
+                continue
+            if suffixes_filter:
+                suffixes = suffixes_filter(part_path, suffixes)
+            for asuffix in suffixes:
+                suff_path = os.path.join(part_path, asuffix)
+                if hook_pre_suffix:
+                    hook_pre_suffix(suff_path)
+                try:
+                    hashes = listdir(suff_path)
+                except OSError as e:
+                    if e.errno != errno.ENOTDIR:
+                        raise
+                    continue
+                if hashes_filter:
+                    hashes = hashes_filter(suff_path, hashes)
+                for hsh in hashes:
+                    hash_path = os.path.join(suff_path, hsh)
+                    if hook_pre_hash:
+                        hook_pre_hash(hash_path)
+                    if yield_hash_dirs:
+                        if os.path.isdir(hash_path):
+                            yield hash_path, device, partition
+                    else:
+                        try:
+                            files = sorted(listdir(hash_path), reverse=True)
+                        except OSError as e:
+                            if e.errno != errno.ENOTDIR:
+                                raise
+                            continue
+                        for fname in files:
+                            if suffix and not fname.endswith(suffix):
+                                continue
+                            path = os.path.join(hash_path, fname)
+                            yield path, device, partition
+                    if hook_post_hash:
+                        hook_post_hash(hash_path)
+                if hook_post_suffix:
+                    hook_post_suffix(suff_path)
+            if hook_post_partition:
+                hook_post_partition(part_path)
+        if hook_post_device:
+            hook_post_device(os.path.join(devices, device))
+
+
+class AbstractRateLimiter(object):
+    # 1,000 milliseconds = 1 second
+    clock_accuracy = 1000.0
+
+    def __init__(self, max_rate, rate_buffer=5, burst_after_idle=False,
+                 running_time=0):
+        """
+        :param max_rate: The maximum rate per second allowed for the process.
+            Must be > 0 to engage rate-limiting behavior.
+        :param rate_buffer: Number of seconds the rate counter can drop and be
+            allowed to catch up (at a faster than listed rate). A larger number
+            will result in larger spikes in rate but better average accuracy.
+        :param burst_after_idle: If False (the default) then the rate_buffer
+            allowance is lost after the rate limiter has not been called for
+            more than rate_buffer seconds. If True then the rate_buffer
+            allowance is preserved during idle periods which means that a burst
+            of requests may be granted immediately after the idle period.
+        :param running_time: The running time in milliseconds of the next
+            allowable request. Setting this to any time in the past will cause
+            the rate limiter to immediately allow requests; setting this to a
+            future time will cause the rate limiter to deny requests until that
+            time. If ``burst_after_idle`` is True then this can
+            be set to current time (ms) to avoid an initial burst, or set to
+            running_time < (current time - rate_buffer ms) to allow an initial
+            burst.
+        """
+        self.set_max_rate(max_rate)
+        self.set_rate_buffer(rate_buffer)
+        self.burst_after_idle = burst_after_idle
+        self.running_time = running_time
+
+    def set_max_rate(self, max_rate):
+        self.max_rate = max_rate
+        self.time_per_incr = (self.clock_accuracy / self.max_rate
+                              if self.max_rate else 0)
+
+    def set_rate_buffer(self, rate_buffer):
+        self.rate_buffer_ms = rate_buffer * self.clock_accuracy
+
+    def _sleep(self, seconds):
+        # subclasses should override to implement a sleep
+        raise NotImplementedError
+
+    def is_allowed(self, incr_by=1, now=None, block=False):
+        """
+        Check if the calling process is allowed to proceed according to the
+        rate limit.
+
+        :param incr_by: How much to increment the counter.  Useful if you want
+                        to ratelimit 1024 bytes/sec and have differing sizes
+                        of requests. Must be > 0 to engage rate-limiting
+                        behavior.
+        :param now: The time in seconds; defaults to time.time()
+        :param block: if True, the call will sleep until the calling process
+            is allowed to proceed; otherwise the call returns immediately.
+        :return: True if the the calling process is allowed to proceed, False
+            otherwise.
+        """
+        if self.max_rate <= 0 or incr_by <= 0:
+            return True
+
+        now = now or time.time()
+        # Convert seconds to milliseconds
+        now = now * self.clock_accuracy
+
+        # Calculate time per request in milliseconds
+        time_per_request = self.time_per_incr * float(incr_by)
+
+        # Convert rate_buffer to milliseconds and compare
+        if now - self.running_time > self.rate_buffer_ms:
+            self.running_time = now
+            if self.burst_after_idle:
+                self.running_time -= self.rate_buffer_ms
+
+        if now >= self.running_time:
+            self.running_time += time_per_request
+            allowed = True
+        elif block:
+            sleep_time = (self.running_time - now) / self.clock_accuracy
+            # increment running time before sleeping in case the sleep allows
+            # another thread to inspect the rate limiter state
+            self.running_time += time_per_request
+            # Convert diff to a floating point number of seconds and sleep
+            self._sleep(sleep_time)
+            allowed = True
+        else:
+            allowed = False
+
+        return allowed
+
+    def wait(self, incr_by=1, now=None):
+        self.is_allowed(incr_by=incr_by, now=now, block=True)
+
+
+class EventletRateLimiter(AbstractRateLimiter):
+    def __init__(self, max_rate, rate_buffer=5, running_time=0,
+                 burst_after_idle=False):
+        super(EventletRateLimiter, self).__init__(
+            max_rate, rate_buffer=rate_buffer, running_time=running_time,
+            burst_after_idle=burst_after_idle)
+
+    def _sleep(self, seconds):
+        eventlet.sleep(seconds)
+
+
+def ratelimit_sleep(running_time, max_rate, incr_by=1, rate_buffer=5):
+    """
+    Will eventlet.sleep() for the appropriate time so that the max_rate
+    is never exceeded.  If max_rate is 0, will not ratelimit.  The
+    maximum recommended rate should not exceed (1000 * incr_by) a second
+    as eventlet.sleep() does involve some overhead.  Returns running_time
+    that should be used for subsequent calls.
+
+    :param running_time: the running time in milliseconds of the next
+                         allowable request. Best to start at zero.
+    :param max_rate: The maximum rate per second allowed for the process.
+    :param incr_by: How much to increment the counter.  Useful if you want
+                    to ratelimit 1024 bytes/sec and have differing sizes
+                    of requests. Must be > 0 to engage rate-limiting
+                    behavior.
+    :param rate_buffer: Number of seconds the rate counter can drop and be
+                        allowed to catch up (at a faster than listed rate).
+                        A larger number will result in larger spikes in rate
+                        but better average accuracy. Must be > 0 to engage
+                        rate-limiting behavior.
+    :return: The absolute time for the next interval in milliseconds; note
+        that time could have passed well beyond that point, but the next call
+        will catch that and skip the sleep.
+    """
+    warnings.warn(
+        'ratelimit_sleep() is deprecated; use the ``EventletRateLimiter`` '
+        'class instead.', DeprecationWarning, stacklevel=2
+    )
+    rate_limit = EventletRateLimiter(max_rate, rate_buffer=rate_buffer,
+                                     running_time=running_time)
+    rate_limit.wait(incr_by=incr_by)
+    return rate_limit.running_time
+
+
+class ContextPool(GreenPool):
+    """GreenPool subclassed to kill its coros when it gets gc'ed"""
+
+    def __enter__(self):
+        return self
+
+    def __exit__(self, type, value, traceback):
+        self.close()
+
+    def close(self):
+        for coro in list(self.coroutines_running):
+            coro.kill()
+
+
+class GreenAsyncPileWaitallTimeout(Timeout):
+    pass
+
+
+DEAD = object()
+
+
+class GreenAsyncPile(object):
+    """
+    Runs jobs in a pool of green threads, and the results can be retrieved by
+    using this object as an iterator.
+
+    This is very similar in principle to eventlet.GreenPile, except it returns
+    results as they become available rather than in the order they were
+    launched.
+
+    Correlating results with jobs (if necessary) is left to the caller.
+    """
+
+    def __init__(self, size_or_pool):
+        """
+        :param size_or_pool: thread pool size or a pool to use
+        """
+        if isinstance(size_or_pool, GreenPool):
+            self._pool = size_or_pool
+            size = self._pool.size
+        else:
+            self._pool = GreenPool(size_or_pool)
+            size = size_or_pool
+        self._responses = eventlet.queue.LightQueue(size)
+        self._inflight = 0
+        self._pending = 0
+
+    def _run_func(self, func, args, kwargs):
+        try:
+            self._responses.put(func(*args, **kwargs))
+        except Exception:
+            if eventlet.hubs.get_hub().debug_exceptions:
+                traceback.print_exception(*sys.exc_info())
+            self._responses.put(DEAD)
+        finally:
+            self._inflight -= 1
+
+    @property
+    def inflight(self):
+        return self._inflight
+
+    def spawn(self, func, *args, **kwargs):
+        """
+        Spawn a job in a green thread on the pile.
+        """
+        self._pending += 1
+        self._inflight += 1
+        self._pool.spawn(self._run_func, func, args, kwargs)
+
+    def waitfirst(self, timeout):
+        """
+        Wait up to timeout seconds for first result to come in.
+
+        :param timeout: seconds to wait for results
+        :returns: first item to come back, or None
+        """
+        for result in self._wait(timeout, first_n=1):
+            return result
+
+    def waitall(self, timeout):
+        """
+        Wait timeout seconds for any results to come in.
+
+        :param timeout: seconds to wait for results
+        :returns: list of results accrued in that time
+        """
+        return self._wait(timeout)
+
+    def _wait(self, timeout, first_n=None):
+        results = []
+        try:
+            with GreenAsyncPileWaitallTimeout(timeout):
+                while True:
+                    results.append(next(self))
+                    if first_n and len(results) >= first_n:
+                        break
+        except (GreenAsyncPileWaitallTimeout, StopIteration):
+            pass
+        return results
+
+    def __iter__(self):
+        return self
+
+    def __next__(self):
+        while True:
+            try:
+                rv = self._responses.get_nowait()
+            except eventlet.queue.Empty:
+                if self._inflight == 0:
+                    raise StopIteration()
+                rv = self._responses.get()
+            self._pending -= 1
+            if rv is DEAD:
+                continue
+            return rv
+
+
+class StreamingPile(GreenAsyncPile):
+    """
+    Runs jobs in a pool of green threads, spawning more jobs as results are
+    retrieved and worker threads become available.
+
+    When used as a context manager, has the same worker-killing properties as
+    :class:`ContextPool`.
+    """
+
+    def __init__(self, size):
+        """:param size: number of worker threads to use"""
+        self.pool = ContextPool(size)
+        super(StreamingPile, self).__init__(self.pool)
+
+    def asyncstarmap(self, func, args_iter):
+        """
+        This is the same as :func:`itertools.starmap`, except that *func* is
+        executed in a separate green thread for each item, and results won't
+        necessarily have the same order as inputs.
+        """
+        args_iter = iter(args_iter)
+
+        # Initialize the pile
+        for args in itertools.islice(args_iter, self.pool.size):
+            self.spawn(func, *args)
+
+        # Keep populating the pile as greenthreads become available
+        for args in args_iter:
+            try:
+                to_yield = next(self)
+            except StopIteration:
+                break
+            yield to_yield
+            self.spawn(func, *args)
+
+        # Drain the pile
+        for result in self:
+            yield result
+
+    def __enter__(self):
+        self.pool.__enter__()
+        return self
+
+    def __exit__(self, type, value, traceback):
+        self.pool.__exit__(type, value, traceback)
+
+
+def validate_sync_to(value, allowed_sync_hosts, realms_conf):
+    """
+    Validates an X-Container-Sync-To header value, returning the
+    validated endpoint, realm, and realm_key, or an error string.
+
+    :param value: The X-Container-Sync-To header value to validate.
+    :param allowed_sync_hosts: A list of allowed hosts in endpoints,
+        if realms_conf does not apply.
+    :param realms_conf: An instance of
+        swift.common.container_sync_realms.ContainerSyncRealms to
+        validate against.
+    :returns: A tuple of (error_string, validated_endpoint, realm,
+        realm_key). The error_string will None if the rest of the
+        values have been validated. The validated_endpoint will be
+        the validated endpoint to sync to. The realm and realm_key
+        will be set if validation was done through realms_conf.
+    """
+    orig_value = value
+    value = value.rstrip('/')
+    if not value:
+        return (None, None, None, None)
+    if value.startswith('//'):
+        if not realms_conf:
+            return (None, None, None, None)
+        data = value[2:].split('/')
+        if len(data) != 4:
+            return (
+                'Invalid X-Container-Sync-To format %r' % orig_value,
+                None, None, None)
+        realm, cluster, account, container = data
+        realm_key = realms_conf.key(realm)
+        if not realm_key:
+            return ('No realm key for %r' % realm, None, None, None)
+        endpoint = realms_conf.endpoint(realm, cluster)
+        if not endpoint:
+            return (
+                'No cluster endpoint for %(realm)r %(cluster)r'
+                % {'realm': realm, 'cluster': cluster},
+                None, None, None)
+        return (
+            None,
+            '%s/%s/%s' % (endpoint.rstrip('/'), account, container),
+            realm.upper(), realm_key)
+    p = urlparse(value)
+    if p.scheme not in ('http', 'https'):
+        return (
+            'Invalid scheme %r in X-Container-Sync-To, must be "//", '
+            '"http", or "https".' % p.scheme,
+            None, None, None)
+    if not p.path:
+        return ('Path required in X-Container-Sync-To', None, None, None)
+    if p.params or p.query or p.fragment:
+        return (
+            'Params, queries, and fragments not allowed in '
+            'X-Container-Sync-To',
+            None, None, None)
+    if p.hostname not in allowed_sync_hosts:
+        return (
+            'Invalid host %r in X-Container-Sync-To' % p.hostname,
+            None, None, None)
+    return (None, value, None, None)
+
+
+def get_remote_client(req):
+    # remote host for zeus
+    client = req.headers.get('x-cluster-client-ip')
+    if not client and 'x-forwarded-for' in req.headers:
+        # remote host for other lbs
+        client = req.headers['x-forwarded-for'].split(',')[0].strip()
+    if not client:
+        client = req.remote_addr
+    return client
+
+
+def human_readable(value):
+    """
+    Returns the number in a human readable format; for example 1048576 = "1Mi".
+    """
+    value = float(value)
+    index = -1
+    suffixes = 'KMGTPEZY'
+    while value >= 1024 and index + 1 < len(suffixes):
+        index += 1
+        value = round(value / 1024)
+    if index == -1:
+        return '%d' % value
+    return '%d%si' % (round(value), suffixes[index])
+
+
+def put_recon_cache_entry(cache_entry, key, item):
+    """
+    Update a recon cache entry item.
+
+    If ``item`` is an empty dict then any existing ``key`` in ``cache_entry``
+    will be deleted. Similarly if ``item`` is a dict and any of its values are
+    empty dicts then the corresponding key will be deleted from the nested dict
+    in ``cache_entry``.
+
+    We use nested recon cache entries when the object auditor
+    runs in parallel or else in 'once' mode with a specified subset of devices.
+
+    :param cache_entry: a dict of existing cache entries
+    :param key: key for item to update
+    :param item: value for item to update
+    """
+    if isinstance(item, dict):
+        if not item:
+            cache_entry.pop(key, None)
+            return
+        if key not in cache_entry or key in cache_entry and not \
+                isinstance(cache_entry[key], dict):
+            cache_entry[key] = {}
+        for k, v in item.items():
+            if v == {}:
+                cache_entry[key].pop(k, None)
+            else:
+                cache_entry[key][k] = v
+    else:
+        cache_entry[key] = item
+
+
+def dump_recon_cache(cache_dict, cache_file, logger, lock_timeout=2,
+                     set_owner=None):
+    """Update recon cache values
+
+    :param cache_dict: Dictionary of cache key/value pairs to write out
+    :param cache_file: cache file to update
+    :param logger: the logger to use to log an encountered error
+    :param lock_timeout: timeout (in seconds)
+    :param set_owner: Set owner of recon cache file
+    """
+    try:
+        with lock_file(cache_file, lock_timeout, unlink=False) as cf:
+            cache_entry = {}
+            try:
+                existing_entry = cf.readline()
+                if existing_entry:
+                    cache_entry = json.loads(existing_entry)
+            except ValueError:
+                # file doesn't have a valid entry, we'll recreate it
+                pass
+            for cache_key, cache_value in cache_dict.items():
+                put_recon_cache_entry(cache_entry, cache_key, cache_value)
+            tf = None
+            try:
+                with NamedTemporaryFile(dir=os.path.dirname(cache_file),
+                                        delete=False) as tf:
+                    cache_data = json.dumps(cache_entry, ensure_ascii=True,
+                                            sort_keys=True)
+                    tf.write(cache_data.encode('ascii') + b'\n')
+                if set_owner:
+                    os.chown(tf.name, pwd.getpwnam(set_owner).pw_uid, -1)
+                renamer(tf.name, cache_file, fsync=False)
+            finally:
+                if tf is not None:
+                    try:
+                        os.unlink(tf.name)
+                    except OSError as err:
+                        if err.errno != errno.ENOENT:
+                            raise
+    except (Exception, Timeout) as err:
+        logger.exception('Exception dumping recon cache: %s' % err)
+
+
+def load_recon_cache(cache_file):
+    """
+    Load a recon cache file. Treats missing file as empty.
+    """
+    try:
+        with open(cache_file) as fh:
+            return json.load(fh)
+    except IOError as e:
+        if e.errno == errno.ENOENT:
+            return {}
+        else:
+            raise
+    except ValueError:  # invalid JSON
+        return {}
+
+
+def listdir(path):
+    try:
+        return os.listdir(path)
+    except OSError as err:
+        if err.errno != errno.ENOENT:
+            raise
+    return []
+
+
+def streq_const_time(s1, s2):
+    """Constant-time string comparison.
+
+    :params s1: the first string
+    :params s2: the second string
+
+    :return: True if the strings are equal.
+
+    This function takes two strings and compares them.  It is intended to be
+    used when doing a comparison for authentication purposes to help guard
+    against timing attacks.
+    """
+    if len(s1) != len(s2):
+        return False
+    result = 0
+    for (a, b) in zip(s1, s2):
+        result |= ord(a) ^ ord(b)
+    return result == 0
+
+
+def pairs(item_list):
+    """
+    Returns an iterator of all pairs of elements from item_list.
+
+    :param item_list: items (no duplicates allowed)
+    """
+    for i, item1 in enumerate(item_list):
+        for item2 in item_list[(i + 1):]:
+            yield (item1, item2)
+
+
+def replication(func):
+    """
+    Decorator to declare which methods are accessible for different
+    type of servers:
+
+    * If option replication_server is None then this decorator
+      doesn't matter.
+    * If option replication_server is True then ONLY decorated with
+      this decorator methods will be started.
+    * If option replication_server is False then decorated with this
+      decorator methods will NOT be started.
+
+    :param func: function to mark accessible for replication
+    """
+    func.replication = True
+
+    return func
+
+
+def public(func):
+    """
+    Decorator to declare which methods are publicly accessible as HTTP
+    requests
+
+    :param func: function to make public
+    """
+    func.publicly_accessible = True
+    return func
+
+
+def private(func):
+    """
+    Decorator to declare which methods are privately accessible as HTTP
+    requests with an ``X-Backend-Allow-Private-Methods: True`` override
+
+    :param func: function to make private
+    """
+    func.privately_accessible = True
+    return func
+
+
+def majority_size(n):
+    return (n // 2) + 1
+
+
+def quorum_size(n):
+    """
+    quorum size as it applies to services that use 'replication' for data
+    integrity  (Account/Container services).  Object quorum_size is defined
+    on a storage policy basis.
+
+    Number of successful backend requests needed for the proxy to consider
+    the client request successful.
+    """
+    return (n + 1) // 2
+
+
+def rsync_ip(ip):
+    """
+    Transform ip string to an rsync-compatible form
+
+    Will return ipv4 addresses unchanged, but will nest ipv6 addresses
+    inside square brackets.
+
+    :param ip: an ip string (ipv4 or ipv6)
+
+    :returns: a string ip address
+    """
+    return '[%s]' % ip if is_valid_ipv6(ip) else ip
+
+
+def rsync_module_interpolation(template, device):
+    """
+    Interpolate devices variables inside a rsync module template
+
+    :param template: rsync module template as a string
+    :param device: a device from a ring
+
+    :returns: a string with all variables replaced by device attributes
+    """
+    replacements = {
+        'ip': rsync_ip(device.get('ip', '')),
+        'port': device.get('port', ''),
+        'replication_ip': rsync_ip(device.get('replication_ip', '')),
+        'replication_port': device.get('replication_port', ''),
+        'region': device.get('region', ''),
+        'zone': device.get('zone', ''),
+        'device': device.get('device', ''),
+        'meta': device.get('meta', ''),
+    }
+    try:
+        module = template.format(**replacements)
+    except KeyError as e:
+        raise ValueError('Cannot interpolate rsync_module, invalid variable: '
+                         '%s' % e)
+    return module
+
+
+class Everything(object):
+    """
+    A container that contains everything. If "e" is an instance of
+    Everything, then "x in e" is true for all x.
+    """
+
+    def __contains__(self, element):
+        return True
+
+
+def list_from_csv(comma_separated_str):
+    """
+    Splits the str given and returns a properly stripped list of the comma
+    separated values.
+    """
+    if comma_separated_str:
+        return [v.strip() for v in comma_separated_str.split(',') if v.strip()]
+    return []
+
+
+def csv_append(csv_string, item):
+    """
+    Appends an item to a comma-separated string.
+
+    If the comma-separated string is empty/None, just returns item.
+    """
+    if csv_string:
+        return ",".join((csv_string, item))
+    else:
+        return item
+
+
+class ClosingIterator(object):
+    """
+    Wrap another iterator and close it, if possible, on completion/exception.
+
+    If other closeable objects are given then they will also be closed when
+    this iterator is closed.
+
+    This is particularly useful for ensuring a generator properly closes its
+    resources, even if the generator was never started.
+
+    This class may be subclassed to override the behavior of
+    ``_get_next_item``.
+
+    :param iterable: iterator to wrap.
+    :param other_closeables: other resources to attempt to close.
+    """
+    __slots__ = ('closeables', 'wrapped_iter', 'closed')
+
+    def __init__(self, iterable, other_closeables=None):
+        self.closeables = [iterable]
+        if other_closeables:
+            self.closeables.extend(other_closeables)
+        # this is usually, but not necessarily, the same object
+        self.wrapped_iter = iter(iterable)
+        self.closed = False
+
+    def __iter__(self):
+        return self
+
+    def _get_next_item(self):
+        return next(self.wrapped_iter)
+
+    def __next__(self):
+        try:
+            return self._get_next_item()
+        except Exception:
+            # note: if wrapped_iter is a generator then the exception
+            # already caused it to exit (without raising a GeneratorExit)
+            # but we still need to close any other closeables.
+            self.close()
+            raise
+
+    def close(self):
+        if not self.closed:
+            for wrapped in self.closeables:
+                close_if_possible(wrapped)
+            # clear it out so they get GC'ed
+            self.closeables = []
+            self.wrapped_iter = iter([])
+            self.closed = True
+
+
+class ClosingMapper(ClosingIterator):
+    """
+    A closing iterator that yields the result of ``function`` as it is applied
+    to each item of ``iterable``.
+
+    Note that while this behaves similarly to the built-in ``map`` function,
+    ``other_closeables`` does not have the same semantic as the ``iterables``
+    argument of ``map``.
+
+    :param function: a function that will be called with each item of
+        ``iterable`` before yielding its result.
+    :param iterable: iterator to wrap.
+    :param other_closeables: other resources to attempt to close.
+    """
+    __slots__ = ('func',)
+
+    def __init__(self, function, iterable, other_closeables=None):
+        self.func = function
+        super(ClosingMapper, self).__init__(iterable, other_closeables)
+
+    def _get_next_item(self):
+        return self.func(super(ClosingMapper, self)._get_next_item())
+
+
+class CloseableChain(ClosingIterator):
+    """
+    Like itertools.chain, but with a close method that will attempt to invoke
+    its sub-iterators' close methods, if any.
+    """
+
+    def __init__(self, *iterables):
+        chained_iter = itertools.chain(*iterables)
+        super(CloseableChain, self).__init__(chained_iter, iterables)
+
+
+def reiterate(iterable):
+    """
+    Consume the first truthy item from an iterator, then re-chain it to the
+    rest of the iterator.  This is useful when you want to make sure the
+    prologue to downstream generators have been executed before continuing.
+    :param iterable: an iterable object
+    """
+    if isinstance(iterable, (list, tuple)):
+        return iterable
+    else:
+        iterator = iter(iterable)
+        try:
+            chunk = next(iterator)
+            while not chunk:
+                chunk = next(iterator)
+            return CloseableChain([chunk], iterator)
+        except StopIteration:
+            close_if_possible(iterable)
+            return iter([])
+
+
+class InputProxy(object):
+    """
+    File-like object that counts bytes read.
+    To be swapped in for wsgi.input for accounting purposes.
+
+    :param wsgi_input: file-like object to be wrapped
+    """
+
+    def __init__(self, wsgi_input):
+        self.wsgi_input = wsgi_input
+        #: total number of bytes read from the wrapped input
+        self.bytes_received = 0
+        #: ``True`` if an exception is raised by ``read()`` or ``readline()``,
+        #: ``False`` otherwise
+        self.client_disconnect = False
+
+    def chunk_update(self, chunk, eof, *args, **kwargs):
+        """
+        Called each time a chunk of bytes is read from the wrapped input.
+
+        :param chunk: the chunk of bytes that has been read.
+        :param eof: ``True`` if there are no more bytes to read from the
+            wrapped input, ``False`` otherwise. If ``read()`` has been called
+            this will be ``True`` when the size of ``chunk`` is less than the
+            requested size or the requested size is None. If ``readline`` has
+            been called this will be ``True`` when an incomplete line is read
+            (i.e. not ending with ``b'\\n'``) whose length is less than the
+            requested size or the requested size is None. If ``read()`` or
+            ``readline()`` are called with a requested size that exactly
+            matches the number of bytes remaining in the wrapped input then
+            ``eof`` will be ``False``. A subsequent call to ``read()`` or
+            ``readline()`` with non-zero ``size`` would result in ``eof`` being
+            ``True``. Alternatively, the end of the input could be inferred
+            by comparing ``bytes_received`` with the expected length of the
+            input.
+        """
+        # subclasses may override this method; either the given chunk or an
+        # alternative chunk value should be returned
+        return chunk
+
+    def read(self, size=None, *args, **kwargs):
+        """
+        Pass read request to the underlying file-like object and
+        add bytes read to total.
+
+        :param size: (optional) maximum number of bytes to read; the default
+            ``None`` means unlimited.
+        """
+        try:
+            chunk = self.wsgi_input.read(size, *args, **kwargs)
+        except Exception:
+            self.client_disconnect = True
+            raise
+        self.bytes_received += len(chunk)
+        eof = size is None or size < 0 or len(chunk) < size
+        return self.chunk_update(chunk, eof)
+
+    def readline(self, size=None, *args, **kwargs):
+        """
+        Pass readline request to the underlying file-like object and
+        add bytes read to total.
+
+        :param size: (optional) maximum number of bytes to read from the
+            current line; the default ``None`` means unlimited.
+        """
+        try:
+            line = self.wsgi_input.readline(size, *args, **kwargs)
+        except Exception:
+            self.client_disconnect = True
+            raise
+        self.bytes_received += len(line)
+        eof = ((size is None or size < 0 or len(line) < size)
+               and (line[-1:] != b'\n'))
+        return self.chunk_update(line, eof)
+
+    def close(self):
+        close_if_possible(self.wsgi_input)
+
+
+class LRUCache(object):
+    """
+    Decorator for size/time bound memoization that evicts the least
+    recently used members.
+    """
+
+    PREV, NEXT, KEY, CACHED_AT, VALUE = 0, 1, 2, 3, 4  # link fields
+
+    def __init__(self, maxsize=1000, maxtime=3600):
+        self.maxsize = maxsize
+        self.maxtime = maxtime
+        self.reset()
+
+    def reset(self):
+        self.mapping = {}
+        self.head = [None, None, None, None, None]  # oldest
+        self.tail = [self.head, None, None, None, None]  # newest
+        self.head[self.NEXT] = self.tail
+
+    def set_cache(self, value, *key):
+        while len(self.mapping) >= self.maxsize:
+            old_next, old_key = self.head[self.NEXT][self.NEXT:self.NEXT + 2]
+            self.head[self.NEXT], old_next[self.PREV] = old_next, self.head
+            del self.mapping[old_key]
+        last = self.tail[self.PREV]
+        link = [last, self.tail, key, time.time(), value]
+        self.mapping[key] = last[self.NEXT] = self.tail[self.PREV] = link
+        return value
+
+    def get_cached(self, link, *key):
+        link_prev, link_next, key, cached_at, value = link
+        if cached_at + self.maxtime < time.time():
+            raise KeyError('%r has timed out' % (key,))
+        link_prev[self.NEXT] = link_next
+        link_next[self.PREV] = link_prev
+        last = self.tail[self.PREV]
+        last[self.NEXT] = self.tail[self.PREV] = link
+        link[self.PREV] = last
+        link[self.NEXT] = self.tail
+        return value
+
+    def __call__(self, f):
+
+        class LRUCacheWrapped(object):
+
+            @functools.wraps(f)
+            def __call__(im_self, *key):
+                link = self.mapping.get(key, self.head)
+                if link is not self.head:
+                    try:
+                        return self.get_cached(link, *key)
+                    except KeyError:
+                        pass
+                value = f(*key)
+                self.set_cache(value, *key)
+                return value
+
+            def size(im_self):
+                """
+                Return the size of the cache
+                """
+                return len(self.mapping)
+
+            def reset(im_self):
+                return self.reset()
+
+            def get_maxsize(im_self):
+                return self.maxsize
+
+            def set_maxsize(im_self, i):
+                self.maxsize = i
+
+            def get_maxtime(im_self):
+                return self.maxtime
+
+            def set_maxtime(im_self, i):
+                self.maxtime = i
+
+            maxsize = property(get_maxsize, set_maxsize)
+            maxtime = property(get_maxtime, set_maxtime)
+
+            def __repr__(im_self):
+                return '<%s %r>' % (im_self.__class__.__name__, f)
+
+        return LRUCacheWrapped()
+
+
+class Spliterator(object):
+    """
+    Takes an iterator yielding sliceable things (e.g. strings or lists) and
+    yields subiterators, each yielding up to the requested number of items
+    from the source.
+
+    >>> si = Spliterator(["abcde", "fg", "hijkl"])
+    >>> ''.join(si.take(4))
+    "abcd"
+    >>> ''.join(si.take(3))
+    "efg"
+    >>> ''.join(si.take(1))
+    "h"
+    >>> ''.join(si.take(3))
+    "ijk"
+    >>> ''.join(si.take(3))
+    "l"  # shorter than requested; this can happen with the last iterator
+
+    """
+
+    def __init__(self, source_iterable):
+        self.input_iterator = iter(source_iterable)
+        self.leftovers = None
+        self.leftovers_index = 0
+        self._iterator_in_progress = False
+
+    def take(self, n):
+        if self._iterator_in_progress:
+            raise ValueError(
+                "cannot call take() again until the first iterator is"
+                " exhausted (has raised StopIteration)")
+        self._iterator_in_progress = True
+
+        try:
+            if self.leftovers:
+                # All this string slicing is a little awkward, but it's for
+                # a good reason. Consider a length N string that someone is
+                # taking k bytes at a time.
+                #
+                # With this implementation, we create one new string of
+                # length k (copying the bytes) on each call to take(). Once
+                # the whole input has been consumed, each byte has been
+                # copied exactly once, giving O(N) bytes copied.
+                #
+                # If, instead of this, we were to set leftovers =
+                # leftovers[k:] and omit leftovers_index, then each call to
+                # take() would copy k bytes to create the desired substring,
+                # then copy all the remaining bytes to reset leftovers,
+                # resulting in an overall O(N^2) bytes copied.
+                llen = len(self.leftovers) - self.leftovers_index
+                if llen <= n:
+                    n -= llen
+                    to_yield = self.leftovers[self.leftovers_index:]
+                    self.leftovers = None
+                    self.leftovers_index = 0
+                    yield to_yield
+                else:
+                    to_yield = self.leftovers[
+                        self.leftovers_index:(self.leftovers_index + n)]
+                    self.leftovers_index += n
+                    n = 0
+                    yield to_yield
+
+            while n > 0:
+                try:
+                    chunk = next(self.input_iterator)
+                except StopIteration:
+                    return
+                cl = len(chunk)
+                if cl <= n:
+                    n -= cl
+                    yield chunk
+                else:
+                    self.leftovers = chunk
+                    self.leftovers_index = n
+                    yield chunk[:n]
+                    n = 0
+        finally:
+            self._iterator_in_progress = False
+
+
+def ismount(path):
+    """
+    Test whether a path is a mount point. This will catch any
+    exceptions and translate them into a False return value
+    Use ismount_raw to have the exceptions raised instead.
+    """
+    try:
+        return ismount_raw(path)
+    except OSError:
+        return False
+
+
+def ismount_raw(path):
+    """
+    Test whether a path is a mount point. Whereas ismount will catch
+    any exceptions and just return False, this raw version will not
+    catch exceptions.
+
+    This is code hijacked from C Python 2.6.8, adapted to remove the extra
+    lstat() system call.
+    """
+    try:
+        s1 = os.lstat(path)
+    except os.error as err:
+        if err.errno == errno.ENOENT:
+            # It doesn't exist -- so not a mount point :-)
+            return False
+        raise
+
+    if stat.S_ISLNK(s1.st_mode):
+        # Some environments (like vagrant-swift-all-in-one) use a symlink at
+        # the device level but could still provide a stubfile in the target
+        # to indicate that it should be treated as a mount point for swift's
+        # purposes.
+        if os.path.isfile(os.path.join(path, ".ismount")):
+            return True
+        # Otherwise, a symlink can never be a mount point
+        return False
+
+    s2 = os.lstat(os.path.join(path, '..'))
+    dev1 = s1.st_dev
+    dev2 = s2.st_dev
+    if dev1 != dev2:
+        # path/.. on a different device as path
+        return True
+
+    ino1 = s1.st_ino
+    ino2 = s2.st_ino
+    if ino1 == ino2:
+        # path/.. is the same i-node as path
+        return True
+
+    # Device and inode checks are not properly working inside containerized
+    # environments, therefore using a workaround to check if there is a
+    # stubfile placed by an operator
+    if os.path.isfile(os.path.join(path, ".ismount")):
+        return True
+
+    return False
+
+
+def close_if_possible(maybe_closable):
+    close_method = getattr(maybe_closable, 'close', None)
+    if callable(close_method):
+        return close_method()
+
+
+@contextmanager
+def closing_if_possible(maybe_closable):
+    """
+    Like contextlib.closing(), but doesn't crash if the object lacks a close()
+    method.
+
+    PEP 333 (WSGI) says: "If the iterable returned by the application has a
+    close() method, the server or gateway must call that method upon
+    completion of the current request[.]" This function makes that easier.
+    """
+    try:
+        yield maybe_closable
+    finally:
+        close_if_possible(maybe_closable)
+
+
+def drain_and_close(response_or_app_iter, read_limit=None):
+    """
+    Drain and close a swob or WSGI response.
+
+    This ensures we don't log a 499 in the proxy just because we realized we
+    don't care about the body of an error.
+    """
+    app_iter = getattr(response_or_app_iter, 'app_iter', response_or_app_iter)
+    if app_iter is None:  # for example, if we used the Response.body property
+        return
+    bytes_read = 0
+    with closing_if_possible(app_iter):
+        for chunk in app_iter:
+            bytes_read += len(chunk)
+            if read_limit is not None and bytes_read >= read_limit:
+                break
+
+
+def friendly_close(resp):
+    """
+    Close a swob or WSGI response and maybe drain it.
+
+    It's basically free to "read" a HEAD or HTTPException response - the bytes
+    are probably already in our network buffers.  For a larger response we
+    could possibly burn a lot of CPU/network trying to drain an un-used
+    response.  This method will read up to DEFAULT_DRAIN_LIMIT bytes to avoid
+    logging a 499 in the proxy when it would otherwise be easy to just throw
+    away the small/empty body.
+    """
+    return drain_and_close(resp, read_limit=DEFAULT_DRAIN_LIMIT)
+
+
+_rfc_token = r'[^()<>@,;:\"/\[\]?={}\x00-\x20\x7f]+'  # nosec B105
+_rfc_extension_pattern = re.compile(
+    r'(?:\s*;\s*(' + _rfc_token + r")\s*(?:=\s*(" + _rfc_token +
+    r'|"(?:[^"\\]|\\.)*"))?)')
+
+_loose_token = r'[^()<>@,;:\"\[\]?={}\x00-\x20\x7f]+'  # nosec B105
+_loose_extension_pattern = re.compile(
+    r'(?:\s*;\s*(' + _loose_token + r")\s*(?:=\s*(" + _loose_token +
+    r'|"(?:[^"\\]|\\.)*"))?)')
+
+_content_range_pattern = re.compile(r'^bytes (\d+)-(\d+)/(\d+)$')
+
+
+def parse_content_range(content_range):
+    """
+    Parse a content-range header into (first_byte, last_byte, total_size).
+
+    See RFC 7233 section 4.2 for details on the header format, but it's
+    basically "Content-Range: bytes ${start}-${end}/${total}".
+
+    :param content_range: Content-Range header value to parse,
+        e.g. "bytes 100-1249/49004"
+    :returns: 3-tuple (start, end, total)
+    :raises ValueError: if malformed
+    """
+    found = re.search(_content_range_pattern, content_range)
+    if not found:
+        raise ValueError("malformed Content-Range %r" % (content_range,))
+    return tuple(int(x) for x in found.groups())
+
+
+def parse_content_type(content_type, strict=True):
+    """
+    Parse a content-type and its parameters into values.
+    RFC 2616 sec 14.17 and 3.7 are pertinent.
+
+    **Examples**::
+
+        'text/plain; charset=UTF-8' -> ('text/plain', [('charset, 'UTF-8')])
+        'text/plain; charset=UTF-8; level=1' ->
+            ('text/plain', [('charset, 'UTF-8'), ('level', '1')])
+
+    :param content_type: content_type to parse
+    :param strict: ignore ``/`` and any following characters in parameter
+        tokens. If ``strict`` is True a parameter such as ``x=a/b`` will be
+        parsed as ``x=a``. If ``strict`` is False a parameter such as ``x=a/b``
+        will be parsed as ``x=a/b``. The default is True.
+    :returns: a tuple containing (content type, list of k, v parameter tuples)
+    """
+    parm_list = []
+    if ';' in content_type:
+        content_type, parms = content_type.split(';', 1)
+        parms = ';' + parms
+        pat = _rfc_extension_pattern if strict else _loose_extension_pattern
+        for m in pat.findall(parms):
+            key = m[0].strip()
+            value = m[1].strip()
+            parm_list.append((key, value))
+    return content_type, parm_list
+
+
+def parse_header(value):
+    """
+    Parse a header value to extract the first part and a dict of any
+    following parameters.
+
+    The ``value`` to parse should be of the form:
+
+        ``<first part>[;<key>=<value>][; <key>=<value>]...``
+
+    ``<first part>`` should be of the form ``<token>[/<token>]``, ``<key>``
+    should be a ``token``, and ``<value>`` should be either a ``token`` or
+    ``quoted-string``, where ``token`` and ``quoted-string`` are defined by RFC
+    2616 section 2.2.
+
+    :param value: the header value to parse.
+    :return: a tuple (first part, dict(params)).
+    """
+    # note: this does not behave *exactly* like cgi.parse_header (which this
+    # replaces) w.r.t. parsing non-token characters in param values (e.g. the
+    # null character) , but it's sufficient for our use cases.
+    token, params = parse_content_type(value, strict=False)
+    return token, dict(params)
+
+
+def extract_swift_bytes(content_type):
+    """
+    Parse a content-type and return a tuple containing:
+        - the content_type string minus any swift_bytes param,
+        -  the swift_bytes value or None if the param was not found
+
+    :param content_type: a content-type string
+    :return: a tuple of (content-type, swift_bytes or None)
+    """
+    content_type, params = parse_content_type(content_type)
+    swift_bytes = None
+    for k, v in params:
+        if k == 'swift_bytes':
+            swift_bytes = v
+        else:
+            content_type += ';%s=%s' % (k, v)
+    return content_type, swift_bytes
+
+
+def override_bytes_from_content_type(listing_dict, logger=None):
+    """
+    Takes a dict from a container listing and overrides the content_type,
+    bytes fields if swift_bytes is set.
+    """
+    listing_dict['content_type'], swift_bytes = extract_swift_bytes(
+        listing_dict['content_type'])
+    if swift_bytes is not None:
+        try:
+            listing_dict['bytes'] = int(swift_bytes)
+        except ValueError:
+            if logger:
+                logger.exception("Invalid swift_bytes")
+
+
+def clean_content_type(value):
+    if ';' in value:
+        left, right = value.rsplit(';', 1)
+        if right.lstrip().startswith('swift_bytes='):
+            return left
+    return value
+
+
+class _MultipartMimeFileLikeObject(object):
+
+    def __init__(self, wsgi_input, boundary, input_buffer, read_chunk_size):
+        self.no_more_data_for_this_file = False
+        self.no_more_files = False
+        self.wsgi_input = wsgi_input
+        self.boundary = boundary
+        self.input_buffer = input_buffer
+        self.read_chunk_size = read_chunk_size
+
+    def read(self, length=None):
+        if not length:
+            length = self.read_chunk_size
+        if self.no_more_data_for_this_file:
+            return b''
+
+        # read enough data to know whether we're going to run
+        # into a boundary in next [length] bytes
+        if len(self.input_buffer) < length + len(self.boundary) + 2:
+            to_read = length + len(self.boundary) + 2
+            while to_read > 0:
+                try:
+                    chunk = self.wsgi_input.read(to_read)
+                except (IOError, ValueError) as e:
+                    raise swift.common.exceptions.ChunkReadError(str(e))
+                to_read -= len(chunk)
+                self.input_buffer += chunk
+                if not chunk:
+                    self.no_more_files = True
+                    break
+
+        boundary_pos = self.input_buffer.find(self.boundary)
+
+        # boundary does not exist in the next (length) bytes
+        if boundary_pos == -1 or boundary_pos > length:
+            ret = self.input_buffer[:length]
+            self.input_buffer = self.input_buffer[length:]
+        # if it does, just return data up to the boundary
+        else:
+            ret, self.input_buffer = self.input_buffer.split(self.boundary, 1)
+            self.no_more_files = self.input_buffer.startswith(b'--')
+            self.no_more_data_for_this_file = True
+            self.input_buffer = self.input_buffer[2:]
+        return ret
+
+    def readline(self):
+        if self.no_more_data_for_this_file:
+            return b''
+        boundary_pos = newline_pos = -1
+        while newline_pos < 0 and boundary_pos < 0:
+            try:
+                chunk = self.wsgi_input.read(self.read_chunk_size)
+            except (IOError, ValueError) as e:
+                raise swift.common.exceptions.ChunkReadError(str(e))
+            self.input_buffer += chunk
+            newline_pos = self.input_buffer.find(b'\r\n')
+            boundary_pos = self.input_buffer.find(self.boundary)
+            if not chunk:
+                self.no_more_files = True
+                break
+        # found a newline
+        if newline_pos >= 0 and \
+                (boundary_pos < 0 or newline_pos < boundary_pos):
+            # Use self.read to ensure any logic there happens...
+            ret = b''
+            to_read = newline_pos + 2
+            while to_read > 0:
+                chunk = self.read(to_read)
+                # Should never happen since we're reading from input_buffer,
+                # but just for completeness...
+                if not chunk:
+                    break
+                to_read -= len(chunk)
+                ret += chunk
+            return ret
+        else:  # no newlines, just return up to next boundary
+            return self.read(len(self.input_buffer))
+
+
+def iter_multipart_mime_documents(wsgi_input, boundary, read_chunk_size=4096):
+    """
+    Given a multi-part-mime-encoded input file object and boundary,
+    yield file-like objects for each part. Note that this does not
+    split each part into headers and body; the caller is responsible
+    for doing that if necessary.
+
+    :param wsgi_input: The file-like object to read from.
+    :param boundary: The mime boundary to separate new file-like objects on.
+    :returns: A generator of file-like objects for each part.
+    :raises MimeInvalid: if the document is malformed
+    """
+    boundary = b'--' + boundary
+    blen = len(boundary) + 2  # \r\n
+    try:
+        got = wsgi_input.readline(blen)
+        while got == b'\r\n':
+            got = wsgi_input.readline(blen)
+    except (IOError, ValueError) as e:
+        raise swift.common.exceptions.ChunkReadError(str(e))
+
+    if got.strip() != boundary:
+        raise swift.common.exceptions.MimeInvalid(
+            'invalid starting boundary: wanted %r, got %r' % (boundary, got))
+    boundary = b'\r\n' + boundary
+    input_buffer = b''
+    done = False
+    while not done:
+        it = _MultipartMimeFileLikeObject(wsgi_input, boundary, input_buffer,
+                                          read_chunk_size)
+        yield it
+        done = it.no_more_files
+        input_buffer = it.input_buffer
+
+
+def parse_mime_headers(doc_file):
+    """
+    Takes a file-like object containing a MIME document and returns a
+    HeaderKeyDict containing the headers. The body of the message is not
+    consumed: the position in doc_file is left at the beginning of the body.
+
+    This function was inspired by the Python standard library's
+    http.client.parse_headers.
+
+    :param doc_file: binary file-like object containing a MIME document
+    :returns: a swift.common.swob.HeaderKeyDict containing the headers
+    """
+    headers = []
+    while True:
+        line = doc_file.readline()
+        done = line in (b'\r\n', b'\n', b'')
+        try:
+            line = line.decode('utf-8')
+        except UnicodeDecodeError:
+            line = line.decode('latin1')
+        headers.append(line)
+        if done:
+            break
+    header_string = ''.join(headers)
+    headers = email.parser.Parser().parsestr(header_string)
+    return HeaderKeyDict(headers)
+
+
+def mime_to_document_iters(input_file, boundary, read_chunk_size=4096):
+    """
+    Takes a file-like object containing a multipart MIME document and
+    returns an iterator of (headers, body-file) tuples.
+
+    :param input_file: file-like object with the MIME doc in it
+    :param boundary: MIME boundary, sans dashes
+        (e.g. "divider", not "--divider")
+    :param read_chunk_size: size of strings read via input_file.read()
+    """
+    if isinstance(boundary, str):
+        # Since the boundary is in client-supplied headers, it can contain
+        # garbage that trips us and we don't like client-induced 500.
+        boundary = boundary.encode('latin-1', errors='replace')
+    doc_files = iter_multipart_mime_documents(input_file, boundary,
+                                              read_chunk_size)
+    for i, doc_file in enumerate(doc_files):
+        # this consumes the headers and leaves just the body in doc_file
+        headers = parse_mime_headers(doc_file)
+        yield (headers, doc_file)
+
+
+def maybe_multipart_byteranges_to_document_iters(app_iter, content_type):
+    """
+    Takes an iterator that may or may not contain a multipart MIME document
+    as well as content type and returns an iterator of body iterators.
+
+    :param app_iter: iterator that may contain a multipart MIME document
+    :param content_type: content type of the app_iter, used to determine
+                         whether it conains a multipart document and, if
+                         so, what the boundary is between documents
+    """
+    content_type, params_list = parse_content_type(content_type)
+    if content_type != 'multipart/byteranges':
+        yield app_iter
+        return
+
+    body_file = FileLikeIter(app_iter)
+    boundary = dict(params_list)['boundary']
+    for _headers, body in mime_to_document_iters(body_file, boundary):
+        yield (chunk for chunk in iter(lambda: body.read(65536), b''))
+
+
+def document_iters_to_multipart_byteranges(ranges_iter, boundary):
+    """
+    Takes an iterator of range iters and yields a multipart/byteranges MIME
+    document suitable for sending as the body of a multi-range 206 response.
+
+    See document_iters_to_http_response_body for parameter descriptions.
+    """
+    if not isinstance(boundary, bytes):
+        boundary = boundary.encode('ascii')
+
+    divider = b"--" + boundary + b"\r\n"
+    terminator = b"--" + boundary + b"--"
+
+    for range_spec in ranges_iter:
+        start_byte = range_spec["start_byte"]
+        end_byte = range_spec["end_byte"]
+        entity_length = range_spec.get("entity_length", "*")
+        content_type = range_spec["content_type"]
+        part_iter = range_spec["part_iter"]
+        if not isinstance(content_type, bytes):
+            content_type = str(content_type).encode('utf-8')
+        if not isinstance(entity_length, bytes):
+            entity_length = str(entity_length).encode('utf-8')
+
+        part_header = b''.join((
+            divider,
+            b"Content-Type: ", content_type, b"\r\n",
+            b"Content-Range: ", b"bytes %d-%d/%s\r\n" % (
+                start_byte, end_byte, entity_length),
+            b"\r\n"
+        ))
+        yield part_header
+
+        for chunk in part_iter:
+            yield chunk
+        yield b"\r\n"
+    yield terminator
+
+
+class StringAlong(ClosingIterator):
+    """
+    This iterator wraps and iterates over a first iterator until it stops, and
+    then iterates a second iterator, expecting it to stop immediately. This
+    "stringing along" of the second iterator is useful when the exit of the
+    second iterator must be delayed until the first iterator has stopped. For
+    example, when the second iterator has already yielded its item(s) but
+    has resources that mustn't be garbage collected until the first iterator
+    has stopped.
+
+    The second iterator is expected to have no more items and raise
+    StopIteration when called. If this is not the case then
+    ``unexpected_items_func`` is called.
+
+    :param iterable: a first iterator that is wrapped and iterated.
+    :param other_iter: a second iterator that is stopped once the first
+        iterator has stopped.
+    :param unexpected_items_func: a no-arg function that will be called if the
+        second iterator is found to have remaining items.
+    """
+    __slots__ = ('other_iter', 'unexpected_items_func')
+
+    def __init__(self, iterable, other_iter, unexpected_items_func):
+        super(StringAlong, self).__init__(iterable, [other_iter])
+        self.other_iter = other_iter
+        self.unexpected_items_func = unexpected_items_func
+
+    def _get_next_item(self):
+        try:
+            return super(StringAlong, self)._get_next_item()
+        except StopIteration:
+            try:
+                next(self.other_iter)
+            except StopIteration:
+                pass
+            else:
+                self.unexpected_items_func()
+            finally:
+                raise
+
+
+def document_iters_to_http_response_body(ranges_iter, boundary, multipart,
+                                         logger):
+    """
+    Takes an iterator of range iters and turns it into an appropriate
+    HTTP response body, whether that's multipart/byteranges or not.
+
+    This is almost, but not quite, the inverse of
+    request_helpers.http_response_to_document_iters(). This function only
+    yields chunks of the body, not any headers.
+
+    :param ranges_iter: an iterator of dictionaries, one per range.
+        Each dictionary must contain at least the following key:
+        "part_iter": iterator yielding the bytes in the range
+
+        Additionally, if multipart is True, then the following other keys
+        are required:
+
+        "start_byte": index of the first byte in the range
+        "end_byte": index of the last byte in the range
+        "content_type": value for the range's Content-Type header
+
+        Finally, there is one optional key that is used in the
+            multipart/byteranges case:
+
+        "entity_length": length of the requested entity (not necessarily
+            equal to the response length). If omitted, "*" will be used.
+
+        Each part_iter will be exhausted prior to calling next(ranges_iter).
+
+    :param boundary: MIME boundary to use, sans dashes (e.g. "boundary", not
+        "--boundary").
+    :param multipart: True if the response should be multipart/byteranges,
+        False otherwise. This should be True if and only if you have 2 or
+        more ranges.
+    :param logger: a logger
+    """
+    if multipart:
+        return document_iters_to_multipart_byteranges(ranges_iter, boundary)
+    else:
+        try:
+            response_body_iter = next(ranges_iter)['part_iter']
+        except StopIteration:
+            return ''
+
+        # We need to make sure ranges_iter does not get garbage-collected
+        # before response_body_iter is exhausted. The reason is that
+        # ranges_iter has a finally block that calls close_swift_conn, and
+        # so if that finally block fires before we read response_body_iter,
+        # there's nothing there.
+        result = StringAlong(
+            response_body_iter, ranges_iter,
+            lambda: logger.warning(
+                "More than one part in a single-part response?"))
+        return result
+
+
+def multipart_byteranges_to_document_iters(input_file, boundary,
+                                           read_chunk_size=4096):
+    """
+    Takes a file-like object containing a multipart/byteranges MIME document
+    (see RFC 7233, Appendix A) and returns an iterator of (first-byte,
+    last-byte, length, document-headers, body-file) 5-tuples.
+
+    :param input_file: file-like object with the MIME doc in it
+    :param boundary: MIME boundary, sans dashes
+        (e.g. "divider", not "--divider")
+    :param read_chunk_size: size of strings read via input_file.read()
+    """
+    for headers, body in mime_to_document_iters(input_file, boundary,
+                                                read_chunk_size):
+        first_byte, last_byte, length = parse_content_range(
+            headers.get('content-range'))
+        yield (first_byte, last_byte, length, headers.items(), body)
+
+
+#: Regular expression to match form attributes.
+ATTRIBUTES_RE = re.compile(r'(\w+)=(".*?"|[^";]+)(; ?|$)')
+
+
+def parse_content_disposition(header):
+    """
+    Given the value of a header like:
+    Content-Disposition: form-data; name="somefile"; filename="test.html"
+
+    Return data like
+    ("form-data", {"name": "somefile", "filename": "test.html"})
+
+    :param header: Value of a header (the part after the ': ').
+    :returns: (value name, dict) of the attribute data parsed (see above).
+    """
+    attributes = {}
+    attrs = ''
+    if ';' in header:
+        header, attrs = [x.strip() for x in header.split(';', 1)]
+    m = True
+    while m:
+        m = ATTRIBUTES_RE.match(attrs)
+        if m:
+            attrs = attrs[len(m.group(0)):]
+            attributes[m.group(1)] = m.group(2).strip('"')
+    return header, attributes
+
+
+class NamespaceOuterBound(object):
+    """
+    A custom singleton type to be subclassed for the outer bounds of
+    Namespaces.
+    """
+    _singleton = None
+
+    def __new__(cls):
+        if cls is NamespaceOuterBound:
+            raise TypeError('NamespaceOuterBound is an abstract class; '
+                            'only subclasses should be instantiated')
+        if cls._singleton is None:
+            cls._singleton = super(NamespaceOuterBound, cls).__new__(cls)
+        return cls._singleton
+
+    def __str__(self):
+        return ''
+
+    def __repr__(self):
+        return type(self).__name__
+
+    def __bool__(self):
+        return False
+
+
+@functools.total_ordering
+class Namespace(object):
+    """
+    A Namespace encapsulates parameters that define a range of the object
+    namespace.
+
+    :param name: the name of the ``Namespace``; this SHOULD take the form of a
+        path to a container i.e. <account_name>/<container_name>.
+    :param lower: the lower bound of object names contained in the namespace;
+        the lower bound *is not* included in the namespace.
+    :param upper: the upper bound of object names contained in the namespace;
+        the upper bound *is* included in the namespace.
+    """
+    __slots__ = ('_lower', '_upper', '_name')
+
+    @functools.total_ordering
+    class MaxBound(NamespaceOuterBound):
+        # singleton for maximum bound
+        def __ge__(self, other):
+            return True
+
+    @functools.total_ordering
+    class MinBound(NamespaceOuterBound):
+        # singleton for minimum bound
+        def __le__(self, other):
+            return True
+
+    MIN = MinBound()
+    MAX = MaxBound()
+
+    def __init__(self, name, lower, upper):
+        self._lower = Namespace.MIN
+        self._upper = Namespace.MAX
+        # We deliberately do not validate that the name has the form 'a/c'
+        # because we want Namespace instantiation to be fast. Namespaces are
+        # typically created using state that has previously been serialized
+        # from a ShardRange instance, and the ShardRange will have validated
+        # the name format.
+        self._name = self._encode(name)
+        self.lower = lower
+        self.upper = upper
+
+    def __iter__(self):
+        yield 'name', str(self.name)
+        yield 'lower', self.lower_str
+        yield 'upper', self.upper_str
+
+    def __repr__(self):
+        return '%s(%s)' % (self.__class__.__name__, ', '.join(
+            '%s=%r' % prop for prop in self))
+
+    def __lt__(self, other):
+        # a Namespace is less than other if its entire namespace is less than
+        # other; if other is another Namespace that implies that this
+        # Namespace's upper must be less than or equal to the other
+        # Namespace's lower
+        if self.upper == Namespace.MAX:
+            return False
+        if isinstance(other, Namespace):
+            return self.upper <= other.lower
+        elif other is None:
+            return True
+        else:
+            return self.upper < self._encode(other)
+
+    def __gt__(self, other):
+        # a Namespace is greater than other if its entire namespace is greater
+        # than other; if other is another Namespace that implies that this
+        # Namespace's lower must be greater than or equal to the other
+        # Namespace's upper
+        if self.lower == Namespace.MIN:
+            return False
+        if isinstance(other, Namespace):
+            return self.lower >= other.upper
+        elif other is None:
+            return False
+        else:
+            return self.lower >= self._encode(other)
+
+    def __eq__(self, other):
+        # test for equality of range bounds only
+        if not isinstance(other, Namespace):
+            return False
+        return self.lower == other.lower and self.upper == other.upper
+
+    def __ne__(self, other):
+        return not (self == other)
+
+    def __contains__(self, item):
+        # test if the given item is within the namespace
+        if item == '':
+            return False
+        item = self._encode_bound(item)
+        return self.lower < item <= self.upper
+
+    @classmethod
+    def _encode(cls, value):
+        if isinstance(value, bytes):
+            # This should never fail -- the value should always be coming from
+            # valid swift paths, which means UTF-8
+            return value.decode('utf-8')
+        return value
+
+    def _encode_bound(self, bound):
+        if isinstance(bound, NamespaceOuterBound):
+            return bound
+        if not (isinstance(bound, str) or
+                isinstance(bound, bytes)):
+            raise TypeError('must be a string type')
+        return self._encode(bound)
+
+    @property
+    def account(self):
+        return self._name.split('/')[0]
+
+    @property
+    def container(self):
+        # note: this may raise an IndexError if name does not have the expected
+        # form 'a/c'; that is a deliberate trade-off against the overhead of
+        # validating the name every time a Namespace is instantiated.
+        return self._name.split('/')[1]
+
+    @property
+    def name(self):
+        return self._name
+
+    @property
+    def lower(self):
+        return self._lower
+
+    @property
+    def lower_str(self):
+        return str(self.lower)
+
+    @lower.setter
+    def lower(self, value):
+        if value is None or (value == b"" if isinstance(value, bytes) else
+                             value == u""):
+            value = Namespace.MIN
+        try:
+            value = self._encode_bound(value)
+        except TypeError as err:
+            raise TypeError('lower %s' % err)
+        if value > self._upper:
+            raise ValueError(
+                'lower (%r) must be less than or equal to upper (%r)' %
+                (value, self.upper))
+        self._lower = value
+
+    @property
+    def upper(self):
+        return self._upper
+
+    @property
+    def upper_str(self):
+        return str(self.upper)
+
+    @upper.setter
+    def upper(self, value):
+        if value is None or (value == b"" if isinstance(value, bytes) else
+                             value == u""):
+            value = Namespace.MAX
+        try:
+            value = self._encode_bound(value)
+        except TypeError as err:
+            raise TypeError('upper %s' % err)
+        if value < self._lower:
+            raise ValueError(
+                'upper (%r) must be greater than or equal to lower (%r)' %
+                (value, self.lower))
+        self._upper = value
+
+    @property
+    def end_marker(self):
+        return self.upper_str + '\x00' if self.upper else ''
+
+    def entire_namespace(self):
+        """
+        Returns True if this namespace includes the entire namespace, False
+        otherwise.
+        """
+        return (self.lower == Namespace.MIN and
+                self.upper == Namespace.MAX)
+
+    def overlaps(self, other):
+        """
+        Returns True if this namespace overlaps with the other namespace.
+
+        :param other: an instance of :class:`~swift.common.utils.Namespace`
+        """
+        if not isinstance(other, Namespace):
+            return False
+        return max(self.lower, other.lower) < min(self.upper, other.upper)
+
+    def includes(self, other):
+        """
+        Returns True if this namespace includes the whole of the other
+        namespace, False otherwise.
+
+        :param other: an instance of :class:`~swift.common.utils.Namespace`
+        """
+        return (self.lower <= other.lower) and (other.upper <= self.upper)
+
+    def expand(self, donors):
+        """
+        Expands the bounds as necessary to match the minimum and maximum bounds
+        of the given donors.
+
+        :param donors: A list of :class:`~swift.common.utils.Namespace`
+        :return: True if the bounds have been modified, False otherwise.
+        """
+        modified = False
+        new_lower = self.lower
+        new_upper = self.upper
+        for donor in donors:
+            new_lower = min(new_lower, donor.lower)
+            new_upper = max(new_upper, donor.upper)
+        if self.lower > new_lower or self.upper < new_upper:
+            self.lower = new_lower
+            self.upper = new_upper
+            modified = True
+        return modified
+
+
+class NamespaceBoundList(object):
+    def __init__(self, bounds):
+        """
+        Encapsulate a compact representation of namespaces. Each item in the
+        list is a list [lower bound, name].
+
+        :param bounds: a list of lists ``[lower bound, name]``. The list
+            should be ordered by ``lower bound``.
+        """
+        self.bounds = [] if bounds is None else bounds
+
+    def __eq__(self, other):
+        # test for equality of NamespaceBoundList objects only
+        if not isinstance(other, NamespaceBoundList):
+            return False
+        return self.bounds == other.bounds
+
+    def __len__(self):
+        """
+        Return the number of namespaces in the NamespaceBoundList.
+        """
+        return len(self.bounds)
+
+    @classmethod
+    def parse(cls, namespaces):
+        """
+        Create a NamespaceBoundList object by parsing a list of Namespaces or
+        shard ranges and only storing the compact bounds list.
+
+        Each Namespace in the given list of ``namespaces`` provides the next
+        [lower bound, name] list to append to the NamespaceBoundList. The
+        given ``namespaces`` should be contiguous because the
+        NamespaceBoundList only stores lower bounds; if ``namespaces`` has
+        overlaps then at least one of the overlapping namespaces may be
+        ignored; similarly, gaps between namespaces are not represented in the
+        NamespaceBoundList.
+
+        :param namespaces: A list of Namespace instances. The list should be
+            ordered by namespace bounds.
+        :return: a NamespaceBoundList.
+        """
+        if not namespaces:
+            return None
+        bounds = []
+        upper = namespaces[0].lower
+        for ns in namespaces:
+            if ns.lower < upper:
+                # Discard overlapping namespace.
+                # Overlapping namespaces are expected in lists of shard ranges
+                # fetched from the backend. For example, while a parent
+                # container is in the process of sharding, the parent shard
+                # range and its children shard ranges may be returned in the
+                # list of shard ranges. However, the backend sorts the list by
+                # (upper, state, lower, name) such that the children precede
+                # the parent, and it is the children that we prefer to retain
+                # in the NamespaceBoundList. For example, these namespaces:
+                #   (a-b, "child1"), (b-c, "child2"), (a-c, "parent")
+                # would result in a NamespaceBoundList:
+                #   (a, "child1"), (b, "child2")
+                # Unexpected overlaps or gaps may result in namespaces being
+                # 'extended' because only lower bounds are stored. For example,
+                # these namespaces:
+                #   (a-b, "ns1"), (d-e, "ns2")
+                # would result in a NamespaceBoundList:
+                #   (a, "ns1"), (d, "ns2")
+                # When used to find a target namespace for an object update
+                # that lies in a gap, the NamespaceBoundList will map the
+                # object name to the preceding namespace. In the example, an
+                # object named "c" would be mapped to "ns1". (In previous
+                # versions, an object update lying in a gap would have been
+                # mapped to the root container.)
+                continue
+            bounds.append([ns.lower_str, str(ns.name)])
+            upper = ns.upper
+        return cls(bounds)
+
+    def get_namespace(self, item):
+        """
+        Get a Namespace instance that contains ``item`` by bisecting on the
+        lower bounds directly. This function is used for performance sensitive
+        path, for example, '_get_update_shard' in proxy object controller. For
+        normal paths, convert NamespaceBoundList to a list of Namespaces, and
+        use `~swift.common.utils.find_namespace` or
+        `~swift.common.utils.filter_namespaces`.
+
+        :param item: The item for a which a Namespace is to be found.
+        :return: the Namespace that contains ``item``.
+        """
+        pos = bisect.bisect(self.bounds, [item]) - 1
+        lower, name = self.bounds[pos]
+        upper = ('' if pos + 1 == len(self.bounds)
+                 else self.bounds[pos + 1][0])
+        return Namespace(name, lower, upper)
+
+    def get_namespaces(self):
+        """
+        Get the contained namespaces as a list of contiguous Namespaces ordered
+        by lower bound.
+
+        :return: A list of Namespace objects which are ordered by
+            ``lower bound``.
+        """
+        if not self.bounds:
+            return []
+        namespaces = []
+        num_ns = len(self.bounds)
+        for i in range(num_ns):
+            lower, name = self.bounds[i]
+            upper = ('' if i + 1 == num_ns else self.bounds[i + 1][0])
+            namespaces.append(Namespace(name, lower, upper))
+        return namespaces
+
+
+class ShardName(object):
+    """
+    Encapsulates the components of a shard name.
+
+    Instances of this class would typically be constructed via the create() or
+    parse() class methods.
+
+    Shard names have the form:
+
+        <account>/<root_container>-<parent_container_hash>-<timestamp>-<index>
+
+    Note: some instances of :class:`~swift.common.utils.ShardRange` have names
+    that will NOT parse as a :class:`~swift.common.utils.ShardName`; e.g. a
+    root container's own shard range will have a name format of
+    <account>/<root_container> which will raise ValueError if passed to parse.
+    """
+
+    def __init__(self, account, root_container,
+                 parent_container_hash,
+                 timestamp,
+                 index):
+        self.account = self._validate(account)
+        self.root_container = self._validate(root_container)
+        self.parent_container_hash = self._validate(parent_container_hash)
+        self.timestamp = Timestamp(timestamp)
+        self.index = int(index)
+
+    @classmethod
+    def _validate(cls, arg):
+        if arg is None:
+            raise ValueError('arg must not be None')
+        return arg
+
+    def __str__(self):
+        return '%s/%s-%s-%s-%s' % (self.account,
+                                   self.root_container,
+                                   self.parent_container_hash,
+                                   self.timestamp.internal,
+                                   self.index)
+
+    @classmethod
+    def hash_container_name(cls, container_name):
+        """
+        Calculates the hash of a container name.
+
+        :param container_name: name to be hashed.
+        :return: the hexdigest of the md5 hash of ``container_name``.
+        :raises ValueError: if ``container_name`` is None.
+        """
+        cls._validate(container_name)
+        if not isinstance(container_name, bytes):
+            container_name = container_name.encode('utf-8')
+        hash = md5(container_name, usedforsecurity=False).hexdigest()
+        return hash
+
+    @classmethod
+    def create(cls, account, root_container, parent_container,
+               timestamp, index):
+        """
+        Create an instance of :class:`~swift.common.utils.ShardName`.
+
+        :param account: the hidden internal account to which the shard
+            container belongs.
+        :param root_container: the name of the root container for the shard.
+        :param parent_container: the name of the parent container for the
+            shard; for initial first generation shards this should be the same
+            as ``root_container``; for shards of shards this should be the name
+            of the sharding shard container.
+        :param timestamp: an instance of :class:`~swift.common.utils.Timestamp`
+        :param index: a unique index that will distinguish the path from any
+            other path generated using the same combination of
+            ``account``, ``root_container``, ``parent_container`` and
+            ``timestamp``.
+
+        :return: an instance of :class:`~swift.common.utils.ShardName`.
+        :raises ValueError: if any argument is None
+        """
+        # we make the shard name unique with respect to other shards names by
+        # embedding a hash of the parent container name; we use a hash (rather
+        # than the actual parent container name) to prevent shard names become
+        # longer with every generation.
+        parent_container_hash = cls.hash_container_name(parent_container)
+        return cls(account, root_container, parent_container_hash, timestamp,
+                   index)
+
+    @classmethod
+    def parse(cls, name):
+        """
+        Parse ``name`` to an instance of
+        :class:`~swift.common.utils.ShardName`.
+
+        :param name: a shard name which should have the form:
+            <account>/
+            <root_container>-<parent_container_hash>-<timestamp>-<index>
+
+        :return: an instance of :class:`~swift.common.utils.ShardName`.
+        :raises ValueError: if ``name`` is not a valid shard name.
+        """
+        try:
+            account, container = name.split('/', 1)
+            root_container, parent_container_hash, timestamp, index = \
+                container.rsplit('-', 3)
+            return cls(account, root_container, parent_container_hash,
+                       timestamp, index)
+        except ValueError:
+            raise ValueError('invalid name: %s' % name)
+
+
+class ShardRange(Namespace):
+    """
+    A ShardRange encapsulates sharding state related to a container including
+    lower and upper bounds that define the object namespace for which the
+    container is responsible.
+
+    Shard ranges may be persisted in a container database. Timestamps
+    associated with subsets of the shard range attributes are used to resolve
+    conflicts when a shard range needs to be merged with an existing shard
+    range record and the most recent version of an attribute should be
+    persisted.
+
+    :param name: the name of the shard range; this MUST take the form of a
+        path to a container i.e. <account_name>/<container_name>.
+    :param timestamp: a timestamp that represents the time at which the
+        shard range's ``lower``, ``upper`` or ``deleted`` attributes were
+        last modified.
+    :param lower: the lower bound of object names contained in the shard range;
+        the lower bound *is not* included in the shard range namespace.
+    :param upper: the upper bound of object names contained in the shard range;
+        the upper bound *is* included in the shard range namespace.
+    :param object_count: the number of objects in the shard range; defaults to
+        zero.
+    :param bytes_used: the number of bytes in the shard range; defaults to
+        zero.
+    :param meta_timestamp: a timestamp that represents the time at which the
+        shard range's ``object_count`` and ``bytes_used`` were last updated;
+        defaults to the value of ``timestamp``.
+    :param deleted: a boolean; if True the shard range is considered to be
+        deleted.
+    :param state: the state; must be one of ShardRange.STATES; defaults to
+        CREATED.
+    :param state_timestamp: a timestamp that represents the time at which
+        ``state`` was forced to its current value; defaults to the value of
+        ``timestamp``. This timestamp is typically not updated with every
+        change of ``state`` because in general conflicts in ``state``
+        attributes are resolved by choosing the larger ``state`` value.
+        However, when this rule does not apply, for example when changing state
+        from ``SHARDED`` to ``ACTIVE``, the ``state_timestamp`` may be advanced
+        so that the new ``state`` value is preferred over any older ``state``
+        value.
+    :param epoch: optional epoch timestamp which represents the time at which
+        sharding was enabled for a container.
+    :param reported: optional indicator that this shard and its stats have
+        been reported to the root container.
+    :param tombstones: the number of tombstones in the shard range; defaults to
+        -1 to indicate that the value is unknown.
+    """
+    FOUND = 10
+    CREATED = 20
+    CLEAVED = 30
+    ACTIVE = 40
+    SHRINKING = 50
+    SHARDING = 60
+    SHARDED = 70
+    SHRUNK = 80
+    STATES = {FOUND: 'found',
+              CREATED: 'created',
+              CLEAVED: 'cleaved',
+              ACTIVE: 'active',
+              SHRINKING: 'shrinking',
+              SHARDING: 'sharding',
+              SHARDED: 'sharded',
+              SHRUNK: 'shrunk'}
+    STATES_BY_NAME = dict((v, k) for k, v in STATES.items())
+    SHRINKING_STATES = (SHRINKING, SHRUNK)
+    SHARDING_STATES = (SHARDING, SHARDED)
+    CLEAVING_STATES = SHRINKING_STATES + SHARDING_STATES
+
+    __slots__ = (
+        '_timestamp', '_meta_timestamp', '_state_timestamp', '_epoch',
+        '_deleted', '_state', '_count', '_bytes',
+        '_tombstones', '_reported')
+
+    def __init__(self, name, timestamp=0,
+                 lower=Namespace.MIN, upper=Namespace.MAX,
+                 object_count=0, bytes_used=0, meta_timestamp=None,
+                 deleted=False, state=None, state_timestamp=None, epoch=None,
+                 reported=False, tombstones=-1, **kwargs):
+        super(ShardRange, self).__init__(name=name, lower=lower, upper=upper)
+        self._validate_name(self.name)
+        self._timestamp = self._meta_timestamp = self._state_timestamp = \
+            self._epoch = None
+        self._deleted = False
+        self._state = None
+
+        self.timestamp = timestamp
+        self.deleted = deleted
+        self.object_count = object_count
+        self.bytes_used = bytes_used
+        self.meta_timestamp = meta_timestamp
+        self.state = self.FOUND if state is None else state
+        self.state_timestamp = state_timestamp
+        self.epoch = epoch
+        self.reported = reported
+        self.tombstones = tombstones
+
+    @classmethod
+    def sort_key(cls, sr):
+        return cls.sort_key_order(sr.name, sr.lower, sr.upper, sr.state)
+
+    @staticmethod
+    def sort_key_order(name, lower, upper, state):
+        # Use Namespace.MaxBound() for upper bound '', this will allow this
+        # record to be sorted correctly by upper.
+        upper = upper if upper else Namespace.MaxBound()
+        # defines the sort order for shard ranges
+        # note if this ever changes to *not* sort by upper first then it breaks
+        # a key assumption for bisect, which is used by utils.find_namespace
+        # with shard ranges.
+        return upper, state, lower, name
+
+    def is_child_of(self, parent):
+        """
+        Test if this shard range is a child of another shard range. The
+        parent-child relationship is inferred from the names of the shard
+        ranges. This method is limited to work only within the scope of the
+        same user-facing account (with and without shard prefix).
+
+        :param parent: an instance of ``ShardRange``.
+        :return: True if ``parent`` is the parent of this shard range, False
+            otherwise, assuming that they are within the same account.
+        """
+        # note: We limit the usages of this method to be within the same
+        # account, because account shard prefix is configurable and it's hard
+        # to perform checking without breaking backward-compatibility.
+        try:
+            self_parsed_name = ShardName.parse(self.name)
+        except ValueError:
+            # self is not a shard and therefore not a child.
+            return False
+
+        try:
+            parsed_parent_name = ShardName.parse(parent.name)
+            parent_root_container = parsed_parent_name.root_container
+        except ValueError:
+            # parent is a root container.
+            parent_root_container = parent.container
+
+        return (
+            self_parsed_name.root_container == parent_root_container
+            and self_parsed_name.parent_container_hash
+            == ShardName.hash_container_name(parent.container)
+        )
+
+    def _find_root(self, parsed_name, shard_ranges):
+        for sr in shard_ranges:
+            if parsed_name.root_container == sr.container:
+                return sr
+        return None
+
+    def find_root(self, shard_ranges):
+        """
+        Find this shard range's root shard range in the given ``shard_ranges``.
+
+        :param shard_ranges: a list of instances of
+            :class:`~swift.common.utils.ShardRange`
+        :return: this shard range's root shard range if it is found in the
+            list, otherwise None.
+        """
+        try:
+            self_parsed_name = ShardName.parse(self.name)
+        except ValueError:
+            # not a shard
+            return None
+        return self._find_root(self_parsed_name, shard_ranges)
+
+    def find_ancestors(self, shard_ranges):
+        """
+        Find this shard range's ancestor ranges in the given ``shard_ranges``.
+
+        This method makes a best-effort attempt to identify this shard range's
+        parent shard range, the parent's parent, etc., up to and including the
+        root shard range. It is only possible to directly identify the parent
+        of a particular shard range, so the search is recursive; if any member
+        of the ancestry is not found then the search ends and older ancestors
+        that may be in the list are not identified. The root shard range,
+        however, will always be identified if it is present in the list.
+
+        For example, given a list that contains parent, grandparent,
+        great-great-grandparent and root shard ranges, but is missing the
+        great-grandparent shard range, only the parent, grand-parent and root
+        shard ranges will be identified.
+
+        :param shard_ranges: a list of instances of
+            :class:`~swift.common.utils.ShardRange`
+        :return: a list of instances of
+            :class:`~swift.common.utils.ShardRange` containing items in the
+            given ``shard_ranges`` that can be identified as ancestors of this
+            shard range. The list may not be complete if there are gaps in the
+            ancestry, but is guaranteed to contain at least the parent and
+            root shard ranges if they are present.
+        """
+        if not shard_ranges:
+            return []
+
+        try:
+            self_parsed_name = ShardName.parse(self.name)
+        except ValueError:
+            # not a shard
+            return []
+
+        ancestors = []
+        for sr in shard_ranges:
+            if self.is_child_of(sr):
+                ancestors.append(sr)
+                break
+        if ancestors:
+            ancestors.extend(ancestors[0].find_ancestors(shard_ranges))
+        else:
+            root_sr = self._find_root(self_parsed_name, shard_ranges)
+            if root_sr:
+                ancestors.append(root_sr)
+        return ancestors
+
+    @classmethod
+    def make_path(cls, shards_account, root_container, parent_container,
+                  timestamp, index):
+        """
+        Returns a path for a shard container that is valid to use as a name
+        when constructing a :class:`~swift.common.utils.ShardRange`.
+
+        :param shards_account: the hidden internal account to which the shard
+            container belongs.
+        :param root_container: the name of the root container for the shard.
+        :param parent_container: the name of the parent container for the
+            shard; for initial first generation shards this should be the same
+            as ``root_container``; for shards of shards this should be the name
+            of the sharding shard container.
+        :param timestamp: an instance of :class:`~swift.common.utils.Timestamp`
+        :param index: a unique index that will distinguish the path from any
+            other path generated using the same combination of
+            ``shards_account``, ``root_container``, ``parent_container`` and
+            ``timestamp``.
+        :return: a string of the form <account_name>/<container_name>
+        """
+        timestamp = cls._to_timestamp(timestamp)
+        return str(ShardName.create(shards_account,
+                                    root_container,
+                                    parent_container,
+                                    timestamp,
+                                    index))
+
+    @classmethod
+    def _to_timestamp(cls, timestamp):
+        if timestamp is None or isinstance(timestamp, Timestamp):
+            return timestamp
+        return Timestamp(timestamp)
+
+    @property
+    def name(self):
+        return self._name
+
+    @staticmethod
+    def _validate_name(name):
+        # Validate the name format is 'a/c'. The ShardRange class is typically
+        # used when shard state is created (e.g. by the sharder or
+        # swift-manage-shard-ranges), but it is not typically used in
+        # performance sensitive paths (e.g. listing namespaces), so we can
+        # afford the overhead of being more defensive here.
+        if not name or len(name.split('/')) != 2 or not all(name.split('/')):
+            raise ValueError(
+                "Name must be of the form '<account>/<container>', got %r" %
+                name)
+        return name
+
+    @name.setter
+    def name(self, name):
+        self._name = self._validate_name(self._encode(name))
+
+    @property
+    def timestamp(self):
+        return self._timestamp
+
+    @timestamp.setter
+    def timestamp(self, ts):
+        if ts is None:
+            raise TypeError('timestamp cannot be None')
+        self._timestamp = self._to_timestamp(ts)
+
+    @property
+    def meta_timestamp(self):
+        if self._meta_timestamp is None:
+            return self.timestamp
+        return self._meta_timestamp
+
+    @meta_timestamp.setter
+    def meta_timestamp(self, ts):
+        self._meta_timestamp = self._to_timestamp(ts)
+
+    @property
+    def object_count(self):
+        return self._count
+
+    @object_count.setter
+    def object_count(self, count):
+        count = int(count)
+        if count < 0:
+            raise ValueError('object_count cannot be < 0')
+        self._count = count
+
+    @property
+    def bytes_used(self):
+        return self._bytes
+
+    @bytes_used.setter
+    def bytes_used(self, bytes_used):
+        bytes_used = int(bytes_used)
+        if bytes_used < 0:
+            raise ValueError('bytes_used cannot be < 0')
+        self._bytes = bytes_used
+
+    @property
+    def tombstones(self):
+        return self._tombstones
+
+    @tombstones.setter
+    def tombstones(self, tombstones):
+        self._tombstones = int(tombstones)
+
+    @property
+    def row_count(self):
+        """
+        Returns the total number of rows in the shard range i.e. the sum of
+        objects and tombstones.
+
+        :return: the row count
+        """
+        return self.object_count + max(self.tombstones, 0)
+
+    def update_meta(self, object_count, bytes_used, meta_timestamp=None):
+        """
+        Set the object stats metadata to the given values and update the
+        meta_timestamp to the current time.
+
+        :param object_count: should be an integer
+        :param bytes_used: should be an integer
+        :param meta_timestamp: timestamp for metadata; if not given the
+            current time will be set.
+        :raises ValueError: if ``object_count`` or ``bytes_used`` cannot be
+            cast to an int, or if meta_timestamp is neither None nor can be
+            cast to a :class:`~swift.common.utils.Timestamp`.
+        """
+        if self.object_count != int(object_count):
+            self.object_count = int(object_count)
+            self.reported = False
+
+        if self.bytes_used != int(bytes_used):
+            self.bytes_used = int(bytes_used)
+            self.reported = False
+
+        if meta_timestamp is None:
+            self.meta_timestamp = Timestamp.now()
+        else:
+            self.meta_timestamp = meta_timestamp
+
+    def update_tombstones(self, tombstones, meta_timestamp=None):
+        """
+        Set the tombstones metadata to the given values and update the
+        meta_timestamp to the current time.
+
+        :param tombstones: should be an integer
+        :param meta_timestamp: timestamp for metadata; if not given the
+            current time will be set.
+        :raises ValueError: if ``tombstones`` cannot be cast to an int, or
+            if meta_timestamp is neither None nor can be cast to a
+            :class:`~swift.common.utils.Timestamp`.
+        """
+        tombstones = int(tombstones)
+        if 0 <= tombstones != self.tombstones:
+            self.tombstones = tombstones
+            self.reported = False
+        if meta_timestamp is None:
+            self.meta_timestamp = Timestamp.now()
+        else:
+            self.meta_timestamp = meta_timestamp
+
+    def increment_meta(self, object_count, bytes_used):
+        """
+        Increment the object stats metadata by the given values and update the
+        meta_timestamp to the current time.
+
+        :param object_count: should be an integer
+        :param bytes_used: should be an integer
+        :raises ValueError: if ``object_count`` or ``bytes_used`` cannot be
+            cast to an int.
+        """
+        self.update_meta(self.object_count + int(object_count),
+                         self.bytes_used + int(bytes_used))
+
+    @classmethod
+    def resolve_state(cls, state):
+        """
+        Given a value that may be either the name or the number of a state
+        return a tuple of (state number, state name).
+
+        :param state: Either a string state name or an integer state number.
+        :return: A tuple (state number, state name)
+        :raises ValueError: if ``state`` is neither a valid state name nor a
+            valid state number.
+        """
+        try:
+            try:
+                # maybe it's a number
+                float_state = float(state)
+                state_num = int(float_state)
+                if state_num != float_state:
+                    raise ValueError('Invalid state %r' % state)
+                state_name = cls.STATES[state_num]
+            except (ValueError, TypeError):
+                # maybe it's a state name
+                state_name = state.lower()
+                state_num = cls.STATES_BY_NAME[state_name]
+        except (KeyError, AttributeError):
+            raise ValueError('Invalid state %r' % state)
+        return state_num, state_name
+
+    @property
+    def state(self):
+        return self._state
+
+    @state.setter
+    def state(self, state):
+        self._state = self.resolve_state(state)[0]
+
+    @property
+    def state_text(self):
+        return self.STATES[self.state]
+
+    @property
+    def state_timestamp(self):
+        if self._state_timestamp is None:
+            return self.timestamp
+        return self._state_timestamp
+
+    @state_timestamp.setter
+    def state_timestamp(self, ts):
+        self._state_timestamp = self._to_timestamp(ts)
+
+    @property
+    def epoch(self):
+        return self._epoch
+
+    @epoch.setter
+    def epoch(self, epoch):
+        self._epoch = self._to_timestamp(epoch)
+
+    @property
+    def reported(self):
+        return self._reported
+
+    @reported.setter
+    def reported(self, value):
+        self._reported = bool(value)
+
+    def update_state(self, state, state_timestamp=None):
+        """
+        Set state to the given value and optionally update the state_timestamp
+        to the given time.
+
+        :param state: new state, should be an integer
+        :param state_timestamp: timestamp for state; if not given the
+            state_timestamp will not be changed.
+        :return: True if the state or state_timestamp was changed, False
+            otherwise
+        """
+        if state_timestamp is None and self.state == state:
+            return False
+        self.state = state
+        if state_timestamp is not None:
+            self.state_timestamp = state_timestamp
+        self.reported = False
+        return True
+
+    @property
+    def deleted(self):
+        return self._deleted
+
+    @deleted.setter
+    def deleted(self, value):
+        self._deleted = bool(value)
+
+    def set_deleted(self, timestamp=None):
+        """
+        Mark the shard range deleted and set timestamp to the current time.
+
+        :param timestamp: optional timestamp to set; if not given the
+            current time will be set.
+        :return: True if the deleted attribute or timestamp was changed, False
+            otherwise
+        """
+        if timestamp is None and self.deleted:
+            return False
+        self.deleted = True
+        self.timestamp = timestamp or Timestamp.now()
+        return True
+
+    # It's a little funny that we're making this mutable class hashable, but
+    # we want to be able to map donor -> acceptor, shard range -> broker, etc.
+    # Since we override __eq__, we don't get Python's hashable-by-default,
+    # but we are happy to use their hash-derived-from-id().
+    # NB: this breaks Python's assumption that "Hashable objects which compare
+    # equal must have the same hash value."
+    __hash__ = object.__hash__
+
+    def __repr__(self):
+        return '%s<%r to %r as of %s, (%d, %d) as of %s, %s as of %s>' % (
+            self.__class__.__name__, self.lower, self.upper,
+            self.timestamp.internal, self.object_count, self.bytes_used,
+            self.meta_timestamp.internal, self.state_text,
+            self.state_timestamp.internal)
+
+    def __iter__(self):
+        yield 'name', self.name
+        yield 'timestamp', self.timestamp.internal
+        yield 'lower', str(self.lower)
+        yield 'upper', str(self.upper)
+        yield 'object_count', self.object_count
+        yield 'bytes_used', self.bytes_used
+        yield 'meta_timestamp', self.meta_timestamp.internal
+        yield 'deleted', 1 if self.deleted else 0
+        yield 'state', self.state
+        yield 'state_timestamp', self.state_timestamp.internal
+        yield 'epoch', self.epoch.internal if self.epoch is not None else None
+        yield 'reported', 1 if self.reported else 0
+        yield 'tombstones', self.tombstones
+
+    def copy(self, timestamp=None, **kwargs):
+        """
+        Creates a copy of the ShardRange.
+
+        :param timestamp: (optional) If given, the returned ShardRange will
+            have all of its timestamps set to this value. Otherwise the
+            returned ShardRange will have the original timestamps.
+        :return: an instance of :class:`~swift.common.utils.ShardRange`
+        """
+        new = ShardRange.from_dict(dict(self, **kwargs))
+        if timestamp:
+            new.timestamp = timestamp
+            new.meta_timestamp = new.state_timestamp = None
+        return new
+
+    @classmethod
+    def from_dict(cls, params):
+        """
+        Return an instance constructed using the given dict of params. This
+        method is deliberately less flexible than the class `__init__()` method
+        and requires all of the `__init__()` args to be given in the dict of
+        params.
+
+        :param params: a dict of parameters
+        :return: an instance of this class
+        """
+        return cls(
+            params['name'], params['timestamp'], params['lower'],
+            params['upper'], params['object_count'], params['bytes_used'],
+            params['meta_timestamp'], params['deleted'], params['state'],
+            params['state_timestamp'], params['epoch'],
+            params.get('reported', 0), params.get('tombstones', -1))
+
+
+class ShardRangeList(UserList):
+    """
+    This class provides some convenience functions for working with lists of
+    :class:`~swift.common.utils.ShardRange`.
+
+    This class does not enforce ordering or continuity of the list items:
+    callers should ensure that items are added in order as appropriate.
+    """
+
+    def __getitem__(self, index):
+        # workaround for py36,py37 - not needed for py3.8+
+        # see https://github.com/python/cpython/commit/b1c3167c
+        result = self.data[index]
+        return ShardRangeList(result) if type(result) is list else result
+
+    @property
+    def lower(self):
+        """
+        Returns the lower bound of the first item in the list. Note: this will
+        only be equal to the lowest bound of all items in the list if the list
+        contents has been sorted.
+
+        :return: lower bound of first item in the list, or Namespace.MIN
+                 if the list is empty.
+        """
+        if not self:
+            # empty list has range MIN->MIN
+            return Namespace.MIN
+        return self[0].lower
+
+    @property
+    def upper(self):
+        """
+        Returns the upper bound of the last item in the list. Note: this will
+        only be equal to the uppermost bound of all items in the list if the
+        list has previously been sorted.
+
+        :return: upper bound of last item in the list, or Namespace.MIN
+                 if the list is empty.
+        """
+        if not self:
+            # empty list has range MIN->MIN
+            return Namespace.MIN
+        return self[-1].upper
+
+    @property
+    def object_count(self):
+        """
+        Returns the total number of objects of all items in the list.
+
+        :return: total object count
+        """
+        return sum(sr.object_count for sr in self)
+
+    @property
+    def row_count(self):
+        """
+        Returns the total number of rows of all items in the list.
+
+        :return: total row count
+        """
+        return sum(sr.row_count for sr in self)
+
+    @property
+    def bytes_used(self):
+        """
+        Returns the total number of bytes in all items in the list.
+
+        :return: total bytes used
+        """
+        return sum(sr.bytes_used for sr in self)
+
+    @property
+    def timestamps(self):
+        return set(sr.timestamp for sr in self)
+
+    @property
+    def states(self):
+        return set(sr.state for sr in self)
+
+    def includes(self, other):
+        """
+        Check if another ShardRange namespace is enclosed between the list's
+        ``lower`` and ``upper`` properties. Note: the list's ``lower`` and
+        ``upper`` properties will only equal the outermost bounds of all items
+        in the list if the list has previously been sorted.
+
+        Note: the list does not need to contain an item matching ``other`` for
+        this method to return True, although if the list has been sorted and
+        does contain an item matching ``other`` then the method will return
+        True.
+
+        :param other: an instance of :class:`~swift.common.utils.ShardRange`
+        :return: True if other's namespace is enclosed, False otherwise.
+        """
+        return self.lower <= other.lower and self.upper >= other.upper
+
+    def filter(self, includes=None, marker=None, end_marker=None):
+        """
+        Filter the list for those shard ranges whose namespace includes the
+        ``includes`` name or any part of the namespace between ``marker`` and
+        ``end_marker``. If none of ``includes``, ``marker`` or ``end_marker``
+        are specified then all shard ranges will be returned.
+
+        :param includes: a string; if not empty then only the shard range, if
+            any, whose namespace includes this string will be returned, and
+            ``marker`` and ``end_marker`` will be ignored.
+        :param marker: if specified then only shard ranges whose upper bound is
+            greater than this value will be returned.
+        :param end_marker: if specified then only shard ranges whose lower
+            bound is less than this value will be returned.
+        :return: A new instance of :class:`~swift.common.utils.ShardRangeList`
+            containing the filtered shard ranges.
+        """
+        return ShardRangeList(
+            filter_namespaces(self, includes, marker, end_marker))
+
+    def find_lower(self, condition):
+        """
+        Finds the first shard range satisfies the given condition and returns
+        its lower bound.
+
+        :param condition: A function that must accept a single argument of type
+            :class:`~swift.common.utils.ShardRange` and return True if the
+            shard range satisfies the condition or False otherwise.
+        :return: The lower bound of the first shard range to satisfy the
+            condition, or the ``upper`` value of this list if no such shard
+            range is found.
+
+        """
+        for sr in self:
+            if condition(sr):
+                return sr.lower
+        return self.upper
+
+
+def find_namespace(item, namespaces):
+    """
+    Find a Namespace/ShardRange in given list of ``namespaces`` whose namespace
+    contains ``item``.
+
+    :param item: The item for a which a Namespace is to be found.
+    :param ranges: a sorted list of Namespaces.
+    :return: the Namespace/ShardRange whose namespace contains ``item``, or
+        None if no suitable Namespace is found.
+    """
+    index = bisect.bisect_left(namespaces, item)
+    if index != len(namespaces) and item in namespaces[index]:
+        return namespaces[index]
+    return None
+
+
+def filter_namespaces(namespaces, includes, marker, end_marker):
+    """
+    Filter the given Namespaces/ShardRanges to those whose namespace includes
+    the ``includes`` name or any part of the namespace between ``marker`` and
+    ``end_marker``. If none of ``includes``, ``marker`` or ``end_marker`` are
+    specified then all Namespaces will be returned.
+
+    :param namespaces: A list of :class:`~swift.common.utils.Namespace` or
+        :class:`~swift.common.utils.ShardRange`.
+    :param includes: a string; if not empty then only the Namespace,
+        if any, whose namespace includes this string will be returned,
+        ``marker`` and ``end_marker`` will be ignored.
+    :param marker: if specified then only shard ranges whose upper bound is
+        greater than this value will be returned.
+    :param end_marker: if specified then only shard ranges whose lower bound is
+        less than this value will be returned.
+    :return: A filtered list of :class:`~swift.common.utils.Namespace`.
+    """
+    if includes:
+        namespace = find_namespace(includes, namespaces)
+        return [namespace] if namespace else []
+
+    def namespace_filter(sr):
+        end = start = True
+        if end_marker:
+            end = end_marker > sr.lower
+        if marker:
+            start = marker < sr.upper
+        return start and end
+
+    if marker or end_marker:
+        return list(filter(namespace_filter, namespaces))
+
+    if marker == Namespace.MAX or end_marker == Namespace.MIN:
+        # MIN and MAX are both Falsy so not handled by namespace_filter
+        return []
+
+    return namespaces
+
+
+def o_tmpfile_in_path_supported(dirpath):
+    fd = None
+    try:
+        fd = os.open(dirpath, os.O_WRONLY | O_TMPFILE)
+        return True
+    except OSError as e:
+        if e.errno in (errno.EINVAL, errno.EISDIR, errno.EOPNOTSUPP):
+            return False
+        else:
+            raise Exception("Error on '%(path)s' while checking "
+                            "O_TMPFILE: '%(ex)s'" %
+                            {'path': dirpath, 'ex': e})
+    finally:
+        if fd is not None:
+            os.close(fd)
+
+
+def o_tmpfile_in_tmpdir_supported():
+    return o_tmpfile_in_path_supported(gettempdir())
+
+
+def safe_json_loads(value):
+    if value:
+        try:
+            return json.loads(value)
+        except (TypeError, ValueError):
+            pass
+    return None
+
+
+def strict_b64decode(value, allow_line_breaks=False, exact_size=None):
+    '''
+    Validate and decode Base64-encoded data.
+
+    The stdlib base64 module silently discards bad characters, but we often
+    want to treat them as an error.
+
+    :param value: some base64-encoded data
+    :param allow_line_breaks: if True, ignore carriage returns and newlines
+    :param exact_size: if provided, the exact size of the decoded bytes
+        expected; also enforces round-trip checks
+    :returns: the decoded data
+    :raises ValueError: if ``value`` is not a string, contains invalid
+                        characters, or has insufficient padding
+    '''
+    if isinstance(value, bytes):
+        try:
+            value = value.decode('ascii')
+        except UnicodeDecodeError:
+            raise ValueError
+    if not isinstance(value, str):
+        raise ValueError
+    # b64decode will silently discard bad characters, but we want to
+    # treat them as an error
+    valid_chars = string.digits + string.ascii_letters + '/+'
+    strip_chars = '='
+    if allow_line_breaks:
+        valid_chars += '\r\n'
+        strip_chars += '\r\n'
+    if any(c not in valid_chars for c in value.strip(strip_chars)):
+        raise ValueError
+    ret_val = base64.b64decode(value)
+    if exact_size is not None:
+        if len(ret_val) != exact_size:
+            raise ValueError
+        if base64_str(ret_val) != value:
+            raise ValueError
+    return ret_val
+
+
+def base64_str(value):
+    return base64.b64encode(value).decode('ascii')
+
+
+def cap_length(value, max_length):
+    if value and len(value) > max_length:
+        if isinstance(value, bytes):
+            return value[:max_length] + b'...'
+        else:
+            return value[:max_length] + '...'
+    return value
+
+
+MD5_BLOCK_READ_BYTES = 4096
+
+
+def md5_hash_for_file(fname):
+    """
+    Get the MD5 checksum of a file.
+
+    :param fname: path to file
+    :returns: MD5 checksum, hex encoded
+    """
+    with open(fname, 'rb') as f:
+        md5sum = md5(usedforsecurity=False)
+        for block in iter(lambda: f.read(MD5_BLOCK_READ_BYTES), b''):
+            md5sum.update(block)
+    return md5sum.hexdigest()
+
+
+def get_partition_for_hash(hex_hash, part_power):
+    """
+    Return partition number for given hex hash and partition power.
+    :param hex_hash: A hash string
+    :param part_power: partition power
+    :returns: partition number
+    """
+    raw_hash = binascii.unhexlify(hex_hash)
+    part_shift = 32 - int(part_power)
+    return struct.unpack_from('>I', raw_hash)[0] >> part_shift
+
+
+def get_partition_from_path(devices, path):
+    """
+    :param devices: directory where devices are mounted (e.g. /srv/node)
+    :param path: full path to a object file or hashdir
+    :returns: the (integer) partition from the path
+    """
+    offset_parts = devices.rstrip(os.sep).split(os.sep)
+    path_components = path.split(os.sep)
+    if offset_parts == path_components[:len(offset_parts)]:
+        offset = len(offset_parts)
+    else:
+        raise ValueError('Path %r is not under device dir %r' % (
+            path, devices))
+    return int(path_components[offset + 2])
+
+
+def replace_partition_in_path(devices, path, part_power):
+    """
+    Takes a path and a partition power and returns the same path, but with the
+    correct partition number. Most useful when increasing the partition power.
+
+    :param devices: directory where devices are mounted (e.g. /srv/node)
+    :param path: full path to a object file or hashdir
+    :param part_power: partition power to compute correct partition number
+    :returns: Path with re-computed partition power
+    """
+    offset_parts = devices.rstrip(os.sep).split(os.sep)
+    path_components = path.split(os.sep)
+    if offset_parts == path_components[:len(offset_parts)]:
+        offset = len(offset_parts)
+    else:
+        raise ValueError('Path %r is not under device dir %r' % (
+            path, devices))
+    part = get_partition_for_hash(path_components[offset + 4], part_power)
+    path_components[offset + 2] = "%d" % part
+    return os.sep.join(path_components)
+
+
+def load_pkg_resource(group, uri):
+    if '#' in uri:
+        uri, name = uri.split('#', 1)
+    else:
+        name = uri
+        uri = 'egg:swift'
+
+    if ':' in uri:
+        scheme, dist = uri.split(':', 1)
+        scheme = scheme.lower()
+    else:
+        scheme = 'egg'
+        dist = uri
+
+    if scheme != 'egg':
+        raise TypeError('Unhandled URI scheme: %r' % scheme)
+
+    if pkg_resources:
+        # python < 3.8
+        return pkg_resources.load_entry_point(dist, group, name)
+
+    # May raise importlib.metadata.PackageNotFoundError
+    meta = importlib.metadata.distribution(dist)
+
+    entry_points = [ep for ep in meta.entry_points
+                    if ep.group == group and ep.name == name]
+    if not entry_points:
+        raise ImportError("Entry point %r not found" % ((group, name),))
+    return entry_points[0].load()
+
+
+def round_robin_iter(its):
+    """
+    Takes a list of iterators, yield an element from each in a round-robin
+    fashion until all of them are exhausted.
+    :param its: list of iterators
+    """
+    while its:
+        for it in its:
+            try:
+                yield next(it)
+            except StopIteration:
+                its.remove(it)
+
+
+OverrideOptions = collections.namedtuple(
+    'OverrideOptions', ['devices', 'partitions', 'policies'])
+
+
+def parse_override_options(**kwargs):
+    """
+    Figure out which policies, devices, and partitions we should operate on,
+    based on kwargs.
+
+    If 'override_policies' is already present in kwargs, then return that
+    value. This happens when using multiple worker processes; the parent
+    process supplies override_policies=X to each child process.
+
+    Otherwise, in run-once mode, look at the 'policies' keyword argument.
+    This is the value of the "--policies" command-line option. In
+    run-forever mode or if no --policies option was provided, an empty list
+    will be returned.
+
+    The procedures for devices and partitions are similar.
+
+    :returns: a named tuple with fields "devices", "partitions", and
+      "policies".
+    """
+    run_once = kwargs.get('once', False)
+
+    if 'override_policies' in kwargs:
+        policies = kwargs['override_policies']
+    elif run_once:
+        policies = [
+            int(p) for p in list_from_csv(kwargs.get('policies'))]
+    else:
+        policies = []
+
+    if 'override_devices' in kwargs:
+        devices = kwargs['override_devices']
+    elif run_once:
+        devices = list_from_csv(kwargs.get('devices'))
+    else:
+        devices = []
+
+    if 'override_partitions' in kwargs:
+        partitions = kwargs['override_partitions']
+    elif run_once:
+        partitions = [
+            int(p) for p in list_from_csv(kwargs.get('partitions'))]
+    else:
+        partitions = []
+
+    return OverrideOptions(devices=devices, partitions=partitions,
+                           policies=policies)
+
+
+def distribute_evenly(items, num_buckets):
+    """
+    Distribute items as evenly as possible into N buckets.
+    """
+    out = [[] for _ in range(num_buckets)]
+    for index, item in enumerate(items):
+        out[index % num_buckets].append(item)
+    return out
+
+
+def get_redirect_data(response):
+    """
+    Extract a redirect location from a response's headers.
+
+    :param response: a response
+    :return: a tuple of (path, Timestamp) if a Location header is found,
+        otherwise None
+    :raises ValueError: if the Location header is found but a
+        X-Backend-Redirect-Timestamp is not found, or if there is a problem
+        with the format of etiher header
+    """
+    headers = HeaderKeyDict(response.getheaders())
+    if 'Location' not in headers:
+        return None
+    location = urlparse(headers['Location']).path
+    if config_true_value(headers.get('X-Backend-Location-Is-Quoted',
+                                     'false')):
+        location = unquote(location)
+    account, container, _junk = split_path(location, 2, 3, True)
+    timestamp_val = headers.get('X-Backend-Redirect-Timestamp')
+    try:
+        timestamp = Timestamp(timestamp_val)
+    except (TypeError, ValueError):
+        raise ValueError('Invalid timestamp value: %s' % timestamp_val)
+    return '%s/%s' % (account, container), timestamp
+
+
+def parse_db_filename(filename):
+    """
+    Splits a db filename into three parts: the hash, the epoch, and the
+    extension.
+
+    >>> parse_db_filename("ab2134.db")
+    ('ab2134', None, '.db')
+    >>> parse_db_filename("ab2134_1234567890.12345.db")
+    ('ab2134', '1234567890.12345', '.db')
+
+    :param filename: A db file basename or path to a db file.
+    :return: A tuple of (hash , epoch, extension). ``epoch`` may be None.
+    :raises ValueError: if ``filename`` is not a path to a file.
+    """
+    filename = os.path.basename(filename)
+    if not filename:
+        raise ValueError('Path to a file required.')
+    name, ext = os.path.splitext(filename)
+    parts = name.split('_')
+    hash_ = parts.pop(0)
+    epoch = parts[0] if parts else None
+    return hash_, epoch, ext
+
+
+def make_db_file_path(db_path, epoch):
+    """
+    Given a path to a db file, return a modified path whose filename part has
+    the given epoch.
+
+    A db filename takes the form ``<hash>[_<epoch>].db``; this method replaces
+    the ``<epoch>`` part of the given ``db_path`` with the given ``epoch``
+    value, or drops the epoch part if the given ``epoch`` is ``None``.
+
+    :param db_path: Path to a db file that does not necessarily exist.
+    :param epoch: A string (or ``None``) that will be used as the epoch
+        in the new path's filename; non-``None`` values will be
+        normalized to the normal string representation of a
+        :class:`~swift.common.utils.Timestamp`.
+    :return: A modified path to a db file.
+    :raises ValueError: if the ``epoch`` is not valid for constructing a
+        :class:`~swift.common.utils.Timestamp`.
+    """
+    hash_, _, ext = parse_db_filename(db_path)
+    db_dir = os.path.dirname(db_path)
+    if epoch is None:
+        return os.path.join(db_dir, hash_ + ext)
+    epoch = Timestamp(epoch).normal
+    return os.path.join(db_dir, '%s_%s%s' % (hash_, epoch, ext))
+
+
+def get_db_files(db_path):
+    """
+    Given the path to a db file, return a sorted list of all valid db files
+    that actually exist in that path's dir. A valid db filename has the form::
+
+        <hash>[_<epoch>].db
+
+    where <hash> matches the <hash> part of the given db_path as would be
+    parsed by :meth:`~swift.utils.common.parse_db_filename`.
+
+    :param db_path: Path to a db file that does not necessarily exist.
+    :return: List of valid db files that do exist in the dir of the
+        ``db_path``. This list may be empty.
+    """
+    db_dir, db_file = os.path.split(db_path)
+    try:
+        files = os.listdir(db_dir)
+    except OSError as err:
+        if err.errno == errno.ENOENT:
+            return []
+        raise
+    if not files:
+        return []
+    match_hash, epoch, ext = parse_db_filename(db_file)
+    results = []
+    for f in files:
+        hash_, epoch, ext = parse_db_filename(f)
+        if ext != '.db':
+            continue
+        if hash_ != match_hash:
+            continue
+        results.append(os.path.join(db_dir, f))
+    return sorted(results)
+
+
+def get_pid_notify_socket(pid=None):
+    """
+    Get a pid-specific abstract notification socket.
+
+    This is used by the ``swift-reload`` command.
+    """
+    if pid is None:
+        pid = os.getpid()
+    return '\0swift-notifications\0' + str(pid)
+
+
+class NotificationServer(object):
+    RECV_SIZE = 1024
+
+    def __init__(self, pid, read_timeout):
+        self.pid = pid
+        self.read_timeout = read_timeout
+        self.sock = None
+
+    def receive(self):
+        return self.sock.recv(self.RECV_SIZE)
+
+    def close(self):
+        self.sock.close()
+        self.sock = None
+
+    def start(self):
+        if self.sock is not None:
+            raise RuntimeError('notification server already started')
+
+        self.sock = socket.socket(socket.AF_UNIX, socket.SOCK_DGRAM)
+        started = False
+        try:
+            self.sock.bind(get_pid_notify_socket(self.pid))
+            self.sock.settimeout(self.read_timeout)
+            started = True
+        finally:
+            if not started:
+                self.close()
+
+    def __enter__(self):
+        if self.sock is None:
+            self.start()
+        return self
+
+    def __exit__(self, *args):
+        self.close()
+
+
+def systemd_notify(logger=None, msg=b"READY=1"):
+    """
+    Send systemd-compatible notifications.
+
+    Attempt to send the message to swift's pid-specific notification socket;
+    see :func:`get_pid_notify_socket`. This is used by the ``swift-reload``
+    command.
+
+    Additionally, notify the service manager that started this process, if
+    it has set the NOTIFY_SOCKET environment variable. For example, systemd
+    will set this when the unit has ``Type=notify``. More information can
+    be found in systemd documentation:
+    https://www.freedesktop.org/software/systemd/man/sd_notify.html
+
+    Common messages include::
+
+       READY=1
+       RELOADING=1
+       STOPPING=1
+
+    :param logger: a logger object
+    :param msg: the message to send
+    """
+    if not isinstance(msg, bytes):
+        msg = msg.encode('utf8')
+
+    notify_sockets = [get_pid_notify_socket()]
+    systemd_socket = os.getenv('NOTIFY_SOCKET')
+    if systemd_socket:
+        notify_sockets.append(systemd_socket)
+    for notify_socket in notify_sockets:
+        if notify_socket.startswith('@'):
+            # abstract namespace socket
+            notify_socket = '\0%s' % notify_socket[1:]
+        sock = socket.socket(socket.AF_UNIX, socket.SOCK_DGRAM)
+        with closing(sock):
+            try:
+                sock.connect(notify_socket)
+                sock.sendall(msg)
+            except EnvironmentError as e:
+                if logger and not (notify_socket == notify_sockets[0] and
+                                   e.errno == errno.ECONNREFUSED):
+                    logger.debug("Systemd notification failed", exc_info=True)
+
+
+class Watchdog(object):
+    """
+    Implements a watchdog to efficiently manage concurrent timeouts.
+
+    Compared to eventlet.timeouts.Timeout, it reduces the number of context
+    switching in eventlet by avoiding to schedule actions (throw an Exception),
+    then unschedule them if the timeouts are cancelled.
+
+    1. at T+0, request timeout(10)
+        => wathdog greenlet sleeps 10 seconds
+    2. at T+1, request timeout(15)
+        => the timeout will expire after the current, no need to wake up the
+           watchdog greenlet
+    3. at T+2, request timeout(5)
+        => the timeout will expire before the first timeout, wake up the
+           watchdog greenlet to calculate a new sleep period
+    4. at T+7, the 3rd timeout expires
+        => the exception is raised, then the greenlet watchdog sleep(3) to
+           wake up for the 1st timeout expiration
+    """
+
+    def __init__(self):
+        # key => (timeout, timeout_at, caller_greenthread, exception)
+        self._timeouts = dict()
+        self._evt = Event()
+        self._next_expiration = None
+        self._run_gth = None
+
+    def start(self, timeout, exc, timeout_at=None):
+        """
+        Schedule a timeout action
+
+        :param timeout: duration before the timeout expires
+        :param exc: exception to throw when the timeout expire, must inherit
+                    from eventlet.Timeout
+        :param timeout_at: allow to force the expiration timestamp
+        :return: id of the scheduled timeout, needed to cancel it
+        """
+        now = time.time()
+        if not timeout_at:
+            timeout_at = now + timeout
+        gth = eventlet.greenthread.getcurrent()
+        timeout_definition = (timeout, timeout_at, gth, exc, now)
+        key = id(timeout_definition)
+        self._timeouts[key] = timeout_definition
+
+        # Wake up the watchdog loop only when there is a new shorter timeout
+        if (self._next_expiration is None
+                or self._next_expiration > timeout_at):
+            # There could be concurrency on .send(), so wrap it in a try
+            try:
+                if not self._evt.ready():
+                    self._evt.send()
+            except AssertionError:
+                pass
+
+        return key
+
+    def stop(self, key):
+        """
+        Cancel a scheduled timeout
+
+        :param key: timeout id, as returned by start()
+        """
+        try:
+            del self._timeouts[key]
+        except KeyError:
+            pass
+
+    def spawn(self):
+        """
+        Start the watchdog greenthread.
+        """
+        if self._run_gth is None:
+            self._run_gth = eventlet.spawn(self.run)
+
+    def kill(self):
+        """
+        Stop the watchdog greenthread.
+        """
+        if self._run_gth is not None:
+            self._run_gth.kill()
+            self._run_gth = None
+
+    def run(self):
+        while True:
+            self._run()
+
+    def _run(self):
+        now = time.time()
+        self._next_expiration = None
+        if self._evt.ready():
+            self._evt.reset()
+        for k, (timeout, timeout_at, gth, exc,
+                created_at) in list(self._timeouts.items()):
+            if timeout_at <= now:
+                self.stop(k)
+                e = exc()
+                # set this after __init__ to keep it off the eventlet scheduler
+                e.seconds = timeout
+                e.created_at = created_at
+                eventlet.hubs.get_hub().schedule_call_global(0, gth.throw, e)
+            else:
+                if (self._next_expiration is None
+                        or self._next_expiration > timeout_at):
+                    self._next_expiration = timeout_at
+        if self._next_expiration is None:
+            sleep_duration = self._next_expiration
+        else:
+            sleep_duration = self._next_expiration - now
+        self._evt.wait(sleep_duration)
+
+
+class WatchdogTimeout(object):
+    """
+    Context manager to schedule a timeout in a Watchdog instance
+    """
+
+    def __init__(self, watchdog, timeout, exc, timeout_at=None):
+        """
+        Schedule a timeout in a Watchdog instance
+
+        :param watchdog: Watchdog instance
+        :param timeout: duration before the timeout expires
+        :param exc: exception to throw when the timeout expire, must inherit
+                    from eventlet.timeouts.Timeout
+        :param timeout_at: allow to force the expiration timestamp
+        """
+        self.watchdog = watchdog
+        self.key = watchdog.start(timeout, exc, timeout_at=timeout_at)
+
+    def __enter__(self):
+        pass
+
+    def __exit__(self, type, value, traceback):
+        self.watchdog.stop(self.key)
+
+
+class CooperativeIterator(ClosingIterator):
+    """
+    Wrapper to make a deliberate periodic call to ``sleep()`` while iterating
+    over wrapped iterator, providing an opportunity to switch greenthreads.
+
+    This is for fairness; if the network is outpacing the CPU, we'll always be
+    able to read and write data without encountering an EWOULDBLOCK, and so
+    eventlet will not switch greenthreads on its own. We do it manually so that
+    clients don't starve.
+
+    The number 5 here was chosen by making stuff up. It's not every single
+    chunk, but it's not too big either, so it seemed like it would probably be
+    an okay choice.
+
+    Note that we may trampoline to other greenthreads more often than once
+    every 5 chunks, depending on how blocking our network IO is; the explicit
+    sleep here simply provides a lower bound on the rate of trampolining.
+
+    :param iterable: iterator to wrap.
+    :param period: number of items yielded from this iterator between calls to
+        ``sleep()``; a negative value or 0 mean that cooperative sleep will be
+        disabled.
+    """
+    __slots__ = ('period', 'count')
+
+    def __init__(self, iterable, period=5):
+        super(CooperativeIterator, self).__init__(iterable)
+        self.count = 0
+        self.period = max(0, period or 0)
+
+    def _get_next_item(self):
+        if self.period:
+            if self.count >= self.period:
+                self.count = 0
+                sleep()
+            self.count += 1
+        return super(CooperativeIterator, self)._get_next_item()
+
+
+def get_ppid(pid):
+    """
+    Get the parent process's PID given a child pid.
+
+    :raises OSError: if the child pid cannot be found
+    """
+    try:
+        with open('/proc/%d/stat' % pid) as fp:
+            stats = fp.read().split()
+        return int(stats[3])
+    except IOError as e:
+        if e.errno == errno.ENOENT:
+            if not os.path.exists('/proc/'):
+                raise RuntimeError('get_ppid can only be used on Linux')
+            raise OSError(errno.ESRCH, 'No such process')
+        raise
diff --git a/swift/common/utils/base.py b/swift/common/utils/base.py
new file mode 100644
index 0000000000..159dac0c01
--- /dev/null
+++ b/swift/common/utils/base.py
@@ -0,0 +1,131 @@
+# Copyright (c) 2010-2024 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""
+Miscellaneous utility functions that may be used in other utils modules.
+
+This module is imported by other utils modules.
+This module should not import from other utils modules.
+"""
+
+import codecs
+import hashlib
+
+from urllib.parse import quote as _quote
+
+
+try:
+    _test_md5 = hashlib.md5(usedforsecurity=False)  # nosec
+
+    def md5(string=b'', usedforsecurity=True):
+        """Return an md5 hashlib object using usedforsecurity parameter
+
+        For python distributions that support the usedforsecurity keyword
+        parameter, this passes the parameter through as expected.
+        See https://bugs.python.org/issue9216
+        """
+        return hashlib.md5(string, usedforsecurity=usedforsecurity)  # nosec
+except TypeError:
+    def md5(string=b'', usedforsecurity=True):
+        """Return an md5 hashlib object without usedforsecurity parameter
+
+        For python distributions that do not yet support this keyword
+        parameter, we drop the parameter
+        """
+        return hashlib.md5(string)  # nosec
+
+
+utf8_decoder = codecs.getdecoder('utf-8')
+utf8_encoder = codecs.getencoder('utf-8')
+# Apparently under py3 we need to go to utf-16 to collapse surrogates?
+utf16_decoder = codecs.getdecoder('utf-16')
+utf16_encoder = codecs.getencoder('utf-16')
+
+
+def get_valid_utf8_str(str_or_unicode):
+    """
+    Get valid parts of utf-8 str from str, unicode and even invalid utf-8 str
+
+    :param str_or_unicode: a string or an unicode which can be invalid utf-8
+    """
+    if isinstance(str_or_unicode, bytes):
+        try:
+            (str_or_unicode, _len) = utf8_decoder(str_or_unicode,
+                                                  'surrogatepass')
+        except UnicodeDecodeError:
+            (str_or_unicode, _len) = utf8_decoder(str_or_unicode,
+                                                  'replace')
+    (str_or_unicode, _len) = utf16_encoder(str_or_unicode, 'surrogatepass')
+    (valid_unicode_str, _len) = utf16_decoder(str_or_unicode, 'replace')
+    return valid_unicode_str.encode('utf-8')
+
+
+def quote(value, safe='/'):
+    """
+    Patched version of urllib.quote that encodes utf-8 strings before quoting
+    """
+    quoted = _quote(get_valid_utf8_str(value), safe)
+    if isinstance(value, bytes):
+        quoted = quoted.encode('utf-8')
+    return quoted
+
+
+def split_path(path, minsegs=1, maxsegs=None, rest_with_last=False):
+    """
+    Validate and split the given HTTP request path.
+
+    **Examples**::
+
+        ['a'] = split_path('/a')
+        ['a', None] = split_path('/a', 1, 2)
+        ['a', 'c'] = split_path('/a/c', 1, 2)
+        ['a', 'c', 'o/r'] = split_path('/a/c/o/r', 1, 3, True)
+
+    :param path: HTTP Request path to be split
+    :param minsegs: Minimum number of segments to be extracted
+    :param maxsegs: Maximum number of segments to be extracted
+    :param rest_with_last: If True, trailing data will be returned as part
+                           of last segment.  If False, and there is
+                           trailing data, raises ValueError.
+    :returns: list of segments with a length of maxsegs (non-existent
+              segments will return as None)
+    :raises ValueError: if given an invalid path
+    """
+    if not maxsegs:
+        maxsegs = minsegs
+    if minsegs > maxsegs:
+        raise ValueError('minsegs > maxsegs: %d > %d' % (minsegs, maxsegs))
+    if rest_with_last:
+        segs = path.split('/', maxsegs)
+        minsegs += 1
+        maxsegs += 1
+        count = len(segs)
+        if (segs[0] or count < minsegs or count > maxsegs or
+                '' in segs[1:minsegs]):
+            raise ValueError('Invalid path: %s' % quote(path))
+    else:
+        minsegs += 1
+        maxsegs += 1
+        segs = path.split('/', maxsegs)
+        count = len(segs)
+        if (segs[0] or count < minsegs or count > maxsegs + 1 or
+                '' in segs[1:minsegs] or
+                (count == maxsegs + 1 and segs[maxsegs])):
+            raise ValueError('Invalid path: %s' % quote(path))
+    segs = segs[1:maxsegs]
+    if not all(segs[:-1]):
+        raise ValueError('Invalid path: %s' % quote(path))
+    segs.extend([None] * (maxsegs - 1 - len(segs)))
+    return segs
diff --git a/swift/common/utils/checksum.py b/swift/common/utils/checksum.py
new file mode 100644
index 0000000000..dc1b88bd6d
--- /dev/null
+++ b/swift/common/utils/checksum.py
@@ -0,0 +1,266 @@
+# Copyright (c) 2024 NVIDIA
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+try:
+    import anycrc
+except ImportError:
+    anycrc = None
+import binascii
+import ctypes
+import ctypes.util
+import errno
+import socket
+import struct
+import zlib
+
+
+# See if anycrc is available...
+if anycrc:
+    crc32c_anycrc = anycrc.Model('CRC32C').calc
+    crc64nvme_anycrc = anycrc.Model('CRC64-NVME').calc
+else:
+    crc32c_anycrc = None
+    crc64nvme_anycrc = None
+
+
+def find_isal():
+    # If isal is available system-wide, great!
+    isal_lib = ctypes.util.find_library('isal')
+    if isal_lib is None:
+        # py38+: Hopefully pyeclib was installed from a manylinux wheel
+        # with isal baked in?
+        try:
+            import pyeclib  # noqa
+            from importlib.metadata import \
+                files as pkg_files, PackageNotFoundError  # py38+
+        except ImportError:
+            pass
+        else:
+            # Assume busted installs won't have it
+            try:
+                pyeclib_files = pkg_files('pyeclib')
+                if pyeclib_files is None:
+                    # Have a dist-info, but no RECORD file??
+                    pyeclib_files = []
+            except PackageNotFoundError:
+                # Could import pyeclib, but no dist-info directory??
+                pyeclib_files = []
+            isal_libs = [f for f in pyeclib_files
+                         if f.name.startswith("libisal")]
+            if len(isal_libs) == 1:
+                isal_lib = isal_libs[0].locate()
+    return ctypes.CDLL(isal_lib) if isal_lib else None
+
+
+isal = find_isal()
+
+if hasattr(isal, 'crc32_iscsi'):  # isa-l >= 2.16
+    isal.crc32_iscsi.argtypes = [ctypes.c_char_p, ctypes.c_int, ctypes.c_uint]
+    isal.crc32_iscsi.restype = ctypes.c_uint
+
+    def crc32c_isal(data, value=0):
+        result = isal.crc32_iscsi(
+            data,
+            len(data),
+            value ^ 0xffff_ffff,
+        )
+        # for some reason, despite us specifying that restype is uint,
+        # it can come back signed??
+        return (result & 0xffff_ffff) ^ 0xffff_ffff
+else:
+    crc32c_isal = None
+
+if hasattr(isal, 'crc64_rocksoft_refl'):  # isa-l >= 2.31.0
+    isal.crc64_rocksoft_refl.argtypes = [
+        ctypes.c_uint64, ctypes.c_char_p, ctypes.c_uint64]
+    isal.crc64_rocksoft_refl.restype = ctypes.c_uint64
+
+    def crc64nvme_isal(data, value=0):
+        return isal.crc64_rocksoft_refl(
+            value,
+            data,
+            len(data),
+        )
+else:
+    crc64nvme_isal = None
+
+
+# The kernel may also provide crc32c
+AF_ALG = getattr(socket, 'AF_ALG', 38)
+try:
+    _sock = socket.socket(AF_ALG, socket.SOCK_SEQPACKET)
+    _sock.bind(("hash", "crc32c"))
+except OSError as e:
+    if e.errno == errno.ENOENT:
+        # could create socket, but crc32c is unknown
+        _sock.close()
+    elif e.errno != errno.EAFNOSUPPORT:
+        raise
+    crc32c_kern = None
+else:
+    def crc32c_kern(data, value=0):
+        crc32c_sock = socket.socket(AF_ALG, socket.SOCK_SEQPACKET)
+        try:
+            crc32c_sock.bind(("hash", "crc32c"))
+            crc32c_sock.setsockopt(
+                socket.SOL_ALG,
+                socket.ALG_SET_KEY,
+                struct.pack("I", value ^ 0xffff_ffff))
+            sock, _ = crc32c_sock.accept()
+            try:
+                sock.sendall(data)
+                return struct.unpack("I", sock.recv(4))[0]
+            finally:
+                sock.close()
+        finally:
+            crc32c_sock.close()
+
+
+def _select_crc32c_impl():
+    # Use the best implementation available.
+    # On various hardware we've seen
+    #
+    #  CPU           |   ISA-L   |  Kernel
+    # ---------------+-----------+----------
+    # Intel N100     |  ~9GB/s   | ~3.5GB/s
+    # ARM Cortex-A55 |  ~2.5GB/s | ~0.4GB/s
+    # Intel 11850H   |  ~7GB/s   | ~2.6GB/s
+    # AMD 3900XT     | ~20GB/s   | ~5GB/s
+    #
+    # i.e., ISA-L is consistently 3-5x faster than kernel sockets
+    selected = crc32c_isal or crc32c_kern or crc32c_anycrc or None
+    if not selected:
+        raise NotImplementedError(
+            'no crc32c implementation, install isal or anycrc')
+    return selected
+
+
+def _select_crc64nvme_impl():
+    selected = crc64nvme_isal or crc64nvme_anycrc or None
+    if not selected:
+        raise NotImplementedError(
+            'no crc64nvme implementation, install isal or anycrc')
+    return selected
+
+
+class CRCHasher(object):
+    """
+    Helper that works like a hashlib hasher, but with a CRC.
+    """
+    def __init__(self, name, crc_func, data=None, initial_value=0, width=32):
+        """
+        Initialize the CRCHasher.
+
+        :param name: Name of the hasher
+        :param crc_func: Function to compute the CRC.
+        :param data: Data to update the hasher.
+        :param initial_value: Initial CRC value.
+        :param width: Width (in bits) of CRC values.
+        """
+        self.name = name
+        self.crc_func = crc_func
+        self.crc = initial_value
+        if width not in (32, 64):
+            raise ValueError("CRCHasher only supports 32- or 64-bit CRCs")
+        self.width = width
+        if data is not None:
+            self.update(data)
+
+    @property
+    def digest_size(self):
+        return self.width / 8
+
+    @property
+    def digest_fmt(self):
+        return "!I" if self.width == 32 else "!Q"
+
+    def update(self, data):
+        """
+        Update the CRC with new data.
+
+        :param data: Data to update the CRC with.
+        """
+        self.crc = self.crc_func(data, self.crc)
+
+    def digest(self):
+        """
+        Return the current CRC value as a big-endian integer of length
+        ``width / 8`` bytes.
+
+        :returns: Packed CRC value. (bytes)
+        """
+        return struct.pack(self.digest_fmt, self.crc)
+
+    def hexdigest(self):
+        """
+        Return the hexadecimal representation of the current CRC value.
+
+        :returns: Hexadecimal CRC value. (str)
+        """
+        hex = binascii.hexlify(self.digest()).decode("ascii")
+        return hex
+
+    def copy(self):
+        """
+        Copy the current state of this CRCHasher to a new one.
+
+        :returns:
+        """
+        return CRCHasher(self.name,
+                         self.crc_func,
+                         initial_value=self.crc,
+                         width=self.width)
+
+
+def crc32(data=None, initial_value=0):
+    return CRCHasher('crc32',
+                     zlib.crc32,
+                     data=data,
+                     initial_value=initial_value)
+
+
+def crc32c(data=None, initial_value=0):
+    return CRCHasher('crc32c',
+                     _select_crc32c_impl(),
+                     data=data,
+                     initial_value=initial_value)
+
+
+def crc64nvme(data=None, initial_value=0):
+    return CRCHasher('crc64nvme',
+                     _select_crc64nvme_impl(),
+                     data=data,
+                     initial_value=initial_value,
+                     width=64)
+
+
+def log_selected_implementation(logger):
+    try:
+        impl = _select_crc32c_impl()
+    except NotImplementedError:
+        logger.warning(
+            'No implementation found for CRC32C; '
+            'install ISA-L or anycrc for support.')
+    else:
+        logger.info('Using %s implementation for CRC32C.' % impl.__name__)
+
+    try:
+        impl = _select_crc64nvme_impl()
+    except NotImplementedError:
+        logger.warning(
+            'No implementation found for CRC64NVME; '
+            'install ISA-L or anycrc for support.')
+    else:
+        logger.info('Using %s implementation for CRC64NVME.' % impl.__name__)
diff --git a/swift/common/utils/config.py b/swift/common/utils/config.py
new file mode 100644
index 0000000000..d070648b28
--- /dev/null
+++ b/swift/common/utils/config.py
@@ -0,0 +1,448 @@
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import os
+import operator
+import re
+import configparser
+from configparser import ConfigParser, RawConfigParser
+
+# Used when reading config values
+TRUE_VALUES = {'true', '1', 'yes', 'on', 't', 'y'}
+
+
+def config_true_value(value):
+    """
+    Returns True if the value is either True or a string in TRUE_VALUES.
+    Returns False otherwise.
+    """
+    return value is True or \
+        (isinstance(value, str) and value.lower() in TRUE_VALUES)
+
+
+def _non_negative_number(value, expected_type_f=float,
+                         expected_type_description='float number'):
+    try:
+        value = expected_type_f(value)
+        if value < 0:
+            raise ValueError
+    except (TypeError, ValueError):
+        raise ValueError('Value must be a non-negative %s, not "%s".'
+                         % (expected_type_description, value))
+    return value
+
+
+def non_negative_float(value):
+    """
+    Check that the value casts to a float and is non-negative.
+
+    :param value: value to check
+    :raises ValueError: if the value cannot be cast to a float or is negative.
+    :return: a float
+    """
+    return _non_negative_number(value)
+
+
+def non_negative_int(value):
+    """
+    Check that the value casts to an int and is a whole number.
+
+    :param value: value to check
+    :raises ValueError: if the value cannot be cast to an int or does not
+        represent a whole number.
+    :return: an int
+    """
+    return _non_negative_number(value, expected_type_f=int,
+                                expected_type_description='integer')
+
+
+def config_positive_int_value(value):
+    """
+    Returns positive int value if it can be cast by int() and it's an
+    integer > 0. (not including zero) Raises ValueError otherwise.
+    """
+    try:
+        result = int(value)
+        if result < 1:
+            raise ValueError()
+    except (TypeError, ValueError):
+        raise ValueError(
+            'Config option must be an positive int number, not "%s".' % value)
+    return result
+
+
+def config_positive_float_value(value):
+    """
+    Returns positive float value if it can be cast by float() and it's a
+    float > 0. (not including zero) Raises ValueError otherwise.
+    """
+    try:
+        result = float(value)
+        if result <= 0:
+            raise ValueError()
+    except (TypeError, ValueError):
+        raise ValueError(
+            'Config option must be a positive float number, not "%s".' % value)
+    return result
+
+
+def config_float_value(value, minimum=None, maximum=None):
+    try:
+        val = float(value)
+        if minimum is not None and val < minimum:
+            raise ValueError()
+        if maximum is not None and val > maximum:
+            raise ValueError()
+        return val
+    except (TypeError, ValueError):
+        min_ = ', greater than %s' % minimum if minimum is not None else ''
+        max_ = ', less than %s' % maximum if maximum is not None else ''
+        raise ValueError('Config option must be a number%s%s, not "%s".' %
+                         (min_, max_, value))
+
+
+def config_auto_int_value(value, default):
+    """
+    Returns default if value is None or 'auto'.
+    Returns value as an int or raises ValueError otherwise.
+    """
+    if value is None or \
+       (isinstance(value, str) and value.lower() == 'auto'):
+        return default
+    try:
+        value = int(value)
+    except (TypeError, ValueError):
+        raise ValueError('Config option must be an integer or the '
+                         'string "auto", not "%s".' % value)
+    return value
+
+
+def config_percent_value(value):
+    try:
+        return config_float_value(value, 0, 100) / 100.0
+    except ValueError as err:
+        raise ValueError("%s: %s" % (str(err), value))
+
+
+def config_request_node_count_value(value):
+    try:
+        value_parts = value.lower().split()
+        rnc_value = int(value_parts[0])
+    except (ValueError, AttributeError):
+        pass
+    else:
+        if len(value_parts) == 1:
+            return lambda replicas: rnc_value
+        elif (len(value_parts) == 3 and
+              value_parts[1] == '*' and
+              value_parts[2] == 'replicas'):
+            return lambda replicas: rnc_value * replicas
+    raise ValueError(
+        'Invalid request_node_count value: %r' % value)
+
+
+def config_fallocate_value(reserve_value):
+    """
+    Returns fallocate reserve_value as an int or float.
+    Returns is_percent as a boolean.
+    Returns a ValueError on invalid fallocate value.
+    """
+    try:
+        if str(reserve_value[-1:]) == '%':
+            reserve_value = float(reserve_value[:-1])
+            is_percent = True
+        else:
+            reserve_value = int(reserve_value)
+            is_percent = False
+    except ValueError:
+        raise ValueError('Error: %s is an invalid value for fallocate'
+                         '_reserve.' % reserve_value)
+    return reserve_value, is_percent
+
+
+def config_read_prefixed_options(conf, prefix_name, defaults):
+    """
+    Read prefixed options from configuration
+
+    :param conf: the configuration
+    :param prefix_name: the prefix (including, if needed, an underscore)
+    :param defaults: a dict of default values. The dict supplies the
+                     option name and type (string or comma separated string)
+    :return: a dict containing the options
+    """
+    params = {}
+    for option_name in defaults.keys():
+        value = conf.get('%s%s' % (prefix_name, option_name))
+        if value:
+            if isinstance(defaults.get(option_name), list):
+                params[option_name] = []
+                for role in value.lower().split(','):
+                    params[option_name].append(role.strip())
+            else:
+                params[option_name] = value.strip()
+    return params
+
+
+def append_underscore(prefix):
+    if prefix and not prefix.endswith('_'):
+        prefix += '_'
+    return prefix
+
+
+def config_read_reseller_options(conf, defaults):
+    """
+    Read reseller_prefix option and associated options from configuration
+
+    Reads the reseller_prefix option, then reads options that may be
+    associated with a specific reseller prefix. Reads options such that an
+    option without a prefix applies to all reseller prefixes unless an option
+    has an explicit prefix.
+
+    :param conf: the configuration
+    :param defaults: a dict of default values. The key is the option
+                     name. The value is either an array of strings or a string
+    :return: tuple of an array of reseller prefixes and a dict of option values
+    """
+    reseller_prefix_opt = conf.get('reseller_prefix', 'AUTH').split(',')
+    reseller_prefixes = []
+    for prefix in [pre.strip() for pre in reseller_prefix_opt if pre.strip()]:
+        if prefix == "''":
+            prefix = ''
+        prefix = append_underscore(prefix)
+        if prefix not in reseller_prefixes:
+            reseller_prefixes.append(prefix)
+    if len(reseller_prefixes) == 0:
+        reseller_prefixes.append('')
+
+    # Get prefix-using config options
+    associated_options = {}
+    for prefix in reseller_prefixes:
+        associated_options[prefix] = dict(defaults)
+        associated_options[prefix].update(
+            config_read_prefixed_options(conf, '', defaults))
+        prefix_name = prefix if prefix != '' else "''"
+        associated_options[prefix].update(
+            config_read_prefixed_options(conf, prefix_name, defaults))
+    return reseller_prefixes, associated_options
+
+
+def affinity_key_function(affinity_str):
+    """Turns an affinity config value into a function suitable for passing to
+    sort(). After doing so, the array will be sorted with respect to the given
+    ordering.
+
+    For example, if affinity_str is "r1=1, r2z7=2, r2z8=2", then the array
+    will be sorted with all nodes from region 1 (r1=1) first, then all the
+    nodes from region 2 zones 7 and 8 (r2z7=2 and r2z8=2), then everything
+    else.
+
+    Note that the order of the pieces of affinity_str is irrelevant; the
+    priority values are what comes after the equals sign.
+
+    If affinity_str is empty or all whitespace, then the resulting function
+    will not alter the ordering of the nodes.
+
+    :param affinity_str: affinity config value, e.g. "r1z2=3"
+                         or "r1=1, r2z1=2, r2z2=2"
+    :returns: single-argument function
+    :raises ValueError: if argument invalid
+    """
+    affinity_str = affinity_str.strip()
+
+    if not affinity_str:
+        return lambda x: 0
+
+    priority_matchers = []
+    pieces = [s.strip() for s in affinity_str.split(',')]
+    for piece in pieces:
+        # matches r<number>=<number> or r<number>z<number>=<number>
+        match = re.match(r"r(\d+)(?:z(\d+))?=(\d+)$", piece)
+        if match:
+            region, zone, priority = match.groups()
+            region = int(region)
+            priority = int(priority)
+            zone = int(zone) if zone else None
+
+            matcher = {'region': region, 'priority': priority}
+            if zone is not None:
+                matcher['zone'] = zone
+            priority_matchers.append(matcher)
+        else:
+            raise ValueError("Invalid affinity value: %r" % affinity_str)
+
+    priority_matchers.sort(key=operator.itemgetter('priority'))
+
+    def keyfn(ring_node):
+        for matcher in priority_matchers:
+            if (matcher['region'] == ring_node['region']
+                and ('zone' not in matcher
+                     or matcher['zone'] == ring_node['zone'])):
+                return matcher['priority']
+        return 4294967296  # 2^32, i.e. "a big number"
+    return keyfn
+
+
+def affinity_locality_predicate(write_affinity_str):
+    """
+    Turns a write-affinity config value into a predicate function for nodes.
+    The returned value will be a 1-arg function that takes a node dictionary
+    and returns a true value if it is "local" and a false value otherwise. The
+    definition of "local" comes from the affinity_str argument passed in here.
+
+    For example, if affinity_str is "r1, r2z2", then only nodes where region=1
+    or where (region=2 and zone=2) are considered local.
+
+    If affinity_str is empty or all whitespace, then the resulting function
+    will consider everything local
+
+    :param write_affinity_str: affinity config value, e.g. "r1z2"
+        or "r1, r2z1, r2z2"
+    :returns: single-argument function, or None if affinity_str is empty
+    :raises ValueError: if argument invalid
+    """
+    affinity_str = write_affinity_str.strip()
+
+    if not affinity_str:
+        return None
+
+    matchers = []
+    pieces = [s.strip() for s in affinity_str.split(',')]
+    for piece in pieces:
+        # matches r<number> or r<number>z<number>
+        match = re.match(r"r(\d+)(?:z(\d+))?$", piece)
+        if match:
+            region, zone = match.groups()
+            region = int(region)
+            zone = int(zone) if zone else None
+
+            matcher = {'region': region}
+            if zone is not None:
+                matcher['zone'] = zone
+            matchers.append(matcher)
+        else:
+            raise ValueError("Invalid write-affinity value: %r" % affinity_str)
+
+    def is_local(ring_node):
+        for matcher in matchers:
+            if (matcher['region'] == ring_node['region']
+                and ('zone' not in matcher
+                     or matcher['zone'] == ring_node['zone'])):
+                return True
+        return False
+    return is_local
+
+
+def read_conf_dir(parser, conf_dir):
+    conf_files = []
+    for f in os.listdir(conf_dir):
+        if f.endswith('.conf') and not f.startswith('.'):
+            conf_files.append(os.path.join(conf_dir, f))
+    return parser.read(sorted(conf_files))
+
+
+class NicerInterpolation(configparser.BasicInterpolation):
+    def before_get(self, parser, section, option, value, defaults):
+        if '%(' not in value:
+            return value
+        return super(NicerInterpolation, self).before_get(
+            parser, section, option, value, defaults)
+
+
+def readconf(conf_path, section_name=None, log_name=None, defaults=None,
+             raw=False):
+    """
+    Read config file(s) and return config items as a dict
+
+    :param conf_path: path to config file/directory, or a file-like object
+                     (hasattr readline)
+    :param section_name: config section to read (will return all sections if
+                     not defined)
+    :param log_name: name to be used with logging (will use section_name if
+                     not defined)
+    :param defaults: dict of default values to pre-populate the config with
+    :returns: dict of config items
+    :raises ValueError: if section_name does not exist
+    :raises IOError: if reading the file failed
+    """
+    if defaults is None:
+        defaults = {}
+    if raw:
+        c = RawConfigParser(defaults)
+    else:
+        # In general, we haven't really thought much about interpolation
+        # in configs. Python's default ConfigParser has always supported
+        # it, though, so *we* got it "for free". Unfortunatley, since we
+        # "supported" interpolation, we have to assume there are
+        # deployments in the wild that use it, and try not to break them.
+        # So, do what we can to mimic the py2 behavior of passing through
+        # values like "1%" (which we want to support for
+        # fallocate_reserve).
+        c = ConfigParser(defaults, interpolation=NicerInterpolation())
+    c.optionxform = str  # Don't lower-case keys
+
+    if hasattr(conf_path, 'readline'):
+        if hasattr(conf_path, 'seek'):
+            conf_path.seek(0)
+        c.read_file(conf_path)
+    else:
+        if os.path.isdir(conf_path):
+            # read all configs in directory
+            success = read_conf_dir(c, conf_path)
+        else:
+            success = c.read(conf_path)
+        if not success:
+            raise IOError("Unable to read config from %s" %
+                          conf_path)
+    if section_name:
+        if c.has_section(section_name):
+            conf = dict(c.items(section_name))
+        else:
+            raise ValueError(
+                "Unable to find %(section)s config section in %(conf)s" %
+                {'section': section_name, 'conf': conf_path})
+        if "log_name" not in conf:
+            if log_name is not None:
+                conf['log_name'] = log_name
+            else:
+                conf['log_name'] = section_name
+    else:
+        conf = {}
+        for s in c.sections():
+            conf.update({s: dict(c.items(s))})
+        if 'log_name' not in conf:
+            conf['log_name'] = log_name
+    conf['__file__'] = conf_path
+    return conf
+
+
+def parse_prefixed_conf(conf_file, prefix):
+    """
+    Search the config file for any common-prefix sections and load those
+    sections to a dict mapping the after-prefix reference to options.
+
+    :param conf_file: the file name of the config to parse
+    :param prefix: the common prefix of the sections
+    :return: a dict mapping policy reference -> dict of policy options
+    :raises ValueError: if a policy config section has an invalid name
+    """
+
+    ret_config = {}
+    all_conf = readconf(conf_file)
+    for section, options in all_conf.items():
+        if not section.startswith(prefix):
+            continue
+        target_ref = section[len(prefix):]
+        ret_config[target_ref] = options
+    return ret_config
diff --git a/swift/common/utils/ipaddrs.py b/swift/common/utils/ipaddrs.py
new file mode 100644
index 0000000000..1d3438f6e6
--- /dev/null
+++ b/swift/common/utils/ipaddrs.py
@@ -0,0 +1,222 @@
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import ctypes
+import ctypes.util
+import os
+import platform
+import re
+import socket
+
+
+# Used by the parse_socket_string() function to validate IPv6 addresses
+IPV6_RE = re.compile(r"^\[(?P<address>.*)\](:(?P<port>[0-9]+))?$")
+
+
+def is_valid_ip(ip):
+    """
+    Return True if the provided ip is a valid IP-address
+    """
+    return is_valid_ipv4(ip) or is_valid_ipv6(ip)
+
+
+def is_valid_ipv4(ip):
+    """
+    Return True if the provided ip is a valid IPv4-address
+    """
+    try:
+        socket.inet_pton(socket.AF_INET, ip)
+    except socket.error:  # not a valid IPv4 address
+        return False
+    return True
+
+
+def is_valid_ipv6(ip):
+    """
+    Returns True if the provided ip is a valid IPv6-address
+    """
+    try:
+        socket.inet_pton(socket.AF_INET6, ip)
+    except socket.error:  # not a valid IPv6 address
+        return False
+    return True
+
+
+def expand_ipv6(address):
+    """
+    Expand ipv6 address.
+    :param address: a string indicating valid ipv6 address
+    :returns: a string indicating fully expanded ipv6 address
+
+    """
+    packed_ip = socket.inet_pton(socket.AF_INET6, address)
+    return socket.inet_ntop(socket.AF_INET6, packed_ip)
+
+
+def errcheck(result, func, arguments):
+    if result != 0:
+        errno = ctypes.set_errno(0)
+        raise OSError(errno, "getifaddrs: %s" % os.strerror(errno))
+    return result
+
+
+libc = ctypes.CDLL(ctypes.util.find_library("c"), use_errno=True)
+getifaddrs = libc.getifaddrs
+getifaddrs.errcheck = errcheck
+freeifaddrs = libc.freeifaddrs
+
+
+class sockaddr_in4(ctypes.Structure):
+    if platform.system() == 'Linux':
+        _fields_ = [
+            ("sin_family", ctypes.c_uint16),
+            ("sin_port", ctypes.c_uint16),
+            ("sin_addr", ctypes.c_ubyte * 4),
+        ]
+    else:
+        # Assume BSD / OS X
+        _fields_ = [
+            ("sin_len", ctypes.c_uint8),
+            ("sin_family", ctypes.c_uint8),
+            ("sin_port", ctypes.c_uint16),
+            ("sin_addr", ctypes.c_ubyte * 4),
+        ]
+
+
+class sockaddr_in6(ctypes.Structure):
+    if platform.system() == 'Linux':
+        _fields_ = [
+            ("sin6_family", ctypes.c_uint16),
+            ("sin6_port", ctypes.c_uint16),
+            ("sin6_flowinfo", ctypes.c_uint32),
+            ("sin6_addr", ctypes.c_ubyte * 16),
+        ]
+    else:
+        # Assume BSD / OS X
+        _fields_ = [
+            ("sin6_len", ctypes.c_uint8),
+            ("sin6_family", ctypes.c_uint8),
+            ("sin6_port", ctypes.c_uint16),
+            ("sin6_flowinfo", ctypes.c_uint32),
+            ("sin6_addr", ctypes.c_ubyte * 16),
+        ]
+
+
+class ifaddrs(ctypes.Structure):
+    pass
+
+
+# Have to do this a little later so we can self-reference
+ifaddrs._fields_ = [
+    ("ifa_next", ctypes.POINTER(ifaddrs)),
+    ("ifa_name", ctypes.c_char_p),
+    ("ifa_flags", ctypes.c_int),
+    # Use the smaller of the two to start, can cast later
+    # when we *know* we're looking at INET6
+    ("ifa_addr", ctypes.POINTER(sockaddr_in4)),
+    # Don't care about the rest of the fields
+]
+
+
+def whataremyips(ring_ip=None):
+    """
+    Get "our" IP addresses ("us" being the set of services configured by
+    one `*.conf` file). If our REST listens on a specific address, return it.
+    Otherwise, if listen on '0.0.0.0' or '::' return all addresses, including
+    the loopback.
+
+    :param str ring_ip: Optional ring_ip/bind_ip from a config file; may be
+                        IP address or hostname.
+    :returns: list of Strings of ip addresses
+    """
+    if ring_ip:
+        # See if bind_ip is '0.0.0.0'/'::'
+        try:
+            _, _, _, _, sockaddr = socket.getaddrinfo(
+                ring_ip, None, 0, socket.SOCK_STREAM, 0,
+                socket.AI_NUMERICHOST)[0]
+            if sockaddr[0] not in ('0.0.0.0', '::'):
+                return [ring_ip]
+        except socket.gaierror:
+            pass
+
+    addresses = []
+    addrs = ctypes.POINTER(ifaddrs)()
+    getifaddrs(ctypes.byref(addrs))
+    try:
+        cur = addrs
+        while cur:
+            if not cur.contents.ifa_addr:
+                # Not all interfaces will have addresses; move on
+                cur = cur.contents.ifa_next
+                continue
+            sa_family = cur.contents.ifa_addr.contents.sin_family
+            if sa_family == socket.AF_INET:
+                addresses.append(
+                    socket.inet_ntop(
+                        socket.AF_INET,
+                        cur.contents.ifa_addr.contents.sin_addr,
+                    )
+                )
+            elif sa_family == socket.AF_INET6:
+                addr = ctypes.cast(cur.contents.ifa_addr,
+                                   ctypes.POINTER(sockaddr_in6))
+                addresses.append(
+                    socket.inet_ntop(
+                        socket.AF_INET6,
+                        addr.contents.sin6_addr,
+                    )
+                )
+            cur = cur.contents.ifa_next
+    finally:
+        freeifaddrs(addrs)
+    return addresses
+
+
+def parse_socket_string(socket_string, default_port):
+    """
+    Given a string representing a socket, returns a tuple of (host, port).
+    Valid strings are DNS names, IPv4 addresses, or IPv6 addresses, with an
+    optional port. If an IPv6 address is specified it **must** be enclosed in
+    [], like *[::1]* or *[::1]:11211*. This follows the accepted prescription
+    for `IPv6 host literals`_.
+
+    Examples::
+
+        server.org
+        server.org:1337
+        127.0.0.1:1337
+        [::1]:1337
+        [::1]
+
+    .. _IPv6 host literals: https://tools.ietf.org/html/rfc3986#section-3.2.2
+    """
+    port = default_port
+    # IPv6 addresses must be between '[]'
+    if socket_string.startswith('['):
+        match = IPV6_RE.match(socket_string)
+        if not match:
+            raise ValueError("Invalid IPv6 address: %s" % socket_string)
+        host = match.group('address')
+        port = match.group('port') or port
+    else:
+        if ':' in socket_string:
+            tokens = socket_string.split(':')
+            if len(tokens) > 2:
+                raise ValueError("IPv6 addresses must be between '[]'")
+            host, port = tokens
+        else:
+            host = socket_string
+    return (host, port)
diff --git a/swift/common/utils/libc.py b/swift/common/utils/libc.py
new file mode 100644
index 0000000000..94571157d1
--- /dev/null
+++ b/swift/common/utils/libc.py
@@ -0,0 +1,345 @@
+# Copyright (c) 2010-2023 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""Functions Swift uses to interact with libc and other low-level APIs."""
+
+import ctypes
+import ctypes.util
+import fcntl
+import logging
+import os
+import platform
+import socket
+
+
+# These are lazily pulled from libc elsewhere
+_posix_fadvise = None
+_libc_socket = None
+_libc_bind = None
+_libc_accept = None
+# see man -s 2 setpriority
+_libc_setpriority = None
+# see man -s 2 syscall
+_posix_syscall = None
+
+# from /usr/src/linux-headers-*/include/uapi/linux/resource.h
+PRIO_PROCESS = 0
+
+
+# /usr/include/x86_64-linux-gnu/asm/unistd_64.h defines syscalls there
+# are many like it, but this one is mine, see man -s 2 ioprio_set
+def NR_ioprio_set():
+    """Give __NR_ioprio_set value for your system."""
+    architecture = os.uname()[4]
+    arch_bits = platform.architecture()[0]
+    # check if supported system, now support x86_64 and AArch64
+    if architecture == 'x86_64' and arch_bits == '64bit':
+        return 251
+    elif architecture == 'aarch64' and arch_bits == '64bit':
+        return 30
+    raise OSError("Swift doesn't support ionice priority for %s %s" %
+                  (architecture, arch_bits))
+
+
+# this syscall integer probably only works on x86_64 linux systems, you
+# can check if it's correct on yours with something like this:
+"""
+#include <stdio.h>
+#include <sys/syscall.h>
+
+int main(int argc, const char* argv[]) {
+    printf("%d\n", __NR_ioprio_set);
+    return 0;
+}
+"""
+
+# this is the value for "which" that says our who value will be a pid
+# pulled out of /usr/src/linux-headers-*/include/linux/ioprio.h
+IOPRIO_WHO_PROCESS = 1
+
+
+IO_CLASS_ENUM = {
+    'IOPRIO_CLASS_RT': 1,
+    'IOPRIO_CLASS_BE': 2,
+    'IOPRIO_CLASS_IDLE': 3,
+}
+
+# the IOPRIO_PRIO_VALUE "macro" is also pulled from
+# /usr/src/linux-headers-*/include/linux/ioprio.h
+IOPRIO_CLASS_SHIFT = 13
+
+
+def IOPRIO_PRIO_VALUE(class_, data):
+    return (((class_) << IOPRIO_CLASS_SHIFT) | data)
+
+
+# These constants are Linux-specific, and Python doesn't seem to know
+# about them. We ask anyway just in case that ever gets fixed.
+#
+# The values were copied from the Linux 3.x kernel headers.
+AF_ALG = getattr(socket, 'AF_ALG', 38)
+F_SETPIPE_SZ = getattr(fcntl, 'F_SETPIPE_SZ', 1031)
+
+
+def noop_libc_function(*args):
+    return 0
+
+
+def load_libc_function(func_name, log_error=True,
+                       fail_if_missing=False, errcheck=False):
+    """
+    Attempt to find the function in libc, otherwise return a no-op func.
+
+    :param func_name: name of the function to pull from libc.
+    :param log_error: log an error when a function can't be found
+    :param fail_if_missing: raise an exception when a function can't be found.
+                            Default behavior is to return a no-op function.
+    :param errcheck: boolean, if true install a wrapper on the function
+                     to check for a return values of -1 and call
+                     ctype.get_errno and raise an OSError
+    """
+    try:
+        libc = ctypes.CDLL(ctypes.util.find_library('c'), use_errno=True)
+        func = getattr(libc, func_name)
+    except AttributeError:
+        if fail_if_missing:
+            raise
+        if log_error:
+            logging.warning("Unable to locate %s in libc.  Leaving as a "
+                            "no-op.", func_name)
+        return noop_libc_function
+    if errcheck:
+        def _errcheck(result, f, args):
+            if result == -1:
+                errcode = ctypes.get_errno()
+                raise OSError(errcode, os.strerror(errcode))
+            return result
+        func.errcheck = _errcheck
+    return func
+
+
+class _LibcWrapper(object):
+    """
+    A callable object that forwards its calls to a C function from libc.
+
+    These objects are lazy. libc will not be checked until someone tries to
+    either call the function or check its availability.
+
+    _LibcWrapper objects have an "available" property; if true, then libc
+    has the function of that name. If false, then calls will fail with a
+    NotImplementedError.
+    """
+
+    def __init__(self, func_name):
+        self._func_name = func_name
+        self._func_handle = None
+        self._loaded = False
+
+    def _ensure_loaded(self):
+        if not self._loaded:
+            func_name = self._func_name
+            try:
+                # Keep everything in this try-block in local variables so
+                # that a typo in self.some_attribute_name doesn't raise a
+                # spurious AttributeError.
+                func_handle = load_libc_function(
+                    func_name, fail_if_missing=True)
+                self._func_handle = func_handle
+            except AttributeError:
+                # We pass fail_if_missing=True to load_libc_function and
+                # then ignore the error. It's weird, but otherwise we have
+                # to check if self._func_handle is noop_libc_function, and
+                # that's even weirder.
+                pass
+            self._loaded = True
+
+    @property
+    def available(self):
+        self._ensure_loaded()
+        return bool(self._func_handle)
+
+    def __call__(self, *args):
+        if self.available:
+            return self._func_handle(*args)
+        else:
+            raise NotImplementedError(
+                "No function %r found in libc" % self._func_name)
+
+
+def drop_buffer_cache(fd, offset, length):
+    """
+    Drop 'buffer' cache for the given range of the given file.
+
+    :param fd: file descriptor
+    :param offset: start offset
+    :param length: length
+    """
+    global _posix_fadvise
+    if _posix_fadvise is None:
+        _posix_fadvise = load_libc_function('posix_fadvise64')
+    # 4 means "POSIX_FADV_DONTNEED"
+    ret = _posix_fadvise(fd, ctypes.c_uint64(offset),
+                         ctypes.c_uint64(length), 4)
+    if ret != 0:
+        logging.warning("posix_fadvise64(%(fd)s, %(offset)s, %(length)s, 4) "
+                        "-> %(ret)s", {'fd': fd, 'offset': offset,
+                                       'length': length, 'ret': ret})
+
+
+class sockaddr_alg(ctypes.Structure):
+    _fields_ = [("salg_family", ctypes.c_ushort),
+                ("salg_type", ctypes.c_ubyte * 14),
+                ("salg_feat", ctypes.c_uint),
+                ("salg_mask", ctypes.c_uint),
+                ("salg_name", ctypes.c_ubyte * 64)]
+
+
+_bound_md5_sockfd = None
+
+
+def get_md5_socket():
+    """
+    Get an MD5 socket file descriptor. One can MD5 data with it by writing it
+    to the socket with os.write, then os.read the 16 bytes of the checksum out
+    later.
+
+    NOTE: It is the caller's responsibility to ensure that os.close() is
+    called on the returned file descriptor. This is a bare file descriptor,
+    not a Python object. It doesn't close itself.
+    """
+
+    # Linux's AF_ALG sockets work like this:
+    #
+    # First, initialize a socket with socket() and bind(). This tells the
+    # socket what algorithm to use, as well as setting up any necessary bits
+    # like crypto keys. Of course, MD5 doesn't need any keys, so it's just the
+    # algorithm name.
+    #
+    # Second, to hash some data, get a second socket by calling accept() on
+    # the first socket. Write data to the socket, then when finished, read the
+    # checksum from the socket and close it. This lets you checksum multiple
+    # things without repeating all the setup code each time.
+    #
+    # Since we only need to bind() one socket, we do that here and save it for
+    # future re-use. That way, we only use one file descriptor to get an MD5
+    # socket instead of two, and we also get to save some syscalls.
+
+    global _bound_md5_sockfd
+    global _libc_socket
+    global _libc_bind
+    global _libc_accept
+
+    if _libc_accept is None:
+        _libc_accept = load_libc_function('accept', fail_if_missing=True)
+    if _libc_socket is None:
+        _libc_socket = load_libc_function('socket', fail_if_missing=True)
+    if _libc_bind is None:
+        _libc_bind = load_libc_function('bind', fail_if_missing=True)
+
+    # Do this at first call rather than at import time so that we don't use a
+    # file descriptor on systems that aren't using any MD5 sockets.
+    if _bound_md5_sockfd is None:
+        sockaddr_setup = sockaddr_alg(
+            AF_ALG,
+            (ord('h'), ord('a'), ord('s'), ord('h'), 0),
+            0, 0,
+            (ord('m'), ord('d'), ord('5'), 0))
+        hash_sockfd = _libc_socket(ctypes.c_int(AF_ALG),
+                                   ctypes.c_int(socket.SOCK_SEQPACKET),
+                                   ctypes.c_int(0))
+        if hash_sockfd < 0:
+            raise IOError(ctypes.get_errno(),
+                          "Failed to initialize MD5 socket")
+
+        bind_result = _libc_bind(ctypes.c_int(hash_sockfd),
+                                 ctypes.pointer(sockaddr_setup),
+                                 ctypes.c_int(ctypes.sizeof(sockaddr_alg)))
+        if bind_result < 0:
+            os.close(hash_sockfd)
+            raise IOError(ctypes.get_errno(), "Failed to bind MD5 socket")
+
+        _bound_md5_sockfd = hash_sockfd
+
+    md5_sockfd = _libc_accept(ctypes.c_int(_bound_md5_sockfd), None, 0)
+    if md5_sockfd < 0:
+        raise IOError(ctypes.get_errno(), "Failed to accept MD5 socket")
+
+    return md5_sockfd
+
+
+def modify_priority(conf, logger):
+    """
+    Modify priority by nice and ionice.
+    """
+
+    global _libc_setpriority
+    if _libc_setpriority is None:
+        _libc_setpriority = load_libc_function('setpriority',
+                                               errcheck=True)
+
+    def _setpriority(nice_priority):
+        """
+        setpriority for this pid
+
+        :param nice_priority: valid values are -19 to 20
+        """
+        try:
+            _libc_setpriority(PRIO_PROCESS, os.getpid(),
+                              int(nice_priority))
+        except (ValueError, OSError):
+            print("WARNING: Unable to modify scheduling priority of process."
+                  " Keeping unchanged! Check logs for more info. ")
+            logger.exception('Unable to modify nice priority')
+        else:
+            logger.debug('set nice priority to %s' % nice_priority)
+
+    nice_priority = conf.get('nice_priority')
+    if nice_priority is not None:
+        _setpriority(nice_priority)
+
+    global _posix_syscall
+    if _posix_syscall is None:
+        _posix_syscall = load_libc_function('syscall', errcheck=True)
+
+    def _ioprio_set(io_class, io_priority):
+        """
+        ioprio_set for this process
+
+        :param io_class: the I/O class component, can be
+                         IOPRIO_CLASS_RT, IOPRIO_CLASS_BE,
+                         or IOPRIO_CLASS_IDLE
+        :param io_priority: priority value in the I/O class
+        """
+        try:
+            io_class = IO_CLASS_ENUM[io_class]
+            io_priority = int(io_priority)
+            _posix_syscall(NR_ioprio_set(),
+                           IOPRIO_WHO_PROCESS,
+                           os.getpid(),
+                           IOPRIO_PRIO_VALUE(io_class, io_priority))
+        except (KeyError, ValueError, OSError):
+            print("WARNING: Unable to modify I/O scheduling class "
+                  "and priority of process. Keeping unchanged! "
+                  "Check logs for more info.")
+            logger.exception("Unable to modify ionice priority")
+        else:
+            logger.debug('set ionice class %s priority %s',
+                         io_class, io_priority)
+
+    io_class = conf.get("ionice_class")
+    if io_class is None:
+        return
+    io_priority = conf.get("ionice_priority", 0)
+    _ioprio_set(io_class, io_priority)
diff --git a/swift/common/utils/logs.py b/swift/common/utils/logs.py
new file mode 100644
index 0000000000..bd6c595fe0
--- /dev/null
+++ b/swift/common/utils/logs.py
@@ -0,0 +1,859 @@
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+
+import errno
+import hashlib
+import logging
+from logging.handlers import SysLogHandler
+import os
+import socket
+import stat
+import string
+import sys
+import time
+import fcntl
+import eventlet
+import datetime
+
+from swift.common.utils.base import md5, quote, split_path
+from swift.common.utils.config import config_true_value
+# common.utils imports a fully qualified common.exceptions so that
+# common.exceptions can import common.utils with out a circular import error
+# (if we only make reference to attributes of a module w/i our function/method
+# bodies fully qualifed module names can have their attributes lazily
+# evaluated); as the only other module with-in utils that imports exceptions:
+# we do the same here
+import swift.common.exceptions
+
+from eventlet.green.http import client as green_http_client
+import http.client
+from eventlet.green import threading
+
+
+NOTICE = 25
+
+LOG_LINE_DEFAULT_FORMAT = '{remote_addr} - - [{time.d}/{time.b}/{time.Y}' \
+                          ':{time.H}:{time.M}:{time.S} +0000] ' \
+                          '"{method} {path}" {status} {content_length} ' \
+                          '"{referer}" "{txn_id}" "{user_agent}" ' \
+                          '{trans_time:.4f} "{additional_info}" {pid} ' \
+                          '{policy_index}'
+
+
+def logging_monkey_patch():
+    # explicitly patch the logging lock
+    logging._lock = logging.threading.RLock()
+    # setup notice level logging
+    logging.addLevelName(NOTICE, 'NOTICE')
+    SysLogHandler.priority_map['NOTICE'] = 'notice'
+    # Trying to log threads while monkey-patched can lead to deadlocks; see
+    # https://bugs.launchpad.net/swift/+bug/1895739
+    logging.logThreads = 0
+
+
+class PipeMutex(object):
+    """
+    Mutex using a pipe. Works across both greenlets and real threads, even
+    at the same time.
+    """
+
+    def __init__(self):
+        self.rfd, self.wfd = os.pipe()
+
+        # You can't create a pipe in non-blocking mode; you must set it
+        # later.
+        rflags = fcntl.fcntl(self.rfd, fcntl.F_GETFL)
+        fcntl.fcntl(self.rfd, fcntl.F_SETFL, rflags | os.O_NONBLOCK)
+        os.write(self.wfd, b'-')  # start unlocked
+
+        self.owner = None
+        self.recursion_depth = 0
+
+        # Usually, it's an error to have multiple greenthreads all waiting
+        # to read the same file descriptor. It's often a sign of inadequate
+        # concurrency control; for example, if you have two greenthreads
+        # trying to use the same memcache connection, they'll end up writing
+        # interleaved garbage to the socket or stealing part of each others'
+        # responses.
+        #
+        # In this case, we have multiple greenthreads waiting on the same
+        # file descriptor by design. This lets greenthreads in real thread A
+        # wait with greenthreads in real thread B for the same mutex.
+        # Therefore, we must turn off eventlet's multiple-reader detection.
+        #
+        # It would be better to turn off multiple-reader detection for only
+        # our calls to trampoline(), but eventlet does not support that.
+        eventlet.debug.hub_prevent_multiple_readers(False)
+
+    def acquire(self, blocking=True):
+        """
+        Acquire the mutex.
+
+        If called with blocking=False, returns True if the mutex was
+        acquired and False if it wasn't. Otherwise, blocks until the mutex
+        is acquired and returns True.
+
+        This lock is recursive; the same greenthread may acquire it as many
+        times as it wants to, though it must then release it that many times
+        too.
+        """
+        current_greenthread_id = id(eventlet.greenthread.getcurrent())
+        if self.owner == current_greenthread_id:
+            self.recursion_depth += 1
+            return True
+
+        while True:
+            try:
+                # If there is a byte available, this will read it and remove
+                # it from the pipe. If not, this will raise OSError with
+                # errno=EAGAIN.
+                os.read(self.rfd, 1)
+                self.owner = current_greenthread_id
+                return True
+            except OSError as err:
+                if err.errno != errno.EAGAIN:
+                    raise
+
+                if not blocking:
+                    return False
+
+                # Tell eventlet to suspend the current greenthread until
+                # self.rfd becomes readable. This will happen when someone
+                # else writes to self.wfd.
+                eventlet.hubs.trampoline(self.rfd, read=True)
+
+    def release(self):
+        """
+        Release the mutex.
+        """
+        current_greenthread_id = id(eventlet.greenthread.getcurrent())
+        if self.owner != current_greenthread_id:
+            raise RuntimeError("cannot release un-acquired lock")
+
+        if self.recursion_depth > 0:
+            self.recursion_depth -= 1
+            return
+
+        self.owner = None
+        os.write(self.wfd, b'X')
+
+    def close(self):
+        """
+        Close the mutex. This releases its file descriptors.
+
+        You can't use a mutex after it's been closed.
+        """
+        if self.wfd is not None:
+            os.close(self.rfd)
+            self.rfd = None
+            os.close(self.wfd)
+            self.wfd = None
+        self.owner = None
+        self.recursion_depth = 0
+
+    def __del__(self):
+        # We need this so we don't leak file descriptors. Otherwise, if you
+        # call get_swift_logger() and don't explicitly dispose of it by calling
+        # logger.logger.handlers[0].lock.close() [1], the pipe file
+        # descriptors are leaked.
+        #
+        # This only really comes up in tests. Swift processes tend to call
+        # get_swift_logger() once and then hang on to it until they exit,
+        # but the test suite calls get_swift_logger() a lot.
+        #
+        # [1] and that's a completely ridiculous thing to expect callers to
+        # do, so nobody does it and that's okay.
+        self.close()
+
+    def __enter__(self):
+        self.acquire()
+        return self
+
+    def __exit__(self, *args):
+        self.release()
+
+
+class NoopMutex(object):
+    """
+    "Mutex" that doesn't lock anything.
+
+    We only allow our syslog logging to be configured via UDS or UDP, neither
+    of which have the message-interleaving trouble you'd expect from TCP or
+    file handlers.
+    """
+
+    def __init__(self):
+        # Usually, it's an error to have multiple greenthreads all waiting
+        # to write to the same file descriptor. It's often a sign of inadequate
+        # concurrency control; for example, if you have two greenthreads
+        # trying to use the same memcache connection, they'll end up writing
+        # interleaved garbage to the socket or stealing part of each others'
+        # responses.
+        #
+        # In this case, we have multiple greenthreads waiting on the same
+        # (logging) file descriptor by design. So, similar to the PipeMutex,
+        # we must turn off eventlet's multiple-waiter detection.
+        #
+        # It would be better to turn off multiple-reader detection for only
+        # the logging socket fd, but eventlet does not support that.
+        eventlet.debug.hub_prevent_multiple_readers(False)
+
+    def acquire(self, blocking=True):
+        pass
+
+    def release(self):
+        pass
+
+    def __enter__(self):
+        return self
+
+    def __exit__(self, *args):
+        pass
+
+
+class ThreadSafeSysLogHandler(SysLogHandler):
+    def createLock(self):
+        if config_true_value(os.environ.get(
+                'SWIFT_NOOP_LOGGING_MUTEX') or 'true'):
+            self.lock = NoopMutex()
+        else:
+            self.lock = PipeMutex()
+
+
+# double inheritance to support property with setter
+class SwiftLogAdapter(logging.LoggerAdapter, object):
+    """
+    A LogAdapter that modifies the adapted ``Logger`` instance
+    in the following ways:
+
+    * Performs some reformatting on calls to :meth:`exception`.
+    * Provides threadlocal txn_id and client_ip attributes.
+    * Adds the txn_id, client_ip and server attributes to the ``extras`` dict
+      when a message is processed.
+    * Adds the given prefix to the start of each log message.
+    * Provides a notice method for logging at NOTICE level.
+    """
+
+    _cls_thread_local = threading.local()
+
+    def __init__(self, logger, server, prefix=''):
+        logging.LoggerAdapter.__init__(self, logger, {})
+        self.prefix = prefix
+        self.server = server
+        self.warn = self.warning
+
+    @property
+    def txn_id(self):
+        if hasattr(self._cls_thread_local, 'txn_id'):
+            return self._cls_thread_local.txn_id
+
+    @txn_id.setter
+    def txn_id(self, value):
+        self._cls_thread_local.txn_id = value
+
+    @property
+    def client_ip(self):
+        if hasattr(self._cls_thread_local, 'client_ip'):
+            return self._cls_thread_local.client_ip
+
+    @client_ip.setter
+    def client_ip(self, value):
+        self._cls_thread_local.client_ip = value
+
+    @property
+    def thread_locals(self):
+        return (self.txn_id, self.client_ip)
+
+    @thread_locals.setter
+    def thread_locals(self, value):
+        self.txn_id, self.client_ip = value
+
+    def process(self, msg, kwargs):
+        """
+        Add extra info to message
+        """
+        kwargs['extra'] = {'server': self.server, 'txn_id': self.txn_id,
+                           'client_ip': self.client_ip}
+        msg = '%s%s' % (self.prefix, msg)
+        return msg, kwargs
+
+    def notice(self, msg, *args, **kwargs):
+        """
+        Convenience function for syslog priority LOG_NOTICE. The python
+        logging lvl is set to 25, just above info.  SysLogHandler is
+        monkey patched to map this log lvl to the LOG_NOTICE syslog
+        priority.
+        """
+        self.log(NOTICE, msg, *args, **kwargs)
+
+    def _exception(self, msg, *args, **kwargs):
+        # We up-call to exception() where stdlib uses error() so we can get
+        # some of the traceback suppression from LogAdapter, below
+        logging.LoggerAdapter.exception(self, msg, *args, **kwargs)
+
+    def exception(self, msg, *args, **kwargs):
+        _junk, exc, _junk = sys.exc_info()
+        call = self.error
+        emsg = ''
+        if isinstance(exc, (http.client.BadStatusLine,
+                            green_http_client.BadStatusLine)):
+            # Use error(); not really exceptional
+            emsg = repr(exc)
+            # Note that on py3, we've seen a RemoteDisconnected error getting
+            # raised, which inherits from *both* BadStatusLine and OSError;
+            # we want it getting caught here
+        elif isinstance(exc, (OSError, socket.error)):
+            if exc.errno in (errno.EIO, errno.ENOSPC):
+                emsg = str(exc)
+            elif exc.errno == errno.ECONNREFUSED:
+                emsg = 'Connection refused'
+            elif exc.errno == errno.ECONNRESET:
+                emsg = 'Connection reset'
+            elif exc.errno == errno.EHOSTUNREACH:
+                emsg = 'Host unreachable'
+            elif exc.errno == errno.ENETUNREACH:
+                emsg = 'Network unreachable'
+            elif exc.errno == errno.ETIMEDOUT:
+                emsg = 'Connection timeout'
+            elif exc.errno == errno.EPIPE:
+                emsg = 'Broken pipe'
+            else:
+                call = self._exception
+        elif isinstance(exc, eventlet.Timeout):
+            emsg = exc.__class__.__name__
+            detail = '%ss' % exc.seconds
+            if hasattr(exc, 'created_at'):
+                detail += ' after %0.2fs' % (time.time() - exc.created_at)
+            emsg += ' (%s)' % detail
+            if isinstance(exc, swift.common.exceptions.MessageTimeout):
+                if exc.msg:
+                    emsg += ' %s' % exc.msg
+        else:
+            call = self._exception
+        call('%s: %s' % (msg, emsg), *args, **kwargs)
+
+
+class SwiftLogFormatter(logging.Formatter):
+    """
+    Custom logging.Formatter will append txn_id to a log message if the
+    record has one and the message does not. Optionally it can shorten
+    overly long log lines.
+    """
+
+    def __init__(self, fmt=None, datefmt=None, max_line_length=0):
+        logging.Formatter.__init__(self, fmt=fmt, datefmt=datefmt)
+        self.max_line_length = max_line_length
+
+    def format(self, record):
+        if not hasattr(record, 'server'):
+            # Catch log messages that were not initiated by swift
+            # (for example, the keystone auth middleware)
+            record.server = record.name
+
+        # Included from Python's logging.Formatter and then altered slightly to
+        # replace \n with #012
+        record.message = record.getMessage()
+        if self._fmt.find('%(asctime)') >= 0:
+            record.asctime = self.formatTime(record, self.datefmt)
+        msg = (self._fmt % record.__dict__).replace('\n', '#012')
+        if record.exc_info:
+            # Cache the traceback text to avoid converting it multiple times
+            # (it's constant anyway)
+            if not record.exc_text:
+                record.exc_text = self.formatException(
+                    record.exc_info).replace('\n', '#012')
+        if record.exc_text:
+            if not msg.endswith('#012'):
+                msg = msg + '#012'
+            msg = msg + record.exc_text
+
+        if (hasattr(record, 'txn_id') and record.txn_id and
+                record.txn_id not in msg):
+            msg = "%s (txn: %s)" % (msg, record.txn_id)
+        if (hasattr(record, 'client_ip') and record.client_ip and
+                record.levelno != logging.INFO and
+                record.client_ip not in msg):
+            msg = "%s (client_ip: %s)" % (msg, record.client_ip)
+        if self.max_line_length > 0 and len(msg) > self.max_line_length:
+            if self.max_line_length < 7:
+                msg = msg[:self.max_line_length]
+            else:
+                approxhalf = (self.max_line_length - 5) // 2
+                msg = msg[:approxhalf] + " ... " + msg[-approxhalf:]
+        return msg
+
+
+class LoggerFileObject(object):
+
+    # Note: this is greenthread-local storage
+    _cls_thread_local = threading.local()
+
+    def __init__(self, logger, log_type='STDOUT'):
+        self.logger = logger
+        self.log_type = log_type
+
+    def write(self, value):
+        # We can get into a nasty situation when logs are going to syslog
+        # and syslog dies.
+        #
+        # It's something like this:
+        #
+        # (A) someone logs something
+        #
+        # (B) there's an exception in sending to /dev/log since syslog is
+        #     not working
+        #
+        # (C) logging takes that exception and writes it to stderr (see
+        #     logging.Handler.handleError)
+        #
+        # (D) stderr was replaced with a LoggerFileObject at process start,
+        #     so the LoggerFileObject takes the provided string and tells
+        #     its logger to log it (to syslog, naturally).
+        #
+        # Then, steps B through D repeat until we run out of stack.
+        if getattr(self._cls_thread_local, 'already_called_write', False):
+            return
+
+        self._cls_thread_local.already_called_write = True
+        try:
+            value = value.strip()
+            if value:
+                if 'Connection reset by peer' in value:
+                    self.logger.error(
+                        '%s: Connection reset by peer', self.log_type)
+                else:
+                    self.logger.error('%(type)s: %(value)s',
+                                      {'type': self.log_type, 'value': value})
+        finally:
+            self._cls_thread_local.already_called_write = False
+
+    def writelines(self, values):
+        if getattr(self._cls_thread_local, 'already_called_writelines', False):
+            return
+
+        self._cls_thread_local.already_called_writelines = True
+        try:
+            self.logger.error('%(type)s: %(value)s',
+                              {'type': self.log_type,
+                               'value': '#012'.join(values)})
+        finally:
+            self._cls_thread_local.already_called_writelines = False
+
+    def close(self):
+        pass
+
+    def flush(self):
+        pass
+
+    def __iter__(self):
+        return self
+
+    def __next__(self):
+        raise IOError(errno.EBADF, 'Bad file descriptor')
+
+    def read(self, size=-1):
+        raise IOError(errno.EBADF, 'Bad file descriptor')
+
+    def readline(self, size=-1):
+        raise IOError(errno.EBADF, 'Bad file descriptor')
+
+    def tell(self):
+        return 0
+
+    def xreadlines(self):
+        return self
+
+
+class LogLevelFilter(object):
+    """
+    Drop messages for the logger based on level.
+
+    This is useful when dependencies log too much information.
+
+    :param level: All messages at or below this level are dropped
+                  (DEBUG < INFO < WARN < ERROR < CRITICAL|FATAL)
+                  Default: DEBUG
+    """
+
+    def __init__(self, level=logging.DEBUG):
+        self.level = level
+
+    def filter(self, record):
+        if record.levelno <= self.level:
+            return 0
+        return 1
+
+
+def get_swift_logger(conf, name=None, log_to_console=False, log_route=None,
+                     fmt="%(server)s: %(message)s"):
+    """
+    Get the current system logger using config settings.
+
+    **Log config and defaults**::
+
+        log_facility = LOG_LOCAL0
+        log_level = INFO
+        log_name = swift
+        log_max_line_length = 0
+        log_udp_host = (disabled)
+        log_udp_port = logging.handlers.SYSLOG_UDP_PORT
+        log_address = /dev/log
+
+    :param conf: Configuration dict to read settings from
+    :param name: This value is used to populate the ``server`` field in
+                 the log format, as the default value for ``log_route``;
+                 defaults to the ``log_name`` value in ``conf``, if it exists,
+                 or to 'swift'.
+    :param log_to_console: Add handler which writes to console on stderr
+    :param log_route: Route for the logging, not emitted to the log, just used
+                      to separate logging configurations; defaults to the value
+                      of ``name`` or whatever ``name`` defaults to. This value
+                      is used as the name attribute of the
+                      ``logging.LogAdapter`` that is returned.
+    :param fmt: Override log format
+    :return: an instance of ``SwiftLogAdapter``
+    """
+    # note: log_name is typically specified in conf (i.e. defined by
+    # operators), whereas log_route is typically hard-coded in callers of
+    # get_swift_logger (i.e. defined by developers)
+    if not conf:
+        conf = {}
+    if name is None:
+        name = conf.get('log_name', 'swift')
+    if not log_route:
+        log_route = name
+    logger = logging.getLogger(log_route)
+    logger.propagate = False
+    # all new handlers will get the same formatter
+    formatter = SwiftLogFormatter(
+        fmt=fmt, max_line_length=int(conf.get('log_max_line_length', 0)))
+
+    # get_swift_logger will only ever add one SysLog Handler to a logger
+    if not hasattr(get_swift_logger, 'handler4logger'):
+        get_swift_logger.handler4logger = {}
+    if logger in get_swift_logger.handler4logger:
+        logger.removeHandler(get_swift_logger.handler4logger[logger])
+
+    # facility for this logger will be set by last call wins
+    facility = getattr(SysLogHandler, conf.get('log_facility', 'LOG_LOCAL0'),
+                       SysLogHandler.LOG_LOCAL0)
+    udp_host = conf.get('log_udp_host')
+    if udp_host:
+        udp_port = int(conf.get('log_udp_port',
+                                logging.handlers.SYSLOG_UDP_PORT))
+        handler = ThreadSafeSysLogHandler(address=(udp_host, udp_port),
+                                          facility=facility)
+    else:
+        log_address = conf.get('log_address', '/dev/log')
+        handler = None
+        try:
+            mode = os.stat(log_address).st_mode
+            if stat.S_ISSOCK(mode):
+                handler = ThreadSafeSysLogHandler(address=log_address,
+                                                  facility=facility)
+        except (OSError, socket.error) as e:
+            # If either /dev/log isn't a UNIX socket or it does not exist at
+            # all then py2 would raise an error
+            if e.errno not in [errno.ENOTSOCK, errno.ENOENT]:
+                raise
+        if handler is None:
+            # fallback to default UDP
+            handler = ThreadSafeSysLogHandler(facility=facility)
+    handler.setFormatter(formatter)
+    logger.addHandler(handler)
+    get_swift_logger.handler4logger[logger] = handler
+
+    # setup console logging
+    if log_to_console or hasattr(get_swift_logger, 'console_handler4logger'):
+        # remove pre-existing console handler for this logger
+        if not hasattr(get_swift_logger, 'console_handler4logger'):
+            get_swift_logger.console_handler4logger = {}
+        if logger in get_swift_logger.console_handler4logger:
+            logger.removeHandler(
+                get_swift_logger.console_handler4logger[logger])
+
+        console_handler = logging.StreamHandler(sys.__stderr__)
+        console_handler.setFormatter(formatter)
+        logger.addHandler(console_handler)
+        get_swift_logger.console_handler4logger[logger] = console_handler
+
+    # set the level for the logger
+    logger.setLevel(
+        getattr(logging, conf.get('log_level', 'INFO').upper(), logging.INFO))
+
+    adapted_logger = SwiftLogAdapter(logger, name)
+    other_handlers = conf.get('log_custom_handlers', None)
+    if other_handlers:
+        log_custom_handlers = [s.strip() for s in other_handlers.split(',')
+                               if s.strip()]
+        for hook in log_custom_handlers:
+            try:
+                mod, fnc = hook.rsplit('.', 1)
+                logger_hook = getattr(__import__(mod, fromlist=[fnc]), fnc)
+                logger_hook(conf, name, log_to_console, log_route, fmt,
+                            logger, adapted_logger)
+            except (AttributeError, ImportError):
+                print('Error calling custom handler [%s]' % hook,
+                      file=sys.stderr)
+            except ValueError:
+                print('Invalid custom handler format [%s]' % hook,
+                      file=sys.stderr)
+
+    return adapted_logger
+
+
+def get_prefixed_swift_logger(swift_logger, prefix):
+    """
+    Return a clone of the given ``swift_logger`` with a new prefix string
+    that replaces the prefix string of the given ``swift_logger``.
+
+    :param swift_logger: an instance of ``SwiftLogAdapter``.
+    :param prefix: a string prefix.
+    :returns: a new instance of ``SwiftLogAdapter``.
+    """
+    return SwiftLogAdapter(
+        swift_logger.logger, swift_logger.server, prefix=prefix)
+
+
+class NullLogger(object):
+    """A no-op logger for eventlet wsgi."""
+
+    def write(self, *args):
+        # "Logs" the args to nowhere
+        pass
+
+    def exception(self, *args):
+        pass
+
+    def critical(self, *args):
+        pass
+
+    def error(self, *args):
+        pass
+
+    def warning(self, *args):
+        pass
+
+    def info(self, *args):
+        pass
+
+    def debug(self, *args):
+        pass
+
+    def log(self, *args):
+        pass
+
+
+def capture_stdio(logger, **kwargs):
+    """
+    Log unhandled exceptions, close stdio, capture stdout and stderr.
+
+    param logger: Logger object to use
+    """
+    # log uncaught exceptions
+    sys.excepthook = lambda * exc_info: \
+        logger.critical('UNCAUGHT EXCEPTION', exc_info=exc_info)
+
+    # collect stdio file desc not in use for logging
+    stdio_files = [sys.stdin, sys.stdout, sys.stderr]
+    console_fds = [h.stream.fileno() for _junk, h in getattr(
+        get_swift_logger, 'console_handler4logger', {}).items()]
+    stdio_files = [f for f in stdio_files if f.fileno() not in console_fds]
+
+    with open(os.devnull, 'r+b') as nullfile:
+        # close stdio (excludes fds open for logging)
+        for f in stdio_files:
+            # some platforms throw an error when attempting an stdin flush
+            try:
+                f.flush()
+            except IOError:
+                pass
+
+            try:
+                os.dup2(nullfile.fileno(), f.fileno())
+            except OSError:
+                pass
+
+    # redirect stdio
+    if kwargs.pop('capture_stdout', True):
+        sys.stdout = LoggerFileObject(logger)
+    if kwargs.pop('capture_stderr', True):
+        sys.stderr = LoggerFileObject(logger, 'STDERR')
+
+
+class StrAnonymizer(str):
+    """
+    Class that permits to get a string anonymized or simply quoted.
+    """
+
+    def __new__(cls, data, method, salt):
+        method = method.lower()
+        if method not in hashlib.algorithms_guaranteed:
+            raise ValueError('Unsupported hashing method: %r' % method)
+        s = str.__new__(cls, data or '')
+        s.method = method
+        s.salt = salt
+        return s
+
+    @property
+    def anonymized(self):
+        if not self:
+            return self
+        else:
+            if self.method == 'md5':
+                h = md5(usedforsecurity=False)
+            else:
+                h = getattr(hashlib, self.method)()
+            if self.salt:
+                h.update(self.salt.encode('latin1'))
+            h.update(self.encode('latin1'))
+            return '{%s%s}%s' % ('S' if self.salt else '', self.method.upper(),
+                                 h.hexdigest())
+
+
+class StrFormatTime(object):
+    """
+    Class that permits to get formats or parts of a time.
+    """
+
+    def __init__(self, ts):
+        self.time = ts
+        self.time_struct = time.gmtime(ts)
+
+    def __str__(self):
+        return "%.9f" % self.time
+
+    def __getattr__(self, attr):
+        if attr not in ['a', 'A', 'b', 'B', 'c', 'd', 'H',
+                        'I', 'j', 'm', 'M', 'p', 'S', 'U',
+                        'w', 'W', 'x', 'X', 'y', 'Y', 'Z']:
+            raise ValueError(("The attribute %s is not a correct directive "
+                              "for time.strftime formater.") % attr)
+        return datetime.datetime(
+            *self.time_struct[:-2],
+            tzinfo=datetime.timezone.utc).strftime('%' + attr)
+
+    @property
+    def asctime(self):
+        return time.asctime(self.time_struct)
+
+    @property
+    def datetime(self):
+        return time.strftime('%d/%b/%Y/%H/%M/%S', self.time_struct)
+
+    @property
+    def iso8601(self):
+        return time.strftime('%Y-%m-%dT%H:%M:%S', self.time_struct)
+
+    @property
+    def ms(self):
+        return self.__str__().split('.')[1][:3]
+
+    @property
+    def us(self):
+        return self.__str__().split('.')[1][:6]
+
+    @property
+    def ns(self):
+        return self.__str__().split('.')[1]
+
+    @property
+    def s(self):
+        return self.__str__().split('.')[0]
+
+
+def get_log_line(req, res, trans_time, additional_info, fmt,
+                 anonymization_method, anonymization_salt):
+    """
+    Make a line for logging that matches the documented log line format
+    for backend servers.
+
+    :param req: the request.
+    :param res: the response.
+    :param trans_time: the time the request took to complete, a float.
+    :param additional_info: a string to log at the end of the line
+
+    :returns: a properly formatted line for logging.
+    """
+
+    policy_index = get_policy_index(req.headers, res.headers)
+    if req.path.startswith('/'):
+        disk, partition, account, container, obj = split_path(req.path, 0, 5,
+                                                              True)
+    else:
+        disk, partition, account, container, obj = (None, ) * 5
+    replacements = {
+        'remote_addr': StrAnonymizer(req.remote_addr, anonymization_method,
+                                     anonymization_salt),
+        'time': StrFormatTime(time.time()),
+        'method': req.method,
+        'path': StrAnonymizer(req.path, anonymization_method,
+                              anonymization_salt),
+        'disk': disk,
+        'partition': partition,
+        'account': StrAnonymizer(account, anonymization_method,
+                                 anonymization_salt),
+        'container': StrAnonymizer(container, anonymization_method,
+                                   anonymization_salt),
+        'object': StrAnonymizer(obj, anonymization_method,
+                                anonymization_salt),
+        'status': res.status.split()[0],
+        'content_length': res.content_length,
+        'referer': StrAnonymizer(req.referer, anonymization_method,
+                                 anonymization_salt),
+        'txn_id': req.headers.get('x-trans-id'),
+        'user_agent': StrAnonymizer(req.user_agent, anonymization_method,
+                                    anonymization_salt),
+        'trans_time': trans_time,
+        'additional_info': additional_info,
+        'pid': os.getpid(),
+        'policy_index': policy_index,
+    }
+    return LogStringFormatter(default='-').format(fmt, **replacements)
+
+
+def get_policy_index(req_headers, res_headers):
+    """
+    Returns the appropriate index of the storage policy for the request from
+    a proxy server
+
+    :param req_headers: dict of the request headers.
+    :param res_headers: dict of the response headers.
+
+    :returns: string index of storage policy, or None
+    """
+    header = 'X-Backend-Storage-Policy-Index'
+    policy_index = res_headers.get(header, req_headers.get(header))
+    if isinstance(policy_index, bytes):
+        policy_index = policy_index.decode('ascii')
+    return str(policy_index) if policy_index is not None else None
+
+
+class LogStringFormatter(string.Formatter):
+    def __init__(self, default='', quote=False):
+        super(LogStringFormatter, self).__init__()
+        self.default = default
+        self.quote = quote
+
+    def format_field(self, value, spec):
+        if not value:
+            return self.default
+        else:
+            log = super(LogStringFormatter, self).format_field(value, spec)
+            if self.quote:
+                return quote(log, ':/{}')
+            else:
+                return log
diff --git a/swift/common/utils/timestamp.py b/swift/common/utils/timestamp.py
new file mode 100644
index 0000000000..7067f4fe0d
--- /dev/null
+++ b/swift/common/utils/timestamp.py
@@ -0,0 +1,404 @@
+# Copyright (c) 2010-2023 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""Timestamp-related functions for use with Swift."""
+
+import datetime
+import functools
+import math
+import time
+
+
+NORMAL_FORMAT = "%016.05f"
+INTERNAL_FORMAT = NORMAL_FORMAT + '_%016x'
+SHORT_FORMAT = NORMAL_FORMAT + '_%x'
+MAX_OFFSET = (16 ** 16) - 1
+PRECISION = 1e-5
+# Setting this to True will cause the internal format to always display
+# extended digits - even when the value is equivalent to the normalized form.
+# This isn't ideal during an upgrade when some servers might not understand
+# the new time format - but flipping it to True works great for testing.
+FORCE_INTERNAL = False  # or True
+
+
+@functools.total_ordering
+class Timestamp(object):
+    """
+    Internal Representation of Swift Time.
+
+    The normalized form of the X-Timestamp header looks like a float
+    with a fixed width to ensure stable string sorting - normalized
+    timestamps look like "1402464677.04188"
+
+    To support overwrites of existing data without modifying the original
+    timestamp but still maintain consistency a second internal offset vector
+    is append to the normalized timestamp form which compares and sorts
+    greater than the fixed width float format but less than a newer timestamp.
+    The internalized format of timestamps looks like
+    "1402464677.04188_0000000000000000" - the portion after the underscore is
+    the offset and is a formatted hexadecimal integer.
+
+    The internalized form is not exposed to clients in responses from
+    Swift.  Normal client operations will not create a timestamp with an
+    offset.
+
+    The Timestamp class in common.utils supports internalized and
+    normalized formatting of timestamps and also comparison of timestamp
+    values.  When the offset value of a Timestamp is 0 - it's considered
+    insignificant and need not be represented in the string format; to
+    support backwards compatibility during a Swift upgrade the
+    internalized and normalized form of a Timestamp with an
+    insignificant offset are identical.  When a timestamp includes an
+    offset it will always be represented in the internalized form, but
+    is still excluded from the normalized form.  Timestamps with an
+    equivalent timestamp portion (the float part) will compare and order
+    by their offset.  Timestamps with a greater timestamp portion will
+    always compare and order greater than a Timestamp with a lesser
+    timestamp regardless of it's offset.  String comparison and ordering
+    is guaranteed for the internalized string format, and is backwards
+    compatible for normalized timestamps which do not include an offset.
+    """
+
+    def __init__(self, timestamp, offset=0, delta=0, check_bounds=True):
+        """
+        Create a new Timestamp.
+
+        :param timestamp: time in seconds since the Epoch, may be any of:
+
+            * a float or integer
+            * normalized/internalized string
+            * another instance of this class (offset is preserved)
+
+        :param offset: the second internal offset vector, an int
+        :param delta: deca-microsecond difference from the base timestamp
+                      param, an int
+        """
+        if isinstance(timestamp, bytes):
+            timestamp = timestamp.decode('ascii')
+        if isinstance(timestamp, str):
+            base, base_offset = timestamp.partition('_')[::2]
+            float_timestamp = float(base)
+            if '_' in base_offset:
+                raise ValueError('invalid literal for int() with base 16: '
+                                 '%r' % base_offset)
+            if base_offset:
+                self.offset = int(base_offset, 16)
+            else:
+                self.offset = 0
+        else:
+            float_timestamp = float(timestamp)
+            self.offset = getattr(timestamp, 'offset', 0)
+        # increment offset
+        if offset >= 0:
+            self.offset += offset
+        else:
+            raise ValueError('offset must be non-negative')
+        if self.offset > MAX_OFFSET:
+            raise ValueError('offset must be smaller than %d' % MAX_OFFSET)
+        self.raw = int(round(float_timestamp / PRECISION))
+        # add delta
+        if delta:
+            self.raw = self.raw + delta
+            if self.raw <= 0:
+                raise ValueError(
+                    'delta must be greater than %d' % (-1 * self.raw))
+
+        self.timestamp = round(float(self.raw * PRECISION), 5)
+        if check_bounds:
+            if self.timestamp < 0:
+                raise ValueError('timestamp cannot be negative')
+            if self.timestamp >= 10000000000:
+                raise ValueError('timestamp too large')
+
+    @classmethod
+    def now(cls, offset=0, delta=0):
+        """
+        Returns an instance of a Timestamp at the current time.
+        """
+        return cls(time.time(), offset=offset, delta=delta)
+
+    @classmethod
+    def zero(cls):
+        """
+        Returns an instance of the smallest possible Timestamp.
+        """
+        return cls(0)
+
+    def __repr__(self):
+        return INTERNAL_FORMAT % (self.timestamp, self.offset)
+
+    def __str__(self):
+        raise TypeError('You must specify which string format is required')
+
+    def __float__(self):
+        return self.timestamp
+
+    def __int__(self):
+        return int(self.timestamp)
+
+    def __bool__(self):
+        return bool(self.timestamp or self.offset)
+
+    @property
+    def normal(self):
+        return NORMAL_FORMAT % self.timestamp
+
+    @property
+    def internal(self):
+        if self.offset or FORCE_INTERNAL:
+            return INTERNAL_FORMAT % (self.timestamp, self.offset)
+        else:
+            return self.normal
+
+    @property
+    def short(self):
+        if self.offset or FORCE_INTERNAL:
+            return SHORT_FORMAT % (self.timestamp, self.offset)
+        else:
+            return self.normal
+
+    @property
+    def isoformat(self):
+        """
+        Get an isoformat string representation of the 'normal' part of the
+        Timestamp with microsecond precision and no trailing timezone, for
+        example::
+
+            1970-01-01T00:00:00.000000
+
+        :return: an isoformat string
+        """
+        t = float(self.normal)
+        # On Python 3, round manually using ROUND_HALF_EVEN rounding
+        # method, to use the same rounding method than Python 2. Python 3
+        # used a different rounding method, but Python 3.4.4 and 3.5.1 use
+        # again ROUND_HALF_EVEN as Python 2.
+        # See https://bugs.python.org/issue23517
+        frac, t = math.modf(t)
+        us = round(frac * 1e6)
+        if us >= 1000000:
+            t += 1
+            us -= 1000000
+        elif us < 0:
+            t -= 1
+            us += 1000000
+        dt = datetime.datetime.fromtimestamp(t, datetime.timezone.utc)
+        dt = dt.replace(microsecond=us)
+
+        isoformat = dt.isoformat()
+        # need to drop tzinfo
+        isoformat = isoformat[:isoformat.index('+')]
+        # python isoformat() doesn't include msecs when zero
+        if len(isoformat) < len("1970-01-01T00:00:00.000000"):
+            isoformat += ".000000"
+        return isoformat
+
+    @classmethod
+    def from_isoformat(cls, date_string):
+        """
+        Parse an isoformat string representation of time to a Timestamp object.
+
+        :param date_string: a string formatted as per an Timestamp.isoformat
+            property.
+        :return: an instance of  this class.
+        """
+        start = datetime.datetime.strptime(date_string, "%Y-%m-%dT%H:%M:%S.%f")
+        delta = start - EPOCH
+        # This calculation is based on Python 2.7's Modules/datetimemodule.c,
+        # function delta_to_microseconds(), but written in Python.
+        return cls(delta.total_seconds())
+
+    def ceil(self):
+        """
+        Return the 'normal' part of the timestamp rounded up to the nearest
+        integer number of seconds.
+
+        This value should be used whenever the second-precision Last-Modified
+        time of a resource is required.
+
+        :return: a float value with second precision.
+        """
+        return math.ceil(float(self))
+
+    def __eq__(self, other):
+        if other is None:
+            return False
+        if not isinstance(other, Timestamp):
+            try:
+                other = Timestamp(other, check_bounds=False)
+            except ValueError:
+                return False
+        return self.internal == other.internal
+
+    def __ne__(self, other):
+        return not (self == other)
+
+    def __lt__(self, other):
+        if other is None:
+            return False
+        if not isinstance(other, Timestamp):
+            other = Timestamp(other, check_bounds=False)
+        if other.timestamp < 0:
+            return False
+        if other.timestamp >= 10000000000:
+            return True
+        return self.internal < other.internal
+
+    def __hash__(self):
+        return hash(self.internal)
+
+    def __invert__(self):
+        if self.offset:
+            raise ValueError('Cannot invert timestamps with offsets')
+        return Timestamp((999999999999999 - self.raw) * PRECISION)
+
+
+def encode_timestamps(t1, t2=None, t3=None, explicit=False):
+    """
+    Encode up to three timestamps into a string. Unlike a Timestamp object, the
+    encoded string does NOT used fixed width fields and consequently no
+    relative chronology of the timestamps can be inferred from lexicographic
+    sorting of encoded timestamp strings.
+
+    The format of the encoded string is:
+        <t1>[<+/-><t2 - t1>[<+/-><t3 - t2>]]
+
+    i.e. if t1 = t2 = t3 then just the string representation of t1 is returned,
+    otherwise the time offsets for t2 and t3 are appended. If explicit is True
+    then the offsets for t2 and t3 are always appended even if zero.
+
+    Note: any offset value in t1 will be preserved, but offsets on t2 and t3
+    are not preserved. In the anticipated use cases for this method (and the
+    inverse decode_timestamps method) the timestamps passed as t2 and t3 are
+    not expected to have offsets as they will be timestamps associated with a
+    POST request. In the case where the encoding is used in a container objects
+    table row, t1 could be the PUT or DELETE time but t2 and t3 represent the
+    content type and metadata times (if different from the data file) i.e.
+    correspond to POST timestamps. In the case where the encoded form is used
+    in a .meta file name, t1 and t2 both correspond to POST timestamps.
+    """
+    form = '{0}'
+    values = [t1.short]
+    if t2 is not None:
+        t2_t1_delta = t2.raw - t1.raw
+        explicit = explicit or (t2_t1_delta != 0)
+        values.append(t2_t1_delta)
+        if t3 is not None:
+            t3_t2_delta = t3.raw - t2.raw
+            explicit = explicit or (t3_t2_delta != 0)
+            values.append(t3_t2_delta)
+        if explicit:
+            form += '{1:+x}'
+            if t3 is not None:
+                form += '{2:+x}'
+    return form.format(*values)
+
+
+def decode_timestamps(encoded, explicit=False):
+    """
+    Parses a string of the form generated by encode_timestamps and returns
+    a tuple of the three component timestamps. If explicit is False, component
+    timestamps that are not explicitly encoded will be assumed to have zero
+    delta from the previous component and therefore take the value of the
+    previous component. If explicit is True, component timestamps that are
+    not explicitly encoded will be returned with value None.
+    """
+    # TODO: some tests, e.g. in test_replicator, put float timestamps values
+    # into container db's, hence this defensive check, but in real world
+    # this may never happen.
+    if not isinstance(encoded, str):
+        ts = Timestamp(encoded)
+        return ts, ts, ts
+
+    parts = []
+    signs = []
+    pos_parts = encoded.split('+')
+    for part in pos_parts:
+        # parse time components and their signs
+        # e.g. x-y+z --> parts = [x, y, z] and signs = [+1, -1, +1]
+        neg_parts = part.split('-')
+        parts = parts + neg_parts
+        signs = signs + [1] + [-1] * (len(neg_parts) - 1)
+    t1 = Timestamp(parts[0])
+    t2 = t3 = None
+    if len(parts) > 1:
+        t2 = t1
+        delta = signs[1] * int(parts[1], 16)
+        # if delta = 0 we want t2 = t3 = t1 in order to
+        # preserve any offset in t1 - only construct a distinct
+        # timestamp if there is a non-zero delta.
+        if delta:
+            t2 = Timestamp((t1.raw + delta) * PRECISION)
+    elif not explicit:
+        t2 = t1
+    if len(parts) > 2:
+        t3 = t2
+        delta = signs[2] * int(parts[2], 16)
+        if delta:
+            t3 = Timestamp((t2.raw + delta) * PRECISION)
+    elif not explicit:
+        t3 = t2
+    return t1, t2, t3
+
+
+def normalize_timestamp(timestamp):
+    """
+    Format a timestamp (string or numeric) into a standardized
+    xxxxxxxxxx.xxxxx (10.5) format.
+
+    Note that timestamps using values greater than or equal to November 20th,
+    2286 at 17:46 UTC will use 11 digits to represent the number of
+    seconds.
+
+    :param timestamp: unix timestamp
+    :returns: normalized timestamp as a string
+    """
+    return Timestamp(timestamp).normal
+
+
+EPOCH = datetime.datetime(1970, 1, 1)
+
+
+def last_modified_date_to_timestamp(last_modified_date_str):
+    """
+    Convert a last modified date (like you'd get from a container listing,
+    e.g. 2014-02-28T23:22:36.698390) to a float.
+    """
+    return Timestamp.from_isoformat(last_modified_date_str)
+
+
+def normalize_delete_at_timestamp(timestamp, high_precision=False):
+    """
+    Format a timestamp (string or numeric) into a standardized
+    xxxxxxxxxx (10) or xxxxxxxxxx.xxxxx (10.5) format.
+
+    Note that timestamps less than 0000000000 are raised to
+    0000000000 and values greater than November 20th, 2286 at
+    17:46:39 UTC will be capped at that date and time, resulting in
+    no return value exceeding 9999999999.99999 (or 9999999999 if
+    using low-precision).
+
+    This cap is because the expirer is already working through a
+    sorted list of strings that were all a length of 10. Adding
+    another digit would mess up the sort and cause the expirer to
+    break from processing early. By 2286, this problem will need to
+    be fixed, probably by creating an additional .expiring_objects
+    account to work from with 11 (or more) digit container names.
+
+    :param timestamp: unix timestamp
+    :returns: normalized timestamp as a string
+    """
+    fmt = '%016.5f' if high_precision else '%010d'
+    return fmt % min(max(0, float(timestamp)), 9999999999.99999)
diff --git a/swift/common/wsgi.py b/swift/common/wsgi.py
index 6f13999aa3..e31bb1a5e1 100644
--- a/swift/common/wsgi.py
+++ b/swift/common/wsgi.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -15,58 +15,164 @@
 
 """WSGI tools for use with swift."""
 
+
 import errno
+import json
 import os
 import signal
+import struct
+import sys
+from textwrap import dedent
 import time
-import mimetools
-from itertools import chain
-from StringIO import StringIO
+import warnings
 
 import eventlet
 import eventlet.debug
-from eventlet import greenio, GreenPool, sleep, wsgi, listen
-from paste.deploy import loadapp, appconfig
-from eventlet.green import socket, ssl
-from urllib import unquote
+from eventlet import greenio, GreenPool, sleep, wsgi, listen, Timeout
+from paste.deploy import loadwsgi
+from eventlet.green import socket, ssl, os as green_os
+from io import BytesIO, StringIO
 
-from swift.common.swob import Request
+from swift.common import utils, constraints
+from swift.common.http_protocol import SwiftHttpProtocol, \
+    SwiftHttpProxiedProtocol
+from swift.common.storage_policy import BindPortsCache
+from swift.common.swob import Request, wsgi_unquote
 from swift.common.utils import capture_stdio, disable_fallocate, \
     drop_privileges, get_logger, NullLogger, config_true_value, \
-    validate_configuration
+    validate_configuration, get_hub, config_auto_int_value, \
+    reiterate, clean_up_daemon_hygiene, systemd_notify, NicerInterpolation, \
+    set_swift_dir
+
+SIGNUM_TO_NAME = {getattr(signal, n): n for n in dir(signal)
+                  if n.startswith('SIG') and '_' not in n}
+NOTIFY_FD_ENV_KEY = '__SWIFT_SERVER_NOTIFY_FD'
+CHILD_STATE_FD_ENV_KEY = '__SWIFT_SERVER_CHILD_STATE_FD'
+
+# Set maximum line size of message headers to be accepted.
+wsgi.MAX_HEADER_LINE = constraints.MAX_HEADER_SIZE
+
+try:
+    import multiprocessing
+    CPU_COUNT = multiprocessing.cpu_count() or 1
+except (ImportError, NotImplementedError):
+    CPU_COUNT = 1
+
+
+class NamedConfigLoader(loadwsgi.ConfigLoader):
+    """
+    Patch paste.deploy's ConfigLoader so each context object will know what
+    config section it came from.
+    """
+
+    def get_context(self, object_type, name=None, global_conf=None):
+        self.parser._interpolation = NicerInterpolation()
+        context = super(NamedConfigLoader, self).get_context(
+            object_type, name=name, global_conf=global_conf)
+        context.name = name
+        context.local_conf['__name__'] = name
+        return context
+
+
+loadwsgi.ConfigLoader = NamedConfigLoader
+
+
+class ConfigDirLoader(NamedConfigLoader):
+    """
+    Read configuration from multiple files under the given path.
+    """
+
+    def __init__(self, conf_dir):
+        # parent class uses filename attribute when building error messages
+        self.filename = conf_dir = conf_dir.strip()
+        defaults = {
+            'here': os.path.normpath(os.path.abspath(conf_dir)),
+            '__file__': os.path.abspath(conf_dir)
+        }
+        self.parser = loadwsgi.NicerConfigParser(conf_dir, defaults=defaults)
+        self.parser.optionxform = str  # Don't lower-case keys
+        utils.read_conf_dir(self.parser, conf_dir)
+
+
+def _loadconfigdir(object_type, uri, path, name, relative_to, global_conf):
+    if relative_to:
+        path = os.path.normpath(os.path.join(relative_to, path))
+    loader = ConfigDirLoader(path)
+    if global_conf:
+        loader.update_defaults(global_conf, overwrite=False)
+    return loader.get_context(object_type, name, global_conf)
 
 
-def monkey_patch_mimetools():
+# add config_dir parsing to paste.deploy
+loadwsgi._loaders['config_dir'] = _loadconfigdir
+
+
+class ConfigString(NamedConfigLoader):
     """
-    mimetools.Message defaults content-type to "text/plain"
-    This changes it to default to None, so we can detect missing headers.
+    Wrap a raw config string up for paste.deploy.
+
+    If you give one of these to our loadcontext (e.g. give it to our
+    appconfig) we'll intercept it and get it routed to the right loader.
     """
 
-    orig_parsetype = mimetools.Message.parsetype
+    def __init__(self, config_string):
+        self.contents = StringIO(dedent(config_string))
+        self.filename = "string"
+        defaults = {
+            'here': "string",
+            '__file__': self,
+        }
+        self.parser = loadwsgi.NicerConfigParser("string", defaults=defaults)
+        self.parser.optionxform = str  # Don't lower-case keys
+        # Defaults don't need interpolation (crazy PasteDeploy...)
+        self.parser.defaults = lambda: dict(self.parser._defaults, **defaults)
+        self.parser.read_file(self.contents)
+
+    def readline(self, *args, **kwargs):
+        return self.contents.readline(*args, **kwargs)
+
+    def seek(self, *args, **kwargs):
+        return self.contents.seek(*args, **kwargs)
+
+    def __iter__(self):
+        return iter(self.contents)
 
-    def parsetype(self):
-        if not self.typeheader:
-            self.type = None
-            self.maintype = None
-            self.subtype = None
-            self.plisttext = ''
+
+def wrap_conf_type(f):
+    """
+    Wrap a function whos first argument is a paste.deploy style config uri,
+    such that you can pass it an un-adorned raw filesystem path (or config
+    string) and the config directive (either config:, config_dir:, or
+    config_str:) will be added automatically based on the type of entity
+    (either a file or directory, or if no such entity on the file system -
+    just a string) before passing it through to the paste.deploy function.
+    """
+    def wrapper(conf_path, *args, **kwargs):
+        if os.path.isdir(conf_path):
+            conf_type = 'config_dir'
         else:
-            orig_parsetype(self)
+            conf_type = 'config'
+        conf_uri = '%s:%s' % (conf_type, conf_path)
+        return f(conf_uri, *args, **kwargs)
+    return wrapper
 
-    mimetools.Message.parsetype = parsetype
 
+appconfig = wrap_conf_type(loadwsgi.appconfig)
 
-def get_socket(conf, default_port=8080):
+
+def get_socket(conf):
     """Bind socket to bind ip:port in conf
 
     :param conf: Configuration dict to read settings from
-    :param default_port: port to use if not specified in conf
 
-    :returns : a socket object as returned from socket.listen or
-               ssl.wrap_socket if conf specifies cert_file
+    :returns: a socket object as returned from socket.listen or
+              ssl.wrap_socket if conf specifies cert_file
     """
-    bind_addr = (conf.get('bind_ip', '0.0.0.0'),
-                 int(conf.get('bind_port', default_port)))
+    try:
+        bind_port = int(conf['bind_port'])
+    except (ValueError, KeyError, TypeError):
+        raise ConfigFilePortError()
+    bind_addr = (conf.get('bind_ip', '0.0.0.0'), bind_port)
     address_family = [addr[0] for addr in socket.getaddrinfo(
         bind_addr[0], bind_addr[1], socket.AF_UNSPEC, socket.SOCK_STREAM)
         if addr[0] in (socket.AF_INET, socket.AF_INET6)][0]
@@ -74,152 +180,1060 @@ def get_socket(conf, default_port=8080):
     bind_timeout = int(conf.get('bind_timeout', 30))
     retry_until = time.time() + bind_timeout
     warn_ssl = False
+
+    try:
+        keepidle = int(conf.get('keep_idle', 600))
+        if keepidle <= 0 or keepidle >= 2 ** 15 - 1:
+            raise ValueError()
+    except (ValueError, KeyError, TypeError):
+        raise ConfigFileError()
+
     while not sock and time.time() < retry_until:
         try:
             sock = listen(bind_addr, backlog=int(conf.get('backlog', 4096)),
                           family=address_family)
             if 'cert_file' in conf:
+                context = ssl.SSLContext(ssl.PROTOCOL_TLS_SERVER)
+                context.verify_mode = ssl.CERT_NONE
+                context.load_cert_chain(conf['cert_file'], conf['key_file'])
                 warn_ssl = True
-                sock = ssl.wrap_socket(sock, certfile=conf['cert_file'],
-                                       keyfile=conf['key_file'])
-        except socket.error, err:
+                sock = context.wrap_socket(sock, server_side=True)
+        except socket.error as err:
             if err.args[0] != errno.EADDRINUSE:
                 raise
             sleep(0.1)
     if not sock:
-        raise Exception(_('Could not bind to %s:%s '
-                          'after trying for %s seconds') % (
-                              bind_addr[0], bind_addr[1], bind_timeout))
-    sock.setsockopt(socket.SOL_SOCKET, socket.SO_REUSEADDR, 1)
+        raise Exception('Could not bind to %(addr)s:%(port)s '
+                        'after trying for %(timeout)s seconds' % {
+                            'addr': bind_addr[0], 'port': bind_addr[1],
+                            'timeout': bind_timeout})
     # in my experience, sockets can hang around forever without keepalive
     sock.setsockopt(socket.SOL_SOCKET, socket.SO_KEEPALIVE, 1)
+    sock.setsockopt(socket.IPPROTO_TCP, socket.TCP_NODELAY, 1)
     if hasattr(socket, 'TCP_KEEPIDLE'):
-        sock.setsockopt(socket.IPPROTO_TCP, socket.TCP_KEEPIDLE, 600)
+        sock.setsockopt(socket.IPPROTO_TCP, socket.TCP_KEEPIDLE, keepidle)
     if warn_ssl:
-        ssl_warning_message = 'WARNING: SSL should only be enabled for ' \
-                              'testing purposes. Use external SSL ' \
-                              'termination for a production deployment.'
+        ssl_warning_message = ('WARNING: SSL should only be enabled for '
+                               'testing purposes. Use external SSL '
+                               'termination for a production deployment.')
         get_logger(conf).warning(ssl_warning_message)
-        print _(ssl_warning_message)
+        print(ssl_warning_message)
     return sock
 
 
-# TODO: pull pieces of this out to test
-def run_wsgi(conf_file, app_section, *args, **kwargs):
+class RestrictedGreenPool(GreenPool):
+    """
+    Works the same as GreenPool, but if the size is specified as one, then the
+    spawn_n() method will invoke waitall() before returning to prevent the
+    caller from doing any other work (like calling accept()).
     """
-    Runs the server using the specified number of workers.
+    def __init__(self, size=1024):
+        super(RestrictedGreenPool, self).__init__(size=size)
+        self._rgp_do_wait = (size == 1)
 
-    :param conf_file: Path to paste.deploy style configuration file
-    :param app_section: App name from conf file to load config from
+    def spawn_n(self, *args, **kwargs):
+        super(RestrictedGreenPool, self).spawn_n(*args, **kwargs)
+        if self._rgp_do_wait:
+            self.waitall()
+
+
+class PipelineWrapper(object):
     """
-    # Load configuration, Set logger and Load request processor
-    try:
-        (app, conf, logger, log_name) = \
-            init_request_processor(conf_file, app_section, *args, **kwargs)
-    except ConfigFileError, e:
-        print e
-        return
-
-    # bind to address and port
-    sock = get_socket(conf, default_port=kwargs.get('default_port', 8080))
-    # remaining tasks should not require elevated privileges
-    drop_privileges(conf.get('user', 'swift'))
-    # redirect errors to logger and close stdio
-    capture_stdio(logger)
-
-    def run_server():
-        wsgi.HttpProtocol.default_request_version = "HTTP/1.0"
-        # Turn off logging requests by the underlying WSGI software.
-        wsgi.HttpProtocol.log_request = lambda *a: None
-        # Redirect logging other messages by the underlying WSGI software.
-        wsgi.HttpProtocol.log_message = \
-            lambda s, f, *a: logger.error('ERROR WSGI: ' + f % a)
-        wsgi.WRITE_TIMEOUT = int(conf.get('client_timeout') or 60)
-        eventlet.hubs.use_hub('poll')
-        eventlet.patcher.monkey_patch(all=False, socket=True)
-        eventlet_debug = config_true_value(conf.get('eventlet_debug', 'no'))
-        eventlet.debug.hub_exceptions(eventlet_debug)
-        app = loadapp('config:%s' % conf_file,
-                      global_conf={'log_name': log_name})
-        pool = GreenPool(size=1024)
+    This class provides a number of utility methods for
+    modifying the composition of a wsgi pipeline.
+    """
+
+    def __init__(self, context):
+        self.context = context
+
+    def __contains__(self, entry_point_name):
         try:
-            wsgi.server(sock, app, NullLogger(), custom_pool=pool)
-        except socket.error, err:
-            if err[0] != errno.EINVAL:
-                raise
+            self.index(entry_point_name)
+            return True
+        except ValueError:
+            return False
+
+    def startswith(self, entry_point_name):
+        """
+        Tests if the pipeline starts with the given entry point name.
+
+        :param entry_point_name: entry point of middleware or app (Swift only)
+
+        :returns: True if entry_point_name is first in pipeline, False
+                  otherwise
+        """
+        try:
+            first_ctx = self.context.filter_contexts[0]
+        except IndexError:
+            first_ctx = self.context.app_context
+        return first_ctx.entry_point_name == entry_point_name
+
+    def _format_for_display(self, ctx):
+        # Contexts specified by pipeline= have .name set in NamedConfigLoader.
+        if hasattr(ctx, 'name'):
+            return ctx.name
+        # This should not happen: a foreign context. Let's not crash.
+        return "<unknown>"
+
+    def __str__(self):
+        parts = [self._format_for_display(ctx)
+                 for ctx in self.context.filter_contexts]
+        parts.append(self._format_for_display(self.context.app_context))
+        return " ".join(parts)
+
+    def create_filter(self, entry_point_name):
+        """
+        Creates a context for a filter that can subsequently be added
+        to a pipeline context.
+
+        :param entry_point_name: entry point of the middleware (Swift only)
+
+        :returns: a filter context
+        """
+        spec = 'egg:swift#' + entry_point_name
+        ctx = loadwsgi.loadcontext(loadwsgi.FILTER, spec,
+                                   global_conf=self.context.global_conf)
+        ctx.protocol = 'paste.filter_factory'
+        ctx.name = entry_point_name
+        return ctx
+
+    def index(self, entry_point_name):
+        """
+        Returns the first index of the given entry point name in the pipeline.
+
+        Raises ValueError if the given module is not in the pipeline.
+        """
+        for i, ctx in enumerate(self.context.filter_contexts):
+            if ctx.entry_point_name == entry_point_name:
+                return i
+        raise ValueError("%s is not in pipeline" % (entry_point_name,))
+
+    def insert_filter(self, ctx, index=0):
+        """
+        Inserts a filter module into the pipeline context.
+
+        :param ctx: the context to be inserted
+        :param index: (optional) index at which filter should be
+                      inserted in the list of pipeline filters. Default
+                      is 0, which means the start of the pipeline.
+        """
+        self.context.filter_contexts.insert(index, ctx)
+
+
+def loadcontext(object_type, uri, name=None, relative_to=None,
+                global_conf=None):
+    if isinstance(uri, loadwsgi.ConfigLoader):
+        # bypass loadcontext's uri parsing and loader routing and
+        # just directly return the context
+        if global_conf:
+            uri.update_defaults(global_conf, overwrite=False)
+        return uri.get_context(object_type, name, global_conf)
+    add_conf_type = wrap_conf_type(lambda x: x)
+    return loadwsgi.loadcontext(object_type, add_conf_type(uri), name=name,
+                                relative_to=relative_to,
+                                global_conf=global_conf)
+
+
+def loadapp(conf_file, global_conf=None, allow_modify_pipeline=True):
+    """
+    Loads a context from a config file, and if the context is a pipeline
+    then presents the app with the opportunity to modify the pipeline.
+
+    :param conf_file: path to a config file
+    :param global_conf: a dict of options to update the loaded config. Options
+        in ``global_conf`` will override those in ``conf_file`` except where
+        the ``conf_file`` option is preceded by ``set``.
+    :param allow_modify_pipeline: if True, and the context is a pipeline, and
+        the loaded app has a ``modify_wsgi_pipeline`` property, then that
+        property will be called before the pipeline is loaded.
+    :return: the loaded app
+    """
+    global_conf = global_conf or {}
+    ctx = loadcontext(loadwsgi.APP, conf_file, global_conf=global_conf)
+    if ctx.object_type.name == 'pipeline':
+        # give app the opportunity to modify the pipeline context
+        ultimate_app = ctx.app_context.create()
+        func = getattr(ultimate_app, 'modify_wsgi_pipeline', None)
+        if func and allow_modify_pipeline:
+            func(PipelineWrapper(ctx))
+        filters = [c.create() for c in reversed(ctx.filter_contexts)]
+        pipeline = [ultimate_app]
+        request_logging_app = app = ultimate_app
+        for filter_app in filters:
+            app = filter_app(pipeline[0])
+            pipeline.insert(0, app)
+            if request_logging_app is ultimate_app and \
+                    app.__class__.__name__ == 'ProxyLoggingMiddleware':
+                request_logging_app = filter_app(ultimate_app)
+                # Set some separate-pipeline attrs
+                request_logging_app._pipeline = [
+                    request_logging_app, ultimate_app]
+                request_logging_app._pipeline_request_logging_app = \
+                    request_logging_app
+                request_logging_app._pipeline_final_app = ultimate_app
+
+        for app in pipeline:
+            app._pipeline = pipeline
+            # For things like making (logged) backend requests for
+            # get_account_info and get_container_info
+            app._pipeline_request_logging_app = request_logging_app
+            # For getting proxy-server options like *_existence_skip_cache_pct
+            app._pipeline_final_app = ultimate_app
+
+        return pipeline[0]
+    return ctx.create()
+
+
+def load_app_config(conf_file):
+    """
+    Read the app config section from a config file.
+
+    :param conf_file: path to a config file
+    :return: a dict
+    """
+    app_conf = {}
+    try:
+        ctx = loadcontext(loadwsgi.APP, conf_file)
+    except LookupError:
+        pass
+    else:
+        app_conf.update(ctx.app_context.global_conf)
+        app_conf.update(ctx.app_context.local_conf)
+    return app_conf
+
+
+def run_server(conf, logger, sock, global_conf=None, ready_callback=None,
+               allow_modify_pipeline=True):
+    # Ensure TZ environment variable exists to avoid stat('/etc/localtime') on
+    # some platforms. This locks in reported times to UTC.
+    os.environ['TZ'] = 'UTC+0'
+    time.tzset()
+
+    eventlet.hubs.use_hub(get_hub())
+    eventlet_debug = config_true_value(conf.get('eventlet_debug', 'no'))
+    eventlet.debug.hub_exceptions(eventlet_debug)
+    wsgi_logger = NullLogger()
+    if eventlet_debug:
+        # let eventlet.wsgi.server log to stderr
+        wsgi_logger = None
+    # utils.LogAdapter stashes name in server; fallback on unadapted loggers
+    if not global_conf:
+        if hasattr(logger, 'server'):
+            log_name = logger.server
+        else:
+            log_name = logger.name
+        global_conf = {'log_name': log_name}
+    app = loadapp(conf['__file__'], global_conf=global_conf,
+                  allow_modify_pipeline=allow_modify_pipeline)
+    max_clients = int(conf.get('max_clients', '1024'))
+    pool = RestrictedGreenPool(size=max_clients)
+
+    # Select which protocol class to use (normal or one expecting PROXY
+    # protocol)
+    if config_true_value(conf.get('require_proxy_protocol', 'no')):
+        protocol_class = SwiftHttpProxiedProtocol
+    else:
+        protocol_class = SwiftHttpProtocol
+
+    max_request_line = constraints.MAX_REQUEST_LINE
+    server_kwargs = {
+        'custom_pool': pool,
+        'protocol': protocol_class,
+        'socket_timeout': float(conf.get('client_timeout') or 60),
+        # Disable capitalizing headers in Eventlet. This is necessary for
+        # the AWS SDK to work with s3api middleware (it needs an "ETag"
+        # header; "Etag" just won't do).
+        'capitalize_response_headers': False,
+        'url_length_limit': max_request_line,
+    }
+    if conf.get('keepalive_timeout'):
+        server_kwargs['keepalive'] = float(conf['keepalive_timeout']) or False
+
+    if ready_callback:
+        ready_callback()
+    # Yes, eventlet, we know -- we have to support bad clients, though
+    warnings.filterwarnings(
+        'ignore', message='capitalize_response_headers is disabled')
+    try:
+        wsgi.server(sock, app, wsgi_logger, **server_kwargs)
+    except socket.error as err:
+        if err.errno != errno.EINVAL:
+            raise
+    finally:
         pool.waitall()
+        if hasattr(app._pipeline_final_app, 'watchdog'):
+            app._pipeline_final_app.watchdog.kill()
 
-    worker_count = int(conf.get('workers', '1'))
-    # Useful for profiling [no forks].
-    if worker_count == 0:
-        run_server()
-        return
-
-    def kill_children(*args):
-        """Kills the entire process group."""
-        logger.error('SIGTERM received')
-        signal.signal(signal.SIGTERM, signal.SIG_IGN)
-        running[0] = False
-        os.killpg(0, signal.SIGTERM)
 
-    def hup(*args):
-        """Shuts down the server, but allows running requests to complete"""
-        logger.error('SIGHUP received')
-        signal.signal(signal.SIGHUP, signal.SIG_IGN)
-        running[0] = False
-
-    running = [True]
-    signal.signal(signal.SIGTERM, kill_children)
-    signal.signal(signal.SIGHUP, hup)
-    children = []
-    while running[0]:
-        while len(children) < worker_count:
+class StrategyBase(object):
+    """
+    Some operations common to all strategy classes.
+    """
+    def __init__(self, conf, logger):
+        self.conf = conf
+        self.logger = logger
+        self.signaled_ready = False
+
+        # Each strategy is welcome to track data however it likes, but all
+        # socket refs should be somewhere in this dict. This allows forked-off
+        # children to easily drop refs to sibling sockets in post_fork_hook().
+        self.tracking_data = {}
+
+        # When doing a seamless reload, we inherit a bunch of child processes
+        # that should all clean themselves up fairly quickly; track them here
+        self.reload_pids = dict()
+        # If they don't cleanup quickly, we'll start killing them after this
+        self.stale_worker_timeout = utils.non_negative_float(
+            conf.get('stale_worker_timeout', 86400))
+
+    def post_fork_hook(self):
+        """
+        Called in each forked-off child process, prior to starting the actual
+        wsgi server, to perform any initialization such as drop privileges.
+        """
+
+        if not self.signaled_ready:
+            capture_stdio(self.logger)
+        drop_privileges(self.conf.get('user', 'swift'))
+        del self.tracking_data  # children don't need to track siblings
+        # only MAINPID should be sending systemd notifications
+        os.environ.pop('NOTIFY_SOCKET', None)
+
+    def shutdown_sockets(self):
+        """
+        Shutdown any listen sockets.
+        """
+
+        for sock in self.iter_sockets():
+            greenio.shutdown_safe(sock)
+            sock.close()
+
+    def set_close_on_exec_on_listen_sockets(self):
+        """
+        Set the close-on-exec flag on any listen sockets.
+        """
+
+        for sock in self.iter_sockets():
+            # Python 3.4 and later default to sockets having close-on-exec
+            # set (what PEP 0446 calls "non-inheritable").  This new method
+            # on socket objects is provided to toggle it.
+            sock.set_inheritable(False)
+
+    def signal_ready(self):
+        """
+        Signal that the server is up and accepting connections.
+        """
+        if self.signaled_ready:
+            return  # Already did it
+
+        # Redirect errors to logger and close stdio. swift-init (for example)
+        # uses this to know that the service is ready to accept connections.
+        capture_stdio(self.logger)
+
+        # If necessary, signal an old copy of us that it's okay to shutdown
+        # its listen sockets now because ours are up and ready to receive
+        # connections. This is used for seamless reloading using SIGUSR1.
+        reexec_signal_fd = os.getenv(NOTIFY_FD_ENV_KEY)
+        if reexec_signal_fd:
+            if ',' in reexec_signal_fd:
+                reexec_signal_fd, worker_state_fd = reexec_signal_fd.split(',')
+            reexec_signal_fd = int(reexec_signal_fd)
+            os.write(reexec_signal_fd, str(os.getpid()).encode('utf8'))
+            os.close(reexec_signal_fd)
+        worker_state_fd = os.getenv(CHILD_STATE_FD_ENV_KEY)
+        try:
+            self.read_state_from_old_manager(worker_state_fd)
+        except Exception as e:
+            # This was all opportunistic anyway; old swift wouldn't even
+            # *try* to send us any state -- we don't want *new* code to
+            # fail just because *old* code didn't live up to its promise
+            self.logger.warning(
+                'Failed to read state from the old manager: %r', e,
+                exc_info=True)
+
+        # Finally, signal systemd (if appropriate) that process started
+        # properly.
+        systemd_notify(logger=self.logger)
+
+        self.signaled_ready = True
+
+    def read_state_from_old_manager(self, worker_state_fd):
+        """
+        Read worker state from the old manager's socket-closer.
+
+        The socket-closing process is the last thing to still have the worker
+        PIDs in its head, so it sends us a JSON dict (prefixed by its length)
+        of the form::
+
+           {
+             "old_pids": {
+               "<old worker>": "<first reload time>",
+               ...
+             }
+           }
+
+        More data may be added in the future.
+
+        :param worker_state_fd: The file descriptor that should have the
+                                old worker state. Should be passed to us
+                                via the ``__SWIFT_SERVER_CHILD_STATE_FD``
+                                environment variable.
+        """
+        if not worker_state_fd:
+            return
+        worker_state_fd = int(worker_state_fd)
+        try:
+            # The temporary manager may have up and died while trying to send
+            # state; hopefully its logs will have more about what went wrong
+            # -- let's just log at warning here
+            data_len = os.read(worker_state_fd, 4)
+            if len(data_len) != 4:
+                self.logger.warning(
+                    'Invalid worker state received; expected 4 bytes '
+                    'followed by a payload but only received %d bytes',
+                    len(data_len))
+                return
+
+            data_len = struct.unpack('!I', data_len)[0]
+            data = b''
+            while len(data) < data_len:
+                chunk = os.read(worker_state_fd, data_len - len(data))
+                if not chunk:
+                    break
+                data += chunk
+            if len(data) != data_len:
+                self.logger.warning(
+                    'Incomplete worker state received; expected %d '
+                    'bytes but only received %d', data_len, len(data))
+                return
+
+            # OK, the temporary manager was able to tell us how much it wanted
+            # to send and send it; from here on, error seems appropriate.
+            try:
+                old_state = json.loads(data)
+            except ValueError:
+                self.logger.error(
+                    'Invalid worker state received; '
+                    'invalid JSON: %r', data)
+                return
+
+            try:
+                old_pids = {
+                    int(pid): float(reloaded)
+                    for pid, reloaded in old_state["old_pids"].items()}
+            except (KeyError, TypeError) as err:
+                self.logger.error(
+                    'Invalid worker state received; '
+                    'error reading old pids: %s', err)
+            self.logger.debug('Received old worker pids: %s', old_pids)
+            self.reload_pids.update(old_pids)
+
+            def smother(old_pids=old_pids, timeout=self.stale_worker_timeout):
+                own_pid = os.getpid()
+                kill_times = sorted(((reloaded + timeout, pid)
+                                     for pid, reloaded in old_pids.items()),
+                                    reverse=True)
+                while kill_times:
+                    kill_time, pid = kill_times.pop()
+                    now = time.time()
+                    if kill_time > now:
+                        sleep(kill_time - now)
+                    try:
+                        ppid = utils.get_ppid(pid)
+                    except OSError as e:
+                        if e.errno != errno.ESRCH:
+                            self.logger.error("Could not determine parent "
+                                              "for stale pid %d: %s", pid, e)
+                        continue
+                    if ppid == own_pid:
+                        self.logger.notice("Killing long-running stale worker "
+                                           "%d after %ds", pid, int(timeout))
+                        try:
+                            os.kill(pid, signal.SIGKILL)
+                        except OSError as e:
+                            if e.errno != errno.ESRCH:
+                                self.logger.error(
+                                    "Could not kill stale pid %d: %s", pid, e)
+                    # else, pid got re-used?
+
+            eventlet.spawn_n(smother)
+
+        finally:
+            os.close(worker_state_fd)
+
+
+class WorkersStrategy(StrategyBase):
+    """
+    WSGI server management strategy object for a single bind port and listen
+    socket shared by a configured number of forked-off workers.
+
+    Tracking data is a map of ``pid -> socket``.
+
+    Used in :py:func:`run_wsgi`.
+
+    :param dict conf: Server configuration dictionary.
+    :param logger: The server's :py:class:`~swift.common.utils.LogAdaptor`
+                   object.
+    """
+
+    def __init__(self, conf, logger):
+        super(WorkersStrategy, self).__init__(conf, logger)
+        self.worker_count = config_auto_int_value(conf.get('workers'),
+                                                  CPU_COUNT)
+
+    def loop_timeout(self):
+        """
+        We want to keep from busy-waiting, but we also need a non-None value so
+        the main loop gets a chance to tell whether it should keep running or
+        not (e.g. SIGHUP received).
+
+        So we return 0.5.
+        """
+
+        return 0.5
+
+    def no_fork_sock(self):
+        """
+        Return a server listen socket if the server should run in the
+        foreground (no fork).
+        """
+
+        # Useful for profiling [no forks].
+        if self.worker_count == 0:
+            return get_socket(self.conf)
+
+    def new_worker_socks(self):
+        """
+        Yield a sequence of (socket, opqaue_data) tuples for each server which
+        should be forked-off and started.
+
+        The opaque_data item for each socket will passed into the
+        :py:meth:`log_sock_exit` and :py:meth:`register_worker_start` methods
+        where it will be ignored.
+        """
+
+        while len(self.tracking_data) < self.worker_count:
+            yield get_socket(self.conf), None
+
+    def log_sock_exit(self, sock, _unused):
+        """
+        Log a server's exit.
+
+        :param socket sock: The listen socket for the worker just started.
+        :param _unused: The socket's opaque_data yielded by
+                        :py:meth:`new_worker_socks`.
+        """
+
+        self.logger.notice('Child %d exiting normally' % os.getpid())
+
+    def register_worker_start(self, sock, _unused, pid):
+        """
+        Called when a new worker is started.
+
+        :param socket sock: The listen socket for the worker just started.
+        :param _unused: The socket's opaque_data yielded by new_worker_socks().
+        :param int pid: The new worker process' PID
+        """
+
+        self.logger.notice('Started child %s from parent %s',
+                           pid, os.getpid())
+        self.tracking_data[pid] = sock
+
+    def register_worker_exit(self, pid):
+        """
+        Called when a worker has exited.
+
+        NOTE: a re-exec'ed server can reap the dead worker PIDs from the old
+        server process that is being replaced as part of a service reload
+        (SIGUSR1).  So we need to be robust to getting some unknown PID here.
+
+        :param int pid: The PID of the worker that exited.
+        """
+
+        if self.reload_pids.pop(pid, None):
+            self.logger.notice('Removing stale child %d from parent %d',
+                               pid, os.getpid())
+            return
+
+        sock = self.tracking_data.pop(pid, None)
+        if sock is None:
+            self.logger.warning('Ignoring wait() result from unknown PID %d',
+                                pid)
+        else:
+            self.logger.error('Removing dead child %d from parent %d',
+                              pid, os.getpid())
+            greenio.shutdown_safe(sock)
+            sock.close()
+
+    def iter_sockets(self):
+        """
+        Yields all known listen sockets.
+        """
+
+        for sock in self.tracking_data.values():
+            yield sock
+
+    def get_worker_pids(self):
+        return list(self.tracking_data.keys())
+
+
+class ServersPerPortStrategy(StrategyBase):
+    """
+    WSGI server management strategy object for an object-server with one listen
+    port per unique local port in the storage policy rings.  The
+    `servers_per_port` integer config setting determines how many workers are
+    run per port.
+
+    Tracking data is a map like ``port -> [(pid, socket), ...]``.
+
+    Used in :py:func:`run_wsgi`.
+
+    :param dict conf: Server configuration dictionary.
+    :param logger: The server's :py:class:`~swift.common.utils.LogAdaptor`
+                   object.
+    :param int servers_per_port: The number of workers to run per port.
+    """
+
+    def __init__(self, conf, logger, servers_per_port):
+        super(ServersPerPortStrategy, self).__init__(conf, logger)
+        self.servers_per_port = servers_per_port
+        self.swift_dir = conf.get('swift_dir', '/etc/swift')
+        self.ring_check_interval = float(conf.get('ring_check_interval', 15))
+
+        # typically ring_ip will be the same as bind_ip, but in a container the
+        # bind_ip might be differnt than the host ip address used to lookup
+        # devices/ports in the ring
+        ring_ip = conf.get('ring_ip', conf.get('bind_ip', '0.0.0.0'))
+        self.cache = BindPortsCache(self.swift_dir, ring_ip)
+
+    def _reload_bind_ports(self):
+        self.bind_ports = self.cache.all_bind_ports_for_node()
+
+    def _bind_port(self, port):
+        new_conf = self.conf.copy()
+        new_conf['bind_port'] = port
+        return get_socket(new_conf)
+
+    def loop_timeout(self):
+        """
+        Return timeout before checking for reloaded rings.
+
+        :returns: The time to wait for a child to exit before checking for
+                  reloaded rings (new ports).
+        """
+
+        return self.ring_check_interval
+
+    def no_fork_sock(self):
+        """
+        This strategy does not support running in the foreground.
+        """
+
+        pass
+
+    def new_worker_socks(self):
+        """
+        Yield a sequence of (socket, (port, server_idx)) tuples for each server
+        which should be forked-off and started.
+
+        Any sockets for "orphaned" ports no longer in any ring will be closed
+        (causing their associated workers to gracefully exit) after all new
+        sockets have been yielded.
+
+        The server_idx item for each socket will passed into the
+        :py:meth:`log_sock_exit` and :py:meth:`register_worker_start` methods.
+        """
+
+        self._reload_bind_ports()
+        desired_port_index_pairs = {
+            (p, i) for p in self.bind_ports
+            for i in range(self.servers_per_port)}
+
+        current_port_index_pairs = {
+            (p, i)
+            for p, port_data in self.tracking_data.items()
+            for i, (pid, sock) in enumerate(port_data)
+            if pid is not None}
+
+        if desired_port_index_pairs != current_port_index_pairs:
+            # Orphan ports are ports which had object-server processes running,
+            # but which no longer appear in the ring.  We'll kill them after we
+            # start missing workers.
+            orphan_port_index_pairs = current_port_index_pairs - \
+                desired_port_index_pairs
+
+            # Fork off worker(s) for every port that's supposed to have
+            # worker(s) but doesn't
+            missing_port_index_pairs = desired_port_index_pairs - \
+                current_port_index_pairs
+            for port, server_idx in sorted(missing_port_index_pairs):
+                try:
+                    sock = self._bind_port(port)
+                except Exception as e:
+                    self.logger.critical('Unable to bind to port %d: %s',
+                                         port, e)
+                    continue
+                yield sock, (port, server_idx)
+
+            for port, idx in orphan_port_index_pairs:
+                # For any port in orphan_port_index_pairs, it is guaranteed
+                # that there should be no listen socket for that port, so we
+                # can close and forget them.
+                pid, sock = self.tracking_data[port][idx]
+                greenio.shutdown_safe(sock)
+                sock.close()
+                self.logger.notice(
+                    'Closing unnecessary sock for port %d (child pid %d)',
+                    port, pid)
+                self.tracking_data[port][idx] = (None, None)
+                if all(sock is None
+                       for _pid, sock in self.tracking_data[port]):
+                    del self.tracking_data[port]
+
+    def log_sock_exit(self, sock, data):
+        """
+        Log a server's exit.
+        """
+
+        port, server_idx = data
+        self.logger.notice('Child %d (PID %d, port %d) exiting normally',
+                           server_idx, os.getpid(), port)
+
+    def register_worker_start(self, sock, data, pid):
+        """
+        Called when a new worker is started.
+
+        :param socket sock: The listen socket for the worker just started.
+        :param tuple data: The socket's (port, server_idx) as yielded by
+                           :py:meth:`new_worker_socks`.
+        :param int pid: The new worker process' PID
+        """
+
+        port, server_idx = data
+        self.logger.notice('Started child %d (PID %d) for port %d',
+                           server_idx, pid, port)
+        if port not in self.tracking_data:
+            self.tracking_data[port] = [(None, None)] * self.servers_per_port
+        self.tracking_data[port][server_idx] = (pid, sock)
+
+    def register_worker_exit(self, pid):
+        """
+        Called when a worker has exited.
+
+        :param int pid: The PID of the worker that exited.
+        """
+
+        if self.reload_pids.pop(pid, None):
+            self.logger.notice('Removing stale child %d from parent %d',
+                               pid, os.getpid())
+            return
+
+        for port_data in self.tracking_data.values():
+            for idx, (child_pid, sock) in enumerate(port_data):
+                if child_pid == pid:
+                    self.logger.error('Removing dead child %d from parent %d',
+                                      pid, os.getpid())
+                    port_data[idx] = (None, None)
+                    greenio.shutdown_safe(sock)
+                    sock.close()
+                    return
+
+        self.logger.warning('Ignoring wait() result from unknown PID %d', pid)
+
+    def iter_sockets(self):
+        """
+        Yields all known listen sockets.
+        """
+
+        for port_data in self.tracking_data.values():
+            for _pid, sock in port_data:
+                yield sock
+
+    def get_worker_pids(self):
+        return [
+            pid
+            for port_data in self.tracking_data.values()
+            for pid, _sock in port_data]
+
+
+def check_config(conf_path, app_section, *args, **kwargs):
+    # Load configuration, Set logger and Load request processor
+    (conf, logger, log_name) = \
+        _initrp(conf_path, app_section, *args, **kwargs)
+
+    # optional nice/ionice priority scheduling
+    utils.modify_priority(conf, logger)
+
+    servers_per_port = int(conf.get('servers_per_port', '0') or 0)
+
+    # NOTE: for now servers_per_port is object-server-only; future work could
+    # be done to test and allow it to be used for account and container
+    # servers, but that has not been done yet.
+    if servers_per_port and app_section == 'object-server':
+        strategy = ServersPerPortStrategy(
+            conf, logger, servers_per_port=servers_per_port)
+    else:
+        strategy = WorkersStrategy(conf, logger)
+        try:
+            # Quick sanity check
+            if not (1 <= int(conf['bind_port']) <= 2 ** 16 - 1):
+                raise ValueError
+        except (ValueError, KeyError, TypeError):
+            error_msg = 'bind_port wasn\'t properly set in the config file. ' \
+                        'It must be explicitly set to a valid port number.'
+            logger.error(error_msg)
+            raise ConfigFileError(error_msg)
+
+    # patch event before loadapp
+    utils.monkey_patch()
+
+    # Ensure the configuration and application can be loaded before proceeding.
+    global_conf = {'log_name': log_name}
+    loadapp(conf_path, global_conf=global_conf)
+    if 'global_conf_callback' in kwargs:
+        kwargs['global_conf_callback'](conf, global_conf)
+
+    # set utils.FALLOCATE_RESERVE if desired
+    utils.FALLOCATE_RESERVE, utils.FALLOCATE_IS_PERCENT = \
+        utils.config_fallocate_value(conf.get('fallocate_reserve', '1%'))
+    return conf, logger, global_conf, strategy
+
+
+def run_wsgi(conf_path, app_section, *args, **kwargs):
+    """
+    Runs the server according to some strategy.  The default strategy runs a
+    specified number of workers in pre-fork model.  The object-server (only)
+    may use a servers-per-port strategy if its config has a servers_per_port
+    setting with a value greater than zero.
+
+    :param conf_path: Path to paste.deploy style configuration file/directory
+    :param app_section: App name from conf file to load config from
+    :param allow_modify_pipeline: Boolean for whether the server should have
+                                  an opportunity to change its own pipeline.
+                                  Defaults to True
+    :param test_config: if False (the default) then load and validate the
+        config and if successful then continue to run the server; if True then
+        load and validate the config but do not run the server.
+    :returns: 0 if successful, nonzero otherwise
+    """
+    try:
+        conf, logger, global_conf, strategy = check_config(
+            conf_path, app_section, *args, **kwargs)
+    except ConfigFileError as err:
+        print(err)
+        return 1
+
+    if kwargs.get('test_config'):
+        return 0
+
+    # Do some daemonization process hygene before we fork any children or run a
+    # server without forking.
+    clean_up_daemon_hygiene()
+
+    allow_modify_pipeline = kwargs.get('allow_modify_pipeline', True)
+    no_fork_sock = strategy.no_fork_sock()
+    if no_fork_sock:
+        run_server(conf, logger, no_fork_sock, global_conf=global_conf,
+                   ready_callback=strategy.signal_ready,
+                   allow_modify_pipeline=allow_modify_pipeline)
+        systemd_notify(logger, "STOPPING=1")
+        return 0
+
+    def stop_with_signal(signum, *args):
+        """Set running flag to False and capture the signum"""
+        running_context[0] = False
+        running_context[1] = signum
+
+    # context to hold boolean running state and stop signum
+    running_context = [True, None]
+    signal.signal(signal.SIGTERM, stop_with_signal)
+    signal.signal(signal.SIGHUP, stop_with_signal)
+    signal.signal(signal.SIGUSR1, stop_with_signal)
+
+    while running_context[0]:
+        new_workers = {}  # pid -> status pipe
+        for sock, sock_info in strategy.new_worker_socks():
+            read_fd, write_fd = os.pipe()
             pid = os.fork()
             if pid == 0:
-                signal.signal(signal.SIGHUP, signal.SIG_DFL)
+                os.close(read_fd)
                 signal.signal(signal.SIGTERM, signal.SIG_DFL)
-                run_server()
-                logger.notice('Child %d exiting normally' % os.getpid())
-                return
+
+                def shutdown_my_listen_sock(signum, *args):
+                    greenio.shutdown_safe(sock)
+
+                signal.signal(signal.SIGHUP, shutdown_my_listen_sock)
+                signal.signal(signal.SIGUSR1, shutdown_my_listen_sock)
+                strategy.post_fork_hook()
+
+                def notify():
+                    os.write(write_fd, b'ready')
+                    os.close(write_fd)
+
+                run_server(conf, logger, sock, ready_callback=notify,
+                           allow_modify_pipeline=allow_modify_pipeline)
+                strategy.log_sock_exit(sock, sock_info)
+                return 0
             else:
-                logger.notice('Started child %s' % pid)
-                children.append(pid)
+                os.close(write_fd)
+                new_workers[pid] = read_fd
+                strategy.register_worker_start(sock, sock_info, pid)
+
+        for pid, read_fd in new_workers.items():
+            worker_status = os.read(read_fd, 30)
+            os.close(read_fd)
+            if worker_status != b'ready':
+                raise Exception(
+                    'worker %d did not start normally: %r' %
+                    (pid, worker_status))
+
+        # TODO: signal_ready() as soon as we have at least one new worker for
+        # each port, instead of waiting for all of them
+        strategy.signal_ready()
+
+        # The strategy may need to pay attention to something in addition to
+        # child process exits (like new ports showing up in a ring).
+        #
+        # NOTE: a timeout value of None will just instantiate the Timeout
+        # object and not actually schedule it, which is equivalent to no
+        # timeout for the green_os.wait().
+        loop_timeout = strategy.loop_timeout()
+
+        with Timeout(loop_timeout, exception=False):
+            try:
+                try:
+                    pid, status = green_os.wait()
+                    if os.WIFEXITED(status) or os.WIFSIGNALED(status):
+                        strategy.register_worker_exit(pid)
+                except OSError as err:
+                    if err.errno not in (errno.EINTR, errno.ECHILD):
+                        raise
+                    if err.errno == errno.ECHILD:
+                        # If there are no children at all (ECHILD), then
+                        # there's nothing to actually wait on. We sleep
+                        # for a little bit to avoid a tight CPU spin
+                        # and still are able to catch any KeyboardInterrupt
+                        # events that happen. The value of 0.01 matches the
+                        # value in eventlet's waitpid().
+                        sleep(0.01)
+            except KeyboardInterrupt:
+                logger.notice('User quit')
+                running_context[0] = False
+                break
+
+    if running_context[1] is not None:
         try:
-            pid, status = os.wait()
-            if os.WIFEXITED(status) or os.WIFSIGNALED(status):
-                logger.error('Removing dead child %s' % pid)
-                children.remove(pid)
-        except OSError, err:
-            if err.errno not in (errno.EINTR, errno.ECHILD):
-                raise
-        except KeyboardInterrupt:
-            logger.notice('User quit')
-            break
-    greenio.shutdown_safe(sock)
-    sock.close()
-    logger.notice('Exited')
+            signame = SIGNUM_TO_NAME[running_context[1]]
+        except KeyError:
+            logger.error('Stopping with unexpected signal %r' %
+                         running_context[1])
+        else:
+            logger.notice('%s received (%s)', signame, os.getpid())
+    if running_context[1] == signal.SIGTERM:
+        systemd_notify(logger, "STOPPING=1")
+        os.killpg(0, signal.SIGTERM)
+    elif running_context[1] == signal.SIGUSR1:
+        systemd_notify(logger, "RELOADING=1")
+        # set up a pipe, fork off a child to handle cleanup later,
+        # and rexec ourselves with an environment variable set which will
+        # indicate which fd (one of the pipe ends) to write a byte to
+        # to indicate listen socket setup is complete.  That will signal
+        # the forked-off child to complete its listen socket shutdown.
+        #
+        # NOTE: all strategies will now require the parent process to retain
+        # superuser privileges so that the re'execd process can bind a new
+        # socket to the configured IP & port(s).  We can't just reuse existing
+        # listen sockets because then the bind IP couldn't be changed.
+        #
+        # NOTE: we need to set all our listen sockets close-on-exec so the only
+        # open reference to those file descriptors will be in the forked-off
+        # child here who waits to shutdown the old server's listen sockets.  If
+        # the re-exec'ed server's old listen sockets aren't closed-on-exec,
+        # then the old server can't actually ever exit.
+        strategy.set_close_on_exec_on_listen_sockets()
+        read_fd, write_fd = os.pipe()
+        state_rfd, state_wfd = os.pipe()
+        orig_server_pid = os.getpid()
+        child_pid = os.fork()
+        if child_pid:
+            # parent; set env var for fds and reexec ourselves
+            os.close(read_fd)
+            os.close(state_wfd)
+            os.putenv(NOTIFY_FD_ENV_KEY, str(write_fd))
+            os.putenv(CHILD_STATE_FD_ENV_KEY, str(state_rfd))
+            myself = os.path.realpath(sys.argv[0])
+            logger.info("Old server PID=%d re'execing as: %r",
+                        orig_server_pid, [myself] + list(sys.argv))
+            if hasattr(os, 'set_inheritable'):
+                # See https://www.python.org/dev/peps/pep-0446/
+                os.set_inheritable(write_fd, True)
+                os.set_inheritable(state_rfd, True)
+            os.execv(myself, sys.argv)  # nosec B606
+            logger.error('Somehow lived past os.execv()?!')
+            exit('Somehow lived past os.execv()?!')
+        elif child_pid == 0:
+            # child
+            os.close(write_fd)
+            os.close(state_rfd)
+            logger.info('Old server temporary child PID=%d waiting for '
+                        "re-exec'ed PID=%d to signal readiness...",
+                        os.getpid(), orig_server_pid)
+            try:
+                got_pid = os.read(read_fd, 30)
+            except Exception:
+                logger.warning('Unexpected exception while reading from '
+                               'pipe:', exc_info=True)
+            else:
+                got_pid = got_pid.decode('ascii')
+                if got_pid:
+                    logger.info('Old server temporary child PID=%d notified '
+                                'to shutdown old listen sockets by PID=%s',
+                                os.getpid(), got_pid)
+                    # Ensure new process knows about old children
+                    stale_pids = dict(strategy.reload_pids)
+                    stale_pids[os.getpid()] = now = time.time()
+                    stale_pids.update({
+                        pid: now for pid in strategy.get_worker_pids()})
+                    data = json.dumps({
+                        "old_pids": stale_pids,
+                    }).encode('ascii')
+                    os.write(state_wfd, struct.pack('!I', len(data)) + data)
+                    os.close(state_wfd)
+                else:
+                    logger.warning('Old server temporary child PID=%d *NOT* '
+                                   'notified to shutdown old listen sockets; '
+                                   'the pipe just *died*.', os.getpid())
+            try:
+                os.close(read_fd)
+            except Exception:
+                pass
+    else:
+        # SIGHUP or, less likely, run in "once" mode
+        systemd_notify(logger, "STOPPING=1")
+
+    strategy.shutdown_sockets()
+    signal.signal(signal.SIGTERM, signal.SIG_IGN)
+    logger.notice('Exited (%s)', os.getpid())
+    return 0
 
 
 class ConfigFileError(Exception):
     pass
 
 
-def init_request_processor(conf_file, app_section, *args, **kwargs):
-    """
-    Loads common settings from conf
-    Sets the logger
-    Loads the request processor
+class ConfigFilePortError(ConfigFileError):
+    pass
 
-    :param conf_file: Path to paste.deploy style configuration file
-    :param app_section: App name from conf file to load config from
-    :returns: the loaded application entry point
-    :raises ConfigFileError: Exception is raised for config file error
-    """
+
+def _initrp(conf_path, app_section, *args, **kwargs):
     try:
-        conf = appconfig('config:%s' % conf_file, name=app_section)
-    except Exception, e:
-        raise ConfigFileError("Error trying to load config %s: %s" %
-                              (conf_file, e))
+        conf = appconfig(conf_path, name=app_section)
+    except Exception as e:
+        raise ConfigFileError("Error trying to load config from %s: %s" %
+                              (conf_path, e))
+
+    if conf.get('swift_dir'):
+        set_swift_dir(conf['swift_dir'])
 
     validate_configuration()
 
@@ -236,8 +1250,22 @@ def init_request_processor(conf_file, app_section, *args, **kwargs):
     if config_true_value(conf.get('disable_fallocate', 'no')):
         disable_fallocate()
 
-    monkey_patch_mimetools()
-    app = loadapp('config:%s' % conf_file, global_conf={'log_name': log_name})
+    return (conf, logger, log_name)
+
+
+def init_request_processor(conf_path, app_section, *args, **kwargs):
+    """
+    Loads common settings from conf
+    Sets the logger
+    Loads the request processor
+
+    :param conf_path: Path to paste.deploy style configuration file/directory
+    :param app_section: App name from conf file to load config from
+    :returns: the loaded application entry point
+    :raises ConfigFileError: Exception is raised for config file error
+    """
+    (conf, logger, log_name) = _initrp(conf_path, app_section, *args, **kwargs)
+    app = loadapp(conf_path, global_conf={'log_name': log_name})
     return (app, conf, logger, log_name)
 
 
@@ -249,10 +1277,6 @@ class WSGIContext(object):
     """
     def __init__(self, wsgi_app):
         self.app = wsgi_app
-        # Results from the last call to self._start_response.
-        self._response_status = None
-        self._response_headers = None
-        self._response_exc_info = None
 
     def _start_response(self, status, headers, exc_info=None):
         """
@@ -260,24 +1284,23 @@ def _start_response(self, status, headers, exc_info=None):
         Uses the same semantics as the usual WSGI start_response.
         """
         self._response_status = status
-        self._response_headers = headers
+        self._response_headers = \
+            headers if isinstance(headers, list) else list(headers)
         self._response_exc_info = exc_info
 
     def _app_call(self, env):
         """
         Ensures start_response has been called before returning.
         """
+        self._response_status = None
+        self._response_headers = None
+        self._response_exc_info = None
         resp = self.app(env, self._start_response)
-        # if start_response has been called, just return the iter
-        if self._response_status is not None:
-            return resp
-        resp = iter(resp)
-        try:
-            first_chunk = resp.next()
-        except StopIteration:
-            return iter([])
-        else:  # We got a first_chunk
-            return chain([first_chunk], resp)
+        # if start_response has not been called, iterate until we've got a
+        # non-empty chunk, by which time the app *should* have called it
+        if self._response_status is None:
+            resp = reiterate(resp)
+        return resp
 
     def _get_status_int(self):
         """
@@ -293,51 +1316,17 @@ def _response_header_value(self, key):
                 return val
         return None
 
+    def update_content_length(self, new_total_len):
+        self._response_headers = [
+            (h, v) for h, v in self._response_headers
+            if h.lower() != 'content-length']
+        self._response_headers.append(('Content-Length', str(new_total_len)))
 
-def make_pre_authed_request(env, method=None, path=None, body=None,
-                            headers=None, agent='Swift'):
-    """
-    Makes a new swob.Request based on the current env but with the
-    parameters specified. Note that this request will be preauthorized.
 
-    :param env: The WSGI environment to base the new request on.
-    :param method: HTTP method of new request; default is from
-                   the original env.
-    :param path: HTTP path of new request; default is from the
-                 original env. path should be compatible with what you
-                 would send to Request.blank. path should be quoted and it
-                 can include a query string. for example:
-                 '/a%20space?unicode_str%E8%AA%9E=y%20es'
-    :param body: HTTP body of new request; empty by default.
-    :param headers: Extra HTTP headers of new request; None by
-                    default.
-    :param agent: The HTTP user agent to use; default 'Swift'. You
-                  can put %(orig)s in the agent to have it replaced
-                  with the original env's HTTP_USER_AGENT, such as
-                  '%(orig)s StaticWeb'. You also set agent to None to
-                  use the original env's HTTP_USER_AGENT or '' to
-                  have no HTTP_USER_AGENT.
-    :returns: Fresh swob.Request object.
+def make_env(env, method=None, path=None, agent='Swift', query_string=None,
+             swift_source=None):
     """
-    query_string = None
-    if path and '?' in path:
-        path, query_string = path.split('?', 1)
-    newenv = make_pre_authed_env(env, method, path=unquote(path), agent=agent,
-                                 query_string=query_string)
-    if not headers:
-        headers = {}
-    if body:
-        return Request.blank(path, environ=newenv, body=body, headers=headers)
-    else:
-        return Request.blank(path, environ=newenv, headers=headers)
-
-
-def make_pre_authed_env(env, method=None, path=None, agent='Swift',
-                        query_string=None):
-    """
-    Returns a new fresh WSGI environment with escalated privileges to
-    do backend checks, listings, etc. that the remote user wouldn't
-    be able to accomplish directly.
+    Returns a new fresh WSGI environment.
 
     :param env: The WSGI environment to base the new environment on.
     :param method: The new REQUEST_METHOD or None to use the
@@ -356,14 +1345,20 @@ def make_pre_authed_env(env, method=None, path=None, agent='Swift',
                   '%(orig)s StaticWeb'. You also set agent to None to
                   use the original env's HTTP_USER_AGENT or '' to
                   have no HTTP_USER_AGENT.
+    :param swift_source: Used to mark the request as originating out of
+                         middleware. Will be logged in proxy logs.
     :returns: Fresh WSGI environment.
     """
     newenv = {}
-    for name in ('eventlet.posthooks', 'HTTP_USER_AGENT', 'HTTP_HOST',
-                 'PATH_INFO', 'QUERY_STRING', 'REMOTE_USER', 'REQUEST_METHOD',
+    for name in ('HTTP_USER_AGENT', 'HTTP_HOST', 'PATH_INFO',
+                 'QUERY_STRING', 'REMOTE_USER', 'REQUEST_METHOD',
                  'SCRIPT_NAME', 'SERVER_NAME', 'SERVER_PORT',
+                 'HTTP_ORIGIN', 'HTTP_ACCESS_CONTROL_REQUEST_METHOD',
                  'SERVER_PROTOCOL', 'swift.cache', 'swift.source',
-                 'swift.trans_id'):
+                 'swift.trans_id', 'swift.authorize_override',
+                 'swift.authorize', 'HTTP_X_USER_ID', 'HTTP_X_PROJECT_ID',
+                 'HTTP_REFERER', 'swift.infocache',
+                 'swift.base_labels', 'swift.shard_listing_history'):
         if name in env:
             newenv[name] = env[name]
     if method:
@@ -378,10 +1373,72 @@ def make_pre_authed_env(env, method=None, path=None, agent='Swift',
             agent % {'orig': env.get('HTTP_USER_AGENT', '')}).strip()
     elif agent == '' and 'HTTP_USER_AGENT' in newenv:
         del newenv['HTTP_USER_AGENT']
+    if swift_source:
+        newenv['swift.source'] = swift_source
+    newenv['wsgi.input'] = BytesIO()
+    if 'SCRIPT_NAME' not in newenv:
+        newenv['SCRIPT_NAME'] = ''
+    return newenv
+
+
+def make_subrequest(env, method=None, path=None, body=None, headers=None,
+                    agent='Swift', swift_source=None, make_env=make_env):
+    """
+    Makes a new swob.Request based on the current env but with the
+    parameters specified.
+
+    :param env: The WSGI environment to base the new request on.
+    :param method: HTTP method of new request; default is from
+                   the original env.
+    :param path: HTTP path of new request; default is from the
+                 original env. path should be compatible with what you
+                 would send to Request.blank. path should be quoted and it
+                 can include a query string. for example:
+                 '/a%20space?unicode_str%E8%AA%9E=y%20es'
+    :param body: HTTP body of new request; empty by default.
+    :param headers: Extra HTTP headers of new request; None by
+                    default.
+    :param agent: The HTTP user agent to use; default 'Swift'. You
+                  can put %(orig)s in the agent to have it replaced
+                  with the original env's HTTP_USER_AGENT, such as
+                  '%(orig)s StaticWeb'. You also set agent to None to
+                  use the original env's HTTP_USER_AGENT or '' to
+                  have no HTTP_USER_AGENT.
+    :param swift_source: Used to mark the request as originating out of
+                         middleware. Will be logged in proxy logs.
+    :param make_env: make_subrequest calls this make_env to help build the
+        swob.Request.
+    :returns: Fresh swob.Request object.
+    """
+    query_string = None
+    path = path or ''
+    if path and '?' in path:
+        path, query_string = path.split('?', 1)
+    newenv = make_env(env, method, path=wsgi_unquote(path), agent=agent,
+                      query_string=query_string, swift_source=swift_source)
+    if not headers:
+        headers = {}
+    if body:
+        return Request.blank(path, environ=newenv, body=body, headers=headers)
+    else:
+        return Request.blank(path, environ=newenv, headers=headers)
+
+
+def make_pre_authed_env(env, method=None, path=None, agent='Swift',
+                        query_string=None, swift_source=None):
+    """Same as :py:func:`make_env` but with preauthorization."""
+    newenv = make_env(
+        env, method=method, path=path, agent=agent, query_string=query_string,
+        swift_source=swift_source)
     newenv['swift.authorize'] = lambda req: None
     newenv['swift.authorize_override'] = True
     newenv['REMOTE_USER'] = '.wsgi.pre_authed'
-    newenv['wsgi.input'] = StringIO('')
-    if 'SCRIPT_NAME' not in newenv:
-        newenv['SCRIPT_NAME'] = ''
     return newenv
+
+
+def make_pre_authed_request(env, method=None, path=None, body=None,
+                            headers=None, agent='Swift', swift_source=None):
+    """Same as :py:func:`make_subrequest` but with preauthorization."""
+    return make_subrequest(
+        env, method=method, path=path, body=body, headers=headers, agent=agent,
+        swift_source=swift_source, make_env=make_pre_authed_env)
diff --git a/swift/container/auditor.py b/swift/container/auditor.py
index c2921b1175..14b0537f4f 100644
--- a/swift/container/auditor.py
+++ b/swift/container/auditor.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,111 +13,27 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-import os
-import time
-from random import random
 
-from eventlet import Timeout
+from swift.container.backend import ContainerBroker
+from swift.common.daemon import run_daemon
+from swift.common.db_auditor import DatabaseAuditor
+from swift.common.utils import parse_options
 
-import swift.common.db
-from swift.container import server as container_server
-from swift.common.db import ContainerBroker
-from swift.common.utils import get_logger, audit_location_generator, \
-    config_true_value, dump_recon_cache
-from swift.common.daemon import Daemon
 
-
-class ContainerAuditor(Daemon):
+class ContainerAuditor(DatabaseAuditor):
     """Audit containers."""
 
-    def __init__(self, conf):
-        self.conf = conf
-        self.logger = get_logger(conf, log_route='container-auditor')
-        self.devices = conf.get('devices', '/srv/node')
-        self.mount_check = config_true_value(conf.get('mount_check', 'true'))
-        self.interval = int(conf.get('interval', 1800))
-        self.container_passes = 0
-        self.container_failures = 0
-        swift.common.db.DB_PREALLOCATION = \
-            config_true_value(conf.get('db_preallocation', 'f'))
-        self.recon_cache_path = conf.get('recon_cache_path',
-                                         '/var/cache/swift')
-        self.rcache = os.path.join(self.recon_cache_path, "container.recon")
+    server_type = "container"
+    broker_class = ContainerBroker
 
-    def _one_audit_pass(self, reported):
-        all_locs = audit_location_generator(self.devices,
-                                            container_server.DATADIR,
-                                            mount_check=self.mount_check,
-                                            logger=self.logger)
-        for path, device, partition in all_locs:
-            self.container_audit(path)
-            if time.time() - reported >= 3600:  # once an hour
-                self.logger.info(
-                    _('Since %(time)s: Container audits: %(pass)s passed '
-                      'audit, %(fail)s failed audit'),
-                    {'time': time.ctime(reported),
-                     'pass': self.container_passes,
-                     'fail': self.container_failures})
-                dump_recon_cache(
-                    {'container_audits_since': reported,
-                     'container_audits_passed': self.container_passes,
-                     'container_audits_failed': self.container_failures},
-                    self.rcache, self.logger)
-                reported = time.time()
-                self.container_passes = 0
-                self.container_failures = 0
-        return reported
+    def _audit(self, job, broker):
+        return None
 
-    def run_forever(self, *args, **kwargs):
-        """Run the container audit until stopped."""
-        reported = time.time()
-        time.sleep(random() * self.interval)
-        while True:
-            self.logger.info(_('Begin container audit pass.'))
-            begin = time.time()
-            try:
-                reported = self._one_audit_pass(reported)
-            except (Exception, Timeout):
-                self.logger.increment('errors')
-                self.logger.exception(_('ERROR auditing'))
-            elapsed = time.time() - begin
-            if elapsed < self.interval:
-                time.sleep(self.interval - elapsed)
-            self.logger.info(
-                _('Container audit pass completed: %.02fs'), elapsed)
-            dump_recon_cache({'container_auditor_pass_completed': elapsed},
-                             self.rcache, self.logger)
 
-    def run_once(self, *args, **kwargs):
-        """Run the container audit once."""
-        self.logger.info(_('Begin container audit "once" mode'))
-        begin = reported = time.time()
-        self._one_audit_pass(reported)
-        elapsed = time.time() - begin
-        self.logger.info(
-            _('Container audit "once" mode completed: %.02fs'), elapsed)
-        dump_recon_cache({'container_auditor_pass_completed': elapsed},
-                         self.recon_container)
+def main():
+    conf_file, options = parse_options(once=True)
+    run_daemon(ContainerAuditor, conf_file, **options)
 
-    def container_audit(self, path):
-        """
-        Audits the given container path
 
-        :param path: the path to a container db
-        """
-        start_time = time.time()
-        try:
-            if not path.endswith('.db'):
-                return
-            broker = ContainerBroker(path)
-            if not broker.is_deleted():
-                info = broker.get_info()
-                self.logger.increment('passes')
-                self.container_passes += 1
-                self.logger.debug(_('Audit passed for %s'), broker.db_file)
-        except (Exception, Timeout):
-            self.logger.increment('failures')
-            self.container_failures += 1
-            self.logger.exception(_('ERROR Could not get container info %s'),
-                                  broker.db_file)
-        self.logger.timing_since('timing', start_time)
+if __name__ == '__main__':
+    main()
diff --git a/swift/container/backend.py b/swift/container/backend.py
new file mode 100644
index 0000000000..48a70470c7
--- /dev/null
+++ b/swift/container/backend.py
@@ -0,0 +1,2544 @@
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""
+Pluggable Back-ends for Container Server
+"""
+import errno
+
+import os
+from uuid import uuid4
+
+from urllib.parse import unquote
+import sqlite3
+from eventlet import tpool
+
+from swift.common.constraints import CONTAINER_LISTING_LIMIT
+from swift.common.exceptions import LockTimeout
+from swift.common.utils import Timestamp, encode_timestamps, \
+    decode_timestamps, extract_swift_bytes, storage_directory, hash_path, \
+    ShardRange, renamer, MD5_OF_EMPTY_STRING, get_db_files, \
+    parse_db_filename, make_db_file_path, split_path, RESERVED_BYTE, \
+    ShardRangeList, Namespace
+from swift.common.db import DatabaseBroker, BROKER_TIMEOUT, \
+    zero_like, DatabaseAlreadyExists, SQLITE_ARG_LIMIT
+
+DATADIR = 'containers'
+
+RECORD_TYPE_OBJECT = 'object'
+RECORD_TYPE_SHARD = 'shard'
+SHARD_RANGE_TABLE = 'shard_range'
+
+NOTFOUND = 'not_found'
+UNSHARDED = 'unsharded'
+SHARDING = 'sharding'
+SHARDED = 'sharded'
+COLLAPSED = 'collapsed'
+
+
+SHARD_STATS_STATES = [ShardRange.ACTIVE, ShardRange.SHARDING,
+                      ShardRange.SHRINKING]
+SHARD_LISTING_STATES = SHARD_STATS_STATES + [ShardRange.CLEAVED]
+SHARD_UPDATE_STATES = [ShardRange.CREATED, ShardRange.CLEAVED,
+                       ShardRange.ACTIVE, ShardRange.SHARDING]
+# when auditing a shard gets its own shard range, which could be in any state
+# except FOUND, and any potential acceptors excluding FOUND ranges that may be
+# unwanted overlaps
+SHARD_AUDITING_STATES = [ShardRange.CREATED, ShardRange.CLEAVED,
+                         ShardRange.ACTIVE, ShardRange.SHARDING,
+                         ShardRange.SHARDED, ShardRange.SHRINKING,
+                         ShardRange.SHRUNK]
+# shard's may not be fully populated while in the FOUND and CREATED
+# state, so shards should only update their own shard range's object
+# stats when they are in the following states
+SHARD_UPDATE_STAT_STATES = [ShardRange.CLEAVED, ShardRange.ACTIVE,
+                            ShardRange.SHARDING, ShardRange.SHARDED,
+                            ShardRange.SHRINKING, ShardRange.SHRUNK]
+
+# attribute names in order used when transforming shard ranges from dicts to
+# tuples and vice-versa
+SHARD_RANGE_KEYS = ('name', 'timestamp', 'lower', 'upper', 'object_count',
+                    'bytes_used', 'meta_timestamp', 'deleted', 'state',
+                    'state_timestamp', 'epoch', 'reported', 'tombstones')
+
+POLICY_STAT_TABLE_CREATE = '''
+    CREATE TABLE policy_stat (
+        storage_policy_index INTEGER PRIMARY KEY,
+        object_count INTEGER DEFAULT 0,
+        bytes_used INTEGER DEFAULT 0
+    );
+'''
+
+POLICY_STAT_TRIGGER_SCRIPT = '''
+    CREATE TRIGGER object_insert_policy_stat AFTER INSERT ON object
+    BEGIN
+        UPDATE policy_stat
+        SET object_count = object_count + (1 - new.deleted),
+            bytes_used = bytes_used + new.size
+        WHERE storage_policy_index = new.storage_policy_index;
+        INSERT INTO policy_stat (
+            storage_policy_index, object_count, bytes_used)
+        SELECT new.storage_policy_index,
+               (1 - new.deleted),
+               new.size
+        WHERE NOT EXISTS(
+            SELECT changes() as change
+            FROM policy_stat
+            WHERE change <> 0
+        );
+        UPDATE container_info
+        SET hash = chexor(hash, new.name, new.created_at);
+    END;
+
+    CREATE TRIGGER object_delete_policy_stat AFTER DELETE ON object
+    BEGIN
+        UPDATE policy_stat
+        SET object_count = object_count - (1 - old.deleted),
+            bytes_used = bytes_used - old.size
+        WHERE storage_policy_index = old.storage_policy_index;
+        UPDATE container_info
+        SET hash = chexor(hash, old.name, old.created_at);
+    END;
+'''
+
+CONTAINER_INFO_TABLE_SCRIPT = '''
+    CREATE TABLE container_info (
+        account TEXT,
+        container TEXT,
+        created_at TEXT,
+        put_timestamp TEXT DEFAULT '0',
+        delete_timestamp TEXT DEFAULT '0',
+        reported_put_timestamp TEXT DEFAULT '0',
+        reported_delete_timestamp TEXT DEFAULT '0',
+        reported_object_count INTEGER DEFAULT 0,
+        reported_bytes_used INTEGER DEFAULT 0,
+        hash TEXT default '00000000000000000000000000000000',
+        id TEXT,
+        status TEXT DEFAULT '',
+        status_changed_at TEXT DEFAULT '0',
+        metadata TEXT DEFAULT '',
+        x_container_sync_point1 INTEGER DEFAULT -1,
+        x_container_sync_point2 INTEGER DEFAULT -1,
+        storage_policy_index INTEGER DEFAULT 0,
+        reconciler_sync_point INTEGER DEFAULT -1
+    );
+'''
+
+CONTAINER_STAT_VIEW_SCRIPT = '''
+    CREATE VIEW container_stat
+    AS SELECT ci.account, ci.container, ci.created_at,
+        ci.put_timestamp, ci.delete_timestamp,
+        ci.reported_put_timestamp, ci.reported_delete_timestamp,
+        ci.reported_object_count, ci.reported_bytes_used, ci.hash,
+        ci.id, ci.status, ci.status_changed_at, ci.metadata,
+        ci.x_container_sync_point1, ci.x_container_sync_point2,
+        ci.reconciler_sync_point,
+        ci.storage_policy_index,
+        coalesce(ps.object_count, 0) AS object_count,
+        coalesce(ps.bytes_used, 0) AS bytes_used
+    FROM container_info ci LEFT JOIN policy_stat ps
+    ON ci.storage_policy_index = ps.storage_policy_index;
+
+    CREATE TRIGGER container_stat_update
+    INSTEAD OF UPDATE ON container_stat
+    BEGIN
+        UPDATE container_info
+        SET account = NEW.account,
+            container = NEW.container,
+            created_at = NEW.created_at,
+            put_timestamp = NEW.put_timestamp,
+            delete_timestamp = NEW.delete_timestamp,
+            reported_put_timestamp = NEW.reported_put_timestamp,
+            reported_delete_timestamp = NEW.reported_delete_timestamp,
+            reported_object_count = NEW.reported_object_count,
+            reported_bytes_used = NEW.reported_bytes_used,
+            hash = NEW.hash,
+            id = NEW.id,
+            status = NEW.status,
+            status_changed_at = NEW.status_changed_at,
+            metadata = NEW.metadata,
+            x_container_sync_point1 = NEW.x_container_sync_point1,
+            x_container_sync_point2 = NEW.x_container_sync_point2,
+            storage_policy_index = NEW.storage_policy_index,
+            reconciler_sync_point = NEW.reconciler_sync_point;
+    END;
+'''
+
+
+def update_new_item_from_existing(new_item, existing):
+    """
+    Compare the data and meta related timestamps of a new object item with
+    the timestamps of an existing object record, and update the new item
+    with data and/or meta related attributes from the existing record if
+    their timestamps are newer.
+
+    The multiple timestamps are encoded into a single string for storing
+    in the 'created_at' column of the objects db table.
+
+    :param new_item: A dict of object update attributes
+    :param existing: A dict of existing object attributes
+    :return: True if any attributes of the new item dict were found to be
+             newer than the existing and therefore not updated, otherwise
+             False implying that the updated item is equal to the existing.
+    """
+
+    # item[created_at] may be updated so keep a copy of the original
+    # value in case we process this item again
+    new_item.setdefault('data_timestamp', new_item['created_at'])
+
+    # content-type and metadata timestamps may be encoded in
+    # item[created_at], or may be set explicitly.
+    item_ts_data, item_ts_ctype, item_ts_meta = decode_timestamps(
+        new_item['data_timestamp'])
+
+    if new_item.get('ctype_timestamp'):
+        item_ts_ctype = Timestamp(new_item.get('ctype_timestamp'))
+        item_ts_meta = item_ts_ctype
+    if new_item.get('meta_timestamp'):
+        item_ts_meta = Timestamp(new_item.get('meta_timestamp'))
+
+    if not existing:
+        # encode new_item timestamps into one string for db record
+        new_item['created_at'] = encode_timestamps(
+            item_ts_data, item_ts_ctype, item_ts_meta)
+        return True
+
+    # decode existing timestamp into separate data, content-type and
+    # metadata timestamps
+    rec_ts_data, rec_ts_ctype, rec_ts_meta = decode_timestamps(
+        existing['created_at'])
+
+    # Extract any swift_bytes values from the content_type values. This is
+    # necessary because the swift_bytes value to persist should be that at the
+    # most recent data timestamp whereas the content-type value to persist is
+    # that at the most recent content-type timestamp. The two values happen to
+    # be stored in the same database column for historical reasons.
+    for item in (new_item, existing):
+        content_type, swift_bytes = extract_swift_bytes(item['content_type'])
+        item['content_type'] = content_type
+        item['swift_bytes'] = swift_bytes
+
+    newer_than_existing = [True, True, True]
+    if rec_ts_data >= item_ts_data:
+        # apply data attributes from existing record
+        new_item.update([(k, existing[k])
+                         for k in ('size', 'etag', 'deleted', 'swift_bytes')])
+        item_ts_data = rec_ts_data
+        newer_than_existing[0] = False
+    if rec_ts_ctype >= item_ts_ctype:
+        # apply content-type attribute from existing record
+        new_item['content_type'] = existing['content_type']
+        item_ts_ctype = rec_ts_ctype
+        newer_than_existing[1] = False
+    if rec_ts_meta >= item_ts_meta:
+        # apply metadata timestamp from existing record
+        item_ts_meta = rec_ts_meta
+        newer_than_existing[2] = False
+
+    # encode updated timestamps into one string for db record
+    new_item['created_at'] = encode_timestamps(
+        item_ts_data, item_ts_ctype, item_ts_meta)
+
+    # append the most recent swift_bytes onto the most recent content_type in
+    # new_item and restore existing to its original state
+    for item in (new_item, existing):
+        if item['swift_bytes']:
+            item['content_type'] += ';swift_bytes=%s' % item['swift_bytes']
+        del item['swift_bytes']
+
+    return any(newer_than_existing)
+
+
+def merge_shards(shard_data, existing):
+    """
+    Compares ``shard_data`` with ``existing`` and updates ``shard_data`` with
+    any items of ``existing`` that take precedence over the corresponding item
+    in ``shard_data``.
+
+    :param shard_data: a dict representation of shard range that may be
+        modified by this method.
+    :param existing: a dict representation of shard range.
+    :returns: True if ``shard data`` has any item(s) that are considered to
+        take precedence over the corresponding item in ``existing``
+    """
+    if not existing:
+        return True
+    if existing['timestamp'] < shard_data['timestamp']:
+        # note that currently we do not roll forward any meta or state from
+        # an item that was created at older time, newer created time trumps
+        shard_data['reported'] = 0  # reset the latch
+        return True
+    elif existing['timestamp'] > shard_data['timestamp']:
+        return False
+
+    new_content = False
+    # timestamp must be the same, so preserve existing range bounds and deleted
+    for k in ('lower', 'upper', 'deleted'):
+        shard_data[k] = existing[k]
+
+    # now we need to look for meta data updates
+    if existing['meta_timestamp'] >= shard_data['meta_timestamp']:
+        for k in ('object_count', 'bytes_used', 'meta_timestamp'):
+            shard_data[k] = existing[k]
+        shard_data['tombstones'] = existing.get('tombstones', -1)
+    else:
+        new_content = True
+
+    # We can latch the reported flag
+    if existing['reported'] and \
+            existing['object_count'] == shard_data['object_count'] and \
+            existing['bytes_used'] == shard_data['bytes_used'] and \
+            existing.get('tombstones', -1) == shard_data['tombstones'] and \
+            existing['state'] == shard_data['state'] and \
+            existing['epoch'] == shard_data['epoch']:
+        shard_data['reported'] = 1
+    else:
+        shard_data.setdefault('reported', 0)
+        if shard_data['reported'] and not existing['reported']:
+            new_content = True
+
+    if (existing['state_timestamp'] == shard_data['state_timestamp']
+            and shard_data['state'] > existing['state']):
+        new_content = True
+    elif existing['state_timestamp'] >= shard_data['state_timestamp']:
+        for k in ('state', 'state_timestamp', 'epoch'):
+            shard_data[k] = existing[k]
+    else:
+        new_content = True
+    return new_content
+
+
+def sift_shard_ranges(new_shard_ranges, existing_shard_ranges):
+    """
+    Compares new and existing shard ranges, updating the new shard ranges with
+    any more recent state from the existing, and returns shard ranges sorted
+    into those that need adding because they contain new or updated state and
+    those that need deleting because their state has been superseded.
+
+    :param new_shard_ranges: a list of dicts, each of which represents a shard
+        range.
+    :param existing_shard_ranges: a dict mapping shard range names to dicts
+        representing a shard range.
+    :return: a tuple (to_add, to_delete); to_add is a list of dicts, each of
+        which represents a shard range that is to be added to the existing
+        shard ranges; to_delete is a set of shard range names that are to be
+        deleted.
+    """
+    to_delete = set()
+    to_add = {}
+    for item in new_shard_ranges:
+        item_ident = item['name']
+        existing = existing_shard_ranges.get(item_ident)
+        if merge_shards(item, existing):
+            # exists with older timestamp
+            if item_ident in existing_shard_ranges:
+                to_delete.add(item_ident)
+            # duplicate entries in item_list
+            if (item_ident not in to_add or
+                    merge_shards(item, to_add[item_ident])):
+                to_add[item_ident] = item
+    return to_add.values(), to_delete
+
+
+class ContainerBroker(DatabaseBroker):
+    """
+    Encapsulates working with a container database.
+
+    Note that this may involve multiple on-disk DB files if the container
+    becomes sharded:
+
+    * :attr:`_db_file` is the path to the legacy container DB name, i.e.
+      ``<hash>.db``. This file should exist for an initialised broker that
+      has never been sharded, but will not exist once a container has been
+      sharded.
+    * :attr:`db_files` is a list of existing db files for the broker. This
+      list should have at least one entry for an initialised broker, and
+      should have two entries while a broker is in SHARDING state.
+    * :attr:`db_file` is the path to whichever db is currently authoritative
+      for the container. Depending on the container's state, this may not be
+      the same as the ``db_file`` argument given to :meth:`~__init__`, unless
+      ``force_db_file`` is True in which case :attr:`db_file` is always equal
+      to the ``db_file`` argument given to :meth:`~__init__`.
+    * :attr:`pending_file` is always equal to :attr:`_db_file` extended with
+      ``.pending``, i.e. ``<hash>.db.pending``.
+    """
+    db_type = 'container'
+    db_contains_type = 'object'
+    db_reclaim_timestamp = 'created_at'
+    delete_meta_whitelist = ['x-container-sysmeta-shard-quoted-root',
+                             'x-container-sysmeta-shard-root',
+                             'x-container-sysmeta-sharding']
+
+    def __init__(self, db_file, timeout=BROKER_TIMEOUT, logger=None,
+                 account=None, container=None, pending_timeout=None,
+                 stale_reads_ok=False, skip_commits=False,
+                 force_db_file=False):
+        self._init_db_file = db_file
+        base_db_file = make_db_file_path(db_file, None)
+        super(ContainerBroker, self).__init__(
+            base_db_file, timeout, logger, account, container, pending_timeout,
+            stale_reads_ok, skip_commits=skip_commits)
+        # the root account and container are populated on demand
+        self._root_account = self._root_container = None
+        self._force_db_file = force_db_file
+        self._db_files = None
+
+    @classmethod
+    def create_broker(cls, device_path, part, account, container, logger=None,
+                      epoch=None, put_timestamp=None,
+                      storage_policy_index=None):
+        """
+        Create a ContainerBroker instance. If the db doesn't exist, initialize
+        the db file.
+
+        :param device_path: device path
+        :param part: partition number
+        :param account: account name string
+        :param container: container name string
+        :param logger: a logger instance
+        :param epoch: a timestamp to include in the db filename
+        :param put_timestamp: initial timestamp if broker needs to be
+            initialized
+        :param storage_policy_index: the storage policy index
+        :return: a tuple of (``broker``, ``initialized``) where ``broker`` is
+            an instance of :class:`swift.container.backend.ContainerBroker` and
+            ``initialized`` is True if the db file was initialized, False
+            otherwise.
+        """
+        hsh = hash_path(account, container)
+        db_dir = storage_directory(DATADIR, part, hsh)
+        db_path = make_db_file_path(
+            os.path.join(device_path, db_dir, hsh + '.db'), epoch)
+        broker = ContainerBroker(db_path, account=account, container=container,
+                                 logger=logger)
+        initialized = False
+        if not os.path.exists(broker.db_file):
+            try:
+                broker.initialize(put_timestamp, storage_policy_index)
+                initialized = True
+            except DatabaseAlreadyExists:
+                pass
+        return broker, initialized
+
+    def get_db_state(self):
+        """
+        Returns the current state of on disk db files.
+        """
+        if not self.db_files:
+            return NOTFOUND
+        if len(self.db_files) > 1:
+            return SHARDING
+        if self.db_epoch is None:
+            # never been sharded
+            return UNSHARDED
+        if self.db_epoch != self.get_own_shard_range().epoch:
+            return UNSHARDED
+        if not self.has_other_shard_ranges():
+            return COLLAPSED
+        return SHARDED
+
+    def sharding_initiated(self):
+        """
+        Returns True if a broker has shard range state that would be necessary
+        for sharding to have been initiated, False otherwise.
+        """
+        own_shard_range = self.get_own_shard_range()
+        if own_shard_range.state in ShardRange.CLEAVING_STATES:
+            return self.has_other_shard_ranges()
+        return False
+
+    def sharding_required(self):
+        """
+        Returns True if a broker has shard range state that would be necessary
+        for sharding to have been initiated but has not yet completed sharding,
+        False otherwise.
+        """
+        db_state = self.get_db_state()
+        return (db_state == SHARDING or
+                (db_state == UNSHARDED and self.sharding_initiated()))
+
+    def is_sharded(self):
+        return self.get_db_state() == SHARDED
+
+    def reload_db_files(self):
+        """
+        Reloads the cached list of valid on disk db files for this broker.
+        """
+        # reset connection so the next access will use the correct DB file
+        self.conn = None
+        self._db_files = get_db_files(self._init_db_file)
+
+    @property
+    def db_files(self):
+        """
+        Gets the cached list of valid db files that exist on disk for this
+        broker.
+
+        The cached list may be refreshed by calling
+            :meth:`~swift.container.backend.ContainerBroker.reload_db_files`.
+
+        :return: A list of paths to db files ordered by ascending epoch;
+            the list may be empty.
+        """
+        if not self._db_files:
+            self.reload_db_files()
+        return self._db_files
+
+    @property
+    def db_file(self):
+        """
+        Get the path to the primary db file for this broker. This is typically
+        the db file for the most recent sharding epoch. However, if no db files
+        exist on disk, or if ``force_db_file`` was True when the broker was
+        constructed, then the primary db file is the file passed to the broker
+        constructor.
+
+        :return: A path to a db file; the file does not necessarily exist.
+        """
+        if self._force_db_file:
+            return self._init_db_file
+        if self.db_files:
+            return self.db_files[-1]
+        return self._init_db_file
+
+    @property
+    def db_epoch(self):
+        hash_, epoch, ext = parse_db_filename(self.db_file)
+        return epoch
+
+    @property
+    def storage_policy_index(self):
+        if not hasattr(self, '_storage_policy_index'):
+            self._storage_policy_index = \
+                self._get_info()['storage_policy_index']
+        return self._storage_policy_index
+
+    @property
+    def path(self):
+        self._populate_instance_cache()
+        return '%s/%s' % (self.account, self.container)
+
+    def _initialize(self, conn, put_timestamp, storage_policy_index):
+        """
+        Create a brand new container database (tables, indices, triggers, etc.)
+        """
+        if not self.account:
+            raise ValueError(
+                'Attempting to create a new database with no account set')
+        if not self.container:
+            raise ValueError(
+                'Attempting to create a new database with no container set')
+        if storage_policy_index is None:
+            storage_policy_index = 0
+        self.create_object_table(conn)
+        self.create_policy_stat_table(conn, storage_policy_index)
+        self.create_container_info_table(conn, put_timestamp,
+                                         storage_policy_index)
+        self.create_shard_range_table(conn)
+        self._db_files = None
+
+    def create_object_table(self, conn):
+        """
+        Create the object table which is specific to the container DB.
+        Not a part of Pluggable Back-ends, internal to the baseline code.
+
+        :param conn: DB connection object
+        """
+        conn.executescript("""
+            CREATE TABLE object (
+                ROWID INTEGER PRIMARY KEY AUTOINCREMENT,
+                name TEXT,
+                created_at TEXT,
+                size INTEGER,
+                content_type TEXT,
+                etag TEXT,
+                deleted INTEGER DEFAULT 0,
+                storage_policy_index INTEGER DEFAULT 0
+            );
+
+            CREATE INDEX ix_object_deleted_name ON object (deleted, name);
+
+            CREATE TRIGGER object_update BEFORE UPDATE ON object
+            BEGIN
+                SELECT RAISE(FAIL, 'UPDATE not allowed; DELETE and INSERT');
+            END;
+
+        """ + POLICY_STAT_TRIGGER_SCRIPT)
+
+    def create_container_info_table(self, conn, put_timestamp,
+                                    storage_policy_index):
+        """
+        Create the container_info table which is specific to the container DB.
+        Not a part of Pluggable Back-ends, internal to the baseline code.
+        Also creates the container_stat view.
+
+        :param conn: DB connection object
+        :param put_timestamp: put timestamp
+        :param storage_policy_index: storage policy index
+        """
+        if put_timestamp is None:
+            put_timestamp = Timestamp.zero().internal
+        # The container_stat view is for compatibility; old versions of Swift
+        # expected a container_stat table with columns "object_count" and
+        # "bytes_used", but when that stuff became per-storage-policy and
+        # moved to the policy_stat table, we stopped creating those columns in
+        # container_stat.
+        #
+        # To retain compatibility, we create the container_stat view with some
+        # triggers to make it behave like the old container_stat table. This
+        # way, if an old version of Swift encounters a database with the new
+        # schema, it can still work.
+        #
+        # Note that this can occur during a rolling Swift upgrade if a DB gets
+        # rsynced from an old node to a new, so it's necessary for
+        # availability during upgrades. The fact that it enables downgrades is
+        # a nice bonus.
+        conn.executescript(CONTAINER_INFO_TABLE_SCRIPT +
+                           CONTAINER_STAT_VIEW_SCRIPT)
+        conn.execute("""
+            INSERT INTO container_info (account, container, created_at, id,
+                put_timestamp, status_changed_at, storage_policy_index)
+            VALUES (?, ?, ?, ?, ?, ?, ?);
+        """, (self.account, self.container, Timestamp.now().internal,
+              self._new_db_id(), put_timestamp, put_timestamp,
+              storage_policy_index))
+
+    def create_policy_stat_table(self, conn, storage_policy_index=0):
+        """
+        Create policy_stat table.
+
+        :param conn: DB connection object
+        :param storage_policy_index: the policy_index the container is
+                                     being created with
+        """
+        conn.executescript(POLICY_STAT_TABLE_CREATE)
+        conn.execute("""
+            INSERT INTO policy_stat (storage_policy_index)
+            VALUES (?)
+        """, (storage_policy_index,))
+
+    def create_shard_range_table(self, conn):
+        """
+        Create the shard_range table which is specific to the container DB.
+
+        :param conn: DB connection object
+        """
+        # Use execute (not executescript) so we get the benefits of our
+        # GreenDBConnection. Creating a table requires a whole-DB lock;
+        # *any* in-progress cursor will otherwise trip a "database is locked"
+        # error.
+        conn.execute("""
+            CREATE TABLE %s (
+                ROWID INTEGER PRIMARY KEY AUTOINCREMENT,
+                name TEXT,
+                timestamp TEXT,
+                lower TEXT,
+                upper TEXT,
+                object_count INTEGER DEFAULT 0,
+                bytes_used INTEGER DEFAULT 0,
+                meta_timestamp TEXT,
+                deleted INTEGER DEFAULT 0,
+                state INTEGER,
+                state_timestamp TEXT,
+                epoch TEXT,
+                reported INTEGER DEFAULT 0,
+                tombstones INTEGER DEFAULT -1
+            );
+        """ % SHARD_RANGE_TABLE)
+
+        conn.execute("""
+            CREATE TRIGGER shard_range_update BEFORE UPDATE ON %s
+            BEGIN
+                SELECT RAISE(FAIL, 'UPDATE not allowed; DELETE and INSERT');
+            END;
+        """ % SHARD_RANGE_TABLE)
+
+    def get_db_version(self, conn):
+        if self._db_version == -1:
+            self._db_version = 0
+            for row in conn.execute('''
+                    SELECT name FROM sqlite_master
+                    WHERE name = 'ix_object_deleted_name' '''):
+                self._db_version = 1
+        return self._db_version
+
+    def _get_deleted_key(self, connection):
+        if self.get_db_version(connection) < 1:
+            return '+deleted'
+        return 'deleted'
+
+    def _newid(self, conn):
+        conn.execute('''
+            UPDATE container_stat
+            SET reported_put_timestamp = 0, reported_delete_timestamp = 0,
+                reported_object_count = 0, reported_bytes_used = 0''')
+
+    def _commit_puts_load(self, item_list, entry):
+        """See :func:`swift.common.db.DatabaseBroker._commit_puts_load`"""
+        (name, timestamp, size, content_type, etag, deleted) = entry[:6]
+        if len(entry) > 6:
+            storage_policy_index = entry[6]
+        else:
+            storage_policy_index = 0
+        content_type_timestamp = meta_timestamp = None
+        if len(entry) > 7:
+            content_type_timestamp = entry[7]
+        if len(entry) > 8:
+            meta_timestamp = entry[8]
+        item_list.append({'name': name,
+                          'created_at': timestamp,
+                          'size': size,
+                          'content_type': content_type,
+                          'etag': etag,
+                          'deleted': deleted,
+                          'storage_policy_index': storage_policy_index,
+                          'ctype_timestamp': content_type_timestamp,
+                          'meta_timestamp': meta_timestamp})
+
+    def _empty(self):
+        self._commit_puts_stale_ok()
+        with self.get() as conn:
+            try:
+                row = conn.execute(
+                    'SELECT max(object_count) from policy_stat').fetchone()
+            except sqlite3.OperationalError as err:
+                if not any(msg in str(err) for msg in (
+                        "no such column: storage_policy_index",
+                        "no such table: policy_stat")):
+                    raise
+                row = conn.execute(
+                    'SELECT object_count from container_stat').fetchone()
+            return zero_like(row[0])
+
+    def empty(self):
+        """
+        Check if container DB is empty.
+
+        This method uses more stringent checks on object count than
+        :meth:`is_deleted`: this method checks that there are no objects in any
+        policy; if the container is in the process of sharding then both fresh
+        and retiring databases are checked to be empty; if a root container has
+        shard ranges then they are checked to be empty.
+
+        :returns: True if the database has no active objects, False otherwise
+        """
+        if not all(broker._empty() for broker in self.get_brokers()):
+            return False
+        if self.is_root_container() and self.sharding_initiated():
+            # sharded shards don't get updates from their shards so their shard
+            # usage should not be relied upon
+            return self.get_shard_usage()['object_count'] <= 0
+        return True
+
+    def delete_object(self, name, timestamp, storage_policy_index=0):
+        """
+        Mark an object deleted.
+
+        :param name: object name to be deleted
+        :param timestamp: timestamp when the object was marked as deleted
+        :param storage_policy_index: the storage policy index for the object
+        """
+        self.put_object(name, timestamp, 0, 'application/deleted', 'noetag',
+                        deleted=1, storage_policy_index=storage_policy_index)
+
+    def make_tuple_for_pickle(self, record):
+        return (record['name'], record['created_at'], record['size'],
+                record['content_type'], record['etag'], record['deleted'],
+                record['storage_policy_index'],
+                record['ctype_timestamp'],
+                record['meta_timestamp'])
+
+    def put_object(self, name, timestamp, size, content_type, etag, deleted=0,
+                   storage_policy_index=0, ctype_timestamp=None,
+                   meta_timestamp=None):
+        """
+        Creates an object in the DB with its metadata.
+
+        :param name: object name to be created
+        :param timestamp: timestamp of when the object was created
+        :param size: object size
+        :param content_type: object content-type
+        :param etag: object etag
+        :param deleted: if True, marks the object as deleted and sets the
+                        deleted_at timestamp to timestamp
+        :param storage_policy_index: the storage policy index for the object
+        :param ctype_timestamp: timestamp of when content_type was last
+                                updated
+        :param meta_timestamp: timestamp of when metadata was last updated
+        """
+        record = {'name': name, 'created_at': timestamp, 'size': size,
+                  'content_type': content_type, 'etag': etag,
+                  'deleted': deleted,
+                  'storage_policy_index': storage_policy_index,
+                  'ctype_timestamp': ctype_timestamp,
+                  'meta_timestamp': meta_timestamp}
+        self.put_record(record)
+
+    def remove_objects(self, lower, upper, max_row=None):
+        """
+        Removes object records in the given namespace range from the object
+        table.
+
+        Note that objects are removed regardless of their storage_policy_index.
+
+        :param lower: defines the lower bound of object names that will be
+            removed; names greater than this value will be removed; names less
+            than or equal to this value will not be removed.
+        :param upper: defines the upper bound of object names that will be
+            removed; names less than or equal to this value will be removed;
+            names greater than this value will not be removed. The empty string
+            is interpreted as there being no upper bound.
+        :param max_row: if specified only rows less than or equal to max_row
+            will be removed
+        """
+        query_conditions = []
+        query_args = []
+        if max_row is not None:
+            query_conditions.append('ROWID <= ?')
+            query_args.append(str(max_row))
+        if lower:
+            query_conditions.append('name > ?')
+            query_args.append(lower)
+        if upper:
+            query_conditions.append('name <= ?')
+            query_args.append(upper)
+
+        query = 'DELETE FROM object WHERE deleted in (0, 1)'
+        if query_conditions:
+            query += ' AND ' + ' AND '.join(query_conditions)
+
+        with self.get() as conn:
+            conn.execute(query, query_args)
+            conn.commit()
+
+    def _is_deleted_info(self, object_count, put_timestamp, delete_timestamp,
+                         **kwargs):
+        """
+        Apply delete logic to database info.
+
+        :returns: True if the DB is considered to be deleted, False otherwise
+        """
+        # The container is considered deleted if the delete_timestamp
+        # value is greater than the put_timestamp, and there are no
+        # objects in the container.
+        return zero_like(object_count) and (
+            Timestamp(delete_timestamp) > Timestamp(put_timestamp))
+
+    def _is_deleted(self, conn):
+        """
+        Check if the DB is considered to be deleted.
+
+        This object count used in this check is the same as the container
+        object count that would be returned in the result of :meth:`get_info`
+        and exposed to a client i.e. it is based on the container_stat view for
+        the current storage policy index or relevant shard range usage.
+
+        :param conn: database conn
+
+        :returns: True if the DB is considered to be deleted, False otherwise
+        """
+        info = conn.execute('''
+            SELECT put_timestamp, delete_timestamp, object_count
+            FROM container_stat''').fetchone()
+        info = dict(info)
+        info.update(self._get_alternate_object_stats()[1])
+        return self._is_deleted_info(**info)
+
+    def is_old_enough_to_reclaim(self, now, reclaim_age):
+        with self.get() as conn:
+            info = conn.execute('''
+                SELECT put_timestamp, delete_timestamp
+                FROM container_stat''').fetchone()
+        return (Timestamp(now - reclaim_age) >
+                Timestamp(info['delete_timestamp']) >
+                Timestamp(info['put_timestamp']))
+
+    def is_empty_enough_to_reclaim(self):
+        if self.is_root_container() and (self.has_other_shard_ranges() or
+                                         self.get_db_state() == SHARDING):
+            return False
+        return self.empty()
+
+    def is_reclaimable(self, now, reclaim_age):
+        return self.is_old_enough_to_reclaim(now, reclaim_age) and \
+            self.is_empty_enough_to_reclaim()
+
+    def get_info_is_deleted(self):
+        """
+        Get the is_deleted status and info for the container.
+
+        :returns: a tuple, in the form (info, is_deleted) info is a dict as
+                  returned by get_info and is_deleted is a boolean.
+        """
+        if not os.path.exists(self.db_file):
+            return {}, True
+        info = self.get_info()
+        return info, self._is_deleted_info(**info)
+
+    def get_replication_info(self):
+        info = super(ContainerBroker, self).get_replication_info()
+        info['shard_max_row'] = self.get_max_row(SHARD_RANGE_TABLE)
+        return info
+
+    def _do_get_info_query(self, conn):
+        data = None
+        trailing_sync = 'x_container_sync_point1, x_container_sync_point2'
+        trailing_pol = 'storage_policy_index'
+        errors = set()
+        while not data:
+            try:
+                data = conn.execute(('''
+                    SELECT account, container, created_at, put_timestamp,
+                        delete_timestamp, status, status_changed_at,
+                        object_count, bytes_used,
+                        reported_put_timestamp, reported_delete_timestamp,
+                        reported_object_count, reported_bytes_used, hash,
+                        id, %s, %s
+                        FROM container_stat
+                ''') % (trailing_sync, trailing_pol)).fetchone()
+            except sqlite3.OperationalError as err:
+                err_msg = str(err)
+                if err_msg in errors:
+                    # only attempt migration once
+                    raise
+                errors.add(err_msg)
+                if 'no such column: storage_policy_index' in err_msg:
+                    trailing_pol = '0 AS storage_policy_index'
+                elif 'no such column: x_container_sync_point' in err_msg:
+                    trailing_sync = '-1 AS x_container_sync_point1, ' \
+                                    '-1 AS x_container_sync_point2'
+                else:
+                    raise
+        data = dict(data)
+        # populate instance cache
+        self._storage_policy_index = data['storage_policy_index']
+        self.account = data['account']
+        self.container = data['container']
+        return data
+
+    def _get_info(self):
+        self._commit_puts_stale_ok()
+        with self.get() as conn:
+            return self._do_get_info_query(conn)
+
+    def _populate_instance_cache(self, conn=None):
+        # load cached instance attributes from the database if necessary
+        if self.container is None:
+            with self.maybe_get(conn) as conn:
+                self._do_get_info_query(conn)
+
+    def _get_alternate_object_stats(self):
+        db_state = self.get_db_state()
+        if db_state == SHARDING:
+            other_info = self.get_brokers()[0]._get_info()
+            stats = {'object_count': other_info['object_count'],
+                     'bytes_used': other_info['bytes_used']}
+        elif db_state == SHARDED and self.is_root_container():
+            stats = self.get_shard_usage()
+        else:
+            stats = {}
+        return db_state, stats
+
+    def get_info(self):
+        """
+        Get global data for the container.
+
+        :returns: dict with keys: account, container, created_at,
+                  put_timestamp, delete_timestamp, status, status_changed_at,
+                  object_count, bytes_used, reported_put_timestamp,
+                  reported_delete_timestamp, reported_object_count,
+                  reported_bytes_used, hash, id, x_container_sync_point1,
+                  x_container_sync_point2, and storage_policy_index,
+                  db_state.
+        """
+        data = self._get_info()
+        state, stats = self._get_alternate_object_stats()
+        data.update(stats)
+        data['db_state'] = state
+        return data
+
+    def set_x_container_sync_points(self, sync_point1, sync_point2):
+        with self.get() as conn:
+            try:
+                self._set_x_container_sync_points(conn, sync_point1,
+                                                  sync_point2)
+            except sqlite3.OperationalError as err:
+                if 'no such column: x_container_sync_point' not in \
+                        str(err):
+                    raise
+                self._migrate_add_container_sync_points(conn)
+                self._set_x_container_sync_points(conn, sync_point1,
+                                                  sync_point2)
+            conn.commit()
+
+    def _set_x_container_sync_points(self, conn, sync_point1, sync_point2):
+        if sync_point1 is not None and sync_point2 is not None:
+            conn.execute('''
+                UPDATE container_stat
+                SET x_container_sync_point1 = ?,
+                    x_container_sync_point2 = ?
+            ''', (sync_point1, sync_point2))
+        elif sync_point1 is not None:
+            conn.execute('''
+                UPDATE container_stat
+                SET x_container_sync_point1 = ?
+            ''', (sync_point1,))
+        elif sync_point2 is not None:
+            conn.execute('''
+                UPDATE container_stat
+                SET x_container_sync_point2 = ?
+            ''', (sync_point2,))
+
+    def get_policy_stats(self):
+        with self.get() as conn:
+            try:
+                info = conn.execute('''
+                    SELECT storage_policy_index, object_count, bytes_used
+                    FROM policy_stat
+                ''').fetchall()
+            except sqlite3.OperationalError as err:
+                if not any(msg in str(err) for msg in (
+                        "no such column: storage_policy_index",
+                        "no such table: policy_stat")):
+                    raise
+                info = conn.execute('''
+                    SELECT 0 as storage_policy_index, object_count, bytes_used
+                    FROM container_stat
+                ''').fetchall()
+        policy_stats = {}
+        for row in info:
+            stats = dict(row)
+            key = stats.pop('storage_policy_index')
+            policy_stats[key] = stats
+        return policy_stats
+
+    def has_multiple_policies(self):
+        with self.get() as conn:
+            try:
+                curs = conn.execute('''
+                    SELECT count(storage_policy_index)
+                    FROM policy_stat
+                    ''').fetchone()
+            except sqlite3.OperationalError as err:
+                if 'no such table: policy_stat' not in str(err):
+                    raise
+                # no policy_stat row
+                return False
+            if curs and curs[0] > 1:
+                return True
+            # only one policy_stat row
+            return False
+
+    def set_storage_policy_index(self, policy_index, timestamp=None):
+        """
+        Update the container_stat policy_index and status_changed_at.
+        """
+        if timestamp is None:
+            timestamp = Timestamp.now().internal
+
+        def _setit(conn):
+            conn.execute('''
+                INSERT OR IGNORE INTO policy_stat (storage_policy_index)
+                VALUES (?)
+             ''', (policy_index,))
+            conn.execute('''
+                UPDATE container_stat
+                SET storage_policy_index = ?,
+                    status_changed_at = MAX(?, status_changed_at)
+                WHERE storage_policy_index <> ?
+            ''', (policy_index, timestamp, policy_index))
+            conn.commit()
+
+        with self.get() as conn:
+            try:
+                _setit(conn)
+            except sqlite3.OperationalError as err:
+                if not any(msg in str(err) for msg in (
+                        "no such column: storage_policy_index",
+                        "no such table: policy_stat")):
+                    raise
+                self._migrate_add_storage_policy(conn)
+                _setit(conn)
+
+        self._storage_policy_index = policy_index
+
+    def reported(self, put_timestamp, delete_timestamp, object_count,
+                 bytes_used):
+        """
+        Update reported stats, available with container's `get_info`.
+
+        :param put_timestamp: put_timestamp to update
+        :param delete_timestamp: delete_timestamp to update
+        :param object_count: object_count to update
+        :param bytes_used: bytes_used to update
+        """
+        with self.get() as conn:
+            conn.execute('''
+                UPDATE container_stat
+                SET reported_put_timestamp = ?, reported_delete_timestamp = ?,
+                    reported_object_count = ?, reported_bytes_used = ?
+            ''', (put_timestamp, delete_timestamp, object_count, bytes_used))
+            conn.commit()
+
+    def list_objects_iter(self, limit, marker, end_marker, prefix, delimiter,
+                          path=None, storage_policy_index=0, reverse=False,
+                          include_deleted=False, since_row=None,
+                          transform_func=None, all_policies=False,
+                          allow_reserved=False):
+        """
+        Get a list of objects sorted by name starting at marker onward, up
+        to limit entries.  Entries will begin with the prefix and will not
+        have the delimiter after the prefix.
+
+        :param limit: maximum number of entries to get
+        :param marker: marker query
+        :param end_marker: end marker query
+        :param prefix: prefix query
+        :param delimiter: delimiter for query
+        :param path: if defined, will set the prefix and delimiter based on
+                     the path
+        :param storage_policy_index: storage policy index for query
+        :param reverse: reverse the result order.
+        :param include_deleted: if True, include only deleted objects; if
+            False (default), include only undeleted objects; otherwise, include
+            both deleted and undeleted objects.
+        :param since_row: include only items whose ROWID is greater than
+            the given row id; by default all rows are included.
+        :param transform_func: an optional function that if given will be
+            called for each object to get a transformed version of the object
+            to include in the listing; should have same signature as
+            :meth:`~_transform_record`; defaults to :meth:`~_transform_record`.
+        :param all_policies: if True, include objects for all storage policies
+            ignoring any value given for ``storage_policy_index``
+        :param allow_reserved: exclude names with reserved-byte by default
+
+        :returns: list of tuples of (name, created_at, size, content_type,
+                  etag, deleted)
+        """
+        if include_deleted is True:
+            deleted_arg = ' = 1'
+        elif include_deleted is False:
+            deleted_arg = ' = 0'
+        else:
+            deleted_arg = ' in (0, 1)'
+
+        if transform_func is None:
+            transform_func = self._transform_record
+        delim_force_gte = False
+        self._commit_puts_stale_ok()
+        if reverse:
+            # Reverse the markers if we are reversing the listing.
+            marker, end_marker = end_marker, marker
+        if path is not None:
+            prefix = path
+            if path:
+                prefix = path = path.rstrip('/') + '/'
+            delimiter = '/'
+        elif delimiter and not prefix:
+            prefix = ''
+        if prefix:
+            end_prefix = prefix[:-1] + chr(ord(prefix[-1]) + 1)
+        orig_marker = marker
+        with self.get() as conn:
+            results = []
+            deleted_key = self._get_deleted_key(conn)
+            query_keys = ['name', 'created_at', 'size', 'content_type',
+                          'etag', deleted_key]
+            while len(results) < limit:
+                query_args = []
+                query_conditions = []
+                if end_marker and (not prefix or end_marker < end_prefix):
+                    query_conditions.append('name < ?')
+                    query_args.append(end_marker)
+                elif prefix:
+                    query_conditions.append('name < ?')
+                    query_args.append(end_prefix)
+
+                if delim_force_gte:
+                    query_conditions.append('name >= ?')
+                    query_args.append(marker)
+                    # Always set back to False
+                    delim_force_gte = False
+                elif marker and (not prefix or marker >= prefix):
+                    query_conditions.append('name > ?')
+                    query_args.append(marker)
+                elif prefix:
+                    query_conditions.append('name >= ?')
+                    query_args.append(prefix)
+                if not allow_reserved:
+                    query_conditions.append('name >= ?')
+                    query_args.append(chr(ord(RESERVED_BYTE) + 1))
+                query_conditions.append(deleted_key + deleted_arg)
+                if since_row:
+                    query_conditions.append('ROWID > ?')
+                    query_args.append(since_row)
+
+                def build_query(keys, conditions, args):
+                    query = 'SELECT ' + ', '.join(keys) + ' FROM object '
+                    if conditions:
+                        query += 'WHERE ' + ' AND '.join(conditions)
+                    tail_query = '''
+                        ORDER BY name %s LIMIT ?
+                    ''' % ('DESC' if reverse else '')
+                    return query + tail_query, args + [limit - len(results)]
+
+                # storage policy filter
+                if all_policies:
+                    query, args = build_query(
+                        query_keys + ['storage_policy_index'],
+                        query_conditions,
+                        query_args)
+                else:
+                    query, args = build_query(
+                        query_keys + ['storage_policy_index'],
+                        query_conditions + ['storage_policy_index = ?'],
+                        query_args + [storage_policy_index])
+                try:
+                    curs = conn.execute(query, tuple(args))
+                except sqlite3.OperationalError as err:
+                    if 'no such column: storage_policy_index' not in str(err):
+                        raise
+                    query, args = build_query(
+                        query_keys + ['0 as storage_policy_index'],
+                        query_conditions, query_args)
+                    curs = conn.execute(query, tuple(args))
+                curs.row_factory = None
+
+                # Delimiters without a prefix is ignored, further if there
+                # is no delimiter then we can simply return the result as
+                # prefixes are now handled in the SQL statement.
+                if prefix is None or not delimiter:
+                    return [transform_func(r) for r in curs]
+
+                # We have a delimiter and a prefix (possibly empty string) to
+                # handle
+                rowcount = 0
+                for row in curs:
+                    rowcount += 1
+                    name = row[0]
+                    if reverse:
+                        end_marker = name
+                    else:
+                        marker = name
+
+                    if len(results) >= limit:
+                        curs.close()
+                        return results
+                    end = name.find(delimiter, len(prefix))
+                    if path is not None:
+                        if name == path:
+                            continue
+                        if end >= 0 and len(name) > end + len(delimiter):
+                            if reverse:
+                                end_marker = name[:end + len(delimiter)]
+                            else:
+                                marker = ''.join([
+                                    name[:end],
+                                    delimiter[:-1],
+                                    chr(ord(delimiter[-1:]) + 1),
+                                ])
+                            curs.close()
+                            break
+                    elif end >= 0:
+                        if reverse:
+                            end_marker = name[:end + len(delimiter)]
+                        else:
+                            marker = ''.join([
+                                name[:end],
+                                delimiter[:-1],
+                                chr(ord(delimiter[-1:]) + 1),
+                            ])
+                            # we want result to be inclusive of delim+1
+                            delim_force_gte = True
+                        dir_name = name[:end + len(delimiter)]
+                        if dir_name != orig_marker:
+                            results.append([dir_name, '0', 0, None, ''])
+                        curs.close()
+                        break
+                    results.append(transform_func(row))
+                if not rowcount:
+                    break
+            return results
+
+    def get_objects(self, limit=None, marker='', end_marker='',
+                    include_deleted=None, since_row=None):
+        """
+        Returns a list of objects, including deleted objects, in all policies.
+        Each object in the list is described by a dict with keys {'name',
+        'created_at', 'size', 'content_type', 'etag', 'deleted',
+        'storage_policy_index'}.
+
+        :param limit: maximum number of entries to get
+        :param marker: if set, objects with names less than or equal to this
+            value will not be included in the list.
+        :param end_marker: if set, objects with names greater than or equal to
+            this value will not be included in the list.
+        :param include_deleted: if True, include only deleted objects; if
+            False, include only undeleted objects; otherwise (default), include
+            both deleted and undeleted objects.
+        :param since_row: include only items whose ROWID is greater than
+            the given row id; by default all rows are included.
+        :return: a list of dicts, each describing an object.
+        """
+
+        limit = CONTAINER_LISTING_LIMIT if limit is None else limit
+        return self.list_objects_iter(
+            limit, marker, end_marker, prefix=None, delimiter=None, path=None,
+            reverse=False, include_deleted=include_deleted,
+            transform_func=self._record_to_dict, since_row=since_row,
+            all_policies=True, allow_reserved=True
+        )
+
+    def _transform_record(self, record):
+        """
+        Returns a tuple of (name, last-modified time, size, content_type and
+        etag) for the given record.
+
+        The given record's created_at timestamp is decoded into separate data,
+        content-type and meta timestamps and the metadata timestamp is used as
+        the last-modified time value.
+        """
+        t_data, t_ctype, t_meta = decode_timestamps(record[1])
+        return (record[0], t_meta.internal) + record[2:5]
+
+    def _record_to_dict(self, rec):
+        if rec:
+            keys = ('name', 'created_at', 'size', 'content_type', 'etag',
+                    'deleted', 'storage_policy_index')
+            return dict(zip(keys, rec))
+        return None
+
+    def merge_items(self, item_list, source=None):
+        """
+        Merge items into the object table.
+
+        :param item_list: list of dictionaries of {'name', 'created_at',
+                          'size', 'content_type', 'etag', 'deleted',
+                          'storage_policy_index', 'ctype_timestamp',
+                          'meta_timestamp'}
+        :param source: if defined, update incoming_sync with the source
+        """
+        for item in item_list:
+            if isinstance(item['name'], bytes):
+                item['name'] = item['name'].decode('utf-8')
+
+        def _really_really_merge_items(conn):
+            curs = conn.cursor()
+            if self.get_db_version(conn) >= 1:
+                query_mod = ' deleted IN (0, 1) AND '
+            else:
+                query_mod = ''
+            curs.execute('BEGIN IMMEDIATE')
+            # Get sqlite records for objects in item_list that already exist.
+            # We must chunk it up to avoid sqlite's limit of 999 args.
+            records = {}
+            for offset in range(0, len(item_list), SQLITE_ARG_LIMIT):
+                chunk = [rec['name'] for rec in
+                         item_list[offset:offset + SQLITE_ARG_LIMIT]]
+                records.update(
+                    ((rec[0], rec[6]), rec) for rec in curs.execute(
+                        'SELECT name, created_at, size, content_type,'
+                        'etag, deleted, storage_policy_index '
+                        'FROM object WHERE ' + query_mod + ' name IN (%s)' %
+                        ','.join('?' * len(chunk)), chunk))
+            # Sort item_list into things that need adding and deleting, based
+            # on results of created_at query.
+            to_delete = set()
+            to_add = {}
+            for item in item_list:
+                item.setdefault('storage_policy_index', 0)  # legacy
+                item_ident = (item['name'], item['storage_policy_index'])
+                existing = self._record_to_dict(records.get(item_ident))
+                if update_new_item_from_existing(item, existing):
+                    if item_ident in records:  # exists with older timestamp
+                        to_delete.add(item_ident)
+                    if item_ident in to_add:  # duplicate entries in item_list
+                        update_new_item_from_existing(item, to_add[item_ident])
+                    to_add[item_ident] = item
+            if to_delete:
+                curs.executemany(
+                    'DELETE FROM object WHERE ' + query_mod +
+                    'name=? AND storage_policy_index=?',
+                    (item_ident for item_ident in to_delete))
+            if to_add:
+                curs.executemany(
+                    'INSERT INTO object (name, created_at, size, content_type,'
+                    'etag, deleted, storage_policy_index) '
+                    'VALUES (?, ?, ?, ?, ?, ?, ?)',
+                    ((rec['name'], rec['created_at'], rec['size'],
+                      rec['content_type'], rec['etag'], rec['deleted'],
+                      rec['storage_policy_index'])
+                     for rec in to_add.values()))
+            if source:
+                # for replication we rely on the remote end sending merges in
+                # order with no gaps to increment sync_points
+                sync_point = item_list[-1]['ROWID']
+                curs.execute('''
+                    UPDATE incoming_sync SET
+                    sync_point=max(?, sync_point) WHERE remote_id=?
+                ''', (sync_point, source))
+                if curs.rowcount < 1:
+                    curs.execute('''
+                        INSERT INTO incoming_sync (sync_point, remote_id)
+                        VALUES (?, ?)
+                    ''', (sync_point, source))
+            conn.commit()
+
+        def _really_merge_items(conn):
+            return tpool.execute(_really_really_merge_items, conn)
+
+        with self.get() as conn:
+            try:
+                return _really_merge_items(conn)
+            except sqlite3.OperationalError as err:
+                if 'no such column: storage_policy_index' not in str(err):
+                    raise
+                self._migrate_add_storage_policy(conn)
+                return _really_merge_items(conn)
+
+    def merge_shard_ranges(self, shard_ranges):
+        """
+        Merge shard ranges into the shard range table.
+
+        :param shard_ranges: a shard range or a list of shard ranges; each
+            shard range should be an instance of
+            :class:`~swift.common.utils.ShardRange` or a dict representation of
+            a shard range having ``SHARD_RANGE_KEYS``.
+        """
+        if not shard_ranges:
+            return
+        if not isinstance(shard_ranges, (list, ShardRangeList)):
+            shard_ranges = [shard_ranges]
+
+        item_list = []
+        for item in shard_ranges:
+            if isinstance(item, ShardRange):
+                item = dict(item)
+            for col in ('name', 'lower', 'upper'):
+                if isinstance(item[col], bytes):
+                    item[col] = item[col].decode('utf-8')
+            item_list.append(item)
+
+        def _really_merge_items(conn):
+            curs = conn.cursor()
+            curs.execute('BEGIN IMMEDIATE')
+
+            # Get rows for items that already exist.
+            # We must chunk it up to avoid sqlite's limit of 999 args.
+            records = {}
+            for offset in range(0, len(item_list), SQLITE_ARG_LIMIT):
+                chunk = [record['name'] for record
+                         in item_list[offset:offset + SQLITE_ARG_LIMIT]]
+                records.update(
+                    (rec[0], dict(zip(SHARD_RANGE_KEYS, rec)))
+                    for rec in curs.execute(
+                        'SELECT %s FROM %s '
+                        'WHERE deleted IN (0, 1) AND name IN (%s)' %
+                        (', '.join(SHARD_RANGE_KEYS), SHARD_RANGE_TABLE,
+                         ','.join('?' * len(chunk))), chunk))
+
+            to_add, to_delete = sift_shard_ranges(item_list, records)
+
+            if to_delete:
+                curs.executemany(
+                    'DELETE FROM %s WHERE deleted in (0, 1) '
+                    'AND name = ?' % SHARD_RANGE_TABLE,
+                    ((item_ident,) for item_ident in to_delete))
+            if to_add:
+                vals = ','.join('?' * len(SHARD_RANGE_KEYS))
+                curs.executemany(
+                    'INSERT INTO %s (%s) VALUES (%s)' %
+                    (SHARD_RANGE_TABLE, ','.join(SHARD_RANGE_KEYS), vals),
+                    tuple([item[k] for k in SHARD_RANGE_KEYS]
+                          for item in to_add))
+            conn.commit()
+
+        migrations = {
+            'no such column: reported':
+                self._migrate_add_shard_range_reported,
+            'no such column: tombstones':
+                self._migrate_add_shard_range_tombstones,
+            ('no such table: %s' % SHARD_RANGE_TABLE):
+                self.create_shard_range_table,
+        }
+        migrations_done = set()
+        with self.get() as conn:
+            while True:
+                try:
+                    return _really_merge_items(conn)
+                except sqlite3.OperationalError as err:
+                    # Without the rollback, new enough (>= py37) python/sqlite3
+                    # will panic:
+                    #   sqlite3.OperationalError: cannot start a transaction
+                    #   within a transaction
+                    conn.rollback()
+                    for err_str, migration in migrations.items():
+                        if err_str in migrations_done:
+                            continue
+                        if err_str in str(err):
+                            migration(conn)
+                            migrations_done.add(err_str)
+                            break
+                    else:
+                        raise
+
+    def get_reconciler_sync(self):
+        with self.get() as conn:
+            try:
+                return conn.execute('''
+                    SELECT reconciler_sync_point FROM container_stat
+                    ''').fetchone()[0]
+            except sqlite3.OperationalError as err:
+                if "no such column: reconciler_sync_point" not in str(err):
+                    raise
+                return -1
+
+    def update_reconciler_sync(self, point):
+        query = '''
+            UPDATE container_stat
+            SET reconciler_sync_point = ?
+        '''
+        with self.get() as conn:
+            try:
+                conn.execute(query, (point,))
+            except sqlite3.OperationalError as err:
+                if "no such column: reconciler_sync_point" not in str(err):
+                    raise
+                self._migrate_add_storage_policy(conn)
+                conn.execute(query, (point,))
+            conn.commit()
+
+    def get_misplaced_since(self, start, count):
+        """
+        Get a list of objects which are in a storage policy different
+        from the container's storage policy.
+
+        :param start: last reconciler sync point
+        :param count: maximum number of entries to get
+
+        :returns: list of dicts with keys: name, created_at, size,
+                  content_type, etag, storage_policy_index
+        """
+        qry = '''
+            SELECT ROWID, name, created_at, size, content_type, etag,
+                   deleted, storage_policy_index
+            FROM object
+            WHERE ROWID > ?
+            AND storage_policy_index != (
+                SELECT storage_policy_index FROM container_stat LIMIT 1)
+            ORDER BY ROWID ASC LIMIT ?
+        '''
+        self._commit_puts_stale_ok()
+        with self.get() as conn:
+            try:
+                cur = conn.execute(qry, (start, count))
+            except sqlite3.OperationalError as err:
+                if "no such column: storage_policy_index" not in str(err):
+                    raise
+                return []
+            return list(dict(row) for row in cur.fetchall())
+
+    def _migrate_add_container_sync_points(self, conn):
+        """
+        Add the x_container_sync_point columns to the 'container_stat' table.
+        """
+        conn.executescript('''
+            BEGIN;
+            ALTER TABLE container_stat
+            ADD COLUMN x_container_sync_point1 INTEGER DEFAULT -1;
+            ALTER TABLE container_stat
+            ADD COLUMN x_container_sync_point2 INTEGER DEFAULT -1;
+            COMMIT;
+        ''')
+
+    def _migrate_add_storage_policy(self, conn):
+        """
+        Migrate the container schema to support tracking objects from
+        multiple storage policies.  If the container_stat table has any
+        pending migrations, they are applied now before copying into
+        container_info.
+
+         * create the 'policy_stat' table.
+         * copy the current 'object_count' and 'bytes_used' columns to a
+           row in the 'policy_stat' table.
+         * add the storage_policy_index column to the 'object' table.
+         * drop the 'object_insert' and 'object_delete' triggers.
+         * add the 'object_insert_policy_stat' and
+           'object_delete_policy_stat' triggers.
+         * create container_info table for non-policy container info
+         * insert values from container_stat into container_info
+         * drop container_stat table
+         * create container_stat view
+        """
+
+        # I tried just getting the list of column names in the current
+        # container_stat table with a pragma table_info, but could never get
+        # it inside the same transaction as the DDL (non-DML) statements:
+        #     https://docs.python.org/2/library/sqlite3.html
+        #         #controlling-transactions
+        # So we just apply all pending migrations to container_stat and copy a
+        # static known list of column names into container_info.
+        try:
+            self._migrate_add_container_sync_points(conn)
+        except sqlite3.OperationalError as e:
+            if 'duplicate column' in str(e):
+                conn.execute('ROLLBACK;')
+            else:
+                raise
+
+        try:
+            conn.executescript("""
+                ALTER TABLE container_stat
+                ADD COLUMN metadata TEXT DEFAULT '';
+            """)
+        except sqlite3.OperationalError as e:
+            if 'duplicate column' not in str(e):
+                raise
+
+        column_names = ', '.join((
+            'account', 'container', 'created_at', 'put_timestamp',
+            'delete_timestamp', 'reported_put_timestamp',
+            'reported_object_count', 'reported_bytes_used', 'hash', 'id',
+            'status', 'status_changed_at', 'metadata',
+            'x_container_sync_point1', 'x_container_sync_point2'))
+
+        conn.executescript(
+            'BEGIN;' +
+            POLICY_STAT_TABLE_CREATE +
+            '''
+                INSERT INTO policy_stat (
+                    storage_policy_index, object_count, bytes_used)
+                SELECT 0, object_count, bytes_used
+                FROM container_stat;
+
+                ALTER TABLE object
+                ADD COLUMN storage_policy_index INTEGER DEFAULT 0;
+
+                DROP TRIGGER object_insert;
+                DROP TRIGGER object_delete;
+            ''' +
+            POLICY_STAT_TRIGGER_SCRIPT +
+            CONTAINER_INFO_TABLE_SCRIPT +
+            '''
+                INSERT INTO container_info (%s)
+                SELECT %s FROM container_stat;
+
+                DROP TABLE IF EXISTS container_stat;
+            ''' % (column_names, column_names) +
+            CONTAINER_STAT_VIEW_SCRIPT +
+            'COMMIT;')
+
+    def _migrate_add_shard_range_reported(self, conn):
+        """
+        Add the reported column to the 'shard_range' table.
+        """
+        conn.executescript('''
+            BEGIN;
+            ALTER TABLE %s
+            ADD COLUMN reported INTEGER DEFAULT 0;
+            COMMIT;
+        ''' % SHARD_RANGE_TABLE)
+
+    def _migrate_add_shard_range_tombstones(self, conn):
+        """
+        Add the tombstones column to the 'shard_range' table.
+        """
+        conn.executescript('''
+            BEGIN;
+            ALTER TABLE %s
+            ADD COLUMN tombstones INTEGER DEFAULT -1;
+            COMMIT;
+        ''' % SHARD_RANGE_TABLE)
+
+    def _reclaim_other_stuff(self, conn, age_timestamp, sync_timestamp):
+        """
+        This is only called once at the end of reclaim after tombstone reclaim
+        has been completed.
+
+        :param conn: db connection
+        :param age_timestamp: (float) the max created_at timestamp of object
+            rows to delete
+        :param sync_timestamp: (float) the max update_at timestamp of sync rows
+            to delete
+        """
+        super(ContainerBroker, self)._reclaim_other_stuff(
+            conn, age_timestamp, sync_timestamp)
+        # populate instance cache, but use existing conn to avoid deadlock
+        # when it has a pending update
+        self._populate_instance_cache(conn=conn)
+        try:
+            conn.execute('''
+                DELETE FROM %s WHERE deleted = 1 AND timestamp < ?
+                AND name != ?
+            ''' % SHARD_RANGE_TABLE, (sync_timestamp, self.path))
+        except sqlite3.OperationalError as err:
+            if ('no such table: %s' % SHARD_RANGE_TABLE) not in str(err):
+                raise
+
+    def _make_filler_shard_range(self, namespaces, marker, end_marker):
+        if namespaces and namespaces[-1].upper == Namespace.MAX:
+            return None
+
+        # Insert a modified copy of own shard range to fill any gap between the
+        # end of any found and the upper bound of own shard range. Gaps
+        # enclosed within the found shard ranges are not filled.
+        own_shard_range = self.get_own_shard_range()
+        if namespaces:
+            last_upper = namespaces[-1].upper
+        else:
+            last_upper = max(marker or own_shard_range.lower,
+                             own_shard_range.lower)
+        required_upper = min(end_marker or own_shard_range.upper,
+                             own_shard_range.upper)
+        if required_upper > last_upper:
+            filler_sr = own_shard_range
+            filler_sr.lower = last_upper
+            filler_sr.upper = required_upper
+            return filler_sr
+        else:
+            return None
+
+    def get_namespaces(self, marker=None, end_marker=None, includes=None,
+                       reverse=False, states=None, fill_gaps=False):
+        """
+        Returns a list of persisted namespaces per input parameters.
+
+        :param marker: restricts the returned list to shard ranges whose
+            namespace includes or is greater than the marker value. If
+            ``reverse=True`` then ``marker`` is treated as ``end_marker``.
+            ``marker`` is ignored if ``includes`` is specified.
+        :param end_marker: restricts the returned list to shard ranges whose
+            namespace includes or is less than the end_marker value. If
+            ``reverse=True`` then ``end_marker`` is treated as ``marker``.
+            ``end_marker`` is ignored if ``includes`` is specified.
+        :param includes: restricts the returned list to the shard range that
+            includes the given value; if ``includes`` is specified then
+            ``fill_gaps``, ``marker`` and ``end_marker`` are ignored.
+        :param reverse: reverse the result order.
+        :param states: if specified, restricts the returned list to namespaces
+            that have one of the given states; should be a list of ints.
+        :param fill_gaps: if True, insert a modified copy of own shard range to
+            fill any gap between the end of any found shard ranges and the
+            upper bound of own shard range. Gaps enclosed within the found
+            shard ranges are not filled.
+        :return: a list of Namespace objects.
+        """
+        if includes is None and (marker == Namespace.MAX
+                                 or end_marker == Namespace.MIN):
+            return []
+
+        if reverse:
+            marker, end_marker = end_marker, marker
+        if marker and end_marker and marker >= end_marker:
+            return []
+
+        included_states = set(states) if states else None
+        with self.get() as conn:
+            # Namespace only needs 'name', 'lower' and 'upper', but the query
+            # also need to include 'state' to be used when subesequently
+            # sorting the rows. And the sorting can't be done within SQLite
+            # since the value for maximum upper bound is an empty string.
+
+            conditions = ['deleted = 0', 'name != ?']
+            params = [self.path]
+            if included_states:
+                conditions.append('state in (%s)' % ','.join(
+                    '?' * len(included_states)))
+                params.extend(included_states)
+            if includes is None:
+                if end_marker:
+                    conditions.append('lower < ?')
+                    params.append(end_marker)
+                if marker:
+                    conditions.append("(upper = '' OR upper > ?)")
+                    params.append(marker)
+            else:
+                conditions.extend(('lower < ?', "(upper = '' OR upper >= ?)"))
+                params.extend((includes, includes))
+            condition = ' WHERE ' + ' AND '.join(conditions)
+            sql = '''
+            SELECT name, lower, upper, state FROM %s%s
+            ''' % (SHARD_RANGE_TABLE, condition)
+            try:
+                data = conn.execute(sql, params)
+                data.row_factory = None
+                namespaces = [row for row in data]
+            except sqlite3.OperationalError as err:
+                if ('no such table: %s' % SHARD_RANGE_TABLE) in str(err):
+                    return []
+                else:
+                    raise
+
+        # Sort those namespaces in order, note that each namespace record also
+        # include additional attribute 'state'.
+        def sort_key(namespace):
+            return ShardRange.sort_key_order(name=namespace[0],
+                                             lower=namespace[1],
+                                             upper=namespace[2],
+                                             state=namespace[3])
+        namespaces.sort(key=sort_key)
+        # Convert the record tuples to Namespace objects.
+        namespaces = [Namespace(row[0], row[1], row[2]) for row in namespaces]
+        if includes:
+            return namespaces[:1] if namespaces else []
+
+        if fill_gaps:
+            filler_sr = self._make_filler_shard_range(
+                namespaces, marker, end_marker)
+            if filler_sr:
+                namespaces.append(Namespace(filler_sr.name,
+                                            filler_sr.lower,
+                                            filler_sr.upper))
+        if reverse:
+            namespaces.reverse()
+
+        return namespaces
+
+    def _get_shard_range_rows(self, connection=None, marker=None,
+                              end_marker=None, includes=None,
+                              include_deleted=False, states=None,
+                              include_own=False, exclude_others=False,
+                              limit=None):
+        """
+        Returns a list of shard range rows.
+
+        To get all shard ranges use ``include_own=True``. To get only the
+        broker's own shard range use ``include_own=True`` and
+        ``exclude_others=True``.
+
+        :param connection: db connection
+        :param marker: restricts the returned list to rows whose namespace
+            includes or is greater than the marker value. ``marker`` is ignored
+             if ``includes`` is specified.
+        :param end_marker: restricts the returned list to rows whose namespace
+            includes or is less than the end_marker value. ``end_marker`` is
+            ignored if ``includes`` is specified.
+        :param includes: restricts the returned list to the shard range that
+            includes the given value; if ``includes`` is specified then
+            ``marker`` and ``end_marker`` are ignored, but other constraints
+            are applied (e.g. ``exclude_others`` and ``include_deleted``).
+        :param include_deleted: include rows marked as deleted.
+        :param states: include only rows matching the given states; should be
+            a list of ints.
+        :param include_own: boolean that governs whether the row whose name
+            matches the broker's path is included in the returned list. If
+            True, that row is included unless it is excluded by other
+            constraints (e.g. ``marker``, ``end_marker``, ``includes``). If
+            False, that row is not included. Default is False.
+        :param exclude_others: boolean that governs whether the rows whose
+            names do not match the broker's path are included in the returned
+            list. If True, those rows are not included, otherwise they are
+            included. Default is False.
+        :param limit: restricts the returned list to the given number of rows.
+            Should be a whole number; negative values will be ignored.
+            The ``limit`` parameter is useful to optimise a search
+            when the maximum number of expected matching rows is known, and
+            particularly when that maximum number is much less than the total
+            number of rows in the DB. However, the DB search is not ordered and
+            the subset of rows returned when ``limit`` is less than all
+            possible matching rows is therefore unpredictable.
+        :return: a list of tuples.
+        """
+
+        if exclude_others and not include_own:
+            return []
+
+        included_states = set(states) if states else None
+
+        # defaults to be used when legacy db's are missing columns
+        default_values = {'reported': 0,
+                          'tombstones': -1}
+
+        def do_query(conn, defaults=None):
+            condition = ''
+            conditions = []
+            params = []
+            if not include_deleted:
+                conditions.append('deleted=0')
+            if included_states:
+                conditions.append('state in (%s)' % ','.join(
+                    '?' * len(included_states)))
+                params.extend(included_states)
+            if not include_own:
+                conditions.append('name != ?')
+                params.append(self.path)
+            if exclude_others:
+                conditions.append('name = ?')
+                params.append(self.path)
+            if includes is None:
+                if end_marker:
+                    conditions.append('lower < ?')
+                    params.append(end_marker)
+                if marker:
+                    conditions.append("(upper = '' OR upper > ?)")
+                    params.append(marker)
+            else:
+                conditions.extend(('lower < ?', "(upper = '' OR upper >= ?)"))
+                params.extend((includes, includes))
+            if conditions:
+                condition = ' WHERE ' + ' AND '.join(conditions)
+            if limit is not None and limit >= 0:
+                condition += ' LIMIT %d' % limit
+            columns = SHARD_RANGE_KEYS[:-2]
+            for column in SHARD_RANGE_KEYS[-2:]:
+                if column in defaults:
+                    columns += (('%s as %s' %
+                                 (default_values[column], column)),)
+                else:
+                    columns += (column,)
+            sql = '''
+            SELECT %s
+            FROM %s%s;
+            ''' % (', '.join(columns), SHARD_RANGE_TABLE, condition)
+            data = conn.execute(sql, params)
+            data.row_factory = None
+            return [row for row in data]
+
+        with self.maybe_get(connection) as conn:
+            defaults = set()
+            attempts = len(default_values) + 1
+            while attempts:
+                attempts -= 1
+                try:
+                    return do_query(conn, defaults)
+                except sqlite3.OperationalError as err:
+                    if ('no such table: %s' % SHARD_RANGE_TABLE) in str(err):
+                        return []
+                    if not attempts:
+                        raise
+                    new_defaults = set()
+                    for column in default_values.keys():
+                        if 'no such column: %s' % column in str(err):
+                            new_defaults.add(column)
+                    if not new_defaults:
+                        raise
+                    if new_defaults.intersection(defaults):
+                        raise
+                    defaults.update(new_defaults)
+
+    @classmethod
+    def resolve_shard_range_states(cls, states):
+        """
+        Given a list of values each of which may be the name of a state, the
+        number of a state, or an alias, return the set of state numbers
+        described by the list.
+
+        The following alias values are supported: 'listing' maps to all states
+        that are considered valid when listing objects; 'updating' maps to all
+        states that are considered valid for redirecting an object update;
+        'auditing' maps to all states that are considered valid for a shard
+        container that is updating its own shard range table from a root (this
+        currently maps to all states except FOUND).
+
+        :param states: a list of values each of which may be the name of a
+            state, the number of a state, or an alias
+        :return: a set of integer state numbers, or None if no states are given
+        :raises ValueError: if any value in the given list is neither a valid
+            state nor a valid alias
+        """
+        if states:
+            resolved_states = set()
+            for state in states:
+                if state == 'listing':
+                    resolved_states.update(SHARD_LISTING_STATES)
+                elif state == 'updating':
+                    resolved_states.update(SHARD_UPDATE_STATES)
+                elif state == 'auditing':
+                    resolved_states.update(SHARD_AUDITING_STATES)
+                else:
+                    resolved_states.add(ShardRange.resolve_state(state)[0])
+            return resolved_states
+        return None
+
+    def get_shard_ranges(self, marker=None, end_marker=None, includes=None,
+                         reverse=False, include_deleted=False, states=None,
+                         include_own=False, exclude_others=False,
+                         fill_gaps=False):
+        """
+        Returns a list of persisted shard ranges.
+
+        :param marker: restricts the returned list to shard ranges whose
+            namespace includes or is greater than the marker value. If
+            ``reverse=True`` then ``marker`` is treated as ``end_marker``.
+            ``marker`` is ignored if ``includes`` is specified.
+        :param end_marker: restricts the returned list to shard ranges whose
+            namespace includes or is less than the end_marker value. If
+            ``reverse=True`` then ``end_marker`` is treated as ``marker``.
+            ``end_marker`` is ignored if ``includes`` is specified.
+        :param includes: restricts the returned list to the shard range that
+            includes the given value; if ``includes`` is specified then
+            ``fill_gaps``, ``marker`` and ``end_marker`` are ignored, but other
+            constraints are applied (e.g. ``exclude_others`` and
+            ``include_deleted``).
+        :param reverse: reverse the result order.
+        :param include_deleted: include items that have the delete marker set.
+        :param states: if specified, restricts the returned list to shard
+            ranges that have one of the given states; should be a list of ints.
+        :param include_own: boolean that governs whether the row whose name
+            matches the broker's path is included in the returned list. If
+            True, that row is included unless it is excluded by other
+            constraints (e.g. ``marker``, ``end_marker``, ``includes``). If
+            False, that row is not included. Default is False.
+        :param exclude_others: boolean that governs whether the rows whose
+            names do not match the broker's path are included in the returned
+            list. If True, those rows are not included, otherwise they are
+            included. Default is False.
+        :param fill_gaps: if True, insert a modified copy of own shard range to
+            fill any gap between the end of any found shard ranges and the
+            upper bound of own shard range. Gaps enclosed within the found
+            shard ranges are not filled. ``fill_gaps`` is ignored if
+            ``includes`` is specified.
+        :return: a list of instances of :class:`swift.common.utils.ShardRange`.
+        """
+        if includes is None and (marker == Namespace.MAX
+                                 or end_marker == Namespace.MIN):
+            return []
+
+        if reverse:
+            marker, end_marker = end_marker, marker
+        if marker and end_marker and marker >= end_marker:
+            return []
+
+        shard_ranges = [
+            ShardRange(*row)
+            for row in self._get_shard_range_rows(
+                marker=marker, end_marker=end_marker, includes=includes,
+                include_deleted=include_deleted, states=states,
+                include_own=include_own, exclude_others=exclude_others)]
+        shard_ranges.sort(key=ShardRange.sort_key)
+        if includes:
+            return shard_ranges[:1] if shard_ranges else []
+
+        if fill_gaps:
+            filler_sr = self._make_filler_shard_range(
+                shard_ranges, marker, end_marker)
+            if filler_sr:
+                shard_ranges.append(filler_sr)
+
+        if reverse:
+            shard_ranges.reverse()
+
+        return shard_ranges
+
+    def get_own_shard_range(self, no_default=False):
+        """
+        Returns a shard range representing this broker's own shard range. If no
+        such range has been persisted in the broker's shard ranges table then a
+        default shard range representing the entire namespace will be returned.
+
+        The ``object_count`` and ``bytes_used`` of the returned shard range are
+        not guaranteed to be up-to-date with the current object stats for this
+        broker. Callers that require up-to-date stats should use the
+        ``get_info`` method.
+
+        :param no_default: if True and the broker's own shard range is not
+            found in the shard ranges table then None is returned, otherwise a
+            default shard range is returned.
+        :return: an instance of :class:`~swift.common.utils.ShardRange`
+        """
+        rows = self._get_shard_range_rows(
+            include_own=True, include_deleted=True, exclude_others=True,
+            limit=1)
+        if rows:
+            own_shard_range = ShardRange(*rows[0])
+        elif no_default:
+            own_shard_range = None
+        else:
+            own_shard_range = ShardRange(
+                self.path, Timestamp.now(), ShardRange.MIN, ShardRange.MAX,
+                state=ShardRange.ACTIVE)
+        return own_shard_range
+
+    def is_own_shard_range(self, shard_range):
+        return shard_range.name == self.path
+
+    def enable_sharding(self, epoch):
+        """
+        Updates this broker's own shard range with the given epoch, sets its
+        state to SHARDING and persists it in the DB.
+
+        :param epoch: a :class:`~swift.utils.common.Timestamp`
+        :return: the broker's updated own shard range.
+        """
+        own_shard_range = self.get_own_shard_range()
+        own_shard_range.update_state(ShardRange.SHARDING, epoch)
+        own_shard_range.epoch = epoch
+        self.merge_shard_ranges(own_shard_range)
+        return own_shard_range
+
+    def get_shard_usage(self):
+        """
+        Get the aggregate object stats for all shard ranges in states ACTIVE,
+        SHARDING or SHRINKING.
+
+        :return: a dict with keys {bytes_used, object_count}
+        """
+        with self.get() as conn:
+            sql = '''
+            SELECT COALESCE(SUM(bytes_used), 0),
+                   COALESCE(SUM(object_count), 0)
+            FROM %s
+            WHERE state in (%s)
+              AND deleted = 0
+              AND name != ?
+            ''' % (SHARD_RANGE_TABLE, ','.join('?' * len(SHARD_STATS_STATES)))
+            cur = conn.execute(sql, SHARD_STATS_STATES + [self.path])
+            bytes_used, object_count = cur.fetchone()
+        return {'bytes_used': bytes_used,
+                'object_count': object_count}
+
+    def has_other_shard_ranges(self):
+        """
+        This function tells if there is any shard range other than the
+        broker's own shard range, that is not marked as deleted.
+
+        :return: A boolean value as described above.
+        """
+        with self.get() as conn:
+            sql = '''
+            SELECT 1 FROM %s
+            WHERE deleted = 0 AND name != ? LIMIT 1
+            ''' % (SHARD_RANGE_TABLE)
+            try:
+                data = conn.execute(sql, [self.path])
+                data.row_factory = None
+                return True if [row for row in data] else False
+            except sqlite3.OperationalError as err:
+                if ('no such table: %s' % SHARD_RANGE_TABLE) in str(err):
+                    return False
+                else:
+                    raise
+
+    def get_all_shard_range_data(self):
+        """
+        Returns a list of all shard range data, including own shard range and
+        deleted shard ranges.
+
+        :return: A list of dict representations of a ShardRange.
+        """
+        shard_ranges = self.get_shard_ranges(include_deleted=True,
+                                             include_own=True)
+        return [dict(sr) for sr in shard_ranges]
+
+    def set_sharding_state(self):
+        """
+        Creates and initializes a fresh DB file in preparation for sharding a
+        retiring DB. The broker's own shard range must have an epoch timestamp
+        for this method to succeed.
+
+        :return: True if the fresh DB was successfully created, False
+            otherwise.
+        """
+        epoch = self.get_own_shard_range().epoch
+        if not epoch:
+            self.logger.warning("Container '%s' cannot be set to sharding "
+                                "state: missing epoch", self.path)
+            return False
+        db_state = self.get_db_state()
+        if not db_state == UNSHARDED:
+            self.logger.warning("Container '%s' cannot be set to sharding "
+                                "state while in %s state", self.path, db_state)
+            return False
+
+        info = self.get_info()
+        tmp_db_file = os.path.join(self.db_dir,
+                                   "fresh%s.db.tmp" % str(uuid4()))
+        fresh_broker = ContainerBroker(tmp_db_file, self.timeout, self.logger,
+                                       self.account, self.container)
+        fresh_broker.initialize(info['put_timestamp'],
+                                info['storage_policy_index'])
+        # copy relevant data from the retiring db to the fresh db
+        fresh_broker.update_metadata(self.metadata)
+        fresh_broker.merge_shard_ranges(self.get_all_shard_range_data())
+        # copy sync points so that any peer in sync with retiring db will
+        # appear to be in sync with the fresh db, although the peer shouldn't
+        # attempt to replicate objects to a db with shard ranges.
+        for incoming in (True, False):
+            syncs = self.get_syncs(incoming)
+            fresh_broker.merge_syncs(syncs, incoming)
+
+        max_row = self.get_max_row()
+        with fresh_broker.get() as fresh_broker_conn:
+            # Initialise the rowid to continue from where the retiring db ended
+            try:
+                sql = "INSERT into object " \
+                      "(ROWID, name, created_at, size, content_type, etag) " \
+                    "values (?, 'tmp_sharding', ?, 0, '', ?)"
+                fresh_broker_conn.execute(
+                    sql, (max_row, Timestamp.now().internal,
+                          MD5_OF_EMPTY_STRING))
+                fresh_broker_conn.execute(
+                    'DELETE FROM object WHERE ROWID = ?', (max_row,))
+                fresh_broker_conn.commit()
+            except sqlite3.OperationalError as err:
+                self.logger.error(
+                    'Failed to set the ROWID of the fresh database for %s: %s',
+                    self.path, err)
+                return False
+
+            # sync the retiring container stat into the fresh db. At least the
+            # things that either aren't covered through the normal
+            # broker api, and things that wont just be regenerated.
+            try:
+                sql = 'UPDATE container_stat SET created_at=?, '
+                sql += 'delete_timestamp=?, status=?, status_changed_at=?'
+                sql_data = (info['created_at'], info['delete_timestamp'],
+                            info['status'], info['status_changed_at'])
+                # 'reported_*' items are not sync'd because this is consistent
+                # with when a new DB is created after rsync'ing to another
+                # node (see _newid()). 'hash' should not be sync'd because
+                # this DB has no object rows.
+                fresh_broker_conn.execute(sql, sql_data)
+                fresh_broker_conn.commit()
+            except sqlite3.OperationalError as err:
+                self.logger.error(
+                    'Failed to sync the container_stat table/view with the '
+                    'fresh database for %s: %s',
+                    self.path, err)
+                return False
+
+        # Rename to the new database
+        fresh_db_filename = make_db_file_path(self._db_file, epoch)
+        renamer(tmp_db_file, fresh_db_filename)
+        self.reload_db_files()
+        return True
+
+    def set_sharded_state(self):
+        """
+        Unlink's the broker's retiring DB file.
+
+        :return: True if the retiring DB was successfully unlinked, False
+            otherwise.
+        """
+        db_state = self.get_db_state()
+        if not db_state == SHARDING:
+            self.logger.warning("Container %r cannot be set to sharded "
+                                "state while in %s state",
+                                self.path, db_state)
+            return False
+
+        self.reload_db_files()
+        if len(self.db_files) < 2:
+            self.logger.warning(
+                'Refusing to delete db file for %r: no fresher db file found '
+                'in %r.', self.path, self.db_files)
+            return False
+
+        retiring_file = self.db_files[-2]
+        try:
+            os.unlink(retiring_file)
+            self.logger.debug('Unlinked retiring db %r', retiring_file)
+        except OSError as err:
+            if err.errno != errno.ENOENT:
+                self.logger.exception('Failed to unlink %r' % self._db_file)
+            return False
+
+        self.reload_db_files()
+        if len(self.db_files) >= 2:
+            self.logger.warning(
+                'Still have multiple db files after unlinking %r: %r',
+                retiring_file, self.db_files)
+            return False
+
+        return True
+
+    def get_brokers(self):
+        """
+        Return a list of brokers for component dbs. The list has two entries
+        while the db state is sharding: the first entry is a broker for the
+        retiring db with ``skip_commits`` set to ``True``; the second entry is
+        a broker for the fresh db  with ``skip_commits`` set to ``False``. For
+        any other db state the list has one entry.
+
+        :return: a list of :class:`~swift.container.backend.ContainerBroker`
+        """
+        if len(self.db_files) > 2:
+            self.logger.warning('Unexpected db files will be ignored: %s' %
+                                self.db_files[:-2])
+        brokers = []
+        db_files = self.db_files[-2:]
+        while db_files:
+            db_file = db_files.pop(0)
+            sub_broker = ContainerBroker(
+                db_file, self.timeout, self.logger, self.account,
+                self.container, self.pending_timeout, self.stale_reads_ok,
+                force_db_file=True, skip_commits=bool(db_files))
+            brokers.append(sub_broker)
+        return brokers
+
+    def set_sharding_sysmeta(self, key, value):
+        """
+        Updates the broker's metadata stored under the given key
+        prefixed with a sharding specific namespace.
+
+        :param key: metadata key in the sharding metadata namespace.
+        :param value: metadata value
+        """
+        self.update_metadata({'X-Container-Sysmeta-Shard-' + key:
+                              (value, Timestamp.now().internal)})
+
+    def get_sharding_sysmeta_with_timestamps(self):
+        """
+        Returns sharding specific info from the broker's metadata with
+        timestamps.
+
+        :param key: if given the value stored under ``key`` in the sharding
+            info will be returned.
+        :return: a dict of sharding info with their timestamps.
+        """
+        prefix = 'X-Container-Sysmeta-Shard-'
+        return {
+            k[len(prefix):]: v
+            for k, v in self.metadata.items()
+            if k.startswith(prefix)
+        }
+
+    def get_sharding_sysmeta(self, key=None):
+        """
+        Returns sharding specific info from the broker's metadata.
+
+        :param key: if given the value stored under ``key`` in the sharding
+            info will be returned.
+        :return: either a dict of sharding info or the value stored under
+            ``key`` in that dict.
+        """
+        info = self.get_sharding_sysmeta_with_timestamps()
+        if key:
+            return info.get(key, (None, None))[0]
+        else:
+            return {k: v[0] for k, v in info.items()}
+
+    def _get_root_meta(self):
+        """
+        Get the (unquoted) root path, plus the header the info came from.
+        If no info available, returns ``(None, None)``
+        """
+        path = self.get_sharding_sysmeta('Quoted-Root')
+        if path:
+            return 'X-Container-Sysmeta-Shard-Quoted-Root', unquote(path)
+
+        path = self.get_sharding_sysmeta('Root')
+        if path:
+            return 'X-Container-Sysmeta-Shard-Root', path
+
+        return None, None
+
+    def _load_root_info(self):
+        """
+        Load the root container name and account for the container represented
+        by this broker.
+
+        The root container path, if set, is stored in sysmeta under the key
+        ``X-Container-Sysmeta-Shard-Root``. If this sysmeta is not set then the
+        container is considered to be a root container and ``_root_account``
+        and ``_root_container`` are set equal to the broker ``account`` and
+        ``container`` attributes respectively.
+
+        """
+        hdr, path = self._get_root_meta()
+
+        if not path:
+            # Ensure account/container get populated
+            self._populate_instance_cache()
+            self._root_account = self.account
+            self._root_container = self.container
+            return
+
+        try:
+            self._root_account, self._root_container = split_path(
+                '/' + path, 2, 2)
+        except ValueError:
+            raise ValueError("Expected %s to be of the form "
+                             "'account/container', got %r" % (hdr, path))
+
+    @property
+    def root_account(self):
+        if not self._root_account:
+            self._load_root_info()
+        return self._root_account
+
+    @property
+    def root_container(self):
+        if not self._root_container:
+            self._load_root_info()
+        return self._root_container
+
+    @property
+    def root_path(self):
+        return '%s/%s' % (self.root_account, self.root_container)
+
+    def is_root_container(self):
+        """
+        Returns True if this container is a root container, False otherwise.
+
+        A root container is a container that is not a shard of another
+        container.
+        """
+        _, path = self._get_root_meta()
+        if path is not None:
+            # We have metadata telling us where the root is; it's
+            # authoritative; shards should always have this metadata even when
+            # deleted
+            return self.path == path
+
+        # Else, we're either a root or a legacy deleted shard whose sharding
+        # sysmeta was deleted
+        own_shard_range = self.get_own_shard_range(no_default=True)
+        if not own_shard_range:
+            return True  # Never been sharded
+
+        if own_shard_range.deleted:
+            # When shard ranges shrink, they get marked deleted
+            return False
+        else:
+            # But even when a root collapses, empties, and gets deleted, its
+            # own_shard_range is left alive
+            return True
+
+    def _get_next_shard_range_upper(self, shard_size, last_upper=None):
+        """
+        Returns the name of the object that is ``shard_size`` rows beyond
+        ``last_upper`` in the object table ordered by name. If ``last_upper``
+        is not given then it defaults to the start of object table ordered by
+        name.
+
+        :param last_upper: the upper bound of the last found shard range.
+        :return: an object name, or None if the number of rows beyond
+            ``last_upper`` is less than ``shard_size``.
+        """
+        self._commit_puts_stale_ok()
+        with self.get() as connection:
+            sql = ('SELECT name FROM object WHERE %s=0 ' %
+                   self._get_deleted_key(connection))
+            args = []
+            if last_upper:
+                sql += "AND name > ? "
+                args.append(str(last_upper))
+            sql += "ORDER BY name LIMIT 1 OFFSET %d" % (shard_size - 1)
+            row = connection.execute(sql, args).fetchone()
+            return row['name'] if row else None
+
+    def find_shard_ranges(self, shard_size, limit=-1, existing_ranges=None,
+                          minimum_shard_size=1):
+        """
+        Scans the container db for shard ranges. Scanning will start at the
+        upper bound of the any ``existing_ranges`` that are given, otherwise
+        at ``ShardRange.MIN``. Scanning will stop when ``limit`` shard ranges
+        have been found or when no more shard ranges can be found. In the
+        latter case, the upper bound of the final shard range will be equal to
+        the upper bound of the container namespace.
+
+        This method does not modify the state of the db; callers are
+        responsible for persisting any shard range data in the db.
+
+        :param shard_size: the size of each shard range
+        :param limit: the maximum number of shard points to be found; a
+            negative value (default) implies no limit.
+        :param existing_ranges: an optional list of existing ShardRanges; if
+            given, this list should be sorted in order of upper bounds; the
+            scan for new shard ranges will start at the upper bound of the last
+            existing ShardRange.
+        :param minimum_shard_size: Minimum size of the final shard range. If
+            this is greater than one then the final shard range may be extended
+            to more than shard_size in order to avoid a further shard range
+            with less minimum_shard_size rows.
+        :return:  a tuple; the first value in the tuple is a list of
+            dicts each having keys {'index', 'lower', 'upper', 'object_count'}
+            in order of ascending 'upper'; the second value in the tuple is a
+            boolean which is True if the last shard range has been found, False
+            otherwise.
+        """
+        existing_ranges = existing_ranges or []
+        minimum_shard_size = max(minimum_shard_size, 1)
+        object_count = self.get_info().get('object_count', 0)
+        if shard_size + minimum_shard_size > object_count:
+            # container not big enough to shard
+            return [], False
+
+        own_shard_range = self.get_own_shard_range()
+        progress = 0
+        progress_reliable = True
+        # update initial state to account for any existing shard ranges
+        if existing_ranges:
+            if all([sr.state == ShardRange.FOUND
+                    for sr in existing_ranges]):
+                progress = sum([sr.object_count for sr in existing_ranges])
+            else:
+                # else: object count in existing shard ranges may have changed
+                # since they were found so progress cannot be reliably
+                # calculated; use default progress of zero - that's ok,
+                # progress is used for optimisation not correctness
+                progress_reliable = False
+            last_shard_upper = existing_ranges[-1].upper
+            if last_shard_upper >= own_shard_range.upper:
+                # == implies all ranges were previously found
+                # > implies an acceptor range has been set into which this
+                # shard should cleave itself
+                return [], True
+        else:
+            last_shard_upper = own_shard_range.lower
+
+        found_ranges = []
+        sub_broker = self.get_brokers()[0]
+        index = len(existing_ranges)
+        while limit is None or limit < 0 or len(found_ranges) < limit:
+            if progress + shard_size + minimum_shard_size > object_count:
+                # next shard point is within minimum_size rows of the final
+                # object name, or beyond it, so don't bother with db query.
+                # This shard will have <= shard_size + (minimum_size - 1) rows.
+                next_shard_upper = None
+            else:
+                try:
+                    next_shard_upper = sub_broker._get_next_shard_range_upper(
+                        shard_size, last_shard_upper)
+                except (sqlite3.OperationalError, LockTimeout):
+                    self.logger.exception(
+                        "Problem finding shard upper in %r: " % self.db_file)
+                    break
+
+            if (next_shard_upper is None or
+                    next_shard_upper > own_shard_range.upper):
+                # We reached the end of the container namespace, or possibly
+                # beyond if the container has misplaced objects. In either case
+                # limit the final shard range to own_shard_range.upper.
+                next_shard_upper = own_shard_range.upper
+                if progress_reliable:
+                    # object count may include misplaced objects so the final
+                    # shard size may not be accurate until cleaved, but at
+                    # least the sum of shard sizes will equal the unsharded
+                    # object_count
+                    shard_size = object_count - progress
+
+            # NB shard ranges are created with a non-zero object count for a
+            # few reasons:
+            #  1. so that the apparent container object count remains
+            #     consistent;
+            #  2. the container is non-deletable while shards have been found
+            #     but not yet cleaved; and
+            #  3. So we have a rough idea of size of the shards should be
+            #     while cleaving.
+            found_ranges.append(
+                {'index': index,
+                 'lower': str(last_shard_upper),
+                 'upper': str(next_shard_upper),
+                 'object_count': shard_size})
+
+            if next_shard_upper == own_shard_range.upper:
+                return found_ranges, True
+
+            progress += shard_size
+            last_shard_upper = next_shard_upper
+            index += 1
+
+        return found_ranges, False
diff --git a/swift/container/reconciler.py b/swift/container/reconciler.py
new file mode 100644
index 0000000000..d61206a30c
--- /dev/null
+++ b/swift/container/reconciler.py
@@ -0,0 +1,865 @@
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import time
+from collections import defaultdict
+import functools
+import socket
+import itertools
+import logging
+
+from eventlet import GreenPile, GreenPool, Timeout
+
+from swift.common import constraints
+from swift.common.daemon import Daemon, run_daemon
+from swift.common.direct_client import (
+    direct_head_container, direct_delete_container_object,
+    direct_put_container_object, ClientException)
+from swift.common.internal_client import InternalClient, UnexpectedResponse
+from swift.common.request_helpers import MISPLACED_OBJECTS_ACCOUNT, \
+    USE_REPLICATION_NETWORK_HEADER
+from swift.common.utils import get_logger, split_path, majority_size, \
+    FileLikeIter, Timestamp, last_modified_date_to_timestamp, \
+    LRUCache, decode_timestamps, hash_path, parse_options
+from swift.common.storage_policy import POLICIES
+
+MISPLACED_OBJECTS_CONTAINER_DIVISOR = 3600  # 1 hour
+CONTAINER_POLICY_TTL = 30
+
+
+def cmp_policy_info(info, remote_info):
+    """
+    You have to squint to see it, but the general strategy is just:
+
+    if either has been recreated:
+        return the newest (of the recreated)
+    else
+        return the oldest
+
+    I tried cleaning it up for awhile, but settled on just writing a bunch of
+    tests instead.  Once you get an intuitive sense for the nuance here you
+    can try and see there's a better way to spell the boolean logic but it all
+    ends up looking sorta hairy.
+
+    :returns: -1 if info is correct, 1 if remote_info is better
+    """
+    def is_deleted(info):
+        return (info['delete_timestamp'] > info['put_timestamp'] and
+                info.get('count', info.get('object_count', 0)) == 0)
+
+    def cmp(a, b):
+        if a < b:
+            return -1
+        elif b < a:
+            return 1
+        else:
+            return 0
+
+    deleted = is_deleted(info)
+    remote_deleted = is_deleted(remote_info)
+    if any([deleted, remote_deleted]):
+        if not deleted:
+            return -1
+        elif not remote_deleted:
+            return 1
+        return cmp(remote_info['status_changed_at'],
+                   info['status_changed_at'])
+
+    def has_been_recreated(info):
+        return (info['put_timestamp'] > info['delete_timestamp'] >
+                Timestamp.zero())
+
+    remote_recreated = has_been_recreated(remote_info)
+    recreated = has_been_recreated(info)
+    if any([remote_recreated, recreated]):
+        if not recreated:
+            return 1
+        elif not remote_recreated:
+            return -1
+        # both have been recreated, everything devoles to here eventually
+        most_recent_successful_delete = max(info['delete_timestamp'],
+                                            remote_info['delete_timestamp'])
+        if info['put_timestamp'] < most_recent_successful_delete:
+            return 1
+        elif remote_info['put_timestamp'] < most_recent_successful_delete:
+            return -1
+    return cmp(info['status_changed_at'], remote_info['status_changed_at'])
+
+
+def incorrect_policy_index(info, remote_info):
+    """
+    Compare remote_info to info and decide if the remote storage policy index
+    should be used instead of ours.
+    """
+    if 'storage_policy_index' not in remote_info:
+        return False
+    if remote_info['storage_policy_index'] == info['storage_policy_index']:
+        return False
+
+    # Only return True if remote_info has the better data;
+    # see the docstring for cmp_policy_info
+    return cmp_policy_info(info, remote_info) > 0
+
+
+def translate_container_headers_to_info(headers):
+    default_timestamp = Timestamp.zero().internal
+    return {
+        'storage_policy_index': int(headers['X-Backend-Storage-Policy-Index']),
+        'put_timestamp': headers.get('x-backend-put-timestamp',
+                                     default_timestamp),
+        'delete_timestamp': headers.get('x-backend-delete-timestamp',
+                                        default_timestamp),
+        'status_changed_at': headers.get('x-backend-status-changed-at',
+                                         default_timestamp),
+    }
+
+
+def best_policy_index(headers):
+    container_info = [translate_container_headers_to_info(header_set)
+                      for header_set in headers]
+    container_info.sort(key=functools.cmp_to_key(cmp_policy_info))
+    return container_info[0]['storage_policy_index']
+
+
+def get_reconciler_container_name(obj_timestamp):
+    """
+    Get the name of a container into which a misplaced object should be
+    enqueued. The name is the object's last modified time rounded down to the
+    nearest hour.
+
+    :param obj_timestamp: a string representation of the object's 'created_at'
+                          time from it's container db row.
+    :return: a container name
+    """
+    # Use last modified time of object to determine reconciler container name
+    _junk, _junk, ts_meta = decode_timestamps(obj_timestamp)
+    return str(int(ts_meta) //
+               MISPLACED_OBJECTS_CONTAINER_DIVISOR *
+               MISPLACED_OBJECTS_CONTAINER_DIVISOR)
+
+
+def get_reconciler_obj_name(policy_index, account, container, obj):
+    return "%(policy_index)d:/%(acc)s/%(con)s/%(obj)s" % {
+        'policy_index': policy_index, 'acc': account,
+        'con': container, 'obj': obj}
+
+
+def get_reconciler_content_type(op):
+    try:
+        return {
+            'put': 'application/x-put',
+            'delete': 'application/x-delete',
+        }[op.lower()]
+    except KeyError:
+        raise ValueError('invalid operation type %r' % op)
+
+
+def get_row_to_q_entry_translator(broker):
+    account = broker.root_account
+    container = broker.root_container
+    op_type = {
+        0: get_reconciler_content_type('put'),
+        1: get_reconciler_content_type('delete'),
+    }
+
+    def translator(obj_info):
+        name = get_reconciler_obj_name(obj_info['storage_policy_index'],
+                                       account, container,
+                                       obj_info['name'])
+        return {
+            'name': name,
+            'deleted': 0,
+            'created_at': obj_info['created_at'],
+            'etag': obj_info['created_at'],
+            'content_type': op_type[obj_info['deleted']],
+            'size': 0,
+        }
+    return translator
+
+
+def add_to_reconciler_queue(container_ring, account, container, obj,
+                            obj_policy_index, obj_timestamp, op,
+                            force=False, conn_timeout=5, response_timeout=15):
+    """
+    Add an object to the container reconciler's queue. This will cause the
+    container reconciler to move it from its current storage policy index to
+    the correct storage policy index.
+
+    :param container_ring: container ring
+    :param account: the misplaced object's account
+    :param container: the misplaced object's container
+    :param obj: the misplaced object
+    :param obj_policy_index: the policy index where the misplaced object
+                             currently is
+    :param obj_timestamp: the misplaced object's X-Timestamp. We need this to
+                          ensure that the reconciler doesn't overwrite a newer
+                          object with an older one.
+    :param op: the method of the operation (DELETE or PUT)
+    :param force: over-write queue entries newer than obj_timestamp
+    :param conn_timeout: max time to wait for connection to container server
+    :param response_timeout: max time to wait for response from container
+                             server
+
+    :returns: .misplaced_object container name, False on failure. "Success"
+              means a majority of containers got the update.
+    """
+    container_name = get_reconciler_container_name(obj_timestamp)
+    object_name = get_reconciler_obj_name(obj_policy_index, account,
+                                          container, obj)
+    if force:
+        # this allows an operator to re-enqueue an object that has
+        # already been popped from the queue to be reprocessed, but
+        # could potentially prevent out of order updates from making it
+        # into the queue
+        x_timestamp = Timestamp.now().internal
+    else:
+        x_timestamp = obj_timestamp
+    q_op_type = get_reconciler_content_type(op)
+    headers = {
+        'X-Size': 0,
+        'X-Etag': obj_timestamp,
+        'X-Timestamp': x_timestamp,
+        'X-Content-Type': q_op_type,
+        USE_REPLICATION_NETWORK_HEADER: 'true',
+    }
+
+    def _check_success(*args, **kwargs):
+        try:
+            direct_put_container_object(*args, **kwargs)
+            return 1
+        except (ClientException, Timeout, socket.error):
+            return 0
+
+    pile = GreenPile()
+    part, nodes = container_ring.get_nodes(MISPLACED_OBJECTS_ACCOUNT,
+                                           container_name)
+    for node in nodes:
+        pile.spawn(_check_success, node, part, MISPLACED_OBJECTS_ACCOUNT,
+                   container_name, object_name, headers=headers,
+                   conn_timeout=conn_timeout,
+                   response_timeout=response_timeout)
+
+    successes = sum(pile)
+    if successes >= majority_size(len(nodes)):
+        return container_name
+    else:
+        return False
+
+
+def slightly_later_timestamp(ts, offset=1):
+    return Timestamp(ts, offset=offset).internal
+
+
+def parse_raw_obj(obj_info):
+    """
+    Translate a reconciler container listing entry to a dictionary
+    containing the parts of the misplaced object queue entry.
+
+    :param obj_info: an entry in an a container listing with the
+                     required keys: name, content_type, and hash
+
+    :returns: a queue entry dict with the keys: q_policy_index, account,
+              container, obj, q_op, q_ts, q_record, and path
+    """
+    raw_obj_name = obj_info['name']
+    policy_index, obj_name = raw_obj_name.split(':', 1)
+    q_policy_index = int(policy_index)
+    account, container, obj = split_path(obj_name, 3, 3, rest_with_last=True)
+    try:
+        q_op = {
+            'application/x-put': 'PUT',
+            'application/x-delete': 'DELETE',
+        }[obj_info['content_type']]
+    except KeyError:
+        raise ValueError('invalid operation type %r' %
+                         obj_info.get('content_type', None))
+    return {
+        'q_policy_index': q_policy_index,
+        'account': account,
+        'container': container,
+        'obj': obj,
+        'q_op': q_op,
+        'q_ts': decode_timestamps((obj_info['hash']))[0],
+        'q_record': last_modified_date_to_timestamp(
+            obj_info['last_modified']),
+        'path': '/%s/%s/%s' % (account, container, obj)
+    }
+
+
+@LRUCache(maxtime=CONTAINER_POLICY_TTL)
+def direct_get_container_policy_index(container_ring, account_name,
+                                      container_name):
+    """
+    Talk directly to the primary container servers to figure out the storage
+    policy index for a given container.
+
+    :param container_ring: ring in which to look up the container locations
+    :param account_name: name of the container's account
+    :param container_name: name of the container
+    :returns: storage policy index, or None if it couldn't get a majority
+    """
+    def _eat_client_exception(*args):
+        try:
+            return direct_head_container(*args, headers={
+                USE_REPLICATION_NETWORK_HEADER: 'true'})
+        except ClientException as err:
+            if err.http_status == 404:
+                return err.http_headers
+        except (Timeout, socket.error):
+            pass
+
+    pile = GreenPile()
+    part, nodes = container_ring.get_nodes(account_name, container_name)
+    for node in nodes:
+        pile.spawn(_eat_client_exception, node, part, account_name,
+                   container_name)
+
+    headers = [x for x in pile if x is not None]
+    if len(headers) < majority_size(len(nodes)):
+        return
+    return best_policy_index(headers)
+
+
+def direct_delete_container_entry(container_ring, account_name, container_name,
+                                  object_name, headers=None):
+    """
+    Talk directly to the primary container servers to delete a particular
+    object listing. Does not talk to object servers; use this only when a
+    container entry does not actually have a corresponding object.
+    """
+    if headers is None:
+        headers = {}
+    headers[USE_REPLICATION_NETWORK_HEADER] = 'true'
+
+    pool = GreenPool()
+    part, nodes = container_ring.get_nodes(account_name, container_name)
+    for node in nodes:
+        pool.spawn_n(direct_delete_container_object, node, part, account_name,
+                     container_name, object_name, headers=headers)
+
+    # This either worked or it didn't; if it didn't, we'll retry on the next
+    # reconciler loop when we see the queue entry again.
+    pool.waitall()
+
+
+class ContainerReconciler(Daemon):
+    """
+    Move objects that are in the wrong storage policy.
+    """
+    log_route = 'container-reconciler'
+
+    def __init__(self, conf, logger=None, swift=None):
+        self.conf = conf
+        # This option defines how long an un-processable misplaced object
+        # marker will be retried before it is abandoned.  It is not coupled
+        # with the tombstone reclaim age in the consistency engine.
+        self.reclaim_age = int(conf.get('reclaim_age', 86400 * 7))
+        self.interval = float(conf.get('interval', 30))
+        conf_path = conf.get('__file__') or \
+            '/etc/swift/container-reconciler.conf'
+        self.logger = logger or get_logger(
+            conf, log_route=self.log_route)
+        request_tries = int(conf.get('request_tries') or 3)
+        self.swift = swift or InternalClient(
+            conf_path,
+            'Swift Container Reconciler',
+            request_tries,
+            use_replication_network=True,
+            global_conf={'log_name': '%s-ic' % conf.get(
+                'log_name', self.log_route)})
+        self.swift_dir = conf.get('swift_dir', '/etc/swift')
+        self.stats = defaultdict(int)
+        self.last_stat_time = time.time()
+        self.ring_check_interval = float(conf.get('ring_check_interval', 15))
+        self.concurrency = int(conf.get('concurrency', 1))
+        if self.concurrency < 1:
+            raise ValueError("concurrency must be set to at least 1")
+        self.processes = int(self.conf.get('processes', 0))
+        if self.processes < 0:
+            raise ValueError(
+                'processes must be an integer greater than or equal to 0')
+        self.process = int(self.conf.get('process', 0))
+        if self.process < 0:
+            raise ValueError(
+                'process must be an integer greater than or equal to 0')
+        if self.processes and self.process >= self.processes:
+            raise ValueError(
+                'process must be less than processes')
+
+    def stats_log(self, metric, msg, *args, **kwargs):
+        """
+        Update stats tracking for metric and emit log message.
+        """
+        level = kwargs.pop('level', logging.DEBUG)
+        log_message = '%s: ' % metric + msg
+        self.logger.log(level, log_message, *args, **kwargs)
+        self.stats[metric] += 1
+
+    def log_stats(self, force=False):
+        """
+        Dump stats to logger, noop when stats have been already been
+        logged in the last minute.
+        """
+        now = time.time()
+        should_log = force or (now - self.last_stat_time > 60)
+        if should_log:
+            self.last_stat_time = now
+            self.logger.info('Reconciler Stats: %r', dict(**self.stats))
+
+    def pop_queue(self, container, obj, q_ts, q_record):
+        """
+        Issue a delete object request to the container for the misplaced
+        object queue entry.
+
+        :param container: the misplaced objects container
+        :param obj: the name of the misplaced object
+        :param q_ts: the timestamp of the misplaced object
+        :param q_record: the timestamp of the queue entry
+
+        N.B. q_ts will normally be the same time as q_record except when
+        an object was manually re-enqued.
+        """
+        q_path = '/%s/%s/%s' % (MISPLACED_OBJECTS_ACCOUNT, container, obj)
+        x_timestamp = slightly_later_timestamp(max(q_record, q_ts), offset=2)
+        self.stats_log('pop_queue', 'remove %r (%f) from the queue (%s)',
+                       q_path, q_ts, x_timestamp)
+        headers = {'X-Timestamp': x_timestamp}
+        direct_delete_container_entry(
+            self.swift.container_ring, MISPLACED_OBJECTS_ACCOUNT,
+            container, obj, headers=headers)
+
+    def can_reconcile_policy(self, policy_index):
+        pol = POLICIES.get_by_index(policy_index)
+        if pol:
+            pol.load_ring(self.swift_dir, reload_time=self.ring_check_interval)
+            return pol.object_ring.next_part_power is None
+        return False
+
+    def throw_tombstones(self, account, container, obj, timestamp,
+                         policy_index, path):
+        """
+        Issue a delete object request to the given storage_policy.
+
+        :param account: the account name
+        :param container: the container name
+        :param obj: the object name
+        :param timestamp: the timestamp of the object to delete
+        :param policy_index: the policy index to direct the request
+        :param path: the path to be used for logging
+        """
+        x_timestamp = slightly_later_timestamp(timestamp)
+        self.stats_log('cleanup_attempt', '%r (%f) from policy_index '
+                       '%s (%s) will be deleted',
+                       path, timestamp, policy_index, x_timestamp)
+        headers = {
+            'X-Timestamp': x_timestamp,
+            'X-Backend-Storage-Policy-Index': policy_index,
+        }
+        success = False
+        try:
+            self.swift.delete_object(account, container, obj,
+                                     acceptable_statuses=(2, 404),
+                                     headers=headers)
+        except UnexpectedResponse as err:
+            self.stats_log('cleanup_failed', '%r (%f) was not cleaned up '
+                           'in storage_policy %s (%s)', path, timestamp,
+                           policy_index, err)
+        else:
+            success = True
+            self.stats_log('cleanup_success', '%r (%f) was successfully '
+                           'removed from policy_index %s', path, timestamp,
+                           policy_index)
+        return success
+
+    def _reconcile_object(self, account, container, obj, q_policy_index, q_ts,
+                          q_op, path, **kwargs):
+        """
+        Perform object reconciliation.
+
+        :param account: the account name of the misplaced object
+        :param container: the container name of the misplaced object
+        :param obj: the object name
+        :param q_policy_index: the policy index of the source indicated by the
+                               queue entry.
+        :param q_ts: the timestamp of the misplaced object
+        :param q_op: the operation of the misplaced request
+        :param path: the full path of the misplaced object for logging
+
+        :returns: True to indicate the request is fully processed
+                  successfully, otherwise False.
+        """
+        container_policy_index = direct_get_container_policy_index(
+            self.swift.container_ring, account, container)
+        if container_policy_index is None:
+            self.stats_log('unavailable_container', '%r (%f) unable to '
+                           'determine the destination policy_index',
+                           path, q_ts)
+            return False
+        if container_policy_index == q_policy_index:
+            self.stats_log('noop_object', '%r (%f) container policy_index '
+                           '%s matches queue policy index %s', path, q_ts,
+                           container_policy_index, q_policy_index)
+            return True
+
+        # don't reconcile if the source or container policy_index is in the
+        # middle of a PPI
+        if not self.can_reconcile_policy(q_policy_index):
+            self.stats_log('ppi_skip', 'Source policy (%r) in the middle of '
+                           'a part power increase (PPI)', q_policy_index)
+            return False
+        if not self.can_reconcile_policy(container_policy_index):
+            self.stats_log('ppi_skip', 'Container policy (%r) in the middle '
+                           'of a part power increase (PPI)',
+                           container_policy_index)
+            return False
+
+        # check if object exists in the destination already
+        self.logger.debug('checking for %r (%f) in destination '
+                          'policy_index %s', path, q_ts,
+                          container_policy_index)
+        headers = {
+            'X-Backend-Storage-Policy-Index': container_policy_index}
+        try:
+            dest_obj = self.swift.get_object_metadata(
+                account, container, obj, headers=headers,
+                acceptable_statuses=(2, 4))
+        except UnexpectedResponse:
+            self.stats_log('unavailable_destination', '%r (%f) unable to '
+                           'determine the destination timestamp, if any',
+                           path, q_ts)
+            return False
+        dest_ts = Timestamp(
+            dest_obj.get('x-backend-timestamp', Timestamp.zero()))
+        if dest_ts >= q_ts:
+            self.stats_log('found_object', '%r (%f) in policy_index %s '
+                           'is newer than queue (%f)', path, dest_ts,
+                           container_policy_index, q_ts)
+            return self.throw_tombstones(account, container, obj, q_ts,
+                                         q_policy_index, path)
+
+        # object is misplaced
+        self.stats_log('misplaced_object', '%r (%f) in policy_index %s '
+                       'should be in policy_index %s', path, q_ts,
+                       q_policy_index, container_policy_index)
+
+        # fetch object from the source location
+        self.logger.debug('fetching %r (%f) from storage policy %s', path,
+                          q_ts, q_policy_index)
+        headers = {
+            'X-Backend-Storage-Policy-Index': q_policy_index}
+        try:
+            source_obj_status, source_obj_info, source_obj_iter = \
+                self.swift.get_object(account, container, obj,
+                                      headers=headers,
+                                      acceptable_statuses=(2, 4))
+        except UnexpectedResponse as err:
+            source_obj_status = err.resp.status_int
+            source_obj_info = {}
+            source_obj_iter = None
+
+        source_ts = Timestamp(
+            source_obj_info.get('x-backend-timestamp', Timestamp.zero()))
+        if source_obj_status == 404 and q_op == 'DELETE':
+            return self.ensure_tombstone_in_right_location(
+                q_policy_index, account, container, obj, q_ts, path,
+                container_policy_index, source_ts)
+        else:
+            return self.ensure_object_in_right_location(
+                q_policy_index, account, container, obj, q_ts, path,
+                container_policy_index, source_ts, source_obj_status,
+                source_obj_info, source_obj_iter)
+
+    def ensure_object_in_right_location(self, q_policy_index, account,
+                                        container, obj, q_ts, path,
+                                        container_policy_index, source_ts,
+                                        source_obj_status, source_obj_info,
+                                        source_obj_iter, **kwargs):
+        """
+        Validate source object will satisfy the misplaced object queue entry
+        and move to destination.
+
+        :param q_policy_index: the policy_index for the source object
+        :param account: the account name of the misplaced object
+        :param container: the container name of the misplaced object
+        :param obj: the name of the misplaced object
+        :param q_ts: the timestamp of the misplaced object
+        :param path: the full path of the misplaced object for logging
+        :param container_policy_index: the policy_index of the destination
+        :param source_ts: the timestamp of the source object
+        :param source_obj_status: the HTTP status source object request
+        :param source_obj_info: the HTTP headers of the source object request
+        :param source_obj_iter: the body iter of the source object request
+        """
+        if source_obj_status // 100 != 2 or source_ts < q_ts:
+            if q_ts < time.time() - self.reclaim_age:
+                # it's old and there are no tombstones or anything; give up
+                self.stats_log('lost_source', '%r (%s) was not available in '
+                               'policy_index %s and has expired', path,
+                               q_ts.internal, q_policy_index,
+                               level=logging.CRITICAL)
+                return True
+            # the source object is unavailable or older than the queue
+            # entry; a version that will satisfy the queue entry hopefully
+            # exists somewhere in the cluster, so wait and try again
+            self.stats_log('unavailable_source', '%r (%s) in '
+                           'policy_index %s responded %s (%s)', path,
+                           q_ts.internal, q_policy_index, source_obj_status,
+                           source_ts.internal, level=logging.WARNING)
+            return False
+
+        # optimistically move any source with a timestamp >= q_ts
+        ts = max(Timestamp(source_ts), q_ts)
+        # move the object
+        put_timestamp = slightly_later_timestamp(ts, offset=3)
+        self.stats_log('copy_attempt', '%r (%f) in policy_index %s will be '
+                       'moved to policy_index %s (%s)', path, source_ts,
+                       q_policy_index, container_policy_index, put_timestamp)
+        headers = source_obj_info.copy()
+        headers['X-Backend-Storage-Policy-Index'] = container_policy_index
+        headers['X-Timestamp'] = put_timestamp
+
+        try:
+            self.swift.upload_object(
+                FileLikeIter(source_obj_iter), account, container, obj,
+                headers=headers)
+        except UnexpectedResponse as err:
+            self.stats_log('copy_failed', 'upload %r (%f) from '
+                           'policy_index %s to policy_index %s '
+                           'returned %s', path, source_ts, q_policy_index,
+                           container_policy_index, err, level=logging.WARNING)
+            return False
+        except:  # noqa
+            self.stats_log('unhandled_error', 'unable to upload %r (%f) '
+                           'from policy_index %s to policy_index %s ', path,
+                           source_ts, q_policy_index, container_policy_index,
+                           level=logging.ERROR, exc_info=True)
+            return False
+
+        self.stats_log('copy_success', '%r (%f) moved from policy_index %s '
+                       'to policy_index %s (%s)', path, source_ts,
+                       q_policy_index, container_policy_index, put_timestamp)
+
+        return self.throw_tombstones(account, container, obj, q_ts,
+                                     q_policy_index, path)
+
+    def ensure_tombstone_in_right_location(self, q_policy_index, account,
+                                           container, obj, q_ts, path,
+                                           container_policy_index, source_ts,
+                                           **kwargs):
+        """
+        Issue a DELETE request against the destination to match the
+        misplaced DELETE against the source.
+        """
+        delete_timestamp = slightly_later_timestamp(q_ts, offset=3)
+        self.stats_log('delete_attempt', '%r (%f) in policy_index %s '
+                       'will be deleted from policy_index %s (%s)', path,
+                       source_ts, q_policy_index, container_policy_index,
+                       delete_timestamp)
+        headers = {
+            'X-Backend-Storage-Policy-Index': container_policy_index,
+            'X-Timestamp': delete_timestamp,
+        }
+        try:
+            self.swift.delete_object(account, container, obj,
+                                     headers=headers)
+        except UnexpectedResponse as err:
+            self.stats_log('delete_failed', 'delete %r (%f) from '
+                           'policy_index %s (%s) returned %s', path,
+                           source_ts, container_policy_index,
+                           delete_timestamp, err, level=logging.WARNING)
+            return False
+        except:  # noqa
+            self.stats_log('unhandled_error', 'unable to delete %r (%f) '
+                           'from policy_index %s (%s)', path, source_ts,
+                           container_policy_index, delete_timestamp,
+                           level=logging.ERROR, exc_info=True)
+            return False
+
+        self.stats_log('delete_success', '%r (%f) deleted from '
+                       'policy_index %s (%s)', path, source_ts,
+                       container_policy_index, delete_timestamp,
+                       level=logging.INFO)
+
+        return self.throw_tombstones(account, container, obj, q_ts,
+                                     q_policy_index, path)
+
+    def reconcile_object(self, info):
+        """
+        Process a possibly misplaced object write request.  Determine correct
+        destination storage policy by checking with primary containers.  Check
+        source and destination, copying or deleting into destination and
+        cleaning up the source as needed.
+
+        This method wraps _reconcile_object for exception handling.
+
+        :param info: a queue entry dict
+
+        :returns: True to indicate the request is fully processed
+                  successfully, otherwise False.
+        """
+        self.logger.debug('checking placement for %r (%f) '
+                          'in policy_index %s', info['path'],
+                          info['q_ts'], info['q_policy_index'])
+        success = False
+        try:
+            success = self._reconcile_object(**info)
+        except:  # noqa
+            self.logger.exception('Unhandled Exception trying to '
+                                  'reconcile %r (%f) in policy_index %s',
+                                  info['path'], info['q_ts'],
+                                  info['q_policy_index'])
+        if success:
+            metric = 'success'
+            msg = 'was handled successfully'
+        else:
+            metric = 'retry'
+            msg = 'must be retried'
+        msg = '%(path)r (%(q_ts)f) in policy_index %(q_policy_index)s ' + msg
+        self.stats_log(metric, msg, info, level=logging.INFO)
+        self.log_stats()
+        return success
+
+    def _iter_containers(self):
+        """
+        Generate a list of containers to process.
+        """
+        # hit most recent container first instead of waiting on the updaters
+        current_container = get_reconciler_container_name(time.time())
+        yield current_container
+        self.logger.debug('looking for containers in %s',
+                          MISPLACED_OBJECTS_ACCOUNT)
+        container_gen = self.swift.iter_containers(MISPLACED_OBJECTS_ACCOUNT)
+        while True:
+            one_page = None
+            try:
+                one_page = list(itertools.islice(
+                    container_gen, constraints.CONTAINER_LISTING_LIMIT))
+            except UnexpectedResponse as err:
+                self.logger.error('Error listing containers in '
+                                  'account %s (%s)',
+                                  MISPLACED_OBJECTS_ACCOUNT, err)
+
+            if not one_page:
+                # don't generally expect more than one page
+                break
+            # reversed order since we expect older containers to be empty
+            for c in reversed(one_page):
+                container = c['name']
+                if container == current_container:
+                    continue  # we've already hit this one this pass
+                yield container
+
+    def _iter_objects(self, container):
+        """
+        Generate a list of objects to process.
+
+        :param container: the name of the container to process
+
+        If the given container is empty and older than reclaim_age this
+        processor will attempt to reap it.
+        """
+        self.logger.debug('looking for objects in %s', container)
+        found_obj = False
+        try:
+            for raw_obj in self.swift.iter_objects(
+                    MISPLACED_OBJECTS_ACCOUNT, container):
+                found_obj = True
+                yield raw_obj
+        except UnexpectedResponse as err:
+            self.logger.error('Error listing objects in container %s (%s)',
+                              container, err)
+        if float(container) < time.time() - self.reclaim_age and \
+                not found_obj:
+            # Try to delete old empty containers so the queue doesn't
+            # grow without bound. It's ok if there's a conflict.
+            self.swift.delete_container(
+                MISPLACED_OBJECTS_ACCOUNT, container,
+                acceptable_statuses=(2, 404, 409, 412))
+
+    def should_process(self, queue_item):
+        """
+        Check if a given entry should be handled by this process.
+
+        :param container: the queue container
+        :param queue_item: an entry from the queue
+        """
+        if not self.processes:
+            return True
+        hexdigest = hash_path(
+            queue_item['account'], queue_item['container'], queue_item['obj'])
+        return int(hexdigest, 16) % self.processes == self.process
+
+    def process_queue_item(self, q_container, q_entry, queue_item):
+        """
+        Process an entry and remove from queue on success.
+
+        :param q_container: the queue container
+        :param q_entry: the raw_obj name from the q_container
+        :param queue_item: a parsed entry from the queue
+        """
+        finished = self.reconcile_object(queue_item)
+        if finished:
+            self.pop_queue(q_container, q_entry,
+                           queue_item['q_ts'],
+                           queue_item['q_record'])
+
+    def reconcile(self):
+        """
+        Main entry point for concurrent processing of misplaced objects.
+
+        Iterate over all queue entries and delegate processing to spawned
+        workers in the pool.
+        """
+        self.logger.debug('pulling items from the queue')
+        pool = GreenPool(self.concurrency)
+        for container in self._iter_containers():
+            self.logger.debug('checking container %s', container)
+            for raw_obj in self._iter_objects(container):
+                try:
+                    queue_item = parse_raw_obj(raw_obj)
+                except Exception:
+                    self.stats_log('invalid_record',
+                                   'invalid queue record: %r', raw_obj,
+                                   level=logging.ERROR, exc_info=True)
+                    continue
+                if self.should_process(queue_item):
+                    pool.spawn_n(self.process_queue_item,
+                                 container, raw_obj['name'], queue_item)
+            self.log_stats()
+        pool.waitall()
+
+    def run_once(self, *args, **kwargs):
+        """
+        Process every entry in the queue.
+        """
+        try:
+            self.reconcile()
+        except:  # noqa
+            self.logger.exception('Unhandled Exception trying to reconcile')
+        self.log_stats(force=True)
+
+    def run_forever(self, *args, **kwargs):
+        while True:
+            self.run_once(*args, **kwargs)
+            self.stats = defaultdict(int)
+            self.logger.info('sleeping between intervals (%ss)', self.interval)
+            time.sleep(self.interval)
+
+
+def main():
+    conf_file, options = parse_options(once=True)
+    run_daemon(ContainerReconciler, conf_file, **options)
+
+
+if __name__ == '__main__':
+    main()
diff --git a/swift/container/replicator.py b/swift/container/replicator.py
index 3d5aee9b73..07e1bb4ce1 100644
--- a/swift/container/replicator.py
+++ b/swift/container/replicator.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,19 +13,452 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-from swift.container import server as container_server
-from swift.common import db, db_replicator
+import os
+import json
+from collections import defaultdict
+from eventlet import Timeout
+import optparse
+from random import choice
+
+from swift.container.sync_store import ContainerSyncStore
+from swift.container.backend import ContainerBroker, DATADIR, SHARDED, \
+    merge_shards
+from swift.container.reconciler import (
+    MISPLACED_OBJECTS_ACCOUNT, incorrect_policy_index,
+    get_reconciler_container_name, get_row_to_q_entry_translator)
+from swift.common import db_replicator
+from swift.common.daemon import run_daemon
+from swift.common.storage_policy import POLICIES
+from swift.common.swob import HTTPOk, HTTPAccepted
+from swift.common.http import is_success
+from swift.common.utils import Timestamp, majority_size, get_db_files, \
+    parse_options, node_to_string
+
+
+def check_merge_own_shard_range(shards, broker, logger, source):
+    """
+    If broker has own_shard_range *with an epoch* then filter out an
+    own_shard_range *without an epoch*, and log a warning about it.
+
+    :param shards: a list of candidate ShardRanges to merge
+    :param broker: a ContainerBroker
+    :param logger: a logger
+    :param source: string to log as source of shards
+    :return: a list of ShardRanges to actually merge
+    """
+    # work-around for https://bugs.launchpad.net/swift/+bug/1980451
+    own_sr = broker.get_own_shard_range()
+    if own_sr.epoch is None:
+        return shards
+    to_merge = []
+    for shard in shards:
+        if shard['name'] == own_sr.name and not shard['epoch']:
+            shard_copy = dict(shard)
+            new_content = merge_shards(shard_copy, dict(own_sr))
+            if new_content and shard_copy['epoch'] is None:
+                logger.warning(
+                    'Ignoring remote osr w/o epoch, own_sr: %r, remote_sr: %r,'
+                    ' source: %s', dict(own_sr), shard, source)
+            continue
+        to_merge.append(shard)
+    return to_merge
 
 
 class ContainerReplicator(db_replicator.Replicator):
     server_type = 'container'
-    brokerclass = db.ContainerBroker
-    datadir = container_server.DATADIR
-    default_port = 6001
+    brokerclass = ContainerBroker
+    datadir = DATADIR
+    default_port = 6201
+
+    def __init__(self, conf, logger=None):
+        super(ContainerReplicator, self).__init__(conf, logger=logger)
+        self.reconciler_cleanups = self.sync_store = None
 
     def report_up_to_date(self, full_info):
-        for key in ('put_timestamp', 'delete_timestamp', 'object_count',
-                    'bytes_used'):
-            if full_info['reported_' + key] != full_info[key]:
+        reported_key_map = {
+            'reported_put_timestamp': 'put_timestamp',
+            'reported_delete_timestamp': 'delete_timestamp',
+            'reported_bytes_used': 'bytes_used',
+            'reported_object_count': 'count',
+        }
+        for reported, value_key in reported_key_map.items():
+            if full_info[reported] != full_info[value_key]:
+                return False
+        return True
+
+    def _gather_sync_args(self, replication_info):
+        parent = super(ContainerReplicator, self)
+        sync_args = parent._gather_sync_args(replication_info)
+        if len(POLICIES) > 1:
+            sync_args += tuple(replication_info[k] for k in
+                               ('status_changed_at', 'count',
+                                'storage_policy_index'))
+        return sync_args
+
+    def _handle_sync_response(self, node, response, info, broker, http,
+                              different_region=False):
+        if is_success(response.status):
+            remote_info = json.loads(response.data.decode('ascii'))
+            if incorrect_policy_index(info, remote_info):
+                status_changed_at = Timestamp.now()
+                broker.set_storage_policy_index(
+                    remote_info['storage_policy_index'],
+                    timestamp=status_changed_at.internal)
+            sync_timestamps = ('created_at', 'put_timestamp',
+                               'delete_timestamp')
+            if any(info[key] != remote_info[key] for key in sync_timestamps):
+                broker.merge_timestamps(*(remote_info[key] for key in
+                                          sync_timestamps))
+
+            if remote_info.get('shard_max_row', -1) >= 0:
+                # Grab remote's shard ranges, too
+                self._fetch_and_merge_shard_ranges(http, broker)
+
+        return super(ContainerReplicator, self)._handle_sync_response(
+            node, response, info, broker, http, different_region)
+
+    def _sync_shard_ranges(self, broker, http, local_id):
+        # TODO: currently the number of shard ranges is expected to be _much_
+        # less than normal objects so all are sync'd on each cycle. However, in
+        # future there should be sync points maintained much like for object
+        # syncing so that only new shard range rows are sync'd.
+        shard_range_data = broker.get_all_shard_range_data()
+        if shard_range_data:
+            if not self._send_replicate_request(
+                    http, 'merge_shard_ranges', shard_range_data, local_id):
                 return False
+            node_str = node_to_string(http.node, False)
+            self.db_logger.debug(broker, 'synced %s shard ranges to %s',
+                                 len(shard_range_data), node_str)
+        return True
+
+    def _choose_replication_mode(self, node, rinfo, info, local_sync, broker,
+                                 http, different_region):
+        node_str = node_to_string(node, False)
+        if 'shard_max_row' in rinfo:
+            # Always replicate shard ranges to new-enough swift
+            shard_range_success = self._sync_shard_ranges(
+                broker, http, info['id'])
+        else:
+            shard_range_success = False
+            self.db_logger.warning(
+                broker,
+                'unable to replicate shard ranges to peer %s; '
+                'peer may need upgrading', node_str)
+        if broker.sharding_initiated():
+            if info['db_state'] == SHARDED and len(
+                    broker.get_objects(limit=1)) == 0:
+                self.db_logger.debug(
+                    broker,
+                    'sharded and has nothing more to replicate to peer %s',
+                    node_str)
+            else:
+                # Only print the scary warning if there was something that
+                # didn't get replicated
+                self.db_logger.warning(
+                    broker,
+                    'able to shard -- refusing to replicate objects to '
+                    'peer %s; have shard ranges and will wait for cleaving',
+                    node_str)
+            self.stats['deferred'] += 1
+            return shard_range_success
+
+        success = super(ContainerReplicator, self)._choose_replication_mode(
+            node, rinfo, info, local_sync, broker, http,
+            different_region)
+        return shard_range_success and success
+
+    def _fetch_and_merge_shard_ranges(self, http, broker):
+        with Timeout(self.node_timeout):
+            response = http.replicate('get_shard_ranges')
+        if response and is_success(response.status):
+            shards = json.loads(response.data.decode('ascii'))
+            shards = check_merge_own_shard_range(
+                shards, broker, self.logger, '%s%s' % (http.host, http.path))
+            broker.merge_shard_ranges(shards)
+
+    def find_local_handoff_for_part(self, part):
+        """
+        Find a device in the ring that is on this node on which to place a
+        partition. Preference is given to a device that is a primary location
+        for the partition. If no such device is found then a local device with
+        weight is chosen, and failing that any local device.
+
+        :param part: a partition
+        :returns: a node entry from the ring
+        """
+        if not self._local_device_ids:
+            raise RuntimeError('Cannot find local handoff; no local devices')
+
+        for node in self.ring.get_part_nodes(part):
+            if node['id'] in self._local_device_ids:
+                return node
+
+        # don't attempt to minimize handoff depth: just choose any local
+        # device, but start by only picking a device with a weight, just in
+        # case some devices are being drained...
+        local_devs_with_weight = [
+            dev for dev in self._local_device_ids.values()
+            if dev.get('weight', 0)]
+        if local_devs_with_weight:
+            return choice(local_devs_with_weight)
+
+        # we have to return something, so choose any local device..
+        node = choice(list(self._local_device_ids.values()))
+        self.logger.warning(
+            "Could not find a non-zero weight device for handoff partition "
+            "%d, falling back device %s" %
+            (part, node['device']))
+        return node
+
+    def get_reconciler_broker(self, timestamp):
+        """
+        Get a local instance of the reconciler container broker that is
+        appropriate to enqueue the given timestamp.
+
+        :param timestamp: the timestamp of the row to be enqueued
+
+        :returns: a local reconciler broker
+        """
+        container = get_reconciler_container_name(timestamp)
+        if self.reconciler_containers and \
+                container in self.reconciler_containers:
+            return self.reconciler_containers[container][1]
+        account = MISPLACED_OBJECTS_ACCOUNT
+        part = self.ring.get_part(account, container)
+        node = self.find_local_handoff_for_part(part)
+        broker, initialized = ContainerBroker.create_broker(
+            os.path.join(self.root, node['device']), part, account, container,
+            logger=self.logger, put_timestamp=timestamp,
+            storage_policy_index=0)
+        self.logger.increment('reconciler_db_created' if initialized
+                              else 'reconciler_db_exists')
+        if self.reconciler_containers is not None:
+            self.reconciler_containers[container] = part, broker, node['id']
+        return broker
+
+    def feed_reconciler(self, container, item_list):
+        """
+        Add queue entries for rows in item_list to the local reconciler
+        container database.
+
+        :param container: the name of the reconciler container
+        :param item_list: the list of rows to enqueue
+
+        :returns: True if successfully enqueued
+        """
+
+        try:
+            reconciler = self.get_reconciler_broker(container)
+        except Exception:
+            self.logger.exception('Failed to get reconciler broker for '
+                                  'container %s', container)
+            return False
+        self.logger.debug('Adding %d objects to the reconciler at %s',
+                          len(item_list), reconciler.db_file)
+        try:
+            reconciler.merge_items(item_list)
+        except (Exception, Timeout):
+            self.logger.exception('UNHANDLED EXCEPTION: trying to merge '
+                                  '%d items to reconciler container %s',
+                                  len(item_list), reconciler.db_file)
+            return False
         return True
+
+    def dump_to_reconciler(self, broker, point):
+        """
+        Look for object rows for objects updates in the wrong storage policy
+        in broker with a ``ROWID`` greater than the rowid given as point.
+
+        :param broker: the container broker with misplaced objects
+        :param point: the last verified ``reconciler_sync_point``
+
+        :returns: the last successful enqueued rowid
+        """
+        max_sync = broker.get_max_row()
+        misplaced = broker.get_misplaced_since(point, self.per_diff)
+        if not misplaced:
+            return max_sync
+        translator = get_row_to_q_entry_translator(broker)
+        errors = False
+        low_sync = point
+        while misplaced:
+            batches = defaultdict(list)
+            for item in misplaced:
+                container = get_reconciler_container_name(item['created_at'])
+                batches[container].append(translator(item))
+            for container, item_list in batches.items():
+                success = self.feed_reconciler(container, item_list)
+                if not success:
+                    errors = True
+            point = misplaced[-1]['ROWID']
+            if not errors:
+                low_sync = point
+            misplaced = broker.get_misplaced_since(point, self.per_diff)
+        return low_sync
+
+    def _post_replicate_hook(self, broker, info, responses):
+        if info['account'] == MISPLACED_OBJECTS_ACCOUNT:
+            return
+
+        try:
+            self.sync_store.update_sync_store(broker)
+        except Exception:
+            self.db_logger.exception(broker, 'Failed to update sync_store')
+
+        point = broker.get_reconciler_sync()
+        if not broker.has_multiple_policies() and info['max_row'] != point:
+            broker.update_reconciler_sync(info['max_row'])
+            return
+        max_sync = self.dump_to_reconciler(broker, point)
+        success = responses.count(True) >= majority_size(len(responses))
+        if max_sync > point and success:
+            # to be safe, only slide up the sync point with a majority on
+            # replication
+            broker.update_reconciler_sync(max_sync)
+
+    def cleanup_post_replicate(self, broker, orig_info, responses):
+        if broker.sharding_required():
+            # despite being a handoff, since we're sharding we're not going to
+            # do any cleanup so we can continue cleaving - this is still
+            # considered "success"
+            self.db_logger.debug(
+                broker,
+                'Not deleting db (requires sharding, state %s)',
+                broker.get_db_state())
+            return True
+        return super(ContainerReplicator, self).cleanup_post_replicate(
+            broker, orig_info, responses)
+
+    def delete_db(self, broker):
+        """
+        Ensure that reconciler databases are only cleaned up at the end of the
+        replication run.
+        """
+        if (self.reconciler_cleanups is not None and
+                broker.account == MISPLACED_OBJECTS_ACCOUNT):
+            # this container shouldn't be here, make sure it's cleaned up
+            self.reconciler_cleanups[broker.container] = broker
+            return
+        if self.sync_store:
+            try:
+                # DB is going to get deleted. Be preemptive about it
+                self.sync_store.remove_synced_container(broker)
+            except Exception:
+                self.db_logger.exception(
+                    broker, 'Failed to remove sync_store entry')
+
+        return super(ContainerReplicator, self).delete_db(broker)
+
+    def replicate_reconcilers(self):
+        """
+        Ensure any items merged to reconciler containers during replication
+        are pushed out to correct nodes and any reconciler containers that do
+        not belong on this node are removed.
+        """
+        self.logger.info('Replicating %d reconciler containers',
+                         len(self.reconciler_containers))
+        for part, reconciler, node_id in self.reconciler_containers.values():
+            self.cpool.spawn_n(
+                self._replicate_object, part, reconciler.db_file, node_id)
+        self.cpool.waitall()
+        # wipe out the cache do disable bypass in delete_db
+        cleanups = self.reconciler_cleanups
+        self.reconciler_cleanups = self.reconciler_containers = None
+        self.logger.info('Cleaning up %d reconciler containers',
+                         len(cleanups))
+        for reconciler in cleanups.values():
+            self.cpool.spawn_n(self.delete_db, reconciler)
+        self.cpool.waitall()
+        self.logger.info('Finished reconciler replication')
+
+    def run_once(self, *args, **kwargs):
+        self.reconciler_containers = {}
+        self.reconciler_cleanups = {}
+        self.sync_store = ContainerSyncStore(self.root,
+                                             self.logger,
+                                             self.mount_check)
+        rv = super(ContainerReplicator, self).run_once(*args, **kwargs)
+        if any([self.reconciler_containers, self.reconciler_cleanups]):
+            self.replicate_reconcilers()
+        return rv
+
+
+class ContainerReplicatorRpc(db_replicator.ReplicatorRpc):
+
+    def _db_file_exists(self, db_path):
+        return bool(get_db_files(db_path))
+
+    def _parse_sync_args(self, args):
+        parent = super(ContainerReplicatorRpc, self)
+        remote_info = parent._parse_sync_args(args)
+        if len(args) > 9:
+            remote_info['status_changed_at'] = args[7]
+            remote_info['count'] = args[8]
+            remote_info['storage_policy_index'] = args[9]
+        return remote_info
+
+    def _get_synced_replication_info(self, broker, remote_info):
+        """
+        Sync the remote_info storage_policy_index if needed and return the
+        newly synced replication info.
+
+        :param broker: the database broker
+        :param remote_info: the remote replication info
+
+        :returns: local broker replication info
+        """
+        info = broker.get_replication_info()
+        if incorrect_policy_index(info, remote_info):
+            status_changed_at = Timestamp.now().internal
+            broker.set_storage_policy_index(
+                remote_info['storage_policy_index'],
+                timestamp=status_changed_at)
+            info = broker.get_replication_info()
+        return info
+
+    def _abort_rsync_then_merge(self, db_file, old_filename):
+        if super(ContainerReplicatorRpc, self)._abort_rsync_then_merge(
+                db_file, old_filename):
+            return True
+        # if the local db has started sharding since the original 'sync'
+        # request then abort object replication now; instantiate a fresh broker
+        # each time this check if performed so to get latest state
+        broker = ContainerBroker(db_file, logger=self.logger)
+        return broker.sharding_initiated()
+
+    def _post_rsync_then_merge_hook(self, existing_broker, new_broker):
+        # Note the following hook will need to change to using a pointer and
+        # limit in the future.
+        shards = existing_broker.get_all_shard_range_data()
+        shards = check_merge_own_shard_range(
+            shards, new_broker, self.logger, 'rsync')
+        new_broker.merge_shard_ranges(shards)
+
+    def merge_shard_ranges(self, broker, args):
+        shards = check_merge_own_shard_range(
+            args[0], broker, self.logger, 'repl_req')
+        broker.merge_shard_ranges(shards)
+        return HTTPAccepted()
+
+    def get_shard_ranges(self, broker, args):
+        return HTTPOk(headers={'Content-Type': 'application/json'},
+                      body=json.dumps(broker.get_all_shard_range_data()))
+
+
+def main():
+    parser = optparse.OptionParser("%prog CONFIG [options]")
+    parser.add_option('-d', '--devices',
+                      help=('Replicate only given devices. '
+                            'Comma-separated list. '
+                            'Only has effect if --once is used.'))
+    parser.add_option('-p', '--partitions',
+                      help=('Replicate only given partitions. '
+                            'Comma-separated list. '
+                            'Only has effect if --once is used.'))
+    conf_file, options = parse_options(parser=parser, once=True)
+    run_daemon(ContainerReplicator, conf_file, **options)
+
+
+if __name__ == '__main__':
+    main()
diff --git a/swift/container/server.py b/swift/container/server.py
index 604cd68733..cd99b1ebf3 100644
--- a/swift/container/server.py
+++ b/swift/container/server.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,64 +13,158 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-from __future__ import with_statement
-
+import json
 import os
+import sys
 import time
 import traceback
-from urllib import unquote
-from xml.sax import saxutils
-from datetime import datetime
 
 from eventlet import Timeout
 
+from urllib.parse import quote
+
 import swift.common.db
-from swift.common.db import ContainerBroker
-from swift.common.utils import get_logger, get_param, hash_path, public, \
-    normalize_timestamp, storage_directory, split_path, validate_sync_to, \
-    config_true_value, validate_device_partition, json, timing_stats
-from swift.common.constraints import CONTAINER_LISTING_LIMIT, \
-    check_mount, check_float, check_utf8, FORMAT2CONTENT_TYPE
+from swift.container.sync_store import ContainerSyncStore
+from swift.container.backend import ContainerBroker, DATADIR, \
+    RECORD_TYPE_SHARD, UNSHARDED, SHARDING, SHARDED, SHARD_UPDATE_STATES
+from swift.container.replicator import ContainerReplicatorRpc
+from swift.common.db import DatabaseAlreadyExists
+from swift.common.container_sync_realms import ContainerSyncRealms
+from swift.common.request_helpers import split_and_validate_path, \
+    is_sys_or_user_meta, validate_internal_container, validate_internal_obj, \
+    validate_container_params
+from swift.common.utils import get_logger, hash_path, public, \
+    Timestamp, storage_directory, validate_sync_to, \
+    config_true_value, replication, \
+    override_bytes_from_content_type, get_log_line, \
+    config_fallocate_value, fs_has_free_space, list_from_csv, \
+    ShardRange, parse_options
+from swift.common.constraints import valid_timestamp, check_utf8, \
+    check_drive, AUTO_CREATE_ACCOUNT_PREFIX
 from swift.common.bufferedhttp import http_connect
 from swift.common.exceptions import ConnectionTimeout
-from swift.common.db_replicator import ReplicatorRpc
-from swift.common.http import HTTP_NOT_FOUND, is_success
+from swift.common.http import HTTP_NO_CONTENT, HTTP_NOT_FOUND, is_success
+from swift.common.middleware import listing_formats
+from swift.common.storage_policy import POLICIES
+from swift.common.base_storage_server import BaseStorageServer, timing_stats
+from swift.common.header_key_dict import HeaderKeyDict
 from swift.common.swob import HTTPAccepted, HTTPBadRequest, HTTPConflict, \
     HTTPCreated, HTTPInternalServerError, HTTPNoContent, HTTPNotFound, \
     HTTPPreconditionFailed, HTTPMethodNotAllowed, Request, Response, \
-    HTTPInsufficientStorage, HTTPNotAcceptable
+    HTTPInsufficientStorage, HTTPException, HTTPMovedPermanently, \
+    wsgi_to_str, str_to_wsgi
+from swift.common.wsgi import run_wsgi
+
+
+def gen_resp_headers(info, is_deleted=False):
+    """
+    Convert container info dict to headers.
+    """
+    ts_zero = Timestamp.zero()
+    # backend headers are always included
+    headers = {
+        'X-Backend-Timestamp': Timestamp(
+            info.get('created_at', ts_zero)).internal,
+        'X-Backend-PUT-Timestamp': Timestamp(
+            info.get('put_timestamp', ts_zero)).internal,
+        'X-Backend-DELETE-Timestamp': Timestamp(
+            info.get('delete_timestamp', ts_zero)).internal,
+        'X-Backend-Status-Changed-At': Timestamp(
+            info.get('status_changed_at', ts_zero)).internal,
+        'X-Backend-Storage-Policy-Index': info.get('storage_policy_index', 0),
+    }
+    if not is_deleted:
+        # base container info on deleted containers is not exposed to client
+        headers.update({
+            'X-Container-Object-Count': info.get('object_count', 0),
+            'X-Container-Bytes-Used': info.get('bytes_used', 0),
+            'X-Timestamp': Timestamp(info.get('created_at', ts_zero)).normal,
+            'X-PUT-Timestamp': Timestamp(
+                info.get('put_timestamp', ts_zero)).normal,
+            'X-Backend-Sharding-State': info.get('db_state', UNSHARDED),
+        })
+    return headers
+
+
+def get_container_name_and_placement(req):
+    """
+    Split and validate path for a container.
+
+    :param req: a swob request
+
+    :returns: a tuple of path parts as strings
+    """
+    drive, part, account, container = split_and_validate_path(req, 4)
+    validate_internal_container(account, container)
+    return drive, part, account, container
+
+
+def get_obj_name_and_placement(req):
+    """
+    Split and validate path for an object.
+
+    :param req: a swob request
 
-DATADIR = 'containers'
+    :returns: a tuple of path parts as strings
+    """
+    drive, part, account, container, obj = split_and_validate_path(
+        req, 4, 5, True)
+    validate_internal_obj(account, container, obj)
+    return drive, part, account, container, obj
 
 
-class ContainerController(object):
+class ContainerController(BaseStorageServer):
     """WSGI Controller for the container server."""
 
     # Ensure these are all lowercase
     save_headers = ['x-container-read', 'x-container-write',
                     'x-container-sync-key', 'x-container-sync-to']
+    server_type = 'container-server'
 
-    def __init__(self, conf):
-        self.logger = get_logger(conf, log_route='container-server')
-        self.root = conf.get('devices', '/srv/node/')
+    def __init__(self, conf, logger=None):
+        super(ContainerController, self).__init__(conf)
+        self.logger = logger or get_logger(conf, log_route='container-server')
+        self.log_requests = config_true_value(conf.get('log_requests', 'true'))
+        self.root = conf.get('devices', '/srv/node')
         self.mount_check = config_true_value(conf.get('mount_check', 'true'))
-        self.node_timeout = int(conf.get('node_timeout', 3))
+        self.node_timeout = float(conf.get('node_timeout', 3))
         self.conn_timeout = float(conf.get('conn_timeout', 0.5))
+        #: ContainerSyncCluster instance for validating sync-to values.
+        self.realms_conf = ContainerSyncRealms(
+            os.path.join(
+                conf.get('swift_dir', '/etc/swift'),
+                'container-sync-realms.conf'),
+            self.logger)
+        #: The list of hosts we're allowed to send syncs to. This can be
+        #: overridden by data in self.realms_conf
         self.allowed_sync_hosts = [
             h.strip()
             for h in conf.get('allowed_sync_hosts', '127.0.0.1').split(',')
             if h.strip()]
-        self.replicator_rpc = ReplicatorRpc(
+        self.replicator_rpc = ContainerReplicatorRpc(
             self.root, DATADIR, ContainerBroker, self.mount_check,
             logger=self.logger)
-        self.auto_create_account_prefix = \
-            conf.get('auto_create_account_prefix') or '.'
+        self.auto_create_account_prefix = AUTO_CREATE_ACCOUNT_PREFIX
+        self.shards_account_prefix = (
+            self.auto_create_account_prefix + 'shards_')
         if config_true_value(conf.get('allow_versions', 'f')):
             self.save_headers.append('x-versions-location')
+        if 'allow_versions' in conf:
+            self.logger.warning('Option allow_versions is deprecated. '
+                                'Configure the versioned_writes middleware in '
+                                'the proxy-server instead. This option will '
+                                'be ignored in a future release.')
         swift.common.db.DB_PREALLOCATION = \
             config_true_value(conf.get('db_preallocation', 'f'))
+        swift.common.db.QUERY_LOGGING = \
+            config_true_value(conf.get('db_query_logging', 'f'))
+        self.sync_store = ContainerSyncStore(self.root,
+                                             self.logger,
+                                             self.mount_check)
+        self.fallocate_reserve, self.fallocate_is_percent = \
+            config_fallocate_value(conf.get('fallocate_reserve', '1%'))
 
-    def _get_container_broker(self, drive, part, account, container):
+    def _get_container_broker(self, drive, part, account, container, **kwargs):
         """
         Get a DB broker for the container.
 
@@ -83,33 +177,87 @@ def _get_container_broker(self, drive, part, account, container):
         hsh = hash_path(account, container)
         db_dir = storage_directory(DATADIR, part, hsh)
         db_path = os.path.join(self.root, drive, db_dir, hsh + '.db')
-        return ContainerBroker(db_path, account=account, container=container,
-                               logger=self.logger)
+        kwargs.setdefault('account', account)
+        kwargs.setdefault('container', container)
+        kwargs.setdefault('logger', self.logger)
+        return ContainerBroker(db_path, **kwargs)
+
+    def get_and_validate_policy_index(self, req):
+        """
+        Validate that the index supplied maps to a policy.
+
+        :returns: policy index from request, or None if not present
+        :raises HTTPBadRequest: if the supplied index is bogus
+        """
+        header = 'X-Backend-Storage-Policy-Index'
+        policy_index = req.headers.get(header, None)
+        if policy_index is None:
+            return None
+
+        try:
+            policy_index = int(policy_index)
+            policy = POLICIES.get_by_index(policy_index)
+            if policy is None:
+                raise ValueError
+        except ValueError:
+            raise HTTPBadRequest(
+                request=req, content_type="text/plain",
+                body="Invalid %s %r" % (header, policy_index))
+        else:
+            return int(policy)
 
     def account_update(self, req, account, container, broker):
         """
-        Update the account server with latest container info.
+        Update the account server(s) with latest container info.
 
         :param req: swob.Request object
         :param account: account name
         :param container: container name
         :param broker: container DB broker object
-        :returns: if the account request returns a 404 error code,
-                  HTTPNotFound response object, otherwise None.
+        :returns: if all the account requests return a 404 error code,
+                  HTTPNotFound response object,
+                  if the account cannot be updated due to a malformed header,
+                  an HTTPBadRequest response object,
+                  otherwise None.
         """
-        account_host = req.headers.get('X-Account-Host')
-        account_partition = req.headers.get('X-Account-Partition')
-        account_device = req.headers.get('X-Account-Device')
-        if all([account_host, account_partition, account_device]):
+        account_hosts = [h.strip() for h in
+                         req.headers.get('X-Account-Host', '').split(',')]
+        account_devices = [d.strip() for d in
+                           req.headers.get('X-Account-Device', '').split(',')]
+        account_partition = req.headers.get('X-Account-Partition', '')
+
+        if len(account_hosts) != len(account_devices):
+            # This shouldn't happen unless there's a bug in the proxy,
+            # but if there is, we want to know about it.
+            self.logger.error(
+                'ERROR Account update failed: different  '
+                'numbers of hosts and devices in request: '
+                '"%(hosts)s" vs "%(devices)s"', {
+                    'hosts': req.headers.get('X-Account-Host', ''),
+                    'devices': req.headers.get('X-Account-Device', '')})
+            return HTTPBadRequest(req=req)
+
+        if account_partition:
+            # zip is lazy, but we need a list, so force evaluation.
+            updates = list(zip(account_hosts, account_devices))
+        else:
+            updates = []
+
+        account_404s = 0
+
+        for account_host, account_device in updates:
             account_ip, account_port = account_host.rsplit(':', 1)
             new_path = '/' + '/'.join([account, container])
             info = broker.get_info()
-            account_headers = {
+            account_headers = HeaderKeyDict({
                 'x-put-timestamp': info['put_timestamp'],
                 'x-delete-timestamp': info['delete_timestamp'],
                 'x-object-count': info['object_count'],
                 'x-bytes-used': info['bytes_used'],
-                'x-trans-id': req.headers.get('x-trans-id', '-')}
+                'x-trans-id': req.headers.get('x-trans-id', '-'),
+                'X-Backend-Storage-Policy-Index': info['storage_policy_index'],
+                'user-agent': 'container-server %s' % os.getpid(),
+                'referer': req.as_referer()})
             if req.headers.get('x-account-override-deleted', 'no').lower() == \
                     'yes':
                 account_headers['x-account-override-deleted'] = 'yes'
@@ -122,60 +270,125 @@ def account_update(self, req, account, container, broker):
                     account_response = conn.getresponse()
                     account_response.read()
                     if account_response.status == HTTP_NOT_FOUND:
-                        return HTTPNotFound(request=req)
+                        account_404s += 1
                     elif not is_success(account_response.status):
-                        self.logger.error(_(
+                        self.logger.error(
                             'ERROR Account update failed '
                             'with %(ip)s:%(port)s/%(device)s (will retry '
-                            'later): Response %(status)s %(reason)s'),
+                            'later): Response %(status)s %(reason)s',
                             {'ip': account_ip, 'port': account_port,
                              'device': account_device,
                              'status': account_response.status,
                              'reason': account_response.reason})
             except (Exception, Timeout):
-                self.logger.exception(_(
+                self.logger.exception(
                     'ERROR account update failed with '
-                    '%(ip)s:%(port)s/%(device)s (will retry later)'),
+                    '%(ip)s:%(port)s/%(device)s (will retry later)',
                     {'ip': account_ip, 'port': account_port,
                      'device': account_device})
-        return None
+        if updates and account_404s == len(updates):
+            return HTTPNotFound(req=req)
+        else:
+            return None
+
+    def _update_sync_store(self, broker, method):
+        try:
+            self.sync_store.update_sync_store(broker)
+        except Exception:
+            self.logger.exception('Failed to update sync_store %s during %s' %
+                                  (broker.db_file, method))
+
+    def _redirect_to_shard(self, req, broker, obj_name):
+        """
+        If the request indicates that it can accept a redirection, look for a
+        shard range that contains ``obj_name`` and if one exists return a
+        HTTPMovedPermanently response.
+
+        :param req: an instance of :class:`~swift.common.swob.Request`
+        :param broker: a container broker
+        :param obj_name: an object name
+        :return: an instance of :class:`swift.common.swob.HTTPMovedPermanently`
+            if a shard range exists for the given ``obj_name``, otherwise None.
+        """
+        if not config_true_value(
+                req.headers.get('x-backend-accept-redirect', False)):
+            # We want to avoid fetching shard ranges for the (more
+            # time-sensitive) object-server update, so allow some misplaced
+            # objects to land between when we've started sharding and when the
+            # proxy learns about it. Note that this path is also used by old,
+            # pre-sharding updaters during a rolling upgrade.
+            return None
+
+        shard_ranges = broker.get_shard_ranges(
+            includes=obj_name, states=SHARD_UPDATE_STATES)
+        if not shard_ranges:
+            return None
+
+        # note: obj_name may be included in both a created sub-shard and its
+        # sharding parent. get_shard_ranges will return the created sub-shard
+        # in preference to the parent, which is the desired result.
+        containing_range = shard_ranges[0]
+        location = "/%s/%s" % (containing_range.name, obj_name)
+        if location != quote(location) and not config_true_value(
+                req.headers.get('x-backend-accept-quoted-location', False)):
+            # Sender expects the destination to be unquoted, but it isn't safe
+            # to send unquoted. Eat the update for now and let the sharder
+            # move it later. Should only come up during rolling upgrades.
+            return None
+
+        headers = {'Location': quote(location),
+                   'X-Backend-Location-Is-Quoted': 'true',
+                   'X-Backend-Redirect-Timestamp':
+                       containing_range.timestamp.internal}
+
+        # we do not want the host added to the location
+        req.environ['swift.leave_relative_location'] = True
+        return HTTPMovedPermanently(headers=headers, request=req)
+
+    def check_free_space(self, drive):
+        drive_root = os.path.join(self.root, drive)
+        return fs_has_free_space(
+            drive_root, self.fallocate_reserve, self.fallocate_is_percent)
 
     @public
-    @timing_stats
+    @timing_stats()
     def DELETE(self, req):
         """Handle HTTP DELETE request."""
+        drive, part, account, container, obj = get_obj_name_and_placement(req)
+        req_timestamp = valid_timestamp(req)
         try:
-            drive, part, account, container, obj = split_path(
-                unquote(req.path), 4, 5, True)
-            validate_device_partition(drive, part)
-        except ValueError, err:
-            return HTTPBadRequest(body=str(err), content_type='text/plain',
-                                  request=req)
-        if 'x-timestamp' not in req.headers or \
-                not check_float(req.headers['x-timestamp']):
-            return HTTPBadRequest(body='Missing timestamp', request=req,
-                                  content_type='text/plain')
-        if self.mount_check and not check_mount(self.root, drive):
+            check_drive(self.root, drive, self.mount_check)
+        except ValueError:
             return HTTPInsufficientStorage(drive=drive, request=req)
+        # policy index is only relevant for delete_obj (and transitively for
+        # auto create accounts)
+        obj_policy_index = self.get_and_validate_policy_index(req) or 0
         broker = self._get_container_broker(drive, part, account, container)
-        if account.startswith(self.auto_create_account_prefix) and obj and \
-                not os.path.exists(broker.db_file):
-            broker.initialize(normalize_timestamp(
-                req.headers.get('x-timestamp') or time.time()))
-        if not os.path.exists(broker.db_file):
+        if obj:
+            self._maybe_autocreate(broker, req_timestamp, account,
+                                   obj_policy_index, req)
+        elif not os.path.exists(broker.db_file):
             return HTTPNotFound()
+
         if obj:     # delete object
-            broker.delete_object(obj, req.headers.get('x-timestamp'))
+            # redirect if a shard range exists for the object name
+            redirect = self._redirect_to_shard(req, broker, obj)
+            if redirect:
+                return redirect
+
+            broker.delete_object(obj, req.headers.get('x-timestamp'),
+                                 obj_policy_index)
             return HTTPNoContent(request=req)
         else:
             # delete container
             if not broker.empty():
                 return HTTPConflict(request=req)
-            existed = float(broker.get_info()['put_timestamp']) and \
+            existed = Timestamp(broker.get_info()['put_timestamp']) and \
                 not broker.is_deleted()
-            broker.delete_db(req.headers['X-Timestamp'])
+            broker.delete_db(req_timestamp.internal)
             if not broker.is_deleted():
                 return HTTPConflict(request=req)
+            self._update_sync_store(broker, 'DELETE')
             resp = self.account_update(req, account, container, broker)
             if resp:
                 return resp
@@ -183,314 +396,650 @@ def DELETE(self, req):
                 return HTTPNoContent(request=req)
             return HTTPNotFound()
 
+    def _update_or_create(self, req, broker, timestamp, new_container_policy,
+                          requested_policy_index):
+        """
+        Create new database broker or update timestamps for existing database.
+
+        :param req: the swob request object
+        :param broker: the broker instance for the container
+        :param timestamp: internalized timestamp
+        :param new_container_policy: the storage policy index to use
+                                     when creating the container
+        :param requested_policy_index: the storage policy index sent in the
+                                       request, may be None
+
+        :returns: created, a bool, if database did not previously exist
+        """
+        if not os.path.exists(broker.db_file):
+            try:
+                broker.initialize(timestamp, new_container_policy)
+            except DatabaseAlreadyExists:
+                pass
+            else:
+                return True  # created
+        recreated = broker.is_deleted()
+        if recreated:
+            # only set storage policy on deleted containers
+            broker.set_storage_policy_index(new_container_policy,
+                                            timestamp=timestamp)
+        elif requested_policy_index is not None:
+            # validate requested policy with existing container
+            if requested_policy_index != broker.storage_policy_index:
+                raise HTTPConflict(request=req,
+                                   headers={'x-backend-storage-policy-index':
+                                            broker.storage_policy_index})
+        broker.update_put_timestamp(timestamp)
+        if broker.is_deleted():
+            raise HTTPConflict(request=req)
+        if recreated:
+            broker.update_status_changed_at(timestamp)
+        return recreated
+
+    def _should_autocreate(self, account, req):
+        auto_create_header = req.headers.get('X-Backend-Auto-Create')
+        if auto_create_header:
+            # If the caller included an explicit X-Backend-Auto-Create header,
+            # assume they know the behavior they want
+            return config_true_value(auto_create_header)
+        if account.startswith(self.shards_account_prefix):
+            # we have to specical case this subset of the
+            # auto_create_account_prefix because we don't want the updater
+            # accidently auto-creating shards; only the sharder creates
+            # shards and it will explicitly tell the server to do so
+            return False
+        return account.startswith(self.auto_create_account_prefix)
+
+    def _maybe_autocreate(self, broker, req_timestamp, account,
+                          policy_index, req):
+        created = False
+        should_autocreate = self._should_autocreate(account, req)
+        if should_autocreate and not os.path.exists(broker.db_file):
+            if policy_index is None:
+                raise HTTPBadRequest(
+                    'X-Backend-Storage-Policy-Index header is required')
+            try:
+                broker.initialize(req_timestamp.internal, policy_index)
+            except DatabaseAlreadyExists:
+                pass
+            else:
+                created = True
+        if not os.path.exists(broker.db_file):
+            raise HTTPNotFound()
+        return created
+
+    def _update_metadata(self, req, broker, req_timestamp, method):
+        metadata = {
+            wsgi_to_str(key): (wsgi_to_str(value), req_timestamp.internal)
+            for key, value in req.headers.items()
+            if key.lower() in self.save_headers
+            or is_sys_or_user_meta('container', key)}
+        if metadata:
+            if 'X-Container-Sync-To' in metadata:
+                if 'X-Container-Sync-To' not in broker.metadata or \
+                        metadata['X-Container-Sync-To'][0] != \
+                        broker.metadata['X-Container-Sync-To'][0]:
+                    broker.set_x_container_sync_points(-1, -1)
+            broker.update_metadata(metadata, validate_metadata=True)
+            self._update_sync_store(broker, method)
+
     @public
-    @timing_stats
+    @timing_stats()
     def PUT(self, req):
         """Handle HTTP PUT request."""
-        try:
-            drive, part, account, container, obj = split_path(
-                unquote(req.path), 4, 5, True)
-            validate_device_partition(drive, part)
-        except ValueError, err:
-            return HTTPBadRequest(body=str(err), content_type='text/plain',
-                                  request=req)
-        if 'x-timestamp' not in req.headers or \
-                not check_float(req.headers['x-timestamp']):
-            return HTTPBadRequest(body='Missing timestamp', request=req,
-                                  content_type='text/plain')
+        drive, part, account, container, obj = get_obj_name_and_placement(req)
+        req_timestamp = valid_timestamp(req)
         if 'x-container-sync-to' in req.headers:
-            err = validate_sync_to(req.headers['x-container-sync-to'],
-                                   self.allowed_sync_hosts)
+            err, sync_to, realm, realm_key = validate_sync_to(
+                req.headers['x-container-sync-to'], self.allowed_sync_hosts,
+                self.realms_conf)
             if err:
                 return HTTPBadRequest(err)
-        if self.mount_check and not check_mount(self.root, drive):
+        try:
+            check_drive(self.root, drive, self.mount_check)
+        except ValueError:
             return HTTPInsufficientStorage(drive=drive, request=req)
-        timestamp = normalize_timestamp(req.headers['x-timestamp'])
+        if not self.check_free_space(drive):
+            return HTTPInsufficientStorage(drive=drive, request=req)
+
         broker = self._get_container_broker(drive, part, account, container)
-        if obj:     # put container object
-            if account.startswith(self.auto_create_account_prefix) and \
-                    not os.path.exists(broker.db_file):
-                broker.initialize(timestamp)
-            if not os.path.exists(broker.db_file):
-                return HTTPNotFound()
-            broker.put_object(obj, timestamp, int(req.headers['x-size']),
-                              req.headers['x-content-type'],
-                              req.headers['x-etag'])
-            return HTTPCreated(request=req)
-        else:   # put container
-            if not os.path.exists(broker.db_file):
-                broker.initialize(timestamp)
-                created = True
-            else:
-                created = broker.is_deleted()
-                broker.update_put_timestamp(timestamp)
-                if broker.is_deleted():
-                    return HTTPConflict(request=req)
-            metadata = {}
-            metadata.update(
-                (key, (value, timestamp))
-                for key, value in req.headers.iteritems()
-                if key.lower() in self.save_headers or
-                key.lower().startswith('x-container-meta-'))
-            if metadata:
-                if 'X-Container-Sync-To' in metadata:
-                    if 'X-Container-Sync-To' not in broker.metadata or \
-                            metadata['X-Container-Sync-To'][0] != \
-                            broker.metadata['X-Container-Sync-To'][0]:
-                        broker.set_x_container_sync_points(-1, -1)
-                broker.update_metadata(metadata)
-            resp = self.account_update(req, account, container, broker)
-            if resp:
-                return resp
-            if created:
-                return HTTPCreated(request=req)
-            else:
-                return HTTPAccepted(request=req)
+        if obj:
+            return self.PUT_object(req, broker, account, obj, req_timestamp)
+        record_type = req.headers.get('x-backend-record-type', '').lower()
+        if record_type == RECORD_TYPE_SHARD:
+            return self.PUT_shard(req, broker, account, req_timestamp)
+        else:
+            return self.PUT_container(req, broker, account,
+                                      container, req_timestamp)
+
+    @timing_stats()
+    def PUT_object(self, req, broker, account, obj, req_timestamp):
+        """Put object into container."""
+        # obj put expects the policy_index header, default is for
+        # legacy support during upgrade.
+        requested_policy_index = self.get_and_validate_policy_index(req)
+        obj_policy_index = requested_policy_index or 0
+        self._maybe_autocreate(
+            broker, req_timestamp, account, obj_policy_index, req)
+        # redirect if a shard exists for this object name
+        response = self._redirect_to_shard(req, broker, obj)
+        if response:
+            return response
+
+        broker.put_object(obj, req_timestamp.internal,
+                          int(req.headers['x-size']),
+                          wsgi_to_str(req.headers['x-content-type']),
+                          wsgi_to_str(req.headers['x-etag']), 0,
+                          obj_policy_index,
+                          wsgi_to_str(req.headers.get(
+                              'x-content-type-timestamp')),
+                          wsgi_to_str(req.headers.get('x-meta-timestamp')))
+        return HTTPCreated(request=req)
+
+    def _create_ok_resp(self, req, broker, created):
+        if created:
+            return HTTPCreated(request=req,
+                               headers={'x-backend-storage-policy-index':
+                                        broker.storage_policy_index})
+        else:
+            return HTTPAccepted(request=req,
+                                headers={'x-backend-storage-policy-index':
+                                         broker.storage_policy_index})
+
+    @timing_stats()
+    def PUT_shard(self, req, broker, account, req_timestamp):
+        """Put shards into container."""
+        requested_policy_index = self.get_and_validate_policy_index(req)
+        try:
+            # validate incoming data...
+            shard_ranges = [ShardRange.from_dict(sr)
+                            for sr in json.loads(req.body)]
+        except (ValueError, KeyError, TypeError) as err:
+            return HTTPBadRequest('Invalid body: %r' % err)
+        created = self._maybe_autocreate(
+            broker, req_timestamp, account, requested_policy_index, req)
+        self._update_metadata(req, broker, req_timestamp, 'PUT')
+        if shard_ranges:
+            # TODO: consider writing the shard ranges into the pending
+            # file, but if so ensure an all-or-none semantic for the write
+            broker.merge_shard_ranges(shard_ranges)
+        return self._create_ok_resp(req, broker, created)
+
+    @timing_stats()
+    def PUT_container(self, req, broker, account, container, req_timestamp):
+        """Update or create container."""
+        requested_policy_index = self.get_and_validate_policy_index(req)
+        if requested_policy_index is None:
+            # use the default index sent by the proxy if available
+            new_container_policy = req.headers.get(
+                'X-Backend-Storage-Policy-Default', int(POLICIES.default))
+        else:
+            new_container_policy = requested_policy_index
+        created = self._update_or_create(req, broker,
+                                         req_timestamp.internal,
+                                         new_container_policy,
+                                         requested_policy_index)
+        self._update_metadata(req, broker, req_timestamp, 'PUT')
+        resp = self.account_update(req, account, container, broker)
+        if resp:
+            return resp
+        return self._create_ok_resp(req, broker, created)
 
     @public
-    @timing_stats
+    @timing_stats(sample_rate=0.1)
     def HEAD(self, req):
         """Handle HTTP HEAD request."""
+        drive, part, account, container, obj = get_obj_name_and_placement(req)
+        out_content_type = listing_formats.get_listing_content_type(req)
         try:
-            drive, part, account, container, obj = split_path(
-                unquote(req.path), 4, 5, True)
-            validate_device_partition(drive, part)
-        except ValueError, err:
-            return HTTPBadRequest(body=str(err), content_type='text/plain',
-                                  request=req)
-        if self.mount_check and not check_mount(self.root, drive):
+            check_drive(self.root, drive, self.mount_check)
+        except ValueError:
             return HTTPInsufficientStorage(drive=drive, request=req)
-        broker = self._get_container_broker(drive, part, account, container)
-        broker.pending_timeout = 0.1
-        broker.stale_reads_ok = True
-        if broker.is_deleted():
-            return HTTPNotFound(request=req)
-        info = broker.get_info()
-        headers = {
-            'X-Container-Object-Count': info['object_count'],
-            'X-Container-Bytes-Used': info['bytes_used'],
-            'X-Timestamp': info['created_at'],
-            'X-PUT-Timestamp': info['put_timestamp'],
-        }
+        broker = self._get_container_broker(drive, part, account, container,
+                                            pending_timeout=0.1,
+                                            stale_reads_ok=True)
+        info, is_deleted = broker.get_info_is_deleted()
+        headers = gen_resp_headers(info, is_deleted=is_deleted)
+        if is_deleted:
+            return HTTPNotFound(request=req, headers=headers)
         headers.update(
-            (key, value)
-            for key, (value, timestamp) in broker.metadata.iteritems()
+            (str_to_wsgi(key), str_to_wsgi(value))
+            for key, (value, timestamp) in broker.metadata.items()
             if value != '' and (key.lower() in self.save_headers or
-                                key.lower().startswith('x-container-meta-')))
-        if get_param(req, 'format'):
-            req.accept = FORMAT2CONTENT_TYPE.get(
-                get_param(req, 'format').lower(), FORMAT2CONTENT_TYPE['plain'])
-        headers['Content-Type'] = req.accept.best_match(
-            ['text/plain', 'application/json', 'application/xml', 'text/xml'])
-        if not headers['Content-Type']:
-            return HTTPNotAcceptable(request=req)
-        return HTTPNoContent(request=req, headers=headers, charset='utf-8')
+                                is_sys_or_user_meta('container', key)))
+        headers['Content-Type'] = out_content_type
+        headers['Content-Length'] = 0
+        resp = HTTPNoContent(request=req, headers=headers, charset='utf-8')
+        resp.last_modified = Timestamp(headers['X-PUT-Timestamp'])
+        return resp
+
+    def update_shard_record(self, record, shard_record_full=True):
+        """
+        Return the shard_range database record as a dict, the keys will depend
+        on the database fields provided in the record.
+
+        :param record: shard entry record, either ShardRange or Namespace.
+        :param shard_record_full: boolean, when true the timestamp field is
+                                  added as "last_modified" in iso format.
+        :returns: dict suitable for listing responses
+        """
+        response = dict(record)
+        if shard_record_full:
+            created = record.timestamp
+            response['last_modified'] = Timestamp(created).isoformat
+        return response
+
+    def update_object_record(self, record):
+        """
+        Perform mutation to container listing records that are common to all
+        serialization formats, and returns it as a dict.
+
+        Converts created time to iso timestamp.
+        Replaces size with 'swift_bytes' content type parameter.
+
+        :param record: object entry record
+        :returns: modified record
+        """
+        # record is object info
+        (name, created, size, content_type, etag) = record[:5]
+        if content_type is None:
+            return {'subdir': name}
+        response = {
+            'bytes': size, 'hash': etag, 'name': name,
+            'content_type': content_type}
+        override_bytes_from_content_type(response, logger=self.logger)
+        response['last_modified'] = Timestamp(created).isoformat
+        return response
 
     @public
-    @timing_stats
+    @timing_stats()
     def GET(self, req):
-        """Handle HTTP GET request."""
+        """
+        Handle HTTP GET request.
+
+        The body of the response to a successful GET request contains a listing
+        of either objects or shard ranges. The exact content of the listing is
+        determined by a combination of request headers and query string
+        parameters, as follows:
+
+        * The type of the listing is determined by the
+          ``X-Backend-Record-Type`` header. If this header has value ``shard``
+          then the response body will be a list of shard ranges; if this header
+          has value ``auto``, and the container state is ``sharding`` or
+          ``sharded``, then the listing will be a list of shard ranges;
+          otherwise the response body will be a list of objects.
+
+        * Both shard range and object listings may be filtered according to
+          the constraints described below. However, the
+          ``X-Backend-Ignore-Shard-Name-Filter`` header may be used to override
+          the application of the ``marker``, ``end_marker``, ``includes`` and
+          ``reverse`` parameters to shard range listings. These parameters will
+          be ignored if the header has the value 'sharded' and the current db
+          sharding state is also 'sharded'. Note that this header does not
+          override the ``states`` constraint on shard range listings.
+
+        * The order of both shard range and object listings may be reversed by
+          using a ``reverse`` query string parameter with a
+          value in :attr:`swift.common.utils.TRUE_VALUES`.
+
+        * Both shard range and object listings may be constrained to a name
+          range by the ``marker`` and ``end_marker`` query string parameters.
+          Object listings will only contain objects whose names are greater
+          than any ``marker`` value and less than any ``end_marker`` value.
+          Shard range listings will only contain shard ranges whose namespace
+          is greater than or includes any ``marker`` value and is less than or
+          includes any ``end_marker`` value.
+
+        * Shard range listings may also be constrained by an ``includes`` query
+          string parameter. If this parameter is present the listing will only
+          contain shard ranges whose namespace includes the value of the
+          parameter; any ``marker`` or ``end_marker`` parameters are ignored
+
+        * The length of an object listing may be constrained by the ``limit``
+          parameter. Object listings may also be constrained by ``prefix``,
+          ``delimiter`` and ``path`` query string parameters.
+
+        * Shard range listings will include deleted shard ranges if and only if
+          the ``X-Backend-Include-Deleted`` header value is one of
+          :attr:`swift.common.utils.TRUE_VALUES`. Object listings never
+          include deleted objects.
+
+        * Shard range listings may be constrained to include only shard ranges
+          whose state is specified by a query string ``states`` parameter. If
+          present, the ``states`` parameter should be a comma separated list of
+          either the string or integer representation of
+          :data:`~swift.common.utils.ShardRange.STATES`.
+
+          Alias values may be used in a ``states`` parameter value. The
+          ``listing`` alias will cause the listing to include all shard ranges
+          in a state suitable for contributing to an object listing. The
+          ``updating`` alias will cause the listing to include all shard ranges
+          in a state suitable to accept an object update.
+
+          If either of these aliases is used then the shard range listing will
+          if necessary be extended with a synthesised 'filler' range in order
+          to satisfy the requested name range when insufficient actual shard
+          ranges are found. Any 'filler' shard range will cover the otherwise
+          uncovered tail of the requested name range and will point back to the
+          same container.
+
+          The ``auditing`` alias will cause the listing to include all shard
+          ranges in a state useful to the sharder while auditing a shard
+          container. This alias will not cause a 'filler' range to be added,
+          but will cause the container's own shard range to be included in the
+          listing. For now, ``auditing`` is only supported when
+          'X-Backend-Record-Shard-Format' is 'full'.
+
+        * Shard range listings can be simplified to include only Namespace
+          only attributes (name, lower and upper) if the caller send the header
+          ``X-Backend-Record-Shard-Format`` with value 'namespace' as a hint
+          that it would prefer namespaces. If this header doesn't exist or the
+          value is 'full', the listings will default to include all attributes
+          of shard ranges. But if params has includes/marker/end_marker then
+          the response will be full shard ranges, regardless the header of
+          ``X-Backend-Record-Shard-Format``. The response header
+          ``X-Backend-Record-Type`` will tell the user what type it gets back.
+
+        * Listings are not normally returned from a deleted container. However,
+          the ``X-Backend-Override-Deleted`` header may be used with a value in
+          :attr:`swift.common.utils.TRUE_VALUES` to force a shard range
+          listing to be returned from a deleted container whose DB file still
+          exists.
+
+        :param req: an instance of :class:`swift.common.swob.Request`
+        :returns: an instance of :class:`swift.common.swob.Response`
+        """
+        drive, part, account, container, obj = get_obj_name_and_placement(req)
+        params = validate_container_params(req)
+        out_content_type = listing_formats.get_listing_content_type(req)
         try:
-            drive, part, account, container, obj = split_path(
-                unquote(req.path), 4, 5, True)
-            validate_device_partition(drive, part)
-        except ValueError, err:
-            return HTTPBadRequest(body=str(err), content_type='text/plain',
-                                  request=req)
-        if self.mount_check and not check_mount(self.root, drive):
+            check_drive(self.root, drive, self.mount_check)
+        except ValueError:
             return HTTPInsufficientStorage(drive=drive, request=req)
-        broker = self._get_container_broker(drive, part, account, container)
-        broker.pending_timeout = 0.1
-        broker.stale_reads_ok = True
-        if broker.is_deleted():
-            return HTTPNotFound(request=req)
-        info = broker.get_info()
-        resp_headers = {
-            'X-Container-Object-Count': info['object_count'],
-            'X-Container-Bytes-Used': info['bytes_used'],
-            'X-Timestamp': info['created_at'],
-            'X-PUT-Timestamp': info['put_timestamp'],
-        }
-        resp_headers.update(
-            (key, value)
-            for key, (value, timestamp) in broker.metadata.iteritems()
-            if value != '' and (key.lower() in self.save_headers or
-                                key.lower().startswith('x-container-meta-')))
-        try:
-            path = get_param(req, 'path')
-            prefix = get_param(req, 'prefix')
-            delimiter = get_param(req, 'delimiter')
-            if delimiter and (len(delimiter) > 1 or ord(delimiter) > 254):
-                # delimiters can be made more flexible later
-                return HTTPPreconditionFailed(body='Bad delimiter')
-            marker = get_param(req, 'marker', '')
-            end_marker = get_param(req, 'end_marker')
-            limit = CONTAINER_LISTING_LIMIT
-            given_limit = get_param(req, 'limit')
-            if given_limit and given_limit.isdigit():
-                limit = int(given_limit)
-                if limit > CONTAINER_LISTING_LIMIT:
-                    return HTTPPreconditionFailed(
-                        request=req,
-                        body='Maximum limit is %d' % CONTAINER_LISTING_LIMIT)
-            query_format = get_param(req, 'format')
-        except UnicodeDecodeError, err:
-            return HTTPBadRequest(body='parameters not utf8',
-                                  content_type='text/plain', request=req)
-        if query_format:
-            req.accept = FORMAT2CONTENT_TYPE.get(query_format.lower(),
-                                                 FORMAT2CONTENT_TYPE['plain'])
-        out_content_type = req.accept.best_match(
-            ['text/plain', 'application/json', 'application/xml', 'text/xml'])
-        if not out_content_type:
-            return HTTPNotAcceptable(request=req)
-        container_list = broker.list_objects_iter(limit, marker, end_marker,
-                                                  prefix, delimiter, path)
-        if out_content_type == 'application/json':
-            data = []
-            for (name, created_at, size, content_type, etag) in container_list:
-                if content_type is None:
-                    data.append({"subdir": name})
-                else:
-                    created_at = datetime.utcfromtimestamp(
-                        float(created_at)).isoformat()
-                    # python isoformat() doesn't include msecs when zero
-                    if len(created_at) < len("1970-01-01T00:00:00.000000"):
-                        created_at += ".000000"
-                    data.append({'last_modified': created_at, 'bytes': size,
-                                'content_type': content_type, 'hash': etag,
-                                'name': name})
-            container_list = json.dumps(data)
-        elif out_content_type.endswith('/xml'):
-            xml_output = []
-            for (name, created_at, size, content_type, etag) in container_list:
-                # escape name and format date here
-                name = saxutils.escape(name)
-                created_at = datetime.utcfromtimestamp(
-                    float(created_at)).isoformat()
-                # python isoformat() doesn't include msecs when zero
-                if len(created_at) < len("1970-01-01T00:00:00.000000"):
-                    created_at += ".000000"
-                if content_type is None:
-                    xml_output.append('<subdir name="%s"><name>%s</name>'
-                                      '</subdir>' % (name, name))
-                else:
-                    content_type = saxutils.escape(content_type)
-                    xml_output.append(
-                        '<object><name>%s</name><hash>%s</hash>'
-                        '<bytes>%d</bytes><content_type>%s</content_type>'
-                        '<last_modified>%s</last_modified></object>' %
-                        (name, etag, size, content_type, created_at))
-            container_list = ''.join([
-                '<?xml version="1.0" encoding="UTF-8"?>\n',
-                '<container name=%s>' % saxutils.quoteattr(container),
-                ''.join(xml_output), '</container>'])
+        broker = self._get_container_broker(drive, part, account, container,
+                                            pending_timeout=0.1,
+                                            stale_reads_ok=True)
+        info, is_deleted = broker.get_info_is_deleted()
+        record_type = req.headers.get('x-backend-record-type', '').lower()
+        db_state = info.get('db_state')
+        if record_type == 'auto' and db_state in (SHARDING, SHARDED):
+            record_type = 'shard'
+        if record_type == 'shard':
+            return self.GET_shard(req, broker, container, params, info,
+                                  is_deleted, out_content_type)
+        else:
+            return self.GET_object(req, broker, container, params, info,
+                                   is_deleted, out_content_type)
+
+    @timing_stats()
+    def GET_shard(self, req, broker, container, params, info,
+                  is_deleted, out_content_type):
+        """
+        Returns a list of persisted shard ranges or namespaces in response.
+
+        :param req: swob.Request object
+        :param broker: container DB broker object
+        :param container: container name
+        :param params: the request params.
+        :param info: the global info for the container
+        :param is_deleted: the is_deleted status for the container.
+        :param out_content_type: content type as a string.
+        :returns: an instance of :class:`swift.common.swob.Response`
+        """
+        override_deleted = info and config_true_value(
+            req.headers.get('x-backend-override-deleted', False))
+        resp_headers = gen_resp_headers(
+            info, is_deleted=is_deleted and not override_deleted)
+
+        if is_deleted and not override_deleted:
+            return HTTPNotFound(request=req, headers=resp_headers)
+
+        marker = params.get('marker', '')
+        end_marker = params.get('end_marker')
+        reverse = config_true_value(params.get('reverse'))
+        states = params.get('states')
+        includes = params.get('includes')
+        include_deleted = config_true_value(
+            req.headers.get('x-backend-include-deleted', False))
+
+        resp_headers['X-Backend-Record-Type'] = 'shard'
+        override_filter_hdr = req.headers.get(
+            'x-backend-override-shard-name-filter', '').lower()
+        if override_filter_hdr == info.get('db_state') == 'sharded':
+            # respect the request to send back *all* ranges if the db is in
+            # sharded state
+            resp_headers['X-Backend-Override-Shard-Name-Filter'] = 'true'
+            marker = end_marker = includes = None
+            reverse = False
+        fill_gaps = include_own = False
+        if states:
+            states = list_from_csv(states)
+            fill_gaps = any(('listing' in states, 'updating' in states))
+            # The 'auditing' state alias is used by the sharder during
+            # shard audit; if the shard is shrinking then it needs to get
+            # acceptor shard ranges, which may be the root container
+            # itself, so use include_own.
+            include_own = 'auditing' in states
+            try:
+                states = broker.resolve_shard_range_states(states)
+            except ValueError:
+                return HTTPBadRequest(request=req, body='Bad state')
+
+        # For record type of 'shard', user can specify an additional header
+        # to ask for list of Namespaces instead of full ShardRanges.
+        # This will allow proxy server who is going to retrieve Namespace
+        # to talk to older version of container servers who don't support
+        # Namespace yet during upgrade.
+        shard_format = req.headers.get(
+            'x-backend-record-shard-format', 'full').lower()
+        if shard_format == 'namespace':
+            resp_headers['X-Backend-Record-Shard-Format'] = 'namespace'
+            # Namespace GET does not support all the options of Shard Range
+            # GET: 'x-backend-include-deleted' cannot be supported because
+            # there is no way for a Namespace to indicate the deleted state;
+            # the 'auditing' state query parameter is not supported because it
+            # is specific to the sharder which only requests full shard ranges.
+            if include_deleted:
+                return HTTPBadRequest(
+                    request=req, body='No include_deleted for namespace GET')
+            if include_own:
+                return HTTPBadRequest(
+                    request=req, body='No auditing state for namespace GET')
+            shard_format_full = False
+            container_list = broker.get_namespaces(
+                marker, end_marker, includes, reverse, states, fill_gaps)
         else:
-            if not container_list:
-                return HTTPNoContent(request=req, headers=resp_headers)
-            container_list = '\n'.join(r[0] for r in container_list) + '\n'
-        ret = Response(body=container_list, request=req, headers=resp_headers)
-        ret.content_type = out_content_type
-        ret.charset = 'utf-8'
+            resp_headers['X-Backend-Record-Shard-Format'] = 'full'
+            shard_format_full = True
+            container_list = broker.get_shard_ranges(
+                marker, end_marker, includes, reverse, states=states,
+                include_deleted=include_deleted, fill_gaps=fill_gaps,
+                include_own=include_own)
+        listing = [self.update_shard_record(record, shard_format_full)
+                   for record in container_list]
+        return self._create_GET_response(req, out_content_type, info,
+                                         resp_headers, broker.metadata,
+                                         container, listing)
+
+    @timing_stats()
+    def GET_object(self, req, broker, container, params, info,
+                   is_deleted, out_content_type):
+        """
+        Returns a list of objects in response.
+
+        :param req: swob.Request object
+        :param broker: container DB broker object
+        :param container: container name
+        :param params: the request params.
+        :param info: the global info for the container
+        :param is_deleted: the is_deleted status for the container.
+        :param out_content_type: content type as a string.
+        :returns: an instance of :class:`swift.common.swob.Response`
+        """
+        marker = params.get('marker', '')
+        end_marker = params.get('end_marker')
+        reverse = config_true_value(params.get('reverse'))
+        path = params.get('path')
+        prefix = params.get('prefix')
+        delimiter = params.get('delimiter')
+        limit = params['limit']
+        requested_policy_index = self.get_and_validate_policy_index(req)
+        resp_headers = gen_resp_headers(info, is_deleted=is_deleted)
+        if is_deleted:
+            return HTTPNotFound(request=req, headers=resp_headers)
+        resp_headers['X-Backend-Record-Type'] = 'object'
+        storage_policy_index = (
+            requested_policy_index if requested_policy_index is not None
+            else info['storage_policy_index'])
+        resp_headers['X-Backend-Record-Storage-Policy-Index'] = \
+            storage_policy_index
+        # Use the retired db while container is in process of sharding,
+        # otherwise use current db
+        src_broker = broker.get_brokers()[0]
+        container_list = src_broker.list_objects_iter(
+            limit, marker, end_marker, prefix, delimiter, path,
+            storage_policy_index=storage_policy_index,
+            reverse=reverse, allow_reserved=req.allow_reserved_names)
+        listing = [self.update_object_record(record)
+                   for record in container_list]
+        return self._create_GET_response(req, out_content_type, info,
+                                         resp_headers, broker.metadata,
+                                         container, listing)
+
+    def _create_GET_response(self, req, out_content_type, info, resp_headers,
+                             metadata, container, listing):
+        for key, (value, _timestamp) in metadata.items():
+            if value and (key.lower() in self.save_headers or
+                          is_sys_or_user_meta('container', key)):
+                resp_headers[str_to_wsgi(key)] = str_to_wsgi(value)
+
+        if out_content_type.endswith('/xml'):
+            body = listing_formats.container_to_xml(listing, container)
+        elif out_content_type.endswith('/json'):
+            body = json.dumps(listing).encode('ascii')
+        else:
+            body = listing_formats.listing_to_text(listing)
+
+        ret = Response(request=req, headers=resp_headers, body=body,
+                       content_type=out_content_type, charset='utf-8')
+        ret.last_modified = Timestamp(resp_headers['X-PUT-Timestamp'])
+        if not ret.body:
+            ret.status_int = HTTP_NO_CONTENT
         return ret
 
     @public
-    @timing_stats
+    @replication
+    @timing_stats(sample_rate=0.01)
     def REPLICATE(self, req):
         """
         Handle HTTP REPLICATE request (json-encoded RPC calls for replication.)
         """
+        post_args = split_and_validate_path(req, 3)
+        drive, partition, hash = post_args
         try:
-            post_args = split_path(unquote(req.path), 3)
-            drive, partition, hash = post_args
-            validate_device_partition(drive, partition)
-        except ValueError, err:
-            return HTTPBadRequest(body=str(err), content_type='text/plain',
-                                  request=req)
-        if self.mount_check and not check_mount(self.root, drive):
+            check_drive(self.root, drive, self.mount_check)
+        except ValueError:
+            return HTTPInsufficientStorage(drive=drive, request=req)
+        if not self.check_free_space(drive):
             return HTTPInsufficientStorage(drive=drive, request=req)
         try:
             args = json.load(req.environ['wsgi.input'])
-        except ValueError, err:
+        except ValueError as err:
             return HTTPBadRequest(body=str(err), content_type='text/plain')
         ret = self.replicator_rpc.dispatch(post_args, args)
         ret.request = req
         return ret
 
     @public
-    @timing_stats
-    def POST(self, req):
-        """Handle HTTP POST request."""
+    @timing_stats()
+    def UPDATE(self, req):
+        """
+        Handle HTTP UPDATE request (merge_items RPCs coming from the proxy.)
+        """
+        drive, part, account, container = get_container_name_and_placement(req)
+        req_timestamp = valid_timestamp(req)
+        try:
+            check_drive(self.root, drive, self.mount_check)
+        except ValueError:
+            return HTTPInsufficientStorage(drive=drive, request=req)
+        if not self.check_free_space(drive):
+            return HTTPInsufficientStorage(drive=drive, request=req)
+
+        requested_policy_index = self.get_and_validate_policy_index(req)
+        broker = self._get_container_broker(drive, part, account, container)
+        self._maybe_autocreate(broker, req_timestamp, account,
+                               requested_policy_index, req)
         try:
-            drive, part, account, container = split_path(unquote(req.path), 4)
-            validate_device_partition(drive, part)
-        except ValueError, err:
-            return HTTPBadRequest(body=str(err), content_type='text/plain',
-                                  request=req)
-        if 'x-timestamp' not in req.headers or \
-                not check_float(req.headers['x-timestamp']):
-            return HTTPBadRequest(body='Missing or bad timestamp',
-                                  request=req, content_type='text/plain')
+            objs = json.load(req.environ['wsgi.input'])
+        except ValueError as err:
+            return HTTPBadRequest(body=str(err), content_type='text/plain')
+        broker.merge_items(objs)
+        return HTTPAccepted(request=req)
+
+    @public
+    @timing_stats()
+    def POST(self, req):
+        """
+        Handle HTTP POST request.
+
+        A POST request will update the container's ``put_timestamp``, unless
+        it has an ``X-Backend-No-Timestamp-Update`` header with a truthy value.
+
+        :param req: an instance of :class:`~swift.common.swob.Request`.
+        """
+        drive, part, account, container = get_container_name_and_placement(req)
+        req_timestamp = valid_timestamp(req)
         if 'x-container-sync-to' in req.headers:
-            err = validate_sync_to(req.headers['x-container-sync-to'],
-                                   self.allowed_sync_hosts)
+            err, sync_to, realm, realm_key = validate_sync_to(
+                req.headers['x-container-sync-to'], self.allowed_sync_hosts,
+                self.realms_conf)
             if err:
                 return HTTPBadRequest(err)
-        if self.mount_check and not check_mount(self.root, drive):
+        try:
+            check_drive(self.root, drive, self.mount_check)
+        except ValueError:
+            return HTTPInsufficientStorage(drive=drive, request=req)
+        if not self.check_free_space(drive):
             return HTTPInsufficientStorage(drive=drive, request=req)
         broker = self._get_container_broker(drive, part, account, container)
         if broker.is_deleted():
             return HTTPNotFound(request=req)
-        timestamp = normalize_timestamp(req.headers['x-timestamp'])
-        metadata = {}
-        metadata.update(
-            (key, (value, timestamp)) for key, value in req.headers.iteritems()
-            if key.lower() in self.save_headers or
-            key.lower().startswith('x-container-meta-'))
-        if metadata:
-            if 'X-Container-Sync-To' in metadata:
-                if 'X-Container-Sync-To' not in broker.metadata or \
-                        metadata['X-Container-Sync-To'][0] != \
-                        broker.metadata['X-Container-Sync-To'][0]:
-                    broker.set_x_container_sync_points(-1, -1)
-            broker.update_metadata(metadata)
+        if not config_true_value(
+                req.headers.get('x-backend-no-timestamp-update', False)):
+            broker.update_put_timestamp(req_timestamp.internal)
+        self._update_metadata(req, broker, req_timestamp, 'POST')
         return HTTPNoContent(request=req)
 
     def __call__(self, env, start_response):
         start_time = time.time()
         req = Request(env)
         self.logger.txn_id = req.headers.get('x-trans-id', None)
-        if not check_utf8(req.path_info):
-            res = HTTPPreconditionFailed(body='Invalid UTF8')
+        if not check_utf8(wsgi_to_str(req.path_info), internal=True):
+            res = HTTPPreconditionFailed(body='Invalid UTF8 or contains NULL')
         else:
             try:
                 # disallow methods which have not been marked 'public'
-                try:
-                    method = getattr(self, req.method)
-                    getattr(method, 'publicly_accessible')
-                except AttributeError:
+                if req.method not in self.allowed_methods:
                     res = HTTPMethodNotAllowed()
                 else:
-                    res = method(req)
+                    res = getattr(self, req.method)(req)
+            except HTTPException as error_response:
+                res = error_response
             except (Exception, Timeout):
-                self.logger.exception(_(
-                    'ERROR __call__ error with %(method)s %(path)s '),
+                self.logger.exception(
+                    'ERROR __call__ error with %(method)s %(path)s ',
                     {'method': req.method, 'path': req.path})
                 res = HTTPInternalServerError(body=traceback.format_exc())
-        trans_time = '%.4f' % (time.time() - start_time)
-        log_message = '%s - - [%s] "%s %s" %s %s "%s" "%s" "%s" %s' % (
-            req.remote_addr,
-            time.strftime('%d/%b/%Y:%H:%M:%S +0000',
-                          time.gmtime()),
-            req.method, req.path,
-            res.status.split()[0], res.content_length or '-',
-            req.headers.get('x-trans-id', '-'),
-            req.referer or '-', req.user_agent or '-',
-            trans_time)
-        if req.method.upper() == 'REPLICATE':
-            self.logger.debug(log_message)
-        else:
-            self.logger.info(log_message)
+        if self.log_requests:
+            trans_time = time.time() - start_time
+            log_message = get_log_line(req, res, trans_time, '',
+                                       self.log_format,
+                                       self.anonymization_method,
+                                       self.anonymization_salt)
+            if req.method.upper() == 'REPLICATE':
+                self.logger.debug(log_message)
+            else:
+                self.logger.info(log_message)
         return res(env, start_response)
 
 
@@ -499,3 +1048,12 @@ def app_factory(global_conf, **local_conf):
     conf = global_conf.copy()
     conf.update(local_conf)
     return ContainerController(conf)
+
+
+def main():
+    conf_file, options = parse_options(test_config=True)
+    sys.exit(run_wsgi(conf_file, 'container-server', **options))
+
+
+if __name__ == '__main__':
+    main()
diff --git a/swift/container/sharder.py b/swift/container/sharder.py
new file mode 100644
index 0000000000..e878b83ebc
--- /dev/null
+++ b/swift/container/sharder.py
@@ -0,0 +1,2662 @@
+# Copyright (c) 2015 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import collections
+import errno
+import json
+import operator
+from optparse import OptionParser
+import time
+from collections import defaultdict
+from operator import itemgetter
+from random import random
+
+import os
+from urllib.parse import quote
+from eventlet import Timeout
+from contextlib import contextmanager
+
+from swift.common import internal_client
+from swift.common.constraints import check_drive, AUTO_CREATE_ACCOUNT_PREFIX
+from swift.common.db_replicator import BrokerAnnotatedLogger
+from swift.common.direct_client import (direct_put_container,
+                                        DirectClientException)
+from swift.common.daemon import run_daemon
+from swift.common.request_helpers import USE_REPLICATION_NETWORK_HEADER
+from swift.common.ring.utils import is_local_device
+from swift.common.statsd_client import get_labeled_statsd_client
+from swift.common.swob import str_to_wsgi
+from swift.common.utils import get_logger, config_true_value, \
+    dump_recon_cache, whataremyips, Timestamp, ShardRange, GreenAsyncPile, \
+    config_positive_int_value, quorum_size, parse_override_options, \
+    Everything, config_auto_int_value, ShardRangeList, config_percent_value, \
+    node_to_string, parse_options
+from swift.container.backend import ContainerBroker, \
+    RECORD_TYPE_SHARD, UNSHARDED, SHARDING, SHARDED, COLLAPSED, \
+    SHARD_UPDATE_STATES, sift_shard_ranges, SHARD_UPDATE_STAT_STATES
+from swift.container.replicator import ContainerReplicator
+
+
+CLEAVE_SUCCESS = 0
+CLEAVE_FAILED = 1
+CLEAVE_EMPTY = 2
+
+DEFAULT_PERIODIC_WARNINGS_INTERVAL = 24 * 3600
+
+
+def sharding_enabled(broker):
+    # NB all shards will by default have been created with
+    # X-Container-Sysmeta-Sharding set and will therefore be candidates for
+    # sharding, along with explicitly configured root containers.
+    sharding = broker.metadata.get('X-Container-Sysmeta-Sharding')
+    if sharding and config_true_value(sharding[0]):
+        return True
+    # if broker has been marked deleted it will have lost sysmeta, but we still
+    # need to process the broker (for example, to shrink any shard ranges) so
+    # fallback to checking if it has any shard ranges
+    if broker.has_other_shard_ranges():
+        return True
+    return False
+
+
+def make_shard_ranges(broker, shard_data, shards_account_prefix):
+    timestamp = Timestamp.now()
+    shard_ranges = []
+    for data in shard_data:
+        # Make a copy so we don't mutate the original
+        kwargs = data.copy()
+        path = ShardRange.make_path(
+            shards_account_prefix + broker.root_account,
+            broker.root_container, broker.container,
+            timestamp, kwargs.pop('index'))
+
+        shard_ranges.append(ShardRange(path, timestamp, **kwargs))
+    return shard_ranges
+
+
+def _find_discontinuity(paths, start):
+    # select the path that reaches furthest from start into the namespace
+    start_paths = [path for path in paths if path.lower == start]
+    start_paths.sort(key=lambda p: p.upper)
+    longest_start_path = start_paths[-1]
+    # search for paths that end further into the namespace (note: these must
+    # have a lower that differs from the start_path upper, otherwise they would
+    # be part of the start_path longer!)
+    end_paths = [path for path in paths
+                 if path.upper > longest_start_path.upper]
+    if end_paths:
+        # select those that begin nearest the start of the namespace
+        end_paths.sort(key=lambda p: p.lower)
+        end_paths = [p for p in end_paths if p.lower == end_paths[0].lower]
+        # select the longest of those
+        end_paths.sort(key=lambda p: p.upper)
+        longest_end_path = end_paths[-1]
+    else:
+        longest_end_path = None
+    return longest_start_path, longest_end_path
+
+
+def find_paths_with_gaps(shard_ranges, within_range=None):
+    """
+    Find gaps in the shard ranges and pairs of shard range paths that lead to
+    and from those gaps. For each gap a single pair of adjacent paths is
+    selected. The concatenation of all selected paths and gaps will span the
+    entire namespace with no overlaps.
+
+    :param shard_ranges: a list of instances of ShardRange.
+    :param within_range: an optional ShardRange that constrains the search
+        space; the method will only return gaps within this range. The default
+        is the entire namespace.
+    :return: A list of tuples of ``(start_path, gap_range, end_path)`` where
+        ``start_path`` is a list of ShardRanges leading to the gap,
+        ``gap_range`` is a ShardRange synthesized to describe the namespace
+        gap, and ``end_path`` is a list of ShardRanges leading from the gap.
+        When gaps start or end at the namespace minimum or maximum bounds,
+        ``start_path`` and ``end_path`` may be 'null' paths that contain a
+        single ShardRange covering either the minimum or maximum of the
+        namespace.
+    """
+    timestamp = Timestamp.now()
+    within_range = within_range or ShardRange('entire/namespace', timestamp)
+    shard_ranges = ShardRangeList(shard_ranges)
+    # note: find_paths results do not include shrinking ranges
+    paths = find_paths(shard_ranges)
+    # add paths covering no namespace at start and end of namespace to ensure
+    # that a start_path and end_path is always found even when there is a gap
+    # at the start or end of the namespace
+    null_start = ShardRange('null/start', timestamp,
+                            lower=ShardRange.MIN,
+                            upper=ShardRange.MIN,
+                            state=ShardRange.FOUND)
+    null_end = ShardRange('null/end', timestamp,
+                          lower=ShardRange.MAX,
+                          upper=ShardRange.MAX,
+                          state=ShardRange.FOUND)
+    paths.extend([ShardRangeList([null_start]), ShardRangeList([null_end])])
+    paths_with_gaps = []
+    start = null_start.lower
+    while True:
+        start_path, end_path = _find_discontinuity(paths, start)
+        if end_path is None:
+            # end of namespace reached
+            break
+        start = end_path.lower
+        if start_path.upper > end_path.lower:
+            # overlap
+            continue
+        gap_range = ShardRange('gap/index_%06d' % len(paths_with_gaps),
+                               timestamp,
+                               lower=start_path.upper,
+                               upper=end_path.lower)
+        if gap_range.overlaps(within_range):
+            paths_with_gaps.append((start_path, gap_range, end_path))
+    return paths_with_gaps
+
+
+def _is_parent_or_child(shard_range, other, time_period):
+    """
+    Test if shard range ``shard_range`` is the parent or a child of another
+    shard range ``other`` within past time period ``time_period``. This method
+    is limited to work only within the scope of the same user-facing account
+    (with and without shard prefix).
+
+    :param shard_range: an instance of ``ShardRange``.
+    :param other: an instance of ``ShardRange``.
+    :param time_period: the specified past time period in seconds. Value of
+        0 means all time in the past.
+    :return: True if ``shard_range`` is the parent or a child of ``other``
+        within past time period, False otherwise, assuming that they are within
+         the same account.
+    """
+    exclude_age = (time.time() - float(time_period)) if time_period > 0 else 0
+    if shard_range.is_child_of(other) and shard_range.timestamp >= exclude_age:
+        return True
+    if other.is_child_of(shard_range) and other.timestamp >= exclude_age:
+        return True
+    return False
+
+
+def find_overlapping_ranges(
+        shard_ranges, exclude_parent_child=False, time_period=0):
+    """
+    Find all pairs of overlapping ranges in the given list.
+
+    :param shard_ranges: A list of :class:`~swift.utils.ShardRange`
+    :param exclude_parent_child: If True then overlapping pairs that have a
+        parent-child relationship within the past time period
+        ``time_period`` are excluded from the returned set. Default is
+        False.
+    :param time_period: the specified past time period in seconds. Value of
+        0 means all time in the past.
+    :return: a set of tuples, each tuple containing ranges that overlap with
+        each other.
+    """
+    result = set()
+    for i, shard_range in enumerate(shard_ranges):
+        if exclude_parent_child:
+            overlapping = [
+                sr for sr in shard_ranges[i + 1:]
+                if shard_range.name != sr.name and shard_range.overlaps(sr) and
+                not _is_parent_or_child(shard_range, sr, time_period)]
+        else:
+            overlapping = [
+                sr for sr in shard_ranges[i + 1:]
+                if shard_range.name != sr.name and shard_range.overlaps(sr)]
+        if overlapping:
+            overlapping.append(shard_range)
+            overlapping.sort(key=ShardRange.sort_key)
+            result.add(tuple(overlapping))
+
+    return result
+
+
+def is_sharding_candidate(shard_range, threshold):
+    # note: use *object* count as the condition for sharding: tombstones will
+    # eventually be reclaimed so should not trigger sharding
+    return (shard_range.state == ShardRange.ACTIVE and
+            shard_range.object_count >= threshold)
+
+
+def is_shrinking_candidate(shard_range, shrink_threshold, expansion_limit,
+                           states=None):
+    # typically shrink_threshold < expansion_limit but check both just in case
+    # note: use *row* count (objects plus tombstones) as the condition for
+    # shrinking to avoid inadvertently moving large numbers of tombstones into
+    # an acceptor
+    states = states or (ShardRange.ACTIVE,)
+    return (shard_range.state in states and
+            shard_range.row_count < shrink_threshold and
+            shard_range.row_count <= expansion_limit)
+
+
+def find_sharding_candidates(broker, threshold, shard_ranges=None):
+    # this should only execute on root containers; the goal is to find
+    # large shard containers that should be sharded.
+    # First cut is simple: assume root container shard usage stats are good
+    # enough to make decision.
+    if shard_ranges is None:
+        shard_ranges = broker.get_shard_ranges(states=[ShardRange.ACTIVE])
+    candidates = []
+    for shard_range in shard_ranges:
+        if not is_sharding_candidate(shard_range, threshold):
+            continue
+        shard_range.update_state(ShardRange.SHARDING,
+                                 state_timestamp=Timestamp.now())
+        shard_range.epoch = shard_range.state_timestamp
+        candidates.append(shard_range)
+    return candidates
+
+
+def find_shrinking_candidates(broker, shrink_threshold, expansion_limit):
+    # this is only here to preserve a legacy public function signature;
+    # superseded by find_compactible_shard_sequences
+    merge_pairs = {}
+    # restrict search to sequences with one donor
+    results = find_compactible_shard_sequences(broker, shrink_threshold,
+                                               expansion_limit, 1, -1,
+                                               include_shrinking=True)
+    for sequence in results:
+        # map acceptor -> donor list
+        merge_pairs[sequence[-1]] = sequence[-2]
+    return merge_pairs
+
+
+def find_compactible_shard_sequences(broker,
+                                     shrink_threshold,
+                                     expansion_limit,
+                                     max_shrinking,
+                                     max_expanding,
+                                     include_shrinking=False):
+    """
+    Find sequences of shard ranges that could be compacted into a single
+    acceptor shard range.
+
+    This function does not modify shard ranges.
+
+    :param broker: A :class:`~swift.container.backend.ContainerBroker`.
+    :param shrink_threshold: the number of rows below which a shard may be
+        considered for shrinking into another shard
+    :param expansion_limit: the maximum number of rows that an acceptor shard
+        range should have after other shard ranges have been compacted into it
+    :param max_shrinking: the maximum number of shard ranges that should be
+        compacted into each acceptor; -1 implies unlimited.
+    :param max_expanding: the maximum number of acceptors to be found (i.e. the
+        maximum number of sequences to be returned); -1 implies unlimited.
+    :param include_shrinking: if True then existing compactible sequences are
+        included in the results; default is False.
+    :returns: A list of :class:`~swift.common.utils.ShardRangeList` each
+        containing a sequence of neighbouring shard ranges that may be
+        compacted; the final shard range in the list is the acceptor
+    """
+    # this should only execute on root containers that have sharded; the
+    # goal is to find small shard containers that could be retired by
+    # merging with a neighbour.
+    # First cut is simple: assume root container shard usage stats are good
+    # enough to make decision; only merge with upper neighbour so that
+    # upper bounds never change (shard names include upper bound).
+    shard_ranges = broker.get_shard_ranges()
+    own_shard_range = broker.get_own_shard_range()
+
+    def sequence_complete(sequence):
+        # a sequence is considered complete if any of the following are true:
+        #  - the final shard range has more objects than the shrink_threshold,
+        #    so should not be shrunk (this shard will be the acceptor)
+        #  - the max number of shard ranges to be compacted (max_shrinking) has
+        #    been reached
+        #  - the total number of objects in the sequence has reached the
+        #    expansion_limit
+        if (sequence and
+                (not is_shrinking_candidate(
+                    sequence[-1], shrink_threshold, expansion_limit,
+                    states=(ShardRange.ACTIVE, ShardRange.SHRINKING)) or
+                 0 < max_shrinking < len(sequence) or
+                 sequence.row_count >= expansion_limit)):
+            return True
+        return False
+
+    compactible_sequences = []
+    index = 0
+    expanding = 0
+    while ((max_expanding < 0 or expanding < max_expanding) and
+           index < len(shard_ranges)):
+        if not is_shrinking_candidate(
+                shard_ranges[index], shrink_threshold, expansion_limit,
+                states=(ShardRange.ACTIVE, ShardRange.SHRINKING)):
+            # this shard range cannot be the start of a new or existing
+            # compactible sequence, move on
+            index += 1
+            continue
+
+        # start of a *possible* sequence
+        sequence = ShardRangeList([shard_ranges[index]])
+        for shard_range in shard_ranges[index + 1:]:
+            # attempt to add contiguous shard ranges to the sequence
+            if sequence.upper < shard_range.lower:
+                # found a gap! break before consuming this range because it
+                # could become the first in the next sequence
+                break
+
+            if shard_range.state not in (ShardRange.ACTIVE,
+                                         ShardRange.SHRINKING):
+                # found? created? sharded? don't touch it
+                break
+
+            if shard_range.state == ShardRange.SHRINKING:
+                # already shrinking: add to sequence unconditionally
+                sequence.append(shard_range)
+            elif (sequence.row_count + shard_range.row_count
+                  <= expansion_limit):
+                # add to sequence: could be a donor or acceptor
+                sequence.append(shard_range)
+                if sequence_complete(sequence):
+                    break
+            else:
+                break
+
+        index += len(sequence)
+        if (index == len(shard_ranges) and
+                len(shard_ranges) == len(sequence) and
+                not sequence_complete(sequence) and
+                sequence.includes(own_shard_range)):
+            # special case: only one sequence has been found, which consumes
+            # all shard ranges, encompasses the entire namespace, has no more
+            # than expansion_limit records and whose shard ranges are all
+            # shrinkable; all the shards in the sequence can be shrunk to the
+            # root, so append own_shard_range to the sequence to act as an
+            # acceptor; note: only shrink to the root when *all* the remaining
+            # shard ranges can be simultaneously shrunk to the root.
+            sequence.append(own_shard_range)
+
+        if len(sequence) < 2 or sequence[-1].state not in (ShardRange.ACTIVE,
+                                                           ShardRange.SHARDED):
+            # this sequence doesn't end with a suitable acceptor shard range
+            continue
+
+        # all valid sequences are counted against the max_expanding allowance
+        # even if the sequence is already shrinking
+        expanding += 1
+        if (all([sr.state != ShardRange.SHRINKING for sr in sequence]) or
+                include_shrinking):
+            compactible_sequences.append(sequence)
+
+    return compactible_sequences
+
+
+def finalize_shrinking(broker, acceptor_ranges, donor_ranges, timestamp):
+    """
+    Update donor shard ranges to shrinking state and merge donors and acceptors
+    to broker.
+
+    :param broker: A :class:`~swift.container.backend.ContainerBroker`.
+    :param acceptor_ranges: A list of :class:`~swift.common.utils.ShardRange`
+        that are to be acceptors.
+    :param donor_ranges: A list of :class:`~swift.common.utils.ShardRange`
+        that are to be donors; these will have their state and timestamp
+        updated.
+    :param timestamp: timestamp to use when updating donor state
+    """
+    for donor in donor_ranges:
+        if donor.update_state(ShardRange.SHRINKING):
+            # Set donor state to shrinking state_timestamp defines new epoch
+            donor.epoch = donor.state_timestamp = timestamp
+    broker.merge_shard_ranges(acceptor_ranges + donor_ranges)
+
+
+def process_compactible_shard_sequences(broker, sequences):
+    """
+    Transform the given sequences of shard ranges into a list of acceptors and
+    a list of shrinking donors. For each given sequence the final ShardRange in
+    the sequence (the acceptor) is expanded to accommodate the other
+    ShardRanges in the sequence (the donors). The donors and acceptors are then
+    merged into the broker.
+
+    :param broker: A :class:`~swift.container.backend.ContainerBroker`.
+    :param sequences: A list of :class:`~swift.common.utils.ShardRangeList`
+    """
+    timestamp = Timestamp.now()
+    acceptor_ranges = []
+    shrinking_ranges = []
+    for sequence in sequences:
+        donors = sequence[:-1]
+        shrinking_ranges.extend(donors)
+        # Update the acceptor container with its expanded bounds to prevent it
+        # treating objects cleaved from the donor as misplaced.
+        acceptor = sequence[-1]
+        if acceptor.expand(donors):
+            # Update the acceptor container with its expanded bounds to prevent
+            # it treating objects cleaved from the donor as misplaced.
+            acceptor.timestamp = timestamp
+        if acceptor.update_state(ShardRange.ACTIVE):
+            # Ensure acceptor state is ACTIVE (when acceptor is root)
+            acceptor.state_timestamp = timestamp
+        acceptor_ranges.append(acceptor)
+    finalize_shrinking(broker, acceptor_ranges, shrinking_ranges, timestamp)
+
+
+def find_paths(shard_ranges):
+    """
+    Returns a list of all continuous paths through the shard ranges. An
+    individual path may not necessarily span the entire namespace, but it will
+    span a continuous namespace without gaps.
+
+    :param shard_ranges: A list of :class:`~swift.common.utils.ShardRange`.
+    :return: A list of :class:`~swift.common.utils.ShardRangeList`.
+    """
+    # A node is a point in the namespace that is used as a bound of any shard
+    # range. Shard ranges form the edges between nodes.
+
+    # First build a dict mapping nodes to a list of edges that leave that node
+    # (in other words, shard ranges whose lower bound equals the node)
+    node_successors = collections.defaultdict(list)
+    for shard_range in shard_ranges:
+        if shard_range.state == ShardRange.SHRINKING:
+            # shrinking shards are not a viable edge in any path
+            continue
+        node_successors[shard_range.lower].append(shard_range)
+
+    paths = []
+
+    def clone_path(other=None):
+        # create a new path, possibly cloning another path, and add it to the
+        # list of all paths through the shards
+        path = ShardRangeList() if other is None else ShardRangeList(other)
+        paths.append(path)
+        return path
+
+    # we need to keep track of every path that ends at each node so that when
+    # we visit the node we can extend those paths, or clones of them, with the
+    # edges that leave the node
+    paths_to_node = collections.defaultdict(list)
+
+    # visit the nodes in ascending order by name...
+    for node, edges in sorted(node_successors.items()):
+        if not edges:
+            # this node is a dead-end, so there's no path updates to make
+            continue
+        if not paths_to_node[node]:
+            # this is either the first node to be visited, or it has no paths
+            # leading to it, so we need to start a new path here
+            paths_to_node[node].append(clone_path([]))
+        for path_to_node in paths_to_node[node]:
+            # extend each path that arrives at this node with all of the
+            # possible edges that leave the node; if more than edge leaves the
+            # node then we will make clones of the path to the node and extend
+            # those clones, adding to the collection of all paths though the
+            # shards
+            for i, edge in enumerate(edges):
+                if i == len(edges) - 1:
+                    # the last edge is used to extend the original path to the
+                    # node; there is nothing special about the last edge, but
+                    # doing this last means the original path to the node can
+                    # be cloned for all other edges before being modified here
+                    path = path_to_node
+                else:
+                    # for all but one of the edges leaving the node we need to
+                    # make a clone the original path
+                    path = clone_path(path_to_node)
+                # extend the path with the edge
+                path.append(edge)
+                # keep track of which node this path now arrives at
+                paths_to_node[edge.upper].append(path)
+    return paths
+
+
+def rank_paths(paths, shard_range_to_span):
+    """
+    Sorts the given list of paths such that the most preferred path is the
+    first item in the list.
+
+    :param paths: A list of :class:`~swift.common.utils.ShardRangeList`.
+    :param shard_range_to_span: An instance of
+        :class:`~swift.common.utils.ShardRange` that describes the namespace
+        that would ideally be spanned by a path. Paths that include this
+        namespace will be preferred over those that do not.
+    :return: A sorted list of :class:`~swift.common.utils.ShardRangeList`.
+    """
+    def sort_key(path):
+        # defines the order of preference for paths through shards
+        return (
+            # complete path for the namespace
+            path.includes(shard_range_to_span),
+            # most cleaving progress
+            path.find_lower(lambda sr: sr.state not in (
+                ShardRange.CLEAVED, ShardRange.ACTIVE)),
+            # largest object count
+            path.object_count,
+            # fewest timestamps
+            -1 * len(path.timestamps),
+            # newest timestamp
+            sorted(path.timestamps)[-1]
+        )
+
+    paths.sort(key=sort_key, reverse=True)
+    return paths
+
+
+def combine_shard_ranges(new_shard_ranges, existing_shard_ranges):
+    """
+    Combines new and existing shard ranges based on most recent state.
+
+    :param new_shard_ranges: a list of ShardRange instances.
+    :param existing_shard_ranges: a list of ShardRange instances.
+    :return: a list of ShardRange instances.
+    """
+    new_shard_ranges = [dict(sr) for sr in new_shard_ranges]
+    existing_shard_ranges = [dict(sr) for sr in existing_shard_ranges]
+    to_add, to_delete = sift_shard_ranges(
+        new_shard_ranges,
+        dict((sr['name'], sr) for sr in existing_shard_ranges))
+    result = [ShardRange.from_dict(existing)
+              for existing in existing_shard_ranges
+              if existing['name'] not in to_delete]
+    result.extend([ShardRange.from_dict(sr) for sr in to_add])
+    return sorted([sr for sr in result if not sr.deleted],
+                  key=ShardRange.sort_key)
+
+
+def update_own_shard_range_stats(broker, own_shard_range):
+    """
+    Update the ``own_shard_range`` with the up-to-date object stats from
+    the ``broker``.
+
+    Note: this method does not persist the updated ``own_shard_range``;
+    callers should use ``broker.merge_shard_ranges`` if the updated stats
+    need to be persisted.
+
+    :param broker: an instance of ``ContainerBroker``.
+    :param own_shard_range: and instance of ``ShardRange``.
+    :returns: ``own_shard_range`` with up-to-date ``object_count``
+        and ``bytes_used``.
+    """
+    info = broker.get_info()
+    own_shard_range.update_meta(
+        info['object_count'], info['bytes_used'])
+    return own_shard_range
+
+
+class CleavingContext(object):
+    """
+    Encapsulates metadata associated with the process of cleaving a retiring
+    DB. This metadata includes:
+
+    * ``ref``: The unique part of the key that is used when persisting a
+      serialized ``CleavingContext`` as sysmeta in the DB. The unique part of
+      the key is based off the DB id. This ensures that each context is
+      associated with a specific DB file. The unique part of the key is
+      included in the ``CleavingContext`` but should not be modified by any
+      caller.
+
+    * ``cursor``: the upper bound of the last shard range to have been
+      cleaved from the retiring DB.
+
+    * ``max_row``: the retiring DB's max row; this is updated to the value of
+      the retiring DB's ``max_row`` every time a ``CleavingContext`` is
+      loaded for that DB, and may change during the process of cleaving the
+      DB.
+
+    * ``cleave_to_row``: the value of ``max_row`` at the moment when cleaving
+      starts for the DB. When cleaving completes (i.e. the cleave cursor has
+      reached the upper bound of the cleaving namespace), ``cleave_to_row``
+      is compared to the current ``max_row``: if the two values are not equal
+      then rows have been added to the DB which may not have been cleaved, in
+      which case the ``CleavingContext`` is ``reset`` and cleaving is
+      re-started.
+
+    * ``last_cleave_to_row``: the minimum DB row from which cleaving should
+      select objects to cleave; this is initially set to None i.e. all rows
+      should be cleaved. If the ``CleavingContext`` is ``reset`` then the
+      ``last_cleave_to_row`` is set to the current value of
+      ``cleave_to_row``, which in turn is set to the current value of
+      ``max_row`` by a subsequent call to ``start``. The repeated cleaving
+      therefore only selects objects in rows greater than the
+      ``last_cleave_to_row``, rather than cleaving the whole DB again.
+
+    * ``ranges_done``: the number of shard ranges that have been cleaved from
+      the retiring DB.
+
+    * ``ranges_todo``: the number of shard ranges that are yet to be
+      cleaved from the retiring DB.
+    """
+    def __init__(self, ref, cursor='', max_row=None, cleave_to_row=None,
+                 last_cleave_to_row=None, cleaving_done=False,
+                 misplaced_done=False, ranges_done=0, ranges_todo=0,
+                 replication_time=0):
+        self.ref = ref
+        self._cursor = None
+        self.cursor = cursor
+        self.max_row = max_row
+        self.cleave_to_row = cleave_to_row
+        self.last_cleave_to_row = last_cleave_to_row
+        self.cleaving_done = cleaving_done
+        self.misplaced_done = misplaced_done
+        self.ranges_done = ranges_done
+        self.ranges_todo = ranges_todo
+        self.replication_time = replication_time
+
+    def __iter__(self):
+        yield 'ref', self.ref
+        yield 'cursor', self.cursor
+        yield 'max_row', self.max_row
+        yield 'cleave_to_row', self.cleave_to_row
+        yield 'last_cleave_to_row', self.last_cleave_to_row
+        yield 'cleaving_done', self.cleaving_done
+        yield 'misplaced_done', self.misplaced_done
+        yield 'ranges_done', self.ranges_done
+        yield 'ranges_todo', self.ranges_todo
+        yield 'replication_time', self.replication_time
+
+    def __repr__(self):
+        return '%s(%s)' % (self.__class__.__name__, ', '.join(
+            '%s=%r' % prop for prop in self))
+
+    @property
+    def cursor(self):
+        return self._cursor
+
+    @cursor.setter
+    def cursor(self, value):
+        self._cursor = value
+
+    @property
+    def marker(self):
+        return self.cursor + '\x00'
+
+    @classmethod
+    def _make_ref(cls, broker):
+        return broker.get_info()['id']
+
+    @classmethod
+    def load_all(cls, broker):
+        """
+        Returns all cleaving contexts stored in the broker's DB.
+
+        :param broker: an instance of :class:`ContainerBroker`
+        :return: list of tuples of (CleavingContext, timestamp)
+        """
+        brokers = broker.get_brokers()
+        sysmeta = brokers[-1].get_sharding_sysmeta_with_timestamps()
+
+        contexts = []
+        for key, (val, timestamp) in sysmeta.items():
+            # If the value is blank, then the metadata is
+            # marked for deletion
+            if key.startswith("Context-") and val:
+                try:
+                    contexts.append((cls(**json.loads(val)), timestamp))
+                except ValueError:
+                    continue
+        return contexts
+
+    @classmethod
+    def load(cls, broker):
+        """
+        Returns a CleavingContext tracking the cleaving progress of the given
+        broker's DB.
+
+        :param broker: an instances of :class:`ContainerBroker`
+        :return: An instance of :class:`CleavingContext`.
+        """
+        brokers = broker.get_brokers()
+        ref = cls._make_ref(brokers[0])
+        data = brokers[-1].get_sharding_sysmeta('Context-' + ref)
+        data = json.loads(data) if data else {}
+        data['ref'] = ref
+        data['max_row'] = brokers[0].get_max_row()
+        return cls(**data)
+
+    def store(self, broker):
+        """
+        Persists the serialized ``CleavingContext`` as sysmeta in the given
+        broker's DB.
+
+        :param broker: an instances of :class:`ContainerBroker`
+        """
+        broker.set_sharding_sysmeta('Context-' + self.ref,
+                                    json.dumps(dict(self)))
+
+    def reset(self):
+        self.cursor = ''
+        self.ranges_done = 0
+        self.ranges_todo = 0
+        self.cleaving_done = False
+        self.misplaced_done = False
+        self.last_cleave_to_row = self.cleave_to_row
+        self.replication_time = 0
+
+    def start(self):
+        self.cursor = ''
+        self.ranges_done = 0
+        self.ranges_todo = 0
+        self.cleaving_done = False
+        self.cleave_to_row = self.max_row
+        self.replication_time = 0
+
+    def range_done(self, new_cursor):
+        self.ranges_done += 1
+        self.ranges_todo -= 1
+        self.cursor = new_cursor
+
+    def done(self):
+        return all((self.misplaced_done, self.cleaving_done,
+                    self.max_row == self.cleave_to_row))
+
+    def delete(self, broker):
+        # These will get reclaimed when `_reclaim_metadata` in
+        # common/db.py is called.
+        broker.set_sharding_sysmeta('Context-' + self.ref, '')
+
+
+class ContainerSharderConf(object):
+    def __init__(self, conf=None):
+        conf = conf if conf else {}
+
+        def get_val(key, validator, default):
+            """
+            Get a value from conf and validate it.
+
+            :param key: key to lookup value in the ``conf`` dict.
+            :param validator: A function that will passed the value from the
+                ``conf`` dict and should return the value to be set. This
+                function should raise a ValueError if the ``conf`` value if not
+                valid.
+            :param default: value to use if ``key`` is not found in ``conf``.
+            :raises: ValueError if the value read from ``conf`` is invalid.
+            :returns: the configuration value.
+            """
+            try:
+                return validator(conf.get(key, default))
+            except ValueError as err:
+                raise ValueError('Error setting %s: %s' % (key, err))
+
+        self.shard_container_threshold = get_val(
+            'shard_container_threshold', config_positive_int_value, 1000000)
+        self.max_shrinking = get_val(
+            'max_shrinking', int, 1)
+        self.max_expanding = get_val(
+            'max_expanding', int, -1)
+        self.shard_scanner_batch_size = get_val(
+            'shard_scanner_batch_size', config_positive_int_value, 10)
+        self.cleave_batch_size = get_val(
+            'cleave_batch_size', config_positive_int_value, 2)
+        self.cleave_row_batch_size = get_val(
+            'cleave_row_batch_size', config_positive_int_value, 10000)
+        self.broker_timeout = get_val(
+            'broker_timeout', config_positive_int_value, 60)
+        self.recon_candidates_limit = get_val(
+            'recon_candidates_limit', int, 5)
+        self.recon_sharded_timeout = get_val(
+            'recon_sharded_timeout', int, 43200)
+        self.container_sharding_timeout = get_val(
+            'container_sharding_timeout', int, 172800)
+        self.conn_timeout = get_val(
+            'conn_timeout', float, 5)
+        self.auto_shard = get_val(
+            'auto_shard', config_true_value, False)
+        # deprecated percent options still loaded...
+        self.shrink_threshold = get_val(
+            'shard_shrink_point', self.percent_of_threshold, 10)
+        self.expansion_limit = get_val(
+            'shard_shrink_merge_point', self.percent_of_threshold, 75)
+        # ...but superseded by absolute options if present in conf
+        self.shrink_threshold = get_val(
+            'shrink_threshold', int, self.shrink_threshold)
+        self.expansion_limit = get_val(
+            'expansion_limit', int, self.expansion_limit)
+        self.rows_per_shard = get_val(
+            'rows_per_shard', config_positive_int_value,
+            max(self.shard_container_threshold // 2, 1))
+        self.minimum_shard_size = get_val(
+            'minimum_shard_size', config_positive_int_value,
+            max(self.rows_per_shard // 5, 1))
+
+    def percent_of_threshold(self, val):
+        return int(config_percent_value(val) * self.shard_container_threshold)
+
+    @classmethod
+    def validate_conf(cls, namespace):
+        ops = {'<': operator.lt,
+               '<=': operator.le}
+        checks = (('minimum_shard_size', '<=', 'rows_per_shard'),
+                  ('shrink_threshold', '<=', 'minimum_shard_size'),
+                  ('rows_per_shard', '<', 'shard_container_threshold'),
+                  ('expansion_limit', '<', 'shard_container_threshold'))
+        for key1, op, key2 in checks:
+            try:
+                val1 = getattr(namespace, key1)
+                val2 = getattr(namespace, key2)
+            except AttributeError:
+                # swift-manage-shard-ranges uses a subset of conf options for
+                # each command so only validate those actually in the namespace
+                continue
+            if not ops[op](val1, val2):
+                raise ValueError('%s (%d) must be %s %s (%d)'
+                                 % (key1, val1, op, key2, val2))
+
+
+DEFAULT_SHARDER_CONF = vars(ContainerSharderConf())
+
+
+class ContainerSharder(ContainerSharderConf, ContainerReplicator):
+    """Shards containers."""
+    log_route = 'container-sharder'
+
+    def __init__(self, conf, logger=None, statsd=None):
+        logger = logger or get_logger(conf, log_route=self.log_route)
+        ContainerReplicator.__init__(self, conf, logger=logger)
+        ContainerSharderConf.__init__(self, conf)
+        ContainerSharderConf.validate_conf(self)
+        self.statsd = statsd or get_labeled_statsd_client(conf, self.logger)
+        self.shards_account_prefix = (AUTO_CREATE_ACCOUNT_PREFIX + 'shards_')
+        self.sharding_candidates = []
+        self.shrinking_candidates = []
+        replica_count = self.ring.replica_count
+        quorum = quorum_size(replica_count)
+        self.shard_replication_quorum = config_auto_int_value(
+            conf.get('shard_replication_quorum'), quorum)
+        if self.shard_replication_quorum > replica_count:
+            self.logger.warning(
+                'shard_replication_quorum of %s exceeds replica count %s'
+                ', reducing to %s', self.shard_replication_quorum,
+                replica_count, replica_count)
+            self.shard_replication_quorum = replica_count
+        self.existing_shard_replication_quorum = config_auto_int_value(
+            conf.get('existing_shard_replication_quorum'),
+            self.shard_replication_quorum)
+        if self.existing_shard_replication_quorum > replica_count:
+            self.logger.warning(
+                'existing_shard_replication_quorum of %s exceeds replica count'
+                ' %s, reducing to %s', self.existing_shard_replication_quorum,
+                replica_count, replica_count)
+            self.existing_shard_replication_quorum = replica_count
+
+        # internal client
+        request_tries = config_positive_int_value(
+            conf.get('request_tries', 3))
+        internal_client_conf_path = conf.get('internal_client_conf_path',
+                                             '/etc/swift/internal-client.conf')
+        try:
+            self.int_client = internal_client.InternalClient(
+                internal_client_conf_path,
+                'Swift Container Sharder',
+                request_tries,
+                use_replication_network=True,
+                global_conf={'log_name': '%s-ic' % conf.get(
+                    'log_name', self.log_route)})
+        except (OSError, IOError) as err:
+            if err.errno != errno.ENOENT and \
+                    not str(err).endswith(' not found'):
+                raise
+            raise SystemExit(
+                'Unable to load internal client from config: %r (%s)' %
+                (internal_client_conf_path, err))
+        self.stats_interval = float(conf.get('stats_interval', '3600'))
+        self.reported = 0
+        self.periodic_warnings_interval = float(
+            conf.get('periodic_warnings_interval',
+                     DEFAULT_PERIODIC_WARNINGS_INTERVAL))
+        self.periodic_warnings_start = time.time()
+        self.periodic_warnings = set()
+        self.db_logger = BrokerAnnotatedLogger(self.logger)
+
+    def periodic_warning(self, broker, msg, *args, **kwargs):
+        now = time.time()
+        if now - self.periodic_warnings_start >= \
+                self.periodic_warnings_interval:
+            self.periodic_warnings.clear()
+            self.periodic_warnings_start = now
+
+        db_file = broker.db_file
+        key = (db_file, msg)
+        if key not in self.periodic_warnings:
+            self.periodic_warnings.add(key)
+            self.db_logger.warning(broker, msg, *args, **kwargs)
+
+    def _zero_stats(self):
+        """Zero out the stats."""
+        super(ContainerSharder, self)._zero_stats()
+        # all sharding stats that are additional to the inherited replicator
+        # stats are maintained under the 'sharding' key in self.stats
+        self.stats['sharding'] = defaultdict(lambda: defaultdict(int))
+        self.sharding_candidates = []
+        self.shrinking_candidates = []
+
+    def _append_stat(self, category, key, value):
+        if not self.stats['sharding'][category][key]:
+            self.stats['sharding'][category][key] = list()
+        self.stats['sharding'][category][key].append(value)
+
+    def _min_stat(self, category, key, value):
+        current = self.stats['sharding'][category][key]
+        if not current:
+            self.stats['sharding'][category][key] = value
+        else:
+            self.stats['sharding'][category][key] = min(current, value)
+
+    def _max_stat(self, category, key, value):
+        current = self.stats['sharding'][category][key]
+        if not current:
+            self.stats['sharding'][category][key] = value
+        else:
+            self.stats['sharding'][category][key] = max(current, value)
+
+    def _increment_stat(self, category, key, statsd=False):
+        self._update_stat(category, key, step=1, statsd=statsd)
+
+    def _update_stat(self, category, key, step=1, statsd=False):
+        if step:
+            self.stats['sharding'][category][key] += step
+            if statsd:
+                statsd_key = '%s_%s' % (category, key)
+                self.logger.update_stats(statsd_key, step)
+
+    def _make_stats_info(self, broker, node, own_shard_range):
+        try:
+            file_size = os.stat(broker.db_file).st_size
+        except OSError:
+            file_size = None
+
+        return {'path': broker.db_file,
+                'node_index': node.get('index'),
+                'account': broker.account,
+                'container': broker.container,
+                'root': broker.root_path,
+                'object_count': own_shard_range.object_count,
+                'tombstones': own_shard_range.tombstones,
+                'meta_timestamp': own_shard_range.meta_timestamp.internal,
+                'file_size': file_size}
+
+    def _identify_sharding_candidate(self, broker, node):
+        own_shard_range = broker.get_own_shard_range()
+        update_own_shard_range_stats(broker, own_shard_range)
+        if is_sharding_candidate(
+                own_shard_range, self.shard_container_threshold):
+            self.sharding_candidates.append(
+                self._make_stats_info(broker, node, own_shard_range))
+
+    def _identify_shrinking_candidate(self, broker, node):
+        sequences = find_compactible_shard_sequences(
+            broker, self.shrink_threshold, self.expansion_limit,
+            self.max_shrinking, self.max_expanding)
+        # compactible_ranges are all apart from final acceptor in each sequence
+        compactible_ranges = sum(len(seq) - 1 for seq in sequences)
+
+        if compactible_ranges:
+            own_shard_range = broker.get_own_shard_range()
+            update_own_shard_range_stats(broker, own_shard_range)
+            shrink_candidate = self._make_stats_info(
+                broker, node, own_shard_range)
+            # The number of ranges/donors that can be shrunk if the
+            # tool is used with the current max_shrinking, max_expanding
+            # settings.
+            shrink_candidate['compactible_ranges'] = compactible_ranges
+            self.shrinking_candidates.append(shrink_candidate)
+
+    def _transform_candidate_stats(self, category, candidates, sort_keys):
+        category['found'] = len(candidates)
+        candidates.sort(key=itemgetter(*sort_keys), reverse=True)
+        if self.recon_candidates_limit >= 0:
+            category['top'] = candidates[:self.recon_candidates_limit]
+        else:
+            category['top'] = candidates
+
+    def _record_sharding_progress(self, broker, node, error, processing_time):
+        db_state = broker.get_db_state()
+        if db_state not in (UNSHARDED, SHARDING, SHARDED):
+            return
+        own_shard_range = broker.get_own_shard_range()
+        if own_shard_range.state not in ShardRange.CLEAVING_STATES:
+            return
+
+        latest_context = latest_context_ts = None
+        if db_state == SHARDED:
+            contexts = CleavingContext.load_all(broker)
+            if not contexts:
+                return
+            contexts_sorted = sorted(contexts, key=lambda x: Timestamp(x[1]))
+            latest_context = contexts_sorted[-1]
+            latest_context_ts = Timestamp(latest_context[1])
+            if float(latest_context_ts) + self.recon_sharded_timeout \
+                    < float(Timestamp.now()):
+                # last context timestamp too old for the
+                # broker to be recorded
+                return
+
+        update_own_shard_range_stats(broker, own_shard_range)
+        info = self._make_stats_info(broker, node, own_shard_range)
+
+        if latest_context:
+            info["total_replicate_time"] = latest_context[0].replication_time
+            sharding_total_elapsed = (float(latest_context_ts)
+                                      - float(own_shard_range.epoch))
+            info['total_sharding_time'] = sharding_total_elapsed
+
+        if processing_time:
+            info['processing_time'] = processing_time
+
+        info['state'] = own_shard_range.state_text
+        info['db_state'] = broker.get_db_state()
+        states = [ShardRange.FOUND, ShardRange.CREATED,
+                  ShardRange.CLEAVED, ShardRange.ACTIVE]
+        shard_ranges = broker.get_shard_ranges(states=states)
+        state_count = {}
+        for state in states:
+            state_count[ShardRange.STATES[state]] = 0
+        for shard_range in shard_ranges:
+            state_count[shard_range.state_text] += 1
+        info.update(state_count)
+        info['error'] = error and str(error)
+        self._append_stat('sharding_in_progress', 'all', info)
+
+        if broker.sharding_required() and (
+                own_shard_range.epoch is not None) and (
+                float(own_shard_range.epoch) +
+                self.container_sharding_timeout <
+                time.time()):
+            # Note: There is no requirement that own_shard_range.epoch equals
+            # the time at which the own_shard_range was merged into the
+            # container DB, which predicates sharding starting. But s-m-s-r and
+            # auto-sharding do set epoch and then merge, so we use it to tell
+            # whether sharding has been taking too long or not.
+            self.db_logger.warning(
+                broker, 'Cleaving has not completed in %.2f seconds since %s. '
+                'DB state: %s, own_shard_range state: %s, state count of '
+                'shard ranges: %s' %
+                (time.time() - float(own_shard_range.epoch),
+                 own_shard_range.epoch.isoformat, db_state,
+                 own_shard_range.state_text, str(state_count)))
+
+    def _report_stats(self):
+        # report accumulated stats since start of one sharder cycle
+        default_stats = ('attempted', 'success', 'failure')
+        category_keys = (
+            ('visited', default_stats + ('skipped', 'completed')),
+            ('scanned', default_stats + ('found', 'min_time', 'max_time')),
+            ('created', default_stats),
+            ('cleaved', default_stats + ('min_time', 'max_time',)),
+            ('misplaced', default_stats + ('found', 'placed', 'unplaced')),
+            ('audit_root', default_stats + ('has_overlap', 'num_overlap')),
+            ('audit_shard', default_stats),
+        )
+
+        now = time.time()
+        last_report = time.ctime(self.stats['start'])
+        elapsed = now - self.stats['start']
+        sharding_stats = self.stats['sharding']
+        for category, keys in category_keys:
+            stats = sharding_stats[category]
+            msg = ' '.join(['%s:%s' % (k, str(stats[k])) for k in keys])
+            self.logger.info('Since %s %s - %s', last_report, category, msg)
+
+        # transform the sharding and shrinking candidate states
+        # first sharding
+        category = self.stats['sharding']['sharding_candidates']
+        self._transform_candidate_stats(category, self.sharding_candidates,
+                                        sort_keys=('object_count',))
+
+        # next shrinking
+        category = self.stats['sharding']['shrinking_candidates']
+        self._transform_candidate_stats(category, self.shrinking_candidates,
+                                        sort_keys=('compactible_ranges',))
+
+        dump_recon_cache(
+            {'sharding_stats': self.stats,
+             'sharding_time': elapsed,
+             'sharding_last': now},
+            self.rcache, self.logger)
+        self.reported = now
+
+    def _periodic_report_stats(self):
+        if (time.time() - self.reported) >= self.stats_interval:
+            self._report_stats()
+
+    def _check_node(self, node):
+        """
+        :return: The path to the device, if the node is mounted.
+            Returns False if the node is unmounted.
+        """
+        if not node:
+            return False
+        if not is_local_device(self.ips, self.port,
+                               node['replication_ip'],
+                               node['replication_port']):
+            return False
+        try:
+            return check_drive(self.root, node['device'], self.mount_check)
+        except ValueError:
+            self.logger.warning(
+                'Skipping %(device)s as it is not mounted' % node)
+            return False
+
+    def _fetch_shard_ranges(self, broker, newest=False, params=None,
+                            include_deleted=False):
+        path = self.int_client.make_path(broker.root_account,
+                                         broker.root_container)
+        params = params or {}
+        params.setdefault('format', 'json')
+        headers = {'X-Backend-Record-Type': 'shard',
+                   'X-Backend-Record-Shard-Format': 'full',
+                   'X-Backend-Override-Deleted': 'true',
+                   'X-Backend-Include-Deleted': str(include_deleted)}
+        if newest:
+            headers['X-Newest'] = 'true'
+        try:
+            resp = self.int_client.make_request(
+                'GET', path, headers, acceptable_statuses=(2,),
+                params=params)
+        except internal_client.UnexpectedResponse as err:
+            self.db_logger.warning(
+                broker,
+                "Failed to get shard ranges from %s: %s",
+                quote(broker.root_path), err)
+            return None
+        record_type = resp.headers.get('x-backend-record-type')
+        if record_type != 'shard':
+            err = 'unexpected record type %r' % record_type
+            self.db_logger.error(
+                broker,
+                "Failed to get shard ranges from %s: %s",
+                quote(broker.root_path), err)
+            return None
+
+        try:
+            data = json.loads(resp.body)
+            if not isinstance(data, list):
+                raise ValueError('not a list')
+            return [ShardRange.from_dict(shard_range)
+                    for shard_range in data]
+        except (ValueError, TypeError, KeyError) as err:
+            self.db_logger.error(
+                broker,
+                "Failed to get shard ranges from %s: invalid data: %r",
+                quote(broker.root_path), err)
+        return None
+
+    def _put_container(self, broker, node, part, account, container, headers,
+                       body):
+        try:
+            direct_put_container(node, part, account, container,
+                                 conn_timeout=self.conn_timeout,
+                                 response_timeout=self.node_timeout,
+                                 headers=headers, contents=body)
+        except DirectClientException as err:
+            self.db_logger.warning(
+                broker,
+                'Failed to put shard ranges to %s %s/%s: %s',
+                node_to_string(node, replication=True),
+                quote(account), quote(container), err.http_status)
+        except (Exception, Timeout) as err:
+            self.db_logger.exception(
+                broker,
+                'Failed to put shard ranges to %s %s/%s: %s',
+                node_to_string(node, replication=True),
+                quote(account), quote(container), err)
+        else:
+            return True
+        return False
+
+    def _send_shard_ranges(self, broker, account, container, shard_ranges,
+                           headers=None):
+        body = json.dumps([dict(sr, reported=0)
+                           for sr in shard_ranges]).encode('ascii')
+        part, nodes = self.ring.get_nodes(account, container)
+        headers = headers or {}
+        headers.update({'X-Backend-Record-Type': RECORD_TYPE_SHARD,
+                        USE_REPLICATION_NETWORK_HEADER: 'True',
+                        'User-Agent': 'container-sharder %s' % os.getpid(),
+                        'X-Timestamp': Timestamp.now().internal,
+                        'Content-Length': len(body),
+                        'Content-Type': 'application/json'})
+
+        pool = GreenAsyncPile(len(nodes))
+        for node in nodes:
+            pool.spawn(self._put_container, broker, node, part, account,
+                       container, headers, body)
+
+        results = pool.waitall(None)
+        return results.count(True) >= quorum_size(self.ring.replica_count)
+
+    def _get_shard_broker(self, shard_range, root_path, policy_index):
+        """
+        Get a broker for a container db for the given shard range. If one of
+        the shard container's primary nodes is a local device then that will be
+        chosen for the db, otherwise the first of the shard container's handoff
+        nodes that is local will be chosen.
+
+        :param shard_range: a :class:`~swift.common.utils.ShardRange`
+        :param root_path: the path of the shard's root container
+        :param policy_index: the storage policy index
+        :returns: a tuple of ``(part, broker, node_id, put_timestamp)`` where
+            ``part`` is the shard container's partition,
+            ``broker`` is an instance of
+            :class:`~swift.container.backend.ContainerBroker`,
+            ``node_id`` is the id of the selected node,
+            ``put_timestamp`` is the put_timestamp if the broker needed to
+            be initialized.
+        """
+        part = self.ring.get_part(shard_range.account, shard_range.container)
+        node = self.find_local_handoff_for_part(part)
+
+        put_timestamp = Timestamp.now().internal
+        shard_broker, initialized = ContainerBroker.create_broker(
+            os.path.join(self.root, node['device']), part, shard_range.account,
+            shard_range.container, epoch=shard_range.epoch,
+            storage_policy_index=policy_index, put_timestamp=put_timestamp)
+
+        # Get the valid info into the broker.container, etc
+        shard_broker.get_info()
+        shard_broker.merge_shard_ranges(shard_range)
+        shard_broker.set_sharding_sysmeta('Quoted-Root', quote(root_path))
+        # NB: we *used* to do
+        #    shard_broker.set_sharding_sysmeta('Root', root_path)
+        # but that isn't safe for container names with nulls or newlines (or
+        # possibly some other characters). We consciously *don't* make any
+        # attempt to set the old meta; during an upgrade, some shards may think
+        # they are in fact roots, but it cleans up well enough once everyone's
+        # upgraded.
+        shard_broker.update_metadata({
+            'X-Container-Sysmeta-Sharding':
+                ('True', Timestamp.now().internal)})
+
+        put_timestamp = put_timestamp if initialized else None
+        return part, shard_broker, node['id'], put_timestamp
+
+    def _audit_root_container(self, broker):
+        # This is the root container, and therefore the tome of knowledge,
+        # all we can do is check there is nothing screwy with the ranges
+        self._increment_stat('audit_root', 'attempted')
+        warnings = []
+        own_shard_range = broker.get_own_shard_range()
+
+        if own_shard_range.state in ShardRange.SHARDING_STATES:
+            shard_ranges = [sr for sr in broker.get_shard_ranges()
+                            if sr.state != ShardRange.SHRINKING]
+            paths_with_gaps = find_paths_with_gaps(shard_ranges)
+            if paths_with_gaps:
+                warnings.append(
+                    'missing range(s): %s (use swift-manage-shard-ranges '
+                    'repair)' % len(paths_with_gaps))
+
+        for state in ShardRange.STATES:
+            if state == ShardRange.SHRINKING:
+                # Shrinking is how we resolve overlaps; we've got to
+                # allow multiple shards in that state
+                continue
+            shard_ranges = broker.get_shard_ranges(states=[state])
+            # Transient overlaps can occur during the period immediately after
+            # sharding if a root learns about new child shards before it learns
+            # that the parent has sharded. These overlaps are normally
+            # corrected as an up-to-date version of the parent shard range is
+            # replicated to the root. Parent-child overlaps are therefore
+            # ignored for a reclaim age after the child was created. After
+            # that, parent-child overlaps may indicate that there is
+            # permanently stale parent shard range data, perhaps from a node
+            # that has been offline, so these are reported.
+            overlaps = find_overlapping_ranges(
+                shard_ranges, exclude_parent_child=True,
+                time_period=self.reclaim_age)
+            if overlaps:
+                self._increment_stat('audit_root', 'has_overlap')
+                self._update_stat('audit_root', 'num_overlap',
+                                  step=len(overlaps))
+                warnings.append(
+                    'overlapping ranges: %s (use swift-manage-shard-ranges '
+                    'repair)' % len(overlaps))
+
+        # We've seen a case in production where the roots own_shard_range
+        # epoch is reset to None, and state set to ACTIVE (like re-defaulted)
+        # Epoch it important to sharding so we want to detect if this happens
+        # 1. So we can alert, and 2. to see how common it is.
+        if own_shard_range.epoch is None and broker.db_epoch:
+            warnings.append('own_shard_range reset to None should be %s'
+                            % broker.db_epoch)
+
+        if warnings:
+            self.db_logger.warning(
+                broker, 'Audit failed for root: %s',
+                ', '.join(warnings))
+            self._increment_stat('audit_root', 'failure', statsd=True)
+            return False
+
+        self._increment_stat('audit_root', 'success', statsd=True)
+        return True
+
+    def _merge_shard_ranges_from_root(self, broker, shard_ranges,
+                                      own_shard_range):
+        """
+        Merge appropriate items from the given ``shard_ranges`` into the
+        ``broker``. The selection of items that are merged will depend upon the
+        state of the shard.
+
+        :param broker: A :class:`~swift.container.backend.ContainerBroker`.
+        :param shard_ranges: A list of instances of
+            :class:`~swift.common.utils.ShardRange` describing the shard ranges
+            fetched from the root container.
+        :param own_shard_range: A :class:`~swift.common.utils.ShardRange`
+            describing the shard's own shard range.
+        :return: a tuple of ``own_shard_range, own_shard_range_from_root``. The
+            returned``own_shard_range`` will have been updated if the matching
+            ``own_shard_range_from_root`` has newer data.
+            ``own_shard_range_from_root`` will be None if no such matching
+            shard range is found in ``shard_ranges``.
+        """
+        own_shard_range_from_root = None
+        children_shard_ranges = []
+        other_shard_ranges = []
+        for shard_range in shard_ranges:
+            # look for this shard range in the list of shard ranges received
+            # from root; the root may have different lower and upper bounds for
+            # this shard (e.g. if this shard has been expanded in the root to
+            # accept a shrinking shard) so we only match on name.
+            if shard_range.name == own_shard_range.name:
+                # If we find our own shard range in the root response, merge
+                # it and reload own shard range (note: own_range_from_root may
+                # not necessarily be 'newer' than the own shard range we
+                # already have, but merging will get us to the 'newest' state)
+                self.db_logger.debug(
+                    broker, 'Updating own shard range from root')
+                own_shard_range_from_root = shard_range
+                broker.merge_shard_ranges(own_shard_range_from_root)
+                orig_own_shard_range = own_shard_range
+                own_shard_range = broker.get_own_shard_range()
+                if (orig_own_shard_range != own_shard_range or
+                        orig_own_shard_range.state != own_shard_range.state):
+                    self.db_logger.info(
+                        broker, 'Updated own shard range from %s to %s',
+                        orig_own_shard_range, own_shard_range)
+            elif shard_range.is_child_of(own_shard_range):
+                children_shard_ranges.append(shard_range)
+            else:
+                other_shard_ranges.append(shard_range)
+
+        if children_shard_ranges and not broker.is_sharded():
+            # Merging shard ranges from the root is only necessary until this
+            # DB is fully cleaved and reaches SHARDED DB state, after which it
+            # is useful for debugging for the set of sub-shards to which a
+            # shards has sharded to be frozen.
+            self.db_logger.debug(
+                broker,
+                'Updating %d children shard ranges from root',
+                len(children_shard_ranges))
+            broker.merge_shard_ranges(children_shard_ranges)
+
+        if (other_shard_ranges
+                and own_shard_range.state in ShardRange.CLEAVING_STATES
+                and not broker.is_sharded()):
+            # Other shard ranges returned from the root may need to be merged
+            # for the purposes of sharding or shrinking this shard:
+            #
+            # Shrinking states: If the up-to-date state is shrinking, the
+            # shards fetched from root may contain shards into which this shard
+            # is to shrink itself. Shrinking is initiated by modifying multiple
+            # neighboring shard range states *in the root*, rather than
+            # modifying a shard directly. We therefore need to learn about
+            # *other* neighboring shard ranges from the root, possibly
+            # including the root itself. We need to include shrunk state too,
+            # because one replica of a shard may already have moved the
+            # own_shard_range state to shrunk while another replica may still
+            # be in the process of shrinking.
+            #
+            # Sharding states: Normally a shard will shard to its own children.
+            # However, in some circumstances a shard may need to shard to other
+            # non-children sub-shards. For example, a shard range repair may
+            # cause a child sub-shard to be deleted and its namespace covered
+            # by another 'acceptor' shard.
+            #
+            # Therefore, if the up-to-date own_shard_range state indicates that
+            # sharding or shrinking is in progress, then other shard ranges
+            # will be merged, with the following caveats: we never expect a
+            # shard to shard to any ancestor shard range including the root,
+            # but containers might ultimately *shrink* to root; we never want
+            # to cleave to a container that is itself sharding or shrinking;
+            # the merged shard ranges should not result in gaps or overlaps in
+            # the namespace of this shard.
+            #
+            # Note: the search for ancestors is guaranteed to find the parent
+            # and root *if they are present*, but if any ancestor is missing
+            # then there is a chance that older generations in the
+            # other_shard_ranges will not be filtered and could be merged. That
+            # is only a problem if they are somehow still in ACTIVE state, and
+            # no overlap is detected, so the ancestor is merged.
+            ancestor_names = [
+                sr.name for sr in own_shard_range.find_ancestors(shard_ranges)]
+            filtered_other_shard_ranges = [
+                sr for sr in other_shard_ranges
+                if (sr.name not in ancestor_names
+                    and (sr.state not in ShardRange.CLEAVING_STATES
+                         or sr.deleted))
+            ]
+            if own_shard_range.state in ShardRange.SHRINKING_STATES:
+                root_shard_range = own_shard_range.find_root(
+                    other_shard_ranges)
+                if (root_shard_range and
+                        root_shard_range.state == ShardRange.ACTIVE):
+                    filtered_other_shard_ranges.append(root_shard_range)
+            existing_shard_ranges = broker.get_shard_ranges()
+            combined_shard_ranges = combine_shard_ranges(
+                filtered_other_shard_ranges, existing_shard_ranges)
+            overlaps = find_overlapping_ranges(combined_shard_ranges)
+            paths_with_gaps = find_paths_with_gaps(
+                combined_shard_ranges, own_shard_range)
+            if not (overlaps or paths_with_gaps):
+                # only merge if shard ranges appear to be *good*
+                self.db_logger.debug(
+                    broker,
+                    'Updating %s other shard range(s) from root',
+                    len(filtered_other_shard_ranges))
+                broker.merge_shard_ranges(filtered_other_shard_ranges)
+
+        return own_shard_range, own_shard_range_from_root
+
+    def _delete_shard_container(self, broker, own_shard_range):
+        """
+        Mark a shard container as deleted if it was sharded or shrunk more than
+        reclaim_age in the past. (The DB file will be removed by the replicator
+        after a further reclaim_age.)
+
+        :param broker: A :class:`~swift.container.backend.ContainerBroker`.
+        :param own_shard_range: A :class:`~swift.common.utils.ShardRange`
+            describing the shard's own shard range.
+        """
+        delete_age = time.time() - self.reclaim_age
+        deletable_states = (ShardRange.SHARDED, ShardRange.SHRUNK)
+        if (own_shard_range.state in deletable_states and
+                own_shard_range.deleted and
+                own_shard_range.timestamp < delete_age and
+                broker.empty()):
+            broker.delete_db(Timestamp.now().internal)
+            self.db_logger.debug(
+                broker, 'Marked shard container as deleted')
+
+    def _do_audit_shard_container(self, broker):
+        warnings = []
+        if not broker.account.startswith(self.shards_account_prefix):
+            warnings.append('account not in shards namespace %r' %
+                            self.shards_account_prefix)
+
+        own_shard_range = broker.get_own_shard_range(no_default=True)
+
+        if not own_shard_range:
+            self.db_logger.warning(
+                broker,
+                'Audit failed for shard: missing own shard '
+                'range (skipping)')
+            return False, warnings
+
+        # Get the root view of the world, at least that part of the world
+        # that overlaps with this shard's namespace. The
+        # 'states=auditing' parameter will cause the root to include
+        # its own shard range in the response, which is necessary for the
+        # particular case when this shard should be shrinking to the root
+        # container; when not shrinking to root, but to another acceptor,
+        # the root range should be in sharded state and will not interfere
+        # with cleaving, listing or updating behaviour.
+        shard_ranges = self._fetch_shard_ranges(
+            broker, newest=True,
+            params={'marker': str_to_wsgi(own_shard_range.lower_str),
+                    'end_marker': str_to_wsgi(own_shard_range.upper_str),
+                    'states': 'auditing'},
+            include_deleted=True)
+        if shard_ranges:
+            own_shard_range, own_shard_range_from_root = \
+                self._merge_shard_ranges_from_root(
+                    broker, shard_ranges, own_shard_range)
+            if not own_shard_range_from_root:
+                # this is not necessarily an error - some replicas of the
+                # root may not yet know about this shard container, or the
+                # shard's own shard range could become deleted and
+                # reclaimed from the root under rare conditions
+                warnings.append('root has no matching shard range')
+        elif not own_shard_range.deleted:
+            warnings.append('unable to get shard ranges from root')
+        # else, our shard range is deleted, so root may have reclaimed it
+
+        self._delete_shard_container(broker, own_shard_range)
+
+        return True, warnings
+
+    def _audit_shard_container(self, broker):
+        self._increment_stat('audit_shard', 'attempted')
+        success, warnings = self._do_audit_shard_container(broker)
+        if warnings:
+            self.db_logger.warning(
+                broker, 'Audit warnings for shard: %s',
+                ', '.join(warnings))
+        self._increment_stat(
+            'audit_shard', 'success' if success else 'failure', statsd=True)
+        return success
+
+    def _audit_cleave_contexts(self, broker):
+        now = Timestamp.now()
+        for context, last_mod in CleavingContext.load_all(broker):
+            last_mod = Timestamp(last_mod)
+            is_done = context.done() and last_mod.timestamp + \
+                self.recon_sharded_timeout < now.timestamp
+            is_stale = last_mod.timestamp + self.reclaim_age < now.timestamp
+            if is_done or is_stale:
+                context.delete(broker)
+
+    def _audit_container(self, broker):
+        if broker.is_deleted():
+            if broker.is_old_enough_to_reclaim(time.time(), self.reclaim_age) \
+                    and not broker.is_empty_enough_to_reclaim():
+                self.periodic_warning(
+                    broker, 'Reclaimable db stuck waiting for shrinking')
+            # if the container has been marked as deleted, all metadata will
+            # have been erased so no point auditing. But we want it to pass, in
+            # case any objects exist inside it.
+            return True
+        self._audit_cleave_contexts(broker)
+        if broker.is_root_container():
+            return self._audit_root_container(broker)
+        return self._audit_shard_container(broker)
+
+    def yield_objects(self, broker, src_shard_range, since_row=None,
+                      batch_size=None):
+        """
+        Iterates through all object rows in ``src_shard_range`` in name order
+        yielding them in lists of up to ``batch_size`` in length. All batches
+        of rows that are not marked deleted are yielded before all batches of
+        rows that are marked deleted.
+
+        :param broker: A :class:`~swift.container.backend.ContainerBroker`.
+        :param src_shard_range: A :class:`~swift.common.utils.ShardRange`
+            describing the source range.
+        :param since_row: include only object rows whose ROWID is greater than
+            the given row id; by default all object rows are included.
+        :param batch_size: The maximum number of object rows to include in each
+            yielded batch; defaults to cleave_row_batch_size.
+        :return: a generator of tuples of (list of rows, broker info dict)
+        """
+        if (src_shard_range.lower == ShardRange.MAX or
+                src_shard_range.upper == ShardRange.MIN):
+            # this is an unexpected condition but handled with an early return
+            # just in case, because:
+            #   lower == ShardRange.MAX  ->  marker == ''
+            # which could result in rows being erroneously yielded.
+            return
+
+        batch_size = batch_size or self.cleave_row_batch_size
+        for include_deleted in (False, True):
+            marker = src_shard_range.lower_str
+            while True:
+                info = broker.get_info()
+                info['max_row'] = broker.get_max_row()
+                start = time.time()
+                objects = broker.get_objects(
+                    limit=batch_size,
+                    marker=marker,
+                    end_marker=src_shard_range.end_marker,
+                    include_deleted=include_deleted,
+                    since_row=since_row)
+                self.db_logger.debug(
+                    broker,
+                    'got %s rows (deleted=%s) in %ss',
+                    len(objects), include_deleted, time.time() - start)
+                if objects:
+                    yield objects, info
+
+                if len(objects) < batch_size:
+                    break
+                marker = objects[-1]['name']
+
+    def yield_objects_to_shard_range(self, broker, src_shard_range,
+                                     dest_shard_ranges):
+        """
+        Iterates through all object rows in ``src_shard_range`` to place them
+        in destination shard ranges provided by the ``dest_shard_ranges``
+        function. Yields tuples of ``(batch of object rows, destination shard
+        range in which those object rows belong, broker info)``.
+
+        If no destination shard range exists for a batch of object rows then
+        tuples are yielded of ``(batch of object rows, None, broker info)``.
+        This indicates to the caller that there are a non-zero number of object
+        rows for which no destination shard range was found.
+
+        Note that the same destination shard range may be referenced in more
+        than one yielded tuple.
+
+        :param broker: A :class:`~swift.container.backend.ContainerBroker`.
+        :param src_shard_range: A :class:`~swift.common.utils.ShardRange`
+            describing the source range.
+        :param dest_shard_ranges: A function which should return a list of
+            destination shard ranges sorted in the order defined by
+            :meth:`~swift.common.utils.ShardRange.sort_key`.
+        :return: a generator of tuples of ``(object row list, shard range,
+            broker info dict)``  where ``shard_range`` may be ``None``.
+        """
+        # calling dest_shard_ranges() may result in a request to fetch shard
+        # ranges, so first check that the broker actually has misplaced object
+        # rows in the source namespace
+        for _ in self.yield_objects(broker, src_shard_range, batch_size=1):
+            break
+        else:
+            return
+
+        dest_shard_range_iter = iter(dest_shard_ranges())
+        src_shard_range_marker = src_shard_range.lower
+        for dest_shard_range in dest_shard_range_iter:
+            if dest_shard_range.upper <= src_shard_range.lower:
+                continue
+
+            if dest_shard_range.lower > src_shard_range_marker:
+                # no destination for a sub-namespace of the source namespace
+                sub_src_range = src_shard_range.copy(
+                    lower=src_shard_range_marker, upper=dest_shard_range.lower)
+                for objs, info in self.yield_objects(broker, sub_src_range):
+                    yield objs, None, info
+
+            sub_src_range = src_shard_range.copy(
+                lower=max(dest_shard_range.lower, src_shard_range.lower),
+                upper=min(dest_shard_range.upper, src_shard_range.upper))
+            for objs, info in self.yield_objects(broker, sub_src_range):
+                yield objs, dest_shard_range, info
+
+            src_shard_range_marker = dest_shard_range.upper
+            if dest_shard_range.upper >= src_shard_range.upper:
+                # the entire source namespace has been traversed
+                break
+        else:
+            # dest_shard_ranges_iter was exhausted before reaching the end of
+            # the source namespace
+            sub_src_range = src_shard_range.copy(lower=src_shard_range_marker)
+            for objs, info in self.yield_objects(broker, sub_src_range):
+                yield objs, None, info
+
+    def _post_replicate_hook(self, broker, info, responses):
+        # override superclass behaviour
+        pass
+
+    def _replicate_and_delete(self, broker, dest_shard_range, part,
+                              dest_broker, node_id, info):
+        success, responses = self._replicate_object(
+            part, dest_broker.db_file, node_id)
+        replication_successes = responses.count(True)
+        quorum = quorum_size(self.ring.replica_count)
+        if not success and replication_successes < quorum:
+            self.db_logger.warning(
+                broker,
+                'Failed to sufficiently replicate misplaced objects '
+                'shard %s in state %s: %s successes, %s required '
+                '(not removing objects), shard db: %s',
+                dest_shard_range.name, dest_shard_range.state_text,
+                replication_successes, quorum, dest_broker.db_file)
+            return False
+
+        if broker.get_info()['id'] != info['id']:
+            # the db changed - don't remove any objects
+            success = False
+        else:
+            # remove objects up to the max row of the db sampled prior to
+            # the first object yielded for this destination; objects added
+            # after that point may not have been yielded and replicated so
+            # it is not safe to remove them yet
+            broker.remove_objects(
+                dest_shard_range.lower_str,
+                dest_shard_range.upper_str,
+                max_row=info['max_row'])
+            success = True
+
+        if not success:
+            self.db_logger.warning(
+                broker,
+                'Refused to remove misplaced objects for '
+                'dest %s in state %s', dest_shard_range.name,
+                dest_shard_range.state_text)
+        return success
+
+    def _move_objects(self, src_broker, src_shard_range, policy_index,
+                      shard_range_fetcher):
+        # move objects from src_shard_range in src_broker to destination shard
+        # ranges provided by shard_range_fetcher
+        dest_brokers = {}  # map shard range -> broker
+        placed = unplaced = 0
+        success = True
+        for objs, dest_shard_range, info in self.yield_objects_to_shard_range(
+                src_broker, src_shard_range, shard_range_fetcher):
+            if not dest_shard_range:
+                unplaced += len(objs)
+                success = False
+                continue
+
+            if dest_shard_range.name == src_broker.path:
+                self.db_logger.debug(
+                    src_broker,
+                    'Skipping source as misplaced objects destination')
+                # in shrinking context, the misplaced objects might actually be
+                # correctly placed if the root has expanded this shard but this
+                # broker has not yet been updated
+                continue
+
+            if dest_shard_range not in dest_brokers:
+                part, dest_broker, node_id, put_timestamp = \
+                    self._get_shard_broker(
+                        dest_shard_range, src_broker.root_path, policy_index)
+                stat = 'db_exists' if put_timestamp is None else 'db_created'
+                self._increment_stat('misplaced', stat, statsd=True)
+                # save the broker info that was sampled prior to the *first*
+                # yielded objects for this destination
+                destination = {'part': part,
+                               'dest_broker': dest_broker,
+                               'node_id': node_id,
+                               'info': info}
+                dest_brokers[dest_shard_range] = destination
+            else:
+                destination = dest_brokers[dest_shard_range]
+            destination['dest_broker'].merge_items(objs)
+            placed += len(objs)
+
+        if unplaced:
+            self.db_logger.warning(
+                src_broker,
+                'Failed to find destination for at least '
+                '%s misplaced objects', unplaced)
+
+        # TODO: consider executing the replication jobs concurrently
+        for dest_shard_range, dest_args in dest_brokers.items():
+            self.db_logger.debug(
+                src_broker,
+                'moving misplaced objects found in range %s',
+                dest_shard_range)
+            success &= self._replicate_and_delete(
+                src_broker, dest_shard_range, **dest_args)
+
+        self._update_stat('misplaced', 'placed', step=placed, statsd=True)
+        self._update_stat('misplaced', 'unplaced', step=unplaced, statsd=True)
+        return success, placed, unplaced
+
+    def _make_shard_range_fetcher(self, broker, src_shard_range):
+        # returns a function that will lazy load shard ranges on demand;
+        # this means only one lookup is made for all misplaced ranges.
+        outer = {}
+
+        def shard_range_fetcher():
+            if not outer:
+                if broker.is_root_container():
+                    ranges = broker.get_shard_ranges(
+                        marker=src_shard_range.lower_str,
+                        end_marker=src_shard_range.end_marker,
+                        states=SHARD_UPDATE_STATES)
+                else:
+                    # TODO: the root may not yet know about shard ranges to
+                    # which a shard is sharding, but those could come from
+                    # the broker
+                    ranges = self._fetch_shard_ranges(
+                        broker, newest=True,
+                        params={'states': 'updating',
+                                'marker': str_to_wsgi(
+                                    src_shard_range.lower_str),
+                                'end_marker': str_to_wsgi(
+                                    src_shard_range.end_marker)})
+                outer['ranges'] = iter(ranges)
+            return outer['ranges']
+        return shard_range_fetcher
+
+    def _make_default_misplaced_object_bounds(self, broker):
+        # Objects outside of this container's own range are misplaced.
+        own_shard_range = broker.get_own_shard_range()
+        bounds = []
+        if own_shard_range.lower:
+            bounds.append(('', own_shard_range.lower))
+        if own_shard_range.upper:
+            bounds.append((own_shard_range.upper, ''))
+        return bounds
+
+    def _make_misplaced_object_bounds(self, broker):
+        bounds = []
+        db_state = broker.get_db_state()
+        if db_state == SHARDED:
+            # Anything in the object table is treated as a misplaced object.
+            bounds.append(('', ''))
+
+        if not bounds and db_state == SHARDING:
+            # Objects outside of this container's own range are misplaced.
+            # Objects in already cleaved shard ranges are also misplaced.
+            cleave_context = CleavingContext.load(broker)
+            if cleave_context.cursor:
+                bounds.append(('', cleave_context.cursor))
+                own_shard_range = broker.get_own_shard_range()
+                if own_shard_range.upper:
+                    bounds.append((own_shard_range.upper, ''))
+
+        return bounds or self._make_default_misplaced_object_bounds(broker)
+
+    def _move_misplaced_objects(self, broker, src_broker=None,
+                                src_bounds=None):
+        """
+        Search for objects in the given broker that do not belong in that
+        broker's namespace and move those objects to their correct shard
+        container.
+
+        :param broker: An instance of :class:`swift.container.ContainerBroker`.
+        :param src_broker: optional alternative broker to use as the source
+            of misplaced objects; if not specified then ``broker`` is used as
+            the source.
+        :param src_bounds: optional list of (lower, upper) namespace bounds to
+            use when searching for misplaced objects
+        :return: True if all misplaced objects were sufficiently replicated to
+            their correct shard containers, False otherwise
+        """
+        self.db_logger.debug(broker, 'Looking for misplaced objects')
+        self._increment_stat('misplaced', 'attempted')
+        src_broker = src_broker or broker
+        if src_bounds is None:
+            src_bounds = self._make_misplaced_object_bounds(broker)
+        # (ab)use ShardRange instances to encapsulate source namespaces
+        src_ranges = [ShardRange('dont/care', Timestamp.now(), lower, upper)
+                      for lower, upper in src_bounds]
+        self.db_logger.debug(
+            broker, 'misplaced object source bounds %s',
+            src_bounds)
+        policy_index = broker.storage_policy_index
+        success = True
+        num_placed = num_unplaced = 0
+        for src_shard_range in src_ranges:
+            part_success, part_placed, part_unplaced = self._move_objects(
+                src_broker, src_shard_range, policy_index,
+                self._make_shard_range_fetcher(broker, src_shard_range))
+            success &= part_success
+            num_placed += part_placed
+            num_unplaced += part_unplaced
+
+        if num_placed or num_unplaced:
+            # the found stat records the number of DBs in which any misplaced
+            # rows were found, not the total number of misplaced rows
+            self._increment_stat('misplaced', 'found', statsd=True)
+            self.db_logger.debug(
+                broker,
+                'Placed %s misplaced objects (%s unplaced)',
+                num_placed, num_unplaced)
+        self._increment_stat('misplaced', 'success' if success else 'failure',
+                             statsd=True)
+        self.db_logger.debug(
+            broker, 'Finished handling misplaced objects')
+        return success
+
+    def _find_shard_ranges(self, broker):
+        """
+        Scans the container to find shard ranges and adds them to the shard
+        ranges table. If there are existing shard ranges then scanning starts
+        from the upper bound of the uppermost existing shard range.
+
+        :param broker: An instance of :class:`swift.container.ContainerBroker`
+        :return: a tuple of (success, num of shard ranges found) where success
+            is True if the last shard range has been found, False otherwise.
+        """
+        own_shard_range = broker.get_own_shard_range()
+        shard_ranges = broker.get_shard_ranges()
+        if shard_ranges and shard_ranges[-1].upper >= own_shard_range.upper:
+            self.db_logger.debug(
+                broker, 'Scan for shard ranges already completed')
+            return 0
+
+        self.db_logger.info(broker, 'Starting scan for shard ranges')
+        self._increment_stat('scanned', 'attempted')
+
+        start = time.time()
+        shard_data, last_found = broker.find_shard_ranges(
+            self.rows_per_shard, limit=self.shard_scanner_batch_size,
+            existing_ranges=shard_ranges,
+            minimum_shard_size=self.minimum_shard_size)
+        elapsed = time.time() - start
+
+        if not shard_data:
+            if last_found:
+                self.db_logger.info(
+                    broker, "Already found all shard ranges")
+                self._increment_stat('scanned', 'success', statsd=True)
+            else:
+                # we didn't find anything
+                self.db_logger.warning(
+                    broker, "No shard ranges found")
+                self._increment_stat('scanned', 'failure', statsd=True)
+            return 0
+
+        shard_ranges = make_shard_ranges(
+            broker, shard_data, self.shards_account_prefix)
+        broker.merge_shard_ranges(shard_ranges)
+        num_found = len(shard_ranges)
+        self.db_logger.info(
+            broker, "Completed scan for shard ranges: %d found",
+            num_found)
+        self._update_stat('scanned', 'found', step=num_found)
+        self._min_stat('scanned', 'min_time', round(elapsed / num_found, 3))
+        self._max_stat('scanned', 'max_time', round(elapsed / num_found, 3))
+
+        if last_found:
+            self.db_logger.info(broker, "Final shard range reached.")
+        self._increment_stat('scanned', 'success', statsd=True)
+        return num_found
+
+    def _create_shard_containers(self, broker):
+        # Create shard containers that are ready to receive redirected object
+        # updates. Do this now, so that redirection can begin immediately
+        # without waiting for cleaving to complete.
+        found_ranges = broker.get_shard_ranges(states=[ShardRange.FOUND])
+        created_ranges = []
+        for shard_range in found_ranges:
+            self._increment_stat('created', 'attempted')
+            shard_range.update_state(ShardRange.CREATED)
+            headers = {
+                'X-Backend-Storage-Policy-Index': broker.storage_policy_index,
+                'X-Container-Sysmeta-Shard-Quoted-Root': quote(
+                    broker.root_path),
+                'X-Container-Sysmeta-Sharding': 'True',
+                'X-Backend-Auto-Create': 'True'}
+            # NB: we *used* to send along
+            #    'X-Container-Sysmeta-Shard-Root': broker.root_path
+            # but that isn't safe for container names with nulls or newlines
+            # (or possibly some other characters). We consciously *don't* make
+            # any attempt to set the old meta; during an upgrade, some shards
+            # may think they are in fact roots, but it cleans up well enough
+            # once everyone's upgraded.
+            success = self._send_shard_ranges(
+                broker, shard_range.account, shard_range.container,
+                [shard_range], headers=headers)
+            if success:
+                self.db_logger.debug(
+                    broker, 'PUT new shard range container for %s',
+                    shard_range)
+                self._increment_stat('created', 'success', statsd=True)
+            else:
+                self.db_logger.error(
+                    broker, 'PUT of new shard container %r failed',
+                    shard_range)
+                self._increment_stat('created', 'failure', statsd=True)
+                # break, not continue, because elsewhere it is assumed that
+                # finding and cleaving shard ranges progresses linearly, so we
+                # do not want any subsequent shard ranges to be in created
+                # state while this one is still in found state
+                break
+            created_ranges.append(shard_range)
+
+        if created_ranges:
+            broker.merge_shard_ranges(created_ranges)
+            if not broker.is_root_container():
+                self._send_shard_ranges(broker, broker.root_account,
+                                        broker.root_container, created_ranges)
+            self.db_logger.info(
+                broker, "Completed creating %d shard range containers",
+                len(created_ranges))
+        return len(created_ranges)
+
+    def _cleave_shard_broker(self, broker, cleaving_context, shard_range,
+                             own_shard_range, shard_broker, put_timestamp,
+                             shard_part, node_id):
+        result = CLEAVE_SUCCESS
+        start = time.time()
+        # only cleave from the retiring db - misplaced objects handler will
+        # deal with any objects in the fresh db
+        source_broker = broker.get_brokers()[0]
+        # if this range has been cleaved before but replication
+        # failed then the shard db may still exist and it may not be
+        # necessary to merge all the rows again
+        source_db_id = source_broker.get_info()['id']
+        source_max_row = source_broker.get_max_row()
+        sync_point = shard_broker.get_sync(source_db_id)
+        if sync_point < source_max_row or source_max_row == -1:
+            sync_from_row = max(cleaving_context.last_cleave_to_row or -1,
+                                sync_point)
+            objects = None
+            for objects, info in self.yield_objects(
+                    source_broker, shard_range,
+                    since_row=sync_from_row):
+                shard_broker.merge_items(objects)
+            if objects is None:
+                self.db_logger.info(
+                    broker, "Cleaving %r - zero objects found",
+                    shard_range)
+                if shard_broker.get_info()['put_timestamp'] == put_timestamp:
+                    # This was just created; don't need to replicate this
+                    # SR because there was nothing there. So cleanup and
+                    # remove the shard_broker from its hand off location.
+                    # Because nothing was here we wont count it in the shard
+                    # batch count.
+                    result = CLEAVE_EMPTY
+                # Else, it wasn't newly created by us, and
+                # we don't know what's in it or why. Let it get
+                # replicated and counted in the batch count.
+
+            # Note: the max row stored as a sync point is sampled *before*
+            # objects are yielded to ensure that is less than or equal to
+            # the last yielded row. Other sync points are also copied from the
+            # source broker to the shards; if another replica of the source
+            # happens to subsequently cleave into a primary replica of the
+            # shard then it will only need to cleave rows after its last sync
+            # point with this replica of the source broker.
+            shard_broker.merge_syncs(
+                [{'sync_point': source_max_row, 'remote_id': source_db_id}] +
+                source_broker.get_syncs())
+        else:
+            self.db_logger.debug(
+                broker, "Cleaving %r - shard db already in sync",
+                shard_range)
+
+        replication_quorum = self.existing_shard_replication_quorum
+        if own_shard_range.state in ShardRange.SHRINKING_STATES:
+            if shard_range.includes(own_shard_range):
+                # When shrinking to a single acceptor that completely encloses
+                # this shard's namespace, include deleted own (donor) shard
+                # range in the replicated db so that when acceptor next updates
+                # root it will atomically update its namespace *and* delete the
+                # donor. This reduces the chance of a temporary listing gap if
+                # this shard fails to update the root with its SHRUNK/deleted
+                # state. Don't do this when sharding a shard or shrinking to
+                # multiple acceptors because in those cases the donor namespace
+                # should not be deleted until *all* shards are cleaved.
+                if own_shard_range.update_state(ShardRange.SHRUNK):
+                    own_shard_range.set_deleted()
+                    broker.merge_shard_ranges(own_shard_range)
+                shard_broker.merge_shard_ranges(own_shard_range)
+        elif shard_range.state == ShardRange.CREATED:
+            # The shard range object stats may have changed since the shard
+            # range was found, so update with stats of objects actually
+            # copied to the shard broker. Only do this the first time each
+            # shard range is cleaved.
+            info = shard_broker.get_info()
+            shard_range.update_meta(
+                info['object_count'], info['bytes_used'])
+            # Update state to CLEAVED; only do this when sharding, not when
+            # shrinking
+            shard_range.update_state(ShardRange.CLEAVED)
+            shard_broker.merge_shard_ranges(shard_range)
+            replication_quorum = self.shard_replication_quorum
+
+        if result == CLEAVE_EMPTY:
+            self.delete_db(shard_broker)
+        else:  # result == CLEAVE_SUCCESS:
+            self.db_logger.info(
+                broker, 'Replicating new shard container %s for %s',
+                quote(shard_broker.path), own_shard_range)
+
+            replicate_start = time.time()
+            success, responses = self._replicate_object(
+                shard_part, shard_broker.db_file, node_id)
+            cleaving_context.replication_time += time.time() - replicate_start
+
+            replication_successes = responses.count(True)
+            if (not success and (not responses or
+                                 replication_successes < replication_quorum)):
+                # insufficient replication or replication not even attempted;
+                # break because we don't want to progress the cleave cursor
+                # until each shard range has been successfully cleaved
+                self.db_logger.warning(
+                    broker, 'Failed to sufficiently replicate cleaved shard '
+                            '%s in state %s: %s successes, %s required, '
+                            'shard db: %s',
+                    shard_broker.path, shard_range.state_text,
+                    replication_successes, replication_quorum,
+                    shard_broker.db_file)
+                self._increment_stat('cleaved', 'failure', statsd=True)
+                result = CLEAVE_FAILED
+            else:
+                elapsed = round(time.time() - start, 3)
+                self._min_stat('cleaved', 'min_time', elapsed)
+                self._max_stat('cleaved', 'max_time', elapsed)
+                self.db_logger.info(
+                    broker, 'Cleaved %s in %gs', shard_range,
+                    elapsed)
+                self._increment_stat('cleaved', 'success', statsd=True)
+
+        if result in (CLEAVE_SUCCESS, CLEAVE_EMPTY):
+            broker.merge_shard_ranges(shard_range)
+            cleaving_context.range_done(shard_range.upper_str)
+            if shard_range.upper >= own_shard_range.upper:
+                # cleaving complete
+                cleaving_context.cleaving_done = True
+            cleaving_context.store(broker)
+        return result
+
+    def _cleave_shard_range(self, broker, cleaving_context, shard_range,
+                            own_shard_range):
+        self.db_logger.info(
+            broker, "Cleaving from row %s into %s for %r",
+            cleaving_context.last_cleave_to_row,
+            quote(shard_range.name), shard_range)
+        self._increment_stat('cleaved', 'attempted')
+        policy_index = broker.storage_policy_index
+        shard_part, shard_broker, node_id, put_timestamp = \
+            self._get_shard_broker(shard_range, broker.root_path,
+                                   policy_index)
+        stat = 'db_exists' if put_timestamp is None else 'db_created'
+        self._increment_stat('cleaved', stat, statsd=True)
+        return self._cleave_shard_broker(
+            broker, cleaving_context, shard_range, own_shard_range,
+            shard_broker, put_timestamp, shard_part, node_id)
+
+    def _cleave(self, broker):
+        # Returns True if misplaced objects have been moved and the entire
+        # container namespace has been successfully cleaved, False otherwise
+        if broker.is_sharded():
+            self.db_logger.debug(
+                broker, 'Passing over already sharded container')
+            return True
+
+        cleaving_context = CleavingContext.load(broker)
+        if not cleaving_context.misplaced_done:
+            # ensure any misplaced objects in the source broker are moved; note
+            # that this invocation of _move_misplaced_objects is targetted at
+            # the *retiring* db.
+            self.db_logger.debug(
+                broker,
+                'Moving any misplaced objects from sharding container')
+            bounds = self._make_default_misplaced_object_bounds(broker)
+            cleaving_context.misplaced_done = self._move_misplaced_objects(
+                broker, src_broker=broker.get_brokers()[0],
+                src_bounds=bounds)
+            cleaving_context.store(broker)
+
+        if cleaving_context.cleaving_done:
+            self.db_logger.debug(
+                broker, 'Cleaving already complete for container')
+            return cleaving_context.misplaced_done
+
+        shard_ranges = broker.get_shard_ranges(marker=cleaving_context.marker)
+        # Ignore shrinking shard ranges: we never want to cleave objects to a
+        # shrinking shard. Shrinking shard ranges are to be expected in a root;
+        # shrinking shard ranges (other than own shard range) are not normally
+        # expected in a shard but can occur if there is an overlapping shard
+        # range that has been discovered from the root.
+        ranges_todo = [sr for sr in shard_ranges
+                       if sr.state != ShardRange.SHRINKING]
+        if cleaving_context.cursor:
+            # always update ranges_todo in case shard ranges have changed since
+            # last visit
+            cleaving_context.ranges_todo = len(ranges_todo)
+            self.db_logger.debug(
+                broker, 'Continuing to cleave (%s done, %s todo)',
+                cleaving_context.ranges_done,
+                cleaving_context.ranges_todo)
+        else:
+            cleaving_context.start()
+            own_shard_range = broker.get_own_shard_range()
+            cleaving_context.cursor = own_shard_range.lower_str
+            cleaving_context.ranges_todo = len(ranges_todo)
+            self.db_logger.info(
+                broker, 'Starting to cleave (%s todo)',
+                cleaving_context.ranges_todo)
+
+        own_shard_range = broker.get_own_shard_range(no_default=True)
+        if own_shard_range is None:
+            # A default should never be SHRINKING or SHRUNK but because we
+            # may write own_shard_range back to broker, let's make sure
+            # it can't be defaulted.
+            self.db_logger.warning(broker, 'Failed to get own_shard_range')
+            ranges_todo = []  # skip cleaving
+
+        labels = {
+            'account': broker.account,
+            'container': broker.container
+        }
+        if cleaving_context.ranges_done == 0 and own_shard_range:
+            self.statsd.timing_since(
+                'swift_container_sharder_time_to_first_cleave',
+                float(own_shard_range.epoch), labels={
+                    **labels,
+                    'ranges_todo': cleaving_context.ranges_todo})
+
+        ranges_done = []
+        for shard_range in ranges_todo:
+            if cleaving_context.cleaving_done:
+                # note: there may still be ranges_todo, for example: if this
+                # shard is shrinking and has merged a root shard range in
+                # sharded state along with an active acceptor shard range, but
+                # the root range is irrelevant
+                break
+
+            if len(ranges_done) == self.cleave_batch_size:
+                break
+
+            if shard_range.lower > cleaving_context.cursor:
+                self.db_logger.info(
+                    broker, 'Stopped cleave at gap: %r - %r' %
+                            (cleaving_context.cursor, shard_range.lower))
+                break
+
+            if shard_range.state not in (ShardRange.CREATED,
+                                         ShardRange.CLEAVED,
+                                         ShardRange.ACTIVE):
+                self.db_logger.info(
+                    broker, 'Stopped cleave at unready %s', shard_range)
+                break
+
+            cleave_result = self._cleave_shard_range(
+                broker, cleaving_context, shard_range, own_shard_range)
+
+            if cleave_result == CLEAVE_SUCCESS:
+                ranges_done.append(shard_range)
+            elif cleave_result == CLEAVE_FAILED:
+                break
+            # else: CLEAVE_EMPTY: no errors, but no rows found either. keep
+            # going, and don't count it against our batch size
+
+        # _cleave_shard_range always store()s the context on success; *also* do
+        # that here in case we hit a failure right off the bat or ended loop
+        # with skipped ranges
+        cleaving_context.store(broker)
+        self.db_logger.debug(
+            broker, 'Cleaved %s shard ranges', len(ranges_done))
+
+        if cleaving_context.cleaving_done:
+            self.statsd.timing_since(
+                'swift_container_sharder_time_to_last_cleave',
+                float(own_shard_range.epoch), labels={
+                    **labels,
+                    'ranges_done': cleaving_context.ranges_done})
+
+        return (cleaving_context.misplaced_done and
+                cleaving_context.cleaving_done)
+
+    def _complete_sharding(self, broker):
+        cleaving_context = CleavingContext.load(broker)
+        if cleaving_context.done():
+            # Move all CLEAVED shards to ACTIVE state and if a shard then
+            # delete own shard range; these changes will be simultaneously
+            # reported in the next update to the root container.
+            own_shard_range = broker.get_own_shard_range(no_default=True)
+            if own_shard_range is None:
+                # This is more of a belts and braces, not sure we could even
+                # get this far with without an own_shard_range. But because
+                # we will be writing own_shard_range back, we need to make sure
+                self.db_logger.warning(
+                    broker, 'Failed to get own_shard_range')
+                return False
+            own_shard_range.update_meta(0, 0)
+            if own_shard_range.state in ShardRange.SHRINKING_STATES:
+                own_shard_range.update_state(ShardRange.SHRUNK)
+                modified_shard_ranges = []
+            else:
+                own_shard_range.update_state(ShardRange.SHARDED)
+                modified_shard_ranges = broker.get_shard_ranges(
+                    states=[ShardRange.CLEAVED])
+                for sr in modified_shard_ranges:
+                    sr.update_state(ShardRange.ACTIVE)
+            if (not broker.is_root_container() and not
+                    own_shard_range.deleted):
+                own_shard_range = own_shard_range.copy(
+                    timestamp=Timestamp.now(), deleted=1)
+            modified_shard_ranges.append(own_shard_range)
+            broker.merge_shard_ranges(modified_shard_ranges)
+            if broker.set_sharded_state():
+                return True
+            else:
+                self.db_logger.warning(
+                    broker, 'Failed to remove retiring db file')
+        else:
+            self.db_logger.warning(
+                broker, 'Repeat cleaving required, context: %s',
+                dict(cleaving_context))
+            cleaving_context.reset()
+            cleaving_context.store(broker)
+
+        return False
+
+    def _find_and_enable_sharding_candidates(self, broker, shard_ranges=None):
+        candidates = find_sharding_candidates(
+            broker, self.shard_container_threshold, shard_ranges)
+        if candidates:
+            self.db_logger.debug(
+                broker, 'Identified %s sharding candidates',
+                len(candidates))
+            broker.merge_shard_ranges(candidates)
+
+    def _find_and_enable_shrinking_candidates(self, broker):
+        if not broker.is_sharded():
+            self.db_logger.warning(
+                broker, 'Cannot shrink a not yet sharded container')
+            return
+
+        compactible_sequences = find_compactible_shard_sequences(
+            broker, self.shrink_threshold, self.expansion_limit,
+            self.max_shrinking, self.max_expanding, include_shrinking=True)
+        self.db_logger.debug(
+            broker, 'Found %s compactible sequences of length(s) %s' %
+            (len(compactible_sequences),
+             [len(s) for s in compactible_sequences]))
+        process_compactible_shard_sequences(broker, compactible_sequences)
+        own_shard_range = broker.get_own_shard_range()
+        for sequence in compactible_sequences:
+            acceptor = sequence[-1]
+            donors = ShardRangeList(sequence[:-1])
+            self.db_logger.debug(
+                broker,
+                'shrinking %d objects from %d shard ranges into %s' %
+                (donors.object_count, len(donors), acceptor))
+            if acceptor.name != own_shard_range.name:
+                self._send_shard_ranges(broker, acceptor.account,
+                                        acceptor.container, [acceptor])
+                acceptor.increment_meta(donors.object_count, donors.bytes_used)
+            # Now send a copy of the expanded acceptor, with an updated
+            # timestamp, to each donor container. This forces each donor to
+            # asynchronously cleave its entire contents to the acceptor and
+            # delete itself. The donor will pass its own deleted shard range to
+            # the acceptor when cleaving. Subsequent updates from the donor or
+            # the acceptor will then update the root to have the  deleted donor
+            # shard range.
+            for donor in donors:
+                self._send_shard_ranges(broker, donor.account,
+                                        donor.container, [donor, acceptor])
+
+    def _update_root_container(self, broker):
+        own_shard_range = broker.get_own_shard_range(no_default=True)
+        if not own_shard_range:
+            return
+
+        # Don't update the osr stats including tombstones unless its CLEAVED+
+        if own_shard_range.state in SHARD_UPDATE_STAT_STATES:
+            # do a reclaim *now* in order to get best estimate of tombstone
+            # count that is consistent with the current object_count
+            reclaimer = self._reclaim(broker)
+            tombstones = reclaimer.get_tombstone_count()
+            self.db_logger.debug(broker, 'tombstones = %d', tombstones)
+            # shrinking candidates are found in the root DB so that's the only
+            # place we need up to date tombstone stats.
+            own_shard_range.update_tombstones(tombstones)
+            update_own_shard_range_stats(broker, own_shard_range)
+
+            if not own_shard_range.reported:
+                broker.merge_shard_ranges(own_shard_range)
+
+        # we can't use `state not in SHARD_UPDATE_STAT_STATES` to return
+        # because there are cases we still want to update root even if the
+        # stats are wrong. Such as it's a new shard or something else has
+        # decided to remove the latch to update root.
+        if own_shard_range.reported:
+            return
+
+        # now get a consistent list of own and other shard ranges
+        shard_ranges = broker.get_shard_ranges(
+            include_own=True,
+            include_deleted=True)
+        # send everything
+        if self._send_shard_ranges(broker, broker.root_account,
+                                   broker.root_container, shard_ranges,
+                                   {'Referer': quote(broker.path)}):
+            # on success, mark ourselves as reported so we don't keep
+            # hammering the root
+            own_shard_range.reported = True
+            broker.merge_shard_ranges(own_shard_range)
+            self.db_logger.debug(
+                broker, 'updated root objs=%d, tombstones=%s',
+                own_shard_range.object_count,
+                own_shard_range.tombstones)
+
+    def _process_broker(self, broker, node, part):
+        broker.get_info()  # make sure account/container are populated
+        db_state = broker.get_db_state()
+        is_deleted = broker.is_deleted()
+        self.db_logger.debug(
+            broker, 'Starting processing, state %s%s', db_state,
+            ' (deleted)' if is_deleted else '')
+
+        if not self._audit_container(broker):
+            return
+
+        # now look and deal with misplaced objects.
+        move_start_ts = time.time()
+        self._move_misplaced_objects(broker)
+        self.logger.timing_since(
+            'sharder.sharding.move_misplaced', move_start_ts)
+
+        is_leader = node['index'] == 0 and self.auto_shard and not is_deleted
+
+        if db_state in (UNSHARDED, COLLAPSED):
+            if is_leader and broker.is_root_container():
+                # bootstrap sharding of root container
+                own_shard_range = broker.get_own_shard_range()
+                update_own_shard_range_stats(broker, own_shard_range)
+                self._find_and_enable_sharding_candidates(
+                    broker, shard_ranges=[own_shard_range])
+
+            own_shard_range = broker.get_own_shard_range()
+            if own_shard_range.state in ShardRange.CLEAVING_STATES:
+                if broker.has_other_shard_ranges():
+                    # container has been given shard ranges rather than
+                    # found them e.g. via replication or a shrink event,
+                    # or manually triggered cleaving.
+                    db_start_ts = time.time()
+                    if broker.set_sharding_state():
+                        db_state = SHARDING
+                        self.db_logger.info(
+                            broker, 'Kick off container cleaving, '
+                            'own shard range in state %r',
+                            own_shard_range.state_text)
+                    self.logger.timing_since(
+                        'sharder.sharding.set_state', db_start_ts)
+                elif is_leader:
+                    if broker.set_sharding_state():
+                        db_state = SHARDING
+                else:
+                    self.db_logger.debug(
+                        broker,
+                        'Own shard range in state %r but no shard '
+                        'ranges and not leader; remaining unsharded',
+                        own_shard_range.state_text)
+
+        if db_state == SHARDING:
+            cleave_start_ts = time.time()
+            if is_leader:
+                num_found = self._find_shard_ranges(broker)
+            else:
+                num_found = 0
+
+            # create shard containers for newly found ranges
+            num_created = self._create_shard_containers(broker)
+
+            if num_found or num_created:
+                # share updated shard range state with  other nodes
+                self._replicate_object(part, broker.db_file, node['id'])
+
+            # always try to cleave any pending shard ranges
+            cleave_complete = self._cleave(broker)
+            self.logger.timing_since(
+                'sharder.sharding.cleave', cleave_start_ts)
+
+            if cleave_complete:
+                if self._complete_sharding(broker):
+                    db_state = SHARDED
+                    self._increment_stat('visited', 'completed', statsd=True)
+                    self.db_logger.info(
+                        broker, 'Completed cleaving, DB set to sharded '
+                        'state')
+                    self.logger.timing_since(
+                        'sharder.sharding.completed',
+                        float(broker.get_own_shard_range().epoch))
+                else:
+                    self.db_logger.info(
+                        broker,
+                        'Completed cleaving, DB remaining in sharding '
+                        'state')
+
+        if not broker.is_deleted():
+            if db_state == SHARDED and broker.is_root_container():
+                # look for shrink stats
+                send_start_ts = time.time()
+                self._identify_shrinking_candidate(broker, node)
+                if is_leader:
+                    self._find_and_enable_shrinking_candidates(broker)
+                    self._find_and_enable_sharding_candidates(broker)
+                for shard_range in broker.get_shard_ranges(
+                        states=[ShardRange.SHARDING]):
+                    self._send_shard_ranges(broker, shard_range.account,
+                                            shard_range.container,
+                                            [shard_range])
+                self.logger.timing_since(
+                    'sharder.sharding.send_sr', send_start_ts)
+
+            if not broker.is_root_container():
+                # Update the root container with this container's shard range
+                # info; do this even when sharded in case previous attempts
+                # failed; don't do this if there is no own shard range. When
+                # sharding a shard, this is when the root will see the new
+                # shards move to ACTIVE state and the sharded shard
+                # simultaneously become deleted.
+                update_start_ts = time.time()
+                self._update_root_container(broker)
+                self.logger.timing_since(
+                    'sharder.sharding.update_root', update_start_ts)
+
+        self.db_logger.debug(
+            broker, 'Finished processing, state %s%s',
+            broker.get_db_state(), ' (deleted)' if is_deleted else '')
+
+    def _one_shard_cycle(self, devices_to_shard, partitions_to_shard):
+        """
+        The main function, everything the sharder does forks from this method.
+
+        The sharder loops through each container with sharding enabled and each
+        sharded container on the server, on each container it:
+            - audits the container
+            - checks and deals with misplaced items
+            - cleaves any shard ranges as required
+            - if not a root container, reports shard range stats to the root
+              container
+        """
+
+        self.logger.info('Container sharder cycle starting, auto-sharding %s',
+                         self.auto_shard)
+        if isinstance(devices_to_shard, (list, tuple)):
+            self.logger.info('(Override devices: %s)',
+                             ', '.join(str(d) for d in devices_to_shard))
+        if isinstance(partitions_to_shard, (list, tuple)):
+            self.logger.info('(Override partitions: %s)',
+                             ', '.join(str(p) for p in partitions_to_shard))
+        self._zero_stats()
+        self._local_device_ids = {}
+        dirs = []
+        self.ips = whataremyips(self.bind_ip)
+        for node in self.ring.devs:
+            device_path = self._check_node(node)
+            if not device_path:
+                continue
+            datadir = os.path.join(device_path, self.datadir)
+            if os.path.isdir(datadir):
+                # Populate self._local_device_ids so we can find devices for
+                # shard containers later
+                self._local_device_ids[node['id']] = node
+                if node['device'] not in devices_to_shard:
+                    continue
+                part_filt = self._partition_dir_filter(
+                    node['id'],
+                    partitions_to_shard)
+                dirs.append((datadir, node, part_filt))
+        if not dirs:
+            self.logger.info('Found no containers directories')
+        for part, path, node in self.roundrobin_datadirs(dirs):
+            # NB: get_part_nodes always provides an 'index' key;
+            # this will be used in leader selection
+            for primary in self.ring.get_part_nodes(int(part)):
+                if node['id'] == primary['id']:
+                    node = primary
+                    break
+            else:
+                # Set index such that we'll *never* be selected as a leader
+                node['index'] = 'handoff'
+
+            broker = ContainerBroker(path, logger=self.logger,
+                                     timeout=self.broker_timeout)
+            error = processing_time = None
+            try:
+                self._identify_sharding_candidate(broker, node)
+                if sharding_enabled(broker):
+                    self._increment_stat('visited', 'attempted')
+
+                    process_start = time.time()
+                    self._process_broker(broker, node, part)
+                    processing_time = time.time() - process_start
+
+                    self._increment_stat('visited', 'success', statsd=True)
+                else:
+                    self._increment_stat('visited', 'skipped')
+            except (Exception, Timeout) as err:
+                self._increment_stat('visited', 'failure', statsd=True)
+                self.db_logger.exception(
+                    broker, 'Unhandled exception while processing: '
+                    '%s', err)
+                error = err
+            try:
+                self._record_sharding_progress(broker, node, error,
+                                               processing_time)
+            except (Exception, Timeout) as error:
+                self.db_logger.exception(
+                    broker, 'Unhandled exception while dumping '
+                    'progress: %s', error)
+            self._periodic_report_stats()
+
+        self._report_stats()
+
+    @contextmanager
+    def _set_auto_shard_from_command_line(self, **kwargs):
+        conf_auto_shard = self.auto_shard
+        auto_shard = kwargs.get('auto_shard', None)
+        if auto_shard is not None:
+            self.auto_shard = config_true_value(auto_shard)
+        try:
+            yield
+        finally:
+            self.auto_shard = conf_auto_shard
+
+    def run_forever(self, *args, **kwargs):
+        """Run the container sharder until stopped."""
+        with self._set_auto_shard_from_command_line(**kwargs):
+            self.reported = time.time()
+            time.sleep(random() * self.interval)
+            while True:
+                begin = time.time()
+                try:
+                    self._one_shard_cycle(devices_to_shard=Everything(),
+                                          partitions_to_shard=Everything())
+                except (Exception, Timeout):
+                    self.logger.increment('errors')
+                    self.logger.exception('Exception in sharder')
+                elapsed = time.time() - begin
+                self.logger.info(
+                    'Container sharder cycle completed: %.02fs', elapsed)
+                if elapsed < self.interval:
+                    time.sleep(self.interval - elapsed)
+
+    def run_once(self, *args, **kwargs):
+        """Run the container sharder once."""
+        self.logger.info('Begin container sharder "once" mode')
+        override_options = parse_override_options(once=True, **kwargs)
+        devices_to_shard = override_options.devices or Everything()
+        partitions_to_shard = override_options.partitions or Everything()
+        with self._set_auto_shard_from_command_line(**kwargs):
+            begin = self.reported = time.time()
+            self._one_shard_cycle(devices_to_shard=devices_to_shard,
+                                  partitions_to_shard=partitions_to_shard)
+            elapsed = time.time() - begin
+            self.logger.info(
+                'Container sharder "once" mode completed: %.02fs', elapsed)
+
+
+def main():
+    parser = OptionParser("%prog CONFIG [options]")
+    parser.add_option('-d', '--devices',
+                      help='Shard containers only on given devices. '
+                           'Comma-separated list. '
+                           'Only has effect if --once is used.')
+    parser.add_option('-p', '--partitions',
+                      help='Shard containers only in given partitions. '
+                           'Comma-separated list. '
+                           'Only has effect if --once is used.')
+    parser.add_option('--no-auto-shard', action='store_false',
+                      dest='auto_shard', default=None,
+                      help='Disable auto-sharding. Overrides the auto_shard '
+                           'value in the config file.')
+    conf_file, options = parse_options(parser=parser, once=True)
+    run_daemon(ContainerSharder, conf_file, **options)
+
+
+if __name__ == '__main__':
+    main()
diff --git a/swift/container/sync.py b/swift/container/sync.py
index e28d2c5160..ee9e62a130 100644
--- a/swift/container/sync.py
+++ b/swift/container/sync.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,59 +13,64 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
+import collections
+import errno
+import os
+import uuid
 from time import ctime, time
-from random import random, shuffle
+from random import choice, random
 from struct import unpack_from
 
 from eventlet import sleep, Timeout
+from urllib.parse import urlparse
 
 import swift.common.db
-from swift.container import server as container_server
-from swiftclient import ClientException, delete_object, put_object, \
-    quote
-from swift.common.direct_client import direct_get_object
+from swift.common.db import DatabaseConnectionError
+from swift.container.backend import ContainerBroker
+from swift.container.sync_store import ContainerSyncStore
+from swift.common.container_sync_realms import ContainerSyncRealms
+from swift.common.daemon import run_daemon
+from swift.common.internal_client import (
+    delete_object, put_object, head_object,
+    InternalClient, UnexpectedResponse)
+from swift.common.exceptions import ClientException
 from swift.common.ring import Ring
-from swift.common.db import ContainerBroker
-from swift.common.utils import audit_location_generator, get_logger, \
-    hash_path, config_true_value, validate_sync_to, whataremyips
+from swift.common.ring.utils import is_local_device
+from swift.common.swob import normalize_etag
+from swift.common.utils import (
+    clean_content_type, config_true_value,
+    FileLikeIter, get_logger, hash_path, quote, validate_sync_to,
+    whataremyips, Timestamp, decode_timestamps, parse_options)
 from swift.common.daemon import Daemon
-from swift.common.http import HTTP_UNAUTHORIZED, HTTP_NOT_FOUND
+from swift.common.http import HTTP_UNAUTHORIZED, HTTP_NOT_FOUND, HTTP_CONFLICT
+from swift.common.wsgi import ConfigString
+from swift.common.middleware.versioned_writes.object_versioning import (
+    SYSMETA_VERSIONS_CONT, SYSMETA_VERSIONS_SYMLINK)
 
 
-class _Iter2FileLikeObject(object):
-    """
-    Returns an iterator's contents via :func:`read`, making it look like a file
-    object.
-    """
+# The default internal client config body is to support upgrades without
+# requiring deployment of the new /etc/swift/internal-client.conf
+ic_conf_body = """
+[DEFAULT]
+[pipeline:main]
+pipeline = catch_errors proxy-logging cache symlink proxy-server
 
-    def __init__(self, iterator):
-        self.iterator = iterator
-        self._chunk = ''
+[app:proxy-server]
+use = egg:swift#proxy
+account_autocreate = true
 
-    def read(self, size=-1):
-        """
-        read([size]) -> read at most size bytes, returned as a string.
+[filter:symlink]
+use = egg:swift#symlink
 
-        If the size argument is negative or omitted, read until EOF is reached.
-        Notice that when in non-blocking mode, less data than what was
-        requested may be returned, even if no size parameter was given.
-        """
-        if size < 0:
-            chunk = self._chunk
-            self._chunk = ''
-            return chunk + ''.join(self.iterator)
-        chunk = self._chunk
-        self._chunk = ''
-        if chunk and len(chunk) <= size:
-            return chunk
-        try:
-            chunk += self.iterator.next()
-        except StopIteration:
-            pass
-        if len(chunk) <= size:
-            return chunk
-        self._chunk = chunk[size:]
-        return chunk[:size]
+[filter:cache]
+use = egg:swift#memcache
+
+[filter:proxy-logging]
+use = egg:swift#proxy_logging
+
+[filter:catch_errors]
+use = egg:swift#catch_errors
+""".lstrip()
 
 
 class ContainerSync(Daemon):
@@ -77,13 +82,6 @@ class ContainerSync(Daemon):
     If they exist, newer rows since the last sync will trigger PUTs or DELETEs
     to the other container.
 
-    .. note::
-
-        Container sync will sync object POSTs only if the proxy server is set
-        to use "object_post_as_copy = true" which is the default. So-called
-        fast object posts, "object_post_as_copy = false" do not update the
-        container listings and therefore can't be detected for synchronization.
-
     The actual syncing is slightly more complicated to make use of the three
     (or number-of-replicas) main nodes for a container without each trying to
     do the exact same work but also without missing work if one node happens to
@@ -99,28 +97,28 @@ class ContainerSync(Daemon):
     An example may help. Assume replica count is 3 and perfectly matching
     ROWIDs starting at 1.
 
-        First sync run, database has 6 rows:
-
-            * SyncPoint1 starts as -1.
-            * SyncPoint2 starts as -1.
-            * No rows between points, so no "all updates" rows.
-            * Six rows newer than SyncPoint1, so a third of the rows are sent
-              by node 1, another third by node 2, remaining third by node 3.
-            * SyncPoint1 is set as 6 (the newest ROWID known).
-            * SyncPoint2 is left as -1 since no "all updates" rows were synced.
-
-        Next sync run, database has 12 rows:
-
-            * SyncPoint1 starts as 6.
-            * SyncPoint2 starts as -1.
-            * The rows between -1 and 6 all trigger updates (most of which
-              should short-circuit on the remote end as having already been
-              done).
-            * Six more rows newer than SyncPoint1, so a third of the rows are
-              sent by node 1, another third by node 2, remaining third by node
-              3.
-            * SyncPoint1 is set as 12 (the newest ROWID known).
-            * SyncPoint2 is set as 6 (the newest "all updates" ROWID).
+       First sync run, database has 6 rows:
+
+       * SyncPoint1 starts as -1.
+       * SyncPoint2 starts as -1.
+       * No rows between points, so no "all updates" rows.
+       * Six rows newer than SyncPoint1, so a third of the rows are sent
+         by node 1, another third by node 2, remaining third by node 3.
+       * SyncPoint1 is set as 6 (the newest ROWID known).
+       * SyncPoint2 is left as -1 since no "all updates" rows were synced.
+
+       Next sync run, database has 12 rows:
+
+       * SyncPoint1 starts as 6.
+       * SyncPoint2 starts as -1.
+       * The rows between -1 and 6 all trigger updates (most of which
+         should short-circuit on the remote end as having already been
+         done).
+       * Six more rows newer than SyncPoint1, so a third of the rows are
+         sent by node 1, another third by node 2, remaining third by node
+         3.
+       * SyncPoint1 is set as 12 (the newest ROWID known).
+       * SyncPoint2 is set as 6 (the newest "all updates" ROWID).
 
     In this way, under normal circumstances each node sends its share of
     updates each run and just sends a batch of older updates to ensure nothing
@@ -130,16 +128,15 @@ class ContainerSync(Daemon):
                  section of the container-server.conf
     :param container_ring: If None, the <swift_dir>/container.ring.gz will be
                            loaded. This is overridden by unit tests.
-    :param object_ring: If None, the <swift_dir>/object.ring.gz will be loaded.
-                        This is overridden by unit tests.
     """
+    log_route = 'container-sync'
 
-    def __init__(self, conf, container_ring=None, object_ring=None):
+    def __init__(self, conf, container_ring=None, logger=None):
         #: The dict of configuration values from the [container-sync] section
         #: of the container-server.conf.
         self.conf = conf
         #: Logger to use for container-sync log lines.
-        self.logger = get_logger(conf, log_route='container-sync')
+        self.logger = logger or get_logger(conf, log_route=self.log_route)
         #: Path to the local device mount points.
         self.devices = conf.get('devices', '/srv/node')
         #: Indicates whether mount points should be verified as actual mount
@@ -147,17 +144,31 @@ def __init__(self, conf, container_ring=None, object_ring=None):
         self.mount_check = config_true_value(conf.get('mount_check', 'true'))
         #: Minimum time between full scans. This is to keep the daemon from
         #: running wild on near empty systems.
-        self.interval = int(conf.get('interval', 300))
+        self.interval = float(conf.get('interval', 300))
         #: Maximum amount of time to spend syncing a container before moving on
-        #: to the next one. If a conatiner sync hasn't finished in this time,
+        #: to the next one. If a container sync hasn't finished in this time,
         #: it'll just be resumed next scan.
         self.container_time = int(conf.get('container_time', 60))
-        #: The list of hosts we're allowed to send syncs to.
+        #: ContainerSyncCluster instance for validating sync-to values.
+        self.realms_conf = ContainerSyncRealms(
+            os.path.join(
+                conf.get('swift_dir', '/etc/swift'),
+                'container-sync-realms.conf'),
+            self.logger)
+        #: The list of hosts we're allowed to send syncs to. This can be
+        #: overridden by data in self.realms_conf
         self.allowed_sync_hosts = [
             h.strip()
             for h in conf.get('allowed_sync_hosts', '127.0.0.1').split(',')
             if h.strip()]
-        self.proxy = conf.get('sync_proxy')
+        self.http_proxies = [
+            a.strip()
+            for a in conf.get('sync_proxy', '').split(',')
+            if a.strip()]
+        #: ContainerSyncStore instance for iterating over synced containers
+        self.sync_store = ContainerSyncStore(self.devices,
+                                             self.logger,
+                                             self.mount_check)
         #: Number of containers with sync turned on that were successfully
         #: synced.
         self.container_syncs = 0
@@ -165,35 +176,66 @@ def __init__(self, conf, container_ring=None, object_ring=None):
         self.container_deletes = 0
         #: Number of successful PUTs triggered.
         self.container_puts = 0
-        #: Number of containers that didn't have sync turned on.
+        #: Number of containers whose sync has been turned off, but
+        #: are not yet cleared from the sync store.
         self.container_skips = 0
         #: Number of containers that had a failure of some type.
         self.container_failures = 0
+
+        #: Per container stats. These are collected per container.
+        #: puts - the number of puts that were done for the container
+        #: deletes - the number of deletes that were fot the container
+        #: bytes - the total number of bytes transferred per the container
+        self.container_stats = collections.defaultdict(int)
+        self.container_stats.clear()
+
         #: Time of last stats report.
         self.reported = time()
-        swift_dir = conf.get('swift_dir', '/etc/swift')
+        self.swift_dir = conf.get('swift_dir', '/etc/swift')
         #: swift.common.ring.Ring for locating containers.
-        self.container_ring = container_ring or Ring(swift_dir,
+        self.container_ring = container_ring or Ring(self.swift_dir,
                                                      ring_name='container')
-        #: swift.common.ring.Ring for locating objects.
-        self.object_ring = object_ring or Ring(swift_dir, ring_name='object')
-        self._myips = whataremyips()
-        self._myport = int(conf.get('bind_port', 6001))
+        bind_ip = conf.get('bind_ip', '0.0.0.0')
+        self._myips = whataremyips(bind_ip)
+        self._myport = int(conf.get('bind_port', 6201))
         swift.common.db.DB_PREALLOCATION = \
             config_true_value(conf.get('db_preallocation', 'f'))
+        self.conn_timeout = float(conf.get('conn_timeout', 5))
+        request_tries = int(conf.get('request_tries') or 3)
+
+        internal_client_conf_path = conf.get('internal_client_conf_path')
+        if not internal_client_conf_path:
+            self.logger.warning(
+                'Configuration option internal_client_conf_path not '
+                'defined. Using default configuration, See '
+                'internal-client.conf-sample for options')
+            internal_client_conf = ConfigString(ic_conf_body)
+        else:
+            internal_client_conf = internal_client_conf_path
+        try:
+            self.swift = InternalClient(
+                internal_client_conf, 'Swift Container Sync', request_tries,
+                use_replication_network=True,
+                global_conf={'log_name': '%s-ic' % conf.get(
+                    'log_name', self.log_route)})
+        except (OSError, IOError) as err:
+            if err.errno != errno.ENOENT and \
+                    not str(err).endswith(' not found'):
+                raise
+            raise SystemExit(
+                'Unable to load internal client from config: '
+                '%(conf)r (%(error)s)'
+                % {'conf': internal_client_conf_path, 'error': err})
 
-    def run_forever(self):
+    def run_forever(self, *args, **kwargs):
         """
         Runs container sync scans until stopped.
         """
         sleep(random() * self.interval)
         while True:
             begin = time()
-            all_locs = audit_location_generator(self.devices,
-                                                container_server.DATADIR,
-                                                mount_check=self.mount_check,
-                                                logger=self.logger)
-            for path, device, partition in all_locs:
+            for path in self.sync_store.synced_containers_generator():
+                self.container_stats.clear()
                 self.container_sync(path)
                 if time() - self.reported >= 3600:  # once an hour
                     self.report()
@@ -201,24 +243,20 @@ def run_forever(self):
             if elapsed < self.interval:
                 sleep(self.interval - elapsed)
 
-    def run_once(self):
+    def run_once(self, *args, **kwargs):
         """
         Runs a single container sync scan.
         """
-        self.logger.info(_('Begin container sync "once" mode'))
+        self.logger.info('Begin container sync "once" mode')
         begin = time()
-        all_locs = audit_location_generator(self.devices,
-                                            container_server.DATADIR,
-                                            mount_check=self.mount_check,
-                                            logger=self.logger)
-        for path, device, partition in all_locs:
+        for path in self.sync_store.synced_containers_generator():
             self.container_sync(path)
             if time() - self.reported >= 3600:  # once an hour
                 self.report()
         self.report()
         elapsed = time() - begin
         self.logger.info(
-            _('Container sync "once" mode completed: %.02fs'), elapsed)
+            'Container sync "once" mode completed: %.02fs', elapsed)
 
     def report(self):
         """
@@ -226,8 +264,8 @@ def report(self):
         next report.
         """
         self.logger.info(
-            _('Since %(time)s: %(sync)s synced [%(delete)s deletes, %(put)s '
-              'puts], %(skip)s skipped, %(fail)s failed'),
+            'Since %(time)s: %(sync)s synced [%(delete)s deletes, %(put)s '
+            'puts], %(skip)s skipped, %(fail)s failed',
             {'time': ctime(self.reported),
              'sync': self.container_syncs,
              'delete': self.container_deletes,
@@ -241,6 +279,30 @@ def report(self):
         self.container_skips = 0
         self.container_failures = 0
 
+    def container_report(self, start, end, sync_point1, sync_point2, info,
+                         max_row):
+        self.logger.info('Container sync report: %(container)s, '
+                         'time window start: %(start)s, '
+                         'time window end: %(end)s, '
+                         'puts: %(puts)s, '
+                         'posts: %(posts)s, '
+                         'deletes: %(deletes)s, '
+                         'bytes: %(bytes)s, '
+                         'sync_point1: %(point1)s, '
+                         'sync_point2: %(point2)s, '
+                         'total_rows: %(total)s',
+                         {'container': '%s/%s' % (info['account'],
+                                                  info['container']),
+                          'start': start,
+                          'end': end,
+                          'puts': self.container_stats['puts'],
+                          'posts': 0,
+                          'deletes': self.container_stats['deletes'],
+                          'bytes': self.container_stats['bytes'],
+                          'point1': sync_point1,
+                          'point2': sync_point2,
+                          'total': max_row})
+
     def container_sync(self, path):
         """
         Checks the given path for a container database, determines if syncing
@@ -249,193 +311,354 @@ def container_sync(self, path):
 
         :param path: the path to a container db
         """
+        broker = None
         try:
-            if not path.endswith('.db'):
-                return
-            broker = ContainerBroker(path)
-            info = broker.get_info()
+            broker = ContainerBroker(path, logger=self.logger)
+            # The path we pass to the ContainerBroker is a real path of
+            # a container DB. If we get here, however, it means that this
+            # path is linked from the sync_containers dir. In rare cases
+            # of race or processes failures the link can be stale and
+            # the get_info below will raise a DB doesn't exist exception
+            # In this case we remove the stale link and raise an error
+            # since in most cases the db should be there.
+            try:
+                info = broker.get_info()
+            except DatabaseConnectionError as db_err:
+                if str(db_err).endswith("DB doesn't exist"):
+                    self.sync_store.remove_synced_container(broker)
+                raise
+
             x, nodes = self.container_ring.get_nodes(info['account'],
                                                      info['container'])
             for ordinal, node in enumerate(nodes):
-                if node['ip'] in self._myips and node['port'] == self._myport:
+                if is_local_device(self._myips, self._myport,
+                                   node['ip'], node['port']):
                     break
             else:
                 return
+            if broker.metadata.get(SYSMETA_VERSIONS_CONT):
+                self.container_skips += 1
+                self.logger.increment('skips')
+                self.logger.warning('Skipping container %s/%s with '
+                                    'object versioning configured' % (
+                                        info['account'], info['container']))
+                return
             if not broker.is_deleted():
                 sync_to = None
-                sync_key = None
+                user_key = None
                 sync_point1 = info['x_container_sync_point1']
                 sync_point2 = info['x_container_sync_point2']
-                for key, (value, timestamp) in broker.metadata.iteritems():
+                for key, (value, timestamp) in broker.metadata.items():
                     if key.lower() == 'x-container-sync-to':
                         sync_to = value
                     elif key.lower() == 'x-container-sync-key':
-                        sync_key = value
-                if not sync_to or not sync_key:
+                        user_key = value
+                if not sync_to or not user_key:
                     self.container_skips += 1
                     self.logger.increment('skips')
                     return
-                sync_to = sync_to.rstrip('/')
-                err = validate_sync_to(sync_to, self.allowed_sync_hosts)
+                err, sync_to, realm, realm_key = validate_sync_to(
+                    sync_to, self.allowed_sync_hosts, self.realms_conf)
                 if err:
                     self.logger.info(
-                        _('ERROR %(db_file)s: %(validate_sync_to_err)s'),
-                        {'db_file': broker.db_file,
+                        'ERROR %(db_file)s: %(validate_sync_to_err)s',
+                        {'db_file': str(broker),
                          'validate_sync_to_err': err})
                     self.container_failures += 1
                     self.logger.increment('failures')
                     return
-                stop_at = time() + self.container_time
-                while time() < stop_at and sync_point2 < sync_point1:
-                    rows = broker.get_items_since(sync_point2, 1)
-                    if not rows:
-                        break
-                    row = rows[0]
-                    if row['ROWID'] > sync_point1:
-                        break
-                    key = hash_path(info['account'], info['container'],
-                                    row['name'], raw_digest=True)
-                    # This node will only intially sync out one third of the
-                    # objects (if 3 replicas, 1/4 if 4, etc.). This section
-                    # will attempt to sync previously skipped rows in case the
-                    # other nodes didn't succeed.
-                    if unpack_from('>I', key)[0] % \
-                            len(nodes) != ordinal:
-                        if not self.container_sync_row(row, sync_to, sync_key,
-                                                       broker, info):
-                            return
-                    sync_point2 = row['ROWID']
-                    broker.set_x_container_sync_points(None, sync_point2)
-                while time() < stop_at:
-                    rows = broker.get_items_since(sync_point1, 1)
-                    if not rows:
-                        break
-                    row = rows[0]
-                    key = hash_path(info['account'], info['container'],
-                                    row['name'], raw_digest=True)
-                    # This node will only intially sync out one third of the
-                    # objects (if 3 replicas, 1/4 if 4, etc.). It'll come back
-                    # around to the section above and attempt to sync
-                    # previously skipped rows in case the other nodes didn't
-                    # succeed.
-                    if unpack_from('>I', key)[0] % \
-                            len(nodes) == ordinal:
-                        if not self.container_sync_row(row, sync_to, sync_key,
-                                                       broker, info):
-                            return
-                    sync_point1 = row['ROWID']
-                    broker.set_x_container_sync_points(sync_point1, None)
-                self.container_syncs += 1
-                self.logger.increment('syncs')
-        except (Exception, Timeout), err:
+                start_at = time()
+                stop_at = start_at + self.container_time
+                next_sync_point = None
+                sync_stage_time = start_at
+                try:
+                    while time() < stop_at and sync_point2 < sync_point1:
+                        rows = broker.get_items_since(sync_point2, 1)
+                        if not rows:
+                            break
+                        row = rows[0]
+                        if row['ROWID'] > sync_point1:
+                            break
+                        # This node will only initially sync out one third
+                        # of the objects (if 3 replicas, 1/4 if 4, etc.)
+                        # and will skip problematic rows as needed in case of
+                        # faults.
+                        # This section will attempt to sync previously skipped
+                        # rows in case the previous attempts by any of the
+                        # nodes didn't succeed.
+                        if not self.container_sync_row(
+                                row, sync_to, user_key, broker, info, realm,
+                                realm_key):
+                            if not next_sync_point:
+                                next_sync_point = sync_point2
+                        sync_point2 = row['ROWID']
+                        broker.set_x_container_sync_points(None, sync_point2)
+                    if next_sync_point:
+                        broker.set_x_container_sync_points(None,
+                                                           next_sync_point)
+                    else:
+                        next_sync_point = sync_point2
+                    sync_stage_time = time()
+                    while sync_stage_time < stop_at:
+                        rows = broker.get_items_since(sync_point1, 1)
+                        if not rows:
+                            break
+                        row = rows[0]
+                        key = hash_path(info['account'], info['container'],
+                                        row['name'], raw_digest=True)
+                        # This node will only initially sync out one third of
+                        # the objects (if 3 replicas, 1/4 if 4, etc.).
+                        # It'll come back around to the section above
+                        # and attempt to sync previously skipped rows in case
+                        # the other nodes didn't succeed or in case it failed
+                        # to do so the first time.
+                        if unpack_from('>I', key)[0] % \
+                                len(nodes) == ordinal:
+                            self.container_sync_row(
+                                row, sync_to, user_key, broker, info, realm,
+                                realm_key)
+                        sync_point1 = row['ROWID']
+                        broker.set_x_container_sync_points(sync_point1, None)
+                        sync_stage_time = time()
+                    self.container_syncs += 1
+                    self.logger.increment('syncs')
+                finally:
+                    self.container_report(start_at, sync_stage_time,
+                                          sync_point1,
+                                          next_sync_point,
+                                          info, broker.get_max_row())
+        except (Exception, Timeout):
             self.container_failures += 1
             self.logger.increment('failures')
-            self.logger.exception(_('ERROR Syncing %s'), (broker.db_file))
+            self.logger.exception('ERROR Syncing %s',
+                                  broker if broker else path)
+
+    def _update_sync_to_headers(self, name, sync_to, user_key,
+                                realm, realm_key, method, headers):
+        """
+        Updates container sync headers
 
-    def container_sync_row(self, row, sync_to, sync_key, broker, info):
+        :param name: The name of the object
+        :param sync_to: The URL to the remote container.
+        :param user_key: The X-Container-Sync-Key to use when sending requests
+                         to the other container.
+        :param realm: The realm from self.realms_conf, if there is one.
+            If None, fallback to using the older allowed_sync_hosts
+            way of syncing.
+        :param realm_key: The realm key from self.realms_conf, if there
+            is one. If None, fallback to using the older
+            allowed_sync_hosts way of syncing.
+        :param method: HTTP method to create sig with
+        :param headers: headers to update with container sync headers
+        """
+        if realm and realm_key:
+            nonce = uuid.uuid4().hex
+            path = urlparse(sync_to).path + '/' + quote(name)
+            sig = self.realms_conf.get_sig(method, path,
+                                           headers.get('x-timestamp', 0),
+                                           nonce, realm_key,
+                                           user_key)
+            headers['x-container-sync-auth'] = '%s %s %s' % (realm,
+                                                             nonce,
+                                                             sig)
+        else:
+            headers['x-container-sync-key'] = user_key
+
+    def _object_in_remote_container(self, name, sync_to, user_key,
+                                    realm, realm_key, timestamp):
+        """
+        Performs head object on remote to eliminate extra remote put and
+        local get object calls
+
+        :param name: The name of the object in the updated row in the local
+                     database triggering the sync update.
+        :param sync_to: The URL to the remote container.
+        :param user_key: The X-Container-Sync-Key to use when sending requests
+                         to the other container.
+        :param realm: The realm from self.realms_conf, if there is one.
+            If None, fallback to using the older allowed_sync_hosts
+            way of syncing.
+        :param realm_key: The realm key from self.realms_conf, if there
+            is one. If None, fallback to using the older
+            allowed_sync_hosts way of syncing.
+        :param timestamp: last modified date of local object
+        :returns: True if object already exists in remote
+        """
+        headers = {'x-timestamp': timestamp.internal}
+        self._update_sync_to_headers(name, sync_to, user_key, realm,
+                                     realm_key, 'HEAD', headers)
+        try:
+            metadata, _ = head_object(sync_to, name=name,
+                                      headers=headers,
+                                      proxy=self.select_http_proxy(),
+                                      logger=self.logger,
+                                      retries=0)
+            remote_ts = Timestamp(
+                metadata.get('x-timestamp', Timestamp.zero()))
+            self.logger.debug("remote obj timestamp %s local obj %s" %
+                              (timestamp.internal, remote_ts.internal))
+            if timestamp <= remote_ts:
+                return True
+            # Object in remote should be updated
+            return False
+        except ClientException as http_err:
+            # Object not in remote
+            if http_err.http_status == 404:
+                return False
+            raise http_err
+
+    def container_sync_row(self, row, sync_to, user_key, broker, info,
+                           realm, realm_key):
         """
         Sends the update the row indicates to the sync_to container.
+        Update can be either delete or put.
 
         :param row: The updated row in the local database triggering the sync
                     update.
         :param sync_to: The URL to the remote container.
-        :param sync_key: The X-Container-Sync-Key to use when sending requests
+        :param user_key: The X-Container-Sync-Key to use when sending requests
                          to the other container.
         :param broker: The local container database broker.
         :param info: The get_info result from the local container database
                      broker.
+        :param realm: The realm from self.realms_conf, if there is one.
+            If None, fallback to using the older allowed_sync_hosts
+            way of syncing.
+        :param realm_key: The realm key from self.realms_conf, if there
+            is one. If None, fallback to using the older
+            allowed_sync_hosts way of syncing.
         :returns: True on success
         """
         try:
             start_time = time()
+            # extract last modified time from the created_at value
+            ts_data, ts_ctype, ts_meta = decode_timestamps(
+                row['created_at'])
             if row['deleted']:
+                # when sync'ing a deleted object, use ts_data - this is the
+                # timestamp of the source tombstone
                 try:
-                    delete_object(sync_to, name=row['name'],
-                                  headers={'x-timestamp': row['created_at'],
-                                           'x-container-sync-key': sync_key},
-                                  proxy=self.proxy)
-                except ClientException, err:
-                    if err.http_status != HTTP_NOT_FOUND:
+                    headers = {'x-timestamp': ts_data.internal}
+                    self._update_sync_to_headers(row['name'], sync_to,
+                                                 user_key, realm, realm_key,
+                                                 'DELETE', headers)
+                    delete_object(sync_to, name=row['name'], headers=headers,
+                                  proxy=self.select_http_proxy(),
+                                  logger=self.logger,
+                                  timeout=self.conn_timeout)
+                except ClientException as err:
+                    if err.http_status not in (
+                            HTTP_NOT_FOUND, HTTP_CONFLICT):
                         raise
                 self.container_deletes += 1
+                self.container_stats['deletes'] += 1
                 self.logger.increment('deletes')
                 self.logger.timing_since('deletes.timing', start_time)
             else:
-                part, nodes = self.object_ring.get_nodes(
-                    info['account'], info['container'],
-                    row['name'])
-                shuffle(nodes)
+                # when sync'ing a live object, use ts_meta - this is the time
+                # at which the source object was last modified by a PUT or POST
+                if self._object_in_remote_container(row['name'],
+                                                    sync_to, user_key, realm,
+                                                    realm_key, ts_meta):
+                    return True
                 exc = None
-                looking_for_timestamp = float(row['created_at'])
-                timestamp = -1
-                headers = body = None
-                for node in nodes:
-                    try:
-                        these_headers, this_body = direct_get_object(
-                            node, part, info['account'], info['container'],
-                            row['name'], resp_chunk_size=65536)
-                        this_timestamp = float(these_headers['x-timestamp'])
-                        if this_timestamp > timestamp:
-                            timestamp = this_timestamp
-                            headers = these_headers
-                            body = this_body
-                    except ClientException, err:
-                        # If any errors are not 404, make sure we report the
-                        # non-404 one. We don't want to mistakenly assume the
-                        # object no longer exists just because one says so and
-                        # the others errored for some other reason.
-                        if not exc or exc.http_status == HTTP_NOT_FOUND:
-                            exc = err
-                    except (Exception, Timeout), err:
-                        exc = err
-                if timestamp < looking_for_timestamp:
+                # look up for the newest one; the symlink=get query-string has
+                # no effect unless symlinks are enabled in the internal client
+                # in which case it ensures that symlink objects retain their
+                # symlink property when sync'd.
+                headers_out = {'X-Newest': True,
+                               'X-Backend-Storage-Policy-Index':
+                               str(info['storage_policy_index'])}
+                try:
+                    source_obj_status, headers, body = \
+                        self.swift.get_object(info['account'],
+                                              info['container'], row['name'],
+                                              headers=headers_out,
+                                              acceptable_statuses=(2, 4),
+                                              params={'symlink': 'get'})
+
+                except (Exception, UnexpectedResponse, Timeout) as err:
+                    headers = {}
+                    body = None
+                    exc = err
+
+                # skip object_versioning links; this is in case the container
+                # metadata is out of date
+                if headers.get(SYSMETA_VERSIONS_SYMLINK):
+                    self.logger.info(
+                        'Skipping versioning symlink %s/%s/%s ' % (
+                            info['account'], info['container'],
+                            row['name']))
+                    return True
+
+                timestamp = Timestamp(
+                    headers.get('x-timestamp', Timestamp.zero()))
+                if timestamp < ts_meta:
                     if exc:
                         raise exc
                     raise Exception(
-                        _('Unknown exception trying to GET: %(node)r '
-                          '%(account)r %(container)r %(object)r'),
-                        {'node': node, 'part': part,
-                         'account': info['account'],
+                        'Unknown exception trying to GET: '
+                        '%(account)r %(container)r %(object)r' %
+                        {'account': info['account'],
                          'container': info['container'],
                          'object': row['name']})
                 for key in ('date', 'last-modified'):
                     if key in headers:
                         del headers[key]
                 if 'etag' in headers:
-                    headers['etag'] = headers['etag'].strip('"')
-                headers['x-timestamp'] = row['created_at']
-                headers['x-container-sync-key'] = sync_key
+                    headers['etag'] = normalize_etag(headers['etag'])
+                if 'content-type' in headers:
+                    headers['content-type'] = clean_content_type(
+                        headers['content-type'])
+                self._update_sync_to_headers(row['name'], sync_to, user_key,
+                                             realm, realm_key, 'PUT', headers)
                 put_object(sync_to, name=row['name'], headers=headers,
-                           contents=_Iter2FileLikeObject(body),
-                           proxy=self.proxy)
+                           contents=FileLikeIter(body),
+                           proxy=self.select_http_proxy(), logger=self.logger,
+                           timeout=self.conn_timeout)
                 self.container_puts += 1
+                self.container_stats['puts'] += 1
+                self.container_stats['bytes'] += row['size']
                 self.logger.increment('puts')
                 self.logger.timing_since('puts.timing', start_time)
-        except ClientException, err:
+        except ClientException as err:
             if err.http_status == HTTP_UNAUTHORIZED:
                 self.logger.info(
-                    _('Unauth %(sync_from)r => %(sync_to)r'),
+                    'Unauth %(sync_from)r => %(sync_to)r',
                     {'sync_from': '%s/%s' %
                         (quote(info['account']), quote(info['container'])),
                      'sync_to': sync_to})
             elif err.http_status == HTTP_NOT_FOUND:
                 self.logger.info(
-                    _('Not found %(sync_from)r => %(sync_to)r'),
+                    'Not found %(sync_from)r => %(sync_to)r \
+                    - object %(obj_name)r',
                     {'sync_from': '%s/%s' %
                         (quote(info['account']), quote(info['container'])),
-                     'sync_to': sync_to})
+                     'sync_to': sync_to, 'obj_name': row['name']})
             else:
                 self.logger.exception(
-                    _('ERROR Syncing %(db_file)s %(row)s'),
-                    {'db_file': broker.db_file, 'row': row})
+                    'ERROR Syncing %(db_file)s %(row)s',
+                    {'db_file': str(broker), 'row': row})
             self.container_failures += 1
             self.logger.increment('failures')
             return False
-        except (Exception, Timeout), err:
+        except (Exception, Timeout):
             self.logger.exception(
-                _('ERROR Syncing %(db_file)s %(row)s'),
-                {'db_file': broker.db_file, 'row': row})
+                'ERROR Syncing %(db_file)s %(row)s',
+                {'db_file': str(broker), 'row': row})
             self.container_failures += 1
             self.logger.increment('failures')
             return False
         return True
+
+    def select_http_proxy(self):
+        return choice(self.http_proxies) if self.http_proxies else None
+
+
+def main():
+    conf_file, options = parse_options(once=True)
+    run_daemon(ContainerSync, conf_file, **options)
+
+
+if __name__ == '__main__':
+    main()
diff --git a/swift/container/sync_store.py b/swift/container/sync_store.py
new file mode 100644
index 0000000000..729eaee093
--- /dev/null
+++ b/swift/container/sync_store.py
@@ -0,0 +1,177 @@
+# Copyright (c) 2010-2016 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import os
+import errno
+
+from swift.common.utils import audit_location_generator, mkdirs
+from swift.container.backend import DATADIR
+
+SYNC_DATADIR = 'sync_containers'
+
+
+class ContainerSyncStore(object):
+    """
+    Filesystem based store for local containers that needs to be synced.
+
+    The store holds a list of containers that need to be synced by the
+    container sync daemon. The store is local to the container server node,
+    that is, only containers whose databases are kept locally on the node are
+    listed.
+    """
+    def __init__(self, devices, logger, mount_check):
+        self.devices = os.path.normpath(os.path.join('/', devices)) + '/'
+        self.logger = logger
+        self.mount_check = mount_check
+
+    def _container_to_synced_container_path(self, path):
+        # path is assumed to be of the form:
+        # /srv/node/sdb/containers/part/.../*.db
+        # or more generally:
+        # devices/device/containers/part/.../*.db
+        # Below we split the path to the following parts:
+        # devices, device, rest
+        devices = self.devices
+        path = os.path.normpath(path)
+        device = path[len(devices):path.rfind(DATADIR)]
+        rest = path[path.rfind(DATADIR) + len(DATADIR) + 1:]
+
+        return os.path.join(devices, device, SYNC_DATADIR, rest)
+
+    def _synced_container_to_container_path(self, path):
+        # synced path is assumed to be of the form:
+        # /srv/node/sdb/sync_containers/part/.../*.db
+        # or more generally:
+        # devices/device/sync_containers/part/.../*.db
+        # Below we split the path to the following parts:
+        # devices, device, rest
+        devices = self.devices
+        path = os.path.normpath(path)
+        device = path[len(devices):path.rfind(SYNC_DATADIR)]
+        rest = path[path.rfind(SYNC_DATADIR) + len(SYNC_DATADIR) + 1:]
+
+        return os.path.join(devices, device, DATADIR, rest)
+
+    def add_synced_container(self, broker):
+        """
+        Adds the container db represented by broker to the list of synced
+        containers.
+
+        :param broker: An instance of ContainerBroker representing the
+                       container to add.
+        """
+        sync_file = self._container_to_synced_container_path(broker.db_file)
+        stat = None
+        try:
+            stat = os.stat(sync_file)
+        except OSError as oserr:
+            if oserr.errno != errno.ENOENT:
+                raise oserr
+
+        if stat is not None:
+            return
+
+        sync_path = os.path.dirname(sync_file)
+        mkdirs(sync_path)
+
+        try:
+            os.symlink(broker.db_file, sync_file)
+        except OSError as oserr:
+            if (oserr.errno != errno.EEXIST or
+                    not os.path.islink(sync_file)):
+                raise oserr
+
+    def remove_synced_container(self, broker):
+        """
+        Removes the container db represented by broker from the list of synced
+        containers.
+
+        :param broker: An instance of ContainerBroker representing the
+                       container to remove.
+        """
+        sync_file = broker.db_file
+        sync_file = self._container_to_synced_container_path(sync_file)
+        try:
+            os.unlink(sync_file)
+            os.removedirs(os.path.dirname(sync_file))
+        except OSError as oserr:
+            if oserr.errno != errno.ENOENT:
+                raise oserr
+
+    def update_sync_store(self, broker):
+        """
+        Add or remove a symlink to/from the sync-containers directory
+        according to the broker's metadata.
+
+        Decide according to the broker x-container-sync-to and
+        x-container-sync-key whether a symlink needs to be added or
+        removed.
+
+        We mention that if both metadata items do not appear
+        at all, the container has never been set for sync in reclaim_age
+        in which case we do nothing. This is important as this method is
+        called for ALL containers from the container replicator.
+
+        Once we realize that we do need to do something, we check if
+        the container is marked for delete, in which case we want to
+        remove the symlink
+
+        For adding a symlink we notice that both x-container-sync-to and
+        x-container-sync-key exist and are valid, that is, are not empty.
+
+        At this point we know we need to do something, the container
+        is not marked for delete and the condition to add a symlink
+        is not met. conclusion need to remove the symlink.
+
+        :param broker: An instance of ContainerBroker
+        """
+        # If the broker metadata does not have both x-container-sync-to
+        # and x-container-sync-key it has *never* been set. Make sure
+        # we do nothing in this case
+        if ('X-Container-Sync-To' not in broker.metadata and
+                'X-Container-Sync-Key' not in broker.metadata):
+            return
+
+        if broker.is_deleted():
+            self.remove_synced_container(broker)
+            return
+
+        # If both x-container-sync-to and x-container-sync-key
+        # exist and valid, add the symlink
+        sync_to = sync_key = None
+        if 'X-Container-Sync-To' in broker.metadata:
+            sync_to = broker.metadata['X-Container-Sync-To'][0]
+        if 'X-Container-Sync-Key' in broker.metadata:
+            sync_key = broker.metadata['X-Container-Sync-Key'][0]
+        if sync_to and sync_key:
+            self.add_synced_container(broker)
+            return
+
+        self.remove_synced_container(broker)
+
+    def synced_containers_generator(self):
+        """
+        Iterates over the list of synced containers
+        yielding the path of the container db
+        """
+        all_locs = audit_location_generator(self.devices, SYNC_DATADIR, '.db',
+                                            mount_check=self.mount_check,
+                                            logger=self.logger)
+        for path, device, partition in all_locs:
+            # What we want to yield is the real path as its being used for
+            # initiating a container broker. The broker would break if not
+            # given the db real path, as it e.g. assumes the existence of
+            # .pending in the same path
+            yield self._synced_container_to_container_path(path)
diff --git a/swift/container/updater.py b/swift/container/updater.py
index 27d791e4a3..27a4079a30 100644
--- a/swift/container/updater.py
+++ b/swift/container/updater.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -21,33 +21,48 @@
 from random import random, shuffle
 from tempfile import mkstemp
 
-from eventlet import spawn, patcher, Timeout
+from eventlet import spawn, Timeout
 
 import swift.common.db
-from swift.container.server import DATADIR
+from swift.common.constraints import check_drive
+from swift.container.backend import ContainerBroker, DATADIR
 from swift.common.bufferedhttp import http_connect
-from swift.common.db import ContainerBroker
-from swift.common.exceptions import ConnectionTimeout
+from swift.common.exceptions import ConnectionTimeout, LockTimeout
 from swift.common.ring import Ring
-from swift.common.utils import get_logger, config_true_value, dump_recon_cache
-from swift.common.daemon import Daemon
+from swift.common.utils import get_logger, config_true_value, \
+    dump_recon_cache, majority_size, Timestamp, EventletRateLimiter, \
+    eventlet_monkey_patch, node_to_string, parse_options
+from swift.common.daemon import Daemon, run_daemon
 from swift.common.http import is_success, HTTP_INTERNAL_SERVER_ERROR
+from swift.common.recon import RECON_CONTAINER_FILE, DEFAULT_RECON_CACHE_PATH
 
 
 class ContainerUpdater(Daemon):
     """Update container information in account listings."""
 
-    def __init__(self, conf):
+    def __init__(self, conf, logger=None):
         self.conf = conf
-        self.logger = get_logger(conf, log_route='container-updater')
+        self.logger = logger or get_logger(conf, log_route='container-updater')
         self.devices = conf.get('devices', '/srv/node')
         self.mount_check = config_true_value(conf.get('mount_check', 'true'))
         self.swift_dir = conf.get('swift_dir', '/etc/swift')
-        self.interval = int(conf.get('interval', 300))
+        self.interval = float(conf.get('interval', 300))
         self.account_ring = None
         self.concurrency = int(conf.get('concurrency', 4))
-        self.slowdown = float(conf.get('slowdown', 0.01))
-        self.node_timeout = int(conf.get('node_timeout', 3))
+        if 'slowdown' in conf:
+            self.logger.warning(
+                'The slowdown option is deprecated in favor of '
+                'containers_per_second. This option may be ignored in a '
+                'future release.')
+            containers_per_second = 1 / (
+                float(conf.get('slowdown', '0.01')) + 0.01)
+        else:
+            containers_per_second = 50
+        self.max_containers_per_second = \
+            float(conf.get('containers_per_second',
+                           containers_per_second))
+        self.rate_limiter = EventletRateLimiter(self.max_containers_per_second)
+        self.node_timeout = float(conf.get('node_timeout', 3))
         self.conn_timeout = float(conf.get('conn_timeout', 0.5))
         self.no_changes = 0
         self.successes = 0
@@ -59,8 +74,9 @@ def __init__(self, conf):
         swift.common.db.DB_PREALLOCATION = \
             config_true_value(conf.get('db_preallocation', 'f'))
         self.recon_cache_path = conf.get('recon_cache_path',
-                                         '/var/cache/swift')
-        self.rcache = os.path.join(self.recon_cache_path, "container.recon")
+                                         DEFAULT_RECON_CACHE_PATH)
+        self.rcache = os.path.join(self.recon_cache_path, RECON_CONTAINER_FILE)
+        self.user_agent = 'container-updater %s' % os.getpid()
 
     def get_account_ring(self):
         """Get the account ring.  Load it if it hasn't been yet."""
@@ -68,6 +84,14 @@ def get_account_ring(self):
             self.account_ring = Ring(self.swift_dir, ring_name='account')
         return self.account_ring
 
+    def _listdir(self, path):
+        try:
+            return os.listdir(path)
+        except OSError as e:
+            self.logger.error('ERROR:  Failed to get paths to drive '
+                              'partitions: %s', e)
+            return []
+
     def get_paths(self):
         """
         Get paths to all of the partitions on each drive to be processed.
@@ -75,15 +99,16 @@ def get_paths(self):
         :returns: a list of paths
         """
         paths = []
-        for device in os.listdir(self.devices):
-            dev_path = os.path.join(self.devices, device)
-            if self.mount_check and not os.path.ismount(dev_path):
-                self.logger.warn(_('%s is not mounted'), device)
+        for device in self._listdir(self.devices):
+            try:
+                dev_path = check_drive(self.devices, device, self.mount_check)
+            except ValueError as err:
+                self.logger.warning("%s", err)
                 continue
             con_path = os.path.join(dev_path, DATADIR)
             if not os.path.exists(con_path):
                 continue
-            for partition in os.listdir(con_path):
+            for partition in self._listdir(con_path):
                 paths.append(os.path.join(con_path, partition))
         shuffle(paths)
         return paths
@@ -97,21 +122,21 @@ def _load_suppressions(self, filename):
                     self.account_suppressions[account] = until
         except Exception:
             self.logger.exception(
-                _('ERROR with loading suppressions from %s: ') % filename)
+                'ERROR with loading suppressions from %s: ', filename)
         finally:
             os.unlink(filename)
 
     def run_forever(self, *args, **kwargs):
         """
-        Run the updator continuously.
+        Run the updater continuously.
         """
         time.sleep(random() * self.interval)
         while True:
-            self.logger.info(_('Begin container update sweep'))
+            self.logger.info('Begin container update sweep')
             begin = time.time()
             now = time.time()
             expired_suppressions = \
-                [a for a, u in self.account_suppressions.iteritems()
+                [a for a, u in self.account_suppressions.items()
                  if u < now]
             for account in expired_suppressions:
                 del self.account_suppressions[account]
@@ -132,7 +157,8 @@ def run_forever(self, *args, **kwargs):
                     pid2filename[pid] = tmpfilename
                 else:
                     signal.signal(signal.SIGTERM, signal.SIG_DFL)
-                    patcher.monkey_patch(all=False, socket=True)
+                    os.environ.pop('NOTIFY_SOCKET', None)
+                    eventlet_monkey_patch()
                     self.no_changes = 0
                     self.successes = 0
                     self.failures = 0
@@ -141,9 +167,9 @@ def run_forever(self, *args, **kwargs):
                     self.container_sweep(path)
                     elapsed = time.time() - forkbegin
                     self.logger.debug(
-                        _('Container update sweep of %(path)s completed: '
-                          '%(elapsed).02fs, %(success)s successes, %(fail)s '
-                          'failures, %(no_change)s with no changes'),
+                        'Container update sweep of %(path)s completed: '
+                        '%(elapsed).02fs, %(success)s successes, %(fail)s '
+                        'failures, %(no_change)s with no changes',
                         {'path': path, 'elapsed': elapsed,
                          'success': self.successes, 'fail': self.failures,
                          'no_change': self.no_changes})
@@ -155,7 +181,7 @@ def run_forever(self, *args, **kwargs):
                 finally:
                     del pid2filename[pid]
             elapsed = time.time() - begin
-            self.logger.info(_('Container update sweep completed: %.02fs'),
+            self.logger.info('Container update sweep completed: %.02fs',
                              elapsed)
             dump_recon_cache({'container_updater_sweep': elapsed},
                              self.rcache, self.logger)
@@ -166,8 +192,8 @@ def run_once(self, *args, **kwargs):
         """
         Run the updater once.
         """
-        patcher.monkey_patch(all=False, socket=True)
-        self.logger.info(_('Begin container update single threaded sweep'))
+        eventlet_monkey_patch()
+        self.logger.info('Begin container update single threaded sweep')
         begin = time.time()
         self.no_changes = 0
         self.successes = 0
@@ -175,10 +201,10 @@ def run_once(self, *args, **kwargs):
         for path in self.get_paths():
             self.container_sweep(path)
         elapsed = time.time() - begin
-        self.logger.info(_(
+        self.logger.info(
             'Container update single threaded sweep completed: '
             '%(elapsed).02fs, %(success)s successes, %(fail)s failures, '
-            '%(no_change)s with no changes'),
+            '%(no_change)s with no changes',
             {'elapsed': elapsed, 'success': self.successes,
              'fail': self.failures, 'no_change': self.no_changes})
         dump_recon_cache({'container_updater_sweep': elapsed},
@@ -193,8 +219,14 @@ def container_sweep(self, path):
         for root, dirs, files in os.walk(path):
             for file in files:
                 if file.endswith('.db'):
-                    self.process_container(os.path.join(root, file))
-                    time.sleep(self.slowdown)
+                    dbfile = os.path.join(root, file)
+                    try:
+                        self.process_container(dbfile)
+                    except (Exception, Timeout) as e:
+                        self.logger.exception(
+                            "Error processing container %s: %s", dbfile, e)
+
+                    self.rate_limiter.wait()
 
     def process_container(self, dbfile):
         """
@@ -204,13 +236,26 @@ def process_container(self, dbfile):
         """
         start_time = time.time()
         broker = ContainerBroker(dbfile, logger=self.logger)
-        info = broker.get_info()
+        try:
+            info = broker.get_info()
+        except LockTimeout as e:
+            self.logger.info(
+                "Failed to get container info (Lock timeout: %s); skipping.",
+                str(e))
+            return
         # Don't send updates if the container was auto-created since it
         # definitely doesn't have up to date statistics.
-        if float(info['put_timestamp']) <= 0:
+        if Timestamp(info['put_timestamp']) <= 0:
             return
         if self.account_suppressions.get(info['account'], 0) > time.time():
             return
+
+        if not broker.is_root_container():
+            # Don't double-up account stats.
+            # The sharder should get these stats to the root container,
+            # and the root's updater will get them to the right account.
+            info['object_count'] = info['bytes_used'] = 0
+
         if info['put_timestamp'] > info['reported_put_timestamp'] or \
                 info['delete_timestamp'] > info['reported_delete_timestamp'] \
                 or info['object_count'] != info['reported_object_count'] or \
@@ -219,35 +264,46 @@ def process_container(self, dbfile):
             part, nodes = self.get_account_ring().get_nodes(info['account'])
             events = [spawn(self.container_report, node, part, container,
                             info['put_timestamp'], info['delete_timestamp'],
-                            info['object_count'], info['bytes_used'])
+                            info['object_count'], info['bytes_used'],
+                            info['storage_policy_index'])
                       for node in nodes]
             successes = 0
-            failures = 0
+            stub404s = 0
             for event in events:
-                if is_success(event.wait()):
+                result = event.wait()
+                if is_success(result):
                     successes += 1
-                else:
-                    failures += 1
-            if successes > failures:
+                if result == 404:
+                    stub404s += 1
+            if successes >= majority_size(len(events)):
                 self.logger.increment('successes')
                 self.successes += 1
                 self.logger.debug(
-                    _('Update report sent for %(container)s %(dbfile)s'),
+                    'Update report sent for %(container)s %(dbfile)s',
                     {'container': container, 'dbfile': dbfile})
                 broker.reported(info['put_timestamp'],
                                 info['delete_timestamp'], info['object_count'],
                                 info['bytes_used'])
+            elif stub404s == len(events):
+                self.logger.increment('failures')
+                self.failures += 1
+                self.logger.debug(
+                    'Update report stub for %(container)s %(dbfile)s',
+                    {'container': container, 'dbfile': dbfile})
+                broker.quarantine('no account replicas exist')
+                # All that's left at this point is a few sacks of Gnocchi,
+                # easily collected by the dark data watcher in object auditor.
             else:
                 self.logger.increment('failures')
                 self.failures += 1
                 self.logger.debug(
-                    _('Update report failed for %(container)s %(dbfile)s'),
+                    'Update report failed for %(container)s %(dbfile)s',
                     {'container': container, 'dbfile': dbfile})
                 self.account_suppressions[info['account']] = until = \
                     time.time() + self.account_suppression_time
                 if self.new_account_suppressions:
-                    print >>self.new_account_suppressions, \
-                        info['account'], until
+                    print(info['account'], until,
+                          file=self.new_account_suppressions)
             # Only track timing data for attempted updates:
             self.logger.timing_since('timing', start_time)
         else:
@@ -255,7 +311,8 @@ def process_container(self, dbfile):
             self.no_changes += 1
 
     def container_report(self, node, part, container, put_timestamp,
-                         delete_timestamp, count, bytes):
+                         delete_timestamp, count, bytes,
+                         storage_policy_index):
         """
         Report container info to an account server.
 
@@ -266,21 +323,25 @@ def container_report(self, node, part, container, put_timestamp,
         :param delete_timestamp: delete timestamp
         :param count: object count in the container
         :param bytes: bytes used in the container
+        :param storage_policy_index: the policy index for the container
         """
         with ConnectionTimeout(self.conn_timeout):
             try:
+                headers = {
+                    'X-Put-Timestamp': put_timestamp,
+                    'X-Delete-Timestamp': delete_timestamp,
+                    'X-Object-Count': count,
+                    'X-Bytes-Used': bytes,
+                    'X-Account-Override-Deleted': 'yes',
+                    'X-Backend-Storage-Policy-Index': storage_policy_index,
+                    'user-agent': self.user_agent}
                 conn = http_connect(
-                    node['ip'], node['port'], node['device'], part,
-                    'PUT', container,
-                    headers={'X-Put-Timestamp': put_timestamp,
-                             'X-Delete-Timestamp': delete_timestamp,
-                             'X-Object-Count': count,
-                             'X-Bytes-Used': bytes,
-                             'X-Account-Override-Deleted': 'yes'})
+                    node['replication_ip'], node['replication_port'],
+                    node['device'], part, 'PUT', container, headers=headers)
             except (Exception, Timeout):
-                self.logger.exception(_(
-                    'ERROR account update failed with '
-                    '%(ip)s:%(port)s/%(device)s (will retry later): '), node)
+                self.logger.exception(
+                    'ERROR account update failed with %s (will retry later):',
+                    node_to_string(node, replication=True))
                 return HTTP_INTERNAL_SERVER_ERROR
         with Timeout(self.node_timeout):
             try:
@@ -290,5 +351,17 @@ def container_report(self, node, part, container, put_timestamp,
             except (Exception, Timeout):
                 if self.logger.getEffectiveLevel() <= logging.DEBUG:
                     self.logger.exception(
-                        _('Exception with %(ip)s:%(port)s/%(device)s'), node)
+                        'Exception with %s',
+                        node_to_string(node, replication=True))
                 return HTTP_INTERNAL_SERVER_ERROR
+            finally:
+                conn.close()
+
+
+def main():
+    conf_file, options = parse_options(once=True)
+    run_daemon(ContainerUpdater, conf_file, **options)
+
+
+if __name__ == '__main__':
+    main()
diff --git a/swift/obj/auditor.py b/swift/obj/auditor.py
index 94cceb821e..ab753c4f16 100644
--- a/swift/obj/auditor.py
+++ b/swift/obj/auditor.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,80 +13,155 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
+import json
 import os
+import sys
 import time
-
+import signal
+from optparse import OptionParser
+from os.path import basename, dirname, join
+from random import shuffle
+from contextlib import closing
 from eventlet import Timeout
 
-from swift.obj import server as object_server
-from swift.common.utils import get_logger, audit_location_generator, \
-    ratelimit_sleep, config_true_value, dump_recon_cache
-from swift.common.exceptions import AuditException, DiskFileError, \
-    DiskFileNotExist
-from swift.common.daemon import Daemon
-
-SLEEP_BETWEEN_AUDITS = 30
+from swift.obj import diskfile, replicator
+from swift.common.exceptions import DiskFileQuarantined, DiskFileNotExist, \
+    DiskFileDeleted, DiskFileExpired, QuarantineRequest
+from swift.common.daemon import Daemon, run_daemon
+from swift.common.storage_policy import POLICIES
+from swift.common.utils import (
+    config_auto_int_value, dump_recon_cache, get_logger, list_from_csv,
+    listdir, load_pkg_resource, parse_prefixed_conf, EventletRateLimiter,
+    readconf, round_robin_iter, unlink_paths_older_than, parse_options,
+    get_prefixed_logger)
+from swift.common.recon import RECON_OBJECT_FILE, DEFAULT_RECON_CACHE_PATH
 
 
 class AuditorWorker(object):
-    """Walk through file system to audit object"""
+    """Walk through file system to audit objects"""
 
-    def __init__(self, conf, zero_byte_only_at_fps=0):
+    def __init__(self, conf, logger, rcache, devices, zero_byte_only_at_fps=0,
+                 watcher_defs=None):
+        if watcher_defs is None:
+            watcher_defs = {}
         self.conf = conf
-        self.logger = get_logger(conf, log_route='object-auditor')
-        self.devices = conf.get('devices', '/srv/node')
-        self.mount_check = config_true_value(conf.get('mount_check', 'true'))
+        self.logger = logger
+        self.devices = devices
         self.max_files_per_second = float(conf.get('files_per_second', 20))
         self.max_bytes_per_second = float(conf.get('bytes_per_second',
                                                    10000000))
+        try:
+            # ideally unless ops overrides the rsync_tempfile_timeout in the
+            # auditor section we can base our behavior on whatever they
+            # configure for their replicator
+            replicator_config = readconf(self.conf['__file__'],
+                                         'object-replicator')
+        except (KeyError, ValueError, IOError):
+            # if we can't parse the real config (generally a KeyError on
+            # __file__, or ValueError on no object-replicator section, or
+            # IOError if reading the file failed) we use
+            # a very conservative default for rsync_timeout
+            default_rsync_timeout = 86400
+        else:
+            replicator_rsync_timeout = int(replicator_config.get(
+                'rsync_timeout', replicator.DEFAULT_RSYNC_TIMEOUT))
+            # Here we can do some light math for ops and use the *replicator's*
+            # rsync_timeout (plus 15 mins to avoid deleting local tempfiles
+            # before the remote replicator kills it's rsync)
+            default_rsync_timeout = replicator_rsync_timeout + 900
+            # there's not really a good reason to assume the replicator
+            # section's reclaim_age is more appropriate than the reconstructor
+            # reclaim_age - but we're already parsing the config so we can set
+            # the default value in our config if it's not already set
+            if 'reclaim_age' in replicator_config:
+                conf.setdefault('reclaim_age',
+                                replicator_config['reclaim_age'])
+        self.rsync_tempfile_timeout = config_auto_int_value(
+            self.conf.get('rsync_tempfile_timeout'), default_rsync_timeout)
+        self.diskfile_router = diskfile.DiskFileRouter(conf, self.logger)
+
         self.auditor_type = 'ALL'
         self.zero_byte_only_at_fps = zero_byte_only_at_fps
         if self.zero_byte_only_at_fps:
             self.max_files_per_second = float(self.zero_byte_only_at_fps)
             self.auditor_type = 'ZBF'
         self.log_time = int(conf.get('log_time', 3600))
-        self.files_running_time = 0
-        self.bytes_running_time = 0
+        self.last_logged = 0
+        self.files_rate_limiter = EventletRateLimiter(
+            self.max_files_per_second)
+        self.bytes_rate_limiter = EventletRateLimiter(
+            self.max_bytes_per_second)
         self.bytes_processed = 0
         self.total_bytes_processed = 0
         self.total_files_processed = 0
         self.passes = 0
         self.quarantines = 0
         self.errors = 0
-        self.recon_cache_path = conf.get('recon_cache_path',
-                                         '/var/cache/swift')
-        self.rcache = os.path.join(self.recon_cache_path, "object.recon")
+        self.rcache = rcache
+        self.stats_sizes = sorted(
+            [int(s) for s in list_from_csv(conf.get('object_size_stats'))])
+        self.stats_buckets = dict(
+            [(s, 0) for s in self.stats_sizes + ['OVER']])
+
+        self.watchers = [
+            WatcherWrapper(wdef['klass'], name, wdef['conf'], logger)
+            for name, wdef in watcher_defs.items()]
+        logger.debug("%d audit watcher(s) loaded", len(self.watchers))
+
+    def create_recon_nested_dict(self, top_level_key, device_list, item):
+        if device_list:
+            device_key = ''.join(sorted(device_list))
+            return {top_level_key: {device_key: item}}
+        else:
+            return {top_level_key: item}
 
-    def audit_all_objects(self, mode='once'):
-        self.logger.info(_('Begin object audit "%s" mode (%s)' %
-                           (mode, self.auditor_type)))
+    def audit_all_objects(self, mode='once', device_dirs=None):
+        description = ''
+        if device_dirs:
+            device_dir_str = ','.join(sorted(device_dirs))
+            if self.auditor_type == 'ALL':
+                description = ' - parallel, %s' % device_dir_str
+            else:
+                description = ' - %s' % device_dir_str
+        self.logger.info('Begin object audit "%(mode)s" mode (%(audi_type)s'
+                         '%(description)s)',
+                         {'mode': mode, 'audi_type': self.auditor_type,
+                          'description': description})
+        for watcher in self.watchers:
+            watcher.start(self.auditor_type)
         begin = reported = time.time()
         self.total_bytes_processed = 0
         self.total_files_processed = 0
         total_quarantines = 0
         total_errors = 0
         time_auditing = 0
-        all_locs = audit_location_generator(self.devices,
-                                            object_server.DATADIR,
-                                            mount_check=self.mount_check,
-                                            logger=self.logger)
-        for path, device, partition in all_locs:
+
+        # get AuditLocations for each policy
+        loc_generators = []
+        for policy in POLICIES:
+            loc_generators.append(
+                self.diskfile_router[policy]
+                    .object_audit_location_generator(
+                        policy, device_dirs=device_dirs,
+                        auditor_type=self.auditor_type))
+
+        all_locs = round_robin_iter(loc_generators)
+        for location in all_locs:
             loop_time = time.time()
-            self.object_audit(path, device, partition)
+            self.failsafe_object_audit(location)
             self.logger.timing_since('timing', loop_time)
-            self.files_running_time = ratelimit_sleep(
-                self.files_running_time, self.max_files_per_second)
+            self.files_rate_limiter.wait()
             self.total_files_processed += 1
             now = time.time()
-            if now - reported >= self.log_time:
-                self.logger.info(_(
+            if now - self.last_logged >= self.log_time:
+                self.logger.info(
                     'Object audit (%(type)s). '
                     'Since %(start_time)s: Locally: %(passes)d passed, '
-                    '%(quars)d quarantined, %(errors)d errors '
-                    'files/sec: %(frate).2f , bytes/sec: %(brate).2f, '
+                    '%(quars)d quarantined, %(errors)d errors, '
+                    'files/sec: %(frate).2f, bytes/sec: %(brate).2f, '
                     'Total time: %(total).2f, Auditing time: %(audit).2f, '
-                    'Rate: %(audit_rate).2f') % {
-                        'type': self.auditor_type,
+                    'Rate: %(audit_rate).2f', {
+                        'type': '%s%s' % (self.auditor_type, description),
                         'start_time': time.ctime(reported),
                         'passes': self.passes, 'quars': self.quarantines,
                         'errors': self.errors,
@@ -94,15 +169,14 @@ def audit_all_objects(self, mode='once'):
                         'brate': self.bytes_processed / (now - reported),
                         'total': (now - begin), 'audit': time_auditing,
                         'audit_rate': time_auditing / (now - begin)})
-                dump_recon_cache({'object_auditor_stats_%s' %
-                                  self.auditor_type: {
-                                      'errors': self.errors,
-                                      'passes': self.passes,
-                                      'quarantined': self.quarantines,
-                                      'bytes_processed': self.bytes_processed,
-                                      'start_time': reported,
-                                      'audit_time': time_auditing}},
-                                 self.rcache, self.logger)
+                cache_entry = self.create_recon_nested_dict(
+                    'object_auditor_stats_%s' % (self.auditor_type),
+                    device_dirs,
+                    {'errors': self.errors, 'passes': self.passes,
+                     'quarantined': self.quarantines,
+                     'bytes_processed': self.bytes_processed,
+                     'start_time': reported, 'audit_time': time_auditing})
+                dump_recon_cache(cache_entry, self.rcache, self.logger)
                 reported = now
                 total_quarantines += self.quarantines
                 total_errors += self.errors
@@ -110,120 +184,375 @@ def audit_all_objects(self, mode='once'):
                 self.quarantines = 0
                 self.errors = 0
                 self.bytes_processed = 0
+                self.last_logged = now
             time_auditing += (now - loop_time)
         # Avoid divide by zero during very short runs
         elapsed = (time.time() - begin) or 0.000001
-        self.logger.info(_(
+        self.logger.info(
             'Object audit (%(type)s) "%(mode)s" mode '
             'completed: %(elapsed).02fs. Total quarantined: %(quars)d, '
-            'Total errors: %(errors)d, Total files/sec: %(frate).2f , '
+            'Total errors: %(errors)d, Total files/sec: %(frate).2f, '
             'Total bytes/sec: %(brate).2f, Auditing time: %(audit).2f, '
-            'Rate: %(audit_rate).2f') % {
-                'type': self.auditor_type, 'mode': mode, 'elapsed': elapsed,
-                'quars': total_quarantines, 'errors': total_errors,
+            'Rate: %(audit_rate).2f', {
+                'type': '%s%s' % (self.auditor_type, description),
+                'mode': mode, 'elapsed': elapsed,
+                'quars': total_quarantines + self.quarantines,
+                'errors': total_errors + self.errors,
                 'frate': self.total_files_processed / elapsed,
                 'brate': self.total_bytes_processed / elapsed,
                 'audit': time_auditing, 'audit_rate': time_auditing / elapsed})
+        for watcher in self.watchers:
+            watcher.end()
+        if self.stats_sizes:
+            self.logger.info(
+                'Object audit stats: %s', json.dumps(self.stats_buckets))
+
+        for policy in POLICIES:
+            # Unset remaining partitions to not skip them in the next run
+            self.diskfile_router[policy].clear_auditor_status(
+                policy,
+                self.auditor_type)
+
+    def record_stats(self, obj_size):
+        """
+        Based on config's object_size_stats will keep track of how many objects
+        fall into the specified ranges. For example with the following:
 
-    def object_audit(self, path, device, partition):
+        object_size_stats = 10, 100, 1024
+
+        and your system has 3 objects of sizes: 5, 20, and 10000 bytes the log
+        will look like: {"10": 1, "100": 1, "1024": 0, "OVER": 1}
         """
-        Audits the given object path.
+        for size in self.stats_sizes:
+            if obj_size <= size:
+                self.stats_buckets[size] += 1
+                break
+        else:
+            self.stats_buckets["OVER"] += 1
 
-        :param path: a path to an object
-        :param device: the device the path is on
-        :param partition: the partition the path is on
+    def failsafe_object_audit(self, location):
+        """
+        Entrypoint to object_audit, with a failsafe generic exception handler.
         """
         try:
-            if not path.endswith('.data'):
-                return
-            try:
-                name = object_server.read_metadata(path)['name']
-            except (Exception, Timeout), exc:
-                raise AuditException('Error when reading metadata: %s' % exc)
-            _junk, account, container, obj = name.split('/', 3)
-            df = object_server.DiskFile(self.devices, device, partition,
-                                        account, container, obj, self.logger,
-                                        keep_data_fp=True)
-            try:
-                if df.data_file is None:
-                    # file is deleted, we found the tombstone
-                    return
-                try:
-                    obj_size = df.get_data_file_size()
-                except DiskFileError, e:
-                    raise AuditException(str(e))
-                except DiskFileNotExist:
-                    return
-                if self.zero_byte_only_at_fps and obj_size:
-                    self.passes += 1
-                    return
-                for chunk in df:
-                    self.bytes_running_time = ratelimit_sleep(
-                        self.bytes_running_time, self.max_bytes_per_second,
-                        incr_by=len(chunk))
-                    self.bytes_processed += len(chunk)
-                    self.total_bytes_processed += len(chunk)
-                df.close()
-                if df.quarantined_dir:
-                    self.quarantines += 1
-                    self.logger.error(
-                        _("ERROR Object %(path)s failed audit and will be "
-                          "quarantined: ETag and file's md5 do not match"),
-                        {'path': path})
-            finally:
-                df.close(verify_file=False)
-        except AuditException, err:
-            self.logger.increment('quarantines')
-            self.quarantines += 1
-            self.logger.error(_('ERROR Object %(obj)s failed audit and will '
-                                'be quarantined: %(err)s'),
-                              {'obj': path, 'err': err})
-            object_server.quarantine_renamer(
-                os.path.join(self.devices, device), path)
-            return
+            self.object_audit(location)
         except (Exception, Timeout):
             self.logger.increment('errors')
             self.errors += 1
-            self.logger.exception(_('ERROR Trying to audit %s'), path)
-            return
+            self.logger.exception('ERROR Trying to audit %s', location)
+
+    def object_audit(self, location):
+        """
+        Audits the given object location.
+
+        :param location: an audit location
+                         (from diskfile.object_audit_location_generator)
+        """
+        def raise_dfq(msg):
+            raise DiskFileQuarantined(msg)
+
+        diskfile_mgr = self.diskfile_router[location.policy]
+        # this method doesn't normally raise errors, even if the audit
+        # location does not exist; if this raises an unexpected error it
+        # will get logged in failsafe
+        df = diskfile_mgr.get_diskfile_from_audit_location(location)
+        reader = None
+        try:
+            with df.open(modernize=True):
+                metadata = df.get_metadata()
+                if not df.validate_metadata():
+                    df._quarantine(
+                        df._data_file,
+                        "Metadata failed validation")
+                obj_size = int(metadata['Content-Length'])
+                if self.stats_sizes:
+                    self.record_stats(obj_size)
+                if obj_size and not self.zero_byte_only_at_fps:
+                    reader = df.reader(_quarantine_hook=raise_dfq)
+            if reader:
+                with closing(reader):
+                    for chunk in reader:
+                        chunk_len = len(chunk)
+                        self.bytes_rate_limiter.wait(incr_by=chunk_len)
+                        self.bytes_processed += chunk_len
+                        self.total_bytes_processed += chunk_len
+            for watcher in self.watchers:
+                try:
+                    watcher.see_object(
+                        metadata,
+                        df._ondisk_info['data_file'])
+                except QuarantineRequest:
+                    raise df._quarantine(
+                        df._data_file,
+                        "Requested by %s" % watcher.watcher_name)
+        except DiskFileQuarantined as err:
+            self.quarantines += 1
+            self.logger.error('ERROR Object %(obj)s failed audit and was'
+                              ' quarantined: %(err)s',
+                              {'obj': location, 'err': err})
+        except DiskFileExpired:
+            pass  # ignore expired objects
+        except DiskFileDeleted:
+            # If there is a reclaimable tombstone, we'll invalidate the hash
+            # to trigger the replicator to rehash/cleanup this suffix
+            ts = df._ondisk_info['ts_info']['timestamp']
+            if (not self.zero_byte_only_at_fps and
+                    (time.time() - float(ts)) > df.manager.reclaim_age):
+                df.manager.invalidate_hash(dirname(df._datadir))
+        except DiskFileNotExist:
+            pass
+
         self.passes += 1
+        # _ondisk_info attr is initialized to None and filled in by open
+        ondisk_info_dict = df._ondisk_info or {}
+        if 'unexpected' in ondisk_info_dict:
+            is_rsync_tempfile = lambda fpath: (
+                diskfile.RE_RSYNC_TEMPFILE.match(basename(fpath)))
+            rsync_tempfile_paths = filter(is_rsync_tempfile,
+                                          ondisk_info_dict['unexpected'])
+            mtime = time.time() - self.rsync_tempfile_timeout
+            unlink_paths_older_than(rsync_tempfile_paths, mtime)
 
 
 class ObjectAuditor(Daemon):
     """Audit objects."""
 
-    def __init__(self, conf, **options):
+    def __init__(self, conf, logger=None, **options):
         self.conf = conf
-        self.logger = get_logger(conf, log_route='object-auditor')
+        self.logger = logger or get_logger(conf, log_route='object-auditor')
+        self.devices = conf.get('devices', '/srv/node')
+        self.concurrency = int(conf.get('concurrency', 1))
         self.conf_zero_byte_fps = int(
             conf.get('zero_byte_files_per_second', 50))
+        self.recon_cache_path = conf.get('recon_cache_path',
+                                         DEFAULT_RECON_CACHE_PATH)
+        self.rcache = join(self.recon_cache_path, RECON_OBJECT_FILE)
+        self.interval = float(conf.get('interval', 30))
+
+        watcher_names = set(list_from_csv(conf.get('watchers', '')))
+        # Normally '__file__' is always in config, but tests neglect it often.
+        watcher_configs = \
+            parse_prefixed_conf(conf['__file__'], 'object-auditor:watcher:') \
+            if '__file__' in conf else {}
+        self.watcher_defs = {}
+        for name in watcher_names:
+            self.logger.debug("Loading entry point '%s'", name)
+            wconf = dict(conf)
+            wconf.update(watcher_configs.get(name, {}))
+            self.watcher_defs[name] = {
+                'conf': wconf,
+                'klass': load_pkg_resource("swift.object_audit_watcher", name)}
 
     def _sleep(self):
-        time.sleep(SLEEP_BETWEEN_AUDITS)
+        time.sleep(self.interval)
+
+    def clear_recon_cache(self, auditor_type):
+        """Clear recon cache entries"""
+        dump_recon_cache({'object_auditor_stats_%s' % auditor_type: {}},
+                         self.rcache, self.logger)
+
+    def run_audit(self, **kwargs):
+        """Run the object audit"""
+        mode = kwargs.get('mode')
+        zero_byte_only_at_fps = kwargs.get('zero_byte_fps', 0)
+        device_dirs = kwargs.get('device_dirs')
+        worker = AuditorWorker(self.conf, self.logger, self.rcache,
+                               self.devices,
+                               zero_byte_only_at_fps=zero_byte_only_at_fps,
+                               watcher_defs=self.watcher_defs)
+        worker.audit_all_objects(mode=mode, device_dirs=device_dirs)
+
+    def fork_child(self, zero_byte_fps=False, sleep_between_zbf_scanner=False,
+                   **kwargs):
+        """Child execution"""
+        pid = os.fork()
+        if pid:
+            return pid
+        else:
+            signal.signal(signal.SIGTERM, signal.SIG_DFL)
+            os.environ.pop('NOTIFY_SOCKET', None)
+            if zero_byte_fps:
+                kwargs['zero_byte_fps'] = self.conf_zero_byte_fps
+                if sleep_between_zbf_scanner:
+                    self._sleep()
+            try:
+                self.run_audit(**kwargs)
+            except Exception as e:
+                self.logger.exception(
+                    "ERROR: Unable to run auditing: %s", e)
+            finally:
+                sys.exit()
+
+    def audit_loop(self, parent, zbo_fps, override_devices=None, **kwargs):
+        """Parallel audit loop"""
+        self.clear_recon_cache('ALL')
+        self.clear_recon_cache('ZBF')
+        once = kwargs.get('mode') == 'once'
+        kwargs['device_dirs'] = override_devices
+        if parent:
+            kwargs['zero_byte_fps'] = zbo_fps
+            self.run_audit(**kwargs)
+        else:
+            pids = set()
+            if self.conf_zero_byte_fps:
+                zbf_pid = self.fork_child(zero_byte_fps=True, **kwargs)
+                pids.add(zbf_pid)
+            if self.concurrency == 1:
+                # Audit all devices in 1 process
+                pids.add(self.fork_child(**kwargs))
+            else:
+                # Divide devices amongst parallel processes set by
+                # self.concurrency.  Total number of parallel processes
+                # is self.concurrency + 1 if zero_byte_fps.
+                parallel_proc = self.concurrency + 1 if \
+                    self.conf_zero_byte_fps else self.concurrency
+                device_list = list(override_devices) if override_devices else \
+                    listdir(self.devices)
+                shuffle(device_list)
+                while device_list:
+                    pid = None
+                    if len(pids) == parallel_proc:
+                        pid = os.wait()[0]
+                        pids.discard(pid)
+
+                    if self.conf_zero_byte_fps and pid == zbf_pid and once:
+                        # If we're only running one pass and the ZBF scanner
+                        # finished, don't bother restarting it.
+                        zbf_pid = -100
+                    elif self.conf_zero_byte_fps and pid == zbf_pid:
+                        # When we're running forever, the ZBF scanner must
+                        # be restarted as soon as it finishes.
+                        kwargs['device_dirs'] = override_devices
+                        # sleep between ZBF scanner forks
+                        self._sleep()
+                        zbf_pid = self.fork_child(zero_byte_fps=True, **kwargs)
+                        pids.add(zbf_pid)
+                    else:
+                        kwargs['device_dirs'] = [device_list.pop()]
+                        pids.add(self.fork_child(**kwargs))
+            while pids:
+                pid = os.wait()[0]
+                # ZBF scanner must be restarted as soon as it finishes
+                # unless we're in run-once mode
+                if self.conf_zero_byte_fps and pid == zbf_pid and \
+                   len(pids) > 1 and not once:
+                    kwargs['device_dirs'] = override_devices
+                    # sleep between ZBF scanner forks
+                    zbf_pid = self.fork_child(zero_byte_fps=True,
+                                              sleep_between_zbf_scanner=True,
+                                              **kwargs)
+                    pids.add(zbf_pid)
+                pids.discard(pid)
 
     def run_forever(self, *args, **kwargs):
         """Run the object audit until stopped."""
         # zero byte only command line option
         zbo_fps = kwargs.get('zero_byte_fps', 0)
+        parent = False
         if zbo_fps:
             # only start parent
             parent = True
-        else:
-            parent = os.fork()  # child gets parent = 0
         kwargs = {'mode': 'forever'}
-        if parent:
-            kwargs['zero_byte_fps'] = zbo_fps or self.conf_zero_byte_fps
+
         while True:
             try:
-                self.run_once(**kwargs)
-            except (Exception, Timeout):
-                self.logger.exception(_('ERROR auditing'))
+                self.audit_loop(parent, zbo_fps, **kwargs)
+            except (Exception, Timeout) as err:
+                self.logger.exception('ERROR auditing: %s', err)
             self._sleep()
 
     def run_once(self, *args, **kwargs):
-        """Run the object audit once."""
-        mode = kwargs.get('mode', 'once')
-        zero_byte_only_at_fps = kwargs.get('zero_byte_fps', 0)
-        worker = AuditorWorker(self.conf,
-                               zero_byte_only_at_fps=zero_byte_only_at_fps)
-        worker.audit_all_objects(mode=mode)
+        """Run the object audit once"""
+        # zero byte only command line option
+        zbo_fps = kwargs.get('zero_byte_fps', 0)
+        override_devices = list_from_csv(kwargs.get('devices'))
+        # Remove bogus entries and duplicates from override_devices
+        override_devices = list(
+            set(listdir(self.devices)).intersection(set(override_devices)))
+        parent = False
+        if zbo_fps:
+            # only start parent
+            parent = True
+        kwargs = {'mode': 'once'}
+
+        try:
+            self.audit_loop(parent, zbo_fps, override_devices=override_devices,
+                            **kwargs)
+        except (Exception, Timeout) as err:
+            self.logger.exception('ERROR auditing: %s', err)
+
+
+class WatcherWrapper(object):
+    """
+    Run the user-supplied watcher.
+
+    Simple and gets the job done. Note that we aren't doing anything
+    to isolate ourselves from hangs or file descriptor leaks
+    in the plugins.
+
+    :param logger: an instance of ``SwiftLogAdapter``.
+
+    """
+
+    def __init__(self, watcher_class, watcher_name, conf, logger):
+        self.watcher_name = watcher_name
+        self.watcher_in_error = False
+        self.logger = get_prefixed_logger(
+            logger, '[audit-watcher %s] ' % watcher_name)
+
+        try:
+            self.watcher = watcher_class(conf, self.logger)
+        except (Exception, Timeout):
+            self.logger.exception('Error intializing watcher')
+            self.watcher_in_error = True
+
+    def start(self, audit_type):
+        if self.watcher_in_error:
+            return  # can't trust the state of the thing; bail
+        try:
+            self.watcher.start(audit_type=audit_type)
+        except (Exception, Timeout):
+            self.logger.exception('Error starting watcher')
+            self.watcher_in_error = True
+
+    def see_object(self, meta, data_file_path):
+        if self.watcher_in_error:
+            return  # can't trust the state of the thing; bail
+        kwargs = {'object_metadata': meta,
+                  'data_file_path': data_file_path}
+        try:
+            self.watcher.see_object(**kwargs)
+        except QuarantineRequest:
+            # Avoid extra logging.
+            raise
+        except (Exception, Timeout):
+            self.logger.exception(
+                'Error in see_object(meta=%r, data_file_path=%r)',
+                meta, data_file_path)
+            # Do *not* flag watcher as being in an error state; a failure
+            # to process one object shouldn't impact the ability to process
+            # others.
+
+    def end(self):
+        if self.watcher_in_error:
+            return  # can't trust the state of the thing; bail
+        kwargs = {}
+        try:
+            self.watcher.end(**kwargs)
+        except (Exception, Timeout):
+            self.logger.exception('Error ending watcher')
+            self.watcher_in_error = True
+
+
+def main():
+    parser = OptionParser("%prog CONFIG [options]")
+    parser.add_option('-z', '--zero_byte_fps',
+                      help='Audit only zero byte files at specified files/sec')
+    parser.add_option('-d', '--devices',
+                      help='Audit only given devices. Comma-separated list')
+    conf_file, options = parse_options(parser=parser, once=True)
+    run_daemon(ObjectAuditor, conf_file, **options)
+
+
+if __name__ == '__main__':
+    main()
diff --git a/swift/obj/diskfile.py b/swift/obj/diskfile.py
new file mode 100644
index 0000000000..7f644791bd
--- /dev/null
+++ b/swift/obj/diskfile.py
@@ -0,0 +1,3912 @@
+# Copyright (c) 2010-2013 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""
+Disk File Interface for the Swift Object Server
+
+The `DiskFile`, `DiskFileWriter` and `DiskFileReader` classes combined define
+the on-disk abstraction layer for supporting the object server REST API
+interfaces (excluding `REPLICATE`). Other implementations wishing to provide
+an alternative backend for the object server must implement the three
+classes. An example alternative implementation can be found in the
+`mem_server.py` and `mem_diskfile.py` modules along size this one.
+
+The `DiskFileManager` is a reference implemenation specific class and is not
+part of the backend API.
+
+The remaining methods in this module are considered implementation specific and
+are also not considered part of the backend API.
+"""
+
+import pickle  # nosec: B403
+import binascii
+import copy
+import errno
+import fcntl
+import json
+import os
+import re
+import time
+import uuid
+import logging
+import traceback
+import xattr
+from os.path import basename, dirname, exists, join, splitext
+import random
+from tempfile import mkstemp
+from contextlib import contextmanager
+from collections import defaultdict
+from datetime import timedelta
+
+from eventlet import Timeout, tpool
+from eventlet.hubs import trampoline
+from pyeclib.ec_iface import ECDriverError, ECInvalidFragmentMetadata, \
+    ECBadFragmentChecksum, ECInvalidParameter
+
+from swift.common.constraints import check_drive
+from swift.common.request_helpers import is_sys_meta
+from swift.common.utils import mkdirs, Timestamp, \
+    storage_directory, hash_path, renamer, fallocate, fsync, fdatasync, \
+    fsync_dir, drop_buffer_cache, lock_path, write_pickle, \
+    config_true_value, listdir, split_path, remove_file, \
+    get_md5_socket, F_SETPIPE_SZ, decode_timestamps, encode_timestamps, \
+    MD5_OF_EMPTY_STRING, link_fd_to_path, \
+    O_TMPFILE, makedirs_count, replace_partition_in_path, remove_directory, \
+    md5, is_file_older, non_negative_float, config_fallocate_value, \
+    fs_has_free_space, CooperativeIterator, EUCLEAN
+from swift.common.splice import splice, tee
+from swift.common.exceptions import DiskFileQuarantined, DiskFileNotExist, \
+    DiskFileCollision, DiskFileNoSpace, DiskFileDeviceUnavailable, \
+    DiskFileDeleted, DiskFileError, DiskFileNotOpen, PathNotDir, \
+    ReplicationLockTimeout, DiskFileExpired, DiskFileXattrNotSupported, \
+    DiskFileBadMetadataChecksum, PartitionLockTimeout, DiskFileStateChanged
+from swift.common.swob import multi_range_iterator
+from swift.common.storage_policy import (
+    get_policy_string, split_policy_string, PolicyError, POLICIES,
+    REPL_POLICY, EC_POLICY)
+
+
+PICKLE_PROTOCOL = 2
+DEFAULT_RECLAIM_AGE = timedelta(weeks=1).total_seconds()
+DEFAULT_COMMIT_WINDOW = 60.0
+HASH_FILE = 'hashes.pkl'
+HASH_INVALIDATIONS_FILE = 'hashes.invalid'
+METADATA_KEY = b'user.swift.metadata'
+METADATA_CHECKSUM_KEY = b'user.swift.metadata_checksum'
+DROP_CACHE_WINDOW = 1024 * 1024
+# These are system-set metadata keys that cannot be changed with a POST.
+# They should be lowercase.
+RESERVED_DATAFILE_META = {'content-length', 'deleted', 'etag'}
+DATAFILE_SYSTEM_META = {'x-static-large-object'}
+DATADIR_BASE = 'objects'
+ASYNCDIR_BASE = 'async_pending'
+TMP_BASE = 'tmp'
+MIN_TIME_UPDATE_AUDITOR_STATUS = 60
+# This matches rsync tempfiles, like ".<timestamp>.data.Xy095a"
+RE_RSYNC_TEMPFILE = re.compile(r'^\..*\.([a-zA-Z0-9_]){6}$')
+
+
+def get_data_dir(policy_or_index):
+    '''
+    Get the data dir for the given policy.
+
+    :param policy_or_index: ``StoragePolicy`` instance, or an index (string or
+                            int); if None, the legacy Policy-0 is assumed.
+    :returns: ``objects`` or ``objects-<N>`` as appropriate
+    '''
+    return get_policy_string(DATADIR_BASE, policy_or_index)
+
+
+def get_async_dir(policy_or_index):
+    '''
+    Get the async dir for the given policy.
+
+    :param policy_or_index: ``StoragePolicy`` instance, or an index (string or
+                            int); if None, the legacy Policy-0 is assumed.
+    :returns: ``async_pending`` or ``async_pending-<N>`` as appropriate
+    '''
+    return get_policy_string(ASYNCDIR_BASE, policy_or_index)
+
+
+def get_tmp_dir(policy_or_index):
+    '''
+    Get the temp dir for the given policy.
+
+    :param policy_or_index: ``StoragePolicy`` instance, or an index (string or
+                            int); if None, the legacy Policy-0 is assumed.
+    :returns: ``tmp`` or ``tmp-<N>`` as appropriate
+    '''
+    return get_policy_string(TMP_BASE, policy_or_index)
+
+
+def _get_filename(fd):
+    """
+    Helper function to get to file name from a file descriptor or filename.
+
+    :param fd: file descriptor or filename.
+
+    :returns: the filename.
+    """
+    if hasattr(fd, 'name'):
+        # fd object
+        return fd.name
+
+    # fd is a filename
+    return fd
+
+
+def _encode_metadata(metadata):
+    """
+    UTF8 encode any unicode keys or values in given metadata dict.
+
+    :param metadata: a dict
+    """
+    def encode_str(item):
+        if isinstance(item, str):
+            return item.encode('utf8', 'surrogateescape')
+        return item
+
+    return dict(((encode_str(k), encode_str(v)) for k, v in metadata.items()))
+
+
+def _decode_metadata(metadata, metadata_written_by_py3):
+    """
+    Given a metadata dict from disk, convert keys and values to native strings.
+
+    :param metadata: a dict
+    :param metadata_written_by_py3:
+    """
+    def to_str(item, is_name=False):
+        # For years, py2 and py3 handled non-ascii metadata differently;
+        # see https://bugs.launchpad.net/swift/+bug/2012531
+        if not metadata_written_by_py3 and isinstance(item, bytes) \
+                and not is_name:
+            # do our best to read old py2 data
+            item = item.decode('latin1')
+        if isinstance(item, bytes):
+            return item.decode('utf8', 'surrogateescape')
+        return item
+
+    return {to_str(k): to_str(v, k == b'name') for k, v in metadata.items()}
+
+
+def _read_file_metadata(fd, add_missing_checksum=False):
+    """
+    Helper function to read the pickled metadata from an object file.
+
+    :param fd: file descriptor or filename to load the metadata from
+    :param add_missing_checksum: if set and checksum is missing, add it
+
+    :returns: dictionary of metadata
+    :raises DiskFileXattrNotSupported: if the filesystem does not support xattr
+    :raises DiskFileStateChanged: if the file metadata could not be read. It is
+        assumed that the caller perceived the file to exist, so the fact that
+        the file metadata cannot now be read suggests that the file state has
+        subsequently changed.
+    :raises DiskFileBadMetadataChecksum: if the checksum of the read metadata
+        does not match the stored checksum
+    """
+    metadata = b''
+    key = 0
+    try:
+        while True:
+            metadata += xattr.getxattr(
+                fd, METADATA_KEY + str(key or '').encode('ascii'))
+            key += 1
+    except (IOError, OSError) as e:
+        if errno.errorcode.get(e.errno) in ('ENOTSUP', 'EOPNOTSUPP'):
+            msg = "Filesystem at %s does not support xattr"
+            logging.exception(msg, _get_filename(fd))
+            raise DiskFileXattrNotSupported(e)
+        if e.errno == errno.ENOENT:
+            raise DiskFileStateChanged()
+        # TODO: we might want to re-raise errors that don't denote a missing
+        # xattr here.  Seems to be ENODATA on linux and ENOATTR on BSD/OSX.
+
+    metadata_checksum = None
+    try:
+        metadata_checksum = xattr.getxattr(fd, METADATA_CHECKSUM_KEY)
+    except (IOError, OSError):
+        # All the interesting errors were handled above; the only thing left
+        # here is ENODATA / ENOATTR to indicate that this attribute doesn't
+        # exist. This is fine; it just means that this object predates the
+        # introduction of metadata checksums.
+        if add_missing_checksum:
+            new_checksum = (md5(metadata, usedforsecurity=False)
+                            .hexdigest().encode('ascii'))
+            try:
+                xattr.setxattr(fd, METADATA_CHECKSUM_KEY, new_checksum)
+            except (IOError, OSError) as e:
+                logging.error("Error adding metadata: %s" % e)
+
+    if metadata_checksum:
+        computed_checksum = (md5(metadata, usedforsecurity=False)
+                             .hexdigest().encode('ascii'))
+        if metadata_checksum != computed_checksum:
+            raise DiskFileBadMetadataChecksum(
+                "Metadata checksum mismatch for %s: "
+                "stored checksum='%s', computed='%s'" % (
+                    fd, metadata_checksum, computed_checksum))
+
+    metadata_written_by_py3 = (b'_codecs\nencode' in metadata[:32])
+    # strings are utf-8 encoded when written, but have not always been
+    # (see https://bugs.launchpad.net/swift/+bug/1678018) so encode them again
+    # when read
+    metadata = pickle.loads(metadata, encoding='bytes')  # nosec: B301
+    return _decode_metadata(metadata, metadata_written_by_py3)
+
+
+def read_metadata(fd, add_missing_checksum=False):
+    """
+    Helper function to read the pickled metadata from an object data file.
+
+    The only difference from ``_read_file_metadata`` is that this function
+    raises ``DiskFileNotExist`` when the file cannot be read.
+
+    :param fd: file descriptor or filename to load the metadata from
+    :param add_missing_checksum: if set and checksum is missing, add it
+    :returns: dictionary of metadata
+    :raises DiskFileXattrNotSupported: if the filesystem does not support xattr
+    :raises DiskFileNotExist: if the file metadata could not be read
+    :raises DiskFileBadMetadataChecksum: if the checksum of the read metadata
+        does not match the stored checksum
+    """
+    try:
+        return _read_file_metadata(fd, add_missing_checksum)
+    except DiskFileStateChanged:
+        raise DiskFileNotExist()
+
+
+def write_metadata(fd, metadata, xattr_size=65536):
+    """
+    Helper function to write pickled metadata for an object file.
+
+    :param fd: file descriptor or filename to write the metadata
+    :param metadata: metadata to write
+    """
+    metastr = pickle.dumps(_encode_metadata(metadata), PICKLE_PROTOCOL)
+    metastr_md5 = (
+        md5(metastr, usedforsecurity=False).hexdigest().encode('ascii'))
+    key = 0
+    try:
+        while metastr:
+            xattr.setxattr(fd, METADATA_KEY + str(key or '').encode('ascii'),
+                           metastr[:xattr_size])
+            metastr = metastr[xattr_size:]
+            key += 1
+        xattr.setxattr(fd, METADATA_CHECKSUM_KEY, metastr_md5)
+    except IOError as e:
+        # errno module doesn't always have both of these, hence the ugly
+        # check
+        if errno.errorcode.get(e.errno) in ('ENOTSUP', 'EOPNOTSUPP'):
+            msg = "Filesystem at %s does not support xattr"
+            logging.exception(msg, _get_filename(fd))
+            raise DiskFileXattrNotSupported(e)
+        elif e.errno in (errno.ENOSPC, errno.EDQUOT):
+            msg = "No space left on device for %s" % _get_filename(fd)
+            logging.exception(msg)
+            raise DiskFileNoSpace()
+        raise
+
+
+def extract_policy(obj_path):
+    """
+    Extracts the policy for an object (based on the name of the objects
+    directory) given the device-relative path to the object. Returns None in
+    the event that the path is malformed in some way.
+
+    The device-relative path is everything after the mount point; for example:
+
+    /srv/node/d42/objects-5/30/179/
+        485dc017205a81df3af616d917c90179/1401811134.873649.data
+
+    would have device-relative path:
+
+    objects-5/30/179/485dc017205a81df3af616d917c90179/1401811134.873649.data
+
+    :param obj_path: device-relative path of an object, or the full path
+    :returns: a :class:`~swift.common.storage_policy.BaseStoragePolicy` or None
+    """
+    try:
+        obj_portion = obj_path[obj_path.rindex(DATADIR_BASE):]
+        obj_dirname = obj_portion[:obj_portion.index('/')]
+    except Exception:
+        return None
+    try:
+        base, policy = split_policy_string(obj_dirname)
+    except PolicyError:
+        return None
+    return policy
+
+
+def quarantine_renamer(device_path, corrupted_file_path):
+    """
+    In the case that a file is corrupted, move it to a quarantined
+    area to allow replication to fix it.
+
+    :params device_path: The path to the device the corrupted file is on.
+    :params corrupted_file_path: The path to the file you want quarantined.
+
+    :returns: path (str) of directory the file was moved to
+    :raises OSError: re-raises non errno.EEXIST / errno.ENOTEMPTY
+                     exceptions from rename
+    """
+    policy = extract_policy(corrupted_file_path)
+    if policy is None:
+        # TODO: support a quarantine-unknown location
+        policy = POLICIES.legacy
+    from_dir = dirname(corrupted_file_path)
+    to_dir = join(device_path, 'quarantined',
+                  get_data_dir(policy),
+                  basename(from_dir))
+    if len(basename(from_dir)) == 3:
+        # quarantining whole suffix
+        invalidate_hash(from_dir)
+    else:
+        invalidate_hash(dirname(from_dir))
+    try:
+        renamer(from_dir, to_dir, fsync=False)
+    except OSError as e:
+        if e.errno not in (errno.EEXIST, errno.ENOTEMPTY):
+            raise
+        to_dir = "%s-%s" % (to_dir, uuid.uuid4().hex)
+        renamer(from_dir, to_dir, fsync=False)
+    return to_dir
+
+
+def valid_suffix(value):
+    if not isinstance(value, str) or len(value) != 3:
+        return False
+    return all(c in '0123456789abcdef' for c in value)
+
+
+def read_hashes(partition_dir):
+    """
+    Read the existing hashes.pkl
+
+    :returns: a dict, the suffix hashes (if any), the key 'valid' will be False
+              if hashes.pkl is corrupt, cannot be read or does not exist
+    """
+    hashes_file = join(partition_dir, HASH_FILE)
+    hashes = {'valid': False}
+    try:
+        with open(hashes_file, 'rb') as hashes_fp:
+            pickled_hashes = hashes_fp.read()
+    except (IOError, OSError):
+        pass
+    else:
+        try:
+            hashes = pickle.loads(pickled_hashes)  # nosec: B301
+        except Exception:
+            # pickle.loads() can raise a wide variety of exceptions when
+            # given invalid input depending on the way in which the
+            # input is invalid.
+            pass
+
+    # Check for corrupted data that could break os.listdir()
+    if not all(valid_suffix(key) or key in ('valid', 'updated')
+               for key in hashes):
+        return {'valid': False}
+
+    # hashes.pkl w/o valid updated key is "valid" but "forever old"
+    hashes.setdefault('valid', True)
+    hashes.setdefault('updated', -1)
+    return hashes
+
+
+def write_hashes(partition_dir, hashes):
+    """
+    Write hashes to hashes.pkl
+
+    The updated key is added to hashes before it is written.
+    """
+    hashes_file = join(partition_dir, HASH_FILE)
+    # 'valid' key should always be set by the caller; however, if there's a bug
+    # setting invalid is most safe
+    hashes.setdefault('valid', False)
+    hashes['updated'] = time.time()
+    write_pickle(hashes, hashes_file, partition_dir, PICKLE_PROTOCOL)
+
+
+def consolidate_hashes(partition_dir):
+    """
+    Take what's in hashes.pkl and hashes.invalid, combine them, write the
+    result back to hashes.pkl, and clear out hashes.invalid.
+
+    :param partition_dir: absolute path to partition dir containing hashes.pkl
+                          and hashes.invalid
+
+    :returns: a dict, the suffix hashes (if any), the key 'valid' will be False
+              if hashes.pkl is corrupt, cannot be read or does not exist
+    """
+    invalidations_file = join(partition_dir, HASH_INVALIDATIONS_FILE)
+
+    with lock_path(partition_dir):
+        hashes = read_hashes(partition_dir)
+
+        found_invalidation_entry = hashes_updated = False
+        try:
+            with open(invalidations_file, 'r') as inv_fh:
+                for line in inv_fh:
+                    found_invalidation_entry = True
+                    suffix = line.strip()
+                    if not valid_suffix(suffix):
+                        continue
+                    hashes_updated = True
+                    hashes[suffix] = None
+        except (IOError, OSError) as e:
+            if e.errno != errno.ENOENT:
+                raise
+
+        if hashes_updated:
+            write_hashes(partition_dir, hashes)
+        if found_invalidation_entry:
+            # Now that all the invalidations are reflected in hashes.pkl, it's
+            # safe to clear out the invalidations file.
+            with open(invalidations_file, 'wb') as inv_fh:
+                pass
+
+        return hashes
+
+
+def invalidate_hash(suffix_dir):
+    """
+    Invalidates the hash for a suffix_dir in the partition's hashes file.
+
+    :param suffix_dir: absolute path to suffix dir whose hash needs
+                       invalidating
+    """
+
+    suffix = basename(suffix_dir)
+    partition_dir = dirname(suffix_dir)
+    invalidations_file = join(partition_dir, HASH_INVALIDATIONS_FILE)
+    if not isinstance(suffix, bytes):
+        suffix = suffix.encode('utf-8')
+    with lock_path(partition_dir):
+        try:
+            inv_fh = open(invalidations_file, 'ab')
+        except FileNotFoundError:
+            # Was previously locked for replication off a handoff, and has now
+            # been deleted -- I guess?
+            pass
+        else:
+            with inv_fh:
+                inv_fh.write(suffix + b"\n")
+
+
+def relink_paths(target_path, new_target_path, ignore_missing=True):
+    """
+    Hard-links a file located in ``target_path`` using the second path
+    ``new_target_path``. Creates intermediate directories if required.
+
+    :param target_path: current absolute filename
+    :param new_target_path: new absolute filename for the hardlink
+    :param ignore_missing: if True then no exception is raised if the link
+        could not be made because ``target_path`` did not exist, otherwise an
+        OSError will be raised.
+    :raises: OSError if the hard link could not be created, unless the intended
+        hard link already exists or the ``target_path`` does not exist and
+        ``must_exist`` if False.
+    :returns: True if the link was created by the call to this method, False
+        otherwise.
+    """
+    link_created = False
+    if target_path != new_target_path:
+        new_target_dir = os.path.dirname(new_target_path)
+        try:
+            os.makedirs(new_target_dir)
+        except OSError as err:
+            if err.errno != errno.EEXIST:
+                raise
+
+        try:
+            os.link(target_path, new_target_path)
+            link_created = True
+        except OSError as err:
+            # there are some circumstances in which it may be ok that the
+            # attempted link failed
+            ok = False
+            if err.errno == errno.ENOENT:
+                # this is ok if the *target* path doesn't exist anymore
+                ok = not os.path.exists(target_path) and ignore_missing
+            if err.errno == errno.EEXIST:
+                # this is ok *if* the intended link has already been made
+                try:
+                    orig_stat = os.stat(target_path)
+                except OSError as sub_err:
+                    # this is ok: the *target* path doesn't exist anymore
+                    ok = sub_err.errno == errno.ENOENT and ignore_missing
+                else:
+                    try:
+                        new_stat = os.stat(new_target_path)
+                        ok = new_stat.st_ino == orig_stat.st_ino
+                    except OSError:
+                        # squash this exception; the original will be raised
+                        pass
+            if not ok:
+                raise err
+    return link_created
+
+
+def get_part_path(dev_path, policy, partition):
+    """
+    Given the device path, policy, and partition, returns the full
+    path to the partition
+    """
+    return os.path.join(dev_path, get_data_dir(policy), str(partition))
+
+
+class AuditLocation(object):
+    """
+    Represents an object location to be audited.
+
+    Other than being a bucket of data, the only useful thing this does is
+    stringify to a filesystem path so the auditor's logs look okay.
+    """
+
+    def __init__(self, path, device, partition, policy):
+        self.path, self.device, self.partition, self.policy = (
+            path, device, partition, policy)
+
+    def __str__(self):
+        return str(self.path)
+
+
+def object_audit_location_generator(devices, datadir, mount_check=True,
+                                    logger=None, device_dirs=None,
+                                    auditor_type="ALL"):
+    """
+    Given a devices path (e.g. "/srv/node"), yield an AuditLocation for all
+    objects stored under that directory for the given datadir (policy),
+    if device_dirs isn't set.  If device_dirs is set, only yield AuditLocation
+    for the objects under the entries in device_dirs. The AuditLocation only
+    knows the path to the hash directory, not to the .data file therein
+    (if any). This is to avoid a double listdir(hash_dir); the DiskFile object
+    will always do one, so we don't.
+
+    :param devices: parent directory of the devices to be audited
+    :param datadir: objects directory
+    :param mount_check: flag to check if a mount check should be performed
+                        on devices
+    :param logger: a logger object
+    :param device_dirs: a list of directories under devices to traverse
+    :param auditor_type: either ALL or ZBF
+    """
+    if not device_dirs:
+        device_dirs = listdir(devices)
+    else:
+        # remove bogus devices and duplicates from device_dirs
+        device_dirs = list(
+            set(listdir(devices)).intersection(set(device_dirs)))
+    # randomize devices in case of process restart before sweep completed
+    random.shuffle(device_dirs)
+
+    base, policy = split_policy_string(datadir)
+    for device in device_dirs:
+        try:
+            check_drive(devices, device, mount_check)
+        except ValueError as err:
+            if logger:
+                logger.debug('Skipping: %s', err)
+            continue
+
+        datadir_path = os.path.join(devices, device, datadir)
+        if not os.path.exists(datadir_path):
+            continue
+
+        partitions = get_auditor_status(datadir_path, logger, auditor_type)
+
+        for pos, partition in enumerate(partitions):
+            update_auditor_status(datadir_path, logger,
+                                  partitions[pos:], auditor_type)
+            part_path = os.path.join(datadir_path, partition)
+            try:
+                suffixes = listdir(part_path)
+            except OSError as e:
+                if e.errno not in (errno.ENOTDIR, errno.ENODATA,
+                                   EUCLEAN):
+                    raise
+                continue
+            for asuffix in suffixes:
+                suff_path = os.path.join(part_path, asuffix)
+                try:
+                    hashes = listdir(suff_path)
+                except OSError as e:
+                    if e.errno not in (errno.ENOTDIR, errno.ENODATA,
+                                       EUCLEAN):
+                        raise
+                    continue
+                for hsh in hashes:
+                    hsh_path = os.path.join(suff_path, hsh)
+                    yield AuditLocation(hsh_path, device, partition,
+                                        policy)
+
+        update_auditor_status(datadir_path, logger, [], auditor_type)
+
+
+def get_auditor_status(datadir_path, logger, auditor_type):
+    auditor_status = os.path.join(
+        datadir_path, "auditor_status_%s.json" % auditor_type)
+    status = {}
+    try:
+        with open(auditor_status, encoding='utf8') as statusfile:
+            status = statusfile.read()
+    except (OSError, IOError) as e:
+        if e.errno != errno.ENOENT and logger:
+            logger.warning('Cannot read %(auditor_status)s (%(err)s)',
+                           {'auditor_status': auditor_status, 'err': e})
+        return listdir(datadir_path)
+    try:
+        status = json.loads(status)
+    except ValueError as e:
+        logger.warning('Loading JSON from %(auditor_status)s failed'
+                       ' (%(err)s)',
+                       {'auditor_status': auditor_status, 'err': e})
+        return listdir(datadir_path)
+    return status['partitions']
+
+
+def update_auditor_status(datadir_path, logger, partitions, auditor_type):
+    status = json.dumps({'partitions': partitions}).encode('utf8')
+    auditor_status = os.path.join(
+        datadir_path, "auditor_status_%s.json" % auditor_type)
+    try:
+        mtime = os.stat(auditor_status).st_mtime
+    except OSError:
+        mtime = 0
+    recently_updated = (mtime + MIN_TIME_UPDATE_AUDITOR_STATUS) > time.time()
+    if recently_updated and len(partitions) > 0:
+        if logger:
+            logger.debug(
+                'Skipping the update of recently changed %s' % auditor_status)
+        return
+    try:
+        with open(auditor_status, "wb") as statusfile:
+            statusfile.write(status)
+    except (OSError, IOError) as e:
+        if logger:
+            logger.warning('Cannot write %(auditor_status)s (%(err)s)',
+                           {'auditor_status': auditor_status, 'err': e})
+
+
+def clear_auditor_status(devices, datadir, auditor_type="ALL"):
+    device_dirs = listdir(devices)
+    for device in device_dirs:
+        datadir_path = os.path.join(devices, device, datadir)
+        auditor_status = os.path.join(
+            datadir_path, "auditor_status_%s.json" % auditor_type)
+        remove_file(auditor_status)
+
+
+class DiskFileRouter(object):
+
+    def __init__(self, *args, **kwargs):
+        self.policy_to_manager = {}
+        for policy in POLICIES:
+            # create diskfile managers now to provoke any errors
+            self.policy_to_manager[int(policy)] = \
+                policy.get_diskfile_manager(*args, **kwargs)
+
+    def __getitem__(self, policy):
+        return self.policy_to_manager[int(policy)]
+
+
+class BaseDiskFileManager(object):
+    """
+    Management class for devices, providing common place for shared parameters
+    and methods not provided by the DiskFile class (which primarily services
+    the object server REST API layer).
+
+    The `get_diskfile()` method is how this implementation creates a `DiskFile`
+    object.
+
+    .. note::
+
+        This class is reference implementation specific and not part of the
+        pluggable on-disk backend API.
+
+    .. note::
+
+        TODO(portante): Not sure what the right name to recommend here, as
+        "manager" seemed generic enough, though suggestions are welcome.
+
+    :param conf: caller provided configuration object
+    :param logger: caller provided logger
+    """
+
+    diskfile_cls = None  # must be set by subclasses
+    policy = None  # must be set by subclasses
+
+    invalidate_hash = staticmethod(invalidate_hash)
+    consolidate_hashes = staticmethod(consolidate_hashes)
+    quarantine_renamer = staticmethod(quarantine_renamer)
+
+    def __init__(self, conf, logger):
+        self.logger = logger
+        self.devices = conf.get('devices', '/srv/node')
+        self.disk_chunk_size = int(conf.get('disk_chunk_size', 65536))
+        self.keep_cache_size = int(conf.get('keep_cache_size', 5242880))
+        self.bytes_per_sync = int(conf.get('mb_per_sync', 512)) * 1024 * 1024
+        self.mount_check = config_true_value(conf.get('mount_check', 'true'))
+        self.reclaim_age = int(conf.get('reclaim_age', DEFAULT_RECLAIM_AGE))
+        self.commit_window = non_negative_float(conf.get(
+            'commit_window', DEFAULT_COMMIT_WINDOW))
+        replication_concurrency_per_device = conf.get(
+            'replication_concurrency_per_device')
+        replication_one_per_device = conf.get('replication_one_per_device')
+        if replication_concurrency_per_device is None \
+                and replication_one_per_device is not None:
+            self.logger.warning('Option replication_one_per_device is '
+                                'deprecated and will be removed in a future '
+                                'version. Update your configuration to use '
+                                'option replication_concurrency_per_device.')
+            if config_true_value(replication_one_per_device):
+                replication_concurrency_per_device = 1
+            else:
+                replication_concurrency_per_device = 0
+        elif replication_one_per_device is not None:
+            self.logger.warning('Option replication_one_per_device ignored as '
+                                'replication_concurrency_per_device is '
+                                'defined.')
+        if replication_concurrency_per_device is None:
+            self.replication_concurrency_per_device = 1
+        else:
+            self.replication_concurrency_per_device = int(
+                replication_concurrency_per_device)
+        self.replication_lock_timeout = int(conf.get(
+            'replication_lock_timeout', 15))
+        self.fallocate_reserve, self.fallocate_is_percent = \
+            config_fallocate_value(conf.get('fallocate_reserve', '1%'))
+
+        self.use_splice = False
+        self.pipe_size = None
+
+        conf_wants_splice = config_true_value(conf.get('splice', 'no'))
+        # If the operator wants zero-copy with splice() but we don't have the
+        # requisite kernel support, complain so they can go fix it.
+        if conf_wants_splice and not splice.available:
+            self.logger.warning(
+                "Use of splice() requested (config says \"splice = %s\"), "
+                "but the system does not support it. "
+                "splice() will not be used." % conf.get('splice'))
+        elif conf_wants_splice and splice.available:
+            try:
+                sockfd = get_md5_socket()
+                os.close(sockfd)
+            except IOError as err:
+                # AF_ALG socket support was introduced in kernel 2.6.38; on
+                # systems with older kernels (or custom-built kernels lacking
+                # AF_ALG support), we can't use zero-copy.
+                if err.errno != errno.EAFNOSUPPORT:
+                    raise
+                self.logger.warning("MD5 sockets not supported. "
+                                    "splice() will not be used.")
+            else:
+                self.use_splice = True
+                with open('/proc/sys/fs/pipe-max-size') as f:
+                    max_pipe_size = int(f.read())
+                self.pipe_size = min(max_pipe_size, self.disk_chunk_size)
+        self.use_linkat = True
+
+    @classmethod
+    def check_policy(cls, policy):
+        if policy.policy_type != cls.policy:
+            raise ValueError('Invalid policy_type: %s' % policy.policy_type)
+
+    def make_on_disk_filename(self, timestamp, ext=None,
+                              ctype_timestamp=None, *a, **kw):
+        """
+        Returns filename for given timestamp.
+
+        :param timestamp: the object timestamp, an instance of
+                          :class:`~swift.common.utils.Timestamp`
+        :param ext: an optional string representing a file extension to be
+                    appended to the returned file name
+        :param ctype_timestamp: an optional content-type timestamp, an instance
+                                of :class:`~swift.common.utils.Timestamp`
+        :returns: a file name
+        """
+        rv = timestamp.internal
+        if ext == '.meta' and ctype_timestamp:
+            # If ctype_timestamp is None then the filename is simply the
+            # internal form of the timestamp. If ctype_timestamp is not None
+            # then the difference between the raw values of the two timestamps
+            # is appended as a hex number, with its sign.
+            #
+            # There are two reasons for encoding the content-type timestamp
+            # in the filename in this way. First, it means that two .meta files
+            # having the same timestamp but different content-type timestamps
+            # (and potentially different content-type values) will be distinct
+            # and therefore will be independently replicated when rsync
+            # replication is used. That ensures that all nodes end up having
+            # all content-type values after replication (with the most recent
+            # value being selected when the diskfile is opened). Second, having
+            # the content-type encoded in timestamp in the filename makes it
+            # possible for the  on disk file search code to determine that
+            # timestamp by inspecting only the filename, and not needing to
+            # open the file and read its xattrs.
+            rv = encode_timestamps(timestamp, ctype_timestamp, explicit=True)
+        if ext:
+            rv = '%s%s' % (rv, ext)
+        return rv
+
+    def parse_on_disk_filename(self, filename, policy):
+        """
+        Parse an on disk file name.
+
+        :param filename: the file name including extension
+        :param policy: storage policy used to store the file
+        :returns: a dict, with keys for timestamp, ext and ctype_timestamp:
+
+            * timestamp is a :class:`~swift.common.utils.Timestamp`
+            * ctype_timestamp is a :class:`~swift.common.utils.Timestamp` or
+              None for .meta files, otherwise None
+            * ext is a string, the file extension including the leading dot or
+              the empty string if the filename has no extension.
+
+            Subclasses may override this method to add further keys to the
+            returned dict.
+
+        :raises DiskFileError: if any part of the filename is not able to be
+                               validated.
+        """
+        ts_ctype = None
+        fname, ext = splitext(filename)
+        try:
+            if ext == '.meta':
+                timestamp, ts_ctype = decode_timestamps(
+                    fname, explicit=True)[:2]
+            else:
+                timestamp = Timestamp(fname)
+        except ValueError:
+            raise DiskFileError('Invalid Timestamp value in filename %r'
+                                % filename)
+        return {
+            'timestamp': timestamp,
+            'ext': ext,
+            'ctype_timestamp': ts_ctype
+        }
+
+    def _process_ondisk_files(self, exts, results, **kwargs):
+        """
+        Called by get_ondisk_files(). Should be over-ridden to implement
+        subclass specific handling of files.
+
+        :param exts: dict of lists of file info, keyed by extension
+        :param results: a dict that may be updated with results
+        """
+        raise NotImplementedError
+
+    def _verify_ondisk_files(self, results, **kwargs):
+        """
+        Verify that the final combination of on disk files complies with the
+        diskfile contract.
+
+        :param results: files that have been found and accepted
+        :returns: True if the file combination is compliant, False otherwise
+        """
+        data_file, meta_file, ts_file = tuple(
+            [results[key]
+             for key in ('data_file', 'meta_file', 'ts_file')])
+
+        return ((data_file is None and meta_file is None and ts_file is None)
+                or (ts_file is not None and data_file is None
+                    and meta_file is None)
+                or (data_file is not None and ts_file is None))
+
+    def _split_list(self, original_list, condition):
+        """
+        Split a list into two lists. The first list contains the first N items
+        of the original list, in their original order,  where 0 < N <=
+        len(original list). The second list contains the remaining items of the
+        original list, in their original order.
+
+        The index, N, at which the original list is split is the index of the
+        first item in the list that does not satisfy the given condition. Note
+        that the original list should be appropriately sorted if the second
+        list is to contain no items that satisfy the given condition.
+
+        :param original_list: the list to be split.
+        :param condition: a single argument function that will be used to test
+                          for the list item to split on.
+        :return: a tuple of two lists.
+        """
+        for i, item in enumerate(original_list):
+            if not condition(item):
+                return original_list[:i], original_list[i:]
+        return original_list, []
+
+    def _split_gt_timestamp(self, file_info_list, timestamp):
+        """
+        Given a list of file info dicts, reverse sorted by timestamp, split the
+        list into two: items newer than timestamp, and items at same time or
+        older than timestamp.
+
+        :param file_info_list: a list of file_info dicts.
+        :param timestamp: a Timestamp.
+        :return: a tuple of two lists.
+        """
+        return self._split_list(
+            file_info_list, lambda x: x['timestamp'] > timestamp)
+
+    def _split_gte_timestamp(self, file_info_list, timestamp):
+        """
+        Given a list of file info dicts, reverse sorted by timestamp, split the
+        list into two: items newer than or at same time as the timestamp, and
+        items older than timestamp.
+
+        :param file_info_list: a list of file_info dicts.
+        :param timestamp: a Timestamp.
+        :return: a tuple of two lists.
+        """
+        return self._split_list(
+            file_info_list, lambda x: x['timestamp'] >= timestamp)
+
+    def get_ondisk_files(self, files, datadir, verify=True, policy=None,
+                         **kwargs):
+        """
+        Given a simple list of files names, determine the files that constitute
+        a valid fileset i.e. a set of files that defines the state of an
+        object, and determine the files that are obsolete and could be deleted.
+        Note that some files may fall into neither category.
+
+        If a file is considered part of a valid fileset then its info dict will
+        be added to the results dict, keyed by <extension>_info. Any files that
+        are no longer required will have their info dicts added to a list
+        stored under the key 'obsolete'.
+
+        The results dict will always contain entries with keys 'ts_file',
+        'data_file' and 'meta_file'. Their values will be the fully qualified
+        path to a file of the corresponding type if there is such a file in the
+        valid fileset, or None.
+
+        :param files: a list of file names.
+        :param datadir: directory name files are from; this is used to
+                        construct file paths in the results, but the datadir is
+                        not modified by this method.
+        :param verify: if True verify that the ondisk file contract has not
+                       been violated, otherwise do not verify.
+        :param policy: storage policy used to store the files. Used to
+                       validate fragment indexes for EC policies.
+        :returns: a dict that will contain keys:
+                    ts_file   -> path to a .ts file or None
+                    data_file -> path to a .data file or None
+                    meta_file -> path to a .meta file or None
+                    ctype_file -> path to a .meta file or None
+                  and may contain keys:
+                    ts_info   -> a file info dict for a .ts file
+                    data_info -> a file info dict for a .data file
+                    meta_info -> a file info dict for a .meta file
+                    ctype_info -> a file info dict for a .meta file which
+                    contains the content-type value
+                    unexpected -> a list of file paths for unexpected
+                    files
+                    possible_reclaim -> a list of file info dicts for possible
+                    reclaimable files
+                    obsolete  -> a list of file info dicts for obsolete files
+        """
+        # Build the exts data structure:
+        # exts is a dict that maps file extensions to a list of file_info
+        # dicts for the files having that extension. The file_info dicts are of
+        # the form returned by parse_on_disk_filename, with the filename added.
+        # Each list is sorted in reverse timestamp order.
+
+        # the results dict is used to collect results of file filtering
+        results = {}
+
+        # The exts dict will be modified during subsequent processing as files
+        # are removed to be discarded or ignored.
+        exts = defaultdict(list)
+
+        for afile in files:
+            # Categorize files by extension
+            try:
+                file_info = self.parse_on_disk_filename(afile, policy)
+                file_info['filename'] = afile
+                exts[file_info['ext']].append(file_info)
+            except DiskFileError as e:
+                file_path = os.path.join(datadir or '', afile)
+                results.setdefault('unexpected', []).append(file_path)
+                # log warnings if it's not a rsync temp file
+                if RE_RSYNC_TEMPFILE.match(afile):
+                    self.logger.debug('Rsync tempfile: %s', file_path)
+                else:
+                    self.logger.warning('Unexpected file %s: %s',
+                                        file_path, e)
+        for ext in exts:
+            # For each extension sort files into reverse chronological order.
+            exts[ext] = sorted(
+                exts[ext], key=lambda info: info['timestamp'], reverse=True)
+
+        if exts.get('.ts'):
+            # non-tombstones older than or equal to latest tombstone are
+            # obsolete
+            for ext in filter(lambda ext: ext != '.ts', exts.keys()):
+                exts[ext], older = self._split_gt_timestamp(
+                    exts[ext], exts['.ts'][0]['timestamp'])
+                results.setdefault('obsolete', []).extend(older)
+            # all but most recent .ts are obsolete
+            results.setdefault('obsolete', []).extend(exts['.ts'][1:])
+            exts['.ts'] = exts['.ts'][:1]
+
+        if exts.get('.meta'):
+            # retain the newest meta file
+            retain = 1
+            if exts['.meta'][1:]:
+                # there are other meta files so find the one with newest
+                # ctype_timestamp...
+                exts['.meta'][1:] = sorted(
+                    exts['.meta'][1:],
+                    key=lambda info: info['ctype_timestamp'] or 0,
+                    reverse=True)
+                # ...and retain this IFF its ctype_timestamp is greater than
+                # newest meta file
+                if ((exts['.meta'][1]['ctype_timestamp'] or 0) >
+                        (exts['.meta'][0]['ctype_timestamp'] or 0)):
+                    if (exts['.meta'][1]['timestamp'] ==
+                            exts['.meta'][0]['timestamp']):
+                        # both at same timestamp so retain only the one with
+                        # newest ctype
+                        exts['.meta'][:2] = [exts['.meta'][1],
+                                             exts['.meta'][0]]
+                        retain = 1
+                    else:
+                        # retain both - first has newest metadata, second has
+                        # newest ctype
+                        retain = 2
+            # discard all meta files not being retained...
+            results.setdefault('obsolete', []).extend(exts['.meta'][retain:])
+            exts['.meta'] = exts['.meta'][:retain]
+
+        # delegate to subclass handler
+        self._process_ondisk_files(exts, results, **kwargs)
+
+        # set final choice of files
+        if 'data_info' in results:
+            if exts.get('.meta'):
+                # only report a meta file if a data file has been chosen
+                results['meta_info'] = exts['.meta'][0]
+                ctype_info = exts['.meta'].pop()
+                if (ctype_info['ctype_timestamp']
+                        > results['data_info']['timestamp']):
+                    results['ctype_info'] = ctype_info
+        elif exts.get('.ts'):
+            # only report a ts file if a data file has not been chosen
+            # (ts files will commonly already have been removed from exts if
+            # a data file was chosen, but that may not be the case if
+            # non-durable EC fragment(s) were chosen, hence the elif here)
+            results['ts_info'] = exts['.ts'][0]
+
+        # set ts_file, data_file, meta_file and ctype_file with path to
+        # chosen file or None
+        for info_key in ('data_info', 'meta_info', 'ts_info', 'ctype_info'):
+            info = results.get(info_key)
+            key = info_key[:-5] + '_file'
+            results[key] = join(datadir, info['filename']) if info else None
+
+        if verify and not self._verify_ondisk_files(results, **kwargs):
+            raise RuntimeError(
+                "On-disk file search algorithm contract is broken: %s"
+                % str(results))
+
+        return results
+
+    def cleanup_ondisk_files(self, hsh_path, **kwargs):
+        """
+        Clean up on-disk files that are obsolete and gather the set of valid
+        on-disk files for an object.
+
+        :param hsh_path: object hash path
+        :param frag_index: if set, search for a specific fragment index .data
+                           file, otherwise accept the first valid .data file
+        :returns: a dict that may contain: valid on disk files keyed by their
+                  filename extension; a list of obsolete files stored under the
+                  key 'obsolete'; a list of files remaining in the directory,
+                  reverse sorted, stored under the key 'files'.
+        """
+        def is_reclaimable(timestamp):
+            return (time.time() - float(timestamp)) > self.reclaim_age
+
+        try:
+            files = os.listdir(hsh_path)
+        except OSError as err:
+            if err.errno == errno.ENOENT:
+                results = self.get_ondisk_files(
+                    [], hsh_path, verify=False, **kwargs)
+                results['files'] = []
+                return results
+            else:
+                raise
+
+        files.sort(reverse=True)
+        results = self.get_ondisk_files(
+            files, hsh_path, verify=False, **kwargs)
+        if 'ts_info' in results and is_reclaimable(
+                results['ts_info']['timestamp']):
+            remove_file(join(hsh_path, results['ts_info']['filename']))
+            files.remove(results.pop('ts_info')['filename'])
+        for file_info in results.get('possible_reclaim', []):
+            # stray files are not deleted until reclaim-age; non-durable data
+            # files are not deleted unless they were written before
+            # commit_window
+            filepath = join(hsh_path, file_info['filename'])
+            if (is_reclaimable(file_info['timestamp']) and
+                    (file_info.get('durable', True) or
+                     self.commit_window <= 0 or
+                     is_file_older(filepath, self.commit_window))):
+                results.setdefault('obsolete', []).append(file_info)
+        for file_info in results.get('obsolete', []):
+            remove_file(join(hsh_path, file_info['filename']))
+            files.remove(file_info['filename'])
+        results['files'] = files
+        if not files:  # everything got unlinked
+            try:
+                os.rmdir(hsh_path)
+            except OSError as err:
+                if err.errno not in (errno.ENOENT, errno.ENOTEMPTY):
+                    self.logger.debug(
+                        'Error cleaning up empty hash directory %s: %s',
+                        hsh_path, err)
+                # else, no real harm; pass
+        return results
+
+    def _update_suffix_hashes(self, hashes, ondisk_info):
+        """
+        Applies policy specific updates to the given dict of md5 hashes for
+        the given ondisk_info.
+
+        :param hashes: a dict of md5 hashes to be updated
+        :param ondisk_info: a dict describing the state of ondisk files, as
+                            returned by get_ondisk_files
+        """
+        raise NotImplementedError
+
+    def _hash_suffix_dir(self, path, policy):
+        """
+
+        :param path: full path to directory
+        :param policy: storage policy used
+        """
+        class shim(object):
+            def __init__(self):
+                self.md5 = md5(usedforsecurity=False)
+
+            def update(self, s):
+                if isinstance(s, str):
+                    self.md5.update(s.encode('utf-8'))
+                else:
+                    self.md5.update(s)
+
+            def hexdigest(self):
+                return self.md5.hexdigest()
+        hashes = defaultdict(shim)
+        try:
+            path_contents = sorted(os.listdir(path))
+        except OSError as err:
+            if err.errno in (errno.ENOTDIR, errno.ENOENT):
+                raise PathNotDir()
+            raise
+        for hsh in path_contents:
+            hsh_path = join(path, hsh)
+            try:
+                ondisk_info = self.cleanup_ondisk_files(
+                    hsh_path, policy=policy)
+            except OSError as err:
+                partition_path = dirname(path)
+                objects_path = dirname(partition_path)
+                device_path = dirname(objects_path)
+                if err.errno == errno.ENOTDIR:
+                    # The made-up filename is so that the eventual dirpath()
+                    # will result in this object directory that we care about.
+                    # Some failures will result in an object directory
+                    # becoming a file, thus causing the parent directory to
+                    # be qarantined.
+                    quar_path = quarantine_renamer(device_path,
+                                                   join(hsh_path,
+                                                        "made-up-filename"))
+                    logging.error(
+                        'Quarantined %(hsh_path)s to %(quar_path)s because '
+                        'it is not a directory', {'hsh_path': hsh_path,
+                                                  'quar_path': quar_path})
+                    continue
+                elif err.errno in (errno.ENODATA, EUCLEAN):
+                    try:
+                        # We've seen cases where bad sectors lead to ENODATA
+                        # here; use a similar hack as above
+                        quar_path = quarantine_renamer(
+                            device_path,
+                            join(hsh_path, "made-up-filename"))
+                        orig_path = hsh_path
+                    except (OSError, IOError):
+                        # We've *also* seen the bad sectors lead to us needing
+                        # to quarantine the whole suffix
+                        quar_path = quarantine_renamer(device_path, hsh_path)
+                        orig_path = path
+                    logging.error(
+                        'Quarantined %(orig_path)s to %(quar_path)s because '
+                        'it could not be listed', {'orig_path': orig_path,
+                                                   'quar_path': quar_path})
+                    continue
+                raise
+            if not ondisk_info['files']:
+                continue
+
+            # ondisk_info has info dicts containing timestamps for those
+            # files that could determine the state of the diskfile if it were
+            # to be opened. We update the suffix hash with the concatenation of
+            # each file's timestamp and extension. The extension is added to
+            # guarantee distinct hash values from two object dirs that have
+            # different file types at the same timestamp(s).
+            #
+            # Files that may be in the object dir but would have no effect on
+            # the state of the diskfile are not used to update the hash.
+            for key in (k for k in ('meta_info', 'ts_info')
+                        if k in ondisk_info):
+                info = ondisk_info[key]
+                hashes[None].update(info['timestamp'].internal + info['ext'])
+
+            # delegate to subclass for data file related updates...
+            self._update_suffix_hashes(hashes, ondisk_info)
+
+            if 'ctype_info' in ondisk_info:
+                # We have a distinct content-type timestamp so update the
+                # hash. As a precaution, append '_ctype' to differentiate this
+                # value from any other timestamp value that might included in
+                # the hash in future. There is no .ctype file so use _ctype to
+                # avoid any confusion.
+                info = ondisk_info['ctype_info']
+                hashes[None].update(info['ctype_timestamp'].internal
+                                    + '_ctype')
+
+        try:
+            os.rmdir(path)
+        except OSError as e:
+            if e.errno == errno.ENOENT:
+                raise PathNotDir()
+        else:
+            # if we remove it, pretend like it wasn't there to begin with so
+            # that the suffix key gets removed
+            raise PathNotDir()
+        return hashes
+
+    def _hash_suffix(self, path, policy=None):
+        """
+        Performs reclamation and returns an md5 of all (remaining) files.
+
+        :param path: full path to directory
+        :param policy: storage policy used to store the files
+        :raises PathNotDir: if given path is not a valid directory
+        :raises OSError: for non-ENOTDIR errors
+        """
+        raise NotImplementedError
+
+    def _get_hashes(self, *args, **kwargs):
+        """
+        Base entry-point to non-tpool'd __get_hashes
+
+        See __get_hashes for params
+
+        :returns: (int, dict) tuple, i.e. (num_hashed, sanitized_suffix_hashes)
+        """
+        hashed, hashes = self.__get_hashes(*args, **kwargs)
+        hashes.pop('updated', None)
+        hashes.pop('valid', None)
+        return hashed, hashes
+
+    def __get_hashes(self, device, partition, policy, recalculate=None,
+                     do_listdir=False):
+        """
+        Get hashes for each suffix dir in a partition.  do_listdir causes it to
+        mistrust the hash cache for suffix existence at the (unexpectedly high)
+        cost of a listdir.
+
+        :param device: name of target device
+        :param partition: partition on the device in which the object lives
+        :param policy: the StoragePolicy instance
+        :param recalculate: list of suffixes which should be recalculated when
+                            got
+        :param do_listdir: force existence check for all hashes in the
+                           partition
+
+        :returns: tuple of (number of suffix dirs hashed, dictionary of hashes)
+        """
+        hashed = 0
+        dev_path = self.get_dev_path(device)
+        partition_path = get_part_path(dev_path, policy, partition)
+        hashes_file = join(partition_path, HASH_FILE)
+        modified = False
+        orig_hashes = {'valid': False}
+
+        if recalculate is None:
+            recalculate = []
+
+        try:
+            orig_hashes = self.consolidate_hashes(partition_path)
+        except Exception:
+            self.logger.warning('Unable to read %r', hashes_file,
+                                exc_info=True)
+
+        if not orig_hashes['valid']:
+            # This is the only path to a valid hashes from invalid read (e.g.
+            # does not exist, corrupt, etc.).  Moreover, in order to write this
+            # valid hashes we must read *the exact same* invalid state or we'll
+            # trigger race detection.
+            do_listdir = True
+            hashes = {'valid': True}
+            # If the exception handling around consolidate_hashes fired we're
+            # going to do a full rehash regardless; but we need to avoid
+            # needless recursion if the on-disk hashes.pkl is actually readable
+            # (worst case is consolidate_hashes keeps raising exceptions and we
+            # eventually run out of stack).
+            # N.B. orig_hashes invalid only effects new parts and error/edge
+            # conditions - so try not to get overly caught up trying to
+            # optimize it out unless you manage to convince yourself there's a
+            # bad behavior.
+            orig_hashes = read_hashes(partition_path)
+        else:
+            hashes = copy.deepcopy(orig_hashes)
+
+        if do_listdir:
+            for suff in os.listdir(partition_path):
+                if len(suff) == 3:
+                    hashes.setdefault(suff, None)
+            modified = True
+            self.logger.debug('Run listdir on %s', partition_path)
+        hashes.update((suffix, None) for suffix in recalculate)
+        for suffix, hash_ in list(hashes.items()):
+            if suffix in ('valid', 'updated'):
+                continue
+            if not hash_:
+                suffix_dir = join(partition_path, suffix)
+                try:
+                    hashes[suffix] = self._hash_suffix(
+                        suffix_dir, policy=policy)
+                    hashed += 1
+                except PathNotDir:
+                    del hashes[suffix]
+                except OSError:
+                    logging.exception('Error hashing suffix')
+                modified = True
+        if modified:
+            with lock_path(partition_path):
+                if read_hashes(partition_path) == orig_hashes:
+                    write_hashes(partition_path, hashes)
+                    return hashed, hashes
+            return self.__get_hashes(device, partition, policy,
+                                     recalculate=recalculate,
+                                     do_listdir=do_listdir)
+        else:
+            return hashed, hashes
+
+    def construct_dev_path(self, device):
+        """
+        Construct the path to a device without checking if it is mounted.
+
+        :param device: name of target device
+        :returns: full path to the device
+        """
+        return os.path.join(self.devices, device)
+
+    def get_dev_path(self, device, mount_check=None):
+        """
+        Return the path to a device, first checking to see if either it
+        is a proper mount point, or at least a directory depending on
+        the mount_check configuration option.
+
+        :param device: name of target device
+        :param mount_check: whether or not to check mountedness of device.
+                            Defaults to bool(self.mount_check).
+        :returns: full path to the device, None if the path to the device is
+                  not a proper mount point or directory.
+        """
+        if mount_check is False:
+            # explicitly forbidden from syscall, just return path
+            return join(self.devices, device)
+        # we'll do some kind of check if not explicitly forbidden
+        try:
+            return check_drive(self.devices, device,
+                               mount_check or self.mount_check)
+        except ValueError:
+            return None
+
+    @contextmanager
+    def replication_lock(self, device, policy, partition):
+        """
+        A context manager that will lock on the partition and, if configured
+        to do so, on the device given.
+
+        :param device: name of target device
+        :param policy: policy targeted by the replication request
+        :param partition: partition targeted by the replication request
+        :raises ReplicationLockTimeout: If the lock on the device
+            cannot be granted within the configured timeout.
+        """
+        limit_time = time.time() + self.replication_lock_timeout
+        with self.partition_lock(device, policy, partition, name='replication',
+                                 timeout=self.replication_lock_timeout):
+            if self.replication_concurrency_per_device:
+                with lock_path(self.get_dev_path(device),
+                               timeout=limit_time - time.time(),
+                               timeout_class=ReplicationLockTimeout,
+                               limit=self.replication_concurrency_per_device):
+                    yield True
+            else:
+                yield True
+
+    @contextmanager
+    def partition_lock(self, device, policy, partition, name=None,
+                       timeout=None):
+        """
+        A context manager that will lock on the partition given.
+
+        :param device: device targeted by the lock request
+        :param policy: policy targeted by the lock request
+        :param partition: partition targeted by the lock request
+        :raises PartitionLockTimeout: If the lock on the partition
+            cannot be granted within the configured timeout.
+        """
+        if timeout is None:
+            timeout = self.replication_lock_timeout
+        part_path = os.path.join(self.get_dev_path(device),
+                                 get_data_dir(policy), str(partition))
+        with lock_path(part_path, timeout=timeout,
+                       timeout_class=PartitionLockTimeout, limit=1, name=name):
+            yield True
+
+    def pickle_async_update(self, device, account, container, obj, data,
+                            timestamp, policy):
+        """
+        Write data describing a container update notification to a pickle file
+        in the async_pending directory.
+
+        :param device: name of target device
+        :param account: account name for the object
+        :param container: container name for the object
+        :param obj: object name for the object
+        :param data: update data to be written to pickle file
+        :param timestamp: a Timestamp
+        :param policy: the StoragePolicy instance
+        """
+        device_path = self.construct_dev_path(device)
+        async_dir = os.path.join(device_path, get_async_dir(policy))
+        tmp_dir = os.path.join(device_path, get_tmp_dir(policy))
+        mkdirs(tmp_dir)
+        ohash = hash_path(account, container, obj)
+        write_pickle(
+            data,
+            os.path.join(async_dir, ohash[-3:], ohash + '-' +
+                         Timestamp(timestamp).internal),
+            tmp_dir)
+        self.logger.increment('async_pendings')
+
+    def get_diskfile(self, device, partition, account, container, obj,
+                     policy, **kwargs):
+        """
+        Returns a BaseDiskFile instance for an object based on the object's
+        partition, path parts and policy.
+
+        :param device: name of target device
+        :param partition: partition on device in which the object lives
+        :param account: account name for the object
+        :param container: container name for the object
+        :param obj: object name for the object
+        :param policy: the StoragePolicy instance
+        """
+        dev_path = self.get_dev_path(device)
+        if not dev_path:
+            raise DiskFileDeviceUnavailable()
+        return self.diskfile_cls(self, dev_path,
+                                 partition, account, container, obj,
+                                 policy=policy, use_splice=self.use_splice,
+                                 pipe_size=self.pipe_size, **kwargs)
+
+    def clear_auditor_status(self, policy, auditor_type="ALL"):
+        datadir = get_data_dir(policy)
+        clear_auditor_status(self.devices, datadir, auditor_type)
+
+    def object_audit_location_generator(self, policy, device_dirs=None,
+                                        auditor_type="ALL"):
+        """
+        Yield an AuditLocation for all objects stored under device_dirs.
+
+        :param policy: the StoragePolicy instance
+        :param device_dirs: directory of target device
+        :param auditor_type: either ALL or ZBF
+        """
+        datadir = get_data_dir(policy)
+        return object_audit_location_generator(self.devices, datadir,
+                                               self.mount_check,
+                                               self.logger, device_dirs,
+                                               auditor_type)
+
+    def get_diskfile_from_audit_location(self, audit_location):
+        """
+        Returns a BaseDiskFile instance for an object at the given
+        AuditLocation.
+
+        :param audit_location: object location to be audited
+        """
+        dev_path = self.get_dev_path(audit_location.device, mount_check=False)
+        return self.diskfile_cls.from_hash_dir(
+            self, audit_location.path, dev_path,
+            audit_location.partition, policy=audit_location.policy)
+
+    def get_diskfile_and_filenames_from_hash(self, device, partition,
+                                             object_hash, policy, **kwargs):
+        """
+        Returns a tuple of (a DiskFile instance for an object at the given
+        object_hash, the basenames of the files in the object's hash dir).
+        Just in case someone thinks of refactoring, be sure DiskFileDeleted is
+        *not* raised, but the DiskFile instance representing the tombstoned
+        object is returned instead.
+
+        :param device: name of target device
+        :param partition: partition on the device in which the object lives
+        :param object_hash: the hash of an object path
+        :param policy: the StoragePolicy instance
+        :raises DiskFileNotExist: if the object does not exist
+        :returns: a tuple comprising (an instance of BaseDiskFile, a list of
+            file basenames)
+        """
+        dev_path = self.get_dev_path(device)
+        if not dev_path:
+            raise DiskFileDeviceUnavailable()
+        object_path = os.path.join(
+            dev_path, get_data_dir(policy), str(partition), object_hash[-3:],
+            object_hash)
+        try:
+            filenames = self.cleanup_ondisk_files(object_path)['files']
+        except OSError as err:
+            if err.errno == errno.ENOTDIR:
+                # The made-up filename is so that the eventual dirpath()
+                # will result in this object directory that we care about.
+                # Some failures will result in an object directory
+                # becoming a file, thus causing the parent directory to
+                # be qarantined.
+                quar_path = self.quarantine_renamer(dev_path,
+                                                    join(object_path,
+                                                         "made-up-filename"))
+                logging.exception(
+                    'Quarantined %(object_path)s to %(quar_path)s because '
+                    'it is not a directory', {'object_path': object_path,
+                                              'quar_path': quar_path})
+                raise DiskFileNotExist()
+            elif err.errno in (errno.ENODATA, EUCLEAN):
+                try:
+                    # We've seen cases where bad sectors lead to ENODATA here;
+                    # use a similar hack as above
+                    quar_path = self.quarantine_renamer(
+                        dev_path,
+                        join(object_path, "made-up-filename"))
+                    orig_path = object_path
+                except (OSError, IOError):
+                    # We've *also* seen the bad sectors lead to us needing to
+                    # quarantine the whole suffix, not just the hash dir
+                    quar_path = self.quarantine_renamer(dev_path, object_path)
+                    orig_path = os.path.dirname(object_path)
+                logging.exception(
+                    'Quarantined %(orig_path)s to %(quar_path)s because '
+                    'it could not be listed', {'orig_path': orig_path,
+                                               'quar_path': quar_path})
+                raise DiskFileNotExist()
+            if err.errno != errno.ENOENT:
+                raise
+            raise DiskFileNotExist()
+        if not filenames:
+            raise DiskFileNotExist()
+        try:
+            metadata = read_metadata(os.path.join(object_path, filenames[-1]))
+        except EOFError:
+            raise DiskFileNotExist()
+        try:
+            account, container, obj = split_path(
+                metadata.get('name', ''), 3, 3, True)
+        except ValueError:
+            raise DiskFileNotExist()
+        df = self.diskfile_cls(self, dev_path, partition, account, container,
+                               obj, policy=policy, **kwargs)
+        return df, filenames
+
+    def get_diskfile_from_hash(self, device, partition, object_hash, policy,
+                               **kwargs):
+        """
+        Returns a DiskFile instance for an object at the given object_hash.
+        Just in case someone thinks of refactoring, be sure DiskFileDeleted is
+        *not* raised, but the DiskFile instance representing the tombstoned
+        object is returned instead.
+
+        :param device: name of target device
+        :param partition: partition on the device in which the object lives
+        :param object_hash: the hash of an object path
+        :param policy: the StoragePolicy instance
+        :raises DiskFileNotExist: if the object does not exist
+        :returns: an instance of BaseDiskFile
+        """
+        return self.get_diskfile_and_filenames_from_hash(
+            device, partition, object_hash, policy, **kwargs)[0]
+
+    def get_hashes(self, device, partition, suffixes, policy,
+                   skip_rehash=False):
+        """
+
+        :param device: name of target device
+        :param partition: partition name
+        :param suffixes: a list of suffix directories to be recalculated
+        :param policy: the StoragePolicy instance
+        :param skip_rehash: just mark the suffixes dirty; return None
+        :returns: a dictionary that maps suffix directories
+        """
+        dev_path = self.get_dev_path(device)
+        if not dev_path:
+            raise DiskFileDeviceUnavailable()
+        partition_path = get_part_path(dev_path, policy, partition)
+        suffixes = [suf for suf in suffixes or [] if valid_suffix(suf)]
+
+        if skip_rehash:
+            for suffix in suffixes:
+                self.invalidate_hash(os.path.join(partition_path, suffix))
+            hashes = None
+        elif not os.path.exists(partition_path):
+            hashes = {}
+        else:
+            _junk, hashes = tpool.execute(
+                self._get_hashes, device, partition, policy,
+                recalculate=suffixes)
+        return hashes
+
+    def _listdir(self, path):
+        """
+        :param path: full path to directory
+        """
+        try:
+            return os.listdir(path)
+        except OSError as err:
+            if err.errno != errno.ENOENT:
+                self.logger.error(
+                    'ERROR: Skipping %r due to error with listdir attempt: %s',
+                    path, err)
+        return []
+
+    def yield_suffixes(self, device, partition, policy):
+        """
+        Yields tuples of (full_path, suffix_only) for suffixes stored
+        on the given device and partition.
+
+        :param device: name of target device
+        :param partition: partition name
+        :param policy: the StoragePolicy instance
+        """
+        dev_path = self.get_dev_path(device)
+        if not dev_path:
+            raise DiskFileDeviceUnavailable()
+        partition_path = get_part_path(dev_path, policy, partition)
+        for suffix in self._listdir(partition_path):
+            if len(suffix) != 3:
+                continue
+            try:
+                int(suffix, 16)
+            except ValueError:
+                continue
+            yield (os.path.join(partition_path, suffix), suffix)
+
+    def yield_hashes(self, device, partition, policy,
+                     suffixes=None, **kwargs):
+        """
+        Yields tuples of (hash_only, timestamps) for object
+        information stored for the given device, partition, and
+        (optionally) suffixes. If suffixes is None, all stored
+        suffixes will be searched for object hashes. Note that if
+        suffixes is not None but empty, such as [], then nothing will
+        be yielded.
+
+        timestamps is a dict which may contain items mapping:
+
+        - ts_data -> timestamp of data or tombstone file,
+        - ts_meta -> timestamp of meta file, if one exists
+        - ts_ctype -> timestamp of meta file containing most recent
+                      content-type value, if one exists
+        - durable -> True if data file at ts_data is durable, False otherwise
+
+        where timestamps are instances of
+        :class:`~swift.common.utils.Timestamp`
+
+        :param device: name of target device
+        :param partition: partition name
+        :param policy: the StoragePolicy instance
+        :param suffixes: optional list of suffix directories to be searched
+        """
+        dev_path = self.get_dev_path(device)
+        if not dev_path:
+            raise DiskFileDeviceUnavailable()
+
+        partition_path = get_part_path(dev_path, policy, partition)
+        if suffixes is None:
+            suffixes = self.yield_suffixes(device, partition, policy)
+        else:
+            suffixes = (
+                (os.path.join(partition_path, suffix), suffix)
+                for suffix in suffixes)
+
+        # define keys that we need to extract the result from the on disk info
+        # data:
+        #   (x, y, z) -> result[x] should take the value of y[z]
+        key_map = (
+            ('ts_meta', 'meta_info', 'timestamp'),
+            ('ts_data', 'data_info', 'timestamp'),
+            ('ts_data', 'ts_info', 'timestamp'),
+            ('ts_ctype', 'ctype_info', 'ctype_timestamp'),
+            ('durable', 'data_info', 'durable'),
+        )
+
+        # cleanup_ondisk_files() will remove empty hash dirs, and we'll
+        # invalidate any empty suffix dirs so they'll get cleaned up on
+        # the next rehash
+        for suffix_path, suffix in suffixes:
+            found_files = False
+            for object_hash in self._listdir(suffix_path):
+                object_path = os.path.join(suffix_path, object_hash)
+                try:
+                    diskfile_info = self.cleanup_ondisk_files(
+                        object_path, **kwargs)
+                    if diskfile_info['files']:
+                        found_files = True
+                    result = {}
+                    for result_key, diskfile_info_key, info_key in key_map:
+                        if diskfile_info_key not in diskfile_info:
+                            continue
+                        info = diskfile_info[diskfile_info_key]
+                        if info_key in info:
+                            # durable key not returned from replicated Diskfile
+                            result[result_key] = info[info_key]
+                    if 'ts_data' not in result:
+                        # file sets that do not include a .data or .ts
+                        # file cannot be opened and therefore cannot
+                        # be ssync'd
+                        continue
+                    yield object_hash, result
+                except AssertionError as err:
+                    self.logger.debug('Invalid file set in %s (%s)' % (
+                        object_path, err))
+                except DiskFileError as err:
+                    self.logger.debug(
+                        'Invalid diskfile filename in %r (%s)' % (
+                            object_path, err))
+
+            if not found_files:
+                self.invalidate_hash(suffix_path)
+
+
+class BaseDiskFileWriter(object):
+    """
+    Encapsulation of the write context for servicing PUT REST API
+    requests. Serves as the context manager object for the
+    :class:`swift.obj.diskfile.DiskFile` class's
+    :func:`swift.obj.diskfile.DiskFile.create` method.
+
+    .. note::
+
+        It is the responsibility of the
+        :func:`swift.obj.diskfile.DiskFile.create` method context manager to
+        close the open file descriptor.
+
+    .. note::
+
+        The arguments to the constructor are considered implementation
+        specific. The API does not define the constructor arguments.
+
+    :param name: name of object from REST API
+    :param datadir: on-disk directory object will end up in on
+                    :func:`swift.obj.diskfile.DiskFileWriter.put`
+    :param fd: open file descriptor of temporary file to receive data
+    :param tmppath: full path name of the opened file descriptor
+    :param bytes_per_sync: number bytes written between sync calls
+    :param diskfile: the diskfile creating this DiskFileWriter instance
+    :param next_part_power: the next partition power to be used
+    :param extension: the file extension to be used; may be used internally
+                      to distinguish between PUT/POST/DELETE operations
+    """
+
+    def __init__(self, name, datadir, size, bytes_per_sync, diskfile,
+                 next_part_power, extension='.data'):
+        # Parameter tracking
+        self._name = name
+        self._datadir = datadir
+        self._fd = None
+        self._tmppath = None
+        self._size = size
+        self._chunks_etag = md5(usedforsecurity=False)
+        self._bytes_per_sync = bytes_per_sync
+        self._diskfile = diskfile
+        self.next_part_power = next_part_power
+        self._extension = extension
+
+        # Internal attributes
+        self._upload_size = 0
+        self._last_sync = 0
+        self._put_succeeded = False
+
+    @property
+    def manager(self):
+        return self._diskfile.manager
+
+    @property
+    def logger(self):
+        return self.manager.logger
+
+    def _get_tempfile(self):
+        tmppath = None
+        if self.manager.use_linkat:
+            self._dirs_created = makedirs_count(self._datadir)
+            try:
+                fd = os.open(self._datadir, O_TMPFILE | os.O_WRONLY)
+            except OSError as err:
+                if err.errno in (errno.EOPNOTSUPP, errno.EISDIR, errno.EINVAL):
+                    msg = 'open(%s, O_TMPFILE | O_WRONLY) failed: %s \
+                           Falling back to using mkstemp()' \
+                           % (self._datadir, os.strerror(err.errno))
+                    self.logger.debug(msg)
+                    self.manager.use_linkat = False
+                else:
+                    raise
+        if not self.manager.use_linkat:
+            tmpdir = join(self._diskfile._device_path,
+                          get_tmp_dir(self._diskfile.policy))
+            if not exists(tmpdir):
+                mkdirs(tmpdir)
+            fd, tmppath = mkstemp(dir=tmpdir)
+        return fd, tmppath
+
+    def open(self):
+        if self._fd is not None:
+            raise ValueError('DiskFileWriter is already open')
+
+        try:
+            self._fd, self._tmppath = self._get_tempfile()
+        except OSError as err:
+            if err.errno in (errno.ENOSPC, errno.EDQUOT):
+                # No more inodes in filesystem
+                raise DiskFileNoSpace()
+            raise
+        if self._extension == '.ts':
+            # DELETEs always bypass any free-space reserve checks
+            pass
+        elif self._size:
+            try:
+                fallocate(self._fd, self._size)
+            except OSError as err:
+                if err.errno in (errno.ENOSPC, errno.EDQUOT):
+                    raise DiskFileNoSpace()
+                raise
+        else:
+            # If we don't know the size (i.e. self._size is None) or the size
+            # is known to be zero, we still want to block writes once we're
+            # past the reserve threshold.
+            if not fs_has_free_space(
+                    self._fd,
+                    self.manager.fallocate_reserve,
+                    self.manager.fallocate_is_percent
+            ):
+                raise DiskFileNoSpace()
+        return self
+
+    def close(self):
+        if self._fd:
+            try:
+                os.close(self._fd)
+            except OSError:
+                pass
+            self._fd = None
+        if self._tmppath and not self._put_succeeded:
+            # Try removing the temp file only if put did NOT succeed.
+            #
+            # dfw.put_succeeded is set to True after renamer() succeeds in
+            # DiskFileWriter._finalize_put()
+            try:
+                # when mkstemp() was used
+                os.unlink(self._tmppath)
+            except OSError:
+                self.logger.exception('Error removing tempfile: %s' %
+                                      self._tmppath)
+            self._tmppath = None
+
+    def write(self, chunk):
+        """
+        Write a chunk of data to disk. All invocations of this method must
+        come before invoking the :func:
+
+        For this implementation, the data is written into a temporary file.
+
+        :param chunk: the chunk of data to write as a string object
+        """
+        if not self._fd:
+            raise ValueError('Writer is not open')
+        self._chunks_etag.update(chunk)
+        while chunk:
+            written = os.write(self._fd, chunk)
+            self._upload_size += written
+            chunk = chunk[written:]
+
+        # For large files sync every 512MB (by default) written
+        diff = self._upload_size - self._last_sync
+        if diff >= self._bytes_per_sync:
+            tpool.execute(fdatasync, self._fd)
+            drop_buffer_cache(self._fd, self._last_sync, diff)
+            self._last_sync = self._upload_size
+
+    def chunks_finished(self):
+        """
+        Expose internal stats about written chunks.
+
+        :returns: a tuple, (upload_size, etag)
+        """
+        return self._upload_size, self._chunks_etag.hexdigest()
+
+    def _finalize_put(self, metadata, target_path, cleanup,
+                      logger_thread_locals):
+        if logger_thread_locals is not None:
+            self.logger.thread_locals = logger_thread_locals
+        # Write the metadata before calling fsync() so that both data and
+        # metadata are flushed to disk.
+        write_metadata(self._fd, metadata)
+        # We call fsync() before calling drop_cache() to lower the amount of
+        # redundant work the drop cache code will perform on the pages (now
+        # that after fsync the pages will be all clean).
+        fsync(self._fd)
+        # From the Department of the Redundancy Department, make sure we call
+        # drop_cache() after fsync() to avoid redundant work (pages all
+        # clean).
+        drop_buffer_cache(self._fd, 0, self._upload_size)
+        self.manager.invalidate_hash(dirname(self._datadir))
+        # After the rename/linkat completes, this object will be available for
+        # requests to reference.
+        if self._tmppath:
+            # It was a named temp file created by mkstemp()
+            renamer(self._tmppath, target_path)
+        else:
+            # It was an unnamed temp file created by open() with O_TMPFILE
+            link_fd_to_path(self._fd, target_path,
+                            self._diskfile._dirs_created)
+
+        # Check if the partition power will/has been increased
+        new_target_path = None
+        if self.next_part_power:
+            new_target_path = replace_partition_in_path(
+                self.manager.devices, target_path, self.next_part_power)
+            if target_path != new_target_path:
+                try:
+                    fsync_dir(os.path.dirname(target_path))
+                    self.manager.logger.debug(
+                        'Relinking %s to %s due to next_part_power set',
+                        target_path, new_target_path)
+                    relink_paths(target_path, new_target_path)
+                except OSError as exc:
+                    self.manager.logger.exception(
+                        'Relinking %s to %s failed: %s',
+                        target_path, new_target_path, exc)
+
+        # If rename is successful, flag put as succeeded. This is done to avoid
+        # unnecessary os.unlink() of tempfile later. As renamer() has
+        # succeeded, the tempfile would no longer exist at its original path.
+        self._put_succeeded = True
+        if cleanup:
+            try:
+                self.manager.cleanup_ondisk_files(self._datadir)
+            except OSError:
+                logging.exception('Problem cleaning up %s', self._datadir)
+
+            self._part_power_cleanup(target_path, new_target_path)
+
+    def _put(self, metadata, cleanup=True, *a, **kw):
+        """
+        Helper method for subclasses.
+
+        For this implementation, this method is responsible for renaming the
+        temporary file to the final name and directory location.  This method
+        should be called after the final call to
+        :func:`swift.obj.diskfile.DiskFileWriter.write`.
+
+        :param metadata: dictionary of metadata to be associated with the
+                         object
+        :param cleanup: a Boolean. If True then obsolete files will be removed
+                        from the object dir after the put completes, otherwise
+                        obsolete files are left in place.
+        """
+        timestamp = Timestamp(metadata['X-Timestamp'])
+        ctype_timestamp = metadata.get('Content-Type-Timestamp')
+        if ctype_timestamp:
+            ctype_timestamp = Timestamp(ctype_timestamp)
+        filename = self.manager.make_on_disk_filename(
+            timestamp, self._extension, ctype_timestamp=ctype_timestamp,
+            *a, **kw)
+        metadata['name'] = self._name
+        target_path = join(self._datadir, filename)
+
+        tpool.execute(
+            self._finalize_put, metadata, target_path, cleanup,
+            logger_thread_locals=getattr(self.logger, 'thread_locals', None))
+
+    def put(self, metadata):
+        """
+        Finalize writing the file on disk.
+
+        :param metadata: dictionary of metadata to be associated with the
+                         object
+        """
+        raise NotImplementedError
+
+    def commit(self, timestamp):
+        """
+        Perform any operations necessary to mark the object as durable. For
+        replication policy type this is a no-op.
+
+        :param timestamp: object put timestamp, an instance of
+                          :class:`~swift.common.utils.Timestamp`
+        """
+        pass
+
+    def _part_power_cleanup(self, cur_path, new_path):
+        """
+        Cleanup relative DiskFile directories.
+
+        If the partition power is increased soon or has just been increased but
+        the relinker didn't yet cleanup the old files, an additional cleanup of
+        the relative dirs has to be done. Otherwise there might be some unused
+        files left if a PUT or DELETE is done in the meantime
+        :param cur_path: current full path to an object file
+        :param new_path: recomputed path to an object file, based on the
+                         next_part_power set in the ring
+
+        """
+        if new_path is None:
+            return
+
+        # Partition power will be increased soon
+        if new_path != cur_path:
+            new_target_dir = os.path.dirname(new_path)
+            try:
+                self.manager.cleanup_ondisk_files(new_target_dir)
+            except OSError:
+                logging.exception(
+                    'Problem cleaning up %s', new_target_dir)
+
+        # Partition power has been increased, cleanup not yet finished
+        else:
+            prev_part_power = int(self.next_part_power) - 1
+            old_target_path = replace_partition_in_path(
+                self.manager.devices, cur_path, prev_part_power)
+            old_target_dir = os.path.dirname(old_target_path)
+            try:
+                self.manager.cleanup_ondisk_files(old_target_dir)
+            except OSError:
+                logging.exception(
+                    'Problem cleaning up %s', old_target_dir)
+
+
+class BaseDiskFileReader(object):
+    """
+    Encapsulation of the WSGI read context for servicing GET REST API
+    requests. Serves as the context manager object for the
+    :class:`swift.obj.diskfile.DiskFile` class's
+    :func:`swift.obj.diskfile.DiskFile.reader` method.
+
+    .. note::
+
+        The quarantining behavior of this method is considered implementation
+        specific, and is not required of the API.
+
+    .. note::
+
+        The arguments to the constructor are considered implementation
+        specific. The API does not define the constructor arguments.
+
+    :param fp: open file object pointer reference
+    :param data_file: on-disk data file name for the object
+    :param obj_size: verified on-disk size of the object
+    :param etag: expected metadata etag value for entire file
+    :param disk_chunk_size: size of reads from disk in bytes
+    :param keep_cache_size: maximum object size that will be kept in cache
+    :param device_path: on-disk device path, used when quarantining an obj
+    :param logger: logger caller wants this object to use
+    :param quarantine_hook: 1-arg callable called w/reason when quarantined
+    :param use_splice: if true, use zero-copy splice() to send data
+    :param pipe_size: size of pipe buffer used in zero-copy operations
+    :param diskfile: the diskfile creating this DiskFileReader instance
+    :param keep_cache: should resulting reads be kept in the buffer cache
+    :param cooperative_period: the period parameter when does cooperative
+                               yielding during file read
+    :param etag_validate_frac: the probability that we should perform etag
+                               validation during a complete file read
+    """
+    def __init__(self, fp, data_file, obj_size, etag,
+                 disk_chunk_size, keep_cache_size, device_path, logger,
+                 quarantine_hook, use_splice, pipe_size, diskfile,
+                 keep_cache=False, cooperative_period=0,
+                 etag_validate_frac=1):
+        # Parameter tracking
+        self._fp = fp
+        self._data_file = data_file
+        self._obj_size = obj_size
+        self._etag = etag
+        self._diskfile = diskfile
+        self._disk_chunk_size = disk_chunk_size
+        self._device_path = device_path
+        self._logger = logger
+        self._quarantine_hook = quarantine_hook
+        self._use_splice = use_splice
+        self._pipe_size = pipe_size
+        if keep_cache:
+            # Caller suggests we keep this in cache, only do it if the
+            # object's size is less than the maximum.
+            self._keep_cache = obj_size < keep_cache_size
+        else:
+            self._keep_cache = False
+        self._cooperative_period = cooperative_period
+        self._etag_validate_frac = etag_validate_frac
+
+        # Internal Attributes
+        self._iter_etag = None
+        self._bytes_read = 0
+        self._started_at_0 = False
+        self._read_to_eof = False
+        self._md5_of_sent_bytes = None
+        self._suppress_file_closing = False
+        self._quarantined_dir = None
+
+    @property
+    def manager(self):
+        return self._diskfile.manager
+
+    def _init_checks(self):
+        if self._fp.tell() == 0:
+            self._started_at_0 = True
+            if random.random() < self._etag_validate_frac:
+                self._iter_etag = md5(usedforsecurity=False)
+
+    def _update_checks(self, chunk):
+        if self._iter_etag:
+            self._iter_etag.update(chunk)
+
+    def __iter__(self):
+        return CooperativeIterator(
+            self._inner_iter(), period=self._cooperative_period)
+
+    def _inner_iter(self):
+        """Returns an iterator over the data file."""
+        try:
+            dropped_cache = 0
+            self._bytes_read = 0
+            self._started_at_0 = False
+            self._read_to_eof = False
+            self._init_checks()
+            while True:
+                try:
+                    chunk = self._fp.read(self._disk_chunk_size)
+                except IOError as e:
+                    if e.errno == errno.EIO:
+                        # Note that if there's no quarantine hook set up,
+                        # this won't raise any exception
+                        self._quarantine(str(e))
+                    # ... so it's significant that this is not in an else
+                    raise
+                if chunk:
+                    self._update_checks(chunk)
+                    self._bytes_read += len(chunk)
+                    if self._bytes_read - dropped_cache > DROP_CACHE_WINDOW:
+                        self._drop_cache(self._fp.fileno(), dropped_cache,
+                                         self._bytes_read - dropped_cache)
+                        dropped_cache = self._bytes_read
+                    yield chunk
+                else:
+                    self._read_to_eof = True
+                    self._drop_cache(self._fp.fileno(), dropped_cache,
+                                     self._bytes_read - dropped_cache)
+                    break
+        finally:
+            if not self._suppress_file_closing:
+                self.close()
+
+    def can_zero_copy_send(self):
+        return self._use_splice
+
+    def zero_copy_send(self, wsockfd):
+        """
+        Does some magic with splice() and tee() to move stuff from disk to
+        network without ever touching userspace.
+
+        :param wsockfd: file descriptor (integer) of the socket out which to
+                        send data
+        """
+        # Note: if we ever add support for zero-copy ranged GET responses,
+        # we'll have to make this conditional.
+        self._started_at_0 = True
+
+        rfd = self._fp.fileno()
+        client_rpipe, client_wpipe = os.pipe()
+        hash_rpipe, hash_wpipe = os.pipe()
+        md5_sockfd = get_md5_socket()
+
+        # The actual amount allocated to the pipe may be rounded up to the
+        # nearest multiple of the page size. If we have the memory allocated,
+        # we may as well use it.
+        #
+        # Note: this will raise IOError on failure, so we don't bother
+        # checking the return value.
+        pipe_size = fcntl.fcntl(client_rpipe, F_SETPIPE_SZ, self._pipe_size)
+        fcntl.fcntl(hash_rpipe, F_SETPIPE_SZ, pipe_size)
+
+        dropped_cache = 0
+        self._bytes_read = 0
+        try:
+            while True:
+                # Read data from disk to pipe
+                (bytes_in_pipe, _1, _2) = splice(
+                    rfd, None, client_wpipe, None, pipe_size, 0)
+                if bytes_in_pipe == 0:
+                    self._read_to_eof = True
+                    self._drop_cache(rfd, dropped_cache,
+                                     self._bytes_read - dropped_cache)
+                    break
+                self._bytes_read += bytes_in_pipe
+
+                # "Copy" data from pipe A to pipe B (really just some pointer
+                # manipulation in the kernel, not actual copying).
+                bytes_copied = tee(client_rpipe, hash_wpipe, bytes_in_pipe, 0)
+                if bytes_copied != bytes_in_pipe:
+                    # We teed data between two pipes of equal size, and the
+                    # destination pipe was empty. If, somehow, the destination
+                    # pipe was full before all the data was teed, we should
+                    # fail here. If we don't raise an exception, then we will
+                    # have the incorrect MD5 hash once the object has been
+                    # sent out, causing a false-positive quarantine.
+                    raise Exception("tee() failed: tried to move %d bytes, "
+                                    "but only moved %d" %
+                                    (bytes_in_pipe, bytes_copied))
+                # Take the data and feed it into an in-kernel MD5 socket. The
+                # MD5 socket hashes data that is written to it. Reading from
+                # it yields the MD5 checksum of the written data.
+                #
+                # Note that we don't have to worry about splice() returning
+                # None here (which happens on EWOULDBLOCK); we're splicing
+                # $bytes_in_pipe bytes from a pipe with exactly that many
+                # bytes in it, so read won't block, and we're splicing it into
+                # an MD5 socket, which synchronously hashes any data sent to
+                # it, so writing won't block either.
+                (hashed, _1, _2) = splice(hash_rpipe, None, md5_sockfd, None,
+                                          bytes_in_pipe, splice.SPLICE_F_MORE)
+                if hashed != bytes_in_pipe:
+                    raise Exception("md5 socket didn't take all the data? "
+                                    "(tried to write %d, but wrote %d)" %
+                                    (bytes_in_pipe, hashed))
+
+                while bytes_in_pipe > 0:
+                    try:
+                        res = splice(client_rpipe, None, wsockfd, None,
+                                     bytes_in_pipe, 0)
+                        bytes_in_pipe -= res[0]
+                    except IOError as exc:
+                        if exc.errno == errno.EWOULDBLOCK:
+                            trampoline(wsockfd, write=True)
+                        else:
+                            raise
+
+                if self._bytes_read - dropped_cache > DROP_CACHE_WINDOW:
+                    self._drop_cache(rfd, dropped_cache,
+                                     self._bytes_read - dropped_cache)
+                    dropped_cache = self._bytes_read
+        finally:
+            # Linux MD5 sockets return '00000000000000000000000000000000' for
+            # the checksum if you didn't write any bytes to them, instead of
+            # returning the correct value.
+            if self._bytes_read > 0:
+                bin_checksum = os.read(md5_sockfd, 16)
+                hex_checksum = binascii.hexlify(bin_checksum).decode('ascii')
+            else:
+                hex_checksum = MD5_OF_EMPTY_STRING
+            self._md5_of_sent_bytes = hex_checksum
+
+            os.close(client_rpipe)
+            os.close(client_wpipe)
+            os.close(hash_rpipe)
+            os.close(hash_wpipe)
+            os.close(md5_sockfd)
+            self.close()
+
+    def app_iter_range(self, start, stop):
+        """
+        Returns an iterator over the data file for range (start, stop)
+
+        """
+        if start or start == 0:
+            self._fp.seek(start)
+        if stop is not None:
+            length = stop - start
+        else:
+            length = None
+        try:
+            for chunk in self:
+                if length is not None:
+                    length -= len(chunk)
+                    if length < 0:
+                        # Chop off the extra:
+                        yield chunk[:length]
+                        break
+                yield chunk
+        finally:
+            if not self._suppress_file_closing:
+                self.close()
+
+    def app_iter_ranges(self, ranges, content_type, boundary, size):
+        """
+        Returns an iterator over the data file for a set of ranges
+
+        """
+        if not ranges:
+            yield b''
+        else:
+            if not isinstance(content_type, bytes):
+                content_type = content_type.encode('utf8')
+            if not isinstance(boundary, bytes):
+                boundary = boundary.encode('ascii')
+            try:
+                self._suppress_file_closing = True
+                for chunk in multi_range_iterator(
+                        ranges, content_type, boundary, size,
+                        self.app_iter_range):
+                    yield chunk
+            finally:
+                self._suppress_file_closing = False
+                self.close()
+
+    def _drop_cache(self, fd, offset, length):
+        """
+        Method for no-oping buffer cache drop method.
+
+        :param fd: file descriptor or filename
+        """
+        if not self._keep_cache:
+            drop_buffer_cache(fd, offset, length)
+
+    def _quarantine(self, msg):
+        self._quarantined_dir = self.manager.quarantine_renamer(
+            self._device_path, self._data_file)
+        self._logger.warning("Quarantined object %s: %s" % (
+            self._data_file, msg))
+        self._logger.increment('quarantines')
+        self._quarantine_hook(msg)
+
+    def _handle_close_quarantine(self):
+        """Check if file needs to be quarantined"""
+        if self._iter_etag and not self._md5_of_sent_bytes:
+            self._md5_of_sent_bytes = self._iter_etag.hexdigest()
+
+        if self._bytes_read != self._obj_size:
+            self._quarantine(
+                "Bytes read: %s, does not match metadata: %s" % (
+                    self._bytes_read, self._obj_size))
+        elif self._md5_of_sent_bytes and \
+                self._etag != self._md5_of_sent_bytes:
+            self._quarantine(
+                "ETag %s and file's md5 %s do not match" % (
+                    self._etag, self._md5_of_sent_bytes))
+
+    def close(self):
+        """
+        Close the open file handle if present.
+
+        For this specific implementation, this method will handle quarantining
+        the file if necessary.
+        """
+        if self._fp:
+            try:
+                if self._started_at_0 and self._read_to_eof:
+                    self._handle_close_quarantine()
+            except DiskFileQuarantined:
+                raise
+            except (Exception, Timeout) as e:
+                self._logger.error(
+                    'ERROR DiskFile %(data_file)s'
+                    ' close failure: %(exc)s : %(stack)s',
+                    {'exc': e, 'stack': ''.join(traceback.format_exc()),
+                     'data_file': self._data_file})
+            finally:
+                fp, self._fp = self._fp, None
+                fp.close()
+
+
+class BaseDiskFile(object):
+    """
+    Manage object files.
+
+    This specific implementation manages object files on a disk formatted with
+    a POSIX-compliant file system that supports extended attributes as
+    metadata on a file or directory.
+
+    .. note::
+
+        The arguments to the constructor are considered implementation
+        specific. The API does not define the constructor arguments.
+
+        The following path format is used for data file locations:
+        <devices_path/<device_dir>/<datadir>/<partdir>/<suffixdir>/<hashdir>/
+        <datafile>.<ext>
+
+    :param mgr: associated DiskFileManager instance
+    :param device_path: path to the target device or drive
+    :param partition: partition on the device in which the object lives
+    :param account: account name for the object
+    :param container: container name for the object
+    :param obj: object name for the object
+    :param _datadir: override the full datadir otherwise constructed here
+    :param policy: the StoragePolicy instance
+    :param use_splice: if true, use zero-copy splice() to send data
+    :param pipe_size: size of pipe buffer used in zero-copy operations
+    :param open_expired: if True, open() will not raise a DiskFileExpired if
+                         object is expired
+    :param next_part_power: the next partition power to be used
+    """
+    reader_cls = None  # must be set by subclasses
+    writer_cls = None  # must be set by subclasses
+
+    def __init__(self, mgr, device_path, partition,
+                 account=None, container=None, obj=None, _datadir=None,
+                 policy=None, use_splice=False, pipe_size=None,
+                 open_expired=False, next_part_power=None, **kwargs):
+        self._manager = mgr
+        self._device_path = device_path
+        self._logger = mgr.logger
+        self._disk_chunk_size = mgr.disk_chunk_size
+        self._bytes_per_sync = mgr.bytes_per_sync
+        self._use_splice = use_splice
+        self._pipe_size = pipe_size
+        self._open_expired = open_expired
+        # This might look a lttle hacky i.e tracking number of newly created
+        # dirs to fsync only those many later. If there is a better way,
+        # please suggest.
+        # Or one could consider getting rid of doing fsyncs on dirs altogether
+        # and mounting XFS with the 'dirsync' mount option which should result
+        # in all entry fops being carried out synchronously.
+        self._dirs_created = 0
+        self.policy = policy
+        self.next_part_power = next_part_power
+        if account and container and obj:
+            self._name = '/' + '/'.join((account, container, obj))
+            self._account = account
+            self._container = container
+            self._obj = obj
+        elif account or container or obj:
+            raise ValueError(
+                'Received a/c/o args %r, %r, and %r. Either none or all must '
+                'be provided.' % (account, container, obj))
+        else:
+            # gets populated when we read the metadata
+            self._name = None
+            self._account = None
+            self._container = None
+            self._obj = None
+        self._tmpdir = join(device_path, get_tmp_dir(policy))
+        self._ondisk_info = None
+        self._metadata = None
+        self._datafile_metadata = None
+        self._metafile_metadata = None
+        self._data_file = None
+        self._fp = None
+        self._quarantined_dir = None
+        self._content_length = None
+        if _datadir:
+            self._datadir = _datadir
+        else:
+            name_hash = hash_path(account, container, obj)
+            self._datadir = join(
+                device_path, storage_directory(get_data_dir(policy),
+                                               partition, name_hash))
+
+    def __repr__(self):
+        return '<%s datadir=%r>' % (self.__class__.__name__, self._datadir)
+
+    @property
+    def manager(self):
+        return self._manager
+
+    @property
+    def account(self):
+        return self._account
+
+    @property
+    def container(self):
+        return self._container
+
+    @property
+    def obj(self):
+        return self._obj
+
+    @property
+    def content_length(self):
+        if self._metadata is None:
+            raise DiskFileNotOpen()
+        return self._content_length
+
+    @property
+    def timestamp(self):
+        if self._metadata is None:
+            raise DiskFileNotOpen()
+        return Timestamp(self._metadata.get('X-Timestamp'))
+
+    @property
+    def data_timestamp(self):
+        if self._datafile_metadata is None:
+            raise DiskFileNotOpen()
+        return Timestamp(self._datafile_metadata.get('X-Timestamp'))
+
+    @property
+    def durable_timestamp(self):
+        """
+        Provides the timestamp of the newest data file found in the object
+        directory.
+
+        :return: A Timestamp instance, or None if no data file was found.
+        :raises DiskFileNotOpen: if the open() method has not been previously
+                                 called on this instance.
+        """
+        if self._ondisk_info is None:
+            raise DiskFileNotOpen()
+        if self._datafile_metadata:
+            return Timestamp(self._datafile_metadata.get('X-Timestamp'))
+        return None
+
+    @property
+    def fragments(self):
+        return None
+
+    @property
+    def content_type(self):
+        if self._metadata is None:
+            raise DiskFileNotOpen()
+        return self._metadata.get('Content-Type')
+
+    @property
+    def content_type_timestamp(self):
+        if self._metadata is None:
+            raise DiskFileNotOpen()
+        t = self._metadata.get('Content-Type-Timestamp',
+                               self._datafile_metadata.get('X-Timestamp'))
+        return Timestamp(t)
+
+    @classmethod
+    def from_hash_dir(cls, mgr, hash_dir_path, device_path, partition, policy):
+        return cls(mgr, device_path, partition, _datadir=hash_dir_path,
+                   policy=policy)
+
+    def open(self, modernize=False, current_time=None):
+        """
+        Open the object.
+
+        This implementation opens the data file representing the object, reads
+        the associated metadata in the extended attributes, additionally
+        combining metadata from fast-POST `.meta` files.
+
+        :param modernize: if set, update this diskfile to the latest format.
+             Currently, this means adding metadata checksums if none are
+             present.
+
+        :param current_time: Unix time used in checking expiration. If not
+             present, the current time will be used.
+
+        .. note::
+
+            An implementation is allowed to raise any of the following
+            exceptions, but is only required to raise `DiskFileNotExist` when
+            the object representation does not exist.
+
+        :raises DiskFileCollision: on name mis-match with metadata
+        :raises DiskFileNotExist: if the object does not exist
+        :raises DiskFileDeleted: if the object was previously deleted
+        :raises DiskFileQuarantined: if while reading metadata of the file
+                                     some data did pass cross checks
+        :returns: itself for use as a context manager
+        """
+        # First figure out if the data directory exists
+        try:
+            files = os.listdir(self._datadir)
+        except OSError as err:
+            if err.errno == errno.ENOTDIR:
+                # If there's a file here instead of a directory, quarantine
+                # it; something's gone wrong somewhere.
+                raise self._quarantine(
+                    # hack: quarantine_renamer actually renames the directory
+                    # enclosing the filename you give it, but here we just
+                    # want this one file and not its parent.
+                    os.path.join(self._datadir, "made-up-filename"),
+                    "Expected directory, found file at %s" % self._datadir)
+            elif err.errno in (errno.ENODATA, EUCLEAN):
+                try:
+                    # We've seen cases where bad sectors lead to ENODATA here
+                    raise self._quarantine(
+                        # similar hack to above
+                        os.path.join(self._datadir, "made-up-filename"),
+                        "Failed to list directory at %s" % self._datadir)
+                except (OSError, IOError):
+                    # We've *also* seen the bad sectors lead to us needing to
+                    # quarantine the whole suffix, not just the hash dir
+                    raise self._quarantine(
+                        # skip the above hack to rename the suffix
+                        self._datadir,
+                        "Failed to list directory at %s" % self._datadir)
+            elif err.errno != errno.ENOENT:
+                raise DiskFileError(
+                    "Error listing directory %s: %s" % (self._datadir, err))
+            # The data directory does not exist, so the object cannot exist.
+            files = []
+
+        # gather info about the valid files to use to open the DiskFile
+        file_info = self._get_ondisk_files(files, self.policy)
+
+        self._data_file = file_info.get('data_file')
+        if not self._data_file:
+            raise self._construct_exception_from_ts_file(**file_info)
+        try:
+            self._fp = self._construct_from_data_file(
+                current_time=current_time, modernize=modernize, **file_info)
+        except IOError as e:
+            if e.errno in (errno.ENODATA, EUCLEAN):
+                raise self._quarantine(
+                    file_info['data_file'],
+                    "Failed to open %s: %s" % (file_info['data_file'], e))
+        # This method must populate the internal _metadata attribute.
+        self._metadata = self._metadata or {}
+        return self
+
+    def __enter__(self):
+        """
+        Context enter.
+
+        .. note::
+
+            An implementation shall raise `DiskFileNotOpen` when has not
+            previously invoked the :func:`swift.obj.diskfile.DiskFile.open`
+            method.
+        """
+        if self._metadata is None:
+            raise DiskFileNotOpen()
+        return self
+
+    def __exit__(self, t, v, tb):
+        """
+        Context exit.
+
+        .. note::
+
+            This method will be invoked by the object server while servicing
+            the REST API *before* the object has actually been read. It is the
+            responsibility of the implementation to properly handle that.
+        """
+        if self._fp is not None:
+            fp, self._fp = self._fp, None
+            fp.close()
+
+    def _quarantine(self, data_file, msg):
+        """
+        Quarantine a file; responsible for incrementing the associated logger's
+        count of quarantines.
+
+        :param data_file: full path of data file to quarantine
+        :param msg: reason for quarantining to be included in the exception
+        :returns: DiskFileQuarantined exception object
+        """
+        self._quarantined_dir = self.manager.quarantine_renamer(
+            self._device_path, data_file)
+        self._logger.warning("Quarantined object %s: %s" % (
+            data_file, msg))
+        self._logger.increment('quarantines')
+        return DiskFileQuarantined(msg)
+
+    def _get_ondisk_files(self, files, policy=None):
+        """
+        Determine the on-disk files to use.
+
+        :param files: a list of files in the object's dir
+        :param policy: storage policy used to store the files
+        :returns: dict of files to use having keys 'data_file', 'ts_file',
+                 'meta_file'
+        """
+        raise NotImplementedError
+
+    def _construct_exception_from_ts_file(self, ts_file, **kwargs):
+        """
+        If a tombstone is present it means the object is considered
+        deleted. We just need to pull the metadata from the tombstone file
+        which has the timestamp to construct the deleted exception. If there
+        was no tombstone, just report it does not exist.
+
+        :param ts_file: the tombstone file name found on disk
+        :returns: DiskFileDeleted if the ts_file was provided, else
+                  DiskFileNotExist
+        """
+        if not ts_file:
+            exc = DiskFileNotExist()
+        else:
+            try:
+                metadata = self._read_and_validate_metadata(ts_file, ts_file)
+            except (DiskFileQuarantined, DiskFileStateChanged):
+                # If the tombstone's corrupted, quarantine it and pretend it
+                # wasn't there
+                exc = DiskFileNotExist()
+            else:
+                # All well and good that we have found a tombstone file, but
+                # we don't have a data file so we are just going to raise an
+                # exception that we could not find the object, providing the
+                # tombstone's timestamp.
+                exc = DiskFileDeleted(metadata=metadata)
+        return exc
+
+    def validate_metadata(self):
+        return ('Content-Length' in self._datafile_metadata)
+
+    def _verify_name_matches_hash(self, data_file):
+        """
+
+        :param data_file: data file name, used when quarantines occur
+        """
+        hash_from_fs = os.path.basename(self._datadir)
+        hash_from_name = hash_path(self._name.lstrip('/'))
+        if hash_from_fs != hash_from_name:
+            raise self._quarantine(
+                data_file,
+                "Hash of name in metadata does not match directory name")
+
+    def _verify_data_file(self, data_file, fp, current_time):
+        """
+        Verify the metadata's name value matches what we think the object is
+        named.
+
+        :param data_file: data file name being consider, used when quarantines
+                          occur
+        :param fp: open file pointer so that we can `fstat()` the file to
+                   verify the on-disk size with Content-Length metadata value
+        :param current_time: Unix time used in checking expiration
+        :raises DiskFileCollision: if the metadata stored name does not match
+                                   the referenced name of the file
+        :raises DiskFileExpired: if the object has expired
+        :raises DiskFileQuarantined: if data inconsistencies were detected
+                                     between the metadata and the file-system
+                                     metadata
+        """
+        try:
+            mname = self._metadata['name']
+        except KeyError:
+            raise self._quarantine(data_file, "missing name metadata")
+        else:
+            if mname != self._name:
+                self._logger.error(
+                    'Client path %(client)s does not match '
+                    'path stored in object metadata %(meta)s',
+                    {'client': self._name, 'meta': mname})
+                raise DiskFileCollision('Client path does not match path '
+                                        'stored in object metadata')
+        try:
+            x_delete_at = int(self._metadata['X-Delete-At'])
+        except KeyError:
+            pass
+        except ValueError:
+            # Quarantine, the x-delete-at key is present but not an
+            # integer.
+            raise self._quarantine(
+                data_file, "bad metadata x-delete-at value %s" % (
+                    self._metadata['X-Delete-At']))
+        else:
+            if current_time is None:
+                current_time = time.time()
+            if x_delete_at <= current_time and not self._open_expired:
+                raise DiskFileExpired(metadata=self._metadata)
+        try:
+            metadata_size = int(self._metadata['Content-Length'])
+        except KeyError:
+            raise self._quarantine(
+                data_file, "missing content-length in metadata")
+        except ValueError:
+            # Quarantine, the content-length key is present but not an
+            # integer.
+            raise self._quarantine(
+                data_file, "bad metadata content-length value %s" % (
+                    self._metadata['Content-Length']))
+        fd = fp.fileno()
+        try:
+            statbuf = os.fstat(fd)
+        except OSError as err:
+            # Quarantine, we can't successfully stat the file.
+            raise self._quarantine(data_file, "not stat-able: %s" % err)
+        else:
+            obj_size = statbuf.st_size
+        if obj_size != metadata_size:
+            raise self._quarantine(
+                data_file, "metadata content-length %s does"
+                " not match actual object size %s" % (
+                    metadata_size, statbuf.st_size))
+        self._content_length = obj_size
+        return obj_size
+
+    def _read_and_validate_metadata(self, source, quarantine_filename=None,
+                                    add_missing_checksum=False):
+        """
+        Read metadata from source object file. In case of failure, quarantine
+        the file.
+
+        Takes source and filename separately so we can read from an open
+        file if we have one.
+
+        :param source: file descriptor or filename to load the metadata from
+        :param quarantine_filename: full path of file to load the metadata from
+        :param add_missing_checksum: if True and no metadata checksum is
+            present, generate one and write it down
+        :returns: dictionary of metadata
+        :raises DiskFileXattrNotSupported: if the filesystem does not support
+            xattr
+        :raises DiskFileStateChanged: if the file metadata could not be
+            read
+        :raises DiskFileQuarantined: if an error occurred that caused the file
+            to be quarantined
+        """
+        try:
+            return _read_file_metadata(source, add_missing_checksum)
+        except (DiskFileXattrNotSupported, DiskFileStateChanged):
+            raise
+        except DiskFileBadMetadataChecksum as err:
+            raise self._quarantine(quarantine_filename, str(err))
+        except Exception as err:
+            raise self._quarantine(
+                quarantine_filename,
+                "Exception reading metadata: %s" % err)
+
+    def _merge_content_type_metadata(self, ctype_file):
+        """
+        When a second .meta file is providing the most recent Content-Type
+        metadata then merge it into the metafile_metadata.
+
+        :param ctype_file: An on-disk .meta file
+        """
+        ctypefile_metadata = self._read_and_validate_metadata(
+            ctype_file, ctype_file)
+        if ('Content-Type' in ctypefile_metadata
+            and (ctypefile_metadata.get('Content-Type-Timestamp', '') >
+                 self._metafile_metadata.get('Content-Type-Timestamp', ''))
+            and (ctypefile_metadata.get('Content-Type-Timestamp', '') >
+                 self.data_timestamp)):
+            self._metafile_metadata['Content-Type'] = \
+                ctypefile_metadata['Content-Type']
+            self._metafile_metadata['Content-Type-Timestamp'] = \
+                ctypefile_metadata.get('Content-Type-Timestamp')
+
+    def _construct_from_data_file(self, data_file, meta_file, ctype_file,
+                                  current_time, modernize=False,
+                                  **kwargs):
+        """
+        Open the `.data` file to fetch its metadata, and fetch the metadata
+        from fast-POST `.meta` files as well if any exist, merging them
+        properly.
+
+        :param data_file: on-disk `.data` file being considered
+        :param meta_file: on-disk fast-POST `.meta` file being considered
+        :param ctype_file: on-disk fast-POST `.meta` file being considered that
+                           contains content-type and content-type timestamp
+        :param current_time: Unix time used in checking expiration
+        :param modernize: whether to update the on-disk files to the newest
+                          format
+        :returns: an opened data file pointer
+        :raises DiskFileStateChanged: if any of the on-disk files could not be
+            read
+        :raises DiskFileCollision: if the metadata stored name does not match
+                                   the referenced name of the file
+        :raises DiskFileExpired: if the object has expired
+        :raises DiskFileQuarantined: if data inconsistencies were detected
+                                     between the metadata and the file-system
+                                     metadata
+        """
+        try:
+            fp = open(data_file, 'rb')
+        except IOError as e:
+            if e.errno == errno.ENOENT:
+                raise DiskFileStateChanged()
+            raise
+        self._datafile_metadata = self._read_and_validate_metadata(
+            fp, data_file,
+            add_missing_checksum=modernize)
+        self._metadata = {}
+        if meta_file:
+            self._metafile_metadata = self._read_and_validate_metadata(
+                meta_file, meta_file,
+                add_missing_checksum=modernize)
+            if ctype_file and ctype_file != meta_file:
+                self._merge_content_type_metadata(ctype_file)
+            sys_metadata = dict(
+                [(key, val) for key, val in self._datafile_metadata.items()
+                 if key.lower() in (RESERVED_DATAFILE_META |
+                                    DATAFILE_SYSTEM_META)
+                 or is_sys_meta('object', key)])
+            self._metadata.update(self._metafile_metadata)
+            self._metadata.update(sys_metadata)
+            # diskfile writer added 'name' to metafile, so remove it here
+            self._metafile_metadata.pop('name', None)
+            # TODO: the check for Content-Type is only here for tests that
+            # create .data files without Content-Type
+            if ('Content-Type' in self._datafile_metadata and
+                    (self.data_timestamp >
+                     self._metafile_metadata.get('Content-Type-Timestamp'))):
+                self._metadata['Content-Type'] = \
+                    self._datafile_metadata['Content-Type']
+                self._metadata.pop('Content-Type-Timestamp', None)
+        else:
+            self._metadata.update(self._datafile_metadata)
+        if self._name is None:
+            # If we don't know our name, we were just given a hash dir at
+            # instantiation, so we'd better validate that the name hashes back
+            # to us
+            self._name = self._metadata['name']
+            self._verify_name_matches_hash(data_file)
+        self._verify_data_file(data_file, fp, current_time)
+        return fp
+
+    def get_metafile_metadata(self):
+        """
+        Provide the metafile metadata for a previously opened object as a
+        dictionary. This is metadata that was written by a POST and does not
+        include any persistent metadata that was set by the original PUT.
+
+        :returns: object's .meta file metadata dictionary, or None if there is
+                  no .meta file
+        :raises DiskFileNotOpen: if the
+            :func:`swift.obj.diskfile.DiskFile.open` method was not previously
+            invoked
+        """
+        if self._metadata is None:
+            raise DiskFileNotOpen()
+        return self._metafile_metadata
+
+    def get_datafile_metadata(self):
+        """
+        Provide the datafile metadata for a previously opened object as a
+        dictionary. This is metadata that was included when the object was
+        first PUT, and does not include metadata set by any subsequent POST.
+
+        :returns: object's datafile metadata dictionary
+        :raises DiskFileNotOpen: if the
+            :func:`swift.obj.diskfile.DiskFile.open` method was not previously
+            invoked
+        """
+        if self._datafile_metadata is None:
+            raise DiskFileNotOpen()
+        return self._datafile_metadata
+
+    def get_metadata(self):
+        """
+        Provide the metadata for a previously opened object as a dictionary.
+
+        :returns: object's metadata dictionary
+        :raises DiskFileNotOpen: if the
+            :func:`swift.obj.diskfile.DiskFile.open` method was not previously
+            invoked
+        """
+        if self._metadata is None:
+            raise DiskFileNotOpen()
+        return self._metadata
+
+    def read_metadata(self, current_time=None):
+        """
+        Return the metadata for an object without requiring the caller to open
+        the object first.
+
+        :param current_time: Unix time used in checking expiration. If not
+             present, the current time will be used.
+        :returns: metadata dictionary for an object
+        :raises DiskFileError: this implementation will raise the same
+                            errors as the `open()` method.
+        """
+        with self.open(current_time=current_time):
+            return self.get_metadata()
+
+    def reader(self, keep_cache=False, cooperative_period=0,
+               etag_validate_frac=1,
+               _quarantine_hook=lambda m: None):
+        """
+        Return a :class:`swift.common.swob.Response` class compatible
+        "`app_iter`" object as defined by
+        :class:`swift.obj.diskfile.DiskFileReader`.
+
+        For this implementation, the responsibility of closing the open file
+        is passed to the :class:`swift.obj.diskfile.DiskFileReader` object.
+
+        :param keep_cache: caller's preference for keeping data read in the
+                           OS buffer cache
+        :param cooperative_period: the period parameter for cooperative
+                                   yielding during file read
+        :param etag_validate_frac: the probability that we should perform etag
+                                   validation during a complete file read
+        :param _quarantine_hook: 1-arg callable called when obj quarantined;
+                                 the arg is the reason for quarantine.
+                                 Default is to ignore it.
+                                 Not needed by the REST layer.
+        :returns: a :class:`swift.obj.diskfile.DiskFileReader` object
+        """
+        dr = self.reader_cls(
+            self._fp, self._data_file, int(self._metadata['Content-Length']),
+            self._metadata['ETag'], self._disk_chunk_size,
+            self._manager.keep_cache_size, self._device_path, self._logger,
+            use_splice=self._use_splice, quarantine_hook=_quarantine_hook,
+            pipe_size=self._pipe_size, diskfile=self, keep_cache=keep_cache,
+            cooperative_period=cooperative_period,
+            etag_validate_frac=etag_validate_frac)
+        # At this point the reader object is now responsible for closing
+        # the file pointer.
+        self._fp = None
+        return dr
+
+    def _writer(self, size, extension):
+        return self.writer_cls(self._name, self._datadir, size,
+                               self._bytes_per_sync, self,
+                               self.next_part_power, extension=extension)
+
+    def writer(self, size=None):
+        return self._writer(size, '.data')
+
+    @contextmanager
+    def create(self, size=None, extension='.data'):
+        """
+        Context manager to create a file. We create a temporary file first, and
+        then return a DiskFileWriter object to encapsulate the state.
+
+        .. note::
+
+            An implementation is not required to perform on-disk
+            preallocations even if the parameter is specified. But if it does
+            and it fails, it must raise a `DiskFileNoSpace` exception.
+
+        :param size: optional initial size of file to explicitly allocate on
+                     disk
+        :param extension: file extension to use for the newly-created file;
+                          defaults to ``.data`` for the sake of tests
+        :raises DiskFileNoSpace: if a size is specified and allocation fails
+        """
+        dfw = self._writer(size, extension)
+        try:
+            yield dfw.open()
+        finally:
+            dfw.close()
+
+    def write_metadata(self, metadata):
+        """
+        Write a block of metadata to an object without requiring the caller to
+        create the object first. Supports fast-POST behavior semantics.
+
+        :param metadata: dictionary of metadata to be associated with the
+                         object
+        :raises DiskFileError: this implementation will raise the same
+                            errors as the `create()` method.
+        """
+        with self.create(extension='.meta') as writer:
+            writer.put(metadata)
+
+    def delete(self, timestamp):
+        """
+        Delete the object.
+
+        This implementation creates a tombstone file using the given
+        timestamp, and removes any older versions of the object file. Any
+        file that has an older timestamp than timestamp will be deleted.
+
+        .. note::
+
+            An implementation is free to use or ignore the timestamp
+            parameter.
+
+        :param timestamp: timestamp to compare with each file
+        :raises DiskFileError: this implementation will raise the same
+                            errors as the `create()` method.
+        """
+        # this is dumb, only tests send in strings
+        timestamp = Timestamp(timestamp)
+        with self.create(extension='.ts') as deleter:
+            deleter.put({'X-Timestamp': timestamp.internal})
+
+
+class DiskFileReader(BaseDiskFileReader):
+    pass
+
+
+class DiskFileWriter(BaseDiskFileWriter):
+    def put(self, metadata):
+        """
+        Finalize writing the file on disk.
+
+        :param metadata: dictionary of metadata to be associated with the
+                         object
+        """
+        super(DiskFileWriter, self)._put(metadata, True)
+
+
+class DiskFile(BaseDiskFile):
+    reader_cls = DiskFileReader
+    writer_cls = DiskFileWriter
+
+    def _get_ondisk_files(self, files, policy=None):
+        self._ondisk_info = self.manager.get_ondisk_files(
+            files, self._datadir, policy=policy)
+        return self._ondisk_info
+
+
+class DiskFileManager(BaseDiskFileManager):
+    diskfile_cls = DiskFile
+    policy = REPL_POLICY
+
+    def _process_ondisk_files(self, exts, results, **kwargs):
+        """
+        Implement replication policy specific handling of .data files.
+
+        :param exts: dict of lists of file info, keyed by extension
+        :param results: a dict that may be updated with results
+        """
+        if exts.get('.data'):
+            for ext in exts.keys():
+                if ext == '.data':
+                    # older .data's are obsolete
+                    exts[ext], obsolete = self._split_gte_timestamp(
+                        exts[ext], exts['.data'][0]['timestamp'])
+                else:
+                    # other files at same or older timestamp as most recent
+                    # data are obsolete
+                    exts[ext], obsolete = self._split_gt_timestamp(
+                        exts[ext], exts['.data'][0]['timestamp'])
+                results.setdefault('obsolete', []).extend(obsolete)
+
+            # set results
+            results['data_info'] = exts['.data'][0]
+
+        # .meta files *may* be ready for reclaim if there is no data
+        if exts.get('.meta') and not exts.get('.data'):
+            results.setdefault('possible_reclaim', []).extend(
+                exts.get('.meta'))
+
+    def _update_suffix_hashes(self, hashes, ondisk_info):
+        """
+        Applies policy specific updates to the given dict of md5 hashes for
+        the given ondisk_info.
+
+        :param hashes: a dict of md5 hashes to be updated
+        :param ondisk_info: a dict describing the state of ondisk files, as
+                            returned by get_ondisk_files
+        """
+        if 'data_info' in ondisk_info:
+            file_info = ondisk_info['data_info']
+            hashes[None].update(
+                file_info['timestamp'].internal + file_info['ext'])
+
+    def _hash_suffix(self, path, policy=None):
+        """
+        Performs reclamation and returns an md5 of all (remaining) files.
+
+        :param path: full path to directory
+        :param policy: storage policy used to store the files
+        :raises PathNotDir: if given path is not a valid directory
+        :raises OSError: for non-ENOTDIR errors
+        :returns: md5 of files in suffix
+        """
+        hashes = self._hash_suffix_dir(path, policy)
+        return hashes[None].hexdigest()
+
+
+class ECDiskFileReader(BaseDiskFileReader):
+    def __init__(self, fp, data_file, obj_size, etag,
+                 disk_chunk_size, keep_cache_size, device_path, logger,
+                 quarantine_hook, use_splice, pipe_size, diskfile,
+                 keep_cache=False, cooperative_period=0,
+                 etag_validate_frac=1):
+        super(ECDiskFileReader, self).__init__(
+            fp, data_file, obj_size, etag,
+            disk_chunk_size, keep_cache_size, device_path, logger,
+            quarantine_hook, use_splice, pipe_size, diskfile, keep_cache,
+            cooperative_period, etag_validate_frac)
+        self.frag_buf = None
+        self.frag_offset = 0
+        self.frag_size = self._diskfile.policy.fragment_size
+
+    def _init_checks(self):
+        super(ECDiskFileReader, self)._init_checks()
+        # for a multi-range GET this will be called at the start of each range;
+        # only initialise the frag_buf for reads starting at 0.
+        # TODO: reset frag buf to '' if tell() shows that start is on a frag
+        # boundary so that we check frags selected by a range not starting at 0
+        if self._started_at_0:
+            self.frag_buf = b''
+        else:
+            self.frag_buf = None
+
+    def _check_frag(self, frag):
+        if not frag:
+            return
+        if not isinstance(frag, bytes):
+            # ECInvalidParameter can be returned if the frag violates the input
+            # format so for safety, check the input chunk if it's binary to
+            # avoid quarantining a valid fragment archive.
+            self._diskfile._logger.warning(
+                'Unexpected fragment data type (not quarantined) '
+                '%(datadir)s: %(type)s at offset 0x%(offset)x',
+                {'datadir': self._diskfile._datadir,
+                 'type': type(frag),
+                 'offset': self.frag_offset})
+            return
+
+        try:
+            self._diskfile.policy.pyeclib_driver.get_metadata(frag)
+        except (ECInvalidFragmentMetadata, ECBadFragmentChecksum,
+                ECInvalidParameter):
+            # Any of these exceptions may be returned from ECDriver with a
+            # corrupted fragment.
+            msg = 'Invalid EC metadata at offset 0x%x' % self.frag_offset
+            self._quarantine(msg)
+            # We have to terminate the response iter with an exception but it
+            # can't be StopIteration, this will produce a STDERR traceback in
+            # eventlet.wsgi if you have eventlet_debug turned on; but any
+            # attempt to finish the iterator cleanly won't trigger the needful
+            # error handling cleanup - failing to do so, and yet still failing
+            # to deliver all promised bytes will hang the HTTP connection
+            raise DiskFileQuarantined(msg)
+        except ECDriverError as err:
+            self._diskfile._logger.warning(
+                'Problem checking EC fragment %(datadir)s: %(err)s',
+                {'datadir': self._diskfile._datadir, 'err': err})
+
+    def _update_checks(self, chunk):
+        super(ECDiskFileReader, self)._update_checks(chunk)
+        if self.frag_buf is not None:
+            self.frag_buf += chunk
+            cursor = 0
+            while len(self.frag_buf) >= cursor + self.frag_size:
+                self._check_frag(self.frag_buf[cursor:cursor + self.frag_size])
+                cursor += self.frag_size
+                self.frag_offset += self.frag_size
+            if cursor:
+                self.frag_buf = self.frag_buf[cursor:]
+
+    def _handle_close_quarantine(self):
+        super(ECDiskFileReader, self)._handle_close_quarantine()
+        self._check_frag(self.frag_buf)
+
+
+class ECDiskFileWriter(BaseDiskFileWriter):
+
+    def _finalize_durable(self, data_file_path, durable_data_file_path,
+                          timestamp):
+        exc = None
+        new_data_file_path = new_durable_data_file_path = None
+        if self.next_part_power:
+            new_data_file_path = replace_partition_in_path(
+                self.manager.devices, data_file_path, self.next_part_power)
+            new_durable_data_file_path = replace_partition_in_path(
+                self.manager.devices, durable_data_file_path,
+                self.next_part_power)
+        error_in_ppi_rename = False
+        try:
+            try:
+                os.rename(data_file_path, durable_data_file_path)
+                fsync_dir(self._datadir)
+                if self.next_part_power and \
+                        data_file_path != new_data_file_path:
+                    try:
+                        os.rename(new_data_file_path,
+                                  new_durable_data_file_path)
+                    except OSError:
+                        error_in_ppi_rename = True
+                        raise  # Still translate to a DiskFileError below
+
+            except (OSError, IOError) as err:
+                if err.errno == errno.ENOENT:
+                    files = os.listdir(self._datadir)
+                    results = self.manager.get_ondisk_files(
+                        files, self._datadir,
+                        frag_index=self._diskfile._frag_index,
+                        policy=self._diskfile.policy)
+                    # We "succeeded" if another writer cleaned up our data
+                    ts_info = results.get('ts_info')
+                    durables = results.get('durable_frag_set', [])
+                    if ts_info and ts_info['timestamp'] > timestamp:
+                        return
+                    elif any(frag['timestamp'] >= timestamp
+                             for frag in durables):
+                        return
+
+                if error_in_ppi_rename:
+                    self.manager.logger.error(
+                        'Renaming new path %s to %s failed',
+                        new_data_file_path, new_durable_data_file_path)
+                if err.errno not in (errno.ENOSPC, errno.EDQUOT):
+                    # re-raise to catch all handler
+                    raise
+                params = {'file': durable_data_file_path, 'err': err}
+                self.manager.logger.exception(
+                    'No space left on device for %(file)s (%(err)s)',
+                    params)
+                exc = DiskFileNoSpace(
+                    'No space left on device for %(file)s (%(err)s)' % params)
+            else:
+                try:
+                    self.manager.cleanup_ondisk_files(self._datadir)
+                except OSError as os_err:
+                    self.manager.logger.exception(
+                        'Problem cleaning up %(datadir)s (%(err)s)',
+                        {'datadir': self._datadir, 'err': os_err})
+                self._part_power_cleanup(
+                    durable_data_file_path, new_durable_data_file_path)
+
+        except Exception as err:
+            params = {'file': durable_data_file_path, 'err': err}
+            self.manager.logger.exception(
+                'Problem making data file durable %(file)s (%(err)s)',
+                params)
+            exc = DiskFileError(
+                'Problem making data file durable %(file)s (%(err)s)' % params)
+        if exc:
+            raise exc
+
+    def commit(self, timestamp):
+        """
+        Finalize put by renaming the object data file to include a durable
+        marker. We do this for EC policy because it requires a 2-phase put
+        commit confirmation.
+
+        :param timestamp: object put timestamp, an instance of
+                          :class:`~swift.common.utils.Timestamp`
+        :raises DiskFileError: if the diskfile frag_index has not been set
+                              (either during initialisation or a call to put())
+        """
+        data_file_path = join(
+            self._datadir, self.manager.make_on_disk_filename(
+                timestamp, '.data', self._diskfile._frag_index))
+        durable_data_file_path = os.path.join(
+            self._datadir, self.manager.make_on_disk_filename(
+                timestamp, '.data', self._diskfile._frag_index, durable=True))
+        tpool.execute(
+            self._finalize_durable, data_file_path, durable_data_file_path,
+            timestamp)
+
+    def put(self, metadata):
+        """
+        The only difference between this method and the replication policy
+        DiskFileWriter method is adding the frag index to the metadata.
+
+        :param metadata: dictionary of metadata to be associated with object
+        """
+        fi = None
+        cleanup = True
+        if self._extension == '.data':
+            # generally we treat the fragment index provided in metadata as
+            # canon, but if it's unavailable (e.g. tests) it's reasonable to
+            # use the frag_index provided at instantiation. Either way make
+            # sure that the fragment index is included in object sysmeta.
+            fi = metadata.setdefault('X-Object-Sysmeta-Ec-Frag-Index',
+                                     self._diskfile._frag_index)
+            fi = self.manager.validate_fragment_index(
+                fi, self._diskfile.policy)
+            self._diskfile._frag_index = fi
+            # defer cleanup until commit() writes makes diskfile durable
+            cleanup = False
+        super(ECDiskFileWriter, self)._put(metadata, cleanup, frag_index=fi)
+
+
+class ECDiskFile(BaseDiskFile):
+
+    reader_cls = ECDiskFileReader
+    writer_cls = ECDiskFileWriter
+
+    def __init__(self, *args, **kwargs):
+        super(ECDiskFile, self).__init__(*args, **kwargs)
+        frag_index = kwargs.get('frag_index')
+        self._frag_index = None
+        if frag_index is not None:
+            self._frag_index = self.manager.validate_fragment_index(
+                frag_index, self.policy)
+        self._frag_prefs = self._validate_frag_prefs(kwargs.get('frag_prefs'))
+        self._durable_frag_set = None
+
+    def _validate_frag_prefs(self, frag_prefs):
+        """
+        Validate that frag_prefs is a list of dicts containing expected keys
+        'timestamp' and 'exclude'. Convert timestamp values to Timestamp
+        instances and validate that exclude values are valid fragment indexes.
+
+        :param frag_prefs: data to validate, should be a list of dicts.
+        :raise DiskFileError: if the frag_prefs data is invalid.
+        :return: a list of dicts with converted and validated values.
+        """
+        # We *do* want to preserve an empty frag_prefs list because it
+        # indicates that a durable file is not required.
+        if frag_prefs is None:
+            return None
+
+        try:
+            return [
+                {'timestamp': Timestamp(pref['timestamp']),
+                 'exclude': [self.manager.validate_fragment_index(fi)
+                             for fi in pref['exclude']]}
+                for pref in frag_prefs]
+        except ValueError as e:
+            raise DiskFileError(
+                'Bad timestamp in frag_prefs: %r: %s'
+                % (frag_prefs, e))
+        except DiskFileError as e:
+            raise DiskFileError(
+                'Bad fragment index in frag_prefs: %r: %s'
+                % (frag_prefs, e))
+        except (KeyError, TypeError) as e:
+            raise DiskFileError(
+                'Bad frag_prefs: %r: %s' % (frag_prefs, e))
+
+    def validate_metadata(self):
+        required_metadata = [
+            'Content-Length',
+            'X-Object-Sysmeta-Ec-Frag-Index',
+            'X-Object-Sysmeta-Ec-Etag',
+        ]
+        for header in required_metadata:
+            if not self._datafile_metadata.get(header):
+                return False
+        return True
+
+    @property
+    def durable_timestamp(self):
+        """
+        Provides the timestamp of the newest durable file found in the object
+        directory.
+
+        :return: A Timestamp instance, or None if no durable file was found.
+        :raises DiskFileNotOpen: if the open() method has not been previously
+                                 called on this instance.
+        """
+        if self._ondisk_info is None:
+            raise DiskFileNotOpen()
+        if self._ondisk_info.get('durable_frag_set'):
+            return self._ondisk_info['durable_frag_set'][0]['timestamp']
+        return None
+
+    @property
+    def fragments(self):
+        """
+        Provides information about all fragments that were found in the object
+        directory, including fragments without a matching durable file, and
+        including any fragment chosen to construct the opened diskfile.
+
+        :return: A dict mapping <Timestamp instance> -> <list of frag indexes>,
+                 or None if the diskfile has not been opened or no fragments
+                 were found.
+        """
+        if self._ondisk_info:
+            frag_sets = self._ondisk_info['frag_sets']
+            return dict([(ts, [info['frag_index'] for info in frag_set])
+                         for ts, frag_set in frag_sets.items()])
+
+    def _get_ondisk_files(self, files, policy=None):
+        """
+        The only difference between this method and the replication policy
+        DiskFile method is passing in the frag_index and frag_prefs kwargs to
+        our manager's get_ondisk_files method.
+
+        :param files: list of file names
+        :param policy: storage policy used to store the files
+        """
+        self._ondisk_info = self.manager.get_ondisk_files(
+            files, self._datadir, frag_index=self._frag_index,
+            frag_prefs=self._frag_prefs, policy=policy)
+        return self._ondisk_info
+
+    def purge(self, timestamp, frag_index, nondurable_purge_delay=0,
+              meta_timestamp=None):
+        """
+        Remove a tombstone file matching the specified timestamp or
+        datafile matching the specified timestamp and fragment index
+        from the object directory.
+
+        This provides the EC reconstructor/ssync process with a way to
+        remove a tombstone or fragment from a handoff node after
+        reverting it to its primary node.
+
+        The hash will be invalidated, and if empty the hsh_path will
+        be removed immediately.
+
+        :param timestamp: the object timestamp, an instance of
+                          :class:`~swift.common.utils.Timestamp`
+        :param frag_index: fragment archive index, must be
+                           a whole number or None.
+        :param nondurable_purge_delay: only remove a non-durable data file if
+            it's been on disk longer than this many seconds.
+        :param meta_timestamp: if not None then remove any meta file with this
+            timestamp
+        """
+        purge_file = self.manager.make_on_disk_filename(
+            timestamp, ext='.ts')
+        purge_path = os.path.join(self._datadir, purge_file)
+        remove_file(purge_path)
+
+        if meta_timestamp is not None:
+            purge_file = self.manager.make_on_disk_filename(
+                meta_timestamp, ext='.meta')
+            purge_path = os.path.join(self._datadir, purge_file)
+            remove_file(purge_path)
+
+        if frag_index is not None:
+            # data file may or may not be durable so try removing both filename
+            # possibilities
+            purge_file = self.manager.make_on_disk_filename(
+                timestamp, ext='.data', frag_index=frag_index)
+            purge_path = os.path.join(self._datadir, purge_file)
+            if is_file_older(purge_path, nondurable_purge_delay):
+                remove_file(purge_path)
+
+            purge_file = self.manager.make_on_disk_filename(
+                timestamp, ext='.data', frag_index=frag_index, durable=True)
+            purge_path = os.path.join(self._datadir, purge_file)
+            remove_file(purge_path)
+
+            remove_directory(self._datadir)
+        self.manager.invalidate_hash(dirname(self._datadir))
+
+
+class ECDiskFileManager(BaseDiskFileManager):
+    diskfile_cls = ECDiskFile
+    policy = EC_POLICY
+
+    def validate_fragment_index(self, frag_index, policy=None):
+        """
+        Return int representation of frag_index, or raise a DiskFileError if
+        frag_index is not a whole number.
+
+        :param frag_index: a fragment archive index
+        :param policy: storage policy used to validate the index against
+        """
+        try:
+            frag_index = int(str(frag_index))
+        except (ValueError, TypeError) as e:
+            raise DiskFileError(
+                'Bad fragment index: %s: %s' % (frag_index, e))
+        if frag_index < 0:
+            raise DiskFileError(
+                'Fragment index must not be negative: %s' % frag_index)
+        if policy and frag_index >= policy.ec_ndata + policy.ec_nparity:
+            msg = 'Fragment index must be less than %d for a %d+%d policy: %s'
+            raise DiskFileError(msg % (
+                policy.ec_ndata + policy.ec_nparity,
+                policy.ec_ndata, policy.ec_nparity, frag_index))
+        return frag_index
+
+    def make_on_disk_filename(self, timestamp, ext=None, frag_index=None,
+                              ctype_timestamp=None, durable=False, *a, **kw):
+        """
+        Returns the EC specific filename for given timestamp.
+
+        :param timestamp: the object timestamp, an instance of
+                          :class:`~swift.common.utils.Timestamp`
+        :param ext: an optional string representing a file extension to be
+                    appended to the returned file name
+        :param frag_index: a fragment archive index, used with .data extension
+                           only, must be a whole number.
+        :param ctype_timestamp: an optional content-type timestamp, an instance
+                                of :class:`~swift.common.utils.Timestamp`
+        :param durable: if True then include a durable marker in data filename.
+        :returns: a file name
+        :raises DiskFileError: if ext=='.data' and the kwarg frag_index is not
+                               a whole number
+        """
+        if ext == '.data':
+            # for datafiles only we encode the fragment index in the filename
+            # to allow archives of different indexes to temporarily be stored
+            # on the same node in certain situations
+            frag_index = self.validate_fragment_index(frag_index)
+            rv = timestamp.internal + '#' + str(frag_index)
+            if durable:
+                rv += '#d'
+            return '%s%s' % (rv, ext)
+        return super(ECDiskFileManager, self).make_on_disk_filename(
+            timestamp, ext, ctype_timestamp, *a, **kw)
+
+    def parse_on_disk_filename(self, filename, policy):
+        """
+        Returns timestamp(s) and other info extracted from a policy specific
+        file name. For EC policy the data file name includes a fragment index
+        and possibly a durable marker, both of which must be stripped off
+        to retrieve the timestamp.
+
+        :param filename: the file name including extension
+        :returns: a dict, with keys for timestamp, frag_index, durable, ext and
+                  ctype_timestamp:
+
+            * timestamp is a :class:`~swift.common.utils.Timestamp`
+            * frag_index is an int or None
+            * ctype_timestamp is a :class:`~swift.common.utils.Timestamp` or
+              None for .meta files, otherwise None
+            * ext is a string, the file extension including the leading dot or
+              the empty string if the filename has no extension
+            * durable is a boolean that is True if the filename is a data file
+              that includes a durable marker
+
+        :raises DiskFileError: if any part of the filename is not able to be
+                               validated.
+        """
+        frag_index = None
+        float_frag, ext = splitext(filename)
+        if ext == '.data':
+            parts = float_frag.split('#')
+            try:
+                timestamp = Timestamp(parts[0])
+            except ValueError:
+                raise DiskFileError('Invalid Timestamp value in filename %r'
+                                    % filename)
+            # it is an error for an EC data file to not have a valid
+            # fragment index
+            try:
+                frag_index = parts[1]
+            except IndexError:
+                # expect validate_fragment_index raise DiskFileError
+                pass
+            frag_index = self.validate_fragment_index(frag_index, policy)
+            try:
+                durable = parts[2] == 'd'
+            except IndexError:
+                durable = False
+            return {
+                'timestamp': timestamp,
+                'frag_index': frag_index,
+                'ext': ext,
+                'ctype_timestamp': None,
+                'durable': durable
+            }
+        rv = super(ECDiskFileManager, self).parse_on_disk_filename(
+            filename, policy)
+        rv['frag_index'] = None
+        return rv
+
+    def _process_ondisk_files(self, exts, results, frag_index=None,
+                              frag_prefs=None, **kwargs):
+        """
+        Implement EC policy specific handling of .data and legacy .durable
+        files.
+
+        If a frag_prefs keyword arg is provided then its value may determine
+        which fragment index at which timestamp is used to construct the
+        diskfile. The value of frag_prefs should be a list. Each item in the
+        frag_prefs list should be a dict that describes per-timestamp
+        preferences using the following items:
+
+            * timestamp: An instance of :class:`~swift.common.utils.Timestamp`.
+            * exclude: A list of valid fragment indexes (i.e. whole numbers)
+              that should be EXCLUDED when choosing a fragment at the
+              timestamp. This list may be empty.
+
+        For example::
+
+            [
+              {'timestamp': <Timestamp instance>, 'exclude': [1,3]},
+              {'timestamp': <Timestamp instance>, 'exclude': []}
+            ]
+
+        The order of per-timestamp dicts in the frag_prefs list is significant
+        and indicates descending preference for fragments from each timestamp
+        i.e. a fragment that satisfies the first per-timestamp preference in
+        the frag_prefs will be preferred over a fragment that satisfies a
+        subsequent per-timestamp preferred, and so on.
+
+        If a timestamp is not cited in any per-timestamp preference dict then
+        it is assumed that any fragment index at that timestamp may be used to
+        construct the diskfile.
+
+        When a frag_prefs arg is provided, including an empty list, there is no
+        requirement for there to be a durable file at the same timestamp as a
+        data file that is chosen to construct the disk file
+
+        :param exts: dict of lists of file info, keyed by extension
+        :param results: a dict that may be updated with results
+        :param frag_index: if set, search for a specific fragment index .data
+                           file, otherwise accept the first valid .data file.
+        :param frag_prefs: if set, search for any fragment index .data file
+                           that satisfies the frag_prefs.
+        """
+        durable_info = None
+        if exts.get('.durable'):
+            # in older versions, separate .durable files were used to indicate
+            # the durability of data files having the same timestamp
+            durable_info = exts['.durable'][0]
+
+        # Split the list of .data files into sets of frags having the same
+        # timestamp, identifying the durable and newest sets (if any) as we go.
+        # To do this we can take advantage of the list of .data files being
+        # reverse-time ordered. Keep the resulting per-timestamp frag sets in
+        # a frag_sets dict mapping a Timestamp instance -> frag_set.
+        all_frags = exts.get('.data')
+        frag_sets = {}
+        durable_frag_set = None
+        while all_frags:
+            frag_set, all_frags = self._split_gte_timestamp(
+                all_frags, all_frags[0]['timestamp'])
+            # sort the frag set into ascending frag_index order
+            frag_set.sort(key=lambda info: info['frag_index'])
+            timestamp = frag_set[0]['timestamp']
+            frag_sets[timestamp] = frag_set
+            for frag in frag_set:
+                # a data file marked as durable may supersede a legacy durable
+                # file if it is newer
+                if frag['durable']:
+                    if (not durable_info or
+                            durable_info['timestamp'] < timestamp):
+                        # this frag defines the durable timestamp
+                        durable_info = frag
+                    break
+            if durable_info and durable_info['timestamp'] == timestamp:
+                durable_frag_set = frag_set
+                # a data frag filename may not have the #d part if durability
+                # is defined by a legacy .durable, so always mark all data
+                # frags as durable here
+                for frag in frag_set:
+                    frag['durable'] = True
+                break  # ignore frags that are older than durable timestamp
+
+        # Choose which frag set to use
+        chosen_frag_set = None
+        if frag_prefs is not None:
+            candidate_frag_sets = dict(frag_sets)
+            # For each per-timestamp frag preference dict, do we have any frag
+            # indexes at that timestamp that are not in the exclusion list for
+            # that timestamp? If so choose the highest of those frag_indexes.
+            for ts, exclude_indexes in [
+                    (ts_pref['timestamp'], ts_pref['exclude'])
+                    for ts_pref in frag_prefs
+                    if ts_pref['timestamp'] in candidate_frag_sets]:
+                available_indexes = [info['frag_index']
+                                     for info in candidate_frag_sets[ts]]
+                acceptable_indexes = list(set(available_indexes) -
+                                          set(exclude_indexes))
+                if acceptable_indexes:
+                    chosen_frag_set = candidate_frag_sets[ts]
+                    # override any frag_index passed in as method param with
+                    # the last (highest) acceptable_index
+                    frag_index = acceptable_indexes[-1]
+                    break
+                else:
+                    # this frag_set has no acceptable frag index so
+                    # remove it from the candidate frag_sets
+                    candidate_frag_sets.pop(ts)
+            else:
+                # No acceptable frag index was found at any timestamp mentioned
+                # in the frag_prefs. Choose the newest remaining candidate
+                # frag_set - the proxy can decide if it wants the returned
+                # fragment with that time.
+                if candidate_frag_sets:
+                    ts_newest = sorted(candidate_frag_sets.keys())[-1]
+                    chosen_frag_set = candidate_frag_sets[ts_newest]
+        else:
+            chosen_frag_set = durable_frag_set
+
+        # Select a single chosen frag from the chosen frag_set, by either
+        # matching against a specified frag_index or taking the highest index.
+        chosen_frag = None
+        if chosen_frag_set:
+            if frag_index is not None:
+                # search the frag set to find the exact frag_index
+                for info in chosen_frag_set:
+                    if info['frag_index'] == frag_index:
+                        chosen_frag = info
+                        break
+            else:
+                chosen_frag = chosen_frag_set[-1]
+
+        # If we successfully found a frag then set results
+        if chosen_frag:
+            results['data_info'] = chosen_frag
+            results['durable_frag_set'] = durable_frag_set
+            results['chosen_frag_set'] = chosen_frag_set
+            if chosen_frag_set != durable_frag_set:
+                # hide meta files older than data file but newer than durable
+                # file so they don't get marked as obsolete (we already threw
+                # out .meta's that are older than a .durable)
+                exts['.meta'], _older = self._split_gt_timestamp(
+                    exts['.meta'], chosen_frag['timestamp'])
+        results['frag_sets'] = frag_sets
+
+        # Mark everything older than most recent durable data as obsolete
+        # and remove from the exts dict.
+        if durable_info:
+            for ext in exts.keys():
+                exts[ext], older = self._split_gte_timestamp(
+                    exts[ext], durable_info['timestamp'])
+                results.setdefault('obsolete', []).extend(older)
+
+        # Mark any isolated legacy .durable as obsolete
+        if exts.get('.durable') and not durable_frag_set:
+            results.setdefault('obsolete', []).extend(exts['.durable'])
+            exts.pop('.durable')
+
+        # Fragments *may* be ready for reclaim, unless they are most recent
+        # durable
+        for frag_set in frag_sets.values():
+            if frag_set in (durable_frag_set, chosen_frag_set):
+                continue
+            results.setdefault('possible_reclaim', []).extend(frag_set)
+
+        # .meta files *may* be ready for reclaim if there is no durable data
+        if exts.get('.meta') and not durable_frag_set:
+            results.setdefault('possible_reclaim', []).extend(
+                exts.get('.meta'))
+
+    def _verify_ondisk_files(self, results, frag_index=None,
+                             frag_prefs=None, **kwargs):
+        """
+        Verify that the final combination of on disk files complies with the
+        erasure-coded diskfile contract.
+
+        :param results: files that have been found and accepted
+        :param frag_index: specifies a specific fragment index .data file
+        :param frag_prefs: if set, indicates that fragment preferences have
+            been specified and therefore that a selected fragment is not
+            required to be durable.
+        :returns: True if the file combination is compliant, False otherwise
+        """
+        if super(ECDiskFileManager, self)._verify_ondisk_files(
+                results, **kwargs):
+            have_data_file = results['data_file'] is not None
+            have_durable = (results.get('durable_frag_set') is not None or
+                            (have_data_file and frag_prefs is not None))
+            return have_data_file == have_durable
+        return False
+
+    def _update_suffix_hashes(self, hashes, ondisk_info):
+        """
+        Applies policy specific updates to the given dict of md5 hashes for
+        the given ondisk_info.
+
+        The only difference between this method and the replication policy
+        function is the way that data files update hashes dict. Instead of all
+        filenames hashed into a single hasher, each data file name will fall
+        into a bucket keyed by its fragment index.
+
+        :param hashes: a dict of md5 hashes to be updated
+        :param ondisk_info: a dict describing the state of ondisk files, as
+                            returned by get_ondisk_files
+        """
+        for frag_set in ondisk_info['frag_sets'].values():
+            for file_info in frag_set:
+                fi = file_info['frag_index']
+                hashes[fi].update(file_info['timestamp'].internal)
+        if 'durable_frag_set' in ondisk_info:
+            # The durable_frag_set may be indicated by a legacy
+            # <timestamp>.durable file or by a durable <timestamp>#fi#d.data
+            # file. Either way we update hashes[None] with the string
+            # <timestamp>.durable which is a consistent representation of the
+            # abstract state of the object regardless of the actual file set.
+            # That way if we use a local combination of a legacy t1.durable and
+            # t1#0.data to reconstruct a remote t1#0#d.data then, when next
+            # hashed, the local and remote will make identical updates to their
+            # suffix hashes.
+            file_info = ondisk_info['durable_frag_set'][0]
+            hashes[None].update(file_info['timestamp'].internal + '.durable')
+
+    def _hash_suffix(self, path, policy=None):
+        """
+        Performs reclamation and returns an md5 of all (remaining) files.
+
+        :param path: full path to directory
+        :param policy: storage policy used to store the files
+        :raises PathNotDir: if given path is not a valid directory
+        :raises OSError: for non-ENOTDIR errors
+        :returns: dict of md5 hex digests
+        """
+        # hash_per_fi instead of single hash for whole suffix
+        # here we flatten out the hashers hexdigest into a dictionary instead
+        # of just returning the one hexdigest for the whole suffix
+
+        hash_per_fi = self._hash_suffix_dir(path, policy)
+        return dict((fi, md5.hexdigest()) for fi, md5 in hash_per_fi.items())
diff --git a/swift/obj/expirer.py b/swift/obj/expirer.py
index 85bc29b5d7..3d006f8f74 100644
--- a/swift/obj/expirer.py
+++ b/swift/obj/expirer.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,45 +13,315 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
+import urllib
+
 from random import random
 from time import time
+from optparse import OptionParser
 from os.path import join
+from collections import defaultdict, deque
 
 from eventlet import sleep, Timeout
+from eventlet.greenpool import GreenPool
 
-from swift.common.daemon import Daemon
-from swift.common.internal_client import InternalClient
-from swift.common.utils import get_logger, dump_recon_cache
+from swift.common.constraints import AUTO_CREATE_ACCOUNT_PREFIX
+from swift.common.daemon import Daemon, run_daemon
+from swift.common.internal_client import InternalClient, UnexpectedResponse
+from swift.common import utils
+from swift.common.utils import get_logger, dump_recon_cache, split_path, \
+    Timestamp, config_true_value, normalize_delete_at_timestamp, \
+    RateLimitedIterator, md5, non_negative_float, non_negative_int, \
+    parse_content_type, parse_options, config_positive_int_value
 from swift.common.http import HTTP_NOT_FOUND, HTTP_CONFLICT, \
     HTTP_PRECONDITION_FAILED
+from swift.common.recon import RECON_OBJECT_FILE, DEFAULT_RECON_CACHE_PATH
+
+from swift.container.reconciler import direct_delete_container_entry
+
+MAX_OBJECTS_TO_CACHE = 100000
+X_DELETE_TYPE = 'text/plain'
+ASYNC_DELETE_TYPE = 'application/async-deleted'
+
+# expiring_objects_account_name used to be a supported configuration across
+# proxy/expirer configs, but AUTO_CREATE_ACCOUNT_PREFIX is configured in
+# swift.conf constraints; neither should be changed
+EXPIRER_ACCOUNT_NAME = AUTO_CREATE_ACCOUNT_PREFIX + 'expiring_objects'
+# Most clusters use the default "expiring_objects_container_divisor" of 86400
+EXPIRER_CONTAINER_DIVISOR = 86400
+EXPIRER_CONTAINER_PER_DIVISOR = 100
+
+
+class ExpirerConfig(object):
+
+    def __init__(self, conf, container_ring=None, logger=None):
+        """
+        Read the configurable object-expirer values consistently and issue
+        warnings appropriately when we encounter deprecated options.
+
+        This class is used in multiple contexts on proxy and object servers.
+
+        :param conf: a config dictionary
+        :param container_ring: optional, required in proxy context to lookup
+                               task container (part, nodes)
+        :param logger: optional, will create one from the conf if not given
+        """
+        logger = logger or get_logger(conf)
+        if 'expiring_objects_container_divisor' in conf:
+            logger.warning(
+                'expiring_objects_container_divisor is deprecated')
+            expirer_divisor = config_positive_int_value(
+                conf['expiring_objects_container_divisor'])
+        else:
+            expirer_divisor = EXPIRER_CONTAINER_DIVISOR
+
+        if 'expiring_objects_account_name' in conf:
+            logger.warning(
+                'expiring_objects_account_name is deprecated; you need '
+                'to migrate to the standard .expiring_objects account')
+            account_name = (AUTO_CREATE_ACCOUNT_PREFIX +
+                            conf['expiring_objects_account_name'])
+        else:
+            account_name = EXPIRER_ACCOUNT_NAME
+        self.account_name = account_name
+        self.expirer_divisor = expirer_divisor
+        self.task_container_per_day = EXPIRER_CONTAINER_PER_DIVISOR
+        if self.task_container_per_day >= self.expirer_divisor:
+            msg = 'expiring_objects_container_divisor MUST be greater than 100'
+            if self.expirer_divisor != 86400:
+                msg += '; expiring_objects_container_divisor (%s) SHOULD be ' \
+                       'default value of %d' \
+                       % (self.expirer_divisor, EXPIRER_CONTAINER_DIVISOR)
+            raise ValueError(msg)
+        self.container_ring = container_ring
+
+    def get_expirer_container(self, x_delete_at, acc, cont, obj):
+        """
+        Returns an expiring object task container name for given X-Delete-At
+        and (native string) a/c/o.
+        """
+        # offset backwards from the expected day is a hash of size "per day"
+        shard_int = (int(utils.hash_path(acc, cont, obj), 16) %
+                     self.task_container_per_day)
+        # even though the attr is named "task_container_per_day" it's actually
+        # "task_container_per_divisor" if for some reason the deprecated config
+        # "expirer_divisor" option doesn't have the default value of 86400
+        return normalize_delete_at_timestamp(
+            int(x_delete_at) // self.expirer_divisor *
+            self.expirer_divisor - shard_int)
+
+    def get_expirer_account_and_container(self, x_delete_at, acc, cont, obj):
+        """
+        Calculates the expected expirer account and container for the target
+        given the current configuration.
+
+        :returns: a tuple, (account_name, task_container)
+        """
+        task_container = self.get_expirer_container(
+            x_delete_at, acc, cont, obj)
+        return self.account_name, task_container
+
+    def is_expected_task_container(self, task_container_int):
+        """
+        Validate the task_container timestamp as an expected value given the
+        current configuration. Changing the expirer configuration will lead to
+        orphaned x-delete-at task objects on overwrite, which may stick around
+        a whole reclaim age.
+
+        :params task_container_int: an int, all task_containers are expected
+                                    to be integer timestamps
+
+        :returns: a boolean, True if name fits with the given config
+        """
+        # calculate seconds offset into previous divisor window
+        r = (task_container_int - 1) % self.expirer_divisor
+        # seconds offset should be no more than task_container_per_day i.e.
+        # given % 86400, r==86359 is ok (because 41 is less than 100), but
+        # 49768 would be unexpected
+        return self.expirer_divisor - r <= self.task_container_per_day
+
+    def get_delete_at_nodes(self, x_delete_at, acc, cont, obj):
+        """
+        Get the task_container part, nodes, and name.
+
+        :returns: a tuple, (part, nodes, task_container_name)
+        """
+        if not self.container_ring:
+            raise RuntimeError('%s was not created with container_ring' % self)
+        account_name, task_container = self.get_expirer_account_and_container(
+            x_delete_at, acc, cont, obj)
+        part, nodes = self.container_ring.get_nodes(
+            account_name, task_container)
+        return part, nodes, task_container
+
+
+def build_task_obj(timestamp, target_account, target_container,
+                   target_obj, high_precision=False):
+    """
+    :return: a task object name in format of
+             "<timestamp>-<target_account>/<target_container>/<target_obj>"
+    """
+    timestamp = Timestamp(timestamp)
+    return '%s-%s/%s/%s' % (
+        normalize_delete_at_timestamp(timestamp, high_precision),
+        target_account, target_container, target_obj)
+
+
+def parse_task_obj(task_obj):
+    """
+    :param task_obj: a task object name in format of
+                     "<timestamp>-<target_account>/<target_container>" +
+                     "/<target_obj>"
+    :return: 4-tuples of (delete_at_time, target_account, target_container,
+             target_obj)
+    """
+    timestamp, target_path = task_obj.split('-', 1)
+    timestamp = Timestamp(timestamp)
+    target_account, target_container, target_obj = \
+        split_path('/' + target_path, 3, 3, True)
+    return timestamp, target_account, target_container, target_obj
+
+
+def extract_expirer_bytes_from_ctype(content_type):
+    """
+    Parse a content-type and return the number of bytes.
+
+    :param content_type: a content-type string
+    :return: int or None
+    """
+    content_type, params = parse_content_type(content_type)
+    bytes_size = None
+    for k, v in params:
+        if k == 'swift_expirer_bytes':
+            bytes_size = int(v)
+    return bytes_size
+
+
+def embed_expirer_bytes_in_ctype(content_type, metadata):
+    """
+    Embed number of bytes into content-type.  The bytes should come from
+    content-length on regular objects, but future extensions to "bytes in
+    expirer queue" monitoring may want to more closely consider expiration of
+    large multipart object manifests.
+
+    :param content_type: a content-type string
+    :param metadata: a dict, from Diskfile metadata
+    :return: str
+    """
+    # as best I can tell this key is required by df.open
+    report_bytes = metadata['Content-Length']
+    return "%s;swift_expirer_bytes=%d" % (content_type, int(report_bytes))
+
+
+def read_conf_for_delay_reaping_times(conf):
+    delay_reaping_times = {}
+    for conf_key in conf:
+        delay_reaping_prefix = "delay_reaping_"
+        if not conf_key.startswith(delay_reaping_prefix):
+            continue
+        delay_reaping_key = urllib.parse.unquote(
+            conf_key[len(delay_reaping_prefix):])
+        if delay_reaping_key.strip('/') != delay_reaping_key:
+            raise ValueError(
+                '%s '
+                'should be in the form delay_reaping_<account> '
+                'or delay_reaping_<account>/<container> '
+                '(leading or trailing "/" is not allowed)' % conf_key)
+        try:
+            # If split_path fails, have multiple '/' or
+            # account name is invalid
+            account, container = split_path(
+                '/' + delay_reaping_key, 1, 2
+            )
+        except ValueError:
+            raise ValueError(
+                '%s '
+                'should be in the form delay_reaping_<account> '
+                'or delay_reaping_<account>/<container> '
+                '(at most one "/" is allowed)' % conf_key)
+        try:
+            delay_reaping_times[(account, container)] = non_negative_float(
+                conf.get(conf_key)
+            )
+        except ValueError:
+            raise ValueError(
+                '%s must be a float '
+                'greater than or equal to 0' % conf_key)
+    return delay_reaping_times
+
+
+def get_delay_reaping(delay_reaping_times, target_account, target_container):
+    return delay_reaping_times.get(
+        (target_account, target_container),
+        delay_reaping_times.get((target_account, None), 0.0))
 
 
 class ObjectExpirer(Daemon):
     """
-    Daemon that queries the internal hidden expiring_objects_account to
-    discover objects that need to be deleted.
+    Daemon that queries the internal hidden task accounts to discover objects
+    that need to be deleted.
 
     :param conf: The daemon configuration.
     """
+    log_route = 'object-expirer'
 
-    def __init__(self, conf):
+    def __init__(self, conf, logger=None, swift=None):
         self.conf = conf
-        self.logger = get_logger(conf, log_route='object-expirer')
-        self.interval = int(conf.get('interval') or 300)
-        self.expiring_objects_account = \
-            (conf.get('auto_create_account_prefix') or '.') + \
-            'expiring_objects'
-        conf_path = conf.get('__file__') or '/etc/swift/object-expirer.conf'
-        request_tries = int(conf.get('request_tries') or 3)
-        self.swift = InternalClient(conf_path,
-                                    'Swift Object Expirer',
-                                    request_tries)
-        self.report_interval = int(conf.get('report_interval') or 300)
+        self.logger = logger or get_logger(conf, log_route=self.log_route)
+        self.interval = float(conf.get('interval') or 300)
+        self.tasks_per_second = float(conf.get('tasks_per_second', 50.0))
+        self.expirer_config = ExpirerConfig(conf, logger=self.logger)
+
+        self.conf_path = \
+            self.conf.get('__file__') or '/etc/swift/object-expirer.conf'
+        # True, if the conf file is 'object-expirer.conf'.
+        is_legacy_conf = 'expirer' in self.conf_path
+        # object-expirer.conf supports only legacy queue
+        self.dequeue_from_legacy = \
+            True if is_legacy_conf else \
+            config_true_value(conf.get('dequeue_from_legacy', 'false'))
+        self.swift = swift or self._make_internal_client(is_legacy_conf)
+        self.read_conf_for_queue_access()
+        self.report_interval = float(conf.get('report_interval') or 300)
         self.report_first_time = self.report_last_time = time()
         self.report_objects = 0
         self.recon_cache_path = conf.get('recon_cache_path',
-                                         '/var/cache/swift')
-        self.rcache = join(self.recon_cache_path, 'object.recon')
+                                         DEFAULT_RECON_CACHE_PATH)
+        self.rcache = join(self.recon_cache_path, RECON_OBJECT_FILE)
+        self.concurrency = int(conf.get('concurrency', 1))
+        if self.concurrency < 1:
+            raise ValueError("concurrency must be set to at least 1")
+        # This option defines how long an un-processable expired object
+        # marker will be retried before it is abandoned.  It is not coupled
+        # with the tombstone reclaim age in the consistency engine.
+        self.reclaim_age = int(conf.get('reclaim_age', 604800))
+
+        self.delay_reaping_times = read_conf_for_delay_reaping_times(conf)
+        self.round_robin_task_cache_size = int(
+            conf.get('round_robin_task_cache_size', MAX_OBJECTS_TO_CACHE))
+
+    def _make_internal_client(self, is_legacy_conf):
+        default_ic_conf_path = '/etc/swift/internal-client.conf'
+        if is_legacy_conf:
+            default_ic_conf_path = self.conf_path
+        ic_conf_path = self.conf.get(
+            'internal_client_conf_path', default_ic_conf_path)
+        request_tries = int(self.conf.get('request_tries') or 3)
+        return InternalClient(
+            ic_conf_path, 'Swift Object Expirer', request_tries,
+            use_replication_network=True,
+            global_conf={'log_name': '%s-ic' % self.conf.get(
+                'log_name', self.log_route)})
+
+    def read_conf_for_queue_access(self):
+        self.expiring_objects_account = AUTO_CREATE_ACCOUNT_PREFIX + \
+            (self.conf.get('expiring_objects_account_name') or
+             'expiring_objects')
+
+        # This is for common parameter with general task queue in future
+        self.task_container_prefix = ''
+        self.processes = non_negative_int(self.conf.get('processes', 0))
+        self.process = non_negative_int(self.conf.get('process', 0))
+        self._validate_processes_config()
 
     def report(self, final=False):
         """
@@ -63,17 +333,223 @@ def report(self, final=False):
         """
         if final:
             elapsed = time() - self.report_first_time
-            self.logger.info(_('Pass completed in %ds; %d objects expired') %
-                             (elapsed, self.report_objects))
+            self.logger.info(
+                'Pass completed in %(time)ds; %(objects)d objects expired', {
+                    'time': elapsed, 'objects': self.report_objects})
             dump_recon_cache({'object_expiration_pass': elapsed,
                               'expired_last_pass': self.report_objects},
                              self.rcache, self.logger)
         elif time() - self.report_last_time >= self.report_interval:
             elapsed = time() - self.report_first_time
-            self.logger.info(_('Pass so far %ds; %d objects expired') %
-                             (elapsed, self.report_objects))
+            self.logger.info(
+                'Pass so far %(time)ds; %(objects)d objects expired', {
+                    'time': elapsed, 'objects': self.report_objects})
             self.report_last_time = time()
 
+    def parse_task_obj(self, task_obj):
+        return parse_task_obj(task_obj)
+
+    def round_robin_order(self, task_iter):
+        """
+        Change order of expiration tasks to avoid deleting objects in a
+        certain container continuously.
+
+        :param task_iter: An iterator of delete-task dicts, which should each
+            have a ``target_path`` key.
+        """
+        obj_cache = defaultdict(deque)
+        cnt = 0
+
+        def dump_obj_cache_in_round_robin():
+            while obj_cache:
+                for key in sorted(obj_cache):
+                    if obj_cache[key]:
+                        yield obj_cache[key].popleft()
+                    else:
+                        del obj_cache[key]
+
+        for delete_task in task_iter:
+            try:
+                target_account, target_container, _junk = \
+                    split_path('/' + delete_task['target_path'], 3, 3, True)
+                cache_key = '%s/%s' % (target_account, target_container)
+            # sanity
+            except ValueError:
+                self.logger.error('Unexcepted error handling task %r' %
+                                  delete_task)
+                continue
+
+            obj_cache[cache_key].append(delete_task)
+            cnt += 1
+
+            if cnt > self.round_robin_task_cache_size:
+                for task in dump_obj_cache_in_round_robin():
+                    yield task
+                cnt = 0
+
+        for task in dump_obj_cache_in_round_robin():
+            yield task
+
+    def hash_mod(self, name, divisor):
+        """
+        :param name: a task object name
+        :param divisor: a divisor number
+        :return: an integer to decide which expirer is assigned to the task
+        """
+        if not isinstance(name, bytes):
+            name = name.encode('utf8')
+        # md5 is only used for shuffling mod
+        return int(md5(
+            name, usedforsecurity=False).hexdigest(), 16) % divisor
+
+    def iter_task_accounts_to_expire(self):
+        """
+        Yields (task_account, my_index, divisor).
+        my_index and divisor is used to assign task obj to only one
+        expirer. In expirer method, expirer calculates assigned index for each
+        expiration task. The assigned index is in [0, 1, ..., divisor - 1].
+        Expirers have their own "my_index" for each task_account. Expirer whose
+        "my_index" is equal to the assigned index executes the task. Because
+        each expirer have different "my_index", task objects are executed by
+        only one expirer.
+        """
+        if self.processes > 0:
+            yield (self.expirer_config.account_name,
+                   self.process, self.processes)
+        else:
+            yield self.expirer_config.account_name, 0, 1
+
+    def get_task_containers_to_expire(self, task_account):
+        """
+        Collects task_container names under the task_account if the delete at
+        timestamp of task_container is past.
+        """
+        container_list = []
+        unexpected_task_containers = {
+            'examples': [],
+            'count': 0,
+        }
+        for c in self.swift.iter_containers(task_account,
+                                            prefix=self.task_container_prefix):
+            try:
+                task_container_int = int(Timestamp(c['name']))
+            except ValueError:
+                self.logger.error('skipping invalid task container: %s/%s',
+                                  task_account, c['name'])
+                continue
+            if not self.expirer_config.is_expected_task_container(
+                    task_container_int):
+                unexpected_task_containers['count'] += 1
+                if unexpected_task_containers['count'] < 5:
+                    unexpected_task_containers['examples'].append(c['name'])
+            if task_container_int > Timestamp.now():
+                break
+            container_list.append(str(task_container_int))
+
+        if unexpected_task_containers['count']:
+            self.logger.info(
+                'processing %s unexpected task containers (e.g. %s)',
+                unexpected_task_containers['count'],
+                ' '.join(unexpected_task_containers['examples']))
+        return container_list
+
+    def get_delay_reaping(self, target_account, target_container):
+        return get_delay_reaping(self.delay_reaping_times, target_account,
+                                 target_container)
+
+    def _iter_task_container(self, task_account, task_container,
+                             my_index, divisor):
+        """
+        Iterates the input task container, yields a task expire info dict for
+        each delete task if it is assigned to this expirer process.
+
+        :raises UnexpectedResponse: if the task container listing is not
+            successful.
+        """
+        container_empty = True
+        for o in self.swift.iter_objects(task_account,
+                                         task_container,
+                                         acceptable_statuses=[2]):
+            container_empty = False
+            task_object = o['name']
+            try:
+                delete_timestamp, target_account, target_container, \
+                    target_object = parse_task_obj(task_object)
+            except ValueError:
+                self.logger.exception('Unexcepted error handling task %r' %
+                                      task_object)
+                self.logger.increment('tasks.parse_errors')
+                continue
+            is_async = o.get('content_type') == ASYNC_DELETE_TYPE
+            delay_reaping = self.get_delay_reaping(target_account,
+                                                   target_container)
+
+            if delete_timestamp > Timestamp.now():
+                # we shouldn't yield ANY more objects that can't reach
+                # the expiration date yet.
+                break
+
+            # Only one expirer daemon assigned for each task
+            if self.hash_mod('%s/%s' % (task_container, task_object),
+                             divisor) != my_index:
+                self.logger.increment('tasks.skipped')
+                continue
+
+            if delete_timestamp > Timestamp(time() - delay_reaping) \
+                    and not is_async:
+                # we shouldn't yield the object during the delay
+                self.logger.increment('tasks.delayed')
+                continue
+
+            self.logger.increment('tasks.assigned')
+            yield {'task_account': task_account,
+                   'task_container': task_container,
+                   'task_object': task_object,
+                   'target_path': '/'.join([
+                       target_account, target_container, target_object]),
+                   'delete_timestamp': delete_timestamp,
+                   'is_async_delete': is_async}
+        if container_empty:
+            try:
+                self.swift.delete_container(
+                    task_account, task_container,
+                    acceptable_statuses=(2, HTTP_NOT_FOUND, HTTP_CONFLICT))
+            except (Exception, Timeout) as err:
+                self.logger.exception(
+                    'Exception while deleting container %(account)s '
+                    '%(container)s %(err)s', {
+                        'account': task_account,
+                        'container': task_container, 'err': str(err)})
+
+    def iter_task_to_expire(self, task_account_container_list,
+                            my_index, divisor):
+        """
+        Yields task expire info dict which consists of task_account,
+        task_container, task_object, timestamp_to_delete, and target_path
+        """
+        for task_account, task_container in task_account_container_list:
+            try:
+                for item in self._iter_task_container(
+                        task_account, task_container, my_index, divisor):
+                    yield item
+            except UnexpectedResponse as err:
+                if err.resp.status_int != 404:
+                    self.logger.error(
+                        'Unexpected response while listing objects in '
+                        'container %(account)s %(container)s: %(err)s', {
+                            'account': task_account,
+                            'container': task_container,
+                            'err': str(err)
+                        })
+            except (Exception, Timeout) as err:
+                self.logger.error(
+                    'Exception while listing objects in container %(account)s '
+                    '%(container)s: %(err)s', {
+                        'account': task_account,
+                        'container': task_container,
+                        'err': str(err)
+                    })
+
     def run_once(self, *args, **kwargs):
         """
         Executes a single pass, looking for objects to expire.
@@ -81,55 +557,67 @@ def run_once(self, *args, **kwargs):
         :param args: Extra args to fulfill the Daemon interface; this daemon
                      has no additional args.
         :param kwargs: Extra keyword args to fulfill the Daemon interface; this
-                       daemon has no additional keyword args.
+                       daemon accepts processes and process keyword args.
+                       These will override the values from the config file if
+                       provided.
         """
+        # these config values are available to override at the command line,
+        # blow-up now if they're wrong
+        self.override_proceses_config_from_command_line(**kwargs)
+        # This if-clause will be removed when general task queue feature is
+        # implemented.
+        if not self.dequeue_from_legacy:
+            self.logger.info('This node is not configured to dequeue tasks '
+                             'from the legacy queue.  This node will '
+                             'not process any expiration tasks.  At least '
+                             'one node in your cluster must be configured '
+                             'with dequeue_from_legacy == true.')
+            return
+
+        pool = GreenPool(self.concurrency)
         self.report_first_time = self.report_last_time = time()
         self.report_objects = 0
         try:
-            self.logger.debug(_('Run begin'))
-            containers, objects = \
-                self.swift.get_account_info(self.expiring_objects_account)
-            self.logger.info(_('Pass beginning; %s possible containers; %s '
-                               'possible objects') % (containers, objects))
-            for c in self.swift.iter_containers(self.expiring_objects_account):
-                container = c['name']
-                timestamp = int(container)
-                if timestamp > int(time()):
-                    break
-                for o in self.swift.iter_objects(self.expiring_objects_account,
-                                                 container):
-                    obj = o['name'].encode('utf8')
-                    timestamp, actual_obj = obj.split('-', 1)
-                    timestamp = int(timestamp)
-                    if timestamp > int(time()):
-                        break
-                    start_time = time()
-                    try:
-                        self.delete_actual_object(actual_obj, timestamp)
-                        self.swift.delete_object(self.expiring_objects_account,
-                                                 container, obj)
-                        self.report_objects += 1
-                        self.logger.increment('objects')
-                    except (Exception, Timeout), err:
-                        self.logger.increment('errors')
-                        self.logger.exception(
-                            _('Exception while deleting object %s %s %s') %
-                            (container, obj, str(err)))
-                    self.logger.timing_since('timing', start_time)
-                    self.report()
-                try:
-                    self.swift.delete_container(
-                        self.expiring_objects_account,
-                        container,
-                        acceptable_statuses=(2, HTTP_NOT_FOUND, HTTP_CONFLICT))
-                except (Exception, Timeout), err:
-                    self.logger.exception(
-                        _('Exception while deleting container %s %s') %
-                        (container, str(err)))
-            self.logger.debug(_('Run end'))
+            self.logger.debug('Run begin')
+            for task_account, my_index, divisor in \
+                    self.iter_task_accounts_to_expire():
+                container_count, obj_count = \
+                    self.swift.get_account_info(task_account)
+
+                # the task account is skipped if there are no task container
+                if not container_count:
+                    continue
+
+                self.logger.info(
+                    'Pass beginning for task account %(account)s; '
+                    '%(container_count)s possible containers; '
+                    '%(obj_count)s possible objects', {
+                        'account': task_account,
+                        'container_count': container_count,
+                        'obj_count': obj_count})
+
+                task_account_container_list = \
+                    [(task_account, task_container) for task_container in
+                     self.get_task_containers_to_expire(task_account)]
+
+                # delete_task_iter is a generator to yield a dict of
+                # task_account, task_container, task_object, delete_timestamp,
+                # target_path to handle delete actual object and pop the task
+                # from the queue.
+                delete_task_iter = \
+                    self.round_robin_order(self.iter_task_to_expire(
+                        task_account_container_list, my_index, divisor))
+                rate_limited_iter = RateLimitedIterator(
+                    delete_task_iter,
+                    elements_per_second=self.tasks_per_second)
+                for delete_task in rate_limited_iter:
+                    pool.spawn_n(self.delete_object, **delete_task)
+
+            pool.waitall()
+            self.logger.debug('Run end')
             self.report(final=True)
         except (Exception, Timeout):
-            self.logger.exception(_('Unhandled exception'))
+            self.logger.exception('Unhandled exception')
 
     def run_forever(self, *args, **kwargs):
         """
@@ -140,18 +628,94 @@ def run_forever(self, *args, **kwargs):
         :param kwargs: Extra keyword args to fulfill the Daemon interface; this
                        daemon has no additional keyword args.
         """
+        # these config values are available to override at the command line
+        # blow-up now if they're wrong
+        self.override_proceses_config_from_command_line(**kwargs)
         sleep(random() * self.interval)
         while True:
             begin = time()
             try:
-                self.run_once()
+                self.run_once(*args, **kwargs)
             except (Exception, Timeout):
-                self.logger.exception(_('Unhandled exception'))
+                self.logger.exception('Unhandled exception')
             elapsed = time() - begin
             if elapsed < self.interval:
                 sleep(random() * (self.interval - elapsed))
 
-    def delete_actual_object(self, actual_obj, timestamp):
+    def override_proceses_config_from_command_line(self, **kwargs):
+        """
+        Sets self.processes and self.process from the kwargs if those
+        values exist, otherwise, leaves those values as they were set in
+        the config file.
+
+        :param kwargs: Keyword args passed into the run_forever(), run_once()
+                       methods.  They have values specified on the command
+                       line when the daemon is run.
+        """
+        if kwargs.get('processes') is not None:
+            self.processes = non_negative_int(kwargs['processes'])
+
+        if kwargs.get('process') is not None:
+            self.process = non_negative_int(kwargs['process'])
+
+        self._validate_processes_config()
+
+    def _validate_processes_config(self):
+        """
+        Used in constructor and in override_proceses_config_from_command_line
+        to validate the processes configuration requirements.
+
+        :raiess: ValueError if processes config is invalid
+        """
+        if self.processes and self.process >= self.processes:
+            raise ValueError(
+                'process must be less than processes')
+
+    def delete_object(self, target_path, delete_timestamp,
+                      task_account, task_container, task_object,
+                      is_async_delete):
+        start_time = time()
+        try:
+            try:
+                self.delete_actual_object(target_path, delete_timestamp,
+                                          is_async_delete)
+            except UnexpectedResponse as err:
+                if err.resp.status_int not in {HTTP_NOT_FOUND,
+                                               HTTP_PRECONDITION_FAILED}:
+                    raise
+                if float(delete_timestamp) > time() - self.reclaim_age:
+                    # we'll have to retry the DELETE later
+                    raise
+            self.pop_queue(task_account, task_container, task_object)
+            self.report_objects += 1
+            self.logger.increment('objects')
+        except UnexpectedResponse as err:
+            self.logger.increment('errors')
+            self.logger.error(
+                'Unexpected response while deleting object '
+                '%(account)s %(container)s %(obj)s: %(err)s' % {
+                    'account': task_account, 'container': task_container,
+                    'obj': task_object, 'err': str(err.resp.status_int)})
+            self.logger.debug(err.resp.body)
+        except (Exception, Timeout) as err:
+            self.logger.increment('errors')
+            self.logger.exception(
+                'Exception while deleting object %(account)s %(container)s '
+                '%(obj)s %(err)s' % {
+                    'account': task_account, 'container': task_container,
+                    'obj': task_object, 'err': str(err)})
+        self.logger.timing_since('timing', start_time)
+        self.report()
+
+    def pop_queue(self, task_account, task_container, task_object):
+        """
+        Issue a delete object request to the task_container for the expiring
+        object queue entry.
+        """
+        direct_delete_container_entry(self.swift.container_ring, task_account,
+                                      task_container, task_object)
+
+    def delete_actual_object(self, actual_obj, timestamp, is_async_delete):
         """
         Deletes the end-user object indicated by the actual object name given
         '<account>/<container>/<object>' if and only if the X-Delete-At value
@@ -159,9 +723,41 @@ def delete_actual_object(self, actual_obj, timestamp):
 
         :param actual_obj: The name of the end-user object to delete:
                            '<account>/<container>/<object>'
-        :param timestamp: The timestamp the X-Delete-At value must match to
-                          perform the actual delete.
+        :param timestamp: The swift.common.utils.Timestamp instance the
+                          X-Delete-At value must match to perform the actual
+                          delete.
+        :param is_async_delete: False if the object should be deleted because
+                                of "normal" expiration, or True if it should
+                                be async-deleted.
+        :raises UnexpectedResponse: if the delete was unsuccessful and
+                                    should be retried later
         """
-        self.swift.make_request('DELETE', '/v1/%s' % actual_obj.lstrip('/'),
-                                {'X-If-Delete-At': str(timestamp)},
-                                (2, HTTP_NOT_FOUND, HTTP_PRECONDITION_FAILED))
+        if is_async_delete:
+            headers = {'X-Timestamp': timestamp.normal}
+            acceptable_statuses = (2, HTTP_CONFLICT, HTTP_NOT_FOUND)
+        else:
+            headers = {'X-Timestamp': timestamp.normal,
+                       'X-If-Delete-At': timestamp.normal,
+                       'X-Backend-Clean-Expiring-Object-Queue': 'no'}
+            acceptable_statuses = (2, HTTP_CONFLICT)
+        self.swift.delete_object(*split_path('/' + actual_obj, 3, 3, True),
+                                 headers=headers,
+                                 acceptable_statuses=acceptable_statuses)
+
+
+def main():
+    parser = OptionParser("%prog CONFIG [options]")
+    parser.add_option('--processes', dest='processes',
+                      help="Number of processes to use to do the work, don't "
+                      "use this option to do all the work in one process")
+    parser.add_option('--process', dest='process',
+                      help="Process number for this process, don't use "
+                      "this option to do all the work in one process, this "
+                      "is used to determine which part of the work this "
+                      "process should do")
+    conf_file, options = parse_options(parser=parser, once=True)
+    run_daemon(ObjectExpirer, conf_file, **options)
+
+
+if __name__ == '__main__':
+    main()
diff --git a/swift/obj/mem_diskfile.py b/swift/obj/mem_diskfile.py
new file mode 100644
index 0000000000..f134e6edf6
--- /dev/null
+++ b/swift/obj/mem_diskfile.py
@@ -0,0 +1,516 @@
+# Copyright (c) 2010-2013 OpenStack, LLC.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+""" In-Memory Disk File Interface for Swift Object Server"""
+
+import io
+import time
+from contextlib import contextmanager
+
+from eventlet import Timeout
+
+from swift.common.utils import Timestamp
+from swift.common.exceptions import DiskFileQuarantined, DiskFileNotExist, \
+    DiskFileCollision, DiskFileDeleted, DiskFileNotOpen
+from swift.common.request_helpers import is_sys_meta
+from swift.common.swob import multi_range_iterator
+from swift.common.utils import md5
+from swift.obj.diskfile import DATAFILE_SYSTEM_META, RESERVED_DATAFILE_META
+
+
+class InMemoryFileSystem(object):
+    """
+    A very simplistic in-memory file system scheme.
+
+    There is one dictionary mapping a given object name to a tuple. The first
+    entry in the tuple is the BytesIO buffer representing the file contents,
+    the second entry is the metadata dictionary.
+    """
+
+    def __init__(self):
+        self._filesystem = {}
+
+    def get_object(self, name):
+        """
+        Return back an file-like object and its metadata
+
+        :param name: standard object name
+        :return: (fp, metadata) fp is ``BytesIO`` in-memory representation
+                                object (or None). metadata is a dictionary
+                                of metadata (or None)
+        """
+        val = self._filesystem.get(name)
+        if val is None:
+            fp, metadata = None, None
+        else:
+            fp, metadata = val
+        return fp, metadata
+
+    def put_object(self, name, fp, metadata):
+        """
+        Store object into memory
+
+        :param name: standard object name
+        :param fp: ``BytesIO`` in-memory representation object
+        :param metadata: dictionary of metadata to be written
+        """
+        self._filesystem[name] = (fp, metadata)
+
+    def del_object(self, name):
+        """
+        Delete object from memory
+
+        :param name: standard object name
+        """
+        del self._filesystem[name]
+
+    def get_diskfile(self, account, container, obj, **kwargs):
+        return DiskFile(self, account, container, obj)
+
+    def pickle_async_update(self, *args, **kwargs):
+        """
+        For now don't handle async updates.
+        """
+        pass
+
+
+class DiskFileWriter(object):
+    """
+    .. note::
+        Sample alternative pluggable on-disk backend implementation.
+
+    Encapsulation of the write context for servicing PUT REST API
+    requests. Serves as the context manager object for DiskFile's create()
+    method.
+
+    :param fs: internal file system object to use
+    :param name: standard object name
+    """
+    def __init__(self, fs, name):
+        self._filesystem = fs
+        self._name = name
+        self._fp = None
+        self._upload_size = 0
+        self._chunks_etag = md5(usedforsecurity=False)
+
+    def open(self):
+        """
+        Prepare to accept writes.
+
+        Create a new ``BytesIO`` object for a started-but-not-yet-finished
+        PUT.
+        """
+        self._fp = io.BytesIO()
+        return self
+
+    def close(self):
+        """
+        Clean up resources following an ``open()``.
+
+        Note: If ``put()`` has not been called, the data written will be lost.
+        """
+        self._fp = None
+
+    def write(self, chunk):
+        """
+        Write a chunk of data into the ``BytesIO`` object.
+
+        :param chunk: the chunk of data to write as a string object
+        """
+        self._fp.write(chunk)
+        self._upload_size += len(chunk)
+        self._chunks_etag.update(chunk)
+
+    def chunks_finished(self):
+        """
+        Expose internal stats about written chunks.
+
+        :returns: a tuple, (upload_size, etag)
+        """
+        return self._upload_size, self._chunks_etag.hexdigest()
+
+    def put(self, metadata):
+        """
+        Make the final association in the in-memory file system for this name
+        with the ``BytesIO`` object.
+
+        :param metadata: dictionary of metadata to be written
+        """
+        metadata['name'] = self._name
+        self._filesystem.put_object(self._name, self._fp, metadata)
+
+    def commit(self, timestamp):
+        """
+        Perform any operations necessary to mark the object as durable. For
+        mem_diskfile type this is a no-op.
+
+        :param timestamp: object put timestamp, an instance of
+                          :class:`~swift.common.utils.Timestamp`
+        """
+        pass
+
+
+class DiskFileReader(object):
+    """
+    .. note::
+        Sample alternative pluggable on-disk backend implementation.
+
+    Encapsulation of the read context for servicing GET REST API
+    requests. Serves as the context manager object for DiskFile's reader()
+    method.
+
+    :param name: object name
+    :param fp: open file object pointer reference
+    :param obj_size: on-disk size of object in bytes
+    :param etag: MD5 hash of object from metadata
+    """
+    def __init__(self, name, fp, obj_size, etag):
+        self._name = name
+        self._fp = fp
+        self._obj_size = obj_size
+        self._etag = etag
+        #
+        self._iter_etag = None
+        self._bytes_read = 0
+        self._started_at_0 = False
+        self._read_to_eof = False
+        self._suppress_file_closing = False
+        #
+        self.was_quarantined = ''
+
+    def __iter__(self):
+        try:
+            self._bytes_read = 0
+            self._started_at_0 = False
+            self._read_to_eof = False
+            if self._fp.tell() == 0:
+                self._started_at_0 = True
+                self._iter_etag = md5(usedforsecurity=False)
+            while True:
+                chunk = self._fp.read()
+                if chunk:
+                    if self._iter_etag:
+                        self._iter_etag.update(chunk)
+                    self._bytes_read += len(chunk)
+                    yield chunk
+                else:
+                    self._read_to_eof = True
+                    break
+        finally:
+            if not self._suppress_file_closing:
+                self.close()
+
+    def app_iter_range(self, start, stop):
+        if start or start == 0:
+            self._fp.seek(start)
+        if stop is not None:
+            length = stop - start
+        else:
+            length = None
+        try:
+            for chunk in self:
+                if length is not None:
+                    length -= len(chunk)
+                    if length < 0:
+                        # Chop off the extra:
+                        yield chunk[:length]
+                        break
+                yield chunk
+        finally:
+            if not self._suppress_file_closing:
+                self.close()
+
+    def app_iter_ranges(self, ranges, content_type, boundary, size):
+        if not ranges:
+            yield ''
+        else:
+            try:
+                self._suppress_file_closing = True
+                for chunk in multi_range_iterator(
+                        ranges, content_type, boundary, size,
+                        self.app_iter_range):
+                    yield chunk
+            finally:
+                self._suppress_file_closing = False
+                try:
+                    self.close()
+                except DiskFileQuarantined:
+                    pass
+
+    def _quarantine(self, msg):
+        self.was_quarantined = msg
+
+    def _handle_close_quarantine(self):
+        if self._bytes_read != self._obj_size:
+            self._quarantine(
+                "Bytes read: %s, does not match metadata: %s" % (
+                    self._bytes_read, self._obj_size))
+        elif self._iter_etag and \
+                self._etag != self._iter_etag.hexdigest():
+            self._quarantine(
+                "ETag %s and file's md5 %s do not match" % (
+                    self._etag, self._iter_etag.hexdigest()))
+
+    def close(self):
+        """
+        Close the file. Will handle quarantining file if necessary.
+        """
+        if self._fp:
+            try:
+                if self._started_at_0 and self._read_to_eof:
+                    self._handle_close_quarantine()
+            except (Exception, Timeout):
+                pass
+            finally:
+                self._fp = None
+
+
+class DiskFile(object):
+    """
+    .. note::
+
+        Sample alternative pluggable on-disk backend implementation. This
+        example duck-types the reference implementation DiskFile class.
+
+    Manage object files in-memory.
+
+    :param fs: an instance of InMemoryFileSystem
+    :param account: account name for the object
+    :param container: container name for the object
+    :param obj: object name for the object
+    """
+
+    def __init__(self, fs, account, container, obj):
+        self._name = '/' + '/'.join((account, container, obj))
+        self._metadata = None
+        self._fp = None
+        self._filesystem = fs
+        self.fragments = None
+
+    def open(self, modernize=False, current_time=None):
+        """
+        Open the file and read the metadata.
+
+        This method must populate the _metadata attribute.
+
+        :param current_time: Unix time used in checking expiration. If not
+             present, the current time will be used.
+        :raises DiskFileCollision: on name mis-match with metadata
+        :raises DiskFileDeleted: if it does not exist, or a tombstone is
+                                 present
+        :raises DiskFileQuarantined: if while reading metadata of the file
+                                     some data did pass cross checks
+        """
+        fp, self._metadata = self._filesystem.get_object(self._name)
+        if fp is None:
+            raise DiskFileDeleted()
+        self._fp = self._verify_data_file(fp, current_time)
+        self._metadata = self._metadata or {}
+        return self
+
+    def __enter__(self):
+        if self._metadata is None:
+            raise DiskFileNotOpen()
+        return self
+
+    def __exit__(self, t, v, tb):
+        if self._fp is not None:
+            self._fp = None
+
+    def _quarantine(self, name, msg):
+        """
+        Quarantine a file; responsible for incrementing the associated logger's
+        count of quarantines.
+
+        :param name: name of object to quarantine
+        :param msg: reason for quarantining to be included in the exception
+        :returns: DiskFileQuarantined exception object
+        """
+        # for this implementation we simply delete the bad object
+        self._filesystem.del_object(name)
+        return DiskFileQuarantined(msg)
+
+    def _verify_data_file(self, fp, current_time):
+        """
+        Verify the metadata's name value matches what we think the object is
+        named.
+
+        :raises DiskFileCollision: if the metadata stored name does not match
+                                   the referenced name of the file
+        :raises DiskFileNotExist: if the object has expired
+        :raises DiskFileQuarantined: if data inconsistencies were detected
+                                     between the metadata and the file-system
+                                     metadata
+        """
+        try:
+            mname = self._metadata['name']
+        except KeyError:
+            raise self._quarantine(self._name, "missing name metadata")
+        else:
+            if mname != self._name:
+                raise DiskFileCollision('Client path does not match path '
+                                        'stored in object metadata')
+        try:
+            x_delete_at = int(self._metadata['X-Delete-At'])
+        except KeyError:
+            pass
+        except ValueError:
+            # Quarantine, the x-delete-at key is present but not an
+            # integer.
+            raise self._quarantine(
+                self._name, "bad metadata x-delete-at value %s" % (
+                    self._metadata['X-Delete-At']))
+        else:
+            if current_time is None:
+                current_time = time.time()
+            if x_delete_at <= current_time:
+                raise DiskFileNotExist('Expired')
+        try:
+            metadata_size = int(self._metadata['Content-Length'])
+        except KeyError:
+            raise self._quarantine(
+                self._name, "missing content-length in metadata")
+        except ValueError:
+            # Quarantine, the content-length key is present but not an
+            # integer.
+            raise self._quarantine(
+                self._name, "bad metadata content-length value %s" % (
+                    self._metadata['Content-Length']))
+        try:
+            fp.seek(0, 2)
+            obj_size = fp.tell()
+            fp.seek(0, 0)
+        except OSError as err:
+            # Quarantine, we can't successfully stat the file.
+            raise self._quarantine(self._name, "not stat-able: %s" % err)
+        if obj_size != metadata_size:
+            raise self._quarantine(
+                self._name, "metadata content-length %s does"
+                " not match actual object size %s" % (
+                    metadata_size, obj_size))
+        return fp
+
+    def get_metadata(self):
+        """
+        Provide the metadata for an object as a dictionary.
+
+        :returns: object's metadata dictionary
+        """
+        if self._metadata is None:
+            raise DiskFileNotOpen()
+        return self._metadata
+
+    get_datafile_metadata = get_metadata
+    get_metafile_metadata = get_metadata
+
+    def read_metadata(self, current_time=None):
+        """
+        Return the metadata for an object.
+
+        :param current_time: Unix time used in checking expiration. If not
+             present, the current time will be used.
+        :returns: metadata dictionary for an object
+        """
+        with self.open(current_time=current_time):
+            return self.get_metadata()
+
+    def reader(self, keep_cache=False, cooperative_period=0,
+               etag_validate_frac=1):
+        """
+        Return a swift.common.swob.Response class compatible "app_iter"
+        object. The responsibility of closing the open file is passed to the
+        DiskFileReader object.
+
+        :param keep_cache:
+        :param cooperative_period:
+        :param etag_validate_frac:
+        """
+        dr = DiskFileReader(self._name, self._fp,
+                            int(self._metadata['Content-Length']),
+                            self._metadata['ETag'])
+        # At this point the reader object is now responsible for
+        # the file pointer.
+        self._fp = None
+        return dr
+
+    def writer(self, size=None):
+        return DiskFileWriter(self._filesystem, self._name)
+
+    @contextmanager
+    def create(self, size=None):
+        """
+        Context manager to create a file. We create a temporary file first, and
+        then return a DiskFileWriter object to encapsulate the state.
+
+        :param size: optional initial size of file to explicitly allocate on
+                     disk
+        :raises DiskFileNoSpace: if a size is specified and allocation fails
+        """
+        writer = self.writer(size)
+        try:
+            yield writer.open()
+        finally:
+            writer.close()
+
+    def write_metadata(self, metadata):
+        """
+        Write a block of metadata to an object.
+        """
+        data, cur_mdata = self._filesystem.get_object(self._name)
+        if data is not None:
+            # The object exists. Update the new metadata with the object's
+            # immutable metadata (e.g. name, size, etag, sysmeta) and store it
+            # with the object data.
+            immutable_metadata = dict(
+                [(key, val) for key, val in cur_mdata.items()
+                 if key.lower() in (RESERVED_DATAFILE_META |
+                                    DATAFILE_SYSTEM_META)
+                 or is_sys_meta('object', key)])
+            metadata.update(immutable_metadata)
+            metadata['name'] = self._name
+            self._filesystem.put_object(self._name, data, metadata)
+
+    def delete(self, timestamp):
+        """
+        Perform a delete for the given object in the given container under the
+        given account.
+
+        This creates a tombstone file with the given timestamp, and removes
+        any older versions of the object file.  Any file that has an older
+        timestamp than timestamp will be deleted.
+
+        :param timestamp: timestamp to compare with each file
+        """
+        fp, md = self._filesystem.get_object(self._name)
+        if md and md['X-Timestamp'] < Timestamp(timestamp):
+            self._filesystem.del_object(self._name)
+
+    @property
+    def timestamp(self):
+        if self._metadata is None:
+            raise DiskFileNotOpen()
+        return Timestamp(self._metadata.get('X-Timestamp'))
+
+    data_timestamp = timestamp
+
+    durable_timestamp = timestamp
+
+    content_type_timestamp = timestamp
+
+    @property
+    def content_type(self):
+        if self._metadata is None:
+            raise DiskFileNotOpen()
+        return self._metadata.get('Content-Type')
diff --git a/swift/obj/mem_server.py b/swift/obj/mem_server.py
new file mode 100644
index 0000000000..50a30c6266
--- /dev/null
+++ b/swift/obj/mem_server.py
@@ -0,0 +1,61 @@
+# Copyright (c) 2010-2013 OpenStack, LLC.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+""" In-Memory Object Server for Swift """
+
+
+from swift.obj.mem_diskfile import InMemoryFileSystem
+from swift.obj import server
+
+
+class ObjectController(server.ObjectController):
+    """
+    Implements the WSGI application for the Swift In-Memory Object Server.
+    """
+
+    def setup(self, conf):
+        """
+        Nothing specific to do for the in-memory version.
+
+        :param conf: WSGI configuration parameter
+        """
+        self._filesystem = InMemoryFileSystem()
+        self.fallocate_reserve = 0
+
+    def get_diskfile(self, device, partition, account, container, obj,
+                     **kwargs):
+        """
+        Utility method for instantiating a DiskFile object supporting a given
+        REST API.
+
+        An implementation of the object server that wants to use a different
+        DiskFile class would simply over-ride this method to provide that
+        behavior.
+        """
+        return self._filesystem.get_diskfile(account, container, obj, **kwargs)
+
+    def REPLICATE(self, request):
+        """
+        Handle REPLICATE requests for the Swift Object Server.  This is used
+        by the object replicator to get hashes for directories.
+        """
+        pass
+
+
+def app_factory(global_conf, **local_conf):
+    """paste.deploy app factory for creating WSGI object server apps"""
+    conf = global_conf.copy()
+    conf.update(local_conf)
+    return ObjectController(conf)
diff --git a/swift/obj/reconstructor.py b/swift/obj/reconstructor.py
new file mode 100644
index 0000000000..8d7d90f837
--- /dev/null
+++ b/swift/obj/reconstructor.py
@@ -0,0 +1,1584 @@
+# Copyright (c) 2010-2015 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import itertools
+import json
+import errno
+from optparse import OptionParser
+import os
+from os.path import join
+import random
+import time
+from collections import defaultdict
+import pickle  # nosec: B403
+import shutil
+
+from eventlet import (GreenPile, GreenPool, Timeout, sleep, tpool, spawn)
+from eventlet.support.greenlets import GreenletExit
+
+from swift.common.utils import (
+    whataremyips, unlink_older_than, compute_eta, get_logger,
+    dump_recon_cache, mkdirs, config_true_value, parse_options,
+    GreenAsyncPile, Timestamp, remove_file, node_to_string,
+    load_recon_cache, parse_override_options, distribute_evenly,
+    remove_directory, config_request_node_count_value,
+    non_negative_int, get_prefixed_logger)
+from swift.common.header_key_dict import HeaderKeyDict
+from swift.common.bufferedhttp import http_connect
+from swift.common.daemon import Daemon, run_daemon
+from swift.common.recon import RECON_OBJECT_FILE, DEFAULT_RECON_CACHE_PATH
+from swift.common.ring.utils import is_local_device
+from swift.obj.ssync_sender import Sender as ssync_sender
+from swift.common.http import HTTP_OK, HTTP_NOT_FOUND, \
+    HTTP_INSUFFICIENT_STORAGE
+from swift.obj.diskfile import DiskFileRouter, get_data_dir, \
+    get_tmp_dir, DEFAULT_RECLAIM_AGE
+from swift.common.storage_policy import POLICIES, EC_POLICY
+from swift.common.exceptions import ConnectionTimeout, DiskFileError, \
+    SuffixSyncError, PartitionLockTimeout, DiskFileNotExist
+
+SYNC, REVERT = ('sync_only', 'sync_revert')
+UNKNOWN_RESPONSE_STATUS = 0  # used as response status for timeouts, exceptions
+
+
+def _get_partners(node_index, part_nodes):
+    """
+    Returns the left, right and far partners of the node whose index is equal
+    to the given node_index.
+
+    :param node_index: the primary index
+    :param part_nodes: a list of primary nodes
+    :returns: [<node-to-left>, <node-to-right>, <node-opposite>]
+    """
+    num_nodes = len(part_nodes)
+    return [
+        part_nodes[(node_index - 1) % num_nodes],
+        part_nodes[(node_index + 1) % num_nodes],
+        part_nodes[(
+            node_index + (num_nodes // 2)
+        ) % num_nodes],
+    ]
+
+
+def _full_path(node, part, relative_path, policy):
+    """
+    Combines the node properties, partition, relative-path and policy into a
+    single string representation.
+
+    :param node: a dict describing node properties
+    :param part: partition number
+    :param path: path of the desired EC archive relative to partition dir
+    :param policy: an instance of
+                   :class:`~swift.common.storage_policy.BaseStoragePolicy`
+    :return: string representation of absolute path on node plus policy index
+    """
+    if not isinstance(relative_path, str):
+        relative_path = relative_path.decode('utf8')
+    return '%(node)s/%(part)s%(path)s policy#%(policy)d' % {
+        'node': node_to_string(node, replication=True),
+        'part': part, 'path': relative_path,
+        'policy': policy,
+    }
+
+
+class ResponseBucket(object):
+    """
+    Encapsulates fragment GET response data related to a single timestamp.
+    """
+    def __init__(self):
+        # count of all responses associated with this Bucket
+        self.num_responses = 0
+        # map {frag_index: response} for subset of responses that could be used
+        # to rebuild the missing fragment
+        self.useful_responses = {}
+        # set if a durable timestamp was seen in responses
+        self.durable = False
+        # etag of the first response associated with the Bucket
+        self.etag = None
+
+
+class RebuildingECDiskFileStream(object):
+    """
+    This class wraps the reconstructed fragment archive data and
+    metadata in the DiskFile interface for ssync.
+    """
+
+    def __init__(self, datafile_metadata, frag_index, rebuilt_fragment_iter):
+        # start with metadata from a participating FA
+        self.datafile_metadata = datafile_metadata
+
+        # the new FA is going to have the same length as others in the set
+        self._content_length = int(self.datafile_metadata['Content-Length'])
+        # update the FI and delete the ETag, the obj server will
+        # recalc on the other side...
+        self.datafile_metadata['X-Object-Sysmeta-Ec-Frag-Index'] = frag_index
+        for etag_key in ('ETag', 'Etag'):
+            self.datafile_metadata.pop(etag_key, None)
+
+        self.frag_index = frag_index
+        self.rebuilt_fragment_iter = rebuilt_fragment_iter
+
+    def get_metadata(self):
+        return self.datafile_metadata
+
+    def get_datafile_metadata(self):
+        return self.datafile_metadata
+
+    @property
+    def content_length(self):
+        return self._content_length
+
+    def reader(self):
+        for chunk in self.rebuilt_fragment_iter:
+            yield chunk
+
+
+class ObjectReconstructor(Daemon):
+    """
+    Reconstruct objects using erasure code.  And also rebalance EC Fragment
+    Archive objects off handoff nodes.
+
+    Encapsulates most logic and data needed by the object reconstruction
+    process. Each call to .reconstruct() performs one pass.  It's up to the
+    caller to do this in a loop.
+    """
+
+    def __init__(self, conf, logger=None):
+        """
+        :param conf: configuration object obtained from ConfigParser
+        :param logger: an instance of ``SwiftLogAdapter``.
+        """
+        self.conf = conf
+        self.logger = \
+            logger or get_logger(conf, log_route='object-reconstructor')
+        self.devices_dir = conf.get('devices', '/srv/node')
+        self.mount_check = config_true_value(conf.get('mount_check', 'true'))
+        self.swift_dir = conf.get('swift_dir', '/etc/swift')
+        self.ring_ip = conf.get('ring_ip', conf.get('bind_ip', '0.0.0.0'))
+        self.servers_per_port = int(conf.get('servers_per_port', '0') or 0)
+        self.port = None if self.servers_per_port else \
+            int(conf.get('bind_port', 6200))
+        self.concurrency = int(conf.get('concurrency', 1))
+        # N.B. to maintain compatibility with legacy configs this option can
+        # not be named 'workers' because the object-server uses that option
+        # name in the DEFAULT section
+        self.reconstructor_workers = int(conf.get('reconstructor_workers', 0))
+        self.policies = [policy for policy in POLICIES
+                         if policy.policy_type == EC_POLICY]
+        self.stats_interval = float(conf.get('stats_interval', '300'))
+        self.ring_check_interval = float(conf.get('ring_check_interval', 15))
+        self.next_check = time.time() + self.ring_check_interval
+        self.partition_times = []
+        self.interval = float(conf.get('interval') or
+                              conf.get('run_pause') or 30)
+        if 'run_pause' in conf:
+            if 'interval' in conf:
+                self.logger.warning(
+                    'Option object-reconstructor/run_pause is deprecated and '
+                    'object-reconstructor/interval is already configured. '
+                    'You can safely remove run_pause; it is now ignored and '
+                    'will be removed in a future version.')
+            else:
+                self.logger.warning(
+                    'Option object-reconstructor/run_pause is deprecated '
+                    'and will be removed in a future version. '
+                    'Update your configuration to use option '
+                    'object-reconstructor/interval.')
+        self.http_timeout = int(conf.get('http_timeout', 60))
+        self.lockup_timeout = int(conf.get('lockup_timeout', 1800))
+        self.recon_cache_path = conf.get('recon_cache_path',
+                                         DEFAULT_RECON_CACHE_PATH)
+        self.rcache = os.path.join(self.recon_cache_path, RECON_OBJECT_FILE)
+        self._next_rcache_update = time.time() + self.stats_interval
+        # defaults subject to change after beta
+        self.conn_timeout = float(conf.get('conn_timeout', 0.5))
+        self.node_timeout = float(conf.get('node_timeout', 10))
+        self.network_chunk_size = int(conf.get('network_chunk_size', 65536))
+        self.disk_chunk_size = int(conf.get('disk_chunk_size', 65536))
+        self.headers = {
+            'Content-Length': '0',
+            'user-agent': 'obj-reconstructor %s' % os.getpid()}
+        if 'handoffs_first' in conf:
+            self.logger.warning(
+                'The handoffs_first option is deprecated in favor '
+                'of handoffs_only. This option may be ignored in a '
+                'future release.')
+            # honor handoffs_first for backwards compatibility
+            default_handoffs_only = config_true_value(conf['handoffs_first'])
+        else:
+            default_handoffs_only = False
+        self.handoffs_only = config_true_value(
+            conf.get('handoffs_only', default_handoffs_only))
+        if self.handoffs_only:
+            self.logger.warning(
+                'Handoff only mode is not intended for normal '
+                'operation, use handoffs_only with care.')
+        elif default_handoffs_only:
+            self.logger.warning('Ignored handoffs_first option in favor '
+                                'of handoffs_only.')
+        self.rebuild_handoff_node_count = int(conf.get(
+            'rebuild_handoff_node_count', 2))
+        self.quarantine_threshold = non_negative_int(
+            conf.get('quarantine_threshold', 0))
+        self.quarantine_age = int(
+            conf.get('quarantine_age',
+                     conf.get('reclaim_age', DEFAULT_RECLAIM_AGE)))
+        self.request_node_count = config_request_node_count_value(
+            conf.get('request_node_count', '2 * replicas'))
+        self.max_objects_per_revert = non_negative_int(
+            conf.get('max_objects_per_revert', 0))
+        # When upgrading from liberasurecode<=1.5.0, you may want to continue
+        # writing legacy CRCs until all nodes are upgraded and capabale of
+        # reading fragments with zlib CRCs.
+        # See https://bugs.launchpad.net/liberasurecode/+bug/1886088 for more
+        # information.
+        if 'write_legacy_ec_crc' in conf:
+            os.environ['LIBERASURECODE_WRITE_LEGACY_CRC'] = \
+                '1' if config_true_value(conf['write_legacy_ec_crc']) else '0'
+        # else, assume operators know what they're doing and leave env alone
+
+        self._df_router = DiskFileRouter(conf, self.logger)
+        self.all_local_devices = self.get_local_devices()
+        self.rings_mtime = None
+
+    def get_worker_args(self, once=False, **kwargs):
+        """
+        Take the set of all local devices for this node from all the EC
+        policies rings, and distribute them evenly into the number of workers
+        to be spawned according to the configured worker count. If `devices` is
+        given in `kwargs` then distribute only those devices.
+
+        :param once: False if the worker(s) will be daemonized, True if the
+            worker(s) will be run once
+        :param kwargs: optional overrides from the command line
+        """
+        if self.reconstructor_workers < 1:
+            return
+        override_opts = parse_override_options(once=once, **kwargs)
+
+        # Note that this get re-used when dumping stats and in is_healthy
+        self.all_local_devices = self.get_local_devices()
+
+        if override_opts.devices:
+            devices = [d for d in override_opts.devices
+                       if d in self.all_local_devices]
+        else:
+            devices = list(self.all_local_devices)
+        if not devices:
+            # we only need a single worker to do nothing until a ring change
+            yield dict(override_devices=override_opts.devices,
+                       override_partitions=override_opts.partitions,
+                       multiprocess_worker_index=0)
+            return
+
+        # for somewhat uniform load per worker use same
+        # max_devices_per_worker when handling all devices or just override
+        # devices, but only use enough workers for the actual devices being
+        # handled
+        self.reconstructor_workers = min(self.reconstructor_workers,
+                                         len(devices))
+        for index, ods in enumerate(distribute_evenly(
+                devices, self.reconstructor_workers)):
+            yield dict(override_partitions=override_opts.partitions,
+                       override_devices=ods,
+                       multiprocess_worker_index=index)
+
+    def is_healthy(self):
+        """
+        Check whether rings have changed, and maybe do a recon update.
+
+        :returns: False if any ec ring has changed
+        """
+        now = time.time()
+        if now > self._next_rcache_update:
+            self._next_rcache_update = now + self.stats_interval
+            self.aggregate_recon_update()
+        rings_mtime = [os.path.getmtime(self.load_object_ring(
+                       policy).serialized_path) for policy in self.policies]
+        if self.rings_mtime == rings_mtime:
+            return True
+        self.rings_mtime = rings_mtime
+        return self.get_local_devices() == self.all_local_devices
+
+    def aggregate_recon_update(self):
+        """
+        Aggregate per-disk rcache updates from child workers.
+        """
+        existing_data = load_recon_cache(self.rcache)
+        first_start = time.time()
+        last_finish = 0
+        all_devices_reporting = True
+        for device in self.all_local_devices:
+            per_disk_stats = existing_data.get(
+                'object_reconstruction_per_disk', {}).get(device, {})
+            try:
+                start_time = per_disk_stats['object_reconstruction_last'] - \
+                    (per_disk_stats['object_reconstruction_time'] * 60)
+                finish_time = per_disk_stats['object_reconstruction_last']
+            except KeyError:
+                all_devices_reporting = False
+                break
+            first_start = min(first_start, start_time)
+            last_finish = max(last_finish, finish_time)
+        if all_devices_reporting and last_finish > 0:
+            duration = last_finish - first_start
+            recon_update = {
+                'object_reconstruction_time': duration / 60.0,
+                'object_reconstruction_last': last_finish
+            }
+        else:
+            # if any current devices have not yet dropped stats, or the rcache
+            # file does not yet exist, we may still clear out per device stats
+            # for any devices that have been removed from local devices
+            recon_update = {}
+        found_devices = set(existing_data.get(
+            'object_reconstruction_per_disk', {}).keys())
+        clear_update = {d: {} for d in found_devices
+                        if d not in self.all_local_devices}
+        if clear_update:
+            recon_update['object_reconstruction_per_disk'] = clear_update
+        dump_recon_cache(recon_update, self.rcache, self.logger)
+
+    def load_object_ring(self, policy):
+        """
+        Make sure the policy's rings are loaded.
+
+        :param policy: the StoragePolicy instance
+        :returns: appropriate ring object
+        """
+        policy.load_ring(self.swift_dir)
+        return policy.object_ring
+
+    def check_ring(self, object_ring):
+        """
+        Check to see if the ring has been updated
+
+        :param object_ring: the ring to check
+        :returns: boolean indicating whether or not the ring has changed
+        """
+        if time.time() > self.next_check:
+            self.next_check = time.time() + self.ring_check_interval
+            if object_ring.has_changed():
+                return False
+        return True
+
+    def _get_response(self, node, policy, partition, path, headers):
+        """
+        Helper method for reconstruction that GETs a single EC fragment
+        archive
+
+        :param node: the node to GET from
+        :param policy: the job policy
+        :param partition: the partition
+        :param path: path of the desired EC archive relative to partition dir
+        :param headers: the headers to send
+        :returns: response
+        """
+        full_path = _full_path(node, partition, path, policy)
+        resp = None
+        try:
+            with ConnectionTimeout(self.conn_timeout):
+                conn = http_connect(
+                    node['replication_ip'], node['replication_port'],
+                    node['device'], partition, 'GET', path, headers=headers)
+            with Timeout(self.node_timeout):
+                resp = conn.getresponse()
+                resp.full_path = full_path
+                resp.node = node
+        except (Exception, Timeout):
+            self.logger.exception(
+                "Trying to GET %(full_path)s", {
+                    'full_path': full_path})
+        return resp
+
+    def _handle_fragment_response(self, node, policy, partition, fi_to_rebuild,
+                                  path, buckets, error_responses, resp):
+        """
+        Place ok responses into a per-timestamp bucket. Append bad responses to
+        a list per-status-code in error_responses.
+
+        :return: the per-timestamp bucket if the response is ok, otherwise
+            None.
+        """
+        if not resp:
+            error_responses[UNKNOWN_RESPONSE_STATUS].append(resp)
+            return None
+
+        if resp.status not in [HTTP_OK, HTTP_NOT_FOUND]:
+            self.logger.warning(
+                "Invalid response %(resp)s from %(full_path)s",
+                {'resp': resp.status, 'full_path': resp.full_path})
+        if resp.status != HTTP_OK:
+            error_responses[resp.status].append(resp)
+            return None
+
+        resp.headers = HeaderKeyDict(resp.getheaders())
+        frag_index = resp.headers.get('X-Object-Sysmeta-Ec-Frag-Index')
+        try:
+            resp_frag_index = int(frag_index)
+        except (TypeError, ValueError):
+            # The successful response should include valid X-Object-
+            # Sysmeta-Ec-Frag-Index but for safety, catching the case either
+            # missing X-Object-Sysmeta-Ec-Frag-Index or invalid frag index to
+            # reconstruct and dump warning log for that
+            self.logger.warning(
+                'Invalid resp from %s '
+                '(invalid X-Object-Sysmeta-Ec-Frag-Index: %r)',
+                resp.full_path, frag_index)
+            error_responses[UNKNOWN_RESPONSE_STATUS].append(resp)
+            return None
+
+        timestamp = resp.headers.get('X-Backend-Data-Timestamp',
+                                     resp.headers.get('X-Backend-Timestamp'))
+        if not timestamp:
+            self.logger.warning(
+                'Invalid resp from %s, frag index %s (missing '
+                'X-Backend-Data-Timestamp and X-Backend-Timestamp)',
+                resp.full_path, resp_frag_index)
+            error_responses[UNKNOWN_RESPONSE_STATUS].append(resp)
+            return None
+        timestamp = Timestamp(timestamp)
+
+        etag = resp.headers.get('X-Object-Sysmeta-Ec-Etag')
+        if not etag:
+            self.logger.warning(
+                'Invalid resp from %s, frag index %s (missing Etag)',
+                resp.full_path, resp_frag_index)
+            error_responses[UNKNOWN_RESPONSE_STATUS].append(resp)
+            return None
+
+        bucket = buckets[timestamp]
+        bucket.num_responses += 1
+        if bucket.etag is None:
+            bucket.etag = etag
+        elif bucket.etag != etag:
+            self.logger.error('Mixed Etag (%s, %s) for %s frag#%s',
+                              etag, bucket.etag,
+                              _full_path(node, partition, path, policy),
+                              fi_to_rebuild)
+            return None
+
+        durable_timestamp = resp.headers.get('X-Backend-Durable-Timestamp')
+        if durable_timestamp:
+            buckets[Timestamp(durable_timestamp)].durable = True
+
+        if resp_frag_index == fi_to_rebuild:
+            # TODO: With duplicated EC frags it's not unreasonable to find the
+            # very fragment we're trying to rebuild exists on another primary
+            # node.  In this case we should stream it directly from the remote
+            # node to our target instead of rebuild.  But instead we ignore it.
+            self.logger.debug(
+                'Found existing frag #%s at %s while rebuilding to %s',
+                fi_to_rebuild, resp.full_path,
+                _full_path(node, partition, path, policy))
+        elif resp_frag_index not in bucket.useful_responses:
+            bucket.useful_responses[resp_frag_index] = resp
+        # else: duplicate frag_index isn't useful for rebuilding
+
+        return bucket
+
+    def _is_quarantine_candidate(self, policy, buckets, error_responses, df):
+        # This condition is deliberately strict because it determines if
+        # more requests will be issued and ultimately if the fragment
+        # will be quarantined.
+        if list(error_responses.keys()) != [404]:
+            # only quarantine if all other responses are 404 so we are
+            # confident there are no other frags on queried nodes
+            return False
+
+        local_timestamp = Timestamp(df.get_datafile_metadata()['X-Timestamp'])
+        if list(buckets.keys()) != [local_timestamp]:
+            # don't quarantine if there's insufficient other timestamp
+            # frags, or no response for the local frag timestamp: we
+            # possibly could quarantine, but this unexpected case may be
+            # worth more investigation
+            return False
+
+        if time.time() - float(local_timestamp) <= self.quarantine_age:
+            # If the fragment has not yet passed reclaim age then it is
+            # likely that a tombstone will be reverted to this node, or
+            # neighbor frags will get reverted from handoffs to *other* nodes
+            # and we'll discover we *do* have enough to reconstruct. Don't
+            # quarantine it yet: better that it is cleaned up 'normally'.
+            return False
+
+        bucket = buckets[local_timestamp]
+        return (bucket.num_responses <= self.quarantine_threshold and
+                bucket.num_responses < policy.ec_ndata and
+                df._frag_index in bucket.useful_responses)
+
+    def _make_fragment_requests(self, job, node, df, buckets, error_responses):
+        """
+        Issue requests for fragments to the list of ``nodes`` and sort the
+        responses into per-timestamp ``buckets`` or per-status
+        ``error_responses``. If any bucket accumulates sufficient responses to
+        rebuild the missing fragment then return that bucket.
+
+        :param job: job from ssync_sender.
+        :param node: node to which we're rebuilding.
+        :param df: an instance of :class:`~swift.obj.diskfile.BaseDiskFile`.
+        :param buckets: dict of per-timestamp buckets for ok responses.
+        :param error_responses: dict of per-status lists of error responses.
+        :return: A per-timestamp with sufficient responses, or None if
+            there is no such bucket.
+        """
+        policy = job['policy']
+        partition = job['partition']
+        datafile_metadata = df.get_datafile_metadata()
+
+        # the fragment index we need to reconstruct is the position index
+        # of the node we're rebuilding to within the primary part list
+        fi_to_rebuild = node['backend_index']
+
+        # KISS send out connection requests to all nodes, see what sticks.
+        # Use fragment preferences header to tell other nodes that we want
+        # fragments at the same timestamp as our fragment, and that they don't
+        # need to be durable. Accumulate responses into per-timestamp buckets
+        # and if any buckets gets enough responses then use those responses to
+        # rebuild.
+        headers = self.headers.copy()
+        headers['X-Backend-Storage-Policy-Index'] = int(policy)
+        headers['X-Backend-Replication'] = 'True'
+        local_timestamp = Timestamp(datafile_metadata['X-Timestamp'])
+        frag_prefs = [{'timestamp': local_timestamp.normal, 'exclude': []}]
+        headers['X-Backend-Fragment-Preferences'] = json.dumps(frag_prefs)
+        path = datafile_metadata['name']
+
+        ring = policy.object_ring
+        primary_nodes = ring.get_part_nodes(partition)
+        # primary_node_count is the maximum number of nodes to consume in a
+        # normal rebuild attempt when there is no quarantine candidate,
+        # including the node to which we are rebuilding
+        primary_node_count = len(primary_nodes)
+        # don't try and fetch a fragment from the node we're rebuilding to
+        filtered_primary_nodes = [n for n in primary_nodes
+                                  if n['id'] != node['id']]
+        # concurrency is the number of requests fired off in initial batch
+        concurrency = len(filtered_primary_nodes)
+        # max_node_count is the maximum number of nodes to consume when
+        # verifying a quarantine candidate and is at least primary_node_count
+        max_node_count = max(primary_node_count,
+                             self.request_node_count(primary_node_count))
+
+        pile = GreenAsyncPile(concurrency)
+        for primary_node in filtered_primary_nodes:
+            pile.spawn(self._get_response, primary_node, policy, partition,
+                       path, headers)
+
+        useful_bucket = None
+        for resp in pile:
+            bucket = self._handle_fragment_response(
+                node, policy, partition, fi_to_rebuild, path, buckets,
+                error_responses, resp)
+            if bucket and len(bucket.useful_responses) >= policy.ec_ndata:
+                useful_bucket = bucket
+                break
+
+        # Once all rebuild nodes have responded, if we have a quarantine
+        # candidate, go beyond primary_node_count and on to handoffs. The
+        # first non-404 response will prevent quarantine, but the expected
+        # common case is all 404 responses so we use some concurrency to get an
+        # outcome faster at the risk of some unnecessary requests in the
+        # uncommon case.
+        if (not useful_bucket and
+                self._is_quarantine_candidate(
+                    policy, buckets, error_responses, df)):
+            node_count = primary_node_count
+            handoff_iter = itertools.islice(ring.get_more_nodes(partition),
+                                            max_node_count - node_count)
+            for handoff_node in itertools.islice(handoff_iter, concurrency):
+                node_count += 1
+                pile.spawn(self._get_response, handoff_node, policy, partition,
+                           path, headers)
+            for resp in pile:
+                bucket = self._handle_fragment_response(
+                    node, policy, partition, fi_to_rebuild, path, buckets,
+                    error_responses, resp)
+                if bucket and len(bucket.useful_responses) >= policy.ec_ndata:
+                    useful_bucket = bucket
+                    self.logger.debug(
+                        'Reconstructing frag from handoffs, node_count=%d'
+                        % node_count)
+                    break
+                elif self._is_quarantine_candidate(
+                        policy, buckets, error_responses, df):
+                    try:
+                        handoff_node = next(handoff_iter)
+                        node_count += 1
+                        pile.spawn(self._get_response, handoff_node, policy,
+                                   partition, path, headers)
+                    except StopIteration:
+                        pass
+                # else: this frag is no longer a quarantine candidate, so we
+                # could break right here and ignore any remaining responses,
+                # but given that we may have actually found another frag we'll
+                # optimistically wait for any remaining responses in case a
+                # useful bucket is assembled.
+
+        return useful_bucket
+
+    def reconstruct_fa(self, job, node, df):
+        """
+        Reconstructs a fragment archive - this method is called from ssync
+        after a remote node responds that is missing this object - the local
+        diskfile is opened to provide metadata - but to reconstruct the
+        missing fragment archive we must connect to multiple object servers.
+
+        :param job: job from ssync_sender.
+        :param node: node to which we're rebuilding.
+        :param df: an instance of :class:`~swift.obj.diskfile.BaseDiskFile`.
+        :returns: a DiskFile like class for use by ssync.
+        :raises DiskFileQuarantined: if the fragment archive cannot be
+            reconstructed and has as a result been quarantined.
+        :raises DiskFileError: if the fragment archive cannot be reconstructed.
+        """
+        policy = job['policy']
+        partition = job['partition']
+        # the fragment index we need to reconstruct is the position index
+        # of the node we're rebuilding to within the primary part list
+        fi_to_rebuild = node['backend_index']
+        datafile_metadata = df.get_datafile_metadata()
+        if not df.validate_metadata():
+            raise df._quarantine(
+                df._data_file, "Invalid fragment #%s" % df._frag_index)
+        local_timestamp = Timestamp(datafile_metadata['X-Timestamp'])
+        path = datafile_metadata['name']
+
+        buckets = defaultdict(ResponseBucket)  # map timestamp -> Bucket
+        error_responses = defaultdict(list)  # map status code -> response list
+
+        # don't try and fetch a fragment from the node we're rebuilding to
+        useful_bucket = self._make_fragment_requests(
+            job, node, df, buckets, error_responses)
+
+        if useful_bucket:
+            frag_indexes = list(useful_bucket.useful_responses.keys())
+            self.logger.debug('Reconstruct frag #%s with frag indexes %s'
+                              % (fi_to_rebuild, frag_indexes))
+            responses = list(useful_bucket.useful_responses.values())
+            rebuilt_fragment_iter = self.make_rebuilt_fragment_iter(
+                responses[:policy.ec_ndata], path, policy, fi_to_rebuild)
+            return RebuildingECDiskFileStream(datafile_metadata, fi_to_rebuild,
+                                              rebuilt_fragment_iter)
+
+        full_path = _full_path(node, partition, path, policy)
+        for timestamp, bucket in sorted(buckets.items()):
+            self.logger.error(
+                'Unable to get enough responses (%s/%s from %s ok responses) '
+                'to reconstruct %s %s frag#%s with ETag %s and timestamp %s' %
+                (len(bucket.useful_responses), policy.ec_ndata,
+                 bucket.num_responses,
+                 'durable' if bucket.durable else 'non-durable',
+                 full_path, fi_to_rebuild, bucket.etag, timestamp.internal))
+
+        if error_responses:
+            durable = buckets[local_timestamp].durable
+            errors = ', '.join(
+                '%s x %s' % (len(responses),
+                             'unknown' if status == UNKNOWN_RESPONSE_STATUS
+                             else status)
+                for status, responses in sorted(error_responses.items()))
+            self.logger.error(
+                'Unable to get enough responses (%s error responses) '
+                'to reconstruct %s %s frag#%s' % (
+                    errors, 'durable' if durable else 'non-durable',
+                    full_path, fi_to_rebuild))
+
+        if self._is_quarantine_candidate(policy, buckets, error_responses, df):
+            raise df._quarantine(
+                df._data_file, "Solitary fragment #%s" % df._frag_index)
+
+        raise DiskFileError('Unable to reconstruct EC archive')
+
+    def _reconstruct(self, policy, fragment_payload, frag_index):
+        return policy.pyeclib_driver.reconstruct(fragment_payload,
+                                                 [frag_index])[0]
+
+    def make_rebuilt_fragment_iter(self, responses, path, policy, frag_index):
+        """
+        Turn a set of connections from backend object servers into a generator
+        that yields up the rebuilt fragment archive for frag_index.
+        """
+
+        def _get_one_fragment(resp):
+            buff = []
+            remaining_bytes = policy.fragment_size
+            while remaining_bytes:
+                chunk = resp.read(remaining_bytes)
+                if not chunk:
+                    break
+                remaining_bytes -= len(chunk)
+                buff.append(chunk)
+            return b''.join(buff)
+
+        def fragment_payload_iter():
+            # We need a fragment from each connections, so best to
+            # use a GreenPile to keep them ordered and in sync
+            pile = GreenPile(len(responses))
+            while True:
+                for resp in responses:
+                    pile.spawn(_get_one_fragment, resp)
+                try:
+                    with Timeout(self.node_timeout):
+                        fragment_payload = [fragment for fragment in pile]
+                except (Exception, Timeout):
+                    self.logger.exception(
+                        "Error trying to rebuild %(path)s "
+                        "policy#%(policy)d frag#%(frag_index)s",
+                        {'path': path,
+                         'policy': policy,
+                         'frag_index': frag_index,
+                         })
+                    break
+                if not all(fragment_payload):
+                    break
+                rebuilt_fragment = self._reconstruct(
+                    policy, fragment_payload, frag_index)
+                yield rebuilt_fragment
+
+        return fragment_payload_iter()
+
+    def stats_line(self):
+        """
+        Logs various stats for the currently running reconstruction pass.
+        """
+        if (self.device_count and self.part_count):
+            elapsed = (time.time() - self.start) or 0.000001
+            rate = self.reconstruction_part_count / elapsed
+            self.logger.info(
+                "%(reconstructed)d/%(total)d (%(percentage).2f%%)"
+                " partitions reconstructed in %(time).2fs "
+                "(%(rate).2f/sec, %(remaining)s remaining)",
+                {'reconstructed': self.reconstruction_part_count,
+                 'total': self.part_count,
+                 'percentage':
+                 self.reconstruction_part_count * 100.0 / self.part_count,
+                 'time': time.time() - self.start, 'rate': rate,
+                 'remaining': '%d%s' %
+                 compute_eta(self.start,
+                             self.reconstruction_part_count,
+                             self.part_count)})
+
+            if self.suffix_count and self.partition_times:
+                self.logger.info(
+                    "%(checked)d suffixes checked - "
+                    "%(hashed).2f%% hashed, %(synced).2f%% synced",
+                    {'checked': self.suffix_count,
+                     'hashed': (self.suffix_hash * 100.0) / self.suffix_count,
+                     'synced': (self.suffix_sync * 100.0) / self.suffix_count})
+                self.partition_times.sort()
+                self.logger.info(
+                    "Partition times: max %(max).4fs, "
+                    "min %(min).4fs, med %(med).4fs",
+                    {'max': self.partition_times[-1],
+                     'min': self.partition_times[0],
+                     'med': self.partition_times[
+                         len(self.partition_times) // 2]})
+        else:
+            self.logger.info(
+                "Nothing reconstructed for %s seconds.",
+                (time.time() - self.start))
+
+    def _emplace_log_prefix(self, worker_index):
+        self.logger = get_prefixed_logger(
+            self.logger, "[worker %d/%d pid=%s] " % (
+                worker_index + 1,
+                # use 1-based indexing for more readable logs
+                self.reconstructor_workers,
+                os.getpid()))
+
+    def kill_coros(self):
+        """Utility function that kills all coroutines currently running."""
+        for coro in list(self.run_pool.coroutines_running):
+            try:
+                coro.kill(GreenletExit)
+            except GreenletExit:
+                pass
+
+    def heartbeat(self):
+        """
+        Loop that runs in the background during reconstruction.  It
+        periodically logs progress.
+        """
+        while True:
+            sleep(self.stats_interval)
+            self.stats_line()
+
+    def detect_lockups(self):
+        """
+        In testing, the pool.waitall() call very occasionally failed to return.
+        This is an attempt to make sure the reconstructor finishes its
+        reconstruction pass in some eventuality.
+        """
+        while True:
+            sleep(self.lockup_timeout)
+            if self.reconstruction_count == self.last_reconstruction_count:
+                self.logger.error("Lockup detected.. killing live coros.")
+                self.kill_coros()
+            self.last_reconstruction_count = self.reconstruction_count
+
+    def _get_hashes(self, device, partition, policy, recalculate=None,
+                    do_listdir=False):
+        df_mgr = self._df_router[policy]
+        hashed, suffix_hashes = tpool.execute(
+            df_mgr._get_hashes, device, partition, policy,
+            recalculate=recalculate, do_listdir=do_listdir)
+        # hashed is always an int, we count it in stats but don't return it
+        self.logger.update_stats('suffix.hashes', hashed)
+        return suffix_hashes
+
+    def get_suffix_delta(self, local_suff, local_index,
+                         remote_suff, remote_index):
+        """
+        Compare the local suffix hashes with the remote suffix hashes
+        for the given local and remote fragment indexes.  Return those
+        suffixes which should be synced.
+
+        :param local_suff: the local suffix hashes (from _get_hashes)
+        :param local_index: the local fragment index for the job
+        :param remote_suff: the remote suffix hashes (from remote
+                            REPLICATE request)
+        :param remote_index: the remote fragment index for the job
+
+        :returns: a list of strings, the suffix dirs to sync
+        """
+        suffixes = []
+        for suffix, sub_dict_local in local_suff.items():
+            sub_dict_remote = remote_suff.get(suffix, {})
+            if (sub_dict_local.get(None) != sub_dict_remote.get(None) or
+                    sub_dict_local.get(local_index) !=
+                    sub_dict_remote.get(remote_index)):
+                suffixes.append(suffix)
+        return suffixes
+
+    def _iter_nodes_for_frag(self, policy, partition, node):
+        """
+        Generate a priority list of nodes that can sync to the given node.
+
+        The primary node is always the highest priority, after that we'll use
+        handoffs.
+
+        To avoid conflicts placing frags we'll skip through the handoffs and
+        only yield back those that are offset equal to the given primary
+        node index.
+
+        Nodes returned from this iterator will have 'backend_index' set.
+        """
+        node['backend_index'] = policy.get_backend_index(node['index'])
+        yield node
+        count = 0
+        for handoff_node in policy.object_ring.get_more_nodes(partition):
+            handoff_backend_index = policy.get_backend_index(
+                handoff_node['handoff_index'])
+            if handoff_backend_index == node['backend_index']:
+                if (self.rebuild_handoff_node_count >= 0 and
+                        count >= self.rebuild_handoff_node_count):
+                    break
+                handoff_node['backend_index'] = handoff_backend_index
+                yield handoff_node
+                count += 1
+
+    def _get_suffixes_to_sync(self, job, node):
+        """
+        For SYNC jobs we need to make a remote REPLICATE request to get
+        the remote node's current suffix's hashes and then compare to our
+        local suffix's hashes to decide which suffixes (if any) are out
+        of sync.
+
+        :param job: the job dict, with the keys defined in ``_get_part_jobs``
+        :param node: the remote node dict
+        :returns: a (possibly empty) list of strings, the suffixes to be
+                  synced and the remote node.
+        """
+        # get hashes from the remote node
+        remote_suffixes = None
+        attempts_remaining = 1
+        headers = self.headers.copy()
+        headers['X-Backend-Storage-Policy-Index'] = int(job['policy'])
+        possible_nodes = self._iter_nodes_for_frag(
+            job['policy'], job['partition'], node)
+        while remote_suffixes is None and attempts_remaining:
+            try:
+                node = next(possible_nodes)
+            except StopIteration:
+                break
+            attempts_remaining -= 1
+            conn = None
+            try:
+                with Timeout(self.http_timeout):
+                    conn = http_connect(
+                        node['replication_ip'], node['replication_port'],
+                        node['device'], job['partition'], 'REPLICATE',
+                        '', headers=headers)
+                    resp = conn.getresponse()
+                if resp.status == HTTP_INSUFFICIENT_STORAGE:
+                    self.logger.error(
+                        '%s responded as unmounted',
+                        _full_path(node, job['partition'], '',
+                                   job['policy']))
+                    attempts_remaining += 1
+                elif resp.status != HTTP_OK:
+                    full_path = _full_path(node, job['partition'], '',
+                                           job['policy'])
+                    self.logger.error(
+                        "Invalid response %(resp)s from %(full_path)s",
+                        {'resp': resp.status, 'full_path': full_path})
+                else:
+                    remote_suffixes = pickle.loads(resp.read())  # nosec: B301
+            except (Exception, Timeout):
+                # all exceptions are logged here so that our caller can
+                # safely catch our exception and continue to the next node
+                # without logging
+                self.logger.exception('Unable to get remote suffix hashes '
+                                      'from %r' % _full_path(
+                                          node, job['partition'], '',
+                                          job['policy']))
+            finally:
+                if conn:
+                    conn.close()
+        if remote_suffixes is None:
+            raise SuffixSyncError('Unable to get remote suffix hashes')
+
+        suffixes = self.get_suffix_delta(job['hashes'],
+                                         job['frag_index'],
+                                         remote_suffixes,
+                                         node['backend_index'])
+        # now recalculate local hashes for suffixes that don't
+        # match so we're comparing the latest
+        local_suff = self._get_hashes(job['local_dev']['device'],
+                                      job['partition'],
+                                      job['policy'], recalculate=suffixes)
+
+        suffixes = self.get_suffix_delta(local_suff,
+                                         job['frag_index'],
+                                         remote_suffixes,
+                                         node['backend_index'])
+
+        self.suffix_count += len(suffixes)
+        return suffixes, node
+
+    def delete_reverted_objs(self, job, objects):
+        """
+        For EC we can potentially revert only some of a partition
+        so we'll delete reverted objects here. Note that we delete
+        the fragment index of the file we sent to the remote node.
+
+        :param job: the job being processed
+        :param objects: a dict of objects to be deleted, each entry maps
+                        hash=>timestamp
+        """
+        df_mgr = self._df_router[job['policy']]
+        suffixes_to_delete = set()
+        for object_hash, timestamps in objects.items():
+            try:
+                df, filenames = df_mgr.get_diskfile_and_filenames_from_hash(
+                    job['local_dev']['device'], job['partition'],
+                    object_hash, job['policy'],
+                    frag_index=job['frag_index'])
+                # legacy durable data files look like modern nondurable data
+                # files; we therefore override nondurable_purge_delay when we
+                # know the data file is durable so that legacy durable data
+                # files get purged
+                nondurable_purge_delay = (0 if timestamps.get('durable')
+                                          else df_mgr.commit_window)
+                data_files = [
+                    f for f in filenames
+                    if f.endswith('.data')]
+                purgable_data_files = [
+                    f for f in data_files
+                    if f.startswith(timestamps['ts_data'].internal)]
+                if (job['primary_frag_index'] is None
+                        and len(purgable_data_files) == len(data_files) <= 1):
+                    # pure handoff node, and we're about to purge the last
+                    # .data file, so it's ok to remove any meta file that may
+                    # have been reverted
+                    meta_timestamp = timestamps.get('ts_meta')
+                else:
+                    meta_timestamp = None
+                df.purge(timestamps['ts_data'], job['frag_index'],
+                         nondurable_purge_delay, meta_timestamp)
+            except DiskFileNotExist:
+                # may have passed reclaim age since being reverted, or may have
+                # raced with another reconstructor process trying the same
+                pass
+            except DiskFileError:
+                self.logger.exception(
+                    'Unable to purge DiskFile (%r %r %r)',
+                    object_hash, timestamps['ts_data'], job['frag_index'])
+            suffixes_to_delete.add(object_hash[-3:])
+
+        for suffix in suffixes_to_delete:
+            remove_directory(os.path.join(job['path'], suffix))
+
+    def process_job(self, job):
+        """
+        Sync the local partition with the remote node(s) according to
+        the parameters of the job.  For primary nodes, the SYNC job type
+        will define both left and right hand sync_to nodes to ssync with
+        as defined by this primary nodes index in the node list based on
+        the fragment index found in the partition.  For non-primary
+        nodes (either handoff revert, or rebalance) the REVERT job will
+        define a single node in sync_to which is the proper/new home for
+        the fragment index.
+
+        N.B. ring rebalancing can be time consuming and handoff nodes'
+        fragment indexes do not have a stable order, it's possible to
+        have more than one REVERT job for a partition, and in some rare
+        failure conditions there may even also be a SYNC job for the
+        same partition - but each one will be processed separately
+        because each job will define a separate list of node(s) to
+        'sync_to'.
+
+        :param job: the job dict, with the keys defined in ``_get_job_info``
+        """
+        begin = time.time()
+        if job['job_type'] == REVERT:
+            self._revert(job, begin)
+        else:
+            self._sync(job, begin)
+        self.partition_times.append(time.time() - begin)
+        self.reconstruction_count += 1
+
+    def _sync(self, job, begin):
+        """
+        Process a SYNC job.
+        """
+        self.logger.increment(
+            'partition.update.count.%s' % (job['local_dev']['device'],))
+        for node in job['sync_to']:
+            try:
+                suffixes, node = self._get_suffixes_to_sync(job, node)
+            except SuffixSyncError:
+                continue
+
+            if not suffixes:
+                continue
+
+            # ssync any out-of-sync suffixes with the remote node; do not limit
+            # max_objects - we need to check them all because, unlike a revert
+            # job, we don't purge any objects so start with the same set each
+            # cycle
+            success, _ = ssync_sender(
+                self, node, job, suffixes, include_non_durable=False,
+                max_objects=0)()
+            # update stats for this attempt
+            self.suffix_sync += len(suffixes)
+            self.logger.update_stats('suffix.syncs', len(suffixes))
+        self.logger.timing_since('partition.update.timing', begin)
+
+    def _revert(self, job, begin):
+        """
+        Process a REVERT job.
+        """
+        self.logger.increment(
+            'partition.delete.count.%s' % (job['local_dev']['device'],))
+        syncd_with = 0
+        reverted_objs = {}
+        try:
+            df_mgr = self._df_router[job['policy']]
+            # Only object-server can take this lock if an incoming SSYNC is
+            # running on the same partition. Taking the lock here ensure we
+            # won't enter a race condition where both nodes try to
+            # cross-replicate the same partition and both delete it.
+            with df_mgr.partition_lock(job['device'], job['policy'],
+                                       job['partition'], name='replication',
+                                       timeout=0.2):
+                limited_by_max_objects = False
+                for node in job['sync_to']:
+                    node['backend_index'] = job['policy'].get_backend_index(
+                        node['index'])
+                    sender = ssync_sender(
+                        self, node, job, job['suffixes'],
+                        include_non_durable=True,
+                        max_objects=self.max_objects_per_revert)
+                    success, in_sync_objs = sender()
+                    limited_by_max_objects |= sender.limited_by_max_objects
+                    if success:
+                        syncd_with += 1
+                        reverted_objs.update(in_sync_objs)
+                if syncd_with >= len(job['sync_to']):
+                    self.delete_reverted_objs(job, reverted_objs)
+                if syncd_with < len(job['sync_to']) or limited_by_max_objects:
+                    self.handoffs_remaining += 1
+        except PartitionLockTimeout:
+            self.logger.info("Unable to lock handoff partition %d for revert "
+                             "on device %s policy %d",
+                             job['partition'], job['device'], job['policy'])
+            self.logger.increment('partition.lock-failure.count')
+            self.handoffs_remaining += 1
+        self.logger.timing_since('partition.delete.timing', begin)
+
+    def _get_part_jobs(self, local_dev, part_path, partition, policy):
+        """
+        Helper function to build jobs for a partition, this method will
+        read the suffix hashes and create job dictionaries to describe
+        the needed work.  There will be one job for each fragment index
+        discovered in the partition.
+
+        For a fragment index which corresponds to this node's ring
+        index, a job with job_type SYNC will be created to ensure that
+        the left and right hand primary ring nodes for the part have the
+        corresponding left and right hand fragment archives.
+
+        A fragment index (or entire partition) for which this node is
+        not the primary corresponding node, will create job(s) with
+        job_type REVERT to ensure that fragment archives are pushed to
+        the correct node and removed from this one.
+
+        A partition may result in multiple jobs.  Potentially many
+        REVERT jobs, and zero or one SYNC job.
+
+        :param local_dev: the local device (node dict)
+        :param part_path: full path to partition
+        :param partition: partition number
+        :param policy: the policy
+
+        :returns: a list of dicts of job info
+
+        N.B. If this function ever returns an empty list of jobs the entire
+        partition will be deleted.
+        """
+        # find all the fi's in the part, and which suffixes have them
+        try:
+            hashes = self._get_hashes(local_dev['device'], partition, policy,
+                                      do_listdir=True)
+        except OSError as e:
+            if e.errno != errno.ENOTDIR:
+                raise
+            self.logger.warning(
+                'Unexpected entity %r is not a directory' % part_path)
+            return []
+        non_data_fragment_suffixes = []
+        data_fi_to_suffixes = defaultdict(list)
+        for suffix, fi_hash in hashes.items():
+            if not fi_hash:
+                # this is for sanity and clarity, normally an empty
+                # suffix would get del'd from the hashes dict, but an
+                # OSError trying to re-hash the suffix could leave the
+                # value empty - it will log the exception; but there's
+                # no way to properly address this suffix at this time.
+                continue
+            data_frag_indexes = [f for f in fi_hash if f is not None]
+            if not data_frag_indexes:
+                non_data_fragment_suffixes.append(suffix)
+            else:
+                for fi in data_frag_indexes:
+                    data_fi_to_suffixes[fi].append(suffix)
+
+        # helper to ensure consistent structure of jobs
+        def build_job(job_type, frag_index, suffixes, sync_to,
+                      primary_frag_index):
+            return {
+                'job_type': job_type,
+                'frag_index': frag_index,
+                'suffixes': suffixes,
+                'sync_to': sync_to,
+                'partition': partition,
+                'path': part_path,
+                'hashes': hashes,
+                'policy': policy,
+                'local_dev': local_dev,
+                # ssync likes to have it handy
+                'device': local_dev['device'],
+                # provide a hint to revert jobs that the node is a primary for
+                # one of the frag indexes
+                'primary_frag_index': primary_frag_index,
+            }
+
+        # aggregate jobs for all the fragment index in this part
+        jobs = []
+
+        # check the primary nodes - to see if the part belongs here
+        primary_frag_index = None
+        part_nodes = policy.object_ring.get_part_nodes(partition)
+        for node in part_nodes:
+            if node['id'] == local_dev['id']:
+                # this partition belongs here, we'll need a sync job
+                primary_frag_index = policy.get_backend_index(node['index'])
+                try:
+                    suffixes = data_fi_to_suffixes.pop(primary_frag_index)
+                except KeyError:
+                    # N.B. If this function ever returns an empty list of jobs
+                    # the entire partition will be deleted.
+                    suffixes = []
+                sync_job = build_job(
+                    job_type=SYNC,
+                    frag_index=primary_frag_index,
+                    suffixes=suffixes,
+                    sync_to=_get_partners(node['index'], part_nodes),
+                    primary_frag_index=primary_frag_index
+                )
+                # ssync callback to rebuild missing fragment_archives
+                sync_job['sync_diskfile_builder'] = self.reconstruct_fa
+                jobs.append(sync_job)
+                break
+
+        # assign remaining data fragment suffixes to revert jobs
+        ordered_fis = sorted((len(suffixes), fi) for fi, suffixes
+                             in data_fi_to_suffixes.items())
+        for count, fi in ordered_fis:
+            # In single region EC a revert job must sync to the specific
+            # primary who's node_index matches the data's frag_index.  With
+            # duplicated EC frags a revert job must sync to all primary nodes
+            # that should be holding this frag_index.
+            if fi >= len(part_nodes):
+                self.logger.warning(
+                    'Bad fragment index %r for suffixes %r under %s',
+                    fi, data_fi_to_suffixes[fi], part_path)
+                continue
+            nodes_sync_to = []
+            node_index = fi
+            for n in range(policy.ec_duplication_factor):
+                nodes_sync_to.append(part_nodes[node_index])
+                node_index += policy.ec_n_unique_fragments
+
+            revert_job = build_job(
+                job_type=REVERT,
+                frag_index=fi,
+                suffixes=data_fi_to_suffixes[fi],
+                sync_to=nodes_sync_to,
+                primary_frag_index=primary_frag_index
+            )
+            jobs.append(revert_job)
+
+        # now we need to assign suffixes that have no data fragments
+        if non_data_fragment_suffixes:
+            if jobs:
+                # the first job will be either the sync_job, or the
+                # revert_job for the fragment index that is most common
+                # among the suffixes
+                jobs[0]['suffixes'].extend(non_data_fragment_suffixes)
+            else:
+                # this is an unfortunate situation, we need a revert job to
+                # push partitions off this node, but none of the suffixes
+                # have any data fragments to hint at which node would be a
+                # good candidate to receive the tombstones.
+                #
+                # we'll check a sample of other primaries before we delete our
+                # local tombstones, the exact number doesn't matter as long as
+                # it's enough to ensure the tombstones are not lost and less
+                # than *all the replicas*
+                nsample = (policy.ec_n_unique_fragments *
+                           policy.ec_duplication_factor) - policy.ec_ndata + 1
+                jobs.append(build_job(
+                    job_type=REVERT,
+                    frag_index=None,
+                    suffixes=non_data_fragment_suffixes,
+                    sync_to=random.sample(part_nodes, nsample),
+                    primary_frag_index=primary_frag_index
+                ))
+        # return a list of jobs for this part
+        return jobs
+
+    def get_policy2devices(self):
+        ips = whataremyips(self.ring_ip)
+        policy2devices = {}
+        for policy in self.policies:
+            self.load_object_ring(policy)
+            local_devices = [
+                dev for dev in policy.object_ring.devs
+                if dev and is_local_device(
+                    ips, self.port,
+                    dev['replication_ip'], dev['replication_port'])]
+            policy2devices[policy] = local_devices
+        return policy2devices
+
+    def get_local_devices(self):
+        """Returns a set of all local devices in all EC policies."""
+        policy2devices = self.get_policy2devices()
+        local_devices = set()
+        for devices in policy2devices.values():
+            local_devices.update(d['device'] for d in devices)
+        return local_devices
+
+    def collect_parts(self, override_devices=None, override_partitions=None):
+        """
+        Helper for getting partitions in the top level reconstructor
+
+        In handoffs_only mode primary partitions will not be included in the
+        returned (possibly empty) list.
+        """
+        override_devices = override_devices or []
+        override_partitions = override_partitions or []
+
+        policy2devices = self.get_policy2devices()
+        all_parts = []
+
+        for policy, local_devices in policy2devices.items():
+            # Skip replication if next_part_power is set. In this case
+            # every object is hard-linked twice, but the replicator
+            # can't detect them and would create a second copy of the
+            # file if not yet existing - and this might double the
+            # actual transferred and stored data
+            next_part_power = getattr(
+                policy.object_ring, 'next_part_power', None)
+            if next_part_power is not None:
+                self.logger.warning(
+                    "next_part_power set in policy '%s'. Skipping",
+                    policy.name)
+                continue
+
+            df_mgr = self._df_router[policy]
+            for local_dev in local_devices:
+                if override_devices and (
+                        local_dev['device'] not in override_devices):
+                    continue
+                self.device_count += 1
+                dev_path = df_mgr.get_dev_path(local_dev['device'])
+                if not dev_path:
+                    self.logger.warning('%s is not mounted',
+                                        local_dev['device'])
+                    continue
+                data_dir = get_data_dir(policy)
+                obj_path = join(dev_path, data_dir)
+                tmp_path = join(dev_path, get_tmp_dir(int(policy)))
+                unlink_older_than(tmp_path, time.time() -
+                                  df_mgr.reclaim_age)
+                if not os.path.exists(obj_path):
+                    try:
+                        mkdirs(obj_path)
+                    except Exception:
+                        self.logger.exception(
+                            'Unable to create %s' % obj_path)
+                    continue
+                try:
+                    partitions = os.listdir(obj_path)
+                except OSError:
+                    self.logger.exception(
+                        'Unable to list partitions in %r' % obj_path)
+                    continue
+
+                self.part_count += len(partitions)
+                for partition in partitions:
+                    part_path = join(obj_path, partition)
+                    if (partition.startswith('auditor_status_') and
+                            partition.endswith('.json')):
+                        # ignore auditor status files
+                        continue
+                    if not partition.isdigit():
+                        self.logger.warning(
+                            'Unexpected entity in data dir: %r' % part_path)
+                        self.delete_partition(part_path)
+                        self.reconstruction_part_count += 1
+                        continue
+                    partition = int(partition)
+                    if override_partitions and (partition not in
+                                                override_partitions):
+                        continue
+                    # N.B. At a primary node in handoffs_only mode may skip to
+                    # sync misplaced (handoff) fragments in the primary
+                    # partition. That may happen while rebalancing several
+                    # times. (e.g. a node holding handoff fragment being a new
+                    # primary) Those fragments will be synced (and revert) once
+                    # handoffs_only mode turned off.
+                    if self.handoffs_only and any(
+                            local_dev['id'] == n['id']
+                            for n in policy.object_ring.get_part_nodes(
+                            partition)):
+                        self.logger.debug('Skipping %s job for %s '
+                                          'while in handoffs_only mode.',
+                                          SYNC, part_path)
+                        continue
+                    part_info = {
+                        'local_dev': local_dev,
+                        'policy': policy,
+                        'partition': partition,
+                        'part_path': part_path,
+                    }
+                    all_parts.append(part_info)
+        random.shuffle(all_parts)
+        return all_parts
+
+    def build_reconstruction_jobs(self, part_info):
+        """
+        Helper function for collect_jobs to build jobs for reconstruction
+        using EC style storage policy
+
+        N.B. If this function ever returns an empty list of jobs the entire
+        partition will be deleted.
+        """
+        jobs = self._get_part_jobs(**part_info)
+        random.shuffle(jobs)
+        self.job_count += len(jobs)
+        return jobs
+
+    def _reset_stats(self):
+        self.start = time.time()
+        self.job_count = 0
+        self.part_count = 0
+        self.device_count = 0
+        self.suffix_count = 0
+        self.suffix_sync = 0
+        self.suffix_hash = 0
+        self.reconstruction_count = 0
+        self.reconstruction_part_count = 0
+        self.last_reconstruction_count = -1
+        self.handoffs_remaining = 0
+
+    def delete_partition(self, path):
+        def kill_it(path):
+            shutil.rmtree(path, ignore_errors=True)
+            remove_file(path)
+
+        self.logger.info("Removing partition: %s", path)
+        tpool.execute(kill_it, path)
+
+    def reconstruct(self, **kwargs):
+        """Run a reconstruction pass"""
+        self._reset_stats()
+        self.partition_times = []
+
+        stats = spawn(self.heartbeat)
+        lockup_detector = spawn(self.detect_lockups)
+        changed_rings = set()
+
+        try:
+            self.run_pool = GreenPool(size=self.concurrency)
+            for part_info in self.collect_parts(**kwargs):
+                sleep()  # Give spawns a cycle
+                if part_info['policy'] in changed_rings:
+                    continue
+                if not self.check_ring(part_info['policy'].object_ring):
+                    changed_rings.add(part_info['policy'])
+                    self.logger.info(
+                        "Ring change detected for policy %d (%s). Aborting "
+                        "current reconstruction pass for this policy.",
+                        part_info['policy'].idx, part_info['policy'].name)
+                    continue
+
+                self.reconstruction_part_count += 1
+                jobs = self.build_reconstruction_jobs(part_info)
+                if not jobs:
+                    # If this part belongs on this node, _get_part_jobs
+                    # will *always* build a sync_job - even if there's
+                    # no suffixes in the partition that needs to sync.
+                    # If there's any suffixes in the partition then our
+                    # job list would have *at least* one revert job.
+                    # Therefore we know this part a) doesn't belong on
+                    # this node and b) doesn't have any suffixes in it.
+                    self.run_pool.spawn(self.delete_partition,
+                                        part_info['part_path'])
+                for job in jobs:
+                    self.run_pool.spawn(self.process_job, job)
+            with Timeout(self.lockup_timeout):
+                self.run_pool.waitall()
+        except (Exception, Timeout):
+            self.logger.exception("Exception in top-level "
+                                  "reconstruction loop")
+            self.kill_coros()
+        finally:
+            stats.kill()
+            lockup_detector.kill()
+            self.stats_line()
+        if self.handoffs_only:
+            if self.handoffs_remaining > 0:
+                self.logger.info(
+                    "Handoffs only mode still has handoffs remaining. "
+                    "Next pass will continue to revert handoffs.")
+            else:
+                self.logger.warning(
+                    "Handoffs only mode found no handoffs remaining. "
+                    "You should disable handoffs_only once all nodes "
+                    "are reporting no handoffs remaining.")
+
+    def final_recon_dump(self, total, override_devices=None, **kwargs):
+        """
+        Add stats for this worker's run to recon cache.
+
+        When in worker mode (per_disk_stats == True) this worker's stats are
+        added per device instead of in the top level keys (aggregation is
+        serialized in the parent process).
+
+        :param total: the runtime of cycle in minutes
+        :param override_devices: (optional) list of device that are being
+            reconstructed
+        """
+        recon_update = {
+            'object_reconstruction_time': total,
+            'object_reconstruction_last': time.time(),
+        }
+
+        devices = override_devices or self.all_local_devices
+        if self.reconstructor_workers > 0 and devices:
+            recon_update['pid'] = os.getpid()
+            recon_update = {'object_reconstruction_per_disk': {
+                d: recon_update for d in devices}}
+        else:
+            # if not running in worker mode, kill any per_disk stats
+            recon_update['object_reconstruction_per_disk'] = {}
+        dump_recon_cache(recon_update, self.rcache, self.logger)
+
+    def post_multiprocess_run(self):
+        # This method is called after run_once when using multiple workers.
+        self.aggregate_recon_update()
+
+    def run_once(self, multiprocess_worker_index=None, *args, **kwargs):
+        if multiprocess_worker_index is not None:
+            self._emplace_log_prefix(multiprocess_worker_index)
+        start = time.time()
+        self.logger.info("Running object reconstructor in script mode.")
+        override_opts = parse_override_options(once=True, **kwargs)
+        self.reconstruct(override_devices=override_opts.devices,
+                         override_partitions=override_opts.partitions)
+        total = (time.time() - start) / 60
+        self.logger.info(
+            "Object reconstruction complete (once). (%.02f minutes)", total)
+        # Only dump stats if they would actually be meaningful -- i.e. we're
+        # collecting per-disk stats and covering all partitions, or we're
+        # covering all partitions, all disks.
+        if not override_opts.partitions and (
+                self.reconstructor_workers > 0 or not override_opts.devices):
+            self.final_recon_dump(
+                total, override_devices=override_opts.devices,
+                override_partitions=override_opts.partitions)
+
+    def run_forever(self, multiprocess_worker_index=None, *args, **kwargs):
+        if multiprocess_worker_index is not None:
+            self._emplace_log_prefix(multiprocess_worker_index)
+        self.logger.info("Starting object reconstructor in daemon mode.")
+        # Run the reconstructor continually
+        while True:
+            start = time.time()
+            self.logger.info("Starting object reconstruction pass.")
+            override_opts = parse_override_options(**kwargs)
+            # Run the reconstructor
+            self.reconstruct(override_devices=override_opts.devices,
+                             override_partitions=override_opts.partitions)
+            total = (time.time() - start) / 60
+            self.logger.info(
+                "Object reconstruction complete. (%.02f minutes)", total)
+            self.final_recon_dump(
+                total, override_devices=override_opts.devices,
+                override_partitions=override_opts.partitions)
+            self.logger.debug('reconstruction sleeping for %s seconds.',
+                              self.interval)
+            sleep(self.interval)
+
+
+def main():
+    parser = OptionParser("%prog CONFIG [options]")
+    parser.add_option('-d', '--devices',
+                      help='Reconstruct only given devices. '
+                           'Comma-separated list. '
+                           'Only has effect if --once is used.')
+    parser.add_option('-p', '--partitions',
+                      help='Reconstruct only given partitions. '
+                           'Comma-separated list. '
+                           'Only has effect if --once is used.')
+    conf_file, options = parse_options(parser=parser, once=True)
+    run_daemon(ObjectReconstructor, conf_file, **options)
+
+
+if __name__ == '__main__':
+    main()
diff --git a/swift/obj/replicator.py b/swift/obj/replicator.py
index fb1d6974f3..332eaca8e0 100644
--- a/swift/obj/replicator.py
+++ b/swift/obj/replicator.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,222 +13,105 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
+from collections import defaultdict
+from optparse import OptionParser
 import os
-from os.path import basename, dirname, isdir, isfile, join
+import errno
+from os.path import isdir, isfile, join, dirname
 import random
 import shutil
 import time
-import logging
-import hashlib
 import itertools
-import cPickle as pickle
-import errno
-import uuid
+import pickle  # nosec: B403
 
 import eventlet
-from eventlet import GreenPool, tpool, Timeout, sleep, hubs
+from eventlet import GreenPool, queue, tpool, Timeout, sleep
 from eventlet.green import subprocess
-from eventlet.support.greenlets import GreenletExit
 
-from swift.common.ring import Ring
-from swift.common.utils import whataremyips, unlink_older_than, lock_path, \
-    compute_eta, get_logger, write_pickle, renamer, dump_recon_cache, \
-    rsync_ip, mkdirs, config_true_value, list_from_csv
+from swift.common.constraints import check_drive
+from swift.common.ring.utils import is_local_device
+from swift.common.utils import whataremyips, unlink_older_than, \
+    compute_eta, get_logger, dump_recon_cache, parse_options, \
+    rsync_module_interpolation, mkdirs, config_true_value, \
+    config_auto_int_value, storage_directory, load_recon_cache, EUCLEAN, \
+    parse_override_options, distribute_evenly, listdir, node_to_string, \
+    get_prefixed_logger
 from swift.common.bufferedhttp import http_connect
-from swift.common.daemon import Daemon
+from swift.common.daemon import Daemon, run_daemon
 from swift.common.http import HTTP_OK, HTTP_INSUFFICIENT_STORAGE
-from swift.common.exceptions import PathNotDir
+from swift.common.recon import RECON_OBJECT_FILE, DEFAULT_RECON_CACHE_PATH
+from swift.obj import ssync_sender
+from swift.obj.diskfile import get_data_dir, get_tmp_dir, DiskFileRouter
+from swift.common.storage_policy import POLICIES, REPL_POLICY
+from swift.common.exceptions import PartitionLockTimeout
 
-hubs.use_hub('poll')
+DEFAULT_RSYNC_TIMEOUT = 900
 
-PICKLE_PROTOCOL = 2
-ONE_WEEK = 604800
-HASH_FILE = 'hashes.pkl'
 
+def _do_listdir(partition, replication_cycle):
+    return (((partition + replication_cycle) % 10) == 0)
 
-def quarantine_renamer(device_path, corrupted_file_path):
-    """
-    In the case that a file is corrupted, move it to a quarantined
-    area to allow replication to fix it.
 
-    :params device_path: The path to the device the corrupted file is on.
-    :params corrupted_file_path: The path to the file you want quarantined.
+class Stats(object):
+    fields = ['attempted', 'failure', 'hashmatch', 'remove', 'rsync',
+              'success', 'suffix_count', 'suffix_hash', 'suffix_sync',
+              'failure_nodes']
 
-    :returns: path (str) of directory the file was moved to
-    :raises OSError: re-raises non errno.EEXIST / errno.ENOTEMPTY
-                     exceptions from rename
-    """
-    from_dir = dirname(corrupted_file_path)
-    to_dir = join(device_path, 'quarantined', 'objects', basename(from_dir))
-    invalidate_hash(dirname(from_dir))
-    try:
-        renamer(from_dir, to_dir)
-    except OSError, e:
-        if e.errno not in (errno.EEXIST, errno.ENOTEMPTY):
-            raise
-        to_dir = "%s-%s" % (to_dir, uuid.uuid4().hex)
-        renamer(from_dir, to_dir)
-    return to_dir
-
-
-def hash_suffix(path, reclaim_age):
-    """
-    Performs reclamation and returns an md5 of all (remaining) files.
+    @classmethod
+    def from_recon(cls, dct):
+        return cls(**{k: v for k, v in dct.items() if k in cls.fields})
 
-    :param reclaim_age: age in seconds at which to remove tombstones
-    :raises PathNotDir: if given path is not a valid directory
-    :raises OSError: for non-ENOTDIR errors
-    """
-    md5 = hashlib.md5()
-    try:
-        path_contents = sorted(os.listdir(path))
-    except OSError, err:
-        if err.errno in (errno.ENOTDIR, errno.ENOENT):
-            raise PathNotDir()
-        raise
-    for hsh in path_contents:
-        hsh_path = join(path, hsh)
-        try:
-            files = os.listdir(hsh_path)
-        except OSError, err:
-            if err.errno == errno.ENOTDIR:
-                partition_path = dirname(path)
-                objects_path = dirname(partition_path)
-                device_path = dirname(objects_path)
-                quar_path = quarantine_renamer(device_path, hsh_path)
-                logging.exception(
-                    _('Quarantined %s to %s because it is not a directory') %
-                    (hsh_path, quar_path))
-                continue
-            raise
-        if len(files) == 1:
-            if files[0].endswith('.ts'):
-                # remove tombstones older than reclaim_age
-                ts = files[0].rsplit('.', 1)[0]
-                if (time.time() - float(ts)) > reclaim_age:
-                    os.unlink(join(hsh_path, files[0]))
-                    files.remove(files[0])
-        elif files:
-            files.sort(reverse=True)
-            meta = data = tomb = None
-            for filename in list(files):
-                if not meta and filename.endswith('.meta'):
-                    meta = filename
-                if not data and filename.endswith('.data'):
-                    data = filename
-                if not tomb and filename.endswith('.ts'):
-                    tomb = filename
-                if (filename < tomb or       # any file older than tomb
-                    filename < data or       # any file older than data
-                    (filename.endswith('.meta') and
-                     filename < meta)):      # old meta
-                    os.unlink(join(hsh_path, filename))
-                    files.remove(filename)
-        if not files:
-            os.rmdir(hsh_path)
-        for filename in files:
-            md5.update(filename)
-    try:
-        os.rmdir(path)
-    except OSError:
-        pass
-    return md5.hexdigest()
-
-
-def invalidate_hash(suffix_dir):
-    """
-    Invalidates the hash for a suffix_dir in the partition's hashes file.
+    def to_recon(self):
+        return {k: getattr(self, k) for k in self.fields}
 
-    :param suffix_dir: absolute path to suffix dir whose hash needs
-                       invalidating
-    """
+    def __init__(self, attempted=0, failure=0, hashmatch=0, remove=0, rsync=0,
+                 success=0, suffix_count=0, suffix_hash=0,
+                 suffix_sync=0, failure_nodes=None):
+        self.attempted = attempted
+        self.failure = failure
+        self.hashmatch = hashmatch
+        self.remove = remove
+        self.rsync = rsync
+        self.success = success
+        self.suffix_count = suffix_count
+        self.suffix_hash = suffix_hash
+        self.suffix_sync = suffix_sync
+        self.failure_nodes = defaultdict(lambda: defaultdict(int),
+                                         (failure_nodes or {}))
 
-    suffix = os.path.basename(suffix_dir)
-    partition_dir = os.path.dirname(suffix_dir)
-    hashes_file = join(partition_dir, HASH_FILE)
-    with lock_path(partition_dir):
-        try:
-            with open(hashes_file, 'rb') as fp:
-                hashes = pickle.load(fp)
-            if suffix in hashes and not hashes[suffix]:
-                return
-        except Exception:
-            return
-        hashes[suffix] = None
-        write_pickle(hashes, hashes_file, partition_dir, PICKLE_PROTOCOL)
-
-
-def get_hashes(partition_dir, recalculate=[], do_listdir=False,
-               reclaim_age=ONE_WEEK):
-    """
-    Get a list of hashes for the suffix dir.  do_listdir causes it to mistrust
-    the hash cache for suffix existence at the (unexpectedly high) cost of a
-    listdir.  reclaim_age is just passed on to hash_suffix.
+    def __add__(self, other):
+        total = type(self)()
+        total.attempted = self.attempted + other.attempted
+        total.failure = self.failure + other.failure
+        total.hashmatch = self.hashmatch + other.hashmatch
+        total.remove = self.remove + other.remove
+        total.rsync = self.rsync + other.rsync
+        total.success = self.success + other.success
+        total.suffix_count = self.suffix_count + other.suffix_count
+        total.suffix_hash = self.suffix_hash + other.suffix_hash
+        total.suffix_sync = self.suffix_sync + other.suffix_sync
 
-    :param partition_dir: absolute path of partition to get hashes for
-    :param recalculate: list of suffixes which should be recalculated when got
-    :param do_listdir: force existence check for all hashes in the partition
-    :param reclaim_age: age at which to remove tombstones
+        all_failed_ips = (set(list(self.failure_nodes.keys()) +
+                              list(other.failure_nodes.keys())))
+        for ip in all_failed_ips:
+            self_devs = self.failure_nodes.get(ip, {})
+            other_devs = other.failure_nodes.get(ip, {})
+            this_ip_failures = {}
+            for dev in set(list(self_devs.keys()) + list(other_devs.keys())):
+                this_ip_failures[dev] = (
+                    self_devs.get(dev, 0) + other_devs.get(dev, 0))
+            total.failure_nodes[ip] = this_ip_failures
+        return total
 
-    :returns: tuple of (number of suffix dirs hashed, dictionary of hashes)
-    """
+    def add_failure_stats(self, failures):
+        """
+        Note the failure of one or more devices.
 
-    hashed = 0
-    hashes_file = join(partition_dir, HASH_FILE)
-    modified = False
-    force_rewrite = False
-    hashes = {}
-    mtime = -1
-    try:
-        with open(hashes_file, 'rb') as fp:
-            hashes = pickle.load(fp)
-        mtime = os.path.getmtime(hashes_file)
-    except Exception:
-        do_listdir = True
-        force_rewrite = True
-    if do_listdir:
-        for suff in os.listdir(partition_dir):
-            if len(suff) == 3:
-                hashes.setdefault(suff, None)
-        modified = True
-    hashes.update((hash_, None) for hash_ in recalculate)
-    for suffix, hash_ in hashes.items():
-        if not hash_:
-            suffix_dir = join(partition_dir, suffix)
-            try:
-                hashes[suffix] = hash_suffix(suffix_dir, reclaim_age)
-                hashed += 1
-            except PathNotDir:
-                del hashes[suffix]
-            except OSError:
-                logging.exception(_('Error hashing suffix'))
-            modified = True
-    if modified:
-        with lock_path(partition_dir):
-            if force_rewrite or not os.path.exists(hashes_file) or \
-                    os.path.getmtime(hashes_file) == mtime:
-                write_pickle(
-                    hashes, hashes_file, partition_dir, PICKLE_PROTOCOL)
-                return hashed, hashes
-        return get_hashes(partition_dir, recalculate, do_listdir,
-                          reclaim_age)
-    else:
-        return hashed, hashes
-
-
-def tpool_reraise(func, *args, **kwargs):
-    """
-    Hack to work around Eventlet's tpool not catching and reraising Timeouts.
-    """
-    def inner():
-        try:
-            return func(*args, **kwargs)
-        except BaseException, err:
-            return err
-    resp = tpool.execute(inner)
-    if isinstance(resp, BaseException):
-        raise resp
-    return resp
+        :param failures: a list of (ip, device-name) pairs that failed
+        """
+        self.failure += len(failures)
+        for ip, device in failures:
+            self.failure_nodes[ip][device] += 1
 
 
 class ObjectReplicator(Daemon):
@@ -240,33 +123,247 @@ class ObjectReplicator(Daemon):
     caller to do this in a loop.
     """
 
-    def __init__(self, conf):
+    def __init__(self, conf, logger=None):
         """
         :param conf: configuration object obtained from ConfigParser
-        :param logger: logging object
+        :param logger: an instance of ``SwiftLogAdapter``.
         """
         self.conf = conf
-        self.logger = get_logger(conf, log_route='object-replicator')
+        self.logger = \
+            logger or get_logger(conf, log_route='object-replicator')
         self.devices_dir = conf.get('devices', '/srv/node')
         self.mount_check = config_true_value(conf.get('mount_check', 'true'))
-        self.vm_test_mode = config_true_value(conf.get('vm_test_mode', 'no'))
         self.swift_dir = conf.get('swift_dir', '/etc/swift')
-        self.port = int(conf.get('bind_port', 6000))
+        self.ring_ip = conf.get('ring_ip', conf.get('bind_ip', '0.0.0.0'))
+        self.servers_per_port = int(conf.get('servers_per_port', '0') or 0)
+        self.port = None if self.servers_per_port else \
+            int(conf.get('bind_port', 6200))
         self.concurrency = int(conf.get('concurrency', 1))
-        self.stats_interval = int(conf.get('stats_interval', '300'))
-        self.object_ring = Ring(self.swift_dir, ring_name='object')
-        self.ring_check_interval = int(conf.get('ring_check_interval', 15))
+        self.replicator_workers = int(conf.get('replicator_workers', 0))
+        self.policies = [policy for policy in POLICIES
+                         if policy.policy_type == REPL_POLICY]
+        self.stats_interval = float(conf.get('stats_interval', '300'))
+        self.ring_check_interval = float(conf.get('ring_check_interval', 15))
         self.next_check = time.time() + self.ring_check_interval
-        self.reclaim_age = int(conf.get('reclaim_age', 86400 * 7))
+        self.replication_cycle = random.randint(0, 9)
         self.partition_times = []
-        self.run_pause = int(conf.get('run_pause', 30))
-        self.rsync_timeout = int(conf.get('rsync_timeout', 900))
+        self.interval = float(conf.get('interval') or
+                              conf.get('run_pause') or 30)
+        if 'run_pause' in conf:
+            if 'interval' in conf:
+                self.logger.warning(
+                    'Option object-replicator/run_pause is deprecated and '
+                    'object-replicator/interval is already configured. You '
+                    'can safely remove run_pause; it is now ignored and will '
+                    'be removed in a future version.')
+            else:
+                self.logger.warning(
+                    'Option object-replicator/run_pause is deprecated and '
+                    'will be removed in a future version. Update your '
+                    'configuration to use option object-replicator/interval.')
+        self.rsync_timeout = int(conf.get('rsync_timeout',
+                                          DEFAULT_RSYNC_TIMEOUT))
         self.rsync_io_timeout = conf.get('rsync_io_timeout', '30')
+        self.rsync_bwlimit = conf.get('rsync_bwlimit', '0')
+        self.rsync_compress = config_true_value(
+            conf.get('rsync_compress', 'no'))
+        self.rsync_module = conf.get('rsync_module', '').rstrip('/')
+        if not self.rsync_module:
+            self.rsync_module = '{replication_ip}::object'
         self.http_timeout = int(conf.get('http_timeout', 60))
-        self.lockup_timeout = int(conf.get('lockup_timeout', 1800))
         self.recon_cache_path = conf.get('recon_cache_path',
-                                         '/var/cache/swift')
-        self.rcache = os.path.join(self.recon_cache_path, "object.recon")
+                                         DEFAULT_RECON_CACHE_PATH)
+        self.rcache = os.path.join(self.recon_cache_path, RECON_OBJECT_FILE)
+        self._next_rcache_update = time.time() + self.stats_interval
+        self.conn_timeout = float(conf.get('conn_timeout', 0.5))
+        self.node_timeout = float(conf.get('node_timeout', 10))
+        self.sync_method = getattr(self, conf.get('sync_method') or 'rsync')
+        self.network_chunk_size = int(conf.get('network_chunk_size', 65536))
+        self.default_headers = {
+            'Content-Length': '0',
+            'user-agent': 'object-replicator %s' % os.getpid()}
+        self.log_rsync_transfers = config_true_value(
+            conf.get('log_rsync_transfers', True))
+        self.rsync_error_log_line_length = \
+            int(conf.get('rsync_error_log_line_length', 0))
+        self.handoffs_first = config_true_value(conf.get('handoffs_first',
+                                                         False))
+        self.handoff_delete = config_auto_int_value(
+            conf.get('handoff_delete', 'auto'), 0)
+        if any((self.handoff_delete, self.handoffs_first)):
+            self.logger.warning('Handoff only mode is not intended for normal '
+                                'operation, please disable handoffs_first and '
+                                'handoff_delete before the next '
+                                'normal rebalance')
+        if all(self.load_object_ring(p).replica_count <= self.handoff_delete
+               for p in self.policies):
+            self.logger.warning('No storage policies found for which '
+                                'handoff_delete=%d would have an effect. '
+                                'Disabling.', self.handoff_delete)
+            self.handoff_delete = 0
+        self.is_multiprocess_worker = None
+        self._df_router = DiskFileRouter(conf, self.logger)
+        self._child_process_reaper_queue = queue.LightQueue()
+        self.rings_mtime = None
+
+    def _zero_stats(self):
+        self.stats_for_dev = defaultdict(Stats)
+
+    @property
+    def total_stats(self):
+        return sum(self.stats_for_dev.values(), Stats())
+
+    def _emplace_log_prefix(self, worker_index):
+        self.logger = get_prefixed_logger(
+            self.logger, "[worker %d/%d pid=%d] " % (
+                worker_index + 1,
+                # use 1-based indexing for more readable logs
+                self.replicator_workers,
+                os.getpid()))
+
+    def _child_process_reaper(self):
+        """
+        Consume processes from self._child_process_reaper_queue and wait() for
+        them
+        """
+        procs = set()
+        done = False
+        while not done:
+            timeout = 60 if procs else None
+            try:
+                new_proc = self._child_process_reaper_queue.get(
+                    timeout=timeout)
+                if new_proc is not None:
+                    procs.add(new_proc)
+                else:
+                    done = True
+            except queue.Empty:
+                pass
+
+            reaped_procs = set()
+            for proc in procs:
+                # this will reap the process if it has exited, but
+                # otherwise will not wait
+                if proc.poll() is not None:
+                    reaped_procs.add(proc)
+            procs -= reaped_procs
+
+    def get_worker_args(self, once=False, **kwargs):
+        if self.replicator_workers < 1:
+            return []
+
+        override_opts = parse_override_options(once=once, **kwargs)
+        have_overrides = bool(override_opts.devices or override_opts.partitions
+                              or override_opts.policies)
+
+        # save this off for ring-change detection later in is_healthy()
+        self.all_local_devices = self.get_local_devices()
+
+        if override_opts.devices:
+            devices_to_replicate = [
+                d for d in override_opts.devices
+                if d in self.all_local_devices]
+        else:
+            # The sort isn't strictly necessary since we're just trying to
+            # spread devices around evenly, but it makes testing easier.
+            devices_to_replicate = sorted(self.all_local_devices)
+
+        # Distribute devices among workers as evenly as possible
+        self.replicator_workers = min(self.replicator_workers,
+                                      len(devices_to_replicate))
+        return [{'override_devices': devs,
+                 'override_partitions': override_opts.partitions,
+                 'override_policies': override_opts.policies,
+                 'have_overrides': have_overrides,
+                 'multiprocess_worker_index': index}
+                for index, devs in enumerate(
+                    distribute_evenly(devices_to_replicate,
+                                      self.replicator_workers))]
+
+    def is_healthy(self):
+        """
+        Check whether our set of local devices remains the same.
+
+        If devices have been added or removed, then we return False here so
+        that we can kill off any worker processes and then distribute the
+        new set of local devices across a new set of workers so that all
+        devices are, once again, being worked on.
+
+        This function may also cause recon stats to be updated.
+
+        :returns: False if any local devices have been added or removed,
+          True otherwise
+        """
+        # We update recon here because this is the only function we have in
+        # a multiprocess replicator that gets called periodically in the
+        # parent process.
+        if time.time() >= self._next_rcache_update:
+            update = self.aggregate_recon_update()
+            dump_recon_cache(update, self.rcache, self.logger)
+        rings_mtime = [os.path.getmtime(self.load_object_ring(
+                       policy).serialized_path) for policy in self.policies]
+        if self.rings_mtime == rings_mtime:
+            return True
+        self.rings_mtime = rings_mtime
+        return self.get_local_devices() == self.all_local_devices
+
+    def get_local_devices(self):
+        """
+        Returns a set of all local devices in all replication-type storage
+        policies.
+
+        This is the device names, e.g. "sdq" or "d1234" or something, not
+        the full ring entries.
+        """
+        ips = whataremyips(self.ring_ip)
+        local_devices = set()
+        for policy in self.policies:
+            self.load_object_ring(policy)
+            for device in policy.object_ring.devs:
+                if device and is_local_device(
+                        ips, self.port,
+                        device['replication_ip'],
+                        device['replication_port']):
+                    local_devices.add(device['device'])
+        return local_devices
+
+    # Just exists for doc anchor point
+    def sync(self, node, job, suffixes, *args, **kwargs):
+        """
+        Synchronize local suffix directories from a partition with a remote
+        node.
+
+        :param node: the "dev" entry for the remote node to sync with
+        :param job: information about the partition being synced
+        :param suffixes: a list of suffixes which need to be pushed
+
+        :returns: boolean and dictionary, boolean indicating success or failure
+        """
+        return self.sync_method(node, job, suffixes, *args, **kwargs)
+
+    def load_object_ring(self, policy):
+        """
+        Make sure the policy's rings are loaded.
+
+        :param policy: the StoragePolicy instance
+        :returns: appropriate ring object
+        """
+        policy.load_ring(self.swift_dir)
+        return policy.object_ring
+
+    def _limit_rsync_log(self, line):
+        """
+        If rsync_error_log_line_length is defined then
+        limit the error to that length
+
+        :param line: rsync log line
+        :return: If enabled the line limited to rsync_error_log_line_length
+                 otherwise the initial line.
+        """
+        if self.rsync_error_log_line_length:
+            return line[:self.rsync_error_log_line_length]
+
+        return line
 
     def _rsync(self, args):
         """
@@ -275,7 +372,8 @@ def _rsync(self, args):
         :returns: return code of rsync process. 0 is successful
         """
         start_time = time.time()
-        ret_val = None
+        proc = None
+
         try:
             with Timeout(self.rsync_timeout):
                 proc = subprocess.Popen(args,
@@ -284,45 +382,62 @@ def _rsync(self, args):
                 results = proc.stdout.read()
                 ret_val = proc.wait()
         except Timeout:
-            self.logger.error(_("Killing long-running rsync: %s"), str(args))
-            proc.kill()
+            self.logger.error(
+                self._limit_rsync_log(
+                    "Killing long-running rsync after %ds: %s" % (
+                        self.rsync_timeout, str(args))))
+            if proc:
+                proc.kill()
+                try:
+                    # Note: Python 2.7's subprocess.Popen class doesn't take
+                    # any arguments for wait(), but Python 3's does.
+                    # However, Eventlet's replacement Popen takes a timeout
+                    # argument regardless of Python version, so we don't
+                    # need any conditional code here.
+                    proc.wait(timeout=1.0)
+                except subprocess.TimeoutExpired:
+                    # Sometimes a process won't die immediately even after a
+                    # SIGKILL. This can be due to failing disks, high load,
+                    # or other reasons. We can't wait for it forever since
+                    # we're taking up a slot in the (green)thread pool, so
+                    # we send it over to another greenthread, not part of
+                    # our pool, whose sole duty is to wait for child
+                    # processes to exit.
+                    self._child_process_reaper_queue.put(proc)
             return 1  # failure response code
+
         total_time = time.time() - start_time
-        for result in results.split('\n'):
+        for result in results.decode('utf8').split('\n'):
             if result == '':
                 continue
             if result.startswith('cd+'):
                 continue
+            if result.startswith('<') and not self.log_rsync_transfers:
+                continue
             if not ret_val:
-                self.logger.info(result)
+                self.logger.debug(result)
             else:
                 self.logger.error(result)
         if ret_val:
-            self.logger.error(_('Bad rsync return code: %(args)s -> %(ret)d'),
-                              {'args': str(args), 'ret': ret_val})
-        elif results:
-            self.logger.info(
-                _("Successful rsync of %(src)s at %(dst)s (%(time).03f)"),
-                {'src': args[-2], 'dst': args[-1], 'time': total_time})
+            self.logger.error(
+                self._limit_rsync_log(
+                    'Bad rsync return code: %(ret)d <- %(args)s' %
+                    {'args': str(args), 'ret': ret_val}))
         else:
-            self.logger.debug(
-                _("Successful rsync of %(src)s at %(dst)s (%(time).03f)"),
-                {'src': args[-2], 'dst': args[-1], 'time': total_time})
+            log_method = self.logger.info if results else self.logger.debug
+            log_method(
+                "Successful rsync of %(src)s to %(dst)s (%(time).03f)",
+                {'src': args[-2][:-3] + '...', 'dst': args[-1],
+                 'time': total_time})
         return ret_val
 
     def rsync(self, node, job, suffixes):
         """
-        Synchronize local suffix directories from a partition with a remote
-        node.
-
-        :param node: the "dev" entry for the remote node to sync with
-        :param job: information about the partition being synced
-        :param suffixes: a list of suffixes which need to be pushed
-
-        :returns: boolean indicating success or failure
+        Uses rsync to implement the sync method. This was the first
+        sync method in Swift.
         """
         if not os.path.exists(job['path']):
-            return False
+            return False, {}
         args = [
             'rsync',
             '--recursive',
@@ -333,12 +448,15 @@ def rsync(self, node, job, suffixes):
             '--ignore-existing',
             '--timeout=%s' % self.rsync_io_timeout,
             '--contimeout=%s' % self.rsync_io_timeout,
+            '--bwlimit=%s' % self.rsync_bwlimit,
+            '--exclude=.*.%s' % ''.join('[0-9a-zA-Z]' for i in range(6))
         ]
-        node_ip = rsync_ip(node['ip'])
-        if self.vm_test_mode:
-            rsync_module = '%s::object%s' % (node_ip, node['port'])
-        else:
-            rsync_module = '%s::object' % node_ip
+        if self.rsync_compress and \
+                job['region'] != node['region']:
+            # Allow for compression, but only if the remote node is in
+            # a different region than the local one.
+            args.append('--compress')
+        rsync_module = rsync_module_interpolation(self.rsync_module, node)
         had_any = False
         for suffix in suffixes:
             spath = join(job['path'], suffix)
@@ -346,24 +464,47 @@ def rsync(self, node, job, suffixes):
                 args.append(spath)
                 had_any = True
         if not had_any:
-            return False
+            return False, {}
+        data_dir = get_data_dir(job['policy'])
         args.append(join(rsync_module, node['device'],
-                    'objects', job['partition']))
-        return self._rsync(args) == 0
+                    data_dir, job['partition']))
+        success = (self._rsync(args) == 0)
+
+        # TODO: Catch and swallow (or at least minimize) timeouts when doing
+        # an update job; if we don't manage to notify the remote, we should
+        # catch it on the next pass
+        if success or not job['delete']:
+            headers = dict(self.default_headers)
+            headers['X-Backend-Storage-Policy-Index'] = int(job['policy'])
+            with Timeout(self.http_timeout):
+                conn = http_connect(
+                    node['replication_ip'], node['replication_port'],
+                    node['device'], job['partition'], 'REPLICATE',
+                    '/' + '-'.join(suffixes), headers=headers)
+                try:
+                    conn.getresponse().read()
+                finally:
+                    conn.close()
+        return success, {}
+
+    def ssync(self, node, job, suffixes, remote_check_objs=None):
+        return ssync_sender.Sender(
+            self, node, job, suffixes, remote_check_objs)()
 
-    def check_ring(self):
+    def check_ring(self, object_ring):
         """
         Check to see if the ring has been updated
+        :param object_ring: the ring to check
 
         :returns: boolean indicating whether or not the ring has changed
         """
         if time.time() > self.next_check:
             self.next_check = time.time() + self.ring_check_interval
-            if self.object_ring.has_changed():
+            if object_ring.has_changed():
                 return False
         return True
 
-    def update_deleted(self, job):
+    def revert(self, job):
         """
         High-level method that replicates a single partition that doesn't
         belong on this node.
@@ -372,110 +513,251 @@ def update_deleted(self, job):
         """
 
         def tpool_get_suffixes(path):
-            return [suff for suff in os.listdir(path)
+            return [suff for suff in listdir(path)
                     if len(suff) == 3 and isdir(join(path, suff))]
-        self.replication_count += 1
+
+        stats = self.stats_for_dev[job['device']]
+        stats.attempted += 1
         self.logger.increment('partition.delete.count.%s' % (job['device'],))
+        headers = dict(self.default_headers)
+        headers['X-Backend-Storage-Policy-Index'] = int(job['policy'])
+        failure_devs_info = set()
         begin = time.time()
+        handoff_partition_deleted = False
         try:
-            responses = []
-            suffixes = tpool.execute(tpool_get_suffixes, job['path'])
-            if suffixes:
-                for node in job['nodes']:
-                    success = self.rsync(node, job, suffixes)
-                    if success:
-                        with Timeout(self.http_timeout):
-                            http_connect(
-                                node['ip'], node['port'],
-                                node['device'], job['partition'], 'REPLICATE',
-                                '/' + '-'.join(suffixes),
-                                headers={'Content-Length': '0'}).\
-                                getresponse().read()
-                    responses.append(success)
-            if not suffixes or (len(responses) ==
-                                len(job['nodes']) and all(responses)):
-                self.logger.info(_("Removing partition: %s"), job['path'])
-                tpool.execute(shutil.rmtree, job['path'], ignore_errors=True)
+            df_mgr = self._df_router[job['policy']]
+            # Only object-server can take this lock if an incoming SSYNC is
+            # running on the same partition. Taking the lock here ensure we
+            # won't enter a race condition where both nodes try to
+            # cross-replicate the same partition and both delete it.
+            with df_mgr.partition_lock(job['device'], job['policy'],
+                                       job['partition'], name='replication',
+                                       timeout=0.2):
+                responses = []
+                suffixes = tpool.execute(tpool_get_suffixes, job['path'])
+                synced_remote_regions = {}
+                delete_objs = None
+                if suffixes:
+                    for node in job['nodes']:
+                        stats.rsync += 1
+                        kwargs = {}
+                        if self.conf.get('sync_method', 'rsync') == 'ssync' \
+                                and node['region'] in synced_remote_regions:
+                            kwargs['remote_check_objs'] = \
+                                synced_remote_regions[node['region']]
+                        # candidates is a dict(hash=>timestamp) of objects
+                        # for deletion
+                        success, candidates = self.sync(
+                            node, job, suffixes, **kwargs)
+                        if not success:
+                            failure_devs_info.add((node['replication_ip'],
+                                                   node['device']))
+                        if success and node['region'] != job['region']:
+                            synced_remote_regions[node['region']] = \
+                                candidates.keys()
+                        responses.append(success)
+                    for cand_objs in synced_remote_regions.values():
+                        if delete_objs is None:
+                            delete_objs = cand_objs
+                        else:
+                            delete_objs = delete_objs & cand_objs
+
+                if self.handoff_delete:
+                    # delete handoff if we have had handoff_delete successes
+                    successes_count = len([resp for resp in responses if resp])
+                    delete_handoff = successes_count >= min(
+                        self.handoff_delete, len(job['nodes']))
+                else:
+                    # delete handoff if all syncs were successful
+                    delete_handoff = len(responses) == len(job['nodes']) and \
+                        all(responses)
+                if delete_handoff:
+                    stats.remove += 1
+                    if (self.conf.get('sync_method', 'rsync') == 'ssync' and
+                            delete_objs is not None):
+                        self.logger.info("Removing %s objects",
+                                         len(delete_objs))
+                        _junk, error_paths = self.delete_handoff_objs(
+                            job, delete_objs)
+                        # if replication works for a hand-off device and it
+                        # failed, the remote devices which are target of the
+                        # replication from the hand-off device will be marked.
+                        # Because cleanup after replication failed means
+                        # replicator needs to replicate again with the same
+                        # info.
+                        if error_paths:
+                            failure_devs_info.update(
+                                [(failure_dev['replication_ip'],
+                                  failure_dev['device'])
+                                 for failure_dev in job['nodes']])
+                    else:
+                        self.delete_partition(job['path'])
+                        handoff_partition_deleted = True
+                elif not suffixes:
+                    self.delete_partition(job['path'])
+                    handoff_partition_deleted = True
+        except PartitionLockTimeout:
+            self.logger.info("Unable to lock handoff partition %s for "
+                             "replication on device %s policy %d",
+                             job['partition'], job['device'],
+                             job['policy'])
+            self.logger.increment('partition.lock-failure.count')
         except (Exception, Timeout):
-            self.logger.exception(_("Error syncing handoff partition"))
+            self.logger.exception("Error syncing handoff partition")
         finally:
+            stats.add_failure_stats(failure_devs_info)
+            target_devs_info = set([(target_dev['replication_ip'],
+                                     target_dev['device'])
+                                    for target_dev in job['nodes']])
+            stats.success += len(target_devs_info - failure_devs_info)
+            if not handoff_partition_deleted:
+                self.handoffs_remaining += 1
             self.partition_times.append(time.time() - begin)
             self.logger.timing_since('partition.delete.timing', begin)
 
+    def delete_partition(self, path):
+        self.logger.info("Removing partition: %s", path)
+        try:
+            tpool.execute(shutil.rmtree, path)
+        except OSError as e:
+            if e.errno not in (errno.ENOENT, errno.ENOTEMPTY, errno.ENODATA,
+                               EUCLEAN):
+                # Don't worry if there was a race to create or delete,
+                # or some disk corruption that happened after the sync
+                raise
+
+    def delete_handoff_objs(self, job, delete_objs):
+        success_paths = []
+        error_paths = []
+        for object_hash in delete_objs:
+            object_path = storage_directory(job['obj_path'], job['partition'],
+                                            object_hash)
+            tpool.execute(shutil.rmtree, object_path, ignore_errors=True)
+            suffix_dir = dirname(object_path)
+            try:
+                os.rmdir(suffix_dir)
+                success_paths.append(object_path)
+            except OSError as e:
+                if e.errno not in (errno.ENOENT, errno.ENOTEMPTY):
+                    error_paths.append(object_path)
+                    self.logger.exception(
+                        "Unexpected error trying to cleanup suffix dir %r",
+                        suffix_dir)
+        return success_paths, error_paths
+
     def update(self, job):
         """
         High-level method that replicates a single partition.
 
         :param job: a dict containing info about the partition to be replicated
         """
-        self.replication_count += 1
+        stats = self.stats_for_dev[job['device']]
+        stats.attempted += 1
         self.logger.increment('partition.update.count.%s' % (job['device'],))
+        headers = dict(self.default_headers)
+        headers['X-Backend-Storage-Policy-Index'] = int(job['policy'])
+        target_devs_info = set()
+        failure_devs_info = set()
         begin = time.time()
+        df_mgr = self._df_router[job['policy']]
         try:
-            hashed, local_hash = tpool_reraise(
-                get_hashes, job['path'],
-                do_listdir=(self.replication_count % 10) == 0,
-                reclaim_age=self.reclaim_age)
-            self.suffix_hash += hashed
+            hashed, local_hash = tpool.execute(
+                df_mgr._get_hashes, job['device'],
+                job['partition'], job['policy'],
+                do_listdir=_do_listdir(
+                    int(job['partition']),
+                    self.replication_cycle))
+            stats.suffix_hash += hashed
             self.logger.update_stats('suffix.hashes', hashed)
             attempts_left = len(job['nodes'])
+            synced_remote_regions = set()
+            random.shuffle(job['nodes'])
             nodes = itertools.chain(
                 job['nodes'],
-                self.object_ring.get_more_nodes(int(job['partition'])))
+                job['policy'].object_ring.get_more_nodes(
+                    int(job['partition'])))
             while attempts_left > 0:
-                # If this throws StopIterator it will be caught way below
+                # If this throws StopIteration it will be caught way below
                 node = next(nodes)
+                node_str = node_to_string(node, replication=True)
+                target_devs_info.add((node['replication_ip'], node['device']))
                 attempts_left -= 1
+                # if we have already synced to this remote region,
+                # don't sync again on this replication pass
+                if node['region'] in synced_remote_regions:
+                    continue
                 try:
                     with Timeout(self.http_timeout):
-                        resp = http_connect(
-                            node['ip'], node['port'],
+                        conn = http_connect(
+                            node['replication_ip'], node['replication_port'],
                             node['device'], job['partition'], 'REPLICATE',
-                            '', headers={'Content-Length': '0'}).getresponse()
-                        if resp.status == HTTP_INSUFFICIENT_STORAGE:
-                            self.logger.error(_('%(ip)s/%(device)s responded'
-                                                ' as unmounted'), node)
-                            attempts_left += 1
-                            continue
-                        if resp.status != HTTP_OK:
-                            self.logger.error(_("Invalid response %(resp)s "
-                                                "from %(ip)s"),
-                                              {'resp': resp.status,
-                                               'ip': node['ip']})
-                            continue
-                        remote_hash = pickle.loads(resp.read())
+                            '', headers=headers)
+                        try:
+                            resp = conn.getresponse()
+                            if resp.status == HTTP_INSUFFICIENT_STORAGE:
+                                self.logger.error('%s responded as unmounted',
+                                                  node_str)
+                                attempts_left += 1
+                                failure_devs_info.add((node['replication_ip'],
+                                                       node['device']))
+                                continue
+                            if resp.status != HTTP_OK:
+                                self.logger.error(
+                                    "Invalid response %(resp)s "
+                                    "from %(remote)s",
+                                    {'resp': resp.status, 'remote': node_str})
+                                failure_devs_info.add((node['replication_ip'],
+                                                       node['device']))
+                                continue
+                            remote_hash = pickle.loads(
+                                resp.read())  # nosec: B301
+                        finally:
+                            conn.close()
                         del resp
                     suffixes = [suffix for suffix in local_hash if
                                 local_hash[suffix] !=
                                 remote_hash.get(suffix, -1)]
                     if not suffixes:
+                        stats.hashmatch += 1
                         continue
-                    hashed, recalc_hash = tpool_reraise(
-                        get_hashes,
-                        job['path'], recalculate=suffixes,
-                        reclaim_age=self.reclaim_age)
+                    hashed, recalc_hash = tpool.execute(
+                        df_mgr._get_hashes,
+                        job['device'], job['partition'], job['policy'],
+                        recalculate=suffixes)
                     self.logger.update_stats('suffix.hashes', hashed)
                     local_hash = recalc_hash
                     suffixes = [suffix for suffix in local_hash if
                                 local_hash[suffix] !=
                                 remote_hash.get(suffix, -1)]
-                    self.rsync(node, job, suffixes)
-                    with Timeout(self.http_timeout):
-                        conn = http_connect(
-                            node['ip'], node['port'],
-                            node['device'], job['partition'], 'REPLICATE',
-                            '/' + '-'.join(suffixes),
-                            headers={'Content-Length': '0'})
-                        conn.getresponse().read()
-                    self.suffix_sync += len(suffixes)
+                    if not suffixes:
+                        stats.hashmatch += 1
+                        continue
+                    stats.rsync += 1
+                    success, _junk = self.sync(node, job, suffixes)
+                    if not success:
+                        failure_devs_info.add((node['replication_ip'],
+                                               node['device']))
+                    # add only remote region when replicate succeeded
+                    if success and node['region'] != job['region']:
+                        synced_remote_regions.add(node['region'])
+                    stats.suffix_sync += len(suffixes)
                     self.logger.update_stats('suffix.syncs', len(suffixes))
                 except (Exception, Timeout):
-                    self.logger.exception(_("Error syncing with node: %s") %
-                                          node)
-            self.suffix_count += len(local_hash)
+                    failure_devs_info.add((node['replication_ip'],
+                                           node['device']))
+                    self.logger.exception("Error syncing with node: %s",
+                                          node_str)
+            stats.suffix_count += len(local_hash)
+        except StopIteration:
+            self.logger.error('Ran out of handoffs while replicating '
+                              'partition %s of policy %d',
+                              job['partition'], int(job['policy']))
         except (Exception, Timeout):
-            self.logger.exception(_("Error syncing partition"))
+            failure_devs_info.update(target_devs_info)
+            self.logger.exception("Error syncing partition")
         finally:
+            stats.add_failure_stats(failure_devs_info)
+            stats.success += len(target_devs_info - failure_devs_info)
             self.partition_times.append(time.time() - begin)
             self.logger.timing_since('partition.update.timing', begin)
 
@@ -483,47 +765,48 @@ def stats_line(self):
         """
         Logs various stats for the currently running replication pass.
         """
-        if self.replication_count:
+        stats = self.total_stats
+        replication_count = stats.attempted
+        if replication_count > self.last_replication_count:
+            self.last_replication_count = replication_count
             elapsed = (time.time() - self.start) or 0.000001
-            rate = self.replication_count / elapsed
+            rate = replication_count / elapsed
             self.logger.info(
-                _("%(replicated)d/%(total)d (%(percentage).2f%%)"
-                  " partitions replicated in %(time).2fs (%(rate).2f/sec, "
-                  "%(remaining)s remaining)"),
-                {'replicated': self.replication_count, 'total': self.job_count,
-                 'percentage': self.replication_count * 100.0 / self.job_count,
+                "%(replicated)d/%(total)d (%(percentage).2f%%)"
+                " partitions replicated in %(time).2fs (%(rate).2f/sec, "
+                "%(remaining)s remaining)",
+                {'replicated': replication_count, 'total': self.job_count,
+                 'percentage': replication_count * 100.0 / self.job_count,
                  'time': time.time() - self.start, 'rate': rate,
                  'remaining': '%d%s' % compute_eta(self.start,
-                                                   self.replication_count,
+                                                   replication_count,
                                                    self.job_count)})
-            if self.suffix_count:
+            self.logger.info('%(success)s successes, %(failure)s failures',
+                             dict(success=stats.success,
+                                  failure=stats.failure))
+
+            if stats.suffix_count:
                 self.logger.info(
-                    _("%(checked)d suffixes checked - "
-                      "%(hashed).2f%% hashed, %(synced).2f%% synced"),
-                    {'checked': self.suffix_count,
-                     'hashed': (self.suffix_hash * 100.0) / self.suffix_count,
-                     'synced': (self.suffix_sync * 100.0) / self.suffix_count})
+                    "%(checked)d suffixes checked - "
+                    "%(hashed).2f%% hashed, %(synced).2f%% synced",
+                    {'checked': stats.suffix_count,
+                     'hashed':
+                     (stats.suffix_hash * 100.0) / stats.suffix_count,
+                     'synced':
+                     (stats.suffix_sync * 100.0) / stats.suffix_count})
                 self.partition_times.sort()
                 self.logger.info(
-                    _("Partition times: max %(max).4fs, "
-                      "min %(min).4fs, med %(med).4fs"),
+                    "Partition times: max %(max).4fs, "
+                    "min %(min).4fs, med %(med).4fs",
                     {'max': self.partition_times[-1],
                      'min': self.partition_times[0],
                      'med': self.partition_times[
                          len(self.partition_times) // 2]})
         else:
             self.logger.info(
-                _("Nothing replicated for %s seconds."),
+                "Nothing replicated for %s seconds.",
                 (time.time() - self.start))
 
-    def kill_coros(self):
-        """Utility function that kills all coroutines currently running."""
-        for coro in list(self.run_pool.coroutines_running):
-            try:
-                coro.kill(GreenletExit)
-            except GreenletExit:
-                pass
-
     def heartbeat(self):
         """
         Loop that runs in the background during replication.  It periodically
@@ -533,136 +816,368 @@ def heartbeat(self):
             eventlet.sleep(self.stats_interval)
             self.stats_line()
 
-    def detect_lockups(self):
+    def build_replication_jobs(self, policy, ips, override_devices=None,
+                               override_partitions=None):
         """
-        In testing, the pool.waitall() call very occasionally failed to return.
-        This is an attempt to make sure the replicator finishes its replication
-        pass in some eventuality.
-        """
-        while True:
-            eventlet.sleep(self.lockup_timeout)
-            if self.replication_count == self.last_replication_count:
-                self.logger.error(_("Lockup detected.. killing live coros."))
-                self.kill_coros()
-            self.last_replication_count = self.replication_count
-
-    def collect_jobs(self):
-        """
-        Returns a sorted list of jobs (dictionaries) that specify the
-        partitions, nodes, etc to be rsynced.
+        Helper function for collect_jobs to build jobs for replication
+        using replication style storage policy
         """
         jobs = []
-        ips = whataremyips()
-        for local_dev in [dev for dev in self.object_ring.devs
-                          if dev and dev['ip'] in ips and
-                          dev['port'] == self.port]:
-            dev_path = join(self.devices_dir, local_dev['device'])
-            obj_path = join(dev_path, 'objects')
-            tmp_path = join(dev_path, 'tmp')
-            if self.mount_check and not os.path.ismount(dev_path):
-                self.logger.warn(_('%s is not mounted'), local_dev['device'])
+        df_mgr = self._df_router[policy]
+        self.all_devs_info.update(
+            [(dev['replication_ip'], dev['device'])
+             for dev in policy.object_ring.devs if dev])
+        data_dir = get_data_dir(policy)
+        found_local = False
+        for local_dev in [dev for dev in policy.object_ring.devs
+                          if (dev
+                              and is_local_device(ips,
+                                                  self.port,
+                                                  dev['replication_ip'],
+                                                  dev['replication_port'])
+                              and (override_devices is None
+                                   or dev['device'] in override_devices))]:
+            found_local = True
+            local_dev_stats = self.stats_for_dev[local_dev['device']]
+            try:
+                dev_path = check_drive(self.devices_dir, local_dev['device'],
+                                       self.mount_check)
+            except ValueError as err:
+                local_dev_stats.add_failure_stats(
+                    [(failure_dev['replication_ip'],
+                      failure_dev['device'])
+                     for failure_dev in policy.object_ring.devs
+                     if failure_dev])
+                self.logger.warning("%s", err)
                 continue
-            unlink_older_than(tmp_path, time.time() - self.reclaim_age)
+            obj_path = join(dev_path, data_dir)
+            tmp_path = join(dev_path, get_tmp_dir(policy))
+            unlink_older_than(tmp_path, time.time() -
+                              df_mgr.reclaim_age)
             if not os.path.exists(obj_path):
-                mkdirs(obj_path)
+                try:
+                    mkdirs(obj_path)
+                except Exception:
+                    self.logger.exception('ERROR creating %s' % obj_path)
                 continue
-            for partition in os.listdir(obj_path):
+            for partition in listdir(obj_path):
+                if (override_partitions is not None and partition.isdigit()
+                        and int(partition) not in override_partitions):
+                    continue
+
+                if (partition.startswith('auditor_status_') and
+                        partition.endswith('.json')):
+                    # ignore auditor status files
+                    continue
+
+                part_nodes = None
                 try:
                     job_path = join(obj_path, partition)
-                    if isfile(job_path):
-                        # Clean up any (probably zero-byte) files where a
-                        # partition should be.
-                        self.logger.warning('Removing partition directory '
-                                            'which was a file: %s', job_path)
-                        os.remove(job_path)
-                        continue
-                    part_nodes = \
-                        self.object_ring.get_part_nodes(int(partition))
+                    part_nodes = policy.object_ring.get_part_nodes(
+                        int(partition))
                     nodes = [node for node in part_nodes
                              if node['id'] != local_dev['id']]
                     jobs.append(
                         dict(path=job_path,
                              device=local_dev['device'],
+                             obj_path=obj_path,
                              nodes=nodes,
                              delete=len(nodes) > len(part_nodes) - 1,
-                             partition=partition))
-                except ValueError, OSError:
+                             policy=policy,
+                             partition=partition,
+                             region=local_dev['region']))
+                except ValueError:
+                    if part_nodes:
+                        local_dev_stats.add_failure_stats(
+                            [(failure_dev['replication_ip'],
+                              failure_dev['device'])
+                             for failure_dev in nodes])
+                    else:
+                        local_dev_stats.add_failure_stats(
+                            [(failure_dev['replication_ip'],
+                              failure_dev['device'])
+                             for failure_dev in policy.object_ring.devs
+                             if failure_dev])
                     continue
+        if not found_local:
+            self.logger.error("Can't find itself in policy with index %d with"
+                              " ips %s and with port %s in ring file, not"
+                              " replicating",
+                              int(policy), ", ".join(ips), self.port)
+        return jobs
+
+    def collect_jobs(self, override_devices=None, override_partitions=None,
+                     override_policies=None):
+        """
+        Returns a sorted list of jobs (dictionaries) that specify the
+        partitions, nodes, etc to be rsynced.
+
+        :param override_devices: if set, only jobs on these devices
+            will be returned
+        :param override_partitions: if set, only jobs on these partitions
+            will be returned
+        :param override_policies: if set, only jobs in these storage
+            policies will be returned
+        """
+        jobs = []
+        ips = whataremyips(self.ring_ip)
+        for policy in self.policies:
+            # Skip replication if next_part_power is set. In this case
+            # every object is hard-linked twice, but the replicator can't
+            # detect them and would create a second copy of the file if not
+            # yet existing - and this might double the actual transferred
+            # and stored data
+            next_part_power = getattr(
+                policy.object_ring, 'next_part_power', None)
+            if next_part_power is not None:
+                self.logger.warning(
+                    "next_part_power set in policy '%s'. Skipping",
+                    policy.name)
+                continue
+
+            if (override_policies is not None and
+                    policy.idx not in override_policies):
+                continue
+            # ensure rings are loaded for policy
+            self.load_object_ring(policy)
+            jobs += self.build_replication_jobs(
+                policy, ips, override_devices=override_devices,
+                override_partitions=override_partitions)
         random.shuffle(jobs)
+        if self.handoffs_first:
+            # Move the handoff parts to the front of the list
+            jobs.sort(key=lambda job: not job['delete'])
         self.job_count = len(jobs)
         return jobs
 
-    def replicate(self, override_devices=[], override_partitions=[]):
+    def replicate(self, override_devices=None, override_partitions=None,
+                  override_policies=None, start_time=None):
         """Run a replication pass"""
-        self.start = time.time()
-        self.suffix_count = 0
-        self.suffix_sync = 0
-        self.suffix_hash = 0
-        self.replication_count = 0
-        self.last_replication_count = -1
+        if start_time is None:
+            start_time = time.time()
+        self.start = start_time
+        self.last_replication_count = 0
+        self.replication_cycle = (self.replication_cycle + 1) % 10
         self.partition_times = []
+        self.all_devs_info = set()
+        self.handoffs_remaining = 0
+
         stats = eventlet.spawn(self.heartbeat)
-        lockup_detector = eventlet.spawn(self.detect_lockups)
         eventlet.sleep()  # Give spawns a cycle
+
+        current_nodes = None
+        dev_stats = None
+        num_jobs = 0
         try:
             self.run_pool = GreenPool(size=self.concurrency)
-            jobs = self.collect_jobs()
+            jobs = self.collect_jobs(override_devices=override_devices,
+                                     override_partitions=override_partitions,
+                                     override_policies=override_policies)
             for job in jobs:
-                if override_devices and job['device'] not in override_devices:
-                    continue
-                if override_partitions and \
-                        job['partition'] not in override_partitions:
-                    continue
-                dev_path = join(self.devices_dir, job['device'])
-                if self.mount_check and not os.path.ismount(dev_path):
-                    self.logger.warn(_('%s is not mounted'), job['device'])
+                dev_stats = self.stats_for_dev[job['device']]
+                num_jobs += 1
+                current_nodes = job['nodes']
+                try:
+                    check_drive(self.devices_dir, job['device'],
+                                self.mount_check)
+                except ValueError as err:
+                    dev_stats.add_failure_stats([
+                        (failure_dev['replication_ip'], failure_dev['device'])
+                        for failure_dev in job['nodes']])
+                    self.logger.warning("%s", err)
                     continue
-                if not self.check_ring():
-                    self.logger.info(_("Ring change detected. Aborting "
-                                       "current replication pass."))
+                if self.handoffs_first and not job['delete']:
+                    # in handoffs first mode, we won't process primary
+                    # partitions until rebalance was successful!
+                    if self.handoffs_remaining:
+                        self.logger.warning(
+                            "Handoffs first mode still has handoffs "
+                            "remaining.  Aborting current "
+                            "replication pass.")
+                        break
+                if not self.check_ring(job['policy'].object_ring):
+                    self.logger.info("Ring change detected. Aborting "
+                                     "current replication pass.")
                     return
+
+                try:
+                    if isfile(job['path']):
+                        # Clean up any (probably zero-byte) files where a
+                        # partition should be.
+                        self.logger.warning(
+                            'Removing partition directory '
+                            'which was a file: %s', job['path'])
+                        os.remove(job['path'])
+                        continue
+                except OSError:
+                    continue
                 if job['delete']:
-                    self.run_pool.spawn(self.update_deleted, job)
+                    self.run_pool.spawn(self.revert, job)
                 else:
                     self.run_pool.spawn(self.update, job)
-            with Timeout(self.lockup_timeout):
-                self.run_pool.waitall()
-        except (Exception, Timeout):
-            self.logger.exception(_("Exception in top-level replication loop"))
-            self.kill_coros()
+            current_nodes = None
+            self.run_pool.waitall()
+        except (Exception, Timeout) as err:
+            if dev_stats:
+                if current_nodes:
+                    dev_stats.add_failure_stats(
+                        [(failure_dev['replication_ip'],
+                          failure_dev['device'])
+                         for failure_dev in current_nodes])
+                else:
+                    dev_stats.add_failure_stats(self.all_devs_info)
+            self.logger.exception(
+                "Exception in top-level replication loop: %s", err)
         finally:
             stats.kill()
-            lockup_detector.kill()
             self.stats_line()
 
-    def run_once(self, *args, **kwargs):
-        start = time.time()
-        self.logger.info(_("Running object replicator in script mode."))
-        override_devices = list_from_csv(kwargs.get('devices'))
-        override_partitions = list_from_csv(kwargs.get('partitions'))
+    def update_recon(self, total, end_time, override_devices):
+        # Called at the end of a replication pass to update recon stats.
+        if self.is_multiprocess_worker:
+            # If it weren't for the failure_nodes field, we could do this as
+            # a bunch of shared memory using multiprocessing.Value, which
+            # would be nice because it'd avoid dealing with existing data
+            # during an upgrade.
+            update = {
+                'object_replication_per_disk': {
+                    od: {'replication_stats':
+                         self.stats_for_dev[od].to_recon(),
+                         'replication_time': total,
+                         'replication_last': end_time,
+                         'object_replication_time': total,
+                         'object_replication_last': end_time}
+                    for od in override_devices}}
+        else:
+            update = {'replication_stats': self.total_stats.to_recon(),
+                      'replication_time': total,
+                      'replication_last': end_time,
+                      'object_replication_time': total,
+                      'object_replication_last': end_time}
+        dump_recon_cache(update, self.rcache, self.logger)
+
+    def aggregate_recon_update(self):
+        per_disk_stats = load_recon_cache(self.rcache).get(
+            'object_replication_per_disk', {})
+        recon_update = {}
+        min_repl_last = float('inf')
+        min_repl_time = float('inf')
+
+        # If every child has reported some stats, then aggregate things.
+        if all(ld in per_disk_stats for ld in self.all_local_devices):
+            aggregated = Stats()
+            for device_name, data in per_disk_stats.items():
+                aggregated += Stats.from_recon(data['replication_stats'])
+                min_repl_time = min(
+                    min_repl_time, data['object_replication_time'])
+                min_repl_last = min(
+                    min_repl_last, data['object_replication_last'])
+            recon_update['replication_stats'] = aggregated.to_recon()
+            recon_update['replication_last'] = min_repl_last
+            recon_update['replication_time'] = min_repl_time
+            recon_update['object_replication_last'] = min_repl_last
+            recon_update['object_replication_time'] = min_repl_time
+
+        # Clear out entries for old local devices that we no longer have
+        devices_to_remove = set(per_disk_stats) - set(self.all_local_devices)
+        if devices_to_remove:
+            recon_update['object_replication_per_disk'] = {
+                dtr: {} for dtr in devices_to_remove}
+
+        return recon_update
+
+    def run_once(self, multiprocess_worker_index=None,
+                 have_overrides=False, *args, **kwargs):
+        if multiprocess_worker_index is not None:
+            self.is_multiprocess_worker = True
+            self._emplace_log_prefix(multiprocess_worker_index)
+
+        rsync_reaper = eventlet.spawn(self._child_process_reaper)
+        self._zero_stats()
+        self.logger.info("Running object replicator in script mode.")
+
+        override_opts = parse_override_options(once=True, **kwargs)
+        devices = override_opts.devices or None
+        partitions = override_opts.partitions or None
+        policies = override_opts.policies or None
+
+        start_time = time.time()
         self.replicate(
-            override_devices=override_devices,
-            override_partitions=override_partitions)
-        total = (time.time() - start) / 60
+            override_devices=devices,
+            override_partitions=partitions,
+            override_policies=policies,
+            start_time=start_time)
+        end_time = time.time()
+        total = (end_time - start_time) / 60
         self.logger.info(
-            _("Object replication complete (once). (%.02f minutes)"), total)
-        if not (override_partitions or override_devices):
-            dump_recon_cache({'object_replication_time': total},
-                             self.rcache, self.logger)
+            "Object replication complete (once). (%.02f minutes)", total)
 
-    def run_forever(self, *args, **kwargs):
-        self.logger.info(_("Starting object replicator in daemon mode."))
+        # If we've been manually run on a subset of
+        # policies/devices/partitions, then our recon stats are not
+        # representative of how replication is doing, so we don't publish
+        # them.
+        if self.is_multiprocess_worker:
+            # The main process checked for overrides and determined that
+            # there were none
+            should_update_recon = not have_overrides
+        else:
+            # We are single-process, so update recon only if we worked on
+            # everything
+            should_update_recon = not (partitions or devices or policies)
+        if should_update_recon:
+            self.update_recon(total, end_time, devices)
+
+        # Give rsync processes one last chance to exit, then bail out and
+        # let them be init's problem
+        self._child_process_reaper_queue.put(None)
+        rsync_reaper.wait()
+
+    def run_forever(self, multiprocess_worker_index=None,
+                    override_devices=None, *args, **kwargs):
+        if multiprocess_worker_index is not None:
+            self.is_multiprocess_worker = True
+            self._emplace_log_prefix(multiprocess_worker_index)
+        self.logger.info("Starting object replicator in daemon mode.")
+        eventlet.spawn_n(self._child_process_reaper)
         # Run the replicator continually
         while True:
-            start = time.time()
-            self.logger.info(_("Starting object replication pass."))
+            self._zero_stats()
+            self.logger.info("Starting object replication pass.")
             # Run the replicator
-            self.replicate()
-            total = (time.time() - start) / 60
+            start = time.time()
+            self.replicate(override_devices=override_devices)
+            end = time.time()
+            total = (end - start) / 60
             self.logger.info(
-                _("Object replication complete. (%.02f minutes)"), total)
-            dump_recon_cache({'object_replication_time': total},
-                             self.rcache, self.logger)
-            self.logger.debug(_('Replication sleeping for %s seconds.'),
-                              self.run_pause)
-            sleep(self.run_pause)
+                "Object replication complete. (%.02f minutes)", total)
+            self.update_recon(total, end, override_devices)
+            self.logger.debug('Replication sleeping for %s seconds.',
+                              self.interval)
+            sleep(self.interval)
+
+    def post_multiprocess_run(self):
+        # This method is called after run_once using multiple workers.
+        update = self.aggregate_recon_update()
+        dump_recon_cache(update, self.rcache, self.logger)
+
+
+def main():
+    parser = OptionParser("%prog CONFIG [options]")
+    parser.add_option('-d', '--devices',
+                      help='Replicate only given devices. '
+                           'Comma-separated list. '
+                           'Only has effect if --once is used.')
+    parser.add_option('-p', '--partitions',
+                      help='Replicate only given partitions. '
+                           'Comma-separated list. '
+                           'Only has effect if --once is used.')
+    parser.add_option('-i', '--policies',
+                      help='Replicate only given policy indices. '
+                           'Comma-separated list. '
+                           'Only has effect if --once is used.')
+    conf_file, options = parse_options(parser=parser, once=True)
+    run_daemon(ObjectReplicator, conf_file, **options)
+
+
+if __name__ == '__main__':
+    main()
diff --git a/swift/obj/server.py b/swift/obj/server.py
old mode 100755
new mode 100644
index 3c03aec4ed..b3d7b44071
--- a/swift/obj/server.py
+++ b/swift/obj/server.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -15,421 +15,270 @@
 
 """ Object Server for Swift """
 
-from __future__ import with_statement
-import cPickle as pickle
-import errno
+import pickle  # nosec: B403
+from urllib.parse import unquote
+import json
 import os
+import multiprocessing
+import sys
 import time
 import traceback
-from datetime import datetime
-from hashlib import md5
-from tempfile import mkstemp
-from urllib import unquote
-from contextlib import contextmanager
-
-from xattr import getxattr, setxattr
-from eventlet import sleep, Timeout, tpool
-
-from swift.common.utils import mkdirs, normalize_timestamp, public, \
-    storage_directory, hash_path, renamer, fallocate, fsync, \
-    split_path, drop_buffer_cache, get_logger, write_pickle, \
-    config_true_value, validate_device_partition, timing_stats
+import socket
+
+from eventlet import sleep, wsgi, Timeout, tpool
+from eventlet.greenthread import spawn
+
+from swift.common.utils import public, get_logger, \
+    config_true_value, config_percent_value, \
+    replication, normalize_delete_at_timestamp, \
+    get_log_line, Timestamp, parse_mime_headers, \
+    iter_multipart_mime_documents, extract_swift_bytes, safe_json_loads, \
+    config_auto_int_value, split_path, get_redirect_data, \
+    normalize_timestamp, md5, parse_options, CooperativeIterator
 from swift.common.bufferedhttp import http_connect
-from swift.common.constraints import check_object_creation, check_mount, \
-    check_float, check_utf8
-from swift.common.exceptions import ConnectionTimeout, DiskFileError, \
-    DiskFileNotExist
-from swift.obj.replicator import tpool_reraise, invalidate_hash, \
-    quarantine_renamer, get_hashes
-from swift.common.http import is_success
+from swift.common.constraints import check_object_creation, \
+    valid_timestamp, check_utf8, AUTO_CREATE_ACCOUNT_PREFIX
+from swift.common.exceptions import ConnectionTimeout, DiskFileQuarantined, \
+    DiskFileNotExist, DiskFileCollision, DiskFileNoSpace, DiskFileDeleted, \
+    DiskFileDeviceUnavailable, DiskFileExpired, ChunkReadTimeout, \
+    ChunkReadError, DiskFileXattrNotSupported, DiskFileStateChanged
+from swift.common.request_helpers import resolve_ignore_range_header, \
+    OBJECT_SYSMETA_CONTAINER_UPDATE_OVERRIDE_PREFIX
+from swift.obj import ssync_receiver, expirer
+from swift.common.http import is_success, HTTP_MOVED_PERMANENTLY
+from swift.common.base_storage_server import BaseStorageServer, \
+    timing_stats, labeled_timing_stats
+from swift.common.header_key_dict import HeaderKeyDict
+from swift.common.request_helpers import get_name_and_placement, \
+    is_user_meta, is_sys_or_user_meta, is_object_transient_sysmeta, \
+    resolve_etag_is_at_header, is_sys_meta, validate_internal_obj, \
+    is_backend_open_expired
+from swift.common.statsd_client import get_labeled_statsd_client
 from swift.common.swob import HTTPAccepted, HTTPBadRequest, HTTPCreated, \
-    HTTPInternalServerError, HTTPNoContent, HTTPNotFound, HTTPNotModified, \
+    HTTPInternalServerError, HTTPNoContent, HTTPNotFound, \
     HTTPPreconditionFailed, HTTPRequestTimeout, HTTPUnprocessableEntity, \
-    HTTPClientDisconnect, HTTPMethodNotAllowed, Request, Response, UTC, \
-    HTTPInsufficientStorage, multi_range_iterator
+    HTTPClientDisconnect, HTTPMethodNotAllowed, Request, Response, \
+    HTTPInsufficientStorage, HTTPForbidden, HTTPException, HTTPConflict, \
+    HTTPServerError, bytes_to_wsgi, wsgi_to_bytes, wsgi_to_str, \
+    normalize_etag, HTTPServiceUnavailable
+from swift.common.wsgi import run_wsgi
+from swift.obj.diskfile import RESERVED_DATAFILE_META, DiskFileRouter
+from swift.obj.expirer import build_task_obj, embed_expirer_bytes_in_ctype, \
+    X_DELETE_TYPE
 
 
-DATADIR = 'objects'
-ASYNCDIR = 'async_pending'
-PICKLE_PROTOCOL = 2
-METADATA_KEY = 'user.swift.metadata'
-MAX_OBJECT_NAME_LENGTH = 1024
-# keep these lower-case
-DISALLOWED_HEADERS = set('content-length content-type deleted etag'.split())
+LABELED_METRIC_NAME = 'swift_object_server_request_timing'
 
 
-def read_metadata(fd):
-    """
-    Helper function to read the pickled metadata from an object file.
+def iter_mime_headers_and_bodies(wsgi_input, mime_boundary, read_chunk_size):
+    mime_documents_iter = iter_multipart_mime_documents(
+        wsgi_input, mime_boundary, read_chunk_size)
 
-    :param fd: file descriptor to load the metadata from
+    for file_like in mime_documents_iter:
+        hdrs = parse_mime_headers(file_like)
+        yield (hdrs, file_like)
 
-    :returns: dictionary of metadata
-    """
-    metadata = ''
-    key = 0
-    try:
-        while True:
-            metadata += getxattr(fd, '%s%s' % (METADATA_KEY, (key or '')))
-            key += 1
-    except IOError:
-        pass
-    return pickle.loads(metadata)
-
-
-def write_metadata(fd, metadata):
-    """
-    Helper function to write pickled metadata for an object file.
 
-    :param fd: file descriptor to write the metadata
-    :param metadata: metadata to write
+def drain(file_like, read_size, timeout):
     """
-    metastr = pickle.dumps(metadata, PICKLE_PROTOCOL)
-    key = 0
-    while metastr:
-        setxattr(fd, '%s%s' % (METADATA_KEY, key or ''), metastr[:254])
-        metastr = metastr[254:]
-        key += 1
+    Read and discard any bytes from file_like.
 
+    :param file_like: file-like object to read from
+    :param read_size: how big a chunk to read at a time
+    :param timeout: how long to wait for a read (use None for no timeout)
 
-class DiskFile(object):
-    """
-    Manage object files on disk.
-
-    :param path: path to devices on the node
-    :param device: device name
-    :param partition: partition on the device the object lives in
-    :param account: account name for the object
-    :param container: container name for the object
-    :param obj: object name for the object
-    :param keep_data_fp: if True, don't close the fp, otherwise close it
-    :param disk_chunk_size: size of chunks on file reads
-    :param iter_hook: called when __iter__ returns a chunk
+    :raises ChunkReadTimeout: if no chunk was read in time
     """
 
-    def __init__(self, path, device, partition, account, container, obj,
-                 logger, keep_data_fp=False, disk_chunk_size=65536,
-                 iter_hook=None):
-        self.disk_chunk_size = disk_chunk_size
-        self.iter_hook = iter_hook
-        self.name = '/' + '/'.join((account, container, obj))
-        name_hash = hash_path(account, container, obj)
-        self.datadir = os.path.join(
-            path, device, storage_directory(DATADIR, partition, name_hash))
-        self.device_path = os.path.join(path, device)
-        self.tmpdir = os.path.join(path, device, 'tmp')
-        self.tmppath = None
-        self.logger = logger
-        self.metadata = {}
-        self.meta_file = None
-        self.data_file = None
-        self.fp = None
-        self.iter_etag = None
-        self.started_at_0 = False
-        self.read_to_eof = False
-        self.quarantined_dir = None
-        self.keep_cache = False
-        self.suppress_file_closing = False
-        if not os.path.exists(self.datadir):
-            return
-        files = sorted(os.listdir(self.datadir), reverse=True)
-        for file in files:
-            if file.endswith('.ts'):
-                self.data_file = self.meta_file = None
-                self.metadata = {'deleted': True}
-                return
-            if file.endswith('.meta') and not self.meta_file:
-                self.meta_file = os.path.join(self.datadir, file)
-            if file.endswith('.data') and not self.data_file:
-                self.data_file = os.path.join(self.datadir, file)
+    while True:
+        with ChunkReadTimeout(timeout):
+            chunk = file_like.read(read_size)
+            if not chunk:
                 break
-        if not self.data_file:
-            return
-        self.fp = open(self.data_file, 'rb')
-        self.metadata = read_metadata(self.fp)
-        if not keep_data_fp:
-            self.close(verify_file=False)
-        if self.meta_file:
-            with open(self.meta_file) as mfp:
-                for key in self.metadata.keys():
-                    if key.lower() not in DISALLOWED_HEADERS:
-                        del self.metadata[key]
-                self.metadata.update(read_metadata(mfp))
-
-    def __iter__(self):
-        """Returns an iterator over the data file."""
-        try:
-            dropped_cache = 0
-            read = 0
-            self.started_at_0 = False
-            self.read_to_eof = False
-            if self.fp.tell() == 0:
-                self.started_at_0 = True
-                self.iter_etag = md5()
-            while True:
-                chunk = self.fp.read(self.disk_chunk_size)
-                if chunk:
-                    if self.iter_etag:
-                        self.iter_etag.update(chunk)
-                    read += len(chunk)
-                    if read - dropped_cache > (1024 * 1024):
-                        self.drop_cache(self.fp.fileno(), dropped_cache,
-                                        read - dropped_cache)
-                        dropped_cache = read
-                    yield chunk
-                    if self.iter_hook:
-                        self.iter_hook()
-                else:
-                    self.read_to_eof = True
-                    self.drop_cache(self.fp.fileno(), dropped_cache,
-                                    read - dropped_cache)
-                    break
-        finally:
-            if not self.suppress_file_closing:
-                self.close()
-
-    def app_iter_range(self, start, stop):
-        """Returns an iterator over the data file for range (start, stop)"""
-        if start or start == 0:
-            self.fp.seek(start)
-        if stop is not None:
-            length = stop - start
-        else:
-            length = None
-        for chunk in self:
-            if length is not None:
-                length -= len(chunk)
-                if length < 0:
-                    # Chop off the extra:
-                    yield chunk[:length]
-                    break
-            yield chunk
-
-    def app_iter_ranges(self, ranges, content_type, boundary, size):
-        """Returns an iterator over the data file for a set of ranges"""
-        if (not ranges or len(ranges) == 0):
-            yield ''
-        else:
-            try:
-                self.suppress_file_closing = True
-                for chunk in multi_range_iterator(
-                        ranges, content_type, boundary, size,
-                        self.app_iter_range):
-                    yield chunk
-            finally:
-                self.suppress_file_closing = False
-                self.close()
-
-    def _handle_close_quarantine(self):
-        """Check if file needs to be quarantined"""
-        try:
-            obj_size = self.get_data_file_size()
-        except DiskFileError, e:
-            self.quarantine()
-            return
-        except DiskFileNotExist:
-            return
-
-        if self.iter_etag and self.started_at_0 and self.read_to_eof and \
-                'ETag' in self.metadata and \
-                self.iter_etag.hexdigest() != self.metadata.get('ETag'):
-            self.quarantine()
-
-    def close(self, verify_file=True):
-        """
-        Close the file. Will handle quarantining file if necessary.
-
-        :param verify_file: Defaults to True. If false, will not check
-                            file to see if it needs quarantining.
-        """
-        if self.fp:
-            try:
-                if verify_file:
-                    self._handle_close_quarantine()
-            except (Exception, Timeout), e:
-                self.logger.error(_(
-                    'ERROR DiskFile %(data_file)s in '
-                    '%(data_dir)s close failure: %(exc)s : %(stack)'),
-                    {'exc': e, 'stack': ''.join(traceback.format_stack()),
-                     'data_file': self.data_file, 'data_dir': self.datadir})
-            finally:
-                self.fp.close()
-                self.fp = None
-
-    def is_deleted(self):
-        """
-        Check if the file is deleted.
-
-        :returns: True if the file doesn't exist or has been flagged as
-                  deleted.
-        """
-        return not self.data_file or 'deleted' in self.metadata
-
-    def is_expired(self):
-        """
-        Check if the file is expired.
-
-        :returns: True if the file has an X-Delete-At in the past
-        """
-        return ('X-Delete-At' in self.metadata and
-                int(self.metadata['X-Delete-At']) <= time.time())
-
-    @contextmanager
-    def mkstemp(self):
-        """Contextmanager to make a temporary file."""
-        if not os.path.exists(self.tmpdir):
-            mkdirs(self.tmpdir)
-        fd, self.tmppath = mkstemp(dir=self.tmpdir)
-        try:
-            yield fd
-        finally:
-            try:
-                os.close(fd)
-            except OSError:
-                pass
-            tmppath, self.tmppath = self.tmppath, None
-            try:
-                os.unlink(tmppath)
-            except OSError:
-                pass
 
-    def put(self, fd, metadata, extension='.data'):
-        """
-        Finalize writing the file on disk, and renames it from the temp file to
-        the real location.  This should be called after the data has been
-        written to the temp file.
 
-        :param fd: file descriptor of the temp file
-        :param metadata: dictionary of metadata to be written
-        :param extension: extension to be used when making the file
-        """
-        assert self.tmppath is not None
-        metadata['name'] = self.name
-        timestamp = normalize_timestamp(metadata['X-Timestamp'])
-        write_metadata(fd, metadata)
-        if 'Content-Length' in metadata:
-            self.drop_cache(fd, 0, int(metadata['Content-Length']))
-        tpool.execute(fsync, fd)
-        invalidate_hash(os.path.dirname(self.datadir))
-        renamer(self.tmppath,
-                os.path.join(self.datadir, timestamp + extension))
-        self.metadata = metadata
+def get_obj_name_and_placement(request):
+    """
+    Split and validate path for an object.
 
-    def put_metadata(self, metadata, tombstone=False):
-        """
-        Short hand for putting metadata to .meta and .ts files.
+    :param request: a swob request
 
-        :param metadata: dictionary of metadata to be written
-        :param tombstone: whether or not we are writing a tombstone
-        """
-        extension = '.ts' if tombstone else '.meta'
-        with self.mkstemp() as fd:
-            self.put(fd, metadata, extension=extension)
+    :returns: a tuple of path parts and storage policy
+    """
+    device, partition, account, container, obj, policy = \
+        get_name_and_placement(request, 5, 5, True)
+    validate_internal_obj(account, container, obj)
+    return device, partition, account, container, obj, policy
 
-    def unlinkold(self, timestamp):
-        """
-        Remove any older versions of the object file.  Any file that has an
-        older timestamp than timestamp will be deleted.
 
-        :param timestamp: timestamp to compare with each file
-        """
-        timestamp = normalize_timestamp(timestamp)
-        for fname in os.listdir(self.datadir):
-            if fname < timestamp:
-                try:
-                    os.unlink(os.path.join(self.datadir, fname))
-                except OSError, err:    # pragma: no cover
-                    if err.errno != errno.ENOENT:
-                        raise
+def _make_backend_fragments_header(fragments):
+    if fragments:
+        result = {}
+        for ts, frag_list in fragments.items():
+            result[ts.internal] = frag_list
+        return json.dumps(result)
+    return None
 
-    def drop_cache(self, fd, offset, length):
-        """Method for no-oping buffer cache drop method."""
-        if not self.keep_cache:
-            drop_buffer_cache(fd, offset, length)
 
-    def quarantine(self):
-        """
-        In the case that a file is corrupted, move it to a quarantined
-        area to allow replication to fix it.
+class EventletPlungerString(bytes):
+    """
+    Eventlet won't send headers until it's accumulated at least
+    eventlet.wsgi.MINIMUM_CHUNK_SIZE bytes or the app iter is exhausted.
+    If we want to send the response body behind Eventlet's back, perhaps
+    with some zero-copy wizardry, then we have to unclog the plumbing in
+    eventlet.wsgi to force the headers out, so we use an
+    EventletPlungerString to empty out all of Eventlet's buffers.
+    """
+    def __len__(self):
+        return wsgi.MINIMUM_CHUNK_SIZE + 1
 
-        :returns: if quarantine is successful, path to quarantined
-                  directory otherwise None
-        """
-        if not (self.is_deleted() or self.quarantined_dir):
-            self.quarantined_dir = quarantine_renamer(self.device_path,
-                                                      self.data_file)
-            self.logger.increment('quarantines')
-            return self.quarantined_dir
 
-    def get_data_file_size(self):
-        """
-        Returns the os.path.getsize for the file.  Raises an exception if this
-        file does not match the Content-Length stored in the metadata. Or if
-        self.data_file does not exist.
-
-        :returns: file size as an int
-        :raises DiskFileError: on file size mismatch.
-        :raises DiskFileNotExist: on file not existing (including deleted)
-        """
-        try:
-            file_size = 0
-            if self.data_file:
-                file_size = os.path.getsize(self.data_file)
-                if 'Content-Length' in self.metadata:
-                    metadata_size = int(self.metadata['Content-Length'])
-                    if file_size != metadata_size:
-                        raise DiskFileError(
-                            'Content-Length of %s does not match file size '
-                            'of %s' % (metadata_size, file_size))
-                return file_size
-        except OSError, err:
-            if err.errno != errno.ENOENT:
-                raise
-        raise DiskFileNotExist('Data File does not exist.')
-
-
-class ObjectController(object):
+class ObjectController(BaseStorageServer):
     """Implements the WSGI application for the Swift Object Server."""
 
-    def __init__(self, conf):
+    server_type = 'object-server'
+
+    def __init__(self, conf, logger=None):
         """
         Creates a new WSGI application for the Swift Object Server. An
         example configuration is given at
         <source-dir>/etc/object-server.conf-sample or
         /etc/swift/object-server.conf-sample.
         """
-        self.logger = get_logger(conf, log_route='object-server')
-        self.devices = conf.get('devices', '/srv/node/')
-        self.mount_check = config_true_value(conf.get('mount_check', 'true'))
-        self.node_timeout = int(conf.get('node_timeout', 3))
+        super(ObjectController, self).__init__(conf)
+        self.logger = logger or get_logger(conf, log_route='object-server')
+        self.statsd = get_labeled_statsd_client(conf, self.logger.logger)
+        self.node_timeout = float(conf.get('node_timeout', 3))
+        self.container_update_timeout = float(
+            conf.get('container_update_timeout', 1))
         self.conn_timeout = float(conf.get('conn_timeout', 0.5))
+        self.client_timeout = float(conf.get('client_timeout', 60))
         self.disk_chunk_size = int(conf.get('disk_chunk_size', 65536))
         self.network_chunk_size = int(conf.get('network_chunk_size', 65536))
-        self.keep_cache_size = int(conf.get('keep_cache_size', 5242880))
-        self.keep_cache_private = \
-            config_true_value(conf.get('keep_cache_private', 'false'))
         self.log_requests = config_true_value(conf.get('log_requests', 'true'))
         self.max_upload_time = int(conf.get('max_upload_time', 86400))
         self.slow = int(conf.get('slow', 0))
-        self.bytes_per_sync = int(conf.get('mb_per_sync', 512)) * 1024 * 1024
+        self.keep_cache_private = \
+            config_true_value(conf.get('keep_cache_private', 'false'))
+        self.keep_cache_slo_manifest = \
+            config_true_value(conf.get('keep_cache_slo_manifest', 'false'))
+        self.cooperative_period = int(conf.get("cooperative_period", 0))
+        self.etag_validate_frac = config_percent_value(
+            conf.get("etag_validate_pct", 100))
+
         default_allowed_headers = '''
             content-disposition,
             content-encoding,
             x-delete-at,
             x-object-manifest,
+            x-static-large-object,
+            cache-control,
+            content-language,
+            expires,
+            x-robots-tag
         '''
-        self.allowed_headers = set(
-            i.strip().lower() for i in
-            conf.get('allowed_headers', default_allowed_headers).split(',')
-            if i.strip() and i.strip().lower() not in DISALLOWED_HEADERS)
-        self.expiring_objects_account = \
-            (conf.get('auto_create_account_prefix') or '.') + \
-            'expiring_objects'
-        self.expiring_objects_container_divisor = \
-            int(conf.get('expiring_objects_container_divisor') or 86400)
+        extra_allowed_headers = [
+            header.strip().lower() for header in conf.get(
+                'allowed_headers', default_allowed_headers).split(',')
+            if header.strip()
+        ]
+        self.allowed_headers = set()
+        for header in extra_allowed_headers:
+            if header not in RESERVED_DATAFILE_META:
+                self.allowed_headers.add(header)
+
+        self.auto_create_account_prefix = AUTO_CREATE_ACCOUNT_PREFIX
+        self.expirer_config = expirer.ExpirerConfig(conf, logger=self.logger)
+        # Initialization was successful, so now apply the network chunk size
+        # parameter as the default read / write buffer size for the network
+        # sockets.
+        #
+        # NOTE WELL: This is a class setting, so until we get set this on a
+        # per-connection basis, this affects reading and writing on ALL
+        # sockets, those between the proxy servers and external clients, and
+        # those between the proxy servers and the other internal servers.
+        #
+        # ** Because the primary motivation for this is to optimize how data
+        # is written back to the proxy server, we could use the value from the
+        # disk_chunk_size parameter. However, it affects all created sockets
+        # using this class so we have chosen to tie it to the
+        # network_chunk_size parameter value instead.
+        # if six.PY2:
+        #    socket._fileobject.default_bufsize = self.network_chunk_size
+        # TODO: find a way to enable similar functionality in py3
+
+        # Provide further setup specific to an object server implementation.
+        self.setup(conf)
+
+    def setup(self, conf):
+        """
+        Implementation specific setup. This method is called at the very end
+        by the constructor to allow a specific implementation to modify
+        existing attributes or add its own attributes.
+
+        :param conf: WSGI configuration parameter
+        """
+
+        # Common on-disk hierarchy shared across account, container and object
+        # servers.
+        self._diskfile_router = DiskFileRouter(conf, self.logger)
+        # This is populated by global_conf_callback way below as the semaphore
+        # is shared by all workers.
+        if 'replication_semaphore' in conf:
+            # The value was put in a list so it could get past paste
+            self.replication_semaphore = conf['replication_semaphore'][0]
+        else:
+            self.replication_semaphore = None
+        self.replication_failure_threshold = int(
+            conf.get('replication_failure_threshold') or 100)
+        self.replication_failure_ratio = float(
+            conf.get('replication_failure_ratio') or 1.0)
+
+        servers_per_port = int(conf.get('servers_per_port', '0') or 0)
+        if servers_per_port:
+            # The typical servers-per-port deployment also uses one port per
+            # disk, so you really get N servers per disk. In that case,
+            # having a pool of 20 threads per server per disk is far too
+            # much. For example, given a 60-disk chassis and 4 servers per
+            # disk, the default configuration will give us 21 threads per
+            # server (the main thread plus the twenty tpool threads), for a
+            # total of around 60 * 21 * 4 = 5040 threads. This is clearly
+            # too high.
+            #
+            # Instead, we use a tpool size of 1, giving us 2 threads per
+            # process. In the example above, that's 60 * 2 * 4 = 480
+            # threads, which is reasonable since there are 240 processes.
+            default_tpool_size = 1
+        else:
+            # If we're not using servers-per-port, then leave the tpool size
+            # alone. The default (20) is typically good enough for one
+            # object server handling requests for many disks.
+            default_tpool_size = None
+
+        tpool_size = config_auto_int_value(
+            conf.get('eventlet_tpool_num_threads'),
+            default_tpool_size)
+
+        if tpool_size:
+            tpool.set_num_threads(tpool_size)
+
+    def get_diskfile(self, device, partition, account, container, obj,
+                     policy, **kwargs):
+        """
+        Utility method for instantiating a DiskFile object supporting a given
+        REST API.
+
+        An implementation of the object server that wants to use a different
+        DiskFile class would simply over-ride this method to provide that
+        behavior.
+        """
+        return self._diskfile_router[policy].get_diskfile(
+            device, partition, account, container, obj, policy, **kwargs)
 
     def async_update(self, op, account, container, obj, host, partition,
-                     contdevice, headers_out, objdevice):
+                     contdevice, headers_out, objdevice, policy,
+                     logger_thread_locals=None, container_path=None,
+                     db_state=None):
         """
         Sends or saves an async update.
 
@@ -443,8 +292,27 @@ def async_update(self, op, account, container, obj, host, partition,
         :param headers_out: dictionary of headers to send in the container
                             request
         :param objdevice: device name that the object is in
+        :param policy: the associated BaseStoragePolicy instance
+        :param logger_thread_locals: The thread local values to be set on the
+                                     self.logger to retain transaction
+                                     logging information.
+        :param container_path: optional path in the form `<account/container>`
+            to which the update should be sent. If given this path will be used
+            instead of constructing a path from the ``account`` and
+            ``container`` params.
+        :param db_state: The current database state of the container as
+            supplied to us by the proxy.
         """
-        full_path = '/%s/%s/%s' % (account, container, obj)
+        if logger_thread_locals:
+            self.logger.thread_locals = logger_thread_locals
+        headers_out['user-agent'] = 'object-server %s' % os.getpid()
+        if container_path:
+            # use explicitly specified container path
+            full_path = '/%s/%s' % (container_path, obj)
+        else:
+            full_path = '/%s/%s/%s' % (account, container, obj)
+
+        redirect_data = None
         if all([host, partition, contdevice]):
             try:
                 with ConnectionTimeout(self.conn_timeout):
@@ -454,32 +322,44 @@ def async_update(self, op, account, container, obj, host, partition,
                 with Timeout(self.node_timeout):
                     response = conn.getresponse()
                     response.read()
-                    if is_success(response.status):
-                        return
-                    else:
-                        self.logger.error(_(
-                            'ERROR Container update failed '
-                            '(saving for async update later): %(status)d '
-                            'response from %(ip)s:%(port)s/%(dev)s'),
-                            {'status': response.status, 'ip': ip, 'port': port,
-                             'dev': contdevice})
+                if is_success(response.status):
+                    return
+
+                if response.status == HTTP_MOVED_PERMANENTLY:
+                    try:
+                        redirect_data = get_redirect_data(response)
+                    except ValueError as err:
+                        self.logger.error(
+                            'Container update failed for %r; problem with '
+                            'redirect location: %s' % (obj, err))
+                else:
+                    self.logger.error(
+                        'ERROR Container update failed '
+                        '(saving for async update later): %(status)d '
+                        'response from %(ip)s:%(port)s/%(dev)s',
+                        {'status': response.status, 'ip': ip, 'port': port,
+                         'dev': contdevice})
             except (Exception, Timeout):
-                self.logger.exception(_(
+                self.logger.exception(
                     'ERROR container update failed with '
-                    '%(ip)s:%(port)s/%(dev)s (saving for async update later)'),
+                    '%(ip)s:%(port)s/%(dev)s (saving for async update later)',
                     {'ip': ip, 'port': port, 'dev': contdevice})
-        async_dir = os.path.join(self.devices, objdevice, ASYNCDIR)
-        ohash = hash_path(account, container, obj)
-        self.logger.increment('async_pendings')
-        write_pickle(
-            {'op': op, 'account': account, 'container': container,
-             'obj': obj, 'headers': headers_out},
-            os.path.join(async_dir, ohash[-3:], ohash + '-' +
-                         normalize_timestamp(headers_out['x-timestamp'])),
-            os.path.join(self.devices, objdevice, 'tmp'))
-
-    def container_update(self, op, account, container, obj, headers_in,
-                         headers_out, objdevice):
+        data = {'op': op, 'account': account, 'container': container,
+                'obj': obj, 'headers': headers_out, 'db_state': db_state}
+        if redirect_data:
+            self.logger.debug(
+                'Update to %(path)s redirected to %(redirect)s',
+                {'path': full_path, 'redirect': redirect_data[0]})
+            container_path = redirect_data[0]
+        if container_path:
+            data['container_path'] = container_path
+        timestamp = headers_out.get('x-meta-timestamp',
+                                    headers_out.get('x-timestamp'))
+        self._diskfile_router[policy].pickle_async_update(
+            objdevice, account, container, obj, data, timestamp, policy)
+
+    def container_update(self, op, account, container, obj, request,
+                         headers_out, objdevice, policy):
         """
         Update the container when objects are updated.
 
@@ -487,391 +367,1040 @@ def container_update(self, op, account, container, obj, headers_in,
         :param account: account name for the object
         :param container: container name for the object
         :param obj: object name
-        :param headers_in: dictionary of headers from the original request
+        :param request: the original request object driving the update
         :param headers_out: dictionary of headers to send in the container
-                            request
+                            request(s)
         :param objdevice: device name that the object is in
+        :param policy:  the BaseStoragePolicy instance
         """
-        host = headers_in.get('X-Container-Host', None)
-        partition = headers_in.get('X-Container-Partition', None)
-        contdevice = headers_in.get('X-Container-Device', None)
-        if not all([host, partition, contdevice]):
+        headers_in = request.headers
+        conthosts = [h.strip() for h in
+                     headers_in.get('X-Container-Host', '').split(',')]
+        contdevices = [d.strip() for d in
+                       headers_in.get('X-Container-Device', '').split(',')]
+        contpartition = headers_in.get('X-Container-Partition', '')
+        contdbstate = headers_in.get('X-Container-Root-Db-State')
+
+        if len(conthosts) != len(contdevices):
+            # This shouldn't happen unless there's a bug in the proxy,
+            # but if there is, we want to know about it.
+            self.logger.error(
+                'ERROR Container update failed: different '
+                'numbers of hosts and devices in request: '
+                '"%(hosts)s" vs "%(devices)s"', {
+                    'hosts': headers_in.get('X-Container-Host', ''),
+                    'devices': headers_in.get('X-Container-Device', '')})
             return
-        self.async_update(op, account, container, obj, host, partition,
-                          contdevice, headers_out, objdevice)
+
+        contpath = headers_in.get('X-Backend-Quoted-Container-Path')
+        if contpath:
+            contpath = unquote(contpath)
+        else:
+            contpath = headers_in.get('X-Backend-Container-Path')
+
+        if contpath:
+            try:
+                # TODO: this is very late in request handling to be validating
+                # a header - if we did *not* check and the header was bad
+                # presumably the update would fail and we would fall back to an
+                # async update to the root container, which might be best
+                # course of action rather than aborting update altogether?
+                split_path('/' + contpath, minsegs=2, maxsegs=2)
+            except ValueError:
+                self.logger.error(
+                    "Invalid X-Backend-Container-Path, should be of the form "
+                    "'account/container' but got %r." % contpath)
+                # fall back to updating root container
+                contpath = None
+
+        if contpartition:
+            # In py3, zip() continues to work for our purposes... But when
+            # we want to log an error, consumed items are not longer present
+            # in the zip, making the logs useless for operators. So, list().
+            updates = list(zip(conthosts, contdevices))
+        else:
+            updates = []
+
+        headers_out['x-trans-id'] = headers_in.get('x-trans-id', '-')
+        headers_out['referer'] = request.as_referer()
+        headers_out['X-Backend-Storage-Policy-Index'] = int(policy)
+        update_greenthreads = []
+        for conthost, contdevice in updates:
+            gt = spawn(self.async_update, op, account, container, obj,
+                       conthost, contpartition, contdevice, headers_out,
+                       objdevice, policy,
+                       logger_thread_locals=self.logger.thread_locals,
+                       container_path=contpath, db_state=contdbstate)
+            update_greenthreads.append(gt)
+        # Wait a little bit to see if the container updates are successful.
+        # If we immediately return after firing off the greenthread above, then
+        # we're more likely to confuse the end-user who does a listing right
+        # after getting a successful response to the object create. The
+        # `container_update_timeout` bounds the length of time we wait so that
+        # one slow container server doesn't make the entire request lag.
+        try:
+            with Timeout(self.container_update_timeout):
+                for gt in update_greenthreads:
+                    gt.wait()
+        except Timeout:
+            # updates didn't go through, log it and return
+            self.logger.debug(
+                'Container update timeout (%.4fs) waiting for %s',
+                self.container_update_timeout, updates)
 
     def delete_at_update(self, op, delete_at, account, container, obj,
-                         headers_in, objdevice):
+                         request, objdevice, policy, extra_headers=None):
         """
         Update the expiring objects container when objects are updated.
 
         :param op: operation performed (ex: 'PUT', or 'DELETE')
+        :param delete_at: scheduled delete in UNIX seconds, int
         :param account: account name for the object
         :param container: container name for the object
         :param obj: object name
-        :param headers_in: dictionary of headers from the original request
+        :param request: the original request driving the update
         :param objdevice: device name that the object is in
+        :param policy: the BaseStoragePolicy instance (used for tmp dir)
+        :param extra_headers: dict of additional headers for the update
         """
-        # Quick cap that will work from now until Sat Nov 20 17:46:39 2286
-        # At that time, Swift will be so popular and pervasive I will have
-        # created income for thousands of future programmers.
-        delete_at = max(min(delete_at, 9999999999), 0)
-        host = partition = contdevice = None
-        headers_out = {'x-timestamp': headers_in['x-timestamp'],
-                       'x-trans-id': headers_in.get('x-trans-id', '-')}
+        if config_true_value(
+                request.headers.get('x-backend-replication', 'f')):
+            return
+
+        delete_at = normalize_delete_at_timestamp(delete_at)
+
+        headers_in = request.headers
+        headers_out = HeaderKeyDict({
+            # system accounts are always Policy-0
+            'X-Backend-Storage-Policy-Index': 0,
+            'x-timestamp': request.timestamp.internal,
+            'x-trans-id': headers_in.get('x-trans-id', '-'),
+            'referer': request.as_referer()})
+
+        expiring_objects_account_name, delete_at_container = \
+            self.expirer_config.get_expirer_account_and_container(
+                delete_at, account, container, obj)
         if op != 'DELETE':
-            host = headers_in.get('X-Delete-At-Host', None)
+            hosts = headers_in.get('X-Delete-At-Host', None)
+            if hosts is None:
+                # If header is missing, no update needed as sufficient other
+                # object servers should perform the required update.
+                return
+
+            proxy_delete_at_container = headers_in.get(
+                'X-Delete-At-Container', None)
+            if delete_at_container != proxy_delete_at_container:
+                if not proxy_delete_at_container:
+                    # We carry this warning around for pre-2013 proxies
+                    self.logger.warning(
+                        'X-Delete-At-Container header must be specified for '
+                        'expiring objects background %s to work properly. '
+                        'Making best guess as to the container name '
+                        'for now.', op)
+                    proxy_delete_at_container = delete_at_container
+                else:
+                    # Inconsistent configuration may lead to orphaned expirer
+                    # task queue objects when X-Delete-At is updated, which can
+                    # stick around for a whole reclaim age.
+                    self.logger.debug(
+                        'Proxy X-Delete-At-Container %r does not match '
+                        'expected %r for current expirer_config.',
+                        proxy_delete_at_container, delete_at_container)
+                # it's not possible to say which is "more correct", this will
+                # at least match the host/part/device
+                delete_at_container = normalize_delete_at_timestamp(
+                    proxy_delete_at_container)
+
+            # new updates need to enqueue new x-delete-at
             partition = headers_in.get('X-Delete-At-Partition', None)
-            contdevice = headers_in.get('X-Delete-At-Device', None)
+            contdevices = headers_in.get('X-Delete-At-Device', '')
+            updates = [upd for upd in
+                       zip((h.strip() for h in hosts.split(',')),
+                           (c.strip() for c in contdevices.split(',')))
+                       if all(upd) and partition]
+            if not updates:
+                updates = [(None, None)]
             headers_out['x-size'] = '0'
-            headers_out['x-content-type'] = 'text/plain'
+            headers_out['x-content-type'] = X_DELETE_TYPE
             headers_out['x-etag'] = 'd41d8cd98f00b204e9800998ecf8427e'
-        self.async_update(
-            op, self.expiring_objects_account,
-            str(delete_at / self.expiring_objects_container_divisor *
-                self.expiring_objects_container_divisor),
-            '%s-%s/%s/%s' % (delete_at, account, container, obj),
-            host, partition, contdevice, headers_out, objdevice)
+            if extra_headers:
+                headers_out.update(extra_headers)
+        else:
+            if not config_true_value(
+                request.headers.get(
+                    'X-Backend-Clean-Expiring-Object-Queue', 't')):
+                return
+            # DELETE op always go directly to async_pending
+            partition = None
+            updates = [(None, None)]
+
+        for host, contdevice in updates:
+            self.async_update(
+                op, expiring_objects_account_name, delete_at_container,
+                build_task_obj(delete_at, account, container, obj),
+                host, partition, contdevice, headers_out, objdevice,
+                policy)
+
+    def _make_timeout_reader(self, file_like):
+        def timeout_reader():
+            with ChunkReadTimeout(self.client_timeout):
+                try:
+                    return file_like.read(self.network_chunk_size)
+                except (IOError, ValueError):
+                    raise ChunkReadError
+        return timeout_reader
+
+    def _read_put_commit_message(self, mime_documents_iter):
+        rcvd_commit = False
+        try:
+            with ChunkReadTimeout(self.client_timeout):
+                commit_hdrs, commit_iter = next(mime_documents_iter)
+                if commit_hdrs.get('X-Document', None) == "put commit":
+                    rcvd_commit = True
+            drain(commit_iter, self.network_chunk_size, self.client_timeout)
+        except ChunkReadError:
+            raise HTTPClientDisconnect()
+        except ChunkReadTimeout:
+            raise HTTPRequestTimeout()
+        except StopIteration:
+            raise HTTPBadRequest(body="couldn't find PUT commit MIME doc")
+        return rcvd_commit
+
+    def _read_metadata_footer(self, mime_documents_iter):
+        try:
+            with ChunkReadTimeout(self.client_timeout):
+                footer_hdrs, footer_iter = next(mime_documents_iter)
+        except ChunkReadError:
+            raise HTTPClientDisconnect()
+        except ChunkReadTimeout:
+            raise HTTPRequestTimeout()
+        except StopIteration:
+            raise HTTPBadRequest(body="couldn't find footer MIME doc")
+        return self._parse_footer(footer_hdrs, footer_iter)
+
+    def _parse_footer(self, footer_hdrs, footer_iter):
+        """
+        Validate footer metadata and translate JSON body into HeaderKeyDict.
+        """
+        timeout_reader = self._make_timeout_reader(footer_iter)
+        try:
+            footer_body = b''.join(iter(timeout_reader, b''))
+        except ChunkReadError:
+            raise HTTPClientDisconnect()
+        except ChunkReadTimeout:
+            raise HTTPRequestTimeout()
+
+        footer_md5 = footer_hdrs.get('Content-MD5')
+        if not footer_md5:
+            raise HTTPBadRequest(body="no Content-MD5 in footer")
+        if footer_md5 != md5(footer_body, usedforsecurity=False).hexdigest():
+            raise HTTPUnprocessableEntity(body="footer MD5 mismatch")
+
+        try:
+            return HeaderKeyDict(json.loads(footer_body))
+        except ValueError:
+            raise HTTPBadRequest("invalid JSON for footer doc")
+
+    def _check_container_override(self, update_headers, metadata,
+                                  footers=None):
+        """
+        Applies any overrides to the container update headers.
+
+        Overrides may be in the x-object-sysmeta-container-update- namespace or
+        the x-backend-container-update-override- namespace. The former is
+        preferred and is used by proxy middlewares. The latter is historical
+        but is still used with EC policy PUT requests; for backwards
+        compatibility the header names used with EC policy requests have not
+        been changed to the sysmeta namespace - that way the EC PUT path of a
+        newer proxy will remain compatible with an object server that pre-dates
+        the introduction of the x-object-sysmeta-container-update- namespace
+        and vice-versa.
+
+        :param update_headers: a dict of headers used in the container update
+        :param metadata: a dict that may container override items
+        :param footers: another dict that may container override items, at a
+                        higher priority than metadata
+        """
+        footers = footers or {}
+        # the order of this list is significant:
+        # x-object-sysmeta-container-update-override-* headers take precedence
+        # over x-backend-container-update-override-* headers
+        override_prefixes = ['x-backend-container-update-override-',
+                             OBJECT_SYSMETA_CONTAINER_UPDATE_OVERRIDE_PREFIX]
+        for override_prefix in override_prefixes:
+            for key, val in metadata.items():
+                if key.lower().startswith(override_prefix):
+                    override = key.lower().replace(override_prefix, 'x-')
+                    update_headers[override] = val
+            # apply x-backend-container-update-override* from footers *before*
+            # x-object-sysmeta-container-update-override-* from headers
+            for key, val in footers.items():
+                if key.lower().startswith(override_prefix):
+                    override = key.lower().replace(override_prefix, 'x-')
+                    update_headers[override] = val
+
+    def _conditional_delete_at_update(self, request, device, account,
+                                      container, obj, policy, metadata,
+                                      orig_delete_at, new_delete_at):
+        if new_delete_at:
+            extra_headers = {
+                'x-content-type': embed_expirer_bytes_in_ctype(
+                    X_DELETE_TYPE, metadata),
+                'x-content-type-timestamp':
+                metadata.get('X-Timestamp'),
+            }
+            self.delete_at_update(
+                'PUT', new_delete_at, account, container, obj, request,
+                device, policy, extra_headers)
+        if orig_delete_at and orig_delete_at != new_delete_at:
+            self.delete_at_update(
+                'DELETE', orig_delete_at, account, container, obj,
+                request, device, policy)
 
     @public
-    @timing_stats
-    def POST(self, request):
+    @timing_stats()
+    @labeled_timing_stats(metric=LABELED_METRIC_NAME)
+    def POST(self, request, timing_stats_labels):
         """Handle HTTP POST requests for the Swift Object Server."""
-        try:
-            device, partition, account, container, obj = \
-                split_path(unquote(request.path), 5, 5, True)
-            validate_device_partition(device, partition)
-        except ValueError, err:
-            return HTTPBadRequest(body=str(err), request=request,
-                                  content_type='text/plain')
-        if 'x-timestamp' not in request.headers or \
-                not check_float(request.headers['x-timestamp']):
-            return HTTPBadRequest(body='Missing timestamp', request=request,
-                                  content_type='text/plain')
+        device, partition, account, container, obj, policy = \
+            get_obj_name_and_placement(request)
+        timing_stats_labels['account'] = account
+        timing_stats_labels['container'] = container
+        timing_stats_labels['policy'] = int(policy)
+
+        req_timestamp = valid_timestamp(request)
         new_delete_at = int(request.headers.get('X-Delete-At') or 0)
-        if new_delete_at and new_delete_at < time.time():
+        if new_delete_at and new_delete_at < req_timestamp:
             return HTTPBadRequest(body='X-Delete-At in past', request=request,
                                   content_type='text/plain')
-        if self.mount_check and not check_mount(self.devices, device):
+        next_part_power = request.headers.get('X-Backend-Next-Part-Power')
+        try:
+            disk_file = self.get_diskfile(
+                device, partition, account, container, obj,
+                policy=policy, open_expired=is_backend_open_expired(request),
+                next_part_power=next_part_power)
+        except DiskFileDeviceUnavailable:
             return HTTPInsufficientStorage(drive=device, request=request)
-        file = DiskFile(self.devices, device, partition, account, container,
-                        obj, self.logger, disk_chunk_size=self.disk_chunk_size)
-
-        if file.is_deleted() or file.is_expired():
-            return HTTPNotFound(request=request)
         try:
-            file_size = file.get_data_file_size()
-        except (DiskFileError, DiskFileNotExist):
-            file.quarantine()
+            orig_metadata = disk_file.read_metadata(current_time=req_timestamp)
+        except DiskFileXattrNotSupported:
+            return HTTPInsufficientStorage(drive=device, request=request)
+        except (DiskFileNotExist, DiskFileQuarantined):
             return HTTPNotFound(request=request)
-        metadata = {'X-Timestamp': request.headers['x-timestamp']}
-        metadata.update(val for val in request.headers.iteritems()
-                        if val[0].lower().startswith('x-object-meta-'))
-        for header_key in self.allowed_headers:
-            if header_key in request.headers:
-                header_caps = header_key.title()
-                metadata[header_caps] = request.headers[header_key]
-        old_delete_at = int(file.metadata.get('X-Delete-At') or 0)
-        if old_delete_at != new_delete_at:
-            if new_delete_at:
-                self.delete_at_update('PUT', new_delete_at, account, container,
-                                      obj, request.headers, device)
-            if old_delete_at:
-                self.delete_at_update('DELETE', old_delete_at, account,
-                                      container, obj, request.headers, device)
-        file.put_metadata(metadata)
-        return HTTPAccepted(request=request)
+        except DiskFileStateChanged:
+            return HTTPServiceUnavailable(request=request)
+        orig_timestamp = Timestamp(
+            orig_metadata.get('X-Timestamp', Timestamp.zero()))
+        orig_ctype_timestamp = disk_file.content_type_timestamp
+        req_ctype_time = '0'
+        req_ctype = request.headers.get('Content-Type')
+        if req_ctype:
+            req_ctype_time = request.headers.get('Content-Type-Timestamp',
+                                                 req_timestamp.internal)
+        req_ctype_timestamp = Timestamp(req_ctype_time)
+        if orig_timestamp >= req_timestamp \
+                and orig_ctype_timestamp >= req_ctype_timestamp:
+            return HTTPConflict(
+                request=request,
+                headers={'X-Backend-Timestamp': orig_timestamp.internal})
+
+        if req_timestamp > orig_timestamp:
+            metadata = {'X-Timestamp': req_timestamp.internal}
+            metadata.update(val for val in request.headers.items()
+                            if (is_user_meta('object', val[0]) or
+                                is_object_transient_sysmeta(val[0])))
+            headers_to_copy = (
+                request.headers.get(
+                    'X-Backend-Replication-Headers', '').split() +
+                list(self.allowed_headers))
+            for header_key in headers_to_copy:
+                if header_key in request.headers:
+                    header_caps = bytes_to_wsgi(
+                        wsgi_to_bytes(header_key).title())
+                    metadata[header_caps] = request.headers[header_key]
+            orig_delete_at = int(orig_metadata.get('X-Delete-At') or 0)
+            disk_file_metadata = disk_file.get_datafile_metadata()
+            self._conditional_delete_at_update(
+                request, device, account, container, obj, policy,
+                disk_file_metadata, orig_delete_at, new_delete_at
+            )
+        else:
+            # preserve existing metadata, only content-type may be updated
+            metadata = dict(disk_file.get_metafile_metadata())
+
+        if req_ctype_timestamp > orig_ctype_timestamp:
+            # we have a new content-type, add to metadata and container update
+            content_type_headers = {
+                'Content-Type': request.headers['Content-Type'],
+                'Content-Type-Timestamp': req_ctype_timestamp.internal
+            }
+            metadata.update(content_type_headers)
+        else:
+            # send existing content-type with container update
+            content_type_headers = {
+                'Content-Type': disk_file.content_type,
+                'Content-Type-Timestamp': orig_ctype_timestamp.internal
+            }
+            if orig_ctype_timestamp != disk_file.data_timestamp:
+                # only add to metadata if it's not the datafile content-type
+                metadata.update(content_type_headers)
 
-    @public
-    @timing_stats
-    def PUT(self, request):
-        """Handle HTTP PUT requests for the Swift Object Server."""
         try:
-            device, partition, account, container, obj = \
-                split_path(unquote(request.path), 5, 5, True)
-            validate_device_partition(device, partition)
-        except ValueError, err:
-            return HTTPBadRequest(body=str(err), request=request,
-                                  content_type='text/plain')
-        if self.mount_check and not check_mount(self.devices, device):
+            disk_file.write_metadata(metadata)
+        except (DiskFileXattrNotSupported, DiskFileNoSpace):
             return HTTPInsufficientStorage(drive=device, request=request)
-        if 'x-timestamp' not in request.headers or \
-                not check_float(request.headers['x-timestamp']):
-            return HTTPBadRequest(body='Missing timestamp', request=request,
-                                  content_type='text/plain')
+
+        if (content_type_headers['Content-Type-Timestamp']
+                != disk_file.data_timestamp):
+            # Current content-type is not from the datafile, but the datafile
+            # content-type may have a swift_bytes param that was appended by
+            # SLO and we must continue to send that with the container update.
+            # Do this (rather than use a separate header) for backwards
+            # compatibility because there may be 'legacy' container updates in
+            # async pending that have content-types with swift_bytes params, so
+            # we have to be able to handle those in container server anyway.
+            _, swift_bytes = extract_swift_bytes(
+                disk_file.get_datafile_metadata()['Content-Type'])
+            if swift_bytes:
+                content_type_headers['Content-Type'] += (';swift_bytes=%s'
+                                                         % swift_bytes)
+
+        update_headers = HeaderKeyDict({
+            'x-size': orig_metadata['Content-Length'],
+            'x-content-type': content_type_headers['Content-Type'],
+            'x-timestamp': disk_file.data_timestamp.internal,
+            'x-content-type-timestamp':
+            content_type_headers['Content-Type-Timestamp'],
+            'x-meta-timestamp': metadata['X-Timestamp'],
+            'x-etag': orig_metadata['ETag']})
+
+        # Special cases for backwards compatibility.
+        # For EC policy, send X-Object-Sysmeta-Ec-Etag which is same as the
+        # X-Backend-Container-Update-Override-Etag value sent with the original
+        # PUT. Similarly send X-Object-Sysmeta-Ec-Content-Length which is the
+        # same as the X-Backend-Container-Update-Override-Size value. We have
+        # to send Etag and size with a POST container update because the
+        # original PUT container update may have failed or be in async_pending.
+        if 'X-Object-Sysmeta-Ec-Etag' in orig_metadata:
+            update_headers['X-Etag'] = orig_metadata[
+                'X-Object-Sysmeta-Ec-Etag']
+        if 'X-Object-Sysmeta-Ec-Content-Length' in orig_metadata:
+            update_headers['X-Size'] = orig_metadata[
+                'X-Object-Sysmeta-Ec-Content-Length']
+
+        self._check_container_override(update_headers, orig_metadata)
+
+        # object POST updates are PUT to the container server
+        self.container_update(
+            'PUT', account, container, obj, request, update_headers,
+            device, policy)
+
+        # Add current content-type and sysmeta to response
+        resp_headers = {
+            'X-Backend-Content-Type': content_type_headers['Content-Type']}
+        for key, value in orig_metadata.items():
+            if is_sys_meta('object', key):
+                resp_headers[key] = value
+
+        return HTTPAccepted(request=request, headers=resp_headers)
+
+    def _pre_create_checks(self, request, device, partition,
+                           account, container, obj, policy):
+        req_timestamp = valid_timestamp(request)
         error_response = check_object_creation(request, obj)
         if error_response:
-            return error_response
-        new_delete_at = int(request.headers.get('X-Delete-At') or 0)
-        if new_delete_at and new_delete_at < time.time():
-            return HTTPBadRequest(body='X-Delete-At in past', request=request,
-                                  content_type='text/plain')
-        file = DiskFile(self.devices, device, partition, account, container,
-                        obj, self.logger, disk_chunk_size=self.disk_chunk_size)
-        orig_timestamp = file.metadata.get('X-Timestamp')
-        upload_expiration = time.time() + self.max_upload_time
-        etag = md5()
-        upload_size = 0
-        last_sync = 0
-        with file.mkstemp() as fd:
-            if 'content-length' in request.headers:
+            raise error_response
+        try:
+            fsize = request.message_length()
+        except ValueError as e:
+            raise HTTPBadRequest(body=str(e), request=request,
+                                 content_type='text/plain')
+        # In case of multipart-MIME put, the proxy sends a chunked request,
+        # but may let us know the real content length so we can verify that
+        # we have enough disk space to hold the object.
+        if fsize is None:
+            fsize = request.headers.get('X-Backend-Obj-Content-Length')
+            if fsize is not None:
                 try:
-                    fallocate(fd, int(request.headers['content-length']))
-                except OSError:
-                    return HTTPInsufficientStorage(drive=device,
-                                                   request=request)
-            reader = request.environ['wsgi.input'].read
-            for chunk in iter(lambda: reader(self.network_chunk_size), ''):
-                upload_size += len(chunk)
-                if time.time() > upload_expiration:
-                    self.logger.increment('PUT.timeouts')
-                    return HTTPRequestTimeout(request=request)
-                etag.update(chunk)
-                while chunk:
-                    written = os.write(fd, chunk)
-                    chunk = chunk[written:]
-                # For large files sync every 512MB (by default) written
-                if upload_size - last_sync >= self.bytes_per_sync:
-                    tpool.execute(fsync, fd)
-                    drop_buffer_cache(fd, last_sync, upload_size - last_sync)
-                    last_sync = upload_size
-                sleep()
-
-            if 'content-length' in request.headers and \
-                    int(request.headers['content-length']) != upload_size:
-                return HTTPClientDisconnect(request=request)
-            etag = etag.hexdigest()
-            if 'etag' in request.headers and \
-                    request.headers['etag'].lower() != etag:
-                return HTTPUnprocessableEntity(request=request)
-            metadata = {
-                'X-Timestamp': request.headers['x-timestamp'],
-                'Content-Type': request.headers['content-type'],
-                'ETag': etag,
-                'Content-Length': str(upload_size),
+                    fsize = int(fsize)
+                except ValueError as e:
+                    raise HTTPBadRequest(body=str(e), request=request,
+                                         content_type='text/plain')
+        # SSYNC will include Frag-Index header for subrequests, in which case
+        # get_diskfile will ignore non-matching on-disk data files
+        frag_index = request.headers.get('X-Backend-Ssync-Frag-Index')
+        next_part_power = request.headers.get('X-Backend-Next-Part-Power')
+        try:
+            disk_file = self.get_diskfile(
+                device, partition, account, container, obj,
+                policy=policy, frag_index=frag_index,
+                next_part_power=next_part_power)
+        except DiskFileDeviceUnavailable:
+            raise HTTPInsufficientStorage(drive=device, request=request)
+        try:
+            orig_metadata = disk_file.read_metadata(current_time=req_timestamp)
+            orig_timestamp = disk_file.data_timestamp
+        except DiskFileXattrNotSupported:
+            raise HTTPInsufficientStorage(drive=device, request=request)
+        except DiskFileDeleted as e:
+            orig_metadata = {}
+            orig_timestamp = e.timestamp
+        except (DiskFileNotExist, DiskFileQuarantined,
+                DiskFileStateChanged):
+            orig_metadata = {}
+            orig_timestamp = Timestamp.zero()
+        # Checks for If-None-Match
+        if request.if_none_match is not None and orig_metadata:
+            if '*' in request.if_none_match:
+                # File exists already so return 412
+                raise HTTPPreconditionFailed(request=request)
+            if orig_metadata.get('ETag') in request.if_none_match:
+                # The current ETag matches, so raise 412
+                raise HTTPPreconditionFailed(request=request)
+        if orig_timestamp >= req_timestamp:
+            raise HTTPConflict(
+                request=request,
+                headers={'X-Backend-Timestamp': orig_timestamp.internal})
+        return disk_file, fsize, orig_metadata
+
+    def _do_multi_stage_mime_continue_headers(self, request, obj_input):
+        """
+        If the proxy wants to send us object metadata after the object body, it
+        sets some headers. We have to tell the proxy, in the 100 Continue
+        response, that we're able to parse a multipart MIME document and
+        extract the object and metadata from it. If we don't, then the proxy
+        won't actually send the footer metadata.
+
+        If the proxy doesn't want to do any of that, this is the identity
+        function for obj_input and multi_stage_mime_state will be False-y.
+
+        :returns: a tuple, (obj_input, multi_stage_mime_state)
+        """
+        have_metadata_footer = False
+        use_multiphase_commit = False
+
+        hundred_continue_headers = []
+        if config_true_value(
+                request.headers.get(
+                    'X-Backend-Obj-Multiphase-Commit')):
+            use_multiphase_commit = True
+            hundred_continue_headers.append(
+                ('X-Obj-Multiphase-Commit', 'yes'))
+
+        if config_true_value(
+                request.headers.get('X-Backend-Obj-Metadata-Footer')):
+            have_metadata_footer = True
+            hundred_continue_headers.append(
+                ('X-Obj-Metadata-Footer', 'yes'))
+
+        if have_metadata_footer or use_multiphase_commit:
+            obj_input.set_hundred_continue_response_headers(
+                hundred_continue_headers)
+            mime_boundary = wsgi_to_bytes(request.headers.get(
+                'X-Backend-Obj-Multipart-Mime-Boundary'))
+            if not mime_boundary:
+                raise HTTPBadRequest("no MIME boundary")
+
+            with ChunkReadTimeout(self.client_timeout):
+                mime_documents_iter = iter_mime_headers_and_bodies(
+                    request.environ['wsgi.input'],
+                    mime_boundary, self.network_chunk_size)
+                _junk_hdrs, obj_input = next(mime_documents_iter)
+            multi_stage_mime_state = {
+                'have_metadata_footer': have_metadata_footer,
+                'use_multiphase_commit': use_multiphase_commit,
+                'mime_documents_iter': mime_documents_iter,
             }
-            metadata.update(val for val in request.headers.iteritems()
-                            if val[0].lower().startswith('x-object-meta-') and
-                            len(val[0]) > 14)
-            for header_key in self.allowed_headers:
-                if header_key in request.headers:
-                    header_caps = header_key.title()
-                    metadata[header_caps] = request.headers[header_key]
-            old_delete_at = int(file.metadata.get('X-Delete-At') or 0)
-            if old_delete_at != new_delete_at:
-                if new_delete_at:
-                    self.delete_at_update(
-                        'PUT', new_delete_at, account, container, obj,
-                        request.headers, device)
-                if old_delete_at:
-                    self.delete_at_update(
-                        'DELETE', old_delete_at, account, container, obj,
-                        request.headers, device)
-            file.put(fd, metadata)
-        file.unlinkold(metadata['X-Timestamp'])
-        if not orig_timestamp or \
-                orig_timestamp < request.headers['x-timestamp']:
-            self.container_update(
-                'PUT', account, container, obj, request.headers,
-                {'x-size': file.metadata['Content-Length'],
-                 'x-content-type': file.metadata['Content-Type'],
-                 'x-timestamp': file.metadata['X-Timestamp'],
-                 'x-etag': file.metadata['ETag'],
-                 'x-trans-id': request.headers.get('x-trans-id', '-')},
-                device)
-        resp = HTTPCreated(request=request, etag=etag)
-        return resp
+        else:
+            multi_stage_mime_state = {}
+        return obj_input, multi_stage_mime_state
+
+    def _stage_obj_data(self, request, device, obj_input, writer, fsize):
+        """
+        Feed the object_input into the writer.
+
+        :returns: a tuple, (upload_size, etag)
+        """
+        writer.open()
+        elapsed_time = 0
+        upload_expiration = time.time() + self.max_upload_time
+        timeout_reader = self._make_timeout_reader(obj_input)
+
+        # Wrap the chunks in CooperativeIterator with specified period
+        cooperative_reader = CooperativeIterator(
+            iter(timeout_reader, b''), period=self.cooperative_period
+        )
+
+        for chunk in cooperative_reader:
+            start_time = time.time()
+            if start_time > upload_expiration:
+                self.logger.increment('PUT.timeouts')
+                raise HTTPRequestTimeout(request=request)
+            writer.write(chunk)
+            elapsed_time += time.time() - start_time
+
+        upload_size, etag = writer.chunks_finished()
+        if fsize is not None and fsize != upload_size:
+            raise HTTPClientDisconnect(request=request)
+        if upload_size:
+            self.logger.transfer_rate(
+                'PUT.' + device + '.timing', elapsed_time,
+                upload_size)
+        return upload_size, etag
+
+    def _get_request_metadata(self, request, upload_size, etag):
+        """
+        Pull object metadata off the request.
+
+        :returns: metadata, a dict of object metadata
+        """
+        metadata = {
+            'X-Timestamp': request.timestamp.internal,
+            'Content-Type': request.headers['content-type'],
+            'Content-Length': str(upload_size),
+            'ETag': etag,
+        }
+        metadata.update(val for val in request.headers.items()
+                        if (is_sys_or_user_meta('object', val[0]) or
+                            is_object_transient_sysmeta(val[0])))
+        headers_to_copy = (
+            request.headers.get(
+                'X-Backend-Replication-Headers', '').split() +
+            list(self.allowed_headers))
+        for header_key in headers_to_copy:
+            if header_key in request.headers:
+                header_caps = bytes_to_wsgi(
+                    wsgi_to_bytes(header_key).title())
+                metadata[header_caps] = request.headers[header_key]
+        return metadata
+
+    def _read_mime_footers_metadata(self, have_metadata_footer,
+                                    mime_documents_iter, **kwargs):
+        """
+        Read footer metadata from the bottom of the multi-stage MIME body.
+
+        :returns: metadata, a dict
+        """
+        if have_metadata_footer:
+            metadata = self._read_metadata_footer(
+                mime_documents_iter)
+            footer_etag = metadata.pop('etag', '').lower()
+            if footer_etag:
+                metadata['ETag'] = footer_etag
+        else:
+            metadata = {}
+        return metadata
+
+    def _apply_extra_metadata(self, request, metadata, footers_metadata):
+        """
+        Apply extra metadata precedence to prepare metadata for storage.
+        """
+        metadata.update(val for val in footers_metadata.items()
+                        if (is_sys_or_user_meta('object', val[0]) or
+                            is_object_transient_sysmeta(val[0])))
+        # N.B. footers_metadata is a HeaderKeyDict
+        received_etag = normalize_etag(footers_metadata.get(
+            'etag', request.headers.get('etag', '')))
+        if received_etag and received_etag != metadata['ETag']:
+            raise HTTPUnprocessableEntity(request=request)
+
+    def _send_multi_stage_continue_headers(self, request,
+                                           use_multiphase_commit,
+                                           mime_documents_iter, **kwargs):
+        """
+        If the PUT requires a two-phase commit (a data and a commit phase) send
+        the proxy server another 100-continue response to indicate that we are
+        finished writing object data
+        """
+        if use_multiphase_commit:
+            request.environ['wsgi.input'].\
+                send_hundred_continue_response()
+            if not self._read_put_commit_message(mime_documents_iter):
+                raise HTTPServerError(request=request)
+
+    def _drain_mime_request(self, mime_documents_iter, **kwargs):
+        """
+        Drain any remaining MIME docs from the socket. There shouldn't be any,
+        but we must read the whole request body.
+        """
+        try:
+            while True:
+                with ChunkReadTimeout(self.client_timeout):
+                    _junk_hdrs, _junk_body = next(mime_documents_iter)
+                drain(_junk_body, self.network_chunk_size,
+                      self.client_timeout)
+        except ChunkReadError:
+            raise HTTPClientDisconnect()
+        except ChunkReadTimeout:
+            raise HTTPRequestTimeout()
+        except StopIteration:
+            pass
+
+    def _post_commit_updates(self, request, device,
+                             account, container, obj, policy,
+                             orig_metadata, footers_metadata, metadata):
+        orig_delete_at = int(orig_metadata.get('X-Delete-At') or 0)
+        new_delete_at = int(request.headers.get('X-Delete-At') or 0)
+
+        self._conditional_delete_at_update(request, device, account, container,
+                                           obj, policy, metadata,
+                                           orig_delete_at, new_delete_at)
+
+        update_headers = HeaderKeyDict({
+            'x-size': metadata['Content-Length'],
+            'x-content-type': metadata['Content-Type'],
+            'x-timestamp': metadata['X-Timestamp'],
+            'x-etag': metadata['ETag']})
+        # apply any container update header overrides sent with request
+        self._check_container_override(update_headers, request.headers,
+                                       footers_metadata)
+        self.container_update(
+            'PUT', account, container, obj, request,
+            update_headers, device, policy)
 
     @public
-    @timing_stats
-    def GET(self, request):
-        """Handle HTTP GET requests for the Swift Object Server."""
+    @timing_stats()
+    @labeled_timing_stats(metric=LABELED_METRIC_NAME)
+    def PUT(self, request, timing_stats_labels):
+        """Handle HTTP PUT requests for the Swift Object Server."""
+        device, partition, account, container, obj, policy = \
+            get_obj_name_and_placement(request)
+        timing_stats_labels['account'] = account
+        timing_stats_labels['container'] = container
+        timing_stats_labels['policy'] = int(policy)
+
+        disk_file, fsize, orig_metadata = self._pre_create_checks(
+            request, device, partition, account, container, obj, policy)
+        writer = disk_file.writer(size=fsize)
         try:
-            device, partition, account, container, obj = \
-                split_path(unquote(request.path), 5, 5, True)
-            validate_device_partition(device, partition)
-        except ValueError, err:
-            return HTTPBadRequest(body=str(err), request=request,
-                                  content_type='text/plain')
-        if self.mount_check and not check_mount(self.devices, device):
-            return HTTPInsufficientStorage(drive=device, request=request)
-        file = DiskFile(self.devices, device, partition, account, container,
-                        obj, self.logger, keep_data_fp=True,
-                        disk_chunk_size=self.disk_chunk_size,
-                        iter_hook=sleep)
-        if file.is_deleted() or file.is_expired():
-            if request.headers.get('if-match') == '*':
-                return HTTPPreconditionFailed(request=request)
+            obj_input = request.environ['wsgi.input']
+            obj_input, multi_stage_mime_state = \
+                self._do_multi_stage_mime_continue_headers(request, obj_input)
+            upload_size, etag = self._stage_obj_data(
+                request, device, obj_input, writer, fsize)
+            metadata = self._get_request_metadata(request, upload_size, etag)
+            if multi_stage_mime_state:
+                footers_metadata = self._read_mime_footers_metadata(
+                    **multi_stage_mime_state)
             else:
-                return HTTPNotFound(request=request)
-        try:
-            file_size = file.get_data_file_size()
-        except (DiskFileError, DiskFileNotExist):
-            file.quarantine()
-            return HTTPNotFound(request=request)
-        if request.headers.get('if-match') not in (None, '*') and \
-                file.metadata['ETag'] not in request.if_match:
-            file.close()
-            return HTTPPreconditionFailed(request=request)
-        if request.headers.get('if-none-match') is not None:
-            if file.metadata['ETag'] in request.if_none_match:
-                resp = HTTPNotModified(request=request)
-                resp.etag = file.metadata['ETag']
-                file.close()
-                return resp
+                footers_metadata = {}
+            self._apply_extra_metadata(request, metadata, footers_metadata)
+            writer.put(metadata)
+            if multi_stage_mime_state:
+                self._send_multi_stage_continue_headers(
+                    request, **multi_stage_mime_state)
+            if not config_true_value(
+                    request.headers.get('X-Backend-No-Commit', False)):
+                writer.commit(request.timestamp)
+            if multi_stage_mime_state:
+                self._drain_mime_request(**multi_stage_mime_state)
+        except (DiskFileXattrNotSupported, DiskFileNoSpace):
+            return HTTPInsufficientStorage(drive=device, request=request)
+        except ChunkReadError:
+            return HTTPClientDisconnect(request=request)
+        except ChunkReadTimeout:
+            return HTTPRequestTimeout(request=request)
+        finally:
+            writer.close()
+        self._post_commit_updates(request, device,
+                                  account, container, obj, policy,
+                                  orig_metadata, footers_metadata, metadata)
+        return HTTPCreated(request=request, etag=etag)
+
+    @public
+    @timing_stats()
+    @labeled_timing_stats(metric=LABELED_METRIC_NAME)
+    def GET(self, request, timing_stats_labels):
+        """Handle HTTP GET requests for the Swift Object Server."""
+        device, partition, account, container, obj, policy = \
+            get_obj_name_and_placement(request)
+        timing_stats_labels['account'] = account
+        timing_stats_labels['container'] = container
+        timing_stats_labels['policy'] = int(policy)
+
+        request.headers.setdefault('X-Timestamp',
+                                   normalize_timestamp(time.time()))
+        req_timestamp = valid_timestamp(request)
+        frag_prefs = safe_json_loads(
+            request.headers.get('X-Backend-Fragment-Preferences'))
         try:
-            if_unmodified_since = request.if_unmodified_since
-        except (OverflowError, ValueError):
-            # catches timestamps before the epoch
-            return HTTPPreconditionFailed(request=request)
-        if if_unmodified_since and \
-                datetime.fromtimestamp(
-                    float(file.metadata['X-Timestamp']), UTC) > \
-                if_unmodified_since:
-            file.close()
-            return HTTPPreconditionFailed(request=request)
+            disk_file = self.get_diskfile(
+                device, partition, account, container, obj,
+                policy=policy, frag_prefs=frag_prefs,
+                open_expired=is_backend_open_expired(request))
+        except DiskFileDeviceUnavailable:
+            return HTTPInsufficientStorage(drive=device, request=request)
         try:
-            if_modified_since = request.if_modified_since
-        except (OverflowError, ValueError):
-            # catches timestamps before the epoch
-            return HTTPPreconditionFailed(request=request)
-        if if_modified_since and \
-                datetime.fromtimestamp(
-                    float(file.metadata['X-Timestamp']), UTC) < \
-                if_modified_since:
-            file.close()
-            return HTTPNotModified(request=request)
-        response = Response(app_iter=file,
-                            request=request, conditional_response=True)
-        response.headers['Content-Type'] = file.metadata.get(
-            'Content-Type', 'application/octet-stream')
-        for key, value in file.metadata.iteritems():
-            if key.lower().startswith('x-object-meta-') or \
-                    key.lower() in self.allowed_headers:
-                response.headers[key] = value
-        response.etag = file.metadata['ETag']
-        response.last_modified = float(file.metadata['X-Timestamp'])
-        response.content_length = file_size
-        if response.content_length < self.keep_cache_size and \
-                (self.keep_cache_private or
-                 ('X-Auth-Token' not in request.headers and
-                  'X-Storage-Token' not in request.headers)):
-            file.keep_cache = True
-        if 'Content-Encoding' in file.metadata:
-            response.content_encoding = file.metadata['Content-Encoding']
-        response.headers['X-Timestamp'] = file.metadata['X-Timestamp']
-        return request.get_response(response)
+            with disk_file.open(current_time=req_timestamp):
+                metadata = disk_file.get_metadata()
+                resolve_ignore_range_header(request, metadata)
+                obj_size = int(metadata['Content-Length'])
+                file_x_ts = Timestamp(metadata['X-Timestamp'])
+                keep_cache = (
+                    self.keep_cache_private
+                    or (
+                        "X-Auth-Token" not in request.headers
+                        and "X-Storage-Token" not in request.headers
+                    )
+                    or (
+                        self.keep_cache_slo_manifest
+                        and config_true_value(
+                            metadata.get("X-Static-Large-Object")
+                        )
+                    )
+                )
+                conditional_etag = resolve_etag_is_at_header(request, metadata)
+                app_iter = disk_file.reader(
+                    keep_cache=keep_cache,
+                    cooperative_period=self.cooperative_period,
+                    etag_validate_frac=self.etag_validate_frac,
+                )
+                response = Response(
+                    app_iter=app_iter, request=request,
+                    conditional_response=True,
+                    conditional_etag=conditional_etag,
+                )
+                response.headers['Content-Type'] = metadata.get(
+                    'Content-Type', 'application/octet-stream')
+                for key, value in metadata.items():
+                    if (is_sys_or_user_meta('object', key) or
+                            is_object_transient_sysmeta(key) or
+                            key.lower() in self.allowed_headers):
+                        response.headers[key] = value
+                response.etag = metadata['ETag']
+                response.last_modified = file_x_ts
+                response.content_length = obj_size
+                try:
+                    response.content_encoding = metadata[
+                        'Content-Encoding']
+                except KeyError:
+                    pass
+                response.headers['X-Timestamp'] = file_x_ts.normal
+                response.headers['X-Backend-Timestamp'] = file_x_ts.internal
+                response.headers['X-Backend-Data-Timestamp'] = \
+                    disk_file.data_timestamp.internal
+                if disk_file.durable_timestamp:
+                    response.headers['X-Backend-Durable-Timestamp'] = \
+                        disk_file.durable_timestamp.internal
+                response.headers['X-Backend-Fragments'] = \
+                    _make_backend_fragments_header(disk_file.fragments)
+                resp = request.get_response(response)
+        except DiskFileXattrNotSupported:
+            return HTTPInsufficientStorage(drive=device, request=request)
+        except (DiskFileNotExist, DiskFileQuarantined) as e:
+            headers = {}
+            if hasattr(e, 'timestamp'):
+                headers['X-Backend-Timestamp'] = e.timestamp.internal
+            resp = HTTPNotFound(request=request, headers=headers,
+                                conditional_response=True)
+        except DiskFileStateChanged:
+            resp = HTTPServiceUnavailable(request=request)
+        return resp
 
     @public
-    @timing_stats
-    def HEAD(self, request):
+    @timing_stats(sample_rate=0.8)
+    @labeled_timing_stats(metric=LABELED_METRIC_NAME)
+    def HEAD(self, request, timing_stats_labels):
         """Handle HTTP HEAD requests for the Swift Object Server."""
+        device, partition, account, container, obj, policy = \
+            get_obj_name_and_placement(request)
+        timing_stats_labels['account'] = account
+        timing_stats_labels['container'] = container
+        timing_stats_labels['policy'] = int(policy)
+
+        request.headers.setdefault('X-Timestamp',
+                                   normalize_timestamp(time.time()))
+        req_timestamp = valid_timestamp(request)
+        frag_prefs = safe_json_loads(
+            request.headers.get('X-Backend-Fragment-Preferences'))
         try:
-            device, partition, account, container, obj = \
-                split_path(unquote(request.path), 5, 5, True)
-            validate_device_partition(device, partition)
-        except ValueError, err:
-            resp = HTTPBadRequest(request=request)
-            resp.content_type = 'text/plain'
-            resp.body = str(err)
-            return resp
-        if self.mount_check and not check_mount(self.devices, device):
+            disk_file = self.get_diskfile(
+                device, partition, account, container, obj,
+                policy=policy, frag_prefs=frag_prefs,
+                open_expired=is_backend_open_expired(request))
+        except DiskFileDeviceUnavailable:
             return HTTPInsufficientStorage(drive=device, request=request)
-        file = DiskFile(self.devices, device, partition, account, container,
-                        obj, self.logger, disk_chunk_size=self.disk_chunk_size)
-        if file.is_deleted() or file.is_expired():
-            return HTTPNotFound(request=request)
         try:
-            file_size = file.get_data_file_size()
-        except (DiskFileError, DiskFileNotExist):
-            file.quarantine()
-            return HTTPNotFound(request=request)
-        response = Response(request=request, conditional_response=True)
-        response.headers['Content-Type'] = file.metadata.get(
+            metadata = disk_file.read_metadata(current_time=req_timestamp)
+        except DiskFileXattrNotSupported:
+            return HTTPInsufficientStorage(drive=device, request=request)
+        except (DiskFileNotExist, DiskFileQuarantined) as e:
+            headers = {}
+            if hasattr(e, 'timestamp'):
+                headers['X-Backend-Timestamp'] = e.timestamp.internal
+            return HTTPNotFound(request=request, headers=headers,
+                                conditional_response=True)
+        except DiskFileStateChanged:
+            return HTTPServiceUnavailable(request=request)
+        conditional_etag = resolve_etag_is_at_header(request, metadata)
+        response = Response(request=request, conditional_response=True,
+                            conditional_etag=conditional_etag)
+        response.headers['Content-Type'] = metadata.get(
             'Content-Type', 'application/octet-stream')
-        for key, value in file.metadata.iteritems():
-            if key.lower().startswith('x-object-meta-') or \
-                    key.lower() in self.allowed_headers:
+        for key, value in metadata.items():
+            if (is_sys_or_user_meta('object', key) or
+                    is_object_transient_sysmeta(key) or
+                    key.lower() in self.allowed_headers):
                 response.headers[key] = value
-        response.etag = file.metadata['ETag']
-        response.last_modified = float(file.metadata['X-Timestamp'])
+        response.etag = metadata['ETag']
+        ts = Timestamp(metadata['X-Timestamp'])
+        response.last_modified = ts
         # Needed for container sync feature
-        response.headers['X-Timestamp'] = file.metadata['X-Timestamp']
-        response.content_length = file_size
-        if 'Content-Encoding' in file.metadata:
-            response.content_encoding = file.metadata['Content-Encoding']
+        response.headers['X-Timestamp'] = ts.normal
+        response.headers['X-Backend-Timestamp'] = ts.internal
+        response.headers['X-Backend-Data-Timestamp'] = \
+            disk_file.data_timestamp.internal
+        if disk_file.durable_timestamp:
+            response.headers['X-Backend-Durable-Timestamp'] = \
+                disk_file.durable_timestamp.internal
+        response.headers['X-Backend-Fragments'] = \
+            _make_backend_fragments_header(disk_file.fragments)
+        response.content_length = int(metadata['Content-Length'])
+        try:
+            response.content_encoding = metadata['Content-Encoding']
+        except KeyError:
+            pass
         return response
 
     @public
-    @timing_stats
-    def DELETE(self, request):
+    @timing_stats()
+    @labeled_timing_stats(metric=LABELED_METRIC_NAME)
+    def DELETE(self, request, timing_stats_labels):
         """Handle HTTP DELETE requests for the Swift Object Server."""
+        device, partition, account, container, obj, policy = \
+            get_obj_name_and_placement(request)
+        timing_stats_labels['account'] = account
+        timing_stats_labels['container'] = container
+        timing_stats_labels['policy'] = int(policy)
+
+        req_timestamp = valid_timestamp(request)
+        next_part_power = request.headers.get('X-Backend-Next-Part-Power')
         try:
-            device, partition, account, container, obj = \
-                split_path(unquote(request.path), 5, 5, True)
-            validate_device_partition(device, partition)
-        except ValueError, e:
-            return HTTPBadRequest(body=str(e), request=request,
-                                  content_type='text/plain')
-        if 'x-timestamp' not in request.headers or \
-                not check_float(request.headers['x-timestamp']):
-            return HTTPBadRequest(body='Missing timestamp', request=request,
-                                  content_type='text/plain')
-        if self.mount_check and not check_mount(self.devices, device):
+            disk_file = self.get_diskfile(
+                device, partition, account, container, obj,
+                policy=policy, next_part_power=next_part_power)
+        except DiskFileDeviceUnavailable:
             return HTTPInsufficientStorage(drive=device, request=request)
-        response_class = HTTPNoContent
-        file = DiskFile(self.devices, device, partition, account, container,
-                        obj, self.logger, disk_chunk_size=self.disk_chunk_size)
-        if 'x-if-delete-at' in request.headers and \
-                int(request.headers['x-if-delete-at']) != \
-                int(file.metadata.get('X-Delete-At') or 0):
-            return HTTPPreconditionFailed(
-                request=request,
-                body='X-If-Delete-At and X-Delete-At do not match')
-        orig_timestamp = file.metadata.get('X-Timestamp')
-        if file.is_deleted() or file.is_expired():
+        try:
+            orig_metadata = disk_file.read_metadata(current_time=req_timestamp)
+        except DiskFileXattrNotSupported:
+            return HTTPInsufficientStorage(drive=device, request=request)
+        except DiskFileExpired as e:
+            orig_timestamp = e.timestamp
+            orig_metadata = e.metadata
             response_class = HTTPNotFound
-        metadata = {
-            'X-Timestamp': request.headers['X-Timestamp'], 'deleted': True,
-        }
-        old_delete_at = int(file.metadata.get('X-Delete-At') or 0)
-        if old_delete_at:
-            self.delete_at_update('DELETE', old_delete_at, account,
-                                  container, obj, request.headers, device)
-        file.put_metadata(metadata, tombstone=True)
-        file.unlinkold(metadata['X-Timestamp'])
-        if not orig_timestamp or \
-                orig_timestamp < request.headers['x-timestamp']:
+        except DiskFileDeleted as e:
+            orig_timestamp = e.timestamp
+            orig_metadata = {}
+            response_class = HTTPNotFound
+        except (DiskFileNotExist, DiskFileQuarantined):
+            orig_timestamp = 0
+            orig_metadata = {}
+            response_class = HTTPNotFound
+        except DiskFileStateChanged:
+            # Bail out early because unread metadata may have an X-Delete-At.
+            # This condition can occur when a concurrent request has replaced
+            # the data or meta file that this thread was trying to open. Force
+            # client to retry, hoping the on-disk files have settled.
+            return HTTPServiceUnavailable(request=request)
+        else:
+            orig_timestamp = disk_file.data_timestamp
+            if orig_timestamp < req_timestamp:
+                response_class = HTTPNoContent
+            else:
+                response_class = HTTPConflict
+        response_timestamp = max(orig_timestamp, req_timestamp)
+        orig_delete_at = Timestamp(
+            orig_metadata.get('X-Delete-At') or Timestamp.zero())
+        try:
+            req_if_delete_at_val = request.headers['x-if-delete-at']
+            req_if_delete_at = Timestamp(req_if_delete_at_val)
+        except KeyError:
+            pass
+        except ValueError:
+            return HTTPBadRequest(
+                request=request,
+                body='Bad X-If-Delete-At header value')
+        else:
+            # request includes x-if-delete-at; we must not place a tombstone
+            # if we can not verify the x-if-delete-at time
+            if not orig_timestamp:
+                # no object found at all
+                return HTTPNotFound()
+            if orig_timestamp >= req_timestamp:
+                # Found a newer object -- return 409 as work item is stale
+                return HTTPConflict()
+            if orig_delete_at != req_if_delete_at:
+                return HTTPPreconditionFailed(
+                    request=request,
+                    body='X-If-Delete-At and X-Delete-At do not match')
+            else:
+                # differentiate success from no object at all
+                response_class = HTTPNoContent
+        self._conditional_delete_at_update(
+            request, device, account, container, obj, policy, {},
+            orig_delete_at, 0
+        )
+        if orig_timestamp < req_timestamp:
+            try:
+                disk_file.delete(req_timestamp)
+            except DiskFileNoSpace:
+                return HTTPInsufficientStorage(drive=device, request=request)
             self.container_update(
-                'DELETE', account, container, obj, request.headers,
-                {'x-timestamp': metadata['X-Timestamp'],
-                 'x-trans-id': request.headers.get('x-trans-id', '-')},
-                device)
-        resp = response_class(request=request)
-        return resp
+                'DELETE', account, container, obj, request,
+                HeaderKeyDict({'x-timestamp': req_timestamp.internal}),
+                device, policy)
+        return response_class(
+            request=request,
+            headers={'X-Backend-Timestamp': response_timestamp.internal,
+                     'X-Backend-Content-Type': orig_metadata.get(
+                         'Content-Type', '')})
 
     @public
-    @timing_stats
-    def REPLICATE(self, request):
+    @replication
+    @timing_stats(sample_rate=0.1)
+    @labeled_timing_stats(metric=LABELED_METRIC_NAME)
+    def REPLICATE(self, request, timing_stats_labels):
         """
         Handle REPLICATE requests for the Swift Object Server.  This is used
         by the object replicator to get hashes for directories.
+
+        Note that the name REPLICATE is preserved for historical reasons as
+        this verb really just returns the hashes information for the specified
+        parameters and is used, for example, by both replication and EC.
         """
+        device, partition, suffix_parts, policy = \
+            get_name_and_placement(request, 2, 3, True)
+        suffixes = suffix_parts.split('-') if suffix_parts else []
+        skip_rehash = bool(suffixes)
+        timing_stats_labels['policy'] = int(policy)
+        timing_stats_labels['skip_rehash'] = skip_rehash
+
         try:
-            device, partition, suffix = split_path(
-                unquote(request.path), 2, 3, True)
-            validate_device_partition(device, partition)
-        except ValueError, e:
-            return HTTPBadRequest(body=str(e), request=request,
-                                  content_type='text/plain')
-        if self.mount_check and not check_mount(self.devices, device):
-            return HTTPInsufficientStorage(drive=device, request=request)
-        path = os.path.join(self.devices, device, DATADIR, partition)
-        if not os.path.exists(path):
-            mkdirs(path)
-        suffixes = suffix.split('-') if suffix else []
-        _junk, hashes = tpool_reraise(get_hashes, path, recalculate=suffixes)
-        return Response(body=pickle.dumps(hashes))
+            hashes = self._diskfile_router[policy].get_hashes(
+                device, partition, suffixes, policy,
+                skip_rehash=skip_rehash)
+        except DiskFileDeviceUnavailable:
+            resp = HTTPInsufficientStorage(drive=device, request=request)
+        else:
+            # force pickle protocol for compatibility with py2 nodes
+            resp = Response(body=pickle.dumps(hashes, protocol=2))
+        return resp
+
+    @public
+    @replication
+    @timing_stats(sample_rate=0.1)
+    @labeled_timing_stats(metric=LABELED_METRIC_NAME)
+    def SSYNC(self, request, timing_stats_labels):
+        # the ssync sender may want to send PUT subrequests for non-durable
+        # data that should not be committed; legacy behaviour has been to
+        # commit all PUTs (subject to EC footer metadata), so we need to
+        # indicate to the sender that this object server has been upgraded to
+        # understand the X-Backend-No-Commit header.
+        headers = {'X-Backend-Accept-No-Commit': True}
+        receiver = ssync_receiver.Receiver(self, request)
+        timing_stats_labels['policy'] = int(receiver.policy)
+        return Response(app_iter=receiver(), headers=headers)
 
     def __call__(self, env, start_response):
         """WSGI Application entry point for the Swift Object Server."""
@@ -879,35 +1408,32 @@ def __call__(self, env, start_response):
         req = Request(env)
         self.logger.txn_id = req.headers.get('x-trans-id', None)
 
-        if not check_utf8(req.path_info):
-            res = HTTPPreconditionFailed(body='Invalid UTF8')
+        if not check_utf8(wsgi_to_str(req.path_info), internal=True):
+            res = HTTPPreconditionFailed(body='Invalid UTF8 or contains NULL')
         else:
             try:
                 # disallow methods which have not been marked 'public'
-                try:
-                    method = getattr(self, req.method)
-                    getattr(method, 'publicly_accessible')
-                except AttributeError:
+                if req.method not in self.allowed_methods:
                     res = HTTPMethodNotAllowed()
                 else:
-                    res = method(req)
+                    res = getattr(self, req.method)(req)
+            except DiskFileCollision:
+                res = HTTPForbidden(request=req)
+            except HTTPException as error_response:
+                res = error_response
             except (Exception, Timeout):
-                self.logger.exception(_(
+                self.logger.exception(
                     'ERROR __call__ error with %(method)s'
-                    ' %(path)s '), {'method': req.method, 'path': req.path})
+                    ' %(path)s ', {'method': req.method, 'path': req.path})
                 res = HTTPInternalServerError(body=traceback.format_exc())
         trans_time = time.time() - start_time
+        res.fix_conditional_response()
         if self.log_requests:
-            log_line = '%s - - [%s] "%s %s" %s %s "%s" "%s" "%s" %.4f' % (
-                req.remote_addr,
-                time.strftime('%d/%b/%Y:%H:%M:%S +0000',
-                              time.gmtime()),
-                req.method, req.path, res.status.split()[0],
-                res.content_length or '-', req.referer or '-',
-                req.headers.get('x-trans-id', '-'),
-                req.user_agent or '-',
-                trans_time)
-            if req.method == 'REPLICATE':
+            log_line = get_log_line(req, res, trans_time, '', self.log_format,
+                                    self.anonymization_method,
+                                    self.anonymization_salt)
+            if req.method in ('REPLICATE', 'SSYNC') or \
+                    'X-Backend-Replication' in req.headers:
                 self.logger.debug(log_line)
             else:
                 self.logger.info(log_line)
@@ -915,7 +1441,81 @@ def __call__(self, env, start_response):
             slow = self.slow - trans_time
             if slow > 0:
                 sleep(slow)
-        return res(env, start_response)
+
+        # To be able to zero-copy send the object, we need a few things.
+        # First, we have to be responding successfully to a GET, or else we're
+        # not sending the object. Second, we have to be able to extract the
+        # socket file descriptor from the WSGI input object. Third, the
+        # diskfile has to support zero-copy send.
+        #
+        # There's a good chance that this could work for 206 responses too,
+        # but the common case is sending the whole object, so we'll start
+        # there.
+        if req.method == 'GET' and res.status_int == 200 and \
+           isinstance(env['wsgi.input'], wsgi.Input):
+            app_iter = getattr(res, 'app_iter', None)
+            checker = getattr(app_iter, 'can_zero_copy_send', None)
+            if checker and checker():
+                # For any kind of zero-copy thing like sendfile or splice, we
+                # need the file descriptor. Eventlet doesn't provide a clean
+                # way of getting that, so we resort to this.
+                wsock = env['wsgi.input'].get_socket()
+                wsockfd = wsock.fileno()
+
+                # Don't call zero_copy_send() until after we force the HTTP
+                # headers out of Eventlet and into the socket.
+                def zero_copy_iter():
+                    # If possible, set TCP_CORK so that headers don't
+                    # immediately go on the wire, but instead, wait for some
+                    # response body to make the TCP frames as large as
+                    # possible (and hence as few packets as possible).
+                    #
+                    # On non-Linux systems, we might consider TCP_NODELAY, but
+                    # since the only known zero-copy-capable diskfile uses
+                    # Linux-specific syscalls, we'll defer that work until
+                    # someone needs it.
+                    if hasattr(socket, 'TCP_CORK'):
+                        wsock.setsockopt(socket.IPPROTO_TCP,
+                                         socket.TCP_CORK, 1)
+                    yield EventletPlungerString()
+                    try:
+                        app_iter.zero_copy_send(wsockfd)
+                    except Exception:
+                        self.logger.exception("zero_copy_send() blew up")
+                        raise
+                    yield b''
+
+                # Get headers ready to go out
+                res(env, start_response)
+                return zero_copy_iter()
+            else:
+                return res(env, start_response)
+        else:
+            return res(env, start_response)
+
+
+def global_conf_callback(preloaded_app_conf, global_conf):
+    """
+    Callback for swift.common.wsgi.run_wsgi during the global_conf
+    creation so that we can add our replication_semaphore, used to
+    limit the number of concurrent SSYNC_REQUESTS across all
+    workers.
+
+    :param preloaded_app_conf: The preloaded conf for the WSGI app.
+                               This conf instance will go away, so
+                               just read from it, don't write.
+    :param global_conf: The global conf that will eventually be
+                        passed to the app_factory function later.
+                        This conf is created before the worker
+                        subprocesses are forked, so can be useful to
+                        set up semaphores, shared memory, etc.
+    """
+    replication_concurrency = int(
+        preloaded_app_conf.get('replication_concurrency') or 4)
+    if replication_concurrency:
+        # Have to put the value in a list so it can get past paste
+        global_conf['replication_semaphore'] = [
+            multiprocessing.BoundedSemaphore(replication_concurrency)]
 
 
 def app_factory(global_conf, **local_conf):
@@ -923,3 +1523,14 @@ def app_factory(global_conf, **local_conf):
     conf = global_conf.copy()
     conf.update(local_conf)
     return ObjectController(conf)
+
+
+def main():
+    conf_file, options = parse_options(test_config=True)
+    sys.exit(run_wsgi(conf_file, 'object-server',
+                      global_conf_callback=global_conf_callback,
+                      **options))
+
+
+if __name__ == '__main__':
+    main()
diff --git a/swift/obj/ssync_receiver.py b/swift/obj/ssync_receiver.py
new file mode 100644
index 0000000000..6415d9fd46
--- /dev/null
+++ b/swift/obj/ssync_receiver.py
@@ -0,0 +1,626 @@
+# Copyright (c) 2013 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+
+import eventlet.greenio
+import eventlet.wsgi
+from eventlet import sleep, Timeout
+import urllib
+
+from swift.common import exceptions
+from swift.common import http
+from swift.common import swob
+from swift.common import utils
+from swift.common import request_helpers
+from swift.common.utils import Timestamp
+
+
+class SsyncClientDisconnected(Exception):
+    pass
+
+
+def decode_missing(line):
+    """
+    Parse a string of the form generated by
+    :py:func:`~swift.obj.ssync_sender.encode_missing` and return a dict
+    with keys ``object_hash``, ``ts_data``, ``ts_meta``, ``ts_ctype``,
+    ``durable``.
+
+    The encoder for this line is
+    :py:func:`~swift.obj.ssync_sender.encode_missing`
+    """
+    result = {}
+    parts = line.decode('ascii').split()
+    result['object_hash'] = urllib.parse.unquote(parts[0])
+    t_data = urllib.parse.unquote(parts[1])
+    result['ts_data'] = ts_data = Timestamp(t_data)
+    result['ts_meta'] = result['ts_ctype'] = ts_data
+    result['durable'] = True  # default to True in case this key isn't sent
+    if len(parts) > 2:
+        # allow for a comma separated list of k:v pairs to future-proof
+        subparts = urllib.parse.unquote(parts[2]).split(',')
+        for item in [subpart for subpart in subparts if ':' in subpart]:
+            k, v = item.split(':')
+            if k == 'm':
+                v, _, o = v.partition('__')
+                # ignore ts_data offset when calculating ts_meta
+                result['ts_meta'] = Timestamp(ts_data.normal,
+                                              delta=int(v, 16),
+                                              offset=int(o or '0', 16))
+            elif k == 't':
+                v, _, o = v.partition('__')
+                # ignore ts_data offset when calculating ts_ctype
+                result['ts_ctype'] = Timestamp(Timestamp(ts_data).normal,
+                                               delta=int(v, 16),
+                                               offset=int(o or '0', 16))
+            elif k == 'durable':
+                result['durable'] = utils.config_true_value(v)
+    return result
+
+
+def encode_wanted(remote, local):
+    """
+    Compare a remote and local results and generate a wanted line.
+
+    :param remote: a dict, with ts_data and ts_meta keys in the form
+                   returned by :py:func:`decode_missing`
+    :param local: a dict, possibly empty, with ts_data and ts_meta keys
+                  in the form returned :py:meth:`Receiver._check_local`
+
+    The decoder for this line is
+    :py:func:`~swift.obj.ssync_sender.decode_wanted`
+    """
+    want = {}
+    if 'ts_data' in local:
+        # we have something, let's get just the right stuff
+        if remote['ts_data'] > local['ts_data']:
+            want['data'] = True
+        if 'ts_meta' in local and remote['ts_meta'] > local['ts_meta']:
+            want['meta'] = True
+        if ('ts_ctype' in local and remote['ts_ctype'] > local['ts_ctype']
+                and remote['ts_ctype'] > remote['ts_data']):
+            want['meta'] = True
+    else:
+        # we got nothing, so we'll take whatever the remote has
+        want['data'] = True
+        want['meta'] = True
+    if want:
+        # this is the inverse of _decode_wanted's key_map
+        key_map = dict(data='d', meta='m')
+        parts = ''.join(v for k, v in sorted(key_map.items()) if want.get(k))
+        return '%s %s' % (urllib.parse.quote(remote['object_hash']), parts)
+    return None
+
+
+class SsyncInputProxy:
+    """
+    Wraps a wsgi input to provide ssync specific read methods.
+
+    If any exception or timeout is raised while reading from the input then
+    subsequent calls will raise the same exception. Callers are thereby
+    prevented from reading the input after it has raised an exception, when its
+    state may be uncertain. This enables the input to be safely shared by
+    multiple callers (typically an ssync Receiver and an ObjectController) who
+    may otherwise each be unaware that the other has encountered an exception.
+
+    :param wsgi_input: a wsgi input
+    :param chunk_size: the number of bytes to read at a time
+    :param timeout: the timeout in seconds applied to each read
+    """
+    def __init__(self, wsgi_input, chunk_size, timeout):
+        self.wsgi_input = wsgi_input
+        self.chunk_size = chunk_size
+        self.timeout = timeout
+        self.exception = None
+
+    def read_line(self, context):
+        """
+        Try to read a line from the wsgi input; annotate any timeout or read
+        errors with a description of the calling context.
+
+        :param context: string to annotate any exception raised
+        """
+        if self.exception:
+            raise self.exception
+        try:
+            try:
+                with exceptions.MessageTimeout(self.timeout, context):
+                    line = self.wsgi_input.readline(self.chunk_size)
+            except (eventlet.wsgi.ChunkReadError, IOError) as err:
+                raise exceptions.ChunkReadError('%s: %s' % (context, err))
+        except (Exception, Timeout) as err:
+            self.exception = err
+            raise
+
+        if line and not line.endswith(b'\n'):
+            # Everywhere we would call readline, we should always get
+            # a clean end-of-line as we should be reading
+            # SSYNC-specific messages or HTTP request lines/headers.
+            # If we didn't, it indicates that the wsgi input readline reached a
+            # valid end of chunked body without finding a newline.
+            raise exceptions.ChunkReadError(
+                '%s: %s' % (context, 'missing newline'))
+
+        return line
+
+    def _read_chunk(self, context, size):
+        if self.exception:
+            raise self.exception
+        try:
+            try:
+                with exceptions.MessageTimeout(self.timeout, context):
+                    chunk = self.wsgi_input.read(size)
+            except (eventlet.wsgi.ChunkReadError, IOError) as err:
+                raise exceptions.ChunkReadError('%s: %s' % (context, err))
+            if not chunk:
+                raise exceptions.ChunkReadError(
+                    'Early termination for %s' % context)
+        except (Exception, Timeout) as err:
+            self.exception = err
+            raise
+        return chunk
+
+    def make_subreq_input(self, context, content_length):
+        """
+        Returns a wsgi input that will read up to the given ``content-length``
+        from the wrapped wsgi input.
+
+        :param context: string to annotate any exception raised
+        :param content_length: maximum number of bytes to read
+        """
+        def subreq_iter():
+            bytes_left = content_length
+            while bytes_left > 0:
+                size = min(bytes_left, self.chunk_size)
+                chunk = self._read_chunk(context, size)
+                bytes_left -= len(chunk)
+                yield chunk
+
+        return utils.FileLikeIter(subreq_iter())
+
+
+class Receiver(object):
+    """
+    Handles incoming SSYNC requests to the object server.
+
+    These requests come from the object-replicator daemon that uses
+    :py:mod:`.ssync_sender`.
+
+    The number of concurrent SSYNC requests is restricted by
+    use of a replication_semaphore and can be configured with the
+    object-server.conf [object-server] replication_concurrency
+    setting.
+
+    An SSYNC request is really just an HTTP conduit for
+    sender/receiver replication communication. The overall
+    SSYNC request should always succeed, but it will contain
+    multiple requests within its request and response bodies. This
+    "hack" is done so that replication concurrency can be managed.
+
+    The general process inside an SSYNC request is:
+
+    1. Initialize the request: Basic request validation, mount check,
+       acquire semaphore lock, etc..
+
+    2. Missing check: Sender sends the hashes and timestamps of
+       the object information it can send, receiver sends back
+       the hashes it wants (doesn't have or has an older
+       timestamp).
+
+    3. Updates: Sender sends the object information requested.
+
+    4. Close down: Release semaphore lock, etc.
+    """
+
+    def __init__(self, app, request):
+        self.app = app
+        self.request = request
+        self.device = None
+        self.partition = None
+        self.input = None
+        # We default to dropping the connection in case there is any exception
+        # raised during processing because otherwise the sender could send for
+        # quite some time before realizing it was all in vain.
+        self.disconnect = True
+        self.initialize_request()
+
+    def __call__(self):
+        """
+        Processes an SSYNC request.
+
+        Acquires a semaphore lock and then proceeds through the steps
+        of the SSYNC process.
+        """
+        # The general theme for functions __call__ calls is that they should
+        # raise exceptions.MessageTimeout for client timeouts (logged locally),
+        # exceptions.ChunkReadError for client disconnects (logged locally),
+        # swob.HTTPException classes for exceptions to return to the caller but
+        # not log locally (unmounted, for example), and any other Exceptions
+        # will be logged with a full stack trace.
+        #       This is because the client is never just some random user but
+        # is instead also our code and we definitely want to know if our code
+        # is broken or doing something unexpected.
+        try:
+            # Double try blocks in case our main error handlers fail.
+            try:
+                # Need to send something to trigger wsgi to return response
+                # headers and kick off the ssync exchange.
+                yield b'\r\n'
+                # If semaphore is in use, try to acquire it, non-blocking, and
+                # return a 503 if it fails.
+                if self.app.replication_semaphore:
+                    if not self.app.replication_semaphore.acquire(False):
+                        raise swob.HTTPServiceUnavailable()
+                try:
+                    with self.diskfile_mgr.replication_lock(self.device,
+                                                            self.policy,
+                                                            self.partition):
+                        for data in self.missing_check():
+                            yield data
+                        for data in self.updates():
+                            yield data
+                    # We didn't raise an exception, so end the request
+                    # normally.
+                    self.disconnect = False
+                finally:
+                    if self.app.replication_semaphore:
+                        self.app.replication_semaphore.release()
+            except SsyncClientDisconnected:
+                self.app.logger.error('ssync client disconnected')
+                self.disconnect = True
+            except exceptions.LockTimeout as err:
+                self.app.logger.debug(
+                    '%s/%s/%s SSYNC LOCK TIMEOUT: %s' % (
+                        self.request.remote_addr, self.device, self.partition,
+                        err))
+                yield (':ERROR: %d %r\n' % (0, str(err))).encode('utf8')
+            except exceptions.MessageTimeout as err:
+                self.app.logger.error(
+                    '%s/%s/%s TIMEOUT in ssync.Receiver: %s' % (
+                        self.request.remote_addr, self.device, self.partition,
+                        err))
+                yield (':ERROR: %d %r\n' % (408, str(err))).encode('utf8')
+            except exceptions.ChunkReadError as err:
+                self.app.logger.error(
+                    '%s/%s/%s read failed in ssync.Receiver: %s' % (
+                        self.request.remote_addr, self.device, self.partition,
+                        err))
+                # Since the client (presumably) hung up, no point in trying to
+                # send anything about the error
+            except swob.HTTPException as err:
+                body = b''.join(err({}, lambda *args: None))
+                yield (':ERROR: %d %r\n' % (
+                    err.status_int, body)).encode('utf8')
+            except Exception as err:
+                self.app.logger.exception(
+                    '%s/%s/%s EXCEPTION in ssync.Receiver' %
+                    (self.request.remote_addr, self.device, self.partition))
+                yield (':ERROR: %d %r\n' % (0, str(err))).encode('utf8')
+        except Exception:
+            self.app.logger.exception('EXCEPTION in ssync.Receiver')
+        if self.disconnect:
+            # This makes the socket close early so the remote side doesn't have
+            # to send its whole request while the lower Eventlet-level just
+            # reads it and throws it away. Instead, the connection is dropped
+            # and the remote side will get a broken-pipe exception.
+            try:
+                socket = self.request.environ['wsgi.input'].get_socket()
+                eventlet.greenio.shutdown_safe(socket)
+                socket.close()
+            except Exception:
+                pass  # We're okay with the above failing.
+
+    def initialize_request(self):
+        """
+        Basic validation of request and mount check.
+
+        This function will be called before attempting to acquire a
+        replication semaphore lock, so contains only quick checks.
+        """
+        # This environ override has been supported since eventlet 0.14:
+        # https://bitbucket.org/eventlet/eventlet/commits/ \
+        #     4bd654205a4217970a57a7c4802fed7ff2c8b770
+        self.request.environ['eventlet.minimum_write_chunk_size'] = 0
+        self.device, self.partition, self.policy = \
+            request_helpers.get_name_and_placement(self.request, 2, 2, False)
+
+        self.frag_index = None
+        if self.request.headers.get('X-Backend-Ssync-Frag-Index'):
+            try:
+                self.frag_index = int(
+                    self.request.headers['X-Backend-Ssync-Frag-Index'])
+            except ValueError:
+                raise swob.HTTPBadRequest(
+                    'Invalid X-Backend-Ssync-Frag-Index %r' %
+                    self.request.headers['X-Backend-Ssync-Frag-Index'])
+        utils.validate_device_partition(self.device, self.partition)
+        self.diskfile_mgr = self.app._diskfile_router[self.policy]
+        if not self.diskfile_mgr.get_dev_path(self.device):
+            raise swob.HTTPInsufficientStorage(drive=self.device)
+        self.input = SsyncInputProxy(self.request.environ['wsgi.input'],
+                                     self.app.network_chunk_size,
+                                     self.app.client_timeout)
+
+    def _check_local(self, remote, make_durable=True):
+        """
+        Parse local diskfile and return results of current
+        representative for comparison to remote.
+
+        :param object_hash: the hash of the remote object being offered
+        """
+        try:
+            df = self.diskfile_mgr.get_diskfile_from_hash(
+                self.device, self.partition, remote['object_hash'],
+                self.policy, frag_index=self.frag_index, open_expired=True)
+        except exceptions.DiskFileNotExist:
+            return {}
+        try:
+            df.open()
+        except exceptions.DiskFileDeleted as err:
+            result = {'ts_data': err.timestamp}
+        except exceptions.DiskFileError:
+            # e.g. a non-durable EC frag
+            result = {}
+        else:
+            result = {
+                'ts_data': df.data_timestamp,
+                'ts_meta': df.timestamp,
+                'ts_ctype': df.content_type_timestamp,
+            }
+        if ((df.durable_timestamp is None or
+             df.durable_timestamp < remote['ts_data']) and
+                df.fragments and
+                remote['ts_data'] in df.fragments and
+                self.frag_index in df.fragments[remote['ts_data']]):
+            # The remote is offering a fragment that we already have but is
+            # *newer* than anything *durable* that we have
+            if remote['durable']:
+                # We have the frag, just missing durable state, so make the
+                # frag durable now. Try this just once to avoid looping if
+                # it fails.
+                if make_durable:
+                    try:
+                        with df.create() as writer:
+                            writer.commit(remote['ts_data'])
+                        return self._check_local(remote, make_durable=False)
+                    except Exception:
+                        # if commit fails then log exception and fall back to
+                        # wanting a full update
+                        self.app.logger.exception(
+                            '%s/%s/%s EXCEPTION in ssync.Receiver while '
+                            'attempting commit of %s'
+                            % (self.request.remote_addr, self.device,
+                               self.partition, df._datadir))
+            else:
+                # We have the non-durable frag that is on offer, but our
+                # ts_data may currently be set to an older durable frag, so
+                # bump our ts_data to prevent the remote frag being wanted.
+                result['ts_data'] = remote['ts_data']
+        return result
+
+    def _check_missing(self, line):
+        """
+        Parse offered object from sender, and compare to local diskfile,
+        responding with proper protocol line to represented needed data
+        or None if in sync.
+
+        Anchor point for tests to mock legacy protocol changes.
+        """
+        remote = decode_missing(line)
+        local = self._check_local(remote)
+        return encode_wanted(remote, local)
+
+    def missing_check(self):
+        """
+        Handles the receiver-side of the MISSING_CHECK step of a
+        SSYNC request.
+
+        Receives a list of hashes and timestamps of object
+        information the sender can provide and responds with a list
+        of hashes desired, either because they're missing or have an
+        older timestamp locally.
+
+        The process is generally:
+
+        1. Sender sends ``:MISSING_CHECK: START`` and begins
+           sending `hash timestamp` lines.
+
+        2. Receiver gets ``:MISSING_CHECK: START`` and begins
+           reading the `hash timestamp` lines, collecting the
+           hashes of those it desires.
+
+        3. Sender sends ``:MISSING_CHECK: END``.
+
+        4. Receiver gets ``:MISSING_CHECK: END``, responds with
+           ``:MISSING_CHECK: START``, followed by the list of
+           <wanted_hash> specifiers it collected as being wanted
+           (one per line), ``:MISSING_CHECK: END``, and flushes any
+           buffers.
+
+           Each <wanted_hash> specifier has the form <hash>[ <parts>] where
+           <parts> is a string containing characters 'd' and/or 'm'
+           indicating that only data or meta part of object respectively is
+           required to be sync'd.
+
+        5. Sender gets ``:MISSING_CHECK: START`` and reads the list
+           of hashes desired by the receiver until reading
+           ``:MISSING_CHECK: END``.
+
+        The collection and then response is so the sender doesn't
+        have to read while it writes to ensure network buffers don't
+        fill up and block everything.
+        """
+        line = self.input.read_line('missing_check start')
+        if not line:
+            # Guess they hung up
+            raise SsyncClientDisconnected
+        if line.strip() != b':MISSING_CHECK: START':
+            raise Exception(
+                'Looking for :MISSING_CHECK: START got %r'
+                % utils.cap_length(line, 1024))
+        object_hashes = []
+        nlines = 0
+        while True:
+            line = self.input.read_line('missing_check line')
+            if not line or line.strip() == b':MISSING_CHECK: END':
+                break
+            want = self._check_missing(line)
+            if want:
+                object_hashes.append(want)
+            if nlines % 5 == 0:
+                sleep()  # Gives a chance for other greenthreads to run
+            nlines += 1
+        yield b':MISSING_CHECK: START\r\n'
+        if object_hashes:
+            yield b'\r\n'.join(hsh.encode('ascii') for hsh in object_hashes)
+        yield b'\r\n'
+        yield b':MISSING_CHECK: END\r\n'
+
+    def updates(self):
+        """
+        Handles the UPDATES step of an SSYNC request.
+
+        Receives a set of PUT and DELETE subrequests that will be
+        routed to the object server itself for processing. These
+        contain the information requested by the MISSING_CHECK step.
+
+        The PUT and DELETE subrequests are formatted pretty much
+        exactly like regular HTTP requests, excepting the HTTP
+        version on the first request line.
+
+        The process is generally:
+
+        1. Sender sends ``:UPDATES: START`` and begins sending the
+           PUT and DELETE subrequests.
+
+        2. Receiver gets ``:UPDATES: START`` and begins routing the
+           subrequests to the object server.
+
+        3. Sender sends ``:UPDATES: END``.
+
+        4. Receiver gets ``:UPDATES: END`` and sends ``:UPDATES:
+           START`` and ``:UPDATES: END`` (assuming no errors).
+
+        5. Sender gets ``:UPDATES: START`` and ``:UPDATES: END``.
+
+        If too many subrequests fail, as configured by
+        replication_failure_threshold and replication_failure_ratio,
+        the receiver will hang up the request early so as to not
+        waste any more time.
+
+        At step 4, the receiver will send back an error if there were
+        any failures (that didn't cause a hangup due to the above
+        thresholds) so the sender knows the whole was not entirely a
+        success. This is so the sender knows if it can remove an out
+        of place partition, for example.
+        """
+        line = self.input.read_line('updates start')
+        if not line:
+            # Guess they hung up waiting for us to process the missing check
+            raise SsyncClientDisconnected
+        if line.strip() != b':UPDATES: START':
+            raise Exception('Looking for :UPDATES: START got %r'
+                            % utils.cap_length(line, 1024))
+        successes = 0
+        failures = 0
+        updates = 0
+        while True:
+            line = self.input.read_line('updates line')
+            if not line or line.strip() == b':UPDATES: END':
+                break
+            # Read first line METHOD PATH of subrequest.
+            context = swob.bytes_to_wsgi(line.strip())
+            method, path = context.split(' ', 1)
+            subreq = swob.Request.blank(
+                '/%s/%s%s' % (self.device, self.partition, path),
+                environ={'REQUEST_METHOD': method})
+            # Read header lines.
+            content_length = None
+            replication_headers = []
+            while True:
+                line = self.input.read_line('updates line')
+                if not line:
+                    raise Exception('Got no headers for %s' % context)
+                line = line.strip()
+                if not line:
+                    break
+                header, value = line.split(b':', 1)
+                header = swob.bytes_to_wsgi(header.strip().lower())
+                value = swob.bytes_to_wsgi(value.strip())
+                subreq.headers[header] = value
+                if header not in ('etag', 'x-backend-no-commit'):
+                    # we'll use X-Backend-Replication-Headers to force the
+                    # object server to write all sync'd metadata, but with some
+                    # exceptions:
+                    #  - make sure ssync doesn't cause 'Etag' to be added to
+                    #    obj metadata in addition to 'ETag' which object server
+                    #    sets (note capitalization)
+                    #  - filter out x-backend-no-commit which ssync sender may
+                    #    have added to the subrequest
+                    replication_headers.append(header)
+                if header == 'content-length':
+                    content_length = int(value)
+            # Establish subrequest body, if needed.
+            if method in ('DELETE', 'POST'):
+                if content_length not in (None, 0):
+                    raise Exception(
+                        '%s subrequest with content-length %s'
+                        % (method, path))
+            elif method == 'PUT':
+                if content_length is None:
+                    raise Exception('No content-length sent for %s' % context)
+                subreq.environ['wsgi.input'] = self.input.make_subreq_input(
+                    context, content_length)
+            else:
+                raise Exception('Invalid subrequest method %s' % method)
+            subreq.headers['X-Backend-Storage-Policy-Index'] = int(self.policy)
+            subreq.headers['X-Backend-Replication'] = 'True'
+            if self.frag_index is not None:
+                # primary node should not 409 if it has a non-primary fragment
+                subreq.headers['X-Backend-Ssync-Frag-Index'] = self.frag_index
+            if replication_headers:
+                subreq.headers['X-Backend-Replication-Headers'] = \
+                    ' '.join(replication_headers)
+            # Route subrequest and translate response.
+            resp = subreq.get_response(self.app)
+            if http.is_success(resp.status_int) or \
+                    resp.status_int == http.HTTP_NOT_FOUND:
+                successes += 1
+            else:
+                self.app.logger.warning(
+                    'ssync subrequest failed with %s: %s (%s)' %
+                    (resp.status_int, context, resp.body))
+                failures += 1
+            if failures >= self.app.replication_failure_threshold and (
+                    not successes or
+                    float(failures) / successes >
+                    self.app.replication_failure_ratio):
+                raise Exception(
+                    'Too many %d failures to %d successes' %
+                    (failures, successes))
+            # The subreq may have failed, but we want to read the rest of the
+            # body from the remote side so we can either detect a broken input
+            # or continue on with the next subreq.
+            for junk in subreq.environ['wsgi.input']:
+                pass
+            if updates % 5 == 0:
+                sleep()  # Gives a chance for other greenthreads to run
+            updates += 1
+        if failures:
+            raise swob.HTTPInternalServerError(
+                'ERROR: With :UPDATES: %d failures to %d successes' %
+                (failures, successes))
+        yield b':UPDATES: START\r\n'
+        yield b':UPDATES: END\r\n'
diff --git a/swift/obj/ssync_sender.py b/swift/obj/ssync_sender.py
new file mode 100644
index 0000000000..6b3d8e77a3
--- /dev/null
+++ b/swift/obj/ssync_sender.py
@@ -0,0 +1,535 @@
+# Copyright (c) 2013 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from eventlet import sleep
+import urllib
+
+from swift.common import bufferedhttp
+from swift.common import exceptions
+from swift.common import http
+from swift.common import utils
+from swift.common.swob import wsgi_to_bytes
+
+
+def encode_missing(object_hash, ts_data, ts_meta=None, ts_ctype=None,
+                   **kwargs):
+    """
+    Returns a string representing the object hash, its data file timestamp,
+    the delta forwards to its metafile and content-type timestamps, if
+    non-zero, and its durability, in the form:
+    ``<hash> <ts_data> [m:<hex delta to ts_meta>[,t:<hex delta to ts_ctype>]
+    [,durable:False]``
+
+    The decoder for this line is
+    :py:func:`~swift.obj.ssync_receiver.decode_missing`
+    """
+    msg = ('%s %s'
+           % (urllib.parse.quote(object_hash),
+              urllib.parse.quote(ts_data.internal)))
+    extra_parts = []
+    if ts_meta and ts_meta != ts_data:
+        delta = ts_meta.raw - ts_data.raw
+        extra_parts.append('m:%x' % delta)
+        if ts_meta.offset:
+            extra_parts[-1] += '__%x' % ts_meta.offset
+        if ts_ctype and ts_ctype != ts_data:
+            delta = ts_ctype.raw - ts_data.raw
+            extra_parts.append('t:%x' % delta)
+            if ts_ctype.offset:
+                extra_parts[-1] += '__%x' % ts_ctype.offset
+    if 'durable' in kwargs and kwargs['durable'] is False:
+        # only send durable in the less common case that it is False
+        extra_parts.append('durable:%s' % kwargs['durable'])
+    if extra_parts:
+        msg = '%s %s' % (msg, ','.join(extra_parts))
+    return msg.encode('ascii')
+
+
+def decode_wanted(parts):
+    """
+    Parse missing_check line parts to determine which parts of local
+    diskfile were wanted by the receiver.
+
+    The encoder for parts is
+    :py:func:`~swift.obj.ssync_receiver.encode_wanted`
+    """
+    wanted = {}
+    key_map = {'d': 'data', 'm': 'meta'}
+    if parts:
+        # receiver specified data and/or meta wanted, so use those as
+        # conditions for sending PUT and/or POST subrequests
+        for k in key_map:
+            if k in parts[0]:
+                wanted[key_map[k]] = True
+    if not wanted:
+        # assume legacy receiver which will only accept PUTs. There is no
+        # way to send any meta file content without morphing the timestamp
+        # of either the data or the metadata, so we just send data file
+        # content to a legacy receiver. Once the receiver gets updated we
+        # will be able to send it the meta file content.
+        wanted['data'] = True
+    return wanted
+
+
+class SsyncBufferedHTTPResponse(bufferedhttp.BufferedHTTPResponse, object):
+    def __init__(self, *args, **kwargs):
+        super(SsyncBufferedHTTPResponse, self).__init__(*args, **kwargs)
+        self.ssync_response_buffer = b''
+        self.ssync_response_chunk_left = 0
+
+    def readline(self, size=1024):
+        """
+        Reads a line from the SSYNC response body.
+
+        httplib has no readline and will block on read(x) until x is
+        read, so we have to do the work ourselves. A bit of this is
+        taken from Python's httplib itself.
+        """
+        data = self.ssync_response_buffer
+        self.ssync_response_buffer = b''
+        while b'\n' not in data and len(data) < size:
+            if self.ssync_response_chunk_left == -1:  # EOF-already indicator
+                break
+            if self.ssync_response_chunk_left == 0:
+                line = self.fp.readline()
+                i = line.find(b';')
+                if i >= 0:
+                    line = line[:i]  # strip chunk-extensions
+                try:
+                    self.ssync_response_chunk_left = int(line.strip(), 16)
+                except ValueError:
+                    # close the connection as protocol synchronisation is
+                    # probably lost
+                    self.close()
+                    raise exceptions.ReplicationException('Early disconnect')
+                if self.ssync_response_chunk_left == 0:
+                    self.ssync_response_chunk_left = -1
+                    break
+            chunk = self.fp.read(min(self.ssync_response_chunk_left,
+                                     size - len(data)))
+            if not chunk:
+                # close the connection as protocol synchronisation is
+                # probably lost
+                self.close()
+                raise exceptions.ReplicationException('Early disconnect')
+            self.ssync_response_chunk_left -= len(chunk)
+            if self.ssync_response_chunk_left == 0:
+                self.fp.read(2)  # discard the trailing \r\n
+            data += chunk
+        if b'\n' in data:
+            data, self.ssync_response_buffer = data.split(b'\n', 1)
+            data += b'\n'
+        return data
+
+
+class SsyncBufferedHTTPConnection(bufferedhttp.BufferedHTTPConnection):
+    response_class = SsyncBufferedHTTPResponse
+
+
+class Sender(object):
+    """
+    Sends SSYNC requests to the object server.
+
+    These requests are eventually handled by
+    :py:mod:`.ssync_receiver` and full documentation about the
+    process is there.
+    """
+
+    def __init__(self, daemon, node, job, suffixes, remote_check_objs=None,
+                 include_non_durable=False, max_objects=0):
+        self.daemon = daemon
+        self.df_mgr = self.daemon._df_router[job['policy']]
+        self.node = node
+        self.job = job
+        self.suffixes = suffixes
+        # When remote_check_objs is given in job, ssync_sender trys only to
+        # make sure those objects exist or not in remote.
+        self.remote_check_objs = remote_check_objs
+        self.include_non_durable = include_non_durable
+        self.max_objects = max_objects
+        self.limited_by_max_objects = False
+
+    def __call__(self):
+        """
+        Perform ssync with remote node.
+
+        :returns: a 2-tuple, in the form (success, can_delete_objs) where
+                  success is a boolean and can_delete_objs is the map of
+                  objects that are in sync with the receiver. Each entry in
+                  can_delete_objs maps a hash => timestamp of data file or
+                  tombstone file
+        """
+        if not self.suffixes:
+            return True, {}
+        connection = response = None
+        try:
+            # Double try blocks in case our main error handler fails.
+            try:
+                # The general theme for these functions is that they should
+                # raise exceptions.MessageTimeout for client timeouts and
+                # exceptions.ReplicationException for common issues that will
+                # abort the replication attempt and log a simple error. All
+                # other exceptions will be logged with a full stack trace.
+                connection, response = self.connect()
+                # available_map has an entry for each object in given suffixes
+                # that is available to be sync'd;
+                # each entry is a hash => dict of timestamps of data file or
+                # tombstone file and/or meta file
+                # send_map has an entry for each object that the receiver wants
+                # to be sync'ed;
+                # each entry maps an object hash => dict of wanted parts
+                available_map, send_map = self.missing_check(connection,
+                                                             response)
+                if self.remote_check_objs is None:
+                    self.updates(connection, response, send_map)
+                    can_delete_obj = available_map
+                else:
+                    # when we are initialized with remote_check_objs we don't
+                    # *send* any requested updates; instead we only collect
+                    # what's already in sync and safe for deletion
+                    in_sync_hashes = (set(available_map.keys()) -
+                                      set(send_map.keys()))
+                    can_delete_obj = dict((hash_, available_map[hash_])
+                                          for hash_ in in_sync_hashes)
+                self.daemon.logger.debug(
+                    'ssync completed ok: dev: %s, part: %s, policy: %d, '
+                    'num suffixes: %s, available: %d, sent: %d, deletable: %d',
+                    self.job['device'], self.job['partition'],
+                    self.job['policy'].idx, len(self.suffixes),
+                    len(available_map), len(send_map), len(can_delete_obj))
+                return True, can_delete_obj
+            except (exceptions.MessageTimeout,
+                    exceptions.ReplicationException) as err:
+                node_str = utils.node_to_string(self.node, replication=True)
+                self.daemon.logger.error('%s/%s %s', node_str,
+                                         self.job['partition'], err)
+            except Exception:
+                # We don't want any exceptions to escape our code and possibly
+                # mess up the original replicator code that called us since it
+                # was originally written to shell out to rsync which would do
+                # no such thing.
+                node_str = utils.node_to_string(self.node, replication=True)
+                self.daemon.logger.exception(
+                    '%s/%s EXCEPTION in ssync.Sender',
+                    node_str, self.job['partition'])
+            finally:
+                self.disconnect(connection)
+        except Exception:
+            # We don't want any exceptions to escape our code and possibly
+            # mess up the original replicator code that called us since it
+            # was originally written to shell out to rsync which would do
+            # no such thing.
+            # This particular exception handler does the minimal amount as it
+            # would only get called if the above except Exception handler
+            # failed (bad node or job data).
+            self.daemon.logger.exception('EXCEPTION in ssync.Sender')
+        return False, {}
+
+    def connect(self):
+        """
+        Establishes a connection and starts an SSYNC request
+        with the object server.
+        """
+        connection = response = None
+        node_addr = '%s:%s' % (self.node['replication_ip'],
+                               self.node['replication_port'])
+        with exceptions.MessageTimeout(
+                self.daemon.conn_timeout, 'connect send'):
+            connection = SsyncBufferedHTTPConnection(node_addr)
+            connection.putrequest('SSYNC', '/%s/%s' % (
+                self.node['device'], self.job['partition']))
+            connection.putheader('Transfer-Encoding', 'chunked')
+            connection.putheader('X-Backend-Storage-Policy-Index',
+                                 int(self.job['policy']))
+            # a sync job must use the node's backend_index for the frag_index
+            # of the rebuilt fragments instead of the frag_index from the job
+            # which will be rebuilding them
+            frag_index = self.node.get('backend_index')
+            if frag_index is not None:
+                connection.putheader('X-Backend-Ssync-Frag-Index', frag_index)
+                # Node-Index header is for backwards compat 2.4.0-2.20.0
+                connection.putheader('X-Backend-Ssync-Node-Index', frag_index)
+            connection.endheaders()
+        with exceptions.MessageTimeout(
+                self.daemon.node_timeout, 'connect receive'):
+            response = connection.getresponse()
+            if response.status != http.HTTP_OK:
+                err_msg = utils.cap_length(response.read(), 1024)
+                raise exceptions.ReplicationException(
+                    'Expected status %s; got %s (%s)' %
+                    (http.HTTP_OK, response.status, err_msg))
+            if self.include_non_durable and not utils.config_true_value(
+                    response.getheader('x-backend-accept-no-commit', False)):
+                # fall back to legacy behaviour if receiver does not understand
+                # X-Backend-Commit
+                self.daemon.logger.warning(
+                    'ssync receiver %s does not accept non-durable fragments' %
+                    node_addr)
+                self.include_non_durable = False
+        return connection, response
+
+    def missing_check(self, connection, response):
+        """
+        Handles the sender-side of the MISSING_CHECK step of a
+        SSYNC request.
+
+        Full documentation of this can be found at
+        :py:meth:`.Receiver.missing_check`.
+        """
+        self.limited_by_max_objects = False
+        available_map = {}
+        send_map = {}
+        # First, send our list.
+        with exceptions.MessageTimeout(
+                self.daemon.node_timeout, 'missing_check start'):
+            msg = b':MISSING_CHECK: START\r\n'
+            connection.send(b'%x\r\n%s\r\n' % (len(msg), msg))
+        # an empty frag_prefs list is sufficient to get non-durable frags
+        # yielded, in which case an older durable frag will not be yielded
+        frag_prefs = [] if self.include_non_durable else None
+        hash_gen = self.df_mgr.yield_hashes(
+            self.job['device'], self.job['partition'],
+            self.job['policy'], self.suffixes,
+            frag_index=self.job.get('frag_index'),
+            frag_prefs=frag_prefs)
+        if self.remote_check_objs is not None:
+            hash_gen = filter(
+                lambda objhash_timestamps:
+                objhash_timestamps[0] in
+                self.remote_check_objs, hash_gen)
+        nlines = 0
+        nbytes = 0
+        object_hash = None
+        for object_hash, timestamps in hash_gen:
+            available_map[object_hash] = timestamps
+            with exceptions.MessageTimeout(
+                    self.daemon.node_timeout,
+                    'missing_check send line: %d lines (%d bytes) sent'
+                    % (nlines, nbytes)):
+                msg = b'%s\r\n' % encode_missing(object_hash, **timestamps)
+                msg = b'%x\r\n%s\r\n' % (len(msg), msg)
+                connection.send(msg)
+            if nlines % 5 == 0:
+                sleep()  # Gives a chance for other greenthreads to run
+            nlines += 1
+            nbytes += len(msg)
+            if 0 < self.max_objects <= nlines:
+                break
+        for _ in hash_gen:
+            # only log truncation if there were more hashes to come...
+            self.limited_by_max_objects = True
+            self.daemon.logger.info(
+                'ssync missing_check truncated after %d objects: '
+                'device: %s, part: %s, policy: %s, last object hash: '
+                '%s', nlines, self.job['device'],
+                self.job['partition'], int(self.job['policy']),
+                object_hash)
+            break
+        with exceptions.MessageTimeout(
+                self.daemon.node_timeout, 'missing_check end'):
+            msg = b':MISSING_CHECK: END\r\n'
+            connection.send(b'%x\r\n%s\r\n' % (len(msg), msg))
+        # Now, retrieve the list of what they want.
+        while True:
+            with exceptions.MessageTimeout(
+                    self.daemon.http_timeout, 'missing_check start wait'):
+                line = response.readline(size=self.daemon.network_chunk_size)
+            if not line:
+                raise exceptions.ReplicationException('Early disconnect')
+            line = line.strip()
+            if line == b':MISSING_CHECK: START':
+                break
+            elif line:
+                try:
+                    line = line.decode('ascii')
+                except UnicodeDecodeError:
+                    pass
+                raise exceptions.ReplicationException(
+                    'Unexpected response: %r' % utils.cap_length(line, 1024))
+        while True:
+            with exceptions.MessageTimeout(
+                    self.daemon.http_timeout, 'missing_check line wait'):
+                line = response.readline(size=self.daemon.network_chunk_size)
+            if not line:
+                raise exceptions.ReplicationException('Early disconnect')
+            line = line.strip()
+            if line == b':MISSING_CHECK: END':
+                break
+            parts = line.decode('ascii').split()
+            if parts:
+                send_map[parts[0]] = decode_wanted(parts[1:])
+        return available_map, send_map
+
+    def updates(self, connection, response, send_map):
+        """
+        Handles the sender-side of the UPDATES step of an SSYNC
+        request.
+
+        Full documentation of this can be found at
+        :py:meth:`.Receiver.updates`.
+        """
+        # First, send all our subrequests based on the send_map.
+        with exceptions.MessageTimeout(
+                self.daemon.node_timeout, 'updates start'):
+            msg = b':UPDATES: START\r\n'
+            connection.send(b'%x\r\n%s\r\n' % (len(msg), msg))
+        frag_prefs = [] if self.include_non_durable else None
+        updates = 0
+        for object_hash, want in send_map.items():
+            object_hash = urllib.parse.unquote(object_hash)
+            try:
+                df = self.df_mgr.get_diskfile_from_hash(
+                    self.job['device'], self.job['partition'], object_hash,
+                    self.job['policy'], frag_index=self.job.get('frag_index'),
+                    open_expired=True, frag_prefs=frag_prefs)
+            except exceptions.DiskFileNotExist:
+                continue
+            url_path = urllib.parse.quote(
+                '/%s/%s/%s' % (df.account, df.container, df.obj))
+            try:
+                df.open()
+                if want.get('data'):
+                    is_durable = (df.durable_timestamp == df.data_timestamp)
+                    # EC reconstructor may have passed a callback to build an
+                    # alternative diskfile - construct it using the metadata
+                    # from the data file only.
+                    df_alt = self.job.get(
+                        'sync_diskfile_builder', lambda *args: df)(
+                            self.job, self.node, df)
+                    self.send_put(connection, url_path, df_alt,
+                                  durable=is_durable)
+                if want.get('meta') and df.data_timestamp != df.timestamp:
+                    self.send_post(connection, url_path, df)
+            except exceptions.DiskFileDeleted as err:
+                if want.get('data'):
+                    self.send_delete(connection, url_path, err.timestamp)
+            except exceptions.DiskFileError:
+                # DiskFileErrors are expected while opening the diskfile,
+                # before any data is read and sent. Since there is no partial
+                # state on the receiver it's ok to ignore this diskfile and
+                # continue. The diskfile may however be deleted after a
+                # successful ssync since it remains in the send_map.
+                pass
+            if updates % 5 == 0:
+                sleep()  # Gives a chance for other greenthreads to run
+            updates += 1
+        with exceptions.MessageTimeout(
+                self.daemon.node_timeout, 'updates end'):
+            msg = b':UPDATES: END\r\n'
+            connection.send(b'%x\r\n%s\r\n' % (len(msg), msg))
+        # Now, read their response for any issues.
+        while True:
+            with exceptions.MessageTimeout(
+                    self.daemon.http_timeout, 'updates start wait'):
+                line = response.readline(size=self.daemon.network_chunk_size)
+            if not line:
+                raise exceptions.ReplicationException('Early disconnect')
+            line = line.strip()
+            if line == b':UPDATES: START':
+                break
+            elif line:
+                try:
+                    line = line.decode('ascii')
+                except UnicodeDecodeError:
+                    pass
+                raise exceptions.ReplicationException(
+                    'Unexpected response: %r' % utils.cap_length(line, 1024))
+        while True:
+            with exceptions.MessageTimeout(
+                    self.daemon.http_timeout, 'updates line wait'):
+                line = response.readline(size=self.daemon.network_chunk_size)
+            if not line:
+                raise exceptions.ReplicationException('Early disconnect')
+            line = line.strip()
+            if line == b':UPDATES: END':
+                break
+            elif line:
+                try:
+                    line = line.decode('ascii')
+                except UnicodeDecodeError:
+                    pass
+                raise exceptions.ReplicationException(
+                    'Unexpected response: %r' % utils.cap_length(line, 1024))
+
+    def send_subrequest(self, connection, method, url_path, headers, df):
+        msg = [b'%s %s' % (method.encode('ascii'), url_path.encode('utf8'))]
+        for key, value in sorted(headers.items()):
+            msg.append(wsgi_to_bytes('%s: %s' % (key, value)))
+        msg = b'\r\n'.join(msg) + b'\r\n\r\n'
+        with exceptions.MessageTimeout(self.daemon.node_timeout,
+                                       'send_%s' % method.lower()):
+            connection.send(b'%x\r\n%s\r\n' % (len(msg), msg))
+
+        if df:
+            bytes_read = 0
+            for chunk in df.reader():
+                bytes_read += len(chunk)
+                with exceptions.MessageTimeout(self.daemon.node_timeout,
+                                               'send_%s chunk' %
+                                               method.lower()):
+                    connection.send(b'%x\r\n%s\r\n' % (len(chunk), chunk))
+            if bytes_read != df.content_length:
+                # Since we may now have partial state on the receiver we have
+                # to prevent the receiver finalising what may well be a bad or
+                # partially written diskfile. Unfortunately we have no other
+                # option than to pull the plug on this ssync session. If ssync
+                # supported multiphase PUTs like the proxy uses for EC we could
+                # send a bad etag in a footer of this subrequest, but that is
+                # not supported.
+                raise exceptions.ReplicationException(
+                    'Sent data length does not match content-length')
+
+    def send_delete(self, connection, url_path, timestamp):
+        """
+        Sends a DELETE subrequest with the given information.
+        """
+        headers = {'X-Timestamp': timestamp.internal}
+        self.send_subrequest(connection, 'DELETE', url_path, headers, None)
+
+    def send_put(self, connection, url_path, df, durable=True):
+        """
+        Sends a PUT subrequest for the url_path using the source df
+        (DiskFile) and content_length.
+        """
+        headers = {'Content-Length': str(df.content_length)}
+        if not durable:
+            # only send this header for the less common case; without this
+            # header object servers assume default commit behaviour
+            headers['X-Backend-No-Commit'] = 'True'
+        for key, value in df.get_datafile_metadata().items():
+            if key not in ('name', 'Content-Length'):
+                headers[key] = value
+        self.send_subrequest(connection, 'PUT', url_path, headers, df)
+
+    def send_post(self, connection, url_path, df):
+        metadata = df.get_metafile_metadata()
+        if metadata is None:
+            return
+        self.send_subrequest(connection, 'POST', url_path, metadata, None)
+
+    def disconnect(self, connection):
+        """
+        Closes down the connection to the object server once done
+        with the SSYNC request.
+        """
+        if not connection:
+            return
+        try:
+            with exceptions.MessageTimeout(
+                    self.daemon.node_timeout, 'disconnect'):
+                connection.send(b'0\r\n\r\n')
+        except (Exception, exceptions.Timeout):
+            pass  # We're okay with the above failing.
+        connection.close()
diff --git a/swift/obj/updater.py b/swift/obj/updater.py
index 31185dec10..5f8e7f6657 100644
--- a/swift/obj/updater.py
+++ b/swift/obj/updater.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -12,47 +12,465 @@
 # implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
+import queue
 
-import cPickle as pickle
+import pickle  # nosec: B403
+import errno
 import os
 import signal
 import sys
 import time
-from random import random
+import uuid
+from random import random, shuffle
+from bisect import insort
+from collections import deque
 
-from eventlet import patcher, Timeout
+from eventlet import spawn, Timeout
 
 from swift.common.bufferedhttp import http_connect
+from swift.common.constraints import check_drive
 from swift.common.exceptions import ConnectionTimeout
 from swift.common.ring import Ring
 from swift.common.utils import get_logger, renamer, write_pickle, \
-    dump_recon_cache, config_true_value
-from swift.common.daemon import Daemon
-from swift.obj.server import ASYNCDIR
-from swift.common.http import is_success, HTTP_NOT_FOUND, \
-    HTTP_INTERNAL_SERVER_ERROR
+    dump_recon_cache, config_true_value, RateLimitedIterator, split_path, \
+    eventlet_monkey_patch, get_redirect_data, ContextPool, hash_path, \
+    non_negative_float, config_positive_int_value, non_negative_int, \
+    EventletRateLimiter, node_to_string, parse_options, load_recon_cache, \
+    Timestamp
+from swift.common.daemon import Daemon, run_daemon
+from swift.common.header_key_dict import HeaderKeyDict
+from swift.common.storage_policy import split_policy_string, PolicyError
+from swift.common.recon import RECON_OBJECT_FILE, DEFAULT_RECON_CACHE_PATH
+from swift.obj.diskfile import get_tmp_dir, ASYNCDIR_BASE
+from swift.common.http import is_success, HTTP_INTERNAL_SERVER_ERROR, \
+    HTTP_MOVED_PERMANENTLY
+
+
+class RateLimiterBucket(EventletRateLimiter):
+    """
+    Extends EventletRateLimiter to also maintain a deque of items that have
+    been deferred due to rate-limiting, and to provide a comparator for sorting
+    instanced by readiness.
+    """
+    def __init__(self, max_updates_per_second):
+        super(RateLimiterBucket, self).__init__(max_updates_per_second,
+                                                rate_buffer=0)
+        self.deque = deque()
+
+    def __len__(self):
+        return len(self.deque)
+
+    def __bool__(self):
+        return bool(self.deque)
+
+    def __lt__(self, other):
+        # used to sort RateLimiterBuckets by readiness
+        if isinstance(other, RateLimiterBucket):
+            return self.running_time < other.running_time
+        return self.running_time < other
+
+
+class BucketizedUpdateSkippingLimiter(object):
+    """
+    Wrap an iterator to rate-limit updates on a per-bucket basis, where updates
+    are mapped to buckets by hashing their destination path. If an update is
+    rate-limited then it is placed on a deferral queue and may be sent later if
+    the wrapped iterator is exhausted before the ``drain_until`` time is
+    reached.
+
+    The deferral queue has constrained size and once the queue is full updates
+    are evicted using a first-in-first-out policy. This policy is used because
+    updates on the queue may have been made obsolete by newer updates written
+    to disk, and this is more likely for updates that have been on the queue
+    longest.
+
+    The iterator increments stats as follows:
+
+    * The `deferrals` stat is incremented for each update that is
+      rate-limited. Note that a individual update is rate-limited at most
+      once.
+    * The `skips` stat is incremented for each rate-limited update that is
+      not eventually yielded. This includes updates that are evicted from the
+      deferral queue and all updates that remain in the deferral queue when
+      ``drain_until`` time is reached and the iterator terminates.
+    * The `drains` stat is incremented for each rate-limited update that is
+      eventually yielded.
+
+    Consequently, when this iterator terminates, the sum of `skips` and
+    `drains` is equal to the number of `deferrals`.
+
+    :param update_iterable: an async_pending update iterable
+    :param logger: a logger instance
+    :param stats: a SweepStats instance
+    :param num_buckets: number of buckets to divide container hashes into, the
+                        more buckets total the less containers to a bucket
+                        (once a busy container slows down a bucket the whole
+                        bucket starts deferring)
+    :param max_elements_per_group_per_second: tunable, when deferring kicks in
+    :param max_deferred_elements: maximum number of deferred elements before
+        skipping starts. Each bucket may defer updates, but once the total
+        number of deferred updates summed across all buckets reaches this
+        value then all buckets will skip subsequent updates.
+    :param drain_until: time at which any remaining deferred elements must be
+        skipped and the iterator stops. Once the wrapped iterator has been
+        exhausted, this iterator will drain deferred elements from its buckets
+        until either all buckets have drained or this time is reached.
+    """
+
+    def __init__(self, update_iterable, logger, stats, num_buckets=1000,
+                 max_elements_per_group_per_second=50,
+                 max_deferred_elements=0,
+                 drain_until=0):
+        self.iterator = iter(update_iterable)
+        self.logger = logger
+        self.stats = stats
+        # if we want a smaller "blast radius" we could make this number bigger
+        self.num_buckets = max(num_buckets, 1)
+        self.max_deferred_elements = max_deferred_elements
+        self.deferred_buckets = deque()
+        self.drain_until = drain_until
+        self.salt = str(uuid.uuid4())
+        self.buckets = [RateLimiterBucket(max_elements_per_group_per_second)
+                        for _ in range(self.num_buckets)]
+        self.buckets_ordered_by_readiness = None
+
+    def __iter__(self):
+        return self
+
+    def _bucket_key(self, update):
+        acct, cont = split_update_path(update)
+        return int(hash_path(acct, cont, self.salt), 16) % self.num_buckets
+
+    def _get_time(self):
+        return time.time()
+
+    def __next__(self):
+        # first iterate over the wrapped iterator...
+        for update_ctx in self.iterator:
+            bucket = self.buckets[self._bucket_key(update_ctx['update'])]
+            now = self._get_time()
+            if bucket.is_allowed(now=now):
+                # no need to ratelimit, just return next update
+                return update_ctx
+
+            self.stats.deferrals += 1
+            self.logger.increment("deferrals")
+            if self.max_deferred_elements > 0:
+                if len(self.deferred_buckets) >= self.max_deferred_elements:
+                    # create space to defer this update by popping the least
+                    # recent deferral from the least recently deferred bucket;
+                    # updates read from disk recently are preferred over those
+                    # read from disk less recently.
+                    oldest_deferred_bucket = self.deferred_buckets.popleft()
+                    oldest_deferred_bucket.deque.popleft()
+                    self.stats.skips += 1
+                    self.logger.increment("skips")
+                # append the update to the bucket's queue and append the bucket
+                # to the queue of deferred buckets
+                # note: buckets may have multiple entries in deferred_buckets,
+                # one for each deferred update in that particular bucket
+                bucket.deque.append(update_ctx)
+                self.deferred_buckets.append(bucket)
+            else:
+                self.stats.skips += 1
+                self.logger.increment("skips")
+
+        if self.buckets_ordered_by_readiness is None:
+            # initialise a queue of those buckets with deferred elements;
+            # buckets are queued in the chronological order in which they are
+            # ready to serve an element
+            self.buckets_ordered_by_readiness = queue.PriorityQueue()
+            for bucket in self.buckets:
+                if bucket:
+                    self.buckets_ordered_by_readiness.put(bucket)
+
+        # now drain the buckets...
+        undrained_elements = []
+        while not self.buckets_ordered_by_readiness.empty():
+            now = self._get_time()
+            bucket = self.buckets_ordered_by_readiness.get_nowait()
+            if now < self.drain_until:
+                # wait for next element to be ready
+                bucket.wait(now=now)
+                # drain the most recently deferred element
+                item = bucket.deque.pop()
+                if bucket:
+                    # bucket has more deferred elements, re-insert in queue in
+                    # correct chronological position
+                    self.buckets_ordered_by_readiness.put(bucket)
+                self.stats.drains += 1
+                self.logger.increment("drains")
+                return item
+            else:
+                # time to stop iterating: gather all un-drained elements
+                undrained_elements.extend(bucket.deque)
+
+        if undrained_elements:
+            # report final batch of skipped elements
+            self.stats.skips += len(undrained_elements)
+            self.logger.update_stats("skips", len(undrained_elements))
+
+        raise StopIteration()
+
+
+class OldestAsyncPendingTracker:
+    """
+    Manages the tracking of the oldest async pending updates for each
+    account-container pair using a sorted list for timestamps. Evicts the
+    newest pairs when t max_entries is reached. Supports retrieving the N
+    oldest async pending updates or calculating the age of the oldest pending
+    update.
+    """
+    def __init__(
+        self,
+        max_entries,
+    ):
+        self.max_entries = max_entries
+        self.sorted_entries = []
+        self.ac_to_timestamp = {}
+
+    def add_update(self, account, container, timestamp):
+        """
+        Add or update a timestamp for a given account and container.
+
+        :param account: (str) The account name.
+        :param container: (str) The container name.
+        :param timestamp: (str) The timestamp to add or update.
+        """
+        # Ensure the timestamp is a float
+        timestamp = float(Timestamp(timestamp))
+
+        ac = (account, container)
+
+        if ac in self.ac_to_timestamp:
+            old_timestamp = self.ac_to_timestamp[ac]
+            # Only replace the existing timestamp if the new one is older
+            if timestamp < old_timestamp:
+                # Remove the old (timestamp, ac) from the
+                # sorted list
+                self.sorted_entries.remove((old_timestamp, ac))
+                # Insert the new (timestamp, ac) in the sorted order
+                insort(self.sorted_entries, (timestamp, ac))
+                # Update the ac_to_timestamp dictionary
+                self.ac_to_timestamp[ac] = timestamp
+        else:
+            # Insert the new (timestamp, ac) in the sorted order
+            insort(self.sorted_entries, (timestamp, ac))
+            self.ac_to_timestamp[ac] = timestamp
+
+        # Check size and evict the newest ac(s) if necessary
+        if (len(self.ac_to_timestamp) > self.max_entries):
+            # Pop the newest entry (largest timestamp)
+            _, newest_ac = (self.sorted_entries.pop())
+            del self.ac_to_timestamp[newest_ac]
+
+    def get_n_oldest_timestamp_acs(self, n):
+        oldest_entries = self.sorted_entries[:n]
+        return {
+            'oldest_count': len(oldest_entries),
+            'oldest_entries': [
+                {
+                    'timestamp': entry[0],
+                    'account': entry[1][0],
+                    'container': entry[1][1],
+                }
+                for entry in oldest_entries
+            ],
+        }
+
+    def get_oldest_timestamp(self):
+        if self.sorted_entries:
+            return self.sorted_entries[0][0]
+        return None
+
+    def get_oldest_timestamp_age(self):
+        current_time = time.time()
+        oldest_timestamp = self.get_oldest_timestamp()
+        if oldest_timestamp is not None:
+            return current_time - oldest_timestamp
+        return None
+
+    def reset(self):
+        self.sorted_entries = []
+        self.ac_to_timestamp = {}
+
+    def get_memory_usage(self):
+        return self._get_size(self)
+
+    def _get_size(self, obj, seen=None):
+        if seen is None:
+            seen = set()
+
+        obj_id = id(obj)
+        if obj_id in seen:
+            return 0
+        seen.add(obj_id)
+
+        size = sys.getsizeof(obj)
+
+        if isinstance(obj, dict):
+            size += sum(
+                self._get_size(k, seen) + self._get_size(v, seen)
+                for k, v in obj.items()
+            )
+        elif hasattr(obj, '__dict__'):
+            size += self._get_size(obj.__dict__, seen)
+        elif (
+            hasattr(obj, '__iter__')
+            and not isinstance(obj, (str, bytes, bytearray))
+        ):
+            size += sum(self._get_size(i, seen) for i in obj)
+
+        return size
+
+
+class SweepStats(object):
+    """
+    Stats bucket for an update sweep
+
+    A measure of the rate at which updates are being rate-limited is::
+
+        deferrals / (deferrals + successes + failures - drains)
+
+    A measure of the rate at which updates are not being sent during a sweep
+    is::
+
+        skips / (skips + successes + failures)
+    """
+    def __init__(self, errors=0, failures=0, quarantines=0, successes=0,
+                 unlinks=0, outdated_unlinks=0, redirects=0, skips=0,
+                 deferrals=0, drains=0):
+        self.errors = errors
+        self.failures = failures
+        self.quarantines = quarantines
+        self.successes = successes
+        self.unlinks = unlinks
+        self.outdated_unlinks = outdated_unlinks
+        self.redirects = redirects
+        self.skips = skips
+        self.deferrals = deferrals
+        self.drains = drains
+
+    def copy(self):
+        return type(self)(self.errors, self.failures, self.quarantines,
+                          self.successes, self.unlinks, self.outdated_unlinks,
+                          self.redirects, self.skips, self.deferrals,
+                          self.drains)
+
+    def since(self, other):
+        return type(self)(self.errors - other.errors,
+                          self.failures - other.failures,
+                          self.quarantines - other.quarantines,
+                          self.successes - other.successes,
+                          self.unlinks - other.unlinks,
+                          self.outdated_unlinks - other.outdated_unlinks,
+                          self.redirects - other.redirects,
+                          self.skips - other.skips,
+                          self.deferrals - other.deferrals,
+                          self.drains - other.drains)
+
+    def reset(self):
+        self.errors = 0
+        self.failures = 0
+        self.quarantines = 0
+        self.successes = 0
+        self.unlinks = 0
+        self.outdated_unlinks = 0
+        self.redirects = 0
+        self.skips = 0
+        self.deferrals = 0
+        self.drains = 0
+
+    def __str__(self):
+        keys = (
+            (self.successes, 'successes'),
+            (self.failures, 'failures'),
+            (self.quarantines, 'quarantines'),
+            (self.unlinks, 'unlinks'),
+            (self.outdated_unlinks, 'outdated_unlinks'),
+            (self.errors, 'errors'),
+            (self.redirects, 'redirects'),
+            (self.skips, 'skips'),
+            (self.deferrals, 'deferrals'),
+            (self.drains, 'drains'),
+        )
+        return ', '.join('%d %s' % pair for pair in keys)
+
+
+def split_update_path(update):
+    """
+    Split the account and container parts out of the async update data.
+
+    N.B. updates to shards set the container_path key while the account and
+    container keys are always the root.
+    """
+    container_path = update.get('container_path')
+    if container_path:
+        acct, cont = split_path('/' + container_path, minsegs=2)
+    else:
+        acct, cont = update['account'], update['container']
+    return acct, cont
 
 
 class ObjectUpdater(Daemon):
     """Update object information in container listings."""
 
-    def __init__(self, conf):
+    def __init__(self, conf, logger=None):
         self.conf = conf
-        self.logger = get_logger(conf, log_route='object-updater')
+        self.logger = logger or get_logger(conf, log_route='object-updater')
         self.devices = conf.get('devices', '/srv/node')
         self.mount_check = config_true_value(conf.get('mount_check', 'true'))
         self.swift_dir = conf.get('swift_dir', '/etc/swift')
-        self.interval = int(conf.get('interval', 300))
+        self.interval = float(conf.get('interval', 300))
         self.container_ring = None
-        self.concurrency = int(conf.get('concurrency', 1))
-        self.slowdown = float(conf.get('slowdown', 0.01))
-        self.node_timeout = int(conf.get('node_timeout', 10))
+        self.concurrency = int(conf.get('concurrency', 8))
+        self.updater_workers = config_positive_int_value(
+            conf.get('updater_workers', 1))
+        if 'slowdown' in conf:
+            self.logger.warning(
+                'The slowdown option is deprecated in favor of '
+                'objects_per_second. This option may be ignored in a '
+                'future release.')
+            objects_per_second = 1 / (
+                float(conf.get('slowdown', '0.01')) + 0.01)
+        else:
+            objects_per_second = 50
+        self.objects_running_time = 0
+        self.max_objects_per_second = \
+            float(conf.get('objects_per_second',
+                           objects_per_second))
+        self.max_objects_per_container_per_second = non_negative_float(
+            conf.get('max_objects_per_container_per_second', 0))
+        self.per_container_ratelimit_buckets = config_positive_int_value(
+            conf.get('per_container_ratelimit_buckets', 1000))
+        self.node_timeout = float(conf.get('node_timeout', 10))
         self.conn_timeout = float(conf.get('conn_timeout', 0.5))
-        self.successes = 0
-        self.failures = 0
+        self.report_interval = float(conf.get('report_interval', 300))
         self.recon_cache_path = conf.get('recon_cache_path',
-                                         '/var/cache/swift')
-        self.rcache = os.path.join(self.recon_cache_path, 'object.recon')
+                                         DEFAULT_RECON_CACHE_PATH)
+        self.rcache = os.path.join(self.recon_cache_path, RECON_OBJECT_FILE)
+        max_entries = config_positive_int_value(
+            conf.get('async_tracker_max_entries', 100)
+        )
+        self.dump_count = config_positive_int_value(
+            conf.get('async_tracker_dump_count', 5)
+        )
+        self.stats = SweepStats()
+        self.oldest_async_pendings = OldestAsyncPendingTracker(max_entries)
+        self.max_deferred_updates = non_negative_int(
+            conf.get('max_deferred_updates', 10000))
+        self.begin = time.time()
+
+    def _listdir(self, path):
+        try:
+            return os.listdir(path)
+        except OSError as e:
+            self.stats.errors += 1
+            self.logger.increment('errors')
+            self.logger.error('ERROR: Unable to access %(path)s: '
+                              '%(error)s',
+                              {'path': path, 'error': e})
+            return []
 
     def get_container_ring(self):
         """Get the container ring.  Load it, if it hasn't been yet."""
@@ -60,74 +478,284 @@ def get_container_ring(self):
             self.container_ring = Ring(self.swift_dir, ring_name='container')
         return self.container_ring
 
+    def _process_device_in_child(self, dev_path, device):
+        """Process a single device in a forked child process."""
+        signal.signal(signal.SIGTERM, signal.SIG_DFL)
+        os.environ.pop('NOTIFY_SOCKET', None)
+        eventlet_monkey_patch()
+        self.stats.reset()
+        self.oldest_async_pendings.reset()
+        forkbegin = time.time()
+        self.object_sweep(dev_path)
+        elapsed = time.time() - forkbegin
+        self.logger.info(
+            ('Object update sweep of %(device)s '
+                'completed: %(elapsed).02fs, %(stats)s'),
+            {'device': device, 'elapsed': elapsed,
+                'stats': self.stats})
+        self.dump_device_recon(device)
+
+    def _process_devices(self, devices):
+        """Process devices, handling both single and multi-threaded modes."""
+        pids = []
+        # read from container ring to ensure it's fresh
+        self.get_container_ring().get_nodes('')
+        for device in devices:
+            try:
+                dev_path = check_drive(self.devices, device,
+                                       self.mount_check)
+            except ValueError as err:
+                # We don't count this as an error. The occasional
+                # unmounted drive is part of normal cluster operations,
+                # so a simple warning is sufficient.
+                self.logger.warning('Skipping: %s', err)
+                continue
+            while len(pids) >= self.updater_workers:
+                pids.remove(os.wait()[0])
+            pid = os.fork()
+            if pid:
+                pids.append(pid)
+            else:
+                self._process_device_in_child(dev_path, device)
+                sys.exit()
+
+        while pids:
+            pids.remove(os.wait()[0])
+
     def run_forever(self, *args, **kwargs):
         """Run the updater continuously."""
         time.sleep(random() * self.interval)
         while True:
-            self.logger.info(_('Begin object update sweep'))
-            begin = time.time()
-            pids = []
-            # read from container ring to ensure it's fresh
-            self.get_container_ring().get_nodes('')
-            for device in os.listdir(self.devices):
-                if self.mount_check and not \
-                        os.path.ismount(os.path.join(self.devices, device)):
-                    self.logger.increment('errors')
-                    self.logger.warn(
-                        _('Skipping %s as it is not mounted'), device)
-                    continue
-                while len(pids) >= self.concurrency:
-                    pids.remove(os.wait()[0])
-                pid = os.fork()
-                if pid:
-                    pids.append(pid)
-                else:
-                    signal.signal(signal.SIGTERM, signal.SIG_DFL)
-                    patcher.monkey_patch(all=False, socket=True)
-                    self.successes = 0
-                    self.failures = 0
-                    forkbegin = time.time()
-                    self.object_sweep(os.path.join(self.devices, device))
-                    elapsed = time.time() - forkbegin
-                    self.logger.info(
-                        _('Object update sweep of %(device)s'
-                          ' completed: %(elapsed).02fs, %(success)s successes'
-                          ', %(fail)s failures'),
-                        {'device': device, 'elapsed': elapsed,
-                         'success': self.successes, 'fail': self.failures})
-                    sys.exit()
-            while pids:
-                pids.remove(os.wait()[0])
-            elapsed = time.time() - begin
-            self.logger.info(_('Object update sweep completed: %.02fs'),
-                             elapsed)
-            dump_recon_cache({'object_updater_sweep': elapsed},
-                             self.rcache, self.logger)
+            elapsed = self.run_once(*args, **kwargs)
             if elapsed < self.interval:
                 time.sleep(self.interval - elapsed)
 
     def run_once(self, *args, **kwargs):
-        """Run the updater once"""
-        self.logger.info(_('Begin object update single threaded sweep'))
-        begin = time.time()
-        self.successes = 0
-        self.failures = 0
-        for device in os.listdir(self.devices):
-            if self.mount_check and \
-                    not os.path.ismount(os.path.join(self.devices, device)):
-                self.logger.increment('errors')
-                self.logger.warn(
-                    _('Skipping %s as it is not mounted'), device)
-                continue
-            self.object_sweep(os.path.join(self.devices, device))
-        elapsed = time.time() - begin
+        """Run the updater once."""
+        self.logger.info('Begin object update sweep of all devices')
+        self.begin = time.time()
+        devices = self._listdir(self.devices)
+        self._process_devices(devices)
+        now = time.time()
+        elapsed = now - self.begin
         self.logger.info(
-            _('Object update single threaded sweep completed: '
-              '%(elapsed).02fs, %(success)s successes, %(fail)s failures'),
-            {'elapsed': elapsed, 'success': self.successes,
-             'fail': self.failures})
-        dump_recon_cache({'object_updater_sweep': elapsed},
-                         self.rcache, self.logger)
+            ('Object update sweep of all devices completed: '
+             '%(elapsed).02fs'),
+            {'elapsed': elapsed})
+        self.aggregate_and_dump_recon(devices, elapsed, now)
+        return elapsed
+
+    def _gather_recon_stats(self):
+        """Gather stats for device recon dumps."""
+        stats = {
+            'failures_oldest_timestamp':
+                self.oldest_async_pendings.get_oldest_timestamp(),
+            'failures_oldest_timestamp_age':
+                self.oldest_async_pendings.get_oldest_timestamp_age(),
+            'failures_account_container_count':
+                len(self.oldest_async_pendings.ac_to_timestamp),
+            'failures_oldest_timestamp_account_containers':
+                self.oldest_async_pendings.get_n_oldest_timestamp_acs(
+                    self.dump_count),
+            'tracker_memory_usage':
+                self.oldest_async_pendings.get_memory_usage(),
+        }
+        return stats
+
+    def dump_device_recon(self, device):
+        """Dump recon stats for a single device."""
+        disk_recon_stats = self._gather_recon_stats()
+        dump_recon_cache(
+            {'object_updater_per_device': {device: disk_recon_stats}},
+            self.rcache,
+            self.logger,
+        )
+
+    def aggregate_and_dump_recon(self, devices, elapsed, now):
+        """
+        Aggregate recon stats across devices and dump the result to the
+        recon cache.
+        """
+        recon_cache = load_recon_cache(self.rcache)
+        device_stats = recon_cache.get('object_updater_per_device', {})
+        if not isinstance(device_stats, dict):
+            raise TypeError('object_updater_per_device must be a dict')
+        devices_to_remove = set(device_stats) - set(devices)
+        device_stats = {dev: device_stats.get(dev) or {}
+                        for dev in devices}
+
+        aggregated_oldest_entries = []
+
+        for stats in device_stats.values():
+            container_data = stats.get(
+                'failures_oldest_timestamp_account_containers', {})
+            aggregated_oldest_entries.extend(container_data.get(
+                'oldest_entries', []))
+        aggregated_oldest_entries.sort(key=lambda x: x['timestamp'])
+        aggregated_oldest_entries = aggregated_oldest_entries[:self.dump_count]
+        aggregated_oldest_count = len(aggregated_oldest_entries)
+
+        aggregated_stats = {
+            'failures_account_container_count': max(
+                list(
+                    stats.get('failures_account_container_count', 0)
+                    for stats in device_stats.values()
+                )
+                or [0],
+            ),
+            'tracker_memory_usage': (
+                float(sum(
+                    stats.get('tracker_memory_usage', 0)
+                    for stats in device_stats.values()
+                ))
+                / float(len(device_stats))
+            )
+            * max(1, min(self.updater_workers, len(device_stats)))
+            if device_stats
+            else 0,
+            'failures_oldest_timestamp': min(
+                list(filter(lambda x: x is not None,
+                            [stats.get('failures_oldest_timestamp')
+                             for stats in device_stats.values()]
+                            )) or [None],
+            ),
+            'failures_oldest_timestamp_age': max(
+                list(filter(lambda x: x is not None,
+                            [stats.get('failures_oldest_timestamp_age')
+                             for stats in device_stats.values()]
+                            )) or [None],
+            ),
+            'failures_oldest_timestamp_account_containers': {
+                'oldest_count': aggregated_oldest_count,
+                'oldest_entries': aggregated_oldest_entries,
+            },
+        }
+
+        recon_dump = {
+            'object_updater_sweep': elapsed,
+            'object_updater_stats': aggregated_stats,
+            'object_updater_last': now
+        }
+        if devices_to_remove:
+            recon_dump['object_updater_per_device'] = {
+                d: {} for d in devices_to_remove}
+        dump_recon_cache(
+            recon_dump,
+            self.rcache,
+            self.logger,
+        )
+
+    def _load_update(self, device, update_path):
+        try:
+            return pickle.load(open(update_path, 'rb'))  # nosec: B301
+        except Exception as e:
+            if getattr(e, 'errno', None) == errno.ENOENT:
+                return
+            self.logger.exception(
+                'ERROR Pickle problem, quarantining %s', update_path)
+            self.stats.quarantines += 1
+            self.logger.increment('quarantines')
+            target_path = os.path.join(device, 'quarantined', 'objects',
+                                       os.path.basename(update_path))
+            renamer(update_path, target_path, fsync=False)
+            try:
+                # If this was the last async_pending in the directory,
+                # then this will succeed. Otherwise, it'll fail, and
+                # that's okay.
+                os.rmdir(os.path.dirname(update_path))
+            except OSError:
+                pass
+            return
+
+    def _iter_async_pendings(self, device):
+        """
+        Locate and yield an update context for all the async pending files on
+        the device. Each update context contains details of the async pending
+        file location, its timestamp and the un-pickled update data.
+
+        Async pending files that fail to load will be quarantined.
+
+        Only the most recent update for the same object is yielded; older
+        (stale) async pending files are unlinked as they are located.
+
+        The iterator tries to clean up empty directories as it goes.
+        """
+        # loop through async pending dirs for all policies
+        for asyncdir in self._listdir(device):
+            # we only care about directories
+            async_pending = os.path.join(device, asyncdir)
+            if not asyncdir.startswith(ASYNCDIR_BASE):
+                # skip stuff like "accounts", "containers", etc.
+                continue
+            if not os.path.isdir(async_pending):
+                continue
+            try:
+                base, policy = split_policy_string(asyncdir)
+            except PolicyError as e:
+                # This isn't an error, but a misconfiguration. Logging a
+                # warning should be sufficient.
+                self.logger.warning('Directory %(directory)r does not map '
+                                    'to a valid policy (%(error)s)', {
+                                        'directory': asyncdir, 'error': e})
+                continue
+            prefix_dirs = self._listdir(async_pending)
+            shuffle(prefix_dirs)
+            for prefix in prefix_dirs:
+                prefix_path = os.path.join(async_pending, prefix)
+                if not os.path.isdir(prefix_path):
+                    continue
+                last_obj_hash = None
+                for update_file in sorted(self._listdir(prefix_path),
+                                          reverse=True):
+                    update_path = os.path.join(prefix_path, update_file)
+                    if not os.path.isfile(update_path):
+                        continue
+                    try:
+                        obj_hash, timestamp = update_file.split('-')
+                    except ValueError:
+                        self.stats.errors += 1
+                        self.logger.increment('errors')
+                        self.logger.error(
+                            'ERROR async pending file with unexpected '
+                            'name %s', update_path)
+                        continue
+                    # Async pendings are stored on disk like this:
+                    #
+                    # <device>/async_pending/<suffix>/<obj_hash>-<timestamp>
+                    #
+                    # If there are multiple updates for a given object,
+                    # they'll look like this:
+                    #
+                    # <device>/async_pending/<obj_suffix>/<obj_hash>-<timestamp1>
+                    # <device>/async_pending/<obj_suffix>/<obj_hash>-<timestamp2>
+                    # <device>/async_pending/<obj_suffix>/<obj_hash>-<timestamp3>
+                    #
+                    # Async updates also have the property that newer
+                    # updates contain all the information in older updates.
+                    # Since we sorted the directory listing in reverse
+                    # order, we'll see timestamp3 first, yield it, and then
+                    # unlink timestamp2 and timestamp1 since we know they
+                    # are obsolete.
+                    #
+                    # This way, our caller only gets useful async_pendings.
+                    if obj_hash == last_obj_hash:
+                        self.stats.outdated_unlinks += 1
+                        self.logger.increment('outdated_unlinks')
+                        try:
+                            os.unlink(update_path)
+                        except OSError as e:
+                            if e.errno != errno.ENOENT:
+                                raise
+                    else:
+                        last_obj_hash = obj_hash
+                        update = self._load_update(device, update_path)
+                        if update is not None:
+                            yield {'device': device,
+                                   'policy': policy,
+                                   'update_path': update_path,
+                                   'obj_hash': obj_hash,
+                                   'timestamp': timestamp,
+                                   'update': update}
 
     def object_sweep(self, device):
         """
@@ -136,107 +764,232 @@ def object_sweep(self, device):
         :param device: path to device
         """
         start_time = time.time()
-        async_pending = os.path.join(device, ASYNCDIR)
-        if not os.path.isdir(async_pending):
-            return
-        for prefix in os.listdir(async_pending):
-            prefix_path = os.path.join(async_pending, prefix)
-            if not os.path.isdir(prefix_path):
-                continue
-            last_obj_hash = None
-            for update in sorted(os.listdir(prefix_path), reverse=True):
-                update_path = os.path.join(prefix_path, update)
-                if not os.path.isfile(update_path):
-                    continue
-                try:
-                    obj_hash, timestamp = update.split('-')
-                except ValueError:
-                    self.logger.increment('errors')
-                    self.logger.error(
-                        _('ERROR async pending file with unexpected name %s')
-                        % (update_path))
-                    continue
-                if obj_hash == last_obj_hash:
-                    self.logger.increment("unlinks")
-                    os.unlink(update_path)
-                else:
-                    self.process_object_update(update_path, device)
-                    last_obj_hash = obj_hash
-                time.sleep(self.slowdown)
-            try:
-                os.rmdir(prefix_path)
-            except OSError:
-                pass
+        last_status_update = start_time
+        start_stats = self.stats.copy()
+        my_pid = os.getpid()
+        self.logger.info("Object update sweep starting on %s (pid: %d)",
+                         device, my_pid)
+
+        ap_iter = RateLimitedIterator(
+            self._iter_async_pendings(device),
+            elements_per_second=self.max_objects_per_second)
+        ap_iter = BucketizedUpdateSkippingLimiter(
+            ap_iter, self.logger, self.stats,
+            self.per_container_ratelimit_buckets,
+            self.max_objects_per_container_per_second,
+            max_deferred_elements=self.max_deferred_updates,
+            drain_until=self.begin + self.interval)
+        with ContextPool(self.concurrency) as pool:
+            for update_ctx in ap_iter:
+                pool.spawn(self.process_object_update, **update_ctx)
+                now = time.time()
+                if now - last_status_update >= self.report_interval:
+                    this_sweep = self.stats.since(start_stats)
+                    self.logger.info(
+                        ('Object update sweep progress on %(device)s: '
+                         '%(elapsed).02fs, %(stats)s (pid: %(pid)d)'),
+                        {'device': device,
+                         'elapsed': now - start_time,
+                         'pid': my_pid,
+                         'stats': this_sweep})
+                    last_status_update = now
+            pool.waitall()
+
         self.logger.timing_since('timing', start_time)
+        sweep_totals = self.stats.since(start_stats)
+        self.logger.info(
+            ('Object update sweep completed on %(device)s '
+             'in %(elapsed).02fs seconds:, '
+             '%(successes)d successes, %(failures)d failures, '
+             '%(quarantines)d quarantines, '
+             '%(unlinks)d unlinks, '
+             '%(outdated_unlinks)d outdated_unlinks, '
+             '%(errors)d errors, '
+             '%(redirects)d redirects, '
+             '%(skips)d skips, '
+             '%(deferrals)d deferrals, '
+             '%(drains)d drains '
+             '(pid: %(pid)d)'),
+            {'device': device,
+             'elapsed': time.time() - start_time,
+             'pid': my_pid,
+             'successes': sweep_totals.successes,
+             'failures': sweep_totals.failures,
+             'quarantines': sweep_totals.quarantines,
+             'unlinks': sweep_totals.unlinks,
+             'outdated_unlinks': sweep_totals.outdated_unlinks,
+             'errors': sweep_totals.errors,
+             'redirects': sweep_totals.redirects,
+             'skips': sweep_totals.skips,
+             'deferrals': sweep_totals.deferrals,
+             'drains': sweep_totals.drains
+             })
 
-    def process_object_update(self, update_path, device):
+    def process_object_update(self, update_path, device, policy, update,
+                              **kwargs):
         """
         Process the object information to be updated and update.
 
         :param update_path: path to pickled object update file
         :param device: path to device
+        :param policy: storage policy of object update
+        :param update: the un-pickled update data
+        :param kwargs: un-used keys from update_ctx
         """
-        try:
-            update = pickle.load(open(update_path, 'rb'))
-        except Exception:
-            self.logger.exception(
-                _('ERROR Pickle problem, quarantining %s'), update_path)
-            self.logger.increment('quarantines')
-            renamer(update_path, os.path.join(
-                    device, 'quarantined', 'objects',
-                    os.path.basename(update_path)))
-            return
-        successes = update.get('successes', [])
-        part, nodes = self.get_container_ring().get_nodes(
-            update['account'], update['container'])
-        obj = '/%s/%s/%s' % \
-              (update['account'], update['container'], update['obj'])
-        success = True
-        new_successes = False
-        for node in nodes:
-            if node['id'] not in successes:
-                status = self.object_update(node, part, update['op'], obj,
-                                            update['headers'])
-                if not is_success(status) and status != HTTP_NOT_FOUND:
+
+        def do_update():
+            successes = update.get('successes', [])
+            headers_out = HeaderKeyDict(update['headers'].copy())
+            headers_out['user-agent'] = 'object-updater %s' % os.getpid()
+            headers_out.setdefault('X-Backend-Storage-Policy-Index',
+                                   str(int(policy)))
+            headers_out.setdefault('X-Backend-Accept-Redirect', 'true')
+            headers_out.setdefault('X-Backend-Accept-Quoted-Location', 'true')
+            acct, cont = split_update_path(update)
+            part, nodes = self.get_container_ring().get_nodes(acct, cont)
+            path = '/%s/%s/%s' % (acct, cont, update['obj'])
+            events = [spawn(self.object_update,
+                            node, part, update['op'], path, headers_out)
+                      for node in nodes if node['id'] not in successes]
+            success = True
+            new_successes = rewrite_pickle = False
+            redirect = None
+            redirects = set()
+            for event in events:
+                event_success, node_id, redirect = event.wait()
+                if event_success is True:
+                    successes.append(node_id)
+                    new_successes = True
+                else:
                     success = False
+                if redirect:
+                    redirects.add(redirect)
+
+            if success:
+                self.stats.successes += 1
+                self.logger.increment('successes')
+                self.logger.debug('Update sent for %(path)s %(update_path)s',
+                                  {'path': path, 'update_path': update_path})
+                self.stats.unlinks += 1
+                self.logger.increment('unlinks')
+                os.unlink(update_path)
+                try:
+                    # If this was the last async_pending in the directory,
+                    # then this will succeed. Otherwise, it'll fail, and
+                    # that's okay.
+                    os.rmdir(os.path.dirname(update_path))
+                except OSError:
+                    pass
+            elif redirects:
+                # erase any previous successes
+                update.pop('successes', None)
+                redirect = max(redirects, key=lambda x: x[-1])[0]
+                redirect_history = update.setdefault('redirect_history', [])
+                if redirect in redirect_history:
+                    # force next update to be sent to root, reset history
+                    update['container_path'] = None
+                    update['redirect_history'] = []
                 else:
-                    successes.append(node['id'])
-                    new_successes = True
-        if success:
-            self.successes += 1
-            self.logger.increment('successes')
-            self.logger.debug(_('Update sent for %(obj)s %(path)s'),
-                              {'obj': obj, 'path': update_path})
-            self.logger.increment("unlinks")
-            os.unlink(update_path)
-        else:
-            self.failures += 1
-            self.logger.increment('failures')
-            self.logger.debug(_('Update failed for %(obj)s %(path)s'),
-                              {'obj': obj, 'path': update_path})
-            if new_successes:
-                update['successes'] = successes
-                write_pickle(update, update_path, os.path.join(device, 'tmp'))
-
-    def object_update(self, node, part, op, obj, headers):
+                    update['container_path'] = redirect
+                    redirect_history.append(redirect)
+                self.stats.redirects += 1
+                self.logger.increment("redirects")
+                self.logger.debug(
+                    'Update redirected for %(path)s %(update_path)s to '
+                    '%(shard)s',
+                    {'path': path, 'update_path': update_path,
+                     'shard': update['container_path']})
+                rewrite_pickle = True
+            else:
+                self.stats.failures += 1
+                self.logger.increment('failures')
+                self.logger.debug('Update failed for %(path)s %(update_path)s',
+                                  {'path': path, 'update_path': update_path})
+                self.oldest_async_pendings.add_update(
+                    acct, cont, kwargs['timestamp']
+                )
+                if new_successes:
+                    update['successes'] = successes
+                    rewrite_pickle = True
+
+            return rewrite_pickle, redirect
+
+        rewrite_pickle, redirect = do_update()
+        if redirect:
+            # make one immediate retry to the redirect location
+            rewrite_pickle, redirect = do_update()
+        if rewrite_pickle:
+            write_pickle(update, update_path, os.path.join(
+                device, get_tmp_dir(policy)))
+
+    def object_update(self, node, part, op, path, headers_out):
         """
         Perform the object update to the container
 
         :param node: node dictionary from the container ring
         :param part: partition that holds the container
-        :param op: operation performed (ex: 'POST' or 'DELETE')
-        :param obj: object name being updated
-        :param headers: headers to send with the update
+        :param op: operation performed (ex: 'PUT' or 'DELETE')
+        :param path: /<acct>/<cont>/<obj> path being updated
+        :param headers_out: headers to send with the update
+        :return: a tuple of (``success``, ``node_id``, ``redirect``)
+            where ``success`` is True if the update succeeded, ``node_id`` is
+            the_id of the node updated and ``redirect`` is either None or a
+            tuple of (a path, a timestamp string).
         """
+        redirect = None
+        start = time.time()
+        # Assume an error until we hear otherwise
+        status = 500
         try:
             with ConnectionTimeout(self.conn_timeout):
-                conn = http_connect(node['ip'], node['port'], node['device'],
-                                    part, op, obj, headers)
+                conn = http_connect(
+                    node['replication_ip'], node['replication_port'],
+                    node['device'], part, op, path, headers_out)
             with Timeout(self.node_timeout):
                 resp = conn.getresponse()
                 resp.read()
-                return resp.status
-        except (Exception, Timeout):
-            self.logger.exception(_('ERROR with remote server '
-                                    '%(ip)s:%(port)s/%(device)s'), node)
-        return HTTP_INTERNAL_SERVER_ERROR
+            status = resp.status
+
+            if status == HTTP_MOVED_PERMANENTLY:
+                try:
+                    redirect = get_redirect_data(resp)
+                except ValueError as err:
+                    self.logger.error(
+                        'Container update failed for %r; problem with '
+                        'redirect location: %s' % (path, err))
+
+            success = is_success(status)
+            if not success:
+                self.logger.debug(
+                    'Error code %(status)d is returned from remote '
+                    'server %(node)s',
+                    {'status': resp.status,
+                     'node': node_to_string(node, replication=True)})
+            return success, node['id'], redirect
+        except Exception:
+            self.logger.exception('ERROR with remote server %s',
+                                  node_to_string(node, replication=True))
+        except Timeout as exc:
+            action = 'connecting to'
+            if not isinstance(exc, ConnectionTimeout):
+                # i.e., we definitely made the request but gave up
+                # waiting for the response
+                status = 499
+                action = 'waiting on'
+            self.logger.info(
+                'Timeout %s remote server %s: %s',
+                action, node_to_string(node, replication=True), exc)
+        finally:
+            elapsed = time.time() - start
+            self.logger.timing('updater.timing.status.%s' % status,
+                               elapsed * 1000)
+        return HTTP_INTERNAL_SERVER_ERROR, node['id'], redirect
+
+
+def main():
+    conf_file, options = parse_options(once=True)
+    run_daemon(ObjectUpdater, conf_file, **options)
+
+
+if __name__ == '__main__':
+    main()
diff --git a/swift/obj/watchers/__init__.py b/swift/obj/watchers/__init__.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/swift/obj/watchers/dark_data.py b/swift/obj/watchers/dark_data.py
new file mode 100644
index 0000000000..bf976dbefe
--- /dev/null
+++ b/swift/obj/watchers/dark_data.py
@@ -0,0 +1,213 @@
+# Copyright (c) 2019 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+#
+# This is an audit watcher that manages the dark data in the cluster.
+# Since the API for audit watchers is intended to use external plugins,
+# this code is invoked as if it were external: through load_pkg_resources().
+# Our setup.py comes pre-configured for convenience, but the operator has
+# to enable this watcher honestly by additing DarkDataWatcher to watchers=
+# in object-server.conf. The default is off, as if this does not exist.
+# Which is for the best, because of a large performance impact of this.
+#
+
+"""
+The name of "Dark Data" refers to the scientific hypothesis of Dark Matter,
+which supposes that the universe contains a lot of matter than we cannot
+observe. The Dark Data in Swift is the name of objects that are not
+accounted in the containers.
+
+The experience of running large scale clusters suggests that Swift does
+not have any particular bugs that trigger creation of dark data. So,
+this is an excercise in writing watchers, with a plausible function.
+
+When enabled, Dark Data watcher definitely drags down the cluster's overall
+performance. Of course, the load increase can be mitigated as usual,
+but at the expense of the total time taken by the pass of auditor.
+
+Because the watcher only deems an object dark when all container
+servers agree, it will silently fail to detect anything if even one
+of container servers in the ring is down or unreacheable. This is
+done in the interest of operators who run with action=delete.
+
+If a container is sharded, there is a small edgecase where an object row could
+be misplaced. So it is recommended to always start with action=log, before
+your confident to run action=delete.
+
+Finally, keep in mind that Dark Data watcher needs the container
+ring to operate, but runs on an object node. This can come up if
+cluster has nodes separated by function.
+"""
+
+import os
+import random
+import shutil
+import time
+
+from eventlet import Timeout
+
+from swift.common.direct_client import direct_get_container
+from swift.common.exceptions import ClientException, QuarantineRequest
+from swift.common.ring import Ring
+from swift.common.utils import split_path, Namespace, Timestamp
+
+
+class ContainerError(Exception):
+    pass
+
+
+class DarkDataWatcher(object):
+    def __init__(self, conf, logger):
+
+        self.logger = logger
+
+        swift_dir = '/etc/swift'
+        self.container_ring = Ring(swift_dir, ring_name='container')
+        self.dark_data_policy = conf.get('action')
+        if self.dark_data_policy not in ['log', 'delete', 'quarantine']:
+            if self.dark_data_policy is not None:
+                self.logger.warning(
+                    "Dark data action %r unknown, defaults to action = 'log'" %
+                    (self.dark_data_policy,))
+            self.dark_data_policy = 'log'
+        self.grace_age = int(conf.get('grace_age', 604800))
+
+    def start(self, audit_type, **other_kwargs):
+        self.is_zbf = audit_type == 'ZBF'
+        self.tot_unknown = 0
+        self.tot_dark = 0
+        self.tot_okay = 0
+
+    def policy_based_object_handling(self, data_file_path, metadata):
+        obj_path = metadata['name']
+
+        if self.dark_data_policy == "quarantine":
+            self.logger.info("quarantining dark data %s" % obj_path)
+            raise QuarantineRequest
+        elif self.dark_data_policy == "log":
+            self.logger.info("reporting dark data %s" % obj_path)
+        elif self.dark_data_policy == "delete":
+            obj_dir = os.path.dirname(data_file_path)
+            self.logger.info("deleting dark data %s" % obj_dir)
+            shutil.rmtree(obj_dir)
+
+    def see_object(self, object_metadata, data_file_path, **other_kwargs):
+
+        # No point in loading the container servers with unnecessary requests.
+        if self.is_zbf:
+            return
+
+        put_tstr = object_metadata['X-Timestamp']
+        if float(Timestamp(put_tstr)) + self.grace_age >= time.time():
+            # We can add "tot_new" if lumping these with the good objects
+            # ever bothers anyone.
+            self.tot_okay += 1
+            return
+
+        obj_path = object_metadata['name']
+        try:
+            obj_info = get_info_1(self.container_ring, obj_path)
+        except ContainerError:
+            self.tot_unknown += 1
+            return
+
+        if obj_info is None:
+            self.tot_dark += 1
+            self.policy_based_object_handling(data_file_path, object_metadata)
+        else:
+            # OK, object is there, but in the future we might want to verify
+            # more. Watch out for versioned objects, EC, and all that.
+            self.tot_okay += 1
+
+    def end(self, **other_kwargs):
+        if self.is_zbf:
+            return
+        self.logger.info("total unknown %d ok %d dark %d" %
+                         (self.tot_unknown, self.tot_okay, self.tot_dark))
+
+
+#
+# Get the information for 1 object from container server
+#
+def get_info_1(container_ring, obj_path):
+
+    path_comps = split_path(obj_path, 1, 3, True)
+    account_name = path_comps[0]
+    container_name = path_comps[1]
+    obj_name = path_comps[2]
+    visited = set()
+
+    def check_container(account_name, container_name):
+        record_type = 'auto'
+        if (account_name, container_name) in visited:
+            # Already queried; So we have a last ditch effort and specifically
+            # ask for object data as this could be pointing back to the root
+            # If the container doesn't have objects then this will return
+            # no objects and break the loop.
+            record_type = 'object'
+        else:
+            visited.add((account_name, container_name))
+
+        container_part, container_nodes = \
+            container_ring.get_nodes(account_name, container_name)
+        if not container_nodes:
+            raise ContainerError()
+
+        # Perhaps we should do something about the way we select the container
+        # nodes. For now we just shuffle. It spreads the load, but it does not
+        # improve upon the the case when some nodes are down, so auditor slows
+        # to a crawl (if this plugin is enabled).
+        random.shuffle(container_nodes)
+
+        err_flag = 0
+        shards = set()
+        for node in container_nodes:
+            try:
+                # The prefix+limit trick is used when a traditional listing
+                # is returned, while includes is there for shards.
+                # See the how GET routes it in swift/container/server.py.
+                headers, objs_or_shards = direct_get_container(
+                    node, container_part, account_name, container_name,
+                    prefix=obj_name, limit=1,
+                    extra_params={'includes': obj_name, 'states': 'listing'},
+                    headers={'X-Backend-Record-Type': record_type})
+            except (ClientException, Timeout):
+                # Something is wrong with that server, treat as an error.
+                err_flag += 1
+                continue
+            if headers.get('X-Backend-Record-Type') == 'shard':
+                # When using includes=obj_name, we don't need to anything
+                # like find_shard_range(obj_name, ... objs_or_shards).
+                if len(objs_or_shards) != 0:
+                    namespace = Namespace(objs_or_shards[0]['name'],
+                                          objs_or_shards[0]['lower'],
+                                          objs_or_shards[0]['upper'])
+                    shards.add((namespace.account, namespace.container))
+                continue
+            if objs_or_shards and objs_or_shards[0]['name'] == obj_name:
+                return objs_or_shards[0]
+
+        # If we got back some shards, recurse
+        for account_name, container_name in shards:
+            res = check_container(account_name, container_name)
+            if res:
+                return res
+
+        # We only report the object as dark if all known servers agree to it.
+        if err_flag:
+            raise ContainerError()
+        return None
+
+    return check_container(account_name, container_name)
diff --git a/swift/proxy/controllers/__init__.py b/swift/proxy/controllers/__init__.py
index 516f3c2859..706fd9165c 100644
--- a/swift/proxy/controllers/__init__.py
+++ b/swift/proxy/controllers/__init__.py
@@ -1,4 +1,26 @@
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
 from swift.proxy.controllers.base import Controller
-from swift.proxy.controllers.obj import ObjectController
+from swift.proxy.controllers.info import InfoController
+from swift.proxy.controllers.obj import ObjectControllerRouter
 from swift.proxy.controllers.account import AccountController
 from swift.proxy.controllers.container import ContainerController
+
+__all__ = [
+    'AccountController',
+    'ContainerController',
+    'Controller',
+    'InfoController',
+    'ObjectControllerRouter',
+]
diff --git a/swift/proxy/controllers/account.py b/swift/proxy/controllers/account.py
index 4237c5cfe8..340e14384b 100644
--- a/swift/proxy/controllers/account.py
+++ b/swift/proxy/controllers/account.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,26 +13,18 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-# NOTE: swift_conn
-# You'll see swift_conn passed around a few places in this file. This is the
-# source httplib connection of whatever it is attached to.
-#   It is used when early termination of reading from the connection should
-# happen, such as when a range request is satisfied but there's still more the
-# source connection would like to send. To prevent having to read all the data
-# that could be left, the source connection can be .close() and then reads
-# commence to empty out any buffers.
-#   These shenanigans are to ensure all related objects can be garbage
-# collected. We've seen objects hang around forever otherwise.
+from urllib.parse import unquote
 
-import time
-from urllib import unquote
-from random import shuffle
-
-from swift.common.utils import normalize_timestamp, public
-from swift.common.constraints import check_metadata, MAX_ACCOUNT_NAME_LENGTH
-from swift.common.http import is_success, HTTP_NOT_FOUND
-from swift.proxy.controllers.base import Controller, get_account_memcache_key
-from swift.common.swob import HTTPBadRequest, HTTPMethodNotAllowed, Request
+from swift.account.utils import account_listing_response
+from swift.common.middleware.acl import parse_acl, format_acl
+from swift.common.utils import public
+from swift.common.constraints import check_metadata
+from swift.common.http import HTTP_NOT_FOUND, HTTP_GONE
+from swift.proxy.controllers.base import Controller, clear_info_cache, \
+    set_info_cache, NodeIter
+from swift.common.middleware import listing_formats
+from swift.common.swob import HTTPBadRequest, HTTPMethodNotAllowed
+from swift.common.request_helpers import get_sys_meta_prefix
 
 
 class AccountController(Controller):
@@ -40,39 +32,78 @@ class AccountController(Controller):
     server_type = 'Account'
 
     def __init__(self, app, account_name, **kwargs):
-        Controller.__init__(self, app)
+        super(AccountController, self).__init__(app)
         self.account_name = unquote(account_name)
         if not self.app.allow_account_management:
             self.allowed_methods.remove('PUT')
             self.allowed_methods.remove('DELETE')
 
+    def add_acls_from_sys_metadata(self, resp):
+        if resp.environ['REQUEST_METHOD'] in ('HEAD', 'GET', 'PUT', 'POST'):
+            prefix = get_sys_meta_prefix('account') + 'core-'
+            name = 'access-control'
+            (extname, intname) = ('x-account-' + name, prefix + name)
+            acl_dict = parse_acl(version=2, data=resp.headers.pop(intname))
+            if acl_dict:  # treat empty dict as empty header
+                resp.headers[extname] = format_acl(
+                    version=2, acl_dict=acl_dict)
+
     def GETorHEAD(self, req):
         """Handler for HTTP GET/HEAD requests."""
-        partition, nodes = self.app.account_ring.get_nodes(self.account_name)
-        shuffle(nodes)
+        length_limit = self.get_name_length_limit()
+        if len(self.account_name) > length_limit:
+            resp = HTTPBadRequest(request=req)
+            resp.body = b'Account name length of %d longer than %d' % \
+                        (len(self.account_name), length_limit)
+            # Don't cache this. We know the account doesn't exist because
+            # the name is bad; we don't need to cache that because it's
+            # really cheap to recompute.
+            return resp
+
+        partition = self.app.account_ring.get_part(self.account_name)
+        concurrency = self.app.account_ring.replica_count \
+            if self.app.get_policy_options(None).concurrent_gets else 1
+        node_iter = NodeIter(
+            'account', self.app, self.app.account_ring, partition,
+            self.logger, req)
+        params = req.params
+        params['format'] = 'json'
+        req.params = params
         resp = self.GETorHEAD_base(
-            req, _('Account'), partition, nodes, req.path_info.rstrip('/'),
-            len(nodes))
-        if resp.status_int == HTTP_NOT_FOUND and self.app.account_autocreate:
-            if len(self.account_name) > MAX_ACCOUNT_NAME_LENGTH:
-                resp = HTTPBadRequest(request=req)
-                resp.body = 'Account name length of %d longer than %d' % \
-                            (len(self.account_name), MAX_ACCOUNT_NAME_LENGTH)
-                return resp
-            headers = {'X-Timestamp': normalize_timestamp(time.time()),
-                       'X-Trans-Id': self.trans_id,
-                       'Connection': 'close'}
-            resp = self.make_requests(
-                Request.blank('/v1/' + self.account_name),
-                self.app.account_ring, partition, 'PUT',
-                '/' + self.account_name, [headers] * len(nodes))
-            if not is_success(resp.status_int):
-                self.app.logger.warning('Could not autocreate account %r' %
-                                        self.account_name)
-                return resp
-            resp = self.GETorHEAD_base(
-                req, _('Account'), partition, nodes, req.path_info.rstrip('/'),
-                len(nodes))
+            req, 'Account', node_iter, partition,
+            req.swift_entity_path.rstrip('/'), concurrency)
+        if resp.status_int == HTTP_NOT_FOUND:
+            if resp.headers.get('X-Account-Status', '').lower() == 'deleted':
+                resp.status = HTTP_GONE
+            elif self.app.account_autocreate:
+                # This is kind of a lie; we pretend like the account is
+                # there, but it's not. We'll create it as soon as something
+                # tries to write to it, but we don't need databases on disk
+                # to tell us that nothing's there.
+                #
+                # We set a header so that certain consumers can tell it's a
+                # fake listing. The important one is the PUT of a container
+                # to an autocreate account; the proxy checks to see if the
+                # account exists before actually performing the PUT and
+                # creates the account if necessary. If we feed it a perfect
+                # lie, it'll just try to create the container without
+                # creating the account, and that'll fail.
+                resp = account_listing_response(
+                    self.account_name, req,
+                    listing_formats.get_listing_content_type(req))
+                resp.headers['X-Backend-Fake-Account-Listing'] = 'yes'
+
+        # Cache this. We just made a request to a storage node and got
+        # up-to-date information for the account.
+        resp.headers['X-Backend-Recheck-Account-Existence'] = str(
+            self.app.recheck_account_existence)
+        set_info_cache(req.environ, self.account_name, None, resp)
+
+        if req.environ.get('swift_owner'):
+            self.add_acls_from_sys_metadata(resp)
+        else:
+            for header in self.app.swift_owner_headers:
+                resp.headers.pop(header, None)
         return resp
 
     @public
@@ -85,75 +116,66 @@ def PUT(self, req):
         error_response = check_metadata(req, 'account')
         if error_response:
             return error_response
-        if len(self.account_name) > MAX_ACCOUNT_NAME_LENGTH:
+        length_limit = self.get_name_length_limit()
+        if len(self.account_name) > length_limit:
             resp = HTTPBadRequest(request=req)
-            resp.body = 'Account name length of %d longer than %d' % \
-                        (len(self.account_name), MAX_ACCOUNT_NAME_LENGTH)
+            resp.body = b'Account name length of %d longer than %d' % \
+                        (len(self.account_name), length_limit)
             return resp
         account_partition, accounts = \
             self.app.account_ring.get_nodes(self.account_name)
-        headers = {'X-Timestamp': normalize_timestamp(time.time()),
-                   'x-trans-id': self.trans_id,
-                   'Connection': 'close'}
-        self.transfer_headers(req.headers, headers)
-        if self.app.memcache:
-            self.app.memcache.delete(
-                get_account_memcache_key(self.account_name))
+        headers = self.generate_request_headers(req, transfer=True)
+        clear_info_cache(req.environ, self.account_name)
         resp = self.make_requests(
             req, self.app.account_ring, account_partition, 'PUT',
-            req.path_info, [headers] * len(accounts))
+            req.swift_entity_path, [headers] * len(accounts))
+        self.add_acls_from_sys_metadata(resp)
         return resp
 
     @public
     def POST(self, req):
         """HTTP POST request handler."""
+        length_limit = self.get_name_length_limit()
+        if len(self.account_name) > length_limit:
+            resp = HTTPBadRequest(request=req)
+            resp.body = b'Account name length of %d longer than %d' % \
+                        (len(self.account_name), length_limit)
+            return resp
         error_response = check_metadata(req, 'account')
         if error_response:
             return error_response
         account_partition, accounts = \
             self.app.account_ring.get_nodes(self.account_name)
-        headers = {'X-Timestamp': normalize_timestamp(time.time()),
-                   'X-Trans-Id': self.trans_id,
-                   'Connection': 'close'}
-        self.transfer_headers(req.headers, headers)
-        if self.app.memcache:
-            self.app.memcache.delete(
-                get_account_memcache_key(self.account_name))
+        headers = self.generate_request_headers(req, transfer=True)
+        clear_info_cache(req.environ, self.account_name)
         resp = self.make_requests(
             req, self.app.account_ring, account_partition, 'POST',
-            req.path_info, [headers] * len(accounts))
+            req.swift_entity_path, [headers] * len(accounts))
         if resp.status_int == HTTP_NOT_FOUND and self.app.account_autocreate:
-            if len(self.account_name) > MAX_ACCOUNT_NAME_LENGTH:
-                resp = HTTPBadRequest(request=req)
-                resp.body = 'Account name length of %d longer than %d' % \
-                            (len(self.account_name), MAX_ACCOUNT_NAME_LENGTH)
-                return resp
+            self.autocreate_account(req, self.account_name)
             resp = self.make_requests(
-                Request.blank('/v1/' + self.account_name),
-                self.app.account_ring, account_partition, 'PUT',
-                '/' + self.account_name, [headers] * len(accounts))
-            if not is_success(resp.status_int):
-                self.app.logger.warning('Could not autocreate account %r' %
-                                        self.account_name)
-                return resp
+                req, self.app.account_ring, account_partition, 'POST',
+                req.swift_entity_path, [headers] * len(accounts))
+        self.add_acls_from_sys_metadata(resp)
         return resp
 
     @public
     def DELETE(self, req):
         """HTTP DELETE request handler."""
+        # Extra safety in case someone typos a query string for an
+        # account-level DELETE request that was really meant to be caught by
+        # some middleware.
+        if req.query_string:
+            return HTTPBadRequest(request=req)
         if not self.app.allow_account_management:
             return HTTPMethodNotAllowed(
                 request=req,
                 headers={'Allow': ', '.join(self.allowed_methods)})
         account_partition, accounts = \
             self.app.account_ring.get_nodes(self.account_name)
-        headers = {'X-Timestamp': normalize_timestamp(time.time()),
-                   'X-Trans-Id': self.trans_id,
-                   'Connection': 'close'}
-        if self.app.memcache:
-            self.app.memcache.delete(
-                get_account_memcache_key(self.account_name))
+        headers = self.generate_request_headers(req)
+        clear_info_cache(req.environ, self.account_name)
         resp = self.make_requests(
             req, self.app.account_ring, account_partition, 'DELETE',
-            req.path_info, [headers] * len(accounts))
+            req.swift_entity_path, [headers] * len(accounts))
         return resp
diff --git a/swift/proxy/controllers/base.py b/swift/proxy/controllers/base.py
index 200e9682ff..259a69a968 100644
--- a/swift/proxy/controllers/base.py
+++ b/swift/proxy/controllers/base.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2016 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -15,7 +15,7 @@
 
 # NOTE: swift_conn
 # You'll see swift_conn passed around a few places in this file. This is the
-# source httplib connection of whatever it is attached to.
+# source bufferedhttp connection of whatever it is attached to.
 #   It is used when early termination of reading from the connection should
 # happen, such as when a range request is satisfied but there's still more the
 # source connection would like to send. To prevent having to read all the data
@@ -24,102 +24,1874 @@
 #   These shenanigans are to ensure all related objects can be garbage
 # collected. We've seen objects hang around forever otherwise.
 
+from urllib.parse import quote
+
 import time
+import json
 import functools
 import inspect
+import itertools
+import operator
+import random
+from copy import deepcopy
+from types import SimpleNamespace
+
+from eventlet.timeout import Timeout
+
+from swift.common.memcached import MemcacheConnectionError
+from swift.common.wsgi import make_pre_authed_env, make_pre_authed_request
+from swift.common.utils import Timestamp, WatchdogTimeout, config_true_value, \
+    public, split_path, list_from_csv, GreenthreadSafeIterator, \
+    GreenAsyncPile, quorum_size, parse_content_type, drain_and_close, \
+    document_iters_to_http_response_body, cache_from_env, \
+    CooperativeIterator, NamespaceBoundList, Namespace, ClosingMapper
+from swift.common.bufferedhttp import http_connect
+from swift.common import constraints
+from swift.common.exceptions import ChunkReadTimeout, ChunkWriteTimeout, \
+    ConnectionTimeout, RangeAlreadyComplete, ShortReadError
+from swift.common.header_key_dict import HeaderKeyDict
+from swift.common.http import is_informational, is_success, is_redirection, \
+    is_server_error, HTTP_OK, HTTP_PARTIAL_CONTENT, HTTP_MULTIPLE_CHOICES, \
+    HTTP_BAD_REQUEST, HTTP_NOT_FOUND, HTTP_UNAUTHORIZED, HTTP_CONTINUE, \
+    HTTP_GONE, HTTP_REQUESTED_RANGE_NOT_SATISFIABLE
+from swift.common.swob import Request, Response, Range, \
+    HTTPException, HTTPRequestedRangeNotSatisfiable, HTTPServiceUnavailable, \
+    status_map, wsgi_to_str, str_to_wsgi, wsgi_quote, wsgi_unquote, \
+    normalize_etag
+from swift.common.request_helpers import strip_sys_meta_prefix, \
+    strip_user_meta_prefix, is_user_meta, is_sys_meta, is_sys_or_user_meta, \
+    http_response_to_document_iters, is_object_transient_sysmeta, \
+    strip_object_transient_sysmeta_prefix, get_ip_port, get_user_meta_prefix, \
+    get_sys_meta_prefix, is_use_replication_network
+from swift.common.storage_policy import POLICIES
+
+DEFAULT_RECHECK_ACCOUNT_EXISTENCE = 60  # seconds
+DEFAULT_RECHECK_CONTAINER_EXISTENCE = 60  # seconds
+DEFAULT_RECHECK_UPDATING_SHARD_RANGES = 3600  # seconds
+DEFAULT_RECHECK_LISTING_SHARD_RANGES = 600  # seconds
+
+
+def update_headers(response, headers):
+    """
+    Helper function to update headers in the response.
+
+    :param response: swob.Response object
+    :param headers: dictionary headers
+    """
+    if hasattr(headers, 'items'):
+        headers = headers.items()
+    for name, value in headers:
+        if name.lower() == 'etag':
+            response.headers[name] = value.replace('"', '')
+        elif name.lower() not in (
+                'date', 'content-length', 'content-type',
+                'connection', 'x-put-timestamp', 'x-delete-after'):
+            response.headers[name] = value
+
+
+def delay_denial(func):
+    """
+    Decorator to declare which methods should have any swift.authorize call
+    delayed. This is so the method can load the Request object up with
+    additional information that may be needed by the authorization system.
+
+    :param func: function for which authorization will be delayed
+    """
+    func.delay_denial = True
+    return func
+
+
+def _prep_headers_to_info(headers, server_type):
+    """
+    Helper method that iterates once over a dict of headers,
+    converting all keys to lower case and separating
+    into subsets containing user metadata, system metadata
+    and other headers.
+    """
+    meta = {}
+    sysmeta = {}
+    other = {}
+    for key, val in dict(headers).items():
+        lkey = wsgi_to_str(key).lower()
+        val = wsgi_to_str(val) if isinstance(val, str) else val
+        if is_user_meta(server_type, lkey):
+            meta[strip_user_meta_prefix(server_type, lkey)] = val
+        elif is_sys_meta(server_type, lkey):
+            sysmeta[strip_sys_meta_prefix(server_type, lkey)] = val
+        else:
+            other[lkey] = val
+    return other, meta, sysmeta
+
+
+def headers_to_account_info(headers, status_int=HTTP_OK):
+    """
+    Construct a cacheable dict of account info based on response headers.
+    """
+    headers, meta, sysmeta = _prep_headers_to_info(headers, 'account')
+    account_info = {
+        'status': status_int,
+        # 'container_count' anomaly:
+        # Previous code sometimes expects an int sometimes a string
+        # Current code aligns to str and None, yet translates to int in
+        # deprecated functions as needed
+        'container_count': headers.get('x-account-container-count'),
+        'total_object_count': headers.get('x-account-object-count'),
+        'bytes': headers.get('x-account-bytes-used'),
+        'storage_policies': {policy.idx: {
+            'container_count': int(headers.get(
+                'x-account-storage-policy-{}-container-count'.format(
+                    policy.name), 0)),
+            'object_count': int(headers.get(
+                'x-account-storage-policy-{}-object-count'.format(
+                    policy.name), 0)),
+            'bytes': int(headers.get(
+                'x-account-storage-policy-{}-bytes-used'.format(
+                    policy.name), 0))}
+            for policy in POLICIES
+        },
+        'meta': meta,
+        'sysmeta': sysmeta,
+    }
+    if is_success(status_int):
+        account_info['account_really_exists'] = not config_true_value(
+            headers.get('x-backend-fake-account-listing'))
+    return account_info
+
+
+def headers_to_container_info(headers, status_int=HTTP_OK):
+    """
+    Construct a cacheable dict of container info based on response headers.
+    """
+    headers, meta, sysmeta = _prep_headers_to_info(headers, 'container')
+    return {
+        'status': status_int,
+        'read_acl': headers.get('x-container-read'),
+        'write_acl': headers.get('x-container-write'),
+        'sync_to': headers.get('x-container-sync-to'),
+        'sync_key': headers.get('x-container-sync-key'),
+        'object_count': headers.get('x-container-object-count'),
+        'bytes': headers.get('x-container-bytes-used'),
+        'versions': headers.get('x-versions-location'),
+        'storage_policy': headers.get('x-backend-storage-policy-index', '0'),
+        'cors': {
+            'allow_origin': meta.get('access-control-allow-origin'),
+            'expose_headers': meta.get('access-control-expose-headers'),
+            'max_age': meta.get('access-control-max-age')
+        },
+        'meta': meta,
+        'sysmeta': sysmeta,
+        'sharding_state': headers.get('x-backend-sharding-state', 'unsharded'),
+        # the 'internal' format version of timestamps is cached since the
+        # normal format can be derived from this when required
+        'created_at': headers.get('x-backend-timestamp'),
+        'put_timestamp': headers.get('x-backend-put-timestamp'),
+        'delete_timestamp': headers.get('x-backend-delete-timestamp'),
+        'status_changed_at': headers.get('x-backend-status-changed-at'),
+    }
+
+
+def headers_from_container_info(info):
+    """
+    Construct a HeaderKeyDict from a container info dict.
+
+    :param info: a dict of container metadata
+    :returns: a HeaderKeyDict or None if info is None or any required headers
+        could not be constructed
+    """
+    if not info:
+        return None
+
+    required = (
+        ('x-backend-timestamp', 'created_at'),
+        ('x-backend-put-timestamp', 'put_timestamp'),
+        ('x-backend-delete-timestamp', 'delete_timestamp'),
+        ('x-backend-status-changed-at', 'status_changed_at'),
+        ('x-backend-storage-policy-index', 'storage_policy'),
+        ('x-container-object-count', 'object_count'),
+        ('x-container-bytes-used', 'bytes'),
+        ('x-backend-sharding-state', 'sharding_state'),
+    )
+    required_normal_format_timestamps = (
+        ('x-timestamp', 'created_at'),
+        ('x-put-timestamp', 'put_timestamp'),
+    )
+    optional = (
+        ('x-container-read', 'read_acl'),
+        ('x-container-write', 'write_acl'),
+        ('x-container-sync-key', 'sync_key'),
+        ('x-container-sync-to', 'sync_to'),
+        ('x-versions-location', 'versions'),
+    )
+    cors_optional = (
+        ('access-control-allow-origin', 'allow_origin'),
+        ('access-control-expose-headers', 'expose_headers'),
+        ('access-control-max-age', 'max_age')
+    )
+
+    def lookup(info, key):
+        # raises KeyError or ValueError
+        val = info[key]
+        if val is None:
+            raise ValueError
+        return val
+
+    # note: required headers may be missing from info for example during
+    # upgrade when stale info is still in cache
+    headers = HeaderKeyDict()
+    for hdr, key in required:
+        try:
+            headers[hdr] = lookup(info, key)
+        except (KeyError, ValueError):
+            return None
+
+    for hdr, key in required_normal_format_timestamps:
+        try:
+            headers[hdr] = Timestamp(lookup(info, key)).normal
+        except (KeyError, ValueError):
+            return None
+
+    for hdr, key in optional:
+        try:
+            headers[hdr] = lookup(info, key)
+        except (KeyError, ValueError):
+            pass
+
+    policy_index = info.get('storage_policy')
+    headers['x-storage-policy'] = POLICIES[int(policy_index)].name
+    prefix = get_user_meta_prefix('container')
+    headers.update(
+        (prefix + k, v)
+        for k, v in info.get('meta', {}).items())
+    for hdr, key in cors_optional:
+        try:
+            headers[prefix + hdr] = lookup(info.get('cors'), key)
+        except (KeyError, ValueError):
+            pass
+    prefix = get_sys_meta_prefix('container')
+    headers.update(
+        (prefix + k, v)
+        for k, v in info.get('sysmeta', {}).items())
+
+    return headers
+
+
+def headers_to_object_info(headers, status_int=HTTP_OK):
+    """
+    Construct a cacheable dict of object info based on response headers.
+    """
+    headers, meta, sysmeta = _prep_headers_to_info(headers, 'object')
+    transient_sysmeta = {}
+    for key, val in headers.items():
+        if is_object_transient_sysmeta(key):
+            key = strip_object_transient_sysmeta_prefix(key.lower())
+            transient_sysmeta[key] = val
+    info = {'status': status_int,
+            'length': headers.get('content-length'),
+            'type': headers.get('content-type'),
+            'etag': headers.get('etag'),
+            'meta': meta,
+            'sysmeta': sysmeta,
+            'transient_sysmeta': transient_sysmeta
+            }
+    return info
+
+
+def cors_validation(func):
+    """
+    Decorator to check if the request is a CORS request and if so, if it's
+    valid.
+
+    :param func: function to check
+    """
+    @functools.wraps(func)
+    def wrapped(*a, **kw):
+        controller = a[0]
+        req = a[1]
+
+        # The logic here was interpreted from
+        #    http://www.w3.org/TR/cors/#resource-requests
+
+        # Is this a CORS request?
+        req_origin = req.headers.get('Origin', None)
+        if req_origin:
+            # Yes, this is a CORS request so test if the origin is allowed
+            container_info = \
+                controller.container_info(controller.account_name,
+                                          controller.container_name, req)
+            cors_info = container_info.get('cors', {})
+
+            # Call through to the decorated method
+            resp = func(*a, **kw)
+
+            if controller.app.strict_cors_mode and \
+                    not controller.is_origin_allowed(cors_info, req_origin):
+                return resp
+
+            # Expose,
+            #  - simple response headers,
+            #    http://www.w3.org/TR/cors/#simple-response-header
+            #  - swift specific: etag, x-timestamp, x-trans-id
+            #  - headers provided by the operator in cors_expose_headers
+            #  - user metadata headers
+            #  - headers provided by the user in
+            #    x-container-meta-access-control-expose-headers
+            if 'Access-Control-Expose-Headers' not in resp.headers:
+                expose_headers = set([
+                    'cache-control', 'content-language', 'content-type',
+                    'expires', 'last-modified', 'pragma', 'etag',
+                    'x-timestamp', 'x-trans-id', 'x-openstack-request-id'])
+                expose_headers.update(controller.app.cors_expose_headers)
+                for header in resp.headers:
+                    if header.startswith('X-Container-Meta') or \
+                            header.startswith('X-Object-Meta'):
+                        expose_headers.add(header.lower())
+                if cors_info.get('expose_headers'):
+                    expose_headers = expose_headers.union(
+                        [header_line.strip().lower()
+                         for header_line in
+                         cors_info['expose_headers'].split(' ')
+                         if header_line.strip()])
+                resp.headers['Access-Control-Expose-Headers'] = \
+                    ', '.join(expose_headers)
+
+            # The user agent won't process the response if the Allow-Origin
+            # header isn't included
+            if 'Access-Control-Allow-Origin' not in resp.headers:
+                if cors_info['allow_origin'] and \
+                        cors_info['allow_origin'].strip() == '*':
+                    resp.headers['Access-Control-Allow-Origin'] = '*'
+                else:
+                    resp.headers['Access-Control-Allow-Origin'] = req_origin
+                    if 'Vary' in resp.headers:
+                        resp.headers['Vary'] += ', Origin'
+                    else:
+                        resp.headers['Vary'] = 'Origin'
+
+            return resp
+        else:
+            # Not a CORS request so make the call as normal
+            return func(*a, **kw)
+
+    return wrapped
+
+
+def get_object_info(env, app, path=None, swift_source=None):
+    """
+    Get the info structure for an object, based on env and app.
+    This is useful to middlewares.
+
+    .. note::
+
+        This call bypasses auth. Success does not imply that the request has
+        authorization to the object.
+    """
+    (version, account, container, obj) = \
+        split_path(path or env['PATH_INFO'], 4, 4, True)
+    info = _get_object_info(app, env, account, container, obj,
+                            swift_source=swift_source)
+    if info:
+        info = deepcopy(info)
+    else:
+        info = headers_to_object_info({}, 0)
+
+    for field in ('length',):
+        if info.get(field) is None:
+            info[field] = 0
+        else:
+            info[field] = int(info[field])
+
+    return info
+
+
+def _record_ac_info_cache_metrics(
+        app, cache_state, container=None, resp=None):
+    """
+    Record a single cache operation by account or container lookup into its
+    corresponding metrics.
+
+    :param  app: the application object
+    :param  cache_state: the state of this cache operation, includes
+                infocache_hit, memcache hit, miss, error, skip, force_skip
+                and disabled.
+    :param  container: the container name
+    :param  resp: the response from either backend or cache hit.
+    """
+    try:
+        proxy_app = app._pipeline_final_app
+    except AttributeError:
+        logger = None
+    else:
+        logger = proxy_app.logger
+    server_type = 'container' if container else 'account'
+    if logger:
+        record_cache_op_metrics(logger, server_type, 'info', cache_state, resp)
+
+
+def get_container_info(env, app, swift_source=None, cache_only=False):
+    """
+    Get the info structure for a container, based on env and app.
+    This is useful to middlewares.
+
+    :param env: the environment used by the current request
+    :param app: the application object
+    :param swift_source: Used to mark the request as originating out of
+                         middleware. Will be logged in proxy logs.
+    :param cache_only: If true, indicates that caller doesn't want to HEAD the
+                       backend container when cache miss.
+    :returns: the object info
+
+    .. note::
+
+        This call bypasses auth. Success does not imply that the request has
+        authorization to the container.
+    """
+    (version, wsgi_account, wsgi_container, unused) = \
+        split_path(env['PATH_INFO'], 3, 4, True)
+
+    if not constraints.valid_api_version(version):
+        # Not a valid Swift request; return 0 like we do
+        # if there's an account failure
+        return headers_to_container_info({}, 0)
+
+    account = wsgi_to_str(wsgi_account)
+    container = wsgi_to_str(wsgi_container)
+
+    # Try to cut through all the layers to the proxy app
+    # (while also preserving logging)
+    try:
+        logged_app = app._pipeline_request_logging_app
+        proxy_app = app._pipeline_final_app
+    except AttributeError:
+        logged_app = proxy_app = app
+    # Check in environment cache and in memcache (in that order)
+    info, cache_state = _get_info_from_caches(
+        proxy_app, env, account, container)
+
+    resp = None
+    if not info and not cache_only:
+        # Cache miss; go HEAD the container and populate the caches
+        env.setdefault('swift.infocache', {})
+        # Before checking the container, make sure the account exists.
+        #
+        # If it is an autocreateable account, just assume it exists; don't
+        # HEAD the account, as a GET or HEAD response for an autocreateable
+        # account is successful whether the account actually has .db files
+        # on disk or not.
+        is_autocreate_account = account.startswith(
+            constraints.AUTO_CREATE_ACCOUNT_PREFIX)
+        if not is_autocreate_account:
+            account_info = get_account_info(env, logged_app, swift_source)
+            if not account_info or not is_success(account_info['status']):
+                _record_ac_info_cache_metrics(
+                    logged_app, cache_state, container)
+                return headers_to_container_info({}, 0)
+
+        req = _prepare_pre_auth_info_request(
+            env, ("/%s/%s/%s" % (version, wsgi_account, wsgi_container)),
+            (swift_source or 'GET_CONTAINER_INFO'))
+        # *Always* allow reserved names for get-info requests -- it's on the
+        # caller to keep the result private-ish
+        req.headers['X-Backend-Allow-Reserved-Names'] = 'true'
+        resp = req.get_response(logged_app)
+        drain_and_close(resp)
+        # Check in infocache to see if the proxy (or anyone else) already
+        # populated the cache for us. If they did, just use what's there.
+        #
+        # See similar comment in get_account_info() for justification.
+        info = _get_info_from_infocache(env, account, container)
+        if info is None:
+            info = set_info_cache(env, account, container, resp)
+
+    if info:
+        info = deepcopy(info)  # avoid mutating what's in swift.infocache
+    else:
+        status_int = 0 if cache_only else 503
+        info = headers_to_container_info({}, status_int)
+
+    # Old data format in memcache immediately after a Swift upgrade; clean
+    # it up so consumers of get_container_info() aren't exposed to it.
+    if 'object_count' not in info and 'container_size' in info:
+        info['object_count'] = info.pop('container_size')
+
+    for field in ('storage_policy', 'bytes', 'object_count'):
+        if info.get(field) is None:
+            info[field] = 0
+        else:
+            info[field] = int(info[field])
+
+    if info.get('sharding_state') is None:
+        info['sharding_state'] = 'unsharded'
+
+    versions_cont = info.get('sysmeta', {}).get('versions-container', '')
+    if versions_cont:
+        versions_cont = wsgi_unquote(str_to_wsgi(
+            versions_cont)).split('/')[0]
+        versions_req = _prepare_pre_auth_info_request(
+            env, ("/%s/%s/%s" % (version, wsgi_account, versions_cont)),
+            (swift_source or 'GET_CONTAINER_INFO'))
+        versions_req.headers['X-Backend-Allow-Reserved-Names'] = 'true'
+        versions_info = get_container_info(versions_req.environ, app)
+        info['bytes'] = info['bytes'] + versions_info['bytes']
+
+    _record_ac_info_cache_metrics(logged_app, cache_state, container, resp)
+    return info
+
+
+def get_account_info(env, app, swift_source=None):
+    """
+    Get the info structure for an account, based on env and app.
+    This is useful to middlewares.
+
+    .. note::
+
+        This call bypasses auth. Success does not imply that the request has
+        authorization to the account.
+
+    :raises ValueError: when path doesn't contain an account
+    """
+    (version, wsgi_account, _junk) = split_path(env['PATH_INFO'], 2, 3, True)
+
+    if not constraints.valid_api_version(version):
+        return headers_to_account_info({}, 0)
+
+    account = wsgi_to_str(wsgi_account)
+
+    # Try to cut through all the layers to the proxy app
+    # (while also preserving logging)
+    try:
+        app = app._pipeline_request_logging_app
+    except AttributeError:
+        pass
+    # Check in environment cache and in memcache (in that order)
+    info, cache_state = _get_info_from_caches(app, env, account)
+
+    # Cache miss; go HEAD the account and populate the caches
+    if info:
+        resp = None
+    else:
+        env.setdefault('swift.infocache', {})
+        req = _prepare_pre_auth_info_request(
+            env, "/%s/%s" % (version, wsgi_account),
+            (swift_source or 'GET_ACCOUNT_INFO'))
+        # *Always* allow reserved names for get-info requests -- it's on the
+        # caller to keep the result private-ish
+        req.headers['X-Backend-Allow-Reserved-Names'] = 'true'
+        resp = req.get_response(app)
+        drain_and_close(resp)
+        # Check in infocache to see if the proxy (or anyone else) already
+        # populated the cache for us. If they did, just use what's there.
+        #
+        # The point of this is to avoid setting the value in memcached
+        # twice. Otherwise, we're needlessly sending requests across the
+        # network.
+        #
+        # If the info didn't make it into the cache, we'll compute it from
+        # the response and populate the cache ourselves.
+        #
+        # Note that this is taking "exists in infocache" to imply "exists in
+        # memcache". That's because we're trying to avoid superfluous
+        # network traffic, and checking in memcache prior to setting in
+        # memcache would defeat the purpose.
+        info = _get_info_from_infocache(env, account)
+        if info is None:
+            info = set_info_cache(env, account, None, resp)
+
+    if info:
+        info = info.copy()  # avoid mutating what's in swift.infocache
+    else:
+        info = headers_to_account_info({}, 503)
+
+    for field in ('container_count', 'bytes', 'total_object_count'):
+        if info.get(field) is None:
+            info[field] = 0
+        else:
+            info[field] = int(info[field])
+
+    _record_ac_info_cache_metrics(app, cache_state, container=None, resp=resp)
+    return info
+
+
+def get_cache_key(account, container=None, obj=None, shard=None):
+    """
+    Get the keys for both memcache and env['swift.infocache'] (cache_key)
+    where info about accounts, containers, and objects is cached
+
+    :param account: The name of the account
+    :param container: The name of the container (or None if account)
+    :param obj: The name of the object (or None if account or container)
+    :param shard: Sharding state for the container query; typically 'updating'
+                  or 'listing' (Requires account and container; cannot use
+                  with obj)
+    :returns: a (native) string cache_key
+    """
+    def to_native(s):
+        if s is None or isinstance(s, str):
+            return s
+        return s.decode('utf8', 'surrogateescape')
+
+    account = to_native(account)
+    container = to_native(container)
+    obj = to_native(obj)
+
+    if shard:
+        if not (account and container):
+            raise ValueError('Shard cache key requires account and container')
+        if obj:
+            raise ValueError('Shard cache key cannot have obj')
+        cache_key = 'shard-%s-v2/%s/%s' % (shard, account, container)
+    elif obj:
+        if not (account and container):
+            raise ValueError('Object cache key requires account and container')
+        cache_key = 'object/%s/%s/%s' % (account, container, obj)
+    elif container:
+        if not account:
+            raise ValueError('Container cache key requires account')
+        cache_key = 'container/%s/%s' % (account, container)
+    else:
+        cache_key = 'account/%s' % account
+    # Use a unique environment cache key per account and one container.
+    # This allows caching both account and container and ensures that when we
+    # copy this env to form a new request, it won't accidentally reuse the
+    # old container or account info
+    return cache_key
+
+
+def set_info_cache(env, account, container, resp):
+    """
+    Cache info in both memcache and env.
+
+    :param  env: the WSGI request environment
+    :param  account: the unquoted account name
+    :param  container: the unquoted container name or None
+    :param  resp: the response received or None if info cache should be cleared
+
+    :returns: the info that was placed into the cache, or None if the
+              request status was not in (404, 410, 2xx).
+    """
+    cache_key = get_cache_key(account, container)
+    infocache = env.setdefault('swift.infocache', {})
+    memcache = cache_from_env(env, True)
+    if resp is None:
+        clear_info_cache(env, account, container)
+        return
+
+    if container:
+        cache_time = int(resp.headers.get(
+            'X-Backend-Recheck-Container-Existence',
+            DEFAULT_RECHECK_CONTAINER_EXISTENCE))
+    else:
+        cache_time = int(resp.headers.get(
+            'X-Backend-Recheck-Account-Existence',
+            DEFAULT_RECHECK_ACCOUNT_EXISTENCE))
+
+    if resp.status_int in (HTTP_NOT_FOUND, HTTP_GONE):
+        cache_time *= 0.1
+    elif not is_success(resp.status_int):
+        # If we got a response, it was unsuccessful, and it wasn't an
+        # "authoritative" failure, bail without touching caches.
+        return
+
+    if container:
+        info = headers_to_container_info(resp.headers, resp.status_int)
+    else:
+        info = headers_to_account_info(resp.headers, resp.status_int)
+    if memcache:
+        memcache.set(cache_key, info, time=cache_time)
+    infocache[cache_key] = info
+    return info
+
+
+def set_object_info_cache(app, env, account, container, obj, resp):
+    """
+    Cache object info in the WSGI environment, but not in memcache. Caching
+    in memcache would lead to cache pressure and mass evictions due to the
+    large number of objects in a typical Swift cluster. This is a
+    per-request cache only.
+
+    :param  app: the application object
+    :param env: the environment used by the current request
+    :param  account: the unquoted account name
+    :param  container: the unquoted container name
+    :param  obj: the unquoted object name
+    :param  resp: a GET or HEAD response received from an object server, or
+              None if info cache should be cleared
+    :returns: the object info
+    """
+
+    cache_key = get_cache_key(account, container, obj)
+
+    if 'swift.infocache' in env and not resp:
+        env['swift.infocache'].pop(cache_key, None)
+        return
+
+    info = headers_to_object_info(resp.headers, resp.status_int)
+    env.setdefault('swift.infocache', {})[cache_key] = info
+    return info
+
+
+def clear_info_cache(env, account, container=None, shard=None):
+    """
+    Clear the cached info in both memcache and env
+
+    :param  env: the WSGI request environment
+    :param  account: the account name
+    :param  container: the container name if clearing info for containers, or
+              None
+    :param  shard: the sharding state if clearing info for container shard
+              ranges, or None
+    """
+    cache_key = get_cache_key(account, container, shard=shard)
+    infocache = env.setdefault('swift.infocache', {})
+    memcache = cache_from_env(env, True)
+    infocache.pop(cache_key, None)
+    if memcache:
+        memcache.delete(cache_key)
+
+
+def _get_info_from_infocache(env, account, container=None):
+    """
+    Get cached account or container information from request-environment
+    cache (swift.infocache).
+
+    :param  env: the environment used by the current request
+    :param  account: the account name
+    :param  container: the container name
+
+    :returns: a dictionary of cached info on cache hit, None on miss
+    """
+    cache_key = get_cache_key(account, container)
+    if 'swift.infocache' in env and cache_key in env['swift.infocache']:
+        return env['swift.infocache'][cache_key]
+    return None
+
+
+def record_cache_op_metrics(
+        logger, server_type, op_type, cache_state, resp=None):
+    """
+    Record a single cache operation into its corresponding metrics.
+
+    :param  logger: the metrics logger
+    :param  server_type: 'account' or 'container'
+    :param  op_type: the name of the operation type, includes 'shard_listing',
+              'shard_updating', and etc.
+    :param  cache_state: the state of this cache operation. When it's
+              'infocache_hit' or memcache 'hit', expect it succeeded and 'resp'
+              will be None; for all other cases like memcache 'miss' or 'skip'
+              which will make to backend, expect a valid 'resp'.
+    :param  resp: the response from backend for all cases except cache hits.
+    """
+    server_type = server_type.lower()
+    if cache_state == 'infocache_hit':
+        logger.increment('%s.%s.infocache.hit' % (server_type, op_type))
+    elif cache_state == 'hit':
+        # memcache hits.
+        logger.increment('%s.%s.cache.hit' % (server_type, op_type))
+    else:
+        # the cases of cache_state is memcache miss, error, skip, force_skip
+        # or disabled.
+        if resp:
+            logger.increment('%s.%s.cache.%s.%d' % (
+                server_type, op_type, cache_state, resp.status_int))
+        else:
+            # In some situation, we choose not to lookup backend after cache
+            # miss.
+            logger.increment('%s.%s.cache.%s' % (
+                server_type, op_type, cache_state))
+
+
+def _get_info_from_memcache(app, env, account, container=None):
+    """
+    Get cached account or container information from memcache
+
+    :param  app: the application object
+    :param  env: the environment used by the current request
+    :param  account: the account name
+    :param  container: the container name
+
+    :returns: a tuple of two values, the first is a dictionary of cached info
+      on cache hit, None on miss or if memcache is not in use; the second is
+      cache state.
+    """
+    memcache = cache_from_env(env, True)
+    if not memcache:
+        return None, 'disabled'
+
+    try:
+        proxy_app = app._pipeline_final_app
+    except AttributeError:
+        # Only the middleware entry-points get a reference to the
+        # proxy-server app; if a middleware composes itself as multiple
+        # filters, we'll just have to choose a reasonable default
+        skip_chance = 0.0
+    else:
+        if container:
+            skip_chance = proxy_app.container_existence_skip_cache
+        else:
+            skip_chance = proxy_app.account_existence_skip_cache
+
+    cache_key = get_cache_key(account, container)
+    if skip_chance and random.random() < skip_chance:
+        info = None
+        cache_state = 'skip'
+    else:
+        info = memcache.get(cache_key)
+        cache_state = 'hit' if info else 'miss'
+    if info:
+        env.setdefault('swift.infocache', {})[cache_key] = info
+    return info, cache_state
+
+
+def _get_info_from_caches(app, env, account, container=None):
+    """
+    Get the cached info from env or memcache (if used) in that order.
+    Used for both account and container info.
+
+    :param  app: the application object
+    :param  env: the environment used by the current request
+    :returns: a tuple of (the cached info or None if not cached, cache state)
+    """
+
+    info = _get_info_from_infocache(env, account, container)
+    if info:
+        cache_state = 'infocache_hit'
+    else:
+        info, cache_state = _get_info_from_memcache(
+            app, env, account, container)
+    return info, cache_state
+
+
+def namespace_bounds_to_list(bounds):
+    """
+    This function converts the namespaces bounds to ``NamespaceBoundList``.
+
+    :param  bounds: a list of namespaces bounds(tuple of lower and name).
+    :returns: the object instance of ``NamespaceBoundList``; None if ``bounds``
+        is None or empty.
+    """
+    ns_bound_list = None
+    if bounds:
+        ns_bound_list = NamespaceBoundList(bounds)
+    return ns_bound_list
+
+
+def namespace_list_to_bounds(ns_bound_list):
+    """
+    This function converts ``NamespaceBoundList`` to the namespaces bounds.
+
+    :param  ns_bound_list: an object instance of ``NamespaceBoundList``.
+    :returns: a list of namespaces bounds(tuple of lower and name); None if
+        ``ns_bound_list`` is None or empty.
+    """
+    bounds = None
+    if ns_bound_list:
+        bounds = ns_bound_list.bounds
+    return bounds
+
+
+def get_namespaces_from_cache(req, cache_key, skip_chance):
+    """
+    Get cached namespaces from infocache or memcache.
+
+    :param req: a :class:`swift.common.swob.Request` object.
+    :param cache_key: the cache key for both infocache and memcache.
+    :param skip_chance: the probability of skipping the memcache look-up.
+    :return: a tuple of (value, cache state). Value is an instance of
+        :class:`swift.common.utils.NamespaceBoundList` if a non-empty list is
+        found in memcache. Otherwise value is ``None``, for example if memcache
+        look-up was skipped, or no value was found, or an empty list was found.
+    """
+    # try get namespaces from infocache first
+    infocache = req.environ.setdefault('swift.infocache', {})
+    ns_bound_list = infocache.get(cache_key)
+    if ns_bound_list:
+        return ns_bound_list, 'infocache_hit'
+
+    # then try get them from memcache
+    memcache = cache_from_env(req.environ, True)
+    if skip_chance and random.random() < skip_chance:
+        return None, 'skip'
+    try:
+        bounds = memcache.get(cache_key, raise_on_error=True)
+        cache_state = 'hit' if bounds else 'miss'
+    except MemcacheConnectionError:
+        bounds = None
+        cache_state = 'error'
+
+    ns_bound_list = namespace_bounds_to_list(bounds)
+    infocache[cache_key] = ns_bound_list
+    return ns_bound_list, cache_state
+
+
+def set_namespaces_in_cache(req, cache_key, ns_bound_list, time):
+    """
+    Set a list of namespace bounds in infocache and memcache.
+
+    :param req: a :class:`swift.common.swob.Request` object.
+    :param cache_key: the cache key for both infocache and memcache.
+    :param ns_bound_list: a :class:`swift.common.utils.NamespaceBoundList`;
+                          should NOT be None nor empty.
+    :param time: how long the namespaces should remain in memcache.
+    :return: the cache_state.
+    """
+    if cache_key.startswith('shard-updating'):
+        raise ValueError('shard-updating cache should use '
+                         'CooperativeNamespaceCachePopulator')
+    infocache = req.environ.setdefault('swift.infocache', {})
+    infocache[cache_key] = ns_bound_list
+    memcache = cache_from_env(req.environ, True)
+    if memcache:
+        bounds = namespace_list_to_bounds(ns_bound_list)
+        try:
+            memcache.set(cache_key, bounds, time=time, raise_on_error=True)
+        except MemcacheConnectionError:
+            cache_state = 'set_error'
+        else:
+            cache_state = 'set'
+    else:
+        # N.B. get_namespaces_from_cache is used for both types of namespace
+        # cache objects (updating and listing), and both code paths only call
+        # that helper if memcache is enabled.  But this function is now only
+        # used to set cache *listing* namespace objects over in
+        # ContainerController, so if that code path learns to not call it when
+        # memcache is disabled this func could also drop cache_state=disabled
+        cache_state = 'disabled'
+    return cache_state
+
+
+def _prepare_pre_auth_info_request(env, path, swift_source):
+    """
+    Prepares a pre authed request to obtain info using a HEAD.
+
+    :param env: the environment used by the current request
+    :param path: The unquoted, WSGI-str request path
+    :param swift_source: value for swift.source in WSGI environment
+    :returns: the pre authed request
+    """
+    # Set the env for the pre_authed call without a query string
+    newenv = make_pre_authed_env(env, 'HEAD', path, agent='Swift',
+                                 query_string='', swift_source=swift_source)
+    # This is a sub request for container metadata- drop the Origin header from
+    # the request so the it is not treated as a CORS request.
+    newenv.pop('HTTP_ORIGIN', None)
+
+    # ACLs are only shown to account owners, so let's make sure this request
+    # looks like it came from the account owner.
+    newenv['swift_owner'] = True
+
+    # Note that Request.blank expects quoted path
+    return Request.blank(wsgi_quote(path), environ=newenv)
+
+
+def get_info(app, env, account, container=None, swift_source=None):
+    """
+    Get info about accounts or containers
+
+    Note: This call bypasses auth. Success does not imply that the
+          request has authorization to the info.
+
+    :param app: the application object
+    :param env: the environment used by the current request
+    :param account: The unquoted name of the account
+    :param container: The unquoted name of the container (or None if account)
+    :param swift_source: swift source logged for any subrequests made while
+                         retrieving the account or container info
+    :returns: information about the specified entity in a dictionary. See
+      get_account_info and get_container_info for details on what's in the
+      dictionary.
+    """
+    env.setdefault('swift.infocache', {})
+
+    if container:
+        path = '/v1/%s/%s' % (account, container)
+        path_env = env.copy()
+        path_env['PATH_INFO'] = path
+        return get_container_info(path_env, app, swift_source=swift_source)
+    else:
+        # account info
+        path = '/v1/%s' % (account,)
+        path_env = env.copy()
+        path_env['PATH_INFO'] = path
+        return get_account_info(path_env, app, swift_source=swift_source)
+
+
+def _get_object_info(app, env, account, container, obj, swift_source=None):
+    """
+    Get the info about object
+
+    Note: This call bypasses auth. Success does not imply that the
+          request has authorization to the info.
+
+    :param app: the application object
+    :param env: the environment used by the current request
+    :param account: The unquoted, WSGI-str name of the account
+    :param container: The unquoted, WSGI-str name of the container
+    :param obj: The unquoted, WSGI-str name of the object
+    :returns: the cached info or None if cannot be retrieved
+    """
+    cache_key = get_cache_key(account, container, obj)
+    info = env.get('swift.infocache', {}).get(cache_key)
+    if info:
+        return info
+    # Not in cache, let's try the object servers
+    path = '/v1/%s/%s/%s' % (account, container, obj)
+    req = _prepare_pre_auth_info_request(env, path, swift_source)
+    # *Always* allow reserved names for get-info requests -- it's on the
+    # caller to keep the result private-ish
+    req.headers['X-Backend-Allow-Reserved-Names'] = 'true'
+    resp = req.get_response(app)
+    # Unlike get_account_info() and get_container_info(), we don't save
+    # things in memcache, so we can store the info without network traffic,
+    # *and* the proxy doesn't cache object info for us, so there's no chance
+    # that the object info would be in the environment. Thus, we just
+    # compute the object info based on the response and stash it in
+    # swift.infocache.
+    info = set_object_info_cache(app, env, account, container, obj, resp)
+    return info
+
+
+def close_swift_conn(src):
+    """
+    Force close the http connection to the backend.
+
+    :param src: the response from the backend
+    """
+    try:
+        # Since the backends set "Connection: close" in their response
+        # headers, the response object (src) is solely responsible for the
+        # socket. The connection object (src.swift_conn) has no references
+        # to the socket, so calling its close() method does nothing, and
+        # therefore we don't do it.
+        #
+        # Also, since calling the response's close() method might not
+        # close the underlying socket but only decrement some
+        # reference-counter, we have a special method here that really,
+        # really kills the underlying socket with a close() syscall.
+        src.nuke_from_orbit()  # it's the only way to be sure
+    except Exception:
+        pass
+
+
+def bytes_to_skip(record_size, range_start):
+    """
+    Assume an object is composed of N records, where the first N-1 are all
+    the same size and the last is at most that large, but may be smaller.
+
+    When a range request is made, it might start with a partial record. This
+    must be discarded, lest the consumer get bad data. This is particularly
+    true of suffix-byte-range requests, e.g. "Range: bytes=-12345" where the
+    size of the object is unknown at the time the request is made.
+
+    This function computes the number of bytes that must be discarded to
+    ensure only whole records are yielded. Erasure-code decoding needs this.
+
+    This function could have been inlined, but it took enough tries to get
+    right that some targeted unit tests were desirable, hence its extraction.
+    """
+    return (record_size - (range_start % record_size)) % record_size
+
+
+def is_good_source(status, server_type):
+    """
+    Indicates whether or not the request made to the backend found
+    what it was looking for.
+
+    :param resp: the response from the backend.
+    :param server_type: the type of server: 'Account', 'Container' or 'Object'.
+    :returns: True if the response status code is acceptable, False if not.
+    """
+    if (server_type == 'Object' and
+            status == HTTP_REQUESTED_RANGE_NOT_SATISFIABLE):
+        return True
+    return is_success(status) or is_redirection(status)
+
+
+def is_useful_response(resp, node):
+    if not resp:
+        return False
+    if ('handoff_index' in node
+            and resp.status == 404
+            and resp.getheader('x-backend-timestamp') is None):
+        # a 404 from a handoff are not considered authoritative unless they
+        # have an x-backend-timestamp that indicates that there is a tombstone
+        return False
+    return True
+
+
+class ByteCountEnforcer(object):
+    """
+    Enforces that successive calls to file_like.read() give at least
+    <nbytes> bytes before exhaustion.
+
+    If file_like fails to do so, ShortReadError is raised.
+
+    If more than <nbytes> bytes are read, we don't care.
+    """
+
+    def __init__(self, file_like, nbytes):
+        """
+        :param file_like: file-like object
+        :param nbytes: number of bytes expected, or None if length is unknown.
+        """
+        self.file_like = file_like
+        self.nbytes = self.bytes_left = nbytes
+
+    def read(self, amt=None):
+        chunk = self.file_like.read(amt)
+        if self.bytes_left is None:
+            return chunk
+        elif len(chunk) == 0 and self.bytes_left > 0:
+            raise ShortReadError(
+                "Too few bytes; read %d, expecting %d" % (
+                    self.nbytes - self.bytes_left, self.nbytes))
+        else:
+            self.bytes_left -= len(chunk)
+            return chunk
+
+
+class GetterSource(object):
+    """
+    Encapsulates properties of a source from which a GET response is read.
+
+    :param app: a proxy app.
+    :param resp: an instance of ``HTTPResponse``.
+    :param node: a dict describing the node from which the response was
+        returned.
+    """
+    __slots__ = ('app', 'resp', 'node', '_parts_iter')
+
+    def __init__(self, app, resp, node):
+        self.app = app
+        self.resp = resp
+        self.node = node
+        self._parts_iter = None
+
+    @property
+    def timestamp(self):
+        """
+        Provide the timestamp of the swift http response as a Timestamp
+        instance.  Used as a sort key.
+
+        :return: an instance of ``utils.Timestamp``
+        """
+        return Timestamp(self.resp.getheader('x-backend-data-timestamp') or
+                         self.resp.getheader('x-backend-timestamp') or
+                         self.resp.getheader('x-put-timestamp') or
+                         self.resp.getheader('x-timestamp') or
+                         Timestamp.zero())
+
+    @property
+    def parts_iter(self):
+        # lazy load a source response body parts iter if and when the source is
+        # actually read
+        if self.resp and not self._parts_iter:
+            self._parts_iter = http_response_to_document_iters(
+                self.resp, read_chunk_size=self.app.object_chunk_size)
+        return self._parts_iter
+
+    def close(self):
+        # Close-out the connection as best as possible.
+        close_swift_conn(self.resp)
+
+
+class GetterBase(object):
+    """
+    This base class provides helper methods for handling GET requests to
+    backend servers.
+
+    :param app: a proxy app.
+    :param req: an instance of ``swob.Request``.
+    :param node_iter: an iterator yielding nodes.
+    :param partition: partition.
+    :param policy: the policy instance, or None if Account or Container.
+    :param path: path for the request.
+    :param backend_headers: a dict of headers to be sent with backend requests.
+    :param node_timeout: the timeout value for backend requests.
+    :param resource_type: a string description of the type of resource being
+        accessed; ``resource type`` is used in logs and isn't necessarily the
+        server type.
+    :param logger: a logger instance.
+    """
+
+    def __init__(self, app, req, node_iter, partition, policy,
+                 path, backend_headers, node_timeout, resource_type,
+                 logger=None):
+        self.app = app
+        self.req = req
+        self.node_iter = node_iter
+        self.partition = partition
+        self.policy = policy
+        self.path = path
+        self.backend_headers = backend_headers
+        # resource type is used in logs and isn't necessarily the server type
+        self.resource_type = resource_type
+        self.node_timeout = node_timeout
+        self.logger = logger or app.logger
+        self.bytes_used_from_backend = 0
+        self.source = None
+
+    def _find_source(self):
+        """
+        Look for a suitable new source and if one is found then set
+        ``self.source``.
+
+        :return: ``True`` if ``self.source`` has been updated, ``False``
+            otherwise.
+        """
+        # Subclasses must implement this method, but _replace_source should be
+        # called to get a source installed
+        raise NotImplementedError()
+
+    def _replace_source(self, err_msg=''):
+        if self.source:
+            self.app.error_occurred(self.source.node, err_msg)
+            self.source.close()
+        return self._find_source()
+
+    def _get_next_response_part(self):
+        # return the next part of the response body; there may only be one part
+        # unless it's a multipart/byteranges response
+        while True:
+            # the loop here is to resume if trying to parse
+            # multipart/byteranges response raises a ChunkReadTimeout
+            # and resets the source_parts_iter
+            try:
+                with WatchdogTimeout(self.app.watchdog, self.node_timeout,
+                                     ChunkReadTimeout):
+                    # If we don't have a multipart/byteranges response,
+                    # but just a 200 or a single-range 206, then this
+                    # performs no IO, and either just returns source or
+                    # raises StopIteration.
+                    # Otherwise, this call to next() performs IO when
+                    # we have a multipart/byteranges response, as it
+                    # will read the MIME boundary and part headers. In this
+                    # case, ChunkReadTimeout may also be raised.
+                    # If StopIteration is raised, it escapes and is
+                    # handled elsewhere.
+                    start_byte, end_byte, length, headers, part = next(
+                        self.source.parts_iter)
+                return (start_byte, end_byte, length, headers, part)
+            except ChunkReadTimeout:
+                if not self._replace_source(
+                        'Trying to read next part of %s multi-part GET '
+                        '(retrying)' % self.resource_type):
+                    raise
+
+    def fast_forward(self, num_bytes):
+        """
+        Will skip num_bytes into the current ranges.
+
+        :params num_bytes: the number of bytes that have already been read on
+                           this request. This will change the Range header
+                           so that the next req will start where it left off.
+
+        :raises HTTPRequestedRangeNotSatisfiable: if begin + num_bytes
+                                                  > end of range + 1
+        :raises RangeAlreadyComplete: if begin + num_bytes == end of range + 1
+        """
+        self.backend_headers.pop(
+            'X-Backend-Ignore-Range-If-Metadata-Present', None)
+
+        try:
+            req_range = Range(self.backend_headers.get('Range'))
+        except ValueError:
+            req_range = None
+
+        if req_range:
+            begin, end = req_range.ranges[0]
+            if begin is None:
+                # this is a -50 range req (last 50 bytes of file)
+                end -= num_bytes
+                if end == 0:
+                    # we sent out exactly the first range's worth of bytes, so
+                    # we're done with it
+                    raise RangeAlreadyComplete()
+
+                if end < 0:
+                    raise HTTPRequestedRangeNotSatisfiable()
+
+            else:
+                begin += num_bytes
+                if end is not None and begin == end + 1:
+                    # we sent out exactly the first range's worth of bytes, so
+                    # we're done with it
+                    raise RangeAlreadyComplete()
+
+                if end is not None and begin > end:
+                    raise HTTPRequestedRangeNotSatisfiable()
+
+            req_range.ranges = [(begin, end)] + req_range.ranges[1:]
+            self.backend_headers['Range'] = str(req_range)
+        else:
+            self.backend_headers['Range'] = 'bytes=%d-' % num_bytes
+
+        # Reset so if we need to do this more than once, we don't double-up
+        self.bytes_used_from_backend = 0
+
+    def pop_range(self):
+        """
+        Remove the first byterange from our Range header.
+
+        This is used after a byterange has been completely sent to the
+        client; this way, should we need to resume the download from another
+        object server, we do not re-fetch byteranges that the client already
+        has.
+
+        If we have no Range header, this is a no-op.
+        """
+        if 'Range' in self.backend_headers:
+            try:
+                req_range = Range(self.backend_headers['Range'])
+            except ValueError:
+                # there's a Range header, but it's garbage, so get rid of it
+                self.backend_headers.pop('Range')
+                return
+            begin, end = req_range.ranges.pop(0)
+            if len(req_range.ranges) > 0:
+                self.backend_headers['Range'] = str(req_range)
+            else:
+                self.backend_headers.pop('Range')
+
+    def learn_size_from_content_range(self, start, end, length):
+        """
+        Sets our Range header's first byterange to the value learned from
+        the Content-Range header in the response; if we were given a
+        fully-specified range (e.g. "bytes=123-456"), this is a no-op.
+
+        If we were given a half-specified range (e.g. "bytes=123-" or
+        "bytes=-456"), then this changes the Range header to a
+        semantically-equivalent one *and* it lets us resume on a proper
+        boundary instead of just in the middle of a piece somewhere.
+        """
+        if length == 0:
+            return
+
+        if 'Range' in self.backend_headers:
+            try:
+                req_range = Range(self.backend_headers['Range'])
+                new_ranges = [(start, end)] + req_range.ranges[1:]
+            except ValueError:
+                new_ranges = [(start, end)]
+        else:
+            new_ranges = [(start, end)]
+
+        self.backend_headers['Range'] = (
+            "bytes=" + (",".join("%s-%s" % (s if s is not None else '',
+                                            e if e is not None else '')
+                                 for s, e in new_ranges)))
+
+
+class GetOrHeadHandler(GetterBase):
+    """
+    Handles GET requests to backend servers.
+
+    :param app: a proxy app.
+    :param req: an instance of ``swob.Request``.
+    :param server_type: server type used in logging
+    :param node_iter: an iterator yielding nodes.
+    :param partition: partition.
+    :param path: path for the request.
+    :param backend_headers: a dict of headers to be sent with backend requests.
+    :param concurrency: number of requests to run concurrently.
+    :param policy: the policy instance, or None if Account or Container.
+    :param logger: a logger instance.
+    """
+
+    def __init__(self, app, req, server_type, node_iter, partition, path,
+                 backend_headers, concurrency=1, policy=None, logger=None):
+        newest = config_true_value(req.headers.get('x-newest', 'f'))
+        if server_type == 'Object' and not newest:
+            node_timeout = app.recoverable_node_timeout
+        else:
+            node_timeout = app.node_timeout
+        super(GetOrHeadHandler, self).__init__(
+            app=app, req=req, node_iter=node_iter, partition=partition,
+            policy=policy, path=path, backend_headers=backend_headers,
+            node_timeout=node_timeout, resource_type=server_type.lower(),
+            logger=logger)
+        self.newest = newest
+        self.server_type = server_type
+        self.used_nodes = []
+        self.used_source_etag = None
+        self.concurrency = concurrency
+        self.latest_404_timestamp = Timestamp.zero()
+        policy_options = self.app.get_policy_options(self.policy)
+        self.rebalance_missing_suppression_count = min(
+            policy_options.rebalance_missing_suppression_count,
+            node_iter.num_primary_nodes - 1)
+
+        # populated when finding source
+        self.statuses = []
+        self.reasons = []
+        self.bodies = []
+        self.source_headers = []
+        self.sources = []
+
+        # populated from response headers
+        self.start_byte = self.end_byte = self.length = None
+
+    def _iter_bytes_from_response_part(self, part_file, nbytes):
+        # yield chunks of bytes from a single response part; if an error
+        # occurs, try to resume yielding bytes from a different source
+        part_file = ByteCountEnforcer(part_file, nbytes)
+        while True:
+            try:
+                with WatchdogTimeout(self.app.watchdog, self.node_timeout,
+                                     ChunkReadTimeout):
+                    chunk = part_file.read(self.app.object_chunk_size)
+                    if nbytes is not None:
+                        nbytes -= len(chunk)
+            except (ChunkReadTimeout, ShortReadError) as e:
+                if self.newest or self.server_type != 'Object':
+                    raise
+                try:
+                    self.fast_forward(self.bytes_used_from_backend)
+                except (HTTPException, ValueError):
+                    raise e
+                except RangeAlreadyComplete:
+                    break
+                if self._replace_source(
+                        'Trying to read object during GET (retrying)'):
+                    try:
+                        _junk, _junk, _junk, _junk, part_file = \
+                            self._get_next_response_part()
+                    except StopIteration:
+                        # Tried to find a new node from which to
+                        # finish the GET, but failed. There's
+                        # nothing more we can do here.
+                        raise e
+                    part_file = ByteCountEnforcer(part_file, nbytes)
+                else:
+                    raise e
+            else:
+                if not chunk:
+                    break
+
+                with WatchdogTimeout(self.app.watchdog,
+                                     self.app.client_timeout,
+                                     ChunkWriteTimeout):
+                    self.bytes_used_from_backend += len(chunk)
+                    yield chunk
+
+    def _iter_parts_from_response(self):
+        # iterate over potentially multiple response body parts; for each
+        # part, yield an iterator over the part's bytes
+        try:
+            part_iter = None
+            try:
+                while True:
+                    start_byte, end_byte, length, headers, part = \
+                        self._get_next_response_part()
+                    self.learn_size_from_content_range(
+                        start_byte, end_byte, length)
+                    self.bytes_used_from_backend = 0
+                    # not length; that refers to the whole object, so is the
+                    # wrong value to use for GET-range responses
+                    byte_count = ((end_byte - start_byte + 1)
+                                  if (end_byte is not None
+                                      and start_byte is not None)
+                                  else None)
+                    part_iter = CooperativeIterator(
+                        self._iter_bytes_from_response_part(part, byte_count))
+                    yield {'start_byte': start_byte, 'end_byte': end_byte,
+                           'entity_length': length, 'headers': headers,
+                           'part_iter': part_iter}
+                    self.pop_range()
+            except StopIteration:
+                self.req.environ['swift.non_client_disconnect'] = True
+            finally:
+                if part_iter:
+                    part_iter.close()
+
+        except ChunkWriteTimeout:
+            self.logger.info(
+                'Client did not read from proxy within %ss',
+                self.app.client_timeout)
+            self.logger.increment('%s.client_timeouts' %
+                                  self.server_type.lower())
+        except GeneratorExit:
+            warn = True
+            req_range = self.backend_headers['Range']
+            if req_range:
+                req_range = Range(req_range)
+                if len(req_range.ranges) == 1:
+                    begin, end = req_range.ranges[0]
+                    if end is not None and begin is not None:
+                        if end - begin + 1 == self.bytes_used_from_backend:
+                            warn = False
+            if (warn and
+                    not self.req.environ.get('swift.non_client_disconnect')):
+                self.logger.info('Client disconnected on read of %r',
+                                 self.path)
+            raise
+        except Exception:
+            self.logger.exception('Trying to send to client')
+            raise
+        finally:
+            self.source.close()
+
+    @property
+    def last_status(self):
+        if self.statuses:
+            return self.statuses[-1]
+        else:
+            return None
+
+    @property
+    def last_headers(self):
+        if self.source_headers:
+            return HeaderKeyDict(self.source_headers[-1])
+        else:
+            return None
+
+    def _make_node_request(self, node, logger_thread_locals):
+        # make a backend request; return True if the response is deemed good
+        # (has an acceptable status code), useful (matches any previously
+        # discovered etag) and sufficient (a single good response is
+        # insufficient when we're searching for the newest timestamp)
+        self.logger.thread_locals = logger_thread_locals
+        if node in self.used_nodes:
+            return False
+
+        req_headers = dict(self.backend_headers)
+        ip, port = get_ip_port(node, req_headers)
+        start_node_timing = time.time()
+        try:
+            with ConnectionTimeout(self.app.conn_timeout):
+                conn = http_connect(
+                    ip, port, node['device'],
+                    self.partition, self.req.method, self.path,
+                    headers=req_headers,
+                    query_string=self.req.query_string)
+            self.app.set_node_timing(node, time.time() - start_node_timing)
+
+            with Timeout(self.node_timeout):
+                possible_source = conn.getresponse()
+                # See NOTE: swift_conn at top of file about this.
+                possible_source.swift_conn = conn
+        except (Exception, Timeout):
+            self.app.exception_occurred(
+                node, self.server_type,
+                'Trying to %(method)s %(path)s' %
+                {'method': self.req.method, 'path': self.req.path})
+            return False
+
+        src_headers = dict(
+            (k.lower(), v) for k, v in
+            possible_source.getheaders())
+        if is_good_source(possible_source.status, self.server_type):
+            # 404 if we know we don't have a synced copy
+            if not float(possible_source.getheader('X-PUT-Timestamp', 1)):
+                self.statuses.append(HTTP_NOT_FOUND)
+                self.reasons.append('')
+                self.bodies.append('')
+                self.source_headers.append([])
+                close_swift_conn(possible_source)
+            else:
+                if self.used_source_etag and \
+                        self.used_source_etag != normalize_etag(
+                            src_headers.get('etag', '')):
+                    self.statuses.append(HTTP_NOT_FOUND)
+                    self.reasons.append('')
+                    self.bodies.append('')
+                    self.source_headers.append([])
+                    return False
+
+                # a possible source should only be added as a valid source
+                # if its timestamp is newer than previously found tombstones
+                ps_timestamp = Timestamp(
+                    src_headers.get('x-backend-data-timestamp') or
+                    src_headers.get('x-backend-timestamp') or
+                    src_headers.get('x-put-timestamp') or
+                    src_headers.get('x-timestamp') or
+                    Timestamp.zero())
+                if ps_timestamp >= self.latest_404_timestamp:
+                    self.statuses.append(possible_source.status)
+                    self.reasons.append(possible_source.reason)
+                    self.bodies.append(None)
+                    self.source_headers.append(possible_source.getheaders())
+                    self.sources.append(
+                        GetterSource(self.app, possible_source, node))
+                    if not self.newest:  # one good source is enough
+                        return True
+        else:
+            if 'handoff_index' in node and \
+                    (is_server_error(possible_source.status) or
+                     possible_source.status == HTTP_NOT_FOUND) and \
+                    not Timestamp(src_headers.get('x-backend-timestamp',
+                                                  Timestamp.zero())):
+                # throw out 5XX and 404s from handoff nodes unless the data is
+                # really on disk and had been DELETEd
+                return False
+
+            if self.rebalance_missing_suppression_count > 0 and \
+                    possible_source.status == HTTP_NOT_FOUND and \
+                    not Timestamp(src_headers.get('x-backend-timestamp',
+                                                  Timestamp.zero())):
+                self.rebalance_missing_suppression_count -= 1
+                return False
+
+            self.statuses.append(possible_source.status)
+            self.reasons.append(possible_source.reason)
+            self.bodies.append(possible_source.read())
+            self.source_headers.append(possible_source.getheaders())
+
+            # if 404, record the timestamp. If a good source shows up, its
+            # timestamp will be compared to the latest 404.
+            # For now checking only on objects, but future work could include
+            # the same check for account and containers. See lp 1560574.
+            if self.server_type == 'Object' and \
+                    possible_source.status == HTTP_NOT_FOUND:
+                hdrs = HeaderKeyDict(possible_source.getheaders())
+                ts = Timestamp(hdrs.get('X-Backend-Timestamp',
+                                        Timestamp.zero()))
+                if ts > self.latest_404_timestamp:
+                    self.latest_404_timestamp = ts
+            self.app.check_response(node, self.server_type, possible_source,
+                                    self.req.method, self.path,
+                                    self.bodies[-1])
+        return False
+
+    def _find_source(self):
+        self.statuses = []
+        self.reasons = []
+        self.bodies = []
+        self.source_headers = []
+        self.sources = []
+
+        nodes = GreenthreadSafeIterator(self.node_iter)
+
+        pile = GreenAsyncPile(self.concurrency)
+
+        for node in nodes:
+            pile.spawn(self._make_node_request, node,
+                       self.logger.thread_locals)
+            _timeout = self.app.get_policy_options(
+                self.policy).concurrency_timeout \
+                if pile.inflight < self.concurrency else None
+            if pile.waitfirst(_timeout):
+                break
+        else:
+            # ran out of nodes, see if any stragglers will finish
+            any(pile)
+
+        # this helps weed out any sucess status that were found before a 404
+        # and added to the list in the case of x-newest.
+        if self.sources:
+            self.sources = [s for s in self.sources
+                            if s.timestamp >= self.latest_404_timestamp]
+
+        if self.sources:
+            self.sources.sort(key=operator.attrgetter('timestamp'))
+            source = self.sources.pop()
+            for unused_source in self.sources:
+                unused_source.close()
+            self.used_nodes.append(source.node)
+
+            # Save off the source etag so that, if we lose the connection
+            # and have to resume from a different node, we can be sure that
+            # we have the same object (replication). Otherwise, if the cluster
+            # has two versions of the same object, we might end up switching
+            # between old and new mid-stream and giving garbage to the client.
+            if self.used_source_etag is None:
+                self.used_source_etag = normalize_etag(
+                    source.resp.getheader('etag', ''))
+            self.source = source
+            return True
+        return False
+
+    def _make_app_iter(self):
+        """
+        Returns an iterator over the contents of the source (via its read
+        func).  There is also quite a bit of cleanup to ensure garbage
+        collection works and the underlying socket of the source is closed.
 
-from eventlet import spawn_n, GreenPile, Timeout
-from eventlet.queue import Queue, Empty, Full
-from eventlet.timeout import Timeout
+        :return: an iterator that yields chunks of response body bytes
+        """
 
-from swift.common.utils import normalize_timestamp, config_true_value, public
-from swift.common.bufferedhttp import http_connect
-from swift.common.constraints import MAX_ACCOUNT_NAME_LENGTH
-from swift.common.exceptions import ChunkReadTimeout, ConnectionTimeout
-from swift.common.http import is_informational, is_success, is_redirection, \
-    is_server_error, HTTP_OK, HTTP_PARTIAL_CONTENT, HTTP_MULTIPLE_CHOICES, \
-    HTTP_BAD_REQUEST, HTTP_NOT_FOUND, HTTP_SERVICE_UNAVAILABLE, \
-    HTTP_INSUFFICIENT_STORAGE, HTTP_UNAUTHORIZED
-from swift.common.swob import Request, Response, status_map
+        ct = self.source.resp.getheader('Content-Type')
+        if ct:
+            content_type, content_type_attrs = parse_content_type(ct)
+            is_multipart = content_type == 'multipart/byteranges'
+        else:
+            is_multipart = False
 
+        boundary = "dontcare"
+        if is_multipart:
+            # we need some MIME boundary; fortunately, the object server has
+            # furnished one for us, so we'll just re-use it
+            boundary = dict(content_type_attrs)["boundary"]
 
-def update_headers(response, headers):
-    """
-    Helper function to update headers in the response.
+        parts_iter = self._iter_parts_from_response()
 
-    :param response: swob.Response object
-    :param headers: dictionary headers
-    """
-    if hasattr(headers, 'items'):
-        headers = headers.items()
-    for name, value in headers:
-        if name == 'etag':
-            response.headers[name] = value.replace('"', '')
-        elif name not in ('date', 'content-length', 'content-type',
-                          'connection', 'x-put-timestamp', 'x-delete-after'):
-            response.headers[name] = value
+        def add_content_type(response_part):
+            response_part["content_type"] = \
+                HeaderKeyDict(response_part["headers"]).get("Content-Type")
+            return response_part
 
+        return document_iters_to_http_response_body(
+            ClosingMapper(add_content_type, parts_iter),
+            boundary, is_multipart, self.logger)
+
+    def get_working_response(self):
+        res = None
+        if self._replace_source():
+            res = Response(request=self.req)
+            res.status = self.source.resp.status
+            update_headers(res, self.source.resp.getheaders())
+            if self.req.method == 'GET' and \
+                    self.source.resp.status in (HTTP_OK, HTTP_PARTIAL_CONTENT):
+                res.app_iter = self._make_app_iter()
+                # See NOTE: swift_conn at top of file about this.
+                res.swift_conn = self.source.resp.swift_conn
+            if not res.environ:
+                res.environ = {}
+            res.environ['swift_x_timestamp'] = self.source.resp.getheader(
+                'x-timestamp')
+            res.accept_ranges = 'bytes'
+            res.content_length = self.source.resp.getheader('Content-Length')
+            if self.source.resp.getheader('Content-Type'):
+                res.charset = None
+                res.content_type = self.source.resp.getheader('Content-Type')
+        return res
 
-def source_key(resp):
-    """
-    Provide the timestamp of the swift http response as a floating
-    point value.  Used as a sort key.
 
-    :param resp: httplib response object
+class NodeIter(object):
     """
-    return float(resp.getheader('x-put-timestamp') or
-                 resp.getheader('x-timestamp') or 0)
+    Yields nodes for a ring partition, skipping over error
+    limited nodes and stopping at the configurable number of nodes. If a
+    node yielded subsequently gets error limited, an extra node will be
+    yielded to take its place.
 
+    Note that if you're going to iterate over this concurrently from
+    multiple greenthreads, you'll want to use a
+    swift.common.utils.GreenthreadSafeIterator to serialize access.
+    Otherwise, you may get ValueErrors from concurrent access. (You also
+    may not, depending on how logging is configured, the vagaries of
+    socket IO and eventlet, and the phase of the moon.)
 
-def delay_denial(func):
+    :param server_type: one of 'account', 'container', or 'object'
+    :param app: a proxy app
+    :param ring: ring to get yield nodes from
+    :param partition: ring partition to yield nodes for
+    :param logger: a logger instance
+    :param request: yielded nodes will be annotated with `use_replication`
+        based on the `request` headers.
+    :param node_iter: optional iterable of nodes to try. Useful if you
+        want to filter or reorder the nodes.
+    :param policy: an instance of :class:`BaseStoragePolicy`. This should be
+        None for an account or container ring.
     """
-    Decorator to declare which methods should have any swift.authorize call
-    delayed. This is so the method can load the Request object up with
-    additional information that may be needed by the authorization system.
 
-    :param func: function for which authorization will be delayed
-    """
-    func.delay_denial = True
+    def __init__(self, server_type, app, ring, partition, logger, request,
+                 node_iter=None, policy=None):
+        self.server_type = server_type
+        self.app = app
+        self.ring = ring
+        self.partition = partition
+        self.logger = logger
+        self.request = request
 
-    @functools.wraps(func)
-    def wrapped(*a, **kw):
-        return func(*a, **kw)
-    return wrapped
+        part_nodes = ring.get_part_nodes(partition)
+        if node_iter is None:
+            node_iter = itertools.chain(
+                part_nodes, ring.get_more_nodes(partition))
+        self.num_primary_nodes = len(part_nodes)
+        self.nodes_left = self.app.request_node_count(self.num_primary_nodes)
+        self.expected_handoffs = self.nodes_left - self.num_primary_nodes
 
+        # Use of list() here forcibly yanks the first N nodes (the primary
+        # nodes) from node_iter, so the rest of its values are handoffs.
+        self.primary_nodes = self.app.sort_nodes(
+            list(itertools.islice(node_iter, self.num_primary_nodes)),
+            policy=policy)
+        self.handoff_iter = node_iter
+        self._node_provider = None
 
-def get_account_memcache_key(account):
-    return 'account/%s' % account
+    @property
+    def primaries_left(self):
+        return len(self.primary_nodes)
 
+    def __iter__(self):
+        self._node_iter = self._node_gen()
+        return self
 
-def get_container_memcache_key(account, container):
-    return 'container/%s/%s' % (account, container)
+    def log_handoffs(self, handoffs):
+        """
+        Log handoff requests if handoff logging is enabled and the
+        handoff was not expected.
 
+        We only log handoffs when we've pushed the handoff count further
+        than we would normally have expected under normal circumstances,
+        that is (request_node_count - num_primaries), when handoffs goes
+        higher than that it means one of the primaries must have been
+        skipped because of error limiting before we consumed all of our
+        nodes_left.
+        """
+        if not self.app.log_handoffs:
+            return
+        extra_handoffs = handoffs - self.expected_handoffs
+        if extra_handoffs > 0:
+            self.logger.increment('%s.handoff_count' %
+                                  self.server_type.lower())
+            self.logger.warning(
+                'Handoff requested (%d)' % handoffs)
+            if (extra_handoffs == self.num_primary_nodes):
+                # all the primaries were skipped, and handoffs didn't help
+                self.logger.increment('%s.handoff_all_count' %
+                                      self.server_type.lower())
 
-def headers_to_container_info(headers, status_int=HTTP_OK):
-    """
-    Construct a cacheable dict of container info based on response headers.
-    """
-    headers = dict(headers)
-    return {
-        'status': status_int,
-        'read_acl': headers.get('x-container-read'),
-        'write_acl': headers.get('x-container-write'),
-        'sync_key': headers.get('x-container-sync-key'),
-        'count': headers.get('x-container-object-count'),
-        'bytes': headers.get('x-container-bytes-used'),
-        'versions': headers.get('x-versions-location'),
-        'cors': {
-            'allow_origin': headers.get(
-                'x-container-meta-access-control-allow-origin'),
-            'allow_headers': headers.get(
-                'x-container-meta-access-control-allow-headers'),
-            'max_age': headers.get(
-                'x-container-meta-access-control-max-age')
-        },
-        'meta': dict((key.lower()[17:], value)
-                     for key, value in headers.iteritems()
-                     if key.lower().startswith('x-container-meta-'))
-    }
+    def set_node_provider(self, callback):
+        """
+        Install a callback function that will be used during a call to next()
+        to get an alternate node instead of returning the next node from the
+        iterator.
+
+        :param callback: A no argument function that should return a node dict
+                         or None.
+        """
+        self._node_provider = callback
+
+    def _node_gen(self):
+        while self.primary_nodes:
+            node = self.primary_nodes.pop(0)
+            if not self.app.error_limited(node):
+                yield node
+                if not self.app.error_limited(node):
+                    self.nodes_left -= 1
+                    if self.nodes_left <= 0:
+                        return
+        handoffs = 0
+        for node in self.handoff_iter:
+            if not self.app.error_limited(node):
+                handoffs += 1
+                self.log_handoffs(handoffs)
+                yield node
+                if not self.app.error_limited(node):
+                    self.nodes_left -= 1
+                    if self.nodes_left <= 0:
+                        return
+
+    def _annotate_node(self, node):
+        """
+        Helper function to set use_replication dict value for a node by looking
+        up the header value for x-backend-use-replication-network.
+
+        :param node: node dictionary from the ring or node_iter.
+        :returns: node dictionary with replication network enabled/disabled
+        """
+        # nodes may have come from a ring or a node_iter passed to the
+        # constructor: be careful not to mutate them!
+        return dict(node, use_replication=is_use_replication_network(
+            self.request.headers))
+
+    def __next__(self):
+        node = None
+        if self._node_provider:
+            # give node provider the opportunity to inject a node
+            node = self._node_provider()
+        if not node:
+            node = next(self._node_iter)
+        return self._annotate_node(node)
 
 
 class Controller(object):
@@ -130,335 +1902,332 @@ class Controller(object):
     pass_through_headers = []
 
     def __init__(self, app):
+        """
+        Creates a controller attached to an application instance
+
+        :param app: the application instance
+        """
         self.account_name = None
         self.app = app
         self.trans_id = '-'
-        self.allowed_methods = set()
-        all_methods = inspect.getmembers(self, predicate=inspect.ismethod)
-        for name, m in all_methods:
-            if getattr(m, 'publicly_accessible', False):
-                self.allowed_methods.add(name)
-
-    def transfer_headers(self, src_headers, dst_headers):
-
-        st = self.server_type.lower()
-        x_remove = 'x-remove-%s-meta-' % st
-        x_remove_read = 'x-remove-%s-read' % st
-        x_remove_write = 'x-remove-%s-write' % st
-        x_meta = 'x-%s-meta-' % st
-        dst_headers.update((k.lower().replace('-remove', '', 1), '')
-                           for k in src_headers
-                           if k.lower().startswith(x_remove) or
-                           k.lower() in (x_remove_read, x_remove_write))
+        self._allowed_methods = None
+        self._private_methods = None
 
-        dst_headers.update((k.lower(), v)
-                           for k, v in src_headers.iteritems()
-                           if k.lower() in self.pass_through_headers or
-                           k.lower().startswith(x_meta))
+    @property
+    def logger(self):
+        return self.app.logger
 
-    def error_increment(self, node):
-        """
-        Handles incrementing error counts when talking to nodes.
+    @property
+    def allowed_methods(self):
+        if self._allowed_methods is None:
+            self._allowed_methods = set()
+            all_methods = inspect.getmembers(self, predicate=inspect.ismethod)
+            for name, m in all_methods:
+                if getattr(m, 'publicly_accessible', False):
+                    self._allowed_methods.add(name)
+        return self._allowed_methods
 
-        :param node: dictionary of node to increment the error count for
-        """
-        node['errors'] = node.get('errors', 0) + 1
-        node['last_error'] = time.time()
+    @property
+    def private_methods(self):
+        if self._private_methods is None:
+            self._private_methods = set()
+            all_methods = inspect.getmembers(self, predicate=inspect.ismethod)
+            for name, m in all_methods:
+                if getattr(m, 'privately_accessible', False):
+                    self._private_methods.add(name)
+        return self._private_methods
 
-    def error_occurred(self, node, msg):
+    def _x_remove_headers(self):
         """
-        Handle logging, and handling of errors.
+        Returns a list of headers that must not be sent to the backend
 
-        :param node: dictionary of node to handle errors for
-        :param msg: error message
+        :returns: a list of header
         """
-        self.error_increment(node)
-        self.app.logger.error(_('%(msg)s %(ip)s:%(port)s'),
-                              {'msg': msg, 'ip': node['ip'],
-                              'port': node['port']})
+        return []
 
-    def exception_occurred(self, node, typ, additional_info):
+    def transfer_headers(self, src_headers, dst_headers):
         """
-        Handle logging of generic exceptions.
+        Transfer legal headers from an original client request to dictionary
+        that will be used as headers by the backend request
 
-        :param node: dictionary of node to log the error for
-        :param typ: server type
-        :param additional_info: additional information to log
+        :param src_headers: A dictionary of the original client request headers
+        :param dst_headers: A dictionary of the backend request headers
         """
-        self.app.logger.exception(
-            _('ERROR with %(type)s server %(ip)s:%(port)s/%(device)s re: '
-              '%(info)s'),
-            {'type': typ, 'ip': node['ip'], 'port': node['port'],
-             'device': node['device'], 'info': additional_info})
+        st = self.server_type.lower()
 
-    def error_limited(self, node):
-        """
-        Check if the node is currently error limited.
+        x_remove = 'x-remove-%s-meta-' % st
+        dst_headers.update((k.lower().replace('-remove', '', 1), '')
+                           for k in src_headers
+                           if k.lower().startswith(x_remove) or
+                           k.lower() in self._x_remove_headers())
 
-        :param node: dictionary of node to check
-        :returns: True if error limited, False otherwise
-        """
-        now = time.time()
-        if not 'errors' in node:
-            return False
-        if 'last_error' in node and node['last_error'] < \
-                now - self.app.error_suppression_interval:
-            del node['last_error']
-            if 'errors' in node:
-                del node['errors']
-            return False
-        limited = node['errors'] > self.app.error_suppression_limit
-        if limited:
-            self.app.logger.debug(
-                _('Node error limited %(ip)s:%(port)s (%(device)s)'), node)
-        return limited
+        dst_headers.update((k.lower(), v)
+                           for k, v in src_headers.items()
+                           if k.lower() in self.pass_through_headers or
+                           is_sys_or_user_meta(st, k))
 
-    def error_limit(self, node):
+    def generate_request_headers(self, orig_req=None, additional=None,
+                                 transfer=False):
         """
-        Mark a node as error limited.
+        Create a dict of headers to be used in backend requests
 
-        :param node: dictionary of node to error limit
+        :param orig_req: the original request sent by the client to the proxy
+        :param additional: additional headers to send to the backend
+        :param transfer: If True, transfer headers from original client request
+        :returns: a dictionary of headers
         """
-        node['errors'] = self.app.error_suppression_limit + 1
-        node['last_error'] = time.time()
+        headers = HeaderKeyDict()
+        if orig_req:
+            headers.update((k.lower(), v)
+                           for k, v in orig_req.headers.items()
+                           if k.lower().startswith('x-backend-'))
+            referer = orig_req.as_referer()
+        else:
+            referer = ''
+        # additional headers can override x-backend-* headers from orig_req
+        if additional:
+            headers.update(additional)
+        if orig_req and transfer:
+            # transfer headers from orig_req can override additional headers
+            self.transfer_headers(orig_req.headers, headers)
+        headers.setdefault('x-timestamp', Timestamp.now().internal)
+        # orig_req and additional headers cannot override the following...
+        headers['x-trans-id'] = self.trans_id
+        headers['connection'] = 'close'
+        headers['user-agent'] = self.app.backend_user_agent
+        headers['referer'] = referer
+        return headers
 
-    def account_info(self, account, autocreate=False):
+    def account_info(self, account, req):
         """
         Get account information, and also verify that the account exists.
 
-        :param account: name of the account to get the info for
+        :param account: native str name of the account to get the info for
+        :param req: caller's HTTP request context object
         :returns: tuple of (account partition, account nodes, container_count)
                   or (None, None, None) if it does not exist
         """
+        if req:
+            env = getattr(req, 'environ', {})
+        else:
+            env = {}
+        env.setdefault('swift.infocache', {})
+        path_env = env.copy()
+        path_env['PATH_INFO'] = "/v1/%s" % (str_to_wsgi(account),)
+
+        info = get_account_info(path_env, self.app)
+        if (not info
+                or not is_success(info['status'])
+                or not info.get('account_really_exists', True)):
+            return None, None, None
+        container_count = info['container_count']
         partition, nodes = self.app.account_ring.get_nodes(account)
-        # 0 = no responses, 200 = found, 404 = not found, -1 = mixed responses
-        if self.app.memcache:
-            cache_key = get_account_memcache_key(account)
-            cache_value = self.app.memcache.get(cache_key)
-            if not isinstance(cache_value, dict):
-                result_code = cache_value
-                container_count = 0
-            else:
-                result_code = cache_value['status']
-                container_count = cache_value['container_count']
-            if result_code == HTTP_OK:
-                return partition, nodes, container_count
-            elif result_code == HTTP_NOT_FOUND and not autocreate:
-                return None, None, None
-        result_code = 0
-        container_count = 0
-        attempts_left = len(nodes)
-        path = '/%s' % account
-        headers = {'x-trans-id': self.trans_id, 'Connection': 'close'}
-        iternodes = self.iter_nodes(partition, nodes, self.app.account_ring)
-        while attempts_left > 0:
-            try:
-                node = iternodes.next()
-            except StopIteration:
-                break
-            attempts_left -= 1
-            try:
-                with ConnectionTimeout(self.app.conn_timeout):
-                    conn = http_connect(node['ip'], node['port'],
-                                        node['device'], partition, 'HEAD',
-                                        path, headers)
-                with Timeout(self.app.node_timeout):
-                    resp = conn.getresponse()
-                    body = resp.read()
-                    if is_success(resp.status):
-                        result_code = HTTP_OK
-                        container_count = int(
-                            resp.getheader('x-account-container-count') or 0)
-                        break
-                    elif resp.status == HTTP_NOT_FOUND:
-                        if result_code == 0:
-                            result_code = HTTP_NOT_FOUND
-                        elif result_code != HTTP_NOT_FOUND:
-                            result_code = -1
-                    elif resp.status == HTTP_INSUFFICIENT_STORAGE:
-                        self.error_limit(node)
-                        continue
-                    else:
-                        result_code = -1
-            except (Exception, Timeout):
-                self.exception_occurred(node, _('Account'),
-                                        _('Trying to get account info for %s')
-                                        % path)
-        if result_code == HTTP_NOT_FOUND and autocreate:
-            if len(account) > MAX_ACCOUNT_NAME_LENGTH:
-                return None, None, None
-            headers = {'X-Timestamp': normalize_timestamp(time.time()),
-                       'X-Trans-Id': self.trans_id,
-                       'Connection': 'close'}
-            resp = self.make_requests(Request.blank('/v1' + path),
-                                      self.app.account_ring, partition, 'PUT',
-                                      path, [headers] * len(nodes))
-            if not is_success(resp.status_int):
-                self.app.logger.warning('Could not autocreate account %r' %
-                                        path)
-                return None, None, None
-            result_code = HTTP_OK
-        if self.app.memcache and result_code in (HTTP_OK, HTTP_NOT_FOUND):
-            if result_code == HTTP_OK:
-                cache_timeout = self.app.recheck_account_existence
-            else:
-                cache_timeout = self.app.recheck_account_existence * 0.1
-            self.app.memcache.set(cache_key,
-                                  {'status': result_code,
-                                  'container_count': container_count},
-                                  timeout=cache_timeout)
-        if result_code == HTTP_OK:
-            return partition, nodes, container_count
-        return None, None, None
+        return partition, nodes, container_count
 
-    def container_info(self, account, container, account_autocreate=False):
+    def container_info(self, account, container, req):
         """
-        Get container information and thusly verify container existance.
-        This will also make a call to account_info to verify that the
-        account exists.
+        Get container information and thusly verify container existence.
+        This will also verify account existence.
 
-        :param account: account name for the container
-        :param container: container name to look up
+        :param account: native-str account name for the container
+        :param container: native-str container name to look up
+        :param req: caller's HTTP request context object
         :returns: dict containing at least container partition ('partition'),
                   container nodes ('containers'), container read
                   acl ('read_acl'), container write acl ('write_acl'),
                   and container sync key ('sync_key').
                   Values are set to None if the container does not exist.
         """
-        part, nodes = self.app.container_ring.get_nodes(account, container)
-        path = '/%s/%s' % (account, container)
-        container_info = {'status': 0, 'read_acl': None,
-                          'write_acl': None, 'sync_key': None,
-                          'count': None, 'bytes': None,
-                          'versions': None, 'partition': None,
-                          'nodes': None}
-        if self.app.memcache:
-            cache_key = get_container_memcache_key(account, container)
-            cache_value = self.app.memcache.get(cache_key)
-            if isinstance(cache_value, dict):
-                if 'container_size' in cache_value:
-                    cache_value['count'] = cache_value['container_size']
-                if is_success(cache_value['status']):
-                    container_info.update(cache_value)
-                    container_info['partition'] = part
-                    container_info['nodes'] = nodes
-                return container_info
-        if not self.account_info(account, autocreate=account_autocreate)[1]:
-            return container_info
-        attempts_left = len(nodes)
-        headers = {'x-trans-id': self.trans_id, 'Connection': 'close'}
-        for node in self.iter_nodes(part, nodes, self.app.container_ring):
-            try:
-                with ConnectionTimeout(self.app.conn_timeout):
-                    conn = http_connect(node['ip'], node['port'],
-                                        node['device'], part, 'HEAD',
-                                        path, headers)
-                with Timeout(self.app.node_timeout):
-                    resp = conn.getresponse()
-                    body = resp.read()
-                if is_success(resp.status):
-                    container_info.update(
-                        headers_to_container_info(resp.getheaders()))
-                    break
-                elif resp.status == HTTP_NOT_FOUND:
-                    container_info['status'] = HTTP_NOT_FOUND
-                else:
-                    container_info['status'] = -1
-                    if resp.status == HTTP_INSUFFICIENT_STORAGE:
-                        self.error_limit(node)
-            except (Exception, Timeout):
-                self.exception_occurred(
-                    node, _('Container'),
-                    _('Trying to get container info for %s') % path)
-            attempts_left -= 1
-            if attempts_left <= 0:
-                break
-        if self.app.memcache:
-            if container_info['status'] == HTTP_OK:
-                self.app.memcache.set(
-                    cache_key, container_info,
-                    timeout=self.app.recheck_container_existence)
-            elif container_info['status'] == HTTP_NOT_FOUND:
-                self.app.memcache.set(
-                    cache_key, container_info,
-                    timeout=self.app.recheck_container_existence * 0.1)
-        if container_info['status'] == HTTP_OK:
-            container_info['partition'] = part
-            container_info['nodes'] = nodes
-        return container_info
-
-    def iter_nodes(self, partition, nodes, ring):
-        """
-        Node iterator that will first iterate over the normal nodes for a
-        partition and then the handoff partitions for the node.
-
-        :param partition: partition to iterate nodes for
-        :param nodes: list of node dicts from the ring
-        :param ring: ring to get handoff nodes from
-        """
-        for node in nodes:
-            if not self.error_limited(node):
-                yield node
-        handoffs = 0
-        for node in ring.get_more_nodes(partition):
-            if not self.error_limited(node):
-                handoffs += 1
-                if self.app.log_handoffs:
-                    self.app.logger.increment('handoff_count')
-                    self.app.logger.warning(
-                        'Handoff requested (%d)' % handoffs)
-                    if handoffs == len(nodes):
-                        self.app.logger.increment('handoff_all_count')
-                yield node
+        if req:
+            env = getattr(req, 'environ', {})
+        else:
+            env = {}
+        env.setdefault('swift.infocache', {})
+        path_env = env.copy()
+        path_env['PATH_INFO'] = "/v1/%s/%s" % (
+            str_to_wsgi(account), str_to_wsgi(container))
+        info = get_container_info(path_env, self.app)
+        if not is_success(info.get('status')):
+            info['partition'] = None
+            info['nodes'] = None
+        else:
+            part, nodes = self.app.container_ring.get_nodes(account, container)
+            info['partition'] = part
+            info['nodes'] = nodes
+        return info
 
     def _make_request(self, nodes, part, method, path, headers, query,
-                      logger_thread_locals):
-        self.app.logger.thread_locals = logger_thread_locals
+                      body, logger_thread_locals):
+        """
+        Iterates over the given node iterator, sending an HTTP request to one
+        node at a time.  The first non-informational, non-server-error
+        response is returned.  If no non-informational, non-server-error
+        response is received from any of the nodes, returns None.
+
+        :param nodes: an iterator of the backend server and handoff servers
+        :param part: the partition number
+        :param method: the method to send to the backend
+        :param path: the path to send to the backend
+                     (full path ends up being /<$device>/<$part>/<$path>)
+        :param headers: dictionary of headers
+        :param query: query string to send to the backend.
+        :param body: byte string to use as the request body.
+                     Try to keep it small.
+        :param logger_thread_locals: The thread local values to be set on the
+                                     self.logger to retain transaction
+                                     logging information.
+        :returns: a swob.Response object, or None if no responses were received
+        """
+        self.logger.thread_locals = logger_thread_locals
+        if body:
+            if not isinstance(body, bytes):
+                raise TypeError('body must be bytes, not %s' % type(body))
+            headers['Content-Length'] = str(len(body))
         for node in nodes:
             try:
+                ip, port = get_ip_port(node, headers)
+                start_node_timing = time.time()
                 with ConnectionTimeout(self.app.conn_timeout):
-                    conn = http_connect(node['ip'], node['port'],
-                                        node['device'], part, method, path,
-                                        headers=headers, query_string=query)
+                    conn = http_connect(
+                        ip, port, node['device'], part, method, path,
+                        headers=headers, query_string=query)
                     conn.node = node
+                self.app.set_node_timing(node, time.time() - start_node_timing)
+                if body:
+                    with Timeout(self.app.node_timeout):
+                        conn.send(body)
                 with Timeout(self.app.node_timeout):
                     resp = conn.getresponse()
-                    if not is_informational(resp.status) and \
-                            not is_server_error(resp.status):
-                        return resp.status, resp.reason, resp.read()
-                    elif resp.status == HTTP_INSUFFICIENT_STORAGE:
-                        self.error_limit(node)
+                    if (self.app.check_response(node, self.server_type, resp,
+                                                method, path)
+                            and not is_informational(resp.status)):
+                        return resp, resp.read(), node
+
             except (Exception, Timeout):
-                self.exception_occurred(node, self.server_type,
-                                        _('Trying to %(method)s %(path)s') %
-                                        {'method': method, 'path': path})
+                self.app.exception_occurred(
+                    node, self.server_type,
+                    'Trying to %(method)s %(path)s' %
+                    {'method': method, 'path': path})
+        return None, None, None
+
+    def _make_requests(self, req, ring, part, method, path, headers,
+                       query_string='', node_count=None, node_iterator=None,
+                       body=None):
+        """
+        Internal method that handles the actual request execution and response
+        collection.
+
+        :param req: a request sent by the client
+        :param ring: the ring used for finding backend servers
+        :param part: the partition number
+        :param method: the method to send to the backend
+        :param path: the path to send to the backend
+        :param headers: a list of dicts, where each dict represents one
+                        backend request that should be made.
+        :param query_string: optional query string to send to the backend
+        :param node_count: optional number of nodes to send request to.
+        :param node_iterator: optional node iterator.
+        :param body: byte string to use as the request body.
+        :returns: list of tuples of (resp, body, node)
+        """
+        nodes = GreenthreadSafeIterator(node_iterator or NodeIter(
+            self.server_type.lower(), self.app, ring, part, self.logger, req))
+        node_number = node_count or len(ring.get_part_nodes(part))
+        pile = GreenAsyncPile(node_number)
+
+        for head in headers:
+            pile.spawn(self._make_request, nodes, part, method, path,
+                       head, query_string, body, self.logger.thread_locals)
+        results = []
+        statuses = []
+        for resp, body, node in pile:
+            if not is_useful_response(resp, node):
+                continue
+            results.append((resp, body, node))
+            statuses.append(resp.status)
+            if self.have_quorum(statuses, node_number):
+                break
+        # give any pending requests *some* chance to finish
+        finished_quickly = pile.waitall(self.app.post_quorum_timeout)
+        for resp, body, node in finished_quickly:
+            if not is_useful_response(resp, node):
+                continue
+            results.append((resp, body, node))
+            statuses.append(resp.status)
+        while len(results) < node_number:
+            swob_resp = HTTPServiceUnavailable(request=req)
+            stub_http_client_resp = SimpleNamespace(
+                status=swob_resp.status_int,
+                reason=swob_resp.title,
+                getheaders=lambda: swob_resp.headers)
+            results.append((stub_http_client_resp, swob_resp.body, None))
+        return results
 
     def make_requests(self, req, ring, part, method, path, headers,
-                      query_string=''):
+                      query_string='', overrides=None, node_count=None,
+                      node_iterator=None, body=None):
         """
         Sends an HTTP request to multiple nodes and aggregates the results.
         It attempts the primary nodes concurrently, then iterates over the
         handoff nodes as needed.
 
+        :param req: a request sent by the client
+        :param ring: the ring used for finding backend servers
+        :param part: the partition number
+        :param method: the method to send to the backend
+        :param path: the path to send to the backend
+                     (full path ends up being  /<$device>/<$part>/<$path>)
         :param headers: a list of dicts, where each dict represents one
                         backend request that should be made.
+        :param query_string: optional query string to send to the backend
+        :param overrides: optional return status override map used to override
+                          the returned status of a request.
+        :param node_count: optional number of nodes to send request to.
+        :param node_iterator: optional node iterator.
+        :param body: byte string to use as the request body.
+                     Try to keep it small.
         :returns: a swob.Response object
         """
-        start_nodes = ring.get_part_nodes(part)
-        nodes = self.iter_nodes(part, start_nodes, ring)
-        pile = GreenPile(len(start_nodes))
-        for head in headers:
-            pile.spawn(self._make_request, nodes, part, method, path,
-                       head, query_string, self.app.logger.thread_locals)
-        response = [resp for resp in pile if resp]
-        while len(response) < len(start_nodes):
-            response.append((HTTP_SERVICE_UNAVAILABLE, '', ''))
-        statuses, reasons, bodies = zip(*response)
+        results = self._make_requests(
+            req, ring, part, method, path, headers, query_string,
+            node_count, node_iterator, body)
+        statuses, reasons, resp_headers, bodies = zip(*[(
+            resp.status, resp.reason, resp.getheaders(), body)
+            for resp, body, _ in results])
         return self.best_response(req, statuses, reasons, bodies,
-                                  '%s %s' % (self.server_type, req.method))
+                                  '%s %s' % (self.server_type, req.method),
+                                  overrides=overrides, headers=resp_headers)
+
+    def _quorum_size(self, n):
+        """
+        Number of successful backend responses needed for the proxy to
+        consider the client request successful.
+        """
+        return quorum_size(n)
+
+    def have_quorum(self, statuses, node_count, quorum=None):
+        """
+        Given a list of statuses from several requests, determine if
+        a quorum response can already be decided.
+
+        :param statuses: list of statuses returned
+        :param node_count: number of nodes being queried (basically ring count)
+        :param quorum: number of statuses required for quorum
+        :returns: True or False, depending on if quorum is established
+        """
+        if quorum is None:
+            quorum = self._quorum_size(node_count)
+        if len(statuses) >= quorum:
+            for hundred in (HTTP_CONTINUE, HTTP_OK, HTTP_MULTIPLE_CHOICES,
+                            HTTP_BAD_REQUEST):
+                if sum(1 for s in statuses
+                       if hundred <= s < hundred + 100) >= quorum:
+                    return True
+        return False
 
     def best_response(self, req, statuses, reasons, bodies, server_type,
-                      etag=None):
+                      etag=None, headers=None, overrides=None,
+                      quorum_size=None):
         """
         Given a list of responses from several servers, choose the best to
         return to the API.
@@ -469,274 +2238,336 @@ def best_response(self, req, statuses, reasons, bodies, server_type,
         :param bodies: bodies of each response
         :param server_type: type of server the responses came from
         :param etag: etag
+        :param headers: headers of each response
+        :param overrides: overrides to apply when lacking quorum
+        :param quorum_size: quorum size to use
         :returns: swob.Response object with the correct status, body, etc. set
         """
-        resp = Response(request=req)
-        if len(statuses):
-            for hundred in (HTTP_OK, HTTP_MULTIPLE_CHOICES, HTTP_BAD_REQUEST):
-                hstatuses = \
-                    [s for s in statuses if hundred <= s < hundred + 100]
-                if len(hstatuses) > len(statuses) / 2:
-                    status = max(hstatuses)
-                    status_index = statuses.index(status)
-                    resp.status = '%s %s' % (status, reasons[status_index])
-                    resp.body = bodies[status_index]
-                    if etag:
-                        resp.headers['etag'] = etag.strip('"')
-                    return resp
-        self.app.logger.error(_('%(type)s returning 503 for %(statuses)s'),
+        if quorum_size is None:
+            quorum_size = self._quorum_size(len(statuses))
+
+        resp = self._compute_quorum_response(
+            req, statuses, reasons, bodies, etag, headers,
+            quorum_size=quorum_size)
+        if overrides and not resp:
+            faked_up_status_indices = set()
+            transformed = []
+            for (i, (status, reason, hdrs, body)) in enumerate(zip(
+                    statuses, reasons, headers, bodies)):
+                if status in overrides:
+                    faked_up_status_indices.add(i)
+                    transformed.append((overrides[status], '', '', ''))
+                else:
+                    transformed.append((status, reason, hdrs, body))
+            statuses, reasons, headers, bodies = zip(*transformed)
+            resp = self._compute_quorum_response(
+                req, statuses, reasons, bodies, etag, headers,
+                indices_to_avoid=faked_up_status_indices,
+                quorum_size=quorum_size)
+
+        if not resp:
+            resp = HTTPServiceUnavailable(request=req)
+            self.logger.error('%(type)s returning 503 for %(statuses)s',
                               {'type': server_type, 'statuses': statuses})
-        resp.status = '503 Internal Server Error'
+
         return resp
 
+    def _compute_quorum_response(self, req, statuses, reasons, bodies, etag,
+                                 headers, quorum_size, indices_to_avoid=()):
+        if not statuses:
+            return None
+        for hundred in (HTTP_OK, HTTP_MULTIPLE_CHOICES, HTTP_BAD_REQUEST):
+            hstatuses = \
+                [(i, s) for i, s in enumerate(statuses)
+                 if hundred <= s < hundred + 100]
+            if len(hstatuses) >= quorum_size:
+                try:
+                    status_index, status = max(
+                        ((i, stat) for i, stat in hstatuses
+                            if i not in indices_to_avoid),
+                        key=operator.itemgetter(1))
+                except ValueError:
+                    # All statuses were indices to avoid
+                    continue
+                resp = status_map[status](request=req)
+                resp.status = '%s %s' % (status, reasons[status_index])
+                resp.body = bodies[status_index]
+                if headers:
+                    update_headers(resp, headers[status_index])
+                if etag:
+                    resp.headers['etag'] = normalize_etag(etag)
+                return resp
+        return None
+
     @public
     def GET(self, req):
-        """Handler for HTTP GET requests."""
+        """
+        Handler for HTTP GET requests.
+
+        :param req: The client request
+        :returns: the response to the client
+        """
         return self.GETorHEAD(req)
 
     @public
     def HEAD(self, req):
-        """Handler for HTTP HEAD requests."""
-        return self.GETorHEAD(req)
-
-    def _make_app_iter_reader(self, node, source, queue, logger_thread_locals):
-        """
-        Reads from the source and places data in the queue. It expects
-        something else be reading from the queue and, if nothing does within
-        self.app.client_timeout seconds, the process will be aborted.
-
-        :param node: The node dict that the source is connected to, for
-                     logging/error-limiting purposes.
-        :param source: The httplib.Response object to read from.
-        :param queue: The eventlet.queue.Queue to place read source data into.
-        :param logger_thread_locals: The thread local values to be set on the
-                                     self.app.logger to retain transaction
-                                     logging information.
         """
-        self.app.logger.thread_locals = logger_thread_locals
-        success = True
-        try:
-            try:
-                while True:
-                    with ChunkReadTimeout(self.app.node_timeout):
-                        chunk = source.read(self.app.object_chunk_size)
-                    if not chunk:
-                        break
-                    queue.put(chunk, timeout=self.app.client_timeout)
-            except Full:
-                self.app.logger.warn(
-                    _('Client did not read from queue within %ss') %
-                    self.app.client_timeout)
-                self.app.logger.increment('client_timeouts')
-                success = False
-            except (Exception, Timeout):
-                self.exception_occurred(node, _('Object'),
-                                        _('Trying to read during GET'))
-                success = False
-        finally:
-            # Ensure the queue getter gets a terminator.
-            queue.resize(2)
-            queue.put(success)
-            # Close-out the connection as best as possible.
-            if getattr(source, 'swift_conn', None):
-                self.close_swift_conn(source)
+        Handler for HTTP HEAD requests.
 
-    def _make_app_iter(self, node, source):
+        :param req: The client request
+        :returns: the response to the client
         """
-        Returns an iterator over the contents of the source (via its read
-        func).  There is also quite a bit of cleanup to ensure garbage
-        collection works and the underlying socket of the source is closed.
+        return self.GETorHEAD(req)
 
-        :param source: The httplib.Response object this iterator should read
-                       from.
-        :param node: The node the source is reading from, for logging purposes.
+    def autocreate_account(self, req, account):
         """
-        try:
-            # Spawn reader to read from the source and place in the queue.
-            # We then drop any reference to the source or node, for garbage
-            # collection purposes.
-            queue = Queue(1)
-            spawn_n(self._make_app_iter_reader, node, source, queue,
-                    self.app.logger.thread_locals)
-            source = node = None
-            while True:
-                chunk = queue.get(timeout=self.app.node_timeout)
-                if isinstance(chunk, bool):  # terminator
-                    success = chunk
-                    if not success:
-                        raise Exception(_('Failed to read all data'
-                                          ' from the source'))
-                    break
-                yield chunk
-        except Empty:
-            raise ChunkReadTimeout()
-        except (GeneratorExit, Timeout):
-            self.app.logger.warn(_('Client disconnected on read'))
-        except Exception:
-            self.app.logger.exception(_('Trying to send to client'))
-            raise
-
-    def close_swift_conn(self, src):
-        try:
-            src.swift_conn.close()
-        except Exception:
-            pass
-        src.swift_conn = None
-        try:
-            while src.read(self.app.object_chunk_size):
-                pass
-        except Exception:
-            pass
-        try:
-            src.close()
-        except Exception:
-            pass
+        Autocreate an account
 
-    def is_good_source(self, src):
-        """
-        Indicates whether or not the request made to the backend found
-        what it was looking for.
+        :param req: request leading to this autocreate
+        :param account: the unquoted account name
         """
-        return is_success(src.status) or is_redirection(src.status)
+        partition, nodes = self.app.account_ring.get_nodes(account)
+        path = '/%s' % account
+        headers = {'X-Timestamp': Timestamp.now().internal,
+                   'X-Trans-Id': self.trans_id,
+                   'X-Openstack-Request-Id': self.trans_id,
+                   'Connection': 'close'}
+        # transfer any x-account-sysmeta headers from original request
+        # to the autocreate PUT
+        headers.update((k, v)
+                       for k, v in req.headers.items()
+                       if is_sys_meta('account', k))
+        resp = self.make_requests(Request.blank(str_to_wsgi('/v1' + path)),
+                                  self.app.account_ring, partition, 'PUT',
+                                  path, [headers] * len(nodes))
+        if is_success(resp.status_int):
+            self.logger.info('autocreate account %r', path)
+            clear_info_cache(req.environ, account)
+            return True
+        else:
+            self.logger.warning('Could not autocreate account %r', path)
+            return False
 
-    def GETorHEAD_base(self, req, server_type, partition, nodes, path,
-                       attempts):
+    def GETorHEAD_base(self, req, server_type, node_iter, partition, path,
+                       concurrency=1, policy=None):
         """
         Base handler for HTTP GET or HEAD requests.
 
         :param req: swob.Request object
-        :param server_type: server type
+        :param server_type: server type used in logging
+        :param node_iter: an iterator to obtain nodes from
         :param partition: partition
-        :param nodes: nodes
         :param path: path for the request
-        :param attempts: number of attempts to try
+        :param concurrency: number of requests to run concurrently
+        :param policy: the policy instance, or None if Account or Container
         :returns: swob.Response object
         """
-        statuses = []
-        reasons = []
-        bodies = []
-        sources = []
-        newest = config_true_value(req.headers.get('x-newest', 'f'))
-        nodes = iter(nodes)
-        while len(statuses) < attempts:
-            try:
-                node = nodes.next()
-            except StopIteration:
-                break
-            if self.error_limited(node):
-                continue
-            try:
-                with ConnectionTimeout(self.app.conn_timeout):
-                    headers = dict(req.headers)
-                    headers['Connection'] = 'close'
-                    conn = http_connect(
-                        node['ip'], node['port'], node['device'], partition,
-                        req.method, path, headers=headers,
-                        query_string=req.query_string)
-                with Timeout(self.app.node_timeout):
-                    possible_source = conn.getresponse()
-                    # See NOTE: swift_conn at top of file about this.
-                    possible_source.swift_conn = conn
-            except (Exception, Timeout):
-                self.exception_occurred(
-                    node, server_type, _('Trying to %(method)s %(path)s') %
-                    {'method': req.method, 'path': req.path})
-                continue
-            if self.is_good_source(possible_source):
-                # 404 if we know we don't have a synced copy
-                if not float(possible_source.getheader('X-PUT-Timestamp', 1)):
-                    statuses.append(HTTP_NOT_FOUND)
-                    reasons.append('')
-                    bodies.append('')
-                    self.close_swift_conn(possible_source)
-                else:
-                    statuses.append(possible_source.status)
-                    reasons.append(possible_source.reason)
-                    bodies.append('')
-                    sources.append(possible_source)
-                    if not newest:  # one good source is enough
-                        break
+        backend_headers = self.generate_request_headers(
+            req, additional=req.headers)
+
+        handler = GetOrHeadHandler(self.app, req, self.server_type, node_iter,
+                                   partition, path, backend_headers,
+                                   concurrency, policy=policy,
+                                   logger=self.logger)
+        res = handler.get_working_response()
+
+        if not res:
+            res = self.best_response(
+                req, handler.statuses, handler.reasons, handler.bodies,
+                '%s %s' % (server_type, req.method),
+                headers=handler.source_headers)
+
+        # if a backend policy index is present in resp headers, translate it
+        # here with the friendly policy name
+        if 'X-Backend-Storage-Policy-Index' in res.headers and \
+                is_success(res.status_int):
+            policy = \
+                POLICIES.get_by_index(
+                    res.headers['X-Backend-Storage-Policy-Index'])
+            if policy:
+                res.headers['X-Storage-Policy'] = policy.name
             else:
-                statuses.append(possible_source.status)
-                reasons.append(possible_source.reason)
-                bodies.append(possible_source.read())
-                if possible_source.status == HTTP_INSUFFICIENT_STORAGE:
-                    self.error_limit(node)
-                elif is_server_error(possible_source.status):
-                    self.error_occurred(node, _('ERROR %(status)d %(body)s '
-                                                'From %(type)s Server') %
-                                        {'status': possible_source.status,
-                                         'body': bodies[-1][:1024],
-                                         'type': server_type})
-        if sources:
-            sources.sort(key=source_key)
-            source = sources.pop()
-            for src in sources:
-                self.close_swift_conn(src)
-            res = Response(request=req, conditional_response=True)
-            if req.method == 'GET' and \
-                    source.status in (HTTP_OK, HTTP_PARTIAL_CONTENT):
-                res.app_iter = self._make_app_iter(node, source)
-                # See NOTE: swift_conn at top of file about this.
-                res.swift_conn = source.swift_conn
-            res.status = source.status
-            update_headers(res, source.getheaders())
-            if not res.environ:
-                res.environ = {}
-            res.environ['swift_x_timestamp'] = \
-                source.getheader('x-timestamp')
-            res.accept_ranges = 'bytes'
-            res.content_length = source.getheader('Content-Length')
-            if source.getheader('Content-Type'):
-                res.charset = None
-                res.content_type = source.getheader('Content-Type')
-            return res
-        return self.best_response(req, statuses, reasons, bodies,
-                                  '%s %s' % (server_type, req.method))
+                self.logger.error(
+                    'Could not translate %s (%r) from %r to policy',
+                    'X-Backend-Storage-Policy-Index',
+                    res.headers['X-Backend-Storage-Policy-Index'], path)
+
+        return res
 
-    def OPTIONS_base(self, req):
+    def is_origin_allowed(self, cors_info, origin):
+        """
+        Is the given Origin allowed to make requests to this resource
+
+        :param cors_info: the resource's CORS related metadata headers
+        :param origin: the origin making the request
+        :return: True or False
+        """
+        allowed_origins = set()
+        if cors_info.get('allow_origin'):
+            allowed_origins.update(
+                [a.strip()
+                 for a in cors_info['allow_origin'].split(' ')
+                 if a.strip()])
+        if self.app.cors_allow_origin:
+            allowed_origins.update(self.app.cors_allow_origin)
+        return origin in allowed_origins or '*' in allowed_origins
+
+    @public
+    def OPTIONS(self, req):
         """
         Base handler for OPTIONS requests
 
         :param req: swob.Request object
         :returns: swob.Response object
         """
+        # Prepare the default response
         headers = {'Allow': ', '.join(self.allowed_methods)}
-        resp = Response(status=200, request=req,
-                        headers=headers)
+        resp = Response(status=200, request=req, headers=headers)
+
+        # If this isn't a CORS pre-flight request then return now
         req_origin_value = req.headers.get('Origin', None)
         if not req_origin_value:
-            # NOT a CORS request
             return resp
 
-        # CORS preflight request
+        # This is a CORS preflight request so check it's allowed
         try:
             container_info = \
-                self.container_info(self.account_name, self.container_name)
+                self.container_info(self.account_name,
+                                    self.container_name, req)
         except AttributeError:
-            container_info = {}
+            # This should only happen for requests to the Account. A future
+            # change could allow CORS requests to the Account level as well.
+            return resp
+
         cors = container_info.get('cors', {})
-        allowed_origins = set()
-        if cors.get('allow_origin'):
-            allowed_origins.update(cors['allow_origin'].split(' '))
-        if self.app.cors_allow_origin:
-            allowed_origins.update(self.app.cors_allow_origin)
-        if (req_origin_value not in allowed_origins and
-                '*' not in allowed_origins) or (
+
+        # If the CORS origin isn't allowed return a 401
+        if not self.is_origin_allowed(cors, req_origin_value) or (
                 req.headers.get('Access-Control-Request-Method') not in
                 self.allowed_methods):
             resp.status = HTTP_UNAUTHORIZED
-            return resp  # CORS preflight request that isn't valid
-        headers['access-control-allow-origin'] = req_origin_value
+            return resp
+
+        # Populate the response with the CORS preflight headers
+        if cors.get('allow_origin') and \
+                cors.get('allow_origin').strip() == '*':
+            headers['access-control-allow-origin'] = '*'
+        else:
+            headers['access-control-allow-origin'] = req_origin_value
+            if 'vary' in headers:
+                headers['vary'] += ', Origin'
+            else:
+                headers['vary'] = 'Origin'
+
         if cors.get('max_age') is not None:
             headers['access-control-max-age'] = cors.get('max_age')
-        headers['access-control-allow-methods'] = ', '.join(
-            self.allowed_methods)
-        if cors.get('allow_headers'):
-            headers['access-control-allow-headers'] = cors.get('allow_headers')
+
+        headers['access-control-allow-methods'] = \
+            ', '.join(self.allowed_methods)
+
+        # Allow all headers requested in the request. The CORS
+        # specification does leave the door open for this, as mentioned in
+        # http://www.w3.org/TR/cors/#resource-preflight-requests
+        # Note: Since the list of headers can be unbounded
+        # simply returning headers can be enough.
+        allow_headers = set(
+            list_from_csv(req.headers.get('Access-Control-Request-Headers')))
+        if allow_headers:
+            headers['access-control-allow-headers'] = ', '.join(allow_headers)
+            if 'vary' in headers:
+                headers['vary'] += ', Access-Control-Request-Headers'
+            else:
+                headers['vary'] = 'Access-Control-Request-Headers'
+
         resp.headers = headers
+
         return resp
 
-    @public
-    def OPTIONS(self, req):
-        return self.OPTIONS_base(req)
+    def get_name_length_limit(self):
+        if self.account_name.startswith(self.app.auto_create_account_prefix):
+            multiplier = 2
+        else:
+            multiplier = 1
+
+        if self.server_type == 'Account':
+            return constraints.MAX_ACCOUNT_NAME_LENGTH * multiplier
+        elif self.server_type == 'Container':
+            return constraints.MAX_CONTAINER_NAME_LENGTH * multiplier
+        else:
+            raise ValueError(
+                "server_type can only be 'account' or 'container'")
+
+    def _parse_listing_response(self, req, response):
+        if not is_success(response.status_int):
+            record_type = req.headers.get('X-Backend-Record-Type')
+            self.logger.warning(
+                'Failed to get container %s listing from %s: %s',
+                record_type, req.path_qs, response.status_int)
+            return None
+
+        try:
+            data = json.loads(response.body)
+            if not isinstance(data, list):
+                raise ValueError('not a list')
+            return data
+        except ValueError as err:
+            record_type = response.headers.get('X-Backend-Record-Type')
+            self.logger.error(
+                'Problem with container %s listing response from %s: %r',
+                record_type, req.path_qs, err)
+            return None
+
+    def _get_container_listing(self, req, account, container, headers=None,
+                               params=None):
+        """
+        Fetch container listing from given `account/container`.
+
+        :param req: original Request instance.
+        :param account: account in which `container` is stored.
+        :param container: container from which listing should be fetched.
+        :param headers: extra headers to be included with the listing
+            sub-request; these update the headers copied from the original
+            request.
+        :param params: query string parameters to be used.
+        :return: a tuple of (deserialized json data structure, swob Response)
+        """
+        params = params or {}
+        version, _a, _c, _other = req.split_path(3, 4, True)
+        path = '/'.join(['', version, account, container])
+
+        subreq = make_pre_authed_request(
+            req.environ, method='GET', path=quote(path), headers=req.headers,
+            swift_source='SH')
+        if headers:
+            subreq.headers.update(headers)
+        subreq.params = params
+        self.logger.debug(
+            'Get listing from %s %s' % (subreq.path_qs, headers))
+        response = self.app.handle_request(subreq)
+        data = self._parse_listing_response(subreq, response)
+        return data, response
+
+    def _parse_namespaces(self, req, listing, response):
+        if listing is None:
+            return None
+
+        record_type = response.headers.get('x-backend-record-type')
+        if record_type != 'shard':
+            err = 'unexpected record type %r' % record_type
+            self.logger.error("Failed to get shard ranges from %s: %s",
+                              req.path_qs, err)
+            return None
+
+        try:
+            # Note: a legacy container-server could return a list of
+            # ShardRanges, but that's ok: namespaces just need 'name', 'lower'
+            # and 'upper' keys. If we ever need to know we can look for a
+            # 'x-backend-record-shard-format' header from newer container
+            # servers.
+            return [Namespace(data['name'], data['lower'], data['upper'])
+                    for data in listing]
+        except (ValueError, TypeError, KeyError) as err:
+            self.logger.error(
+                "Failed to get namespaces from %s: invalid data: %r",
+                req.path_qs, err)
+            return None
diff --git a/swift/proxy/controllers/container.py b/swift/proxy/controllers/container.py
index 915e47627d..da7b0e3aeb 100644
--- a/swift/proxy/controllers/container.py
+++ b/swift/proxy/controllers/container.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,28 +13,23 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-# NOTE: swift_conn
-# You'll see swift_conn passed around a few places in this file. This is the
-# source httplib connection of whatever it is attached to.
-#   It is used when early termination of reading from the connection should
-# happen, such as when a range request is satisfied but there's still more the
-# source connection would like to send. To prevent having to read all the data
-# that could be left, the source connection can be .close() and then reads
-# commence to empty out any buffers.
-#   These shenanigans are to ensure all related objects can be garbage
-# collected. We've seen objects hang around forever otherwise.
-
-import time
-from urllib import unquote
-from random import shuffle
-
-from swift.common.utils import normalize_timestamp, public
-from swift.common.constraints import check_metadata, MAX_CONTAINER_NAME_LENGTH
-from swift.common.http import HTTP_ACCEPTED
-from swift.proxy.controllers.base import Controller, delay_denial, \
-    get_container_memcache_key, headers_to_container_info
-from swift.common.swob import HTTPBadRequest, HTTPForbidden, \
-    HTTPNotFound
+import json
+
+from urllib.parse import unquote
+
+from swift.common.utils import public, private, csv_append, Timestamp, \
+    config_true_value, cache_from_env, filter_namespaces, NamespaceBoundList
+from swift.common.constraints import check_metadata, CONTAINER_LISTING_LIMIT
+from swift.common.http import HTTP_ACCEPTED, is_success
+from swift.common.request_helpers import get_sys_meta_prefix, get_param, \
+    constrain_req_limit, validate_container_params
+from swift.proxy.controllers.base import Controller, delay_denial, NodeIter, \
+    cors_validation, set_info_cache, clear_info_cache, get_container_info, \
+    record_cache_op_metrics, get_cache_key, headers_from_container_info, \
+    update_headers, set_namespaces_in_cache, get_namespaces_from_cache
+from swift.common.storage_policy import POLICIES
+from swift.common.swob import HTTPBadRequest, HTTPForbidden, HTTPNotFound, \
+    HTTPServiceUnavailable, str_to_wsgi, wsgi_to_str, Response
 
 
 class ContainerController(Controller):
@@ -47,10 +42,39 @@ class ContainerController(Controller):
                             'x-versions-location']
 
     def __init__(self, app, account_name, container_name, **kwargs):
-        Controller.__init__(self, app)
+        super(ContainerController, self).__init__(app)
         self.account_name = unquote(account_name)
         self.container_name = unquote(container_name)
 
+    def _x_remove_headers(self):
+        st = self.server_type.lower()
+        return ['x-remove-%s-read' % st,
+                'x-remove-%s-write' % st,
+                'x-remove-versions-location',
+                'x-remove-%s-sync-key' % st,
+                'x-remove-%s-sync-to' % st]
+
+    def _convert_policy_to_index(self, req):
+        """
+        Helper method to convert a policy name (from a request from a client)
+        to a policy index (for a request to a backend).
+
+        :param req: incoming request
+        """
+        policy_name = req.headers.get('X-Storage-Policy')
+        if not policy_name:
+            return
+        policy = POLICIES.get_by_name(policy_name)
+        if not policy:
+            raise HTTPBadRequest(request=req,
+                                 content_type="text/plain",
+                                 body=("Invalid %s '%s'"
+                                       % ('X-Storage-Policy', policy_name)))
+        if policy.is_deprecated:
+            body = 'Storage Policy %r is deprecated' % (policy.name)
+            raise HTTPBadRequest(request=req, body=body)
+        return int(policy)
+
     def clean_acls(self, req):
         if 'swift.clean_acl' in req.environ:
             for header in ('x-container-read', 'x-container-write'):
@@ -59,148 +83,689 @@ def clean_acls(self, req):
                         req.headers[header] = \
                             req.environ['swift.clean_acl'](header,
                                                            req.headers[header])
-                    except ValueError, err:
+                    except ValueError as err:
                         return HTTPBadRequest(request=req, body=str(err))
         return None
 
-    def GETorHEAD(self, req):
-        """Handler for HTTP GET/HEAD requests."""
-        if not self.account_info(self.account_name)[1]:
-            return HTTPNotFound(request=req)
-        part, nodes = self.app.container_ring.get_nodes(
+    def _clear_container_info_cache(self, req):
+        clear_info_cache(req.environ,
+                         self.account_name, self.container_name)
+        clear_info_cache(req.environ,
+                         self.account_name, self.container_name, 'listing')
+        # TODO: should we also purge updating shards from cache?
+
+    def _GETorHEAD_from_backend(self, req):
+        part = self.app.container_ring.get_part(
             self.account_name, self.container_name)
-        shuffle(nodes)
+        concurrency = self.app.container_ring.replica_count \
+            if self.app.get_policy_options(None).concurrent_gets else 1
+        node_iter = NodeIter(
+            'container', self.app, self.app.container_ring, part,
+            self.logger, req)
         resp = self.GETorHEAD_base(
-            req, _('Container'), part, nodes, req.path_info, len(nodes))
-        if self.app.memcache:
-            # set the memcache container size for ratelimiting
-            cache_key = get_container_memcache_key(self.account_name,
-                                                   self.container_name)
-            self.app.memcache.set(
-                cache_key,
-                headers_to_container_info(resp.headers, resp.status_int),
-                timeout=self.app.recheck_container_existence)
+            req, 'Container', node_iter, part,
+            req.swift_entity_path, concurrency)
+        return resp
+
+    def _filter_complete_listing(self, req, namespaces):
+        """
+        Filter complete list of namespaces to return only those specified by
+        the request constraints.
+
+        :param req: a :class:`~swift.common.swob.Request`.
+        :param namespaces: a list of :class:`~swift.common.utils.Namespace`.
+        :return: a list of :class:`~swift.common.utils.Namespace`.
+        """
+        marker = get_param(req, 'marker', '')
+        end_marker = get_param(req, 'end_marker')
+        includes = get_param(req, 'includes')
+        reverse = config_true_value(get_param(req, 'reverse'))
+        if reverse:
+            marker, end_marker = end_marker, marker
+        namespaces = filter_namespaces(
+            namespaces, includes, marker, end_marker)
+        if reverse:
+            namespaces.reverse()
+        return namespaces
+
+    def _get_listing_namespaces_from_cache(self, req, headers):
+        """
+        Try to fetch shard namespace data from cache and, if successful, return
+        a list of Namespaces. Also return the cache state.
+
+        :param req: an instance of ``swob.Request``.
+        :return: a tuple comprising (a list instance of ``Namespace`` objects
+            or ``None`` if no namespaces were found in cache, the cache state).
+        """
+        cache_key = get_cache_key(self.account_name, self.container_name,
+                                  shard='listing')
+        skip_chance = self.app.container_listing_shard_ranges_skip_cache
+        ns_bound_list, cache_state = get_namespaces_from_cache(
+            req, cache_key, skip_chance)
+        if not ns_bound_list:
+            return None, None, cache_state
+
+        # Namespaces found in cache so there is no need to go to backend,
+        # but we need to build response headers: mimic
+        # GetOrHeadHandler.get_working_response...
+        # note: server sets charset with content_type but proxy
+        # GETorHEAD_base does not, so don't set it here either
+        namespaces = ns_bound_list.get_namespaces()
+        self.logger.debug('Found %d shards in cache for %s',
+                          len(namespaces), req.path_qs)
+        headers.update({'x-backend-record-type': 'shard',
+                        'x-backend-record-shard-format': 'namespace',
+                        'x-backend-cached-results': 'true'})
+        resp = Response(request=req)
+        update_headers(resp, headers)
+        resp.last_modified = Timestamp(headers['x-put-timestamp'])
+        resp.environ['swift_x_timestamp'] = headers.get('x-timestamp')
+        resp.accept_ranges = 'bytes'
+        resp.content_type = 'application/json'
+        namespaces = self._filter_complete_listing(req, namespaces)
+        return resp, namespaces, cache_state
+
+    def _set_listing_namespaces_in_cache(self, req, namespaces):
+        """
+        Store a list of namespaces in both infocache and memcache.
+
+        Note: the returned list of namespaces may not be identical to the given
+        list. Any gaps in the given namespaces will be 'lost' as a result of
+        compacting the list of namespaces to a NamespaceBoundList for caching.
+        That is ok. When the cached NamespaceBoundList is transformed back to
+        Namespaces to perform a listing, the Namespace before each gap will
+        have expanded to include the gap, which means that the backend GET to
+        that shard will have an end_marker beyond that shard's upper bound, and
+        equal to the next available shard's lower. At worst, some misplaced
+        objects, in the gap above the shard's upper, may be included in the
+        shard's response.
+
+        :param req: the request object.
+        :param namespaces:  a list of :class:`~swift.common.utils.Namespace`
+            objects; must be not None or empty.
+        :return: a list of :class:`~swift.common.utils.Namespace` objects.
+        """
+        cache_key = get_cache_key(self.account_name, self.container_name,
+                                  shard='listing')
+        ns_bound_list = NamespaceBoundList.parse(namespaces)
+        # cache in infocache even if no namespaces returned; this
+        # is unexpected but use that result for this request
+        set_cache_state = set_namespaces_in_cache(
+            req, cache_key, ns_bound_list,
+            self.app.recheck_listing_shard_ranges)
+        if set_cache_state == 'set':
+            self.logger.info(
+                'Caching listing namespaces for %s (%d namespaces)',
+                cache_key, len(ns_bound_list.bounds))
+        # return the de-gapped namespaces
+        return ns_bound_list.get_namespaces()
+
+    def _get_listing_namespaces_from_backend(self, req, cache_enabled):
+        """
+        Fetch shard namespace data from the backend and, if successful, return
+        a list of Namespaces.
+
+        :param req: an instance of ``swob.Request``.
+        :param cache_enabled: a boolean which should be True if memcache is
+            available to cache the returned data, False otherwise.
+        :return: a list instance of ``Namespace`` objects or ``None`` if no
+            namespace data was returned from the backend.
+        """
+        # Instruct the backend server to 'automatically' return namespaces
+        # of shards in a 'listing' state if the container is sharded, and
+        # that the more compact 'namespace' format is sufficient. Older
+        # container servers may still respond with the 'full' shard range
+        # format.
+        req.headers['X-Backend-Record-Type'] = 'auto'
+        req.headers['X-Backend-Record-Shard-Format'] = 'namespace'
+        # 'x-backend-include-deleted' is not expected in 'auto' requests to
+        # the proxy (it's not supported for objects and is used by the
+        # sharder when explicitly fetching 'shard' record type), but we
+        # explicitly set it to false here just in case. A newer container
+        # server would ignore it when returning namespaces, but an older
+        # container server would include unwanted deleted shard range.
+        req.headers['X-Backend-Include-Deleted'] = 'false'
+        params = req.params
+        params['states'] = 'listing'
+        req.params = params
+        if cache_enabled:
+            # Instruct the backend server to ignore name constraints in
+            # request params if returning namespaces so that the response
+            # can potentially be cached, but only if the container state is
+            # 'sharded'. We don't attempt to cache namespaces for a
+            # 'sharding' container as they may include the container itself
+            # as a 'gap filler' for shards that have not yet cleaved;
+            # listings from 'gap filler' namespaces are likely to become
+            # stale as the container continues to cleave objects to its
+            # shards and caching them is therefore more likely to result in
+            # stale or incomplete listings on subsequent container GETs.
+            req.headers['x-backend-override-shard-name-filter'] = 'sharded'
+        resp = self._GETorHEAD_from_backend(req)
+        resp_record_type = resp.headers.get(
+            'x-backend-record-type', '').lower()
+        sharding_state = resp.headers.get(
+            'x-backend-sharding-state', '').lower()
+        complete_listing = config_true_value(resp.headers.pop(
+            'x-backend-override-shard-name-filter', False))
+        if resp_record_type == 'shard':
+            data = self._parse_listing_response(req, resp)
+            namespaces = self._parse_namespaces(req, data, resp)
+            # given that we sent
+            # 'x-backend-override-shard-name-filter=sharded' we should only
+            # receive back 'x-backend-override-shard-name-filter=true' if
+            # the sharding state is 'sharded', but check them both
+            # anyway...
+            if (namespaces and
+                    sharding_state == 'sharded' and
+                    complete_listing):
+                namespaces = self._set_listing_namespaces_in_cache(
+                    req, namespaces)
+                namespaces = self._filter_complete_listing(req, namespaces)
+        else:
+            namespaces = None
+        return resp, namespaces
+
+    def _record_shard_listing_cache_metrics(self, cache_state, resp, info):
+        """
+        Record a single cache operation by shard listing into its
+        corresponding metrics.
+
+        :param  cache_state: the state of this cache operation, includes
+                  infocache_hit, memcache hit, miss, error, skip, force_skip
+                  and disabled.
+        :param  resp: the response from either backend or cache hit.
+        :param  info: the cached container info.
+        """
+        should_record = False
+        if is_success(resp.status_int):
+            if resp.headers.get('X-Backend-Record-Type', '') == 'shard':
+                # Here we either got namespaces by hitting the cache, or we
+                # got namespaces from backend successfully for cache_state
+                # other than cache hit. Note: it's possible that later we find
+                # that namespaces can't be parsed.
+                should_record = True
+        elif (info and is_success(info['status'])
+                and info.get('sharding_state') == 'sharded'):
+            # The shard listing request failed when getting namespaces from
+            # backend.
+            # Note: In the absence of 'info' we cannot assume the container is
+            # sharded, so we don't increment the metric if 'info' is None. Even
+            # when we have valid info, we can't be sure that the container is
+            # sharded, but we assume info was correct and increment the failure
+            # metrics.
+            should_record = True
+        # else:
+        #  The request failed, but in the absence of info we cannot assume
+        #  the container is sharded, so we don't increment the metric.
+
+        if should_record:
+            record_cache_op_metrics(
+                self.logger, self.server_type.lower(), 'shard_listing',
+                cache_state, resp)
+
+    def _GET_auto(self, req):
+        # This is an object listing but the backend may be sharded.
+        # Only lookup container info from cache and skip the backend HEAD,
+        # since we are going to GET the backend container anyway.
+        info = get_container_info(
+            req.environ, self.app, swift_source=None, cache_only=True)
+        memcache = cache_from_env(req.environ, True)
+        cache_enabled = self.app.recheck_listing_shard_ranges > 0 and memcache
+        resp = namespaces = None
+        if cache_enabled:
+            # if the container is sharded we may look for namespaces in cache
+            headers = headers_from_container_info(info)
+            if config_true_value(req.headers.get('x-newest', False)):
+                cache_state = 'force_skip'
+                self.logger.debug(
+                    'Skipping shard cache lookup (x-newest) for %s',
+                    req.path_qs)
+            elif (headers and is_success(info['status']) and
+                  info.get('sharding_state') == 'sharded'):
+                # container is sharded so we may have the namespaces cached,
+                # but only use cached namespaces if all required response
+                # headers are also available from cache.
+                resp, namespaces, cache_state = \
+                    self._get_listing_namespaces_from_cache(req, headers)
+            else:
+                # container metadata didn't support a cache lookup, this could
+                # be the case that container metadata was not in cache and we
+                # don't know if the container was sharded, or the case that the
+                # sharding state in metadata indicates the container was
+                # unsharded.
+                cache_state = 'bypass'
+        else:
+            cache_state = 'disabled'
+
+        if not namespaces:
+            resp, namespaces = self._get_listing_namespaces_from_backend(
+                req, cache_enabled)
+        self._record_shard_listing_cache_metrics(cache_state, resp, info)
+
+        if namespaces is not None:
+            # we got namespaces, so the container must be sharded; now build
+            # the listing from shards
+            # NB: the filtered namespaces list may be empty but we still need
+            # to build a response body with an empty list of objects
+            resp = self._get_from_shards(req, resp, namespaces)
+
+        return resp
+
+    def _get_or_head_pre_check(self, req):
+        ai = self.account_info(self.account_name, req)
+        auto_account = self.account_name.startswith(
+            self.app.auto_create_account_prefix)
+        if not (auto_account or ai[1]):
+            if 'swift.authorize' in req.environ:
+                aresp = req.environ['swift.authorize'](req)
+                if aresp:
+                    # Don't cache this. It doesn't reflect the state of the
+                    # container, just that the user can't access it.
+                    return aresp
+            # Don't cache this. The lack of account will be cached, and that
+            # is sufficient.
+            return HTTPNotFound(request=req)
+        return None
+
+    def _get_or_head_post_check(self, req, resp):
+        if not config_true_value(
+                resp.headers.get('X-Backend-Cached-Results')):
+            # Cache container metadata. We just made a request to a storage
+            # node and got up-to-date information for the container.
+            resp.headers['X-Backend-Recheck-Container-Existence'] = str(
+                self.app.recheck_container_existence)
+            set_info_cache(req.environ, self.account_name,
+                           self.container_name, resp)
 
         if 'swift.authorize' in req.environ:
-            req.acl = resp.headers.get('x-container-read')
+            req.acl = wsgi_to_str(resp.headers.get('x-container-read'))
             aresp = req.environ['swift.authorize'](req)
             if aresp:
+                # Don't cache this. It doesn't reflect the state of the
+                # container, just that the user can't access it.
                 return aresp
         if not req.environ.get('swift_owner', False):
-            for key in ('x-container-read', 'x-container-write',
-                        'x-container-sync-key', 'x-container-sync-to'):
+            for key in self.app.swift_owner_headers:
                 if key in resp.headers:
                     del resp.headers[key]
+        # Expose sharding state in reseller requests
+        if req.environ.get('reseller_request', False):
+            resp.headers['X-Container-Sharding'] = config_true_value(
+                resp.headers.get(get_sys_meta_prefix('container') + 'Sharding',
+                                 'False'))
         return resp
 
     @public
     @delay_denial
+    @cors_validation
     def GET(self, req):
         """Handler for HTTP GET requests."""
-        return self.GETorHEAD(req)
+        # early checks for request validity
+        validate_container_params(req)
+        aresp = self._get_or_head_pre_check(req)
+        if aresp:
+            return aresp
+
+        # Always request json format from the backend. listing_formats
+        # middleware will take care of what the client gets back.
+        # The read-modify-write of params here is because the
+        # Request.params getter dynamically generates a dict of params from
+        # the query string; the setter must be called for new params to
+        # update the query string.
+        params = req.params
+        params['format'] = 'json'
+        req.params = params
+
+        # x-backend-record-type may be sent via internal client e.g. from
+        # the sharder or in probe tests
+        record_type = req.headers.get('X-Backend-Record-Type', '').lower()
+        if record_type in ('object', 'shard'):
+            # Go direct to the backend for HEADs, and GETs that *explicitly*
+            # specify a record type. We won't be reading/writing namespaces in
+            # cache nor building listings from shards. This path is used by
+            # the sharder, manage_shard_ranges and other tools that fetch shard
+            # ranges, and by the proxy itself when explicitly requesting
+            # objects while recursively building a listing from shards.
+            # Note: shard record type could be namespace or full format
+            resp = self._GETorHEAD_from_backend(req)
+        else:
+            # Requests that do not explicitly specify a record type, or specify
+            # 'auto', default to returning an object listing. The listing may
+            # be built from shards and may involve reading/writing namespaces
+            # in cache. This path is used for client requests and by the proxy
+            # itself while recursively building a listing from shards.
+            resp = self._GET_auto(req)
+            resp.headers.pop('X-Backend-Record-Type', None)
+            resp.headers.pop('X-Backend-Record-Shard-Format', None)
+
+        return self._get_or_head_post_check(req, resp)
+
+    def _get_from_shards(self, req, resp, namespaces):
+        """
+        Construct an object listing using shards described by the list of
+        namespaces.
+
+        :param req: an instance of :class:`~swift.common.swob.Request`.
+        :param resp: an instance of :class:`~swift.common.swob.Response`.
+        :param namespaces: a list of :class:`~swift.common.utils.Namespace`.
+        :return: an instance of :class:`~swift.common.swob.Response`. If an
+            error is encountered while building the listing an instance of
+            ``HTTPServiceUnavailable`` may be returned. Otherwise, the given
+            ``resp`` is returned with a body that is an object listing.
+        """
+        # The history of containers that have returned namespaces is
+        # maintained in the request environ so that loops can be avoided by
+        # forcing an object listing if the same container is visited again.
+        # This can happen in at least two scenarios:
+        #   1. a container has filled a gap in its namespaces with a
+        #      namespace pointing to itself
+        #   2. a root container returns a (stale) namespace pointing to a
+        #      shard that has shrunk into the root, in which case the shrunken
+        #      shard may return the root's namespace.
+        shard_listing_history = req.environ.setdefault(
+            'swift.shard_listing_history', [])
+        policy_key = 'X-Backend-Storage-Policy-Index'
+        if not (shard_listing_history or policy_key in req.headers):
+            # We're handling the original request to the root container: set
+            # the root policy index in the request, unless it is already set,
+            # so that shards will return listings for that policy index.
+            # Note: we only get here if the root responded with namespaces,
+            # or if the namespaces were cached and the cached root container
+            # info has sharding_state==sharded; in both cases we can assume
+            # that the response is "modern enough" to include
+            # 'X-Backend-Storage-Policy-Index'.
+            req.headers[policy_key] = resp.headers[policy_key]
+        shard_listing_history.append((self.account_name, self.container_name))
+        self.logger.debug('GET listing from %s shards for: %s',
+                          len(namespaces), req.path_qs)
+
+        objects = []
+        req_limit = constrain_req_limit(req, CONTAINER_LISTING_LIMIT)
+        params = req.params.copy()
+        params.pop('states', None)
+        req.headers.pop('X-Backend-Record-Type', None)
+        reverse = config_true_value(params.get('reverse'))
+        marker = wsgi_to_str(params.get('marker'))
+        end_marker = wsgi_to_str(params.get('end_marker'))
+        prefix = wsgi_to_str(params.get('prefix'))
+
+        limit = req_limit
+        all_resp_status = []
+        for i, namespace in enumerate(namespaces):
+            params['limit'] = limit
+            # Always set marker to ensure that object names less than or equal
+            # to those already in the listing are not fetched; if the listing
+            # is empty then the original request marker, if any, is used. This
+            # allows misplaced objects below the expected namespace to be
+            # included in the listing.
+            last_name = ''
+            last_name_was_subdir = False
+            if objects:
+                last_name_was_subdir = 'subdir' in objects[-1]
+                if last_name_was_subdir:
+                    last_name = objects[-1]['subdir']
+                else:
+                    last_name = objects[-1]['name']
+
+                params['marker'] = str_to_wsgi(last_name)
+            elif marker:
+                params['marker'] = str_to_wsgi(marker)
+            else:
+                params['marker'] = ''
+            # Always set end_marker to ensure that misplaced objects beyond the
+            # expected namespace are not fetched. This prevents a misplaced
+            # object obscuring correctly placed objects in the next shard
+            # range.
+            if end_marker and end_marker in namespace:
+                params['end_marker'] = str_to_wsgi(end_marker)
+            elif reverse:
+                params['end_marker'] = str_to_wsgi(namespace.lower_str)
+            else:
+                params['end_marker'] = str_to_wsgi(namespace.end_marker)
+
+            headers = {}
+            if ((namespace.account, namespace.container) in
+                    shard_listing_history):
+                # directed back to same container - force GET of objects
+                headers['X-Backend-Record-Type'] = 'object'
+            else:
+                headers['X-Backend-Record-Type'] = 'auto'
+            if config_true_value(req.headers.get('x-newest', False)):
+                headers['X-Newest'] = 'true'
+
+            if prefix:
+                if prefix > namespace:
+                    continue
+                try:
+                    just_past = prefix[:-1] + chr(ord(prefix[-1]) + 1)
+                except ValueError:
+                    pass
+                else:
+                    if just_past < namespace:
+                        continue
+
+            if last_name_was_subdir and str(
+                namespace.lower if reverse else namespace.upper
+            ).startswith(last_name):
+                continue
+
+            self.logger.debug(
+                'Getting listing part %d from shard %s %s with %s',
+                i, namespace, namespace.name, headers)
+            objs, shard_resp = self._get_container_listing(
+                req, namespace.account, namespace.container,
+                headers=headers, params=params)
+            all_resp_status.append(shard_resp.status_int)
+
+            sharding_state = shard_resp.headers.get('x-backend-sharding-state',
+                                                    'unknown')
+
+            if objs is None:
+                # give up if any non-success response from shard containers
+                self.logger.error(
+                    'Aborting listing from shards due to bad response: %r'
+                    % all_resp_status)
+                return HTTPServiceUnavailable(request=req)
+            shard_policy = shard_resp.headers.get(
+                'X-Backend-Record-Storage-Policy-Index',
+                shard_resp.headers[policy_key]
+            )
+            if shard_policy != req.headers[policy_key]:
+                self.logger.error(
+                    'Aborting listing from shards due to bad shard policy '
+                    'index: %s (expected %s)',
+                    shard_policy, req.headers[policy_key])
+                return HTTPServiceUnavailable(request=req)
+            self.logger.debug(
+                'Found %d objects in shard (state=%s), total = %d',
+                len(objs), sharding_state, len(objs) + len(objects))
+
+            if not objs:
+                # tolerate empty shard containers
+                continue
+
+            objects.extend(objs)
+            limit -= len(objs)
+
+            if limit <= 0:
+                break
+            last_name = objects[-1].get('name',
+                                        objects[-1].get('subdir', u''))
+            if end_marker and reverse and end_marker >= last_name:
+                break
+            if end_marker and not reverse and end_marker <= last_name:
+                break
+
+        resp.body = json.dumps(objects).encode('ascii')
+        constrained = any(req.params.get(constraint) for constraint in (
+            'marker', 'end_marker', 'path', 'prefix', 'delimiter'))
+        if not constrained and len(objects) < req_limit:
+            self.logger.debug('Setting object count to %s' % len(objects))
+            # prefer the actual listing stats over the potentially outdated
+            # root stats. This condition is only likely when a sharded
+            # container is shrinking or in tests; typically a sharded container
+            # will have more than CONTAINER_LISTING_LIMIT objects so any
+            # unconstrained listing will be capped by the limit and total
+            # object stats cannot therefore be inferred from the listing.
+            resp.headers['X-Container-Object-Count'] = len(objects)
+            resp.headers['X-Container-Bytes-Used'] = sum(
+                [o['bytes'] for o in objects])
+        return resp
 
     @public
     @delay_denial
+    @cors_validation
     def HEAD(self, req):
         """Handler for HTTP HEAD requests."""
-        return self.GETorHEAD(req)
+        aresp = self._get_or_head_pre_check(req)
+        if aresp:
+            return aresp
+        resp = self._GETorHEAD_from_backend(req)
+        return self._get_or_head_post_check(req, resp)
 
     @public
+    @cors_validation
     def PUT(self, req):
         """HTTP PUT request handler."""
         error_response = \
             self.clean_acls(req) or check_metadata(req, 'container')
         if error_response:
             return error_response
-        if len(self.container_name) > MAX_CONTAINER_NAME_LENGTH:
-            resp = HTTPBadRequest(request=req)
-            resp.body = 'Container name length of %d longer than %d' % \
-                        (len(self.container_name), MAX_CONTAINER_NAME_LENGTH)
+        policy_index = self._convert_policy_to_index(req)
+        if not req.environ.get('swift_owner'):
+            for key in self.app.swift_owner_headers:
+                req.headers.pop(key, None)
+        if req.environ.get('reseller_request', False) and \
+                'X-Container-Sharding' in req.headers:
+            req.headers[get_sys_meta_prefix('container') + 'Sharding'] = \
+                str(config_true_value(req.headers['X-Container-Sharding']))
+        length_limit = self.get_name_length_limit()
+        if len(self.container_name) > length_limit:
+            body = 'Container name length of %d longer than %d' % (
+                len(self.container_name), length_limit)
+            resp = HTTPBadRequest(request=req, body=body)
             return resp
         account_partition, accounts, container_count = \
-            self.account_info(self.account_name,
-                              autocreate=self.app.account_autocreate)
-        if self.app.max_containers_per_account > 0 and \
-                container_count >= self.app.max_containers_per_account and \
-                self.account_name not in self.app.max_containers_whitelist:
-            resp = HTTPForbidden(request=req)
-            resp.body = 'Reached container limit of %s' % \
-                        self.app.max_containers_per_account
-            return resp
+            self.account_info(self.account_name, req)
+        if not accounts and self.app.account_autocreate:
+            if not self.autocreate_account(req, self.account_name):
+                return HTTPServiceUnavailable(request=req)
+            account_partition, accounts, container_count = \
+                self.account_info(self.account_name, req)
         if not accounts:
             return HTTPNotFound(request=req)
+        if 0 < self.app.max_containers_per_account <= container_count and \
+                self.account_name not in self.app.max_containers_whitelist:
+            container_info = \
+                self.container_info(self.account_name, self.container_name,
+                                    req)
+            if not is_success(container_info.get('status')):
+                body = 'Reached container limit of %s' % (
+                    self.app.max_containers_per_account, )
+                resp = HTTPForbidden(request=req, body=body)
+                return resp
         container_partition, containers = self.app.container_ring.get_nodes(
             self.account_name, self.container_name)
-        headers = []
-        for account in accounts:
-            nheaders = {'X-Timestamp': normalize_timestamp(time.time()),
-                        'x-trans-id': self.trans_id,
-                        'X-Account-Host': '%(ip)s:%(port)s' % account,
-                        'X-Account-Partition': account_partition,
-                        'X-Account-Device': account['device'],
-                        'Connection': 'close'}
-            self.transfer_headers(req.headers, nheaders)
-            headers.append(nheaders)
-        if self.app.memcache:
-            cache_key = get_container_memcache_key(self.account_name,
-                                                   self.container_name)
-            self.app.memcache.delete(cache_key)
+        headers = self._backend_requests(req, len(containers),
+                                         account_partition, accounts,
+                                         policy_index)
         resp = self.make_requests(
             req, self.app.container_ring,
-            container_partition, 'PUT', req.path_info, headers)
+            container_partition, 'PUT', req.swift_entity_path, headers)
+        self._clear_container_info_cache(req)
         return resp
 
     @public
+    @cors_validation
     def POST(self, req):
         """HTTP POST request handler."""
         error_response = \
             self.clean_acls(req) or check_metadata(req, 'container')
         if error_response:
             return error_response
+        if not req.environ.get('swift_owner'):
+            for key in self.app.swift_owner_headers:
+                req.headers.pop(key, None)
+        if req.environ.get('reseller_request', False) and \
+                'X-Container-Sharding' in req.headers:
+            req.headers[get_sys_meta_prefix('container') + 'Sharding'] = \
+                str(config_true_value(req.headers['X-Container-Sharding']))
         account_partition, accounts, container_count = \
-            self.account_info(self.account_name,
-                              autocreate=self.app.account_autocreate)
+            self.account_info(self.account_name, req)
         if not accounts:
             return HTTPNotFound(request=req)
         container_partition, containers = self.app.container_ring.get_nodes(
             self.account_name, self.container_name)
-        headers = {'X-Timestamp': normalize_timestamp(time.time()),
-                   'x-trans-id': self.trans_id,
-                   'Connection': 'close'}
-        self.transfer_headers(req.headers, headers)
-        if self.app.memcache:
-            self.app.memcache.delete(get_container_memcache_key(
-                self.account_name, self.container_name))
+        headers = self.generate_request_headers(req, transfer=True)
+        self._clear_container_info_cache(req)
         resp = self.make_requests(
             req, self.app.container_ring, container_partition, 'POST',
-            req.path_info, [headers] * len(containers))
+            req.swift_entity_path, [headers] * len(containers))
         return resp
 
     @public
+    @cors_validation
     def DELETE(self, req):
         """HTTP DELETE request handler."""
         account_partition, accounts, container_count = \
-            self.account_info(self.account_name)
+            self.account_info(self.account_name, req)
         if not accounts:
             return HTTPNotFound(request=req)
         container_partition, containers = self.app.container_ring.get_nodes(
             self.account_name, self.container_name)
-        headers = []
-        for account in accounts:
-            headers.append({'X-Timestamp': normalize_timestamp(time.time()),
-                           'X-Trans-Id': self.trans_id,
-                           'X-Account-Host': '%(ip)s:%(port)s' % account,
-                           'X-Account-Partition': account_partition,
-                           'X-Account-Device': account['device'],
-                           'Connection': 'close'})
-        if self.app.memcache:
-            cache_key = get_container_memcache_key(self.account_name,
-                                                   self.container_name)
-            self.app.memcache.delete(cache_key)
+        headers = self._backend_requests(req, len(containers),
+                                         account_partition, accounts)
+        self._clear_container_info_cache(req)
         resp = self.make_requests(
             req, self.app.container_ring, container_partition, 'DELETE',
-            req.path_info, headers)
+            req.swift_entity_path, headers)
         # Indicates no server had the container
         if resp.status_int == HTTP_ACCEPTED:
             return HTTPNotFound(request=req)
         return resp
+
+    @private
+    def UPDATE(self, req):
+        """HTTP UPDATE request handler.
+
+        Method to perform bulk operations on container DBs,
+        similar to a merge_items REPLICATE request.
+
+        Not client facing; internal clients or middlewares must include
+        ``X-Backend-Allow-Private-Methods: true`` header to access.
+        """
+        container_partition, containers = self.app.container_ring.get_nodes(
+            self.account_name, self.container_name)
+        # Since this isn't client facing, expect callers to supply an index
+        policy_index = req.headers['X-Backend-Storage-Policy-Index']
+        headers = self._backend_requests(
+            req, len(containers), account_partition=None, accounts=[],
+            policy_index=policy_index)
+        return self.make_requests(
+            req, self.app.container_ring, container_partition, 'UPDATE',
+            req.swift_entity_path, headers, body=req.body)
+
+    def _backend_requests(self, req, n_outgoing, account_partition, accounts,
+                          policy_index=None):
+        additional = {'X-Timestamp': Timestamp.now().internal}
+        if policy_index is None:
+            additional['X-Backend-Storage-Policy-Default'] = \
+                int(POLICIES.default)
+        else:
+            additional['X-Backend-Storage-Policy-Index'] = str(policy_index)
+        headers = [self.generate_request_headers(req, transfer=True,
+                                                 additional=additional)
+                   for _junk in range(n_outgoing)]
+
+        for i, account in enumerate(accounts):
+            i = i % len(headers)
+
+            headers[i]['X-Account-Partition'] = account_partition
+            headers[i]['X-Account-Host'] = csv_append(
+                headers[i].get('X-Account-Host'),
+                '%(ip)s:%(port)s' % account)
+            headers[i]['X-Account-Device'] = csv_append(
+                headers[i].get('X-Account-Device'),
+                account['device'])
+
+        return headers
diff --git a/swift/proxy/controllers/info.py b/swift/proxy/controllers/info.py
new file mode 100644
index 0000000000..2435849c78
--- /dev/null
+++ b/swift/proxy/controllers/info.py
@@ -0,0 +1,108 @@
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import json
+from time import time
+
+from swift.common.utils import public, streq_const_time
+from swift.common.digest import get_hmac
+from swift.common.registry import get_swift_info
+from swift.proxy.controllers.base import Controller, delay_denial
+from swift.common.swob import HTTPOk, HTTPForbidden, HTTPUnauthorized
+
+
+class InfoController(Controller):
+    """WSGI controller for info requests"""
+    server_type = 'Info'
+
+    def __init__(self, app, version, expose_info, disallowed_sections,
+                 admin_key):
+        super(InfoController, self).__init__(app)
+        self.expose_info = expose_info
+        self.disallowed_sections = disallowed_sections
+        self.admin_key = admin_key
+        self.allowed_hmac_methods = {
+            'HEAD': ['HEAD', 'GET'],
+            'GET': ['GET']}
+
+    @public
+    @delay_denial
+    def GET(self, req):
+        return self.GETorHEAD(req)
+
+    @public
+    @delay_denial
+    def HEAD(self, req):
+        return self.GETorHEAD(req)
+
+    @public
+    @delay_denial
+    def OPTIONS(self, req):
+        return HTTPOk(request=req, headers={'Allow': 'HEAD, GET, OPTIONS'})
+
+    def GETorHEAD(self, req):
+        """Handler for HTTP GET/HEAD requests."""
+        """
+        Handles requests to /info
+        Should return a WSGI-style callable (such as swob.Response).
+
+        :param req: swob.Request object
+        """
+        if not self.expose_info:
+            return HTTPForbidden(request=req)
+
+        admin_request = False
+        sig = req.params.get('swiftinfo_sig', '')
+        expires = req.params.get('swiftinfo_expires', '')
+
+        if sig != '' or expires != '':
+            admin_request = True
+            if not self.admin_key:
+                return HTTPForbidden(request=req)
+            try:
+                expires = int(expires)
+            except ValueError:
+                return HTTPUnauthorized(request=req)
+            if expires < time():
+                return HTTPUnauthorized(request=req)
+
+            valid_sigs = []
+            for method in self.allowed_hmac_methods[req.method]:
+                valid_sigs.append(get_hmac(method,
+                                           '/info',
+                                           expires,
+                                           self.admin_key))
+
+            # While it's true that any() will short-circuit, this doesn't
+            # affect the timing-attack resistance since the only way this will
+            # short-circuit is when a valid signature is passed in.
+            is_valid_hmac = any(streq_const_time(valid_sig, sig)
+                                for valid_sig in valid_sigs)
+            if not is_valid_hmac:
+                return HTTPUnauthorized(request=req)
+
+        headers = {}
+        if 'Origin' in req.headers:
+            headers['Access-Control-Allow-Origin'] = req.headers['Origin']
+            headers['Access-Control-Expose-Headers'] = ', '.join(
+                ['x-trans-id'])
+
+        info = json.dumps(get_swift_info(
+            admin=admin_request, disallowed_sections=self.disallowed_sections))
+
+        return HTTPOk(request=req,
+                      headers=headers,
+                      body=info.encode('ascii'),
+                      content_type='application/json; charset=UTF-8')
diff --git a/swift/proxy/controllers/obj.py b/swift/proxy/controllers/obj.py
index 0e30936331..5e0fd48b6b 100644
--- a/swift/proxy/controllers/obj.py
+++ b/swift/proxy/controllers/obj.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -15,7 +15,7 @@
 
 # NOTE: swift_conn
 # You'll see swift_conn passed around a few places in this file. This is the
-# source httplib connection of whatever it is attached to.
+# source bufferedhttp connection of whatever it is attached to.
 #   It is used when early termination of reading from the connection should
 # happen, such as when a range request is satisfied but there's still more the
 # source connection would like to send. To prevent having to read all the data
@@ -24,943 +24,3505 @@
 #   These shenanigans are to ensure all related objects can be garbage
 # collected. We've seen objects hang around forever otherwise.
 
+from urllib.parse import quote, unquote
+
+import collections
 import itertools
+import json
 import mimetypes
-import re
 import time
-from datetime import datetime
-from urllib import unquote, quote
-from hashlib import md5
-from random import shuffle
+import math
+import random
 
-from eventlet import sleep, GreenPile, Timeout
-from eventlet.queue import Queue
+from greenlet import GreenletExit
+from eventlet import GreenPile
+from eventlet.queue import Queue, Empty
 from eventlet.timeout import Timeout
 
-from swift.common.utils import ContextPool, normalize_timestamp, \
-    config_true_value, public, json
+from swift.common.utils import (
+    clean_content_type, config_true_value, ContextPool, csv_append,
+    GreenAsyncPile, GreenthreadSafeIterator, Timestamp, WatchdogTimeout,
+    normalize_delete_at_timestamp, public,
+    document_iters_to_http_response_body, parse_content_range,
+    quorum_size, reiterate, close_if_possible, safe_json_loads, md5,
+    NamespaceBoundList, CooperativeIterator, cache_from_env,
+    CooperativeCachePopulator, node_to_string)
 from swift.common.bufferedhttp import http_connect
-from swift.common.constraints import check_metadata, check_object_creation, \
-    CONTAINER_LISTING_LIMIT, MAX_FILE_SIZE
+from swift.common.constraints import check_metadata, check_object_creation
+from swift.common import constraints
 from swift.common.exceptions import ChunkReadTimeout, \
-    ChunkWriteTimeout, ConnectionTimeout, ListingIterNotFound, \
-    ListingIterNotAuthorized, ListingIterError
-from swift.common.http import is_success, is_client_error, HTTP_CONTINUE, \
-    HTTP_CREATED, HTTP_MULTIPLE_CHOICES, HTTP_NOT_FOUND, \
-    HTTP_INTERNAL_SERVER_ERROR, HTTP_SERVICE_UNAVAILABLE, \
-    HTTP_INSUFFICIENT_STORAGE
-from swift.proxy.controllers.base import Controller, delay_denial
+    ChunkWriteTimeout, ConnectionTimeout, ResponseTimeout, \
+    InsufficientStorage, FooterNotSupported, MultiphasePUTNotSupported, \
+    PutterConnectError, ChunkReadError, RangeAlreadyComplete, ShortReadError
+from swift.common.header_key_dict import HeaderKeyDict
+from swift.common.http import (
+    is_informational, is_success, is_client_error, is_server_error,
+    is_redirection, HTTP_CONTINUE, HTTP_INTERNAL_SERVER_ERROR,
+    HTTP_SERVICE_UNAVAILABLE, HTTP_INSUFFICIENT_STORAGE,
+    HTTP_PRECONDITION_FAILED, HTTP_CONFLICT, HTTP_UNPROCESSABLE_ENTITY,
+    HTTP_REQUESTED_RANGE_NOT_SATISFIABLE, HTTP_NOT_FOUND, HTTP_ACCEPTED)
+from swift.common.storage_policy import (POLICIES, REPL_POLICY, EC_POLICY,
+                                         ECDriverError, PolicyError)
+from swift.proxy.controllers.base import Controller, delay_denial, \
+    cors_validation, update_headers, bytes_to_skip, ByteCountEnforcer, \
+    record_cache_op_metrics, get_cache_key, GetterBase, GetterSource, \
+    is_good_source, NodeIter, get_namespaces_from_cache, \
+    namespace_bounds_to_list, namespace_list_to_bounds
 from swift.common.swob import HTTPAccepted, HTTPBadRequest, HTTPNotFound, \
     HTTPPreconditionFailed, HTTPRequestEntityTooLarge, HTTPRequestTimeout, \
-    HTTPServerError, HTTPServiceUnavailable, Request, Response, \
-    HTTPClientDisconnect
+    HTTPServerError, HTTPServiceUnavailable, HTTPClientDisconnect, \
+    HTTPUnprocessableEntity, Response, HTTPException, \
+    HTTPRequestedRangeNotSatisfiable, Range, HTTPInternalServerError, \
+    normalize_etag, str_to_wsgi
+from swift.common.request_helpers import update_etag_is_at_header, \
+    resolve_etag_is_at_header, validate_internal_obj, get_ip_port, \
+    is_open_expired, append_log_info
+
 
+def check_content_type(req):
+    if not req.environ.get('swift.content_type_overridden') and \
+            ';' in req.headers.get('content-type', ''):
+        for param in req.headers['content-type'].split(';')[1:]:
+            if param.lstrip().startswith('swift_'):
+                return HTTPBadRequest("Invalid Content-Type, "
+                                      "swift_* is not a valid parameter name.")
+    return None
 
-class SegmentedIterable(object):
+
+def num_container_updates(container_replicas, container_quorum,
+                          object_replicas, object_quorum):
     """
-    Iterable that returns the object contents for a segmented object in Swift.
-
-    If there's a failure that cuts the transfer short, the response's
-    `status_int` will be updated (again, just for logging since the original
-    status would have already been sent to the client).
-
-    :param controller: The ObjectController instance to work with.
-    :param container: The container the object segments are within.
-    :param listing: The listing of object segments to iterate over; this may
-                    be an iterator or list that returns dicts with 'name' and
-                    'bytes' keys.
-    :param response: The swob.Response this iterable is associated with, if
-                     any (default: None)
+    We need to send container updates via enough object servers such
+    that, if the object PUT succeeds, then the container update is
+    durable (either it's synchronously updated or written to async
+    pendings).
+
+    Define:
+      Qc = the quorum size for the container ring
+      Qo = the quorum size for the object ring
+      Rc = the replica count for the container ring
+      Ro = the replica count (or EC N+K) for the object ring
+
+    A durable container update is one that's made it to at least Qc
+    nodes. To always be durable, we have to send enough container
+    updates so that, if only Qo object PUTs succeed, and all the
+    failed object PUTs had container updates, at least Qc updates
+    remain. Since (Ro - Qo) object PUTs may fail, we must have at
+    least Qc + Ro - Qo container updates to ensure that Qc of them
+    remain.
+
+    Also, each container replica is named in at least one object PUT
+    request so that, when all requests succeed, no work is generated
+    for the container replicator. Thus, at least Rc updates are
+    necessary.
+
+    :param container_replicas: replica count for the container ring (Rc)
+    :param container_quorum: quorum size for the container ring (Qc)
+    :param object_replicas: replica count for the object ring (Ro)
+    :param object_quorum: quorum size for the object ring (Qo)
+
     """
+    return max(
+        # Qc + Ro - Qo
+        container_quorum + object_replicas - object_quorum,
+        # Rc
+        container_replicas)
 
-    def __init__(self, controller, container, listing, response=None):
-        self.controller = controller
-        self.container = container
-        self.listing = iter(listing)
-        self.segment = 0
-        self.segment_dict = None
-        self.segment_peek = None
-        self.seek = 0
-        self.segment_iter = None
-        # See NOTE: swift_conn at top of file about this.
-        self.segment_iter_swift_conn = None
-        self.position = 0
-        self.response = response
-        if not self.response:
-            self.response = Response()
-        self.next_get_time = 0
-
-    def _load_next_segment(self):
-        """
-        Loads the self.segment_iter with the next object segment's contents.
-
-        :raises: StopIteration when there are no more object segments.
-        """
-        try:
-            self.segment += 1
-            self.segment_dict = self.segment_peek or self.listing.next()
-            self.segment_peek = None
-            partition, nodes = self.controller.app.object_ring.get_nodes(
-                self.controller.account_name, self.container,
-                self.segment_dict['name'])
-            path = '/%s/%s/%s' % (self.controller.account_name, self.container,
-                                  self.segment_dict['name'])
-            req = Request.blank(path)
-            if self.seek:
-                req.range = 'bytes=%s-' % self.seek
-                self.seek = 0
-            if self.segment > self.controller.app.rate_limit_after_segment:
-                sleep(max(self.next_get_time - time.time(), 0))
-            self.next_get_time = time.time() + \
-                1.0 / self.controller.app.rate_limit_segments_per_sec
-            shuffle(nodes)
-            resp = self.controller.GETorHEAD_base(
-                req, _('Object'), partition,
-                self.controller.iter_nodes(partition, nodes,
-                                           self.controller.app.object_ring),
-                path, len(nodes))
-            if not is_success(resp.status_int):
-                raise Exception(_(
-                    'Could not load object segment %(path)s:'
-                    ' %(status)s') % {'path': path, 'status': resp.status_int})
-            self.segment_iter = resp.app_iter
-            # See NOTE: swift_conn at top of file about this.
-            self.segment_iter_swift_conn = getattr(resp, 'swift_conn', None)
-        except StopIteration:
-            raise
-        except (Exception, Timeout), err:
-            if not getattr(err, 'swift_logged', False):
-                self.controller.app.logger.exception(_(
-                    'ERROR: While processing manifest '
-                    '/%(acc)s/%(cont)s/%(obj)s'),
-                    {'acc': self.controller.account_name,
-                     'cont': self.controller.container_name,
-                     'obj': self.controller.object_name})
-                err.swift_logged = True
-                self.response.status_int = HTTP_SERVICE_UNAVAILABLE
-            raise
 
-    def next(self):
-        return iter(self).next()
+class ObjectControllerRouter(object):
 
-    def __iter__(self):
-        """ Standard iterator function that returns the object's contents. """
-        try:
-            while True:
-                if not self.segment_iter:
-                    self._load_next_segment()
-                while True:
-                    with ChunkReadTimeout(self.controller.app.node_timeout):
-                        try:
-                            chunk = self.segment_iter.next()
-                            break
-                        except StopIteration:
-                            self._load_next_segment()
-                self.position += len(chunk)
-                yield chunk
-        except StopIteration:
-            raise
-        except (Exception, Timeout), err:
-            if not getattr(err, 'swift_logged', False):
-                self.controller.app.logger.exception(_(
-                    'ERROR: While processing manifest '
-                    '/%(acc)s/%(cont)s/%(obj)s'),
-                    {'acc': self.controller.account_name,
-                     'cont': self.controller.container_name,
-                     'obj': self.controller.object_name})
-                err.swift_logged = True
-                self.response.status_int = HTTP_SERVICE_UNAVAILABLE
-            raise
+    policy_type_to_controller_map = {}
 
-    def app_iter_range(self, start, stop):
+    @classmethod
+    def register(cls, policy_type):
         """
-        Non-standard iterator function for use with Webob in serving Range
-        requests more quickly. This will skip over segments and do a range
-        request on the first segment to return data from, if needed.
+        Decorator for Storage Policy implementations to register
+        their ObjectController implementations.
 
-        :param start: The first byte (zero-based) to return. None for 0.
-        :param stop: The last byte (zero-based) to return. None for end.
+        This also fills in a policy_type attribute on the class.
         """
-        try:
-            if start:
-                self.segment_peek = self.listing.next()
-                while start >= self.position + self.segment_peek['bytes']:
-                    self.segment += 1
-                    self.position += self.segment_peek['bytes']
-                    self.segment_peek = self.listing.next()
-                self.seek = start - self.position
-            else:
-                start = 0
-            if stop is not None:
-                length = stop - start
-            else:
-                length = None
-            for chunk in self:
-                if length is not None:
-                    length -= len(chunk)
-                    if length < 0:
-                        # Chop off the extra:
-                        yield chunk[:length]
-                        break
-                yield chunk
-            # See NOTE: swift_conn at top of file about this.
-            if self.segment_iter_swift_conn:
-                try:
-                    self.segment_iter_swift_conn.close()
-                except Exception:
-                    pass
-                self.segment_iter_swift_conn = None
-            if self.segment_iter:
-                try:
-                    while self.segment_iter.next():
-                        pass
-                except Exception:
-                    pass
-                self.segment_iter = None
-        except StopIteration:
-            raise
-        except (Exception, Timeout), err:
-            if not getattr(err, 'swift_logged', False):
-                self.controller.app.logger.exception(_(
-                    'ERROR: While processing manifest '
-                    '/%(acc)s/%(cont)s/%(obj)s'),
-                    {'acc': self.controller.account_name,
-                     'cont': self.controller.container_name,
-                     'obj': self.controller.object_name})
-                err.swift_logged = True
-                self.response.status_int = HTTP_SERVICE_UNAVAILABLE
-            raise
+        def register_wrapper(controller_cls):
+            if policy_type in cls.policy_type_to_controller_map:
+                raise PolicyError(
+                    '%r is already registered for the policy_type %r' % (
+                        cls.policy_type_to_controller_map[policy_type],
+                        policy_type))
+            cls.policy_type_to_controller_map[policy_type] = controller_cls
+            controller_cls.policy_type = policy_type
+            return controller_cls
+        return register_wrapper
+
+    def __init__(self):
+        self.policy_to_controller_cls = {}
+        for policy in POLICIES:
+            self.policy_to_controller_cls[int(policy)] = \
+                self.policy_type_to_controller_map[policy.policy_type]
 
+    def __getitem__(self, policy):
+        return self.policy_to_controller_cls[int(policy)]
 
-class ObjectController(Controller):
-    """WSGI controller for object requests."""
+
+class CooperativeNamespaceCachePopulator(CooperativeCachePopulator):
+    """
+    CooperativeCachePopulator to fetch updating namespaces from backend
+    container cooperatively using cooperative token and memcached.
+    """
+
+    def __init__(self, ctrl, account, container, req, cache_key):
+        infocache = req.environ.setdefault('swift.infocache', {})
+        memcache = cache_from_env(req.environ, True)
+        cache_ttl = ctrl.app.recheck_updating_shard_ranges
+        avg_backend_fetch_time = ctrl.app.namespace_avg_backend_fetch_time
+        num_tokens = ctrl.app.namespace_cache_tokens_per_session
+        labels = {
+            'resource': 'shard_updating',
+        }
+        if account is not None:
+            labels['account'] = account
+        if container is not None:
+            labels['container'] = container
+        super().__init__(
+            ctrl.app, infocache, memcache, cache_key, cache_ttl,
+            avg_backend_fetch_time, num_tokens, labels=labels
+        )
+        self.ctrl = ctrl
+        self.account = account
+        self.container = container
+        self.req = req
+
+    def cache_encoder(self, ns_bound_list):
+        return namespace_list_to_bounds(ns_bound_list)
+
+    def cache_decoder(self, bounds):
+        return namespace_bounds_to_list(bounds)
+
+    def do_fetch_backend(self):
+        return self.ctrl._get_backend_updating_namespaces(
+            self.req, self.account, self.container)
+
+
+class BaseObjectController(Controller):
+    """Base WSGI controller for object requests."""
     server_type = 'Object'
 
     def __init__(self, app, account_name, container_name, object_name,
                  **kwargs):
-        Controller.__init__(self, app)
+        super(BaseObjectController, self).__init__(app)
         self.account_name = unquote(account_name)
         self.container_name = unquote(container_name)
         self.object_name = unquote(object_name)
+        validate_internal_obj(
+            self.account_name, self.container_name, self.object_name)
 
-    def _listing_iter(self, lcontainer, lprefix, env):
-        for page in self._listing_pages_iter(lcontainer, lprefix, env):
-            for item in page:
-                yield item
+    def iter_nodes_local_first(self, ring, partition, request, policy=None,
+                               local_handoffs_first=False):
+        """
+        Yields nodes for a ring partition.
 
-    def _listing_pages_iter(self, lcontainer, lprefix, env):
-        lpartition, lnodes = self.app.container_ring.get_nodes(
-            self.account_name, lcontainer)
-        marker = ''
-        while True:
-            lreq = Request.blank('i will be overridden by env', environ=env)
-            # Don't quote PATH_INFO, by WSGI spec
-            lreq.environ['PATH_INFO'] = \
-                '/%s/%s' % (self.account_name, lcontainer)
-            lreq.environ['REQUEST_METHOD'] = 'GET'
-            lreq.environ['QUERY_STRING'] = \
-                'format=json&prefix=%s&marker=%s' % (quote(lprefix),
-                                                     quote(marker))
-            shuffle(lnodes)
-            lresp = self.GETorHEAD_base(
-                lreq, _('Container'), lpartition, lnodes, lreq.path_info,
-                len(lnodes))
-            if 'swift.authorize' in env:
-                lreq.acl = lresp.headers.get('x-container-read')
-                aresp = env['swift.authorize'](lreq)
-                if aresp:
-                    raise ListingIterNotAuthorized(aresp)
-            if lresp.status_int == HTTP_NOT_FOUND:
-                raise ListingIterNotFound()
-            elif not is_success(lresp.status_int):
-                raise ListingIterError()
-            if not lresp.body:
-                break
-            sublisting = json.loads(lresp.body)
-            if not sublisting:
-                break
-            marker = sublisting[-1]['name']
-            yield sublisting
+        If the 'write_affinity' setting is non-empty, then this will yield N
+        local nodes (as defined by the write_affinity setting) first, then the
+        rest of the nodes as normal. It is a re-ordering of the nodes such
+        that the local ones come first; no node is omitted. The effect is
+        that the request will be serviced by local object servers first, but
+        nonlocal ones will be employed if not enough local ones are available.
 
-    def _remaining_items(self, listing_iter):
+        :param ring: ring to get nodes from
+        :param partition: ring partition to yield nodes for
+        :param request: nodes will be annotated with `use_replication` based on
+            the `request` headers
+        :param policy: optional, an instance of
+            :class:`~swift.common.storage_policy.BaseStoragePolicy`
+        :param local_handoffs_first: optional, if True prefer primaries and
+            local handoff nodes first before looking elsewhere.
         """
-        Returns an item-by-item iterator for a page-by-page iterator
-        of item listings.
+        policy_options = self.app.get_policy_options(policy)
+        is_local = policy_options.write_affinity_is_local_fn
+        if is_local is None:
+            return NodeIter(
+                'object', self.app, ring, partition, self.logger, request,
+                policy=policy)
 
-        Swallows listing-related errors; this iterator is only used
-        after we've already started streaming a response to the
-        client, and so if we start getting errors from the container
-        servers now, it's too late to send an error to the client, so
-        we just quit looking for segments.
-        """
-        try:
-            for page in listing_iter:
-                for item in page:
-                    yield item
-        except ListingIterNotFound:
-            pass
-        except ListingIterError:
-            pass
-        except ListingIterNotAuthorized:
-            pass
+        primary_nodes = ring.get_part_nodes(partition)
+        handoff_nodes = ring.get_more_nodes(partition)
+        all_nodes = itertools.chain(primary_nodes, handoff_nodes)
 
-    def is_good_source(self, src):
-        """
-        Indicates whether or not the request made to the backend found
-        what it was looking for.
+        if local_handoffs_first:
+            num_locals = policy_options.write_affinity_handoff_delete_count
+            if num_locals is None:
+                local_primaries = [node for node in primary_nodes
+                                   if is_local(node)]
+                num_locals = len(primary_nodes) - len(local_primaries)
 
-        In the case of an object, a 416 indicates that we found a
-        backend with the object.
-        """
-        return src.status == 416 or \
-            super(ObjectController, self).is_good_source(src)
+            first_local_handoffs = list(itertools.islice(
+                (node for node in handoff_nodes if is_local(node)), num_locals)
+            )
+            preferred_nodes = primary_nodes + first_local_handoffs
+        else:
+            num_locals = policy_options.write_affinity_node_count_fn(
+                len(primary_nodes)
+            )
+            preferred_nodes = list(itertools.islice(
+                (node for node in all_nodes if is_local(node)), num_locals)
+            )
+            # refresh it; it moved when we computed preferred_nodes
+            handoff_nodes = ring.get_more_nodes(partition)
+            all_nodes = itertools.chain(primary_nodes, handoff_nodes)
+
+        node_iter = itertools.chain(
+            preferred_nodes,
+            (node for node in all_nodes if node not in preferred_nodes)
+        )
+
+        return NodeIter(
+            'object', self.app, ring, partition, self.logger, request,
+            node_iter=node_iter, policy=policy)
 
     def GETorHEAD(self, req):
         """Handle HTTP GET or HEAD requests."""
-        container_info = self.container_info(self.account_name,
-                                             self.container_name)
+        container_info = self.container_info(
+            self.account_name, self.container_name, req)
         req.acl = container_info['read_acl']
+        # pass the policy index to storage nodes via req header
+        policy_index = req.headers.get('X-Backend-Storage-Policy-Index',
+                                       container_info['storage_policy'])
+        policy = POLICIES.get_by_index(policy_index)
+        obj_ring = self.app.get_object_ring(policy_index)
+        req.headers['X-Backend-Storage-Policy-Index'] = policy_index
+        if is_open_expired(self.app, req):
+            req.headers['X-Backend-Open-Expired'] = 'true'
         if 'swift.authorize' in req.environ:
             aresp = req.environ['swift.authorize'](req)
             if aresp:
                 return aresp
-
-        partition, nodes = self.app.object_ring.get_nodes(
+        partition = obj_ring.get_part(
             self.account_name, self.container_name, self.object_name)
-        shuffle(nodes)
-        resp = self.GETorHEAD_base(
-            req, _('Object'), partition,
-            self.iter_nodes(partition, nodes, self.app.object_ring),
-            req.path_info, len(nodes))
-
-        if 'x-object-manifest' in resp.headers:
-            lcontainer, lprefix = \
-                resp.headers['x-object-manifest'].split('/', 1)
-            lcontainer = unquote(lcontainer)
-            lprefix = unquote(lprefix)
-            try:
-                pages_iter = iter(self._listing_pages_iter(lcontainer, lprefix,
-                                                           req.environ))
-                listing_page1 = pages_iter.next()
-                listing = itertools.chain(listing_page1,
-                                          self._remaining_items(pages_iter))
-            except ListingIterNotFound:
-                return HTTPNotFound(request=req)
-            except ListingIterNotAuthorized, err:
-                return err.aresp
-            except ListingIterError:
-                return HTTPServerError(request=req)
-            except StopIteration:
-                listing_page1 = listing = ()
-
-            if len(listing_page1) >= CONTAINER_LISTING_LIMIT:
-                resp = Response(headers=resp.headers, request=req,
-                                conditional_response=True)
-                if req.method == 'HEAD':
-                    # These shenanigans are because swob translates the HEAD
-                    # request into a swob EmptyResponse for the body, which
-                    # has a len, which eventlet translates as needing a
-                    # content-length header added. So we call the original
-                    # swob resp for the headers but return an empty iterator
-                    # for the body.
-
-                    def head_response(environ, start_response):
-                        resp(environ, start_response)
-                        return iter([])
-
-                    head_response.status_int = resp.status_int
-                    return head_response
-                else:
-                    resp.app_iter = SegmentedIterable(
-                        self, lcontainer, listing, resp)
+        node_iter = NodeIter(
+            'object', self.app, obj_ring, partition, self.logger, req,
+            policy=policy)
 
-            else:
-                # For objects with a reasonable number of segments, we'll serve
-                # them with a set content-length and computed etag.
-                if listing:
-                    listing = list(listing)
-                    content_length = sum(o['bytes'] for o in listing)
-                    last_modified = max(o['last_modified'] for o in listing)
-                    last_modified = datetime(*map(int, re.split('[^\d]',
-                                             last_modified)[:-1]))
-                    etag = md5(
-                        ''.join(o['hash'] for o in listing)).hexdigest()
-                else:
-                    content_length = 0
-                    last_modified = resp.last_modified
-                    etag = md5().hexdigest()
-                resp = Response(headers=resp.headers, request=req,
-                                conditional_response=True)
-                resp.app_iter = SegmentedIterable(self, lcontainer, listing,
-                                                  resp)
-                resp.content_length = content_length
-                resp.last_modified = last_modified
-                resp.etag = etag
-            resp.headers['accept-ranges'] = 'bytes'
-            # In case of a manifest file of nonzero length, the
-            # backend may have sent back a Content-Range header for
-            # the manifest. It's wrong for the client, though.
-            resp.content_range = None
+        resp = self._get_or_head_response(req, node_iter, partition, policy)
 
+        if ';' in resp.headers.get('content-type', ''):
+            resp.content_type = clean_content_type(
+                resp.headers['content-type'])
         return resp
 
     @public
+    @cors_validation
     @delay_denial
     def GET(self, req):
         """Handler for HTTP GET requests."""
         return self.GETorHEAD(req)
 
     @public
+    @cors_validation
     @delay_denial
     def HEAD(self, req):
         """Handler for HTTP HEAD requests."""
         return self.GETorHEAD(req)
 
+    def _do_get_updating_namespaces(
+            self, req, account, container, includes=None):
+        """
+        Fetch namespaces in 'updating' states from given `account/container`.
+        If `includes` is given then the shard range for that object name is
+        requested, otherwise all namespaces are requested.
+
+        :param req: original Request instance.
+        :param account: account from which namespaces should be fetched.
+        :param container: container from which namespaces should be fetched.
+        :param includes: (optional) restricts the list of fetched namespaces
+            to those which include the given name.
+        :return: a list of instances of :class:`swift.common.utils.Namespace`,
+            or None if there was a problem fetching the namespaces.
+        """
+        params = req.params.copy()
+        params.pop('limit', None)
+        params['format'] = 'json'
+        params['states'] = 'updating'
+        headers = {'X-Backend-Record-Type': 'shard',
+                   'X-Backend-Record-Shard-Format': 'namespace'}
+        if includes:
+            params['includes'] = str_to_wsgi(includes)
+        listing, response = self._get_container_listing(
+            req, account, container, headers=headers, params=params)
+        return self._parse_namespaces(req, listing, response), response
+
+    def _get_update_shard_caching_disabled(self, req, account, container, obj):
+        """
+        Fetch the corresponding updating shard range for the given object when
+        all caching is disabled.
+
+        :param req: original Request instance.
+        :param account: account from which shard ranges should be fetched.
+        :param container: container from which shard ranges should be fetched.
+        :param obj: object getting updated.
+        :return: an instance of :class:`swift.common.utils.Namespace`,
+            or None if the update should go back to the root
+        """
+        # legacy behavior requests container server for includes=obj
+        namespaces, response = self._do_get_updating_namespaces(
+            req, account, container, includes=obj)
+        record_cache_op_metrics(
+            self.logger, self.server_type.lower(), 'shard_updating',
+            'disabled', response)
+        # there will be only one Namespace in the list if any
+        return namespaces[0] if namespaces else None
+
+    def _get_backend_updating_namespaces(self, req, account, container):
+        """
+        Retrieve the updating namespaces from the backend.
+
+        :param req: original Request instance.
+        :param account: account from which namespaces should be fetched.
+        :param container: container from which namespaces should be fetched.
+        :return: a tuple of (NamespaceBoundList, response).
+        """
+        # pull full set of updating namespaces from backend
+        namespaces, backend_response = self._do_get_updating_namespaces(
+            req, account, container)
+        ns_bound_list = NamespaceBoundList.parse(namespaces)
+        return ns_bound_list, backend_response
+
+    def _get_update_shard(self, req, account, container, obj):
+        """
+        Find the appropriate shard range for an object update.
+
+        Note that this fetches and caches (in both the per-request infocache
+        and memcache, if available) all shard ranges for the given root
+        container so we won't have to contact the container DB for every write.
+
+        :param req: original Request instance.
+        :param account: account from which shard ranges should be fetched.
+        :param container: container from which shard ranges should be fetched.
+        :param obj: object getting updated.
+        :return: an instance of :class:`swift.common.utils.Namespace`,
+            or None if the update should go back to the root
+        """
+        memcache = cache_from_env(req.environ, True)
+        if not self.app.recheck_updating_shard_ranges or not memcache:
+            # caching is disabled
+            return self._get_update_shard_caching_disabled(
+                req, account, container, obj)
+
+        # caching is enabled, try to get from caches
+        cache_key = get_cache_key(account, container, shard='updating')
+        skip_chance = self.app.container_updating_shard_ranges_skip_cache
+        ns_bound_list, get_cache_state = get_namespaces_from_cache(
+            req, cache_key, skip_chance)
+        response = None
+        if not ns_bound_list:
+            # namespaces not found in memcache or cache was skipped, so pull
+            # the full set of updating shard ranges from the backend and set in
+            # the memcache with the usage of cooperative token.
+            cache_populator = CooperativeNamespaceCachePopulator(
+                self, account, container, req, cache_key)
+            ns_bound_list = cache_populator.fetch_data()
+            if cache_populator.set_cache_state:
+                # record the general cache set metrics.
+                record_cache_op_metrics(
+                    self.logger, self.server_type.lower(), 'shard_updating',
+                    cache_populator.set_cache_state, None)
+                # TODO: use enum to unify 'set_cache_state' in existing
+                # 'set_namespaces_in_cache' and CooperativeCachePopulator, and
+                # convert existing usages of response to just status code.
+                if cache_populator.set_cache_state == 'set':
+                    message = "Caching updating shards for %s (%d shards)" % (
+                        cache_key, len(ns_bound_list))
+                    if cache_populator.token_acquired:
+                        message += " with a finished token"
+                    self.logger.info(message)
+            response = cache_populator.backend_resp
+
+        # record the general cache get metrics.
+        record_cache_op_metrics(
+            self.logger, self.server_type.lower(), 'shard_updating',
+            get_cache_state, response)
+        return ns_bound_list.get_namespace(obj) if ns_bound_list else None
+
+    def _get_update_target(self, req, container_info):
+        # find the sharded container to which we'll send the update
+        db_state = container_info.get('sharding_state', 'unsharded')
+        if db_state in ('sharded', 'sharding'):
+            update_shard_ns = self._get_update_shard(
+                req, self.account_name, self.container_name, self.object_name)
+            if update_shard_ns:
+                partition, nodes = self.app.container_ring.get_nodes(
+                    update_shard_ns.account, update_shard_ns.container)
+                return partition, nodes, update_shard_ns.name, db_state
+
+        return (container_info['partition'], container_info['nodes'], None,
+                db_state)
+
     @public
+    @cors_validation
     @delay_denial
     def POST(self, req):
         """HTTP POST request handler."""
-        if 'x-delete-after' in req.headers:
-            try:
-                x_delete_after = int(req.headers['x-delete-after'])
-            except ValueError:
-                return HTTPBadRequest(request=req,
-                                      content_type='text/plain',
-                                      body='Non-integer X-Delete-After')
-            req.headers['x-delete-at'] = '%d' % (time.time() + x_delete_after)
-        if self.app.object_post_as_copy:
-            req.method = 'PUT'
-            req.path_info = '/%s/%s/%s' % (
-                self.account_name, self.container_name, self.object_name)
-            req.headers['Content-Length'] = 0
-            req.headers['X-Copy-From'] = quote('/%s/%s' % (self.container_name,
-                                               self.object_name))
-            req.headers['X-Fresh-Metadata'] = 'true'
-            req.environ['swift_versioned_copy'] = True
-            resp = self.PUT(req)
-            # Older editions returned 202 Accepted on object POSTs, so we'll
-            # convert any 201 Created responses to that for compatibility with
-            # picky clients.
-            if resp.status_int != HTTP_CREATED:
-                return resp
-            return HTTPAccepted(request=req)
-        else:
-            error_response = check_metadata(req, 'object')
-            if error_response:
-                return error_response
-            container_info = self.container_info(
-                self.account_name, self.container_name,
-                account_autocreate=self.app.account_autocreate)
-            container_partition = container_info['partition']
-            containers = container_info['nodes']
-            req.acl = container_info['write_acl']
-            if 'swift.authorize' in req.environ:
-                aresp = req.environ['swift.authorize'](req)
-                if aresp:
-                    return aresp
-            if not containers:
-                return HTTPNotFound(request=req)
-            if 'x-delete-at' in req.headers:
-                try:
-                    x_delete_at = int(req.headers['x-delete-at'])
-                    if x_delete_at < time.time():
-                        return HTTPBadRequest(
-                            body='X-Delete-At in past', request=req,
-                            content_type='text/plain')
-                except ValueError:
-                    return HTTPBadRequest(request=req,
-                                          content_type='text/plain',
-                                          body='Non-integer X-Delete-At')
-                delete_at_container = str(
-                    x_delete_at /
-                    self.app.expiring_objects_container_divisor *
-                    self.app.expiring_objects_container_divisor)
-                delete_at_part, delete_at_nodes = \
-                    self.app.container_ring.get_nodes(
-                        self.app.expiring_objects_account, delete_at_container)
+        container_info = self.container_info(
+            self.account_name, self.container_name, req)
+        req.acl = container_info['write_acl']
+        if is_open_expired(self.app, req):
+            req.headers['X-Backend-Open-Expired'] = 'true'
+        if 'swift.authorize' in req.environ:
+            aresp = req.environ['swift.authorize'](req)
+            if aresp:
+                return aresp
+        if not is_success(container_info.get('status')):
+            return HTTPNotFound(request=req)
+        error_response = check_metadata(req, 'object')
+        if error_response:
+            return error_response
+
+        req.ensure_x_timestamp()
+
+        req, delete_at_container, delete_at_part, \
+            delete_at_nodes = self._config_obj_expiration(req)
+
+        # pass the policy index to storage nodes via req header
+        policy_index = req.headers.get('X-Backend-Storage-Policy-Index',
+                                       container_info['storage_policy'])
+        obj_ring = self.app.get_object_ring(policy_index)
+        req.headers['X-Backend-Storage-Policy-Index'] = policy_index
+        next_part_power = getattr(obj_ring, 'next_part_power', None)
+        if next_part_power:
+            req.headers['X-Backend-Next-Part-Power'] = next_part_power
+        partition, nodes = obj_ring.get_nodes(
+            self.account_name, self.container_name, self.object_name)
+
+        headers = self._backend_requests(
+            req, len(nodes), container_info, delete_at_container,
+            delete_at_part, delete_at_nodes)
+        return self._post_object(req, obj_ring, partition, headers)
+
+    def _backend_requests(self, req, n_outgoing,
+                          container_info, delete_at_container=None,
+                          delete_at_partition=None, delete_at_nodes=None):
+        policy_index = req.headers['X-Backend-Storage-Policy-Index']
+        policy = POLICIES.get_by_index(policy_index)
+        container_partition, containers, container_path, db_state = \
+            self._get_update_target(req, container_info)
+        headers = [self.generate_request_headers(req, additional=req.headers)
+                   for _junk in range(n_outgoing)]
+
+        def set_container_update(index, container_node):
+            ip, port = get_ip_port(container_node, headers[index])
+            headers[index]['X-Container-Partition'] = container_partition
+            headers[index]['X-Container-Host'] = csv_append(
+                headers[index].get('X-Container-Host'),
+                '%(ip)s:%(port)s' % {'ip': ip, 'port': port})
+            headers[index]['X-Container-Device'] = csv_append(
+                headers[index].get('X-Container-Device'),
+                container_node['device'])
+            headers[index]['X-Container-Root-Db-State'] = db_state
+            if container_path:
+                headers[index]['X-Backend-Quoted-Container-Path'] = quote(
+                    container_path)
+                # NB: we used to send
+                #    'X-Backend-Container-Path': container_path
+                # but that isn't safe for container names with nulls or
+                # newlines (or possibly some other characters). We consciously
+                # *don't* make any attempt to set the old meta; during an
+                # upgrade, old object-servers will talk to the root which
+                # will eat the update and move it as a misplaced object.
+
+        def set_delete_at_headers(index, delete_at_node):
+            ip, port = get_ip_port(delete_at_node, headers[index])
+            headers[index]['X-Delete-At-Container'] = delete_at_container
+            headers[index]['X-Delete-At-Partition'] = delete_at_partition
+            headers[index]['X-Delete-At-Host'] = csv_append(
+                headers[index].get('X-Delete-At-Host'),
+                '%(ip)s:%(port)s' % {'ip': ip, 'port': port})
+            headers[index]['X-Delete-At-Device'] = csv_append(
+                headers[index].get('X-Delete-At-Device'),
+                delete_at_node['device'])
+
+        n_updates_needed = num_container_updates(
+            len(containers), quorum_size(len(containers)),
+            n_outgoing, policy.quorum)
+
+        container_iter = itertools.cycle(containers)
+        dan_iter = itertools.cycle(delete_at_nodes or [])
+        existing_updates = 0
+        while existing_updates < n_updates_needed:
+            index = existing_updates % n_outgoing
+            set_container_update(index, next(container_iter))
+            if delete_at_nodes:
+                # We reverse the index in order to distribute the updates
+                # across all nodes.
+                set_delete_at_headers(n_outgoing - 1 - index, next(dan_iter))
+            existing_updates += 1
+
+        # Keep the number of expirer-queue deletes to a reasonable number.
+        #
+        # In the best case, at least one object server writes out an
+        # async_pending for an expirer-queue update. In the worst case, no
+        # object server does so, and an expirer-queue row remains that
+        # refers to an already-deleted object. In this case, upon attempting
+        # to delete the object, the object expirer will notice that the
+        # object does not exist and then remove the row from the expirer
+        # queue.
+        #
+        # In other words: expirer-queue updates on object DELETE are nice to
+        # have, but not strictly necessary for correct operation.
+        #
+        # Also, each queue update results in an async_pending record, which
+        # causes the object updater to talk to all container servers. If we
+        # have N async_pendings and Rc container replicas, we cause N * Rc
+        # requests from object updaters to container servers (possibly more,
+        # depending on retries). Thus, it is helpful to keep this number
+        # small.
+        n_desired_queue_updates = 2
+        for i in range(len(headers)):
+            headers[i].setdefault('X-Backend-Clean-Expiring-Object-Queue',
+                                  't' if i < n_desired_queue_updates else 'f')
+
+        return headers
+
+    def _get_conn_response(self, putter, path, logger_thread_locals,
+                           final_phase, **kwargs):
+        self.logger.thread_locals = logger_thread_locals
+        try:
+            resp = putter.await_response(
+                self.app.node_timeout, not final_phase)
+        except (Exception, Timeout):
+            resp = None
+            if final_phase:
+                status_type = 'final'
             else:
-                delete_at_part = delete_at_nodes = None
-            partition, nodes = self.app.object_ring.get_nodes(
-                self.account_name, self.container_name, self.object_name)
-            req.headers['X-Timestamp'] = normalize_timestamp(time.time())
-            headers = []
-            for container in containers:
-                nheaders = dict(req.headers.iteritems())
-                nheaders['Connection'] = 'close'
-                nheaders['X-Container-Host'] = '%(ip)s:%(port)s' % container
-                nheaders['X-Container-Partition'] = container_partition
-                nheaders['X-Container-Device'] = container['device']
-                if delete_at_nodes:
-                    node = delete_at_nodes.pop(0)
-                    nheaders['X-Delete-At-Host'] = '%(ip)s:%(port)s' % node
-                    nheaders['X-Delete-At-Partition'] = delete_at_part
-                    nheaders['X-Delete-At-Device'] = node['device']
-                headers.append(nheaders)
-            resp = self.make_requests(req, self.app.object_ring, partition,
-                                      'POST', req.path_info, headers)
-            return resp
+                status_type = 'commit'
+            self.app.exception_occurred(
+                putter.node, 'Object',
+                'Trying to get %(status_type)s status of PUT to %(path)s' %
+                {'status_type': status_type, 'path': path})
+        return (putter, resp)
 
-    def _send_file(self, conn, path):
-        """Method for a file PUT coro"""
-        while True:
-            chunk = conn.queue.get()
-            if not conn.failed:
-                try:
-                    with ChunkWriteTimeout(self.app.node_timeout):
-                        conn.send(chunk)
-                except (Exception, ChunkWriteTimeout):
-                    conn.failed = True
-                    self.exception_occurred(conn.node, _('Object'),
-                                            _('Trying to write to %s') % path)
-            conn.queue.task_done()
-
-    def _connect_put_node(self, nodes, part, path, headers,
+    def _have_adequate_put_responses(self, statuses, num_nodes, min_responses):
+        """
+        Test for sufficient PUT responses from backend nodes to proceed with
+        PUT handling.
+
+        :param statuses: a list of response statuses.
+        :param num_nodes: number of backend nodes to which PUT requests may be
+                          issued.
+        :param min_responses: (optional) minimum number of nodes required to
+                              have responded with satisfactory status code.
+        :return: True if sufficient backend responses have returned a
+                 satisfactory status code.
+        """
+        raise NotImplementedError
+
+    def _get_put_responses(self, req, putters, num_nodes, final_phase=True,
+                           min_responses=None):
+        """
+        Collect object responses to a PUT request and determine if a
+        satisfactory number of nodes have returned success.  Returns
+        lists of accumulated status codes, reasons, bodies and etags.
+
+        :param req: the request
+        :param putters: list of putters for the request
+        :param num_nodes: number of nodes involved
+        :param final_phase: boolean indicating if this is the last phase
+        :param min_responses: minimum needed when not requiring quorum
+        :return: a tuple of lists of status codes, reasons, bodies and etags.
+                 The list of bodies and etags is only populated for the final
+                 phase of a PUT transaction.
+        """
+        statuses = []
+        reasons = []
+        bodies = []
+        etags = set()
+
+        pile = GreenAsyncPile(len(putters))
+        for putter in putters:
+            if putter.failed:
+                continue
+            pile.spawn(self._get_conn_response, putter, req.path,
+                       self.logger.thread_locals, final_phase=final_phase)
+
+        def _handle_response(putter, response):
+            statuses.append(response.status)
+            reasons.append(response.reason)
+            if final_phase:
+                body = response.read()
+            else:
+                body = b''
+            bodies.append(body)
+            if not self.app.check_response(putter.node, 'Object', response,
+                                           req.method, req.path, body):
+                putter.failed = True
+            elif is_success(response.status):
+                etags.add(normalize_etag(response.getheader('etag')))
+
+        for (putter, response) in pile:
+            if response:
+                _handle_response(putter, response)
+                if self._have_adequate_put_responses(
+                        statuses, num_nodes, min_responses):
+                    break
+            else:
+                putter.failed = True
+
+        # give any pending requests *some* chance to finish
+        finished_quickly = pile.waitall(self.app.post_quorum_timeout)
+        for (putter, response) in finished_quickly:
+            if response:
+                _handle_response(putter, response)
+
+        if final_phase:
+            while len(statuses) < num_nodes:
+                statuses.append(HTTP_SERVICE_UNAVAILABLE)
+                reasons.append('')
+                bodies.append(b'')
+
+        return statuses, reasons, bodies, etags
+
+    def _config_obj_expiration(self, req):
+        delete_at_container = None
+        delete_at_part = None
+        delete_at_nodes = None
+
+        req = constraints.check_delete_headers(req)
+
+        if 'x-delete-at' in req.headers:
+            req.headers['x-delete-at'] = normalize_delete_at_timestamp(
+                int(req.headers['x-delete-at']))
+            x_delete_at = int(req.headers['x-delete-at'])
+
+            append_log_info(req.environ, 'x-delete-at:%s' % x_delete_at)
+
+            delete_at_part, delete_at_nodes, delete_at_container = \
+                self.app.expirer_config.get_delete_at_nodes(
+                    x_delete_at, self.account_name, self.container_name,
+                    self.object_name)
+
+        return req, delete_at_container, delete_at_part, delete_at_nodes
+
+    def _update_content_type(self, req):
+        # Sometimes the 'content-type' header exists, but is set to None.
+        detect_content_type = \
+            config_true_value(req.headers.get('x-detect-content-type'))
+        if detect_content_type or not req.headers.get('content-type'):
+            guessed_type, _junk = mimetypes.guess_type(req.path_info)
+            req.headers['Content-Type'] = guessed_type or \
+                'application/octet-stream'
+            if detect_content_type:
+                req.headers.pop('x-detect-content-type')
+
+    def _check_failure_put_connections(self, putters, req, min_conns):
+        """
+        Identify any failed connections and check minimum connection count.
+
+        :param putters: a list of Putter instances
+        :param req: request
+        :param min_conns: minimum number of putter connections required
+        """
+        if req.if_none_match is not None and '*' in req.if_none_match:
+            statuses = [
+                putter.resp.status for putter in putters if putter.resp]
+            if HTTP_PRECONDITION_FAILED in statuses:
+                # If we find any copy of the file, it shouldn't be uploaded
+                self.logger.debug(
+                    'Object PUT returning 412, %(statuses)r',
+                    {'statuses': statuses})
+                raise HTTPPreconditionFailed(request=req)
+
+        if any(putter for putter in putters if putter.resp and
+               putter.resp.status == HTTP_CONFLICT):
+            status_times = ['%(status)s (%(timestamp)s)' % {
+                'status': putter.resp.status,
+                'timestamp': HeaderKeyDict(
+                    putter.resp.getheaders()).get(
+                        'X-Backend-Timestamp', 'unknown')
+            } for putter in putters if putter.resp]
+            self.logger.debug(
+                'Object PUT returning 202 for 409: '
+                '%(req_timestamp)s <= %(timestamps)r',
+                {'req_timestamp': req.timestamp.internal,
+                 'timestamps': ', '.join(status_times)})
+            raise HTTPAccepted(request=req)
+
+        self._check_min_conn(req, putters, min_conns)
+
+    def _make_putter(self, node, part, req, headers):
+        """
+        Returns a putter object for handling streaming of object to object
+        servers.
+
+        Subclasses must implement this method.
+
+        :param node: a storage node
+        :param part: ring partition number
+        :param req: a swob Request
+        :param headers: request headers
+        :return: an instance of a Putter
+        """
+        raise NotImplementedError
+
+    def _connect_put_node(self, nodes, part, req, headers,
                           logger_thread_locals):
-        """Method for a file PUT connect"""
-        self.app.logger.thread_locals = logger_thread_locals
+        """
+        Make connection to storage nodes
+
+        Connects to the first working node that it finds in nodes iter and
+        sends over the request headers. Returns a Putter to handle the rest of
+        the streaming, or None if no working nodes were found.
+
+        :param nodes: an iterator of the target storage nodes
+        :param part: ring partition number
+        :param req: a swob Request
+        :param headers: request headers
+        :param logger_thread_locals: The thread local values to be set on the
+                                     self.logger to retain transaction
+                                     logging information.
+        :return: an instance of a Putter
+        """
+        self.logger.thread_locals = logger_thread_locals
         for node in nodes:
             try:
-                with ConnectionTimeout(self.app.conn_timeout):
-                    conn = http_connect(
-                        node['ip'], node['port'], node['device'], part, 'PUT',
-                        path, headers)
-                with Timeout(self.app.node_timeout):
-                    resp = conn.getexpect()
-                if resp.status == HTTP_CONTINUE:
-                    conn.resp = None
-                    conn.node = node
-                    return conn
-                elif is_success(resp.status):
-                    conn.resp = resp
-                    conn.node = node
-                    return conn
-                elif resp.status == HTTP_INSUFFICIENT_STORAGE:
-                    self.error_limit(node)
-            except:
-                self.exception_occurred(node, _('Object'),
-                                        _('Expect: 100-continue on %s') % path)
+                putter = self._make_putter(node, part, req, headers)
+                self.app.set_node_timing(node, putter.connect_duration)
+                return putter
+            except InsufficientStorage:
+                self.app.error_limit(node, 'ERROR Insufficient Storage')
+            except PutterConnectError as e:
+                msg = 'ERROR %d Expect: 100-continue From Object Server'
+                self.app.error_occurred(node, msg % e.status)
+            except (Exception, Timeout):
+                self.app.exception_occurred(
+                    node, 'Object',
+                    'Expect: 100-continue on %s' %
+                    quote(req.swift_entity_path))
+
+    def _get_put_connections(self, req, nodes, partition, outgoing_headers,
+                             policy):
+        """
+        Establish connections to storage nodes for PUT request
+        """
+        obj_ring = policy.object_ring
+        node_iter = GreenthreadSafeIterator(
+            self.iter_nodes_local_first(obj_ring, partition, req,
+                                        policy=policy))
+        pile = GreenPile(len(nodes))
+
+        for nheaders in outgoing_headers:
+            # RFC2616:8.2.3 disallows 100-continue without a body,
+            # so switch to chunked request
+            if nheaders.get('Content-Length') == '0':
+                nheaders['Transfer-Encoding'] = 'chunked'
+                del nheaders['Content-Length']
+            nheaders['Expect'] = '100-continue'
+            pile.spawn(self._connect_put_node, node_iter, partition,
+                       req, nheaders, self.logger.thread_locals)
+
+        putters = [putter for putter in pile if putter]
+
+        return putters
+
+    def _check_min_conn(self, req, putters, min_conns, msg=None):
+        msg = msg or ('Object PUT returning 503, %(conns)s/%(nodes)s '
+                      'required connections')
+
+        if len(putters) < min_conns:
+            self.logger.error(msg, {'conns': len(putters), 'nodes': min_conns})
+            raise HTTPServiceUnavailable(request=req)
+
+    def _get_footers(self, req):
+        footers = HeaderKeyDict()
+        footer_callback = req.environ.get(
+            'swift.callback.update_footers', lambda _footer: None)
+        footer_callback(footers)
+        return footers
+
+    def _store_object(self, req, data_source, nodes, partition,
+                      outgoing_headers):
+        """
+        This method is responsible for establishing connection
+        with storage nodes and sending the data to each one of those
+        nodes. The process of transferring data is specific to each
+        Storage Policy, thus it is required for each policy specific
+        ObjectController to provide their own implementation of this method.
+
+        :param req: the PUT Request
+        :param data_source: an iterator of the source of the data
+        :param nodes: an iterator of the target storage nodes
+        :param partition: ring partition number
+        :param outgoing_headers: system headers to storage nodes
+        :return: Response object
+        """
+        raise NotImplementedError()
+
+    def _delete_object(self, req, obj_ring, partition, headers,
+                       node_count=None, node_iterator=None):
+        """Delete object considering write-affinity.
+
+        When deleting object in write affinity deployment, also take configured
+        handoff nodes number into consideration, instead of just sending
+        requests to primary nodes. Otherwise (write-affinity is disabled),
+        go with the same way as before.
+
+        :param req: the DELETE Request
+        :param obj_ring: the object ring
+        :param partition: ring partition number
+        :param headers: system headers to storage nodes
+        :return: Response object
+        """
+        status_overrides = {404: 204}
+        resp = self.make_requests(req, obj_ring,
+                                  partition, 'DELETE', req.swift_entity_path,
+                                  headers, overrides=status_overrides,
+                                  node_count=node_count,
+                                  node_iterator=node_iterator)
+        return resp
+
+    def _post_extra_handoffs(self, req, obj_ring, partition, headers, results,
+                             handoff_nodes):
+        """
+        Send POST requests to handoff nodes when primary nodes return mixed
+        results.
+
+        :param req: the POST Request
+        :param obj_ring: the object ring
+        :param partition: ring partition number
+        :param headers: system headers to storage nodes
+        :param results: results from primary node requests
+        :param handoff_nodes: list of handoff nodes to try
+        :return: list of handoff results to extend the original results
+        """
+        node_iter = NodeIter(
+            'object', self.app, obj_ring, partition, self.logger, req,
+            node_iter=handoff_nodes)
+        # we want the backend headers from the *missing* nodes
+        missing_headers = [h for h, r in zip(headers, results)
+                           if r[0].status != HTTP_ACCEPTED]
+        # _make_requests will make requests per header, if our handoff_iter is
+        # too short it can *recycle* the nodes (?) and get 409s!?
+        missing_headers = missing_headers[:len(handoff_nodes)]
+        handoff_results = self._make_requests(
+            req, obj_ring, partition, 'POST',
+            req.swift_entity_path, missing_headers,
+            node_count=len(handoff_nodes),
+            node_iterator=node_iter)
+        return handoff_results
+
+    def _collect_status_map(self, results):
+        status_map = collections.defaultdict(list)
+        for resp, _body, node in results:
+            if not node:
+                continue
+            status_map[resp.status].append(node_to_string(node))
+        return status_map
+
+    def _post_object(self, req, obj_ring, partition, headers):
+        """
+        send object POST request to storage nodes.
+
+        :param req: the POST Request
+        :param obj_ring: the object ring
+        :param partition: ring partition number
+        :param headers: system headers to storage nodes
+        :return: Response object
+        """
+        node_iter = NodeIter(
+            'object', self.app, obj_ring, partition, self.logger, req)
+        results = self._make_requests(
+            req, obj_ring, partition, 'POST', req.swift_entity_path, headers,
+            node_iterator=node_iter)
+        primary_status_map = self._collect_status_map(results)
+        # by default best_response quorum is resp length sized, presumably in
+        # order to support fractional replicas
+        quorum = self._quorum_size(len(results))
+        found_count = len(primary_status_map[HTTP_ACCEPTED])
+        if found_count and found_count < quorum:
+            # ... but quorum is going to be wrong if we make extra requests
+            quorum = self._quorum_size(obj_ring.replica_count)
+            # the make_requests machinery will make extra requests to handoffs
+            # for Timeout/503 primaries, we only have to make up for the 404s
+            extra_requests = len(primary_status_map[HTTP_NOT_FOUND])
+            handoff_nodes = list(itertools.islice(
+                node_iter.handoff_iter, extra_requests))
+            self.logger.debug(
+                'Primary nodes returned mixed results on POST: %r,'
+                ' trying handoffs: %r', dict(primary_status_map),
+                [node_to_string(n) for n in handoff_nodes])
+            handoff_results = self._post_extra_handoffs(
+                req, obj_ring, partition, headers, results, handoff_nodes)
+            results.extend(handoff_results)
+
+        statuses, reasons, resp_headers, bodies = zip(*[(
+            resp.status, resp.reason, resp.getheaders(), body)
+            for resp, body, _node in results])
+
+        final_resp = self.best_response(
+            req, statuses, reasons, bodies, 'Object POST',
+            headers=resp_headers, quorum_size=quorum)
+        if final_resp.status_int == HTTP_NOT_FOUND and found_count > 0:
+            # 404 can't be right, we have an existence proof
+            final_status_map = self._collect_status_map(results)
+            self.logger.debug(
+                'Unable to resolve mixed results on POST: %r',
+                dict(final_status_map))
+            raise HTTPServiceUnavailable(request=req)
+        return final_resp
 
     @public
+    @cors_validation
     @delay_denial
     def PUT(self, req):
         """HTTP PUT request handler."""
+        if req.if_none_match is not None and '*' not in req.if_none_match:
+            # Sending an etag with if-none-match isn't currently supported
+            return HTTPBadRequest(request=req, content_type='text/plain',
+                                  body='If-None-Match only supports *')
         container_info = self.container_info(
-            self.account_name, self.container_name,
-            account_autocreate=self.app.account_autocreate)
-        container_partition = container_info['partition']
-        containers = container_info['nodes']
+            self.account_name, self.container_name, req)
+        policy_index = req.headers.get('X-Backend-Storage-Policy-Index',
+                                       container_info['storage_policy'])
+        obj_ring = self.app.get_object_ring(policy_index)
+        partition, nodes = obj_ring.get_nodes(
+            self.account_name, self.container_name, self.object_name)
+
+        # pass the policy index to storage nodes via req header
+        req.headers['X-Backend-Storage-Policy-Index'] = policy_index
+        next_part_power = getattr(obj_ring, 'next_part_power', None)
+        if next_part_power:
+            req.headers['X-Backend-Next-Part-Power'] = next_part_power
         req.acl = container_info['write_acl']
         req.environ['swift_sync_key'] = container_info['sync_key']
-        object_versions = container_info['versions']
+
+        # is request authorized
         if 'swift.authorize' in req.environ:
             aresp = req.environ['swift.authorize'](req)
             if aresp:
                 return aresp
-        if not containers:
+
+        if not is_success(container_info.get('status')):
             return HTTPNotFound(request=req)
-        if 'x-delete-after' in req.headers:
-            try:
-                x_delete_after = int(req.headers['x-delete-after'])
-            except ValueError:
-                    return HTTPBadRequest(request=req,
-                                          content_type='text/plain',
-                                          body='Non-integer X-Delete-After')
-            req.headers['x-delete-at'] = '%d' % (time.time() + x_delete_after)
-        if 'x-delete-at' in req.headers:
-            try:
-                x_delete_at = int(req.headers['x-delete-at'])
-                if x_delete_at < time.time():
-                    return HTTPBadRequest(
-                        body='X-Delete-At in past', request=req,
-                        content_type='text/plain')
-            except ValueError:
-                return HTTPBadRequest(request=req, content_type='text/plain',
-                                      body='Non-integer X-Delete-At')
-            delete_at_container = str(
-                x_delete_at /
-                self.app.expiring_objects_container_divisor *
-                self.app.expiring_objects_container_divisor)
-            delete_at_part, delete_at_nodes = \
-                self.app.container_ring.get_nodes(
-                    self.app.expiring_objects_account, delete_at_container)
-        else:
-            delete_at_part = delete_at_nodes = None
-        partition, nodes = self.app.object_ring.get_nodes(
-            self.account_name, self.container_name, self.object_name)
-        # do a HEAD request for container sync and checking object versions
-        if 'x-timestamp' in req.headers or \
-                (object_versions and not
-                 req.environ.get('swift_versioned_copy')):
-            hreq = Request.blank(req.path_info, headers={'X-Newest': 'True'},
-                                 environ={'REQUEST_METHOD': 'HEAD'})
-            hresp = self.GETorHEAD_base(hreq, _('Object'), partition, nodes,
-                                        hreq.path_info, len(nodes))
-        # Used by container sync feature
-        if 'x-timestamp' in req.headers:
-            try:
-                req.headers['X-Timestamp'] = \
-                    normalize_timestamp(float(req.headers['x-timestamp']))
-                if hresp.environ and 'swift_x_timestamp' in hresp.environ and \
-                    float(hresp.environ['swift_x_timestamp']) >= \
-                        float(req.headers['x-timestamp']):
-                    return HTTPAccepted(request=req)
-            except ValueError:
-                return HTTPBadRequest(
-                    request=req, content_type='text/plain',
-                    body='X-Timestamp should be a UNIX timestamp float value; '
-                         'was %r' % req.headers['x-timestamp'])
-        else:
-            req.headers['X-Timestamp'] = normalize_timestamp(time.time())
-        # Sometimes the 'content-type' header exists, but is set to None.
-        content_type_manually_set = True
-        if not req.headers.get('content-type'):
-            guessed_type, _junk = mimetypes.guess_type(req.path_info)
-            req.headers['Content-Type'] = guessed_type or \
-                'application/octet-stream'
-            content_type_manually_set = False
-        error_response = check_object_creation(req, self.object_name)
+
+        # update content type in case it is missing
+        self._update_content_type(req)
+
+        req.ensure_x_timestamp()
+
+        # check constraints on object name and request headers
+        error_response = check_object_creation(req, self.object_name) or \
+            check_content_type(req)
         if error_response:
             return error_response
-        if object_versions and not req.environ.get('swift_versioned_copy'):
-            is_manifest = 'x-object-manifest' in req.headers or \
-                          'x-object-manifest' in hresp.headers
-            if hresp.status_int != HTTP_NOT_FOUND and not is_manifest:
-                # This is a version manifest and needs to be handled
-                # differently. First copy the existing data to a new object,
-                # then write the data from this request to the version manifest
-                # object.
-                lcontainer = object_versions.split('/')[0]
-                prefix_len = '%03x' % len(self.object_name)
-                lprefix = prefix_len + self.object_name + '/'
-                ts_source = hresp.environ.get('swift_x_timestamp')
-                if ts_source is None:
-                    ts_source = time.mktime(time.strptime(
-                                            hresp.headers['last-modified'],
-                                            '%a, %d %b %Y %H:%M:%S GMT'))
-                new_ts = normalize_timestamp(ts_source)
-                vers_obj_name = lprefix + new_ts
-                copy_headers = {
-                    'Destination': '%s/%s' % (lcontainer, vers_obj_name)}
-                copy_environ = {'REQUEST_METHOD': 'COPY',
-                                'swift_versioned_copy': True
-                                }
-                copy_req = Request.blank(req.path_info, headers=copy_headers,
-                                         environ=copy_environ)
-                copy_resp = self.COPY(copy_req)
-                if is_client_error(copy_resp.status_int):
-                    # missing container or bad permissions
-                    return HTTPPreconditionFailed(request=req)
-                elif not is_success(copy_resp.status_int):
-                    # could not copy the data, bail
-                    return HTTPServiceUnavailable(request=req)
-
-        reader = req.environ['wsgi.input'].read
-        data_source = iter(lambda: reader(self.app.client_chunk_size), '')
-        source_header = req.headers.get('X-Copy-From')
-        source_resp = None
-        if source_header:
-            source_header = unquote(source_header)
-            acct = req.path_info.split('/', 2)[1]
-            if isinstance(acct, unicode):
-                acct = acct.encode('utf-8')
-            if not source_header.startswith('/'):
-                source_header = '/' + source_header
-            source_header = '/' + acct + source_header
-            try:
-                src_container_name, src_obj_name = \
-                    source_header.split('/', 3)[2:]
-            except ValueError:
-                return HTTPPreconditionFailed(
-                    request=req,
-                    body='X-Copy-From header must be of the form'
-                         '<container name>/<object name>')
-            source_req = req.copy_get()
-            source_req.path_info = source_header
-            source_req.headers['X-Newest'] = 'true'
-            orig_obj_name = self.object_name
-            orig_container_name = self.container_name
-            self.object_name = src_obj_name
-            self.container_name = src_container_name
-            source_resp = self.GET(source_req)
-            if source_resp.status_int >= HTTP_MULTIPLE_CHOICES:
-                return source_resp
-            self.object_name = orig_obj_name
-            self.container_name = orig_container_name
-            new_req = Request.blank(req.path_info,
-                                    environ=req.environ, headers=req.headers)
-            data_source = source_resp.app_iter
-            new_req.content_length = source_resp.content_length
-            if new_req.content_length is None:
-                # This indicates a transfer-encoding: chunked source object,
-                # which currently only happens because there are more than
-                # CONTAINER_LISTING_LIMIT segments in a segmented object. In
-                # this case, we're going to refuse to do the server-side copy.
-                return HTTPRequestEntityTooLarge(request=req)
-            new_req.etag = source_resp.etag
-            # we no longer need the X-Copy-From header
-            del new_req.headers['X-Copy-From']
-            if not content_type_manually_set:
-                new_req.headers['Content-Type'] = \
-                    source_resp.headers['Content-Type']
-            if not config_true_value(
-                    new_req.headers.get('x-fresh-metadata', 'false')):
-                for k, v in source_resp.headers.items():
-                    if k.lower().startswith('x-object-meta-'):
-                        new_req.headers[k] = v
-                for k, v in req.headers.items():
-                    if k.lower().startswith('x-object-meta-'):
-                        new_req.headers[k] = v
-            req = new_req
-        node_iter = self.iter_nodes(partition, nodes, self.app.object_ring)
-        pile = GreenPile(len(nodes))
-        chunked = req.headers.get('transfer-encoding')
-        for container in containers:
-            nheaders = dict(req.headers.iteritems())
-            nheaders['Connection'] = 'close'
-            nheaders['X-Container-Host'] = '%(ip)s:%(port)s' % container
-            nheaders['X-Container-Partition'] = container_partition
-            nheaders['X-Container-Device'] = container['device']
-            # RFC2616:8.2.3 disallows 100-continue without a body
-            if (req.content_length > 0) or chunked:
-                nheaders['Expect'] = '100-continue'
-            if delete_at_nodes:
-                node = delete_at_nodes.pop(0)
-                nheaders['X-Delete-At-Host'] = '%(ip)s:%(port)s' % node
-                nheaders['X-Delete-At-Partition'] = delete_at_part
-                nheaders['X-Delete-At-Device'] = node['device']
-            pile.spawn(self._connect_put_node, node_iter, partition,
-                       req.path_info, nheaders, self.app.logger.thread_locals)
-        conns = [conn for conn in pile if conn]
-        if len(conns) <= len(nodes) / 2:
-            self.app.logger.error(
-                _('Object PUT returning 503, %(conns)s/%(nodes)s '
-                  'required connections'),
-                {'conns': len(conns), 'nodes': len(nodes) // 2 + 1})
-            return HTTPServiceUnavailable(request=req)
-        bytes_transferred = 0
-        try:
-            with ContextPool(len(nodes)) as pool:
-                for conn in conns:
-                    conn.failed = False
-                    conn.queue = Queue(self.app.put_queue_depth)
-                    pool.spawn(self._send_file, conn, req.path)
-                while True:
-                    with ChunkReadTimeout(self.app.client_timeout):
-                        try:
-                            chunk = next(data_source)
-                        except StopIteration:
-                            if chunked:
-                                [conn.queue.put('0\r\n\r\n') for conn in conns]
-                            break
-                    bytes_transferred += len(chunk)
-                    if bytes_transferred > MAX_FILE_SIZE:
-                        return HTTPRequestEntityTooLarge(request=req)
-                    for conn in list(conns):
-                        if not conn.failed:
-                            conn.queue.put(
-                                '%x\r\n%s\r\n' % (len(chunk), chunk)
-                                if chunked else chunk)
-                        else:
-                            conns.remove(conn)
-                    if len(conns) <= len(nodes) / 2:
-                        self.app.logger.error(_(
-                            'Object PUT exceptions during'
-                            ' send, %(conns)s/%(nodes)s required connections'),
-                            {'conns': len(conns), 'nodes': len(nodes) / 2 + 1})
-                        return HTTPServiceUnavailable(request=req)
-                for conn in conns:
-                    if conn.queue.unfinished_tasks:
-                        conn.queue.join()
-            conns = [conn for conn in conns if not conn.failed]
-        except ChunkReadTimeout, err:
-            self.app.logger.warn(
-                _('ERROR Client read timeout (%ss)'), err.seconds)
-            self.app.logger.increment('client_timeouts')
-            return HTTPRequestTimeout(request=req)
-        except (Exception, Timeout):
-            self.app.logger.exception(
-                _('ERROR Exception causing client disconnect'))
-            return HTTPClientDisconnect(request=req)
-        if req.content_length and bytes_transferred < req.content_length:
-            req.client_disconnect = True
-            self.app.logger.warn(
-                _('Client disconnected without sending enough data'))
-            self.app.logger.increment('client_disconnects')
-            return HTTPClientDisconnect(request=req)
-        statuses = []
-        reasons = []
-        bodies = []
-        etags = set()
-        for conn in conns:
+
+        def reader():
             try:
-                with Timeout(self.app.node_timeout):
-                    if conn.resp:
-                        response = conn.resp
-                    else:
-                        response = conn.getresponse()
-                    statuses.append(response.status)
-                    reasons.append(response.reason)
-                    bodies.append(response.read())
-                    if response.status >= HTTP_INTERNAL_SERVER_ERROR:
-                        self.error_occurred(
-                            conn.node,
-                            _('ERROR %(status)d %(body)s From Object Server '
-                              're: %(path)s') %
-                            {'status': response.status,
-                             'body': bodies[-1][:1024], 'path': req.path})
-                    elif is_success(response.status):
-                        etags.add(response.getheader('etag').strip('"'))
-            except (Exception, Timeout):
-                self.exception_occurred(
-                    conn.node, _('Object'),
-                    _('Trying to get final status of PUT to %s') % req.path)
-        if len(etags) > 1:
-            self.app.logger.error(
-                _('Object servers returned %s mismatched etags'), len(etags))
-            return HTTPServerError(request=req)
-        etag = len(etags) and etags.pop() or None
-        while len(statuses) < len(nodes):
-            statuses.append(HTTP_SERVICE_UNAVAILABLE)
-            reasons.append('')
-            bodies.append('')
-        resp = self.best_response(req, statuses, reasons, bodies,
-                                  _('Object PUT'), etag=etag)
-        if source_header:
-            resp.headers['X-Copied-From'] = quote(
-                source_header.split('/', 2)[2])
-            if 'last-modified' in source_resp.headers:
-                resp.headers['X-Copied-From-Last-Modified'] = \
-                    source_resp.headers['last-modified']
-            for k, v in req.headers.items():
-                if k.lower().startswith('x-object-meta-'):
-                    resp.headers[k] = v
-        resp.last_modified = float(req.headers['X-Timestamp'])
+                return req.environ['wsgi.input'].read(
+                    self.app.client_chunk_size)
+            except (ValueError, IOError) as e:
+                raise ChunkReadError(str(e))
+        data_source = iter(reader, b'')
+
+        # check if object is set to be automatically deleted (i.e. expired)
+        req, delete_at_container, delete_at_part, \
+            delete_at_nodes = self._config_obj_expiration(req)
+
+        # add special headers to be handled by storage nodes
+        outgoing_headers = self._backend_requests(
+            req, len(nodes), container_info,
+            delete_at_container, delete_at_part, delete_at_nodes)
+
+        # send object to storage nodes
+        resp = self._store_object(
+            req, data_source, nodes, partition, outgoing_headers)
         return resp
 
     @public
+    @cors_validation
     @delay_denial
     def DELETE(self, req):
         """HTTP DELETE request handler."""
-        container_info = self.container_info(self.account_name,
-                                             self.container_name)
-        container_partition = container_info['partition']
-        containers = container_info['nodes']
+        container_info = self.container_info(
+            self.account_name, self.container_name, req)
+        # pass the policy index to storage nodes via req header
+        policy_index = req.headers.get('X-Backend-Storage-Policy-Index',
+                                       container_info['storage_policy'])
+        obj_ring = self.app.get_object_ring(policy_index)
+        # pass the policy index to storage nodes via req header
+        req.headers['X-Backend-Storage-Policy-Index'] = policy_index
+        next_part_power = getattr(obj_ring, 'next_part_power', None)
+        if next_part_power:
+            req.headers['X-Backend-Next-Part-Power'] = next_part_power
         req.acl = container_info['write_acl']
         req.environ['swift_sync_key'] = container_info['sync_key']
-        object_versions = container_info['versions']
-        if object_versions:
-            # this is a version manifest and needs to be handled differently
-            lcontainer = object_versions.split('/')[0]
-            prefix_len = '%03x' % len(self.object_name)
-            lprefix = prefix_len + self.object_name + '/'
-            last_item = None
-            try:
-                for last_item in self._listing_iter(lcontainer, lprefix,
-                                                    req.environ):
-                    pass
-            except ListingIterNotFound:
-                # no worries, last_item is None
-                pass
-            except ListingIterNotAuthorized, err:
-                return err.aresp
-            except ListingIterError:
-                return HTTPServerError(request=req)
-            if last_item:
-                # there are older versions so copy the previous version to the
-                # current object and delete the previous version
-                orig_container = self.container_name
-                orig_obj = self.object_name
-                self.container_name = lcontainer
-                self.object_name = last_item['name']
-                copy_path = '/' + self.account_name + '/' + \
-                            self.container_name + '/' + self.object_name
-                copy_headers = {'X-Newest': 'True',
-                                'Destination': orig_container + '/' + orig_obj
-                                }
-                copy_environ = {'REQUEST_METHOD': 'COPY',
-                                'swift_versioned_copy': True
-                                }
-                creq = Request.blank(copy_path, headers=copy_headers,
-                                     environ=copy_environ)
-                copy_resp = self.COPY(creq)
-                if is_client_error(copy_resp.status_int):
-                    # some user error, maybe permissions
-                    return HTTPPreconditionFailed(request=req)
-                elif not is_success(copy_resp.status_int):
-                    # could not copy the data, bail
-                    return HTTPServiceUnavailable(request=req)
-                # reset these because the COPY changed them
-                self.container_name = lcontainer
-                self.object_name = last_item['name']
-                new_del_req = Request.blank(copy_path, environ=req.environ)
-                container_info = self.container_info(self.account_name,
-                                                     self.container_name)
-                container_partition = container_info['partition']
-                containers = container_info['nodes']
-                new_del_req.acl = container_info['write_acl']
-                new_del_req.path_info = copy_path
-                req = new_del_req
-                # remove 'X-If-Delete-At', since it is not for the older copy
-                if 'X-If-Delete-At' in req.headers:
-                    del req.headers['X-If-Delete-At']
         if 'swift.authorize' in req.environ:
             aresp = req.environ['swift.authorize'](req)
             if aresp:
                 return aresp
-        if not containers:
+        if not is_success(container_info.get('status')):
             return HTTPNotFound(request=req)
-        partition, nodes = self.app.object_ring.get_nodes(
+        partition, nodes = obj_ring.get_nodes(
             self.account_name, self.container_name, self.object_name)
-        # Used by container sync feature
-        if 'x-timestamp' in req.headers:
-            try:
-                req.headers['X-Timestamp'] = \
-                    normalize_timestamp(float(req.headers['x-timestamp']))
-            except ValueError:
-                return HTTPBadRequest(
-                    request=req, content_type='text/plain',
-                    body='X-Timestamp should be a UNIX timestamp float value; '
-                         'was %r' % req.headers['x-timestamp'])
-        else:
-            req.headers['X-Timestamp'] = normalize_timestamp(time.time())
-        headers = []
-        for container in containers:
-            nheaders = dict(req.headers.iteritems())
-            nheaders['Connection'] = 'close'
-            nheaders['X-Container-Host'] = '%(ip)s:%(port)s' % container
-            nheaders['X-Container-Partition'] = container_partition
-            nheaders['X-Container-Device'] = container['device']
-            headers.append(nheaders)
-        resp = self.make_requests(req, self.app.object_ring,
-                                  partition, 'DELETE', req.path_info, headers)
+
+        req.ensure_x_timestamp()
+
+        # Include local handoff nodes if write-affinity is enabled.
+        node_count = len(nodes)
+        node_iterator = None
+        policy = POLICIES.get_by_index(policy_index)
+        policy_options = self.app.get_policy_options(policy)
+        is_local = policy_options.write_affinity_is_local_fn
+        if is_local is not None:
+            local_handoffs = policy_options.write_affinity_handoff_delete_count
+            if local_handoffs is None:
+                local_primaries = [node for node in nodes if is_local(node)]
+                local_handoffs = len(nodes) - len(local_primaries)
+            node_count += local_handoffs
+            node_iterator = self.iter_nodes_local_first(
+                obj_ring, partition, req, policy=policy,
+                local_handoffs_first=True)
+
+        headers = self._backend_requests(req, node_count, container_info)
+        return self._delete_object(req, obj_ring, partition, headers,
+                                   node_count=node_count,
+                                   node_iterator=node_iterator)
+
+
+@ObjectControllerRouter.register(REPL_POLICY)
+class ReplicatedObjectController(BaseObjectController):
+
+    def _get_or_head_response(self, req, node_iter, partition, policy):
+        concurrency = self.app.get_object_ring(policy.idx).replica_count \
+            if self.app.get_policy_options(policy).concurrent_gets else 1
+        resp = self.GETorHEAD_base(
+            req, 'Object', node_iter, partition,
+            req.swift_entity_path, concurrency, policy)
         return resp
 
-    @public
-    @delay_denial
-    def COPY(self, req):
-        """HTTP COPY request handler."""
-        dest = req.headers.get('Destination')
-        if not dest:
-            return HTTPPreconditionFailed(request=req,
-                                          body='Destination header required')
-        dest = unquote(dest)
-        if not dest.startswith('/'):
-            dest = '/' + dest
-        try:
-            _junk, dest_container, dest_object = dest.split('/', 2)
-        except ValueError:
-            return HTTPPreconditionFailed(
-                request=req,
-                body='Destination header must be of the form '
-                     '<container name>/<object name>')
-        source = '/' + self.container_name + '/' + self.object_name
-        self.container_name = dest_container
-        self.object_name = dest_object
-        # re-write the existing request as a PUT instead of creating a new one
-        # since this one is already attached to the posthooklogger
-        req.method = 'PUT'
-        req.path_info = '/' + self.account_name + dest
-        req.headers['Content-Length'] = 0
-        req.headers['X-Copy-From'] = quote(source)
-        del req.headers['Destination']
-        return self.PUT(req)
+    def _make_putter(self, node, part, req, headers):
+        if req.environ.get('swift.callback.update_footers'):
+            putter = MIMEPutter.connect(
+                node, part, req.swift_entity_path, headers, self.app.watchdog,
+                conn_timeout=self.app.conn_timeout,
+                node_timeout=self.app.node_timeout,
+                write_timeout=self.app.node_timeout,
+                send_exception_handler=self.app.exception_occurred,
+                logger=self.logger,
+                need_multiphase=False)
+        else:
+            te = ',' + headers.get('Transfer-Encoding', '')
+            putter = Putter.connect(
+                node, part, req.swift_entity_path, headers, self.app.watchdog,
+                conn_timeout=self.app.conn_timeout,
+                node_timeout=self.app.node_timeout,
+                write_timeout=self.app.node_timeout,
+                send_exception_handler=self.app.exception_occurred,
+                logger=self.logger,
+                chunked=te.endswith(',chunked'))
+        return putter
+
+    def _transfer_data(self, req, data_source, putters, nodes):
+        """
+        Transfer data for a replicated object.
+
+        This method was added in the PUT method extraction change
+        """
+        bytes_transferred = 0
+        data_source = CooperativeIterator(data_source)
+
+        def send_chunk(chunk):
+            timeout_at = time.time() + self.app.node_timeout
+            for putter in list(putters):
+                if not putter.failed:
+                    putter.send_chunk(chunk, timeout_at=timeout_at)
+                else:
+                    putter.close()
+                    putters.remove(putter)
+            self._check_min_conn(
+                req, putters, min_conns,
+                msg='Object PUT exceptions during send, '
+                    '%(conns)s/%(nodes)s required connections')
+
+        min_conns = quorum_size(len(nodes))
+        try:
+            while True:
+                with WatchdogTimeout(self.app.watchdog,
+                                     self.app.client_timeout,
+                                     ChunkReadTimeout):
+                    try:
+                        chunk = next(data_source)
+                    except StopIteration:
+                        break
+                bytes_transferred += len(chunk)
+                if bytes_transferred > constraints.MAX_FILE_SIZE:
+                    raise HTTPRequestEntityTooLarge(request=req)
+
+                send_chunk(chunk)
+
+            ml = req.message_length()
+            if ml and bytes_transferred < ml:
+                self.logger.warning(
+                    'Client disconnected without sending enough data')
+                self.logger.increment('object.client_disconnects')
+                raise HTTPClientDisconnect(request=req)
+
+            trail_md = self._get_footers(req)
+            for putter in putters:
+                # send any footers set by middleware
+                putter.end_of_object_data(footer_metadata=trail_md)
+
+            self._check_min_conn(
+                req, [p for p in putters if not p.failed], min_conns,
+                msg='Object PUT exceptions after last send, '
+                    '%(conns)s/%(nodes)s required connections')
+        except ChunkReadTimeout as err:
+            self.logger.warning(
+                'ERROR Client read timeout (%ss)', err.seconds)
+            self.logger.increment('object.client_timeouts')
+            raise HTTPRequestTimeout(request=req)
+        except HTTPException:
+            raise
+        except ChunkReadError:
+            self.logger.warning(
+                'Client disconnected without sending last chunk')
+            self.logger.increment('object.client_disconnects')
+            raise HTTPClientDisconnect(request=req)
+        except Timeout:
+            self.logger.exception(
+                'ERROR Exception causing client disconnect')
+            raise HTTPClientDisconnect(request=req)
+        except Exception:
+            self.logger.exception(
+                'ERROR Exception transferring data to object servers %s',
+                {'path': req.path})
+            raise HTTPInternalServerError(request=req)
+
+    def _have_adequate_put_responses(self, statuses, num_nodes, min_responses):
+        return self.have_quorum(statuses, num_nodes)
+
+    def _store_object(self, req, data_source, nodes, partition,
+                      outgoing_headers):
+        """
+        Store a replicated object.
+
+        This method is responsible for establishing connection
+        with storage nodes and sending object to each one of those
+        nodes. After sending the data, the "best" response will be
+        returned based on statuses from all connections
+        """
+        policy_index = req.headers.get('X-Backend-Storage-Policy-Index')
+        policy = POLICIES.get_by_index(policy_index)
+        if not nodes:
+            return HTTPNotFound()
+
+        putters = self._get_put_connections(
+            req, nodes, partition, outgoing_headers, policy)
+        min_conns = quorum_size(len(nodes))
+        try:
+            # check that a minimum number of connections were established and
+            # meet all the correct conditions set in the request
+            self._check_failure_put_connections(putters, req, min_conns)
+
+            # transfer data
+            self._transfer_data(req, data_source, putters, nodes)
+
+            # get responses
+            statuses, reasons, bodies, etags = \
+                self._get_put_responses(req, putters, len(nodes))
+        except HTTPException as resp:
+            return resp
+        finally:
+            for putter in putters:
+                putter.close()
+
+        if len(etags) > 1:
+            self.logger.error(
+                'Object servers returned %s mismatched etags', len(etags))
+            return HTTPServerError(request=req)
+        etag = etags.pop() if len(etags) else None
+        resp = self.best_response(req, statuses, reasons, bodies,
+                                  'Object PUT', etag=etag)
+        resp.last_modified = Timestamp(req.headers['X-Timestamp'])
+        return resp
+
+
+class ECAppIter(object):
+    """
+    WSGI iterable that decodes EC fragment archives (or portions thereof)
+    into the original object (or portions thereof).
+
+    :param path: object's path, sans v1 (e.g. /a/c/o)
+
+    :param policy: storage policy for this object
+
+    :param internal_parts_iters: list of the response-document-parts
+        iterators for the backend GET responses. For an M+K erasure code,
+        the caller must supply M such iterables.
+
+    :param range_specs: list of dictionaries describing the ranges requested
+        by the client. Each dictionary contains the start and end of the
+        client's requested byte range as well as the start and end of the EC
+        segments containing that byte range.
+
+    :param fa_length: length of the fragment archive, in bytes, if the
+        response is a 200. If it's a 206, then this is ignored.
+
+    :param obj_length: length of the object, in bytes. Learned from the
+        headers in the GET response from the object server.
+
+    :param logger: a logger
+    """
+
+    def __init__(self, path, policy, internal_parts_iters, range_specs,
+                 fa_length, obj_length, logger):
+        self.path = path
+        self.policy = policy
+        self.internal_parts_iters = internal_parts_iters
+        self.range_specs = range_specs
+        self.fa_length = fa_length
+        self.obj_length = obj_length if obj_length is not None else 0
+        self.boundary = b''
+        self.logger = logger
+
+        self.mime_boundary = None
+        self.learned_content_type = None
+        self.stashed_iter = None
+        self.pool = ContextPool(len(internal_parts_iters))
+
+    def close(self):
+        # close down the stashed iter and shutdown the context pool to
+        # clean up the frag queue feeding coroutines that may be currently
+        # executing the internal_parts_iters.
+        if self.stashed_iter:
+            close_if_possible(self.stashed_iter)
+        self.pool.close()
+        for it in self.internal_parts_iters:
+            close_if_possible(it)
+
+    def kickoff(self, req, resp):
+        """
+        Start pulling data from the backends so that we can learn things like
+        the real Content-Type that might only be in the multipart/byteranges
+        response body. Update our response accordingly.
+
+        Also, this is the first point at which we can learn the MIME
+        boundary that our response has in the headers. We grab that so we
+        can also use it in the body.
+
+        :returns: None
+        :raises HTTPException: on error
+        """
+        self.mime_boundary = resp.boundary
+
+        try:
+            self.stashed_iter = reiterate(self._real_iter(req, resp.headers))
+        except Exception:
+            self.close()
+            raise
+
+        if self.learned_content_type is not None:
+            resp.content_type = self.learned_content_type
+        resp.content_length = self.obj_length
+
+    def _next_ranges(self):
+        # Each FA part should have approximately the same headers. We really
+        # only care about Content-Range and Content-Type, and that'll be the
+        # same for all the different FAs.
+        for part_infos in zip(*self.internal_parts_iters):
+            frag_iters = [pi['part_iter'] for pi in part_infos]
+            headers = HeaderKeyDict(part_infos[0]['headers'])
+            yield headers, frag_iters
+
+    def _actual_range(self, req_start, req_end, entity_length):
+        # Takes 3 args: (requested-first-byte, requested-last-byte,
+        # actual-length).
+        #
+        # Returns a 3-tuple (first-byte, last-byte, satisfiable).
+        #
+        # It is possible to get (None, None, True). This means that the last
+        # N>0 bytes of a 0-byte object were requested, and we are able to
+        # satisfy that request by returning nothing.
+        try:
+            rng = Range("bytes=%s-%s" % (
+                req_start if req_start is not None else '',
+                req_end if req_end is not None else ''))
+        except ValueError:
+            return (None, None, False)
+
+        rfl = rng.ranges_for_length(entity_length)
+        if rfl and entity_length == 0:
+            return (None, None, True)
+        elif not rfl:
+            return (None, None, False)
+        else:
+            # ranges_for_length() adds 1 to the last byte's position
+            # because webob once made a mistake
+            return (rfl[0][0], rfl[0][1] - 1, True)
+
+    def _fill_out_range_specs_from_obj_length(self, range_specs):
+        # Add a few fields to each range spec:
+        #
+        #  * resp_client_start, resp_client_end: the actual bytes that will
+        #      be delivered to the client for the requested range. This may
+        #      differ from the requested bytes if, say, the requested range
+        #      overlaps the end of the object.
+        #
+        #  * resp_segment_start, resp_segment_end: the actual offsets of the
+        #      segments that will be decoded for the requested range. These
+        #      differ from resp_client_start/end in that these are aligned
+        #      to segment boundaries, while resp_client_start/end are not
+        #      necessarily so.
+        #
+        #  * satisfiable: a boolean indicating whether the range is
+        #      satisfiable or not (i.e. the requested range overlaps the
+        #      object in at least one byte).
+        #
+        # This is kept separate from _fill_out_range_specs_from_fa_length()
+        # because this computation can be done with just the response
+        # headers from the object servers (in particular
+        # X-Object-Sysmeta-Ec-Content-Length), while the computation in
+        # _fill_out_range_specs_from_fa_length() requires the beginnings of
+        # the response bodies.
+        for spec in range_specs:
+            cstart, cend, csat = self._actual_range(
+                spec['req_client_start'],
+                spec['req_client_end'],
+                self.obj_length)
+            spec['resp_client_start'] = cstart
+            spec['resp_client_end'] = cend
+            spec['satisfiable'] = csat
+
+            sstart, send, _junk = self._actual_range(
+                spec['req_segment_start'],
+                spec['req_segment_end'],
+                self.obj_length)
+
+            seg_size = self.policy.ec_segment_size
+            if (spec['req_segment_start'] is None and
+                    sstart is not None and
+                    sstart % seg_size != 0):
+                # Segment start may, in the case of a suffix request, need
+                # to be rounded up (not down!) to the nearest segment boundary.
+                # This reflects the trimming of leading garbage (partial
+                # fragments) from the retrieved fragments.
+                sstart += seg_size - (sstart % seg_size)
+
+            spec['resp_segment_start'] = sstart
+            spec['resp_segment_end'] = send
+
+    def _fill_out_range_specs_from_fa_length(self, fa_length, range_specs):
+        # Add two fields to each range spec:
+        #
+        #  * resp_fragment_start, resp_fragment_end: the start and end of
+        #      the fragments that compose this byterange. These values are
+        #      aligned to fragment boundaries.
+        #
+        # This way, ECAppIter has the knowledge it needs to correlate
+        # response byteranges with requested ones for when some byteranges
+        # are omitted from the response entirely and also to put the right
+        # Content-Range headers in a multipart/byteranges response.
+        for spec in range_specs:
+            fstart, fend, _junk = self._actual_range(
+                spec['req_fragment_start'],
+                spec['req_fragment_end'],
+                fa_length)
+            spec['resp_fragment_start'] = fstart
+            spec['resp_fragment_end'] = fend
+
+    def __iter__(self):
+        if self.stashed_iter is not None:
+            return self
+        else:
+            raise ValueError("Failed to call kickoff() before __iter__()")
+
+    def __next__(self):
+        return next(self.stashed_iter)
+
+    def _real_iter(self, req, resp_headers):
+        if not self.range_specs:
+            client_asked_for_range = False
+            range_specs = [{
+                'req_client_start': 0,
+                'req_client_end': (None if self.obj_length is None
+                                   else self.obj_length - 1),
+                'resp_client_start': 0,
+                'resp_client_end': (None if self.obj_length is None
+                                    else self.obj_length - 1),
+                'req_segment_start': 0,
+                'req_segment_end': (None if self.obj_length is None
+                                    else self.obj_length - 1),
+                'resp_segment_start': 0,
+                'resp_segment_end': (None if self.obj_length is None
+                                     else self.obj_length - 1),
+                'req_fragment_start': 0,
+                'req_fragment_end': self.fa_length - 1,
+                'resp_fragment_start': 0,
+                'resp_fragment_end': self.fa_length - 1,
+                'satisfiable': self.obj_length > 0,
+            }]
+        else:
+            client_asked_for_range = True
+            range_specs = self.range_specs
+
+        self._fill_out_range_specs_from_obj_length(range_specs)
+
+        multipart = (len([rs for rs in range_specs if rs['satisfiable']]) > 1)
+        # Multipart responses are not required to be in the same order as
+        # the Range header; the parts may be in any order the server wants.
+        # Further, if multiple ranges are requested and only some are
+        # satisfiable, then only the satisfiable ones appear in the response
+        # at all. Thus, we cannot simply iterate over range_specs in order;
+        # we must use the Content-Range header from each part to figure out
+        # what we've been given.
+        #
+        # We do, however, make the assumption that all the object-server
+        # responses have their ranges in the same order. Otherwise, a
+        # streaming decode would be impossible.
+
+        def convert_ranges_iter():
+            seen_first_headers = False
+            ranges_for_resp = {}
+
+            for headers, frag_iters in self._next_ranges():
+                content_type = headers['Content-Type']
+
+                content_range = headers.get('Content-Range')
+                if content_range is not None:
+                    fa_start, fa_end, fa_length = parse_content_range(
+                        content_range)
+                elif self.fa_length <= 0:
+                    fa_start = None
+                    fa_end = None
+                    fa_length = 0
+                else:
+                    fa_start = 0
+                    fa_end = self.fa_length - 1
+                    fa_length = self.fa_length
+
+                if not seen_first_headers:
+                    # This is the earliest we can possibly do this. On a
+                    # 200 or 206-single-byterange response, we can learn
+                    # the FA's length from the HTTP response headers.
+                    # However, on a 206-multiple-byteranges response, we
+                    # don't learn it until the first part of the
+                    # response body, in the headers of the first MIME
+                    # part.
+                    #
+                    # Similarly, the content type of a
+                    # 206-multiple-byteranges response is
+                    # "multipart/byteranges", not the object's actual
+                    # content type.
+                    self._fill_out_range_specs_from_fa_length(
+                        fa_length, range_specs)
+
+                    satisfiable = False
+                    for range_spec in range_specs:
+                        satisfiable |= range_spec['satisfiable']
+                        key = (range_spec['resp_fragment_start'],
+                               range_spec['resp_fragment_end'])
+                        ranges_for_resp.setdefault(key, []).append(range_spec)
+
+                    # The client may have asked for an unsatisfiable set of
+                    # ranges, but when converted to fragments, the object
+                    # servers see it as satisfiable. For example, imagine a
+                    # request for bytes 800-900 of a 750-byte object with a
+                    # 1024-byte segment size. The object servers will see a
+                    # request for bytes 0-${fragsize-1}, and that's
+                    # satisfiable, so they return 206. It's not until we
+                    # learn the object size that we can check for this
+                    # condition.
+                    #
+                    # Note that some unsatisfiable ranges *will* be caught
+                    # by the object servers, like bytes 1800-1900 of a
+                    # 100-byte object with 1024-byte segments. That's not
+                    # what we're dealing with here, though.
+                    if client_asked_for_range and not satisfiable:
+                        req.environ[
+                            'swift.non_client_disconnect'] = True
+                        raise HTTPRequestedRangeNotSatisfiable(
+                            request=req, headers=resp_headers)
+                    self.learned_content_type = content_type
+                    seen_first_headers = True
+
+                range_spec = ranges_for_resp[(fa_start, fa_end)].pop(0)
+                seg_iter = self._decode_segments_from_fragments(frag_iters)
+                if not range_spec['satisfiable']:
+                    # This'll be small; just a single small segment. Discard
+                    # it.
+                    for x in seg_iter:
+                        pass
+                    continue
+
+                byterange_iter = self._iter_one_range(range_spec, seg_iter)
+
+                converted = {
+                    "start_byte": range_spec["resp_client_start"],
+                    "end_byte": range_spec["resp_client_end"],
+                    "content_type": content_type,
+                    "part_iter": byterange_iter}
+
+                if self.obj_length is not None:
+                    converted["entity_length"] = self.obj_length
+                yield converted
+
+        return document_iters_to_http_response_body(
+            convert_ranges_iter(), self.mime_boundary, multipart, self.logger)
+
+    def _iter_one_range(self, range_spec, segment_iter):
+        client_start = range_spec['resp_client_start']
+        client_end = range_spec['resp_client_end']
+        segment_start = range_spec['resp_segment_start']
+        segment_end = range_spec['resp_segment_end']
+
+        # It's entirely possible that the client asked for a range that
+        # includes some bytes we have and some we don't; for example, a
+        # range of bytes 1000-20000000 on a 1500-byte object.
+        segment_end = (min(segment_end, self.obj_length - 1)
+                       if segment_end is not None
+                       else self.obj_length - 1)
+        client_end = (min(client_end, self.obj_length - 1)
+                      if client_end is not None
+                      else self.obj_length - 1)
+        if segment_start is None:
+            num_segments = 0
+            start_overrun = 0
+            end_overrun = 0
+        else:
+            num_segments = int(
+                math.ceil(float(segment_end + 1 - segment_start)
+                          / self.policy.ec_segment_size))
+            # We get full segments here, but the client may have requested a
+            # byte range that begins or ends in the middle of a segment.
+            # Thus, we have some amount of overrun (extra decoded bytes)
+            # that we trim off so the client gets exactly what they
+            # requested.
+            start_overrun = client_start - segment_start
+            end_overrun = segment_end - client_end
+
+        for i, next_seg in enumerate(segment_iter):
+            # We may have a start_overrun of more than one segment in
+            # the case of suffix-byte-range requests. However, we never
+            # have an end_overrun of more than one segment.
+            if start_overrun > 0:
+                seglen = len(next_seg)
+                if seglen <= start_overrun:
+                    start_overrun -= seglen
+                    continue
+                else:
+                    next_seg = next_seg[start_overrun:]
+                    start_overrun = 0
+
+            if i == (num_segments - 1) and end_overrun:
+                next_seg = next_seg[:-end_overrun]
+
+            yield next_seg
+
+    def _decode_segments_from_fragments(self, fragment_iters):
+        # Decodes the fragments from the object servers and yields one
+        # segment at a time.
+        queues = [Queue(1) for _junk in range(len(fragment_iters))]
+
+        def put_fragments_in_queue(frag_iter, queue, logger_thread_locals):
+            self.logger.thread_locals = logger_thread_locals
+            try:
+                for fragment in frag_iter:
+                    if fragment.startswith(b' '):
+                        raise Exception('Leading whitespace on fragment.')
+                    queue.put(fragment)
+            except GreenletExit:
+                # killed by contextpool
+                pass
+            except ChunkReadTimeout:
+                # unable to resume in ECFragGetter
+                self.logger.exception(
+                    "ChunkReadTimeout fetching fragments for %r",
+                    quote(self.path))
+            except ChunkWriteTimeout:
+                # slow client disconnect
+                self.logger.exception(
+                    "ChunkWriteTimeout feeding fragments for %r",
+                    quote(self.path))
+            except:  # noqa
+                self.logger.exception("Exception fetching fragments for %r",
+                                      quote(self.path))
+            finally:
+                queue.resize(2)  # ensure there's room
+                queue.put(None)
+                frag_iter.close()
+
+        segments_decoded = 0
+        with self.pool as pool:
+            for frag_iter, queue in zip(fragment_iters, queues):
+                pool.spawn(put_fragments_in_queue, frag_iter, queue,
+                           self.logger.thread_locals)
+
+            while True:
+                fragments = []
+                for queue in queues:
+                    fragment = queue.get()
+                    queue.task_done()
+                    fragments.append(fragment)
+
+                # If any object server connection yields out a None; we're
+                # done.  Either they are all None, and we've finished
+                # successfully; or some un-recoverable failure has left us
+                # with an un-reconstructible list of fragments - so we'll
+                # break out of the iter so WSGI can tear down the broken
+                # connection.
+                frags_with_data = sum([1 for f in fragments if f])
+                if frags_with_data < len(fragments):
+                    if frags_with_data > 0:
+                        self.logger.warning(
+                            'Un-recoverable fragment rebuild. Only received '
+                            '%d/%d fragments for %r', frags_with_data,
+                            len(fragments), quote(self.path))
+                    break
+                try:
+                    segment = self.policy.pyeclib_driver.decode(fragments)
+                except ECDriverError as err:
+                    self.logger.error(
+                        "Error decoding fragments for %r. "
+                        "Segments decoded: %d, "
+                        "Lengths: [%s]: %s" % (
+                            quote(self.path), segments_decoded,
+                            ', '.join(map(str, map(len, fragments))),
+                            str(err)))
+                    raise
+
+                segments_decoded += 1
+                yield segment
+
+    def app_iter_range(self, start, end):
+        return self
+
+    def app_iter_ranges(self, ranges, content_type, boundary, content_size):
+        return self
+
+
+def client_range_to_segment_range(client_start, client_end, segment_size):
+    """
+    Takes a byterange from the client and converts it into a byterange
+    spanning the necessary segments.
+
+    Handles prefix, suffix, and fully-specified byte ranges.
+
+    Examples:
+        client_range_to_segment_range(100, 700, 512) = (0, 1023)
+        client_range_to_segment_range(100, 700, 256) = (0, 767)
+        client_range_to_segment_range(300, None, 256) = (256, None)
+
+    :param client_start: first byte of the range requested by the client
+    :param client_end: last byte of the range requested by the client
+    :param segment_size: size of an EC segment, in bytes
+
+    :returns: a 2-tuple (seg_start, seg_end) where
+
+      * seg_start is the first byte of the first segment, or None if this is
+        a suffix byte range
+
+      * seg_end is the last byte of the last segment, or None if this is a
+        prefix byte range
+    """
+    # the index of the first byte of the first segment
+    segment_start = (
+        int(client_start // segment_size)
+        * segment_size) if client_start is not None else None
+    # the index of the last byte of the last segment
+    segment_end = (
+        # bytes M-
+        None if client_end is None else
+        # bytes M-N
+        (((int(client_end // segment_size) + 1)
+          * segment_size) - 1) if client_start is not None else
+        # bytes -N: we get some extra bytes to make sure we
+        # have all we need.
+        #
+        # To see why, imagine a 100-byte segment size, a
+        # 340-byte object, and a request for the last 50
+        # bytes. Naively requesting the last 100 bytes would
+        # result in a truncated first segment and hence a
+        # truncated download. (Of course, the actual
+        # obj-server requests are for fragments, not
+        # segments, but that doesn't change the
+        # calculation.)
+        #
+        # This does mean that we fetch an extra segment if
+        # the object size is an exact multiple of the
+        # segment size. It's a little wasteful, but it's
+        # better to be a little wasteful than to get some
+        # range requests completely wrong.
+        (int(math.ceil((
+            float(client_end) / segment_size) + 1))  # nsegs
+         * segment_size))
+    return (segment_start, segment_end)
+
+
+def segment_range_to_fragment_range(segment_start, segment_end, segment_size,
+                                    fragment_size):
+    """
+    Takes a byterange spanning some segments and converts that into a
+    byterange spanning the corresponding fragments within their fragment
+    archives.
+
+    Handles prefix, suffix, and fully-specified byte ranges.
+
+    :param segment_start: first byte of the first segment
+    :param segment_end: last byte of the last segment
+    :param segment_size: size of an EC segment, in bytes
+    :param fragment_size: size of an EC fragment, in bytes
+
+    :returns: a 2-tuple (frag_start, frag_end) where
+
+      * frag_start is the first byte of the first fragment, or None if this
+        is a suffix byte range
+
+      * frag_end is the last byte of the last fragment, or None if this is a
+        prefix byte range
+    """
+    # Note: segment_start and (segment_end + 1) are
+    # multiples of segment_size, so we don't have to worry
+    # about integer math giving us rounding troubles.
+    #
+    # There's a whole bunch of +1 and -1 in here; that's because HTTP wants
+    # byteranges to be inclusive of the start and end, so e.g. bytes 200-300
+    # is a range containing 101 bytes. Python has half-inclusive ranges, of
+    # course, so we have to convert back and forth. We try to keep things in
+    # HTTP-style byteranges for consistency.
+
+    # the index of the first byte of the first fragment
+    fragment_start = ((
+        segment_start // segment_size * fragment_size)
+        if segment_start is not None else None)
+    # the index of the last byte of the last fragment
+    fragment_end = (
+        # range unbounded on the right
+        None if segment_end is None else
+        # range unbounded on the left; no -1 since we're
+        # asking for the last N bytes, not to have a
+        # particular byte be the last one
+        ((segment_end + 1) // segment_size
+         * fragment_size) if segment_start is None else
+        # range bounded on both sides; the -1 is because the
+        # rest of the expression computes the length of the
+        # fragment, and a range of N bytes starts at index M
+        # and ends at M + N - 1.
+        ((segment_end + 1) // segment_size * fragment_size) - 1)
+    return (fragment_start, fragment_end)
+
+
+NO_DATA_SENT = 1
+SENDING_DATA = 2
+DATA_SENT = 3
+DATA_ACKED = 4
+COMMIT_SENT = 5
+
+
+class Putter(object):
+    """
+    Putter for backend PUT requests.
+
+    Encapsulates all the actions required to establish a connection with a
+    storage node and stream data to that node.
+
+    :param conn: an HTTPConnection instance
+    :param node: dict describing storage node
+    :param resp: an HTTPResponse instance if connect() received final response
+    :param path: the object path to send to the storage node
+    :param connect_duration: time taken to initiate the HTTPConnection
+    :param watchdog: a spawned Watchdog instance that will enforce timeouts
+    :param write_timeout: time limit to write a chunk to the connection socket
+    :param send_exception_handler: callback called when an exception occured
+                                   writing to the connection socket
+    :param logger: a Logger instance
+    :param chunked: boolean indicating if the request encoding is chunked
+    """
+
+    def __init__(self, conn, node, resp, path, connect_duration, watchdog,
+                 write_timeout, send_exception_handler, logger,
+                 chunked=False):
+        # Note: you probably want to call Putter.connect() instead of
+        # instantiating one of these directly.
+        self.conn = conn
+        self.node = node
+        self.resp = self.final_resp = resp
+        self.path = path
+        self.connect_duration = connect_duration
+        self.watchdog = watchdog
+        self.write_timeout = write_timeout
+        self.send_exception_handler = send_exception_handler
+        # for handoff nodes node_index is None
+        self.node_index = node.get('index')
+
+        self.failed = False
+        self.state = NO_DATA_SENT
+        self.chunked = chunked
+        self.logger = logger
+
+    def await_response(self, timeout, informational=False):
+        """
+        Get 100-continue response indicating the end of 1st phase of a 2-phase
+        commit or the final response, i.e. the one with status >= 200.
+
+        Might or might not actually wait for anything. If we said Expect:
+        100-continue but got back a non-100 response, that'll be the thing
+        returned, and we won't do any network IO to get it. OTOH, if we got
+        a 100 Continue response and sent up the PUT request's body, then
+        we'll actually read the 2xx-5xx response off the network here.
+
+        :param timeout: time to wait for a response
+        :param informational: if True then try to get a 100-continue response,
+                              otherwise try to get a final response.
+        :returns: HTTPResponse
+        :raises Timeout: if the response took too long
+        """
+        # don't do this update of self.resp if the Expect response during
+        # connect() was actually a final response
+        if not self.final_resp:
+            with Timeout(timeout):
+                if informational:
+                    self.resp = self.conn.getexpect()
+                else:
+                    self.resp = self.conn.getresponse()
+        return self.resp
+
+    def _start_object_data(self):
+        # Called immediately before the first chunk of object data is sent.
+        # Subclasses may implement custom behaviour
+        pass
+
+    def send_chunk(self, chunk, timeout_at=None):
+        if not chunk:
+            # If we're not using chunked transfer-encoding, sending a 0-byte
+            # chunk is just wasteful. If we *are* using chunked
+            # transfer-encoding, sending a 0-byte chunk terminates the
+            # request body. Neither one of these is good.
+            return
+        elif self.state == DATA_SENT:
+            raise ValueError("called send_chunk after end_of_object_data")
+
+        if self.state == NO_DATA_SENT:
+            self._start_object_data()
+            self.state = SENDING_DATA
+
+        self._send_chunk(chunk, timeout_at=timeout_at)
+
+    def end_of_object_data(self, **kwargs):
+        """
+        Call when there is no more data to send.
+        """
+        if self.state == DATA_SENT:
+            raise ValueError("called end_of_object_data twice")
+
+        self._send_chunk(b'')
+        self.state = DATA_SENT
+
+    def _send_chunk(self, chunk, timeout_at=None):
+        if not self.failed:
+            if self.chunked:
+                to_send = b"%x\r\n%s\r\n" % (len(chunk), chunk)
+            else:
+                to_send = chunk
+            try:
+                with WatchdogTimeout(self.watchdog, self.write_timeout,
+                                     ChunkWriteTimeout, timeout_at=timeout_at):
+                    self.conn.send(to_send)
+            except (Exception, ChunkWriteTimeout):
+                self.failed = True
+                self.send_exception_handler(self.node, 'Object',
+                                            'Trying to write to %s'
+                                            % quote(self.path))
+
+    def close(self):
+        # release reference to response to ensure connection really does close,
+        # see bug https://bugs.launchpad.net/swift/+bug/1594739
+        self.resp = self.final_resp = None
+        self.conn.close()
+
+    @classmethod
+    def _make_connection(cls, node, part, path, headers, conn_timeout,
+                         node_timeout):
+        ip, port = get_ip_port(node, headers)
+        start_time = time.time()
+        with ConnectionTimeout(conn_timeout):
+            conn = http_connect(ip, port, node['device'],
+                                part, 'PUT', path, headers)
+        connect_duration = time.time() - start_time
+
+        with ResponseTimeout(node_timeout):
+            resp = conn.getexpect()
+
+        if resp.status == HTTP_INSUFFICIENT_STORAGE:
+            raise InsufficientStorage
+
+        if is_server_error(resp.status):
+            raise PutterConnectError(resp.status)
+
+        final_resp = None
+        if (is_success(resp.status) or
+                resp.status in (HTTP_CONFLICT, HTTP_UNPROCESSABLE_ENTITY) or
+                (headers.get('If-None-Match', None) is not None and
+                 resp.status == HTTP_PRECONDITION_FAILED)):
+            final_resp = resp
+
+        return conn, resp, final_resp, connect_duration
+
+    @classmethod
+    def connect(cls, node, part, path, headers, watchdog, conn_timeout,
+                node_timeout, write_timeout, send_exception_handler,
+                logger=None, chunked=False, **kwargs):
+        """
+        Connect to a backend node and send the headers.
+
+        :returns: Putter instance
+
+        :raises ConnectionTimeout: if initial connection timed out
+        :raises ResponseTimeout: if header retrieval timed out
+        :raises InsufficientStorage: on 507 response from node
+        :raises PutterConnectError: on non-507 server error response from node
+        """
+        conn, expect_resp, final_resp, connect_duration = cls._make_connection(
+            node, part, path, headers, conn_timeout, node_timeout)
+        return cls(conn, node, final_resp, path, connect_duration, watchdog,
+                   write_timeout, send_exception_handler, logger,
+                   chunked=chunked)
+
+
+class MIMEPutter(Putter):
+    """
+    Putter for backend PUT requests that use MIME.
+
+    This is here mostly to wrap up the fact that all multipart PUTs are
+    chunked because of the mime boundary footer trick and the first
+    half of the two-phase PUT conversation handling.
+
+    An HTTP PUT request that supports streaming.
+    """
+
+    def __init__(self, conn, node, resp, path, connect_duration, watchdog,
+                 write_timeout, send_exception_handler, logger, mime_boundary,
+                 multiphase=False):
+        super(MIMEPutter, self).__init__(conn, node, resp, path,
+                                         connect_duration, watchdog,
+                                         write_timeout, send_exception_handler,
+                                         logger)
+        # Note: you probably want to call MimePutter.connect() instead of
+        # instantiating one of these directly.
+        self.chunked = True  # MIME requests always send chunked body
+        self.mime_boundary = mime_boundary
+        self.multiphase = multiphase
+
+    def _start_object_data(self):
+        # We're sending the object plus other stuff in the same request
+        # body, all wrapped up in multipart MIME, so we'd better start
+        # off the MIME document before sending any object data.
+        self._send_chunk(b"--%s\r\nX-Document: object body\r\n\r\n" %
+                         (self.mime_boundary,))
+
+    def end_of_object_data(self, footer_metadata=None):
+        """
+        Call when there is no more data to send.
+
+        Overrides superclass implementation to send any footer metadata
+        after object data.
+
+        :param footer_metadata: dictionary of metadata items
+                                to be sent as footers.
+        """
+        if self.state == DATA_SENT:
+            raise ValueError("called end_of_object_data twice")
+        elif self.state == NO_DATA_SENT and self.mime_boundary:
+            self._start_object_data()
+
+        footer_body = json.dumps(footer_metadata).encode('ascii')
+        footer_md5 = md5(
+            footer_body, usedforsecurity=False).hexdigest().encode('ascii')
+
+        tail_boundary = (b"--%s" % (self.mime_boundary,))
+        if not self.multiphase:
+            # this will be the last part sent
+            tail_boundary = tail_boundary + b"--"
+
+        message_parts = [
+            (b"\r\n--%s\r\n" % self.mime_boundary),
+            b"X-Document: object metadata\r\n",
+            b"Content-MD5: %s\r\n" % footer_md5,
+            b"\r\n",
+            footer_body, b"\r\n",
+            tail_boundary, b"\r\n",
+        ]
+        self._send_chunk(b"".join(message_parts))
+
+        self._send_chunk(b'')
+        self.state = DATA_SENT
+
+    def send_commit_confirmation(self):
+        """
+        Call when there are > quorum 2XX responses received.  Send commit
+        confirmations to all object nodes to finalize the PUT.
+        """
+        if not self.multiphase:
+            raise ValueError(
+                "called send_commit_confirmation but multiphase is False")
+        if self.state == COMMIT_SENT:
+            raise ValueError("called send_commit_confirmation twice")
+
+        self.state = DATA_ACKED
+
+        if self.mime_boundary:
+            body = b"put_commit_confirmation"
+            tail_boundary = (b"--%s--" % (self.mime_boundary,))
+            message_parts = [
+                b"X-Document: put commit\r\n",
+                b"\r\n",
+                body, b"\r\n",
+                tail_boundary,
+            ]
+            self._send_chunk(b"".join(message_parts))
+
+        self._send_chunk(b'')
+        self.state = COMMIT_SENT
+
+    @classmethod
+    def connect(cls, node, part, path, headers, watchdog, conn_timeout,
+                node_timeout, write_timeout, send_exception_handler,
+                logger=None, need_multiphase=True, **kwargs):
+        """
+        Connect to a backend node and send the headers.
+
+        Override superclass method to notify object of need for support for
+        multipart body with footers and optionally multiphase commit, and
+        verify object server's capabilities.
+
+        :param need_multiphase: if True then multiphase support is required of
+                                the object server
+        :raises FooterNotSupported: if need_metadata_footer is set but
+                 backend node can't process footers
+        :raises MultiphasePUTNotSupported: if need_multiphase is set but
+                 backend node can't handle multiphase PUT
+        """
+        mime_boundary = b"%.64x" % random.randint(0, 16 ** 64)
+        headers = HeaderKeyDict(headers)
+        # when using a multipart mime request to backend the actual
+        # content-length is not equal to the object content size, so move the
+        # object content size to X-Backend-Obj-Content-Length if that has not
+        # already been set by the EC PUT path.
+        headers.setdefault('X-Backend-Obj-Content-Length',
+                           headers.pop('Content-Length', None))
+        # We're going to be adding some unknown amount of data to the
+        # request, so we can't use an explicit content length, and thus
+        # we must use chunked encoding.
+        headers['Transfer-Encoding'] = 'chunked'
+        headers['Expect'] = '100-continue'
+
+        headers['X-Backend-Obj-Multipart-Mime-Boundary'] = mime_boundary
+
+        headers['X-Backend-Obj-Metadata-Footer'] = 'yes'
+
+        if need_multiphase:
+            headers['X-Backend-Obj-Multiphase-Commit'] = 'yes'
+
+        conn, expect_resp, final_resp, connect_duration = cls._make_connection(
+            node, part, path, headers, conn_timeout, node_timeout)
+
+        if is_informational(expect_resp.status):
+            continue_headers = HeaderKeyDict(expect_resp.getheaders())
+            can_send_metadata_footer = config_true_value(
+                continue_headers.get('X-Obj-Metadata-Footer', 'no'))
+            can_handle_multiphase_put = config_true_value(
+                continue_headers.get('X-Obj-Multiphase-Commit', 'no'))
+
+            if not can_send_metadata_footer:
+                raise FooterNotSupported()
+
+            if need_multiphase and not can_handle_multiphase_put:
+                raise MultiphasePUTNotSupported()
+
+        return cls(conn, node, final_resp, path, connect_duration, watchdog,
+                   write_timeout, send_exception_handler, logger,
+                   mime_boundary, multiphase=need_multiphase)
+
+
+def chunk_transformer(policy):
+    """
+    A generator to transform a source chunk to erasure coded chunks for each
+    `send` call. The number of erasure coded chunks is as
+    policy.ec_n_unique_fragments.
+    """
+    segment_size = policy.ec_segment_size
+
+    buf = collections.deque()
+    total_buf_len = 0
+
+    chunk = yield
+    while chunk:
+        buf.append(chunk)
+        total_buf_len += len(chunk)
+        if total_buf_len >= segment_size:
+            chunks_to_encode = []
+            # extract as many chunks as we can from the input buffer
+            while total_buf_len >= segment_size:
+                to_take = segment_size
+                pieces = []
+                while to_take > 0:
+                    piece = buf.popleft()
+                    if len(piece) > to_take:
+                        buf.appendleft(piece[to_take:])
+                        piece = piece[:to_take]
+                    pieces.append(piece)
+                    to_take -= len(piece)
+                    total_buf_len -= len(piece)
+                chunks_to_encode.append(b''.join(pieces))
+
+            frags_by_byte_order = []
+            for chunk_to_encode in chunks_to_encode:
+                frags_by_byte_order.append(
+                    policy.pyeclib_driver.encode(chunk_to_encode))
+            # Sequential calls to encode() have given us a list that
+            # looks like this:
+            #
+            # [[frag_A1, frag_B1, frag_C1, ...],
+            #  [frag_A2, frag_B2, frag_C2, ...], ...]
+            #
+            # What we need is a list like this:
+            #
+            # [(frag_A1 + frag_A2 + ...),  # destined for node A
+            #  (frag_B1 + frag_B2 + ...),  # destined for node B
+            #  (frag_C1 + frag_C2 + ...),  # destined for node C
+            #  ...]
+            obj_data = [b''.join(frags)
+                        for frags in zip(*frags_by_byte_order)]
+            chunk = yield obj_data
+        else:
+            # didn't have enough data to encode
+            chunk = yield None
+
+    # Now we've gotten an empty chunk, which indicates end-of-input.
+    # Take any leftover bytes and encode them.
+    last_bytes = b''.join(buf)
+    if last_bytes:
+        last_frags = policy.pyeclib_driver.encode(last_bytes)
+        yield last_frags
+    else:
+        yield [b''] * policy.ec_n_unique_fragments
+
+
+def trailing_metadata(policy, client_obj_hasher,
+                      bytes_transferred_from_client,
+                      fragment_archive_index):
+    return HeaderKeyDict({
+        # etag and size values are being added twice here.
+        # The container override header is used to update the container db
+        # with these values as they represent the correct etag and size for
+        # the whole object and not just the FA.
+        # The object sysmeta headers will be saved on each FA of the object.
+        'X-Object-Sysmeta-EC-Etag': client_obj_hasher.hexdigest(),
+        'X-Object-Sysmeta-EC-Content-Length':
+        str(bytes_transferred_from_client),
+        # older style x-backend-container-update-override-* headers are used
+        # here (rather than x-object-sysmeta-container-update-override-*
+        # headers) for backwards compatibility: the request may be to an object
+        # server that has not yet been upgraded to accept the newer style
+        # x-object-sysmeta-container-update-override- headers.
+        'X-Backend-Container-Update-Override-Etag':
+        client_obj_hasher.hexdigest(),
+        'X-Backend-Container-Update-Override-Size':
+        str(bytes_transferred_from_client),
+        'X-Object-Sysmeta-Ec-Frag-Index': str(fragment_archive_index),
+        # These fields are for debuggability,
+        # AKA "what is this thing?"
+        'X-Object-Sysmeta-EC-Scheme': policy.ec_scheme_description,
+        'X-Object-Sysmeta-EC-Segment-Size': str(policy.ec_segment_size),
+    })
+
+
+class ECGetResponseBucket(object):
+    """
+    A helper class to encapsulate the properties of buckets in which fragment
+    getters and alternate nodes are collected.
+    """
+
+    def __init__(self, policy, timestamp):
+        """
+        :param policy: an instance of ECStoragePolicy
+        :param timestamp: a Timestamp, or None for a bucket of error responses
+        """
+        self.policy = policy
+        self.timestamp = timestamp
+        # if no timestamp when init'd then the bucket will update its timestamp
+        # as responses are added
+        self.update_timestamp = timestamp is None
+        self.gets = collections.defaultdict(list)
+        self.alt_nodes = collections.defaultdict(list)
+        self._durable = False
+        self.status = self.headers = None
+
+    def set_durable(self):
+        self._durable = True
+
+    @property
+    def durable(self):
+        return self._durable
+
+    def add_response(self, getter, parts_iter):
+        """
+        Add another response to this bucket.  Response buckets can be for
+        fragments with the same timestamp, or for errors with the same status.
+        """
+        headers = getter.last_headers
+        timestamp_str = headers.get('X-Backend-Timestamp',
+                                    headers.get('X-Timestamp'))
+        if timestamp_str and self.update_timestamp:
+            # 404s will keep the most recent timestamp
+            self.timestamp = max(Timestamp(timestamp_str), self.timestamp)
+        if not self.gets:
+            # stash first set of backend headers, which will be used to
+            # populate a client response
+            self.status = getter.last_status
+            # TODO: each bucket is for a single *data* timestamp, but sources
+            # in the same bucket may have different *metadata* timestamps if
+            # some backends have more recent .meta files than others. Currently
+            # we just use the last received metadata headers - this behavior is
+            # ok and is consistent with a replication policy GET which
+            # similarly does not attempt to find the backend with the most
+            # recent metadata. We could alternatively choose to the *newest*
+            # metadata headers for self.headers by selecting the source with
+            # the latest X-Timestamp.
+            self.headers = headers
+        elif headers.get('X-Object-Sysmeta-Ec-Etag') != \
+                self.headers.get('X-Object-Sysmeta-Ec-Etag'):
+            # Fragments at the same timestamp with different etags are never
+            # expected and error buckets shouldn't have this header. If somehow
+            # this happens then ignore those responses to avoid mixing
+            # fragments that will not reconstruct otherwise an exception from
+            # pyeclib is almost certain.
+            raise ValueError("ETag mismatch")
+
+        frag_index = headers.get('X-Object-Sysmeta-Ec-Frag-Index')
+        frag_index = int(frag_index) if frag_index is not None else None
+        self.gets[frag_index].append((getter, parts_iter))
+
+    def get_responses(self):
+        """
+        Return a list of all useful sources. Where there are multiple sources
+        associated with the same frag_index then only one is included.
+
+        :return: a list of sources, each source being a tuple of form
+                (ECFragGetter, iter)
+        """
+        all_sources = []
+        for frag_index, sources in self.gets.items():
+            if frag_index is None:
+                # bad responses don't have a frag_index (and fake good
+                # responses from some unit tests)
+                all_sources.extend(sources)
+            else:
+                all_sources.extend(sources[:1])
+        return all_sources
+
+    def add_alternate_nodes(self, node, frag_indexes):
+        for frag_index in frag_indexes:
+            self.alt_nodes[frag_index].append(node)
+
+    @property
+    def shortfall(self):
+        """
+        The number of additional responses needed to complete this bucket;
+        typically (ndata - resp_count).
+
+        If the bucket has no durable responses, shortfall is extended out to
+        replica count to ensure the proxy makes additional primary requests.
+        """
+        resp_count = len(self.get_responses())
+        if self.durable or self.status == HTTP_REQUESTED_RANGE_NOT_SATISFIABLE:
+            return max(self.policy.ec_ndata - resp_count, 0)
+        alt_count = min(self.policy.object_ring.replica_count - resp_count,
+                        self.policy.ec_nparity)
+        return max([1, self.policy.ec_ndata - resp_count, alt_count])
+
+    @property
+    def shortfall_with_alts(self):
+        # The shortfall that we expect to have if we were to send requests
+        # for frags on the alt nodes.
+        alts = set(self.alt_nodes.keys()).difference(set(self.gets.keys()))
+        result = self.policy.ec_ndata - (len(self.get_responses()) + len(alts))
+        return max(result, 0)
+
+    def close_conns(self):
+        """
+        Close bucket's responses; they won't be used for a client response.
+        """
+        for getter, frag_iter in self.get_responses():
+            if getter.source:
+                getter.source.close()
+
+    def __str__(self):
+        # return a string summarising bucket state, useful for debugging.
+        return '<%s, %s, %s, %s(%s), %s>' \
+               % (self.timestamp.internal, self.status, self._durable,
+                  self.shortfall, self.shortfall_with_alts, len(self.gets))
+
+
+class ECGetResponseCollection(object):
+    """
+    Manages all successful EC GET responses gathered by ECFragGetters.
+
+    A response comprises a tuple of (<getter instance>, <parts iterator>). All
+    responses having the same data timestamp are placed in an
+    ECGetResponseBucket for that timestamp. The buckets are stored in the
+    'buckets' dict which maps timestamp-> bucket.
+
+    This class encapsulates logic for selecting the best bucket from the
+    collection, and for choosing alternate nodes.
+    """
+
+    def __init__(self, policy):
+        """
+        :param policy: an instance of ECStoragePolicy
+        """
+        self.policy = policy
+        self.buckets = {}
+        self.default_bad_bucket = ECGetResponseBucket(self.policy, None)
+        self.bad_buckets = {}
+        self.node_iter_count = 0
+
+    def _get_bucket(self, timestamp):
+        """
+        :param timestamp: a Timestamp
+        :return: ECGetResponseBucket for given timestamp
+        """
+        return self.buckets.setdefault(
+            timestamp, ECGetResponseBucket(self.policy, timestamp))
+
+    def _get_bad_bucket(self, status):
+        """
+        :param status: a representation of status
+        :return: ECGetResponseBucket for given status
+        """
+        return self.bad_buckets.setdefault(
+            status, ECGetResponseBucket(self.policy, None))
+
+    def add_response(self, get, parts_iter):
+        """
+        Add a response to the collection.
+
+        :param get: An instance of
+                    :class:`~swift.proxy.controllers.obj.ECFragGetter`
+        :param parts_iter: An iterator over response body parts
+        :raises ValueError: if the response etag or status code values do not
+            match any values previously received for the same timestamp
+        """
+        if is_success(get.last_status):
+            self.add_good_response(get, parts_iter)
+        else:
+            self.add_bad_resp(get, parts_iter)
+
+    def add_bad_resp(self, get, parts_iter):
+        bad_bucket = self._get_bad_bucket(get.last_status)
+        bad_bucket.add_response(get, parts_iter)
+
+    def add_good_response(self, get, parts_iter):
+        headers = get.last_headers
+        # Add the response to the appropriate bucket keyed by data file
+        # timestamp. Fall back to using X-Backend-Timestamp as key for object
+        # servers that have not been upgraded.
+        t_data_file = headers.get('X-Backend-Data-Timestamp')
+        t_obj = headers.get('X-Backend-Timestamp', headers.get('X-Timestamp'))
+        if t_data_file:
+            timestamp = Timestamp(t_data_file)
+        elif t_obj:
+            timestamp = Timestamp(t_obj)
+        else:
+            # Don't think this should ever come up in practice,
+            # but tests cover it
+            timestamp = None
+        self._get_bucket(timestamp).add_response(get, parts_iter)
+
+        # The node may also have alternate fragments indexes (possibly at
+        # different timestamps). For each list of alternate fragments indexes,
+        # find the bucket for their data file timestamp and add the node and
+        # list to that bucket's alternate nodes.
+        frag_sets = safe_json_loads(headers.get('X-Backend-Fragments')) or {}
+        for t_frag, frag_set in frag_sets.items():
+            t_frag = Timestamp(t_frag)
+            self._get_bucket(t_frag).add_alternate_nodes(
+                get.source.node, frag_set)
+        # If the response includes a durable timestamp then mark that bucket as
+        # durable. Note that this may be a different bucket than the one this
+        # response got added to, and that we may never go and get a durable
+        # frag from this node; it is sufficient that we have been told that a
+        # durable frag exists, somewhere, at t_durable.
+        t_durable = headers.get('X-Backend-Durable-Timestamp')
+        if not t_durable and not t_data_file:
+            # obj server not upgraded so assume this response's frag is durable
+            t_durable = t_obj
+        if t_durable:
+            self._get_bucket(Timestamp(t_durable)).set_durable()
+
+    def _sort_buckets(self):
+        def key_fn(bucket):
+            # Returns a tuple to use for sort ordering:
+            # durable buckets with no shortfall sort higher,
+            # then durable buckets with no shortfall_with_alts,
+            # then non-durable buckets with no shortfall,
+            # otherwise buckets with lowest shortfall_with_alts sort higher,
+            # finally buckets with newer timestamps sort higher.
+            return (bucket.durable,
+                    bucket.shortfall <= 0,
+                    -1 * bucket.shortfall_with_alts,
+                    bucket.timestamp)
+
+        return sorted(self.buckets.values(), key=key_fn, reverse=True)
+
+    @property
+    def best_bucket(self):
+        """
+        Return the "best" bucket in the collection.
+
+        The "best" bucket is the newest timestamp with sufficient getters, or
+        the closest to having sufficient getters, unless it is bettered by a
+        bucket with potential alternate nodes.
+
+        If there are no good buckets we return the "least_bad" bucket.
+
+        :return: An instance of :class:`~ECGetResponseBucket` or None if there
+                 are no buckets in the collection.
+        """
+        sorted_buckets = self._sort_buckets()
+        for bucket in sorted_buckets:
+            # tombstones will set bad_bucket.timestamp
+            not_found_bucket = self.bad_buckets.get(404)
+            if not_found_bucket and not_found_bucket.timestamp and \
+                    bucket.timestamp < not_found_bucket.timestamp:
+                # "good bucket" is trumped by newer tombstone
+                continue
+            return bucket
+        return self.least_bad_bucket
+
+    def choose_best_bucket(self):
+        best_bucket = self.best_bucket
+        # it's now or never -- close down any other requests
+        for bucket in self.buckets.values():
+            if bucket is best_bucket:
+                continue
+            bucket.close_conns()
+        return best_bucket
+
+    @property
+    def least_bad_bucket(self):
+        """
+        Return the bad_bucket with the smallest shortfall
+        """
+        if all(status == 404 for status in self.bad_buckets):
+            # NB: also covers an empty self.bad_buckets
+            return self.default_bad_bucket
+        # we want "enough" 416s to prevent "extra" requests - but we keep
+        # digging on 404s
+        short, status = min((bucket.shortfall, status)
+                            for status, bucket in self.bad_buckets.items()
+                            if status != 404)
+        return self.bad_buckets[status]
+
+    @property
+    def shortfall(self):
+        best_bucket = self.best_bucket
+        shortfall = best_bucket.shortfall
+        return min(shortfall, self.least_bad_bucket.shortfall)
+
+    @property
+    def durable(self):
+        return self.best_bucket.durable
+
+    def _get_frag_prefs(self):
+        # Construct the current frag_prefs list, with best_bucket prefs first.
+        frag_prefs = []
+
+        for bucket in self._sort_buckets():
+            if bucket.timestamp:
+                exclusions = [fi for fi in bucket.gets if fi is not None]
+                prefs = {'timestamp': bucket.timestamp.internal,
+                         'exclude': exclusions}
+                frag_prefs.append(prefs)
+
+        return frag_prefs
+
+    def get_extra_headers(self):
+        frag_prefs = self._get_frag_prefs()
+        return {'X-Backend-Fragment-Preferences': json.dumps(frag_prefs)}
+
+    def _get_alternate_nodes(self):
+        if self.node_iter_count <= self.policy.ec_ndata:
+            # It makes sense to wait before starting to use alternate nodes,
+            # because if we find sufficient frags on *distinct* nodes then we
+            # spread work across mode nodes. There's no formal proof that
+            # waiting for ec_ndata GETs is the right answer, but it seems
+            # reasonable to try *at least* that many primary nodes before
+            # resorting to alternate nodes.
+            return None
+
+        bucket = self.best_bucket
+        if (bucket is None) or (bucket.shortfall <= 0) or not bucket.durable:
+            return None
+
+        alt_frags = set(bucket.alt_nodes.keys())
+        got_frags = set(bucket.gets.keys())
+        wanted_frags = list(alt_frags.difference(got_frags))
+
+        # We may have the same frag_index on more than one node so shuffle to
+        # avoid using the same frag_index consecutively, since we may not get a
+        # response from the last node provided before being asked to provide
+        # another node.
+        random.shuffle(wanted_frags)
+
+        for frag_index in wanted_frags:
+            nodes = bucket.alt_nodes.get(frag_index)
+            if nodes:
+                return nodes
+        return None
+
+    def has_alternate_node(self):
+        return True if self._get_alternate_nodes() else False
+
+    def provide_alternate_node(self):
+        """
+        Callback function that is installed in a NodeIter. Called on every call
+        to NodeIter.next(), which means we can track the number of nodes to
+        which GET requests have been made and selectively inject an alternate
+        node, if we have one.
+
+        :return: A dict describing a node to which the next GET request
+                 should be made.
+        """
+        self.node_iter_count += 1
+        nodes = self._get_alternate_nodes()
+        if nodes:
+            return nodes.pop(0).copy()
+
+
+class ECFragGetter(GetterBase):
+
+    def __init__(self, app, req, node_iter, partition, policy, path,
+                 backend_headers, header_provider, logger_thread_locals,
+                 logger):
+        super(ECFragGetter, self).__init__(
+            app=app, req=req, node_iter=node_iter, partition=partition,
+            policy=policy, path=path, backend_headers=backend_headers,
+            node_timeout=app.recoverable_node_timeout,
+            resource_type='EC fragment', logger=logger)
+        self.header_provider = header_provider
+        self.fragment_size = policy.fragment_size
+        self.skip_bytes = 0
+        self.logger_thread_locals = logger_thread_locals
+        self.status = self.reason = self.body = self.source_headers = None
+        self._source_iter = None
+
+    def _iter_bytes_from_response_part(self, part_file, nbytes):
+        buf = b''
+        part_file = ByteCountEnforcer(part_file, nbytes)
+        while True:
+            try:
+                with WatchdogTimeout(self.app.watchdog,
+                                     self.node_timeout,
+                                     ChunkReadTimeout):
+                    chunk = part_file.read(self.app.object_chunk_size)
+                    # NB: this append must be *inside* the context
+                    # manager for test.unit.SlowBody to do its thing
+                    buf += chunk
+                    if nbytes is not None:
+                        nbytes -= len(chunk)
+            except (ChunkReadTimeout, ShortReadError) as e:
+                try:
+                    self.fast_forward(self.bytes_used_from_backend)
+                except (HTTPException, ValueError):
+                    self.logger.exception('Unable to fast forward')
+                    raise e
+                except RangeAlreadyComplete:
+                    break
+                buf = b''
+                if self._replace_source(
+                        'Trying to read EC fragment during GET (retrying)'):
+                    try:
+                        _junk, _junk, _junk, _junk, part_file = \
+                            self._get_next_response_part()
+                    except StopIteration:
+                        # it's not clear to me how to make
+                        # _get_next_response_part raise StopIteration for the
+                        # first doc part of a new request
+                        raise e
+                    part_file = ByteCountEnforcer(part_file, nbytes)
+                else:
+                    raise e
+            else:
+                if buf and self.skip_bytes:
+                    if self.skip_bytes < len(buf):
+                        buf = buf[self.skip_bytes:]
+                        self.bytes_used_from_backend += self.skip_bytes
+                        self.skip_bytes = 0
+                    else:
+                        self.skip_bytes -= len(buf)
+                        self.bytes_used_from_backend += len(buf)
+                        buf = b''
+
+                while buf and (len(buf) >= self.fragment_size or not chunk):
+                    client_chunk = buf[:self.fragment_size]
+                    buf = buf[self.fragment_size:]
+                    with WatchdogTimeout(self.app.watchdog,
+                                         self.app.client_timeout,
+                                         ChunkWriteTimeout):
+                        self.bytes_used_from_backend += len(client_chunk)
+                        yield client_chunk
+
+                if not chunk:
+                    break
+
+    def _iter_parts_from_response(self):
+        try:
+            part_iter = None
+            try:
+                while True:
+                    try:
+                        start_byte, end_byte, length, headers, part = \
+                            self._get_next_response_part()
+                    except StopIteration:
+                        # it seems this is the only way out of the loop; not
+                        # sure why the req.environ update is always needed
+                        self.req.environ['swift.non_client_disconnect'] = True
+                        break
+                    # skip_bytes compensates for the backend request range
+                    # expansion done in _convert_range
+                    self.skip_bytes = bytes_to_skip(
+                        self.fragment_size, start_byte)
+                    self.learn_size_from_content_range(
+                        start_byte, end_byte, length)
+                    self.bytes_used_from_backend = 0
+                    # not length; that refers to the whole object, so is the
+                    # wrong value to use for GET-range responses
+                    byte_count = ((end_byte - start_byte + 1) - self.skip_bytes
+                                  if (end_byte is not None
+                                      and start_byte is not None)
+                                  else None)
+                    part_iter = CooperativeIterator(
+                        self._iter_bytes_from_response_part(part, byte_count))
+                    yield {'start_byte': start_byte, 'end_byte': end_byte,
+                           'entity_length': length, 'headers': headers,
+                           'part_iter': part_iter}
+                    self.pop_range()
+            finally:
+                if part_iter:
+                    part_iter.close()
+
+        except ChunkReadTimeout:
+            self.app.exception_occurred(self.source.node, 'Object',
+                                        'Trying to read during GET')
+            raise
+        except ChunkWriteTimeout:
+            self.logger.warning(
+                'Client did not read from proxy within %ss' %
+                self.app.client_timeout)
+            self.logger.increment('object.client_timeouts')
+        except GeneratorExit:
+            warn = True
+            req_range = self.backend_headers['Range']
+            if req_range:
+                req_range = Range(req_range)
+                if len(req_range.ranges) == 1:
+                    begin, end = req_range.ranges[0]
+                    if end is not None and begin is not None:
+                        if end - begin + 1 == self.bytes_used_from_backend:
+                            warn = False
+            if (warn and
+                    not self.req.environ.get('swift.non_client_disconnect')):
+                self.logger.warning(
+                    'Client disconnected on read of EC frag %r', self.path)
+            raise
+        except Exception:
+            self.logger.exception('Trying to send to client')
+            raise
+        finally:
+            self.source.close()
+
+    @property
+    def last_status(self):
+        return self.status or HTTP_INTERNAL_SERVER_ERROR
+
+    @property
+    def last_headers(self):
+        if self.source_headers:
+            return HeaderKeyDict(self.source_headers)
+        else:
+            return HeaderKeyDict()
+
+    def _make_node_request(self, node):
+        # make a backend request; return a response if it has an acceptable
+        # status code, otherwise None
+        self.logger.thread_locals = self.logger_thread_locals
+        req_headers = dict(self.backend_headers)
+        ip, port = get_ip_port(node, req_headers)
+        req_headers.update(self.header_provider())
+        start_node_timing = time.time()
+        try:
+            with ConnectionTimeout(self.app.conn_timeout):
+                conn = http_connect(
+                    ip, port, node['device'],
+                    self.partition, 'GET', self.path,
+                    headers=req_headers,
+                    query_string=self.req.query_string)
+            self.app.set_node_timing(node, time.time() - start_node_timing)
+
+            with Timeout(self.node_timeout):
+                possible_source = conn.getresponse()
+                # See NOTE: swift_conn at top of file about this.
+                possible_source.swift_conn = conn
+        except (Exception, Timeout):
+            self.app.exception_occurred(
+                node, 'Object',
+                'Trying to %(method)s %(path)s' %
+                {'method': self.req.method, 'path': self.req.path})
+            return None
+
+        src_headers = dict(
+            (k.lower(), v) for k, v in
+            possible_source.getheaders())
+
+        if 'handoff_index' in node and \
+                (is_server_error(possible_source.status) or
+                 possible_source.status == HTTP_NOT_FOUND) and \
+                not Timestamp(
+                    src_headers.get('x-backend-timestamp', Timestamp.zero())):
+            # throw out 5XX and 404s from handoff nodes unless the data is
+            # really on disk and had been DELETEd
+            self.logger.debug('Ignoring %s from handoff' %
+                              possible_source.status)
+            conn.close()
+            return None
+
+        self.status = possible_source.status
+        self.reason = possible_source.reason
+        self.source_headers = possible_source.getheaders()
+        if is_good_source(possible_source.status, server_type='Object'):
+            self.body = None
+            return possible_source
+        else:
+            self.body = possible_source.read()
+            conn.close()
+
+            if self.app.check_response(node, 'Object', possible_source, 'GET',
+                                       self.path):
+                self.logger.debug(
+                    'Ignoring %s from primary' % possible_source.status)
+
+            return None
+
+    @property
+    def source_iter(self):
+        """
+        An iterator over responses to backend fragment GETs. Yields an
+        instance of ``GetterSource`` if a response is good, otherwise ``None``.
+        """
+        if self._source_iter is None:
+            self._source_iter = self._source_gen()
+        return self._source_iter
+
+    def _source_gen(self):
+        self.status = self.reason = self.body = self.source_headers = None
+        for node in self.node_iter:
+            source = self._make_node_request(node)
+            if source:
+                yield GetterSource(self.app, source, node)
+            else:
+                yield None
+            self.status = self.reason = self.body = self.source_headers = None
+
+    def _find_source(self):
+        # capture last used etag before continuation
+        used_etag = self.last_headers.get('X-Object-Sysmeta-EC-ETag')
+        for source in self.source_iter:
+            if not source:
+                # _make_node_request only returns good sources
+                continue
+            if source.resp.getheader('X-Object-Sysmeta-EC-ETag') != used_etag:
+                self.logger.warning(
+                    'Skipping source (etag mismatch: got %s, expected %s)',
+                    source.resp.getheader('X-Object-Sysmeta-EC-ETag'),
+                    used_etag)
+            else:
+                self.source = source
+                return True
+        return False
+
+    def response_parts_iter(self):
+        """
+        Create an iterator over a single fragment response body.
+
+        :return: an interator that yields chunks of bytes from a fragment
+            response body.
+        """
+        it = None
+        try:
+            source = next(self.source_iter)
+        except StopIteration:
+            pass
+        else:
+            if source:
+                self.source = source
+                it = self._iter_parts_from_response()
+        return it
+
+
+@ObjectControllerRouter.register(EC_POLICY)
+class ECObjectController(BaseObjectController):
+    def _fragment_GET_request(
+            self, req, node_iter, partition, policy,
+            header_provider, logger_thread_locals):
+        """
+        Makes a GET request for a fragment.
+        """
+        self.logger.thread_locals = logger_thread_locals
+        backend_headers = self.generate_request_headers(
+            req, additional=req.headers)
+
+        getter = ECFragGetter(self.app, req, node_iter, partition,
+                              policy, req.swift_entity_path, backend_headers,
+                              header_provider, logger_thread_locals,
+                              self.logger)
+        return getter, getter.response_parts_iter()
+
+    def _convert_range(self, req, policy):
+        """
+        Take the requested range(s) from the client and convert it to range(s)
+        to be sent to the object servers.
+
+        This includes widening requested ranges to full segments, then
+        converting those ranges to fragments so that we retrieve the minimum
+        number of fragments from the object server.
+
+        Mutates the request passed in.
+
+        Returns a list of range specs (dictionaries with the different byte
+        indices in them).
+        """
+        # Since segments and fragments have different sizes, we need
+        # to modify the Range header sent to the object servers to
+        # make sure we get the right fragments out of the fragment
+        # archives.
+        segment_size = policy.ec_segment_size
+        fragment_size = policy.fragment_size
+
+        range_specs = []
+        new_ranges = []
+        for client_start, client_end in req.range.ranges:
+            # TODO: coalesce ranges that overlap segments. For
+            # example, "bytes=0-10,20-30,40-50" with a 64 KiB
+            # segment size will result in a Range header in the
+            # object request of "bytes=0-65535,0-65535,0-65535",
+            # which is wasteful. We should be smarter and only
+            # request that first segment once.
+            segment_start, segment_end = client_range_to_segment_range(
+                client_start, client_end, segment_size)
+
+            fragment_start, fragment_end = \
+                segment_range_to_fragment_range(
+                    segment_start, segment_end,
+                    segment_size, fragment_size)
+
+            new_ranges.append((fragment_start, fragment_end))
+            range_specs.append({'req_client_start': client_start,
+                                'req_client_end': client_end,
+                                'req_segment_start': segment_start,
+                                'req_segment_end': segment_end,
+                                'req_fragment_start': fragment_start,
+                                'req_fragment_end': fragment_end})
+
+        req.range = "bytes=" + ",".join(
+            "%s-%s" % (s if s is not None else "",
+                       e if e is not None else "")
+            for s, e in new_ranges)
+        return range_specs
+
+    def feed_remaining_primaries(self, safe_iter, pile, req, partition, policy,
+                                 buckets, feeder_q, logger_thread_locals):
+        timeout = self.app.get_policy_options(policy).concurrency_timeout
+        while True:
+            try:
+                feeder_q.get(timeout=timeout)
+            except Empty:
+                if safe_iter.unsafe_iter.primaries_left:
+                    # this will run async, if it ends up taking the last
+                    # primary we won't find out until the next pass
+                    pile.spawn(self._fragment_GET_request,
+                               req, safe_iter, partition,
+                               policy, buckets.get_extra_headers,
+                               logger_thread_locals)
+                else:
+                    # ran out of primaries
+                    break
+            else:
+                # got a stop
+                break
+
+    def _get_or_head_response(self, req, node_iter, partition, policy):
+        update_etag_is_at_header(req, "X-Object-Sysmeta-Ec-Etag")
+
+        if req.method == 'HEAD':
+            # no fancy EC decoding here, just one plain old HEAD request to
+            # one object server because all fragments hold all metadata
+            # information about the object.
+            concurrency = policy.ec_ndata \
+                if self.app.get_policy_options(policy).concurrent_gets else 1
+            resp = self.GETorHEAD_base(
+                req, 'Object', node_iter, partition,
+                req.swift_entity_path, concurrency, policy)
+            self._fix_response(req, resp)
+            return resp
+
+        # GET request
+        orig_range = None
+        range_specs = []
+        if req.range:
+            orig_range = req.range
+            range_specs = self._convert_range(req, policy)
+
+        safe_iter = GreenthreadSafeIterator(node_iter)
+
+        policy_options = self.app.get_policy_options(policy)
+        ec_request_count = policy.ec_ndata
+        if policy_options.concurrent_gets:
+            ec_request_count += policy_options.concurrent_ec_extra_requests
+        with ContextPool(policy.ec_n_unique_fragments) as pool:
+            pile = GreenAsyncPile(pool)
+            buckets = ECGetResponseCollection(policy)
+            node_iter.set_node_provider(buckets.provide_alternate_node)
+
+            for node_count in range(ec_request_count):
+                pile.spawn(self._fragment_GET_request,
+                           req, safe_iter, partition,
+                           policy, buckets.get_extra_headers,
+                           self.logger.thread_locals)
+
+            feeder_q = None
+            if policy_options.concurrent_gets:
+                feeder_q = Queue()
+                pool.spawn(self.feed_remaining_primaries, safe_iter, pile, req,
+                           partition, policy, buckets, feeder_q,
+                           self.logger.thread_locals)
+
+            extra_requests = 0
+            # max_extra_requests is an arbitrary hard limit for spawning extra
+            # getters in case some unforeseen scenario, or a misbehaving object
+            # server, causes us to otherwise make endless requests e.g. if an
+            # object server were to ignore frag_prefs and always respond with
+            # a frag that is already in a bucket. Now we're assuming it should
+            # be limit at most 2 * replicas.
+            max_extra_requests = (
+                (policy.object_ring.replica_count * 2) - policy.ec_ndata)
+            for get, parts_iter in pile:
+                try:
+                    buckets.add_response(get, parts_iter)
+                except ValueError as err:
+                    self.logger.error(
+                        "Problem with fragment response: %s", err)
+                best_bucket = buckets.best_bucket
+                if best_bucket.durable and best_bucket.shortfall <= 0:
+                    # good enough!
+                    break
+                requests_available = extra_requests < max_extra_requests and (
+                    node_iter.nodes_left > 0 or buckets.has_alternate_node())
+                if requests_available and (
+                        buckets.shortfall > pile._pending or
+                        not is_good_source(get.last_status, self.server_type)):
+                    extra_requests += 1
+                    pile.spawn(self._fragment_GET_request, req, safe_iter,
+                               partition, policy, buckets.get_extra_headers,
+                               self.logger.thread_locals)
+            if feeder_q:
+                feeder_q.put('stop')
+
+        # Put this back, since we *may* need it for kickoff()/_fix_response()
+        # (but note that _fix_ranges() may also pop it back off before then)
+        req.range = orig_range
+        best_bucket = buckets.choose_best_bucket()
+        if best_bucket.shortfall <= 0 and best_bucket.durable:
+            # headers can come from any of the getters
+            resp_headers = best_bucket.headers
+            resp_headers.pop('Content-Range', None)
+            eccl = resp_headers.get('X-Object-Sysmeta-Ec-Content-Length')
+            obj_length = int(eccl) if eccl is not None else None
+
+            # This is only true if we didn't get a 206 response, but
+            # that's the only time this is used anyway.
+            fa_length = int(resp_headers['Content-Length'])
+            app_iter = ECAppIter(
+                req.swift_entity_path,
+                policy,
+                [p_iter for _getter, p_iter in best_bucket.get_responses()],
+                range_specs, fa_length, obj_length,
+                self.logger)
+            resp = Response(
+                request=req,
+                conditional_response=True,
+                app_iter=app_iter)
+            update_headers(resp, resp_headers)
+            self._fix_ranges(req, resp)
+            try:
+                app_iter.kickoff(req, resp)
+            except HTTPException as err_resp:
+                # catch any HTTPException response here so that we can
+                # process response headers uniformly in _fix_response
+                resp = err_resp
+        else:
+            # TODO: we can get here if all buckets are successful but none
+            # have ec_ndata getters, so bad_bucket may have no gets and we will
+            # return a 503 when a 404 may be more appropriate. We can also get
+            # here with less than ec_ndata 416's and may then return a 416
+            # which is also questionable because a non-range get for same
+            # object would return 404 or 503.
+            statuses = []
+            reasons = []
+            bodies = []
+            headers = []
+            best_bucket.close_conns()
+            rebalance_missing_suppression_count = min(
+                policy_options.rebalance_missing_suppression_count,
+                node_iter.num_primary_nodes - 1)
+            for status, bad_bucket in buckets.bad_buckets.items():
+                for getter, _parts_iter in bad_bucket.get_responses():
+                    if best_bucket.durable:
+                        bad_resp_headers = getter.last_headers
+                        t_data_file = bad_resp_headers.get(
+                            'X-Backend-Data-Timestamp')
+                        t_obj = bad_resp_headers.get(
+                            'X-Backend-Timestamp',
+                            bad_resp_headers.get('X-Timestamp'))
+                        bad_ts = Timestamp(t_data_file or
+                                           t_obj or
+                                           Timestamp.zero())
+                        if bad_ts <= best_bucket.timestamp:
+                            # We have reason to believe there's still good data
+                            # out there, it's just currently unavailable
+                            continue
+                    if getter.status:
+                        timestamp = Timestamp(getter.last_headers.get(
+                            'X-Backend-Timestamp',
+                            getter.last_headers.get(
+                                'X-Timestamp', Timestamp.zero())))
+                        if (rebalance_missing_suppression_count > 0 and
+                                getter.status == HTTP_NOT_FOUND and
+                                not timestamp):
+                            rebalance_missing_suppression_count -= 1
+                            continue
+                        statuses.append(getter.status)
+                        reasons.append(getter.reason)
+                        bodies.append(getter.body)
+                        headers.append(getter.source_headers)
+
+            if not statuses and is_success(best_bucket.status) and \
+                    not best_bucket.durable:
+                # pretend that non-durable bucket was 404s
+                statuses.append(404)
+                reasons.append('404 Not Found')
+                bodies.append(b'')
+                headers.append({})
+
+            resp = self.best_response(
+                req, statuses, reasons, bodies, 'Object',
+                headers=headers)
+        self._fix_response(req, resp)
+
+        # For sure put this back before actually returning the response
+        # to the rest of the pipeline, so we don't modify the client headers
+        req.range = orig_range
+        return resp
+
+    def _fix_response(self, req, resp):
+        # EC fragment archives each have different bytes, hence different
+        # etags. However, they all have the original object's etag stored in
+        # sysmeta, so we copy that here (if it exists) so the client gets it.
+        resp.headers['Etag'] = resp.headers.get('X-Object-Sysmeta-Ec-Etag')
+        # We're about to invoke conditional response checking so set the
+        # correct conditional etag from wherever X-Backend-Etag-Is-At points,
+        # if it exists at all.
+        resp._conditional_etag = resolve_etag_is_at_header(req, resp.headers)
+        if (is_success(resp.status_int) or is_redirection(resp.status_int) or
+                resp.status_int == HTTP_REQUESTED_RANGE_NOT_SATISFIABLE):
+            resp.accept_ranges = 'bytes'
+        if is_success(resp.status_int):
+            resp.headers['Content-Length'] = resp.headers.get(
+                'X-Object-Sysmeta-Ec-Content-Length')
+            resp.fix_conditional_response()
+        if resp.status_int == HTTP_REQUESTED_RANGE_NOT_SATISFIABLE:
+            resp.headers['Content-Range'] = 'bytes */%s' % resp.headers[
+                'X-Object-Sysmeta-Ec-Content-Length']
+        ec_headers = [header for header in resp.headers
+                      if header.lower().startswith('x-object-sysmeta-ec-')]
+        for header in ec_headers:
+            # clients (including middlewares) shouldn't need to care about
+            # this implementation detail
+            del resp.headers[header]
+
+    def _fix_ranges(self, req, resp):
+        # Has to be called *before* kickoff()!
+        if is_success(resp.status_int):
+            ignore_range_headers = set(
+                h.strip().lower()
+                for h in req.headers.get(
+                    'X-Backend-Ignore-Range-If-Metadata-Present',
+                    '').split(','))
+            if ignore_range_headers.intersection(
+                    h.lower() for h in resp.headers):
+                # If we leave the Range header around, swob (or somebody) will
+                # try to "fix" things for us when we kickoff() the app_iter.
+                req.headers.pop('Range', None)
+                resp.app_iter.range_specs = []
+
+    def _make_putter(self, node, part, req, headers):
+        return MIMEPutter.connect(
+            node, part, req.swift_entity_path, headers, self.app.watchdog,
+            conn_timeout=self.app.conn_timeout,
+            node_timeout=self.app.node_timeout,
+            write_timeout=self.app.node_timeout,
+            send_exception_handler=self.app.exception_occurred,
+            logger=self.logger,
+            need_multiphase=True)
+
+    def _determine_chunk_destinations(self, putters, policy):
+        """
+        Given a list of putters, return a dict where the key is the putter
+        and the value is the frag index to use.
+
+        This is done so that we line up handoffs using the same frag index
+        (in the primary part list) as the primary that the handoff is standing
+        in for.  This lets erasure-code fragment archives wind up on the
+        preferred local primary nodes when possible.
+
+        :param putters: a list of swift.proxy.controllers.obj.MIMEPutter
+                        instance
+        :param policy: A policy instance which should be one of ECStoragePolicy
+        """
+        # Give each putter a "frag index": the index of the
+        # transformed chunk that we'll send to it.
+        #
+        # For primary nodes, that's just its index (primary 0 gets
+        # chunk 0, primary 1 gets chunk 1, and so on). For handoffs,
+        # we assign the chunk index of a missing primary.
+        handoff_conns = []
+        putter_to_frag_index = {}
+        for p in putters:
+            if p.node_index is not None:
+                putter_to_frag_index[p] = policy.get_backend_index(
+                    p.node_index)
+            else:
+                handoff_conns.append(p)
+
+        # Note: we may have more holes than handoffs. This is okay; it
+        # just means that we failed to connect to one or more storage
+        # nodes. Holes occur when a storage node is down, in which
+        # case the connection is not replaced, and when a storage node
+        # returns 507, in which case a handoff is used to replace it.
+
+        # lack_list is a dict of list to keep hole indexes
+        # e.g. if we have 2 holes for frag index 0 with ec_duplication_factor=2
+        # lack_list is like {0: [0], 1: [0]}, and then, if 1 hole found
+        # for frag index 1, lack_list will be {0: [0, 1], 1: [0]}.
+        # After that, holes will be filled from bigger key
+        # (i.e. 1:[0] at first)
+
+        # Grouping all missing fragment indexes for each frag_index
+        available_indexes = list(putter_to_frag_index.values())
+        lack_list = collections.defaultdict(list)
+        for frag_index in range(policy.ec_n_unique_fragments):
+            # Set the missing index to lack_list
+            available_count = available_indexes.count(frag_index)
+            # N.B. it should be duplication_factor >= lack >= 0
+            lack = policy.ec_duplication_factor - available_count
+            # now we are missing one or more nodes to store the frag index
+            for lack_tier in range(lack):
+                lack_list[lack_tier].append(frag_index)
+
+        # Extract the lack_list to a flat list
+        holes = []
+        for lack_tier, indexes in sorted(lack_list.items(), reverse=True):
+            holes.extend(indexes)
+
+        # Fill putter_to_frag_index list with the hole list
+        for hole, p in zip(holes, handoff_conns):
+            putter_to_frag_index[p] = hole
+        return putter_to_frag_index
+
+    def _transfer_data(self, req, policy, data_source, putters, nodes,
+                       min_conns, etag_hasher):
+        """
+        Transfer data for an erasure coded object.
+
+        This method was added in the PUT method extraction change
+        """
+        bytes_transferred = 0
+        chunk_transform = chunk_transformer(policy)
+        chunk_transform.send(None)
+        frag_hashers = collections.defaultdict(
+            lambda: md5(usedforsecurity=False))
+
+        def send_chunk(chunk):
+            # Note: there's two different hashers in here. etag_hasher is
+            # hashing the original object so that we can validate the ETag
+            # that the client sent (and etag_hasher is None if the client
+            # didn't send one). The hasher in frag_hashers is hashing the
+            # fragment archive being sent to the client; this lets us guard
+            # against data corruption on the network between proxy and
+            # object server.
+            if etag_hasher:
+                etag_hasher.update(chunk)
+            backend_chunks = chunk_transform.send(chunk)
+            if backend_chunks is None:
+                # If there's not enough bytes buffered for erasure-encoding
+                # or whatever we're doing, the transform will give us None.
+                return
+
+            updated_frag_indexes = set()
+            timeout_at = time.time() + self.app.node_timeout
+            for putter in list(putters):
+                frag_index = putter_to_frag_index[putter]
+                backend_chunk = backend_chunks[frag_index]
+                if not putter.failed:
+                    # N.B. same frag_index will appear when using
+                    # ec_duplication_factor >= 2. So skip to feed the chunk
+                    # to hasher if the frag was updated already.
+                    if frag_index not in updated_frag_indexes:
+                        frag_hashers[frag_index].update(backend_chunk)
+                        updated_frag_indexes.add(frag_index)
+                    putter.send_chunk(backend_chunk, timeout_at=timeout_at)
+                else:
+                    putter.close()
+                    putters.remove(putter)
+            self._check_min_conn(
+                req, putters, min_conns,
+                msg='Object PUT exceptions during send, '
+                    '%(conns)s/%(nodes)s required connections')
+
+        try:
+            # build our putter_to_frag_index dict to place handoffs in the
+            # same part nodes index as the primaries they are covering
+            putter_to_frag_index = self._determine_chunk_destinations(
+                putters, policy)
+            data_source = CooperativeIterator(data_source)
+
+            while True:
+                with WatchdogTimeout(self.app.watchdog,
+                                     self.app.client_timeout,
+                                     ChunkReadTimeout):
+                    try:
+                        chunk = next(data_source)
+                    except StopIteration:
+                        break
+                bytes_transferred += len(chunk)
+                if bytes_transferred > constraints.MAX_FILE_SIZE:
+                    raise HTTPRequestEntityTooLarge(request=req)
+
+                send_chunk(chunk)
+
+            ml = req.message_length()
+            if ml and bytes_transferred < ml:
+                self.logger.warning(
+                    'Client disconnected without sending enough data')
+                self.logger.increment('object.client_disconnects')
+                raise HTTPClientDisconnect(request=req)
+
+            send_chunk(b'')  # flush out any buffered data
+
+            computed_etag = (etag_hasher.hexdigest()
+                             if etag_hasher else None)
+            footers = self._get_footers(req)
+            received_etag = normalize_etag(footers.get(
+                'etag', req.headers.get('etag', '')))
+            if (computed_etag and received_etag and
+                    computed_etag != received_etag):
+                raise HTTPUnprocessableEntity(request=req)
+
+            # Remove any EC reserved metadata names from footers
+            footers = {(k, v) for k, v in footers.items()
+                       if not k.lower().startswith('x-object-sysmeta-ec-')}
+            for putter in putters:
+                frag_index = putter_to_frag_index[putter]
+                # Update any footers set by middleware with EC footers
+                trail_md = trailing_metadata(
+                    policy, etag_hasher,
+                    bytes_transferred, frag_index)
+                trail_md.update(footers)
+                # Etag footer must always be hash of what we sent
+                trail_md['Etag'] = frag_hashers[frag_index].hexdigest()
+                putter.end_of_object_data(footer_metadata=trail_md)
+
+            # for storage policies requiring 2-phase commit (e.g.
+            # erasure coding), enforce >= 'quorum' number of
+            # 100-continue responses - this indicates successful
+            # object data and metadata commit and is a necessary
+            # condition to be met before starting 2nd PUT phase
+            final_phase = False
+            statuses, reasons, bodies, _junk = \
+                self._get_put_responses(
+                    req, putters, len(nodes), final_phase=final_phase,
+                    min_responses=min_conns)
+            if not self.have_quorum(
+                    statuses, len(nodes), quorum=min_conns):
+                self.logger.error(
+                    'Not enough object servers ack\'ed (got %d)',
+                    statuses.count(HTTP_CONTINUE))
+                raise HTTPServiceUnavailable(request=req)
+
+            elif not self._have_adequate_informational(
+                    statuses, min_conns):
+                resp = self.best_response(req, statuses, reasons, bodies,
+                                          'Object PUT',
+                                          quorum_size=min_conns)
+                if is_client_error(resp.status_int):
+                    # if 4xx occurred in this state it is absolutely
+                    # a bad conversation between proxy-server and
+                    # object-server (even if it's
+                    # HTTP_UNPROCESSABLE_ENTITY) so we should regard this
+                    # as HTTPServiceUnavailable.
+                    raise HTTPServiceUnavailable(request=req)
+                else:
+                    # Other errors should use raw best_response
+                    raise resp
+
+            # quorum achieved, start 2nd phase - send commit
+            # confirmation to participating object servers
+            # so they write a .durable state file indicating
+            # a successful PUT
+            for putter in putters:
+                putter.send_commit_confirmation()
+        except ChunkReadTimeout as err:
+            self.logger.warning(
+                'ERROR Client read timeout (%ss)', err.seconds)
+            self.logger.increment('object.client_timeouts')
+            raise HTTPRequestTimeout(request=req)
+        except ChunkReadError:
+            self.logger.warning(
+                'Client disconnected without sending last chunk')
+            self.logger.increment('object.client_disconnects')
+            raise HTTPClientDisconnect(request=req)
+        except HTTPException:
+            raise
+        except Timeout:
+            self.logger.exception(
+                'ERROR Exception causing client disconnect')
+            raise HTTPClientDisconnect(request=req)
+        except Exception:
+            self.logger.exception(
+                'ERROR Exception transferring data to object servers %s',
+                {'path': req.path})
+            raise HTTPInternalServerError(request=req)
+
+    def _have_adequate_responses(
+            self, statuses, min_responses, conditional_func):
+        """
+        Given a list of statuses from several requests, determine if a
+        satisfactory number of nodes have responded with 1xx or 2xx statuses to
+        deem the transaction for a successful response to the client.
+
+        :param statuses: list of statuses returned so far
+        :param min_responses: minimal pass criterion for number of successes
+        :param conditional_func: a callable function to check http status code
+        :returns: True or False, depending on current number of successes
+        """
+        if sum(1 for s in statuses if (conditional_func(s))) >= min_responses:
+            return True
+        return False
+
+    def _have_adequate_successes(self, statuses, min_responses):
+        """
+        Partial method of _have_adequate_responses for 2xx
+        """
+        return self._have_adequate_responses(
+            statuses, min_responses, is_success)
+
+    def _have_adequate_informational(self, statuses, min_responses):
+        """
+        Partial method of _have_adequate_responses for 1xx
+        """
+        return self._have_adequate_responses(
+            statuses, min_responses, is_informational)
+
+    def _have_adequate_put_responses(self, statuses, num_nodes, min_responses):
+        # For an EC PUT we require a quorum of responses with success statuses
+        # in order to move on to next phase of PUT request handling without
+        # having to wait for *all* responses.
+        # TODO: this implies that in the first phase of the backend PUTs when
+        # we are actually expecting 1xx responses that we will end up waiting
+        # for *all* responses. That seems inefficient since we only need a
+        # quorum of 1xx responses to proceed.
+        return self._have_adequate_successes(statuses, min_responses)
+
+    def _store_object(self, req, data_source, nodes, partition,
+                      outgoing_headers):
+        """
+        Store an erasure coded object.
+        """
+        policy_index = int(req.headers.get('X-Backend-Storage-Policy-Index'))
+        policy = POLICIES.get_by_index(policy_index)
+
+        expected_frag_size = None
+        ml = req.message_length()
+        if ml:
+            # TODO: PyECLib <= 1.2.0 looks to return the segment info
+            # different from the input for aligned data efficiency but
+            # Swift never does. So calculate the fragment length Swift
+            # will actually send to object server by making two different
+            # get_segment_info calls (until PyECLib fixed).
+            # policy.fragment_size makes the call using segment size,
+            # and the next call is to get info for the last segment
+
+            # get number of fragments except the tail - use truncation //
+            num_fragments = ml // policy.ec_segment_size
+            expected_frag_size = policy.fragment_size * num_fragments
+
+            # calculate the tail fragment_size by hand and add it to
+            # expected_frag_size
+            last_segment_size = ml % policy.ec_segment_size
+            if last_segment_size:
+                last_info = policy.pyeclib_driver.get_segment_info(
+                    last_segment_size, policy.ec_segment_size)
+                expected_frag_size += last_info['fragment_size']
+        for headers in outgoing_headers:
+            headers['X-Backend-Obj-Content-Length'] = expected_frag_size
+            # the object server will get different bytes, so these
+            # values do not apply.
+            headers.pop('Content-Length', None)
+            headers.pop('Etag', None)
+
+        # Since the request body sent from client -> proxy is not
+        # the same as the request body sent proxy -> object, we
+        # can't rely on the object-server to do the etag checking -
+        # so we have to do it here.
+        etag_hasher = md5(usedforsecurity=False)
+
+        min_conns = policy.quorum
+        putters = self._get_put_connections(
+            req, nodes, partition, outgoing_headers, policy)
+
+        try:
+            # check that a minimum number of connections were established and
+            # meet all the correct conditions set in the request
+            self._check_failure_put_connections(putters, req, min_conns)
+
+            self._transfer_data(req, policy, data_source, putters,
+                                nodes, min_conns, etag_hasher)
+            # The durable state will propagate in a replicated fashion; if
+            # one fragment is durable then the reconstructor will spread the
+            # durable status around.
+            # In order to avoid successfully writing an object, but refusing
+            # to serve it on a subsequent GET because don't have enough
+            # durable data fragments - we require the same number of durable
+            # writes as quorum fragment writes.  If object servers are in the
+            # future able to serve their non-durable fragment archives we may
+            # be able to reduce this quorum count if needed.
+            # ignore response etags
+            statuses, reasons, bodies, _etags = \
+                self._get_put_responses(req, putters, len(nodes),
+                                        final_phase=True,
+                                        min_responses=min_conns)
+        except HTTPException as resp:
+            return resp
+        finally:
+            for putter in putters:
+                putter.close()
+
+        etag = etag_hasher.hexdigest()
+        resp = self.best_response(req, statuses, reasons, bodies,
+                                  'Object PUT', etag=etag,
+                                  quorum_size=min_conns)
+        resp.last_modified = Timestamp(req.headers['X-Timestamp'])
+        return resp
diff --git a/swift/proxy/server.py b/swift/proxy/server.py
index c064f6bb27..250dd29b21 100644
--- a/swift/proxy/server.py
+++ b/swift/proxy/server.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,85 +13,279 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-# NOTE: swift_conn
-# You'll see swift_conn passed around a few places in this file. This is the
-# source httplib connection of whatever it is attached to.
-#   It is used when early termination of reading from the connection should
-# happen, such as when a range request is satisfied but there's still more the
-# source connection would like to send. To prevent having to read all the data
-# that could be left, the source connection can be .close() and then reads
-# commence to empty out any buffers.
-#   These shenanigans are to ensure all related objects can be garbage
-# collected. We've seen objects hang around forever otherwise.
-
 import mimetypes
 import os
-import time
-from ConfigParser import ConfigParser
-import uuid
+import socket
+
+from collections import defaultdict
+
+from random import shuffle
+from time import time
+import functools
+import sys
 
 from eventlet import Timeout
 
+from swift import __canonical_version__ as swift_version
+from swift.common import constraints
+from swift.common.http import is_server_error, HTTP_INSUFFICIENT_STORAGE
+from swift.common.storage_policy import POLICIES
 from swift.common.ring import Ring
-from swift.common.utils import cache_from_env, get_logger, \
-    get_remote_client, split_path, config_true_value
-from swift.common.constraints import check_utf8
-from swift.proxy.controllers import AccountController, ObjectController, \
-    ContainerController, Controller
-from swift.common.swob import HTTPAccepted, HTTPBadRequest, HTTPForbidden, \
+from swift.common.error_limiter import ErrorLimiter
+from swift.common.utils import Watchdog, get_logger, \
+    get_remote_client, split_path, config_true_value, generate_trans_id, \
+    affinity_key_function, affinity_locality_predicate, list_from_csv, \
+    parse_prefixed_conf, config_auto_int_value, node_to_string, \
+    config_request_node_count_value, config_percent_value, cap_length, \
+    parse_options, non_negative_int, config_positive_float_value
+from swift.common.registry import register_swift_info
+from swift.common.constraints import check_utf8, valid_api_version
+from swift.common.statsd_client import get_labeled_statsd_client
+from swift.proxy.controllers import AccountController, ContainerController, \
+    ObjectControllerRouter, InfoController
+from swift.proxy.controllers.base import get_container_info, \
+    DEFAULT_RECHECK_CONTAINER_EXISTENCE, DEFAULT_RECHECK_ACCOUNT_EXISTENCE, \
+    DEFAULT_RECHECK_UPDATING_SHARD_RANGES, DEFAULT_RECHECK_LISTING_SHARD_RANGES
+from swift.common.swob import HTTPBadRequest, HTTPForbidden, \
     HTTPMethodNotAllowed, HTTPNotFound, HTTPPreconditionFailed, \
-    HTTPRequestEntityTooLarge, HTTPRequestTimeout, HTTPServerError, \
-    HTTPServiceUnavailable, HTTPClientDisconnect, status_map, Request, Response
+    HTTPServerError, HTTPException, Request, HTTPServiceUnavailable, \
+    wsgi_to_str
+from swift.common.exceptions import APIVersionError
+from swift.common.wsgi import run_wsgi
+from swift.obj import expirer
+
+DEFAULT_NAMESPACE_AVG_BACKEND_FETCH_TIME = 0.3  # seconds
+DEFAULT_NAMESPACE_CACHE_TOKENS_PER_SESSION = 3  # 3 tokens per session
+
+
+# List of entry points for mandatory middlewares.
+#
+# Fields:
+#
+# "name" (required) is the entry point name from setup.py.
+#
+# "after_fn" (optional) a function that takes a PipelineWrapper object as its
+# single argument and returns a list of middlewares that this middleware
+# should come after. Any middlewares in the returned list that are not present
+# in the pipeline will be ignored, so you can safely name optional middlewares
+# to come after. For example, ["catch_errors", "bulk"] would install this
+# middleware after catch_errors and bulk if both were present, but if bulk
+# were absent, would just install it after catch_errors.
+
+required_filters = [
+    {'name': 'catch_errors'},
+    {'name': 'gatekeeper',
+     'after_fn': lambda pipe: (['catch_errors']
+                               if pipe.startswith('catch_errors')
+                               else [])},
+    {'name': 'listing_formats', 'after_fn': lambda _junk: [
+        'catch_errors', 'gatekeeper', 'proxy_logging', 'memcache']},
+    # Put copy before dlo, slo and versioned_writes
+    {'name': 'copy', 'after_fn': lambda _junk: [
+        'staticweb', 'tempauth', 'keystoneauth',
+        'catch_errors', 'gatekeeper', 'proxy_logging']},
+    {'name': 'dlo', 'after_fn': lambda _junk: [
+        'copy', 'staticweb', 'tempauth', 'keystoneauth',
+        'catch_errors', 'gatekeeper', 'proxy_logging']},
+    {'name': 'versioned_writes', 'after_fn': lambda _junk: [
+        'slo', 'dlo', 'copy', 'staticweb', 'tempauth',
+        'keystoneauth', 'catch_errors', 'gatekeeper', 'proxy_logging']},
+]
+
+
+def _label_for_policy(policy):
+    if policy is not None:
+        return 'policy %s (%s)' % (policy.idx, policy.name)
+    return '(default)'
+
+
+VALID_SORTING_METHODS = ('shuffle', 'timing', 'affinity')
+
+
+class ProxyOverrideOptions(object):
+    """
+    Encapsulates proxy server options that may be overridden e.g. for
+    policy specific configurations.
+
+    :param conf: the proxy-server config dict.
+    :param override_conf: a dict of overriding configuration options.
+    """
+    def __init__(self, base_conf, override_conf, app):
+
+        def get(key, default):
+            return override_conf.get(key, base_conf.get(key, default))
+
+        self.sorting_method = get('sorting_method', 'shuffle').lower()
+        if self.sorting_method not in VALID_SORTING_METHODS:
+            raise ValueError(
+                'Invalid sorting_method value; must be one of %s, not %r' % (
+                    ', '.join(VALID_SORTING_METHODS), self.sorting_method))
+
+        self.read_affinity = get('read_affinity', '')
+        try:
+            self.read_affinity_sort_key = affinity_key_function(
+                self.read_affinity)
+        except ValueError as err:
+            # make the message a little more useful
+            raise ValueError("Invalid read_affinity value: %r (%s)" %
+                             (self.read_affinity, err.args[0]))
+
+        self.write_affinity = get('write_affinity', '')
+        try:
+            self.write_affinity_is_local_fn \
+                = affinity_locality_predicate(self.write_affinity)
+        except ValueError as err:
+            # make the message a little more useful
+            raise ValueError("Invalid write_affinity value: %r (%s)" %
+                             (self.write_affinity, err.args[0]))
+        self.write_affinity_node_count = get(
+            'write_affinity_node_count', '2 * replicas').lower()
+        value = self.write_affinity_node_count.split()
+        if len(value) == 1:
+            wanc_value = int(value[0])
+            self.write_affinity_node_count_fn = lambda replicas: wanc_value
+        elif len(value) == 3 and value[1] == '*' and value[2] == 'replicas':
+            wanc_value = int(value[0])
+            self.write_affinity_node_count_fn = \
+                lambda replicas: wanc_value * replicas
+        else:
+            raise ValueError(
+                'Invalid write_affinity_node_count value: %r' %
+                (' '.join(value)))
+
+        self.write_affinity_handoff_delete_count = config_auto_int_value(
+            get('write_affinity_handoff_delete_count', 'auto'), None
+        )
+
+        self.rebalance_missing_suppression_count = int(get(
+            'rebalance_missing_suppression_count', 1))
+        self.concurrent_gets = config_true_value(get('concurrent_gets', False))
+        self.concurrency_timeout = float(get(
+            'concurrency_timeout', app.conn_timeout))
+        self.concurrent_ec_extra_requests = int(get(
+            'concurrent_ec_extra_requests', 0))
+
+    def __repr__(self):
+        return '%s({}, {%s}, app)' % (
+            self.__class__.__name__, ', '.join(
+                '%r: %r' % (k, getattr(self, k)) for k in (
+                    'sorting_method',
+                    'read_affinity',
+                    'write_affinity',
+                    'write_affinity_node_count',
+                    'write_affinity_handoff_delete_count',
+                    'rebalance_missing_suppression_count',
+                    'concurrent_gets',
+                    'concurrency_timeout',
+                    'concurrent_ec_extra_requests',
+                )))
+
+    def __eq__(self, other):
+        if not isinstance(other, ProxyOverrideOptions):
+            return False
+        return all(getattr(self, k) == getattr(other, k) for k in (
+            'sorting_method',
+            'read_affinity',
+            'write_affinity',
+            'write_affinity_node_count',
+            'write_affinity_handoff_delete_count',
+            'rebalance_missing_suppression_count',
+            'concurrent_gets',
+            'concurrency_timeout',
+            'concurrent_ec_extra_requests',
+        ))
 
 
 class Application(object):
     """WSGI application for the proxy server."""
 
-    def __init__(self, conf, memcache=None, logger=None, account_ring=None,
-                 container_ring=None, object_ring=None):
+    def __init__(self, conf, logger=None, account_ring=None,
+                 container_ring=None, statsd=None):
+        # This is for the sake of tests which instantiate an Application
+        # directly rather than via loadapp().
+        self._pipeline_final_app = self
+
         if conf is None:
             conf = {}
         if logger is None:
-            self.logger = get_logger(conf, log_route='proxy-server')
+            self.logger = get_logger(conf, log_route='proxy-server',
+                                     statsd_tail_prefix='proxy-server')
         else:
             self.logger = logger
+        self.statsd = statsd or get_labeled_statsd_client(conf, self.logger)
+        self.backend_user_agent = 'proxy-server %s' % os.getpid()
 
         swift_dir = conf.get('swift_dir', '/etc/swift')
-        self.node_timeout = int(conf.get('node_timeout', 10))
+        self.swift_dir = swift_dir
+        self.node_timeout = float(conf.get('node_timeout', 10))
+        self.recoverable_node_timeout = float(
+            conf.get('recoverable_node_timeout', self.node_timeout))
         self.conn_timeout = float(conf.get('conn_timeout', 0.5))
-        self.client_timeout = int(conf.get('client_timeout', 60))
-        self.put_queue_depth = int(conf.get('put_queue_depth', 10))
+        self.client_timeout = float(conf.get('client_timeout', 60))
         self.object_chunk_size = int(conf.get('object_chunk_size', 65536))
         self.client_chunk_size = int(conf.get('client_chunk_size', 65536))
-        self.error_suppression_interval = \
-            int(conf.get('error_suppression_interval', 60))
-        self.error_suppression_limit = \
+        self.trans_id_suffix = conf.get('trans_id_suffix', '')
+        self.post_quorum_timeout = float(conf.get('post_quorum_timeout', 0.5))
+        error_suppression_interval = \
+            float(conf.get('error_suppression_interval', 60))
+        error_suppression_limit = \
             int(conf.get('error_suppression_limit', 10))
+        self.error_limiter = ErrorLimiter(error_suppression_interval,
+                                          error_suppression_limit)
         self.recheck_container_existence = \
-            int(conf.get('recheck_container_existence', 60))
+            int(conf.get('recheck_container_existence',
+                         DEFAULT_RECHECK_CONTAINER_EXISTENCE))
+        self.recheck_updating_shard_ranges = \
+            int(conf.get('recheck_updating_shard_ranges',
+                         DEFAULT_RECHECK_UPDATING_SHARD_RANGES))
+        self.recheck_listing_shard_ranges = \
+            int(conf.get('recheck_listing_shard_ranges',
+                         DEFAULT_RECHECK_LISTING_SHARD_RANGES))
         self.recheck_account_existence = \
-            int(conf.get('recheck_account_existence', 60))
+            int(conf.get('recheck_account_existence',
+                         DEFAULT_RECHECK_ACCOUNT_EXISTENCE))
+        self.container_existence_skip_cache = config_percent_value(
+            conf.get('container_existence_skip_cache_pct', 0))
+        self.container_updating_shard_ranges_skip_cache = \
+            config_percent_value(conf.get(
+                'container_updating_shard_ranges_skip_cache_pct', 0))
+        self.container_listing_shard_ranges_skip_cache = \
+            config_percent_value(conf.get(
+                'container_listing_shard_ranges_skip_cache_pct', 0))
+        self.account_existence_skip_cache = config_percent_value(
+            conf.get('account_existence_skip_cache_pct', 0))
+        self.namespace_avg_backend_fetch_time = \
+            config_positive_float_value(
+                conf.get(
+                    'namespace_avg_backend_fetch_time',
+                    DEFAULT_NAMESPACE_AVG_BACKEND_FETCH_TIME
+                )
+            )
+        self.namespace_cache_tokens_per_session = \
+            non_negative_int(
+                conf.get(
+                    'namespace_cache_tokens_per_session',
+                    DEFAULT_NAMESPACE_CACHE_TOKENS_PER_SESSION
+                )
+            )
         self.allow_account_management = \
             config_true_value(conf.get('allow_account_management', 'no'))
-        self.object_post_as_copy = \
-            config_true_value(conf.get('object_post_as_copy', 'true'))
-        self.resellers_conf = ConfigParser()
-        self.resellers_conf.read(os.path.join(swift_dir, 'resellers.conf'))
-        self.object_ring = object_ring or Ring(swift_dir, ring_name='object')
         self.container_ring = container_ring or Ring(swift_dir,
                                                      ring_name='container')
         self.account_ring = account_ring or Ring(swift_dir,
                                                  ring_name='account')
-        self.memcache = memcache
+        # ensure rings are loaded for all configured storage policies
+        for policy in POLICIES:
+            policy.load_ring(swift_dir)
+        self.obj_controller_router = ObjectControllerRouter()
         mimetypes.init(mimetypes.knownfiles +
                        [os.path.join(swift_dir, 'mime.types')])
         self.account_autocreate = \
             config_true_value(conf.get('account_autocreate', 'no'))
-        self.expiring_objects_account = \
-            (conf.get('auto_create_account_prefix') or '.') + \
-            'expiring_objects'
-        self.expiring_objects_container_divisor = \
-            int(conf.get('expiring_objects_container_divisor') or 86400)
+        self.auto_create_account_prefix = \
+            constraints.AUTO_CREATE_ACCOUNT_PREFIX
+        self.expirer_config = expirer.ExpirerConfig(
+            conf, container_ring=self.container_ring, logger=self.logger)
         self.max_containers_per_account = \
             int(conf.get('max_containers_per_account') or 0)
         self.max_containers_whitelist = [
@@ -101,32 +295,204 @@ def __init__(self, conf, memcache=None, logger=None, account_ring=None,
         self.deny_host_headers = [
             host.strip() for host in
             conf.get('deny_host_headers', '').split(',') if host.strip()]
-        self.rate_limit_after_segment = \
-            int(conf.get('rate_limit_after_segment', 10))
-        self.rate_limit_segments_per_sec = \
-            int(conf.get('rate_limit_segments_per_sec', 1))
         self.log_handoffs = config_true_value(conf.get('log_handoffs', 'true'))
         self.cors_allow_origin = [
             a.strip()
             for a in conf.get('cors_allow_origin', '').split(',')
             if a.strip()]
+        self.cors_expose_headers = [
+            a.strip()
+            for a in conf.get('cors_expose_headers', '').split(',')
+            if a.strip()]
+        self.strict_cors_mode = config_true_value(
+            conf.get('strict_cors_mode', 't'))
+        self.allow_open_expired = config_true_value(
+            conf.get('allow_open_expired', 'f'))
+        self.node_timings = {}
+        self.timing_expiry = int(conf.get('timing_expiry', 300))
+        value = conf.get('request_node_count', '2 * replicas')
+        self.request_node_count = config_request_node_count_value(value)
+        # swift_owner_headers are stripped by the account and container
+        # controllers; we should extend header stripping to object controller
+        # when a privileged object header is implemented.
+        swift_owner_headers = conf.get(
+            'swift_owner_headers',
+            'x-container-read, x-container-write, '
+            'x-container-sync-key, x-container-sync-to, '
+            'x-account-meta-temp-url-key, x-account-meta-temp-url-key-2, '
+            'x-container-meta-temp-url-key, x-container-meta-temp-url-key-2, '
+            'x-account-access-control')
+        self.swift_owner_headers = [
+            name.strip().title()
+            for name in swift_owner_headers.split(',') if name.strip()]
+
+        # When upgrading from liberasurecode<=1.5.0, you may want to continue
+        # writing legacy CRCs until all nodes are upgraded and capabale of
+        # reading fragments with zlib CRCs.
+        # See https://bugs.launchpad.net/liberasurecode/+bug/1886088 for more
+        # information.
+        if 'write_legacy_ec_crc' in conf:
+            os.environ['LIBERASURECODE_WRITE_LEGACY_CRC'] = \
+                '1' if config_true_value(conf['write_legacy_ec_crc']) else '0'
+        # else, assume operators know what they're doing and leave env alone
+
+        # Initialization was successful, so now apply the client chunk size
+        # parameter as the default read / write buffer size for the network
+        # sockets.
+        #
+        # NOTE WELL: This is a class setting, so until we get set this on a
+        # per-connection basis, this affects reading and writing on ALL
+        # sockets, those between the proxy servers and external clients, and
+        # those between the proxy servers and the other internal servers.
+        #
+        # ** Because it affects the client as well, currently, we use the
+        # client chunk size as the govenor and not the object chunk size.
+        if sys.version_info < (3,):
+            socket._fileobject.default_bufsize = self.client_chunk_size
+        # TODO: find a way to enable similar functionality in py3
+
+        self.expose_info = config_true_value(
+            conf.get('expose_info', 'yes'))
+        self.disallowed_sections = list_from_csv(
+            conf.get('disallowed_sections', ', '.join([
+                'swift.auto_create_account_prefix',
+                'swift.valid_api_versions',
+            ])))
+        self.admin_key = conf.get('admin_key', None)
+        self._override_options = self._load_per_policy_config(conf)
+        self.sorts_by_timing = any(pc.sorting_method == 'timing'
+                                   for pc in self._override_options.values())
+
+        register_swift_info(
+            version=swift_version,
+            strict_cors_mode=self.strict_cors_mode,
+            policies=POLICIES.get_policy_info(),
+            allow_account_management=self.allow_account_management,
+            account_autocreate=self.account_autocreate,
+            allow_open_expired=self.allow_open_expired,
+            **constraints.EFFECTIVE_CONSTRAINTS)
+        self.watchdog = Watchdog()
+        self.watchdog.spawn()
+
+    def _make_policy_override(self, policy, conf, override_conf):
+        label_for_policy = _label_for_policy(policy)
+        try:
+            override = ProxyOverrideOptions(conf, override_conf, self)
+            self.logger.debug("Loaded override config for %s: %r" %
+                              (label_for_policy, override))
+            return override
+        except ValueError as err:
+            raise ValueError('%s for %s' % (err, label_for_policy))
+
+    def _load_per_policy_config(self, conf):
+        """
+        Loads per-policy config override values from proxy server conf file.
+
+        :param conf: the proxy server local conf dict
+        :return: a dict mapping :class:`BaseStoragePolicy` to an instance of
+            :class:`ProxyOverrideOptions` that has policy-specific config
+            attributes
+        """
+        # the default options will be used when looking up a policy that had no
+        # override options
+        default_options = self._make_policy_override(None, conf, {})
+        overrides = defaultdict(lambda: default_options)
+        # force None key to be set in the defaultdict so that it is found when
+        # iterating over items in check_config
+        overrides[None] = default_options
+        for index, override_conf in conf.get('policy_config', {}).items():
+            try:
+                index = int(index)
+            except ValueError:
+                # require policies to be referenced by index; using index *or*
+                # name isn't possible because names such as "3" are allowed
+                raise ValueError(
+                    'Override config must refer to policy index: %r' % index)
+            try:
+                policy = POLICIES[index]
+            except KeyError:
+                raise ValueError(
+                    "No policy found for override config, index: %s" % index)
+            override = self._make_policy_override(policy, conf, override_conf)
+            overrides[index] = override
+        return overrides
+
+    def get_policy_options(self, policy):
+        """
+        Return policy specific options.
+
+        :param policy: an instance of :class:`BaseStoragePolicy` or ``None``
+        :return: an instance of :class:`ProxyOverrideOptions`
+        """
+        return self._override_options[policy and policy.idx]
+
+    def check_config(self):
+        """
+        Check the configuration for possible errors
+        """
+        for policy_idx, options in self._override_options.items():
+            policy = (None if policy_idx is None
+                      else POLICIES.get_by_index(policy_idx))
+            if options.read_affinity and options.sorting_method != 'affinity':
+                self.logger.warning(
+                    "sorting_method is set to '%(method)s', not 'affinity'; "
+                    "%(label)s read_affinity setting will have no effect.",
+                    {'label': _label_for_policy(policy),
+                     'method': options.sorting_method})
+
+    def get_object_ring(self, policy_idx):
+        """
+        Get the ring object to use to handle a request based on its policy.
+
+        :param policy_idx: policy index as defined in swift.conf
 
-    def get_controller(self, path):
+        :returns: appropriate ring object
+        """
+        return POLICIES.get_object_ring(policy_idx, self.swift_dir)
+
+    def get_controller(self, req):
         """
         Get the controller to handle a request.
 
-        :param path: path from request
+        :param req: the request
         :returns: tuple of (controller class, path dictionary)
 
-        :raises: ValueError (thrown by split_path) if given invalid path
+        :raises ValueError: (thrown by split_path) if given invalid path
         """
-        version, account, container, obj = split_path(path, 1, 4, True)
+        if req.path == '/info':
+            d = dict(version=None,
+                     expose_info=self.expose_info,
+                     disallowed_sections=self.disallowed_sections,
+                     admin_key=self.admin_key)
+            return InfoController, d
+
+        version, account, container, obj = split_path(
+            wsgi_to_str(req.path), 1, 4, True)
         d = dict(version=version,
                  account_name=account,
                  container_name=container,
                  object_name=obj)
+        if account and not valid_api_version(version):
+            raise APIVersionError('Invalid path')
         if obj and container and account:
-            return ObjectController, d
+            info = get_container_info(req.environ, self)
+            if is_server_error(info.get('status')):
+                raise HTTPServiceUnavailable(request=req)
+            policy_index = req.headers.get('X-Backend-Storage-Policy-Index',
+                                           info['storage_policy'])
+            policy = POLICIES.get_by_index(policy_index)
+            if not policy:
+                # This indicates that a new policy has been created,
+                # with rings, deployed, released (i.e. deprecated =
+                # False), used by a client to create a container via
+                # another proxy that was restarted after the policy
+                # was released, and is now cached - all before this
+                # worker was HUPed to stop accepting new
+                # connections.  There should never be an "unknown"
+                # index - but when there is - it's probably operator
+                # error and hopefully temporary.
+                raise HTTPServiceUnavailable('Unknown Storage Policy')
+            return self.obj_controller_router[policy], d
         elif container and account:
             return ContainerController, d
         elif account and not container and not obj:
@@ -142,22 +508,28 @@ def __call__(self, env, start_response):
         :param start_response: WSGI callable
         """
         try:
-            if self.memcache is None:
-                self.memcache = cache_from_env(env)
             req = self.update_request(Request(env))
             return self.handle_request(req)(env, start_response)
         except UnicodeError:
-            err = HTTPPreconditionFailed(request=req, body='Invalid UTF8')
+            err = HTTPPreconditionFailed(
+                request=req, body='Invalid UTF8 or contains NULL')
             return err(env, start_response)
         except (Exception, Timeout):
             start_response('500 Server Error',
                            [('Content-Type', 'text/plain')])
-            return ['Internal server error.\n']
+            return [b'Internal server error.\n']
 
     def update_request(self, req):
         if 'x-storage-token' in req.headers and \
                 'x-auth-token' not in req.headers:
             req.headers['x-auth-token'] = req.headers['x-storage-token']
+        te = req.headers.get('transfer-encoding', '').lower()
+        if te.rsplit(',', 1)[-1].strip() == 'chunked' and \
+                'content-length' in req.headers:
+            # RFC says if both are present, transfer-encoding wins.
+            # Definitely *don't* forward on the header the backend
+            # ought to ignore; that offers request-smuggling vectors.
+            del req.headers['content-length']
         return req
 
     def handle_request(self, req):
@@ -168,26 +540,27 @@ def handle_request(self, req):
         :param req: swob.Request object
         """
         try:
-            self.logger.set_statsd_prefix('proxy-server')
             if req.content_length and req.content_length < 0:
                 self.logger.increment('errors')
                 return HTTPBadRequest(request=req,
                                       body='Invalid Content-Length')
 
             try:
-                if not check_utf8(req.path_info):
+                if not check_utf8(wsgi_to_str(req.path_info),
+                                  internal=req.allow_reserved_names):
                     self.logger.increment('errors')
-                    return HTTPPreconditionFailed(request=req,
-                                                  body='Invalid UTF8')
+                    return HTTPPreconditionFailed(
+                        request=req, body='Invalid UTF8 or contains NULL')
             except UnicodeError:
                 self.logger.increment('errors')
-                return HTTPPreconditionFailed(request=req, body='Invalid UTF8')
+                return HTTPPreconditionFailed(
+                    request=req, body='Invalid UTF8 or contains NULL')
 
             try:
-                controller, path_parts = self.get_controller(req.path)
-                p = req.path_info
-                if isinstance(p, unicode):
-                    p = p.encode('utf-8')
+                controller, path_parts = self.get_controller(req)
+            except APIVersionError:
+                self.logger.increment('errors')
+                return HTTPBadRequest(request=req)
             except ValueError:
                 self.logger.increment('errors')
                 return HTTPNotFound(request=req)
@@ -198,26 +571,31 @@ def handle_request(self, req):
                     req.host.split(':')[0] in self.deny_host_headers:
                 return HTTPForbidden(request=req, body='Invalid host header')
 
-            self.logger.set_statsd_prefix('proxy-server.' +
-                                          controller.server_type.lower())
             controller = controller(self, **path_parts)
             if 'swift.trans_id' not in req.environ:
                 # if this wasn't set by an earlier middleware, set it now
-                trans_id = 'tx' + uuid.uuid4().hex
+                trans_id_suffix = self.trans_id_suffix
+                trans_id_extra = req.headers.get('x-trans-id-extra')
+                if trans_id_extra:
+                    trans_id_suffix += '-' + trans_id_extra[:32]
+                trans_id = generate_trans_id(trans_id_suffix)
                 req.environ['swift.trans_id'] = trans_id
                 self.logger.txn_id = trans_id
             req.headers['x-trans-id'] = req.environ['swift.trans_id']
             controller.trans_id = req.environ['swift.trans_id']
             self.logger.client_ip = get_remote_client(req)
-            try:
-                handler = getattr(controller, req.method)
-                getattr(handler, 'publicly_accessible')
-            except AttributeError:
-                allowed_methods = getattr(controller, 'allowed_methods', set())
-                return HTTPMethodNotAllowed(
-                    request=req, headers={'Allow': ', '.join(allowed_methods)})
-            if path_parts['version']:
-                req.path_info_pop()
+
+            allowed_methods = controller.allowed_methods
+            if config_true_value(req.headers.get(
+                    'X-Backend-Allow-Private-Methods', False)):
+                allowed_methods = set(allowed_methods).union(
+                    controller.private_methods)
+            if req.method not in allowed_methods:
+                return HTTPMethodNotAllowed(request=req, headers={
+                    'Allow': ', '.join(allowed_methods)})
+            handler = getattr(controller, req.method)
+
+            old_authorize = None
             if 'swift.authorize' in req.environ:
                 # We call authorize before the handler, always. If authorized,
                 # we remove the swift.authorize hook so isn't ever called
@@ -227,7 +605,7 @@ def handle_request(self, req):
                 resp = req.environ['swift.authorize'](req)
                 if not resp:
                     # No resp means authorized, no delayed recheck required.
-                    del req.environ['swift.authorize']
+                    old_authorize = req.environ['swift.authorize']
                 else:
                     # Response indicates denial, but we might delay the denial
                     # and recheck later. If not delayed, return the error now.
@@ -236,15 +614,236 @@ def handle_request(self, req):
             # Save off original request method (GET, POST, etc.) in case it
             # gets mutated during handling.  This way logging can display the
             # method the client actually sent.
-            req.environ['swift.orig_req_method'] = req.method
-            return handler(req)
+            req.environ.setdefault('swift.orig_req_method', req.method)
+            try:
+                if old_authorize:
+                    req.environ.pop('swift.authorize', None)
+                return handler(req)
+            finally:
+                if old_authorize:
+                    req.environ['swift.authorize'] = old_authorize
+        except HTTPException as error_response:
+            return error_response
         except (Exception, Timeout):
-            self.logger.exception(_('ERROR Unhandled exception in request'))
+            self.logger.exception('ERROR Unhandled exception in request')
             return HTTPServerError(request=req)
 
+    def sort_nodes(self, nodes, policy=None):
+        """
+        Sorts nodes in-place (and returns the sorted list) according to
+        the configured strategy. The default "sorting" is to randomly
+        shuffle the nodes. If the "timing" strategy is chosen, the nodes
+        are sorted according to the stored timing data.
+
+        :param nodes: a list of nodes
+        :param policy: an instance of :class:`BaseStoragePolicy`
+        """
+        # In the case of timing sorting, shuffling ensures that close timings
+        # (ie within the rounding resolution) won't prefer one over another.
+        # Python's sort is stable (http://wiki.python.org/moin/HowTo/Sorting/)
+        shuffle(nodes)
+        policy_options = self.get_policy_options(policy)
+        if policy_options.sorting_method == 'timing':
+            now = time()
+
+            def key_func(node):
+                timing, expires = self.node_timings.get(node['ip'], (-1.0, 0))
+                return timing if expires > now else -1.0
+            nodes.sort(key=key_func)
+        elif policy_options.sorting_method == 'affinity':
+            nodes.sort(key=policy_options.read_affinity_sort_key)
+        return nodes
+
+    def set_node_timing(self, node, timing):
+        if not self.sorts_by_timing:
+            return
+        now = time()
+        timing = round(timing, 3)  # sort timings to the millisecond
+        self.node_timings[node['ip']] = (timing, now + self.timing_expiry)
+
+    def error_limited(self, node):
+        """
+        Check if the node is currently error limited.
+
+        :param node: dictionary of node to check
+        :returns: True if error limited, False otherwise
+        """
+        limited = self.error_limiter.is_limited(node)
+        if limited:
+            self.logger.increment('error_limiter.is_limited')
+            self.logger.debug(
+                'Node is error limited: %s', node_to_string(node))
+        return limited
+
+    def error_limit(self, node, msg):
+        """
+        Mark a node as error limited. This immediately pretends the
+        node received enough errors to trigger error suppression. Use
+        this for errors like Insufficient Storage. For other errors
+        use :func:`increment`.
+
+        :param node: dictionary of node to error limit
+        :param msg: error message
+        """
+        self.error_limiter.limit(node)
+        self.logger.increment('error_limiter.forced_limit')
+        self.logger.error(
+            'Node will be error limited for %.2fs: %s, error: %s',
+            self.error_limiter.suppression_interval, node_to_string(node),
+            msg)
+
+    def _error_increment(self, node):
+        """
+        Call increment() on error limiter once, emit metrics and log if error
+        suppression will be triggered.
+
+        :param node: dictionary of node to handle errors for
+        """
+        if self.error_limiter.increment(node):
+            self.logger.increment('error_limiter.incremented_limit')
+            self.logger.error(
+                'Node will be error limited for %.2fs: %s',
+                self.error_limiter.suppression_interval, node_to_string(node))
+
+    def error_occurred(self, node, msg):
+        """
+        Handle logging, and handling of errors.
+
+        :param node: dictionary of node to handle errors for
+        :param msg: error message
+        """
+        if isinstance(msg, bytes):
+            msg = msg.decode('utf-8')
+        self.logger.error('%(msg)s %(node)s',
+                          {'msg': msg, 'node': node_to_string(node)})
+        self._error_increment(node)
+
+    def check_response(self, node, server_type, response, method, path,
+                       body=None):
+        """
+        Check response for error status codes and update error limiters as
+        required.
+
+        :param node: a dict describing a node
+        :param server_type: the type of server from which the response was
+            received (e.g. 'Object').
+        :param response: an instance of HTTPResponse.
+        :param method: the request method.
+        :param path: the request path.
+        :param body: an optional response body. If given, up to 1024 of the
+            start of the body will be included in any log message.
+        :return True: if the response status code is less than 500, False
+            otherwise.
+        """
+        ok = False
+        if response.status == HTTP_INSUFFICIENT_STORAGE:
+            self.error_limit(node, 'ERROR Insufficient Storage')
+        elif is_server_error(response.status):
+            values = {'status': response.status,
+                      'method': method,
+                      'path': path,
+                      'type': server_type}
+            if body is None:
+                fmt = 'ERROR %(status)d Trying to %(method)s ' \
+                      '%(path)s From %(type)s Server'
+            else:
+                fmt = 'ERROR %(status)d %(body)s Trying to %(method)s ' \
+                      '%(path)s From %(type)s Server'
+                values['body'] = cap_length(body, 1024)
+            self.error_occurred(node, fmt % values)
+        else:
+            ok = True
+
+        return ok
+
+    def exception_occurred(self, node, typ, additional_info,
+                           **kwargs):
+        """
+        Handle logging of generic exceptions.
+
+        :param node: dictionary of node to log the error for
+        :param typ: server type
+        :param additional_info: additional information to log
+        """
+        if 'level' in kwargs:
+            log = functools.partial(self.logger.log, kwargs.pop('level'))
+            if 'exc_info' not in kwargs:
+                kwargs['exc_info'] = sys.exc_info()
+        else:
+            log = self.logger.exception
+        if isinstance(additional_info, bytes):
+            additional_info = additional_info.decode('utf-8')
+        log('ERROR with %(type)s server %(node)s'
+            ' re: %(info)s',
+            {'type': typ, 'node': node_to_string(node),
+             'info': additional_info},
+            **kwargs)
+        self._error_increment(node)
+
+    def modify_wsgi_pipeline(self, pipe):
+        """
+        Called during WSGI pipeline creation. Modifies the WSGI pipeline
+        context to ensure that mandatory middleware is present in the pipeline.
+
+        :param pipe: A PipelineWrapper object
+        """
+        pipeline_was_modified = False
+        for filter_spec in reversed(required_filters):
+            filter_name = filter_spec['name']
+            if filter_name not in pipe:
+                afters = filter_spec.get('after_fn', lambda _junk: [])(pipe)
+                insert_at = 0
+                for after in afters:
+                    try:
+                        insert_at = max(insert_at, pipe.index(after) + 1)
+                    except ValueError:  # not in pipeline; ignore it
+                        pass
+                self.logger.info(
+                    'Adding required filter %(filter_name)s to pipeline at '
+                    'position %(insert_at)d',
+                    {'filter_name': filter_name, 'insert_at': insert_at})
+                ctx = pipe.create_filter(filter_name)
+                pipe.insert_filter(ctx, index=insert_at)
+                pipeline_was_modified = True
+
+        if pipeline_was_modified:
+            self.logger.info("Pipeline was modified. "
+                             "New pipeline is \"%s\".", pipe)
+        else:
+            self.logger.debug("Pipeline is \"%s\"", pipe)
+
+
+def parse_per_policy_config(conf):
+    """
+    Search the config file for any per-policy config sections and load those
+    sections to a dict mapping policy reference (name or index) to policy
+    options.
+
+    :param conf: the proxy server conf dict
+    :return: a dict mapping policy reference -> dict of policy options
+    :raises ValueError: if a policy config section has an invalid name
+    """
+    policy_section_prefix = conf['__name__'] + ':policy:'
+    return parse_prefixed_conf(conf['__file__'], policy_section_prefix)
+
 
 def app_factory(global_conf, **local_conf):
     """paste.deploy app factory for creating WSGI proxy apps."""
     conf = global_conf.copy()
     conf.update(local_conf)
-    return Application(conf)
+    # Do this here so that the use of conf['__file__'] and conf['__name__'] is
+    # isolated from the Application. This also simplifies tests that construct
+    # an Application instance directly.
+    conf['policy_config'] = parse_per_policy_config(conf)
+    app = Application(conf)
+    app.check_config()
+    return app
+
+
+def main():
+    conf_file, options = parse_options(test_config=True)
+    sys.exit(run_wsgi(conf_file, 'proxy-server', **options))
+
+
+if __name__ == '__main__':
+    main()
diff --git a/test-requirements.txt b/test-requirements.txt
new file mode 100644
index 0000000000..28697926a8
--- /dev/null
+++ b/test-requirements.txt
@@ -0,0 +1,23 @@
+# The order of packages is significant, because pip processes them in the order
+# of appearance. Changing the order has an impact on the overall integration
+# process, which may cause wedges in the gate later.
+
+# Hacking already pins down pep8, pyflakes and flake8
+hacking>=2.0,<7.1.0 # Apache-2.0
+coverage>=5.2.1 # Apache-2.0
+pytest>=4.6.11  # MIT
+pytest-subtests>=0.3.0  # MIT
+pytest-cov>=2.12.1  # MIT
+stestr>=2.0.0 # Apache-2.0
+python-swiftclient>=3.2.0
+python-keystoneclient>=3.19.0 # Apache-2.0
+boto>=2.32.1
+boto3>=1.9
+botocore>=1.12
+requests-mock>=1.2.0 # Apache-2.0
+keystonemiddleware>=4.17.0 # Apache-2.0
+
+# Security checks
+bandit>=1.1.0 # Apache-2.0
+
+docutils>=0.15  # OSI-Approved Open Source, Public Domain
diff --git a/test/__init__.py b/test/__init__.py
index 50b24ed1a9..d048c62593 100644
--- a/test/__init__.py
+++ b/test/__init__.py
@@ -1,15 +1,44 @@
-# See http://code.google.com/p/python-nose/issues/detail?id=373
-# The code below enables nosetests to work with i18n _() blocks
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
 
-import __builtin__
 import sys
+
 import os
-from ConfigParser import MissingSectionHeaderError
-from StringIO import StringIO
 
-from swift.common.utils import readconf
+from unittest.util import safe_repr
+
+import warnings
+warnings.filterwarnings('ignore', module='cryptography|OpenSSL', message=(
+    'Python 2 is no longer supported by the Python core team. '
+    'Support for it is now deprecated in cryptography, '
+    'and will be removed in a future release.'))
+warnings.filterwarnings('ignore', module='cryptography|OpenSSL', message=(
+    'Python 2 is no longer supported by the Python core team. '
+    'Support for it is now deprecated in cryptography, '
+    'and will be removed in the next release.'))
+warnings.filterwarnings('ignore', message=(
+    'Python 3.6 is no longer supported by the Python core team. '
+    'Therefore, support for it is deprecated in cryptography '
+    'and will be removed in a future release.'))
 
-setattr(__builtin__, '_', lambda x: x)
+import unittest
+
+from eventlet.green import socket
+
+from swift.common.utils import readconf
+from swift.common.utils.timestamp import Timestamp
 
 
 # Work around what seems to be a Python bug.
@@ -25,25 +54,77 @@ def get_config(section_name=None, defaults=None):
     :param section_name: the section to read (all sections if not defined)
     :param defaults: an optional dictionary namespace of defaults
     """
-    config_file = os.environ.get('SWIFT_TEST_CONFIG_FILE',
-                                 '/etc/swift/test.conf')
     config = {}
     if defaults is not None:
         config.update(defaults)
 
+    config_file = os.environ.get('SWIFT_TEST_CONFIG_FILE',
+                                 '/etc/swift/test.conf')
     try:
         config = readconf(config_file, section_name)
-    except SystemExit:
+    except IOError:
         if not os.path.exists(config_file):
-            print >>sys.stderr, \
-                'Unable to read test config %s - file not found' \
-                % config_file
+            print('Unable to read test config %s - file not found'
+                  % config_file, file=sys.stderr)
         elif not os.access(config_file, os.R_OK):
-            print >>sys.stderr, \
-                'Unable to read test config %s - permission denied' \
-                % config_file
-        else:
-            print >>sys.stderr, \
-                'Unable to read test config %s - section %s not found' \
-                % (config_file, section_name)
+            print('Unable to read test config %s - permission denied'
+                  % config_file, file=sys.stderr)
+    except ValueError as e:
+        print(e)
     return config
+
+
+def listen_zero():
+    """
+    The eventlet.listen() always sets SO_REUSEPORT, so when called with
+    ("localhost",0), instead of returning unique ports it can return the
+    same port twice. That causes our tests to fail, so open-code it here
+    without SO_REUSEPORT.
+    """
+    sock = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
+    sock.bind(("127.0.0.1", 0))
+    sock.listen(50)
+    return sock
+
+
+class BaseTestCase(unittest.TestCase):
+    def _assertDictContainsSubset(self, subset, dictionary, msg=None):
+        """Checks whether dictionary is a superset of subset."""
+        # This is almost identical to the method in python3.4 version of
+        # unitest.case.TestCase.assertDictContainsSubset, reproduced here to
+        # avoid the deprecation warning in the original when using python3.
+        missing = []
+        mismatched = []
+        for key, value in subset.items():
+            if key not in dictionary:
+                missing.append(key)
+            elif value != dictionary[key]:
+                mismatched.append('%s, expected: %s, actual: %s' %
+                                  (safe_repr(key), safe_repr(value),
+                                   safe_repr(dictionary[key])))
+
+        if not (missing or mismatched):
+            return
+
+        standardMsg = ''
+        if missing:
+            standardMsg = 'Missing: %s' % ','.join(safe_repr(m) for m in
+                                                   missing)
+        if mismatched:
+            if standardMsg:
+                standardMsg += '; '
+            standardMsg += 'Mismatched values: %s' % ','.join(mismatched)
+
+        self.fail(self._formatMessage(msg, standardMsg))
+
+    def assert_valid_timestamp(self, timestamp):
+        """
+        Helper that asserts the given timestamp is a valid Timestamp
+        representation.
+
+        :param timestamp: a string or instance of Timestamp
+        """
+        try:
+            timestamp = Timestamp(timestamp)
+        except (ValueError, TypeError) as e:
+            self.fail('Invalid timestamp (%r): %r' % (timestamp, e))
diff --git a/test/cors/README.rst b/test/cors/README.rst
new file mode 100644
index 0000000000..72fc8b4524
--- /dev/null
+++ b/test/cors/README.rst
@@ -0,0 +1,122 @@
+CORS Functional Tests
+=====================
+
+`Cross Origin Resource Sharing <https://www.w3.org/TR/cors/>`__ is a bit
+of a complicated beast. It focuses on the interactions between
+
+* a **user-agent** (typically a web browser),
+* a "**source origin**" server (whose code the user-agent is running), and
+* some **other server** (for our purposes, usually Swift).
+
+Where it gets hairy is that there may be varying degrees of trust between
+these different actors.
+
+Fortunately, Swift `allows per-container configuration
+<https://docs.openstack.org/swift/latest/cors.html>`__ of many CORS options.
+However, our normal functional tests only exercise bits and pieces of CORS,
+without telling a complete story or performing a true end-to-end test. *These*
+tests aim to remedy that.
+
+The tests consist of three parts:
+
+* setup
+    Create several test containers with well-known names, set appropriate
+    ACLs and CORS metadata, and upload some test objects.
+
+* serve
+    Serve a static website on localhost which, on load, will make several
+    CORS requests and verify expected behavior.
+
+* run
+    Use Selenium to load the website, wait for and scrape the results, and
+    output them in `TAP format <http://testanything.org/tap-specification.html>`__.
+    Alternatively, open the page in your local browser and manually inspect whether
+    tests passed or failed.
+
+All of this is orchestrated through ``main.py``. It uses the standard ``OS_*``
+environment variables to determine how to connect to Swift:
+
+* ``OS_AUTH_URL`` (or ``ST_AUTH``)
+* ``OS_USERNAME`` (or ``ST_USER``)
+* ``OS_PASSWORD`` (or ``ST_KEY``)
+* ``OS_STORAGE_URL`` (optional)
+
+There are additional environment variables to exercise the S3 API:
+
+* ``S3_ENDPOINT``
+* ``S3_USER``
+* ``S3_KEY``
+
+.. note::
+   It is necessary to set `s3_acl = False` in the `[filter:s3api]` section of
+   your `proxy-server.conf` for all the s3 object tests to pass.
+
+..
+   TODO: verify that this works with Keystone
+
+Running Tests Manually
+----------------------
+
+To inspect the test results in your local browser, run::
+
+   $ ./test/cors/main.py --no-run
+
+This will create some test containers and object in Swift, start a simple
+static site, and emit a URL to visit to run the tests, like::
+
+   Serving test at http://localhost:8000/#OS_AUTH_URL=http://saio/auth/v1.0&OS_USERNAME=test:tester&OS_PASSWORD=testing&OS_STORAGE_URL=http://saio/v1/AUTH_test&S3_ENDPOINT=http://saio&S3_USER=test%3Atester&S3_KEY=testing
+
+.. note::
+   You can use ``--hostname`` and ``--port`` to adjust the origin used.
+
+Open the link. Toward the top of the page will be a status line; it will cycle
+through the following states:
+
+* Loading
+* Starting jobs
+* Waiting for jobs to finish
+* Complete
+
+When complete, it will also include a summary of the number of tests run as
+well as pass/fail/skip counts. Below the status line will be a table of
+individual tests with status, description, and additional information.
+
+You can also run a single test by adding a ``&test=<name>`` query parameter.
+For example::
+
+   http://localhost:8000/#OS_AUTH_URL=http://saio/auth/v1.0&OS_USERNAME=test:tester&OS_PASSWORD=testing&OS_STORAGE_URL=http://saio/v1/AUTH_test&test=object%20-%20GET
+
+will just run the test named ``object - GET``.
+
+To stop the server, press ``^C``.
+
+Running Tests with Selenium
+---------------------------
+
+`Selenium <https://www.selenium.dev/>`__ may be used to automate visiting the
+static site, waiting for tests to run, and gathering results. See the
+`installation instructions <https://selenium-python.readthedocs.io/installation.html>`__
+for the Python bindings for more information about setting this up.
+
+.. note::
+   On Linux, you may want to use ``xvfb-run`` to have browsers use a virtual
+   display.
+
+When using selenium, the test runner will try to run tests in Firefox, Chrome,
+Safari, Edge, and IE if available; if a browser seems to not be available, its
+tests will be skipped.
+
+Updating aws-sdk-js
+-------------------
+
+There are tests that exercise CORS over the S3 API; these use a vendored
+version of `aws-sdk-js <https://github.com/aws/aws-sdk-js/>`__ that only
+covers the S3 service. The current version used is 2.829.0, built on
+2021-01-21 by
+
+* visiting https://sdk.amazonaws.com/builder/js/,
+* clearing all services,
+* explicitly adding AWS.S3,
+* clicking "Build" to download,
+* saving in the ``test/cors/vendor`` directory, and finally
+* updating the version number in ``test/cors/test-s3*.js``.
diff --git a/test/cors/harness.js b/test/cors/harness.js
new file mode 100644
index 0000000000..abd4b13b20
--- /dev/null
+++ b/test/cors/harness.js
@@ -0,0 +1,258 @@
+/* global PARAMS, XMLHttpRequest */
+
+const STORAGE_URL = PARAMS.OS_STORAGE_URL || 'http://localhost:8080/v1/AUTH_test'
+
+function makeUrl (path) {
+  if (path.startsWith('http://') || path.startsWith('https://')) {
+    return new URL(path)
+  }
+  if (!path.startsWith('/')) {
+    return new URL(STORAGE_URL + '/' + path)
+  }
+  return new URL(STORAGE_URL.substr(0, STORAGE_URL.indexOf('/', 3 + STORAGE_URL.indexOf('://'))) + path)
+}
+
+export function MakeRequest (method, path, headers, body, params) {
+  var url = makeUrl(path)
+  headers = headers || {}
+  params = params || {}
+  if (!(
+    url.searchParams.has('Signature') ||
+    url.searchParams.has('X-Amz-Signature') ||
+    'Authorization' in headers
+  )) {
+    // give each Swift request a unique query string to avoid ever fetching from cache
+    params['cors-test-time'] = Date.now().toString()
+    params['cors-test-random'] = Math.random().toString()
+  }
+  for (var key in params) {
+      url.searchParams.append(key, params[key])
+  }
+  return new Promise((resolve, reject) => {
+    const req = new XMLHttpRequest()
+    req.addEventListener('readystatechange', function () {
+      if (this.readyState === 4) {
+        resolve(this)
+      }
+    })
+    req.open(method, url.toString())
+    if (headers) {
+      for (const name of Object.keys(headers)) {
+        req.setRequestHeader(name, headers[name])
+      }
+    }
+    req.send(body)
+  })
+}
+
+export function HasStatus (expectedStatus, expectedMessage) {
+  return function (resp) {
+    if (resp.status !== expectedStatus) {
+      throw new Error('Expected status ' + expectedStatus + ', got ' + resp.status)
+    }
+    if (resp.statusText !== expectedMessage) {
+      throw new Error('Expected status text ' + expectedMessage + ', got ' + resp.statusText)
+    }
+    return resp
+  }
+}
+
+export function HasHeaders (headers) {
+  if (headers instanceof Array) {
+    return function (resp) {
+      const missing = headers.filter((h) => !resp.getResponseHeader(h))
+      if (missing.length) {
+        throw new Error('Missing expected headers ' + JSON.stringify(missing) + ' in response: ' + resp.getAllResponseHeaders())
+      }
+      return resp
+    }
+  } else {
+    return function (resp) {
+      const names = Object.keys(headers)
+      const missing = names.filter((h) => !resp.getResponseHeader(h))
+      if (missing.length) {
+        throw new Error('Missing expected headers ' + JSON.stringify(missing) + ' in response: ' + resp.getAllResponseHeaders())
+      }
+      for (const name of names) {
+        const value = resp.getResponseHeader(name)
+        if (name === 'Etag') {
+          // special case for Etag which may or may not be quoted
+          if ((value !== headers[name]) && (value !== "\"" + headers[name] + "\"")) {
+            throw new Error('Expected header ' + name + ' to have value ' + headers[name] + ', got ' + value)
+          }
+        }
+        else if (value !== headers[name]) {
+          throw new Error('Expected header ' + name + ' to have value ' + headers[name] + ', got ' + value)
+        }
+      }
+      return resp
+    }
+  }
+}
+
+export function HasCommonResponseHeaders (resp) {
+  // These appear in most *all* responses, but have unpredictable values
+  HasHeaders([
+    'Last-Modified',
+    'X-Openstack-Request-Id',
+    'X-Timestamp',
+    'X-Trans-Id',
+    'Content-Type'
+  ])(resp)
+  // Save that trans-id and request-id are the same thing
+  if (resp.getResponseHeader('X-Trans-Id') !== resp.getResponseHeader('X-Openstack-Request-Id')) {
+    throw new Error('Expected X-Trans-Id and X-Openstack-Request-Id to match; got ' + resp.getAllResponseHeaders())
+  }
+  // These appear in most responses, but *aren't* (currently) exposed via CORS
+  DoesNotHaveHeaders([
+    'Accept-Ranges',
+    'Access-Control-Allow-Origin',
+    'Access-Control-Expose-Headers',
+    'Date',
+    // Hmmm....
+    'Content-Range',
+    'X-Account-Bytes-Used',
+    'X-Account-Container-Count',
+    'X-Account-Object-Count',
+    'X-Container-Bytes-Used',
+    'X-Container-Object-Count'
+  ])(resp)
+  return resp
+}
+
+export function DoesNotHaveHeaders (headers) {
+  return function (resp) {
+    const found = headers.filter((h) => resp.getResponseHeader(h))
+    if (found.length) {
+      throw new Error('Found unexpected headers ' + found + ' in response: ' + resp.getAllResponseHeaders())
+    }
+    return resp
+  }
+}
+
+export function HasNoBody (resp) {
+  if (resp.responseText !== '') {
+    throw new Error('Expected no response body; got ' + resp.responseText)
+  }
+  return resp
+}
+
+export function BodyHasLength (expectedLength) {
+  return (resp) => {
+    if (resp.responseText.length !== expectedLength) {
+      throw new Error('Expected body to have length ' + expectedLength + ', got ' + resp.responseText.length)
+    }
+    return resp
+  }
+}
+
+export function CorsBlocked (resp) {
+  // Yeah, there's *nothing* useful here -- gotta look at the browser's console if you want to see what happened
+  HasStatus(0, '')(resp)
+  const allHeaders = resp.getAllResponseHeaders()
+  if (allHeaders !== '') {
+    throw new Error('Expected no headers; got ' + allHeaders)
+  }
+  HasNoBody(resp)
+  return resp
+}
+
+function _denial (status, text) {
+  function Denial (resp) {
+    HasStatus(status, text)(resp)
+    const prefix = '<html><h1>' + text + '</h1>'
+    if (!resp.responseText.startsWith(prefix)) {
+      throw new Error('Expected body to start with ' + JSON.stringify(prefix) + '; got ' + JSON.stringify(resp.responseText))
+    }
+
+    HasHeaders({ 'Content-Type': 'text/html; charset=UTF-8' })(resp)
+    HasHeaders([
+      'X-Openstack-Request-Id',
+      'X-Trans-Id',
+      'Content-Type'
+    ])(resp)
+    if (resp.getResponseHeader('X-Trans-Id') !== resp.getResponseHeader('X-Openstack-Request-Id')) {
+      throw new Error('Expected X-Trans-Id and X-Openstack-Request-Id to match; got ' + resp.getAllResponseHeaders())
+    }
+    DoesNotHaveHeaders([
+      'X-Account-Bytes-Used',
+      'X-Account-Container-Count',
+      'X-Account-Object-Count',
+      'X-Container-Bytes-Used',
+      'X-Container-Object-Count',
+      'Etag',
+      'X-Object-Meta-Mtime',
+      'Last-Modified',
+      'X-Timestamp',
+      'Accept-Ranges',
+      'Access-Control-Allow-Origin',
+      'Access-Control-Expose-Headers',
+      'Date',
+      // Hmmm....
+      'Content-Range'
+    ])(resp)
+    return resp
+  }
+  return Denial
+}
+export const Unauthorized = _denial(401, 'Unauthorized')
+export const NotFound = _denial(404, 'Not Found')
+
+const $new = document.createElement.bind(document)
+
+export function Skip (msg) {
+  this.message = msg
+}
+Skip.prototype = new Error()
+
+const testPromises = []
+export function runTests (prefix, tests) {
+  for (let i = 0; i < tests.length; ++i) {
+    const [name, test] = tests[i]
+    const fullName = prefix + ' - ' + name
+    if ('test' in PARAMS && PARAMS['test'] !== fullName) {
+      continue
+    }
+    const row = document.getElementById('results').appendChild($new('tr'))
+    row.appendChild($new('td')).textContent = 'Queued'
+    row.appendChild($new('td')).textContent = fullName
+    row.appendChild($new('td'))
+    testPromises.push(
+      test().then((resp) => {
+        row.childNodes[0].className = 'pass'
+        row.childNodes[0].textContent = 'PASS'
+      }).catch((reason) => {
+        if (reason instanceof Skip) {
+          row.childNodes[0].className = 'skip'
+          row.childNodes[0].textContent = 'SKIP'
+          row.childNodes[2].textContent = reason.message
+        } else {
+          row.childNodes[0].className = 'fail'
+          row.childNodes[0].textContent = 'FAIL'
+          row.childNodes[2].textContent = reason.message || reason
+          if (reason.stack) {
+            row.childNodes[2].textContent += '\n' + reason.stack
+          }
+          throw reason
+        }
+      })
+    )
+  }
+}
+
+window.addEventListener('load', function () {
+  document.getElementById('status').textContent = 'Waiting for all ' + testPromises.length + ' tests to finish...'
+  // Poor-man's version of something approximating
+  //    Promise.allSettled(testPromises).then((results) => {
+  // for Firefox < 71, Chrome < 76, etc.
+  Promise.all(testPromises.map(x => x.then((x) => x, (x) => x))).then(() => {
+    const resultTable = document.getElementById('results')
+    document.getElementById('status').textContent = (
+      'Complete.' +
+      ' TESTS: ' + resultTable.childNodes.length +
+      ' PASS: ' + resultTable.querySelectorAll('.pass').length +
+      ' FAIL: ' + resultTable.querySelectorAll('.fail').length +
+      ' SKIP: ' + resultTable.querySelectorAll('.skip').length
+    )
+  })
+})
diff --git a/test/cors/index.html b/test/cors/index.html
new file mode 100644
index 0000000000..9a9654756a
--- /dev/null
+++ b/test/cors/index.html
@@ -0,0 +1,44 @@
+<html>
+    <head>
+        <meta charset="utf-8" />
+        <title>CORS Tests</title>
+        <style type="text/css">
+tr:nth-child(2n) { background: lightgrey; }
+.pass { background: green; }
+.fail { background: red; }
+.skip { background: orange; }
+td:nth-child(1) {
+    padding: .1em;
+    width: 8em;
+    text-align: center;
+}
+td:nth-child(2) {
+    width: 50%;
+}
+        </style>
+        <script type="text/javascript">
+            const PARAMS = !window.location.hash ? {} : window.location.hash.substr(1)
+                .split('&')
+                .map(v => v.split('='))
+                .reduce( (acc, [key, val]) => ({ ...acc, [unescape(key)]: unescape(val) }), {})
+            console.log(PARAMS)
+            var _xamzrequire // Needed to be able to import the sdk later
+        </script>
+        <script type="module" src="test-info.js"></script>
+        <script type="module" src="test-account.js"></script>
+        <script type="module" src="test-container.js"></script>
+        <script type="module" src="test-object.js"></script>
+        <script type="module" src="test-large-objects.js"></script>
+        <script type="module" src="test-symlink.js"></script>
+        <script type="module" src="test-s3-obj.js"></script>
+    </head>
+    <body>
+        <h2>CORS Tests</h2>
+        <div id="status">Loading...</div>
+        <table>
+            <thead><th>Result</th><th>Name</th><th>Details</th></thead>
+            <tbody id="results"></tbody>
+        </table>
+        <pre id="dumper"></pre>
+    </body>
+</html>
diff --git a/test/cors/main.py b/test/cors/main.py
new file mode 100755
index 0000000000..f081470088
--- /dev/null
+++ b/test/cors/main.py
@@ -0,0 +1,342 @@
+#!/usr/bin/env python
+
+# Copyright (c) 2020 SwiftStack, Inc.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import argparse
+import json
+import os
+import os.path
+import sys
+import threading
+import time
+import traceback
+
+import urllib.parse
+import socketserver
+import http.server
+
+try:
+    import selenium.webdriver
+except ImportError:
+    selenium = None
+import swiftclient.client
+
+DEFAULT_ENV = {
+    'OS_AUTH_URL': os.environ.get('ST_AUTH',
+                                  'http://localhost:8080/auth/v1.0'),
+    'OS_USERNAME': os.environ.get('ST_USER', 'test:tester'),
+    'OS_PASSWORD': os.environ.get('ST_KEY', 'testing'),
+    'OS_STORAGE_URL': None,
+    'S3_ENDPOINT': None,
+    'S3_USER': 'test:tester',
+    'S3_KEY': 'testing',
+}
+ENV = {key: os.environ.get(key, default)
+       for key, default in DEFAULT_ENV.items()}
+
+TEST_TIMEOUT = 120.0  # seconds
+STEPS = 500
+
+
+class CORSSiteHandler(http.server.SimpleHTTPRequestHandler):
+    def __init__(self, *args, **kwargs):
+        super().__init__(
+            *args,
+            directory=os.path.realpath(os.path.dirname(__file__)),
+            **kwargs,
+        )
+
+    def log_message(self, fmt, *args):
+        pass  # quiet, you!
+
+
+class CORSSiteServer(socketserver.TCPServer):
+    allow_reuse_address = True
+
+
+class CORSSite(threading.Thread):
+    def __init__(self, bind_port=8000):
+        super().__init__()
+        self.server = None
+        self.bind_port = bind_port
+
+    def run(self):
+        self.server = CORSSiteServer(
+            ('0.0.0.0', self.bind_port),
+            CORSSiteHandler)
+        self.server.serve_forever()
+
+    def terminate(self):
+        if self.server is not None:
+            self.server.shutdown()
+            self.join()
+
+
+class Zeroes(object):
+    BUF = b'\x00' * 64 * 1024
+
+    def __init__(self, size=0):
+        self.pos = 0
+        self.size = size
+
+    def __iter__(self):
+        while self.pos < self.size:
+            chunk = self.BUF[:self.size - self.pos]
+            self.pos += len(chunk)
+            yield chunk
+
+    def __len__(self):
+        return self.size
+
+
+def setup(args):
+    conn = swiftclient.client.Connection(
+        ENV['OS_AUTH_URL'],
+        ENV['OS_USERNAME'],
+        ENV['OS_PASSWORD'],
+        timeout=30)  # We've seen request times as high as 7-8s in the gate
+    cluster_info = conn.get_capabilities()
+    conn.put_container('private', {
+        'X-Container-Read': '',
+        'X-Container-Meta-Access-Control-Allow-Origin': '',
+    })
+    conn.put_container('referrer-allowed', {
+        'X-Container-Read': '.r:%s' % args.hostname,
+        'X-Container-Meta-Access-Control-Allow-Origin': (
+            'http://%s:%d' % (args.hostname, args.port)),
+    })
+    conn.put_container('other-referrer-allowed', {
+        'X-Container-Read': '.r:other-host',
+        'X-Container-Meta-Access-Control-Allow-Origin': 'http://other-host',
+    })
+    conn.put_container('public-with-cors', {
+        'X-Container-Read': '.r:*,.rlistings',
+        'X-Container-Meta-Access-Control-Allow-Origin': '*',
+    })
+    conn.put_container('private-with-cors', {
+        'X-Container-Read': '',
+        'X-Container-Meta-Access-Control-Allow-Origin': '*',
+    })
+    conn.put_container('public-no-cors', {
+        'X-Container-Read': '.r:*,.rlistings',
+        'X-Container-Meta-Access-Control-Allow-Origin': '',
+    })
+    conn.put_container('public-segments', {
+        'X-Container-Read': '.r:*',
+        'X-Container-Meta-Access-Control-Allow-Origin': '',
+    })
+
+    for container in ('private', 'referrer-allowed', 'other-referrer-allowed',
+                      'public-with-cors', 'private-with-cors',
+                      'public-no-cors'):
+        conn.put_object(container, 'obj', Zeroes(1024), headers={
+            'X-Object-Meta-Mtime': str(time.time())})
+    for n in range(10):
+        segment_etag = conn.put_object(
+            'public-segments', 'seg%02d' % n, Zeroes(1024 * 1024),
+            headers={'Content-Type': 'application/swiftclient-segment'})
+        conn.put_object(
+            'public-with-cors', 'dlo/seg%02d' % n, Zeroes(1024 * 1024),
+            headers={'Content-Type': 'application/swiftclient-segment'})
+    conn.put_object('public-with-cors', 'dlo-with-unlistable-segments', b'',
+                    headers={'X-Object-Manifest': 'public-segments/seg'})
+    conn.put_object('public-with-cors', 'dlo', b'',
+                    headers={'X-Object-Manifest': 'public-with-cors/dlo/seg'})
+
+    if 'slo' in cluster_info:
+        conn.put_object('public-with-cors', 'slo', json.dumps([
+            {'path': 'public-segments/seg%02d' % n, 'etag': segment_etag}
+            for n in range(10)]), query_string='multipart-manifest=put')
+
+    if 'symlink' in cluster_info:
+        for tgt in ('private', 'public-with-cors', 'public-no-cors'):
+            conn.put_object('public-with-cors', 'symlink-to-' + tgt, b'',
+                            headers={'X-Symlink-Target': tgt + '/obj'})
+
+
+def get_results_table(browser):
+    result_table = browser.find_element_by_id('results')
+    for row in result_table.find_elements_by_xpath('./tr'):
+        cells = row.find_elements_by_xpath('td')
+        yield (
+            cells[0].text,
+            browser.name + ': ' + cells[1].text,
+            cells[2].text)
+
+
+def run(args, url):
+    results = []
+    browsers = list(ALL_BROWSERS) if 'all' in args.browsers else args.browsers
+    ran_one = False
+    for browser_name in browsers:
+        kwargs = {}
+        try:
+            options = getattr(
+                selenium.webdriver, browser_name.title() + 'Options')()
+            options.headless = True
+            kwargs['options'] = options
+        except AttributeError:
+            # not all browser types have Options class
+            pass
+
+        driver = getattr(selenium.webdriver, browser_name.title())
+        try:
+            browser = driver(**kwargs)
+        except Exception as e:
+            if not any(x in str(e) for x in (
+                'needs to be in PATH',
+                'SafariDriver was not found',
+                'OSError: [Errno 8] Exec format error',
+                'safaridriver not available for download',
+            )):
+                traceback.print_exc()
+            results.append(('SKIP', browser_name, str(e).strip()))
+            continue
+        ran_one = True
+        try:
+            browser.get(url)
+
+            start = time.time()
+            for _ in range(STEPS):
+                status = browser.find_element_by_id('status').text
+                if status.startswith('Complete'):
+                    results.extend(get_results_table(browser))
+                    break
+                time.sleep(TEST_TIMEOUT / STEPS)
+            else:
+                try:
+                    results.extend(get_results_table(browser))
+                except Exception:
+                    pass  # worth a shot
+                # that took a sec; give it *one last chance* to succeed
+                status = browser.find_element_by_id('status').text
+                if not status.startswith('Complete'):
+                    results.append((
+                        'ERROR', browser_name, 'Timed out (%s)' % status))
+                    continue
+            sys.stderr.write('Tested %s in %.1fs\n' % (
+                browser_name, time.time() - start))
+        except Exception as e:
+            results.append(('ERROR', browser_name, str(e).strip()))
+        finally:
+            browser.close()
+
+    if args.output is not None:
+        fp = open(args.output, 'w')
+    else:
+        fp = sys.stdout
+
+    fp.write('1..%d\n' % len(results))
+    rc = 0
+    if not ran_one:
+        rc += 1  # make sure "no tests ran" translates to "failed"
+    for test, (status, name, details) in enumerate(results, start=1):
+        if status == 'PASS':
+            fp.write('ok %d - %s\n' % (test, name))
+        elif status == 'SKIP':
+            fp.write('ok %d - %s # skip %s\n' % (test, name, details))
+        else:
+            fp.write('not ok %d - %s\n' % (test, name))
+            fp.write('  %s%s\n' % (status, ':' if details else ''))
+            if details:
+                fp.write(''.join(
+                    '  ' + line + '\n'
+                    for line in details.split('\n')))
+            rc += 1
+
+    if fp is not sys.stdout:
+        fp.close()
+
+    return rc
+
+
+ALL_BROWSERS = [
+    'firefox',
+    'chrome',
+    'safari',
+    'edge',
+    'ie',
+]
+
+if __name__ == '__main__':
+    parser = argparse.ArgumentParser(
+        formatter_class=argparse.RawDescriptionHelpFormatter,
+        description='Set up and run CORS functional tests',
+        epilog='''The tests consist of three parts:
+
+setup - Create several test containers with well-known names, set appropriate
+        ACLs and CORS metadata, and upload some test objects.
+serve - Serve a static website on localhost which, on load, will make several
+        CORS requests and verify expected behavior.
+run   - Use Selenium to load the website, wait for and scrape the results,
+        and output them in TAP format.
+
+By default, perform all three parts. You can skip some or all of the parts
+with the --no-setup, --no-serve, and --no-run options.
+''')
+    parser.add_argument('-P', '--port', type=int, default=8000)
+    parser.add_argument('-H', '--hostname', default='localhost')
+    parser.add_argument('--no-setup', action='store_true')
+    parser.add_argument('--no-serve', action='store_true')
+    parser.add_argument('--no-run', action='store_true')
+    parser.add_argument('-o', '--output')
+    parser.add_argument('browsers', nargs='*',
+                        default='all',
+                        choices=['all'] + ALL_BROWSERS)
+    args = parser.parse_args()
+    if not args.no_setup:
+        setup(args)
+
+    if args.no_serve:
+        site = None
+    else:
+        site = CORSSite(args.port)
+
+    should_run = not args.no_run
+    if should_run and not selenium:
+        print('Selenium not available; cannot run tests automatically')
+        should_run = False
+
+    if ENV['OS_STORAGE_URL'] is None:
+        ENV['OS_STORAGE_URL'] = swiftclient.client.get_auth(
+            ENV['OS_AUTH_URL'],
+            ENV['OS_USERNAME'],
+            ENV['OS_PASSWORD'],
+            timeout=1)[0]
+    if ENV['S3_ENDPOINT'] is None:
+        ENV['S3_ENDPOINT'] = ENV['OS_STORAGE_URL'].partition('/v1')[0]
+
+    url = 'http://%s:%d/#%s' % (args.hostname, args.port, '&'.join(
+        '%s=%s' % (urllib.parse.quote(key), urllib.parse.quote(val))
+        for key, val in ENV.items()))
+
+    rc = 0
+    if should_run:
+        if site:
+            site.start()
+        try:
+            rc = run(args, url)
+        finally:
+            if site:
+                site.terminate()
+    else:
+        if site:
+            print('Serving test at %s' % url)
+            try:
+                site.run()
+            except KeyboardInterrupt:
+                pass
+    exit(rc)
diff --git a/test/cors/test-account.js b/test/cors/test-account.js
new file mode 100644
index 0000000000..b106ed76d0
--- /dev/null
+++ b/test/cors/test-account.js
@@ -0,0 +1,16 @@
+import { runTests, MakeRequest, CorsBlocked } from './harness.js'
+
+runTests('account', [
+  ['GET', () => MakeRequest('GET', '')
+    // 200, but missing Access-Control-Allow-Origin
+    .then(CorsBlocked)],
+  ['HEAD', () => MakeRequest('HEAD', '')
+    // 200, but missing Access-Control-Allow-Origin
+    .then(CorsBlocked)],
+  ['POST', () => MakeRequest('POST', '')
+    // 200, but missing Access-Control-Allow-Origin
+    .then(CorsBlocked)],
+  ['POST with meta', () => MakeRequest('POST', '', { 'X-Account-Meta-Never-Makes-It': 'preflight failed' })
+    // preflight 200s, but it's missing Access-Control-Allow-Origin
+    .then(CorsBlocked)]
+])
diff --git a/test/cors/test-container.js b/test/cors/test-container.js
new file mode 100644
index 0000000000..f95acb6447
--- /dev/null
+++ b/test/cors/test-container.js
@@ -0,0 +1,148 @@
+import {
+  runTests,
+  MakeRequest,
+  HasStatus,
+  HasHeaders,
+  HasCommonResponseHeaders,
+  HasNoBody
+} from './harness.js'
+
+function CheckJsonListing (resp) {
+  HasHeaders({ 'Content-Type': 'application/json; charset=utf-8' })(resp)
+  const listing = JSON.parse(resp.responseText)
+  for (const item of listing) {
+    if ('subdir' in item) {
+      if (Object.keys(item).length !== 1) {
+        throw new Error('Expected subdir to be the only key, got ' + JSON.stringify(item))
+      }
+      continue
+    }
+    const missing = ['name', 'bytes', 'content_type', 'hash', 'last_modified'].filter((key) => !(key in item))
+    if (missing.length) {
+      throw new Error('Listing item is missing expected keys ' + JSON.stringify(missing) + '; got ' + JSON.stringify(item))
+    }
+  }
+  return listing
+}
+
+function HasStatus200Or204 (resp) {
+  if (resp.status === 200) {
+    // NB: some browsers (like chrome) may serve HEADs from cached GETs, leading to the 200
+    HasStatus(200, 'OK')(resp)
+  } else {
+    HasStatus(204, 'No Content')(resp)
+  }
+  return resp
+}
+
+const expectedListing = [
+  'dlo',
+  'dlo-with-unlistable-segments',
+  'dlo/seg00',
+  'dlo/seg01',
+  'dlo/seg02',
+  'dlo/seg03',
+  'dlo/seg04',
+  'dlo/seg05',
+  'dlo/seg06',
+  'dlo/seg07',
+  'dlo/seg08',
+  'dlo/seg09',
+  'obj',
+  'slo',
+  'symlink-to-private',
+  'symlink-to-public-no-cors',
+  'symlink-to-public-with-cors'
+]
+const expectedWithDelimiter = [
+  'dlo',
+  'dlo-with-unlistable-segments',
+  'dlo/',
+  'obj',
+  'slo',
+  'symlink-to-private',
+  'symlink-to-public-no-cors',
+  'symlink-to-public-with-cors'
+]
+
+runTests('container', [
+  ['GET format=plain',
+    () => MakeRequest('GET', 'public-with-cors', {}, '', {'format': 'plain'})
+      .then(HasStatus(200, 'OK'))
+      .then(HasCommonResponseHeaders)
+      .then(HasHeaders({ 'Content-Type': 'text/plain; charset=utf-8' }))
+      .then((resp) => {
+        const names = resp.responseText.split('\n')
+        if (!(names.length === expectedListing.length + 1 && names.every((name, i) => name === (i === expectedListing.length ? '' : expectedListing[i])))) {
+          throw new Error('Expected listing to have items ' + JSON.stringify(expectedListing) + '; got ' + JSON.stringify(names))
+        }
+      })],
+  ['GET format=json',
+    () => MakeRequest('GET', 'public-with-cors', {}, '', {'format': 'json'})
+      .then(HasStatus(200, 'OK'))
+      .then(HasCommonResponseHeaders)
+      .then(CheckJsonListing)
+      .then((listing) => {
+        const names = listing.map((item) => 'subdir' in item ? item.subdir : item.name)
+        if (!(names.length === expectedListing.length && names.every((name, i) => expectedListing[i] === name))) {
+          throw new Error('Expected listing to have items ' + JSON.stringify(expectedListing) + '; got ' + JSON.stringify(names))
+        }
+      })],
+  ['GET format=json&delimiter=/',
+    () => MakeRequest('GET', 'public-with-cors', {}, '', {'format': 'json', 'delimiter': '/'})
+      .then(HasStatus(200, 'OK'))
+      .then(HasCommonResponseHeaders)
+      .then(CheckJsonListing)
+      .then((listing) => {
+        const names = listing.map((item) => 'subdir' in item ? item.subdir : item.name)
+        if (!(names.length === expectedWithDelimiter.length && names.every((name, i) => expectedWithDelimiter[i] === name))) {
+          throw new Error('Expected listing to have items ' + JSON.stringify(expectedWithDelimiter) + '; got ' + JSON.stringify(names))
+        }
+      })],
+  ['GET format=xml',
+    () => MakeRequest('GET', 'public-with-cors', {}, '', {'format': 'xml'})
+      .then(HasStatus(200, 'OK'))
+      .then(HasHeaders({ 'Content-Type': 'application/xml; charset=utf-8' }))
+      .then((resp) => {
+        const prefix = '<?xml version="1.0" encoding="UTF-8"?>\n<container name="public-with-cors">'
+        if (resp.responseText.substr(0, prefix.length) !== prefix) {
+          throw new Error('Expected response to start with ' + JSON.stringify(prefix) + '; got ' + resp.responseText)
+        }
+      })],
+  ['GET Accept: json',
+    () => MakeRequest('GET', 'public-with-cors', { Accept: 'application/json' })
+      .then(HasStatus(200, 'OK'))
+      .then(HasCommonResponseHeaders)
+      .then(CheckJsonListing)
+      .then((listing) => {
+        if (listing.length !== 17) {
+          throw new Error('Expected exactly 17 items in listing; got ' + listing.length)
+        }
+      })],
+  ['GET Accept: xml',
+    // NB: flakey on Safari -- sometimes it serves JSON from cache, *even with* a Vary: Accept header
+    () => MakeRequest('GET', 'public-with-cors', { Accept: 'application/xml' })
+      .then(HasStatus(200, 'OK'))
+      .then(HasHeaders({ 'Content-Type': 'application/xml; charset=utf-8' }))
+      .then((resp) => {
+        const prefix = '<?xml version="1.0" encoding="UTF-8"?>\n<container name="public-with-cors">'
+        if (resp.responseText.substr(0, prefix.length) !== prefix) {
+          throw new Error('Expected response to start with ' + JSON.stringify(prefix) + '; got ' + resp.responseText)
+        }
+      })],
+  ['HEAD format=plain',
+    () => MakeRequest('HEAD', 'public-with-cors', {}, '', {'format': 'plain'})
+      .then(HasStatus200Or204)
+      .then(HasHeaders({ 'Content-Type': 'text/plain; charset=utf-8' }))
+      .then(HasNoBody)],
+  ['HEAD format=json',
+    () => MakeRequest('HEAD', 'public-with-cors', {}, '', {'format': 'json'})
+      .then(HasStatus200Or204)
+      .then(HasHeaders({ 'Content-Type': 'application/json; charset=utf-8' }))
+      .then(HasNoBody)],
+  ['HEAD format=xml',
+    () => MakeRequest('HEAD', 'public-with-cors', {}, '', {'format': 'xml'})
+      .then(HasStatus200Or204)
+      .then(HasHeaders({ 'Content-Type': 'application/xml; charset=utf-8' }))
+      .then(HasNoBody)]
+])
diff --git a/test/cors/test-info.js b/test/cors/test-info.js
new file mode 100644
index 0000000000..903dbba05c
--- /dev/null
+++ b/test/cors/test-info.js
@@ -0,0 +1,60 @@
+import {
+  runTests,
+  MakeRequest,
+  HasStatus,
+  HasHeaders,
+  DoesNotHaveHeaders,
+  HasNoBody,
+  CorsBlocked
+} from './harness.js'
+
+function CheckInfoHeaders (resp) {
+  return Promise.resolve(resp)
+    .then(HasHeaders({ 'Content-Type': 'application/json; charset=UTF-8' }))
+    .then(HasHeaders(['X-Trans-Id']))
+    .then(DoesNotHaveHeaders([
+      'X-Openstack-Request-Id', // TODO: this is blocked by CORS but almost certainly shouldn't
+      'X-Timestamp',
+      'Accept-Ranges',
+      'Access-Control-Allow-Origin',
+      'Access-Control-Expose-Headers',
+      'Date',
+      'Content-Range'
+    ]))
+}
+function CheckInfoBody (resp) {
+  const clusterInfo = JSON.parse(resp.responseText)
+  if (!('swift' in clusterInfo)) {
+    throw new Error('Expected to find "swift" in /info response; ' +
+                    'got ' + JSON.stringify(clusterInfo))
+  }
+  if (!('version' in clusterInfo.swift)) {
+    throw new Error('Expected to find "swift.version" in /info response; ' +
+                    'got ' + JSON.stringify(clusterInfo.swift))
+  }
+  console.log('Tested against Swift version ' + clusterInfo.swift.version)
+  return clusterInfo
+}
+
+export const GetClusterInfo = MakeRequest('GET', '/info')
+  .then(HasStatus(200, 'OK'))
+  .then(CheckInfoHeaders)
+  .then(CheckInfoBody)
+
+// TODO: /info should probably get an automatic access-control-allow-origin: *
+runTests('cluster info', [
+  ['GET', () => GetClusterInfo],
+  ['GET with header', () => MakeRequest('GET', '/info', { 'X-Trans-Id-Extra': 'my-tracker' })
+    // 200, but missing Access-Control-Allow-Origin
+    .then(CorsBlocked)],
+  ['HEAD', () => MakeRequest('HEAD', '/info')
+    .then(HasStatus(200, 'OK'))
+    .then(CheckInfoHeaders)
+    .then(HasNoBody)],
+  ['OPTIONS', () => MakeRequest('OPTIONS', '/info')
+    // 200, but missing Access-Control-Allow-Origin
+    .then(CorsBlocked)],
+  ['POST', () => MakeRequest('POST', '/info')
+    // 405, but missing Access-Control-Allow-Origin
+    .then(CorsBlocked)]
+])
diff --git a/test/cors/test-large-objects.js b/test/cors/test-large-objects.js
new file mode 100644
index 0000000000..11af1974ff
--- /dev/null
+++ b/test/cors/test-large-objects.js
@@ -0,0 +1,93 @@
+import {
+  runTests,
+  MakeRequest,
+  HasStatus,
+  HasHeaders,
+  HasCommonResponseHeaders,
+  DoesNotHaveHeaders,
+  HasNoBody,
+  CorsBlocked,
+  Skip
+} from './harness.js'
+import { GetClusterInfo } from './test-info.js'
+
+function MakeSloRequest () {
+  return GetClusterInfo.then((clusterInfo) => {
+    if (!('slo' in clusterInfo)) {
+      throw new Skip('SLO is not enabled')
+    }
+    return MakeRequest(...arguments)
+  })
+}
+
+runTests('large object', [
+  ['GET DLO',
+    () => MakeRequest('GET', 'public-with-cors/dlo')
+      .then(HasStatus(200, 'OK'))
+      .then(HasCommonResponseHeaders)
+      .then(HasHeaders({
+        'Content-Type': 'application/octet-stream',
+        ETag: '"8d431e7531abb83a6cf67e56d91c6f74"'
+      }))
+      .then(DoesNotHaveHeaders(['X-Object-Manifest'])) // TODO: should maybe be exposed
+      .then((resp) => {
+        if (resp.responseText.length !== 10485760) {
+          throw new Error('Expected body to have length 10485760, got ' + resp.responseText.length)
+        }
+      })],
+  ['GET DLO with unlistable segments',
+    () => MakeRequest('GET', 'public-with-cors/dlo-with-unlistable-segments')
+      .then(CorsBlocked)], // TODO: should probably be Unauthorized
+  ['GET SLO',
+    () => MakeSloRequest('GET', 'public-with-cors/slo')
+      .then(HasStatus(200, 'OK'))
+      .then(HasCommonResponseHeaders)
+      .then(HasHeaders({
+        'Content-Type': 'application/octet-stream',
+        ETag: '"8d431e7531abb83a6cf67e56d91c6f74"'
+      }))
+      .then(DoesNotHaveHeaders(['X-Static-Large-Object'])) // TODO: should maybe be exposed
+      .then((resp) => {
+        if (resp.responseText.length !== 10485760) {
+          throw new Error('Expected body to have length 10485760, got ' + resp.responseText.length)
+        }
+      })],
+  ['HEAD SLO',
+    () => MakeSloRequest('HEAD', 'public-with-cors/slo')
+      .then(HasStatus(200, 'OK'))
+      .then(HasCommonResponseHeaders)
+      .then(HasHeaders({
+        'Content-Type': 'application/octet-stream',
+        ETag: '"8d431e7531abb83a6cf67e56d91c6f74"'
+      }))
+      .then(DoesNotHaveHeaders(['X-Static-Large-Object'])) // TODO: should maybe be exposed
+      .then(HasNoBody)],
+  ['GET SLO Range',
+    () => MakeSloRequest('GET', 'public-with-cors/slo', { Range: 'bytes=100-199' })
+      .then(HasStatus(206, 'Partial Content'))
+      .then(HasCommonResponseHeaders)
+      .then(HasHeaders({
+        'Content-Type': 'application/octet-stream',
+        ETag: '"8d431e7531abb83a6cf67e56d91c6f74"'
+      }))
+      .then(DoesNotHaveHeaders(['X-Static-Large-Object'])) // TODO: should maybe be exposed
+      .then((resp) => {
+        if (resp.responseText.length !== 100) {
+          throw new Error('Expected body to have length 100, got ' + resp.responseText.length)
+        }
+      })],
+  ['GET SLO Suffix Range',
+    () => MakeSloRequest('GET', 'public-with-cors/slo', { Range: 'bytes=-100' })
+      .then(HasStatus(206, 'Partial Content'))
+      .then(HasCommonResponseHeaders)
+      .then(HasHeaders({
+        'Content-Type': 'application/octet-stream',
+        ETag: '"8d431e7531abb83a6cf67e56d91c6f74"'
+      }))
+      .then(DoesNotHaveHeaders(['X-Static-Large-Object'])) // TODO: should maybe be exposed
+      .then((resp) => {
+        if (resp.responseText.length !== 100) {
+          throw new Error('Expected body to have length 100, got ' + resp.responseText.length)
+        }
+      })]
+])
diff --git a/test/cors/test-object.js b/test/cors/test-object.js
new file mode 100644
index 0000000000..f2cbe7b8dc
--- /dev/null
+++ b/test/cors/test-object.js
@@ -0,0 +1,169 @@
+import {
+  runTests,
+  MakeRequest,
+  HasStatus,
+  HasHeaders,
+  HasCommonResponseHeaders,
+  HasNoBody,
+  BodyHasLength,
+  CorsBlocked,
+  NotFound,
+  Unauthorized
+} from './harness.js'
+
+runTests('object', [
+  ['GET',
+    () => MakeRequest('GET', 'public-with-cors/obj')
+      .then(HasStatus(200, 'OK'))
+      .then(HasCommonResponseHeaders)
+      .then(HasHeaders({
+        'Content-Type': 'application/octet-stream',
+        Etag: '0f343b0931126a20f133d67c2b018a3b'
+      }))
+      .then(HasHeaders(['X-Object-Meta-Mtime']))
+      .then(BodyHasLength(1024))],
+  ['HEAD',
+    () => MakeRequest('HEAD', 'public-with-cors/obj')
+      .then(HasStatus(200, 'OK'))
+      .then(HasCommonResponseHeaders)
+      .then(HasHeaders({ 'Content-Type': 'application/octet-stream' }))
+      .then(HasHeaders(['X-Object-Meta-Mtime']))
+      .then(HasNoBody)],
+  ['GET Range',
+    () => MakeRequest('GET', 'public-with-cors/obj', { Range: 'bytes=100-199' })
+      .then(HasStatus(206, 'Partial Content'))
+      .then(HasCommonResponseHeaders)
+      .then(HasHeaders({
+        'Content-Type': 'application/octet-stream',
+        Etag: '0f343b0931126a20f133d67c2b018a3b'
+      }))
+      .then(HasHeaders(['X-Object-Meta-Mtime']))
+      .then(BodyHasLength(100))],
+  ['GET If-Match matching',
+    () => MakeRequest('GET', 'public-with-cors/obj', { 'If-Match': '0f343b0931126a20f133d67c2b018a3b' })
+      .then(HasStatus(200, 'OK'))
+      .then(HasCommonResponseHeaders)
+      .then(HasHeaders({
+        'Content-Type': 'application/octet-stream',
+        Etag: '0f343b0931126a20f133d67c2b018a3b'
+      }))
+      .then(HasHeaders(['X-Object-Meta-Mtime']))
+      .then(BodyHasLength(1024))],
+  ['GET If-Match not matching',
+    () => MakeRequest('GET', 'public-with-cors/obj', { 'If-Match': 'something-else' })
+      .then(HasStatus(412, 'Precondition Failed'))
+      .then(HasCommonResponseHeaders)
+      .then(HasHeaders({
+        'Content-Type': 'text/html; charset=UTF-8',
+        Etag: '0f343b0931126a20f133d67c2b018a3b'
+      }))
+      .then(HasHeaders(['X-Object-Meta-Mtime']))
+      .then(HasNoBody)],
+  ['GET If-None-Match matching',
+    () => MakeRequest('GET', 'public-with-cors/obj', { 'If-None-Match': '0f343b0931126a20f133d67c2b018a3b' })
+      .then(HasStatus(304, 'Not Modified'))
+      .then(HasCommonResponseHeaders)
+      .then(HasHeaders({
+        // TODO: Content-Type can vary depending on storage policy type...
+        // 'Content-Type': 'application/octet-stream',
+        Etag: '0f343b0931126a20f133d67c2b018a3b'
+      }))
+      .then(HasHeaders(['Content-Type', 'X-Object-Meta-Mtime']))
+      .then(HasNoBody)],
+  ['GET If-None-Match not matching',
+    () => MakeRequest('GET', 'public-with-cors/obj', { 'If-None-Match': 'something-else' })
+      .then(HasStatus(200, 'OK'))
+      .then(HasCommonResponseHeaders)
+      .then(HasHeaders({
+        'Content-Type': 'application/octet-stream',
+        Etag: '0f343b0931126a20f133d67c2b018a3b'
+      }))
+      .then(HasHeaders(['X-Object-Meta-Mtime']))
+      .then(BodyHasLength(1024))],
+  ['GET not found',
+    () => MakeRequest('GET', 'public-with-cors/should-404')
+      .then(NotFound)],
+  ['POST',
+    () => MakeRequest('POST', 'public-with-cors/obj')
+      // No good way to make a container publicly-writable
+      .then(Unauthorized)],
+  ['POST with meta',
+    () => MakeRequest('POST', 'public-with-cors/obj', { 'X-Object-Meta-Foo': 'bar' })
+      // Still no good way to make a container publicly-writable, but notably,
+      // *the POST goes through* and this isn't just CorsBlocked
+      .then(Unauthorized)],
+  ['GET no CORS, object exists',
+    () => MakeRequest('GET', 'public-no-cors/obj')
+      .then(CorsBlocked)], // But req 200s
+  ['GET no CORS, object does not exist',
+    () => MakeRequest('GET', 'public-no-cors/should-404')
+      .then(CorsBlocked)], // But req 404s
+  ['GET Range no CORS',
+    () => MakeRequest('GET', 'public-no-cors/obj', { Range: 'bytes=100-199' })
+      .then(CorsBlocked)], // preflight fails
+  ['GET other-referrer, object exists',
+    () => MakeRequest('GET', 'other-referrer-allowed/obj')
+      .then(CorsBlocked)], // But req 401s
+  ['GET other-referrer, object does not exist',
+    () => MakeRequest('GET', 'other-referrer-allowed/should-404')
+      .then(CorsBlocked)], // But req 401s
+  ['GET Range other-referrer',
+    () => MakeRequest('GET', 'other-referrer-allowed/obj', { Range: 'bytes=100-199' })
+      .then(CorsBlocked)], // preflight fails
+  ['GET other-referrer, attempt to spoof referer',
+    () => MakeRequest('GET', 'other-referrer-allowed/obj', { Referer: 'https://other-host' })
+      .then(CorsBlocked)], // new header gets ignored, req 401s with no allow-origin
+  ['GET no ACL, object exists',
+    () => MakeRequest('GET', 'private-with-cors/obj')
+      .then(Unauthorized)],
+  ['GET no ACL, object does not exist',
+    () => MakeRequest('GET', 'private-with-cors/would-404')
+      .then(Unauthorized)],
+  ['GET completely private',
+    () => MakeRequest('GET', 'private/obj')
+      .then(CorsBlocked)],
+  ['GET Range completely private',
+    () => MakeRequest('GET', 'private/obj', { Range: 'bytes=100-199' })
+      .then(CorsBlocked)],
+  ['GET referrer allowed',
+    () => MakeRequest('GET', 'referrer-allowed/obj')
+      .then(HasStatus(200, 'OK'))
+      .then(HasCommonResponseHeaders)
+      .then(HasHeaders({
+        'Content-Type': 'application/octet-stream',
+        Etag: '0f343b0931126a20f133d67c2b018a3b'
+      }))
+      .then(HasHeaders(['X-Object-Meta-Mtime']))
+      .then(BodyHasLength(1024))],
+  ['HEAD referrer allowed',
+    () => MakeRequest('HEAD', 'referrer-allowed/obj')
+      .then(HasStatus(200, 'OK'))
+      .then(HasCommonResponseHeaders)
+      .then(HasHeaders({
+        'Content-Type': 'application/octet-stream',
+        Etag: '0f343b0931126a20f133d67c2b018a3b'
+      }))
+      .then(HasHeaders(['X-Object-Meta-Mtime']))
+      .then(HasNoBody)],
+  ['GET Range referrer allowed',
+    () => MakeRequest('GET', 'referrer-allowed/obj', { Range: 'bytes=100-199' })
+      .then(HasStatus(206, 'Partial Content'))
+      .then(HasCommonResponseHeaders)
+      .then(HasHeaders({
+        'Content-Type': 'application/octet-stream',
+        Etag: '0f343b0931126a20f133d67c2b018a3b'
+      }))
+      .then(HasHeaders(['X-Object-Meta-Mtime']))
+      .then(BodyHasLength(100))],
+  ['GET attempt to spoof referer',
+    () => MakeRequest('GET', 'referrer-allowed/obj', { Referer: 'https://other-host' })
+      // new header gets ignored, no preflight, get succeeds
+      .then(HasStatus(200, 'OK'))
+      .then(HasCommonResponseHeaders)
+      .then(HasHeaders({
+        'Content-Type': 'application/octet-stream',
+        Etag: '0f343b0931126a20f133d67c2b018a3b'
+      }))
+      .then(HasHeaders(['X-Object-Meta-Mtime']))
+      .then(BodyHasLength(1024))]
+])
diff --git a/test/cors/test-s3-obj.js b/test/cors/test-s3-obj.js
new file mode 100644
index 0000000000..1dbc8189ce
--- /dev/null
+++ b/test/cors/test-s3-obj.js
@@ -0,0 +1,243 @@
+/* global PARAMS */
+
+import {
+  runTests,
+  MakeRequest,
+  HasStatus,
+  HasHeaders,
+  DoesNotHaveHeaders,
+  HasNoBody,
+  BodyHasLength,
+  CorsBlocked
+} from './harness.js'
+
+import './vendor/aws-sdk-2.829.0.min.js'
+const AWS = window.AWS
+
+function CheckTransactionIdHeaders (resp) {
+  return Promise.resolve(resp)
+    .then(HasHeaders([
+      'x-amz-request-id',
+      'x-amz-id-2',
+      'X-Openstack-Request-Id',
+      'X-Trans-Id'
+    ]))
+    .then((resp) => {
+      const txnId = resp.getResponseHeader('X-Openstack-Request-Id')
+      return Promise.resolve(resp)
+        .then(HasHeaders({
+          'x-amz-request-id': txnId,
+          'x-amz-id-2': txnId,
+          'X-Trans-Id': txnId
+        }))
+    })
+}
+function CheckS3Headers (resp) {
+  return Promise.resolve(resp)
+    .then(HasHeaders([
+      'Last-Modified',
+      'Content-Type'
+    ]))
+    .then(CheckTransactionIdHeaders)
+    .then(DoesNotHaveHeaders([
+      'X-Timestamp',
+      'Accept-Ranges',
+      'Access-Control-Allow-Origin',
+      'Access-Control-Expose-Headers',
+      'Date',
+      // Hmmm....
+      'Content-Range',
+      'X-Account-Bytes-Used',
+      'X-Account-Container-Count',
+      'X-Account-Object-Count',
+      'X-Container-Bytes-Used',
+      'X-Container-Object-Count'
+    ]))
+}
+
+function MakeS3Request (service, operation, params) {
+  return new Promise((resolve, reject) => {
+    const s3req = service[operation](params)
+    // Don't *actually* send it
+    s3req.removeListener('send', AWS.EventListeners.Core.SEND)
+
+    // Instead, copy method, path, headers over to a new test-harness request
+    s3req.addListener('send', function () {
+      const endpoint = s3req.httpRequest.endpoint
+      const signedReq = s3req.httpRequest
+
+      const filteredHeaders = {}
+      for (const header of Object.keys(signedReq.headers)) {
+        if (header === 'Host' || header === 'Content-Length') {
+          continue // browser won't let you send these anyway
+        }
+        filteredHeaders[header] = signedReq.headers[header]
+      }
+      resolve(MakeRequest(
+        signedReq.method,
+        endpoint.protocol + '//' + endpoint.host + signedReq.path,
+        filteredHeaders,
+        signedReq.body
+      ))
+    })
+
+    s3req.send()
+  })
+}
+
+function makeTests (params) {
+  const service = new AWS.S3(params)
+  return [
+    ['presigned GET, no CORS',
+      () => MakeRequest('GET', service.getSignedUrl('getObject', {
+        Bucket: 'public-no-cors',
+        Key: 'obj'
+      }))
+        .then(CorsBlocked)],
+    ['presigned HEAD, no CORS',
+      () => MakeRequest('HEAD', service.getSignedUrl('headObject', {
+        Bucket: 'public-no-cors',
+        Key: 'obj'
+      }))
+        .then(CorsBlocked)],
+    ['presigned GET, object exists',
+      () => MakeRequest('GET', service.getSignedUrl('getObject', {
+        Bucket: 'private-with-cors',
+        Key: 'obj'
+      }))
+        .then(HasStatus(200, 'OK'))
+        .then(CheckS3Headers)
+        .then(HasHeaders(['x-amz-meta-mtime']))
+        .then(DoesNotHaveHeaders(['X-Object-Meta-Mtime']))
+        .then(HasHeaders({
+          'Content-Type': 'application/octet-stream',
+          Etag: '"0f343b0931126a20f133d67c2b018a3b"'
+        }))
+        .then(BodyHasLength(1024))],
+    ['presigned HEAD, object exists',
+      () => MakeRequest('HEAD', service.getSignedUrl('headObject', {
+        Bucket: 'private-with-cors',
+        Key: 'obj'
+      }))
+        .then(HasStatus(200, 'OK'))
+        .then(CheckS3Headers)
+        .then(HasHeaders(['x-amz-meta-mtime']))
+        .then(DoesNotHaveHeaders(['X-Object-Meta-Mtime']))
+        .then(HasHeaders({
+          'Content-Type': 'application/octet-stream',
+          Etag: '"0f343b0931126a20f133d67c2b018a3b"'
+        }))
+        .then(HasNoBody)],
+    ['GET, object exists',
+      () => MakeS3Request(service, 'getObject', {
+        Bucket: 'private-with-cors',
+        Key: 'obj'
+      })
+        .then(HasStatus(200, 'OK'))
+        .then(CheckS3Headers)
+        .then(HasHeaders(['x-amz-meta-mtime']))
+        .then(DoesNotHaveHeaders(['X-Object-Meta-Mtime']))
+        .then(HasHeaders({
+          'Content-Type': 'application/octet-stream',
+          Etag: '"0f343b0931126a20f133d67c2b018a3b"'
+        }))
+        .then(BodyHasLength(1024))],
+    ['PUT then DELETE',
+      () => Promise.resolve('put-target-' + Math.random()).then((objectName) => {
+        return MakeS3Request(service, 'putObject', {
+          Bucket: 'private-with-cors',
+          Key: objectName,
+          Body: 'test'
+        })
+          .then(HasStatus(200, 'OK'))
+          .then(CheckS3Headers)
+          .then(HasHeaders({
+            'Content-Type': 'text/html; charset=UTF-8',
+            Etag: '"098f6bcd4621d373cade4e832627b4f6"'
+          }))
+          .then(HasNoBody)
+          .then((resp) => {
+            return MakeS3Request(service, 'deleteObject', {
+              Bucket: 'private-with-cors',
+              Key: objectName
+            })
+          })
+          .then(HasStatus(204, 'No Content'))
+          .then(CheckTransactionIdHeaders)
+          .then(HasNoBody)
+      })],
+    ['presigned PUT then DELETE',
+      () => Promise.resolve('put-target-' + Math.random()).then((objectName) => {
+        return MakeRequest('PUT', service.getSignedUrl('putObject', {
+          Bucket: 'private-with-cors',
+          Key: objectName,
+          ContentType: 'application/octet-stream'
+          // Consciously go for an unsigned payload
+        }), {'Content-Type': 'application/octet-stream'}, 'test')
+          .then(HasStatus(200, 'OK'))
+          .then(CheckS3Headers)
+          .then(HasHeaders({
+            'Content-Type': 'text/html; charset=UTF-8',
+            Etag: '"098f6bcd4621d373cade4e832627b4f6"'
+          }))
+          .then(HasNoBody)
+          .then((resp) => {
+            return MakeRequest('DELETE', service.getSignedUrl('deleteObject', {
+              Bucket: 'private-with-cors',
+              Key: objectName
+            }))
+          })
+          .then(HasStatus(204, 'No Content'))
+          .then(CheckTransactionIdHeaders)
+          .then(HasNoBody)
+      })],
+    ['GET If-Match matching',
+      () => MakeS3Request(service, 'getObject', {
+        Bucket: 'private-with-cors',
+        Key: 'obj',
+        IfMatch: '0f343b0931126a20f133d67c2b018a3b'
+      })
+        .then(HasStatus(200, 'OK'))
+        .then(CheckS3Headers)
+        .then(HasHeaders(['x-amz-meta-mtime']))
+        .then(DoesNotHaveHeaders(['X-Object-Meta-Mtime']))
+        .then(HasHeaders({
+          'Content-Type': 'application/octet-stream',
+          Etag: '"0f343b0931126a20f133d67c2b018a3b"'
+        }))
+        .then(BodyHasLength(1024))],
+    ['GET Range',
+      () => MakeS3Request(service, 'getObject', {
+        Bucket: 'private-with-cors',
+        Key: 'obj',
+        Range: 'bytes=100-199'
+      })
+        .then(HasStatus(206, 'Partial Content'))
+        .then(CheckS3Headers)
+        .then(HasHeaders(['x-amz-meta-mtime']))
+        .then(DoesNotHaveHeaders(['X-Object-Meta-Mtime']))
+        .then(HasHeaders({
+          'Content-Type': 'application/octet-stream',
+          Etag: '"0f343b0931126a20f133d67c2b018a3b"'
+        }))
+        .then(BodyHasLength(100))]
+  ]
+}
+
+runTests('s3 obj (v2)', makeTests({
+  endpoint: PARAMS.S3_ENDPOINT || 'http://localhost:8080',
+  region: PARAMS.S3_REGION || 'us-east-1',
+  accessKeyId: PARAMS.S3_USER || 'test:tester',
+  secretAccessKey: PARAMS.S3_KEY || 'testing',
+  s3ForcePathStyle: true,
+  signatureVersion: 'v2'
+}))
+
+runTests('s3 obj (v4)', makeTests({
+  endpoint: PARAMS.S3_ENDPOINT || 'http://localhost:8080',
+  region: PARAMS.S3_REGION || 'us-east-1',
+  accessKeyId: PARAMS.S3_USER || 'test:tester',
+  secretAccessKey: PARAMS.S3_KEY || 'testing',
+  s3ForcePathStyle: true,
+  signatureVersion: 'v4'
+}))
diff --git a/test/cors/test-symlink.js b/test/cors/test-symlink.js
new file mode 100644
index 0000000000..ed6781237f
--- /dev/null
+++ b/test/cors/test-symlink.js
@@ -0,0 +1,139 @@
+import {
+  runTests,
+  MakeRequest,
+  HasStatus,
+  HasHeaders,
+  HasCommonResponseHeaders,
+  DoesNotHaveHeaders,
+  HasNoBody,
+  CorsBlocked,
+  Skip
+} from './harness.js'
+import { GetClusterInfo } from './test-info.js'
+
+function MakeSymlinkRequest () {
+  return GetClusterInfo.then((clusterInfo) => {
+    if (!('symlink' in clusterInfo)) {
+      throw new Skip('Symlink is not enabled')
+    }
+    return MakeRequest(...arguments)
+  })
+}
+
+runTests('symlink', [
+  ['GET link to no CORS',
+    () => MakeSymlinkRequest('GET', 'public-with-cors/symlink-to-public-no-cors')
+      .then(CorsBlocked)],
+  ['HEAD link to no CORS',
+    () => MakeSymlinkRequest('HEAD', 'public-with-cors/symlink-to-public-no-cors')
+      .then(CorsBlocked)],
+  ['GET Range link to no CORS',
+    () => MakeSymlinkRequest('GET', 'public-with-cors/symlink-to-public-no-cors', { Range: 'bytes=100-199' })
+      .then(CorsBlocked)], // But preflight *succeeded*!
+
+  ['GET link with CORS',
+    () => MakeSymlinkRequest('GET', 'public-with-cors/symlink-to-public-with-cors')
+      .then(HasStatus(200, 'OK'))
+      .then(HasCommonResponseHeaders)
+      .then(HasHeaders({
+        'Content-Type': 'application/octet-stream',
+        Etag: '0f343b0931126a20f133d67c2b018a3b'
+      }))
+      .then(HasHeaders(['X-Object-Meta-Mtime']))
+      .then(DoesNotHaveHeaders(['Content-Location']))
+      .then((resp) => {
+        if (resp.responseText.length !== 1024) {
+          throw new Error('Expected body to have length 1024, got ' + resp.responseText.length)
+        }
+      })],
+  ['HEAD link with CORS',
+    () => MakeSymlinkRequest('HEAD', 'public-with-cors/symlink-to-public-with-cors')
+      .then(HasStatus(200, 'OK'))
+      .then(HasCommonResponseHeaders)
+      .then(HasHeaders({
+        'Content-Type': 'application/octet-stream',
+        Etag: '0f343b0931126a20f133d67c2b018a3b'
+      }))
+      .then(HasHeaders(['X-Object-Meta-Mtime']))
+      .then(DoesNotHaveHeaders(['Content-Location']))
+      .then(HasNoBody)],
+  ['GET Range link with CORS',
+    () => MakeSymlinkRequest('GET', 'public-with-cors/symlink-to-public-with-cors', { Range: 'bytes=100-199' })
+      .then(HasStatus(206, 'Partial Content'))
+      .then(HasCommonResponseHeaders)
+      .then(HasHeaders({
+        'Content-Type': 'application/octet-stream',
+        Etag: '0f343b0931126a20f133d67c2b018a3b'
+      }))
+      .then(HasHeaders(['X-Object-Meta-Mtime']))
+      .then(DoesNotHaveHeaders(['Content-Location']))
+      .then((resp) => {
+        if (resp.responseText.length !== 100) {
+          throw new Error('Expected body to have length 100, got ' + resp.responseText.length)
+        }
+      })],
+
+  ['GET private',
+    () => MakeSymlinkRequest('GET', 'public-with-cors/symlink-to-private')
+      .then(CorsBlocked)], // TODO: maybe should be Unauthorized?
+  ['HEAD private',
+    () => MakeSymlinkRequest('HEAD', 'public-with-cors/symlink-to-private')
+      .then(CorsBlocked)], // TODO: maybe should be Unauthorized?
+  ['GET private Range',
+    () => MakeSymlinkRequest('GET', 'public-with-cors/symlink-to-private', { Range: 'bytes=100-199' })
+      .then(CorsBlocked)], // TODO: maybe should be Unauthorized?
+
+  ['GET If-Match matching',
+    () => MakeSymlinkRequest('GET', 'public-with-cors/symlink-to-public-with-cors', { 'If-Match': '0f343b0931126a20f133d67c2b018a3b' })
+      .then(HasStatus(200, 'OK'))
+      .then(HasCommonResponseHeaders)
+      .then(HasHeaders({
+        'Content-Type': 'application/octet-stream',
+        Etag: '0f343b0931126a20f133d67c2b018a3b'
+      }))
+      .then(HasHeaders(['X-Object-Meta-Mtime']))
+      .then(DoesNotHaveHeaders(['Content-Location']))
+      .then((resp) => {
+        if (resp.responseText.length !== 1024) {
+          throw new Error('Expected body to have length 1024, got ' + resp.responseText.length)
+        }
+      })],
+  ['GET If-Match not matching',
+    () => MakeSymlinkRequest('GET', 'public-with-cors/symlink-to-public-with-cors', { 'If-Match': 'something-else' })
+      .then(HasStatus(412, 'Precondition Failed'))
+      .then(HasCommonResponseHeaders)
+      .then(HasHeaders({
+        'Content-Type': 'text/html; charset=UTF-8',
+        Etag: '0f343b0931126a20f133d67c2b018a3b'
+      }))
+      .then(HasHeaders(['X-Object-Meta-Mtime']))
+      .then(DoesNotHaveHeaders(['Content-Location']))
+      .then(HasNoBody)],
+  ['GET If-None-Match matching',
+    () => MakeSymlinkRequest('GET', 'public-with-cors/symlink-to-public-with-cors', { 'If-None-Match': '0f343b0931126a20f133d67c2b018a3b' })
+      .then(HasStatus(304, 'Not Modified'))
+      .then(HasCommonResponseHeaders)
+      .then(HasHeaders({
+        // Content-Type can vary depending on storage policy type...
+        // 'Content-Type': 'text/html; charset=UTF-8',
+        Etag: '0f343b0931126a20f133d67c2b018a3b'
+      }))
+      .then(HasHeaders(['Content-Type', 'X-Object-Meta-Mtime']))
+      .then(DoesNotHaveHeaders(['Content-Location']))
+      .then(HasNoBody)],
+  ['GET If-None-Match not matching',
+    () => MakeSymlinkRequest('GET', 'public-with-cors/symlink-to-public-with-cors', { 'If-None-Match': 'something-else' })
+      .then(HasStatus(200, 'OK'))
+      .then(HasCommonResponseHeaders)
+      .then(HasHeaders({
+        'Content-Type': 'application/octet-stream',
+        Etag: '0f343b0931126a20f133d67c2b018a3b'
+      }))
+      .then(HasHeaders(['X-Object-Meta-Mtime']))
+      .then(DoesNotHaveHeaders(['Content-Location']))
+      .then((resp) => {
+        if (resp.responseText.length !== 1024) {
+          throw new Error('Expected body to have length 1024, got ' + resp.responseText.length)
+        }
+      })]
+])
diff --git a/test/cors/vendor/aws-sdk-2.829.0.min.js b/test/cors/vendor/aws-sdk-2.829.0.min.js
new file mode 100644
index 0000000000..b803ed5b84
--- /dev/null
+++ b/test/cors/vendor/aws-sdk-2.829.0.min.js
@@ -0,0 +1,10 @@
+_xamzrequire=function(){function e(t,r,n){function i(s,a){if(!r[s]){if(!t[s]){var u="function"==typeof require&&require;if(!a&&u)return u(s,!0);if(o)return o(s,!0);var c=new Error("Cannot find module '"+s+"'");throw c.code="MODULE_NOT_FOUND",c}var l=r[s]={exports:{}};t[s][0].call(l.exports,function(e){return i(t[s][1][e]||e)},l,l.exports,e,t,r,n)}return r[s].exports}for(var o="function"==typeof require&&require,s=0;s<n.length;s++)i(n[s]);return i}return e}()({105:[function(e,t,r){(function(r){(function(){var n=e("../core"),i=e("../region_config"),o={isArnInParam:function(e,t){var r=(e.service.api.operations[e.operation]||{}).input||{},i=r.members||{};return!(!e.params[t]||!i[t])&&n.util.ARN.validate(e.params[t])},validateArnService:function(e){var t=e.service._parsedArn;if("s3"!==t.service&&"s3-outposts"!==t.service)throw n.util.error(new Error,{code:"InvalidARN",message:"expect 's3' or 's3-outposts' in ARN service component"})},validateArnAccount:function(e){if(!/[0-9]{12}/.exec(e.service._parsedArn.accountId))throw n.util.error(new Error,{code:"InvalidARN",message:'ARN accountID does not match regex "[0-9]{12}"'})},validateS3AccessPointArn:function(e){var t=e.service._parsedArn,r=t.resource["accesspoint".length];if(2!==t.resource.split(r).length)throw n.util.error(new Error,{code:"InvalidARN",message:"Access Point ARN should have one resource accesspoint/{accesspointName}"});var i=t.resource.split(r)[1],s=i+"-"+t.accountId;if(!o.dnsCompatibleBucketName(s)||s.match(/\./))throw n.util.error(new Error,{code:"InvalidARN",message:"Access point resource in ARN is not DNS compatible. Got "+i});e.service._parsedArn.accessPoint=i},validateOutpostsArn:function(e){var t=e.service._parsedArn;if(0!==t.resource.indexOf("outpost:")&&0!==t.resource.indexOf("outpost/"))throw n.util.error(new Error,{code:"InvalidARN",message:"ARN resource should begin with 'outpost/'"});var r=t.resource["outpost".length],i=t.resource.split(r)[1];if(!new RegExp(/^([a-zA-Z0-9]|[a-zA-Z0-9][a-zA-Z0-9-]{0,61}[a-zA-Z0-9])$/).test(i))throw n.util.error(new Error,{code:"InvalidARN",message:"Outpost resource in ARN is not DNS compatible. Got "+i});e.service._parsedArn.outpostId=i},validateOutpostsAccessPointArn:function(e){var t=e.service._parsedArn,r=t.resource["outpost".length];if(4!==t.resource.split(r).length)throw n.util.error(new Error,{code:"InvalidARN",message:"Outposts ARN should have two resources outpost/{outpostId}/accesspoint/{accesspointName}"});var i=t.resource.split(r)[3],s=i+"-"+t.accountId;if(!o.dnsCompatibleBucketName(s)||s.match(/\./))throw n.util.error(new Error,{code:"InvalidARN",message:"Access point resource in ARN is not DNS compatible. Got "+i});e.service._parsedArn.accessPoint=i},validateArnRegion:function(e){var t=o.loadUseArnRegionConfig(e),r=e.service._parsedArn.region,s=e.service.config.region;if(!r)throw n.util.error(new Error,{code:"InvalidARN",message:"ARN region is empty"});if(s.indexOf("fips")>=0||r.indexOf("fips")>=0)throw n.util.error(new Error,{code:"InvalidConfiguration",message:"ARN endpoint is not compatible with FIPS region"});if(!t&&r!==s)throw n.util.error(new Error,{code:"InvalidConfiguration",message:"Configured region conflicts with access point region"});if(t&&i.getEndpointSuffix(r)!==i.getEndpointSuffix(s))throw n.util.error(new Error,{code:"InvalidConfiguration",message:"Configured region and access point region not in same partition"});if(e.service.config.useAccelerateEndpoint)throw n.util.error(new Error,{code:"InvalidConfiguration",message:"useAccelerateEndpoint config is not supported with access point ARN"});if("s3-outposts"===e.service._parsedArn.service&&e.service.config.useDualstack)throw n.util.error(new Error,{code:"InvalidConfiguration",message:"useDualstack config is not supported with outposts access point ARN"})},loadUseArnRegionConfig:function(e){var t="AWS_S3_USE_ARN_REGION",i="s3_use_arn_region",o=!0,s=e.service._originalConfig||{};if(void 0!==e.service.config.s3UseArnRegion)return e.service.config.s3UseArnRegion;if(void 0!==s.s3UseArnRegion)o=!0===s.s3UseArnRegion;else if(n.util.isNode())if(r.env[t]){var a=r.env[t].trim().toLowerCase();if(["false","true"].indexOf(a)<0)throw n.util.error(new Error,{code:"InvalidConfiguration",message:t+" only accepts true or false. Got "+r.env[t],retryable:!1});o="true"===a}else{var u={},c={};try{u=n.util.getProfilesFromSharedConfig(n.util.iniLoader),c=u[r.env.AWS_PROFILE||n.util.defaultProfile]}catch(e){}if(c[i]){if(["false","true"].indexOf(c[i].trim().toLowerCase())<0)throw n.util.error(new Error,{code:"InvalidConfiguration",message:i+" only accepts true or false. Got "+c[i],retryable:!1});o="true"===c[i].trim().toLowerCase()}}return e.service.config.s3UseArnRegion=o,o},validatePopulateUriFromArn:function(e){if(e.service._originalConfig&&e.service._originalConfig.endpoint)throw n.util.error(new Error,{code:"InvalidConfiguration",message:"Custom endpoint is not compatible with access point ARN"});if(e.service.config.s3ForcePathStyle)throw n.util.error(new Error,{code:"InvalidConfiguration",message:"Cannot construct path-style endpoint with access point"})},dnsCompatibleBucketName:function(e){var t=e,r=new RegExp(/^[a-z0-9][a-z0-9\.\-]{1,61}[a-z0-9]$/),n=new RegExp(/(\d+\.){3}\d+/),i=new RegExp(/\.\./);return!(!t.match(r)||t.match(n)||t.match(i))}};t.exports=o}).call(this)}).call(this,e("_process"))},{"../core":39,"../region_config":82,_process:8}],38:[function(e,t,r){(function(r){(function(){function n(e,t){if("string"==typeof e){if(["legacy","regional"].indexOf(e.toLowerCase())>=0)return e.toLowerCase();throw o.util.error(new Error,t)}}function i(e,t){e=e||{};var i;if(e[t.clientConfig]&&(i=n(e[t.clientConfig],{code:"InvalidConfiguration",message:'invalid "'+t.clientConfig+'" configuration. Expect "legacy"  or "regional". Got "'+e[t.clientConfig]+'".'})))return i;if(!o.util.isNode())return i;if(Object.prototype.hasOwnProperty.call(r.env,t.env)){if(i=n(r.env[t.env],{code:"InvalidEnvironmentalVariable",message:"invalid "+t.env+' environmental variable. Expect "legacy"  or "regional". Got "'+r.env[t.env]+'".'}))return i}var s={};try{s=o.util.getProfilesFromSharedConfig(o.util.iniLoader)[r.env.AWS_PROFILE||o.util.defaultProfile]}catch(e){}if(s&&Object.prototype.hasOwnProperty.call(s,t.sharedConfig)){if(i=n(s[t.sharedConfig],{code:"InvalidConfiguration",message:"invalid "+t.sharedConfig+' profile config. Expect "legacy"  or "regional". Got "'+s[t.sharedConfig]+'".'}))return i}return i}var o=e("./core");t.exports=i}).call(this)}).call(this,e("_process"))},{"./core":39,_process:8}],39:[function(e,t,r){var n={util:e("./util")};({}).toString(),t.exports=n,n.util.update(n,{VERSION:"2.829.0",Signers:{},Protocol:{Json:e("./protocol/json"),Query:e("./protocol/query"),Rest:e("./protocol/rest"),RestJson:e("./protocol/rest_json"),RestXml:e("./protocol/rest_xml")},XML:{Builder:e("./xml/builder"),Parser:null},JSON:{Builder:e("./json/builder"),Parser:e("./json/parser")},Model:{Api:e("./model/api"),Operation:e("./model/operation"),Shape:e("./model/shape"),Paginator:e("./model/paginator"),ResourceWaiter:e("./model/resource_waiter")},apiLoader:e("./api_loader"),EndpointCache:e("../vendor/endpoint-cache").EndpointCache}),e("./sequential_executor"),e("./service"),e("./config"),e("./http"),e("./event_listeners"),e("./request"),e("./response"),e("./resource_waiter"),e("./signers/request_signer"),e("./param_validator"),n.events=new n.SequentialExecutor,n.util.memoizedProperty(n,"endpointCache",function(){return new n.EndpointCache(n.config.endpointCacheSize)},!0)},{"../vendor/endpoint-cache":125,"./api_loader":27,"./config":37,"./event_listeners":60,"./http":61,"./json/builder":63,"./json/parser":64,"./model/api":65,"./model/operation":67,"./model/paginator":68,"./model/resource_waiter":69,"./model/shape":70,"./param_validator":71,"./protocol/json":74,"./protocol/query":75,"./protocol/rest":76,"./protocol/rest_json":77,"./protocol/rest_xml":78,"./request":84,"./resource_waiter":85,"./response":86,"./sequential_executor":88,"./service":89,"./signers/request_signer":110,"./util":118,"./xml/builder":120}],125:[function(e,t,r){"use strict";Object.defineProperty(r,"__esModule",{value:!0});var n=e("./utils/LRU"),i=1e3,o=function(){function e(e){void 0===e&&(e=i),this.maxSize=e,this.cache=new n.LRUCache(e)}return Object.defineProperty(e.prototype,"size",{get:function(){return this.cache.length},enumerable:!0,configurable:!0}),e.prototype.put=function(t,r){var n="string"!=typeof t?e.getKeyString(t):t,i=this.populateValue(r);this.cache.put(n,i)},e.prototype.get=function(t){var r="string"!=typeof t?e.getKeyString(t):t,n=Date.now(),i=this.cache.get(r);if(i)for(var o=0;o<i.length;o++){var s=i[o];if(s.Expire<n)return void this.cache.remove(r)}return i},e.getKeyString=function(e){for(var t=[],r=Object.keys(e).sort(),n=0;n<r.length;n++){var i=r[n];void 0!==e[i]&&t.push(e[i])}return t.join(" ")},e.prototype.populateValue=function(e){var t=Date.now();return e.map(function(e){return{Address:e.Address||"",Expire:t+60*(e.CachePeriodInMinutes||1)*1e3}})},e.prototype.empty=function(){this.cache.empty()},e.prototype.remove=function(t){var r="string"!=typeof t?e.getKeyString(t):t;this.cache.remove(r)},e}();r.EndpointCache=o},{"./utils/LRU":126}],126:[function(e,t,r){"use strict";Object.defineProperty(r,"__esModule",{value:!0});var n=function(){function e(e,t){this.key=e,this.value=t}return e}(),i=function(){function e(e){if(this.nodeMap={},this.size=0,"number"!=typeof e||e<1)throw new Error("Cache size can only be positive number");this.sizeLimit=e}return Object.defineProperty(e.prototype,"length",{get:function(){return this.size},enumerable:!0,configurable:!0}),e.prototype.prependToList=function(e){this.headerNode?(this.headerNode.prev=e,e.next=this.headerNode):this.tailNode=e,this.headerNode=e,this.size++},e.prototype.removeFromTail=function(){if(this.tailNode){var e=this.tailNode,t=e.prev;return t&&(t.next=void 0),e.prev=void 0,this.tailNode=t,this.size--,e}},e.prototype.detachFromList=function(e){this.headerNode===e&&(this.headerNode=e.next),this.tailNode===e&&(this.tailNode=e.prev),e.prev&&(e.prev.next=e.next),e.next&&(e.next.prev=e.prev),e.next=void 0,e.prev=void 0,this.size--},e.prototype.get=function(e){if(this.nodeMap[e]){var t=this.nodeMap[e];return this.detachFromList(t),this.prependToList(t),t.value}},e.prototype.remove=function(e){if(this.nodeMap[e]){var t=this.nodeMap[e];this.detachFromList(t),delete this.nodeMap[e]}},e.prototype.put=function(e,t){if(this.nodeMap[e])this.remove(e);else if(this.size===this.sizeLimit){var r=this.removeFromTail(),i=r.key;delete this.nodeMap[i]}var o=new n(e,t);this.nodeMap[e]=o,this.prependToList(o)},e.prototype.empty=function(){for(var e=Object.keys(this.nodeMap),t=0;t<e.length;t++){var r=e[t],n=this.nodeMap[r];this.detachFromList(n),delete this.nodeMap[r]}},e}();r.LRUCache=i},{}],120:[function(e,t,r){function n(){}function i(e,t,r){switch(r.type){case"structure":return o(e,t,r);case"map":return s(e,t,r);case"list":return a(e,t,r);default:return u(e,t,r)}}function o(e,t,r){l.arrayEach(r.memberNames,function(n){var o=r.members[n];if("body"===o.location){var s=t[n],a=o.name;if(void 0!==s&&null!==s)if(o.isXmlAttribute)e.addAttribute(a,s);else if(o.flattened)i(e,s,o);else{var u=new h(a);e.addChildNode(u),c(u,o),i(u,s,o)}}})}function s(e,t,r){var n=r.key.name||"key",o=r.value.name||"value";l.each(t,function(t,s){var a=new h(r.flattened?r.name:"entry");e.addChildNode(a);var u=new h(n),c=new h(o);a.addChildNode(u),a.addChildNode(c),i(u,t,r.key),i(c,s,r.value)})}function a(e,t,r){r.flattened?l.arrayEach(t,function(t){var n=r.member.name||r.name,o=new h(n);e.addChildNode(o),i(o,t,r.member)}):l.arrayEach(t,function(t){var n=r.member.name||"member",o=new h(n);e.addChildNode(o),i(o,t,r.member)})}function u(e,t,r){e.addChildNode(new p(r.toWireFormat(t)))}function c(e,t,r){var n,i="xmlns";t.xmlNamespaceUri?(n=t.xmlNamespaceUri,t.xmlNamespacePrefix&&(i+=":"+t.xmlNamespacePrefix)):r&&t.api.xmlNamespaceUri&&(n=t.api.xmlNamespaceUri),n&&e.addAttribute(i,n)}var l=e("../util"),h=e("./xml-node").XmlNode,p=e("./xml-text").XmlText;n.prototype.toXML=function(e,t,r,n){var o=new h(r);return c(o,t,!0),i(o,e,t),o.children.length>0||n?o.toString():""},t.exports=n},{"../util":118,"./xml-node":123,"./xml-text":124}],124:[function(e,t,r){function n(e){this.value=e}var i=e("./escape-element").escapeElement;n.prototype.toString=function(){return i(""+this.value)},t.exports={XmlText:n}},{"./escape-element":122}],122:[function(e,t,r){function n(e){return e.replace(/&/g,"&amp;").replace(/</g,"&lt;").replace(/>/g,"&gt;")}t.exports={escapeElement:n}},{}],123:[function(e,t,r){function n(e,t){void 0===t&&(t=[]),this.name=e,this.children=t,this.attributes={}}var i=e("./escape-attribute").escapeAttribute;n.prototype.addAttribute=function(e,t){return this.attributes[e]=t,this},n.prototype.addChildNode=function(e){return this.children.push(e),this},n.prototype.removeAttribute=function(e){return delete this.attributes[e],this},n.prototype.toString=function(){for(var e=Boolean(this.children.length),t="<"+this.name,r=this.attributes,n=0,o=Object.keys(r);n<o.length;n++){var s=o[n],a=r[s];void 0!==a&&null!==a&&(t+=" "+s+'="'+i(""+a)+'"')}return t+=e?">"+this.children.map(function(e){return e.toString()}).join("")+"</"+this.name+">":"/>"},t.exports={XmlNode:n}},{"./escape-attribute":121}],121:[function(e,t,r){function n(e){return e.replace(/&/g,"&amp;").replace(/'/g,"&apos;").replace(/</g,"&lt;").replace(/>/g,"&gt;").replace(/"/g,"&quot;")}t.exports={escapeAttribute:n}},{}],110:[function(e,t,r){var n=e("../core"),i=n.util.inherit;n.Signers.RequestSigner=i({constructor:function(e){this.request=e},setServiceClientId:function(e){this.serviceClientId=e},getServiceClientId:function(){return this.serviceClientId}}),n.Signers.RequestSigner.getVersion=function(e){switch(e){case"v2":return n.Signers.V2;case"v3":return n.Signers.V3;case"s3v4":case"v4":return n.Signers.V4;case"s3":return n.Signers.S3;case"v3https":return n.Signers.V3Https}throw new Error("Unknown signing version "+e)},e("./v2"),e("./v3"),e("./v3https"),e("./v4"),e("./s3"),e("./presign")},{"../core":39,"./presign":109,"./s3":111,"./v2":112,"./v3":113,"./v3https":114,"./v4":115}],115:[function(e,t,r){var n=e("../core"),i=e("./v4_credentials"),o=n.util.inherit;n.Signers.V4=o(n.Signers.RequestSigner,{constructor:function(e,t,r){n.Signers.RequestSigner.call(this,e),this.serviceName=t,r=r||{},this.signatureCache="boolean"!=typeof r.signatureCache||r.signatureCache,this.operation=r.operation,this.signatureVersion=r.signatureVersion},algorithm:"AWS4-HMAC-SHA256",addAuthorization:function(e,t){var r=n.util.date.iso8601(t).replace(/[:\-]|\.\d{3}/g,"");this.isPresigned()?this.updateForPresigned(e,r):this.addHeaders(e,r),this.request.headers.Authorization=this.authorization(e,r)},addHeaders:function(e,t){this.request.headers["X-Amz-Date"]=t,e.sessionToken&&(this.request.headers["x-amz-security-token"]=e.sessionToken)},updateForPresigned:function(e,t){var r=this.credentialString(t),i={"X-Amz-Date":t,"X-Amz-Algorithm":this.algorithm,"X-Amz-Credential":e.accessKeyId+"/"+r,"X-Amz-Expires":this.request.headers["presigned-expires"],"X-Amz-SignedHeaders":this.signedHeaders()};e.sessionToken&&(i["X-Amz-Security-Token"]=e.sessionToken),this.request.headers["Content-Type"]&&(i["Content-Type"]=this.request.headers["Content-Type"]),this.request.headers["Content-MD5"]&&(i["Content-MD5"]=this.request.headers["Content-MD5"]),this.request.headers["Cache-Control"]&&(i["Cache-Control"]=this.request.headers["Cache-Control"]),n.util.each.call(this,this.request.headers,function(e,t){if("presigned-expires"!==e&&this.isSignableHeader(e)){var r=e.toLowerCase();0===r.indexOf("x-amz-meta-")?i[r]=t:0===r.indexOf("x-amz-")&&(i[e]=t)}});var o=this.request.path.indexOf("?")>=0?"&":"?";this.request.path+=o+n.util.queryParamsToString(i)},authorization:function(e,t){var r=[],n=this.credentialString(t);return r.push(this.algorithm+" Credential="+e.accessKeyId+"/"+n),r.push("SignedHeaders="+this.signedHeaders()),r.push("Signature="+this.signature(e,t)),r.join(", ")},signature:function(e,t){var r=i.getSigningKey(e,t.substr(0,8),this.request.region,this.serviceName,this.signatureCache);return n.util.crypto.hmac(r,this.stringToSign(t),"hex")},stringToSign:function(e){var t=[];return t.push("AWS4-HMAC-SHA256"),t.push(e),t.push(this.credentialString(e)),t.push(this.hexEncodedHash(this.canonicalString())),t.join("\n")},canonicalString:function(){var e=[],t=this.request.pathname();return"s3"!==this.serviceName&&"s3v4"!==this.signatureVersion&&(t=n.util.uriEscapePath(t)),e.push(this.request.method),e.push(t),e.push(this.request.search()),e.push(this.canonicalHeaders()+"\n"),e.push(this.signedHeaders()),e.push(this.hexEncodedBodyHash()),e.join("\n")},canonicalHeaders:function(){var e=[];n.util.each.call(this,this.request.headers,function(t,r){e.push([t,r])}),e.sort(function(e,t){return e[0].toLowerCase()<t[0].toLowerCase()?-1:1});var t=[];return n.util.arrayEach.call(this,e,function(e){var r=e[0].toLowerCase();if(this.isSignableHeader(r)){var i=e[1];if(void 0===i||null===i||"function"!=typeof i.toString)throw n.util.error(new Error("Header "+r+" contains invalid value"),{code:"InvalidHeader"});t.push(r+":"+this.canonicalHeaderValues(i.toString()))}}),t.join("\n")},canonicalHeaderValues:function(e){return e.replace(/\s+/g," ").replace(/^\s+|\s+$/g,"")},signedHeaders:function(){var e=[];return n.util.each.call(this,this.request.headers,function(t){t=t.toLowerCase(),this.isSignableHeader(t)&&e.push(t)}),e.sort().join(";")},credentialString:function(e){return i.createScope(e.substr(0,8),this.request.region,this.serviceName)},hexEncodedHash:function(e){return n.util.crypto.sha256(e,"hex")},hexEncodedBodyHash:function(){var e=this.request;return this.isPresigned()&&"s3"===this.serviceName&&!e.body?"UNSIGNED-PAYLOAD":e.headers["X-Amz-Content-Sha256"]?e.headers["X-Amz-Content-Sha256"]:this.hexEncodedHash(this.request.body||"")},unsignableHeaders:["authorization","content-type","content-length","user-agent","presigned-expires","expect","x-amzn-trace-id"],isSignableHeader:function(e){return 0===e.toLowerCase().indexOf("x-amz-")||this.unsignableHeaders.indexOf(e)<0},isPresigned:function(){return!!this.request.headers["presigned-expires"]}}),t.exports=n.Signers.V4},{"../core":39,"./v4_credentials":116}],116:[function(e,t,r){var n=e("../core"),i={},o=[];t.exports={createScope:function(e,t,r){return[e.substr(0,8),t,r,"aws4_request"].join("/")},getSigningKey:function(e,t,r,s,a){var u=n.util.crypto.hmac(e.secretAccessKey,e.accessKeyId,"base64"),c=[u,t,r,s].join("_");if((a=!1!==a)&&c in i)return i[c];var l=n.util.crypto.hmac("AWS4"+e.secretAccessKey,t,"buffer"),h=n.util.crypto.hmac(l,r,"buffer"),p=n.util.crypto.hmac(h,s,"buffer"),f=n.util.crypto.hmac(p,"aws4_request","buffer");return a&&(i[c]=f,o.push(c),o.length>50&&delete i[o.shift()]),f},emptyCache:function(){i={},o=[]}}},{"../core":39}],114:[function(e,t,r){var n=e("../core"),i=n.util.inherit;e("./v3"),n.Signers.V3Https=i(n.Signers.V3,{authorization:function(e){return"AWS3-HTTPS AWSAccessKeyId="+e.accessKeyId+",Algorithm=HmacSHA256,Signature="+this.signature(e)},stringToSign:function(){return this.request.headers["X-Amz-Date"]}}),t.exports=n.Signers.V3Https},{"../core":39,"./v3":113}],113:[function(e,t,r){var n=e("../core"),i=n.util.inherit;n.Signers.V3=i(n.Signers.RequestSigner,{addAuthorization:function(e,t){var r=n.util.date.rfc822(t);this.request.headers["X-Amz-Date"]=r,e.sessionToken&&(this.request.headers["x-amz-security-token"]=e.sessionToken),this.request.headers["X-Amzn-Authorization"]=this.authorization(e,r)},authorization:function(e){return"AWS3 AWSAccessKeyId="+e.accessKeyId+",Algorithm=HmacSHA256,SignedHeaders="+this.signedHeaders()+",Signature="+this.signature(e)},signedHeaders:function(){var e=[];return n.util.arrayEach(this.headersToSign(),function(t){e.push(t.toLowerCase())}),e.sort().join(";")},canonicalHeaders:function(){var e=this.request.headers,t=[];return n.util.arrayEach(this.headersToSign(),function(r){t.push(r.toLowerCase().trim()+":"+String(e[r]).trim())}),t.sort().join("\n")+"\n"},headersToSign:function(){var e=[];return n.util.each(this.request.headers,function(t){("Host"===t||"Content-Encoding"===t||t.match(/^X-Amz/i))&&e.push(t)}),e},signature:function(e){return n.util.crypto.hmac(e.secretAccessKey,this.stringToSign(),"base64")},stringToSign:function(){var e=[];return e.push(this.request.method),e.push("/"),e.push(""),e.push(this.canonicalHeaders()),e.push(this.request.body),n.util.crypto.sha256(e.join("\n"))}}),t.exports=n.Signers.V3},{"../core":39}],112:[function(e,t,r){var n=e("../core"),i=n.util.inherit;n.Signers.V2=i(n.Signers.RequestSigner,{addAuthorization:function(e,t){t||(t=n.util.date.getDate());var r=this.request;r.params.Timestamp=n.util.date.iso8601(t),r.params.SignatureVersion="2",r.params.SignatureMethod="HmacSHA256",r.params.AWSAccessKeyId=e.accessKeyId,e.sessionToken&&(r.params.SecurityToken=e.sessionToken),delete r.params.Signature,r.params.Signature=this.signature(e),r.body=n.util.queryParamsToString(r.params),r.headers["Content-Length"]=r.body.length},signature:function(e){return n.util.crypto.hmac(e.secretAccessKey,this.stringToSign(),"base64")},stringToSign:function(){var e=[];return e.push(this.request.method),e.push(this.request.endpoint.host.toLowerCase()),e.push(this.request.pathname()),e.push(n.util.queryParamsToString(this.request.params)),e.join("\n")}}),t.exports=n.Signers.V2},{"../core":39}],111:[function(e,t,r){var n=e("../core"),i=n.util.inherit;n.Signers.S3=i(n.Signers.RequestSigner,{subResources:{acl:1,accelerate:1,analytics:1,cors:1,lifecycle:1,delete:1,inventory:1,location:1,logging:1,metrics:1,notification:1,partNumber:1,policy:1,requestPayment:1,replication:1,restore:1,tagging:1,torrent:1,uploadId:1,uploads:1,versionId:1,versioning:1,versions:1,website:1},responseHeaders:{"response-content-type":1,"response-content-language":1,"response-expires":1,"response-cache-control":1,"response-content-disposition":1,"response-content-encoding":1},addAuthorization:function(e,t){this.request.headers["presigned-expires"]||(this.request.headers["X-Amz-Date"]=n.util.date.rfc822(t)),e.sessionToken&&(this.request.headers["x-amz-security-token"]=e.sessionToken);var r=this.sign(e.secretAccessKey,this.stringToSign()),i="AWS "+e.accessKeyId+":"+r;this.request.headers.Authorization=i},stringToSign:function(){var e=this.request,t=[];t.push(e.method),t.push(e.headers["Content-MD5"]||""),t.push(e.headers["Content-Type"]||""),t.push(e.headers["presigned-expires"]||"");var r=this.canonicalizedAmzHeaders();return r&&t.push(r),t.push(this.canonicalizedResource()),t.join("\n")},canonicalizedAmzHeaders:function(){var e=[];n.util.each(this.request.headers,function(t){t.match(/^x-amz-/i)&&e.push(t)}),e.sort(function(e,t){return e.toLowerCase()<t.toLowerCase()?-1:1});var t=[];return n.util.arrayEach.call(this,e,function(e){t.push(e.toLowerCase()+":"+String(this.request.headers[e]))}),t.join("\n")},canonicalizedResource:function(){var e=this.request,t=e.path.split("?"),r=t[0],i=t[1],o="";if(e.virtualHostedBucket&&(o+="/"+e.virtualHostedBucket),o+=r,i){var s=[];n.util.arrayEach.call(this,i.split("&"),function(e){var t=e.split("=")[0],r=e.split("=")[1];if(this.subResources[t]||this.responseHeaders[t]){var n={name:t};void 0!==r&&(this.subResources[t]?n.value=r:n.value=decodeURIComponent(r)),s.push(n)}}),s.sort(function(e,t){return e.name<t.name?-1:1}),s.length&&(i=[],n.util.arrayEach(s,function(e){void 0===e.value?i.push(e.name):i.push(e.name+"="+e.value)}),o+="?"+i.join("&"))}return o},sign:function(e,t){return n.util.crypto.hmac(e,t,"base64","sha1")}}),t.exports=n.Signers.S3},{"../core":39}],109:[function(e,t,r){function n(e){var t=e.httpRequest.headers[a],r=e.service.getSignerClass(e);if(delete e.httpRequest.headers["User-Agent"],delete e.httpRequest.headers["X-Amz-User-Agent"],r===o.Signers.V4){if(t>604800){throw o.util.error(new Error,{code:"InvalidExpiryTime",message:"Presigning does not support expiry time greater than a week with SigV4 signing.",retryable:!1})}e.httpRequest.headers[a]=t}else{if(r!==o.Signers.S3)throw o.util.error(new Error,{message:"Presigning only supports S3 or SigV4 signing.",code:"UnsupportedSigner",retryable:!1});var n=e.service?e.service.getSkewCorrectedDate():o.util.date.getDate();e.httpRequest.headers[a]=parseInt(o.util.date.unixTimestamp(n)+t,10).toString()}}function i(e){var t=e.httpRequest.endpoint,r=o.util.urlParse(e.httpRequest.path),n={};r.search&&(n=o.util.queryStringParse(r.search.substr(1)));var i=e.httpRequest.headers.Authorization.split(" ");if("AWS"===i[0])i=i[1].split(":"),n.Signature=i.pop(),n.AWSAccessKeyId=i.join(":"),o.util.each(e.httpRequest.headers,function(e,t){e===a&&(e="Expires"),0===e.indexOf("x-amz-meta-")&&(delete n[e],e=e.toLowerCase()),n[e]=t}),delete e.httpRequest.headers[a],delete n.Authorization,delete n.Host;else if("AWS4-HMAC-SHA256"===i[0]){i.shift();var s=i.join(" "),u=s.match(/Signature=(.*?)(?:,|\s|\r?\n|$)/)[1];n["X-Amz-Signature"]=u,delete n.Expires}t.pathname=r.pathname,t.search=o.util.queryParamsToString(n)}var o=e("../core"),s=o.util.inherit,a="presigned-expires";o.Signers.Presign=s({sign:function(e,t,r){if(e.httpRequest.headers[a]=t||3600,e.on("build",n),e.on("sign",i),e.removeListener("afterBuild",o.EventListeners.Core.SET_CONTENT_LENGTH),e.removeListener("afterBuild",o.EventListeners.Core.COMPUTE_SHA256),e.emit("beforePresign",[e]),!r){if(e.build(),e.response.error)throw e.response.error;return o.util.urlFormat(e.httpRequest.endpoint)}e.build(function(){this.response.error?r(this.response.error):r(null,o.util.urlFormat(e.httpRequest.endpoint))})}}),t.exports=o.Signers.Presign},{"../core":39}],89:[function(e,t,r){(function(r){(function(){var n=e("./core"),i=e("./model/api"),o=e("./region_config"),s=n.util.inherit,a=0;n.Service=s({constructor:function(e){if(!this.loadServiceClass)throw n.util.error(new Error,"Service must be constructed with `new' operator");var t=this.loadServiceClass(e||{});if(t){var r=n.util.copy(e),i=new t(e);return Object.defineProperty(i,"_originalConfig",{get:function(){return r},enumerable:!1,configurable:!0}),i._clientId=++a,i}this.initialize(e)},initialize:function(e){var t=n.config[this.serviceIdentifier];if(this.config=new n.Config(n.config),t&&this.config.update(t,!0),e&&this.config.update(e,!0),this.validateService(),this.config.endpoint||o.configureEndpoint(this),this.config.endpoint=this.endpointFromTemplate(this.config.endpoint),this.setEndpoint(this.config.endpoint),n.SequentialExecutor.call(this),n.Service.addDefaultMonitoringListeners(this),(this.config.clientSideMonitoring||n.Service._clientSideMonitoring)&&this.publisher){var i=this.publisher;this.addNamedListener("PUBLISH_API_CALL","apiCall",function(e){r.nextTick(function(){i.eventHandler(e)})}),this.addNamedListener("PUBLISH_API_ATTEMPT","apiCallAttempt",function(e){r.nextTick(function(){i.eventHandler(e)})})}},validateService:function(){},loadServiceClass:function(e){var t=e;if(n.util.isEmpty(this.api)){if(t.apiConfig)return n.Service.defineServiceApi(this.constructor,t.apiConfig);if(this.constructor.services){t=new n.Config(n.config),t.update(e,!0);var r=t.apiVersions[this.constructor.serviceIdentifier];return r=r||t.apiVersion,this.getLatestServiceClass(r)}return null}return null},getLatestServiceClass:function(e){return e=this.getLatestServiceVersion(e),null===this.constructor.services[e]&&n.Service.defineServiceApi(this.constructor,e),this.constructor.services[e]},getLatestServiceVersion:function(e){if(!this.constructor.services||0===this.constructor.services.length)throw new Error("No services defined on "+this.constructor.serviceIdentifier);if(e?n.util.isType(e,Date)&&(e=n.util.date.iso8601(e).split("T")[0]):e="latest",Object.hasOwnProperty(this.constructor.services,e))return e;for(var t=Object.keys(this.constructor.services).sort(),r=null,i=t.length-1;i>=0;i--)if("*"!==t[i][t[i].length-1]&&(r=t[i]),t[i].substr(0,10)<=e)return r;throw new Error("Could not find "+this.constructor.serviceIdentifier+" API to satisfy version constraint `"+e+"'")},api:{},defaultRetryCount:3,customizeRequests:function(e){if(e){if("function"!=typeof e)throw new Error("Invalid callback type '"+typeof e+"' provided in customizeRequests");this.customRequestHandler=e}else this.customRequestHandler=null},makeRequest:function(e,t,r){if("function"==typeof t&&(r=t,t=null),t=t||{},this.config.params){var i=this.api.operations[e];i&&(t=n.util.copy(t),n.util.each(this.config.params,function(e,r){i.input.members[e]&&(void 0!==t[e]&&null!==t[e]||(t[e]=r))}))}var o=new n.Request(this,e,t);return this.addAllRequestListeners(o),this.attachMonitoringEmitter(o),r&&o.send(r),o},makeUnauthenticatedRequest:function(e,t,r){"function"==typeof t&&(r=t,t={});var n=this.makeRequest(e,t).toUnauthenticated();return r?n.send(r):n},waitFor:function(e,t,r){return new n.ResourceWaiter(this,e).wait(t,r)},addAllRequestListeners:function(e){for(var t=[n.events,n.EventListeners.Core,this.serviceInterface(),n.EventListeners.CorePost],r=0;r<t.length;r++)t[r]&&e.addListeners(t[r]);this.config.paramValidation||e.removeListener("validate",n.EventListeners.Core.VALIDATE_PARAMETERS),this.config.logger&&e.addListeners(n.EventListeners.Logger),this.setupRequestListeners(e),"function"==typeof this.constructor.prototype.customRequestHandler&&this.constructor.prototype.customRequestHandler(e),Object.prototype.hasOwnProperty.call(this,"customRequestHandler")&&"function"==typeof this.customRequestHandler&&this.customRequestHandler(e)},apiCallEvent:function(e){var t=e.service.api.operations[e.operation],r={Type:"ApiCall",Api:t?t.name:e.operation,Version:1,Service:e.service.api.serviceId||e.service.api.endpointPrefix,Region:e.httpRequest.region,MaxRetriesExceeded:0,UserAgent:e.httpRequest.getUserAgent()},n=e.response;if(n.httpResponse.statusCode&&(r.FinalHttpStatusCode=n.httpResponse.statusCode),n.error){var i=n.error;n.httpResponse.statusCode>299?(i.code&&(r.FinalAwsException=i.code),i.message&&(r.FinalAwsExceptionMessage=i.message)):((i.code||i.name)&&(r.FinalSdkException=i.code||i.name),i.message&&(r.FinalSdkExceptionMessage=i.message))}return r},apiAttemptEvent:function(e){var t=e.service.api.operations[e.operation],r={Type:"ApiCallAttempt",Api:t?t.name:e.operation,Version:1,Service:e.service.api.serviceId||e.service.api.endpointPrefix,Fqdn:e.httpRequest.endpoint.hostname,UserAgent:e.httpRequest.getUserAgent()},n=e.response;return n.httpResponse.statusCode&&(r.HttpStatusCode=n.httpResponse.statusCode),!e._unAuthenticated&&e.service.config.credentials&&e.service.config.credentials.accessKeyId&&(r.AccessKey=e.service.config.credentials.accessKeyId),n.httpResponse.headers?(e.httpRequest.headers["x-amz-security-token"]&&(r.SessionToken=e.httpRequest.headers["x-amz-security-token"]),n.httpResponse.headers["x-amzn-requestid"]&&(r.XAmznRequestId=n.httpResponse.headers["x-amzn-requestid"]),n.httpResponse.headers["x-amz-request-id"]&&(r.XAmzRequestId=n.httpResponse.headers["x-amz-request-id"]),n.httpResponse.headers["x-amz-id-2"]&&(r.XAmzId2=n.httpResponse.headers["x-amz-id-2"]),r):r},attemptFailEvent:function(e){var t=this.apiAttemptEvent(e),r=e.response,n=r.error;return r.httpResponse.statusCode>299?(n.code&&(t.AwsException=n.code),n.message&&(t.AwsExceptionMessage=n.message)):((n.code||n.name)&&(t.SdkException=n.code||n.name),n.message&&(t.SdkExceptionMessage=n.message)),t},attachMonitoringEmitter:function(e){var t,r,i,o,s,a,u=0,c=this;e.on("validate",function(){o=n.util.realClock.now(),a=Date.now()},!0),e.on("sign",function(){r=n.util.realClock.now(),t=Date.now(),s=e.httpRequest.region,u++},!0),e.on("validateResponse",function(){i=Math.round(n.util.realClock.now()-r)}),e.addNamedListener("API_CALL_ATTEMPT","success",function(){var r=c.apiAttemptEvent(e);r.Timestamp=t,r.AttemptLatency=i>=0?i:0,r.Region=s,c.emit("apiCallAttempt",[r])}),e.addNamedListener("API_CALL_ATTEMPT_RETRY","retry",function(){
+var o=c.attemptFailEvent(e);o.Timestamp=t,i=i||Math.round(n.util.realClock.now()-r),o.AttemptLatency=i>=0?i:0,o.Region=s,c.emit("apiCallAttempt",[o])}),e.addNamedListener("API_CALL","complete",function(){var t=c.apiCallEvent(e);if(t.AttemptCount=u,!(t.AttemptCount<=0)){t.Timestamp=a;var r=Math.round(n.util.realClock.now()-o);t.Latency=r>=0?r:0;var i=e.response;i.error&&i.error.retryable&&"number"==typeof i.retryCount&&"number"==typeof i.maxRetries&&i.retryCount>=i.maxRetries&&(t.MaxRetriesExceeded=1),c.emit("apiCall",[t])}})},setupRequestListeners:function(e){},getSigningName:function(){return this.api.signingName||this.api.endpointPrefix},getSignerClass:function(e){var t,r=null,i="";if(e){r=(e.service.api.operations||{})[e.operation]||null,i=r?r.authtype:""}return t=this.config.signatureVersion?this.config.signatureVersion:"v4"===i||"v4-unsigned-body"===i?"v4":this.api.signatureVersion,n.Signers.RequestSigner.getVersion(t)},serviceInterface:function(){switch(this.api.protocol){case"ec2":case"query":return n.EventListeners.Query;case"json":return n.EventListeners.Json;case"rest-json":return n.EventListeners.RestJson;case"rest-xml":return n.EventListeners.RestXml}if(this.api.protocol)throw new Error("Invalid service `protocol' "+this.api.protocol+" in API config")},successfulResponse:function(e){return e.httpResponse.statusCode<300},numRetries:function(){return void 0!==this.config.maxRetries?this.config.maxRetries:this.defaultRetryCount},retryDelays:function(e,t){return n.util.calculateRetryDelay(e,this.config.retryDelayOptions,t)},retryableError:function(e){return!!this.timeoutError(e)||(!!this.networkingError(e)||(!!this.expiredCredentialsError(e)||(!!this.throttledError(e)||e.statusCode>=500)))},networkingError:function(e){return"NetworkingError"===e.code},timeoutError:function(e){return"TimeoutError"===e.code},expiredCredentialsError:function(e){return"ExpiredTokenException"===e.code},clockSkewError:function(e){switch(e.code){case"RequestTimeTooSkewed":case"RequestExpired":case"InvalidSignatureException":case"SignatureDoesNotMatch":case"AuthFailure":case"RequestInTheFuture":return!0;default:return!1}},getSkewCorrectedDate:function(){return new Date(Date.now()+this.config.systemClockOffset)},applyClockOffset:function(e){e&&(this.config.systemClockOffset=e-Date.now())},isClockSkewed:function(e){if(e)return Math.abs(this.getSkewCorrectedDate().getTime()-e)>=3e5},throttledError:function(e){if(429===e.statusCode)return!0;switch(e.code){case"ProvisionedThroughputExceededException":case"Throttling":case"ThrottlingException":case"RequestLimitExceeded":case"RequestThrottled":case"RequestThrottledException":case"TooManyRequestsException":case"TransactionInProgressException":case"EC2ThrottledException":return!0;default:return!1}},endpointFromTemplate:function(e){if("string"!=typeof e)return e;var t=e;return t=t.replace(/\{service\}/g,this.api.endpointPrefix),t=t.replace(/\{region\}/g,this.config.region),t=t.replace(/\{scheme\}/g,this.config.sslEnabled?"https":"http")},setEndpoint:function(e){this.endpoint=new n.Endpoint(e,this.config)},paginationConfig:function(e,t){var r=this.api.operations[e].paginator;if(!r){if(t){var i=new Error;throw n.util.error(i,"No pagination configuration for "+e)}return null}return r}}),n.util.update(n.Service,{defineMethods:function(e){n.util.each(e.prototype.api.operations,function(t){if(!e.prototype[t]){"none"===e.prototype.api.operations[t].authtype?e.prototype[t]=function(e,r){return this.makeUnauthenticatedRequest(t,e,r)}:e.prototype[t]=function(e,r){return this.makeRequest(t,e,r)}}})},defineService:function(e,t,r){n.Service._serviceMap[e]=!0,Array.isArray(t)||(r=t,t=[]);var i=s(n.Service,r||{});if("string"==typeof e){n.Service.addVersions(i,t);var o=i.serviceIdentifier||e;i.serviceIdentifier=o}else i.prototype.api=e,n.Service.defineMethods(i);if(n.SequentialExecutor.call(this.prototype),!this.prototype.publisher&&n.util.clientSideMonitoring){var a=n.util.clientSideMonitoring.Publisher,u=n.util.clientSideMonitoring.configProvider,c=u();this.prototype.publisher=new a(c),c.enabled&&(n.Service._clientSideMonitoring=!0)}return n.SequentialExecutor.call(i.prototype),n.Service.addDefaultMonitoringListeners(i.prototype),i},addVersions:function(e,t){Array.isArray(t)||(t=[t]),e.services=e.services||{};for(var r=0;r<t.length;r++)void 0===e.services[t[r]]&&(e.services[t[r]]=null);e.apiVersions=Object.keys(e.services).sort()},defineServiceApi:function(e,t,r){function o(t){t.isApi?a.prototype.api=t:a.prototype.api=new i(t,{serviceIdentifier:e.serviceIdentifier})}var a=s(e,{serviceIdentifier:e.serviceIdentifier});if("string"==typeof t){if(r)o(r);else try{o(n.apiLoader(e.serviceIdentifier,t))}catch(r){throw n.util.error(r,{message:"Could not find API configuration "+e.serviceIdentifier+"-"+t})}Object.prototype.hasOwnProperty.call(e.services,t)||(e.apiVersions=e.apiVersions.concat(t).sort()),e.services[t]=a}else o(t);return n.Service.defineMethods(a),a},hasService:function(e){return Object.prototype.hasOwnProperty.call(n.Service._serviceMap,e)},addDefaultMonitoringListeners:function(e){e.addNamedListener("MONITOR_EVENTS_BUBBLE","apiCallAttempt",function(t){var r=Object.getPrototypeOf(e);r._events&&r.emit("apiCallAttempt",[t])}),e.addNamedListener("CALL_EVENTS_BUBBLE","apiCall",function(t){var r=Object.getPrototypeOf(e);r._events&&r.emit("apiCall",[t])})},_serviceMap:{}}),n.util.mixin(n.Service,n.SequentialExecutor),t.exports=n.Service}).call(this)}).call(this,e("_process"))},{"./core":39,"./model/api":65,"./region_config":82,_process:8}],82:[function(e,t,r){function n(e){if(!e)return null;var t=e.split("-");return t.length<3?null:t.slice(0,t.length-2).join("-")+"-*"}function i(e){var t=e.config.region,r=n(t),i=e.api.endpointPrefix;return[[t,i],[r,i],[t,"*"],[r,"*"],["*",i],["*","*"]].map(function(e){return e[0]&&e[1]?e.join("/"):null})}function o(e,t){u.each(t,function(t,r){"globalEndpoint"!==t&&(void 0!==e.config[t]&&null!==e.config[t]||(e.config[t]=r))})}function s(e){for(var t=i(e),r=0;r<t.length;r++){var n=t[r];if(n&&Object.prototype.hasOwnProperty.call(c.rules,n)){var s=c.rules[n];return"string"==typeof s&&(s=c.patterns[s]),e.config.useDualstack&&u.isDualstackAvailable(e)&&(s=u.copy(s),s.endpoint=s.endpoint.replace(/{service}\.({region}\.)?/,"{service}.dualstack.{region}.")),e.isGlobalEndpoint=!!s.globalEndpoint,s.signingRegion&&(e.signingRegion=s.signingRegion),s.signatureVersion||(s.signatureVersion="v4"),void o(e,s)}}}function a(e){for(var t={"^(us|eu|ap|sa|ca|me)\\-\\w+\\-\\d+$":"amazonaws.com","^cn\\-\\w+\\-\\d+$":"amazonaws.com.cn","^us\\-gov\\-\\w+\\-\\d+$":"amazonaws.com","^us\\-iso\\-\\w+\\-\\d+$":"c2s.ic.gov","^us\\-isob\\-\\w+\\-\\d+$":"sc2s.sgov.gov"},r=Object.keys(t),n=0;n<r.length;n++){var i=RegExp(r[n]),o=t[r[n]];if(i.test(e))return o}return"amazonaws.com"}var u=e("./util"),c=e("./region_config_data.json");t.exports={configureEndpoint:s,getEndpointSuffix:a}},{"./region_config_data.json":83,"./util":118}],83:[function(e,t,r){t.exports={rules:{"*/*":{endpoint:"{service}.{region}.amazonaws.com"},"cn-*/*":{endpoint:"{service}.{region}.amazonaws.com.cn"},"us-iso-*/*":{endpoint:"{service}.{region}.c2s.ic.gov"},"us-isob-*/*":{endpoint:"{service}.{region}.sc2s.sgov.gov"},"*/budgets":"globalSSL","*/cloudfront":"globalSSL","*/sts":"globalSSL","*/importexport":{endpoint:"{service}.amazonaws.com",signatureVersion:"v2",globalEndpoint:!0},"*/route53":"globalSSL","cn-*/route53":{endpoint:"{service}.amazonaws.com.cn",globalEndpoint:!0,signingRegion:"cn-northwest-1"},"us-gov-*/route53":"globalGovCloud","*/waf":"globalSSL","*/iam":"globalSSL","cn-*/iam":{endpoint:"{service}.cn-north-1.amazonaws.com.cn",globalEndpoint:!0,signingRegion:"cn-north-1"},"us-gov-*/iam":"globalGovCloud","us-gov-*/sts":{endpoint:"{service}.{region}.amazonaws.com"},"us-gov-west-1/s3":"s3signature","us-west-1/s3":"s3signature","us-west-2/s3":"s3signature","eu-west-1/s3":"s3signature","ap-southeast-1/s3":"s3signature","ap-southeast-2/s3":"s3signature","ap-northeast-1/s3":"s3signature","sa-east-1/s3":"s3signature","us-east-1/s3":{endpoint:"{service}.amazonaws.com",signatureVersion:"s3"},"us-east-1/sdb":{endpoint:"{service}.amazonaws.com",signatureVersion:"v2"},"*/sdb":{endpoint:"{service}.{region}.amazonaws.com",signatureVersion:"v2"}},patterns:{globalSSL:{endpoint:"https://{service}.amazonaws.com",globalEndpoint:!0,signingRegion:"us-east-1"},globalGovCloud:{endpoint:"{service}.us-gov.amazonaws.com",globalEndpoint:!0,signingRegion:"us-gov-west-1"},s3signature:{endpoint:"{service}.{region}.amazonaws.com",signatureVersion:"s3"}}}},{}],86:[function(e,t,r){var n=e("./core"),i=n.util.inherit,o=e("jmespath");n.Response=i({constructor:function(e){this.request=e,this.data=null,this.error=null,this.retryCount=0,this.redirectCount=0,this.httpResponse=new n.HttpResponse,e&&(this.maxRetries=e.service.numRetries(),this.maxRedirects=e.service.config.maxRedirects)},nextPage:function(e){var t,r=this.request.service,i=this.request.operation;try{t=r.paginationConfig(i,!0)}catch(e){this.error=e}if(!this.hasNextPage()){if(e)e(this.error,null);else if(this.error)throw this.error;return null}var o=n.util.copy(this.request.params);if(this.nextPageTokens){var s=t.inputToken;"string"==typeof s&&(s=[s]);for(var a=0;a<s.length;a++)o[s[a]]=this.nextPageTokens[a];return r.makeRequest(this.request.operation,o,e)}return e?e(null,null):null},hasNextPage:function(){return this.cacheNextPageTokens(),!!this.nextPageTokens||void 0===this.nextPageTokens&&void 0},cacheNextPageTokens:function(){if(Object.prototype.hasOwnProperty.call(this,"nextPageTokens"))return this.nextPageTokens;this.nextPageTokens=void 0;var e=this.request.service.paginationConfig(this.request.operation);if(!e)return this.nextPageTokens;if(this.nextPageTokens=null,e.moreResults&&!o.search(this.data,e.moreResults))return this.nextPageTokens;var t=e.outputToken;return"string"==typeof t&&(t=[t]),n.util.arrayEach.call(this,t,function(e){var t=o.search(this.data,e);t&&(this.nextPageTokens=this.nextPageTokens||[],this.nextPageTokens.push(t))}),this.nextPageTokens}})},{"./core":39,jmespath:7}],85:[function(e,t,r){function n(e){var t=e.request._waiter,r=t.config.acceptors,n=!1,i="retry";r.forEach(function(r){if(!n){var o=t.matchers[r.matcher];o&&o(e,r.expected,r.argument)&&(n=!0,i=r.state)}}),!n&&e.error&&(i="failure"),"success"===i?t.setSuccess(e):t.setError(e,"retry"===i)}var i=e("./core"),o=i.util.inherit,s=e("jmespath");i.ResourceWaiter=o({constructor:function(e,t){this.service=e,this.state=t,this.loadWaiterConfig(this.state)},service:null,state:null,config:null,matchers:{path:function(e,t,r){try{var n=s.search(e.data,r)}catch(e){return!1}return s.strictDeepEqual(n,t)},pathAll:function(e,t,r){try{var n=s.search(e.data,r)}catch(e){return!1}Array.isArray(n)||(n=[n]);var i=n.length;if(!i)return!1;for(var o=0;o<i;o++)if(!s.strictDeepEqual(n[o],t))return!1;return!0},pathAny:function(e,t,r){try{var n=s.search(e.data,r)}catch(e){return!1}Array.isArray(n)||(n=[n]);for(var i=n.length,o=0;o<i;o++)if(s.strictDeepEqual(n[o],t))return!0;return!1},status:function(e,t){var r=e.httpResponse.statusCode;return"number"==typeof r&&r===t},error:function(e,t){return"string"==typeof t&&e.error?t===e.error.code:t===!!e.error}},listeners:(new i.SequentialExecutor).addNamedListeners(function(e){e("RETRY_CHECK","retry",function(e){var t=e.request._waiter;e.error&&"ResourceNotReady"===e.error.code&&(e.error.retryDelay=1e3*(t.config.delay||0))}),e("CHECK_OUTPUT","extractData",n),e("CHECK_ERROR","extractError",n)}),wait:function(e,t){"function"==typeof e&&(t=e,e=void 0),e&&e.$waiter&&(e=i.util.copy(e),"number"==typeof e.$waiter.delay&&(this.config.delay=e.$waiter.delay),"number"==typeof e.$waiter.maxAttempts&&(this.config.maxAttempts=e.$waiter.maxAttempts),delete e.$waiter);var r=this.service.makeRequest(this.config.operation,e);return r._waiter=this,r.response.maxRetries=this.config.maxAttempts,r.addListeners(this.listeners),t&&r.send(t),r},setSuccess:function(e){e.error=null,e.data=e.data||{},e.request.removeAllListeners("extractData")},setError:function(e,t){e.data=null,e.error=i.util.error(e.error||new Error,{code:"ResourceNotReady",message:"Resource is not in the state "+this.state,retryable:t})},loadWaiterConfig:function(e){if(!this.service.api.waiters[e])throw new i.util.error(new Error,{code:"StateNotFoundError",message:"State "+e+" not found."});this.config=i.util.copy(this.service.api.waiters[e])}})},{"./core":39,jmespath:7}],84:[function(e,t,r){(function(t){(function(){function r(e){return Object.prototype.hasOwnProperty.call(u,e._asm.currentState)}var n=e("./core"),i=e("./state_machine"),o=n.util.inherit,s=n.util.domain,a=e("jmespath"),u={success:1,error:1,complete:1},c=new i;c.setupStates=function(){var e=function(e,t){var n=this;n._haltHandlersOnError=!1,n.emit(n._asm.currentState,function(e){if(e)if(r(n)){if(!(s&&n.domain instanceof s.Domain))throw e;e.domainEmitter=n,e.domain=n.domain,e.domainThrown=!1,n.domain.emit("error",e)}else n.response.error=e,t(e);else t(n.response.error)})};this.addState("validate","build","error",e),this.addState("build","afterBuild","restart",e),this.addState("afterBuild","sign","restart",e),this.addState("sign","send","retry",e),this.addState("retry","afterRetry","afterRetry",e),this.addState("afterRetry","sign","error",e),this.addState("send","validateResponse","retry",e),this.addState("validateResponse","extractData","extractError",e),this.addState("extractError","extractData","retry",e),this.addState("extractData","success","retry",e),this.addState("restart","build","error",e),this.addState("success","complete","complete",e),this.addState("error","complete","complete",e),this.addState("complete",null,null,e)},c.setupStates(),n.Request=o({constructor:function(e,t,r){var o=e.endpoint,a=e.config.region,u=e.config.customUserAgent;e.isGlobalEndpoint&&(a=e.signingRegion?e.signingRegion:"us-east-1"),this.domain=s&&s.active,this.service=e,this.operation=t,this.params=r||{},this.httpRequest=new n.HttpRequest(o,a),this.httpRequest.appendToUserAgent(u),this.startTime=e.getSkewCorrectedDate(),this.response=new n.Response(this),this._asm=new i(c.states,"validate"),this._haltHandlersOnError=!1,n.SequentialExecutor.call(this),this.emit=this.emitEvent},send:function(e){return e&&(this.httpRequest.appendToUserAgent("callback"),this.on("complete",function(t){e.call(t,t.error,t.data)})),this.runTo(),this.response},build:function(e){return this.runTo("send",e)},runTo:function(e,t){return this._asm.runTo(e,t,this),this},abort:function(){return this.removeAllListeners("validateResponse"),this.removeAllListeners("extractError"),this.on("validateResponse",function(e){e.error=n.util.error(new Error("Request aborted by user"),{code:"RequestAbortedError",retryable:!1})}),this.httpRequest.stream&&!this.httpRequest.stream.didCallback&&(this.httpRequest.stream.abort(),this.httpRequest._abortCallback?this.httpRequest._abortCallback():this.removeAllListeners("send")),this},eachPage:function(e){function t(r){e.call(r,r.error,r.data,function(i){!1!==i&&(r.hasNextPage()?r.nextPage().on("complete",t).send():e.call(r,null,null,n.util.fn.noop))})}e=n.util.fn.makeAsync(e,3),this.on("complete",t).send()},eachItem:function(e){function t(t,i){if(t)return e(t,null);if(null===i)return e(null,null);var o=r.service.paginationConfig(r.operation),s=o.resultKey;Array.isArray(s)&&(s=s[0]);var u=a.search(i,s),c=!0;return n.util.arrayEach(u,function(t){if(!1===(c=e(null,t)))return n.util.abort}),c}var r=this;this.eachPage(t)},isPageable:function(){return!!this.service.paginationConfig(this.operation)},createReadStream:function(){var e=n.util.stream,r=this,i=null;return 2===n.HttpClient.streamsApiVersion?(i=new e.PassThrough,t.nextTick(function(){r.send()})):(i=new e.Stream,i.readable=!0,i.sent=!1,i.on("newListener",function(e){i.sent||"data"!==e||(i.sent=!0,t.nextTick(function(){r.send()}))})),this.on("error",function(e){i.emit("error",e)}),this.on("httpHeaders",function(t,o,s){if(t<300){r.removeListener("httpData",n.EventListeners.Core.HTTP_DATA),r.removeListener("httpError",n.EventListeners.Core.HTTP_ERROR),r.on("httpError",function(e){s.error=e,s.error.retryable=!1});var a,u=!1;if("HEAD"!==r.httpRequest.method&&(a=parseInt(o["content-length"],10)),void 0!==a&&!isNaN(a)&&a>=0){u=!0;var c=0}var l=function(){u&&c!==a?i.emit("error",n.util.error(new Error("Stream content length mismatch. Received "+c+" of "+a+" bytes."),{code:"StreamContentLengthMismatch"})):2===n.HttpClient.streamsApiVersion?i.end():i.emit("end")},h=s.httpResponse.createUnbufferedStream();if(2===n.HttpClient.streamsApiVersion)if(u){var p=new e.PassThrough;p._write=function(t){return t&&t.length&&(c+=t.length),e.PassThrough.prototype._write.apply(this,arguments)},p.on("end",l),i.on("error",function(e){u=!1,h.unpipe(p),p.emit("end"),p.end()}),h.pipe(p).pipe(i,{end:!1})}else h.pipe(i);else u&&h.on("data",function(e){e&&e.length&&(c+=e.length)}),h.on("data",function(e){i.emit("data",e)}),h.on("end",l);h.on("error",function(e){u=!1,i.emit("error",e)})}}),i},emitEvent:function(e,t,r){"function"==typeof t&&(r=t,t=null),r||(r=function(){}),t||(t=this.eventParameters(e,this.response)),n.SequentialExecutor.prototype.emit.call(this,e,t,function(e){e&&(this.response.error=e),r.call(this,e)})},eventParameters:function(e){switch(e){case"restart":case"validate":case"sign":case"build":case"afterValidate":case"afterBuild":return[this];case"error":return[this.response.error,this.response];default:return[this.response]}},presign:function(e,t){return t||"function"!=typeof e||(t=e,e=null),(new n.Signers.Presign).sign(this.toGet(),e,t)},isPresigned:function(){return Object.prototype.hasOwnProperty.call(this.httpRequest.headers,"presigned-expires")},toUnauthenticated:function(){return this._unAuthenticated=!0,this.removeListener("validate",n.EventListeners.Core.VALIDATE_CREDENTIALS),this.removeListener("sign",n.EventListeners.Core.SIGN),this},toGet:function(){return"query"!==this.service.api.protocol&&"ec2"!==this.service.api.protocol||(this.removeListener("build",this.buildAsGet),this.addListener("build",this.buildAsGet)),this},buildAsGet:function(e){e.httpRequest.method="GET",e.httpRequest.path=e.service.endpoint.path+"?"+e.httpRequest.body,e.httpRequest.body="",delete e.httpRequest.headers["Content-Length"],delete e.httpRequest.headers["Content-Type"]},haltHandlersOnError:function(){this._haltHandlersOnError=!0}}),n.Request.addPromisesToClass=function(e){this.prototype.promise=function(){var t=this;return this.httpRequest.appendToUserAgent("promise"),new e(function(e,r){t.on("complete",function(t){t.error?r(t.error):e(Object.defineProperty(t.data||{},"$response",{value:t}))}),t.runTo()})}},n.Request.deletePromisesFromClass=function(){delete this.prototype.promise},n.util.addPromises(n.Request),n.util.mixin(n.Request,n.SequentialExecutor)}).call(this)}).call(this,e("_process"))},{"./core":39,"./state_machine":117,_process:8,jmespath:7}],117:[function(e,t,r){function n(e,t){this.currentState=t||null,this.states=e||{}}n.prototype.runTo=function(e,t,r,n){"function"==typeof e&&(n=r,r=t,t=e,e=null);var i=this,o=i.states[i.currentState];o.fn.call(r||i,n,function(n){if(n){if(!o.fail)return t?t.call(r,n):null;i.currentState=o.fail}else{if(!o.accept)return t?t.call(r):null;i.currentState=o.accept}if(i.currentState===e)return t?t.call(r,n):null;i.runTo(e,t,r,n)})},n.prototype.addState=function(e,t,r,n){return"function"==typeof t?(n=t,t=null,r=null):"function"==typeof r&&(n=r,r=null),this.currentState||(this.currentState=e),this.states[e]={accept:t,fail:r,fn:n},this},t.exports=n},{}],71:[function(e,t,r){var n=e("./core");n.ParamValidator=n.util.inherit({constructor:function(e){!0!==e&&void 0!==e||(e={min:!0}),this.validation=e},validate:function(e,t,r){if(this.errors=[],this.validateMember(e,t||{},r||"params"),this.errors.length>1){var i=this.errors.join("\n* ");throw i="There were "+this.errors.length+" validation errors:\n* "+i,n.util.error(new Error(i),{code:"MultipleValidationErrors",errors:this.errors})}if(1===this.errors.length)throw this.errors[0];return!0},fail:function(e,t){this.errors.push(n.util.error(new Error(t),{code:e}))},validateStructure:function(e,t,r){this.validateType(t,r,["object"],"structure");for(var n,i=0;e.required&&i<e.required.length;i++){n=e.required[i];var o=t[n];void 0!==o&&null!==o||this.fail("MissingRequiredParameter","Missing required key '"+n+"' in "+r)}for(n in t)if(Object.prototype.hasOwnProperty.call(t,n)){var s=t[n],a=e.members[n];if(void 0!==a){var u=[r,n].join(".");this.validateMember(a,s,u)}else void 0!==s&&null!==s&&this.fail("UnexpectedParameter","Unexpected key '"+n+"' found in "+r)}return!0},validateMember:function(e,t,r){switch(e.type){case"structure":return this.validateStructure(e,t,r);case"list":return this.validateList(e,t,r);case"map":return this.validateMap(e,t,r);default:return this.validateScalar(e,t,r)}},validateList:function(e,t,r){if(this.validateType(t,r,[Array])){this.validateRange(e,t.length,r,"list member count");for(var n=0;n<t.length;n++)this.validateMember(e.member,t[n],r+"["+n+"]")}},validateMap:function(e,t,r){if(this.validateType(t,r,["object"],"map")){var n=0;for(var i in t)Object.prototype.hasOwnProperty.call(t,i)&&(this.validateMember(e.key,i,r+"[key='"+i+"']"),this.validateMember(e.value,t[i],r+"['"+i+"']"),n++);this.validateRange(e,n,r,"map member count")}},validateScalar:function(e,t,r){switch(e.type){case null:case void 0:case"string":return this.validateString(e,t,r);case"base64":case"binary":return this.validatePayload(t,r);case"integer":case"float":return this.validateNumber(e,t,r);case"boolean":return this.validateType(t,r,["boolean"]);case"timestamp":return this.validateType(t,r,[Date,/^\d{4}-\d{2}-\d{2}T\d{2}:\d{2}:\d{2}(\.\d+)?Z$/,"number"],"Date object, ISO-8601 string, or a UNIX timestamp");default:return this.fail("UnkownType","Unhandled type "+e.type+" for "+r)}},validateString:function(e,t,r){var n=["string"];e.isJsonValue&&(n=n.concat(["number","object","boolean"])),null!==t&&this.validateType(t,r,n)&&(this.validateEnum(e,t,r),this.validateRange(e,t.length,r,"string length"),this.validatePattern(e,t,r),this.validateUri(e,t,r))},validateUri:function(e,t,r){"uri"===e.location&&0===t.length&&this.fail("UriParameterError",'Expected uri parameter to have length >= 1, but found "'+t+'" for '+r)},validatePattern:function(e,t,r){this.validation.pattern&&void 0!==e.pattern&&(new RegExp(e.pattern).test(t)||this.fail("PatternMatchError",'Provided value "'+t+'" does not match regex pattern /'+e.pattern+"/ for "+r))},validateRange:function(e,t,r,n){this.validation.min&&void 0!==e.min&&t<e.min&&this.fail("MinRangeError","Expected "+n+" >= "+e.min+", but found "+t+" for "+r),this.validation.max&&void 0!==e.max&&t>e.max&&this.fail("MaxRangeError","Expected "+n+" <= "+e.max+", but found "+t+" for "+r)},validateEnum:function(e,t,r){this.validation.enum&&void 0!==e.enum&&-1===e.enum.indexOf(t)&&this.fail("EnumError","Found string value of "+t+", but expected "+e.enum.join("|")+" for "+r)},validateType:function(e,t,r,i){if(null===e||void 0===e)return!1;for(var o=!1,s=0;s<r.length;s++){if("string"==typeof r[s]){if(typeof e===r[s])return!0}else if(r[s]instanceof RegExp){if((e||"").toString().match(r[s]))return!0}else{if(e instanceof r[s])return!0;if(n.util.isType(e,r[s]))return!0;i||o||(r=r.slice()),r[s]=n.util.typeName(r[s])}o=!0}var a=i;a||(a=r.join(", ").replace(/,([^,]+)$/,", or$1"));var u=a.match(/^[aeiou]/i)?"n":"";return this.fail("InvalidParameterType","Expected "+t+" to be a"+u+" "+a),!1},validateNumber:function(e,t,r){if(null!==t&&void 0!==t){if("string"==typeof t){var n=parseFloat(t);n.toString()===t&&(t=n)}this.validateType(t,r,["number"])&&this.validateRange(e,t,r,"numeric value")}},validatePayload:function(e,t){if(null!==e&&void 0!==e&&"string"!=typeof e&&(!e||"number"!=typeof e.byteLength)){if(n.util.isNode()){var r=n.util.stream.Stream;if(n.util.Buffer.isBuffer(e)||e instanceof r)return}else if(void 0!==typeof Blob&&e instanceof Blob)return;var i=["Buffer","Stream","File","Blob","ArrayBuffer","DataView"];if(e)for(var o=0;o<i.length;o++){if(n.util.isType(e,i[o]))return;if(n.util.typeName(e.constructor)===i[o])return}this.fail("InvalidParameterType","Expected "+t+" to be a string, Buffer, Stream, Blob, or typed array object")}}})},{"./core":39}],65:[function(e,t,r){function n(e,t){function r(e,t){!0===t.endpointoperation&&h(n,"endpointOperation",l.string.lowerFirst(e)),t.endpointdiscovery&&!n.hasRequiredEndpointDiscovery&&h(n,"hasRequiredEndpointDiscovery",!0===t.endpointdiscovery.required)}var n=this;e=e||{},t=t||{},t.api=this,e.metadata=e.metadata||{};var f=t.serviceIdentifier;delete t.serviceIdentifier,h(this,"isApi",!0,!1),h(this,"apiVersion",e.metadata.apiVersion),h(this,"endpointPrefix",e.metadata.endpointPrefix),h(this,"signingName",e.metadata.signingName),h(this,"globalEndpoint",e.metadata.globalEndpoint),h(this,"signatureVersion",e.metadata.signatureVersion),h(this,"jsonVersion",e.metadata.jsonVersion),h(this,"targetPrefix",e.metadata.targetPrefix),h(this,"protocol",e.metadata.protocol),h(this,"timestampFormat",e.metadata.timestampFormat),h(this,"xmlNamespaceUri",e.metadata.xmlNamespace),h(this,"abbreviation",e.metadata.serviceAbbreviation),h(this,"fullName",e.metadata.serviceFullName),h(this,"serviceId",e.metadata.serviceId),f&&c[f]&&h(this,"xmlNoDefaultLists",c[f].xmlNoDefaultLists,!1),p(this,"className",function(){var t=e.metadata.serviceAbbreviation||e.metadata.serviceFullName;return t?(t=t.replace(/^Amazon|AWS\s*|\(.*|\s+|\W+/g,""),"ElasticLoadBalancing"===t&&(t="ELB"),t):null}),h(this,"operations",new i(e.operations,t,function(e,r){return new o(e,r,t)},l.string.lowerFirst,r)),h(this,"shapes",new i(e.shapes,t,function(e,r){return s.create(r,t)})),h(this,"paginators",new i(e.paginators,t,function(e,r){return new a(e,r,t)})),h(this,"waiters",new i(e.waiters,t,function(e,r){return new u(e,r,t)},l.string.lowerFirst)),t.documentation&&(h(this,"documentation",e.documentation),h(this,"documentationUrl",e.documentationUrl))}var i=e("./collection"),o=e("./operation"),s=e("./shape"),a=e("./paginator"),u=e("./resource_waiter"),c=e("../../apis/metadata.json"),l=e("../util"),h=l.property,p=l.memoizedProperty;t.exports=n},{"../../apis/metadata.json":26,"../util":118,"./collection":66,"./operation":67,"./paginator":68,"./resource_waiter":69,"./shape":70}],69:[function(e,t,r){function n(e,t,r){r=r||{},o(this,"name",e),o(this,"api",r.api,!1),t.operation&&o(this,"operation",i.string.lowerFirst(t.operation));var n=this;["type","description","delay","maxAttempts","acceptors"].forEach(function(e){var r=t[e];r&&o(n,e,r)})}var i=e("../util"),o=i.property;t.exports=n},{"../util":118}],68:[function(e,t,r){function n(e,t){i(this,"inputToken",t.input_token),i(this,"limitKey",t.limit_key),i(this,"moreResults",t.more_results),i(this,"outputToken",t.output_token),i(this,"resultKey",t.result_key)}var i=e("../util").property;t.exports=n},{"../util":118}],67:[function(e,t,r){function n(e,t,r){var n=this;r=r||{},a(this,"name",t.name||e),a(this,"api",r.api,!1),t.http=t.http||{},a(this,"endpoint",t.endpoint),a(this,"httpMethod",t.http.method||"POST"),a(this,"httpPath",t.http.requestUri||"/"),a(this,"authtype",t.authtype||""),a(this,"endpointDiscoveryRequired",t.endpointdiscovery?t.endpointdiscovery.required?"REQUIRED":"OPTIONAL":"NULL"),u(this,"input",function(){return t.input?o.create(t.input,r):new o.create({type:"structure"},r)}),u(this,"output",function(){return t.output?o.create(t.output,r):new o.create({type:"structure"},r)}),u(this,"errors",function(){var e=[];if(!t.errors)return null;for(var n=0;n<t.errors.length;n++)e.push(o.create(t.errors[n],r));return e}),u(this,"paginator",function(){return r.api.paginators[e]}),r.documentation&&(a(this,"documentation",t.documentation),a(this,"documentationUrl",t.documentationUrl)),u(this,"idempotentMembers",function(){var e=[],t=n.input,r=t.members;if(!t.members)return e;for(var i in r)r.hasOwnProperty(i)&&!0===r[i].isIdempotent&&e.push(i);return e}),u(this,"hasEventOutput",function(){return i(n.output)})}function i(e){var t=e.members,r=e.payload;if(!e.members)return!1;if(r){return t[r].isEventStream}for(var n in t)if(!t.hasOwnProperty(n)&&!0===t[n].isEventStream)return!0;return!1}var o=e("./shape"),s=e("../util"),a=s.property,u=s.memoizedProperty;t.exports=n},{"../util":118,"./shape":70}],61:[function(e,t,r){var n=e("./core"),i=n.util.inherit;n.Endpoint=i({constructor:function(e,t){if(n.util.hideProperties(this,["slashes","auth","hash","search","query"]),void 0===e||null===e)throw new Error("Invalid endpoint: "+e);if("string"!=typeof e)return n.util.copy(e);if(!e.match(/^http/)){e=((t&&void 0!==t.sslEnabled?t.sslEnabled:n.config.sslEnabled)?"https":"http")+"://"+e}n.util.update(this,n.util.urlParse(e)),this.port?this.port=parseInt(this.port,10):this.port="https:"===this.protocol?443:80}}),n.HttpRequest=i({constructor:function(e,t){e=new n.Endpoint(e),this.method="POST",this.path=e.path||"/",this.headers={},this.body="",this.endpoint=e,this.region=t,this._userAgent="",this.setUserAgent()},setUserAgent:function(){this._userAgent=this.headers[this.getUserAgentHeaderName()]=n.util.userAgent()},getUserAgentHeaderName:function(){return(n.util.isBrowser()?"X-Amz-":"")+"User-Agent"},appendToUserAgent:function(e){"string"==typeof e&&e&&(this._userAgent+=" "+e),this.headers[this.getUserAgentHeaderName()]=this._userAgent},getUserAgent:function(){return this._userAgent},pathname:function(){return this.path.split("?",1)[0]},search:function(){var e=this.path.split("?",2)[1];return e?(e=n.util.queryStringParse(e),n.util.queryParamsToString(e)):""},updateEndpoint:function(e){var t=new n.Endpoint(e);this.endpoint=t,this.path=t.path||"/",this.headers.Host&&(this.headers.Host=t.host)}}),n.HttpResponse=i({constructor:function(){this.statusCode=void 0,this.headers={},this.body=void 0,this.streaming=!1,this.stream=null},createUnbufferedStream:function(){return this.streaming=!0,this.stream}}),n.HttpClient=i({}),n.HttpClient.getInstance=function(){return void 0===this.singleton&&(this.singleton=new this),this.singleton}},{"./core":39}],60:[function(e,t,r){function n(e){if(!e.service.api.operations)return"";var t=e.service.api.operations[e.operation];return t?t.authtype:""}var i=e("./core"),o=e("./sequential_executor"),s=e("./discover_endpoint").discoverEndpoint;i.EventListeners={Core:{}},i.EventListeners={Core:(new o).addNamedListeners(function(e,t){t("VALIDATE_CREDENTIALS","validate",function(e,t){if(!e.service.api.signatureVersion&&!e.service.config.signatureVersion)return t();e.service.config.getCredentials(function(r){r&&(e.response.error=i.util.error(r,{code:"CredentialsError",message:"Missing credentials in config, if using AWS_CONFIG_FILE, set AWS_SDK_LOAD_CONFIG=1"})),t()})}),e("VALIDATE_REGION","validate",function(e){if(!e.service.isGlobalEndpoint){var t=new RegExp(/^([a-zA-Z0-9]|[a-zA-Z0-9][a-zA-Z0-9-]{0,61}[a-zA-Z0-9])$/);e.service.config.region?t.test(e.service.config.region)||(e.response.error=i.util.error(new Error,{code:"ConfigError",message:"Invalid region in config"})):e.response.error=i.util.error(new Error,{code:"ConfigError",message:"Missing region in config"})}}),e("BUILD_IDEMPOTENCY_TOKENS","validate",function(e){if(e.service.api.operations){var t=e.service.api.operations[e.operation];if(t){var r=t.idempotentMembers;if(r.length){for(var n=i.util.copy(e.params),o=0,s=r.length;o<s;o++)n[r[o]]||(n[r[o]]=i.util.uuid.v4());e.params=n}}}}),e("VALIDATE_PARAMETERS","validate",function(e){if(e.service.api.operations){var t=e.service.api.operations[e.operation].input,r=e.service.config.paramValidation;new i.ParamValidator(r).validate(t,e.params)}}),t("COMPUTE_SHA256","afterBuild",function(e,t){if(e.haltHandlersOnError(),e.service.api.operations){var r=e.service.api.operations[e.operation],n=r?r.authtype:"";if(!e.service.api.signatureVersion&&!n&&!e.service.config.signatureVersion)return t();if(e.service.getSignerClass(e)===i.Signers.V4){var o=e.httpRequest.body||""
+;if(n.indexOf("unsigned-body")>=0)return e.httpRequest.headers["X-Amz-Content-Sha256"]="UNSIGNED-PAYLOAD",t();i.util.computeSha256(o,function(r,n){r?t(r):(e.httpRequest.headers["X-Amz-Content-Sha256"]=n,t())})}else t()}}),e("SET_CONTENT_LENGTH","afterBuild",function(e){var t=n(e),r=i.util.getRequestPayloadShape(e);if(void 0===e.httpRequest.headers["Content-Length"])try{var o=i.util.string.byteLength(e.httpRequest.body);e.httpRequest.headers["Content-Length"]=o}catch(n){if(r&&r.isStreaming){if(r.requiresLength)throw n;if(t.indexOf("unsigned-body")>=0)return void(e.httpRequest.headers["Transfer-Encoding"]="chunked");throw n}throw n}}),e("SET_HTTP_HOST","afterBuild",function(e){e.httpRequest.headers.Host=e.httpRequest.endpoint.host}),e("RESTART","restart",function(){var e=this.response.error;e&&e.retryable&&(this.httpRequest=new i.HttpRequest(this.service.endpoint,this.service.region),this.response.retryCount<this.service.config.maxRetries?this.response.retryCount++:this.response.error=null)});t("DISCOVER_ENDPOINT","sign",s,!0),t("SIGN","sign",function(e,t){var r=e.service,n=e.service.api.operations||{},i=n[e.operation],o=i?i.authtype:"";if(!r.api.signatureVersion&&!o&&!r.config.signatureVersion)return t();r.config.getCredentials(function(n,o){if(n)return e.response.error=n,t();try{var s=r.getSkewCorrectedDate(),a=r.getSignerClass(e),u=new a(e.httpRequest,r.getSigningName(),{signatureCache:r.config.signatureCache,operation:i,signatureVersion:r.api.signatureVersion});u.setServiceClientId(r._clientId),delete e.httpRequest.headers.Authorization,delete e.httpRequest.headers.Date,delete e.httpRequest.headers["X-Amz-Date"],u.addAuthorization(o,s),e.signedAt=s}catch(t){e.response.error=t}t()})}),e("VALIDATE_RESPONSE","validateResponse",function(e){this.service.successfulResponse(e,this)?(e.data={},e.error=null):(e.data=null,e.error=i.util.error(new Error,{code:"UnknownError",message:"An unknown error occurred."}))}),t("SEND","send",function(e,t){function r(r){e.httpResponse.stream=r;var n=e.request.httpRequest.stream,o=e.request.service,s=o.api,a=e.request.operation,u=s.operations[a]||{};r.on("headers",function(n,s,a){if(e.request.emit("httpHeaders",[n,s,e,a]),!e.httpResponse.streaming)if(2===i.HttpClient.streamsApiVersion){if(u.hasEventOutput&&o.successfulResponse(e))return e.request.emit("httpDone"),void t();r.on("readable",function(){var t=r.read();null!==t&&e.request.emit("httpData",[t,e])})}else r.on("data",function(t){e.request.emit("httpData",[t,e])})}),r.on("end",function(){if(!n||!n.didCallback){if(2===i.HttpClient.streamsApiVersion&&u.hasEventOutput&&o.successfulResponse(e))return;e.request.emit("httpDone"),t()}})}function n(t){t.on("sendProgress",function(t){e.request.emit("httpUploadProgress",[t,e])}),t.on("receiveProgress",function(t){e.request.emit("httpDownloadProgress",[t,e])})}function o(r){if("RequestAbortedError"!==r.code){var n="TimeoutError"===r.code?r.code:"NetworkingError";r=i.util.error(r,{code:n,region:e.request.httpRequest.region,hostname:e.request.httpRequest.endpoint.hostname,retryable:!0})}e.error=r,e.request.emit("httpError",[e.error,e],function(){t()})}function s(){var t=i.HttpClient.getInstance(),s=e.request.service.config.httpOptions||{};try{n(t.handleRequest(e.request.httpRequest,s,r,o))}catch(e){o(e)}}e.httpResponse._abortCallback=t,e.error=null,e.data=null,(e.request.service.getSkewCorrectedDate()-this.signedAt)/1e3>=600?this.emit("sign",[this],function(e){e?t(e):s()}):s()}),e("HTTP_HEADERS","httpHeaders",function(e,t,r,n){r.httpResponse.statusCode=e,r.httpResponse.statusMessage=n,r.httpResponse.headers=t,r.httpResponse.body=i.util.buffer.toBuffer(""),r.httpResponse.buffers=[],r.httpResponse.numBytes=0;var o=t.date||t.Date,s=r.request.service;if(o){var a=Date.parse(o);s.config.correctClockSkew&&s.isClockSkewed(a)&&s.applyClockOffset(a)}}),e("HTTP_DATA","httpData",function(e,t){if(e){if(i.util.isNode()){t.httpResponse.numBytes+=e.length;var r=t.httpResponse.headers["content-length"],n={loaded:t.httpResponse.numBytes,total:r};t.request.emit("httpDownloadProgress",[n,t])}t.httpResponse.buffers.push(i.util.buffer.toBuffer(e))}}),e("HTTP_DONE","httpDone",function(e){if(e.httpResponse.buffers&&e.httpResponse.buffers.length>0){var t=i.util.buffer.concat(e.httpResponse.buffers);e.httpResponse.body=t}delete e.httpResponse.numBytes,delete e.httpResponse.buffers}),e("FINALIZE_ERROR","retry",function(e){e.httpResponse.statusCode&&(e.error.statusCode=e.httpResponse.statusCode,void 0===e.error.retryable&&(e.error.retryable=this.service.retryableError(e.error,this)))}),e("INVALIDATE_CREDENTIALS","retry",function(e){if(e.error)switch(e.error.code){case"RequestExpired":case"ExpiredTokenException":case"ExpiredToken":e.error.retryable=!0,e.request.service.config.credentials.expired=!0}}),e("EXPIRED_SIGNATURE","retry",function(e){var t=e.error;t&&"string"==typeof t.code&&"string"==typeof t.message&&t.code.match(/Signature/)&&t.message.match(/expired/)&&(e.error.retryable=!0)}),e("CLOCK_SKEWED","retry",function(e){e.error&&this.service.clockSkewError(e.error)&&this.service.config.correctClockSkew&&(e.error.retryable=!0)}),e("REDIRECT","retry",function(e){e.error&&e.error.statusCode>=300&&e.error.statusCode<400&&e.httpResponse.headers.location&&(this.httpRequest.endpoint=new i.Endpoint(e.httpResponse.headers.location),this.httpRequest.headers.Host=this.httpRequest.endpoint.host,e.error.redirect=!0,e.error.retryable=!0)}),e("RETRY_CHECK","retry",function(e){e.error&&(e.error.redirect&&e.redirectCount<e.maxRedirects?e.error.retryDelay=0:e.retryCount<e.maxRetries&&(e.error.retryDelay=this.service.retryDelays(e.retryCount,e.error)||0))}),t("RESET_RETRY_STATE","afterRetry",function(e,t){var r,n=!1;e.error&&(r=e.error.retryDelay||0,e.error.retryable&&e.retryCount<e.maxRetries?(e.retryCount++,n=!0):e.error.redirect&&e.redirectCount<e.maxRedirects&&(e.redirectCount++,n=!0)),n&&r>=0?(e.error=null,setTimeout(t,r)):t()})}),CorePost:(new o).addNamedListeners(function(e){e("EXTRACT_REQUEST_ID","extractData",i.util.extractRequestId),e("EXTRACT_REQUEST_ID","extractError",i.util.extractRequestId),e("ENOTFOUND_ERROR","httpError",function(e){if("NetworkingError"===e.code&&function(e){return"ENOTFOUND"===e.errno||"number"==typeof e.errno&&"function"==typeof i.util.getSystemErrorName&&["EAI_NONAME","EAI_NODATA"].indexOf(i.util.getSystemErrorName(e.errno)>=0)}(e)){var t="Inaccessible host: `"+e.hostname+"'. This service may not be available in the `"+e.region+"' region.";this.response.error=i.util.error(new Error(t),{code:"UnknownEndpoint",region:e.region,hostname:e.hostname,retryable:!0,originalError:e})}})}),Logger:(new o).addNamedListeners(function(t){t("LOG_REQUEST","complete",function(t){function r(e,t){if(!t)return t;if(e.isSensitive)return"***SensitiveInformation***";switch(e.type){case"structure":var n={};return i.util.each(t,function(t,i){Object.prototype.hasOwnProperty.call(e.members,t)?n[t]=r(e.members[t],i):n[t]=i}),n;case"list":var o=[];return i.util.arrayEach(t,function(t,n){o.push(r(e.member,t))}),o;case"map":var s={};return i.util.each(t,function(t,n){s[t]=r(e.value,n)}),s;default:return t}}var n=t.request,o=n.service.config.logger;if(o){var s=function(){var s=t.request.service.getSkewCorrectedDate().getTime(),a=(s-n.startTime.getTime())/1e3,u=!!o.isTTY,c=t.httpResponse.statusCode,l=n.params;if(n.service.api.operations&&n.service.api.operations[n.operation]&&n.service.api.operations[n.operation].input){l=r(n.service.api.operations[n.operation].input,n.params)}var h=e("util").inspect(l,!0,null),p="";return u&&(p+="[33m"),p+="[AWS "+n.service.serviceIdentifier+" "+c,p+=" "+a.toString()+"s "+t.retryCount+" retries]",u&&(p+="[0;1m"),p+=" "+i.util.string.lowerFirst(n.operation),p+="("+h+")",u&&(p+="[0m"),p}();"function"==typeof o.log?o.log(s):"function"==typeof o.write&&o.write(s+"\n")}})}),Json:(new o).addNamedListeners(function(t){var r=e("./protocol/json");t("BUILD","build",r.buildRequest),t("EXTRACT_DATA","extractData",r.extractData),t("EXTRACT_ERROR","extractError",r.extractError)}),Rest:(new o).addNamedListeners(function(t){var r=e("./protocol/rest");t("BUILD","build",r.buildRequest),t("EXTRACT_DATA","extractData",r.extractData),t("EXTRACT_ERROR","extractError",r.extractError)}),RestJson:(new o).addNamedListeners(function(t){var r=e("./protocol/rest_json");t("BUILD","build",r.buildRequest),t("EXTRACT_DATA","extractData",r.extractData),t("EXTRACT_ERROR","extractError",r.extractError)}),RestXml:(new o).addNamedListeners(function(t){var r=e("./protocol/rest_xml");t("BUILD","build",r.buildRequest),t("EXTRACT_DATA","extractData",r.extractData),t("EXTRACT_ERROR","extractError",r.extractError)}),Query:(new o).addNamedListeners(function(t){var r=e("./protocol/query");t("BUILD","build",r.buildRequest),t("EXTRACT_DATA","extractData",r.extractData),t("EXTRACT_ERROR","extractError",r.extractError)})}},{"./core":39,"./discover_endpoint":47,"./protocol/json":74,"./protocol/query":75,"./protocol/rest":76,"./protocol/rest_json":77,"./protocol/rest_xml":78,"./sequential_executor":88,util:20}],88:[function(e,t,r){var n=e("./core");n.SequentialExecutor=n.util.inherit({constructor:function(){this._events={}},listeners:function(e){return this._events[e]?this._events[e].slice(0):[]},on:function(e,t,r){return this._events[e]?r?this._events[e].unshift(t):this._events[e].push(t):this._events[e]=[t],this},onAsync:function(e,t,r){return t._isAsync=!0,this.on(e,t,r)},removeListener:function(e,t){var r=this._events[e];if(r){for(var n=r.length,i=-1,o=0;o<n;++o)r[o]===t&&(i=o);i>-1&&r.splice(i,1)}return this},removeAllListeners:function(e){return e?delete this._events[e]:this._events={},this},emit:function(e,t,r){r||(r=function(){});var n=this.listeners(e),i=n.length;return this.callListeners(n,t,r),i>0},callListeners:function(e,t,r,i){function o(i){if(i&&(a=n.util.error(a||new Error,i),s._haltHandlersOnError))return r.call(s,a);s.callListeners(e,t,r,a)}for(var s=this,a=i||null;e.length>0;){var u=e.shift();if(u._isAsync)return void u.apply(s,t.concat([o]));try{u.apply(s,t)}catch(e){a=n.util.error(a||new Error,e)}if(a&&s._haltHandlersOnError)return void r.call(s,a)}r.call(s,a)},addListeners:function(e){var t=this;return e._events&&(e=e._events),n.util.each(e,function(e,r){"function"==typeof r&&(r=[r]),n.util.arrayEach(r,function(r){t.on(e,r)})}),t},addNamedListener:function(e,t,r,n){return this[e]=r,this.addListener(t,r,n),this},addNamedAsyncListener:function(e,t,r,n){return r._isAsync=!0,this.addNamedListener(e,t,r,n)},addNamedListeners:function(e){var t=this;return e(function(){t.addNamedListener.apply(t,arguments)},function(){t.addNamedAsyncListener.apply(t,arguments)}),this}}),n.SequentialExecutor.prototype.addListener=n.SequentialExecutor.prototype.on,t.exports=n.SequentialExecutor},{"./core":39}],78:[function(e,t,r){function n(e){var t=e.service.api.operations[e.operation].input,r=new a.XML.Builder,n=e.params,i=t.payload;if(i){var o=t.members[i];if(void 0===(n=n[i]))return;if("structure"===o.type){var s=o.name;e.httpRequest.body=r.toXML(n,o,s,!0)}else e.httpRequest.body=n}else e.httpRequest.body=r.toXML(n,t,t.name||t.shape||u.string.upperFirst(e.operation)+"Request")}function i(e){c.buildRequest(e),["GET","HEAD"].indexOf(e.httpRequest.method)<0&&n(e)}function o(e){c.extractError(e);var t;try{t=(new a.XML.Parser).parse(e.httpResponse.body.toString())}catch(r){t={Code:e.httpResponse.statusCode,Message:e.httpResponse.statusMessage}}t.Errors&&(t=t.Errors),t.Error&&(t=t.Error),t.Code?e.error=u.error(new Error,{code:t.Code,message:t.Message}):e.error=u.error(new Error,{code:e.httpResponse.statusCode,message:null})}function s(e){c.extractData(e);var t,r=e.request,n=e.httpResponse.body,i=r.service.api.operations[r.operation],o=i.output,s=(i.hasEventOutput,o.payload);if(s){var l=o.members[s];l.isEventStream?(t=new a.XML.Parser,e.data[s]=u.createEventStream(2===a.HttpClient.streamsApiVersion?e.httpResponse.stream:e.httpResponse.body,t,l)):"structure"===l.type?(t=new a.XML.Parser,e.data[s]=t.parse(n.toString(),l)):"binary"===l.type||l.isStreaming?e.data[s]=n:e.data[s]=l.toType(n)}else if(n.length>0){t=new a.XML.Parser;var h=t.parse(n.toString(),o);u.update(e.data,h)}}var a=e("../core"),u=e("../util"),c=e("./rest");t.exports={buildRequest:i,extractError:o,extractData:s}},{"../core":39,"../util":118,"./rest":76}],77:[function(e,t,r){function n(e){var t=new h,r=e.service.api.operations[e.operation].input;if(r.payload){var n={},o=r.members[r.payload];if(void 0===(n=e.params[r.payload]))return;"structure"===o.type?(e.httpRequest.body=t.build(n,o),i(e)):(e.httpRequest.body=n,("binary"===o.type||o.isStreaming)&&i(e,!0))}else{var s=t.build(e.params,r);"{}"===s&&"GET"===e.httpRequest.method||(e.httpRequest.body=s),i(e)}}function i(e,t){var r=e.service.api.operations[e.operation];r.input;if(!e.httpRequest.headers["Content-Type"]){var n=t?"binary/octet-stream":"application/json";e.httpRequest.headers["Content-Type"]=n}}function o(e){c.buildRequest(e),["HEAD","DELETE"].indexOf(e.httpRequest.method)<0&&n(e)}function s(e){l.extractError(e)}function a(e){c.extractData(e);var t,r=e.request,n=r.service.api.operations[r.operation],i=r.service.api.operations[r.operation].output||{};n.hasEventOutput;if(i.payload){var o=i.members[i.payload],s=e.httpResponse.body;if(o.isEventStream)t=new p,e.data[payload]=u.createEventStream(2===AWS.HttpClient.streamsApiVersion?e.httpResponse.stream:s,t,o);else if("structure"===o.type||"list"===o.type){var t=new p;e.data[i.payload]=t.parse(s,o)}else"binary"===o.type||o.isStreaming?e.data[i.payload]=s:e.data[i.payload]=o.toType(s)}else{var a=e.data;l.extractData(e),e.data=u.merge(a,e.data)}}var u=e("../util"),c=e("./rest"),l=e("./json"),h=e("../json/builder"),p=e("../json/parser");t.exports={buildRequest:o,extractError:s,extractData:a}},{"../json/builder":63,"../json/parser":64,"../util":118,"./json":74,"./rest":76}],76:[function(e,t,r){function n(e){e.httpRequest.method=e.service.api.operations[e.operation].httpMethod}function i(e,t,r,n){var i=[e,t].join("/");i=i.replace(/\/+/g,"/");var o={},s=!1;if(l.each(r.members,function(e,t){var r=n[e];if(null!==r&&void 0!==r)if("uri"===t.location){var a=new RegExp("\\{"+t.name+"(\\+)?\\}");i=i.replace(a,function(e,t){return(t?l.uriEscapePath:l.uriEscape)(String(r))})}else"querystring"===t.location&&(s=!0,"list"===t.type?o[t.name]=r.map(function(e){return l.uriEscape(t.member.toWireFormat(e).toString())}):"map"===t.type?l.each(r,function(e,t){Array.isArray(t)?o[e]=t.map(function(e){return l.uriEscape(String(e))}):o[e]=l.uriEscape(String(t))}):o[t.name]=l.uriEscape(t.toWireFormat(r).toString()))}),s){i+=i.indexOf("?")>=0?"&":"?";var a=[];l.arrayEach(Object.keys(o).sort(),function(e){Array.isArray(o[e])||(o[e]=[o[e]]);for(var t=0;t<o[e].length;t++)a.push(l.uriEscape(String(e))+"="+o[e][t])}),i+=a.join("&")}return i}function o(e){var t=e.service.api.operations[e.operation],r=t.input,n=i(e.httpRequest.endpoint.path,t.httpPath,r,e.params);e.httpRequest.path=n}function s(e){var t=e.service.api.operations[e.operation];l.each(t.input.members,function(t,r){var n=e.params[t];null!==n&&void 0!==n&&("headers"===r.location&&"map"===r.type?l.each(n,function(t,n){e.httpRequest.headers[r.name+t]=n}):"header"===r.location&&(n=r.toWireFormat(n).toString(),r.isJsonValue&&(n=l.base64.encode(n)),e.httpRequest.headers[r.name]=n))})}function a(e){n(e),o(e),s(e),h(e)}function u(){}function c(e){var t=e.request,r={},n=e.httpResponse,i=t.service.api.operations[t.operation],o=i.output,s={};l.each(n.headers,function(e,t){s[e.toLowerCase()]=t}),l.each(o.members,function(e,t){var i=(t.name||e).toLowerCase();if("headers"===t.location&&"map"===t.type){r[e]={};var o=t.isLocationName?t.name:"",a=new RegExp("^"+o+"(.+)","i");l.each(n.headers,function(t,n){var i=t.match(a);null!==i&&(r[e][i[1]]=n)})}else if("header"===t.location){if(void 0!==s[i]){var u=t.isJsonValue?l.base64.decode(s[i]):s[i];r[e]=t.toType(u)}}else"statusCode"===t.location&&(r[e]=parseInt(n.statusCode,10))}),e.data=r}var l=e("../util"),h=e("./helpers").populateHostPrefix;t.exports={buildRequest:a,extractError:u,extractData:c,generateURI:i}},{"../util":118,"./helpers":73}],75:[function(e,t,r){function n(e){var t=e.service.api.operations[e.operation],r=e.httpRequest;r.headers["Content-Type"]="application/x-www-form-urlencoded; charset=utf-8",r.params={Version:e.service.api.apiVersion,Action:t.name},(new u).serialize(e.params,t.input,function(e,t){r.params[e]=t}),r.body=a.queryParamsToString(r.params),l(e)}function i(e){var t,r=e.httpResponse.body.toString();if(r.match("<UnknownOperationException"))t={Code:"UnknownOperation",Message:"Unknown operation "+e.request.operation};else try{t=(new s.XML.Parser).parse(r)}catch(r){t={Code:e.httpResponse.statusCode,Message:e.httpResponse.statusMessage}}t.requestId&&!e.requestId&&(e.requestId=t.requestId),t.Errors&&(t=t.Errors),t.Error&&(t=t.Error),t.Code?e.error=a.error(new Error,{code:t.Code,message:t.Message}):e.error=a.error(new Error,{code:e.httpResponse.statusCode,message:null})}function o(e){var t=e.request,r=t.service.api.operations[t.operation],n=r.output||{},i=n;if(i.resultWrapper){var o=c.create({type:"structure"});o.members[i.resultWrapper]=n,o.memberNames=[i.resultWrapper],a.property(n,"name",n.resultWrapper),n=o}var u=new s.XML.Parser;if(n&&n.members&&!n.members._XAMZRequestId){var l=c.create({type:"string"},{api:{protocol:"query"}},"requestId");n.members._XAMZRequestId=l}var h=u.parse(e.httpResponse.body.toString(),n);e.requestId=h._XAMZRequestId||h.requestId,h._XAMZRequestId&&delete h._XAMZRequestId,i.resultWrapper&&h[i.resultWrapper]&&(a.update(h,h[i.resultWrapper]),delete h[i.resultWrapper]),e.data=h}var s=e("../core"),a=e("../util"),u=e("../query/query_param_serializer"),c=e("../model/shape"),l=e("./helpers").populateHostPrefix;t.exports={buildRequest:n,extractError:i,extractData:o}},{"../core":39,"../model/shape":70,"../query/query_param_serializer":79,"../util":118,"./helpers":73}],79:[function(e,t,r){function n(){}function i(e){return e.isQueryName||"ec2"!==e.api.protocol?e.name:e.name[0].toUpperCase()+e.name.substr(1)}function o(e,t,r,n){c.each(r.members,function(r,o){var s=t[r];if(null!==s&&void 0!==s){var a=i(o);a=e?e+"."+a:a,u(a,s,o,n)}})}function s(e,t,r,n){var i=1;c.each(t,function(t,o){var s=r.flattened?".":".entry.",a=s+i+++".",c=a+(r.key.name||"key"),l=a+(r.value.name||"value");u(e+c,t,r.key,n),u(e+l,o,r.value,n)})}function a(e,t,r,n){var o=r.member||{};if(0===t.length)return void n.call(this,e,null);c.arrayEach(t,function(t,s){var a="."+(s+1);if("ec2"===r.api.protocol)a+="";else if(r.flattened){if(o.name){var c=e.split(".");c.pop(),c.push(i(o)),e=c.join(".")}}else a="."+(o.name?o.name:"member")+a;u(e+a,t,o,n)})}function u(e,t,r,n){null!==t&&void 0!==t&&("structure"===r.type?o(e,t,r,n):"list"===r.type?a(e,t,r,n):"map"===r.type?s(e,t,r,n):n(e,r.toWireFormat(t).toString()))}var c=e("../util");n.prototype.serialize=function(e,t,r){o("",e,t,r)},t.exports=n},{"../util":118}],70:[function(e,t,r){function n(e,t,r){null!==r&&void 0!==r&&y.property.apply(this,arguments)}function i(e,t){e.constructor.prototype[t]||y.memoizedProperty.apply(this,arguments)}function o(e,t,r){t=t||{},n(this,"shape",e.shape),n(this,"api",t.api,!1),n(this,"type",e.type),n(this,"enum",e.enum),n(this,"min",e.min),n(this,"max",e.max),n(this,"pattern",e.pattern),n(this,"location",e.location||this.location||"body"),n(this,"name",this.name||e.xmlName||e.queryName||e.locationName||r),n(this,"isStreaming",e.streaming||this.isStreaming||!1),n(this,"requiresLength",e.requiresLength,!1),n(this,"isComposite",e.isComposite||!1),n(this,"isShape",!0,!1),n(this,"isQueryName",Boolean(e.queryName),!1),n(this,"isLocationName",Boolean(e.locationName),!1),n(this,"isIdempotent",!0===e.idempotencyToken),n(this,"isJsonValue",!0===e.jsonvalue),n(this,"isSensitive",!0===e.sensitive||e.prototype&&!0===e.prototype.sensitive),n(this,"isEventStream",Boolean(e.eventstream),!1),n(this,"isEvent",Boolean(e.event),!1),n(this,"isEventPayload",Boolean(e.eventpayload),!1),n(this,"isEventHeader",Boolean(e.eventheader),!1),n(this,"isTimestampFormatSet",Boolean(e.timestampFormat)||e.prototype&&!0===e.prototype.isTimestampFormatSet,!1),n(this,"endpointDiscoveryId",Boolean(e.endpointdiscoveryid),!1),n(this,"hostLabel",Boolean(e.hostLabel),!1),t.documentation&&(n(this,"documentation",e.documentation),n(this,"documentationUrl",e.documentationUrl)),e.xmlAttribute&&n(this,"isXmlAttribute",e.xmlAttribute||!1),n(this,"defaultValue",null),this.toWireFormat=function(e){return null===e||void 0===e?"":e},this.toType=function(e){return e}}function s(e){o.apply(this,arguments),n(this,"isComposite",!0),e.flattened&&n(this,"flattened",e.flattened||!1)}function a(e,t){var r=this,a=null,u=!this.isShape;s.apply(this,arguments),u&&(n(this,"defaultValue",function(){return{}}),n(this,"members",{}),n(this,"memberNames",[]),n(this,"required",[]),n(this,"isRequired",function(){return!1})),e.members&&(n(this,"members",new g(e.members,t,function(e,r){return o.create(r,t,e)})),i(this,"memberNames",function(){return e.xmlOrder||Object.keys(e.members)}),e.event&&(i(this,"eventPayloadMemberName",function(){for(var e=r.members,t=r.memberNames,n=0,i=t.length;n<i;n++)if(e[t[n]].isEventPayload)return t[n]}),i(this,"eventHeaderMemberNames",function(){for(var e=r.members,t=r.memberNames,n=[],i=0,o=t.length;i<o;i++)e[t[i]].isEventHeader&&n.push(t[i]);return n}))),e.required&&(n(this,"required",e.required),n(this,"isRequired",function(t){if(!a){a={};for(var r=0;r<e.required.length;r++)a[e.required[r]]=!0}return a[t]},!1,!0)),n(this,"resultWrapper",e.resultWrapper||null),e.payload&&n(this,"payload",e.payload),"string"==typeof e.xmlNamespace?n(this,"xmlNamespaceUri",e.xmlNamespace):"object"==typeof e.xmlNamespace&&(n(this,"xmlNamespacePrefix",e.xmlNamespace.prefix),n(this,"xmlNamespaceUri",e.xmlNamespace.uri))}function u(e,t){var r=this,a=!this.isShape;if(s.apply(this,arguments),a&&n(this,"defaultValue",function(){return[]}),e.member&&i(this,"member",function(){return o.create(e.member,t)}),this.flattened){var u=this.name;i(this,"name",function(){return r.member.name||u})}}function c(e,t){var r=!this.isShape;s.apply(this,arguments),r&&(n(this,"defaultValue",function(){return{}}),n(this,"key",o.create({type:"string"},t)),n(this,"value",o.create({type:"string"},t))),e.key&&i(this,"key",function(){return o.create(e.key,t)}),e.value&&i(this,"value",function(){return o.create(e.value,t)})}function l(e){var t=this;if(o.apply(this,arguments),e.timestampFormat)n(this,"timestampFormat",e.timestampFormat);else if(t.isTimestampFormatSet&&this.timestampFormat)n(this,"timestampFormat",this.timestampFormat);else if("header"===this.location)n(this,"timestampFormat","rfc822");else if("querystring"===this.location)n(this,"timestampFormat","iso8601");else if(this.api)switch(this.api.protocol){case"json":case"rest-json":n(this,"timestampFormat","unixTimestamp");break;case"rest-xml":case"query":case"ec2":n(this,"timestampFormat","iso8601")}this.toType=function(e){return null===e||void 0===e?null:"function"==typeof e.toUTCString?e:"string"==typeof e||"number"==typeof e?y.date.parseTimestamp(e):null},this.toWireFormat=function(e){return y.date.format(e,t.timestampFormat)}}function h(){o.apply(this,arguments);var e=["rest-xml","query","ec2"];this.toType=function(t){return t=this.api&&e.indexOf(this.api.protocol)>-1?t||"":t,this.isJsonValue?JSON.parse(t):t&&"function"==typeof t.toString?t.toString():t},this.toWireFormat=function(e){return this.isJsonValue?JSON.stringify(e):e}}function p(){o.apply(this,arguments),this.toType=function(e){return null===e||void 0===e?null:parseFloat(e)},this.toWireFormat=this.toType}function f(){o.apply(this,arguments),this.toType=function(e){return null===e||void 0===e?null:parseInt(e,10)},this.toWireFormat=this.toType}function d(){o.apply(this,arguments),this.toType=function(e){var t=y.base64.decode(e);if(this.isSensitive&&y.isNode()&&"function"==typeof y.Buffer.alloc){var r=y.Buffer.alloc(t.length,t);t.fill(0),t=r}return t},this.toWireFormat=y.base64.encode}function m(){d.apply(this,arguments)}function v(){o.apply(this,arguments),this.toType=function(e){return"boolean"==typeof e?e:null===e||void 0===e?null:"true"===e}}var g=e("./collection"),y=e("../util");o.normalizedTypes={character:"string",double:"float",long:"integer",short:"integer",biginteger:"integer",bigdecimal:"float",blob:"binary"},o.types={structure:a,list:u,map:c,boolean:v,timestamp:l,float:p,integer:f,string:h,base64:m,binary:d},o.resolve=function(e,t){if(e.shape){var r=t.api.shapes[e.shape];if(!r)throw new Error("Cannot find shape reference: "+e.shape);return r}return null},o.create=function(e,t,r){if(e.isShape)return e;var n=o.resolve(e,t);if(n){var i=Object.keys(e);t.documentation||(i=i.filter(function(e){return!e.match(/documentation/)}));var s=function(){n.constructor.call(this,e,t,r)};return s.prototype=n,new s}e.type||(e.members?e.type="structure":e.member?e.type="list":e.key?e.type="map":e.type="string");var a=e.type;if(o.normalizedTypes[e.type]&&(e.type=o.normalizedTypes[e.type]),o.types[e.type])return new o.types[e.type](e,t,r);throw new Error("Unrecognized shape type: "+a)},o.shapes={StructureShape:a,ListShape:u,MapShape:c,StringShape:h,BooleanShape:v,Base64Shape:m},t.exports=o},{"../util":118,"./collection":66}],66:[function(e,t,r){function n(e,t,r,n){o(this,n(e),function(){return r(e,t)})}function i(e,t,r,i,o){i=i||String;var s=this;for(var a in e)Object.prototype.hasOwnProperty.call(e,a)&&(n.call(s,a,e[a],r,i),o&&o(a,e[a]))}var o=e("../util").memoizedProperty;t.exports=i},{"../util":118}],74:[function(e,t,r){function n(e){var t=e.httpRequest,r=e.service.api,n=r.targetPrefix+"."+r.operations[e.operation].name,i=r.jsonVersion||"1.0",o=r.operations[e.operation].input,s=new a;1===i&&(i="1.0"),t.body=s.build(e.params||{},o),t.headers["Content-Type"]="application/x-amz-json-"+i,t.headers["X-Amz-Target"]=n,c(e)}function i(e){var t={},r=e.httpResponse;if(t.code=r.headers["x-amzn-errortype"]||"UnknownError","string"==typeof t.code&&(t.code=t.code.split(":")[0]),r.body.length>0)try{var n=JSON.parse(r.body.toString()),i=n.__type||n.code||n.Code;i&&(t.code=i.split("#").pop()),"RequestEntityTooLarge"===t.code?t.message="Request body must be less than 1 MB":t.message=n.message||n.Message||null}catch(n){t.statusCode=r.statusCode,t.message=r.statusMessage}else t.statusCode=r.statusCode,t.message=r.statusCode.toString();e.error=s.error(new Error,t)}function o(e){var t=e.httpResponse.body.toString()||"{}";if(!1===e.request.service.config.convertResponseTypes)e.data=JSON.parse(t);else{var r=e.request.service.api.operations[e.request.operation],n=r.output||{},i=new u;e.data=i.parse(t,n)}}var s=e("../util"),a=e("../json/builder"),u=e("../json/parser"),c=e("./helpers").populateHostPrefix;t.exports={buildRequest:n,extractError:i,extractData:o}},{"../json/builder":63,"../json/parser":64,"../util":118,"./helpers":73}],73:[function(e,t,r){function n(e){if(!e.service.config.hostPrefixEnabled)return e;var t=e.service.api.operations[e.operation];if(i(e))return e;if(t.endpoint&&t.endpoint.hostPrefix){var r=t.endpoint.hostPrefix,n=o(r,e.params,t.input);s(e.httpRequest.endpoint,n),a(e.httpRequest.endpoint.hostname)}return e}function i(e){var t=e.service.api,r=t.operations[e.operation],n=t.endpointOperation&&t.endpointOperation===u.string.lowerFirst(r.name);return"NULL"!==r.endpointDiscoveryRequired||!0===n}function o(e,t,r){return u.each(r.members,function(r,n){if(!0===n.hostLabel){if("string"!=typeof t[r]||""===t[r])throw u.error(new Error,{message:"Parameter "+r+" should be a non-empty string.",code:"InvalidParameter"});var i=new RegExp("\\{"+r+"\\}","g");e=e.replace(i,t[r])}}),e}function s(e,t){e.host&&(e.host=t+e.host),e.hostname&&(e.hostname=t+e.hostname)}function a(e){var t=e.split("."),r=/^[a-zA-Z0-9]{1}$|^[a-zA-Z0-9][a-zA-Z0-9\-]*[a-zA-Z0-9]$/;u.arrayEach(t,function(e){if(!e.length||e.length<1||e.length>63)throw u.error(new Error,{code:"ValidationError",message:"Hostname label length should be between 1 to 63 characters, inclusive."});if(!r.test(e))throw c.util.error(new Error,{code:"ValidationError",message:e+" is not hostname compatible."})})}var u=e("../util"),c=e("../core");t.exports={populateHostPrefix:n}},{"../core":39,"../util":118}],64:[function(e,t,r){function n(){}function i(e,t){if(t&&void 0!==e)switch(t.type){case"structure":return o(e,t);case"map":return a(e,t);case"list":return s(e,t);default:return u(e,t)}}function o(e,t){if(null!=e){var r={},n=t.members;return c.each(n,function(t,n){var o=n.isLocationName?n.name:t;if(Object.prototype.hasOwnProperty.call(e,o)){var s=e[o],a=i(s,n);void 0!==a&&(r[t]=a)}}),r}}function s(e,t){if(null!=e){var r=[];return c.arrayEach(e,function(e){var n=i(e,t.member);void 0===n?r.push(null):r.push(n)}),r}}function a(e,t){if(null!=e){var r={};return c.each(e,function(e,n){var o=i(n,t.value);r[e]=void 0===o?null:o}),r}}function u(e,t){return t.toType(e)}var c=e("../util");n.prototype.parse=function(e,t){return i(JSON.parse(e),t)},t.exports=n},{"../util":118}],63:[function(e,t,r){function n(){}function i(e,t){if(t&&void 0!==e&&null!==e)switch(t.type){case"structure":return o(e,t);case"map":return a(e,t);case"list":return s(e,t);default:return u(e,t)}}function o(e,t){var r={};return c.each(e,function(e,n){var o=t.members[e];if(o){if("body"!==o.location)return;var s=o.isLocationName?o.name:e,a=i(n,o);void 0!==a&&(r[s]=a)}}),r}function s(e,t){var r=[];return c.arrayEach(e,function(e){var n=i(e,t.member);void 0!==n&&r.push(n)}),r}function a(e,t){var r={};return c.each(e,function(e,n){var o=i(n,t.value);void 0!==o&&(r[e]=o)}),r}function u(e,t){return t.toWireFormat(e)}var c=e("../util");n.prototype.build=function(e,t){return JSON.stringify(i(e,t))},t.exports=n},{"../util":118}],47:[function(e,t,r){(function(r){(function(){function n(e){var t=e.service,r=t.api||{},n={};return t.config.region&&(n.region=t.config.region),r.serviceId&&(n.serviceId=r.serviceId),t.config.credentials.accessKeyId&&(n.accessKeyId=t.config.credentials.accessKeyId),n}function i(e,t,r){r&&void 0!==t&&null!==t&&"structure"===r.type&&r.required&&r.required.length>0&&m.arrayEach(r.required,function(n){var o=r.members[n];if(!0===o.endpointDiscoveryId){var s=o.isLocationName?o.name:n;e[s]=String(t[n])}else i(e,t[n],o)})}function o(e,t){var r={};return i(r,e.params,t),r}function s(e){var t=e.service,r=t.api,i=r.operations?r.operations[e.operation]:void 0,s=i?i.input:void 0,a=o(e,s),c=n(e);Object.keys(a).length>0&&(c=m.update(c,a),i&&(c.operation=i.name));var l=d.endpointCache.get(c);if(!l||1!==l.length||""!==l[0].Address)if(l&&l.length>0)e.httpRequest.updateEndpoint(l[0].Address);else{var h=t.makeRequest(r.endpointOperation,{Operation:i.name,Identifiers:a});u(h),h.removeListener("validate",d.EventListeners.Core.VALIDATE_PARAMETERS),h.removeListener("retry",d.EventListeners.Core.RETRY_CHECK),d.endpointCache.put(c,[{Address:"",CachePeriodInMinutes:1}]),h.send(function(e,t){t&&t.Endpoints?d.endpointCache.put(c,t.Endpoints):e&&d.endpointCache.put(c,[{Address:"",CachePeriodInMinutes:1}])})}}function a(e,t){var r=e.service,i=r.api,s=i.operations?i.operations[e.operation]:void 0,a=s?s.input:void 0,c=o(e,a),l=n(e);Object.keys(c).length>0&&(l=m.update(l,c),s&&(l.operation=s.name));var h=d.EndpointCache.getKeyString(l),p=d.endpointCache.get(h);if(p&&1===p.length&&""===p[0].Address)return g[h]||(g[h]=[]),void g[h].push({request:e,callback:t});if(p&&p.length>0)e.httpRequest.updateEndpoint(p[0].Address),t();else{var f=r.makeRequest(i.endpointOperation,{Operation:s.name,Identifiers:c});f.removeListener("validate",d.EventListeners.Core.VALIDATE_PARAMETERS),u(f),d.endpointCache.put(h,[{Address:"",CachePeriodInMinutes:60}]),f.send(function(r,n){if(r){if(e.response.error=m.error(r,{retryable:!1}),d.endpointCache.remove(l),g[h]){var i=g[h];m.arrayEach(i,function(e){e.request.response.error=m.error(r,{retryable:!1}),e.callback()}),delete g[h]}}else if(n&&(d.endpointCache.put(h,n.Endpoints),
+e.httpRequest.updateEndpoint(n.Endpoints[0].Address),g[h])){var i=g[h];m.arrayEach(i,function(e){e.request.httpRequest.updateEndpoint(n.Endpoints[0].Address),e.callback()}),delete g[h]}t()})}}function u(e){var t=e.service.api,r=t.apiVersion;r&&!e.httpRequest.headers["x-amz-api-version"]&&(e.httpRequest.headers["x-amz-api-version"]=r)}function c(e){var t=e.error,r=e.httpResponse;if(t&&("InvalidEndpointException"===t.code||421===r.statusCode)){var i=e.request,s=i.service.api.operations||{},a=s[i.operation]?s[i.operation].input:void 0,u=o(i,a),c=n(i);Object.keys(u).length>0&&(c=m.update(c,u),s[i.operation]&&(c.operation=s[i.operation].name)),d.endpointCache.remove(c)}}function l(e){if(e._originalConfig&&e._originalConfig.endpoint&&!0===e._originalConfig.endpointDiscoveryEnabled)throw m.error(new Error,{code:"ConfigurationException",message:"Custom endpoint is supplied; endpointDiscoveryEnabled must not be true."});var t=d.config[e.serviceIdentifier]||{};return Boolean(d.config.endpoint||t.endpoint||e._originalConfig&&e._originalConfig.endpoint)}function h(e){return["false","0"].indexOf(e)>=0}function p(e){var t=e.service||{};if(void 0!==t.config.endpointDiscoveryEnabled)return t.config.endpointDiscoveryEnabled;if(!m.isBrowser()){for(var n=0;n<v.length;n++){var i=v[n];if(Object.prototype.hasOwnProperty.call(r.env,i)){if(""===r.env[i]||void 0===r.env[i])throw m.error(new Error,{code:"ConfigurationException",message:"environmental variable "+i+" cannot be set to nothing"});return!h(r.env[i])}}var o={};try{o=d.util.iniLoader?d.util.iniLoader.loadFrom({isConfig:!0,filename:r.env[d.util.sharedConfigFileEnv]}):{}}catch(e){}var s=o[r.env.AWS_PROFILE||d.util.defaultProfile]||{};if(Object.prototype.hasOwnProperty.call(s,"endpoint_discovery_enabled")){if(void 0===s.endpoint_discovery_enabled)throw m.error(new Error,{code:"ConfigurationException",message:"config file entry 'endpoint_discovery_enabled' cannot be set to nothing"});return!h(s.endpoint_discovery_enabled)}}}function f(e,t){var r=e.service||{};if(l(r)||e.isPresigned())return t();var n=r.api.operations||{},i=n[e.operation],o=i?i.endpointDiscoveryRequired:"NULL",u=p(e),h=r.api.hasRequiredEndpointDiscovery;switch((u||h)&&e.httpRequest.appendToUserAgent("endpoint-discovery"),o){case"OPTIONAL":(u||h)&&(s(e),e.addNamedListener("INVALIDATE_CACHED_ENDPOINTS","extractError",c)),t();break;case"REQUIRED":if(!1===u){e.response.error=m.error(new Error,{code:"ConfigurationException",message:"Endpoint Discovery is disabled but "+r.api.className+"."+e.operation+"() requires it. Please check your configurations."}),t();break}e.addNamedListener("INVALIDATE_CACHED_ENDPOINTS","extractError",c),a(e,t);break;case"NULL":default:t()}}var d=e("./core"),m=e("./util"),v=["AWS_ENABLE_ENDPOINT_DISCOVERY","AWS_ENDPOINT_DISCOVERY_ENABLED"],g={};t.exports={discoverEndpoint:f,requiredDiscoverEndpoint:a,optionalDiscoverEndpoint:s,marshallCustomIdentifiers:o,getCacheKey:n,invalidateCachedEndpoint:c}}).call(this)}).call(this,e("_process"))},{"./core":39,"./util":118,_process:8}],118:[function(e,t,r){(function(r,n){(function(){var i,o={environment:"nodejs",engine:function(){if(o.isBrowser()&&"undefined"!=typeof navigator)return navigator.userAgent;var e=r.platform+"/"+r.version;return r.env.AWS_EXECUTION_ENV&&(e+=" exec-env/"+r.env.AWS_EXECUTION_ENV),e},userAgent:function(){var t=o.environment,r="aws-sdk-"+t+"/"+e("./core").VERSION;return"nodejs"===t&&(r+=" "+o.engine()),r},uriEscape:function(e){var t=encodeURIComponent(e);return t=t.replace(/[^A-Za-z0-9_.~\-%]+/g,escape),t=t.replace(/[*]/g,function(e){return"%"+e.charCodeAt(0).toString(16).toUpperCase()})},uriEscapePath:function(e){var t=[];return o.arrayEach(e.split("/"),function(e){t.push(o.uriEscape(e))}),t.join("/")},urlParse:function(e){return o.url.parse(e)},urlFormat:function(e){return o.url.format(e)},queryStringParse:function(e){return o.querystring.parse(e)},queryParamsToString:function(e){var t=[],r=o.uriEscape,n=Object.keys(e).sort();return o.arrayEach(n,function(n){var i=e[n],s=r(n),a=s+"=";if(Array.isArray(i)){var u=[];o.arrayEach(i,function(e){u.push(r(e))}),a=s+"="+u.sort().join("&"+s+"=")}else void 0!==i&&null!==i&&(a=s+"="+r(i));t.push(a)}),t.join("&")},readFileSync:function(t){return o.isBrowser()?null:e("fs").readFileSync(t,"utf-8")},base64:{encode:function(e){if("number"==typeof e)throw o.error(new Error("Cannot base64 encode number "+e));return null===e||void 0===e?e:o.buffer.toBuffer(e).toString("base64")},decode:function(e){if("number"==typeof e)throw o.error(new Error("Cannot base64 decode number "+e));return null===e||void 0===e?e:o.buffer.toBuffer(e,"base64")}},buffer:{toBuffer:function(e,t){return"function"==typeof o.Buffer.from&&o.Buffer.from!==Uint8Array.from?o.Buffer.from(e,t):new o.Buffer(e,t)},alloc:function(e,t,r){if("number"!=typeof e)throw new Error("size passed to alloc must be a number.");if("function"==typeof o.Buffer.alloc)return o.Buffer.alloc(e,t,r);var n=new o.Buffer(e);return void 0!==t&&"function"==typeof n.fill&&n.fill(t,void 0,void 0,r),n},toStream:function(e){o.Buffer.isBuffer(e)||(e=o.buffer.toBuffer(e));var t=new o.stream.Readable,r=0;return t._read=function(n){if(r>=e.length)return t.push(null);var i=r+n;i>e.length&&(i=e.length),t.push(e.slice(r,i)),r=i},t},concat:function(e){var t,r=0,n=0,i=null;for(t=0;t<e.length;t++)r+=e[t].length;for(i=o.buffer.alloc(r),t=0;t<e.length;t++)e[t].copy(i,n),n+=e[t].length;return i}},string:{byteLength:function(t){if(null===t||void 0===t)return 0;if("string"==typeof t&&(t=o.buffer.toBuffer(t)),"number"==typeof t.byteLength)return t.byteLength;if("number"==typeof t.length)return t.length;if("number"==typeof t.size)return t.size;if("string"==typeof t.path)return e("fs").lstatSync(t.path).size;throw o.error(new Error("Cannot determine length of "+t),{object:t})},upperFirst:function(e){return e[0].toUpperCase()+e.substr(1)},lowerFirst:function(e){return e[0].toLowerCase()+e.substr(1)}},ini:{parse:function(e){var t,r={};return o.arrayEach(e.split(/\r?\n/),function(e){e=e.split(/(^|\s)[;#]/)[0];var n=e.match(/^\s*\[([^\[\]]+)\]\s*$/);if(n){if("__proto__"===(t=n[1])||"__proto__"===t.split(/\s/)[1])throw o.error(new Error("Cannot load profile name '"+t+"' from shared ini file."))}else if(t){var i=e.match(/^\s*(.+?)\s*=\s*(.+?)\s*$/);i&&(r[t]=r[t]||{},r[t][i[1]]=i[2])}}),r}},fn:{noop:function(){},callback:function(e){if(e)throw e},makeAsync:function(e,t){return t&&t<=e.length?e:function(){var t=Array.prototype.slice.call(arguments,0);t.pop()(e.apply(null,t))}}},date:{getDate:function(){return i||(i=e("./core")),i.config.systemClockOffset?new Date((new Date).getTime()+i.config.systemClockOffset):new Date},iso8601:function(e){return void 0===e&&(e=o.date.getDate()),e.toISOString().replace(/\.\d{3}Z$/,"Z")},rfc822:function(e){return void 0===e&&(e=o.date.getDate()),e.toUTCString()},unixTimestamp:function(e){return void 0===e&&(e=o.date.getDate()),e.getTime()/1e3},from:function(e){return"number"==typeof e?new Date(1e3*e):new Date(e)},format:function(e,t){return t||(t="iso8601"),o.date[t](o.date.from(e))},parseTimestamp:function(e){if("number"==typeof e)return new Date(1e3*e);if(e.match(/^\d+$/))return new Date(1e3*e);if(e.match(/^\d{4}/))return new Date(e);if(e.match(/^\w{3},/))return new Date(e);throw o.error(new Error("unhandled timestamp format: "+e),{code:"TimestampParserError"})}},crypto:{crc32Table:[0,1996959894,3993919788,2567524794,124634137,1886057615,3915621685,2657392035,249268274,2044508324,3772115230,2547177864,162941995,2125561021,3887607047,2428444049,498536548,1789927666,4089016648,2227061214,450548861,1843258603,4107580753,2211677639,325883990,1684777152,4251122042,2321926636,335633487,1661365465,4195302755,2366115317,997073096,1281953886,3579855332,2724688242,1006888145,1258607687,3524101629,2768942443,901097722,1119000684,3686517206,2898065728,853044451,1172266101,3705015759,2882616665,651767980,1373503546,3369554304,3218104598,565507253,1454621731,3485111705,3099436303,671266974,1594198024,3322730930,2970347812,795835527,1483230225,3244367275,3060149565,1994146192,31158534,2563907772,4023717930,1907459465,112637215,2680153253,3904427059,2013776290,251722036,2517215374,3775830040,2137656763,141376813,2439277719,3865271297,1802195444,476864866,2238001368,4066508878,1812370925,453092731,2181625025,4111451223,1706088902,314042704,2344532202,4240017532,1658658271,366619977,2362670323,4224994405,1303535960,984961486,2747007092,3569037538,1256170817,1037604311,2765210733,3554079995,1131014506,879679996,2909243462,3663771856,1141124467,855842277,2852801631,3708648649,1342533948,654459306,3188396048,3373015174,1466479909,544179635,3110523913,3462522015,1591671054,702138776,2966460450,3352799412,1504918807,783551873,3082640443,3233442989,3988292384,2596254646,62317068,1957810842,3939845945,2647816111,81470997,1943803523,3814918930,2489596804,225274430,2053790376,3826175755,2466906013,167816743,2097651377,4027552580,2265490386,503444072,1762050814,4150417245,2154129355,426522225,1852507879,4275313526,2312317920,282753626,1742555852,4189708143,2394877945,397917763,1622183637,3604390888,2714866558,953729732,1340076626,3518719985,2797360999,1068828381,1219638859,3624741850,2936675148,906185462,1090812512,3747672003,2825379669,829329135,1181335161,3412177804,3160834842,628085408,1382605366,3423369109,3138078467,570562233,1426400815,3317316542,2998733608,733239954,1555261956,3268935591,3050360625,752459403,1541320221,2607071920,3965973030,1969922972,40735498,2617837225,3943577151,1913087877,83908371,2512341634,3803740692,2075208622,213261112,2463272603,3855990285,2094854071,198958881,2262029012,4057260610,1759359992,534414190,2176718541,4139329115,1873836001,414664567,2282248934,4279200368,1711684554,285281116,2405801727,4167216745,1634467795,376229701,2685067896,3608007406,1308918612,956543938,2808555105,3495958263,1231636301,1047427035,2932959818,3654703836,1088359270,936918e3,2847714899,3736837829,1202900863,817233897,3183342108,3401237130,1404277552,615818150,3134207493,3453421203,1423857449,601450431,3009837614,3294710456,1567103746,711928724,3020668471,3272380065,1510334235,755167117],crc32:function(e){var t=o.crypto.crc32Table,r=-1;"string"==typeof e&&(e=o.buffer.toBuffer(e));for(var n=0;n<e.length;n++){r=r>>>8^t[255&(r^e.readUInt8(n))]}return(-1^r)>>>0},hmac:function(e,t,r,n){return r||(r="binary"),"buffer"===r&&(r=void 0),n||(n="sha256"),"string"==typeof t&&(t=o.buffer.toBuffer(t)),o.crypto.lib.createHmac(n,e).update(t).digest(r)},md5:function(e,t,r){return o.crypto.hash("md5",e,t,r)},sha256:function(e,t,r){return o.crypto.hash("sha256",e,t,r)},hash:function(e,t,r,n){var i=o.crypto.createHash(e);r||(r="binary"),"buffer"===r&&(r=void 0),"string"==typeof t&&(t=o.buffer.toBuffer(t));var s=o.arraySliceFn(t),a=o.Buffer.isBuffer(t);if(o.isBrowser()&&"undefined"!=typeof ArrayBuffer&&t&&t.buffer instanceof ArrayBuffer&&(a=!0),n&&"object"==typeof t&&"function"==typeof t.on&&!a)t.on("data",function(e){i.update(e)}),t.on("error",function(e){n(e)}),t.on("end",function(){n(null,i.digest(r))});else{if(!n||!s||a||"undefined"==typeof FileReader){o.isBrowser()&&"object"==typeof t&&!a&&(t=new o.Buffer(new Uint8Array(t)));var u=i.update(t).digest(r);return n&&n(null,u),u}var c=0,l=new FileReader;l.onerror=function(){n(new Error("Failed to read data."))},l.onload=function(){var e=new o.Buffer(new Uint8Array(l.result));i.update(e),c+=e.length,l._continueReading()},l._continueReading=function(){if(c>=t.size)return void n(null,i.digest(r));var e=c+524288;e>t.size&&(e=t.size),l.readAsArrayBuffer(s.call(t,c,e))},l._continueReading()}},toHex:function(e){for(var t=[],r=0;r<e.length;r++)t.push(("0"+e.charCodeAt(r).toString(16)).substr(-2,2));return t.join("")},createHash:function(e){return o.crypto.lib.createHash(e)}},abort:{},each:function(e,t){for(var r in e)if(Object.prototype.hasOwnProperty.call(e,r)){var n=t.call(this,r,e[r]);if(n===o.abort)break}},arrayEach:function(e,t){for(var r in e)if(Object.prototype.hasOwnProperty.call(e,r)){var n=t.call(this,e[r],parseInt(r,10));if(n===o.abort)break}},update:function(e,t){return o.each(t,function(t,r){e[t]=r}),e},merge:function(e,t){return o.update(o.copy(e),t)},copy:function(e){if(null===e||void 0===e)return e;var t={};for(var r in e)t[r]=e[r];return t},isEmpty:function(e){for(var t in e)if(Object.prototype.hasOwnProperty.call(e,t))return!1;return!0},arraySliceFn:function(e){var t=e.slice||e.webkitSlice||e.mozSlice;return"function"==typeof t?t:null},isType:function(e,t){return"function"==typeof t&&(t=o.typeName(t)),Object.prototype.toString.call(e)==="[object "+t+"]"},typeName:function(e){if(Object.prototype.hasOwnProperty.call(e,"name"))return e.name;var t=e.toString(),r=t.match(/^\s*function (.+)\(/);return r?r[1]:t},error:function(e,t){var r=null;return"string"==typeof e.message&&""!==e.message&&("string"==typeof t||t&&t.message)&&(r=o.copy(e),r.message=e.message),e.message=e.message||null,"string"==typeof t?e.message=t:"object"==typeof t&&null!==t&&(o.update(e,t),t.message&&(e.message=t.message),(t.code||t.name)&&(e.code=t.code||t.name),t.stack&&(e.stack=t.stack)),"function"==typeof Object.defineProperty&&(Object.defineProperty(e,"name",{writable:!0,enumerable:!1}),Object.defineProperty(e,"message",{enumerable:!0})),e.name=String(t&&t.name||e.name||e.code||"Error"),e.time=new Date,r&&(e.originalError=r),e},inherit:function(e,t){var r=null;if(void 0===t)t=e,e=Object,r={};else{var n=function(){};n.prototype=e.prototype,r=new n}return t.constructor===Object&&(t.constructor=function(){if(e!==Object)return e.apply(this,arguments)}),t.constructor.prototype=r,o.update(t.constructor.prototype,t),t.constructor.__super__=e,t.constructor},mixin:function(){for(var e=arguments[0],t=1;t<arguments.length;t++)for(var r in arguments[t].prototype){var n=arguments[t].prototype[r];"constructor"!==r&&(e.prototype[r]=n)}return e},hideProperties:function(e,t){"function"==typeof Object.defineProperty&&o.arrayEach(t,function(t){Object.defineProperty(e,t,{enumerable:!1,writable:!0,configurable:!0})})},property:function(e,t,r,n,i){var o={configurable:!0,enumerable:void 0===n||n};"function"!=typeof r||i?(o.value=r,o.writable=!0):o.get=r,Object.defineProperty(e,t,o)},memoizedProperty:function(e,t,r,n){var i=null;o.property(e,t,function(){return null===i&&(i=r()),i},n)},hoistPayloadMember:function(e){var t=e.request,r=t.operation,n=t.service.api.operations[r],i=n.output;if(i.payload&&!n.hasEventOutput){var s=i.members[i.payload],a=e.data[i.payload];"structure"===s.type&&o.each(a,function(t,r){o.property(e.data,t,r,!1)})}},computeSha256:function(t,r){if(o.isNode()){var n=o.stream.Stream,i=e("fs");if("function"==typeof n&&t instanceof n){if("string"!=typeof t.path)return r(new Error("Non-file stream objects are not supported with SigV4"));var s={};"number"==typeof t.start&&(s.start=t.start),"number"==typeof t.end&&(s.end=t.end),t=i.createReadStream(t.path,s)}}o.crypto.sha256(t,"hex",function(e,t){e?r(e):r(null,t)})},isClockSkewed:function(e){if(e)return o.property(i.config,"isClockSkewed",Math.abs((new Date).getTime()-e)>=3e5,!1),i.config.isClockSkewed},applyClockOffset:function(e){e&&(i.config.systemClockOffset=e-(new Date).getTime())},extractRequestId:function(e){var t=e.httpResponse.headers["x-amz-request-id"]||e.httpResponse.headers["x-amzn-requestid"];!t&&e.data&&e.data.ResponseMetadata&&(t=e.data.ResponseMetadata.RequestId),t&&(e.requestId=t),e.error&&(e.error.requestId=t)},addPromises:function(e,t){var r=!1;void 0===t&&i&&i.config&&(t=i.config.getPromisesDependency()),void 0===t&&"undefined"!=typeof Promise&&(t=Promise),"function"!=typeof t&&(r=!0),Array.isArray(e)||(e=[e]);for(var n=0;n<e.length;n++){var o=e[n];r?o.deletePromisesFromClass&&o.deletePromisesFromClass():o.addPromisesToClass&&o.addPromisesToClass(t)}},promisifyMethod:function(e,t){return function(){var r=this,n=Array.prototype.slice.call(arguments);return new t(function(t,i){n.push(function(e,r){e?i(e):t(r)}),r[e].apply(r,n)})}},isDualstackAvailable:function(t){if(!t)return!1;var r=e("../apis/metadata.json");return"string"!=typeof t&&(t=t.serviceIdentifier),!("string"!=typeof t||!r.hasOwnProperty(t))&&!!r[t].dualstackAvailable},calculateRetryDelay:function(e,t,r){t||(t={});var n=t.customBackoff||null;if("function"==typeof n)return n(e,r);var i="number"==typeof t.base?t.base:100;return Math.random()*(Math.pow(2,e)*i)},handleRequestWithRetries:function(e,t,r){t||(t={});var n=i.HttpClient.getInstance(),s=t.httpOptions||{},a=0,u=function(e){var n=t.maxRetries||0;if(e&&"TimeoutError"===e.code&&(e.retryable=!0),e&&e.retryable&&a<n){var i=o.calculateRetryDelay(a,t.retryDelayOptions,e);if(i>=0)return a++,void setTimeout(c,i+(e.retryAfter||0))}r(e)},c=function(){var t="";n.handleRequest(e,s,function(e){e.on("data",function(e){t+=e.toString()}),e.on("end",function(){var n=e.statusCode;if(n<300)r(null,t);else{var i=1e3*parseInt(e.headers["retry-after"],10)||0,s=o.error(new Error,{statusCode:n,retryable:n>=500||429===n});i&&s.retryable&&(s.retryAfter=i),u(s)}})},u)};i.util.defer(c)},uuid:{v4:function(){return e("uuid").v4()}},convertPayloadToString:function(e){var t=e.request,r=t.operation,n=t.service.api.operations[r].output||{};n.payload&&e.data[n.payload]&&(e.data[n.payload]=e.data[n.payload].toString())},defer:function(e){"object"==typeof r&&"function"==typeof r.nextTick?r.nextTick(e):"function"==typeof n?n(e):setTimeout(e,0)},getRequestPayloadShape:function(e){var t=e.service.api.operations;if(t){var r=(t||{})[e.operation];if(r&&r.input&&r.input.payload)return r.input.members[r.input.payload]}},getProfilesFromSharedConfig:function(e,t){function n(e,t){for(var r=0,n=Object.keys(t);r<n.length;r++)e[n[r]]=t[n[r]];return e}var i={},s={};if(r.env[o.configOptInEnv])var s=e.loadFrom({isConfig:!0,filename:r.env[o.sharedConfigFileEnv]});var a={};try{var a=e.loadFrom({filename:t||r.env[o.configOptInEnv]&&r.env[o.sharedCredentialsFileEnv]})}catch(e){if(!r.env[o.configOptInEnv])throw e}for(var u=0,c=Object.keys(s);u<c.length;u++)i[c[u]]=n(i[c[u]]||{},s[c[u]]);for(var u=0,c=Object.keys(a);u<c.length;u++)i[c[u]]=n(i[c[u]]||{},a[c[u]]);return i},ARN:{validate:function(e){return e&&0===e.indexOf("arn:")&&e.split(":").length>=6},parse:function(e){var t=e.split(":");return{partition:t[1],service:t[2],region:t[3],accountId:t[4],resource:t.slice(5).join(":")}},build:function(e){if(void 0===e.service||void 0===e.region||void 0===e.accountId||void 0===e.resource)throw o.error(new Error("Input ARN object is invalid"));return"arn:"+(e.partition||"aws")+":"+e.service+":"+e.region+":"+e.accountId+":"+e.resource}},defaultProfile:"default",configOptInEnv:"AWS_SDK_LOAD_CONFIG",sharedCredentialsFileEnv:"AWS_SHARED_CREDENTIALS_FILE",sharedConfigFileEnv:"AWS_CONFIG_FILE",imdsDisabledEnv:"AWS_EC2_METADATA_DISABLED"};t.exports=o}).call(this)}).call(this,e("_process"),e("timers").setImmediate)},{"../apis/metadata.json":26,"./core":39,_process:8,fs:2,timers:16,uuid:21}],37:[function(e,t,r){var n=e("./core");e("./credentials"),e("./credentials/credential_provider_chain");var i;n.Config=n.util.inherit({constructor:function(e){void 0===e&&(e={}),e=this.extractCredentials(e),n.util.each.call(this,this.keys,function(t,r){this.set(t,e[t],r)})},getCredentials:function(e){function t(t){e(t,t?null:i.credentials)}function r(e,t){return new n.util.error(t||new Error,{code:"CredentialsError",message:e,name:"CredentialsError"})}var i=this;i.credentials?"function"==typeof i.credentials.get?function(){i.credentials.get(function(e){e&&(e=r("Could not load credentials from "+i.credentials.constructor.name,e)),t(e)})}():function(){var e=null;i.credentials.accessKeyId&&i.credentials.secretAccessKey||(e=r("Missing credentials")),t(e)}():i.credentialProvider?i.credentialProvider.resolve(function(e,n){e&&(e=r("Could not load credentials from any providers",e)),i.credentials=n,t(e)}):t(r("No credentials to load"))},update:function(e,t){t=t||!1,e=this.extractCredentials(e),n.util.each.call(this,e,function(e,r){(t||Object.prototype.hasOwnProperty.call(this.keys,e)||n.Service.hasService(e))&&this.set(e,r)})},loadFromPath:function(e){this.clear();var t=JSON.parse(n.util.readFileSync(e)),r=new n.FileSystemCredentials(e),i=new n.CredentialProviderChain;return i.providers.unshift(r),i.resolve(function(e,r){if(e)throw e;t.credentials=r}),this.constructor(t),this},clear:function(){n.util.each.call(this,this.keys,function(e){delete this[e]}),this.set("credentials",void 0),this.set("credentialProvider",void 0)},set:function(e,t,r){void 0===t?(void 0===r&&(r=this.keys[e]),this[e]="function"==typeof r?r.call(this):r):"httpOptions"===e&&this[e]?this[e]=n.util.merge(this[e],t):this[e]=t},keys:{credentials:null,credentialProvider:null,region:null,logger:null,apiVersions:{},apiVersion:null,endpoint:void 0,httpOptions:{timeout:12e4},maxRetries:void 0,maxRedirects:10,paramValidation:!0,sslEnabled:!0,s3ForcePathStyle:!1,s3BucketEndpoint:!1,s3DisableBodySigning:!0,s3UsEast1RegionalEndpoint:"legacy",s3UseArnRegion:void 0,computeChecksums:!0,convertResponseTypes:!0,correctClockSkew:!1,customUserAgent:null,dynamoDbCrc32:!0,systemClockOffset:0,signatureVersion:null,signatureCache:!0,retryDelayOptions:{},useAccelerateEndpoint:!1,clientSideMonitoring:!1,endpointDiscoveryEnabled:void 0,endpointCacheSize:1e3,hostPrefixEnabled:!0,stsRegionalEndpoints:"legacy"},extractCredentials:function(e){return e.accessKeyId&&e.secretAccessKey&&(e=n.util.copy(e),e.credentials=new n.Credentials(e)),e},setPromisesDependency:function(e){i=e,null===e&&"function"==typeof Promise&&(i=Promise);var t=[n.Request,n.Credentials,n.CredentialProviderChain];n.S3&&(t.push(n.S3),n.S3.ManagedUpload&&t.push(n.S3.ManagedUpload)),n.util.addPromises(t,i)},getPromisesDependency:function(){return i}}),n.config=new n.Config},{"./core":39,"./credentials":40,"./credentials/credential_provider_chain":43}],43:[function(e,t,r){var n=e("../core");n.CredentialProviderChain=n.util.inherit(n.Credentials,{constructor:function(e){this.providers=e||n.CredentialProviderChain.defaultProviders.slice(0),this.resolveCallbacks=[]},resolve:function(e){function t(e,s){if(!e&&s||i===o.length)return n.util.arrayEach(r.resolveCallbacks,function(t){t(e,s)}),void(r.resolveCallbacks.length=0);var a=o[i++];s="function"==typeof a?a.call():a,s.get?s.get(function(e){t(e,e?null:s)}):t(null,s)}var r=this;if(0===r.providers.length)return e(new Error("No providers")),r;if(1===r.resolveCallbacks.push(e)){var i=0,o=r.providers.slice(0);t()}return r}}),n.CredentialProviderChain.defaultProviders=[],n.CredentialProviderChain.addPromisesToClass=function(e){this.prototype.resolvePromise=n.util.promisifyMethod("resolve",e)},n.CredentialProviderChain.deletePromisesFromClass=function(){delete this.prototype.resolvePromise},n.util.addPromises(n.CredentialProviderChain)},{"../core":39}],40:[function(e,t,r){var n=e("./core");n.Credentials=n.util.inherit({constructor:function(){if(n.util.hideProperties(this,["secretAccessKey"]),this.expired=!1,this.expireTime=null,this.refreshCallbacks=[],1===arguments.length&&"object"==typeof arguments[0]){var e=arguments[0].credentials||arguments[0];this.accessKeyId=e.accessKeyId,this.secretAccessKey=e.secretAccessKey,this.sessionToken=e.sessionToken}else this.accessKeyId=arguments[0],this.secretAccessKey=arguments[1],this.sessionToken=arguments[2]},expiryWindow:15,needsRefresh:function(){var e=n.util.date.getDate().getTime(),t=new Date(e+1e3*this.expiryWindow);return!!(this.expireTime&&t>this.expireTime)||(this.expired||!this.accessKeyId||!this.secretAccessKey)},get:function(e){var t=this;this.needsRefresh()?this.refresh(function(r){r||(t.expired=!1),e&&e(r)}):e&&e()},refresh:function(e){this.expired=!1,e()},coalesceRefresh:function(e,t){var r=this;1===r.refreshCallbacks.push(e)&&r.load(function(e){n.util.arrayEach(r.refreshCallbacks,function(r){t?r(e):n.util.defer(function(){r(e)})}),r.refreshCallbacks.length=0})},load:function(e){e()}}),n.Credentials.addPromisesToClass=function(e){this.prototype.getPromise=n.util.promisifyMethod("get",e),this.prototype.refreshPromise=n.util.promisifyMethod("refresh",e)},n.Credentials.deletePromisesFromClass=function(){delete this.prototype.getPromise,delete this.prototype.refreshPromise},n.util.addPromises(n.Credentials)},{"./core":39}],27:[function(e,t,r){function n(e,t){if(!n.services.hasOwnProperty(e))throw new Error("InvalidService: Failed to load api for "+e);return n.services[e][t]}n.services={},t.exports=n},{}],26:[function(e,t,r){t.exports={acm:{name:"ACM",cors:!0},apigateway:{name:"APIGateway",cors:!0},applicationautoscaling:{prefix:"application-autoscaling",name:"ApplicationAutoScaling",cors:!0},appstream:{name:"AppStream"},autoscaling:{name:"AutoScaling",cors:!0},batch:{name:"Batch"},budgets:{name:"Budgets"},clouddirectory:{name:"CloudDirectory",versions:["2016-05-10*"]},cloudformation:{name:"CloudFormation",cors:!0},cloudfront:{name:"CloudFront",versions:["2013-05-12*","2013-11-11*","2014-05-31*","2014-10-21*","2014-11-06*","2015-04-17*","2015-07-27*","2015-09-17*","2016-01-13*","2016-01-28*","2016-08-01*","2016-08-20*","2016-09-07*","2016-09-29*","2016-11-25*","2017-03-25*","2017-10-30*","2018-06-18*","2018-11-05*","2019-03-26*"],cors:!0},cloudhsm:{name:"CloudHSM",cors:!0},cloudsearch:{name:"CloudSearch"},cloudsearchdomain:{name:"CloudSearchDomain"},cloudtrail:{name:"CloudTrail",cors:!0},cloudwatch:{prefix:"monitoring",name:"CloudWatch",cors:!0},cloudwatchevents:{prefix:"events",name:"CloudWatchEvents",versions:["2014-02-03*"],cors:!0},cloudwatchlogs:{prefix:"logs",name:"CloudWatchLogs",cors:!0},codebuild:{name:"CodeBuild",cors:!0},codecommit:{name:"CodeCommit",cors:!0},codedeploy:{name:"CodeDeploy",cors:!0},codepipeline:{name:"CodePipeline",cors:!0},cognitoidentity:{prefix:"cognito-identity",name:"CognitoIdentity",cors:!0},cognitoidentityserviceprovider:{prefix:"cognito-idp",name:"CognitoIdentityServiceProvider",cors:!0},cognitosync:{prefix:"cognito-sync",name:"CognitoSync",cors:!0},configservice:{prefix:"config",name:"ConfigService",cors:!0},cur:{name:"CUR",cors:!0},datapipeline:{name:"DataPipeline"},devicefarm:{name:"DeviceFarm",cors:!0},directconnect:{name:"DirectConnect",cors:!0},directoryservice:{prefix:"ds",name:"DirectoryService"},discovery:{name:"Discovery"},dms:{name:"DMS"},dynamodb:{name:"DynamoDB",cors:!0},dynamodbstreams:{prefix:"streams.dynamodb",name:"DynamoDBStreams",cors:!0},ec2:{name:"EC2",versions:["2013-06-15*","2013-10-15*","2014-02-01*","2014-05-01*","2014-06-15*","2014-09-01*","2014-10-01*","2015-03-01*","2015-04-15*","2015-10-01*","2016-04-01*","2016-09-15*"],cors:!0},ecr:{name:"ECR",cors:!0},ecs:{name:"ECS",cors:!0},efs:{prefix:"elasticfilesystem",name:"EFS",cors:!0},elasticache:{name:"ElastiCache",versions:["2012-11-15*","2014-03-24*","2014-07-15*","2014-09-30*"],cors:!0},elasticbeanstalk:{name:"ElasticBeanstalk",cors:!0},elb:{prefix:"elasticloadbalancing",name:"ELB",cors:!0},elbv2:{prefix:"elasticloadbalancingv2",name:"ELBv2",cors:!0},emr:{prefix:"elasticmapreduce",name:"EMR",cors:!0},es:{name:"ES"},elastictranscoder:{name:"ElasticTranscoder",cors:!0},firehose:{name:"Firehose",cors:!0},gamelift:{name:"GameLift",cors:!0},glacier:{name:"Glacier"},health:{name:"Health"},iam:{name:"IAM",cors:!0},importexport:{name:"ImportExport"},inspector:{name:"Inspector",versions:["2015-08-18*"],cors:!0},iot:{name:"Iot",cors:!0},iotdata:{prefix:"iot-data",name:"IotData",cors:!0},kinesis:{name:"Kinesis",cors:!0},kinesisanalytics:{name:"KinesisAnalytics"},kms:{name:"KMS",cors:!0},lambda:{name:"Lambda",cors:!0},lexruntime:{prefix:"runtime.lex",name:"LexRuntime",cors:!0},lightsail:{name:"Lightsail"},machinelearning:{name:"MachineLearning",cors:!0},marketplacecommerceanalytics:{name:"MarketplaceCommerceAnalytics",cors:!0},marketplacemetering:{prefix:"meteringmarketplace",name:"MarketplaceMetering"},mturk:{prefix:"mturk-requester",name:"MTurk",cors:!0},mobileanalytics:{name:"MobileAnalytics",cors:!0},opsworks:{name:"OpsWorks",cors:!0},opsworkscm:{name:"OpsWorksCM"},organizations:{name:"Organizations"},pinpoint:{name:"Pinpoint"},polly:{name:"Polly",cors:!0},rds:{name:"RDS",versions:["2014-09-01*"],cors:!0},redshift:{name:"Redshift",cors:!0},rekognition:{name:"Rekognition",cors:!0},resourcegroupstaggingapi:{name:"ResourceGroupsTaggingAPI"},route53:{name:"Route53",cors:!0},route53domains:{name:"Route53Domains",cors:!0},s3:{name:"S3",dualstackAvailable:!0,cors:!0},s3control:{name:"S3Control",dualstackAvailable:!0,xmlNoDefaultLists:!0},servicecatalog:{name:"ServiceCatalog",cors:!0},ses:{prefix:"email",name:"SES",cors:!0},shield:{name:"Shield"},simpledb:{prefix:"sdb",name:"SimpleDB"},sms:{name:"SMS"},snowball:{name:"Snowball"},sns:{name:"SNS",cors:!0},sqs:{name:"SQS",cors:!0},ssm:{name:"SSM",cors:!0},storagegateway:{name:"StorageGateway",cors:!0},stepfunctions:{prefix:"states",name:"StepFunctions"},sts:{name:"STS",cors:!0},support:{name:"Support"},swf:{name:"SWF"},xray:{name:"XRay",cors:!0},waf:{name:"WAF",cors:!0},wafregional:{prefix:"waf-regional",name:"WAFRegional"},workdocs:{name:"WorkDocs",cors:!0},workspaces:{name:"WorkSpaces"},codestar:{name:"CodeStar"},lexmodelbuildingservice:{prefix:"lex-models",name:"LexModelBuildingService",cors:!0},marketplaceentitlementservice:{prefix:"entitlement.marketplace",name:"MarketplaceEntitlementService"},athena:{name:"Athena"},greengrass:{name:"Greengrass"},dax:{name:"DAX"},migrationhub:{prefix:"AWSMigrationHub",name:"MigrationHub"},cloudhsmv2:{name:"CloudHSMV2"},glue:{name:"Glue"},mobile:{name:"Mobile"},pricing:{name:"Pricing",cors:!0},costexplorer:{prefix:"ce",name:"CostExplorer",cors:!0},mediaconvert:{name:"MediaConvert"},medialive:{name:"MediaLive"},mediapackage:{name:"MediaPackage"},mediastore:{name:"MediaStore"},mediastoredata:{prefix:"mediastore-data",name:"MediaStoreData",cors:!0},appsync:{name:"AppSync"},guardduty:{name:"GuardDuty"},mq:{name:"MQ"},comprehend:{name:"Comprehend",cors:!0},iotjobsdataplane:{prefix:"iot-jobs-data",name:"IoTJobsDataPlane"},kinesisvideoarchivedmedia:{prefix:"kinesis-video-archived-media",name:"KinesisVideoArchivedMedia",cors:!0},kinesisvideomedia:{prefix:"kinesis-video-media",name:"KinesisVideoMedia",cors:!0},kinesisvideo:{name:"KinesisVideo",cors:!0},sagemakerruntime:{prefix:"runtime.sagemaker",name:"SageMakerRuntime"},sagemaker:{name:"SageMaker"},translate:{name:"Translate",cors:!0},resourcegroups:{prefix:"resource-groups",name:"ResourceGroups",cors:!0},alexaforbusiness:{name:"AlexaForBusiness"},cloud9:{name:"Cloud9"},serverlessapplicationrepository:{prefix:"serverlessrepo",name:"ServerlessApplicationRepository"},servicediscovery:{name:"ServiceDiscovery"},workmail:{name:"WorkMail"},autoscalingplans:{prefix:"autoscaling-plans",name:"AutoScalingPlans"},transcribeservice:{prefix:"transcribe",name:"TranscribeService"},connect:{name:"Connect",cors:!0},acmpca:{prefix:"acm-pca",name:"ACMPCA"},fms:{name:"FMS"},secretsmanager:{name:"SecretsManager",cors:!0},iotanalytics:{name:"IoTAnalytics",cors:!0},iot1clickdevicesservice:{prefix:"iot1click-devices",name:"IoT1ClickDevicesService"},iot1clickprojects:{prefix:"iot1click-projects",name:"IoT1ClickProjects"},pi:{name:"PI"},neptune:{name:"Neptune"},mediatailor:{name:"MediaTailor"},eks:{name:"EKS"},macie:{name:"Macie"},dlm:{name:"DLM"},signer:{name:"Signer"},chime:{name:"Chime"},pinpointemail:{prefix:"pinpoint-email",name:"PinpointEmail"},ram:{name:"RAM"},route53resolver:{name:"Route53Resolver"},pinpointsmsvoice:{prefix:"sms-voice",name:"PinpointSMSVoice"},quicksight:{name:"QuickSight"},rdsdataservice:{prefix:"rds-data",name:"RDSDataService"},amplify:{name:"Amplify"},datasync:{name:"DataSync"},robomaker:{name:"RoboMaker"},transfer:{name:"Transfer"},globalaccelerator:{name:"GlobalAccelerator"},comprehendmedical:{name:"ComprehendMedical",cors:!0},kinesisanalyticsv2:{name:"KinesisAnalyticsV2"},mediaconnect:{name:"MediaConnect"},fsx:{name:"FSx"},securityhub:{name:"SecurityHub"},appmesh:{name:"AppMesh",versions:["2018-10-01*"]},licensemanager:{prefix:"license-manager",name:"LicenseManager"},kafka:{name:"Kafka"},apigatewaymanagementapi:{
+name:"ApiGatewayManagementApi"},apigatewayv2:{name:"ApiGatewayV2"},docdb:{name:"DocDB"},backup:{name:"Backup"},worklink:{name:"WorkLink"},textract:{name:"Textract"},managedblockchain:{name:"ManagedBlockchain"},mediapackagevod:{prefix:"mediapackage-vod",name:"MediaPackageVod"},groundstation:{name:"GroundStation"},iotthingsgraph:{name:"IoTThingsGraph"},iotevents:{name:"IoTEvents"},ioteventsdata:{prefix:"iotevents-data",name:"IoTEventsData"},personalize:{name:"Personalize",cors:!0},personalizeevents:{prefix:"personalize-events",name:"PersonalizeEvents",cors:!0},personalizeruntime:{prefix:"personalize-runtime",name:"PersonalizeRuntime",cors:!0},applicationinsights:{prefix:"application-insights",name:"ApplicationInsights"},servicequotas:{prefix:"service-quotas",name:"ServiceQuotas"},ec2instanceconnect:{prefix:"ec2-instance-connect",name:"EC2InstanceConnect"},eventbridge:{name:"EventBridge"},lakeformation:{name:"LakeFormation"},forecastservice:{prefix:"forecast",name:"ForecastService",cors:!0},forecastqueryservice:{prefix:"forecastquery",name:"ForecastQueryService",cors:!0},qldb:{name:"QLDB"},qldbsession:{prefix:"qldb-session",name:"QLDBSession"},workmailmessageflow:{name:"WorkMailMessageFlow"},codestarnotifications:{prefix:"codestar-notifications",name:"CodeStarNotifications"},savingsplans:{name:"SavingsPlans"},sso:{name:"SSO"},ssooidc:{prefix:"sso-oidc",name:"SSOOIDC"},marketplacecatalog:{prefix:"marketplace-catalog",name:"MarketplaceCatalog"},dataexchange:{name:"DataExchange"},sesv2:{name:"SESV2"},migrationhubconfig:{prefix:"migrationhub-config",name:"MigrationHubConfig"},connectparticipant:{name:"ConnectParticipant"},appconfig:{name:"AppConfig"},iotsecuretunneling:{name:"IoTSecureTunneling"},wafv2:{name:"WAFV2"},elasticinference:{prefix:"elastic-inference",name:"ElasticInference"},imagebuilder:{name:"Imagebuilder"},schemas:{name:"Schemas"},accessanalyzer:{name:"AccessAnalyzer"},codegurureviewer:{prefix:"codeguru-reviewer",name:"CodeGuruReviewer"},codeguruprofiler:{name:"CodeGuruProfiler"},computeoptimizer:{prefix:"compute-optimizer",name:"ComputeOptimizer"},frauddetector:{name:"FraudDetector"},kendra:{name:"Kendra"},networkmanager:{name:"NetworkManager"},outposts:{name:"Outposts"},augmentedairuntime:{prefix:"sagemaker-a2i-runtime",name:"AugmentedAIRuntime"},ebs:{name:"EBS"},kinesisvideosignalingchannels:{prefix:"kinesis-video-signaling",name:"KinesisVideoSignalingChannels",cors:!0},detective:{name:"Detective"},codestarconnections:{prefix:"codestar-connections",name:"CodeStarconnections"},synthetics:{name:"Synthetics"},iotsitewise:{name:"IoTSiteWise"},macie2:{name:"Macie2"},codeartifact:{name:"CodeArtifact"},honeycode:{name:"Honeycode"},ivs:{name:"IVS"},braket:{name:"Braket"},identitystore:{name:"IdentityStore"},appflow:{name:"Appflow"},redshiftdata:{prefix:"redshift-data",name:"RedshiftData"},ssoadmin:{prefix:"sso-admin",name:"SSOAdmin"},timestreamquery:{prefix:"timestream-query",name:"TimestreamQuery"},timestreamwrite:{prefix:"timestream-write",name:"TimestreamWrite"},s3outposts:{name:"S3Outposts"},databrew:{name:"DataBrew"},servicecatalogappregistry:{prefix:"servicecatalog-appregistry",name:"ServiceCatalogAppRegistry"},networkfirewall:{prefix:"network-firewall",name:"NetworkFirewall"},mwaa:{name:"MWAA"},amplifybackend:{name:"AmplifyBackend"},appintegrations:{name:"AppIntegrations"},connectcontactlens:{prefix:"connect-contact-lens",name:"ConnectContactLens"},devopsguru:{prefix:"devops-guru",name:"DevOpsGuru"},ecrpublic:{prefix:"ecr-public",name:"ECRPUBLIC"},lookoutvision:{name:"LookoutVision"},sagemakerfeaturestoreruntime:{prefix:"sagemaker-featurestore-runtime",name:"SageMakerFeatureStoreRuntime"},customerprofiles:{prefix:"customer-profiles",name:"CustomerProfiles"},auditmanager:{name:"AuditManager"},emrcontainers:{prefix:"emr-containers",name:"EMRcontainers"},healthlake:{name:"HealthLake"},sagemakeredge:{prefix:"sagemaker-edge",name:"SagemakerEdge"},amp:{name:"Amp"},greengrassv2:{name:"GreengrassV2"},iotdeviceadvisor:{name:"IotDeviceAdvisor"},iotfleethub:{name:"IoTFleetHub"},iotwireless:{name:"IoTWireless"},location:{name:"Location"},wellarchitected:{name:"WellArchitected"}}},{}],21:[function(e,t,r){var n=e("./v1"),i=e("./v4"),o=i;o.v1=n,o.v4=i,t.exports=o},{"./v1":24,"./v4":25}],25:[function(e,t,r){function n(e,t,r){var n=t&&r||0;"string"==typeof e&&(t="binary"===e?new Array(16):null,e=null),e=e||{};var s=e.random||(e.rng||i)();if(s[6]=15&s[6]|64,s[8]=63&s[8]|128,t)for(var a=0;a<16;++a)t[n+a]=s[a];return t||o(s)}var i=e("./lib/rng"),o=e("./lib/bytesToUuid");t.exports=n},{"./lib/bytesToUuid":22,"./lib/rng":23}],24:[function(e,t,r){function n(e,t,r){var n=t&&r||0,l=t||[];e=e||{};var h=e.node||i,p=void 0!==e.clockseq?e.clockseq:o;if(null==h||null==p){var f=s();null==h&&(h=i=[1|f[0],f[1],f[2],f[3],f[4],f[5]]),null==p&&(p=o=16383&(f[6]<<8|f[7]))}var d=void 0!==e.msecs?e.msecs:(new Date).getTime(),m=void 0!==e.nsecs?e.nsecs:c+1,v=d-u+(m-c)/1e4;if(v<0&&void 0===e.clockseq&&(p=p+1&16383),(v<0||d>u)&&void 0===e.nsecs&&(m=0),m>=1e4)throw new Error("uuid.v1(): Can't create more than 10M uuids/sec");u=d,c=m,o=p,d+=122192928e5;var g=(1e4*(268435455&d)+m)%4294967296;l[n++]=g>>>24&255,l[n++]=g>>>16&255,l[n++]=g>>>8&255,l[n++]=255&g;var y=d/4294967296*1e4&268435455;l[n++]=y>>>8&255,l[n++]=255&y,l[n++]=y>>>24&15|16,l[n++]=y>>>16&255,l[n++]=p>>>8|128,l[n++]=255&p;for(var b=0;b<6;++b)l[n+b]=h[b];return t||a(l)}var i,o,s=e("./lib/rng"),a=e("./lib/bytesToUuid"),u=0,c=0;t.exports=n},{"./lib/bytesToUuid":22,"./lib/rng":23}],23:[function(e,t,r){var n="undefined"!=typeof crypto&&crypto.getRandomValues&&crypto.getRandomValues.bind(crypto)||"undefined"!=typeof msCrypto&&"function"==typeof window.msCrypto.getRandomValues&&msCrypto.getRandomValues.bind(msCrypto);if(n){var i=new Uint8Array(16);t.exports=function(){return n(i),i}}else{var o=new Array(16);t.exports=function(){for(var e,t=0;t<16;t++)0==(3&t)&&(e=4294967296*Math.random()),o[t]=e>>>((3&t)<<3)&255;return o}}},{}],22:[function(e,t,r){function n(e,t){var r=t||0,n=i;return[n[e[r++]],n[e[r++]],n[e[r++]],n[e[r++]],"-",n[e[r++]],n[e[r++]],"-",n[e[r++]],n[e[r++]],"-",n[e[r++]],n[e[r++]],"-",n[e[r++]],n[e[r++]],n[e[r++]],n[e[r++]],n[e[r++]],n[e[r++]]].join("")}for(var i=[],o=0;o<256;++o)i[o]=(o+256).toString(16).substr(1);t.exports=n},{}],20:[function(e,t,r){(function(t,n){(function(){function i(e,t){var n={seen:[],stylize:s};return arguments.length>=3&&(n.depth=arguments[2]),arguments.length>=4&&(n.colors=arguments[3]),m(t)?n.showHidden=t:t&&r._extend(n,t),E(n.showHidden)&&(n.showHidden=!1),E(n.depth)&&(n.depth=2),E(n.colors)&&(n.colors=!1),E(n.customInspect)&&(n.customInspect=!0),n.colors&&(n.stylize=o),u(n,e,n.depth)}function o(e,t){var r=i.styles[t];return r?"["+i.colors[r][0]+"m"+e+"["+i.colors[r][1]+"m":e}function s(e,t){return e}function a(e){var t={};return e.forEach(function(e,r){t[e]=!0}),t}function u(e,t,n){if(e.customInspect&&t&&A(t.inspect)&&t.inspect!==r.inspect&&(!t.constructor||t.constructor.prototype!==t)){var i=t.inspect(n,e);return b(i)||(i=u(e,i,n)),i}var o=c(e,t);if(o)return o;var s=Object.keys(t),m=a(s);if(e.showHidden&&(s=Object.getOwnPropertyNames(t)),x(t)&&(s.indexOf("message")>=0||s.indexOf("description")>=0))return l(t);if(0===s.length){if(A(t)){var v=t.name?": "+t.name:"";return e.stylize("[Function"+v+"]","special")}if(_(t))return e.stylize(RegExp.prototype.toString.call(t),"regexp");if(C(t))return e.stylize(Date.prototype.toString.call(t),"date");if(x(t))return l(t)}var g="",y=!1,w=["{","}"];if(d(t)&&(y=!0,w=["[","]"]),A(t)){g=" [Function"+(t.name?": "+t.name:"")+"]"}if(_(t)&&(g=" "+RegExp.prototype.toString.call(t)),C(t)&&(g=" "+Date.prototype.toUTCString.call(t)),x(t)&&(g=" "+l(t)),0===s.length&&(!y||0==t.length))return w[0]+g+w[1];if(n<0)return _(t)?e.stylize(RegExp.prototype.toString.call(t),"regexp"):e.stylize("[Object]","special");e.seen.push(t);var E;return E=y?h(e,t,n,m,s):s.map(function(r){return p(e,t,n,m,r,y)}),e.seen.pop(),f(E,g,w)}function c(e,t){if(E(t))return e.stylize("undefined","undefined");if(b(t)){var r="'"+JSON.stringify(t).replace(/^"|"$/g,"").replace(/'/g,"\\'").replace(/\\"/g,'"')+"'";return e.stylize(r,"string")}return y(t)?e.stylize(""+t,"number"):m(t)?e.stylize(""+t,"boolean"):v(t)?e.stylize("null","null"):void 0}function l(e){return"["+Error.prototype.toString.call(e)+"]"}function h(e,t,r,n,i){for(var o=[],s=0,a=t.length;s<a;++s)L(t,String(s))?o.push(p(e,t,r,n,String(s),!0)):o.push("");return i.forEach(function(i){i.match(/^\d+$/)||o.push(p(e,t,r,n,i,!0))}),o}function p(e,t,r,n,i,o){var s,a,c;if(c=Object.getOwnPropertyDescriptor(t,i)||{value:t[i]},c.get?a=c.set?e.stylize("[Getter/Setter]","special"):e.stylize("[Getter]","special"):c.set&&(a=e.stylize("[Setter]","special")),L(n,i)||(s="["+i+"]"),a||(e.seen.indexOf(c.value)<0?(a=v(r)?u(e,c.value,null):u(e,c.value,r-1),a.indexOf("\n")>-1&&(a=o?a.split("\n").map(function(e){return"  "+e}).join("\n").substr(2):"\n"+a.split("\n").map(function(e){return"   "+e}).join("\n"))):a=e.stylize("[Circular]","special")),E(s)){if(o&&i.match(/^\d+$/))return a;s=JSON.stringify(""+i),s.match(/^"([a-zA-Z_][a-zA-Z_0-9]*)"$/)?(s=s.substr(1,s.length-2),s=e.stylize(s,"name")):(s=s.replace(/'/g,"\\'").replace(/\\"/g,'"').replace(/(^"|"$)/g,"'"),s=e.stylize(s,"string"))}return s+": "+a}function f(e,t,r){var n=0;return e.reduce(function(e,t){return n++,t.indexOf("\n")>=0&&n++,e+t.replace(/\u001b\[\d\d?m/g,"").length+1},0)>60?r[0]+(""===t?"":t+"\n ")+" "+e.join(",\n  ")+" "+r[1]:r[0]+t+" "+e.join(", ")+" "+r[1]}function d(e){return Array.isArray(e)}function m(e){return"boolean"==typeof e}function v(e){return null===e}function g(e){return null==e}function y(e){return"number"==typeof e}function b(e){return"string"==typeof e}function w(e){return"symbol"==typeof e}function E(e){return void 0===e}function _(e){return S(e)&&"[object RegExp]"===T(e)}function S(e){return"object"==typeof e&&null!==e}function C(e){return S(e)&&"[object Date]"===T(e)}function x(e){return S(e)&&("[object Error]"===T(e)||e instanceof Error)}function A(e){return"function"==typeof e}function R(e){return null===e||"boolean"==typeof e||"number"==typeof e||"string"==typeof e||"symbol"==typeof e||void 0===e}function T(e){return Object.prototype.toString.call(e)}function k(e){return e<10?"0"+e.toString(10):e.toString(10)}function I(){var e=new Date,t=[k(e.getHours()),k(e.getMinutes()),k(e.getSeconds())].join(":");return[e.getDate(),N[e.getMonth()],t].join(" ")}function L(e,t){return Object.prototype.hasOwnProperty.call(e,t)}var P=/%[sdj%]/g;r.format=function(e){if(!b(e)){for(var t=[],r=0;r<arguments.length;r++)t.push(i(arguments[r]));return t.join(" ")}for(var r=1,n=arguments,o=n.length,s=String(e).replace(P,function(e){if("%%"===e)return"%";if(r>=o)return e;switch(e){case"%s":return String(n[r++]);case"%d":return Number(n[r++]);case"%j":try{return JSON.stringify(n[r++])}catch(e){return"[Circular]"}default:return e}}),a=n[r];r<o;a=n[++r])v(a)||!S(a)?s+=" "+a:s+=" "+i(a);return s},r.deprecate=function(e,i){function o(){if(!s){if(t.throwDeprecation)throw new Error(i);t.traceDeprecation?console.trace(i):console.error(i),s=!0}return e.apply(this,arguments)}if(E(n.process))return function(){return r.deprecate(e,i).apply(this,arguments)};if(!0===t.noDeprecation)return e;var s=!1;return o};var q,O={};r.debuglog=function(e){if(E(q)&&(q=t.env.NODE_DEBUG||""),e=e.toUpperCase(),!O[e])if(new RegExp("\\b"+e+"\\b","i").test(q)){var n=t.pid;O[e]=function(){var t=r.format.apply(r,arguments);console.error("%s %d: %s",e,n,t)}}else O[e]=function(){};return O[e]},r.inspect=i,i.colors={bold:[1,22],italic:[3,23],underline:[4,24],inverse:[7,27],white:[37,39],grey:[90,39],black:[30,39],blue:[34,39],cyan:[36,39],green:[32,39],magenta:[35,39],red:[31,39],yellow:[33,39]},i.styles={special:"cyan",number:"yellow",boolean:"yellow",undefined:"grey",null:"bold",string:"green",date:"magenta",regexp:"red"},r.isArray=d,r.isBoolean=m,r.isNull=v,r.isNullOrUndefined=g,r.isNumber=y,r.isString=b,r.isSymbol=w,r.isUndefined=E,r.isRegExp=_,r.isObject=S,r.isDate=C,r.isError=x,r.isFunction=A,r.isPrimitive=R,r.isBuffer=e("./support/isBuffer");var N=["Jan","Feb","Mar","Apr","May","Jun","Jul","Aug","Sep","Oct","Nov","Dec"];r.log=function(){console.log("%s - %s",I(),r.format.apply(r,arguments))},r.inherits=e("inherits"),r._extend=function(e,t){if(!t||!S(t))return e;for(var r=Object.keys(t),n=r.length;n--;)e[r[n]]=t[r[n]];return e}}).call(this)}).call(this,e("_process"),"undefined"!=typeof global?global:"undefined"!=typeof self?self:"undefined"!=typeof window?window:{})},{"./support/isBuffer":19,_process:8,inherits:18}],19:[function(e,t,r){t.exports=function(e){return e&&"object"==typeof e&&"function"==typeof e.copy&&"function"==typeof e.fill&&"function"==typeof e.readUInt8}},{}],18:[function(e,t,r){"function"==typeof Object.create?t.exports=function(e,t){e.super_=t,e.prototype=Object.create(t.prototype,{constructor:{value:e,enumerable:!1,writable:!0,configurable:!0}})}:t.exports=function(e,t){e.super_=t;var r=function(){};r.prototype=t.prototype,e.prototype=new r,e.prototype.constructor=e}},{}],16:[function(e,t,r){(function(t,n){(function(){function i(e,t){this._id=e,this._clearFn=t}var o=e("process/browser.js").nextTick,s=Function.prototype.apply,a=Array.prototype.slice,u={},c=0;r.setTimeout=function(){return new i(s.call(setTimeout,window,arguments),clearTimeout)},r.setInterval=function(){return new i(s.call(setInterval,window,arguments),clearInterval)},r.clearTimeout=r.clearInterval=function(e){e.close()},i.prototype.unref=i.prototype.ref=function(){},i.prototype.close=function(){this._clearFn.call(window,this._id)},r.enroll=function(e,t){clearTimeout(e._idleTimeoutId),e._idleTimeout=t},r.unenroll=function(e){clearTimeout(e._idleTimeoutId),e._idleTimeout=-1},r._unrefActive=r.active=function(e){clearTimeout(e._idleTimeoutId);var t=e._idleTimeout;t>=0&&(e._idleTimeoutId=setTimeout(function(){e._onTimeout&&e._onTimeout()},t))},r.setImmediate="function"==typeof t?t:function(e){var t=c++,n=!(arguments.length<2)&&a.call(arguments,1);return u[t]=!0,o(function(){u[t]&&(n?e.apply(null,n):e.call(null),r.clearImmediate(t))}),t},r.clearImmediate="function"==typeof n?n:function(e){delete u[e]}}).call(this)}).call(this,e("timers").setImmediate,e("timers").clearImmediate)},{"process/browser.js":8,timers:16}],8:[function(e,t,r){function n(){throw new Error("setTimeout has not been defined")}function i(){throw new Error("clearTimeout has not been defined")}function o(e){if(h===setTimeout)return setTimeout(e,0);if((h===n||!h)&&setTimeout)return h=setTimeout,setTimeout(e,0);try{return h(e,0)}catch(t){try{return h.call(null,e,0)}catch(t){return h.call(this,e,0)}}}function s(e){if(p===clearTimeout)return clearTimeout(e);if((p===i||!p)&&clearTimeout)return p=clearTimeout,clearTimeout(e);try{return p(e)}catch(t){try{return p.call(null,e)}catch(t){return p.call(this,e)}}}function a(){v&&d&&(v=!1,d.length?m=d.concat(m):g=-1,m.length&&u())}function u(){if(!v){var e=o(a);v=!0;for(var t=m.length;t;){for(d=m,m=[];++g<t;)d&&d[g].run();g=-1,t=m.length}d=null,v=!1,s(e)}}function c(e,t){this.fun=e,this.array=t}function l(){}var h,p,f=t.exports={};!function(){try{h="function"==typeof setTimeout?setTimeout:n}catch(e){h=n}try{p="function"==typeof clearTimeout?clearTimeout:i}catch(e){p=i}}();var d,m=[],v=!1,g=-1;f.nextTick=function(e){var t=new Array(arguments.length-1);if(arguments.length>1)for(var r=1;r<arguments.length;r++)t[r-1]=arguments[r];m.push(new c(e,t)),1!==m.length||v||o(u)},c.prototype.run=function(){this.fun.apply(null,this.array)},f.title="browser",f.browser=!0,f.env={},f.argv=[],f.version="",f.versions={},f.on=l,f.addListener=l,f.once=l,f.off=l,f.removeListener=l,f.removeAllListeners=l,f.emit=l,f.prependListener=l,f.prependOnceListener=l,f.listeners=function(e){return[]},f.binding=function(e){throw new Error("process.binding is not supported")},f.cwd=function(){return"/"},f.chdir=function(e){throw new Error("process.chdir is not supported")},f.umask=function(){return 0}},{}],7:[function(e,t,r){!function(e){"use strict";function t(e){return null!==e&&"[object Array]"===Object.prototype.toString.call(e)}function r(e){return null!==e&&"[object Object]"===Object.prototype.toString.call(e)}function n(e,i){if(e===i)return!0;if(Object.prototype.toString.call(e)!==Object.prototype.toString.call(i))return!1;if(!0===t(e)){if(e.length!==i.length)return!1;for(var o=0;o<e.length;o++)if(!1===n(e[o],i[o]))return!1;return!0}if(!0===r(e)){var s={};for(var a in e)if(hasOwnProperty.call(e,a)){if(!1===n(e[a],i[a]))return!1;s[a]=!0}for(var u in i)if(hasOwnProperty.call(i,u)&&!0!==s[u])return!1;return!0}return!1}function i(e){if(""===e||!1===e||null===e)return!0;if(t(e)&&0===e.length)return!0;if(r(e)){for(var n in e)if(e.hasOwnProperty(n))return!1;return!0}return!1}function o(e){for(var t=Object.keys(e),r=[],n=0;n<t.length;n++)r.push(e[t[n]]);return r}function s(e){return e>="a"&&e<="z"||e>="A"&&e<="Z"||"_"===e}function a(e){return e>="0"&&e<="9"||"-"===e}function u(e){return e>="a"&&e<="z"||e>="A"&&e<="Z"||e>="0"&&e<="9"||"_"===e}function c(){}function l(){}function h(e){this.runtime=e}function p(e){this._interpreter=e,this.functionTable={abs:{_func:this._functionAbs,_signature:[{types:[g]}]},avg:{_func:this._functionAvg,_signature:[{types:[S]}]},ceil:{_func:this._functionCeil,_signature:[{types:[g]}]},contains:{_func:this._functionContains,_signature:[{types:[b,w]},{types:[y]}]},ends_with:{_func:this._functionEndsWith,_signature:[{types:[b]},{types:[b]}]},floor:{_func:this._functionFloor,_signature:[{types:[g]}]},length:{_func:this._functionLength,_signature:[{types:[b,w,E]}]},map:{_func:this._functionMap,_signature:[{types:[_]},{types:[w]}]},max:{_func:this._functionMax,_signature:[{types:[S,C]}]},merge:{_func:this._functionMerge,_signature:[{types:[E],variadic:!0}]},max_by:{_func:this._functionMaxBy,_signature:[{types:[w]},{types:[_]}]},sum:{_func:this._functionSum,_signature:[{types:[S]}]},starts_with:{_func:this._functionStartsWith,_signature:[{types:[b]},{types:[b]}]},min:{_func:this._functionMin,_signature:[{types:[S,C]}]},min_by:{_func:this._functionMinBy,_signature:[{types:[w]},{types:[_]}]},type:{_func:this._functionType,_signature:[{types:[y]}]},keys:{_func:this._functionKeys,_signature:[{types:[E]}]},values:{_func:this._functionValues,_signature:[{types:[E]}]},sort:{_func:this._functionSort,_signature:[{types:[C,S]}]},sort_by:{_func:this._functionSortBy,_signature:[{types:[w]},{types:[_]}]},join:{_func:this._functionJoin,_signature:[{types:[b]},{types:[C]}]},reverse:{_func:this._functionReverse,_signature:[{types:[b,w]}]},to_array:{_func:this._functionToArray,_signature:[{types:[y]}]},to_string:{_func:this._functionToString,_signature:[{types:[y]}]},to_number:{_func:this._functionToNumber,_signature:[{types:[y]}]},not_null:{_func:this._functionNotNull,_signature:[{types:[y],variadic:!0}]}}}function f(e){return(new l).parse(e)}function d(e){return(new c).tokenize(e)}function m(e,t){var r=new l,n=new p,i=new h(n);n._interpreter=i;var o=r.parse(t);return i.search(o,e)}var v;v="function"==typeof String.prototype.trimLeft?function(e){return e.trimLeft()}:function(e){return e.match(/^\s*(.*)/)[1]};var g=0,y=1,b=2,w=3,E=4,_=6,S=8,C=9,x={".":"Dot","*":"Star",",":"Comma",":":"Colon","{":"Lbrace","}":"Rbrace","]":"Rbracket","(":"Lparen",")":"Rparen","@":"Current"},A={"<":!0,">":!0,"=":!0,"!":!0},R={" ":!0,"\t":!0,"\n":!0};c.prototype={tokenize:function(e){var t=[];this._current=0;for(var r,n,i;this._current<e.length;)if(s(e[this._current]))r=this._current,n=this._consumeUnquotedIdentifier(e),t.push({type:"UnquotedIdentifier",value:n,start:r});else if(void 0!==x[e[this._current]])t.push({type:x[e[this._current]],value:e[this._current],start:this._current}),this._current++;else if(a(e[this._current]))i=this._consumeNumber(e),t.push(i);else if("["===e[this._current])i=this._consumeLBracket(e),t.push(i);else if('"'===e[this._current])r=this._current,n=this._consumeQuotedIdentifier(e),t.push({type:"QuotedIdentifier",value:n,start:r});else if("'"===e[this._current])r=this._current,n=this._consumeRawStringLiteral(e),t.push({type:"Literal",value:n,start:r});else if("`"===e[this._current]){r=this._current;var o=this._consumeLiteral(e);t.push({type:"Literal",value:o,start:r})}else if(void 0!==A[e[this._current]])t.push(this._consumeOperator(e));else if(void 0!==R[e[this._current]])this._current++;else if("&"===e[this._current])r=this._current,this._current++,"&"===e[this._current]?(this._current++,t.push({type:"And",value:"&&",start:r})):t.push({type:"Expref",value:"&",start:r});else{if("|"!==e[this._current]){var u=new Error("Unknown character:"+e[this._current]);throw u.name="LexerError",u}r=this._current,this._current++,"|"===e[this._current]?(this._current++,t.push({type:"Or",value:"||",start:r})):t.push({type:"Pipe",value:"|",start:r})}return t},_consumeUnquotedIdentifier:function(e){var t=this._current;for(this._current++;this._current<e.length&&u(e[this._current]);)this._current++;return e.slice(t,this._current)},_consumeQuotedIdentifier:function(e){var t=this._current;this._current++;for(var r=e.length;'"'!==e[this._current]&&this._current<r;){var n=this._current;"\\"!==e[n]||"\\"!==e[n+1]&&'"'!==e[n+1]?n++:n+=2,this._current=n}return this._current++,JSON.parse(e.slice(t,this._current))},_consumeRawStringLiteral:function(e){var t=this._current;this._current++;for(var r=e.length;"'"!==e[this._current]&&this._current<r;){var n=this._current;"\\"!==e[n]||"\\"!==e[n+1]&&"'"!==e[n+1]?n++:n+=2,this._current=n}return this._current++,e.slice(t+1,this._current-1).replace("\\'","'")},_consumeNumber:function(e){var t=this._current;this._current++;for(var r=e.length;a(e[this._current])&&this._current<r;)this._current++;return{type:"Number",value:parseInt(e.slice(t,this._current)),start:t}},_consumeLBracket:function(e){var t=this._current;return this._current++,"?"===e[this._current]?(this._current++,{type:"Filter",value:"[?",start:t}):"]"===e[this._current]?(this._current++,{type:"Flatten",value:"[]",start:t}):{type:"Lbracket",value:"[",start:t}},_consumeOperator:function(e){var t=this._current,r=e[t];return this._current++,"!"===r?"="===e[this._current]?(this._current++,{type:"NE",value:"!=",start:t}):{type:"Not",value:"!",start:t}:"<"===r?"="===e[this._current]?(this._current++,{type:"LTE",value:"<=",start:t}):{type:"LT",value:"<",start:t}:">"===r?"="===e[this._current]?(this._current++,{type:"GTE",value:">=",start:t}):{type:"GT",value:">",start:t}:"="===r&&"="===e[this._current]?(this._current++,{type:"EQ",value:"==",start:t}):void 0},_consumeLiteral:function(e){this._current++;for(var t,r=this._current,n=e.length;"`"!==e[this._current]&&this._current<n;){var i=this._current;"\\"!==e[i]||"\\"!==e[i+1]&&"`"!==e[i+1]?i++:i+=2,this._current=i}var o=v(e.slice(r,this._current));return o=o.replace("\\`","`"),t=this._looksLikeJSON(o)?JSON.parse(o):JSON.parse('"'+o+'"'),this._current++,t},_looksLikeJSON:function(e){var t='[{"',r=["true","false","null"],n="-0123456789";if(""===e)return!1;if(t.indexOf(e[0])>=0)return!0;if(r.indexOf(e)>=0)return!0;if(!(n.indexOf(e[0])>=0))return!1;try{return JSON.parse(e),!0}catch(e){return!1}}};var T={};T.EOF=0,T.UnquotedIdentifier=0,T.QuotedIdentifier=0,T.Rbracket=0,T.Rparen=0,T.Comma=0,T.Rbrace=0,T.Number=0,T.Current=0,T.Expref=0,T.Pipe=1,T.Or=2,T.And=3,T.EQ=5,T.GT=5,T.LT=5,T.GTE=5,T.LTE=5,T.NE=5,T.Flatten=9,T.Star=20,T.Filter=21,T.Dot=40,T.Not=45,T.Lbrace=50,T.Lbracket=55,T.Lparen=60,l.prototype={parse:function(e){this._loadTokens(e),this.index=0;var t=this.expression(0);if("EOF"!==this._lookahead(0)){var r=this._lookaheadToken(0),n=new Error("Unexpected token type: "+r.type+", value: "+r.value);throw n.name="ParserError",n}return t},_loadTokens:function(e){var t=new c,r=t.tokenize(e);r.push({type:"EOF",value:"",start:e.length}),this.tokens=r},expression:function(e){var t=this._lookaheadToken(0);this._advance();for(var r=this.nud(t),n=this._lookahead(0);e<T[n];)this._advance(),r=this.led(n,r),n=this._lookahead(0);return r},_lookahead:function(e){return this.tokens[this.index+e].type},_lookaheadToken:function(e){return this.tokens[this.index+e]},_advance:function(){this.index++},nud:function(e){var t,r,n;switch(e.type){case"Literal":return{type:"Literal",value:e.value};case"UnquotedIdentifier":return{type:"Field",name:e.value};case"QuotedIdentifier":var i={type:"Field",name:e.value};if("Lparen"===this._lookahead(0))throw new Error("Quoted identifier not allowed for function names.");return i;case"Not":return r=this.expression(T.Not),{type:"NotExpression",children:[r]};case"Star":return t={type:"Identity"},r=null,r="Rbracket"===this._lookahead(0)?{type:"Identity"}:this._parseProjectionRHS(T.Star),{type:"ValueProjection",children:[t,r]};case"Filter":return this.led(e.type,{type:"Identity"});case"Lbrace":return this._parseMultiselectHash();case"Flatten":return t={type:"Flatten",children:[{type:"Identity"}]},r=this._parseProjectionRHS(T.Flatten),{type:"Projection",children:[t,r]};case"Lbracket":return"Number"===this._lookahead(0)||"Colon"===this._lookahead(0)?(r=this._parseIndexExpression(),this._projectIfSlice({type:"Identity"},r)):"Star"===this._lookahead(0)&&"Rbracket"===this._lookahead(1)?(this._advance(),this._advance(),r=this._parseProjectionRHS(T.Star),{type:"Projection",children:[{type:"Identity"},r]}):this._parseMultiselectList();case"Current":return{type:"Current"};case"Expref":return n=this.expression(T.Expref),{type:"ExpressionReference",children:[n]};case"Lparen":for(var o=[];"Rparen"!==this._lookahead(0);)"Current"===this._lookahead(0)?(n={type:"Current"},this._advance()):n=this.expression(0),o.push(n);return this._match("Rparen"),o[0];default:this._errorToken(e)}},led:function(e,t){var r;switch(e){case"Dot":var n=T.Dot;return"Star"!==this._lookahead(0)?(r=this._parseDotRHS(n),{type:"Subexpression",children:[t,r]}):(this._advance(),r=this._parseProjectionRHS(n),{type:"ValueProjection",children:[t,r]});case"Pipe":return r=this.expression(T.Pipe),{type:"Pipe",children:[t,r]};case"Or":return r=this.expression(T.Or),{type:"OrExpression",children:[t,r]};case"And":return r=this.expression(T.And),{type:"AndExpression",children:[t,r]};case"Lparen":for(var i,o=t.name,s=[];"Rparen"!==this._lookahead(0);)"Current"===this._lookahead(0)?(i={type:"Current"},this._advance()):i=this.expression(0),"Comma"===this._lookahead(0)&&this._match("Comma"),s.push(i);return this._match("Rparen"),{type:"Function",name:o,children:s};case"Filter":var a=this.expression(0);return this._match("Rbracket"),r="Flatten"===this._lookahead(0)?{type:"Identity"}:this._parseProjectionRHS(T.Filter),{type:"FilterProjection",children:[t,r,a]};case"Flatten":return{type:"Projection",children:[{type:"Flatten",children:[t]},this._parseProjectionRHS(T.Flatten)]};case"EQ":case"NE":case"GT":case"GTE":case"LT":case"LTE":return this._parseComparator(t,e);case"Lbracket":var u=this._lookaheadToken(0);return"Number"===u.type||"Colon"===u.type?(r=this._parseIndexExpression(),this._projectIfSlice(t,r)):(this._match("Star"),this._match("Rbracket"),r=this._parseProjectionRHS(T.Star),{type:"Projection",children:[t,r]});default:this._errorToken(this._lookaheadToken(0))}},_match:function(e){if(this._lookahead(0)!==e){var t=this._lookaheadToken(0),r=new Error("Expected "+e+", got: "+t.type);throw r.name="ParserError",r}this._advance()},_errorToken:function(e){var t=new Error("Invalid token ("+e.type+'): "'+e.value+'"');throw t.name="ParserError",t},_parseIndexExpression:function(){if("Colon"===this._lookahead(0)||"Colon"===this._lookahead(1))return this._parseSliceExpression();var e={type:"Index",value:this._lookaheadToken(0).value};return this._advance(),this._match("Rbracket"),e},_projectIfSlice:function(e,t){var r={type:"IndexExpression",children:[e,t]};return"Slice"===t.type?{type:"Projection",children:[r,this._parseProjectionRHS(T.Star)]}:r},_parseSliceExpression:function(){for(var e=[null,null,null],t=0,r=this._lookahead(0);"Rbracket"!==r&&t<3;){if("Colon"===r)t++,this._advance();else{if("Number"!==r){var n=this._lookahead(0),i=new Error("Syntax error, unexpected token: "+n.value+"("+n.type+")");throw i.name="Parsererror",i}e[t]=this._lookaheadToken(0).value,this._advance()}r=this._lookahead(0)}return this._match("Rbracket"),{type:"Slice",children:e}},_parseComparator:function(e,t){return{type:"Comparator",name:t,children:[e,this.expression(T[t])]}},_parseDotRHS:function(e){var t=this._lookahead(0);return["UnquotedIdentifier","QuotedIdentifier","Star"].indexOf(t)>=0?this.expression(e):"Lbracket"===t?(this._match("Lbracket"),this._parseMultiselectList()):"Lbrace"===t?(this._match("Lbrace"),this._parseMultiselectHash()):void 0},_parseProjectionRHS:function(e){var t;if(T[this._lookahead(0)]<10)t={type:"Identity"};else if("Lbracket"===this._lookahead(0))t=this.expression(e);else if("Filter"===this._lookahead(0))t=this.expression(e);else{if("Dot"!==this._lookahead(0)){var r=this._lookaheadToken(0),n=new Error("Sytanx error, unexpected token: "+r.value+"("+r.type+")");throw n.name="ParserError",n}this._match("Dot"),t=this._parseDotRHS(e)}return t},_parseMultiselectList:function(){for(var e=[];"Rbracket"!==this._lookahead(0);){var t=this.expression(0);if(e.push(t),"Comma"===this._lookahead(0)&&(this._match("Comma"),"Rbracket"===this._lookahead(0)))throw new Error("Unexpected token Rbracket")}return this._match("Rbracket"),{type:"MultiSelectList",children:e}},_parseMultiselectHash:function(){for(var e,t,r,n,i=[],o=["UnquotedIdentifier","QuotedIdentifier"];;){if(e=this._lookaheadToken(0),o.indexOf(e.type)<0)throw new Error("Expecting an identifier token, got: "+e.type);if(t=e.value,this._advance(),this._match("Colon"),r=this.expression(0),n={type:"KeyValuePair",name:t,value:r},i.push(n),"Comma"===this._lookahead(0))this._match("Comma");else if("Rbrace"===this._lookahead(0)){this._match("Rbrace");break}}return{type:"MultiSelectHash",children:i}}},h.prototype={search:function(e,t){return this.visit(e,t)},visit:function(e,s){var a,u,c,l,h,p,f,d,m;switch(e.type){case"Field":return null===s?null:r(s)?(p=s[e.name],void 0===p?null:p):null;case"Subexpression":for(c=this.visit(e.children[0],s),m=1;m<e.children.length;m++)if(null===(c=this.visit(e.children[1],c)))return null;return c;case"IndexExpression":return f=this.visit(e.children[0],s),this.visit(e.children[1],f);case"Index":if(!t(s))return null;var v=e.value;return v<0&&(v=s.length+v),c=s[v],void 0===c&&(c=null),c;case"Slice":if(!t(s))return null;var g=e.children.slice(0),y=this.computeSliceParams(s.length,g),b=y[0],w=y[1],E=y[2];if(c=[],E>0)for(m=b;m<w;m+=E)c.push(s[m]);else for(m=b;m>w;m+=E)c.push(s[m]);return c;case"Projection":var _=this.visit(e.children[0],s);if(!t(_))return null;for(d=[],m=0;m<_.length;m++)null!==(u=this.visit(e.children[1],_[m]))&&d.push(u);return d;case"ValueProjection":if(_=this.visit(e.children[0],s),!r(_))return null;d=[];var S=o(_);for(m=0;m<S.length;m++)null!==(u=this.visit(e.children[1],S[m]))&&d.push(u);return d;case"FilterProjection":if(_=this.visit(e.children[0],s),!t(_))return null;var C=[],x=[];for(m=0;m<_.length;m++)a=this.visit(e.children[2],_[m]),i(a)||C.push(_[m]);for(var A=0;A<C.length;A++)null!==(u=this.visit(e.children[1],C[A]))&&x.push(u);return x;case"Comparator":switch(l=this.visit(e.children[0],s),h=this.visit(e.children[1],s),e.name){case"EQ":c=n(l,h);break;case"NE":c=!n(l,h);break;case"GT":c=l>h;break;case"GTE":c=l>=h;break;case"LT":c=l<h;break;case"LTE":c=l<=h;break;default:throw new Error("Unknown comparator: "+e.name)}return c;case"Flatten":var R=this.visit(e.children[0],s);if(!t(R))return null;var T=[];for(m=0;m<R.length;m++)u=R[m],t(u)?T.push.apply(T,u):T.push(u);return T;case"Identity":return s;case"MultiSelectList":if(null===s)return null;for(d=[],m=0;m<e.children.length;m++)d.push(this.visit(e.children[m],s));return d;case"MultiSelectHash":if(null===s)return null;d={};var k;for(m=0;m<e.children.length;m++)k=e.children[m],d[k.name]=this.visit(k.value,s);return d;case"OrExpression":return a=this.visit(e.children[0],s),
+i(a)&&(a=this.visit(e.children[1],s)),a;case"AndExpression":return l=this.visit(e.children[0],s),!0===i(l)?l:this.visit(e.children[1],s);case"NotExpression":return l=this.visit(e.children[0],s),i(l);case"Literal":return e.value;case"Pipe":return f=this.visit(e.children[0],s),this.visit(e.children[1],f);case"Current":return s;case"Function":var I=[];for(m=0;m<e.children.length;m++)I.push(this.visit(e.children[m],s));return this.runtime.callFunction(e.name,I);case"ExpressionReference":var L=e.children[0];return L.jmespathType="Expref",L;default:throw new Error("Unknown node type: "+e.type)}},computeSliceParams:function(e,t){var r=t[0],n=t[1],i=t[2],o=[null,null,null];if(null===i)i=1;else if(0===i){var s=new Error("Invalid slice, step cannot be 0");throw s.name="RuntimeError",s}var a=i<0;return r=null===r?a?e-1:0:this.capSliceRange(e,r,i),n=null===n?a?-1:e:this.capSliceRange(e,n,i),o[0]=r,o[1]=n,o[2]=i,o},capSliceRange:function(e,t,r){return t<0?(t+=e)<0&&(t=r<0?-1:0):t>=e&&(t=r<0?e-1:e),t}},p.prototype={callFunction:function(e,t){var r=this.functionTable[e];if(void 0===r)throw new Error("Unknown function: "+e+"()");return this._validateArgs(e,t,r._signature),r._func.call(this,t)},_validateArgs:function(e,t,r){var n;if(r[r.length-1].variadic){if(t.length<r.length)throw n=1===r.length?" argument":" arguments",new Error("ArgumentError: "+e+"() takes at least"+r.length+n+" but received "+t.length)}else if(t.length!==r.length)throw n=1===r.length?" argument":" arguments",new Error("ArgumentError: "+e+"() takes "+r.length+n+" but received "+t.length);for(var i,o,s,a=0;a<r.length;a++){s=!1,i=r[a].types,o=this._getTypeName(t[a]);for(var u=0;u<i.length;u++)if(this._typeMatches(o,i[u],t[a])){s=!0;break}if(!s)throw new Error("TypeError: "+e+"() expected argument "+(a+1)+" to be type "+i+" but received type "+o+" instead.")}},_typeMatches:function(e,t,r){if(t===y)return!0;if(t!==C&&t!==S&&t!==w)return e===t;if(t===w)return e===w;if(e===w){var n;t===S?n=g:t===C&&(n=b);for(var i=0;i<r.length;i++)if(!this._typeMatches(this._getTypeName(r[i]),n,r[i]))return!1;return!0}},_getTypeName:function(e){switch(Object.prototype.toString.call(e)){case"[object String]":return b;case"[object Number]":return g;case"[object Array]":return w;case"[object Boolean]":return 5;case"[object Null]":return 7;case"[object Object]":return"Expref"===e.jmespathType?_:E}},_functionStartsWith:function(e){return 0===e[0].lastIndexOf(e[1])},_functionEndsWith:function(e){var t=e[0],r=e[1];return-1!==t.indexOf(r,t.length-r.length)},_functionReverse:function(e){if(this._getTypeName(e[0])===b){for(var t=e[0],r="",n=t.length-1;n>=0;n--)r+=t[n];return r}var i=e[0].slice(0);return i.reverse(),i},_functionAbs:function(e){return Math.abs(e[0])},_functionCeil:function(e){return Math.ceil(e[0])},_functionAvg:function(e){for(var t=0,r=e[0],n=0;n<r.length;n++)t+=r[n];return t/r.length},_functionContains:function(e){return e[0].indexOf(e[1])>=0},_functionFloor:function(e){return Math.floor(e[0])},_functionLength:function(e){return r(e[0])?Object.keys(e[0]).length:e[0].length},_functionMap:function(e){for(var t=[],r=this._interpreter,n=e[0],i=e[1],o=0;o<i.length;o++)t.push(r.visit(n,i[o]));return t},_functionMerge:function(e){for(var t={},r=0;r<e.length;r++){var n=e[r];for(var i in n)t[i]=n[i]}return t},_functionMax:function(e){if(e[0].length>0){if(this._getTypeName(e[0][0])===g)return Math.max.apply(Math,e[0]);for(var t=e[0],r=t[0],n=1;n<t.length;n++)r.localeCompare(t[n])<0&&(r=t[n]);return r}return null},_functionMin:function(e){if(e[0].length>0){if(this._getTypeName(e[0][0])===g)return Math.min.apply(Math,e[0]);for(var t=e[0],r=t[0],n=1;n<t.length;n++)t[n].localeCompare(r)<0&&(r=t[n]);return r}return null},_functionSum:function(e){for(var t=0,r=e[0],n=0;n<r.length;n++)t+=r[n];return t},_functionType:function(e){switch(this._getTypeName(e[0])){case g:return"number";case b:return"string";case w:return"array";case E:return"object";case 5:return"boolean";case _:return"expref";case 7:return"null"}},_functionKeys:function(e){return Object.keys(e[0])},_functionValues:function(e){for(var t=e[0],r=Object.keys(t),n=[],i=0;i<r.length;i++)n.push(t[r[i]]);return n},_functionJoin:function(e){var t=e[0];return e[1].join(t)},_functionToArray:function(e){return this._getTypeName(e[0])===w?e[0]:[e[0]]},_functionToString:function(e){return this._getTypeName(e[0])===b?e[0]:JSON.stringify(e[0])},_functionToNumber:function(e){var t,r=this._getTypeName(e[0]);return r===g?e[0]:r!==b||(t=+e[0],isNaN(t))?null:t},_functionNotNull:function(e){for(var t=0;t<e.length;t++)if(7!==this._getTypeName(e[t]))return e[t];return null},_functionSort:function(e){var t=e[0].slice(0);return t.sort(),t},_functionSortBy:function(e){var t=e[0].slice(0);if(0===t.length)return t;var r=this._interpreter,n=e[1],i=this._getTypeName(r.visit(n,t[0]));if([g,b].indexOf(i)<0)throw new Error("TypeError");for(var o=this,s=[],a=0;a<t.length;a++)s.push([a,t[a]]);s.sort(function(e,t){var s=r.visit(n,e[1]),a=r.visit(n,t[1]);if(o._getTypeName(s)!==i)throw new Error("TypeError: expected "+i+", received "+o._getTypeName(s));if(o._getTypeName(a)!==i)throw new Error("TypeError: expected "+i+", received "+o._getTypeName(a));return s>a?1:s<a?-1:e[0]-t[0]});for(var u=0;u<s.length;u++)t[u]=s[u][1];return t},_functionMaxBy:function(e){for(var t,r,n=e[1],i=e[0],o=this.createKeyFunction(n,[g,b]),s=-1/0,a=0;a<i.length;a++)(r=o(i[a]))>s&&(s=r,t=i[a]);return t},_functionMinBy:function(e){for(var t,r,n=e[1],i=e[0],o=this.createKeyFunction(n,[g,b]),s=1/0,a=0;a<i.length;a++)(r=o(i[a]))<s&&(s=r,t=i[a]);return t},createKeyFunction:function(e,t){var r=this,n=this._interpreter;return function(i){var o=n.visit(e,i);if(t.indexOf(r._getTypeName(o))<0){var s="TypeError: expected one of "+t+", received "+r._getTypeName(o);throw new Error(s)}return o}}},e.tokenize=d,e.compile=f,e.search=m,e.strictDeepEqual=n}(void 0===r?this.jmespath={}:r)},{}],2:[function(e,t,r){},{}]},{},[105]),_xamzrequire=function e(t,r,n){function i(s,a){if(!r[s]){if(!t[s]){var u="function"==typeof _xamzrequire&&_xamzrequire;if(!a&&u)return u(s,!0);if(o)return o(s,!0);var c=new Error("Cannot find module '"+s+"'");throw c.code="MODULE_NOT_FOUND",c}var l=r[s]={exports:{}};t[s][0].call(l.exports,function(e){var r=t[s][1][e];return i(r||e)},l,l.exports,e,t,r,n)}return r[s].exports}for(var o="function"==typeof _xamzrequire&&_xamzrequire,s=0;s<n.length;s++)i(n[s]);return i}({28:[function(e,t,r){e("./browser_loader");var n=e("./core");"undefined"!=typeof window&&(window.AWS=n),void 0!==t&&(t.exports=n),"undefined"!=typeof self&&(self.AWS=n)},{"./browser_loader":35,"./core":39}],35:[function(e,t,r){(function(r){(function(){var r=e("./util");r.crypto.lib=e("./browserCryptoLib"),r.Buffer=e("buffer/").Buffer,r.url=e("url/"),r.querystring=e("querystring/"),r.realClock=e("./realclock/browserClock"),r.environment="js",r.createEventStream=e("./event-stream/buffered-create-event-stream").createEventStream,r.isBrowser=function(){return!0},r.isNode=function(){return!1};var n=e("./core");if(t.exports=n,e("./credentials"),e("./credentials/credential_provider_chain"),e("./credentials/temporary_credentials"),e("./credentials/chainable_temporary_credentials"),e("./credentials/web_identity_credentials"),e("./credentials/cognito_identity_credentials"),e("./credentials/saml_credentials"),n.XML.Parser=e("./xml/browser_parser"),e("./http/xhr"),void 0===i)var i={browser:!0}}).call(this)}).call(this,e("_process"))},{"./browserCryptoLib":29,"./core":39,"./credentials":40,"./credentials/chainable_temporary_credentials":41,"./credentials/cognito_identity_credentials":42,"./credentials/credential_provider_chain":43,"./credentials/saml_credentials":44,"./credentials/temporary_credentials":45,"./credentials/web_identity_credentials":46,"./event-stream/buffered-create-event-stream":54,"./http/xhr":62,"./realclock/browserClock":81,"./util":118,"./xml/browser_parser":119,_process:8,"buffer/":3,"querystring/":15,"url/":17}],119:[function(e,t,r){function n(){}function i(e,t){for(var r=e.getElementsByTagName(t),n=0,i=r.length;n<i;n++)if(r[n].parentNode===e)return r[n]}function o(e,t){switch(t||(t={}),t.type){case"structure":return s(e,t);case"map":return a(e,t);case"list":return u(e,t);case void 0:case null:return l(e);default:return c(e,t)}}function s(e,t){var r={};return null===e?r:(h.each(t.members,function(n,s){if(s.isXmlAttribute){if(Object.prototype.hasOwnProperty.call(e.attributes,s.name)){var a=e.attributes[s.name].value;r[n]=o({textContent:a},s)}}else{var u=s.flattened?e:i(e,s.name);u?r[n]=o(u,s):s.flattened||"list"!==s.type||t.api.xmlNoDefaultLists||(r[n]=s.defaultValue)}}),r)}function a(e,t){for(var r={},n=t.key.name||"key",s=t.value.name||"value",a=t.flattened?t.name:"entry",u=e.firstElementChild;u;){if(u.nodeName===a){var c=i(u,n).textContent,l=i(u,s);r[c]=o(l,t.value)}u=u.nextElementSibling}return r}function u(e,t){for(var r=[],n=t.flattened?t.name:t.member.name||"member",i=e.firstElementChild;i;)i.nodeName===n&&r.push(o(i,t.member)),i=i.nextElementSibling;return r}function c(e,t){if(e.getAttribute){var r=e.getAttribute("encoding");"base64"===r&&(t=new p.create({type:r}))}var n=e.textContent;return""===n&&(n=null),"function"==typeof t.toType?t.toType(n):n}function l(e){if(void 0===e||null===e)return"";if(!e.firstElementChild)return null===e.parentNode.parentNode?{}:0===e.childNodes.length?"":e.textContent;for(var t={type:"structure",members:{}},r=e.firstElementChild;r;){var n=r.nodeName;Object.prototype.hasOwnProperty.call(t.members,n)?t.members[n].type="list":t.members[n]={name:n},r=r.nextElementSibling}return s(e,t)}var h=e("../util"),p=e("../model/shape");n.prototype.parse=function(e,t){if(""===e.replace(/^\s+/,""))return{};var r,n;try{if(window.DOMParser){try{r=(new DOMParser).parseFromString(e,"text/xml")}catch(e){throw h.error(new Error("Parse error in document"),{originalError:e,code:"XMLParserError",retryable:!0})}if(null===r.documentElement)throw h.error(new Error("Cannot parse empty document."),{code:"XMLParserError",retryable:!0});var s=r.getElementsByTagName("parsererror")[0];if(s&&(s.parentNode===r||"body"===s.parentNode.nodeName||s.parentNode.parentNode===r||"body"===s.parentNode.parentNode.nodeName)){var a=s.getElementsByTagName("div")[0]||s;throw h.error(new Error(a.textContent||"Parser error in document"),{code:"XMLParserError",retryable:!0})}}else{if(!window.ActiveXObject)throw new Error("Cannot load XML parser");if(r=new window.ActiveXObject("Microsoft.XMLDOM"),r.async=!1,!r.loadXML(e))throw h.error(new Error("Parse error in document"),{code:"XMLParserError",retryable:!0})}}catch(e){n=e}if(r&&r.documentElement&&!n){var u=o(r.documentElement,t),c=i(r.documentElement,"ResponseMetadata");return c&&(u.ResponseMetadata=o(c,{})),u}if(n)throw h.error(n||new Error,{code:"XMLParserError",retryable:!0});return{}},t.exports=n},{"../model/shape":70,"../util":118}],81:[function(e,t,r){t.exports={now:function(){return"undefined"!=typeof performance&&"function"==typeof performance.now?performance.now():Date.now()}}},{}],62:[function(e,t,r){var n=e("../core"),i=e("events").EventEmitter;e("../http"),n.XHRClient=n.util.inherit({handleRequest:function(e,t,r,o){var s=this,a=e.endpoint,u=new i,c=a.protocol+"//"+a.hostname;80!==a.port&&443!==a.port&&(c+=":"+a.port),c+=e.path;var l=new XMLHttpRequest,h=!1;e.stream=l,l.addEventListener("readystatechange",function(){try{if(0===l.status)return}catch(e){return}this.readyState>=this.HEADERS_RECEIVED&&!h&&(u.statusCode=l.status,u.headers=s.parseHeaders(l.getAllResponseHeaders()),u.emit("headers",u.statusCode,u.headers,l.statusText),h=!0),this.readyState===this.DONE&&s.finishRequest(l,u)},!1),l.upload.addEventListener("progress",function(e){u.emit("sendProgress",e)}),l.addEventListener("progress",function(e){u.emit("receiveProgress",e)},!1),l.addEventListener("timeout",function(){o(n.util.error(new Error("Timeout"),{code:"TimeoutError"}))},!1),l.addEventListener("error",function(){o(n.util.error(new Error("Network Failure"),{code:"NetworkingError"}))},!1),l.addEventListener("abort",function(){o(n.util.error(new Error("Request aborted"),{code:"RequestAbortedError"}))},!1),r(u),l.open(e.method,c,!1!==t.xhrAsync),n.util.each(e.headers,function(e,t){"Content-Length"!==e&&"User-Agent"!==e&&"Host"!==e&&l.setRequestHeader(e,t)}),t.timeout&&!1!==t.xhrAsync&&(l.timeout=t.timeout),t.xhrWithCredentials&&(l.withCredentials=!0);try{l.responseType="arraybuffer"}catch(e){}try{e.body?l.send(e.body):l.send()}catch(t){if(!e.body||"object"!=typeof e.body.buffer)throw t;l.send(e.body.buffer)}return u},parseHeaders:function(e){var t={};return n.util.arrayEach(e.split(/\r?\n/),function(e){var r=e.split(":",1)[0],n=e.substring(r.length+2);r.length>0&&(t[r.toLowerCase()]=n)}),t},finishRequest:function(e,t){var r;if("arraybuffer"===e.responseType&&e.response){var i=e.response;r=new n.util.Buffer(i.byteLength);for(var o=new Uint8Array(i),s=0;s<r.length;++s)r[s]=o[s]}try{r||"string"!=typeof e.responseText||(r=new n.util.Buffer(e.responseText))}catch(e){}r&&t.emit("data",r),t.emit("end")}}),n.HttpClient.prototype=n.XHRClient.prototype,n.HttpClient.streamsApiVersion=1},{"../core":39,"../http":61,events:4}],54:[function(e,t,r){function n(e,t,r){for(var n=i(e),s=[],a=0;a<n.length;a++)s.push(o(t,n[a],r));return s}var i=e("../event-stream/event-message-chunker").eventMessageChunker,o=e("./parse-event").parseEvent;t.exports={createEventStream:n}},{"../event-stream/event-message-chunker":55,"./parse-event":57}],57:[function(e,t,r){function n(e,t,r){var n=o(t),s=n.headers[":message-type"];if(s){if("error"===s.value)throw i(n);if("event"!==s.value)return}var a=n.headers[":event-type"],u=r.members[a.value];if(u){var c={},l=u.eventPayloadMemberName;if(l){var h=u.members[l];"binary"===h.type?c[l]=n.body:c[l]=e.parse(n.body.toString(),h)}for(var p=u.eventHeaderMemberNames,f=0;f<p.length;f++){var d=p[f];n.headers[d]&&(c[d]=u.members[d].toType(n.headers[d].value))}var m={};return m[a.value]=c,m}}function i(e){var t=e.headers[":error-code"],r=e.headers[":error-message"],n=new Error(r.value||r);return n.code=n.name=t.value||t,n}var o=e("./parse-message").parseMessage;t.exports={parseEvent:n}},{"./parse-message":58}],58:[function(e,t,r){function n(e){for(var t={},r=0;r<e.length;){var n=e.readUInt8(r++),i=e.slice(r,r+n).toString();switch(r+=n,e.readUInt8(r++)){case 0:t[i]={type:a,value:!0};break;case 1:t[i]={type:a,value:!1};break;case 2:t[i]={type:u,value:e.readInt8(r++)};break;case 3:t[i]={type:c,value:e.readInt16BE(r)},r+=2;break;case 4:t[i]={type:l,value:e.readInt32BE(r)},r+=4;break;case 5:t[i]={type:h,value:new o(e.slice(r,r+8))},r+=8;break;case 6:var s=e.readUInt16BE(r);r+=2,t[i]={type:p,value:e.slice(r,r+s)},r+=s;break;case 7:var v=e.readUInt16BE(r);r+=2,t[i]={type:f,value:e.slice(r,r+v).toString()},r+=v;break;case 8:t[i]={type:d,value:new Date(new o(e.slice(r,r+8)).valueOf())},r+=8;break;case 9:var g=e.slice(r,r+16).toString("hex");r+=16,t[i]={type:m,value:g.substr(0,8)+"-"+g.substr(8,4)+"-"+g.substr(12,4)+"-"+g.substr(16,4)+"-"+g.substr(20)};break;default:throw new Error("Unrecognized header type tag")}}return t}function i(e){var t=s(e);return{headers:n(t.headers),body:t.body}}var o=e("./int64").Int64,s=e("./split-message").splitMessage,a="boolean",u="byte",c="short",l="integer",h="long",p="binary",f="string",d="timestamp",m="uuid";t.exports={parseMessage:i}},{"./int64":56,"./split-message":59}],59:[function(e,t,r){function n(e){if(i.Buffer.isBuffer(e)||(e=o(e)),e.length<c)throw new Error("Provided message too short to accommodate event stream message overhead");if(e.length!==e.readUInt32BE(0))throw new Error("Reported message length does not match received message length");var t=e.readUInt32BE(a);if(t!==i.crypto.crc32(e.slice(0,a)))throw new Error("The prelude checksum specified in the message ("+t+") does not match the calculated CRC32 checksum.");var r=e.readUInt32BE(e.length-u);if(r!==i.crypto.crc32(e.slice(0,e.length-u)))throw new Error("The message checksum did not match the expected value of "+r);var n=a+u,l=n+e.readUInt32BE(s);return{headers:e.slice(n,l),body:e.slice(l,e.length-u)}}var i=e("../core").util,o=i.buffer.toBuffer,s=4,a=2*s,u=4,c=a+2*u;t.exports={splitMessage:n}},{"../core":39}],56:[function(e,t,r){function n(e){if(8!==e.length)throw new Error("Int64 buffers must be exactly 8 bytes");o.Buffer.isBuffer(e)||(e=s(e)),this.bytes=e}function i(e){for(var t=0;t<8;t++)e[t]^=255;for(var t=7;t>-1&&0===++e[t];t--);}var o=e("../core").util,s=o.buffer.toBuffer;n.fromNumber=function(e){if(e>0x8000000000000000||e<-0x8000000000000000)throw new Error(e+" is too large (or, if negative, too small) to represent as an Int64");for(var t=new Uint8Array(8),r=7,o=Math.abs(Math.round(e));r>-1&&o>0;r--,o/=256)t[r]=o;return e<0&&i(t),new n(t)},n.prototype.valueOf=function(){var e=this.bytes.slice(0),t=128&e[0];return t&&i(e),parseInt(e.toString("hex"),16)*(t?-1:1)},n.prototype.toString=function(){return String(this.valueOf())},t.exports={Int64:n}},{"../core":39}],55:[function(e,t,r){function n(e){for(var t=[],r=0;r<e.length;){var n=e.readInt32BE(r),i=e.slice(r,n+r);r+=n,t.push(i)}return t}t.exports={eventMessageChunker:n}},{}],46:[function(e,t,r){var n=e("../core");n.WebIdentityCredentials=n.util.inherit(n.Credentials,{constructor:function(e,t){n.Credentials.call(this),this.expired=!0,this.params=e,this.params.RoleSessionName=this.params.RoleSessionName||"web-identity",this.data=null,this._clientConfig=n.util.copy(t||{})},refresh:function(e){this.coalesceRefresh(e||n.util.fn.callback)},load:function(e){var t=this;t.createClients(),t.service.assumeRoleWithWebIdentity(function(r,n){t.data=null,r||(t.data=n,t.service.credentialsFrom(n,t)),e(r)})},createClients:function(){if(!this.service){var e=n.util.merge({},this._clientConfig);e.params=this.params,this.service=new n.STS(e)}}})},{"../core":39}],45:[function(e,t,r){var n=e("../core");n.TemporaryCredentials=n.util.inherit(n.Credentials,{constructor:function(e,t){n.Credentials.call(this),this.loadMasterCredentials(t),this.expired=!0,this.params=e||{},this.params.RoleArn&&(this.params.RoleSessionName=this.params.RoleSessionName||"temporary-credentials")},refresh:function(e){this.coalesceRefresh(e||n.util.fn.callback)},load:function(e){var t=this;t.createClients(),t.masterCredentials.get(function(){t.service.config.credentials=t.masterCredentials,(t.params.RoleArn?t.service.assumeRole:t.service.getSessionToken).call(t.service,function(r,n){r||t.service.credentialsFrom(n,t),e(r)})})},loadMasterCredentials:function(e){for(this.masterCredentials=e||n.config.credentials;this.masterCredentials.masterCredentials;)this.masterCredentials=this.masterCredentials.masterCredentials;"function"!=typeof this.masterCredentials.get&&(this.masterCredentials=new n.Credentials(this.masterCredentials))},createClients:function(){this.service=this.service||new n.STS({params:this.params})}})},{"../core":39}],44:[function(e,t,r){var n=e("../core");n.SAMLCredentials=n.util.inherit(n.Credentials,{constructor:function(e){n.Credentials.call(this),this.expired=!0,this.params=e},refresh:function(e){this.coalesceRefresh(e||n.util.fn.callback)},load:function(e){var t=this;t.createClients(),t.service.assumeRoleWithSAML(function(r,n){r||t.service.credentialsFrom(n,t),e(r)})},createClients:function(){this.service=this.service||new n.STS({params:this.params})}})},{"../core":39}],42:[function(e,t,r){var n=e("../core");n.CognitoIdentityCredentials=n.util.inherit(n.Credentials,{localStorageKey:{id:"aws.cognito.identity-id.",providers:"aws.cognito.identity-providers."},constructor:function(e,t){n.Credentials.call(this),this.expired=!0,this.params=e,this.data=null,this._identityId=null,this._clientConfig=n.util.copy(t||{}),this.loadCachedId();var r=this;Object.defineProperty(this,"identityId",{get:function(){return r.loadCachedId(),r._identityId||r.params.IdentityId},set:function(e){r._identityId=e}})},refresh:function(e){this.coalesceRefresh(e||n.util.fn.callback)},load:function(e){var t=this;t.createClients(),t.data=null,t._identityId=null,t.getId(function(r){r?(t.clearIdOnNotAuthorized(r),e(r)):t.params.RoleArn?t.getCredentialsFromSTS(e):t.getCredentialsForIdentity(e)})},clearCachedId:function(){this._identityId=null,delete this.params.IdentityId;var e=this.params.IdentityPoolId,t=this.params.LoginId||"";delete this.storage[this.localStorageKey.id+e+t],delete this.storage[this.localStorageKey.providers+e+t]},clearIdOnNotAuthorized:function(e){var t=this;"NotAuthorizedException"==e.code&&t.clearCachedId()},getId:function(e){var t=this;if("string"==typeof t.params.IdentityId)return e(null,t.params.IdentityId);t.cognito.getId(function(r,n){!r&&n.IdentityId?(t.params.IdentityId=n.IdentityId,e(null,n.IdentityId)):e(r)})},loadCredentials:function(e,t){e&&t&&(t.expired=!1,t.accessKeyId=e.Credentials.AccessKeyId,t.secretAccessKey=e.Credentials.SecretKey,t.sessionToken=e.Credentials.SessionToken,t.expireTime=e.Credentials.Expiration)},getCredentialsForIdentity:function(e){var t=this;t.cognito.getCredentialsForIdentity(function(r,n){r?t.clearIdOnNotAuthorized(r):(t.cacheId(n),t.data=n,t.loadCredentials(t.data,t)),e(r)})},getCredentialsFromSTS:function(e){var t=this;t.cognito.getOpenIdToken(function(r,n){r?(t.clearIdOnNotAuthorized(r),e(r)):(t.cacheId(n),t.params.WebIdentityToken=n.Token,t.webIdentityCredentials.refresh(function(r){r||(t.data=t.webIdentityCredentials.data,t.sts.credentialsFrom(t.data,t)),e(r)}))})},loadCachedId:function(){var e=this;if(n.util.isBrowser()&&!e.params.IdentityId){var t=e.getStorage("id");if(t&&e.params.Logins){var r=Object.keys(e.params.Logins);0!==(e.getStorage("providers")||"").split(",").filter(function(e){return-1!==r.indexOf(e)}).length&&(e.params.IdentityId=t)}else t&&(e.params.IdentityId=t)}},createClients:function(){var e=this._clientConfig;if(this.webIdentityCredentials=this.webIdentityCredentials||new n.WebIdentityCredentials(this.params,e),!this.cognito){var t=n.util.merge({},e);t.params=this.params,this.cognito=new n.CognitoIdentity(t)}this.sts=this.sts||new n.STS(e)},cacheId:function(e){this._identityId=e.IdentityId,this.params.IdentityId=this._identityId,n.util.isBrowser()&&(this.setStorage("id",e.IdentityId),this.params.Logins&&this.setStorage("providers",Object.keys(this.params.Logins).join(",")))},getStorage:function(e){return this.storage[this.localStorageKey[e]+this.params.IdentityPoolId+(this.params.LoginId||"")]},setStorage:function(e,t){try{this.storage[this.localStorageKey[e]+this.params.IdentityPoolId+(this.params.LoginId||"")]=t}catch(e){}},storage:function(){try{var e=n.util.isBrowser()&&null!==window.localStorage&&"object"==typeof window.localStorage?window.localStorage:{};return e["aws.test-storage"]="foobar",delete e["aws.test-storage"],e}catch(e){return{}}}()})},{"../core":39}],41:[function(e,t,r){var n=e("../core");n.ChainableTemporaryCredentials=n.util.inherit(n.Credentials,{constructor:function(e){n.Credentials.call(this),e=e||{},this.errorCode="ChainableTemporaryCredentialsProviderFailure",this.expired=!0,this.tokenCodeFn=null;var t=n.util.copy(e.params)||{};if(t.RoleArn&&(t.RoleSessionName=t.RoleSessionName||"temporary-credentials"),t.SerialNumber){if(!e.tokenCodeFn||"function"!=typeof e.tokenCodeFn)throw new n.util.error(new Error("tokenCodeFn must be a function when params.SerialNumber is given"),{code:this.errorCode});this.tokenCodeFn=e.tokenCodeFn}var r=n.util.merge({params:t,credentials:e.masterCredentials||n.config.credentials},e.stsConfig||{});this.service=new n.STS(r)},refresh:function(e){this.coalesceRefresh(e||n.util.fn.callback)},load:function(e){var t=this,r=t.service.config.params.RoleArn?"assumeRole":"getSessionToken";this.getTokenCode(function(n,i){var o={};if(n)return void e(n);i&&(o.TokenCode=i),t.service[r](o,function(r,n){r||t.service.credentialsFrom(n,t),e(r)})})},getTokenCode:function(e){var t=this;this.tokenCodeFn?this.tokenCodeFn(this.service.config.params.SerialNumber,function(r,i){if(r){var o=r;return r instanceof Error&&(o=r.message),void e(n.util.error(new Error("Error fetching MFA token: "+o),{code:t.errorCode}))}e(null,i)}):e(null)}})},{"../core":39}],29:[function(e,t,r){var n=e("./browserHmac"),i=e("./browserMd5"),o=e("./browserSha1"),s=e("./browserSha256");t.exports={createHash:function(e){if("md5"===(e=e.toLowerCase()))return new i;if("sha256"===e)return new s;if("sha1"===e)return new o;throw new Error("Hash algorithm "+e+" is not supported in the browser SDK")},createHmac:function(e,t){if("md5"===(e=e.toLowerCase()))return new n(i,t);if("sha256"===e)return new n(s,t);if("sha1"===e)return new n(o,t);throw new Error("HMAC algorithm "+e+" is not supported in the browser SDK")},createSign:function(){throw new Error("createSign is not implemented in the browser")}}},{"./browserHmac":31,"./browserMd5":32,"./browserSha1":33,"./browserSha256":34}],34:[function(e,t,r){function n(){this.state=[1779033703,3144134277,1013904242,2773480762,1359893119,2600822924,528734635,1541459225],this.temp=new Int32Array(64),this.buffer=new Uint8Array(64),this.bufferLength=0,this.bytesHashed=0,this.finished=!1}var i=e("buffer/").Buffer,o=e("./browserHashUtils"),s=new Uint32Array([1116352408,1899447441,3049323471,3921009573,961987163,1508970993,2453635748,2870763221,3624381080,310598401,607225278,1426881987,1925078388,2162078206,2614888103,3248222580,3835390401,4022224774,264347078,604807628,770255983,1249150122,1555081692,1996064986,2554220882,2821834349,2952996808,3210313671,3336571891,3584528711,113926993,338241895,666307205,773529912,1294757372,1396182291,1695183700,1986661051,2177026350,2456956037,2730485921,2820302411,3259730800,3345764771,3516065817,3600352804,4094571909,275423344,430227734,506948616,659060556,883997877,958139571,1322822218,1537002063,1747873779,1955562222,2024104815,2227730452,2361852424,2428436474,2756734187,3204031479,3329325298]),a=Math.pow(2,53)-1;t.exports=n,n.BLOCK_SIZE=64,n.prototype.update=function(e){if(this.finished)throw new Error("Attempted to update an already finished hash.");if(o.isEmptyData(e))return this;e=o.convertToBuffer(e);var t=0,r=e.byteLength;if(this.bytesHashed+=r,8*this.bytesHashed>a)throw new Error("Cannot hash more than 2^53 - 1 bits");for(;r>0;)this.buffer[this.bufferLength++]=e[t++],r--,64===this.bufferLength&&(this.hashBuffer(),this.bufferLength=0);return this},n.prototype.digest=function(e){if(!this.finished){var t=8*this.bytesHashed,r=new DataView(this.buffer.buffer,this.buffer.byteOffset,this.buffer.byteLength),n=this.bufferLength;if(r.setUint8(this.bufferLength++,128),n%64>=56){for(var o=this.bufferLength;o<64;o++)r.setUint8(o,0);this.hashBuffer(),this.bufferLength=0}for(var o=this.bufferLength;o<56;o++)r.setUint8(o,0);r.setUint32(56,Math.floor(t/4294967296),!0),r.setUint32(60,t),this.hashBuffer(),this.finished=!0}for(var s=new i(32),o=0;o<8;o++)s[4*o]=this.state[o]>>>24&255,s[4*o+1]=this.state[o]>>>16&255,s[4*o+2]=this.state[o]>>>8&255,s[4*o+3]=this.state[o]>>>0&255;return e?s.toString(e):s},n.prototype.hashBuffer=function(){for(var e=this,t=e.buffer,r=e.state,n=r[0],i=r[1],o=r[2],a=r[3],u=r[4],c=r[5],l=r[6],h=r[7],p=0;p<64;p++){if(p<16)this.temp[p]=(255&t[4*p])<<24|(255&t[4*p+1])<<16|(255&t[4*p+2])<<8|255&t[4*p+3];else{var f=this.temp[p-2],d=(f>>>17|f<<15)^(f>>>19|f<<13)^f>>>10;f=this.temp[p-15];var m=(f>>>7|f<<25)^(f>>>18|f<<14)^f>>>3;this.temp[p]=(d+this.temp[p-7]|0)+(m+this.temp[p-16]|0)}var v=(((u>>>6|u<<26)^(u>>>11|u<<21)^(u>>>25|u<<7))+(u&c^~u&l)|0)+(h+(s[p]+this.temp[p]|0)|0)|0,g=((n>>>2|n<<30)^(n>>>13|n<<19)^(n>>>22|n<<10))+(n&i^n&o^i&o)|0;h=l,l=c,c=u,u=a+v|0,a=o,o=i,i=n,n=v+g|0}r[0]+=n,r[1]+=i,r[2]+=o,r[3]+=a,r[4]+=u,r[5]+=c,r[6]+=l,r[7]+=h}},{"./browserHashUtils":30,"buffer/":3}],33:[function(e,t,r){function n(){this.h0=1732584193,this.h1=4023233417,this.h2=2562383102,this.h3=271733878,this.h4=3285377520,this.block=new Uint32Array(80),this.offset=0,this.shift=24,this.totalLength=0}var i=e("buffer/").Buffer,o=e("./browserHashUtils");new Uint32Array([1518500249,1859775393,-1894007588,-899497514]),Math.pow(2,53);t.exports=n,n.BLOCK_SIZE=64,n.prototype.update=function(e){if(this.finished)throw new Error("Attempted to update an already finished hash.");if(o.isEmptyData(e))return this;e=o.convertToBuffer(e);var t=e.length;this.totalLength+=8*t;for(var r=0;r<t;r++)this.write(e[r]);return this},n.prototype.write=function(e){this.block[this.offset]|=(255&e)<<this.shift,this.shift?this.shift-=8:(this.offset++,this.shift=24),16===this.offset&&this.processBlock()},n.prototype.digest=function(e){this.write(128),(this.offset>14||14===this.offset&&this.shift<24)&&this.processBlock(),this.offset=14,this.shift=24,this.write(0),this.write(0),this.write(this.totalLength>0xffffffffff?this.totalLength/1099511627776:0),this.write(this.totalLength>4294967295?this.totalLength/4294967296:0);for(var t=24;t>=0;t-=8)this.write(this.totalLength>>t);var r=new i(20),n=new DataView(r.buffer);return n.setUint32(0,this.h0,!1),n.setUint32(4,this.h1,!1),n.setUint32(8,this.h2,!1),n.setUint32(12,this.h3,!1),n.setUint32(16,this.h4,!1),e?r.toString(e):r},n.prototype.processBlock=function(){for(var e=16;e<80;e++){var t=this.block[e-3]^this.block[e-8]^this.block[e-14]^this.block[e-16];this.block[e]=t<<1|t>>>31}var r,n,i=this.h0,o=this.h1,s=this.h2,a=this.h3,u=this.h4;for(e=0;e<80;e++){e<20?(r=a^o&(s^a),n=1518500249):e<40?(r=o^s^a,n=1859775393):e<60?(r=o&s|a&(o|s),n=2400959708):(r=o^s^a,n=3395469782);var c=(i<<5|i>>>27)+r+u+n+(0|this.block[e]);u=a,a=s,s=o<<30|o>>>2,o=i,i=c}for(this.h0=this.h0+i|0,this.h1=this.h1+o|0,this.h2=this.h2+s|0,this.h3=this.h3+a|0,this.h4=this.h4+u|0,this.offset=0,e=0;e<16;e++)this.block[e]=0}},{"./browserHashUtils":30,"buffer/":3}],32:[function(e,t,r){function n(){this.state=[1732584193,4023233417,2562383102,271733878],this.buffer=new DataView(new ArrayBuffer(h)),this.bufferLength=0,this.bytesHashed=0,this.finished=!1}function i(e,t,r,n,i,o){return((t=(t+e&4294967295)+(n+o&4294967295)&4294967295)<<i|t>>>32-i)+r&4294967295}function o(e,t,r,n,o,s,a){return i(t&r|~t&n,e,t,o,s,a)}function s(e,t,r,n,o,s,a){return i(t&n|r&~n,e,t,o,s,a)}function a(e,t,r,n,o,s,a){return i(t^r^n,e,t,o,s,a)}function u(e,t,r,n,o,s,a){return i(r^(t|~n),e,t,o,s,a)}var c=e("./browserHashUtils"),l=e("buffer/").Buffer,h=64;t.exports=n,n.BLOCK_SIZE=h,n.prototype.update=function(e){if(c.isEmptyData(e))return this;if(this.finished)throw new Error("Attempted to update an already finished hash.");var t=c.convertToBuffer(e),r=0,n=t.byteLength;for(this.bytesHashed+=n;n>0;)this.buffer.setUint8(this.bufferLength++,t[r++]),n--,this.bufferLength===h&&(this.hashBuffer(),this.bufferLength=0);return this},n.prototype.digest=function(e){if(!this.finished){var t=this,r=t.buffer,n=t.bufferLength,i=t.bytesHashed,o=8*i;if(r.setUint8(this.bufferLength++,128),n%h>=h-8){for(var s=this.bufferLength;s<h;s++)r.setUint8(s,0);this.hashBuffer(),this.bufferLength=0}for(var s=this.bufferLength;s<h-8;s++)r.setUint8(s,0);r.setUint32(h-8,o>>>0,!0),r.setUint32(h-4,Math.floor(o/4294967296),!0),this.hashBuffer(),this.finished=!0}for(var a=new DataView(new ArrayBuffer(16)),s=0;s<4;s++)a.setUint32(4*s,this.state[s],!0);var u=new l(a.buffer,a.byteOffset,a.byteLength);return e?u.toString(e):u},n.prototype.hashBuffer=function(){var e=this,t=e.buffer,r=e.state,n=r[0],i=r[1],c=r[2],l=r[3];n=o(n,i,c,l,t.getUint32(0,!0),7,3614090360),l=o(l,n,i,c,t.getUint32(4,!0),12,3905402710),c=o(c,l,n,i,t.getUint32(8,!0),17,606105819),i=o(i,c,l,n,t.getUint32(12,!0),22,3250441966),n=o(n,i,c,l,t.getUint32(16,!0),7,4118548399),l=o(l,n,i,c,t.getUint32(20,!0),12,1200080426),c=o(c,l,n,i,t.getUint32(24,!0),17,2821735955),i=o(i,c,l,n,t.getUint32(28,!0),22,4249261313),n=o(n,i,c,l,t.getUint32(32,!0),7,1770035416),l=o(l,n,i,c,t.getUint32(36,!0),12,2336552879),c=o(c,l,n,i,t.getUint32(40,!0),17,4294925233),i=o(i,c,l,n,t.getUint32(44,!0),22,2304563134),n=o(n,i,c,l,t.getUint32(48,!0),7,1804603682),l=o(l,n,i,c,t.getUint32(52,!0),12,4254626195),c=o(c,l,n,i,t.getUint32(56,!0),17,2792965006),i=o(i,c,l,n,t.getUint32(60,!0),22,1236535329),
+n=s(n,i,c,l,t.getUint32(4,!0),5,4129170786),l=s(l,n,i,c,t.getUint32(24,!0),9,3225465664),c=s(c,l,n,i,t.getUint32(44,!0),14,643717713),i=s(i,c,l,n,t.getUint32(0,!0),20,3921069994),n=s(n,i,c,l,t.getUint32(20,!0),5,3593408605),l=s(l,n,i,c,t.getUint32(40,!0),9,38016083),c=s(c,l,n,i,t.getUint32(60,!0),14,3634488961),i=s(i,c,l,n,t.getUint32(16,!0),20,3889429448),n=s(n,i,c,l,t.getUint32(36,!0),5,568446438),l=s(l,n,i,c,t.getUint32(56,!0),9,3275163606),c=s(c,l,n,i,t.getUint32(12,!0),14,4107603335),i=s(i,c,l,n,t.getUint32(32,!0),20,1163531501),n=s(n,i,c,l,t.getUint32(52,!0),5,2850285829),l=s(l,n,i,c,t.getUint32(8,!0),9,4243563512),c=s(c,l,n,i,t.getUint32(28,!0),14,1735328473),i=s(i,c,l,n,t.getUint32(48,!0),20,2368359562),n=a(n,i,c,l,t.getUint32(20,!0),4,4294588738),l=a(l,n,i,c,t.getUint32(32,!0),11,2272392833),c=a(c,l,n,i,t.getUint32(44,!0),16,1839030562),i=a(i,c,l,n,t.getUint32(56,!0),23,4259657740),n=a(n,i,c,l,t.getUint32(4,!0),4,2763975236),l=a(l,n,i,c,t.getUint32(16,!0),11,1272893353),c=a(c,l,n,i,t.getUint32(28,!0),16,4139469664),i=a(i,c,l,n,t.getUint32(40,!0),23,3200236656),n=a(n,i,c,l,t.getUint32(52,!0),4,681279174),l=a(l,n,i,c,t.getUint32(0,!0),11,3936430074),c=a(c,l,n,i,t.getUint32(12,!0),16,3572445317),i=a(i,c,l,n,t.getUint32(24,!0),23,76029189),n=a(n,i,c,l,t.getUint32(36,!0),4,3654602809),l=a(l,n,i,c,t.getUint32(48,!0),11,3873151461),c=a(c,l,n,i,t.getUint32(60,!0),16,530742520),i=a(i,c,l,n,t.getUint32(8,!0),23,3299628645),n=u(n,i,c,l,t.getUint32(0,!0),6,4096336452),l=u(l,n,i,c,t.getUint32(28,!0),10,1126891415),c=u(c,l,n,i,t.getUint32(56,!0),15,2878612391),i=u(i,c,l,n,t.getUint32(20,!0),21,4237533241),n=u(n,i,c,l,t.getUint32(48,!0),6,1700485571),l=u(l,n,i,c,t.getUint32(12,!0),10,2399980690),c=u(c,l,n,i,t.getUint32(40,!0),15,4293915773),i=u(i,c,l,n,t.getUint32(4,!0),21,2240044497),n=u(n,i,c,l,t.getUint32(32,!0),6,1873313359),l=u(l,n,i,c,t.getUint32(60,!0),10,4264355552),c=u(c,l,n,i,t.getUint32(24,!0),15,2734768916),i=u(i,c,l,n,t.getUint32(52,!0),21,1309151649),n=u(n,i,c,l,t.getUint32(16,!0),6,4149444226),l=u(l,n,i,c,t.getUint32(44,!0),10,3174756917),c=u(c,l,n,i,t.getUint32(8,!0),15,718787259),i=u(i,c,l,n,t.getUint32(36,!0),21,3951481745),r[0]=n+r[0]&4294967295,r[1]=i+r[1]&4294967295,r[2]=c+r[2]&4294967295,r[3]=l+r[3]&4294967295}},{"./browserHashUtils":30,"buffer/":3}],31:[function(e,t,r){function n(e,t){this.hash=new e,this.outer=new e;var r=i(e,t),n=new Uint8Array(e.BLOCK_SIZE);n.set(r);for(var o=0;o<e.BLOCK_SIZE;o++)r[o]^=54,n[o]^=92;this.hash.update(r),this.outer.update(n);for(var o=0;o<r.byteLength;o++)r[o]=0}function i(e,t){var r=o.convertToBuffer(t);if(r.byteLength>e.BLOCK_SIZE){var n=new e;n.update(r),r=n.digest()}var i=new Uint8Array(e.BLOCK_SIZE);return i.set(r),i}var o=e("./browserHashUtils");t.exports=n,n.prototype.update=function(e){if(o.isEmptyData(e)||this.error)return this;try{this.hash.update(o.convertToBuffer(e))}catch(e){this.error=e}return this},n.prototype.digest=function(e){return this.outer.finished||this.outer.update(this.hash.digest()),this.outer.digest(e)}},{"./browserHashUtils":30}],30:[function(e,t,r){function n(e){return"string"==typeof e?0===e.length:0===e.byteLength}function i(e){return"string"==typeof e&&(e=new o(e,"utf8")),ArrayBuffer.isView(e)?new Uint8Array(e.buffer,e.byteOffset,e.byteLength/Uint8Array.BYTES_PER_ELEMENT):new Uint8Array(e)}var o=e("buffer/").Buffer;"undefined"!=typeof ArrayBuffer&&void 0===ArrayBuffer.isView&&(ArrayBuffer.isView=function(e){return s.indexOf(Object.prototype.toString.call(e))>-1});var s=["[object Int8Array]","[object Uint8Array]","[object Uint8ClampedArray]","[object Int16Array]","[object Uint16Array]","[object Int32Array]","[object Uint32Array]","[object Float32Array]","[object Float64Array]","[object DataView]"];t.exports={isEmptyData:n,convertToBuffer:i}},{"buffer/":3}],17:[function(e,t,r){function n(){this.protocol=null,this.slashes=null,this.auth=null,this.host=null,this.port=null,this.hostname=null,this.hash=null,this.search=null,this.query=null,this.pathname=null,this.path=null,this.href=null}function i(e,t,r){if(e&&c(e)&&e instanceof n)return e;var i=new n;return i.parse(e,t,r),i}function o(e){return u(e)&&(e=i(e)),e instanceof n?e.format():n.prototype.format.call(e)}function s(e,t){return i(e,!1,!0).resolve(t)}function a(e,t){return e?i(e,!1,!0).resolveObject(t):t}function u(e){return"string"==typeof e}function c(e){return"object"==typeof e&&null!==e}function l(e){return null===e}function h(e){return null==e}var p=e("punycode");r.parse=i,r.resolve=s,r.resolveObject=a,r.format=o,r.Url=n;var f=/^([a-z0-9.+-]+:)/i,d=/:[0-9]*$/,m=["<",">",'"',"`"," ","\r","\n","\t"],v=["{","}","|","\\","^","`"].concat(m),g=["'"].concat(v),y=["%","/","?",";","#"].concat(g),b=["/","?","#"],w=/^[a-z0-9A-Z_-]{0,63}$/,E=/^([a-z0-9A-Z_-]{0,63})(.*)$/,_={javascript:!0,"javascript:":!0},S={javascript:!0,"javascript:":!0},C={http:!0,https:!0,ftp:!0,gopher:!0,file:!0,"http:":!0,"https:":!0,"ftp:":!0,"gopher:":!0,"file:":!0},x=e("querystring");n.prototype.parse=function(e,t,r){if(!u(e))throw new TypeError("Parameter 'url' must be a string, not "+typeof e);var n=e;n=n.trim();var i=f.exec(n);if(i){i=i[0];var o=i.toLowerCase();this.protocol=o,n=n.substr(i.length)}if(r||i||n.match(/^\/\/[^@\/]+@[^@\/]+/)){var s="//"===n.substr(0,2);!s||i&&S[i]||(n=n.substr(2),this.slashes=!0)}if(!S[i]&&(s||i&&!C[i])){for(var a=-1,c=0;c<b.length;c++){var l=n.indexOf(b[c]);-1!==l&&(-1===a||l<a)&&(a=l)}var h,d;d=-1===a?n.lastIndexOf("@"):n.lastIndexOf("@",a),-1!==d&&(h=n.slice(0,d),n=n.slice(d+1),this.auth=decodeURIComponent(h)),a=-1;for(var c=0;c<y.length;c++){var l=n.indexOf(y[c]);-1!==l&&(-1===a||l<a)&&(a=l)}-1===a&&(a=n.length),this.host=n.slice(0,a),n=n.slice(a),this.parseHost(),this.hostname=this.hostname||"";var m="["===this.hostname[0]&&"]"===this.hostname[this.hostname.length-1];if(!m)for(var v=this.hostname.split(/\./),c=0,A=v.length;c<A;c++){var R=v[c];if(R&&!R.match(w)){for(var T="",k=0,I=R.length;k<I;k++)R.charCodeAt(k)>127?T+="x":T+=R[k];if(!T.match(w)){var L=v.slice(0,c),P=v.slice(c+1),q=R.match(E);q&&(L.push(q[1]),P.unshift(q[2])),P.length&&(n="/"+P.join(".")+n),this.hostname=L.join(".");break}}}if(this.hostname.length>255?this.hostname="":this.hostname=this.hostname.toLowerCase(),!m){for(var O=this.hostname.split("."),N=[],c=0;c<O.length;++c){var U=O[c];N.push(U.match(/[^A-Za-z0-9_-]/)?"xn--"+p.encode(U):U)}this.hostname=N.join(".")}var D=this.port?":"+this.port:"",M=this.hostname||"";this.host=M+D,this.href+=this.host,m&&(this.hostname=this.hostname.substr(1,this.hostname.length-2),"/"!==n[0]&&(n="/"+n))}if(!_[o])for(var c=0,A=g.length;c<A;c++){var j=g[c],B=encodeURIComponent(j);B===j&&(B=escape(j)),n=n.split(j).join(B)}var F=n.indexOf("#");-1!==F&&(this.hash=n.substr(F),n=n.slice(0,F));var z=n.indexOf("?");if(-1!==z?(this.search=n.substr(z),this.query=n.substr(z+1),t&&(this.query=x.parse(this.query)),n=n.slice(0,z)):t&&(this.search="",this.query={}),n&&(this.pathname=n),C[o]&&this.hostname&&!this.pathname&&(this.pathname="/"),this.pathname||this.search){var D=this.pathname||"",U=this.search||"";this.path=D+U}return this.href=this.format(),this},n.prototype.format=function(){var e=this.auth||"";e&&(e=encodeURIComponent(e),e=e.replace(/%3A/i,":"),e+="@");var t=this.protocol||"",r=this.pathname||"",n=this.hash||"",i=!1,o="";this.host?i=e+this.host:this.hostname&&(i=e+(-1===this.hostname.indexOf(":")?this.hostname:"["+this.hostname+"]"),this.port&&(i+=":"+this.port)),this.query&&c(this.query)&&Object.keys(this.query).length&&(o=x.stringify(this.query));var s=this.search||o&&"?"+o||"";return t&&":"!==t.substr(-1)&&(t+=":"),this.slashes||(!t||C[t])&&!1!==i?(i="//"+(i||""),r&&"/"!==r.charAt(0)&&(r="/"+r)):i||(i=""),n&&"#"!==n.charAt(0)&&(n="#"+n),s&&"?"!==s.charAt(0)&&(s="?"+s),r=r.replace(/[?#]/g,function(e){return encodeURIComponent(e)}),s=s.replace("#","%23"),t+i+r+s+n},n.prototype.resolve=function(e){return this.resolveObject(i(e,!1,!0)).format()},n.prototype.resolveObject=function(e){if(u(e)){var t=new n;t.parse(e,!1,!0),e=t}var r=new n;if(Object.keys(this).forEach(function(e){r[e]=this[e]},this),r.hash=e.hash,""===e.href)return r.href=r.format(),r;if(e.slashes&&!e.protocol)return Object.keys(e).forEach(function(t){"protocol"!==t&&(r[t]=e[t])}),C[r.protocol]&&r.hostname&&!r.pathname&&(r.path=r.pathname="/"),r.href=r.format(),r;if(e.protocol&&e.protocol!==r.protocol){if(!C[e.protocol])return Object.keys(e).forEach(function(t){r[t]=e[t]}),r.href=r.format(),r;if(r.protocol=e.protocol,e.host||S[e.protocol])r.pathname=e.pathname;else{for(var i=(e.pathname||"").split("/");i.length&&!(e.host=i.shift()););e.host||(e.host=""),e.hostname||(e.hostname=""),""!==i[0]&&i.unshift(""),i.length<2&&i.unshift(""),r.pathname=i.join("/")}if(r.search=e.search,r.query=e.query,r.host=e.host||"",r.auth=e.auth,r.hostname=e.hostname||e.host,r.port=e.port,r.pathname||r.search){var o=r.pathname||"",s=r.search||"";r.path=o+s}return r.slashes=r.slashes||e.slashes,r.href=r.format(),r}var a=r.pathname&&"/"===r.pathname.charAt(0),c=e.host||e.pathname&&"/"===e.pathname.charAt(0),p=c||a||r.host&&e.pathname,f=p,d=r.pathname&&r.pathname.split("/")||[],i=e.pathname&&e.pathname.split("/")||[],m=r.protocol&&!C[r.protocol];if(m&&(r.hostname="",r.port=null,r.host&&(""===d[0]?d[0]=r.host:d.unshift(r.host)),r.host="",e.protocol&&(e.hostname=null,e.port=null,e.host&&(""===i[0]?i[0]=e.host:i.unshift(e.host)),e.host=null),p=p&&(""===i[0]||""===d[0])),c)r.host=e.host||""===e.host?e.host:r.host,r.hostname=e.hostname||""===e.hostname?e.hostname:r.hostname,r.search=e.search,r.query=e.query,d=i;else if(i.length)d||(d=[]),d.pop(),d=d.concat(i),r.search=e.search,r.query=e.query;else if(!h(e.search)){if(m){r.hostname=r.host=d.shift();var v=!!(r.host&&r.host.indexOf("@")>0)&&r.host.split("@");v&&(r.auth=v.shift(),r.host=r.hostname=v.shift())}return r.search=e.search,r.query=e.query,l(r.pathname)&&l(r.search)||(r.path=(r.pathname?r.pathname:"")+(r.search?r.search:"")),r.href=r.format(),r}if(!d.length)return r.pathname=null,r.search?r.path="/"+r.search:r.path=null,r.href=r.format(),r;for(var g=d.slice(-1)[0],y=(r.host||e.host)&&("."===g||".."===g)||""===g,b=0,w=d.length;w>=0;w--)g=d[w],"."==g?d.splice(w,1):".."===g?(d.splice(w,1),b++):b&&(d.splice(w,1),b--);if(!p&&!f)for(;b--;b)d.unshift("..");!p||""===d[0]||d[0]&&"/"===d[0].charAt(0)||d.unshift(""),y&&"/"!==d.join("/").substr(-1)&&d.push("");var E=""===d[0]||d[0]&&"/"===d[0].charAt(0);if(m){r.hostname=r.host=E?"":d.length?d.shift():"";var v=!!(r.host&&r.host.indexOf("@")>0)&&r.host.split("@");v&&(r.auth=v.shift(),r.host=r.hostname=v.shift())}return p=p||r.host&&d.length,p&&!E&&d.unshift(""),d.length?r.pathname=d.join("/"):(r.pathname=null,r.path=null),l(r.pathname)&&l(r.search)||(r.path=(r.pathname?r.pathname:"")+(r.search?r.search:"")),r.auth=e.auth||r.auth,r.slashes=r.slashes||e.slashes,r.href=r.format(),r},n.prototype.parseHost=function(){var e=this.host,t=d.exec(e);t&&(t=t[0],":"!==t&&(this.port=t.substr(1)),e=e.substr(0,e.length-t.length)),e&&(this.hostname=e)}},{punycode:9,querystring:12}],15:[function(e,t,r){arguments[4][12][0].apply(r,arguments)},{"./decode":13,"./encode":14,dup:12}],14:[function(e,t,r){"use strict";var n=function(e){switch(typeof e){case"string":return e;case"boolean":return e?"true":"false";case"number":return isFinite(e)?e:"";default:return""}};t.exports=function(e,t,r,i){return t=t||"&",r=r||"=",null===e&&(e=void 0),"object"==typeof e?Object.keys(e).map(function(i){var o=encodeURIComponent(n(i))+r;return Array.isArray(e[i])?e[i].map(function(e){return o+encodeURIComponent(n(e))}).join(t):o+encodeURIComponent(n(e[i]))}).join(t):i?encodeURIComponent(n(i))+r+encodeURIComponent(n(e)):""}},{}],13:[function(e,t,r){"use strict";function n(e,t){return Object.prototype.hasOwnProperty.call(e,t)}t.exports=function(e,t,r,i){t=t||"&",r=r||"=";var o={};if("string"!=typeof e||0===e.length)return o;var s=/\+/g;e=e.split(t);var a=1e3;i&&"number"==typeof i.maxKeys&&(a=i.maxKeys);var u=e.length;a>0&&u>a&&(u=a);for(var c=0;c<u;++c){var l,h,p,f,d=e[c].replace(s,"%20"),m=d.indexOf(r);m>=0?(l=d.substr(0,m),h=d.substr(m+1)):(l=d,h=""),p=decodeURIComponent(l),f=decodeURIComponent(h),n(o,p)?Array.isArray(o[p])?o[p].push(f):o[p]=[o[p],f]:o[p]=f}return o}},{}],12:[function(e,t,r){"use strict";r.decode=r.parse=e("./decode"),r.encode=r.stringify=e("./encode")},{"./decode":10,"./encode":11}],11:[function(e,t,r){"use strict";function n(e,t){if(e.map)return e.map(t);for(var r=[],n=0;n<e.length;n++)r.push(t(e[n],n));return r}var i=function(e){switch(typeof e){case"string":return e;case"boolean":return e?"true":"false";case"number":return isFinite(e)?e:"";default:return""}};t.exports=function(e,t,r,a){return t=t||"&",r=r||"=",null===e&&(e=void 0),"object"==typeof e?n(s(e),function(s){var a=encodeURIComponent(i(s))+r;return o(e[s])?n(e[s],function(e){return a+encodeURIComponent(i(e))}).join(t):a+encodeURIComponent(i(e[s]))}).join(t):a?encodeURIComponent(i(a))+r+encodeURIComponent(i(e)):""};var o=Array.isArray||function(e){return"[object Array]"===Object.prototype.toString.call(e)},s=Object.keys||function(e){var t=[];for(var r in e)Object.prototype.hasOwnProperty.call(e,r)&&t.push(r);return t}},{}],10:[function(e,t,r){"use strict";function n(e,t){return Object.prototype.hasOwnProperty.call(e,t)}t.exports=function(e,t,r,o){t=t||"&",r=r||"=";var s={};if("string"!=typeof e||0===e.length)return s;var a=/\+/g;e=e.split(t);var u=1e3;o&&"number"==typeof o.maxKeys&&(u=o.maxKeys);var c=e.length;u>0&&c>u&&(c=u);for(var l=0;l<c;++l){var h,p,f,d,m=e[l].replace(a,"%20"),v=m.indexOf(r);v>=0?(h=m.substr(0,v),p=m.substr(v+1)):(h=m,p=""),f=decodeURIComponent(h),d=decodeURIComponent(p),n(s,f)?i(s[f])?s[f].push(d):s[f]=[s[f],d]:s[f]=d}return s};var i=Array.isArray||function(e){return"[object Array]"===Object.prototype.toString.call(e)}},{}],9:[function(e,t,r){(function(e){(function(){!function(n){function i(e){throw RangeError(q[e])}function o(e,t){for(var r=e.length,n=[];r--;)n[r]=t(e[r]);return n}function s(e,t){var r=e.split("@"),n="";return r.length>1&&(n=r[0]+"@",e=r[1]),e=e.replace(P,"."),n+o(e.split("."),t).join(".")}function a(e){for(var t,r,n=[],i=0,o=e.length;i<o;)t=e.charCodeAt(i++),t>=55296&&t<=56319&&i<o?(r=e.charCodeAt(i++),56320==(64512&r)?n.push(((1023&t)<<10)+(1023&r)+65536):(n.push(t),i--)):n.push(t);return n}function u(e){return o(e,function(e){var t="";return e>65535&&(e-=65536,t+=U(e>>>10&1023|55296),e=56320|1023&e),t+=U(e)}).join("")}function c(e){return e-48<10?e-22:e-65<26?e-65:e-97<26?e-97:_}function l(e,t){return e+22+75*(e<26)-((0!=t)<<5)}function h(e,t,r){var n=0;for(e=r?N(e/A):e>>1,e+=N(e/t);e>O*C>>1;n+=_)e=N(e/O);return N(n+(O+1)*e/(e+x))}function p(e){var t,r,n,o,s,a,l,p,f,d,m=[],v=e.length,g=0,y=T,b=R;for(r=e.lastIndexOf(k),r<0&&(r=0),n=0;n<r;++n)e.charCodeAt(n)>=128&&i("not-basic"),m.push(e.charCodeAt(n));for(o=r>0?r+1:0;o<v;){for(s=g,a=1,l=_;o>=v&&i("invalid-input"),p=c(e.charCodeAt(o++)),(p>=_||p>N((E-g)/a))&&i("overflow"),g+=p*a,f=l<=b?S:l>=b+C?C:l-b,!(p<f);l+=_)d=_-f,a>N(E/d)&&i("overflow"),a*=d;t=m.length+1,b=h(g-s,t,0==s),N(g/t)>E-y&&i("overflow"),y+=N(g/t),g%=t,m.splice(g++,0,y)}return u(m)}function f(e){var t,r,n,o,s,u,c,p,f,d,m,v,g,y,b,w=[];for(e=a(e),v=e.length,t=T,r=0,s=R,u=0;u<v;++u)(m=e[u])<128&&w.push(U(m));for(n=o=w.length,o&&w.push(k);n<v;){for(c=E,u=0;u<v;++u)(m=e[u])>=t&&m<c&&(c=m);for(g=n+1,c-t>N((E-r)/g)&&i("overflow"),r+=(c-t)*g,t=c,u=0;u<v;++u)if(m=e[u],m<t&&++r>E&&i("overflow"),m==t){for(p=r,f=_;d=f<=s?S:f>=s+C?C:f-s,!(p<d);f+=_)b=p-d,y=_-d,w.push(U(l(d+b%y,0))),p=N(b/y);w.push(U(l(p,0))),s=h(r,g,n==o),r=0,++n}++r,++t}return w.join("")}function d(e){return s(e,function(e){return I.test(e)?p(e.slice(4).toLowerCase()):e})}function m(e){return s(e,function(e){return L.test(e)?"xn--"+f(e):e})}var v="object"==typeof r&&r&&!r.nodeType&&r,g="object"==typeof t&&t&&!t.nodeType&&t,y="object"==typeof e&&e;y.global!==y&&y.window!==y&&y.self!==y||(n=y);var b,w,E=2147483647,_=36,S=1,C=26,x=38,A=700,R=72,T=128,k="-",I=/^xn--/,L=/[^\x20-\x7E]/,P=/[\x2E\u3002\uFF0E\uFF61]/g,q={overflow:"Overflow: input needs wider integers to process","not-basic":"Illegal input >= 0x80 (not a basic code point)","invalid-input":"Invalid input"},O=_-S,N=Math.floor,U=String.fromCharCode;if(b={version:"1.3.2",ucs2:{decode:a,encode:u},decode:p,encode:f,toASCII:m,toUnicode:d},"function"==typeof define&&"object"==typeof define.amd&&define.amd)define("punycode",function(){return b});else if(v&&g)if(t.exports==v)g.exports=b;else for(w in b)b.hasOwnProperty(w)&&(v[w]=b[w]);else n.punycode=b}(this)}).call(this)}).call(this,"undefined"!=typeof global?global:"undefined"!=typeof self?self:"undefined"!=typeof window?window:{})},{}],4:[function(e,t,r){function n(){this._events=this._events||{},this._maxListeners=this._maxListeners||void 0}function i(e){return"function"==typeof e}function o(e){return"number"==typeof e}function s(e){return"object"==typeof e&&null!==e}function a(e){return void 0===e}t.exports=n,n.EventEmitter=n,n.prototype._events=void 0,n.prototype._maxListeners=void 0,n.defaultMaxListeners=10,n.prototype.setMaxListeners=function(e){if(!o(e)||e<0||isNaN(e))throw TypeError("n must be a positive number");return this._maxListeners=e,this},n.prototype.emit=function(e){var t,r,n,o,u,c;if(this._events||(this._events={}),"error"===e&&(!this._events.error||s(this._events.error)&&!this._events.error.length)){if((t=arguments[1])instanceof Error)throw t;var l=new Error('Uncaught, unspecified "error" event. ('+t+")");throw l.context=t,l}if(r=this._events[e],a(r))return!1;if(i(r))switch(arguments.length){case 1:r.call(this);break;case 2:r.call(this,arguments[1]);break;case 3:r.call(this,arguments[1],arguments[2]);break;default:o=Array.prototype.slice.call(arguments,1),r.apply(this,o)}else if(s(r))for(o=Array.prototype.slice.call(arguments,1),c=r.slice(),n=c.length,u=0;u<n;u++)c[u].apply(this,o);return!0},n.prototype.addListener=function(e,t){var r;if(!i(t))throw TypeError("listener must be a function");return this._events||(this._events={}),this._events.newListener&&this.emit("newListener",e,i(t.listener)?t.listener:t),this._events[e]?s(this._events[e])?this._events[e].push(t):this._events[e]=[this._events[e],t]:this._events[e]=t,s(this._events[e])&&!this._events[e].warned&&(r=a(this._maxListeners)?n.defaultMaxListeners:this._maxListeners)&&r>0&&this._events[e].length>r&&(this._events[e].warned=!0,console.error("(node) warning: possible EventEmitter memory leak detected. %d listeners added. Use emitter.setMaxListeners() to increase limit.",this._events[e].length),"function"==typeof console.trace&&console.trace()),this},n.prototype.on=n.prototype.addListener,n.prototype.once=function(e,t){function r(){this.removeListener(e,r),n||(n=!0,t.apply(this,arguments))}if(!i(t))throw TypeError("listener must be a function");var n=!1;return r.listener=t,this.on(e,r),this},n.prototype.removeListener=function(e,t){var r,n,o,a;if(!i(t))throw TypeError("listener must be a function");if(!this._events||!this._events[e])return this;if(r=this._events[e],o=r.length,n=-1,r===t||i(r.listener)&&r.listener===t)delete this._events[e],this._events.removeListener&&this.emit("removeListener",e,t);else if(s(r)){for(a=o;a-- >0;)if(r[a]===t||r[a].listener&&r[a].listener===t){n=a;break}if(n<0)return this;1===r.length?(r.length=0,delete this._events[e]):r.splice(n,1),this._events.removeListener&&this.emit("removeListener",e,t)}return this},n.prototype.removeAllListeners=function(e){var t,r;if(!this._events)return this;if(!this._events.removeListener)return 0===arguments.length?this._events={}:this._events[e]&&delete this._events[e],this;if(0===arguments.length){for(t in this._events)"removeListener"!==t&&this.removeAllListeners(t);return this.removeAllListeners("removeListener"),this._events={},this}if(r=this._events[e],i(r))this.removeListener(e,r);else if(r)for(;r.length;)this.removeListener(e,r[r.length-1]);return delete this._events[e],this},n.prototype.listeners=function(e){return this._events&&this._events[e]?i(this._events[e])?[this._events[e]]:this._events[e].slice():[]},n.prototype.listenerCount=function(e){if(this._events){var t=this._events[e];if(i(t))return 1;if(t)return t.length}return 0},n.listenerCount=function(e,t){return e.listenerCount(t)}},{}],3:[function(e,t,r){(function(t,n){(function(){"use strict";function n(){return o.TYPED_ARRAY_SUPPORT?2147483647:1073741823}function i(e,t){if(n()<t)throw new RangeError("Invalid typed array length");return o.TYPED_ARRAY_SUPPORT?(e=new Uint8Array(t),e.__proto__=o.prototype):(null===e&&(e=new o(t)),e.length=t),e}function o(e,t,r){if(!(o.TYPED_ARRAY_SUPPORT||this instanceof o))return new o(e,t,r);if("number"==typeof e){if("string"==typeof t)throw new Error("If encoding is specified then the first argument must be a string");return c(this,e)}return s(this,e,t,r)}function s(e,t,r,n){if("number"==typeof t)throw new TypeError('"value" argument must not be a number');return"undefined"!=typeof ArrayBuffer&&t instanceof ArrayBuffer?p(e,t,r,n):"string"==typeof t?l(e,t,r):f(e,t)}function a(e){if("number"!=typeof e)throw new TypeError('"size" argument must be a number');if(e<0)throw new RangeError('"size" argument must not be negative')}function u(e,t,r,n){return a(t),t<=0?i(e,t):void 0!==r?"string"==typeof n?i(e,t).fill(r,n):i(e,t).fill(r):i(e,t)}function c(e,t){if(a(t),e=i(e,t<0?0:0|d(t)),!o.TYPED_ARRAY_SUPPORT)for(var r=0;r<t;++r)e[r]=0;return e}function l(e,t,r){if("string"==typeof r&&""!==r||(r="utf8"),!o.isEncoding(r))throw new TypeError('"encoding" must be a valid string encoding');var n=0|v(t,r);e=i(e,n);var s=e.write(t,r);return s!==n&&(e=e.slice(0,s)),e}function h(e,t){var r=t.length<0?0:0|d(t.length);e=i(e,r);for(var n=0;n<r;n+=1)e[n]=255&t[n];return e}function p(e,t,r,n){if(t.byteLength,r<0||t.byteLength<r)throw new RangeError("'offset' is out of bounds");if(t.byteLength<r+(n||0))throw new RangeError("'length' is out of bounds");return t=void 0===r&&void 0===n?new Uint8Array(t):void 0===n?new Uint8Array(t,r):new Uint8Array(t,r,n),o.TYPED_ARRAY_SUPPORT?(e=t,e.__proto__=o.prototype):e=h(e,t),e}function f(e,t){if(o.isBuffer(t)){var r=0|d(t.length);return e=i(e,r),0===e.length?e:(t.copy(e,0,0,r),e)}if(t){if("undefined"!=typeof ArrayBuffer&&t.buffer instanceof ArrayBuffer||"length"in t)return"number"!=typeof t.length||Y(t.length)?i(e,0):h(e,t);if("Buffer"===t.type&&$(t.data))return h(e,t.data)}throw new TypeError("First argument must be a string, Buffer, ArrayBuffer, Array, or array-like object.")}function d(e){if(e>=n())throw new RangeError("Attempt to allocate Buffer larger than maximum size: 0x"+n().toString(16)+" bytes");return 0|e}function m(e){return+e!=e&&(e=0),o.alloc(+e)}function v(e,t){if(o.isBuffer(e))return e.length;if("undefined"!=typeof ArrayBuffer&&"function"==typeof ArrayBuffer.isView&&(ArrayBuffer.isView(e)||e instanceof ArrayBuffer))return e.byteLength;"string"!=typeof e&&(e=""+e);var r=e.length;if(0===r)return 0;for(var n=!1;;)switch(t){case"ascii":case"latin1":case"binary":return r;case"utf8":case"utf-8":case void 0:return V(e).length;case"ucs2":case"ucs-2":case"utf16le":case"utf-16le":return 2*r;case"hex":return r>>>1;case"base64":return X(e).length;default:if(n)return V(e).length;t=(""+t).toLowerCase(),n=!0}}function g(e,t,r){var n=!1;if((void 0===t||t<0)&&(t=0),t>this.length)return"";if((void 0===r||r>this.length)&&(r=this.length),r<=0)return"";if(r>>>=0,t>>>=0,r<=t)return"";for(e||(e="utf8");;)switch(e){case"hex":return P(this,t,r);case"utf8":case"utf-8":return T(this,t,r);case"ascii":return I(this,t,r);case"latin1":case"binary":return L(this,t,r);case"base64":return R(this,t,r);case"ucs2":case"ucs-2":case"utf16le":case"utf-16le":return q(this,t,r);default:if(n)throw new TypeError("Unknown encoding: "+e);e=(e+"").toLowerCase(),n=!0}}function y(e,t,r){var n=e[t];e[t]=e[r],e[r]=n}function b(e,t,r,n,i){if(0===e.length)return-1;if("string"==typeof r?(n=r,r=0):r>2147483647?r=2147483647:r<-2147483648&&(r=-2147483648),r=+r,isNaN(r)&&(r=i?0:e.length-1),r<0&&(r=e.length+r),r>=e.length){if(i)return-1;r=e.length-1}else if(r<0){if(!i)return-1;r=0}if("string"==typeof t&&(t=o.from(t,n)),o.isBuffer(t))return 0===t.length?-1:w(e,t,r,n,i);if("number"==typeof t)return t&=255,o.TYPED_ARRAY_SUPPORT&&"function"==typeof Uint8Array.prototype.indexOf?i?Uint8Array.prototype.indexOf.call(e,t,r):Uint8Array.prototype.lastIndexOf.call(e,t,r):w(e,[t],r,n,i);throw new TypeError("val must be string, number or Buffer")}function w(e,t,r,n,i){function o(e,t){return 1===s?e[t]:e.readUInt16BE(t*s)}var s=1,a=e.length,u=t.length;if(void 0!==n&&("ucs2"===(n=String(n).toLowerCase())||"ucs-2"===n||"utf16le"===n||"utf-16le"===n)){if(e.length<2||t.length<2)return-1;s=2,a/=2,u/=2,r/=2}var c;if(i){var l=-1;for(c=r;c<a;c++)if(o(e,c)===o(t,-1===l?0:c-l)){if(-1===l&&(l=c),c-l+1===u)return l*s}else-1!==l&&(c-=c-l),l=-1}else for(r+u>a&&(r=a-u),c=r;c>=0;c--){for(var h=!0,p=0;p<u;p++)if(o(e,c+p)!==o(t,p)){h=!1;break}if(h)return c}return-1}function E(e,t,r,n){r=Number(r)||0;var i=e.length-r;n?(n=Number(n))>i&&(n=i):n=i;var o=t.length;if(o%2!=0)throw new TypeError("Invalid hex string");n>o/2&&(n=o/2);for(var s=0;s<n;++s){var a=parseInt(t.substr(2*s,2),16);if(isNaN(a))return s;e[r+s]=a}return s}function _(e,t,r,n){return G(V(t,e.length-r),e,r,n)}function S(e,t,r,n){return G(K(t),e,r,n)}function C(e,t,r,n){return S(e,t,r,n)}function x(e,t,r,n){return G(X(t),e,r,n)}function A(e,t,r,n){return G(W(t,e.length-r),e,r,n)}function R(e,t,r){return 0===t&&r===e.length?J.fromByteArray(e):J.fromByteArray(e.slice(t,r))}function T(e,t,r){r=Math.min(e.length,r);for(var n=[],i=t;i<r;){var o=e[i],s=null,a=o>239?4:o>223?3:o>191?2:1;if(i+a<=r){var u,c,l,h;switch(a){case 1:o<128&&(s=o);break;case 2:u=e[i+1],128==(192&u)&&(h=(31&o)<<6|63&u)>127&&(s=h);break;case 3:u=e[i+1],c=e[i+2],128==(192&u)&&128==(192&c)&&(h=(15&o)<<12|(63&u)<<6|63&c)>2047&&(h<55296||h>57343)&&(s=h);break;case 4:u=e[i+1],c=e[i+2],l=e[i+3],128==(192&u)&&128==(192&c)&&128==(192&l)&&(h=(15&o)<<18|(63&u)<<12|(63&c)<<6|63&l)>65535&&h<1114112&&(s=h)}}null===s?(s=65533,a=1):s>65535&&(s-=65536,n.push(s>>>10&1023|55296),s=56320|1023&s),n.push(s),i+=a}return k(n)}function k(e){var t=e.length;if(t<=Q)return String.fromCharCode.apply(String,e);for(var r="",n=0;n<t;)r+=String.fromCharCode.apply(String,e.slice(n,n+=Q));return r}function I(e,t,r){var n="";r=Math.min(e.length,r);for(var i=t;i<r;++i)n+=String.fromCharCode(127&e[i]);return n}function L(e,t,r){var n="";r=Math.min(e.length,r);for(var i=t;i<r;++i)n+=String.fromCharCode(e[i]);return n}function P(e,t,r){var n=e.length;(!t||t<0)&&(t=0),(!r||r<0||r>n)&&(r=n);for(var i="",o=t;o<r;++o)i+=H(e[o]);return i}function q(e,t,r){for(var n=e.slice(t,r),i="",o=0;o<n.length;o+=2)i+=String.fromCharCode(n[o]+256*n[o+1]);return i}function O(e,t,r){if(e%1!=0||e<0)throw new RangeError("offset is not uint");if(e+t>r)throw new RangeError("Trying to access beyond buffer length")}function N(e,t,r,n,i,s){if(!o.isBuffer(e))throw new TypeError('"buffer" argument must be a Buffer instance');if(t>i||t<s)throw new RangeError('"value" argument is out of bounds');if(r+n>e.length)throw new RangeError("Index out of range")}function U(e,t,r,n){t<0&&(t=65535+t+1);for(var i=0,o=Math.min(e.length-r,2);i<o;++i)e[r+i]=(t&255<<8*(n?i:1-i))>>>8*(n?i:1-i)}function D(e,t,r,n){t<0&&(t=4294967295+t+1);for(var i=0,o=Math.min(e.length-r,4);i<o;++i)e[r+i]=t>>>8*(n?i:3-i)&255}function M(e,t,r,n,i,o){if(r+n>e.length)throw new RangeError("Index out of range");if(r<0)throw new RangeError("Index out of range")}function j(e,t,r,n,i){return i||M(e,t,r,4,3.4028234663852886e38,-3.4028234663852886e38),Z.write(e,t,r,n,23,4),r+4}function B(e,t,r,n,i){return i||M(e,t,r,8,1.7976931348623157e308,-1.7976931348623157e308),Z.write(e,t,r,n,52,8),r+8}function F(e){if(e=z(e).replace(ee,""),e.length<2)return"";for(;e.length%4!=0;)e+="=";return e}function z(e){return e.trim?e.trim():e.replace(/^\s+|\s+$/g,"")}function H(e){return e<16?"0"+e.toString(16):e.toString(16)}function V(e,t){t=t||1/0;for(var r,n=e.length,i=null,o=[],s=0;s<n;++s){if((r=e.charCodeAt(s))>55295&&r<57344){if(!i){if(r>56319){(t-=3)>-1&&o.push(239,191,189);continue}if(s+1===n){(t-=3)>-1&&o.push(239,191,189);continue}i=r;continue}if(r<56320){(t-=3)>-1&&o.push(239,191,189),i=r;continue}r=65536+(i-55296<<10|r-56320)}else i&&(t-=3)>-1&&o.push(239,191,189);if(i=null,r<128){if((t-=1)<0)break;o.push(r)}else if(r<2048){if((t-=2)<0)break;o.push(r>>6|192,63&r|128)}else if(r<65536){if((t-=3)<0)break;o.push(r>>12|224,r>>6&63|128,63&r|128)}else{if(!(r<1114112))throw new Error("Invalid code point");if((t-=4)<0)break;o.push(r>>18|240,r>>12&63|128,r>>6&63|128,63&r|128)}}return o}function K(e){for(var t=[],r=0;r<e.length;++r)t.push(255&e.charCodeAt(r));return t}function W(e,t){for(var r,n,i,o=[],s=0;s<e.length&&!((t-=2)<0);++s)r=e.charCodeAt(s),n=r>>8,i=r%256,o.push(i),o.push(n);return o}function X(e){return J.toByteArray(F(e))}function G(e,t,r,n){for(var i=0;i<n&&!(i+r>=t.length||i>=e.length);++i)t[i+r]=e[i];return i}function Y(e){return e!==e}var J=e("base64-js"),Z=e("ieee754"),$=e("isarray");r.Buffer=o,r.SlowBuffer=m,r.INSPECT_MAX_BYTES=50,o.TYPED_ARRAY_SUPPORT=void 0!==t.TYPED_ARRAY_SUPPORT?t.TYPED_ARRAY_SUPPORT:function(){try{var e=new Uint8Array(1);return e.__proto__={__proto__:Uint8Array.prototype,foo:function(){return 42}},42===e.foo()&&"function"==typeof e.subarray&&0===e.subarray(1,1).byteLength}catch(e){return!1}}(),r.kMaxLength=n(),o.poolSize=8192,o._augment=function(e){return e.__proto__=o.prototype,e},o.from=function(e,t,r){return s(null,e,t,r)},o.TYPED_ARRAY_SUPPORT&&(o.prototype.__proto__=Uint8Array.prototype,o.__proto__=Uint8Array,"undefined"!=typeof Symbol&&Symbol.species&&o[Symbol.species]===o&&Object.defineProperty(o,Symbol.species,{value:null,configurable:!0})),o.alloc=function(e,t,r){return u(null,e,t,r)},o.allocUnsafe=function(e){return c(null,e)},o.allocUnsafeSlow=function(e){return c(null,e)},o.isBuffer=function(e){return!(null==e||!e._isBuffer)},o.compare=function(e,t){if(!o.isBuffer(e)||!o.isBuffer(t))throw new TypeError("Arguments must be Buffers");if(e===t)return 0;for(var r=e.length,n=t.length,i=0,s=Math.min(r,n);i<s;++i)if(e[i]!==t[i]){r=e[i],n=t[i];break}return r<n?-1:n<r?1:0},o.isEncoding=function(e){switch(String(e).toLowerCase()){case"hex":case"utf8":case"utf-8":case"ascii":case"latin1":case"binary":case"base64":case"ucs2":case"ucs-2":case"utf16le":case"utf-16le":return!0;default:return!1}},o.concat=function(e,t){if(!$(e))throw new TypeError('"list" argument must be an Array of Buffers');if(0===e.length)return o.alloc(0);var r;if(void 0===t)for(t=0,r=0;r<e.length;++r)t+=e[r].length;var n=o.allocUnsafe(t),i=0;for(r=0;r<e.length;++r){var s=e[r];if(!o.isBuffer(s))throw new TypeError('"list" argument must be an Array of Buffers');s.copy(n,i),i+=s.length}return n},o.byteLength=v,o.prototype._isBuffer=!0,o.prototype.swap16=function(){var e=this.length;if(e%2!=0)throw new RangeError("Buffer size must be a multiple of 16-bits");for(var t=0;t<e;t+=2)y(this,t,t+1);return this},o.prototype.swap32=function(){var e=this.length;if(e%4!=0)throw new RangeError("Buffer size must be a multiple of 32-bits");for(var t=0;t<e;t+=4)y(this,t,t+3),y(this,t+1,t+2);return this},o.prototype.swap64=function(){var e=this.length;if(e%8!=0)throw new RangeError("Buffer size must be a multiple of 64-bits");for(var t=0;t<e;t+=8)y(this,t,t+7),y(this,t+1,t+6),y(this,t+2,t+5),y(this,t+3,t+4);return this},o.prototype.toString=function(){var e=0|this.length;return 0===e?"":0===arguments.length?T(this,0,e):g.apply(this,arguments)},o.prototype.equals=function(e){if(!o.isBuffer(e))throw new TypeError("Argument must be a Buffer");return this===e||0===o.compare(this,e)},o.prototype.inspect=function(){var e="",t=r.INSPECT_MAX_BYTES;return this.length>0&&(e=this.toString("hex",0,t).match(/.{2}/g).join(" "),this.length>t&&(e+=" ... ")),"<Buffer "+e+">"},o.prototype.compare=function(e,t,r,n,i){if(!o.isBuffer(e))throw new TypeError("Argument must be a Buffer");if(void 0===t&&(t=0),void 0===r&&(r=e?e.length:0),
+void 0===n&&(n=0),void 0===i&&(i=this.length),t<0||r>e.length||n<0||i>this.length)throw new RangeError("out of range index");if(n>=i&&t>=r)return 0;if(n>=i)return-1;if(t>=r)return 1;if(t>>>=0,r>>>=0,n>>>=0,i>>>=0,this===e)return 0;for(var s=i-n,a=r-t,u=Math.min(s,a),c=this.slice(n,i),l=e.slice(t,r),h=0;h<u;++h)if(c[h]!==l[h]){s=c[h],a=l[h];break}return s<a?-1:a<s?1:0},o.prototype.includes=function(e,t,r){return-1!==this.indexOf(e,t,r)},o.prototype.indexOf=function(e,t,r){return b(this,e,t,r,!0)},o.prototype.lastIndexOf=function(e,t,r){return b(this,e,t,r,!1)},o.prototype.write=function(e,t,r,n){if(void 0===t)n="utf8",r=this.length,t=0;else if(void 0===r&&"string"==typeof t)n=t,r=this.length,t=0;else{if(!isFinite(t))throw new Error("Buffer.write(string, encoding, offset[, length]) is no longer supported");t|=0,isFinite(r)?(r|=0,void 0===n&&(n="utf8")):(n=r,r=void 0)}var i=this.length-t;if((void 0===r||r>i)&&(r=i),e.length>0&&(r<0||t<0)||t>this.length)throw new RangeError("Attempt to write outside buffer bounds");n||(n="utf8");for(var o=!1;;)switch(n){case"hex":return E(this,e,t,r);case"utf8":case"utf-8":return _(this,e,t,r);case"ascii":return S(this,e,t,r);case"latin1":case"binary":return C(this,e,t,r);case"base64":return x(this,e,t,r);case"ucs2":case"ucs-2":case"utf16le":case"utf-16le":return A(this,e,t,r);default:if(o)throw new TypeError("Unknown encoding: "+n);n=(""+n).toLowerCase(),o=!0}},o.prototype.toJSON=function(){return{type:"Buffer",data:Array.prototype.slice.call(this._arr||this,0)}};var Q=4096;o.prototype.slice=function(e,t){var r=this.length;e=~~e,t=void 0===t?r:~~t,e<0?(e+=r)<0&&(e=0):e>r&&(e=r),t<0?(t+=r)<0&&(t=0):t>r&&(t=r),t<e&&(t=e);var n;if(o.TYPED_ARRAY_SUPPORT)n=this.subarray(e,t),n.__proto__=o.prototype;else{var i=t-e;n=new o(i,void 0);for(var s=0;s<i;++s)n[s]=this[s+e]}return n},o.prototype.readUIntLE=function(e,t,r){e|=0,t|=0,r||O(e,t,this.length);for(var n=this[e],i=1,o=0;++o<t&&(i*=256);)n+=this[e+o]*i;return n},o.prototype.readUIntBE=function(e,t,r){e|=0,t|=0,r||O(e,t,this.length);for(var n=this[e+--t],i=1;t>0&&(i*=256);)n+=this[e+--t]*i;return n},o.prototype.readUInt8=function(e,t){return t||O(e,1,this.length),this[e]},o.prototype.readUInt16LE=function(e,t){return t||O(e,2,this.length),this[e]|this[e+1]<<8},o.prototype.readUInt16BE=function(e,t){return t||O(e,2,this.length),this[e]<<8|this[e+1]},o.prototype.readUInt32LE=function(e,t){return t||O(e,4,this.length),(this[e]|this[e+1]<<8|this[e+2]<<16)+16777216*this[e+3]},o.prototype.readUInt32BE=function(e,t){return t||O(e,4,this.length),16777216*this[e]+(this[e+1]<<16|this[e+2]<<8|this[e+3])},o.prototype.readIntLE=function(e,t,r){e|=0,t|=0,r||O(e,t,this.length);for(var n=this[e],i=1,o=0;++o<t&&(i*=256);)n+=this[e+o]*i;return i*=128,n>=i&&(n-=Math.pow(2,8*t)),n},o.prototype.readIntBE=function(e,t,r){e|=0,t|=0,r||O(e,t,this.length);for(var n=t,i=1,o=this[e+--n];n>0&&(i*=256);)o+=this[e+--n]*i;return i*=128,o>=i&&(o-=Math.pow(2,8*t)),o},o.prototype.readInt8=function(e,t){return t||O(e,1,this.length),128&this[e]?-1*(255-this[e]+1):this[e]},o.prototype.readInt16LE=function(e,t){t||O(e,2,this.length);var r=this[e]|this[e+1]<<8;return 32768&r?4294901760|r:r},o.prototype.readInt16BE=function(e,t){t||O(e,2,this.length);var r=this[e+1]|this[e]<<8;return 32768&r?4294901760|r:r},o.prototype.readInt32LE=function(e,t){return t||O(e,4,this.length),this[e]|this[e+1]<<8|this[e+2]<<16|this[e+3]<<24},o.prototype.readInt32BE=function(e,t){return t||O(e,4,this.length),this[e]<<24|this[e+1]<<16|this[e+2]<<8|this[e+3]},o.prototype.readFloatLE=function(e,t){return t||O(e,4,this.length),Z.read(this,e,!0,23,4)},o.prototype.readFloatBE=function(e,t){return t||O(e,4,this.length),Z.read(this,e,!1,23,4)},o.prototype.readDoubleLE=function(e,t){return t||O(e,8,this.length),Z.read(this,e,!0,52,8)},o.prototype.readDoubleBE=function(e,t){return t||O(e,8,this.length),Z.read(this,e,!1,52,8)},o.prototype.writeUIntLE=function(e,t,r,n){if(e=+e,t|=0,r|=0,!n){N(this,e,t,r,Math.pow(2,8*r)-1,0)}var i=1,o=0;for(this[t]=255&e;++o<r&&(i*=256);)this[t+o]=e/i&255;return t+r},o.prototype.writeUIntBE=function(e,t,r,n){if(e=+e,t|=0,r|=0,!n){N(this,e,t,r,Math.pow(2,8*r)-1,0)}var i=r-1,o=1;for(this[t+i]=255&e;--i>=0&&(o*=256);)this[t+i]=e/o&255;return t+r},o.prototype.writeUInt8=function(e,t,r){return e=+e,t|=0,r||N(this,e,t,1,255,0),o.TYPED_ARRAY_SUPPORT||(e=Math.floor(e)),this[t]=255&e,t+1},o.prototype.writeUInt16LE=function(e,t,r){return e=+e,t|=0,r||N(this,e,t,2,65535,0),o.TYPED_ARRAY_SUPPORT?(this[t]=255&e,this[t+1]=e>>>8):U(this,e,t,!0),t+2},o.prototype.writeUInt16BE=function(e,t,r){return e=+e,t|=0,r||N(this,e,t,2,65535,0),o.TYPED_ARRAY_SUPPORT?(this[t]=e>>>8,this[t+1]=255&e):U(this,e,t,!1),t+2},o.prototype.writeUInt32LE=function(e,t,r){return e=+e,t|=0,r||N(this,e,t,4,4294967295,0),o.TYPED_ARRAY_SUPPORT?(this[t+3]=e>>>24,this[t+2]=e>>>16,this[t+1]=e>>>8,this[t]=255&e):D(this,e,t,!0),t+4},o.prototype.writeUInt32BE=function(e,t,r){return e=+e,t|=0,r||N(this,e,t,4,4294967295,0),o.TYPED_ARRAY_SUPPORT?(this[t]=e>>>24,this[t+1]=e>>>16,this[t+2]=e>>>8,this[t+3]=255&e):D(this,e,t,!1),t+4},o.prototype.writeIntLE=function(e,t,r,n){if(e=+e,t|=0,!n){var i=Math.pow(2,8*r-1);N(this,e,t,r,i-1,-i)}var o=0,s=1,a=0;for(this[t]=255&e;++o<r&&(s*=256);)e<0&&0===a&&0!==this[t+o-1]&&(a=1),this[t+o]=(e/s>>0)-a&255;return t+r},o.prototype.writeIntBE=function(e,t,r,n){if(e=+e,t|=0,!n){var i=Math.pow(2,8*r-1);N(this,e,t,r,i-1,-i)}var o=r-1,s=1,a=0;for(this[t+o]=255&e;--o>=0&&(s*=256);)e<0&&0===a&&0!==this[t+o+1]&&(a=1),this[t+o]=(e/s>>0)-a&255;return t+r},o.prototype.writeInt8=function(e,t,r){return e=+e,t|=0,r||N(this,e,t,1,127,-128),o.TYPED_ARRAY_SUPPORT||(e=Math.floor(e)),e<0&&(e=255+e+1),this[t]=255&e,t+1},o.prototype.writeInt16LE=function(e,t,r){return e=+e,t|=0,r||N(this,e,t,2,32767,-32768),o.TYPED_ARRAY_SUPPORT?(this[t]=255&e,this[t+1]=e>>>8):U(this,e,t,!0),t+2},o.prototype.writeInt16BE=function(e,t,r){return e=+e,t|=0,r||N(this,e,t,2,32767,-32768),o.TYPED_ARRAY_SUPPORT?(this[t]=e>>>8,this[t+1]=255&e):U(this,e,t,!1),t+2},o.prototype.writeInt32LE=function(e,t,r){return e=+e,t|=0,r||N(this,e,t,4,2147483647,-2147483648),o.TYPED_ARRAY_SUPPORT?(this[t]=255&e,this[t+1]=e>>>8,this[t+2]=e>>>16,this[t+3]=e>>>24):D(this,e,t,!0),t+4},o.prototype.writeInt32BE=function(e,t,r){return e=+e,t|=0,r||N(this,e,t,4,2147483647,-2147483648),e<0&&(e=4294967295+e+1),o.TYPED_ARRAY_SUPPORT?(this[t]=e>>>24,this[t+1]=e>>>16,this[t+2]=e>>>8,this[t+3]=255&e):D(this,e,t,!1),t+4},o.prototype.writeFloatLE=function(e,t,r){return j(this,e,t,!0,r)},o.prototype.writeFloatBE=function(e,t,r){return j(this,e,t,!1,r)},o.prototype.writeDoubleLE=function(e,t,r){return B(this,e,t,!0,r)},o.prototype.writeDoubleBE=function(e,t,r){return B(this,e,t,!1,r)},o.prototype.copy=function(e,t,r,n){if(r||(r=0),n||0===n||(n=this.length),t>=e.length&&(t=e.length),t||(t=0),n>0&&n<r&&(n=r),n===r)return 0;if(0===e.length||0===this.length)return 0;if(t<0)throw new RangeError("targetStart out of bounds");if(r<0||r>=this.length)throw new RangeError("sourceStart out of bounds");if(n<0)throw new RangeError("sourceEnd out of bounds");n>this.length&&(n=this.length),e.length-t<n-r&&(n=e.length-t+r);var i,s=n-r;if(this===e&&r<t&&t<n)for(i=s-1;i>=0;--i)e[i+t]=this[i+r];else if(s<1e3||!o.TYPED_ARRAY_SUPPORT)for(i=0;i<s;++i)e[i+t]=this[i+r];else Uint8Array.prototype.set.call(e,this.subarray(r,r+s),t);return s},o.prototype.fill=function(e,t,r,n){if("string"==typeof e){if("string"==typeof t?(n=t,t=0,r=this.length):"string"==typeof r&&(n=r,r=this.length),1===e.length){var i=e.charCodeAt(0);i<256&&(e=i)}if(void 0!==n&&"string"!=typeof n)throw new TypeError("encoding must be a string");if("string"==typeof n&&!o.isEncoding(n))throw new TypeError("Unknown encoding: "+n)}else"number"==typeof e&&(e&=255);if(t<0||this.length<t||this.length<r)throw new RangeError("Out of range index");if(r<=t)return this;t>>>=0,r=void 0===r?this.length:r>>>0,e||(e=0);var s;if("number"==typeof e)for(s=t;s<r;++s)this[s]=e;else{var a=o.isBuffer(e)?e:V(new o(e,n).toString()),u=a.length;for(s=0;s<r-t;++s)this[s+t]=a[s%u]}return this};var ee=/[^+\/0-9A-Za-z-_]/g}).call(this)}).call(this,"undefined"!=typeof global?global:"undefined"!=typeof self?self:"undefined"!=typeof window?window:{},e("buffer").Buffer)},{"base64-js":1,buffer:3,ieee754:5,isarray:6}],6:[function(e,t,r){var n={}.toString;t.exports=Array.isArray||function(e){return"[object Array]"==n.call(e)}},{}],5:[function(e,t,r){r.read=function(e,t,r,n,i){var o,s,a=8*i-n-1,u=(1<<a)-1,c=u>>1,l=-7,h=r?i-1:0,p=r?-1:1,f=e[t+h];for(h+=p,o=f&(1<<-l)-1,f>>=-l,l+=a;l>0;o=256*o+e[t+h],h+=p,l-=8);for(s=o&(1<<-l)-1,o>>=-l,l+=n;l>0;s=256*s+e[t+h],h+=p,l-=8);if(0===o)o=1-c;else{if(o===u)return s?NaN:1/0*(f?-1:1);s+=Math.pow(2,n),o-=c}return(f?-1:1)*s*Math.pow(2,o-n)},r.write=function(e,t,r,n,i,o){var s,a,u,c=8*o-i-1,l=(1<<c)-1,h=l>>1,p=23===i?Math.pow(2,-24)-Math.pow(2,-77):0,f=n?0:o-1,d=n?1:-1,m=t<0||0===t&&1/t<0?1:0;for(t=Math.abs(t),isNaN(t)||t===1/0?(a=isNaN(t)?1:0,s=l):(s=Math.floor(Math.log(t)/Math.LN2),t*(u=Math.pow(2,-s))<1&&(s--,u*=2),t+=s+h>=1?p/u:p*Math.pow(2,1-h),t*u>=2&&(s++,u/=2),s+h>=l?(a=0,s=l):s+h>=1?(a=(t*u-1)*Math.pow(2,i),s+=h):(a=t*Math.pow(2,h-1)*Math.pow(2,i),s=0));i>=8;e[r+f]=255&a,f+=d,a/=256,i-=8);for(s=s<<i|a,c+=i;c>0;e[r+f]=255&s,f+=d,s/=256,c-=8);e[r+f-d]|=128*m}},{}],1:[function(e,t,r){"use strict";function n(e){var t=e.length;if(t%4>0)throw new Error("Invalid string. Length must be a multiple of 4");var r=e.indexOf("=");return-1===r&&(r=t),[r,r===t?0:4-r%4]}function i(e){var t=n(e),r=t[0],i=t[1];return 3*(r+i)/4-i}function o(e,t,r){return 3*(t+r)/4-r}function s(e){var t,r,i=n(e),s=i[0],a=i[1],u=new p(o(e,s,a)),c=0,l=a>0?s-4:s;for(r=0;r<l;r+=4)t=h[e.charCodeAt(r)]<<18|h[e.charCodeAt(r+1)]<<12|h[e.charCodeAt(r+2)]<<6|h[e.charCodeAt(r+3)],u[c++]=t>>16&255,u[c++]=t>>8&255,u[c++]=255&t;return 2===a&&(t=h[e.charCodeAt(r)]<<2|h[e.charCodeAt(r+1)]>>4,u[c++]=255&t),1===a&&(t=h[e.charCodeAt(r)]<<10|h[e.charCodeAt(r+1)]<<4|h[e.charCodeAt(r+2)]>>2,u[c++]=t>>8&255,u[c++]=255&t),u}function a(e){return l[e>>18&63]+l[e>>12&63]+l[e>>6&63]+l[63&e]}function u(e,t,r){for(var n,i=[],o=t;o<r;o+=3)n=(e[o]<<16&16711680)+(e[o+1]<<8&65280)+(255&e[o+2]),i.push(a(n));return i.join("")}function c(e){for(var t,r=e.length,n=r%3,i=[],o=0,s=r-n;o<s;o+=16383)i.push(u(e,o,o+16383>s?s:o+16383));return 1===n?(t=e[r-1],i.push(l[t>>2]+l[t<<4&63]+"==")):2===n&&(t=(e[r-2]<<8)+e[r-1],i.push(l[t>>10]+l[t>>4&63]+l[t<<2&63]+"=")),i.join("")}r.byteLength=i,r.toByteArray=s,r.fromByteArray=c;for(var l=[],h=[],p="undefined"!=typeof Uint8Array?Uint8Array:Array,f="ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/",d=0,m=f.length;d<m;++d)l[d]=f[d],h[f.charCodeAt(d)]=d;h["-".charCodeAt(0)]=62,h["_".charCodeAt(0)]=63},{}]},{},[28]);AWS.apiLoader.services.s3={},AWS.S3=AWS.Service.defineService("s3",["2006-03-01"]),_xamzrequire=function e(t,r,i){function n(o,s){if(!r[o]){if(!t[o]){var u="function"==typeof _xamzrequire&&_xamzrequire;if(!s&&u)return u(o,!0);if(a)return a(o,!0);var c=new Error("Cannot find module '"+o+"'");throw c.code="MODULE_NOT_FOUND",c}var l=r[o]={exports:{}};t[o][0].call(l.exports,function(e){var r=t[o][1][e];return n(r||e)},l,l.exports,e,t,r,i)}return r[o].exports}for(var a="function"==typeof _xamzrequire&&_xamzrequire,o=0;o<i.length;o++)n(i[o]);return n}({103:[function(e,t,r){var i=e("../core"),n=e("../signers/v4_credentials"),a=e("../config_regional_endpoint"),o=e("./s3util"),s=e("../region_config");e("../s3/managed_upload");var u={completeMultipartUpload:!0,copyObject:!0,uploadPartCopy:!0},c=["AuthorizationHeaderMalformed","BadRequest","PermanentRedirect",301];i.util.update(i.S3.prototype,{getSignatureVersion:function(e){var t=this.api.signatureVersion,r=this._originalConfig?this._originalConfig.signatureVersion:null,i=this.config.signatureVersion,n=!!e&&e.isPresigned();return r?r="v2"===r?"s3":r:(!0!==n?t="v4":i&&(t=i),t)},getSigningName:function(){var e=i.Service.prototype.getSigningName;return this._parsedArn&&this._parsedArn.service?this._parsedArn.service:e.call(this)},getSignerClass:function(e){var t=this.getSignatureVersion(e);return i.Signers.RequestSigner.getVersion(t)},validateService:function(){var e,t=[];if(this.config.region||(this.config.region="us-east-1"),!this.config.endpoint&&this.config.s3BucketEndpoint&&t.push("An endpoint must be provided when configuring `s3BucketEndpoint` to true."),1===t.length?e=t[0]:t.length>1&&(e="Multiple configuration errors:\n"+t.join("\n")),e)throw i.util.error(new Error,{name:"InvalidEndpoint",message:e})},shouldDisableBodySigning:function(e){var t=this.getSignerClass();return!0===this.config.s3DisableBodySigning&&t===i.Signers.V4&&"https:"===e.httpRequest.endpoint.protocol},setupRequestListeners:function(e){if(e.addListener("validate",this.validateScheme),e.addListener("validate",this.validateBucketName,!0),e.addListener("validate",this.optInUsEast1RegionalEndpoint,!0),e.removeListener("validate",i.EventListeners.Core.VALIDATE_REGION),e.addListener("build",this.addContentType),e.addListener("build",this.computeContentMd5),e.addListener("build",this.computeSseCustomerKeyMd5),e.addListener("build",this.populateURI),e.addListener("afterBuild",this.addExpect100Continue),e.addListener("extractError",this.extractError),e.addListener("extractData",i.util.hoistPayloadMember),e.addListener("extractData",this.extractData),e.addListener("extractData",this.extractErrorFrom200Response),e.addListener("beforePresign",this.prepareSignedUrl),this.shouldDisableBodySigning(e)&&(e.removeListener("afterBuild",i.EventListeners.Core.COMPUTE_SHA256),e.addListener("afterBuild",this.disableBodySigning)),"createBucket"!==e.operation&&o.isArnInParam(e,"Bucket"))return e.service._parsedArn=i.util.ARN.parse(e.params.Bucket),e.removeListener("validate",this.validateBucketName),e.removeListener("build",this.populateURI),"s3"===e.service._parsedArn.service?(e.addListener("validate",o.validateS3AccessPointArn),e.addListener("validate",this.validateArnResourceType)):"s3-outposts"===e.service._parsedArn.service&&(e.addListener("validate",o.validateOutpostsAccessPointArn),e.addListener("validate",o.validateOutpostsArn)),e.addListener("validate",o.validateArnRegion),e.addListener("validate",o.validateArnAccount),e.addListener("validate",o.validateArnService),e.addListener("build",this.populateUriFromAccessPointArn),void e.addListener("build",o.validatePopulateUriFromArn);e.addListener("validate",this.validateBucketEndpoint),e.addListener("validate",this.correctBucketRegionFromCache),e.onAsync("extractError",this.requestBucketRegion),i.util.isBrowser()&&e.onAsync("retry",this.reqRegionForNetworkingError)},validateScheme:function(e){var t=e.params,r=e.httpRequest.endpoint.protocol;if((t.SSECustomerKey||t.CopySourceSSECustomerKey)&&"https:"!==r)throw i.util.error(new Error,{code:"ConfigError",message:"Cannot send SSE keys over HTTP. Set 'sslEnabled'to 'true' in your configuration"})},validateBucketEndpoint:function(e){if(!e.params.Bucket&&e.service.config.s3BucketEndpoint){throw i.util.error(new Error,{code:"ConfigError",message:"Cannot send requests to root API with `s3BucketEndpoint` set."})}},validateArnResourceType:function(e){var t=e.service._parsedArn.resource;if(0!==t.indexOf("accesspoint:")&&0!==t.indexOf("accesspoint/"))throw i.util.error(new Error,{code:"InvalidARN",message:"ARN resource should begin with 'accesspoint/'"})},validateBucketName:function(e){var t=e.service,r=t.getSignatureVersion(e),n=e.params&&e.params.Bucket,a=e.params&&e.params.Key,o=n&&n.indexOf("/");if(n&&o>=0)if("string"==typeof a&&o>0){e.params=i.util.copy(e.params);var s=n.substr(o+1)||"";e.params.Key=s+"/"+a,e.params.Bucket=n.substr(0,o)}else if("v4"===r){var u="Bucket names cannot contain forward slashes. Bucket: "+n;throw i.util.error(new Error,{code:"InvalidBucket",message:u})}},isValidAccelerateOperation:function(e){return-1===["createBucket","deleteBucket","listBuckets"].indexOf(e)},optInUsEast1RegionalEndpoint:function(e){var t=e.service,r=t.config;if(r.s3UsEast1RegionalEndpoint=a(t._originalConfig,{env:"AWS_S3_US_EAST_1_REGIONAL_ENDPOINT",sharedConfig:"s3_us_east_1_regional_endpoint",clientConfig:"s3UsEast1RegionalEndpoint"}),!(t._originalConfig||{}).endpoint&&"us-east-1"===e.httpRequest.region&&"regional"===r.s3UsEast1RegionalEndpoint&&e.httpRequest.endpoint.hostname.indexOf("s3.amazonaws.com")>=0){var i=r.endpoint.indexOf(".amazonaws.com");regionalEndpoint=r.endpoint.substring(0,i)+".us-east-1"+r.endpoint.substring(i),e.httpRequest.updateEndpoint(regionalEndpoint)}},populateURI:function(e){var t=e.httpRequest,r=e.params.Bucket,i=e.service,n=t.endpoint;if(r&&!i.pathStyleBucketName(r)){i.config.useAccelerateEndpoint&&i.isValidAccelerateOperation(e.operation)?i.config.useDualstack?n.hostname=r+".s3-accelerate.dualstack.amazonaws.com":n.hostname=r+".s3-accelerate.amazonaws.com":i.config.s3BucketEndpoint||(n.hostname=r+"."+n.hostname);var a=n.port;n.host=80!==a&&443!==a?n.hostname+":"+n.port:n.hostname,t.virtualHostedBucket=r,i.removeVirtualHostedBucketFromPath(e)}},removeVirtualHostedBucketFromPath:function(e){var t=e.httpRequest,r=t.virtualHostedBucket;if(r&&t.path){if(e.params&&e.params.Key){var n="/"+i.util.uriEscapePath(e.params.Key);if(0===t.path.indexOf(n)&&(t.path.length===n.length||"?"===t.path[n.length]))return}t.path=t.path.replace(new RegExp("/"+r),""),"/"!==t.path[0]&&(t.path="/"+t.path)}},populateUriFromAccessPointArn:function(e){var t=e.service._parsedArn,r="s3-outposts"===t.service,n=r?"."+t.outpostId:"",a=r?"s3-outposts":"s3-accesspoint",o=!r&&e.service.config.useDualstack?".dualstack":"",u=e.httpRequest.endpoint,c=s.getEndpointSuffix(t.region),l=e.service.config.s3UseArnRegion;u.hostname=[t.accessPoint+"-"+t.accountId+n,a+o,l?t.region:e.service.config.region,c].join("."),u.host=u.hostname;var d=i.util.uriEscape(e.params.Bucket),p=e.httpRequest.path;e.httpRequest.path=p.replace(new RegExp("/"+d),""),"/"!==e.httpRequest.path[0]&&(e.httpRequest.path="/"+e.httpRequest.path),e.httpRequest.region=t.region},addExpect100Continue:function(e){var t=e.httpRequest.headers["Content-Length"];i.util.isNode()&&(t>=1048576||e.params.Body instanceof i.util.stream.Stream)&&(e.httpRequest.headers.Expect="100-continue")},addContentType:function(e){var t=e.httpRequest;if("GET"===t.method||"HEAD"===t.method)return void delete t.headers["Content-Type"];t.headers["Content-Type"]||(t.headers["Content-Type"]="application/octet-stream");var r=t.headers["Content-Type"];if(i.util.isBrowser())if("string"!=typeof t.body||r.match(/;\s*charset=/)){var n=function(e,t,r){return t+r.toUpperCase()};t.headers["Content-Type"]=r.replace(/(;\s*charset=)(.+)$/,n)}else{t.headers["Content-Type"]+="; charset=UTF-8"}},computableChecksumOperations:{putBucketCors:!0,putBucketLifecycle:!0,putBucketLifecycleConfiguration:!0,putBucketTagging:!0,deleteObjects:!0,putBucketReplication:!0,putObjectLegalHold:!0,putObjectRetention:!0,putObjectLockConfiguration:!0},willComputeChecksums:function(e){if(this.computableChecksumOperations[e.operation])return!0;if(!this.config.computeChecksums)return!1;if(!i.util.Buffer.isBuffer(e.httpRequest.body)&&"string"!=typeof e.httpRequest.body)return!1;var t=e.service.api.operations[e.operation].input.members;return!(!e.service.shouldDisableBodySigning(e)||Object.prototype.hasOwnProperty.call(e.httpRequest.headers,"presigned-expires")||!t.ContentMD5||e.params.ContentMD5)||!(e.service.getSignerClass(e)===i.Signers.V4&&t.ContentMD5&&!t.ContentMD5.required)&&(!(!t.ContentMD5||e.params.ContentMD5)||void 0)},computeContentMd5:function(e){if(e.service.willComputeChecksums(e)){var t=i.util.crypto.md5(e.httpRequest.body,"base64");e.httpRequest.headers["Content-MD5"]=t}},computeSseCustomerKeyMd5:function(e){var t={SSECustomerKey:"x-amz-server-side-encryption-customer-key-MD5",CopySourceSSECustomerKey:"x-amz-copy-source-server-side-encryption-customer-key-MD5"};i.util.each(t,function(t,r){if(e.params[t]){var n=i.util.crypto.md5(e.params[t],"base64");e.httpRequest.headers[r]=n}})},pathStyleBucketName:function(e){return!!this.config.s3ForcePathStyle||!this.config.s3BucketEndpoint&&(!o.dnsCompatibleBucketName(e)||!(!this.config.sslEnabled||!e.match(/\./)))},extractErrorFrom200Response:function(e){if(u[e.request.operation]){var t=e.httpResponse;if(t.body&&t.body.toString().match("<Error>")){e.data=null;throw(this.service?this.service:this).extractError(e),e.error}if(!t.body||!t.body.toString().match(/<[\w_]/))throw e.data=null,i.util.error(new Error,{code:"InternalError",message:"S3 aborted request"})}},retryableError:function(e,t){return!(!u[t.operation]||200!==e.statusCode)||(!t._requestRegionForBucket||!t.service.bucketRegionCache[t._requestRegionForBucket])&&(!(!e||"RequestTimeout"!==e.code)||(e&&-1!=c.indexOf(e.code)&&e.region&&e.region!=t.httpRequest.region?(t.httpRequest.region=e.region,301===e.statusCode&&t.service.updateReqBucketRegion(t),!0):i.Service.prototype.retryableError.call(this,e,t)))},updateReqBucketRegion:function(e,t){var r=e.httpRequest;if("string"==typeof t&&t.length&&(r.region=t),r.endpoint.host.match(/s3(?!-accelerate).*\.amazonaws\.com$/)){var n=e.service,a=n.config,o=a.s3BucketEndpoint;o&&delete a.s3BucketEndpoint;var s=i.util.copy(a);delete s.endpoint,s.region=r.region,r.endpoint=new i.S3(s).endpoint,n.populateURI(e),a.s3BucketEndpoint=o,r.headers.Host=r.endpoint.host,"validate"===e._asm.currentState&&(e.removeListener("build",n.populateURI),e.addListener("build",n.removeVirtualHostedBucketFromPath))}},extractData:function(e){var t=e.request;if("getBucketLocation"===t.operation){var r=e.httpResponse.body.toString().match(/>(.+)<\/Location/);delete e.data._,e.data.LocationConstraint=r?r[1]:""}var i=t.params.Bucket||null;if("deleteBucket"!==t.operation||"string"!=typeof i||e.error){var n=e.httpResponse.headers||{},a=n["x-amz-bucket-region"]||null;if(!a&&"createBucket"===t.operation&&!e.error){var o=t.params.CreateBucketConfiguration;a=o?"EU"===o.LocationConstraint?"eu-west-1":o.LocationConstraint:"us-east-1"}a&&i&&a!==t.service.bucketRegionCache[i]&&(t.service.bucketRegionCache[i]=a)}else t.service.clearBucketRegionCache(i);t.service.extractRequestIds(e)},extractError:function(e){var t={304:"NotModified",403:"Forbidden",400:"BadRequest",404:"NotFound"},r=e.request,n=e.httpResponse.statusCode,a=e.httpResponse.body||"",o=e.httpResponse.headers||{},s=o["x-amz-bucket-region"]||null,u=r.params.Bucket||null,c=r.service.bucketRegionCache;s&&u&&s!==c[u]&&(c[u]=s);var l;if(t[n]&&0===a.length)u&&!s&&(l=c[u]||null)!==r.httpRequest.region&&(s=l),e.error=i.util.error(new Error,{code:t[n],message:null,region:s});else{var d=(new i.XML.Parser).parse(a.toString());d.Region&&!s?(s=d.Region,u&&s!==c[u]&&(c[u]=s)):!u||s||d.Region||(l=c[u]||null)!==r.httpRequest.region&&(s=l),e.error=i.util.error(new Error,{code:d.Code||n,message:d.Message||null,region:s})}r.service.extractRequestIds(e)},requestBucketRegion:function(e,t){var r=e.error,n=e.request,a=n.params.Bucket||null;if(!r||!a||r.region||"listObjects"===n.operation||i.util.isNode()&&"headBucket"===n.operation||400===r.statusCode&&"headObject"!==n.operation||-1===c.indexOf(r.code))return t();var o=i.util.isNode()?"headBucket":"listObjects",s={Bucket:a};"listObjects"===o&&(s.MaxKeys=0);var u=n.service[o](s);u._requestRegionForBucket=a,u.send(function(){var e=n.service.bucketRegionCache[a]||null;r.region=e,t()})},reqRegionForNetworkingError:function(e,t){if(!i.util.isBrowser())return t();var r=e.error,n=e.request,a=n.params.Bucket;if(!r||"NetworkingError"!==r.code||!a||"us-east-1"===n.httpRequest.region)return t();var s=n.service,u=s.bucketRegionCache,c=u[a]||null;if(c&&c!==n.httpRequest.region)s.updateReqBucketRegion(n,c),t();else if(o.dnsCompatibleBucketName(a))if(n.httpRequest.virtualHostedBucket){var l=s.listObjects({Bucket:a,MaxKeys:0});s.updateReqBucketRegion(l,"us-east-1"),l._requestRegionForBucket=a,l.send(function(){var e=s.bucketRegionCache[a]||null;e&&e!==n.httpRequest.region&&s.updateReqBucketRegion(n,e),t()})}else t();else s.updateReqBucketRegion(n,"us-east-1"),"us-east-1"!==u[a]&&(u[a]="us-east-1"),t()},bucketRegionCache:{},clearBucketRegionCache:function(e){var t=this.bucketRegionCache;e?"string"==typeof e&&(e=[e]):e=Object.keys(t);for(var r=0;r<e.length;r++)delete t[e[r]];return t},correctBucketRegionFromCache:function(e){var t=e.params.Bucket||null;if(t){var r=e.service,i=e.httpRequest.region,n=r.bucketRegionCache[t];n&&n!==i&&r.updateReqBucketRegion(e,n)}},extractRequestIds:function(e){var t=e.httpResponse.headers?e.httpResponse.headers["x-amz-id-2"]:null,r=e.httpResponse.headers?e.httpResponse.headers["x-amz-cf-id"]:null;e.extendedRequestId=t,e.cfId=r,e.error&&(e.error.requestId=e.requestId||null,e.error.extendedRequestId=t,e.error.cfId=r)},getSignedUrl:function(e,t,r){t=i.util.copy(t||{});var n=t.Expires||900;if("number"!=typeof n)throw i.util.error(new Error,{code:"InvalidParameterException",message:"The expiration must be a number, received "+typeof n});delete t.Expires;var a=this.makeRequest(e,t);if(!r)return a.presign(n,r);i.util.defer(function(){a.presign(n,r)})},createPresignedPost:function(e,t){function r(){return{url:i.util.urlFormat(u),fields:o.preparePostFields(s.credentials,s.region,a,e.Fields,e.Conditions,e.Expires)}}"function"==typeof e&&void 0===t&&(t=e,e=null),e=i.util.copy(e||{});var n=this.config.params||{},a=e.Bucket||n.Bucket,o=this,s=this.config,u=i.util.copy(this.endpoint);if(s.s3BucketEndpoint||(u.pathname="/"+a),!t)return r();s.getCredentials(function(e){if(e)t(e);else try{t(null,r())}catch(e){t(e)}})},preparePostFields:function(e,t,r,a,o,s){var u=this.getSkewCorrectedDate();if(!e||!t||!r)throw new Error("Unable to create a POST object policy without a bucket, region, and credentials");a=i.util.copy(a||{}),o=(o||[]).slice(0),s=s||3600;var c=i.util.date.iso8601(u).replace(/[:\-]|\.\d{3}/g,""),l=c.substr(0,8),d=n.createScope(l,t,"s3"),p=e.accessKeyId+"/"+d;a.bucket=r,a["X-Amz-Algorithm"]="AWS4-HMAC-SHA256",a["X-Amz-Credential"]=p,a["X-Amz-Date"]=c,e.sessionToken&&(a["X-Amz-Security-Token"]=e.sessionToken);for(var g in a)if(a.hasOwnProperty(g)){var h={};h[g]=a[g],o.push(h)}return a.Policy=this.preparePostPolicy(new Date(u.valueOf()+1e3*s),o),a["X-Amz-Signature"]=i.util.crypto.hmac(n.getSigningKey(e,l,t,"s3",!0),a.Policy,"hex"),a},preparePostPolicy:function(e,t){return i.util.base64.encode(JSON.stringify({expiration:i.util.date.iso8601(e),conditions:t}))},prepareSignedUrl:function(e){e.addListener("validate",e.service.noPresignedContentLength),e.removeListener("build",e.service.addContentType),e.params.Body?e.addListener("afterBuild",i.EventListeners.Core.COMPUTE_SHA256):e.removeListener("build",e.service.computeContentMd5)},disableBodySigning:function(e){var t=e.httpRequest.headers;Object.prototype.hasOwnProperty.call(t,"presigned-expires")||(t["X-Amz-Content-Sha256"]="UNSIGNED-PAYLOAD")},noPresignedContentLength:function(e){if(void 0!==e.params.ContentLength)throw i.util.error(new Error,{code:"UnexpectedParameter",message:"ContentLength is not supported in pre-signed URLs."})},createBucket:function(e,t){"function"!=typeof e&&e||(t=t||e,e={});var r=this.endpoint.hostname,n=i.util.copy(e);return r===this.api.globalEndpoint||e.CreateBucketConfiguration||(n.CreateBucketConfiguration={LocationConstraint:this.config.region}),this.makeRequest("createBucket",n,t)},upload:function(e,t,r){"function"==typeof t&&void 0===r&&(r=t,t=null),t=t||{},t=i.util.merge(t||{},{service:this,params:e});var n=new i.S3.ManagedUpload(t);return"function"==typeof r&&n.send(r),n}}),i.S3.addPromisesToClass=function(e){this.prototype.getSignedUrlPromise=i.util.promisifyMethod("getSignedUrl",e)},i.S3.deletePromisesFromClass=function(){delete this.prototype.getSignedUrlPromise},i.util.addPromises(i.S3)},{"../config_regional_endpoint":38,"../core":39,"../region_config":82,"../s3/managed_upload":87,"../signers/v4_credentials":116,"./s3util":105}],87:[function(e,t,r){var i=e("../core"),n=i.util.string.byteLength,a=i.util.Buffer;i.S3.ManagedUpload=i.util.inherit({constructor:function(e){var t=this;i.SequentialExecutor.call(t),t.body=null,t.sliceFn=null,t.callback=null,t.parts={},t.completeInfo=[],t.fillQueue=function(){t.callback(new Error("Unsupported body payload "+typeof t.body))},t.configure(e)},configure:function(e){if(e=e||{},this.partSize=this.minPartSize,e.queueSize&&(this.queueSize=e.queueSize),e.partSize&&(this.partSize=e.partSize),e.leavePartsOnError&&(this.leavePartsOnError=!0),e.tags){if(!Array.isArray(e.tags))throw new Error("Tags must be specified as an array; "+typeof e.tags+" provided.");this.tags=e.tags}if(this.partSize<this.minPartSize)throw new Error("partSize must be greater than "+this.minPartSize);this.service=e.service,this.bindServiceObject(e.params),this.validateBody(),this.adjustTotalBytes()},leavePartsOnError:!1,queueSize:4,partSize:null,minPartSize:5242880,maxTotalParts:1e4,send:function(e){var t=this;t.failed=!1,t.callback=e||function(e){if(e)throw e};var r=!0;if(t.sliceFn)t.fillQueue=t.fillBuffer;else if(i.util.isNode()){var n=i.util.stream.Stream;t.body instanceof n&&(r=!1,t.fillQueue=t.fillStream,t.partBuffers=[],t.body.on("error",function(e){t.cleanup(e)}).on("readable",function(){t.fillQueue()}).on("end",function(){t.isDoneChunking=!0,t.numParts=t.totalPartNumbers,t.fillQueue.call(t),t.isDoneChunking&&t.totalPartNumbers>=1&&t.doneParts===t.numParts&&t.finishMultiPart()}))}r&&t.fillQueue.call(t)},abort:function(){var e=this;!0===e.isDoneChunking&&1===e.totalPartNumbers&&e.singlePart?e.singlePart.abort():e.cleanup(i.util.error(new Error("Request aborted by user"),{code:"RequestAbortedError",retryable:!1}))},validateBody:function(){var e=this;if(e.body=e.service.config.params.Body,"string"==typeof e.body)e.body=i.util.buffer.toBuffer(e.body);else if(!e.body)throw new Error("params.Body is required");e.sliceFn=i.util.arraySliceFn(e.body)},bindServiceObject:function(e){e=e||{};var t=this;if(t.service){var r=t.service,n=i.util.copy(r._originalConfig||{});n.signatureVersion=r.getSignatureVersion(),t.service=new r.constructor.__super__(n),t.service.config.params=i.util.merge(t.service.config.params||{},e)}else t.service=new i.S3({params:e})},adjustTotalBytes:function(){var e=this;try{e.totalBytes=n(e.body)}catch(e){}if(e.totalBytes){var t=Math.ceil(e.totalBytes/e.maxTotalParts);t>e.partSize&&(e.partSize=t)}else e.totalBytes=void 0},isDoneChunking:!1,partPos:0,totalChunkedBytes:0,totalUploadedBytes:0,totalBytes:void 0,numParts:0,totalPartNumbers:0,activeParts:0,doneParts:0,parts:null,completeInfo:null,failed:!1,multipartReq:null,partBuffers:null,partBufferLength:0,fillBuffer:function(){var e=this,t=n(e.body);if(0===t)return e.isDoneChunking=!0,e.numParts=1,void e.nextChunk(e.body);for(;e.activeParts<e.queueSize&&e.partPos<t;){var r=Math.min(e.partPos+e.partSize,t),i=e.sliceFn.call(e.body,e.partPos,r);e.partPos+=e.partSize,(n(i)<e.partSize||e.partPos===t)&&(e.isDoneChunking=!0,e.numParts=e.totalPartNumbers+1),e.nextChunk(i)}},fillStream:function(){var e=this;if(!(e.activeParts>=e.queueSize)){var t=e.body.read(e.partSize-e.partBufferLength)||e.body.read();if(t&&(e.partBuffers.push(t),e.partBufferLength+=t.length,e.totalChunkedBytes+=t.length),e.partBufferLength>=e.partSize){var r=1===e.partBuffers.length?e.partBuffers[0]:a.concat(e.partBuffers);if(e.partBuffers=[],e.partBufferLength=0,r.length>e.partSize){var i=r.slice(e.partSize);e.partBuffers.push(i),e.partBufferLength+=i.length,r=r.slice(0,e.partSize)}e.nextChunk(r)}e.isDoneChunking&&!e.isDoneSending&&(r=1===e.partBuffers.length?e.partBuffers[0]:a.concat(e.partBuffers),e.partBuffers=[],e.partBufferLength=0,e.totalBytes=e.totalChunkedBytes,e.isDoneSending=!0,(0===e.numParts||r.length>0)&&(e.numParts++,e.nextChunk(r))),e.body.read(0)}},nextChunk:function(e){var t=this;if(t.failed)return null;var r=++t.totalPartNumbers;if(t.isDoneChunking&&1===r){var n={Body:e};this.tags&&(n.Tagging=this.getTaggingHeader());var a=t.service.putObject(n);return a._managedUpload=t,a.on("httpUploadProgress",t.progress).send(t.finishSinglePart),t.singlePart=a,null}if(t.service.config.params.ContentMD5){var o=i.util.error(new Error("The Content-MD5 you specified is invalid for multi-part uploads."),{code:"InvalidDigest",retryable:!1});return t.cleanup(o),null}if(t.completeInfo[r]&&null!==t.completeInfo[r].ETag)return null;t.activeParts++,t.service.config.params.UploadId?t.uploadPart(e,r):t.multipartReq?t.queueChunks(e,r):(t.multipartReq=t.service.createMultipartUpload(),t.multipartReq.on("success",function(e){t.service.config.params.UploadId=e.data.UploadId,t.multipartReq=null}),t.queueChunks(e,r),t.multipartReq.on("error",function(e){t.cleanup(e)}),t.multipartReq.send())},getTaggingHeader:function(){for(var e=[],t=0;t<this.tags.length;t++)e.push(i.util.uriEscape(this.tags[t].Key)+"="+i.util.uriEscape(this.tags[t].Value));return e.join("&")},uploadPart:function(e,t){var r=this,n={Body:e,ContentLength:i.util.string.byteLength(e),PartNumber:t},a={ETag:null,PartNumber:t};r.completeInfo[t]=a;var o=r.service.uploadPart(n);r.parts[t]=o,o._lastUploadedBytes=0,o._managedUpload=r,o.on("httpUploadProgress",r.progress),o.send(function(e,o){if(delete r.parts[n.PartNumber],r.activeParts--,!(e||o&&o.ETag)){var s="No access to ETag property on response.";i.util.isBrowser()&&(s+=" Check CORS configuration to expose ETag header."),e=i.util.error(new Error(s),{code:"ETagMissing",retryable:!1})}return e?r.cleanup(e):r.completeInfo[t]&&null!==r.completeInfo[t].ETag?null:(a.ETag=o.ETag,r.doneParts++,void(r.isDoneChunking&&r.doneParts===r.numParts?r.finishMultiPart():r.fillQueue.call(r)))})},queueChunks:function(e,t){var r=this;r.multipartReq.on("success",function(){r.uploadPart(e,t)})},cleanup:function(e){var t=this;t.failed||("function"==typeof t.body.removeAllListeners&&"function"==typeof t.body.resume&&(t.body.removeAllListeners("readable"),t.body.removeAllListeners("end"),t.body.resume()),t.multipartReq&&(t.multipartReq.removeAllListeners("success"),t.multipartReq.removeAllListeners("error"),t.multipartReq.removeAllListeners("complete"),delete t.multipartReq),t.service.config.params.UploadId&&!t.leavePartsOnError?t.service.abortMultipartUpload().send():t.leavePartsOnError&&(t.isDoneChunking=!1),i.util.each(t.parts,function(e,t){t.removeAllListeners("complete"),t.abort()}),t.activeParts=0,t.partPos=0,t.numParts=0,t.totalPartNumbers=0,t.parts={},t.failed=!0,t.callback(e))},finishMultiPart:function(){var e=this,t={MultipartUpload:{Parts:e.completeInfo.slice(1)}};e.service.completeMultipartUpload(t,function(t,r){if(t)return e.cleanup(t);if(r&&"string"==typeof r.Location&&(r.Location=r.Location.replace(/%2F/g,"/")),Array.isArray(e.tags)){for(var i=0;i<e.tags.length;i++)e.tags[i].Value=String(e.tags[i].Value);e.service.putObjectTagging({Tagging:{TagSet:e.tags}},function(t,i){t?e.callback(t):e.callback(t,r)})}else e.callback(t,r)})},finishSinglePart:function(e,t){var r=this.request._managedUpload,i=this.request.httpRequest,n=i.endpoint;if(e)return r.callback(e);t.Location=[n.protocol,"//",n.host,i.path].join(""),t.key=this.request.params.Key,t.Key=this.request.params.Key,t.Bucket=this.request.params.Bucket,r.callback(e,t)},progress:function(e){var t=this._managedUpload;"putObject"===this.operation?(e.part=1,e.key=this.params.Key):(t.totalUploadedBytes+=e.loaded-this._lastUploadedBytes,this._lastUploadedBytes=e.loaded,e={loaded:t.totalUploadedBytes,total:t.totalBytes,part:this.params.PartNumber,key:this.params.Key}),t.emit("httpUploadProgress",[e])}}),i.util.mixin(i.S3.ManagedUpload,i.SequentialExecutor),i.S3.ManagedUpload.addPromisesToClass=function(e){this.prototype.promise=i.util.promisifyMethod("send",e)},i.S3.ManagedUpload.deletePromisesFromClass=function(){delete this.prototype.promise},i.util.addPromises(i.S3.ManagedUpload),t.exports=i.S3.ManagedUpload},{"../core":39}]},{},[103]);AWS.apiLoader.services.s3["2006-03-01"]={version:"2.0",metadata:{apiVersion:"2006-03-01",checksumFormat:"md5",endpointPrefix:"s3",globalEndpoint:"s3.amazonaws.com",protocol:"rest-xml",serviceAbbreviation:"Amazon S3",serviceFullName:"Amazon Simple Storage Service",serviceId:"S3",signatureVersion:"s3",uid:"s3-2006-03-01"},operations:{AbortMultipartUpload:{http:{method:"DELETE",requestUri:"/{Bucket}/{Key+}",responseCode:204},input:{type:"structure",required:["Bucket","Key","UploadId"],members:{Bucket:{location:"uri",locationName:"Bucket"},Key:{location:"uri",locationName:"Key"},UploadId:{location:"querystring",locationName:"uploadId"},RequestPayer:{location:"header",locationName:"x-amz-request-payer"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{RequestCharged:{location:"header",locationName:"x-amz-request-charged"}}}},CompleteMultipartUpload:{http:{requestUri:"/{Bucket}/{Key+}"},input:{type:"structure",required:["Bucket","Key","UploadId"],members:{Bucket:{location:"uri",locationName:"Bucket"},Key:{location:"uri",locationName:"Key"},MultipartUpload:{locationName:"CompleteMultipartUpload",xmlNamespace:{uri:"http://s3.amazonaws.com/doc/2006-03-01/"},type:"structure",members:{Parts:{locationName:"Part",type:"list",member:{type:"structure",members:{ETag:{},PartNumber:{type:"integer"}}},flattened:!0}}},UploadId:{location:"querystring",locationName:"uploadId"},RequestPayer:{location:"header",locationName:"x-amz-request-payer"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}},payload:"MultipartUpload"},output:{type:"structure",members:{Location:{},Bucket:{},Key:{},Expiration:{location:"header",locationName:"x-amz-expiration"},ETag:{},ServerSideEncryption:{location:"header",locationName:"x-amz-server-side-encryption"},VersionId:{location:"header",locationName:"x-amz-version-id"},SSEKMSKeyId:{shape:"Sk",location:"header",locationName:"x-amz-server-side-encryption-aws-kms-key-id"},BucketKeyEnabled:{location:"header",locationName:"x-amz-server-side-encryption-bucket-key-enabled",type:"boolean"},RequestCharged:{location:"header",locationName:"x-amz-request-charged"}}}},CopyObject:{http:{method:"PUT",requestUri:"/{Bucket}/{Key+}"},input:{type:"structure",required:["Bucket","CopySource","Key"],members:{ACL:{location:"header",locationName:"x-amz-acl"},Bucket:{location:"uri",locationName:"Bucket"},CacheControl:{location:"header",locationName:"Cache-Control"},ContentDisposition:{location:"header",locationName:"Content-Disposition"},ContentEncoding:{location:"header",locationName:"Content-Encoding"},ContentLanguage:{location:"header",locationName:"Content-Language"},ContentType:{location:"header",locationName:"Content-Type"},CopySource:{location:"header",locationName:"x-amz-copy-source"},CopySourceIfMatch:{location:"header",locationName:"x-amz-copy-source-if-match"},CopySourceIfModifiedSince:{location:"header",locationName:"x-amz-copy-source-if-modified-since",type:"timestamp"},CopySourceIfNoneMatch:{location:"header",locationName:"x-amz-copy-source-if-none-match"},CopySourceIfUnmodifiedSince:{location:"header",locationName:"x-amz-copy-source-if-unmodified-since",type:"timestamp"},Expires:{location:"header",locationName:"Expires",type:"timestamp"},GrantFullControl:{location:"header",locationName:"x-amz-grant-full-control"},GrantRead:{location:"header",locationName:"x-amz-grant-read"},GrantReadACP:{location:"header",locationName:"x-amz-grant-read-acp"},GrantWriteACP:{location:"header",locationName:"x-amz-grant-write-acp"},Key:{location:"uri",locationName:"Key"},Metadata:{shape:"S13",location:"headers",locationName:"x-amz-meta-"},MetadataDirective:{location:"header",locationName:"x-amz-metadata-directive"},TaggingDirective:{location:"header",locationName:"x-amz-tagging-directive"},ServerSideEncryption:{location:"header",locationName:"x-amz-server-side-encryption"},StorageClass:{location:"header",locationName:"x-amz-storage-class"},WebsiteRedirectLocation:{location:"header",locationName:"x-amz-website-redirect-location"},SSECustomerAlgorithm:{location:"header",locationName:"x-amz-server-side-encryption-customer-algorithm"},SSECustomerKey:{shape:"S1b",location:"header",locationName:"x-amz-server-side-encryption-customer-key"},SSECustomerKeyMD5:{location:"header",locationName:"x-amz-server-side-encryption-customer-key-MD5"},SSEKMSKeyId:{shape:"Sk",location:"header",locationName:"x-amz-server-side-encryption-aws-kms-key-id"},SSEKMSEncryptionContext:{shape:"S1d",location:"header",locationName:"x-amz-server-side-encryption-context"},BucketKeyEnabled:{location:"header",locationName:"x-amz-server-side-encryption-bucket-key-enabled",type:"boolean"},CopySourceSSECustomerAlgorithm:{location:"header",locationName:"x-amz-copy-source-server-side-encryption-customer-algorithm"},CopySourceSSECustomerKey:{shape:"S1f",location:"header",locationName:"x-amz-copy-source-server-side-encryption-customer-key"},CopySourceSSECustomerKeyMD5:{location:"header",locationName:"x-amz-copy-source-server-side-encryption-customer-key-MD5"},RequestPayer:{location:"header",locationName:"x-amz-request-payer"},Tagging:{location:"header",locationName:"x-amz-tagging"},ObjectLockMode:{location:"header",locationName:"x-amz-object-lock-mode"},ObjectLockRetainUntilDate:{shape:"S1j",location:"header",locationName:"x-amz-object-lock-retain-until-date"},ObjectLockLegalHoldStatus:{location:"header",locationName:"x-amz-object-lock-legal-hold"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"},ExpectedSourceBucketOwner:{location:"header",locationName:"x-amz-source-expected-bucket-owner"}}},output:{type:"structure",members:{CopyObjectResult:{type:"structure",members:{ETag:{},LastModified:{type:"timestamp"}}},Expiration:{location:"header",locationName:"x-amz-expiration"},CopySourceVersionId:{location:"header",locationName:"x-amz-copy-source-version-id"},VersionId:{location:"header",locationName:"x-amz-version-id"},ServerSideEncryption:{location:"header",locationName:"x-amz-server-side-encryption"},SSECustomerAlgorithm:{location:"header",locationName:"x-amz-server-side-encryption-customer-algorithm"},SSECustomerKeyMD5:{location:"header",locationName:"x-amz-server-side-encryption-customer-key-MD5"},SSEKMSKeyId:{shape:"Sk",location:"header",locationName:"x-amz-server-side-encryption-aws-kms-key-id"},SSEKMSEncryptionContext:{shape:"S1d",location:"header",locationName:"x-amz-server-side-encryption-context"},BucketKeyEnabled:{location:"header",locationName:"x-amz-server-side-encryption-bucket-key-enabled",type:"boolean"},RequestCharged:{location:"header",locationName:"x-amz-request-charged"}},payload:"CopyObjectResult"},alias:"PutObjectCopy"},CreateBucket:{http:{method:"PUT",requestUri:"/{Bucket}"},input:{type:"structure",required:["Bucket"],members:{ACL:{location:"header",locationName:"x-amz-acl"},Bucket:{location:"uri",locationName:"Bucket"},CreateBucketConfiguration:{locationName:"CreateBucketConfiguration",xmlNamespace:{uri:"http://s3.amazonaws.com/doc/2006-03-01/"},type:"structure",members:{LocationConstraint:{}}},GrantFullControl:{location:"header",locationName:"x-amz-grant-full-control"},GrantRead:{location:"header",locationName:"x-amz-grant-read"},GrantReadACP:{location:"header",locationName:"x-amz-grant-read-acp"},GrantWrite:{location:"header",locationName:"x-amz-grant-write"},GrantWriteACP:{location:"header",locationName:"x-amz-grant-write-acp"},ObjectLockEnabledForBucket:{location:"header",locationName:"x-amz-bucket-object-lock-enabled",type:"boolean"}},payload:"CreateBucketConfiguration"},output:{type:"structure",members:{Location:{location:"header",locationName:"Location"}}},alias:"PutBucket"},CreateMultipartUpload:{http:{requestUri:"/{Bucket}/{Key+}?uploads"},input:{type:"structure",required:["Bucket","Key"],members:{ACL:{location:"header",locationName:"x-amz-acl"},Bucket:{location:"uri",locationName:"Bucket"},CacheControl:{location:"header",locationName:"Cache-Control"},ContentDisposition:{location:"header",locationName:"Content-Disposition"},ContentEncoding:{location:"header",locationName:"Content-Encoding"},ContentLanguage:{location:"header",locationName:"Content-Language"},ContentType:{location:"header",locationName:"Content-Type"},Expires:{location:"header",locationName:"Expires",type:"timestamp"},GrantFullControl:{location:"header",locationName:"x-amz-grant-full-control"},GrantRead:{location:"header",locationName:"x-amz-grant-read"},GrantReadACP:{location:"header",locationName:"x-amz-grant-read-acp"},GrantWriteACP:{location:"header",locationName:"x-amz-grant-write-acp"},Key:{location:"uri",locationName:"Key"},Metadata:{shape:"S13",location:"headers",locationName:"x-amz-meta-"},ServerSideEncryption:{location:"header",locationName:"x-amz-server-side-encryption"},StorageClass:{location:"header",locationName:"x-amz-storage-class"},WebsiteRedirectLocation:{location:"header",locationName:"x-amz-website-redirect-location"},SSECustomerAlgorithm:{location:"header",locationName:"x-amz-server-side-encryption-customer-algorithm"},SSECustomerKey:{shape:"S1b",location:"header",locationName:"x-amz-server-side-encryption-customer-key"},SSECustomerKeyMD5:{location:"header",locationName:"x-amz-server-side-encryption-customer-key-MD5"},SSEKMSKeyId:{shape:"Sk",location:"header",locationName:"x-amz-server-side-encryption-aws-kms-key-id"},SSEKMSEncryptionContext:{shape:"S1d",location:"header",locationName:"x-amz-server-side-encryption-context"},BucketKeyEnabled:{location:"header",locationName:"x-amz-server-side-encryption-bucket-key-enabled",type:"boolean"},RequestPayer:{location:"header",locationName:"x-amz-request-payer"},Tagging:{location:"header",locationName:"x-amz-tagging"},ObjectLockMode:{location:"header",locationName:"x-amz-object-lock-mode"},ObjectLockRetainUntilDate:{shape:"S1j",location:"header",locationName:"x-amz-object-lock-retain-until-date"},ObjectLockLegalHoldStatus:{location:"header",locationName:"x-amz-object-lock-legal-hold"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{AbortDate:{location:"header",locationName:"x-amz-abort-date",type:"timestamp"},AbortRuleId:{location:"header",locationName:"x-amz-abort-rule-id"},Bucket:{locationName:"Bucket"},Key:{},UploadId:{},ServerSideEncryption:{location:"header",locationName:"x-amz-server-side-encryption"},SSECustomerAlgorithm:{location:"header",locationName:"x-amz-server-side-encryption-customer-algorithm"},SSECustomerKeyMD5:{location:"header",locationName:"x-amz-server-side-encryption-customer-key-MD5"},SSEKMSKeyId:{shape:"Sk",location:"header",locationName:"x-amz-server-side-encryption-aws-kms-key-id"},SSEKMSEncryptionContext:{shape:"S1d",location:"header",locationName:"x-amz-server-side-encryption-context"},BucketKeyEnabled:{location:"header",locationName:"x-amz-server-side-encryption-bucket-key-enabled",type:"boolean"},RequestCharged:{location:"header",locationName:"x-amz-request-charged"}}},alias:"InitiateMultipartUpload"},DeleteBucket:{http:{method:"DELETE",requestUri:"/{Bucket}",responseCode:204},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}}},DeleteBucketAnalyticsConfiguration:{http:{method:"DELETE",requestUri:"/{Bucket}?analytics",responseCode:204},input:{type:"structure",required:["Bucket","Id"],members:{Bucket:{location:"uri",locationName:"Bucket"},Id:{location:"querystring",locationName:"id"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}}},DeleteBucketCors:{http:{method:"DELETE",requestUri:"/{Bucket}?cors",responseCode:204},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}}},DeleteBucketEncryption:{http:{method:"DELETE",requestUri:"/{Bucket}?encryption",responseCode:204},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}}},DeleteBucketIntelligentTieringConfiguration:{http:{method:"DELETE",requestUri:"/{Bucket}?intelligent-tiering",responseCode:204},input:{type:"structure",required:["Bucket","Id"],members:{Bucket:{location:"uri",locationName:"Bucket"},Id:{location:"querystring",locationName:"id"}}}},DeleteBucketInventoryConfiguration:{http:{method:"DELETE",requestUri:"/{Bucket}?inventory",responseCode:204},input:{type:"structure",required:["Bucket","Id"],members:{Bucket:{location:"uri",locationName:"Bucket"},Id:{location:"querystring",locationName:"id"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}}},DeleteBucketLifecycle:{http:{method:"DELETE",requestUri:"/{Bucket}?lifecycle",responseCode:204},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}}},DeleteBucketMetricsConfiguration:{http:{method:"DELETE",requestUri:"/{Bucket}?metrics",responseCode:204},input:{type:"structure",required:["Bucket","Id"],members:{Bucket:{location:"uri",locationName:"Bucket"},Id:{location:"querystring",locationName:"id"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}}},DeleteBucketOwnershipControls:{http:{method:"DELETE",requestUri:"/{Bucket}?ownershipControls",responseCode:204},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}}},DeleteBucketPolicy:{http:{method:"DELETE",requestUri:"/{Bucket}?policy",responseCode:204},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}}},DeleteBucketReplication:{http:{method:"DELETE",requestUri:"/{Bucket}?replication",responseCode:204},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}}},DeleteBucketTagging:{http:{method:"DELETE",requestUri:"/{Bucket}?tagging",responseCode:204},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}}},DeleteBucketWebsite:{http:{method:"DELETE",requestUri:"/{Bucket}?website",responseCode:204},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}}},DeleteObject:{http:{method:"DELETE",requestUri:"/{Bucket}/{Key+}",responseCode:204},input:{type:"structure",required:["Bucket","Key"],members:{Bucket:{location:"uri",locationName:"Bucket"},Key:{location:"uri",locationName:"Key"},MFA:{location:"header",locationName:"x-amz-mfa"},VersionId:{location:"querystring",locationName:"versionId"},RequestPayer:{location:"header",locationName:"x-amz-request-payer"},BypassGovernanceRetention:{location:"header",locationName:"x-amz-bypass-governance-retention",type:"boolean"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{DeleteMarker:{location:"header",locationName:"x-amz-delete-marker",type:"boolean"},VersionId:{location:"header",locationName:"x-amz-version-id"},RequestCharged:{location:"header",locationName:"x-amz-request-charged"}}}},DeleteObjectTagging:{http:{method:"DELETE",requestUri:"/{Bucket}/{Key+}?tagging",responseCode:204},input:{type:"structure",required:["Bucket","Key"],members:{Bucket:{location:"uri",locationName:"Bucket"},Key:{location:"uri",locationName:"Key"},VersionId:{location:"querystring",locationName:"versionId"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{VersionId:{location:"header",locationName:"x-amz-version-id"}}}},DeleteObjects:{http:{requestUri:"/{Bucket}?delete"},input:{type:"structure",required:["Bucket","Delete"],members:{Bucket:{location:"uri",locationName:"Bucket"},Delete:{locationName:"Delete",xmlNamespace:{uri:"http://s3.amazonaws.com/doc/2006-03-01/"},type:"structure",required:["Objects"],members:{Objects:{locationName:"Object",type:"list",member:{type:"structure",required:["Key"],members:{Key:{},VersionId:{}}},flattened:!0},Quiet:{type:"boolean"}}},MFA:{location:"header",locationName:"x-amz-mfa"},RequestPayer:{location:"header",locationName:"x-amz-request-payer"},BypassGovernanceRetention:{location:"header",locationName:"x-amz-bypass-governance-retention",type:"boolean"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}},payload:"Delete"},output:{type:"structure",members:{Deleted:{type:"list",member:{type:"structure",members:{Key:{},VersionId:{},DeleteMarker:{type:"boolean"},DeleteMarkerVersionId:{}}},flattened:!0},RequestCharged:{location:"header",locationName:"x-amz-request-charged"},Errors:{locationName:"Error",type:"list",member:{type:"structure",members:{Key:{},VersionId:{},Code:{},Message:{}}},flattened:!0}}},alias:"DeleteMultipleObjects",httpChecksumRequired:!0},DeletePublicAccessBlock:{http:{method:"DELETE",requestUri:"/{Bucket}?publicAccessBlock",responseCode:204},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}}},GetBucketAccelerateConfiguration:{http:{method:"GET",requestUri:"/{Bucket}?accelerate"},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{Status:{}}}},GetBucketAcl:{http:{method:"GET",requestUri:"/{Bucket}?acl"},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{Owner:{shape:"S37"},Grants:{shape:"S3a",locationName:"AccessControlList"}}}},GetBucketAnalyticsConfiguration:{http:{method:"GET",requestUri:"/{Bucket}?analytics"},input:{type:"structure",required:["Bucket","Id"],members:{Bucket:{location:"uri",locationName:"Bucket"},Id:{location:"querystring",locationName:"id"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{AnalyticsConfiguration:{shape:"S3j"}},payload:"AnalyticsConfiguration"}},GetBucketCors:{http:{method:"GET",requestUri:"/{Bucket}?cors"},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{CORSRules:{shape:"S3y",locationName:"CORSRule"}}}},GetBucketEncryption:{http:{method:"GET",requestUri:"/{Bucket}?encryption"},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{ServerSideEncryptionConfiguration:{shape:"S4b"}},payload:"ServerSideEncryptionConfiguration"}},GetBucketIntelligentTieringConfiguration:{http:{method:"GET",requestUri:"/{Bucket}?intelligent-tiering"},input:{type:"structure",required:["Bucket","Id"],members:{Bucket:{location:"uri",locationName:"Bucket"},Id:{location:"querystring",locationName:"id"}}},output:{type:"structure",members:{IntelligentTieringConfiguration:{shape:"S4h"}},payload:"IntelligentTieringConfiguration"}},GetBucketInventoryConfiguration:{http:{method:"GET",requestUri:"/{Bucket}?inventory"},input:{type:"structure",required:["Bucket","Id"],members:{Bucket:{location:"uri",locationName:"Bucket"},Id:{location:"querystring",locationName:"id"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{InventoryConfiguration:{shape:"S4r"}},payload:"InventoryConfiguration"}},GetBucketLifecycle:{http:{method:"GET",requestUri:"/{Bucket}?lifecycle"},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{Rules:{shape:"S57",locationName:"Rule"}}},deprecated:!0},GetBucketLifecycleConfiguration:{http:{method:"GET",requestUri:"/{Bucket}?lifecycle"},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{Rules:{shape:"S5m",locationName:"Rule"}}}},GetBucketLocation:{http:{method:"GET",requestUri:"/{Bucket}?location"},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{LocationConstraint:{}}}},GetBucketLogging:{http:{method:"GET",requestUri:"/{Bucket}?logging"},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{LoggingEnabled:{shape:"S5w"}}}},GetBucketMetricsConfiguration:{http:{method:"GET",requestUri:"/{Bucket}?metrics"},input:{type:"structure",required:["Bucket","Id"],members:{Bucket:{location:"uri",locationName:"Bucket"},Id:{location:"querystring",locationName:"id"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{MetricsConfiguration:{shape:"S64"}},payload:"MetricsConfiguration"}},GetBucketNotification:{http:{method:"GET",requestUri:"/{Bucket}?notification"},input:{shape:"S67"},output:{shape:"S68"},deprecated:!0},GetBucketNotificationConfiguration:{http:{method:"GET",requestUri:"/{Bucket}?notification"},input:{shape:"S67"},output:{shape:"S6j"}},GetBucketOwnershipControls:{http:{method:"GET",requestUri:"/{Bucket}?ownershipControls"},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{OwnershipControls:{shape:"S6z"}},payload:"OwnershipControls"}},GetBucketPolicy:{http:{method:"GET",requestUri:"/{Bucket}?policy"},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{Policy:{}},payload:"Policy"}},GetBucketPolicyStatus:{http:{method:"GET",requestUri:"/{Bucket}?policyStatus"},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{PolicyStatus:{type:"structure",members:{IsPublic:{locationName:"IsPublic",type:"boolean"}}}},payload:"PolicyStatus"}},GetBucketReplication:{http:{method:"GET",requestUri:"/{Bucket}?replication"},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{ReplicationConfiguration:{shape:"S7c"}},payload:"ReplicationConfiguration"}},GetBucketRequestPayment:{http:{method:"GET",requestUri:"/{Bucket}?requestPayment"},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{Payer:{}}}},GetBucketTagging:{http:{method:"GET",requestUri:"/{Bucket}?tagging"},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",required:["TagSet"],members:{TagSet:{shape:"S3p"}}}},GetBucketVersioning:{http:{method:"GET",requestUri:"/{Bucket}?versioning"},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{Status:{},MFADelete:{locationName:"MfaDelete"}}}},GetBucketWebsite:{http:{method:"GET",requestUri:"/{Bucket}?website"},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{RedirectAllRequestsTo:{shape:"S8f"},IndexDocument:{shape:"S8i"},ErrorDocument:{shape:"S8k"},RoutingRules:{shape:"S8l"}}}},GetObject:{http:{method:"GET",requestUri:"/{Bucket}/{Key+}"},input:{type:"structure",required:["Bucket","Key"],members:{Bucket:{location:"uri",locationName:"Bucket"},IfMatch:{location:"header",locationName:"If-Match"},IfModifiedSince:{location:"header",locationName:"If-Modified-Since",type:"timestamp"},IfNoneMatch:{location:"header",locationName:"If-None-Match"},IfUnmodifiedSince:{location:"header",locationName:"If-Unmodified-Since",type:"timestamp"},Key:{location:"uri",locationName:"Key"},Range:{location:"header",locationName:"Range"},ResponseCacheControl:{location:"querystring",locationName:"response-cache-control"},ResponseContentDisposition:{location:"querystring",locationName:"response-content-disposition"},ResponseContentEncoding:{location:"querystring",locationName:"response-content-encoding"},ResponseContentLanguage:{location:"querystring",locationName:"response-content-language"},ResponseContentType:{location:"querystring",locationName:"response-content-type"},ResponseExpires:{location:"querystring",locationName:"response-expires",type:"timestamp",timestampFormat:"rfc822"},VersionId:{location:"querystring",locationName:"versionId"},SSECustomerAlgorithm:{location:"header",locationName:"x-amz-server-side-encryption-customer-algorithm"},SSECustomerKey:{shape:"S1b",location:"header",locationName:"x-amz-server-side-encryption-customer-key"},SSECustomerKeyMD5:{location:"header",locationName:"x-amz-server-side-encryption-customer-key-MD5"},RequestPayer:{location:"header",locationName:"x-amz-request-payer"},PartNumber:{location:"querystring",locationName:"partNumber",type:"integer"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{Body:{streaming:!0,type:"blob"},DeleteMarker:{location:"header",locationName:"x-amz-delete-marker",type:"boolean"},AcceptRanges:{location:"header",locationName:"accept-ranges"},Expiration:{location:"header",locationName:"x-amz-expiration"},Restore:{location:"header",locationName:"x-amz-restore"},LastModified:{location:"header",locationName:"Last-Modified",type:"timestamp"},ContentLength:{location:"header",locationName:"Content-Length",type:"long"},ETag:{location:"header",locationName:"ETag"},MissingMeta:{location:"header",locationName:"x-amz-missing-meta",type:"integer"},VersionId:{location:"header",locationName:"x-amz-version-id"},CacheControl:{location:"header",locationName:"Cache-Control"},ContentDisposition:{location:"header",locationName:"Content-Disposition"},ContentEncoding:{location:"header",locationName:"Content-Encoding"},ContentLanguage:{location:"header",locationName:"Content-Language"},ContentRange:{location:"header",locationName:"Content-Range"},ContentType:{location:"header",locationName:"Content-Type"},Expires:{location:"header",locationName:"Expires",type:"timestamp"},WebsiteRedirectLocation:{location:"header",locationName:"x-amz-website-redirect-location"},ServerSideEncryption:{location:"header",locationName:"x-amz-server-side-encryption"},Metadata:{shape:"S13",location:"headers",locationName:"x-amz-meta-"},SSECustomerAlgorithm:{location:"header",locationName:"x-amz-server-side-encryption-customer-algorithm"},SSECustomerKeyMD5:{location:"header",locationName:"x-amz-server-side-encryption-customer-key-MD5"},SSEKMSKeyId:{shape:"Sk",location:"header",locationName:"x-amz-server-side-encryption-aws-kms-key-id"},BucketKeyEnabled:{location:"header",locationName:"x-amz-server-side-encryption-bucket-key-enabled",type:"boolean"},StorageClass:{location:"header",locationName:"x-amz-storage-class"},RequestCharged:{location:"header",locationName:"x-amz-request-charged"},ReplicationStatus:{location:"header",locationName:"x-amz-replication-status"},PartsCount:{location:"header",locationName:"x-amz-mp-parts-count",type:"integer"},TagCount:{location:"header",locationName:"x-amz-tagging-count",type:"integer"},ObjectLockMode:{location:"header",locationName:"x-amz-object-lock-mode"},ObjectLockRetainUntilDate:{shape:"S1j",location:"header",locationName:"x-amz-object-lock-retain-until-date"},ObjectLockLegalHoldStatus:{location:"header",locationName:"x-amz-object-lock-legal-hold"}},payload:"Body"}},GetObjectAcl:{http:{method:"GET",requestUri:"/{Bucket}/{Key+}?acl"},input:{type:"structure",required:["Bucket","Key"],members:{Bucket:{location:"uri",locationName:"Bucket"},Key:{location:"uri",locationName:"Key"},VersionId:{location:"querystring",locationName:"versionId"},RequestPayer:{location:"header",locationName:"x-amz-request-payer"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{Owner:{shape:"S37"},Grants:{shape:"S3a",locationName:"AccessControlList"},RequestCharged:{location:"header",locationName:"x-amz-request-charged"}}}},GetObjectLegalHold:{http:{method:"GET",requestUri:"/{Bucket}/{Key+}?legal-hold"},input:{type:"structure",required:["Bucket","Key"],members:{Bucket:{location:"uri",locationName:"Bucket"},Key:{location:"uri",locationName:"Key"},VersionId:{location:"querystring",locationName:"versionId"},RequestPayer:{location:"header",locationName:"x-amz-request-payer"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{LegalHold:{shape:"S9k"}},payload:"LegalHold"}},GetObjectLockConfiguration:{http:{method:"GET",requestUri:"/{Bucket}?object-lock"},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{ObjectLockConfiguration:{shape:"S9n"}},payload:"ObjectLockConfiguration"}},GetObjectRetention:{http:{method:"GET",requestUri:"/{Bucket}/{Key+}?retention"},input:{type:"structure",required:["Bucket","Key"],members:{Bucket:{location:"uri",locationName:"Bucket"},Key:{location:"uri",locationName:"Key"},VersionId:{location:"querystring",locationName:"versionId"},RequestPayer:{location:"header",locationName:"x-amz-request-payer"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{Retention:{shape:"S9v"}},payload:"Retention"}},GetObjectTagging:{http:{method:"GET",requestUri:"/{Bucket}/{Key+}?tagging"},input:{type:"structure",required:["Bucket","Key"],members:{Bucket:{location:"uri",locationName:"Bucket"},Key:{location:"uri",locationName:"Key"},VersionId:{location:"querystring",locationName:"versionId"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",required:["TagSet"],members:{VersionId:{location:"header",locationName:"x-amz-version-id"},TagSet:{shape:"S3p"}}}},GetObjectTorrent:{http:{method:"GET",requestUri:"/{Bucket}/{Key+}?torrent"},
+input:{type:"structure",required:["Bucket","Key"],members:{Bucket:{location:"uri",locationName:"Bucket"},Key:{location:"uri",locationName:"Key"},RequestPayer:{location:"header",locationName:"x-amz-request-payer"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{Body:{streaming:!0,type:"blob"},RequestCharged:{location:"header",locationName:"x-amz-request-charged"}},payload:"Body"}},GetPublicAccessBlock:{http:{method:"GET",requestUri:"/{Bucket}?publicAccessBlock"},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{PublicAccessBlockConfiguration:{shape:"Sa2"}},payload:"PublicAccessBlockConfiguration"}},HeadBucket:{http:{method:"HEAD",requestUri:"/{Bucket}"},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}}},HeadObject:{http:{method:"HEAD",requestUri:"/{Bucket}/{Key+}"},input:{type:"structure",required:["Bucket","Key"],members:{Bucket:{location:"uri",locationName:"Bucket"},IfMatch:{location:"header",locationName:"If-Match"},IfModifiedSince:{location:"header",locationName:"If-Modified-Since",type:"timestamp"},IfNoneMatch:{location:"header",locationName:"If-None-Match"},IfUnmodifiedSince:{location:"header",locationName:"If-Unmodified-Since",type:"timestamp"},Key:{location:"uri",locationName:"Key"},Range:{location:"header",locationName:"Range"},VersionId:{location:"querystring",locationName:"versionId"},SSECustomerAlgorithm:{location:"header",locationName:"x-amz-server-side-encryption-customer-algorithm"},SSECustomerKey:{shape:"S1b",location:"header",locationName:"x-amz-server-side-encryption-customer-key"},SSECustomerKeyMD5:{location:"header",locationName:"x-amz-server-side-encryption-customer-key-MD5"},RequestPayer:{location:"header",locationName:"x-amz-request-payer"},PartNumber:{location:"querystring",locationName:"partNumber",type:"integer"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{DeleteMarker:{location:"header",locationName:"x-amz-delete-marker",type:"boolean"},AcceptRanges:{location:"header",locationName:"accept-ranges"},Expiration:{location:"header",locationName:"x-amz-expiration"},Restore:{location:"header",locationName:"x-amz-restore"},ArchiveStatus:{location:"header",locationName:"x-amz-archive-status"},LastModified:{location:"header",locationName:"Last-Modified",type:"timestamp"},ContentLength:{location:"header",locationName:"Content-Length",type:"long"},ETag:{location:"header",locationName:"ETag"},MissingMeta:{location:"header",locationName:"x-amz-missing-meta",type:"integer"},VersionId:{location:"header",locationName:"x-amz-version-id"},CacheControl:{location:"header",locationName:"Cache-Control"},ContentDisposition:{location:"header",locationName:"Content-Disposition"},ContentEncoding:{location:"header",locationName:"Content-Encoding"},ContentLanguage:{location:"header",locationName:"Content-Language"},ContentType:{location:"header",locationName:"Content-Type"},Expires:{location:"header",locationName:"Expires",type:"timestamp"},WebsiteRedirectLocation:{location:"header",locationName:"x-amz-website-redirect-location"},ServerSideEncryption:{location:"header",locationName:"x-amz-server-side-encryption"},Metadata:{shape:"S13",location:"headers",locationName:"x-amz-meta-"},SSECustomerAlgorithm:{location:"header",locationName:"x-amz-server-side-encryption-customer-algorithm"},SSECustomerKeyMD5:{location:"header",locationName:"x-amz-server-side-encryption-customer-key-MD5"},SSEKMSKeyId:{shape:"Sk",location:"header",locationName:"x-amz-server-side-encryption-aws-kms-key-id"},BucketKeyEnabled:{location:"header",locationName:"x-amz-server-side-encryption-bucket-key-enabled",type:"boolean"},StorageClass:{location:"header",locationName:"x-amz-storage-class"},RequestCharged:{location:"header",locationName:"x-amz-request-charged"},ReplicationStatus:{location:"header",locationName:"x-amz-replication-status"},PartsCount:{location:"header",locationName:"x-amz-mp-parts-count",type:"integer"},ObjectLockMode:{location:"header",locationName:"x-amz-object-lock-mode"},ObjectLockRetainUntilDate:{shape:"S1j",location:"header",locationName:"x-amz-object-lock-retain-until-date"},ObjectLockLegalHoldStatus:{location:"header",locationName:"x-amz-object-lock-legal-hold"}}}},ListBucketAnalyticsConfigurations:{http:{method:"GET",requestUri:"/{Bucket}?analytics"},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ContinuationToken:{location:"querystring",locationName:"continuation-token"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{IsTruncated:{type:"boolean"},ContinuationToken:{},NextContinuationToken:{},AnalyticsConfigurationList:{locationName:"AnalyticsConfiguration",type:"list",member:{shape:"S3j"},flattened:!0}}}},ListBucketIntelligentTieringConfigurations:{http:{method:"GET",requestUri:"/{Bucket}?intelligent-tiering"},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ContinuationToken:{location:"querystring",locationName:"continuation-token"}}},output:{type:"structure",members:{IsTruncated:{type:"boolean"},ContinuationToken:{},NextContinuationToken:{},IntelligentTieringConfigurationList:{locationName:"IntelligentTieringConfiguration",type:"list",member:{shape:"S4h"},flattened:!0}}}},ListBucketInventoryConfigurations:{http:{method:"GET",requestUri:"/{Bucket}?inventory"},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ContinuationToken:{location:"querystring",locationName:"continuation-token"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{ContinuationToken:{},InventoryConfigurationList:{locationName:"InventoryConfiguration",type:"list",member:{shape:"S4r"},flattened:!0},IsTruncated:{type:"boolean"},NextContinuationToken:{}}}},ListBucketMetricsConfigurations:{http:{method:"GET",requestUri:"/{Bucket}?metrics"},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ContinuationToken:{location:"querystring",locationName:"continuation-token"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{IsTruncated:{type:"boolean"},ContinuationToken:{},NextContinuationToken:{},MetricsConfigurationList:{locationName:"MetricsConfiguration",type:"list",member:{shape:"S64"},flattened:!0}}}},ListBuckets:{http:{method:"GET"},output:{type:"structure",members:{Buckets:{type:"list",member:{locationName:"Bucket",type:"structure",members:{Name:{},CreationDate:{type:"timestamp"}}}},Owner:{shape:"S37"}}},alias:"GetService"},ListMultipartUploads:{http:{method:"GET",requestUri:"/{Bucket}?uploads"},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},Delimiter:{location:"querystring",locationName:"delimiter"},EncodingType:{location:"querystring",locationName:"encoding-type"},KeyMarker:{location:"querystring",locationName:"key-marker"},MaxUploads:{location:"querystring",locationName:"max-uploads",type:"integer"},Prefix:{location:"querystring",locationName:"prefix"},UploadIdMarker:{location:"querystring",locationName:"upload-id-marker"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{Bucket:{},KeyMarker:{},UploadIdMarker:{},NextKeyMarker:{},Prefix:{},Delimiter:{},NextUploadIdMarker:{},MaxUploads:{type:"integer"},IsTruncated:{type:"boolean"},Uploads:{locationName:"Upload",type:"list",member:{type:"structure",members:{UploadId:{},Key:{},Initiated:{type:"timestamp"},StorageClass:{},Owner:{shape:"S37"},Initiator:{shape:"Sb3"}}},flattened:!0},CommonPrefixes:{shape:"Sb4"},EncodingType:{}}}},ListObjectVersions:{http:{method:"GET",requestUri:"/{Bucket}?versions"},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},Delimiter:{location:"querystring",locationName:"delimiter"},EncodingType:{location:"querystring",locationName:"encoding-type"},KeyMarker:{location:"querystring",locationName:"key-marker"},MaxKeys:{location:"querystring",locationName:"max-keys",type:"integer"},Prefix:{location:"querystring",locationName:"prefix"},VersionIdMarker:{location:"querystring",locationName:"version-id-marker"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{IsTruncated:{type:"boolean"},KeyMarker:{},VersionIdMarker:{},NextKeyMarker:{},NextVersionIdMarker:{},Versions:{locationName:"Version",type:"list",member:{type:"structure",members:{ETag:{},Size:{type:"integer"},StorageClass:{},Key:{},VersionId:{},IsLatest:{type:"boolean"},LastModified:{type:"timestamp"},Owner:{shape:"S37"}}},flattened:!0},DeleteMarkers:{locationName:"DeleteMarker",type:"list",member:{type:"structure",members:{Owner:{shape:"S37"},Key:{},VersionId:{},IsLatest:{type:"boolean"},LastModified:{type:"timestamp"}}},flattened:!0},Name:{},Prefix:{},Delimiter:{},MaxKeys:{type:"integer"},CommonPrefixes:{shape:"Sb4"},EncodingType:{}}},alias:"GetBucketObjectVersions"},ListObjects:{http:{method:"GET",requestUri:"/{Bucket}"},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},Delimiter:{location:"querystring",locationName:"delimiter"},EncodingType:{location:"querystring",locationName:"encoding-type"},Marker:{location:"querystring",locationName:"marker"},MaxKeys:{location:"querystring",locationName:"max-keys",type:"integer"},Prefix:{location:"querystring",locationName:"prefix"},RequestPayer:{location:"header",locationName:"x-amz-request-payer"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{IsTruncated:{type:"boolean"},Marker:{},NextMarker:{},Contents:{shape:"Sbm"},Name:{},Prefix:{},Delimiter:{},MaxKeys:{type:"integer"},CommonPrefixes:{shape:"Sb4"},EncodingType:{}}},alias:"GetBucket"},ListObjectsV2:{http:{method:"GET",requestUri:"/{Bucket}?list-type=2"},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},Delimiter:{location:"querystring",locationName:"delimiter"},EncodingType:{location:"querystring",locationName:"encoding-type"},MaxKeys:{location:"querystring",locationName:"max-keys",type:"integer"},Prefix:{location:"querystring",locationName:"prefix"},ContinuationToken:{location:"querystring",locationName:"continuation-token"},FetchOwner:{location:"querystring",locationName:"fetch-owner",type:"boolean"},StartAfter:{location:"querystring",locationName:"start-after"},RequestPayer:{location:"header",locationName:"x-amz-request-payer"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{IsTruncated:{type:"boolean"},Contents:{shape:"Sbm"},Name:{},Prefix:{},Delimiter:{},MaxKeys:{type:"integer"},CommonPrefixes:{shape:"Sb4"},EncodingType:{},KeyCount:{type:"integer"},ContinuationToken:{},NextContinuationToken:{},StartAfter:{}}}},ListParts:{http:{method:"GET",requestUri:"/{Bucket}/{Key+}"},input:{type:"structure",required:["Bucket","Key","UploadId"],members:{Bucket:{location:"uri",locationName:"Bucket"},Key:{location:"uri",locationName:"Key"},MaxParts:{location:"querystring",locationName:"max-parts",type:"integer"},PartNumberMarker:{location:"querystring",locationName:"part-number-marker",type:"integer"},UploadId:{location:"querystring",locationName:"uploadId"},RequestPayer:{location:"header",locationName:"x-amz-request-payer"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{AbortDate:{location:"header",locationName:"x-amz-abort-date",type:"timestamp"},AbortRuleId:{location:"header",locationName:"x-amz-abort-rule-id"},Bucket:{},Key:{},UploadId:{},PartNumberMarker:{type:"integer"},NextPartNumberMarker:{type:"integer"},MaxParts:{type:"integer"},IsTruncated:{type:"boolean"},Parts:{locationName:"Part",type:"list",member:{type:"structure",members:{PartNumber:{type:"integer"},LastModified:{type:"timestamp"},ETag:{},Size:{type:"integer"}}},flattened:!0},Initiator:{shape:"Sb3"},Owner:{shape:"S37"},StorageClass:{},RequestCharged:{location:"header",locationName:"x-amz-request-charged"}}}},PutBucketAccelerateConfiguration:{http:{method:"PUT",requestUri:"/{Bucket}?accelerate"},input:{type:"structure",required:["Bucket","AccelerateConfiguration"],members:{Bucket:{location:"uri",locationName:"Bucket"},AccelerateConfiguration:{locationName:"AccelerateConfiguration",xmlNamespace:{uri:"http://s3.amazonaws.com/doc/2006-03-01/"},type:"structure",members:{Status:{}}},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}},payload:"AccelerateConfiguration"}},PutBucketAcl:{http:{method:"PUT",requestUri:"/{Bucket}?acl"},input:{type:"structure",required:["Bucket"],members:{ACL:{location:"header",locationName:"x-amz-acl"},AccessControlPolicy:{shape:"Sc4",locationName:"AccessControlPolicy",xmlNamespace:{uri:"http://s3.amazonaws.com/doc/2006-03-01/"}},Bucket:{location:"uri",locationName:"Bucket"},ContentMD5:{location:"header",locationName:"Content-MD5"},GrantFullControl:{location:"header",locationName:"x-amz-grant-full-control"},GrantRead:{location:"header",locationName:"x-amz-grant-read"},GrantReadACP:{location:"header",locationName:"x-amz-grant-read-acp"},GrantWrite:{location:"header",locationName:"x-amz-grant-write"},GrantWriteACP:{location:"header",locationName:"x-amz-grant-write-acp"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}},payload:"AccessControlPolicy"},httpChecksumRequired:!0},PutBucketAnalyticsConfiguration:{http:{method:"PUT",requestUri:"/{Bucket}?analytics"},input:{type:"structure",required:["Bucket","Id","AnalyticsConfiguration"],members:{Bucket:{location:"uri",locationName:"Bucket"},Id:{location:"querystring",locationName:"id"},AnalyticsConfiguration:{shape:"S3j",locationName:"AnalyticsConfiguration",xmlNamespace:{uri:"http://s3.amazonaws.com/doc/2006-03-01/"}},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}},payload:"AnalyticsConfiguration"}},PutBucketCors:{http:{method:"PUT",requestUri:"/{Bucket}?cors"},input:{type:"structure",required:["Bucket","CORSConfiguration"],members:{Bucket:{location:"uri",locationName:"Bucket"},CORSConfiguration:{locationName:"CORSConfiguration",xmlNamespace:{uri:"http://s3.amazonaws.com/doc/2006-03-01/"},type:"structure",required:["CORSRules"],members:{CORSRules:{shape:"S3y",locationName:"CORSRule"}}},ContentMD5:{location:"header",locationName:"Content-MD5"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}},payload:"CORSConfiguration"},httpChecksumRequired:!0},PutBucketEncryption:{http:{method:"PUT",requestUri:"/{Bucket}?encryption"},input:{type:"structure",required:["Bucket","ServerSideEncryptionConfiguration"],members:{Bucket:{location:"uri",locationName:"Bucket"},ContentMD5:{location:"header",locationName:"Content-MD5"},ServerSideEncryptionConfiguration:{shape:"S4b",locationName:"ServerSideEncryptionConfiguration",xmlNamespace:{uri:"http://s3.amazonaws.com/doc/2006-03-01/"}},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}},payload:"ServerSideEncryptionConfiguration"},httpChecksumRequired:!0},PutBucketIntelligentTieringConfiguration:{http:{method:"PUT",requestUri:"/{Bucket}?intelligent-tiering"},input:{type:"structure",required:["Bucket","Id","IntelligentTieringConfiguration"],members:{Bucket:{location:"uri",locationName:"Bucket"},Id:{location:"querystring",locationName:"id"},IntelligentTieringConfiguration:{shape:"S4h",locationName:"IntelligentTieringConfiguration",xmlNamespace:{uri:"http://s3.amazonaws.com/doc/2006-03-01/"}}},payload:"IntelligentTieringConfiguration"}},PutBucketInventoryConfiguration:{http:{method:"PUT",requestUri:"/{Bucket}?inventory"},input:{type:"structure",required:["Bucket","Id","InventoryConfiguration"],members:{Bucket:{location:"uri",locationName:"Bucket"},Id:{location:"querystring",locationName:"id"},InventoryConfiguration:{shape:"S4r",locationName:"InventoryConfiguration",xmlNamespace:{uri:"http://s3.amazonaws.com/doc/2006-03-01/"}},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}},payload:"InventoryConfiguration"}},PutBucketLifecycle:{http:{method:"PUT",requestUri:"/{Bucket}?lifecycle"},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ContentMD5:{location:"header",locationName:"Content-MD5"},LifecycleConfiguration:{locationName:"LifecycleConfiguration",xmlNamespace:{uri:"http://s3.amazonaws.com/doc/2006-03-01/"},type:"structure",required:["Rules"],members:{Rules:{shape:"S57",locationName:"Rule"}}},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}},payload:"LifecycleConfiguration"},deprecated:!0,httpChecksumRequired:!0},PutBucketLifecycleConfiguration:{http:{method:"PUT",requestUri:"/{Bucket}?lifecycle"},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},LifecycleConfiguration:{locationName:"LifecycleConfiguration",xmlNamespace:{uri:"http://s3.amazonaws.com/doc/2006-03-01/"},type:"structure",required:["Rules"],members:{Rules:{shape:"S5m",locationName:"Rule"}}},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}},payload:"LifecycleConfiguration"},httpChecksumRequired:!0},PutBucketLogging:{http:{method:"PUT",requestUri:"/{Bucket}?logging"},input:{type:"structure",required:["Bucket","BucketLoggingStatus"],members:{Bucket:{location:"uri",locationName:"Bucket"},BucketLoggingStatus:{locationName:"BucketLoggingStatus",xmlNamespace:{uri:"http://s3.amazonaws.com/doc/2006-03-01/"},type:"structure",members:{LoggingEnabled:{shape:"S5w"}}},ContentMD5:{location:"header",locationName:"Content-MD5"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}},payload:"BucketLoggingStatus"},httpChecksumRequired:!0},PutBucketMetricsConfiguration:{http:{method:"PUT",requestUri:"/{Bucket}?metrics"},input:{type:"structure",required:["Bucket","Id","MetricsConfiguration"],members:{Bucket:{location:"uri",locationName:"Bucket"},Id:{location:"querystring",locationName:"id"},MetricsConfiguration:{shape:"S64",locationName:"MetricsConfiguration",xmlNamespace:{uri:"http://s3.amazonaws.com/doc/2006-03-01/"}},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}},payload:"MetricsConfiguration"}},PutBucketNotification:{http:{method:"PUT",requestUri:"/{Bucket}?notification"},input:{type:"structure",required:["Bucket","NotificationConfiguration"],members:{Bucket:{location:"uri",locationName:"Bucket"},ContentMD5:{location:"header",locationName:"Content-MD5"},NotificationConfiguration:{shape:"S68",locationName:"NotificationConfiguration",xmlNamespace:{uri:"http://s3.amazonaws.com/doc/2006-03-01/"}},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}},payload:"NotificationConfiguration"},deprecated:!0,httpChecksumRequired:!0},PutBucketNotificationConfiguration:{http:{method:"PUT",requestUri:"/{Bucket}?notification"},input:{type:"structure",required:["Bucket","NotificationConfiguration"],members:{Bucket:{location:"uri",locationName:"Bucket"},NotificationConfiguration:{shape:"S6j",locationName:"NotificationConfiguration",xmlNamespace:{uri:"http://s3.amazonaws.com/doc/2006-03-01/"}},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}},payload:"NotificationConfiguration"}},PutBucketOwnershipControls:{http:{method:"PUT",requestUri:"/{Bucket}?ownershipControls"},input:{type:"structure",required:["Bucket","OwnershipControls"],members:{Bucket:{location:"uri",locationName:"Bucket"},ContentMD5:{location:"header",locationName:"Content-MD5"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"},OwnershipControls:{shape:"S6z",locationName:"OwnershipControls",xmlNamespace:{uri:"http://s3.amazonaws.com/doc/2006-03-01/"}}},payload:"OwnershipControls"},httpChecksumRequired:!0},PutBucketPolicy:{http:{method:"PUT",requestUri:"/{Bucket}?policy"},input:{type:"structure",required:["Bucket","Policy"],members:{Bucket:{location:"uri",locationName:"Bucket"},ContentMD5:{location:"header",locationName:"Content-MD5"},ConfirmRemoveSelfBucketAccess:{location:"header",locationName:"x-amz-confirm-remove-self-bucket-access",type:"boolean"},Policy:{},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}},payload:"Policy"},httpChecksumRequired:!0},PutBucketReplication:{http:{method:"PUT",requestUri:"/{Bucket}?replication"},input:{type:"structure",required:["Bucket","ReplicationConfiguration"],members:{Bucket:{location:"uri",locationName:"Bucket"},ContentMD5:{location:"header",locationName:"Content-MD5"},ReplicationConfiguration:{shape:"S7c",locationName:"ReplicationConfiguration",xmlNamespace:{uri:"http://s3.amazonaws.com/doc/2006-03-01/"}},Token:{location:"header",locationName:"x-amz-bucket-object-lock-token"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}},payload:"ReplicationConfiguration"},httpChecksumRequired:!0},PutBucketRequestPayment:{http:{method:"PUT",requestUri:"/{Bucket}?requestPayment"},input:{type:"structure",required:["Bucket","RequestPaymentConfiguration"],members:{Bucket:{location:"uri",locationName:"Bucket"},ContentMD5:{location:"header",locationName:"Content-MD5"},RequestPaymentConfiguration:{locationName:"RequestPaymentConfiguration",xmlNamespace:{uri:"http://s3.amazonaws.com/doc/2006-03-01/"},type:"structure",required:["Payer"],members:{Payer:{}}},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}},payload:"RequestPaymentConfiguration"},httpChecksumRequired:!0},PutBucketTagging:{http:{method:"PUT",requestUri:"/{Bucket}?tagging"},input:{type:"structure",required:["Bucket","Tagging"],members:{Bucket:{location:"uri",locationName:"Bucket"},ContentMD5:{location:"header",locationName:"Content-MD5"},Tagging:{shape:"Sct",locationName:"Tagging",xmlNamespace:{uri:"http://s3.amazonaws.com/doc/2006-03-01/"}},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}},payload:"Tagging"},httpChecksumRequired:!0},PutBucketVersioning:{http:{method:"PUT",requestUri:"/{Bucket}?versioning"},input:{type:"structure",required:["Bucket","VersioningConfiguration"],members:{Bucket:{location:"uri",locationName:"Bucket"},ContentMD5:{location:"header",locationName:"Content-MD5"},MFA:{location:"header",locationName:"x-amz-mfa"},VersioningConfiguration:{locationName:"VersioningConfiguration",xmlNamespace:{uri:"http://s3.amazonaws.com/doc/2006-03-01/"},type:"structure",members:{MFADelete:{locationName:"MfaDelete"},Status:{}}},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}},payload:"VersioningConfiguration"},httpChecksumRequired:!0},PutBucketWebsite:{http:{method:"PUT",requestUri:"/{Bucket}?website"},input:{type:"structure",required:["Bucket","WebsiteConfiguration"],members:{Bucket:{location:"uri",locationName:"Bucket"},ContentMD5:{location:"header",locationName:"Content-MD5"},WebsiteConfiguration:{locationName:"WebsiteConfiguration",xmlNamespace:{uri:"http://s3.amazonaws.com/doc/2006-03-01/"},type:"structure",members:{ErrorDocument:{shape:"S8k"},IndexDocument:{shape:"S8i"},RedirectAllRequestsTo:{shape:"S8f"},RoutingRules:{shape:"S8l"}}},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}},payload:"WebsiteConfiguration"},httpChecksumRequired:!0},PutObject:{http:{method:"PUT",requestUri:"/{Bucket}/{Key+}"},input:{type:"structure",required:["Bucket","Key"],members:{ACL:{location:"header",locationName:"x-amz-acl"},Body:{streaming:!0,type:"blob"},Bucket:{location:"uri",locationName:"Bucket"},CacheControl:{location:"header",locationName:"Cache-Control"},ContentDisposition:{location:"header",locationName:"Content-Disposition"},ContentEncoding:{location:"header",locationName:"Content-Encoding"},ContentLanguage:{location:"header",locationName:"Content-Language"},ContentLength:{location:"header",locationName:"Content-Length",type:"long"},ContentMD5:{location:"header",locationName:"Content-MD5"},ContentType:{location:"header",locationName:"Content-Type"},Expires:{location:"header",locationName:"Expires",type:"timestamp"},GrantFullControl:{location:"header",locationName:"x-amz-grant-full-control"},GrantRead:{location:"header",locationName:"x-amz-grant-read"},GrantReadACP:{location:"header",locationName:"x-amz-grant-read-acp"},GrantWriteACP:{location:"header",locationName:"x-amz-grant-write-acp"},Key:{location:"uri",locationName:"Key"},Metadata:{shape:"S13",location:"headers",locationName:"x-amz-meta-"},ServerSideEncryption:{location:"header",locationName:"x-amz-server-side-encryption"},StorageClass:{location:"header",locationName:"x-amz-storage-class"},WebsiteRedirectLocation:{location:"header",locationName:"x-amz-website-redirect-location"},SSECustomerAlgorithm:{location:"header",locationName:"x-amz-server-side-encryption-customer-algorithm"},SSECustomerKey:{shape:"S1b",location:"header",locationName:"x-amz-server-side-encryption-customer-key"},SSECustomerKeyMD5:{location:"header",locationName:"x-amz-server-side-encryption-customer-key-MD5"},SSEKMSKeyId:{shape:"Sk",location:"header",locationName:"x-amz-server-side-encryption-aws-kms-key-id"},SSEKMSEncryptionContext:{shape:"S1d",location:"header",locationName:"x-amz-server-side-encryption-context"},BucketKeyEnabled:{location:"header",locationName:"x-amz-server-side-encryption-bucket-key-enabled",type:"boolean"},RequestPayer:{location:"header",locationName:"x-amz-request-payer"},Tagging:{location:"header",locationName:"x-amz-tagging"},ObjectLockMode:{location:"header",locationName:"x-amz-object-lock-mode"},ObjectLockRetainUntilDate:{shape:"S1j",location:"header",locationName:"x-amz-object-lock-retain-until-date"},ObjectLockLegalHoldStatus:{location:"header",locationName:"x-amz-object-lock-legal-hold"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}},payload:"Body"},output:{type:"structure",members:{Expiration:{location:"header",locationName:"x-amz-expiration"},ETag:{location:"header",locationName:"ETag"},ServerSideEncryption:{location:"header",locationName:"x-amz-server-side-encryption"},VersionId:{location:"header",locationName:"x-amz-version-id"},SSECustomerAlgorithm:{location:"header",locationName:"x-amz-server-side-encryption-customer-algorithm"},SSECustomerKeyMD5:{location:"header",locationName:"x-amz-server-side-encryption-customer-key-MD5"},SSEKMSKeyId:{shape:"Sk",location:"header",locationName:"x-amz-server-side-encryption-aws-kms-key-id"},SSEKMSEncryptionContext:{shape:"S1d",location:"header",locationName:"x-amz-server-side-encryption-context"},BucketKeyEnabled:{location:"header",locationName:"x-amz-server-side-encryption-bucket-key-enabled",type:"boolean"},RequestCharged:{location:"header",locationName:"x-amz-request-charged"}}}},PutObjectAcl:{http:{method:"PUT",requestUri:"/{Bucket}/{Key+}?acl"},input:{type:"structure",required:["Bucket","Key"],members:{ACL:{location:"header",locationName:"x-amz-acl"},AccessControlPolicy:{shape:"Sc4",locationName:"AccessControlPolicy",xmlNamespace:{uri:"http://s3.amazonaws.com/doc/2006-03-01/"}},Bucket:{location:"uri",locationName:"Bucket"},ContentMD5:{location:"header",locationName:"Content-MD5"},GrantFullControl:{location:"header",locationName:"x-amz-grant-full-control"},GrantRead:{location:"header",locationName:"x-amz-grant-read"},GrantReadACP:{location:"header",locationName:"x-amz-grant-read-acp"},GrantWrite:{location:"header",locationName:"x-amz-grant-write"},GrantWriteACP:{location:"header",locationName:"x-amz-grant-write-acp"},Key:{location:"uri",locationName:"Key"},RequestPayer:{location:"header",locationName:"x-amz-request-payer"},VersionId:{location:"querystring",locationName:"versionId"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}},payload:"AccessControlPolicy"},output:{type:"structure",members:{RequestCharged:{location:"header",locationName:"x-amz-request-charged"}}},httpChecksumRequired:!0},PutObjectLegalHold:{http:{method:"PUT",requestUri:"/{Bucket}/{Key+}?legal-hold"},input:{type:"structure",required:["Bucket","Key"],members:{Bucket:{location:"uri",locationName:"Bucket"},Key:{location:"uri",locationName:"Key"},LegalHold:{shape:"S9k",locationName:"LegalHold",xmlNamespace:{uri:"http://s3.amazonaws.com/doc/2006-03-01/"}},RequestPayer:{location:"header",locationName:"x-amz-request-payer"},VersionId:{location:"querystring",locationName:"versionId"},ContentMD5:{location:"header",locationName:"Content-MD5"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}},payload:"LegalHold"},output:{type:"structure",members:{RequestCharged:{location:"header",locationName:"x-amz-request-charged"}}},httpChecksumRequired:!0},PutObjectLockConfiguration:{http:{method:"PUT",requestUri:"/{Bucket}?object-lock"},input:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ObjectLockConfiguration:{shape:"S9n",locationName:"ObjectLockConfiguration",xmlNamespace:{uri:"http://s3.amazonaws.com/doc/2006-03-01/"}},RequestPayer:{location:"header",locationName:"x-amz-request-payer"},Token:{location:"header",locationName:"x-amz-bucket-object-lock-token"},ContentMD5:{location:"header",locationName:"Content-MD5"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}},payload:"ObjectLockConfiguration"},output:{type:"structure",members:{RequestCharged:{location:"header",locationName:"x-amz-request-charged"}}},httpChecksumRequired:!0},PutObjectRetention:{http:{method:"PUT",requestUri:"/{Bucket}/{Key+}?retention"},input:{type:"structure",required:["Bucket","Key"],members:{Bucket:{location:"uri",locationName:"Bucket"},Key:{location:"uri",locationName:"Key"},Retention:{shape:"S9v",locationName:"Retention",xmlNamespace:{uri:"http://s3.amazonaws.com/doc/2006-03-01/"}},RequestPayer:{location:"header",locationName:"x-amz-request-payer"},VersionId:{location:"querystring",locationName:"versionId"},BypassGovernanceRetention:{location:"header",locationName:"x-amz-bypass-governance-retention",type:"boolean"},ContentMD5:{location:"header",locationName:"Content-MD5"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}},payload:"Retention"},output:{type:"structure",members:{RequestCharged:{location:"header",locationName:"x-amz-request-charged"}}},httpChecksumRequired:!0},PutObjectTagging:{http:{method:"PUT",requestUri:"/{Bucket}/{Key+}?tagging"},input:{type:"structure",required:["Bucket","Key","Tagging"],members:{Bucket:{location:"uri",locationName:"Bucket"},Key:{location:"uri",locationName:"Key"},VersionId:{location:"querystring",locationName:"versionId"},ContentMD5:{location:"header",locationName:"Content-MD5"},Tagging:{shape:"Sct",locationName:"Tagging",xmlNamespace:{uri:"http://s3.amazonaws.com/doc/2006-03-01/"}},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}},payload:"Tagging"},output:{type:"structure",members:{VersionId:{location:"header",locationName:"x-amz-version-id"}}},httpChecksumRequired:!0},PutPublicAccessBlock:{http:{method:"PUT",requestUri:"/{Bucket}?publicAccessBlock"},input:{type:"structure",required:["Bucket","PublicAccessBlockConfiguration"],members:{Bucket:{location:"uri",locationName:"Bucket"},ContentMD5:{location:"header",locationName:"Content-MD5"},PublicAccessBlockConfiguration:{shape:"Sa2",
+locationName:"PublicAccessBlockConfiguration",xmlNamespace:{uri:"http://s3.amazonaws.com/doc/2006-03-01/"}},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}},payload:"PublicAccessBlockConfiguration"},httpChecksumRequired:!0},RestoreObject:{http:{requestUri:"/{Bucket}/{Key+}?restore"},input:{type:"structure",required:["Bucket","Key"],members:{Bucket:{location:"uri",locationName:"Bucket"},Key:{location:"uri",locationName:"Key"},VersionId:{location:"querystring",locationName:"versionId"},RestoreRequest:{locationName:"RestoreRequest",xmlNamespace:{uri:"http://s3.amazonaws.com/doc/2006-03-01/"},type:"structure",members:{Days:{type:"integer"},GlacierJobParameters:{type:"structure",required:["Tier"],members:{Tier:{}}},Type:{},Tier:{},Description:{},SelectParameters:{type:"structure",required:["InputSerialization","ExpressionType","Expression","OutputSerialization"],members:{InputSerialization:{shape:"Sdj"},ExpressionType:{},Expression:{},OutputSerialization:{shape:"Sdy"}}},OutputLocation:{type:"structure",members:{S3:{type:"structure",required:["BucketName","Prefix"],members:{BucketName:{},Prefix:{},Encryption:{type:"structure",required:["EncryptionType"],members:{EncryptionType:{},KMSKeyId:{shape:"Sk"},KMSContext:{}}},CannedACL:{},AccessControlList:{shape:"S3a"},Tagging:{shape:"Sct"},UserMetadata:{type:"list",member:{locationName:"MetadataEntry",type:"structure",members:{Name:{},Value:{}}}},StorageClass:{}}}}}}},RequestPayer:{location:"header",locationName:"x-amz-request-payer"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}},payload:"RestoreRequest"},output:{type:"structure",members:{RequestCharged:{location:"header",locationName:"x-amz-request-charged"},RestoreOutputPath:{location:"header",locationName:"x-amz-restore-output-path"}}},alias:"PostObjectRestore"},SelectObjectContent:{http:{requestUri:"/{Bucket}/{Key+}?select&select-type=2"},input:{locationName:"SelectObjectContentRequest",xmlNamespace:{uri:"http://s3.amazonaws.com/doc/2006-03-01/"},type:"structure",required:["Bucket","Key","Expression","ExpressionType","InputSerialization","OutputSerialization"],members:{Bucket:{location:"uri",locationName:"Bucket"},Key:{location:"uri",locationName:"Key"},SSECustomerAlgorithm:{location:"header",locationName:"x-amz-server-side-encryption-customer-algorithm"},SSECustomerKey:{shape:"S1b",location:"header",locationName:"x-amz-server-side-encryption-customer-key"},SSECustomerKeyMD5:{location:"header",locationName:"x-amz-server-side-encryption-customer-key-MD5"},Expression:{},ExpressionType:{},RequestProgress:{type:"structure",members:{Enabled:{type:"boolean"}}},InputSerialization:{shape:"Sdj"},OutputSerialization:{shape:"Sdy"},ScanRange:{type:"structure",members:{Start:{type:"long"},End:{type:"long"}}},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},output:{type:"structure",members:{Payload:{type:"structure",members:{Records:{type:"structure",members:{Payload:{eventpayload:!0,type:"blob"}},event:!0},Stats:{type:"structure",members:{Details:{eventpayload:!0,type:"structure",members:{BytesScanned:{type:"long"},BytesProcessed:{type:"long"},BytesReturned:{type:"long"}}}},event:!0},Progress:{type:"structure",members:{Details:{eventpayload:!0,type:"structure",members:{BytesScanned:{type:"long"},BytesProcessed:{type:"long"},BytesReturned:{type:"long"}}}},event:!0},Cont:{type:"structure",members:{},event:!0},End:{type:"structure",members:{},event:!0}},eventstream:!0}},payload:"Payload"}},UploadPart:{http:{method:"PUT",requestUri:"/{Bucket}/{Key+}"},input:{type:"structure",required:["Bucket","Key","PartNumber","UploadId"],members:{Body:{streaming:!0,type:"blob"},Bucket:{location:"uri",locationName:"Bucket"},ContentLength:{location:"header",locationName:"Content-Length",type:"long"},ContentMD5:{location:"header",locationName:"Content-MD5"},Key:{location:"uri",locationName:"Key"},PartNumber:{location:"querystring",locationName:"partNumber",type:"integer"},UploadId:{location:"querystring",locationName:"uploadId"},SSECustomerAlgorithm:{location:"header",locationName:"x-amz-server-side-encryption-customer-algorithm"},SSECustomerKey:{shape:"S1b",location:"header",locationName:"x-amz-server-side-encryption-customer-key"},SSECustomerKeyMD5:{location:"header",locationName:"x-amz-server-side-encryption-customer-key-MD5"},RequestPayer:{location:"header",locationName:"x-amz-request-payer"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}},payload:"Body"},output:{type:"structure",members:{ServerSideEncryption:{location:"header",locationName:"x-amz-server-side-encryption"},ETag:{location:"header",locationName:"ETag"},SSECustomerAlgorithm:{location:"header",locationName:"x-amz-server-side-encryption-customer-algorithm"},SSECustomerKeyMD5:{location:"header",locationName:"x-amz-server-side-encryption-customer-key-MD5"},SSEKMSKeyId:{shape:"Sk",location:"header",locationName:"x-amz-server-side-encryption-aws-kms-key-id"},BucketKeyEnabled:{location:"header",locationName:"x-amz-server-side-encryption-bucket-key-enabled",type:"boolean"},RequestCharged:{location:"header",locationName:"x-amz-request-charged"}}}},UploadPartCopy:{http:{method:"PUT",requestUri:"/{Bucket}/{Key+}"},input:{type:"structure",required:["Bucket","CopySource","Key","PartNumber","UploadId"],members:{Bucket:{location:"uri",locationName:"Bucket"},CopySource:{location:"header",locationName:"x-amz-copy-source"},CopySourceIfMatch:{location:"header",locationName:"x-amz-copy-source-if-match"},CopySourceIfModifiedSince:{location:"header",locationName:"x-amz-copy-source-if-modified-since",type:"timestamp"},CopySourceIfNoneMatch:{location:"header",locationName:"x-amz-copy-source-if-none-match"},CopySourceIfUnmodifiedSince:{location:"header",locationName:"x-amz-copy-source-if-unmodified-since",type:"timestamp"},CopySourceRange:{location:"header",locationName:"x-amz-copy-source-range"},Key:{location:"uri",locationName:"Key"},PartNumber:{location:"querystring",locationName:"partNumber",type:"integer"},UploadId:{location:"querystring",locationName:"uploadId"},SSECustomerAlgorithm:{location:"header",locationName:"x-amz-server-side-encryption-customer-algorithm"},SSECustomerKey:{shape:"S1b",location:"header",locationName:"x-amz-server-side-encryption-customer-key"},SSECustomerKeyMD5:{location:"header",locationName:"x-amz-server-side-encryption-customer-key-MD5"},CopySourceSSECustomerAlgorithm:{location:"header",locationName:"x-amz-copy-source-server-side-encryption-customer-algorithm"},CopySourceSSECustomerKey:{shape:"S1f",location:"header",locationName:"x-amz-copy-source-server-side-encryption-customer-key"},CopySourceSSECustomerKeyMD5:{location:"header",locationName:"x-amz-copy-source-server-side-encryption-customer-key-MD5"},RequestPayer:{location:"header",locationName:"x-amz-request-payer"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"},ExpectedSourceBucketOwner:{location:"header",locationName:"x-amz-source-expected-bucket-owner"}}},output:{type:"structure",members:{CopySourceVersionId:{location:"header",locationName:"x-amz-copy-source-version-id"},CopyPartResult:{type:"structure",members:{ETag:{},LastModified:{type:"timestamp"}}},ServerSideEncryption:{location:"header",locationName:"x-amz-server-side-encryption"},SSECustomerAlgorithm:{location:"header",locationName:"x-amz-server-side-encryption-customer-algorithm"},SSECustomerKeyMD5:{location:"header",locationName:"x-amz-server-side-encryption-customer-key-MD5"},SSEKMSKeyId:{shape:"Sk",location:"header",locationName:"x-amz-server-side-encryption-aws-kms-key-id"},BucketKeyEnabled:{location:"header",locationName:"x-amz-server-side-encryption-bucket-key-enabled",type:"boolean"},RequestCharged:{location:"header",locationName:"x-amz-request-charged"}},payload:"CopyPartResult"}}},shapes:{Sk:{type:"string",sensitive:!0},S13:{type:"map",key:{},value:{}},S1b:{type:"blob",sensitive:!0},S1d:{type:"string",sensitive:!0},S1f:{type:"blob",sensitive:!0},S1j:{type:"timestamp",timestampFormat:"iso8601"},S37:{type:"structure",members:{DisplayName:{},ID:{}}},S3a:{type:"list",member:{locationName:"Grant",type:"structure",members:{Grantee:{shape:"S3c"},Permission:{}}}},S3c:{type:"structure",required:["Type"],members:{DisplayName:{},EmailAddress:{},ID:{},Type:{locationName:"xsi:type",xmlAttribute:!0},URI:{}},xmlNamespace:{prefix:"xsi",uri:"http://www.w3.org/2001/XMLSchema-instance"}},S3j:{type:"structure",required:["Id","StorageClassAnalysis"],members:{Id:{},Filter:{type:"structure",members:{Prefix:{},Tag:{shape:"S3m"},And:{type:"structure",members:{Prefix:{},Tags:{shape:"S3p",flattened:!0,locationName:"Tag"}}}}},StorageClassAnalysis:{type:"structure",members:{DataExport:{type:"structure",required:["OutputSchemaVersion","Destination"],members:{OutputSchemaVersion:{},Destination:{type:"structure",required:["S3BucketDestination"],members:{S3BucketDestination:{type:"structure",required:["Format","Bucket"],members:{Format:{},BucketAccountId:{},Bucket:{},Prefix:{}}}}}}}}}}},S3m:{type:"structure",required:["Key","Value"],members:{Key:{},Value:{}}},S3p:{type:"list",member:{shape:"S3m",locationName:"Tag"}},S3y:{type:"list",member:{type:"structure",required:["AllowedMethods","AllowedOrigins"],members:{AllowedHeaders:{locationName:"AllowedHeader",type:"list",member:{},flattened:!0},AllowedMethods:{locationName:"AllowedMethod",type:"list",member:{},flattened:!0},AllowedOrigins:{locationName:"AllowedOrigin",type:"list",member:{},flattened:!0},ExposeHeaders:{locationName:"ExposeHeader",type:"list",member:{},flattened:!0},MaxAgeSeconds:{type:"integer"}}},flattened:!0},S4b:{type:"structure",required:["Rules"],members:{Rules:{locationName:"Rule",type:"list",member:{type:"structure",members:{ApplyServerSideEncryptionByDefault:{type:"structure",required:["SSEAlgorithm"],members:{SSEAlgorithm:{},KMSMasterKeyID:{shape:"Sk"}}},BucketKeyEnabled:{type:"boolean"}}},flattened:!0}}},S4h:{type:"structure",required:["Id","Status","Tierings"],members:{Id:{},Filter:{type:"structure",members:{Prefix:{},Tag:{shape:"S3m"},And:{type:"structure",members:{Prefix:{},Tags:{shape:"S3p",flattened:!0,locationName:"Tag"}}}}},Status:{},Tierings:{locationName:"Tiering",type:"list",member:{type:"structure",required:["Days","AccessTier"],members:{Days:{type:"integer"},AccessTier:{}}},flattened:!0}}},S4r:{type:"structure",required:["Destination","IsEnabled","Id","IncludedObjectVersions","Schedule"],members:{Destination:{type:"structure",required:["S3BucketDestination"],members:{S3BucketDestination:{type:"structure",required:["Bucket","Format"],members:{AccountId:{},Bucket:{},Format:{},Prefix:{},Encryption:{type:"structure",members:{SSES3:{locationName:"SSE-S3",type:"structure",members:{}},SSEKMS:{locationName:"SSE-KMS",type:"structure",required:["KeyId"],members:{KeyId:{shape:"Sk"}}}}}}}}},IsEnabled:{type:"boolean"},Filter:{type:"structure",required:["Prefix"],members:{Prefix:{}}},Id:{},IncludedObjectVersions:{},OptionalFields:{type:"list",member:{locationName:"Field"}},Schedule:{type:"structure",required:["Frequency"],members:{Frequency:{}}}}},S57:{type:"list",member:{type:"structure",required:["Prefix","Status"],members:{Expiration:{shape:"S59"},ID:{},Prefix:{},Status:{},Transition:{shape:"S5e"},NoncurrentVersionTransition:{shape:"S5g"},NoncurrentVersionExpiration:{shape:"S5h"},AbortIncompleteMultipartUpload:{shape:"S5i"}}},flattened:!0},S59:{type:"structure",members:{Date:{shape:"S5a"},Days:{type:"integer"},ExpiredObjectDeleteMarker:{type:"boolean"}}},S5a:{type:"timestamp",timestampFormat:"iso8601"},S5e:{type:"structure",members:{Date:{shape:"S5a"},Days:{type:"integer"},StorageClass:{}}},S5g:{type:"structure",members:{NoncurrentDays:{type:"integer"},StorageClass:{}}},S5h:{type:"structure",members:{NoncurrentDays:{type:"integer"}}},S5i:{type:"structure",members:{DaysAfterInitiation:{type:"integer"}}},S5m:{type:"list",member:{type:"structure",required:["Status"],members:{Expiration:{shape:"S59"},ID:{},Prefix:{deprecated:!0},Filter:{type:"structure",members:{Prefix:{},Tag:{shape:"S3m"},And:{type:"structure",members:{Prefix:{},Tags:{shape:"S3p",flattened:!0,locationName:"Tag"}}}}},Status:{},Transitions:{locationName:"Transition",type:"list",member:{shape:"S5e"},flattened:!0},NoncurrentVersionTransitions:{locationName:"NoncurrentVersionTransition",type:"list",member:{shape:"S5g"},flattened:!0},NoncurrentVersionExpiration:{shape:"S5h"},AbortIncompleteMultipartUpload:{shape:"S5i"}}},flattened:!0},S5w:{type:"structure",required:["TargetBucket","TargetPrefix"],members:{TargetBucket:{},TargetGrants:{type:"list",member:{locationName:"Grant",type:"structure",members:{Grantee:{shape:"S3c"},Permission:{}}}},TargetPrefix:{}}},S64:{type:"structure",required:["Id"],members:{Id:{},Filter:{type:"structure",members:{Prefix:{},Tag:{shape:"S3m"},And:{type:"structure",members:{Prefix:{},Tags:{shape:"S3p",flattened:!0,locationName:"Tag"}}}}}}},S67:{type:"structure",required:["Bucket"],members:{Bucket:{location:"uri",locationName:"Bucket"},ExpectedBucketOwner:{location:"header",locationName:"x-amz-expected-bucket-owner"}}},S68:{type:"structure",members:{TopicConfiguration:{type:"structure",members:{Id:{},Events:{shape:"S6b",locationName:"Event"},Event:{deprecated:!0},Topic:{}}},QueueConfiguration:{type:"structure",members:{Id:{},Event:{deprecated:!0},Events:{shape:"S6b",locationName:"Event"},Queue:{}}},CloudFunctionConfiguration:{type:"structure",members:{Id:{},Event:{deprecated:!0},Events:{shape:"S6b",locationName:"Event"},CloudFunction:{},InvocationRole:{}}}}},S6b:{type:"list",member:{},flattened:!0},S6j:{type:"structure",members:{TopicConfigurations:{locationName:"TopicConfiguration",type:"list",member:{type:"structure",required:["TopicArn","Events"],members:{Id:{},TopicArn:{locationName:"Topic"},Events:{shape:"S6b",locationName:"Event"},Filter:{shape:"S6m"}}},flattened:!0},QueueConfigurations:{locationName:"QueueConfiguration",type:"list",member:{type:"structure",required:["QueueArn","Events"],members:{Id:{},QueueArn:{locationName:"Queue"},Events:{shape:"S6b",locationName:"Event"},Filter:{shape:"S6m"}}},flattened:!0},LambdaFunctionConfigurations:{locationName:"CloudFunctionConfiguration",type:"list",member:{type:"structure",required:["LambdaFunctionArn","Events"],members:{Id:{},LambdaFunctionArn:{locationName:"CloudFunction"},Events:{shape:"S6b",locationName:"Event"},Filter:{shape:"S6m"}}},flattened:!0}}},S6m:{type:"structure",members:{Key:{locationName:"S3Key",type:"structure",members:{FilterRules:{locationName:"FilterRule",type:"list",member:{type:"structure",members:{Name:{},Value:{}}},flattened:!0}}}}},S6z:{type:"structure",required:["Rules"],members:{Rules:{locationName:"Rule",type:"list",member:{type:"structure",required:["ObjectOwnership"],members:{ObjectOwnership:{}}},flattened:!0}}},S7c:{type:"structure",required:["Role","Rules"],members:{Role:{},Rules:{locationName:"Rule",type:"list",member:{type:"structure",required:["Status","Destination"],members:{ID:{},Priority:{type:"integer"},Prefix:{deprecated:!0},Filter:{type:"structure",members:{Prefix:{},Tag:{shape:"S3m"},And:{type:"structure",members:{Prefix:{},Tags:{shape:"S3p",flattened:!0,locationName:"Tag"}}}}},Status:{},SourceSelectionCriteria:{type:"structure",members:{SseKmsEncryptedObjects:{type:"structure",required:["Status"],members:{Status:{}}},ReplicaModifications:{type:"structure",required:["Status"],members:{Status:{}}}}},ExistingObjectReplication:{type:"structure",required:["Status"],members:{Status:{}}},Destination:{type:"structure",required:["Bucket"],members:{Bucket:{},Account:{},StorageClass:{},AccessControlTranslation:{type:"structure",required:["Owner"],members:{Owner:{}}},EncryptionConfiguration:{type:"structure",members:{ReplicaKmsKeyID:{}}},ReplicationTime:{type:"structure",required:["Status","Time"],members:{Status:{},Time:{shape:"S7y"}}},Metrics:{type:"structure",required:["Status"],members:{Status:{},EventThreshold:{shape:"S7y"}}}}},DeleteMarkerReplication:{type:"structure",members:{Status:{}}}}},flattened:!0}}},S7y:{type:"structure",members:{Minutes:{type:"integer"}}},S8f:{type:"structure",required:["HostName"],members:{HostName:{},Protocol:{}}},S8i:{type:"structure",required:["Suffix"],members:{Suffix:{}}},S8k:{type:"structure",required:["Key"],members:{Key:{}}},S8l:{type:"list",member:{locationName:"RoutingRule",type:"structure",required:["Redirect"],members:{Condition:{type:"structure",members:{HttpErrorCodeReturnedEquals:{},KeyPrefixEquals:{}}},Redirect:{type:"structure",members:{HostName:{},HttpRedirectCode:{},Protocol:{},ReplaceKeyPrefixWith:{},ReplaceKeyWith:{}}}}}},S9k:{type:"structure",members:{Status:{}}},S9n:{type:"structure",members:{ObjectLockEnabled:{},Rule:{type:"structure",members:{DefaultRetention:{type:"structure",members:{Mode:{},Days:{type:"integer"},Years:{type:"integer"}}}}}}},S9v:{type:"structure",members:{Mode:{},RetainUntilDate:{shape:"S5a"}}},Sa2:{type:"structure",members:{BlockPublicAcls:{locationName:"BlockPublicAcls",type:"boolean"},IgnorePublicAcls:{locationName:"IgnorePublicAcls",type:"boolean"},BlockPublicPolicy:{locationName:"BlockPublicPolicy",type:"boolean"},RestrictPublicBuckets:{locationName:"RestrictPublicBuckets",type:"boolean"}}},Sb3:{type:"structure",members:{ID:{},DisplayName:{}}},Sb4:{type:"list",member:{type:"structure",members:{Prefix:{}}},flattened:!0},Sbm:{type:"list",member:{type:"structure",members:{Key:{},LastModified:{type:"timestamp"},ETag:{},Size:{type:"integer"},StorageClass:{},Owner:{shape:"S37"}}},flattened:!0},Sc4:{type:"structure",members:{Grants:{shape:"S3a",locationName:"AccessControlList"},Owner:{shape:"S37"}}},Sct:{type:"structure",required:["TagSet"],members:{TagSet:{shape:"S3p"}}},Sdj:{type:"structure",members:{CSV:{type:"structure",members:{FileHeaderInfo:{},Comments:{},QuoteEscapeCharacter:{},RecordDelimiter:{},FieldDelimiter:{},QuoteCharacter:{},AllowQuotedRecordDelimiter:{type:"boolean"}}},CompressionType:{},JSON:{type:"structure",members:{Type:{}}},Parquet:{type:"structure",members:{}}}},Sdy:{type:"structure",members:{CSV:{type:"structure",members:{QuoteFields:{},QuoteEscapeCharacter:{},RecordDelimiter:{},FieldDelimiter:{},QuoteCharacter:{}}},JSON:{type:"structure",members:{RecordDelimiter:{}}}}}},paginators:{ListBuckets:{result_key:"Buckets"},ListMultipartUploads:{input_token:["KeyMarker","UploadIdMarker"],limit_key:"MaxUploads",more_results:"IsTruncated",output_token:["NextKeyMarker","NextUploadIdMarker"],result_key:["Uploads","CommonPrefixes"]},ListObjectVersions:{input_token:["KeyMarker","VersionIdMarker"],limit_key:"MaxKeys",more_results:"IsTruncated",output_token:["NextKeyMarker","NextVersionIdMarker"],result_key:["Versions","DeleteMarkers","CommonPrefixes"]},ListObjects:{input_token:"Marker",limit_key:"MaxKeys",more_results:"IsTruncated",output_token:"NextMarker || Contents[-1].Key",result_key:["Contents","CommonPrefixes"]},ListObjectsV2:{input_token:"ContinuationToken",limit_key:"MaxKeys",output_token:"NextContinuationToken",result_key:["Contents","CommonPrefixes"]},ListParts:{input_token:"PartNumberMarker",limit_key:"MaxParts",more_results:"IsTruncated",output_token:"NextPartNumberMarker",result_key:"Parts"}},waiters:{BucketExists:{delay:5,operation:"HeadBucket",maxAttempts:20,acceptors:[{expected:200,matcher:"status",state:"success"},{expected:301,matcher:"status",state:"success"},{expected:403,matcher:"status",state:"success"},{expected:404,matcher:"status",state:"retry"}]},BucketNotExists:{delay:5,operation:"HeadBucket",maxAttempts:20,acceptors:[{expected:404,matcher:"status",state:"success"}]},ObjectExists:{delay:5,operation:"HeadObject",maxAttempts:20,acceptors:[{expected:200,matcher:"status",state:"success"},{expected:404,matcher:"status",state:"retry"}]},ObjectNotExists:{delay:5,operation:"HeadObject",maxAttempts:20,acceptors:[{expected:404,matcher:"status",state:"success"}]}}};AWS.apiLoader.services.sts={},AWS.STS=AWS.Service.defineService("sts",["2011-06-15"]),_xamzrequire=function e(n,i,t){function r(s,a){if(!i[s]){if(!n[s]){var u="function"==typeof _xamzrequire&&_xamzrequire;if(!a&&u)return u(s,!0);if(o)return o(s,!0);var c=new Error("Cannot find module '"+s+"'");throw c.code="MODULE_NOT_FOUND",c}var d=i[s]={exports:{}};n[s][0].call(d.exports,function(e){var i=n[s][1][e];return r(i||e)},d,d.exports,e,n,i,t)}return i[s].exports}for(var o="function"==typeof _xamzrequire&&_xamzrequire,s=0;s<t.length;s++)r(t[s]);return r}({107:[function(e,n,i){var t=e("../core"),r=e("../config_regional_endpoint");t.util.update(t.STS.prototype,{credentialsFrom:function(e,n){return e?(n||(n=new t.TemporaryCredentials),n.expired=!1,n.accessKeyId=e.Credentials.AccessKeyId,n.secretAccessKey=e.Credentials.SecretAccessKey,n.sessionToken=e.Credentials.SessionToken,n.expireTime=e.Credentials.Expiration,n):null},assumeRoleWithWebIdentity:function(e,n){return this.makeUnauthenticatedRequest("assumeRoleWithWebIdentity",e,n)},assumeRoleWithSAML:function(e,n){return this.makeUnauthenticatedRequest("assumeRoleWithSAML",e,n)},setupRequestListeners:function(e){e.addListener("validate",this.optInRegionalEndpoint,!0)},optInRegionalEndpoint:function(e){var n=e.service,i=n.config;if(i.stsRegionalEndpoints=r(n._originalConfig,{env:"AWS_STS_REGIONAL_ENDPOINTS",sharedConfig:"sts_regional_endpoints",clientConfig:"stsRegionalEndpoints"}),"regional"===i.stsRegionalEndpoints&&n.isGlobalEndpoint){if(!i.region)throw t.util.error(new Error,{code:"ConfigError",message:"Missing region in config"});var o=i.endpoint.indexOf(".amazonaws.com"),s=i.endpoint.substring(0,o)+"."+i.region+i.endpoint.substring(o);e.httpRequest.updateEndpoint(s),e.httpRequest.region=i.region}}})},{"../config_regional_endpoint":38,"../core":39}]},{},[107]);AWS.apiLoader.services.sts["2011-06-15"]={version:"2.0",metadata:{apiVersion:"2011-06-15",endpointPrefix:"sts",globalEndpoint:"sts.amazonaws.com",protocol:"query",serviceAbbreviation:"AWS STS",serviceFullName:"AWS Security Token Service",serviceId:"STS",signatureVersion:"v4",uid:"sts-2011-06-15",xmlNamespace:"https://sts.amazonaws.com/doc/2011-06-15/"},operations:{AssumeRole:{input:{type:"structure",required:["RoleArn","RoleSessionName"],members:{RoleArn:{},RoleSessionName:{},PolicyArns:{shape:"S4"},Policy:{},DurationSeconds:{type:"integer"},Tags:{shape:"S8"},TransitiveTagKeys:{type:"list",member:{}},ExternalId:{},SerialNumber:{},TokenCode:{}}},output:{resultWrapper:"AssumeRoleResult",type:"structure",members:{Credentials:{shape:"Sh"},AssumedRoleUser:{shape:"Sm"},PackedPolicySize:{type:"integer"}}}},AssumeRoleWithSAML:{input:{type:"structure",required:["RoleArn","PrincipalArn","SAMLAssertion"],members:{RoleArn:{},PrincipalArn:{},SAMLAssertion:{},PolicyArns:{shape:"S4"},Policy:{},DurationSeconds:{type:"integer"}}},output:{resultWrapper:"AssumeRoleWithSAMLResult",type:"structure",members:{Credentials:{shape:"Sh"},AssumedRoleUser:{shape:"Sm"},PackedPolicySize:{type:"integer"},Subject:{},SubjectType:{},Issuer:{},Audience:{},NameQualifier:{}}}},AssumeRoleWithWebIdentity:{input:{type:"structure",required:["RoleArn","RoleSessionName","WebIdentityToken"],members:{RoleArn:{},RoleSessionName:{},WebIdentityToken:{},ProviderId:{},PolicyArns:{shape:"S4"},Policy:{},DurationSeconds:{type:"integer"}}},output:{resultWrapper:"AssumeRoleWithWebIdentityResult",type:"structure",members:{Credentials:{shape:"Sh"},SubjectFromWebIdentityToken:{},AssumedRoleUser:{shape:"Sm"},PackedPolicySize:{type:"integer"},Provider:{},Audience:{}}}},DecodeAuthorizationMessage:{input:{type:"structure",required:["EncodedMessage"],members:{EncodedMessage:{}}},output:{resultWrapper:"DecodeAuthorizationMessageResult",type:"structure",members:{DecodedMessage:{}}}},GetAccessKeyInfo:{input:{type:"structure",required:["AccessKeyId"],members:{AccessKeyId:{}}},output:{resultWrapper:"GetAccessKeyInfoResult",type:"structure",members:{Account:{}}}},GetCallerIdentity:{input:{type:"structure",members:{}},output:{resultWrapper:"GetCallerIdentityResult",type:"structure",members:{UserId:{},Account:{},Arn:{}}}},GetFederationToken:{input:{type:"structure",required:["Name"],members:{Name:{},Policy:{},PolicyArns:{shape:"S4"},DurationSeconds:{type:"integer"},Tags:{shape:"S8"}}},output:{resultWrapper:"GetFederationTokenResult",type:"structure",members:{Credentials:{shape:"Sh"},FederatedUser:{type:"structure",required:["FederatedUserId","Arn"],members:{FederatedUserId:{},Arn:{}}},PackedPolicySize:{type:"integer"}}}},GetSessionToken:{input:{type:"structure",members:{DurationSeconds:{type:"integer"},SerialNumber:{},TokenCode:{}}},output:{resultWrapper:"GetSessionTokenResult",type:"structure",members:{Credentials:{shape:"Sh"}}}}},shapes:{S4:{type:"list",member:{type:"structure",members:{arn:{}}}},S8:{type:"list",member:{type:"structure",required:["Key","Value"],members:{Key:{},Value:{}}}},Sh:{type:"structure",required:["AccessKeyId","SecretAccessKey","SessionToken","Expiration"],members:{AccessKeyId:{},SecretAccessKey:{},SessionToken:{},Expiration:{type:"timestamp"}}},Sm:{type:"structure",required:["AssumedRoleId","Arn"],members:{AssumedRoleId:{},Arn:{}}}},paginators:{}};
diff --git a/test/debug_logger.py b/test/debug_logger.py
new file mode 100644
index 0000000000..a632cfc36c
--- /dev/null
+++ b/test/debug_logger.py
@@ -0,0 +1,366 @@
+# Copyright (c) 2010-2021 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import collections
+import contextlib
+import logging
+from unittest import mock
+import sys
+
+from collections import defaultdict
+
+from swift.common import utils, statsd_client
+from swift.common.utils import NOTICE
+
+
+class WARN_DEPRECATED(Exception):
+    def __init__(self, msg):
+        self.msg = msg
+        print(self.msg)
+
+
+SendtoCall = collections.namedtuple('SendToCall', ['payload', 'address'])
+
+
+class RecordingSocket(object):
+    def __init__(self):
+        self.sendto_calls = []
+
+    def sendto(self, payload, address):
+        self.sendto_calls.append(SendtoCall(payload, address))
+
+    def close(self):
+        pass
+
+
+class BaseFakeStatsdClient:
+    def __init__(self):
+        self.clear()
+
+        # Capture then call parent public stat functions
+        self.update_stats = self._capture("update_stats")
+        self.increment = self._capture("increment")
+        self.decrement = self._capture("decrement")
+        self.timing = self._capture("timing")
+        self.timing_since = self._capture("timing_since")
+        self.transfer_rate = self._capture("transfer_rate")
+
+    def _capture(self, func_name):
+        # this works in subclasses because super() searches the next inherited
+        # class after BaseFakeStatsdClient i.e. the real StatsdClient class
+        func = getattr(super(BaseFakeStatsdClient, self), func_name)
+
+        def wrapper(*args, **kwargs):
+            self.calls[func_name].append((args, kwargs))
+            return func(*args, **kwargs)
+        return wrapper
+
+    def _set_sock_family_and_target(self, host, port):
+        self._target = (host, port)
+
+    def _open_socket(self):
+        return self.recording_socket
+
+    def clear(self):
+        self.calls = defaultdict(list)
+        self.recording_socket = RecordingSocket()
+        self.counters = defaultdict(int)
+        self.labeled_stats_counters = defaultdict(int)
+
+    @property
+    def sendto_calls(self):
+        return self.recording_socket.sendto_calls
+
+    def get_increments(self):
+        """
+        Helper to avoid spelling a tricky list comprehension
+
+        :returns: a list of the "metric" arg for all calls to increment
+        """
+        return [call[0][0] for call in self.calls['increment']]
+
+    def _update_stats(self, metric, value, *args, **kwargs):
+        """
+        Hook into base class primitive to track all "counter" metrics
+        """
+        self.counters[metric] += value
+        labels = kwargs.get('labels', None)
+        if labels is not None:
+            hashable_labels = frozenset(labels.items())
+            self.labeled_stats_counters[(metric, hashable_labels)] += value
+        return super()._update_stats(metric, value, *args, **kwargs)
+
+    def get_labeled_stats_counts(self):
+        return self.labeled_stats_counters
+
+    # getter for backwards compat
+    def get_stats_counts(self):
+        return self.counters
+
+
+class FakeStatsdClient(BaseFakeStatsdClient, statsd_client.StatsdClient):
+    def __init__(self, *args, **kwargs):
+        super(FakeStatsdClient, self).__init__()
+        super(BaseFakeStatsdClient, self).__init__(*args, **kwargs)
+
+
+class FakeLabeledStatsdClient(BaseFakeStatsdClient,
+                              statsd_client.LabeledStatsdClient):
+    def __init__(self, *args, **kwargs):
+        super(FakeLabeledStatsdClient, self).__init__()
+        super(BaseFakeStatsdClient, self).__init__(*args, **kwargs)
+
+
+class CaptureLog(object):
+    """
+    Captures log records passed to the ``handle`` method and provides accessor
+    functions to the captured logs.
+    """
+
+    def __init__(self):
+        self.clear()
+
+    def _clear(self):
+        self.log_dict = defaultdict(list)
+        self.lines_dict = {'critical': [], 'error': [], 'info': [],
+                           'warning': [], 'debug': [], 'notice': []}
+
+    clear = _clear  # this is a public interface
+
+    def get_lines_for_level(self, level):
+        if level not in self.lines_dict:
+            raise KeyError(
+                "Invalid log level '%s'; valid levels are %s" %
+                (level,
+                 ', '.join("'%s'" % lvl for lvl in sorted(self.lines_dict))))
+        return self.lines_dict[level]
+
+    def all_log_lines(self):
+        return dict((level, msgs) for level, msgs in self.lines_dict.items()
+                    if len(msgs) > 0)
+
+    def _handle(self, record):
+        try:
+            line = record.getMessage()
+        except TypeError:
+            print('WARNING: unable to format log message %r %% %r' % (
+                record.msg, record.args))
+            raise
+        self.lines_dict[record.levelname.lower()].append(line)
+        return 0
+
+    def handle(self, record):
+        return self._handle(record)
+
+
+class FakeLogger(logging.Logger, CaptureLog):
+    # a thread safe fake logger
+
+    def __init__(self, *args, **kwargs):
+        self._clear()
+        self.name = kwargs.get('name') or 'swift.unit.fake_logger'
+        self.level = logging.NOTSET
+        if 'facility' in kwargs:
+            self.facility = kwargs['facility']
+        self.statsd_client = FakeStatsdClient('host', 8125)
+        self.thread_locals = None
+        self.parent = None
+        # ensure the NOTICE level has been named, in case it has not already
+        # been set
+        logging.addLevelName(NOTICE, 'NOTICE')
+
+    store_in = {
+        logging.ERROR: 'error',
+        logging.WARNING: 'warning',
+        logging.INFO: 'info',
+        logging.DEBUG: 'debug',
+        logging.CRITICAL: 'critical',
+        NOTICE: 'notice',
+    }
+
+    def clear(self):
+        self._clear()
+        self.statsd_client.clear()
+
+    def close(self):
+        self.clear()
+
+    def warn(self, *args, **kwargs):
+        raise WARN_DEPRECATED("Deprecated Method warn use warning instead")
+
+    def notice(self, msg, *args, **kwargs):
+        """
+        Convenience function for syslog priority LOG_NOTICE. The python
+        logging lvl is set to 25, just above info.  SysLogHandler is
+        monkey patched to map this log lvl to the LOG_NOTICE syslog
+        priority.
+        """
+        self.log(NOTICE, msg, *args, **kwargs)
+
+    def _log(self, level, msg, *args, **kwargs):
+        store_name = self.store_in[level]
+        cargs = [msg]
+        if any(args):
+            cargs.extend(args)
+        captured = dict(kwargs)
+        if 'exc_info' in kwargs and \
+                not isinstance(kwargs['exc_info'], tuple):
+            captured['exc_info'] = sys.exc_info()
+        self.log_dict[store_name].append((tuple(cargs), captured))
+        super(FakeLogger, self)._log(level, msg, *args, **kwargs)
+
+    def setFormatter(self, obj):
+        self.formatter = obj
+
+    def set_name(self, name):
+        # don't touch _handlers
+        self._name = name
+
+    def acquire(self):
+        pass
+
+    def release(self):
+        pass
+
+    def createLock(self):
+        pass
+
+    def emit(self, record):
+        pass
+
+    def flush(self):
+        pass
+
+    def handleError(self, record):
+        pass
+
+    def isEnabledFor(self, level):
+        return True
+
+
+class DebugSwiftLogFormatter(utils.SwiftLogFormatter):
+
+    def format(self, record):
+        msg = super(DebugSwiftLogFormatter, self).format(record)
+        return msg.replace('#012', '\n')
+
+
+class DebugLogger(FakeLogger):
+    """A simple stdout logging version of FakeLogger"""
+
+    def __init__(self, *args, **kwargs):
+        FakeLogger.__init__(self, *args, **kwargs)
+        self.formatter = DebugSwiftLogFormatter(
+            "%(server)s %(levelname)s: %(message)s")
+        self.records = defaultdict(list)
+
+    def handle(self, record):
+        self._handle(record)
+        formatted = self.formatter.format(record)
+        print(formatted)
+        self.records[record.levelname].append(formatted)
+
+
+class DebugLogAdapter(utils.logs.SwiftLogAdapter):
+    def __init__(self, *args, **kwargs):
+        super(DebugLogAdapter, self).__init__(*args, **kwargs)
+        self.txn_id = None
+
+    def __getattribute__(self, name):
+        try:
+            return object.__getattribute__(self, name)
+        except AttributeError:
+            return getattr(self.__dict__['logger'], name)
+
+
+def debug_logger(name='test', log_route=None):
+    """get a named adapted debug logger"""
+    log_route = log_route or name
+    adapted_logger = DebugLogAdapter(DebugLogger(name=log_route), name)
+    utils._patch_statsd_methods(adapted_logger, adapted_logger.logger)
+    return adapted_logger
+
+
+def debug_statsd_client(conf):
+    """get a configured statsd client"""
+    with mock.patch('swift.common.statsd_client.StatsdClient',
+                    FakeStatsdClient):
+        return statsd_client.get_statsd_client(conf)
+
+
+def debug_labeled_statsd_client(conf):
+    """get a configured labeled statsd client"""
+    with mock.patch('swift.common.statsd_client.LabeledStatsdClient',
+                    FakeLabeledStatsdClient):
+        return statsd_client.get_labeled_statsd_client(conf)
+
+
+class ForwardingLogHandler(logging.NullHandler):
+    """
+    Provides a LogHandler implementation that simply forwards filtered records
+    to a given handler function. This can be useful to forward records to a
+    handler without the handler itself needing to subclass LogHandler.
+    """
+
+    def __init__(self, handler_fn):
+        super(ForwardingLogHandler, self).__init__()
+        self.handler_fn = handler_fn
+
+    def handle(self, record):
+        return self.handler_fn(record)
+
+
+class CaptureLogAdapter(utils.logs.SwiftLogAdapter, CaptureLog):
+    """
+    A LogAdapter that is capable of capturing logs for inspection via accessor
+    methods.
+    """
+
+    def __init__(self, logger, name):
+        super(CaptureLogAdapter, self).__init__(logger, name)
+        self.clear()
+        self.handler = ForwardingLogHandler(self.handle)
+
+    def start_capture(self):
+        """
+        Attaches the adapter's handler to the adapted logger in order to start
+        capturing log messages.
+        """
+        self.logger.addHandler(self.handler)
+
+    def stop_capture(self):
+        """
+        Detaches the adapter's handler from the adapted logger. This should be
+        called to prevent further logging to the adapted logger (possibly via
+        other log adapter instances) being captured by this instance.
+        """
+        self.logger.removeHandler(self.handler)
+
+
+@contextlib.contextmanager
+def capture_logger(conf, *args, **kwargs):
+    """
+    Yields an adapted system logger based on the conf options. The log adapter
+    captures logs in order to support the pattern of tests calling the log
+    accessor methods (e.g. get_lines_for_level) directly on the logger
+    instance.
+    """
+    with mock.patch('swift.common.utils.logs.SwiftLogAdapter',
+                    CaptureLogAdapter):
+        log_adapter = utils.get_logger(conf, *args, **kwargs)
+    log_adapter.start_capture()
+    try:
+        yield log_adapter
+    finally:
+        log_adapter.stop_capture()
diff --git a/test/functional/__init__.py b/test/functional/__init__.py
index e69de29bb2..dadbd98b01 100644
--- a/test/functional/__init__.py
+++ b/test/functional/__init__.py
@@ -0,0 +1,1339 @@
+# Copyright (c) 2014 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+
+import configparser
+import contextlib
+
+from unittest import mock
+import os
+from urllib.parse import urlparse, urlsplit, urlunsplit
+import sys
+import socket
+import locale
+import eventlet
+import eventlet.debug
+import functools
+import random
+import base64
+
+from time import time, sleep
+from shutil import rmtree
+from tempfile import mkdtemp
+from unittest import SkipTest
+
+from configparser import ConfigParser
+import http.client
+from http.client import HTTPException
+
+from swift.common.middleware.memcache import MemcacheMiddleware
+from swift.common.storage_policy import parse_storage_policies, PolicyError
+from swift.common.utils import set_swift_dir
+
+from test import get_config, listen_zero
+
+from test.debug_logger import debug_logger
+from test.unit import FakeMemcache
+# importing skip_if_no_xattrs so that functional tests can grab it from the
+# test.functional namespace.
+from test.unit import skip_if_no_xattrs as real_skip_if_no_xattrs
+
+from swift.common import constraints, utils, ring, storage_policy
+from swift.common.ring import Ring
+from swift.common.http_protocol import SwiftHttpProtocol
+from swift.common.wsgi import loadapp
+from swift.common.utils import config_true_value, split_path
+from swift.account import server as account_server
+from swift.container import server as container_server
+from swift.obj import server as object_server, mem_server as mem_object_server
+import swift.proxy.controllers.obj
+
+http.client._MAXHEADERS = constraints.MAX_HEADER_COUNT
+DEBUG = True
+
+# In order to get the proper blocking behavior of sockets without using
+# threads, where we can set an arbitrary timeout for some piece of code under
+# test, we use eventlet with the standard socket library patched. We have to
+# perform this setup at module import time, since all the socket module
+# bindings in the swiftclient code will have been made by the time nose
+# invokes the package or class setup methods.
+eventlet.hubs.use_hub(utils.get_hub())
+eventlet.patcher.monkey_patch(all=False, socket=True)
+eventlet.debug.hub_exceptions(False)
+
+# swift_test_client import from swiftclient, so move after the monkey-patching
+from test.functional.swift_test_client import Account, Connection, Container, \
+    ResponseError
+
+from swiftclient import get_auth, http_connection
+
+config = {}
+web_front_end = None
+normalized_urls = None
+
+# If no config was read, we will fall back to old school env vars
+swift_test_auth_version = None
+swift_test_auth = os.environ.get('SWIFT_TEST_AUTH')
+swift_test_user = [os.environ.get('SWIFT_TEST_USER'), None, None, '', '', '']
+swift_test_key = [os.environ.get('SWIFT_TEST_KEY'), None, None, '', '', '']
+swift_test_tenant = ['', '', '', '', '', '']
+swift_test_perm = ['', '', '', '', '', '']
+swift_test_domain = ['', '', '', '', '', '']
+swift_test_user_id = ['', '', '', '', '', '']
+swift_test_tenant_id = ['', '', '', '', '', '']
+
+skip, skip2, skip3, skip_if_not_v3, skip_service_tokens, \
+    skip_if_no_reseller_admin = False, False, False, False, False, False
+
+orig_collate = ''
+insecure = False
+
+in_process = False
+_testdir = _test_servers = _test_coros = _test_socks = None
+policy_specified = None
+skip_if_no_xattrs = None
+
+
+class FakeMemcacheMiddleware(MemcacheMiddleware):
+    """
+    Caching middleware that fakes out caching in swift if memcached
+    does not appear to be running.
+    """
+
+    def __init__(self, app, conf):
+        super(FakeMemcacheMiddleware, self).__init__(app, conf)
+        self.memcache = FakeMemcache()
+
+
+class InProcessException(BaseException):
+    pass
+
+
+def _info(msg):
+    print(msg, file=sys.stderr)
+
+
+def _debug(msg):
+    if DEBUG:
+        _info('DEBUG: ' + msg)
+
+
+@contextlib.contextmanager
+def _modify_conf_file(src_conf_file, dest_conf_file):
+    conf = ConfigParser()
+    conf.read(src_conf_file)
+    try:
+        yield conf
+    except configparser.Error as err:
+        msg = 'Error modifying conf file %s: %s' % (src_conf_file, err)
+        raise InProcessException(msg)
+    else:
+        with open(dest_conf_file, 'w') as fp:
+            conf.write(fp)
+
+
+def _cleanup_pipeline(pipeline_str):
+    # return single-whitespace delimited and padded string
+    # e.g. "x   y  " -> " x y "
+    return ' %s ' % ' '.join([x for x in pipeline_str.split(' ') if x])
+
+
+def _modify_pipeline_substring(conf, old_substr, new_substr):
+    section = 'pipeline:main'
+    old_pipeline = _cleanup_pipeline(conf.get(section, 'pipeline'))
+    old_substr = _cleanup_pipeline(old_substr)
+    new_substr = _cleanup_pipeline(new_substr)
+    if old_substr not in old_pipeline:
+        raise InProcessException(
+            'Failed to replace pipeline substring: old="%s", new="%s", '
+            'pipeline="%s"' % (old_substr, new_substr, old_pipeline))
+
+    if new_substr in old_pipeline:
+        _info('WARNING: "%s" is already in pipeline, not replacing'
+              % new_substr)
+        new_pipeline = old_pipeline
+    else:
+        new_pipeline = old_pipeline.replace(old_substr, new_substr)
+        _debug('Replaced pipeline substring "%s" with "%s"'
+               % (old_substr, new_substr))
+    # remove padding
+    new_pipeline = new_pipeline.strip(' ')
+    conf.set(section, 'pipeline', new_pipeline)
+    _debug('Proxy pipeline is now "%s"' % new_pipeline)
+
+
+def _in_process_setup_swift_conf(swift_conf_src, testdir):
+    # override swift.conf contents for in-process functional test runs
+    test_conf_file = os.path.join(testdir, 'swift.conf')
+    with _modify_conf_file(swift_conf_src, test_conf_file) as conf:
+        section = 'swift-hash'
+        conf.set(section, 'swift_hash_path_suffix', 'inprocfunctests')
+        conf.set(section, 'swift_hash_path_prefix', 'inprocfunctests')
+        section = 'swift-constraints'
+        max_file_size = (8 * 1024 * 1024) + 2  # 8 MB + 2
+        conf.set(section, 'max_file_size', str(max_file_size))
+
+    return test_conf_file
+
+
+def _in_process_find_conf_file(conf_src_dir, conf_file_name, use_sample=True):
+    """
+    Look for a file first in conf_src_dir, if it exists, otherwise optionally
+    look in the source tree sample 'etc' dir.
+
+    :param conf_src_dir: Directory in which to search first for conf file. May
+                         be None
+    :param conf_file_name: Name of conf file
+    :param use_sample: If True and the conf_file_name is not found, then return
+                       any sample conf file found in the source tree sample
+                       'etc' dir by appending '-sample' to conf_file_name
+    :returns: Path to conf file
+    :raises InProcessException: If no conf file is found
+    """
+    dflt_src_dir = os.path.normpath(os.path.join(os.path.abspath(__file__),
+                                    os.pardir, os.pardir, os.pardir,
+                                    'etc'))
+    conf_src_dir = dflt_src_dir if conf_src_dir is None else conf_src_dir
+    conf_file_path = os.path.join(conf_src_dir, conf_file_name)
+    if os.path.exists(conf_file_path):
+        return conf_file_path
+
+    if use_sample:
+        # fall back to using the corresponding sample conf file
+        conf_file_name += '-sample'
+        conf_file_path = os.path.join(dflt_src_dir, conf_file_name)
+        if os.path.exists(conf_file_path):
+            return conf_file_path
+
+    msg = 'Failed to find config file %s' % conf_file_name
+    raise InProcessException(msg)
+
+
+def _in_process_setup_ring(swift_conf, conf_src_dir, testdir):
+    """
+    If SWIFT_TEST_POLICY is set:
+    - look in swift.conf file for specified policy
+    - move this to be policy-0 but preserving its options
+    - copy its ring file to test dir, changing its devices to suit
+      in process testing, and renaming it to suit policy-0
+    Otherwise, create a default ring file.
+    """
+    with _modify_conf_file(swift_conf, swift_conf) as conf:
+        sp_prefix = 'storage-policy:'
+
+        try:
+            # policy index 0 will be created if no policy exists in conf
+            policies = parse_storage_policies(conf)
+        except PolicyError as e:
+            raise InProcessException(e)
+
+        # clear all policies from test swift.conf before adding test policy
+        # back
+        for policy in policies:
+            conf.remove_section(sp_prefix + str(policy.idx))
+
+        if policy_specified:
+            policy_to_test = policies.get_by_name(policy_specified)
+            if policy_to_test is None:
+                raise InProcessException('Failed to find policy name "%s"'
+                                         % policy_specified)
+            _info('Using specified policy %s' % policy_to_test.name)
+        else:
+            policy_to_test = policies.default
+            _info('Defaulting to policy %s' % policy_to_test.name)
+
+        # make policy_to_test be policy index 0 and default for the test config
+        sp_zero_section = sp_prefix + '0'
+        conf.add_section(sp_zero_section)
+        for (k, v) in policy_to_test.get_info(config=True).items():
+            conf.set(sp_zero_section, k, str(v))
+        conf.set(sp_zero_section, 'default', 'True')
+
+    # look for a source ring file
+    ring_file_src = ring_file_test = 'object.ring.gz'
+    if policy_to_test.idx:
+        ring_file_src = 'object-%s.ring.gz' % policy_to_test.idx
+    try:
+        ring_file_src = _in_process_find_conf_file(conf_src_dir, ring_file_src,
+                                                   use_sample=False)
+    except InProcessException:
+        if policy_specified:
+            raise InProcessException('Failed to find ring file %s'
+                                     % ring_file_src)
+        ring_file_src = None
+
+    ring_file_test = os.path.join(testdir, ring_file_test)
+    if ring_file_src:
+        # copy source ring file to a policy-0 test ring file, re-homing servers
+        _info('Using source ring file %s' % ring_file_src)
+        ring_data = ring.RingData.load(ring_file_src)
+        obj_sockets = []
+        for dev in ring_data.devs:
+            device = 'sd%c1' % chr(len(obj_sockets) + ord('a'))
+            utils.mkdirs(os.path.join(_testdir, 'sda1'))
+            utils.mkdirs(os.path.join(_testdir, 'sda1', 'tmp'))
+            obj_socket = listen_zero()
+            obj_sockets.append(obj_socket)
+            dev['port'] = obj_socket.getsockname()[1]
+            dev['ip'] = '127.0.0.1'
+            dev['device'] = device
+            dev['replication_port'] = dev['port']
+            dev['replication_ip'] = dev['ip']
+        ring_data.save(ring_file_test)
+    else:
+        # make default test ring, 3 replicas, 4 partitions, 3 devices
+        # which will work for a replication policy or a 2+1 EC policy
+        _info('No source object ring file, creating 3rep/4part/3dev ring')
+        obj_sockets = [listen_zero() for _ in (0, 1, 2)]
+        replica2part2dev_id = [[0, 1, 2, 0],
+                               [1, 2, 0, 1],
+                               [2, 0, 1, 2]]
+        devs = [{'id': 0, 'region': 1, 'zone': 0, 'device': 'sda1',
+                 'ip': '127.0.0.1', 'port': obj_sockets[0].getsockname()[1]},
+                {'id': 1, 'region': 1, 'zone': 1, 'device': 'sdb1',
+                 'ip': '127.0.0.1', 'port': obj_sockets[1].getsockname()[1]},
+                {'id': 2, 'region': 1, 'zone': 2, 'device': 'sdc1',
+                 'ip': '127.0.0.1', 'port': obj_sockets[2].getsockname()[1]}]
+        ring_data = ring.RingData(replica2part2dev_id, devs, 30)
+        ring_data.save(ring_file_test)
+
+    for dev in ring_data.devs:
+        _debug('Ring file dev: %s' % dev)
+
+    return obj_sockets
+
+
+def _load_etag_quoter(proxy_conf_file, swift_conf_file, **kwargs):
+    _debug('Ensuring etag-quoter is in proxy pipeline')
+    test_conf_file = os.path.join(_testdir, 'proxy-server.conf')
+    with _modify_conf_file(proxy_conf_file, test_conf_file) as conf:
+        _modify_pipeline_substring(
+            conf,
+            "cache",
+            "cache etag-quoter")
+
+    return test_conf_file, swift_conf_file
+
+
+def _load_encryption(proxy_conf_file, swift_conf_file, **kwargs):
+    """
+    Load encryption configuration and override proxy-server.conf contents.
+
+    :param proxy_conf_file: Source proxy conf filename
+    :param swift_conf_file: Source swift conf filename
+    :returns: Tuple of paths to the proxy conf file and swift conf file to use
+    :raises InProcessException: raised if proxy conf contents are invalid
+    """
+    _debug('Setting configuration for encryption')
+
+    # The global conf dict cannot be used to modify the pipeline.
+    # The pipeline loader requires the pipeline to be set in the local_conf.
+    # If pipeline is set in the global conf dict (which in turn populates the
+    # DEFAULTS options) then it prevents pipeline being loaded into the local
+    # conf during wsgi load_app.
+    # Therefore we must modify the [pipeline:main] section.
+
+    test_conf_file = os.path.join(_testdir, 'proxy-server.conf')
+    with _modify_conf_file(proxy_conf_file, test_conf_file) as conf:
+        _modify_pipeline_substring(
+            conf,
+            "proxy-logging proxy-server",
+            "keymaster encryption proxy-logging proxy-server")
+        root_secret = base64.b64encode(os.urandom(32)).decode('ascii')
+        conf.set('filter:keymaster', 'encryption_root_secret', root_secret)
+        conf.set('filter:versioned_writes', 'allow_object_versioning', 'true')
+        conf.set('filter:etag-quoter', 'enable_by_default', 'true')
+
+    return _load_etag_quoter(test_conf_file, swift_conf_file)
+
+
+def _load_ec_as_default_policy(proxy_conf_file, swift_conf_file, **kwargs):
+    """
+    Override swift.conf [storage-policy:0] section to use a 2+1 EC policy.
+
+    :param proxy_conf_file: Source proxy conf filename
+    :param swift_conf_file: Source swift conf filename
+    :returns: Tuple of paths to the proxy conf file and swift conf file to use
+    """
+    _debug('Setting configuration for default EC policy')
+
+    with _modify_conf_file(swift_conf_file, swift_conf_file) as conf:
+        # remove existing policy sections that came with swift.conf-sample
+        for section in list(conf.sections()):
+            if section.startswith('storage-policy'):
+                conf.remove_section(section)
+        # add new policy 0 section for an EC policy
+        conf.add_section('storage-policy:0')
+        ec_policy_spec = {
+            'name': 'ec-test',
+            'policy_type': 'erasure_coding',
+            'ec_type': 'liberasurecode_rs_vand',
+            'ec_num_data_fragments': 2,
+            'ec_num_parity_fragments': 1,
+            'ec_object_segment_size': 1048576,
+            'default': True
+        }
+
+        for k, v in ec_policy_spec.items():
+            conf.set('storage-policy:0', k, str(v))
+
+    return proxy_conf_file, swift_conf_file
+
+
+def _load_domain_remap_staticweb(proxy_conf_file, swift_conf_file, **kwargs):
+    """
+    Load domain_remap and staticweb into proxy server pipeline.
+
+    :param proxy_conf_file: Source proxy conf filename
+    :param swift_conf_file: Source swift conf filename
+    :returns: Tuple of paths to the proxy conf file and swift conf file to use
+    :raises InProcessException: raised if proxy conf contents are invalid
+    """
+    _debug('Setting configuration for domain_remap')
+
+    # add a domain_remap storage_domain to the test configuration
+    storage_domain = 'example.net'
+    global config
+    config['storage_domain'] = storage_domain
+
+    # The global conf dict cannot be used to modify the pipeline.
+    # The pipeline loader requires the pipeline to be set in the local_conf.
+    # If pipeline is set in the global conf dict (which in turn populates the
+    # DEFAULTS options) then it prevents pipeline being loaded into the local
+    # conf during wsgi load_app.
+    # Therefore we must modify the [pipeline:main] section.
+    test_conf_file = os.path.join(_testdir, 'proxy-server.conf')
+    with _modify_conf_file(proxy_conf_file, test_conf_file) as conf:
+        _modify_pipeline_substring(
+            conf,
+            "tempauth",
+            "tempauth staticweb")
+        _modify_pipeline_substring(
+            conf,
+            "listing_formats",
+            "domain_remap listing_formats")
+        # set storage_domain in domain_remap middleware to match test config
+        section = 'filter:domain_remap'
+        conf.set(section, 'storage_domain', storage_domain)
+
+    return test_conf_file, swift_conf_file
+
+
+def _load_s3api(proxy_conf_file, swift_conf_file, **kwargs):
+    """
+    Load s3api configuration and override proxy-server.conf contents.
+
+    :param proxy_conf_file: Source proxy conf filename
+    :param swift_conf_file: Source swift conf filename
+    :returns: Tuple of paths to the proxy conf file and swift conf file to use
+    :raises InProcessException: raised if proxy conf contents are invalid
+    """
+    _debug('Setting configuration for s3api')
+
+    # The global conf dict cannot be used to modify the pipeline.
+    # The pipeline loader requires the pipeline to be set in the local_conf.
+    # If pipeline is set in the global conf dict (which in turn populates the
+    # DEFAULTS options) then it prevents pipeline being loaded into the local
+    # conf during wsgi load_app.
+    # Therefore we must modify the [pipeline:main] section.
+
+    test_conf_file = os.path.join(_testdir, 'proxy-server.conf')
+    with _modify_conf_file(proxy_conf_file, test_conf_file) as conf:
+        _modify_pipeline_substring(
+            conf,
+            "tempauth",
+            "s3api tempauth")
+        conf.set('filter:s3api', 's3_acl', 'true')
+
+        conf.set('filter:versioned_writes', 'allow_object_versioning', 'true')
+
+    return test_conf_file, swift_conf_file
+
+
+# Mapping from possible values of the variable
+# SWIFT_TEST_IN_PROCESS_CONF_LOADER
+# to the method to call for loading the associated configuration
+# The expected signature for these methods is:
+# conf_filename_to_use loader(input_conf_filename, **kwargs)
+conf_loaders = {
+    'encryption': _load_encryption,
+    'ec': _load_ec_as_default_policy,
+}
+
+
+def in_process_setup(the_object_server=object_server):
+    _info('IN-PROCESS SERVERS IN USE FOR FUNCTIONAL TESTS')
+    _info('Using object_server class: %s' % the_object_server.__name__)
+    conf_src_dir = os.environ.get('SWIFT_TEST_IN_PROCESS_CONF_DIR')
+    show_debug_logs = os.environ.get('SWIFT_TEST_DEBUG_LOGS')
+
+    if conf_src_dir is not None:
+        if not os.path.isdir(conf_src_dir):
+            msg = 'Config source %s is not a dir' % conf_src_dir
+            raise InProcessException(msg)
+        _info('Using config source dir: %s' % conf_src_dir)
+
+    # If SWIFT_TEST_IN_PROCESS_CONF specifies a config source dir then
+    # prefer config files from there, otherwise read config from source tree
+    # sample files. A mixture of files from the two sources is allowed.
+    proxy_conf = _in_process_find_conf_file(conf_src_dir, 'proxy-server.conf')
+    _info('Using proxy config from %s' % proxy_conf)
+    swift_conf_src = _in_process_find_conf_file(conf_src_dir, 'swift.conf')
+    _info('Using swift config from %s' % swift_conf_src)
+
+    global _testdir
+    _testdir = os.path.join(mkdtemp(), 'tmp_functional')
+    utils.mkdirs(_testdir)
+    rmtree(_testdir)
+    utils.mkdirs(os.path.join(_testdir, 'sda1'))
+    utils.mkdirs(os.path.join(_testdir, 'sda1', 'tmp'))
+    utils.mkdirs(os.path.join(_testdir, 'sdb1'))
+    utils.mkdirs(os.path.join(_testdir, 'sdb1', 'tmp'))
+    utils.mkdirs(os.path.join(_testdir, 'sdc1'))
+    utils.mkdirs(os.path.join(_testdir, 'sdc1', 'tmp'))
+
+    swift_conf = _in_process_setup_swift_conf(swift_conf_src, _testdir)
+    _info('prepared swift.conf: %s' % swift_conf)
+
+    # load s3api and staticweb configs
+    proxy_conf, swift_conf = _load_s3api(proxy_conf, swift_conf)
+    proxy_conf, swift_conf = _load_domain_remap_staticweb(proxy_conf,
+                                                          swift_conf)
+
+    # Call the associated method for the value of
+    # 'SWIFT_TEST_IN_PROCESS_CONF_LOADER', if one exists
+    conf_loader_label = os.environ.get(
+        'SWIFT_TEST_IN_PROCESS_CONF_LOADER')
+    if conf_loader_label is not None:
+        try:
+            conf_loader = conf_loaders[conf_loader_label]
+            _debug('Calling method %s mapped to conf loader %s' %
+                   (conf_loader.__name__, conf_loader_label))
+        except KeyError as missing_key:
+            raise InProcessException('No function mapped for conf loader %s' %
+                                     missing_key)
+
+        try:
+            # Pass-in proxy_conf, swift_conf files
+            proxy_conf, swift_conf = conf_loader(proxy_conf, swift_conf)
+            _debug('Now using proxy conf %s' % proxy_conf)
+            _debug('Now using swift conf %s' % swift_conf)
+        except Exception as err:  # noqa
+            raise InProcessException(err)
+
+    obj_sockets = _in_process_setup_ring(swift_conf, conf_src_dir, _testdir)
+
+    # load new swift.conf file
+    if set_swift_dir(os.path.dirname(swift_conf)):
+        constraints.reload_constraints()
+        storage_policy.reload_storage_policies()
+
+    global config
+    if constraints.SWIFT_CONSTRAINTS_LOADED:
+        # Use the swift constraints that are loaded for the test framework
+        # configuration
+        _c = dict((k, str(v))
+                  for k, v in constraints.EFFECTIVE_CONSTRAINTS.items())
+        config.update(_c)
+    else:
+        # In-process swift constraints were not loaded, somethings wrong
+        raise SkipTest
+
+    global _test_socks
+    _test_socks = []
+    # We create the proxy server listening socket to get its port number so
+    # that we can add it as the "auth_port" value for the functional test
+    # clients.
+    prolis = listen_zero()
+    _test_socks.append(prolis)
+
+    # The following set of configuration values is used both for the
+    # functional test frame work and for the various proxy, account, container
+    # and object servers.
+    config.update({
+        # Values needed by the various in-process swift servers
+        'devices': _testdir,
+        'swift_dir': _testdir,
+        'mount_check': 'false',
+        'client_timeout': '4',
+        'container_update_timeout': '3',
+        'allow_account_management': 'true',
+        'account_autocreate': 'true',
+        'allow_open_expired': 'true',
+        'allow_versions': 'True',
+        'allow_versioned_writes': 'True',
+        # Below are values used by the functional test framework, as well as
+        # by the various in-process swift servers
+        'auth_uri': 'http://127.0.0.1:%d/auth/v1.0/' % prolis.getsockname()[1],
+        's3_storage_url': 'http://%s:%d/' % prolis.getsockname(),
+        # Primary functional test account (needs admin access to the
+        # account)
+        'account': 'test',
+        'username': 'tester',
+        'password': 'testing',
+        's3_access_key': 'test:tester',
+        's3_secret_key': 'testing',
+        # Secondary user of the primary test account (needs admin access
+        # to the account) for s3api
+        's3_access_key2': 'test:tester2',
+        's3_secret_key2': 'testing2',
+        # User on a second account (needs admin access to the account)
+        'account2': 'test2',
+        'username2': 'tester2',
+        'password2': 'testing2',
+        # User on same account as first, but without admin access
+        'username3': 'tester3',
+        'password3': 'testing3',
+        's3_access_key3': 'test:tester3',
+        's3_secret_key3': 'testing3',
+        # Service user and prefix (emulates glance, cinder, etc. user)
+        'account5': 'test5',
+        'username5': 'tester5',
+        'password5': 'testing5',
+        'service_prefix': 'SERVICE',
+        # For tempauth middleware. Update reseller_prefix
+        'reseller_prefix': 'AUTH, SERVICE',
+        'SERVICE_require_group': 'service',
+        # Reseller admin user (needs reseller_admin_role)
+        'account6': 'admin',
+        'username6': 'admin',
+        'password6': 'admin'
+    })
+
+    acc1lis = listen_zero()
+    acc2lis = listen_zero()
+    con1lis = listen_zero()
+    con2lis = listen_zero()
+    _test_socks += [acc1lis, acc2lis, con1lis, con2lis] + obj_sockets
+
+    account_ring_path = os.path.join(_testdir, 'account.ring.gz')
+    ring.RingData(
+        [[0, 1, 0, 1], [1, 0, 1, 0]],
+        [{'id': 0, 'region': 1, 'zone': 0, 'device': 'sda1', 'ip': '127.0.0.1',
+          'port': acc1lis.getsockname()[1]},
+         {'id': 1, 'region': 1, 'zone': 1, 'device': 'sdb1', 'ip': '127.0.0.1',
+          'port': acc2lis.getsockname()[1]}], 30).save(account_ring_path)
+    container_ring_path = os.path.join(_testdir, 'container.ring.gz')
+    ring.RingData(
+        [[0, 1, 0, 1], [1, 0, 1, 0]],
+        [{'id': 0, 'region': 1, 'zone': 0, 'device': 'sda1', 'ip': '127.0.0.1',
+          'port': con1lis.getsockname()[1]},
+         {'id': 1, 'region': 1, 'zone': 1, 'device': 'sdb1', 'ip': '127.0.0.1',
+          'port': con2lis.getsockname()[1]}], 30).save(container_ring_path)
+
+    def get_logger_name(name):
+        if show_debug_logs:
+            return debug_logger(name)
+        else:
+            return None
+
+    acc1srv = account_server.AccountController(
+        config, logger=get_logger_name('acct1'))
+    acc2srv = account_server.AccountController(
+        config, logger=get_logger_name('acct2'))
+    con1srv = container_server.ContainerController(
+        config, logger=get_logger_name('cont1'))
+    con2srv = container_server.ContainerController(
+        config, logger=get_logger_name('cont2'))
+
+    objsrvs = [
+        (obj_sockets[index],
+         the_object_server.ObjectController(
+             config, logger=get_logger_name('obj%d' % (index + 1))))
+        for index in range(len(obj_sockets))
+    ]
+
+    if show_debug_logs:
+        logger = get_logger_name('proxy')
+    else:
+        logger = utils.get_logger(config, 'wsgi-server', log_route='wsgi')
+
+    def get_logger(name, *args, **kwargs):
+        return logger
+
+    with mock.patch('swift.common.utils.get_logger', get_logger):
+        with mock.patch('swift.common.middleware.memcache.MemcacheMiddleware',
+                        FakeMemcacheMiddleware):
+            try:
+                app = loadapp(proxy_conf, global_conf=config)
+            except Exception as e:
+                raise InProcessException(e)
+
+    nl = utils.NullLogger()
+    global proxy_srv
+    proxy_srv = prolis
+    prospa = eventlet.spawn(eventlet.wsgi.server, prolis, app, nl,
+                            protocol=SwiftHttpProtocol)
+    acc1spa = eventlet.spawn(eventlet.wsgi.server, acc1lis, acc1srv, nl,
+                             protocol=SwiftHttpProtocol)
+    acc2spa = eventlet.spawn(eventlet.wsgi.server, acc2lis, acc2srv, nl,
+                             protocol=SwiftHttpProtocol)
+    con1spa = eventlet.spawn(eventlet.wsgi.server, con1lis, con1srv, nl,
+                             protocol=SwiftHttpProtocol)
+    con2spa = eventlet.spawn(eventlet.wsgi.server, con2lis, con2srv, nl,
+                             protocol=SwiftHttpProtocol)
+
+    objspa = [eventlet.spawn(eventlet.wsgi.server, objsrv[0], objsrv[1], nl,
+                             protocol=SwiftHttpProtocol)
+              for objsrv in objsrvs]
+
+    global _test_coros
+    _test_coros = \
+        (prospa, acc1spa, acc2spa, con1spa, con2spa) + tuple(objspa)
+
+    # Create accounts "test" and "test2"
+    def create_account(act):
+        ts = utils.normalize_timestamp(time())
+        account_ring = Ring(_testdir, ring_name='account')
+        partition, nodes = account_ring.get_nodes(act)
+        for node in nodes:
+            # Note: we are just using the http_connect method in the object
+            # controller here to talk to the account server nodes.
+            conn = swift.proxy.controllers.obj.http_connect(
+                node['ip'], node['port'], node['device'], partition, 'PUT',
+                '/' + act, {'X-Timestamp': ts, 'x-trans-id': act})
+            resp = conn.getresponse()
+            assert resp.status == 201, 'Unable to create account: %s\n%s' % (
+                resp.status, resp.read())
+
+    create_account('AUTH_test')
+    create_account('AUTH_test2')
+
+
+cluster_info = {}
+
+
+def get_cluster_info():
+    # The fallback constraints used for testing will come from the current
+    # effective constraints.
+    eff_constraints = dict(constraints.EFFECTIVE_CONSTRAINTS)
+
+    # We'll update those constraints based on what the /info API provides, if
+    # anything.
+    global cluster_info
+    global config
+    try:
+        conn = Connection(config)
+        conn.authenticate()
+        cluster_info.update(conn.cluster_info())
+    except (ResponseError, socket.error, SkipTest):
+        # Failed to get cluster_information via /info API, so fall back on
+        # test.conf data
+        pass
+    else:
+        try:
+            eff_constraints.update(cluster_info['swift'])
+        except KeyError:
+            # Most likely the swift cluster has "expose_info = false" set
+            # in its proxy-server.conf file, so we'll just do the best we
+            # can.
+            print("** Swift Cluster not exposing /info **", file=sys.stderr)
+
+    # Finally, we'll allow any constraint present in the swift-constraints
+    # section of test.conf to override everything. Note that only those
+    # constraints defined in the constraints module are converted to integers.
+    test_constraints = get_config('swift-constraints')
+    for k in constraints.DEFAULT_CONSTRAINTS:
+        try:
+            test_constraints[k] = int(test_constraints[k])
+        except KeyError:
+            pass
+        except ValueError:
+            print("Invalid constraint value: %s = %s" % (
+                k, test_constraints[k]), file=sys.stderr)
+    eff_constraints.update(test_constraints)
+
+    # Just make it look like these constraints were loaded from a /info call,
+    # even if the /info call failed, or when they are overridden by values
+    # from the swift-constraints section of test.conf
+    cluster_info['swift'] = eff_constraints
+
+
+def setup_package():
+
+    global policy_specified
+    global skip_if_no_xattrs
+    policy_specified = os.environ.get('SWIFT_TEST_POLICY')
+    in_process_env = os.environ.get('SWIFT_TEST_IN_PROCESS')
+    if in_process_env is not None:
+        use_in_process = utils.config_true_value(in_process_env)
+    else:
+        use_in_process = None
+
+    global in_process
+
+    global config
+    if use_in_process:
+        # Explicitly set to True, so barrel on ahead with in-process
+        # functional test setup.
+        in_process = True
+        # NOTE: No attempt is made to a read local test.conf file.
+    else:
+        if use_in_process is None:
+            # Not explicitly set, default to using in-process functional tests
+            # if the test.conf file is not found, or does not provide a usable
+            # configuration.
+            config.update(get_config('func_test'))
+            if not config:
+                in_process = True
+            # else... leave in_process value unchanged. It may be that
+            # setup_package is called twice, in which case in_process_setup may
+            # have loaded config before we reach here a second time, so the
+            # existence of config is not reliable to determine that in_process
+            # should be False. Anyway, it's default value is False.
+        else:
+            # Explicitly set to False, do not attempt to use in-process
+            # functional tests, be sure we attempt to read from local
+            # test.conf file.
+            in_process = False
+            config.update(get_config('func_test'))
+
+    if in_process:
+        in_mem_obj_env = os.environ.get('SWIFT_TEST_IN_MEMORY_OBJ')
+        in_mem_obj = utils.config_true_value(in_mem_obj_env)
+        skip_if_no_xattrs = real_skip_if_no_xattrs
+        try:
+            in_process_setup(the_object_server=(
+                mem_object_server if in_mem_obj else object_server))
+        except InProcessException as exc:
+            print(('Exception during in-process setup: %s'
+                   % str(exc)), file=sys.stderr)
+            raise
+    else:
+        skip_if_no_xattrs = lambda: None
+
+    global web_front_end
+    web_front_end = config.get('web_front_end', 'integral')
+    global normalized_urls
+    normalized_urls = utils.config_true_value(
+        config.get('normalized_urls', False))
+
+    global orig_collate
+    orig_collate = locale.setlocale(locale.LC_COLLATE)
+    locale.setlocale(locale.LC_COLLATE, config.get('collate', 'C'))
+
+    global insecure
+    insecure = config_true_value(config.get('insecure', False))
+
+    global swift_test_auth_version
+    global swift_test_auth
+    global swift_test_user
+    global swift_test_key
+    global swift_test_tenant
+    global swift_test_perm
+    global swift_test_domain
+    global swift_test_service_prefix
+
+    swift_test_service_prefix = None
+
+    if config:
+        swift_test_auth_version = str(config.get('auth_version', '1'))
+
+        if 'auth_uri' in config:
+            swift_test_auth = config['auth_uri']
+            # Back-fill the individual parts -- really, we should just need
+            # host and port for s3_test_client, and that's only until we
+            # improve it to take a s3_storage_url option
+            parsed = urlsplit(config['auth_uri'])
+            config.update({
+                'auth_ssl': str(parsed.scheme == 'https'),
+                'auth_host': parsed.hostname,
+                'auth_port': str(
+                    parsed.port if parsed.port is not None else
+                    443 if parsed.scheme == 'https' else 80),
+                'auth_prefix': parsed.path,
+            })
+            config.setdefault('s3_storage_url',
+                              urlunsplit(parsed[:2] + ('', None, None)))
+        elif 'auth_host' in config:
+            scheme = 'http'
+            if config_true_value(config.get('auth_ssl', 'no')):
+                scheme = 'https'
+            netloc = config['auth_host']
+            if 'auth_port' in config:
+                netloc += ':' + config['auth_port']
+            auth_prefix = config.get('auth_prefix', '/')
+            if swift_test_auth_version == "1":
+                auth_prefix += 'v1.0'
+            config['auth_uri'] = swift_test_auth = urlunsplit(
+                (scheme, netloc, auth_prefix, None, None))
+            config.setdefault('s3_storage_url', urlunsplit(
+                (scheme, netloc, '', None, None)))
+        # else, neither auth_uri nor auth_host; swift_test_auth will be unset
+        # and we'll skip everything later
+
+        if 'service_prefix' in config:
+            swift_test_service_prefix = utils.append_underscore(
+                config['service_prefix'])
+
+        if swift_test_auth_version == "1":
+
+            try:
+                if 'account' in config:
+                    swift_test_user[0] = '%(account)s:%(username)s' % config
+                else:
+                    swift_test_user[0] = '%(username)s' % config
+                swift_test_key[0] = config['password']
+            except KeyError:
+                # bad config, no account/username configured, tests cannot be
+                # run
+                pass
+            try:
+                swift_test_user[1] = '%s%s' % (
+                    '%s:' % config['account2'] if 'account2' in config else '',
+                    config['username2'])
+                swift_test_key[1] = config['password2']
+            except KeyError:
+                pass  # old config, no second account tests can be run
+            try:
+                swift_test_user[2] = '%s%s' % (
+                    '%s:' % config['account'] if 'account'
+                    in config else '', config['username3'])
+                swift_test_key[2] = config['password3']
+            except KeyError:
+                pass  # old config, no third account tests can be run
+            try:
+                swift_test_user[4] = '%s%s' % (
+                    '%s:' % config['account5'], config['username5'])
+                swift_test_key[4] = config['password5']
+                swift_test_tenant[4] = config['account5']
+            except KeyError:
+                pass  # no service token tests can be run
+            try:
+                swift_test_user[5] = '%s%s' % (
+                    '%s:' % config['account6'], config['username6'])
+                swift_test_key[5] = config['password6']
+                swift_test_tenant[5] = config['account6']
+            except KeyError:
+                pass  # no reseller admin tests can be run
+
+            for _ in range(3):
+                swift_test_perm[_] = swift_test_user[_]
+
+        else:
+            swift_test_user[0] = config['username']
+            swift_test_tenant[0] = config['account']
+            swift_test_key[0] = config['password']
+            if 'domain' in config:
+                swift_test_domain[0] = config['domain']
+            swift_test_user[1] = config['username2']
+            swift_test_tenant[1] = config['account2']
+            swift_test_key[1] = config['password2']
+            if 'domain2' in config:
+                swift_test_domain[1] = config['domain2']
+            swift_test_user[2] = config['username3']
+            swift_test_tenant[2] = config['account']
+            swift_test_key[2] = config['password3']
+            if 'domain3' in config:
+                swift_test_domain[2] = config['domain3']
+            if 'username4' in config:
+                swift_test_user[3] = config['username4']
+                swift_test_tenant[3] = config['account4']
+                swift_test_key[3] = config['password4']
+                swift_test_domain[3] = config['domain4']
+            if 'username5' in config:
+                swift_test_user[4] = config['username5']
+                swift_test_tenant[4] = config['account5']
+                swift_test_key[4] = config['password5']
+                if 'domain5' in config:
+                    swift_test_domain[4] = config['domain5']
+            if 'username6' in config:
+                swift_test_user[5] = config['username6']
+                swift_test_tenant[5] = config['account6']
+                swift_test_key[5] = config['password6']
+                if 'domain6' in config:
+                    swift_test_domain[5] = config['domain6']
+
+            for _ in range(5):
+                swift_test_perm[_] = swift_test_tenant[_] + ':' \
+                    + swift_test_user[_]
+
+    global skip
+    if not skip:
+        skip = not all([swift_test_auth, swift_test_user[0],
+                        swift_test_key[0]])
+        if skip:
+            print('SKIPPING FUNCTIONAL TESTS DUE TO NO CONFIG',
+                  file=sys.stderr)
+
+    global skip2
+    if not skip2:
+        skip2 = not all([not skip, swift_test_user[1], swift_test_key[1]])
+        if not skip and skip2:
+            print('SKIPPING SECOND ACCOUNT FUNCTIONAL TESTS '
+                  'DUE TO NO CONFIG FOR THEM', file=sys.stderr)
+
+    global skip3
+    if not skip3:
+        skip3 = not all([not skip, swift_test_user[2], swift_test_key[2]])
+        if not skip and skip3:
+            print('SKIPPING THIRD ACCOUNT FUNCTIONAL TESTS '
+                  'DUE TO NO CONFIG FOR THEM', file=sys.stderr)
+
+    global skip_if_not_v3
+    if not skip_if_not_v3:
+        skip_if_not_v3 = (swift_test_auth_version != '3'
+                          or not all([not skip,
+                                      swift_test_user[3],
+                                      swift_test_key[3]]))
+        if not skip and skip_if_not_v3:
+            print('SKIPPING FUNCTIONAL TESTS SPECIFIC TO AUTH VERSION 3',
+                  file=sys.stderr)
+
+    global skip_service_tokens
+    if not skip_service_tokens:
+        skip_service_tokens = not all([not skip, swift_test_user[4],
+                                       swift_test_key[4], swift_test_tenant[4],
+                                       swift_test_service_prefix])
+        if not skip and skip_service_tokens:
+            print(
+                'SKIPPING FUNCTIONAL TESTS SPECIFIC TO SERVICE TOKENS',
+                file=sys.stderr)
+
+    if policy_specified:
+        policies = FunctionalStoragePolicyCollection.from_info()
+        for p in policies:
+            # policy names are case-insensitive
+            if policy_specified.lower() == p['name'].lower():
+                _info('Using specified policy %s' % policy_specified)
+                FunctionalStoragePolicyCollection.policy_specified = p
+                Container.policy_specified = policy_specified
+                break
+        else:
+            _info(
+                'SKIPPING FUNCTIONAL TESTS: Failed to find specified policy %s'
+                % policy_specified)
+            raise Exception('Failed to find specified policy %s'
+                            % policy_specified)
+
+    global skip_if_no_reseller_admin
+    if not skip_if_no_reseller_admin:
+        skip_if_no_reseller_admin = not all([not skip, swift_test_user[5],
+                                             swift_test_key[5],
+                                             swift_test_tenant[5]])
+        if not skip and skip_if_no_reseller_admin:
+            print('SKIPPING FUNCTIONAL TESTS DUE TO NO CONFIG FOR '
+                  'RESELLER ADMIN', file=sys.stderr)
+
+    get_cluster_info()
+
+
+def teardown_package():
+    global orig_collate
+    locale.setlocale(locale.LC_COLLATE, orig_collate)
+
+    # clean up containers and objects left behind after running tests
+    global config
+
+    if config:
+        try:
+            conn = Connection(config)
+            conn.authenticate()
+            account = Account(conn, config.get('account', config['username']))
+            account.delete_containers()
+        except (SkipTest):
+            pass
+
+    global in_process
+    global _test_socks
+    if in_process:
+        try:
+            for i, server in enumerate(_test_coros):
+                server.kill()
+                if not server.dead:
+                    # kill it from the socket level
+                    _test_socks[i].close()
+        except Exception:
+            pass
+        try:
+            rmtree(os.path.dirname(_testdir))
+        except Exception:
+            pass
+
+        reset_globals()
+
+
+class AuthError(Exception):
+    pass
+
+
+class InternalServerError(Exception):
+    pass
+
+
+url = [None, None, None, None, None, None]
+token = [None, None, None, None, None, None]
+service_token = [None, None, None, None, None, None]
+parsed = [None, None, None, None, None, None]
+conn = [None, None, None, None, None, None]
+
+
+def reset_globals():
+    global url, token, service_token, parsed, conn, config
+    url = [None, None, None, None, None, None]
+    token = [None, None, None, None, None, None]
+    service_token = [None, None, None, None, None, None]
+    parsed = [None, None, None, None, None, None]
+    conn = [None, None, None, None, None, None]
+    if config:
+        config = {}
+
+
+def connection(url):
+    parsed_url, http_conn = http_connection(url, insecure=insecure)
+
+    orig_request = http_conn.request
+
+    # Add the policy header if policy_specified is set
+    def request_with_policy(method, url, body=None, headers={}):
+        if policy_specified and method == 'PUT':
+            version, account, container, obj = split_path(url, 1, 4, True)
+            if container and not obj and 'X-Storage-Policy' not in headers:
+                headers['X-Storage-Policy'] = policy_specified
+
+        return orig_request(method, url, body, headers)
+
+    http_conn.request = request_with_policy
+
+    return parsed_url, http_conn
+
+
+def get_url_token(user_index, os_options):
+    authargs = dict(snet=False,
+                    tenant_name=swift_test_tenant[user_index],
+                    auth_version=swift_test_auth_version,
+                    os_options=os_options,
+                    insecure=insecure)
+    url, token = get_auth(swift_test_auth,
+                          swift_test_user[user_index],
+                          swift_test_key[user_index],
+                          **authargs)
+    return url, token
+
+
+def retry(func, *args, **kwargs):
+    """
+    You can use the kwargs to override:
+      'retries' (default: 5)
+      'use_account' (default: 1) - which user's token to pass
+      'url_account' (default: matches 'use_account') - which user's storage URL
+      'resource' (default: url[url_account] - URL to connect to; retry()
+          will interpolate the variable :storage_url: if present
+      'service_user' - add a service token from this user (1 indexed)
+    """
+    global url, token, service_token, parsed, conn
+    retries = kwargs.get('retries', 5)
+    attempts, backoff = 0, 1
+
+    # use account #1 by default; turn user's 1-indexed account into 0-indexed
+    use_account = kwargs.pop('use_account', 1) - 1
+    service_user = kwargs.pop('service_user', None)
+    if service_user:
+        service_user -= 1  # 0-index
+
+    # access our own account by default
+    url_account = kwargs.pop('url_account', use_account + 1) - 1
+    os_options = {'user_domain_name': swift_test_domain[use_account],
+                  'project_domain_name': swift_test_domain[use_account]}
+    while attempts <= retries:
+        auth_failure = False
+        attempts += 1
+        try:
+            if not url[use_account] or not token[use_account]:
+                url[use_account], token[use_account] = get_url_token(
+                    use_account, os_options)
+                parsed[use_account] = conn[use_account] = None
+            if not parsed[use_account] or not conn[use_account]:
+                parsed[use_account], conn[use_account] = \
+                    connection(url[use_account])
+
+            # default resource is the account url[url_account]
+            resource = kwargs.pop('resource', '%(storage_url)s')
+            template_vars = {'storage_url': url[url_account]}
+            parsed_result = urlparse(resource % template_vars)
+            if isinstance(service_user, int):
+                if not service_token[service_user]:
+                    dummy, service_token[service_user] = get_url_token(
+                        service_user, os_options)
+                kwargs['service_token'] = service_token[service_user]
+            return func(url[url_account], token[use_account],
+                        parsed_result, conn[url_account],
+                        *args, **kwargs)
+        except (socket.error, HTTPException):
+            if attempts > retries:
+                raise
+            parsed[use_account] = conn[use_account] = None
+            if service_user:
+                service_token[service_user] = None
+        except AuthError:
+            auth_failure = True
+            url[use_account] = token[use_account] = None
+            if service_user:
+                service_token[service_user] = None
+        except InternalServerError:
+            pass
+        if attempts <= retries:
+            if not auth_failure:
+                sleep(backoff)
+            backoff *= 2
+    raise Exception('No result after %s retries.' % retries)
+
+
+def check_response(conn):
+    resp = conn.getresponse()
+    if resp.status == 401:
+        resp.read()
+        raise AuthError()
+    elif resp.status // 100 == 5:
+        resp.read()
+        raise InternalServerError()
+    return resp
+
+
+def load_constraint(name):
+    global cluster_info
+    try:
+        c = cluster_info['swift'][name]
+    except KeyError:
+        raise SkipTest("Missing constraint: %s" % name)
+    if not isinstance(c, int):
+        raise SkipTest("Bad value, %r, for constraint: %s" % (c, name))
+    return c
+
+
+def get_storage_policy_from_cluster_info(info):
+    policies = info['swift'].get('policies', {})
+    default_policy = []
+    non_default_policies = []
+    for p in policies:
+        if p.get('default', {}):
+            default_policy.append(p)
+        else:
+            non_default_policies.append(p)
+    return default_policy, non_default_policies
+
+
+def reset_acl():
+    def post(url, token, parsed, conn):
+        conn.request('POST', parsed.path, '', {
+            'X-Auth-Token': token,
+            'X-Account-Access-Control': '{}'
+        })
+        return check_response(conn)
+    resp = retry(post, use_account=1)
+    resp.read()
+
+
+def requires_acls(f):
+    @functools.wraps(f)
+    def wrapper(*args, **kwargs):
+        global skip, cluster_info
+        if skip or not cluster_info:
+            raise SkipTest('Requires account ACLs')
+        # Determine whether this cluster has account ACLs; if not, skip test
+        if not cluster_info.get('tempauth', {}).get('account_acls'):
+            raise SkipTest('Requires account ACLs')
+        if swift_test_auth_version != '1':
+            # remove when keystoneauth supports account acls
+            raise SkipTest('Requires account ACLs')
+        reset_acl()
+        try:
+            rv = f(*args, **kwargs)
+        finally:
+            reset_acl()
+        return rv
+    return wrapper
+
+
+class FunctionalStoragePolicyCollection(object):
+
+    # policy_specified is set in __init__.py when tests are being set up.
+    policy_specified = None
+
+    def __init__(self, policies):
+        self._all = policies
+        self.default = None
+        for p in self:
+            if p.get('default', False):
+                assert self.default is None, 'Found multiple default ' \
+                    'policies %r and %r' % (self.default, p)
+                self.default = p
+
+    @classmethod
+    def from_info(cls, info=None):
+        if not (info or cluster_info):
+            get_cluster_info()
+        info = info or cluster_info
+        try:
+            policy_info = info['swift']['policies']
+        except KeyError:
+            raise AssertionError('Did not find any policy info in %r' % info)
+        policies = cls(policy_info)
+        assert policies.default, \
+            'Did not find default policy in %r' % policy_info
+        return policies
+
+    def __len__(self):
+        return len(self._all)
+
+    def __iter__(self):
+        return iter(self._all)
+
+    def __getitem__(self, index):
+        return self._all[index]
+
+    def filter(self, **kwargs):
+        return self.__class__([p for p in self if all(
+            p.get(k) == v for k, v in kwargs.items())])
+
+    def exclude(self, **kwargs):
+        return self.__class__([p for p in self if all(
+            p.get(k) != v for k, v in kwargs.items())])
+
+    def select(self):
+        # check that a policy was specified and that it is available
+        # in the current list (i.e., hasn't been excluded of the current list)
+        if self.policy_specified and self.policy_specified in self:
+            return self.policy_specified
+        else:
+            return random.choice(self)
+
+
+def requires_policies(f):
+    @functools.wraps(f)
+    def wrapper(self, *args, **kwargs):
+        if skip:
+            raise SkipTest
+        try:
+            self.policies = FunctionalStoragePolicyCollection.from_info()
+        except AssertionError:
+            raise SkipTest("Unable to determine available policies")
+        if len(self.policies) < 2:
+            raise SkipTest("Multiple policies not enabled")
+        return f(self, *args, **kwargs)
+
+    return wrapper
+
+
+def requires_bulk(f):
+    @functools.wraps(f)
+    def wrapper(*args, **kwargs):
+        if skip or not cluster_info:
+            raise SkipTest('Requires bulk middleware')
+        # Determine whether this cluster has bulk middleware; if not, skip test
+        if not cluster_info.get('bulk_upload', {}):
+            raise SkipTest('Requires bulk middleware')
+        return f(*args, **kwargs)
+    return wrapper
diff --git a/test/functional/mock_swift_key_manager.py b/test/functional/mock_swift_key_manager.py
new file mode 100644
index 0000000000..388b84d5a1
--- /dev/null
+++ b/test/functional/mock_swift_key_manager.py
@@ -0,0 +1,59 @@
+# Copyright (c) 2017 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from castellan.tests.unit.key_manager.mock_key_manager import MockKeyManager
+
+
+class MockSwiftKeyManager(MockKeyManager):
+    """Mocking key manager for Swift functional tests.
+
+    This mock key manager implementation extends the Castellan mock key
+    manager with support for a pre-existing key that the Swift proxy server
+    can use as the root encryption secret. The actual key material bytes
+    for the root encryption secret changes each time this mock key manager is
+    instantiated, meaning that data written earlier is no longer accessible
+    once the proxy server is restarted.
+
+    To use this mock key manager instead of the default Barbican key manager,
+    set the following property in the [kms_keymaster] section in the
+    keymaster.conf configuration file pointed to using the
+    keymaster_config_path property in the [filter:kms_keymaster] section in the
+    proxy-server.conf file:
+
+        api_class = test.functional.mock_swift_key_manager.MockSwiftKeyManager
+
+    In case of a Python import error, make sure that the swift directory under
+    which this mock key manager resides is early in the sys.path, e.g., by
+    setting it in the PYTHONPATH environment variable before starting the
+    proxy server.
+
+    This key manager is not suitable for use in production deployments.
+    """
+
+    def __init__(self, configuration=None):
+        super(MockSwiftKeyManager, self).__init__(configuration)
+        '''
+        Create a new, random symmetric key for use as the encryption root
+        secret.
+        '''
+        existing_key = self._generate_key(algorithm='AES', length=256)
+        '''
+        Store the key under the UUID 'mock_key_manager_existing_key', from
+        where it can be retrieved by the proxy server. In the kms_keymaster
+        configuration, set the following property to use this key:
+
+            key_id = mock_key_manager_existing_key
+        '''
+        self.keys['mock_key_manager_existing_key'] = existing_key
diff --git a/test/functional/s3api/__init__.py b/test/functional/s3api/__init__.py
new file mode 100644
index 0000000000..9f402a4e95
--- /dev/null
+++ b/test/functional/s3api/__init__.py
@@ -0,0 +1,141 @@
+# Copyright (c) 2011-2014 OpenStack Foundation.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+import traceback
+from contextlib import contextmanager
+import logging
+from unittest import SkipTest
+
+import os
+
+import test.functional as tf
+from test.functional.s3api.s3_test_client import (
+    Connection, get_boto3_conn, tear_down_s3)
+try:
+    import boto
+except ImportError:
+    boto = None
+
+
+def setUpModule():
+    tf.setup_package()
+
+
+def tearDownModule():
+    tf.teardown_package()
+
+
+class S3ApiBase(unittest.TestCase):
+    def __init__(self, method_name):
+        super(S3ApiBase, self).__init__(method_name)
+        self.method_name = method_name
+
+    @contextmanager
+    def quiet_boto_logging(self):
+        original_level = logging.getLogger('boto').getEffectiveLevel()
+        try:
+            logging.getLogger('boto').setLevel(logging.INFO)
+            yield
+        finally:
+            logging.getLogger('boto').setLevel(original_level)
+
+    def setUp(self):
+        if not tf.config.get('s3_access_key'):
+            raise SkipTest('no s3api user configured')
+        if 's3api' not in tf.cluster_info:
+            raise SkipTest('s3api middleware is not enabled')
+        if boto is None:
+            raise SkipTest('boto 2.x library is not installed')
+        if tf.config.get('account'):
+            user_id = '%s:%s' % (tf.config['account'], tf.config['username'])
+        else:
+            user_id = tf.config['username']
+        try:
+            self.conn = Connection(
+                tf.config['s3_access_key'], tf.config['s3_secret_key'],
+                user_id=user_id)
+
+            self.conn.reset()
+        except Exception:
+            message = '%s got an error during initialize process.\n\n%s' % \
+                      (self.method_name, traceback.format_exc())
+            # TODO: Find a way to make this go to FAIL instead of Error
+            self.fail(message)
+
+    def assertCommonResponseHeaders(self, headers, etag=None):
+        """
+        asserting common response headers with args
+        :param headers: a dict of response headers
+        :param etag: a string of md5(content).hexdigest() if not given,
+                     this won't assert anything about etag. (e.g. DELETE obj)
+        """
+        self.assertTrue(headers['x-amz-id-2'] is not None)
+        self.assertTrue(headers['x-amz-request-id'] is not None)
+        self.assertTrue(headers['date'] is not None)
+        # TODO; requires consideration
+        # self.assertTrue(headers['server'] is not None)
+        if etag is not None:
+            self.assertTrue('etag' in headers)  # sanity
+            self.assertEqual(etag, headers['etag'].strip('"'))
+
+
+class S3ApiBaseBoto3(S3ApiBase):
+    def setUp(self):
+        if not tf.config.get('s3_access_key'):
+            raise SkipTest('no s3api user configured')
+        if 's3api' not in tf.cluster_info:
+            raise SkipTest('s3api middleware is not enabled')
+        try:
+            self.conn = get_boto3_conn(
+                tf.config['s3_access_key'], tf.config['s3_secret_key'])
+            self.endpoint_url = self.conn._endpoint.host
+            self.access_key = self.conn._request_signer._credentials.access_key
+            self.region = self.conn._client_config.region_name
+            tear_down_s3(self.conn)
+        except Exception:
+            message = '%s got an error during initialize process.\n\n%s' % \
+                      (self.method_name, traceback.format_exc())
+            # TODO: Find a way to make this go to FAIL instead of Error
+            self.fail(message)
+
+    def tearDown(self):
+        tear_down_s3(self.conn)
+
+
+def skip_boto2_sort_header_bug(m):
+    def wrapped(self, *args, **kwargs):
+        if os.environ.get('S3_USE_SIGV4') == "True":
+            # boto doesn't sort headers for v4 sigs properly; see
+            # https://github.com/boto/boto/pull/3032
+            # or https://github.com/boto/boto/pull/3176
+            # or https://github.com/boto/boto/pull/3751
+            # or https://github.com/boto/boto/pull/3824
+            self.skipTest('This stuff got the issue of boto<=2.x')
+        return m(self, *args, **kwargs)
+    return wrapped
+
+
+class SigV4Mixin(object):
+    @classmethod
+    def setUpClass(cls):
+        os.environ['S3_USE_SIGV4'] = "True"
+
+    @classmethod
+    def tearDownClass(cls):
+        del os.environ['S3_USE_SIGV4']
+
+    def setUp(self):
+        super(SigV4Mixin, self).setUp()
diff --git a/test/functional/s3api/s3_test_client.py b/test/functional/s3api/s3_test_client.py
new file mode 100644
index 0000000000..3f437a663c
--- /dev/null
+++ b/test/functional/s3api/s3_test_client.py
@@ -0,0 +1,226 @@
+# Copyright (c) 2015 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import logging
+import os
+from urllib.parse import urlparse
+import test.functional as tf
+import boto3
+from botocore.exceptions import ClientError
+try:
+    from boto.s3.connection import (
+        S3Connection,
+        OrdinaryCallingFormat,
+        S3ResponseError,
+    )
+except ImportError:
+    S3Connection = OrdinaryCallingFormat = S3ResponseError = None
+import sys
+import traceback
+
+
+RETRY_COUNT = 3
+
+
+if os.environ.get('SWIFT_TEST_QUIET_BOTO_LOGS'):
+    logging.getLogger('boto').setLevel(logging.INFO)
+    logging.getLogger('botocore').setLevel(logging.INFO)
+    logging.getLogger('boto3').setLevel(logging.INFO)
+
+
+def setUpModule():
+    tf.setup_package()
+
+
+def tearDownModule():
+    tf.teardown_package()
+
+
+class Connection(object):
+    """
+    Connection class used for S3 functional testing.
+    """
+    def __init__(self, aws_access_key,
+                 aws_secret_key,
+                 user_id=None):
+        """
+        Initialize method.
+
+        :param aws_access_key: a string of aws access key
+        :param aws_secret_key: a string of aws secret key
+        :param user_id: a string consists of TENANT and USER name used for
+                        asserting Owner ID (not required S3Connection)
+
+        In default, Connection class will be initialized as tester user
+        behaves as:
+        user_test_tester = testing .admin
+
+        """
+        self.aws_access_key = aws_access_key
+        self.aws_secret_key = aws_secret_key
+        self.user_id = user_id or aws_access_key
+        parsed = urlparse(tf.config['s3_storage_url'])
+        self.host = parsed.hostname
+        self.port = parsed.port
+        self.conn = \
+            S3Connection(aws_access_key, aws_secret_key,
+                         is_secure=(parsed.scheme == 'https'),
+                         host=self.host, port=self.port,
+                         calling_format=OrdinaryCallingFormat())
+        self.conn.auth_region_name = tf.config.get('s3_region', 'us-east-1')
+
+    def reset(self):
+        """
+        Reset all swift environment to keep clean. As a result by calling this
+        method, we can assume the backend swift keeps no containers and no
+        objects on this connection's account.
+        """
+        exceptions = []
+        for i in range(RETRY_COUNT):
+            try:
+                buckets = self.conn.get_all_buckets()
+                if not buckets:
+                    break
+
+                for bucket in buckets:
+                    try:
+                        for upload in bucket.list_multipart_uploads():
+                            upload.cancel_upload()
+
+                        for obj in bucket.list_versions():
+                            bucket.delete_key(
+                                obj.name, version_id=obj.version_id)
+
+                        try:
+                            self.conn.delete_bucket(bucket.name)
+                        except ClientError as e:
+                            err_code = e.response.get('Error', {}).get('Code')
+                            if err_code != 'BucketNotEmpty':
+                                raise
+                            # else, listing consistency issue; try again
+                    except S3ResponseError as e:
+                        # 404 means NoSuchBucket, NoSuchKey, or NoSuchUpload
+                        if e.status != 404:
+                            raise
+            except Exception:
+                exceptions.append(''.join(
+                    traceback.format_exception(*sys.exc_info())))
+        if exceptions:
+            exceptions.insert(0, 'Too many errors to continue:')
+            raise Exception('\n========\n'.join(exceptions))
+
+    def make_request(self, method, bucket='', obj='', headers=None, body=b'',
+                     query=None):
+        """
+        Wrapper method of S3Connection.make_request.
+
+        :param method: a string of HTTP request method
+        :param bucket: a string of bucket name
+        :param obj: a string of object name
+        :param headers: a dictionary of headers
+        :param body: a string of data binary sent to S3 as a request body
+        :param query: a string of HTTP query argument
+
+        :returns: a tuple of (int(status_code), headers dict, response body)
+        """
+        response = \
+            self.conn.make_request(method, bucket=bucket, key=obj,
+                                   headers=headers, data=body,
+                                   query_args=query, sender=None,
+                                   override_num_retries=RETRY_COUNT,
+                                   retry_handler=None)
+        return (response.status,
+                {h.lower(): v for h, v in response.getheaders()},
+                response.read())
+
+    def generate_url_and_headers(self, method, bucket='', obj='',
+                                 expires_in=3600):
+        url = self.conn.generate_url(expires_in, method, bucket, obj)
+        if os.environ.get('S3_USE_SIGV4') == "True":
+            # V4 signatures are known-broken in boto, but we can work around it
+            if url.startswith('https://') and not tf.config[
+                    's3_storage_url'].startswith('https://'):
+                url = 'http://' + url[8:]
+            if self.port is None:
+                return url, {}
+            else:
+                return url, {'Host': '%(host)s:%(port)d:%(port)d' % {
+                    'host': self.host, 'port': self.port}}
+        return url, {}
+
+
+def get_boto3_conn(aws_access_key, aws_secret_key):
+    endpoint_url = tf.config['s3_storage_url']
+    config = boto3.session.Config(s3={'addressing_style': 'path'})
+    return boto3.client(
+        's3', aws_access_key_id=aws_access_key,
+        aws_secret_access_key=aws_secret_key,
+        config=config, region_name=tf.config.get('s3_region', 'us-east-1'),
+        use_ssl=endpoint_url.startswith('https:'),
+        endpoint_url=endpoint_url)
+
+
+def tear_down_s3(conn):
+    """
+    Reset all swift environment to keep clean. As a result by calling this
+    method, we can assume the backend swift keeps no containers and no
+    objects on this connection's account.
+    """
+    exceptions = []
+    for i in range(RETRY_COUNT):
+        try:
+            resp = conn.list_buckets()
+            buckets = [bucket['Name'] for bucket in resp.get('Buckets', [])]
+            for bucket in buckets:
+                try:
+                    resp = conn.list_multipart_uploads(Bucket=bucket)
+                    for upload in resp.get('Uploads', []):
+                        conn.abort_multipart_upload(
+                            Bucket=bucket,
+                            Key=upload['Key'],
+                            UploadId=upload['UploadId'])
+
+                    resp = conn.list_objects(Bucket=bucket)
+                    for obj in resp.get('Contents', []):
+                        conn.delete_object(Bucket=bucket, Key=obj['Key'])
+                    try:
+                        conn.delete_bucket(Bucket=bucket)
+                    except ClientError as e:
+                        err_code = e.response.get('Error', {}).get('Code')
+                        if err_code != 'BucketNotEmpty':
+                            raise
+                        # else, listing consistency issue; try again
+                except ClientError as e:
+                    # 404 means NoSuchBucket, NoSuchKey, or NoSuchUpload
+                    if e.response['ResponseMetadata']['HTTPStatusCode'] != 404:
+                        raise
+        except Exception:
+            exceptions.append(''.join(
+                traceback.format_exception(*sys.exc_info())))
+    if exceptions:
+        exceptions.insert(0, 'Too many errors to continue:')
+        raise Exception('\n========\n'.join(exceptions))
+
+
+# TODO: make sure where this function is used
+def get_admin_connection():
+    """
+    Return tester connection behaves as:
+    user_test_admin = admin .admin
+    """
+    aws_access_key = tf.config['s3_access_key']
+    aws_secret_key = tf.config['s3_secret_key']
+    user_id = tf.config['s3_access_key']
+    return Connection(aws_access_key, aws_secret_key, user_id)
diff --git a/test/functional/s3api/test_acl.py b/test/functional/s3api/test_acl.py
new file mode 100644
index 0000000000..46c6298c3e
--- /dev/null
+++ b/test/functional/s3api/test_acl.py
@@ -0,0 +1,159 @@
+# Copyright (c) 2015 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+import os
+import test.functional as tf
+from swift.common.middleware.s3api.etree import fromstring
+from unittest import SkipTest
+from test.functional.s3api import S3ApiBase
+from test.functional.s3api.s3_test_client import Connection
+from test.functional.s3api.utils import get_error_code
+
+
+def setUpModule():
+    tf.setup_package()
+
+
+def tearDownModule():
+    tf.teardown_package()
+
+
+class TestS3Acl(S3ApiBase):
+    def setUp(self):
+        super(TestS3Acl, self).setUp()
+        self.bucket = 'bucket'
+        self.obj = 'object'
+        if 's3_access_key3' not in tf.config or \
+                's3_secret_key3' not in tf.config:
+            raise SkipTest(
+                'TestS3Acl requires s3_access_key3 and s3_secret_key3 '
+                'configured for reduced-access user')
+        status, headers, body = self.conn.make_request('PUT', self.bucket)
+        self.assertEqual(status, 200, body)
+        access_key3 = tf.config['s3_access_key3']
+        secret_key3 = tf.config['s3_secret_key3']
+        self.conn3 = Connection(access_key3, secret_key3, access_key3)
+
+    def test_acl(self):
+        self.conn.make_request('PUT', self.bucket, self.obj)
+        query = 'acl'
+
+        # PUT Bucket ACL
+        headers = {'x-amz-acl': 'public-read'}
+        status, headers, body = \
+            self.conn.make_request('PUT', self.bucket, headers=headers,
+                                   query=query)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self.assertEqual(headers['content-length'], '0')
+
+        # GET Bucket ACL
+        status, headers, body = \
+            self.conn.make_request('GET', self.bucket, query=query)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        # TODO: Fix the response that last-modified must be in the response.
+        # self.assertTrue(headers['last-modified'] is not None)
+        self.assertEqual(headers['content-length'], str(len(body)))
+        self.assertTrue(headers['content-type'] is not None)
+        elem = fromstring(body, 'AccessControlPolicy')
+        owner = elem.find('Owner')
+        self.assertEqual(owner.find('ID').text, self.conn.user_id)
+        self.assertEqual(owner.find('DisplayName').text, self.conn.user_id)
+        acl = elem.find('AccessControlList')
+        self.assertTrue(acl.find('Grant') is not None)
+
+        # GET Object ACL
+        status, headers, body = \
+            self.conn.make_request('GET', self.bucket, self.obj, query=query)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        # TODO: Fix the response that last-modified must be in the response.
+        # self.assertTrue(headers['last-modified'] is not None)
+        self.assertEqual(headers['content-length'], str(len(body)))
+        self.assertTrue(headers['content-type'] is not None)
+        elem = fromstring(body, 'AccessControlPolicy')
+        owner = elem.find('Owner')
+        self.assertEqual(owner.find('ID').text, self.conn.user_id)
+        self.assertEqual(owner.find('DisplayName').text, self.conn.user_id)
+        acl = elem.find('AccessControlList')
+        self.assertTrue(acl.find('Grant') is not None)
+
+    def test_put_bucket_acl_error(self):
+        req_headers = {'x-amz-acl': 'public-read'}
+        aws_error_conn = Connection(tf.config['s3_access_key'], 'invalid')
+        status, headers, body = \
+            aws_error_conn.make_request('PUT', self.bucket,
+                                        headers=req_headers, query='acl')
+        self.assertEqual(get_error_code(body), 'SignatureDoesNotMatch')
+
+        status, headers, body = \
+            self.conn.make_request('PUT', 'nothing',
+                                   headers=req_headers, query='acl')
+        self.assertEqual(get_error_code(body), 'NoSuchBucket')
+
+        status, headers, body = \
+            self.conn3.make_request('PUT', self.bucket,
+                                    headers=req_headers, query='acl')
+        self.assertEqual(get_error_code(body), 'AccessDenied')
+
+    def test_get_bucket_acl_error(self):
+        aws_error_conn = Connection(tf.config['s3_access_key'], 'invalid')
+        status, headers, body = \
+            aws_error_conn.make_request('GET', self.bucket, query='acl')
+        self.assertEqual(get_error_code(body), 'SignatureDoesNotMatch')
+
+        status, headers, body = \
+            self.conn.make_request('GET', 'nothing', query='acl')
+        self.assertEqual(get_error_code(body), 'NoSuchBucket')
+
+        status, headers, body = \
+            self.conn3.make_request('GET', self.bucket, query='acl')
+        self.assertEqual(get_error_code(body), 'AccessDenied')
+
+    def test_get_object_acl_error(self):
+        self.conn.make_request('PUT', self.bucket, self.obj)
+
+        aws_error_conn = Connection(tf.config['s3_access_key'], 'invalid')
+        status, headers, body = \
+            aws_error_conn.make_request('GET', self.bucket, self.obj,
+                                        query='acl')
+        self.assertEqual(get_error_code(body), 'SignatureDoesNotMatch')
+
+        status, headers, body = \
+            self.conn.make_request('GET', self.bucket, 'nothing', query='acl')
+        self.assertEqual(get_error_code(body), 'NoSuchKey')
+
+        status, headers, body = \
+            self.conn3.make_request('GET', self.bucket, self.obj, query='acl')
+        self.assertEqual(get_error_code(body), 'AccessDenied')
+
+
+class TestS3AclSigV4(TestS3Acl):
+    @classmethod
+    def setUpClass(cls):
+        os.environ['S3_USE_SIGV4'] = "True"
+
+    @classmethod
+    def tearDownClass(cls):
+        del os.environ['S3_USE_SIGV4']
+
+    def setUp(self):
+        super(TestS3AclSigV4, self).setUp()
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/functional/s3api/test_bucket.py b/test/functional/s3api/test_bucket.py
new file mode 100644
index 0000000000..e237b72049
--- /dev/null
+++ b/test/functional/s3api/test_bucket.py
@@ -0,0 +1,643 @@
+# Copyright (c) 2015 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import botocore
+import datetime
+import unittest
+import os
+from unittest import SkipTest
+
+import test.functional as tf
+from swift.common.utils import config_true_value
+from test.functional.s3api import S3ApiBaseBoto3
+from test.functional.s3api.s3_test_client import get_boto3_conn
+from test.functional.swift_test_client import Connection
+
+
+def setUpModule():
+    tf.setup_package()
+
+
+def tearDownModule():
+    tf.teardown_package()
+
+
+class TestS3ApiBucket(S3ApiBaseBoto3):
+    def _validate_object_listing(self, resp_objects, req_objects,
+                                 expect_owner=True):
+        self.assertEqual(len(resp_objects), len(req_objects))
+        for i, obj in enumerate(resp_objects):
+            self.assertEqual(obj['Key'], req_objects[i])
+            self.assertIsInstance(obj['LastModified'], datetime.datetime)
+            self.assertIn('ETag', obj)
+            self.assertIn('Size', obj)
+            self.assertEqual(obj['StorageClass'], 'STANDARD')
+            if not expect_owner:
+                self.assertNotIn('Owner', obj)
+            elif tf.cluster_info['s3api'].get('s3_acl'):
+                self.assertEqual(obj['Owner']['ID'], self.access_key)
+                self.assertEqual(obj['Owner']['DisplayName'], self.access_key)
+            else:
+                self.assertIn('Owner', obj)
+                self.assertIn('ID', obj['Owner'])
+                self.assertIn('DisplayName', obj['Owner'])
+
+    def test_bucket(self):
+        bucket = 'bucket'
+        max_bucket_listing = int(tf.cluster_info['s3api'].get(
+            'max_bucket_listing', 1000))
+
+        # PUT Bucket
+        resp = self.conn.create_bucket(Bucket=bucket)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        headers = resp['ResponseMetadata']['HTTPHeaders']
+
+        self.assertCommonResponseHeaders(headers)
+        self.assertIn(headers['location'], (
+            '/' + bucket,  # swob won't touch it...
+            # but webob (which we get because of auth_token) *does*
+            '%s/%s' % (self.endpoint_url, bucket),
+        ))
+        self.assertEqual(headers['content-length'], '0')
+
+        # GET Bucket(Without Object)
+        resp = self.conn.list_objects(Bucket=bucket)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        headers = resp['ResponseMetadata']['HTTPHeaders']
+
+        self.assertCommonResponseHeaders(headers)
+        self.assertIsNotNone(headers['content-type'])
+        # TODO; requires consideration
+        # self.assertEqual(headers['transfer-encoding'], 'chunked')
+
+        self.assertEqual(resp['Name'], bucket)
+        self.assertEqual(resp['Prefix'], '')
+        self.assertEqual(resp['Marker'], '')
+        self.assertEqual(resp['MaxKeys'], max_bucket_listing)
+        self.assertFalse(resp['IsTruncated'])
+        self.assertNotIn('Contents', bucket)
+
+        # GET Bucket(With Object)
+        req_objects = ['object', 'object2']
+        for obj in req_objects:
+            self.conn.put_object(Bucket=bucket, Key=obj, Body=b'')
+        resp = self.conn.list_objects(Bucket=bucket)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+
+        self.assertEqual(resp['Name'], bucket)
+        self.assertEqual(resp['Prefix'], '')
+        self.assertEqual(resp['Marker'], '')
+        self.assertEqual(resp['MaxKeys'], max_bucket_listing)
+        self.assertFalse(resp['IsTruncated'])
+        self._validate_object_listing(resp['Contents'], req_objects)
+
+        # HEAD Bucket
+        resp = self.conn.head_bucket(Bucket=bucket)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        headers = resp['ResponseMetadata']['HTTPHeaders']
+
+        self.assertCommonResponseHeaders(headers)
+        self.assertIsNotNone(headers['content-type'])
+        # TODO; requires consideration
+        # self.assertEqual(headers['transfer-encoding'], 'chunked')
+
+        # DELETE Bucket
+        for obj in req_objects:
+            self.conn.delete_object(Bucket=bucket, Key=obj)
+        resp = self.conn.delete_bucket(Bucket=bucket)
+        self.assertEqual(204, resp['ResponseMetadata']['HTTPStatusCode'])
+
+        self.assertCommonResponseHeaders(
+            resp['ResponseMetadata']['HTTPHeaders'])
+
+    def test_bucket_listing_with_staticweb(self):
+        if 'staticweb' not in tf.cluster_info:
+            raise SkipTest('Staticweb not enabled')
+        bucket = 'bucket'
+
+        resp = self.conn.create_bucket(Bucket=bucket)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+
+        resp = self.conn.list_objects(Bucket=bucket)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+
+        # enable staticweb listings; make publicly-readable
+        conn = Connection(tf.config)
+        conn.authenticate()
+        post_status = conn.make_request('POST', [bucket], hdrs={
+            'X-Container-Read': '.r:*,.rlistings',
+            'X-Container-Meta-Web-Listings': 'true',
+        })
+        self.assertEqual(post_status, 204)
+
+        resp = self.conn.list_objects(Bucket=bucket)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+
+    def test_put_bucket_error(self):
+        event_system = self.conn.meta.events
+        event_system.unregister(
+            'before-parameter-build.s3',
+            botocore.handlers.validate_bucket_name)
+        with self.assertRaises(botocore.exceptions.ClientError) as ctx:
+            self.conn.create_bucket(Bucket='bucket+invalid')
+        self.assertEqual(
+            ctx.exception.response['ResponseMetadata']['HTTPStatusCode'], 400)
+        self.assertEqual(
+            ctx.exception.response['Error']['Code'], 'InvalidBucketName')
+
+        auth_error_conn = get_boto3_conn(tf.config['s3_access_key'], 'invalid')
+        with self.assertRaises(botocore.exceptions.ClientError) as ctx:
+            auth_error_conn.create_bucket(Bucket='bucket')
+        self.assertEqual(
+            ctx.exception.response['ResponseMetadata']['HTTPStatusCode'], 403)
+        self.assertEqual(ctx.exception.response['Error']['Code'],
+                         'SignatureDoesNotMatch')
+
+        self.conn.create_bucket(Bucket='bucket')
+        with self.assertRaises(botocore.exceptions.ClientError) as ctx:
+            self.conn.create_bucket(Bucket='bucket')
+        self.assertEqual(
+            ctx.exception.response['ResponseMetadata']['HTTPStatusCode'], 409)
+        self.assertEqual(
+            ctx.exception.response['Error']['Code'], 'BucketAlreadyOwnedByYou')
+
+    def test_put_bucket_error_key2(self):
+        if config_true_value(tf.cluster_info['s3api'].get('s3_acl')):
+            if 's3_access_key2' not in tf.config or \
+                    's3_secret_key2' not in tf.config:
+                raise SkipTest(
+                    'Cannot test for BucketAlreadyExists with second user; '
+                    'need s3_access_key2 and s3_secret_key2 configured')
+
+            self.conn.create_bucket(Bucket='bucket')
+
+            # Other users of the same account get the same 409 error
+            conn2 = get_boto3_conn(tf.config['s3_access_key2'],
+                                   tf.config['s3_secret_key2'])
+            with self.assertRaises(botocore.exceptions.ClientError) as ctx:
+                conn2.create_bucket(Bucket='bucket')
+            self.assertEqual(
+                ctx.exception.response['ResponseMetadata']['HTTPStatusCode'],
+                409)
+            self.assertEqual(
+                ctx.exception.response['Error']['Code'], 'BucketAlreadyExists')
+
+    def test_put_bucket_error_key3(self):
+        if 's3_access_key3' not in tf.config or \
+                's3_secret_key3' not in tf.config:
+            raise SkipTest('Cannot test for AccessDenied; need '
+                           's3_access_key3 and s3_secret_key3 configured')
+
+        self.conn.create_bucket(Bucket='bucket')
+        # If the user can't create buckets, they shouldn't even know
+        # whether the bucket exists.
+        conn3 = get_boto3_conn(tf.config['s3_access_key3'],
+                               tf.config['s3_secret_key3'])
+        with self.assertRaises(botocore.exceptions.ClientError) as ctx:
+            conn3.create_bucket(Bucket='bucket')
+        self.assertEqual(
+            ctx.exception.response['ResponseMetadata']['HTTPStatusCode'], 403)
+        self.assertEqual(
+            ctx.exception.response['Error']['Code'], 'AccessDenied')
+
+    def test_put_bucket_with_LocationConstraint(self):
+        resp = self.conn.create_bucket(
+            Bucket='bucket',
+            CreateBucketConfiguration={'LocationConstraint': self.region})
+        self.assertEqual(resp['ResponseMetadata']['HTTPStatusCode'], 200)
+
+    def test_get_bucket_error(self):
+        event_system = self.conn.meta.events
+        event_system.unregister(
+            'before-parameter-build.s3',
+            botocore.handlers.validate_bucket_name)
+        self.conn.create_bucket(Bucket='bucket')
+
+        with self.assertRaises(botocore.exceptions.ClientError) as ctx:
+            self.conn.list_objects(Bucket='bucket+invalid')
+        self.assertEqual(
+            ctx.exception.response['Error']['Code'], 'InvalidBucketName')
+
+        auth_error_conn = get_boto3_conn(tf.config['s3_access_key'], 'invalid')
+        with self.assertRaises(botocore.exceptions.ClientError) as ctx:
+            auth_error_conn.list_objects(Bucket='bucket')
+        self.assertEqual(
+            ctx.exception.response['Error']['Code'], 'SignatureDoesNotMatch')
+
+        with self.assertRaises(botocore.exceptions.ClientError) as ctx:
+            self.conn.list_objects(Bucket='nothing')
+        self.assertEqual(
+            ctx.exception.response['Error']['Code'], 'NoSuchBucket')
+
+    def _prepare_test_get_bucket(self, bucket, objects):
+        try:
+            self.conn.create_bucket(Bucket=bucket)
+        except botocore.exceptions.ClientError as e:
+            err_code = e.response.get('Error', {}).get('Code')
+            if err_code != 'BucketAlreadyOwnedByYou':
+                raise
+
+        for obj in objects:
+            self.conn.put_object(Bucket=bucket, Key=obj, Body=b'')
+
+    def test_blank_params(self):
+        bucket = 'bucket'
+        self._prepare_test_get_bucket(bucket, ())
+
+        resp = self.conn.list_objects(
+            Bucket=bucket, Delimiter='', Marker='', Prefix='')
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertNotIn('Delimiter', resp)
+        self.assertIn('Marker', resp)
+        self.assertEqual('', resp['Marker'])
+        self.assertIn('Prefix', resp)
+        self.assertEqual('', resp['Prefix'])
+
+        resp = self.conn.list_objects_v2(
+            Bucket=bucket, Delimiter='', StartAfter='', Prefix='')
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertNotIn('Delimiter', resp)
+        self.assertIn('StartAfter', resp)
+        self.assertEqual('', resp['StartAfter'])
+        self.assertIn('Prefix', resp)
+        self.assertEqual('', resp['Prefix'])
+
+        resp = self.conn.list_object_versions(
+            Bucket=bucket, Delimiter='', KeyMarker='', Prefix='')
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertIn('Delimiter', resp)
+        self.assertEqual('', resp['Delimiter'])
+        self.assertIn('KeyMarker', resp)
+        self.assertEqual('', resp['KeyMarker'])
+        self.assertIn('Prefix', resp)
+        self.assertEqual('', resp['Prefix'])
+
+    def test_get_bucket_with_delimiter(self):
+        bucket = 'bucket'
+        put_objects = ('object', 'object2', 'subdir/object', 'subdir2/object',
+                       'dir/subdir/object')
+        self._prepare_test_get_bucket(bucket, put_objects)
+
+        delimiter = '/'
+        expect_objects = ('object', 'object2')
+        expect_prefixes = ('dir/', 'subdir/', 'subdir2/')
+        resp = self.conn.list_objects(Bucket=bucket, Delimiter=delimiter)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual(resp['Delimiter'], delimiter)
+        self._validate_object_listing(resp['Contents'], expect_objects)
+        resp_prefixes = resp['CommonPrefixes']
+        self.assertEqual(
+            resp_prefixes,
+            [{'Prefix': p} for p in expect_prefixes])
+
+    def test_get_bucket_with_multi_char_delimiter(self):
+        bucket = 'bucket'
+        put_objects = ('object', 'object2', 'subdir/object', 'subdir2/object',
+                       'dir/subdir/object')
+        self._prepare_test_get_bucket(bucket, put_objects)
+
+        delimiter = '/obj'
+        expect_objects = ('object', 'object2')
+        expect_prefixes = ('dir/subdir/obj', 'subdir/obj', 'subdir2/obj')
+        resp = self.conn.list_objects(Bucket=bucket, Delimiter=delimiter)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual(resp['Delimiter'], delimiter)
+        self._validate_object_listing(resp['Contents'], expect_objects)
+        resp_prefixes = resp['CommonPrefixes']
+        self.assertEqual(
+            resp_prefixes,
+            [{'Prefix': p} for p in expect_prefixes])
+
+    def test_get_bucket_with_non_ascii_delimiter(self):
+        bucket = 'bucket'
+        put_objects = (
+            'bar',
+            'foo',
+            u'foobar\N{SNOWMAN}baz',
+            u'foo\N{SNOWMAN}bar',
+            u'foo\N{SNOWMAN}bar\N{SNOWMAN}baz',
+        )
+        self._prepare_test_get_bucket(bucket, put_objects)
+        # boto3 doesn't always unquote everything it should; see
+        # https://github.com/boto/botocore/pull/1901
+        # Fortunately, we can just drop the encoding-type=url param
+        self.conn.meta.events.unregister(
+            'before-parameter-build.s3.ListObjects',
+            botocore.handlers.set_list_objects_encoding_type_url)
+
+        delimiter = u'\N{SNOWMAN}'
+        expect_objects = ('bar', 'foo')
+        expect_prefixes = (u'foobar\N{SNOWMAN}', u'foo\N{SNOWMAN}')
+        resp = self.conn.list_objects(Bucket=bucket, Delimiter=delimiter)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual(resp['Delimiter'], delimiter)
+        self._validate_object_listing(resp['Contents'], expect_objects)
+        resp_prefixes = resp['CommonPrefixes']
+        self.assertEqual(
+            resp_prefixes,
+            [{'Prefix': p} for p in expect_prefixes])
+
+        prefix = u'foo\N{SNOWMAN}'
+        expect_objects = (u'foo\N{SNOWMAN}bar',)
+        expect_prefixes = (u'foo\N{SNOWMAN}bar\N{SNOWMAN}',)
+        resp = self.conn.list_objects(
+            Bucket=bucket, Delimiter=delimiter, Prefix=prefix)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual(resp['Delimiter'], delimiter)
+        self.assertEqual(resp['Prefix'], prefix)
+        self._validate_object_listing(resp['Contents'], expect_objects)
+        resp_prefixes = resp['CommonPrefixes']
+        self.assertEqual(
+            resp_prefixes,
+            [{'Prefix': p} for p in expect_prefixes])
+
+    def test_get_bucket_with_encoding_type(self):
+        bucket = 'bucket'
+        put_objects = ('object', 'object2')
+        self._prepare_test_get_bucket(bucket, put_objects)
+
+        encoding_type = 'url'
+        resp = self.conn.list_objects(
+            Bucket=bucket, EncodingType=encoding_type)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual(resp['EncodingType'], encoding_type)
+
+    def test_get_bucket_with_marker(self):
+        bucket = 'bucket'
+        put_objects = ('object', 'object2', 'subdir/object', 'subdir2/object',
+                       'dir/subdir/object')
+        self._prepare_test_get_bucket(bucket, put_objects)
+
+        marker = 'object'
+        expect_objects = ('object2', 'subdir/object', 'subdir2/object')
+        resp = self.conn.list_objects(Bucket=bucket, Marker=marker)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual(resp['Marker'], marker)
+        self._validate_object_listing(resp['Contents'], expect_objects)
+
+    def test_get_bucket_with_max_keys(self):
+        bucket = 'bucket'
+        put_objects = ('object', 'object2', 'subdir/object', 'subdir2/object',
+                       'dir/subdir/object')
+        self._prepare_test_get_bucket(bucket, put_objects)
+
+        max_keys = 2
+        expect_objects = ('dir/subdir/object', 'object')
+        resp = self.conn.list_objects(Bucket=bucket, MaxKeys=max_keys)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual(resp['MaxKeys'], max_keys)
+        self._validate_object_listing(resp['Contents'], expect_objects)
+
+    def test_get_bucket_with_prefix(self):
+        bucket = 'bucket'
+        req_objects = ('object', 'object2', 'subdir/object', 'subdir2/object',
+                       'dir/subdir/object')
+        self._prepare_test_get_bucket(bucket, req_objects)
+
+        prefix = 'object'
+        expect_objects = ('object', 'object2')
+        resp = self.conn.list_objects(Bucket=bucket, Prefix=prefix)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual(resp['Prefix'], prefix)
+        self._validate_object_listing(resp['Contents'], expect_objects)
+
+    def test_get_bucket_v2_with_start_after(self):
+        bucket = 'bucket'
+        put_objects = ('object', 'object2', 'subdir/object', 'subdir2/object',
+                       'dir/subdir/object')
+        self._prepare_test_get_bucket(bucket, put_objects)
+
+        marker = 'object'
+        expect_objects = ('object2', 'subdir/object', 'subdir2/object')
+        resp = self.conn.list_objects_v2(Bucket=bucket, StartAfter=marker)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual(resp['StartAfter'], marker)
+        self.assertEqual(resp['KeyCount'], 3)
+        self._validate_object_listing(resp['Contents'], expect_objects,
+                                      expect_owner=False)
+
+    def test_get_bucket_v2_with_fetch_owner(self):
+        bucket = 'bucket'
+        put_objects = ('object', 'object2', 'subdir/object', 'subdir2/object',
+                       'dir/subdir/object')
+        self._prepare_test_get_bucket(bucket, put_objects)
+
+        expect_objects = ('dir/subdir/object', 'object', 'object2',
+                          'subdir/object', 'subdir2/object')
+        resp = self.conn.list_objects_v2(Bucket=bucket, FetchOwner=True)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual(resp['KeyCount'], 5)
+        self._validate_object_listing(resp['Contents'], expect_objects)
+
+    def test_get_bucket_v2_with_continuation_token_and_delimiter(self):
+        bucket = 'bucket'
+        put_objects = ('object', u'object2-\u062a', 'subdir/object',
+                       u'subdir2-\u062a/object', 'dir/subdir/object',
+                       'x', 'y', 'z')
+        self._prepare_test_get_bucket(bucket, put_objects)
+
+        expected = [{'objects': ['object', u'object2-\u062a'],
+                     'subdirs': ['dir/']},
+                    {'objects': ['x'],
+                     'subdirs': ['subdir/', u'subdir2-\u062a/']},
+                    {'objects': ['y', 'z'],
+                     'subdirs': []}]
+
+        continuation_token = ''
+
+        for i in range(len(expected)):
+            resp = self.conn.list_objects_v2(
+                Bucket=bucket,
+                MaxKeys=3,
+                Delimiter='/',
+                ContinuationToken=continuation_token)
+            self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+            self.assertEqual(resp['MaxKeys'], 3)
+            self.assertEqual(
+                resp['KeyCount'],
+                len(expected[i]['objects']) + len(expected[i]['subdirs']))
+            expect_truncated = i < len(expected) - 1
+            self.assertEqual(resp['IsTruncated'], expect_truncated)
+            if expect_truncated:
+                self.assertIsNotNone(resp['NextContinuationToken'])
+                continuation_token = resp['NextContinuationToken']
+            self._validate_object_listing(resp['Contents'],
+                                          expected[i]['objects'],
+                                          expect_owner=False)
+            resp_subdirs = resp.get('CommonPrefixes', [])
+            self.assertEqual(
+                resp_subdirs,
+                [{'Prefix': p} for p in expected[i]['subdirs']])
+
+    def test_head_bucket_error(self):
+        event_system = self.conn.meta.events
+        event_system.unregister(
+            'before-parameter-build.s3',
+            botocore.handlers.validate_bucket_name)
+
+        self.conn.create_bucket(Bucket='bucket')
+
+        with self.assertRaises(botocore.exceptions.ClientError) as ctx:
+            self.conn.head_bucket(Bucket='bucket+invalid')
+        self.assertEqual(
+            ctx.exception.response['ResponseMetadata']['HTTPStatusCode'], 400)
+        self.assertEqual(ctx.exception.response['Error']['Code'], '400')
+        self.assertEqual(
+            ctx.exception.response[
+                'ResponseMetadata']['HTTPHeaders']['content-length'], '0')
+
+        auth_error_conn = get_boto3_conn(tf.config['s3_access_key'], 'invalid')
+        with self.assertRaises(botocore.exceptions.ClientError) as ctx:
+            auth_error_conn.head_bucket(Bucket='bucket')
+        self.assertEqual(
+            ctx.exception.response['ResponseMetadata']['HTTPStatusCode'], 403)
+        self.assertEqual(
+            ctx.exception.response['Error']['Code'], '403')
+        self.assertEqual(
+            ctx.exception.response[
+                'ResponseMetadata']['HTTPHeaders']['content-length'], '0')
+
+        with self.assertRaises(botocore.exceptions.ClientError) as ctx:
+            self.conn.head_bucket(Bucket='nothing')
+        self.assertEqual(
+            ctx.exception.response['ResponseMetadata']['HTTPStatusCode'], 404)
+        self.assertEqual(
+            ctx.exception.response['Error']['Code'], '404')
+        self.assertEqual(
+            ctx.exception.response[
+                'ResponseMetadata']['HTTPHeaders']['content-length'], '0')
+
+    def test_delete_bucket_error(self):
+        event_system = self.conn.meta.events
+        event_system.unregister(
+            'before-parameter-build.s3',
+            botocore.handlers.validate_bucket_name)
+        with self.assertRaises(botocore.exceptions.ClientError) as ctx:
+            self.conn.delete_bucket(Bucket='bucket+invalid')
+        self.assertEqual(
+            ctx.exception.response['Error']['Code'], 'InvalidBucketName')
+
+        auth_error_conn = get_boto3_conn(tf.config['s3_access_key'], 'invalid')
+        with self.assertRaises(botocore.exceptions.ClientError) as ctx:
+            auth_error_conn.delete_bucket(Bucket='bucket')
+        self.assertEqual(
+            ctx.exception.response['Error']['Code'], 'SignatureDoesNotMatch')
+
+        with self.assertRaises(botocore.exceptions.ClientError) as ctx:
+            self.conn.delete_bucket(Bucket='bucket')
+        self.assertEqual(
+            ctx.exception.response['Error']['Code'], 'NoSuchBucket')
+
+    def test_bucket_invalid_method_error(self):
+        def _mangle_req_method(request, **kwargs):
+            request.method = 'GETPUT'
+
+        def _mangle_req_controller_method(request, **kwargs):
+            request.method = '_delete_segments_bucket'
+
+        event_system = self.conn.meta.events
+        event_system.register(
+            'request-created.s3.CreateBucket',
+            _mangle_req_method)
+        # non existed verb in the controller
+        with self.assertRaises(botocore.exceptions.ClientError) as ctx:
+            self.conn.create_bucket(Bucket='bucket')
+        self.assertEqual(
+            ctx.exception.response['Error']['Code'], 'MethodNotAllowed')
+
+        event_system.unregister('request-created.s3.CreateBucket',
+                                _mangle_req_method)
+        event_system.register('request-created.s3.CreateBucket',
+                              _mangle_req_controller_method)
+
+        try:
+            import awscrt  # noqa: F401
+        except ImportError:
+            raise SkipTest('lower-case request methods require awscrt for '
+                           'proper signing (try `pip install awscrt`)')
+        # the method exists in the controller but deny as MethodNotAllowed
+        with self.assertRaises(botocore.exceptions.ClientError) as ctx:
+            self.conn.create_bucket(Bucket='bucket')
+        self.assertEqual(
+            ctx.exception.response['Error']['Code'], 'MethodNotAllowed')
+
+    def test_bucket_get_object_lock_configuration(self):
+        bucket = 'bucket'
+
+        # PUT Bucket
+        resp = self.conn.create_bucket(Bucket=bucket)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        headers = resp['ResponseMetadata']['HTTPHeaders']
+        self.assertCommonResponseHeaders(headers)
+
+        # now attempt to get object_lock_configuration from new bucket.
+        with self.assertRaises(botocore.exceptions.ClientError) as ce:
+            self.conn.get_object_lock_configuration(
+                Bucket=bucket)
+        self.assertEqual(
+            ce.exception.response['ResponseMetadata']['HTTPStatusCode'],
+            404)
+        self.assertEqual(
+            ce.exception.response['Error']['Code'],
+            'ObjectLockConfigurationNotFoundError')
+
+        self.assertEqual(
+            str(ce.exception),
+            'An error occurred (ObjectLockConfigurationNotFoundError) when '
+            'calling the GetObjectLockConfiguration operation: Object Lock '
+            'configuration does not exist for this bucket')
+
+    def test_bucket_put_object_lock_configuration(self):
+        bucket = 'bucket'
+
+        # PUT Bucket
+        resp = self.conn.create_bucket(Bucket=bucket)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        headers = resp['ResponseMetadata']['HTTPHeaders']
+        self.assertCommonResponseHeaders(headers)
+
+        # now attempt to get object_lock_configuration from new bucket.
+        with self.assertRaises(botocore.exceptions.ClientError) as ce:
+            self.conn.put_object_lock_configuration(
+                Bucket=bucket, ObjectLockConfiguration={})
+
+        self.assertEqual(
+            ce.exception.response['ResponseMetadata']['HTTPStatusCode'],
+            501)
+        self.assertEqual(
+            ce.exception.response['Error']['Code'],
+            'NotImplemented')
+
+        self.assertEqual(str(ce.exception),
+                         'An error occurred (NotImplemented) when calling '
+                         'the PutObjectLockConfiguration operation: The '
+                         'requested resource is not implemented')
+
+
+class TestS3ApiBucketSigV4(TestS3ApiBucket):
+    @classmethod
+    def setUpClass(cls):
+        os.environ['S3_USE_SIGV4'] = "True"
+
+    @classmethod
+    def tearDownClass(cls):
+        del os.environ['S3_USE_SIGV4']
+
+    def setUp(self):
+        super(TestS3ApiBucket, self).setUp()
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/functional/s3api/test_multi_delete.py b/test/functional/s3api/test_multi_delete.py
new file mode 100644
index 0000000000..be32a530ff
--- /dev/null
+++ b/test/functional/s3api/test_multi_delete.py
@@ -0,0 +1,260 @@
+# Copyright (c) 2015 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+import os
+import test.functional as tf
+from swift.common.middleware.s3api.etree import fromstring, tostring, \
+    Element, SubElement
+
+from test.functional.s3api import S3ApiBase
+from test.functional.s3api.s3_test_client import Connection
+from test.functional.s3api.utils import get_error_code, calculate_md5
+
+
+def setUpModule():
+    tf.setup_package()
+
+
+def tearDownModule():
+    tf.teardown_package()
+
+
+class TestS3ApiMultiDelete(S3ApiBase):
+    def _prepare_test_delete_multi_objects(self, bucket, objects):
+        self.conn.make_request('PUT', bucket)
+        for obj in objects:
+            self.conn.make_request('PUT', bucket, obj)
+
+    def _gen_multi_delete_xml(self, objects, quiet=None):
+        elem = Element('Delete')
+        if quiet:
+            SubElement(elem, 'Quiet').text = quiet
+        for key in objects:
+            obj = SubElement(elem, 'Object')
+            SubElement(obj, 'Key').text = key
+
+        return tostring(elem, use_s3ns=False)
+
+    def _gen_invalid_multi_delete_xml(self, hasObjectTag=False):
+        elem = Element('Delete')
+        if hasObjectTag:
+            obj = SubElement(elem, 'Object')
+            SubElement(obj, 'Key').text = ''
+
+        return tostring(elem, use_s3ns=False)
+
+    def _test_delete_multi_objects(self, with_non_ascii=False):
+        bucket = 'bucket'
+        if with_non_ascii:
+            put_objects = [u'\N{SNOWMAN}obj%s' % var for var in range(4)]
+        else:
+            put_objects = ['obj%s' % var for var in range(4)]
+        self._prepare_test_delete_multi_objects(bucket, put_objects)
+        query = 'delete'
+
+        # Delete an object via MultiDelete API
+        req_objects = put_objects[:1]
+        xml = self._gen_multi_delete_xml(req_objects)
+        content_md5 = calculate_md5(xml)
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, body=xml,
+                                   headers={'Content-MD5': content_md5},
+                                   query=query)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self.assertTrue(headers['content-type'] is not None)
+        self.assertEqual(headers['content-length'], str(len(body)))
+        elem = fromstring(body)
+        resp_objects = elem.findall('Deleted')
+        self.assertEqual(len(resp_objects), len(req_objects))
+        for o in resp_objects:
+            key = o.find('Key').text
+            self.assertTrue(key in req_objects)
+
+        # Delete 2 objects via MultiDelete API
+        req_objects = put_objects[1:3]
+        xml = self._gen_multi_delete_xml(req_objects)
+        content_md5 = calculate_md5(xml)
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, body=xml,
+                                   headers={'Content-MD5': content_md5},
+                                   query=query)
+        self.assertEqual(status, 200)
+        elem = fromstring(body, 'DeleteResult')
+        resp_objects = elem.findall('Deleted')
+        self.assertEqual(len(resp_objects), len(req_objects))
+        for o in resp_objects:
+            key = o.find('Key').text
+            self.assertTrue(key in req_objects)
+
+        if with_non_ascii:
+            fake_objs = [u'\N{SNOWMAN}obj%s' % var for var in range(4, 6)]
+        else:
+            fake_objs = ['obj%s' % var for var in range(4, 6)]
+        # Delete 2 objects via MultiDelete API but one (obj4) doesn't exist.
+        req_objects = [put_objects[-1], fake_objs[0]]
+        xml = self._gen_multi_delete_xml(req_objects)
+        content_md5 = calculate_md5(xml)
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, body=xml,
+                                   headers={'Content-MD5': content_md5},
+                                   query=query)
+        self.assertEqual(status, 200)
+        elem = fromstring(body, 'DeleteResult')
+        resp_objects = elem.findall('Deleted')
+        # S3 assumes a NoSuchKey object as deleted.
+        self.assertEqual(len(resp_objects), len(req_objects))
+        for o in resp_objects:
+            key = o.find('Key').text
+            self.assertTrue(key in req_objects)
+
+        # Delete 2 objects via MultiDelete API but no objects exist
+        req_objects = fake_objs[:2]
+        xml = self._gen_multi_delete_xml(req_objects)
+        content_md5 = calculate_md5(xml)
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, body=xml,
+                                   headers={'Content-MD5': content_md5},
+                                   query=query)
+        self.assertEqual(status, 200)
+        elem = fromstring(body, 'DeleteResult')
+        resp_objects = elem.findall('Deleted')
+        self.assertEqual(len(resp_objects), len(req_objects))
+        for o in resp_objects:
+            key = o.find('Key').text
+            self.assertTrue(key in req_objects)
+
+    def test_delete_multi_objects(self):
+        self._test_delete_multi_objects()
+
+    def test_delete_multi_objects_with_non_ascii(self):
+        self._test_delete_multi_objects(with_non_ascii=True)
+
+    def test_delete_multi_objects_error(self):
+        bucket = 'bucket'
+        put_objects = ['obj']
+        self._prepare_test_delete_multi_objects(bucket, put_objects)
+        xml = self._gen_multi_delete_xml(put_objects)
+        content_md5 = calculate_md5(xml)
+        query = 'delete'
+
+        auth_error_conn = Connection(tf.config['s3_access_key'], 'invalid')
+        status, headers, body = \
+            auth_error_conn.make_request('POST', bucket, body=xml,
+                                         headers={
+                                             'Content-MD5': content_md5
+                                         },
+                                         query=query)
+        self.assertEqual(get_error_code(body), 'SignatureDoesNotMatch')
+
+        status, headers, body = \
+            self.conn.make_request('POST', 'nothing', body=xml,
+                                   headers={'Content-MD5': content_md5},
+                                   query=query)
+        self.assertEqual(get_error_code(body), 'NoSuchBucket')
+
+        # without Object tag
+        xml = self._gen_invalid_multi_delete_xml()
+        content_md5 = calculate_md5(xml)
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, body=xml,
+                                   headers={'Content-MD5': content_md5},
+                                   query=query)
+        self.assertEqual(get_error_code(body), 'MalformedXML')
+
+        # without value of Key tag
+        xml = self._gen_invalid_multi_delete_xml(hasObjectTag=True)
+        content_md5 = calculate_md5(xml)
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, body=xml,
+                                   headers={'Content-MD5': content_md5},
+                                   query=query)
+        self.assertEqual(get_error_code(body), 'UserKeyMustBeSpecified')
+
+        max_deletes = int(tf.cluster_info.get('s3api', {}).get(
+            'max_multi_delete_objects', 1000))
+        # specified number of objects are over max_multi_delete_objects
+        # (Default 1000), but xml size is relatively small
+        req_objects = ['obj%s' for var in range(max_deletes + 1)]
+        xml = self._gen_multi_delete_xml(req_objects)
+        content_md5 = calculate_md5(xml)
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, body=xml,
+                                   headers={'Content-MD5': content_md5},
+                                   query=query)
+        self.assertEqual(get_error_code(body), 'MalformedXML')
+
+        # specified xml size is large, but number of objects are
+        # smaller than max_multi_delete_objects.
+        obj = 'a' * 102400
+        req_objects = [obj + str(var) for var in range(max_deletes - 1)]
+        xml = self._gen_multi_delete_xml(req_objects)
+        content_md5 = calculate_md5(xml)
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, body=xml,
+                                   headers={'Content-MD5': content_md5},
+                                   query=query)
+        self.assertEqual(get_error_code(body), 'MalformedXML')
+
+    def test_delete_multi_objects_with_quiet(self):
+        bucket = 'bucket'
+        put_objects = ['obj']
+        query = 'delete'
+
+        # with Quiet true
+        quiet = 'true'
+        self._prepare_test_delete_multi_objects(bucket, put_objects)
+        xml = self._gen_multi_delete_xml(put_objects, quiet)
+        content_md5 = calculate_md5(xml)
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, body=xml,
+                                   headers={'Content-MD5': content_md5},
+                                   query=query)
+        self.assertEqual(status, 200)
+        elem = fromstring(body, 'DeleteResult')
+        resp_objects = elem.findall('Deleted')
+        self.assertEqual(len(resp_objects), 0)
+
+        # with Quiet false
+        quiet = 'false'
+        self._prepare_test_delete_multi_objects(bucket, put_objects)
+        xml = self._gen_multi_delete_xml(put_objects, quiet)
+        content_md5 = calculate_md5(xml)
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, body=xml,
+                                   headers={'Content-MD5': content_md5},
+                                   query=query)
+        self.assertEqual(status, 200)
+        elem = fromstring(body, 'DeleteResult')
+        resp_objects = elem.findall('Deleted')
+        self.assertEqual(len(resp_objects), 1)
+
+
+class TestS3ApiMultiDeleteSigV4(TestS3ApiMultiDelete):
+    @classmethod
+    def setUpClass(cls):
+        os.environ['S3_USE_SIGV4'] = "True"
+
+    @classmethod
+    def tearDownClass(cls):
+        del os.environ['S3_USE_SIGV4']
+
+    def setUp(self):
+        super(TestS3ApiMultiDeleteSigV4, self).setUp()
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/functional/s3api/test_multi_upload.py b/test/functional/s3api/test_multi_upload.py
new file mode 100644
index 0000000000..3aa205bbb0
--- /dev/null
+++ b/test/functional/s3api/test_multi_upload.py
@@ -0,0 +1,1342 @@
+# Copyright (c) 2015 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import base64
+import binascii
+import unittest
+
+import urllib.parse
+from itertools import zip_longest
+
+import test.functional as tf
+from swift.common.middleware.s3api.etree import fromstring, tostring, \
+    Element, SubElement
+from swift.common.middleware.s3api.utils import MULTIUPLOAD_SUFFIX, mktime, \
+    S3Timestamp
+from swift.common.utils import md5
+
+from test.functional.s3api import S3ApiBase, SigV4Mixin, \
+    skip_boto2_sort_header_bug
+from test.functional.s3api.s3_test_client import Connection
+from test.functional.s3api.utils import get_error_code, get_error_msg, \
+    calculate_md5
+from test.functional.swift_test_client import Connection as SwiftConnection
+
+
+def setUpModule():
+    tf.setup_package()
+
+
+def tearDownModule():
+    tf.teardown_package()
+
+
+class TestS3ApiMultiUpload(S3ApiBase):
+    def setUp(self):
+        super(TestS3ApiMultiUpload, self).setUp()
+        if not tf.cluster_info['s3api'].get('allow_multipart_uploads', False):
+            self.skipTest('multipart upload is not enebled')
+
+        self.min_segment_size = int(tf.cluster_info['s3api'].get(
+            'min_segment_size', 5242880))
+
+    def _gen_comp_xml(self, etags, step=1):
+        elem = Element('CompleteMultipartUpload')
+        for i, etag in enumerate(etags):
+            elem_part = SubElement(elem, 'Part')
+            SubElement(elem_part, 'PartNumber').text = str(i * step + 1)
+            SubElement(elem_part, 'ETag').text = etag
+        return tostring(elem)
+
+    def _initiate_multi_uploads_result_generator(self, bucket, keys,
+                                                 headers=None, trials=1):
+        if headers is None:
+            headers = [None] * len(keys)
+        self.conn.make_request('PUT', bucket)
+        query = 'uploads'
+        for key, key_headers in zip_longest(keys, headers):
+            for i in range(trials):
+                status, resp_headers, body = \
+                    self.conn.make_request('POST', bucket, key,
+                                           headers=key_headers, query=query)
+                yield status, resp_headers, body
+
+    def _upload_part(self, bucket, key, upload_id, content=None, part_num=1):
+        query = 'partNumber=%s&uploadId=%s' % (part_num, upload_id)
+        content = content if content else b'a' * self.min_segment_size
+        with self.quiet_boto_logging():
+            status, headers, body = self.conn.make_request(
+                'PUT', bucket, key, body=content, query=query)
+        return status, headers, body
+
+    def _upload_part_copy(self, src_bucket, src_obj, dst_bucket, dst_key,
+                          upload_id, part_num=1, src_range=None,
+                          src_version_id=None):
+
+        src_path = '%s/%s' % (src_bucket, src_obj)
+        if src_version_id:
+            src_path += '?versionId=%s' % src_version_id
+        query = 'partNumber=%s&uploadId=%s' % (part_num, upload_id)
+        req_headers = {'X-Amz-Copy-Source': src_path}
+        if src_range:
+            req_headers['X-Amz-Copy-Source-Range'] = src_range
+        status, headers, body = \
+            self.conn.make_request('PUT', dst_bucket, dst_key,
+                                   headers=req_headers,
+                                   query=query)
+        elem = fromstring(body, 'CopyPartResult')
+        etag = elem.find('ETag').text.strip('"')
+        return status, headers, body, etag
+
+    def _complete_multi_upload(self, bucket, key, upload_id, xml):
+        query = 'uploadId=%s' % upload_id
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, key, body=xml,
+                                   query=query)
+        return status, headers, body
+
+    def test_object_multi_upload(self):
+        bucket = 'bucket'
+        keys = [u'obj1\N{SNOWMAN}', u'obj2\N{SNOWMAN}', 'obj3']
+        bad_content_md5 = base64.b64encode(b'a' * 16).strip().decode('ascii')
+        headers = [{'Content-Type': 'foo/bar', 'x-amz-meta-baz': 'quux',
+                    'Content-Encoding': 'gzip', 'Content-Language': 'en-US',
+                    'Expires': 'Thu, 01 Dec 1994 16:00:00 GMT',
+                    'Cache-Control': 'no-cache',
+                    'Content-Disposition': 'attachment'},
+                   {'Content-MD5': bad_content_md5},
+                   {'Etag': 'nonsense'}]
+        uploads = []
+
+        results_generator = self._initiate_multi_uploads_result_generator(
+            bucket, keys, headers=headers)
+
+        # Initiate Multipart Upload
+        for expected_key, (status, headers, body) in \
+                zip(keys, results_generator):
+            self.assertEqual(status, 200, body)
+            self.assertCommonResponseHeaders(headers)
+            self.assertIn('content-type', headers)
+            self.assertEqual(headers['content-type'], 'application/xml')
+            self.assertIn('content-length', headers)
+            self.assertEqual(headers['content-length'], str(len(body)))
+            elem = fromstring(body, 'InitiateMultipartUploadResult')
+            self.assertEqual(elem.find('Bucket').text, bucket)
+            key = elem.find('Key').text
+            self.assertEqual(expected_key, key)
+            upload_id = elem.find('UploadId').text
+            self.assertIsNotNone(upload_id)
+            self.assertNotIn((key, upload_id), uploads)
+            uploads.append((key, upload_id))
+
+        self.assertEqual(len(uploads), len(keys))  # sanity
+
+        # List Multipart Uploads
+        expected_uploads_list = [uploads]
+        for upload in uploads:
+            expected_uploads_list.append([upload])
+        for expected_uploads in expected_uploads_list:
+            query = 'uploads'
+            if len(expected_uploads) == 1:
+                query += '&' + urllib.parse.urlencode(
+                    {'prefix': expected_uploads[0][0]})
+            status, headers, body = \
+                self.conn.make_request('GET', bucket, query=query)
+            self.assertEqual(status, 200)
+            self.assertCommonResponseHeaders(headers)
+            self.assertTrue('content-type' in headers)
+            self.assertEqual(headers['content-type'], 'application/xml')
+            self.assertTrue('content-length' in headers)
+            self.assertEqual(headers['content-length'], str(len(body)))
+            elem = fromstring(body, 'ListMultipartUploadsResult')
+            self.assertEqual(elem.find('Bucket').text, bucket)
+            self.assertIsNone(elem.find('KeyMarker').text)
+            if len(expected_uploads) > 1:
+                self.assertEqual(elem.find('NextKeyMarker').text,
+                                 expected_uploads[-1][0])
+            else:
+                self.assertIsNone(elem.find('NextKeyMarker').text)
+            self.assertIsNone(elem.find('UploadIdMarker').text)
+            if len(expected_uploads) > 1:
+                self.assertEqual(elem.find('NextUploadIdMarker').text,
+                                 expected_uploads[-1][1])
+            else:
+                self.assertIsNone(elem.find('NextUploadIdMarker').text)
+            self.assertEqual(elem.find('MaxUploads').text, '1000')
+            self.assertTrue(elem.find('EncodingType') is None)
+            self.assertEqual(elem.find('IsTruncated').text, 'false')
+            self.assertEqual(len(elem.findall('Upload')),
+                             len(expected_uploads))
+            for (expected_key, expected_upload_id), u in \
+                    zip(expected_uploads, elem.findall('Upload')):
+                key = u.find('Key').text
+                upload_id = u.find('UploadId').text
+                self.assertEqual(expected_key, key)
+                self.assertEqual(expected_upload_id, upload_id)
+                self.assertEqual(u.find('Initiator/ID').text,
+                                 self.conn.user_id)
+                self.assertEqual(u.find('Initiator/DisplayName').text,
+                                 self.conn.user_id)
+                self.assertEqual(u.find('Owner/ID').text, self.conn.user_id)
+                self.assertEqual(u.find('Owner/DisplayName').text,
+                                 self.conn.user_id)
+                self.assertEqual(u.find('StorageClass').text, 'STANDARD')
+                self.assertTrue(u.find('Initiated').text is not None)
+
+        # Upload Part
+        key, upload_id = uploads[0]
+        content = b'a' * self.min_segment_size
+        etag = md5(content, usedforsecurity=False).hexdigest()
+        status, headers, body = \
+            self._upload_part(bucket, key, upload_id, content)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers, etag)
+        self.assertTrue('content-type' in headers)
+        self.assertEqual(headers['content-type'], 'text/html; charset=UTF-8')
+        self.assertTrue('content-length' in headers)
+        self.assertEqual(headers['content-length'], '0')
+        expected_parts_list = [(headers['etag'],
+                                mktime(headers['last-modified']))]
+
+        # Upload Part Copy
+        key, upload_id = uploads[1]
+        src_bucket = 'bucket2'
+        src_obj = 'obj3'
+        src_content = b'b' * self.min_segment_size
+        etag = md5(src_content, usedforsecurity=False).hexdigest()
+
+        # prepare src obj
+        self.conn.make_request('PUT', src_bucket)
+        with self.quiet_boto_logging():
+            self.conn.make_request('PUT', src_bucket, src_obj,
+                                   body=src_content)
+        _, headers, _ = self.conn.make_request('HEAD', src_bucket, src_obj)
+        self.assertCommonResponseHeaders(headers)
+
+        status, headers, body, resp_etag = \
+            self._upload_part_copy(src_bucket, src_obj, bucket,
+                                   key, upload_id)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self.assertTrue('content-type' in headers)
+        self.assertEqual(headers['content-type'], 'application/xml')
+        self.assertTrue('content-length' in headers)
+        self.assertEqual(headers['content-length'], str(len(body)))
+        self.assertTrue('etag' not in headers)
+        elem = fromstring(body, 'CopyPartResult')
+
+        copy_resp_last_modified = elem.find('LastModified').text
+        self.assertIsNotNone(copy_resp_last_modified)
+
+        self.assertEqual(resp_etag, etag)
+
+        # Check last-modified timestamp
+        key, upload_id = uploads[1]
+        query = 'uploadId=%s' % upload_id
+        status, headers, body = \
+            self.conn.make_request('GET', bucket, key, query=query)
+
+        self.assertEqual(200, status)
+        elem = fromstring(body, 'ListPartsResult')
+
+        listing_last_modified = [p.find('LastModified').text
+                                 for p in elem.iterfind('Part')]
+        # There should be *exactly* one parts in the result
+        self.assertEqual(listing_last_modified, [copy_resp_last_modified])
+
+        # List Parts
+        key, upload_id = uploads[0]
+        query = 'uploadId=%s' % upload_id
+        status, headers, body = \
+            self.conn.make_request('GET', bucket, key, query=query)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self.assertTrue('content-type' in headers)
+        self.assertEqual(headers['content-type'], 'application/xml')
+        self.assertTrue('content-length' in headers)
+        self.assertEqual(headers['content-length'], str(len(body)))
+        elem = fromstring(body, 'ListPartsResult')
+        self.assertEqual(elem.find('Bucket').text, bucket)
+        self.assertEqual(elem.find('Key').text, key)
+        self.assertEqual(elem.find('UploadId').text, upload_id)
+        self.assertEqual(elem.find('Initiator/ID').text, self.conn.user_id)
+        self.assertEqual(elem.find('Initiator/DisplayName').text,
+                         self.conn.user_id)
+        self.assertEqual(elem.find('Owner/ID').text, self.conn.user_id)
+        self.assertEqual(elem.find('Owner/DisplayName').text,
+                         self.conn.user_id)
+        self.assertEqual(elem.find('StorageClass').text, 'STANDARD')
+        self.assertEqual(elem.find('PartNumberMarker').text, '0')
+        self.assertEqual(elem.find('NextPartNumberMarker').text, '1')
+        self.assertEqual(elem.find('MaxParts').text, '1000')
+        self.assertEqual(elem.find('IsTruncated').text, 'false')
+        self.assertEqual(len(elem.findall('Part')), 1)
+
+        # etags will be used to generate xml for Complete Multipart Upload
+        etags = []
+        for (expected_etag, expected_date), p in \
+                zip(expected_parts_list, elem.findall('Part')):
+            last_modified = p.find('LastModified').text
+            self.assertIsNotNone(last_modified)
+            last_modified_from_xml = S3Timestamp.from_s3xmlformat(
+                last_modified)
+            self.assertEqual(expected_date, float(last_modified_from_xml))
+            self.assertEqual(expected_etag, p.find('ETag').text)
+            self.assertEqual(self.min_segment_size, int(p.find('Size').text))
+            etags.append(p.find('ETag').text)
+
+        # Complete Multipart Upload
+        key, upload_id = uploads[0]
+        xml = self._gen_comp_xml(etags)
+        status, headers, body = \
+            self._complete_multi_upload(bucket, key, upload_id, xml)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self.assertIn('content-type', headers)
+        self.assertEqual(headers['content-type'], 'application/xml')
+        if 'content-length' in headers:
+            self.assertEqual(headers['content-length'], str(len(body)))
+        else:
+            self.assertIn('transfer-encoding', headers)
+            self.assertEqual(headers['transfer-encoding'], 'chunked')
+        lines = body.split(b'\n')
+        self.assertTrue(lines[0].startswith(b'<?xml'), body)
+        self.assertTrue(lines[0].endswith(b'?>'), body)
+        elem = fromstring(body, 'CompleteMultipartUploadResult')
+        self.assertEqual(
+            '%s/bucket/obj1%%E2%%98%%83' %
+            tf.config['s3_storage_url'].rstrip('/'),
+            elem.find('Location').text)
+        self.assertEqual(elem.find('Bucket').text, bucket)
+        self.assertEqual(elem.find('Key').text, key)
+        concatted_etags = b''.join(
+            etag.strip('"').encode('ascii') for etag in etags)
+        exp_etag = '"%s-%s"' % (
+            md5(binascii.unhexlify(concatted_etags),
+                usedforsecurity=False).hexdigest(), len(etags))
+        etag = elem.find('ETag').text
+        self.assertEqual(etag, exp_etag)
+
+        exp_size = self.min_segment_size * len(etags)
+        status, headers, body = \
+            self.conn.make_request('HEAD', bucket, key)
+        self.assertEqual(status, 200)
+        self.assertEqual(headers['content-length'], str(exp_size))
+        self.assertEqual(headers['content-type'], 'foo/bar')
+        self.assertEqual(headers['content-encoding'], 'gzip')
+        self.assertEqual(headers['content-language'], 'en-US')
+        self.assertEqual(headers['content-disposition'], 'attachment')
+        self.assertEqual(headers['expires'], 'Thu, 01 Dec 1994 16:00:00 GMT')
+        self.assertEqual(headers['cache-control'], 'no-cache')
+        self.assertEqual(headers['x-amz-meta-baz'], 'quux')
+
+        swift_etag = '"%s"' % md5(
+            concatted_etags, usedforsecurity=False).hexdigest()
+        # TODO: GET via swift api, check against swift_etag
+
+        # Should be safe to retry
+        status, headers, body = \
+            self._complete_multi_upload(bucket, key, upload_id, xml)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self.assertIn('content-type', headers)
+        self.assertEqual(headers['content-type'], 'application/xml')
+        if 'content-length' in headers:
+            self.assertEqual(headers['content-length'], str(len(body)))
+        else:
+            self.assertIn('transfer-encoding', headers)
+            self.assertEqual(headers['transfer-encoding'], 'chunked')
+        lines = body.split(b'\n')
+        self.assertTrue(lines[0].startswith(b'<?xml'), body)
+        self.assertTrue(lines[0].endswith(b'?>'), body)
+        elem = fromstring(body, 'CompleteMultipartUploadResult')
+        self.assertEqual(
+            '%s/bucket/obj1%%E2%%98%%83' %
+            tf.config['s3_storage_url'].rstrip('/'),
+            elem.find('Location').text)
+        self.assertEqual(elem.find('Bucket').text, bucket)
+        self.assertEqual(elem.find('Key').text, key)
+        self.assertEqual(elem.find('ETag').text, exp_etag)
+
+        status, headers, body = \
+            self.conn.make_request('HEAD', bucket, key)
+        self.assertEqual(status, 200)
+        self.assertEqual(headers['content-length'], str(exp_size))
+        self.assertEqual(headers['content-type'], 'foo/bar')
+        self.assertEqual(headers['x-amz-meta-baz'], 'quux')
+
+        # Upload Part Copy -- MU as source
+        key, upload_id = uploads[1]
+        status, headers, body, resp_etag = \
+            self._upload_part_copy(bucket, keys[0], bucket,
+                                   key, upload_id, part_num=2)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self.assertIn('content-type', headers)
+        self.assertEqual(headers['content-type'], 'application/xml')
+        self.assertIn('content-length', headers)
+        self.assertEqual(headers['content-length'], str(len(body)))
+        self.assertNotIn('etag', headers)
+        elem = fromstring(body, 'CopyPartResult')
+
+        last_modified = elem.find('LastModified').text
+        self.assertIsNotNone(last_modified)
+
+        exp_content = b'a' * self.min_segment_size
+        etag = md5(exp_content, usedforsecurity=False).hexdigest()
+        self.assertEqual(resp_etag, etag)
+
+        # Also check that the etag is correct in part listings
+        query = 'uploadId=%s' % upload_id
+        status, headers, body = \
+            self.conn.make_request('GET', bucket, key, query=query)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self.assertTrue('content-type' in headers)
+        self.assertEqual(headers['content-type'], 'application/xml')
+        self.assertTrue('content-length' in headers)
+        self.assertEqual(headers['content-length'], str(len(body)))
+        elem = fromstring(body, 'ListPartsResult')
+        self.assertEqual(len(elem.findall('Part')), 2)
+        self.assertEqual(elem.findall('Part')[1].find('PartNumber').text, '2')
+        self.assertEqual(elem.findall('Part')[1].find('ETag').text,
+                         '"%s"' % etag)
+
+        # Abort Multipart Uploads
+        # note that uploads[1] has part data while uploads[2] does not
+        sw_conn = SwiftConnection(tf.config)
+        sw_conn.authenticate()
+        for key, upload_id in uploads[1:]:
+            query = 'uploadId=%s' % upload_id
+            status, headers, body = \
+                self.conn.make_request('DELETE', bucket, key, query=query)
+            self.assertEqual(status, 204)
+            self.assertCommonResponseHeaders(headers)
+            self.assertTrue('content-type' in headers)
+            self.assertEqual(headers['content-type'],
+                             'text/html; charset=UTF-8')
+            self.assertTrue('content-length' in headers)
+            self.assertEqual(headers['content-length'], '0')
+            # Check if all parts have been deleted
+            segments = sw_conn.get_account().container(
+                bucket + MULTIUPLOAD_SUFFIX).files(
+                    parms={'prefix': '%s/%s' % (key, upload_id)})
+            self.assertFalse(segments)
+
+        # Check object
+        def check_obj(req_headers, exp_status):
+            status, headers, body = \
+                self.conn.make_request('HEAD', bucket, keys[0], req_headers)
+            self.assertEqual(status, exp_status)
+            self.assertCommonResponseHeaders(headers)
+            self.assertIn('content-length', headers)
+            if exp_status == 412:
+                self.assertNotIn('etag', headers)
+                self.assertEqual(headers['content-length'], '0')
+            else:
+                self.assertIn('etag', headers)
+                self.assertEqual(headers['etag'], exp_etag)
+                if exp_status == 304:
+                    self.assertEqual(headers['content-length'], '0')
+                else:
+                    self.assertEqual(headers['content-length'], str(exp_size))
+
+        check_obj({}, 200)
+
+        # Sanity check conditionals
+        check_obj({'If-Match': 'some other thing'}, 412)
+        check_obj({'If-None-Match': 'some other thing'}, 200)
+
+        # More interesting conditional cases
+        check_obj({'If-Match': exp_etag}, 200)
+        check_obj({'If-Match': swift_etag}, 412)
+        check_obj({'If-None-Match': swift_etag}, 200)
+        check_obj({'If-None-Match': exp_etag}, 304)
+
+        # Check listings
+        status, headers, body = self.conn.make_request('GET', bucket)
+        self.assertEqual(status, 200)
+
+        elem = fromstring(body, 'ListBucketResult')
+        resp_objects = list(elem.findall('./Contents'))
+        self.assertEqual(len(resp_objects), 1)
+        o = resp_objects[0]
+        expected_key = keys[0]
+        self.assertEqual(o.find('Key').text, expected_key)
+        self.assertIsNotNone(o.find('LastModified').text)
+        self.assertRegex(
+            o.find('LastModified').text,
+            r'^\d{4}-\d{2}-\d{2}T\d{2}:\d{2}:\d{2}.000Z$')
+        self.assertEqual(o.find('ETag').text, exp_etag)
+        self.assertEqual(o.find('Size').text, str(exp_size))
+        self.assertIsNotNone(o.find('StorageClass').text)
+        self.assertEqual(o.find('Owner/ID').text, self.conn.user_id)
+        self.assertEqual(o.find('Owner/DisplayName').text,
+                         self.conn.user_id)
+
+    def test_initiate_multi_upload_error(self):
+        bucket = 'bucket'
+        key = 'obj'
+        self.conn.make_request('PUT', bucket)
+        query = 'uploads'
+
+        auth_error_conn = Connection(tf.config['s3_access_key'], 'invalid')
+        status, headers, body = \
+            auth_error_conn.make_request('POST', bucket, key, query=query)
+        self.assertEqual(get_error_code(body), 'SignatureDoesNotMatch')
+
+        status, resp_headers, body = \
+            self.conn.make_request('POST', 'nothing', key, query=query)
+        self.assertEqual(get_error_code(body), 'NoSuchBucket')
+
+        status, resp_headers, body = self.conn.make_request(
+            'POST', bucket,
+            'x' * (tf.cluster_info['swift']['max_object_name_length'] + 1),
+            query=query)
+        self.assertEqual(get_error_code(body), 'KeyTooLongError')
+
+    def test_list_multi_uploads_error(self):
+        bucket = 'bucket'
+        self.conn.make_request('PUT', bucket)
+        query = 'uploads'
+
+        auth_error_conn = Connection(tf.config['s3_access_key'], 'invalid')
+        status, headers, body = \
+            auth_error_conn.make_request('GET', bucket, query=query)
+        self.assertEqual(get_error_code(body), 'SignatureDoesNotMatch')
+
+        status, headers, body = \
+            self.conn.make_request('GET', 'nothing', query=query)
+        self.assertEqual(get_error_code(body), 'NoSuchBucket')
+
+    def test_upload_part_error(self):
+        bucket = 'bucket'
+        self.conn.make_request('PUT', bucket)
+        query = 'uploads'
+        key = 'obj'
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, key, query=query)
+        elem = fromstring(body, 'InitiateMultipartUploadResult')
+        upload_id = elem.find('UploadId').text
+
+        query = 'partNumber=%s&uploadId=%s' % (1, upload_id)
+        auth_error_conn = Connection(tf.config['s3_access_key'], 'invalid')
+        status, headers, body = \
+            auth_error_conn.make_request('PUT', bucket, key, query=query)
+        self.assertEqual(get_error_code(body), 'SignatureDoesNotMatch')
+
+        status, headers, body = \
+            self.conn.make_request('PUT', 'nothing', key, query=query)
+        self.assertEqual(get_error_code(body), 'NoSuchBucket')
+
+        query = 'partNumber=%s&uploadId=%s' % (1, 'nothing')
+        status, headers, body = \
+            self.conn.make_request('PUT', bucket, key, query=query)
+        self.assertEqual(get_error_code(body), 'NoSuchUpload')
+
+        query = 'partNumber=%s&uploadId=%s' % (0, upload_id)
+        status, headers, body = \
+            self.conn.make_request('PUT', bucket, key, query=query)
+        self.assertEqual(get_error_code(body), 'InvalidArgument')
+        err_msg = 'Part number must be an integer between 1 and'
+        self.assertTrue(err_msg in get_error_msg(body))
+
+    def test_upload_part_copy_error(self):
+        src_bucket = 'src'
+        src_obj = 'src'
+        self.conn.make_request('PUT', src_bucket)
+        self.conn.make_request('PUT', src_bucket, src_obj)
+        src_path = '%s/%s' % (src_bucket, src_obj)
+
+        bucket = 'bucket'
+        self.conn.make_request('PUT', bucket)
+        key = 'obj'
+        query = 'uploads'
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, key, query=query)
+        elem = fromstring(body, 'InitiateMultipartUploadResult')
+        upload_id = elem.find('UploadId').text
+
+        query = 'partNumber=%s&uploadId=%s' % (1, upload_id)
+        auth_error_conn = Connection(tf.config['s3_access_key'], 'invalid')
+        status, headers, body = \
+            auth_error_conn.make_request('PUT', bucket, key,
+                                         headers={
+                                             'X-Amz-Copy-Source': src_path
+                                         },
+                                         query=query)
+        self.assertEqual(get_error_code(body), 'SignatureDoesNotMatch')
+
+        status, headers, body = \
+            self.conn.make_request('PUT', 'nothing', key,
+                                   headers={'X-Amz-Copy-Source': src_path},
+                                   query=query)
+        self.assertEqual(get_error_code(body), 'NoSuchBucket')
+
+        query = 'partNumber=%s&uploadId=%s' % (1, 'nothing')
+        status, headers, body = \
+            self.conn.make_request('PUT', bucket, key,
+                                   headers={'X-Amz-Copy-Source': src_path},
+                                   query=query)
+        self.assertEqual(get_error_code(body), 'NoSuchUpload')
+
+        src_path = '%s/%s' % (src_bucket, 'nothing')
+        query = 'partNumber=%s&uploadId=%s' % (1, upload_id)
+        status, headers, body = \
+            self.conn.make_request('PUT', bucket, key,
+                                   headers={'X-Amz-Copy-Source': src_path},
+                                   query=query)
+        self.assertEqual(get_error_code(body), 'NoSuchKey')
+
+    def test_list_parts_error(self):
+        bucket = 'bucket'
+        self.conn.make_request('PUT', bucket)
+        key = 'obj'
+        query = 'uploads'
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, key, query=query)
+        elem = fromstring(body, 'InitiateMultipartUploadResult')
+        upload_id = elem.find('UploadId').text
+
+        query = 'uploadId=%s' % upload_id
+        auth_error_conn = Connection(tf.config['s3_access_key'], 'invalid')
+
+        status, headers, body = \
+            auth_error_conn.make_request('GET', bucket, key, query=query)
+        self.assertEqual(get_error_code(body), 'SignatureDoesNotMatch')
+
+        status, headers, body = \
+            self.conn.make_request('GET', 'nothing', key, query=query)
+        self.assertEqual(get_error_code(body), 'NoSuchBucket')
+
+        query = 'uploadId=%s' % 'nothing'
+        status, headers, body = \
+            self.conn.make_request('GET', bucket, key, query=query)
+        self.assertEqual(get_error_code(body), 'NoSuchUpload')
+
+    def test_abort_multi_upload_error(self):
+        bucket = 'bucket'
+        self.conn.make_request('PUT', bucket)
+        key = 'obj'
+        query = 'uploads'
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, key, query=query)
+        elem = fromstring(body, 'InitiateMultipartUploadResult')
+        upload_id = elem.find('UploadId').text
+        self._upload_part(bucket, key, upload_id)
+
+        query = 'uploadId=%s' % upload_id
+        auth_error_conn = Connection(tf.config['s3_access_key'], 'invalid')
+        status, headers, body = \
+            auth_error_conn.make_request('DELETE', bucket, key, query=query)
+        self.assertEqual(get_error_code(body), 'SignatureDoesNotMatch')
+
+        status, headers, body = \
+            self.conn.make_request('DELETE', 'nothing', key, query=query)
+        self.assertEqual(get_error_code(body), 'NoSuchBucket')
+
+        status, headers, body = \
+            self.conn.make_request('DELETE', bucket, 'nothing', query=query)
+        self.assertEqual(get_error_code(body), 'NoSuchUpload')
+
+        query = 'uploadId=%s' % 'nothing'
+        status, headers, body = \
+            self.conn.make_request('DELETE', bucket, key, query=query)
+        self.assertEqual(get_error_code(body), 'NoSuchUpload')
+
+    def test_complete_multi_upload_error(self):
+        bucket = 'bucket'
+        keys = ['obj', 'obj2']
+        self.conn.make_request('PUT', bucket)
+        query = 'uploads'
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, keys[0], query=query)
+        elem = fromstring(body, 'InitiateMultipartUploadResult')
+        upload_id = elem.find('UploadId').text
+
+        etags = []
+        for i in range(1, 3):
+            query = 'partNumber=%s&uploadId=%s' % (i, upload_id)
+            status, headers, body = \
+                self.conn.make_request('PUT', bucket, keys[0], query=query)
+            etags.append(headers['etag'])
+        xml = self._gen_comp_xml(etags)
+
+        # part 1 too small
+        query = 'uploadId=%s' % upload_id
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, keys[0], body=xml,
+                                   query=query)
+        self.assertEqual(get_error_code(body), 'EntityTooSmall')
+
+        # invalid credentials
+        auth_error_conn = Connection(tf.config['s3_access_key'], 'invalid')
+        status, headers, body = \
+            auth_error_conn.make_request('POST', bucket, keys[0], body=xml,
+                                         query=query)
+        self.assertEqual(get_error_code(body), 'SignatureDoesNotMatch')
+
+        # wrong/missing bucket
+        status, headers, body = \
+            self.conn.make_request('POST', 'nothing', keys[0], query=query)
+        self.assertEqual(get_error_code(body), 'NoSuchBucket')
+
+        # wrong upload ID
+        query = 'uploadId=%s' % 'nothing'
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, keys[0], body=xml,
+                                   query=query)
+        self.assertEqual(get_error_code(body), 'NoSuchUpload')
+
+        # without Part tag in xml
+        query = 'uploadId=%s' % upload_id
+        xml = self._gen_comp_xml([])
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, keys[0], body=xml,
+                                   query=query)
+        self.assertEqual(get_error_code(body), 'MalformedXML')
+
+        # with invalid etag in xml
+        invalid_etag = 'invalid'
+        xml = self._gen_comp_xml([invalid_etag])
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, keys[0], body=xml,
+                                   query=query)
+        self.assertEqual(get_error_code(body), 'InvalidPart')
+
+        # without part in Swift
+        query = 'uploads'
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, keys[1], query=query)
+        elem = fromstring(body, 'InitiateMultipartUploadResult')
+        upload_id = elem.find('UploadId').text
+        query = 'uploadId=%s' % upload_id
+        xml = self._gen_comp_xml([etags[0]])
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, keys[1], body=xml,
+                                   query=query)
+        self.assertEqual(get_error_code(body), 'InvalidPart')
+
+    def test_complete_multi_upload_conditional(self):
+        bucket = 'bucket'
+        key = 'obj'
+        self.conn.make_request('PUT', bucket)
+        query = 'uploads'
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, key, query=query)
+        elem = fromstring(body, 'InitiateMultipartUploadResult')
+        upload_id = elem.find('UploadId').text
+
+        query = 'partNumber=1&uploadId=%s' % upload_id
+        status, headers, body = \
+            self.conn.make_request('PUT', bucket, key, query=query)
+        part_etag = headers['etag']
+        xml = self._gen_comp_xml([part_etag])
+
+        for headers in [
+            {'If-Match': part_etag},
+            {'If-Match': '*'},
+            {'If-None-Match': part_etag},
+            {'If-Modified-Since': 'Wed, 21 Oct 2015 07:28:00 GMT'},
+            {'If-Unmodified-Since': 'Wed, 21 Oct 2015 07:28:00 GMT'},
+        ]:
+            with self.subTest(headers=headers):
+                query = 'uploadId=%s' % upload_id
+                status, _, body = self.conn.make_request(
+                    'POST', bucket, key, body=xml,
+                    query=query, headers=headers)
+                self.assertEqual(status, 501)
+                self.assertEqual(get_error_code(body), 'NotImplemented')
+
+        # Can do basic existence checks, though
+        headers = {'If-None-Match': '*'}
+        query = 'uploadId=%s' % upload_id
+        status, _, body = self.conn.make_request(
+            'POST', bucket, key, body=xml,
+            query=query, headers=headers)
+        self.assertEqual(status, 200)
+
+        # And it'll prevent overwrites
+        query = 'uploads'
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, key, query=query)
+        elem = fromstring(body, 'InitiateMultipartUploadResult')
+        upload_id = elem.find('UploadId').text
+
+        query = 'partNumber=1&uploadId=%s' % upload_id
+        status, headers, body = \
+            self.conn.make_request('PUT', bucket, key, query=query)
+        part_etag = headers['etag']
+        xml = self._gen_comp_xml([part_etag])
+
+        headers = {'If-None-Match': '*'}
+        query = 'uploadId=%s' % upload_id
+        status, _, body = self.conn.make_request(
+            'POST', bucket, key, body=xml,
+            query=query, headers=headers)
+        self.assertEqual(status, 412)
+        self.assertEqual(get_error_code(body), 'PreconditionFailed')
+
+    def test_complete_upload_min_segment_size(self):
+        bucket = 'bucket'
+        key = 'obj'
+        self.conn.make_request('PUT', bucket)
+        query = 'uploads'
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, key, query=query)
+        elem = fromstring(body, 'InitiateMultipartUploadResult')
+        upload_id = elem.find('UploadId').text
+
+        # multi parts with no body
+        etags = []
+        for i in range(1, 3):
+            query = 'partNumber=%s&uploadId=%s' % (i, upload_id)
+            status, headers, body = \
+                self.conn.make_request('PUT', bucket, key, query=query)
+            etags.append(headers['etag'])
+            xml = self._gen_comp_xml(etags)
+
+        query = 'uploadId=%s' % upload_id
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, key, body=xml,
+                                   query=query)
+        self.assertEqual(get_error_code(body), 'EntityTooSmall')
+
+        # multi parts with all parts less than min segment size
+        etags = []
+        for i in range(1, 3):
+            query = 'partNumber=%s&uploadId=%s' % (i, upload_id)
+            status, headers, body = \
+                self.conn.make_request('PUT', bucket, key, query=query,
+                                       body='AA')
+            etags.append(headers['etag'])
+            xml = self._gen_comp_xml(etags)
+
+        query = 'uploadId=%s' % upload_id
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, key, body=xml,
+                                   query=query)
+        self.assertEqual(get_error_code(body), 'EntityTooSmall')
+
+        # one part and less than min segment size
+        etags = []
+        query = 'partNumber=1&uploadId=%s' % upload_id
+        status, headers, body = \
+            self.conn.make_request('PUT', bucket, key, query=query,
+                                   body='AA')
+        etags.append(headers['etag'])
+        xml = self._gen_comp_xml(etags)
+
+        query = 'uploadId=%s' % upload_id
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, key, body=xml,
+                                   query=query)
+        self.assertEqual(status, 200)
+
+        # multi parts with all parts except the first part less than min
+        # segment size
+        query = 'uploads'
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, key, query=query)
+        elem = fromstring(body, 'InitiateMultipartUploadResult')
+        upload_id = elem.find('UploadId').text
+
+        etags = []
+        body_size = [self.min_segment_size, self.min_segment_size - 1, 2]
+        for i in range(1, 3):
+            query = 'partNumber=%s&uploadId=%s' % (i, upload_id)
+            status, headers, body = \
+                self.conn.make_request('PUT', bucket, key, query=query,
+                                       body=b'A' * body_size[i])
+            etags.append(headers['etag'])
+            xml = self._gen_comp_xml(etags)
+
+        query = 'uploadId=%s' % upload_id
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, key, body=xml,
+                                   query=query)
+        self.assertEqual(get_error_code(body), 'EntityTooSmall')
+
+        # multi parts with all parts except last part more than min segment
+        # size
+        query = 'uploads'
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, key, query=query)
+        elem = fromstring(body, 'InitiateMultipartUploadResult')
+        upload_id = elem.find('UploadId').text
+
+        etags = []
+        body_size = [self.min_segment_size, self.min_segment_size, 2]
+        for i in range(1, 3):
+            query = 'partNumber=%s&uploadId=%s' % (i, upload_id)
+            status, headers, body = \
+                self.conn.make_request('PUT', bucket, key, query=query,
+                                       body=b'A' * body_size[i])
+            etags.append(headers['etag'])
+            xml = self._gen_comp_xml(etags)
+
+        query = 'uploadId=%s' % upload_id
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, key, body=xml,
+                                   query=query)
+        self.assertEqual(status, 200)
+
+    def test_complete_upload_with_fewer_etags(self):
+        bucket = 'bucket'
+        key = 'obj'
+        self.conn.make_request('PUT', bucket)
+        query = 'uploads'
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, key, query=query)
+        elem = fromstring(body, 'InitiateMultipartUploadResult')
+        upload_id = elem.find('UploadId').text
+
+        etags = []
+        for i in range(1, 4):
+            query = 'partNumber=%s&uploadId=%s' % (2 * i - 1, upload_id)
+            status, headers, body = self.conn.make_request(
+                'PUT', bucket, key, body=b'A' * 1024 * 1024 * 5,
+                query=query)
+            etags.append(headers['etag'])
+        query = 'uploadId=%s' % upload_id
+        xml = self._gen_comp_xml(etags[:-1], step=2)
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, key, body=xml,
+                                   query=query)
+        self.assertEqual(status, 200)
+
+    def _initiate_mpu_upload(self, bucket, key):
+        keys = [key]
+        uploads = []
+
+        results_generator = self._initiate_multi_uploads_result_generator(
+            bucket, keys)
+
+        # Initiate Multipart Upload
+        for expected_key, (status, headers, body) in \
+                zip(keys, results_generator):
+            self.assertEqual(status, 200)
+            self.assertCommonResponseHeaders(headers)
+            self.assertTrue('content-type' in headers)
+            self.assertEqual(headers['content-type'], 'application/xml')
+            self.assertTrue('content-length' in headers)
+            self.assertEqual(headers['content-length'], str(len(body)))
+            elem = fromstring(body, 'InitiateMultipartUploadResult')
+            self.assertEqual(elem.find('Bucket').text, bucket)
+            key = elem.find('Key').text
+            self.assertEqual(expected_key, key)
+            upload_id = elem.find('UploadId').text
+            self.assertTrue(upload_id is not None)
+            self.assertTrue((key, upload_id) not in uploads)
+            uploads.append((key, upload_id))
+
+        # sanity, there's just one multi-part upload
+        self.assertEqual(1, len(uploads))
+        self.assertEqual(1, len(keys))
+        _, upload_id = uploads[0]
+        return upload_id
+
+    def _copy_part_from_new_src_range(self, bucket, key, upload_id):
+        src_bucket = 'bucket2'
+        src_obj = 'obj4'
+        src_content = b'y' * (self.min_segment_size // 2) + b'z' * \
+            self.min_segment_size
+        src_range = 'bytes=0-%d' % (self.min_segment_size - 1)
+        etag = md5(
+            src_content[:self.min_segment_size],
+            usedforsecurity=False).hexdigest()
+
+        # prepare src obj
+        self.conn.make_request('PUT', src_bucket)
+        self.conn.make_request('PUT', src_bucket, src_obj, body=src_content)
+        _, headers, _ = self.conn.make_request('HEAD', src_bucket, src_obj)
+        self.assertCommonResponseHeaders(headers)
+
+        status, headers, body, resp_etag = \
+            self._upload_part_copy(src_bucket, src_obj, bucket,
+                                   key, upload_id, 1, src_range)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self.assertTrue('content-type' in headers)
+        self.assertEqual(headers['content-type'], 'application/xml')
+        self.assertTrue('content-length' in headers)
+        self.assertEqual(headers['content-length'], str(len(body)))
+        self.assertTrue('etag' not in headers)
+        elem = fromstring(body, 'CopyPartResult')
+        etags = [elem.find('ETag').text]
+
+        copy_resp_last_modified = elem.find('LastModified').text
+        self.assertIsNotNone(copy_resp_last_modified)
+
+        self.assertEqual(resp_etag, etag)
+
+        # Check last-modified timestamp
+        query = 'uploadId=%s' % upload_id
+        status, headers, body = \
+            self.conn.make_request('GET', bucket, key, query=query)
+
+        elem = fromstring(body, 'ListPartsResult')
+
+        listing_last_modified = [p.find('LastModified').text
+                                 for p in elem.iterfind('Part')]
+        # There should be *exactly* one parts in the result
+        self.assertEqual(listing_last_modified, [copy_resp_last_modified])
+
+        # sanity, there's just one etag
+        self.assertEqual(1, len(etags))
+        return etags[0]
+
+    def _complete_mpu_upload(self, bucket, key, upload_id, etags):
+        # Complete Multipart Upload
+        query = 'uploadId=%s' % upload_id
+        xml = self._gen_comp_xml(etags)
+        status, headers, body = \
+            self.conn.make_request('POST', bucket, key, body=xml,
+                                   query=query)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self.assertTrue('content-type' in headers)
+        self.assertEqual(headers['content-type'], 'application/xml')
+        if 'content-length' in headers:
+            self.assertEqual(headers['content-length'], str(len(body)))
+        else:
+            self.assertIn('transfer-encoding', headers)
+            self.assertEqual(headers['transfer-encoding'], 'chunked')
+        lines = body.split(b'\n')
+        self.assertTrue(lines[0].startswith(b'<?xml'), body)
+        self.assertTrue(lines[0].endswith(b'?>'), body)
+        elem = fromstring(body, 'CompleteMultipartUploadResult')
+        self.assertEqual(
+            '%s/%s/%s' %
+            (tf.config['s3_storage_url'].rstrip('/'), bucket, key),
+            elem.find('Location').text)
+        self.assertEqual(elem.find('Bucket').text, bucket)
+        self.assertEqual(elem.find('Key').text, key)
+        concatted_etags = b''.join(
+            etag.strip('"').encode('ascii') for etag in etags)
+        exp_etag = '"%s-%s"' % (
+            md5(binascii.unhexlify(concatted_etags),
+                usedforsecurity=False).hexdigest(), len(etags))
+        etag = elem.find('ETag').text
+        self.assertEqual(etag, exp_etag)
+
+    @skip_boto2_sort_header_bug
+    def test_mpu_copy_part_from_range_then_complete(self):
+        bucket = 'mpu-copy-range'
+        key = 'obj-complete'
+        upload_id = self._initiate_mpu_upload(bucket, key)
+        etag = self._copy_part_from_new_src_range(bucket, key, upload_id)
+        self._complete_mpu_upload(bucket, key, upload_id, [etag])
+
+    @skip_boto2_sort_header_bug
+    def test_mpu_copy_part_from_range_then_abort(self):
+        bucket = 'mpu-copy-range'
+        key = 'obj-abort'
+        upload_id = self._initiate_mpu_upload(bucket, key)
+        self._copy_part_from_new_src_range(bucket, key, upload_id)
+
+        # Abort Multipart Upload
+        query = 'uploadId=%s' % upload_id
+        status, headers, body = \
+            self.conn.make_request('DELETE', bucket, key, query=query)
+
+        # sanity checks
+        self.assertEqual(status, 204)
+        self.assertCommonResponseHeaders(headers)
+        self.assertTrue('content-type' in headers)
+        self.assertEqual(headers['content-type'], 'text/html; charset=UTF-8')
+        self.assertTrue('content-length' in headers)
+        self.assertEqual(headers['content-length'], '0')
+
+    def _copy_part_from_new_mpu_range(self, bucket, key, upload_id):
+        src_bucket = 'bucket2'
+        src_obj = 'mpu2'
+        src_upload_id = self._initiate_mpu_upload(src_bucket, src_obj)
+        # upload parts
+        etags = []
+        for part_num in range(2):
+            # Upload Part
+            content = (chr(97 + part_num) * self.min_segment_size).encode()
+            etag = md5(content, usedforsecurity=False).hexdigest()
+            status, headers, body = \
+                self._upload_part(src_bucket, src_obj, src_upload_id,
+                                  content, part_num=part_num + 1)
+            self.assertEqual(status, 200)
+            self.assertCommonResponseHeaders(headers, etag)
+            self.assertTrue('content-type' in headers)
+            self.assertEqual(headers['content-type'],
+                             'text/html; charset=UTF-8')
+            self.assertTrue('content-length' in headers)
+            self.assertEqual(headers['content-length'], '0')
+            self.assertEqual(headers['etag'], '"%s"' % etag)
+            etags.append(etag)
+        self._complete_mpu_upload(src_bucket, src_obj, src_upload_id, etags)
+
+        # Upload Part Copy -- MPU as source
+        src_range = 'bytes=0-%d' % (self.min_segment_size - 1)
+        status, headers, body, resp_etag = \
+            self._upload_part_copy(src_bucket, src_obj, bucket,
+                                   key, upload_id, part_num=1,
+                                   src_range=src_range)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self.assertIn('content-type', headers)
+        self.assertEqual(headers['content-type'], 'application/xml')
+        self.assertIn('content-length', headers)
+        self.assertEqual(headers['content-length'], str(len(body)))
+        self.assertNotIn('etag', headers)
+        elem = fromstring(body, 'CopyPartResult')
+
+        last_modified = elem.find('LastModified').text
+        self.assertIsNotNone(last_modified)
+        # use copied with src_range from src_obj?part-number=1
+        self.assertEqual(resp_etag, etags[0])
+
+        return resp_etag
+
+    @skip_boto2_sort_header_bug
+    def test_mpu_copy_part_from_mpu_part_number_then_complete(self):
+        bucket = 'mpu-copy-range'
+        key = 'obj-complete'
+        upload_id = self._initiate_mpu_upload(bucket, key)
+        etag = self._copy_part_from_new_mpu_range(bucket, key, upload_id)
+        self._complete_mpu_upload(bucket, key, upload_id, [etag])
+
+    @skip_boto2_sort_header_bug
+    def test_mpu_copy_part_from_mpu_part_number_then_abort(self):
+        bucket = 'mpu-copy-range'
+        key = 'obj-abort'
+        upload_id = self._initiate_mpu_upload(bucket, key)
+        self._copy_part_from_new_mpu_range(bucket, key, upload_id)
+
+        # Abort Multipart Upload
+        query = 'uploadId=%s' % upload_id
+        status, headers, body = \
+            self.conn.make_request('DELETE', bucket, key, query=query)
+
+        # sanity checks
+        self.assertEqual(status, 204)
+        self.assertCommonResponseHeaders(headers)
+        self.assertTrue('content-type' in headers)
+        self.assertEqual(headers['content-type'], 'text/html; charset=UTF-8')
+        self.assertTrue('content-length' in headers)
+        self.assertEqual(headers['content-length'], '0')
+
+    def test_object_multi_upload_part_copy_version(self):
+        if 'object_versioning' not in tf.cluster_info:
+            self.skipTest('Object Versioning not enabled')
+        bucket = 'bucket'
+        keys = ['obj1']
+        uploads = []
+
+        results_generator = self._initiate_multi_uploads_result_generator(
+            bucket, keys)
+
+        # Initiate Multipart Upload
+        for expected_key, (status, headers, body) in \
+                zip(keys, results_generator):
+            self.assertEqual(status, 200)
+            self.assertCommonResponseHeaders(headers)
+            self.assertTrue('content-type' in headers)
+            self.assertEqual(headers['content-type'], 'application/xml')
+            self.assertTrue('content-length' in headers)
+            self.assertEqual(headers['content-length'], str(len(body)))
+            elem = fromstring(body, 'InitiateMultipartUploadResult')
+            self.assertEqual(elem.find('Bucket').text, bucket)
+            key = elem.find('Key').text
+            self.assertEqual(expected_key, key)
+            upload_id = elem.find('UploadId').text
+            self.assertTrue(upload_id is not None)
+            self.assertTrue((key, upload_id) not in uploads)
+            uploads.append((key, upload_id))
+
+        self.assertEqual(len(uploads), len(keys))  # sanity
+
+        key, upload_id = uploads[0]
+        src_bucket = 'bucket2'
+        src_obj = 'obj4'
+        src_content = b'y' * (self.min_segment_size // 2) + b'z' * \
+            self.min_segment_size
+        etags = [md5(src_content, usedforsecurity=False).hexdigest()]
+
+        # prepare null-version src obj
+        self.conn.make_request('PUT', src_bucket)
+        self.conn.make_request('PUT', src_bucket, src_obj, body=src_content)
+        _, headers, _ = self.conn.make_request('HEAD', src_bucket, src_obj)
+        self.assertCommonResponseHeaders(headers)
+
+        # Turn on versioning
+        elem = Element('VersioningConfiguration')
+        SubElement(elem, 'Status').text = 'Enabled'
+        xml = tostring(elem)
+        status, headers, body = self.conn.make_request(
+            'PUT', src_bucket, body=xml, query='versioning')
+        self.assertEqual(status, 200)
+
+        src_obj2 = 'obj5'
+        src_content2 = b'stub'
+        etags.append(md5(src_content2, usedforsecurity=False).hexdigest())
+
+        # prepare src obj w/ real version
+        self.conn.make_request('PUT', src_bucket, src_obj2, body=src_content2)
+        _, headers, _ = self.conn.make_request('HEAD', src_bucket, src_obj2)
+        self.assertCommonResponseHeaders(headers)
+        version_id2 = headers['x-amz-version-id']
+
+        status, headers, body, resp_etag = \
+            self._upload_part_copy(src_bucket, src_obj, bucket,
+                                   key, upload_id, 1,
+                                   src_version_id='null')
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self.assertTrue('content-type' in headers)
+        self.assertEqual(headers['content-type'], 'application/xml')
+        self.assertTrue('content-length' in headers)
+        self.assertEqual(headers['content-length'], str(len(body)))
+        self.assertTrue('etag' not in headers)
+        elem = fromstring(body, 'CopyPartResult')
+
+        copy_resp_last_modifieds = [elem.find('LastModified').text]
+        self.assertTrue(copy_resp_last_modifieds[0] is not None)
+
+        self.assertEqual(resp_etag, etags[0])
+
+        status, headers, body, resp_etag = \
+            self._upload_part_copy(src_bucket, src_obj2, bucket,
+                                   key, upload_id, 2,
+                                   src_version_id=version_id2)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self.assertTrue('content-type' in headers)
+        self.assertEqual(headers['content-type'], 'application/xml')
+        self.assertTrue('content-length' in headers)
+        self.assertEqual(headers['content-length'], str(len(body)))
+        self.assertTrue('etag' not in headers)
+        elem = fromstring(body, 'CopyPartResult')
+
+        copy_resp_last_modifieds.append(elem.find('LastModified').text)
+        self.assertTrue(copy_resp_last_modifieds[1] is not None)
+
+        self.assertEqual(resp_etag, etags[1])
+
+        # Check last-modified timestamp
+        key, upload_id = uploads[0]
+        query = 'uploadId=%s' % upload_id
+        status, headers, body = \
+            self.conn.make_request('GET', bucket, key, query=query)
+
+        elem = fromstring(body, 'ListPartsResult')
+
+        listing_last_modified = [p.find('LastModified').text
+                                 for p in elem.iterfind('Part')]
+        self.assertEqual(listing_last_modified, copy_resp_last_modifieds)
+
+        # Abort Multipart Upload
+        key, upload_id = uploads[0]
+        query = 'uploadId=%s' % upload_id
+        status, headers, body = \
+            self.conn.make_request('DELETE', bucket, key, query=query)
+
+        # sanity checks
+        self.assertEqual(status, 204)
+        self.assertCommonResponseHeaders(headers)
+        self.assertTrue('content-type' in headers)
+        self.assertEqual(headers['content-type'], 'text/html; charset=UTF-8')
+        self.assertTrue('content-length' in headers)
+        self.assertEqual(headers['content-length'], '0')
+
+    def test_delete_bucket_multi_upload_object_exisiting(self):
+        bucket = 'bucket'
+        keys = ['obj1']
+        uploads = []
+
+        results_generator = self._initiate_multi_uploads_result_generator(
+            bucket, keys)
+
+        # Initiate Multipart Upload
+        for expected_key, (status, _, body) in \
+                zip(keys, results_generator):
+            self.assertEqual(status, 200)  # sanity
+            elem = fromstring(body, 'InitiateMultipartUploadResult')
+            key = elem.find('Key').text
+            self.assertEqual(expected_key, key)  # sanity
+            upload_id = elem.find('UploadId').text
+            self.assertTrue(upload_id is not None)  # sanity
+            self.assertTrue((key, upload_id) not in uploads)
+            uploads.append((key, upload_id))
+
+        self.assertEqual(len(uploads), len(keys))  # sanity
+
+        # Upload Part
+        key, upload_id = uploads[0]
+        content = b'a' * self.min_segment_size
+        status, headers, body = \
+            self._upload_part(bucket, key, upload_id, content)
+        self.assertEqual(status, 200)
+
+        # Complete Multipart Upload
+        key, upload_id = uploads[0]
+        etags = [md5(content, usedforsecurity=False).hexdigest()]
+        xml = self._gen_comp_xml(etags)
+        status, headers, body = \
+            self._complete_multi_upload(bucket, key, upload_id, xml)
+        self.assertEqual(status, 200)  # sanity
+
+        # GET multipart object
+        status, headers, body = \
+            self.conn.make_request('GET', bucket, key)
+        self.assertEqual(status, 200)  # sanity
+        self.assertEqual(content, body)  # sanity
+
+        # DELETE bucket while the object existing
+        status, headers, body = \
+            self.conn.make_request('DELETE', bucket)
+        self.assertEqual(status, 409)  # sanity
+
+        # The object must still be there.
+        status, headers, body = \
+            self.conn.make_request('GET', bucket, key)
+        self.assertEqual(status, 200)  # sanity
+        self.assertEqual(content, body)  # sanity
+
+        # Can delete it with DeleteMultipleObjects request
+        elem = Element('Delete')
+        SubElement(elem, 'Quiet').text = 'true'
+        obj_elem = SubElement(elem, 'Object')
+        SubElement(obj_elem, 'Key').text = key
+        body = tostring(elem, use_s3ns=False)
+
+        status, headers, body = self.conn.make_request(
+            'POST', bucket, body=body, query='delete',
+            headers={'Content-MD5': calculate_md5(body)})
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+
+        status, headers, body = \
+            self.conn.make_request('GET', bucket, key)
+        self.assertEqual(status, 404)  # sanity
+
+        # Now we can delete
+        status, headers, body = \
+            self.conn.make_request('DELETE', bucket)
+        self.assertEqual(status, 204)  # sanity
+
+
+class TestS3ApiMultiUploadSigV4(TestS3ApiMultiUpload, SigV4Mixin):
+    pass
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/functional/s3api/test_object.py b/test/functional/s3api/test_object.py
new file mode 100644
index 0000000000..ad5318d4ac
--- /dev/null
+++ b/test/functional/s3api/test_object.py
@@ -0,0 +1,1029 @@
+# -*- coding: utf-8 -*-
+# Copyright (c) 2015-2021 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import unittest
+
+import calendar
+import email.parser
+from email.utils import formatdate, parsedate
+from time import mktime
+
+import test.functional as tf
+from swift.common import utils
+
+from swift.common.middleware.s3api.etree import fromstring
+from swift.common.middleware.s3api.utils import S3Timestamp
+from swift.common.utils import md5, quote
+
+from test.functional.s3api import S3ApiBase, SigV4Mixin, \
+    skip_boto2_sort_header_bug, S3ApiBaseBoto3, get_boto3_conn
+from test.functional.s3api.s3_test_client import Connection
+from test.functional.s3api.utils import get_error_code, calculate_md5, \
+    get_error_msg
+
+DAY = 86400.0  # 60 * 60 * 24 (sec)
+
+
+def setUpModule():
+    tf.setup_package()
+
+
+def tearDownModule():
+    tf.teardown_package()
+
+
+class TestS3ApiObjectBoto3(S3ApiBaseBoto3):
+    def setUp(self):
+        super().setUp()
+        self.conn = get_boto3_conn(tf.config['s3_access_key'],
+                                   tf.config['s3_secret_key'])
+        self.bucket = 'test-bucket'
+        resp = self.conn.create_bucket(Bucket=self.bucket)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+
+    def test_put(self):
+        body = b'abcd' * 8192
+        resp = self.conn.put_object(Bucket=self.bucket, Key='obj', Body=body)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        resp = self.conn.get_object(Bucket=self.bucket, Key='obj')
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual(body, resp['Body'].read())
+
+    def test_put_chunked(self):
+        body = b'abcd' * 8192
+        resp = self.conn.put_object(Bucket=self.bucket, Key='obj', Body=body,
+                                    ContentEncoding='aws-chunked')
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        resp = self.conn.get_object(Bucket=self.bucket, Key='obj')
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual(body, resp['Body'].read())
+
+    def test_put_chunked_sha256(self):
+        body = b'abcd' * 8192
+        resp = self.conn.put_object(Bucket=self.bucket, Key='obj', Body=body,
+                                    ContentEncoding='aws-chunked',
+                                    ChecksumAlgorithm='SHA256')
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        resp = self.conn.get_object(Bucket=self.bucket, Key='obj')
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual(body, resp['Body'].read())
+
+
+class TestS3ApiObject(S3ApiBase):
+    def setUp(self):
+        super(TestS3ApiObject, self).setUp()
+        self.bucket = 'bucket'
+        self.conn.make_request('PUT', self.bucket)
+
+    def _assertObjectEtag(self, bucket, obj, etag):
+        status, headers, _ = self.conn.make_request('HEAD', bucket, obj)
+        self.assertEqual(status, 200)  # sanity
+        self.assertCommonResponseHeaders(headers, etag)
+
+    def test_object(self):
+        obj = u'object name with %-sign 🙂'
+        content = b'abc123'
+        etag = md5(content, usedforsecurity=False).hexdigest()
+
+        # PUT Object
+        status, headers, body = \
+            self.conn.make_request('PUT', self.bucket, obj, body=content)
+        self.assertEqual(status, 200)
+
+        self.assertCommonResponseHeaders(headers)
+        self.assertTrue('content-length' in headers)  # sanity
+        self.assertEqual(headers['content-length'], '0')
+        self._assertObjectEtag(self.bucket, obj, etag)
+
+        # PUT Object Copy
+        dst_bucket = 'dst-bucket'
+        dst_obj = 'dst_obj'
+        self.conn.make_request('PUT', dst_bucket)
+        headers = {'x-amz-copy-source': '/%s/%s' % (self.bucket, obj)}
+        status, headers, body = \
+            self.conn.make_request('PUT', dst_bucket, dst_obj,
+                                   headers=headers)
+        self.assertEqual(status, 200)
+
+        # PUT Object Copy with URL-encoded Source
+        dst_bucket = 'dst-bucket'
+        dst_obj = 'dst_obj'
+        self.conn.make_request('PUT', dst_bucket)
+        headers = {'x-amz-copy-source': quote('/%s/%s' % (self.bucket, obj))}
+        status, headers, body = \
+            self.conn.make_request('PUT', dst_bucket, dst_obj,
+                                   headers=headers)
+        self.assertEqual(status, 200)
+
+        self.assertCommonResponseHeaders(headers)
+        self.assertEqual(headers['content-length'], str(len(body)))
+
+        elem = fromstring(body, 'CopyObjectResult')
+        self.assertTrue(elem.find('LastModified').text is not None)
+        copy_resp_last_modified_xml = elem.find('LastModified').text
+        self.assertTrue(elem.find('ETag').text is not None)
+        self.assertEqual(etag, elem.find('ETag').text.strip('"'))
+        self._assertObjectEtag(dst_bucket, dst_obj, etag)
+
+        # Check timestamp on Copy in listing:
+        status, headers, body = \
+            self.conn.make_request('GET', dst_bucket)
+        self.assertEqual(status, 200)
+        elem = fromstring(body, 'ListBucketResult')
+        self.assertEqual(
+            elem.find('Contents').find("LastModified").text,
+            copy_resp_last_modified_xml)
+
+        # GET Object copy
+        status, headers, body = \
+            self.conn.make_request('GET', dst_bucket, dst_obj)
+        self.assertEqual(status, 200)
+
+        self.assertCommonResponseHeaders(headers, etag)
+        self.assertTrue(headers['last-modified'] is not None)
+        self.assertEqual(
+            float(S3Timestamp.from_s3xmlformat(copy_resp_last_modified_xml)),
+            calendar.timegm(parsedate(headers['last-modified'])))
+        self.assertTrue(headers['content-type'] is not None)
+        self.assertEqual(headers['content-length'], str(len(content)))
+
+        # GET Object
+        status, headers, body = \
+            self.conn.make_request('GET', self.bucket, obj)
+        self.assertEqual(status, 200)
+
+        self.assertCommonResponseHeaders(headers, etag)
+        self.assertTrue(headers['last-modified'] is not None)
+        self.assertTrue(headers['content-type'] is not None)
+        self.assertEqual(headers['content-length'], str(len(content)))
+        self.assertEqual(headers['accept-ranges'], 'bytes')
+
+        # HEAD Object
+        status, headers, body = \
+            self.conn.make_request('HEAD', self.bucket, obj)
+        self.assertEqual(status, 200)
+
+        self.assertCommonResponseHeaders(headers, etag)
+        self.assertTrue(headers['last-modified'] is not None)
+        self.assertTrue('content-type' in headers)
+        self.assertEqual(headers['content-length'], str(len(content)))
+        self.assertEqual(headers['accept-ranges'], 'bytes')
+
+        # DELETE Object
+        status, headers, body = \
+            self.conn.make_request('DELETE', self.bucket, obj)
+        self.assertEqual(status, 204)
+        self.assertCommonResponseHeaders(headers)
+
+        # DELETE Non-Existent Object
+        status, headers, body = \
+            self.conn.make_request('DELETE', self.bucket, 'does-not-exist')
+        self.assertEqual(status, 204)
+        self.assertCommonResponseHeaders(headers)
+
+    def test_put_object_error(self):
+        auth_error_conn = Connection(tf.config['s3_access_key'], 'invalid')
+        status, headers, body = \
+            auth_error_conn.make_request('PUT', self.bucket, 'object')
+        self.assertEqual(get_error_code(body), 'SignatureDoesNotMatch')
+        self.assertEqual(headers['content-type'], 'application/xml')
+
+        status, headers, body = \
+            self.conn.make_request('PUT', 'bucket2', 'object')
+        self.assertEqual(get_error_code(body), 'NoSuchBucket')
+        self.assertEqual(headers['content-type'], 'application/xml')
+
+    def test_put_object_name_too_long(self):
+        status, headers, body = self.conn.make_request(
+            'PUT', self.bucket,
+            'x' * (tf.cluster_info['swift']['max_object_name_length'] + 1))
+        self.assertEqual(get_error_code(body), 'KeyTooLongError')
+        self.assertEqual(headers['content-type'], 'application/xml')
+
+    def test_put_object_copy_error(self):
+        obj = 'object'
+        self.conn.make_request('PUT', self.bucket, obj)
+        dst_bucket = 'dst-bucket'
+        self.conn.make_request('PUT', dst_bucket)
+        dst_obj = 'dst_object'
+
+        headers = {'x-amz-copy-source': '/%s/%s' % (self.bucket, obj)}
+        auth_error_conn = Connection(tf.config['s3_access_key'], 'invalid')
+        status, headers, body = \
+            auth_error_conn.make_request('PUT', dst_bucket, dst_obj, headers)
+        self.assertEqual(get_error_code(body), 'SignatureDoesNotMatch')
+        self.assertEqual(headers['content-type'], 'application/xml')
+
+        # /src/nothing -> /dst/dst
+        headers = {'X-Amz-Copy-Source': '/%s/%s' % (self.bucket, 'nothing')}
+        status, headers, body = \
+            self.conn.make_request('PUT', dst_bucket, dst_obj, headers)
+        self.assertEqual(get_error_code(body), 'NoSuchKey')
+        self.assertEqual(headers['content-type'], 'application/xml')
+
+        # /nothing/src -> /dst/dst
+        headers = {'X-Amz-Copy-Source': '/%s/%s' % ('nothing', obj)}
+        status, headers, body = \
+            self.conn.make_request('PUT', dst_bucket, dst_obj, headers)
+        # TODO: source bucket is not check.
+        # self.assertEqual(get_error_code(body), 'NoSuchBucket')
+
+        # /src/src -> /nothing/dst
+        headers = {'X-Amz-Copy-Source': '/%s/%s' % (self.bucket, obj)}
+        status, headers, body = \
+            self.conn.make_request('PUT', 'nothing', dst_obj, headers)
+        self.assertEqual(get_error_code(body), 'NoSuchBucket')
+        self.assertEqual(headers['content-type'], 'application/xml')
+
+    def test_get_object_error(self):
+        obj = 'object'
+        self.conn.make_request('PUT', self.bucket, obj)
+
+        auth_error_conn = Connection(tf.config['s3_access_key'], 'invalid')
+        status, headers, body = \
+            auth_error_conn.make_request('GET', self.bucket, obj)
+        self.assertEqual(get_error_code(body), 'SignatureDoesNotMatch')
+        self.assertEqual(headers['content-type'], 'application/xml')
+
+        status, headers, body = \
+            self.conn.make_request('GET', self.bucket, 'invalid')
+        self.assertEqual(get_error_code(body), 'NoSuchKey')
+        self.assertEqual(headers['content-type'], 'application/xml')
+
+        status, headers, body = self.conn.make_request('GET', 'invalid', obj)
+        self.assertEqual(get_error_code(body), 'NoSuchBucket')
+        self.assertEqual(headers['content-type'], 'application/xml')
+
+    def test_head_object_error(self):
+        obj = 'object'
+        self.conn.make_request('PUT', self.bucket, obj)
+
+        auth_error_conn = Connection(tf.config['s3_access_key'], 'invalid')
+        status, headers, body = \
+            auth_error_conn.make_request('HEAD', self.bucket, obj)
+        self.assertEqual(status, 403)
+        self.assertEqual(body, b'')  # sanity
+        self.assertEqual(headers['content-type'], 'application/xml')
+
+        status, headers, body = \
+            self.conn.make_request('HEAD', self.bucket, 'invalid')
+        self.assertEqual(status, 404)
+        self.assertEqual(body, b'')  # sanity
+        self.assertEqual(headers['content-type'], 'application/xml')
+
+        status, headers, body = \
+            self.conn.make_request('HEAD', 'invalid', obj)
+        self.assertEqual(status, 404)
+        self.assertEqual(body, b'')  # sanity
+        self.assertEqual(headers['content-type'], 'application/xml')
+
+    def test_delete_object_error(self):
+        obj = 'object'
+        self.conn.make_request('PUT', self.bucket, obj)
+
+        auth_error_conn = Connection(tf.config['s3_access_key'], 'invalid')
+        status, headers, body = \
+            auth_error_conn.make_request('DELETE', self.bucket, obj)
+        self.assertEqual(get_error_code(body), 'SignatureDoesNotMatch')
+        self.assertEqual(headers['content-type'], 'application/xml')
+
+        status, headers, body = \
+            self.conn.make_request('DELETE', 'invalid', obj)
+        self.assertEqual(get_error_code(body), 'NoSuchBucket')
+        self.assertEqual(headers['content-type'], 'application/xml')
+
+    def test_put_object_content_encoding(self):
+        obj = 'object'
+        etag = md5(usedforsecurity=False).hexdigest()
+        headers = {'Content-Encoding': 'gzip'}
+        status, headers, body = \
+            self.conn.make_request('PUT', self.bucket, obj, headers)
+        self.assertEqual(status, 200)
+        status, headers, body = \
+            self.conn.make_request('HEAD', self.bucket, obj)
+        self.assertTrue('content-encoding' in headers)  # sanity
+        self.assertEqual(headers['content-encoding'], 'gzip')
+        self.assertCommonResponseHeaders(headers)
+        self._assertObjectEtag(self.bucket, obj, etag)
+
+    def test_put_object_content_md5(self):
+        obj = 'object'
+        content = b'abcdefghij'
+        etag = md5(content, usedforsecurity=False).hexdigest()
+        headers = {'Content-MD5': calculate_md5(content)}
+        status, headers, body = \
+            self.conn.make_request('PUT', self.bucket, obj, headers, content)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self._assertObjectEtag(self.bucket, obj, etag)
+
+    def test_put_object_content_type(self):
+        obj = 'object'
+        content = b'abcdefghij'
+        etag = md5(content, usedforsecurity=False).hexdigest()
+        headers = {'Content-Type': 'text/plain'}
+        status, headers, body = \
+            self.conn.make_request('PUT', self.bucket, obj, headers, content)
+        self.assertEqual(status, 200)
+        status, headers, body = \
+            self.conn.make_request('HEAD', self.bucket, obj)
+        self.assertEqual(headers['content-type'], 'text/plain')
+        self.assertCommonResponseHeaders(headers)
+        self._assertObjectEtag(self.bucket, obj, etag)
+
+    def test_put_object_conditional_requests(self):
+        obj = 'object'
+        content = b'abcdefghij'
+        headers = {'If-None-Match': 'asdf'}
+        status, headers, body = \
+            self.conn.make_request('PUT', self.bucket, obj, headers, content)
+        self.assertEqual(status, 501)
+
+        headers = {'If-Match': '*'}
+        status, headers, body = \
+            self.conn.make_request('PUT', self.bucket, obj, headers, content)
+        self.assertEqual(status, 501)
+
+        headers = {'If-Modified-Since': 'Sat, 27 Jun 2015 00:00:00 GMT'}
+        status, headers, body = \
+            self.conn.make_request('PUT', self.bucket, obj, headers, content)
+        self.assertEqual(status, 501)
+
+        headers = {'If-Unmodified-Since': 'Sat, 27 Jun 2015 00:00:00 GMT'}
+        status, headers, body = \
+            self.conn.make_request('PUT', self.bucket, obj, headers, content)
+        self.assertEqual(status, 501)
+
+        # None of the above should actually have created an object
+        status, headers, body = \
+            self.conn.make_request('HEAD', self.bucket, obj, {}, '')
+        self.assertEqual(status, 404)
+
+        # But this will
+        headers = {'If-None-Match': '*'}
+        status, headers, body = \
+            self.conn.make_request('PUT', self.bucket, obj, headers, content)
+        self.assertEqual(status, 200)
+
+        # And the if-none-match prevents overwrites
+        headers = {'If-None-Match': '*'}
+        status, headers, body = \
+            self.conn.make_request('PUT', self.bucket, obj, headers, content)
+        self.assertEqual(status, 412)
+
+    def test_put_object_expect(self):
+        obj = 'object'
+        content = b'abcdefghij'
+        etag = md5(content, usedforsecurity=False).hexdigest()
+        headers = {'Expect': '100-continue'}
+        status, headers, body = \
+            self.conn.make_request('PUT', self.bucket, obj, headers, content)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self._assertObjectEtag(self.bucket, obj, etag)
+
+    def _test_put_object_headers(self, req_headers, expected_headers=None):
+        if expected_headers is None:
+            expected_headers = req_headers
+        obj = 'object'
+        content = b'abcdefghij'
+        etag = md5(content, usedforsecurity=False).hexdigest()
+        status, headers, body = \
+            self.conn.make_request('PUT', self.bucket, obj,
+                                   req_headers, content)
+        self.assertEqual(status, 200)
+        status, headers, body = \
+            self.conn.make_request('HEAD', self.bucket, obj)
+        for header, value in expected_headers.items():
+            self.assertIn(header.lower(), headers)
+            self.assertEqual(headers[header.lower()], value)
+        self.assertCommonResponseHeaders(headers)
+        self._assertObjectEtag(self.bucket, obj, etag)
+
+    @skip_boto2_sort_header_bug
+    def test_put_object_metadata(self):
+        self._test_put_object_headers({
+            'X-Amz-Meta-Bar': 'foo',
+            'X-Amz-Meta-Bar2': 'foo2'})
+
+    def test_put_object_weird_metadata(self):
+        req_headers = dict(
+            ('x-amz-meta-' + c, c)
+            for c in '!"#$%&\'()*+-./<=>?@[\\]^`{|}~')
+        exp_headers = dict(
+            ('x-amz-meta-' + c, c)
+            for c in '!#$%&\'(*+-.^`|~')
+        self._test_put_object_headers(req_headers, exp_headers)
+
+    def test_put_object_underscore_in_metadata(self):
+        # Break this out separately for ease of testing pre-0.19.0 eventlet
+        self._test_put_object_headers({
+            'X-Amz-Meta-Foo-Bar': 'baz',
+            'X-Amz-Meta-Foo_Bar': 'also baz'})
+
+    def test_put_object_content_headers(self):
+        self._test_put_object_headers({
+            'Content-Type': 'foo/bar',
+            'Content-Encoding': 'baz',
+            'Content-Disposition': 'attachment',
+            'Content-Language': 'en'})
+
+    def test_put_object_cache_control(self):
+        self._test_put_object_headers({
+            'Cache-Control': 'private, some-extension'})
+
+    def test_put_object_expires(self):
+        self._test_put_object_headers({
+            # We don't validate that the Expires header is a valid date
+            'Expires': 'a valid HTTP-date timestamp'})
+
+    def test_put_object_robots_tag(self):
+        self._test_put_object_headers({
+            'X-Robots-Tag': 'googlebot: noarchive'})
+
+    def test_put_object_storage_class(self):
+        obj = 'object'
+        content = b'abcdefghij'
+        etag = md5(content, usedforsecurity=False).hexdigest()
+        headers = {'X-Amz-Storage-Class': 'STANDARD'}
+        status, headers, body = \
+            self.conn.make_request('PUT', self.bucket, obj, headers, content)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self._assertObjectEtag(self.bucket, obj, etag)
+
+    def test_put_object_valid_delete_headers(self):
+        obj = 'object'
+        content = b'abcdefghij'
+        ts = utils.Timestamp.now()
+        delete_at = {'X-Delete-At': str(int(ts) + 70)}
+        delete_after = {'X-Delete-After': str(int(ts) + 130)}
+        status, delete_at, body = \
+            self.conn.make_request('PUT', self.bucket, obj, delete_at, content)
+        self.assertEqual(status, 200)
+        status, delete_after, body = \
+            self.conn.make_request('PUT', self.bucket, obj, delete_after,
+                                   content)
+        self.assertEqual(status, 200)
+
+    def test_put_object_invalid_x_delete_at(self):
+        obj = 'object'
+        content = b'abcdefghij'
+        ts = utils.Timestamp.now()
+        headers = {'X-Delete-At': str(int(ts) - 140)}
+        status, headers, body = \
+            self.conn.make_request('PUT', self.bucket, obj, headers, content)
+        self.assertEqual(status, 400)
+        self.assertEqual(get_error_code(body), 'InvalidArgument')
+        self.assertEqual(get_error_msg(body), 'X-Delete-At in past')
+        headers = {'X-Delete-At': 'test'}
+        status, headers, body = \
+            self.conn.make_request('PUT', self.bucket, obj, headers, content)
+        self.assertEqual(status, 400)
+        self.assertEqual(get_error_code(body), 'InvalidArgument')
+        self.assertEqual(get_error_msg(body), 'Non-integer X-Delete-At')
+
+    def test_put_object_invalid_x_delete_after(self):
+        obj = 'object'
+        content = b'abcdefghij'
+        headers = {'X-Delete-After': 'test'}
+        status, headers, body = \
+            self.conn.make_request('PUT', self.bucket, obj, headers, content)
+        self.assertEqual(status, 400)
+        self.assertEqual(get_error_code(body), 'InvalidArgument')
+        self.assertEqual(get_error_msg(body), 'Non-integer X-Delete-After')
+        headers = {'X-Delete-After': '-140'}
+        status, headers, body = \
+            self.conn.make_request('PUT', self.bucket, obj, headers, content)
+        self.assertEqual(status, 400)
+        self.assertEqual(get_error_code(body), 'InvalidArgument')
+        self.assertEqual(get_error_msg(body), 'X-Delete-After in past')
+
+    def test_put_object_copy_source_params(self):
+        obj = 'object'
+        src_headers = {'X-Amz-Meta-Test': 'src'}
+        src_body = b'some content'
+        dst_bucket = 'dst-bucket'
+        dst_obj = 'dst_object'
+        self.conn.make_request('PUT', self.bucket, obj, src_headers, src_body)
+        self.conn.make_request('PUT', dst_bucket)
+
+        headers = {'X-Amz-Copy-Source': '/%s/%s?nonsense' % (
+            self.bucket, obj)}
+        status, headers, body = \
+            self.conn.make_request('PUT', dst_bucket, dst_obj, headers)
+        self.assertEqual(status, 400)
+        self.assertEqual(get_error_code(body), 'InvalidArgument')
+
+        headers = {'X-Amz-Copy-Source': '/%s/%s?versionId=null&nonsense' % (
+            self.bucket, obj)}
+        status, headers, body = \
+            self.conn.make_request('PUT', dst_bucket, dst_obj, headers)
+        self.assertEqual(status, 400)
+        self.assertEqual(get_error_code(body), 'InvalidArgument')
+
+        headers = {'X-Amz-Copy-Source': '/%s/%s?versionId=null' % (
+            self.bucket, obj)}
+        status, headers, body = \
+            self.conn.make_request('PUT', dst_bucket, dst_obj, headers)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        status, headers, body = \
+            self.conn.make_request('GET', dst_bucket, dst_obj)
+        self.assertEqual(status, 200)
+        self.assertEqual(headers['x-amz-meta-test'], 'src')
+        self.assertEqual(body, src_body)
+
+    def test_put_object_copy_source(self):
+        obj = 'object'
+        content = b'abcdefghij'
+        etag = md5(content, usedforsecurity=False).hexdigest()
+        self.conn.make_request('PUT', self.bucket, obj, body=content)
+
+        dst_bucket = 'dst-bucket'
+        dst_obj = 'dst_object'
+        self.conn.make_request('PUT', dst_bucket)
+
+        # /src/src -> /dst/dst
+        headers = {'X-Amz-Copy-Source': '/%s/%s' % (self.bucket, obj)}
+        status, headers, body = \
+            self.conn.make_request('PUT', dst_bucket, dst_obj, headers)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self._assertObjectEtag(dst_bucket, dst_obj, etag)
+
+        # /src/src -> /src/dst
+        headers = {'X-Amz-Copy-Source': '/%s/%s' % (self.bucket, obj)}
+        status, headers, body = \
+            self.conn.make_request('PUT', self.bucket, dst_obj, headers)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self._assertObjectEtag(self.bucket, dst_obj, etag)
+
+        # /src/src -> /src/src
+        # need changes to copy itself (e.g. metadata)
+        headers = {'X-Amz-Copy-Source': '/%s/%s' % (self.bucket, obj),
+                   'X-Amz-Meta-Foo': 'bar',
+                   'X-Amz-Metadata-Directive': 'REPLACE'}
+        status, headers, body = \
+            self.conn.make_request('PUT', self.bucket, obj, headers)
+        self.assertEqual(status, 200)
+        self._assertObjectEtag(self.bucket, obj, etag)
+        self.assertCommonResponseHeaders(headers)
+
+    def test_put_object_copy_metadata_directive(self):
+        obj = 'object'
+        src_headers = {'X-Amz-Meta-Test': 'src'}
+        dst_bucket = 'dst-bucket'
+        dst_obj = 'dst_object'
+        self.conn.make_request('PUT', self.bucket, obj, headers=src_headers)
+        self.conn.make_request('PUT', dst_bucket)
+
+        headers = {'X-Amz-Copy-Source': '/%s/%s' % (self.bucket, obj),
+                   'X-Amz-Metadata-Directive': 'REPLACE',
+                   'X-Amz-Meta-Test': 'dst'}
+        status, headers, body = \
+            self.conn.make_request('PUT', dst_bucket, dst_obj, headers)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        status, headers, body = \
+            self.conn.make_request('HEAD', dst_bucket, dst_obj)
+        self.assertEqual(headers['x-amz-meta-test'], 'dst')
+
+        headers = {'X-Amz-Copy-Source': '/%s/%s' % (self.bucket, obj),
+                   'X-Amz-Metadata-Directive': 'COPY',
+                   'X-Amz-Meta-Test': 'dst'}
+        status, headers, body = \
+            self.conn.make_request('PUT', dst_bucket, dst_obj, headers)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        status, headers, body = \
+            self.conn.make_request('HEAD', dst_bucket, dst_obj)
+        self.assertEqual(headers['x-amz-meta-test'], 'src')
+
+        headers = {'X-Amz-Copy-Source': '/%s/%s' % (self.bucket, obj),
+                   'X-Amz-Meta-Test2': 'dst',
+                   'X-Amz-Metadata-Directive': 'REPLACE'}
+        status, headers, body = \
+            self.conn.make_request('PUT', dst_bucket, dst_obj, headers)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        status, headers, body = \
+            self.conn.make_request('HEAD', dst_bucket, dst_obj)
+        self.assertNotIn('x-amz-meta-test', headers)
+        self.assertEqual(headers['x-amz-meta-test2'], 'dst')
+
+        headers = {'X-Amz-Copy-Source': '/%s/%s' % (self.bucket, obj),
+                   'X-Amz-Metadata-Directive': 'BAD'}
+        status, headers, body = \
+            self.conn.make_request('PUT', dst_bucket, dst_obj, headers)
+        self.assertEqual(status, 400)
+
+    @skip_boto2_sort_header_bug
+    def test_put_object_copy_source_if_modified_since(self):
+        obj = 'object'
+        dst_bucket = 'dst-bucket'
+        dst_obj = 'dst_object'
+        etag = md5(usedforsecurity=False).hexdigest()
+        self.conn.make_request('PUT', self.bucket, obj)
+        self.conn.make_request('PUT', dst_bucket)
+
+        _, headers, _ = self.conn.make_request('HEAD', self.bucket, obj)
+        src_datetime = mktime(parsedate(headers['last-modified']))
+        src_datetime = src_datetime - DAY
+        headers = {'X-Amz-Copy-Source': '/%s/%s' % (self.bucket, obj),
+                   'X-Amz-Copy-Source-If-Modified-Since':
+                   formatdate(src_datetime)}
+        status, headers, body = \
+            self.conn.make_request('PUT', dst_bucket, dst_obj, headers=headers)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self._assertObjectEtag(self.bucket, obj, etag)
+
+    @skip_boto2_sort_header_bug
+    def test_put_object_copy_source_if_unmodified_since(self):
+        obj = 'object'
+        dst_bucket = 'dst-bucket'
+        dst_obj = 'dst_object'
+        etag = md5(usedforsecurity=False).hexdigest()
+        self.conn.make_request('PUT', self.bucket, obj)
+        self.conn.make_request('PUT', dst_bucket)
+
+        _, headers, _ = self.conn.make_request('HEAD', self.bucket, obj)
+        src_datetime = mktime(parsedate(headers['last-modified']))
+        src_datetime = src_datetime + DAY
+        headers = {'X-Amz-Copy-Source': '/%s/%s' % (self.bucket, obj),
+                   'X-Amz-Copy-Source-If-Unmodified-Since':
+                   formatdate(src_datetime)}
+        status, headers, body = \
+            self.conn.make_request('PUT', dst_bucket, dst_obj, headers=headers)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self._assertObjectEtag(self.bucket, obj, etag)
+
+    @skip_boto2_sort_header_bug
+    def test_put_object_copy_source_if_match(self):
+        obj = 'object'
+        dst_bucket = 'dst-bucket'
+        dst_obj = 'dst_object'
+        etag = md5(usedforsecurity=False).hexdigest()
+        self.conn.make_request('PUT', self.bucket, obj)
+        self.conn.make_request('PUT', dst_bucket)
+
+        status, headers, body = \
+            self.conn.make_request('HEAD', self.bucket, obj)
+
+        headers = {'X-Amz-Copy-Source': '/%s/%s' % (self.bucket, obj),
+                   'X-Amz-Copy-Source-If-Match': etag}
+        status, headers, body = \
+            self.conn.make_request('PUT', dst_bucket, dst_obj, headers=headers)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self._assertObjectEtag(self.bucket, obj, etag)
+
+    @skip_boto2_sort_header_bug
+    def test_put_object_copy_source_if_none_match(self):
+        obj = 'object'
+        dst_bucket = 'dst-bucket'
+        dst_obj = 'dst_object'
+        etag = md5(usedforsecurity=False).hexdigest()
+        self.conn.make_request('PUT', self.bucket, obj)
+        self.conn.make_request('PUT', dst_bucket)
+
+        headers = {'X-Amz-Copy-Source': '/%s/%s' % (self.bucket, obj),
+                   'X-Amz-Copy-Source-If-None-Match': 'none-match'}
+        status, headers, body = \
+            self.conn.make_request('PUT', dst_bucket, dst_obj, headers=headers)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self._assertObjectEtag(self.bucket, obj, etag)
+
+    def test_get_object_response_content_type(self):
+        obj = 'obj'
+        self.conn.make_request('PUT', self.bucket, obj)
+
+        query = 'response-content-type=text/plain'
+        status, headers, body = \
+            self.conn.make_request('GET', self.bucket, obj, query=query)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self.assertEqual(headers['content-type'], 'text/plain')
+        self.assertTrue('accept-ranges' in headers)
+
+    def test_get_object_response_content_language(self):
+        obj = 'object'
+        self.conn.make_request('PUT', self.bucket, obj)
+
+        query = 'response-content-language=en'
+        status, headers, body = \
+            self.conn.make_request('GET', self.bucket, obj, query=query)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self.assertEqual(headers['content-language'], 'en')
+        self.assertTrue('accept-ranges' in headers)
+
+    def test_get_object_response_cache_control(self):
+        obj = 'object'
+        self.conn.make_request('PUT', self.bucket, obj)
+
+        query = 'response-cache-control=private'
+        status, headers, body = \
+            self.conn.make_request('GET', self.bucket, obj, query=query)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self.assertTrue('accept-ranges' in headers)
+        self.assertEqual(headers['cache-control'], 'private')
+
+    def test_get_object_response_content_disposition(self):
+        obj = 'object'
+        self.conn.make_request('PUT', self.bucket, obj)
+
+        query = 'response-content-disposition=inline'
+        status, headers, body = \
+            self.conn.make_request('GET', self.bucket, obj, query=query)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self.assertEqual(headers['content-disposition'], 'inline')
+        self.assertTrue('accept-ranges' in headers)
+
+    def test_get_object_response_content_encoding(self):
+        obj = 'object'
+        self.conn.make_request('PUT', self.bucket, obj)
+
+        query = 'response-content-encoding=gzip'
+        status, headers, body = \
+            self.conn.make_request('GET', self.bucket, obj, query=query)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self.assertEqual(headers['content-encoding'], 'gzip')
+        self.assertTrue('accept-ranges' in headers)
+
+    def test_get_object_range(self):
+        obj = 'object'
+        content = b'abcdefghij'
+        headers = {'x-amz-meta-test': 'swift',
+                   'content-type': 'application/octet-stream'}
+        self.conn.make_request(
+            'PUT', self.bucket, obj, headers=headers, body=content)
+
+        headers = {'Range': 'bytes=1-5'}
+        status, headers, body = \
+            self.conn.make_request('GET', self.bucket, obj, headers=headers)
+        self.assertEqual(status, 206)
+        self.assertCommonResponseHeaders(headers)
+        self.assertTrue('content-length' in headers)
+        self.assertTrue('accept-ranges' in headers)
+        self.assertEqual(headers['content-length'], '5')
+        self.assertTrue('x-amz-meta-test' in headers)
+        self.assertEqual('swift', headers['x-amz-meta-test'])
+        self.assertEqual(body, b'bcdef')
+        self.assertEqual('application/octet-stream', headers['content-type'])
+
+        headers = {'Range': 'bytes=5-'}
+        status, headers, body = \
+            self.conn.make_request('GET', self.bucket, obj, headers=headers)
+        self.assertEqual(status, 206)
+        self.assertCommonResponseHeaders(headers)
+        self.assertTrue('content-length' in headers)
+        self.assertTrue('accept-ranges' in headers)
+        self.assertEqual(headers['content-length'], '5')
+        self.assertTrue('x-amz-meta-test' in headers)
+        self.assertEqual('swift', headers['x-amz-meta-test'])
+        self.assertEqual(body, b'fghij')
+
+        headers = {'Range': 'bytes=-5'}
+        status, headers, body = \
+            self.conn.make_request('GET', self.bucket, obj, headers=headers)
+        self.assertEqual(status, 206)
+        self.assertCommonResponseHeaders(headers)
+        self.assertTrue('accept-ranges' in headers)
+        self.assertTrue('content-length' in headers)
+        self.assertEqual(headers['content-length'], '5')
+        self.assertTrue('x-amz-meta-test' in headers)
+        self.assertEqual('swift', headers['x-amz-meta-test'])
+        self.assertEqual(body, b'fghij')
+
+        ranges = ['1-2', '4-5']
+
+        headers = {'Range': 'bytes=%s' % ','.join(ranges)}
+        status, headers, body = \
+            self.conn.make_request('GET', self.bucket, obj, headers=headers)
+        self.assertEqual(status, 206)
+        self.assertCommonResponseHeaders(headers)
+        self.assertTrue('accept-ranges' in headers)
+        self.assertIn('content-length', headers)
+
+        self.assertIn('content-type', headers)  # sanity
+        content_type, boundary = headers['content-type'].split(';')
+
+        self.assertEqual('multipart/byteranges', content_type)
+        self.assertTrue(boundary.startswith('boundary='))  # sanity
+        boundary_str = boundary[len('boundary='):]
+
+        # TODO: Using swift.common.utils.multipart_byteranges_to_document_iters
+        #       could be easy enough.
+        parser = email.parser.BytesFeedParser()
+        parser.feed(
+            b"Content-Type: multipart/byterange; boundary=%s\r\n\r\n" %
+            boundary_str.encode('ascii'))
+        parser.feed(body)
+        message = parser.close()
+
+        self.assertTrue(message.is_multipart())  # sanity check
+        mime_parts = message.get_payload()
+        self.assertEqual(len(mime_parts), len(ranges))  # sanity
+
+        for index, range_value in enumerate(ranges):
+            start, end = map(int, range_value.split('-'))
+            # go to next section and check sanity
+            self.assertTrue(mime_parts[index])
+
+            part = mime_parts[index]
+            self.assertEqual(
+                'application/octet-stream', part.get_content_type())
+            expected_range = 'bytes %s/%s' % (range_value, len(content))
+            self.assertEqual(
+                expected_range, part.get('Content-Range'))
+            # rest
+            payload = part.get_payload(decode=True).strip()
+            self.assertEqual(content[start:end + 1], payload)
+
+    def test_get_object_if_modified_since(self):
+        obj = 'object'
+        self.conn.make_request('PUT', self.bucket, obj)
+
+        _, headers, _ = self.conn.make_request('HEAD', self.bucket, obj)
+        src_datetime = mktime(parsedate(headers['last-modified']))
+        src_datetime = src_datetime - DAY
+        headers = {'If-Modified-Since': formatdate(src_datetime)}
+        status, headers, body = \
+            self.conn.make_request('GET', self.bucket, obj, headers=headers)
+        self.assertEqual(status, 200)
+        self.assertTrue('accept-ranges' in headers)
+        self.assertCommonResponseHeaders(headers)
+
+    def test_get_object_if_unmodified_since(self):
+        obj = 'object'
+        self.conn.make_request('PUT', self.bucket, obj)
+
+        _, headers, _ = self.conn.make_request('HEAD', self.bucket, obj)
+        src_datetime = mktime(parsedate(headers['last-modified']))
+        src_datetime = src_datetime + DAY
+        headers = \
+            {'If-Unmodified-Since': formatdate(src_datetime)}
+        status, headers, body = \
+            self.conn.make_request('GET', self.bucket, obj, headers=headers)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self.assertTrue('accept-ranges' in headers)
+        # check we can use the last modified time from the listing...
+        status, headers, body = \
+            self.conn.make_request('GET', self.bucket)
+        elem = fromstring(body, 'ListBucketResult')
+        last_modified = elem.find('./Contents/LastModified').text
+        listing_datetime = S3Timestamp.from_s3xmlformat(last_modified)
+        # Make sure there's no fractions of a second
+        self.assertEqual(int(listing_datetime), float(listing_datetime))
+        header_datetime = formatdate(int(listing_datetime))
+
+        headers = {'If-Unmodified-Since': header_datetime}
+        status, headers, body = \
+            self.conn.make_request('GET', self.bucket, obj, headers=headers)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self.assertTrue('accept-ranges' in headers)
+
+        headers = {'If-Modified-Since': header_datetime}
+        status, headers, body = \
+            self.conn.make_request('GET', self.bucket, obj, headers=headers)
+        self.assertEqual(status, 304)
+        self.assertTrue('accept-ranges' in headers)
+        self.assertCommonResponseHeaders(headers)
+
+    def test_get_object_if_match(self):
+        obj = 'object'
+        self.conn.make_request('PUT', self.bucket, obj)
+
+        status, headers, body = \
+            self.conn.make_request('HEAD', self.bucket, obj)
+        etag = headers['etag']
+
+        headers = {'If-Match': etag}
+        status, headers, body = \
+            self.conn.make_request('GET', self.bucket, obj, headers=headers)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self.assertTrue('accept-ranges' in headers)
+
+    def test_get_object_if_none_match(self):
+        obj = 'object'
+        self.conn.make_request('PUT', self.bucket, obj)
+
+        headers = {'If-None-Match': 'none-match'}
+        status, headers, body = \
+            self.conn.make_request('GET', self.bucket, obj, headers=headers)
+        self.assertEqual(status, 200)
+        self.assertTrue('accept-ranges' in headers)
+        self.assertCommonResponseHeaders(headers)
+
+    def test_head_object_range(self):
+        obj = 'object'
+        content = b'abcdefghij'
+        self.conn.make_request('PUT', self.bucket, obj, body=content)
+
+        headers = {'Range': 'bytes=1-5'}
+        status, headers, body = \
+            self.conn.make_request('HEAD', self.bucket, obj, headers=headers)
+        self.assertEqual(headers['content-length'], '5')
+        self.assertCommonResponseHeaders(headers)
+        self.assertTrue('accept-ranges' in headers)
+
+        headers = {'Range': 'bytes=5-'}
+        status, headers, body = \
+            self.conn.make_request('HEAD', self.bucket, obj, headers=headers)
+        self.assertEqual(headers['content-length'], '5')
+        self.assertCommonResponseHeaders(headers)
+        self.assertTrue('accept-ranges' in headers)
+
+        headers = {'Range': 'bytes=-5'}
+        status, headers, body = \
+            self.conn.make_request('HEAD', self.bucket, obj, headers=headers)
+        self.assertEqual(headers['content-length'], '5')
+        self.assertCommonResponseHeaders(headers)
+        self.assertTrue('accept-ranges' in headers)
+
+    def test_head_object_if_modified_since(self):
+        obj = 'object'
+        self.conn.make_request('PUT', self.bucket, obj)
+
+        _, headers, _ = self.conn.make_request('HEAD', self.bucket, obj)
+        dt = mktime(parsedate(headers['last-modified']))
+        dt = dt - DAY
+
+        headers = {'If-Modified-Since': formatdate(dt)}
+        status, headers, body = \
+            self.conn.make_request('HEAD', self.bucket, obj, headers=headers)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self.assertTrue('accept-ranges' in headers)
+
+    def test_head_object_if_unmodified_since(self):
+        obj = 'object'
+        self.conn.make_request('PUT', self.bucket, obj)
+
+        _, headers, _ = self.conn.make_request('HEAD', self.bucket, obj)
+        dt = mktime(parsedate(headers['last-modified']))
+        dt = dt + DAY
+
+        headers = {'If-Unmodified-Since': formatdate(dt)}
+        status, headers, body = \
+            self.conn.make_request('HEAD', self.bucket, obj, headers=headers)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self.assertTrue('accept-ranges' in headers)
+
+    def test_head_object_if_match(self):
+        obj = 'object'
+        self.conn.make_request('PUT', self.bucket, obj)
+
+        status, headers, body = \
+            self.conn.make_request('HEAD', self.bucket, obj)
+        etag = headers['etag']
+
+        headers = {'If-Match': etag}
+        status, headers, body = \
+            self.conn.make_request('HEAD', self.bucket, obj, headers=headers)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self.assertTrue('accept-ranges' in headers)
+
+    def test_head_object_if_none_match(self):
+        obj = 'object'
+        self.conn.make_request('PUT', self.bucket, obj)
+
+        headers = {'If-None-Match': 'none-match'}
+        status, headers, body = \
+            self.conn.make_request('HEAD', self.bucket, obj, headers=headers)
+        self.assertEqual(status, 200)
+        self.assertCommonResponseHeaders(headers)
+        self.assertTrue('accept-ranges' in headers)
+
+
+class TestS3ApiObjectSigV4(TestS3ApiObject, SigV4Mixin):
+    pass
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/functional/s3api/test_presigned.py b/test/functional/s3api/test_presigned.py
new file mode 100644
index 0000000000..498fa27682
--- /dev/null
+++ b/test/functional/s3api/test_presigned.py
@@ -0,0 +1,267 @@
+# Copyright (c) 2016 SwiftStack, Inc.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import os
+
+import requests
+
+from swift.common.bufferedhttp import http_connect_raw
+from swift.common.middleware.s3api.etree import fromstring
+
+import test.functional as tf
+
+from test.functional.s3api import S3ApiBase
+from test.functional.s3api.utils import get_error_code, get_error_msg
+
+
+def setUpModule():
+    tf.setup_package()
+
+
+def tearDownModule():
+    tf.teardown_package()
+
+
+class TestS3ApiPresignedUrls(S3ApiBase):
+    def test_bucket(self):
+        bucket = 'test-bucket'
+        req_objects = ('object', 'object2')
+        max_bucket_listing = tf.cluster_info['s3api'].get(
+            'max_bucket_listing', 1000)
+
+        # GET Bucket (Without Object)
+        status, _junk, _junk = self.conn.make_request('PUT', bucket)
+        self.assertEqual(status, 200)
+
+        url, headers = self.conn.generate_url_and_headers('GET', bucket)
+        resp = requests.get(url, headers=headers)
+        self.assertEqual(resp.status_code, 200,
+                         'Got %d %s' % (resp.status_code, resp.content))
+        self.assertCommonResponseHeaders(resp.headers)
+        self.assertIsNotNone(resp.headers['content-type'])
+        self.assertEqual(resp.headers['content-length'],
+                         str(len(resp.content)))
+
+        elem = fromstring(resp.content, 'ListBucketResult')
+        self.assertEqual(elem.find('Name').text, bucket)
+        self.assertIsNone(elem.find('Prefix').text)
+        self.assertIsNone(elem.find('Marker').text)
+        self.assertEqual(elem.find('MaxKeys').text,
+                         str(max_bucket_listing))
+        self.assertEqual(elem.find('IsTruncated').text, 'false')
+        objects = elem.findall('./Contents')
+        self.assertEqual(list(objects), [])
+
+        # GET Bucket (With Object)
+        for obj in req_objects:
+            status, _junk, _junk = self.conn.make_request('PUT', bucket, obj)
+            self.assertEqual(
+                status, 200,
+                'Got %d response while creating %s' % (status, obj))
+
+        resp = requests.get(url, headers=headers)
+        self.assertEqual(resp.status_code, 200,
+                         'Got %d %s' % (resp.status_code, resp.content))
+        self.assertCommonResponseHeaders(resp.headers)
+        self.assertIsNotNone(resp.headers['content-type'])
+        self.assertEqual(resp.headers['content-length'],
+                         str(len(resp.content)))
+
+        elem = fromstring(resp.content, 'ListBucketResult')
+        self.assertEqual(elem.find('Name').text, bucket)
+        self.assertIsNone(elem.find('Prefix').text)
+        self.assertIsNone(elem.find('Marker').text)
+        self.assertEqual(elem.find('MaxKeys').text,
+                         str(max_bucket_listing))
+        self.assertEqual(elem.find('IsTruncated').text, 'false')
+        resp_objects = elem.findall('./Contents')
+        self.assertEqual(len(list(resp_objects)), 2)
+        for o in resp_objects:
+            self.assertIn(o.find('Key').text, req_objects)
+            self.assertIsNotNone(o.find('LastModified').text)
+            self.assertRegex(
+                o.find('LastModified').text,
+                r'^\d{4}-\d{2}-\d{2}T\d{2}:\d{2}:\d{2}.000Z$')
+            self.assertIsNotNone(o.find('ETag').text)
+            self.assertEqual(o.find('Size').text, '0')
+            self.assertIsNotNone(o.find('StorageClass').text is not None)
+            self.assertEqual(o.find('Owner/ID').text, self.conn.user_id)
+            self.assertEqual(o.find('Owner/DisplayName').text,
+                             self.conn.user_id)
+        # DELETE Bucket
+        for obj in req_objects:
+            self.conn.make_request('DELETE', bucket, obj)
+        url, headers = self.conn.generate_url_and_headers('DELETE', bucket)
+        resp = requests.delete(url, headers=headers)
+        self.assertEqual(resp.status_code, 204,
+                         'Got %d %s' % (resp.status_code, resp.content))
+
+    def test_expiration_limits(self):
+        if os.environ.get('S3_USE_SIGV4'):
+            self._test_expiration_limits_v4()
+        else:
+            self._test_expiration_limits_v2()
+
+    def _test_expiration_limits_v2(self):
+        bucket = 'test-bucket'
+
+        # Expiration date is too far in the future
+        url, headers = self.conn.generate_url_and_headers(
+            'GET', bucket, expires_in=2 ** 32)
+        resp = requests.get(url, headers=headers)
+        self.assertEqual(resp.status_code, 403,
+                         'Got %d %s' % (resp.status_code, resp.content))
+        self.assertEqual(get_error_code(resp.content),
+                         'AccessDenied')
+        self.assertIn('Invalid date (should be seconds since epoch)',
+                      get_error_msg(resp.content))
+
+    def _test_expiration_limits_v4(self):
+        bucket = 'test-bucket'
+
+        # Expiration is negative
+        url, headers = self.conn.generate_url_and_headers(
+            'GET', bucket, expires_in=-1)
+        resp = requests.get(url, headers=headers)
+        self.assertEqual(resp.status_code, 400,
+                         'Got %d %s' % (resp.status_code, resp.content))
+        self.assertEqual(get_error_code(resp.content),
+                         'AuthorizationQueryParametersError')
+        self.assertIn('X-Amz-Expires must be non-negative',
+                      get_error_msg(resp.content))
+
+        # Expiration date is too far in the future
+        for exp in (7 * 24 * 60 * 60 + 1,
+                    2 ** 63 - 1):
+            url, headers = self.conn.generate_url_and_headers(
+                'GET', bucket, expires_in=exp)
+            resp = requests.get(url, headers=headers)
+            self.assertEqual(resp.status_code, 400,
+                             'Got %d %s' % (resp.status_code, resp.content))
+            self.assertEqual(get_error_code(resp.content),
+                             'AuthorizationQueryParametersError')
+            self.assertIn('X-Amz-Expires must be less than 604800 seconds',
+                          get_error_msg(resp.content))
+
+        # Expiration date is *way* too far in the future, or isn't a number
+        for exp in (2 ** 63, 'foo'):
+            url, headers = self.conn.generate_url_and_headers(
+                'GET', bucket, expires_in=2 ** 63)
+            resp = requests.get(url, headers=headers)
+            self.assertEqual(resp.status_code, 400,
+                             'Got %d %s' % (resp.status_code, resp.content))
+            self.assertEqual(get_error_code(resp.content),
+                             'AuthorizationQueryParametersError')
+            self.assertEqual('X-Amz-Expires should be a number',
+                             get_error_msg(resp.content))
+
+    def test_object(self):
+        bucket = 'test-bucket'
+        obj = 'object'
+
+        status, _junk, _junk = self.conn.make_request('PUT', bucket)
+        self.assertEqual(status, 200)
+
+        # HEAD/missing object
+        head_url, headers = self.conn.generate_url_and_headers(
+            'HEAD', bucket, obj)
+        resp = requests.head(head_url, headers=headers)
+        self.assertEqual(resp.status_code, 404,
+                         'Got %d %s' % (resp.status_code, resp.content))
+
+        # Wrong verb
+        resp = requests.get(head_url)
+        self.assertEqual(resp.status_code, 403,
+                         'Got %d %s' % (resp.status_code, resp.content))
+        self.assertEqual(get_error_code(resp.content),
+                         'SignatureDoesNotMatch')
+
+        # PUT empty object
+        put_url, headers = self.conn.generate_url_and_headers(
+            'PUT', bucket, obj)
+        resp = requests.put(put_url, data=b'', headers=headers)
+        self.assertEqual(resp.status_code, 200,
+                         'Got %d %s' % (resp.status_code, resp.content))
+        # GET empty object
+        get_url, headers = self.conn.generate_url_and_headers(
+            'GET', bucket, obj)
+        resp = requests.get(get_url, headers=headers)
+        self.assertEqual(resp.status_code, 200,
+                         'Got %d %s' % (resp.status_code, resp.content))
+        self.assertEqual(resp.content, b'')
+
+        # PUT over object
+        resp = requests.put(put_url, data=b'foobar', headers=headers)
+        self.assertEqual(resp.status_code, 200,
+                         'Got %d %s' % (resp.status_code, resp.content))
+
+        # GET non-empty object
+        resp = requests.get(get_url, headers=headers)
+        self.assertEqual(resp.status_code, 200,
+                         'Got %d %s' % (resp.status_code, resp.content))
+        self.assertEqual(resp.content, b'foobar')
+
+        # DELETE Object
+        delete_url, headers = self.conn.generate_url_and_headers(
+            'DELETE', bucket, obj)
+        resp = requests.delete(delete_url, headers=headers)
+        self.assertEqual(resp.status_code, 204,
+                         'Got %d %s' % (resp.status_code, resp.content))
+
+        # Final cleanup
+        status, _junk, _junk = self.conn.make_request('DELETE', bucket)
+        self.assertEqual(status, 204)
+
+    def test_absolute_form_request(self):
+        bucket = 'test-bucket'
+
+        put_url, headers = self.conn.generate_url_and_headers(
+            'PUT', bucket)
+        resp = http_connect_raw(
+            self.conn.host,
+            self.conn.port,
+            'PUT',
+            put_url,  # whole URL, not just the path/query!
+            headers=headers,
+            ssl=put_url.startswith('https:'),
+        ).getresponse()
+        self.assertEqual(resp.status, 200,
+                         'Got %d %s' % (resp.status, resp.read()))
+
+        delete_url, headers = self.conn.generate_url_and_headers(
+            'DELETE', bucket)
+        resp = http_connect_raw(
+            self.conn.host,
+            self.conn.port,
+            'DELETE',
+            delete_url,  # whole URL, not just the path/query!
+            headers=headers,
+            ssl=delete_url.startswith('https:'),
+        ).getresponse()
+        self.assertEqual(resp.status, 204,
+                         'Got %d %s' % (resp.status, resp.read()))
+
+
+class TestS3ApiPresignedUrlsSigV4(TestS3ApiPresignedUrls):
+    @classmethod
+    def setUpClass(cls):
+        os.environ['S3_USE_SIGV4'] = "True"
+
+    @classmethod
+    def tearDownClass(cls):
+        del os.environ['S3_USE_SIGV4']
+
+    def setUp(self):
+        super(TestS3ApiPresignedUrlsSigV4, self).setUp()
diff --git a/test/functional/s3api/test_service.py b/test/functional/s3api/test_service.py
new file mode 100644
index 0000000000..77779cba07
--- /dev/null
+++ b/test/functional/s3api/test_service.py
@@ -0,0 +1,101 @@
+# Copyright (c) 2015 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+import os
+
+import test.functional as tf
+
+from swift.common.middleware.s3api.etree import fromstring
+
+from test.functional.s3api import S3ApiBase
+from test.functional.s3api.s3_test_client import Connection
+from test.functional.s3api.utils import get_error_code
+
+
+def setUpModule():
+    tf.setup_package()
+
+
+def tearDownModule():
+    tf.teardown_package()
+
+
+class TestS3ApiService(S3ApiBase):
+    def setUp(self):
+        super(TestS3ApiService, self).setUp()
+
+    def test_service(self):
+        # GET Service(without bucket)
+        status, headers, body = self.conn.make_request('GET')
+        self.assertEqual(status, 200)
+
+        self.assertCommonResponseHeaders(headers)
+        self.assertTrue(headers['content-type'] is not None)
+        # TODO; requires consideration
+        # self.assertEqual(headers['transfer-encoding'], 'chunked')
+
+        elem = fromstring(body, 'ListAllMyBucketsResult')
+        buckets = elem.findall('./Buckets/Bucket')
+        self.assertEqual(list(buckets), [])
+        owner = elem.find('Owner')
+        self.assertEqual(self.conn.user_id, owner.find('ID').text)
+        self.assertEqual(self.conn.user_id, owner.find('DisplayName').text)
+
+        # GET Service(with Bucket)
+        req_buckets = ('bucket', 'bucket2')
+        for bucket in req_buckets:
+            self.conn.make_request('PUT', bucket)
+        status, headers, body = self.conn.make_request('GET')
+        self.assertEqual(status, 200)
+
+        elem = fromstring(body, 'ListAllMyBucketsResult')
+        resp_buckets = elem.findall('./Buckets/Bucket')
+        self.assertEqual(len(list(resp_buckets)), 2)
+        for b in resp_buckets:
+            self.assertTrue(b.find('Name').text in req_buckets)
+            self.assertTrue(b.find('CreationDate') is not None)
+
+    def test_service_error_signature_not_match(self):
+        auth_error_conn = Connection(tf.config['s3_access_key'], 'invalid')
+        status, headers, body = auth_error_conn.make_request('GET')
+        self.assertEqual(get_error_code(body), 'SignatureDoesNotMatch')
+        self.assertEqual(headers['content-type'], 'application/xml')
+
+    def test_service_error_no_date_header(self):
+        # Without x-amz-date/Date header, that makes 403 forbidden
+        status, headers, body = self.conn.make_request(
+            'GET', headers={'Date': '', 'x-amz-date': ''})
+        self.assertEqual(status, 403)
+        self.assertEqual(get_error_code(body), 'AccessDenied')
+        self.assertIn(b'AWS authentication requires a valid Date '
+                      b'or x-amz-date header', body)
+
+
+class TestS3ApiServiceSigV4(TestS3ApiService):
+    @classmethod
+    def setUpClass(cls):
+        os.environ['S3_USE_SIGV4'] = "True"
+
+    @classmethod
+    def tearDownClass(cls):
+        del os.environ['S3_USE_SIGV4']
+
+    def setUp(self):
+        super(TestS3ApiServiceSigV4, self).setUp()
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/functional/s3api/test_versioning.py b/test/functional/s3api/test_versioning.py
new file mode 100644
index 0000000000..8d783ab61c
--- /dev/null
+++ b/test/functional/s3api/test_versioning.py
@@ -0,0 +1,166 @@
+# Copyright (c) 2017 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from swift.common.middleware.s3api.etree import fromstring, tostring, \
+    Element, SubElement
+import test.functional as tf
+from test.functional.s3api import S3ApiBase
+from test.functional.s3api.utils import get_error_code
+
+
+def setUpModule():
+    tf.setup_package()
+
+
+def tearDownModule():
+    tf.teardown_package()
+
+
+class TestS3ApiVersioning(S3ApiBase):
+    def setUp(self):
+        super(TestS3ApiVersioning, self).setUp()
+        if 'object_versioning' not in tf.cluster_info:
+            # Alternatively, maybe we should assert we get 501s...
+            self.skipTest('S3 versioning requires that Swift object '
+                          'versioning be enabled')
+        status, headers, body = self.conn.make_request('PUT', 'bucket')
+        self.assertEqual(status, 200)
+
+    def tearDown(self):
+        # TODO: is this necessary on AWS? or can you delete buckets while
+        # versioning is enabled?
+        elem = Element('VersioningConfiguration')
+        SubElement(elem, 'Status').text = 'Suspended'
+        xml = tostring(elem)
+        status, headers, body = self.conn.make_request(
+            'PUT', 'bucket', body=xml, query='versioning')
+        self.assertEqual(status, 200)
+
+        status, headers, body = self.conn.make_request('DELETE', 'bucket')
+        self.assertEqual(status, 204)
+        super(TestS3ApiVersioning, self).tearDown()
+
+    def test_versioning_put(self):
+        # Versioning not configured
+        status, headers, body = self.conn.make_request(
+            'GET', 'bucket', query='versioning')
+        self.assertEqual(status, 200)
+        elem = fromstring(body)
+        self.assertEqual(list(elem), [])
+
+        # Enable versioning
+        elem = Element('VersioningConfiguration')
+        SubElement(elem, 'Status').text = 'Enabled'
+        xml = tostring(elem)
+        status, headers, body = self.conn.make_request(
+            'PUT', 'bucket', body=xml, query='versioning')
+        self.assertEqual(status, 200)
+
+        status, headers, body = self.conn.make_request(
+            'GET', 'bucket', query='versioning')
+        self.assertEqual(status, 200)
+        elem = fromstring(body)
+        self.assertEqual(elem.find('./Status').text, 'Enabled')
+
+        # Suspend versioning
+        elem = Element('VersioningConfiguration')
+        SubElement(elem, 'Status').text = 'Suspended'
+        xml = tostring(elem)
+        status, headers, body = self.conn.make_request(
+            'PUT', 'bucket', body=xml, query='versioning')
+        self.assertEqual(status, 200)
+
+        status, headers, body = self.conn.make_request(
+            'GET', 'bucket', query='versioning')
+        self.assertEqual(status, 200)
+        elem = fromstring(body)
+        self.assertEqual(elem.find('./Status').text, 'Suspended')
+
+        # Resume versioning
+        elem = Element('VersioningConfiguration')
+        SubElement(elem, 'Status').text = 'Enabled'
+        xml = tostring(elem)
+        status, headers, body = self.conn.make_request(
+            'PUT', 'bucket', body=xml, query='versioning')
+        self.assertEqual(status, 200)
+
+        status, headers, body = self.conn.make_request(
+            'GET', 'bucket', query='versioning')
+        self.assertEqual(status, 200)
+        elem = fromstring(body)
+        self.assertEqual(elem.find('./Status').text, 'Enabled')
+
+    def test_versioning_immediately_suspend(self):
+        # Versioning not configured
+        status, headers, body = self.conn.make_request(
+            'GET', 'bucket', query='versioning')
+        self.assertEqual(status, 200)
+        elem = fromstring(body)
+        self.assertEqual(list(elem), [])
+
+        # Suspend versioning
+        elem = Element('VersioningConfiguration')
+        SubElement(elem, 'Status').text = 'Suspended'
+        xml = tostring(elem)
+        status, headers, body = self.conn.make_request(
+            'PUT', 'bucket', body=xml, query='versioning')
+        self.assertEqual(status, 200)
+
+        status, headers, body = self.conn.make_request(
+            'GET', 'bucket', query='versioning')
+        self.assertEqual(status, 200)
+        elem = fromstring(body)
+        self.assertEqual(elem.find('./Status').text, 'Suspended')
+
+        # Enable versioning
+        elem = Element('VersioningConfiguration')
+        SubElement(elem, 'Status').text = 'Enabled'
+        xml = tostring(elem)
+        status, headers, body = self.conn.make_request(
+            'PUT', 'bucket', body=xml, query='versioning')
+        self.assertEqual(status, 200)
+
+        status, headers, body = self.conn.make_request(
+            'GET', 'bucket', query='versioning')
+        self.assertEqual(status, 200)
+        elem = fromstring(body)
+        self.assertEqual(elem.find('./Status').text, 'Enabled')
+
+    def test_versioning_put_error(self):
+        # Root tag is not VersioningConfiguration
+        elem = Element('foo')
+        SubElement(elem, 'Status').text = 'Enabled'
+        xml = tostring(elem)
+        status, headers, body = self.conn.make_request(
+            'PUT', 'bucket', body=xml, query='versioning')
+        self.assertEqual(status, 400)
+        self.assertEqual(get_error_code(body), 'MalformedXML')
+
+        # Status is not "Enabled" or "Suspended"
+        elem = Element('VersioningConfiguration')
+        SubElement(elem, 'Status').text = '...'
+        xml = tostring(elem)
+        status, headers, body = self.conn.make_request(
+            'PUT', 'bucket', body=xml, query='versioning')
+        self.assertEqual(status, 400)
+        self.assertEqual(get_error_code(body), 'MalformedXML')
+
+        elem = Element('VersioningConfiguration')
+        SubElement(elem, 'Status').text = ''
+        xml = tostring(elem)
+        status, headers, body = self.conn.make_request(
+            'PUT', 'bucket', body=xml, query='versioning')
+        self.assertEqual(status, 400)
+        self.assertEqual(get_error_code(body), 'MalformedXML')
diff --git a/test/functional/s3api/test_xxe_injection.py b/test/functional/s3api/test_xxe_injection.py
new file mode 100644
index 0000000000..af0a433a88
--- /dev/null
+++ b/test/functional/s3api/test_xxe_injection.py
@@ -0,0 +1,240 @@
+#!/usr/bin/env python
+# Copyright (c) 2022 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import requests
+
+import botocore
+
+import test.functional as tf
+from test.functional.s3api import S3ApiBaseBoto3
+
+
+def setUpModule():
+    tf.setup_package()
+
+
+def tearDownModule():
+    tf.teardown_package()
+
+
+class TestS3ApiXxeInjection(S3ApiBaseBoto3):
+
+    def setUp(self):
+        super(TestS3ApiXxeInjection, self).setUp()
+        self.bucket = 'test-s3api-xxe-injection'
+
+    def _create_bucket(self, **kwargs):
+        resp = self.conn.create_bucket(Bucket=self.bucket, **kwargs)
+        response_metadata = resp.pop('ResponseMetadata', {})
+        self.assertEqual(200, response_metadata.get('HTTPStatusCode'))
+
+    @staticmethod
+    def _clear_data(request, **_kwargs):
+        request.data = b''
+
+    def _presign_url(self, method, key=None, **kwargs):
+        params = {
+            'Bucket': self.bucket
+        }
+        if key:
+            params['Key'] = key
+        params.update(kwargs)
+        try:
+            # https://github.com/boto/boto3/issues/2192
+            self.conn.meta.events.register(
+                'before-sign.s3.*', self._clear_data)
+            url = self.conn.generate_presigned_url(
+                method, Params=params, ExpiresIn=60)
+        finally:
+            self.conn.meta.events.unregister(
+                'before-sign.s3.*', self._clear_data)
+        if not params.get('Key') and '/?' not in url:
+            # Some combination of dependencies seems to cause bucket requests
+            # to not get the trailing slash despite signing with it? But only
+            # new-enough versions sign with the trailing slash
+            url = url.replace('?', '/?')
+        return url
+
+    def test_put_bucket_acl(self):
+        if not tf.cluster_info['s3api'].get('s3_acl'):
+            self.skipTest('s3_acl must be enabled')
+
+        self._create_bucket()
+
+        url = self._presign_url('put_bucket_acl')
+        resp = requests.put(url, data="""
+<!DOCTYPE foo [<!ENTITY xxe SYSTEM "file:///etc/swift/swift.conf"> ]>
+<AccessControlPolicy xmlns="http://s3.amazonaws.com/doc/2006-03-01/">
+<Owner>
+    <DisplayName>test:tester</DisplayName>
+    <ID>test:tester</ID>
+</Owner>
+<AccessControlList>
+    <Grant>
+        <Grantee xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:type="CanonicalUser">
+            <DisplayName>name&xxe;</DisplayName>
+            <ID>id&xxe;</ID>
+        </Grantee>
+        <Permission>WRITE</Permission>
+    </Grant>
+</AccessControlList>
+</AccessControlPolicy>
+""")  # noqa: E501
+        self.assertEqual(200, resp.status_code)
+        self.assertNotIn(b'xxe', resp.content)
+        self.assertNotIn(b'[swift-hash]', resp.content)
+
+        acl = self.conn.get_bucket_acl(Bucket=self.bucket)
+        response_metadata = acl.pop('ResponseMetadata', {})
+        self.assertEqual(200, response_metadata.get('HTTPStatusCode'))
+        self.assertDictEqual({
+            'Owner': {
+                'DisplayName': 'test:tester',
+                'ID': 'test:tester'
+            },
+            'Grants': [
+                {
+                    'Grantee': {
+                        'DisplayName': 'id',
+                        'ID': 'id',
+                        'Type': 'CanonicalUser'
+                    },
+                    'Permission': 'WRITE'
+                }
+            ]
+        }, acl)
+
+    def test_create_bucket(self):
+        url = self._presign_url('create_bucket')
+        resp = requests.put(url, data="""
+<!DOCTYPE foo [<!ENTITY xxe SYSTEM "file:///etc/swift/swift.conf"> ]>
+<CreateBucketConfiguration xmlns="http://s3.amazonaws.com/doc/2006-03-01/">
+    <LocationConstraint>&xxe;</LocationConstraint>
+</CreateBucketConfiguration>
+""")  # noqa: E501
+        self.assertEqual(400, resp.status_code)
+        self.assertNotIn(b'xxe', resp.content)
+        self.assertNotIn(b'[swift-hash]', resp.content)
+
+        self.assertRaisesRegex(
+            botocore.exceptions.ClientError, 'Not Found',
+            self.conn.head_bucket, Bucket=self.bucket)
+
+    def test_delete_objects(self):
+        self._create_bucket()
+
+        url = self._presign_url(
+            'delete_objects',
+            Delete={
+                'Objects': [
+                    {
+                        'Key': 'string',
+                        'VersionId': 'string'
+                    }
+                ]
+            })
+        body = """
+<!DOCTYPE foo [<!ENTITY xxe SYSTEM "file:///etc/swift/swift.conf"> ]>
+<Delete xmlns="http://s3.amazonaws.com/doc/2006-03-01/">
+    <Object>
+        <Key>&xxe;</Key>
+    </Object>
+</Delete>
+"""
+        body = body.encode('utf-8')
+        resp = requests.post(url, data=body)
+        self.assertEqual(400, resp.status_code, resp.content)
+        self.assertNotIn(b'xxe', resp.content)
+        self.assertNotIn(b'[swift-hash]', resp.content)
+
+    def test_complete_multipart_upload(self):
+        self._create_bucket()
+
+        resp = self.conn.create_multipart_upload(
+            Bucket=self.bucket, Key='test')
+        response_metadata = resp.pop('ResponseMetadata', {})
+        self.assertEqual(200, response_metadata.get('HTTPStatusCode'))
+        uploadid = resp.get('UploadId')
+
+        try:
+            url = self._presign_url(
+                'complete_multipart_upload',
+                Key='key',
+                MultipartUpload={
+                    'Parts': [
+                        {
+                            'ETag': 'string',
+                            'PartNumber': 1
+                        }
+                    ],
+                },
+                UploadId=uploadid)
+            resp = requests.post(url, data="""
+<!DOCTYPE foo [<!ENTITY xxe SYSTEM "file:///etc/swift/swift.conf"> ]>
+<CompleteMultipartUpload xmlns="http://s3.amazonaws.com/doc/2006-03-01/">
+   <Part>
+      <ETag>"{uploadid}"</ETag>
+      <PartNumber>&xxe;</PartNumber>
+   </Part>
+</CompleteMultipartUpload>
+""")  # noqa: E501
+            self.assertEqual(404, resp.status_code)
+            self.assertNotIn(b'xxe', resp.content)
+            self.assertNotIn(b'[swift-hash]', resp.content)
+
+            resp = requests.post(url, data="""
+<!DOCTYPE foo [<!ENTITY xxe SYSTEM "file:///etc/swift/swift.conf"> ]>
+<CompleteMultipartUpload xmlns="http://s3.amazonaws.com/doc/2006-03-01/">
+   <Part>
+      <ETag>"&xxe;"</ETag>
+      <PartNumber>1</PartNumber>
+   </Part>
+</CompleteMultipartUpload>
+""")  # noqa: E501
+            self.assertEqual(404, resp.status_code)
+            self.assertNotIn(b'xxe', resp.content)
+            self.assertNotIn(b'[swift-hash]', resp.content)
+        finally:
+            resp = self.conn.abort_multipart_upload(
+                Bucket=self.bucket, Key='test', UploadId=uploadid)
+            response_metadata = resp.pop('ResponseMetadata', {})
+            self.assertEqual(204, response_metadata.get('HTTPStatusCode'))
+
+    def test_put_bucket_versioning(self):
+        if 'object_versioning' not in tf.cluster_info:
+            raise tf.SkipTest('S3 versioning requires that Swift object '
+                              'versioning be enabled')
+        self._create_bucket()
+
+        url = self._presign_url(
+            'put_bucket_versioning',
+            VersioningConfiguration={
+                'Status': 'Enabled'
+            })
+        resp = requests.put(url, data="""
+<!DOCTYPE foo [<!ENTITY xxe SYSTEM "file:///etc/swift/swift.conf"> ]>
+<VersioningConfiguration xmlns="http://s3.amazonaws.com/doc/2006-03-01/">
+    <Status>&xxe;</Status>
+</VersioningConfiguration>
+""")  # noqa: E501
+        self.assertEqual(400, resp.status_code)
+        self.assertNotIn(b'xxe', resp.content)
+        self.assertNotIn(b'[swift-hash]', resp.content)
+
+        versioning = self.conn.get_bucket_versioning(Bucket=self.bucket)
+        response_metadata = versioning.pop('ResponseMetadata', {})
+        self.assertEqual(200, response_metadata.get('HTTPStatusCode'))
+        self.assertDictEqual({}, versioning)
diff --git a/bin/swift-account-reaper b/test/functional/s3api/utils.py
old mode 100755
new mode 100644
similarity index 52%
rename from bin/swift-account-reaper
rename to test/functional/s3api/utils.py
index 2f07153dfa..e8fde39541
--- a/bin/swift-account-reaper
+++ b/test/functional/s3api/utils.py
@@ -1,5 +1,4 @@
-#!/usr/bin/env python
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2015 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -14,10 +13,21 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-from swift.account.reaper import AccountReaper
-from swift.common.utils import parse_options
-from swift.common.daemon import run_daemon
+from base64 import b64encode
+from swift.common.middleware.s3api.etree import fromstring
+from swift.common.utils import md5
 
-if __name__ == '__main__':
-    conf_file, options = parse_options(once=True)
-    run_daemon(AccountReaper, conf_file, **options)
+
+def get_error_code(body):
+    elem = fromstring(body, 'Error')
+    return elem.find('Code').text
+
+
+def get_error_msg(body):
+    elem = fromstring(body, 'Error')
+    return elem.find('Message').text
+
+
+def calculate_md5(body):
+    return b64encode(
+        md5(body, usedforsecurity=False).digest()).strip().decode('ascii')
diff --git a/test/functional/swift_test_client.py b/test/functional/swift_test_client.py
index 7b7619841b..d59a2b61f8 100644
--- a/test/functional/swift_test_client.py
+++ b/test/functional/swift_test_client.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,20 +13,31 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-import hashlib
-import httplib
+import functools
+import io
+import json
 import os
 import random
+import ssl
 import socket
-import StringIO
 import time
-import urllib
 
-import simplejson as json
-
-from nose import SkipTest
+from unittest import SkipTest
 from xml.dom import minidom
 
+import http.client
+import urllib.parse
+from swiftclient import get_auth
+
+from swift.common import constraints
+from swift.common.http import is_success
+from swift.common.swob import str_to_wsgi, wsgi_to_str
+from swift.common.utils import config_true_value, md5
+
+from test import safe_repr
+
+http.client._MAXHEADERS = constraints.MAX_HEADER_COUNT
+
 
 class AuthenticationFailed(Exception):
     pass
@@ -37,20 +48,36 @@ class RequestError(Exception):
 
 
 class ResponseError(Exception):
-    def __init__(self, response):
-        self.status = response.status
-        self.reason = response.reason
-        Exception.__init__(self)
+    def __init__(self, response, method=None, path=None, details=None):
+        self.status = getattr(response, 'status', 0)
+        self.reason = getattr(response, 'reason', '[unknown]')
+        self.method = method
+        self.path = path
+        self.headers = getattr(response, 'getheaders', lambda: [])()
+        self.details = details
+
+        for name, value in self.headers:
+            if name.lower() == 'x-trans-id':
+                self.txid = value
+                break
+        else:
+            self.txid = None
+
+        super(ResponseError, self).__init__()
 
     def __str__(self):
-        return '%d: %s' % (self.status, self.reason)
+        return repr(self)
 
     def __repr__(self):
-        return '%d: %s' % (self.status, self.reason)
+        msg = '%d: %r (%r %r) txid=%s' % (
+            self.status, self.reason, self.method, self.path, self.txid)
+        if self.details:
+            msg += '\n%s' % self.details
+        return msg
 
 
 def listing_empty(method):
-    for i in xrange(0, 6):
+    for i in range(6):
         if len(method()) == 0:
             return True
 
@@ -84,129 +111,263 @@ def listing_items(method):
             items = []
 
 
+def putrequest(self, method, url, skip_host=False, skip_accept_encoding=False):
+    '''Send a request to the server.
+
+    This is mostly a regurgitation of CPython's HTTPConnection.putrequest,
+    but fixed up so we can still send arbitrary bytes in the request line
+    on py3. See also: https://bugs.python.org/issue36274
+
+    To use, swap out a HTTP(S)Connection's putrequest with something like::
+
+       conn.putrequest = putrequest.__get__(conn)
+
+    :param method: specifies an HTTP request method, e.g. 'GET'.
+    :param url: specifies the object being requested, e.g. '/index.html'.
+    :param skip_host: if True does not add automatically a 'Host:' header
+    :param skip_accept_encoding: if True does not add automatically an
+       'Accept-Encoding:' header
+    '''
+    # (Mostly) inline the HTTPConnection implementation; just fix it
+    # so we can send non-ascii request lines. For comparison, see
+    # https://github.com/python/cpython/blob/v2.7.16/Lib/httplib.py#L888-L1003
+    # and https://github.com/python/cpython/blob/v3.7.2/
+    # Lib/http/client.py#L1061-L1183
+    if self._HTTPConnection__response \
+            and self._HTTPConnection__response.isclosed():
+        self._HTTPConnection__response = None
+
+    if self._HTTPConnection__state == http.client._CS_IDLE:
+        self._HTTPConnection__state = http.client._CS_REQ_STARTED
+    else:
+        raise http.client.CannotSendRequest(self._HTTPConnection__state)
+
+    self._method = method
+    if not url:
+        url = '/'
+    self._path = url
+    request = '%s %s %s' % (method, url, self._http_vsn_str)
+    if not isinstance(request, bytes):
+        # This choice of encoding is the whole reason we copy/paste from
+        # cpython. When making backend requests, it should never be
+        # necessary; however, we have some functional tests that want
+        # to send non-ascii bytes.
+        # TODO: when https://bugs.python.org/issue36274 is resolved, make
+        # sure we fix up our API to match whatever upstream chooses to do
+        self._output(request.encode('latin1'))
+    else:
+        self._output(request)
+
+    if self._http_vsn == 11:
+        if not skip_host:
+            netloc = ''
+            if url.startswith('http'):
+                nil, netloc, nil, nil, nil = urllib.parse.urlsplit(url)
+
+            if netloc:
+                try:
+                    netloc_enc = netloc.encode("ascii")
+                except UnicodeEncodeError:
+                    netloc_enc = netloc.encode("idna")
+                self.putheader('Host', netloc_enc)
+            else:
+                if self._tunnel_host:
+                    host = self._tunnel_host
+                    port = self._tunnel_port
+                else:
+                    host = self.host
+                    port = self.port
+
+                try:
+                    host_enc = host.encode("ascii")
+                except UnicodeEncodeError:
+                    host_enc = host.encode("idna")
+
+                if host.find(':') >= 0:
+                    host_enc = b'[' + host_enc + b']'
+
+                if port == self.default_port:
+                    self.putheader('Host', host_enc)
+                else:
+                    host_enc = host_enc.decode("ascii")
+                    self.putheader('Host', "%s:%s" % (host_enc, port))
+
+        if not skip_accept_encoding:
+            self.putheader('Accept-Encoding', 'identity')
+
+
 class Connection(object):
     def __init__(self, config):
-        for key in 'auth_host auth_port auth_ssl username password'.split():
-            if not key in config:
-                raise SkipTest
+        for key in 'auth_uri username password'.split():
+            if key not in config:
+                raise SkipTest(
+                    "Missing required configuration parameter: %s" % key)
 
-        self.auth_host = config['auth_host']
-        self.auth_port = int(config['auth_port'])
-        self.auth_ssl = config['auth_ssl'] in ('on', 'true', 'yes', '1')
-        self.auth_prefix = config.get('auth_prefix', '/')
+        self.auth_url = config['auth_uri']
+        self.insecure = config_true_value(config.get('insecure', 'false'))
+        self.auth_version = str(config.get('auth_version', '1'))
 
+        self.domain = config.get('domain')
         self.account = config.get('account')
         self.username = config['username']
         self.password = config['password']
 
-        self.storage_host = None
-        self.storage_port = None
-
+        self.storage_netloc = None
+        self.storage_path = None
         self.conn_class = None
+        self.connection = None  # until you call .http_connect()
+
+    @property
+    def storage_url(self):
+        return '%s://%s/%s' % (self.storage_scheme, self.storage_netloc,
+                               self.storage_path)
+
+    @storage_url.setter
+    def storage_url(self, value):
+        url = urllib.parse.urlparse(value)
+
+        if url.scheme == 'http':
+            self.conn_class = http.client.HTTPConnection
+        elif url.scheme == 'https':
+            self.conn_class = http.client.HTTPSConnection
+        else:
+            raise ValueError('unexpected protocol %s' % (url.scheme))
+
+        self.storage_netloc = url.netloc
+        # Make sure storage_path is a string and not unicode, since
+        # keystoneclient (called by swiftclient) returns them in
+        # unicode and this would cause troubles when doing
+        # no_safe_quote query.
+        x = url.path.split('/')
+        self.storage_path = str('/%s/%s' % (x[1], x[2]))
+        self.account_name = str(x[2])
+
+    @property
+    def storage_scheme(self):
+        if self.conn_class is None:
+            return None
+        if issubclass(self.conn_class, http.client.HTTPSConnection):
+            return 'https'
+        return 'http'
 
     def get_account(self):
         return Account(self, self.account)
 
-    def authenticate(self, clone_conn=None):
-        if clone_conn:
-            self.conn_class = clone_conn.conn_class
-            self.storage_host = clone_conn.storage_host
-            self.storage_url = clone_conn.storage_url
-            self.storage_port = clone_conn.storage_port
-            self.storage_token = clone_conn.storage_token
-            return
-
-        if self.account:
+    def authenticate(self):
+        if self.auth_version == "1" and self.account:
             auth_user = '%s:%s' % (self.account, self.username)
         else:
             auth_user = self.username
-        headers = {
-            'x-auth-user': auth_user,
-            'x-auth-key': self.password,
-        }
-
-        path = '%sv1.0' % (self.auth_prefix)
-        if self.auth_ssl:
-            connection = httplib.HTTPSConnection(self.auth_host,
-                                                 port=self.auth_port)
-        else:
-            connection = httplib.HTTPConnection(self.auth_host,
-                                                port=self.auth_port)
-        #connection.set_debuglevel(3)
-        connection.request('GET', path, '', headers)
-        response = connection.getresponse()
-        connection.close()
-
-        if response.status == 401:
-            raise AuthenticationFailed()
-
-        if response.status not in (200, 204):
-            raise ResponseError(response)
 
-        for hdr in response.getheaders():
-            if hdr[0].lower() == "x-storage-url":
-                storage_url = hdr[1]
-            elif hdr[0].lower() == "x-storage-token":
-                storage_token = hdr[1]
+        if self.insecure:
+            try:
+                import requests
+                from requests.packages.urllib3.exceptions import \
+                    InsecureRequestWarning
+            except ImportError:
+                pass
+            else:
+                requests.packages.urllib3.disable_warnings(
+                    InsecureRequestWarning)
+        if self.domain:
+            os_opts = {'project_domain_name': self.domain,
+                       'user_domain_name': self.domain}
+        else:
+            os_opts = {}
+        authargs = dict(snet=False, tenant_name=self.account,
+                        auth_version=self.auth_version, os_options=os_opts,
+                        insecure=self.insecure)
+        (storage_url, storage_token) = get_auth(
+            self.auth_url, auth_user, self.password, **authargs)
 
         if not (storage_url and storage_token):
             raise AuthenticationFailed()
 
-        x = storage_url.split('/')
-
-        if x[0] == 'http:':
-            self.conn_class = httplib.HTTPConnection
-            self.storage_port = 80
-        elif x[0] == 'https:':
-            self.conn_class = httplib.HTTPSConnection
-            self.storage_port = 443
-        else:
-            raise ValueError('unexpected protocol %s' % (x[0]))
-
-        self.storage_host = x[2].split(':')[0]
-        if ':' in x[2]:
-            self.storage_port = int(x[2].split(':')[1])
-        self.storage_url = '/%s/%s' % (x[3], x[4])
-
-        self.storage_token = storage_token
+        self.storage_url = storage_url
+        self.auth_user = auth_user
+        # With v2 keystone, storage_token is unicode.
+        # We want it to be string otherwise this would cause
+        # troubles when doing query with already encoded
+        # non ascii characters in its headers.
+        self.storage_token = str(storage_token)
+        self.user_acl = '%s:%s' % (self.account, self.username)
 
         self.http_connect()
-        return self.storage_url, self.storage_token
+        return self.storage_path, self.storage_token
+
+    def cluster_info(self):
+        """
+        Retrieve the data in /info, or {} on 404
+        """
+        status = self.make_request('GET', '/info',
+                                   cfg={'absolute_path': True})
+        if status // 100 == 4:
+            return {}
+        if not is_success(status):
+            raise ResponseError(self.response, 'GET', '/info')
+        return json.loads(self.response.read())
 
     def http_connect(self):
-        self.connection = self.conn_class(self.storage_host,
-                                          port=self.storage_port)
-        #self.connection.set_debuglevel(3)
+        if self.storage_scheme == 'https' and self.insecure:
+            self.connection = self.conn_class(
+                self.storage_netloc,
+                context=ssl._create_unverified_context())
+        else:
+            self.connection = self.conn_class(self.storage_netloc)
+        self.connection.putrequest = putrequest.__get__(self.connection)
+
+    def make_path(self, path=None, cfg=None):
+        if path is None:
+            path = []
+        if cfg is None:
+            cfg = {}
 
-    def make_path(self, path=[], cfg={}):
         if cfg.get('version_only_path'):
-            return '/' + self.storage_url.split('/')[1]
+            return '/' + self.storage_path.split('/')[1]
 
         if path:
-            quote = urllib.quote
+            quote = urllib.parse.quote
             if cfg.get('no_quote') or cfg.get('no_path_quote'):
-                quote = lambda x: x
-            return '%s/%s' % (self.storage_url,
+                quote = str_to_wsgi
+            return '%s/%s' % (self.storage_path,
                               '/'.join([quote(i) for i in path]))
         else:
-            return self.storage_url
+            return self.storage_path
 
-    def make_headers(self, hdrs, cfg={}):
+    def make_headers(self, hdrs, cfg=None):
+        if cfg is None:
+            cfg = {}
         headers = {}
 
         if not cfg.get('no_auth_token'):
             headers['X-Auth-Token'] = self.storage_token
 
+        if cfg.get('use_token'):
+            headers['X-Auth-Token'] = cfg.get('use_token')
+
         if isinstance(hdrs, dict):
-            headers.update(hdrs)
+            headers.update((str_to_wsgi(h), str_to_wsgi(v))
+                           for h, v in hdrs.items())
         return headers
 
-    def make_request(self, method, path=[], data='', hdrs={}, parms={},
-                     cfg={}):
-        path = self.make_path(path, cfg=cfg)
+    def make_request(self, method, path=None, data=b'', hdrs=None, parms=None,
+                     cfg=None):
+        if path is None:
+            path = []
+        if hdrs is None:
+            hdrs = {}
+        if parms is None:
+            parms = {}
+        if cfg is None:
+            cfg = {}
+        if not cfg.get('absolute_path'):
+            # Set absolute_path=True to make a request to exactly the given
+            # path, not storage path + given path. Useful for
+            # non-account/container/object requests.
+            path = self.make_path(path, cfg=cfg)
         headers = self.make_headers(hdrs, cfg=cfg)
         if isinstance(parms, dict) and parms:
-            quote = urllib.quote
+            quote = urllib.parse.quote
             if cfg.get('no_quote') or cfg.get('no_parms_quote'):
                 quote = lambda x: x
             query_args = ['%s=%s' % (quote(x), quote(str(y)))
@@ -214,41 +375,65 @@ def make_request(self, method, path=[], data='', hdrs={}, parms={},
             path = '%s?%s' % (path, '&'.join(query_args))
         if not cfg.get('no_content_length'):
             if cfg.get('set_content_length'):
-                headers['Content-Length'] = cfg.get('set_content_length')
+                headers['Content-Length'] = str(cfg.get('set_content_length'))
             else:
-                headers['Content-Length'] = len(data)
+                headers['Content-Length'] = str(len(data))
 
         def try_request():
             self.http_connect()
             self.connection.request(method, path, data, headers)
             return self.connection.getresponse()
 
+        try:
+            self.response = self.request_with_retry(try_request)
+        except RequestError as e:
+            details = "{method} {path} headers: {headers} data: {data}".format(
+                method=method, path=path, headers=headers, data=data)
+            raise RequestError('Unable to complete request: %s.\n%s' % (
+                details, str(e)))
+        return self.response.status
+
+    def request_with_retry(self, try_request):
         self.response = None
         try_count = 0
+        fail_messages = []
         while try_count < 5:
             try_count += 1
 
             try:
                 self.response = try_request()
-            except httplib.HTTPException:
+            except socket.timeout as e:
+                fail_messages.append(safe_repr(e))
+                continue
+            except http.client.HTTPException as e:
+                fail_messages.append(safe_repr(e))
                 continue
 
             if self.response.status == 401:
+                fail_messages.append("Response 401")
                 self.authenticate()
                 continue
             elif self.response.status == 503:
+                fail_messages.append("Response 503")
                 if try_count != 5:
                     time.sleep(5)
                 continue
-
             break
 
         if self.response:
-            return self.response.status
+            return self.response
 
-        raise RequestError('Unable to complete http request')
+        raise RequestError('Attempts: %s, Failures: %s' % (
+            len(fail_messages), fail_messages))
+
+    def put_start(self, path, hdrs=None, parms=None, cfg=None, chunked=False):
+        if hdrs is None:
+            hdrs = {}
+        if parms is None:
+            parms = {}
+        if cfg is None:
+            cfg = {}
 
-    def put_start(self, path, hdrs={}, parms={}, cfg={}, chunked=False):
         self.http_connect()
 
         path = self.make_path(path, cfg)
@@ -259,56 +444,80 @@ def put_start(self, path, hdrs={}, parms={}, cfg={}, chunked=False):
             headers.pop('Content-Length', None)
 
         if isinstance(parms, dict) and parms:
-            quote = urllib.quote
+            quote = urllib.parse.quote
             if cfg.get('no_quote') or cfg.get('no_parms_quote'):
                 quote = lambda x: x
             query_args = ['%s=%s' % (quote(x), quote(str(y)))
                           for (x, y) in parms.items()]
             path = '%s?%s' % (path, '&'.join(query_args))
 
-            query_args = ['%s=%s' % (urllib.quote(x),
-                          urllib.quote(str(y))) for (x, y) in parms.items()]
-            path = '%s?%s' % (path, '&'.join(query_args))
-
-        self.connection = self.conn_class(self.storage_host,
-                                          port=self.storage_port)
-        #self.connection.set_debuglevel(3)
         self.connection.putrequest('PUT', path)
-        for key, value in headers.iteritems():
+        for key, value in headers.items():
             self.connection.putheader(key, value)
         self.connection.endheaders()
 
     def put_data(self, data, chunked=False):
         if chunked:
-            self.connection.send('%x\r\n%s\r\n' % (len(data), data))
+            self.connection.send(b'%x\r\n%s\r\n' % (len(data), data))
         else:
             self.connection.send(data)
 
     def put_end(self, chunked=False):
         if chunked:
-            self.connection.send('0\r\n\r\n')
+            self.connection.send(b'0\r\n\r\n')
 
         self.response = self.connection.getresponse()
+        # Hope it isn't big!
+        self.response.body = self.response.read()
         self.connection.close()
         return self.response.status
 
 
-class Base:
+class Base(object):
     def __str__(self):
         return self.name
 
-    def header_fields(self, fields):
-        headers = dict(self.conn.response.getheaders())
+    def header_fields(self, required_fields, optional_fields=None):
+        if optional_fields is None:
+            optional_fields = ()
+
+        def is_int_header(header):
+            if header.startswith('x-account-storage-policy-') and \
+                    header.endswith(('-bytes-used', '-object-count')):
+                return True
+            return header in (
+                'content-length',
+                'x-account-container-count',
+                'x-account-object-count',
+                'x-account-bytes-used',
+                'x-container-object-count',
+                'x-container-bytes-used',
+            )
+
+        # NB: on py2, headers were always lower; on py3, they match the bytes
+        # on the wire
+        headers = dict((wsgi_to_str(h).lower(), wsgi_to_str(v))
+                       for h, v in self.conn.response.getheaders())
         ret = {}
-        for field in fields:
-            if not field[1] in headers:
-                raise ValueError("%s was not found in response header" %
-                                 (field[1]))
 
-            try:
-                ret[field[0]] = int(headers[field[1]])
-            except ValueError:
-                ret[field[0]] = headers[field[1]]
+        for return_key, header in required_fields:
+            if header not in headers:
+                raise ValueError("%s was not found in response headers: %r" %
+                                 (header, headers))
+
+            if is_int_header(header):
+                ret[return_key] = int(headers[header])
+            else:
+                ret[return_key] = headers[header]
+
+        for return_key, header in optional_fields:
+            if header not in headers:
+                continue
+            if is_int_header(header):
+                ret[return_key] = int(headers[header])
+            else:
+                ret[return_key] = headers[header]
+
         return ret
 
 
@@ -317,65 +526,99 @@ def __init__(self, conn, name):
         self.conn = conn
         self.name = str(name)
 
+    def update_metadata(self, metadata=None, cfg=None):
+        if metadata is None:
+            metadata = {}
+        if cfg is None:
+            cfg = {}
+        headers = dict(("X-Account-Meta-%s" % k, v)
+                       for k, v in metadata.items())
+
+        self.conn.make_request('POST', self.path, hdrs=headers, cfg=cfg)
+        if not is_success(self.conn.response.status):
+            raise ResponseError(self.conn.response, 'POST',
+                                self.conn.make_path(self.path))
+        return True
+
     def container(self, container_name):
         return Container(self.conn, self.name, container_name)
 
-    def containers(self, hdrs={}, parms={}, cfg={}):
-        format = parms.get('format', None)
-        if format not in [None, 'json', 'xml']:
-            raise RequestError('Invalid format: %s' % format)
-        if format is None and 'format' in parms:
+    def containers(self, hdrs=None, parms=None, cfg=None):
+        if hdrs is None:
+            hdrs = {}
+        if parms is None:
+            parms = {}
+        if cfg is None:
+            cfg = {}
+
+        format_type = parms.get('format', None)
+        if format_type not in [None, 'json', 'xml']:
+            raise RequestError('Invalid format: %s' % format_type)
+        if format_type is None and 'format' in parms:
             del parms['format']
 
         status = self.conn.make_request('GET', self.path, hdrs=hdrs,
                                         parms=parms, cfg=cfg)
         if status == 200:
-            if format == 'json':
+            if format_type == 'json':
                 conts = json.loads(self.conn.response.read())
-                for cont in conts:
-                    cont['name'] = cont['name'].encode('utf-8')
                 return conts
-            elif format == 'xml':
+            elif format_type == 'xml':
                 conts = []
                 tree = minidom.parseString(self.conn.response.read())
                 for x in tree.getElementsByTagName('container'):
                     cont = {}
-                    for key in ['name', 'count', 'bytes']:
+                    for key in ['name', 'count', 'bytes', 'last_modified',
+                                'storage_policy']:
                         cont[key] = x.getElementsByTagName(key)[0].\
                             childNodes[0].nodeValue
                     conts.append(cont)
                 for cont in conts:
-                    cont['name'] = cont['name'].encode('utf-8')
+                    for key in ('count', 'bytes'):
+                        cont[key] = int(cont[key])
                 return conts
             else:
-                lines = self.conn.response.read().split('\n')
+                lines = self.conn.response.read().split(b'\n')
                 if lines and not lines[-1]:
                     lines = lines[:-1]
-                return lines
+                return [line.decode('utf-8') for line in lines]
         elif status == 204:
             return []
 
-        raise ResponseError(self.conn.response)
+        raise ResponseError(self.conn.response, 'GET',
+                            self.conn.make_path(self.path))
 
     def delete_containers(self):
         for c in listing_items(self.containers):
             cont = self.container(c)
+            cont.update_metadata(hdrs={'x-versions-location': ''},
+                                 tolerate_missing=True)
             if not cont.delete_recursive():
                 return False
 
         return listing_empty(self.containers)
 
-    def info(self, hdrs={}, parms={}, cfg={}):
+    def info(self, hdrs=None, parms=None, cfg=None):
+        if hdrs is None:
+            hdrs = {}
+        if parms is None:
+            parms = {}
+        if cfg is None:
+            cfg = {}
         if self.conn.make_request('HEAD', self.path, hdrs=hdrs,
                                   parms=parms, cfg=cfg) != 204:
 
-            raise ResponseError(self.conn.response)
+            raise ResponseError(self.conn.response, 'HEAD',
+                                self.conn.make_path(self.path))
 
         fields = [['object_count', 'x-account-object-count'],
                   ['container_count', 'x-account-container-count'],
                   ['bytes_used', 'x-account-bytes-used']]
+        optional_fields = [
+            ['temp-url-key', 'x-account-meta-temp-url-key'],
+            ['temp-url-key-2', 'x-account-meta-temp-url-key-2']]
 
-        return self.header_fields(fields)
+        return self.header_fields(fields, optional_fields=optional_fields)
 
     @property
     def path(self):
@@ -383,91 +626,153 @@ def path(self):
 
 
 class Container(Base):
+    # policy_specified is set in __init__.py when tests are being set up.
+    policy_specified = None
+
     def __init__(self, conn, account, name):
         self.conn = conn
         self.account = str(account)
         self.name = str(name)
 
-    def create(self, hdrs={}, parms={}, cfg={}):
+    def create(self, hdrs=None, parms=None, cfg=None):
+        if hdrs is None:
+            hdrs = {}
+        if parms is None:
+            parms = {}
+        if cfg is None:
+            cfg = {}
+        if self.policy_specified and 'X-Storage-Policy' not in hdrs:
+            hdrs['X-Storage-Policy'] = self.policy_specified
         return self.conn.make_request('PUT', self.path, hdrs=hdrs,
                                       parms=parms, cfg=cfg) in (201, 202)
 
-    def delete(self, hdrs={}, parms={}):
+    def update_metadata(self, hdrs=None, cfg=None, tolerate_missing=False):
+        if hdrs is None:
+            hdrs = {}
+        if cfg is None:
+            cfg = {}
+
+        self.conn.make_request('POST', self.path, hdrs=hdrs, cfg=cfg)
+        if is_success(self.conn.response.status):
+            return True
+        if tolerate_missing and self.conn.response.status == 404:
+            return True
+        raise ResponseError(self.conn.response, 'POST',
+                            self.conn.make_path(self.path))
+
+    def delete(self, hdrs=None, parms=None, tolerate_missing=False):
+        if hdrs is None:
+            hdrs = {}
+        if parms is None:
+            parms = {}
+        allowed_codes = (204, 404) if tolerate_missing else (204, )
         return self.conn.make_request('DELETE', self.path, hdrs=hdrs,
-                                      parms=parms) == 204
+                                      parms=parms) in allowed_codes
+
+    def delete_files(self, tolerate_missing=False):
+        partialed_files = functools.partial(
+            self.files, tolerate_missing=tolerate_missing)
 
-    def delete_files(self):
-        for f in listing_items(self.files):
-            file = self.file(f)
-            if not file.delete():
+        for f in listing_items(partialed_files):
+            file_item = self.file(f)
+            if not file_item.delete(tolerate_missing=True):
                 return False
 
-        return listing_empty(self.files)
+        return listing_empty(partialed_files)
 
     def delete_recursive(self):
-        return self.delete_files() and self.delete()
+        return self.delete_files(tolerate_missing=True) and \
+            self.delete(tolerate_missing=True)
 
     def file(self, file_name):
         return File(self.conn, self.account, self.name, file_name)
 
-    def files(self, hdrs={}, parms={}, cfg={}):
-        format = parms.get('format', None)
-        if format not in [None, 'json', 'xml']:
-            raise RequestError('Invalid format: %s' % format)
-        if format is None and 'format' in parms:
+    def files(self, hdrs=None, parms=None, cfg=None, tolerate_missing=False):
+        if hdrs is None:
+            hdrs = {}
+        if parms is None:
+            parms = {}
+        if cfg is None:
+            cfg = {}
+        format_type = parms.get('format', None)
+        if format_type not in [None, 'plain', 'json', 'xml']:
+            raise RequestError('Invalid format: %s' % format_type)
+        if format_type is None and 'format' in parms:
             del parms['format']
 
         status = self.conn.make_request('GET', self.path, hdrs=hdrs,
                                         parms=parms, cfg=cfg)
         if status == 200:
-            if format == 'json':
-                files = json.loads(self.conn.response.read())
-
-                for file in files:
-                    file['name'] = file['name'].encode('utf-8')
-                    file['content_type'] = file['content_type'].encode('utf-8')
-                return files
-            elif format == 'xml':
+            if format_type == 'json' or 'versions' in parms:
+                return json.loads(self.conn.response.read())
+            elif format_type == 'xml':
                 files = []
                 tree = minidom.parseString(self.conn.response.read())
-                for x in tree.getElementsByTagName('object'):
-                    file = {}
-                    for key in ['name', 'hash', 'bytes', 'content_type',
-                                'last_modified']:
-
-                        file[key] = x.getElementsByTagName(key)[0].\
-                            childNodes[0].nodeValue
-                    files.append(file)
-
-                for file in files:
-                    file['name'] = file['name'].encode('utf-8')
-                    file['content_type'] = file['content_type'].encode('utf-8')
+                container = tree.getElementsByTagName('container')[0]
+                for x in container.childNodes:
+                    file_item = {}
+                    if x.tagName == 'object':
+                        for key in ['name', 'hash', 'bytes', 'content_type',
+                                    'last_modified']:
+                            file_item[key] = x.getElementsByTagName(key)[0].\
+                                childNodes[0].nodeValue
+                    elif x.tagName == 'subdir':
+                        file_item['subdir'] = x.getElementsByTagName(
+                            'name')[0].childNodes[0].nodeValue
+                    else:
+                        raise ValueError('Found unexpected element %s'
+                                         % x.tagName)
+                    files.append(file_item)
+
+                for file_item in files:
+                    if 'bytes' in file_item:
+                        file_item['bytes'] = int(file_item['bytes'])
                 return files
             else:
                 content = self.conn.response.read()
                 if content:
-                    lines = content.split('\n')
+                    lines = content.split(b'\n')
                     if lines and not lines[-1]:
                         lines = lines[:-1]
-                    return lines
+                    return [line.decode('utf-8') for line in lines]
                 else:
                     return []
-        elif status == 204:
+        elif status == 204 or (status == 404 and tolerate_missing):
             return []
 
-        raise ResponseError(self.conn.response)
+        raise ResponseError(self.conn.response, 'GET',
+                            self.conn.make_path(self.path, cfg=cfg))
 
-    def info(self, hdrs={}, parms={}, cfg={}):
-        status = self.conn.make_request('HEAD', self.path, hdrs=hdrs,
-                                        parms=parms, cfg=cfg)
+    def info(self, hdrs=None, parms=None, cfg=None):
+        if hdrs is None:
+            hdrs = {}
+        if parms is None:
+            parms = {}
+        if cfg is None:
+            cfg = {}
+        self.conn.make_request('HEAD', self.path, hdrs=hdrs,
+                               parms=parms, cfg=cfg)
 
         if self.conn.response.status == 204:
-            fields = [['bytes_used', 'x-container-bytes-used'],
-                      ['object_count', 'x-container-object-count']]
-
-            return self.header_fields(fields)
-
-        raise ResponseError(self.conn.response)
+            required_fields = [['bytes_used', 'x-container-bytes-used'],
+                               ['object_count', 'x-container-object-count'],
+                               ['last_modified', 'last-modified']]
+            optional_fields = [
+                # N.B. swift doesn't return both x-versions-location
+                # and x-history-location at a response so that this is safe
+                # using same variable "versions" for both and it means
+                # versioning is enabled.
+                ['versions', 'x-versions-location'],
+                ['versions', 'x-history-location'],
+                ['versions_enabled', 'x-versions-enabled'],
+                ['tempurl_key', 'x-container-meta-temp-url-key'],
+                ['tempurl_key2', 'x-container-meta-temp-url-key-2'],
+                ['container_quota_bytes', 'x-container-meta-quota-bytes']]
+
+            return self.header_fields(required_fields, optional_fields)
+
+        raise ResponseError(self.conn.response, 'HEAD',
+                            self.conn.make_path(self.path))
 
     @property
     def path(self):
@@ -483,18 +788,24 @@ def __init__(self, conn, account, container, name):
 
         self.chunked_write_in_progress = False
         self.content_type = None
+        self.content_range = None
         self.size = None
         self.metadata = {}
 
-    def make_headers(self, cfg={}):
+    def make_headers(self, cfg=None):
+        if cfg is None:
+            cfg = {}
         headers = {}
         if not cfg.get('no_content_length'):
             if cfg.get('set_content_length'):
-                headers['Content-Length'] = cfg.get('set_content_length')
+                headers['Content-Length'] = str(cfg.get('set_content_length'))
             elif self.size:
-                headers['Content-Length'] = self.size
+                headers['Content-Length'] = str(self.size)
             else:
-                headers['Content-Length'] = 0
+                headers['Content-Length'] = '0'
+
+        if cfg.get('use_token'):
+            headers['X-Auth-Token'] = cfg.get('use_token')
 
         if cfg.get('no_content_type'):
             pass
@@ -512,10 +823,10 @@ def make_headers(self, cfg={}):
     def compute_md5sum(cls, data):
         block_size = 4096
 
-        if isinstance(data, str):
-            data = StringIO.StringIO(data)
+        if isinstance(data, bytes):
+            data = io.BytesIO(data)
 
-        checksum = hashlib.md5()
+        checksum = md5(usedforsecurity=False)
         buff = data.read(block_size)
         while buff:
             checksum.update(buff)
@@ -523,7 +834,18 @@ def compute_md5sum(cls, data):
         data.seek(0)
         return checksum.hexdigest()
 
-    def copy(self, dest_cont, dest_file, hdrs={}, parms={}, cfg={}):
+    def copy(self, dest_cont, dest_file, hdrs=None, parms=None, cfg=None,
+             return_resp=False):
+        """
+        Make a copy of this object using a COPY request with a Destination
+        header.
+        """
+        if hdrs is None:
+            hdrs = {}
+        if parms is None:
+            parms = {}
+        if cfg is None:
+            cfg = {}
         if 'destination' in cfg:
             headers = {'Destination': cfg['destination']}
         elif cfg.get('no_destination'):
@@ -533,35 +855,118 @@ def copy(self, dest_cont, dest_file, hdrs={}, parms={}, cfg={}):
         headers.update(hdrs)
 
         if 'Destination' in headers:
-            headers['Destination'] = urllib.quote(headers['Destination'])
+            headers['Destination'] = urllib.parse.quote(headers['Destination'])
+
+        if self.conn.make_request('COPY', self.path, hdrs=headers,
+                                  cfg=cfg, parms=parms) != 201:
+            raise ResponseError(self.conn.response, 'COPY',
+                                self.conn.make_path(self.path))
+        if return_resp:
+            return self.conn.response
+        return True
+
+    def copy_using_x_copy_from(self, dest_cont, dest_file, hdrs=None,
+                               parms=None, cfg=None, return_resp=False):
+        """
+        Make a copy of this object using a PUT request with an X-Copy-From
+        header.
+        """
+        if hdrs is None:
+            hdrs = {}
+        if parms is None:
+            parms = {}
+        if cfg is None:
+            cfg = {}
+        headers = {'X-Copy-From': '/'.join(self.path)}
+        headers.update(hdrs)
+        path = [dest_cont, dest_file]
+        if self.conn.make_request('PUT', path, hdrs=headers,
+                                  cfg=cfg, parms=parms) != 201:
+            raise ResponseError(self.conn.response, 'PUT',
+                                self.conn.make_path(path))
+        if return_resp:
+            return self.conn.response
+        return True
+
+    def copy_account(self, dest_account, dest_cont, dest_file,
+                     hdrs=None, parms=None, cfg=None):
+        if hdrs is None:
+            hdrs = {}
+        if parms is None:
+            parms = {}
+        if cfg is None:
+            cfg = {}
+        if 'destination' in cfg:
+            headers = {'Destination': cfg['destination']}
+        elif cfg.get('no_destination'):
+            headers = {}
+        else:
+            headers = {'Destination-Account': dest_account,
+                       'Destination': '%s/%s' % (dest_cont, dest_file)}
+        headers.update(hdrs)
+
+        if 'Destination-Account' in headers:
+            headers['Destination-Account'] = \
+                urllib.parse.quote(headers['Destination-Account'])
+        if 'Destination' in headers:
+            headers['Destination'] = urllib.parse.quote(headers['Destination'])
 
-        return self.conn.make_request('COPY', self.path, hdrs=headers,
-                                      parms=parms) == 201
+        if self.conn.make_request('COPY', self.path, hdrs=headers,
+                                  cfg=cfg, parms=parms) != 201:
+            raise ResponseError(self.conn.response, 'COPY',
+                                self.conn.make_path(self.path))
+        return True
 
-    def delete(self, hdrs={}, parms={}):
-        if self.conn.make_request('DELETE', self.path, hdrs=hdrs,
-                                  parms=parms) != 204:
+    def delete(self, hdrs=None, parms=None, cfg=None, tolerate_missing=False):
+        if hdrs is None:
+            hdrs = {}
+        if parms is None:
+            parms = {}
+        if tolerate_missing:
+            allowed_statuses = (204, 404)
+        else:
+            allowed_statuses = (204,)
 
-            raise ResponseError(self.conn.response)
+        if self.conn.make_request(
+                'DELETE', self.path, hdrs=hdrs, cfg=cfg,
+                parms=parms) not in allowed_statuses:
+            raise ResponseError(self.conn.response, 'DELETE',
+                                self.conn.make_path(self.path))
 
         return True
 
-    def info(self, hdrs={}, parms={}, cfg={}):
+    def info(self, hdrs=None, parms=None, cfg=None, exp_status=200):
+        if hdrs is None:
+            hdrs = {}
+        if parms is None:
+            parms = {}
+        if cfg is None:
+            cfg = {}
         if self.conn.make_request('HEAD', self.path, hdrs=hdrs,
-                                  parms=parms, cfg=cfg) != 200:
+                                  parms=parms, cfg=cfg) != exp_status:
 
-            raise ResponseError(self.conn.response)
+            raise ResponseError(self.conn.response, 'HEAD',
+                                self.conn.make_path(self.path))
 
         fields = [['content_length', 'content-length'],
                   ['content_type', 'content-type'],
                   ['last_modified', 'last-modified'],
                   ['etag', 'etag']]
-
-        header_fields = self.header_fields(fields)
-        header_fields['etag'] = header_fields['etag'].strip('"')
+        optional_fields = [['x_object_manifest', 'x-object-manifest'],
+                           ['x_manifest_etag', 'x-manifest-etag'],
+                           ['x_object_version_id', 'x-object-version-id'],
+                           ['x_symlink_target', 'x-symlink-target']]
+
+        header_fields = self.header_fields(fields,
+                                           optional_fields=optional_fields)
+        header_fields['etag'] = header_fields['etag']
         return header_fields
 
-    def initialize(self, hdrs={}, parms={}):
+    def initialize(self, hdrs=None, parms=None):
+        if hdrs is None:
+            hdrs = {}
+        if parms is None:
+            parms = {}
         if not self.name:
             return False
 
@@ -569,20 +974,23 @@ def initialize(self, hdrs={}, parms={}):
                                         parms=parms)
         if status == 404:
             return False
-        elif (status < 200) or (status > 299):
-            raise ResponseError(self.conn.response)
-
-        for hdr in self.conn.response.getheaders():
-            if hdr[0].lower() == 'content-type':
-                self.content_type = hdr[1]
-            if hdr[0].lower().startswith('x-object-meta-'):
-                self.metadata[hdr[0][14:]] = hdr[1]
-            if hdr[0].lower() == 'etag':
-                self.etag = hdr[1].strip('"')
-            if hdr[0].lower() == 'content-length':
-                self.size = int(hdr[1])
-            if hdr[0].lower() == 'last-modified':
-                self.last_modified = hdr[1]
+        elif not is_success(status):
+            raise ResponseError(self.conn.response, 'HEAD',
+                                self.conn.make_path(self.path))
+
+        for hdr, val in self.conn.response.getheaders():
+            hdr = wsgi_to_str(hdr).lower()
+            val = wsgi_to_str(val)
+            if hdr == 'content-type':
+                self.content_type = val
+            if hdr.startswith('x-object-meta-'):
+                self.metadata[hdr[14:]] = val
+            if hdr == 'etag':
+                self.etag = val
+            if hdr == 'content-length':
+                self.size = int(val)
+            if hdr == 'last-modified':
+                self.last_modified = val
 
         return True
 
@@ -599,30 +1007,37 @@ def path(self):
     def random_data(cls, size=None):
         if size is None:
             size = random.randint(1, 32768)
-        fd = open('/dev/urandom', 'r')
+        fd = open('/dev/urandom', 'rb')
         data = fd.read(size)
         fd.close()
         return data
 
     def read(self, size=-1, offset=0, hdrs=None, buffer=None,
-             callback=None, cfg={}):
+             callback=None, cfg=None, parms=None):
+        if cfg is None:
+            cfg = {}
+        if parms is None:
+            parms = {}
 
         if size > 0:
-            range = 'bytes=%d-%d' % (offset, (offset + size) - 1)
+            range_string = 'bytes=%d-%d' % (offset, (offset + size) - 1)
             if hdrs:
-                hdrs['Range'] = range
+                hdrs['Range'] = range_string
             else:
-                hdrs = {'Range': range}
+                hdrs = {'Range': range_string}
 
         status = self.conn.make_request('GET', self.path, hdrs=hdrs,
-                                        cfg=cfg)
+                                        cfg=cfg, parms=parms)
 
-        if(status < 200) or (status > 299):
-            raise ResponseError(self.conn.response)
+        if not is_success(status):
+            raise ResponseError(self.conn.response, 'GET',
+                                self.conn.make_path(self.path))
 
-        for hdr in self.conn.response.getheaders():
-            if hdr[0].lower() == 'content-type':
-                self.content_type = hdr[1]
+        for hdr, val in self.conn.response.getheaders():
+            if hdr.lower() == 'content-type':
+                self.content_type = wsgi_to_str(val)
+            if hdr.lower() == 'content-range':
+                self.content_range = val
 
         if hasattr(buffer, 'write'):
             scratch = self.conn.response.read(8192)
@@ -641,10 +1056,11 @@ def read(self, size=-1, offset=0, hdrs=None, buffer=None,
     def read_md5(self):
         status = self.conn.make_request('GET', self.path)
 
-        if(status < 200) or (status > 299):
-            raise ResponseError(self.conn.response)
+        if not is_success(status):
+            raise ResponseError(self.conn.response, 'GET',
+                                self.conn.make_path(self.path))
 
-        checksum = hashlib.md5()
+        checksum = md5(usedforsecurity=False)
 
         scratch = self.conn.response.read(8192)
         while len(scratch) > 0:
@@ -660,26 +1076,38 @@ def save_to_filename(self, filename, callback=None):
         finally:
             fobj.close()
 
-    def sync_metadata(self, metadata={}, cfg={}):
-        self.metadata.update(metadata)
+    def sync_metadata(self, metadata=None, cfg=None, parms=None):
+        if cfg is None:
+            cfg = {}
+
+        self.metadata = self.metadata if metadata is None else metadata
 
         if self.metadata:
             headers = self.make_headers(cfg=cfg)
             if not cfg.get('no_content_length'):
                 if cfg.get('set_content_length'):
-                    headers['Content-Length'] = \
-                        cfg.get('set_content_length')
+                    headers['Content-Length'] = str(
+                        cfg.get('set_content_length'))
                 else:
-                    headers['Content-Length'] = 0
+                    headers['Content-Length'] = '0'
 
-            self.conn.make_request('POST', self.path, hdrs=headers, cfg=cfg)
+            self.conn.make_request('POST', self.path, hdrs=headers,
+                                   parms=parms, cfg=cfg)
 
-            if self.conn.response.status not in (201, 202):
-                raise ResponseError(self.conn.response)
+            if self.conn.response.status != 202:
+                raise ResponseError(self.conn.response, 'POST',
+                                    self.conn.make_path(self.path))
 
         return True
 
-    def chunked_write(self, data=None, hdrs={}, parms={}, cfg={}):
+    def chunked_write(self, data=None, hdrs=None, parms=None, cfg=None):
+        if hdrs is None:
+            hdrs = {}
+        if parms is None:
+            parms = {}
+        if cfg is None:
+            cfg = {}
+
         if data is not None and self.chunked_write_in_progress:
             self.conn.put_data(data, True)
         elif data is not None:
@@ -698,10 +1126,18 @@ def chunked_write(self, data=None, hdrs={}, parms={}, cfg={}):
         else:
             raise RuntimeError
 
-    def write(self, data='', hdrs={}, parms={}, callback=None, cfg={}):
+    def write(self, data=b'', hdrs=None, parms=None, callback=None, cfg=None,
+              return_resp=False):
+        if hdrs is None:
+            hdrs = {}
+        if parms is None:
+            parms = {}
+        if cfg is None:
+            cfg = {}
+
         block_size = 2 ** 20
 
-        if isinstance(data, file):
+        if all(hasattr(data, attr) for attr in ('flush', 'seek', 'fileno')):
             try:
                 data.flush()
                 data.seek(0)
@@ -709,39 +1145,99 @@ def write(self, data='', hdrs={}, parms={}, callback=None, cfg={}):
                 pass
             self.size = int(os.fstat(data.fileno())[6])
         else:
-            data = StringIO.StringIO(data)
-            self.size = data.len
+            data = io.BytesIO(data)
+            self.size = data.seek(0, os.SEEK_END)
+            data.seek(0)
 
         headers = self.make_headers(cfg=cfg)
         headers.update(hdrs)
 
-        self.conn.put_start(self.path, hdrs=headers, parms=parms, cfg=cfg)
+        def try_request():
+            # rewind to be ready for another attempt
+            data.seek(0)
+            self.conn.put_start(self.path, hdrs=headers, parms=parms, cfg=cfg)
 
-        transfered = 0
-        buff = data.read(block_size)
-        try:
-            while len(buff) > 0:
+            transferred = 0
+            for buff in iter(lambda: data.read(block_size), b''):
                 self.conn.put_data(buff)
-                buff = data.read(block_size)
-                transfered += len(buff)
+                transferred += len(buff)
                 if callable(callback):
-                    callback(transfered, self.size)
+                    callback(transferred, self.size)
 
             self.conn.put_end()
-        except socket.timeout, err:
-            raise err
+            return self.conn.response
 
-        if (self.conn.response.status < 200) or \
-           (self.conn.response.status > 299):
-            raise ResponseError(self.conn.response)
+        try:
+            self.response = self.conn.request_with_retry(try_request)
+        except RequestError as e:
+            raise ResponseError(self.conn.response, 'PUT',
+                                self.conn.make_path(self.path), details=str(e))
+        if not is_success(self.response.status):
+            raise ResponseError(self.conn.response, 'PUT',
+                                self.conn.make_path(self.path))
 
+        try:
+            data.seek(0)
+        except IOError:
+            pass
         self.md5 = self.compute_md5sum(data)
 
+        if return_resp:
+            return self.conn.response
+
         return True
 
-    def write_random(self, size=None, hdrs={}, parms={}, cfg={}):
+    def write_random(self, size=None, hdrs=None, parms=None, cfg=None):
+        if hdrs is None:
+            hdrs = {}
+        if parms is None:
+            parms = {}
+        if cfg is None:
+            cfg = {}
+
         data = self.random_data(size)
         if not self.write(data, hdrs=hdrs, parms=parms, cfg=cfg):
-            raise ResponseError(self.conn.response)
-        self.md5 = self.compute_md5sum(StringIO.StringIO(data))
+            raise ResponseError(self.conn.response, 'PUT',
+                                self.conn.make_path(self.path))
+        self.md5 = self.compute_md5sum(io.BytesIO(data))
         return data
+
+    def write_random_return_resp(self, size=None, hdrs=None, parms=None,
+                                 cfg=None):
+        if hdrs is None:
+            hdrs = {}
+        if parms is None:
+            parms = {}
+        if cfg is None:
+            cfg = {}
+
+        data = self.random_data(size)
+        resp = self.write(data, hdrs=hdrs, parms=parms, cfg=cfg,
+                          return_resp=True)
+        if not resp:
+            raise ResponseError(self.conn.response)
+        self.md5 = self.compute_md5sum(io.BytesIO(data))
+        return resp
+
+    def post(self, hdrs=None, parms=None, cfg=None, return_resp=False):
+        if hdrs is None:
+            hdrs = {}
+        if parms is None:
+            parms = {}
+        if cfg is None:
+            cfg = {}
+
+        headers = self.make_headers(cfg=cfg)
+        headers.update(hdrs)
+
+        self.conn.make_request('POST', self.path, hdrs=headers,
+                               parms=parms, cfg=cfg)
+
+        if self.conn.response.status != 202:
+            raise ResponseError(self.conn.response, 'POST',
+                                self.conn.make_path(self.path))
+
+        if return_resp:
+            return self.conn.response
+
+        return True
diff --git a/test/functional/test_access_control.py b/test/functional/test_access_control.py
new file mode 100644
index 0000000000..096da5ac68
--- /dev/null
+++ b/test/functional/test_access_control.py
@@ -0,0 +1,3318 @@
+#!/usr/bin/python
+# Copyright (c) 2015 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+from urllib.parse import urlparse, urlunparse
+import uuid
+from random import shuffle
+
+try:
+    from keystoneclient.v3 import client as ksc
+except ImportError:
+    ksc = None
+from swiftclient import get_auth, http_connection
+
+import test.functional as tf
+
+
+def setUpModule():
+    tf.setup_package()
+
+
+def tearDownModule():
+    tf.teardown_package()
+
+
+TEST_CASE_FORMAT = (
+    'http_method', 'header', 'account_name', 'container_name', 'object_name',
+    'prep_container_header', 'reseller_prefix', 'target_user_name',
+    'auth_user_name', 'service_user_name', 'expected')
+# http_method           : HTTP methods such as PUT, GET, POST, HEAD and so on
+# header                : headers for a request
+# account_name          : Account name. Usually the name will be automatically
+#                         created by keystone
+# container_name        : Container name. If 'UUID' is specified, a container
+#                         name will be created automatically
+# object_name           : Object name. If 'UUID' is specified, a container
+#                         name will be created automatically
+# prep_container_header : headers which will be set on the container
+# reseller_prefix       : Reseller prefix that will be used for request url.
+#                         Can be None or SERVICE to select the user account
+#                         prefix or the service prefix respectively
+# target_user_name      : a user name which is used for getting the project id
+#                         of the target
+# auth_user_name        : a user name which is used for getting a token for
+#                         X-Auth_Token
+# service_user_name     : a user name which is used for getting a token for
+#                         X-Service-Token
+# expected              : expected status code
+#
+# a combination of account_name, container_name and object_name
+# represents a target.
+# +------------+--------------+-----------+---------+
+# |account_name|container_name|object_name| target  |
+# +------------+--------------+-----------+---------+
+# |    None    |     None     |   None    | account |
+# +------------+--------------+-----------+---------+
+# |    None    |    'UUID'    |   None    |container|
+# +------------+--------------+-----------+---------+
+# |    None    |    'UUID'    |  'UUID'   | object  |
+# +------------+--------------+-----------+---------+
+#
+# The following users are required to run this functional test.
+# No.6, tester6, is added for this test.
+# +----+-----------+-------+---------+-------------+
+# |No. |  Domain   |Project|User name|    Role     |
+# +----+-----------+-------+---------+-------------+
+# | 1  |  default  | test  | tester  |    admin    |
+# +----+-----------+-------+---------+-------------+
+# | 2  |  default  | test2 | tester2 |    admin    |
+# +----+-----------+-------+---------+-------------+
+# | 3  |  default  | test  | tester3 |  _member_   |
+# +----+-----------+-------+---------+-------------+
+# | 4  |test-domain| test4 | tester4 |    admin    |
+# +----+-----------+-------+---------+-------------+
+# | 5  |  default  | test5 | tester5 |   service   |
+# +----+-----------+-------+---------+-------------+
+# | 6  |  default  | test  | tester6 |ResellerAdmin|
+# +----+-----------+-------+---------+-------------+
+
+# A scenario of put for account, container and object with
+# several roles.
+RBAC_PUT = [
+    # PUT container in own account: ok
+    ('PUT', None, None, 'UUID', None, None,
+     None, 'tester', 'tester', None, 201),
+    ('PUT', None, None, 'UUID', None, None,
+     None, 'tester', 'tester', 'tester', 201),
+
+    # PUT container in other users account: not allowed for role admin
+    ('PUT', None, None, 'UUID', None, None,
+     None, 'tester2', 'tester', None, 403),
+    ('PUT', None, None, 'UUID', None, None,
+     None, 'tester4', 'tester', None, 403),
+
+    # PUT container in other users account: not allowed for role _member_
+    ('PUT', None, None, 'UUID', None, None,
+     None, 'tester3', 'tester3', None, 403),
+    ('PUT', None, None, 'UUID', None, None,
+     None, 'tester2', 'tester3', None, 403),
+    ('PUT', None, None, 'UUID', None, None,
+     None, 'tester4', 'tester3', None, 403),
+
+    # PUT container in other users account: allowed for role ResellerAdmin
+    ('PUT', None, None, 'UUID', None, None,
+     None, 'tester6', 'tester6', None, 201),
+    ('PUT', None, None, 'UUID', None, None,
+     None, 'tester2', 'tester6', None, 201),
+    ('PUT', None, None, 'UUID', None, None,
+     None, 'tester4', 'tester6', None, 201),
+
+    # PUT object in own account: ok
+    ('PUT', None, None, 'UUID', 'UUID', None,
+     None, 'tester', 'tester', None, 201),
+    ('PUT', None, None, 'UUID', 'UUID', None,
+     None, 'tester', 'tester', 'tester', 201),
+
+    # PUT object in other users account: not allowed for role admin
+    ('PUT', None, None, 'UUID', 'UUID', None,
+     None, 'tester2', 'tester', None, 403),
+    ('PUT', None, None, 'UUID', 'UUID', None,
+     None, 'tester4', 'tester', None, 403),
+
+    # PUT object in other users account: not allowed for role _member_
+    ('PUT', None, None, 'UUID', 'UUID', None,
+     None, 'tester3', 'tester3', None, 403),
+    ('PUT', None, None, 'UUID', 'UUID', None,
+     None, 'tester2', 'tester3', None, 403),
+    ('PUT', None, None, 'UUID', 'UUID', None,
+     None, 'tester4', 'tester3', None, 403),
+
+    # PUT object in other users account: allowed for role ResellerAdmin
+    ('PUT', None, None, 'UUID', 'UUID', None,
+     None, 'tester6', 'tester6', None, 201),
+    ('PUT', None, None, 'UUID', 'UUID', None,
+     None, 'tester2', 'tester6', None, 201),
+    ('PUT', None, None, 'UUID', 'UUID', None,
+     None, 'tester4', 'tester6', None, 201)
+]
+
+
+RBAC_PUT_WITH_SERVICE_PREFIX = [
+    # PUT container in own account: ok
+    ('PUT', None, None, 'UUID', None, None,
+     None, 'tester', 'tester', 'tester5', 201),
+
+    # PUT container in other users account: not allowed for role service
+    ('PUT', None, None, 'UUID', None, None,
+     None, 'tester', 'tester3', 'tester5', 403),
+    ('PUT', None, None, 'UUID', None, None,
+     None, 'tester', None, 'tester5', 401),
+    ('PUT', None, None, 'UUID', None, None,
+     None, 'tester5', 'tester5', None, 403),
+    ('PUT', None, None, 'UUID', None, None,
+     None, 'tester2', 'tester5', None, 403),
+    ('PUT', None, None, 'UUID', None, None,
+     None, 'tester4', 'tester5', None, 403),
+
+    # PUT object in own account: ok
+    ('PUT', None, None, 'UUID', 'UUID', None,
+     None, 'tester', 'tester', 'tester5', 201),
+
+    # PUT object in other users account: not allowed for role service
+    ('PUT', None, None, 'UUID', 'UUID', None,
+     None, 'tester', 'tester3', 'tester5', 403),
+    ('PUT', None, None, 'UUID', 'UUID', None,
+     None, 'tester', None, 'tester5', 401),
+    ('PUT', None, None, 'UUID', 'UUID', None,
+     None, 'tester5', 'tester5', None, 403),
+    ('PUT', None, None, 'UUID', 'UUID', None,
+     None, 'tester2', 'tester5', None, 403),
+    ('PUT', None, None, 'UUID', 'UUID', None,
+     None, 'tester4', 'tester5', None, 403),
+
+    # All following actions are using SERVICE prefix
+
+    # PUT container in own account: ok
+    ('PUT', None, None, 'UUID', None, None,
+     'SERVICE', 'tester', 'tester', 'tester5', 201),
+
+    # PUT container fails if wrong user, or only one token sent
+    ('PUT', None, None, 'UUID', None, None,
+     'SERVICE', 'tester', 'tester3', 'tester5', 403),
+    ('PUT', None, None, 'UUID', None, None,
+     'SERVICE', 'tester', 'tester', None, 403),
+    ('PUT', None, None, 'UUID', None, None,
+     'SERVICE', 'tester', 'tester', 'tester', 403),
+    ('PUT', None, None, 'UUID', None, None,
+     'SERVICE', 'tester', None, 'tester5', 401),
+
+    # PUT object in own account: ok
+    ('PUT', None, None, 'UUID', 'UUID', None,
+     'SERVICE', 'tester', 'tester', 'tester5', 201),
+
+    # PUT object fails if wrong user, or only one token sent
+    ('PUT', None, None, 'UUID', 'UUID', None,
+     'SERVICE', 'tester', 'tester3', 'tester5', 403),
+    ('PUT', None, None, 'UUID', 'UUID', None,
+     'SERVICE', 'tester', 'tester', None, 403),
+    ('PUT', None, None, 'UUID', 'UUID', None,
+     'SERVICE', 'tester', 'tester', 'tester', 403),
+    ('PUT', None, None, 'UUID', 'UUID', None,
+     'SERVICE', 'tester', None, 'tester5', 401),
+]
+
+
+# A scenario of delete for account, container and object with
+# several roles.
+RBAC_DELETE = [
+    # DELETE container in own account: ok
+    ('DELETE', None, None, 'UUID', None, None,
+     None, 'tester', 'tester', None, 204),
+    ('DELETE', None, None, 'UUID', None, None,
+     None, 'tester', 'tester', 'tester', 204),
+
+    # DELETE container in other users account: not allowed for role admin
+    ('DELETE', None, None, 'UUID', None, None,
+     None, 'tester2', 'tester', None, 403),
+    ('DELETE', None, None, 'UUID', None, None,
+     None, 'tester4', 'tester', None, 403),
+
+    # DELETE container in other users account: not allowed for role _member_
+    ('DELETE', None, None, 'UUID', None, None,
+     None, 'tester3', 'tester3', None, 403),
+    ('DELETE', None, None, 'UUID', None, None,
+     None, 'tester2', 'tester3', None, 403),
+    ('DELETE', None, None, 'UUID', None, None,
+     None, 'tester4', 'tester3', None, 403),
+
+    # DELETE container in other users account: allowed for role ResellerAdmin
+    ('DELETE', None, None, 'UUID', None, None,
+     None, 'tester6', 'tester6', None, 204),
+    ('DELETE', None, None, 'UUID', None, None,
+     None, 'tester2', 'tester6', None, 204),
+    ('DELETE', None, None, 'UUID', None, None,
+     None, 'tester4', 'tester6', None, 204),
+
+    # DELETE object in own account: ok
+    ('DELETE', None, None, 'UUID', 'UUID', None,
+     None, 'tester', 'tester', None, 204),
+    ('DELETE', None, None, 'UUID', 'UUID', None,
+     None, 'tester', 'tester', 'tester', 204),
+
+    # DELETE object in other users account: not allowed for role admin
+    ('DELETE', None, None, 'UUID', 'UUID', None,
+     None, 'tester2', 'tester', None, 403),
+    ('DELETE', None, None, 'UUID', 'UUID', None,
+     None, 'tester4', 'tester', None, 403),
+
+    # DELETE object in other users account: not allowed for role _member_
+    ('DELETE', None, None, 'UUID', 'UUID', None,
+     None, 'tester3', 'tester3', None, 403),
+    ('DELETE', None, None, 'UUID', 'UUID', None,
+     None, 'tester2', 'tester3', None, 403),
+    ('DELETE', None, None, 'UUID', 'UUID', None,
+     None, 'tester4', 'tester3', None, 403),
+
+    # DELETE object in other users account: allowed for role ResellerAdmin
+    ('DELETE', None, None, 'UUID', 'UUID', None,
+     None, 'tester6', 'tester6', None, 204),
+    ('DELETE', None, None, 'UUID', 'UUID', None,
+     None, 'tester2', 'tester6', None, 204),
+    ('DELETE', None, None, 'UUID', 'UUID', None,
+     None, 'tester4', 'tester6', None, 204)
+]
+
+
+RBAC_DELETE_WITH_SERVICE_PREFIX = [
+    # DELETE container in own account: ok
+    ('DELETE', None, None, 'UUID', None, None,
+     None, 'tester', 'tester', 'tester5', 204),
+
+    # DELETE container in other users account: not allowed for role service
+    ('DELETE', None, None, 'UUID', None, None,
+     None, 'tester', 'tester3', 'tester5', 403),
+    ('DELETE', None, None, 'UUID', None, None,
+     None, 'tester', None, 'tester5', 401),
+    ('DELETE', None, None, 'UUID', None, None,
+     None, 'tester5', 'tester5', None, 403),
+    ('DELETE', None, None, 'UUID', None, None,
+     None, 'tester2', 'tester5', None, 403),
+    ('DELETE', None, None, 'UUID', None, None,
+     None, 'tester4', 'tester5', None, 403),
+
+    # DELETE object in own account: ok
+    ('DELETE', None, None, 'UUID', 'UUID', None,
+     None, 'tester', 'tester', 'tester5', 204),
+
+    # DELETE object in other users account: not allowed for role service
+    ('DELETE', None, None, 'UUID', 'UUID', None,
+     None, 'tester', 'tester3', 'tester5', 403),
+    ('DELETE', None, None, 'UUID', 'UUID', None,
+     None, 'tester', None, 'tester5', 401),
+    ('DELETE', None, None, 'UUID', 'UUID', None,
+     None, 'tester5', 'tester5', None, 403),
+    ('DELETE', None, None, 'UUID', 'UUID', None,
+     None, 'tester2', 'tester5', None, 403),
+    ('DELETE', None, None, 'UUID', 'UUID', None,
+     None, 'tester4', 'tester5', None, 403),
+
+    # All following actions are using SERVICE prefix
+
+    # DELETE container in own account: ok
+    ('DELETE', None, None, 'UUID', None, None,
+     'SERVICE', 'tester', 'tester', 'tester5', 204),
+
+    # DELETE container fails if wrong user, or only one token sent
+    ('DELETE', None, None, 'UUID', None, None,
+     'SERVICE', 'tester', 'tester3', 'tester5', 403),
+    ('DELETE', None, None, 'UUID', None, None,
+     'SERVICE', 'tester', 'tester', None, 403),
+    ('DELETE', None, None, 'UUID', None, None,
+     'SERVICE', 'tester', 'tester', 'tester', 403),
+    ('DELETE', None, None, 'UUID', None, None,
+     'SERVICE', 'tester', None, 'tester5', 401),
+
+    # DELETE object in own account: ok
+    ('DELETE', None, None, 'UUID', 'UUID', None,
+     'SERVICE', 'tester', 'tester', 'tester5', 204),
+
+    # DELETE object fails if wrong user, or only one token sent
+    ('DELETE', None, None, 'UUID', 'UUID', None,
+     'SERVICE', 'tester', 'tester3', 'tester5', 403),
+    ('DELETE', None, None, 'UUID', 'UUID', None,
+     'SERVICE', 'tester', 'tester', None, 403),
+    ('DELETE', None, None, 'UUID', 'UUID', None,
+     'SERVICE', 'tester', 'tester', 'tester', 403),
+    ('DELETE', None, None, 'UUID', 'UUID', None,
+     'SERVICE', 'tester', None, 'tester5', 401)
+]
+
+
+# A scenario of get for account, container and object with
+# several roles.
+RBAC_GET = [
+    # GET own account: ok
+    ('GET', None, None, None, None, None,
+     None, 'tester', 'tester', None, 200),
+    ('GET', None, None, None, None, None,
+     None, 'tester', 'tester', 'tester', 200),
+
+    # GET other users account: not allowed for role admin
+    ('GET', None, None, None, None, None,
+     None, 'tester2', 'tester', None, 403),
+    ('GET', None, None, None, None, None,
+     None, 'tester4', 'tester', None, 403),
+
+    # GET other users account: not allowed for role _member_
+    ('GET', None, None, None, None, None,
+     None, 'tester3', 'tester3', None, 403),
+    ('GET', None, None, None, None, None,
+     None, 'tester2', 'tester3', None, 403),
+    ('GET', None, None, None, None, None,
+     None, 'tester4', 'tester3', None, 403),
+
+    # GET other users account: allowed for role ResellerAdmin
+    ('GET', None, None, None, None, None,
+     None, 'tester6', 'tester6', None, 200),
+    ('GET', None, None, None, None, None,
+     None, 'tester2', 'tester6', None, 200),
+    ('GET', None, None, None, None, None,
+     None, 'tester4', 'tester6', None, 200),
+
+    # GET container in own account: ok
+    ('GET', None, None, 'UUID', None, None,
+     None, 'tester', 'tester', None, 200),
+    ('GET', None, None, 'UUID', None, None,
+     None, 'tester', 'tester', 'tester', 200),
+
+    # GET container in other users account: not allowed for role admin
+    ('GET', None, None, 'UUID', None, None,
+     None, 'tester2', 'tester', None, 403),
+    ('GET', None, None, 'UUID', None, None,
+     None, 'tester4', 'tester', None, 403),
+
+    # GET container in other users account: not allowed for role _member_
+    ('GET', None, None, 'UUID', None, None,
+     None, 'tester3', 'tester3', None, 403),
+    ('GET', None, None, 'UUID', None, None,
+     None, 'tester2', 'tester3', None, 403),
+    ('GET', None, None, 'UUID', None, None,
+     None, 'tester4', 'tester3', None, 403),
+
+    # GET container in other users account: allowed for role ResellerAdmin
+    ('GET', None, None, 'UUID', None, None,
+     None, 'tester6', 'tester6', None, 200),
+    ('GET', None, None, 'UUID', None, None,
+     None, 'tester2', 'tester6', None, 200),
+    ('GET', None, None, 'UUID', None, None,
+     None, 'tester4', 'tester6', None, 200),
+
+    # GET object in own account: ok
+    ('GET', None, None, 'UUID', 'UUID', None,
+     None, 'tester', 'tester', None, 200),
+    ('GET', None, None, 'UUID', 'UUID', None,
+     None, 'tester', 'tester', 'tester', 200),
+
+    # GET object in other users account: not allowed for role admin
+    ('GET', None, None, 'UUID', 'UUID', None,
+     None, 'tester2', 'tester', None, 403),
+    ('GET', None, None, 'UUID', 'UUID', None,
+     None, 'tester4', 'tester', None, 403),
+
+    # GET object in other users account: not allowed for role _member_
+    ('GET', None, None, 'UUID', 'UUID', None,
+     None, 'tester3', 'tester3', None, 403),
+    ('GET', None, None, 'UUID', 'UUID', None,
+     None, 'tester2', 'tester3', None, 403),
+    ('GET', None, None, 'UUID', 'UUID', None,
+     None, 'tester4', 'tester3', None, 403),
+
+    # GET object in other users account: allowed for role ResellerAdmin
+    ('GET', None, None, 'UUID', 'UUID', None,
+     None, 'tester6', 'tester6', None, 200),
+    ('GET', None, None, 'UUID', 'UUID', None,
+     None, 'tester2', 'tester6', None, 200),
+    ('GET', None, None, 'UUID', 'UUID', None,
+     None, 'tester4', 'tester6', None, 200)
+]
+
+
+RBAC_GET_WITH_SERVICE_PREFIX = [
+    # GET own account: ok
+    ('GET', None, None, None, None, None,
+     None, 'tester', 'tester', 'tester5', 200),
+
+    # GET other account: not allowed for role service
+    ('GET', None, None, None, None, None,
+     None, 'tester', 'tester3', 'tester5', 403),
+    ('GET', None, None, None, None, None,
+     None, 'tester', None, 'tester5', 401),
+    ('GET', None, None, None, None, None,
+     None, 'tester5', 'tester5', None, 403),
+    ('GET', None, None, None, None, None,
+     None, 'tester2', 'tester5', None, 403),
+    ('GET', None, None, None, None, None,
+     None, 'tester4', 'tester5', None, 403),
+
+    # GET container in own account: ok
+    ('GET', None, None, 'UUID', None, None,
+     None, 'tester', 'tester', 'tester5', 200),
+
+    # GET container in other users account: not allowed for role service
+    ('GET', None, None, 'UUID', None, None,
+     None, 'tester', 'tester3', 'tester5', 403),
+    ('GET', None, None, 'UUID', None, None,
+     None, 'tester', None, 'tester5', 401),
+    ('GET', None, None, 'UUID', None, None,
+     None, 'tester5', 'tester5', None, 403),
+    ('GET', None, None, 'UUID', None, None,
+     None, 'tester2', 'tester5', None, 403),
+    ('GET', None, None, 'UUID', None, None,
+     None, 'tester4', 'tester5', None, 403),
+
+    # GET object in own account: ok
+    ('GET', None, None, 'UUID', 'UUID', None,
+     None, 'tester', 'tester', 'tester5', 200),
+
+    # GET object fails if wrong user, or only one token sent
+    ('GET', None, None, 'UUID', 'UUID', None,
+     None, 'tester', 'tester3', 'tester5', 403),
+    ('GET', None, None, 'UUID', 'UUID', None,
+     None, 'tester', None, 'tester5', 401),
+    ('GET', None, None, 'UUID', 'UUID', None,
+     None, 'tester5', 'tester5', None, 403),
+    ('GET', None, None, 'UUID', 'UUID', None,
+     None, 'tester2', 'tester5', None, 403),
+    ('GET', None, None, 'UUID', 'UUID', None,
+     None, 'tester4', 'tester5', None, 403),
+
+    # All following actions are using SERVICE prefix
+
+    # GET own account: ok
+    ('GET', None, None, None, None, None,
+     'SERVICE', 'tester', 'tester', 'tester5', 200),
+
+    # GET other account: not allowed for role service
+    ('GET', None, None, None, None, None,
+     'SERVICE', 'tester', 'tester3', 'tester5', 403),
+    ('GET', None, None, None, None, None,
+     'SERVICE', 'tester', 'tester', None, 403),
+    ('GET', None, None, None, None, None,
+     'SERVICE', 'tester', 'tester', 'tester', 403),
+    ('GET', None, None, None, None, None,
+     'SERVICE', 'tester', None, 'tester5', 401),
+
+    # GET container in own account: ok
+    ('GET', None, None, 'UUID', None, None,
+     'SERVICE', 'tester', 'tester', 'tester5', 200),
+
+    # GET container fails if wrong user, or only one token sent
+    ('GET', None, None, 'UUID', None, None,
+     'SERVICE', 'tester', 'tester3', 'tester5', 403),
+    ('GET', None, None, 'UUID', None, None,
+     'SERVICE', 'tester', 'tester', None, 403),
+    ('GET', None, None, 'UUID', None, None,
+     'SERVICE', 'tester', 'tester', 'tester', 403),
+    ('GET', None, None, 'UUID', None, None,
+     'SERVICE', 'tester', None, 'tester5', 401),
+
+    # GET object in own account: ok
+    ('GET', None, None, 'UUID', 'UUID', None,
+     'SERVICE', 'tester', 'tester', 'tester5', 200),
+
+    # GET object fails if wrong user, or only one token sent
+    ('GET', None, None, 'UUID', 'UUID', None,
+     'SERVICE', 'tester', 'tester3', 'tester5', 403),
+    ('GET', None, None, 'UUID', 'UUID', None,
+     'SERVICE', 'tester', 'tester', None, 403),
+    ('GET', None, None, 'UUID', 'UUID', None,
+     'SERVICE', 'tester', 'tester', 'tester', 403),
+    ('GET', None, None, 'UUID', 'UUID', None,
+     'SERVICE', 'tester', None, 'tester5', 401)
+]
+
+
+# A scenario of head for account, container and object with
+# several roles.
+RBAC_HEAD = [
+    # HEAD own account: ok
+    ('HEAD', None, None, None, None, None,
+     None, 'tester', 'tester', None, 204),
+    ('HEAD', None, None, None, None, None,
+     None, 'tester', 'tester', 'tester', 204),
+
+    # HEAD other users account: not allowed for role admin
+    ('HEAD', None, None, None, None, None,
+     None, 'tester2', 'tester', None, 403),
+    ('HEAD', None, None, None, None, None,
+     None, 'tester4', 'tester', None, 403),
+
+    # HEAD other users account: not allowed for role _member_
+    ('HEAD', None, None, None, None, None,
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD', None, None, None, None, None,
+     None, 'tester2', 'tester3', None, 403),
+    ('HEAD', None, None, None, None, None,
+     None, 'tester4', 'tester3', None, 403),
+
+    # HEAD other users account: allowed for role ResellerAdmin
+    ('HEAD', None, None, None, None, None,
+     None, 'tester6', 'tester6', None, 204),
+    ('HEAD', None, None, None, None, None,
+     None, 'tester2', 'tester6', None, 204),
+    ('HEAD', None, None, None, None, None,
+     None, 'tester4', 'tester6', None, 204),
+
+    # HEAD container in own account: ok
+    ('HEAD', None, None, 'UUID', None, None,
+     None, 'tester', 'tester', None, 204),
+    ('HEAD', None, None, 'UUID', None, None,
+     None, 'tester', 'tester', 'tester', 204),
+
+    # HEAD container in other users account: not allowed for role admin
+    ('HEAD', None, None, 'UUID', None, None,
+     None, 'tester2', 'tester', None, 403),
+    ('HEAD', None, None, 'UUID', None, None,
+     None, 'tester4', 'tester', None, 403),
+
+    # HEAD container in other users account: not allowed for role _member_
+    ('HEAD', None, None, 'UUID', None, None,
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD', None, None, 'UUID', None, None,
+     None, 'tester2', 'tester3', None, 403),
+    ('HEAD', None, None, 'UUID', None, None,
+     None, 'tester4', 'tester3', None, 403),
+
+    # HEAD container in other users account: allowed for role ResellerAdmin
+    ('HEAD', None, None, 'UUID', None, None,
+     None, 'tester6', 'tester6', None, 204),
+    ('HEAD', None, None, 'UUID', None, None,
+     None, 'tester2', 'tester6', None, 204),
+    ('HEAD', None, None, 'UUID', None, None,
+     None, 'tester4', 'tester6', None, 204),
+
+
+    # HEAD object in own account: ok
+    ('HEAD', None, None, 'UUID', 'UUID', None,
+     None, 'tester', 'tester', None, 200),
+    ('HEAD', None, None, 'UUID', 'UUID', None,
+     None, 'tester', 'tester', 'tester', 200),
+
+    # HEAD object in other users account: not allowed for role admin
+    ('HEAD', None, None, 'UUID', 'UUID', None,
+     None, 'tester2', 'tester', None, 403),
+    ('HEAD', None, None, 'UUID', 'UUID', None,
+     None, 'tester4', 'tester', None, 403),
+
+    # HEAD object in other users account: not allowed for role _member_
+    ('HEAD', None, None, 'UUID', 'UUID', None,
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD', None, None, 'UUID', 'UUID', None,
+     None, 'tester2', 'tester3', None, 403),
+    ('HEAD', None, None, 'UUID', 'UUID', None,
+     None, 'tester4', 'tester3', None, 403),
+
+    # HEAD object in other users account: allowed for role ResellerAdmin
+    ('HEAD', None, None, 'UUID', 'UUID', None,
+     None, 'tester6', 'tester6', None, 200),
+    ('HEAD', None, None, 'UUID', 'UUID', None,
+     None, 'tester2', 'tester6', None, 200),
+    ('HEAD', None, None, 'UUID', 'UUID', None,
+     None, 'tester4', 'tester6', None, 200)
+]
+
+
+RBAC_HEAD_WITH_SERVICE_PREFIX = [
+    # HEAD own account: ok
+    ('HEAD', None, None, None, None, None,
+     None, 'tester', 'tester', 'tester5', 204),
+
+    # HEAD other account: not allowed for role service
+    ('HEAD', None, None, None, None, None,
+     None, 'tester', 'tester3', 'tester5', 403),
+    ('HEAD', None, None, None, None, None,
+     None, 'tester', None, 'tester5', 401),
+    ('HEAD', None, None, None, None, None,
+     None, 'tester5', 'tester5', None, 403),
+    ('HEAD', None, None, None, None, None,
+     None, 'tester2', 'tester5', None, 403),
+    ('HEAD', None, None, None, None, None,
+     None, 'tester4', 'tester5', None, 403),
+
+    # HEAD container in own account: ok
+    ('HEAD', None, None, 'UUID', None, None,
+     None, 'tester', 'tester', 'tester5', 204),
+
+    # HEAD container in other users account: not allowed for role service
+    ('HEAD', None, None, 'UUID', None, None,
+     None, 'tester', 'tester3', 'tester5', 403),
+    ('HEAD', None, None, 'UUID', None, None,
+     None, 'tester', None, 'tester5', 401),
+    ('HEAD', None, None, 'UUID', None, None,
+     None, 'tester5', 'tester5', None, 403),
+    ('HEAD', None, None, 'UUID', None, None,
+     None, 'tester2', 'tester5', None, 403),
+    ('HEAD', None, None, 'UUID', None, None,
+     None, 'tester4', 'tester5', None, 403),
+
+    # HEAD object in own account: ok
+    ('HEAD', None, None, 'UUID', 'UUID', None,
+     None, 'tester', 'tester', 'tester5', 200),
+
+    # HEAD object fails if wrong user, or only one token sent
+    ('HEAD', None, None, 'UUID', 'UUID', None,
+     None, 'tester', 'tester3', 'tester5', 403),
+    ('HEAD', None, None, 'UUID', 'UUID', None,
+     None, 'tester', None, 'tester5', 401),
+    ('HEAD', None, None, 'UUID', 'UUID', None,
+     None, 'tester5', 'tester5', None, 403),
+    ('HEAD', None, None, 'UUID', 'UUID', None,
+     None, 'tester2', 'tester5', None, 403),
+    ('HEAD', None, None, 'UUID', 'UUID', None,
+     None, 'tester4', 'tester5', None, 403),
+
+    # All following actions are using SERVICE prefix
+
+    # HEAD own account: ok
+    ('HEAD', None, None, None, None, None,
+     'SERVICE', 'tester', 'tester', 'tester5', 204),
+
+    # HEAD other account: not allowed for role service
+    ('HEAD', None, None, None, None, None,
+     'SERVICE', 'tester', 'tester3', 'tester5', 403),
+    ('HEAD', None, None, None, None, None,
+     'SERVICE', 'tester', 'tester', None, 403),
+    ('HEAD', None, None, None, None, None,
+     'SERVICE', 'tester', 'tester', 'tester', 403),
+    ('HEAD', None, None, None, None, None,
+     'SERVICE', 'tester', None, 'tester5', 401),
+
+    # HEAD container in own account: ok
+    ('HEAD', None, None, 'UUID', None, None,
+     'SERVICE', 'tester', 'tester', 'tester5', 204),
+
+    # HEAD container in other users account: not allowed for role service
+    ('HEAD', None, None, 'UUID', None, None,
+     'SERVICE', 'tester', 'tester3', 'tester5', 403),
+    ('HEAD', None, None, 'UUID', None, None,
+     'SERVICE', 'tester', 'tester', None, 403),
+    ('HEAD', None, None, 'UUID', None, None,
+     'SERVICE', 'tester', 'tester', 'tester', 403),
+    ('HEAD', None, None, 'UUID', None, None,
+     'SERVICE', 'tester', None, 'tester5', 401),
+
+    # HEAD object in own account: ok
+    ('HEAD', None, None, 'UUID', 'UUID', None,
+     'SERVICE', 'tester', 'tester', 'tester5', 200),
+
+    # HEAD object fails if wrong user, or only one token sent
+    ('HEAD', None, None, 'UUID', 'UUID', None,
+     'SERVICE', 'tester', 'tester3', 'tester5', 403),
+    ('HEAD', None, None, 'UUID', 'UUID', None,
+     'SERVICE', 'tester', 'tester', None, 403),
+    ('HEAD', None, None, 'UUID', 'UUID', None,
+     'SERVICE', 'tester', 'tester', 'tester', 403),
+    ('HEAD', None, None, 'UUID', 'UUID', None,
+     'SERVICE', 'tester', None, 'tester5', 401)
+]
+
+
+# A scenario of post for account, container and object with
+# several roles.
+RBAC_POST = [
+    # POST own account: ok
+    ('POST', None, None, None, None, None,
+     None, 'tester', 'tester', None, 204),
+    ('POST', None, None, None, None, None,
+     None, 'tester', 'tester', 'tester', 204),
+
+    # POST other users account: not allowed for role admin
+    ('POST', None, None, None, None, None,
+     None, 'tester2', 'tester', None, 403),
+    ('POST', None, None, None, None, None,
+     None, 'tester4', 'tester', None, 403),
+
+    # POST other users account: not allowed for role _member_
+    ('POST', None, None, None, None, None,
+     None, 'tester3', 'tester3', None, 403),
+    ('POST', None, None, None, None, None,
+     None, 'tester2', 'tester3', None, 403),
+    ('POST', None, None, None, None, None,
+     None, 'tester4', 'tester3', None, 403),
+
+    # POST other users account: allowed for role ResellerAdmin
+    ('POST', None, None, None, None, None,
+     None, 'tester6', 'tester6', None, 204),
+    ('POST', None, None, None, None, None,
+     None, 'tester2', 'tester6', None, 204),
+    ('POST', None, None, None, None, None,
+     None, 'tester4', 'tester6', None, 204),
+
+    # POST container in own account: ok
+    ('POST', None, None, 'UUID', None, None,
+     None, 'tester', 'tester', None, 204),
+    ('POST', None, None, 'UUID', None, None,
+     None, 'tester', 'tester', 'tester', 204),
+
+    # POST container in other users account: not allowed for role admin
+    ('POST', None, None, 'UUID', None, None,
+     None, 'tester2', 'tester', None, 403),
+    ('POST', None, None, 'UUID', None, None,
+     None, 'tester4', 'tester', None, 403),
+
+    # POST container in other users account: not allowed for role _member_
+    ('POST', None, None, 'UUID', None, None,
+     None, 'tester3', 'tester3', None, 403),
+    ('POST', None, None, 'UUID', None, None,
+     None, 'tester2', 'tester3', None, 403),
+    ('POST', None, None, 'UUID', None, None,
+     None, 'tester4', 'tester3', None, 403),
+
+    # POST container in other users account: allowed for role ResellerAdmin
+    ('POST', None, None, 'UUID', None, None,
+     None, 'tester6', 'tester6', None, 204),
+    ('POST', None, None, 'UUID', None, None,
+     None, 'tester2', 'tester6', None, 204),
+    ('POST', None, None, 'UUID', None, None,
+     None, 'tester4', 'tester6', None, 204),
+
+    # POST object in own account: ok
+    ('POST', None, None, 'UUID', 'UUID', None,
+     None, 'tester', 'tester', None, 202),
+    ('POST', None, None, 'UUID', 'UUID', None,
+     None, 'tester', 'tester', 'tester', 202),
+
+    # POST object in other users account: not allowed for role admin
+    ('POST', None, None, 'UUID', 'UUID', None,
+     None, 'tester2', 'tester', None, 403),
+    ('POST', None, None, 'UUID', 'UUID', None,
+     None, 'tester4', 'tester', None, 403),
+
+    # POST object in other users account: not allowed for role _member_
+    ('POST', None, None, 'UUID', 'UUID', None,
+     None, 'tester3', 'tester3', None, 403),
+    ('POST', None, None, 'UUID', 'UUID', None,
+     None, 'tester2', 'tester3', None, 403),
+    ('POST', None, None, 'UUID', 'UUID', None,
+     None, 'tester4', 'tester3', None, 403),
+
+    # POST object in other users account: allowed for role ResellerAdmin
+    ('POST', None, None, 'UUID', 'UUID', None,
+     None, 'tester6', 'tester6', None, 202),
+    ('POST', None, None, 'UUID', 'UUID', None,
+     None, 'tester2', 'tester6', None, 202),
+    ('POST', None, None, 'UUID', 'UUID', None,
+     None, 'tester4', 'tester6', None, 202)
+]
+
+
+RBAC_POST_WITH_SERVICE_PREFIX = [
+    # POST own account: ok
+    ('POST', None, None, None, None, None,
+     None, 'tester', 'tester', 'tester5', 204),
+
+    # POST own account: ok
+    ('POST', None, None, None, None, None,
+     None, 'tester', 'tester3', 'tester5', 403),
+    ('POST', None, None, None, None, None,
+     None, 'tester', None, 'tester5', 401),
+    ('POST', None, None, None, None, None,
+     None, 'tester5', 'tester5', None, 403),
+    ('POST', None, None, None, None, None,
+     None, 'tester2', 'tester5', None, 403),
+    ('POST', None, None, None, None, None,
+     None, 'tester4', 'tester5', None, 403),
+
+    # POST container in own account: ok
+    ('POST', None, None, 'UUID', None, None,
+     None, 'tester', 'tester', 'tester5', 204),
+
+    # POST container in other users account: not allowed for role service
+    ('POST', None, None, 'UUID', None, None,
+     None, 'tester', 'tester3', 'tester5', 403),
+    ('POST', None, None, 'UUID', None, None,
+     None, 'tester', None, 'tester5', 401),
+    ('POST', None, None, 'UUID', None, None,
+     None, 'tester5', 'tester5', None, 403),
+    ('POST', None, None, 'UUID', None, None,
+     None, 'tester2', 'tester5', None, 403),
+    ('POST', None, None, 'UUID', None, None,
+     None, 'tester4', 'tester5', None, 403),
+
+    # POST object in own account: ok
+    ('POST', None, None, 'UUID', 'UUID', None,
+     None, 'tester', 'tester', 'tester5', 202),
+
+    # POST object fails if wrong user, or only one token sent
+    ('POST', None, None, 'UUID', 'UUID', None,
+     None, 'tester', 'tester3', 'tester5', 403),
+    ('POST', None, None, 'UUID', 'UUID', None,
+     None, 'tester', None, 'tester5', 401),
+    ('POST', None, None, 'UUID', 'UUID', None,
+     None, 'tester5', 'tester5', None, 403),
+    ('POST', None, None, 'UUID', 'UUID', None,
+     None, 'tester2', 'tester5', None, 403),
+    ('POST', None, None, 'UUID', 'UUID', None,
+     None, 'tester4', 'tester5', None, 403),
+
+    # All following actions are using SERVICE prefix
+
+    # POST own account: ok
+    ('POST', None, None, None, None, None,
+     'SERVICE', 'tester', 'tester', 'tester5', 204),
+
+    # POST other account: not allowed for role service
+    ('POST', None, None, None, None, None,
+     'SERVICE', 'tester', 'tester3', 'tester5', 403),
+    ('POST', None, None, None, None, None,
+     'SERVICE', 'tester', 'tester', None, 403),
+    ('POST', None, None, None, None, None,
+     'SERVICE', 'tester', 'tester', 'tester', 403),
+    ('POST', None, None, None, None, None,
+     'SERVICE', 'tester', None, 'tester5', 401),
+
+    # POST container in own account: ok
+    ('POST', None, None, 'UUID', None, None,
+     'SERVICE', 'tester', 'tester', 'tester5', 204),
+
+    # POST container in other users account: not allowed for role service
+    ('POST', None, None, 'UUID', None, None,
+     'SERVICE', 'tester', 'tester3', 'tester5', 403),
+    ('POST', None, None, 'UUID', None, None,
+     'SERVICE', 'tester', 'tester', None, 403),
+    ('POST', None, None, 'UUID', None, None,
+     'SERVICE', 'tester', 'tester', 'tester', 403),
+    ('POST', None, None, 'UUID', None, None,
+     'SERVICE', 'tester', None, 'tester5', 401),
+
+    # POST object in own account: ok
+    ('POST', None, None, 'UUID', 'UUID', None,
+     'SERVICE', 'tester', 'tester', 'tester5', 202),
+
+    # POST object fails if wrong user, or only one token sent
+    ('POST', None, None, 'UUID', 'UUID', None,
+     'SERVICE', 'tester', 'tester3', 'tester5', 403),
+    ('POST', None, None, 'UUID', 'UUID', None,
+     'SERVICE', 'tester', 'tester', None, 403),
+    ('POST', None, None, 'UUID', 'UUID', None,
+     'SERVICE', 'tester', 'tester', 'tester', 403),
+    ('POST', None, None, 'UUID', 'UUID', None,
+     'SERVICE', 'tester', None, 'tester5', 401)
+]
+
+
+# A scenario of options for account, container and object with
+# several roles.
+RBAC_OPTIONS = [
+    # OPTIONS request is always ok
+
+    ('OPTIONS', None, None, None, None, None,
+     None, 'tester', 'tester', None, 200),
+    ('OPTIONS', None, None, None, None, None,
+     None, 'tester', 'tester', 'tester', 200),
+    ('OPTIONS', None, None, None, None, None,
+     None, 'tester2', 'tester', None, 200),
+    ('OPTIONS', None, None, None, None, None,
+     None, 'tester4', 'tester', None, 200),
+    ('OPTIONS', None, None, None, None, None,
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS', None, None, None, None, None,
+     None, 'tester2', 'tester3', None, 200),
+    ('OPTIONS', None, None, None, None, None,
+     None, 'tester4', 'tester3', None, 200),
+    ('OPTIONS', None, None, None, None, None,
+     None, 'tester6', 'tester6', None, 200),
+    ('OPTIONS', None, None, None, None, None,
+     None, 'tester2', 'tester6', None, 200),
+    ('OPTIONS', None, None, None, None, None,
+     None, 'tester4', 'tester6', None, 200),
+    ('OPTIONS', None, None, 'UUID', None, None,
+     None, 'tester', 'tester', None, 200),
+    ('OPTIONS', None, None, 'UUID', None, None,
+     None, 'tester', 'tester', 'tester', 200),
+    ('OPTIONS', None, None, 'UUID', None, None,
+     None, 'tester2', 'tester', None, 200),
+    ('OPTIONS', None, None, 'UUID', None, None,
+     None, 'tester4', 'tester', None, 200),
+    ('OPTIONS', None, None, 'UUID', None, None,
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS', None, None, 'UUID', None, None,
+     None, 'tester2', 'tester3', None, 200),
+    ('OPTIONS', None, None, 'UUID', None, None,
+     None, 'tester4', 'tester3', None, 200),
+    ('OPTIONS', None, None, 'UUID', None, None,
+     None, 'tester6', 'tester6', None, 200),
+    ('OPTIONS', None, None, 'UUID', None, None,
+     None, 'tester2', 'tester6', None, 200),
+    ('OPTIONS', None, None, 'UUID', None, None,
+     None, 'tester4', 'tester6', None, 200),
+    ('OPTIONS', None, None, 'UUID', 'UUID', None,
+     None, 'tester', 'tester', None, 200),
+    ('OPTIONS', None, None, 'UUID', 'UUID', None,
+     None, 'tester', 'tester', 'tester', 200),
+    ('OPTIONS', None, None, 'UUID', 'UUID', None,
+     None, 'tester2', 'tester', None, 200),
+    ('OPTIONS', None, None, 'UUID', 'UUID', None,
+     None, 'tester4', 'tester', None, 200),
+    ('OPTIONS', None, None, 'UUID', 'UUID', None,
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS', None, None, 'UUID', 'UUID', None,
+     None, 'tester2', 'tester3', None, 200),
+    ('OPTIONS', None, None, 'UUID', 'UUID', None,
+     None, 'tester4', 'tester3', None, 200),
+    ('OPTIONS', None, None, 'UUID', 'UUID', None,
+     None, 'tester6', 'tester6', None, 200),
+    ('OPTIONS', None, None, 'UUID', 'UUID', None,
+     None, 'tester2', 'tester6', None, 200),
+    ('OPTIONS', None, None, 'UUID', 'UUID', None,
+     None, 'tester4', 'tester6', None, 200),
+    ('OPTIONS', None, None, None, None,
+     {"X-Container-Meta-Access-Control-Allow-Origin": "*"},
+     None, 'tester', 'tester', None, 200),
+    ('OPTIONS', None, None, None, None,
+     {"X-Container-Meta-Access-Control-Allow-Origin": "http://invalid.com"},
+     None, 'tester', 'tester', None, 200),
+    ('OPTIONS', None, None, 'UUID', None,
+     {"X-Container-Meta-Access-Control-Allow-Origin": "*"},
+     None, 'tester', 'tester', None, 200),
+    ('OPTIONS', None, None, 'UUID', None,
+     {"X-Container-Meta-Access-Control-Allow-Origin": "http://invalid.com"},
+     None, 'tester', 'tester', None, 200),
+    ('OPTIONS', None, None, 'UUID', 'UUID',
+     {"X-Container-Meta-Access-Control-Allow-Origin": "*"},
+     None, 'tester', 'tester', None, 200),
+    ('OPTIONS', None, None, 'UUID', 'UUID',
+     {"X-Container-Meta-Access-Control-Allow-Origin": "http://invalid.com"},
+     None, 'tester', 'tester', None, 200),
+    ('OPTIONS',
+     {"Origin": "http://localhost", "Access-Control-Request-Method": "GET"},
+     None, None, None, None, None, 'tester', 'tester', None, 200),
+    ('OPTIONS',
+     {"Origin": "http://localhost", "Access-Control-Request-Method": "GET"},
+     None, None, None,
+     {"X-Container-Meta-Access-Control-Allow-Origin": "*"},
+     None, 'tester', 'tester', None, 200),
+    ('OPTIONS',
+     {"Origin": "http://localhost", "Access-Control-Request-Method": "GET"},
+     None, None, None,
+     {"X-Container-Meta-Access-Control-Allow-Origin": "http://invalid.com"},
+     None, 'tester', 'tester', None, 200),
+    ('OPTIONS',
+     {"Origin": "http://localhost", "Access-Control-Request-Method": "GET"},
+     None, 'UUID', None, None, None, 'tester', 'tester', None, 401),
+    ('OPTIONS',
+     {"Origin": "http://localhost", "Access-Control-Request-Method": "GET"},
+     None, 'UUID', None,
+     {"X-Container-Meta-Access-Control-Allow-Origin": "*"},
+     None, 'tester', 'tester', None, 200),
+
+    # Not OK for container: wrong origin
+    ('OPTIONS',
+     {"Origin": "http://localhost", "Access-Control-Request-Method": "GET"},
+     None, 'UUID', None,
+     {"X-Container-Meta-Access-Control-Allow-Origin": "http://invalid.com"},
+     None, 'tester', 'tester', None, 401),
+
+    # Not OK for object: missing X-Container-Meta-Access-Control-Allow-Origin
+    ('OPTIONS',
+     {"Origin": "http://localhost", "Access-Control-Request-Method": "GET"},
+     None, 'UUID', 'UUID', None, None, 'tester', 'tester', None, 401),
+    ('OPTIONS',
+     {"Origin": "http://localhost", "Access-Control-Request-Method": "GET"},
+     None, 'UUID', 'UUID',
+     {"X-Container-Meta-Access-Control-Allow-Origin": "*"},
+     None, 'tester', None, None, 200),
+
+    # Not OK for object: wrong origin
+    ('OPTIONS',
+     {"Origin": "http://localhost", "Access-Control-Request-Method": "GET"},
+     None, 'UUID', 'UUID',
+     {"X-Container-Meta-Access-Control-Allow-Origin": "http://invalid.com"},
+     None, 'tester', 'tester', None, 401)
+]
+
+
+RBAC_OPTIONS_WITH_SERVICE_PREFIX = [
+    # OPTIONS request is always ok
+
+    ('OPTIONS', None, None, None, None, None,
+     None, 'tester', 'tester', 'tester5', 200),
+    ('OPTIONS', None, None, None, None, None,
+     None, 'tester', 'tester3', 'tester5', 200),
+    ('OPTIONS', None, None, None, None, None,
+     None, 'tester', None, 'tester5', 200),
+    ('OPTIONS', None, None, None, None, None,
+     None, 'tester5', 'tester5', None, 200),
+    ('OPTIONS', None, None, None, None, None,
+     None, 'tester2', 'tester5', None, 200),
+    ('OPTIONS', None, None, None, None, None,
+     None, 'tester4', 'tester5', None, 200),
+    ('OPTIONS', None, None, 'UUID', None, None,
+     None, 'tester', 'tester', 'tester5', 200),
+    ('OPTIONS', None, None, 'UUID', None, None,
+     None, 'tester', 'tester3', 'tester5', 200),
+    ('OPTIONS', None, None, 'UUID', None, None,
+     None, 'tester', None, 'tester5', 200),
+    ('OPTIONS', None, None, 'UUID', None, None,
+     None, 'tester5', 'tester5', None, 200),
+    ('OPTIONS', None, None, 'UUID', None, None,
+     None, 'tester2', 'tester5', None, 200),
+    ('OPTIONS', None, None, 'UUID', None, None,
+     None, 'tester4', 'tester5', None, 200),
+    ('OPTIONS', None, None, 'UUID', 'UUID', None,
+     None, 'tester', 'tester', 'tester5', 200),
+    ('OPTIONS', None, None, 'UUID', 'UUID', None,
+     None, 'tester', 'tester3', 'tester5', 200),
+    ('OPTIONS', None, None, 'UUID', 'UUID', None,
+     None, 'tester', None, 'tester5', 200),
+    ('OPTIONS', None, None, 'UUID', 'UUID', None,
+     None, 'tester5', 'tester5', None, 200),
+    ('OPTIONS', None, None, 'UUID', 'UUID', None,
+     None, 'tester2', 'tester5', None, 200),
+    ('OPTIONS', None, None, 'UUID', 'UUID', None,
+     None, 'tester4', 'tester5', None, 200),
+    ('OPTIONS', None, None, None, None, None,
+     'SERVICE', 'tester', 'tester', 'tester5', 200),
+    ('OPTIONS', None, None, None, None, None,
+     'SERVICE', 'tester', 'tester3', 'tester5', 200),
+    ('OPTIONS', None, None, None, None, None,
+     'SERVICE', 'tester', 'tester', None, 200),
+    ('OPTIONS', None, None, None, None, None,
+     'SERVICE', 'tester', 'tester', 'tester', 200),
+    ('OPTIONS', None, None, None, None, None,
+     'SERVICE', 'tester', None, 'tester5', 200),
+    ('OPTIONS', None, None, 'UUID', None, None,
+     'SERVICE', 'tester', 'tester', 'tester5', 200),
+    ('OPTIONS', None, None, 'UUID', None, None,
+     'SERVICE', 'tester', 'tester3', 'tester5', 200),
+    ('OPTIONS', None, None, 'UUID', None, None,
+     'SERVICE', 'tester', 'tester', None, 200),
+    ('OPTIONS', None, None, 'UUID', None, None,
+     'SERVICE', 'tester', 'tester', 'tester', 200),
+    ('OPTIONS', None, None, 'UUID', None, None,
+     'SERVICE', 'tester', None, 'tester5', 200),
+    ('OPTIONS', None, None, 'UUID', 'UUID', None,
+     'SERVICE', 'tester', 'tester', 'tester5', 200),
+    ('OPTIONS', None, None, 'UUID', 'UUID', None,
+     'SERVICE', 'tester', 'tester3', 'tester5', 200),
+    ('OPTIONS', None, None, 'UUID', 'UUID', None,
+     'SERVICE', 'tester', 'tester', None, 200),
+    ('OPTIONS', None, None, 'UUID', 'UUID', None,
+     'SERVICE', 'tester', 'tester', 'tester', 200),
+    ('OPTIONS', None, None, 'UUID', 'UUID', None,
+     'SERVICE', 'tester', None, 'tester5', 200)
+]
+
+
+# A scenario of put for container ACL
+ACL_PUT = [
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 403),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '%(test_id)s:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '%(test_id)s:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 403),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test'},
+     None, 'tester3', 'tester3', None, 403),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '%(test_id)s'},
+     None, 'tester3', 'tester3', None, 403),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test2:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test2:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test2:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '*:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '*:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '*:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.r:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.r:*,.rlistings'},
+     None, 'tester3', 'tester3', None, 403),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.r:invalid.domain.com'},
+     None, 'tester3', 'tester3', None, 403),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.r:invalid.domain.com,.rlistings'},
+     None, 'tester3', 'tester3', None, 403),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.rlistings'},
+     None, 'tester3', 'tester3', None, 403),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 201),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 201),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '%(test_id)s:tester3'},
+     None, 'tester3', 'tester3', None, 201),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '%(test_id)s:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 201),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test:*'},
+     None, 'tester3', 'tester3', None, 201),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test'},
+     None, 'tester3', 'tester3', None, 403),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '%(test_id)s'},
+     None, 'tester3', 'tester3', None, 403),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test2:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test2:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test2:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '*:tester3'},
+     None, 'tester3', 'tester3', None, 201),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '*:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '*:*'},
+     None, 'tester3', 'tester3', None, 201),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('PUT',
+     None,
+     None, 'UUID', 'UUID',
+     None,
+     None, 'tester3', 'tester3', None, 403)
+]
+
+
+# A scenario of delete for container ACL
+ACL_DELETE = [
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 403),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '%(test_id)s:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '%(test_id)s:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 403),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test'},
+     None, 'tester3', 'tester3', None, 403),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '%(test_id)s'},
+     None, 'tester3', 'tester3', None, 403),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test2:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test2:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test2:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '*:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '*:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '*:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.r:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.r:*,.rlistings'},
+     None, 'tester3', 'tester3', None, 403),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.r:invalid.domain.com'},
+     None, 'tester3', 'tester3', None, 403),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.r:invalid.domain.com,.rlistings'},
+     None, 'tester3', 'tester3', None, 403),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.rlistings'},
+     None, 'tester3', 'tester3', None, 403),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 204),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 204),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '%(test_id)s:tester3'},
+     None, 'tester3', 'tester3', None, 204),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '%(test_id)s:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 204),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test:*'},
+     None, 'tester3', 'tester3', None, 204),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test'},
+     None, 'tester3', 'tester3', None, 403),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '%(test_id)s'},
+     None, 'tester3', 'tester3', None, 403),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test2:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test2:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test2:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '*:tester3'},
+     None, 'tester3', 'tester3', None, 204),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '*:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '*:*'},
+     None, 'tester3', 'tester3', None, 204),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('DELETE',
+     None,
+     None, 'UUID', 'UUID',
+     None,
+     None, 'tester3', 'tester3', None, 403)
+]
+
+
+# A scenario of get for container ACL
+ACL_GET = [
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 200),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': 'test:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 200),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '%(test_id)s:tester3'},
+     None, 'tester3', 'tester3', None, 200),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '%(test_id)s:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 200),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': 'test:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': 'test:*'},
+     None, 'tester3', 'tester3', None, 200),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': 'test'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '%(test_id)s'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': 'test2:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': 'test2:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': 'test2:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': 'test2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '*:tester3'},
+     None, 'tester3', 'tester3', None, 200),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '*:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '*:*'},
+     None, 'tester3', 'tester3', None, 200),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '.r:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '.r:*,.rlistings'},
+     None, 'tester3', 'tester3', None, 200),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '.r:invalid.domain.com'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '.r:invalid.domain.com,.rlistings'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '.rlistings'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': 'test:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': '%(test_id)s:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': '%(test_id)s:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': 'test:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': 'test:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': 'test'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': '%(test_id)s'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': 'test2:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': 'test2:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': 'test2:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': 'test2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': '*:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': '*:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': '*:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': '*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', None,
+     None,
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 200),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 200),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '%(test_id)s:tester3'},
+     None, 'tester3', 'tester3', None, 200),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '%(test_id)s:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 200),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test:*'},
+     None, 'tester3', 'tester3', None, 200),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '%(test_id)s'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test2:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test2:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test2:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '*:tester3'},
+     None, 'tester3', 'tester3', None, 200),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '*:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '*:*'},
+     None, 'tester3', 'tester3', None, 200),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.r:*'},
+     None, 'tester3', 'tester3', None, 200),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.r:*,.rlistings'},
+     None, 'tester3', 'tester3', None, 200),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.r:invalid.domain.com'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.r:invalid.domain.com,.rlistings'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.rlistings'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '%(test_id)s:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '%(test_id)s:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '%(test_id)s'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test2:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test2:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test2:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '*:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '*:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '*:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('GET',
+     None,
+     None, 'UUID', 'UUID',
+     None,
+     None, 'tester3', 'tester3', None, 403)
+]
+
+
+# A scenario of head for container ACL
+ACL_HEAD = [
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 204),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': 'test:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 204),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '%(test_id)s:tester3'},
+     None, 'tester3', 'tester3', None, 204),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '%(test_id)s:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 204),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': 'test:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': 'test:*'},
+     None, 'tester3', 'tester3', None, 204),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': 'test'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '%(test_id)s'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': 'test2:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': 'test2:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': 'test2:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': 'test2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '*:tester3'},
+     None, 'tester3', 'tester3', None, 204),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '*:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '*:*'},
+     None, 'tester3', 'tester3', None, 204),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '.r:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '.r:*,.rlistings'},
+     None, 'tester3', 'tester3', None, 204),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '.r:invalid.domain.com'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '.r:invalid.domain.com,.rlistings'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '.rlistings'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': 'test:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': '%(test_id)s:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': '%(test_id)s:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': 'test:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': 'test:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': 'test'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': '%(test_id)s'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': 'test2:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': 'test2:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': 'test2:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': 'test2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': '*:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': '*:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': '*:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': '*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', None,
+     None,
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 200),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 200),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '%(test_id)s:tester3'},
+     None, 'tester3', 'tester3', None, 200),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '%(test_id)s:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 200),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test:*'},
+     None, 'tester3', 'tester3', None, 200),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '%(test_id)s'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test2:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test2:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test2:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '*:tester3'},
+     None, 'tester3', 'tester3', None, 200),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '*:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '*:*'},
+     None, 'tester3', 'tester3', None, 200),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.r:*'},
+     None, 'tester3', 'tester3', None, 200),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.r:*,.rlistings'},
+     None, 'tester3', 'tester3', None, 200),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.r:invalid.domain.com'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.r:invalid.domain.com,.rlistings'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.rlistings'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '%(test_id)s:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '%(test_id)s:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '%(test_id)s'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test2:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test2:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test2:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '*:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '*:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '*:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('HEAD',
+     None,
+     None, 'UUID', 'UUID',
+     None,
+     None, 'tester3', 'tester3', None, 403)
+]
+
+
+# A scenario of post for container ACL
+ACL_POST = [
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 403),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '%(test_id)s:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '%(test_id)s:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 403),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test'},
+     None, 'tester3', 'tester3', None, 403),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '%(test_id)s'},
+     None, 'tester3', 'tester3', None, 403),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test2:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test2:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test2:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '*:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '*:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '*:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.r:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.r:*,.rlistings'},
+     None, 'tester3', 'tester3', None, 403),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.r:invalid.domain.com'},
+     None, 'tester3', 'tester3', None, 403),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.r:invalid.domain.com,.rlistings'},
+     None, 'tester3', 'tester3', None, 403),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.rlistings'},
+     None, 'tester3', 'tester3', None, 403),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 202),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 202),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '%(test_id)s:tester3'},
+     None, 'tester3', 'tester3', None, 202),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '%(test_id)s:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 202),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test:*'},
+     None, 'tester3', 'tester3', None, 202),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test'},
+     None, 'tester3', 'tester3', None, 403),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '%(test_id)s'},
+     None, 'tester3', 'tester3', None, 403),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test2:tester3'},
+     None, 'tester3', 'tester3', None, 403),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test2:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test2:*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '*:tester3'},
+     None, 'tester3', 'tester3', None, 202),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '*:tester2'},
+     None, 'tester3', 'tester3', None, 403),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '*:*'},
+     None, 'tester3', 'tester3', None, 202),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '*'},
+     None, 'tester3', 'tester3', None, 403),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     None,
+     None, 'tester3', 'tester3', None, 403),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test',
+      'X-Container-Write': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 202),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test:tester3',
+      'X-Container-Write': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 202),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test:tester2',
+      'X-Container-Write': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 202),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test:%(tester3_id)s',
+      'X-Container-Write': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 202),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test:*',
+      'X-Container-Write': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 202),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test2',
+      'X-Container-Write': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 202),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test2:tester3',
+      'X-Container-Write': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 202),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test2:tester2',
+      'X-Container-Write': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 202),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test2:*',
+      'X-Container-Write': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 202),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '%(test_id)s',
+      'X-Container-Write': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 202),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '%(test_id)s:tester3',
+      'X-Container-Write': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 202),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '%(test_id)s:%(tester3_id)s',
+      'X-Container-Write': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 202),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '*',
+      'X-Container-Write': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 202),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '*:tester3',
+      'X-Container-Write': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 202),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '*:tester2',
+      'X-Container-Write': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 202),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '*:*',
+      'X-Container-Write': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 202),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.rlistings',
+      'X-Container-Write': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 202),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.r:*',
+      'X-Container-Write': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 202),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.r:*,.rlistings',
+      'X-Container-Write': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 202),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.r:invalid.domain.com',
+      'X-Container-Write': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 202),
+    ('POST',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.r:invalid.domain.com,.rlistings',
+      'X-Container-Write': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 202)
+]
+
+
+# A scenario of options for container ACL
+ACL_OPTIONS = [
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': 'test:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '%(test_id)s:tester3'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '%(test_id)s:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': 'test:tester2'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': 'test:*'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': 'test'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '%(test_id)s'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': 'test2:tester3'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': 'test2:tester2'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': 'test2:*'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': 'test2'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '*:tester3'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '*:tester2'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '*:*'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '*'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '.r:*'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '.r:*,.rlistings'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '.r:invalid.domain.com'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '.r:invalid.domain.com,.rlistings'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Read': '.rlistings'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': 'test:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': '%(test_id)s:tester3'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': '%(test_id)s:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': 'test:tester2'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': 'test:*'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': 'test'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': '%(test_id)s'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': 'test2:tester3'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': 'test2:tester2'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': 'test2:*'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': 'test2'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': '*:tester3'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': '*:tester2'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': '*:*'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     {'X-Container-Write': '*'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', None,
+     None,
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '%(test_id)s:tester3'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '%(test_id)s:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test:tester2'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test:*'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '%(test_id)s'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test2:tester3'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test2:tester2'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test2:*'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': 'test2'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '*:tester3'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '*:tester2'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '*:*'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '*'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.r:*'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.r:*,.rlistings'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.r:invalid.domain.com'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.r:invalid.domain.com,.rlistings'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Read': '.rlistings'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test:tester3'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '%(test_id)s:tester3'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '%(test_id)s:%(tester3_id)s'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test:tester2'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test:*'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '%(test_id)s'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test2:tester3'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test2:tester2'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test2:*'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': 'test2'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '*:tester3'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '*:tester2'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '*:*'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     {'X-Container-Write': '*'},
+     None, 'tester3', 'tester3', None, 200),
+    ('OPTIONS',
+     None,
+     None, 'UUID', 'UUID',
+     None,
+     None, 'tester3', 'tester3', None, 200)
+]
+
+
+# http_method           : HTTP methods such as PUT, GET, POST, HEAD and so on
+# auth_user_name        : a user name which is used for getting a token for
+# expected              : expected status code
+TEST_CASE_INFO_FORMAT = ('http_method', 'auth_user_name', 'expected')
+
+
+RBAC_INFO_GET = [
+    ('GET', 'tester', 200),
+    ('GET', 'tester6', 200),
+    ('GET', 'tester3', 200),
+    ('GET', None, 200)
+]
+
+
+RBAC_INFO_HEAD = [
+    ('HEAD', 'tester', 200),
+    ('HEAD', 'tester6', 200),
+    ('HEAD', 'tester3', 200),
+    ('HEAD', None, 200)
+]
+
+
+RBAC_INFO_OPTIONS = [
+    ('OPTIONS', 'tester', 200),
+    ('OPTIONS', 'tester6', 200),
+    ('OPTIONS', 'tester3', 200),
+    ('OPTIONS', None, 200)
+]
+
+
+RBAC_INFO_GET_WITH_SERVICE_PREFIX = [
+    ('GET', 'tester5', 200)
+]
+
+
+RBAC_INFO_HEAD_WITH_SERVICE_PREFIX = [
+    ('HEAD', 'tester5', 200)
+]
+
+
+RBAC_INFO_OPTIONS_WITH_SERVICE_PREFIX = [
+    ('OPTIONS', 'tester5', 200)
+]
+
+
+class BaseClient(object):
+    def __init__(self):
+        self._set_users()
+        self.auth_url = tf.swift_test_auth
+        self.insecure = tf.insecure
+        self.auth_version = tf.swift_test_auth_version
+
+    def _set_users(self):
+        self.users = {}
+        for index in range(6):
+            self.users[tf.swift_test_user[index]] = {
+                'account': tf.swift_test_tenant[index],
+                'password': tf.swift_test_key[index],
+                'domain': tf.swift_test_domain[index]}
+
+
+class KeystoneClient(BaseClient):
+    def get_id_info(self):
+        id_info = {}
+        for user_name, user_info in self.users.items():
+            if user_name != '':
+                user_id, project_id = self._get_id(user_name)
+                id_info[user_name + '_id'] = user_id
+                id_info[user_info['account'] + '_id'] = project_id
+        return id_info
+
+    def _get_id(self, user_name):
+        info = self.users.get(user_name)
+        keystone_client = ksc.Client(
+            auth_url=self.auth_url,
+            version=(self.auth_version,),
+            username=user_name,
+            password=info['password'],
+            project_name=info['account'],
+            project_domain_name=info['domain'],
+            user_domain_name=info['domain'])
+        return keystone_client.user_id, keystone_client.project_id
+
+
+class SwiftClient(BaseClient):
+    _tokens = {}
+
+    def _get_auth(self, user_name):
+        info = self.users.get(user_name)
+        if info is None:
+            return None, None
+
+        os_options = {'user_domain_name': info['domain'],
+                      'project_domain_name': info['domain']}
+        authargs = dict(snet=False, tenant_name=info['account'],
+                        auth_version=self.auth_version, os_options=os_options,
+                        insecure=self.insecure)
+        storage_url, token = get_auth(
+            self.auth_url, user_name, info['password'], **authargs)
+
+        return storage_url, token
+
+    def auth(self, user_name):
+        storage_url, token = SwiftClient._tokens.get(user_name, (None, None))
+        if not token:
+            SwiftClient._tokens[user_name] = self._get_auth(user_name)
+            storage_url, token = SwiftClient._tokens.get(user_name)
+        return storage_url, token
+
+    def send_request(self, method, url, token=None, headers=None,
+                     service_token=None):
+        headers = {} if headers is None else headers.copy()
+        headers.update({'Content-Type': 'application/json',
+                       'Accept': 'application/json'})
+        if token:
+            headers['X-Auth-Token'] = token
+        if service_token:
+            headers['X-Service-Token'] = service_token
+        if self.insecure:
+            parsed, conn = http_connection(url, insecure=self.insecure)
+        else:
+            parsed, conn = http_connection(url)
+
+        conn.request(method, parsed.path, headers=headers)
+        resp = conn.getresponse()
+
+        return resp
+
+
+class BaseTestAC(unittest.TestCase):
+    def setUp(self):
+        if ksc is None:
+            raise unittest.SkipTest('keystoneclient is not available')
+        self.reseller_admin = tf.swift_test_user[5]
+        self.client = SwiftClient()
+
+    def _create_resource_url(self, storage_url, account=None,
+                             container=None, obj=None, reseller_prefix=None):
+        # e.g.
+        #   storage_url = 'http://localhost/v1/AUTH_xxx'
+        #   storage_url_list[:-1] is ['http:', '', 'localhost', 'v1']
+        #   storage_url_list[-1] is 'AUTH_xxx'
+        storage_url_list = storage_url.rstrip('/').split('/')
+        base_url = '/'.join(storage_url_list[:-1])
+
+        if account is None:
+            account = storage_url_list[-1]
+            if reseller_prefix == 'SERVICE':
+                # replace endpoint reseller prefix with service reseller prefix
+                i = (account.index('_') + 1) if '_' in account else 0
+                account = tf.swift_test_service_prefix + account[i:]
+
+        return '/'.join([part for part in (base_url, account, container, obj)
+                         if part])
+
+    def _put_container(self, storage_url, token, test_case):
+        resource_url = self._create_resource_url(
+            storage_url,
+            test_case['account_name'],
+            test_case['container_name'],
+            reseller_prefix=test_case['reseller_prefix'])
+        self.created_resources.append(resource_url)
+        self.client.send_request('PUT', resource_url, token,
+                                 headers=test_case['prep_container_header'])
+
+    def _put_object(self, storage_url, token, test_case):
+        resource_url = self._create_resource_url(
+            storage_url,
+            test_case['account_name'],
+            test_case['container_name'],
+            test_case['object_name'],
+            reseller_prefix=test_case['reseller_prefix'])
+        self.created_resources.append(resource_url)
+        self.client.send_request('PUT', resource_url, token)
+
+    def _get_storage_url_and_token(self, storage_url_user, token_user):
+        storage_url, _junk = self.client.auth(storage_url_user)
+        _junk, token = self.client.auth(token_user)
+
+        return storage_url, token
+
+    def _prepare(self, test_case):
+        storage_url, reseller_token = self._get_storage_url_and_token(
+            test_case['target_user_name'], self.reseller_admin)
+
+        if test_case['http_method'] in ('GET', 'POST', 'DELETE', 'HEAD',
+                                        'OPTIONS'):
+            temp_test_case = test_case.copy()
+            if test_case['container_name'] is None:
+                # When the target is for account, dummy container will be
+                # created to create an account. This account is created by
+                # account_autocreate.
+                temp_test_case['container_name'] = uuid.uuid4().hex
+            self._put_container(storage_url, reseller_token, temp_test_case)
+
+            if test_case['object_name']:
+                self._put_object(storage_url, reseller_token, test_case)
+
+        elif test_case['http_method'] in ('PUT',):
+            if test_case['object_name']:
+                self._put_container(storage_url, reseller_token, test_case)
+
+    def _execute(self, test_case):
+        storage_url, token = self._get_storage_url_and_token(
+            test_case['target_user_name'], test_case['auth_user_name'])
+
+        service_user = test_case['service_user_name']
+        service_token = (None if service_user is None
+                         else self.client.auth(service_user)[1])
+
+        resource_url = self._create_resource_url(
+            storage_url,
+            test_case['account_name'],
+            test_case['container_name'],
+            test_case['object_name'],
+            test_case['reseller_prefix'])
+
+        if test_case['http_method'] in ('PUT'):
+            self.created_resources.append(resource_url)
+
+        resp = self.client.send_request(test_case['http_method'],
+                                        resource_url,
+                                        token,
+                                        headers=test_case['header'],
+                                        service_token=service_token)
+
+        return resp.status
+
+    def _cleanup(self):
+        _junk, reseller_token = self.client.auth(self.reseller_admin)
+        for resource_url in reversed(self.created_resources):
+            resp = self.client.send_request('DELETE', resource_url,
+                                            reseller_token)
+            self.assertIn(resp.status, (204, 404))
+
+    def _convert_data(self, data):
+        test_case = dict(zip(TEST_CASE_FORMAT, data))
+        if test_case['container_name'] == 'UUID':
+            test_case['container_name'] = uuid.uuid4().hex
+        if test_case['object_name'] == 'UUID':
+            test_case['object_name'] = uuid.uuid4().hex
+        return test_case
+
+    def _run_scenario(self, scenario):
+        for data in scenario:
+            test_case = self._convert_data(data)
+            self.created_resources = []
+            try:
+                self._prepare(test_case)
+                result = self._execute(test_case)
+                self.assertEqual(test_case['expected'],
+                                 result,
+                                 'Expected %s but got %s for test case %s' %
+                                 (test_case['expected'], result, test_case))
+            finally:
+                self._cleanup()
+
+
+class TestRBAC(BaseTestAC):
+
+    def test_rbac(self):
+        if any((tf.skip, tf.skip2, tf.skip3, tf.skip_if_not_v3,
+                tf.skip_if_no_reseller_admin)):
+            raise unittest.SkipTest
+        scenario_rbac = RBAC_PUT + RBAC_DELETE + RBAC_GET +\
+            RBAC_HEAD + RBAC_POST + RBAC_OPTIONS
+        shuffle(scenario_rbac)
+        self._run_scenario(scenario_rbac)
+
+    def test_rbac_with_service_prefix(self):
+        if any((tf.skip, tf.skip2, tf.skip3, tf.skip_if_not_v3,
+                tf.skip_service_tokens, tf.skip_if_no_reseller_admin)):
+            raise unittest.SkipTest
+        scenario_rbac = RBAC_PUT_WITH_SERVICE_PREFIX +\
+            RBAC_DELETE_WITH_SERVICE_PREFIX +\
+            RBAC_GET_WITH_SERVICE_PREFIX +\
+            RBAC_HEAD_WITH_SERVICE_PREFIX +\
+            RBAC_POST_WITH_SERVICE_PREFIX +\
+            RBAC_OPTIONS_WITH_SERVICE_PREFIX
+        shuffle(scenario_rbac)
+        self._run_scenario(scenario_rbac)
+
+
+class TestRBACInfo(BaseTestAC):
+    def _get_info_url(self):
+        storage_url, _junk = self.client.auth(self.reseller_admin)
+        parsed_url = urlparse(storage_url)
+        info_url_parts = (
+            parsed_url.scheme, parsed_url.netloc, '/info', '', '', '')
+        return urlunparse(info_url_parts)
+
+    def _prepare(self, test_case):
+        pass
+
+    def _execute(self, test_case):
+        _junk, token = \
+            self.client.auth(test_case['auth_user_name'])
+        resp = self.client.send_request(test_case['http_method'],
+                                        self.info_url, token)
+        return resp.status
+
+    def _cleanup(self):
+        pass
+
+    def _convert_data(self, data):
+        test_case = dict(zip(TEST_CASE_INFO_FORMAT, data))
+        return test_case
+
+    def test_rbac_info(self):
+        if any((tf.skip, tf.skip2, tf.skip3, tf.skip_if_not_v3,
+                tf.skip_if_no_reseller_admin)):
+            raise unittest.SkipTest
+        self.info_url = self._get_info_url()
+        scenario_rbac_info = RBAC_INFO_GET + RBAC_INFO_HEAD + RBAC_INFO_OPTIONS
+        shuffle(scenario_rbac_info)
+        self._run_scenario(scenario_rbac_info)
+
+    def test_rbac_info_with_service_prefix(self):
+        if any((tf.skip, tf.skip2, tf.skip3, tf.skip_if_not_v3,
+                tf.skip_service_tokens, tf.skip_if_no_reseller_admin)):
+            raise unittest.SkipTest
+        self.info_url = self._get_info_url()
+        scenario_rbac_info = RBAC_INFO_GET_WITH_SERVICE_PREFIX +\
+            RBAC_INFO_HEAD_WITH_SERVICE_PREFIX +\
+            RBAC_INFO_OPTIONS_WITH_SERVICE_PREFIX
+        shuffle(scenario_rbac_info)
+        self._run_scenario(scenario_rbac_info)
+
+
+class TestContainerACL(BaseTestAC):
+
+    def _convert_data(self, data):
+        test_case = super(TestContainerACL, self)._convert_data(data)
+        prep_container_header = test_case['prep_container_header']
+        if prep_container_header is not None:
+            for header, header_val in prep_container_header.items():
+                prep_container_header[header] = header_val % self.id_info
+        return test_case
+
+    def test_container_acl(self):
+        if any((tf.skip, tf.skip2, tf.skip3, tf.skip_if_not_v3,
+                tf.skip_if_no_reseller_admin)):
+            raise unittest.SkipTest
+        self.id_info = KeystoneClient().get_id_info()
+        scenario_container_acl = ACL_PUT + ACL_DELETE + ACL_GET +\
+            ACL_HEAD + ACL_POST + ACL_OPTIONS
+        shuffle(scenario_container_acl)
+        self._run_scenario(scenario_container_acl)
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/functional/test_account.py b/test/functional/test_account.py
new file mode 100644
index 0000000000..9a40a14a07
--- /dev/null
+++ b/test/functional/test_account.py
@@ -0,0 +1,1096 @@
+#!/usr/bin/python
+
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+import json
+import urllib.parse
+from uuid import uuid4
+from string import ascii_letters
+
+from swift.common.middleware.acl import format_acl
+from swift.common.utils import distribute_evenly
+
+from test.functional import check_response, retry, requires_acls, \
+    load_constraint, SkipTest
+import test.functional as tf
+
+
+def setUpModule():
+    tf.setup_package()
+
+
+def tearDownModule():
+    tf.teardown_package()
+
+
+class TestAccount(unittest.TestCase):
+    existing_metadata = None
+
+    @classmethod
+    def get_meta(cls):
+        def head(url, token, parsed, conn):
+            conn.request('HEAD', parsed.path, '', {'X-Auth-Token': token})
+            return check_response(conn)
+        resp = retry(head)
+        resp.read()
+        return dict((k, v) for k, v in resp.getheaders() if
+                    k.lower().startswith('x-account-meta'))
+
+    @classmethod
+    def clear_meta(cls, remove_metadata_keys):
+        def post(url, token, parsed, conn, hdr_keys):
+            headers = {'X-Auth-Token': token}
+            headers.update((k, '') for k in hdr_keys)
+            conn.request('POST', parsed.path, '', headers)
+            return check_response(conn)
+
+        buckets = (len(remove_metadata_keys) - 1) // 90 + 1
+        for batch in distribute_evenly(remove_metadata_keys, buckets):
+            resp = retry(post, batch)
+            resp.read()
+
+    @classmethod
+    def set_meta(cls, metadata):
+        def post(url, token, parsed, conn, meta_hdrs):
+            headers = {'X-Auth-Token': token}
+            headers.update(meta_hdrs)
+            conn.request('POST', parsed.path, '', headers)
+            return check_response(conn)
+
+        if not metadata:
+            return
+        resp = retry(post, metadata)
+        resp.read()
+
+    @classmethod
+    def setUpClass(cls):
+        # remove and stash any existing account user metadata before tests
+        cls.existing_metadata = cls.get_meta()
+        cls.clear_meta(cls.existing_metadata.keys())
+
+    @classmethod
+    def tearDownClass(cls):
+        # replace any stashed account user metadata
+        cls.set_meta(cls.existing_metadata)
+
+    def setUp(self):
+        self.max_meta_count = load_constraint('max_meta_count')
+        self.max_meta_name_length = load_constraint('max_meta_name_length')
+        self.max_meta_overall_size = load_constraint('max_meta_overall_size')
+        self.max_meta_value_length = load_constraint('max_meta_value_length')
+
+    def tearDown(self):
+        # clean up any account user metadata created by test
+        new_metadata = self.get_meta().keys()
+        self.clear_meta(new_metadata)
+
+    def test_GET_HEAD_content_type(self):
+
+        def send_req(url, token, parsed, conn, method, params):
+            qs = '?%s' % urllib.parse.urlencode(params) if params else ''
+            conn.request(method, parsed.path + qs, '', {'X-Auth-Token': token})
+            return check_response(conn)
+
+        resp = retry(send_req, 'GET', {})
+        self.assertEqual(resp.status, 204)
+        self.assertEqual(resp.getheader('Content-Type'),
+                         'text/plain; charset=utf-8')
+        self.assertEqual(resp.getheader('Content-Length'), '0')
+
+        resp = retry(send_req, 'HEAD', {})
+        self.assertEqual(resp.status, 204)
+        self.assertEqual(resp.getheader('Content-Type'),
+                         'text/plain; charset=utf-8')
+        self.assertEqual(resp.getheader('Content-Length'), '0')
+
+        resp = retry(send_req, 'GET', {'format': 'json'})
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(resp.getheader('Content-Type'),
+                         'application/json; charset=utf-8')
+        resp = retry(send_req, 'HEAD', {'format': 'json'})
+        self.assertEqual(resp.status, 204)
+        self.assertEqual(resp.getheader('Content-Type'),
+                         'application/json; charset=utf-8')
+        self.assertEqual(resp.getheader('Content-Length'), '0')
+
+        resp = retry(send_req, 'GET', {'format': 'xml'})
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(resp.getheader('Content-Type'),
+                         'application/xml; charset=utf-8')
+        resp = retry(send_req, 'HEAD', {'format': 'xml'})
+        self.assertEqual(resp.status, 204)
+        self.assertEqual(resp.getheader('Content-Type'),
+                         'application/xml; charset=utf-8')
+        self.assertEqual(resp.getheader('Content-Length'), '0')
+
+    def test_metadata(self):
+        if tf.skip:
+            raise SkipTest
+
+        def post(url, token, parsed, conn, value):
+            conn.request('POST', parsed.path, '',
+                         {'X-Auth-Token': token, 'X-Account-Meta-Test': value})
+            return check_response(conn)
+
+        def head(url, token, parsed, conn):
+            conn.request('HEAD', parsed.path, '', {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def get(url, token, parsed, conn):
+            conn.request('GET', parsed.path, '', {'X-Auth-Token': token})
+            return check_response(conn)
+
+        resp = retry(post, '')
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(head)
+        resp.read()
+        self.assertIn(resp.status, (200, 204))
+        self.assertIsNone(resp.getheader('x-account-meta-test'))
+        resp = retry(get)
+        resp.read()
+        self.assertIn(resp.status, (200, 204))
+        self.assertIsNone(resp.getheader('x-account-meta-test'))
+        resp = retry(post, 'Value')
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(head)
+        resp.read()
+        self.assertIn(resp.status, (200, 204))
+        self.assertEqual(resp.getheader('x-account-meta-test'), 'Value')
+        resp = retry(get)
+        resp.read()
+        self.assertIn(resp.status, (200, 204))
+        self.assertEqual(resp.getheader('x-account-meta-test'), 'Value')
+
+    def test_invalid_acls(self):
+        if tf.skip:
+            raise SkipTest
+
+        def post(url, token, parsed, conn, headers):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('POST', parsed.path, '', new_headers)
+            return check_response(conn)
+
+        # needs to be an acceptable header size
+        num_keys = 8
+        max_key_size = load_constraint('max_header_size') // num_keys
+        acl = {'admin': [c * max_key_size for c in ascii_letters[:num_keys]]}
+        headers = {'x-account-access-control': format_acl(
+            version=2, acl_dict=acl)}
+        resp = retry(post, headers=headers, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 400)
+
+        # and again a touch smaller
+        acl = {'admin': [c * max_key_size for c
+                         in ascii_letters[:num_keys - 1]]}
+        headers = {'x-account-access-control': format_acl(
+            version=2, acl_dict=acl)}
+        resp = retry(post, headers=headers, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+    @requires_acls
+    def test_invalid_acl_keys(self):
+        def post(url, token, parsed, conn, headers):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('POST', parsed.path, '', new_headers)
+            return check_response(conn)
+
+        # needs to be json
+        resp = retry(post, headers={'X-Account-Access-Control': 'invalid'},
+                     use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 400)
+
+        acl_user = tf.swift_test_user[1]
+        acl = {'admin': [acl_user], 'invalid_key': 'invalid_value'}
+        headers = {'x-account-access-control': format_acl(
+            version=2, acl_dict=acl)}
+
+        resp = retry(post, headers, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 400)
+        self.assertIsNone(resp.getheader('X-Account-Access-Control'))
+
+    @requires_acls
+    def test_invalid_acl_values(self):
+        def post(url, token, parsed, conn, headers):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('POST', parsed.path, '', new_headers)
+            return check_response(conn)
+
+        acl = {'admin': 'invalid_value'}
+        headers = {'x-account-access-control': format_acl(
+            version=2, acl_dict=acl)}
+
+        resp = retry(post, headers=headers, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 400)
+        self.assertIsNone(resp.getheader('X-Account-Access-Control'))
+
+    @requires_acls
+    def test_read_only_acl(self):
+        if tf.skip3:
+            raise SkipTest
+
+        def get(url, token, parsed, conn):
+            conn.request('GET', parsed.path, '', {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def post(url, token, parsed, conn, headers):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('POST', parsed.path, '', new_headers)
+            return check_response(conn)
+
+        # cannot read account
+        resp = retry(get, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # grant read access
+        acl_user = tf.swift_test_user[2]
+        acl = {'read-only': [acl_user]}
+        headers = {'x-account-access-control': format_acl(
+            version=2, acl_dict=acl)}
+        resp = retry(post, headers=headers, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        # read-only can read account headers
+        resp = retry(get, use_account=3)
+        resp.read()
+        self.assertIn(resp.status, (200, 204))
+        # but not acls
+        self.assertIsNone(resp.getheader('X-Account-Access-Control'))
+
+        # read-only can not write metadata
+        headers = {'x-account-meta-test': 'value'}
+        resp = retry(post, headers=headers, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # but they can read it
+        headers = {'x-account-meta-test': 'value'}
+        resp = retry(post, headers=headers, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(get, use_account=3)
+        resp.read()
+        self.assertIn(resp.status, (200, 204))
+        self.assertEqual(resp.getheader('X-Account-Meta-Test'), 'value')
+
+    @requires_acls
+    def test_read_write_acl(self):
+        if tf.skip3:
+            raise SkipTest
+
+        def get(url, token, parsed, conn):
+            conn.request('GET', parsed.path, '', {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def post(url, token, parsed, conn, headers):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('POST', parsed.path, '', new_headers)
+            return check_response(conn)
+
+        # cannot read account
+        resp = retry(get, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # grant read-write access
+        acl_user = tf.swift_test_user[2]
+        acl = {'read-write': [acl_user]}
+        headers = {'x-account-access-control': format_acl(
+            version=2, acl_dict=acl)}
+        resp = retry(post, headers=headers, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        # read-write can read account headers
+        resp = retry(get, use_account=3)
+        resp.read()
+        self.assertIn(resp.status, (200, 204))
+        # but not acls
+        self.assertIsNone(resp.getheader('X-Account-Access-Control'))
+
+        # read-write can not write account metadata
+        headers = {'x-account-meta-test': 'value'}
+        resp = retry(post, headers=headers, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+    @requires_acls
+    def test_admin_acl(self):
+        if tf.skip3:
+            raise SkipTest
+
+        def get(url, token, parsed, conn):
+            conn.request('GET', parsed.path, '', {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def post(url, token, parsed, conn, headers):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('POST', parsed.path, '', new_headers)
+            return check_response(conn)
+
+        # cannot read account
+        resp = retry(get, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # grant admin access
+        acl_user = tf.swift_test_user[2]
+        acl = {'admin': [acl_user]}
+        acl_json_str = format_acl(version=2, acl_dict=acl)
+        headers = {'x-account-access-control': acl_json_str}
+        resp = retry(post, headers=headers, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        # admin can read account headers
+        resp = retry(get, use_account=3)
+        resp.read()
+        self.assertIn(resp.status, (200, 204))
+        # including acls
+        self.assertEqual(resp.getheader('X-Account-Access-Control'),
+                         acl_json_str)
+
+        # admin can write account metadata
+        value = str(uuid4())
+        headers = {'x-account-meta-test': value}
+        resp = retry(post, headers=headers, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(get, use_account=3)
+        resp.read()
+        self.assertIn(resp.status, (200, 204))
+        self.assertEqual(resp.getheader('X-Account-Meta-Test'), value)
+
+        # admin can even revoke their own access
+        headers = {'x-account-access-control': '{}'}
+        resp = retry(post, headers=headers, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        # and again, cannot read account
+        resp = retry(get, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+    @requires_acls
+    def test_protected_tempurl(self):
+        if tf.skip3:
+            raise SkipTest
+
+        def get(url, token, parsed, conn):
+            conn.request('GET', parsed.path, '', {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def post(url, token, parsed, conn, headers):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('POST', parsed.path, '', new_headers)
+            return check_response(conn)
+
+        # add an account metadata, and temp-url-key to account
+        value = str(uuid4())
+        headers = {
+            'x-account-meta-temp-url-key': 'secret',
+            'x-account-meta-test': value,
+        }
+        resp = retry(post, headers=headers, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        # grant read-only access to tester3
+        acl_user = tf.swift_test_user[2]
+        acl = {'read-only': [acl_user]}
+        acl_json_str = format_acl(version=2, acl_dict=acl)
+        headers = {'x-account-access-control': acl_json_str}
+        resp = retry(post, headers=headers, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        # read-only tester3 can read account metadata
+        resp = retry(get, use_account=3)
+        resp.read()
+        self.assertIn(resp.status, (200, 204),
+                      'Expected status in (200, 204), got %s' % resp.status)
+        self.assertEqual(resp.getheader('X-Account-Meta-Test'), value)
+        # but not temp-url-key
+        self.assertIsNone(resp.getheader('X-Account-Meta-Temp-Url-Key'))
+
+        # grant read-write access to tester3
+        acl_user = tf.swift_test_user[2]
+        acl = {'read-write': [acl_user]}
+        acl_json_str = format_acl(version=2, acl_dict=acl)
+        headers = {'x-account-access-control': acl_json_str}
+        resp = retry(post, headers=headers, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        # read-write tester3 can read account metadata
+        resp = retry(get, use_account=3)
+        resp.read()
+        self.assertIn(resp.status, (200, 204),
+                      'Expected status in (200, 204), got %s' % resp.status)
+        self.assertEqual(resp.getheader('X-Account-Meta-Test'), value)
+        # but not temp-url-key
+        self.assertIsNone(resp.getheader('X-Account-Meta-Temp-Url-Key'))
+
+        # grant admin access to tester3
+        acl_user = tf.swift_test_user[2]
+        acl = {'admin': [acl_user]}
+        acl_json_str = format_acl(version=2, acl_dict=acl)
+        headers = {'x-account-access-control': acl_json_str}
+        resp = retry(post, headers=headers, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        # admin tester3 can read account metadata
+        resp = retry(get, use_account=3)
+        resp.read()
+        self.assertIn(resp.status, (200, 204),
+                      'Expected status in (200, 204), got %s' % resp.status)
+        self.assertEqual(resp.getheader('X-Account-Meta-Test'), value)
+        # including temp-url-key
+        self.assertEqual(resp.getheader('X-Account-Meta-Temp-Url-Key'),
+                         'secret')
+
+        # admin tester3 can even change temp-url-key
+        secret = str(uuid4())
+        headers = {
+            'x-account-meta-temp-url-key': secret,
+        }
+        resp = retry(post, headers=headers, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(get, use_account=3)
+        resp.read()
+        self.assertIn(resp.status, (200, 204),
+                      'Expected status in (200, 204), got %s' % resp.status)
+        self.assertEqual(resp.getheader('X-Account-Meta-Temp-Url-Key'),
+                         secret)
+
+    @requires_acls
+    def test_account_acls(self):
+        if tf.skip2:
+            raise SkipTest
+
+        def post(url, token, parsed, conn, headers):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('POST', parsed.path, '', new_headers)
+            return check_response(conn)
+
+        def put(url, token, parsed, conn, headers):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('PUT', parsed.path, '', new_headers)
+            return check_response(conn)
+
+        def delete(url, token, parsed, conn, headers):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('DELETE', parsed.path, '', new_headers)
+            return check_response(conn)
+
+        def head(url, token, parsed, conn):
+            conn.request('HEAD', parsed.path, '', {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def get(url, token, parsed, conn):
+            conn.request('GET', parsed.path, '', {'X-Auth-Token': token})
+            return check_response(conn)
+
+        try:
+            # User1 can POST to their own account (and reset the ACLs)
+            resp = retry(post, headers={'X-Account-Access-Control': '{}'},
+                         use_account=1)
+            resp.read()
+            self.assertEqual(resp.status, 204)
+            self.assertIsNone(resp.getheader('X-Account-Access-Control'))
+
+            # User1 can GET their own empty account
+            resp = retry(get, use_account=1)
+            resp.read()
+            self.assertEqual(resp.status // 100, 2)
+            self.assertIsNone(resp.getheader('X-Account-Access-Control'))
+
+            # User2 can't GET User1's account
+            resp = retry(get, use_account=2, url_account=1)
+            resp.read()
+            self.assertEqual(resp.status, 403)
+
+            # User1 is swift_owner of their own account, so they can POST an
+            # ACL -- let's do this and make User2 (test_user[1]) an admin
+            acl_user = tf.swift_test_user[1]
+            acl = {'admin': [acl_user]}
+            headers = {'x-account-access-control': format_acl(
+                version=2, acl_dict=acl)}
+            resp = retry(post, headers=headers, use_account=1)
+            resp.read()
+            self.assertEqual(resp.status, 204)
+
+            # User1 can see the new header
+            resp = retry(get, use_account=1)
+            resp.read()
+            self.assertEqual(resp.status // 100, 2)
+            data_from_headers = resp.getheader('x-account-access-control')
+            expected = json.dumps(acl, separators=(',', ':'))
+            self.assertEqual(data_from_headers, expected)
+
+            # Now User2 should be able to GET the account and see the ACL
+            resp = retry(head, use_account=2, url_account=1)
+            resp.read()
+            data_from_headers = resp.getheader('x-account-access-control')
+            self.assertEqual(data_from_headers, expected)
+
+            # Revoke User2's admin access, grant User2 read-write access
+            acl = {'read-write': [acl_user]}
+            headers = {'x-account-access-control': format_acl(
+                version=2, acl_dict=acl)}
+            resp = retry(post, headers=headers, use_account=1)
+            resp.read()
+            self.assertEqual(resp.status, 204)
+
+            # User2 can still GET the account, but not see the ACL
+            # (since it's privileged data)
+            resp = retry(head, use_account=2, url_account=1)
+            resp.read()
+            self.assertEqual(resp.status, 204)
+            self.assertIsNone(resp.getheader('x-account-access-control'))
+
+            # User2 can PUT and DELETE a container
+            resp = retry(put, use_account=2, url_account=1,
+                         resource='%(storage_url)s/mycontainer', headers={})
+            resp.read()
+            self.assertEqual(resp.status, 201)
+            resp = retry(delete, use_account=2, url_account=1,
+                         resource='%(storage_url)s/mycontainer', headers={})
+            resp.read()
+            self.assertEqual(resp.status, 204)
+
+            # Revoke User2's read-write access, grant User2 read-only access
+            acl = {'read-only': [acl_user]}
+            headers = {'x-account-access-control': format_acl(
+                version=2, acl_dict=acl)}
+            resp = retry(post, headers=headers, use_account=1)
+            resp.read()
+            self.assertEqual(resp.status, 204)
+
+            # User2 can still GET the account, but not see the ACL
+            # (since it's privileged data)
+            resp = retry(head, use_account=2, url_account=1)
+            resp.read()
+            self.assertEqual(resp.status, 204)
+            self.assertIsNone(resp.getheader('x-account-access-control'))
+
+            # User2 can't PUT a container
+            resp = retry(put, use_account=2, url_account=1,
+                         resource='%(storage_url)s/mycontainer', headers={})
+            resp.read()
+            self.assertEqual(resp.status, 403)
+
+        finally:
+            # Make sure to clean up even if tests fail -- User2 should not
+            # have access to User1's account in other functional tests!
+            resp = retry(post, headers={'X-Account-Access-Control': '{}'},
+                         use_account=1)
+            resp.read()
+
+    @requires_acls
+    def test_swift_account_acls(self):
+        if tf.skip:
+            raise SkipTest
+
+        def post(url, token, parsed, conn, headers):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('POST', parsed.path, '', new_headers)
+            return check_response(conn)
+
+        def head(url, token, parsed, conn):
+            conn.request('HEAD', parsed.path, '', {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def get(url, token, parsed, conn):
+            conn.request('GET', parsed.path, '', {'X-Auth-Token': token})
+            return check_response(conn)
+
+        try:
+            # User1 can POST to their own account
+            resp = retry(post, headers={'X-Account-Access-Control': '{}'})
+            resp.read()
+            self.assertEqual(resp.status, 204)
+            self.assertIsNone(resp.getheader('X-Account-Access-Control'))
+
+            # User1 can GET their own empty account
+            resp = retry(get)
+            resp.read()
+            self.assertEqual(resp.status // 100, 2)
+            self.assertIsNone(resp.getheader('X-Account-Access-Control'))
+
+            # User1 can POST non-empty data
+            acl_json = '{"admin":["bob"]}'
+            resp = retry(post, headers={'X-Account-Access-Control': acl_json})
+            resp.read()
+            self.assertEqual(resp.status, 204)
+
+            # User1 can GET the non-empty data
+            resp = retry(get)
+            resp.read()
+            self.assertEqual(resp.status // 100, 2)
+            self.assertEqual(resp.getheader('X-Account-Access-Control'),
+                             acl_json)
+
+            # POST non-JSON ACL should fail
+            resp = retry(post, headers={'X-Account-Access-Control': 'yuck'})
+            resp.read()
+            # resp.status will be 400 if tempauth or some other ACL-aware
+            # auth middleware rejects it, or 200 (but silently swallowed by
+            # core Swift) if ACL-unaware auth middleware approves it.
+
+            # A subsequent GET should show the old, valid data, not the garbage
+            resp = retry(get)
+            resp.read()
+            self.assertEqual(resp.status // 100, 2)
+            self.assertEqual(resp.getheader('X-Account-Access-Control'),
+                             acl_json)
+
+        finally:
+            # Make sure to clean up even if tests fail -- User2 should not
+            # have access to User1's account in other functional tests!
+            resp = retry(post, headers={'X-Account-Access-Control': '{}'})
+            resp.read()
+
+    def test_swift_prohibits_garbage_account_acls(self):
+        if tf.skip:
+            raise SkipTest
+
+        def post(url, token, parsed, conn, headers):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('POST', parsed.path, '', new_headers)
+            return check_response(conn)
+
+        def get(url, token, parsed, conn):
+            conn.request('GET', parsed.path, '', {'X-Auth-Token': token})
+            return check_response(conn)
+
+        try:
+            # User1 can POST to their own account
+            resp = retry(post, headers={'X-Account-Access-Control': '{}'})
+            resp.read()
+            self.assertEqual(resp.status, 204)
+            self.assertIsNone(resp.getheader('X-Account-Access-Control'))
+
+            # User1 can GET their own empty account
+            resp = retry(get)
+            resp.read()
+            self.assertEqual(resp.status // 100, 2)
+            self.assertIsNone(resp.getheader('X-Account-Access-Control'))
+
+            # User1 can POST non-empty data
+            acl_json = '{"admin":["bob"]}'
+            resp = retry(post, headers={'X-Account-Access-Control': acl_json})
+            resp.read()
+            self.assertEqual(resp.status, 204)
+            # If this request is handled by ACL-aware auth middleware, then the
+            # ACL will be persisted.  If it is handled by ACL-unaware auth
+            # middleware, then the header will be thrown out.  But the request
+            # should return successfully in any case.
+
+            # User1 can GET the non-empty data
+            resp = retry(get)
+            resp.read()
+            self.assertEqual(resp.status // 100, 2)
+            # ACL will be set if some ACL-aware auth middleware (e.g. tempauth)
+            # propagates it to sysmeta; if no ACL-aware auth middleware does,
+            # then X-Account-Access-Control will still be empty.
+
+            # POST non-JSON ACL should fail
+            resp = retry(post, headers={'X-Account-Access-Control': 'yuck'})
+            resp.read()
+            # resp.status will be 400 if tempauth or some other ACL-aware
+            # auth middleware rejects it, or 200 (but silently swallowed by
+            # core Swift) if ACL-unaware auth middleware approves it.
+
+            # A subsequent GET should either show the old, valid data (if
+            # ACL-aware auth middleware is propagating it) or show nothing
+            # (if no auth middleware in the pipeline is ACL-aware), but should
+            # never return the garbage ACL.
+            resp = retry(get)
+            resp.read()
+            self.assertEqual(resp.status // 100, 2)
+            self.assertNotEqual(resp.getheader('X-Account-Access-Control'),
+                                'yuck')
+
+        finally:
+            # Make sure to clean up even if tests fail -- User2 should not
+            # have access to User1's account in other functional tests!
+            resp = retry(post, headers={'X-Account-Access-Control': '{}'})
+            resp.read()
+
+    def test_unicode_metadata(self):
+        if tf.skip:
+            raise SkipTest
+
+        def post(url, token, parsed, conn, name, value):
+            conn.request('POST', parsed.path, '',
+                         {'X-Auth-Token': token, name: value})
+            return check_response(conn)
+
+        def head(url, token, parsed, conn):
+            conn.request('HEAD', parsed.path, '', {'X-Auth-Token': token})
+            return check_response(conn)
+        uni_value = u'uni\u0E12'
+        # Note that py3 has issues with non-ascii header names; see
+        # https://bugs.python.org/issue37093 -- so we won't test with unicode
+        # header names
+        resp = retry(post, 'X-Account-Meta-uni', uni_value)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(head)
+        resp.read()
+        self.assertIn(resp.status, (200, 204))
+        self.assertEqual(resp.getheader('X-Account-Meta-uni'),
+                         uni_value)
+
+    def test_multi_metadata(self):
+        if tf.skip:
+            raise SkipTest
+
+        def post(url, token, parsed, conn, name, value):
+            conn.request('POST', parsed.path, '',
+                         {'X-Auth-Token': token, name: value})
+            return check_response(conn)
+
+        def head(url, token, parsed, conn):
+            conn.request('HEAD', parsed.path, '', {'X-Auth-Token': token})
+            return check_response(conn)
+
+        resp = retry(post, 'X-Account-Meta-One', '1')
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(head)
+        resp.read()
+        self.assertIn(resp.status, (200, 204))
+        self.assertEqual(resp.getheader('x-account-meta-one'), '1')
+        resp = retry(post, 'X-Account-Meta-Two', '2')
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(head)
+        resp.read()
+        self.assertIn(resp.status, (200, 204))
+        self.assertEqual(resp.getheader('x-account-meta-one'), '1')
+        self.assertEqual(resp.getheader('x-account-meta-two'), '2')
+
+    def test_bad_metadata(self):
+        if tf.skip:
+            raise SkipTest
+
+        def post(url, token, parsed, conn, extra_headers):
+            headers = {'X-Auth-Token': token}
+            headers.update(extra_headers)
+            conn.request('POST', parsed.path, '', headers)
+            return check_response(conn)
+
+        resp = retry(post,
+                     {'X-Account-Meta-' + (
+                         'k' * self.max_meta_name_length): 'v'})
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        # Clear it, so the value-length checking doesn't accidentally trip
+        # the overall max
+        resp = retry(post,
+                     {'X-Account-Meta-' + (
+                         'k' * self.max_meta_name_length): ''})
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        resp = retry(
+            post,
+            {'X-Account-Meta-' + ('k' * (
+                self.max_meta_name_length + 1)): 'v'})
+        resp.read()
+        self.assertEqual(resp.status, 400)
+
+        resp = retry(post,
+                     {'X-Account-Meta-Too-Long': (
+                         'k' * self.max_meta_value_length)})
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(
+            post,
+            {'X-Account-Meta-Too-Long': 'k' * (
+                self.max_meta_value_length + 1)})
+        resp.read()
+        self.assertEqual(resp.status, 400)
+
+    def test_bad_metadata2(self):
+        if tf.skip:
+            raise SkipTest
+
+        def post(url, token, parsed, conn, extra_headers):
+            headers = {'X-Auth-Token': token}
+            headers.update(extra_headers)
+            conn.request('POST', parsed.path, '', headers)
+            return check_response(conn)
+
+        headers = {}
+        for x in range(self.max_meta_count):
+            headers['X-Account-Meta-%d' % x] = 'v'
+        resp = retry(post, headers)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        headers = {}
+        for x in range(self.max_meta_count + 1):
+            headers['X-Account-Meta-%d' % x] = 'v'
+        resp = retry(post, headers)
+        resp.read()
+        self.assertEqual(resp.status, 400)
+
+    def test_bad_metadata3(self):
+        if tf.skip:
+            raise SkipTest
+
+        if tf.in_process:
+            tf.skip_if_no_xattrs()
+
+        def post(url, token, parsed, conn, extra_headers):
+            headers = {'X-Auth-Token': token}
+            headers.update(extra_headers)
+            conn.request('POST', parsed.path, '', headers)
+            return check_response(conn)
+
+        headers = {}
+        header_value = 'k' * self.max_meta_value_length
+        size = 0
+        x = 0
+        while size < (self.max_meta_overall_size - 4
+                      - self.max_meta_value_length):
+            size += 4 + self.max_meta_value_length
+            headers['X-Account-Meta-%04d' % x] = header_value
+            x += 1
+        if self.max_meta_overall_size - size > 1:
+            headers['X-Account-Meta-k'] = \
+                'v' * (self.max_meta_overall_size - size - 1)
+        resp = retry(post, headers)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        # this POST includes metadata size that is over limit
+        headers['X-Account-Meta-k'] = \
+            'x' * (self.max_meta_overall_size - size)
+        resp = retry(post, headers)
+        resp.read()
+        self.assertEqual(resp.status, 400)
+        # this POST would be ok and the aggregate backend metadata
+        # size is on the border
+        headers = {'X-Account-Meta-k':
+                   'y' * (self.max_meta_overall_size - size - 1)}
+        resp = retry(post, headers)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        # this last POST would be ok by itself but takes the aggregate
+        # backend metadata size over limit
+        headers = {'X-Account-Meta-k':
+                   'z' * (self.max_meta_overall_size - size)}
+        resp = retry(post, headers)
+        resp.read()
+        self.assertEqual(resp.status, 400)
+
+
+class TestAccountInNonDefaultDomain(unittest.TestCase):
+    def setUp(self):
+        if tf.skip or tf.skip2 or tf.skip_if_not_v3:
+            raise SkipTest('AUTH VERSION 3 SPECIFIC TEST')
+
+    def test_project_domain_id_header(self):
+        # make sure account exists (assumes account auto create)
+        def post(url, token, parsed, conn):
+            conn.request('POST', parsed.path, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        resp = retry(post, use_account=4)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        # account in non-default domain should have a project domain id
+        def head(url, token, parsed, conn):
+            conn.request('HEAD', parsed.path, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        resp = retry(head, use_account=4)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        self.assertIn('X-Account-Project-Domain-Id', resp.headers)
+
+
+class TestAccountQuotas(unittest.TestCase):
+    def setUp(self):
+        if 'account_quotas' not in tf.cluster_info:
+            raise SkipTest('Account quotas are not enabled')
+
+        self.policies = tf.FunctionalStoragePolicyCollection.from_info()
+
+    def _check_user_cannot_post(self, headers):
+        def post(url, token, parsed, conn):
+            conn.request('POST', parsed.path, '',
+                         dict({'X-Auth-Token': token}, **headers))
+            return check_response(conn)
+
+        resp = retry(post)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+    def test_user_cannot_set_own_quota_legacy(self):
+        self._check_user_cannot_post({'X-Account-Meta-Quota-Bytes': '0'})
+
+    def test_user_cannot_set_own_quota(self):
+        self._check_user_cannot_post({'X-Account-Quota-Bytes': '0'})
+        self._check_user_cannot_post({'X-Account-Quota-Count': '0'})
+
+    def test_user_cannot_set_own_policy_quota(self):
+        policy = self.policies.select()['name']
+        self._check_user_cannot_post(
+            {'X-Account-Quota-Bytes-Policy-' + policy: '0'})
+        self._check_user_cannot_post(
+            {'X-Account-Quota-Count-Policy-' + policy: '0'})
+
+    def test_user_cannot_remove_own_quota_legacy(self):
+        self._check_user_cannot_post(
+            {'X-Remove-Account-Meta-Quota-Bytes': 't'})
+
+    def test_user_cannot_remove_own_quota(self):
+        self._check_user_cannot_post(
+            {'X-Remove-Account-Quota-Bytes': 't'})
+        self._check_user_cannot_post(
+            {'X-Remove-Account-Quota-Count': 't'})
+
+    def test_user_cannot_remove_own_policy_quota(self):
+        policy = self.policies.select()['name']
+        self._check_user_cannot_post(
+            {'X-Remove-Account-Quota-Bytes-Policy-' + policy: 't'})
+        self._check_user_cannot_post(
+            {'X-Remove-Account-Quota-Count-Policy-' + policy: 't'})
+
+    def _check_admin_can_post(self, headers):
+        def post(url, token, parsed, conn):
+            conn.request('POST', parsed.path, '',
+                         dict({'X-Auth-Token': token}, **headers))
+            return check_response(conn)
+
+        resp = retry(post, use_account=6, url_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+    def _test_admin_can_set_and_remove_user_quota(self, quota_header):
+        if tf.skip_if_no_reseller_admin:
+            raise SkipTest('No admin user configured')
+
+        def get_current_quota():
+            def head(url, token, parsed, conn):
+                conn.request('HEAD', parsed.path, '',
+                             {'X-Auth-Token': token})
+                return check_response(conn)
+
+            # Use user, not admin, to ensure globals in test.functional
+            # are properly populated before issuing POSTs
+            resp = retry(head)
+            resp.read()
+            self.assertEqual(resp.status, 204)
+            # Non-user-meta is authoritative now
+            return resp.headers.get(quota_header.replace('-Meta-', '-'),
+                                    resp.headers.get(quota_header))
+
+        original_quota = get_current_quota()
+
+        try:
+            self._check_admin_can_post({quota_header: '123'})
+            self.assertEqual('123', get_current_quota())
+
+            self._check_admin_can_post(
+                {quota_header.replace('X-', 'X-Remove-'): 't'})
+            self.assertIsNone(get_current_quota())
+
+            self._check_admin_can_post({quota_header: '111'})
+            self.assertEqual('111', get_current_quota())
+
+            # Can also remove with an explicit empty string
+            self._check_admin_can_post({quota_header: ''})
+            self.assertIsNone(get_current_quota())
+
+            self._check_admin_can_post({quota_header: '0'})
+            self.assertEqual('0', get_current_quota())
+        finally:
+            self._check_admin_can_post({quota_header: original_quota or ''})
+
+    def test_admin_can_set_and_remove_user_quota_legacy(self):
+        self._test_admin_can_set_and_remove_user_quota(
+            'X-Account-Meta-Quota-Bytes')
+
+    def test_admin_can_set_and_remove_user_quota(self):
+        self._test_admin_can_set_and_remove_user_quota(
+            'X-Account-Quota-Bytes')
+        self._test_admin_can_set_and_remove_user_quota(
+            'X-Account-Quota-Count')
+
+    def test_admin_can_set_and_remove_user_policy_quota(self):
+        if tf.skip_if_no_reseller_admin:
+            raise SkipTest('No admin user configured')
+        policy = self.policies.select()['name']
+
+        def get_current_quota(header):
+            def head(url, token, parsed, conn):
+                conn.request('HEAD', parsed.path, '',
+                             {'X-Auth-Token': token})
+                return check_response(conn)
+
+            # Use user, not admin, to ensure globals in test.functional
+            # are properly populated before issuing POSTs
+            resp = retry(head)
+            resp.read()
+            self.assertEqual(resp.status, 204)
+            return resp.headers.get(header)
+
+        for quota_header in ('X-Account-Quota-Bytes-Policy-' + policy,
+                             'X-Account-Quota-Count-Policy-' + policy):
+            original_quota = get_current_quota(quota_header)
+            try:
+                self._check_admin_can_post({quota_header: '123'})
+                self.assertEqual('123', get_current_quota(quota_header))
+
+                self._check_admin_can_post(
+                    {quota_header.replace('X-', 'X-Remove-'): 't'})
+                self.assertIsNone(get_current_quota(quota_header))
+
+                self._check_admin_can_post({quota_header: '111'})
+                self.assertEqual('111', get_current_quota(quota_header))
+
+                # Can also remove with an explicit empty string
+                self._check_admin_can_post({quota_header: ''})
+                self.assertIsNone(get_current_quota(quota_header))
+
+                self._check_admin_can_post({quota_header: '0'})
+                self.assertEqual('0', get_current_quota(quota_header))
+            finally:
+                self._check_admin_can_post(
+                    {quota_header: original_quota or ''})
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/functional/test_container.py b/test/functional/test_container.py
new file mode 100644
index 0000000000..658e9a6c85
--- /dev/null
+++ b/test/functional/test_container.py
@@ -0,0 +1,1857 @@
+#!/usr/bin/python
+
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import json
+import unittest
+import urllib.parse
+from uuid import uuid4
+
+from test.functional import check_response, cluster_info, retry, \
+    requires_acls, load_constraint, requires_policies, SkipTest
+import test.functional as tf
+
+
+def setUpModule():
+    tf.setup_package()
+
+
+def tearDownModule():
+    tf.teardown_package()
+
+
+class TestContainer(unittest.TestCase):
+
+    def setUp(self):
+        if tf.skip:
+            raise SkipTest
+        self.name = uuid4().hex
+        # this container isn't created by default, but will be cleaned up
+        self.container = uuid4().hex
+
+        def put(url, token, parsed, conn):
+            conn.request('PUT', parsed.path + '/' + self.name, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        resp = retry(put)
+        resp.read()
+        # If the request was received and processed but the container-server
+        # timed out getting the response back to the proxy, or the proxy timed
+        # out getting the response back to the client, the next retry will 202
+        self.assertIn(resp.status, (201, 202))
+
+        self.max_meta_count = load_constraint('max_meta_count')
+        self.max_meta_name_length = load_constraint('max_meta_name_length')
+        self.max_meta_overall_size = load_constraint('max_meta_overall_size')
+        self.max_meta_value_length = load_constraint('max_meta_value_length')
+
+    def tearDown(self):
+        if tf.skip:
+            raise SkipTest
+
+        def get(url, token, parsed, conn, container):
+            conn.request(
+                'GET', parsed.path + '/' + container + '?format=json', '',
+                {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def delete(url, token, parsed, conn, container, obj):
+            path = '/'.join([parsed.path, container, obj['name']])
+            conn.request('DELETE', path, '', {'X-Auth-Token': token})
+            return check_response(conn)
+
+        for container in (self.name, self.container):
+            while True:
+                resp = retry(get, container)
+                body = resp.read()
+                if resp.status == 404:
+                    break
+                self.assertEqual(resp.status // 100, 2, resp.status)
+                objs = json.loads(body)
+                if not objs:
+                    break
+                for obj in objs:
+                    resp = retry(delete, container, obj)
+                    resp.read()
+                    # Under load, container listing may not upate immediately,
+                    # so we may attempt to delete the same object multiple
+                    # times. Tolerate the object having already been deleted.
+                    self.assertIn(resp.status, (204, 404))
+
+        def delete(url, token, parsed, conn, container):
+            conn.request('DELETE', parsed.path + '/' + container, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        for container in (self.name, self.container):
+            resp = retry(delete, container)
+            resp.read()
+            # self.container may not have been created at all, but even if it
+            # has, for either container there may be a failure that trips the
+            # retry despite the request having been successfully processed.
+            self.assertIn(resp.status, (204, 404))
+
+    def test_GET_HEAD_content_type(self):
+
+        def send_req(url, token, parsed, conn, method, container, params):
+            qs = '?%s' % urllib.parse.urlencode(params) if params else ''
+            conn.request(method, parsed.path + '/' + container + qs, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        resp = retry(send_req, 'GET', self.name, {})
+        # GET is still 204 if there's no objects!?
+        self.assertEqual(resp.status, 204)
+        # we respond text/plain by default
+        self.assertEqual(resp.getheader('Content-Type'),
+                         'text/plain; charset=utf-8')
+        self.assertEqual(resp.getheader('Content-Length'), '0')
+
+        resp = retry(send_req, 'HEAD', self.name, {})
+        # HEAD will *always* 204
+        self.assertEqual(resp.status, 204)
+        self.assertEqual(resp.getheader('Content-Type'),
+                         'text/plain; charset=utf-8')
+        self.assertEqual(resp.getheader('Content-Length'), '0')
+
+        def put_object(url, token, parsed, conn, container, obj_name):
+            conn.request('PUT', '/'.join((parsed.path, container, obj_name)),
+                         '', {'X-Auth-Token': token})
+            return check_response(conn)
+
+        resp = retry(put_object, self.name, 'obj1')
+        self.assertEqual(resp.status, 201)
+
+        resp = retry(send_req, 'GET', self.name, {})
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(resp.getheader('Content-Type'),
+                         'text/plain; charset=utf-8')
+
+        resp = retry(send_req, 'HEAD', self.name, {})
+        # HEAD will *always* 204
+        self.assertEqual(resp.status, 204)
+        self.assertEqual(resp.getheader('Content-Type'),
+                         'text/plain; charset=utf-8')
+        self.assertEqual(resp.getheader('Content-Length'), '0')
+
+        # and we can ask for our preferred encoding format
+        resp = retry(send_req, 'GET', self.name, {'format': 'json'})
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(resp.getheader('Content-Type'),
+                         'application/json; charset=utf-8')
+        resp = retry(send_req, 'HEAD', self.name, {'format': 'json'})
+        self.assertEqual(resp.status, 204)
+        self.assertEqual(resp.getheader('Content-Type'),
+                         'application/json; charset=utf-8')
+        self.assertEqual(resp.getheader('Content-Length'), '0')
+
+        resp = retry(send_req, 'GET', self.name, {'format': 'xml'})
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(resp.getheader('Content-Type'),
+                         'application/xml; charset=utf-8')
+        resp = retry(send_req, 'HEAD', self.name, {'format': 'xml'})
+        self.assertEqual(resp.status, 204)
+        self.assertEqual(resp.getheader('Content-Type'),
+                         'application/xml; charset=utf-8')
+        self.assertEqual(resp.getheader('Content-Length'), '0')
+
+    def test_multi_metadata(self):
+        if tf.skip:
+            raise SkipTest
+
+        def post(url, token, parsed, conn, name, value):
+            conn.request('POST', parsed.path + '/' + self.name, '',
+                         {'X-Auth-Token': token, name: value})
+            return check_response(conn)
+
+        def head(url, token, parsed, conn):
+            conn.request('HEAD', parsed.path + '/' + self.name, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        resp = retry(post, 'X-Container-Meta-One', '1')
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(head)
+        resp.read()
+        self.assertIn(resp.status, (200, 204))
+        self.assertEqual(resp.getheader('x-container-meta-one'), '1')
+        resp = retry(post, 'X-Container-Meta-Two', '2')
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(head)
+        resp.read()
+        self.assertIn(resp.status, (200, 204))
+        self.assertEqual(resp.getheader('x-container-meta-one'), '1')
+        self.assertEqual(resp.getheader('x-container-meta-two'), '2')
+
+    def test_unicode_metadata(self):
+        if tf.skip:
+            raise SkipTest
+
+        def post(url, token, parsed, conn, name, value):
+            conn.request('POST', parsed.path + '/' + self.name, '',
+                         {'X-Auth-Token': token, name: value})
+            return check_response(conn)
+
+        def head(url, token, parsed, conn):
+            conn.request('HEAD', parsed.path + '/' + self.name, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        uni_value = u'uni\u0E12'
+        # Note that py3 has issues with non-ascii header names; see
+        # https://bugs.python.org/issue37093 -- so we won't test with unicode
+        # header names
+        resp = retry(post, 'X-Container-Meta-uni', uni_value)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(head)
+        resp.read()
+        self.assertIn(resp.status, (200, 204))
+        self.assertEqual(resp.getheader('X-Container-Meta-uni'),
+                         uni_value)
+
+    def test_PUT_metadata(self):
+        if tf.skip:
+            raise SkipTest
+
+        def put(url, token, parsed, conn, name, value):
+            conn.request('PUT', parsed.path + '/' + name, '',
+                         {'X-Auth-Token': token,
+                          'X-Container-Meta-Test': value})
+            return check_response(conn)
+
+        def head(url, token, parsed, conn, name):
+            conn.request('HEAD', parsed.path + '/' + name, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def get(url, token, parsed, conn, name):
+            conn.request('GET', parsed.path + '/' + name, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def delete(url, token, parsed, conn, name):
+            conn.request('DELETE', parsed.path + '/' + name, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        name = uuid4().hex
+        resp = retry(put, name, 'Value')
+        resp.read()
+        self.assertIn(resp.status, (201, 202))
+        resp = retry(head, name)
+        resp.read()
+        self.assertIn(resp.status, (200, 204))
+        self.assertEqual(resp.getheader('x-container-meta-test'), 'Value')
+        resp = retry(get, name)
+        resp.read()
+        self.assertIn(resp.status, (200, 204))
+        self.assertEqual(resp.getheader('x-container-meta-test'), 'Value')
+        resp = retry(delete, name)
+        resp.read()
+        self.assertIn(resp.status, (204, 404))
+
+        name = uuid4().hex
+        resp = retry(put, name, '')
+        resp.read()
+        self.assertIn(resp.status, (201, 202))
+        resp = retry(head, name)
+        resp.read()
+        self.assertIn(resp.status, (200, 204))
+        self.assertIsNone(resp.getheader('x-container-meta-test'))
+        resp = retry(get, name)
+        resp.read()
+        self.assertIn(resp.status, (200, 204))
+        self.assertIsNone(resp.getheader('x-container-meta-test'))
+        resp = retry(delete, name)
+        resp.read()
+        self.assertIn(resp.status, (204, 404))
+
+    def test_POST_metadata(self):
+        if tf.skip:
+            raise SkipTest
+
+        def post(url, token, parsed, conn, value):
+            conn.request('POST', parsed.path + '/' + self.name, '',
+                         {'X-Auth-Token': token,
+                          'X-Container-Meta-Test': value})
+            return check_response(conn)
+
+        def head(url, token, parsed, conn):
+            conn.request('HEAD', parsed.path + '/' + self.name, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def get(url, token, parsed, conn):
+            conn.request('GET', parsed.path + '/' + self.name, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        resp = retry(head)
+        resp.read()
+        self.assertIn(resp.status, (200, 204))
+        self.assertIsNone(resp.getheader('x-container-meta-test'))
+        resp = retry(get)
+        resp.read()
+        self.assertIn(resp.status, (200, 204))
+        self.assertIsNone(resp.getheader('x-container-meta-test'))
+        resp = retry(post, 'Value')
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(head)
+        resp.read()
+        self.assertIn(resp.status, (200, 204))
+        self.assertEqual(resp.getheader('x-container-meta-test'), 'Value')
+        resp = retry(get)
+        resp.read()
+        self.assertIn(resp.status, (200, 204))
+        self.assertEqual(resp.getheader('x-container-meta-test'), 'Value')
+
+    def test_PUT_bad_metadata(self):
+        if tf.skip:
+            raise SkipTest
+
+        def put(url, token, parsed, conn, name, extra_headers):
+            headers = {'X-Auth-Token': token}
+            headers.update(extra_headers)
+            conn.request('PUT', parsed.path + '/' + name, '', headers)
+            return check_response(conn)
+
+        def delete(url, token, parsed, conn, name):
+            conn.request('DELETE', parsed.path + '/' + name, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        name = uuid4().hex
+        resp = retry(
+            put, name,
+            {'X-Container-Meta-' + ('k' * self.max_meta_name_length): 'v'})
+        resp.read()
+        self.assertIn(resp.status, (201, 202))
+        resp = retry(delete, name)
+        resp.read()
+        self.assertIn(resp.status, (204, 404))
+        name = uuid4().hex
+        resp = retry(
+            put, name,
+            {'X-Container-Meta-' + (
+                'k' * (self.max_meta_name_length + 1)): 'v'})
+        resp.read()
+        self.assertEqual(resp.status, 400)
+        resp = retry(delete, name)
+        resp.read()
+        self.assertEqual(resp.status, 404)
+
+        name = uuid4().hex
+        resp = retry(
+            put, name,
+            {'X-Container-Meta-Too-Long': 'k' * self.max_meta_value_length})
+        resp.read()
+        self.assertIn(resp.status, (201, 202))
+        resp = retry(delete, name)
+        resp.read()
+        self.assertIn(resp.status, (204, 404))
+        name = uuid4().hex
+        resp = retry(
+            put, name,
+            {'X-Container-Meta-Too-Long': 'k' * (
+                self.max_meta_value_length + 1)})
+        resp.read()
+        self.assertEqual(resp.status, 400)
+        resp = retry(delete, name)
+        resp.read()
+        self.assertEqual(resp.status, 404)
+
+        name = uuid4().hex
+        headers = {}
+        for x in range(self.max_meta_count):
+            headers['X-Container-Meta-%d' % x] = 'v'
+        resp = retry(put, name, headers)
+        resp.read()
+        self.assertIn(resp.status, (201, 202))
+        resp = retry(delete, name)
+        resp.read()
+        self.assertIn(resp.status, (204, 404))
+        name = uuid4().hex
+        headers = {}
+        for x in range(self.max_meta_count + 1):
+            headers['X-Container-Meta-%d' % x] = 'v'
+        resp = retry(put, name, headers)
+        resp.read()
+        self.assertEqual(resp.status, 400)
+        resp = retry(delete, name)
+        resp.read()
+        self.assertEqual(resp.status, 404)
+
+        name = uuid4().hex
+        headers = {}
+        header_value = 'k' * self.max_meta_value_length
+        size = 0
+        x = 0
+        while size < (self.max_meta_overall_size - 4
+                      - self.max_meta_value_length):
+            size += 4 + self.max_meta_value_length
+            headers['X-Container-Meta-%04d' % x] = header_value
+            x += 1
+        if self.max_meta_overall_size - size > 1:
+            headers['X-Container-Meta-k'] = \
+                'v' * (self.max_meta_overall_size - size - 1)
+        resp = retry(put, name, headers)
+        resp.read()
+        self.assertIn(resp.status, (201, 202))
+        resp = retry(delete, name)
+        resp.read()
+        self.assertIn(resp.status, (204, 404))
+        name = uuid4().hex
+        headers['X-Container-Meta-k'] = \
+            'v' * (self.max_meta_overall_size - size)
+        resp = retry(put, name, headers)
+        resp.read()
+        self.assertEqual(resp.status, 400)
+        resp = retry(delete, name)
+        resp.read()
+        self.assertEqual(resp.status, 404)
+
+    def test_POST_bad_metadata(self):
+        if tf.skip:
+            raise SkipTest
+
+        def post(url, token, parsed, conn, extra_headers):
+            headers = {'X-Auth-Token': token}
+            headers.update(extra_headers)
+            conn.request('POST', parsed.path + '/' + self.name, '', headers)
+            return check_response(conn)
+
+        resp = retry(
+            post,
+            {'X-Container-Meta-' + ('k' * self.max_meta_name_length): 'v'})
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        # Clear it, so the value-length checking doesn't accidentally trip
+        # the overall max
+        resp = retry(
+            post,
+            {'X-Container-Meta-' + ('k' * self.max_meta_name_length): ''})
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(
+            post,
+            {'X-Container-Meta-' + (
+                'k' * (self.max_meta_name_length + 1)): 'v'})
+        resp.read()
+        self.assertEqual(resp.status, 400)
+
+        resp = retry(
+            post,
+            {'X-Container-Meta-Too-Long': 'k' * self.max_meta_value_length})
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(
+            post,
+            {'X-Container-Meta-Too-Long': 'k' * (
+                self.max_meta_value_length + 1)})
+        resp.read()
+        self.assertEqual(resp.status, 400)
+
+    def test_POST_bad_metadata2(self):
+        if tf.skip:
+            raise SkipTest
+
+        def post(url, token, parsed, conn, extra_headers):
+            headers = {'X-Auth-Token': token}
+            headers.update(extra_headers)
+            conn.request('POST', parsed.path + '/' + self.name, '', headers)
+            return check_response(conn)
+
+        headers = {}
+        for x in range(self.max_meta_count):
+            headers['X-Container-Meta-%d' % x] = 'v'
+        resp = retry(post, headers)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        headers = {}
+        for x in range(self.max_meta_count + 1):
+            headers['X-Container-Meta-%d' % x] = 'v'
+        resp = retry(post, headers)
+        resp.read()
+        self.assertEqual(resp.status, 400)
+
+    def test_POST_bad_metadata3(self):
+        if tf.skip:
+            raise SkipTest
+
+        if tf.in_process:
+            tf.skip_if_no_xattrs()
+
+        def post(url, token, parsed, conn, extra_headers):
+            headers = {'X-Auth-Token': token}
+            headers.update(extra_headers)
+            conn.request('POST', parsed.path + '/' + self.name, '', headers)
+            return check_response(conn)
+
+        headers = {}
+        header_value = 'k' * self.max_meta_value_length
+        size = 0
+        x = 0
+        while size < (self.max_meta_overall_size - 4
+                      - self.max_meta_value_length):
+            size += 4 + self.max_meta_value_length
+            headers['X-Container-Meta-%04d' % x] = header_value
+            x += 1
+        if self.max_meta_overall_size - size > 1:
+            headers['X-Container-Meta-k'] = \
+                'v' * (self.max_meta_overall_size - size - 1)
+        resp = retry(post, headers)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        # this POST includes metadata size that is over limit
+        headers['X-Container-Meta-k'] = \
+            'x' * (self.max_meta_overall_size - size)
+        resp = retry(post, headers)
+        resp.read()
+        self.assertEqual(resp.status, 400)
+        # this POST would be ok and the aggregate backend metadata
+        # size is on the border
+        headers = {'X-Container-Meta-k':
+                   'y' * (self.max_meta_overall_size - size - 1)}
+        resp = retry(post, headers)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        # this last POST would be ok by itself but takes the aggregate
+        # backend metadata size over limit
+        headers = {'X-Container-Meta-k':
+                   'z' * (self.max_meta_overall_size - size)}
+        resp = retry(post, headers)
+        resp.read()
+        self.assertEqual(resp.status, 400)
+
+    def test_public_container(self):
+        if tf.skip:
+            raise SkipTest
+
+        def get(url, token, parsed, conn):
+            conn.request('GET', parsed.path + '/' + self.name)
+            return check_response(conn)
+
+        try:
+            resp = retry(get)
+            raise Exception('Should not have been able to GET')
+        except Exception as err:
+            self.assertTrue(str(err).startswith('No result after '), err)
+
+        def post(url, token, parsed, conn):
+            conn.request('POST', parsed.path + '/' + self.name, '',
+                         {'X-Auth-Token': token,
+                          'X-Container-Read': '.r:*,.rlistings'})
+            return check_response(conn)
+
+        resp = retry(post)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(get)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        def post(url, token, parsed, conn):
+            conn.request('POST', parsed.path + '/' + self.name, '',
+                         {'X-Auth-Token': token, 'X-Container-Read': ''})
+            return check_response(conn)
+
+        resp = retry(post)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        try:
+            resp = retry(get)
+            raise Exception('Should not have been able to GET')
+        except Exception as err:
+            self.assertTrue(str(err).startswith('No result after '), err)
+
+    def test_cross_account_container(self):
+        if tf.skip or tf.skip2:
+            raise SkipTest
+        # Obtain the first account's string
+        first_account = ['unknown']
+
+        def get1(url, token, parsed, conn):
+            first_account[0] = parsed.path
+            conn.request('HEAD', parsed.path + '/' + self.name, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        resp = retry(get1)
+        resp.read()
+
+        # Ensure we can't access the container with the second account
+        def get2(url, token, parsed, conn):
+            conn.request('GET', first_account[0] + '/' + self.name, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        resp = retry(get2, use_account=2)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # Make the container accessible by the second account
+        def post(url, token, parsed, conn):
+            conn.request('POST', parsed.path + '/' + self.name, '',
+                         {'X-Auth-Token': token,
+                          'X-Container-Read': tf.swift_test_perm[1],
+                          'X-Container-Write': tf.swift_test_perm[1]})
+            return check_response(conn)
+
+        resp = retry(post)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        # Ensure we can now use the container with the second account
+        resp = retry(get2, use_account=2)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        # Make the container private again
+        def post(url, token, parsed, conn):
+            conn.request('POST', parsed.path + '/' + self.name, '',
+                         {'X-Auth-Token': token, 'X-Container-Read': '',
+                          'X-Container-Write': ''})
+            return check_response(conn)
+
+        resp = retry(post)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        # Ensure we can't access the container with the second account again
+        resp = retry(get2, use_account=2)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+    def test_cross_account_public_container(self):
+        if tf.skip or tf.skip2:
+            raise SkipTest
+
+        if tf.in_process:
+            tf.skip_if_no_xattrs()
+        # Obtain the first account's string
+        first_account = ['unknown']
+
+        def get1(url, token, parsed, conn):
+            first_account[0] = parsed.path
+            conn.request('HEAD', parsed.path + '/' + self.name, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        resp = retry(get1)
+        resp.read()
+
+        # Ensure we can't access the container with the second account
+        def get2(url, token, parsed, conn):
+            conn.request('GET', first_account[0] + '/' + self.name, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        resp = retry(get2, use_account=2)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # Make the container completely public
+        def post(url, token, parsed, conn):
+            conn.request('POST', parsed.path + '/' + self.name, '',
+                         {'X-Auth-Token': token,
+                          'X-Container-Read': '.r:*,.rlistings'})
+            return check_response(conn)
+
+        resp = retry(post)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        # Ensure we can now read the container with the second account
+        resp = retry(get2, use_account=2)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        # But we shouldn't be able to write with the second account
+        def put2(url, token, parsed, conn):
+            conn.request('PUT', first_account[0] + '/' + self.name + '/object',
+                         'test object', {'X-Auth-Token': token})
+            return check_response(conn)
+
+        resp = retry(put2, use_account=2)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # Now make the container also writable by the second account
+        def post(url, token, parsed, conn):
+            conn.request('POST', parsed.path + '/' + self.name, '',
+                         {'X-Auth-Token': token,
+                          'X-Container-Write': tf.swift_test_perm[1]})
+            return check_response(conn)
+
+        resp = retry(post)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        # Ensure we can still read the container with the second account
+        resp = retry(get2, use_account=2)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        # And that we can now write with the second account
+        resp = retry(put2, use_account=2)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+
+    def test_nonadmin_user(self):
+        if tf.skip or tf.skip3:
+            raise SkipTest
+
+        if tf.in_process:
+            tf.skip_if_no_xattrs()
+        # Obtain the first account's string
+        first_account = ['unknown']
+
+        def get1(url, token, parsed, conn):
+            first_account[0] = parsed.path
+            conn.request('HEAD', parsed.path + '/' + self.name, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        resp = retry(get1)
+        resp.read()
+
+        # Ensure we can't access the container with the third account
+        def get3(url, token, parsed, conn):
+            conn.request('GET', first_account[0] + '/' + self.name, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        resp = retry(get3, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # Make the container accessible by the third account
+        def post(url, token, parsed, conn):
+            conn.request('POST', parsed.path + '/' + self.name, '',
+                         {'X-Auth-Token': token,
+                          'X-Container-Read': tf.swift_test_perm[2]})
+            return check_response(conn)
+
+        resp = retry(post)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        # Ensure we can now read the container with the third account
+        resp = retry(get3, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        # But we shouldn't be able to write with the third account
+        def put3(url, token, parsed, conn):
+            conn.request('PUT', first_account[0] + '/' + self.name + '/object',
+                         'test object', {'X-Auth-Token': token})
+            return check_response(conn)
+
+        resp = retry(put3, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # Now make the container also writable by the third account
+        def post(url, token, parsed, conn):
+            conn.request('POST', parsed.path + '/' + self.name, '',
+                         {'X-Auth-Token': token,
+                          'X-Container-Write': tf.swift_test_perm[2]})
+            return check_response(conn)
+
+        resp = retry(post)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        # Ensure we can still read the container with the third account
+        resp = retry(get3, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        # And that we can now write with the third account
+        resp = retry(put3, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+
+    @requires_acls
+    def test_read_only_acl_listings(self):
+        if tf.skip3:
+            raise SkipTest
+
+        def get(url, token, parsed, conn):
+            conn.request('GET', parsed.path, '', {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def post_account(url, token, parsed, conn, headers):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('POST', parsed.path, '', new_headers)
+            return check_response(conn)
+
+        def put(url, token, parsed, conn, name):
+            conn.request('PUT', parsed.path + '/%s' % name, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        # cannot list containers
+        resp = retry(get, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # grant read-only access
+        acl_user = tf.swift_test_user[2]
+        acl = {'read-only': [acl_user]}
+        headers = {'x-account-access-control': json.dumps(acl)}
+        resp = retry(post_account, headers=headers, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        # read-only can list containers
+        resp = retry(get, use_account=3)
+        listing = resp.read().decode('utf8')
+        self.assertEqual(resp.status, 200)
+        self.assertIn(self.name, listing)
+
+        # read-only can not create containers
+        new_container_name = str(uuid4())
+        resp = retry(put, new_container_name, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # but it can see newly created ones
+        resp = retry(put, new_container_name, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+        resp = retry(get, use_account=3)
+        listing = resp.read().decode('utf8')
+        self.assertEqual(resp.status, 200)
+        self.assertIn(new_container_name, listing)
+
+    @requires_acls
+    def test_read_only_acl_metadata(self):
+        if tf.skip3:
+            raise SkipTest
+
+        def get(url, token, parsed, conn, name):
+            conn.request('GET', parsed.path + '/%s' % name, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def post_account(url, token, parsed, conn, headers):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('POST', parsed.path, '', new_headers)
+            return check_response(conn)
+
+        def post(url, token, parsed, conn, name, headers):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('POST', parsed.path + '/%s' % name, '', new_headers)
+            return check_response(conn)
+
+        # add some metadata
+        value = str(uuid4())
+        headers = {'x-container-meta-test': value}
+        resp = retry(post, self.name, headers=headers, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(get, self.name, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        self.assertEqual(resp.getheader('X-Container-Meta-Test'), value)
+
+        # cannot see metadata
+        resp = retry(get, self.name, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # grant read-only access
+        acl_user = tf.swift_test_user[2]
+        acl = {'read-only': [acl_user]}
+        headers = {'x-account-access-control': json.dumps(acl)}
+        resp = retry(post_account, headers=headers, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        # read-only can NOT write container metadata
+        new_value = str(uuid4())
+        headers = {'x-container-meta-test': new_value}
+        resp = retry(post, self.name, headers=headers, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # read-only can read container metadata
+        resp = retry(get, self.name, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        self.assertEqual(resp.getheader('X-Container-Meta-Test'), value)
+
+    @requires_acls
+    def test_read_write_acl_listings(self):
+        if tf.skip3:
+            raise SkipTest
+
+        def get(url, token, parsed, conn):
+            conn.request('GET', parsed.path, '', {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def post(url, token, parsed, conn, headers):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('POST', parsed.path, '', new_headers)
+            return check_response(conn)
+
+        def put(url, token, parsed, conn, name):
+            conn.request('PUT', parsed.path + '/%s' % name, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def delete(url, token, parsed, conn, name):
+            conn.request('DELETE', parsed.path + '/%s' % name, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        # cannot list containers
+        resp = retry(get, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # grant read-write access
+        acl_user = tf.swift_test_user[2]
+        acl = {'read-write': [acl_user]}
+        headers = {'x-account-access-control': json.dumps(acl)}
+        resp = retry(post, headers=headers, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        # can list containers
+        resp = retry(get, use_account=3)
+        listing = resp.read().decode('utf8')
+        self.assertEqual(resp.status, 200)
+        self.assertIn(self.name, listing)
+
+        # can create new containers
+        new_container_name = str(uuid4())
+        resp = retry(put, new_container_name, use_account=3)
+        resp.read()
+        self.assertIn(resp.status, (201, 202))
+        resp = retry(get, use_account=3)
+        listing = resp.read().decode('utf8')
+        self.assertEqual(resp.status, 200)
+        self.assertIn(new_container_name, listing)
+
+        # can also delete them
+        resp = retry(delete, new_container_name, use_account=3)
+        resp.read()
+        self.assertIn(resp.status, (204, 404))
+        resp = retry(get, use_account=3)
+        listing = resp.read().decode('utf8')
+        self.assertEqual(resp.status, 200)
+        self.assertNotIn(new_container_name, listing)
+
+        # even if they didn't create them
+        empty_container_name = str(uuid4())
+        resp = retry(put, empty_container_name, use_account=1)
+        resp.read()
+        self.assertIn(resp.status, (201, 202))
+        resp = retry(delete, empty_container_name, use_account=3)
+        resp.read()
+        self.assertIn(resp.status, (204, 404))
+
+    @requires_acls
+    def test_read_write_acl_metadata(self):
+        if tf.skip3:
+            raise SkipTest
+
+        def get(url, token, parsed, conn, name):
+            conn.request('GET', parsed.path + '/%s' % name, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def post_account(url, token, parsed, conn, headers):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('POST', parsed.path, '', new_headers)
+            return check_response(conn)
+
+        def post(url, token, parsed, conn, name, headers):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('POST', parsed.path + '/%s' % name, '', new_headers)
+            return check_response(conn)
+
+        # add some metadata
+        value = str(uuid4())
+        headers = {'x-container-meta-test': value}
+        resp = retry(post, self.name, headers=headers, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(get, self.name, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        self.assertEqual(resp.getheader('X-Container-Meta-Test'), value)
+
+        # cannot see metadata
+        resp = retry(get, self.name, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # grant read-write access
+        acl_user = tf.swift_test_user[2]
+        acl = {'read-write': [acl_user]}
+        headers = {'x-account-access-control': json.dumps(acl)}
+        resp = retry(post_account, headers=headers, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        # read-write can read container metadata
+        resp = retry(get, self.name, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        self.assertEqual(resp.getheader('X-Container-Meta-Test'), value)
+
+        # read-write can also write container metadata
+        new_value = str(uuid4())
+        headers = {'x-container-meta-test': new_value}
+        resp = retry(post, self.name, headers=headers, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(get, self.name, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        self.assertEqual(resp.getheader('X-Container-Meta-Test'), new_value)
+
+        # and remove it
+        headers = {'x-remove-container-meta-test': 'true'}
+        resp = retry(post, self.name, headers=headers, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(get, self.name, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        self.assertIsNone(resp.getheader('X-Container-Meta-Test'))
+
+    @requires_acls
+    def test_admin_acl_listing(self):
+        if tf.skip3:
+            raise SkipTest
+
+        def get(url, token, parsed, conn):
+            conn.request('GET', parsed.path, '', {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def post(url, token, parsed, conn, headers):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('POST', parsed.path, '', new_headers)
+            return check_response(conn)
+
+        def put(url, token, parsed, conn, name):
+            conn.request('PUT', parsed.path + '/%s' % name, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def delete(url, token, parsed, conn, name):
+            conn.request('DELETE', parsed.path + '/%s' % name, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        # cannot list containers
+        resp = retry(get, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # grant admin access
+        acl_user = tf.swift_test_user[2]
+        acl = {'admin': [acl_user]}
+        headers = {'x-account-access-control': json.dumps(acl)}
+        resp = retry(post, headers=headers, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        # can list containers
+        resp = retry(get, use_account=3)
+        listing = resp.read().decode('utf8')
+        self.assertEqual(resp.status, 200)
+        self.assertIn(self.name, listing)
+
+        # can create new containers
+        new_container_name = str(uuid4())
+        resp = retry(put, new_container_name, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+        resp = retry(get, use_account=3)
+        listing = resp.read().decode('utf8')
+        self.assertEqual(resp.status, 200)
+        self.assertIn(new_container_name, listing)
+
+        # can also delete them
+        resp = retry(delete, new_container_name, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(get, use_account=3)
+        listing = resp.read().decode('utf8')
+        self.assertEqual(resp.status, 200)
+        self.assertNotIn(new_container_name, listing)
+
+        # even if they didn't create them
+        empty_container_name = str(uuid4())
+        resp = retry(put, empty_container_name, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+        resp = retry(delete, empty_container_name, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+    @requires_acls
+    def test_admin_acl_metadata(self):
+        if tf.skip3:
+            raise SkipTest
+
+        def get(url, token, parsed, conn, name):
+            conn.request('GET', parsed.path + '/%s' % name, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def post_account(url, token, parsed, conn, headers):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('POST', parsed.path, '', new_headers)
+            return check_response(conn)
+
+        def post(url, token, parsed, conn, name, headers):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('POST', parsed.path + '/%s' % name, '', new_headers)
+            return check_response(conn)
+
+        # add some metadata
+        value = str(uuid4())
+        headers = {'x-container-meta-test': value}
+        resp = retry(post, self.name, headers=headers, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(get, self.name, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        self.assertEqual(resp.getheader('X-Container-Meta-Test'), value)
+
+        # cannot see metadata
+        resp = retry(get, self.name, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # grant access
+        acl_user = tf.swift_test_user[2]
+        acl = {'admin': [acl_user]}
+        headers = {'x-account-access-control': json.dumps(acl)}
+        resp = retry(post_account, headers=headers, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        # can read container metadata
+        resp = retry(get, self.name, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        self.assertEqual(resp.getheader('X-Container-Meta-Test'), value)
+
+        # can also write container metadata
+        new_value = str(uuid4())
+        headers = {'x-container-meta-test': new_value}
+        resp = retry(post, self.name, headers=headers, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(get, self.name, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        self.assertEqual(resp.getheader('X-Container-Meta-Test'), new_value)
+
+        # and remove it
+        headers = {'x-remove-container-meta-test': 'true'}
+        resp = retry(post, self.name, headers=headers, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(get, self.name, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        self.assertIsNone(resp.getheader('X-Container-Meta-Test'))
+
+    @requires_acls
+    def test_protected_container_sync(self):
+        if tf.skip3:
+            raise SkipTest
+
+        def get(url, token, parsed, conn, name):
+            conn.request('GET', parsed.path + '/%s' % name, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def post_account(url, token, parsed, conn, headers):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('POST', parsed.path, '', new_headers)
+            return check_response(conn)
+
+        def post(url, token, parsed, conn, name, headers):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('POST', parsed.path + '/%s' % name, '', new_headers)
+            return check_response(conn)
+
+        # add some metadata
+        value = str(uuid4())
+        headers = {
+            'x-container-sync-key': 'secret',
+            'x-container-meta-test': value,
+        }
+        resp = retry(post, self.name, headers=headers, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(get, self.name, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        self.assertEqual(resp.getheader('X-Container-Sync-Key'), 'secret')
+        self.assertEqual(resp.getheader('X-Container-Meta-Test'), value)
+
+        # grant read-only access
+        acl_user = tf.swift_test_user[2]
+        acl = {'read-only': [acl_user]}
+        headers = {'x-account-access-control': json.dumps(acl)}
+        resp = retry(post_account, headers=headers, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        # can read container metadata
+        resp = retry(get, self.name, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        self.assertEqual(resp.getheader('X-Container-Meta-Test'), value)
+        # but not sync-key
+        self.assertIsNone(resp.getheader('X-Container-Sync-Key'))
+
+        # and can not write
+        headers = {'x-container-sync-key': str(uuid4())}
+        resp = retry(post, self.name, headers=headers, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # grant read-write access
+        acl_user = tf.swift_test_user[2]
+        acl = {'read-write': [acl_user]}
+        headers = {'x-account-access-control': json.dumps(acl)}
+        resp = retry(post_account, headers=headers, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        # can read container metadata
+        resp = retry(get, self.name, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        self.assertEqual(resp.getheader('X-Container-Meta-Test'), value)
+        # but not sync-key
+        self.assertIsNone(resp.getheader('X-Container-Sync-Key'))
+
+        # sanity check sync-key w/ account1
+        resp = retry(get, self.name, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        self.assertEqual(resp.getheader('X-Container-Sync-Key'), 'secret')
+
+        # and can write
+        new_value = str(uuid4())
+        headers = {
+            'x-container-sync-key': str(uuid4()),
+            'x-container-meta-test': new_value,
+        }
+        resp = retry(post, self.name, headers=headers, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(get, self.name, use_account=1)  # validate w/ account1
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        self.assertEqual(resp.getheader('X-Container-Meta-Test'), new_value)
+        # but can not write sync-key
+        self.assertEqual(resp.getheader('X-Container-Sync-Key'), 'secret')
+
+        # grant admin access
+        acl_user = tf.swift_test_user[2]
+        acl = {'admin': [acl_user]}
+        headers = {'x-account-access-control': json.dumps(acl)}
+        resp = retry(post_account, headers=headers, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        # admin can read container metadata
+        resp = retry(get, self.name, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        self.assertEqual(resp.getheader('X-Container-Meta-Test'), new_value)
+        # and ALSO sync-key
+        self.assertEqual(resp.getheader('X-Container-Sync-Key'), 'secret')
+
+        # admin tester3 can even change sync-key
+        new_secret = str(uuid4())
+        headers = {'x-container-sync-key': new_secret}
+        resp = retry(post, self.name, headers=headers, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(get, self.name, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        self.assertEqual(resp.getheader('X-Container-Sync-Key'), new_secret)
+
+    @requires_acls
+    def test_protected_container_acl(self):
+        if tf.skip3:
+            raise SkipTest
+
+        def get(url, token, parsed, conn, name):
+            conn.request('GET', parsed.path + '/%s' % name, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def post_account(url, token, parsed, conn, headers):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('POST', parsed.path, '', new_headers)
+            return check_response(conn)
+
+        def post(url, token, parsed, conn, name, headers):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('POST', parsed.path + '/%s' % name, '', new_headers)
+            return check_response(conn)
+
+        # add some container acls
+        value = str(uuid4())
+        headers = {
+            'x-container-read': 'jdoe',
+            'x-container-write': 'jdoe',
+            'x-container-meta-test': value,
+        }
+        resp = retry(post, self.name, headers=headers, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(get, self.name, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        self.assertEqual(resp.getheader('X-Container-Read'), 'jdoe')
+        self.assertEqual(resp.getheader('X-Container-Write'), 'jdoe')
+        self.assertEqual(resp.getheader('X-Container-Meta-Test'), value)
+
+        # grant read-only access
+        acl_user = tf.swift_test_user[2]
+        acl = {'read-only': [acl_user]}
+        headers = {'x-account-access-control': json.dumps(acl)}
+        resp = retry(post_account, headers=headers, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        # can read container metadata
+        resp = retry(get, self.name, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        self.assertEqual(resp.getheader('X-Container-Meta-Test'), value)
+        # but not container acl
+        self.assertIsNone(resp.getheader('X-Container-Read'))
+        self.assertIsNone(resp.getheader('X-Container-Write'))
+
+        # and can not write
+        headers = {
+            'x-container-read': 'frank',
+            'x-container-write': 'frank',
+        }
+        resp = retry(post, self.name, headers=headers, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # grant read-write access
+        acl_user = tf.swift_test_user[2]
+        acl = {'read-write': [acl_user]}
+        headers = {'x-account-access-control': json.dumps(acl)}
+        resp = retry(post_account, headers=headers, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        # can read container metadata
+        resp = retry(get, self.name, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        self.assertEqual(resp.getheader('X-Container-Meta-Test'), value)
+        # but not container acl
+        self.assertIsNone(resp.getheader('X-Container-Read'))
+        self.assertIsNone(resp.getheader('X-Container-Write'))
+
+        # sanity check container acls with account1
+        resp = retry(get, self.name, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        self.assertEqual(resp.getheader('X-Container-Read'), 'jdoe')
+        self.assertEqual(resp.getheader('X-Container-Write'), 'jdoe')
+
+        # and can write
+        new_value = str(uuid4())
+        headers = {
+            'x-container-read': 'frank',
+            'x-container-write': 'frank',
+            'x-container-meta-test': new_value,
+        }
+        resp = retry(post, self.name, headers=headers, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(get, self.name, use_account=1)  # validate w/ account1
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        self.assertEqual(resp.getheader('X-Container-Meta-Test'), new_value)
+        # but can not write container acls
+        self.assertEqual(resp.getheader('X-Container-Read'), 'jdoe')
+        self.assertEqual(resp.getheader('X-Container-Write'), 'jdoe')
+
+        # grant admin access
+        acl_user = tf.swift_test_user[2]
+        acl = {'admin': [acl_user]}
+        headers = {'x-account-access-control': json.dumps(acl)}
+        resp = retry(post_account, headers=headers, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        # admin can read container metadata
+        resp = retry(get, self.name, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        self.assertEqual(resp.getheader('X-Container-Meta-Test'), new_value)
+        # and ALSO container acls
+        self.assertEqual(resp.getheader('X-Container-Read'), 'jdoe')
+        self.assertEqual(resp.getheader('X-Container-Write'), 'jdoe')
+
+        # admin tester3 can even change container acls
+        new_value = str(uuid4())
+        headers = {
+            'x-container-read': '.r:*',
+        }
+        resp = retry(post, self.name, headers=headers, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(get, self.name, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        self.assertEqual(resp.getheader('X-Container-Read'), '.r:*')
+
+    def test_long_name_content_type(self):
+        if tf.skip:
+            raise SkipTest
+
+        def put(url, token, parsed, conn):
+            container_name = 'X' * 2048
+            conn.request('PUT', '%s/%s' % (parsed.path, container_name),
+                         'there', {'X-Auth-Token': token})
+            return check_response(conn)
+
+        resp = retry(put)
+        resp.read()
+        self.assertEqual(resp.status, 400)
+        self.assertEqual(resp.getheader('Content-Type'),
+                         'text/html; charset=UTF-8')
+
+    def test_null_name(self):
+        if tf.skip:
+            raise SkipTest
+
+        def put(url, token, parsed, conn):
+            conn.request('PUT', '%s/abc%%00def' % parsed.path, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        resp = retry(put)
+        if (tf.web_front_end == 'apache2'):
+            self.assertEqual(resp.status, 404)
+        else:
+            self.assertEqual(resp.read(), b'Invalid UTF8 or contains NULL')
+            self.assertEqual(resp.status, 412)
+
+    def test_create_container_gets_default_policy_by_default(self):
+        try:
+            default_policy = \
+                tf.FunctionalStoragePolicyCollection.from_info().default
+        except AssertionError:
+            raise SkipTest()
+
+        def put(url, token, parsed, conn):
+            # using the empty storage policy header value here to ensure
+            # that the default policy is chosen in case policy_specified is set
+            # see __init__.py for details on policy_specified
+            conn.request('PUT', parsed.path + '/' + self.container, '',
+                         {'X-Auth-Token': token, 'X-Storage-Policy': ''})
+            return check_response(conn)
+        resp = retry(put)
+        resp.read()
+        self.assertEqual(resp.status // 100, 2)
+
+        def head(url, token, parsed, conn):
+            conn.request('HEAD', parsed.path + '/' + self.container, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+        resp = retry(head)
+        resp.read()
+        headers = dict((k.lower(), v) for k, v in resp.getheaders())
+        self.assertEqual(headers.get('x-storage-policy'),
+                         default_policy['name'])
+
+    def test_error_invalid_storage_policy_name(self):
+        def put(url, token, parsed, conn, headers):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('PUT', parsed.path + '/' + self.container, '',
+                         new_headers)
+            return check_response(conn)
+
+        # create
+        resp = retry(put, {'X-Storage-Policy': uuid4().hex})
+        resp.read()
+        self.assertEqual(resp.status, 400)
+
+    @requires_policies
+    def test_create_non_default_storage_policy_container(self):
+        policy = self.policies.exclude(default=True).select()
+
+        def put(url, token, parsed, conn, headers=None):
+            base_headers = {'X-Auth-Token': token}
+            if headers:
+                base_headers.update(headers)
+            conn.request('PUT', parsed.path + '/' + self.container, '',
+                         base_headers)
+            return check_response(conn)
+        headers = {'X-Storage-Policy': policy['name']}
+        resp = retry(put, headers=headers)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+
+        def head(url, token, parsed, conn):
+            conn.request('HEAD', parsed.path + '/' + self.container, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+        resp = retry(head)
+        resp.read()
+        headers = dict((k.lower(), v) for k, v in resp.getheaders())
+        self.assertEqual(headers.get('x-storage-policy'),
+                         policy['name'])
+
+        # and test recreate with-out specifying Storage Policy
+        resp = retry(put)
+        resp.read()
+        self.assertEqual(resp.status, 202)
+        # should still be original storage policy
+        resp = retry(head)
+        resp.read()
+        headers = dict((k.lower(), v) for k, v in resp.getheaders())
+        self.assertEqual(headers.get('x-storage-policy'),
+                         policy['name'])
+
+        # delete it
+        def delete(url, token, parsed, conn):
+            conn.request('DELETE', parsed.path + '/' + self.container, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+        resp = retry(delete)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        # verify no policy header
+        resp = retry(head)
+        resp.read()
+        headers = dict((k.lower(), v) for k, v in resp.getheaders())
+        self.assertIsNone(headers.get('x-storage-policy'))
+
+    @requires_policies
+    def test_conflict_change_storage_policy_with_put(self):
+        def put(url, token, parsed, conn, headers):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('PUT', parsed.path + '/' + self.container, '',
+                         new_headers)
+            return check_response(conn)
+
+        # create
+        policy = self.policies.select()
+        resp = retry(put, {'X-Storage-Policy': policy['name']})
+        resp.read()
+        self.assertEqual(resp.status, 201)
+
+        # can't change it
+        other_policy = self.policies.exclude(name=policy['name']).select()
+        resp = retry(put, {'X-Storage-Policy': other_policy['name']})
+        resp.read()
+        self.assertEqual(resp.status, 409)
+
+        def head(url, token, parsed, conn):
+            conn.request('HEAD', parsed.path + '/' + self.container, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+        # still original policy
+        resp = retry(head)
+        resp.read()
+        headers = dict((k.lower(), v) for k, v in resp.getheaders())
+        self.assertEqual(headers.get('x-storage-policy'),
+                         policy['name'])
+
+    @requires_policies
+    def test_noop_change_storage_policy_with_post(self):
+        def put(url, token, parsed, conn, headers):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('PUT', parsed.path + '/' + self.container, '',
+                         new_headers)
+            return check_response(conn)
+
+        # create
+        policy = self.policies.select()
+        resp = retry(put, {'X-Storage-Policy': policy['name']})
+        resp.read()
+        self.assertEqual(resp.status, 201)
+
+        def post(url, token, parsed, conn, headers):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('POST', parsed.path + '/' + self.container, '',
+                         new_headers)
+            return check_response(conn)
+        # attempt update
+        for header in ('X-Storage-Policy', 'X-Storage-Policy-Index'):
+            other_policy = self.policies.exclude(name=policy['name']).select()
+            resp = retry(post, {header: other_policy['name']})
+            resp.read()
+            self.assertEqual(resp.status, 204)
+
+        def head(url, token, parsed, conn):
+            conn.request('HEAD', parsed.path + '/' + self.container, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+        # still original policy
+        resp = retry(head)
+        resp.read()
+        headers = dict((k.lower(), v) for k, v in resp.getheaders())
+        self.assertEqual(headers.get('x-storage-policy'),
+                         policy['name'])
+
+    def test_container_quota_bytes(self):
+        if 'container_quotas' not in cluster_info:
+            raise SkipTest('Container quotas not enabled')
+
+        if tf.in_process:
+            tf.skip_if_no_xattrs()
+
+        def post(url, token, parsed, conn, name, value):
+            conn.request('POST', parsed.path + '/' + self.name, '',
+                         {'X-Auth-Token': token, name: value})
+            return check_response(conn)
+
+        def head(url, token, parsed, conn):
+            conn.request('HEAD', parsed.path + '/' + self.name, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        # set X-Container-Meta-Quota-Bytes is 10
+        resp = retry(post, 'X-Container-Meta-Quota-Bytes', '10')
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(head)
+        resp.read()
+        self.assertIn(resp.status, (200, 204))
+        # confirm X-Container-Meta-Quota-Bytes
+        self.assertEqual(resp.getheader('X-Container-Meta-Quota-Bytes'), '10')
+
+        def put(url, token, parsed, conn, data):
+            conn.request('PUT', parsed.path + '/' + self.name + '/object',
+                         data, {'X-Auth-Token': token})
+            return check_response(conn)
+
+        # upload 11 bytes object
+        resp = retry(put, b'01234567890')
+        resp.read()
+        self.assertEqual(resp.status, 413)
+
+        # upload 10 bytes object
+        resp = retry(put, b'0123456789')
+        resp.read()
+        self.assertEqual(resp.status, 201)
+
+        def get(url, token, parsed, conn):
+            conn.request('GET', parsed.path + '/' + self.name + '/object',
+                         '', {'X-Auth-Token': token})
+            return check_response(conn)
+
+        # download 10 bytes object
+        resp = retry(get)
+        body = resp.read()
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(body, b'0123456789')
+
+
+class BaseTestContainerACLs(unittest.TestCase):
+    # subclasses can change the account in which container
+    # is created/deleted by setUp/tearDown
+    account = 1
+
+    def _get_account(self, url, token, parsed, conn):
+        return parsed.path
+
+    def _get_tenant_id(self, url, token, parsed, conn):
+        account = parsed.path
+        return account.replace('/v1/AUTH_', '', 1)
+
+    def setUp(self):
+        if tf.skip or tf.skip2 or tf.skip_if_not_v3:
+            raise SkipTest('AUTH VERSION 3 SPECIFIC TEST')
+        self.name = uuid4().hex
+
+        def put(url, token, parsed, conn):
+            conn.request('PUT', parsed.path + '/' + self.name, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        resp = retry(put, use_account=self.account)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+
+    def tearDown(self):
+        if tf.skip or tf.skip2 or tf.skip_if_not_v3:
+            raise SkipTest
+
+        def get(url, token, parsed, conn):
+            conn.request('GET', parsed.path + '/' + self.name + '?format=json',
+                         '', {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def delete(url, token, parsed, conn, obj):
+            conn.request('DELETE',
+                         '/'.join([parsed.path, self.name, obj['name']]), '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        while True:
+            resp = retry(get, use_account=self.account)
+            body = resp.read()
+            self.assertEqual(resp.status // 100, 2, resp.status)
+            objs = json.loads(body)
+            if not objs:
+                break
+            for obj in objs:
+                resp = retry(delete, obj, use_account=self.account)
+                resp.read()
+                self.assertEqual(resp.status, 204)
+
+        def delete(url, token, parsed, conn):
+            conn.request('DELETE', parsed.path + '/' + self.name, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        resp = retry(delete, use_account=self.account)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+    def _assert_cross_account_acl_granted(self, granted, grantee_account, acl):
+        '''
+        Check whether a given container ACL is granted when a user specified
+        by account_b attempts to access a container.
+        '''
+        # Obtain the first account's string
+        first_account = retry(self._get_account, use_account=self.account)
+
+        # Ensure we can't access the container with the grantee account
+        def get2(url, token, parsed, conn):
+            conn.request('GET', first_account + '/' + self.name, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        resp = retry(get2, use_account=grantee_account)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        def put2(url, token, parsed, conn):
+            conn.request('PUT', first_account + '/' + self.name + '/object',
+                         'test object', {'X-Auth-Token': token})
+            return check_response(conn)
+
+        resp = retry(put2, use_account=grantee_account)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # Post ACL to the container
+        def post(url, token, parsed, conn):
+            conn.request('POST', parsed.path + '/' + self.name, '',
+                         {'X-Auth-Token': token,
+                          'X-Container-Read': acl,
+                          'X-Container-Write': acl})
+            return check_response(conn)
+
+        resp = retry(post, use_account=self.account)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        # Check access to container from grantee account with ACL in place
+        resp = retry(get2, use_account=grantee_account)
+        resp.read()
+        expected = 204 if granted else 403
+        self.assertEqual(resp.status, expected)
+
+        resp = retry(put2, use_account=grantee_account)
+        resp.read()
+        expected = 201 if granted else 403
+        self.assertEqual(resp.status, expected)
+
+        # Make the container private again
+        def post(url, token, parsed, conn):
+            conn.request('POST', parsed.path + '/' + self.name, '',
+                         {'X-Auth-Token': token, 'X-Container-Read': '',
+                          'X-Container-Write': ''})
+            return check_response(conn)
+
+        resp = retry(post, use_account=self.account)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        # Ensure we can't access the container with the grantee account again
+        resp = retry(get2, use_account=grantee_account)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        resp = retry(put2, use_account=grantee_account)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+
+class TestContainerACLsAccount1(BaseTestContainerACLs):
+    def test_cross_account_acl_names_with_user_in_non_default_domain(self):
+        # names in acls are disallowed when grantee is in a non-default domain
+        acl = '%s:%s' % (tf.swift_test_tenant[3], tf.swift_test_user[3])
+        self._assert_cross_account_acl_granted(False, 4, acl)
+
+    def test_cross_account_acl_ids_with_user_in_non_default_domain(self):
+        # ids are allowed in acls when grantee is in a non-default domain
+        tenant_id = retry(self._get_tenant_id, use_account=4)
+        acl = '%s:%s' % (tenant_id, '*')
+        self._assert_cross_account_acl_granted(True, 4, acl)
+
+    def test_cross_account_acl_names_in_default_domain(self):
+        # names are allowed in acls when grantee and project are in
+        # the default domain
+        acl = '%s:%s' % (tf.swift_test_tenant[1], tf.swift_test_user[1])
+        self._assert_cross_account_acl_granted(True, 2, acl)
+
+    def test_cross_account_acl_ids_in_default_domain(self):
+        # ids are allowed in acls when grantee and project are in
+        # the default domain
+        tenant_id = retry(self._get_tenant_id, use_account=2)
+        acl = '%s:%s' % (tenant_id, '*')
+        self._assert_cross_account_acl_granted(True, 2, acl)
+
+
+class TestContainerACLsAccount4(BaseTestContainerACLs):
+    account = 4
+
+    def test_cross_account_acl_names_with_project_in_non_default_domain(self):
+        # names in acls are disallowed when project is in a non-default domain
+        acl = '%s:%s' % (tf.swift_test_tenant[0], tf.swift_test_user[0])
+        self._assert_cross_account_acl_granted(False, 1, acl)
+
+    def test_cross_account_acl_ids_with_project_in_non_default_domain(self):
+        # ids are allowed in acls when project is in a non-default domain
+        tenant_id = retry(self._get_tenant_id, use_account=1)
+        acl = '%s:%s' % (tenant_id, '*')
+        self._assert_cross_account_acl_granted(True, 1, acl)
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/functional/test_dlo.py b/test/functional/test_dlo.py
new file mode 100644
index 0000000000..58f2004f99
--- /dev/null
+++ b/test/functional/test_dlo.py
@@ -0,0 +1,408 @@
+#!/usr/bin/python -u
+# Copyright (c) 2010-2016 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import urllib
+
+from swift.common.swob import str_to_wsgi
+import test.functional as tf
+from test.functional.tests import Utils, Base, Base2, BaseEnv
+from test.functional.swift_test_client import Connection, ResponseError
+
+
+def setUpModule():
+    tf.setup_package()
+
+
+def tearDownModule():
+    tf.teardown_package()
+
+
+class TestDloEnv(BaseEnv):
+    @classmethod
+    def setUp(cls):
+        super(TestDloEnv, cls).setUp()
+
+        cls.container = cls.account.container(Utils.create_name())
+        cls.container2 = cls.account.container(Utils.create_name())
+
+        for cont in (cls.container, cls.container2):
+            if not cont.create():
+                raise ResponseError(cls.conn.response)
+
+        prefix = Utils.create_name(10)
+        cls.segment_prefix = prefix
+
+        for letter in ('a', 'b', 'c', 'd', 'e'):
+            file_item = cls.container.file("%s/seg_lower%s" % (prefix, letter))
+            file_item.write(letter.encode('ascii') * 10)
+
+            file_item = cls.container.file(
+                "%s/seg_upper_%%ff%s" % (prefix, letter))
+            file_item.write(letter.upper().encode('ascii') * 10)
+
+        for letter in ('f', 'g', 'h', 'i', 'j'):
+            file_item = cls.container2.file("%s/seg_lower%s" %
+                                            (prefix, letter))
+            file_item.write(letter.encode('ascii') * 10)
+
+        man1 = cls.container.file("man1")
+        man1.write(b'man1-contents',
+                   hdrs={"X-Object-Manifest": "%s/%s/seg_lower" %
+                         (cls.container.name, prefix)})
+
+        man2 = cls.container.file("man2")
+        man2.write(b'man2-contents',
+                   hdrs={"X-Object-Manifest": "%s/%s/seg_upper_%%25ff" %
+                         (cls.container.name, prefix)})
+
+        manall = cls.container.file("manall")
+        manall.write(b'manall-contents',
+                     hdrs={"X-Object-Manifest": "%s/%s/seg" %
+                           (cls.container.name, prefix)})
+
+        mancont2 = cls.container.file("mancont2")
+        mancont2.write(
+            b'mancont2-contents',
+            hdrs={"X-Object-Manifest": "%s/%s/seg_lower" %
+                                       (cls.container2.name, prefix)})
+
+
+class TestDlo(Base):
+    env = TestDloEnv
+
+    def test_get_manifest(self):
+        file_item = self.env.container.file('man1')
+        file_contents = file_item.read()
+        self.assertEqual(
+            file_contents,
+            b"aaaaaaaaaabbbbbbbbbbccccccccccddddddddddeeeeeeeeee")
+
+        file_item = self.env.container.file('man2')
+        file_contents = file_item.read()
+        self.assertEqual(
+            file_contents,
+            b"AAAAAAAAAABBBBBBBBBBCCCCCCCCCCDDDDDDDDDDEEEEEEEEEE")
+
+        file_item = self.env.container.file('manall')
+        file_contents = file_item.read()
+        self.assertEqual(
+            file_contents,
+            (b"aaaaaaaaaabbbbbbbbbbccccccccccddddddddddeeeeeeeeee" +
+             b"AAAAAAAAAABBBBBBBBBBCCCCCCCCCCDDDDDDDDDDEEEEEEEEEE"))
+
+    def test_get_manifest_document_itself(self):
+        file_item = self.env.container.file('man1')
+        file_contents = file_item.read(parms={'multipart-manifest': 'get'})
+        self.assertEqual(file_contents, b"man1-contents")
+        self.assertEqual(file_item.info()['x_object_manifest'],
+                         "%s/%s/seg_lower" %
+                         (self.env.container.name, self.env.segment_prefix))
+
+    def test_get_range(self):
+        file_item = self.env.container.file('man1')
+        file_contents = file_item.read(size=25, offset=8)
+        self.assertEqual(file_contents, b"aabbbbbbbbbbccccccccccddd")
+
+        file_contents = file_item.read(size=1, offset=47)
+        self.assertEqual(file_contents, b"e")
+
+    def test_get_multiple_ranges(self):
+        file_item = self.env.container.file('man1')
+        file_contents = file_item.read(
+            hdrs={'Range': 'bytes=0-4,10-14'})
+        self.assert_status(200)  # *not* 206
+        self.assertEqual(
+            file_contents,
+            b"aaaaaaaaaabbbbbbbbbbccccccccccddddddddddeeeeeeeeee")
+
+    def test_get_range_out_of_range(self):
+        file_item = self.env.container.file('man1')
+
+        self.assertRaises(ResponseError, file_item.read, size=7, offset=50)
+        self.assert_status(416)
+        self.assert_header('content-range', 'bytes */50')
+
+    def test_copy(self):
+        # Adding a new segment, copying the manifest, and then deleting the
+        # segment proves that the new object is really the concatenated
+        # segments and not just a manifest.
+        f_segment = self.env.container.file("%s/seg_lowerf" %
+                                            (self.env.segment_prefix))
+        f_segment.write(b'ffffffffff')
+        try:
+            man1_item = self.env.container.file('man1')
+            man1_item.copy(self.env.container.name, "copied-man1")
+        finally:
+            # try not to leave this around for other tests to stumble over
+            f_segment.delete(tolerate_missing=True)
+
+        file_item = self.env.container.file('copied-man1')
+        file_contents = file_item.read()
+        self.assertEqual(
+            file_contents,
+            b"aaaaaaaaaabbbbbbbbbbccccccccccddddddddddeeeeeeeeeeffffffffff")
+        # The copied object must not have X-Object-Manifest
+        self.assertNotIn("x_object_manifest", file_item.info())
+
+    def test_copy_account(self):
+        # dlo use same account and same container only
+        acct = urllib.parse.unquote(self.env.conn.account_name)
+        # Adding a new segment, copying the manifest, and then deleting the
+        # segment proves that the new object is really the concatenated
+        # segments and not just a manifest.
+        f_segment = self.env.container.file("%s/seg_lowerf" %
+                                            (self.env.segment_prefix))
+        f_segment.write(b'ffffffffff')
+        try:
+            man1_item = self.env.container.file('man1')
+            man1_item.copy_account(acct,
+                                   self.env.container.name,
+                                   "copied-man1")
+        finally:
+            # try not to leave this around for other tests to stumble over
+            f_segment.delete(tolerate_missing=True)
+
+        file_item = self.env.container.file('copied-man1')
+        file_contents = file_item.read()
+        self.assertEqual(
+            file_contents,
+            b"aaaaaaaaaabbbbbbbbbbccccccccccddddddddddeeeeeeeeeeffffffffff")
+        # The copied object must not have X-Object-Manifest
+        self.assertNotIn("x_object_manifest", file_item.info())
+
+    def test_copy_manifest(self):
+        # Copying the manifest with multipart-manifest=get query string
+        # should result in another manifest
+        try:
+            man1_item = self.env.container.file('man1')
+            man1_item.copy(self.env.container.name, "copied-man1",
+                           parms={'multipart-manifest': 'get'})
+
+            copied = self.env.container.file("copied-man1")
+            copied_contents = copied.read(parms={'multipart-manifest': 'get'})
+            self.assertEqual(copied_contents, b"man1-contents")
+
+            copied_contents = copied.read()
+            self.assertEqual(
+                copied_contents,
+                b"aaaaaaaaaabbbbbbbbbbccccccccccddddddddddeeeeeeeeee")
+            self.assertEqual(man1_item.info()['x_object_manifest'],
+                             copied.info()['x_object_manifest'])
+        finally:
+            # try not to leave this around for other tests to stumble over
+            self.env.container.file("copied-man1").delete(
+                tolerate_missing=True)
+
+    def test_dlo_if_match_get(self):
+        manifest = self.env.container.file("man1")
+        etag = manifest.info()['etag']
+
+        self.assertRaises(ResponseError, manifest.read,
+                          hdrs={'If-Match': 'not-%s' % etag})
+        self.assert_status(412)
+
+        manifest.read(hdrs={'If-Match': etag})
+        self.assert_status(200)
+
+    def test_dlo_if_none_match_get(self):
+        manifest = self.env.container.file("man1")
+        etag = manifest.info()['etag']
+
+        self.assertRaises(ResponseError, manifest.read,
+                          hdrs={'If-None-Match': etag})
+        self.assert_status(304)
+
+        manifest.read(hdrs={'If-None-Match': "not-%s" % etag})
+        self.assert_status(200)
+
+    def test_dlo_if_match_head(self):
+        manifest = self.env.container.file("man1")
+        etag = manifest.info()['etag']
+
+        self.assertRaises(ResponseError, manifest.info,
+                          hdrs={'If-Match': 'not-%s' % etag})
+        self.assert_status(412)
+
+        manifest.info(hdrs={'If-Match': etag})
+        self.assert_status(200)
+
+    def test_dlo_if_none_match_head(self):
+        manifest = self.env.container.file("man1")
+        etag = manifest.info()['etag']
+
+        self.assertRaises(ResponseError, manifest.info,
+                          hdrs={'If-None-Match': etag})
+        self.assert_status(304)
+
+        manifest.info(hdrs={'If-None-Match': "not-%s" % etag})
+        self.assert_status(200)
+
+    def test_dlo_referer_on_segment_container(self):
+        if 'username3' not in tf.config:
+            self.skipTest('Requires user 3')
+        # First the account2 (test3) should fail
+        config2 = tf.config.copy()
+        config2['username'] = tf.config['username3']
+        config2['password'] = tf.config['password3']
+        conn2 = Connection(config2)
+        conn2.authenticate()
+        headers = {'X-Auth-Token': conn2.storage_token,
+                   'Referer': 'http://blah.example.com'}
+        dlo_file = self.env.container.file("mancont2")
+        self.assertRaises(ResponseError, dlo_file.read,
+                          hdrs=headers)
+        self.assert_status(403)
+
+        # Now set the referer on the dlo container only
+        referer_metadata = {'X-Container-Read': '.r:*.example.com,.rlistings'}
+        self.env.container.update_metadata(referer_metadata)
+
+        self.assertRaises(ResponseError, dlo_file.read,
+                          hdrs=headers)
+        self.assert_status(403)
+
+        # Finally set the referer on the segment container
+        self.env.container2.update_metadata(referer_metadata)
+
+        contents = dlo_file.read(hdrs=headers)
+        self.assertEqual(
+            contents,
+            b"ffffffffffgggggggggghhhhhhhhhhiiiiiiiiiijjjjjjjjjj")
+
+    def test_dlo_post_with_manifest_header(self):
+        # verify that performing a POST to a DLO manifest
+        # preserves the fact that it is a manifest file.
+        # verify that the x-object-manifest header may be updated.
+
+        # create a new manifest for this test to avoid test coupling.
+        x_o_m = self.env.container.file('man1').info()['x_object_manifest']
+        file_item = self.env.container.file(Utils.create_name())
+        file_item.write(b'manifest-contents',
+                        hdrs={"X-Object-Manifest": x_o_m})
+
+        # sanity checks
+        manifest_contents = file_item.read(parms={'multipart-manifest': 'get'})
+        self.assertEqual(b'manifest-contents', manifest_contents)
+        expected_contents = ''.join((c * 10) for c in 'abcde').encode('ascii')
+        contents = file_item.read(parms={})
+        self.assertEqual(expected_contents, contents)
+
+        # POST a modified x-object-manifest value
+        new_x_o_m = x_o_m.rstrip('lower') + 'upper'
+        file_item.post({'x-object-meta-foo': 'bar',
+                        'x-object-manifest': new_x_o_m})
+
+        # verify that x-object-manifest was updated
+        file_item.info()
+        resp_headers = [(h.lower(), v)
+                        for h, v in file_item.conn.response.getheaders()]
+        self.assertIn(('x-object-manifest', str_to_wsgi(new_x_o_m)),
+                      resp_headers)
+        self.assertIn(('x-object-meta-foo', 'bar'), resp_headers)
+
+        # verify that manifest content was not changed
+        manifest_contents = file_item.read(parms={'multipart-manifest': 'get'})
+        self.assertEqual(b'manifest-contents', manifest_contents)
+
+        # verify that updated manifest points to new content
+        expected_contents = ''.join((c * 10) for c in 'ABCDE').encode('ascii')
+        contents = file_item.read(parms={})
+        self.assertEqual(expected_contents, contents)
+
+        # Now revert the manifest to point to original segments, including a
+        # multipart-manifest=get param just to check that has no effect
+        file_item.post({'x-object-manifest': x_o_m},
+                       parms={'multipart-manifest': 'get'})
+
+        # verify that x-object-manifest was reverted
+        info = file_item.info()
+        self.assertIn('x_object_manifest', info)
+        self.assertEqual(x_o_m, info['x_object_manifest'])
+
+        # verify that manifest content was not changed
+        manifest_contents = file_item.read(parms={'multipart-manifest': 'get'})
+        self.assertEqual(b'manifest-contents', manifest_contents)
+
+        # verify that updated manifest points new content
+        expected_contents = ''.join((c * 10) for c in 'abcde').encode('ascii')
+        contents = file_item.read(parms={})
+        self.assertEqual(expected_contents, contents)
+
+    def test_dlo_post_without_manifest_header(self):
+        # verify that a POST to a DLO manifest object with no
+        # x-object-manifest header will cause the existing x-object-manifest
+        # header to be lost
+
+        # create a new manifest for this test to avoid test coupling.
+        x_o_m = self.env.container.file('man1').info()['x_object_manifest']
+        file_item = self.env.container.file(Utils.create_name())
+        file_item.write(b'manifest-contents',
+                        hdrs={"X-Object-Manifest": x_o_m})
+
+        # sanity checks
+        manifest_contents = file_item.read(parms={'multipart-manifest': 'get'})
+        self.assertEqual(b'manifest-contents', manifest_contents)
+        expected_contents = ''.join((c * 10) for c in 'abcde').encode('ascii')
+        contents = file_item.read(parms={})
+        self.assertEqual(expected_contents, contents)
+
+        # POST with no x-object-manifest header
+        file_item.post({})
+
+        # verify that existing x-object-manifest was removed
+        info = file_item.info()
+        self.assertNotIn('x_object_manifest', info)
+
+        # verify that object content was not changed
+        manifest_contents = file_item.read(parms={'multipart-manifest': 'get'})
+        self.assertEqual(b'manifest-contents', manifest_contents)
+
+        # verify that object is no longer a manifest
+        contents = file_item.read(parms={})
+        self.assertEqual(b'manifest-contents', contents)
+
+    def test_dlo_post_with_manifest_regular_object(self):
+        # verify that performing a POST to a regular object
+        # with a manifest header will create a DLO.
+
+        # Put a regular object
+        file_item = self.env.container.file(Utils.create_name())
+        file_item.write(b'file contents', hdrs={})
+
+        # sanity checks
+        file_contents = file_item.read(parms={})
+        self.assertEqual(b'file contents', file_contents)
+
+        # get the path associated with man1
+        x_o_m = self.env.container.file('man1').info()['x_object_manifest']
+
+        # POST a x-object-manifest value to the regular object
+        file_item.post({'x-object-manifest': x_o_m})
+
+        # verify that the file is now a manifest
+        manifest_contents = file_item.read(parms={'multipart-manifest': 'get'})
+        self.assertEqual(b'file contents', manifest_contents)
+        expected_contents = ''.join([(c * 10) for c in 'abcde']).encode()
+        contents = file_item.read(parms={})
+        self.assertEqual(expected_contents, contents)
+        file_item.info()
+        resp_headers = [(h.lower(), v)
+                        for h, v in file_item.conn.response.getheaders()]
+        self.assertIn(('x-object-manifest', str_to_wsgi(x_o_m)), resp_headers)
+
+
+class TestDloUTF8(Base2, TestDlo):
+    pass
diff --git a/test/functional/test_domain_remap.py b/test/functional/test_domain_remap.py
new file mode 100644
index 0000000000..178fab459b
--- /dev/null
+++ b/test/functional/test_domain_remap.py
@@ -0,0 +1,191 @@
+#!/usr/bin/python -u
+# Copyright (c) 2010-2016 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from unittest import SkipTest
+
+import test.functional as tf
+from test.functional import cluster_info
+from test.functional.tests import Utils, Base, BaseEnv
+from test.functional.swift_test_client import Account, Connection, \
+    ResponseError
+
+
+def setUpModule():
+    tf.setup_package()
+
+
+def tearDownModule():
+    tf.teardown_package()
+
+
+class TestDomainRemapEnv(BaseEnv):
+    domain_remap_enabled = None  # tri-state: None initially, then True/False
+    dns_safe_account_name = None  # tri-state: None initially, then True/False
+
+    @classmethod
+    def setUp(cls):
+        cls.conn = Connection(tf.config)
+        cls.conn.authenticate()
+
+        if cls.domain_remap_enabled is None:
+            cls.domain_remap_enabled = 'domain_remap' in cluster_info
+            if not cls.domain_remap_enabled:
+                return
+
+        if cls.dns_safe_account_name is None:
+            cls.dns_safe_account_name = ('%' not in cls.conn.account_name)
+            if not cls.dns_safe_account_name:
+                return
+
+        cls.account = Account(
+            cls.conn, tf.config.get('account', tf.config['username']))
+        cls.account.delete_containers()
+
+        cls.container = cls.account.container(Utils.create_name())
+        if not cls.container.create():
+            raise ResponseError(cls.conn.response)
+
+        cls.obj = cls.container.file(Utils.create_name())
+        cls.obj.write(b'obj contents')
+
+        cls.obj_slash = cls.container.file('/v1')
+        cls.obj_slash.write(b'obj contents')
+
+
+class TestDomainRemap(Base):
+    env = TestDomainRemapEnv
+    set_up = False
+
+    def setUp(self):
+        super(TestDomainRemap, self).setUp()
+        if self.env.domain_remap_enabled is False:
+            raise SkipTest("Domain Remap is not enabled")
+        elif self.env.domain_remap_enabled is not True:
+            # just some sanity checking
+            raise Exception(
+                "Expected domain_remap_enabled to be True/False, got %r" %
+                (self.env.domain_remap_enabled,))
+        if self.env.dns_safe_account_name is False:
+            raise SkipTest("Account name %r cannot work with Domain Remap" %
+                           (self.env.conn.account_name,))
+        elif self.env.dns_safe_account_name is not True:
+            # just some sanity checking
+            raise Exception(
+                "Expected domain_remap_enabled to be True/False, got %r" %
+                (self.env.domain_remap_enabled,))
+        # domain_remap middleware does not advertise its storage_domain values
+        # in swift /info responses so a storage_domain must be configured in
+        # test.conf for these tests to succeed
+        if not tf.config.get('storage_domain'):
+            raise SkipTest('Domain Remap storage_domain not configured in %s' %
+                           tf.config['__file__'])
+
+        storage_domain = tf.config.get('storage_domain')
+
+        self.acct_domain_dash = '%s.%s' % (self.env.account.conn.account_name,
+                                           storage_domain)
+        self.acct_domain_underscore = '%s.%s' % (
+            self.env.account.conn.account_name.replace('_', '-'),
+            storage_domain)
+
+        self.cont_domain_dash = '%s.%s.%s' % (
+            self.env.container.name,
+            self.env.account.conn.account_name,
+            storage_domain)
+        self.cont_domain_underscore = '%s.%s.%s' % (
+            self.env.container.name,
+            self.env.account.conn.account_name.replace('_', '-'),
+            storage_domain)
+
+    def test_GET_remapped_account(self):
+        for domain in (self.acct_domain_dash, self.acct_domain_underscore):
+            self.env.account.conn.make_request('GET', '/',
+                                               hdrs={'Host': domain},
+                                               cfg={'absolute_path': True})
+            self.assert_status(200)
+            body = self.env.account.conn.response.read().decode('utf8')
+            self.assertIn(self.env.container.name, body.split('\n'))
+
+            path = '/'.join(['', self.env.container.name])
+            self.env.account.conn.make_request('GET', path,
+                                               hdrs={'Host': domain},
+                                               cfg={'absolute_path': True})
+            self.assert_status(200)
+            body = self.env.account.conn.response.read().decode('utf8')
+            self.assertIn(self.env.obj.name, body.split('\n'))
+            self.assertIn(self.env.obj_slash.name, body.split('\n'))
+
+            for obj in (self.env.obj, self.env.obj_slash):
+                path = '/'.join(['', self.env.container.name, obj.name])
+                self.env.account.conn.make_request('GET', path,
+                                                   hdrs={'Host': domain},
+                                                   cfg={'absolute_path': True})
+                self.assert_status(200)
+                self.assert_body('obj contents')
+
+    def test_PUT_remapped_account(self):
+        for domain in (self.acct_domain_dash, self.acct_domain_underscore):
+            # Create a container
+            new_container_name = Utils.create_name()
+            path = '/'.join(['', new_container_name])
+            self.env.account.conn.make_request('PUT', path,
+                                               data='new obj contents',
+                                               hdrs={'Host': domain},
+                                               cfg={'absolute_path': True})
+            self.assert_status(201)
+            self.assertIn(new_container_name, self.env.account.containers())
+
+            # Create an object
+            new_obj_name = Utils.create_name()
+            path = '/'.join(['', self.env.container.name, new_obj_name])
+            self.env.account.conn.make_request('PUT', path,
+                                               data='new obj contents',
+                                               hdrs={'Host': domain},
+                                               cfg={'absolute_path': True})
+            self.assert_status(201)
+            new_obj = self.env.container.file(new_obj_name)
+            self.assertEqual(new_obj.read(), b'new obj contents')
+
+    def test_GET_remapped_container(self):
+        for domain in (self.cont_domain_dash, self.cont_domain_underscore):
+            self.env.account.conn.make_request('GET', '/',
+                                               hdrs={'Host': domain},
+                                               cfg={'absolute_path': True})
+            self.assert_status(200)
+            body = self.env.account.conn.response.read().decode('utf8')
+            self.assertIn(self.env.obj.name, body.split('\n'))
+            self.assertIn(self.env.obj_slash.name, body.split('\n'))
+
+            for obj in (self.env.obj, self.env.obj_slash):
+                path = '/'.join(['', obj.name])
+                self.env.account.conn.make_request('GET', path,
+                                                   hdrs={'Host': domain},
+                                                   cfg={'absolute_path': True})
+                self.assert_status(200)
+                self.assert_body('obj contents')
+
+    def test_PUT_remapped_container(self):
+        for domain in (self.cont_domain_dash, self.cont_domain_underscore):
+            new_obj_name = Utils.create_name()
+            path = '/'.join(['', new_obj_name])
+            self.env.account.conn.make_request('PUT', path,
+                                               data='new obj contents',
+                                               hdrs={'Host': domain},
+                                               cfg={'absolute_path': True})
+            self.assert_status(201)
+
+            new_obj = self.env.container.file(new_obj_name)
+            self.assertEqual(new_obj.read(), b'new obj contents')
diff --git a/test/functional/test_object.py b/test/functional/test_object.py
new file mode 100644
index 0000000000..33d8052214
--- /dev/null
+++ b/test/functional/test_object.py
@@ -0,0 +1,2041 @@
+#!/usr/bin/python
+
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import datetime
+import json
+import unittest
+from uuid import uuid4
+import time
+from unittest import SkipTest
+from xml.dom import minidom
+
+from swift.common.header_key_dict import HeaderKeyDict
+from test.functional import check_response, retry, requires_acls, \
+    requires_policies, requires_bulk
+import test.functional as tf
+from swift.common.utils import md5, config_true_value
+
+
+def setUpModule():
+    tf.setup_package()
+
+
+def tearDownModule():
+    tf.teardown_package()
+
+
+class TestObject(unittest.TestCase):
+
+    def setUp(self):
+        if tf.skip or tf.skip2:
+            raise SkipTest
+
+        if tf.in_process:
+            tf.skip_if_no_xattrs()
+        self.container = uuid4().hex
+
+        self.containers = []
+        self._create_container(self.container)
+        self._create_container(self.container, use_account=2)
+
+        self.obj = uuid4().hex
+
+        def put(url, token, parsed, conn):
+            conn.request('PUT', '%s/%s/%s' % (
+                parsed.path, self.container, self.obj), 'test',
+                {'X-Auth-Token': token})
+            return check_response(conn)
+        resp = retry(put)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+
+    def _create_container(self, name=None, headers=None, use_account=1):
+        if not name:
+            name = uuid4().hex
+        self.containers.append(name)
+        headers = headers or {}
+
+        def put(url, token, parsed, conn, name):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('PUT', parsed.path + '/' + name, '',
+                         new_headers)
+            return check_response(conn)
+        resp = retry(put, name, use_account=use_account)
+        resp.read()
+        self.assertIn(resp.status, (201, 202))
+
+        # With keystoneauth we need the accounts to have had the project
+        # domain id persisted as sysmeta prior to testing ACLs. This may
+        # not be the case if, for example, the account was created using
+        # a request with reseller_admin role, when project domain id may
+        # not have been known. So we ensure that the project domain id is
+        # in sysmeta by making a POST to the accounts using an admin role.
+        def post(url, token, parsed, conn):
+            conn.request('POST', parsed.path, '', {'X-Auth-Token': token})
+            return check_response(conn)
+        resp = retry(post, use_account=use_account)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        return name
+
+    def tearDown(self):
+        if tf.skip:
+            raise SkipTest
+
+        # get list of objects in container
+        def get(url, token, parsed, conn, container):
+            conn.request(
+                'GET', parsed.path + '/' + container + '?format=json', '',
+                {'X-Auth-Token': token})
+            return check_response(conn)
+
+        # delete an object
+        def delete(url, token, parsed, conn, container, obj):
+            path = '/'.join([parsed.path, container, obj['name']])
+            conn.request('DELETE', path, '', {'X-Auth-Token': token})
+            return check_response(conn)
+
+        for container in self.containers:
+            while True:
+                resp = retry(get, container)
+                body = resp.read()
+                if resp.status == 404:
+                    break
+                self.assertEqual(resp.status // 100, 2, resp.status)
+                objs = json.loads(body)
+                if not objs:
+                    break
+                for obj in objs:
+                    resp = retry(delete, container, obj)
+                    resp.read()
+                    self.assertIn(resp.status, (204, 404))
+
+        # delete the container
+        def delete(url, token, parsed, conn, name):
+            conn.request('DELETE', parsed.path + '/' + name, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        for container in self.containers:
+            resp = retry(delete, container)
+            resp.read()
+            self.assertIn(resp.status, (204, 404))
+
+    def test_metadata(self):
+        obj = 'test_metadata'
+        req_metadata = {}
+
+        def put(url, token, parsed, conn):
+            headers = {'X-Auth-Token': token}
+            headers.update(req_metadata)
+            conn.request('PUT', '%s/%s/%s' % (
+                parsed.path, self.container, obj
+            ), '', headers)
+            return check_response(conn)
+
+        def get(url, token, parsed, conn):
+            conn.request(
+                'GET',
+                '%s/%s/%s' % (parsed.path, self.container, obj),
+                '',
+                {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def post(url, token, parsed, conn):
+            headers = {'X-Auth-Token': token}
+            headers.update(req_metadata)
+            conn.request('POST', '%s/%s/%s' % (
+                parsed.path, self.container, obj
+            ), '', headers)
+            return check_response(conn)
+
+        def metadata(resp):
+            metadata = {}
+            for k, v in resp.headers.items():
+                if 'meta' in k.lower():
+                    metadata[k] = v
+            return metadata
+
+        # empty put
+        resp = retry(put)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+        resp = retry(get)
+        self.assertEqual(b'', resp.read())
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(metadata(resp), {})
+        # empty post
+        resp = retry(post)
+        resp.read()
+        self.assertEqual(resp.status, 202)
+        resp = retry(get)
+        self.assertEqual(b'', resp.read())
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(metadata(resp), {})
+
+        # metadata put
+        req_metadata = {
+            'x-object-meta-Color': 'blUe',
+            'X-Object-Meta-food': 'PizZa',
+        }
+        resp = retry(put)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+        resp = retry(get)
+        self.assertEqual(b'', resp.read())
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(metadata(resp), {
+            'X-Object-Meta-Color': 'blUe',
+            'X-Object-Meta-Food': 'PizZa',
+        })
+        # metadata post
+        req_metadata = {'X-Object-Meta-color': 'oraNge'}
+        resp = retry(post)
+        resp.read()
+        self.assertEqual(resp.status, 202)
+        resp = retry(get)
+        self.assertEqual(b'', resp.read())
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(metadata(resp), {
+            'X-Object-Meta-Color': 'oraNge'
+        })
+
+        # sysmeta put
+        req_metadata = {
+            'X-Object-Meta-Color': 'Red',
+            'X-Object-Sysmeta-Color': 'Green',
+            'X-Object-Transient-Sysmeta-Color': 'Blue',
+        }
+        resp = retry(put)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+        resp = retry(get)
+        self.assertEqual(b'', resp.read())
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(metadata(resp), {
+            'X-Object-Meta-Color': 'Red',
+        })
+        # sysmeta post
+        req_metadata = {
+            'X-Object-Meta-Food': 'Burger',
+            'X-Object-Meta-Animal': 'Cat',
+            'X-Object-Sysmeta-Animal': 'Cow',
+            'X-Object-Transient-Sysmeta-Food': 'Burger',
+        }
+        resp = retry(post)
+        resp.read()
+        self.assertEqual(resp.status, 202)
+        resp = retry(get)
+        self.assertEqual(b'', resp.read())
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(metadata(resp), {
+            'X-Object-Meta-Food': 'Burger',
+            'X-Object-Meta-Animal': 'Cat',
+        })
+
+        # non-ascii put
+        req_metadata = {
+            'X-Object-Meta-Foo': u'B\u00e2r',
+        }
+        resp = retry(put)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+        resp = retry(get)
+        self.assertEqual(b'', resp.read())
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(metadata(resp), {
+            'X-Object-Meta-Foo': 'B\xc3\xa2r',
+        })
+        # non-ascii post
+        req_metadata = {
+            'X-Object-Meta-Foo': u'B\u00e5z',
+        }
+        resp = retry(post)
+        resp.read()
+        self.assertEqual(resp.status, 202)
+        resp = retry(get)
+        self.assertEqual(b'', resp.read())
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(metadata(resp), {
+            'X-Object-Meta-Foo': 'B\xc3\xa5z',
+        })
+
+    def test_if_none_match(self):
+        def delete(url, token, parsed, conn):
+            conn.request('DELETE', '%s/%s/%s' % (
+                parsed.path, self.container, 'if_none_match_test'), '',
+                {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def put(url, token, parsed, conn):
+            conn.request('PUT', '%s/%s/%s' % (
+                parsed.path, self.container, 'if_none_match_test'), '',
+                {'X-Auth-Token': token,
+                 'Content-Length': '0',
+                 'If-None-Match': '*'})
+            return check_response(conn)
+        resp = retry(put)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+        resp = retry(put)
+        resp.read()
+        self.assertEqual(resp.status, 412)
+
+        resp = retry(delete)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(put)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+
+        def put(url, token, parsed, conn):
+            conn.request('PUT', '%s/%s/%s' % (
+                parsed.path, self.container, 'if_none_match_test'), '',
+                {'X-Auth-Token': token,
+                 'Content-Length': '0',
+                 'If-None-Match': 'somethingelse'})
+            return check_response(conn)
+        resp = retry(put)
+        resp.read()
+        self.assertEqual(resp.status, 400)
+
+    def test_too_small_x_timestamp(self):
+        def put(url, token, parsed, conn):
+            conn.request('PUT', '%s/%s/%s' % (parsed.path, self.container,
+                                              'too_small_x_timestamp'),
+                         '', {'X-Auth-Token': token,
+                              'Content-Length': '0',
+                              'X-Timestamp': '-1'})
+            return check_response(conn)
+
+        def head(url, token, parsed, conn):
+            conn.request('HEAD', '%s/%s/%s' % (parsed.path, self.container,
+                                               'too_small_x_timestamp'),
+                         '', {'X-Auth-Token': token,
+                              'Content-Length': '0'})
+            return check_response(conn)
+        ts_before = time.time()
+        time.sleep(0.05)
+        resp = retry(put)
+        body = resp.read()
+        time.sleep(0.05)
+        ts_after = time.time()
+        if resp.status == 400:
+            # shunt_inbound_x_timestamp must be false
+            self.assertIn(
+                'X-Timestamp should be a UNIX timestamp float value', body)
+        else:
+            self.assertEqual(resp.status, 201)
+            self.assertEqual(body, b'')
+            resp = retry(head)
+            resp.read()
+            self.assertGreater(float(resp.headers['x-timestamp']), ts_before)
+            self.assertLess(float(resp.headers['x-timestamp']), ts_after)
+
+    def test_too_big_x_timestamp(self):
+        def put(url, token, parsed, conn):
+            conn.request('PUT', '%s/%s/%s' % (parsed.path, self.container,
+                                              'too_big_x_timestamp'),
+                         '', {'X-Auth-Token': token,
+                              'Content-Length': '0',
+                              'X-Timestamp': '99999999999.9999999999'})
+            return check_response(conn)
+
+        def head(url, token, parsed, conn):
+            conn.request('HEAD', '%s/%s/%s' % (parsed.path, self.container,
+                                               'too_big_x_timestamp'),
+                         '', {'X-Auth-Token': token,
+                              'Content-Length': '0'})
+            return check_response(conn)
+        ts_before = time.time()
+        time.sleep(0.05)
+        resp = retry(put)
+        body = resp.read()
+        time.sleep(0.05)
+        ts_after = time.time()
+        if resp.status == 400:
+            # shunt_inbound_x_timestamp must be false
+            self.assertIn(
+                'X-Timestamp should be a UNIX timestamp float value', body)
+        else:
+            self.assertEqual(resp.status, 201)
+            self.assertEqual(body, b'')
+            resp = retry(head)
+            resp.read()
+            self.assertGreater(float(resp.headers['x-timestamp']), ts_before)
+            self.assertLess(float(resp.headers['x-timestamp']), ts_after)
+
+    def test_x_delete_after(self):
+        def put(url, token, parsed, conn):
+            conn.request('PUT', '%s/%s/%s' % (parsed.path, self.container,
+                                              'x_delete_after'),
+                         '', {'X-Auth-Token': token,
+                              'Content-Length': '0',
+                              'X-Delete-After': '2'})
+            return check_response(conn)
+        resp = retry(put)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+
+        def get(url, token, parsed, conn):
+            conn.request(
+                'GET',
+                '%s/%s/%s' % (parsed.path, self.container, 'x_delete_after'),
+                '',
+                {'X-Auth-Token': token})
+            return check_response(conn)
+
+        resp = retry(get)
+        resp.read()
+        count = 0
+        while resp.status == 200 and count < 10:
+            resp = retry(get)
+            resp.read()
+            count += 1
+            time.sleep(0.5)
+
+        self.assertEqual(resp.status, 404)
+
+        # To avoid an error when the object deletion in tearDown(),
+        # the object is added again.
+        resp = retry(put)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+
+    def test_x_delete_at(self):
+        def put(url, token, parsed, conn):
+            dt = datetime.datetime.now()
+            epoch = time.mktime(dt.timetuple())
+            delete_time = str(int(epoch) + 3)
+            conn.request(
+                'PUT',
+                '%s/%s/%s' % (parsed.path, self.container, 'x_delete_at'),
+                '',
+                {'X-Auth-Token': token,
+                 'Content-Length': '0',
+                 'X-Delete-At': delete_time})
+            return check_response(conn)
+        resp = retry(put)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+
+        def get(url, token, parsed, conn):
+            conn.request(
+                'GET',
+                '%s/%s/%s' % (parsed.path, self.container, 'x_delete_at'),
+                '',
+                {'X-Auth-Token': token})
+            return check_response(conn)
+
+        resp = retry(get)
+        resp.read()
+        count = 0
+        while resp.status == 200 and count < 10:
+            resp = retry(get)
+            resp.read()
+            count += 1
+            time.sleep(1)
+
+        self.assertEqual(resp.status, 404)
+
+        # To avoid an error when the object deletion in tearDown(),
+        # the object is added again.
+        resp = retry(put)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+
+    def test_open_expired_enabled(self):
+        allow_open_expired = config_true_value(tf.cluster_info['swift'].get(
+            'allow_open_expired', 'false'))
+
+        if not allow_open_expired:
+            raise SkipTest('allow_open_expired is disabled')
+
+        def put(url, token, parsed, conn):
+            dt = datetime.datetime.now()
+            epoch = time.mktime(dt.timetuple())
+            delete_time = str(int(epoch) + 2)
+            conn.request(
+                'PUT',
+                '%s/%s/%s' % (parsed.path, self.container, 'x_delete_at'),
+                '',
+                {'X-Auth-Token': token,
+                 'Content-Length': '0',
+                 'X-Delete-At': delete_time})
+            return check_response(conn)
+        resp = retry(put)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+
+        def get(url, token, parsed, conn, extra_headers=None):
+            headers = {'X-Auth-Token': token}
+            if extra_headers:
+                headers.update(extra_headers)
+            conn.request(
+                'GET',
+                '%s/%s/%s' % (parsed.path, self.container, 'x_delete_at'),
+                '',
+                headers)
+            return check_response(conn)
+
+        def head(url, token, parsed, conn, extra_headers=None):
+            headers = {'X-Auth-Token': token}
+            if extra_headers:
+                headers.update(extra_headers)
+            conn.request(
+                'HEAD',
+                '%s/%s/%s' % (parsed.path, self.container, 'x_delete_at'),
+                '',
+                headers)
+            return check_response(conn)
+
+        def post(url, token, parsed, conn, extra_headers=None):
+            dt = datetime.datetime.now()
+            epoch = time.mktime(dt.timetuple())
+            delete_time = str(int(epoch) + 2)
+            headers = {'X-Auth-Token': token,
+                       'Content-Length': '0',
+                       'X-Delete-At': delete_time
+                       }
+            if extra_headers:
+                headers.update(extra_headers)
+            conn.request(
+                'POST',
+                '%s/%s/%s' % (parsed.path, self.container, 'x_delete_at'),
+                '',
+                headers)
+            return check_response(conn)
+
+        resp = retry(get)
+        resp.read()
+        count = 0
+        while resp.status == 200 and count < 10:
+            resp = retry(get)
+            resp.read()
+            count += 1
+            time.sleep(1)
+
+        # check to see object has expired
+        self.assertEqual(resp.status, 404)
+
+        dt = datetime.datetime.now()
+        now = str(int(time.mktime(dt.timetuple())))
+        resp = retry(get, extra_headers={'X-Open-Expired': True})
+        resp.read()
+        headers = HeaderKeyDict(resp.getheaders())
+        # read the expired object with magic x-open-expired header
+        self.assertEqual(resp.status, 200)
+        self.assertTrue(now > headers['X-Delete-At'])
+
+        resp = retry(head, extra_headers={'X-Open-Expired': True})
+        resp.read()
+        # head expired object with magic x-open-expired header
+        self.assertEqual(resp.status, 200)
+
+        resp = retry(get)
+        resp.read()
+        # verify object is still expired
+        self.assertEqual(resp.status, 404)
+
+        # verify object is still expired if x-open-expire is False
+        resp = retry(get, extra_headers={'X-Open-Expired': False})
+        resp.read()
+        self.assertEqual(resp.status, 404)
+
+        resp = retry(get, extra_headers={'X-Open-Expired': True})
+        resp.read()
+        self.assertEqual(resp.status, 200)
+        headers = HeaderKeyDict(resp.getheaders())
+        self.assertTrue(now > headers['X-Delete-At'])
+
+        resp = retry(head, extra_headers={'X-Open-Expired': False})
+        resp.read()
+        self.assertEqual(resp.status, 404)
+
+        resp = retry(head, extra_headers={'X-Open-Expired': True})
+        resp.read()
+        self.assertEqual(resp.status, 200)
+        headers = HeaderKeyDict(resp.getheaders())
+        self.assertTrue(now > headers['X-Delete-At'])
+
+        resp = retry(post, extra_headers={'X-Open-Expired': False})
+        resp.read()
+        # verify object is not updated and remains deleted
+        self.assertEqual(resp.status, 404)
+
+        # object got restored with magic x-open-expired header
+        resp = retry(post, extra_headers={'X-Open-Expired': True,
+                                          'X-Object-Meta-Test': 'restored!'})
+        resp.read()
+        self.assertEqual(resp.status, 202)
+
+        # verify object could be restored and you can do normal GET
+        resp = retry(get)
+        resp.read()
+        self.assertEqual(resp.status, 200)
+        self.assertIn('X-Object-Meta-Test', resp.headers)
+        self.assertEqual(resp.headers['x-object-meta-test'], 'restored!')
+
+        # verify object is restored and you can do normal HEAD
+        resp = retry(head)
+        resp.read()
+        self.assertEqual(resp.status, 200)
+        # verify object is updated with advanced delete time
+        self.assertIn('X-Delete-At', resp.headers)
+
+        # To avoid an error when the object deletion in tearDown(),
+        # the object is added again.
+        resp = retry(put)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+
+    def test_allow_open_expired_disabled(self):
+        allow_open_expired = config_true_value(tf.cluster_info['swift'].get(
+            'allow_open_expired', 'false'))
+
+        if allow_open_expired:
+            raise SkipTest('allow_open_expired is enabled')
+
+        def put(url, token, parsed, conn):
+            dt = datetime.datetime.now()
+            epoch = time.mktime(dt.timetuple())
+            delete_time = str(int(epoch) + 2)
+            conn.request(
+                'PUT',
+                '%s/%s/%s' % (parsed.path, self.container, 'x_delete_at'),
+                '',
+                {'X-Auth-Token': token,
+                 'Content-Length': '0',
+                 'X-Delete-At': delete_time})
+            return check_response(conn)
+        resp = retry(put)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+
+        def get(url, token, parsed, conn, extra_headers=None):
+            headers = {'X-Auth-Token': token}
+            if extra_headers:
+                headers.update(extra_headers)
+            conn.request(
+                'GET',
+                '%s/%s/%s' % (parsed.path, self.container, 'x_delete_at'),
+                '',
+                headers)
+            return check_response(conn)
+
+        def head(url, token, parsed, conn, extra_headers=None):
+            headers = {'X-Auth-Token': token}
+            if extra_headers:
+                headers.update(extra_headers)
+            conn.request(
+                'HEAD',
+                '%s/%s/%s' % (parsed.path, self.container, 'x_delete_at'),
+                '',
+                headers)
+            return check_response(conn)
+
+        def post(url, token, parsed, conn, extra_headers=None):
+            dt = datetime.datetime.now()
+            epoch = time.mktime(dt.timetuple())
+            delete_time = str(int(epoch) + 2)
+            headers = {'X-Auth-Token': token,
+                       'Content-Length': '0',
+                       'X-Delete-At': delete_time
+                       }
+            if extra_headers:
+                headers.update(extra_headers)
+            conn.request(
+                'POST',
+                '%s/%s/%s' % (parsed.path, self.container, 'x_delete_at'),
+                '',
+                headers)
+            return check_response(conn)
+
+        resp = retry(get)
+        resp.read()
+        count = 0
+        while resp.status == 200 and count < 10:
+            resp = retry(get)
+            resp.read()
+            count += 1
+            time.sleep(1)
+
+        # check to see object has expired
+        self.assertEqual(resp.status, 404)
+
+        resp = retry(get, extra_headers={'X-Open-Expired': True})
+        resp.read()
+        # read the expired object with magic x-open-expired header
+        self.assertEqual(resp.status, 404)
+
+        resp = retry(head, extra_headers={'X-Open-Expired': True})
+        resp.read()
+        # head expired object with magic x-open-expired header
+        self.assertEqual(resp.status, 404)
+
+        resp = retry(get)
+        resp.read()
+        # verify object is still expired
+        self.assertEqual(resp.status, 404)
+
+        # verify object is still expired if x-open-expire is False
+        resp = retry(get, extra_headers={'X-Open-Expired': False})
+        resp.read()
+        self.assertEqual(resp.status, 404)
+
+        resp = retry(get, extra_headers={'X-Open-Expired': True})
+        resp.read()
+        self.assertEqual(resp.status, 404)
+
+        resp = retry(head, extra_headers={'X-Open-Expired': False})
+        resp.read()
+        self.assertEqual(resp.status, 404)
+
+        resp = retry(head, extra_headers={'X-Open-Expired': True})
+        resp.read()
+        self.assertEqual(resp.status, 404)
+
+        resp = retry(post, extra_headers={'X-Open-Expired': False})
+        resp.read()
+        # verify object is not updated and remains deleted
+        self.assertEqual(resp.status, 404)
+
+        # object cannot be restored with magic x-open-expired header
+        resp = retry(post, extra_headers={'X-Open-Expired': True,
+                                          'X-Object-Meta-Test': 'restored!'})
+        resp.read()
+        self.assertEqual(resp.status, 404)
+
+        # To avoid an error when the object deletion in tearDown(),
+        # the object is added again.
+        resp = retry(put)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+
+    def test_non_integer_x_delete_after(self):
+        def put(url, token, parsed, conn):
+            conn.request('PUT', '%s/%s/%s' % (parsed.path, self.container,
+                                              'non_integer_x_delete_after'),
+                         '', {'X-Auth-Token': token,
+                              'Content-Length': '0',
+                              'X-Delete-After': '*'})
+            return check_response(conn)
+        resp = retry(put)
+        body = resp.read()
+        self.assertEqual(resp.status, 400)
+        self.assertEqual(body, b'Non-integer X-Delete-After')
+
+    def test_non_integer_x_delete_at(self):
+        def put(url, token, parsed, conn):
+            conn.request('PUT', '%s/%s/%s' % (parsed.path, self.container,
+                                              'non_integer_x_delete_at'),
+                         '', {'X-Auth-Token': token,
+                              'Content-Length': '0',
+                              'X-Delete-At': '*'})
+            return check_response(conn)
+        resp = retry(put)
+        body = resp.read()
+        self.assertEqual(resp.status, 400)
+        self.assertEqual(body, b'Non-integer X-Delete-At')
+
+    def test_x_delete_at_in_the_past(self):
+        def put(url, token, parsed, conn):
+            conn.request('PUT', '%s/%s/%s' % (parsed.path, self.container,
+                                              'x_delete_at_in_the_past'),
+                         '', {'X-Auth-Token': token,
+                              'Content-Length': '0',
+                              'X-Delete-At': '0'})
+            return check_response(conn)
+        resp = retry(put)
+        body = resp.read()
+        self.assertEqual(resp.status, 400)
+        self.assertEqual(body, b'X-Delete-At in past')
+
+    def test_x_delete_at_in_the_far_future(self):
+        def put(url, token, parsed, conn):
+            path = '%s/%s/%s' % (parsed.path, self.container,
+                                 'x_delete_at_in_the_far_future')
+            conn.request('PUT', path, '', {
+                'X-Auth-Token': token,
+                'Content-Length': '0',
+                'X-Delete-At': '1' * 100})
+            return check_response(conn)
+        resp = retry(put)
+        body = resp.read()
+        self.assertEqual(resp.status, 201, 'Got %s: %s' % (resp.status, body))
+
+        def head(url, token, parsed, conn):
+            path = '%s/%s/%s' % (parsed.path, self.container,
+                                 'x_delete_at_in_the_far_future')
+            conn.request('HEAD', path, '', {'X-Auth-Token': token})
+            return check_response(conn)
+        resp = retry(head)
+        body = resp.read()
+        self.assertEqual(resp.status, 200, 'Got %s: %s' % (resp.status, body))
+        self.assertEqual(resp.headers['x-delete-at'], '9' * 10)
+
+    def test_copy_object(self):
+        if tf.skip:
+            raise SkipTest
+
+        source = '%s/%s' % (self.container, self.obj)
+        dest = '%s/%s' % (self.container, 'test_copy')
+
+        # get contents of source
+        def get_source(url, token, parsed, conn):
+            conn.request('GET',
+                         '%s/%s' % (parsed.path, source),
+                         '', {'X-Auth-Token': token})
+            return check_response(conn)
+        resp = retry(get_source)
+        source_contents = resp.read()
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(source_contents, b'test')
+
+        # copy source to dest with X-Copy-From
+        def put(url, token, parsed, conn):
+            conn.request('PUT', '%s/%s' % (parsed.path, dest), '',
+                         {'X-Auth-Token': token,
+                          'Content-Length': '0',
+                          'X-Copy-From': source})
+            return check_response(conn)
+        resp = retry(put)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+
+        # contents of dest should be the same as source
+        def get_dest(url, token, parsed, conn):
+            conn.request('GET',
+                         '%s/%s' % (parsed.path, dest),
+                         '', {'X-Auth-Token': token})
+            return check_response(conn)
+        resp = retry(get_dest)
+        dest_contents = resp.read()
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(dest_contents, source_contents)
+
+        # delete the copy
+        def delete(url, token, parsed, conn):
+            conn.request('DELETE', '%s/%s' % (parsed.path, dest), '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+        resp = retry(delete)
+        resp.read()
+        self.assertIn(resp.status, (204, 404))
+        # verify dest does not exist
+        resp = retry(get_dest)
+        resp.read()
+        self.assertEqual(resp.status, 404)
+
+        # copy source to dest with COPY
+        def copy(url, token, parsed, conn):
+            conn.request('COPY', '%s/%s' % (parsed.path, source), '',
+                         {'X-Auth-Token': token,
+                          'Destination': dest})
+            return check_response(conn)
+        resp = retry(copy)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+
+        # contents of dest should be the same as source
+        resp = retry(get_dest)
+        dest_contents = resp.read()
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(dest_contents, source_contents)
+
+        # copy source to dest with COPY and range
+        def copy(url, token, parsed, conn):
+            conn.request('COPY', '%s/%s' % (parsed.path, source), '',
+                         {'X-Auth-Token': token,
+                          'Destination': dest,
+                          'Range': 'bytes=1-2'})
+            return check_response(conn)
+        resp = retry(copy)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+
+        # contents of dest should be the same as source
+        resp = retry(get_dest)
+        dest_contents = resp.read()
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(dest_contents, source_contents[1:3])
+
+        # delete the copy
+        resp = retry(delete)
+        resp.read()
+        self.assertIn(resp.status, (204, 404))
+
+    def test_copy_between_accounts(self):
+        if tf.skip2:
+            raise SkipTest
+
+        source = '%s/%s' % (self.container, self.obj)
+        dest = '%s/%s' % (self.container, 'test_copy')
+
+        # get contents of source
+        def get_source(url, token, parsed, conn):
+            conn.request('GET',
+                         '%s/%s' % (parsed.path, source),
+                         '', {'X-Auth-Token': token})
+            return check_response(conn)
+        resp = retry(get_source)
+        source_contents = resp.read()
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(source_contents, b'test')
+
+        acct = tf.parsed[0].path.split('/', 2)[2]
+
+        # copy source to dest with X-Copy-From-Account
+        def put(url, token, parsed, conn):
+            conn.request('PUT', '%s/%s' % (parsed.path, dest), '',
+                         {'X-Auth-Token': token,
+                          'Content-Length': '0',
+                          'X-Copy-From-Account': acct,
+                          'X-Copy-From': source})
+            return check_response(conn)
+        # try to put, will not succeed
+        # user does not have permissions to read from source
+        resp = retry(put, use_account=2)
+        self.assertEqual(resp.status, 403)
+
+        # add acl to allow reading from source
+        def post(url, token, parsed, conn):
+            conn.request('POST', '%s/%s' % (parsed.path, self.container), '',
+                         {'X-Auth-Token': token,
+                          'X-Container-Read': tf.swift_test_perm[1]})
+            return check_response(conn)
+        resp = retry(post)
+        self.assertEqual(resp.status, 204)
+
+        # retry previous put, now should succeed
+        resp = retry(put, use_account=2)
+        self.assertEqual(resp.status, 201)
+
+        # contents of dest should be the same as source
+        def get_dest(url, token, parsed, conn):
+            conn.request('GET',
+                         '%s/%s' % (parsed.path, dest),
+                         '', {'X-Auth-Token': token})
+            return check_response(conn)
+        resp = retry(get_dest, use_account=2)
+        dest_contents = resp.read()
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(dest_contents, source_contents)
+
+        # delete the copy
+        def delete(url, token, parsed, conn):
+            conn.request('DELETE', '%s/%s' % (parsed.path, dest), '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+        resp = retry(delete, use_account=2)
+        resp.read()
+        self.assertIn(resp.status, (204, 404))
+        # verify dest does not exist
+        resp = retry(get_dest, use_account=2)
+        resp.read()
+        self.assertEqual(resp.status, 404)
+
+        acct_dest = tf.parsed[1].path.split('/', 2)[2]
+
+        # copy source to dest with COPY
+        def copy(url, token, parsed, conn):
+            conn.request('COPY', '%s/%s' % (parsed.path, source), '',
+                         {'X-Auth-Token': token,
+                          'Destination-Account': acct_dest,
+                          'Destination': dest})
+            return check_response(conn)
+        # try to copy, will not succeed
+        # user does not have permissions to write to destination
+        resp = retry(copy)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # add acl to allow write to destination
+        def post(url, token, parsed, conn):
+            conn.request('POST', '%s/%s' % (parsed.path, self.container), '',
+                         {'X-Auth-Token': token,
+                          'X-Container-Write': tf.swift_test_perm[0]})
+            return check_response(conn)
+        resp = retry(post, use_account=2)
+        self.assertEqual(resp.status, 204)
+
+        # now copy will succeed
+        resp = retry(copy)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+
+        # contents of dest should be the same as source
+        resp = retry(get_dest, use_account=2)
+        dest_contents = resp.read()
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(dest_contents, source_contents)
+
+        # delete the copy
+        resp = retry(delete, use_account=2)
+        resp.read()
+        self.assertIn(resp.status, (204, 404))
+
+    def test_public_object(self):
+        if tf.skip:
+            raise SkipTest
+
+        def get(url, token, parsed, conn):
+            conn.request('GET',
+                         '%s/%s/%s' % (parsed.path, self.container, self.obj))
+            return check_response(conn)
+        try:
+            resp = retry(get)
+            raise Exception('Should not have been able to GET')
+        except Exception as err:
+            self.assertTrue(str(err).startswith('No result after '))
+
+        def post(url, token, parsed, conn):
+            conn.request('POST', parsed.path + '/' + self.container, '',
+                         {'X-Auth-Token': token,
+                          'X-Container-Read': '.r:*'})
+            return check_response(conn)
+        resp = retry(post)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        resp = retry(get)
+        resp.read()
+        self.assertEqual(resp.status, 200)
+
+        def post(url, token, parsed, conn):
+            conn.request('POST', parsed.path + '/' + self.container, '',
+                         {'X-Auth-Token': token, 'X-Container-Read': ''})
+            return check_response(conn)
+        resp = retry(post)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+        try:
+            resp = retry(get)
+            raise Exception('Should not have been able to GET')
+        except Exception as err:
+            self.assertTrue(str(err).startswith('No result after '))
+
+    def test_private_object(self):
+        if tf.skip or tf.skip3:
+            raise SkipTest
+
+        # Ensure we can't access the object with the third account
+        def get(url, token, parsed, conn):
+            conn.request('GET', '%s/%s/%s' % (
+                parsed.path, self.container, self.obj), '',
+                {'X-Auth-Token': token})
+            return check_response(conn)
+        resp = retry(get, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # create a shared container writable by account3
+        shared_container = uuid4().hex
+
+        def put(url, token, parsed, conn):
+            conn.request('PUT', '%s/%s' % (
+                parsed.path, shared_container), '',
+                {'X-Auth-Token': token,
+                 'X-Container-Read': tf.swift_test_perm[2],
+                 'X-Container-Write': tf.swift_test_perm[2]})
+            return check_response(conn)
+        resp = retry(put)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+
+        # verify third account can not copy from private container
+        def copy(url, token, parsed, conn):
+            conn.request('PUT', '%s/%s/%s' % (
+                parsed.path, shared_container, 'private_object'), '',
+                {'X-Auth-Token': token,
+                 'Content-Length': '0',
+                 'X-Copy-From': '%s/%s' % (self.container, self.obj)})
+            return check_response(conn)
+        resp = retry(copy, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # verify third account can write "obj1" to shared container
+        def put(url, token, parsed, conn):
+            conn.request('PUT', '%s/%s/%s' % (
+                parsed.path, shared_container, 'obj1'), 'test',
+                {'X-Auth-Token': token})
+            return check_response(conn)
+        resp = retry(put, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+
+        # verify third account can copy "obj1" to shared container
+        def copy2(url, token, parsed, conn):
+            conn.request('COPY', '%s/%s/%s' % (
+                parsed.path, shared_container, 'obj1'), '',
+                {'X-Auth-Token': token,
+                 'Destination': '%s/%s' % (shared_container, 'obj1')})
+            return check_response(conn)
+        resp = retry(copy2, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+
+        # verify third account STILL can not copy from private container
+        def copy3(url, token, parsed, conn):
+            conn.request('COPY', '%s/%s/%s' % (
+                parsed.path, self.container, self.obj), '',
+                {'X-Auth-Token': token,
+                 'Destination': '%s/%s' % (shared_container,
+                                           'private_object')})
+            return check_response(conn)
+        resp = retry(copy3, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # clean up "obj1"
+        def delete(url, token, parsed, conn):
+            conn.request('DELETE', '%s/%s/%s' % (
+                parsed.path, shared_container, 'obj1'), '',
+                {'X-Auth-Token': token})
+            return check_response(conn)
+        resp = retry(delete)
+        resp.read()
+        self.assertIn(resp.status, (204, 404))
+
+        # clean up shared_container
+        def delete(url, token, parsed, conn):
+            conn.request('DELETE',
+                         parsed.path + '/' + shared_container, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+        resp = retry(delete)
+        resp.read()
+        self.assertIn(resp.status, (204, 404))
+
+    def test_container_write_only(self):
+        if tf.skip or tf.skip3:
+            raise SkipTest
+
+        # Ensure we can't access the object with the third account
+        def get(url, token, parsed, conn):
+            conn.request('GET', '%s/%s/%s' % (
+                parsed.path, self.container, self.obj), '',
+                {'X-Auth-Token': token})
+            return check_response(conn)
+        resp = retry(get, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # create a shared container writable (but not readable) by account3
+        shared_container = uuid4().hex
+
+        def put(url, token, parsed, conn):
+            conn.request('PUT', '%s/%s' % (
+                parsed.path, shared_container), '',
+                {'X-Auth-Token': token,
+                 'X-Container-Write': tf.swift_test_perm[2]})
+            return check_response(conn)
+        resp = retry(put)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+
+        # verify third account can write "obj1" to shared container
+        def put(url, token, parsed, conn):
+            conn.request('PUT', '%s/%s/%s' % (
+                parsed.path, shared_container, 'obj1'), 'test',
+                {'X-Auth-Token': token})
+            return check_response(conn)
+        resp = retry(put, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+
+        # verify third account cannot copy "obj1" to shared container
+        def copy(url, token, parsed, conn):
+            conn.request('COPY', '%s/%s/%s' % (
+                parsed.path, shared_container, 'obj1'), '',
+                {'X-Auth-Token': token,
+                 'Destination': '%s/%s' % (shared_container, 'obj2')})
+            return check_response(conn)
+        resp = retry(copy, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # verify third account can POST to "obj1" in shared container
+        def post(url, token, parsed, conn):
+            conn.request('POST', '%s/%s/%s' % (
+                parsed.path, shared_container, 'obj1'), '',
+                {'X-Auth-Token': token,
+                 'X-Object-Meta-Color': 'blue'})
+            return check_response(conn)
+        resp = retry(post, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 202)
+
+        # verify third account can DELETE from shared container
+        def delete(url, token, parsed, conn):
+            conn.request('DELETE', '%s/%s/%s' % (
+                parsed.path, shared_container, 'obj1'), '',
+                {'X-Auth-Token': token})
+            return check_response(conn)
+        resp = retry(delete, use_account=3)
+        resp.read()
+        self.assertIn(resp.status, (204, 404))
+
+        # clean up shared_container
+        def delete(url, token, parsed, conn):
+            conn.request('DELETE',
+                         parsed.path + '/' + shared_container, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+        resp = retry(delete)
+        resp.read()
+        self.assertIn(resp.status, (204, 404))
+
+    @requires_acls
+    def test_read_only(self):
+        if tf.skip3:
+            raise SkipTest
+
+        def get_listing(url, token, parsed, conn):
+            conn.request('GET', '%s/%s' % (parsed.path, self.container), '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def post_account(url, token, parsed, conn, headers):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('POST', parsed.path, '', new_headers)
+            return check_response(conn)
+
+        def get(url, token, parsed, conn, name):
+            conn.request('GET', '%s/%s/%s' % (
+                parsed.path, self.container, name), '',
+                {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def put(url, token, parsed, conn, name):
+            conn.request('PUT', '%s/%s/%s' % (
+                parsed.path, self.container, name), 'test',
+                {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def delete(url, token, parsed, conn, name):
+            conn.request('PUT', '%s/%s/%s' % (
+                parsed.path, self.container, name), '',
+                {'X-Auth-Token': token})
+            return check_response(conn)
+
+        # cannot list objects
+        resp = retry(get_listing, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # cannot get object
+        resp = retry(get, self.obj, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # grant read-only access
+        acl_user = tf.swift_test_user[2]
+        acl = {'read-only': [acl_user]}
+        headers = {'x-account-access-control': json.dumps(acl)}
+        resp = retry(post_account, headers=headers, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        # can list objects
+        resp = retry(get_listing, use_account=3)
+        listing = resp.read().decode('utf8')
+        self.assertEqual(resp.status, 200)
+        self.assertIn(self.obj, listing.split('\n'))
+
+        # can get object
+        resp = retry(get, self.obj, use_account=3)
+        body = resp.read()
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(body, b'test')
+
+        # can not put an object
+        obj_name = str(uuid4())
+        resp = retry(put, obj_name, use_account=3)
+        body = resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # can not delete an object
+        resp = retry(delete, self.obj, use_account=3)
+        body = resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # sanity with account1
+        resp = retry(get_listing, use_account=3)
+        listing = resp.read().decode('utf8')
+        self.assertEqual(resp.status, 200)
+        self.assertNotIn(obj_name, listing.split('\n'))
+        self.assertIn(self.obj, listing.split('\n'))
+
+    @requires_acls
+    def test_read_write(self):
+        if tf.skip3:
+            raise SkipTest
+
+        def get_listing(url, token, parsed, conn):
+            conn.request('GET', '%s/%s' % (parsed.path, self.container), '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def post_account(url, token, parsed, conn, headers):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('POST', parsed.path, '', new_headers)
+            return check_response(conn)
+
+        def get(url, token, parsed, conn, name):
+            conn.request('GET', '%s/%s/%s' % (
+                parsed.path, self.container, name), '',
+                {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def put(url, token, parsed, conn, name):
+            conn.request('PUT', '%s/%s/%s' % (
+                parsed.path, self.container, name), 'test',
+                {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def delete(url, token, parsed, conn, name):
+            conn.request('DELETE', '%s/%s/%s' % (
+                parsed.path, self.container, name), '',
+                {'X-Auth-Token': token})
+            return check_response(conn)
+
+        # cannot list objects
+        resp = retry(get_listing, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # cannot get object
+        resp = retry(get, self.obj, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # grant read-write access
+        acl_user = tf.swift_test_user[2]
+        acl = {'read-write': [acl_user]}
+        headers = {'x-account-access-control': json.dumps(acl)}
+        resp = retry(post_account, headers=headers, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        # can list objects
+        resp = retry(get_listing, use_account=3)
+        listing = resp.read().decode('utf8')
+        self.assertEqual(resp.status, 200)
+        self.assertIn(self.obj, listing.split('\n'))
+
+        # can get object
+        resp = retry(get, self.obj, use_account=3)
+        body = resp.read()
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(body, b'test')
+
+        # can put an object
+        obj_name = str(uuid4())
+        resp = retry(put, obj_name, use_account=3)
+        body = resp.read()
+        self.assertEqual(resp.status, 201)
+
+        # can delete an object
+        resp = retry(delete, self.obj, use_account=3)
+        body = resp.read()
+        self.assertIn(resp.status, (204, 404))
+
+        # sanity with account1
+        resp = retry(get_listing, use_account=3)
+        listing = resp.read().decode('utf8')
+        self.assertEqual(resp.status, 200)
+        self.assertIn(obj_name, listing.split('\n'))
+        self.assertNotIn(self.obj, listing.split('\n'))
+
+    @requires_acls
+    def test_admin(self):
+        if tf.skip3:
+            raise SkipTest
+
+        def get_listing(url, token, parsed, conn):
+            conn.request('GET', '%s/%s' % (parsed.path, self.container), '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def post_account(url, token, parsed, conn, headers):
+            new_headers = dict({'X-Auth-Token': token}, **headers)
+            conn.request('POST', parsed.path, '', new_headers)
+            return check_response(conn)
+
+        def get(url, token, parsed, conn, name):
+            conn.request('GET', '%s/%s/%s' % (
+                parsed.path, self.container, name), '',
+                {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def put(url, token, parsed, conn, name):
+            conn.request('PUT', '%s/%s/%s' % (
+                parsed.path, self.container, name), 'test',
+                {'X-Auth-Token': token})
+            return check_response(conn)
+
+        def delete(url, token, parsed, conn, name):
+            conn.request('DELETE', '%s/%s/%s' % (
+                parsed.path, self.container, name), '',
+                {'X-Auth-Token': token})
+            return check_response(conn)
+
+        # cannot list objects
+        resp = retry(get_listing, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # cannot get object
+        resp = retry(get, self.obj, use_account=3)
+        resp.read()
+        self.assertEqual(resp.status, 403)
+
+        # grant admin access
+        acl_user = tf.swift_test_user[2]
+        acl = {'admin': [acl_user]}
+        headers = {'x-account-access-control': json.dumps(acl)}
+        resp = retry(post_account, headers=headers, use_account=1)
+        resp.read()
+        self.assertEqual(resp.status, 204)
+
+        # can list objects
+        resp = retry(get_listing, use_account=3)
+        listing = resp.read().decode('utf8')
+        self.assertEqual(resp.status, 200)
+        self.assertIn(self.obj, listing.split('\n'))
+
+        # can get object
+        resp = retry(get, self.obj, use_account=3)
+        body = resp.read()
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(body, b'test')
+
+        # can put an object
+        obj_name = str(uuid4())
+        resp = retry(put, obj_name, use_account=3)
+        body = resp.read()
+        self.assertEqual(resp.status, 201)
+
+        # can delete an object
+        resp = retry(delete, self.obj, use_account=3)
+        body = resp.read()
+        self.assertIn(resp.status, (204, 404))
+
+        # sanity with account1
+        resp = retry(get_listing, use_account=3)
+        listing = resp.read().decode('utf8')
+        self.assertEqual(resp.status, 200)
+        self.assertIn(obj_name, listing.split('\n'))
+        self.assertNotIn(self.obj, listing)
+
+    def test_manifest(self):
+        if tf.skip:
+            raise SkipTest
+        # Data for the object segments
+        segments1 = [b'one', b'two', b'three', b'four', b'five']
+        segments2 = [b'six', b'seven', b'eight']
+        segments3 = [b'nine', b'ten', b'eleven']
+
+        # Upload the first set of segments
+        def put(url, token, parsed, conn, objnum):
+            conn.request('PUT', '%s/%s/segments1/%s' % (
+                parsed.path, self.container, str(objnum)), segments1[objnum],
+                {'X-Auth-Token': token})
+            return check_response(conn)
+        for objnum in range(len(segments1)):
+            resp = retry(put, objnum)
+            resp.read()
+            self.assertEqual(resp.status, 201)
+
+        # Upload the manifest
+        def put(url, token, parsed, conn):
+            conn.request('PUT', '%s/%s/manifest' % (
+                parsed.path, self.container), '', {
+                    'X-Auth-Token': token,
+                    'X-Object-Manifest': '%s/segments1/' % self.container,
+                    'Content-Type': 'text/jibberish', 'Content-Length': '0'})
+            return check_response(conn)
+        resp = retry(put)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+
+        # Get the manifest (should get all the segments as the body)
+        def get(url, token, parsed, conn):
+            conn.request('GET', '%s/%s/manifest' % (
+                parsed.path, self.container), '', {'X-Auth-Token': token})
+            return check_response(conn)
+        resp = retry(get)
+        self.assertEqual(resp.read(), b''.join(segments1))
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(resp.getheader('content-type'), 'text/jibberish')
+
+        # Get with a range at the start of the second segment
+        def get(url, token, parsed, conn):
+            conn.request('GET', '%s/%s/manifest' % (
+                parsed.path, self.container), '', {
+                    'X-Auth-Token': token, 'Range': 'bytes=3-'})
+            return check_response(conn)
+        resp = retry(get)
+        self.assertEqual(resp.read(), b''.join(segments1[1:]))
+        self.assertEqual(resp.status, 206)
+
+        # Get with a range in the middle of the second segment
+        def get(url, token, parsed, conn):
+            conn.request('GET', '%s/%s/manifest' % (
+                parsed.path, self.container), '', {
+                    'X-Auth-Token': token, 'Range': 'bytes=5-'})
+            return check_response(conn)
+        resp = retry(get)
+        self.assertEqual(resp.read(), b''.join(segments1)[5:])
+        self.assertEqual(resp.status, 206)
+
+        # Get with a full start and stop range
+        def get(url, token, parsed, conn):
+            conn.request('GET', '%s/%s/manifest' % (
+                parsed.path, self.container), '', {
+                    'X-Auth-Token': token, 'Range': 'bytes=5-10'})
+            return check_response(conn)
+        resp = retry(get)
+        self.assertEqual(resp.read(), b''.join(segments1)[5:11])
+        self.assertEqual(resp.status, 206)
+
+        # Upload the second set of segments
+        def put(url, token, parsed, conn, objnum):
+            conn.request('PUT', '%s/%s/segments2/%s' % (
+                parsed.path, self.container, str(objnum)), segments2[objnum],
+                {'X-Auth-Token': token})
+            return check_response(conn)
+        for objnum in range(len(segments2)):
+            resp = retry(put, objnum)
+            resp.read()
+            self.assertEqual(resp.status, 201)
+
+        # Get the manifest (should still be the first segments of course)
+        def get(url, token, parsed, conn):
+            conn.request('GET', '%s/%s/manifest' % (
+                parsed.path, self.container), '', {'X-Auth-Token': token})
+            return check_response(conn)
+        resp = retry(get)
+        self.assertEqual(resp.read(), b''.join(segments1))
+        self.assertEqual(resp.status, 200)
+
+        # Update the manifest
+        def put(url, token, parsed, conn):
+            conn.request('PUT', '%s/%s/manifest' % (
+                parsed.path, self.container), '', {
+                    'X-Auth-Token': token,
+                    'X-Object-Manifest': '%s/segments2/' % self.container,
+                    'Content-Length': '0'})
+            return check_response(conn)
+        resp = retry(put)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+
+        # Get the manifest (should be the second set of segments now)
+        def get(url, token, parsed, conn):
+            conn.request('GET', '%s/%s/manifest' % (
+                parsed.path, self.container), '', {'X-Auth-Token': token})
+            return check_response(conn)
+        resp = retry(get)
+        self.assertEqual(resp.read(), b''.join(segments2))
+        self.assertEqual(resp.status, 200)
+
+        if not tf.skip3:
+
+            # Ensure we can't access the manifest with the third account
+            def get(url, token, parsed, conn):
+                conn.request('GET', '%s/%s/manifest' % (
+                    parsed.path, self.container), '', {'X-Auth-Token': token})
+                return check_response(conn)
+            resp = retry(get, use_account=3)
+            resp.read()
+            self.assertEqual(resp.status, 403)
+
+            # Grant access to the third account
+            def post(url, token, parsed, conn):
+                conn.request('POST', '%s/%s' % (parsed.path, self.container),
+                             '', {'X-Auth-Token': token,
+                                  'X-Container-Read': tf.swift_test_perm[2]})
+                return check_response(conn)
+            resp = retry(post)
+            resp.read()
+            self.assertEqual(resp.status, 204)
+
+            # The third account should be able to get the manifest now
+            def get(url, token, parsed, conn):
+                conn.request('GET', '%s/%s/manifest' % (
+                    parsed.path, self.container), '', {'X-Auth-Token': token})
+                return check_response(conn)
+            resp = retry(get, use_account=3)
+            self.assertEqual(resp.read(), b''.join(segments2))
+            self.assertEqual(resp.status, 200)
+
+        # Create another container for the third set of segments
+        acontainer = uuid4().hex
+
+        def put(url, token, parsed, conn):
+            conn.request('PUT', parsed.path + '/' + acontainer, '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+        resp = retry(put)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+
+        # Upload the third set of segments in the other container
+        def put(url, token, parsed, conn, objnum):
+            conn.request('PUT', '%s/%s/segments3/%s' % (
+                parsed.path, acontainer, str(objnum)), segments3[objnum],
+                {'X-Auth-Token': token})
+            return check_response(conn)
+        for objnum in range(len(segments3)):
+            resp = retry(put, objnum)
+            resp.read()
+            self.assertEqual(resp.status, 201)
+
+        # Update the manifest
+        def put(url, token, parsed, conn):
+            conn.request('PUT', '%s/%s/manifest' % (
+                parsed.path, self.container), '',
+                {'X-Auth-Token': token,
+                 'X-Object-Manifest': '%s/segments3/' % acontainer,
+                 'Content-Length': '0'})
+            return check_response(conn)
+        resp = retry(put)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+
+        # Get the manifest to ensure it's the third set of segments
+        def get(url, token, parsed, conn):
+            conn.request('GET', '%s/%s/manifest' % (
+                parsed.path, self.container), '', {'X-Auth-Token': token})
+            return check_response(conn)
+        resp = retry(get)
+        self.assertEqual(resp.read(), b''.join(segments3))
+        self.assertEqual(resp.status, 200)
+
+        if not tf.skip3:
+
+            # Ensure we can't access the manifest with the third account
+            # (because the segments are in a protected container even if the
+            # manifest itself is not).
+
+            def get(url, token, parsed, conn):
+                conn.request('GET', '%s/%s/manifest' % (
+                    parsed.path, self.container), '', {'X-Auth-Token': token})
+                return check_response(conn)
+            resp = retry(get, use_account=3)
+            resp.read()
+            self.assertEqual(resp.status, 403)
+
+            # Grant access to the third account
+            def post(url, token, parsed, conn):
+                conn.request('POST', '%s/%s' % (parsed.path, acontainer),
+                             '', {'X-Auth-Token': token,
+                                  'X-Container-Read': tf.swift_test_perm[2]})
+                return check_response(conn)
+            resp = retry(post)
+            resp.read()
+            self.assertEqual(resp.status, 204)
+
+            # The third account should be able to get the manifest now
+            def get(url, token, parsed, conn):
+                conn.request('GET', '%s/%s/manifest' % (
+                    parsed.path, self.container), '', {'X-Auth-Token': token})
+                return check_response(conn)
+            resp = retry(get, use_account=3)
+            self.assertEqual(resp.read(), b''.join(segments3))
+            self.assertEqual(resp.status, 200)
+
+        # Delete the manifest
+        def delete(url, token, parsed, conn, objnum):
+            conn.request('DELETE', '%s/%s/manifest' % (
+                parsed.path,
+                self.container), '', {'X-Auth-Token': token})
+            return check_response(conn)
+        resp = retry(delete, objnum)
+        resp.read()
+        self.assertIn(resp.status, (204, 404))
+
+        # Delete the third set of segments
+        def delete(url, token, parsed, conn, objnum):
+            conn.request('DELETE', '%s/%s/segments3/%s' % (
+                parsed.path, acontainer, str(objnum)), '',
+                {'X-Auth-Token': token})
+            return check_response(conn)
+        for objnum in range(len(segments3)):
+            resp = retry(delete, objnum)
+            resp.read()
+            self.assertIn(resp.status, (204, 404))
+
+        # Delete the second set of segments
+        def delete(url, token, parsed, conn, objnum):
+            conn.request('DELETE', '%s/%s/segments2/%s' % (
+                parsed.path, self.container, str(objnum)), '',
+                {'X-Auth-Token': token})
+            return check_response(conn)
+        for objnum in range(len(segments2)):
+            resp = retry(delete, objnum)
+            resp.read()
+            self.assertIn(resp.status, (204, 404))
+
+        # Delete the first set of segments
+        def delete(url, token, parsed, conn, objnum):
+            conn.request('DELETE', '%s/%s/segments1/%s' % (
+                parsed.path, self.container, str(objnum)), '',
+                {'X-Auth-Token': token})
+            return check_response(conn)
+        for objnum in range(len(segments1)):
+            resp = retry(delete, objnum)
+            resp.read()
+            self.assertIn(resp.status, (204, 404))
+
+        # Delete the extra container
+        def delete(url, token, parsed, conn):
+            conn.request('DELETE', '%s/%s' % (parsed.path, acontainer), '',
+                         {'X-Auth-Token': token})
+            return check_response(conn)
+        resp = retry(delete)
+        resp.read()
+        self.assertIn(resp.status, (204, 404))
+
+    def test_delete_content_type(self):
+        if tf.skip:
+            raise SkipTest
+
+        def put(url, token, parsed, conn):
+            conn.request('PUT', '%s/%s/hi' % (parsed.path, self.container),
+                         'there', {'X-Auth-Token': token})
+            return check_response(conn)
+        resp = retry(put)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+
+        def delete(url, token, parsed, conn):
+            conn.request('DELETE', '%s/%s/hi' % (parsed.path, self.container),
+                         '', {'X-Auth-Token': token})
+            return check_response(conn)
+        resp = retry(delete)
+        resp.read()
+        self.assertIn(resp.status, (204, 404))
+        self.assertEqual(resp.getheader('Content-Type'),
+                         'text/html; charset=UTF-8')
+
+    def test_delete_if_delete_at_bad(self):
+        if tf.skip:
+            raise SkipTest
+
+        def put(url, token, parsed, conn):
+            conn.request('PUT',
+                         '%s/%s/hi-delete-bad' % (parsed.path, self.container),
+                         'there', {'X-Auth-Token': token})
+            return check_response(conn)
+        resp = retry(put)
+        resp.read()
+        self.assertEqual(resp.status, 201)
+
+        def delete(url, token, parsed, conn):
+            conn.request('DELETE', '%s/%s/hi' % (parsed.path, self.container),
+                         '', {'X-Auth-Token': token,
+                              'X-If-Delete-At': 'bad'})
+            return check_response(conn)
+        resp = retry(delete)
+        resp.read()
+        self.assertEqual(resp.status, 400)
+
+    def test_null_name(self):
+        if tf.skip:
+            raise SkipTest
+
+        def put(url, token, parsed, conn):
+            conn.request('PUT', '%s/%s/abc%%00def' % (
+                parsed.path,
+                self.container), 'test', {'X-Auth-Token': token})
+            return check_response(conn)
+        resp = retry(put)
+        if (tf.web_front_end == 'apache2'):
+            self.assertEqual(resp.status, 404)
+        else:
+            self.assertEqual(resp.read(), b'Invalid UTF8 or contains NULL')
+            self.assertEqual(resp.status, 412)
+
+    def test_cors(self):
+        if tf.skip:
+            raise SkipTest
+
+        try:
+            strict_cors = tf.cluster_info['swift']['strict_cors_mode']
+        except KeyError:
+            raise SkipTest("cors mode is unknown")
+
+        def put_cors_cont(url, token, parsed, conn, orig):
+            conn.request(
+                'PUT', '%s/%s' % (parsed.path, self.container),
+                '', {'X-Auth-Token': token,
+                     'X-Container-Meta-Access-Control-Allow-Origin': orig})
+            return check_response(conn)
+
+        def put_obj(url, token, parsed, conn, obj):
+            conn.request(
+                'PUT', '%s/%s/%s' % (parsed.path, self.container, obj),
+                'test', {'X-Auth-Token': token, 'X-Object-Meta-Color': 'red'})
+            return check_response(conn)
+
+        def check_cors(url, token, parsed, conn,
+                       method, obj, headers):
+            if method != 'OPTIONS':
+                headers['X-Auth-Token'] = token
+            conn.request(
+                method, '%s/%s/%s' % (parsed.path, self.container, obj),
+                '', headers)
+            return conn.getresponse()
+
+        resp = retry(put_cors_cont, '*')
+        resp.read()
+        self.assertEqual(resp.status // 100, 2)
+
+        resp = retry(put_obj, 'cat')
+        resp.read()
+        self.assertEqual(resp.status // 100, 2)
+
+        resp = retry(check_cors,
+                     'OPTIONS', 'cat', {'Origin': 'http://m.com'})
+        self.assertEqual(resp.status, 401)
+
+        resp = retry(check_cors,
+                     'OPTIONS', 'cat',
+                     {'Origin': 'http://m.com',
+                      'Access-Control-Request-Method': 'GET'})
+
+        self.assertEqual(resp.status, 200)
+        resp.read()
+        headers = dict((k.lower(), v) for k, v in resp.getheaders())
+        self.assertEqual(headers.get('access-control-allow-origin'),
+                         '*')
+        # Just a pre-flight; this doesn't show up yet
+        self.assertNotIn('access-control-expose-headers', headers)
+
+        resp = retry(check_cors,
+                     'GET', 'cat', {'Origin': 'http://m.com'})
+        self.assertEqual(resp.status, 200)
+        headers = dict((k.lower(), v) for k, v in resp.getheaders())
+        self.assertEqual(headers.get('access-control-allow-origin'),
+                         '*')
+        self.assertIn('x-object-meta-color', headers.get(
+            'access-control-expose-headers').split(', '))
+
+        resp = retry(check_cors,
+                     'GET', 'cat', {'Origin': 'http://m.com',
+                                    'X-Web-Mode': 'True'})
+        self.assertEqual(resp.status, 200)
+        headers = dict((k.lower(), v) for k, v in resp.getheaders())
+        self.assertEqual(headers.get('access-control-allow-origin'),
+                         '*')
+        self.assertIn('x-object-meta-color', headers.get(
+            'access-control-expose-headers').split(', '))
+
+        ####################
+
+        resp = retry(put_cors_cont, 'http://secret.com')
+        resp.read()
+        self.assertEqual(resp.status // 100, 2)
+
+        resp = retry(check_cors,
+                     'OPTIONS', 'cat',
+                     {'Origin': 'http://m.com',
+                      'Access-Control-Request-Method': 'GET'})
+        resp.read()
+        self.assertEqual(resp.status, 401)
+
+        if strict_cors:
+            resp = retry(check_cors,
+                         'GET', 'cat', {'Origin': 'http://m.com'})
+            resp.read()
+            self.assertEqual(resp.status, 200)
+            headers = dict((k.lower(), v) for k, v in resp.getheaders())
+            self.assertNotIn('access-control-allow-origin', headers)
+
+            resp = retry(check_cors,
+                         'GET', 'cat', {'Origin': 'http://secret.com'})
+            resp.read()
+            self.assertEqual(resp.status, 200)
+            headers = dict((k.lower(), v) for k, v in resp.getheaders())
+            self.assertEqual(headers.get('access-control-allow-origin'),
+                             'http://secret.com')
+        else:
+            resp = retry(check_cors,
+                         'GET', 'cat', {'Origin': 'http://m.com'})
+            resp.read()
+            self.assertEqual(resp.status, 200)
+            headers = dict((k.lower(), v) for k, v in resp.getheaders())
+            self.assertEqual(headers.get('access-control-allow-origin'),
+                             'http://m.com')
+
+    @requires_policies
+    def test_cross_policy_copy(self):
+        # create container in first policy
+        policy = self.policies.select()
+        container = self._create_container(
+            headers={'X-Storage-Policy': policy['name']})
+        obj = uuid4().hex
+
+        # create a container in second policy
+        other_policy = self.policies.exclude(name=policy['name']).select()
+        other_container = self._create_container(
+            headers={'X-Storage-Policy': other_policy['name']})
+        other_obj = uuid4().hex
+
+        def put_obj(url, token, parsed, conn, container, obj):
+            # to keep track of things, use the original path as the body
+            content = '%s/%s' % (container, obj)
+            path = '%s/%s' % (parsed.path, content)
+            conn.request('PUT', path, content, {'X-Auth-Token': token})
+            return check_response(conn)
+
+        # create objects
+        for c, o in zip((container, other_container), (obj, other_obj)):
+            resp = retry(put_obj, c, o)
+            resp.read()
+            self.assertEqual(resp.status, 201)
+
+        def put_copy_from(url, token, parsed, conn, container, obj, source):
+            dest_path = '%s/%s/%s' % (parsed.path, container, obj)
+            conn.request('PUT', dest_path, '',
+                         {'X-Auth-Token': token,
+                          'Content-Length': '0',
+                          'X-Copy-From': source})
+            return check_response(conn)
+
+        copy_requests = (
+            (container, other_obj, '%s/%s' % (other_container, other_obj)),
+            (other_container, obj, '%s/%s' % (container, obj)),
+        )
+
+        # copy objects
+        for c, o, source in copy_requests:
+            resp = retry(put_copy_from, c, o, source)
+            resp.read()
+            self.assertEqual(resp.status, 201)
+
+        def get_obj(url, token, parsed, conn, container, obj):
+            path = '%s/%s/%s' % (parsed.path, container, obj)
+            conn.request('GET', path, '', {'X-Auth-Token': token})
+            return check_response(conn)
+
+        # validate contents, contents should be source
+        validate_requests = copy_requests
+        for c, o, body in validate_requests:
+            resp = retry(get_obj, c, o)
+            self.assertEqual(resp.status, 200)
+            self.assertEqual(body.encode('utf8'), resp.read())
+
+    @requires_bulk
+    def test_bulk_delete(self):
+
+        def bulk_delete(url, token, parsed, conn):
+            # try to bulk delete the object that was created during test setup
+            conn.request('DELETE', '%s/%s/%s?bulk-delete' % (
+                parsed.path, self.container, self.obj),
+                '%s/%s' % (self.container, self.obj),
+                {'X-Auth-Token': token,
+                 'Accept': 'application/xml',
+                 'Expect': '100-continue',
+                 'Content-Type': 'text/plain'})
+            return check_response(conn)
+        resp = retry(bulk_delete)
+        self.assertEqual(resp.status, 200)
+        body = resp.read()
+        tree = minidom.parseString(body)
+        self.assertEqual(tree.documentElement.tagName, 'delete')
+
+        errors = tree.getElementsByTagName('errors')
+        self.assertEqual(len(errors), 1)
+        errors = [c.data if c.nodeType == c.TEXT_NODE else c.childNodes[0].data
+                  for c in errors[0].childNodes
+                  if c.nodeType != c.TEXT_NODE or c.data.strip()]
+        self.assertEqual(errors, [])
+
+        final_status = tree.getElementsByTagName('response_status')
+        self.assertEqual(len(final_status), 1)
+        self.assertEqual(len(final_status[0].childNodes), 1)
+        self.assertEqual(final_status[0].childNodes[0].data, '200 OK')
+
+    def test_etag_quoter(self):
+        if tf.skip:
+            raise SkipTest
+        if 'etag_quoter' not in tf.cluster_info:
+            raise SkipTest("etag-quoter middleware is not enabled")
+
+        def do_head(expect_quoted=None):
+            def head(url, token, parsed, conn):
+                conn.request('HEAD', '%s/%s/%s' % (
+                    parsed.path, self.container, self.obj), '',
+                    {'X-Auth-Token': token})
+                return check_response(conn)
+
+            resp = retry(head)
+            resp.read()
+            self.assertEqual(resp.status, 200)
+
+            if expect_quoted is None:
+                expect_quoted = tf.cluster_info.get('etag_quoter', {}).get(
+                    'enable_by_default', False)
+
+            expected_etag = md5(b'test', usedforsecurity=False).hexdigest()
+            if expect_quoted:
+                expected_etag = '"%s"' % expected_etag
+            self.assertEqual(resp.headers['etag'], expected_etag)
+
+        def _post(enable_flag, container_path):
+            def post(url, token, parsed, conn):
+                if container_path:
+                    path = '%s/%s' % (parsed.path, self.container)
+                    hdr = 'X-Container-Rfc-Compliant-Etags'
+                else:
+                    path = parsed.path
+                    hdr = 'X-Account-Rfc-Compliant-Etags'
+                headers = {hdr: enable_flag, 'X-Auth-Token': token}
+                conn.request('POST', path, '', headers)
+                return check_response(conn)
+
+            resp = retry(post)
+            resp.read()
+            self.assertEqual(resp.status, 204)
+
+        def post_account(enable_flag):
+            return _post(enable_flag, False)
+
+        def post_container(enable_flag):
+            return _post(enable_flag, True)
+
+        do_head()
+        post_container('t')
+        do_head(expect_quoted=True)
+        try:
+            post_account('t')
+            post_container('')
+            do_head(expect_quoted=True)
+            post_container('f')
+            do_head(expect_quoted=False)
+        finally:
+            # Don't leave a dirty account
+            post_account('')
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/functional/test_object_versioning.py b/test/functional/test_object_versioning.py
new file mode 100644
index 0000000000..a822a71a72
--- /dev/null
+++ b/test/functional/test_object_versioning.py
@@ -0,0 +1,2880 @@
+#!/usr/bin/python -u
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import hashlib
+import hmac
+import json
+import time
+
+from copy import deepcopy
+from urllib.parse import quote, unquote
+from unittest import SkipTest
+
+import test.functional as tf
+
+from swift.common.swob import normalize_etag
+from swift.common.utils import MD5_OF_EMPTY_STRING, config_true_value, md5
+from swift.common.middleware.versioned_writes.object_versioning import \
+    DELETE_MARKER_CONTENT_TYPE
+
+from test.functional.tests import Base, Base2, BaseEnv, Utils
+from test.functional import cluster_info
+from test.functional.swift_test_client import Connection, \
+    ResponseError
+from test.functional.test_tempurl import TestContainerTempurlEnv, \
+    TestTempurlEnv
+
+
+def setUpModule():
+    tf.setup_package()
+
+
+def tearDownModule():
+    tf.teardown_package()
+
+
+class TestObjectVersioningEnv(BaseEnv):
+    account2 = None
+    versions_header_key = 'X-Versions-Enabled'
+
+    @classmethod
+    def setUp(cls):
+        super(TestObjectVersioningEnv, cls).setUp()
+
+        if not tf.skip2:
+            # Second connection for ACL tests
+            config2 = deepcopy(tf.config)
+            config2['account'] = tf.config['account2']
+            config2['username'] = tf.config['username2']
+            config2['password'] = tf.config['password2']
+            cls.conn2 = Connection(config2)
+            cls.conn2.authenticate()
+
+        prefix = Utils.create_name()[:10]
+        cls.container = cls.account.container(prefix + "-objs")
+        container_headers = {cls.versions_header_key: 'True'}
+        if not cls.container.create(hdrs=container_headers):
+            raise ResponseError(cls.conn.response)
+
+        cls.unversioned_container = cls.account.container(
+            prefix + "-unversioned")
+        if not cls.unversioned_container.create():
+            raise ResponseError(cls.conn.response)
+
+        if not tf.skip2:
+            # setup another account to test ACLs
+            config2 = deepcopy(tf.config)
+            config2['account'] = tf.config['account2']
+            config2['username'] = tf.config['username2']
+            config2['password'] = tf.config['password2']
+            cls.conn2 = Connection(config2)
+            cls.storage_url2, cls.storage_token2 = cls.conn2.authenticate()
+            cls.account2 = cls.conn2.get_account()
+            cls.account2.delete_containers()
+
+        if not tf.skip3:
+            # setup another account with no access to anything to test ACLs
+            config3 = deepcopy(tf.config)
+            config3['account'] = tf.config['account']
+            config3['username'] = tf.config['username3']
+            config3['password'] = tf.config['password3']
+            cls.conn3 = Connection(config3)
+            cls.storage_url3, cls.storage_token3 = cls.conn3.authenticate()
+            cls.account3 = cls.conn3.get_account()
+
+        # the allowed headers are configurable in object server, so we cannot
+        # assert that content-encoding or content-disposition get *copied* to
+        # the object version unless they were set on the original PUT, so
+        # populate expected_headers by making a HEAD on the original object
+        precheck_container = cls.account.container('header-precheck-cont')
+        if not precheck_container.create():
+            raise ResponseError(cls.conn.response)
+        test_obj = precheck_container.file('test_allowed_headers')
+        put_headers = {'Content-Type': 'text/jibberish01',
+                       'Content-Encoding': 'gzip',
+                       'Content-Disposition': 'attachment; filename=myfile'}
+        test_obj.write(b"aaaaa", hdrs=put_headers)
+        test_obj.initialize()
+        resp_headers = {
+            h.lower(): v for h, v in test_obj.conn.response.getheaders()}
+        cls.expected_headers = {}
+        for k, v in put_headers.items():
+            if k.lower() in resp_headers:
+                cls.expected_headers[k] = v
+        precheck_container.delete_recursive()
+
+    @classmethod
+    def tearDown(cls):
+        if cls.account:
+            cls.account.delete_containers()
+        if cls.account2:
+            cls.account2.delete_containers()
+
+
+class TestObjectVersioningBase(Base):
+    env = TestObjectVersioningEnv
+
+    def setUp(self):
+        super(TestObjectVersioningBase, self).setUp()
+        if 'object_versioning' not in tf.cluster_info:
+            raise SkipTest("Object Versioning not enabled")
+
+        self._account_name = None
+
+        # make sure versioning is enabled,
+        # since it gets disabled in tearDown
+        self.env.container.update_metadata(
+            hdrs={self.env.versions_header_key: 'True'})
+
+    def _tear_down_files(self, container):
+        try:
+            # only delete files and not containers
+            # as they were configured in self.env
+            # get rid of any versions so they aren't restored
+
+            container.update_metadata(
+                hdrs={self.env.versions_header_key: 'False'})
+
+            # get rid of originals
+            container.delete_files()
+
+            # delete older versions
+            listing_parms = {'versions': None, 'format': 'json'}
+            for obj_info in container.files(parms=listing_parms):
+                prev_version = container.file(obj_info['name'])
+                prev_version.delete(
+                    parms={'version-id': obj_info['version_id']})
+
+        except ResponseError:
+            pass
+
+    def tearDown(self):
+        super(TestObjectVersioningBase, self).tearDown()
+        self._tear_down_files(self.env.container)
+
+    def assertTotalVersions(self, container, count):
+        listing_parms = {'versions': None}
+        self.assertEqual(count, len(container.files(parms=listing_parms)))
+
+    def assertContentTypes(self, container, expected_content_types):
+        listing_parms = {'versions': None,
+                         'format': 'json',
+                         'reverse': 'true'}
+        self.assertEqual(expected_content_types, [
+            o['content_type']
+            for o in container.files(parms=listing_parms)])
+
+
+class TestObjectVersioning(TestObjectVersioningBase):
+
+    @property
+    def account_name(self):
+        if not self._account_name:
+            self._account_name = unquote(
+                self.env.conn.storage_path.rsplit('/', 1)[-1])
+        return self._account_name
+
+    def test_disable_version(self):
+        # sanity
+        self.assertTrue(
+            config_true_value(self.env.container.info()['versions_enabled']))
+
+        # disable it
+        self.env.container.update_metadata(
+            hdrs={self.env.versions_header_key: 'False'})
+        self.assertFalse(
+            config_true_value(self.env.container.info()['versions_enabled']))
+
+        # enabled it back
+        self.env.container.update_metadata(
+            hdrs={self.env.versions_header_key: 'True'})
+        self.assertTrue(
+            config_true_value(self.env.container.info()['versions_enabled']))
+
+    def test_account_list_containers(self):
+        cont_listing = self.env.account.containers()
+        self.assertEqual(cont_listing, [self.env.container.name,
+                                        self.env.unversioned_container.name])
+        self.env.account.delete_containers()
+        prefix = Utils.create_name()
+
+        def get_name(i):
+            return prefix + '-%02d' % i
+
+        num_container = [15, 20]
+        for i in range(num_container[1]):
+            name = get_name(i)
+            container = self.env.account.container(name)
+            container.create()
+
+        limit = 5
+        cont_listing = self.env.account.containers(parms={'limit': limit})
+        self.assertEqual(cont_listing, [get_name(i) for i in range(limit)])
+
+        for i in range(num_container[0], num_container[1]):
+            name = get_name(i)
+            container = self.env.account.container(name)
+            container.update_metadata(
+                hdrs={self.env.versions_header_key: 'True'})
+
+        cont_listing = self.env.account.containers(parms={'limit': limit})
+        self.assertEqual(cont_listing, [get_name(i) for i in range(limit)])
+
+        # we're in charge of getting everything back to normal
+        self.env.account.delete_containers()
+        self.env.container.create()
+        self.env.unversioned_container.create()
+
+    def assert_previous_version(self, object_name, version_id, content,
+                                content_type, expected_headers={},
+                                not_expected_header_keys=[],
+                                check_env_expected_headers=False):
+        '''
+        Find previous version of an object using the ?versions API
+        then, assert object data and metadata using ?version-id API
+        '''
+        prev_version = self.env.container.file(object_name)
+        prev_version.initialize(parms={'version-id': version_id})
+        self.assertEqual(content, prev_version.read(
+            parms={'version-id': version_id}))
+        self.assertEqual(content_type, prev_version.content_type)
+        # make sure the new obj metadata did not leak to the prev. version
+        resp_headers = {
+            h.lower(): v for h, v in prev_version.conn.response.getheaders()}
+
+        for k in not_expected_header_keys:
+            self.assertNotIn(k, resp_headers)
+
+        for k, v in expected_headers.items():
+            self.assertIn(k.lower(), resp_headers)
+            self.assertEqual(v, resp_headers[k.lower()])
+
+        # also check env expected_headers
+        if check_env_expected_headers:
+            for k, v in self.env.expected_headers.items():
+                self.assertIn(k.lower(), resp_headers)
+                self.assertEqual(v, resp_headers[k.lower()])
+
+    def test_expiry(self):
+        # sanity
+        container = self.env.container
+        self.assertTrue(
+            config_true_value(self.env.container.info()['versions_enabled']))
+
+        versioned_obj1 = container.file(Utils.create_name())
+        put_headers = {'Content-Type': 'text/blah-blah-blah',
+                       'X-Delete-After': '1',
+                       'X-Object-Meta-Color': 'blue'}
+        resp = versioned_obj1.write(b"aaaaa", hdrs=put_headers,
+                                    return_resp=True)
+        version_id1 = resp.getheader('x-object-version-id')
+
+        versioned_obj2 = container.file(Utils.create_name())
+        resp = versioned_obj2.write(b"aaaaa", hdrs={}, return_resp=True)
+        version_id2 = resp.getheader('x-object-version-id')
+
+        # swift_test_client's File API doesn't really allow for POSTing
+        # arbitrary headers, so...
+        def post(url, token, parsed, conn):
+            conn.request('POST', '%s/%s/%s' % (parsed.path, container,
+                                               versioned_obj2.name),
+                         '', {'X-Auth-Token': token,
+                              'Content-Length': '0',
+                              'X-Object-Meta-Color': 'red',
+                              'X-Delete-After': '1'})
+            return tf.check_response(conn)
+        resp = tf.retry(post)
+        resp.read()
+        self.assertEqual(resp.status, 202)
+
+        time.sleep(1)
+
+        # Links have expired
+        with self.assertRaises(ResponseError) as cm:
+            versioned_obj1.info()
+        self.assertEqual(404, cm.exception.status)
+
+        with self.assertRaises(ResponseError) as cm:
+            versioned_obj2.info()
+        self.assertEqual(404, cm.exception.status)
+
+        # But data are still there
+        versioned_obj1.initialize(parms={'version-id': version_id1})
+        self.assertEqual('text/blah-blah-blah', versioned_obj1.content_type)
+        self.assertEqual('blue', versioned_obj1.metadata['color'])
+
+        versioned_obj2.initialize(parms={'version-id': version_id2})
+        self.assertEqual('application/octet-stream',
+                         versioned_obj2.content_type)
+        self.assertEqual('red', versioned_obj2.metadata['color'])
+
+        # Note that links may still show up in listings, depending on how
+        # aggressive the object-expirer is. When doing a version-aware
+        # listing, though, we'll only ever have the two entries.
+        self.assertTotalVersions(container, 2)
+
+    def test_get_if_match(self):
+        body = b'data'
+        oname = Utils.create_name()
+        obj = self.env.unversioned_container.file(oname)
+        resp = obj.write(body, return_resp=True)
+        etag = resp.getheader('etag')
+        self.assertEqual(
+            md5(body, usedforsecurity=False).hexdigest(),
+            normalize_etag(etag))
+
+        # un-versioned object is cool with with if-match
+        self.assertEqual(body, obj.read(hdrs={'if-match': etag}))
+        with self.assertRaises(ResponseError) as cm:
+            obj.read(hdrs={'if-match': 'not-the-etag'})
+        self.assertEqual(412, cm.exception.status)
+
+        v_obj = self.env.container.file(oname)
+        resp = v_obj.write(body, return_resp=True)
+        self.assertEqual(resp.getheader('etag'), etag)
+
+        # versioned object is too with with if-match
+        self.assertEqual(body, v_obj.read(hdrs={
+            'if-match': normalize_etag(etag)}))
+        # works quoted, too
+        self.assertEqual(body, v_obj.read(hdrs={
+            'if-match': '"%s"' % normalize_etag(etag)}))
+        with self.assertRaises(ResponseError) as cm:
+            v_obj.read(hdrs={'if-match': 'not-the-etag'})
+        self.assertEqual(412, cm.exception.status)
+
+    def test_container_acls(self):
+        if tf.skip3:
+            raise SkipTest('Username3 not set')
+
+        obj = self.env.container.file(Utils.create_name())
+        resp = obj.write(b"data", return_resp=True)
+        version_id = resp.getheader('x-object-version-id')
+        self.assertIsNotNone(version_id)
+
+        with self.assertRaises(ResponseError) as cm:
+            obj.read(hdrs={'X-Auth-Token': self.env.conn3.storage_token})
+        self.assertEqual(403, cm.exception.status)
+
+        # Container ACLs work more or less like they always have
+        self.env.container.update_metadata(
+            hdrs={'X-Container-Read': self.env.conn3.user_acl})
+        self.assertEqual(b"data", obj.read(hdrs={
+            'X-Auth-Token': self.env.conn3.storage_token}))
+
+        # But the version-specifc GET still requires a swift owner
+        with self.assertRaises(ResponseError) as cm:
+            obj.read(hdrs={'X-Auth-Token': self.env.conn3.storage_token},
+                     parms={'version-id': version_id})
+        self.assertEqual(403, cm.exception.status)
+
+        # If it's pointing to a symlink that points elsewhere, that still needs
+        # to be authed
+        tgt_name = Utils.create_name()
+        self.env.unversioned_container.file(tgt_name).write(b'link')
+        sym_tgt_header = quote(unquote('%s/%s' % (
+            self.env.unversioned_container.name, tgt_name)))
+        obj.write(hdrs={'X-Symlink-Target': sym_tgt_header})
+
+        # So, user1's good...
+        self.assertEqual(b'link', obj.read())
+        # ...but user3 can't
+        with self.assertRaises(ResponseError) as cm:
+            obj.read(hdrs={'X-Auth-Token': self.env.conn3.storage_token})
+        self.assertEqual(403, cm.exception.status)
+
+        # unless we add the acl to the unversioned_container
+        self.env.unversioned_container.update_metadata(
+            hdrs={'X-Container-Read': self.env.conn3.user_acl})
+        self.assertEqual(b'link', obj.read(
+            hdrs={'X-Auth-Token': self.env.conn3.storage_token}))
+
+    def _test_overwriting_setup(self, obj_name=None):
+        # sanity
+        container = self.env.container
+        self.assertTrue(
+            config_true_value(self.env.container.info()['versions_enabled']))
+
+        expected_content_types = []
+        self.assertTotalVersions(container, 0)
+        obj_name = obj_name or Utils.create_name()
+
+        versioned_obj = container.file(obj_name)
+        put_headers = {'Content-Type': 'text/jibberish01',
+                       'Content-Encoding': 'gzip',
+                       'Content-Disposition': 'attachment; filename=myfile'}
+        resp = versioned_obj.write(b"aaaaa", hdrs=put_headers,
+                                   return_resp=True)
+        v1_version_id = resp.getheader('x-object-version-id')
+        expected_content_types.append('text/jibberish01')
+        self.assertContentTypes(container, expected_content_types)
+        obj_info = versioned_obj.info()
+        self.assertEqual('text/jibberish01', obj_info['content_type'])
+
+        self.assertTotalVersions(container, 1)
+        resp = versioned_obj.write(
+            b"bbbbb",
+            hdrs={'Content-Type': 'text/jibberish02',
+                  'X-Object-Meta-Foo': 'Bar'},
+            return_resp=True)
+        v2_version_id = resp.getheader('x-object-version-id')
+        versioned_obj.initialize()
+        self.assertEqual(versioned_obj.content_type, 'text/jibberish02')
+        self.assertEqual(versioned_obj.metadata['foo'], 'Bar')
+        resp_headers = {
+            h.lower(): v for h, v in versioned_obj.conn.response.getheaders()}
+        content_location = quote('/v1/%s/%s/%s' % (
+            self.account_name, container.name, obj_name
+        )) + '?version-id=%s' % (v2_version_id,)
+        self.assertEqual(content_location, resp_headers['content-location'])
+        expected_content_types.append('text/jibberish02')
+        self.assertContentTypes(container, expected_content_types)
+
+        # the old version got saved off
+        self.assertTotalVersions(container, 2)
+
+        self.assert_previous_version(
+            obj_name, v1_version_id, b'aaaaa', 'text/jibberish01',
+            not_expected_header_keys=['X-Object-Meta-Foo'],
+            check_env_expected_headers=True)
+
+        # check that POST does not create a new version
+        versioned_obj.sync_metadata(metadata={'fu': 'baz'})
+        self.assertTotalVersions(container, 2)
+
+        self.assert_previous_version(
+            obj_name, v2_version_id, b'bbbbb', 'text/jibberish02',
+            expected_headers={'X-Object-Meta-Fu': 'baz'})
+
+        # if we overwrite it again, there are three versions
+        resp = versioned_obj.write(b"ccccc", return_resp=True)
+        v3_version_id = resp.getheader('x-object-version-id')
+        expected_content_types.append('text/jibberish02')
+        self.assertContentTypes(container, expected_content_types)
+        self.assertTotalVersions(self.env.container, 3)
+
+        # versioned_obj keeps the newest content
+        self.assertEqual(b"ccccc", versioned_obj.read())
+
+        # test copy from a different container
+        src_container = self.env.account.container(Utils.create_name())
+        self.assertTrue(src_container.create())
+        src_name = Utils.create_name()
+        src_obj = src_container.file(src_name)
+        src_obj.write(b"ddddd", hdrs={'Content-Type': 'text/jibberish04'})
+        src_obj.copy(container.name, obj_name)
+        expected_content_types.append('text/jibberish04')
+        self.assertContentTypes(container, expected_content_types)
+
+        self.assertEqual(b"ddddd", versioned_obj.read())
+        versioned_obj.initialize()
+        self.assertEqual(versioned_obj.content_type, 'text/jibberish04')
+
+        # make sure versions container has the previous version
+        self.assertTotalVersions(self.env.container, 4)
+        self.assert_previous_version(
+            obj_name, v3_version_id, b'ccccc', 'text/jibberish02')
+
+        # test delete
+        # at first, delete will succeed with 204
+        versioned_obj.delete()
+        expected_content_types.append(
+            'application/x-deleted;swift_versions_deleted=1')
+
+        # after that, any time the delete doesn't restore the old version
+        # and we will get 404 NotFound
+        for x in range(3):
+            with self.assertRaises(ResponseError) as cm:
+                versioned_obj.delete()
+            self.assertEqual(404, cm.exception.status)
+            expected_content_types.append(
+                'application/x-deleted;swift_versions_deleted=1')
+
+        # finally, we have 4 versioned items and 4 delete markers total in
+        # the versions container
+        self.assertTotalVersions(self.env.container, 8)
+        self.assertContentTypes(self.env.container, expected_content_types)
+
+        # update versioned_obj
+        versioned_obj.write(b"eeee", hdrs={'Content-Type': 'text/thanksgiving',
+                            'X-Object-Meta-Bar': 'foo'})
+
+        # verify the PUT object is kept successfully
+        obj_info = versioned_obj.info()
+        self.assertEqual('text/thanksgiving', obj_info['content_type'])
+
+        # 8 plus one more write
+        self.assertTotalVersions(self.env.container, 9)
+
+        # update versioned_obj
+        versioned_obj.write(b"ffff", hdrs={'Content-Type': 'text/teriyaki',
+                            'X-Object-Meta-Food': 'chickin'})
+
+        # verify the PUT object is kept successfully
+        obj_info = versioned_obj.info()
+        self.assertEqual('text/teriyaki', obj_info['content_type'])
+
+        # 9 plus one more write
+        self.assertTotalVersions(self.env.container, 10)
+
+        versioned_obj.delete()
+        with self.assertRaises(ResponseError) as cm:
+            versioned_obj.read()
+        self.assertEqual(404, cm.exception.status)
+
+        # 10 plus delete marker
+        self.assertTotalVersions(self.env.container, 11)
+
+        return (versioned_obj, expected_content_types)
+
+    def test_overwriting(self):
+        versioned_obj, expected_content_types = \
+            self._test_overwriting_setup()
+
+    def test_make_old_version_latest(self):
+        obj_name = Utils.create_name()
+        versioned_obj = self.env.container.file(obj_name)
+        versions = [{
+            'content_type': 'text/jibberish01',
+            'body': b'aaaaa',
+        }, {
+            'content_type': 'text/jibberish02',
+            'body': b'bbbbbb',
+        }, {
+            'content_type': 'text/jibberish03',
+            'body': b'ccccccc',
+        }]
+        for version in versions:
+            resp = versioned_obj.write(version['body'], hdrs={
+                'Content-Type': version['content_type']}, return_resp=True)
+            version['version_id'] = resp.getheader('x-object-version-id')
+        expected = [{
+            'name': obj_name,
+            'content_type': version['content_type'],
+            'version_id': version['version_id'],
+            'hash': md5(version['body'], usedforsecurity=False).hexdigest(),
+            'bytes': len(version['body'],)
+        } for version in reversed(versions)]
+        for item, is_latest in zip(expected, (True, False, False)):
+            item['is_latest'] = is_latest
+        versions_listing = self.env.container.files(parms={
+            'versions': 'true', 'format': 'json'})
+        for item in versions_listing:
+            item.pop('last_modified')
+        self.assertEqual(expected, versions_listing)
+
+        versioned_obj.write(b'', parms={
+            'version-id': versions[1]['version_id']})
+        self.assertEqual(b'bbbbbb', versioned_obj.read())
+        for item, is_latest in zip(expected, (False, True, False)):
+            item['is_latest'] = is_latest
+        versions_listing = self.env.container.files(parms={
+            'versions': 'true', 'format': 'json'})
+        for item in versions_listing:
+            item.pop('last_modified')
+        self.assertEqual(expected, versions_listing)
+
+    def test_overwriting_with_url_encoded_object_name(self):
+        obj_name = Utils.create_name() + '%25ff'
+        versioned_obj, expected_content_types = \
+            self._test_overwriting_setup(obj_name)
+
+    def _test_versioning_dlo_setup(self):
+        if tf.in_process:
+            tf.skip_if_no_xattrs()
+
+        container = self.env.container
+        obj_name = Utils.create_name()
+
+        for i in ('1', '2', '3'):
+            time.sleep(.01)  # guarantee that the timestamp changes
+            obj_name_seg = 'segs_' + obj_name + '/' + i
+            versioned_obj = container.file(obj_name_seg)
+            versioned_obj.write(i.encode('ascii'))
+            # immediately overwrite
+            versioned_obj.write((i + i).encode('ascii'))
+
+        # three objects 2 versions each
+        self.assertTotalVersions(self.env.container, 6)
+
+        man_file = container.file(obj_name)
+
+        # write a normal file first
+        resp = man_file.write(
+            b'old content', hdrs={'Content-Type': 'text/jibberish01'},
+            return_resp=True)
+        v1_version_id = resp.getheader('x-object-version-id')
+        self.assertEqual(b'old content', man_file.read())
+
+        # guarantee that the timestamp changes
+        time.sleep(.01)
+
+        # overwrite with a dlo manifest
+        dlo_prefix = quote(unquote('%s/segs_%s/' % (
+            self.env.container.name, obj_name)))
+        resp = man_file.write(
+            b'', hdrs={'Content-Type': 'text/jibberish02',
+                       'X-Object-Manifest': dlo_prefix},
+            return_resp=True)
+        v2_version_id = resp.getheader('x-object-version-id')
+
+        self.assertTotalVersions(self.env.container, 8)
+        self.assertEqual(b'112233', man_file.read())
+
+        self.assert_previous_version(
+            obj_name, v1_version_id, b'old content', 'text/jibberish01')
+
+        # overwrite the manifest with a normal file
+        man_file.write(b'new content')
+        self.assertTotalVersions(self.env.container, 9)
+        self.assertEqual(b'new content', man_file.read())
+
+        # new most-recent archive is the dlo
+        self.assert_previous_version(
+            obj_name, v2_version_id, b'112233', 'text/jibberish02',
+            expected_headers={'X-Object-Manifest': dlo_prefix})
+        return obj_name, man_file
+
+    def test_versioning_dlo(self):
+        obj_name, man_file = \
+            self._test_versioning_dlo_setup()
+
+        man_file.delete()
+        with self.assertRaises(ResponseError) as cm:
+            man_file.read()
+        self.assertEqual(404, cm.exception.status)
+
+        # 9 plus one more write
+        self.assertTotalVersions(self.env.container, 10)
+
+        expected = [b'old content', b'112233', b'new content']
+
+        bodies = []
+        listing_parms = {'versions': None, 'format': 'json',
+                         'reverse': 'true', 'prefix': obj_name}
+        for obj_info in self.env.container.files(parms=listing_parms)[:3]:
+            bodies.append(man_file.read(
+                parms={'version-id': obj_info['version_id']}))
+        self.assertEqual(expected, bodies)
+
+    def _check_overwriting_symlink(self):
+        # sanity
+        container = self.env.container
+        self.assertTrue(
+            config_true_value(self.env.container.info()['versions_enabled']))
+
+        tgt_a_name = Utils.create_name()
+        tgt_b_name = Utils.create_name()
+        expected_count = 0
+
+        tgt_a = container.file(tgt_a_name)
+        tgt_a.write(b'aaaaa', hdrs={'Content-Type': 'text/jibberish01'})
+        expected_count += 1
+
+        tgt_b = container.file(tgt_b_name)
+        tgt_b.write(b"bbbbb")
+        expected_count += 1
+
+        symlink_name = Utils.create_name()
+        sym_tgt_header = quote(unquote('%s/%s' % (container.name, tgt_a_name)))
+        sym_headers_a = {'X-Symlink-Target': sym_tgt_header}
+        symlink = container.file(symlink_name)
+        resp = symlink.write(b'', hdrs=sym_headers_a, return_resp=True)
+        v1_version_id = resp.getheader('x-object-version-id')
+        expected_count += 1
+        self.assertEqual(b"aaaaa", symlink.read())
+
+        sym_headers_b = {'X-Symlink-Target': '%s/%s' % (container.name,
+                                                        tgt_b_name)}
+        symlink.write(b"", hdrs=sym_headers_b)
+        expected_count += 1
+        self.assertEqual(b"bbbbb", symlink.read())
+
+        self.assertTotalVersions(container, expected_count)
+        self.assert_previous_version(
+            symlink_name, v1_version_id, b'aaaaa', 'text/jibberish01')
+        return symlink, tgt_a
+
+    def test_overwriting_symlink(self):
+        if 'symlink' not in cluster_info:
+            raise SkipTest("Symlinks not enabled")
+
+        symlink, target = self._check_overwriting_symlink()
+        # test delete
+        symlink.delete()
+        with self.assertRaises(ResponseError) as cm:
+            symlink.read()
+        self.assertEqual(404, cm.exception.status)
+
+    def _setup_symlink(self):
+        tgt_name = 'target-' + Utils.create_name()
+        target = self.env.container.file(tgt_name)
+        target.write(b'target object data',
+                     hdrs={'Content-Type': 'text/jibberish01'})
+        symlink = self.env.container.file('symlink')
+        resp = symlink.write(b'', hdrs={
+            'Content-Type': 'application/symlink',
+            'X-Symlink-Target': '%s/%s' % (
+                self.env.container.name, target.name)},
+            return_resp=True)
+        symlink_version_id = resp.getheader('x-object-version-id')
+        return symlink, symlink_version_id, target
+
+    def _check_copy_destination_symlink(self):
+        symlink, sym_version_id, target = self._setup_symlink()
+        self.assertEqual(b'target object data', symlink.read())
+        symlink.write(b'this is not a symlink')
+
+        # target, symlink, and new 'not a symlink' overwritten by write
+        self.assertTotalVersions(self.env.container, 3)
+        self.assert_previous_version(
+            symlink.name, sym_version_id,
+            b'target object data', 'text/jibberish01')
+
+        # the symlink is still a symlink
+        prev_version = self.env.container.file(symlink.name)
+        prev_version.initialize(parms={'version-id': sym_version_id})
+        self.assertEqual('application/symlink',
+                         prev_version.info(parms={
+                             'version-id': sym_version_id,
+                             'symlink': 'get'})['content_type'])
+        prev_version.copy(self.env.container.name, symlink.name,
+                          parms={'version-id': sym_version_id,
+                                 'symlink': 'get'})
+        self.assertEqual(b'target object data', symlink.read())
+        self.assertTotalVersions(self.env.container, 4)
+
+        return symlink, target
+
+    def test_copy_destination_restore_symlink(self):
+        if 'symlink' not in cluster_info:
+            raise SkipTest("Symlinks not enabled")
+
+        symlink, target = self._check_copy_destination_symlink()
+        symlink.delete()
+        with self.assertRaises(ResponseError) as cm:
+            symlink.read()
+        self.assertEqual(404, cm.exception.status)
+        # symlink & target, plus overwrite and restore, then delete marker
+        self.assertTotalVersions(self.env.container, 5)
+
+    def test_versioned_staticlink(self):
+        tgt_name = 'target-' + Utils.create_name()
+        link_name = 'staticlink-' + Utils.create_name()
+        target = self.env.container.file(tgt_name)
+        staticlink = self.env.container.file(link_name)
+
+        target_resp = target.write(b'target object data', hdrs={
+            'Content-Type': 'text/jibberish01'}, return_resp=True)
+        staticlink.write(b'', hdrs={
+            'X-Symlink-Target': '%s/%s' % (
+                self.env.container.name, target.name),
+            'X-Symlink-Target-Etag': target_resp.getheader('etag'),
+        }, cfg={'no_content_type': True})
+        self.assertEqual(b'target object data', staticlink.read())
+
+        listing_parms = {'format': 'json', 'versions': 'true'}
+        prev_versions = self.env.container.files(parms=listing_parms)
+        expected = [{
+            'name': link_name,
+            'bytes': 0,
+            'content_type': 'text/jibberish01',
+            'is_latest': True,
+        }, {
+            'name': tgt_name,
+            'bytes': 18,
+            'content_type': 'text/jibberish01',
+            'is_latest': True,
+        }]
+        self.assertEqual(expected, [{
+            k: i[k] for k in (
+                'name', 'bytes', 'content_type', 'is_latest',
+            )} for i in prev_versions])
+
+        target_resp = target.write(b'updated target data', hdrs={
+            'Content-Type': 'text/jibberish02'}, return_resp=True)
+        with self.assertRaises(ResponseError) as caught:
+            staticlink.read()
+        self.assertEqual(409, caught.exception.status)
+        staticlink.write(b'', hdrs={
+            'X-Symlink-Target': '%s/%s' % (
+                self.env.container.name, target.name),
+            'X-Symlink-Target-Etag': target_resp.getheader('etag'),
+        }, cfg={'no_content_type': True})
+        self.assertEqual(b'updated target data', staticlink.read())
+
+        listing_parms = {'format': 'json', 'versions': 'true'}
+        prev_versions = self.env.container.files(parms=listing_parms)
+        expected = [{
+            'name': link_name,
+            'bytes': 0,
+            'content_type': 'text/jibberish02',
+            'is_latest': True,
+        }, {
+            'name': link_name,
+            'bytes': 0,
+            'content_type': 'text/jibberish01',
+            'is_latest': False,
+        }, {
+            'name': tgt_name,
+            'bytes': 19,
+            'content_type': 'text/jibberish02',
+            'is_latest': True,
+        }, {
+            'name': tgt_name,
+            'bytes': 18,
+            'content_type': 'text/jibberish01',
+            'is_latest': False,
+        }]
+        self.assertEqual(expected, [{
+            k: i[k] for k in (
+                'name', 'bytes', 'content_type', 'is_latest',
+            )} for i in prev_versions])
+
+    def test_link_to_versioned_object(self):
+
+        # setup target object
+        tgt_name = 'target-' + Utils.create_name()
+        target = self.env.container.file(tgt_name)
+        target_resp = target.write(b'target object data', hdrs={
+            'Content-Type': 'text/jibberish01'}, return_resp=True)
+
+        # setup dynamic link object from a non-versioned container
+        link_container_name = 'link-container-' + Utils.create_name()
+        link_name = 'link-' + Utils.create_name()
+        link_cont = self.env.account.container(link_container_name)
+        self.assertTrue(link_cont.create())
+        link = link_cont.file(link_name)
+        self.assertTrue(link.write(b'', hdrs={
+            'X-Symlink-Target': '%s/%s' % (
+                self.env.container.name, tgt_name),
+        }, cfg={'no_content_type': True}))
+        self.assertEqual(b'target object data', link.read())
+
+        # setup static link object from a non-versioned container
+        staticlink_name = 'staticlink-' + Utils.create_name()
+        staticlink = link_cont.file(staticlink_name)
+        self.assertTrue(staticlink.write(b'', hdrs={
+            'X-Symlink-Target': '%s/%s' % (
+                self.env.container.name, tgt_name),
+            'X-Symlink-Target-Etag': target_resp.getheader('etag'),
+        }, cfg={'no_content_type': True}))
+        self.assertEqual(b'target object data', link.read())
+
+    def test_versioned_post(self):
+        # first we'll create a versioned object
+        obj_name = Utils.create_name()
+        obj = self.env.container.file(obj_name)
+        resp = obj.write(b'version1', hdrs={
+            'Content-Type': 'text/jibberish10'
+        }, return_resp=True)
+        v1_version_id = resp.getheader('x-object-version-id')
+
+        # send post request
+        obj.post(hdrs={'Content-Type': 'text/updated20'})
+
+        # head request should show updated content-type
+        obj_info = obj.info()
+        self.assertEqual(obj_info['content_type'], 'text/updated20')
+
+        listing_parms = {'format': 'json', 'versions': None}
+        prev_versions = self.env.container.files(parms=listing_parms)
+        self.assertEqual(1, len(prev_versions))
+        for pv in prev_versions:
+            pv.pop('last_modified')
+        self.assertEqual(prev_versions, [{
+            'name': obj_name,
+            'bytes': 8,
+            'content_type': 'text/updated20',
+            'hash': '966634ebf2fc135707d6753692bf4b1e',
+            'version_id': v1_version_id,
+            'is_latest': True,
+        }])
+
+    def test_unversioned_post(self):
+        # first we'll create a versioned object
+        obj_name = Utils.create_name()
+        obj = self.env.container.file(obj_name)
+        resp = obj.write(b'version1', hdrs={
+            'Content-Type': 'text/jibberish10'
+        }, return_resp=True)
+        v1_version_id = resp.getheader('x-object-version-id')
+
+        # now, turn off versioning
+        self.env.container.update_metadata(
+            hdrs={self.env.versions_header_key: 'False'})
+
+        obj.post(hdrs={'Content-Type': 'text/updated20'})
+
+        # head request should show updated content-type
+        obj_info = obj.info()
+        self.assertEqual(obj_info['content_type'], 'text/updated20')
+
+        listing_parms = {'format': 'json', 'versions': None}
+        prev_versions = self.env.container.files(parms=listing_parms)
+        self.assertEqual(1, len(prev_versions))
+        for pv in prev_versions:
+            pv.pop('last_modified')
+        self.assertEqual(prev_versions, [{
+            'name': obj_name,
+            'bytes': 8,
+            'content_type': 'text/updated20',
+            'hash': '966634ebf2fc135707d6753692bf4b1e',
+            'is_latest': True,
+            'version_id': v1_version_id,
+            'is_latest': True,
+        }])
+
+    def test_unversioned_overwrite_and_delete(self):
+        # first we'll create a versioned object
+        obj_name = Utils.create_name()
+        obj = self.env.container.file(obj_name)
+        resp = obj.write(b'version1', hdrs={
+            'Content-Type': 'text/jibberish18'
+        }, return_resp=True)
+        v1_version_id = resp.getheader('x-object-version-id')
+        self.assertTotalVersions(self.env.container, 1)
+
+        # now, turn off versioning, and delete source obj
+        self.env.container.update_metadata(
+            hdrs={self.env.versions_header_key: 'False'})
+        obj.delete()
+
+        # no delete markers, archive listing is unchanged
+        self.assertTotalVersions(self.env.container, 1)
+
+        # sanity, object is gone
+        self.assertRaises(ResponseError, obj.read)
+        self.assertEqual(404, obj.conn.response.status)
+
+        # but, archive version is unmodified
+        self.assert_previous_version(obj_name, v1_version_id, b'version1',
+                                     'text/jibberish18')
+
+        # a new overwrites will not have a version-id
+        resp = obj.write(b'version2', hdrs={
+            'Content-Type': 'text/jibberish19'
+        }, return_resp=True)
+        self.assertIsNone(resp.getheader('x-object-version-id'))
+        self.assertTotalVersions(self.env.container, 2)
+
+        resp = obj.write(b'version3', hdrs={
+            'Content-Type': 'text/jibberish20'
+        }, return_resp=True)
+        self.assertIsNone(resp.getheader('x-object-version-id'))
+        self.assertTotalVersions(self.env.container, 2)
+
+        obj.delete()
+        self.assertTotalVersions(self.env.container, 1)
+
+        obj.delete(tolerate_missing=True)
+        self.assertTotalVersions(self.env.container, 1)
+
+    def test_versioned_overwrite_from_old_version(self):
+        versioned_obj_name = Utils.create_name()
+        obj = self.env.container.file(versioned_obj_name)
+        resp = obj.write(b'version1', hdrs={
+            'Content-Type': 'text/jibberish32'
+        }, return_resp=True)
+        v1_version_id = resp.getheader('x-object-version-id')
+        v1_etag = normalize_etag(resp.getheader('etag'))
+
+        resp = obj.write(b'version2', hdrs={
+            'Content-Type': 'text/jibberish33'
+        }, return_resp=True)
+        v2_version_id = resp.getheader('x-object-version-id')
+        v2_etag = normalize_etag(resp.getheader('etag'))
+
+        # sanity
+        self.assertEqual(b'version2', obj.read())
+
+        self.assertTotalVersions(self.env.container, 2)
+        listing_parms = {'format': 'json', 'reverse': 'true', 'versions': None}
+        prev_versions = self.env.container.files(parms=listing_parms)
+        self.assertEqual(2, len(prev_versions))
+        for pv in prev_versions:
+            pv.pop('last_modified')
+        self.assertEqual(prev_versions, [{
+            'name': versioned_obj_name,
+            'bytes': 8,
+            'content_type': 'text/jibberish32',
+            'hash': v1_etag,
+            'version_id': v1_version_id,
+            'is_latest': False,
+        }, {
+            'name': versioned_obj_name,
+            'bytes': 8,
+            'content_type': 'text/jibberish33',
+            'hash': v2_etag,
+            'version_id': v2_version_id,
+            'is_latest': True,
+        }])
+
+        # restore old version1 back in place with a copy request
+        # should get a new version-id
+        old_version_obj = self.env.container.file(versioned_obj_name)
+        resp = old_version_obj.copy(self.env.container.name,
+                                    versioned_obj_name,
+                                    parms={'version-id': v1_version_id},
+                                    return_resp=True)
+        v3_version_id = resp.getheader('x-object-version-id')
+
+        listing_parms = {'format': 'json', 'reverse': 'true', 'versions': None}
+        prev_versions = self.env.container.files(parms=listing_parms)
+        self.assertEqual(3, len(prev_versions))
+        for pv in prev_versions:
+            pv.pop('last_modified')
+        self.assertEqual(prev_versions, [{
+            'name': versioned_obj_name,
+            'bytes': 8,
+            'content_type': 'text/jibberish32',
+            'hash': v1_etag,
+            'version_id': v1_version_id,
+            'is_latest': False,
+        }, {
+            'name': versioned_obj_name,
+            'bytes': 8,
+            'content_type': 'text/jibberish33',
+            'hash': v2_etag,
+            'version_id': v2_version_id,
+            'is_latest': False,
+        }, {
+            'name': versioned_obj_name,
+            'bytes': 8,
+            'content_type': 'text/jibberish32',
+            'hash': v1_etag,
+            'version_id': v3_version_id,
+            'is_latest': True,
+        }])
+
+        self.assertEqual(b'version1', obj.read())
+        obj_info = obj.info()
+        self.assertEqual('text/jibberish32', obj_info['content_type'])
+        self.assertEqual(v1_etag, normalize_etag(obj_info['etag']))
+
+    def test_delete_with_version_api_old_object(self):
+        versioned_obj_name = Utils.create_name()
+        obj = self.env.container.file(versioned_obj_name)
+        resp = obj.write(b'version1', hdrs={
+            'Content-Type': 'text/jibberish32'
+        }, return_resp=True)
+        v1_version_id = resp.getheader('x-object-version-id')
+
+        obj.write(b'version2', hdrs={'Content-Type': 'text/jibberish33'})
+
+        # sanity
+        self.assertEqual(b'version2', obj.read())
+
+        self.assertTotalVersions(self.env.container, 2)
+        obj.delete(parms={'version-id': v1_version_id})
+
+        self.assertEqual(b'version2', obj.read())
+        self.assertTotalVersions(self.env.container, 1)
+
+    def test_delete_with_version_api_current_object(self):
+        versioned_obj_name = Utils.create_name()
+        obj = self.env.container.file(versioned_obj_name)
+        obj.write(b'version1', hdrs={'Content-Type': 'text/jibberish32'})
+
+        resp = obj.write(b'version2', hdrs={
+            'Content-Type': 'text/jibberish33'
+        }, return_resp=True)
+        v2_version_id = resp.getheader('x-object-version-id')
+
+        # sanity
+        self.assertEqual(b'version2', obj.read())
+
+        self.assertTotalVersions(self.env.container, 2)
+        obj.delete(parms={'version-id': v2_version_id})
+
+        with self.assertRaises(ResponseError) as cm:
+            obj.read()
+        self.assertEqual(404, cm.exception.status)
+        self.assertTotalVersions(self.env.container, 1)
+
+    def test_delete_delete_marker_with_version_api(self):
+        versioned_obj_name = Utils.create_name()
+        obj = self.env.container.file(versioned_obj_name)
+        obj.write(b'version1', hdrs={'Content-Type': 'text/jibberish32'})
+
+        obj.delete()
+        resp_headers = {
+            h.lower(): v for h, v in obj.conn.response.getheaders()}
+        self.assertIn('x-object-version-id', resp_headers)
+        dm_version_id = resp_headers['x-object-version-id']
+
+        # sanity
+        with self.assertRaises(ResponseError) as cm:
+            obj.info(parms={'version-id': dm_version_id})
+        resp_headers = {
+            h.lower(): v for h, v in cm.exception.headers}
+        self.assertEqual(dm_version_id,
+                         resp_headers['x-object-version-id'])
+        self.assertEqual(DELETE_MARKER_CONTENT_TYPE,
+                         resp_headers['content-type'])
+
+        obj.delete(parms={'version-id': dm_version_id})
+        resp_headers = {
+            h.lower(): v for h, v in obj.conn.response.getheaders()}
+        self.assertEqual(dm_version_id,
+                         resp_headers['x-object-version-id'])
+
+    def test_delete_with_version_api_last_object(self):
+        versioned_obj_name = Utils.create_name()
+        obj = self.env.container.file(versioned_obj_name)
+        resp = obj.write(b'version1', hdrs={
+            'Content-Type': 'text/jibberish1'
+        }, return_resp=True)
+        v1_version_id = resp.getheader('x-object-version-id')
+
+        # sanity
+        self.assertEqual(b'version1', obj.read())
+        self.assertTotalVersions(self.env.container, 1)
+
+        # delete
+        obj.delete(parms={'version-id': v1_version_id})
+
+        with self.assertRaises(ResponseError) as cm:
+            obj.read()
+        self.assertEqual(404, cm.exception.status)
+        self.assertTotalVersions(self.env.container, 0)
+
+    def test_delete_with_version_api_null_version(self):
+        versioned_obj_name = Utils.create_name()
+        obj = self.env.container.file(versioned_obj_name)
+        obj.write(b'version1', hdrs={'Content-Type': 'text/jibberish32'})
+        obj.write(b'version2', hdrs={'Content-Type': 'text/jibberish33'})
+
+        # sanity
+        self.assertEqual(b'version2', obj.read())
+        self.assertTotalVersions(self.env.container, 2)
+
+        obj.delete(parms={'version-id': 'null'})
+        with self.assertRaises(ResponseError) as caught:
+            obj.read()
+        self.assertEqual(404, caught.exception.status)
+
+        # no versions removed
+        self.assertTotalVersions(self.env.container, 2)
+
+    def test_delete_with_version_api_old_object_disabled(self):
+        versioned_obj_name = Utils.create_name()
+        obj = self.env.container.file(versioned_obj_name)
+        resp = obj.write(b'version1', hdrs={
+            'Content-Type': 'text/jibberish32'
+        }, return_resp=True)
+        v1_version_id = resp.getheader('x-object-version-id')
+
+        obj.write(b'version2', hdrs={'Content-Type': 'text/jibberish33'})
+
+        # disabled versioning
+        self.env.container.update_metadata(
+            hdrs={self.env.versions_header_key: 'False'})
+
+        # sanity
+        self.assertEqual(b'version2', obj.read())
+
+        self.assertTotalVersions(self.env.container, 2)
+        obj.delete(parms={'version-id': v1_version_id})
+
+        self.assertEqual(b'version2', obj.read())
+        self.assertTotalVersions(self.env.container, 1)
+
+    def test_delete_with_version_api_current_object_disabled(self):
+        versioned_obj_name = Utils.create_name()
+        obj = self.env.container.file(versioned_obj_name)
+        obj.write(b'version1', hdrs={'Content-Type': 'text/jibberish32'})
+
+        resp = obj.write(b'version2', hdrs={
+            'Content-Type': 'text/jibberish33'
+        }, return_resp=True)
+        v2_version_id = resp.getheader('x-object-version-id')
+
+        # disabled versioning
+        self.env.container.update_metadata(
+            hdrs={self.env.versions_header_key: 'False'})
+
+        # sanity
+        self.assertEqual(b'version2', obj.read())
+
+        self.assertTotalVersions(self.env.container, 2)
+        obj.delete(parms={'version-id': v2_version_id})
+
+        with self.assertRaises(ResponseError) as cm:
+            obj.read()
+        self.assertEqual(404, cm.exception.status)
+        self.assertTotalVersions(self.env.container, 1)
+
+    def test_delete_with_version_api_old_object_current_unversioned(self):
+        versioned_obj_name = Utils.create_name()
+        obj = self.env.container.file(versioned_obj_name)
+        resp = obj.write(b'version1', hdrs={
+            'Content-Type': 'text/jibberish32'
+        }, return_resp=True)
+        v1_version_id = resp.getheader('x-object-version-id')
+
+        # disabled versioning
+        self.env.container.update_metadata(
+            hdrs={self.env.versions_header_key: 'False'})
+
+        # write unversioned object (i.e., version-id='null')
+        obj.write(b'version2', hdrs={'Content-Type': 'text/jibberish33'})
+
+        # sanity
+        self.assertEqual(b'version2', obj.read())
+
+        self.assertTotalVersions(self.env.container, 2)
+        obj.delete(parms={'version-id': v1_version_id})
+
+        self.assertEqual(b'version2', obj.read())
+        self.assertTotalVersions(self.env.container, 1)
+
+
+class TestObjectVersioningUTF8(Base2, TestObjectVersioning):
+    pass
+
+
+class TestContainerOperations(TestObjectVersioningBase):
+
+    def _prep_object_versions(self):
+
+        # object with multiple versions and currently deleted
+        obj1_v1 = {}
+        obj1_v1['name'] = 'c' + Utils.create_name()
+        obj = self.env.container.file(obj1_v1['name'])
+
+        # v1
+        resp = obj.write(b'version1', hdrs={
+            'Content-Type': 'text/jibberish11',
+            'ETag': md5(b'version1', usedforsecurity=False).hexdigest(),
+        }, return_resp=True)
+        obj1_v1['id'] = resp.getheader('x-object-version-id')
+
+        # v2
+        resp = obj.write(b'version2', hdrs={
+            'Content-Type': 'text/jibberish12',
+            'ETag': md5(b'version2', usedforsecurity=False).hexdigest(),
+        }, return_resp=True)
+        obj1_v2 = {}
+        obj1_v2['name'] = obj1_v1['name']
+        obj1_v2['id'] = resp.getheader('x-object-version-id')
+
+        # v3
+        resp = obj.write(b'version3', hdrs={
+            'Content-Type': 'text/jibberish13',
+            'ETag': md5(b'version3', usedforsecurity=False).hexdigest(),
+        }, return_resp=True)
+        obj1_v3 = {}
+        obj1_v3['name'] = obj1_v1['name']
+        obj1_v3['id'] = resp.getheader('x-object-version-id')
+
+        with self.assertRaises(ResponseError) as cm:
+            obj.write(b'version4', hdrs={
+                'Content-Type': 'text/jibberish11',
+                'ETag': 'aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa',
+            })
+        self.assertEqual(422, cm.exception.status)
+
+        # v4
+        obj.delete()
+        resp_headers = {
+            h.lower(): v for h, v in obj.conn.response.getheaders()}
+        obj1_v4 = {}
+        obj1_v4['name'] = obj1_v1['name']
+        obj1_v4['id'] = resp_headers.get('x-object-version-id')
+
+        # object with just a single version
+        obj2_v1 = {}
+        obj2_v1['name'] = 'b' + Utils.create_name()
+        obj = self.env.container.file(obj2_v1['name'])
+        resp = obj.write(b'version1', hdrs={
+            'Content-Type': 'text/jibberish20',
+            'ETag': '966634ebf2fc135707d6753692bf4b1e',
+        }, return_resp=True)
+        obj2_v1['id'] = resp.getheader('x-object-version-id')
+
+        # object never existed, just a delete marker
+        obj3_v1 = {}
+        obj3_v1['name'] = 'a' + Utils.create_name()
+        obj = self.env.container.file(obj3_v1['name'])
+        obj.delete(tolerate_missing=True)
+        self.assertEqual(obj.conn.response.status, 404)
+        resp_headers = {
+            h.lower(): v for h, v in obj.conn.response.getheaders()}
+        obj3_v1['id'] = resp_headers.get('x-object-version-id')
+
+        return (obj1_v1, obj1_v2, obj1_v3, obj1_v4, obj2_v1, obj3_v1)
+
+    def _prep_unversioned_objects(self):
+        objs = (
+            'deleted' + Utils.create_name(),
+            'in' + Utils.create_name(),
+            'order' + Utils.create_name(),
+        )
+
+        # object with multiple writes and currently deleted
+        obj = self.env.unversioned_container.file(objs[0])
+        obj.write(b'data', hdrs={
+            'Content-Type': 'text/jibberish11',
+            'ETag': md5(b'data', usedforsecurity=False).hexdigest(),
+        })
+        obj.delete()
+
+        obj = self.env.unversioned_container.file(objs[1])
+        obj.write(b'first', hdrs={
+            'Content-Type': 'text/blah-blah-blah',
+            'ETag': md5(b'first', usedforsecurity=False).hexdigest(),
+        })
+
+        obj = self.env.unversioned_container.file(objs[2])
+        obj.write(b'second', hdrs={
+            'Content-Type': 'text/plain',
+            'ETag': md5(b'second', usedforsecurity=False).hexdigest(),
+        })
+        return objs
+
+    def test_list_all_versions(self):
+        obj1_v1, obj1_v2, obj1_v3, obj1_v4, obj2_v1, obj3_v1 = \
+            self._prep_object_versions()
+
+        # list all versions in container
+        listing_parms = {'format': 'json', 'versions': None}
+        prev_versions = self.env.container.files(parms=listing_parms)
+        self.assertEqual(6, len(prev_versions))
+        for pv in prev_versions:
+            pv.pop('last_modified')
+        self.assertEqual(prev_versions, [{
+            'name': obj3_v1['name'],
+            'bytes': 0,
+            'content_type': 'application/x-deleted;swift_versions_deleted=1',
+            'hash': MD5_OF_EMPTY_STRING,
+            'is_latest': True,
+            'version_id': obj3_v1['id'],
+        }, {
+            'name': obj2_v1['name'],
+            'bytes': 8,
+            'content_type': 'text/jibberish20',
+            'hash': '966634ebf2fc135707d6753692bf4b1e',
+            'is_latest': True,
+            'version_id': obj2_v1['id'],
+        }, {
+            'name': obj1_v4['name'],
+            'bytes': 0,
+            'content_type': 'application/x-deleted;swift_versions_deleted=1',
+            'hash': MD5_OF_EMPTY_STRING,
+            'is_latest': True,
+            'version_id': obj1_v4['id'],
+        }, {
+            'name': obj1_v3['name'],
+            'bytes': 8,
+            'content_type': 'text/jibberish13',
+            'hash': md5(b'version3', usedforsecurity=False).hexdigest(),
+            'is_latest': False,
+            'version_id': obj1_v3['id'],
+        }, {
+            'name': obj1_v2['name'],
+            'bytes': 8,
+            'content_type': 'text/jibberish12',
+            'hash': md5(b'version2', usedforsecurity=False).hexdigest(),
+            'is_latest': False,
+            'version_id': obj1_v2['id'],
+        }, {
+            'name': obj1_v1['name'],
+            'bytes': 8,
+            'content_type': 'text/jibberish11',
+            'hash': md5(b'version1', usedforsecurity=False).hexdigest(),
+            'is_latest': False,
+            'version_id': obj1_v1['id'],
+        }])
+
+    def test_list_all_versions_reverse(self):
+        obj1_v1, obj1_v2, obj1_v3, obj1_v4, obj2_v1, obj3_v1 = \
+            self._prep_object_versions()
+
+        # list all versions in container in reverse order
+        listing_parms = {'format': 'json', 'reverse': 'true', 'versions': None}
+        prev_versions = self.env.container.files(parms=listing_parms)
+        self.assertEqual(6, len(prev_versions))
+        for pv in prev_versions:
+            pv.pop('last_modified')
+        self.assertEqual(prev_versions, [{
+            'name': obj1_v1['name'],
+            'bytes': 8,
+            'content_type': 'text/jibberish11',
+            'hash': md5(b'version1', usedforsecurity=False).hexdigest(),
+            'is_latest': False,
+            'version_id': obj1_v1['id'],
+        }, {
+            'name': obj1_v2['name'],
+            'bytes': 8,
+            'content_type': 'text/jibberish12',
+            'hash': md5(b'version2', usedforsecurity=False).hexdigest(),
+            'is_latest': False,
+            'version_id': obj1_v2['id'],
+        }, {
+            'name': obj1_v3['name'],
+            'bytes': 8,
+            'content_type': 'text/jibberish13',
+            'hash': md5(b'version3', usedforsecurity=False).hexdigest(),
+            'is_latest': False,
+            'version_id': obj1_v3['id'],
+        }, {
+            'name': obj1_v4['name'],
+            'bytes': 0,
+            'content_type': 'application/x-deleted;swift_versions_deleted=1',
+            'hash': MD5_OF_EMPTY_STRING,
+            'is_latest': True,
+            'version_id': obj1_v4['id'],
+        }, {
+            'name': obj2_v1['name'],
+            'bytes': 8,
+            'content_type': 'text/jibberish20',
+            'hash': '966634ebf2fc135707d6753692bf4b1e',
+            'is_latest': True,
+            'version_id': obj2_v1['id'],
+        }, {
+            'name': obj3_v1['name'],
+            'bytes': 0,
+            'content_type': 'application/x-deleted;swift_versions_deleted=1',
+            'hash': MD5_OF_EMPTY_STRING,
+            'is_latest': True,
+            'version_id': obj3_v1['id'],
+        }])
+
+    def test_list_versions_prefix(self):
+
+        obj1_v1, obj1_v2, obj1_v3, obj1_v4, obj2_v1, obj3_v1 = \
+            self._prep_object_versions()
+
+        # list all versions for a given object
+        listing_parms = {'format': 'json',
+                         'versions': None, 'prefix': obj1_v1['name']}
+        prev_versions = self.env.container.files(parms=listing_parms)
+        self.assertEqual(4, len(prev_versions))
+        for pv in prev_versions:
+            pv.pop('last_modified')
+        self.assertEqual(prev_versions, [{
+            'name': obj1_v4['name'],
+            'bytes': 0,
+            'content_type': 'application/x-deleted;swift_versions_deleted=1',
+            'hash': MD5_OF_EMPTY_STRING,
+            'is_latest': True,
+            'version_id': obj1_v4['id'],
+        }, {
+            'name': obj1_v3['name'],
+            'bytes': 8,
+            'content_type': 'text/jibberish13',
+            'hash': md5(b'version3', usedforsecurity=False).hexdigest(),
+            'is_latest': False,
+            'version_id': obj1_v3['id'],
+        }, {
+            'name': obj1_v2['name'],
+            'bytes': 8,
+            'content_type': 'text/jibberish12',
+            'hash': md5(b'version2', usedforsecurity=False).hexdigest(),
+            'is_latest': False,
+            'version_id': obj1_v2['id'],
+        }, {
+            'name': obj1_v1['name'],
+            'bytes': 8,
+            'content_type': 'text/jibberish11',
+            'hash': md5(b'version1', usedforsecurity=False).hexdigest(),
+            'is_latest': False,
+            'version_id': obj1_v1['id'],
+        }])
+
+    def test_list_versions_prefix_reverse(self):
+
+        obj1_v1, obj1_v2, obj1_v3, obj1_v4, obj2_v1, obj3_v1 = \
+            self._prep_object_versions()
+
+        # list all versions for a given object in reverse order
+        listing_parms = {'format': 'json', 'reverse': 'true',
+                         'versions': None, 'prefix': obj1_v1['name']}
+        prev_versions = self.env.container.files(parms=listing_parms)
+        self.assertEqual(4, len(prev_versions))
+        for pv in prev_versions:
+            pv.pop('last_modified')
+        self.assertEqual(prev_versions, [{
+            'name': obj1_v1['name'],
+            'bytes': 8,
+            'content_type': 'text/jibberish11',
+            'hash': md5(b'version1', usedforsecurity=False).hexdigest(),
+            'is_latest': False,
+            'version_id': obj1_v1['id'],
+        }, {
+            'name': obj1_v1['name'],
+            'bytes': 8,
+            'content_type': 'text/jibberish12',
+            'hash': md5(b'version2', usedforsecurity=False).hexdigest(),
+            'is_latest': False,
+            'version_id': obj1_v2['id'],
+        }, {
+            'name': obj1_v1['name'],
+            'bytes': 8,
+            'content_type': 'text/jibberish13',
+            'hash': md5(b'version3', usedforsecurity=False).hexdigest(),
+            'is_latest': False,
+            'version_id': obj1_v3['id'],
+        }, {
+            'name': obj1_v1['name'],
+            'bytes': 0,
+            'content_type': 'application/x-deleted;swift_versions_deleted=1',
+            'hash': MD5_OF_EMPTY_STRING,
+            'is_latest': True,
+            'version_id': obj1_v4['id'],
+        }])
+
+    def test_list_limit(self):
+        obj1_v1, obj1_v2, obj1_v3, obj1_v4, obj2_v1, obj3_v1 = \
+            self._prep_object_versions()
+
+        # list all versions in container
+        listing_parms = {'format': 'json',
+                         'limit': 3,
+                         'versions': None}
+        prev_versions = self.env.container.files(parms=listing_parms)
+        self.assertEqual(3, len(prev_versions))
+        for pv in prev_versions:
+            pv.pop('last_modified')
+        self.assertEqual(prev_versions, [{
+            'name': obj3_v1['name'],
+            'bytes': 0,
+            'content_type': 'application/x-deleted;swift_versions_deleted=1',
+            'hash': MD5_OF_EMPTY_STRING,
+            'is_latest': True,
+            'version_id': obj3_v1['id'],
+        }, {
+            'name': obj2_v1['name'],
+            'bytes': 8,
+            'content_type': 'text/jibberish20',
+            'hash': '966634ebf2fc135707d6753692bf4b1e',
+            'is_latest': True,
+            'version_id': obj2_v1['id'],
+        }, {
+            'name': obj1_v4['name'],
+            'bytes': 0,
+            'content_type': 'application/x-deleted;swift_versions_deleted=1',
+            'hash': MD5_OF_EMPTY_STRING,
+            'is_latest': True,
+            'version_id': obj1_v4['id'],
+        }])
+
+    def test_list_limit_marker(self):
+        obj1_v1, obj1_v2, obj1_v3, obj1_v4, obj2_v1, obj3_v1 = \
+            self._prep_object_versions()
+
+        # list all versions in container
+        listing_parms = {'format': 'json',
+                         'limit': 2,
+                         'marker': obj2_v1['name'],
+                         'versions': None}
+        prev_versions = self.env.container.files(parms=listing_parms)
+        self.assertEqual(2, len(prev_versions))
+        for pv in prev_versions:
+            pv.pop('last_modified')
+        self.assertEqual(prev_versions, [{
+            'name': obj1_v4['name'],
+            'bytes': 0,
+            'content_type': 'application/x-deleted;swift_versions_deleted=1',
+            'hash': MD5_OF_EMPTY_STRING,
+            'is_latest': True,
+            'version_id': obj1_v4['id'],
+        }, {
+            'name': obj1_v3['name'],
+            'bytes': 8,
+            'content_type': 'text/jibberish13',
+            'hash': md5(b'version3', usedforsecurity=False).hexdigest(),
+            'is_latest': False,
+            'version_id': obj1_v3['id'],
+        }])
+
+    def test_list_version_marker(self):
+        obj1_v1, obj1_v2, obj1_v3, obj1_v4, obj2_v1, obj3_v1 = \
+            self._prep_object_versions()
+
+        # list all versions starting with version_marker
+        listing_parms = {'format': 'json',
+                         'marker': obj1_v3['name'],
+                         'version_marker': obj1_v3['id'],
+                         'versions': None}
+        prev_versions = self.env.container.files(parms=listing_parms)
+        self.assertEqual(2, len(prev_versions))
+        for pv in prev_versions:
+            pv.pop('last_modified')
+        self.assertEqual(prev_versions, [{
+            'name': obj1_v2['name'],
+            'bytes': 8,
+            'content_type': 'text/jibberish12',
+            'hash': md5(b'version2', usedforsecurity=False).hexdigest(),
+            'is_latest': False,
+            'version_id': obj1_v2['id'],
+        }, {
+            'name': obj1_v1['name'],
+            'bytes': 8,
+            'content_type': 'text/jibberish11',
+            'hash': md5(b'version1', usedforsecurity=False).hexdigest(),
+            'is_latest': False,
+            'version_id': obj1_v1['id'],
+        }])
+
+    def test_list_version_marker_reverse(self):
+        obj1_v1, obj1_v2, obj1_v3, obj1_v4, obj2_v1, obj3_v1 = \
+            self._prep_object_versions()
+
+        # list all versions starting with version_marker in reverse order
+        listing_parms = {'format': 'json',
+                         'marker': obj1_v3['name'],
+                         'version_marker': obj1_v3['id'],
+                         'reverse': 'true',
+                         'versions': None}
+        prev_versions = self.env.container.files(parms=listing_parms)
+        self.assertEqual(3, len(prev_versions))
+        for pv in prev_versions:
+            pv.pop('last_modified')
+        self.assertEqual(prev_versions, [{
+            'name': obj1_v4['name'],
+            'bytes': 0,
+            'content_type': 'application/x-deleted;swift_versions_deleted=1',
+            'hash': MD5_OF_EMPTY_STRING,
+            'is_latest': True,
+            'version_id': obj1_v4['id'],
+        }, {
+            'name': obj2_v1['name'],
+            'bytes': 8,
+            'content_type': 'text/jibberish20',
+            'hash': '966634ebf2fc135707d6753692bf4b1e',
+            'is_latest': True,
+            'version_id': obj2_v1['id'],
+        }, {
+            'name': obj3_v1['name'],
+            'bytes': 0,
+            'content_type': 'application/x-deleted;swift_versions_deleted=1',
+            'hash': MD5_OF_EMPTY_STRING,
+            'is_latest': True,
+            'version_id': obj3_v1['id'],
+        }])
+
+    def test_list_prefix_version_marker(self):
+        obj1_v1, obj1_v2, obj1_v3, obj1_v4, obj2_v1, obj3_v1 = \
+            self._prep_object_versions()
+
+        # list versions with prefix starting with version_marker
+        listing_parms = {'format': 'json',
+                         'prefix': obj1_v3['name'],
+                         'marker': obj1_v3['name'],
+                         'version_marker': obj1_v3['id'],
+                         'versions': None}
+        prev_versions = self.env.container.files(parms=listing_parms)
+        self.assertEqual(2, len(prev_versions))
+        for pv in prev_versions:
+            pv.pop('last_modified')
+        self.assertEqual(prev_versions, [{
+            'name': obj1_v2['name'],
+            'bytes': 8,
+            'content_type': 'text/jibberish12',
+            'hash': md5(b'version2', usedforsecurity=False).hexdigest(),
+            'is_latest': False,
+            'version_id': obj1_v2['id'],
+        }, {
+            'name': obj1_v1['name'],
+            'bytes': 8,
+            'content_type': 'text/jibberish11',
+            'hash': md5(b'version1', usedforsecurity=False).hexdigest(),
+            'is_latest': False,
+            'version_id': obj1_v1['id'],
+        }])
+
+    def test_list_prefix_version_marker_reverse(self):
+        obj1_v1, obj1_v2, obj1_v3, obj1_v4, obj2_v1, obj3_v1 = \
+            self._prep_object_versions()
+
+        # list versions with prefix starting with version_marker
+        # in reverse order
+        listing_parms = {'format': 'json',
+                         'prefix': obj1_v3['name'],
+                         'marker': obj1_v3['name'],
+                         'version_marker': obj1_v3['id'],
+                         'reverse': 'true',
+                         'versions': None}
+        prev_versions = self.env.container.files(parms=listing_parms)
+        self.assertEqual(1, len(prev_versions))
+        for pv in prev_versions:
+            pv.pop('last_modified')
+        self.assertEqual(prev_versions, [{
+            'name': obj1_v4['name'],
+            'bytes': 0,
+            'content_type': 'application/x-deleted;swift_versions_deleted=1',
+            'hash': MD5_OF_EMPTY_STRING,
+            'is_latest': True,
+            'version_id': obj1_v4['id'],
+        }])
+
+    def test_unacceptable(self):
+        def do_test(format):
+            with self.assertRaises(ResponseError) as caught:
+                self.env.container.files(parms={
+                    'format': format, 'versions': None})
+            self.assertEqual(caught.exception.status, 406)
+
+        do_test('plain')
+        do_test('xml')
+
+        def do_test(accept):
+            with self.assertRaises(ResponseError) as caught:
+                self.env.container.files(hdrs={'Accept': accept},
+                                         parms={'versions': None})
+            self.assertEqual(caught.exception.status, 406)
+
+        do_test('text/plain')
+        do_test('text/xml')
+        do_test('application/xml')
+        do_test('foo/bar')
+
+    def testFileListingLimitMarkerPrefix(self):
+        cont = self.env.container
+
+        files = ['apple', 'banana', 'cacao', 'date', 'elderberry']
+        for f in files:
+            file_item = cont.file(f)
+            self.assertTrue(file_item.write_random())
+            # immediately ovewrite
+            self.assertTrue(file_item.write_random())
+            time.sleep(.01)  # guarantee that the timestamp changes
+
+        # sanity
+        for i in range(len(files)):
+            f = files[i]
+            for j in range(1, len(files) - i):
+                self.assertEqual(cont.files(parms={'limit': j, 'marker': f}),
+                                 files[i + 1: i + j + 1])
+            self.assertEqual(cont.files(parms={'marker': f}), files[i + 1:])
+            self.assertEqual(cont.files(parms={'marker': f, 'prefix': f}), [])
+            self.assertEqual(cont.files(parms={'prefix': f}), [f])
+
+        # repeat items in files list
+        versions = [f2 for f1 in files for f2 in (f1,) * 2]
+
+        # now list versions too
+        v = 0
+        for i in range(len(files)):
+            f = files[i]
+            for j in range(1, len(files) - i):
+                self.assertEqual(versions[i + v + 2: i + j + v + 2], [
+                    item['name'] for item in cont.files(parms={
+                        'limit': j, 'marker': f, 'versions': None})])
+            self.assertEqual(versions[v + i + 2:], [
+                item['name'] for item in cont.files(parms={
+                    'marker': f, 'versions': None})])
+            self.assertEqual(cont.files(parms={'marker': f, 'prefix': f,
+                                               'versions': None}), [])
+            self.assertEqual([f, f], [
+                item['name'] for item in cont.files(parms={
+                    'prefix': f, 'versions': None})])
+            v = v + 1
+
+    def testPrefixAndLimit(self):
+        cont = self.env.container
+
+        prefix_file_count = 10
+        limit_count = 2
+        prefixs = ['apple/', 'banana/', 'cacao/']
+        prefix_files = {}
+
+        for prefix in prefixs:
+            prefix_files[prefix] = []
+
+            for i in range(prefix_file_count):
+                file_item = cont.file(prefix + Utils.create_name())
+                self.assertTrue(file_item.write_random())
+                self.assertTrue(file_item.write_random())
+                prefix_files[prefix].append(file_item.name)
+                time.sleep(.01)  # guarantee that the timestamp changes
+
+        versions_prefix_files = {}
+        for prefix in prefixs:
+            versions_prefix_files[prefix] = [f2 for f1 in prefix_files[prefix]
+                                             for f2 in (f1,) * 2]
+        # sanity
+        for format_type in [None, 'json', 'xml']:
+            for prefix in prefixs:
+                files = cont.files(parms={'prefix': prefix,
+                                          'format': format_type})
+                if isinstance(files[0], dict):
+                    files = [x.get('name', x.get('subdir')) for x in files]
+                self.assertEqual(files, sorted(prefix_files[prefix]))
+
+        # list versions
+        for format_type in [None, 'json']:
+            for prefix in prefixs:
+                files = cont.files(parms={'prefix': prefix,
+                                          'versions': None,
+                                          'format': format_type})
+                if isinstance(files[0], dict):
+                    files = [x.get('name', x.get('subdir')) for x in files]
+                self.assertEqual(files, sorted(versions_prefix_files[prefix]))
+
+        # list versions
+        for format_type in [None, 'json']:
+            for prefix in prefixs:
+                files = cont.files(parms={'limit': limit_count,
+                                          'versions': None,
+                                          'prefix': prefix,
+                                          'format': format_type})
+                if isinstance(files[0], dict):
+                    files = [x.get('name', x.get('subdir')) for x in files]
+                self.assertEqual(len(files), limit_count)
+
+                for file_item in files:
+                    self.assertTrue(file_item.startswith(prefix))
+
+    def testListDelimiter(self):
+        cont = self.env.container
+
+        delimiter = '-'
+        files = ['test', delimiter.join(['test', 'bar']),
+                 delimiter.join(['test', 'foo'])]
+        for f in files:
+            file_item = cont.file(f)
+            self.assertTrue(file_item.write_random())
+
+        # object with no current version, just a delete marker
+        del_file = 'del-baz'
+        obj = self.env.container.file(del_file)
+        obj.delete(tolerate_missing=True)
+        self.assertEqual(obj.conn.response.status, 404)
+
+        # now, turn off versioning and write a un-versioned obj
+        self.env.container.update_metadata(
+            hdrs={self.env.versions_header_key: 'False'})
+
+        # a new write will not have a version-id
+        off_file = 'off-xyz'
+        obj = self.env.container.file(off_file)
+        resp = obj.write(b'unversioned', return_resp=True)
+        self.assertIsNone(resp.getheader('x-object-version-id'))
+
+        # sanity
+        # list latest, delete marker should not show-up
+        for format_type in [None, 'json', 'xml']:
+            results = cont.files(parms={'format': format_type})
+            if isinstance(results[0], dict):
+                results = [x.get('name', x.get('subdir')) for x in results]
+            self.assertEqual(results, ['off-xyz', 'test', 'test-bar',
+                                       'test-foo'])
+
+            results = cont.files(parms={'delimiter': delimiter,
+                                        'format': format_type})
+            if isinstance(results[0], dict):
+                results = [x.get('name', x.get('subdir')) for x in results]
+            self.assertEqual(results, ['off-', 'test', 'test-'])
+
+            results = cont.files(parms={'delimiter': delimiter,
+                                        'format': format_type,
+                                        'reverse': 'yes'})
+            if isinstance(results[0], dict):
+                results = [x.get('name', x.get('subdir')) for x in results]
+            self.assertEqual(results, ['test-', 'test', 'off-'])
+
+        # list versions, we should see delete marker here
+        for format_type in [None, 'json']:
+            results = cont.files(parms={'versions': None,
+                                        'format': format_type})
+            if isinstance(results[0], dict):
+                results = [x.get('name', x.get('subdir')) for x in results]
+            self.assertEqual(results, ['del-baz', 'off-xyz', 'test',
+                                       'test-bar', 'test-foo'])
+
+            results = cont.files(parms={'delimiter': delimiter,
+                                        'versions': None,
+                                        'format': format_type})
+            if isinstance(results[0], dict):
+                results = [x.get('name', x.get('subdir')) for x in results]
+            self.assertEqual(results, ['del-', 'off-', 'test', 'test-'])
+
+            results = cont.files(parms={'delimiter': delimiter,
+                                        'versions': None,
+                                        'format': format_type,
+                                        'reverse': 'yes'})
+            if isinstance(results[0], dict):
+                results = [x.get('name', x.get('subdir')) for x in results]
+            self.assertEqual(results, ['test-', 'test', 'off-', 'del-'])
+
+    def testListMultiCharDelimiter(self):
+        cont = self.env.container
+
+        delimiter = '-&'
+        files = ['test', delimiter.join(['test', 'bar']),
+                 delimiter.join(['test', 'foo'])]
+        for f in files:
+            file_item = cont.file(f)
+            self.assertTrue(file_item.write_random())
+
+        # object with no current version, just a delete marker
+        del_file = 'del-&baz'
+        obj = self.env.container.file(del_file)
+        obj.delete(tolerate_missing=True)
+        self.assertEqual(obj.conn.response.status, 404)
+
+        # now, turn off versioning and write a un-versioned obj
+        self.env.container.update_metadata(
+            hdrs={self.env.versions_header_key: 'False'})
+
+        # a new write will not have a version-id
+        off_file = 'off-&xyz'
+        obj = self.env.container.file(off_file)
+        resp = obj.write(b'unversioned', return_resp=True)
+        self.assertIsNone(resp.getheader('x-object-version-id'))
+
+        # sanity
+        # list latest, delete marker should not show-up
+        for format_type in [None, 'json', 'xml']:
+            results = cont.files(parms={'format': format_type})
+            if isinstance(results[0], dict):
+                results = [x.get('name', x.get('subdir')) for x in results]
+            self.assertEqual(results, ['off-&xyz', 'test', 'test-&bar',
+                                       'test-&foo'])
+
+            results = cont.files(parms={'delimiter': delimiter,
+                                        'format': format_type})
+            if isinstance(results[0], dict):
+                results = [x.get('name', x.get('subdir')) for x in results]
+            self.assertEqual(results, ['off-&', 'test', 'test-&'])
+
+            results = cont.files(parms={'delimiter': delimiter,
+                                        'format': format_type,
+                                        'reverse': 'yes'})
+            if isinstance(results[0], dict):
+                results = [x.get('name', x.get('subdir')) for x in results]
+            self.assertEqual(results, ['test-&', 'test', 'off-&'])
+
+        # list versions, we should see delete marker here
+        for format_type in [None, 'json']:
+            results = cont.files(parms={'versions': None,
+                                        'format': format_type})
+            if isinstance(results[0], dict):
+                results = [x.get('name', x.get('subdir')) for x in results]
+            self.assertEqual(results, ['del-&baz', 'off-&xyz', 'test',
+                                       'test-&bar', 'test-&foo'])
+
+            results = cont.files(parms={'delimiter': delimiter,
+                                        'versions': None,
+                                        'format': format_type})
+            if isinstance(results[0], dict):
+                results = [x.get('name', x.get('subdir')) for x in results]
+            self.assertEqual(results, ['del-&', 'off-&', 'test', 'test-&'])
+
+            results = cont.files(parms={'delimiter': delimiter,
+                                        'versions': None,
+                                        'format': format_type,
+                                        'reverse': 'yes'})
+            if isinstance(results[0], dict):
+                results = [x.get('name', x.get('subdir')) for x in results]
+            self.assertEqual(results, ['test-&', 'test', 'off-&', 'del-&'])
+
+    def test_bytes_count(self):
+
+        container = self.env.container
+
+        # first store a non-versioned object
+        # disable versioning
+        container.update_metadata(
+            hdrs={self.env.versions_header_key: 'False'})
+        self.assertFalse(
+            config_true_value(container.info()['versions_enabled']))
+
+        obj = container.file(Utils.create_name())
+        self.assertTrue(obj.write(b'not-versioned'))
+        self.assertTotalVersions(container, 1)
+
+        # enable versioning
+        container.update_metadata(
+            hdrs={self.env.versions_header_key: 'True'})
+        self.assertTrue(
+            config_true_value(container.info()['versions_enabled']))
+
+        obj1_v1, obj1_v2, obj1_v3, obj1_v4, obj2_v1, obj3_v1 = \
+            self._prep_object_versions()
+
+        self.assertEqual(int(container.info()['bytes_used']), 32 + obj.size)
+        self.assertEqual(int(container.info()['object_count']), 2)
+        self.assertTotalVersions(container, 7)
+
+    def test_container_quota_bytes(self):
+        if 'container_quotas' not in tf.cluster_info:
+            raise SkipTest('Container quotas not enabled')
+
+        if tf.in_process:
+            tf.skip_if_no_xattrs()
+
+        container = self.env.container
+
+        # write two versions of 5 bytes each
+        obj = container.file(Utils.create_name())
+        self.assertTrue(obj.write(b'aaaaa'))
+        self.assertTrue(obj.write(b'bbbbb'))
+        self.assertTotalVersions(container, 2)
+
+        # set X-Container-Meta-Quota-Bytes is 10
+        container.update_metadata(
+            hdrs={'X-Container-Meta-Quota-Bytes': '10'})
+        self.assertEqual(container.info()['container_quota_bytes'], '10')
+
+        with self.assertRaises(ResponseError) as cm:
+            obj.write(b'ccccc')
+        self.assertEqual(413, cm.exception.status)
+
+        # reset container quota
+        container.update_metadata(
+            hdrs={'X-Container-Meta-Quota-Bytes': ''})
+
+    def test_list_unversioned_container(self):
+        _obj1, obj2, obj3 = self._prep_unversioned_objects()
+        # _obj1 got deleted, so won't show up at all
+        item2 = {
+            'name': obj2,
+            'bytes': 5,
+            'content_type': 'text/blah-blah-blah',
+            'hash': md5(b'first', usedforsecurity=False).hexdigest(),
+            'is_latest': True,
+            'version_id': 'null',
+        }
+        item3 = {
+            'name': obj3,
+            'bytes': 6,
+            'content_type': 'text/plain',
+            'hash': md5(b'second', usedforsecurity=False).hexdigest(),
+            'is_latest': True,
+            'version_id': 'null',
+        }
+
+        # version-aware listing works for unversioned containers
+        listing_parms = {'format': 'json',
+                         'versions': None}
+        listing = self.env.unversioned_container.files(parms=listing_parms)
+        for item in listing:
+            item.pop('last_modified')
+        self.assertEqual(listing, [item2, item3])
+
+        listing_parms = {'format': 'json',
+                         'prefix': obj2[:2],
+                         'versions': None}
+        listing = self.env.unversioned_container.files(parms=listing_parms)
+        for item in listing:
+            item.pop('last_modified')
+        self.assertEqual(listing, [item2])
+
+        listing_parms = {'format': 'json',
+                         'marker': obj2,
+                         'versions': None}
+        listing = self.env.unversioned_container.files(parms=listing_parms)
+        for item in listing:
+            item.pop('last_modified')
+        self.assertEqual(listing, [item3])
+
+        listing_parms = {'format': 'json',
+                         'delimiter': 'er',
+                         'versions': None}
+        listing = self.env.unversioned_container.files(parms=listing_parms)
+        for item in listing:
+            if 'name' in item:
+                item.pop('last_modified')
+        self.assertEqual(listing, [item2, {'subdir': 'order'}])
+
+        listing_parms = {'format': 'json',
+                         'reverse': 'true',
+                         'versions': None}
+        listing = self.env.unversioned_container.files(parms=listing_parms)
+        for item in listing:
+            item.pop('last_modified')
+        self.assertEqual(listing, [item3, item2])
+
+    def test_is_latest(self):
+        obj = self.env.container.file(Utils.create_name())
+
+        # v1
+        resp = obj.write(b'version1', hdrs={
+            'Content-Type': 'text/jibberish11',
+            'ETag': md5(b'version1', usedforsecurity=False).hexdigest(),
+        }, return_resp=True)
+        obj_v1 = resp.getheader('x-object-version-id')
+
+        # v2
+        resp = obj.write(b'version2', hdrs={
+            'Content-Type': 'text/jibberish12',
+            'ETag': md5(b'version2', usedforsecurity=False).hexdigest(),
+        }, return_resp=True)
+        obj_v2 = resp.getheader('x-object-version-id')
+
+        obj.delete()
+        resp_headers = {
+            h.lower(): v for h, v in obj.conn.response.getheaders()}
+        obj_v3 = resp_headers.get('x-object-version-id')
+
+        resp = obj.write(b'version4', hdrs={
+            'Content-Type': 'text/jibberish14',
+            'ETag': md5(b'version4', usedforsecurity=False).hexdigest(),
+        }, return_resp=True)
+        obj_v4 = resp.getheader('x-object-version-id')
+
+        listing_parms = {'format': 'json', 'versions': None}
+        prev_versions = self.env.container.files(parms=listing_parms)
+        self.assertEqual(4, len(prev_versions))
+        for pv in prev_versions:
+            pv.pop('last_modified')
+        self.assertEqual(prev_versions, [{
+            'name': obj.name,
+            'bytes': 8,
+            'content_type': 'text/jibberish14',
+            'hash': md5(b'version4', usedforsecurity=False).hexdigest(),
+            'is_latest': True,
+            'version_id': obj_v4,
+        }, {
+            'name': obj.name,
+            'bytes': 0,
+            'content_type': 'application/x-deleted;swift_versions_deleted=1',
+            'hash': MD5_OF_EMPTY_STRING,
+            'is_latest': False,
+            'version_id': obj_v3,
+        }, {
+            'name': obj.name,
+            'bytes': 8,
+            'content_type': 'text/jibberish12',
+            'hash': md5(b'version2', usedforsecurity=False).hexdigest(),
+            'is_latest': False,
+            'version_id': obj_v2,
+        }, {
+            'name': obj.name,
+            'bytes': 8,
+            'content_type': 'text/jibberish11',
+            'hash': md5(b'version1', usedforsecurity=False).hexdigest(),
+            'is_latest': False,
+            'version_id': obj_v1,
+        }])
+
+        self.env.container.update_metadata(
+            hdrs={self.env.versions_header_key: 'False'})
+
+        # v5 - non-versioned
+        obj.write(b'version5', hdrs={
+            'Content-Type': 'text/jibberish15',
+            'ETag': md5(b'version5', usedforsecurity=False).hexdigest(),
+        })
+
+        listing_parms = {'format': 'json', 'versions': None}
+        prev_versions = self.env.container.files(parms=listing_parms)
+        self.assertEqual(5, len(prev_versions))
+        for pv in prev_versions:
+            pv.pop('last_modified')
+        self.assertEqual(prev_versions, [{
+            'name': obj.name,
+            'bytes': 8,
+            'content_type': 'text/jibberish15',
+            'hash': md5(b'version5', usedforsecurity=False).hexdigest(),
+            'is_latest': True,
+            'version_id': 'null',
+        }, {
+            'name': obj.name,
+            'bytes': 8,
+            'content_type': 'text/jibberish14',
+            'hash': md5(b'version4', usedforsecurity=False).hexdigest(),
+            'is_latest': False,
+            'version_id': obj_v4,
+        }, {
+            'name': obj.name,
+            'bytes': 0,
+            'content_type': 'application/x-deleted;swift_versions_deleted=1',
+            'hash': MD5_OF_EMPTY_STRING,
+            'is_latest': False,
+            'version_id': obj_v3,
+        }, {
+            'name': obj.name,
+            'bytes': 8,
+            'content_type': 'text/jibberish12',
+            'hash': md5(b'version2', usedforsecurity=False).hexdigest(),
+            'is_latest': False,
+            'version_id': obj_v2,
+        }, {
+            'name': obj.name,
+            'bytes': 8,
+            'content_type': 'text/jibberish11',
+            'hash': md5(b'version1', usedforsecurity=False).hexdigest(),
+            'is_latest': False,
+            'version_id': obj_v1,
+        }])
+
+
+class TestContainerOperationsUTF8(Base2, TestContainerOperations):
+    pass
+
+
+class TestDeleteContainer(TestObjectVersioningBase):
+    def tearDown(self):
+        # do nothing since test will delete all data + container
+        pass
+
+    def test_delete_container(self):
+        # sanity
+        container = self.env.container
+        self.assertTrue(
+            config_true_value(container.info()['versions_enabled']))
+        self.assertTotalVersions(container, 0)
+
+        # write an object to be versioned
+        obj = container.file(Utils.create_name)
+        obj.write(b"foo")
+        self.assertTotalVersions(container, 1)
+
+        # delete object and attempt to delete container
+        obj.delete()
+        self.assertTotalVersions(container, 2)
+
+        # expect failure because versioning is enabled and
+        # old versions still exist
+        self.assertFalse(container.delete())
+
+        # disable it
+        container.update_metadata(
+            hdrs={self.env.versions_header_key: 'False'})
+        self.assertFalse(
+            config_true_value(container.info()['versions_enabled']))
+
+        # expect failure because old versions still exist
+        self.assertFalse(container.delete())
+
+        # delete older versions
+        self._tear_down_files(container)
+        self.assertTotalVersions(container, 0)
+
+        # and finally delete container
+        self.assertTrue(container.delete())
+
+
+class TestSloWithVersioning(TestObjectVersioningBase):
+
+    def setUp(self):
+        super(TestSloWithVersioning, self).setUp()
+
+        if 'slo' not in cluster_info:
+            raise SkipTest("SLO not enabled")
+        if tf.in_process:
+            tf.skip_if_no_xattrs()
+
+        # create a container with versioning
+        self.env.versions_header_key = 'X-Versions-Enabled'
+        self.container = self.env.account.container(Utils.create_name())
+        container_headers = {self.env.versions_header_key: 'True'}
+        if not self.container.create(hdrs=container_headers):
+            raise ResponseError(self.conn.response)
+
+        self.segments_container = self.env.account.container(
+            Utils.create_name())
+        if not self.segments_container.create():
+            raise ResponseError(self.conn.response)
+
+        # create some segments
+        self.seg_info = {}
+        for letter, size in (('a', 1024 * 1024),
+                             ('b', 1024 * 1024)):
+            seg_name = letter
+            file_item = self.segments_container.file(seg_name)
+            file_item.write((letter * size).encode('ascii'))
+            self.seg_info[seg_name] = {
+                'size_bytes': size,
+                'etag': file_item.md5,
+                'path': '/%s/%s' % (self.segments_container.name, seg_name)}
+
+    @property
+    def account_name(self):
+        if not self._account_name:
+            self._account_name = self.env.account.conn.storage_path.rsplit(
+                '/', 1)[-1]
+        return self._account_name
+
+    def _create_manifest(self, seg_names):
+        # create a manifest in the versioning container
+        file_item = self.container.file("my-slo-manifest")
+        manifest = [self.seg_info[seg_name] for seg_name in seg_names]
+        resp = file_item.write(
+            json.dumps(manifest).encode('ascii'),
+            parms={'multipart-manifest': 'put'},
+            return_resp=True)
+        version_id = resp.getheader('x-object-version-id')
+        return file_item, version_id
+
+    def _assert_is_manifest(self, file_item, seg_name, version_id=None):
+        if version_id:
+            read_params = {'multipart-manifest': 'get',
+                           'version-id': version_id}
+        else:
+            read_params = {'multipart-manifest': 'get'}
+        manifest_body = file_item.read(parms=read_params)
+        resp_headers = {
+            h.lower(): v for h, v in file_item.conn.response.getheaders()}
+        self.assertIn('x-static-large-object', resp_headers)
+        self.assertEqual('application/json; charset=utf-8',
+                         file_item.content_type)
+        try:
+            manifest = json.loads(manifest_body)
+        except ValueError:
+            self.fail("GET with multipart-manifest=get got invalid json")
+
+        self.assertEqual(1, len(manifest))
+        key_map = {'etag': 'hash', 'size_bytes': 'bytes', 'path': 'name'}
+
+        for k_client, k_slo in key_map.items():
+            self.assertEqual(self.seg_info[seg_name][k_client],
+                             manifest[0][k_slo])
+
+    def _assert_is_object(self, file_item, seg_data, version_id=None):
+        if version_id:
+            file_contents = file_item.read(parms={'version-id': version_id})
+        else:
+            file_contents = file_item.read()
+        self.assertEqual(1024 * 1024, len(file_contents))
+        self.assertEqual(seg_data, file_contents[:1])
+        self.assertEqual(seg_data, file_contents[-1:])
+
+    def tearDown(self):
+        self._tear_down_files(self.container)
+
+    def test_slo_manifest_version(self):
+        file_item, v1_version_id = self._create_manifest(['a'])
+        # sanity check: read the manifest, then the large object
+        self._assert_is_manifest(file_item, 'a')
+        self._assert_is_object(file_item, b'a')
+
+        # upload new manifest
+        file_item, v2_version_id = self._create_manifest(['b'])
+        # sanity check: read the manifest, then the large object
+        self._assert_is_manifest(file_item, 'b')
+        self._assert_is_object(file_item, b'b')
+
+        # we wrote two versions
+        self.assertTotalVersions(self.container, 2)
+
+        # check the version 1 is still a manifest
+        self._assert_is_manifest(file_item, 'a', v1_version_id)
+        self._assert_is_object(file_item, b'a', v1_version_id)
+
+        # listing looks good
+        file_info = file_item.info()
+        manifest_info = file_item.info(parms={'multipart-manifest': 'get'})
+        obj_list = self.container.files(parms={'format': 'json'})
+        for o in obj_list:
+            o.pop('last_modified')
+            # TODO: add symlink_path back in expected
+            o.pop('symlink_path')
+        expected = {
+            'bytes': file_info['content_length'],
+            'content_type': 'application/octet-stream',
+            'hash': normalize_etag(manifest_info['etag']),
+            'name': 'my-slo-manifest',
+            'slo_etag': file_info['etag'],
+            'version_symlink': True,
+        }
+        self.assertEqual([expected], obj_list)
+
+        # delete the newest manifest
+        file_item.delete()
+
+        # expect to have 3 versions now, last one being a delete-marker
+        self.assertTotalVersions(self.container, 3)
+
+        # restore version 1
+        file_item.copy(self.container.name, file_item.name,
+                       parms={'multipart-manifest': 'get',
+                              'version-id': v1_version_id})
+        self.assertTotalVersions(self.container, 4)
+        self._assert_is_manifest(file_item, 'a')
+        self._assert_is_object(file_item, b'a')
+
+        # versioned container listing still looks slo-like
+        file_info = file_item.info()
+        manifest_info = file_item.info(parms={'multipart-manifest': 'get'})
+        obj_list = self.container.files(parms={'format': 'json'})
+        for o in obj_list:
+            o.pop('last_modified')
+            # TODO: add symlink_path back in expected
+            o.pop('symlink_path')
+        expected = {
+            'bytes': file_info['content_length'],
+            'content_type': 'application/octet-stream',
+            'hash': normalize_etag(manifest_info['etag']),
+            'name': 'my-slo-manifest',
+            'slo_etag': file_info['etag'],
+            'version_symlink': True,
+        }
+        self.assertEqual([expected], obj_list)
+
+        status = file_item.conn.make_request(
+            'DELETE', file_item.path,
+            hdrs={'Accept': 'application/json'},
+            parms={'multipart-manifest': 'delete',
+                   'version-id': v1_version_id})
+        body = file_item.conn.response.read()
+        self.assertEqual(status, 200, body)
+        resp = json.loads(body)
+        self.assertEqual(resp['Response Status'], '200 OK')
+        self.assertEqual(resp['Errors'], [])
+        self.assertEqual(resp['Number Deleted'], 2)
+
+        self.assertTotalVersions(self.container, 3)
+        # Since we included the ?multipart-manifest=delete, segments
+        # got cleaned up and now the current version is busted
+        with self.assertRaises(ResponseError) as caught:
+            file_item.read()
+        self.assertEqual(409, caught.exception.status)
+
+    def test_links_to_slo(self):
+        file_item, v1_version_id = self._create_manifest(['a'])
+        slo_info = file_item.info()
+
+        symlink_name = Utils.create_name()
+        sym_tgt_header = quote(unquote('%s/%s' % (
+            self.container.name, file_item.name)))
+        symlink = self.container.file(symlink_name)
+
+        # symlink to the slo
+        sym_headers = {'X-Symlink-Target': sym_tgt_header}
+        symlink.write(b'', hdrs=sym_headers)
+        self.assertEqual(slo_info, symlink.info())
+
+        # hardlink to the slo
+        sym_headers['X-Symlink-Target-Etag'] = slo_info['x_manifest_etag']
+        symlink.write(b'', hdrs=sym_headers)
+        self.assertEqual(slo_info, symlink.info())
+
+    def test_slo_HEAD_part_number_with_version(self):
+        file_item, version_id = self._create_manifest(['a', 'b'])
+        file_item.info(parms={'part-number': '1',
+                              'version-id': version_id},
+                       exp_status=206)
+        sizes = [seg['size_bytes']
+                 for seg in (self.seg_info['a'], self.seg_info['b'])]
+        total_size = sum(sizes)
+        resp = file_item.conn.response
+        self.assertEqual(version_id, resp.getheader('X-Object-Version-Id'))
+        self.assertEqual('2', resp.getheader('X-Parts-Count'))
+        self.assertEqual('bytes 0-%s/%s' % (sizes[0] - 1, total_size),
+                         resp.getheader('Content-Range'))
+
+        file_item.info(parms={'part-number': '2',
+                              'version-id': version_id},
+                       exp_status=206)
+        resp = file_item.conn.response
+        self.assertEqual(version_id, resp.getheader('X-Object-Version-Id'))
+        self.assertEqual('2', resp.getheader('X-Parts-Count'))
+        self.assertEqual('bytes %s-%s/%s'
+                         % (sizes[1], total_size - 1, total_size),
+                         resp.getheader('Content-Range'))
+
+        file_item.info(parms={'part-number': '3',
+                              'version-id': version_id},
+                       exp_status=416)
+        resp = file_item.conn.response
+        self.assertEqual(version_id, resp.getheader('X-Object-Version-Id'))
+        self.assertEqual('2', resp.getheader('X-Parts-Count'))
+        self.assertEqual('bytes */%s' % total_size,
+                         resp.getheader('Content-Range'))
+
+    def test_slo_GET_part_number_with_version(self):
+        file_item, version_id = self._create_manifest(['a', 'b'])
+        body = file_item.read(parms={'part-number': '1',
+                                     'version-id': version_id})
+        sizes = [seg['size_bytes']
+                 for seg in (self.seg_info['a'], self.seg_info['b'])]
+        total_size = sum(sizes)
+        resp = file_item.conn.response
+        self.assertEqual(version_id, resp.getheader('X-Object-Version-Id'))
+        self.assertEqual('2', resp.getheader('X-Parts-Count'))
+        self.assertEqual('bytes 0-%s/%s' % (sizes[0] - 1, total_size),
+                         resp.getheader('Content-Range'))
+        self.assertEqual(('a' * sizes[0]).encode('ascii'), body)
+
+        body = file_item.read(parms={'part-number': '2',
+                                     'version-id': version_id})
+        resp = file_item.conn.response
+        self.assertEqual(version_id, resp.getheader('X-Object-Version-Id'))
+        self.assertEqual('2', resp.getheader('X-Parts-Count'))
+        self.assertEqual('bytes %s-%s/%s'
+                         % (sizes[1], total_size - 1, total_size),
+                         resp.getheader('Content-Range'))
+        self.assertEqual(('b' * sizes[0]).encode('ascii'), body)
+
+        with self.assertRaises(ResponseError):
+            file_item.read(parms={'part-number': '3',
+                                  'version-id': version_id})
+        self.assertEqual(416, file_item.conn.response.status)
+        resp = file_item.conn.response
+        self.assertEqual(version_id, resp.getheader('X-Object-Version-Id'))
+        self.assertEqual('2', resp.getheader('X-Parts-Count'))
+        self.assertEqual('bytes */%s' % total_size,
+                         resp.getheader('Content-Range'))
+
+    def test_slo_HEAD_part_number_multiple_versions(self):
+        file_item, version_id_1 = self._create_manifest(['a', 'b'])
+        file_item, version_id_2 = self._create_manifest(['a'])
+        # older version has 2 parts
+        file_item.info(parms={'part-number': '2',
+                              'version-id': version_id_1},
+                       exp_status=206)
+        sizes = [seg['size_bytes']
+                 for seg in (self.seg_info['a'], self.seg_info['b'])]
+        total_size = sum(sizes)
+        resp = file_item.conn.response
+        self.assertEqual(version_id_1, resp.getheader('x-object-version-id'))
+        self.assertEqual('2', resp.getheader('X-Parts-Count'))
+        self.assertEqual('bytes %s-%s/%s'
+                         % (sizes[1], total_size - 1, total_size),
+                         resp.getheader('Content-Range'))
+
+        # newer version has only 1 part
+        file_item.info(parms={'part-number': '1',
+                              'version-id': version_id_2},
+                       exp_status=206)
+        resp = file_item.conn.response
+        self.assertEqual(version_id_2, resp.getheader('X-Object-Version-Id'))
+        self.assertEqual('1', resp.getheader('X-Parts-Count'))
+        self.assertEqual('bytes %s-%s/%s'
+                         % (0, sizes[0] - 1, sizes[0]),
+                         resp.getheader('Content-Range'))
+
+        file_item.info(parms={'part-number': '2',
+                              'version-id': version_id_2},
+                       exp_status=416)
+        resp = file_item.conn.response
+        self.assertEqual(version_id_2, resp.getheader('X-Object-Version-Id'))
+        self.assertEqual('1', resp.getheader('X-Parts-Count'))
+        self.assertEqual('bytes */%s' % sizes[0],
+                         resp.getheader('Content-Range'))
+
+        # current version == newer version has only 1 part
+        file_item.info(parms={'part-number': '2'},
+                       exp_status=416)
+        resp = file_item.conn.response
+        self.assertEqual(version_id_2, resp.getheader('X-Object-Version-Id'))
+        self.assertEqual('1', resp.getheader('X-Parts-Count'))
+        self.assertEqual('bytes */%s' % sizes[0],
+                         resp.getheader('Content-Range'))
+
+
+class TestSloWithVersioningUTF8(Base2, TestSloWithVersioning):
+    pass
+
+
+class TestVersionsLocationWithVersioning(TestObjectVersioningBase):
+
+    # create a container with versioned writes
+    location_header_key = 'X-Versions-Location'
+
+    def setUp(self):
+        super(TestVersionsLocationWithVersioning, self).setUp()
+
+        prefix = Utils.create_name()[:10]
+        self.versions_container = self.env.account.container(
+            prefix + "-versions")
+        if not self.versions_container.create():
+            raise ResponseError(self.conn.response)
+
+        self.container = self.env.account.container(prefix + "-objs")
+        container_headers = {
+            self.location_header_key: quote(self.versions_container.name)}
+        if not self.container.create(hdrs=container_headers):
+            raise ResponseError(self.conn.response)
+
+    def _prep_object_versions(self):
+
+        # object with multiple versions
+        object_name = Utils.create_name()
+        obj = self.container.file(object_name)
+
+        # v1
+        obj.write(b'version1', hdrs={
+            'Content-Type': 'text/jibberish11',
+            'ETag': md5(b'version1', usedforsecurity=False).hexdigest(),
+        })
+
+        # v2
+        obj.write(b'version2', hdrs={
+            'Content-Type': 'text/jibberish12',
+            'ETag': md5(b'version2', usedforsecurity=False).hexdigest(),
+        })
+
+        # v3
+        obj.write(b'version3', hdrs={
+            'Content-Type': 'text/jibberish13',
+            'ETag': md5(b'version3', usedforsecurity=False).hexdigest(),
+        })
+
+        return obj
+
+    def test_list_with_versions_param(self):
+        obj = self._prep_object_versions()
+        obj_name = obj.name
+
+        listing_parms = {'format': 'json', 'versions': None}
+        current_versions = self.container.files(parms=listing_parms)
+        self.assertEqual(1, len(current_versions))
+        for pv in current_versions:
+            pv.pop('last_modified')
+        self.assertEqual(current_versions, [{
+            'name': obj_name,
+            'bytes': 8,
+            'content_type': 'text/jibberish13',
+            'hash': md5(b'version3', usedforsecurity=False).hexdigest(),
+            'is_latest': True,
+            'version_id': 'null'
+        }])
+
+        prev_versions = self.versions_container.files(parms=listing_parms)
+        self.assertEqual(2, len(prev_versions))
+
+        for pv in prev_versions:
+            pv.pop('last_modified')
+            name = pv.pop('name')
+            self.assertTrue(name.startswith('%03x%s/' % (len(obj_name),
+                                                         obj_name)))
+
+        self.assertEqual(prev_versions, [{
+            'bytes': 8,
+            'content_type': 'text/jibberish11',
+            'hash': md5(b'version1', usedforsecurity=False).hexdigest(),
+            'is_latest': True,
+            'version_id': 'null',
+        }, {
+            'bytes': 8,
+            'content_type': 'text/jibberish12',
+            'hash': md5(b'version2', usedforsecurity=False).hexdigest(),
+            'is_latest': True,
+            'version_id': 'null'
+        }])
+
+    def test_delete_with_null_version_id(self):
+        obj = self._prep_object_versions()
+
+        # sanity
+        self.assertEqual(b'version3', obj.read())
+
+        obj.delete(parms={'version-id': 'null'})
+        if self.location_header_key == 'X-Versions-Location':
+            self.assertEqual(b'version2', obj.read())
+        else:
+            with self.assertRaises(ResponseError) as caught:
+                obj.read()
+            self.assertEqual(404, caught.exception.status)
+
+
+class TestHistoryLocationWithVersioning(TestVersionsLocationWithVersioning):
+
+    # create a container with versioned writes
+    location_header_key = 'X-History-Location'
+
+
+class TestVersioningAccountTempurl(TestObjectVersioningBase):
+    env = TestTempurlEnv
+    digest_name = 'sha256'
+
+    def setUp(self):
+        self.env.versions_header_key = 'X-Versions-Enabled'
+        super(TestVersioningAccountTempurl, self).setUp()
+        if self.env.tempurl_enabled is False:
+            raise SkipTest("TempURL not enabled")
+        elif self.env.tempurl_enabled is not True:
+            # just some sanity checking
+            raise Exception(
+                "Expected tempurl_enabled to be True/False, got %r" %
+                (self.env.tempurl_enabled,))
+
+        if self.digest_name not in cluster_info['tempurl'].get(
+                'allowed_digests', ['sha1']):
+            raise SkipTest("tempurl does not support %s signatures" %
+                           self.digest_name)
+
+        self.digest = getattr(hashlib, self.digest_name)
+        self.expires = int(time.time()) + 86400
+        self.obj_tempurl_parms = self.tempurl_parms(
+            'GET', self.expires, self.env.conn.make_path(self.env.obj.path),
+            self.env.tempurl_key)
+
+    def tempurl_parms(self, method, expires, path, key):
+        path = unquote(path)
+        method = method.encode('utf8')
+        path = path.encode('utf8')
+        key = key.encode('utf8')
+        sig = hmac.new(
+            key,
+            b'%s\n%d\n%s' % (method, expires, path),
+            self.digest).hexdigest()
+        return {'temp_url_sig': sig, 'temp_url_expires': str(expires)}
+
+    def test_PUT(self):
+        obj = self.env.obj
+
+        # give out a signature which allows a PUT to obj
+        expires = int(time.time()) + 86400
+        put_parms = self.tempurl_parms(
+            'PUT', expires, self.env.conn.make_path(obj.path),
+            self.env.tempurl_key)
+
+        # try to overwrite existing object
+        resp = obj.write(b"version2", parms=put_parms,
+                         cfg={'no_auth_token': True},
+                         return_resp=True)
+        resp_headers = {
+            h.lower(): v for h, v in resp.getheaders()}
+        self.assertIn('x-object-version-id', resp_headers)
+
+    def test_GET_latest(self):
+        obj = self.env.obj
+
+        expires = int(time.time()) + 86400
+        get_parms = self.tempurl_parms(
+            'GET', expires, self.env.conn.make_path(obj.path),
+            self.env.tempurl_key)
+
+        # get v1 object (., version-id=null, no symlinks involved)
+        contents = obj.read(parms=get_parms, cfg={'no_auth_token': True})
+        self.assert_status([200])
+        self.assertEqual(contents, b"obj contents")
+
+        # give out a signature which allows a PUT to obj
+        expires = int(time.time()) + 86400
+        put_parms = self.tempurl_parms(
+            'PUT', expires, self.env.conn.make_path(obj.path),
+            self.env.tempurl_key)
+
+        # try to overwrite existing object
+        resp = obj.write(b"version2", parms=put_parms,
+                         cfg={'no_auth_token': True},
+                         return_resp=True)
+        resp_headers = {
+            h.lower(): v for h, v in resp.getheaders()}
+        self.assertIn('x-object-version-id', resp_headers)
+
+        # get v2 object
+        contents = obj.read(parms=get_parms, cfg={'no_auth_token': True})
+        self.assert_status([200])
+        self.assertEqual(contents, b"version2")
+
+    def test_GET_version_id(self):
+        # N.B.: The test is not intended to imply the desired behavior
+        # of a tempurl GET with version-id. Currently version-id is simply
+        # ignored as the latest version is always returned. In the future,
+        # users should be able to create a tempurl with version-id as a
+        # parameter.
+
+        # overwrite object a couple more times
+        obj = self.env.obj
+        resp = obj.write(b"version2", return_resp=True)
+        v2_version_id = resp.getheader('x-object-version-id')
+        obj.write(b"version3!!!")
+
+        expires = int(time.time()) + 86400
+        get_parms = self.tempurl_parms(
+            'GET', expires, self.env.conn.make_path(obj.path),
+            self.env.tempurl_key)
+        get_parms['version-id'] = v2_version_id
+
+        contents = obj.read(parms=get_parms, cfg={'no_auth_token': True})
+        self.assert_status([200])
+        self.assertEqual(contents, b"version3!!!")
+
+
+class TestVersioningContainerTempurl(TestObjectVersioningBase):
+    env = TestContainerTempurlEnv
+    digest_name = 'sha256'
+
+    def setUp(self):
+        self.env.versions_header_key = 'X-Versions-Enabled'
+        super(TestVersioningContainerTempurl, self).setUp()
+        if self.env.tempurl_enabled is False:
+            raise SkipTest("TempURL not enabled")
+        elif self.env.tempurl_enabled is not True:
+            # just some sanity checking
+            raise Exception(
+                "Expected tempurl_enabled to be True/False, got %r" %
+                (self.env.tempurl_enabled,))
+
+        if self.digest_name not in cluster_info['tempurl'].get(
+                'allowed_digests', ['sha1']):
+            raise SkipTest("tempurl does not support %s signatures" %
+                           self.digest_name)
+
+        self.digest = getattr(hashlib, self.digest_name)
+        expires = int(time.time()) + 86400
+        sig = self.tempurl_sig(
+            'GET', expires, self.env.conn.make_path(self.env.obj.path),
+            self.env.tempurl_key)
+        self.obj_tempurl_parms = {'temp_url_sig': sig,
+                                  'temp_url_expires': str(expires)}
+
+    def tempurl_sig(self, method, expires, path, key):
+        path = unquote(path)
+        method = method.encode('utf8')
+        path = path.encode('utf8')
+        key = key.encode('utf8')
+        return hmac.new(
+            key,
+            b'%s\n%d\n%s' % (method, expires, path),
+            self.digest).hexdigest()
+
+    def test_PUT(self):
+        obj = self.env.obj
+
+        # give out a signature which allows a PUT to new_obj
+        expires = int(time.time()) + 86400
+        sig = self.tempurl_sig(
+            'PUT', expires, self.env.conn.make_path(obj.path),
+            self.env.tempurl_key)
+        put_parms = {'temp_url_sig': sig,
+                     'temp_url_expires': str(expires)}
+
+        # try to overwrite existing object
+        resp = obj.write(b"version2", parms=put_parms,
+                         cfg={'no_auth_token': True},
+                         return_resp=True)
+        resp_headers = {
+            h.lower(): v for h, v in resp.getheaders()}
+        self.assertIn('x-object-version-id', resp_headers)
+
+    def test_GET_latest(self):
+        obj = self.env.obj
+
+        expires = int(time.time()) + 86400
+        sig = self.tempurl_sig(
+            'GET', expires, self.env.conn.make_path(obj.path),
+            self.env.tempurl_key)
+        get_parms = {'temp_url_sig': sig,
+                     'temp_url_expires': str(expires)}
+
+        # get v1 object (., version-id=null, no symlinks involved)
+        contents = obj.read(parms=get_parms, cfg={'no_auth_token': True})
+        self.assert_status([200])
+        self.assertEqual(contents, b"obj contents")
+
+        # overwrite existing object
+        obj.write(b"version2")
+
+        # get v2 object (reading from versions container)
+        # versioning symlink allows us to bypass the normal
+        # container-tempurl-key scoping
+        contents = obj.read(parms=get_parms, cfg={'no_auth_token': True})
+        self.assert_status([200])
+        self.assertEqual(contents, b"version2")
+        # HEAD works, too
+        obj.info(parms=get_parms, cfg={'no_auth_token': True})
+        self.assert_status([200])
diff --git a/test/functional/test_protocol.py b/test/functional/test_protocol.py
new file mode 100644
index 0000000000..2d30754d13
--- /dev/null
+++ b/test/functional/test_protocol.py
@@ -0,0 +1,78 @@
+#!/usr/bin/python
+
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+
+from test.functional import check_response, retry, SkipTest
+import test.functional as tf
+
+
+def setUpModule():
+    tf.setup_package()
+
+
+def tearDownModule():
+    tf.teardown_package()
+
+
+class TestHttpProtocol(unittest.TestCase):
+    existing_metadata = None
+
+    def _check_transaction_id(self, resp):
+        self.assertIsNotNone(resp.getheader('X-Trans-Id'))
+        self.assertIsNotNone(resp.getheader('X-Openstack-Request-Id'))
+        self.assertIn('tx', resp.getheader('X-Trans-Id'))
+        self.assertIn('tx', resp.getheader('X-Openstack-Request-Id'))
+        self.assertEqual(resp.getheader('X-Openstack-Request-Id'),
+                         resp.getheader('X-Trans-Id'))
+
+    def test_invalid_path_info(self):
+        if tf.skip:
+            raise SkipTest
+
+        def get(url, token, parsed, conn):
+            path = "/info asdf"
+            conn.request('GET', path, '', {'X-Auth-Token': token})
+            return check_response(conn)
+
+        resp = retry(get)
+        resp.read()
+        self.assertEqual(resp.status, 412)
+        self._check_transaction_id(resp)
+
+    def _do_test_path_missing_element(self, path):
+        if tf.skip:
+            raise SkipTest
+
+        def get(url, token, parsed, conn, **kwargs):
+            conn.request('GET', path, '', {'X-Auth-Token': token})
+            resp = check_response(conn)
+            resp.read()
+            return resp
+
+        resp = retry(get, resource=path)
+        self.assertEqual(resp.status, 404)
+        self._check_transaction_id(resp)
+
+    def test_path_missing_account(self):
+        self._do_test_path_missing_element('/v1//testc/testo')
+
+    def test_path_missing_container(self):
+        self._do_test_path_missing_element('/v1/testa//testo')
+
+    def test_path_missing_account_and_container(self):
+        self._do_test_path_missing_element('/v1///testo')
diff --git a/test/functional/test_slo.py b/test/functional/test_slo.py
new file mode 100644
index 0000000000..ec758a9e26
--- /dev/null
+++ b/test/functional/test_slo.py
@@ -0,0 +1,1716 @@
+#!/usr/bin/python -u
+# Copyright (c) 2010-2016 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import base64
+import email.parser
+import itertools
+import json
+import time
+from copy import deepcopy
+from unittest import SkipTest
+
+import urllib
+from swift.common.swob import normalize_etag
+from swift.common.utils import md5, config_true_value
+
+from test.functional import check_response, retry
+import test.functional as tf
+from test.functional import cluster_info
+from test.functional.tests import Utils, Base, Base2, BaseEnv
+from test.functional.swift_test_client import Connection, ResponseError
+
+
+def setUpModule():
+    tf.setup_package()
+
+
+def tearDownModule():
+    tf.teardown_package()
+
+
+def group_file_contents(file_contents):
+    # This looks a little funny, but iterating through a byte string on py3
+    # yields a sequence of ints, not a sequence of single-byte byte strings
+    # as it did on py2.
+    byte_iter = (file_contents[i:i + 1] for i in range(len(file_contents)))
+    return [
+        (char, sum(1 for _ in grp))
+        for char, grp in itertools.groupby(byte_iter)]
+
+
+def md5hex(s):
+    if not isinstance(s, bytes):
+        s = s.encode('ascii')
+    return md5(s, usedforsecurity=False).hexdigest()
+
+
+class TestSloEnv(BaseEnv):
+    slo_enabled = None  # tri-state: None initially, then True/False
+
+    @classmethod
+    def create_segments(cls, container):
+        seg_info = {}
+        for letter, size in (('a', 1024 * 1024),
+                             ('b', 1024 * 1024),
+                             ('c', 1024 * 1024),
+                             ('d', 1024 * 1024),
+                             ('e', 1)):
+            seg_name = "seg_%s" % letter
+            file_item = container.file(seg_name)
+            file_item.write(letter.encode('ascii') * size)
+            seg_info[seg_name] = {
+                'size_bytes': size,
+                'etag': file_item.md5,
+                'path': '/%s/%s' % (container.name, seg_name)}
+        return seg_info
+
+    @classmethod
+    def setUp(cls):
+        if cls.slo_enabled is None:
+            cls.slo_enabled = 'slo' in cluster_info
+            if not cls.slo_enabled:
+                return
+
+        super(TestSloEnv, cls).setUp()
+
+        if not tf.skip2:
+            config2 = deepcopy(tf.config)
+            config2['account'] = tf.config['account2']
+            config2['username'] = tf.config['username2']
+            config2['password'] = tf.config['password2']
+            cls.conn2 = Connection(config2)
+            cls.conn2.authenticate()
+            cls.account2 = cls.conn2.get_account()
+            cls.account2.delete_containers()
+        if not tf.skip3:
+            config3 = tf.config.copy()
+            config3['username'] = tf.config['username3']
+            config3['password'] = tf.config['password3']
+            cls.conn3 = Connection(config3)
+            cls.conn3.authenticate()
+
+        cls.container = cls.account.container(Utils.create_name())
+        cls.container2 = cls.account.container(Utils.create_name())
+
+        for cont in (cls.container, cls.container2):
+            if not cont.create():
+                raise ResponseError(cls.conn.response)
+
+        cls.seg_info = seg_info = cls.create_segments(cls.container)
+
+        file_item = cls.container.file("manifest-abcde")
+        file_item.write(
+            json.dumps([seg_info['seg_a'], seg_info['seg_b'],
+                        seg_info['seg_c'], seg_info['seg_d'],
+                        seg_info['seg_e']]).encode('ascii'),
+            parms={'multipart-manifest': 'put'})
+
+        cls.container.file('seg_with_%ff_funky_name').write(b'z' * 10)
+
+        # Put the same manifest in the container2
+        file_item = cls.container2.file("manifest-abcde")
+        file_item.write(
+            json.dumps([seg_info['seg_a'], seg_info['seg_b'],
+                        seg_info['seg_c'], seg_info['seg_d'],
+                        seg_info['seg_e']]).encode('ascii'),
+            parms={'multipart-manifest': 'put'})
+
+        file_item = cls.container.file('manifest-cd')
+        cd_json = json.dumps([
+            seg_info['seg_c'], seg_info['seg_d']]).encode('ascii')
+        file_item.write(cd_json, parms={'multipart-manifest': 'put'})
+        cd_etag = md5((
+            seg_info['seg_c']['etag'] + seg_info['seg_d']['etag']
+        ).encode('ascii'), usedforsecurity=False).hexdigest()
+
+        file_item = cls.container.file("manifest-bcd-submanifest")
+        file_item.write(
+            json.dumps([seg_info['seg_b'],
+                        {'etag': cd_etag,
+                         'size_bytes': (seg_info['seg_c']['size_bytes'] +
+                                        seg_info['seg_d']['size_bytes']),
+                         'path': '/%s/%s' % (cls.container.name,
+                                             'manifest-cd')}]).encode('ascii'),
+            parms={'multipart-manifest': 'put'})
+        bcd_submanifest_etag = md5((
+            seg_info['seg_b']['etag'] + cd_etag).encode('ascii'),
+            usedforsecurity=False).hexdigest()
+
+        file_item = cls.container.file("manifest-abcde-submanifest")
+        file_item.write(
+            json.dumps([
+                seg_info['seg_a'],
+                {'etag': bcd_submanifest_etag,
+                 'size_bytes': (seg_info['seg_b']['size_bytes'] +
+                                seg_info['seg_c']['size_bytes'] +
+                                seg_info['seg_d']['size_bytes']),
+                 'path': '/%s/%s' % (cls.container.name,
+                                     'manifest-bcd-submanifest')},
+                seg_info['seg_e']]).encode('ascii'),
+            parms={'multipart-manifest': 'put'})
+        abcde_submanifest_etag = md5((
+            seg_info['seg_a']['etag'] + bcd_submanifest_etag +
+            seg_info['seg_e']['etag']).encode('ascii'),
+            usedforsecurity=False).hexdigest()
+        abcde_submanifest_size = (seg_info['seg_a']['size_bytes'] +
+                                  seg_info['seg_b']['size_bytes'] +
+                                  seg_info['seg_c']['size_bytes'] +
+                                  seg_info['seg_d']['size_bytes'] +
+                                  seg_info['seg_e']['size_bytes'])
+
+        file_item = cls.container.file("ranged-manifest")
+        file_item.write(
+            json.dumps([
+                {'etag': abcde_submanifest_etag,
+                 'size_bytes': abcde_submanifest_size,
+                 'path': '/%s/%s' % (cls.container.name,
+                                     'manifest-abcde-submanifest'),
+                 'range': '-1048578'},  # 'c' + ('d' * 2**20) + 'e'
+                {'etag': abcde_submanifest_etag,
+                 'size_bytes': abcde_submanifest_size,
+                 'path': '/%s/%s' % (cls.container.name,
+                                     'manifest-abcde-submanifest'),
+                 'range': '524288-1572863'},  # 'a' * 2**19 + 'b' * 2**19
+                {'etag': abcde_submanifest_etag,
+                 'size_bytes': abcde_submanifest_size,
+                 'path': '/%s/%s' % (cls.container.name,
+                                     'manifest-abcde-submanifest'),
+                 'range': '3145727-3145728'}]).encode('ascii'),  # 'cd'
+            parms={'multipart-manifest': 'put'})
+        ranged_manifest_etag = md5((
+            abcde_submanifest_etag + ':3145727-4194304;' +
+            abcde_submanifest_etag + ':524288-1572863;' +
+            abcde_submanifest_etag + ':3145727-3145728;'
+        ).encode('ascii'), usedforsecurity=False).hexdigest()
+        ranged_manifest_size = 2 * 1024 * 1024 + 4
+
+        file_item = cls.container.file("ranged-submanifest")
+        file_item.write(
+            json.dumps([
+                seg_info['seg_c'],
+                {'etag': ranged_manifest_etag,
+                 'size_bytes': ranged_manifest_size,
+                 'path': '/%s/%s' % (cls.container.name,
+                                     'ranged-manifest')},
+                {'etag': ranged_manifest_etag,
+                 'size_bytes': ranged_manifest_size,
+                 'path': '/%s/%s' % (cls.container.name,
+                                     'ranged-manifest'),
+                 'range': '524289-1572865'},
+                {'etag': ranged_manifest_etag,
+                 'size_bytes': ranged_manifest_size,
+                 'path': '/%s/%s' % (cls.container.name,
+                                     'ranged-manifest'),
+                 'range': '-3'}]).encode('ascii'),
+            parms={'multipart-manifest': 'put'})
+
+        file_item = cls.container.file("manifest-db")
+        file_item.write(
+            json.dumps([
+                {'path': seg_info['seg_d']['path'], 'etag': None,
+                 'size_bytes': None},
+                {'path': seg_info['seg_b']['path'], 'etag': None,
+                 'size_bytes': None},
+            ]).encode('ascii'), parms={'multipart-manifest': 'put'})
+
+        file_item = cls.container.file("ranged-manifest-repeated-segment")
+        file_item.write(
+            json.dumps([
+                {'path': seg_info['seg_a']['path'], 'etag': None,
+                 'size_bytes': None, 'range': '-1048578'},
+                {'path': seg_info['seg_a']['path'], 'etag': None,
+                 'size_bytes': None},
+                {'path': seg_info['seg_b']['path'], 'etag': None,
+                 'size_bytes': None, 'range': '-1048578'},
+            ]).encode('ascii'), parms={'multipart-manifest': 'put'})
+
+        file_item = cls.container.file("mixed-object-data-manifest")
+        file_item.write(
+            json.dumps([
+                {'data': base64.b64encode(b'APRE' * 8).decode('ascii')},
+                {'path': seg_info['seg_a']['path']},
+                {'data': base64.b64encode(b'APOS' * 16).decode('ascii')},
+                {'path': seg_info['seg_b']['path']},
+                {'data': base64.b64encode(b'BPOS' * 32).decode('ascii')},
+                {'data': base64.b64encode(b'CPRE' * 64).decode('ascii')},
+                {'path': seg_info['seg_c']['path']},
+                {'data': base64.b64encode(b'CPOS' * 8).decode('ascii')},
+            ]).encode('ascii'), parms={'multipart-manifest': 'put'}
+        )
+
+        file_item = cls.container.file("nested-data-manifest")
+        file_item.write(
+            json.dumps([
+                {'path': '%s/%s' % (cls.container.name,
+                                    "mixed-object-data-manifest")}
+            ]).encode('ascii'), parms={'multipart-manifest': 'put'}
+        )
+
+
+class TestSlo(Base):
+    env = TestSloEnv
+
+    def setUp(self):
+        super(TestSlo, self).setUp()
+        if self.env.slo_enabled is False:
+            raise SkipTest("SLO not enabled")
+        elif self.env.slo_enabled is not True:
+            # just some sanity checking
+            raise Exception(
+                "Expected slo_enabled to be True/False, got %r" %
+                (self.env.slo_enabled,))
+
+        manifest_abcde_hash = md5(usedforsecurity=False)
+        for letter in (b'a', b'b', b'c', b'd'):
+            manifest_abcde_hash.update(
+                md5(letter * 1024 * 1024, usedforsecurity=False)
+                .hexdigest().encode('ascii'))
+        manifest_abcde_hash.update(
+            md5(b'e', usedforsecurity=False).hexdigest().encode('ascii'))
+        self.manifest_abcde_etag = manifest_abcde_hash.hexdigest()
+
+    def test_slo_get_simple_manifest(self):
+        file_item = self.env.container.file('manifest-abcde')
+        file_contents = file_item.read()
+        self.assertEqual(file_item.conn.response.status, 200)
+        headers = dict(
+            (h.lower(), v)
+            for h, v in file_item.conn.response.getheaders())
+        self.assertIn('etag', headers)
+        self.assertEqual(headers['etag'], '"%s"' % self.manifest_abcde_etag)
+        self.assertEqual([
+            (b'a', 1024 * 1024),
+            (b'b', 1024 * 1024),
+            (b'c', 1024 * 1024),
+            (b'd', 1024 * 1024),
+            (b'e', 1),
+        ], group_file_contents(file_contents))
+
+    def test_slo_multipart_delete_part_number_ignored(self):
+        # create a container just for this test because we're going to delete
+        # objects that we create
+        container = self.env.account.container(Utils.create_name())
+        self.assertTrue(container.create())
+        # create segments in same container
+        seg_info = self.env.create_segments(container)
+        file_item = container.file("manifest-abcde")
+        self.assertTrue(file_item.write(
+            json.dumps([seg_info['seg_a'], seg_info['seg_b'],
+                        seg_info['seg_c'], seg_info['seg_d'],
+                        seg_info['seg_e']]).encode('ascii'),
+            parms={'multipart-manifest': 'put'}))
+        # sanity check, we have SLO...
+        file_item.initialize(parms={'part-number': '5'})
+        self.assertEqual(
+            file_item.conn.response.getheader('X-Static-Large-Object'), 'True')
+        self.assertEqual(
+            file_item.conn.response.getheader('X-Parts-Count'), '5')
+        self.assertEqual(6, len(container.files()))
+
+        # part-number should be ignored
+        status = file_item.conn.make_request(
+            'DELETE', file_item.path,
+            parms={'multipart-manifest': 'delete',
+                   'part-number': '2'})
+        self.assertEqual(200, status)
+        # everything is gone
+        self.assertFalse(container.files())
+
+    def test_get_head_part_number_invalid(self):
+        file_item = self.env.container.file('manifest-abcde')
+        file_item.initialize()
+        ok_resp = file_item.conn.response
+        self.assertEqual(ok_resp.getheader('X-Static-Large-Object'), 'True')
+        self.assertEqual(ok_resp.getheader('Etag'), file_item.etag)
+        self.assertEqual(ok_resp.getheader('Content-Length'),
+                         str(file_item.size))
+
+        # part-number is 1-indexed
+        self.assertRaises(ResponseError, file_item.read,
+                          parms={'part-number': '0'})
+        resp_body = file_item.conn.response.read()
+        self.assertEqual(400, file_item.conn.response.status, resp_body)
+        self.assertEqual(b'Part number must be an integer greater than 0',
+                         resp_body)
+
+        self.assertRaises(ResponseError, file_item.initialize,
+                          parms={'part-number': '0'})
+        resp_body = file_item.conn.response.read()
+        self.assertEqual(400, file_item.conn.response.status)
+        self.assertEqual(b'', resp_body)
+
+    def test_get_head_part_number_out_of_range(self):
+        file_item = self.env.container.file('manifest-abcde')
+        file_item.initialize()
+        ok_resp = file_item.conn.response
+        self.assertEqual(ok_resp.getheader('X-Static-Large-Object'), 'True')
+        self.assertEqual(ok_resp.getheader('Etag'), file_item.etag)
+        self.assertEqual(ok_resp.getheader('Content-Length'),
+                         str(file_item.size))
+        manifest_etag = ok_resp.getheader('Manifest-Etag')
+
+        def check_headers(resp):
+            self.assertEqual(resp.getheader('X-Static-Large-Object'), 'True')
+            self.assertEqual(resp.getheader('Etag'), file_item.etag)
+            self.assertEqual(resp.getheader('Manifest-Etag'), manifest_etag)
+            self.assertEqual(resp.getheader('X-Parts-Count'), '5')
+            self.assertEqual(resp.getheader('Content-Range'),
+                             'bytes */%s' % file_item.size)
+
+        self.assertRaises(ResponseError, file_item.read,
+                          parms={'part-number': '10001'})
+        resp_body = file_item.conn.response.read()
+        self.assertEqual(416, file_item.conn.response.status, resp_body)
+        self.assertEqual(b'The requested part number is not satisfiable',
+                         resp_body)
+        check_headers(file_item.conn.response)
+        self.assertEqual(file_item.conn.response.getheader('Content-Length'),
+                         str(len(resp_body)))
+
+        self.assertRaises(ResponseError, file_item.info,
+                          parms={'part-number': '10001'})
+        resp_body = file_item.conn.response.read()
+        self.assertEqual(416, file_item.conn.response.status)
+        self.assertEqual(b'', resp_body)
+        check_headers(file_item.conn.response)
+        self.assertEqual(file_item.conn.response.getheader('Content-Length'),
+                         '0')
+
+    def test_get_part_number_simple_manifest(self):
+        file_item = self.env.container.file('manifest-abcde')
+        seg_info_list = [
+            self.env.seg_info["seg_%s" % letter]
+            for letter in ['a', 'b', 'c', 'd', 'e']
+        ]
+        checksum = md5(usedforsecurity=False)
+        total_size = 0
+        for seg_info in seg_info_list:
+            checksum.update(seg_info['etag'].encode('ascii'))
+            total_size += seg_info['size_bytes']
+        slo_etag = checksum.hexdigest()
+        start = 0
+        manifest_etag = None
+        for i, seg_info in enumerate(seg_info_list, start=1):
+            part_contents = file_item.read(parms={'part-number': i})
+            self.assertEqual(len(part_contents), seg_info['size_bytes'])
+            headers = dict(
+                (h.lower(), v)
+                for h, v in file_item.conn.response.getheaders())
+            self.assertEqual(headers['content-length'],
+                             str(seg_info['size_bytes']))
+            self.assertEqual(headers['etag'], '"%s"' % slo_etag)
+            if not manifest_etag:
+                manifest_etag = headers['x-manifest-etag']
+            else:
+                self.assertEqual(headers['x-manifest-etag'], manifest_etag)
+            end = start + seg_info['size_bytes'] - 1
+            self.assertEqual(headers['content-range'],
+                             'bytes %d-%d/%d' % (start, end, total_size), i)
+            self.assertEqual(headers['x-parts-count'], '5')
+            start = end + 1
+
+    def test_head_part_number_simple_manifest(self):
+        file_item = self.env.container.file('manifest-abcde')
+        seg_info_list = [
+            self.env.seg_info["seg_%s" % letter]
+            for letter in ['a', 'b', 'c', 'd', 'e']
+        ]
+        checksum = md5(usedforsecurity=False)
+        total_size = 0
+        for seg_info in seg_info_list:
+            checksum.update(seg_info['etag'].encode('ascii'))
+            total_size += seg_info['size_bytes']
+        slo_etag = checksum.hexdigest()
+        start = 0
+        manifest_etag = None
+        for i, seg_info in enumerate(seg_info_list, start=1):
+            part_info = file_item.info(parms={'part-number': i},
+                                       exp_status=206)
+            headers = dict(
+                (h.lower(), v)
+                for h, v in file_item.conn.response.getheaders())
+            self.assertEqual(headers['content-length'],
+                             str(seg_info['size_bytes']))
+            self.assertEqual(headers['etag'], '"%s"' % slo_etag)
+            self.assertEqual(headers['etag'], part_info['etag'])
+            if not manifest_etag:
+                manifest_etag = headers['x-manifest-etag']
+            else:
+                self.assertEqual(headers['x-manifest-etag'], manifest_etag)
+            end = start + seg_info['size_bytes'] - 1
+            self.assertEqual(headers['content-range'],
+                             'bytes %d-%d/%d' % (start, end, total_size), i)
+            self.assertEqual(headers['x-parts-count'], '5')
+            start = end + 1
+
+    def test_x_delete_at_with_part_number_and_open_expired(self):
+        cont_name = self.env.account.container(self.env.container.name)
+        allow_open_expired = config_true_value(tf.cluster_info['swift'].get(
+            'allow_open_expired', 'false'))
+
+        if not allow_open_expired:
+            raise SkipTest('allow_open_expired is disabled')
+
+        # data for segments
+        segments = [b'one', b'two', b'three', b'four']
+        etags = [md5hex(segment) for segment in segments]
+
+        def put_manifest(url, token, parsed, conn, object_segments,
+                         x_delete_after):
+            manifest_data = []
+            start = 0
+
+            for segment_object in range(len(object_segments)):
+                size = len(object_segments[segment_object])
+                end = start + size - 1
+                manifest_data.append({
+                    'path': '/%s/segments/%s' % (cont_name,
+                                                 str(segment_object)),
+                    'etag': etags[segment_object],
+                    'size_bytes': size,
+                })
+                start = end + 1
+
+            conn.request(
+                'PUT',
+                '%s/%s/manifest?multipart-manifest=put' % (parsed.path,
+                                                           cont_name),
+                body=json.dumps(manifest_data),
+                headers={
+                    'X-Auth-Token': token,
+                    'X-Delete-After': str(x_delete_after),
+                    'X-Static-Large-Object': 'true',
+                    'Content-Type': 'application/json'
+                }
+            )
+            resp = check_response(conn)
+            body = resp.read()
+            self.assertEqual(resp.status, 201,
+                             "Response status is not 201: %s" % body)
+
+        def put_segments(url, token, parsed, conn, object_segments,
+                         x_delete_after):
+            for objnum in range(len(object_segments)):
+                conn.request('PUT', '%s/%s/segments/%s' % (
+                    parsed.path,
+                    cont_name,
+                    str(objnum)),
+                    body=object_segments[objnum],
+                    headers={
+                        'X-Auth-Token': token,
+                        'X-Delete-After': str(x_delete_after)})
+                resp = check_response(conn)
+                body = resp.read()
+                self.assertEqual(resp.status, 201,
+                                 "Response status is not 201: %s" % body)
+
+        retry(put_segments, segments, 2)
+        retry(put_manifest, segments, 1)
+
+        # get the manifest
+        def get_manifest(url, token, parsed, conn, extra_headers=None):
+            headers = {'X-Auth-Token': token}
+            if extra_headers:
+                headers.update(extra_headers)
+            conn.request(
+                'GET',
+                '%s/%s/manifest?multipart-manifest=get' %
+                (parsed.path, cont_name),
+                '', headers)
+            return check_response(conn)
+
+        def get_manifest_still_expired(timeout=10, retry_delay=1):
+            start_time = time.time()
+            while time.time() - start_time < timeout:
+                resp = retry(get_manifest)
+                resp.read()
+                if resp.status == 404:
+                    break
+                elif 200 <= resp.status < 300:
+                    time.sleep(retry_delay)
+                else:
+                    self.fail(
+                        f'Unexpected response status {resp.status} for'
+                        f'manifest {resp.url}.')
+            else:
+                self.fail(
+                    f'manifest still returns {resp.status} after '
+                    f'we set x-delete-after to 2s post object '
+                    f'creation')
+
+            self.assertEqual(resp.status, 404,
+                             resp.headers.get('x-trans-id'))
+
+        get_manifest_still_expired()
+
+        def get_manifest_with_open_expire():
+            resp = retry(get_manifest, extra_headers={'X-Open-Expired': True})
+            self.assertEqual(resp.status, 200)
+            resp.read()
+
+        get_manifest_with_open_expire()
+
+        def get_or_head_part(url, token, parsed, conn,
+                             extra_headers=None, method='GET',
+                             part_number=None):
+            headers = {'X-Auth-Token': token}
+            if extra_headers:
+                headers.update(extra_headers)
+            conn.request(method, '%s/%s/manifest?part-number=%s' % (
+                parsed.path,
+                cont_name,
+                part_number
+            ), '', headers)
+            return check_response(conn)
+
+        resp = retry(get_manifest, extra_headers={'X-Open-Expired': True})
+        resp.read()
+        # read the expired object with magic x-open-expired header
+        self.assertEqual(resp.status, 200)
+
+        def check_parts_with_open_expire(method='GET'):
+            for objnum in range(len(segments)):
+                part_num = str(objnum + 1)
+                resp = retry(get_or_head_part,
+                             extra_headers={'X-Open-Expired': True},
+                             method=method, part_number=part_num)
+                resp.read()
+                self.assertEqual(resp.status, 206)
+
+        check_parts_with_open_expire()
+        check_parts_with_open_expire('HEAD')
+
+        def check_part_still_expired(method='GET', timeout=10, retry_delay=1):
+            for objnum, segment in enumerate(segments):
+                part_num = str(objnum + 1)
+                start_time = time.time()
+                while time.time() - start_time < timeout:
+                    resp = retry(get_or_head_part, method=method,
+                                 part_number=part_num)
+                    resp.read()
+                    if resp.status == 404:
+                        break
+                    elif 200 <= resp.status < 300:
+                        time.sleep(retry_delay)
+                    else:
+                        self.fail(
+                            f'Unexpected response status {resp.status} for'
+                            f' part {part_num}.')
+                else:
+                    self.fail(
+                        f'Part {part_num} did not return 404 within {timeout}'
+                        f' seconds.')
+
+        check_part_still_expired()
+        check_part_still_expired('HEAD', 5, 1)
+
+        def head_manifest(url, token, parsed, conn, extra_headers=None):
+            headers = {'X-Auth-Token': token}
+            if extra_headers:
+                headers.update(extra_headers)
+            conn.request('HEAD', '%s/%s/manifest' % (parsed.path,
+                                                     cont_name),
+                         '', headers)
+            return check_response(conn)
+
+        resp = retry(head_manifest, extra_headers={'X-Open-Expired': True})
+        resp.read()
+        # head expired object with magic x-open-expired header
+        self.assertEqual(resp.status, 200)
+
+    def test_slo_container_listing(self):
+        # the listing object size should equal the sum of the size of the
+        # segments, not the size of the manifest body
+        file_item = self.env.container.file(Utils.create_name())
+        file_item.write(
+            json.dumps([self.env.seg_info['seg_a']]).encode('ascii'),
+            parms={'multipart-manifest': 'put'})
+        # The container listing exposes BOTH the MD5 of the manifest content
+        # and the SLO MD5-of-MD5s by splitting the latter out into a separate
+        # key. These should remain consistent when the object is updated with
+        # a POST.
+        file_item.initialize(parms={'multipart-manifest': 'get'})
+        manifest_etag = file_item.etag
+        if tf.cluster_info.get('etag_quoter', {}).get('enable_by_default'):
+            self.assertTrue(manifest_etag.startswith('"'))
+            self.assertTrue(manifest_etag.endswith('"'))
+            # ...but in the listing, it'll be stripped
+            manifest_etag = manifest_etag[1:-1]
+        else:
+            self.assertFalse(manifest_etag.startswith('"'))
+            self.assertFalse(manifest_etag.endswith('"'))
+
+        file_item.initialize()
+        slo_etag = file_item.etag
+        self.assertTrue(slo_etag.startswith('"'))
+        self.assertTrue(slo_etag.endswith('"'))
+
+        listing = self.env.container.files(parms={'format': 'json'})
+        for f_dict in listing:
+            if f_dict['name'] == file_item.name:
+                self.assertEqual(1024 * 1024, f_dict['bytes'])
+                self.assertEqual('application/octet-stream',
+                                 f_dict['content_type'])
+                self.assertEqual(manifest_etag, f_dict['hash'])
+                self.assertEqual(slo_etag, f_dict['slo_etag'])
+                break
+        else:
+            self.fail('Failed to find manifest file in container listing')
+
+        # now POST updated content-type file
+        file_item.content_type = 'image/jpeg'
+        file_item.sync_metadata({'X-Object-Meta-Test': 'blah'})
+        file_item.initialize()
+        self.assertEqual('image/jpeg', file_item.content_type)  # sanity
+
+        # verify that the container listing is consistent with the file
+        listing = self.env.container.files(parms={'format': 'json'})
+        for f_dict in listing:
+            if f_dict['name'] == file_item.name:
+                self.assertEqual(1024 * 1024, f_dict['bytes'])
+                self.assertEqual(file_item.content_type,
+                                 f_dict['content_type'])
+                self.assertEqual(manifest_etag, f_dict['hash'])
+                self.assertEqual(slo_etag, f_dict['slo_etag'])
+                break
+        else:
+            self.fail('Failed to find manifest file in container listing')
+
+        # now POST with no change to content-type
+        file_item.sync_metadata({'X-Object-Meta-Test': 'blah'},
+                                cfg={'no_content_type': True})
+        file_item.initialize()
+        self.assertEqual('image/jpeg', file_item.content_type)  # sanity
+
+        # verify that the container listing is consistent with the file
+        listing = self.env.container.files(parms={'format': 'json'})
+        for f_dict in listing:
+            if f_dict['name'] == file_item.name:
+                self.assertEqual(1024 * 1024, f_dict['bytes'])
+                self.assertEqual(file_item.content_type,
+                                 f_dict['content_type'])
+                self.assertEqual(manifest_etag, f_dict['hash'])
+                self.assertEqual(slo_etag, f_dict['slo_etag'])
+                break
+        else:
+            self.fail('Failed to find manifest file in container listing')
+
+    def test_slo_get_nested_manifest(self):
+        file_item = self.env.container.file('manifest-abcde-submanifest')
+        file_contents = file_item.read()
+        self.assertEqual(4 * 1024 * 1024 + 1, len(file_contents))
+        self.assertEqual([
+            (b'a', 1024 * 1024),
+            (b'b', 1024 * 1024),
+            (b'c', 1024 * 1024),
+            (b'd', 1024 * 1024),
+            (b'e', 1),
+        ], group_file_contents(file_item.read()))
+
+    def test_slo_get_ranged_manifest(self):
+        file_item = self.env.container.file('ranged-manifest')
+        self.assertEqual([
+            (b'c', 1),
+            (b'd', 1024 * 1024),
+            (b'e', 1),
+            (b'a', 512 * 1024),
+            (b'b', 512 * 1024),
+            (b'c', 1),
+            (b'd', 1),
+        ], group_file_contents(file_item.read()))
+
+    def test_slo_get_ranged_manifest_repeated_segment(self):
+        file_item = self.env.container.file('ranged-manifest-repeated-segment')
+        self.assertEqual(
+            [(b'a', 2097152), (b'b', 1048576)],
+            group_file_contents(file_item.read()))
+
+    def test_slo_get_ranged_submanifest(self):
+        file_item = self.env.container.file('ranged-submanifest')
+        self.assertEqual([
+            (b'c', 1024 * 1024 + 1),
+            (b'd', 1024 * 1024),
+            (b'e', 1),
+            (b'a', 512 * 1024),
+            (b'b', 512 * 1024),
+            (b'c', 1),
+            (b'd', 512 * 1024 + 1),
+            (b'e', 1),
+            (b'a', 512 * 1024),
+            (b'b', 1),
+            (b'c', 1),
+            (b'd', 1),
+        ], group_file_contents(file_item.read()))
+
+    def test_slo_ranged_get(self):
+        file_item = self.env.container.file('manifest-abcde')
+        file_contents = file_item.read(size=1024 * 1024 + 2,
+                                       offset=1024 * 1024 - 1)
+        self.assertEqual(file_item.conn.response.status, 206)
+        headers = dict(
+            (h.lower(), v)
+            for h, v in file_item.conn.response.getheaders())
+        self.assertIn('etag', headers)
+        self.assertEqual(headers['etag'], '"%s"' % self.manifest_abcde_etag)
+        self.assertEqual([
+            (b'a', 1),
+            (b'b', 1048576),
+            (b'c', 1),
+        ], group_file_contents(file_contents))
+
+    def test_slo_ranged_get_half_open_on_right(self):
+        file_item = self.env.container.file('manifest-abcde')
+        file_contents = file_item.read(
+            hdrs={"Range": "bytes=1048571-"})
+        self.assertEqual([
+            (b'a', 5),
+            (b'b', 1048576),
+            (b'c', 1048576),
+            (b'd', 1048576),
+            (b'e', 1)
+        ], group_file_contents(file_contents))
+
+    def test_slo_ranged_get_half_open_on_left(self):
+        file_item = self.env.container.file('manifest-abcde')
+        file_contents = file_item.read(
+            hdrs={"Range": "bytes=-123456"})
+        self.assertEqual([
+            (b'd', 123455),
+            (b'e', 1),
+        ], group_file_contents(file_contents))
+
+    def test_slo_multi_ranged_get(self):
+        file_item = self.env.container.file('manifest-abcde')
+        file_contents = file_item.read(
+            hdrs={"Range": "bytes=1048571-1048580,2097147-2097156"})
+
+        # See testMultiRangeGets for explanation
+        parser = email.parser.BytesFeedParser()
+        parser.feed((
+            "Content-Type: %s\r\n\r\n" % file_item.content_type).encode())
+        parser.feed(file_contents)
+
+        root_message = parser.close()
+        self.assertTrue(root_message.is_multipart())  # sanity check
+
+        byteranges = root_message.get_payload()
+        self.assertEqual(len(byteranges), 2)
+
+        self.assertEqual(byteranges[0]['Content-Type'],
+                         "application/octet-stream")
+        self.assertEqual(
+            byteranges[0]['Content-Range'], "bytes 1048571-1048580/4194305")
+        self.assertEqual(byteranges[0].get_payload(decode=True), b"aaaaabbbbb")
+
+        self.assertEqual(byteranges[1]['Content-Type'],
+                         "application/octet-stream")
+        self.assertEqual(
+            byteranges[1]['Content-Range'], "bytes 2097147-2097156/4194305")
+        self.assertEqual(byteranges[1].get_payload(decode=True), b"bbbbbccccc")
+
+    def test_slo_ranged_submanifest(self):
+        file_item = self.env.container.file('manifest-abcde-submanifest')
+        file_contents = file_item.read(size=1024 * 1024 + 2,
+                                       offset=1024 * 1024 * 2 - 1)
+        self.assertEqual([
+            (b'b', 1),
+            (b'c', 1024 * 1024),
+            (b'd', 1),
+        ], group_file_contents(file_contents))
+
+    def test_slo_etag_is_quote_wrapped_hash_of_etags(self):
+        # we have this check in test_slo_get_simple_manifest, too,
+        # but verify that it holds for HEAD requests
+        file_item = self.env.container.file('manifest-abcde')
+        self.assertEqual('"%s"' % self.manifest_abcde_etag,
+                         file_item.info()['etag'])
+
+    def test_slo_etag_is_quote_wrapped_hash_of_etags_submanifests(self):
+
+        def hd(x):
+            return md5(x, usedforsecurity=False).hexdigest().encode('ascii')
+
+        expected_etag = hd(hd(b'a' * 1024 * 1024) +
+                           hd(hd(b'b' * 1024 * 1024) +
+                              hd(hd(b'c' * 1024 * 1024) +
+                                 hd(b'd' * 1024 * 1024))) +
+                           hd(b'e'))
+
+        file_item = self.env.container.file('manifest-abcde-submanifest')
+        self.assertEqual('"%s"' % expected_etag.decode('ascii'),
+                         file_item.info()['etag'])
+
+    def test_slo_etag_mismatch(self):
+        file_item = self.env.container.file("manifest-a-bad-etag")
+        try:
+            file_item.write(
+                json.dumps([{
+                    'size_bytes': 1024 * 1024,
+                    'etag': 'not it',
+                    'path': '/%s/%s' % (self.env.container.name, 'seg_a'),
+                }]).encode('ascii'),
+                parms={'multipart-manifest': 'put'})
+        except ResponseError as err:
+            self.assertEqual(400, err.status)
+        else:
+            self.fail("Expected ResponseError but didn't get it")
+
+    def test_slo_size_mismatch(self):
+        file_item = self.env.container.file("manifest-a-bad-size")
+        try:
+            file_item.write(
+                json.dumps([{
+                    'size_bytes': 1024 * 1024 - 1,
+                    'etag': md5(
+                        b'a' * 1024 * 1024,
+                        usedforsecurity=False).hexdigest(),
+                    'path': '/%s/%s' % (self.env.container.name, 'seg_a'),
+                }]).encode('ascii'),
+                parms={'multipart-manifest': 'put'})
+        except ResponseError as err:
+            self.assertEqual(400, err.status)
+        else:
+            self.fail("Expected ResponseError but didn't get it")
+
+    def test_slo_client_etag_mismatch(self):
+        file_item = self.env.container.file("manifest-a-mismatch-etag")
+        try:
+            file_item.write(
+                json.dumps([{
+                    'size_bytes': 1024 * 1024,
+                    'etag': md5(b'a' * 1024 * 1024,
+                                usedforsecurity=False).hexdigest(),
+                    'path': '/%s/%s' % (self.env.container.name, 'seg_a'),
+                }]).encode('ascii'),
+                parms={'multipart-manifest': 'put'},
+                hdrs={'Etag': 'NOTetagofthesegments'})
+        except ResponseError as err:
+            self.assertEqual(422, err.status)
+
+    def test_slo_client_etag(self):
+        file_item = self.env.container.file("manifest-a-b-etag")
+        etag_a = md5(b'a' * 1024 * 1024, usedforsecurity=False).hexdigest()
+        etag_b = md5(b'b' * 1024 * 1024, usedforsecurity=False).hexdigest()
+        file_item.write(
+            json.dumps([{
+                'size_bytes': 1024 * 1024,
+                'etag': etag_a,
+                'path': '/%s/%s' % (self.env.container.name, 'seg_a')}, {
+                'size_bytes': 1024 * 1024,
+                'etag': etag_b,
+                'path': '/%s/%s' % (self.env.container.name, 'seg_b'),
+            }]).encode('ascii'),
+            parms={'multipart-manifest': 'put'},
+            hdrs={'Etag': md5((etag_a + etag_b).encode(),
+                              usedforsecurity=False).hexdigest()})
+        self.assert_status(201)
+
+    def test_slo_unspecified_etag(self):
+        file_item = self.env.container.file("manifest-a-unspecified-etag")
+        file_item.write(
+            json.dumps([{
+                'size_bytes': 1024 * 1024,
+                'etag': None,
+                'path': '/%s/%s' % (self.env.container.name, 'seg_a'),
+            }]).encode('ascii'),
+            parms={'multipart-manifest': 'put'})
+        self.assert_status(201)
+
+    def test_slo_unspecified_size(self):
+        file_item = self.env.container.file("manifest-a-unspecified-size")
+        file_item.write(
+            json.dumps([{
+                'size_bytes': None,
+                'etag': md5(b'a' * 1024 * 1024,
+                            usedforsecurity=False).hexdigest(),
+                'path': '/%s/%s' % (self.env.container.name, 'seg_a'),
+            }]).encode('ascii'),
+            parms={'multipart-manifest': 'put'})
+        self.assert_status(201)
+
+    def test_slo_funky_segment(self):
+        file_item = self.env.container.file("manifest-with-funky-segment")
+        file_item.write(
+            json.dumps([{
+                'path': '/%s/%s' % (self.env.container.name,
+                                    'seg_with_%ff_funky_name'),
+            }]).encode('ascii'),
+            parms={'multipart-manifest': 'put'})
+        self.assert_status(201)
+
+        self.assertEqual(b'z' * 10, file_item.read())
+
+    def test_slo_missing_etag(self):
+        file_item = self.env.container.file("manifest-a-missing-etag")
+        file_item.write(
+            json.dumps([{
+                'size_bytes': 1024 * 1024,
+                'path': '/%s/%s' % (self.env.container.name, 'seg_a'),
+            }]).encode('ascii'),
+            parms={'multipart-manifest': 'put'})
+        self.assert_status(201)
+
+    def test_slo_missing_size(self):
+        file_item = self.env.container.file("manifest-a-missing-size")
+        file_item.write(
+            json.dumps([{
+                'etag': md5(b'a' * 1024 * 1024,
+                            usedforsecurity=False).hexdigest(),
+                'path': '/%s/%s' % (self.env.container.name, 'seg_a'),
+            }]).encode('ascii'),
+            parms={'multipart-manifest': 'put'})
+        self.assert_status(201)
+
+    def test_slo_path_only(self):
+        file_item = self.env.container.file("manifest-a-path-only")
+        file_item.write(
+            json.dumps([{
+                'path': '/%s/%s' % (self.env.container.name, 'seg_a'),
+            }]).encode('ascii'),
+            parms={'multipart-manifest': 'put'})
+        self.assert_status(201)
+
+    def test_slo_typo_etag(self):
+        file_item = self.env.container.file("manifest-a-typo-etag")
+        try:
+            file_item.write(
+                json.dumps([{
+                    'teag': md5(b'a' * 1024 * 1024,
+                                usedforsecurity=False).hexdigest(),
+                    'size_bytes': 1024 * 1024,
+                    'path': '/%s/%s' % (self.env.container.name, 'seg_a'),
+                }]).encode('ascii'),
+                parms={'multipart-manifest': 'put'})
+        except ResponseError as err:
+            self.assertEqual(400, err.status)
+        else:
+            self.fail("Expected ResponseError but didn't get it")
+
+    def test_slo_typo_size(self):
+        file_item = self.env.container.file("manifest-a-typo-size")
+        try:
+            file_item.write(
+                json.dumps([{
+                    'etag': md5(b'a' * 1024 * 1024,
+                                usedforsecurity=False).hexdigest(),
+                    'siz_bytes': 1024 * 1024,
+                    'path': '/%s/%s' % (self.env.container.name, 'seg_a'),
+                }]).encode('ascii'),
+                parms={'multipart-manifest': 'put'})
+        except ResponseError as err:
+            self.assertEqual(400, err.status)
+        else:
+            self.fail("Expected ResponseError but didn't get it")
+
+    def test_slo_overwrite_segment_with_manifest(self):
+        file_item = self.env.container.file("seg_b")
+        with self.assertRaises(ResponseError) as catcher:
+            file_item.write(
+                json.dumps([
+                    {'size_bytes': 1024 * 1024,
+                     'etag': md5(b'a' * 1024 * 1024,
+                                 usedforsecurity=False).hexdigest(),
+                     'path': '/%s/%s' % (self.env.container.name, 'seg_a')},
+                    {'size_bytes': 1024 * 1024,
+                     'etag': md5(b'b' * 1024 * 1024,
+                                 usedforsecurity=False).hexdigest(),
+                     'path': '/%s/%s' % (self.env.container.name, 'seg_b')},
+                    {'size_bytes': 1024 * 1024,
+                     'etag': md5(b'c' * 1024 * 1024,
+                                 usedforsecurity=False).hexdigest(),
+                     'path': '/%s/%s' % (self.env.container.name, 'seg_c')},
+                ]).encode('ascii'),
+                parms={'multipart-manifest': 'put'})
+        self.assertEqual(400, catcher.exception.status)
+
+    def test_slo_copy(self):
+        file_item = self.env.container.file("manifest-abcde")
+        file_item.copy(self.env.container.name, "copied-abcde")
+
+        copied = self.env.container.file("copied-abcde")
+        copied_contents = copied.read(parms={'multipart-manifest': 'get'})
+        self.assertEqual(4 * 1024 * 1024 + 1, len(copied_contents))
+
+    def test_slo_copy_using_x_copy_from(self):
+        # as per test_slo_copy but using a PUT with x-copy-from
+        file_item = self.env.container.file("manifest-abcde")
+        file_item.copy_using_x_copy_from(
+            self.env.container.name, "copied-abcde")
+
+        copied = self.env.container.file("copied-abcde")
+        copied_contents = copied.read(parms={'multipart-manifest': 'get'})
+        self.assertEqual(4 * 1024 * 1024 + 1, len(copied_contents))
+
+    def test_slo_copy_part_number(self):
+        file_item = self.env.container.file("manifest-abcde")
+        file_item.copy(self.env.container.name, "copied-abcde",
+                       parms={'part-number': '1'})
+
+        copied = self.env.container.file("copied-abcde")
+        copied_contents = copied.read(parms={'multipart-manifest': 'get'})
+        # just the first part is copied
+        self.assertEqual(1024 * 1024, len(copied_contents))
+        self.assertEqual(b'a' * 10, copied_contents[:10])
+
+    def test_slo_copy_part_number_using_x_copy_from(self):
+        # as per test_slo_copy_part_number but using a PUT with x-copy-from
+        file_item = self.env.container.file("manifest-abcde")
+        # part-number on the client PUT target is actually applied to the
+        # internal GET source request
+        file_item.copy_using_x_copy_from(
+            self.env.container.name, "copied-abcde",
+            parms={'part-number': '1'})
+
+        copied = self.env.container.file("copied-abcde")
+        copied_contents = copied.read(parms={'multipart-manifest': 'get'})
+        # just the first part is copied
+        self.assertEqual(1024 * 1024, len(copied_contents))
+        self.assertEqual(b'a' * 10, copied_contents[:10])
+
+    def test_slo_copy_account(self):
+        acct = urllib.parse.unquote(self.env.conn.account_name)
+        # same account copy
+        file_item = self.env.container.file("manifest-abcde")
+        file_item.copy_account(acct, self.env.container.name, "copied-abcde")
+
+        copied = self.env.container.file("copied-abcde")
+        copied_contents = copied.read(parms={'multipart-manifest': 'get'})
+        self.assertEqual(4 * 1024 * 1024 + 1, len(copied_contents))
+
+        if not tf.skip2:
+            # copy to different account
+            acct = urllib.parse.unquote(self.env.conn2.account_name)
+            dest_cont = self.env.account2.container(Utils.create_name())
+            self.assertTrue(dest_cont.create(hdrs={
+                'X-Container-Write': self.env.conn.user_acl
+            }))
+            file_item = self.env.container.file("manifest-abcde")
+            file_item.copy_account(acct, dest_cont, "copied-abcde")
+
+            copied = dest_cont.file("copied-abcde")
+            copied_contents = copied.read(parms={'multipart-manifest': 'get'})
+            self.assertEqual(4 * 1024 * 1024 + 1, len(copied_contents))
+
+    def test_slo_copy_the_manifest(self):
+        source = self.env.container.file("manifest-abcde")
+        source.initialize(parms={'multipart-manifest': 'get'})
+        source_contents = source.read(parms={'multipart-manifest': 'get'})
+        source_json = json.loads(source_contents)
+        manifest_etag = md5(source_contents, usedforsecurity=False).hexdigest()
+        if tf.cluster_info.get('etag_quoter', {}).get('enable_by_default'):
+            manifest_etag = '"%s"' % manifest_etag
+        self.assertEqual(manifest_etag, source.etag)
+
+        source.initialize()
+        self.assertEqual('application/octet-stream', source.content_type)
+        self.assertNotEqual(manifest_etag, source.etag)
+        slo_etag = source.etag
+
+        self.assertTrue(source.copy(self.env.container.name,
+                                    "copied-abcde-manifest-only",
+                                    parms={'multipart-manifest': 'get'}))
+
+        copied = self.env.container.file("copied-abcde-manifest-only")
+        copied.initialize(parms={'multipart-manifest': 'get'})
+        copied_contents = copied.read(parms={'multipart-manifest': 'get'})
+        try:
+            copied_json = json.loads(copied_contents)
+        except ValueError:
+            self.fail("COPY didn't copy the manifest (invalid json on GET)")
+        self.assertEqual(source_json, copied_json)
+        self.assertEqual(manifest_etag, copied.etag)
+
+        copied.initialize()
+        self.assertEqual('application/octet-stream', copied.content_type)
+        self.assertEqual(slo_etag, copied.etag)
+
+        # verify the listing metadata
+        listing = self.env.container.files(parms={'format': 'json'})
+        names = {}
+        for f_dict in listing:
+            if f_dict['name'] in ('manifest-abcde',
+                                  'copied-abcde-manifest-only'):
+                names[f_dict['name']] = f_dict
+
+        self.assertIn('manifest-abcde', names)
+        actual = names['manifest-abcde']
+        self.assertEqual(4 * 1024 * 1024 + 1, actual['bytes'])
+        self.assertEqual('application/octet-stream', actual['content_type'])
+        self.assertEqual(normalize_etag(manifest_etag), actual['hash'])
+        self.assertEqual(slo_etag, actual['slo_etag'])
+
+        self.assertIn('copied-abcde-manifest-only', names)
+        actual = names['copied-abcde-manifest-only']
+        self.assertEqual(4 * 1024 * 1024 + 1, actual['bytes'])
+        self.assertEqual('application/octet-stream', actual['content_type'])
+        self.assertEqual(normalize_etag(manifest_etag), actual['hash'])
+        self.assertEqual(slo_etag, actual['slo_etag'])
+
+        # Test copy manifest including data segments
+        source = self.env.container.file("mixed-object-data-manifest")
+        source_contents = source.read(parms={'multipart-manifest': 'get'})
+        source_json = json.loads(source_contents)
+        source.copy(
+            self.env.container.name,
+            "copied-mixed-object-data-manifest",
+            parms={'multipart-manifest': 'get'})
+
+        copied = self.env.container.file("copied-mixed-object-data-manifest")
+        copied_contents = copied.read(parms={'multipart-manifest': 'get'})
+        try:
+            copied_json = json.loads(copied_contents)
+        except ValueError:
+            self.fail("COPY didn't copy the manifest (invalid json on GET)")
+        self.assertEqual(source_contents, copied_contents)
+        self.assertEqual(copied_json[0], {
+            'data': base64.b64encode(b'APRE' * 8).decode('ascii')})
+
+    def test_slo_copy_the_manifest_using_x_copy_from(self):
+        # as per test_slo_copy_the_manifest but using a PUT with x-copy-from
+        source = self.env.container.file("manifest-abcde")
+        source.initialize(parms={'multipart-manifest': 'get'})
+        source_contents = source.read(parms={'multipart-manifest': 'get'})
+        source_json = json.loads(source_contents)
+        manifest_etag = md5(source_contents, usedforsecurity=False).hexdigest()
+        if tf.cluster_info.get('etag_quoter', {}).get('enable_by_default'):
+            manifest_etag = '"%s"' % manifest_etag
+        self.assertEqual(manifest_etag, source.etag)
+
+        source.initialize()
+        self.assertEqual('application/octet-stream', source.content_type)
+        self.assertNotEqual(manifest_etag, source.etag)
+
+        # multipart-manifest=get on the client PUT target request actually
+        # applies to the internal GET source request
+        self.assertTrue(
+            source.copy_using_x_copy_from(self.env.container.name,
+                                          "copied-abcde-manifest-only",
+                                          parms={'multipart-manifest': 'get'}))
+
+        copied = self.env.container.file("copied-abcde-manifest-only")
+        copied.initialize(parms={'multipart-manifest': 'get'})
+        copied_contents = copied.read(parms={'multipart-manifest': 'get'})
+        try:
+            copied_json = json.loads(copied_contents)
+        except ValueError:
+            self.fail("COPY didn't copy the manifest (invalid json on GET)")
+        self.assertEqual(source_json, copied_json)
+        self.assertEqual(manifest_etag, copied.etag)
+
+    def test_slo_copy_the_manifest_updating_metadata(self):
+        source = self.env.container.file("manifest-abcde")
+        source.content_type = 'application/octet-stream'
+        source.sync_metadata({'test': 'original'})
+        source.initialize(parms={'multipart-manifest': 'get'})
+        source_contents = source.read(parms={'multipart-manifest': 'get'})
+        source_json = json.loads(source_contents)
+        manifest_etag = md5(source_contents, usedforsecurity=False).hexdigest()
+        if tf.cluster_info.get('etag_quoter', {}).get('enable_by_default'):
+            manifest_etag = '"%s"' % manifest_etag
+        self.assertEqual(manifest_etag, source.etag)
+
+        source.initialize()
+        self.assertEqual('application/octet-stream', source.content_type)
+        self.assertNotEqual(manifest_etag, source.etag)
+        slo_etag = source.etag
+        self.assertEqual(source.metadata['test'], 'original')
+
+        self.assertTrue(
+            source.copy(self.env.container.name, "copied-abcde-manifest-only",
+                        parms={'multipart-manifest': 'get'},
+                        hdrs={'Content-Type': 'image/jpeg',
+                              'X-Object-Meta-Test': 'updated'}))
+
+        copied = self.env.container.file("copied-abcde-manifest-only")
+        copied.initialize(parms={'multipart-manifest': 'get'})
+        copied_contents = copied.read(parms={'multipart-manifest': 'get'})
+        try:
+            copied_json = json.loads(copied_contents)
+        except ValueError:
+            self.fail("COPY didn't copy the manifest (invalid json on GET)")
+        self.assertEqual(source_json, copied_json)
+        self.assertEqual(manifest_etag, copied.etag)
+
+        copied.initialize()
+        self.assertEqual('image/jpeg', copied.content_type)
+        self.assertEqual(slo_etag, copied.etag)
+        self.assertEqual(copied.metadata['test'], 'updated')
+
+        # verify the listing metadata
+        listing = self.env.container.files(parms={'format': 'json'})
+        names = {}
+        for f_dict in listing:
+            if f_dict['name'] in ('manifest-abcde',
+                                  'copied-abcde-manifest-only'):
+                names[f_dict['name']] = f_dict
+
+        self.assertIn('manifest-abcde', names)
+        actual = names['manifest-abcde']
+        self.assertEqual(4 * 1024 * 1024 + 1, actual['bytes'])
+        self.assertEqual('application/octet-stream', actual['content_type'])
+        # the container listing should have the etag of the manifest contents
+        self.assertEqual(normalize_etag(manifest_etag), actual['hash'])
+        self.assertEqual(slo_etag, actual['slo_etag'])
+
+        self.assertIn('copied-abcde-manifest-only', names)
+        actual = names['copied-abcde-manifest-only']
+        self.assertEqual(4 * 1024 * 1024 + 1, actual['bytes'])
+        self.assertEqual('image/jpeg', actual['content_type'])
+        self.assertEqual(normalize_etag(manifest_etag), actual['hash'])
+        self.assertEqual(slo_etag, actual['slo_etag'])
+
+    def test_slo_copy_the_manifest_account(self):
+        if tf.skip2:
+            raise SkipTest('Account2 not set')
+        acct = urllib.parse.unquote(self.env.conn.account_name)
+        # same account
+        file_item = self.env.container.file("manifest-abcde")
+        file_item.copy_account(acct,
+                               self.env.container.name,
+                               "copied-abcde-manifest-only",
+                               parms={'multipart-manifest': 'get'})
+
+        copied = self.env.container.file("copied-abcde-manifest-only")
+        copied_contents = copied.read(parms={'multipart-manifest': 'get'})
+        try:
+            json.loads(copied_contents)
+        except ValueError:
+            self.fail("COPY didn't copy the manifest (invalid json on GET)")
+
+        # different account
+        acct = urllib.parse.unquote(self.env.conn2.account_name)
+        dest_cont = self.env.account2.container(Utils.create_name())
+        self.assertTrue(dest_cont.create(hdrs={
+            'X-Container-Write': self.env.conn.user_acl
+        }))
+
+        # manifest copy will fail because there is no read access to segments
+        # in destination account
+        self.assertRaises(ResponseError, file_item.copy_account,
+                          acct, dest_cont, "copied-abcde-manifest-only",
+                          parms={'multipart-manifest': 'get'})
+        self.assertEqual(400, file_item.conn.response.status)
+        resp_body = file_item.conn.response.read()
+        self.assertEqual(5, resp_body.count(b'403 Forbidden'),
+                         'Unexpected response body %r' % resp_body)
+
+        # create segments container in account2 with read access for account1
+        segs_container = self.env.account2.container(self.env.container.name)
+        self.assertTrue(segs_container.create(hdrs={
+            'X-Container-Read': self.env.conn.user_acl
+        }))
+
+        # manifest copy will still fail because there are no segments in
+        # destination account
+        self.assertRaises(ResponseError, file_item.copy_account,
+                          acct, dest_cont, "copied-abcde-manifest-only",
+                          parms={'multipart-manifest': 'get'})
+        self.assertEqual(400, file_item.conn.response.status)
+        resp_body = file_item.conn.response.read()
+        self.assertEqual(5, resp_body.count(b'404 Not Found'),
+                         'Unexpected response body %r' % resp_body)
+
+        # create segments in account2 container with same name as in account1,
+        # manifest copy now succeeds
+        self.env.create_segments(segs_container)
+
+        self.assertTrue(file_item.copy_account(
+            acct, dest_cont, "copied-abcde-manifest-only",
+            parms={'multipart-manifest': 'get'}))
+
+        copied = dest_cont.file("copied-abcde-manifest-only")
+        copied_contents = copied.read(parms={'multipart-manifest': 'get'})
+        try:
+            json.loads(copied_contents)
+        except ValueError:
+            self.fail("COPY didn't copy the manifest (invalid json on GET)")
+
+    def test_slo_put_heartbeating(self):
+        if 'yield_frequency' not in cluster_info['slo']:
+            # old swift?
+            raise SkipTest('Swift does not seem to support heartbeating')
+
+        def do_put(headers=None, include_error=False):
+            file_item = self.env.container.file("manifest-heartbeat")
+            seg_info = self.env.seg_info
+            manifest_data = [seg_info['seg_a'], seg_info['seg_b'],
+                             seg_info['seg_c'], seg_info['seg_d'],
+                             seg_info['seg_e']]
+            if include_error:
+                manifest_data.append({'path': 'non-existent/segment'})
+            resp = file_item.write(
+                json.dumps(manifest_data).encode('ascii'),
+                parms={'multipart-manifest': 'put', 'heartbeat': 'on'},
+                hdrs=headers, return_resp=True)
+            self.assertEqual(resp.status, 202)
+            self.assertTrue(resp.chunked)
+            body_lines = resp.body.split(b'\n', 2)
+            self.assertFalse(body_lines[0].strip())  # all whitespace
+            self.assertEqual(b'\r', body_lines[1])
+            return body_lines[2]
+
+        body_lines = do_put().decode('utf8').split('\n')
+        self.assertIn('Response Status: 201 Created', body_lines)
+        self.assertIn('Etag', [line.split(':', 1)[0] for line in body_lines])
+        self.assertIn('Last Modified', [line.split(':', 1)[0]
+                                        for line in body_lines])
+
+        body_lines = do_put(
+            {'Accept': 'text/plain'}).decode('utf8').split('\n')
+        self.assertIn('Response Status: 201 Created', body_lines)
+        self.assertIn('Etag', [line.split(':', 1)[0] for line in body_lines])
+        self.assertIn('Last Modified', [line.split(':', 1)[0]
+                                        for line in body_lines])
+
+        body = do_put({'Accept': 'application/json'})
+        try:
+            resp = json.loads(body)
+        except ValueError:
+            self.fail('Expected JSON, got %r' % body)
+        self.assertIn('Etag', resp)
+        del resp['Etag']
+        self.assertIn('Last Modified', resp)
+        del resp['Last Modified']
+        self.assertEqual(resp, {
+            'Response Status': '201 Created',
+            'Response Body': '',
+            'Errors': [],
+        })
+
+        body_lines = do_put(include_error=True).decode('utf8').split('\n')
+        self.assertIn('Response Status: 400 Bad Request', body_lines)
+        self.assertIn('Response Body: Bad Request', body_lines)
+        self.assertNotIn('Etag', [line.split(':', 1)[0]
+                                  for line in body_lines])
+        self.assertNotIn('Last Modified', [line.split(':', 1)[0]
+                                           for line in body_lines])
+        self.assertEqual(body_lines[-3:], [
+            'Errors:',
+            'non-existent/segment, 404 Not Found',
+            '',
+        ])
+
+        body = do_put({'Accept': 'application/json'}, include_error=True)
+        try:
+            resp = json.loads(body)
+        except ValueError:
+            self.fail('Expected JSON, got %r' % body)
+        self.assertNotIn('Etag', resp)
+        self.assertNotIn('Last Modified', resp)
+        self.assertEqual(resp, {
+            'Response Status': '400 Bad Request',
+            'Response Body': 'Bad Request\nThe server could not comply with '
+                             'the request since it is either malformed or '
+                             'otherwise incorrect.',
+            'Errors': [
+                ['non-existent/segment', '404 Not Found'],
+            ],
+        })
+
+        body = do_put({'Accept': 'application/json', 'ETag': 'bad etag'})
+        try:
+            resp = json.loads(body)
+        except ValueError:
+            self.fail('Expected JSON, got %r' % body)
+        self.assertNotIn('Etag', resp)
+        self.assertNotIn('Last Modified', resp)
+        self.assertEqual(resp, {
+            'Response Status': '422 Unprocessable Entity',
+            'Response Body': 'Unprocessable Entity\nUnable to process the '
+                             'contained instructions',
+            'Errors': [],
+        })
+
+    def _make_manifest(self):
+        file_item = self.env.container.file("manifest-post")
+        seg_info = self.env.seg_info
+        file_item.write(
+            json.dumps([seg_info['seg_a'], seg_info['seg_b'],
+                        seg_info['seg_c'], seg_info['seg_d'],
+                        seg_info['seg_e']]).encode('ascii'),
+            parms={'multipart-manifest': 'put'})
+        return file_item
+
+    def test_slo_post_the_manifest_metadata_update(self):
+        file_item = self._make_manifest()
+        # sanity check, check the object is an SLO manifest
+        file_item.info()
+        file_item.header_fields([('slo', 'x-static-large-object')])
+
+        # POST a user metadata (i.e. x-object-meta-post)
+        file_item.sync_metadata({'post': 'update'})
+
+        updated = self.env.container.file("manifest-post")
+        updated.info()
+        updated.header_fields([('user-meta', 'x-object-meta-post')])  # sanity
+        updated.header_fields([('slo', 'x-static-large-object')])
+        updated_contents = updated.read(parms={'multipart-manifest': 'get'})
+        try:
+            json.loads(updated_contents)
+        except ValueError:
+            self.fail("Unexpected content on GET, expected a json body")
+
+    def test_slo_post_the_manifest_metadata_update_with_qs(self):
+        # multipart-manifest query should be ignored on post
+        for verb in ('put', 'get', 'delete'):
+            file_item = self._make_manifest()
+            # sanity check, check the object is an SLO manifest
+            file_item.info()
+            file_item.header_fields([('slo', 'x-static-large-object')])
+            # POST a user metadata (i.e. x-object-meta-post)
+            file_item.sync_metadata(metadata={'post': 'update'},
+                                    parms={'multipart-manifest': verb})
+            updated = self.env.container.file("manifest-post")
+            updated.info()
+            updated.header_fields(
+                [('user-meta', 'x-object-meta-post')])  # sanity
+            updated.header_fields([('slo', 'x-static-large-object')])
+            updated_contents = updated.read(
+                parms={'multipart-manifest': 'get'})
+            try:
+                json.loads(updated_contents)
+            except ValueError:
+                self.fail(
+                    "Unexpected content on GET, expected a json body")
+
+    def test_slo_get_the_manifest(self):
+        manifest = self.env.container.file("manifest-abcde")
+        got_body = manifest.read(parms={'multipart-manifest': 'get'})
+
+        self.assertEqual('application/json; charset=utf-8',
+                         manifest.content_type)
+        try:
+            json.loads(got_body)
+        except ValueError:
+            self.fail("GET with multipart-manifest=get got invalid json")
+
+    def test_slo_get_the_manifest_with_details_from_server(self):
+        manifest = self.env.container.file("manifest-db")
+        got_body = manifest.read(parms={'multipart-manifest': 'get'})
+
+        self.assertEqual('application/json; charset=utf-8',
+                         manifest.content_type)
+        try:
+            value = json.loads(got_body)
+        except ValueError:
+            self.fail("GET with multipart-manifest=get got invalid json")
+
+        self.assertEqual(len(value), 2)
+        self.assertEqual(value[0]['bytes'], 1024 * 1024)
+        self.assertEqual(
+            value[0]['hash'],
+            md5(b'd' * 1024 * 1024, usedforsecurity=False).hexdigest())
+        expected_name = '/%s/seg_d' % self.env.container.name
+        self.assertEqual(value[0]['name'], expected_name)
+
+        self.assertEqual(value[1]['bytes'], 1024 * 1024)
+        self.assertEqual(
+            value[1]['hash'],
+            md5(b'b' * 1024 * 1024, usedforsecurity=False).hexdigest())
+        expected_name = '/%s/seg_b' % self.env.container.name
+        self.assertEqual(value[1]['name'], expected_name)
+
+    def test_slo_get_raw_the_manifest_with_details_from_server(self):
+        manifest = self.env.container.file("manifest-db")
+        got_body = manifest.read(parms={'multipart-manifest': 'get',
+                                        'format': 'raw'})
+        self.assert_etag(
+            md5(got_body, usedforsecurity=False).hexdigest())
+
+        # raw format should have the actual manifest object content-type
+        self.assertEqual('application/octet-stream', manifest.content_type)
+        try:
+            value = json.loads(got_body)
+        except ValueError:
+            msg = "GET with multipart-manifest=get&format=raw got invalid json"
+            self.fail(msg)
+
+        self.assertEqual(
+            set(value[0].keys()), set(('size_bytes', 'etag', 'path')))
+        self.assertEqual(len(value), 2)
+        self.assertEqual(value[0]['size_bytes'], 1024 * 1024)
+        self.assertEqual(
+            value[0]['etag'],
+            md5(b'd' * 1024 * 1024, usedforsecurity=False).hexdigest())
+        expected_name = '/%s/seg_d' % self.env.container.name
+        self.assertEqual(value[0]['path'], expected_name)
+        self.assertEqual(value[1]['size_bytes'], 1024 * 1024)
+        self.assertEqual(
+            value[1]['etag'],
+            md5(b'b' * 1024 * 1024, usedforsecurity=False).hexdigest())
+        expected_name = '/%s/seg_b' % self.env.container.name
+        self.assertEqual(value[1]['path'], expected_name)
+
+        file_item = self.env.container.file("manifest-from-get-raw")
+        file_item.write(got_body, parms={'multipart-manifest': 'put'})
+
+        file_contents = file_item.read()
+        self.assertEqual(2 * 1024 * 1024, len(file_contents))
+
+    def test_slo_head_the_manifest(self):
+        manifest = self.env.container.file("manifest-abcde")
+        got_info = manifest.info(parms={'multipart-manifest': 'get'})
+
+        self.assertEqual('application/json; charset=utf-8',
+                         got_info['content_type'])
+
+    def test_slo_if_match_get(self):
+        manifest = self.env.container.file("manifest-abcde")
+        etag = manifest.info()['etag']
+
+        self.assertRaises(ResponseError, manifest.read,
+                          hdrs={'If-Match': 'not-%s' % etag})
+        self.assert_status(412)
+
+        manifest.read(hdrs={'If-Match': etag})
+        self.assert_status(200)
+
+    def test_slo_if_none_match_put(self):
+        file_item = self.env.container.file("manifest-if-none-match")
+        manifest = json.dumps([{
+            'size_bytes': 1024 * 1024,
+            'etag': None,
+            'path': '/%s/%s' % (self.env.container.name, 'seg_a')}])
+
+        self.assertRaises(ResponseError, file_item.write,
+                          manifest.encode('ascii'),
+                          parms={'multipart-manifest': 'put'},
+                          hdrs={'If-None-Match': '"not-star"'})
+        self.assert_status(400)
+
+        file_item.write(manifest.encode('ascii'),
+                        parms={'multipart-manifest': 'put'},
+                        hdrs={'If-None-Match': '*'})
+        self.assert_status(201)
+
+        self.assertRaises(ResponseError, file_item.write,
+                          manifest.encode('ascii'),
+                          parms={'multipart-manifest': 'put'},
+                          hdrs={'If-None-Match': '*'})
+        self.assert_status(412)
+
+    def test_slo_if_none_match_get(self):
+        manifest = self.env.container.file("manifest-abcde")
+        etag = manifest.info()['etag']
+
+        self.assertRaises(ResponseError, manifest.read,
+                          hdrs={'If-None-Match': etag})
+        self.assert_status(304)
+
+        manifest.read(hdrs={'If-None-Match': "not-%s" % etag})
+        self.assert_status(200)
+
+    def test_slo_if_match_head(self):
+        manifest = self.env.container.file("manifest-abcde")
+        etag = manifest.info()['etag']
+
+        self.assertRaises(ResponseError, manifest.info,
+                          hdrs={'If-Match': 'not-%s' % etag})
+        self.assert_status(412)
+
+        manifest.info(hdrs={'If-Match': etag})
+        self.assert_status(200)
+
+    def test_slo_if_none_match_head(self):
+        manifest = self.env.container.file("manifest-abcde")
+        etag = manifest.info()['etag']
+
+        self.assertRaises(ResponseError, manifest.info,
+                          hdrs={'If-None-Match': etag})
+        self.assert_status(304)
+
+        manifest.info(hdrs={'If-None-Match': "not-%s" % etag})
+        self.assert_status(200)
+
+    def test_slo_referer_on_segment_container(self):
+        if tf.skip3:
+            raise SkipTest('Username3 not set')
+        # First the account2 (test3) should fail
+        headers = {'X-Auth-Token': self.env.conn3.storage_token,
+                   'Referer': 'http://blah.example.com'}
+        slo_file = self.env.container2.file('manifest-abcde')
+        self.assertRaises(ResponseError, slo_file.read,
+                          hdrs=headers)
+        self.assert_status(403)
+
+        # Now set the referer on the slo container only
+        referer_metadata = {'X-Container-Read': '.r:*.example.com,.rlistings'}
+        self.env.container2.update_metadata(referer_metadata)
+
+        self.assertRaises(ResponseError, slo_file.read,
+                          hdrs=headers)
+        self.assert_status(409)
+
+        # Finally set the referer on the segment container
+        self.env.container.update_metadata(referer_metadata)
+        contents = slo_file.read(hdrs=headers)
+        self.assertEqual(4 * 1024 * 1024 + 1, len(contents))
+        self.assertEqual(b'a', contents[:1])
+        self.assertEqual(b'a', contents[1024 * 1024 - 1:1024 * 1024])
+        self.assertEqual(b'b', contents[1024 * 1024:1024 * 1024 + 1])
+        self.assertEqual(b'd', contents[-2:-1])
+        self.assertEqual(b'e', contents[-1:])
+
+    def test_slo_data_segments(self):
+        # len('APRE' * 8) == 32
+        # len('APOS' * 16) == 64
+        # len('BPOS' * 32) == 128
+        # len('CPRE' * 64) == 256
+        # len(a_pre + seg_a + post_a) == 32 + 1024 ** 2 + 64
+        # len(seg_b + post_b) == 1024 ** 2 + 128
+        # len(c_pre + seg_c) == 256 + 1024 ** 2
+        # len(total) == 3146208
+
+        for file_name in ("mixed-object-data-manifest",
+                          "nested-data-manifest"):
+            file_item = self.env.container.file(file_name)
+            file_contents = file_item.read(size=3 * 1024 ** 2 + 456,
+                                           offset=28)
+            self.assertEqual([
+                (b'A', 1),
+                (b'P', 1),
+                (b'R', 1),
+                (b'E', 1),
+                (b'a', 1024 * 1024),
+            ] + [
+                (b'A', 1),
+                (b'P', 1),
+                (b'O', 1),
+                (b'S', 1),
+            ] * 16 + [
+                (b'b', 1024 * 1024),
+            ] + [
+                (b'B', 1),
+                (b'P', 1),
+                (b'O', 1),
+                (b'S', 1),
+            ] * 32 + [
+                (b'C', 1),
+                (b'P', 1),
+                (b'R', 1),
+                (b'E', 1),
+            ] * 64 + [
+                (b'c', 1024 * 1024),
+            ] + [
+                (b'C', 1),
+                (b'P', 1),
+                (b'O', 1),
+                (b'S', 1),
+            ], group_file_contents(file_contents))
+
+
+class TestSloUTF8(Base2, TestSlo):
+    pass
diff --git a/test/functional/test_staticweb.py b/test/functional/test_staticweb.py
new file mode 100644
index 0000000000..a98f4ba861
--- /dev/null
+++ b/test/functional/test_staticweb.py
@@ -0,0 +1,627 @@
+#!/usr/bin/python -u
+# Copyright (c) 2010-2017 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import functools
+import hashlib
+import time
+from unittest import SkipTest
+from urllib.parse import unquote
+from swift.common.middleware import tempurl
+from swift.common.utils import quote
+from swift.common.swob import str_to_wsgi
+import test.functional as tf
+from test.functional.tests import Utils, Base, Base2, BaseEnv
+from test.functional.test_tempurl import tempurl_parms
+from test.functional.swift_test_client import Account, Connection, \
+    ResponseError
+
+
+def setUpModule():
+    tf.setup_package()
+
+
+def tearDownModule():
+    tf.teardown_package()
+
+
+def requires_domain_remap(func):
+    @functools.wraps(func)
+    def wrapper(*args, **kwargs):
+        if 'domain_remap' not in tf.cluster_info:
+            raise SkipTest('Domain Remap is not enabled')
+        # domain_remap middleware does not advertise its storage_domain values
+        # in swift /info responses so a storage_domain must be configured in
+        # test.conf for these tests to succeed
+        if not tf.config.get('storage_domain'):
+            raise SkipTest('Domain Remap storage_domain not configured in %s' %
+                           tf.config['__file__'])
+        return func(*args, **kwargs)
+
+    return wrapper
+
+
+class TestStaticWebEnv(BaseEnv):
+    static_web_enabled = None  # tri-state: None initially, then True/False
+
+    @classmethod
+    def setUp(cls):
+        cls.conn = Connection(tf.config)
+        cls.conn.authenticate()
+
+        if cls.static_web_enabled is None:
+            cls.static_web_enabled = 'staticweb' in tf.cluster_info
+            if not cls.static_web_enabled:
+                return
+
+        cls.account = Account(
+            cls.conn, tf.config.get('account', tf.config['username']))
+        cls.account.delete_containers()
+
+        cls.container = cls.account.container(Utils.create_name())
+        if not cls.container.create(
+                hdrs={'X-Container-Read': '.r:*,.rlistings'}):
+            raise ResponseError(cls.conn.response)
+
+        objects = ['index',
+                   'error',
+                   'listings_css',
+                   'dir/',
+                   'dir/obj',
+                   'dir/some sub%dir/',
+                   'dir/some sub%dir/obj']
+
+        cls.objects = {}
+        for item in sorted(objects):
+            if '/' in item.rstrip('/'):
+                parent, _ = item.rstrip('/').rsplit('/', 1)
+                path = '%s/%s' % (cls.objects[parent + '/'].name,
+                                  Utils.create_name())
+            else:
+                path = Utils.create_name()
+
+            if item[-1] == '/':
+                cls.objects[item] = cls.container.file(path)
+                cls.objects[item].write(hdrs={
+                    'Content-Type': 'application/directory'})
+            else:
+                cls.objects[item] = cls.container.file(path)
+                cls.objects[item].write(('%s contents' % item).encode('utf8'))
+
+
+class TestStaticWeb(Base):
+    env = TestStaticWebEnv
+    set_up = False
+
+    def setUp(self):
+        super(TestStaticWeb, self).setUp()
+        if self.env.static_web_enabled is False:
+            raise SkipTest("Static Web not enabled")
+        elif self.env.static_web_enabled is not True:
+            # just some sanity checking
+            raise Exception(
+                "Expected static_web_enabled to be True/False, got %r" %
+                (self.env.static_web_enabled,))
+
+    @property
+    def domain_remap_acct(self):
+        # the storage_domain option is test.conf must be set to one of the
+        # domain_remap middleware storage_domain values
+        return '.'.join((self.env.account.conn.account_name,
+                         tf.config.get('storage_domain')))
+
+    @property
+    def domain_remap_cont(self):
+        # the storage_domain option in test.conf must be set to one of the
+        # domain_remap middleware storage_domain values
+        return '.'.join(
+            (self.env.container.name, self.env.account.conn.account_name,
+             tf.config.get('storage_domain')))
+
+    def _set_staticweb_headers(self, index=False, listings=False,
+                               listings_css=False, error=False):
+        objects = self.env.objects
+        headers = {}
+        if index:
+            headers['X-Container-Meta-Web-Index'] = objects['index'].name
+        else:
+            headers['X-Remove-Container-Meta-Web-Index'] = 'true'
+
+        if listings:
+            headers['X-Container-Meta-Web-Listings'] = 'true'
+        else:
+            headers['X-Remove-Container-Meta-Web-Listings'] = 'true'
+
+        if listings_css:
+            headers['X-Container-Meta-Web-Listings-Css'] = \
+                objects['listings_css'].name
+        else:
+            headers['X-Remove-Container-Meta-Web-Listings-Css'] = 'true'
+
+        if error:
+            headers['X-Container-Meta-Web-Error'] = objects['error'].name
+        else:
+            headers['X-Remove-Container-Meta-Web-Error'] = 'true'
+
+        self.assertTrue(self.env.container.update_metadata(hdrs=headers))
+
+    def _test_redirect_with_slash(self, host, path, anonymous=False):
+        self._set_staticweb_headers(listings=True)
+        self.env.account.conn.make_request(
+            'GET', path,
+            hdrs={'X-Web-Mode': str(not anonymous), 'Host': host},
+            cfg={'no_auth_token': anonymous, 'absolute_path': True})
+
+        self.assert_status(301)
+        expected = '%s://%s%s/' % (
+            self.env.account.conn.storage_scheme, host, path)
+        self.assertEqual(self.env.conn.response.getheader('location'),
+                         expected)
+
+    def _test_redirect_slash_direct(self, anonymous):
+        host = self.env.account.conn.storage_netloc
+        path = '%s/%s' % (self.env.account.conn.storage_path,
+                          quote(self.env.container.name))
+        self._test_redirect_with_slash(host, path, anonymous=anonymous)
+
+        path = '%s/%s/%s' % (self.env.account.conn.storage_path,
+                             quote(self.env.container.name),
+                             quote(self.env.objects['dir/'].name))
+        self._test_redirect_with_slash(host, path, anonymous=anonymous)
+
+    def test_redirect_slash_auth_direct(self):
+        self._test_redirect_slash_direct(False)
+
+    def test_redirect_slash_anon_direct(self):
+        self._test_redirect_slash_direct(True)
+
+    @requires_domain_remap
+    def _test_redirect_slash_remap_acct(self, anonymous):
+        host = self.domain_remap_acct
+        path = '/%s' % quote(self.env.container.name)
+        self._test_redirect_with_slash(host, path, anonymous=anonymous)
+
+        path = '/%s/%s' % (quote(self.env.container.name),
+                           quote(self.env.objects['dir/'].name))
+        self._test_redirect_with_slash(host, path, anonymous=anonymous)
+
+    def test_redirect_slash_auth_remap_acct(self):
+        self._test_redirect_slash_remap_acct(False)
+
+    def test_redirect_slash_anon_remap_acct(self):
+        self._test_redirect_slash_remap_acct(True)
+
+    @requires_domain_remap
+    def _test_redirect_slash_remap_cont(self, anonymous):
+        host = self.domain_remap_cont
+        path = '/%s' % self.env.objects['dir/'].name
+        self._test_redirect_with_slash(host, path, anonymous=anonymous)
+
+    def test_redirect_slash_auth_remap_cont(self):
+        self._test_redirect_slash_remap_cont(False)
+
+    def test_redirect_slash_anon_remap_cont(self):
+        self._test_redirect_slash_remap_cont(True)
+
+    def _test_get_path(self, host, path, anonymous=False, expected_status=200,
+                       expected_in=[], expected_not_in=[]):
+        self.env.account.conn.make_request(
+            'GET', str_to_wsgi(path),
+            hdrs={'X-Web-Mode': str(not anonymous), 'Host': host},
+            cfg={'no_auth_token': anonymous, 'absolute_path': True})
+        self.assert_status(expected_status)
+        body = self.env.account.conn.response.read().decode('utf8')
+        for string in expected_in:
+            self.assertIn(string, body)
+        for string in expected_not_in:
+            self.assertNotIn(string, body)
+
+    def _test_listing(self, host, path, title=None, links=[], notins=[],
+                      css=None, anonymous=False):
+        self._set_staticweb_headers(listings=True,
+                                    listings_css=(css is not None))
+        if title is None:
+            title = unquote(path)
+        expected_in = ['Listing of %s' % title] + [
+            '<a href="{0}">{1}</a>'.format(quote(link), link)
+            for link in links]
+        expected_not_in = notins
+        if css:
+            expected_in.append('<link rel="stylesheet" type="text/css" '
+                               'href="%s" />' % quote(css))
+        self._test_get_path(host, path, anonymous=anonymous,
+                            expected_in=expected_in,
+                            expected_not_in=expected_not_in)
+
+    def _test_listing_direct(self, anonymous, listings_css):
+        objects = self.env.objects
+        host = self.env.account.conn.storage_netloc
+        path = '%s/%s/' % (self.env.account.conn.storage_path,
+                           quote(self.env.container.name))
+        css = objects['listings_css'].name if listings_css else None
+        self._test_listing(host, path, anonymous=True, css=css,
+                           links=[objects['index'].name,
+                                  objects['dir/'].name + '/'],
+                           notins=[objects['dir/obj'].name])
+
+        path = '%s/%s/%s/' % (self.env.account.conn.storage_path,
+                              quote(self.env.container.name),
+                              quote(objects['dir/'].name))
+        css = '../%s' % objects['listings_css'].name if listings_css else None
+        self._test_listing(
+            host, path, anonymous=anonymous, css=css,
+            links=[objects['dir/obj'].name.split('/')[-1],
+                   objects['dir/some sub%dir/'].name.split('/')[-1] + '/'],
+            notins=[objects['index'].name,
+                    objects['dir/some sub%dir/obj'].name])
+
+    def test_listing_auth_direct_without_css(self):
+        self._test_listing_direct(False, False)
+
+    def test_listing_anon_direct_without_css(self):
+        self._test_listing_direct(True, False)
+
+    def test_listing_auth_direct_with_css(self):
+        self._test_listing_direct(False, True)
+
+    def test_listing_anon_direct_with_css(self):
+        self._test_listing_direct(True, True)
+
+    @requires_domain_remap
+    def _test_listing_remap_acct(self, anonymous, listings_css):
+        objects = self.env.objects
+        host = self.domain_remap_acct
+        path = '/%s/' % self.env.container.name
+        css = objects['listings_css'].name if listings_css else None
+        title = '%s/%s/' % (self.env.account.conn.storage_path,
+                            self.env.container.name)
+        self._test_listing(host, path, title=title, anonymous=anonymous,
+                           css=css,
+                           links=[objects['index'].name,
+                                  objects['dir/'].name + '/'],
+                           notins=[objects['dir/obj'].name])
+
+        path = '/%s/%s/' % (self.env.container.name, objects['dir/'].name)
+        css = '../%s' % objects['listings_css'].name if listings_css else None
+        title = '%s/%s/%s/' % (self.env.account.conn.storage_path,
+                               self.env.container.name,
+                               objects['dir/'])
+        self._test_listing(
+            host, path, title=title, anonymous=anonymous, css=css,
+            links=[objects['dir/obj'].name.split('/')[-1],
+                   objects['dir/some sub%dir/'].name.split('/')[-1] + '/'],
+            notins=[objects['index'].name,
+                    objects['dir/some sub%dir/obj'].name])
+
+    def test_listing_auth_remap_acct_without_css(self):
+        self._test_listing_remap_acct(False, False)
+
+    def test_listing_anon_remap_acct_without_css(self):
+        self._test_listing_remap_acct(True, False)
+
+    def test_listing_auth_remap_acct_with_css(self):
+        self._test_listing_remap_acct(False, True)
+
+    def test_listing_anon_remap_acct_with_css(self):
+        self._test_listing_remap_acct(True, True)
+
+    @requires_domain_remap
+    def _test_listing_remap_cont(self, anonymous, listings_css):
+        objects = self.env.objects
+        host = self.domain_remap_cont
+        path = '/'
+        css = objects['listings_css'].name if listings_css else None
+        title = '%s/%s/' % (self.env.account.conn.storage_path,
+                            self.env.container.name)
+        self._test_listing(host, path, title=title, anonymous=anonymous,
+                           css=css,
+                           links=[objects['index'].name,
+                                  objects['dir/'].name + '/'],
+                           notins=[objects['dir/obj'].name])
+
+        path = '/%s/' % objects['dir/'].name
+        css = '../%s' % objects['listings_css'].name if listings_css else None
+        title = '%s/%s/%s/' % (self.env.account.conn.storage_path,
+                               self.env.container.name,
+                               objects['dir/'])
+        self._test_listing(
+            host, path, title=title, anonymous=anonymous, css=css,
+            links=[objects['dir/obj'].name.split('/')[-1],
+                   objects['dir/some sub%dir/'].name.split('/')[-1] + '/'],
+            notins=[objects['index'].name,
+                    objects['dir/some sub%dir/obj'].name])
+
+    def test_listing_auth_remap_cont_without_css(self):
+        self._test_listing_remap_cont(False, False)
+
+    def test_listing_anon_remap_cont_without_css(self):
+        self._test_listing_remap_cont(True, False)
+
+    def test_listing_auth_remap_cont_with_css(self):
+        self._test_listing_remap_cont(False, True)
+
+    def test_listing_anon_remap_cont_with_css(self):
+        self._test_listing_remap_cont(True, True)
+
+    def _test_index(self, host, path, anonymous=False, expected_status=200):
+        self._set_staticweb_headers(index=True)
+        if expected_status == 200:
+            expected_in = ['index contents']
+            expected_not_in = ['Listing']
+        else:
+            expected_in = []
+            expected_not_in = []
+        self._test_get_path(host, path, anonymous=anonymous,
+                            expected_status=expected_status,
+                            expected_in=expected_in,
+                            expected_not_in=expected_not_in)
+
+    def _test_index_direct(self, anonymous):
+        objects = self.env.objects
+        host = self.env.account.conn.storage_netloc
+        path = '%s/%s/' % (self.env.account.conn.storage_path,
+                           quote(self.env.container.name))
+        self._test_index(host, path, anonymous=anonymous)
+
+        path = '%s/%s/%s/' % (self.env.account.conn.storage_path,
+                              quote(self.env.container.name),
+                              quote(objects['dir/'].name))
+        self._test_index(host, path, anonymous=anonymous, expected_status=404)
+
+    def test_index_auth_direct(self):
+        self._test_index_direct(False)
+
+    def test_index_anon_direct(self):
+        self._test_index_direct(True)
+
+    @requires_domain_remap
+    def _test_index_remap_acct(self, anonymous):
+        objects = self.env.objects
+        host = self.domain_remap_acct
+        path = '/%s/' % self.env.container.name
+        self._test_index(host, path, anonymous=anonymous)
+
+        path = '/%s/%s/' % (self.env.container.name, objects['dir/'].name)
+        self._test_index(host, path, anonymous=anonymous, expected_status=404)
+
+    def test_index_auth_remap_acct(self):
+        self._test_index_remap_acct(False)
+
+    def test_index_anon_remap_acct(self):
+        self._test_index_remap_acct(True)
+
+    @requires_domain_remap
+    def _test_index_remap_cont(self, anonymous):
+        objects = self.env.objects
+        host = self.domain_remap_cont
+        path = '/'
+        self._test_index(host, path, anonymous=anonymous)
+
+        path = '/%s/' % objects['dir/'].name
+        self._test_index(host, path, anonymous=anonymous, expected_status=404)
+
+    def test_index_auth_remap_cont(self):
+        self._test_index_remap_cont(False)
+
+    def test_index_anon_remap_cont(self):
+        self._test_index_remap_cont(True)
+
+
+class TestStaticWebUTF8(Base2, TestStaticWeb):
+    def test_redirect_slash_auth_remap_cont(self):
+        self.skipTest("Can't remap UTF8 containers")
+
+    def test_redirect_slash_anon_remap_cont(self):
+        self.skipTest("Can't remap UTF8 containers")
+
+
+class TestStaticWebTempurlEnv(BaseEnv):
+    static_web_enabled = None  # tri-state: None initially, then True/False
+    tempurl_enabled = None  # tri-state: None initially, then True/False
+
+    @classmethod
+    def setUp(cls):
+        cls.conn = Connection(tf.config)
+        cls.conn.authenticate()
+
+        if cls.static_web_enabled is None:
+            cls.static_web_enabled = 'staticweb' in tf.cluster_info
+            if not cls.static_web_enabled:
+                return
+
+        if cls.tempurl_enabled is None:
+            cls.tempurl_enabled = 'tempurl' in tf.cluster_info
+            if not cls.tempurl_enabled:
+                return
+
+        cls.account = Account(
+            cls.conn, tf.config.get('account', tf.config['username']))
+        cls.account.delete_containers()
+
+        cls.container = cls.account.container(Utils.create_name())
+        cls.tempurl_key = Utils.create_name()
+        if not cls.container.create(
+                hdrs={'X-Container-Meta-Web-Listings': 'true',
+                      'X-Container-Meta-Temp-URL-Key': cls.tempurl_key}):
+            raise ResponseError(cls.conn.response)
+
+        objects = ['index',
+                   'error',
+                   'listings_css',
+                   'dir/',
+                   'dir/obj',
+                   'dir/subdir/',
+                   'dir/subdir/obj']
+
+        cls.objects = {}
+        for item in sorted(objects):
+            if '/' in item.rstrip('/'):
+                parent, _ = item.rstrip('/').rsplit('/', 1)
+                path = '%s/%s' % (cls.objects[parent + '/'].name,
+                                  Utils.create_name())
+            else:
+                path = Utils.create_name()
+
+            if item[-1] == '/':
+                cls.objects[item] = cls.container.file(path)
+                cls.objects[item].write(hdrs={
+                    'Content-Type': 'application/directory'})
+            else:
+                cls.objects[item] = cls.container.file(path)
+                cls.objects[item].write(('%s contents' % item).encode('utf8'))
+
+
+class TestStaticWebTempurl(Base):
+    env = TestStaticWebTempurlEnv
+    set_up = False
+
+    def setUp(self):
+        super(TestStaticWebTempurl, self).setUp()
+        if self.env.static_web_enabled is False:
+            raise SkipTest("Static Web not enabled")
+        elif self.env.static_web_enabled is not True:
+            # just some sanity checking
+            raise Exception(
+                "Expected static_web_enabled to be True/False, got %r" %
+                (self.env.static_web_enabled,))
+
+        if self.env.tempurl_enabled is False:
+            raise SkipTest("Temp URL not enabled")
+        elif self.env.tempurl_enabled is not True:
+            # just some sanity checking
+            raise Exception(
+                "Expected tempurl_enabled to be True/False, got %r" %
+                (self.env.tempurl_enabled,))
+
+        self.whole_container_parms = dict(tempurl_parms(
+            'GET', int(time.time() + 60),
+            'prefix:%s' % self.env.conn.make_path(
+                self.env.container.path + ['']),
+            self.env.tempurl_key, hashlib.sha256,
+        ), temp_url_prefix='')
+
+    def link(self, virtual_name, parms=None):
+        name = self.env.objects[virtual_name].name.rsplit('/', 1)[-1]
+        if parms is None:
+            parms = self.whole_container_parms
+        return (
+            '<a href="%s?temp_url_prefix=%s&amp;temp_url_expires=%s&amp;'
+            'temp_url_sig=%s">%s</a>' % (
+                name,
+                parms['temp_url_prefix'],
+                quote(str(parms['temp_url_expires'])),
+                parms['temp_url_sig'],
+                name))
+
+    def test_unauthed(self):
+        status = self.env.conn.make_request(
+            'GET', self.env.container.path, cfg={'no_auth_token': True})
+        self.assertEqual(status, 401)
+
+    def test_staticweb_off(self):
+        self.env.container.update_metadata(
+            {'X-Remove-Container-Meta-Web-Listings': 'true'})
+        status = self.env.conn.make_request(
+            'GET', self.env.container.path, parms=self.whole_container_parms,
+            cfg={'no_auth_token': True})
+        self.assertEqual(status, 401, self.env.conn.response.read())
+
+        status = self.env.conn.make_request(
+            'GET', self.env.container.path + [''],
+            parms=self.whole_container_parms,
+            cfg={'no_auth_token': True})
+        self.assertEqual(status, 401)
+
+        status = self.env.conn.make_request(
+            'GET',
+            self.env.container.path + [self.env.objects['dir/'].name, ''],
+            parms=self.whole_container_parms,
+            cfg={'no_auth_token': True})
+        self.assertEqual(status, 404)
+
+    def test_get_root(self):
+        status = self.env.conn.make_request(
+            'GET', self.env.container.path, parms=self.whole_container_parms,
+            cfg={'no_auth_token': True})
+        self.assertEqual(status, 301)
+
+        status = self.env.conn.make_request(
+            'GET', self.env.container.path + [''],
+            parms=self.whole_container_parms,
+            cfg={'no_auth_token': True})
+        self.assertEqual(status, 200)
+        body = self.env.conn.response.read().decode('utf-8')
+        self.assertIn('Listing of /v1/', body)
+        self.assertNotIn('href="..', body)
+        self.assertIn(self.link('dir/'), body)
+
+    def test_get_dir(self):
+        status = self.env.conn.make_request(
+            'GET',
+            self.env.container.path + [self.env.objects['dir/'].name, ''],
+            parms=self.whole_container_parms,
+            cfg={'no_auth_token': True})
+        self.assertEqual(status, 200)
+        body = self.env.conn.response.read().decode('utf-8')
+        self.assertIn('Listing of /v1/', body)
+        self.assertIn('href="..', body)
+        self.assertIn(self.link('dir/obj'), body)
+        self.assertIn(self.link('dir/subdir/'), body)
+
+    def test_get_dir_with_iso_expiry(self):
+        iso_expiry = time.strftime(
+            tempurl.EXPIRES_ISO8601_FORMAT,
+            time.gmtime(int(self.whole_container_parms['temp_url_expires'])))
+        iso_parms = dict(self.whole_container_parms,
+                         temp_url_expires=iso_expiry)
+        status = self.env.conn.make_request(
+            'GET',
+            self.env.container.path + [self.env.objects['dir/'].name, ''],
+            parms=iso_parms,
+            cfg={'no_auth_token': True})
+        self.assertEqual(status, 200)
+        body = self.env.conn.response.read().decode('utf-8')
+        self.assertIn('Listing of /v1/', body)
+        self.assertIn('href="..', body)
+        self.assertIn(self.link('dir/obj', iso_parms), body)
+        self.assertIn(self.link('dir/subdir/', iso_parms), body)
+
+    def test_get_limited_dir(self):
+        parms = dict(tempurl_parms(
+            'GET', int(time.time() + 60),
+            'prefix:%s' % self.env.conn.make_path(
+                self.env.container.path + [self.env.objects['dir/'].name, '']),
+            self.env.tempurl_key, hashlib.sha256,
+        ), temp_url_prefix=self.env.objects['dir/'].name + '/')
+        status = self.env.conn.make_request(
+            'GET',
+            self.env.container.path + [self.env.objects['dir/'].name, ''],
+            parms=parms, cfg={'no_auth_token': True})
+        self.assertEqual(status, 200)
+        body = self.env.conn.response.read().decode('utf-8')
+        self.assertIn('Listing of /v1/', body)
+        self.assertNotIn('href="..', body)
+        self.assertIn(self.link('dir/obj', parms), body)
+        self.assertIn(self.link('dir/subdir/', parms), body)
+
+        status = self.env.conn.make_request(
+            'GET', self.env.container.path + [
+                self.env.objects['dir/subdir/'].name, ''],
+            parms=parms, cfg={'no_auth_token': True})
+        self.assertEqual(status, 200)
+        body = self.env.conn.response.read().decode('utf-8')
+        self.assertIn('Listing of /v1/', body)
+        self.assertIn('href="..', body)
+        self.assertIn(self.link('dir/subdir/obj', parms), body)
diff --git a/test/functional/test_symlink.py b/test/functional/test_symlink.py
new file mode 100755
index 0000000000..c1c86044be
--- /dev/null
+++ b/test/functional/test_symlink.py
@@ -0,0 +1,2475 @@
+#!/usr/bin/python
+# Copyright (c) 2010-2015 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import hmac
+import unittest
+import itertools
+import hashlib
+import time
+
+import urllib.parse
+from uuid import uuid4
+
+from swift.common.http import is_success
+from swift.common.swob import normalize_etag
+from swift.common.utils import json, MD5_OF_EMPTY_STRING, md5
+from swift.common.middleware.slo import SloGetContext
+from test.functional import check_response, retry, requires_acls, \
+    cluster_info, SkipTest
+from test.functional.tests import Base, TestFileComparisonEnv, Utils, BaseEnv
+from test.functional.test_slo import TestSloEnv
+from test.functional.test_dlo import TestDloEnv
+from test.functional.test_tempurl import TestContainerTempurlEnv, \
+    TestTempurlEnv
+from test.functional.swift_test_client import ResponseError
+import test.functional as tf
+from test.unit import group_by_byte
+
+TARGET_BODY = b'target body'
+
+
+def setUpModule():
+    tf.setup_package()
+    if 'symlink' not in cluster_info:
+        raise SkipTest("Symlinks not enabled")
+
+
+def tearDownModule():
+    tf.teardown_package()
+
+
+class TestSymlinkEnv(BaseEnv):
+    link_cont = uuid4().hex
+    tgt_cont = uuid4().hex
+    tgt_obj = uuid4().hex
+
+    @classmethod
+    def setUp(cls):
+        if tf.skip or tf.skip2:
+            raise SkipTest
+
+        cls._create_container(cls.tgt_cont)  # use_account=1
+        cls._create_container(cls.link_cont)  # use_account=1
+
+        # container in account 2
+        cls._create_container(cls.link_cont, use_account=2)
+        cls._create_tgt_object()
+
+    @classmethod
+    def containers(cls):
+        return (cls.link_cont, cls.tgt_cont)
+
+    @classmethod
+    def target_content_location(cls, override_obj=None, override_account=None):
+        account = override_account or tf.parsed[0].path.split('/', 2)[2]
+        return '/v1/%s/%s/%s' % (account, cls.tgt_cont,
+                                 override_obj or cls.tgt_obj)
+
+    @classmethod
+    def _make_request(cls, url, token, parsed, conn, method,
+                      container, obj='', headers=None, body=b'',
+                      query_args=None):
+        headers = headers or {}
+        headers.update({'X-Auth-Token': token})
+        path = '%s/%s/%s' % (parsed.path, container, obj) if obj \
+               else '%s/%s' % (parsed.path, container)
+        if query_args:
+            path += '?%s' % query_args
+        conn.request(method, path, body, headers)
+        resp = check_response(conn)
+        # to read the buffer and keep it in the attribute, call resp.content
+        resp.content
+        return resp
+
+    @classmethod
+    def _create_container(cls, name, headers=None, use_account=1):
+        headers = headers or {}
+        resp = retry(cls._make_request, method='PUT', container=name,
+                     headers=headers, use_account=use_account)
+        if resp.status not in (201, 202):
+            raise ResponseError(resp)
+        return name
+
+    @classmethod
+    def _create_tgt_object(cls, body=TARGET_BODY):
+        resp = retry(cls._make_request, method='PUT',
+                     headers={'Content-Type': 'application/target'},
+                     container=cls.tgt_cont, obj=cls.tgt_obj,
+                     body=body)
+        if resp.status != 201:
+            raise ResponseError(resp)
+
+        # sanity: successful put response has content-length 0
+        cls.tgt_length = str(len(body))
+        cls.tgt_etag = resp.getheader('etag')
+
+        resp = retry(cls._make_request, method='GET',
+                     container=cls.tgt_cont, obj=cls.tgt_obj)
+        if resp.status != 200 and resp.content != body:
+            raise ResponseError(resp)
+
+    @classmethod
+    def tearDown(cls):
+        delete_containers = [
+            (use_account, containers) for use_account, containers in
+            enumerate([cls.containers(), [cls.link_cont]], 1)]
+        # delete objects inside container
+        for use_account, containers in delete_containers:
+            if use_account == 2 and tf.skip2:
+                continue
+            for container in containers:
+                while True:
+                    cont = container
+                    resp = retry(cls._make_request, method='GET',
+                                 container=cont, query_args='format=json',
+                                 use_account=use_account)
+                    if resp.status == 404:
+                        break
+                    if not is_success(resp.status):
+                        raise ResponseError(resp)
+                    objs = json.loads(resp.content)
+                    if not objs:
+                        break
+                    for obj in objs:
+                        resp = retry(cls._make_request, method='DELETE',
+                                     container=container, obj=obj['name'],
+                                     use_account=use_account)
+                        if resp.status not in (204, 404):
+                            raise ResponseError(resp)
+
+        # delete the containers
+        for use_account, containers in delete_containers:
+            if use_account == 2 and tf.skip2:
+                continue
+            for container in containers:
+                resp = retry(cls._make_request, method='DELETE',
+                             container=container,
+                             use_account=use_account)
+                if resp.status not in (204, 404):
+                    raise ResponseError(resp)
+
+
+class TestSymlink(Base):
+    env = TestSymlinkEnv
+
+    @classmethod
+    def setUpClass(cls):
+        # To skip env setup for class setup, instead setUp the env for each
+        # test method
+        pass
+
+    def setUp(self):
+        self.env.setUp()
+
+        def object_name_generator():
+            while True:
+                yield uuid4().hex
+
+        self.obj_name_gen = object_name_generator()
+        self._account_name = None
+
+    def tearDown(self):
+        self.env.tearDown()
+
+    @property
+    def account_name(self):
+        if not self._account_name:
+            self._account_name = tf.parsed[0].path.split('/', 2)[2]
+        return self._account_name
+
+    def _make_request(self, url, token, parsed, conn, method,
+                      container, obj='', headers=None, body=b'',
+                      query_args=None, allow_redirects=True):
+        headers = headers or {}
+        headers.update({'X-Auth-Token': token})
+        path = '%s/%s/%s' % (parsed.path, container, obj) if obj \
+               else '%s/%s' % (parsed.path, container)
+        if query_args:
+            path += '?%s' % query_args
+        conn.requests_args['allow_redirects'] = allow_redirects
+        conn.request(method, path, body, headers)
+        resp = check_response(conn)
+        # to read the buffer and keep it in the attribute, call resp.content
+        resp.content
+        return resp
+
+    def _make_request_with_symlink_get(self, url, token, parsed, conn, method,
+                                       container, obj, headers=None, body=b''):
+        resp = self._make_request(
+            url, token, parsed, conn, method, container, obj, headers, body,
+            query_args='symlink=get')
+        return resp
+
+    def _test_put_symlink(self, link_cont, link_obj, tgt_cont, tgt_obj):
+        headers = {'X-Symlink-Target': '%s/%s' % (tgt_cont, tgt_obj)}
+        resp = retry(self._make_request, method='PUT',
+                     container=link_cont, obj=link_obj,
+                     headers=headers)
+        self.assertEqual(resp.status, 201)
+
+    def _test_put_symlink_with_etag(self, link_cont, link_obj, tgt_cont,
+                                    tgt_obj, etag, headers=None):
+        headers = headers or {}
+        headers.update({'X-Symlink-Target': '%s/%s' % (tgt_cont, tgt_obj),
+                        'X-Symlink-Target-Etag': etag})
+        resp = retry(self._make_request, method='PUT',
+                     container=link_cont, obj=link_obj,
+                     headers=headers)
+        self.assertEqual(resp.status, 201, resp.content)
+
+    def _test_get_as_target_object(
+            self, link_cont, link_obj, expected_content_location,
+            use_account=1):
+        resp = retry(
+            self._make_request, method='GET',
+            container=link_cont, obj=link_obj, use_account=use_account)
+        self.assertEqual(resp.status, 200, resp.content)
+        self.assertEqual(resp.content, TARGET_BODY)
+        self.assertEqual(resp.getheader('content-length'),
+                         str(self.env.tgt_length))
+        self.assertEqual(resp.getheader('etag'), self.env.tgt_etag)
+        self.assertIn('Content-Location', resp.headers)
+        self.assertEqual(expected_content_location,
+                         resp.getheader('content-location'))
+        return resp
+
+    def _test_head_as_target_object(self, link_cont, link_obj, use_account=1):
+        resp = retry(
+            self._make_request, method='HEAD',
+            container=link_cont, obj=link_obj, use_account=use_account)
+        self.assertEqual(resp.status, 200)
+
+    def _assertLinkObject(self, link_cont, link_obj, use_account=1):
+        # HEAD on link_obj itself
+        resp = retry(
+            self._make_request_with_symlink_get, method='HEAD',
+            container=link_cont, obj=link_obj, use_account=use_account)
+        self.assertEqual(resp.status, 200)
+        self.assertTrue(resp.getheader('x-symlink-target'))
+
+        # GET on link_obj itself
+        resp = retry(
+            self._make_request_with_symlink_get, method='GET',
+            container=link_cont, obj=link_obj, use_account=use_account)
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(resp.content, b'')
+        self.assertEqual(resp.getheader('content-length'), str(0))
+        self.assertTrue(resp.getheader('x-symlink-target'))
+
+    def _assertSymlink(self, link_cont, link_obj,
+                       expected_content_location=None, use_account=1):
+        expected_content_location = \
+            expected_content_location or self.env.target_content_location()
+        # sanity: HEAD/GET on link_obj
+        self._assertLinkObject(link_cont, link_obj, use_account)
+
+        # HEAD target object via symlink
+        self._test_head_as_target_object(
+            link_cont=link_cont, link_obj=link_obj, use_account=use_account)
+
+        # GET target object via symlink
+        self._test_get_as_target_object(
+            link_cont=link_cont, link_obj=link_obj, use_account=use_account,
+            expected_content_location=expected_content_location)
+
+    def test_symlink_with_encoded_target_name(self):
+        # makes sure to test encoded characters as symlink target
+        target_obj = 'dealde%2Fl04 011e%204c8df/flash.png'
+        link_obj = uuid4().hex
+
+        # create target using unnormalized path
+        resp = retry(
+            self._make_request, method='PUT', container=self.env.tgt_cont,
+            obj=target_obj, body=TARGET_BODY)
+        self.assertEqual(resp.status, 201)
+        # you can get it using either name
+        resp = retry(
+            self._make_request, method='GET', container=self.env.tgt_cont,
+            obj=target_obj)
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(resp.content, TARGET_BODY)
+        normalized_quoted_obj = 'dealde/l04%20011e%204c8df/flash.png'
+        self.assertEqual(normalized_quoted_obj, urllib.parse.quote(
+            urllib.parse.unquote(target_obj)))
+        resp = retry(
+            self._make_request, method='GET', container=self.env.tgt_cont,
+            obj=normalized_quoted_obj)
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(resp.content, TARGET_BODY)
+
+        # create a symlink using the un-normalized target path
+        self._test_put_symlink(link_cont=self.env.link_cont, link_obj=link_obj,
+                               tgt_cont=self.env.tgt_cont,
+                               tgt_obj=target_obj)
+        # and it's normalized
+        self._assertSymlink(
+            self.env.link_cont, link_obj,
+            expected_content_location=self.env.target_content_location(
+                normalized_quoted_obj))
+
+        # create a symlink using the normalized target path
+        self._test_put_symlink(link_cont=self.env.link_cont, link_obj=link_obj,
+                               tgt_cont=self.env.tgt_cont,
+                               tgt_obj=normalized_quoted_obj)
+        # and it's ALSO normalized
+        self._assertSymlink(
+            self.env.link_cont, link_obj,
+            expected_content_location=self.env.target_content_location(
+                normalized_quoted_obj))
+
+    def test_symlink_put_head_get(self):
+        link_obj = uuid4().hex
+
+        # PUT link_obj
+        self._test_put_symlink(link_cont=self.env.link_cont, link_obj=link_obj,
+                               tgt_cont=self.env.tgt_cont,
+                               tgt_obj=self.env.tgt_obj)
+
+        self._assertSymlink(self.env.link_cont, link_obj)
+
+    def test_symlink_with_etag_put_head_get(self):
+        link_obj = uuid4().hex
+
+        # PUT link_obj
+        self._test_put_symlink_with_etag(link_cont=self.env.link_cont,
+                                         link_obj=link_obj,
+                                         tgt_cont=self.env.tgt_cont,
+                                         tgt_obj=self.env.tgt_obj,
+                                         etag=self.env.tgt_etag)
+
+        self._assertSymlink(self.env.link_cont, link_obj)
+
+        resp = retry(
+            self._make_request, method='GET',
+            container=self.env.link_cont, obj=link_obj,
+            headers={'If-Match': self.env.tgt_etag})
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(resp.getheader('content-location'),
+                         self.env.target_content_location())
+
+        resp = retry(
+            self._make_request, method='GET',
+            container=self.env.link_cont, obj=link_obj,
+            headers={'If-Match': 'not-the-etag'})
+        self.assertEqual(resp.status, 412)
+        self.assertEqual(resp.getheader('content-location'),
+                         self.env.target_content_location())
+
+    def test_static_symlink_with_bad_etag_put_head_get(self):
+        link_obj = uuid4().hex
+
+        # PUT link_obj
+        self._test_put_symlink_with_etag(link_cont=self.env.link_cont,
+                                         link_obj=link_obj,
+                                         tgt_cont=self.env.tgt_cont,
+                                         tgt_obj=self.env.tgt_obj,
+                                         etag=self.env.tgt_etag)
+
+        # overwrite tgt object
+        self.env._create_tgt_object(body='updated target body')
+
+        resp = retry(
+            self._make_request, method='HEAD',
+            container=self.env.link_cont, obj=link_obj)
+        self.assertEqual(resp.status, 409)
+        # but we still know where it points
+        self.assertEqual(resp.getheader('content-location'),
+                         self.env.target_content_location())
+
+        resp = retry(
+            self._make_request, method='GET',
+            container=self.env.link_cont, obj=link_obj)
+        self.assertEqual(resp.status, 409)
+        self.assertEqual(resp.getheader('content-location'),
+                         self.env.target_content_location())
+
+        # uses a mechanism entirely divorced from if-match
+        resp = retry(
+            self._make_request, method='GET',
+            container=self.env.link_cont, obj=link_obj,
+            headers={'If-Match': self.env.tgt_etag})
+        self.assertEqual(resp.status, 409)
+        self.assertEqual(resp.getheader('content-location'),
+                         self.env.target_content_location())
+
+        resp = retry(
+            self._make_request, method='GET',
+            container=self.env.link_cont, obj=link_obj,
+            headers={'If-Match': 'not-the-etag'})
+        self.assertEqual(resp.status, 409)
+        self.assertEqual(resp.getheader('content-location'),
+                         self.env.target_content_location())
+
+        resp = retry(
+            self._make_request, method='DELETE',
+            container=self.env.tgt_cont, obj=self.env.tgt_obj)
+
+        # not-found-ness trumps if-match-ness
+        resp = retry(
+            self._make_request, method='GET',
+            container=self.env.link_cont, obj=link_obj)
+        self.assertEqual(resp.status, 404)
+        self.assertEqual(resp.getheader('content-location'),
+                         self.env.target_content_location())
+
+    def test_dynamic_link_to_static_link(self):
+        static_link_obj = uuid4().hex
+
+        # PUT static_link to tgt_obj
+        self._test_put_symlink_with_etag(link_cont=self.env.link_cont,
+                                         link_obj=static_link_obj,
+                                         tgt_cont=self.env.tgt_cont,
+                                         tgt_obj=self.env.tgt_obj,
+                                         etag=self.env.tgt_etag)
+
+        symlink_obj = uuid4().hex
+
+        # PUT symlink to static_link
+        self._test_put_symlink(link_cont=self.env.link_cont,
+                               link_obj=symlink_obj,
+                               tgt_cont=self.env.link_cont,
+                               tgt_obj=static_link_obj)
+
+        self._test_get_as_target_object(
+            link_cont=self.env.link_cont, link_obj=symlink_obj,
+            expected_content_location=self.env.target_content_location())
+
+    def test_static_link_to_dynamic_link(self):
+        symlink_obj = uuid4().hex
+
+        # PUT symlink to tgt_obj
+        self._test_put_symlink(link_cont=self.env.link_cont,
+                               link_obj=symlink_obj,
+                               tgt_cont=self.env.tgt_cont,
+                               tgt_obj=self.env.tgt_obj)
+
+        static_link_obj = uuid4().hex
+
+        # PUT a static_link to the symlink
+        self._test_put_symlink_with_etag(link_cont=self.env.link_cont,
+                                         link_obj=static_link_obj,
+                                         tgt_cont=self.env.link_cont,
+                                         tgt_obj=symlink_obj,
+                                         etag=MD5_OF_EMPTY_STRING)
+
+        self._test_get_as_target_object(
+            link_cont=self.env.link_cont, link_obj=static_link_obj,
+            expected_content_location=self.env.target_content_location())
+
+    def test_static_link_to_nowhere(self):
+        missing_obj = uuid4().hex
+        static_link_obj = uuid4().hex
+
+        # PUT a static_link to the missing name
+        headers = {
+            'X-Symlink-Target': '%s/%s' % (self.env.link_cont, missing_obj),
+            'X-Symlink-Target-Etag': MD5_OF_EMPTY_STRING}
+        resp = retry(self._make_request, method='PUT',
+                     container=self.env.link_cont, obj=static_link_obj,
+                     headers=headers)
+        self.assertEqual(resp.status, 409)
+        self.assertEqual(resp.content, b'X-Symlink-Target does not exist')
+
+    def test_static_link_to_broken_symlink(self):
+        symlink_obj = uuid4().hex
+
+        # PUT symlink to tgt_obj
+        self._test_put_symlink(link_cont=self.env.link_cont,
+                               link_obj=symlink_obj,
+                               tgt_cont=self.env.tgt_cont,
+                               tgt_obj=self.env.tgt_obj)
+
+        static_link_obj = uuid4().hex
+
+        # PUT a static_link to the symlink
+        self._test_put_symlink_with_etag(link_cont=self.env.link_cont,
+                                         link_obj=static_link_obj,
+                                         tgt_cont=self.env.link_cont,
+                                         tgt_obj=symlink_obj,
+                                         etag=MD5_OF_EMPTY_STRING)
+
+        # break the symlink
+        resp = retry(
+            self._make_request, method='DELETE',
+            container=self.env.tgt_cont, obj=self.env.tgt_obj)
+        self.assertEqual(resp.status // 100, 2)
+
+        # sanity
+        resp = retry(
+            self._make_request, method='GET',
+            container=self.env.link_cont, obj=symlink_obj)
+        self.assertEqual(resp.status, 404)
+
+        # static_link is broken too!
+        resp = retry(
+            self._make_request, method='GET',
+            container=self.env.link_cont, obj=static_link_obj)
+        self.assertEqual(resp.status, 404)
+
+        # interestingly you may create a static_link to a broken symlink
+        broken_static_link_obj = uuid4().hex
+
+        # PUT a static_link to the broken symlink
+        self._test_put_symlink_with_etag(link_cont=self.env.link_cont,
+                                         link_obj=broken_static_link_obj,
+                                         tgt_cont=self.env.link_cont,
+                                         tgt_obj=symlink_obj,
+                                         etag=MD5_OF_EMPTY_STRING)
+
+    def test_symlink_get_ranged(self):
+        link_obj = uuid4().hex
+
+        # PUT symlink
+        self._test_put_symlink(link_cont=self.env.link_cont, link_obj=link_obj,
+                               tgt_cont=self.env.tgt_cont,
+                               tgt_obj=self.env.tgt_obj)
+
+        headers = {'Range': 'bytes=7-10'}
+        resp = retry(self._make_request, method='GET',
+                     container=self.env.link_cont, obj=link_obj,
+                     headers=headers)
+        self.assertEqual(resp.status, 206)
+        self.assertEqual(resp.content, b'body')
+
+    def test_create_symlink_before_target(self):
+        link_obj = uuid4().hex
+        target_obj = uuid4().hex
+
+        # PUT link_obj before target object is written
+        # PUT, GET, HEAD (on symlink) should all work ok without target object
+        self._test_put_symlink(link_cont=self.env.link_cont, link_obj=link_obj,
+                               tgt_cont=self.env.tgt_cont, tgt_obj=target_obj)
+
+        # Try to GET target via symlink.
+        # 404 will be returned with Content-Location of target path.
+        resp = retry(
+            self._make_request, method='GET',
+            container=self.env.link_cont, obj=link_obj, use_account=1)
+        self.assertEqual(resp.status, 404)
+        self.assertIn('Content-Location', resp.headers)
+        self.assertEqual(self.env.target_content_location(target_obj),
+                         resp.getheader('content-location'))
+
+        # HEAD on target object via symlink should return a 404 since target
+        # object has not yet been written
+        resp = retry(
+            self._make_request, method='HEAD',
+            container=self.env.link_cont, obj=link_obj)
+        self.assertEqual(resp.status, 404)
+
+        # GET on target object directly
+        resp = retry(
+            self._make_request, method='GET',
+            container=self.env.tgt_cont, obj=target_obj)
+        self.assertEqual(resp.status, 404)
+
+        # Now let's write target object and symlink will be able to return
+        # object
+        resp = retry(
+            self._make_request, method='PUT', container=self.env.tgt_cont,
+            obj=target_obj, body=TARGET_BODY)
+
+        self.assertEqual(resp.status, 201)
+        # successful put response has content-length 0
+        target_length = str(len(TARGET_BODY))
+        target_etag = resp.getheader('etag')
+
+        # sanity: HEAD/GET on link_obj itself
+        self._assertLinkObject(self.env.link_cont, link_obj)
+
+        # HEAD target object via symlink
+        self._test_head_as_target_object(
+            link_cont=self.env.link_cont, link_obj=link_obj)
+
+        # GET target object via symlink
+        resp = retry(self._make_request, method='GET',
+                     container=self.env.link_cont, obj=link_obj)
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(resp.content, TARGET_BODY)
+        self.assertEqual(resp.getheader('content-length'), str(target_length))
+        self.assertEqual(resp.getheader('etag'), target_etag)
+        self.assertIn('Content-Location', resp.headers)
+        self.assertEqual(self.env.target_content_location(target_obj),
+                         resp.getheader('content-location'))
+
+    def test_symlink_chain(self):
+        # Testing to symlink chain like symlink -> symlink -> target.
+        symloop_max = cluster_info['symlink']['symloop_max']
+
+        # create symlink chain in a container. To simplify,
+        # use target container for all objects (symlinks and target) here
+        previous = self.env.tgt_obj
+        container = self.env.tgt_cont
+
+        for link_obj in itertools.islice(self.obj_name_gen, symloop_max):
+            # PUT link_obj point to tgt_obj
+            self._test_put_symlink(
+                link_cont=container, link_obj=link_obj,
+                tgt_cont=container, tgt_obj=previous)
+
+            # set corrent link_obj to previous
+            previous = link_obj
+
+        # the last link is valid for symloop_max constraint
+        max_chain_link = link_obj
+        self._assertSymlink(link_cont=container, link_obj=max_chain_link)
+
+        # PUT a new link_obj points to the max_chain_link
+        # that will result in 409 error on the HEAD/GET.
+        too_many_chain_link = next(self.obj_name_gen)
+        self._test_put_symlink(
+            link_cont=container, link_obj=too_many_chain_link,
+            tgt_cont=container, tgt_obj=max_chain_link)
+
+        # try to HEAD to target object via too_many_chain_link
+        resp = retry(self._make_request, method='HEAD',
+                     container=container,
+                     obj=too_many_chain_link)
+        self.assertEqual(resp.status, 409)
+        self.assertEqual(resp.content, b'')
+
+        # try to GET to target object via too_many_chain_link
+        resp = retry(self._make_request, method='GET',
+                     container=container,
+                     obj=too_many_chain_link)
+        self.assertEqual(resp.status, 409)
+        self.assertEqual(
+            resp.content,
+            b'Too many levels of symbolic links, maximum allowed is %d' %
+            symloop_max)
+
+        # However, HEAD/GET to the (just) link is still ok
+        self._assertLinkObject(container, too_many_chain_link)
+
+    def test_symlink_chain_with_etag(self):
+        # Testing to symlink chain like symlink -> symlink -> target.
+        symloop_max = cluster_info['symlink']['symloop_max']
+
+        # create symlink chain in a container. To simplify,
+        # use target container for all objects (symlinks and target) here
+        previous = self.env.tgt_obj
+        container = self.env.tgt_cont
+
+        for link_obj in itertools.islice(self.obj_name_gen, symloop_max):
+            # PUT link_obj point to tgt_obj
+            self._test_put_symlink_with_etag(link_cont=container,
+                                             link_obj=link_obj,
+                                             tgt_cont=container,
+                                             tgt_obj=previous,
+                                             etag=self.env.tgt_etag)
+
+            # set current link_obj to previous
+            previous = link_obj
+
+        # the last link is valid for symloop_max constraint
+        max_chain_link = link_obj
+        self._assertSymlink(link_cont=container, link_obj=max_chain_link)
+
+        # chained etag validation works as long as the target symlink works
+        headers = {'X-Symlink-Target': '%s/%s' % (container, max_chain_link),
+                   'X-Symlink-Target-Etag': 'not-the-real-etag'}
+        resp = retry(self._make_request, method='PUT',
+                     container=container, obj=uuid4().hex,
+                     headers=headers)
+        self.assertEqual(resp.status, 409)
+
+        # PUT a new link_obj pointing to the max_chain_link can validate the
+        # ETag but will result in 409 error on the HEAD/GET.
+        too_many_chain_link = next(self.obj_name_gen)
+        self._test_put_symlink_with_etag(
+            link_cont=container, link_obj=too_many_chain_link,
+            tgt_cont=container, tgt_obj=max_chain_link,
+            etag=self.env.tgt_etag)
+
+        # try to HEAD to target object via too_many_chain_link
+        resp = retry(self._make_request, method='HEAD',
+                     container=container,
+                     obj=too_many_chain_link)
+        self.assertEqual(resp.status, 409)
+        self.assertEqual(resp.content, b'')
+
+        # try to GET to target object via too_many_chain_link
+        resp = retry(self._make_request, method='GET',
+                     container=container,
+                     obj=too_many_chain_link)
+        self.assertEqual(resp.status, 409)
+        self.assertEqual(
+            resp.content,
+            b'Too many levels of symbolic links, maximum allowed is %d' %
+            symloop_max)
+
+        # However, HEAD/GET to the (just) link is still ok
+        self._assertLinkObject(container, too_many_chain_link)
+
+    def test_symlink_and_slo_manifest_chain(self):
+        if 'slo' not in cluster_info:
+            raise SkipTest
+
+        symloop_max = cluster_info['symlink']['symloop_max']
+
+        # create symlink chain in a container. To simplify,
+        # use target container for all objects (symlinks and target) here
+        previous = self.env.tgt_obj
+        container = self.env.tgt_cont
+
+        # make symlink and slo manifest chain
+        # e.g. slo -> symlink -> symlink -> slo -> symlink -> symlink -> target
+        for _ in range(SloGetContext.max_slo_recursion_depth or 1):
+            for link_obj in itertools.islice(self.obj_name_gen, symloop_max):
+                # PUT link_obj point to previous object
+                self._test_put_symlink(
+                    link_cont=container, link_obj=link_obj,
+                    tgt_cont=container, tgt_obj=previous)
+
+                # next link will point to this link
+                previous = link_obj
+            else:
+                # PUT a manifest with single segment to the symlink
+                manifest_obj = next(self.obj_name_gen)
+                manifest = json.dumps(
+                    [{'path': '/%s/%s' % (container, link_obj)}])
+                resp = retry(self._make_request, method='PUT',
+                             container=container, obj=manifest_obj,
+                             body=manifest,
+                             query_args='multipart-manifest=put')
+                self.assertEqual(resp.status, 201)  # sanity
+                previous = manifest_obj
+
+        # From the last manifest to the final target obj length is
+        # symloop_max * max_slo_recursion_depth
+        max_recursion_manifest = previous
+
+        # Check GET to max_recursion_manifest returns valid target object
+        resp = retry(
+            self._make_request, method='GET', container=container,
+            obj=max_recursion_manifest)
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(resp.content, TARGET_BODY)
+        self.assertEqual(resp.getheader('content-length'),
+                         str(self.env.tgt_length))
+        # N.B. since the last manifest is slo so it will remove
+        # content-location info from the response header
+        self.assertNotIn('Content-Location', resp.headers)
+
+        # sanity: one more link to the slo can work still
+        one_more_link = next(self.obj_name_gen)
+        self._test_put_symlink(
+            link_cont=container, link_obj=one_more_link,
+            tgt_cont=container, tgt_obj=max_recursion_manifest)
+
+        resp = retry(
+            self._make_request, method='GET', container=container,
+            obj=one_more_link)
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(resp.content, TARGET_BODY)
+        self.assertEqual(resp.getheader('content-length'),
+                         str(self.env.tgt_length))
+        self.assertIn('Content-Location', resp.headers)
+        self.assertIn('%s/%s' % (container, max_recursion_manifest),
+                      resp.getheader('content-location'))
+
+        # PUT a new slo manifest point to the max_recursion_manifest
+        # Symlink and slo manifest chain from the new manifest to the final
+        # target has (max_slo_recursion_depth + 1) manifests.
+        too_many_recursion_manifest = next(self.obj_name_gen)
+        manifest = json.dumps(
+            [{'path': '/%s/%s' % (container, max_recursion_manifest)}])
+
+        resp = retry(self._make_request, method='PUT',
+                     container=container, obj=too_many_recursion_manifest,
+                     body=manifest.encode('ascii'),
+                     query_args='multipart-manifest=put')
+        self.assertEqual(resp.status, 201)  # sanity
+
+        # Check GET to too_many_recursion_mani returns 409 error
+        resp = retry(self._make_request, method='GET',
+                     container=container, obj=too_many_recursion_manifest)
+        self.assertEqual(resp.status, 409)
+        # N.B. This error message is from slo middleware that uses default.
+        self.assertEqual(
+            resp.content,
+            b'<html><h1>Conflict</h1><p>There was a conflict when trying to'
+            b' complete your request.</p></html>')
+
+    def test_symlink_put_missing_target_container(self):
+        link_obj = uuid4().hex
+
+        # set only object, no container in the prefix
+        headers = {'X-Symlink-Target': self.env.tgt_obj}
+        resp = retry(self._make_request, method='PUT',
+                     container=self.env.link_cont, obj=link_obj,
+                     headers=headers)
+        self.assertEqual(resp.status, 412)
+        self.assertEqual(resp.content,
+                         b'X-Symlink-Target header must be of the form'
+                         b' <container name>/<object name>')
+
+    def test_symlink_put_non_zero_length(self):
+        link_obj = uuid4().hex
+        headers = {'X-Symlink-Target':
+                   '%s/%s' % (self.env.tgt_cont, self.env.tgt_obj)}
+        resp = retry(
+            self._make_request, method='PUT', container=self.env.link_cont,
+            obj=link_obj, body=b'non-zero-length', headers=headers)
+
+        self.assertEqual(resp.status, 400)
+        self.assertEqual(resp.content,
+                         b'Symlink requests require a zero byte body')
+
+    def test_symlink_target_itself(self):
+        link_obj = uuid4().hex
+        headers = {
+            'X-Symlink-Target': '%s/%s' % (self.env.link_cont, link_obj)}
+        resp = retry(self._make_request, method='PUT',
+                     container=self.env.link_cont, obj=link_obj,
+                     headers=headers)
+        self.assertEqual(resp.status, 400)
+        self.assertEqual(resp.content, b'Symlink cannot target itself')
+
+    def test_symlink_target_each_other(self):
+        symloop_max = cluster_info['symlink']['symloop_max']
+
+        link_obj1 = uuid4().hex
+        link_obj2 = uuid4().hex
+
+        # PUT two links which targets each other
+        self._test_put_symlink(
+            link_cont=self.env.link_cont, link_obj=link_obj1,
+            tgt_cont=self.env.link_cont, tgt_obj=link_obj2)
+        self._test_put_symlink(
+            link_cont=self.env.link_cont, link_obj=link_obj2,
+            tgt_cont=self.env.link_cont, tgt_obj=link_obj1)
+
+        for obj in (link_obj1, link_obj2):
+            # sanity: HEAD/GET on the link itself is ok
+            self._assertLinkObject(self.env.link_cont, obj)
+
+        for obj in (link_obj1, link_obj2):
+            resp = retry(self._make_request, method='HEAD',
+                         container=self.env.link_cont, obj=obj)
+            self.assertEqual(resp.status, 409)
+
+            resp = retry(self._make_request, method='GET',
+                         container=self.env.link_cont, obj=obj)
+            self.assertEqual(resp.status, 409)
+            self.assertEqual(
+                resp.content,
+                b'Too many levels of symbolic links, maximum allowed is %d' %
+                symloop_max)
+
+    def test_symlink_put_copy_from(self):
+        link_obj1 = uuid4().hex
+        link_obj2 = uuid4().hex
+
+        self._test_put_symlink(link_cont=self.env.link_cont,
+                               link_obj=link_obj1,
+                               tgt_cont=self.env.tgt_cont,
+                               tgt_obj=self.env.tgt_obj)
+
+        copy_src = '%s/%s' % (self.env.link_cont, link_obj1)
+
+        # copy symlink
+        headers = {'X-Copy-From': copy_src}
+        resp = retry(self._make_request_with_symlink_get,
+                     method='PUT',
+                     container=self.env.link_cont, obj=link_obj2,
+                     headers=headers)
+        self.assertEqual(resp.status, 201)
+
+        self._assertSymlink(link_cont=self.env.link_cont, link_obj=link_obj2)
+
+    @requires_acls
+    def test_symlink_put_copy_from_cross_account(self):
+        link_obj1 = uuid4().hex
+        link_obj2 = uuid4().hex
+
+        self._test_put_symlink(link_cont=self.env.link_cont,
+                               link_obj=link_obj1,
+                               tgt_cont=self.env.tgt_cont,
+                               tgt_obj=self.env.tgt_obj)
+
+        copy_src = '%s/%s' % (self.env.link_cont, link_obj1)
+        perm_two = tf.swift_test_perm[1]
+
+        # add X-Content-Read to account 1 link_cont and tgt_cont
+        # permit account 2 to read account 1 link_cont to perform copy_src
+        # and tgt_cont so that link_obj2 can refer to tgt_object
+        # this ACL allows the copy to succeed
+        headers = {'X-Container-Read': perm_two}
+        resp = retry(
+            self._make_request, method='POST',
+            container=self.env.link_cont, headers=headers)
+        self.assertEqual(resp.status, 204)
+
+        # this ACL allows link_obj in account 2 to target object in account 1
+        resp = retry(self._make_request, method='POST',
+                     container=self.env.tgt_cont, headers=headers)
+        self.assertEqual(resp.status, 204)
+
+        # copy symlink itself to a different account w/o
+        # X-Symlink-Target-Account. This operation will result in copying
+        # symlink to the account 2 container that points to the
+        # container/object in the account 2.
+        # (the container/object is not prepared)
+        headers = {'X-Copy-From-Account': self.account_name,
+                   'X-Copy-From': copy_src}
+        resp = retry(self._make_request_with_symlink_get, method='PUT',
+                     container=self.env.link_cont, obj=link_obj2,
+                     headers=headers, use_account=2)
+        self.assertEqual(resp.status, 201)
+
+        # sanity: HEAD/GET on link_obj itself
+        self._assertLinkObject(self.env.link_cont, link_obj2, use_account=2)
+
+        account_two = tf.parsed[1].path.split('/', 2)[2]
+        # no target object in the account 2
+        for method in ('HEAD', 'GET'):
+            resp = retry(
+                self._make_request, method=method,
+                container=self.env.link_cont, obj=link_obj2, use_account=2)
+            self.assertEqual(resp.status, 404)
+            self.assertIn('content-location', resp.headers)
+            self.assertEqual(
+                self.env.target_content_location(override_account=account_two),
+                resp.getheader('content-location'))
+
+        # copy symlink itself to a different account with target account
+        # the target path will be in account 1
+        # the target path will have an object
+        headers = {'X-Symlink-target-Account': self.account_name,
+                   'X-Copy-From-Account': self.account_name,
+                   'X-Copy-From': copy_src}
+        resp = retry(
+            self._make_request_with_symlink_get, method='PUT',
+            container=self.env.link_cont, obj=link_obj2,
+            headers=headers, use_account=2)
+        self.assertEqual(resp.status, 201)
+
+        self._assertSymlink(link_cont=self.env.link_cont, link_obj=link_obj2,
+                            use_account=2)
+
+    def test_symlink_copy_from_target(self):
+        link_obj1 = uuid4().hex
+        obj2 = uuid4().hex
+
+        self._test_put_symlink(link_cont=self.env.link_cont,
+                               link_obj=link_obj1,
+                               tgt_cont=self.env.tgt_cont,
+                               tgt_obj=self.env.tgt_obj)
+
+        copy_src = '%s/%s' % (self.env.link_cont, link_obj1)
+
+        # issuing a COPY request to a symlink w/o symlink=get, should copy
+        # the target object, not the symlink itself
+        headers = {'X-Copy-From': copy_src}
+        resp = retry(self._make_request, method='PUT',
+                     container=self.env.tgt_cont, obj=obj2,
+                     headers=headers)
+        self.assertEqual(resp.status, 201)
+
+        # HEAD to the copied object
+        resp = retry(self._make_request, method='HEAD',
+                     container=self.env.tgt_cont, obj=obj2)
+        self.assertEqual(200, resp.status)
+        self.assertNotIn('Content-Location', resp.headers)
+        # GET to the copied object
+        resp = retry(self._make_request, method='GET',
+                     container=self.env.tgt_cont, obj=obj2)
+        # But... this is a raw object (not a symlink)
+        self.assertEqual(200, resp.status)
+        self.assertNotIn('Content-Location', resp.headers)
+        self.assertEqual(TARGET_BODY, resp.content)
+
+    def test_symlink_copy(self):
+        link_obj1 = uuid4().hex
+        link_obj2 = uuid4().hex
+
+        self._test_put_symlink(link_cont=self.env.link_cont,
+                               link_obj=link_obj1,
+                               tgt_cont=self.env.tgt_cont,
+                               tgt_obj=self.env.tgt_obj)
+
+        copy_dst = '%s/%s' % (self.env.link_cont, link_obj2)
+
+        # copy symlink
+        headers = {'Destination': copy_dst}
+        resp = retry(
+            self._make_request_with_symlink_get, method='COPY',
+            container=self.env.link_cont, obj=link_obj1, headers=headers)
+        self.assertEqual(resp.status, 201)
+
+        self._assertSymlink(link_cont=self.env.link_cont, link_obj=link_obj2)
+
+    def test_symlink_copy_target(self):
+        link_obj1 = uuid4().hex
+        obj2 = uuid4().hex
+
+        self._test_put_symlink(link_cont=self.env.link_cont,
+                               link_obj=link_obj1,
+                               tgt_cont=self.env.tgt_cont,
+                               tgt_obj=self.env.tgt_obj)
+
+        copy_dst = '%s/%s' % (self.env.tgt_cont, obj2)
+
+        # copy target object
+        headers = {'Destination': copy_dst}
+        resp = retry(self._make_request, method='COPY',
+                     container=self.env.link_cont, obj=link_obj1,
+                     headers=headers)
+        self.assertEqual(resp.status, 201)
+
+        # HEAD to target object via symlink
+        resp = retry(self._make_request, method='HEAD',
+                     container=self.env.tgt_cont, obj=obj2)
+        self.assertEqual(resp.status, 200)
+        self.assertNotIn('Content-Location', resp.headers)
+        # GET to the copied object that should be a raw object (not symlink)
+        resp = retry(self._make_request, method='GET',
+                     container=self.env.tgt_cont, obj=obj2)
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(resp.content, TARGET_BODY)
+        self.assertNotIn('Content-Location', resp.headers)
+
+    def test_post_symlink(self):
+        link_obj = uuid4().hex
+        value1 = uuid4().hex
+
+        self._test_put_symlink(link_cont=self.env.link_cont,
+                               link_obj=link_obj,
+                               tgt_cont=self.env.tgt_cont,
+                               tgt_obj=self.env.tgt_obj)
+
+        # POSTing to a symlink is not allowed and should return a 307
+        headers = {'X-Object-Meta-Alpha': 'apple'}
+        resp = retry(
+            self._make_request, method='POST', container=self.env.link_cont,
+            obj=link_obj, headers=headers, allow_redirects=False)
+        self.assertEqual(resp.status, 307)
+        # we are using account 0 in this test
+        expected_location_hdr = "%s/%s/%s" % (
+            tf.parsed[0].path, self.env.tgt_cont, self.env.tgt_obj)
+        self.assertEqual(resp.getheader('Location'), expected_location_hdr)
+
+        # Read header from symlink itself. The metadata is applied to symlink
+        resp = retry(self._make_request_with_symlink_get, method='GET',
+                     container=self.env.link_cont, obj=link_obj)
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(resp.getheader('X-Object-Meta-Alpha'), 'apple')
+
+        # Post the target object directly
+        headers = {'x-object-meta-test': value1}
+        resp = retry(
+            self._make_request, method='POST', container=self.env.tgt_cont,
+            obj=self.env.tgt_obj, headers=headers)
+        self.assertEqual(resp.status, 202)
+        resp = retry(self._make_request, method='GET',
+                     container=self.env.tgt_cont, obj=self.env.tgt_obj)
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(resp.getheader('X-Object-Meta-Test'), value1)
+
+        # Read header from target object via symlink, should exist now.
+        resp = retry(
+            self._make_request, method='GET', container=self.env.link_cont,
+            obj=link_obj)
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(resp.getheader('X-Object-Meta-Test'), value1)
+        # sanity: no X-Object-Meta-Alpha exists in the response header
+        self.assertNotIn('X-Object-Meta-Alpha', resp.headers)
+
+    def test_post_to_broken_dynamic_symlink(self):
+        # create a symlink to nowhere
+        link_obj = '%s-the-link' % uuid4().hex
+        tgt_obj = '%s-no-where' % uuid4().hex
+        headers = {'X-Symlink-Target': '%s/%s' % (self.env.tgt_cont, tgt_obj)}
+        resp = retry(self._make_request, method='PUT',
+                     container=self.env.link_cont, obj=link_obj,
+                     headers=headers)
+        self.assertEqual(resp.status, 201)
+        # it's a real link!
+        self._assertLinkObject(self.env.link_cont, link_obj)
+        # ... it's just broken
+        resp = retry(
+            self._make_request, method='GET',
+            container=self.env.link_cont, obj=link_obj)
+        self.assertEqual(resp.status, 404)
+        target_path = '/v1/%s/%s/%s' % (
+            self.account_name, self.env.tgt_cont, tgt_obj)
+        self.assertEqual(target_path, resp.headers['Content-Location'])
+
+        # we'll redirect with the Location header to the (invalid) target
+        headers = {'X-Object-Meta-Alpha': 'apple'}
+        resp = retry(
+            self._make_request, method='POST', container=self.env.link_cont,
+            obj=link_obj, headers=headers, allow_redirects=False)
+        self.assertEqual(resp.status, 307)
+        self.assertEqual(target_path, resp.headers['Location'])
+
+        # and of course metadata *is* applied to the link
+        resp = retry(
+            self._make_request_with_symlink_get, method='HEAD',
+            container=self.env.link_cont, obj=link_obj)
+        self.assertEqual(resp.status, 200)
+        self.assertTrue(resp.getheader('X-Object-Meta-Alpha'), 'apple')
+
+    def test_post_to_broken_static_symlink(self):
+        link_obj = uuid4().hex
+
+        # PUT link_obj
+        self._test_put_symlink_with_etag(link_cont=self.env.link_cont,
+                                         link_obj=link_obj,
+                                         tgt_cont=self.env.tgt_cont,
+                                         tgt_obj=self.env.tgt_obj,
+                                         etag=self.env.tgt_etag)
+
+        # overwrite tgt object
+        old_tgt_etag = normalize_etag(self.env.tgt_etag)
+        self.env._create_tgt_object(body='updated target body')
+
+        # sanity
+        resp = retry(
+            self._make_request, method='HEAD',
+            container=self.env.link_cont, obj=link_obj)
+        self.assertEqual(resp.status, 409)
+
+        # but POST will still 307
+        headers = {'X-Object-Meta-Alpha': 'apple'}
+        resp = retry(
+            self._make_request, method='POST', container=self.env.link_cont,
+            obj=link_obj, headers=headers, allow_redirects=False)
+        self.assertEqual(resp.status, 307)
+        target_path = '/v1/%s/%s/%s' % (
+            self.account_name, self.env.tgt_cont, self.env.tgt_obj)
+        self.assertEqual(target_path, resp.headers['Location'])
+        # but we give you the Etag just like... FYI?
+        self.assertEqual(old_tgt_etag, resp.headers['X-Symlink-Target-Etag'])
+
+    def test_post_with_symlink_header(self):
+        # POSTing to a symlink is not allowed and should return a 307
+        # updating the symlink target with a POST should always fail
+        headers = {'X-Symlink-Target': 'container/new_target'}
+        resp = retry(
+            self._make_request, method='POST', container=self.env.tgt_cont,
+            obj=self.env.tgt_obj, headers=headers, allow_redirects=False)
+        self.assertEqual(resp.status, 400)
+        self.assertEqual(resp.content,
+                         b'A PUT request is required to set a symlink target')
+
+    def test_overwrite_symlink(self):
+        link_obj = uuid4().hex
+        new_tgt_obj = "new_target_object_name"
+        new_tgt = '%s/%s' % (self.env.tgt_cont, new_tgt_obj)
+        self._test_put_symlink(link_cont=self.env.link_cont, link_obj=link_obj,
+                               tgt_cont=self.env.tgt_cont,
+                               tgt_obj=self.env.tgt_obj)
+
+        # sanity
+        self._assertSymlink(self.env.link_cont, link_obj)
+
+        # Overwrite symlink with PUT
+        self._test_put_symlink(link_cont=self.env.link_cont, link_obj=link_obj,
+                               tgt_cont=self.env.tgt_cont,
+                               tgt_obj=new_tgt_obj)
+
+        # head symlink to check X-Symlink-Target header
+        resp = retry(self._make_request_with_symlink_get, method='HEAD',
+                     container=self.env.link_cont, obj=link_obj)
+        self.assertEqual(resp.status, 200)
+        # target should remain with old target
+        self.assertEqual(resp.getheader('X-Symlink-Target'), new_tgt)
+
+    def test_delete_symlink(self):
+        link_obj = uuid4().hex
+
+        self._test_put_symlink(link_cont=self.env.link_cont, link_obj=link_obj,
+                               tgt_cont=self.env.tgt_cont,
+                               tgt_obj=self.env.tgt_obj)
+
+        resp = retry(self._make_request, method='DELETE',
+                     container=self.env.link_cont, obj=link_obj)
+        self.assertEqual(resp.status, 204)
+
+        # make sure target object was not deleted and is still reachable
+        resp = retry(self._make_request, method='GET',
+                     container=self.env.tgt_cont, obj=self.env.tgt_obj)
+        self.assertEqual(resp.status, 200)
+        self.assertEqual(resp.content, TARGET_BODY)
+
+    @requires_acls
+    def test_symlink_put_target_account(self):
+        if tf.skip or tf.skip2:
+            raise SkipTest
+        link_obj = uuid4().hex
+
+        # create symlink in account 2
+        # pointing to account 1
+        headers = {'X-Symlink-Target-Account': self.account_name,
+                   'X-Symlink-Target':
+                   '%s/%s' % (self.env.tgt_cont, self.env.tgt_obj)}
+        resp = retry(self._make_request, method='PUT',
+                     container=self.env.link_cont, obj=link_obj,
+                     headers=headers, use_account=2)
+        self.assertEqual(resp.status, 201)
+        perm_two = tf.swift_test_perm[1]
+
+        # sanity test:
+        # it should be ok to get the symlink itself, but not the target object
+        # because the read acl has not been configured yet
+        self._assertLinkObject(self.env.link_cont, link_obj, use_account=2)
+        resp = retry(
+            self._make_request, method='GET',
+            container=self.env.link_cont, obj=link_obj, use_account=2)
+
+        self.assertEqual(resp.status, 403)
+        # still know where it's pointing
+        self.assertEqual(resp.getheader('content-location'),
+                         self.env.target_content_location())
+
+        # add X-Content-Read to account 1 tgt_cont
+        # permit account 2 to read account 1 tgt_cont
+        # add acl to allow reading from source
+        headers = {'X-Container-Read': perm_two}
+        resp = retry(self._make_request, method='POST',
+                     container=self.env.tgt_cont, headers=headers)
+        self.assertEqual(resp.status, 204)
+
+        # GET on link_obj itself
+        self._assertLinkObject(self.env.link_cont, link_obj, use_account=2)
+
+        # GET to target object via symlink
+        resp = self._test_get_as_target_object(
+            self.env.link_cont, link_obj,
+            expected_content_location=self.env.target_content_location(),
+            use_account=2)
+
+    @requires_acls
+    def test_symlink_with_etag_put_target_account(self):
+        if tf.skip or tf.skip2:
+            raise SkipTest
+        link_obj = uuid4().hex
+
+        # try to create a symlink in account 2 pointing to account 1
+        symlink_headers = {
+            'X-Symlink-Target-Account': self.account_name,
+            'X-Symlink-Target':
+            '%s/%s' % (self.env.tgt_cont, self.env.tgt_obj),
+            'X-Symlink-Target-Etag': self.env.tgt_etag}
+        resp = retry(self._make_request, method='PUT',
+                     container=self.env.link_cont, obj=link_obj,
+                     headers=symlink_headers, use_account=2)
+        # since we don't have read access to verify the object we get the
+        # permissions error
+        self.assertEqual(resp.status, 403)
+        perm_two = tf.swift_test_perm[1]
+
+        # add X-Content-Read to account 1 tgt_cont
+        # permit account 2 to read account 1 tgt_cont
+        # add acl to allow reading from source
+        acl_headers = {'X-Container-Read': perm_two}
+        resp = retry(self._make_request, method='POST',
+                     container=self.env.tgt_cont, headers=acl_headers)
+        self.assertEqual(resp.status, 204)
+
+        # now we can create the symlink
+        resp = retry(self._make_request, method='PUT',
+                     container=self.env.link_cont, obj=link_obj,
+                     headers=symlink_headers, use_account=2)
+        self.assertEqual(resp.status, 201)
+        self._assertLinkObject(self.env.link_cont, link_obj, use_account=2)
+
+        # GET to target object via symlink
+        resp = self._test_get_as_target_object(
+            self.env.link_cont, link_obj,
+            expected_content_location=self.env.target_content_location(),
+            use_account=2)
+
+        # Overwrite target
+        resp = retry(self._make_request, method='PUT',
+                     container=self.env.tgt_cont, obj=self.env.tgt_obj,
+                     body='some other content')
+        self.assertEqual(resp.status, 201)
+
+        # link is now broken
+        resp = retry(
+            self._make_request, method='GET',
+            container=self.env.link_cont, obj=link_obj, use_account=2)
+        self.assertEqual(resp.status, 409)
+
+        # but we still know where it points
+        self.assertEqual(resp.getheader('content-location'),
+                         self.env.target_content_location())
+
+        # sanity test, remove permissions
+        headers = {'X-Remove-Container-Read': 'remove'}
+        resp = retry(self._make_request, method='POST',
+                     container=self.env.tgt_cont, headers=headers)
+        self.assertEqual(resp.status, 204)
+        # it should be ok to get the symlink itself, but not the target object
+        # because the read acl has been revoked
+        self._assertLinkObject(self.env.link_cont, link_obj, use_account=2)
+        resp = retry(
+            self._make_request, method='GET',
+            container=self.env.link_cont, obj=link_obj, use_account=2)
+        self.assertEqual(resp.status, 403)
+        # Still know where it is, though
+        self.assertEqual(resp.getheader('content-location'),
+                         self.env.target_content_location())
+
+    def test_symlink_invalid_etag(self):
+        link_obj = uuid4().hex
+        headers = {'X-Symlink-Target': '%s/%s' % (self.env.tgt_cont,
+                                                  self.env.tgt_obj),
+                   'X-Symlink-Target-Etag': 'not-the-real-etag'}
+        resp = retry(self._make_request, method='PUT',
+                     container=self.env.link_cont, obj=link_obj,
+                     headers=headers)
+        self.assertEqual(resp.status, 409)
+        self.assertEqual(resp.content,
+                         b"Object Etag 'ab706c400731332bffa67ed4bc15dcac' "
+                         b"does not match X-Symlink-Target-Etag header "
+                         b"'not-the-real-etag'")
+
+    def test_symlink_object_listing(self):
+        link_obj = uuid4().hex
+        self._test_put_symlink(link_cont=self.env.link_cont, link_obj=link_obj,
+                               tgt_cont=self.env.tgt_cont,
+                               tgt_obj=self.env.tgt_obj)
+        # sanity
+        self._assertSymlink(self.env.link_cont, link_obj)
+        resp = retry(self._make_request, method='GET',
+                     container=self.env.link_cont,
+                     query_args='format=json')
+        self.assertEqual(resp.status, 200)
+        object_list = json.loads(resp.content)
+        self.assertEqual(len(object_list), 1)
+        obj_info = object_list[0]
+        self.assertIn('symlink_path', obj_info)
+        self.assertEqual(self.env.target_content_location(),
+                         obj_info['symlink_path'])
+        self.assertNotIn('symlink_etag', obj_info)
+
+    def test_static_link_object_listing(self):
+        link_obj = uuid4().hex
+        self._test_put_symlink_with_etag(link_cont=self.env.link_cont,
+                                         link_obj=link_obj,
+                                         tgt_cont=self.env.tgt_cont,
+                                         tgt_obj=self.env.tgt_obj,
+                                         etag=self.env.tgt_etag)
+        # sanity
+        self._assertSymlink(self.env.link_cont, link_obj)
+        resp = retry(self._make_request, method='GET',
+                     container=self.env.link_cont,
+                     query_args='format=json')
+        self.assertEqual(resp.status, 200)
+        object_list = json.loads(resp.content)
+        self.assertEqual(len(object_list), 1)
+        self.assertIn('symlink_path', object_list[0])
+        self.assertEqual(self.env.target_content_location(),
+                         object_list[0]['symlink_path'])
+        obj_info = object_list[0]
+        self.assertIn('symlink_etag', obj_info)
+        self.assertEqual(normalize_etag(self.env.tgt_etag),
+                         obj_info['symlink_etag'])
+        self.assertEqual(int(self.env.tgt_length),
+                         obj_info['symlink_bytes'])
+        self.assertEqual(obj_info['content_type'], 'application/target')
+
+        # POSTing to a static_link can change the listing Content-Type
+        headers = {'Content-Type': 'application/foo'}
+        resp = retry(
+            self._make_request, method='POST', container=self.env.link_cont,
+            obj=link_obj, headers=headers, allow_redirects=False)
+        self.assertEqual(resp.status, 307)
+
+        resp = retry(self._make_request, method='GET',
+                     container=self.env.link_cont,
+                     query_args='format=json')
+        self.assertEqual(resp.status, 200)
+        object_list = json.loads(resp.content)
+        self.assertEqual(len(object_list), 1)
+        obj_info = object_list[0]
+        self.assertEqual(obj_info['content_type'], 'application/foo')
+
+
+class TestCrossPolicySymlinkEnv(TestSymlinkEnv):
+    multiple_policies_enabled = None
+
+    @classmethod
+    def setUp(cls):
+        if tf.skip or tf.skip2:
+            raise SkipTest
+
+        if cls.multiple_policies_enabled is None:
+            try:
+                cls.policies = tf.FunctionalStoragePolicyCollection.from_info()
+            except AssertionError:
+                pass
+
+        if cls.policies and len(cls.policies) > 1:
+            cls.multiple_policies_enabled = True
+        else:
+            cls.multiple_policies_enabled = False
+            return
+
+        link_policy = cls.policies.select()
+        tgt_policy = cls.policies.exclude(name=link_policy['name']).select()
+        link_header = {'X-Storage-Policy': link_policy['name']}
+        tgt_header = {'X-Storage-Policy': tgt_policy['name']}
+
+        cls._create_container(cls.link_cont, headers=link_header)
+        cls._create_container(cls.tgt_cont, headers=tgt_header)
+
+        # container in account 2
+        cls._create_container(cls.link_cont, headers=link_header,
+                              use_account=2)
+        cls._create_tgt_object()
+
+
+class TestCrossPolicySymlink(TestSymlink):
+    env = TestCrossPolicySymlinkEnv
+
+    def setUp(self):
+        super(TestCrossPolicySymlink, self).setUp()
+        if self.env.multiple_policies_enabled is False:
+            raise SkipTest('Cross policy test requires multiple policies')
+        elif self.env.multiple_policies_enabled is not True:
+            # just some sanity checking
+            raise Exception("Expected multiple_policies_enabled "
+                            "to be True/False, got %r" % (
+                                self.env.multiple_policies_enabled,))
+
+    def tearDown(self):
+        self.env.tearDown()
+
+
+class TestSymlinkSlo(Base):
+    """
+    Just some sanity testing of SLO + symlinks.
+    It is basically a copy of SLO tests in test_slo, but the tested object is
+    a symlink to the manifest (instead of the manifest itself)
+    """
+    env = TestSloEnv
+
+    def setUp(self):
+        super(TestSymlinkSlo, self).setUp()
+        if self.env.slo_enabled is False:
+            raise SkipTest("SLO not enabled")
+        elif self.env.slo_enabled is not True:
+            # just some sanity checking
+            raise Exception(
+                "Expected slo_enabled to be True/False, got %r" %
+                (self.env.slo_enabled,))
+        self.file_symlink = self.env.container.file(uuid4().hex)
+        self.account_name = self.env.container.conn.storage_path.rsplit(
+            '/', 1)[-1]
+
+    def test_symlink_target_slo_manifest(self):
+        self.file_symlink.write(hdrs={'X-Symlink-Target':
+                                '%s/%s' % (self.env.container.name,
+                                           'manifest-abcde')})
+        self.assertEqual([
+            (b'a', 1024 * 1024),
+            (b'b', 1024 * 1024),
+            (b'c', 1024 * 1024),
+            (b'd', 1024 * 1024),
+            (b'e', 1),
+        ], group_by_byte(self.file_symlink.read()))
+
+        manifest_body = self.file_symlink.read(parms={
+            'multipart-manifest': 'get'})
+        self.assertEqual(
+            [seg['hash'] for seg in json.loads(manifest_body)],
+            [self.env.seg_info['seg_%s' % c]['etag'] for c in 'abcde'])
+
+        for obj_info in self.env.container.files(parms={'format': 'json'}):
+            if obj_info['name'] == self.file_symlink.name:
+                break
+        else:
+            self.fail('Unable to find file_symlink in listing.')
+        obj_info.pop('last_modified')
+        self.assertEqual(obj_info, {
+            'name': self.file_symlink.name,
+            'content_type': 'application/octet-stream',
+            'hash': 'd41d8cd98f00b204e9800998ecf8427e',
+            'bytes': 0,
+            'symlink_path': '/v1/%s/%s/manifest-abcde' % (
+                self.account_name, self.env.container.name),
+        })
+
+    def test_static_link_target_slo_manifest(self):
+        manifest_info = self.env.container2.file(
+            "manifest-abcde").info(parms={
+                'multipart-manifest': 'get'})
+        manifest_etag = manifest_info['etag']
+        self.file_symlink.write(hdrs={
+            'X-Symlink-Target': '%s/%s' % (
+                self.env.container2.name, 'manifest-abcde'),
+            'X-Symlink-Target-Etag': manifest_etag,
+        })
+        self.assertEqual([
+            (b'a', 1024 * 1024),
+            (b'b', 1024 * 1024),
+            (b'c', 1024 * 1024),
+            (b'd', 1024 * 1024),
+            (b'e', 1),
+        ], group_by_byte(self.file_symlink.read()))
+
+        manifest_body = self.file_symlink.read(parms={
+            'multipart-manifest': 'get'})
+        self.assertEqual(
+            [seg['hash'] for seg in json.loads(manifest_body)],
+            [self.env.seg_info['seg_%s' % c]['etag'] for c in 'abcde'])
+
+        # check listing
+        for obj_info in self.env.container.files(parms={'format': 'json'}):
+            if obj_info['name'] == self.file_symlink.name:
+                break
+        else:
+            self.fail('Unable to find file_symlink in listing.')
+        obj_info.pop('last_modified')
+        self.maxDiff = None
+        slo_info = self.env.container2.file("manifest-abcde").info()
+        self.assertEqual(obj_info, {
+            'name': self.file_symlink.name,
+            'content_type': 'application/octet-stream',
+            'hash': u'd41d8cd98f00b204e9800998ecf8427e',
+            'bytes': 0,
+            'slo_etag': slo_info['etag'],
+            'symlink_path': '/v1/%s/%s/manifest-abcde' % (
+                self.account_name, self.env.container2.name),
+            'symlink_bytes': 4 * 2 ** 20 + 1,
+            'symlink_etag': normalize_etag(manifest_etag),
+        })
+
+    def test_static_link_target_slo_manifest_wrong_etag(self):
+        # try the slo "etag"
+        slo_etag = self.env.container2.file(
+            "manifest-abcde").info()['etag']
+        self.assertRaises(ResponseError, self.file_symlink.write, hdrs={
+            'X-Symlink-Target': '%s/%s' % (
+                self.env.container2.name, 'manifest-abcde'),
+            'X-Symlink-Target-Etag': slo_etag,
+        })
+        self.assert_status(409)  # quotes OK, but doesn't match
+
+        # try the slo etag w/o the quotes
+        slo_etag = slo_etag.strip('"')
+        self.assertRaises(ResponseError, self.file_symlink.write, hdrs={
+            'X-Symlink-Target': '%s/%s' % (
+                self.env.container2.name, 'manifest-abcde'),
+            'X-Symlink-Target-Etag': slo_etag,
+        })
+        self.assert_status(409)  # that still doesn't match
+
+    def test_static_link_target_symlink_to_slo_manifest(self):
+        # write symlink
+        self.file_symlink.write(hdrs={'X-Symlink-Target':
+                                '%s/%s' % (self.env.container.name,
+                                           'manifest-abcde')})
+        # write static_link
+        file_static_link = self.env.container.file(uuid4().hex)
+        file_static_link.write(hdrs={
+            'X-Symlink-Target': '%s/%s' % (
+                self.file_symlink.container, self.file_symlink.name),
+            'X-Symlink-Target-Etag': MD5_OF_EMPTY_STRING,
+        })
+
+        # validate reads
+        self.assertEqual([
+            (b'a', 1024 * 1024),
+            (b'b', 1024 * 1024),
+            (b'c', 1024 * 1024),
+            (b'd', 1024 * 1024),
+            (b'e', 1),
+        ], group_by_byte(file_static_link.read()))
+
+        manifest_body = file_static_link.read(parms={
+            'multipart-manifest': 'get'})
+        self.assertEqual(
+            [seg['hash'] for seg in json.loads(manifest_body)],
+            [self.env.seg_info['seg_%s' % c]['etag'] for c in 'abcde'])
+
+        # check listing
+        for obj_info in self.env.container.files(parms={'format': 'json'}):
+            if obj_info['name'] == file_static_link.name:
+                break
+        else:
+            self.fail('Unable to find file_symlink in listing.')
+        obj_info.pop('last_modified')
+        self.maxDiff = None
+        self.assertEqual(obj_info, {
+            'name': file_static_link.name,
+            'content_type': 'application/octet-stream',
+            'hash': 'd41d8cd98f00b204e9800998ecf8427e',
+            'bytes': 0,
+            'symlink_path': u'/v1/%s/%s/%s' % (
+                self.account_name, self.file_symlink.container,
+                self.file_symlink.name),
+            # the only time bytes/etag aren't the target object are when they
+            # validate through another static_link
+            'symlink_bytes': 0,
+            'symlink_etag': MD5_OF_EMPTY_STRING,
+        })
+
+    def test_symlink_target_slo_nested_manifest(self):
+        self.file_symlink.write(hdrs={'X-Symlink-Target':
+                                '%s/%s' % (self.env.container.name,
+                                           'manifest-abcde-submanifest')})
+        self.assertEqual([
+            (b'a', 1024 * 1024),
+            (b'b', 1024 * 1024),
+            (b'c', 1024 * 1024),
+            (b'd', 1024 * 1024),
+            (b'e', 1),
+        ], group_by_byte(self.file_symlink.read()))
+
+    def test_slo_get_ranged_manifest(self):
+        self.file_symlink.write(hdrs={'X-Symlink-Target':
+                                '%s/%s' % (self.env.container.name,
+                                           'ranged-manifest')})
+        self.assertEqual([
+            (b'c', 1),
+            (b'd', 1024 * 1024),
+            (b'e', 1),
+            (b'a', 512 * 1024),
+            (b'b', 512 * 1024),
+            (b'c', 1),
+            (b'd', 1),
+        ], group_by_byte(self.file_symlink.read()))
+
+    def test_slo_ranged_get(self):
+        self.file_symlink.write(hdrs={'X-Symlink-Target':
+                                '%s/%s' % (self.env.container.name,
+                                           'manifest-abcde')})
+        file_contents = self.file_symlink.read(size=1024 * 1024 + 2,
+                                               offset=1024 * 1024 - 1)
+        self.assertEqual([
+            (b'a', 1),
+            (b'b', 1024 * 1024),
+            (b'c', 1),
+        ], group_by_byte(file_contents))
+
+
+class TestSymlinkSloEnv(TestSloEnv):
+
+    @classmethod
+    def create_links_to_segments(cls, container):
+        seg_info = {}
+        for letter in ('a', 'b'):
+            seg_name = "linkto_seg_%s" % letter
+            file_item = container.file(seg_name)
+            sym_hdr = {'X-Symlink-Target': '%s/seg_%s' % (container.name,
+                                                          letter)}
+            file_item.write(hdrs=sym_hdr)
+            seg_info[seg_name] = {
+                'path': '/%s/%s' % (container.name, seg_name)}
+        return seg_info
+
+    @classmethod
+    def setUp(cls):
+        super(TestSymlinkSloEnv, cls).setUp()
+
+        cls.link_seg_info = cls.create_links_to_segments(cls.container)
+        file_item = cls.container.file("manifest-linkto-ab")
+        file_item.write(
+            json.dumps([cls.link_seg_info['linkto_seg_a'],
+                        cls.link_seg_info['linkto_seg_b']]).encode('ascii'),
+            parms={'multipart-manifest': 'put'})
+
+
+class TestSymlinkToSloSegments(Base):
+    """
+    This test class will contain various tests where the segments of the SLO
+    manifest are symlinks to the actual segments. Again the tests are basicaly
+    a copy/paste of the tests in test_slo, only the manifest has been modified
+    to contain symlinks as the segments.
+    """
+    env = TestSymlinkSloEnv
+
+    def setUp(self):
+        super(TestSymlinkToSloSegments, self).setUp()
+        if self.env.slo_enabled is False:
+            raise SkipTest("SLO not enabled")
+        elif self.env.slo_enabled is not True:
+            # just some sanity checking
+            raise Exception(
+                "Expected slo_enabled to be True/False, got %r" %
+                (self.env.slo_enabled,))
+
+    def test_slo_get_simple_manifest_with_links(self):
+        file_item = self.env.container.file("manifest-linkto-ab")
+        self.assertEqual([
+            (b'a', 1024 * 1024),
+            (b'b', 1024 * 1024),
+        ], group_by_byte(file_item.read()))
+
+    def test_slo_container_listing(self):
+        # the listing object size should equal the sum of the size of the
+        # segments, not the size of the manifest body
+        file_item = self.env.container.file(Utils.create_name())
+        file_item.write(
+            json.dumps([
+                self.env.link_seg_info['linkto_seg_a']]).encode('ascii'),
+            parms={'multipart-manifest': 'put'})
+
+        # The container listing has the etag of the actual manifest object
+        # contents which we get using multipart-manifest=get. New enough swift
+        # also exposes the etag that we get when NOT using
+        # multipart-manifest=get. Verify that both remain consistent when the
+        # object is updated with a POST.
+        file_item.initialize()
+        slo_etag = file_item.etag
+        file_item.initialize(parms={'multipart-manifest': 'get'})
+        manifest_etag = file_item.etag
+
+        listing = self.env.container.files(parms={'format': 'json'})
+        for f_dict in listing:
+            if f_dict['name'] == file_item.name:
+                self.assertEqual(1024 * 1024, f_dict['bytes'])
+                self.assertEqual('application/octet-stream',
+                                 f_dict['content_type'])
+                if tf.cluster_info.get('etag_quoter', {}).get(
+                        'enable_by_default'):
+                    self.assertEqual(manifest_etag, '"%s"' % f_dict['hash'])
+                else:
+                    self.assertEqual(manifest_etag, f_dict['hash'])
+                self.assertEqual(slo_etag, f_dict['slo_etag'])
+                break
+        else:
+            self.fail('Failed to find manifest file in container listing')
+
+        # now POST updated content-type file
+        file_item.content_type = 'image/jpeg'
+        file_item.sync_metadata({'X-Object-Meta-Test': 'blah'})
+        file_item.initialize()
+        self.assertEqual('image/jpeg', file_item.content_type)  # sanity
+
+        # verify that the container listing is consistent with the file
+        listing = self.env.container.files(parms={'format': 'json'})
+        for f_dict in listing:
+            if f_dict['name'] == file_item.name:
+                self.assertEqual(1024 * 1024, f_dict['bytes'])
+                self.assertEqual(file_item.content_type,
+                                 f_dict['content_type'])
+                if tf.cluster_info.get('etag_quoter', {}).get(
+                        'enable_by_default'):
+                    self.assertEqual(manifest_etag, '"%s"' % f_dict['hash'])
+                else:
+                    self.assertEqual(manifest_etag, f_dict['hash'])
+                self.assertEqual(slo_etag, f_dict['slo_etag'])
+                break
+        else:
+            self.fail('Failed to find manifest file in container listing')
+
+        # now POST with no change to content-type
+        file_item.sync_metadata({'X-Object-Meta-Test': 'blah'},
+                                cfg={'no_content_type': True})
+        file_item.initialize()
+        self.assertEqual('image/jpeg', file_item.content_type)  # sanity
+
+        # verify that the container listing is consistent with the file
+        listing = self.env.container.files(parms={'format': 'json'})
+        for f_dict in listing:
+            if f_dict['name'] == file_item.name:
+                self.assertEqual(1024 * 1024, f_dict['bytes'])
+                self.assertEqual(file_item.content_type,
+                                 f_dict['content_type'])
+                if tf.cluster_info.get('etag_quoter', {}).get(
+                        'enable_by_default'):
+                    self.assertEqual(manifest_etag, '"%s"' % f_dict['hash'])
+                else:
+                    self.assertEqual(manifest_etag, f_dict['hash'])
+                self.assertEqual(slo_etag, f_dict['slo_etag'])
+                break
+        else:
+            self.fail('Failed to find manifest file in container listing')
+
+    def test_slo_etag_is_hash_of_etags(self):
+        expected_hash = md5(usedforsecurity=False)
+        expected_hash.update((
+            md5(b'a' * 1024 * 1024, usedforsecurity=False)
+            .hexdigest().encode('ascii')))
+        expected_hash.update((
+            md5(b'b' * 1024 * 1024, usedforsecurity=False)
+            .hexdigest().encode('ascii')))
+        expected_etag = expected_hash.hexdigest()
+
+        file_item = self.env.container.file('manifest-linkto-ab')
+        self.assertEqual('"%s"' % expected_etag, file_item.info()['etag'])
+
+    def test_slo_copy(self):
+        file_item = self.env.container.file("manifest-linkto-ab")
+        file_item.copy(self.env.container.name, "copied-abcde")
+
+        copied = self.env.container.file("copied-abcde")
+        self.assertEqual([
+            (b'a', 1024 * 1024),
+            (b'b', 1024 * 1024),
+        ], group_by_byte(copied.read(parms={'multipart-manifest': 'get'})))
+
+    def test_slo_copy_the_manifest(self):
+        # first just perform some tests of the contents of the manifest itself
+        source = self.env.container.file("manifest-linkto-ab")
+        source_contents = source.read(parms={'multipart-manifest': 'get'})
+        source_json = json.loads(source_contents)
+        manifest_etag = md5(source_contents, usedforsecurity=False).hexdigest()
+        if tf.cluster_info.get('etag_quoter', {}).get('enable_by_default'):
+            manifest_etag = '"%s"' % manifest_etag
+
+        source.initialize()
+        slo_etag = source.etag
+        self.assertEqual('application/octet-stream', source.content_type)
+
+        source.initialize(parms={'multipart-manifest': 'get'})
+        self.assertEqual(manifest_etag, source.etag)
+        self.assertEqual('application/json; charset=utf-8',
+                         source.content_type)
+
+        # now, copy the manifest
+        self.assertTrue(source.copy(self.env.container.name,
+                                    "copied-ab-manifest-only",
+                                    parms={'multipart-manifest': 'get'}))
+
+        copied = self.env.container.file("copied-ab-manifest-only")
+        copied_contents = copied.read(parms={'multipart-manifest': 'get'})
+        try:
+            copied_json = json.loads(copied_contents)
+        except ValueError:
+            self.fail("COPY didn't copy the manifest (invalid json on GET)")
+
+        # make sure content of copied manifest is the same as original man.
+        self.assertEqual(source_json, copied_json)
+        copied.initialize()
+        self.assertEqual(copied.etag, slo_etag)
+        self.assertEqual('application/octet-stream', copied.content_type)
+
+        copied.initialize(parms={'multipart-manifest': 'get'})
+        self.assertEqual(source_contents, copied_contents)
+        self.assertEqual(copied.etag, manifest_etag)
+        self.assertEqual('application/json; charset=utf-8',
+                         copied.content_type)
+
+        # verify the listing metadata
+        listing = self.env.container.files(parms={'format': 'json'})
+        names = {}
+        for f_dict in listing:
+            if f_dict['name'] in ('manifest-linkto-ab',
+                                  'copied-ab-manifest-only'):
+                names[f_dict['name']] = f_dict
+
+        self.assertIn('manifest-linkto-ab', names)
+        actual = names['manifest-linkto-ab']
+        self.assertEqual(2 * 1024 * 1024, actual['bytes'])
+        self.assertEqual('application/octet-stream', actual['content_type'])
+        if tf.cluster_info.get('etag_quoter', {}).get('enable_by_default'):
+            self.assertEqual(manifest_etag, '"%s"' % actual['hash'])
+        else:
+            self.assertEqual(manifest_etag, actual['hash'])
+        self.assertEqual(slo_etag, actual['slo_etag'])
+
+        self.assertIn('copied-ab-manifest-only', names)
+        actual = names['copied-ab-manifest-only']
+        self.assertEqual(2 * 1024 * 1024, actual['bytes'])
+        self.assertEqual('application/octet-stream', actual['content_type'])
+        if tf.cluster_info.get('etag_quoter', {}).get('enable_by_default'):
+            self.assertEqual(manifest_etag, '"%s"' % actual['hash'])
+        else:
+            self.assertEqual(manifest_etag, actual['hash'])
+        self.assertEqual(slo_etag, actual['slo_etag'])
+
+
+class TestSymlinkDlo(Base):
+    env = TestDloEnv
+
+    def test_get_manifest(self):
+        link_obj = uuid4().hex
+        file_symlink = self.env.container.file(link_obj)
+        file_symlink.write(hdrs={'X-Symlink-Target':
+                           '%s/%s' % (self.env.container.name,
+                                      'man1')})
+
+        self.assertEqual([
+            (b'a', 10),
+            (b'b', 10),
+            (b'c', 10),
+            (b'd', 10),
+            (b'e', 10),
+        ], group_by_byte(file_symlink.read()))
+
+        link_obj = uuid4().hex
+        file_symlink = self.env.container.file(link_obj)
+        file_symlink.write(hdrs={'X-Symlink-Target':
+                           '%s/%s' % (self.env.container.name,
+                                      'man2')})
+        self.assertEqual([
+            (b'A', 10),
+            (b'B', 10),
+            (b'C', 10),
+            (b'D', 10),
+            (b'E', 10),
+        ], group_by_byte(file_symlink.read()))
+
+        link_obj = uuid4().hex
+        file_symlink = self.env.container.file(link_obj)
+        file_symlink.write(hdrs={'X-Symlink-Target':
+                           '%s/%s' % (self.env.container.name,
+                                      'manall')})
+        self.assertEqual([
+            (b'a', 10),
+            (b'b', 10),
+            (b'c', 10),
+            (b'd', 10),
+            (b'e', 10),
+            (b'A', 10),
+            (b'B', 10),
+            (b'C', 10),
+            (b'D', 10),
+            (b'E', 10),
+        ], group_by_byte(file_symlink.read()))
+
+    def test_get_manifest_document_itself(self):
+        link_obj = uuid4().hex
+        file_symlink = self.env.container.file(link_obj)
+        file_symlink.write(hdrs={'X-Symlink-Target':
+                           '%s/%s' % (self.env.container.name,
+                                      'man1')})
+        file_contents = file_symlink.read(parms={'multipart-manifest': 'get'})
+        self.assertEqual(file_contents, b"man1-contents")
+        self.assertEqual(file_symlink.info()['x_object_manifest'],
+                         "%s/%s/seg_lower" %
+                         (self.env.container.name, self.env.segment_prefix))
+
+    def test_get_range(self):
+        link_obj = uuid4().hex + "_symlink"
+        file_symlink = self.env.container.file(link_obj)
+        file_symlink.write(hdrs={'X-Symlink-Target':
+                           '%s/%s' % (self.env.container.name,
+                                      'man1')})
+        self.assertEqual([
+            (b'a', 2),
+            (b'b', 10),
+            (b'c', 10),
+            (b'd', 3),
+        ], group_by_byte(file_symlink.read(size=25, offset=8)))
+
+        file_contents = file_symlink.read(size=1, offset=47)
+        self.assertEqual(file_contents, b"e")
+
+    def test_get_range_out_of_range(self):
+        link_obj = uuid4().hex
+        file_symlink = self.env.container.file(link_obj)
+        file_symlink.write(hdrs={'X-Symlink-Target':
+                           '%s/%s' % (self.env.container.name,
+                                      'man1')})
+
+        self.assertRaises(ResponseError, file_symlink.read, size=7, offset=50)
+        self.assert_status(416)
+
+
+class TestSymlinkTargetObjectComparisonEnv(TestFileComparisonEnv):
+    @classmethod
+    def setUp(cls):
+        super(TestSymlinkTargetObjectComparisonEnv, cls).setUp()
+        cls.parms = None
+        cls.expect_empty_etag = False
+        cls.expect_body = True
+
+
+class TestSymlinkComparisonEnv(TestFileComparisonEnv):
+    @classmethod
+    def setUp(cls):
+        super(TestSymlinkComparisonEnv, cls).setUp()
+        cls.parms = {'symlink': 'get'}
+        cls.expect_empty_etag = True
+        cls.expect_body = False
+
+
+class TestSymlinkTargetObjectComparison(Base):
+    env = TestSymlinkTargetObjectComparisonEnv
+
+    def setUp(self):
+        super(TestSymlinkTargetObjectComparison, self).setUp()
+        for file_item in self.env.files:
+            link_obj = file_item.name + '_symlink'
+            file_symlink = self.env.container.file(link_obj)
+            file_symlink.write(hdrs={'X-Symlink-Target':
+                               '%s/%s' % (self.env.container.name,
+                                          file_item.name)})
+
+    def testIfMatch(self):
+        for file_item in self.env.files:
+            link_obj = file_item.name + '_symlink'
+            file_symlink = self.env.container.file(link_obj)
+
+            md5 = MD5_OF_EMPTY_STRING if self.env.expect_empty_etag else \
+                file_item.md5
+            hdrs = {'If-Match': md5}
+            body = file_symlink.read(hdrs=hdrs, parms=self.env.parms)
+            if self.env.expect_body:
+                self.assertTrue(body)
+            else:
+                self.assertEqual(b'', body)
+            self.assert_status(200)
+            self.assert_etag(md5)
+
+            hdrs = {'If-Match': 'bogus'}
+            self.assertRaises(ResponseError, file_symlink.read, hdrs=hdrs,
+                              parms=self.env.parms)
+            self.assert_status(412)
+            self.assert_etag(md5)
+
+    def testIfMatchMultipleEtags(self):
+        for file_item in self.env.files:
+            link_obj = file_item.name + '_symlink'
+            file_symlink = self.env.container.file(link_obj)
+
+            md5 = MD5_OF_EMPTY_STRING if self.env.expect_empty_etag else \
+                file_item.md5
+            hdrs = {'If-Match': '"bogus1", "%s", "bogus2"' % md5}
+            body = file_symlink.read(hdrs=hdrs, parms=self.env.parms)
+            if self.env.expect_body:
+                self.assertTrue(body)
+            else:
+                self.assertEqual(b'', body)
+            self.assert_status(200)
+            self.assert_etag(md5)
+
+            hdrs = {'If-Match': '"bogus1", "bogus2", "bogus3"'}
+            self.assertRaises(ResponseError, file_symlink.read, hdrs=hdrs,
+                              parms=self.env.parms)
+            self.assert_status(412)
+            self.assert_etag(md5)
+
+    def testIfNoneMatch(self):
+        for file_item in self.env.files:
+            link_obj = file_item.name + '_symlink'
+            file_symlink = self.env.container.file(link_obj)
+            md5 = MD5_OF_EMPTY_STRING if self.env.expect_empty_etag else \
+                file_item.md5
+
+            hdrs = {'If-None-Match': 'bogus'}
+            body = file_symlink.read(hdrs=hdrs, parms=self.env.parms)
+            if self.env.expect_body:
+                self.assertTrue(body)
+            else:
+                self.assertEqual(b'', body)
+            self.assert_status(200)
+            self.assert_etag(md5)
+
+            hdrs = {'If-None-Match': md5}
+            self.assertRaises(ResponseError, file_symlink.read, hdrs=hdrs,
+                              parms=self.env.parms)
+            self.assert_status(304)
+            self.assert_etag(md5)
+            self.assert_header('accept-ranges', 'bytes')
+
+    def testIfNoneMatchMultipleEtags(self):
+        for file_item in self.env.files:
+            link_obj = file_item.name + '_symlink'
+            file_symlink = self.env.container.file(link_obj)
+            md5 = MD5_OF_EMPTY_STRING if self.env.expect_empty_etag else \
+                file_item.md5
+
+            hdrs = {'If-None-Match': '"bogus1", "bogus2", "bogus3"'}
+            body = file_symlink.read(hdrs=hdrs, parms=self.env.parms)
+            if self.env.expect_body:
+                self.assertTrue(body)
+            else:
+                self.assertEqual(b'', body)
+            self.assert_status(200)
+            self.assert_etag(md5)
+
+            hdrs = {'If-None-Match':
+                    '"bogus1", "bogus2", "%s"' % md5}
+            self.assertRaises(ResponseError, file_symlink.read, hdrs=hdrs,
+                              parms=self.env.parms)
+            self.assert_status(304)
+            self.assert_etag(md5)
+            self.assert_header('accept-ranges', 'bytes')
+
+    def testIfModifiedSince(self):
+        for file_item in self.env.files:
+            link_obj = file_item.name + '_symlink'
+            file_symlink = self.env.container.file(link_obj)
+            md5 = MD5_OF_EMPTY_STRING if self.env.expect_empty_etag else \
+                file_item.md5
+
+            hdrs = {'If-Modified-Since': self.env.time_old_f1}
+            body = file_symlink.read(hdrs=hdrs, parms=self.env.parms)
+            if self.env.expect_body:
+                self.assertTrue(body)
+            else:
+                self.assertEqual(b'', body)
+            self.assert_status(200)
+            self.assert_etag(md5)
+            self.assertTrue(file_symlink.info(hdrs=hdrs, parms=self.env.parms))
+
+            hdrs = {'If-Modified-Since': self.env.time_new}
+            self.assertRaises(ResponseError, file_symlink.read, hdrs=hdrs,
+                              parms=self.env.parms)
+            self.assert_status(304)
+            self.assert_etag(md5)
+            self.assert_header('accept-ranges', 'bytes')
+            self.assertRaises(ResponseError, file_symlink.info, hdrs=hdrs,
+                              parms=self.env.parms)
+            self.assert_status(304)
+            self.assert_etag(md5)
+            self.assert_header('accept-ranges', 'bytes')
+
+    def testIfUnmodifiedSince(self):
+        for file_item in self.env.files:
+            link_obj = file_item.name + '_symlink'
+            file_symlink = self.env.container.file(link_obj)
+            md5 = MD5_OF_EMPTY_STRING if self.env.expect_empty_etag else \
+                file_item.md5
+
+            hdrs = {'If-Unmodified-Since': self.env.time_new}
+            body = file_symlink.read(hdrs=hdrs, parms=self.env.parms)
+            if self.env.expect_body:
+                self.assertTrue(body)
+            else:
+                self.assertEqual(b'', body)
+            self.assert_status(200)
+            self.assert_etag(md5)
+            self.assertTrue(file_symlink.info(hdrs=hdrs, parms=self.env.parms))
+
+            hdrs = {'If-Unmodified-Since': self.env.time_old_f2}
+            self.assertRaises(ResponseError, file_symlink.read, hdrs=hdrs,
+                              parms=self.env.parms)
+            self.assert_status(412)
+            self.assert_etag(md5)
+            self.assertRaises(ResponseError, file_symlink.info, hdrs=hdrs,
+                              parms=self.env.parms)
+            self.assert_status(412)
+            self.assert_etag(md5)
+
+    def testIfMatchAndUnmodified(self):
+        for file_item in self.env.files:
+            link_obj = file_item.name + '_symlink'
+            file_symlink = self.env.container.file(link_obj)
+            md5 = MD5_OF_EMPTY_STRING if self.env.expect_empty_etag else \
+                file_item.md5
+
+            hdrs = {'If-Match': md5,
+                    'If-Unmodified-Since': self.env.time_new}
+            body = file_symlink.read(hdrs=hdrs, parms=self.env.parms)
+            if self.env.expect_body:
+                self.assertTrue(body)
+            else:
+                self.assertEqual(b'', body)
+            self.assert_status(200)
+            self.assert_etag(md5)
+
+            hdrs = {'If-Match': 'bogus',
+                    'If-Unmodified-Since': self.env.time_new}
+            self.assertRaises(ResponseError, file_symlink.read, hdrs=hdrs,
+                              parms=self.env.parms)
+            self.assert_status(412)
+            self.assert_etag(md5)
+
+            hdrs = {'If-Match': md5,
+                    'If-Unmodified-Since': self.env.time_old_f3}
+            self.assertRaises(ResponseError, file_symlink.read, hdrs=hdrs,
+                              parms=self.env.parms)
+            self.assert_status(412)
+            self.assert_etag(md5)
+
+    def testLastModified(self):
+        file_item = self.env.container.file(Utils.create_name())
+        file_item.content_type = Utils.create_name()
+        resp = file_item.write_random_return_resp(self.env.file_size)
+        put_last_modified = resp.getheader('last-modified')
+        md5 = file_item.md5
+
+        # create symlink
+        link_obj = file_item.name + '_symlink'
+        file_symlink = self.env.container.file(link_obj)
+        file_symlink.write(hdrs={'X-Symlink-Target':
+                           '%s/%s' % (self.env.container.name,
+                                      file_item.name)})
+
+        info = file_symlink.info()
+        self.assertIn('last_modified', info)
+        last_modified = info['last_modified']
+        self.assertEqual(put_last_modified, info['last_modified'])
+
+        hdrs = {'If-Modified-Since': last_modified}
+        self.assertRaises(ResponseError, file_symlink.read, hdrs=hdrs)
+        self.assert_status(304)
+        self.assert_etag(md5)
+        self.assert_header('accept-ranges', 'bytes')
+
+        hdrs = {'If-Unmodified-Since': last_modified}
+        self.assertTrue(file_symlink.read(hdrs=hdrs))
+
+
+class TestSymlinkComparison(TestSymlinkTargetObjectComparison):
+    env = TestSymlinkComparisonEnv
+
+    def setUp(self):
+        super(TestSymlinkComparison, self).setUp()
+
+    def testLastModified(self):
+        file_item = self.env.container.file(Utils.create_name())
+        file_item.content_type = Utils.create_name()
+        resp = file_item.write_random_return_resp(self.env.file_size)
+        put_target_last_modified = resp.getheader('last-modified')
+        md5 = MD5_OF_EMPTY_STRING
+
+        # get different last-modified between file and symlink
+        time.sleep(1)
+
+        # create symlink
+        link_obj = file_item.name + '_symlink'
+        file_symlink = self.env.container.file(link_obj)
+        resp = file_symlink.write(return_resp=True,
+                                  hdrs={'X-Symlink-Target':
+                                        '%s/%s' % (self.env.container.name,
+                                                   file_item.name)})
+        put_sym_last_modified = resp.getheader('last-modified')
+
+        info = file_symlink.info(parms=self.env.parms)
+        self.assertIn('last_modified', info)
+        last_modified = info['last_modified']
+        self.assertEqual(put_sym_last_modified, info['last_modified'])
+
+        hdrs = {'If-Modified-Since': put_target_last_modified}
+        body = file_symlink.read(hdrs=hdrs, parms=self.env.parms)
+        self.assertEqual(b'', body)
+        self.assert_status(200)
+        self.assert_etag(md5)
+
+        hdrs = {'If-Modified-Since': last_modified}
+        self.assertRaises(ResponseError, file_symlink.read, hdrs=hdrs,
+                          parms=self.env.parms)
+        self.assert_status(304)
+        self.assert_etag(md5)
+        self.assert_header('accept-ranges', 'bytes')
+
+        hdrs = {'If-Unmodified-Since': last_modified}
+        body = file_symlink.read(hdrs=hdrs, parms=self.env.parms)
+        self.assertEqual(b'', body)
+        self.assert_status(200)
+        self.assert_etag(md5)
+
+
+class TestSymlinkAccountTempurl(Base):
+    env = TestTempurlEnv
+    digest_name = 'sha256'
+
+    def setUp(self):
+        super(TestSymlinkAccountTempurl, self).setUp()
+        if self.env.tempurl_enabled is False:
+            raise SkipTest("TempURL not enabled")
+        elif self.env.tempurl_enabled is not True:
+            # just some sanity checking
+            raise Exception(
+                "Expected tempurl_enabled to be True/False, got %r" %
+                (self.env.tempurl_enabled,))
+
+        if self.digest_name not in cluster_info['tempurl'].get(
+                'allowed_digests', ['sha1']):
+            raise SkipTest("tempurl does not support %s signatures" %
+                           self.digest_name)
+
+        self.digest = getattr(hashlib, self.digest_name)
+        self.expires = int(time.time()) + 86400
+        self.obj_tempurl_parms = self.tempurl_parms(
+            'GET', self.expires, self.env.conn.make_path(self.env.obj.path),
+            self.env.tempurl_key)
+
+    def tempurl_parms(self, method, expires, path, key):
+        path = urllib.parse.unquote(path)
+        method = method.encode('utf8')
+        path = path.encode('utf8')
+        key = key.encode('utf8')
+        sig = hmac.new(
+            key,
+            b'%s\n%d\n%s' % (method, expires, path),
+            self.digest).hexdigest()
+        return {'temp_url_sig': sig, 'temp_url_expires': str(expires)}
+
+    def test_PUT_symlink(self):
+        new_sym = self.env.container.file(Utils.create_name())
+
+        # give out a signature which allows a PUT to new_obj
+        expires = int(time.time()) + 86400
+        put_parms = self.tempurl_parms(
+            'PUT', expires, self.env.conn.make_path(new_sym.path),
+            self.env.tempurl_key)
+
+        # try to create symlink object
+        try:
+            new_sym.write(
+                b'', {'x-symlink-target': 'cont/foo'}, parms=put_parms,
+                cfg={'no_auth_token': True})
+        except ResponseError as e:
+            self.assertEqual(e.status, 400)
+        else:
+            self.fail('request did not error')
+
+    def test_GET_symlink_inside_container(self):
+        tgt_obj = self.env.container.file(Utils.create_name())
+        sym = self.env.container.file(Utils.create_name())
+        tgt_obj.write(b"target object body")
+        sym.write(
+            b'',
+            {'x-symlink-target': '%s/%s' % (self.env.container.name, tgt_obj)})
+
+        expires = int(time.time()) + 86400
+        get_parms = self.tempurl_parms(
+            'GET', expires, self.env.conn.make_path(sym.path),
+            self.env.tempurl_key)
+
+        contents = sym.read(parms=get_parms, cfg={'no_auth_token': True})
+        self.assert_status([200])
+        self.assertEqual(contents, b"target object body")
+
+    def test_GET_symlink_outside_container(self):
+        tgt_obj = self.env.container.file(Utils.create_name())
+        tgt_obj.write(b"target object body")
+
+        container2 = self.env.account.container(Utils.create_name())
+        container2.create()
+
+        sym = container2.file(Utils.create_name())
+        sym.write(
+            b'',
+            {'x-symlink-target': '%s/%s' % (self.env.container.name, tgt_obj)})
+
+        expires = int(time.time()) + 86400
+        get_parms = self.tempurl_parms(
+            'GET', expires, self.env.conn.make_path(sym.path),
+            self.env.tempurl_key)
+
+        # cross container tempurl works fine for account tempurl key
+        contents = sym.read(parms=get_parms, cfg={'no_auth_token': True})
+        self.assert_status([200])
+        self.assertEqual(contents, b"target object body")
+
+
+class TestSymlinkContainerTempurl(Base):
+    env = TestContainerTempurlEnv
+    digest_name = 'sha256'
+
+    def setUp(self):
+        super(TestSymlinkContainerTempurl, self).setUp()
+        if self.env.tempurl_enabled is False:
+            raise SkipTest("TempURL not enabled")
+        elif self.env.tempurl_enabled is not True:
+            # just some sanity checking
+            raise Exception(
+                "Expected tempurl_enabled to be True/False, got %r" %
+                (self.env.tempurl_enabled,))
+
+        if self.digest_name not in cluster_info['tempurl'].get(
+                'allowed_digests', ['sha1']):
+            raise SkipTest("tempurl does not support %s signatures" %
+                           self.digest_name)
+
+        self.digest = getattr(hashlib, self.digest_name)
+        expires = int(time.time()) + 86400
+        sig = self.tempurl_sig(
+            'GET', expires, self.env.conn.make_path(self.env.obj.path),
+            self.env.tempurl_key)
+        self.obj_tempurl_parms = {'temp_url_sig': sig,
+                                  'temp_url_expires': str(expires)}
+
+    def tempurl_sig(self, method, expires, path, key):
+        path = urllib.parse.unquote(path)
+        method = method.encode('utf8')
+        path = path.encode('utf8')
+        key = key.encode('utf8')
+        return hmac.new(
+            key,
+            b'%s\n%d\n%s' % (method, expires, path),
+            self.digest).hexdigest()
+
+    def test_PUT_symlink(self):
+        new_sym = self.env.container.file(Utils.create_name())
+
+        # give out a signature which allows a PUT to new_obj
+        expires = int(time.time()) + 86400
+        sig = self.tempurl_sig(
+            'PUT', expires, self.env.conn.make_path(new_sym.path),
+            self.env.tempurl_key)
+        put_parms = {'temp_url_sig': sig,
+                     'temp_url_expires': str(expires)}
+
+        # try to create symlink object, should fail
+        try:
+            new_sym.write(
+                b'', {'x-symlink-target': 'cont/foo'}, parms=put_parms,
+                cfg={'no_auth_token': True})
+        except ResponseError as e:
+            self.assertEqual(e.status, 400)
+        else:
+            self.fail('request did not error')
+
+    def test_GET_symlink_inside_container(self):
+        tgt_obj = self.env.container.file(Utils.create_name())
+        sym = self.env.container.file(Utils.create_name())
+        tgt_obj.write(b"target object body")
+        sym.write(
+            b'',
+            {'x-symlink-target': '%s/%s' % (self.env.container.name, tgt_obj)})
+
+        expires = int(time.time()) + 86400
+        sig = self.tempurl_sig(
+            'GET', expires, self.env.conn.make_path(sym.path),
+            self.env.tempurl_key)
+        parms = {'temp_url_sig': sig,
+                 'temp_url_expires': str(expires)}
+
+        contents = sym.read(parms=parms, cfg={'no_auth_token': True})
+        self.assert_status([200])
+        self.assertEqual(contents, b"target object body")
+
+    def test_GET_symlink_outside_container(self):
+        tgt_obj = self.env.container.file(Utils.create_name())
+        tgt_obj.write(b"target object body")
+
+        container2 = self.env.account.container(Utils.create_name())
+        container2.create()
+
+        sym = container2.file(Utils.create_name())
+        sym.write(
+            b'',
+            {'x-symlink-target': '%s/%s' % (self.env.container.name, tgt_obj)})
+
+        expires = int(time.time()) + 86400
+        sig = self.tempurl_sig(
+            'GET', expires, self.env.conn.make_path(sym.path),
+            self.env.tempurl_key)
+        parms = {'temp_url_sig': sig,
+                 'temp_url_expires': str(expires)}
+
+        # cross container tempurl does not work for container tempurl key
+        try:
+            sym.read(parms=parms, cfg={'no_auth_token': True})
+        except ResponseError as e:
+            self.assertEqual(e.status, 401)
+        else:
+            self.fail('request did not error')
+        try:
+            sym.info(parms=parms, cfg={'no_auth_token': True})
+        except ResponseError as e:
+            self.assertEqual(e.status, 401)
+        else:
+            self.fail('request did not error')
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/functional/test_tempurl.py b/test/functional/test_tempurl.py
new file mode 100644
index 0000000000..d95f6be199
--- /dev/null
+++ b/test/functional/test_tempurl.py
@@ -0,0 +1,871 @@
+#!/usr/bin/python -u
+# Copyright (c) 2010-2016 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import base64
+import functools
+import hmac
+import hashlib
+import json
+from copy import deepcopy
+import urllib.parse
+from time import time, strftime, gmtime
+from unittest import SkipTest
+
+import test.functional as tf
+from swift.common.middleware import tempurl
+from test.functional import cluster_info
+from test.functional.tests import Utils, Base, Base2, BaseEnv
+from test.functional import requires_acls
+from test.functional.swift_test_client import Account, Connection, \
+    ResponseError
+
+
+def tempurl_parms(method, expires, path, key, digest=None):
+    path = urllib.parse.unquote(path)
+    sig = hmac.new(
+        key.encode('utf8'),
+        b'%s\n%d\n%s' % (method.encode('utf8'), expires, path.encode('utf8')),
+        digest or hashlib.sha256).hexdigest()
+    return {'temp_url_sig': sig, 'temp_url_expires': str(expires)}
+
+
+def setUpModule():
+    tf.setup_package()
+
+
+def tearDownModule():
+    tf.teardown_package()
+
+
+class TestTempurlBaseEnv(BaseEnv):
+    original_account_meta = None
+
+    @classmethod
+    def setUp(cls):
+        super(TestTempurlBaseEnv, cls).setUp()
+        cls.original_account_meta = cls.account.info()
+
+    @classmethod
+    def tearDown(cls):
+        if cls.original_account_meta:
+            # restore any tempurl keys that the tests may have overwritten
+            cls.account.update_metadata(
+                dict((k, cls.original_account_meta.get(k, ''))
+                     for k in ('temp-url-key', 'temp-url-key-2',)))
+
+
+class TestTempurlEnv(TestTempurlBaseEnv):
+    tempurl_enabled = None  # tri-state: None initially, then True/False
+
+    @classmethod
+    def setUp(cls):
+        if cls.tempurl_enabled is None:
+            cls.tempurl_enabled = 'tempurl' in cluster_info
+            if not cls.tempurl_enabled:
+                return
+
+        super(TestTempurlEnv, cls).setUp()
+
+        cls.tempurl_key = Utils.create_name()
+        cls.tempurl_key2 = Utils.create_name()
+
+        cls.account.update_metadata({
+            'temp-url-key': cls.tempurl_key,
+            'temp-url-key-2': cls.tempurl_key2
+        })
+
+        cls.container = cls.account.container(Utils.create_name())
+        if not cls.container.create():
+            raise ResponseError(cls.conn.response)
+
+        cls.obj = cls.container.file(Utils.create_name())
+        cls.obj.write(b"obj contents")
+        cls.other_obj = cls.container.file(Utils.create_name())
+        cls.other_obj.write(b"other obj contents")
+
+
+class TestTempurl(Base):
+    env = TestTempurlEnv
+    digest_name = 'sha256'
+
+    def setUp(self):
+        super(TestTempurl, self).setUp()
+        if self.env.tempurl_enabled is False:
+            raise SkipTest("TempURL not enabled")
+        elif self.env.tempurl_enabled is not True:
+            # just some sanity checking
+            raise Exception(
+                "Expected tempurl_enabled to be True/False, got %r" %
+                (self.env.tempurl_enabled,))
+
+        # N.B. The default to 'sha1' in case the info has nothing is for
+        # extremely old clusters, which presumably use SHA1.
+        if self.digest_name not in cluster_info['tempurl'].get(
+                'allowed_digests', ['sha1']):
+            raise SkipTest("tempurl does not support %s signatures" %
+                           self.digest_name)
+
+        self.digest = getattr(hashlib, self.digest_name)
+        self.expires = int(time()) + 86400
+        self.expires_8601 = strftime(
+            tempurl.EXPIRES_ISO8601_FORMAT, gmtime(self.expires))
+        self.obj_tempurl_parms = self.tempurl_parms(
+            'GET', self.expires, self.env.conn.make_path(self.env.obj.path),
+            self.env.tempurl_key)
+
+    def tempurl_parms(self, method, expires, path, key):
+        return tempurl_parms(method, expires, path, key, self.digest)
+
+    def test_GET(self):
+        for e in (str(self.expires), self.expires_8601):
+            self.obj_tempurl_parms['temp_url_expires'] = e
+
+            contents = self.env.obj.read(
+                parms=self.obj_tempurl_parms,
+                cfg={'no_auth_token': True})
+            self.assertEqual(contents, b"obj contents")
+
+            # GET tempurls also allow HEAD requests
+            self.assertTrue(self.env.obj.info(parms=self.obj_tempurl_parms,
+                                              cfg={'no_auth_token': True}))
+
+    def test_GET_with_key_2(self):
+        expires = int(time()) + 86400
+        parms = self.tempurl_parms(
+            'GET', expires, self.env.conn.make_path(self.env.obj.path),
+            self.env.tempurl_key2)
+
+        contents = self.env.obj.read(parms=parms, cfg={'no_auth_token': True})
+        self.assertEqual(contents, b"obj contents")
+
+    def test_GET_DLO_inside_container(self):
+        seg1 = self.env.container.file(
+            "get-dlo-inside-seg1" + Utils.create_name())
+        seg2 = self.env.container.file(
+            "get-dlo-inside-seg2" + Utils.create_name())
+        seg1.write(b"one fish two fish ")
+        seg2.write(b"red fish blue fish")
+
+        manifest = self.env.container.file("manifest" + Utils.create_name())
+        manifest.write(
+            b'',
+            hdrs={"X-Object-Manifest": "%s/get-dlo-inside-seg" %
+                  (self.env.container.name,)})
+
+        expires = int(time()) + 86400
+        parms = self.tempurl_parms(
+            'GET', expires, self.env.conn.make_path(manifest.path),
+            self.env.tempurl_key)
+
+        contents = manifest.read(parms=parms, cfg={'no_auth_token': True})
+        self.assertEqual(contents, b"one fish two fish red fish blue fish")
+
+    def test_GET_DLO_outside_container(self):
+        seg1 = self.env.container.file(
+            "get-dlo-outside-seg1" + Utils.create_name())
+        seg2 = self.env.container.file(
+            "get-dlo-outside-seg2" + Utils.create_name())
+        seg1.write(b"one fish two fish ")
+        seg2.write(b"red fish blue fish")
+
+        container2 = self.env.account.container(Utils.create_name())
+        container2.create()
+
+        manifest = container2.file("manifest" + Utils.create_name())
+        manifest.write(
+            b'',
+            hdrs={"X-Object-Manifest": "%s/get-dlo-outside-seg" %
+                  (self.env.container.name,)})
+
+        expires = int(time()) + 86400
+        parms = self.tempurl_parms(
+            'GET', expires, self.env.conn.make_path(manifest.path),
+            self.env.tempurl_key)
+
+        # cross container tempurl works fine for account tempurl key
+        contents = manifest.read(parms=parms, cfg={'no_auth_token': True})
+        self.assertEqual(contents, b"one fish two fish red fish blue fish")
+        self.assert_status([200])
+
+    def test_PUT(self):
+        new_obj = self.env.container.file(Utils.create_name())
+
+        expires = int(time()) + 86400
+        expires_8601 = strftime(
+            tempurl.EXPIRES_ISO8601_FORMAT, gmtime(expires))
+
+        put_parms = self.tempurl_parms(
+            'PUT', expires, self.env.conn.make_path(new_obj.path),
+            self.env.tempurl_key)
+        for e in (str(expires), expires_8601):
+            put_parms['temp_url_expires'] = e
+
+            new_obj.write(b'new obj contents',
+                          parms=put_parms, cfg={'no_auth_token': True})
+            self.assertEqual(new_obj.read(), b"new obj contents")
+
+            # PUT tempurls also allow HEAD requests
+            self.assertTrue(new_obj.info(parms=put_parms,
+                                         cfg={'no_auth_token': True}))
+
+    def test_PUT_manifest_access(self):
+        new_obj = self.env.container.file(Utils.create_name())
+
+        # give out a signature which allows a PUT to new_obj
+        expires = int(time()) + 86400
+        put_parms = self.tempurl_parms(
+            'PUT', expires, self.env.conn.make_path(new_obj.path),
+            self.env.tempurl_key)
+
+        # try to create manifest pointing to some random container
+        try:
+            new_obj.write(b'', {
+                'x-object-manifest': '%s/foo' % 'some_random_container'
+            }, parms=put_parms, cfg={'no_auth_token': True})
+        except ResponseError as e:
+            self.assertEqual(e.status, 400)
+        else:
+            self.fail('request did not error')
+
+        # create some other container
+        other_container = self.env.account.container(Utils.create_name())
+        if not other_container.create():
+            raise ResponseError(self.conn.response)
+
+        # try to create manifest pointing to new container
+        try:
+            new_obj.write(b'', {
+                'x-object-manifest': '%s/foo' % other_container
+            }, parms=put_parms, cfg={'no_auth_token': True})
+        except ResponseError as e:
+            self.assertEqual(e.status, 400)
+        else:
+            self.fail('request did not error')
+
+        # try again using a tempurl POST to an already created object
+        new_obj.write(b'', {}, parms=put_parms, cfg={'no_auth_token': True})
+        expires = int(time()) + 86400
+        post_parms = self.tempurl_parms(
+            'POST', expires, self.env.conn.make_path(new_obj.path),
+            self.env.tempurl_key)
+        try:
+            new_obj.post({'x-object-manifest': '%s/foo' % other_container},
+                         parms=post_parms, cfg={'no_auth_token': True})
+        except ResponseError as e:
+            self.assertEqual(e.status, 400)
+        else:
+            self.fail('request did not error')
+
+    def test_HEAD(self):
+        expires = int(time()) + 86400
+        head_parms = self.tempurl_parms(
+            'HEAD', expires, self.env.conn.make_path(self.env.obj.path),
+            self.env.tempurl_key)
+
+        self.assertTrue(self.env.obj.info(parms=head_parms,
+                                          cfg={'no_auth_token': True}))
+
+        # HEAD tempurls don't allow PUT or GET requests, despite the fact that
+        # PUT and GET tempurls both allow HEAD requests
+        self.assertRaises(ResponseError, self.env.other_obj.read,
+                          cfg={'no_auth_token': True},
+                          parms=head_parms)
+        self.assert_status([401])
+
+        self.assertRaises(ResponseError, self.env.other_obj.write,
+                          b'new contents',
+                          cfg={'no_auth_token': True},
+                          parms=head_parms)
+        self.assert_status([401])
+
+    def test_different_object(self):
+        contents = self.env.obj.read(
+            parms=self.obj_tempurl_parms,
+            cfg={'no_auth_token': True})
+        self.assertEqual(contents, b"obj contents")
+
+        self.assertRaises(ResponseError, self.env.other_obj.read,
+                          cfg={'no_auth_token': True},
+                          parms=self.obj_tempurl_parms)
+        self.assert_status([401])
+
+    def test_changing_sig(self):
+        contents = self.env.obj.read(
+            parms=self.obj_tempurl_parms,
+            cfg={'no_auth_token': True})
+        self.assertEqual(contents, b"obj contents")
+
+        parms = self.obj_tempurl_parms.copy()
+        if parms['temp_url_sig'][0] == 'a':
+            parms['temp_url_sig'] = 'b' + parms['temp_url_sig'][1:]
+        else:
+            parms['temp_url_sig'] = 'a' + parms['temp_url_sig'][1:]
+
+        self.assertRaises(ResponseError, self.env.obj.read,
+                          cfg={'no_auth_token': True},
+                          parms=parms)
+        self.assert_status([401])
+
+    def test_changing_expires(self):
+        contents = self.env.obj.read(
+            parms=self.obj_tempurl_parms,
+            cfg={'no_auth_token': True})
+        self.assertEqual(contents, b"obj contents")
+
+        parms = self.obj_tempurl_parms.copy()
+        if parms['temp_url_expires'][-1] == '0':
+            parms['temp_url_expires'] = parms['temp_url_expires'][:-1] + '1'
+        else:
+            parms['temp_url_expires'] = parms['temp_url_expires'][:-1] + '0'
+
+        self.assertRaises(ResponseError, self.env.obj.read,
+                          cfg={'no_auth_token': True},
+                          parms=parms)
+        self.assert_status([401])
+
+
+class TestTempurlPrefix(TestTempurl):
+    def tempurl_parms(self, method, expires, path, key,
+                      prefix=None):
+        path_parts = urllib.parse.unquote(path).split('/')
+
+        if prefix is None:
+            # Choose the first 4 chars of object name as prefix.
+            prefix = path_parts[4][:4]
+        prefix_to_hash = '/'.join(path_parts[0:4]) + '/' + prefix
+        parms = tempurl_parms(
+            method, expires,
+            'prefix:' + prefix_to_hash,
+            key, self.digest)
+        parms['temp_url_prefix'] = prefix
+        return parms
+
+    def test_empty_prefix(self):
+        parms = self.tempurl_parms(
+            'GET', self.expires,
+            self.env.conn.make_path(self.env.obj.path),
+            self.env.tempurl_key, '')
+
+        contents = self.env.obj.read(
+            parms=parms,
+            cfg={'no_auth_token': True})
+        self.assertEqual(contents, b"obj contents")
+
+    def test_no_prefix_match(self):
+        prefix = 'b' if self.env.obj.name[0] == 'a' else 'a'
+
+        parms = self.tempurl_parms(
+            'GET', self.expires,
+            self.env.conn.make_path(self.env.obj.path),
+            self.env.tempurl_key, prefix)
+
+        self.assertRaises(ResponseError, self.env.obj.read,
+                          cfg={'no_auth_token': True},
+                          parms=parms)
+        self.assert_status([401])
+
+    def test_object_url_with_prefix(self):
+        parms = super(TestTempurlPrefix, self).tempurl_parms(
+            'GET', self.expires,
+            self.env.conn.make_path(self.env.obj.path),
+            self.env.tempurl_key)
+        parms['temp_url_prefix'] = self.env.obj.name
+
+        self.assertRaises(ResponseError, self.env.obj.read,
+                          cfg={'no_auth_token': True},
+                          parms=parms)
+        self.assert_status([401])
+
+    def test_missing_query_parm(self):
+        del self.obj_tempurl_parms['temp_url_prefix']
+
+        self.assertRaises(ResponseError, self.env.obj.read,
+                          cfg={'no_auth_token': True},
+                          parms=self.obj_tempurl_parms)
+        self.assert_status([401])
+
+
+class TestTempurlUTF8(Base2, TestTempurl):
+    pass
+
+
+class TestTempurlPrefixUTF8(Base2, TestTempurlPrefix):
+    pass
+
+
+class TestContainerTempurlEnv(BaseEnv):
+    tempurl_enabled = None  # tri-state: None initially, then True/False
+
+    @classmethod
+    def setUp(cls):
+        if cls.tempurl_enabled is None:
+            cls.tempurl_enabled = 'tempurl' in cluster_info
+            if not cls.tempurl_enabled:
+                return
+
+        super(TestContainerTempurlEnv, cls).setUp()
+
+        cls.tempurl_key = Utils.create_name()
+        cls.tempurl_key2 = Utils.create_name()
+
+        if not tf.skip2:
+            # creating another account and connection
+            # for ACL tests
+            config2 = deepcopy(tf.config)
+            config2['account'] = tf.config['account2']
+            config2['username'] = tf.config['username2']
+            config2['password'] = tf.config['password2']
+            cls.conn2 = Connection(config2)
+            cls.conn2.authenticate()
+            cls.account2 = Account(
+                cls.conn2, config2.get('account', config2['username']))
+            cls.account2 = cls.conn2.get_account()
+
+        cls.container = cls.account.container(Utils.create_name())
+        if not tf.skip2:
+            if not cls.container.create({
+                    'x-container-meta-temp-url-key': cls.tempurl_key,
+                    'x-container-meta-temp-url-key-2': cls.tempurl_key2,
+                    'x-container-read': cls.account2.name}):
+                raise ResponseError(cls.conn.response)
+        else:
+            if not cls.container.create({
+                    'x-container-meta-temp-url-key': cls.tempurl_key,
+                    'x-container-meta-temp-url-key-2': cls.tempurl_key2}):
+                raise ResponseError(cls.conn.response)
+
+        cls.obj = cls.container.file(Utils.create_name())
+        cls.obj.write(b"obj contents")
+        cls.other_obj = cls.container.file(Utils.create_name())
+        cls.other_obj.write(b"other obj contents")
+
+
+class TestContainerTempurl(Base):
+    env = TestContainerTempurlEnv
+    digest_name = 'sha256'
+
+    def setUp(self):
+        super(TestContainerTempurl, self).setUp()
+        if self.env.tempurl_enabled is False:
+            raise SkipTest("TempURL not enabled")
+        elif self.env.tempurl_enabled is not True:
+            # just some sanity checking
+            raise Exception(
+                "Expected tempurl_enabled to be True/False, got %r" %
+                (self.env.tempurl_enabled,))
+
+        if self.digest_name not in cluster_info['tempurl'].get(
+                'allowed_digests', ['sha1']):
+            raise SkipTest("tempurl does not support %s signatures" %
+                           self.digest_name)
+
+        self.digest = getattr(hashlib, self.digest_name)
+        expires = int(time()) + 86400
+        sig = self.tempurl_sig(
+            'GET', expires, self.env.conn.make_path(self.env.obj.path),
+            self.env.tempurl_key)
+        self.obj_tempurl_parms = {'temp_url_sig': sig,
+                                  'temp_url_expires': str(expires)}
+
+    def tempurl_sig(self, method, expires, path, key):
+        path = urllib.parse.unquote(path)
+        method = method.encode('utf8')
+        path = path.encode('utf8')
+        key = key.encode('utf8')
+        return hmac.new(
+            key,
+            b'%s\n%d\n%s' % (method, expires, path),
+            self.digest).hexdigest()
+
+    def test_GET(self):
+        contents = self.env.obj.read(
+            parms=self.obj_tempurl_parms,
+            cfg={'no_auth_token': True})
+        self.assertEqual(contents, b"obj contents")
+
+        # GET tempurls also allow HEAD requests
+        self.assertTrue(self.env.obj.info(parms=self.obj_tempurl_parms,
+                                          cfg={'no_auth_token': True}))
+
+    def test_GET_with_key_2(self):
+        expires = int(time()) + 86400
+        sig = self.tempurl_sig(
+            'GET', expires, self.env.conn.make_path(self.env.obj.path),
+            self.env.tempurl_key2)
+        parms = {'temp_url_sig': sig,
+                 'temp_url_expires': str(expires)}
+
+        contents = self.env.obj.read(parms=parms, cfg={'no_auth_token': True})
+        self.assertEqual(contents, b"obj contents")
+
+    def test_PUT(self):
+        new_obj = self.env.container.file(Utils.create_name())
+
+        expires = int(time()) + 86400
+        sig = self.tempurl_sig(
+            'PUT', expires, self.env.conn.make_path(new_obj.path),
+            self.env.tempurl_key)
+        put_parms = {'temp_url_sig': sig,
+                     'temp_url_expires': str(expires)}
+
+        new_obj.write(b'new obj contents',
+                      parms=put_parms, cfg={'no_auth_token': True})
+        self.assertEqual(new_obj.read(), b"new obj contents")
+
+        # PUT tempurls also allow HEAD requests
+        self.assertTrue(new_obj.info(parms=put_parms,
+                                     cfg={'no_auth_token': True}))
+
+    def test_HEAD(self):
+        expires = int(time()) + 86400
+        sig = self.tempurl_sig(
+            'HEAD', expires, self.env.conn.make_path(self.env.obj.path),
+            self.env.tempurl_key)
+        head_parms = {'temp_url_sig': sig,
+                      'temp_url_expires': str(expires)}
+
+        self.assertTrue(self.env.obj.info(parms=head_parms,
+                                          cfg={'no_auth_token': True}))
+        # HEAD tempurls don't allow PUT or GET requests, despite the fact that
+        # PUT and GET tempurls both allow HEAD requests
+        self.assertRaises(ResponseError, self.env.other_obj.read,
+                          cfg={'no_auth_token': True},
+                          parms=self.obj_tempurl_parms)
+        self.assert_status([401])
+
+        self.assertRaises(ResponseError, self.env.other_obj.write,
+                          b'new contents',
+                          cfg={'no_auth_token': True},
+                          parms=self.obj_tempurl_parms)
+        self.assert_status([401])
+
+    def test_different_object(self):
+        contents = self.env.obj.read(
+            parms=self.obj_tempurl_parms,
+            cfg={'no_auth_token': True})
+        self.assertEqual(contents, b"obj contents")
+
+        self.assertRaises(ResponseError, self.env.other_obj.read,
+                          cfg={'no_auth_token': True},
+                          parms=self.obj_tempurl_parms)
+        self.assert_status([401])
+
+    def test_changing_sig(self):
+        contents = self.env.obj.read(
+            parms=self.obj_tempurl_parms,
+            cfg={'no_auth_token': True})
+        self.assertEqual(contents, b"obj contents")
+
+        parms = self.obj_tempurl_parms.copy()
+        if parms['temp_url_sig'][0] == 'a':
+            parms['temp_url_sig'] = 'b' + parms['temp_url_sig'][1:]
+        else:
+            parms['temp_url_sig'] = 'a' + parms['temp_url_sig'][1:]
+
+        self.assertRaises(ResponseError, self.env.obj.read,
+                          cfg={'no_auth_token': True},
+                          parms=parms)
+        self.assert_status([401])
+
+    def test_changing_expires(self):
+        contents = self.env.obj.read(
+            parms=self.obj_tempurl_parms,
+            cfg={'no_auth_token': True})
+        self.assertEqual(contents, b"obj contents")
+
+        parms = self.obj_tempurl_parms.copy()
+        if parms['temp_url_expires'][-1] == '0':
+            parms['temp_url_expires'] = parms['temp_url_expires'][:-1] + '1'
+        else:
+            parms['temp_url_expires'] = parms['temp_url_expires'][:-1] + '0'
+
+        self.assertRaises(ResponseError, self.env.obj.read,
+                          cfg={'no_auth_token': True},
+                          parms=parms)
+        self.assert_status([401])
+
+    @requires_acls
+    def test_tempurl_keys_visible_to_account_owner(self):
+        metadata = self.env.container.info()
+        self.assertEqual(metadata.get('tempurl_key'), self.env.tempurl_key)
+        self.assertEqual(metadata.get('tempurl_key2'), self.env.tempurl_key2)
+
+    @requires_acls
+    def test_tempurl_keys_hidden_from_acl_readonly(self):
+        if tf.skip2:
+            raise SkipTest('Account2 not set')
+        metadata = self.env.container.info(cfg={
+            'use_token': self.env.conn2.storage_token})
+
+        self.assertNotIn(
+            'tempurl_key', metadata,
+            'Container TempURL key found, should not be visible '
+            'to readonly ACLs')
+        self.assertNotIn(
+            'tempurl_key2', metadata,
+            'Container TempURL key-2 found, should not be visible '
+            'to readonly ACLs')
+
+    def test_GET_DLO_inside_container(self):
+        seg1 = self.env.container.file(
+            "get-dlo-inside-seg1" + Utils.create_name())
+        seg2 = self.env.container.file(
+            "get-dlo-inside-seg2" + Utils.create_name())
+        seg1.write(b"one fish two fish ")
+        seg2.write(b"red fish blue fish")
+
+        manifest = self.env.container.file("manifest" + Utils.create_name())
+        manifest.write(
+            b'',
+            hdrs={"X-Object-Manifest": "%s/get-dlo-inside-seg" %
+                  (self.env.container.name,)})
+
+        expires = int(time()) + 86400
+        sig = self.tempurl_sig(
+            'GET', expires, self.env.conn.make_path(manifest.path),
+            self.env.tempurl_key)
+        parms = {'temp_url_sig': sig,
+                 'temp_url_expires': str(expires)}
+
+        contents = manifest.read(parms=parms, cfg={'no_auth_token': True})
+        self.assertEqual(contents, b"one fish two fish red fish blue fish")
+
+    def test_GET_DLO_outside_container(self):
+        container2 = self.env.account.container(Utils.create_name())
+        container2.create()
+        seg1 = container2.file(
+            "get-dlo-outside-seg1" + Utils.create_name())
+        seg2 = container2.file(
+            "get-dlo-outside-seg2" + Utils.create_name())
+        seg1.write(b"one fish two fish ")
+        seg2.write(b"red fish blue fish")
+
+        manifest = self.env.container.file("manifest" + Utils.create_name())
+        manifest.write(
+            b'',
+            hdrs={"X-Object-Manifest": "%s/get-dlo-outside-seg" %
+                  (container2.name,)})
+
+        expires = int(time()) + 86400
+        sig = self.tempurl_sig(
+            'GET', expires, self.env.conn.make_path(manifest.path),
+            self.env.tempurl_key)
+        parms = {'temp_url_sig': sig,
+                 'temp_url_expires': str(expires)}
+
+        # cross container tempurl does not work for container tempurl key
+        try:
+            manifest.read(parms=parms, cfg={'no_auth_token': True})
+        except ResponseError as e:
+            self.assertEqual(e.status, 401)
+        else:
+            self.fail('request did not error')
+        try:
+            manifest.info(parms=parms, cfg={'no_auth_token': True})
+        except ResponseError as e:
+            self.assertEqual(e.status, 401)
+        else:
+            self.fail('request did not error')
+
+
+class TestContainerTempurlUTF8(Base2, TestContainerTempurl):
+    pass
+
+
+class TestSloTempurlEnv(TestTempurlBaseEnv):
+    enabled = None  # tri-state: None initially, then True/False
+
+    @classmethod
+    def setUp(cls):
+        super(TestSloTempurlEnv, cls).setUp()
+        if cls.enabled is None:
+            cls.enabled = 'tempurl' in cluster_info and 'slo' in cluster_info
+
+        cls.tempurl_key = Utils.create_name()
+
+        cls.account.update_metadata({'temp-url-key': cls.tempurl_key})
+
+        cls.manifest_container = cls.account.container(Utils.create_name())
+        cls.segments_container = cls.account.container(Utils.create_name())
+        if not cls.manifest_container.create():
+            raise ResponseError(cls.conn.response)
+        if not cls.segments_container.create():
+            raise ResponseError(cls.conn.response)
+
+        seg1 = cls.segments_container.file(Utils.create_name())
+        seg1.write(b'1' * 1024 * 1024)
+
+        seg2 = cls.segments_container.file(Utils.create_name())
+        seg2.write(b'2' * 1024 * 1024)
+
+        cls.manifest_data = [{'size_bytes': 1024 * 1024,
+                              'etag': seg1.md5,
+                              'path': '/%s/%s' % (cls.segments_container.name,
+                                                  seg1.name)},
+                             {'size_bytes': 1024 * 1024,
+                              'etag': seg2.md5,
+                              'path': '/%s/%s' % (cls.segments_container.name,
+                                                  seg2.name)}]
+
+        cls.manifest = cls.manifest_container.file(Utils.create_name())
+        cls.manifest.write(
+            json.dumps(cls.manifest_data).encode('ascii'),
+            parms={'multipart-manifest': 'put'})
+
+
+class TestSloTempurl(Base):
+    env = TestSloTempurlEnv
+    digest_name = 'sha256'
+
+    def setUp(self):
+        super(TestSloTempurl, self).setUp()
+        if self.env.enabled is False:
+            raise SkipTest("TempURL and SLO not both enabled")
+        elif self.env.enabled is not True:
+            # just some sanity checking
+            raise Exception(
+                "Expected enabled to be True/False, got %r" %
+                (self.env.enabled,))
+
+        if self.digest_name not in cluster_info['tempurl'].get(
+                'allowed_digests', ['sha1']):
+            raise SkipTest("tempurl does not support %s signatures" %
+                           self.digest_name)
+        self.digest = getattr(hashlib, self.digest_name)
+
+    def tempurl_sig(self, method, expires, path, key):
+        path = urllib.parse.unquote(path)
+        method = method.encode('utf8')
+        path = path.encode('utf8')
+        key = key.encode('utf8')
+        return hmac.new(
+            key,
+            b'%s\n%d\n%s' % (method, expires, path),
+            self.digest).hexdigest()
+
+    def test_GET(self):
+        expires = int(time()) + 86400
+        sig = self.tempurl_sig(
+            'GET', expires, self.env.conn.make_path(self.env.manifest.path),
+            self.env.tempurl_key)
+        parms = {'temp_url_sig': sig, 'temp_url_expires': str(expires)}
+
+        contents = self.env.manifest.read(
+            parms=parms,
+            cfg={'no_auth_token': True})
+        self.assertEqual(len(contents), 2 * 1024 * 1024)
+
+        # GET tempurls also allow HEAD requests
+        self.assertTrue(self.env.manifest.info(
+            parms=parms, cfg={'no_auth_token': True}))
+
+
+class TestSloTempurlUTF8(Base2, TestSloTempurl):
+    pass
+
+
+def requires_digest(digest):
+    def decorator(func):
+        @functools.wraps(func)
+        def wrapper(*args, **kwargs):
+            if digest not in cluster_info['tempurl'].get(
+                    'allowed_digests', ['sha1']):
+                raise SkipTest("tempurl does not support %s signatures" %
+                               digest)
+            return func(*args, **kwargs)
+        return wrapper
+    return decorator
+
+
+class TestTempurlAlgorithms(Base):
+    env = TestTempurlEnv
+
+    def setUp(self):
+        super(TestTempurlAlgorithms, self).setUp()
+        if self.env.tempurl_enabled is False:
+            raise SkipTest("TempURL not enabled")
+        elif self.env.tempurl_enabled is not True:
+            # just some sanity checking
+            raise Exception(
+                "Expected tempurl_enabled to be True/False, got %r" %
+                (self.env.tempurl_enabled,))
+
+    def get_sig(self, expires, digest, encoding):
+        path = urllib.parse.unquote(self.env.conn.make_path(self.env.obj.path))
+        path = path.encode('utf8')
+        key = self.env.tempurl_key.encode('utf8')
+        sig = hmac.new(
+            key,
+            b'GET\n%d\n%s' % (expires, path),
+            getattr(hashlib, digest))
+
+        if encoding == 'hex':
+            return sig.hexdigest()
+        elif encoding == 'base64':
+            return digest + ':' + base64.b64encode(
+                sig.digest()).decode('ascii')
+        elif encoding == 'base64-no-padding':
+            return digest + ':' + base64.b64encode(
+                sig.digest()).decode('ascii').strip('=')
+        elif encoding == 'url-safe-base64':
+            return digest + ':' + base64.urlsafe_b64encode(
+                sig.digest()).decode('ascii')
+        else:
+            raise ValueError('Unrecognized encoding: %r' % encoding)
+
+    def _do_test(self, digest, encoding):
+        expires = int(time()) + 86400
+        sig = self.get_sig(expires, digest, encoding)
+
+        if encoding == 'url-safe-base64':
+            # Make sure that we're actually testing url-safe-ness
+            while '-' not in sig and '_' not in sig:
+                expires += 1
+                sig = self.get_sig(expires, digest, encoding)
+
+        parms = {'temp_url_sig': sig, 'temp_url_expires': str(expires)}
+
+        contents = self.env.obj.read(
+            parms=parms,
+            cfg={'no_auth_token': True})
+        self.assertEqual(contents, b"obj contents")
+
+        # GET tempurls also allow HEAD requests
+        self.assertTrue(self.env.obj.info(
+            parms=parms, cfg={'no_auth_token': True}))
+
+    @requires_digest('sha1')
+    def test_sha1(self):
+        self._do_test('sha1', 'hex')
+        self._do_test('sha1', 'base64')
+        self._do_test('sha1', 'base64-no-padding')
+        self._do_test('sha1', 'url-safe-base64')
+
+    @requires_digest('sha256')
+    def test_sha256(self):
+        # apparently Cloud Files supports hex-encoded SHA-256
+        # let's not break that just for the sake of being different
+        self._do_test('sha256', 'hex')
+        self._do_test('sha256', 'base64')
+        self._do_test('sha256', 'base64-no-padding')
+        self._do_test('sha256', 'url-safe-base64')
+
+    @requires_digest('sha512')
+    def test_sha512(self):
+        self._do_test('sha512', 'hex')
+        self._do_test('sha512', 'base64')
+        self._do_test('sha512', 'base64-no-padding')
+        self._do_test('sha512', 'url-safe-base64')
diff --git a/test/functional/test_versioned_writes.py b/test/functional/test_versioned_writes.py
new file mode 100644
index 0000000000..dd65a83834
--- /dev/null
+++ b/test/functional/test_versioned_writes.py
@@ -0,0 +1,1214 @@
+#!/usr/bin/python -u
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from copy import deepcopy
+import json
+import time
+import unittest
+from urllib.parse import quote, unquote
+from unittest import SkipTest
+
+import test.functional as tf
+
+from swift.common.utils import MD5_OF_EMPTY_STRING
+from test.functional.tests import Base, Base2, BaseEnv, Utils
+from test.functional import cluster_info
+from test.functional.swift_test_client import Account, Connection, \
+    ResponseError
+
+
+def setUpModule():
+    tf.setup_package()
+
+
+def tearDownModule():
+    tf.teardown_package()
+
+
+class TestObjectVersioningEnv(BaseEnv):
+    versioning_enabled = None  # tri-state: None initially, then True/False
+    location_header_key = 'X-Versions-Location'
+    account2 = None
+
+    @classmethod
+    def setUp(cls):
+        super(TestObjectVersioningEnv, cls).setUp()
+        if not tf.skip2:
+            # Second connection for ACL tests
+            config2 = deepcopy(tf.config)
+            config2['account'] = tf.config['account2']
+            config2['username'] = tf.config['username2']
+            config2['password'] = tf.config['password2']
+            cls.conn2 = Connection(config2)
+            cls.conn2.authenticate()
+
+        prefix = Utils.create_name()[:10]
+        cls.versions_container = cls.account.container(prefix + "-versions")
+        if not cls.versions_container.create():
+            raise ResponseError(cls.conn.response)
+
+        cls.container = cls.account.container(prefix + "-objs")
+        container_headers = {
+            cls.location_header_key: quote(cls.versions_container.name)}
+        if not cls.container.create(hdrs=container_headers):
+            if cls.conn.response.status == 412:
+                cls.versioning_enabled = False
+                return
+            raise ResponseError(cls.conn.response)
+
+        container_info = cls.container.info()
+        # if versioning is off, then cls.location_header_key won't persist
+        cls.versioning_enabled = 'versions' in container_info
+
+        if not tf.skip2:
+            # setup another account to test ACLs
+            config2 = deepcopy(tf.config)
+            config2['account'] = tf.config['account2']
+            config2['username'] = tf.config['username2']
+            config2['password'] = tf.config['password2']
+            cls.conn2 = Connection(config2)
+            cls.storage_url2, cls.storage_token2 = cls.conn2.authenticate()
+            cls.account2 = cls.conn2.get_account()
+            cls.account2.delete_containers()
+
+        if not tf.skip3:
+            # setup another account with no access to anything to test ACLs
+            config3 = deepcopy(tf.config)
+            config3['account'] = tf.config['account']
+            config3['username'] = tf.config['username3']
+            config3['password'] = tf.config['password3']
+            cls.conn3 = Connection(config3)
+            cls.storage_url3, cls.storage_token3 = cls.conn3.authenticate()
+            cls.account3 = cls.conn3.get_account()
+
+    @classmethod
+    def tearDown(cls):
+        if cls.account:
+            cls.account.delete_containers()
+        if cls.account2:
+            cls.account2.delete_containers()
+
+
+class TestCrossPolicyObjectVersioningEnv(BaseEnv):
+    # tri-state: None initially, then True/False
+    versioning_enabled = None
+    multiple_policies_enabled = None
+    policies = None
+    location_header_key = 'X-Versions-Location'
+    account2 = None
+
+    @classmethod
+    def setUp(cls):
+        super(TestCrossPolicyObjectVersioningEnv, cls).setUp()
+        if cls.multiple_policies_enabled is None:
+            try:
+                cls.policies = tf.FunctionalStoragePolicyCollection.from_info()
+            except AssertionError:
+                pass
+
+        if cls.policies and len(cls.policies) > 1:
+            cls.multiple_policies_enabled = True
+        else:
+            cls.multiple_policies_enabled = False
+            cls.versioning_enabled = True
+            # We don't actually know the state of versioning, but without
+            # multiple policies the tests should be skipped anyway. Claiming
+            # versioning support lets us report the right reason for skipping.
+            return
+
+        policy = cls.policies.select()
+        version_policy = cls.policies.exclude(name=policy['name']).select()
+
+        if not tf.skip2:
+            # Second connection for ACL tests
+            config2 = deepcopy(tf.config)
+            config2['account'] = tf.config['account2']
+            config2['username'] = tf.config['username2']
+            config2['password'] = tf.config['password2']
+            cls.conn2 = Connection(config2)
+            cls.conn2.authenticate()
+
+        prefix = Utils.create_name()[:10]
+        cls.versions_container = cls.account.container(prefix + "-versions")
+        if not cls.versions_container.create(
+                {'X-Storage-Policy': policy['name']}):
+            raise ResponseError(cls.conn.response)
+
+        cls.container = cls.account.container(prefix + "-objs")
+        if not cls.container.create(
+                hdrs={cls.location_header_key: cls.versions_container.name,
+                      'X-Storage-Policy': version_policy['name']}):
+            if cls.conn.response.status == 412:
+                cls.versioning_enabled = False
+                return
+            raise ResponseError(cls.conn.response)
+
+        container_info = cls.container.info()
+        # if versioning is off, then X-Versions-Location won't persist
+        cls.versioning_enabled = 'versions' in container_info
+
+        if not tf.skip2:
+            # setup another account to test ACLs
+            config2 = deepcopy(tf.config)
+            config2['account'] = tf.config['account2']
+            config2['username'] = tf.config['username2']
+            config2['password'] = tf.config['password2']
+            cls.conn2 = Connection(config2)
+            cls.storage_url2, cls.storage_token2 = cls.conn2.authenticate()
+            cls.account2 = cls.conn2.get_account()
+            cls.account2.delete_containers()
+
+        if not tf.skip3:
+            # setup another account with no access to anything to test ACLs
+            config3 = deepcopy(tf.config)
+            config3['account'] = tf.config['account']
+            config3['username'] = tf.config['username3']
+            config3['password'] = tf.config['password3']
+            cls.conn3 = Connection(config3)
+            cls.storage_url3, cls.storage_token3 = cls.conn3.authenticate()
+            cls.account3 = cls.conn3.get_account()
+
+    @classmethod
+    def tearDown(cls):
+        if cls.account:
+            cls.account.delete_containers()
+        if cls.account2:
+            cls.account2.delete_containers()
+
+
+class TestObjectVersioningHistoryModeEnv(TestObjectVersioningEnv):
+    location_header_key = 'X-History-Location'
+
+
+class TestObjectVersioning(Base):
+    env = TestObjectVersioningEnv
+
+    def setUp(self):
+        super(TestObjectVersioning, self).setUp()
+        if self.env.versioning_enabled is False:
+            raise SkipTest("Object versioning not enabled")
+        elif self.env.versioning_enabled is not True:
+            # just some sanity checking
+            raise Exception(
+                "Expected versioning_enabled to be True/False, got %r" %
+                (self.env.versioning_enabled,))
+
+    def _tear_down_files(self):
+        try:
+            # only delete files and not containers
+            # as they were configured in self.env
+            # get rid of any versions so they aren't restored
+            self.env.versions_container.delete_files()
+            # get rid of originals
+            self.env.container.delete_files()
+            # in history mode, deleted originals got copied to versions, so
+            # clear that again
+            self.env.versions_container.delete_files()
+        except ResponseError:
+            pass
+
+    def tearDown(self):
+        super(TestObjectVersioning, self).tearDown()
+        self._tear_down_files()
+
+    def test_clear_version_option(self):
+        # sanity
+        header_val = quote(self.env.versions_container.name)
+        self.assertEqual(self.env.container.info()['versions'], header_val)
+        self.env.container.update_metadata(
+            hdrs={self.env.location_header_key: ''})
+        self.assertIsNone(self.env.container.info().get('versions'))
+
+        # set location back to the way it was
+        self.env.container.update_metadata(
+            hdrs={self.env.location_header_key: header_val})
+        self.assertEqual(self.env.container.info()['versions'], header_val)
+
+    def _test_overwriting_setup(self, obj_name=None):
+        container = self.env.container
+        versions_container = self.env.versions_container
+        cont_info = container.info()
+        self.assertEqual(cont_info['versions'], quote(versions_container.name))
+        expected_content_types = []
+        obj_name = obj_name or Utils.create_name()
+
+        versioned_obj = container.file(obj_name)
+        put_headers = {'Content-Type': 'text/jibberish01',
+                       'Content-Encoding': 'gzip',
+                       'Content-Disposition': 'attachment; filename=myfile'}
+        versioned_obj.write(b"aaaaa", hdrs=put_headers)
+        obj_info = versioned_obj.info()
+        self.assertEqual('text/jibberish01', obj_info['content_type'])
+        expected_content_types.append('text/jibberish01')
+
+        # the allowed headers are configurable in object server, so we cannot
+        # assert that content-encoding or content-disposition get *copied* to
+        # the object version unless they were set on the original PUT, so
+        # populate expected_headers by making a HEAD on the original object
+        resp_headers = {
+            h.lower(): v for h, v in versioned_obj.conn.response.getheaders()}
+        expected_headers = {}
+        for k, v in put_headers.items():
+            if k.lower() in resp_headers:
+                expected_headers[k] = v
+
+        self.assertEqual(0, versions_container.info()['object_count'])
+        versioned_obj.write(b"bbbbb", hdrs={'Content-Type': 'text/jibberish02',
+                            'X-Object-Meta-Foo': 'Bar'})
+        versioned_obj.initialize()
+        self.assertEqual(versioned_obj.content_type, 'text/jibberish02')
+        expected_content_types.append('text/jibberish02')
+        self.assertEqual(versioned_obj.metadata['foo'], 'Bar')
+
+        # the old version got saved off
+        self.assertEqual(1, versions_container.info()['object_count'])
+        versioned_obj_name = versions_container.files()[0]
+        prev_version = versions_container.file(versioned_obj_name)
+        prev_version.initialize()
+        self.assertEqual(b"aaaaa", prev_version.read())
+        self.assertEqual(prev_version.content_type, 'text/jibberish01')
+
+        resp_headers = {
+            h.lower(): v for h, v in prev_version.conn.response.getheaders()}
+        for k, v in expected_headers.items():
+            self.assertIn(k.lower(), resp_headers)
+            self.assertEqual(v, resp_headers[k.lower()])
+
+        # make sure the new obj metadata did not leak to the prev. version
+        self.assertNotIn('foo', prev_version.metadata)
+
+        # check that POST does not create a new version
+        versioned_obj.sync_metadata(metadata={'fu': 'baz'})
+        self.assertEqual(1, versions_container.info()['object_count'])
+
+        # if we overwrite it again, there are two versions
+        versioned_obj.write(b"ccccc")
+        self.assertEqual(2, versions_container.info()['object_count'])
+        expected_content_types.append('text/jibberish02')
+        versioned_obj_name = versions_container.files()[1]
+        prev_version = versions_container.file(versioned_obj_name)
+        prev_version.initialize()
+        self.assertEqual(b"bbbbb", prev_version.read())
+        self.assertEqual(prev_version.content_type, 'text/jibberish02')
+        self.assertNotIn('foo', prev_version.metadata)
+        self.assertIn('fu', prev_version.metadata)
+
+        # versioned_obj keeps the newest content
+        self.assertEqual(b"ccccc", versioned_obj.read())
+
+        # test copy from a different container
+        src_container = self.env.account.container(Utils.create_name())
+        self.assertTrue(src_container.create())
+        src_name = Utils.create_name()
+        src_obj = src_container.file(src_name)
+        src_obj.write(b"ddddd", hdrs={'Content-Type': 'text/jibberish04'})
+        src_obj.copy(container.name, obj_name)
+
+        self.assertEqual(b"ddddd", versioned_obj.read())
+        versioned_obj.initialize()
+        self.assertEqual(versioned_obj.content_type, 'text/jibberish04')
+        expected_content_types.append('text/jibberish04')
+
+        # make sure versions container has the previous version
+        self.assertEqual(3, versions_container.info()['object_count'])
+        versioned_obj_name = versions_container.files()[2]
+        prev_version = versions_container.file(versioned_obj_name)
+        prev_version.initialize()
+        self.assertEqual(b"ccccc", prev_version.read())
+
+        # for further use in the mode-specific tests
+        return (versioned_obj, expected_headers, expected_content_types)
+
+    def test_overwriting(self):
+        versions_container = self.env.versions_container
+        versioned_obj, expected_headers, expected_content_types = \
+            self._test_overwriting_setup()
+
+        # pop one for the current version
+        expected_content_types.pop()
+        self.assertEqual(expected_content_types, [
+            o['content_type'] for o in versions_container.files(
+                parms={'format': 'json'})])
+
+        # test delete
+        versioned_obj.delete()
+        self.assertEqual(b"ccccc", versioned_obj.read())
+        expected_content_types.pop()
+        self.assertEqual(expected_content_types, [
+            o['content_type'] for o in versions_container.files(
+                parms={'format': 'json'})])
+
+        versioned_obj.delete()
+        self.assertEqual(b"bbbbb", versioned_obj.read())
+        expected_content_types.pop()
+        self.assertEqual(expected_content_types, [
+            o['content_type'] for o in versions_container.files(
+                parms={'format': 'json'})])
+
+        versioned_obj.delete()
+        self.assertEqual(b"aaaaa", versioned_obj.read())
+        self.assertEqual(0, versions_container.info()['object_count'])
+
+        # verify that all the original object headers have been copied back
+        obj_info = versioned_obj.info()
+        self.assertEqual('text/jibberish01', obj_info['content_type'])
+        resp_headers = {
+            h.lower(): v for h, v in versioned_obj.conn.response.getheaders()}
+        for k, v in expected_headers.items():
+            self.assertIn(k.lower(), resp_headers)
+            self.assertEqual(v, resp_headers[k.lower()])
+
+        versioned_obj.delete()
+        self.assertRaises(ResponseError, versioned_obj.read)
+
+    def test_overwriting_with_url_encoded_object_name(self):
+        versions_container = self.env.versions_container
+        obj_name = Utils.create_name() + '%25ff'
+        versioned_obj, expected_headers, expected_content_types = \
+            self._test_overwriting_setup(obj_name)
+
+        # pop one for the current version
+        expected_content_types.pop()
+        self.assertEqual(expected_content_types, [
+            o['content_type'] for o in versions_container.files(
+                parms={'format': 'json'})])
+
+        # test delete
+        versioned_obj.delete()
+        self.assertEqual(b"ccccc", versioned_obj.read())
+        expected_content_types.pop()
+        self.assertEqual(expected_content_types, [
+            o['content_type'] for o in versions_container.files(
+                parms={'format': 'json'})])
+
+        versioned_obj.delete()
+        self.assertEqual(b"bbbbb", versioned_obj.read())
+        expected_content_types.pop()
+        self.assertEqual(expected_content_types, [
+            o['content_type'] for o in versions_container.files(
+                parms={'format': 'json'})])
+
+        versioned_obj.delete()
+        self.assertEqual(b"aaaaa", versioned_obj.read())
+        self.assertEqual(0, versions_container.info()['object_count'])
+
+        # verify that all the original object headers have been copied back
+        obj_info = versioned_obj.info()
+        self.assertEqual('text/jibberish01', obj_info['content_type'])
+        resp_headers = {
+            h.lower(): v for h, v in versioned_obj.conn.response.getheaders()}
+        for k, v in expected_headers.items():
+            self.assertIn(k.lower(), resp_headers)
+            self.assertEqual(v, resp_headers[k.lower()])
+
+        versioned_obj.delete()
+        self.assertRaises(ResponseError, versioned_obj.read)
+
+    def assert_most_recent_version(self, obj_name, content,
+                                   should_be_dlo=False):
+        name_len = len(obj_name.encode('utf8'))
+        archive_versions = self.env.versions_container.files(parms={
+            'prefix': '%03x%s/' % (name_len, obj_name),
+            'reverse': 'yes'})
+        archive_file = self.env.versions_container.file(archive_versions[0])
+        self.assertEqual(content, archive_file.read())
+        resp_headers = {
+            h.lower(): v for h, v in archive_file.conn.response.getheaders()}
+        if should_be_dlo:
+            self.assertIn('x-object-manifest', resp_headers)
+        else:
+            self.assertNotIn('x-object-manifest', resp_headers)
+
+    def _test_versioning_dlo_setup(self):
+        if tf.in_process:
+            tf.skip_if_no_xattrs()
+
+        container = self.env.container
+        versions_container = self.env.versions_container
+        obj_name = Utils.create_name()
+
+        for i in ('1', '2', '3'):
+            time.sleep(.01)  # guarantee that the timestamp changes
+            obj_name_seg = obj_name + '/' + i
+            versioned_obj = container.file(obj_name_seg)
+            versioned_obj.write(i.encode('ascii'))
+            # immediately overwrite
+            versioned_obj.write((i + i).encode('ascii'))
+
+        self.assertEqual(3, versions_container.info()['object_count'])
+
+        man_file = container.file(obj_name)
+
+        # write a normal file first
+        man_file.write(b'old content')
+
+        # guarantee that the timestamp changes
+        time.sleep(.01)
+
+        # overwrite with a dlo manifest
+        man_file.write(b'', hdrs={"X-Object-Manifest": "%s/%s/" %
+                       (self.env.container.name, obj_name)})
+
+        self.assertEqual(4, versions_container.info()['object_count'])
+        self.assertEqual(b"112233", man_file.read())
+        self.assert_most_recent_version(obj_name, b'old content')
+
+        # overwrite the manifest with a normal file
+        man_file.write(b'new content')
+        self.assertEqual(5, versions_container.info()['object_count'])
+
+        # new most-recent archive is the dlo
+        self.assert_most_recent_version(
+            obj_name, b'112233', should_be_dlo=True)
+
+        return obj_name, man_file
+
+    def test_versioning_dlo(self):
+        obj_name, man_file = self._test_versioning_dlo_setup()
+
+        # verify that restore works properly
+        man_file.delete()
+        self.assertEqual(4, self.env.versions_container.info()['object_count'])
+        self.assertEqual(b"112233", man_file.read())
+        resp_headers = {
+            h.lower(): v for h, v in man_file.conn.response.getheaders()}
+        self.assertIn('x-object-manifest', resp_headers)
+
+        self.assert_most_recent_version(obj_name, b'old content')
+
+        man_file.delete()
+        self.assertEqual(3, self.env.versions_container.info()['object_count'])
+        self.assertEqual(b"old content", man_file.read())
+
+    def test_versioning_container_acl(self):
+        if tf.skip2:
+            raise SkipTest('Account2 not set')
+        # create versions container and DO NOT give write access to account2
+        versions_container = self.env.account.container(Utils.create_name())
+        location_header_val = quote(str(versions_container))
+        self.assertTrue(versions_container.create(hdrs={
+            'X-Container-Write': ''
+        }))
+
+        # check account2 cannot write to versions container
+        fail_obj_name = Utils.create_name()
+        fail_obj = versions_container.file(fail_obj_name)
+        self.assertRaises(ResponseError, fail_obj.write, b"should fail",
+                          cfg={'use_token': self.env.storage_token2})
+
+        # create container and give write access to account2
+        # don't set X-Versions-Location just yet
+        container = self.env.account.container(Utils.create_name())
+        self.assertTrue(container.create(hdrs={
+            'X-Container-Write': self.env.conn2.user_acl}))
+
+        # check account2 cannot set X-Versions-Location on container
+        self.assertRaises(ResponseError, container.update_metadata, hdrs={
+            self.env.location_header_key: location_header_val},
+            cfg={'use_token': self.env.storage_token2})
+
+        # good! now let admin set the X-Versions-Location
+        # p.s.: sticking a 'x-remove' header here to test precedence
+        # of both headers. Setting the location should succeed.
+        self.assertTrue(container.update_metadata(hdrs={
+            'X-Remove-' + self.env.location_header_key[len('X-'):]:
+            location_header_val,
+            self.env.location_header_key: location_header_val}))
+
+        # write object twice to container and check version
+        obj_name = Utils.create_name()
+        versioned_obj = container.file(obj_name)
+        self.assertTrue(versioned_obj.write(b"never argue with the data",
+                        cfg={'use_token': self.env.storage_token2}))
+        self.assertEqual(versioned_obj.read(), b"never argue with the data")
+
+        self.assertTrue(
+            versioned_obj.write(b"we don't have no beer, just tequila",
+                                cfg={'use_token': self.env.storage_token2}))
+        self.assertEqual(versioned_obj.read(),
+                         b"we don't have no beer, just tequila")
+        self.assertEqual(1, versions_container.info()['object_count'])
+
+        # read the original uploaded object
+        for filename in versions_container.files():
+            backup_file = versions_container.file(filename)
+            break
+        self.assertEqual(backup_file.read(), b"never argue with the data")
+
+        if not tf.skip3:
+            # user3 (some random user with no access to any of account1)
+            # tries to read from versioned container
+            self.assertRaises(ResponseError, backup_file.read,
+                              cfg={'use_token': self.env.storage_token3})
+
+            # create an object user3 can try to copy
+            a2_container = self.env.account2.container(Utils.create_name())
+            a2_container.create(
+                hdrs={'X-Container-Read': self.env.conn3.user_acl},
+                cfg={'use_token': self.env.storage_token2})
+            a2_obj = a2_container.file(Utils.create_name())
+            self.assertTrue(a2_obj.write(b"unused",
+                            cfg={'use_token': self.env.storage_token2}))
+
+            # user3 also cannot write, delete, or copy to/from source container
+            number_of_versions = versions_container.info()['object_count']
+            self.assertRaises(ResponseError, versioned_obj.write,
+                              b"some random user trying to write data",
+                              cfg={'use_token': self.env.storage_token3})
+            self.assertEqual(number_of_versions,
+                             versions_container.info()['object_count'])
+            self.assertRaises(ResponseError, versioned_obj.delete,
+                              cfg={'use_token': self.env.storage_token3})
+            self.assertEqual(number_of_versions,
+                             versions_container.info()['object_count'])
+            self.assertRaises(
+                ResponseError, versioned_obj.write,
+                hdrs={
+                    'X-Copy-From': '%s/%s' % (a2_container.name, a2_obj.name),
+                    'X-Copy-From-Account': self.env.conn2.account_name},
+                cfg={'use_token': self.env.storage_token3})
+            self.assertEqual(number_of_versions,
+                             versions_container.info()['object_count'])
+            self.assertRaises(
+                ResponseError, a2_obj.copy_account,
+                self.env.conn.account_name, container.name, obj_name,
+                cfg={'use_token': self.env.storage_token3})
+            self.assertEqual(number_of_versions,
+                             versions_container.info()['object_count'])
+
+        # user2 can't read or delete from versions-location
+        self.assertRaises(ResponseError, backup_file.read,
+                          cfg={'use_token': self.env.storage_token2})
+        self.assertRaises(ResponseError, backup_file.delete,
+                          cfg={'use_token': self.env.storage_token2})
+
+        # but is able to delete from the source container
+        # this could be a helpful scenario for dev ops that want to setup
+        # just one container to hold object versions of multiple containers
+        # and each one of those containers are owned by different users
+        self.assertTrue(versioned_obj.delete(
+                        cfg={'use_token': self.env.storage_token2}))
+
+        # tear-down since we create these containers here
+        # and not in self.env
+        if not tf.skip3:
+            a2_container.delete_recursive()
+        versions_container.delete_recursive()
+        container.delete_recursive()
+
+    def _test_versioning_check_acl_setup(self):
+        container = self.env.container
+        versions_container = self.env.versions_container
+        versions_container.create(hdrs={'X-Container-Read': '.r:*,.rlistings'})
+
+        obj_name = Utils.create_name()
+        versioned_obj = container.file(obj_name)
+        versioned_obj.write(b"aaaaa")
+        self.assertEqual(b"aaaaa", versioned_obj.read())
+
+        versioned_obj.write(b"bbbbb")
+        self.assertEqual(b"bbbbb", versioned_obj.read())
+
+        # Use token from second account and try to delete the object
+        org_token = self.env.account.conn.storage_token
+        self.env.account.conn.storage_token = self.env.conn2.storage_token
+        try:
+            with self.assertRaises(ResponseError) as cm:
+                versioned_obj.delete()
+            self.assertEqual(403, cm.exception.status)
+        finally:
+            self.env.account.conn.storage_token = org_token
+
+        # Verify with token from first account
+        self.assertEqual(b"bbbbb", versioned_obj.read())
+        return versioned_obj
+
+    def test_versioning_check_acl(self):
+        if tf.skip2:
+            raise SkipTest('Account2 not set')
+        versioned_obj = self._test_versioning_check_acl_setup()
+        versioned_obj.delete()
+        self.assertEqual(b"aaaaa", versioned_obj.read())
+
+    def _check_overwriting_symlink(self):
+        # assertions common to x-versions-location and x-history-location modes
+        container = self.env.container
+        versions_container = self.env.versions_container
+
+        tgt_a_name = Utils.create_name()
+        tgt_b_name = Utils.create_name()
+
+        tgt_a = container.file(tgt_a_name)
+        tgt_a.write(b"aaaaa")
+
+        tgt_b = container.file(tgt_b_name)
+        tgt_b.write(b"bbbbb")
+
+        symlink_name = Utils.create_name()
+        sym_tgt_header = quote(unquote('%s/%s' % (container.name, tgt_a_name)))
+        sym_headers_a = {'X-Symlink-Target': sym_tgt_header}
+        symlink = container.file(symlink_name)
+        symlink.write(b"", hdrs=sym_headers_a)
+        self.assertEqual(b"aaaaa", symlink.read())
+
+        sym_headers_b = {'X-Symlink-Target': '%s/%s' % (container.name,
+                                                        tgt_b_name)}
+        symlink.write(b"", hdrs=sym_headers_b)
+        self.assertEqual(b"bbbbb", symlink.read())
+
+        # the old version got saved off
+        self.assertEqual(1, versions_container.info()['object_count'])
+        versioned_obj_name = versions_container.files()[0]
+        prev_version = versions_container.file(versioned_obj_name)
+        prev_version_info = prev_version.info(parms={'symlink': 'get'})
+        self.assertEqual(b"aaaaa", prev_version.read())
+        symlink_etag = prev_version_info['etag']
+        if symlink_etag.startswith('"') and symlink_etag.endswith('"') and \
+                symlink_etag[1:-1]:
+            symlink_etag = symlink_etag[1:-1]
+        self.assertEqual(MD5_OF_EMPTY_STRING, symlink_etag)
+        self.assertEqual(sym_tgt_header,
+                         prev_version_info['x_symlink_target'])
+        return symlink, tgt_a
+
+    def test_overwriting_symlink(self):
+        if 'symlink' not in cluster_info:
+            raise SkipTest("Symlinks not enabled")
+
+        symlink, target = self._check_overwriting_symlink()
+        # test delete
+        symlink.delete()
+        sym_info = symlink.info(parms={'symlink': 'get'})
+        self.assertEqual(b"aaaaa", symlink.read())
+        if tf.cluster_info.get('etag_quoter', {}).get('enable_by_default'):
+            self.assertEqual('"%s"' % MD5_OF_EMPTY_STRING, sym_info['etag'])
+        else:
+            self.assertEqual(MD5_OF_EMPTY_STRING, sym_info['etag'])
+        self.assertEqual(
+            quote(unquote('%s/%s' % (self.env.container.name, target.name))),
+            sym_info['x_symlink_target'])
+
+    def _setup_symlink(self):
+        target = self.env.container.file('target-object')
+        target.write(b'target object data')
+        symlink = self.env.container.file('symlink')
+        symlink.write(b'', hdrs={
+            'Content-Type': 'application/symlink',
+            'X-Symlink-Target': '%s/%s' % (
+                self.env.container.name, target.name)})
+        return symlink, target
+
+    def _assert_symlink(self, symlink, target):
+        self.assertEqual(b'target object data', symlink.read())
+        self.assertEqual(target.info(), symlink.info())
+        self.assertEqual('application/symlink',
+                         symlink.info(parms={
+                             'symlink': 'get'})['content_type'])
+
+    def _check_copy_destination_restore_symlink(self):
+        # assertions common to x-versions-location and x-history-location modes
+        symlink, target = self._setup_symlink()
+        symlink.write(b'this is not a symlink')
+        # the symlink is versioned
+        version_container_files = self.env.versions_container.files(
+            parms={'format': 'json'})
+        self.assertEqual(1, len(version_container_files))
+        versioned_obj_info = version_container_files[0]
+        self.assertEqual('application/symlink',
+                         versioned_obj_info['content_type'])
+        versioned_obj = self.env.versions_container.file(
+            versioned_obj_info['name'])
+        # the symlink is still a symlink
+        self._assert_symlink(versioned_obj, target)
+        # test manual restore (this creates a new backup of the overwrite)
+        versioned_obj.copy(self.env.container.name, symlink.name,
+                           parms={'symlink': 'get'})
+        self._assert_symlink(symlink, target)
+        # symlink overwritten by write then copy -> 2 versions
+        self.assertEqual(2, self.env.versions_container.info()['object_count'])
+        return symlink, target
+
+    def test_copy_destination_restore_symlink(self):
+        if 'symlink' not in cluster_info:
+            raise SkipTest("Symlinks not enabled")
+
+        symlink, target = self._check_copy_destination_restore_symlink()
+        # and versioned writes restore
+        symlink.delete()
+        self.assertEqual(1, self.env.versions_container.info()['object_count'])
+        self.assertEqual(b'this is not a symlink', symlink.read())
+        symlink.delete()
+        self.assertEqual(0, self.env.versions_container.info()['object_count'])
+        self._assert_symlink(symlink, target)
+
+    def test_put_x_copy_from_restore_symlink(self):
+        if 'symlink' not in cluster_info:
+            raise SkipTest("Symlinks not enabled")
+
+        symlink, target = self._setup_symlink()
+        symlink.write(b'this is not a symlink')
+        version_container_files = self.env.versions_container.files()
+        self.assertEqual(1, len(version_container_files))
+        versioned_obj = self.env.versions_container.file(
+            version_container_files[0])
+        symlink.write(parms={'symlink': 'get'}, cfg={
+            'no_content_type': True}, hdrs={
+                'X-Copy-From': '%s/%s' % (
+                    self.env.versions_container, versioned_obj.name)})
+        self._assert_symlink(symlink, target)
+
+
+class TestObjectVersioningUTF8(Base2, TestObjectVersioning):
+
+    def tearDown(self):
+        self._tear_down_files()
+        super(TestObjectVersioningUTF8, self).tearDown()
+
+
+class TestCrossPolicyObjectVersioning(TestObjectVersioning):
+    env = TestCrossPolicyObjectVersioningEnv
+
+    def setUp(self):
+        super(TestCrossPolicyObjectVersioning, self).setUp()
+        if self.env.multiple_policies_enabled is False:
+            raise SkipTest('Cross policy test requires multiple policies')
+        elif self.env.multiple_policies_enabled is not True:
+            # just some sanity checking
+            raise Exception("Expected multiple_policies_enabled "
+                            "to be True/False, got %r" % (
+                                self.env.versioning_enabled,))
+
+
+class TestObjectVersioningHistoryMode(TestObjectVersioning):
+    env = TestObjectVersioningHistoryModeEnv
+
+    # those override tests includes assertions for delete versioned objects
+    # behaviors different from default object versioning using
+    # x-versions-location.
+
+    def test_overwriting(self):
+        versions_container = self.env.versions_container
+        versioned_obj, expected_headers, expected_content_types = \
+            self._test_overwriting_setup()
+
+        # test delete
+        # at first, delete will succeed with 204
+        versioned_obj.delete()
+        expected_content_types.append(
+            'application/x-deleted;swift_versions_deleted=1')
+        # after that, any time the delete doesn't restore the old version
+        # and we will get 404 NotFound
+        for x in range(3):
+            with self.assertRaises(ResponseError) as cm:
+                versioned_obj.delete()
+            self.assertEqual(404, cm.exception.status)
+            expected_content_types.append(
+                'application/x-deleted;swift_versions_deleted=1')
+        # finally, we have 4 versioned items and 4 delete markers total in
+        # the versions container
+        self.assertEqual(8, versions_container.info()['object_count'])
+        self.assertEqual(expected_content_types, [
+            o['content_type'] for o in versions_container.files(
+                parms={'format': 'json'})])
+
+        # update versioned_obj
+        versioned_obj.write(b"eeee", hdrs={'Content-Type': 'text/thanksgiving',
+                            'X-Object-Meta-Bar': 'foo'})
+        # verify the PUT object is kept successfully
+        obj_info = versioned_obj.info()
+        self.assertEqual('text/thanksgiving', obj_info['content_type'])
+
+        # we still have delete-marker there
+        self.assertEqual(8, versions_container.info()['object_count'])
+
+        # update versioned_obj
+        versioned_obj.write(b"ffff", hdrs={'Content-Type': 'text/teriyaki',
+                            'X-Object-Meta-Food': 'chickin'})
+        # verify the PUT object is kept successfully
+        obj_info = versioned_obj.info()
+        self.assertEqual('text/teriyaki', obj_info['content_type'])
+
+        # new obj will be inserted after delete-marker there
+        self.assertEqual(9, versions_container.info()['object_count'])
+
+        versioned_obj.delete()
+        with self.assertRaises(ResponseError) as cm:
+            versioned_obj.read()
+        self.assertEqual(404, cm.exception.status)
+        self.assertEqual(11, versions_container.info()['object_count'])
+
+    def test_overwriting_with_url_encoded_object_name(self):
+        versions_container = self.env.versions_container
+        obj_name = Utils.create_name() + '%25ff'
+        versioned_obj, expected_headers, expected_content_types = \
+            self._test_overwriting_setup(obj_name)
+
+        # test delete
+        # at first, delete will succeed with 204
+        versioned_obj.delete()
+        expected_content_types.append(
+            'application/x-deleted;swift_versions_deleted=1')
+        # after that, any time the delete doesn't restore the old version
+        # and we will get 404 NotFound
+        for x in range(3):
+            with self.assertRaises(ResponseError) as cm:
+                versioned_obj.delete()
+            self.assertEqual(404, cm.exception.status)
+            expected_content_types.append(
+                'application/x-deleted;swift_versions_deleted=1')
+        # finally, we have 4 versioned items and 4 delete markers total in
+        # the versions container
+        self.assertEqual(8, versions_container.info()['object_count'])
+        self.assertEqual(expected_content_types, [
+            o['content_type'] for o in versions_container.files(
+                parms={'format': 'json'})])
+
+        # update versioned_obj
+        versioned_obj.write(b"eeee", hdrs={'Content-Type': 'text/thanksgiving',
+                            'X-Object-Meta-Bar': 'foo'})
+        # verify the PUT object is kept successfully
+        obj_info = versioned_obj.info()
+        self.assertEqual('text/thanksgiving', obj_info['content_type'])
+
+        # we still have delete-marker there
+        self.assertEqual(8, versions_container.info()['object_count'])
+
+        # update versioned_obj
+        versioned_obj.write(b"ffff", hdrs={'Content-Type': 'text/teriyaki',
+                            'X-Object-Meta-Food': 'chickin'})
+        # verify the PUT object is kept successfully
+        obj_info = versioned_obj.info()
+        self.assertEqual('text/teriyaki', obj_info['content_type'])
+
+        # new obj will be inserted after delete-marker there
+        self.assertEqual(9, versions_container.info()['object_count'])
+
+        versioned_obj.delete()
+        with self.assertRaises(ResponseError) as cm:
+            versioned_obj.read()
+        self.assertEqual(404, cm.exception.status)
+
+    def test_versioning_dlo(self):
+        obj_name, man_file = \
+            self._test_versioning_dlo_setup()
+
+        man_file.delete()
+        with self.assertRaises(ResponseError) as cm:
+            man_file.read()
+        self.assertEqual(404, cm.exception.status)
+        self.assertEqual(7, self.env.versions_container.info()['object_count'])
+
+        expected = [b'old content', b'112233', b'new content', b'']
+
+        name_len = len(obj_name.encode('utf8'))
+        bodies = [
+            self.env.versions_container.file(f).read()
+            for f in self.env.versions_container.files(parms={
+                'prefix': '%03x%s/' % (name_len, obj_name)})]
+        self.assertEqual(expected, bodies)
+
+    def test_versioning_check_acl(self):
+        if tf.skip2:
+            raise SkipTest('Account2 not set')
+        versioned_obj = self._test_versioning_check_acl_setup()
+        versioned_obj.delete()
+        with self.assertRaises(ResponseError) as cm:
+            versioned_obj.read()
+        self.assertEqual(404, cm.exception.status)
+
+        # we have 3 objects in the versions_container, 'aaaaa', 'bbbbb'
+        # and delete-marker with empty content
+        self.assertEqual(3, self.env.versions_container.info()['object_count'])
+        files = self.env.versions_container.files()
+        for actual, expected in zip(files, [b'aaaaa', b'bbbbb', b'']):
+            prev_version = self.env.versions_container.file(actual)
+            self.assertEqual(expected, prev_version.read())
+
+    def test_overwriting_symlink(self):
+        if 'symlink' not in cluster_info:
+            raise SkipTest("Symlinks not enabled")
+
+        symlink, target = self._check_overwriting_symlink()
+        # test delete
+        symlink.delete()
+        with self.assertRaises(ResponseError) as cm:
+            symlink.read()
+        self.assertEqual(404, cm.exception.status)
+
+    def test_copy_destination_restore_symlink(self):
+        if 'symlink' not in cluster_info:
+            raise SkipTest("Symlinks not enabled")
+
+        symlink, target = self._check_copy_destination_restore_symlink()
+        symlink.delete()
+        with self.assertRaises(ResponseError) as cm:
+            symlink.read()
+        self.assertEqual(404, cm.exception.status)
+        # 2 versions plus delete marker and deleted version
+        self.assertEqual(4, self.env.versions_container.info()['object_count'])
+
+
+class TestObjectVersioningHistoryModeUTF8(
+        Base2, TestObjectVersioningHistoryMode):
+    pass
+
+
+class TestSloWithVersioning(unittest.TestCase):
+
+    def setUp(self):
+        if 'slo' not in cluster_info:
+            raise SkipTest("SLO not enabled")
+        if tf.in_process:
+            tf.skip_if_no_xattrs()
+
+        self.conn = Connection(tf.config)
+        self.conn.authenticate()
+        self.account = Account(
+            self.conn, tf.config.get('account', tf.config['username']))
+        self.account.delete_containers()
+
+        # create a container with versioning
+        self.versions_container = self.account.container(Utils.create_name())
+        self.container = self.account.container(Utils.create_name())
+        self.segments_container = self.account.container(Utils.create_name())
+        if not self.container.create(
+                hdrs={'X-Versions-Location': self.versions_container.name}):
+            if self.conn.response.status == 412:
+                raise SkipTest("Object versioning not enabled")
+            else:
+                raise ResponseError(self.conn.response)
+        if 'versions' not in self.container.info():
+            raise SkipTest("Object versioning not enabled")
+
+        for cont in (self.versions_container, self.segments_container):
+            if not cont.create():
+                raise ResponseError(self.conn.response)
+
+        # create some segments
+        self.seg_info = {}
+        for letter, size in (('a', 1024 * 1024),
+                             ('b', 1024 * 1024)):
+            seg_name = letter
+            file_item = self.segments_container.file(seg_name)
+            file_item.write((letter * size).encode('ascii'))
+            self.seg_info[seg_name] = {
+                'size_bytes': size,
+                'etag': file_item.md5,
+                'path': '/%s/%s' % (self.segments_container.name, seg_name)}
+
+    def _create_manifest(self, seg_name):
+        # create a manifest in the versioning container
+        file_item = self.container.file("my-slo-manifest")
+        file_item.write(
+            json.dumps([self.seg_info[seg_name]]).encode('ascii'),
+            parms={'multipart-manifest': 'put'})
+        return file_item
+
+    def _assert_is_manifest(self, file_item, seg_name):
+        manifest_body = file_item.read(parms={'multipart-manifest': 'get'})
+        resp_headers = {
+            h.lower(): v for h, v in file_item.conn.response.getheaders()}
+        self.assertIn('x-static-large-object', resp_headers)
+        self.assertEqual('application/json; charset=utf-8',
+                         file_item.content_type)
+        try:
+            manifest = json.loads(manifest_body)
+        except ValueError:
+            self.fail("GET with multipart-manifest=get got invalid json")
+
+        self.assertEqual(1, len(manifest))
+        key_map = {'etag': 'hash', 'size_bytes': 'bytes'}
+        for k_client, k_slo in key_map.items():
+            self.assertEqual(self.seg_info[seg_name][k_client],
+                             manifest[0][k_slo])
+        self.assertEqual(self.seg_info[seg_name]['path'],
+                         manifest[0]['name'])
+
+    def _assert_is_object(self, file_item, seg_data):
+        file_contents = file_item.read()
+        self.assertEqual(1024 * 1024, len(file_contents))
+        self.assertEqual(seg_data, file_contents[:1])
+        self.assertEqual(seg_data, file_contents[-1:])
+
+    def tearDown(self):
+        # remove versioning to allow simple container delete
+        self.container.update_metadata(hdrs={'X-Versions-Location': ''})
+        self.account.delete_containers()
+
+    def test_slo_manifest_version(self):
+        file_item = self._create_manifest('a')
+        # sanity check: read the manifest, then the large object
+        self._assert_is_manifest(file_item, 'a')
+        self._assert_is_object(file_item, b'a')
+
+        # upload new manifest
+        file_item = self._create_manifest('b')
+        # sanity check: read the manifest, then the large object
+        self._assert_is_manifest(file_item, 'b')
+        self._assert_is_object(file_item, b'b')
+
+        versions_list = self.versions_container.files()
+        self.assertEqual(1, len(versions_list))
+        version_file = self.versions_container.file(versions_list[0])
+        # check the version is still a manifest
+        self._assert_is_manifest(version_file, 'a')
+        self._assert_is_object(version_file, b'a')
+
+        # delete the newest manifest
+        file_item.delete()
+
+        # expect the original manifest file to be restored
+        self._assert_is_manifest(file_item, 'a')
+        self._assert_is_object(file_item, b'a')
+
+    def test_slo_manifest_version_size(self):
+        file_item = self._create_manifest('a')
+        # sanity check: read the manifest, then the large object
+        self._assert_is_manifest(file_item, 'a')
+        self._assert_is_object(file_item, b'a')
+
+        # original manifest size
+        primary_list = self.container.files(parms={'format': 'json'})
+        self.assertEqual(1, len(primary_list))
+        org_size = primary_list[0]['bytes']
+
+        # upload new manifest
+        file_item = self._create_manifest('b')
+        # sanity check: read the manifest, then the large object
+        self._assert_is_manifest(file_item, 'b')
+        self._assert_is_object(file_item, b'b')
+
+        versions_list = self.versions_container.files(parms={'format': 'json'})
+        self.assertEqual(1, len(versions_list))
+        version_file = self.versions_container.file(versions_list[0]['name'])
+        version_file_size = versions_list[0]['bytes']
+        # check the version is still a manifest
+        self._assert_is_manifest(version_file, 'a')
+        self._assert_is_object(version_file, b'a')
+
+        # check the version size is correct
+        self.assertEqual(version_file_size, org_size)
+
+        # delete the newest manifest
+        file_item.delete()
+
+        # expect the original manifest file to be restored
+        self._assert_is_manifest(file_item, 'a')
+        self._assert_is_object(file_item, b'a')
+
+        primary_list = self.container.files(parms={'format': 'json'})
+        self.assertEqual(1, len(primary_list))
+        primary_file_size = primary_list[0]['bytes']
+        # expect the original manifest file size to be the same
+        self.assertEqual(primary_file_size, org_size)
+
+
+class TestSloWithVersioningUTF8(Base2, TestSloWithVersioning):
+    pass
+
+
+class TestObjectVersioningChangingMode(Base):
+    env = TestObjectVersioningHistoryModeEnv
+
+    def setUp(self):
+        super(TestObjectVersioningChangingMode, self).setUp()
+        if 'versioned_writes' not in cluster_info:
+            raise SkipTest("versioned_writes not enabled")
+
+    def test_delete_while_changing_mode(self):
+        container = self.env.container
+        versions_container = self.env.versions_container
+        cont_info = container.info()
+        self.assertEqual(cont_info['versions'], quote(versions_container.name))
+
+        obj_name = Utils.create_name()
+        versioned_obj = container.file(obj_name)
+
+        versioned_obj.write(
+            b"version1", hdrs={'Content-Type': 'text/jibberish01'})
+        versioned_obj.write(
+            b"version2", hdrs={'Content-Type': 'text/jibberish01'})
+
+        # sanity, version1 object should have moved to versions_container
+        self.assertEqual(1, versions_container.info()['object_count'])
+
+        versioned_obj.delete()
+
+        # version2 and the delete marker should have put in versions_container
+        self.assertEqual(3, versions_container.info()['object_count'])
+        delete_marker_name = versions_container.files()[2]
+        delete_marker = versions_container.file(delete_marker_name)
+        delete_marker.initialize()
+        self.assertEqual(
+            delete_marker.content_type,
+            'application/x-deleted;swift_versions_deleted=1')
+
+        # change to stack mode
+        hdrs = {'X-Versions-Location': versions_container.name}
+        container.update_metadata(hdrs=hdrs)
+
+        versioned_obj.delete()
+
+        # version2 object should have been moved in container
+        self.assertEqual(b"version2", versioned_obj.read())
+
+        # and there's only one version1 is left in versions_container
+        self.assertEqual(1, versions_container.info()['object_count'])
+        versioned_obj_name = versions_container.files()[0]
+        prev_version = versions_container.file(versioned_obj_name)
+        prev_version.initialize()
+        self.assertEqual(b"version1", prev_version.read())
+        self.assertEqual(prev_version.content_type, 'text/jibberish01')
+
+        # reset and test double delete
+        # change back to history mode
+        hdrs = {'X-History-Location': versions_container.name}
+        container.update_metadata(hdrs=hdrs)
+
+        # double delete, second DELETE returns a 404 as expected
+        versioned_obj.delete()
+        with self.assertRaises(ResponseError) as cm:
+            versioned_obj.delete()
+        self.assertEqual(404, cm.exception.status)
+
+        # There should now be 4 objects total in versions_container
+        # 2 are delete markers
+        self.assertEqual(4, versions_container.info()['object_count'])
+
+        # change to stack mode
+        hdrs = {'X-Versions-Location': versions_container.name}
+        container.update_metadata(hdrs=hdrs)
+
+        # a delete, just deletes one delete marker, it doesn't yet pop
+        # version2 back in the container
+        # This DELETE doesn't return a 404!
+        versioned_obj.delete()
+        self.assertEqual(3, versions_container.info()['object_count'])
+        self.assertEqual(0, container.info()['object_count'])
+
+        # neither does this one!
+        versioned_obj.delete()
+
+        # version2 object should have been moved in container
+        self.assertEqual(b"version2", versioned_obj.read())
+
+        # and there's only one version1 is left in versions_container
+        self.assertEqual(1, versions_container.info()['object_count'])
+
+
+class TestObjectVersioningChangingModeUTF8(
+        Base2, TestObjectVersioningChangingMode):
+    pass
diff --git a/test/functional/tests.py b/test/functional/tests.py
index fd5b17e5eb..25efb96f91 100644
--- a/test/functional/tests.py
+++ b/test/functional/tests.py
@@ -1,5 +1,5 @@
 #!/usr/bin/python -u
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -15,105 +15,40 @@
 # limitations under the License.
 
 from datetime import datetime
+import io
 import locale
 import random
-import StringIO
+import urllib.parse
 import time
-import threading
-import uuid
 import unittest
-from nose import SkipTest
-from ConfigParser import ConfigParser
+import uuid
+from copy import deepcopy
+import eventlet
+from swift.common.http import is_success, is_client_error
+from swift.common.swob import normalize_etag
+from swift.common.utils import md5
+from email.utils import parsedate
+
+from email.parser import BytesFeedParser as FeedParser
 
-from test import get_config
+from unittest import mock
+
+from test.functional import load_constraint, cluster_info
+from test.functional import check_response, retry
+import test.functional as tf
 from test.functional.swift_test_client import Account, Connection, File, \
-    ResponseError
-from swift.common.constraints import MAX_FILE_SIZE, MAX_META_NAME_LENGTH, \
-    MAX_META_VALUE_LENGTH, MAX_META_COUNT, MAX_META_OVERALL_SIZE, \
-    MAX_OBJECT_NAME_LENGTH, CONTAINER_LISTING_LIMIT, ACCOUNT_LISTING_LIMIT, \
-    MAX_ACCOUNT_NAME_LENGTH, MAX_CONTAINER_NAME_LENGTH
-
-default_constraints = dict((
-    ('max_file_size', MAX_FILE_SIZE),
-    ('max_meta_name_length', MAX_META_NAME_LENGTH),
-    ('max_meta_value_length', MAX_META_VALUE_LENGTH),
-    ('max_meta_count', MAX_META_COUNT),
-    ('max_meta_overall_size', MAX_META_OVERALL_SIZE),
-    ('max_object_name_length', MAX_OBJECT_NAME_LENGTH),
-    ('container_listing_limit', CONTAINER_LISTING_LIMIT),
-    ('account_listing_limit', ACCOUNT_LISTING_LIMIT),
-    ('max_account_name_length', MAX_ACCOUNT_NAME_LENGTH),
-    ('max_container_name_length', MAX_CONTAINER_NAME_LENGTH)))
-constraints_conf = ConfigParser()
-conf_exists = constraints_conf.read('/etc/swift/swift.conf')
-# Constraints are set first from the test config, then from
-# /etc/swift/swift.conf if it exists. If swift.conf doesn't exist,
-# then limit test coverage. This allows SAIO tests to work fine but
-# requires remote funtional testing to know something about the cluster
-# that is being tested.
-config = get_config('func_test')
-for k in default_constraints:
-    if k in config:
-        # prefer what's in test.conf
-        config[k] = int(config[k])
-    elif conf_exists:
-        # swift.conf exists, so use what's defined there (or swift defaults)
-        # This normally happens when the test is running locally to the cluster
-        # as in a SAIO.
-        config[k] = default_constraints[k]
-    else:
-        # .functests don't know what the constraints of the tested cluster are,
-        # so the tests can't reliably pass or fail. Therefore, skip those
-        # tests.
-        config[k] = '%s constraint is not defined' % k
-
-
-def load_constraint(name):
-    c = config[name]
-    if not isinstance(c, int):
-        raise SkipTest(c)
-    return c
-
-locale.setlocale(locale.LC_COLLATE, config.get('collate', 'C'))
-
-
-def chunks(s, length=3):
-    i, j = 0, length
-    while i < len(s):
-        yield s[i:j]
-        i, j = j, j + length
-
-
-def timeout(seconds, method, *args, **kwargs):
-    class TimeoutThread(threading.Thread):
-        def __init__(self, method, *args, **kwargs):
-            threading.Thread.__init__(self)
-
-            self.method = method
-            self.args = args
-            self.kwargs = kwargs
-            self.exception = None
-
-        def run(self):
-            try:
-                self.method(*self.args, **self.kwargs)
-            except Exception, e:
-                self.exception = e
+    ResponseError, SkipTest
 
-    t = TimeoutThread(method, *args, **kwargs)
-    t.start()
-    t.join(seconds)
 
-    if t.exception:
-        raise t.exception
+def setUpModule():
+    tf.setup_package()
 
-    if t.isAlive():
-        t._Thread__stop()
-        return True
-    return False
 
+def tearDownModule():
+    tf.teardown_package()
 
-class Utils:
+
+class Utils(object):
     @classmethod
     def create_ascii_name(cls, length=None):
         return uuid.uuid4().hex
@@ -130,50 +65,89 @@ def create_utf8_name(cls, length=None):
                      u'\u1802\u0901\uF111\uD20F\uB30D\u940B\u850A\u5607'\
                      u'\u3705\u1803\u0902\uF112\uD210\uB30E\u940C\u850B'\
                      u'\u5608\u3706\u1804\u0903\u03A9\u2603'
-        return ''.join([random.choice(utf8_chars)
-                        for x in xrange(length)]).encode('utf-8')
+        return u''.join([random.choice(utf8_chars)
+                         for x in range(length)])
 
     create_name = create_ascii_name
 
 
+class BaseEnv(object):
+    account = conn = None
+
+    @classmethod
+    def setUp(cls):
+        cls.conn = Connection(tf.config)
+        cls.conn.authenticate()
+        cls.account = Account(cls.conn, tf.config.get('account',
+                                                      tf.config['username']))
+        cls.account.delete_containers()
+
+    @classmethod
+    def tearDown(cls):
+        pass
+
+
 class Base(unittest.TestCase):
+    env = BaseEnv
+
+    @classmethod
+    def tearDownClass(cls):
+        cls.env.tearDown()
+
+    @classmethod
+    def setUpClass(cls):
+        cls.env.setUp()
+
     def setUp(self):
-        cls = type(self)
-        if not cls.set_up:
-            cls.env.setUp()
-            cls.set_up = True
+        if tf.in_process:
+            tf.skip_if_no_xattrs()
 
     def assert_body(self, body):
+        if not isinstance(body, bytes):
+            body = body.encode('utf-8')
         response_body = self.env.conn.response.read()
-        self.assert_(response_body == body,
-                     'Body returned: %s' % (response_body))
+        self.assertEqual(response_body, body,
+                         'Body returned: %s' % (response_body))
 
     def assert_status(self, status_or_statuses):
-        self.assert_(self.env.conn.response.status == status_or_statuses or
-                     (hasattr(status_or_statuses, '__iter__') and
-                      self.env.conn.response.status in status_or_statuses),
-                     'Status returned: %d Expected: %s' %
-                     (self.env.conn.response.status, status_or_statuses))
+        self.assertTrue(
+            self.env.conn.response.status == status_or_statuses or
+            (hasattr(status_or_statuses, '__iter__') and
+                self.env.conn.response.status in status_or_statuses),
+            'Status returned: %d Expected: %s' %
+            (self.env.conn.response.status, status_or_statuses))
+
+    def assert_header(self, header_name, expected_value):
+        try:
+            actual_value = self.env.conn.response.getheader(header_name)
+        except KeyError:
+            self.fail(
+                'Expected header name %r not found in response.' % header_name)
+        self.assertEqual(expected_value, actual_value)
+
+    def assert_etag(self, unquoted_value):
+        if tf.cluster_info.get('etag_quoter', {}).get('enable_by_default'):
+            expected = '"%s"' % unquoted_value
+        else:
+            expected = unquoted_value
+        self.assert_header('etag', expected)
 
 
 class Base2(object):
-    def setUp(self):
+    @classmethod
+    def setUpClass(cls):
         Utils.create_name = Utils.create_utf8_name
-        super(Base2, self).setUp()
+        super(Base2, cls).setUpClass()
 
-    def tearDown(self):
+    @classmethod
+    def tearDownClass(cls):
         Utils.create_name = Utils.create_ascii_name
 
 
-class TestAccountEnv:
+class TestAccountEnv(BaseEnv):
     @classmethod
     def setUp(cls):
-        cls.conn = Connection(config)
-        cls.conn.authenticate()
-        cls.account = Account(cls.conn, config.get('account',
-                                                   config['username']))
-        cls.account.delete_containers()
-
+        super(TestAccountEnv, cls).setUp()
         cls.containers = []
         for i in range(10):
             cont = cls.account.container(Utils.create_name())
@@ -185,16 +159,14 @@ def setUp(cls):
 
 class TestAccountDev(Base):
     env = TestAccountEnv
-    set_up = False
 
 
 class TestAccountDevUTF8(Base2, TestAccountDev):
-    set_up = False
+    pass
 
 
 class TestAccount(Base):
     env = TestAccountEnv
-    set_up = False
 
     def testNoAuthToken(self):
         self.assertRaises(ResponseError, self.env.account.info,
@@ -206,11 +178,13 @@ def testNoAuthToken(self):
         self.assert_status([401, 412])
 
     def testInvalidUTF8Path(self):
-        invalid_utf8 = Utils.create_utf8_name()[::-1]
+        valid_utf8 = Utils.create_utf8_name()
+        invalid_utf8 = (valid_utf8.encode('utf8')[::-1]).decode(
+            'utf-8', 'surrogateescape')
         container = self.env.account.container(invalid_utf8)
-        self.assert_(not container.create(cfg={'no_path_quote': True}))
+        self.assertFalse(container.create(cfg={'no_path_quote': True}))
         self.assert_status(412)
-        self.assert_body('Invalid UTF8')
+        self.assert_body('Invalid UTF8 or contains NULL')
 
     def testVersionOnlyPath(self):
         self.env.account.conn.make_request('PUT',
@@ -219,15 +193,20 @@ def testVersionOnlyPath(self):
         self.assert_body('Bad URL')
 
     def testInvalidPath(self):
-        was_url = self.env.account.conn.storage_url
-        self.env.account.conn.storage_url = "/%s" % was_url
-        self.env.account.conn.make_request('GET')
+        was_path = self.env.account.conn.storage_path
+        if (tf.normalized_urls):
+            self.env.account.conn.storage_path = '/'
+        else:
+            self.env.account.conn.storage_path = "/%s" % was_path
         try:
+            self.env.account.conn.make_request('GET')
             self.assert_status(404)
         finally:
-            self.env.account.conn.storage_url = was_url
+            self.env.account.conn.storage_path = was_path
 
-    def testPUT(self):
+    def testPUTError(self):
+        if load_constraint('allow_account_management'):
+            raise SkipTest("Allow account management is enabled")
         self.env.account.conn.make_request('PUT')
         self.assert_status([403, 405])
 
@@ -238,7 +217,7 @@ def testAccountHead(self):
 
             info = self.env.account.info()
             for field in ['object_count', 'container_count', 'bytes_used']:
-                self.assert_(info[field] >= 0)
+                self.assertGreaterEqual(info[field], 0)
 
             if info['container_count'] == len(self.env.containers):
                 break
@@ -246,7 +225,7 @@ def testAccountHead(self):
             if try_count < 5:
                 time.sleep(1)
 
-        self.assertEquals(info['container_count'], len(self.env.containers))
+        self.assertEqual(info['container_count'], len(self.env.containers))
         self.assert_status(204)
 
     def testContainerSerializedInfo(self):
@@ -255,33 +234,36 @@ def testContainerSerializedInfo(self):
             info = {'bytes': 0}
             info['count'] = random.randint(10, 30)
             for i in range(info['count']):
-                file = container.file(Utils.create_name())
+                file_item = container.file(Utils.create_name())
                 bytes = random.randint(1, 32768)
-                file.write_random(bytes)
+                file_item.write_random(bytes)
                 info['bytes'] += bytes
 
             container_info[container.name] = info
 
-        for format in ['json', 'xml']:
-            for a in self.env.account.containers(parms={'format': format}):
-                self.assert_(a['count'] >= 0)
-                self.assert_(a['bytes'] >= 0)
-
-            headers = dict(self.env.conn.response.getheaders())
-            if format == 'json':
-                self.assertEquals(headers['content-type'],
-                                  'application/json; charset=utf-8')
-            elif format == 'xml':
-                self.assertEquals(headers['content-type'],
-                                  'application/xml; charset=utf-8')
+        for format_type in ['json', 'xml']:
+            for a in self.env.account.containers(
+                    parms={'format': format_type}):
+                self.assertGreaterEqual(a['count'], 0)
+                self.assertGreaterEqual(a['bytes'], 0)
+
+            headers = dict((k.lower(), v)
+                           for k, v in self.env.conn.response.getheaders())
+            if format_type == 'json':
+                self.assertEqual(headers['content-type'],
+                                 'application/json; charset=utf-8')
+            elif format_type == 'xml':
+                self.assertEqual(headers['content-type'],
+                                 'application/xml; charset=utf-8')
 
     def testListingLimit(self):
         limit = load_constraint('account_listing_limit')
-        for l in (1, 100, limit / 2, limit - 1, limit, limit + 1, limit * 2):
-            p = {'limit': l}
+        for lim in (1, 100, limit / 2, limit - 1, limit, limit + 1, limit * 2):
+            p = {'limit': lim}
 
-            if l <= limit:
-                self.assert_(len(self.env.account.containers(parms=p)) <= l)
+            if lim <= limit:
+                self.assertLessEqual(len(self.env.account.containers(parms=p)),
+                                     lim)
                 self.assert_status(200)
             else:
                 self.assertRaises(ResponseError,
@@ -291,13 +273,98 @@ def testListingLimit(self):
     def testContainerListing(self):
         a = sorted([c.name for c in self.env.containers])
 
-        for format in [None, 'json', 'xml']:
-            b = self.env.account.containers(parms={'format': format})
+        for format_type in [None, 'json', 'xml']:
+            b = self.env.account.containers(parms={'format': format_type})
 
             if isinstance(b[0], dict):
                 b = [x['name'] for x in b]
 
-            self.assertEquals(a, b)
+            self.assertEqual(a, b)
+
+    def testListDelimiter(self):
+        delimiter = '-'
+        containers = ['test', delimiter.join(['test', 'bar']),
+                      delimiter.join(['test', 'foo'])]
+        for c in containers:
+            cont = self.env.account.container(c)
+            self.assertTrue(cont.create())
+
+        results = self.env.account.containers(parms={'delimiter': delimiter})
+        expected = ['test', 'test-']
+        results = [r for r in results if r in expected]
+        self.assertEqual(expected, results)
+
+        results = self.env.account.containers(parms={'delimiter': delimiter,
+                                                     'reverse': 'yes'})
+        expected.reverse()
+        results = [r for r in results if r in expected]
+        self.assertEqual(expected, results)
+
+    def testListMultiCharDelimiter(self):
+        delimiter = '-&'
+        containers = ['test', delimiter.join(['test', 'bar']),
+                      delimiter.join(['test', 'foo'])]
+        for c in containers:
+            cont = self.env.account.container(c)
+            self.assertTrue(cont.create())
+
+        results = self.env.account.containers(parms={'delimiter': delimiter})
+        expected = ['test', 'test-&']
+        results = [r for r in results if r in expected]
+        self.assertEqual(expected, results)
+
+        results = self.env.account.containers(parms={'delimiter': delimiter,
+                                                     'reverse': 'yes'})
+        expected.reverse()
+        results = [r for r in results if r in expected]
+        self.assertEqual(expected, results)
+
+    def testListDelimiterAndPrefix(self):
+        delimiter = 'a'
+        containers = ['bar', 'bazar']
+        for c in containers:
+            cont = self.env.account.container(c)
+            self.assertTrue(cont.create())
+
+        results = self.env.account.containers(parms={'delimiter': delimiter,
+                                                     'prefix': 'ba'})
+        expected = ['bar', 'baza']
+        results = [r for r in results if r in expected]
+        self.assertEqual(expected, results)
+
+        results = self.env.account.containers(parms={'delimiter': delimiter,
+                                                     'prefix': 'ba',
+                                                     'reverse': 'yes'})
+        expected.reverse()
+        results = [r for r in results if r in expected]
+        self.assertEqual(expected, results)
+
+    def testContainerListingLastModified(self):
+        expected = {}
+        for container in self.env.containers:
+            res = container.info()
+            expected[container.name] = time.mktime(
+                parsedate(res['last_modified']))
+
+        for format_type in ['json', 'xml']:
+            actual = {}
+            containers = self.env.account.containers(
+                parms={'format': format_type})
+            if isinstance(containers[0], dict):
+                for container in containers:
+                    self.assertIn('name', container)  # sanity
+                    self.assertIn('last_modified', container)  # sanity
+                    # ceil by hand (wants easier way!)
+                    datetime_str, micro_sec_str = \
+                        container['last_modified'].split('.')
+                    timestamp = time.mktime(
+                        time.strptime(datetime_str,
+                                      "%Y-%m-%dT%H:%M:%S"))
+                    if int(micro_sec_str):
+                        timestamp += 1
+                    actual[container['name']] = timestamp
+
+            self.assertEqual(expected, actual)
 
     def testInvalidAuthToken(self):
         hdrs = {'X-Auth-Token': 'bogus_auth_token'}
@@ -305,85 +372,183 @@ def testInvalidAuthToken(self):
         self.assert_status(401)
 
     def testLastContainerMarker(self):
-        for format in [None, 'json', 'xml']:
-            containers = self.env.account.containers({'format': format})
-            self.assertEquals(len(containers), len(self.env.containers))
+        for format_type in [None, 'json', 'xml']:
+            containers = self.env.account.containers(parms={
+                'format': format_type})
+            self.assertEqual(len(containers), len(self.env.containers))
             self.assert_status(200)
 
+            marker = (containers[-1] if format_type is None
+                      else containers[-1]['name'])
             containers = self.env.account.containers(
-                parms={'format': format, 'marker': containers[-1]})
-            self.assertEquals(len(containers), 0)
-            if format is None:
+                parms={'format': format_type, 'marker': marker})
+            self.assertEqual(len(containers), 0)
+            if format_type is None:
                 self.assert_status(204)
             else:
                 self.assert_status(200)
 
     def testMarkerLimitContainerList(self):
-        for format in [None, 'json', 'xml']:
+        for format_type in [None, 'json', 'xml']:
             for marker in ['0', 'A', 'I', 'R', 'Z', 'a', 'i', 'r', 'z',
                            'abc123', 'mnop', 'xyz']:
 
                 limit = random.randint(2, 9)
                 containers = self.env.account.containers(
-                    parms={'format': format, 'marker': marker, 'limit': limit})
-                self.assert_(len(containers) <= limit)
+                    parms={'format': format_type,
+                           'marker': marker,
+                           'limit': limit})
+                self.assertLessEqual(len(containers), limit)
                 if containers:
                     if isinstance(containers[0], dict):
                         containers = [x['name'] for x in containers]
-                    self.assert_(locale.strcoll(containers[0], marker) > 0)
+                    self.assertGreater(locale.strcoll(containers[0], marker),
+                                       0)
 
     def testContainersOrderedByName(self):
-        for format in [None, 'json', 'xml']:
+        for format_type in [None, 'json', 'xml']:
             containers = self.env.account.containers(
-                parms={'format': format})
+                parms={'format': format_type})
             if isinstance(containers[0], dict):
                 containers = [x['name'] for x in containers]
-            self.assertEquals(sorted(containers, cmp=locale.strcoll),
-                              containers)
-
+            self.assertEqual(sorted(containers, key=locale.strxfrm),
+                             containers)
+
+    def testQuotedWWWAuthenticateHeader(self):
+        # check that the www-authenticate header value with the swift realm
+        # is correctly quoted.
+        conn = Connection(tf.config)
+        conn.authenticate()
+        inserted_html = '<b>Hello World'
+        hax = 'AUTH_haxx"\nContent-Length: %d\n\n%s' % (len(inserted_html),
+                                                        inserted_html)
+        quoted_hax = urllib.parse.quote(hax)
+        conn.connection.request('GET', '/v1/' + quoted_hax, None, {})
+        resp = conn.connection.getresponse()
+
+        resp_headers = {}
+        for h, v in resp.getheaders():
+            h = h.lower()
+            if h in resp_headers:
+                # py2 would do this for us, but py3 apparently keeps them
+                # separate? Not sure which I like more...
+                resp_headers[h] += ',' + v
+            else:
+                resp_headers[h] = v
 
-class TestAccountUTF8(Base2, TestAccount):
-    set_up = False
+        self.assertIn('www-authenticate', resp_headers)
+        actual = resp_headers['www-authenticate']
+        expected = 'Swift realm="%s"' % quoted_hax
+        # other middleware e.g. auth_token may also set www-authenticate
+        # headers in which case actual values will be a comma separated list.
+        # check that expected value is among the actual values
+        self.assertIn(expected, actual)
 
 
-class TestAccountNoContainersEnv:
-    @classmethod
-    def setUp(cls):
-        cls.conn = Connection(config)
-        cls.conn.authenticate()
-        cls.account = Account(cls.conn, config.get('account',
-                                                   config['username']))
-        cls.account.delete_containers()
+class TestAccountUTF8(Base2, TestAccount):
+    pass
 
 
 class TestAccountNoContainers(Base):
-    env = TestAccountNoContainersEnv
-    set_up = False
-
     def testGetRequest(self):
-        for format in [None, 'json', 'xml']:
-            self.assert_(not self.env.account.containers(
-                parms={'format': format}))
+        for format_type in [None, 'json', 'xml']:
+            self.assertFalse(self.env.account.containers(
+                parms={'format': format_type}))
 
-            if format is None:
+            if format_type is None:
                 self.assert_status(204)
             else:
                 self.assert_status(200)
 
 
 class TestAccountNoContainersUTF8(Base2, TestAccountNoContainers):
-    set_up = False
+    pass
 
 
-class TestContainerEnv:
+class TestAccountSortingEnv(BaseEnv):
     @classmethod
     def setUp(cls):
-        cls.conn = Connection(config)
-        cls.conn.authenticate()
-        cls.account = Account(cls.conn, config.get('account',
-                                                   config['username']))
-        cls.account.delete_containers()
+        super(TestAccountSortingEnv, cls).setUp()
+        postfix = Utils.create_name()
+        cls.cont_items = ('a1', 'a2', 'A3', 'b1', 'B2', 'a10', 'b10', 'zz')
+        cls.cont_items = ['%s%s' % (x, postfix) for x in cls.cont_items]
+
+        for container in cls.cont_items:
+            c = cls.account.container(container)
+            if not c.create():
+                raise ResponseError(cls.conn.response)
+
+
+class TestAccountSorting(Base):
+    env = TestAccountSortingEnv
+
+    def testAccountContainerListSorting(self):
+        # name (byte order) sorting.
+        cont_list = sorted(self.env.cont_items)
+        for reverse in ('false', 'no', 'off', '', 'garbage'):
+            cont_listing = self.env.account.containers(
+                parms={'reverse': reverse})
+            self.assert_status(200)
+            self.assertEqual(cont_list, cont_listing,
+                             'Expected %s but got %s with reverse param %r'
+                             % (cont_list, cont_listing, reverse))
+
+    def testAccountContainerListSortingReverse(self):
+        # name (byte order) sorting.
+        cont_list = sorted(self.env.cont_items)
+        cont_list.reverse()
+        for reverse in ('true', '1', 'yes', 'on', 't', 'y'):
+            cont_listing = self.env.account.containers(
+                parms={'reverse': reverse})
+            self.assert_status(200)
+            self.assertEqual(cont_list, cont_listing,
+                             'Expected %s but got %s with reverse param %r'
+                             % (cont_list, cont_listing, reverse))
+
+    def testAccountContainerListSortingByPrefix(self):
+        cont_list = sorted(c for c in self.env.cont_items if c.startswith('a'))
+        cont_list.reverse()
+        cont_listing = self.env.account.containers(parms={
+            'reverse': 'on', 'prefix': 'a'})
+        self.assert_status(200)
+        self.assertEqual(cont_list, cont_listing)
+
+    def testAccountContainerListSortingByMarkersExclusive(self):
+        first_item = self.env.cont_items[3]  # 'b1' + postfix
+        last_item = self.env.cont_items[4]  # 'B2' + postfix
+
+        cont_list = sorted(c for c in self.env.cont_items
+                           if last_item < c < first_item)
+        cont_list.reverse()
+        cont_listing = self.env.account.containers(parms={
+            'reverse': 'on', 'marker': first_item, 'end_marker': last_item})
+        self.assert_status(200)
+        self.assertEqual(cont_list, cont_listing)
+
+    def testAccountContainerListSortingByMarkersInclusive(self):
+        first_item = self.env.cont_items[3]  # 'b1' + postfix
+        last_item = self.env.cont_items[4]  # 'B2' + postfix
+
+        cont_list = sorted(c for c in self.env.cont_items
+                           if last_item <= c <= first_item)
+        cont_list.reverse()
+        cont_listing = self.env.account.containers(parms={
+            'reverse': 'on', 'marker': first_item + '\x00',
+            'end_marker': last_item[:-1] + chr(ord(last_item[-1]) - 1)})
+        self.assert_status(200)
+        self.assertEqual(cont_list, cont_listing)
 
+    def testAccountContainerListSortingByReversedMarkers(self):
+        cont_listing = self.env.account.containers(parms={
+            'reverse': 'on', 'marker': 'B', 'end_marker': 'b1'})
+        self.assert_status(204)
+        self.assertEqual([], cont_listing)
+
+
+class TestContainerEnv(BaseEnv):
+    @classmethod
+    def setUp(cls):
+        super(TestContainerEnv, cls).setUp()
         cls.container = cls.account.container(Utils.create_name())
         if not cls.container.create():
             raise ResponseError(cls.conn.response)
@@ -392,126 +557,223 @@ def setUp(cls):
         cls.file_size = 128
         cls.files = list()
         for x in range(cls.file_count):
-            file = cls.container.file(Utils.create_name())
-            file.write_random(cls.file_size)
-            cls.files.append(file.name)
+            file_item = cls.container.file(Utils.create_name())
+            file_item.write_random(cls.file_size)
+            cls.files.append(file_item.name)
 
 
 class TestContainerDev(Base):
     env = TestContainerEnv
-    set_up = False
 
 
 class TestContainerDevUTF8(Base2, TestContainerDev):
-    set_up = False
+    pass
 
 
 class TestContainer(Base):
     env = TestContainerEnv
-    set_up = False
 
     def testContainerNameLimit(self):
         limit = load_constraint('max_container_name_length')
 
-        for l in (limit - 100, limit - 10, limit - 1, limit,
-                  limit + 1, limit + 10, limit + 100):
-            cont = self.env.account.container('a' * l)
-            if l <= limit:
-                self.assert_(cont.create())
-                self.assert_status(201)
+        for lim in (limit - 100, limit - 10, limit - 1, limit,
+                    limit + 1, limit + 10, limit + 100):
+            cont = self.env.account.container('a' * lim)
+            if lim <= limit:
+                self.assertTrue(cont.create())
+                self.assert_status((201, 202))
             else:
-                self.assert_(not cont.create())
+                self.assertFalse(cont.create())
                 self.assert_status(400)
 
     def testFileThenContainerDelete(self):
         cont = self.env.account.container(Utils.create_name())
-        self.assert_(cont.create())
-        file = cont.file(Utils.create_name())
-        self.assert_(file.write_random())
+        self.assertTrue(cont.create())
+        file_item = cont.file(Utils.create_name())
+        self.assertTrue(file_item.write_random())
 
-        self.assert_(file.delete())
+        self.assertTrue(file_item.delete())
         self.assert_status(204)
-        self.assert_(file.name not in cont.files())
+        self.assertNotIn(file_item.name, cont.files())
 
-        self.assert_(cont.delete())
+        self.assertTrue(cont.delete())
         self.assert_status(204)
-        self.assert_(cont.name not in self.env.account.containers())
+        self.assertNotIn(cont.name, self.env.account.containers())
 
     def testFileListingLimitMarkerPrefix(self):
         cont = self.env.account.container(Utils.create_name())
-        self.assert_(cont.create())
+        self.assertTrue(cont.create())
 
-        files = sorted([Utils.create_name() for x in xrange(10)])
+        files = sorted([Utils.create_name() for x in range(10)])
         for f in files:
-            file = cont.file(f)
-            self.assert_(file.write_random())
+            file_item = cont.file(f)
+            self.assertTrue(file_item.write_random())
 
-        for i in xrange(len(files)):
+        for i in range(len(files)):
             f = files[i]
-            for j in xrange(1, len(files) - i):
-                self.assert_(cont.files(parms={'limit': j, 'marker': f}) ==
-                             files[i + 1: i + j + 1])
-            self.assert_(cont.files(parms={'marker': f}) == files[i + 1:])
-            self.assert_(cont.files(parms={'marker': f, 'prefix': f}) == [])
-            self.assert_(cont.files(parms={'prefix': f}) == [f])
+            for j in range(1, len(files) - i):
+                self.assertEqual(cont.files(parms={'limit': j, 'marker': f}),
+                                 files[i + 1: i + j + 1])
+            self.assertEqual(cont.files(parms={'marker': f}), files[i + 1:])
+            self.assertEqual(cont.files(parms={'marker': f, 'prefix': f}), [])
+            self.assertEqual(cont.files(parms={'prefix': f}), [f])
 
     def testPrefixAndLimit(self):
         load_constraint('container_listing_limit')
         cont = self.env.account.container(Utils.create_name())
-        self.assert_(cont.create())
+        self.assertTrue(cont.create())
 
         prefix_file_count = 10
         limit_count = 2
         prefixs = ['alpha/', 'beta/', 'kappa/']
         prefix_files = {}
 
-        all_files = []
         for prefix in prefixs:
             prefix_files[prefix] = []
 
             for i in range(prefix_file_count):
-                file = cont.file(prefix + Utils.create_name())
-                file.write()
-                prefix_files[prefix].append(file.name)
+                file_item = cont.file(prefix + Utils.create_name())
+                file_item.write()
+                prefix_files[prefix].append(file_item.name)
 
-        for format in [None, 'json', 'xml']:
+        for format_type in [None, 'json', 'xml']:
             for prefix in prefixs:
-                files = cont.files(parms={'prefix': prefix})
-                self.assertEquals(files, sorted(prefix_files[prefix]))
+                files = cont.files(parms={'prefix': prefix,
+                                          'format': format_type})
+                if isinstance(files[0], dict):
+                    files = [x.get('name', x.get('subdir')) for x in files]
+                self.assertEqual(files, sorted(prefix_files[prefix]))
 
-        for format in [None, 'json', 'xml']:
+        for format_type in [None, 'json', 'xml']:
             for prefix in prefixs:
                 files = cont.files(parms={'limit': limit_count,
-                                   'prefix': prefix})
-                self.assertEquals(len(files), limit_count)
+                                          'prefix': prefix,
+                                          'format': format_type})
+                if isinstance(files[0], dict):
+                    files = [x.get('name', x.get('subdir')) for x in files]
+                self.assertEqual(len(files), limit_count)
+
+                for file_item in files:
+                    self.assertTrue(file_item.startswith(prefix))
+
+    def testListDelimiter(self):
+        cont = self.env.account.container(Utils.create_name())
+        self.assertTrue(cont.create())
+
+        delimiter = '-'
+        files = ['test', delimiter.join(['test', 'bar']),
+                 delimiter.join(['test', 'foo'])]
+        for f in files:
+            file_item = cont.file(f)
+            self.assertTrue(file_item.write_random())
+
+        for format_type in [None, 'json', 'xml']:
+            results = cont.files(parms={'format': format_type})
+            if isinstance(results[0], dict):
+                results = [x.get('name', x.get('subdir')) for x in results]
+            self.assertEqual(results, ['test', 'test-bar', 'test-foo'])
+
+            results = cont.files(parms={'delimiter': delimiter,
+                                        'format': format_type})
+            if isinstance(results[0], dict):
+                results = [x.get('name', x.get('subdir')) for x in results]
+            self.assertEqual(results, ['test', 'test-'])
+
+            results = cont.files(parms={'delimiter': delimiter,
+                                        'format': format_type,
+                                        'reverse': 'yes'})
+            if isinstance(results[0], dict):
+                results = [x.get('name', x.get('subdir')) for x in results]
+            self.assertEqual(results, ['test-', 'test'])
+
+    def testListMultiCharDelimiter(self):
+        cont = self.env.account.container(Utils.create_name())
+        self.assertTrue(cont.create())
+
+        delimiter = '-&'
+        files = ['test', delimiter.join(['test', 'bar']),
+                 delimiter.join(['test', 'foo']), "test-'baz"]
+        for f in files:
+            file_item = cont.file(f)
+            self.assertTrue(file_item.write_random())
+
+        for format_type in [None, 'json', 'xml']:
+            results = cont.files(parms={'format': format_type})
+            if isinstance(results[0], dict):
+                results = [x.get('name', x.get('subdir')) for x in results]
+            self.assertEqual(results, ['test', 'test-&bar', 'test-&foo',
+                                       "test-'baz"])
+
+            results = cont.files(parms={'delimiter': delimiter,
+                                        'format': format_type})
+            if isinstance(results[0], dict):
+                results = [x.get('name', x.get('subdir')) for x in results]
+            self.assertEqual(results, ['test', 'test-&', "test-'baz"])
+
+            results = cont.files(parms={'delimiter': delimiter,
+                                        'format': format_type,
+                                        'reverse': 'yes'})
+            if isinstance(results[0], dict):
+                results = [x.get('name', x.get('subdir')) for x in results]
+            self.assertEqual(results, ["test-'baz", 'test-&', 'test'])
+
+    def testListDelimiterAndPrefix(self):
+        cont = self.env.account.container(Utils.create_name())
+        self.assertTrue(cont.create())
 
-                for file in files:
-                    self.assert_(file.startswith(prefix))
+        delimiter = 'a'
+        files = ['bar', 'bazar']
+        for f in files:
+            file_item = cont.file(f)
+            self.assertTrue(file_item.write_random())
+
+        results = cont.files(parms={'delimiter': delimiter, 'prefix': 'ba'})
+        self.assertEqual(results, ['bar', 'baza'])
+
+        results = cont.files(parms={'delimiter': delimiter,
+                                    'prefix': 'ba',
+                                    'reverse': 'yes'})
+        self.assertEqual(results, ['baza', 'bar'])
+
+    def testLeadingDelimiter(self):
+        cont = self.env.account.container(Utils.create_name())
+        self.assertTrue(cont.create())
+
+        delimiter = '/'
+        files = ['test', delimiter.join(['', 'test', 'bar']),
+                 delimiter.join(['', 'test', 'bar', 'foo'])]
+        for f in files:
+            file_item = cont.file(f)
+            self.assertTrue(file_item.write_random())
+
+        results = cont.files(parms={'delimiter': delimiter})
+        self.assertEqual(results, [delimiter, 'test'])
 
     def testCreate(self):
         cont = self.env.account.container(Utils.create_name())
-        self.assert_(cont.create())
+        self.assertTrue(cont.create())
         self.assert_status(201)
-        self.assert_(cont.name in self.env.account.containers())
+        self.assertIn(cont.name, self.env.account.containers())
 
     def testContainerFileListOnContainerThatDoesNotExist(self):
-        for format in [None, 'json', 'xml']:
+        for format_type in [None, 'json', 'xml']:
             container = self.env.account.container(Utils.create_name())
             self.assertRaises(ResponseError, container.files,
-                              parms={'format': format})
+                              parms={'format': format_type})
             self.assert_status(404)
 
     def testUtf8Container(self):
         valid_utf8 = Utils.create_utf8_name()
-        invalid_utf8 = valid_utf8[::-1]
+        invalid_utf8 = (valid_utf8.encode('utf8')[::-1]).decode(
+            'utf-8', 'surrogateescape')
         container = self.env.account.container(valid_utf8)
-        self.assert_(container.create(cfg={'no_path_quote': True}))
-        self.assert_(container.name in self.env.account.containers())
-        self.assertEquals(container.files(), [])
-        self.assert_(container.delete())
+        self.assertTrue(container.create(cfg={'no_path_quote': True}))
+        self.assertIn(container.name, self.env.account.containers())
+        self.assertEqual(container.files(), [])
+        self.assertTrue(container.delete())
 
         container = self.env.account.container(invalid_utf8)
-        self.assert_(not container.create(cfg={'no_path_quote': True}))
+        self.assertFalse(container.create(cfg={'no_path_quote': True}))
         self.assert_status(412)
         self.assertRaises(ResponseError, container.files,
                           cfg={'no_path_quote': True})
@@ -519,91 +781,113 @@ def testUtf8Container(self):
 
     def testCreateOnExisting(self):
         cont = self.env.account.container(Utils.create_name())
-        self.assert_(cont.create())
+        self.assertTrue(cont.create())
         self.assert_status(201)
-        self.assert_(cont.create())
+        self.assertTrue(cont.create())
         self.assert_status(202)
 
     def testSlashInName(self):
-        if Utils.create_name == Utils.create_utf8_name:
-            cont_name = list(unicode(Utils.create_name(), 'utf-8'))
-        else:
-            cont_name = list(Utils.create_name())
-
+        cont_name = list(Utils.create_name())
         cont_name[random.randint(2, len(cont_name) - 2)] = '/'
         cont_name = ''.join(cont_name)
 
-        if Utils.create_name == Utils.create_utf8_name:
-            cont_name = cont_name.encode('utf-8')
-
         cont = self.env.account.container(cont_name)
-        self.assert_(not cont.create(cfg={'no_path_quote': True}),
-                     'created container with name %s' % (cont_name))
+        self.assertFalse(cont.create(cfg={'no_path_quote': True}),
+                         'created container with name %s' % (cont_name))
         self.assert_status(404)
-        self.assert_(cont.name not in self.env.account.containers())
+        self.assertNotIn(cont.name, self.env.account.containers())
 
     def testDelete(self):
         cont = self.env.account.container(Utils.create_name())
-        self.assert_(cont.create())
+        self.assertTrue(cont.create())
         self.assert_status(201)
-        self.assert_(cont.delete())
+        self.assertTrue(cont.delete())
         self.assert_status(204)
-        self.assert_(cont.name not in self.env.account.containers())
+        self.assertNotIn(cont.name, self.env.account.containers())
 
     def testDeleteOnContainerThatDoesNotExist(self):
         cont = self.env.account.container(Utils.create_name())
-        self.assert_(not cont.delete())
+        self.assertFalse(cont.delete())
         self.assert_status(404)
 
     def testDeleteOnContainerWithFiles(self):
         cont = self.env.account.container(Utils.create_name())
-        self.assert_(cont.create())
-        file = cont.file(Utils.create_name())
-        file.write_random(self.env.file_size)
-        self.assert_(file.name in cont.files())
-        self.assert_(not cont.delete())
+        self.assertTrue(cont.create())
+        file_item = cont.file(Utils.create_name())
+        file_item.write_random(self.env.file_size)
+        self.assertIn(file_item.name, cont.files())
+        self.assertFalse(cont.delete())
         self.assert_status(409)
 
     def testFileCreateInContainerThatDoesNotExist(self):
-        file = File(self.env.conn, self.env.account, Utils.create_name(),
-                    Utils.create_name())
-        self.assertRaises(ResponseError, file.write)
+        file_item = File(self.env.conn, self.env.account, Utils.create_name(),
+                         Utils.create_name())
+        self.assertRaises(ResponseError, file_item.write)
         self.assert_status(404)
 
     def testLastFileMarker(self):
-        for format in [None, 'json', 'xml']:
-            files = self.env.container.files({'format': format})
-            self.assertEquals(len(files), len(self.env.files))
+        for format_type in [None, 'json', 'xml']:
+            files = self.env.container.files(parms={'format': format_type})
+            self.assertEqual(len(files), len(self.env.files))
             self.assert_status(200)
 
+            marker = files[-1] if format_type is None else files[-1]['name']
             files = self.env.container.files(
-                parms={'format': format, 'marker': files[-1]})
-            self.assertEquals(len(files), 0)
+                parms={'format': format_type, 'marker': marker})
+            self.assertEqual(len(files), 0)
 
-            if format is None:
+            if format_type is None:
                 self.assert_status(204)
             else:
                 self.assert_status(200)
 
     def testContainerFileList(self):
-        for format in [None, 'json', 'xml']:
-            files = self.env.container.files(parms={'format': format})
+        for format_type in [None, 'json', 'xml']:
+            files = self.env.container.files(parms={'format': format_type})
             self.assert_status(200)
             if isinstance(files[0], dict):
                 files = [x['name'] for x in files]
 
-            for file in self.env.files:
-                self.assert_(file in files)
+            for file_item in self.env.files:
+                self.assertIn(file_item, files)
+
+            for file_item in files:
+                self.assertIn(file_item, self.env.files)
+
+    def _testContainerFormattedFileList(self, format_type):
+        expected = {}
+        for name in self.env.files:
+            expected[name] = self.env.container.file(name).info()
 
-            for file in files:
-                self.assert_(file in self.env.files)
+        file_list = self.env.container.files(parms={'format': format_type})
+        self.assert_status(200)
+        for actual in file_list:
+            name = actual['name']
+            self.assertIn(name, expected)
+            if tf.cluster_info.get('etag_quoter', {}).get('enable_by_default'):
+                self.assertEqual(expected[name]['etag'],
+                                 '"%s"' % actual['hash'])
+            else:
+                self.assertEqual(expected[name]['etag'], actual['hash'])
+            self.assertEqual(
+                expected[name]['content_type'], actual['content_type'])
+            self.assertEqual(
+                expected[name]['content_length'], actual['bytes'])
+            expected.pop(name)
+        self.assertFalse(expected)  # sanity check
+
+    def testContainerJsonFileList(self):
+        self._testContainerFormattedFileList('json')
+
+    def testContainerXmlFileList(self):
+        self._testContainerFormattedFileList('xml')
 
     def testMarkerLimitFileList(self):
-        for format in [None, 'json', 'xml']:
+        for format_type in [None, 'json', 'xml']:
             for marker in ['0', 'A', 'I', 'R', 'Z', 'a', 'i', 'r', 'z',
                            'abc123', 'mnop', 'xyz']:
                 limit = random.randint(2, self.env.file_count - 1)
-                files = self.env.container.files(parms={'format': format,
+                files = self.env.container.files(parms={'format': format_type,
                                                         'marker': marker,
                                                         'limit': limit})
 
@@ -613,25 +897,25 @@ def testMarkerLimitFileList(self):
                 if isinstance(files[0], dict):
                     files = [x['name'] for x in files]
 
-                self.assert_(len(files) <= limit)
+                self.assertLessEqual(len(files), limit)
                 if files:
                     if isinstance(files[0], dict):
                         files = [x['name'] for x in files]
-                    self.assert_(locale.strcoll(files[0], marker) > 0)
+                    self.assertGreater(locale.strcoll(files[0], marker), 0)
 
     def testFileOrder(self):
-        for format in [None, 'json', 'xml']:
-            files = self.env.container.files(parms={'format': format})
+        for format_type in [None, 'json', 'xml']:
+            files = self.env.container.files(parms={'format': format_type})
             if isinstance(files[0], dict):
                 files = [x['name'] for x in files]
-            self.assertEquals(sorted(files, cmp=locale.strcoll), files)
+            self.assertEqual(sorted(files, key=locale.strxfrm), files)
 
     def testContainerInfo(self):
         info = self.env.container.info()
         self.assert_status(204)
-        self.assertEquals(info['object_count'], self.env.file_count)
-        self.assertEquals(info['bytes_used'],
-                          self.env.file_count * self.env.file_size)
+        self.assertEqual(info['object_count'], self.env.file_count)
+        self.assertEqual(info['bytes_used'],
+                         self.env.file_count * self.env.file_size)
 
     def testContainerInfoOnContainerThatDoesNotExist(self):
         container = self.env.account.container(Utils.create_name())
@@ -639,43 +923,178 @@ def testContainerInfoOnContainerThatDoesNotExist(self):
         self.assert_status(404)
 
     def testContainerFileListWithLimit(self):
-        for format in [None, 'json', 'xml']:
-            files = self.env.container.files(parms={'format': format,
+        for format_type in [None, 'json', 'xml']:
+            files = self.env.container.files(parms={'format': format_type,
                                                     'limit': 2})
-            self.assertEquals(len(files), 2)
-
-    def testTooLongName(self):
-        cont = self.env.account.container('x' * 257)
-        self.assert_(not cont.create(),
-                     'created container with name %s' % (cont.name))
-        self.assert_status(400)
+            self.assertEqual(len(files), 2)
 
     def testContainerExistenceCachingProblem(self):
         cont = self.env.account.container(Utils.create_name())
         self.assertRaises(ResponseError, cont.files)
-        self.assert_(cont.create())
-        cont.files()
+        self.assertTrue(cont.create())
+        self.assertEqual(cont.files(), [])
 
         cont = self.env.account.container(Utils.create_name())
         self.assertRaises(ResponseError, cont.files)
-        self.assert_(cont.create())
-        file = cont.file(Utils.create_name())
-        file.write_random()
+        self.assertTrue(cont.create())
+        # NB: no GET! Make sure the PUT cleared the cached 404
+        file_item = cont.file(Utils.create_name())
+        file_item.write_random()
+
+    def testContainerLastModified(self):
+        container = self.env.account.container(Utils.create_name())
+        self.assertTrue(container.create())
+        info = container.info()
+        t0 = info['last_modified']
+        # last modified header is in date format which supports in second
+        # so we need to wait to increment a sec in the header.
+        eventlet.sleep(1)
+
+        # POST container change last modified timestamp
+        self.assertTrue(
+            container.update_metadata({'x-container-meta-japan': 'mitaka'}))
+        info = container.info()
+        t1 = info['last_modified']
+        self.assertNotEqual(t0, t1)
+        eventlet.sleep(1)
+
+        # PUT container (overwrite) also change last modified
+        self.assertTrue(container.create())
+        info = container.info()
+        t2 = info['last_modified']
+        self.assertNotEqual(t1, t2)
+        eventlet.sleep(1)
+
+        # PUT object doesn't change container last modified timestamp
+        obj = container.file(Utils.create_name())
+        self.assertTrue(
+            obj.write(b"aaaaa", hdrs={'Content-Type': 'text/plain'}))
+        info = container.info()
+        t3 = info['last_modified']
+        self.assertEqual(t2, t3)
+
+        # POST object also doesn't change container last modified timestamp
+        self.assertTrue(
+            obj.sync_metadata({'us': 'austin'}))
+        info = container.info()
+        t4 = info['last_modified']
+        self.assertEqual(t2, t4)
 
 
 class TestContainerUTF8(Base2, TestContainer):
-    set_up = False
+    pass
 
 
-class TestContainerPathsEnv:
+class TestContainerSortingEnv(BaseEnv):
     @classmethod
     def setUp(cls):
-        cls.conn = Connection(config)
-        cls.conn.authenticate()
-        cls.account = Account(cls.conn, config.get('account',
-                                                   config['username']))
-        cls.account.delete_containers()
+        super(TestContainerSortingEnv, cls).setUp()
+        cls.container = cls.account.container(Utils.create_name())
+        if not cls.container.create():
+            raise ResponseError(cls.conn.response)
+
+        cls.file_items = ('a1', 'a2', 'A3', 'b1', 'B2', 'a10', 'b10', 'zz')
+        cls.files = list()
+        cls.file_size = 128
+        for name in cls.file_items:
+            file_item = cls.container.file(name)
+            file_item.write_random(cls.file_size)
+            cls.files.append(file_item.name)
+
+
+class TestContainerSorting(Base):
+    env = TestContainerSortingEnv
+
+    def testContainerFileListSortingReversed(self):
+        file_list = list(sorted(self.env.file_items))
+        file_list.reverse()
+        for reverse in ('true', '1', 'yes', 'on', 't', 'y'):
+            cont_files = self.env.container.files(parms={'reverse': reverse})
+            self.assert_status(200)
+            self.assertEqual(file_list, cont_files,
+                             'Expected %s but got %s with reverse param %r'
+                             % (file_list, cont_files, reverse))
+
+    def testContainerFileSortingByPrefixReversed(self):
+        cont_list = sorted(c for c in self.env.file_items if c.startswith('a'))
+        cont_list.reverse()
+        cont_listing = self.env.container.files(parms={
+            'reverse': 'on', 'prefix': 'a'})
+        self.assert_status(200)
+        self.assertEqual(cont_list, cont_listing)
+
+    def testContainerFileSortingByMarkersExclusiveReversed(self):
+        first_item = self.env.file_items[3]  # 'b1' + postfix
+        last_item = self.env.file_items[4]  # 'B2' + postfix
+
+        cont_list = sorted(c for c in self.env.file_items
+                           if last_item < c < first_item)
+        cont_list.reverse()
+        cont_listing = self.env.container.files(parms={
+            'reverse': 'on', 'marker': first_item, 'end_marker': last_item})
+        self.assert_status(200)
+        self.assertEqual(cont_list, cont_listing)
+
+    def testContainerFileSortingByMarkersInclusiveReversed(self):
+        first_item = self.env.file_items[3]  # 'b1' + postfix
+        last_item = self.env.file_items[4]  # 'B2' + postfix
+
+        cont_list = sorted(c for c in self.env.file_items
+                           if last_item <= c <= first_item)
+        cont_list.reverse()
+        cont_listing = self.env.container.files(parms={
+            'reverse': 'on', 'marker': first_item + '\x00',
+            'end_marker': last_item[:-1] + chr(ord(last_item[-1]) - 1)})
+        self.assert_status(200)
+        self.assertEqual(cont_list, cont_listing)
 
+    def testContainerFileSortingByReversedMarkersReversed(self):
+        cont_listing = self.env.container.files(parms={
+            'reverse': 'on', 'marker': 'B', 'end_marker': 'b1'})
+        self.assert_status(204)
+        self.assertEqual([], cont_listing)
+
+    def testContainerFileListSorting(self):
+        file_list = list(sorted(self.env.file_items))
+        cont_files = self.env.container.files()
+        self.assert_status(200)
+        self.assertEqual(file_list, cont_files)
+
+        # Lets try again but with reverse is specifically turned off
+        cont_files = self.env.container.files(parms={'reverse': 'off'})
+        self.assert_status(200)
+        self.assertEqual(file_list, cont_files)
+
+        cont_files = self.env.container.files(parms={'reverse': 'false'})
+        self.assert_status(200)
+        self.assertEqual(file_list, cont_files)
+
+        cont_files = self.env.container.files(parms={'reverse': 'no'})
+        self.assert_status(200)
+        self.assertEqual(file_list, cont_files)
+
+        cont_files = self.env.container.files(parms={'reverse': ''})
+        self.assert_status(200)
+        self.assertEqual(file_list, cont_files)
+
+        # Lets try again but with a incorrect reverse values
+        cont_files = self.env.container.files(parms={'reverse': 'foo'})
+        self.assert_status(200)
+        self.assertEqual(file_list, cont_files)
+
+        cont_files = self.env.container.files(parms={'reverse': 'hai'})
+        self.assert_status(200)
+        self.assertEqual(file_list, cont_files)
+
+        cont_files = self.env.container.files(parms={'reverse': 'o=[]::::>'})
+        self.assert_status(200)
+        self.assertEqual(file_list, cont_files)
+
+
+class TestContainerPathsEnv(BaseEnv):
+    @classmethod
+    def setUp(cls):
+        super(TestContainerPathsEnv, cls).setUp()
         cls.file_size = 8
 
         cls.container = cls.account.container(Utils.create_name())
@@ -724,18 +1143,27 @@ def setUp(cls):
             'dir1/subdir+with{whatever/file D',
         ]
 
+        stored_files = set()
         for f in cls.files:
-            file = cls.container.file(f)
+            file_item = cls.container.file(f)
             if f.endswith('/'):
-                file.write(hdrs={'Content-Type': 'application/directory'})
+                file_item.write(hdrs={'Content-Type': 'application/directory'})
+            else:
+                file_item.write_random(cls.file_size,
+                                       hdrs={'Content-Type':
+                                             'application/directory'})
+            if (tf.normalized_urls):
+                nfile = '/'.join(filter(None, f.split('/')))
+                if (f[-1] == '/'):
+                    nfile += '/'
+                stored_files.add(nfile)
             else:
-                file.write_random(cls.file_size, hdrs={'Content-Type':
-                                  'application/directory'})
+                stored_files.add(f)
+        cls.stored_files = sorted(stored_files)
 
 
 class TestContainerPaths(Base):
     env = TestContainerPathsEnv
-    set_up = False
 
     def testTraverseContainer(self):
         found_files = []
@@ -745,72 +1173,76 @@ def recurse_path(path, count=0):
             if count > 10:
                 raise ValueError('too deep recursion')
 
-            for file in self.env.container.files(parms={'path': path}):
-                self.assert_(file.startswith(path))
-                if file.endswith('/'):
-                    recurse_path(file, count + 1)
-                    found_dirs.append(file)
+            for file_item in self.env.container.files(parms={'path': path}):
+                self.assertTrue(file_item.startswith(path))
+                if file_item.endswith('/'):
+                    recurse_path(file_item, count + 1)
+                    found_dirs.append(file_item)
                 else:
-                    found_files.append(file)
+                    found_files.append(file_item)
 
         recurse_path('')
-        for file in self.env.files:
-            if file.startswith('/'):
-                self.assert_(file not in found_dirs)
-                self.assert_(file not in found_files)
-            elif file.endswith('/'):
-                self.assert_(file in found_dirs)
-                self.assert_(file not in found_files)
+        for file_item in self.env.stored_files:
+            if file_item.startswith('/'):
+                self.assertNotIn(file_item, found_dirs)
+                self.assertNotIn(file_item, found_files)
+            elif file_item.endswith('/'):
+                self.assertIn(file_item, found_dirs)
+                self.assertNotIn(file_item, found_files)
             else:
-                self.assert_(file in found_files)
-                self.assert_(file not in found_dirs)
+                self.assertIn(file_item, found_files)
+                self.assertNotIn(file_item, found_dirs)
+
         found_files = []
         found_dirs = []
         recurse_path('/')
-        for file in self.env.files:
-            if not file.startswith('/'):
-                self.assert_(file not in found_dirs)
-                self.assert_(file not in found_files)
-            elif file.endswith('/'):
-                self.assert_(file in found_dirs)
-                self.assert_(file not in found_files)
+        for file_item in self.env.stored_files:
+            if not file_item.startswith('/'):
+                self.assertNotIn(file_item, found_dirs)
+                self.assertNotIn(file_item, found_files)
+            elif file_item.endswith('/'):
+                self.assertIn(file_item, found_dirs)
+                self.assertNotIn(file_item, found_files)
             else:
-                self.assert_(file in found_files)
-                self.assert_(file not in found_dirs)
+                self.assertIn(file_item, found_files)
+                self.assertNotIn(file_item, found_dirs)
 
     def testContainerListing(self):
-        for format in (None, 'json', 'xml'):
-            files = self.env.container.files(parms={'format': format})
+        for format_type in (None, 'json', 'xml'):
+            files = self.env.container.files(parms={'format': format_type})
 
             if isinstance(files[0], dict):
                 files = [str(x['name']) for x in files]
 
-            self.assertEquals(files, sorted(self.env.files))
+            self.assertEqual(files, self.env.stored_files)
 
-        for format in ('json', 'xml'):
-            for file in self.env.container.files(parms={'format': format}):
-                self.assert_(int(file['bytes']) >= 0)
-                self.assert_('last_modified' in file)
-                if file['name'].endswith('/'):
-                    self.assertEquals(file['content_type'],
-                                      'application/directory')
+        for format_type in ('json', 'xml'):
+            for file_item in self.env.container.files(parms={'format':
+                                                             format_type}):
+                self.assertGreaterEqual(int(file_item['bytes']), 0)
+                self.assertIn('last_modified', file_item)
+                if file_item['name'].endswith('/'):
+                    self.assertEqual(file_item['content_type'],
+                                     'application/directory')
 
     def testStructure(self):
-        def assert_listing(path, list):
+        def assert_listing(path, file_list):
             files = self.env.container.files(parms={'path': path})
-            self.assertEquals(sorted(list, cmp=locale.strcoll), files)
-
-        assert_listing('/', ['/dir1/', '/dir2/', '/file1', '/file A'])
-        assert_listing('/dir1',
-                       ['/dir1/file2', '/dir1/subdir1/', '/dir1/subdir2/'])
-        assert_listing('/dir1/',
-                       ['/dir1/file2', '/dir1/subdir1/', '/dir1/subdir2/'])
-        assert_listing('/dir1/subdir1',
-                       ['/dir1/subdir1/subsubdir2/', '/dir1/subdir1/file2',
-                        '/dir1/subdir1/file3', '/dir1/subdir1/file4',
-                        '/dir1/subdir1/subsubdir1/'])
-        assert_listing('/dir1/subdir2', [])
-        assert_listing('', ['file1', 'dir1/', 'dir2/'])
+            self.assertEqual(sorted(file_list, key=locale.strxfrm), files)
+        if not tf.normalized_urls:
+            assert_listing('/', ['/dir1/', '/dir2/', '/file1', '/file A'])
+            assert_listing('/dir1',
+                           ['/dir1/file2', '/dir1/subdir1/', '/dir1/subdir2/'])
+            assert_listing('/dir1/',
+                           ['/dir1/file2', '/dir1/subdir1/', '/dir1/subdir2/'])
+            assert_listing('/dir1/subdir1',
+                           ['/dir1/subdir1/subsubdir2/', '/dir1/subdir1/file2',
+                            '/dir1/subdir1/file3', '/dir1/subdir1/file4',
+                            '/dir1/subdir1/subsubdir1/'])
+            assert_listing('/dir1/subdir2', [])
+            assert_listing('', ['file1', 'dir1/', 'dir2/'])
+        else:
+            assert_listing('', ['file1', 'dir1/', 'dir2/', 'file A'])
         assert_listing('dir1', ['dir1/file2', 'dir1/subdir1/',
                                 'dir1/subdir2/', 'dir1/subdir with spaces/',
                                 'dir1/subdir+with{whatever/'])
@@ -832,14 +1264,22 @@ def assert_listing(path, list):
                        ['dir1/subdir with spaces/file B'])
 
 
-class TestFileEnv:
+class TestFileEnv(BaseEnv):
     @classmethod
     def setUp(cls):
-        cls.conn = Connection(config)
-        cls.conn.authenticate()
-        cls.account = Account(cls.conn, config.get('account',
-                                                   config['username']))
-        cls.account.delete_containers()
+        super(TestFileEnv, cls).setUp()
+        if not tf.skip2:
+            # creating another account and connection
+            # for account to account copy tests
+            config2 = deepcopy(tf.config)
+            config2['account'] = tf.config['account2']
+            config2['username'] = tf.config['username2']
+            config2['password'] = tf.config['password2']
+            cls.conn2 = Connection(config2)
+            cls.conn2.authenticate()
+
+            cls.account2 = cls.conn2.get_account()
+            cls.account2.delete_containers()
 
         cls.container = cls.account.container(Utils.create_name())
         if not cls.container.create():
@@ -847,120 +1287,476 @@ def setUp(cls):
 
         cls.file_size = 128
 
+        # With keystoneauth we need the accounts to have had the project
+        # domain id persisted as sysmeta prior to testing ACLs. This may
+        # not be the case if, for example, the account was created using
+        # a request with reseller_admin role, when project domain id may
+        # not have been known. So we ensure that the project domain id is
+        # in sysmeta by making a POST to the accounts using an admin role.
+        cls.account.update_metadata()
+        if not tf.skip2:
+            cls.account2.update_metadata()
+
 
 class TestFileDev(Base):
     env = TestFileEnv
-    set_up = False
 
 
 class TestFileDevUTF8(Base2, TestFileDev):
-    set_up = False
+    pass
 
 
 class TestFile(Base):
     env = TestFileEnv
-    set_up = False
+
+    def testGetResponseHeaders(self):
+        obj_data = b'test_body'
+
+        def do_test(put_hdrs, get_hdrs, expected_hdrs, unexpected_hdrs):
+            filename = Utils.create_name()
+            file_item = self.env.container.file(filename)
+            resp = file_item.write(
+                data=obj_data, hdrs=put_hdrs, return_resp=True)
+
+            # put then get an object
+            resp.read()
+            read_data = file_item.read(hdrs=get_hdrs)
+            self.assertEqual(obj_data, read_data)  # sanity check
+            resp_headers = file_item.conn.response.getheaders()
+
+            # check the *list* of all header (name, value) pairs rather than
+            # constructing a dict in case of repeated names in the list
+            errors = []
+            for k, v in resp_headers:
+                if k.lower() in unexpected_hdrs:
+                    errors.append('Found unexpected header %s: %s' % (k, v))
+            for k, v in expected_hdrs.items():
+                matches = [hdr for hdr in resp_headers if hdr[0].lower() == k]
+                if not matches:
+                    errors.append('Missing expected header %s' % k)
+                for (got_k, got_v) in matches:
+                    # The Connection: header is parsed by cluster's LB and may
+                    # be returned in either original lowercase or camel-cased.
+                    if k == 'connection':
+                        got_v = got_v.lower()
+                    if got_v != v:
+                        errors.append('Expected %s but got %s for %s' %
+                                      (v, got_v, k))
+            if errors:
+                self.fail(
+                    'Errors in response headers:\n  %s' % '\n  '.join(errors))
+
+        put_headers = {'X-Object-Meta-Fruit': 'Banana',
+                       'X-Delete-After': '10000',
+                       'Content-Type': 'application/test'}
+        expected_headers = {'content-length': str(len(obj_data)),
+                            'x-object-meta-fruit': 'Banana',
+                            'accept-ranges': 'bytes',
+                            'content-type': 'application/test',
+                            'etag': md5(
+                                obj_data, usedforsecurity=False).hexdigest(),
+                            'last-modified': mock.ANY,
+                            'date': mock.ANY,
+                            'x-delete-at': mock.ANY,
+                            'x-trans-id': mock.ANY,
+                            'x-openstack-request-id': mock.ANY}
+        if tf.cluster_info.get('etag_quoter', {}).get('enable_by_default'):
+            expected_headers['etag'] = '"%s"' % expected_headers['etag']
+        unexpected_headers = ['connection', 'x-delete-after']
+        do_test(put_headers, {}, expected_headers, unexpected_headers)
+
+        get_headers = {'Connection': 'keep-alive'}
+        expected_headers['connection'] = 'keep-alive'
+        unexpected_headers = ['x-delete-after']
+        do_test(put_headers, get_headers, expected_headers, unexpected_headers)
 
     def testCopy(self):
-        # makes sure to test encoded characters"
+        # makes sure to test encoded characters
         source_filename = 'dealde%2Fl04 011e%204c8df/flash.png'
-        file = self.env.container.file(source_filename)
+        file_item = self.env.container.file(source_filename)
 
         metadata = {}
-        for i in range(1):
-            metadata[Utils.create_ascii_name()] = Utils.create_name()
+        metadata[Utils.create_ascii_name()] = Utils.create_name()
+        put_headers = {'Content-Type': 'application/test',
+                       'Content-Encoding': 'gzip',
+                       'Content-Disposition': 'attachment; filename=myfile'}
+        file_item.metadata = metadata
+        data = file_item.write_random(hdrs=put_headers)
+
+        # the allowed headers are configurable in object server, so we cannot
+        # assert that content-encoding and content-disposition get *copied*
+        # unless they were successfully set on the original PUT, so populate
+        # expected_headers by making a HEAD on the original object
+        file_item.initialize()
+        self.assertEqual('application/test', file_item.content_type)
+        resp_headers = dict(file_item.conn.response.getheaders())
+        expected_headers = {}
+        for k, v in put_headers.items():
+            if k.lower() in resp_headers:
+                expected_headers[k] = v
 
-        data = file.write_random()
-        file.sync_metadata(metadata)
+        dest_cont = self.env.account.container(Utils.create_name())
+        self.assertTrue(dest_cont.create())
+
+        # copy both from within and across containers
+        for cont in (self.env.container, dest_cont):
+            # copy both with and without initial slash
+            for prefix in ('', '/'):
+                dest_filename = Utils.create_name()
+
+                extra_hdrs = {'X-Object-Meta-Extra': 'fresh'}
+                self.assertTrue(file_item.copy(
+                    '%s%s' % (prefix, cont), dest_filename, hdrs=extra_hdrs))
+
+                # verify container listing for copy
+                listing = cont.files(parms={'format': 'json'})
+                for obj in listing:
+                    if obj['name'] == dest_filename:
+                        break
+                else:
+                    self.fail('Failed to find %s in listing' % dest_filename)
+
+                self.assertEqual(file_item.size, obj['bytes'])
+                self.assertEqual(normalize_etag(file_item.etag), obj['hash'])
+                self.assertEqual(file_item.content_type, obj['content_type'])
+
+                file_copy = cont.file(dest_filename)
+
+                self.assertEqual(data, file_copy.read())
+                self.assertTrue(file_copy.initialize())
+                expected_metadata = dict(metadata)
+                # new metadata should be merged with existing
+                expected_metadata['extra'] = 'fresh'
+                self.assertDictEqual(expected_metadata, file_copy.metadata)
+                resp_headers = dict(file_copy.conn.response.getheaders())
+                for k, v in expected_headers.items():
+                    self.assertIn(k.lower(), resp_headers)
+                    self.assertEqual(v, resp_headers[k.lower()])
+
+                # repeat copy with updated content-type, content-encoding and
+                # content-disposition, which should get updated
+                extra_hdrs = {
+                    'X-Object-Meta-Extra': 'fresher',
+                    'Content-Type': 'application/test-changed',
+                    'Content-Encoding': 'not_gzip',
+                    'Content-Disposition': 'attachment; filename=notmyfile'}
+                self.assertTrue(file_item.copy(
+                    '%s%s' % (prefix, cont), dest_filename, hdrs=extra_hdrs))
+
+                self.assertIn(dest_filename, cont.files())
+
+                file_copy = cont.file(dest_filename)
+
+                self.assertEqual(data, file_copy.read())
+                self.assertTrue(file_copy.initialize())
+                expected_metadata['extra'] = 'fresher'
+                self.assertDictEqual(expected_metadata, file_copy.metadata)
+                resp_headers = dict(file_copy.conn.response.getheaders())
+                # if k is in expected_headers then we can assert its new value
+                for k, v in expected_headers.items():
+                    v = extra_hdrs.get(k, v)
+                    self.assertIn(k.lower(), resp_headers)
+                    self.assertEqual(v, resp_headers[k.lower()])
+
+                # verify container listing for copy
+                listing = cont.files(parms={'format': 'json'})
+                for obj in listing:
+                    if obj['name'] == dest_filename:
+                        break
+                else:
+                    self.fail('Failed to find %s in listing' % dest_filename)
+
+                self.assertEqual(file_item.size, obj['bytes'])
+                self.assertEqual(normalize_etag(file_item.etag), obj['hash'])
+                self.assertEqual(
+                    'application/test-changed', obj['content_type'])
+
+                # repeat copy with X-Fresh-Metadata header - existing user
+                # metadata should not be copied, new completely replaces it.
+                extra_hdrs = {'Content-Type': 'application/test-updated',
+                              'X-Object-Meta-Extra': 'fresher',
+                              'X-Fresh-Metadata': 'true'}
+                self.assertTrue(file_item.copy(
+                    '%s%s' % (prefix, cont), dest_filename, hdrs=extra_hdrs))
+
+                self.assertIn(dest_filename, cont.files())
+
+                file_copy = cont.file(dest_filename)
+
+                self.assertEqual(data, file_copy.read())
+                self.assertTrue(file_copy.initialize())
+                self.assertEqual('application/test-updated',
+                                 file_copy.content_type)
+                expected_metadata = {'extra': 'fresher'}
+                self.assertDictEqual(expected_metadata, file_copy.metadata)
+                resp_headers = dict(file_copy.conn.response.getheaders())
+                for k in ('Content-Disposition', 'Content-Encoding'):
+                    self.assertNotIn(k.lower(), resp_headers)
+
+                # verify container listing for copy
+                listing = cont.files(parms={'format': 'json'})
+                for obj in listing:
+                    if obj['name'] == dest_filename:
+                        break
+                else:
+                    self.fail('Failed to find %s in listing' % dest_filename)
+
+                self.assertEqual(file_item.size, obj['bytes'])
+                self.assertEqual(normalize_etag(file_item.etag), obj['hash'])
+                self.assertEqual(
+                    'application/test-updated', obj['content_type'])
+
+    def testCopyRange(self):
+        # makes sure to test encoded characters
+        source_filename = 'dealde%2Fl04 011e%204c8df/flash.png'
+        file_item = self.env.container.file(source_filename)
+
+        metadata = {Utils.create_ascii_name(): Utils.create_name()}
+
+        data = file_item.write_random(1024)
+        file_item.sync_metadata(metadata)
+        file_item.initialize()
+
+        dest_cont = self.env.account.container(Utils.create_name())
+        self.assertTrue(dest_cont.create())
+
+        expected_body = data[100:201]
+        expected_etag = md5(expected_body, usedforsecurity=False)
+        # copy both from within and across containers
+        for cont in (self.env.container, dest_cont):
+            # copy both with and without initial slash
+            for prefix in ('', '/'):
+                dest_filename = Utils.create_name()
+
+                file_item.copy('%s%s' % (prefix, cont), dest_filename,
+                               hdrs={'Range': 'bytes=100-200'})
+                self.assertEqual(201, file_item.conn.response.status)
+
+                # verify container listing for copy
+                listing = cont.files(parms={'format': 'json'})
+                for obj in listing:
+                    if obj['name'] == dest_filename:
+                        break
+                else:
+                    self.fail('Failed to find %s in listing' % dest_filename)
+
+                self.assertEqual(101, obj['bytes'])
+                self.assertEqual(expected_etag.hexdigest(), obj['hash'])
+                self.assertEqual(file_item.content_type, obj['content_type'])
+
+                # verify copy object
+                copy_file_item = cont.file(dest_filename)
+                self.assertEqual(expected_body, copy_file_item.read())
+                self.assertTrue(copy_file_item.initialize())
+                self.assertEqual(metadata, copy_file_item.metadata)
+
+    def testCopyAccount(self):
+        # makes sure to test encoded characters
+        source_filename = 'dealde%2Fl04 011e%204c8df/flash.png'
+        file_item = self.env.container.file(source_filename)
+
+        metadata = {Utils.create_ascii_name(): Utils.create_name()}
+
+        data = file_item.write_random()
+        file_item.sync_metadata(metadata)
 
         dest_cont = self.env.account.container(Utils.create_name())
-        self.assert_(dest_cont.create())
+        self.assertTrue(dest_cont.create())
 
+        acct = self.env.conn.account_name
         # copy both from within and across containers
         for cont in (self.env.container, dest_cont):
             # copy both with and without initial slash
             for prefix in ('', '/'):
                 dest_filename = Utils.create_name()
 
-                file = self.env.container.file(source_filename)
-                file.copy('%s%s' % (prefix, cont), dest_filename)
+                file_item = self.env.container.file(source_filename)
+                file_item.copy_account(acct,
+                                       '%s%s' % (prefix, cont),
+                                       dest_filename)
 
-                self.assert_(dest_filename in cont.files())
+                self.assertIn(dest_filename, cont.files())
 
-                file = cont.file(dest_filename)
+                file_item = cont.file(dest_filename)
 
-                self.assert_(data == file.read())
-                self.assert_(file.initialize())
-                self.assert_(metadata == file.metadata)
+                self.assertEqual(data, file_item.read())
+                self.assertTrue(file_item.initialize())
+                self.assertEqual(metadata, file_item.metadata)
+
+        if not tf.skip2:
+            dest_cont = self.env.account2.container(Utils.create_name())
+            self.assertTrue(dest_cont.create(hdrs={
+                'X-Container-Write': self.env.conn.user_acl
+            }))
+
+            acct = self.env.conn2.account_name
+            # copy both with and without initial slash
+            for prefix in ('', '/'):
+                dest_filename = Utils.create_name()
+
+                file_item = self.env.container.file(source_filename)
+                file_item.copy_account(acct,
+                                       '%s%s' % (prefix, dest_cont),
+                                       dest_filename)
+
+                self.assertIn(dest_filename, dest_cont.files())
+
+                file_item = dest_cont.file(dest_filename)
+
+                self.assertEqual(data, file_item.read())
+                self.assertTrue(file_item.initialize())
+                self.assertEqual(metadata, file_item.metadata)
 
     def testCopy404s(self):
         source_filename = Utils.create_name()
-        file = self.env.container.file(source_filename)
-        file.write_random()
+        file_item = self.env.container.file(source_filename)
+        file_item.write_random()
 
         dest_cont = self.env.account.container(Utils.create_name())
-        self.assert_(dest_cont.create())
+        self.assertTrue(dest_cont.create())
 
         for prefix in ('', '/'):
             # invalid source container
             source_cont = self.env.account.container(Utils.create_name())
-            file = source_cont.file(source_filename)
-            self.assert_(not file.copy('%s%s' % (prefix, self.env.container),
-                         Utils.create_name()))
+            file_item = source_cont.file(source_filename)
+            self.assertRaises(ResponseError, file_item.copy,
+                              '%s%s' % (prefix, self.env.container),
+                              Utils.create_name())
             self.assert_status(404)
 
-            self.assert_(not file.copy('%s%s' % (prefix, dest_cont),
-                         Utils.create_name()))
+            self.assertRaises(ResponseError, file_item.copy,
+                              '%s%s' % (prefix, dest_cont),
+                              Utils.create_name())
             self.assert_status(404)
 
             # invalid source object
-            file = self.env.container.file(Utils.create_name())
-            self.assert_(not file.copy('%s%s' % (prefix, self.env.container),
-                         Utils.create_name()))
+            file_item = self.env.container.file(Utils.create_name())
+            self.assertRaises(ResponseError, file_item.copy,
+                              '%s%s' % (prefix, self.env.container),
+                              Utils.create_name())
             self.assert_status(404)
 
-            self.assert_(not file.copy('%s%s' % (prefix, dest_cont),
-                         Utils.create_name()))
+            self.assertRaises(ResponseError, file_item.copy,
+                              '%s%s' % (prefix, dest_cont),
+                              Utils.create_name())
             self.assert_status(404)
 
             # invalid destination container
-            file = self.env.container.file(source_filename)
-            self.assert_(not file.copy('%s%s' % (prefix, Utils.create_name()),
-                         Utils.create_name()))
+            file_item = self.env.container.file(source_filename)
+            self.assertRaises(ResponseError, file_item.copy,
+                              '%s%s' % (prefix, Utils.create_name()),
+                              Utils.create_name())
+
+    def testCopyAccount404s(self):
+        if tf.skip2:
+            raise SkipTest('Account2 not set')
+        acct = self.env.conn.account_name
+        acct2 = self.env.conn2.account_name
+        source_filename = Utils.create_name()
+        file_item = self.env.container.file(source_filename)
+        file_item.write_random()
+
+        dest_cont = self.env.account.container(Utils.create_name())
+        self.assertTrue(dest_cont.create(hdrs={
+            'X-Container-Read': self.env.conn2.user_acl
+        }))
+        dest_cont2 = self.env.account2.container(Utils.create_name())
+        self.assertTrue(dest_cont2.create(hdrs={
+            'X-Container-Write': self.env.conn.user_acl,
+            'X-Container-Read': self.env.conn.user_acl
+        }))
+
+        for acct, cont in ((acct, dest_cont), (acct2, dest_cont2)):
+            for prefix in ('', '/'):
+                # invalid source container
+                source_cont = self.env.account.container(Utils.create_name())
+                file_item = source_cont.file(source_filename)
+                self.assertRaises(ResponseError, file_item.copy_account,
+                                  acct,
+                                  '%s%s' % (prefix, self.env.container),
+                                  Utils.create_name())
+                # there is no such source container but user has
+                # permissions to do a GET (done internally via COPY) for
+                # objects in his own account.
+                self.assert_status(404)
+
+                self.assertRaises(ResponseError, file_item.copy_account,
+                                  acct,
+                                  '%s%s' % (prefix, cont),
+                                  Utils.create_name())
+                self.assert_status(404)
+
+                # invalid source object
+                file_item = self.env.container.file(Utils.create_name())
+                self.assertRaises(ResponseError, file_item.copy_account,
+                                  acct,
+                                  '%s%s' % (prefix, self.env.container),
+                                  Utils.create_name())
+                # there is no such source container but user has
+                # permissions to do a GET (done internally via COPY) for
+                # objects in his own account.
+                self.assert_status(404)
+
+                self.assertRaises(ResponseError, file_item.copy_account,
+                                  acct,
+                                  '%s%s' % (prefix, cont),
+                                  Utils.create_name())
+                self.assert_status(404)
+
+                # invalid destination container
+                file_item = self.env.container.file(source_filename)
+                self.assertRaises(ResponseError, file_item.copy_account,
+                                  acct,
+                                  '%s%s' % (prefix, Utils.create_name()),
+                                  Utils.create_name())
+                if acct == acct2:
+                    # there is no such destination container
+                    # and foreign user can have no permission to write there
+                    self.assert_status(403)
+                else:
+                    self.assert_status(404)
 
     def testCopyNoDestinationHeader(self):
         source_filename = Utils.create_name()
-        file = self.env.container.file(source_filename)
-        file.write_random()
+        file_item = self.env.container.file(source_filename)
+        file_item.write_random()
 
-        file = self.env.container.file(source_filename)
-        self.assert_(not file.copy(Utils.create_name(), Utils.create_name(),
-                     cfg={'no_destination': True}))
+        file_item = self.env.container.file(source_filename)
+        self.assertRaises(ResponseError, file_item.copy, Utils.create_name(),
+                          Utils.create_name(),
+                          cfg={'no_destination': True})
         self.assert_status(412)
 
     def testCopyDestinationSlashProblems(self):
         source_filename = Utils.create_name()
-        file = self.env.container.file(source_filename)
-        file.write_random()
+        file_item = self.env.container.file(source_filename)
+        file_item.write_random()
 
         # no slash
-        self.assert_(not file.copy(Utils.create_name(), Utils.create_name(),
-                     cfg={'destination': Utils.create_name()}))
+        self.assertRaises(ResponseError, file_item.copy, Utils.create_name(),
+                          Utils.create_name(),
+                          cfg={'destination': Utils.create_name()})
+        self.assert_status(412)
+
+        # too many slashes
+        self.assertRaises(ResponseError, file_item.copy, Utils.create_name(),
+                          Utils.create_name(),
+                          cfg={'destination': '//%s' % Utils.create_name()})
         self.assert_status(412)
 
     def testCopyFromHeader(self):
         source_filename = Utils.create_name()
-        file = self.env.container.file(source_filename)
+        file_item = self.env.container.file(source_filename)
 
         metadata = {}
         for i in range(1):
             metadata[Utils.create_ascii_name()] = Utils.create_name()
-        file.metadata = metadata
+        file_item.metadata = metadata
 
-        data = file.write_random()
+        data = file_item.write_random()
 
         dest_cont = self.env.account.container(Utils.create_name())
-        self.assert_(dest_cont.create())
+        self.assertTrue(dest_cont.create())
 
         # copy both from within and across containers
         for cont in (self.env.container, dest_cont):
@@ -968,60 +1764,196 @@ def testCopyFromHeader(self):
             for prefix in ('', '/'):
                 dest_filename = Utils.create_name()
 
-                file = cont.file(dest_filename)
-                file.write(hdrs={'X-Copy-From': '%s%s/%s' % (prefix,
-                           self.env.container.name, source_filename)})
+                file_item = cont.file(dest_filename)
+                file_item.write(hdrs={'X-Copy-From': '%s%s/%s' % (
+                    prefix, self.env.container.name, source_filename)})
 
-                self.assert_(dest_filename in cont.files())
+                self.assertIn(dest_filename, cont.files())
 
-                file = cont.file(dest_filename)
+                file_item = cont.file(dest_filename)
+
+                self.assertEqual(data, file_item.read())
+                self.assertTrue(file_item.initialize())
+                self.assertEqual(metadata, file_item.metadata)
+
+    def testCopyFromAccountHeader(self):
+        if tf.skip2:
+            raise SkipTest('Account2 not set')
+        acct = self.env.conn.account_name
+        src_cont = self.env.account.container(Utils.create_name())
+        self.assertTrue(src_cont.create(hdrs={
+            'X-Container-Read': self.env.conn2.user_acl
+        }))
+        source_filename = Utils.create_name()
+        file_item = src_cont.file(source_filename)
+
+        metadata = {}
+        for i in range(1):
+            metadata[Utils.create_ascii_name()] = Utils.create_name()
+        file_item.metadata = metadata
+
+        data = file_item.write_random()
+
+        dest_cont = self.env.account.container(Utils.create_name())
+        self.assertTrue(dest_cont.create())
+        dest_cont2 = self.env.account2.container(Utils.create_name())
+        self.assertTrue(dest_cont2.create(hdrs={
+            'X-Container-Write': self.env.conn.user_acl
+        }))
+
+        for cont in (src_cont, dest_cont, dest_cont2):
+            # copy both with and without initial slash
+            for prefix in ('', '/'):
+                dest_filename = Utils.create_name()
 
-                self.assert_(data == file.read())
-                self.assert_(file.initialize())
-                self.assert_(metadata == file.metadata)
+                file_item = cont.file(dest_filename)
+                file_item.write(hdrs={'X-Copy-From-Account': acct,
+                                      'X-Copy-From': '%s%s/%s' % (
+                                          prefix,
+                                          src_cont.name,
+                                          source_filename)})
+
+                self.assertIn(dest_filename, cont.files())
+
+                file_item = cont.file(dest_filename)
+
+                self.assertEqual(data, file_item.read())
+                self.assertTrue(file_item.initialize())
+                self.assertEqual(metadata, file_item.metadata)
 
     def testCopyFromHeader404s(self):
         source_filename = Utils.create_name()
-        file = self.env.container.file(source_filename)
-        file.write_random()
+        file_item = self.env.container.file(source_filename)
+        file_item.write_random()
 
         for prefix in ('', '/'):
             # invalid source container
-            file = self.env.container.file(Utils.create_name())
-            self.assertRaises(ResponseError, file.write,
-                              hdrs={'X-Copy-From': '%s%s/%s' %
-                              (prefix,
-                               Utils.create_name(), source_filename)})
+            file_item = self.env.container.file(Utils.create_name())
+            copy_from = ('%s%s/%s'
+                         % (prefix, Utils.create_name(), source_filename))
+            self.assertRaises(ResponseError, file_item.write,
+                              hdrs={'X-Copy-From': copy_from})
+            self.assert_status(404)
+
+            # invalid source object
+            copy_from = ('%s%s/%s'
+                         % (prefix, self.env.container.name,
+                            Utils.create_name()))
+            file_item = self.env.container.file(Utils.create_name())
+            self.assertRaises(ResponseError, file_item.write,
+                              hdrs={'X-Copy-From': copy_from})
+            self.assert_status(404)
+
+            # invalid destination container
+            dest_cont = self.env.account.container(Utils.create_name())
+            file_item = dest_cont.file(Utils.create_name())
+            copy_from = ('%s%s/%s'
+                         % (prefix, self.env.container.name, source_filename))
+            self.assertRaises(ResponseError, file_item.write,
+                              hdrs={'X-Copy-From': copy_from})
             self.assert_status(404)
 
+    def testCopyFromAccountHeader404s(self):
+        if tf.skip2:
+            raise SkipTest('Account2 not set')
+        acct = self.env.conn2.account_name
+        src_cont = self.env.account2.container(Utils.create_name())
+        self.assertTrue(src_cont.create(hdrs={
+            'X-Container-Read': self.env.conn.user_acl
+        }))
+        source_filename = Utils.create_name()
+        file_item = src_cont.file(source_filename)
+        file_item.write_random()
+        dest_cont = self.env.account.container(Utils.create_name())
+        self.assertTrue(dest_cont.create())
+
+        for prefix in ('', '/'):
+            # invalid source container
+            file_item = dest_cont.file(Utils.create_name())
+            self.assertRaises(ResponseError, file_item.write,
+                              hdrs={'X-Copy-From-Account': acct,
+                                    'X-Copy-From': '%s%s/%s' %
+                                                   (prefix,
+                                                    Utils.create_name(),
+                                                    source_filename)})
+            self.assert_status(403)
+
             # invalid source object
-            file = self.env.container.file(Utils.create_name())
-            self.assertRaises(ResponseError, file.write,
-                              hdrs={'X-Copy-From': '%s%s/%s' %
-                              (prefix,
-                               self.env.container.name, Utils.create_name())})
+            file_item = self.env.container.file(Utils.create_name())
+            self.assertRaises(ResponseError, file_item.write,
+                              hdrs={'X-Copy-From-Account': acct,
+                                    'X-Copy-From': '%s%s/%s' %
+                                                   (prefix,
+                                                    src_cont,
+                                                    Utils.create_name())})
             self.assert_status(404)
 
             # invalid destination container
             dest_cont = self.env.account.container(Utils.create_name())
-            file = dest_cont.file(Utils.create_name())
-            self.assertRaises(ResponseError, file.write,
-                              hdrs={'X-Copy-From': '%s%s/%s' %
-                              (prefix,
-                               self.env.container.name, source_filename)})
+            file_item = dest_cont.file(Utils.create_name())
+            self.assertRaises(ResponseError, file_item.write,
+                              hdrs={'X-Copy-From-Account': acct,
+                                    'X-Copy-From': '%s%s/%s' %
+                                                   (prefix,
+                                                    src_cont,
+                                                    source_filename)})
             self.assert_status(404)
 
+    def testCopyFromAccountHeader403s(self):
+        if tf.skip2:
+            raise SkipTest('Account2 not set')
+        acct = self.env.conn2.account_name
+        src_cont = self.env.account2.container(Utils.create_name())
+        self.assertTrue(src_cont.create())  # Primary user has no access
+        source_filename = Utils.create_name()
+        file_item = src_cont.file(source_filename)
+        file_item.write_random()
+        dest_cont = self.env.account.container(Utils.create_name())
+        self.assertTrue(dest_cont.create())
+
+        for prefix in ('', '/'):
+            # invalid source container
+            file_item = dest_cont.file(Utils.create_name())
+            self.assertRaises(ResponseError, file_item.write,
+                              hdrs={'X-Copy-From-Account': acct,
+                                    'X-Copy-From': '%s%s/%s' %
+                                                   (prefix,
+                                                    Utils.create_name(),
+                                                    source_filename)})
+            self.assert_status(403)
+
+            # invalid source object
+            file_item = self.env.container.file(Utils.create_name())
+            self.assertRaises(ResponseError, file_item.write,
+                              hdrs={'X-Copy-From-Account': acct,
+                                    'X-Copy-From': '%s%s/%s' %
+                                                   (prefix,
+                                                    src_cont,
+                                                    Utils.create_name())})
+            self.assert_status(403)
+
+            # invalid destination container
+            dest_cont = self.env.account.container(Utils.create_name())
+            file_item = dest_cont.file(Utils.create_name())
+            self.assertRaises(ResponseError, file_item.write,
+                              hdrs={'X-Copy-From-Account': acct,
+                                    'X-Copy-From': '%s%s/%s' %
+                                                   (prefix,
+                                                    src_cont,
+                                                    source_filename)})
+            self.assert_status(403)
+
     def testNameLimit(self):
         limit = load_constraint('max_object_name_length')
 
-        for l in (1, 10, limit / 2, limit - 1, limit, limit + 1, limit * 2):
-            file = self.env.container.file('a' * l)
+        for lim in (1, 10, limit // 2, limit - 1, limit, limit + 1, limit * 2):
+            file_item = self.env.container.file('a' * lim)
 
-            if l <= limit:
-                self.assert_(file.write())
+            if lim <= limit:
+                self.assertTrue(file_item.write())
                 self.assert_status(201)
             else:
-                self.assertRaises(ResponseError, file.write)
+                self.assertRaises(ResponseError, file_item.write)
                 self.assert_status(400)
 
     def testQuestionMarkInName(self):
@@ -1032,30 +1964,32 @@ def testQuestionMarkInName(self):
         else:
             file_name = Utils.create_name(6) + '?' + Utils.create_name(6)
 
-        file = self.env.container.file(file_name)
-        self.assert_(file.write(cfg={'no_path_quote': True}))
-        self.assert_(file_name not in self.env.container.files())
-        self.assert_(file_name.split('?')[0] in self.env.container.files())
+        file_item = self.env.container.file(file_name)
+        self.assertTrue(file_item.write(cfg={'no_path_quote': True}))
+        self.assertNotIn(file_name, self.env.container.files())
+        self.assertIn(file_name.split('?')[0], self.env.container.files())
 
     def testDeleteThen404s(self):
-        file = self.env.container.file(Utils.create_name())
-        self.assert_(file.write_random())
+        file_item = self.env.container.file(Utils.create_name())
+        self.assertTrue(file_item.write_random())
         self.assert_status(201)
 
-        self.assert_(file.delete())
+        self.assertTrue(file_item.delete())
         self.assert_status(204)
 
-        file.metadata = {Utils.create_ascii_name(): Utils.create_name()}
+        file_item.metadata = {Utils.create_ascii_name(): Utils.create_name()}
 
-        for method in (file.info, file.read, file.sync_metadata,
-                       file.delete):
+        for method in (file_item.info,
+                       file_item.read,
+                       file_item.sync_metadata,
+                       file_item.delete):
             self.assertRaises(ResponseError, method)
             self.assert_status(404)
 
     def testBlankMetadataName(self):
-        file = self.env.container.file(Utils.create_name())
-        file.metadata = {'': Utils.create_name()}
-        self.assertRaises(ResponseError, file.write_random)
+        file_item = self.env.container.file(Utils.create_name())
+        file_item.metadata = {'': Utils.create_name()}
+        self.assertRaises(ResponseError, file_item.write_random)
         self.assert_status(400)
 
     def testMetadataNumberLimit(self):
@@ -1065,9 +1999,8 @@ def testMetadataNumberLimit(self):
         for i in (number_limit - 10, number_limit - 1, number_limit,
                   number_limit + 1, number_limit + 10, number_limit + 100):
 
-            j = size_limit / (i * 2)
+            j = size_limit // (i * 2)
 
-            size = 0
             metadata = {}
             while len(metadata.keys()) < i:
                 key = Utils.create_ascii_name()
@@ -1075,27 +2008,28 @@ def testMetadataNumberLimit(self):
 
                 if len(key) > j:
                     key = key[:j]
-                    val = val[:j]
+                    # NB: we'll likely write object metadata that's *not* UTF-8
+                    val = val.encode('utf8')[:j].decode(
+                        'utf8', 'surrogateescape')
 
-                size += len(key) + len(val)
                 metadata[key] = val
 
-            file = self.env.container.file(Utils.create_name())
-            file.metadata = metadata
+            file_item = self.env.container.file(Utils.create_name())
+            file_item.metadata = metadata
 
             if i <= number_limit:
-                self.assert_(file.write())
+                self.assertTrue(file_item.write())
                 self.assert_status(201)
-                self.assert_(file.sync_metadata())
-                self.assert_status((201, 202))
+                self.assertTrue(file_item.sync_metadata())
+                self.assert_status(202)
             else:
-                self.assertRaises(ResponseError, file.write)
+                self.assertRaises(ResponseError, file_item.write)
                 self.assert_status(400)
-                file.metadata = {}
-                self.assert_(file.write())
+                file_item.metadata = {}
+                self.assertTrue(file_item.write())
                 self.assert_status(201)
-                file.metadata = metadata
-                self.assertRaises(ResponseError, file.sync_metadata)
+                file_item.metadata = metadata
+                self.assertRaises(ResponseError, file_item.sync_metadata)
                 self.assert_status(400)
 
     def testContentTypeGuessing(self):
@@ -1103,29 +2037,35 @@ def testContentTypeGuessing(self):
                       'zip': 'application/zip'}
 
         container = self.env.account.container(Utils.create_name())
-        self.assert_(container.create())
+        self.assertTrue(container.create())
 
         for i in file_types.keys():
-            file = container.file(Utils.create_name() + '.' + i)
-            file.write('', cfg={'no_content_type': True})
+            file_item = container.file(Utils.create_name() + '.' + i)
+            file_item.write(b'', cfg={'no_content_type': True})
 
         file_types_read = {}
         for i in container.files(parms={'format': 'json'}):
             file_types_read[i['name'].split('.')[1]] = i['content_type']
 
-        self.assertEquals(file_types, file_types_read)
+        self.assertEqual(file_types, file_types_read)
 
     def testRangedGets(self):
-        file_length = 10000
-        range_size = file_length / 10
-        file = self.env.container.file(Utils.create_name())
-        data = file.write_random(file_length)
+        # We set the file_length to a strange multiple here. This is to check
+        # that ranges still work in the EC case when the requested range
+        # spans EC segment boundaries. The 1 MiB base value is chosen because
+        # that's a common EC segment size. The 1.33 multiple is to ensure we
+        # aren't aligned on segment boundaries
+        file_length = int(1048576 * 1.33)
+        range_size = file_length // 10
+        file_item = self.env.container.file(Utils.create_name())
+        data = file_item.write_random(file_length)
 
         for i in range(0, file_length, range_size):
             range_string = 'bytes=%d-%d' % (i, i + range_size - 1)
             hdrs = {'Range': range_string}
-            self.assert_(data[i: i + range_size] == file.read(hdrs=hdrs),
-                         range_string)
+            self.assertEqual(
+                data[i: i + range_size], file_item.read(hdrs=hdrs),
+                range_string)
 
             range_string = 'bytes=-%d' % (i)
             hdrs = {'Range': range_string}
@@ -1135,101 +2075,290 @@ def testRangedGets(self):
                 # least one suffix-byte-range-spec with a NON-ZERO
                 # suffix-length, then the byte-range-set is satisfiable.
                 # Otherwise, the byte-range-set is unsatisfiable.
-                self.assertRaises(ResponseError, file.read, hdrs=hdrs)
+                self.assertRaises(ResponseError, file_item.read, hdrs=hdrs)
                 self.assert_status(416)
+                self.assert_header('content-range', 'bytes */%d' % file_length)
             else:
-                self.assertEquals(file.read(hdrs=hdrs), data[-i:])
+                self.assertEqual(file_item.read(hdrs=hdrs), data[-i:])
+                self.assert_header('content-range', 'bytes %d-%d/%d' % (
+                    file_length - i, file_length - 1, file_length))
+            self.assert_etag(file_item.md5)
+            self.assert_header('accept-ranges', 'bytes')
 
             range_string = 'bytes=%d-' % (i)
             hdrs = {'Range': range_string}
-            self.assert_(file.read(hdrs=hdrs) == data[i - file_length:],
-                         range_string)
+            self.assertEqual(
+                file_item.read(hdrs=hdrs), data[i - file_length:],
+                range_string)
 
         range_string = 'bytes=%d-%d' % (file_length + 1000, file_length + 2000)
         hdrs = {'Range': range_string}
-        self.assertRaises(ResponseError, file.read, hdrs=hdrs)
+        self.assertRaises(ResponseError, file_item.read, hdrs=hdrs)
         self.assert_status(416)
+        self.assert_header('content-range', 'bytes */%d' % file_length)
+        self.assert_etag(file_item.md5)
+        self.assert_header('accept-ranges', 'bytes')
 
         range_string = 'bytes=%d-%d' % (file_length - 1000, file_length + 2000)
         hdrs = {'Range': range_string}
-        self.assert_(file.read(hdrs=hdrs) == data[-1000:], range_string)
+        self.assertEqual(file_item.read(hdrs=hdrs), data[-1000:], range_string)
 
         hdrs = {'Range': '0-4'}
-        self.assert_(file.read(hdrs=hdrs) == data, range_string)
+        self.assertEqual(file_item.read(hdrs=hdrs), data, '0-4')
 
         # RFC 2616 14.35.1
         # "If the entity is shorter than the specified suffix-length, the
         # entire entity-body is used."
         range_string = 'bytes=-%d' % (file_length + 10)
         hdrs = {'Range': range_string}
-        self.assert_(file.read(hdrs=hdrs) == data, range_string)
+        self.assertEqual(file_item.read(hdrs=hdrs), data, range_string)
+
+    def testMultiRangeGets(self):
+        file_length = 10000
+        range_size = file_length // 10
+        subrange_size = range_size // 10
+        file_item = self.env.container.file(Utils.create_name())
+        data = file_item.write_random(
+            file_length, hdrs={"Content-Type":
+                               "lovecraft/rugose; squamous=true"})
+
+        for i in range(0, file_length, range_size):
+            range_string = 'bytes=%d-%d,%d-%d,%d-%d' % (
+                i, i + subrange_size - 1,
+                i + 2 * subrange_size, i + 3 * subrange_size - 1,
+                i + 4 * subrange_size, i + 5 * subrange_size - 1)
+            hdrs = {'Range': range_string}
+
+            fetched = file_item.read(hdrs=hdrs)
+            self.assert_status(206)
+            content_type = file_item.content_type
+            self.assertTrue(content_type.startswith("multipart/byteranges"))
+            self.assertIsNone(file_item.content_range)
+
+            # email.parser.FeedParser wants a message with headers on the
+            # front, then two CRLFs, and then a body (like emails have but
+            # HTTP response bodies don't). We fake it out by constructing a
+            # one-header preamble containing just the Content-Type, then
+            # feeding in the response body.
+            parser = FeedParser()
+            parser.feed(b"Content-Type: %s\r\n\r\n" % content_type.encode())
+            parser.feed(fetched)
+            root_message = parser.close()
+            self.assertTrue(root_message.is_multipart())
+
+            byteranges = root_message.get_payload()
+            self.assertEqual(len(byteranges), 3)
+
+            self.assertEqual(byteranges[0]['Content-Type'],
+                             "lovecraft/rugose; squamous=true")
+            self.assertEqual(
+                byteranges[0]['Content-Range'],
+                "bytes %d-%d/%d" % (i, i + subrange_size - 1, file_length))
+            self.assertEqual(
+                byteranges[0].get_payload(decode=True),
+                data[i:(i + subrange_size)])
+
+            self.assertEqual(byteranges[1]['Content-Type'],
+                             "lovecraft/rugose; squamous=true")
+            self.assertEqual(
+                byteranges[1]['Content-Range'],
+                "bytes %d-%d/%d" % (i + 2 * subrange_size,
+                                    i + 3 * subrange_size - 1, file_length))
+            self.assertEqual(
+                byteranges[1].get_payload(decode=True),
+                data[(i + 2 * subrange_size):(i + 3 * subrange_size)])
+
+            self.assertEqual(byteranges[2]['Content-Type'],
+                             "lovecraft/rugose; squamous=true")
+            self.assertEqual(
+                byteranges[2]['Content-Range'],
+                "bytes %d-%d/%d" % (i + 4 * subrange_size,
+                                    i + 5 * subrange_size - 1, file_length))
+            self.assertEqual(
+                byteranges[2].get_payload(decode=True),
+                data[(i + 4 * subrange_size):(i + 5 * subrange_size)])
+
+        # The first two ranges are satisfiable but the third is not; the
+        # result is a multipart/byteranges response containing only the two
+        # satisfiable byteranges.
+        range_string = 'bytes=%d-%d,%d-%d,%d-%d' % (
+            0, subrange_size - 1,
+            2 * subrange_size, 3 * subrange_size - 1,
+            file_length, file_length + subrange_size - 1)
+        hdrs = {'Range': range_string}
+        fetched = file_item.read(hdrs=hdrs)
+        self.assert_status(206)
+        content_type = file_item.content_type
+        self.assertTrue(content_type.startswith("multipart/byteranges"))
+        self.assertIsNone(file_item.content_range)
+
+        parser = FeedParser()
+        parser.feed(b"Content-Type: %s\r\n\r\n" % content_type.encode())
+        parser.feed(fetched)
+        root_message = parser.close()
+
+        self.assertTrue(root_message.is_multipart())
+        byteranges = root_message.get_payload()
+        self.assertEqual(len(byteranges), 2)
+
+        self.assertEqual(byteranges[0]['Content-Type'],
+                         "lovecraft/rugose; squamous=true")
+        self.assertEqual(
+            byteranges[0]['Content-Range'],
+            "bytes %d-%d/%d" % (0, subrange_size - 1, file_length))
+        self.assertEqual(byteranges[0].get_payload(decode=True),
+                         data[:subrange_size])
+
+        self.assertEqual(byteranges[1]['Content-Type'],
+                         "lovecraft/rugose; squamous=true")
+        self.assertEqual(
+            byteranges[1]['Content-Range'],
+            "bytes %d-%d/%d" % (2 * subrange_size, 3 * subrange_size - 1,
+                                file_length))
+        self.assertEqual(
+            byteranges[1].get_payload(decode=True),
+            data[(2 * subrange_size):(3 * subrange_size)])
+
+        # The first range is satisfiable but the second is not; the
+        # result is either a multipart/byteranges response containing one
+        # byterange or a normal, non-MIME 206 response.
+        range_string = 'bytes=%d-%d,%d-%d' % (
+            0, subrange_size - 1,
+            file_length, file_length + subrange_size - 1)
+        hdrs = {'Range': range_string}
+        fetched = file_item.read(hdrs=hdrs)
+        self.assert_status(206)
+        content_type = file_item.content_type
+        if content_type.startswith("multipart/byteranges"):
+            self.assertIsNone(file_item.content_range)
+            parser = FeedParser()
+            parser.feed(b"Content-Type: %s\r\n\r\n" % content_type.encode())
+            parser.feed(fetched)
+            root_message = parser.close()
+
+            self.assertTrue(root_message.is_multipart())
+            byteranges = root_message.get_payload()
+            self.assertEqual(len(byteranges), 1)
+
+            self.assertEqual(byteranges[0]['Content-Type'],
+                             "lovecraft/rugose; squamous=true")
+            self.assertEqual(
+                byteranges[0]['Content-Range'],
+                "bytes %d-%d/%d" % (0, subrange_size - 1, file_length))
+            self.assertEqual(byteranges[0].get_payload(decode=True),
+                             data[:subrange_size])
+        else:
+            self.assertEqual(
+                file_item.content_range,
+                "bytes %d-%d/%d" % (0, subrange_size - 1, file_length))
+            self.assertEqual(content_type, "lovecraft/rugose; squamous=true")
+            self.assertEqual(fetched, data[:subrange_size])
+
+        # No byterange is satisfiable, so we get a 416 response.
+        range_string = 'bytes=%d-%d,%d-%d' % (
+            file_length, file_length + 2,
+            file_length + 100, file_length + 102)
+        hdrs = {'Range': range_string}
+
+        self.assertRaises(ResponseError, file_item.read, hdrs=hdrs)
+        self.assert_status(416)
+        self.assert_header('content-range', 'bytes */%d' % file_length)
 
     def testRangedGetsWithLWSinHeader(self):
-        #Skip this test until webob 1.2 can tolerate LWS in Range header.
         file_length = 10000
-        range_size = file_length / 10
-        file = self.env.container.file(Utils.create_name())
-        data = file.write_random(file_length)
+        file_item = self.env.container.file(Utils.create_name())
+        data = file_item.write_random(file_length)
 
         for r in ('BYTES=0-999', 'bytes = 0-999', 'BYTES = 0 - 999',
                   'bytes = 0 - 999', 'bytes=0 - 999', 'bytes=0-999 '):
 
-            self.assert_(file.read(hdrs={'Range': r}) == data[0:1000])
+            self.assertEqual(file_item.read(hdrs={'Range': r}), data[0:1000])
 
     def testFileSizeLimit(self):
         limit = load_constraint('max_file_size')
         tsecs = 3
 
+        def timeout(seconds, method, *args, **kwargs):
+            try:
+                with eventlet.Timeout(seconds):
+                    method(*args, **kwargs)
+            except eventlet.Timeout:
+                return True
+            else:
+                return False
+
+        # This loop will result in fallocate calls for 4x the limit
+        # (minus 111 bytes). With fallocate turned on in the object servers,
+        # this may fail if you don't have 4x the limit available on your
+        # data drives.
+
+        # Note that this test does not actually send any data to the system.
+        # All it does is ensure that a response (success or failure) comes
+        # back within 3 seconds. For the successful tests (size smaller
+        # than limit), the cluster will log a 499.
+
         for i in (limit - 100, limit - 10, limit - 1, limit, limit + 1,
                   limit + 10, limit + 100):
 
-            file = self.env.container.file(Utils.create_name())
+            file_item = self.env.container.file(Utils.create_name())
 
             if i <= limit:
-                self.assert_(timeout(tsecs, file.write,
-                             cfg={'set_content_length': i}))
+                self.assertTrue(timeout(tsecs, file_item.write,
+                                cfg={'set_content_length': i}))
             else:
                 self.assertRaises(ResponseError, timeout, tsecs,
-                                  file.write, cfg={'set_content_length': i})
+                                  file_item.write,
+                                  cfg={'set_content_length': i})
 
     def testNoContentLengthForPut(self):
-        file = self.env.container.file(Utils.create_name())
-        self.assertRaises(ResponseError, file.write, 'testing',
+        file_item = self.env.container.file(Utils.create_name())
+        self.assertRaises(ResponseError, file_item.write, b'testing',
                           cfg={'no_content_length': True})
         self.assert_status(411)
 
     def testDelete(self):
-        file = self.env.container.file(Utils.create_name())
-        file.write_random(self.env.file_size)
+        file_item = self.env.container.file(Utils.create_name())
+        file_item.write_random(self.env.file_size)
 
-        self.assert_(file.name in self.env.container.files())
-        self.assert_(file.delete())
-        self.assert_(file.name not in self.env.container.files())
+        self.assertIn(file_item.name, self.env.container.files())
+        self.assertTrue(file_item.delete())
+        self.assertNotIn(file_item.name, self.env.container.files())
 
     def testBadHeaders(self):
         file_length = 100
 
         # no content type on puts should be ok
-        file = self.env.container.file(Utils.create_name())
-        file.write_random(file_length, cfg={'no_content_type': True})
+        file_item = self.env.container.file(Utils.create_name())
+        file_item.write_random(file_length, cfg={'no_content_type': True})
         self.assert_status(201)
 
         # content length x
-        self.assertRaises(ResponseError, file.write_random, file_length,
+        self.assertRaises(ResponseError, file_item.write_random, file_length,
                           hdrs={'Content-Length': 'X'},
                           cfg={'no_content_length': True})
         self.assert_status(400)
 
+        # no content-length
+        self.assertRaises(ResponseError, file_item.write_random, file_length,
+                          cfg={'no_content_length': True})
+        self.assert_status(411)
+
+        self.assertRaises(ResponseError, file_item.write_random, file_length,
+                          hdrs={'transfer-encoding': 'gzip,chunked'},
+                          cfg={'no_content_length': True})
+        self.assert_status(501)
+
         # bad request types
-        #for req in ('LICK', 'GETorHEAD_base', 'container_info',
-        #            'best_response'):
+        # for req in ('LICK', 'GETorHEAD_base', 'container_info',
+        #             'best_response'):
         for req in ('LICK', 'GETorHEAD_base'):
             self.env.account.conn.make_request(req)
             self.assert_status(405)
 
         # bad range headers
-        self.assert_(len(file.read(hdrs={'Range': 'parsecs=8-12'})) ==
-                     file_length)
+        self.assertEqual(
+            len(file_item.read(hdrs={'Range': 'parsecs=8-12'})),
+            file_length)
         self.assert_status(200)
 
     def testMetadataLengthLimits(self):
@@ -1242,135 +2371,137 @@ def testMetadataLengthLimits(self):
 
         for l in lengths:
             metadata = {'a' * l[0]: 'b' * l[1]}
-            file = self.env.container.file(Utils.create_name())
-            file.metadata = metadata
+            file_item = self.env.container.file(Utils.create_name())
+            file_item.metadata = metadata
 
             if l[0] <= key_limit and l[1] <= value_limit:
-                self.assert_(file.write())
+                self.assertTrue(file_item.write())
                 self.assert_status(201)
-                self.assert_(file.sync_metadata())
+                self.assertTrue(file_item.sync_metadata())
             else:
-                self.assertRaises(ResponseError, file.write)
+                self.assertRaises(ResponseError, file_item.write)
                 self.assert_status(400)
-                file.metadata = {}
-                self.assert_(file.write())
+                file_item.metadata = {}
+                self.assertTrue(file_item.write())
                 self.assert_status(201)
-                file.metadata = metadata
-                self.assertRaises(ResponseError, file.sync_metadata)
+                file_item.metadata = metadata
+                self.assertRaises(ResponseError, file_item.sync_metadata)
                 self.assert_status(400)
 
     def testEtagWayoff(self):
-        file = self.env.container.file(Utils.create_name())
+        file_item = self.env.container.file(Utils.create_name())
         hdrs = {'etag': 'reallylonganddefinitelynotavalidetagvalue'}
-        self.assertRaises(ResponseError, file.write_random, hdrs=hdrs)
+        self.assertRaises(ResponseError, file_item.write_random, hdrs=hdrs)
         self.assert_status(422)
 
     def testFileCreate(self):
         for i in range(10):
-            file = self.env.container.file(Utils.create_name())
-            data = file.write_random()
+            file_item = self.env.container.file(Utils.create_name())
+            data = file_item.write_random()
             self.assert_status(201)
-            self.assert_(data == file.read())
+            self.assertEqual(data, file_item.read())
             self.assert_status(200)
 
     def testHead(self):
         file_name = Utils.create_name()
         content_type = Utils.create_name()
 
-        file = self.env.container.file(file_name)
-        file.content_type = content_type
-        file.write_random(self.env.file_size)
+        file_item = self.env.container.file(file_name)
+        file_item.content_type = content_type
+        file_item.write_random(self.env.file_size)
 
-        md5 = file.md5
+        expected_etag = file_item.md5
+        if tf.cluster_info.get('etag_quoter', {}).get('enable_by_default'):
+            expected_etag = '"%s"' % expected_etag
 
-        file = self.env.container.file(file_name)
-        info = file.info()
+        file_item = self.env.container.file(file_name)
+        info = file_item.info()
 
         self.assert_status(200)
-        self.assertEquals(info['content_length'], self.env.file_size)
-        self.assertEquals(info['etag'], md5)
-        self.assertEquals(info['content_type'], content_type)
-        self.assert_('last_modified' in info)
+        self.assertEqual(info['content_length'], self.env.file_size)
+        self.assertEqual(info['etag'], expected_etag)
+        self.assertEqual(info['content_type'], content_type)
+        self.assertIn('last_modified', info)
 
     def testDeleteOfFileThatDoesNotExist(self):
         # in container that exists
-        file = self.env.container.file(Utils.create_name())
-        self.assertRaises(ResponseError, file.delete)
+        file_item = self.env.container.file(Utils.create_name())
+        self.assertRaises(ResponseError, file_item.delete)
         self.assert_status(404)
 
         # in container that does not exist
         container = self.env.account.container(Utils.create_name())
-        file = container.file(Utils.create_name())
-        self.assertRaises(ResponseError, file.delete)
+        file_item = container.file(Utils.create_name())
+        self.assertRaises(ResponseError, file_item.delete)
         self.assert_status(404)
 
     def testHeadOnFileThatDoesNotExist(self):
         # in container that exists
-        file = self.env.container.file(Utils.create_name())
-        self.assertRaises(ResponseError, file.info)
+        file_item = self.env.container.file(Utils.create_name())
+        self.assertRaises(ResponseError, file_item.info)
         self.assert_status(404)
 
         # in container that does not exist
         container = self.env.account.container(Utils.create_name())
-        file = container.file(Utils.create_name())
-        self.assertRaises(ResponseError, file.info)
+        file_item = container.file(Utils.create_name())
+        self.assertRaises(ResponseError, file_item.info)
         self.assert_status(404)
 
     def testMetadataOnPost(self):
-        file = self.env.container.file(Utils.create_name())
-        file.write_random(self.env.file_size)
+        file_item = self.env.container.file(Utils.create_name())
+        file_item.write_random(self.env.file_size)
 
         for i in range(10):
             metadata = {}
-            for i in range(10):
+            for j in range(10):
                 metadata[Utils.create_ascii_name()] = Utils.create_name()
 
-            file.metadata = metadata
-            self.assert_(file.sync_metadata())
-            self.assert_status((201, 202))
+            file_item.metadata = metadata
+            self.assertTrue(file_item.sync_metadata())
+            self.assert_status(202)
 
-            file = self.env.container.file(file.name)
-            self.assert_(file.initialize())
+            file_item = self.env.container.file(file_item.name)
+            self.assertTrue(file_item.initialize())
             self.assert_status(200)
-            self.assertEquals(file.metadata, metadata)
+            self.assertEqual(file_item.metadata, metadata)
 
     def testGetContentType(self):
         file_name = Utils.create_name()
         content_type = Utils.create_name()
 
-        file = self.env.container.file(file_name)
-        file.content_type = content_type
-        file.write_random()
+        file_item = self.env.container.file(file_name)
+        file_item.content_type = content_type
+        file_item.write_random()
 
-        file = self.env.container.file(file_name)
-        file.read()
+        file_item = self.env.container.file(file_name)
+        file_item.read()
 
-        self.assertEquals(content_type, file.content_type)
+        self.assertEqual(content_type, file_item.content_type)
 
     def testGetOnFileThatDoesNotExist(self):
         # in container that exists
-        file = self.env.container.file(Utils.create_name())
-        self.assertRaises(ResponseError, file.read)
+        file_item = self.env.container.file(Utils.create_name())
+        self.assertRaises(ResponseError, file_item.read)
         self.assert_status(404)
 
         # in container that does not exist
         container = self.env.account.container(Utils.create_name())
-        file = container.file(Utils.create_name())
-        self.assertRaises(ResponseError, file.read)
+        file_item = container.file(Utils.create_name())
+        self.assertRaises(ResponseError, file_item.read)
         self.assert_status(404)
 
     def testPostOnFileThatDoesNotExist(self):
         # in container that exists
-        file = self.env.container.file(Utils.create_name())
-        file.metadata['Field'] = 'Value'
-        self.assertRaises(ResponseError, file.sync_metadata)
+        file_item = self.env.container.file(Utils.create_name())
+        file_item.metadata['Field'] = 'Value'
+        self.assertRaises(ResponseError, file_item.sync_metadata)
         self.assert_status(404)
 
         # in container that does not exist
         container = self.env.account.container(Utils.create_name())
-        file = container.file(Utils.create_name())
-        file.metadata['Field'] = 'Value'
-        self.assertRaises(ResponseError, file.sync_metadata)
+        file_item = container.file(Utils.create_name())
+        file_item.metadata['Field'] = 'Value'
+        self.assertRaises(ResponseError, file_item.sync_metadata)
         self.assert_status(404)
 
     def testMetadataOnPut(self):
@@ -1379,18 +2510,18 @@ def testMetadataOnPut(self):
             for j in range(10):
                 metadata[Utils.create_ascii_name()] = Utils.create_name()
 
-            file = self.env.container.file(Utils.create_name())
-            file.metadata = metadata
-            file.write_random(self.env.file_size)
+            file_item = self.env.container.file(Utils.create_name())
+            file_item.metadata = metadata
+            file_item.write_random(self.env.file_size)
 
-            file = self.env.container.file(file.name)
-            self.assert_(file.initialize())
+            file_item = self.env.container.file(file_item.name)
+            self.assertTrue(file_item.initialize())
             self.assert_status(200)
-            self.assertEquals(file.metadata, metadata)
+            self.assertEqual(file_item.metadata, metadata)
 
     def testSerialization(self):
         container = self.env.account.container(Utils.create_name())
-        self.assert_(container.create())
+        self.assertTrue(container.create())
 
         files = []
         for i in (0, 1, 10, 100, 1000, 10000):
@@ -1399,122 +2530,179 @@ def testSerialization(self):
 
         write_time = time.time()
         for f in files:
-            file = container.file(f['name'])
-            file.content_type = f['content_type']
-            file.write_random(f['bytes'])
+            file_item = container.file(f['name'])
+            file_item.content_type = f['content_type']
+            file_item.write_random(f['bytes'])
 
-            f['hash'] = file.md5
+            f['hash'] = file_item.md5
             f['json'] = False
             f['xml'] = False
         write_time = time.time() - write_time
 
-        for format in ['json', 'xml']:
-            for file in container.files(parms={'format': format}):
+        for format_type in ['json', 'xml']:
+            for file_item in container.files(parms={'format': format_type}):
                 found = False
                 for f in files:
-                    if f['name'] != file['name']:
+                    if f['name'] != file_item['name']:
                         continue
 
-                    self.assertEquals(file['content_type'],
-                                      f['content_type'])
-                    self.assertEquals(int(file['bytes']), f['bytes'])
+                    self.assertEqual(file_item['content_type'],
+                                     f['content_type'])
+                    self.assertEqual(int(file_item['bytes']), f['bytes'])
 
-                    d = datetime.strptime(file['last_modified'].split('.')[0],
-                                          "%Y-%m-%dT%H:%M:%S")
+                    d = datetime.strptime(
+                        file_item['last_modified'].split('.')[0],
+                        "%Y-%m-%dT%H:%M:%S")
                     lm = time.mktime(d.timetuple())
 
                     if 'last_modified' in f:
-                        self.assertEquals(f['last_modified'], lm)
+                        self.assertEqual(f['last_modified'], lm)
                     else:
                         f['last_modified'] = lm
 
-                    f[format] = True
+                    f[format_type] = True
                     found = True
 
-                self.assert_(found, 'Unexpected file %s found in '
-                             '%s listing' % (file['name'], format))
+                self.assertTrue(
+                    found, 'Unexpected file %s found in '
+                    '%s listing' % (file_item['name'], format_type))
 
-            headers = dict(self.env.conn.response.getheaders())
-            if format == 'json':
-                self.assertEquals(headers['content-type'],
-                                  'application/json; charset=utf-8')
-            elif format == 'xml':
-                self.assertEquals(headers['content-type'],
-                                  'application/xml; charset=utf-8')
+            headers = dict((h.lower(), v)
+                           for h, v in self.env.conn.response.getheaders())
+            if format_type == 'json':
+                self.assertEqual(headers['content-type'],
+                                 'application/json; charset=utf-8')
+            elif format_type == 'xml':
+                self.assertEqual(headers['content-type'],
+                                 'application/xml; charset=utf-8')
 
         lm_diff = max([f['last_modified'] for f in files]) -\
             min([f['last_modified'] for f in files])
-        self.assert_(lm_diff < write_time + 1, 'Diff in last '
-                     'modified times should be less than time to write files')
+        self.assertLess(lm_diff, write_time + 1,
+                        'Diff in last modified times '
+                        'should be less than time to write files')
 
         for f in files:
-            for format in ['json', 'xml']:
-                self.assert_(f[format], 'File %s not found in %s listing'
-                             % (f['name'], format))
+            for format_type in ['json', 'xml']:
+                self.assertTrue(
+                    f[format_type], 'File %s not found in %s listing'
+                    % (f['name'], format_type))
 
     def testStackedOverwrite(self):
-        file = self.env.container.file(Utils.create_name())
+        file_item = self.env.container.file(Utils.create_name())
 
         for i in range(1, 11):
-            data = file.write_random(512)
-            file.write(data)
-
-        self.assert_(file.read() == data)
+            data = file_item.write_random(512)
+            file_item.write(data)
 
-    def testTooLongName(self):
-        file = self.env.container.file('x' * 1025)
-        self.assertRaises(ResponseError, file.write)
-        self.assert_status(400)
+        self.assertEqual(file_item.read(), data)
 
     def testZeroByteFile(self):
-        file = self.env.container.file(Utils.create_name())
+        file_item = self.env.container.file(Utils.create_name())
 
-        self.assert_(file.write(''))
-        self.assert_(file.name in self.env.container.files())
-        self.assert_(file.read() == '')
+        self.assertTrue(file_item.write(b''))
+        self.assertIn(file_item.name, self.env.container.files())
+        self.assertEqual(file_item.read(), b'')
 
     def testEtagResponse(self):
-        file = self.env.container.file(Utils.create_name())
+        file_item = self.env.container.file(Utils.create_name())
 
-        data = StringIO.StringIO(file.write_random(512))
-        etag = File.compute_md5sum(data)
+        data = io.BytesIO(file_item.write_random(512))
+        self.assert_etag(File.compute_md5sum(data))
 
-        headers = dict(self.env.conn.response.getheaders())
-        self.assert_('etag' in headers.keys())
+    def testChunkedPut(self):
+        if (tf.web_front_end == 'apache2'):
+            raise SkipTest("Chunked PUT cannot be tested with apache2 web "
+                           "front end")
 
-        header_etag = headers['etag'].strip('"')
-        self.assertEquals(etag, header_etag)
+        def chunks(s, length=3):
+            i, j = 0, length
+            while i < len(s):
+                yield s[i:j]
+                i, j = j, j + length
 
-    def testChunkedPut(self):
         data = File.random_data(10000)
         etag = File.compute_md5sum(data)
 
         for i in (1, 10, 100, 1000):
-            file = self.env.container.file(Utils.create_name())
+            file_item = self.env.container.file(Utils.create_name())
 
             for j in chunks(data, i):
-                file.chunked_write(j)
+                file_item.chunked_write(j)
+
+            self.assertTrue(file_item.chunked_write())
+            self.assertEqual(data, file_item.read())
 
-            self.assert_(file.chunked_write())
-            self.assert_(data == file.read())
+            info = file_item.info()
+            self.assertEqual(normalize_etag(info['etag']), etag)
 
-            info = file.info()
-            self.assertEquals(etag, info['etag'])
+    def test_POST(self):
+        # verify consistency between object and container listing metadata
+        file_name = Utils.create_name()
+        file_item = self.env.container.file(file_name)
+        file_item.content_type = 'text/foobar'
+        file_item.write_random(1024)
+
+        # sanity check
+        file_item = self.env.container.file(file_name)
+        file_item.initialize()
+        self.assertEqual('text/foobar', file_item.content_type)
+        self.assertEqual(1024, file_item.size)
+        etag = file_item.etag
+
+        # check container listing is consistent
+        listing = self.env.container.files(parms={'format': 'json'})
+        for f_dict in listing:
+            if f_dict['name'] == file_name:
+                break
+        else:
+            self.fail('Failed to find file %r in listing' % file_name)
+        self.assertEqual(1024, f_dict['bytes'])
+        self.assertEqual('text/foobar', f_dict['content_type'])
+        if tf.cluster_info.get('etag_quoter', {}).get('enable_by_default'):
+            self.assertEqual(etag, '"%s"' % f_dict['hash'])
+        else:
+            self.assertEqual(etag, f_dict['hash'])
+        put_last_modified = f_dict['last_modified']
+
+        # now POST updated content-type to each file
+        file_item = self.env.container.file(file_name)
+        file_item.content_type = 'image/foobarbaz'
+        file_item.sync_metadata({'Test': 'blah'})
+
+        # sanity check object metadata
+        file_item = self.env.container.file(file_name)
+        file_item.initialize()
+
+        self.assertEqual(1024, file_item.size)
+        self.assertEqual('image/foobarbaz', file_item.content_type)
+        self.assertEqual(etag, file_item.etag)
+        self.assertIn('test', file_item.metadata)
+
+        # check for consistency between object and container listing
+        listing = self.env.container.files(parms={'format': 'json'})
+        for f_dict in listing:
+            if f_dict['name'] == file_name:
+                break
+        else:
+            self.fail('Failed to find file %r in listing' % file_name)
+        self.assertEqual(1024, f_dict['bytes'])
+        self.assertEqual('image/foobarbaz', f_dict['content_type'])
+        self.assertLess(put_last_modified, f_dict['last_modified'])
+        if tf.cluster_info.get('etag_quoter', {}).get('enable_by_default'):
+            self.assertEqual(etag, '"%s"' % f_dict['hash'])
+        else:
+            self.assertEqual(etag, f_dict['hash'])
 
 
 class TestFileUTF8(Base2, TestFile):
-    set_up = False
+    pass
 
 
-class TestFileComparisonEnv:
+class TestFileComparisonEnv(BaseEnv):
     @classmethod
     def setUp(cls):
-        cls.conn = Connection(config)
-        cls.conn.authenticate()
-        cls.account = Account(cls.conn, config.get('account',
-                                                   config['username']))
-        cls.account.delete_containers()
-
+        super(TestFileComparisonEnv, cls).setUp()
         cls.container = cls.account.container(Utils.create_name())
 
         if not cls.container.create():
@@ -1524,73 +2712,313 @@ def setUp(cls):
         cls.file_size = 128
         cls.files = list()
         for x in range(cls.file_count):
-            file = cls.container.file(Utils.create_name())
-            file.write_random(cls.file_size)
-            cls.files.append(file)
+            file_item = cls.container.file(Utils.create_name())
+            file_item.write_random(cls.file_size)
+            cls.files.append(file_item)
 
-        cls.time_old = time.asctime(time.localtime(time.time() - 86400))
-        cls.time_new = time.asctime(time.localtime(time.time() + 86400))
+        cls.time_old_f1 = time.strftime("%a, %d %b %Y %H:%M:%S GMT",
+                                        time.gmtime(time.time() - 86400))
+        cls.time_old_f2 = time.strftime("%A, %d-%b-%y %H:%M:%S GMT",
+                                        time.gmtime(time.time() - 86400))
+        cls.time_old_f3 = time.strftime("%a %b %d %H:%M:%S %Y",
+                                        time.gmtime(time.time() - 86400))
+        cls.time_new = time.strftime("%a, %d %b %Y %H:%M:%S GMT",
+                                     time.gmtime(time.time() + 86400))
 
 
 class TestFileComparison(Base):
     env = TestFileComparisonEnv
-    set_up = False
 
     def testIfMatch(self):
-        for file in self.env.files:
-            hdrs = {'If-Match': file.md5}
-            self.assert_(file.read(hdrs=hdrs))
+        for file_item in self.env.files:
+            hdrs = {'If-Match': file_item.md5}
+            self.assertTrue(file_item.read(hdrs=hdrs))
 
             hdrs = {'If-Match': 'bogus'}
-            self.assertRaises(ResponseError, file.read, hdrs=hdrs)
+            self.assertRaises(ResponseError, file_item.read, hdrs=hdrs)
             self.assert_status(412)
+            self.assert_etag(file_item.md5)
+
+    def testIfMatchMultipleEtags(self):
+        for file_item in self.env.files:
+            hdrs = {'If-Match': '"bogus1", "%s", "bogus2"' % file_item.md5}
+            self.assertTrue(file_item.read(hdrs=hdrs))
+
+            hdrs = {'If-Match': '"bogus1", "bogus2", "bogus3"'}
+            self.assertRaises(ResponseError, file_item.read, hdrs=hdrs)
+            self.assert_status(412)
+            self.assert_etag(file_item.md5)
 
     def testIfNoneMatch(self):
-        for file in self.env.files:
+        for file_item in self.env.files:
             hdrs = {'If-None-Match': 'bogus'}
-            self.assert_(file.read(hdrs=hdrs))
+            self.assertTrue(file_item.read(hdrs=hdrs))
+
+            hdrs = {'If-None-Match': file_item.md5}
+            self.assertRaises(ResponseError, file_item.read, hdrs=hdrs)
+            self.assert_status(304)
+            self.assert_etag(file_item.md5)
+            self.assert_header('accept-ranges', 'bytes')
+
+    def testIfNoneMatchMultipleEtags(self):
+        for file_item in self.env.files:
+            hdrs = {'If-None-Match': '"bogus1", "bogus2", "bogus3"'}
+            self.assertTrue(file_item.read(hdrs=hdrs))
 
-            hdrs = {'If-None-Match': file.md5}
-            self.assertRaises(ResponseError, file.read, hdrs=hdrs)
+            hdrs = {'If-None-Match':
+                    '"bogus1", "bogus2", "%s"' % file_item.md5}
+            self.assertRaises(ResponseError, file_item.read, hdrs=hdrs)
             self.assert_status(304)
+            self.assert_etag(file_item.md5)
+            self.assert_header('accept-ranges', 'bytes')
 
     def testIfModifiedSince(self):
-        for file in self.env.files:
-            hdrs = {'If-Modified-Since': self.env.time_old}
-            self.assert_(file.read(hdrs=hdrs))
+        for file_item in self.env.files:
+            hdrs = {'If-Modified-Since': self.env.time_old_f1}
+            self.assertTrue(file_item.read(hdrs=hdrs))
+            self.assertTrue(file_item.info(hdrs=hdrs))
 
             hdrs = {'If-Modified-Since': self.env.time_new}
-            self.assertRaises(ResponseError, file.read, hdrs=hdrs)
+            self.assertRaises(ResponseError, file_item.read, hdrs=hdrs)
             self.assert_status(304)
+            self.assert_etag(file_item.md5)
+            self.assert_header('accept-ranges', 'bytes')
+            self.assertRaises(ResponseError, file_item.info, hdrs=hdrs)
+            self.assert_status(304)
+            self.assert_etag(file_item.md5)
+            self.assert_header('accept-ranges', 'bytes')
 
     def testIfUnmodifiedSince(self):
-        for file in self.env.files:
+        for file_item in self.env.files:
             hdrs = {'If-Unmodified-Since': self.env.time_new}
-            self.assert_(file.read(hdrs=hdrs))
+            self.assertTrue(file_item.read(hdrs=hdrs))
+            self.assertTrue(file_item.info(hdrs=hdrs))
 
-            hdrs = {'If-Unmodified-Since': self.env.time_old}
-            self.assertRaises(ResponseError, file.read, hdrs=hdrs)
+            hdrs = {'If-Unmodified-Since': self.env.time_old_f2}
+            self.assertRaises(ResponseError, file_item.read, hdrs=hdrs)
+            self.assert_status(412)
+            self.assert_etag(file_item.md5)
+            self.assertRaises(ResponseError, file_item.info, hdrs=hdrs)
             self.assert_status(412)
+            self.assert_etag(file_item.md5)
 
     def testIfMatchAndUnmodified(self):
-        for file in self.env.files:
-            hdrs = {'If-Match': file.md5,
+        for file_item in self.env.files:
+            hdrs = {'If-Match': file_item.md5,
                     'If-Unmodified-Since': self.env.time_new}
-            self.assert_(file.read(hdrs=hdrs))
+            self.assertTrue(file_item.read(hdrs=hdrs))
 
             hdrs = {'If-Match': 'bogus',
                     'If-Unmodified-Since': self.env.time_new}
-            self.assertRaises(ResponseError, file.read, hdrs=hdrs)
+            self.assertRaises(ResponseError, file_item.read, hdrs=hdrs)
             self.assert_status(412)
+            self.assert_etag(file_item.md5)
 
-            hdrs = {'If-Match': file.md5,
-                    'If-Unmodified-Since': self.env.time_old}
-            self.assertRaises(ResponseError, file.read, hdrs=hdrs)
+            hdrs = {'If-Match': file_item.md5,
+                    'If-Unmodified-Since': self.env.time_old_f3}
+            self.assertRaises(ResponseError, file_item.read, hdrs=hdrs)
             self.assert_status(412)
+            self.assert_etag(file_item.md5)
+
+    def testLastModified(self):
+        file_name = Utils.create_name()
+        content_type = Utils.create_name()
+
+        file_item = self.env.container.file(file_name)
+        file_item.content_type = content_type
+        resp = file_item.write_random_return_resp(self.env.file_size)
+        put_last_modified = resp.getheader('last-modified')
+        etag = file_item.md5
+
+        file_item = self.env.container.file(file_name)
+        info = file_item.info()
+        self.assertIn('last_modified', info)
+        last_modified = info['last_modified']
+        self.assertEqual(put_last_modified, info['last_modified'])
+
+        hdrs = {'If-Modified-Since': last_modified}
+        self.assertRaises(ResponseError, file_item.read, hdrs=hdrs)
+        self.assert_status(304)
+        self.assert_etag(etag)
+        self.assert_header('accept-ranges', 'bytes')
+
+        hdrs = {'If-Unmodified-Since': last_modified}
+        self.assertTrue(file_item.read(hdrs=hdrs))
 
 
 class TestFileComparisonUTF8(Base2, TestFileComparison):
-    set_up = False
+    pass
+
+
+class TestServiceToken(unittest.TestCase):
+
+    def setUp(self):
+        if tf.skip_service_tokens:
+            raise SkipTest
+
+        if tf.in_process:
+            tf.skip_if_no_xattrs()
+
+        self.SET_TO_USERS_TOKEN = 1
+        self.SET_TO_SERVICE_TOKEN = 2
+
+        # keystoneauth and tempauth differ in allowing PUT account
+        # Even if keystoneauth allows it, the proxy-server uses
+        # allow_account_management to decide if accounts can be created
+        self.put_account_expect = is_client_error
+        if tf.swift_test_auth_version != '1':
+            if cluster_info.get('swift').get('allow_account_management'):
+                self.put_account_expect = is_success
+
+    def _scenario_generator(self):
+        paths = ((None, None), ('c', None), ('c', 'o'))
+        for path in paths:
+            for method in ('PUT', 'POST', 'HEAD', 'GET', 'OPTIONS'):
+                yield method, path[0], path[1]
+        for path in reversed(paths):
+            yield 'DELETE', path[0], path[1]
+
+    def _assert_is_authed_response(self, method, container, object, resp):
+        resp.read()
+        expect = is_success
+        if method == 'DELETE' and not container:
+            expect = is_client_error
+        if method == 'PUT' and not container:
+            expect = self.put_account_expect
+        self.assertTrue(expect(resp.status), 'Unexpected %s for %s %s %s'
+                        % (resp.status, method, container, object))
+
+    def _assert_not_authed_response(self, method, container, object, resp):
+        resp.read()
+        expect = is_client_error
+        if method == 'OPTIONS':
+            expect = is_success
+        self.assertTrue(expect(resp.status), 'Unexpected %s for %s %s %s'
+                        % (resp.status, method, container, object))
+
+    def prepare_request(self, method, use_service_account=False,
+                        container=None, obj=None, body=None, headers=None,
+                        x_auth_token=None,
+                        x_service_token=None, dbg=False):
+        """
+        Setup for making the request
+
+        When retry() calls the do_request() function, it calls it the
+        test user's token, the parsed path, a connection and (optionally)
+        a token from the test service user. We save options here so that
+        do_request() can make the appropriate request.
+
+        :param method: The operation (e.g. 'HEAD')
+        :param use_service_account: Optional. Set True to change the path to
+               be the service account
+        :param container: Optional. Adds a container name to the path
+        :param obj: Optional. Adds an object name to the path
+        :param body: Optional. Adds a body (string) in the request
+        :param headers: Optional. Adds additional headers.
+        :param x_auth_token: Optional. Default is SET_TO_USERS_TOKEN. One of:
+                   SET_TO_USERS_TOKEN     Put the test user's token in
+                                          X-Auth-Token
+                   SET_TO_SERVICE_TOKEN   Put the service token in X-Auth-Token
+        :param x_service_token: Optional. Default is to not set X-Service-Token
+                   to any value. If specified, is one of following:
+                   SET_TO_USERS_TOKEN     Put the test user's token in
+                                          X-Service-Token
+                   SET_TO_SERVICE_TOKEN   Put the service token in
+                                          X-Service-Token
+        :param dbg: Optional. Set true to check request arguments
+        """
+        self.method = method
+        self.use_service_account = use_service_account
+        self.container = container
+        self.obj = obj
+        self.body = body
+        self.headers = headers
+        if x_auth_token:
+            self.x_auth_token = x_auth_token
+        else:
+            self.x_auth_token = self.SET_TO_USERS_TOKEN
+        self.x_service_token = x_service_token
+        self.dbg = dbg
+
+    def do_request(self, url, token, parsed, conn, service_token=''):
+        if self.use_service_account:
+            path = self._service_account(parsed.path)
+        else:
+            path = parsed.path
+        if self.container:
+            path += '/%s' % self.container
+        if self.obj:
+            path += '/%s' % self.obj
+        headers = {}
+        if self.body:
+            headers.update({'Content-Length': len(self.body)})
+        if self.x_auth_token == self.SET_TO_USERS_TOKEN:
+            headers.update({'X-Auth-Token': token})
+        elif self.x_auth_token == self.SET_TO_SERVICE_TOKEN:
+            headers.update({'X-Auth-Token': service_token})
+        if self.x_service_token == self.SET_TO_USERS_TOKEN:
+            headers.update({'X-Service-Token': token})
+        elif self.x_service_token == self.SET_TO_SERVICE_TOKEN:
+            headers.update({'X-Service-Token': service_token})
+        if self.dbg:
+            print('DEBUG: conn.request: method:%s path:%s'
+                  ' body:%s headers:%s' % (self.method, path, self.body,
+                                           headers))
+        conn.request(self.method, path, self.body, headers=headers)
+        return check_response(conn)
+
+    def _service_account(self, path):
+        parts = path.split('/', 3)
+        account = parts[2]
+        try:
+            project_id = account[account.index('_') + 1:]
+        except ValueError:
+            project_id = account
+        parts[2] = '%s%s' % (tf.swift_test_service_prefix, project_id)
+        return '/'.join(parts)
+
+    def test_user_access_own_auth_account(self):
+        # This covers ground tested elsewhere (tests a user doing HEAD
+        # on own account). However, if this fails, none of the remaining
+        # tests will work
+        self.prepare_request('HEAD')
+        resp = retry(self.do_request)
+        resp.read()
+        self.assertIn(resp.status, (200, 204))
+
+    def test_user_cannot_access_service_account(self):
+        for method, container, obj in self._scenario_generator():
+            self.prepare_request(method, use_service_account=True,
+                                 container=container, obj=obj)
+            resp = retry(self.do_request)
+            self._assert_not_authed_response(method, container, obj, resp)
+
+    def test_service_user_denied_with_x_auth_token(self):
+        for method, container, obj in self._scenario_generator():
+            self.prepare_request(method, use_service_account=True,
+                                 container=container, obj=obj,
+                                 x_auth_token=self.SET_TO_SERVICE_TOKEN)
+            resp = retry(self.do_request, service_user=5)
+            self._assert_not_authed_response(method, container, obj, resp)
+
+    def test_service_user_denied_with_x_service_token(self):
+        for method, container, obj in self._scenario_generator():
+            self.prepare_request(method, use_service_account=True,
+                                 container=container, obj=obj,
+                                 x_auth_token=self.SET_TO_SERVICE_TOKEN,
+                                 x_service_token=self.SET_TO_SERVICE_TOKEN)
+            resp = retry(self.do_request, service_user=5)
+            self._assert_not_authed_response(method, container, obj, resp)
+
+    def test_user_plus_service_can_access_service_account(self):
+        for method, container, obj in self._scenario_generator():
+            self.prepare_request(method, use_service_account=True,
+                                 container=container, obj=obj,
+                                 x_auth_token=self.SET_TO_USERS_TOKEN,
+                                 x_service_token=self.SET_TO_SERVICE_TOKEN)
+            resp = retry(self.do_request, service_user=5)
+            self._assert_is_authed_response(method, container, obj, resp)
+
 
 if __name__ == '__main__':
     unittest.main()
diff --git a/test/functionalnosetests/swift_testing.py b/test/functionalnosetests/swift_testing.py
deleted file mode 100644
index 74e8e1cf55..0000000000
--- a/test/functionalnosetests/swift_testing.py
+++ /dev/null
@@ -1,144 +0,0 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#    http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-# implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-import errno
-import os
-import socket
-import sys
-from httplib import HTTPException
-from time import sleep
-from nose import SkipTest
-from ConfigParser import MissingSectionHeaderError
-
-from test import get_config
-
-from swiftclient import get_auth, http_connection
-
-conf = get_config('func_test')
-
-# If no conf was read, we will fall back to old school env vars
-swift_test_auth = os.environ.get('SWIFT_TEST_AUTH')
-swift_test_user = [os.environ.get('SWIFT_TEST_USER'), None, None]
-swift_test_key = [os.environ.get('SWIFT_TEST_KEY'), None, None]
-
-if conf:
-    swift_test_auth = 'http'
-    if conf.get('auth_ssl', 'no').lower() in ('yes', 'true', 'on', '1'):
-        swift_test_auth = 'https'
-    if 'auth_prefix' not in conf:
-        conf['auth_prefix'] = '/'
-    try:
-        swift_test_auth += \
-                '://%(auth_host)s:%(auth_port)s%(auth_prefix)sv1.0' % conf
-    except KeyError:
-        pass  # skip
-    if 'account' in conf:
-        swift_test_user[0] = '%(account)s:%(username)s' % conf
-    else:
-        swift_test_user[0] = '%(username)s' % conf
-    swift_test_key[0] = conf['password']
-    try:
-        swift_test_user[1] = '%s%s' % ('%s:' % conf['account2'] if 'account2'
-                                       in conf else '', conf['username2'])
-        swift_test_key[1] = conf['password2']
-    except KeyError, err:
-        pass  # old conf, no second account tests can be run
-    try:
-        swift_test_user[2] = '%s%s' % ('%s:' % conf['account'] if 'account'
-                                       in conf else '', conf['username3'])
-        swift_test_key[2] = conf['password3']
-    except KeyError, err:
-        pass  # old conf, no third account tests can be run
-
-skip = not all([swift_test_auth, swift_test_user[0], swift_test_key[0]])
-if skip:
-    print >>sys.stderr, 'SKIPPING FUNCTIONAL TESTS DUE TO NO CONFIG'
-
-skip2 = not all([not skip, swift_test_user[1], swift_test_key[1]])
-if not skip and skip2:
-    print >>sys.stderr, \
-          'SKIPPING SECOND ACCOUNT FUNCTIONAL TESTS DUE TO NO CONFIG FOR THEM'
-
-skip3 = not all([not skip, swift_test_user[2], swift_test_key[2]])
-if not skip and skip3:
-    print >>sys.stderr, \
-          'SKIPPING THIRD ACCOUNT FUNCTIONAL TESTS DUE TO NO CONFIG FOR THEM'
-
-
-class AuthError(Exception):
-    pass
-
-
-class InternalServerError(Exception):
-    pass
-
-
-url = [None, None, None]
-token = [None, None, None]
-parsed = [None, None, None]
-conn = [None, None, None]
-
-
-def retry(func, *args, **kwargs):
-    """
-    You can use the kwargs to override the 'retries' (default: 5) and
-    'use_account' (default: 1).
-    """
-    global url, token, parsed, conn
-    retries = kwargs.get('retries', 5)
-    use_account = 1
-    if 'use_account' in kwargs:
-        use_account = kwargs['use_account']
-        del kwargs['use_account']
-    use_account -= 1
-    attempts = 0
-    backoff = 1
-    while attempts <= retries:
-        attempts += 1
-        try:
-            if not url[use_account] or not token[use_account]:
-                url[use_account], token[use_account] = \
-                    get_auth(swift_test_auth, swift_test_user[use_account],
-                             swift_test_key[use_account])
-                parsed[use_account] = conn[use_account] = None
-            if not parsed[use_account] or not conn[use_account]:
-                parsed[use_account], conn[use_account] = \
-                    http_connection(url[use_account])
-            return func(url[use_account], token[use_account],
-                       parsed[use_account], conn[use_account], *args, **kwargs)
-        except (socket.error, HTTPException):
-            if attempts > retries:
-                raise
-            parsed[use_account] = conn[use_account] = None
-        except AuthError, err:
-            url[use_account] = token[use_account] = None
-            continue
-        except InternalServerError, err:
-            pass
-        if attempts <= retries:
-            sleep(backoff)
-            backoff *= 2
-    raise Exception('No result after %s retries.' % retries)
-
-
-def check_response(conn):
-    resp = conn.getresponse()
-    if resp.status == 401:
-        resp.read()
-        raise AuthError()
-    elif resp.status // 100 == 5:
-        resp.read()
-        raise InternalServerError()
-    return resp
diff --git a/test/functionalnosetests/test_account.py b/test/functionalnosetests/test_account.py
deleted file mode 100755
index ae6e3c4299..0000000000
--- a/test/functionalnosetests/test_account.py
+++ /dev/null
@@ -1,152 +0,0 @@
-#!/usr/bin/python
-
-# Copyright (c) 2010-2012 OpenStack, LLC.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#    http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-# implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-import unittest
-from nose import SkipTest
-
-from swift.common.constraints import MAX_META_COUNT, MAX_META_NAME_LENGTH, \
-    MAX_META_OVERALL_SIZE, MAX_META_VALUE_LENGTH
-
-from swift_testing import check_response, retry, skip
-
-
-class TestAccount(unittest.TestCase):
-
-    def test_metadata(self):
-        if skip:
-            raise SkipTest
-        def post(url, token, parsed, conn, value):
-            conn.request('POST', parsed.path, '',
-                {'X-Auth-Token': token, 'X-Account-Meta-Test': value})
-            return check_response(conn)
-        def head(url, token, parsed, conn):
-            conn.request('HEAD', parsed.path, '', {'X-Auth-Token': token})
-            return check_response(conn)
-        def get(url, token, parsed, conn):
-            conn.request('GET', parsed.path, '', {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(post, '')
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        resp = retry(head)
-        resp.read()
-        self.assert_(resp.status in (200, 204), resp.status)
-        self.assertEquals(resp.getheader('x-account-meta-test'), None)
-        resp = retry(get)
-        resp.read()
-        self.assert_(resp.status in (200, 204), resp.status)
-        self.assertEquals(resp.getheader('x-account-meta-test'), None)
-        resp = retry(post, 'Value')
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        resp = retry(head)
-        resp.read()
-        self.assert_(resp.status in (200, 204), resp.status)
-        self.assertEquals(resp.getheader('x-account-meta-test'), 'Value')
-        resp = retry(get)
-        resp.read()
-        self.assert_(resp.status in (200, 204), resp.status)
-        self.assertEquals(resp.getheader('x-account-meta-test'), 'Value')
-
-    def test_multi_metadata(self):
-        if skip:
-            raise SkipTest
-        def post(url, token, parsed, conn, name, value):
-            conn.request('POST', parsed.path, '',
-                         {'X-Auth-Token': token, name: value})
-            return check_response(conn)
-        def head(url, token, parsed, conn):
-            conn.request('HEAD', parsed.path, '', {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(post, 'X-Account-Meta-One', '1')
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        resp = retry(head)
-        resp.read()
-        self.assert_(resp.status in (200, 204), resp.status)
-        self.assertEquals(resp.getheader('x-account-meta-one'), '1')
-        resp = retry(post, 'X-Account-Meta-Two', '2')
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        resp = retry(head)
-        resp.read()
-        self.assert_(resp.status in (200, 204), resp.status)
-        self.assertEquals(resp.getheader('x-account-meta-one'), '1')
-        self.assertEquals(resp.getheader('x-account-meta-two'), '2')
-
-    def test_bad_metadata(self):
-        if skip:
-            raise SkipTest
-        def post(url, token, parsed, conn, extra_headers):
-            headers = {'X-Auth-Token': token}
-            headers.update(extra_headers)
-            conn.request('POST', parsed.path, '', headers)
-            return check_response(conn)
-        resp = retry(post,
-                {'X-Account-Meta-' + ('k' * MAX_META_NAME_LENGTH): 'v'})
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        resp = retry(post,
-                {'X-Account-Meta-' + ('k' * (MAX_META_NAME_LENGTH + 1)): 'v'})
-        resp.read()
-        self.assertEquals(resp.status, 400)
-
-        resp = retry(post,
-                {'X-Account-Meta-Too-Long': 'k' * MAX_META_VALUE_LENGTH})
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        resp = retry(post,
-                {'X-Account-Meta-Too-Long': 'k' * (MAX_META_VALUE_LENGTH + 1)})
-        resp.read()
-        self.assertEquals(resp.status, 400)
-
-        headers = {}
-        for x in xrange(MAX_META_COUNT):
-            headers['X-Account-Meta-%d' % x] = 'v'
-        resp = retry(post, headers)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        headers = {}
-        for x in xrange(MAX_META_COUNT + 1):
-            headers['X-Account-Meta-%d' % x] = 'v'
-        resp = retry(post, headers)
-        resp.read()
-        self.assertEquals(resp.status, 400)
-
-        headers = {}
-        header_value = 'k' * MAX_META_VALUE_LENGTH
-        size = 0
-        x = 0
-        while size < MAX_META_OVERALL_SIZE - 4 - MAX_META_VALUE_LENGTH:
-            size += 4 + MAX_META_VALUE_LENGTH
-            headers['X-Account-Meta-%04d' % x] = header_value
-            x += 1
-        if MAX_META_OVERALL_SIZE - size > 1:
-            headers['X-Account-Meta-k'] = \
-                'v' * (MAX_META_OVERALL_SIZE - size - 1)
-        resp = retry(post, headers)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        headers['X-Account-Meta-k'] = \
-            'v' * (MAX_META_OVERALL_SIZE - size)
-        resp = retry(post, headers)
-        resp.read()
-        self.assertEquals(resp.status, 400)
-
-
-if __name__ == '__main__':
-    unittest.main()
diff --git a/test/functionalnosetests/test_container.py b/test/functionalnosetests/test_container.py
deleted file mode 100755
index 55e76f259c..0000000000
--- a/test/functionalnosetests/test_container.py
+++ /dev/null
@@ -1,557 +0,0 @@
-#!/usr/bin/python
-
-# Copyright (c) 2010-2012 OpenStack, LLC.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#    http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-# implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-import json
-import unittest
-from nose import SkipTest
-from uuid import uuid4
-
-from swift.common.constraints import MAX_META_COUNT, MAX_META_NAME_LENGTH, \
-    MAX_META_OVERALL_SIZE, MAX_META_VALUE_LENGTH
-
-from swift_testing import check_response, retry, skip, skip2, skip3, \
-                          swift_test_user
-
-
-class TestContainer(unittest.TestCase):
-
-    def setUp(self):
-        if skip:
-            raise SkipTest
-        self.name = uuid4().hex
-        def put(url, token, parsed, conn):
-            conn.request('PUT', parsed.path + '/' + self.name, '',
-                         {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(put)
-        resp.read()
-        self.assertEquals(resp.status, 201)
-
-    def tearDown(self):
-        if skip:
-            raise SkipTest
-        def get(url, token, parsed, conn):
-            conn.request('GET', parsed.path + '/' + self.name + '?format=json',
-                         '', {'X-Auth-Token': token})
-            return check_response(conn)
-        def delete(url, token, parsed, conn, obj):
-            conn.request('DELETE',
-                         '/'.join([parsed.path, self.name, obj['name']]), '',
-                         {'X-Auth-Token': token})
-            return check_response(conn)
-        while True:
-            resp = retry(get)
-            body = resp.read()
-            self.assert_(resp.status // 100 == 2, resp.status)
-            objs = json.loads(body)
-            if not objs:
-                break
-            for obj in objs:
-                resp = retry(delete, obj)
-                resp.read()
-                self.assertEquals(resp.status, 204)
-        def delete(url, token, parsed, conn):
-            conn.request('DELETE', parsed.path + '/' + self.name, '',
-                         {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(delete)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-
-    def test_multi_metadata(self):
-        if skip:
-            raise SkipTest
-        def post(url, token, parsed, conn, name, value):
-            conn.request('POST', parsed.path + '/' + self.name, '',
-                {'X-Auth-Token': token, name: value})
-            return check_response(conn)
-        def head(url, token, parsed, conn):
-            conn.request('HEAD', parsed.path + '/' + self.name, '',
-                         {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(post, 'X-Container-Meta-One', '1')
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        resp = retry(head)
-        resp.read()
-        self.assert_(resp.status in (200, 204), resp.status)
-        self.assertEquals(resp.getheader('x-container-meta-one'), '1')
-        resp = retry(post, 'X-Container-Meta-Two', '2')
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        resp = retry(head)
-        resp.read()
-        self.assert_(resp.status in (200, 204), resp.status)
-        self.assertEquals(resp.getheader('x-container-meta-one'), '1')
-        self.assertEquals(resp.getheader('x-container-meta-two'), '2')
-
-    def test_PUT_metadata(self):
-        if skip:
-            raise SkipTest
-        def put(url, token, parsed, conn, name, value):
-            conn.request('PUT', parsed.path + '/' + name, '',
-                {'X-Auth-Token': token, 'X-Container-Meta-Test': value})
-            return check_response(conn)
-        def head(url, token, parsed, conn, name):
-            conn.request('HEAD', parsed.path + '/' + name, '',
-                         {'X-Auth-Token': token})
-            return check_response(conn)
-        def get(url, token, parsed, conn, name):
-            conn.request('GET', parsed.path + '/' + name, '',
-                         {'X-Auth-Token': token})
-            return check_response(conn)
-        def delete(url, token, parsed, conn, name):
-            conn.request('DELETE', parsed.path + '/' + name, '',
-                         {'X-Auth-Token': token})
-            return check_response(conn)
-        name = uuid4().hex
-        resp = retry(put, name, 'Value')
-        resp.read()
-        self.assertEquals(resp.status, 201)
-        resp = retry(head, name)
-        resp.read()
-        self.assert_(resp.status in (200, 204), resp.status)
-        self.assertEquals(resp.getheader('x-container-meta-test'), 'Value')
-        resp = retry(get, name)
-        resp.read()
-        self.assert_(resp.status in (200, 204), resp.status)
-        self.assertEquals(resp.getheader('x-container-meta-test'), 'Value')
-        resp = retry(delete, name)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-
-        name = uuid4().hex
-        resp = retry(put, name, '')
-        resp.read()
-        self.assertEquals(resp.status, 201)
-        resp = retry(head, name)
-        resp.read()
-        self.assert_(resp.status in (200, 204), resp.status)
-        self.assertEquals(resp.getheader('x-container-meta-test'), None)
-        resp = retry(get, name)
-        resp.read()
-        self.assert_(resp.status in (200, 204), resp.status)
-        self.assertEquals(resp.getheader('x-container-meta-test'), None)
-        resp = retry(delete, name)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-
-    def test_POST_metadata(self):
-        if skip:
-            raise SkipTest
-        def post(url, token, parsed, conn, value):
-            conn.request('POST', parsed.path + '/' + self.name, '',
-                {'X-Auth-Token': token, 'X-Container-Meta-Test': value})
-            return check_response(conn)
-        def head(url, token, parsed, conn):
-            conn.request('HEAD', parsed.path + '/' + self.name, '',
-                         {'X-Auth-Token': token})
-            return check_response(conn)
-        def get(url, token, parsed, conn):
-            conn.request('GET', parsed.path + '/' + self.name, '',
-                         {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(head)
-        resp.read()
-        self.assert_(resp.status in (200, 204), resp.status)
-        self.assertEquals(resp.getheader('x-container-meta-test'), None)
-        resp = retry(get)
-        resp.read()
-        self.assert_(resp.status in (200, 204), resp.status)
-        self.assertEquals(resp.getheader('x-container-meta-test'), None)
-        resp = retry(post, 'Value')
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        resp = retry(head)
-        resp.read()
-        self.assert_(resp.status in (200, 204), resp.status)
-        self.assertEquals(resp.getheader('x-container-meta-test'), 'Value')
-        resp = retry(get)
-        resp.read()
-        self.assert_(resp.status in (200, 204), resp.status)
-        self.assertEquals(resp.getheader('x-container-meta-test'), 'Value')
-
-    def test_PUT_bad_metadata(self):
-        if skip:
-            raise SkipTest
-        def put(url, token, parsed, conn, name, extra_headers):
-            headers = {'X-Auth-Token': token}
-            headers.update(extra_headers)
-            conn.request('PUT', parsed.path + '/' + name, '', headers)
-            return check_response(conn)
-        def delete(url, token, parsed, conn, name):
-            conn.request('DELETE', parsed.path + '/' + name, '',
-                         {'X-Auth-Token': token})
-            return check_response(conn)
-        name = uuid4().hex
-        resp = retry(put, name,
-                {'X-Container-Meta-' + ('k' * MAX_META_NAME_LENGTH): 'v'})
-        resp.read()
-        self.assertEquals(resp.status, 201)
-        resp = retry(delete, name)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        name = uuid4().hex
-        resp = retry(put, name,
-               {'X-Container-Meta-' + ('k' * (MAX_META_NAME_LENGTH + 1)): 'v'})
-        resp.read()
-        self.assertEquals(resp.status, 400)
-        resp = retry(delete, name)
-        resp.read()
-        self.assertEquals(resp.status, 404)
-
-        name = uuid4().hex
-        resp = retry(put, name,
-                {'X-Container-Meta-Too-Long': 'k' * MAX_META_VALUE_LENGTH})
-        resp.read()
-        self.assertEquals(resp.status, 201)
-        resp = retry(delete, name)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        name = uuid4().hex
-        resp = retry(put, name,
-              {'X-Container-Meta-Too-Long': 'k' * (MAX_META_VALUE_LENGTH + 1)})
-        resp.read()
-        self.assertEquals(resp.status, 400)
-        resp = retry(delete, name)
-        resp.read()
-        self.assertEquals(resp.status, 404)
-
-        name = uuid4().hex
-        headers = {}
-        for x in xrange(MAX_META_COUNT):
-            headers['X-Container-Meta-%d' % x] = 'v'
-        resp = retry(put, name, headers)
-        resp.read()
-        self.assertEquals(resp.status, 201)
-        resp = retry(delete, name)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        name = uuid4().hex
-        headers = {}
-        for x in xrange(MAX_META_COUNT + 1):
-            headers['X-Container-Meta-%d' % x] = 'v'
-        resp = retry(put, name, headers)
-        resp.read()
-        self.assertEquals(resp.status, 400)
-        resp = retry(delete, name)
-        resp.read()
-        self.assertEquals(resp.status, 404)
-
-        name = uuid4().hex
-        headers = {}
-        header_value = 'k' * MAX_META_VALUE_LENGTH
-        size = 0
-        x = 0
-        while size < MAX_META_OVERALL_SIZE - 4 - MAX_META_VALUE_LENGTH:
-            size += 4 + MAX_META_VALUE_LENGTH
-            headers['X-Container-Meta-%04d' % x] = header_value
-            x += 1
-        if MAX_META_OVERALL_SIZE - size > 1:
-            headers['X-Container-Meta-k'] = \
-                'v' * (MAX_META_OVERALL_SIZE - size - 1)
-        resp = retry(put, name, headers)
-        resp.read()
-        self.assertEquals(resp.status, 201)
-        resp = retry(delete, name)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        name = uuid4().hex
-        headers['X-Container-Meta-k'] = \
-            'v' * (MAX_META_OVERALL_SIZE - size)
-        resp = retry(put, name, headers)
-        resp.read()
-        self.assertEquals(resp.status, 400)
-        resp = retry(delete, name)
-        resp.read()
-        self.assertEquals(resp.status, 404)
-
-    def test_POST_bad_metadata(self):
-        if skip:
-            raise SkipTest
-        def post(url, token, parsed, conn, extra_headers):
-            headers = {'X-Auth-Token': token}
-            headers.update(extra_headers)
-            conn.request('POST', parsed.path + '/' + self.name, '', headers)
-            return check_response(conn)
-        resp = retry(post,
-                {'X-Container-Meta-' + ('k' * MAX_META_NAME_LENGTH): 'v'})
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        resp = retry(post,
-               {'X-Container-Meta-' + ('k' * (MAX_META_NAME_LENGTH + 1)): 'v'})
-        resp.read()
-        self.assertEquals(resp.status, 400)
-
-        resp = retry(post,
-                {'X-Container-Meta-Too-Long': 'k' * MAX_META_VALUE_LENGTH})
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        resp = retry(post,
-              {'X-Container-Meta-Too-Long': 'k' * (MAX_META_VALUE_LENGTH + 1)})
-        resp.read()
-        self.assertEquals(resp.status, 400)
-
-        headers = {}
-        for x in xrange(MAX_META_COUNT):
-            headers['X-Container-Meta-%d' % x] = 'v'
-        resp = retry(post, headers)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        headers = {}
-        for x in xrange(MAX_META_COUNT + 1):
-            headers['X-Container-Meta-%d' % x] = 'v'
-        resp = retry(post, headers)
-        resp.read()
-        self.assertEquals(resp.status, 400)
-
-        headers = {}
-        header_value = 'k' * MAX_META_VALUE_LENGTH
-        size = 0
-        x = 0
-        while size < MAX_META_OVERALL_SIZE - 4 - MAX_META_VALUE_LENGTH:
-            size += 4 + MAX_META_VALUE_LENGTH
-            headers['X-Container-Meta-%04d' % x] = header_value
-            x += 1
-        if MAX_META_OVERALL_SIZE - size > 1:
-            headers['X-Container-Meta-k'] = \
-                'v' * (MAX_META_OVERALL_SIZE - size - 1)
-        resp = retry(post, headers)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        headers['X-Container-Meta-k'] = \
-            'v' * (MAX_META_OVERALL_SIZE - size)
-        resp = retry(post, headers)
-        resp.read()
-        self.assertEquals(resp.status, 400)
-
-    def test_public_container(self):
-        if skip:
-            raise SkipTest
-        def get(url, token, parsed, conn):
-            conn.request('GET', parsed.path + '/' + self.name)
-            return check_response(conn)
-        try:
-            resp = retry(get)
-            raise Exception('Should not have been able to GET')
-        except Exception, err:
-            self.assert_(str(err).startswith('No result after '), err)
-        def post(url, token, parsed, conn):
-            conn.request('POST', parsed.path + '/' + self.name, '',
-                         {'X-Auth-Token': token,
-                          'X-Container-Read': '.r:*,.rlistings'})
-            return check_response(conn)
-        resp = retry(post)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        resp = retry(get)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        def post(url, token, parsed, conn):
-            conn.request('POST', parsed.path + '/' + self.name, '',
-                         {'X-Auth-Token': token, 'X-Container-Read': ''})
-            return check_response(conn)
-        resp = retry(post)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        try:
-            resp = retry(get)
-            raise Exception('Should not have been able to GET')
-        except Exception, err:
-            self.assert_(str(err).startswith('No result after '), err)
-
-    def test_cross_account_container(self):
-        if skip or skip2:
-            raise SkipTest
-        # Obtain the first account's string
-        first_account = ['unknown']
-        def get1(url, token, parsed, conn):
-            first_account[0] = parsed.path
-            conn.request('HEAD', parsed.path + '/' + self.name, '',
-                         {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(get1)
-        resp.read()
-        # Ensure we can't access the container with the second account
-        def get2(url, token, parsed, conn):
-            conn.request('GET', first_account[0] + '/' + self.name, '',
-                         {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(get2, use_account=2)
-        resp.read()
-        self.assertEquals(resp.status, 403)
-        # Make the container accessible by the second account
-        def post(url, token, parsed, conn):
-            conn.request('POST', parsed.path + '/' + self.name, '',
-                {'X-Auth-Token': token, 'X-Container-Read': swift_test_user[1],
-                 'X-Container-Write': swift_test_user[1]})
-            return check_response(conn)
-        resp = retry(post)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        # Ensure we can now use the container with the second account
-        resp = retry(get2, use_account=2)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        # Make the container private again
-        def post(url, token, parsed, conn):
-            conn.request('POST', parsed.path + '/' + self.name, '',
-                         {'X-Auth-Token': token, 'X-Container-Read': '',
-                          'X-Container-Write': ''})
-            return check_response(conn)
-        resp = retry(post)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        # Ensure we can't access the container with the second account again
-        resp = retry(get2, use_account=2)
-        resp.read()
-        self.assertEquals(resp.status, 403)
-
-    def test_cross_account_public_container(self):
-        if skip or skip2:
-            raise SkipTest
-        # Obtain the first account's string
-        first_account = ['unknown']
-        def get1(url, token, parsed, conn):
-            first_account[0] = parsed.path
-            conn.request('HEAD', parsed.path + '/' + self.name, '',
-                         {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(get1)
-        resp.read()
-        # Ensure we can't access the container with the second account
-        def get2(url, token, parsed, conn):
-            conn.request('GET', first_account[0] + '/' + self.name, '',
-                         {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(get2, use_account=2)
-        resp.read()
-        self.assertEquals(resp.status, 403)
-        # Make the container completely public
-        def post(url, token, parsed, conn):
-            conn.request('POST', parsed.path + '/' + self.name, '',
-                         {'X-Auth-Token': token,
-                          'X-Container-Read': '.r:*,.rlistings'})
-            return check_response(conn)
-        resp = retry(post)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        # Ensure we can now read the container with the second account
-        resp = retry(get2, use_account=2)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        # But we shouldn't be able to write with the second account
-        def put2(url, token, parsed, conn):
-            conn.request('PUT', first_account[0] + '/' + self.name + '/object',
-                         'test object', {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(put2, use_account=2)
-        resp.read()
-        self.assertEquals(resp.status, 403)
-        # Now make the container also writeable by the second account
-        def post(url, token, parsed, conn):
-            conn.request('POST', parsed.path + '/' + self.name, '',
-                {'X-Auth-Token': token, 'X-Container-Write': swift_test_user[1]})
-            return check_response(conn)
-        resp = retry(post)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        # Ensure we can still read the container with the second account
-        resp = retry(get2, use_account=2)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        # And that we can now write with the second account
-        resp = retry(put2, use_account=2)
-        resp.read()
-        self.assertEquals(resp.status, 201)
-
-    def test_nonadmin_user(self):
-        if skip or skip3:
-            raise SkipTest
-        # Obtain the first account's string
-        first_account = ['unknown']
-        def get1(url, token, parsed, conn):
-            first_account[0] = parsed.path
-            conn.request('HEAD', parsed.path + '/' + self.name, '',
-                         {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(get1)
-        resp.read()
-        # Ensure we can't access the container with the third account
-        def get3(url, token, parsed, conn):
-            conn.request('GET', first_account[0] + '/' + self.name, '',
-                         {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(get3, use_account=3)
-        resp.read()
-        self.assertEquals(resp.status, 403)
-        # Make the container accessible by the third account
-        def post(url, token, parsed, conn):
-            conn.request('POST', parsed.path + '/' + self.name, '',
-               {'X-Auth-Token': token, 'X-Container-Read': swift_test_user[2]})
-            return check_response(conn)
-        resp = retry(post)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        # Ensure we can now read the container with the third account
-        resp = retry(get3, use_account=3)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        # But we shouldn't be able to write with the third account
-        def put3(url, token, parsed, conn):
-            conn.request('PUT', first_account[0] + '/' + self.name + '/object',
-                         'test object', {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(put3, use_account=3)
-        resp.read()
-        self.assertEquals(resp.status, 403)
-        # Now make the container also writeable by the third account
-        def post(url, token, parsed, conn):
-            conn.request('POST', parsed.path + '/' + self.name, '',
-                         {'X-Auth-Token': token,
-                          'X-Container-Write': swift_test_user[2]})
-            return check_response(conn)
-        resp = retry(post)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        # Ensure we can still read the container with the third account
-        resp = retry(get3, use_account=3)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        # And that we can now write with the third account
-        resp = retry(put3, use_account=3)
-        resp.read()
-        self.assertEquals(resp.status, 201)
-
-    def test_long_name_content_type(self):
-        if skip:
-            raise SkipTest
-
-        def put(url, token, parsed, conn):
-            container_name = 'X' * 2048
-            conn.request('PUT', '%s/%s' % (parsed.path,
-                container_name), 'there', {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(put)
-        resp.read()
-        self.assertEquals(resp.status, 400)
-        self.assertEquals(resp.getheader('Content-Type'),
-                          'text/html; charset=UTF-8')
-
-
-if __name__ == '__main__':
-    unittest.main()
diff --git a/test/functionalnosetests/test_object.py b/test/functionalnosetests/test_object.py
deleted file mode 100755
index a4cefae7c1..0000000000
--- a/test/functionalnosetests/test_object.py
+++ /dev/null
@@ -1,583 +0,0 @@
-#!/usr/bin/python
-
-# Copyright (c) 2010-2012 OpenStack, LLC.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#    http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-# implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-import unittest
-from nose import SkipTest
-from uuid import uuid4
-
-from swift.common.constraints import MAX_META_COUNT, MAX_META_NAME_LENGTH, \
-    MAX_META_OVERALL_SIZE, MAX_META_VALUE_LENGTH
-
-from swift_testing import check_response, retry, skip, skip3, swift_test_user
-
-
-class TestObject(unittest.TestCase):
-
-    def setUp(self):
-        if skip:
-            raise SkipTest
-        self.container = uuid4().hex
-
-        def put(url, token, parsed, conn):
-            conn.request('PUT', parsed.path + '/' + self.container, '',
-                         {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(put)
-        resp.read()
-        self.assertEquals(resp.status, 201)
-        self.obj = uuid4().hex
-
-        def put(url, token, parsed, conn):
-            conn.request('PUT', '%s/%s/%s' % (parsed.path, self.container,
-                self.obj), 'test', {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(put)
-        resp.read()
-        self.assertEquals(resp.status, 201)
-
-    def tearDown(self):
-        if skip:
-            raise SkipTest
-
-        def delete(url, token, parsed, conn, obj):
-            conn.request('DELETE',
-                         '%s/%s/%s' % (parsed.path, self.container, obj),
-                         '', {'X-Auth-Token': token})
-            return check_response(conn)
-
-        # get list of objects in container
-        def list(url, token, parsed, conn):
-            conn.request('GET',
-                         '%s/%s' % (parsed.path, self.container),
-                         '', {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(list)
-        object_listing = resp.read()
-        self.assertEquals(resp.status, 200)
-
-        # iterate over object listing and delete all objects
-        for obj in object_listing.splitlines():
-            resp = retry(delete, obj)
-            resp.read()
-            self.assertEquals(resp.status, 204)
-
-        # delete the container
-        def delete(url, token, parsed, conn):
-            conn.request('DELETE', parsed.path + '/' + self.container, '',
-                         {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(delete)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-
-    def test_copy_object(self):
-        if skip:
-            raise SkipTest
-
-        source = '%s/%s' % (self.container, self.obj)
-        dest = '%s/%s' % (self.container, 'test_copy')
-
-        # get contents of source
-        def get_source(url, token, parsed, conn):
-            conn.request('GET',
-                         '%s/%s' % (parsed.path, source),
-                         '', {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(get_source)
-        source_contents = resp.read()
-        self.assertEquals(resp.status, 200)
-        self.assertEquals(source_contents, 'test')
-
-        # copy source to dest with X-Copy-From
-        def put(url, token, parsed, conn):
-            conn.request('PUT', '%s/%s' % (parsed.path, dest), '',
-                         {'X-Auth-Token': token,
-                          'Content-Length': '0',
-                          'X-Copy-From': source})
-            return check_response(conn)
-        resp = retry(put)
-        contents = resp.read()
-        self.assertEquals(resp.status, 201)
-
-        # contents of dest should be the same as source
-        def get_dest(url, token, parsed, conn):
-            conn.request('GET',
-                         '%s/%s' % (parsed.path, dest),
-                         '', {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(get_dest)
-        dest_contents = resp.read()
-        self.assertEquals(resp.status, 200)
-        self.assertEquals(dest_contents, source_contents)
-
-        # delete the copy
-        def delete(url, token, parsed, conn):
-            conn.request('DELETE', '%s/%s' % (parsed.path, dest), '',
-                         {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(delete)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        # verify dest does not exist
-        resp = retry(get_dest)
-        resp.read()
-        self.assertEquals(resp.status, 404)
-
-        # copy source to dest with COPY
-        def copy(url, token, parsed, conn):
-            conn.request('COPY', '%s/%s' % (parsed.path, source), '',
-                         {'X-Auth-Token': token,
-                          'Destination': dest})
-            return check_response(conn)
-        resp = retry(copy)
-        contents = resp.read()
-        self.assertEquals(resp.status, 201)
-
-        # contents of dest should be the same as source
-        resp = retry(get_dest)
-        dest_contents = resp.read()
-        self.assertEquals(resp.status, 200)
-        self.assertEquals(dest_contents, source_contents)
-
-        # delete the copy
-        resp = retry(delete)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-
-    def test_public_object(self):
-        if skip:
-            raise SkipTest
-
-        def get(url, token, parsed, conn):
-            conn.request('GET',
-                         '%s/%s/%s' % (parsed.path, self.container, self.obj))
-            return check_response(conn)
-        try:
-            resp = retry(get)
-            raise Exception('Should not have been able to GET')
-        except Exception, err:
-            self.assert_(str(err).startswith('No result after '))
-
-        def post(url, token, parsed, conn):
-            conn.request('POST', parsed.path + '/' + self.container, '',
-                         {'X-Auth-Token': token,
-                          'X-Container-Read': '.r:*'})
-            return check_response(conn)
-        resp = retry(post)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        resp = retry(get)
-        resp.read()
-        self.assertEquals(resp.status, 200)
-
-        def post(url, token, parsed, conn):
-            conn.request('POST', parsed.path + '/' + self.container, '',
-                         {'X-Auth-Token': token, 'X-Container-Read': ''})
-            return check_response(conn)
-        resp = retry(post)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        try:
-            resp = retry(get)
-            raise Exception('Should not have been able to GET')
-        except Exception, err:
-            self.assert_(str(err).startswith('No result after '))
-
-    def test_private_object(self):
-        if skip or skip3:
-            raise SkipTest
-
-        # Ensure we can't access the object with the third account
-        def get(url, token, parsed, conn):
-            conn.request('GET', '%s/%s/%s' % (parsed.path, self.container,
-                                              self.obj), '',
-                         {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(get, use_account=3)
-        resp.read()
-        self.assertEquals(resp.status, 403)
-
-        # create a shared container writable by account3
-        shared_container = uuid4().hex
-
-        def put(url, token, parsed, conn):
-            conn.request('PUT', '%s/%s' % (parsed.path,
-                                           shared_container), '',
-                         {'X-Auth-Token': token,
-                         'X-Container-Read': swift_test_user[2],
-                         'X-Container-Write': swift_test_user[2]})
-            return check_response(conn)
-        resp = retry(put)
-        resp.read()
-        self.assertEquals(resp.status, 201)
-
-        # verify third account can not copy from private container
-        def copy(url, token, parsed, conn):
-            conn.request('PUT', '%s/%s/%s' % (parsed.path,
-                                              shared_container,
-                                              'private_object'),
-                         '', {'X-Auth-Token': token,
-                              'Content-Length': '0',
-                              'X-Copy-From': '%s/%s' % (self.container,
-                                                        self.obj)})
-            return check_response(conn)
-        resp = retry(copy, use_account=3)
-        resp.read()
-        self.assertEquals(resp.status, 403)
-
-        # verify third account can write "obj1" to shared container
-        def put(url, token, parsed, conn):
-            conn.request('PUT', '%s/%s/%s' % (parsed.path, shared_container,
-                'obj1'), 'test', {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(put, use_account=3)
-        resp.read()
-        self.assertEquals(resp.status, 201)
-
-        # verify third account can copy "obj1" to shared container
-        def copy2(url, token, parsed, conn):
-            conn.request('COPY', '%s/%s/%s' % (parsed.path,
-                                               shared_container,
-                                               'obj1'),
-                         '', {'X-Auth-Token': token,
-                              'Destination': '%s/%s' % (shared_container,
-                                              'obj1')})
-            return check_response(conn)
-        resp = retry(copy2, use_account=3)
-        resp.read()
-        self.assertEquals(resp.status, 201)
-
-        # verify third account STILL can not copy from private container
-        def copy3(url, token, parsed, conn):
-            conn.request('COPY', '%s/%s/%s' % (parsed.path,
-                                               self.container,
-                                               self.obj),
-                         '', {'X-Auth-Token': token,
-                              'Destination': '%s/%s' % (shared_container,
-                                              'private_object')})
-            return check_response(conn)
-        resp = retry(copy3, use_account=3)
-        resp.read()
-        self.assertEquals(resp.status, 403)
-
-        # clean up "obj1"
-        def delete(url, token, parsed, conn):
-            conn.request('DELETE', '%s/%s/%s' % (parsed.path, shared_container,
-                                         'obj1'), '', {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(delete)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-
-        # clean up shared_container
-        def delete(url, token, parsed, conn):
-            conn.request('DELETE',
-                         parsed.path + '/' + shared_container, '',
-                         {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(delete)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-
-    def test_manifest(self):
-        if skip:
-            raise SkipTest
-        # Data for the object segments
-        segments1 = ['one', 'two', 'three', 'four', 'five']
-        segments2 = ['six', 'seven', 'eight']
-        segments3 = ['nine', 'ten', 'eleven']
-
-        # Upload the first set of segments
-        def put(url, token, parsed, conn, objnum):
-            conn.request('PUT', '%s/%s/segments1/%s' % (parsed.path,
-                self.container, str(objnum)), segments1[objnum],
-                {'X-Auth-Token': token})
-            return check_response(conn)
-        for objnum in xrange(len(segments1)):
-            resp = retry(put, objnum)
-            resp.read()
-            self.assertEquals(resp.status, 201)
-
-        # Upload the manifest
-        def put(url, token, parsed, conn):
-            conn.request('PUT', '%s/%s/manifest' % (parsed.path,
-                self.container), '', {'X-Auth-Token': token,
-                'X-Object-Manifest': '%s/segments1/' % self.container,
-                'Content-Type': 'text/jibberish', 'Content-Length': '0'})
-            return check_response(conn)
-        resp = retry(put)
-        resp.read()
-        self.assertEquals(resp.status, 201)
-
-        # Get the manifest (should get all the segments as the body)
-        def get(url, token, parsed, conn):
-            conn.request('GET', '%s/%s/manifest' % (parsed.path,
-                self.container), '', {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(get)
-        self.assertEquals(resp.read(), ''.join(segments1))
-        self.assertEquals(resp.status, 200)
-        self.assertEquals(resp.getheader('content-type'), 'text/jibberish')
-
-        # Get with a range at the start of the second segment
-        def get(url, token, parsed, conn):
-            conn.request('GET', '%s/%s/manifest' % (parsed.path,
-                self.container), '', {'X-Auth-Token': token, 'Range':
-                'bytes=3-'})
-            return check_response(conn)
-        resp = retry(get)
-        self.assertEquals(resp.read(), ''.join(segments1[1:]))
-        self.assertEquals(resp.status, 206)
-
-        # Get with a range in the middle of the second segment
-        def get(url, token, parsed, conn):
-            conn.request('GET', '%s/%s/manifest' % (parsed.path,
-                self.container), '', {'X-Auth-Token': token, 'Range':
-                'bytes=5-'})
-            return check_response(conn)
-        resp = retry(get)
-        self.assertEquals(resp.read(), ''.join(segments1)[5:])
-        self.assertEquals(resp.status, 206)
-
-        # Get with a full start and stop range
-        def get(url, token, parsed, conn):
-            conn.request('GET', '%s/%s/manifest' % (parsed.path,
-                self.container), '', {'X-Auth-Token': token, 'Range':
-                'bytes=5-10'})
-            return check_response(conn)
-        resp = retry(get)
-        self.assertEquals(resp.read(), ''.join(segments1)[5:11])
-        self.assertEquals(resp.status, 206)
-
-        # Upload the second set of segments
-        def put(url, token, parsed, conn, objnum):
-            conn.request('PUT', '%s/%s/segments2/%s' % (parsed.path,
-                self.container, str(objnum)), segments2[objnum],
-                {'X-Auth-Token': token})
-            return check_response(conn)
-        for objnum in xrange(len(segments2)):
-            resp = retry(put, objnum)
-            resp.read()
-            self.assertEquals(resp.status, 201)
-
-        # Get the manifest (should still be the first segments of course)
-        def get(url, token, parsed, conn):
-            conn.request('GET', '%s/%s/manifest' % (parsed.path,
-                self.container), '', {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(get)
-        self.assertEquals(resp.read(), ''.join(segments1))
-        self.assertEquals(resp.status, 200)
-
-        # Update the manifest
-        def put(url, token, parsed, conn):
-            conn.request('PUT', '%s/%s/manifest' % (parsed.path,
-                self.container), '', {'X-Auth-Token': token,
-                'X-Object-Manifest': '%s/segments2/' % self.container,
-                'Content-Length': '0'})
-            return check_response(conn)
-        resp = retry(put)
-        resp.read()
-        self.assertEquals(resp.status, 201)
-
-        # Get the manifest (should be the second set of segments now)
-        def get(url, token, parsed, conn):
-            conn.request('GET', '%s/%s/manifest' % (parsed.path,
-                self.container), '', {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(get)
-        self.assertEquals(resp.read(), ''.join(segments2))
-        self.assertEquals(resp.status, 200)
-
-        if not skip3:
-
-            # Ensure we can't access the manifest with the third account
-            def get(url, token, parsed, conn):
-                conn.request('GET', '%s/%s/manifest' % (parsed.path,
-                    self.container), '', {'X-Auth-Token': token})
-                return check_response(conn)
-            resp = retry(get, use_account=3)
-            resp.read()
-            self.assertEquals(resp.status, 403)
-
-            # Grant access to the third account
-            def post(url, token, parsed, conn):
-                conn.request('POST', '%s/%s' % (parsed.path, self.container),
-                    '', {'X-Auth-Token': token, 'X-Container-Read':
-                    swift_test_user[2]})
-                return check_response(conn)
-            resp = retry(post)
-            resp.read()
-            self.assertEquals(resp.status, 204)
-
-            # The third account should be able to get the manifest now
-            def get(url, token, parsed, conn):
-                conn.request('GET', '%s/%s/manifest' % (parsed.path,
-                    self.container), '', {'X-Auth-Token': token})
-                return check_response(conn)
-            resp = retry(get, use_account=3)
-            self.assertEquals(resp.read(), ''.join(segments2))
-            self.assertEquals(resp.status, 200)
-
-        # Create another container for the third set of segments
-        acontainer = uuid4().hex
-
-        def put(url, token, parsed, conn):
-            conn.request('PUT', parsed.path + '/' + acontainer, '',
-                         {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(put)
-        resp.read()
-        self.assertEquals(resp.status, 201)
-
-        # Upload the third set of segments in the other container
-        def put(url, token, parsed, conn, objnum):
-            conn.request('PUT', '%s/%s/segments3/%s' % (parsed.path,
-                acontainer, str(objnum)), segments3[objnum],
-                {'X-Auth-Token': token})
-            return check_response(conn)
-        for objnum in xrange(len(segments3)):
-            resp = retry(put, objnum)
-            resp.read()
-            self.assertEquals(resp.status, 201)
-
-        # Update the manifest
-        def put(url, token, parsed, conn):
-            conn.request('PUT', '%s/%s/manifest' % (parsed.path,
-                self.container), '', {'X-Auth-Token': token,
-                'X-Object-Manifest': '%s/segments3/' % acontainer,
-                'Content-Length': '0'})
-            return check_response(conn)
-        resp = retry(put)
-        resp.read()
-        self.assertEquals(resp.status, 201)
-
-        # Get the manifest to ensure it's the third set of segments
-        def get(url, token, parsed, conn):
-            conn.request('GET', '%s/%s/manifest' % (parsed.path,
-                self.container), '', {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(get)
-        self.assertEquals(resp.read(), ''.join(segments3))
-        self.assertEquals(resp.status, 200)
-
-        if not skip3:
-
-            # Ensure we can't access the manifest with the third account
-            # (because the segments are in a protected container even if the
-            # manifest itself is not).
-
-            def get(url, token, parsed, conn):
-                conn.request('GET', '%s/%s/manifest' % (parsed.path,
-                    self.container), '', {'X-Auth-Token': token})
-                return check_response(conn)
-            resp = retry(get, use_account=3)
-            resp.read()
-            self.assertEquals(resp.status, 403)
-
-            # Grant access to the third account
-            def post(url, token, parsed, conn):
-                conn.request('POST', '%s/%s' % (parsed.path, acontainer),
-                    '', {'X-Auth-Token': token, 'X-Container-Read':
-                    swift_test_user[2]})
-                return check_response(conn)
-            resp = retry(post)
-            resp.read()
-            self.assertEquals(resp.status, 204)
-
-            # The third account should be able to get the manifest now
-            def get(url, token, parsed, conn):
-                conn.request('GET', '%s/%s/manifest' % (parsed.path,
-                    self.container), '', {'X-Auth-Token': token})
-                return check_response(conn)
-            resp = retry(get, use_account=3)
-            self.assertEquals(resp.read(), ''.join(segments3))
-            self.assertEquals(resp.status, 200)
-
-        # Delete the manifest
-        def delete(url, token, parsed, conn, objnum):
-            conn.request('DELETE', '%s/%s/manifest' % (parsed.path,
-                self.container), '', {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(delete, objnum)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-
-        # Delete the third set of segments
-        def delete(url, token, parsed, conn, objnum):
-            conn.request('DELETE', '%s/%s/segments3/%s' % (parsed.path,
-                acontainer, str(objnum)), '', {'X-Auth-Token': token})
-            return check_response(conn)
-        for objnum in xrange(len(segments3)):
-            resp = retry(delete, objnum)
-            resp.read()
-            self.assertEquals(resp.status, 204)
-
-        # Delete the second set of segments
-        def delete(url, token, parsed, conn, objnum):
-            conn.request('DELETE', '%s/%s/segments2/%s' % (parsed.path,
-                self.container, str(objnum)), '', {'X-Auth-Token': token})
-            return check_response(conn)
-        for objnum in xrange(len(segments2)):
-            resp = retry(delete, objnum)
-            resp.read()
-            self.assertEquals(resp.status, 204)
-
-        # Delete the first set of segments
-        def delete(url, token, parsed, conn, objnum):
-            conn.request('DELETE', '%s/%s/segments1/%s' % (parsed.path,
-                self.container, str(objnum)), '', {'X-Auth-Token': token})
-            return check_response(conn)
-        for objnum in xrange(len(segments1)):
-            resp = retry(delete, objnum)
-            resp.read()
-            self.assertEquals(resp.status, 204)
-
-        # Delete the extra container
-        def delete(url, token, parsed, conn):
-            conn.request('DELETE', '%s/%s' % (parsed.path, acontainer), '',
-                {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(delete)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-
-    def test_delete_content_type(self):
-        if skip:
-            raise SkipTest
-
-        def put(url, token, parsed, conn):
-            conn.request('PUT', '%s/%s/hi' % (parsed.path,
-                self.container), 'there', {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(put)
-        resp.read()
-        self.assertEquals(resp.status, 201)
-
-        def delete(url, token, parsed, conn):
-            conn.request('DELETE', '%s/%s/hi' % (parsed.path, self.container),
-                '', {'X-Auth-Token': token})
-            return check_response(conn)
-        resp = retry(delete)
-        resp.read()
-        self.assertEquals(resp.status, 204)
-        self.assertEquals(resp.getheader('Content-Type'),
-                          'text/html; charset=UTF-8')
-
-
-if __name__ == '__main__':
-    unittest.main()
diff --git a/test/probe/__init__.py b/test/probe/__init__.py
index 1b3a96154a..e8e82ba9ee 100644
--- a/test/probe/__init__.py
+++ b/test/probe/__init__.py
@@ -1,3 +1,56 @@
+# Copyright (c) 2010-2017 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+
+import eventlet
+eventlet.monkey_patch()
+
+import subprocess
 from test import get_config
+from swift.common.utils import config_true_value
+
+
 config = get_config('probe_test')
 CHECK_SERVER_TIMEOUT = int(config.get('check_server_timeout', 30))
+SUBPROCESS_WAIT_TIMEOUT = int(config.get('subprocess_wait_timeout',
+                                         CHECK_SERVER_TIMEOUT))
+VALIDATE_RSYNC = config_true_value(config.get('validate_rsync', False))
+PROXY_BASE_URL = config.get('proxy_base_url')
+if PROXY_BASE_URL is None:
+    # TODO: find and load an "appropriate" proxy-server.conf(.d), piece
+    # something together from bind_ip, bind_port, and cert_file
+    PROXY_BASE_URL = 'http://127.0.0.1:8080'
+orig_popen_wait = subprocess.Popen.wait
+
+
+def wait_with_timeout(self, timeout=None, check_interval=0.01):
+    # We want to always have a timeout; no probe test should need to wait
+    # on even minute-long running processes.
+    timeout = SUBPROCESS_WAIT_TIMEOUT if timeout is None else timeout
+    try:
+        return orig_popen_wait(
+            self, timeout=timeout, check_interval=check_interval)
+    except subprocess.TimeoutExpired:
+        # Assume we tripped https://github.com/eventlet/eventlet/issues/989
+        # Kill the process (it should be mid-shutdown anyway) and log about it
+        print('WARNING: killing long running daemon after %ss: %r'
+              % (timeout, self.args))
+        self.kill()
+        # return 128 + 9 = 137 which is same as if using a command line like
+        # 'timeout -s KILL <timeout> <command>'
+        return 137
+
+
+subprocess.Popen.wait = wait_with_timeout
diff --git a/test/probe/brain.py b/test/probe/brain.py
new file mode 100644
index 0000000000..25f970c3b4
--- /dev/null
+++ b/test/probe/brain.py
@@ -0,0 +1,394 @@
+#!/usr/bin/python -u
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import functools
+import sys
+from io import BytesIO
+import itertools
+import uuid
+from optparse import OptionParser
+import random
+
+from urllib.parse import urlparse, parse_qs, quote
+
+from swift.common.manager import Manager
+from swift.common import utils, ring
+from swift.common.internal_client import InternalClient, UnexpectedResponse
+from swift.common.storage_policy import POLICIES
+from swift.common.http import HTTP_NOT_FOUND
+
+from swiftclient import client, get_auth, ClientException
+
+from test.probe import PROXY_BASE_URL
+from test.probe.common import ENABLED_POLICIES
+
+TIMEOUT = 60
+
+
+def meta_command(name, bases, attrs):
+    """
+    Look for attrs with a truthy attribute __command__ and add them to an
+    attribute __commands__ on the type that maps names to decorated methods.
+    The decorated methods' doc strings also get mapped in __docs__.
+
+    Also adds a method run(command_name, *args, **kwargs) that will
+    execute the method mapped to the name in __commands__.
+    """
+    commands = {}
+    docs = {}
+    for attr, value in attrs.items():
+        if getattr(value, '__command__', False):
+            commands[attr] = value
+            # methods always have a __doc__ attribute, sometimes empty
+            docs[attr] = (getattr(value, '__doc__', None) or
+                          'perform the %s command' % attr).strip()
+    attrs['__commands__'] = commands
+    attrs['__docs__'] = docs
+
+    def run(self, command, *args, **kwargs):
+        return self.__commands__[command](self, *args, **kwargs)
+    attrs.setdefault('run', run)
+    return type(name, bases, attrs)
+
+
+def command(f):
+    f.__command__ = True
+    return f
+
+
+class BaseBrain(object, metaclass=meta_command):
+    def _setup(self, account, container_name, object_name,
+               server_type, policy):
+        self.account = account
+        self.container_name = container_name
+        self.object_name = object_name
+        server_list = ['%s-server' % server_type] if server_type else ['all']
+        self.servers = Manager(server_list)
+        policies = list(ENABLED_POLICIES)
+        random.shuffle(policies)
+        self.policies = itertools.cycle(policies)
+
+        o = object_name if server_type == 'object' else None
+        c = container_name if server_type in ('object', 'container') else None
+        if server_type in ('container', 'account'):
+            if policy:
+                raise TypeError('Metadata server brains do not '
+                                'support specific storage policies')
+            self.policy = None
+            self.ring = ring.Ring(
+                '/etc/swift/%s.ring.gz' % server_type)
+        elif server_type == 'object':
+            if not policy:
+                raise TypeError('Object BrainSplitters need to '
+                                'specify the storage policy')
+            self.policy = policy
+            policy.load_ring('/etc/swift')
+            self.ring = policy.object_ring
+        else:
+            raise ValueError('Unknown server_type: %r' % server_type)
+        self.server_type = server_type
+
+        self.part, self.nodes = self.ring.get_nodes(self.account, c, o)
+
+        self.node_numbers = [n['id'] + 1 for n in self.nodes]
+        if 1 in self.node_numbers and 2 in self.node_numbers:
+            self.primary_numbers = (1, 2)
+            self.handoff_numbers = (3, 4)
+        else:
+            self.primary_numbers = (3, 4)
+            self.handoff_numbers = (1, 2)
+
+    @command
+    def start_primary_half(self):
+        """
+        start servers 1 & 2
+        """
+        tuple(self.servers.start(number=n) for n in self.primary_numbers)
+
+    @command
+    def stop_primary_half(self):
+        """
+        stop servers 1 & 2
+        """
+        tuple(self.servers.stop(number=n) for n in self.primary_numbers)
+
+    @command
+    def start_handoff_half(self):
+        """
+        start servers 3 & 4
+        """
+        tuple(self.servers.start(number=n) for n in self.handoff_numbers)
+
+    @command
+    def stop_handoff_half(self):
+        """
+        stop servers 3 & 4
+        """
+        tuple(self.servers.stop(number=n) for n in self.handoff_numbers)
+
+    @command
+    def put_container(self, policy_index=None, extra_headers=None):
+        """
+        put container with next storage policy
+        """
+
+        if policy_index is not None:
+            policy = POLICIES.get_by_index(int(policy_index))
+            if not policy:
+                raise ValueError('Unknown policy with index %s' % policy)
+        elif not self.policy:
+            policy = next(self.policies)
+        else:
+            policy = self.policy
+
+        headers = {'X-Storage-Policy': policy.name}
+        if extra_headers:
+            headers.update(extra_headers)
+        self.client.put_container(self.container_name, headers=headers)
+
+    @command
+    def delete_container(self):
+        """
+        delete container
+        """
+        self.client.delete_container(self.container_name)
+
+    @command
+    def put_object(self, headers=None, contents=None):
+        """
+        issue put for test object
+        """
+        self.client.put_object(self.container_name, self.object_name,
+                               headers=headers, contents=contents)
+
+    def post_object(self, headers=None):
+        """
+        issue POST for test object
+        """
+        return self.client.post_object(
+            self.container_name, self.object_name, headers=headers)
+
+    @command
+    def delete_object(self):
+        """
+        issue delete for test object
+        """
+        self.client.delete_object(self.container_name, self.object_name)
+
+    @command
+    def head_object(self):
+        """
+        issue HEAD for test object
+        """
+        return self.client.head_object(self.container_name, self.object_name)
+
+    @command
+    def get_object(self):
+        """
+        issue GET for test object
+        """
+        return self.client.get_object(self.container_name, self.object_name)
+
+
+class PublicBrainClient(object):
+    def __init__(self, url, token):
+        self.url = url
+        self.token = token
+        self.account = utils.split_path(urlparse(url).path, 2, 2)[1]
+
+    def put_container(self, container_name, headers):
+        return client.put_container(self.url, self.token, container_name,
+                                    headers=headers)
+
+    def post_container(self, container_name, headers):
+        return client.post_container(self.url, self.token, container_name,
+                                     headers)
+
+    def get_container(self, container_name, headers=None, query_string=None):
+        return client.get_container(self.url, self.token, container_name,
+                                    headers=headers, query_string=query_string)
+
+    def post_object(self, container_name, object_name, headers=None):
+        return client.post_object(self.url, self.token, container_name,
+                                  object_name, headers=headers)
+
+    def delete_container(self, container_name):
+        return client.delete_container(self.url, self.token, container_name)
+
+    def put_object(self, container_name, object_name, headers, contents,
+                   query_string=None):
+        return client.put_object(self.url, self.token, container_name,
+                                 object_name, headers=headers,
+                                 contents=contents, query_string=query_string)
+
+    def delete_object(self, container_name, object_name):
+        try:
+            client.delete_object(self.url, self.token,
+                                 container_name, object_name)
+        except ClientException as err:
+            if err.http_status != HTTP_NOT_FOUND:
+                raise
+
+    def head_object(self, container_name, object_name):
+        return client.head_object(self.url, self.token, container_name,
+                                  object_name)
+
+    def get_object(self, container_name, object_name, query_string=None):
+        return client.get_object(self.url, self.token,
+                                 container_name, object_name,
+                                 query_string=query_string)
+
+
+def translate_client_exception(m):
+    @functools.wraps(m)
+    def wrapper(*args, **kwargs):
+        try:
+            return m(*args, **kwargs)
+        except UnexpectedResponse as err:
+            raise ClientException(
+                err.args[0],
+                http_scheme=err.resp.environ['wsgi.url_scheme'],
+                http_host=err.resp.environ['SERVER_NAME'],
+                http_port=err.resp.environ['SERVER_PORT'],
+                http_path=quote(err.resp.environ['PATH_INFO']),
+                http_query=err.resp.environ['QUERY_STRING'],
+                http_status=err.resp.status_int,
+                http_reason=err.resp.explanation,
+                http_response_content=err.resp.body,
+                http_response_headers=err.resp.headers,
+            )
+    return wrapper
+
+
+class InternalBrainClient(object):
+
+    def __init__(self, conf_file, account='AUTH_test'):
+        self.swift = InternalClient(conf_file, 'probe-test', 3)
+        self.account = account
+
+    @translate_client_exception
+    def put_container(self, container_name, headers):
+        return self.swift.create_container(self.account, container_name,
+                                           headers=headers)
+
+    @translate_client_exception
+    def post_container(self, container_name, headers):
+        return self.swift.set_container_metadata(self.account, container_name,
+                                                 headers)
+
+    @translate_client_exception
+    def delete_container(self, container_name):
+        return self.swift.delete_container(self.account, container_name)
+
+    def parse_qs(self, query_string):
+        if query_string is not None:
+            return {k: v[-1] for k, v in parse_qs(query_string).items()}
+
+    @translate_client_exception
+    def put_object(self, container_name, object_name, headers, contents,
+                   query_string=None):
+        return self.swift.upload_object(BytesIO(contents), self.account,
+                                        container_name, object_name,
+                                        headers=headers,
+                                        params=self.parse_qs(query_string))
+
+    @translate_client_exception
+    def delete_object(self, container_name, object_name):
+        return self.swift.delete_object(
+            self.account, container_name, object_name)
+
+    @translate_client_exception
+    def head_object(self, container_name, object_name):
+        return self.swift.get_object_metadata(
+            self.account, container_name, object_name)
+
+    @translate_client_exception
+    def get_object(self, container_name, object_name, query_string=None):
+        status, headers, resp_iter = self.swift.get_object(
+            self.account, container_name, object_name,
+            params=self.parse_qs(query_string))
+        return headers, b''.join(resp_iter)
+
+
+class BrainSplitter(BaseBrain):
+    def __init__(self, url, token, container_name='test', object_name='test',
+                 server_type='container', policy=None):
+        self.client = PublicBrainClient(url, token)
+        self._setup(self.client.account, container_name, object_name,
+                    server_type, policy)
+
+
+class InternalBrainSplitter(BaseBrain):
+    def __init__(self, conf, container_name='test', object_name='test',
+                 server_type='container', policy=None):
+        self.client = InternalBrainClient(conf)
+        self._setup(self.client.account, container_name, object_name,
+                    server_type, policy)
+
+
+parser = OptionParser('%prog [options] '
+                      '<command>[:<args>[,<args>...]] [<command>...]')
+parser.usage += '\n\nCommands:\n\t' + \
+    '\n\t'.join("%s - %s" % (name, doc) for name, doc in
+                BrainSplitter.__docs__.items())
+parser.add_option('-c', '--container', default='container-%s' % uuid.uuid4(),
+                  help='set container name')
+parser.add_option('-o', '--object', default='object-%s' % uuid.uuid4(),
+                  help='set object name')
+parser.add_option('-s', '--server_type', default='container',
+                  help='set server type')
+parser.add_option('-P', '--policy_name', default=None,
+                  help='set policy')
+
+
+def main():
+    options, commands = parser.parse_args()
+    if not commands:
+        parser.print_help()
+        return 'ERROR: must specify at least one command'
+    for cmd_args in commands:
+        cmd = cmd_args.split(':', 1)[0]
+        if cmd not in BrainSplitter.__commands__:
+            parser.print_help()
+            return 'ERROR: unknown command %s' % cmd
+    url, token = get_auth(PROXY_BASE_URL + '/auth/v1.0',
+                          'test:tester', 'testing')
+    if options.server_type == 'object' and not options.policy_name:
+        options.policy_name = POLICIES.default.name
+    if options.policy_name:
+        options.server_type = 'object'
+        policy = POLICIES.get_by_name(options.policy_name)
+        if not policy:
+            return 'ERROR: unknown policy %r' % options.policy_name
+    else:
+        policy = None
+    brain = BrainSplitter(url, token, options.container, options.object,
+                          options.server_type, policy=policy)
+    for cmd_args in commands:
+        parts = cmd_args.split(':', 1)
+        command = parts[0]
+        if len(parts) > 1:
+            args = utils.list_from_csv(parts[1])
+        else:
+            args = ()
+        try:
+            brain.run(command, *args)
+        except ClientException as e:
+            print('**WARNING**: %s raised %s' % (command, e))
+    print('STATUS'.join(['*' * 25] * 2))
+    brain.servers.status()
+    sys.exit()
+
+
+if __name__ == "__main__":
+    sys.exit(main())
diff --git a/test/probe/common.py b/test/probe/common.py
index e3be31b4fa..c5471195d6 100644
--- a/test/probe/common.py
+++ b/test/probe/common.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,175 +13,809 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-from httplib import HTTPConnection
-from os import kill
-from signal import SIGTERM
-from subprocess import Popen, PIPE, STDOUT
-from time import sleep, time
 
-from swiftclient import get_auth, head_account
+import errno
+import gc
+import json
+from unittest import mock
+import os
+from subprocess import Popen, PIPE
+import sys
+from tempfile import mkdtemp
+from textwrap import dedent
+from time import sleep, time
+from collections import defaultdict
+import unittest
+from uuid import uuid4
+import shutil
+from http.client import HTTPConnection
+from urllib.parse import urlparse
 
+from swiftclient import get_auth, head_account, client
+from swift.common import internal_client, direct_client, utils
+from swift.common.direct_client import DirectClientException
 from swift.common.ring import Ring
+from swift.common.utils import hash_path, md5, \
+    readconf, renamer, rsync_module_interpolation
+from swift.common.manager import Manager
+from swift.common.storage_policy import POLICIES, EC_POLICY, REPL_POLICY
+from swift.obj.diskfile import get_data_dir
+from test.debug_logger import capture_logger
 
-from test.probe import CHECK_SERVER_TIMEOUT
+from test.probe import CHECK_SERVER_TIMEOUT, VALIDATE_RSYNC, PROXY_BASE_URL
 
 
-def start_server(port, port2server, pids, check=True):
-    server = port2server[port]
-    if server[:-1] in ('account', 'container', 'object'):
-        pids[server] = Popen([
-            'swift-%s-server' % server[:-1],
-            '/etc/swift/%s-server/%s.conf' % (server[:-1], server[-1])]).pid
-        if check:
-            return check_server(port, port2server, pids)
-    else:
-        pids[server] = Popen(['swift-%s-server' % server,
-                              '/etc/swift/%s-server.conf' % server]).pid
-        if check:
-            return check_server(port, port2server, pids)
-    return None
+ENABLED_POLICIES = [p for p in POLICIES if not p.is_deprecated]
+POLICIES_BY_TYPE = defaultdict(list)
+for p in POLICIES:
+    POLICIES_BY_TYPE[p.policy_type].append(p)
+
+
+def get_server_number(ipport, ipport2server):
+    server_number = ipport2server[ipport]
+    server, number = server_number[:-1], server_number[-1:]
+    try:
+        number = int(number)
+    except ValueError:
+        # probably the proxy
+        return server_number, None
+    return server, number
+
+
+def start_server(ipport, ipport2server):
+    server, number = get_server_number(ipport, ipport2server)
+    err = Manager([server]).start(number=number, wait=True)
+    if err:
+        raise Exception('unable to start %s' % (
+            server if not number else '%s%s' % (server, number)))
+    return check_server(ipport, ipport2server)
+
+
+def _check_storage(ipport, path):
+    conn = HTTPConnection(*ipport)
+    conn.request('GET', path)
+    resp = conn.getresponse()
+    # 404 because it's a nonsense path (and mount_check is false)
+    # 507 in case the test target is a VM using mount_check
+    if resp.status not in (404, 507):
+        raise Exception(
+            'Unexpected status %s' % resp.status)
+    return resp
+
+
+def _check_proxy(user, key):
+    url, token = get_auth(PROXY_BASE_URL + '/auth/v1.0',
+                          user, key)
+    account = url.split('/')[-1]
+    head_account(url, token)
+    return url, token, account
+
+
+def _retry_timeout(f, args=None, kwargs=None, timeout=CHECK_SERVER_TIMEOUT):
+    args = args or ()
+    kwargs = kwargs or {}
+    try_until = time() + timeout
+    while True:
+        try:
+            return f(*args, **kwargs)
+        except Exception as err:
+            if time() > try_until:
+                print(err)
+                fsignature = '%s(*%r, **%r)' % (f.__name__, args, kwargs)
+                print('Giving up on %s after %s seconds.' % (
+                    fsignature, timeout))
+                raise err
+            sleep(0.1)
 
 
-def check_server(port, port2server, pids, timeout=CHECK_SERVER_TIMEOUT):
-    server = port2server[port]
+def check_server(ipport, ipport2server):
+    server = ipport2server[ipport]
     if server[:-1] in ('account', 'container', 'object'):
+        if int(server[-1]) > 4:
+            return None
         path = '/connect/1/2'
         if server[:-1] == 'container':
             path += '/3'
         elif server[:-1] == 'object':
             path += '/3/4'
-        try_until = time() + timeout
-        while True:
-            try:
-                conn = HTTPConnection('127.0.0.1', port)
-                conn.request('GET', path)
-                resp = conn.getresponse()
-                if resp.status != 404:
-                    raise Exception(
-                        'Unexpected status %s' % resp.status)
-                break
-            except Exception, err:
-                if time() > try_until:
-                    print err
-                    print 'Giving up on %s:%s after %s seconds.' % (
-                        server, port, timeout)
-                    raise err
-                sleep(0.1)
+        rv = _retry_timeout(_check_storage, args=(ipport, path))
     else:
-        try_until = time() + timeout
-        while True:
-            try:
-                url, token = get_auth('http://127.0.0.1:8080/auth/v1.0',
-                                      'test:tester', 'testing')
-                account = url.split('/')[-1]
-                head_account(url, token)
-                return url, token, account
-            except Exception, err:
-                if time() > try_until:
-                    print err
-                    print 'Giving up on proxy:8080 after 30 seconds.'
-                    raise err
-                sleep(0.1)
-    return None
-
-
-def kill_server(port, port2server, pids):
-    try:
-        kill(pids[port2server[port]], SIGTERM)
-    except Exception, err:
-        print err
+        rv = _retry_timeout(_check_proxy, args=(
+            'test:tester', 'testing'))
+    return rv
+
+
+def kill_server(ipport, ipport2server):
+    server, number = get_server_number(ipport, ipport2server)
+    err = Manager([server]).kill(number=number)
+    if err:
+        raise Exception('unable to kill %s' % (server if not number else
+                                               '%s%s' % (server, number)))
+    return wait_for_server_to_hangup(ipport)
+
+
+def wait_for_server_to_hangup(ipport):
     try_until = time() + 30
     while True:
         try:
-            conn = HTTPConnection('127.0.0.1', port)
+            conn = HTTPConnection(*ipport)
             conn.request('GET', '/')
             conn.getresponse()
-        except Exception, err:
+        except Exception:
             break
         if time() > try_until:
             raise Exception(
-                'Still answering on port %s after 30 seconds' % port)
+                'Still answering on %s:%s after 30 seconds' % ipport)
         sleep(0.1)
 
 
-def kill_servers(port2server, pids):
-    for port in port2server:
-        kill_server(port, port2server, pids)
-
-
-def kill_nonprimary_server(primary_nodes, port2server, pids):
-    primary_ports = [n['port'] for n in primary_nodes]
-    for port, server in port2server.iteritems():
-        if port in primary_ports:
+def kill_nonprimary_server(primary_nodes, ipport2server):
+    primary_ipports = [(n['ip'], n['port']) for n in primary_nodes]
+    for ipport, server in ipport2server.items():
+        if ipport in primary_ipports:
             server_type = server[:-1]
             break
     else:
         raise Exception('Cannot figure out server type for %r' % primary_nodes)
-    for port, server in list(port2server.iteritems()):
-        if server[:-1] == server_type and port not in primary_ports:
-            kill_server(port, port2server, pids)
-            return port
+    for ipport, server in list(ipport2server.items()):
+        if server[:-1] == server_type and ipport not in primary_ipports:
+            kill_server(ipport, ipport2server)
+            return ipport
+
+
+def add_ring_devs_to_ipport2server(ring, server_type, ipport2server,
+                                   servers_per_port=0):
+    # We'll number the servers by order of unique occurrence of:
+    #   IP, if servers_per_port > 0 OR there > 1 IP in ring
+    #   ipport, otherwise
+    unique_ip_count = len({dev['ip'] for dev in ring.devs if dev})
+    things_to_number = {}
+    number = 0
+    for dev in filter(None, ring.devs):
+        ip = dev['ip']
+        ipport = (ip, dev['port'])
+        unique_by = ip if servers_per_port or unique_ip_count > 1 else ipport
+        if unique_by not in things_to_number:
+            number += 1
+            things_to_number[unique_by] = number
+        ipport2server[ipport] = '%s%d' % (server_type,
+                                          things_to_number[unique_by])
+
+
+def store_config_paths(name, configs):
+    server_names = [name, '%s-replicator' % name]
+    if name == 'container':
+        server_names.append('container-sharder')
+    elif name == 'object':
+        server_names.append('object-reconstructor')
+    for server_name in server_names:
+        for server in Manager([server_name]):
+            for i, conf in enumerate(server.conf_files(), 1):
+                configs[server.server][i] = conf
+
 
+def get_ring(ring_name, required_replicas, required_devices,
+             server=None, force_validate=None, ipport2server=None,
+             config_paths=None):
+    if not server:
+        server = ring_name
+    ring = Ring('/etc/swift', ring_name=ring_name)
+    if ipport2server is None:
+        ipport2server = {}  # used internally, even if not passed in
+    if config_paths is None:
+        config_paths = defaultdict(dict)
+    store_config_paths(server, config_paths)
 
-def reset_environment():
-    p = Popen("resetswift 2>&1", shell=True, stdout=PIPE)
+    repl_name = '%s-replicator' % server
+    repl_configs = {i: readconf(c, section_name=repl_name)
+                    for i, c in config_paths[repl_name].items()}
+    servers_per_port = any(int(c.get('servers_per_port', '0'))
+                           for c in repl_configs.values())
+
+    add_ring_devs_to_ipport2server(ring, server, ipport2server,
+                                   servers_per_port=servers_per_port)
+    if not VALIDATE_RSYNC and not force_validate:
+        return ring
+    # easy sanity checks
+    if ring.replica_count != required_replicas:
+        raise unittest.SkipTest('%s has %s replicas instead of %s' % (
+            ring.serialized_path, ring.replica_count, required_replicas))
+
+    devs = [dev for dev in ring.devs if dev is not None]
+    if len(devs) != required_devices:
+        raise unittest.SkipTest('%s has %s devices instead of %s' % (
+            ring.serialized_path, len(devs), required_devices))
+    for dev in devs:
+        # verify server is exposing mounted device
+        ipport = (dev['ip'], dev['port'])
+        _, server_number = get_server_number(ipport, ipport2server)
+        conf = repl_configs[server_number]
+        for device in os.listdir(conf['devices']):
+            if device == dev['device']:
+                dev_path = os.path.join(conf['devices'], device)
+                full_path = os.path.realpath(dev_path)
+                if not os.path.exists(full_path):
+                    raise unittest.SkipTest(
+                        'device %s in %s was not found (%s)' %
+                        (device, conf['devices'], full_path))
+                break
+        else:
+            raise unittest.SkipTest(
+                "unable to find ring device %s under %s's devices (%s)" % (
+                    dev['device'], server, conf['devices']))
+        # verify server is exposing rsync device
+        rsync_export = conf.get('rsync_module', '').rstrip('/')
+        if not rsync_export:
+            rsync_export = '{replication_ip}::%s' % server
+        cmd = "rsync %s" % rsync_module_interpolation(rsync_export, dev)
+        p = Popen(cmd, shell=True, stdout=PIPE)
+        stdout, _stderr = p.communicate()
+        if p.returncode:
+            raise unittest.SkipTest('unable to connect to rsync '
+                                    'export %s (%s)' % (rsync_export, cmd))
+        for line in stdout.decode().splitlines():
+            if line.rsplit(None, 1)[-1] == dev['device']:
+                break
+        else:
+            raise unittest.SkipTest("unable to find ring device %s under "
+                                    "rsync's exported devices for %s (%s)" %
+                                    (dev['device'], rsync_export, cmd))
+    return ring
+
+
+def get_policy(**kwargs):
+    kwargs.setdefault('is_deprecated', False)
+    # go through the policies and make sure they match the
+    # requirements of kwargs
+    for policy in POLICIES:
+        # TODO: for EC, pop policy type here and check it first
+        matches = True
+        for key, value in kwargs.items():
+            try:
+                if getattr(policy, key) != value:
+                    matches = False
+            except AttributeError:
+                matches = False
+        if matches:
+            return policy
+    raise unittest.SkipTest('No policy matching %s' % kwargs)
+
+
+def run_cleanup(cmd):
+    p = Popen(cmd + " 2>&1", shell=True, stdout=PIPE)
     stdout, _stderr = p.communicate()
-    print stdout
-    pids = {}
-    try:
-        port2server = {}
-        for server, port in [('account', 6002), ('container', 6001),
-                             ('object', 6000)]:
-            for number in xrange(1, 5):
-                port2server[port + (number * 10)] = '%s%d' % (server, number)
-        for port in port2server:
-            start_server(port, port2server, pids, check=False)
-        for port in port2server:
-            check_server(port, port2server, pids)
-        port2server[8080] = 'proxy'
-        url, token, account = start_server(8080, port2server, pids)
-        account_ring = Ring('/etc/swift/account.ring.gz')
-        container_ring = Ring('/etc/swift/container.ring.gz')
-        object_ring = Ring('/etc/swift/object.ring.gz')
-    except BaseException:
+    if p.returncode:
+        raise AssertionError(
+            'Cleanup with %r failed: stdout: %s, stderr: %s'
+            % (cmd, stdout, _stderr))
+
+    print(stdout)
+    Manager(['all']).stop()
+
+
+def resetswift():
+    run_cleanup("resetswift")
+
+
+def kill_orphans():
+    run_cleanup("swift-orphans -a 0 -k 9")
+
+
+class Body(object):
+
+    def __init__(self, total=3.5 * 2 ** 20):
+        self.length = int(total)
+        self.hasher = md5(usedforsecurity=False)
+        self.read_amount = 0
+        self.chunk = uuid4().hex.encode('ascii') * 2 ** 10
+        self.buff = b''
+
+    @property
+    def etag(self):
+        return self.hasher.hexdigest()
+
+    def __len__(self):
+        return self.length
+
+    def read(self, amount):
+        if len(self.buff) < amount:
+            try:
+                self.buff += next(self)
+            except StopIteration:
+                pass
+        rv, self.buff = self.buff[:amount], self.buff[amount:]
+        return rv
+
+    def __iter__(self):
+        return self
+
+    def __next__(self):
+        if self.buff:
+            rv, self.buff = self.buff, b''
+            return rv
+        if self.read_amount >= self.length:
+            raise StopIteration()
+        rv = self.chunk[:int(self.length - self.read_amount)]
+        self.read_amount += len(rv)
+        self.hasher.update(rv)
+        return rv
+
+
+def exclude_nodes(nodes, *excludes):
+    """
+    Iterate over ``nodes`` yielding only those not in ``excludes``.
+
+    The index key of the node dicts is ignored when matching nodes against the
+    ``excludes`` nodes. Index is not a fundamental property of a node but a
+    variable annotation added by the Ring depending upon the partition for
+    which the nodes were generated.
+
+    :param nodes: an iterable of node dicts.
+    :param *excludes: one or more node dicts that should not be yielded.
+    :return: yields node dicts.
+    """
+    for node in nodes:
+        match_node = {k: mock.ANY if k == 'index' else v
+                      for k, v in node.items()}
+        if any(exclude == match_node for exclude in excludes):
+            continue
+        yield node
+
+
+class ProbeTest(unittest.TestCase):
+    """
+    Don't instantiate this directly, use a child class instead.
+    """
+
+    def _make_name(self, prefix):
+        return ('%s%s' % (prefix, uuid4())).encode()
+
+    def _load_rings_and_configs(self):
+        self.ipport2server = {}
+        self.configs = defaultdict(dict)
+        self.account_ring = get_ring(
+            'account',
+            self.acct_cont_required_replicas,
+            self.acct_cont_required_devices,
+            ipport2server=self.ipport2server,
+            config_paths=self.configs)
+        self.container_ring = get_ring(
+            'container',
+            self.acct_cont_required_replicas,
+            self.acct_cont_required_devices,
+            ipport2server=self.ipport2server,
+            config_paths=self.configs)
+        self.policy = get_policy(**self.policy_requirements)
+        self.object_ring = get_ring(
+            self.policy.ring_name,
+            self.obj_required_replicas,
+            self.obj_required_devices,
+            server='object',
+            ipport2server=self.ipport2server,
+            config_paths=self.configs)
+        for server in Manager(['proxy-server']):
+            for conf in server.conf_files():
+                self.configs['proxy-server'] = conf
+
+    def setUp(self):
+        # previous test may have left DatabaseBroker instances in garbage with
+        # open connections to db files which will prevent unmounting devices in
+        # resetswift, so collect garbage now
+        gc.collect()
+        resetswift()
+        kill_orphans()
+        self._load_rings_and_configs()
+        try:
+            self.servers_per_port = any(
+                int(readconf(c, section_name='object-replicator').get(
+                    'servers_per_port', '0'))
+                for c in self.configs['object-replicator'].values())
+
+            Manager(['main']).start(wait=True)
+            for ipport in self.ipport2server:
+                check_server(ipport, self.ipport2server)
+            proxy_conf = readconf(self.configs['proxy-server'],
+                                  section_name='app:proxy-server')
+            proxy_ipport = (proxy_conf.get('bind_ip', '127.0.0.1'),
+                            int(proxy_conf.get('bind_port', 8080)))
+            self.ipport2server[proxy_ipport] = 'proxy'
+            self.url, self.token, self.account = check_server(
+                proxy_ipport, self.ipport2server)
+            self.account_1 = {
+                'url': self.url, 'token': self.token, 'account': self.account}
+
+            rv = _retry_timeout(_check_proxy, args=(
+                'test2:tester2', 'testing2'))
+            self.account_2 = {
+                k: v for (k, v) in zip(('url', 'token', 'account'), rv)}
+
+            self.replicators = Manager(
+                ['account-replicator', 'container-replicator',
+                 'object-replicator'])
+            self.updaters = Manager(['container-updater', 'object-updater'])
+        except BaseException:
+            try:
+                raise
+            finally:
+                try:
+                    Manager(['all']).kill()
+                except Exception:
+                    pass
+        info_url = "%s://%s/info" % (urlparse(self.url).scheme,
+                                     urlparse(self.url).netloc)
+        proxy_conn = client.http_connection(info_url)
+        self.cluster_info = client.get_capabilities(proxy_conn)
+
+    def tearDown(self):
+        Manager(['all']).kill()
+
+    def assertLengthEqual(self, obj, length):
+        obj_len = len(obj)
+        self.assertEqual(obj_len, length, 'len(%r) == %d, not %d' % (
+            obj, obj_len, length))
+
+    def device_dir(self, node):
+        server_type, config_number = get_server_number(
+            (node['ip'], node['port']), self.ipport2server)
+        repl_server = '%s-replicator' % server_type
+        conf = readconf(self.configs[repl_server][config_number],
+                        section_name=repl_server)
+        return os.path.join(conf['devices'], node['device'])
+
+    def storage_dir(self, node, part=None, policy=None):
+        policy = policy or self.policy
+        device_path = self.device_dir(node)
+        path_parts = [device_path, get_data_dir(policy)]
+        if part is not None:
+            path_parts.append(str(part))
+        return os.path.join(*path_parts)
+
+    def config_number(self, node):
+        _server_type, config_number = get_server_number(
+            (node['ip'], node['port']), self.ipport2server)
+        return config_number
+
+    def is_local_to(self, node1, node2):
+        """
+        Return True if both ring devices are "local" to each other (on the same
+        "server".
+        """
+        if self.servers_per_port:
+            return node1['ip'] == node2['ip']
+
+        # Without a disambiguating IP, for SAIOs, we have to assume ports
+        # uniquely identify "servers".  SAIOs should be configured to *either*
+        # have unique IPs per node (e.g. 127.0.0.1, 127.0.0.2, etc.) OR unique
+        # ports per server (i.e. sdb1 & sdb5 would have same port numbers in
+        # the 8-disk EC ring).
+        return node1['port'] == node2['port']
+
+    def get_to_final_state(self):
+        # these .stop()s are probably not strictly necessary,
+        # but may prevent race conditions
+        self.replicators.stop()
+        self.updaters.stop()
+
+        self.replicators.once()
+        self.updaters.once()
+        self.replicators.once()
+
+    def kill_drive(self, device):
+        if os.path.ismount(device):
+            os.system('sudo umount %s' % device)
+        else:
+            renamer(device, device + "X")
+
+    def revive_drive(self, device):
+        disabled_name = device + "X"
+        if os.path.isdir(disabled_name):
+            renamer(disabled_name, device)
+        else:
+            os.system('sudo mount %s' % device)
+
+    def make_internal_client(self):
+        tempdir = mkdtemp()
         try:
-            raise
+            conf_path = os.path.join(tempdir, 'internal_client.conf')
+            conf_body = """
+            [DEFAULT]
+            swift_dir = /etc/swift
+
+            [pipeline:main]
+            pipeline = catch_errors cache copy proxy-server
+
+            [app:proxy-server]
+            use = egg:swift#proxy
+            allow_account_management = True
+
+            [filter:copy]
+            use = egg:swift#copy
+
+            [filter:cache]
+            use = egg:swift#memcache
+
+            [filter:catch_errors]
+            use = egg:swift#catch_errors
+            """
+            with open(conf_path, 'w') as f:
+                f.write(dedent(conf_body))
+            return internal_client.InternalClient(conf_path, 'test', 1)
         finally:
+            shutil.rmtree(tempdir)
+
+    def get_all_object_nodes(self):
+        """
+        Returns a list of all nodes in all object storage policies.
+
+        :return: a list of node dicts.
+        """
+        all_obj_nodes = {}
+        for policy in ENABLED_POLICIES:
+            for dev in policy.object_ring.devs:
+                all_obj_nodes[dev['device']] = dev
+        return list(all_obj_nodes.values())
+
+    def gather_async_pendings(self, onodes=None):
+        """
+        Returns a list of paths to async pending files found on given nodes.
+
+        :param onodes: a list of nodes. If None, check all object nodes.
+        :return: a list of file paths.
+        """
+        async_pendings = []
+        if onodes is None:
+            onodes = self.get_all_object_nodes()
+        for onode in onodes:
+            device_dir = self.device_dir(onode)
+            for ap_pol_dir in os.listdir(device_dir):
+                if not ap_pol_dir.startswith('async_pending'):
+                    # skip 'objects', 'containers', etc.
+                    continue
+                async_pending_dir = os.path.join(device_dir, ap_pol_dir)
+                try:
+                    ap_dirs = os.listdir(async_pending_dir)
+                except OSError as err:
+                    if err.errno == errno.ENOENT:
+                        pass
+                    else:
+                        raise
+                else:
+                    for ap_dir in ap_dirs:
+                        ap_dir_fullpath = os.path.join(
+                            async_pending_dir, ap_dir)
+                        async_pendings.extend([
+                            os.path.join(ap_dir_fullpath, ent)
+                            for ent in os.listdir(ap_dir_fullpath)])
+        return async_pendings
+
+    def run_custom_daemon(self, klass, conf_section, conf_index,
+                          custom_conf, **kwargs):
+        conf_file = self.configs[conf_section][conf_index]
+        conf = utils.readconf(conf_file, conf_section)
+        conf.update(custom_conf)
+        # Use a CaptureLogAdapter in order to preserve the pattern of tests
+        # calling the log accessor methods (e.g. get_lines_for_level) directly
+        # on the logger instance
+        with capture_logger(conf, conf.get('log_name', conf_section),
+                            log_to_console=kwargs.pop('verbose', False),
+                            log_route=conf_section) as log_adapter:
+            daemon = klass(conf, log_adapter)
+            daemon.run_once(**kwargs)
+        return daemon
+
+
+def _get_db_file_path(obj_dir):
+    files = sorted(os.listdir(obj_dir), reverse=True)
+    for filename in files:
+        if filename.endswith('db'):
+            return os.path.join(obj_dir, filename)
+
+
+class ReplProbeTest(ProbeTest):
+
+    acct_cont_required_replicas = 3
+    acct_cont_required_devices = 4
+    obj_required_replicas = 3
+    obj_required_devices = 4
+    policy_requirements = {'policy_type': REPL_POLICY}
+
+    def direct_container_op(self, func, account=None, container=None,
+                            expect_failure=False):
+        account = account if account else self.account
+        container = container if container else self.container_to_shard
+        cpart, cnodes = self.container_ring.get_nodes(account, container)
+        unexpected_responses = []
+        results = {}
+        for cnode in cnodes:
             try:
-                kill_servers(port2server, pids)
-            except Exception:
-                pass
-    return pids, port2server, account_ring, container_ring, object_ring, url, \
-        token, account
-
-
-def get_to_final_state():
-    processes = []
-    for job in ('account-replicator', 'container-replicator',
-                'object-replicator'):
-        for number in xrange(1, 5):
-            processes.append(Popen([
-                'swift-%s' % job,
-                '/etc/swift/%s-server/%d.conf' % (job.split('-')[0], number),
-                'once']))
-    for process in processes:
-        process.wait()
-    processes = []
-    for job in ('container-updater', 'object-updater'):
-        for number in xrange(1, 5):
-            processes.append(Popen([
-                'swift-%s' % job,
-                '/etc/swift/%s-server/%d.conf' % (job.split('-')[0], number),
-                'once']))
-    for process in processes:
-        process.wait()
-    processes = []
-    for job in ('account-replicator', 'container-replicator',
-                'object-replicator'):
-        for number in xrange(1, 5):
-            processes.append(Popen([
-                'swift-%s' % job,
-                '/etc/swift/%s-server/%d.conf' % (job.split('-')[0], number),
-                'once']))
-    for process in processes:
-        process.wait()
+                results[cnode['id']] = func(cnode, cpart, account, container)
+            except DirectClientException as err:
+                if not expect_failure:
+                    unexpected_responses.append((cnode, err))
+            else:
+                if expect_failure:
+                    unexpected_responses.append((cnode, 'success'))
+        if unexpected_responses:
+            self.fail('Unexpected responses: %s' % unexpected_responses)
+        return results
+
+    def direct_delete_container(self, account=None, container=None,
+                                expect_failure=False):
+        self.direct_container_op(direct_client.direct_delete_container,
+                                 account, container, expect_failure)
+
+    def direct_head_container(self, account=None, container=None,
+                              expect_failure=False):
+        return self.direct_container_op(direct_client.direct_head_container,
+                                        account, container, expect_failure)
+
+    def direct_get_container(self, account=None, container=None,
+                             expect_failure=False):
+        return self.direct_container_op(direct_client.direct_get_container,
+                                        account, container, expect_failure)
+
+    def get_container_db_files(self, container):
+        opart, onodes = self.container_ring.get_nodes(self.account, container)
+        db_files = []
+        for onode in onodes:
+            node_id = self.config_number(onode)
+            device = onode['device']
+            hash_str = hash_path(self.account, container)
+            server_conf = readconf(self.configs['container-server'][node_id])
+            devices = server_conf['app:container-server']['devices']
+            obj_dir = '%s/%s/containers/%s/%s/%s/' % (devices,
+                                                      device, opart,
+                                                      hash_str[-3:], hash_str)
+            db_files.append(_get_db_file_path(obj_dir))
+
+        return db_files
+
+
+class ECProbeTest(ProbeTest):
+
+    acct_cont_required_replicas = 3
+    acct_cont_required_devices = 4
+    obj_required_replicas = 6
+    obj_required_devices = 8
+    policy_requirements = {'policy_type': EC_POLICY}
+
+    def setUp(self):
+        super(ECProbeTest, self).setUp()
+        self.container_name = self._make_name('container-')
+        self.object_name = self._make_name('object-')
+        # sanity
+        self.assertEqual(self.policy.policy_type, EC_POLICY)
+        self.reconstructor = Manager(["object-reconstructor"])
+
+    def proxy_put(self, extra_headers=None):
+        contents = Body()
+        headers = {
+            self._make_name('x-object-meta-').decode('utf8'):
+                self._make_name('meta-foo-').decode('utf8'),
+        }
+        if extra_headers:
+            headers.update(extra_headers)
+        self.etag = client.put_object(self.url, self.token,
+                                      self.container_name,
+                                      self.object_name,
+                                      contents=contents, headers=headers)
+
+    def proxy_get(self):
+        # GET object
+        headers, body = client.get_object(self.url, self.token,
+                                          self.container_name,
+                                          self.object_name,
+                                          resp_chunk_size=64 * 2 ** 10)
+        resp_checksum = md5(usedforsecurity=False)
+        for chunk in body:
+            resp_checksum.update(chunk)
+        return headers, resp_checksum.hexdigest()
+
+    def direct_get(self, node, part, require_durable=True, extra_headers=None):
+        req_headers = {'X-Backend-Storage-Policy-Index': int(self.policy)}
+        if extra_headers:
+            req_headers.update(extra_headers)
+        if not require_durable:
+            req_headers.update(
+                {'X-Backend-Fragment-Preferences': json.dumps([])})
+        headers, data = direct_client.direct_get_object(
+            node, part, self.account, self.container_name, self.object_name,
+            headers=req_headers, resp_chunk_size=64 * 2 ** 20)
+        hasher = md5(usedforsecurity=False)
+        for chunk in data:
+            hasher.update(chunk)
+        return headers, hasher.hexdigest()
+
+    def assert_direct_get_fails(self, onode, opart, status,
+                                require_durable=True):
+        try:
+            self.direct_get(onode, opart, require_durable=require_durable)
+        except direct_client.DirectClientException as err:
+            self.assertEqual(err.http_status, status)
+            return err
+        else:
+            self.fail('Node data on %r was not fully destroyed!' % (onode,))
+
+    def assert_direct_get_succeeds(self, onode, opart, require_durable=True,
+                                   extra_headers=None):
+        try:
+            return self.direct_get(onode, opart,
+                                   require_durable=require_durable,
+                                   extra_headers=extra_headers)
+        except direct_client.DirectClientException as err:
+            self.fail('Node data on %r was not available: %s' % (onode, err))
+
+    def break_nodes(self, nodes, opart, failed, non_durable):
+        # delete partitions on the failed nodes and remove durable marker from
+        # non-durable nodes
+        made_non_durable = 0
+        for i, node in enumerate(nodes):
+            part_dir = self.storage_dir(node, part=opart)
+            if i in failed:
+                shutil.rmtree(part_dir, True)
+                try:
+                    self.direct_get(node, opart)
+                except direct_client.DirectClientException as err:
+                    self.assertEqual(err.http_status, 404)
+            elif i in non_durable:
+                for dirs, subdirs, files in os.walk(part_dir):
+                    for fname in sorted(files, reverse=True):
+                        # make the newest durable be non-durable
+                        if fname.endswith('.data'):
+                            made_non_durable += 1
+                            non_durable_fname = fname.replace('#d', '')
+                            os.rename(os.path.join(dirs, fname),
+                                      os.path.join(dirs, non_durable_fname))
+
+                            break
+                headers, etag = self.direct_get(node, opart,
+                                                require_durable=False)
+                self.assertNotIn('X-Backend-Durable-Timestamp', headers)
+            try:
+                os.remove(os.path.join(part_dir, 'hashes.pkl'))
+            except OSError as e:
+                if e.errno != errno.ENOENT:
+                    raise
+        return made_non_durable
+
+    def make_durable(self, nodes, opart):
+        # ensure all data files on the specified nodes are durable
+        made_durable = 0
+        for i, node in enumerate(nodes):
+            part_dir = self.storage_dir(node, part=opart)
+            for dirs, subdirs, files in os.walk(part_dir):
+                for fname in sorted(files, reverse=True):
+                    # make the newest non-durable be durable
+                    if (fname.endswith('.data') and
+                            not fname.endswith('#d.data')):
+                        made_durable += 1
+                        non_durable_fname = fname.replace('.data', '#d.data')
+                        os.rename(os.path.join(dirs, fname),
+                                  os.path.join(dirs, non_durable_fname))
+
+                        break
+            headers, etag = self.assert_direct_get_succeeds(node, opart)
+            self.assertIn('X-Backend-Durable-Timestamp', headers)
+            try:
+                os.remove(os.path.join(part_dir, 'hashes.pkl'))
+            except OSError as e:
+                if e.errno != errno.ENOENT:
+                    raise
+        return made_durable
+
+
+if __name__ == "__main__":
+    for server in ('account', 'container'):
+        try:
+            get_ring(server, 3, 4,
+                     force_validate=True)
+        except unittest.SkipTest as err:
+            sys.exit('%s ERROR: %s' % (server, err))
+        print('%s OK' % server)
+    for policy in POLICIES:
+        try:
+            get_ring(policy.ring_name, 3, 4,
+                     server='object', force_validate=True)
+        except unittest.SkipTest as err:
+            sys.exit('object ERROR (%s): %s' % (policy.name, err))
+        print('object OK (%s)' % policy.name)
diff --git a/test/probe/test_account_failures.py b/test/probe/test_account_failures.py
old mode 100755
new mode 100644
index 63c5b2795b..23292ed2f7
--- a/test/probe/test_account_failures.py
+++ b/test/probe/test_account_failures.py
@@ -1,5 +1,5 @@
 #!/usr/bin/python -u
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -14,116 +14,105 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-from subprocess import Popen
-from unittest import main, TestCase
+from unittest import main
 
 from swiftclient import client
 
 from swift.common import direct_client
-from test.probe.common import get_to_final_state, kill_nonprimary_server, \
-    kill_server, kill_servers, reset_environment, start_server
+from swift.common.manager import Manager
+from test.probe.common import kill_nonprimary_server, \
+    kill_server, ReplProbeTest, start_server
 
 
-class TestAccountFailures(TestCase):
-
-    def setUp(self):
-        (self.pids, self.port2server, self.account_ring, self.container_ring,
-         self.object_ring, self.url, self.token,
-         self.account) = reset_environment()
-
-    def tearDown(self):
-        kill_servers(self.port2server, self.pids)
+class TestAccountFailures(ReplProbeTest):
 
     def test_main(self):
         # Create container1 and container2
-        # Assert account level sees them
-        # Create container2/object1
-        # Assert account level doesn't see it yet
-        # Get to final state
-        # Assert account level now sees the container2/object1
-        # Kill account servers excepting two of the primaries
-        # Delete container1
-        # Assert account level knows container1 is gone but doesn't know about
-        #   container2/object2 yet
-        # Put container2/object2
-        # Run container updaters
-        # Assert account level now knows about container2/object2
-        # Restart other primary account server
-        # Assert that server doesn't know about container1's deletion or the
-        #   new container2/object2 yet
-        # Get to final state
-        # Assert that server is now up to date
-
         container1 = 'container1'
         client.put_container(self.url, self.token, container1)
         container2 = 'container2'
         client.put_container(self.url, self.token, container2)
+
+        # Assert account level sees them
         headers, containers = client.get_account(self.url, self.token)
-        self.assertEquals(headers['x-account-container-count'], '2')
-        self.assertEquals(headers['x-account-object-count'], '0')
-        self.assertEquals(headers['x-account-bytes-used'], '0')
+        self.assertEqual(headers['x-account-container-count'], '2')
+        self.assertEqual(headers['x-account-object-count'], '0')
+        self.assertEqual(headers['x-account-bytes-used'], '0')
         found1 = False
         found2 = False
         for container in containers:
             if container['name'] == container1:
                 found1 = True
-                self.assertEquals(container['count'], 0)
-                self.assertEquals(container['bytes'], 0)
+                self.assertEqual(container['count'], 0)
+                self.assertEqual(container['bytes'], 0)
             elif container['name'] == container2:
                 found2 = True
-                self.assertEquals(container['count'], 0)
-                self.assertEquals(container['bytes'], 0)
-        self.assert_(found1)
-        self.assert_(found2)
+                self.assertEqual(container['count'], 0)
+                self.assertEqual(container['bytes'], 0)
+        self.assertTrue(found1)
+        self.assertTrue(found2)
 
+        # Create container2/object1
         client.put_object(self.url, self.token, container2, 'object1', '1234')
+
+        # Assert account level doesn't see it yet
         headers, containers = client.get_account(self.url, self.token)
-        self.assertEquals(headers['x-account-container-count'], '2')
-        self.assertEquals(headers['x-account-object-count'], '0')
-        self.assertEquals(headers['x-account-bytes-used'], '0')
+        self.assertEqual(headers['x-account-container-count'], '2')
+        self.assertEqual(headers['x-account-object-count'], '0')
+        self.assertEqual(headers['x-account-bytes-used'], '0')
         found1 = False
         found2 = False
         for container in containers:
             if container['name'] == container1:
                 found1 = True
-                self.assertEquals(container['count'], 0)
-                self.assertEquals(container['bytes'], 0)
+                self.assertEqual(container['count'], 0)
+                self.assertEqual(container['bytes'], 0)
             elif container['name'] == container2:
                 found2 = True
-                self.assertEquals(container['count'], 0)
-                self.assertEquals(container['bytes'], 0)
-        self.assert_(found1)
-        self.assert_(found2)
+                self.assertEqual(container['count'], 0)
+                self.assertEqual(container['bytes'], 0)
+        self.assertTrue(found1)
+        self.assertTrue(found2)
+
+        # Get to final state
+        self.get_to_final_state()
 
-        get_to_final_state()
+        # Assert account level now sees the container2/object1
         headers, containers = client.get_account(self.url, self.token)
-        self.assertEquals(headers['x-account-container-count'], '2')
-        self.assertEquals(headers['x-account-object-count'], '1')
-        self.assertEquals(headers['x-account-bytes-used'], '4')
+        self.assertEqual(headers['x-account-container-count'], '2')
+        self.assertEqual(headers['x-account-object-count'], '1')
+        self.assertEqual(headers['x-account-bytes-used'], '4')
         found1 = False
         found2 = False
         for container in containers:
             if container['name'] == container1:
                 found1 = True
-                self.assertEquals(container['count'], 0)
-                self.assertEquals(container['bytes'], 0)
+                self.assertEqual(container['count'], 0)
+                self.assertEqual(container['bytes'], 0)
             elif container['name'] == container2:
                 found2 = True
-                self.assertEquals(container['count'], 1)
-                self.assertEquals(container['bytes'], 4)
-        self.assert_(found1)
-        self.assert_(found2)
+                self.assertEqual(container['count'], 1)
+                self.assertEqual(container['bytes'], 4)
+        self.assertTrue(found1)
+        self.assertTrue(found2)
 
         apart, anodes = self.account_ring.get_nodes(self.account)
-        kill_nonprimary_server(anodes, self.port2server, self.pids)
-        kill_server(anodes[0]['port'], self.port2server, self.pids)
+        kill_nonprimary_server(anodes, self.ipport2server)
+        kill_server((anodes[0]['ip'], anodes[0]['port']), self.ipport2server)
+        # Kill account servers excepting two of the primaries
 
+        # Delete container1
         client.delete_container(self.url, self.token, container1)
+
+        # Put container2/object2
         client.put_object(self.url, self.token, container2, 'object2', '12345')
+
+        # Assert account level knows container1 is gone but doesn't know about
+        #   container2/object2 yet
         headers, containers = client.get_account(self.url, self.token)
-        self.assertEquals(headers['x-account-container-count'], '1')
-        self.assertEquals(headers['x-account-object-count'], '1')
-        self.assertEquals(headers['x-account-bytes-used'], '4')
+        self.assertEqual(headers['x-account-container-count'], '1')
+        self.assertEqual(headers['x-account-object-count'], '1')
+        self.assertEqual(headers['x-account-bytes-used'], '4')
         found1 = False
         found2 = False
         for container in containers:
@@ -131,23 +120,19 @@ def test_main(self):
                 found1 = True
             elif container['name'] == container2:
                 found2 = True
-                self.assertEquals(container['count'], 1)
-                self.assertEquals(container['bytes'], 4)
-        self.assert_(not found1)
-        self.assert_(found2)
-
-        processes = []
-        for node in xrange(1, 5):
-            processes.append(Popen([
-                'swift-container-updater',
-                '/etc/swift/container-server/%d.conf' % node,
-                'once']))
-        for process in processes:
-            process.wait()
+                self.assertEqual(container['count'], 1)
+                self.assertEqual(container['bytes'], 4)
+        self.assertFalse(found1)
+        self.assertTrue(found2)
+
+        # Run container updaters
+        Manager(['container-updater']).once()
+
+        # Assert account level now knows about container2/object2
         headers, containers = client.get_account(self.url, self.token)
-        self.assertEquals(headers['x-account-container-count'], '1')
-        self.assertEquals(headers['x-account-object-count'], '2')
-        self.assertEquals(headers['x-account-bytes-used'], '9')
+        self.assertEqual(headers['x-account-container-count'], '1')
+        self.assertEqual(headers['x-account-object-count'], '2')
+        self.assertEqual(headers['x-account-bytes-used'], '9')
         found1 = False
         found2 = False
         for container in containers:
@@ -155,18 +140,21 @@ def test_main(self):
                 found1 = True
             elif container['name'] == container2:
                 found2 = True
-                self.assertEquals(container['count'], 2)
-                self.assertEquals(container['bytes'], 9)
-        self.assert_(not found1)
-        self.assert_(found2)
+                self.assertEqual(container['count'], 2)
+                self.assertEqual(container['bytes'], 9)
+        self.assertFalse(found1)
+        self.assertTrue(found2)
 
-        start_server(anodes[0]['port'], self.port2server, self.pids)
+        # Restart other primary account server
+        start_server((anodes[0]['ip'], anodes[0]['port']), self.ipport2server)
 
+        # Assert that server doesn't know about container1's deletion or the
+        #   new container2/object2 yet
         headers, containers = \
             direct_client.direct_get_account(anodes[0], apart, self.account)
-        self.assertEquals(headers['x-account-container-count'], '2')
-        self.assertEquals(headers['x-account-object-count'], '1')
-        self.assertEquals(headers['x-account-bytes-used'], '4')
+        self.assertEqual(headers['x-account-container-count'], '2')
+        self.assertEqual(headers['x-account-object-count'], '1')
+        self.assertEqual(headers['x-account-bytes-used'], '4')
         found1 = False
         found2 = False
         for container in containers:
@@ -174,17 +162,20 @@ def test_main(self):
                 found1 = True
             elif container['name'] == container2:
                 found2 = True
-                self.assertEquals(container['count'], 1)
-                self.assertEquals(container['bytes'], 4)
-        self.assert_(found1)
-        self.assert_(found2)
+                self.assertEqual(container['count'], 1)
+                self.assertEqual(container['bytes'], 4)
+        self.assertTrue(found1)
+        self.assertTrue(found2)
 
-        get_to_final_state()
+        # Get to final state
+        self.get_to_final_state()
+
+        # Assert that server is now up to date
         headers, containers = \
             direct_client.direct_get_account(anodes[0], apart, self.account)
-        self.assertEquals(headers['x-account-container-count'], '1')
-        self.assertEquals(headers['x-account-object-count'], '2')
-        self.assertEquals(headers['x-account-bytes-used'], '9')
+        self.assertEqual(headers['x-account-container-count'], '1')
+        self.assertEqual(headers['x-account-object-count'], '2')
+        self.assertEqual(headers['x-account-bytes-used'], '9')
         found1 = False
         found2 = False
         for container in containers:
@@ -192,10 +183,11 @@ def test_main(self):
                 found1 = True
             elif container['name'] == container2:
                 found2 = True
-                self.assertEquals(container['count'], 2)
-                self.assertEquals(container['bytes'], 9)
-        self.assert_(not found1)
-        self.assert_(found2)
+                self.assertEqual(container['count'], 2)
+                self.assertEqual(container['bytes'], 9)
+                self.assertEqual(container['bytes'], 9)
+        self.assertFalse(found1)
+        self.assertTrue(found2)
 
 
 if __name__ == '__main__':
diff --git a/test/probe/test_account_get_fake_responses_match.py b/test/probe/test_account_get_fake_responses_match.py
new file mode 100644
index 0000000000..5276049fad
--- /dev/null
+++ b/test/probe/test_account_get_fake_responses_match.py
@@ -0,0 +1,116 @@
+#!/usr/bin/python -u
+# Copyright (c) 2010-2013 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import re
+import unittest
+
+import http.client
+from urllib.parse import urlparse
+from swiftclient import get_auth
+from test.probe import PROXY_BASE_URL
+from test.probe.common import ReplProbeTest
+
+
+class TestAccountGetFakeResponsesMatch(ReplProbeTest):
+
+    def setUp(self):
+        super(TestAccountGetFakeResponsesMatch, self).setUp()
+        self.url, self.token = get_auth(
+            PROXY_BASE_URL + '/auth/v1.0', 'admin:admin', 'admin')
+
+    def _account_path(self, account):
+        _, _, path, _, _, _ = urlparse(self.url)
+
+        basepath, _ = path.rsplit('/', 1)
+        return basepath + '/' + account
+
+    def _get(self, *a, **kw):
+        kw['method'] = 'GET'
+        return self._account_request(*a, **kw)
+
+    def _account_request(self, account, method, headers=None):
+        if headers is None:
+            headers = {}
+        headers['X-Auth-Token'] = self.token
+
+        scheme, netloc, path, _, _, _ = urlparse(self.url)
+        host, port = netloc.partition(':')[::2]
+        if not port:
+            port = '443' if scheme == 'https' else '80'
+        port = int(port)
+
+        if scheme == 'https':
+            conn = http.client.HTTPSConnection(host, port)
+        else:
+            conn = http.client.HTTPConnection(host, port)
+        conn.request(method, self._account_path(account), headers=headers)
+        resp = conn.getresponse()
+        if resp.status // 100 != 2:
+            raise Exception("Unexpected status %s\n%s" %
+                            (resp.status, resp.read()))
+
+        response_headers = {h.lower(): v for h, v in resp.getheaders()}
+        response_body = resp.read()
+        resp.close()
+        return response_headers, response_body
+
+    def test_main(self):
+        # Two accounts: "real" and "fake". The fake one doesn't have any .db
+        # files on disk; the real one does. The real one is empty.
+        #
+        # Make sure the important response fields match.
+
+        real_acct = "AUTH_real"
+        fake_acct = "AUTH_fake"
+
+        self._account_request(real_acct, 'POST',
+                              {'X-Account-Meta-Bert': 'Ernie'})
+
+        # text
+        real_headers, real_body = self._get(real_acct)
+        fake_headers, fake_body = self._get(fake_acct)
+
+        self.assertEqual(real_body, fake_body)
+        self.assertEqual(real_headers['content-type'],
+                         fake_headers['content-type'])
+
+        # json
+        real_headers, real_body = self._get(
+            real_acct, headers={'Accept': 'application/json'})
+        fake_headers, fake_body = self._get(
+            fake_acct, headers={'Accept': 'application/json'})
+
+        self.assertEqual(real_body, fake_body)
+        self.assertEqual(real_headers['content-type'],
+                         fake_headers['content-type'])
+
+        # xml
+        real_headers, real_body = self._get(
+            real_acct, headers={'Accept': 'application/xml'})
+        fake_headers, fake_body = self._get(
+            fake_acct, headers={'Accept': 'application/xml'})
+
+        # the account name is in the XML response
+        real_body = re.sub(br'AUTH_\w{4}', b'AUTH_someaccount', real_body)
+        fake_body = re.sub(br'AUTH_\w{4}', b'AUTH_someaccount', fake_body)
+
+        self.assertEqual(real_body, fake_body)
+        self.assertEqual(real_headers['content-type'],
+                         fake_headers['content-type'])
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/probe/test_account_reaper.py b/test/probe/test_account_reaper.py
new file mode 100644
index 0000000000..d7cbbff126
--- /dev/null
+++ b/test/probe/test_account_reaper.py
@@ -0,0 +1,214 @@
+#!/usr/bin/python -u
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from io import BytesIO
+from time import sleep
+import uuid
+import unittest
+
+from swiftclient import client
+
+from swift.account import reaper
+from swift.common import utils
+from swift.common.manager import Manager
+from swift.common.direct_client import direct_delete_account, \
+    direct_get_object, direct_head_container, ClientException
+from swift.common.request_helpers import get_reserved_name
+from test.probe.common import ReplProbeTest, ENABLED_POLICIES
+
+
+class TestAccountReaper(ReplProbeTest):
+    def setUp(self):
+        super(TestAccountReaper, self).setUp()
+        self.all_objects = []
+        int_client = self.make_internal_client()
+        # upload some containers
+        body = b'test-body'
+        for policy in ENABLED_POLICIES:
+            container = 'container-%s-%s' % (policy.name, uuid.uuid4())
+            client.put_container(self.url, self.token, container,
+                                 headers={'X-Storage-Policy': policy.name})
+            obj = 'object-%s' % uuid.uuid4()
+            client.put_object(self.url, self.token, container, obj, body)
+            self.all_objects.append((policy, container, obj))
+
+            # Also create some reserved names
+            container = get_reserved_name(
+                'reserved', policy.name, str(uuid.uuid4()))
+            int_client.create_container(
+                self.account, container,
+                headers={'X-Storage-Policy': policy.name})
+            obj = get_reserved_name('object', str(uuid.uuid4()))
+            int_client.upload_object(
+                BytesIO(body), self.account, container, obj)
+            self.all_objects.append((policy, container, obj))
+
+            policy.load_ring('/etc/swift')
+
+        Manager(['container-updater']).once()
+
+        headers = client.head_account(self.url, self.token)
+
+        self.assertEqual(int(headers['x-account-container-count']),
+                         len(self.all_objects))
+        self.assertEqual(int(headers['x-account-object-count']),
+                         len(self.all_objects))
+        self.assertEqual(int(headers['x-account-bytes-used']),
+                         len(self.all_objects) * len(body))
+
+        part, nodes = self.account_ring.get_nodes(self.account)
+
+        for node in nodes:
+            direct_delete_account(node, part, self.account)
+
+    def _verify_account_reaped(self):
+        for policy, container, obj in self.all_objects:
+            # verify that any container deletes were at same timestamp
+            cpart, cnodes = self.container_ring.get_nodes(
+                self.account, container)
+            delete_times = set()
+            for cnode in cnodes:
+                try:
+                    direct_head_container(cnode, cpart, self.account,
+                                          container)
+                except ClientException as err:
+                    self.assertEqual(err.http_status, 404)
+                    delete_time = err.http_headers.get(
+                        'X-Backend-DELETE-Timestamp')
+                    # 'X-Backend-DELETE-Timestamp' confirms it was deleted
+                    self.assertTrue(delete_time)
+                    delete_times.add(delete_time)
+                else:
+                    # Container replicas may not yet be deleted if we have a
+                    # policy with object replicas < container replicas, so
+                    # ignore successful HEAD. We'll check for all replicas to
+                    # be deleted again after running the replicators.
+                    pass
+            self.assertEqual(1, len(delete_times), delete_times)
+
+            # verify that all object deletes were at same timestamp
+            part, nodes = policy.object_ring.get_nodes(self.account,
+                                                       container, obj)
+            headers = {'X-Backend-Storage-Policy-Index': int(policy)}
+            delete_times = set()
+            for node in nodes:
+                try:
+                    direct_get_object(node, part, self.account,
+                                      container, obj, headers=headers)
+                except ClientException as err:
+                    self.assertEqual(err.http_status, 404)
+                    delete_time = err.http_headers.get('X-Backend-Timestamp')
+                    # 'X-Backend-Timestamp' confirms obj was deleted
+                    self.assertTrue(delete_time)
+                    delete_times.add(delete_time)
+                else:
+                    self.fail('Found un-reaped /%s/%s/%s on %r in %s!' %
+                              (self.account, container, obj, node, policy))
+            self.assertEqual(1, len(delete_times))
+
+        # run replicators and updaters
+        self.get_to_final_state()
+
+        for policy, container, obj in self.all_objects:
+            # verify that ALL container replicas are now deleted
+            cpart, cnodes = self.container_ring.get_nodes(
+                self.account, container)
+            delete_times = set()
+            for cnode in cnodes:
+                try:
+                    direct_head_container(cnode, cpart, self.account,
+                                          container)
+                except ClientException as err:
+                    self.assertEqual(err.http_status, 404)
+                    delete_time = err.http_headers.get(
+                        'X-Backend-DELETE-Timestamp')
+                    # 'X-Backend-DELETE-Timestamp' confirms it was deleted
+                    self.assertTrue(delete_time)
+                    delete_times.add(delete_time)
+                else:
+                    self.fail('Found un-reaped /%s/%s on %r' %
+                              (self.account, container, cnode))
+            self.assertEqual(1, len(delete_times))
+
+            # sanity check that object state is still consistent...
+            part, nodes = policy.object_ring.get_nodes(self.account,
+                                                       container, obj)
+            headers = {'X-Backend-Storage-Policy-Index': int(policy)}
+            delete_times = set()
+            for node in nodes:
+                try:
+                    direct_get_object(node, part, self.account,
+                                      container, obj, headers=headers)
+                except ClientException as err:
+                    self.assertEqual(err.http_status, 404)
+                    delete_time = err.http_headers.get('X-Backend-Timestamp')
+                    # 'X-Backend-Timestamp' confirms obj was deleted
+                    self.assertTrue(delete_time)
+                    delete_times.add(delete_time)
+                else:
+                    self.fail('Found un-reaped /%s/%s/%s on %r in %s!' %
+                              (self.account, container, obj, node, policy))
+            self.assertEqual(1, len(delete_times))
+
+    def test_reap(self):
+        # run the reaper
+        Manager(['account-reaper']).once()
+
+        self._verify_account_reaped()
+
+    def test_delayed_reap(self):
+        # define reapers which are supposed to operate 3 seconds later
+        account_reapers = []
+        for conf_file in self.configs['account-server'].values():
+            conf = utils.readconf(conf_file, 'account-reaper')
+            conf['delay_reaping'] = '3'
+            account_reapers.append(reaper.AccountReaper(conf))
+
+        self.assertTrue(account_reapers)
+
+        # run reaper, and make sure that nothing is reaped
+        for account_reaper in account_reapers:
+            account_reaper.run_once()
+
+        for policy, container, obj in self.all_objects:
+            cpart, cnodes = self.container_ring.get_nodes(
+                self.account, container)
+            for cnode in cnodes:
+                try:
+                    direct_head_container(cnode, cpart, self.account,
+                                          container)
+                except ClientException:
+                    self.fail(
+                        "Nothing should be reaped. Container should exist")
+
+            part, nodes = policy.object_ring.get_nodes(self.account,
+                                                       container, obj)
+            headers = {'X-Backend-Storage-Policy-Index': int(policy)}
+            for node in nodes:
+                try:
+                    direct_get_object(node, part, self.account,
+                                      container, obj, headers=headers)
+                except ClientException:
+                    self.fail("Nothing should be reaped. Object should exist")
+
+        # wait 3 seconds, run reaper, and make sure that all is reaped
+        sleep(3)
+        for account_reaper in account_reapers:
+            account_reaper.run_once()
+
+        self._verify_account_reaped()
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/test/probe/test_container_failures.py b/test/probe/test_container_failures.py
old mode 100755
new mode 100644
index dfa8d4637e..9d8de5bf47
--- a/test/probe/test_container_failures.py
+++ b/test/probe/test_container_failures.py
@@ -1,5 +1,5 @@
 #!/usr/bin/python -u
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,152 +13,245 @@
 # implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
-
-from os import listdir
-from os.path import join as path_join
-from unittest import main, TestCase
+import time
+from unittest import main
 from uuid import uuid4
 
 from eventlet import GreenPool, Timeout
+import eventlet
 from sqlite3 import connect
+
+from swift.common.manager import Manager
 from swiftclient import client
 
 from swift.common import direct_client
-from swift.common.utils import hash_path, readconf
-from test.probe.common import get_to_final_state, kill_nonprimary_server, \
-    kill_server, kill_servers, reset_environment, start_server
-
-
-def get_db_file_path(obj_dir):
-    files = sorted(listdir(obj_dir), reverse=True)
-    for filename in files:
-        if filename.endswith('db'):
-            return path_join(obj_dir, filename)
-
+from swift.common.exceptions import ClientException
+from swift.common.utils import readconf
+from swift.common.utils.timestamp import Timestamp
+from test.probe.common import kill_nonprimary_server, \
+    kill_server, ReplProbeTest, start_server
 
-class TestContainerFailures(TestCase):
+eventlet.monkey_patch(all=False, socket=True)
 
-    def setUp(self):
-        (self.pids, self.port2server, self.account_ring, self.container_ring,
-         self.object_ring, self.url, self.token,
-         self.account) = reset_environment()
 
-    def tearDown(self):
-        kill_servers(self.port2server, self.pids)
+class TestContainerFailures(ReplProbeTest):
 
     def test_one_node_fails(self):
         # Create container1
+        container1 = 'container-%s' % uuid4()
+        cpart, cnodes = self.container_ring.get_nodes(self.account, container1)
+        client.put_container(self.url, self.token, container1)
+
         # Kill container1 servers excepting two of the primaries
+        kill_nonprimary_server(cnodes, self.ipport2server)
+        kill_server((cnodes[0]['ip'], cnodes[0]['port']), self.ipport2server)
+
         # Delete container1
+        client.delete_container(self.url, self.token, container1)
+
         # Restart other container1 primary server
+        start_server((cnodes[0]['ip'], cnodes[0]['port']), self.ipport2server)
+
         # Create container1/object1 (allowed because at least server thinks the
         #   container exists)
+        client.put_object(self.url, self.token, container1, 'object1', '123')
+
         # Get to a final state
+        self.get_to_final_state()
+
         # Assert all container1 servers indicate container1 is alive and
         #   well with object1
+        for cnode in cnodes:
+            self.assertEqual(
+                [o['name'] for o in direct_client.direct_get_container(
+                    cnode, cpart, self.account, container1)[1]],
+                ['object1'])
+
         # Assert account level also indicates container1 is alive and
         #   well with object1
+        headers, containers = client.get_account(self.url, self.token)
+        self.assertEqual(headers['x-account-container-count'], '1')
+        self.assertEqual(headers['x-account-object-count'], '1')
+        self.assertEqual(headers['x-account-bytes-used'], '3')
+
+    def test_metadata_replicated_with_no_timestamp_update(self):
+        self.maxDiff = None
+        # Create container1
         container1 = 'container-%s' % uuid4()
         cpart, cnodes = self.container_ring.get_nodes(self.account, container1)
         client.put_container(self.url, self.token, container1)
-        kill_nonprimary_server(cnodes, self.port2server, self.pids)
-        kill_server(cnodes[0]['port'], self.port2server, self.pids)
-        client.delete_container(self.url, self.token, container1)
-        start_server(cnodes[0]['port'], self.port2server, self.pids)
-        client.put_object(self.url, self.token, container1, 'object1', '123')
-        get_to_final_state()
+        Manager(['container-replicator']).once()
+
+        exp_hdrs = None
         for cnode in cnodes:
-            self.assertEquals(
-                [o['name'] for o in direct_client.direct_get_container(
-                    cnode, cpart, self.account, container1)[1]],
-                ['object1'])
-        headers, containers = client.get_account(self.url, self.token)
-        self.assertEquals(headers['x-account-container-count'], '1')
-        self.assertEquals(headers['x-account-object-count'], '1')
-        self.assertEquals(headers['x-account-bytes-used'], '3')
+            hdrs = direct_client.direct_head_container(
+                cnode, cpart, self.account, container1)
+            hdrs.pop('Date')
+            if exp_hdrs:
+                self.assertEqual(exp_hdrs, hdrs)
+            exp_hdrs = hdrs
+        self.assertIsNotNone(exp_hdrs)
+        self.assertIn('Last-Modified', exp_hdrs)
+        put_time = float(Timestamp(exp_hdrs['X-Backend-Put-Timestamp']))
+
+        # Post to only one replica of container1 at least 1 second after the
+        # put (to reveal any unexpected change in Last-Modified which is
+        # rounded to seconds)
+        time.sleep(put_time + 1 - time.time())
+        post_hdrs = {'x-container-meta-foo': 'bar',
+                     'x-backend-no-timestamp-update': 'true'}
+        direct_client.direct_post_container(
+            cnodes[1], cpart, self.account, container1, headers=post_hdrs)
+
+        # verify that put_timestamp was not modified
+        exp_hdrs.update({'x-container-meta-foo': 'bar'})
+        hdrs = direct_client.direct_head_container(
+            cnodes[1], cpart, self.account, container1)
+        hdrs.pop('Date')
+        self.assertDictEqual(exp_hdrs, hdrs)
+
+        # Get to a final state
+        Manager(['container-replicator']).once()
+
+        # Assert all container1 servers have consistent metadata
+        for cnode in cnodes:
+            hdrs = direct_client.direct_head_container(
+                cnode, cpart, self.account, container1)
+            hdrs.pop('Date')
+            self.assertDictEqual(exp_hdrs, hdrs)
+
+        # sanity check: verify the put_timestamp is modified without
+        # x-backend-no-timestamp-update
+        post_hdrs = {'x-container-meta-foo': 'baz'}
+        exp_hdrs.update({'x-container-meta-foo': 'baz'})
+        direct_client.direct_post_container(
+            cnodes[1], cpart, self.account, container1, headers=post_hdrs)
+
+        # verify that put_timestamp was modified
+        hdrs = direct_client.direct_head_container(
+            cnodes[1], cpart, self.account, container1)
+        self.assertLess(exp_hdrs['x-backend-put-timestamp'],
+                        hdrs['x-backend-put-timestamp'])
+        self.assertNotEqual(exp_hdrs['last-modified'], hdrs['last-modified'])
+        hdrs.pop('Date')
+        for key in ('x-backend-put-timestamp',
+                    'x-put-timestamp',
+                    'last-modified'):
+            self.assertNotEqual(exp_hdrs[key], hdrs[key])
+            exp_hdrs.pop(key)
+            hdrs.pop(key)
+
+        self.assertDictEqual(exp_hdrs, hdrs)
 
     def test_two_nodes_fail(self):
         # Create container1
+        container1 = 'container-%s' % uuid4()
+        cpart, cnodes = self.container_ring.get_nodes(self.account, container1)
+        client.put_container(self.url, self.token, container1)
+
         # Kill container1 servers excepting one of the primaries
+        cnp_ipport = kill_nonprimary_server(cnodes, self.ipport2server)
+        kill_server((cnodes[0]['ip'], cnodes[0]['port']),
+                    self.ipport2server)
+        kill_server((cnodes[1]['ip'], cnodes[1]['port']),
+                    self.ipport2server)
+
         # Delete container1 directly to the one primary still up
+        direct_client.direct_delete_container(cnodes[2], cpart, self.account,
+                                              container1)
+
         # Restart other container1 servers
+        start_server((cnodes[0]['ip'], cnodes[0]['port']),
+                     self.ipport2server)
+        start_server((cnodes[1]['ip'], cnodes[1]['port']),
+                     self.ipport2server)
+        start_server(cnp_ipport, self.ipport2server)
+
         # Get to a final state
+        self.get_to_final_state()
+
         # Assert all container1 servers indicate container1 is gone (happens
         #   because the one node that knew about the delete replicated to the
         #   others.)
-        # Assert account level also indicates container1 is gone
-        container1 = 'container-%s' % uuid4()
-        cpart, cnodes = self.container_ring.get_nodes(self.account, container1)
-        client.put_container(self.url, self.token, container1)
-        cnp_port = kill_nonprimary_server(cnodes, self.port2server, self.pids)
-        kill_server(cnodes[0]['port'], self.port2server, self.pids)
-        kill_server(cnodes[1]['port'], self.port2server, self.pids)
-        direct_client.direct_delete_container(cnodes[2], cpart, self.account,
-                                              container1)
-        start_server(cnodes[0]['port'], self.port2server, self.pids)
-        start_server(cnodes[1]['port'], self.port2server, self.pids)
-        start_server(cnp_port, self.port2server, self.pids)
-        get_to_final_state()
         for cnode in cnodes:
-            exc = None
             try:
                 direct_client.direct_get_container(cnode, cpart, self.account,
                                                    container1)
-            except client.ClientException, err:
-                exc = err
-            self.assertEquals(exc.http_status, 404)
+            except ClientException as err:
+                self.assertEqual(err.http_status, 404)
+            else:
+                self.fail("Expected ClientException but didn't get it")
+
+        # Assert account level also indicates container1 is gone
         headers, containers = client.get_account(self.url, self.token)
-        self.assertEquals(headers['x-account-container-count'], '0')
-        self.assertEquals(headers['x-account-object-count'], '0')
-        self.assertEquals(headers['x-account-bytes-used'], '0')
-
-    def _get_container_db_files(self, container):
-        opart, onodes = self.container_ring.get_nodes(self.account, container)
-        onode = onodes[0]
-        db_files = []
-        for onode in onodes:
-            node_id = (onode['port'] - 6000) / 10
-            device = onode['device']
-            hash_str = hash_path(self.account, container)
-            server_conf = readconf('/etc/swift/container-server/%s.conf' %
-                                   node_id)
-            devices = server_conf['app:container-server']['devices']
-            obj_dir = '%s/%s/containers/%s/%s/%s/' % (devices,
-                                                      device, opart,
-                                                      hash_str[-3:], hash_str)
-            db_files.append(get_db_file_path(obj_dir))
-
-        return db_files
+        self.assertEqual(headers['x-account-container-count'], '0')
+        self.assertEqual(headers['x-account-object-count'], '0')
+        self.assertEqual(headers['x-account-bytes-used'], '0')
+
+    def test_all_nodes_fail(self):
+        # Create container1
+        container1 = 'container-%s' % uuid4()
+        cpart, cnodes = self.container_ring.get_nodes(self.account, container1)
+        client.put_container(self.url, self.token, container1)
+        client.put_object(self.url, self.token, container1, 'obj1', 'data1')
+
+        # All primaries go down
+        for cnode in cnodes:
+            kill_server((cnode['ip'], cnode['port']), self.ipport2server)
+
+        # Can't GET the container
+        with self.assertRaises(client.ClientException) as caught:
+            client.get_container(self.url, self.token, container1)
+        self.assertEqual(caught.exception.http_status, 503)
+
+        # But we can still write objects! The old info is still in memcache
+        client.put_object(self.url, self.token, container1, 'obj2', 'data2')
+
+        # Can't POST the container, either
+        with self.assertRaises(client.ClientException) as caught:
+            client.post_container(self.url, self.token, container1, {})
+        self.assertEqual(caught.exception.http_status, 503)
+
+        # Though it *does* evict the cache
+        with self.assertRaises(client.ClientException) as caught:
+            client.put_object(self.url, self.token, container1, 'obj3', 'x')
+        self.assertEqual(caught.exception.http_status, 503)
 
     def test_locked_container_dbs(self):
 
         def run_test(num_locks, catch_503):
             container = 'container-%s' % uuid4()
             client.put_container(self.url, self.token, container)
-            db_files = self._get_container_db_files(container)
+            # Get the container info into memcache (so no stray
+            # get_container_info calls muck up our timings)
+            client.get_container(self.url, self.token, container)
+            db_files = self.get_container_db_files(container)
             db_conns = []
             for i in range(num_locks):
                 db_conn = connect(db_files[i])
                 db_conn.execute('begin exclusive transaction')
                 db_conns.append(db_conn)
             if catch_503:
-                exc = None
                 try:
                     client.delete_container(self.url, self.token, container)
-                except client.ClientException, err:
-                    exc = err
-                self.assertEquals(exc.http_status, 503)
+                except client.ClientException as err:
+                    self.assertEqual(err.http_status, 503)
+                else:
+                    self.fail("Expected ClientException but didn't get it")
             else:
                 client.delete_container(self.url, self.token, container)
 
+        proxy_conf = readconf(self.configs['proxy-server'],
+                              section_name='app:proxy-server')
+        node_timeout = int(proxy_conf.get('node_timeout', 10))
         pool = GreenPool()
         try:
-            with Timeout(15):
+            with Timeout(node_timeout + 5):
                 pool.spawn(run_test, 1, False)
                 pool.spawn(run_test, 2, True)
                 pool.spawn(run_test, 3, True)
                 pool.waitall()
-        except Timeout, err:
+        except Timeout as err:
             raise Exception(
                 "The server did not return a 503 on container db locks, "
                 "it just hangs: %s" % err)
diff --git a/test/probe/test_container_merge_policy_index.py b/test/probe/test_container_merge_policy_index.py
new file mode 100644
index 0000000000..9ec1276361
--- /dev/null
+++ b/test/probe/test_container_merge_policy_index.py
@@ -0,0 +1,649 @@
+#!/usr/bin/python -u
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import time
+import uuid
+import random
+import unittest
+
+from swift.common.manager import Manager
+from swift.common.internal_client import InternalClient
+from swift.common import utils, direct_client
+from swift.common.storage_policy import POLICIES
+from swift.common.http import HTTP_NOT_FOUND
+from swift.common.utils import md5
+from swift.container.reconciler import MISPLACED_OBJECTS_ACCOUNT
+from test.probe.brain import BrainSplitter, InternalBrainSplitter
+from swift.common.request_helpers import get_reserved_name
+from test.probe.common import (ReplProbeTest, ENABLED_POLICIES,
+                               POLICIES_BY_TYPE, REPL_POLICY)
+
+from swiftclient import ClientException
+
+TIMEOUT = 60
+
+
+class BaseTestContainerMergePolicyIndex(ReplProbeTest):
+
+    @unittest.skipIf(len(ENABLED_POLICIES) < 2, "Need more than one policy")
+    def setUp(self):
+        super(BaseTestContainerMergePolicyIndex, self).setUp()
+        self.container_name = 'container-%s' % uuid.uuid4()
+        self.object_name = 'object-%s' % uuid.uuid4()
+        self.brain = BrainSplitter(self.url, self.token, self.container_name,
+                                   self.object_name, 'container')
+
+    def _get_object_patiently(self, policy_index):
+        # use proxy to access object (bad container info might be cached...)
+        timeout = time.time() + TIMEOUT
+        while time.time() < timeout:
+            try:
+                return self.brain.get_object()
+            except ClientException as err:
+                if err.http_status != HTTP_NOT_FOUND:
+                    raise
+                time.sleep(1)
+        else:
+            self.fail('could not GET /%s/%s/%s/ from policy %s '
+                      'after %s seconds.' % (
+                          self.account, self.container_name, self.object_name,
+                          int(policy_index), TIMEOUT))
+
+    def _do_test_merge_storage_policy_index(self):
+        # make sure we have some manner of split brain
+        container_part, container_nodes = self.container_ring.get_nodes(
+            self.account, self.container_name)
+        head_responses = []
+        for node in container_nodes:
+            metadata = direct_client.direct_head_container(
+                node, container_part, self.account, self.container_name)
+            head_responses.append((node, metadata))
+        found_policy_indexes = {
+            metadata['X-Backend-Storage-Policy-Index']
+            for node, metadata in head_responses}
+        self.assertGreater(
+            len(found_policy_indexes), 1,
+            'primary nodes did not disagree about policy index %r' %
+            head_responses)
+        # find our object
+        orig_policy_index = None
+        for policy_index in found_policy_indexes:
+            object_ring = POLICIES.get_object_ring(policy_index, '/etc/swift')
+            part, nodes = object_ring.get_nodes(
+                self.account, self.container_name, self.object_name)
+            for node in nodes:
+                try:
+                    direct_client.direct_head_object(
+                        node, part, self.account, self.container_name,
+                        self.object_name,
+                        headers={'X-Backend-Storage-Policy-Index':
+                                 policy_index})
+                except direct_client.ClientException:
+                    continue
+                orig_policy_index = policy_index
+                break
+            if orig_policy_index is not None:
+                break
+        else:
+            self.fail('Unable to find /%s/%s/%s in %r' % (
+                self.account, self.container_name, self.object_name,
+                found_policy_indexes))
+        self.get_to_final_state()
+        Manager(['container-reconciler']).once()
+        # validate containers
+        head_responses = []
+        for node in container_nodes:
+            metadata = direct_client.direct_head_container(
+                node, container_part, self.account, self.container_name)
+            head_responses.append((node, metadata))
+        found_policy_indexes = {
+            metadata['X-Backend-Storage-Policy-Index']
+            for node, metadata in head_responses}
+        self.assertEqual(len(found_policy_indexes), 1,
+                         'primary nodes disagree about policy index %r' %
+                         head_responses)
+
+        expected_policy_index = found_policy_indexes.pop()
+        self.assertNotEqual(orig_policy_index, expected_policy_index)
+        # validate object placement
+        orig_policy_ring = POLICIES.get_object_ring(orig_policy_index,
+                                                    '/etc/swift')
+        for node in orig_policy_ring.devs:
+            try:
+                direct_client.direct_head_object(
+                    node, part, self.account, self.container_name,
+                    self.object_name, headers={
+                        'X-Backend-Storage-Policy-Index': orig_policy_index})
+            except direct_client.ClientException as err:
+                if err.http_status == HTTP_NOT_FOUND:
+                    continue
+                raise
+            else:
+                self.fail('Found /%s/%s/%s in %s' % (
+                    self.account, self.container_name, self.object_name,
+                    orig_policy_index))
+        # verify that the object data read by external client is correct
+        headers, data = self._get_object_patiently(expected_policy_index)
+        self.assertEqual(b'VERIFY', data)
+        self.assertEqual('custom-meta', headers['x-object-meta-test'])
+
+
+class TestContainerMergePolicyIndex(BaseTestContainerMergePolicyIndex):
+    def test_merge_storage_policy_index(self):
+        # generic split brain
+        self.brain.stop_primary_half()
+        self.brain.put_container()
+        self.brain.start_primary_half()
+        self.brain.stop_handoff_half()
+        self.brain.put_container()
+        self.brain.put_object(headers={'x-object-meta-test': 'custom-meta'},
+                              contents=b'VERIFY')
+        self.brain.start_handoff_half()
+        self._do_test_merge_storage_policy_index()
+
+    def test_reconcile_delete(self):
+        # generic split brain
+        self.brain.stop_primary_half()
+        self.brain.put_container()
+        self.brain.put_object()
+        self.brain.start_primary_half()
+        self.brain.stop_handoff_half()
+        self.brain.put_container()
+        self.brain.delete_object()
+        self.brain.start_handoff_half()
+        # make sure we have some manner of split brain
+        container_part, container_nodes = self.container_ring.get_nodes(
+            self.account, self.container_name)
+        head_responses = []
+        for node in container_nodes:
+            metadata = direct_client.direct_head_container(
+                node, container_part, self.account, self.container_name)
+            head_responses.append((node, metadata))
+        found_policy_indexes = {
+            metadata['X-Backend-Storage-Policy-Index']
+            for node, metadata in head_responses}
+        self.assertGreater(
+            len(found_policy_indexes), 1,
+            'primary nodes did not disagree about policy index %r' %
+            head_responses)
+        # find our object
+        orig_policy_index = ts_policy_index = None
+        for policy_index in found_policy_indexes:
+            object_ring = POLICIES.get_object_ring(policy_index, '/etc/swift')
+            part, nodes = object_ring.get_nodes(
+                self.account, self.container_name, self.object_name)
+            for node in nodes:
+                try:
+                    direct_client.direct_head_object(
+                        node, part, self.account, self.container_name,
+                        self.object_name,
+                        headers={'X-Backend-Storage-Policy-Index':
+                                 policy_index})
+                except direct_client.ClientException as err:
+                    if 'x-backend-timestamp' in err.http_headers:
+                        ts_policy_index = policy_index
+                        break
+                else:
+                    orig_policy_index = policy_index
+                    break
+        if not orig_policy_index:
+            self.fail('Unable to find /%s/%s/%s in %r' % (
+                self.account, self.container_name, self.object_name,
+                found_policy_indexes))
+        if not ts_policy_index:
+            self.fail('Unable to find tombstone /%s/%s/%s in %r' % (
+                self.account, self.container_name, self.object_name,
+                found_policy_indexes))
+        self.get_to_final_state()
+        Manager(['container-reconciler']).once()
+        # validate containers
+        head_responses = []
+        for node in container_nodes:
+            metadata = direct_client.direct_head_container(
+                node, container_part, self.account, self.container_name)
+            head_responses.append((node, metadata))
+        node_to_policy = {
+            node['port']: metadata['X-Backend-Storage-Policy-Index']
+            for node, metadata in head_responses}
+        policies = set(node_to_policy.values())
+        self.assertEqual(len(policies), 1,
+                         'primary nodes disagree about policy index %r' %
+                         node_to_policy)
+        expected_policy_index = policies.pop()
+        self.assertEqual(orig_policy_index, expected_policy_index)
+        # validate object fully deleted
+        for policy_index in found_policy_indexes:
+            object_ring = POLICIES.get_object_ring(policy_index, '/etc/swift')
+            part, nodes = object_ring.get_nodes(
+                self.account, self.container_name, self.object_name)
+            for node in nodes:
+                try:
+                    direct_client.direct_head_object(
+                        node, part, self.account, self.container_name,
+                        self.object_name,
+                        headers={'X-Backend-Storage-Policy-Index':
+                                 policy_index})
+                except direct_client.ClientException as err:
+                    if err.http_status == HTTP_NOT_FOUND:
+                        continue
+                else:
+                    self.fail('Found /%s/%s/%s in %s on %s' % (
+                        self.account, self.container_name, self.object_name,
+                        orig_policy_index, node))
+
+    def get_object_name(self, name):
+        """
+        hook for sublcass to translate object names
+        """
+        return name
+
+    def test_reconcile_manifest(self):
+        if 'slo' not in self.cluster_info:
+            raise unittest.SkipTest(
+                "SLO not enabled in proxy; can't test manifest reconciliation")
+        # this test is not only testing a split brain scenario on
+        # multiple policies with mis-placed objects - it even writes out
+        # a static large object directly to the storage nodes while the
+        # objects are unavailably mis-placed from *behind* the proxy and
+        # doesn't know how to do that for EC_POLICY (clayg: why did you
+        # guys let me write a test that does this!?) - so we force
+        # wrong_policy (where the manifest gets written) to be one of
+        # any of your configured REPL_POLICY (we know you have one
+        # because this is a ReplProbeTest)
+        wrong_policy = random.choice(POLICIES_BY_TYPE[REPL_POLICY])
+        policy = random.choice([p for p in ENABLED_POLICIES
+                                if p is not wrong_policy])
+        manifest_data = []
+
+        def write_part(i):
+            body = b'VERIFY%0.2d' % i + b'\x00' * 1048576
+            part_name = self.get_object_name('manifest_part_%0.2d' % i)
+            manifest_entry = {
+                "path": "/%s/%s" % (self.container_name, part_name),
+                "etag": md5(body, usedforsecurity=False).hexdigest(),
+                "size_bytes": len(body),
+            }
+            self.brain.client.put_object(self.container_name, part_name, {},
+                                         body)
+            manifest_data.append(manifest_entry)
+
+        # get an old container stashed
+        self.brain.stop_primary_half()
+        self.brain.put_container(int(policy))
+        self.brain.start_primary_half()
+        # write some parts
+        for i in range(10):
+            write_part(i)
+
+        self.brain.stop_handoff_half()
+        self.brain.put_container(int(wrong_policy))
+        # write some more parts
+        for i in range(10, 20):
+            write_part(i)
+
+        # write manifest
+        with self.assertRaises(ClientException) as catcher:
+            self.brain.client.put_object(
+                self.container_name, self.object_name,
+                {}, utils.json.dumps(manifest_data),
+                query_string='multipart-manifest=put')
+
+        # so as it works out, you can't really upload a multi-part
+        # manifest for objects that are currently misplaced - you have to
+        # wait until they're all available - which is about the same as
+        # some other failure that causes data to be unavailable to the
+        # proxy at the time of upload
+        self.assertEqual(catcher.exception.http_status, 400)
+
+        # but what the heck, we'll sneak one in just to see what happens...
+        direct_manifest_name = self.object_name + '-direct-test'
+        object_ring = POLICIES.get_object_ring(wrong_policy.idx, '/etc/swift')
+        part, nodes = object_ring.get_nodes(
+            self.account, self.container_name, direct_manifest_name)
+        container_part = self.container_ring.get_part(self.account,
+                                                      self.container_name)
+
+        def translate_direct(data):
+            return {
+                'hash': data['etag'],
+                'bytes': data['size_bytes'],
+                'name': data['path'],
+            }
+        direct_manifest_data = [translate_direct(item)
+                                for item in manifest_data]
+        headers = {
+            'x-container-host': ','.join('%s:%s' % (n['ip'], n['port']) for n
+                                         in self.container_ring.devs),
+            'x-container-device': ','.join(n['device'] for n in
+                                           self.container_ring.devs),
+            'x-container-partition': container_part,
+            'X-Backend-Storage-Policy-Index': wrong_policy.idx,
+            'X-Static-Large-Object': 'True',
+        }
+        body = utils.json.dumps(direct_manifest_data).encode('ascii')
+        for node in nodes:
+            direct_client.direct_put_object(
+                node, part, self.account, self.container_name,
+                direct_manifest_name,
+                contents=body,
+                headers=headers)
+            break  # one should do it...
+
+        self.brain.start_handoff_half()
+        self.get_to_final_state()
+        Manager(['container-reconciler']).once()
+        # clear proxy cache
+        self.brain.client.post_container(self.container_name, {})
+
+        # let's see how that direct upload worked out...
+        metadata, body = self.brain.client.get_object(
+            self.container_name, direct_manifest_name,
+            query_string='multipart-manifest=get')
+        self.assertEqual(metadata['x-static-large-object'].lower(), 'true')
+        for i, entry in enumerate(utils.json.loads(body)):
+            for key in ('hash', 'bytes', 'name'):
+                self.assertEqual(entry[key], direct_manifest_data[i][key])
+        metadata, body = self.brain.client.get_object(
+            self.container_name, direct_manifest_name)
+        self.assertEqual(metadata['x-static-large-object'].lower(), 'true')
+        self.assertEqual(int(metadata['content-length']),
+                         sum(part['size_bytes'] for part in manifest_data))
+        self.assertEqual(body, b''.join(b'VERIFY%0.2d' % i + b'\x00' * 1048576
+                                        for i in range(20)))
+
+        # and regular upload should work now too
+        self.brain.client.put_object(
+            self.container_name, self.object_name, {},
+            utils.json.dumps(manifest_data).encode('ascii'),
+            query_string='multipart-manifest=put')
+        metadata = self.brain.client.head_object(self.container_name,
+                                                 self.object_name)
+        self.assertEqual(int(metadata['content-length']),
+                         sum(part['size_bytes'] for part in manifest_data))
+
+    def test_reconcile_symlink(self):
+        if 'symlink' not in self.cluster_info:
+            raise unittest.SkipTest(
+                "Symlink not enabled in proxy; can't test "
+                "symlink reconciliation")
+        wrong_policy = random.choice(ENABLED_POLICIES)
+        policy = random.choice([p for p in ENABLED_POLICIES
+                                if p is not wrong_policy])
+        # get an old container stashed
+        self.brain.stop_primary_half()
+        self.brain.put_container(int(policy))
+        self.brain.start_primary_half()
+        # write some target data
+        target_name = self.get_object_name('target')
+        self.brain.client.put_object(self.container_name, target_name, {},
+                                     b'this is the target data')
+
+        # write the symlink
+        self.brain.stop_handoff_half()
+        self.brain.put_container(int(wrong_policy))
+        symlink_name = self.get_object_name('symlink')
+        self.brain.client.put_object(
+            self.container_name, symlink_name, {
+                'X-Symlink-Target': '%s/%s' % (
+                    self.container_name, target_name),
+                'Content-Type': 'application/symlink',
+            }, b'')
+
+        # at this point we have a broken symlink (the container_info has the
+        # proxy looking for the target in the wrong policy)
+        with self.assertRaises(ClientException) as ctx:
+            self.brain.client.get_object(self.container_name, symlink_name)
+        self.assertEqual(ctx.exception.http_status, 404)
+
+        # of course the symlink itself is fine
+        metadata, body = self.brain.client.get_object(
+            self.container_name, symlink_name, query_string='symlink=get')
+        self.assertEqual(metadata['x-symlink-target'],
+                         utils.quote('%s/%s' % (
+                             self.container_name, target_name)))
+        self.assertEqual(metadata['content-type'], 'application/symlink')
+        self.assertEqual(body, b'')
+        # ... although in the wrong policy
+        object_ring = POLICIES.get_object_ring(int(wrong_policy), '/etc/swift')
+        part, nodes = object_ring.get_nodes(
+            self.account, self.container_name, symlink_name)
+        for node in nodes:
+            metadata = direct_client.direct_head_object(
+                node, part, self.account, self.container_name, symlink_name,
+                headers={'X-Backend-Storage-Policy-Index': int(wrong_policy)})
+            self.assertEqual(metadata['X-Object-Sysmeta-Symlink-Target'],
+                             utils.quote('%s/%s' % (
+                                 self.container_name, target_name)))
+
+        # let the reconciler run
+        self.brain.start_handoff_half()
+        self.get_to_final_state()
+        Manager(['container-reconciler']).once()
+        # clear proxy cache
+        self.brain.client.post_container(self.container_name, {})
+
+        # now the symlink works
+        metadata, body = self.brain.client.get_object(
+            self.container_name, symlink_name)
+        self.assertEqual(body, b'this is the target data')
+        # and it's in the correct policy
+        object_ring = POLICIES.get_object_ring(int(policy), '/etc/swift')
+        part, nodes = object_ring.get_nodes(
+            self.account, self.container_name, symlink_name)
+        for node in nodes:
+            metadata = direct_client.direct_head_object(
+                node, part, self.account, self.container_name, symlink_name,
+                headers={'X-Backend-Storage-Policy-Index': int(policy)})
+            self.assertEqual(metadata['X-Object-Sysmeta-Symlink-Target'],
+                             utils.quote('%s/%s' % (
+                                 self.container_name, target_name)))
+
+    def test_reconciler_move_object_twice(self):
+        # select some policies
+        old_policy = random.choice(ENABLED_POLICIES)
+        new_policy = random.choice([p for p in ENABLED_POLICIES
+                                    if p != old_policy])
+
+        # setup a split brain
+        self.brain.stop_handoff_half()
+        # get old_policy on two primaries
+        self.brain.put_container(policy_index=int(old_policy))
+        self.brain.start_handoff_half()
+        self.brain.stop_primary_half()
+        # force a recreate on handoffs
+        self.brain.put_container(policy_index=int(old_policy))
+        self.brain.delete_container()
+        self.brain.put_container(policy_index=int(new_policy))
+        self.brain.put_object()  # populate memcache with new_policy
+        self.brain.start_primary_half()
+
+        # at this point two primaries have old policy
+        container_part, container_nodes = self.container_ring.get_nodes(
+            self.account, self.container_name)
+        head_responses = [
+            (node, direct_client.direct_head_container(
+                node, container_part, self.account, self.container_name))
+            for node in container_nodes]
+        old_container_nodes = [
+            node for node, metadata in head_responses
+            if int(old_policy) ==
+            int(metadata['X-Backend-Storage-Policy-Index'])]
+        self.assertEqual(2, len(old_container_nodes))
+
+        # hopefully memcache still has the new policy cached
+        self.brain.put_object(headers={'x-object-meta-test': 'custom-meta'},
+                              contents=b'VERIFY')
+        # double-check object correctly written to new policy
+        conf_files = []
+        for server in Manager(['container-reconciler']).servers:
+            conf_files.extend(server.conf_files())
+        conf_file = conf_files[0]
+        int_client = InternalClient(conf_file, 'probe-test', 3)
+        int_client.get_object_metadata(
+            self.account, self.container_name, self.object_name,
+            headers={'X-Backend-Storage-Policy-Index': int(new_policy)})
+        int_client.get_object_metadata(
+            self.account, self.container_name, self.object_name,
+            acceptable_statuses=(4,),
+            headers={'X-Backend-Storage-Policy-Index': int(old_policy)})
+
+        # shutdown the containers that know about the new policy
+        self.brain.stop_handoff_half()
+
+        # and get rows enqueued from old nodes
+        for server_type in ('container-replicator', 'container-updater'):
+            server = Manager([server_type])
+            for node in old_container_nodes:
+                server.once(number=self.config_number(node))
+
+        # verify entry in the queue for the "misplaced" new_policy
+        for container in int_client.iter_containers(MISPLACED_OBJECTS_ACCOUNT):
+            for obj in int_client.iter_objects(MISPLACED_OBJECTS_ACCOUNT,
+                                               container['name']):
+                expected = '%d:/%s/%s/%s' % (new_policy, self.account,
+                                             self.container_name,
+                                             self.object_name)
+                self.assertEqual(obj['name'], expected)
+
+        Manager(['container-reconciler']).once()
+
+        # verify object in old_policy
+        int_client.get_object_metadata(
+            self.account, self.container_name, self.object_name,
+            headers={'X-Backend-Storage-Policy-Index': int(old_policy)})
+
+        # verify object is *not* in new_policy
+        int_client.get_object_metadata(
+            self.account, self.container_name, self.object_name,
+            acceptable_statuses=(4,),
+            headers={'X-Backend-Storage-Policy-Index': int(new_policy)})
+
+        self.get_to_final_state()
+
+        # verify entry in the queue
+        for container in int_client.iter_containers(MISPLACED_OBJECTS_ACCOUNT):
+            for obj in int_client.iter_objects(MISPLACED_OBJECTS_ACCOUNT,
+                                               container['name']):
+                expected = '%d:/%s/%s/%s' % (old_policy, self.account,
+                                             self.container_name,
+                                             self.object_name)
+                self.assertEqual(obj['name'], expected)
+
+        Manager(['container-reconciler']).once()
+
+        # and now it flops back
+        int_client.get_object_metadata(
+            self.account, self.container_name, self.object_name,
+            headers={'X-Backend-Storage-Policy-Index': int(new_policy)})
+        int_client.get_object_metadata(
+            self.account, self.container_name, self.object_name,
+            acceptable_statuses=(4,),
+            headers={'X-Backend-Storage-Policy-Index': int(old_policy)})
+
+        # make sure the queue is settled
+        self.get_to_final_state()
+        for container in int_client.iter_containers(MISPLACED_OBJECTS_ACCOUNT):
+            for obj in int_client.iter_objects(MISPLACED_OBJECTS_ACCOUNT,
+                                               container['name']):
+                self.fail('Found unexpected object %r in the queue' % obj)
+
+        # verify that the object data read by external client is correct
+        headers, data = self._get_object_patiently(int(new_policy))
+        self.assertEqual(b'VERIFY', data)
+        self.assertEqual('custom-meta', headers['x-object-meta-test'])
+
+
+class TestReservedNamespaceMergePolicyIndex(TestContainerMergePolicyIndex):
+
+    @unittest.skipIf(len(ENABLED_POLICIES) < 2, "Need more than one policy")
+    def setUp(self):
+        super(TestReservedNamespaceMergePolicyIndex, self).setUp()
+        self.container_name = get_reserved_name('container', str(uuid.uuid4()))
+        self.object_name = get_reserved_name('object', str(uuid.uuid4()))
+        self.brain = InternalBrainSplitter('/etc/swift/internal-client.conf',
+                                           self.container_name,
+                                           self.object_name, 'container')
+
+    def get_object_name(self, name):
+        return get_reserved_name(name)
+
+    def test_reconcile_manifest(self):
+        raise unittest.SkipTest(
+            'SLO does not allow parts in the reserved namespace')
+
+
+class TestVersioningMergePolicyIndex(BaseTestContainerMergePolicyIndex):
+    def test_merge_storage_policy_index_before_versioning_enabled(self):
+        # reconcile split brain container...
+        self.brain.stop_primary_half()
+        self.brain.put_container()
+        self.brain.start_primary_half()
+        self.brain.stop_handoff_half()
+        self.brain.put_container()
+        self.brain.put_object(headers={'x-object-meta-test': 'custom-meta'},
+                              contents=b'VERIFY')
+        self.brain.start_handoff_half()
+        self._do_test_merge_storage_policy_index()
+        # .. then enable versioning and overwrite the moved object
+        self.brain.client.post_container(
+            self.container_name, headers={'X-Versions-Enabled': 'True'})
+        self.brain.client.put_object(
+            self.container_name, self.object_name, {}, b'MODIFIED')
+        # check both versions...
+        hdrs, listing = self.brain.client.get_container(
+            self.container_name, query_string='format=json&versions=true')
+        self.assertEqual(2, len(listing), listing)
+        hdrs, content = self.brain.client.get_object(
+            self.container_name,
+            listing[0]['name'],
+            query_string='version-id=%s' % listing[0]['version_id'])
+        self.assertEqual(b'MODIFIED', content)
+        hdrs, content = self.brain.client.get_object(
+            self.container_name,
+            listing[1]['name'],
+            query_string='version-id=%s' % listing[1]['version_id'])
+        self.assertEqual(b'VERIFY', content)
+
+    def test_merge_storage_policy_index_after_versioning_enabled(self):
+        # reconcile split brain versioning container...
+        self.brain.stop_primary_half()
+        self.brain.put_container(extra_headers={'X-Versions-Enabled': 'True'})
+        self.brain.start_primary_half()
+        self.brain.stop_handoff_half()
+        self.brain.put_container(extra_headers={'X-Versions-Enabled': 'True'})
+        self.brain.put_object(headers={'x-object-meta-test': 'custom-meta'},
+                              contents=b'VERIFY')
+        self.brain.start_handoff_half()
+        self._do_test_merge_storage_policy_index()
+        # .. then overwrite the moved object
+        self.brain.client.put_object(
+            self.container_name, self.object_name, {}, b'MODIFIED')
+        # check both versions...
+        hdrs, listing = self.brain.client.get_container(
+            self.container_name, query_string='format=json&versions=true')
+        self.assertEqual(2, len(listing), listing)
+        hdrs, content = self.brain.client.get_object(
+            self.container_name,
+            listing[0]['name'],
+            query_string='version-id=%s' % listing[0]['version_id'])
+        self.assertEqual(b'MODIFIED', content)
+        hdrs, content = self.brain.client.get_object(
+            self.container_name,
+            listing[1]['name'],
+            query_string='version-id=%s' % listing[1]['version_id'])
+        self.assertEqual(b'VERIFY', content)
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/test/probe/test_container_sync.py b/test/probe/test_container_sync.py
new file mode 100644
index 0000000000..b5aca19fc8
--- /dev/null
+++ b/test/probe/test_container_sync.py
@@ -0,0 +1,917 @@
+#!/usr/bin/python -u
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import json
+import uuid
+import random
+import unittest
+
+from urllib.parse import urlparse
+from swiftclient import client, ClientException
+
+from swift.common.http import HTTP_NOT_FOUND
+from swift.common.manager import Manager
+from test.probe.brain import BrainSplitter
+from test.probe.common import ReplProbeTest, ENABLED_POLICIES
+
+
+def get_info(url):
+    parts = urlparse(url)
+    url = parts.scheme + '://' + parts.netloc + '/info'
+    http_conn = client.http_connection(url)
+    try:
+        return client.get_capabilities(http_conn)
+    except client.ClientException:
+        raise unittest.SkipTest('Unable to retrieve cluster info')
+
+
+def get_current_realm_cluster(info):
+    try:
+        realms = info['container_sync']['realms']
+    except KeyError:
+        raise unittest.SkipTest('Unable to find container sync realms')
+    for realm, realm_info in realms.items():
+        for cluster, options in realm_info['clusters'].items():
+            if options.get('current', False):
+                return realm, cluster
+    raise unittest.SkipTest('Unable find current realm cluster')
+
+
+class BaseTestContainerSync(ReplProbeTest):
+
+    def setUp(self):
+        super(BaseTestContainerSync, self).setUp()
+        self.info = get_info(self.url)
+        self.realm, self.cluster = get_current_realm_cluster(self.info)
+
+    def _setup_synced_containers(
+            self, source_overrides=None, dest_overrides=None):
+        # these defaults are used to create both source and dest containers
+        # unless overridden by source_overrides and/or dest_overrides
+        default_params = {'url': self.url,
+                          'token': self.token,
+                          'account': self.account,
+                          'sync_key': 'secret'}
+
+        # setup dest container
+        dest = dict(default_params)
+        dest['name'] = 'dest-container-%s' % uuid.uuid4()
+        dest.update(dest_overrides or {})
+        dest_headers = {}
+        dest_policy = None
+        if len(ENABLED_POLICIES) > 1:
+            dest_policy = random.choice(ENABLED_POLICIES)
+            dest_headers['X-Storage-Policy'] = dest_policy.name
+        if dest['sync_key'] is not None:
+            dest_headers['X-Container-Sync-Key'] = dest['sync_key']
+        client.put_container(dest['url'], dest['token'], dest['name'],
+                             headers=dest_headers)
+
+        # setup source container
+        source = dict(default_params)
+        source['name'] = 'source-container-%s' % uuid.uuid4()
+        source.update(source_overrides or {})
+        source_headers = {}
+        sync_to = '//%s/%s/%s/%s' % (self.realm, self.cluster, dest['account'],
+                                     dest['name'])
+        source_headers['X-Container-Sync-To'] = sync_to
+        if source['sync_key'] is not None:
+            source_headers['X-Container-Sync-Key'] = source['sync_key']
+        if dest_policy:
+            source_policy = random.choice([p for p in ENABLED_POLICIES
+                                           if p is not dest_policy])
+            source_headers['X-Storage-Policy'] = source_policy.name
+        client.put_container(source['url'], source['token'], source['name'],
+                             headers=source_headers)
+
+        return source['name'], dest['name']
+
+
+class TestContainerSync(BaseTestContainerSync):
+
+    def test_sync(self):
+        source_container, dest_container = self._setup_synced_containers()
+
+        # upload to source
+        object_name = 'object-%s' % uuid.uuid4()
+        put_headers = {'X-Object-Meta-Test': 'put_value'}
+        client.put_object(self.url, self.token, source_container, object_name,
+                          'test-body', headers=put_headers)
+
+        # cycle container-sync
+        Manager(['container-sync']).once()
+
+        resp_headers, body = client.get_object(self.url, self.token,
+                                               dest_container, object_name)
+        self.assertEqual(body, b'test-body')
+        self.assertIn('x-object-meta-test', resp_headers)
+        self.assertEqual('put_value', resp_headers['x-object-meta-test'])
+
+        # update metadata with a POST
+        post_headers = {'Content-Type': 'image/jpeg',
+                        'X-Object-Meta-Test': 'post_value'}
+        int_client = self.make_internal_client()
+        int_client.set_object_metadata(self.account, source_container,
+                                       object_name, post_headers)
+        # sanity checks...
+        resp_headers = client.head_object(
+            self.url, self.token, source_container, object_name)
+        self.assertIn('x-object-meta-test', resp_headers)
+        self.assertEqual('post_value', resp_headers['x-object-meta-test'])
+        self.assertEqual('image/jpeg', resp_headers['content-type'])
+
+        # cycle container-sync
+        Manager(['container-sync']).once()
+
+        # verify that metadata changes were sync'd
+        resp_headers, body = client.get_object(self.url, self.token,
+                                               dest_container, object_name)
+        self.assertEqual(body, b'test-body')
+        self.assertIn('x-object-meta-test', resp_headers)
+        self.assertEqual('post_value', resp_headers['x-object-meta-test'])
+        self.assertEqual('image/jpeg', resp_headers['content-type'])
+
+        # delete the object
+        client.delete_object(
+            self.url, self.token, source_container, object_name)
+        with self.assertRaises(ClientException) as cm:
+            client.get_object(
+                self.url, self.token, source_container, object_name)
+        self.assertEqual(404, cm.exception.http_status)  # sanity check
+
+        # cycle container-sync
+        Manager(['container-sync']).once()
+
+        # verify delete has been sync'd
+        with self.assertRaises(ClientException) as cm:
+            client.get_object(
+                self.url, self.token, dest_container, object_name)
+        self.assertEqual(404, cm.exception.http_status)  # sanity check
+
+    def test_sync_slo_manifest(self):
+        # Verify that SLO manifests are sync'd even if their segments can not
+        # be found in the destination account at time of sync'ing.
+        # Create source and dest containers for manifest in separate accounts.
+        dest_account = self.account_2
+        source_container, dest_container = self._setup_synced_containers(
+            dest_overrides=dest_account
+        )
+
+        # Create source and dest containers for segments in separate accounts.
+        # These containers must have same name for the destination SLO manifest
+        # to be able to resolve segments. Initially the destination has no sync
+        # key so segments will not sync.
+        segs_container = 'segments-%s' % uuid.uuid4()
+        dest_segs_info = dict(dest_account)
+        dest_segs_info.update({'name': segs_container, 'sync_key': None})
+        self._setup_synced_containers(
+            source_overrides={'name': segs_container, 'sync_key': 'segs_key'},
+            dest_overrides=dest_segs_info)
+
+        # upload a segment to source
+        segment_name = 'segment-%s' % uuid.uuid4()
+        segment_data = b'segment body'  # it's ok for first segment to be small
+        segment_etag = client.put_object(
+            self.url, self.token, segs_container, segment_name,
+            segment_data)
+
+        manifest = [{'etag': segment_etag,
+                     'size_bytes': len(segment_data),
+                     'path': '/%s/%s' % (segs_container, segment_name)}]
+        manifest_name = 'manifest-%s' % uuid.uuid4()
+        put_headers = {'X-Object-Meta-Test': 'put_value'}
+        client.put_object(
+            self.url, self.token, source_container, manifest_name,
+            json.dumps(manifest), headers=put_headers,
+            query_string='multipart-manifest=put')
+
+        resp_headers, manifest_body = client.get_object(
+            self.url, self.token, source_container, manifest_name,
+            query_string='multipart-manifest=get')
+        int_manifest = json.loads(manifest_body)
+
+        # cycle container-sync
+        Manager(['container-sync']).once()
+
+        # verify manifest was sync'd
+        resp_headers, dest_listing = client.get_container(
+            dest_account['url'], dest_account['token'], dest_container)
+        self.assertFalse(dest_listing[1:])
+        self.assertEqual(manifest_name, dest_listing[0]['name'])
+
+        # verify manifest body
+        resp_headers, body = client.get_object(
+            dest_account['url'], dest_account['token'], dest_container,
+            manifest_name, query_string='multipart-manifest=get')
+        self.assertEqual(int_manifest, json.loads(body))
+        self.assertIn('x-object-meta-test', resp_headers)
+        self.assertEqual('put_value', resp_headers['x-object-meta-test'])
+
+        # attempt to GET the SLO will fail because the segment wasn't sync'd
+        with self.assertRaises(ClientException) as cm:
+            client.get_object(dest_account['url'], dest_account['token'],
+                              dest_container, manifest_name)
+        self.assertEqual(409, cm.exception.http_status)
+
+        # now set sync key on destination segments container
+        client.put_container(
+            dest_account['url'], dest_account['token'], segs_container,
+            headers={'X-Container-Sync-Key': 'segs_key'})
+
+        # cycle container-sync
+        Manager(['container-sync']).once()
+
+        # sanity check - verify manifest body
+        resp_headers, body = client.get_object(
+            dest_account['url'], dest_account['token'], dest_container,
+            manifest_name, query_string='multipart-manifest=get')
+        self.assertEqual(int_manifest, json.loads(body))
+        self.assertIn('x-object-meta-test', resp_headers)
+        self.assertEqual('put_value', resp_headers['x-object-meta-test'])
+
+        # verify GET of SLO manifest now succeeds
+        resp_headers, body = client.get_object(
+            dest_account['url'], dest_account['token'], dest_container,
+            manifest_name)
+        self.assertEqual(segment_data, body)
+
+    def test_sync_lazy_skey(self):
+        # Create synced containers, but with no key at source
+        source_container, dest_container =\
+            self._setup_synced_containers(source_overrides={'sync_key': None})
+
+        # upload to source
+        object_name = 'object-%s' % uuid.uuid4()
+        client.put_object(self.url, self.token, source_container, object_name,
+                          'test-body')
+
+        # cycle container-sync, nothing should happen
+        Manager(['container-sync']).once()
+        with self.assertRaises(ClientException) as err:
+            _junk, body = client.get_object(self.url, self.token,
+                                            dest_container, object_name)
+        self.assertEqual(err.exception.http_status, HTTP_NOT_FOUND)
+
+        # amend source key
+        source_headers = {'X-Container-Sync-Key': 'secret'}
+        client.put_container(self.url, self.token, source_container,
+                             headers=source_headers)
+        # cycle container-sync, should replicate
+        Manager(['container-sync']).once()
+        _junk, body = client.get_object(self.url, self.token,
+                                        dest_container, object_name)
+        self.assertEqual(body, b'test-body')
+
+    def test_sync_lazy_dkey(self):
+        # Create synced containers, but with no key at dest
+        source_container, dest_container =\
+            self._setup_synced_containers(dest_overrides={'sync_key': None})
+
+        # upload to source
+        object_name = 'object-%s' % uuid.uuid4()
+        client.put_object(self.url, self.token, source_container, object_name,
+                          'test-body')
+
+        # cycle container-sync, nothing should happen
+        Manager(['container-sync']).once()
+        with self.assertRaises(ClientException) as err:
+            _junk, body = client.get_object(self.url, self.token,
+                                            dest_container, object_name)
+        self.assertEqual(err.exception.http_status, HTTP_NOT_FOUND)
+
+        # amend dest key
+        dest_headers = {'X-Container-Sync-Key': 'secret'}
+        client.put_container(self.url, self.token, dest_container,
+                             headers=dest_headers)
+        # cycle container-sync, should replicate
+        Manager(['container-sync']).once()
+        _junk, body = client.get_object(self.url, self.token,
+                                        dest_container, object_name)
+        self.assertEqual(body, b'test-body')
+
+    def test_sync_with_stale_container_rows(self):
+        source_container, dest_container = self._setup_synced_containers()
+        brain = BrainSplitter(self.url, self.token, source_container,
+                              None, 'container')
+
+        # upload to source
+        object_name = 'object-%s' % uuid.uuid4()
+        client.put_object(self.url, self.token, source_container, object_name,
+                          'test-body')
+
+        # check source container listing
+        _, listing = client.get_container(
+            self.url, self.token, source_container)
+        for expected_obj_dict in listing:
+            if expected_obj_dict['name'] == object_name:
+                break
+        else:
+            self.fail('Failed to find source object %r in container listing %r'
+                      % (object_name, listing))
+
+        # stop all container servers
+        brain.stop_primary_half()
+        brain.stop_handoff_half()
+
+        # upload new object content to source - container updates will fail
+        client.put_object(self.url, self.token, source_container, object_name,
+                          'new-test-body')
+        source_headers = client.head_object(
+            self.url, self.token, source_container, object_name)
+
+        # start all container servers
+        brain.start_primary_half()
+        brain.start_handoff_half()
+
+        # sanity check: source container listing should not have changed
+        _, listing = client.get_container(
+            self.url, self.token, source_container)
+        for actual_obj_dict in listing:
+            if actual_obj_dict['name'] == object_name:
+                self.assertDictEqual(expected_obj_dict, actual_obj_dict)
+                break
+        else:
+            self.fail('Failed to find source object %r in container listing %r'
+                      % (object_name, listing))
+
+        # cycle container-sync - object should be correctly sync'd despite
+        # stale info in container row
+        Manager(['container-sync']).once()
+
+        # verify sync'd object has same content and headers
+        dest_headers, body = client.get_object(self.url, self.token,
+                                               dest_container, object_name)
+        self.assertEqual(body, b'new-test-body')
+        mismatched_headers = []
+        for k in ('etag', 'content-length', 'content-type', 'x-timestamp',
+                  'last-modified'):
+            if source_headers[k] == dest_headers[k]:
+                continue
+            mismatched_headers.append((k, source_headers[k], dest_headers[k]))
+        if mismatched_headers:
+            msg = '\n'.join([('Mismatched header %r, expected %r but got %r'
+                              % item) for item in mismatched_headers])
+            self.fail(msg)
+
+    def test_sync_newer_remote(self):
+        source_container, dest_container = self._setup_synced_containers()
+
+        # upload to source
+        object_name = 'object-%s' % uuid.uuid4()
+        client.put_object(self.url, self.token, source_container, object_name,
+                          'old-source-body')
+
+        # upload to dest with same name
+        client.put_object(self.url, self.token, dest_container, object_name,
+                          'new-test-body')
+
+        # cycle container-sync
+        Manager(['container-sync']).once()
+
+        # verify that the remote object did not change
+        resp_headers, body = client.get_object(self.url, self.token,
+                                               dest_container, object_name)
+        self.assertEqual(body, b'new-test-body')
+
+    def test_sync_delete_when_object_never_synced(self):
+        source_container, dest_container = self._setup_synced_containers()
+
+        # create a tombstone row
+        object_name = 'object-%s' % uuid.uuid4()
+        client.put_object(self.url, self.token, source_container,
+                          object_name, 'source-body')
+        client.delete_object(self.url, self.token, source_container,
+                             object_name)
+
+        # upload some other name, too
+        object_name = 'object-%s' % uuid.uuid4()
+        client.put_object(self.url, self.token, source_container, object_name,
+                          'other-source-body')
+
+        # cycle container-sync
+        Manager(['container-sync']).once()
+
+        # verify that the deletes (which 404ed) didn't block
+        # that last row from syncing
+        resp_headers, body = client.get_object(self.url, self.token,
+                                               dest_container, object_name)
+        self.assertEqual(body, b'other-source-body')
+
+
+class TestContainerSyncAndSymlink(BaseTestContainerSync):
+
+    def setUp(self):
+        super(TestContainerSyncAndSymlink, self).setUp()
+        symlinks_enabled = self.info.get('symlink') or False
+        if not symlinks_enabled:
+            raise unittest.SkipTest("Symlinks not enabled")
+
+    def test_sync_symlink(self):
+        # Verify that symlinks are sync'd as symlinks.
+        dest_account = self.account_2
+        source_container, dest_container = self._setup_synced_containers(
+            dest_overrides=dest_account
+        )
+
+        # Create source and dest containers for target objects in separate
+        # accounts.
+        # These containers must have same name for the destination symlink
+        # to use the same target object. Initially the destination has no sync
+        # key so target will not sync.
+        tgt_container = 'targets-%s' % uuid.uuid4()
+        dest_tgt_info = dict(dest_account)
+        dest_tgt_info.update({'name': tgt_container, 'sync_key': None})
+        self._setup_synced_containers(
+            source_overrides={'name': tgt_container, 'sync_key': 'tgt_key'},
+            dest_overrides=dest_tgt_info)
+
+        # upload a target to source
+        target_name = 'target-%s' % uuid.uuid4()
+        target_body = b'target body'
+        client.put_object(
+            self.url, self.token, tgt_container, target_name,
+            target_body)
+
+        # Note that this tests when the target object is in the same account
+        target_path = '%s/%s' % (tgt_container, target_name)
+        symlink_name = 'symlink-%s' % uuid.uuid4()
+        put_headers = {'X-Symlink-Target': target_path}
+
+        # upload the symlink
+        client.put_object(
+            self.url, self.token, source_container, symlink_name,
+            '', headers=put_headers)
+
+        # verify object is a symlink
+        resp_headers, symlink_body = client.get_object(
+            self.url, self.token, source_container, symlink_name,
+            query_string='symlink=get')
+        self.assertEqual(b'', symlink_body)
+        self.assertIn('x-symlink-target', resp_headers)
+
+        # verify symlink behavior
+        resp_headers, actual_target_body = client.get_object(
+            self.url, self.token, source_container, symlink_name)
+        self.assertEqual(target_body, actual_target_body)
+
+        # cycle container-sync
+        Manager(['container-sync']).once()
+
+        # verify symlink was sync'd
+        resp_headers, dest_listing = client.get_container(
+            dest_account['url'], dest_account['token'], dest_container)
+        self.assertFalse(dest_listing[1:])
+        self.assertEqual(symlink_name, dest_listing[0]['name'])
+
+        # verify symlink remained only a symlink
+        resp_headers, symlink_body = client.get_object(
+            dest_account['url'], dest_account['token'], dest_container,
+            symlink_name, query_string='symlink=get')
+        self.assertEqual(b'', symlink_body)
+        self.assertIn('x-symlink-target', resp_headers)
+
+        # attempt to GET the target object via symlink will fail because
+        # the target wasn't sync'd
+        with self.assertRaises(ClientException) as cm:
+            client.get_object(dest_account['url'], dest_account['token'],
+                              dest_container, symlink_name)
+        self.assertEqual(404, cm.exception.http_status)
+
+        # now set sync key on destination target container
+        client.put_container(
+            dest_account['url'], dest_account['token'], tgt_container,
+            headers={'X-Container-Sync-Key': 'tgt_key'})
+
+        # cycle container-sync
+        Manager(['container-sync']).once()
+
+        # sanity:
+        resp_headers, body = client.get_object(
+            dest_account['url'], dest_account['token'],
+            tgt_container, target_name)
+
+        # sanity check - verify symlink remained only a symlink
+        resp_headers, symlink_body = client.get_object(
+            dest_account['url'], dest_account['token'], dest_container,
+            symlink_name, query_string='symlink=get')
+        self.assertEqual(b'', symlink_body)
+        self.assertIn('x-symlink-target', resp_headers)
+
+        # verify GET of target object via symlink now succeeds
+        resp_headers, actual_target_body = client.get_object(
+            dest_account['url'], dest_account['token'], dest_container,
+            symlink_name)
+        self.assertEqual(target_body, actual_target_body)
+
+    def test_sync_cross_acc_symlink(self):
+        # Verify that cross-account symlinks are sync'd as cross-account
+        # symlinks.
+        source_container, dest_container = self._setup_synced_containers()
+
+        # Sync'd symlinks will have the same target path "/a/c/o".
+        # So if we want to execute probe test with syncing targets,
+        # two swift clusters will be required.
+        # Therefore, for probe test in single cluster, target object is not
+        # sync'd in this test.
+        tgt_account = self.account_2
+        tgt_container = 'targets-%s' % uuid.uuid4()
+
+        tgt_container_headers = {'X-Container-Read': 'test:tester'}
+        if len(ENABLED_POLICIES) > 1:
+            tgt_policy = random.choice(ENABLED_POLICIES)
+            tgt_container_headers['X-Storage-Policy'] = tgt_policy.name
+        client.put_container(tgt_account['url'], tgt_account['token'],
+                             tgt_container, headers=tgt_container_headers)
+
+        # upload a target to source
+        target_name = 'target-%s' % uuid.uuid4()
+        target_body = b'target body'
+        client.put_object(tgt_account['url'], tgt_account['token'],
+                          tgt_container, target_name, target_body)
+
+        # Note that this tests when the target object is in a different account
+        target_path = '%s/%s' % (tgt_container, target_name)
+        symlink_name = 'symlink-%s' % uuid.uuid4()
+        put_headers = {
+            'X-Symlink-Target': target_path,
+            'X-Symlink-Target-Account': tgt_account['account']}
+
+        # upload the symlink
+        client.put_object(
+            self.url, self.token, source_container, symlink_name,
+            '', headers=put_headers)
+
+        # verify object is a cross-account symlink
+        resp_headers, symlink_body = client.get_object(
+            self.url, self.token, source_container, symlink_name,
+            query_string='symlink=get')
+        self.assertEqual(b'', symlink_body)
+        self.assertIn('x-symlink-target', resp_headers)
+        self.assertIn('x-symlink-target-account', resp_headers)
+
+        # verify symlink behavior
+        resp_headers, actual_target_body = client.get_object(
+            self.url, self.token, source_container, symlink_name)
+        self.assertEqual(target_body, actual_target_body)
+
+        # cycle container-sync
+        Manager(['container-sync']).once()
+
+        # verify symlink was sync'd
+        resp_headers, dest_listing = client.get_container(
+            self.url, self.token, dest_container)
+        self.assertFalse(dest_listing[1:])
+        self.assertEqual(symlink_name, dest_listing[0]['name'])
+
+        # verify symlink remained only a symlink
+        resp_headers, symlink_body = client.get_object(
+            self.url, self.token, dest_container,
+            symlink_name, query_string='symlink=get')
+        self.assertEqual(b'', symlink_body)
+        self.assertIn('x-symlink-target', resp_headers)
+        self.assertIn('x-symlink-target-account', resp_headers)
+
+        # verify GET of target object via symlink now succeeds
+        resp_headers, actual_target_body = client.get_object(
+            self.url, self.token, dest_container, symlink_name)
+        self.assertEqual(target_body, actual_target_body)
+
+    def test_sync_static_symlink_different_container(self):
+        source_container, dest_container = self._setup_synced_containers()
+
+        symlink_cont = 'symlink-container-%s' % uuid.uuid4()
+        client.put_container(self.url, self.token, symlink_cont)
+
+        # upload a target to symlink container
+        target_name = 'target-%s' % uuid.uuid4()
+        target_body = b'target body'
+        etag = client.put_object(
+            self.url, self.token, symlink_cont, target_name,
+            target_body)
+
+        # upload a regular object
+        regular_name = 'regular-%s' % uuid.uuid4()
+        regular_body = b'regular body'
+        client.put_object(
+            self.url, self.token, source_container, regular_name,
+            regular_body)
+
+        # static symlink
+        target_path = '%s/%s' % (symlink_cont, target_name)
+        symlink_name = 'symlink-%s' % uuid.uuid4()
+        put_headers = {'X-Symlink-Target': target_path,
+                       'X-Symlink-Target-Etag': etag}
+
+        # upload the symlink
+        client.put_object(
+            self.url, self.token, source_container, symlink_name,
+            '', headers=put_headers)
+
+        # verify object is a symlink
+        resp_headers, symlink_body = client.get_object(
+            self.url, self.token, source_container, symlink_name,
+            query_string='symlink=get')
+        self.assertEqual(b'', symlink_body)
+        self.assertIn('x-symlink-target', resp_headers)
+        self.assertIn('x-symlink-target-etag', resp_headers)
+
+        # verify symlink behavior
+        resp_headers, actual_target_body = client.get_object(
+            self.url, self.token, source_container, symlink_name)
+        self.assertEqual(target_body, actual_target_body)
+        self.assertIn('content-location', resp_headers)
+        content_location = resp_headers['content-location']
+
+        # cycle container-sync
+        Manager(['container-sync']).once()
+
+        # regular object should have synced
+        resp_headers, actual_target_body = client.get_object(
+            self.url, self.token, dest_container, regular_name)
+        self.assertEqual(regular_body, actual_target_body)
+
+        # static symlink gets synced, too
+        resp_headers, actual_target_body = client.get_object(
+            self.url, self.token, dest_container, symlink_name)
+        self.assertEqual(target_body, actual_target_body)
+        self.assertIn('content-location', resp_headers)
+        self.assertEqual(content_location, resp_headers['content-location'])
+
+    def test_sync_busted_static_symlink_different_container(self):
+        source_container, dest_container = self._setup_synced_containers()
+
+        symlink_cont = 'symlink-container-%s' % uuid.uuid4()
+        client.put_container(self.url, self.token, symlink_cont)
+
+        # upload a target to symlink container
+        target_name = 'target-%s' % uuid.uuid4()
+        target_body = b'target body'
+        etag = client.put_object(
+            self.url, self.token, symlink_cont, target_name,
+            target_body)
+
+        # upload a regular object
+        regular_name = 'regular-%s' % uuid.uuid4()
+        regular_body = b'regular body'
+        client.put_object(
+            self.url, self.token, source_container, regular_name,
+            regular_body)
+
+        # static symlink
+        target_path = '%s/%s' % (symlink_cont, target_name)
+        symlink_name = 'symlink-%s' % uuid.uuid4()
+        put_headers = {'X-Symlink-Target': target_path,
+                       'X-Symlink-Target-Etag': etag}
+
+        # upload the symlink
+        client.put_object(
+            self.url, self.token, source_container, symlink_name,
+            '', headers=put_headers)
+
+        # verify object is a symlink
+        resp_headers, symlink_body = client.get_object(
+            self.url, self.token, source_container, symlink_name,
+            query_string='symlink=get')
+        self.assertEqual(b'', symlink_body)
+        self.assertIn('x-symlink-target', resp_headers)
+        self.assertIn('x-symlink-target-etag', resp_headers)
+
+        # verify symlink behavior
+        resp_headers, actual_target_body = client.get_object(
+            self.url, self.token, source_container, symlink_name)
+        self.assertEqual(target_body, actual_target_body)
+        self.assertIn('content-location', resp_headers)
+        content_location = resp_headers['content-location']
+
+        # Break the link
+        client.put_object(
+            self.url, self.token, symlink_cont, target_name,
+            b'something else')
+
+        # cycle container-sync
+        Manager(['container-sync']).once()
+
+        # regular object should have synced
+        resp_headers, actual_target_body = client.get_object(
+            self.url, self.token, dest_container, regular_name)
+        self.assertEqual(regular_body, actual_target_body)
+
+        # static symlink gets synced, too, even though the target's different!
+        with self.assertRaises(ClientException) as cm:
+            client.get_object(
+                self.url, self.token, dest_container, symlink_name)
+        self.assertEqual(409, cm.exception.http_status)
+        resp_headers = cm.exception.http_response_headers
+        self.assertIn('content-location', resp_headers)
+        self.assertEqual(content_location, resp_headers['content-location'])
+
+    def test_sync_static_symlink(self):
+        source_container, dest_container = self._setup_synced_containers()
+
+        # upload a target to symlink container
+        target_name = 'target-%s' % uuid.uuid4()
+        target_body = b'target body'
+        etag = client.put_object(
+            self.url, self.token, source_container, target_name,
+            target_body)
+
+        # static symlink
+        target_path = '%s/%s' % (source_container, target_name)
+        symlink_name = 'symlink-%s' % uuid.uuid4()
+        put_headers = {'X-Symlink-Target': target_path,
+                       'X-Symlink-Target-Etag': etag}
+
+        # upload the symlink
+        client.put_object(
+            self.url, self.token, source_container, symlink_name,
+            '', headers=put_headers)
+
+        # verify object is a symlink
+        resp_headers, symlink_body = client.get_object(
+            self.url, self.token, source_container, symlink_name,
+            query_string='symlink=get')
+        self.assertEqual(b'', symlink_body)
+        self.assertIn('x-symlink-target', resp_headers)
+        self.assertIn('x-symlink-target-etag', resp_headers)
+
+        # verify symlink behavior
+        resp_headers, actual_target_body = client.get_object(
+            self.url, self.token, source_container, symlink_name)
+        self.assertEqual(target_body, actual_target_body)
+
+        # cycle container-sync
+        Manager(['container-sync']).once()
+
+        # regular object should have synced
+        resp_headers, actual_target_body = client.get_object(
+            self.url, self.token, dest_container, target_name)
+        self.assertEqual(target_body, actual_target_body)
+
+        # and static link too
+        resp_headers, actual_target_body = client.get_object(
+            self.url, self.token, dest_container, symlink_name)
+        self.assertEqual(target_body, actual_target_body)
+
+
+class TestContainerSyncAndVersioning(BaseTestContainerSync):
+
+    def setUp(self):
+        super(TestContainerSyncAndVersioning, self).setUp()
+        if 'object_versioning' not in self.info:
+            raise unittest.SkipTest("Object Versioning not enabled")
+
+    def _test_syncing(self, source_container, dest_container):
+        # test syncing and versioning
+        object_name = 'object-%s' % uuid.uuid4()
+        client.put_object(self.url, self.token, source_container, object_name,
+                          'version1')
+
+        # cycle container-sync
+        Manager(['container-sync']).once()
+
+        # overwrite source
+        client.put_object(self.url, self.token, source_container, object_name,
+                          'version2')
+
+        # cycle container-sync
+        Manager(['container-sync']).once()
+
+        resp_headers, listing = client.get_container(
+            self.url, self.token, dest_container,
+            query_string='versions')
+
+        self.assertEqual(2, len(listing))
+
+    def test_enable_versioning_while_syncing_container(self):
+
+        source_container, dest_container = self._setup_synced_containers()
+        version_hdr = {'X-Versions-Enabled': 'true'}
+
+        # Cannot enable versioning on source container
+        with self.assertRaises(ClientException) as cm:
+            client.post_container(self.url, self.token, source_container,
+                                  headers=version_hdr)
+        self.assertEqual(400, cm.exception.http_status)  # sanity check
+        self.assertEqual(b'Cannot enable object versioning on a container '
+                         b'configured as source of container syncing.',
+                         cm.exception.http_response_content)
+
+        # but destination is ok!
+        client.post_container(self.url, self.token, dest_container,
+                              headers=version_hdr)
+
+        headers = client.head_container(self.url, self.token,
+                                        dest_container)
+        self.assertEqual('True', headers.get('x-versions-enabled'))
+        self.assertEqual('secret', headers.get('x-container-sync-key'))
+
+        self._test_syncing(source_container, dest_container)
+
+    def test_enable_syncing_while_versioned(self):
+        source_container, dest_container = self._setup_synced_containers()
+
+        container_name = 'versioned-%s' % uuid.uuid4()
+        version_hdr = {'X-Versions-Enabled': 'true'}
+
+        client.put_container(self.url, self.token, container_name,
+                             headers=version_hdr)
+
+        # fails to configure as a container-sync source
+        sync_headers = {'X-Container-Sync-Key': 'secret'}
+        sync_to = '//%s/%s/%s/%s' % (self.realm, self.cluster, self.account,
+                                     dest_container)
+        sync_headers['X-Container-Sync-To'] = sync_to
+        with self.assertRaises(ClientException) as cm:
+            client.post_container(self.url, self.token, container_name,
+                                  headers=sync_headers)
+        self.assertEqual(400, cm.exception.http_status)  # sanity check
+
+        # but works if it's just a container-sync destination
+        sync_headers = {'X-Container-Sync-Key': 'secret'}
+        client.post_container(self.url, self.token, container_name,
+                              headers=sync_headers)
+
+        headers = client.head_container(self.url, self.token,
+                                        container_name)
+        self.assertEqual('True', headers.get('x-versions-enabled'))
+        self.assertEqual('secret', headers.get('x-container-sync-key'))
+
+        # update source header to sync to versioned container
+        source_headers = {'X-Container-Sync-Key': 'secret'}
+        sync_to = '//%s/%s/%s/%s' % (self.realm, self.cluster, self.account,
+                                     container_name)
+        source_headers['X-Container-Sync-To'] = sync_to
+        client.post_container(self.url, self.token, source_container,
+                              headers=source_headers)
+
+        self._test_syncing(source_container, container_name)
+
+    def test_skip_sync_when_misconfigured(self):
+        source_container, dest_container = self._setup_synced_containers()
+
+        container_name = 'versioned-%s' % uuid.uuid4()
+        version_hdr = {'X-Versions-Enabled': 'true'}
+
+        client.put_container(self.url, self.token, container_name,
+                             headers=version_hdr)
+
+        # some sanity checks
+        object_name = 'object-%s' % uuid.uuid4()
+        client.put_object(self.url, self.token, container_name, object_name,
+                          'version1')
+        client.put_object(self.url, self.token, container_name, object_name,
+                          'version2')
+
+        resp_headers, listing = client.get_container(
+            self.url, self.token, container_name,
+            query_string='versions')
+
+        self.assertEqual(2, len(listing))
+
+        sync_headers = {}
+        sync_to = '//%s/%s/%s/%s' % (self.realm, self.cluster, self.account,
+                                     dest_container)
+        sync_headers['X-Container-Sync-To'] = sync_to
+        sync_headers['X-Container-Sync-Key'] = 'secret'
+
+        # use internal client to set container-sync headers
+        # since it doesn't have container_sync middleware in pipeline
+        # allowing us to bypass checks
+        int_client = self.make_internal_client()
+        # TODO: what a terrible hack, maybe we need to extend internal
+        # client to allow caller to become a swift_owner??
+        int_client.app._pipeline_final_app.swift_owner_headers = []
+        int_client.set_container_metadata(self.account, container_name,
+                                          metadata=sync_headers)
+
+        headers = client.head_container(self.url, self.token,
+                                        container_name)
+
+        # This should never happen, but if it does because of eventual
+        # consistency or a messed up pipeline, container-sync should
+        # skip syncing container.
+        self.assertEqual('True', headers.get('x-versions-enabled'))
+        self.assertEqual('secret', headers.get('x-container-sync-key'))
+        self.assertEqual(sync_to, headers.get('x-container-sync-to'))
+
+        # cycle container-sync
+        Manager(['container-sync']).once()
+
+        with self.assertRaises(ClientException) as cm:
+            client.get_object(
+                self.url, self.token, dest_container, object_name)
+        self.assertEqual(404, cm.exception.http_status)  # sanity check
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/test/probe/test_dark_data.py b/test/probe/test_dark_data.py
new file mode 100644
index 0000000000..dcd6cff53b
--- /dev/null
+++ b/test/probe/test_dark_data.py
@@ -0,0 +1,187 @@
+#!/usr/bin/python -u
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import collections
+import unittest
+
+import os
+import uuid
+import shutil
+
+from datetime import datetime
+from configparser import ConfigParser
+
+from test.probe.brain import BrainSplitter
+from test.probe.common import ReplProbeTest
+from swift.common import manager
+from swift.common.storage_policy import get_policy_string
+from swift.common.manager import Manager, Server
+from swift.common.utils import readconf
+
+
+CONF_SECTION = 'object-auditor:watcher:swift#dark_data'
+
+
+class TestDarkDataDeletion(ReplProbeTest):
+    # NB: could be 'quarantine' in another test
+    action = 'delete'
+
+    def setUp(self):
+        """
+        Reset all environment and start all servers.
+        """
+        super(TestDarkDataDeletion, self).setUp()
+
+        self.conf_dest = \
+            os.path.join('/tmp/',
+                         datetime.now().strftime('swift-%Y-%m-%d_%H-%M-%S-%f'))
+        os.mkdir(self.conf_dest)
+
+        object_server_dir = os.path.join(self.conf_dest, 'object-server')
+        os.mkdir(object_server_dir)
+
+        for conf_file in Server('object-auditor').conf_files():
+            config = readconf(conf_file)
+            if 'object-auditor' not in config:
+                continue  # *somebody* should be set up to run the auditor
+            config['object-auditor'].update(
+                {'watchers': 'swift#dark_data'})
+            # Note that this setdefault business may mean the watcher doesn't
+            # pick up DEFAULT values, but that (probably?) won't matter.
+            # We set grace_age to 0 so that tests don't have to deal with time.
+            config.setdefault(CONF_SECTION, {}).update(
+                {'action': self.action,
+                 'grace_age': "0"})
+
+            parser = ConfigParser()
+            for section in ('object-auditor', CONF_SECTION):
+                parser.add_section(section)
+                for option, value in config[section].items():
+                    parser.set(section, option, value)
+
+            file_name = os.path.basename(conf_file)
+            if file_name.endswith('.d'):
+                # Work around conf.d setups (like you might see with VSAIO)
+                file_name = file_name[:-2]
+            with open(os.path.join(object_server_dir, file_name), 'w') as fp:
+                parser.write(fp)
+
+        self.container_name = 'container-%s' % uuid.uuid4()
+        self.object_name = 'object-%s' % uuid.uuid4()
+        self.brain = BrainSplitter(self.url, self.token, self.container_name,
+                                   self.object_name, 'object',
+                                   policy=self.policy)
+
+    def tearDown(self):
+        shutil.rmtree(self.conf_dest)
+
+    def gather_object_files_by_ext(self):
+        result = collections.defaultdict(set)
+        for node in self.brain.nodes:
+            for path, _, files in os.walk(os.path.join(
+                    self.device_dir(node),
+                    get_policy_string('objects', self.policy))):
+                for file in files:
+                    if file in ('.lock', 'hashes.pkl', 'hashes.invalid',
+                                '.lock-replication'):
+                        continue
+                    _, ext = os.path.splitext(file)
+                    result[ext].add(os.path.join(path, file))
+        return result
+
+    def test_dark_data(self):
+        self.brain.put_container()
+        self.brain.put_object()
+        self.brain.stop_handoff_half()
+        self.brain.delete_object()
+        Manager(['object-updater']).once()
+        Manager(['container-replicator']).once()
+
+        # Sanity check:
+        # * all containers are empty
+        # * primaries that are still up have two .ts files
+        # * primary that's down has one .data file
+        for index, (headers, items) in self.direct_get_container(
+                container=self.container_name).items():
+            self.assertEqual(headers['X-Container-Object-Count'], '0')
+            self.assertEqual(items, [])
+
+        files = self.gather_object_files_by_ext()
+        self.assertLengthEqual(files, 2)
+        self.assertLengthEqual(files['.ts'], 2)
+        self.assertLengthEqual(files['.data'], 1)
+
+        # Simulate a reclaim_age passing,
+        # so the tombstones all got cleaned up
+        for file_path in files['.ts']:
+            os.unlink(file_path)
+
+        # Old node gets reintroduced to the cluster
+        self.brain.start_handoff_half()
+        # ...so replication thinks its got some work to do
+        Manager(['object-replicator']).once()
+
+        # Now we're back to *three* .data files
+        files = self.gather_object_files_by_ext()
+        self.assertLengthEqual(files, 1)
+        self.assertLengthEqual(files['.data'], 3)
+
+        # But that's OK, audit watchers to the rescue!
+        old_swift_dir = manager.SWIFT_DIR
+        manager.SWIFT_DIR = self.conf_dest
+        try:
+            Manager(['object-auditor']).once()
+        finally:
+            manager.SWIFT_DIR = old_swift_dir
+
+        # Verify that the policy was applied.
+        self.check_on_disk_files(files['.data'])
+
+    def check_on_disk_files(self, files):
+        for file_path in files:
+            # File's not there
+            self.assertFalse(os.path.exists(file_path))
+            # And it's not quaratined, either!
+            self.assertPathDoesNotExist(os.path.join(
+                file_path[:file_path.index('objects')], 'quarantined'))
+
+    def assertPathExists(self, path):
+        msg = "Expected path %r to exist, but it doesn't" % path
+        self.assertTrue(os.path.exists(path), msg)
+
+    def assertPathDoesNotExist(self, path):
+        msg = "Expected path %r to not exist, but it does" % path
+        self.assertFalse(os.path.exists(path), msg)
+
+
+class TestDarkDataQuarantining(TestDarkDataDeletion):
+    action = 'quarantine'
+
+    def check_on_disk_files(self, files):
+        for file_path in files:
+            # File's not there
+            self.assertPathDoesNotExist(file_path)
+            # Got quarantined
+            parts = file_path.split(os.path.sep)
+            policy_dir = get_policy_string('objects', self.policy)
+            quarantine_dir = parts[:parts.index(policy_dir)] + ['quarantined']
+            quarantine_path = os.path.sep.join(
+                quarantine_dir + [policy_dir] + parts[-2:])
+            self.assertPathExists(quarantine_path)
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/test/probe/test_db_replicator.py b/test/probe/test_db_replicator.py
new file mode 100755
index 0000000000..5ba39a8657
--- /dev/null
+++ b/test/probe/test_db_replicator.py
@@ -0,0 +1,145 @@
+# Copyright (c) 2010-2016 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from unittest import main
+from uuid import uuid4
+
+from swiftclient import client, ClientException
+
+from test.probe.common import kill_server, ReplProbeTest, start_server
+from swift.common import direct_client, utils
+from swift.common.manager import Manager
+
+
+class TestDbUsyncReplicator(ReplProbeTest):
+    object_puts = 1  # Overridden in subclass to force rsync
+
+    def test_metadata_sync(self):
+        # Create container
+        container = 'container-%s' % uuid4()
+        client.put_container(self.url, self.token, container,
+                             headers={'X-Storage-Policy': self.policy.name,
+                                      'X-Container-Meta-A': '1',
+                                      'X-Container-Meta-B': '1',
+                                      'X-Container-Meta-C': '1'})
+
+        cpart, cnodes = self.container_ring.get_nodes(self.account, container)
+        cnode = cnodes.pop()
+        # 2 of 3 container servers are temporarily down
+        for node in cnodes:
+            kill_server((node['ip'], node['port']),
+                        self.ipport2server)
+
+        # Put some meta on the lone server, to make sure it's merged properly
+        # This will 503 (since we don't have a quorum), but we don't care (!)
+        try:
+            client.post_container(self.url, self.token, container,
+                                  headers={'X-Container-Meta-A': '2',
+                                           'X-Container-Meta-B': '2',
+                                           'X-Container-Meta-D': '2'})
+        except ClientException:
+            pass
+
+        # object updates come to only one container server
+        for _ in range(self.object_puts):
+            obj = 'object-%s' % uuid4()
+            client.put_object(self.url, self.token, container, obj, 'VERIFY')
+
+        # 2 container servers make comeback
+        for node in cnodes:
+            start_server((node['ip'], node['port']),
+                         self.ipport2server)
+        # But, container-server which got object updates is down
+        kill_server((cnode['ip'], cnode['port']),
+                    self.ipport2server)
+
+        # Metadata update will be applied to 2 container servers
+        # (equal to quorum)
+        client.post_container(self.url, self.token, container,
+                              headers={'X-Container-Meta-B': '3',
+                                       'X-Container-Meta-E': '3'})
+        # container-server which got object updates makes comeback
+        start_server((cnode['ip'], cnode['port']),
+                     self.ipport2server)
+
+        # other nodes have no objects
+        for node in cnodes:
+            resp_headers = direct_client.direct_head_container(
+                node, cpart, self.account, container)
+            self.assertIn(resp_headers.get('x-container-object-count'),
+                          (None, '0', 0))
+
+        # If container-replicator on the node which got the object updates
+        # runs in first, db file may be replicated by rsync to other
+        # containers. In that case, the db file does not information about
+        # metadata, so metadata should be synced before replication
+        Manager(['container-replicator']).once(
+            number=self.config_number(cnode))
+
+        expected_meta = {
+            'x-container-meta-a': '2',
+            'x-container-meta-b': '3',
+            'x-container-meta-c': '1',
+            'x-container-meta-d': '2',
+            'x-container-meta-e': '3',
+        }
+
+        # node that got the object updates now has the meta
+        resp_headers = direct_client.direct_head_container(
+            cnode, cpart, self.account, container)
+        for header, value in expected_meta.items():
+            self.assertIn(header, resp_headers)
+            self.assertEqual(value, resp_headers[header])
+        self.assertNotIn(resp_headers.get('x-container-object-count'),
+                         (None, '0', 0))
+
+        # other nodes still have the meta, as well as objects
+        for node in cnodes:
+            resp_headers = direct_client.direct_head_container(
+                node, cpart, self.account, container)
+            for header, value in expected_meta.items():
+                self.assertIn(header, resp_headers)
+                self.assertEqual(value, resp_headers[header])
+            self.assertNotIn(resp_headers.get('x-container-object-count'),
+                             (None, '0', 0))
+
+        # and after full pass on remaining nodes
+        for node in cnodes:
+            Manager(['container-replicator']).once(
+                number=self.config_number(node))
+
+        # ... all is right
+        for node in cnodes + [cnode]:
+            resp_headers = direct_client.direct_head_container(
+                node, cpart, self.account, container)
+            for header, value in expected_meta.items():
+                self.assertIn(header, resp_headers)
+                self.assertEqual(value, resp_headers[header])
+            self.assertNotIn(resp_headers.get('x-container-object-count'),
+                             (None, '0', 0))
+
+
+class TestDbRsyncReplicator(TestDbUsyncReplicator):
+    def setUp(self):
+        super(TestDbRsyncReplicator, self).setUp()
+        cont_configs = [utils.readconf(p, 'container-replicator')
+                        for p in self.configs['container-replicator'].values()]
+        # Do more than per_diff object PUTs, to force rsync instead of usync
+        self.object_puts = 1 + max(int(c.get('per_diff', '1000'))
+                                   for c in cont_configs)
+
+
+if __name__ == '__main__':
+    main()
diff --git a/test/probe/test_empty_device_handoff.py b/test/probe/test_empty_device_handoff.py
index af4bcbbf6e..9a7f4234ca 100644
--- a/test/probe/test_empty_device_handoff.py
+++ b/test/probe/test_empty_device_handoff.py
@@ -1,5 +1,5 @@
 #!/usr/bin/python -u
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -16,57 +16,39 @@
 
 import os
 import shutil
+import time
 
-from subprocess import call, Popen
-from unittest import main, TestCase
+from unittest import main
 from uuid import uuid4
 
 from swiftclient import client
 
 from swift.common import direct_client
-from test.probe.common import kill_server, kill_servers, reset_environment,\
-    start_server
+from swift.obj.diskfile import get_data_dir
+from swift.common.exceptions import ClientException
+from test.probe.common import (
+    kill_server, ReplProbeTest, start_server, get_server_number)
 from swift.common.utils import readconf
+from swift.common.manager import Manager
 
 
-class TestEmptyDevice(TestCase):
-
-    def setUp(self):
-        (self.pids, self.port2server, self.account_ring, self.container_ring,
-         self.object_ring, self.url, self.token,
-         self.account) = reset_environment()
-
-    def tearDown(self):
-        kill_servers(self.port2server, self.pids)
+class TestEmptyDevice(ReplProbeTest):
 
     def _get_objects_dir(self, onode):
         device = onode['device']
-        node_id = (onode['port'] - 6000) / 10
-        obj_server_conf = readconf('/etc/swift/object-server/%s.conf' %
-                                   node_id)
+        _, node_id = get_server_number((onode['ip'], onode['port']),
+                                       self.ipport2server)
+        obj_server_conf = readconf(self.configs['object-server'][node_id])
         devices = obj_server_conf['app:object-server']['devices']
         obj_dir = '%s/%s' % (devices, device)
         return obj_dir
 
     def test_main(self):
         # Create container
-        # Kill one container/obj primary server
-        # Delete the "objects" directory on the primary server
-        # Create container/obj (goes to two primary servers and one handoff)
-        # Kill other two container/obj primary servers
-        # Indirectly through proxy assert we can get container/obj
-        # Restart those other two container/obj primary servers
-        # Directly to handoff server assert we can get container/obj
-        # Assert container listing (via proxy and directly) has container/obj
-        # Bring the first container/obj primary server back up
-        # Assert that it doesn't have container/obj yet
-        # Run object replication for first container/obj primary server
-        # Run object replication for handoff node
-        # Assert the first container/obj primary server now has container/obj
-        # Assert the handoff server no longer has container/obj
-
         container = 'container-%s' % uuid4()
-        client.put_container(self.url, self.token, container)
+        client.put_container(self.url, self.token, container,
+                             headers={'X-Storage-Policy':
+                                      self.policy.name})
 
         cpart, cnodes = self.container_ring.get_nodes(self.account, container)
         cnode = cnodes[0]
@@ -74,75 +56,122 @@ def test_main(self):
         opart, onodes = self.object_ring.get_nodes(
             self.account, container, obj)
         onode = onodes[0]
-        kill_server(onode['port'], self.port2server, self.pids)
-        obj_dir = '%s/objects' % self._get_objects_dir(onode)
+
+        # Kill one container/obj primary server
+        kill_server((onode['ip'], onode['port']), self.ipport2server)
+
+        # Delete the default data directory for objects on the primary server
+        obj_dir = '%s/%s' % (self._get_objects_dir(onode),
+                             get_data_dir(self.policy))
         shutil.rmtree(obj_dir, True)
         self.assertFalse(os.path.exists(obj_dir))
+
+        # Create container/obj (goes to two primary servers and one handoff)
         client.put_object(self.url, self.token, container, obj, 'VERIFY')
         odata = client.get_object(self.url, self.token, container, obj)[-1]
-        if odata != 'VERIFY':
+        if odata != b'VERIFY':
             raise Exception('Object GET did not return VERIFY, instead it '
                             'returned: %s' % repr(odata))
-        # Kill all primaries to ensure GET handoff works
+
+        # Stash the on disk data from a primary for future comparison with the
+        # handoff - this may not equal 'VERIFY' if for example the proxy has
+        # crypto enabled
+        direct_get_data = direct_client.direct_get_object(
+            onodes[1], opart, self.account, container, obj, headers={
+                'X-Backend-Storage-Policy-Index': self.policy.idx})[-1]
+
+        # Kill other two container/obj primary servers
+        #  to ensure GET handoff works
         for node in onodes[1:]:
-            kill_server(node['port'], self.port2server, self.pids)
+            kill_server((node['ip'], node['port']), self.ipport2server)
+
+        # Indirectly through proxy assert we can get container/obj
         odata = client.get_object(self.url, self.token, container, obj)[-1]
-        if odata != 'VERIFY':
+        if odata != b'VERIFY':
             raise Exception('Object GET did not return VERIFY, instead it '
                             'returned: %s' % repr(odata))
+        # Restart those other two container/obj primary servers
         for node in onodes[1:]:
-            start_server(node['port'], self.port2server, self.pids)
+            start_server((node['ip'], node['port']), self.ipport2server)
             self.assertFalse(os.path.exists(obj_dir))
             # We've indirectly verified the handoff node has the object, but
             # let's directly verify it.
-        another_onode = self.object_ring.get_more_nodes(opart).next()
+
+        # Directly to handoff server assert we can get container/obj
+        another_onode = next(self.object_ring.get_more_nodes(opart))
         odata = direct_client.direct_get_object(
-            another_onode, opart, self.account, container, obj)[-1]
-        if odata != 'VERIFY':
-            raise Exception('Direct object GET did not return VERIFY, instead '
-                            'it returned: %s' % repr(odata))
+            another_onode, opart, self.account, container, obj,
+            headers={'X-Backend-Storage-Policy-Index': self.policy.idx})[-1]
+        self.assertEqual(direct_get_data, odata)
+
+        # Assert container listing (via proxy and directly) has container/obj
         objs = [o['name'] for o in
                 client.get_container(self.url, self.token, container)[1]]
         if obj not in objs:
             raise Exception('Container listing did not know about object')
-        for cnode in cnodes:
-            objs = [o['name'] for o in
-                    direct_client.direct_get_container(
-                        cnode, cpart, self.account, container)[1]]
-            if obj not in objs:
-                raise Exception(
-                    'Container server %s:%s did not know about object' %
-                    (cnode['ip'], cnode['port']))
-        start_server(onode['port'], self.port2server, self.pids)
+        timeout = time.time() + 5
+        found_objs_on_cnode = []
+        while time.time() < timeout:
+            for cnode in [c for c in cnodes if cnodes not in
+                          found_objs_on_cnode]:
+                objs = [o['name'] for o in
+                        direct_client.direct_get_container(
+                            cnode, cpart, self.account, container)[1]]
+                if obj in objs:
+                    found_objs_on_cnode.append(cnode)
+            if len(found_objs_on_cnode) >= len(cnodes):
+                break
+            time.sleep(0.3)
+        if len(found_objs_on_cnode) < len(cnodes):
+            missing = ['%s:%s' % (cnode['ip'], cnode['port']) for cnode in
+                       cnodes if cnode not in found_objs_on_cnode]
+            raise Exception('Container servers %r did not know about object' %
+                            missing)
+
+        # Bring the first container/obj primary server back up
+        start_server((onode['ip'], onode['port']), self.ipport2server)
+
+        # Assert that it doesn't have container/obj yet
         self.assertFalse(os.path.exists(obj_dir))
-        exc = None
         try:
-            direct_client.direct_get_object(onode, opart, self.account,
-                                            container, obj)
-        except direct_client.ClientException, err:
-            exc = err
-        self.assertEquals(exc.http_status, 404)
-        self.assertFalse(os.path.exists(obj_dir))
+            direct_client.direct_get_object(
+                onode, opart, self.account, container, obj, headers={
+                    'X-Backend-Storage-Policy-Index': self.policy.idx})
+        except ClientException as err:
+            self.assertEqual(err.http_status, 404)
+            self.assertFalse(os.path.exists(obj_dir))
+        else:
+            self.fail("Expected ClientException but didn't get it")
+
+        # Run object replication for first container/obj primary server
+        _, num = get_server_number(
+            (onode['ip'], onode.get('replication_port', onode['port'])),
+            self.ipport2server)
+        Manager(['object-replicator']).once(number=num)
+
+        # Run object replication for handoff node
+        _, another_num = get_server_number(
+            (another_onode['ip'],
+             another_onode.get('replication_port', another_onode['port'])),
+            self.ipport2server)
+        Manager(['object-replicator']).once(number=another_num)
 
-        call(['swift-object-replicator',
-              '/etc/swift/object-server/%d.conf' %
-              ((onode['port'] - 6000) / 10), 'once'])
-        call(['swift-object-replicator',
-              '/etc/swift/object-server/%d.conf' %
-              ((another_onode['port'] - 6000) / 10), 'once'])
-
-        odata = direct_client.direct_get_object(onode, opart, self.account,
-                                                container, obj)[-1]
-        if odata != 'VERIFY':
-            raise Exception('Direct object GET did not return VERIFY, instead '
-                            'it returned: %s' % repr(odata))
-        exc = None
+        # Assert the first container/obj primary server now has container/obj
+        odata = direct_client.direct_get_object(
+            onode, opart, self.account, container, obj, headers={
+                'X-Backend-Storage-Policy-Index': self.policy.idx})[-1]
+        self.assertEqual(direct_get_data, odata)
+
+        # Assert the handoff server no longer has container/obj
         try:
-            direct_client.direct_get_object(another_onode, opart, self.account,
-                                            container, obj)
-        except direct_client.ClientException, err:
-            exc = err
-        self.assertEquals(exc.http_status, 404)
+            direct_client.direct_get_object(
+                another_onode, opart, self.account, container, obj, headers={
+                    'X-Backend-Storage-Policy-Index': self.policy.idx})
+        except ClientException as err:
+            self.assertEqual(err.http_status, 404)
+        else:
+            self.fail("Expected ClientException but didn't get it")
+
 
 if __name__ == '__main__':
     main()
diff --git a/test/probe/test_mpu.py b/test/probe/test_mpu.py
new file mode 100644
index 0000000000..deb84b014c
--- /dev/null
+++ b/test/probe/test_mpu.py
@@ -0,0 +1,156 @@
+# Copyright (c) 2023 Nvidia
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import unittest
+import uuid
+from tempfile import mkdtemp
+import os.path
+import shutil
+import random
+from hashlib import md5
+
+from swiftclient import client as swiftclient
+
+from test.probe.brain import BrainSplitter
+from test.probe.common import ReplProbeTest, ENABLED_POLICIES
+
+from boto3.s3.transfer import TransferConfig
+from test.s3api import get_s3_client
+
+from unittest import mock
+
+
+class TestMixedPolicyMPU(ReplProbeTest):
+
+    @unittest.skipIf(len(ENABLED_POLICIES) < 2, "Need more than one policy")
+    def setUp(self):
+        self.tempdir = mkdtemp()
+        super(TestMixedPolicyMPU, self).setUp()
+        s3api_info = self.cluster_info.get('s3api', {})
+        if not s3api_info:
+            raise unittest.SkipTest('s3api not enabled')
+
+        self.s3 = get_s3_client(1)
+
+        self.bucket_name = 'bucket-%s' % uuid.uuid4()
+        self.mpu_name = 'mpu-%s' % uuid.uuid4()
+        self.segment_bucket_name = self.bucket_name + '+segments'
+        self.bucket_brain = BrainSplitter(self.url, self.token,
+                                          self.bucket_name)
+        self.segments_brain = BrainSplitter(self.url, self.token,
+                                            self.segment_bucket_name)
+        self.other_policy = random.choice([p for p in ENABLED_POLICIES
+                                           if p != self.policy])
+
+    def make_large_file(self, chunksize, num_chunks):
+        filename = os.path.join(self.tempdir, 'big.file')
+        md5_hasher = md5()
+        slo_etag_hasher = md5()
+        with open(filename, 'wb') as f:
+            c = 'a'
+            for i in range(num_chunks):
+                c = chr(ord(c) + i)
+                chunk = c.encode() * chunksize
+                f.write(chunk)
+                md5_hasher.update(chunk)
+                chunk_etag = md5(chunk).hexdigest()
+                slo_etag_hasher.update(chunk_etag.encode())
+        return filename, md5_hasher.hexdigest(), slo_etag_hasher.hexdigest()
+
+    def tearDown(self):
+        shutil.rmtree(self.tempdir)
+        super(TestMixedPolicyMPU, self).tearDown()
+
+    def _assert_container_storage_policy(self, container_name,
+                                         expected_policy):
+        headers = swiftclient.head_container(self.url, self.token,
+                                             container_name)
+        self.assertEqual(headers['x-storage-policy'], expected_policy.name)
+
+    def test_mixed_policy_upload(self):
+        # Old swift had a cross policy contamination bug
+        # (https://bugs.launchpad.net/swift/+bug/2038459) that created
+        # the SLO manifest with the wrong x-backend-storage-policy-index:
+        # during the CompleteMultipartUpload it read the upload-id-marker from
+        # +segments, and applied that policy index to the manifest PUT, so the
+        # manifest object was stored in the wrong policy and requests for it
+        # would 404.
+        self.s3.create_bucket(Bucket=self.bucket_name)
+        self._assert_container_storage_policy(self.bucket_name, self.policy)
+        # create segments container in another policy
+        self.segments_brain.put_container(policy_index=int(self.other_policy))
+        self._assert_container_storage_policy(self.segment_bucket_name,
+                                              self.other_policy)
+        # I think boto has a minimum chunksize that matches AWS, when I do this
+        # too small I get less chunks in the SLO than I expect
+        chunksize = 5 * 2 ** 20
+        config = TransferConfig(multipart_threshold=chunksize,
+                                multipart_chunksize=chunksize)
+        num_chunks = 3
+        data_filename, md5_hash, slo_etag = self.make_large_file(chunksize,
+                                                                 num_chunks)
+        expected_size = chunksize * num_chunks
+
+        self.s3.upload_file(data_filename, self.bucket_name, self.mpu_name,
+                            Config=config)
+        # s3 mpu request succeeds
+        s3_head_resp = self.s3.head_object(Bucket=self.bucket_name,
+                                           Key=self.mpu_name)
+        self.assertEqual(expected_size, int(s3_head_resp['ContentLength']))
+        self.assertEqual(num_chunks, int(
+            s3_head_resp['ETag'].strip('"').rsplit('-')[-1]))
+        # swift response is the same
+        swift_obj_headers, body = swiftclient.get_object(
+            self.url, self.token, self.bucket_name, self.mpu_name,
+            resp_chunk_size=65536)
+        self.assertEqual(expected_size,
+                         int(swift_obj_headers['content-length']))
+        self.assertEqual(slo_etag, swift_obj_headers['etag'].strip('"'))
+        hasher = md5()
+        for chunk in body:
+            hasher.update(chunk)
+        self.assertEqual(md5_hash, hasher.hexdigest())
+
+        # s3 listing has correct bytes
+        resp = self.s3.list_objects(Bucket=self.bucket_name)
+        # note: with PY2 the args order (expected, actual) is significant for
+        # mock.ANY == datetime(...) to be true
+        self.assertEqual([{
+            u'ETag': s3_head_resp['ETag'],
+            u'Key': self.mpu_name,
+            u'LastModified': mock.ANY,
+            u'Size': expected_size,
+            u'Owner': {u'DisplayName': 'test:tester', u'ID': 'test:tester'},
+            u'StorageClass': 'STANDARD',
+        }], resp['Contents'])
+
+        # swift listing is the same
+        stat, listing = swiftclient.get_container(
+            self.url, self.token, self.bucket_name)
+        self.assertEqual(stat['x-storage-policy'], self.policy.name)
+        self.assertEqual(listing, [{
+            'bytes': expected_size,
+            'content_type': 'application/octet-stream',
+            'hash': swift_obj_headers['x-manifest-etag'],
+            'last_modified': mock.ANY,
+            'name': self.mpu_name,
+            's3_etag': s3_head_resp['ETag'],
+            'slo_etag': swift_obj_headers['etag'],
+        }])
+        # check segments
+        stat, listing = swiftclient.get_container(
+            self.url, self.token, self.segment_bucket_name)
+        self.assertEqual(stat['x-storage-policy'], self.other_policy.name)
+        self.assertEqual([item['name'].split('/')[0] for item in listing],
+                         [self.mpu_name] * 3)
diff --git a/test/probe/test_object_async_update.py b/test/probe/test_object_async_update.py
old mode 100755
new mode 100644
index c8132b1307..2a4ee8bf9c
--- a/test/probe/test_object_async_update.py
+++ b/test/probe/test_object_async_update.py
@@ -1,5 +1,5 @@
 #!/usr/bin/python -u
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -14,56 +14,520 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-from subprocess import Popen
-from unittest import main, TestCase
+import os
+import shutil
+import time
+import uuid
+
+from datetime import datetime
+from io import BytesIO
+from unittest import main, SkipTest
 from uuid import uuid4
+import random
 
-from swiftclient import client
+from unittest import mock
 
-from swift.common import direct_client
-from test.probe.common import kill_nonprimary_server, kill_server, \
-    kill_servers, reset_environment, start_server
+from swiftclient import client
+from swiftclient.exceptions import ClientException
 
+from configparser import ConfigParser
+from swift.common import direct_client, manager
+from swift.common.manager import Manager, Server
+from swift.common.swob import normalize_etag
+from swift.common.utils import readconf
+from test.probe.common import kill_nonprimary_server, \
+    kill_server, ReplProbeTest, start_server, ECProbeTest
 
-class TestObjectAsyncUpdate(TestCase):
 
-    def setUp(self):
-        (self.pids, self.port2server, self.account_ring, self.container_ring,
-         self.object_ring, self.url, self.token,
-         self.account) = reset_environment()
-
-    def tearDown(self):
-        kill_servers(self.port2server, self.pids)
+class TestObjectAsyncUpdate(ReplProbeTest):
 
     def test_main(self):
         # Create container
+        container = 'container-%s' % uuid4()
+        client.put_container(self.url, self.token, container)
+
         # Kill container servers excepting two of the primaries
+        cpart, cnodes = self.container_ring.get_nodes(self.account, container)
+        cnode = cnodes[0]
+        kill_nonprimary_server(cnodes, self.ipport2server)
+        kill_server((cnode['ip'], cnode['port']), self.ipport2server)
+
         # Create container/obj
+        obj = 'object-%s' % uuid4()
+        client.put_object(self.url, self.token, container, obj, '')
+
         # Restart other primary server
+        start_server((cnode['ip'], cnode['port']), self.ipport2server)
+
         # Assert it does not know about container/obj
+        self.assertFalse(direct_client.direct_get_container(
+            cnode, cpart, self.account, container)[1])
+
         # Run the object-updaters
+        Manager(['object-updater']).once()
+
         # Assert the other primary server now knows about container/obj
+        objs = [o['name'] for o in direct_client.direct_get_container(
+            cnode, cpart, self.account, container)[1]]
+        self.assertIn(obj, objs)
+
+    def test_missing_container(self):
+        # In this test, we need to put container at handoff devices, so we
+        # need container devices more than replica count
+        if len(self.container_ring.devs) <= self.container_ring.replica_count:
+            raise SkipTest("Need devices more that replica count")
+
         container = 'container-%s' % uuid4()
-        client.put_container(self.url, self.token, container)
         cpart, cnodes = self.container_ring.get_nodes(self.account, container)
-        cnode = cnodes[0]
-        kill_nonprimary_server(cnodes, self.port2server, self.pids)
-        kill_server(cnode['port'], self.port2server, self.pids)
+
+        # Kill all primary container servers
+        for cnode in cnodes:
+            kill_server((cnode['ip'], cnode['port']), self.ipport2server)
+
+        # Create container, and all of its replicas are placed at handoff
+        # device
+        try:
+            client.put_container(self.url, self.token, container)
+        except ClientException as err:
+            # if the cluster doesn't have enough devices, swift may return
+            # error (ex. When we only have 4 devices in 3-replica cluster).
+            self.assertEqual(err.http_status, 503)
+
+        # Assert handoff device has a container replica
+        another_cnode = next(self.container_ring.get_more_nodes(cpart))
+        direct_client.direct_get_container(
+            another_cnode, cpart, self.account, container)
+
+        # Restart all primary container servers
+        for cnode in cnodes:
+            start_server((cnode['ip'], cnode['port']), self.ipport2server)
+
+        # Create container/obj
         obj = 'object-%s' % uuid4()
         client.put_object(self.url, self.token, container, obj, '')
-        start_server(cnode['port'], self.port2server, self.pids)
-        self.assert_(not direct_client.direct_get_container(
-            cnode, cpart, self.account, container)[1])
-        processes = []
-        for node in xrange(1, 5):
-            processes.append(Popen(['swift-object-updater',
-                                    '/etc/swift/object-server/%d.conf' % node,
-                                    'once']))
-        for process in processes:
-            process.wait()
-        objs = [o['name'] for o in direct_client.direct_get_container(
-            cnode, cpart, self.account, container)[1]]
-        self.assert_(obj in objs)
+
+        # Run the object-updater
+        Manager(['object-updater']).once()
+
+        # Run the container-replicator, and now, container replicas
+        # at handoff device get moved to primary servers
+        Manager(['container-replicator']).once()
+
+        # Assert container replicas in primary servers, just moved by
+        # replicator don't know about the object
+        for cnode in cnodes:
+            self.assertFalse(direct_client.direct_get_container(
+                cnode, cpart, self.account, container)[1])
+
+        # since the container is empty - we can delete it!
+        client.delete_container(self.url, self.token, container)
+
+        # Re-run the object-updaters and now container replicas in primary
+        # container servers should get updated
+        Manager(['object-updater']).once()
+
+        # Assert all primary container servers know about container/obj
+        for cnode in cnodes:
+            objs = [o['name'] for o in direct_client.direct_get_container(
+                    cnode, cpart, self.account, container)[1]]
+            self.assertIn(obj, objs)
+
+
+class TestUpdateOverrides(ReplProbeTest):
+    """
+    Use an internal client to PUT an object to proxy server,
+    bypassing gatekeeper so that X-Object-Sysmeta- headers can be included.
+    Verify that the update override headers take effect and override
+    values propagate to the container server.
+    """
+    def test_update_during_PUT(self):
+        # verify that update sent during a PUT has override values
+        int_client = self.make_internal_client()
+        headers = {
+            'Content-Type': 'text/plain',
+            'X-Object-Sysmeta-Container-Update-Override-Etag': 'override-etag',
+            'X-Object-Sysmeta-Container-Update-Override-Content-Type':
+                'override-type',
+            'X-Object-Sysmeta-Container-Update-Override-Size': '1999'
+        }
+        client.put_container(self.url, self.token, 'c1',
+                             headers={'X-Storage-Policy':
+                                      self.policy.name})
+
+        int_client.upload_object(
+            BytesIO(b'stuff'), self.account, 'c1', 'o1', headers)
+
+        # Run the object-updaters to be sure updates are done
+        Manager(['object-updater']).once()
+
+        meta = int_client.get_object_metadata(self.account, 'c1', 'o1')
+
+        self.assertEqual('text/plain', meta['content-type'])
+        self.assertEqual('c13d88cb4cb02003daedb8a84e5d272a', meta['etag'])
+        self.assertEqual('5', meta['content-length'])
+
+        obj_iter = int_client.iter_objects(self.account, 'c1')
+        for obj in obj_iter:
+            if obj['name'] == 'o1':
+                self.assertEqual('override-etag', obj['hash'])
+                self.assertEqual('override-type', obj['content_type'])
+                self.assertEqual(1999, obj['bytes'])
+                break
+        else:
+            self.fail('Failed to find object o1 in listing')
+
+
+class TestUpdateOverridesEC(ECProbeTest):
+    # verify that the container update overrides used with EC policies make
+    # it to the container servers when container updates are sync or async
+    # and possibly re-ordered with respect to object PUT and POST requests.
+    def test_async_update_after_PUT(self):
+        cpart, cnodes = self.container_ring.get_nodes(self.account, 'c1')
+        client.put_container(self.url, self.token, 'c1',
+                             headers={'X-Storage-Policy':
+                                      self.policy.name})
+
+        # put an object while one container server is stopped so that we force
+        # an async update to it
+        kill_server((cnodes[0]['ip'], cnodes[0]['port']), self.ipport2server)
+        content = u'stuff'
+        client.put_object(self.url, self.token, 'c1', 'o1', contents=content,
+                          content_type='test/ctype')
+        meta = client.head_object(self.url, self.token, 'c1', 'o1')
+
+        # re-start the container server and assert that it does not yet know
+        # about the object
+        start_server((cnodes[0]['ip'], cnodes[0]['port']), self.ipport2server)
+        self.assertFalse(direct_client.direct_get_container(
+            cnodes[0], cpart, self.account, 'c1')[1])
+
+        # Run the object-updaters to be sure updates are done
+        Manager(['object-updater']).once()
+
+        # check the re-started container server got same update as others.
+        # we cannot assert the actual etag value because it may be encrypted
+        listing_etags = set()
+        for cnode in cnodes:
+            listing = direct_client.direct_get_container(
+                cnode, cpart, self.account, 'c1')[1]
+            self.assertEqual(1, len(listing))
+            self.assertEqual(len(content), listing[0]['bytes'])
+            self.assertEqual('test/ctype', listing[0]['content_type'])
+            listing_etags.add(listing[0]['hash'])
+        self.assertEqual(1, len(listing_etags))
+
+        # check that listing meta returned to client is consistent with object
+        # meta returned to client
+        hdrs, listing = client.get_container(self.url, self.token, 'c1')
+        self.assertEqual(1, len(listing))
+        self.assertEqual('o1', listing[0]['name'])
+        self.assertEqual(len(content), listing[0]['bytes'])
+        self.assertEqual(normalize_etag(meta['etag']), listing[0]['hash'])
+        self.assertEqual('test/ctype', listing[0]['content_type'])
+
+    def test_update_during_POST_only(self):
+        # verify correct update values when PUT update is missed but then a
+        # POST update succeeds *before* the PUT async pending update is sent
+        cpart, cnodes = self.container_ring.get_nodes(self.account, 'c1')
+        client.put_container(self.url, self.token, 'c1',
+                             headers={'X-Storage-Policy':
+                                      self.policy.name})
+
+        # put an object while one container server is stopped so that we force
+        # an async update to it
+        kill_server((cnodes[0]['ip'], cnodes[0]['port']), self.ipport2server)
+        content = u'stuff'
+        client.put_object(self.url, self.token, 'c1', 'o1', contents=content,
+                          content_type='test/ctype')
+        meta = client.head_object(self.url, self.token, 'c1', 'o1')
+
+        # re-start the container server and assert that it does not yet know
+        # about the object
+        start_server((cnodes[0]['ip'], cnodes[0]['port']), self.ipport2server)
+        self.assertFalse(direct_client.direct_get_container(
+            cnodes[0], cpart, self.account, 'c1')[1])
+
+        int_client = self.make_internal_client()
+        int_client.set_object_metadata(
+            self.account, 'c1', 'o1', {'X-Object-Meta-Fruit': 'Tomato'})
+        self.assertEqual(
+            'Tomato',
+            int_client.get_object_metadata(self.account, 'c1', 'o1')
+            ['x-object-meta-fruit'])  # sanity
+
+        # check the re-started container server got same update as others.
+        # we cannot assert the actual etag value because it may be encrypted
+        listing_etags = set()
+        for cnode in cnodes:
+            listing = direct_client.direct_get_container(
+                cnode, cpart, self.account, 'c1')[1]
+            self.assertEqual(1, len(listing))
+            self.assertEqual(len(content), listing[0]['bytes'])
+            self.assertEqual('test/ctype', listing[0]['content_type'])
+            listing_etags.add(listing[0]['hash'])
+        self.assertEqual(1, len(listing_etags))
+
+        # check that listing meta returned to client is consistent with object
+        # meta returned to client
+        hdrs, listing = client.get_container(self.url, self.token, 'c1')
+        self.assertEqual(1, len(listing))
+        self.assertEqual('o1', listing[0]['name'])
+        self.assertEqual(len(content), listing[0]['bytes'])
+        self.assertEqual(normalize_etag(meta['etag']), listing[0]['hash'])
+        self.assertEqual('test/ctype', listing[0]['content_type'])
+
+        # Run the object-updaters to send the async pending from the PUT
+        Manager(['object-updater']).once()
+
+        # check container listing metadata is still correct
+        for cnode in cnodes:
+            listing = direct_client.direct_get_container(
+                cnode, cpart, self.account, 'c1')[1]
+            self.assertEqual(1, len(listing))
+            self.assertEqual(len(content), listing[0]['bytes'])
+            self.assertEqual('test/ctype', listing[0]['content_type'])
+            listing_etags.add(listing[0]['hash'])
+        self.assertEqual(1, len(listing_etags))
+
+    def test_async_updates_after_PUT_and_POST(self):
+        # verify correct update values when PUT update and POST updates are
+        # missed but then async updates are sent
+        cpart, cnodes = self.container_ring.get_nodes(self.account, 'c1')
+        client.put_container(self.url, self.token, 'c1',
+                             headers={'X-Storage-Policy':
+                                      self.policy.name})
+
+        # PUT and POST to object while one container server is stopped so that
+        # we force async updates to it
+        kill_server((cnodes[0]['ip'], cnodes[0]['port']), self.ipport2server)
+        content = u'stuff'
+        client.put_object(self.url, self.token, 'c1', 'o1', contents=content,
+                          content_type='test/ctype')
+        meta = client.head_object(self.url, self.token, 'c1', 'o1')
+
+        int_client = self.make_internal_client()
+        int_client.set_object_metadata(
+            self.account, 'c1', 'o1', {'X-Object-Meta-Fruit': 'Tomato'})
+        self.assertEqual(
+            'Tomato',
+            int_client.get_object_metadata(self.account, 'c1', 'o1')
+            ['x-object-meta-fruit'])  # sanity
+
+        # re-start the container server and assert that it does not yet know
+        # about the object
+        start_server((cnodes[0]['ip'], cnodes[0]['port']), self.ipport2server)
+        self.assertFalse(direct_client.direct_get_container(
+            cnodes[0], cpart, self.account, 'c1')[1])
+
+        # Run the object-updaters to send the async pendings
+        Manager(['object-updater']).once()
+
+        # check the re-started container server got same update as others.
+        # we cannot assert the actual etag value because it may be encrypted
+        listing_etags = set()
+        for cnode in cnodes:
+            listing = direct_client.direct_get_container(
+                cnode, cpart, self.account, 'c1')[1]
+            self.assertEqual(1, len(listing))
+            self.assertEqual(len(content), listing[0]['bytes'])
+            self.assertEqual('test/ctype', listing[0]['content_type'])
+            listing_etags.add(listing[0]['hash'])
+        self.assertEqual(1, len(listing_etags))
+
+        # check that listing meta returned to client is consistent with object
+        # meta returned to client
+        hdrs, listing = client.get_container(self.url, self.token, 'c1')
+        self.assertEqual(1, len(listing))
+        self.assertEqual('o1', listing[0]['name'])
+        self.assertEqual(len(content), listing[0]['bytes'])
+        self.assertEqual(normalize_etag(meta['etag']), listing[0]['hash'])
+        self.assertEqual('test/ctype', listing[0]['content_type'])
+
+
+class UpdaterStatsMixIn(object):
+
+    def setUp(self):
+        super(UpdaterStatsMixIn, self).setUp()
+        self.int_client = self.make_internal_client()
+        self.container_servers = Manager(['container-server'])
+        self.object_updater = Manager(['object-updater'])
+        self._post_setup_config()
+
+    def _post_setup_config(self):
+        pass
+
+    def _create_lots_of_asyncs(self):
+        # Create some (acct, cont) pairs
+        num_accounts = 3
+        num_conts_per_a = 4
+        self.ac_pairs = ac_pairs = []
+        for a in range(num_accounts):
+            acct = 'AUTH_user-%s-%03d' % (uuid.uuid4(), a)
+            self.int_client.create_account(acct)
+            for c in range(num_conts_per_a):
+                cont = 'cont-%s-%03d' % (uuid.uuid4(), c)
+                self.int_client.create_container(acct, cont)
+                ac_pairs.append((acct, cont))
+
+        # Shut down a couple container servers
+        for n in random.sample([1, 2, 3, 4], 2):
+            self.container_servers.stop(number=n)
+
+        # Create a bunch of objects
+        num_objs_per_ac = 10
+        for acct, cont in ac_pairs:
+            for o in range(num_objs_per_ac):
+                obj = 'obj-%s-%03d' % (uuid.uuid4(), o)
+                self.int_client.upload_object(BytesIO(b''), acct, cont, obj)
+
+        all_asyncs = self.gather_async_pendings()
+        # Between 1-2 asyncs per object
+        total_objs = num_objs_per_ac * len(ac_pairs)
+        self.assertGreater(len(all_asyncs), total_objs)
+        self.assertLess(len(all_asyncs), total_objs * 2)
+
+    def _gather_recon(self):
+        # We'll collect recon only once from each node
+        dev_to_node_dict = {}
+        for onode in self.object_ring.devs:
+            # We can skip any devices that are already covered by one of the
+            # other nodes we found
+            if any(self.is_local_to(node, onode)
+                    for node in dev_to_node_dict.values()):
+                continue
+            dev_to_node_dict[onode["device"]] = onode
+        self.assertEqual(4, len(dev_to_node_dict))  # sanity
+
+        timeout = 20
+        polling_interval = 2
+        recon_data = []
+        start = time.time()
+        while True:
+            for onode in list(dev_to_node_dict.values()):
+                recon = direct_client.direct_get_recon(
+                    onode, 'updater/object')
+                if (recon.get('object_updater_stats') is not None and
+                        recon.get('object_updater_sweep') is not None):
+                    del dev_to_node_dict[onode["device"]]
+                    recon_data.append(recon)
+            if not dev_to_node_dict:
+                break
+            elapsed = time.time() - start
+            if elapsed > timeout:
+                self.fail(
+                    "Updates did not process within {timeout} seconds".format(
+                        timeout=timeout)
+                )
+            time.sleep(polling_interval)
+        self.assertEqual(4, len(recon_data))  # sanity
+        return recon_data
+
+    def run_updater(self):
+        raise NotImplementedError()
+
+    def _check_recon_data(self, recon_data):
+        ac_pairs = self.ac_pairs
+        ac_set = set()
+        for recon in recon_data:
+            updater_stats = recon['object_updater_stats']
+
+            found_count = updater_stats['failures_account_container_count']
+            # No node should find MORE unique ac than we created
+            self.assertLessEqual(found_count, len(ac_pairs))
+            # and generally we'd expect them to have "at least" one from
+            # significanly MORE than the "majority" of ac_pairs
+            self.assertGreaterEqual(found_count, len(ac_pairs) / 2)
+
+            oldest_count = updater_stats[
+                'failures_oldest_timestamp_account_containers'
+            ]['oldest_count']
+            self.assertEqual(oldest_count, 5)
+
+            ts_ac_entries = updater_stats[
+                'failures_oldest_timestamp_account_containers'
+            ]['oldest_entries']
+            self.assertEqual(len(ts_ac_entries), oldest_count)
+
+            for entry in ts_ac_entries:
+                account = entry['account']
+                container = entry['container']
+                timestamp = entry['timestamp']
+                self.assertIsNotNone(timestamp)
+                ac_set.add((account, container))
+
+            object_updater_last = recon.get('object_updater_last')
+            self.assertIsNotNone(object_updater_last,
+                                 "object_updater_last is missing")
+            self.assertGreater(object_updater_last, 0,
+                               "Invalid object_updater_last time")
+        # All the collected ac_set are from the ac_pairs we created
+        for ac in ac_set:
+            self.assertIn(ac, set(ac_pairs))
+        # Specifically, the ac_pairs we created failures for *first*
+        # are represented by the oldest ac_set across nodes
+        for ac in ac_pairs[:5]:
+            self.assertIn(ac, ac_set)
+        # Where as the more recent failures are NOT!
+        for ac in ac_pairs[-3:]:
+            self.assertNotIn(ac, ac_set)
+
+    def test_stats(self):
+        self._create_lots_of_asyncs()
+        recon_data = self.run_updater()
+        self._check_recon_data(recon_data)
+
+
+class TestObjectUpdaterStatsRunOnce(UpdaterStatsMixIn, ReplProbeTest):
+
+    def run_updater(self):
+        # Run the updater and check stats
+        Manager(['object-updater']).once()
+        return self._gather_recon()
+
+
+class TestObjectUpdaterStatsRunForever(UpdaterStatsMixIn, ECProbeTest):
+
+    def _post_setup_config(self):
+        CONF_SECTION = 'object-updater'
+        self.conf_dest = os.path.join(
+            '/tmp/',
+            datetime.now().strftime('swift-%Y-%m-%d_%H-%M-%S-%f')
+        )
+        os.mkdir(self.conf_dest)
+        object_server_dir = os.path.join(self.conf_dest, 'object-server')
+        os.mkdir(object_server_dir)
+        for conf_file in Server('object-updater').conf_files():
+            config = readconf(conf_file)
+            if CONF_SECTION not in config:
+                continue  # Ensure the object-updater is set up to run
+            config[CONF_SECTION].update({'interval': '1'})
+
+            parser = ConfigParser()
+            parser.add_section(CONF_SECTION)
+            for option, value in config[CONF_SECTION].items():
+                parser.set(CONF_SECTION, option, value)
+
+            file_name = os.path.basename(conf_file)
+            if file_name.endswith('.d'):
+                # Work around conf.d setups (like you might see with VSAIO)
+                file_name = file_name[:-2]
+            with open(os.path.join(object_server_dir, file_name), 'w') as fp:
+                parser.write(fp)
+
+    def tearDown(self):
+        shutil.rmtree(self.conf_dest)
+
+    def run_updater(self):
+        # Start the updater
+        with mock.patch.object(manager, 'SWIFT_DIR', self.conf_dest):
+            updater_status = self.object_updater.start()
+        self.assertEqual(
+            updater_status, 0, "Object updater failed to start")
+        recon_data = self._gather_recon()
+        # Stop the updater
+        stop_status = self.object_updater.stop()
+        self.assertEqual(stop_status, 0, "Object updater failed to stop")
+        return recon_data
 
 
 if __name__ == '__main__':
diff --git a/test/probe/test_object_conditional_requests.py b/test/probe/test_object_conditional_requests.py
new file mode 100644
index 0000000000..e66cb0eaf8
--- /dev/null
+++ b/test/probe/test_object_conditional_requests.py
@@ -0,0 +1,79 @@
+# Copyright (c) 2017 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import uuid
+
+from swift.common.manager import Manager
+from swiftclient import client
+
+from test.probe.brain import BrainSplitter
+from test.probe.common import ReplProbeTest
+
+
+def chunker(body):
+    '''Helper to ensure swiftclient sends a chunked request.'''
+    yield body
+
+
+class TestPutIfNoneMatchRepl(ReplProbeTest):
+    def setUp(self):
+        super(TestPutIfNoneMatchRepl, self).setUp()
+        self.container_name = 'container-%s' % uuid.uuid4()
+        self.object_name = 'object-%s' % uuid.uuid4()
+        self.brain = BrainSplitter(self.url, self.token, self.container_name,
+                                   self.object_name, 'object',
+                                   policy=self.policy)
+
+    def _do_test(self, overwrite_contents):
+        self.brain.put_container()
+        self.brain.stop_primary_half()
+        # put object to only 1 of 3 primaries
+        self.brain.put_object(contents=b'VERIFY')
+        self.brain.start_primary_half()
+
+        # Restart services and attempt to overwrite
+        with self.assertRaises(client.ClientException) as exc_mgr:
+            self.brain.put_object(headers={'If-None-Match': '*'},
+                                  contents=overwrite_contents)
+        self.assertEqual(exc_mgr.exception.http_status, 412)
+
+        # make sure we're GETting from the servers that missed the original PUT
+        self.brain.stop_handoff_half()
+
+        # verify the PUT did not complete
+        with self.assertRaises(client.ClientException) as exc_mgr:
+            client.get_object(
+                self.url, self.token, self.container_name, self.object_name)
+        self.assertEqual(exc_mgr.exception.http_status, 404)
+
+        # for completeness, run replicators...
+        Manager(['object-replicator']).once()
+
+        # ...and verify the object was not overwritten
+        _headers, body = client.get_object(
+            self.url, self.token, self.container_name, self.object_name)
+        self.assertEqual(body, b'VERIFY')
+
+    def test_content_length_nonzero(self):
+        self._do_test(b'OVERWRITE')
+
+    def test_content_length_zero(self):
+        self._do_test(b'')
+
+    def test_chunked(self):
+        self._do_test(chunker(b'OVERWRITE'))
+
+    def test_chunked_empty(self):
+        self._do_test(chunker(b''))
diff --git a/test/probe/test_object_expirer.py b/test/probe/test_object_expirer.py
new file mode 100644
index 0000000000..e3e418df21
--- /dev/null
+++ b/test/probe/test_object_expirer.py
@@ -0,0 +1,856 @@
+#!/usr/bin/python -u
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from collections import Counter
+import json
+import random
+import time
+import uuid
+import unittest
+from io import BytesIO
+
+from swift.common.internal_client import InternalClient, UnexpectedResponse
+from swift.common.manager import Manager
+from swift.common.utils import Timestamp, config_true_value
+from swift.common import direct_client
+from swift.obj.expirer import extract_expirer_bytes_from_ctype
+
+from test.probe.common import ReplProbeTest, ENABLED_POLICIES
+from test.probe.brain import BrainSplitter
+
+from swiftclient import client
+from swiftclient.exceptions import ClientException
+
+
+class TestObjectExpirer(ReplProbeTest):
+
+    def setUp(self):
+        self.expirer = Manager(['object-expirer'])
+        self.expirer.start()
+        err = self.expirer.stop()
+        if err:
+            raise unittest.SkipTest('Unable to verify object-expirer service')
+
+        conf_files = []
+        for server in self.expirer.servers:
+            conf_files.extend(server.conf_files())
+        conf_file = conf_files[0]
+        self.client = InternalClient(conf_file, 'probe-test', 3)
+
+        super(TestObjectExpirer, self).setUp()
+        self.container_name = 'container-%s' % uuid.uuid4()
+        self.object_name = 'object-%s' % uuid.uuid4()
+        self.brain = BrainSplitter(self.url, self.token, self.container_name,
+                                   self.object_name)
+
+    def _check_obj_in_container_listing(self):
+        for obj in self.client.iter_objects(self.account,
+                                            self.container_name):
+
+            if self.object_name == obj['name']:
+                return True
+
+        return False
+
+    @unittest.skipIf(len(ENABLED_POLICIES) < 2, "Need more than one policy")
+    def test_expirer_object_split_brain(self):
+        old_policy = random.choice(ENABLED_POLICIES)
+        wrong_policy = random.choice([p for p in ENABLED_POLICIES
+                                      if p != old_policy])
+        # create an expiring object and a container with the wrong policy
+        self.brain.stop_primary_half()
+        self.brain.put_container(int(old_policy))
+        self.brain.put_object(headers={'X-Delete-After': 2})
+        # get the object timestamp
+        metadata = self.client.get_object_metadata(
+            self.account, self.container_name, self.object_name,
+            headers={'X-Backend-Storage-Policy-Index': int(old_policy)})
+        self.assertIn('x-backend-timestamp', metadata)
+        create_timestamp = Timestamp(metadata['x-backend-timestamp'])
+        self.assertIn('x-timestamp', metadata)
+        self.assertEqual(create_timestamp.normal,
+                         Timestamp(metadata['x-timestamp']).normal)
+        self.brain.start_primary_half()
+        # get the expiring object updates in their queue, while we have all
+        # the servers up
+        Manager(['object-updater']).once()
+        self.brain.stop_handoff_half()
+        self.brain.put_container(int(wrong_policy))
+        # don't start handoff servers, only wrong policy is available
+
+        # make sure auto-created containers get in the account listing
+        Manager(['container-updater']).once()
+        # this guy should no-op since it's unable to expire the object
+        self.expirer.once()
+
+        self.brain.start_handoff_half()
+        self.get_to_final_state()
+
+        # validate object is expired
+        metadata = self.client.get_object_metadata(
+            self.account, self.container_name, self.object_name,
+            acceptable_statuses=(4,),
+            headers={'X-Backend-Storage-Policy-Index': int(old_policy)})
+        self.assertIn('x-backend-timestamp', metadata)
+        self.assertEqual(Timestamp(metadata['x-backend-timestamp']),
+                         create_timestamp)
+
+        # but it is still in the listing
+        self.assertTrue(self._check_obj_in_container_listing(),
+                        msg='Did not find listing for %s' % self.object_name)
+
+        # clear proxy cache
+        client.post_container(self.url, self.token, self.container_name, {})
+        # run the expirer again after replication
+        self.expirer.once()
+
+        # object is not in the listing
+        self.assertFalse(self._check_obj_in_container_listing(),
+                         msg='Found listing for %s' % self.object_name)
+
+        # and validate object is tombstoned
+        found_in_policy = None
+        for policy in ENABLED_POLICIES:
+            metadata = self.client.get_object_metadata(
+                self.account, self.container_name, self.object_name,
+                acceptable_statuses=(4,),
+                headers={'X-Backend-Storage-Policy-Index': int(policy)})
+            if 'x-backend-timestamp' in metadata:
+                if found_in_policy:
+                    self.fail('found object in %s and also %s' %
+                              (found_in_policy, policy))
+                found_in_policy = policy
+                self.assertIn('x-backend-timestamp', metadata)
+                self.assertGreater(Timestamp(metadata['x-backend-timestamp']),
+                                   create_timestamp)
+
+    def test_expirer_doesnt_make_async_pendings(self):
+        # The object expirer cleans up its own queue. The inner loop
+        # basically looks like this:
+        #
+        #    for obj in stuff_to_delete:
+        #        delete_the_object(obj)
+        #        remove_the_queue_entry(obj)
+        #
+        # By default, upon receipt of a DELETE request for an expiring
+        # object, the object servers will create async_pending records to
+        # clean the expirer queue. Since the expirer cleans its own queue,
+        # this is unnecessary. The expirer can make requests in such a way
+        # tha the object server does not write out any async pendings; this
+        # test asserts that this is the case.
+
+        # Make an expiring object in each policy
+        for policy in ENABLED_POLICIES:
+            container_name = "expirer-test-%d" % policy.idx
+            container_headers = {'X-Storage-Policy': policy.name}
+            client.put_container(self.url, self.token, container_name,
+                                 headers=container_headers)
+
+            now = time.time()
+            delete_at = int(now + 2.0)
+            client.put_object(
+                self.url, self.token, container_name, "some-object",
+                headers={'X-Delete-At': str(delete_at),
+                         'X-Timestamp': Timestamp(now).normal},
+                contents='dontcare')
+
+        time.sleep(2.0)
+        # make sure auto-created expirer-queue containers get in the account
+        # listing so the expirer can find them
+        Manager(['container-updater']).once()
+
+        # Make sure there's no async_pendings anywhere. Probe tests only run
+        # on single-node installs anyway, so this set should be small enough
+        # that an exhaustive check doesn't take too long.
+        pendings_before = self.gather_async_pendings()
+
+        # expire the objects
+        Manager(['object-expirer']).once()
+        pendings_after = self.gather_async_pendings()
+        self.assertEqual(pendings_after, pendings_before)
+
+    def test_expirer_object_should_not_be_expired(self):
+
+        # Current object-expirer checks the correctness via x-if-delete-at
+        # header that it can be deleted by expirer. If there are objects
+        # either which doesn't have x-delete-at header as metadata or which
+        # has different x-delete-at value from x-if-delete-at value,
+        # object-expirer's delete will fail as 412 PreconditionFailed.
+        # However, if some of the objects are in handoff nodes, the expirer
+        # can put the tombstone with the timestamp as same as x-delete-at and
+        # the object consistency will be resolved as the newer timestamp will
+        # be winner (in particular, overwritten case w/o x-delete-at). This
+        # test asserts such a situation that, at least, the overwriten object
+        # which have larger timestamp than the original expirered date should
+        # be safe.
+
+        def put_object(headers):
+            # use internal client to PUT objects so that X-Timestamp in headers
+            # is effective
+            headers['Content-Length'] = '0'
+            path = self.client.make_path(
+                self.account, self.container_name, self.object_name)
+            try:
+                self.client.make_request('PUT', path, headers, (2,))
+            except UnexpectedResponse as e:
+                self.fail(
+                    'Expected 201 for PUT object but got %s' % e.resp.status)
+
+        obj_brain = BrainSplitter(self.url, self.token, self.container_name,
+                                  self.object_name, 'object', self.policy)
+
+        # T(obj_created) < T(obj_deleted with x-delete-at) < T(obj_recreated)
+        #   < T(expirer_executed)
+        # Recreated obj should be appeared in any split brain case
+
+        obj_brain.put_container()
+
+        # T(obj_deleted with x-delete-at)
+        # object-server accepts req only if X-Delete-At is later than 'now'
+        # so here, T(obj_created) < T(obj_deleted with x-delete-at)
+        now = time.time()
+        delete_at = int(now + 2.0)
+        recreate_at = delete_at + 1.0
+        put_object(headers={'X-Delete-At': str(delete_at),
+                            'X-Timestamp': Timestamp(now).normal})
+
+        # some object servers stopped to make a situation that the
+        # object-expirer can put tombstone in the primary nodes.
+        obj_brain.stop_primary_half()
+
+        # increment the X-Timestamp explicitly
+        # (will be T(obj_deleted with x-delete-at) < T(obj_recreated))
+        put_object(headers={'X-Object-Meta-Expired': 'False',
+                            'X-Timestamp': Timestamp(recreate_at).normal})
+
+        # make sure auto-created containers get in the account listing
+        Manager(['container-updater']).once()
+        # sanity, the newer object is still there
+        try:
+            metadata = self.client.get_object_metadata(
+                self.account, self.container_name, self.object_name)
+        except UnexpectedResponse as e:
+            self.fail(
+                'Expected 200 for HEAD object but got %s' % e.resp.status)
+
+        self.assertIn('x-object-meta-expired', metadata)
+
+        # some object servers recovered
+        obj_brain.start_primary_half()
+
+        # sleep until after recreated_at
+        while time.time() <= recreate_at:
+            time.sleep(0.1)
+        # Now, expirer runs at the time after obj is recreated
+        self.expirer.once()
+
+        # verify that original object was deleted by expirer
+        obj_brain.stop_handoff_half()
+        try:
+            metadata = self.client.get_object_metadata(
+                self.account, self.container_name, self.object_name,
+                acceptable_statuses=(4,))
+        except UnexpectedResponse as e:
+            self.fail(
+                'Expected 404 for HEAD object but got %s' % e.resp.status)
+        obj_brain.start_handoff_half()
+
+        # and inconsistent state of objects is recovered by replicator
+        Manager(['object-replicator']).once()
+
+        # check if you can get recreated object
+        try:
+            metadata = self.client.get_object_metadata(
+                self.account, self.container_name, self.object_name)
+        except UnexpectedResponse as e:
+            self.fail(
+                'Expected 200 for HEAD object but got %s' % e.resp.status)
+
+        self.assertIn('x-object-meta-expired', metadata)
+
+    def _setup_test_open_expired(self):
+        obj_brain = BrainSplitter(self.url, self.token, self.container_name,
+                                  self.object_name, 'object', self.policy)
+
+        obj_brain.put_container()
+
+        now = time.time()
+        delete_at = int(now + 2)
+        try:
+            path = self.client.make_path(
+                self.account, self.container_name, self.object_name)
+            self.client.make_request('PUT', path, {
+                'X-Delete-At': str(delete_at),
+                'X-Timestamp': Timestamp(now).normal,
+                'Content-Length': '3',
+                'X-Object-Meta-Test': 'foo',
+            }, (2,), BytesIO(b'foo'))
+        except UnexpectedResponse as e:
+            self.fail(
+                'Expected 201 for PUT object but got %s' % e.resp.status)
+
+        # sanity: check that the object was created
+        try:
+            resp = client.head_object(self.url, self.token,
+                                      self.container_name, self.object_name)
+            self.assertEqual('foo', resp.get('x-object-meta-test'))
+        except ClientException as e:
+            self.fail(
+                'Expected 200 for HEAD object but got %s' % e.http_status)
+
+        # make sure auto-created containers get in the account listing
+        Manager(['container-updater']).once()
+
+        # sleep until after expired but not reaped
+        while time.time() <= delete_at:
+            time.sleep(0.1)
+
+        # should get a 404, object is expired
+        with self.assertRaises(ClientException) as e:
+            client.head_object(self.url, self.token,
+                               self.container_name, self.object_name)
+        self.assertEqual(e.exception.http_status, 404)
+
+    def test_open_expired_enabled(self):
+
+        # When the global configuration option allow_open_expired is set to
+        # true, the client should be able to access expired objects that have
+        # not yet been reaped using the x-open-expired flag. However, after
+        # they have been reaped, it should return 404.
+
+        allow_open_expired = config_true_value(
+            self.cluster_info['swift'].get('allow_open_expired')
+        )
+
+        if not allow_open_expired:
+            raise unittest.SkipTest(
+                "allow_open_expired is disabled in this swift cluster")
+
+        self._setup_test_open_expired()
+
+        # since allow_open_expired is enabled, ensure object can be accessed
+        # with x-open-expired header
+        # HEAD request should succeed
+        try:
+            resp = client.head_object(self.url, self.token,
+                                      self.container_name, self.object_name,
+                                      headers={'X-Open-Expired': True})
+            self.assertEqual('foo', resp.get('x-object-meta-test'))
+        except ClientException as e:
+            self.fail(
+                'Expected 200 for HEAD object but got %s' % e.http_status)
+
+        # GET request should succeed
+        try:
+            _, body = client.get_object(self.url, self.token,
+                                        self.container_name, self.object_name,
+                                        headers={'X-Open-Expired': True})
+            self.assertEqual(body, b'foo')
+        except ClientException as e:
+            self.fail(
+                'Expected 200 for GET object but got %s' % e.http_status)
+
+        # POST request should succeed, update x-delete-at
+        now = time.time()
+        new_delete_at = int(now + 5)
+        try:
+            client.post_object(self.url, self.token,
+                               self.container_name, self.object_name,
+                               headers={
+                                   'X-Open-Expired': True,
+                                   'X-Delete-At': str(new_delete_at),
+                                   'X-Object-Meta-Test': 'bar'
+                               })
+        except ClientException as e:
+            self.fail(
+                'Expected 200 for POST object but got %s' % e.http_status)
+
+        # GET requests succeed again, even without the magic header
+        try:
+            _, body = client.get_object(self.url, self.token,
+                                        self.container_name, self.object_name)
+            self.assertEqual(body, b'foo')
+        except ClientException as e:
+            self.fail(
+                'Expected 200 for GET object but got %s' % e.http_status)
+
+        # make sure auto-created containers get in the account listing
+        Manager(['container-updater']).once()
+
+        # run the expirer, but the object expiry time is now in the future
+        self.expirer.once()
+        try:
+            resp = client.head_object(self.url, self.token,
+                                      self.container_name, self.object_name,
+                                      headers={'X-Open-Expired': True})
+            self.assertEqual('bar', resp.get('x-object-meta-test'))
+        except ClientException as e:
+            self.fail(
+                'Expected 200 for HEAD object but got %s' % e.http_status)
+
+        # wait for the object to expire
+        while time.time() <= new_delete_at:
+            time.sleep(0.1)
+
+        # expirer runs to reap the object
+        self.expirer.once()
+
+        # should get a 404 even with x-open-expired since object is reaped
+        with self.assertRaises(ClientException) as e:
+            client.head_object(self.url, self.token,
+                               self.container_name, self.object_name,
+                               headers={'X-Open-Expired': True})
+        self.assertEqual(e.exception.http_status, 404)
+
+    def _setup_test_slo_object(self):
+        segment_container = self.container_name + '_segments'
+        client.put_container(self.url, self.token, self.container_name, {})
+        client.put_container(self.url, self.token, segment_container, {})
+        client.put_object(self.url, self.token,
+                          segment_container, 'segment_1', b'12')
+        client.put_object(self.url, self.token,
+                          segment_container, 'segment_2', b'5678')
+        client.put_object(
+            self.url, self.token, self.container_name, 'slo', json.dumps([
+                {'path': segment_container + '/segment_1'},
+                {'data': 'Cg=='},
+                {'path': segment_container + '/segment_2'},
+            ]), query_string='multipart-manifest=put')
+        _, body = client.get_object(self.url, self.token,
+                                    self.container_name, 'slo')
+        self.assertEqual(body, b'12\n5678')
+
+        return segment_container, self.container_name
+
+    def test_open_expired_enabled_with_part_num(self):
+        allow_open_expired = config_true_value(
+            self.cluster_info['swift'].get('allow_open_expired')
+        )
+
+        if not allow_open_expired:
+            raise unittest.SkipTest(
+                "allow_open_expired is disabled in this swift cluster"
+            )
+
+        seg_container, container_name = self._setup_test_slo_object()
+        now = time.time()
+        delete_at = int(now + 1)
+
+        client.post_object(
+            self.url, self.token, container_name, 'slo',
+            headers={
+                'X-Delete-At': str(delete_at),
+                'X-Object-Meta-Test': 'foo'
+            }
+        )
+
+        # make sure auto-created containers get in the account listing
+        Manager(['container-updater']).once()
+
+        # sleep until after expired but not reaped
+        while time.time() <= delete_at:
+            time.sleep(0.1)
+
+        # should get a 404, object is expired
+        while True:
+            try:
+                client.head_object(self.url, self.token, container_name, 'slo')
+                time.sleep(1)  # Wait for a short period before trying again
+            except ClientException as e:
+                # check if the object is expired
+                if e.http_status == 404:
+                    break  # The object is expired, so we can exit the loop
+
+        resp_headers = client.head_object(
+            self.url, self.token, container_name, 'slo',
+            headers={'X-Open-Expired': True},
+            query_string='part-number=1'
+        )
+
+        self.assertEqual(resp_headers.get('x-object-meta-test'), 'foo')
+        self.assertEqual(resp_headers.get('content-range'), 'bytes 0-1/7')
+        self.assertEqual(resp_headers.get('content-length'), '2')
+        self.assertEqual(resp_headers.get('x-parts-count'), '3')
+        self.assertEqual(resp_headers.get('x-static-large-object'), 'True')
+        self.assertEqual(resp_headers.get('accept-ranges'), 'bytes')
+
+        with self.assertRaises(ClientException) as e:
+            client.head_object(self.url, self.token, container_name, 'slo')
+        self.assertEqual(e.exception.http_status, 404)
+
+        now = time.time()
+        delete_at = int(now + 2)
+        for seg_obj_name in ['segment_1', 'segment_2']:
+            client.post_object(
+                self.url, self.token, seg_container, seg_obj_name,
+                headers={
+                    'X-Open-Expired': True,
+                    'X-Segment-Meta-Test': 'segment-foo',
+                    'X-Delete-At': str(delete_at)
+                }
+            )
+
+        # make sure auto-created containers get in the account listing
+        Manager(['container-updater']).once()
+        while time.time() <= delete_at:
+            time.sleep(0.1)
+
+        # should get a 404, segment object is expired
+        with self.assertRaises(ClientException) as e:
+            client.head_object(self.url, self.token, seg_container,
+                               'segment_2')
+        self.assertEqual(e.exception.http_status, 404)
+
+        # magic of x-open-expired
+        resp_headers = client.head_object(
+            self.url, self.token, seg_container, 'segment_2',
+            headers={'X-Open-Expired': True},
+            query_string='part-number=1'
+        )
+
+        # keep in mind that the segment object is expired
+        self.assertEqual(resp_headers.get('content-length'), '4')
+        self.assertTrue(time.time() > delete_at)
+
+        # expirer runs to reap the whichever object was set for expiry
+        self.expirer.once()
+
+        for seg_obj_name in ['segment_1', 'segment_2']:
+            # should get a 404 even with x-open-expired since object is reaped
+            with self.assertRaises(ClientException) as e:
+                client.head_object(
+                    self.url, self.token, seg_container, seg_obj_name,
+                    headers={'X-Open-Expired': True},
+                    query_string='part-number=1'
+                )
+            self.assertEqual(e.exception.http_status, 404)
+
+    def test_open_expired_disabled(self):
+
+        # When the global configuration option allow_open_expired is set to
+        # false or not configured, the client should not be able to access
+        # expired objects that have not yet been reaped using the
+        # x-open-expired flag.
+
+        allow_open_expired = config_true_value(
+            self.cluster_info['swift'].get('allow_open_expired')
+        )
+
+        if allow_open_expired:
+            raise unittest.SkipTest(
+                "allow_open_expired is enabled in this swift cluster")
+
+        self._setup_test_open_expired()
+
+        # since allow_open_expired is disabled, should get 404 even
+        # with x-open-expired header
+        # HEAD request should fail
+        with self.assertRaises(ClientException) as e:
+            client.head_object(self.url, self.token,
+                               self.container_name, self.object_name,
+                               headers={'X-Open-Expired': True})
+        self.assertEqual(e.exception.http_status, 404)
+
+        # POST request should fail
+        with self.assertRaises(ClientException) as e:
+            client.post_object(self.url, self.token,
+                               self.container_name, self.object_name,
+                               headers={'X-Open-Expired': True})
+        self.assertEqual(e.exception.http_status, 404)
+
+        # GET request should fail
+        with self.assertRaises(ClientException) as e:
+            client.get_object(self.url, self.token,
+                              self.container_name, self.object_name,
+                              headers={'X-Open-Expired': True})
+        self.assertEqual(e.exception.http_status, 404)
+
+        # But with internal client, can GET with X-Backend-Open-Expired
+        # Since object still exists on disk
+        try:
+            object_metadata = self.client.get_object_metadata(
+                self.account, self.container_name, self.object_name,
+                acceptable_statuses=(2,),
+                headers={'X-Backend-Open-Expired': True})
+        except UnexpectedResponse as e:
+            self.fail(
+                'Expected 200 for GET object but got %s' % e.resp.status)
+        self.assertEqual('foo', object_metadata.get('x-object-meta-test'))
+
+        # expirer runs to reap the object
+        self.expirer.once()
+
+        # should get a 404 even with X-Backend-Open-Expired
+        # since object is reaped
+        with self.assertRaises(UnexpectedResponse) as e:
+            object_metadata = self.client.get_object_metadata(
+                self.account, self.container_name, self.object_name,
+                acceptable_statuses=(2,),
+                headers={'X-Backend-Open-Expired': True})
+        self.assertEqual(e.exception.resp.status_int, 404)
+
+    def test_expirer_object_bytes_eventual_consistency(self):
+        obj_brain = BrainSplitter(self.url, self.token, self.container_name,
+                                  self.object_name, 'object', self.policy)
+
+        obj_brain.put_container()
+
+        def put_object(content_length=0):
+            try:
+                self.client.upload_object(BytesIO(bytes(content_length)),
+                                          self.account, self.container_name,
+                                          self.object_name)
+            except UnexpectedResponse as e:
+                self.fail(
+                    'Expected 201 for PUT object but got %s' % e.resp.status)
+
+        t0_content_length = 24
+        put_object(content_length=t0_content_length)
+
+        try:
+            metadata = self.client.get_object_metadata(
+                self.account, self.container_name, self.object_name)
+        except UnexpectedResponse as e:
+            self.fail(
+                'Expected 200 for HEAD object but got %s' % e.resp.status)
+
+        assert metadata['content-length'] == str(t0_content_length)
+        t0 = metadata['x-timestamp']
+
+        obj_brain.stop_primary_half()
+
+        t1_content_length = 32
+        put_object(content_length=t1_content_length)
+
+        try:
+            metadata = self.client.get_object_metadata(
+                self.account, self.container_name, self.object_name)
+        except UnexpectedResponse as e:
+            self.fail(
+                'Expected 200 for HEAD object but got %s' % e.resp.status)
+
+        assert metadata['content-length'] == str(t1_content_length)
+        t1 = metadata['x-timestamp']
+
+        # some object servers recovered
+        obj_brain.start_primary_half()
+
+        head_responses = []
+
+        for node in obj_brain.ring.devs:
+            metadata = direct_client.direct_head_object(
+                node, obj_brain.part, self.account, self.container_name,
+                self.object_name)
+            head_responses.append(metadata)
+
+        timestamp_counts = Counter([
+            resp['X-Timestamp'] for resp in head_responses
+        ])
+        expected_counts = {t0: 2, t1: 2}
+        self.assertEqual(expected_counts, timestamp_counts)
+
+        # Do a POST to update object metadata (timestamp x-delete-at)
+        # POST will create an expiry queue entry with 2 landing on t0, 1 on t1
+        self.client.set_object_metadata(
+            self.account, self.container_name, self.object_name,
+            metadata={'X-Delete-After': '5'}, acceptable_statuses=(2,)
+        )
+
+        # Run the container updater once to register new container containing
+        # expirey queue entry
+        Manager(['container-updater']).once()
+
+        # Find the name of the container containing the expiring object
+        expiring_containers = list(
+            self.client.iter_containers('.expiring_objects')
+        )
+        self.assertEqual(1, len(expiring_containers))
+
+        expiring_container = expiring_containers[0]
+        expiring_container_name = expiring_container['name']
+
+        # Verify that there is one expiring object
+        expiring_objects = list(
+            self.client.iter_objects('.expiring_objects',
+                                     expiring_container_name)
+        )
+        self.assertEqual(1, len(expiring_objects))
+
+        # Get the nodes of the expiring container
+        expiring_container_part_num, expiring_container_nodes = \
+            self.client.container_ring.get_nodes('.expiring_objects',
+                                                 expiring_container_name)
+
+        # Verify that there are only 3 such nodes
+        self.assertEqual(3, len(expiring_container_nodes))
+
+        listing_records = []
+        for node in expiring_container_nodes:
+            metadata, container_data = direct_client.direct_get_container(
+                node, expiring_container_part_num, '.expiring_objects',
+                expiring_container_name)
+            # Verify there is metadata for only one object
+            self.assertEqual(1, len(container_data))
+            listing_records.append(container_data[0])
+
+        # Check for inconsistent metadata
+        byte_size_counts = Counter([
+            extract_expirer_bytes_from_ctype(resp['content_type'])
+            for resp in listing_records
+        ])
+        expected_byte_size_counts = {
+            t0_content_length: 2,
+            t1_content_length: 1
+        }
+
+        self.assertEqual(expected_byte_size_counts, byte_size_counts)
+
+        # Run the replicator to update expirey queue entries
+        Manager(['container-replicator']).once()
+
+        listing_records = []
+        for node in expiring_container_nodes:
+            metadata, container_data = direct_client.direct_get_container(
+                node, expiring_container_part_num, '.expiring_objects',
+                expiring_container_name)
+            self.assertEqual(1, len(container_data))
+            listing_records.append(container_data[0])
+
+        # Ensure that metadata is now consistent
+        byte_size_counts = Counter([
+            extract_expirer_bytes_from_ctype(resp['content_type'])
+            for resp in listing_records
+        ])
+        expected_byte_size_counts = {t1_content_length: 3}
+
+        self.assertEqual(expected_byte_size_counts, byte_size_counts)
+
+    def _test_expirer_delete_outdated_object_version(self, object_exists):
+        # This test simulates a case where the expirer tries to delete
+        # an outdated version of an object.
+        # One case is where the expirer gets a 404, whereas the newest version
+        # of the object is offline.
+        # Another case is where the expirer gets a 412, since the old version
+        # of the object mismatches the expiration time sent by the expirer.
+        # In any of these cases, the expirer should retry deleting the object
+        # later, for as long as a reclaim age has not passed.
+        obj_brain = BrainSplitter(self.url, self.token, self.container_name,
+                                  self.object_name, 'object', self.policy)
+
+        obj_brain.put_container()
+
+        if object_exists:
+            obj_brain.put_object()
+
+        # currently, the object either doesn't exist, or does not have
+        # an expiration
+
+        # stop primary servers and put a newer version of the object, this
+        # time with an expiration. only the handoff servers will have
+        # the new version
+        obj_brain.stop_primary_half()
+        now = time.time()
+        delete_at = int(now + 2.0)
+        obj_brain.put_object({'X-Delete-At': str(delete_at)})
+
+        # make sure auto-created containers get in the account listing
+        Manager(['container-updater']).once()
+
+        # update object record in the container listing
+        Manager(['container-replicator']).once()
+
+        # take handoff servers down, and bring up the outdated primary servers
+        obj_brain.start_primary_half()
+        obj_brain.stop_handoff_half()
+
+        # wait until object expiration time
+        while time.time() <= delete_at:
+            time.sleep(0.1)
+
+        # run expirer against the outdated servers. it should fail since
+        # the outdated version does not match the expiration time
+        self.expirer.once()
+
+        # bring all servers up, and run replicator to update servers
+        obj_brain.start_handoff_half()
+        Manager(['object-replicator']).once()
+
+        # verify the deletion has failed by checking the container listing
+        self.assertTrue(self._check_obj_in_container_listing(),
+                        msg='Did not find listing for %s' % self.object_name)
+
+        # run expirer again, delete should now succeed
+        self.expirer.once()
+
+        # verify the deletion by checking the container listing
+        self.assertFalse(self._check_obj_in_container_listing(),
+                         msg='Found listing for %s' % self.object_name)
+
+    def test_expirer_delete_returns_outdated_404(self):
+        self._test_expirer_delete_outdated_object_version(object_exists=False)
+
+    def test_expirer_delete_returns_outdated_412(self):
+        self._test_expirer_delete_outdated_object_version(object_exists=True)
+
+    def test_slo_async_delete(self):
+        if not self.cluster_info.get('slo', {}).get('allow_async_delete'):
+            raise unittest.SkipTest('allow_async_delete not enabled')
+
+        segment_container, _ = self._setup_test_slo_object()
+
+        client.delete_object(
+            self.url, self.token, self.container_name, 'slo',
+            query_string='multipart-manifest=delete&async=true')
+
+        # Object's deleted
+        _, objects = client.get_container(self.url, self.token,
+                                          self.container_name)
+        self.assertEqual(objects, [])
+        with self.assertRaises(client.ClientException) as caught:
+            client.get_object(self.url, self.token, self.container_name, 'slo')
+        self.assertEqual(404, caught.exception.http_status)
+
+        # But segments are still around and accessible
+        _, objects = client.get_container(self.url, self.token,
+                                          segment_container)
+        self.assertEqual([o['name'] for o in objects],
+                         ['segment_1', 'segment_2'])
+        _, body = client.get_object(self.url, self.token,
+                                    segment_container, 'segment_1')
+        self.assertEqual(body, b'12')
+        _, body = client.get_object(self.url, self.token,
+                                    segment_container, 'segment_2')
+        self.assertEqual(body, b'5678')
+
+        # make sure auto-created expirer-queue containers get in the account
+        # listing so the expirer can find them
+        Manager(['container-updater']).once()
+        self.expirer.once()
+
+        # Now the expirer has cleaned up the segments
+        _, objects = client.get_container(self.url, self.token,
+                                          segment_container)
+        self.assertEqual(objects, [])
+        with self.assertRaises(client.ClientException) as caught:
+            client.get_object(self.url, self.token,
+                              segment_container, 'segment_1')
+        self.assertEqual(404, caught.exception.http_status)
+        with self.assertRaises(client.ClientException) as caught:
+            client.get_object(self.url, self.token,
+                              segment_container, 'segment_2')
+        self.assertEqual(404, caught.exception.http_status)
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/test/probe/test_object_failures.py b/test/probe/test_object_failures.py
old mode 100755
new mode 100644
index f4cd912ef2..ae95096335
--- a/test/probe/test_object_failures.py
+++ b/test/probe/test_object_failures.py
@@ -1,5 +1,5 @@
 #!/usr/bin/python -u
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -14,52 +14,63 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
+import json
+import os
+import time
 from os import listdir, unlink
 from os.path import join as path_join
-from unittest import main, TestCase
+from unittest import main
 from uuid import uuid4
 
 from swiftclient import client
 
 from swift.common import direct_client
+from swift.common.exceptions import ClientException
 from swift.common.utils import hash_path, readconf
-from swift.obj.server import write_metadata, read_metadata
-from test.probe.common import kill_servers, reset_environment
+from swift.obj.diskfile import write_metadata, read_metadata, get_data_dir
+from test.probe.common import ReplProbeTest, ECProbeTest
+
+
+RETRIES = 5
 
 
 def get_data_file_path(obj_dir):
-    files = sorted(listdir(obj_dir), reverse=True)
+    files = []
+    # We might need to try a few times if a request hasn't yet settled. For
+    # instance, a PUT can return success when just 2 of 3 nodes has completed.
+    for attempt in range(RETRIES + 1):
+        try:
+            files = sorted(listdir(obj_dir), reverse=True)
+            break
+        except Exception:
+            if attempt < RETRIES:
+                time.sleep(1)
+            else:
+                raise
     for filename in files:
         return path_join(obj_dir, filename)
 
 
-class TestObjectFailures(TestCase):
-
-    def setUp(self):
-        (self.pids, self.port2server, self.account_ring, self.container_ring,
-         self.object_ring, self.url, self.token,
-         self.account) = reset_environment()
-
-    def tearDown(self):
-        kill_servers(self.port2server, self.pids)
+class TestObjectFailures(ReplProbeTest):
 
     def _setup_data_file(self, container, obj, data):
-        client.put_container(self.url, self.token, container)
+        client.put_container(self.url, self.token, container,
+                             headers={'X-Storage-Policy':
+                                      self.policy.name})
         client.put_object(self.url, self.token, container, obj, data)
         odata = client.get_object(self.url, self.token, container, obj)[-1]
-        self.assertEquals(odata, data)
+        self.assertEqual(odata, data)
         opart, onodes = self.object_ring.get_nodes(
             self.account, container, obj)
         onode = onodes[0]
-        node_id = (onode['port'] - 6000) / 10
+        node_id = self.config_number(onode)
         device = onode['device']
         hash_str = hash_path(self.account, container, obj)
-        obj_server_conf = readconf('/etc/swift/object-server/%s.conf' %
-                                   node_id)
+        obj_server_conf = readconf(self.configs['object-server'][node_id])
         devices = obj_server_conf['app:object-server']['devices']
-        obj_dir = '%s/%s/objects/%s/%s/%s/' % (devices,
-                                               device, opart,
-                                               hash_str[-3:], hash_str)
+        obj_dir = '%s/%s/%s/%s/%s/%s/' % (devices, device,
+                                          get_data_dir(self.policy),
+                                          opart, hash_str[-3:], hash_str)
         data_file = get_data_file_path(obj_dir)
         return onode, opart, data_file
 
@@ -67,103 +78,122 @@ def run_quarantine(self):
         container = 'container-%s' % uuid4()
         obj = 'object-%s' % uuid4()
         onode, opart, data_file = self._setup_data_file(container, obj,
-                                                        'VERIFY')
-        with open(data_file) as fpointer:
-            metadata = read_metadata(fpointer)
+                                                        b'VERIFY')
+        # Stash the on disk data for future comparison - this may not equal
+        # 'VERIFY' if for example the proxy has crypto enabled
+        backend_data = direct_client.direct_get_object(
+            onode, opart, self.account, container, obj, headers={
+                'X-Backend-Storage-Policy-Index': self.policy.idx})[-1]
+
+        metadata = read_metadata(data_file)
         metadata['ETag'] = 'badetag'
-        with open(data_file) as fpointer:
-            write_metadata(fpointer, metadata)
+        write_metadata(data_file, metadata)
 
         odata = direct_client.direct_get_object(
-            onode, opart, self.account, container, obj)[-1]
-        self.assertEquals(odata, 'VERIFY')
+            onode, opart, self.account, container, obj, headers={
+                'X-Backend-Storage-Policy-Index': self.policy.idx})[-1]
+        self.assertEqual(odata, backend_data)
         try:
-            direct_client.direct_get_object(onode, opart, self.account,
-                                            container, obj)
+            direct_client.direct_get_object(
+                onode, opart, self.account, container, obj, headers={
+                    'X-Backend-Storage-Policy-Index': self.policy.idx})
             raise Exception("Did not quarantine object")
-        except client.ClientException, err:
-            self.assertEquals(err.http_status, 404)
+        except ClientException as err:
+            self.assertEqual(err.http_status, 404)
 
     def run_quarantine_range_etag(self):
         container = 'container-range-%s' % uuid4()
         obj = 'object-range-%s' % uuid4()
         onode, opart, data_file = self._setup_data_file(container, obj,
-                                                        'RANGE')
-        with open(data_file) as fpointer:
-            metadata = read_metadata(fpointer)
+                                                        b'RANGE')
+        # Stash the on disk data for future comparison - this may not equal
+        # 'VERIFY' if for example the proxy has crypto enabled
+        backend_data = direct_client.direct_get_object(
+            onode, opart, self.account, container, obj, headers={
+                'X-Backend-Storage-Policy-Index': self.policy.idx})[-1]
+
+        metadata = read_metadata(data_file)
         metadata['ETag'] = 'badetag'
-        with open(data_file) as fpointer:
-            write_metadata(fpointer, metadata)
-        for header, result in [({'Range': 'bytes=0-2'}, 'RAN'),
-                               ({'Range': 'bytes=1-11'}, 'ANGE'),
-                               ({'Range': 'bytes=0-11'}, 'RANGE')]:
+        write_metadata(data_file, metadata)
+        base_headers = {'X-Backend-Storage-Policy-Index': self.policy.idx}
+        for header, result in [({'Range': 'bytes=0-2'}, backend_data[0:3]),
+                               ({'Range': 'bytes=1-11'}, backend_data[1:]),
+                               ({'Range': 'bytes=0-11'}, backend_data)]:
+            req_headers = base_headers.copy()
+            req_headers.update(header)
             odata = direct_client.direct_get_object(
-                onode, opart, self.account, container, obj, headers=header)[-1]
-            self.assertEquals(odata, result)
+                onode, opart, self.account, container, obj,
+                headers=req_headers)[-1]
+            self.assertEqual(odata, result)
 
         try:
-            direct_client.direct_get_object(onode, opart, self.account,
-                                            container, obj)
+            direct_client.direct_get_object(
+                onode, opart, self.account, container, obj, headers={
+                    'X-Backend-Storage-Policy-Index': self.policy.idx})
             raise Exception("Did not quarantine object")
-        except client.ClientException, err:
-            self.assertEquals(err.http_status, 404)
+        except ClientException as err:
+            self.assertEqual(err.http_status, 404)
 
     def run_quarantine_zero_byte_get(self):
         container = 'container-zbyte-%s' % uuid4()
         obj = 'object-zbyte-%s' % uuid4()
-        onode, opart, data_file = self._setup_data_file(container, obj, 'DATA')
-        with open(data_file) as fpointer:
-            metadata = read_metadata(fpointer)
+        onode, opart, data_file = self._setup_data_file(
+            container, obj, b'DATA')
+        metadata = read_metadata(data_file)
         unlink(data_file)
 
         with open(data_file, 'w') as fpointer:
             write_metadata(fpointer, metadata)
         try:
-            direct_client.direct_get_object(onode, opart, self.account,
-                                            container, obj, conn_timeout=1,
-                                            response_timeout=1)
+            direct_client.direct_get_object(
+                onode, opart, self.account, container, obj, conn_timeout=1,
+                response_timeout=1, headers={'X-Backend-Storage-Policy-Index':
+                                             self.policy.idx})
             raise Exception("Did not quarantine object")
-        except client.ClientException, err:
-            self.assertEquals(err.http_status, 404)
+        except ClientException as err:
+            self.assertEqual(err.http_status, 404)
 
     def run_quarantine_zero_byte_head(self):
         container = 'container-zbyte-%s' % uuid4()
         obj = 'object-zbyte-%s' % uuid4()
-        onode, opart, data_file = self._setup_data_file(container, obj, 'DATA')
-        with open(data_file) as fpointer:
-            metadata = read_metadata(fpointer)
+        onode, opart, data_file = self._setup_data_file(
+            container, obj, b'DATA')
+        metadata = read_metadata(data_file)
         unlink(data_file)
 
         with open(data_file, 'w') as fpointer:
             write_metadata(fpointer, metadata)
         try:
-            direct_client.direct_head_object(onode, opart, self.account,
-                                             container, obj, conn_timeout=1,
-                                             response_timeout=1)
+            direct_client.direct_head_object(
+                onode, opart, self.account, container, obj, conn_timeout=1,
+                response_timeout=1, headers={'X-Backend-Storage-Policy-Index':
+                                             self.policy.idx})
             raise Exception("Did not quarantine object")
-        except client.ClientException, err:
-            self.assertEquals(err.http_status, 404)
+        except ClientException as err:
+            self.assertEqual(err.http_status, 404)
 
     def run_quarantine_zero_byte_post(self):
         container = 'container-zbyte-%s' % uuid4()
         obj = 'object-zbyte-%s' % uuid4()
-        onode, opart, data_file = self._setup_data_file(container, obj, 'DATA')
-        with open(data_file) as fpointer:
-            metadata = read_metadata(fpointer)
+        onode, opart, data_file = self._setup_data_file(
+            container, obj, b'DATA')
+        metadata = read_metadata(data_file)
         unlink(data_file)
 
         with open(data_file, 'w') as fpointer:
             write_metadata(fpointer, metadata)
         try:
+            headers = {'X-Object-Meta-1': 'One', 'X-Object-Meta-Two': 'Two',
+                       'X-Backend-Storage-Policy-Index': self.policy.idx}
             direct_client.direct_post_object(
                 onode, opart, self.account,
                 container, obj,
-                {'X-Object-Meta-1': 'One', 'X-Object-Meta-Two': 'Two'},
+                headers=headers,
                 conn_timeout=1,
                 response_timeout=1)
             raise Exception("Did not quarantine object")
-        except client.ClientException, err:
-            self.assertEquals(err.http_status, 404)
+        except ClientException as err:
+            self.assertEqual(err.http_status, 404)
 
     def test_runner(self):
         self.run_quarantine()
@@ -173,5 +203,61 @@ def test_runner(self):
         self.run_quarantine_zero_byte_post()
 
 
+class TestECObjectFailures(ECProbeTest):
+
+    def test_ec_missing_all_durable_fragments(self):
+        # This tests helps assert the behavior that when
+        # the proxy has enough fragments to reconstruct the object
+        # but none are marked as durable, the proxy should return a 404.
+
+        container_name = 'container-%s' % uuid4()
+        object_name = 'object-%s' % uuid4()
+
+        # create EC container
+        headers = {'X-Storage-Policy': self.policy.name}
+        client.put_container(self.url, self.token, container_name,
+                             headers=headers)
+
+        # PUT object, should go to primary nodes
+        client.put_object(self.url, self.token, container_name,
+                          object_name, contents=b'object contents')
+
+        # get our node lists
+        opart, onodes = self.object_ring.get_nodes(
+            self.account, container_name, object_name)
+
+        # sanity test
+        odata = client.get_object(self.url, self.token, container_name,
+                                  object_name)[-1]
+        self.assertEqual(b'object contents', odata)
+
+        # make all fragments non-durable
+        for node in onodes:
+            part_dir = self.storage_dir(node, part=opart)
+            for dirs, subdirs, files in os.walk(part_dir):
+                for fname in files:
+                    if fname.endswith('.data'):
+                        non_durable_fname = fname.replace('#d', '')
+                        os.rename(os.path.join(dirs, fname),
+                                  os.path.join(dirs, non_durable_fname))
+                        break
+            headers = direct_client.direct_head_object(
+                node, opart, self.account, container_name, object_name,
+                headers={
+                    'X-Backend-Storage-Policy-Index': self.policy.idx,
+                    'X-Backend-Fragment-Preferences': json.dumps([])})
+            self.assertNotIn('X-Backend-Durable-Timestamp', headers)
+
+        # Now a new GET should return *404* because all fragments
+        # are non-durable, even if they are reconstructable
+        try:
+            client.get_object(self.url, self.token, container_name,
+                              object_name)
+        except client.ClientException as err:
+            self.assertEqual(err.http_status, 404)
+        else:
+            self.fail("Expected ClientException but didn't get it")
+
+
 if __name__ == '__main__':
     main()
diff --git a/test/probe/test_object_handoff.py b/test/probe/test_object_handoff.py
old mode 100755
new mode 100644
index cc88f5f5f2..e76e86c78a
--- a/test/probe/test_object_handoff.py
+++ b/test/probe/test_object_handoff.py
@@ -1,5 +1,5 @@
 #!/usr/bin/python -u
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -14,85 +14,99 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-from subprocess import call, Popen
-from unittest import main, TestCase
+
+from unittest import main
 from uuid import uuid4
+import random
+from collections import defaultdict
+import os
+import socket
+import errno
 
 from swiftclient import client
 
 from swift.common import direct_client
-from test.probe.common import kill_server, kill_servers, reset_environment, \
-    start_server
-
-
-class TestObjectHandoff(TestCase):
+from swift.common.exceptions import ClientException
+from swift.common.manager import Manager
+from swift.common.utils import md5
+from test.probe.brain import BrainSplitter
+from test.probe.common import (
+    Body, get_server_number, kill_server, start_server,
+    ReplProbeTest, ECProbeTest)
 
-    def setUp(self):
-        (self.pids, self.port2server, self.account_ring, self.container_ring,
-         self.object_ring, self.url, self.token,
-         self.account) = reset_environment()
 
-    def tearDown(self):
-        kill_servers(self.port2server, self.pids)
+class TestObjectHandoff(ReplProbeTest):
 
     def test_main(self):
         # Create container
-        # Kill one container/obj primary server
-        # Create container/obj (goes to two primary servers and one handoff)
-        # Kill other two container/obj primary servers
-        # Indirectly through proxy assert we can get container/obj
-        # Restart those other two container/obj primary servers
-        # Directly to handoff server assert we can get container/obj
-        # Assert container listing (via proxy and directly) has container/obj
-        # Bring the first container/obj primary server back up
-        # Assert that it doesn't have container/obj yet
-        # Run object replication, ensuring we run the handoff node last so it
-        #   should remove its extra handoff partition
-        # Assert the first container/obj primary server now has container/obj
-        # Assert the handoff server no longer has container/obj
-        # Kill the first container/obj primary server again (we have two
-        #   primaries and the handoff up now)
-        # Delete container/obj
-        # Assert we can't head container/obj
-        # Assert container/obj is not in the container listing, both indirectly
-        #   and directly
-        # Restart the first container/obj primary server again
-        # Assert it still has container/obj
-        # Run object replication, ensuring we run the handoff node last so it
-        #   should remove its extra handoff partition
-        # Assert primary node no longer has container/obj
         container = 'container-%s' % uuid4()
-        client.put_container(self.url, self.token, container)
+        client.put_container(self.url, self.token, container,
+                             headers={'X-Storage-Policy':
+                                      self.policy.name})
 
+        # Kill one container/obj primary server
         cpart, cnodes = self.container_ring.get_nodes(self.account, container)
         cnode = cnodes[0]
         obj = 'object-%s' % uuid4()
         opart, onodes = self.object_ring.get_nodes(
             self.account, container, obj)
         onode = onodes[0]
-        kill_server(onode['port'], self.port2server, self.pids)
-        client.put_object(self.url, self.token, container, obj, 'VERIFY')
+        kill_server((onode['ip'], onode['port']), self.ipport2server)
+
+        # Create container/obj (goes to two primary servers and one handoff)
+        client.put_object(self.url, self.token, container, obj, b'VERIFY')
         odata = client.get_object(self.url, self.token, container, obj)[-1]
-        if odata != 'VERIFY':
+        if odata != b'VERIFY':
             raise Exception('Object GET did not return VERIFY, instead it '
                             'returned: %s' % repr(odata))
-        # Kill all primaries to ensure GET handoff works
+
+        # Stash the on disk data from a primary for future comparison with the
+        # handoff - this may not equal 'VERIFY' if for example the proxy has
+        # crypto enabled
+        direct_get_data = direct_client.direct_get_object(
+            onodes[1], opart, self.account, container, obj, headers={
+                'X-Backend-Storage-Policy-Index': self.policy.idx})[-1]
+
+        # Kill other two container/obj primary servers
+        #   to ensure GET handoff works
         for node in onodes[1:]:
-            kill_server(node['port'], self.port2server, self.pids)
+            kill_server((node['ip'], node['port']), self.ipport2server)
+
+        # Indirectly through proxy assert we can get container/obj
         odata = client.get_object(self.url, self.token, container, obj)[-1]
-        if odata != 'VERIFY':
+        if odata != b'VERIFY':
             raise Exception('Object GET did not return VERIFY, instead it '
                             'returned: %s' % repr(odata))
+
+        # Restart those other two container/obj primary servers
         for node in onodes[1:]:
-            start_server(node['port'], self.port2server, self.pids)
-        # We've indirectly verified the handoff node has the object, but let's
-        # directly verify it.
-        another_onode = self.object_ring.get_more_nodes(opart).next()
+            start_server((node['ip'], node['port']), self.ipport2server)
+
+        # We've indirectly verified the handoff node has the container/object,
+        #   but let's directly verify it.
+        another_onode = next(self.object_ring.get_more_nodes(opart))
         odata = direct_client.direct_get_object(
-            another_onode, opart, self.account, container, obj)[-1]
-        if odata != 'VERIFY':
-            raise Exception('Direct object GET did not return VERIFY, instead '
-                            'it returned: %s' % repr(odata))
+            another_onode, opart, self.account, container, obj, headers={
+                'X-Backend-Storage-Policy-Index': self.policy.idx})[-1]
+        self.assertEqual(direct_get_data, odata)
+
+        # drop a tempfile in the handoff's datadir, like it might have
+        # had if there was an rsync failure while it was previously a
+        # primary
+        handoff_device_path = self.device_dir(another_onode)
+        data_filename = None
+        for root, dirs, files in os.walk(handoff_device_path):
+            for filename in files:
+                if filename.endswith('.data'):
+                    data_filename = filename
+                    temp_filename = '.%s.6MbL6r' % data_filename
+                    temp_filepath = os.path.join(root, temp_filename)
+        if not data_filename:
+            self.fail('Did not find any data files on %r' %
+                      handoff_device_path)
+        open(temp_filepath, 'w')
+
+        # Assert container listing (via proxy and directly) has container/obj
         objs = [o['name'] for o in
                 client.get_container(self.url, self.token, container)[1]]
         if obj not in objs:
@@ -105,46 +119,88 @@ def test_main(self):
                 raise Exception(
                     'Container server %s:%s did not know about object' %
                     (cnode['ip'], cnode['port']))
-        start_server(onode['port'], self.port2server, self.pids)
-        exc = None
+
+        # Bring the first container/obj primary server back up
+        start_server((onode['ip'], onode['port']), self.ipport2server)
+
+        # Assert that it doesn't have container/obj yet
         try:
-            direct_client.direct_get_object(onode, opart, self.account,
-                                            container, obj)
-        except direct_client.ClientException, err:
-            exc = err
-        self.assertEquals(exc.http_status, 404)
-        # Run the extra server last so it'll remove its extra partition
-        processes = []
+            direct_client.direct_get_object(
+                onode, opart, self.account, container, obj, headers={
+                    'X-Backend-Storage-Policy-Index': self.policy.idx})
+        except ClientException as err:
+            self.assertEqual(err.http_status, 404)
+        else:
+            self.fail("Expected ClientException but didn't get it")
+
+        # Run object replication, ensuring we run the handoff node last so it
+        #   will remove its extra handoff partition
         for node in onodes:
-            processes.append(Popen(['swift-object-replicator',
-                                    '/etc/swift/object-server/%d.conf' %
-                                    ((node['port'] - 6000) / 10), 'once']))
-        for process in processes:
-            process.wait()
-        call(['swift-object-replicator',
-              '/etc/swift/object-server/%d.conf' %
-              ((another_onode['port'] - 6000) / 10), 'once'])
-        odata = direct_client.direct_get_object(onode, opart, self.account,
-                                                container, obj)[-1]
-        if odata != 'VERIFY':
-            raise Exception('Direct object GET did not return VERIFY, instead '
-                            'it returned: %s' % repr(odata))
-        exc = None
+            _, node_id = get_server_number(
+                (node['ip'], node.get('replication_port', node['port'])),
+                self.ipport2server)
+            Manager(['object-replicator']).once(number=node_id)
+        another_port_num = another_onode.get(
+            'replication_port', another_onode['port'])
+        _, another_num = get_server_number(
+            (another_onode['ip'], another_port_num), self.ipport2server)
+        Manager(['object-replicator']).once(number=another_num)
+
+        # Assert the first container/obj primary server now has container/obj
+        odata = direct_client.direct_get_object(
+            onode, opart, self.account, container, obj, headers={
+                'X-Backend-Storage-Policy-Index': self.policy.idx})[-1]
+        self.assertEqual(direct_get_data, odata)
+
+        # and that it does *not* have a temporary rsync dropping!
+        found_data_filename = False
+        primary_device_path = self.device_dir(onode)
+        for root, dirs, files in os.walk(primary_device_path):
+            for filename in files:
+                if filename.endswith('.6MbL6r'):
+                    self.fail('Found unexpected file %s' %
+                              os.path.join(root, filename))
+                if filename == data_filename:
+                    found_data_filename = True
+        self.assertTrue(found_data_filename,
+                        'Did not find data file %r on %r' % (
+                            data_filename, primary_device_path))
+
+        # Assert the handoff server no longer has container/obj
         try:
-            direct_client.direct_get_object(another_onode, opart, self.account,
-                                            container, obj)
-        except direct_client.ClientException, err:
-            exc = err
-        self.assertEquals(exc.http_status, 404)
+            direct_client.direct_get_object(
+                another_onode, opart, self.account, container, obj, headers={
+                    'X-Backend-Storage-Policy-Index': self.policy.idx})
+        except ClientException as err:
+            self.assertEqual(err.http_status, 404)
+        else:
+            self.fail("Expected ClientException but didn't get it")
 
-        kill_server(onode['port'], self.port2server, self.pids)
-        client.delete_object(self.url, self.token, container, obj)
-        exc = None
+        # Kill the first container/obj primary server again (we have two
+        #   primaries and the handoff up now)
+        kill_server((onode['ip'], onode['port']), self.ipport2server)
+
+        # Delete container/obj
+        try:
+            client.delete_object(self.url, self.token, container, obj)
+        except client.ClientException as err:
+            if self.object_ring.replica_count > 2:
+                raise
+            # Object DELETE returning 503 for (404, 204)
+            # remove this with fix for
+            # https://bugs.launchpad.net/swift/+bug/1318375
+            self.assertEqual(503, err.http_status)
+
+        # Assert we can't head container/obj
         try:
             client.head_object(self.url, self.token, container, obj)
-        except direct_client.ClientException, err:
-            exc = err
-        self.assertEquals(exc.http_status, 404)
+        except client.ClientException as err:
+            self.assertEqual(err.http_status, 404)
+        else:
+            self.fail("Expected ClientException but didn't get it")
+
+        # Assert container/obj is not in the container listing, both indirectly
+        #   and directly
         objs = [o['name'] for o in
                 client.get_container(self.url, self.token, container)[1]]
         if obj in objs:
@@ -157,27 +213,486 @@ def test_main(self):
                 raise Exception(
                     'Container server %s:%s still knew about object' %
                     (cnode['ip'], cnode['port']))
-        start_server(onode['port'], self.port2server, self.pids)
-        direct_client.direct_get_object(onode, opart, self.account, container,
-                                        obj)
-        # Run the extra server last so it'll remove its extra partition
-        processes = []
+
+        # Restart the first container/obj primary server again
+        start_server((onode['ip'], onode['port']), self.ipport2server)
+
+        # Assert it still has container/obj
+        direct_client.direct_get_object(
+            onode, opart, self.account, container, obj, headers={
+                'X-Backend-Storage-Policy-Index': self.policy.idx})
+
+        # Run object replication, ensuring we run the handoff node last so it
+        #   will remove its extra handoff partition
         for node in onodes:
-            processes.append(Popen(['swift-object-replicator',
-                                    '/etc/swift/object-server/%d.conf' %
-                                    ((node['port'] - 6000) / 10), 'once']))
-        for process in processes:
-            process.wait()
-        call(['swift-object-replicator',
-              '/etc/swift/object-server/%d.conf' %
-              ((another_onode['port'] - 6000) / 10), 'once'])
-        exc = None
+            _, node_id = get_server_number(
+                (node['ip'], node.get('replication_port', node['port'])),
+                self.ipport2server)
+            Manager(['object-replicator']).once(number=node_id)
+        _, another_node_id = get_server_number(
+            (another_onode['ip'], another_port_num), self.ipport2server)
+        Manager(['object-replicator']).once(number=another_node_id)
+
+        # Assert primary node no longer has container/obj
         try:
-            direct_client.direct_get_object(another_onode, opart, self.account,
-                                            container, obj)
-        except direct_client.ClientException, err:
-            exc = err
-        self.assertEquals(exc.http_status, 404)
+            direct_client.direct_get_object(
+                another_onode, opart, self.account, container, obj, headers={
+                    'X-Backend-Storage-Policy-Index': self.policy.idx})
+        except ClientException as err:
+            self.assertEqual(err.http_status, 404)
+        else:
+            self.fail("Expected ClientException but didn't get it")
+
+    def test_stale_reads(self):
+        # Create container
+        container = 'container-%s' % uuid4()
+        client.put_container(self.url, self.token, container,
+                             headers={'X-Storage-Policy':
+                                      self.policy.name})
+
+        # Kill one primary obj server
+        obj = 'object-%s' % uuid4()
+        opart, onodes = self.object_ring.get_nodes(
+            self.account, container, obj)
+        onode = onodes[0]
+        kill_server((onode['ip'], onode['port']), self.ipport2server)
+
+        # Create container/obj (goes to two primaries and one handoff)
+        client.put_object(self.url, self.token, container, obj, b'VERIFY')
+        odata = client.get_object(self.url, self.token, container, obj)[-1]
+        if odata != b'VERIFY':
+            raise Exception('Object GET did not return VERIFY, instead it '
+                            'returned: %s' % repr(odata))
+
+        # Stash the on disk data from a primary for future comparison with the
+        # handoff - this may not equal 'VERIFY' if for example the proxy has
+        # crypto enabled
+        direct_get_data = direct_client.direct_get_object(
+            onodes[1], opart, self.account, container, obj, headers={
+                'X-Backend-Storage-Policy-Index': self.policy.idx})[-1]
+
+        # Restart the first container/obj primary server again
+        start_server((onode['ip'], onode['port']), self.ipport2server)
+
+        # send a delete request to primaries
+        client.delete_object(self.url, self.token, container, obj)
+
+        # there should be .ts files in all primaries now
+        for node in onodes:
+            try:
+                direct_client.direct_get_object(
+                    node, opart, self.account, container, obj, headers={
+                        'X-Backend-Storage-Policy-Index': self.policy.idx})
+            except ClientException as err:
+                self.assertEqual(err.http_status, 404)
+            else:
+                self.fail("Expected ClientException but didn't get it")
+
+        # verify that handoff still has the data, DELETEs should have gone
+        # only to primaries
+        another_onode = next(self.object_ring.get_more_nodes(opart))
+        handoff_data = direct_client.direct_get_object(
+            another_onode, opart, self.account, container, obj, headers={
+                'X-Backend-Storage-Policy-Index': self.policy.idx})[-1]
+        self.assertEqual(handoff_data, direct_get_data)
+
+        # Indirectly (i.e., through proxy) try to GET object, it should return
+        # a 404, before bug #1560574, the proxy would return the stale object
+        # from the handoff
+        try:
+            client.get_object(self.url, self.token, container, obj)
+        except client.ClientException as err:
+            self.assertEqual(err.http_status, 404)
+        else:
+            self.fail("Expected ClientException but didn't get it")
+
+    def test_missing_primaries(self):
+        # Create container
+        container = 'container-%s' % uuid4()
+        client.put_container(self.url, self.token, container,
+                             headers={'X-Storage-Policy':
+                                      self.policy.name})
+
+        # Create container/obj (goes to all three primaries)
+        obj = 'object-%s' % uuid4()
+        client.put_object(self.url, self.token, container, obj, b'VERIFY')
+        odata = client.get_object(self.url, self.token, container, obj)[-1]
+        if odata != b'VERIFY':
+            raise Exception('Object GET did not return VERIFY, instead it '
+                            'returned: %s' % repr(odata))
+
+        # Kill all primaries obj server
+        obj = 'object-%s' % uuid4()
+        opart, onodes = self.object_ring.get_nodes(
+            self.account, container, obj)
+        for onode in onodes:
+            kill_server((onode['ip'], onode['port']), self.ipport2server)
+
+        # Indirectly (i.e., through proxy) try to GET object, it should return
+        # a 503, since all primaries will Timeout and handoffs return a 404.
+        try:
+            client.get_object(self.url, self.token, container, obj)
+        except client.ClientException as err:
+            self.assertEqual(err.http_status, 503)
+        else:
+            self.fail("Expected ClientException but didn't get it")
+
+        # Restart the first container/obj primary server again
+        onode = onodes[0]
+        start_server((onode['ip'], onode['port']), self.ipport2server)
+
+        # Send a delete that will reach first primary and handoff.
+        # Sure, the DELETE will return a 404 since the handoff doesn't
+        # have a .data file, but object server will still write a
+        # Tombstone in the handoff node!
+        try:
+            client.delete_object(self.url, self.token, container, obj)
+        except client.ClientException as err:
+            self.assertEqual(err.http_status, 404)
+
+        # kill the first container/obj primary server again
+        kill_server((onode['ip'], onode['port']), self.ipport2server)
+
+        # a new GET should return a 404, since all primaries will Timeout
+        # and the handoff will return a 404 but this time with a tombstone
+        try:
+            client.get_object(self.url, self.token, container, obj)
+        except client.ClientException as err:
+            self.assertEqual(err.http_status, 404)
+        else:
+            self.fail("Expected ClientException but didn't get it")
+
+
+class TestECObjectHandoff(ECProbeTest):
+
+    def get_object(self, container_name, object_name):
+        headers, body = client.get_object(self.url, self.token,
+                                          container_name,
+                                          object_name,
+                                          resp_chunk_size=64 * 2 ** 10)
+        resp_checksum = md5(usedforsecurity=False)
+        for chunk in body:
+            resp_checksum.update(chunk)
+        return resp_checksum.hexdigest()
+
+    def test_ec_handoff_overwrite(self):
+        container_name = 'container-%s' % uuid4()
+        object_name = 'object-%s' % uuid4()
+
+        # create EC container
+        headers = {'X-Storage-Policy': self.policy.name}
+        client.put_container(self.url, self.token, container_name,
+                             headers=headers)
+
+        # PUT object
+        old_contents = Body()
+        client.put_object(self.url, self.token, container_name,
+                          object_name, contents=old_contents)
+
+        # get our node lists
+        opart, onodes = self.object_ring.get_nodes(
+            self.account, container_name, object_name)
+
+        # shutdown one of the primary data nodes
+        failed_primary = random.choice(onodes)
+        failed_primary_device_path = self.device_dir(failed_primary)
+        # first read its ec etag value for future reference - this may not
+        # equal old_contents.etag if for example the proxy has crypto enabled
+        req_headers = {'X-Backend-Storage-Policy-Index': int(self.policy)}
+        headers = direct_client.direct_head_object(
+            failed_primary, opart, self.account, container_name,
+            object_name, headers=req_headers)
+        old_backend_etag = headers['X-Object-Sysmeta-EC-Etag']
+
+        self.kill_drive(failed_primary_device_path)
+
+        # overwrite our object with some new data
+        new_contents = Body()
+        client.put_object(self.url, self.token, container_name,
+                          object_name, contents=new_contents)
+        self.assertNotEqual(new_contents.etag, old_contents.etag)
+
+        # restore failed primary device
+        self.revive_drive(failed_primary_device_path)
+
+        # sanity - failed node has old contents
+        req_headers = {'X-Backend-Storage-Policy-Index': int(self.policy)}
+        headers = direct_client.direct_head_object(
+            failed_primary, opart, self.account, container_name,
+            object_name, headers=req_headers)
+        self.assertEqual(headers['X-Object-Sysmeta-EC-Etag'],
+                         old_backend_etag)
+
+        # we have 1 primary with wrong old etag, and we should have 5 with
+        # new etag plus a handoff with the new etag, so killing 2 other
+        # primaries forces proxy to try to GET from all primaries plus handoff.
+        other_nodes = [n for n in onodes if n != failed_primary]
+        random.shuffle(other_nodes)
+        # grab the value of the new content's ec etag for future reference
+        headers = direct_client.direct_head_object(
+            other_nodes[0], opart, self.account, container_name,
+            object_name, headers=req_headers)
+        new_backend_etag = headers['X-Object-Sysmeta-EC-Etag']
+        for node in other_nodes[:2]:
+            self.kill_drive(self.device_dir(node))
+
+        # sanity, after taking out two primaries we should be down to
+        # only four primaries, one of which has the old etag - but we
+        # also have a handoff with the new etag out there
+        found_frags = defaultdict(int)
+        req_headers = {'X-Backend-Storage-Policy-Index': int(self.policy)}
+        for node in onodes + list(self.object_ring.get_more_nodes(opart)):
+            try:
+                headers = direct_client.direct_head_object(
+                    node, opart, self.account, container_name,
+                    object_name, headers=req_headers)
+            except Exception:
+                continue
+            found_frags[headers['X-Object-Sysmeta-EC-Etag']] += 1
+        self.assertEqual(found_frags, {
+            new_backend_etag: 4,  # this should be enough to rebuild!
+            old_backend_etag: 1,
+        })
+
+        # clear node error limiting
+        Manager(['proxy']).restart()
+
+        resp_etag = self.get_object(container_name, object_name)
+        self.assertEqual(resp_etag, new_contents.etag)
+
+    def _check_nodes(self, opart, onodes, container_name, object_name):
+        found_frags = defaultdict(int)
+        req_headers = {'X-Backend-Storage-Policy-Index': int(self.policy)}
+        for node in onodes + list(self.object_ring.get_more_nodes(opart)):
+            try:
+                headers = direct_client.direct_head_object(
+                    node, opart, self.account, container_name,
+                    object_name, headers=req_headers)
+            except socket.error as e:
+                if e.errno != errno.ECONNREFUSED:
+                    raise
+            except direct_client.DirectClientException as e:
+                if e.http_status != 404:
+                    raise
+            else:
+                found_frags[headers['X-Object-Sysmeta-Ec-Frag-Index']] += 1
+        return found_frags
+
+    def test_ec_handoff_duplicate_available(self):
+        container_name = 'container-%s' % uuid4()
+        object_name = 'object-%s' % uuid4()
+
+        # create EC container
+        headers = {'X-Storage-Policy': self.policy.name}
+        client.put_container(self.url, self.token, container_name,
+                             headers=headers)
+
+        # get our node lists
+        opart, onodes = self.object_ring.get_nodes(
+            self.account, container_name, object_name)
+
+        # find both primary servers that have both of their devices in
+        # the primary node list
+        group_nodes_by_config = defaultdict(list)
+        for n in onodes:
+            group_nodes_by_config[self.config_number(n)].append(n)
+        double_disk_primary = []
+        for config_number, node_list in group_nodes_by_config.items():
+            if len(node_list) > 1:
+                double_disk_primary.append((config_number, node_list))
+
+        # sanity, in a 4+2 with 8 disks two servers will be doubled
+        self.assertEqual(len(double_disk_primary), 2)
+
+        # shutdown the first double primary
+        primary0_config_number, primary0_node_list = double_disk_primary[0]
+        Manager(['object-server']).stop(number=primary0_config_number)
+
+        # PUT object
+        contents = Body()
+        client.put_object(self.url, self.token, container_name,
+                          object_name, contents=contents)
+
+        # sanity fetch two frags on handoffs
+        handoff_frags = []
+        for node in self.object_ring.get_more_nodes(opart):
+            headers, data = direct_client.direct_get_object(
+                node, opart, self.account, container_name, object_name,
+                headers={'X-Backend-Storage-Policy-Index': int(self.policy)}
+            )
+            handoff_frags.append((node, headers, data))
+
+        # bring the first double primary back, and fail the other one
+        Manager(['object-server']).start(number=primary0_config_number)
+        primary1_config_number, primary1_node_list = double_disk_primary[1]
+        Manager(['object-server']).stop(number=primary1_config_number)
+
+        # we can still GET the object
+        resp_etag = self.get_object(container_name, object_name)
+        self.assertEqual(resp_etag, contents.etag)
+
+        # now start to "revert" the first handoff frag
+        node = primary0_node_list[0]
+        handoff_node, headers, data = handoff_frags[0]
+        # N.B. object server api returns quoted ETag
+        headers['ETag'] = headers['Etag'].strip('"')
+        headers['X-Backend-Storage-Policy-Index'] = int(self.policy)
+        direct_client.direct_put_object(
+            node, opart,
+            self.account, container_name, object_name,
+            contents=data, headers=headers)
+
+        # sanity - check available frags
+        frag2count = self._check_nodes(opart, onodes,
+                                       container_name, object_name)
+        # ... five frags total
+        self.assertEqual(sum(frag2count.values()), 5)
+        # ... only 4 unique indexes
+        self.assertEqual(len(frag2count), 4)
+
+        # we can still GET the object
+        resp_etag = self.get_object(container_name, object_name)
+        self.assertEqual(resp_etag, contents.etag)
+
+        # ... but we need both handoffs or we get a error
+        for handoff_node, hdrs, data in handoff_frags:
+            Manager(['object-server']).stop(
+                number=self.config_number(handoff_node))
+            with self.assertRaises(Exception) as cm:
+                self.get_object(container_name, object_name)
+            self.assertIn(cm.exception.http_status, (404, 503))
+            Manager(['object-server']).start(
+                number=self.config_number(handoff_node))
+
+        # fix everything
+        Manager(['object-server']).start(number=primary1_config_number)
+        Manager(["object-reconstructor"]).once()
+
+        # sanity - check available frags
+        frag2count = self._check_nodes(opart, onodes,
+                                       container_name, object_name)
+        # ... six frags total
+        self.assertEqual(sum(frag2count.values()), 6)
+        # ... all six unique
+        self.assertEqual(len(frag2count), 6)
+
+    def test_ec_primary_timeout(self):
+        container_name = 'container-%s' % uuid4()
+        object_name = 'object-%s' % uuid4()
+
+        # create EC container
+        headers = {'X-Storage-Policy': self.policy.name}
+        client.put_container(self.url, self.token, container_name,
+                             headers=headers)
+
+        # PUT object, should go to primary nodes
+        old_contents = Body()
+        client.put_object(self.url, self.token, container_name,
+                          object_name, contents=old_contents)
+
+        # get our node lists
+        opart, onodes = self.object_ring.get_nodes(
+            self.account, container_name, object_name)
+
+        # shutdown three of the primary data nodes
+        for i in range(3):
+            failed_primary = onodes[i]
+            failed_primary_device_path = self.device_dir(failed_primary)
+            self.kill_drive(failed_primary_device_path)
+
+        # Indirectly (i.e., through proxy) try to GET object, it should return
+        # a 503, since all primaries will Timeout and handoffs return a 404.
+        try:
+            client.get_object(self.url, self.token, container_name,
+                              object_name)
+        except client.ClientException as err:
+            self.assertEqual(err.http_status, 503)
+        else:
+            self.fail("Expected ClientException but didn't get it")
+
+        # Send a delete to write down tombstones in the handoff nodes
+        client.delete_object(self.url, self.token, container_name, object_name)
+
+        # Now a new GET should return 404 because the handoff nodes
+        # return a 404 with a Tombstone.
+        try:
+            client.get_object(self.url, self.token, container_name,
+                              object_name)
+        except client.ClientException as err:
+            self.assertEqual(err.http_status, 404)
+        else:
+            self.fail("Expected ClientException but didn't get it")
+
+
+class TestPostObjectHandoff(ReplProbeTest):
+
+    def setUp(self):
+        super().setUp()
+        self.container_name = self._make_name('container-')
+        brain = self._get_brain()
+        brain.put_container(policy_index=int(self.policy))
+
+    def _get_brain(self, object_name=None):
+        if not object_name:
+            service = 'container'
+            policy = None
+        else:
+            service = 'object'
+            policy = self.policy
+        return BrainSplitter(
+            self.url, self.token, self.container_name,
+            object_name, service, policy=policy)
+
+    def test_main(self):
+        object1_name = self._make_name('object1-')
+        object1_brain = self._get_brain(object1_name)
+        # stop 1 primary
+        server_number = random.choice(object1_brain.primary_numbers)
+        object1_brain.servers.stop(number=server_number)
+        # PUT to handoffs
+        object1_brain.put_object()
+        # sanity HEAD
+        object1_brain.head_object()
+        # restart 1 primary
+        object1_brain.servers.start(number=server_number)
+        # sanity HEAD
+        object1_brain.head_object()
+        # POST works just fine
+        object1_brain.post_object(headers={'X-Object-Meta-Test': 'test1'})
+        headers = object1_brain.head_object()
+        self.assertEqual(headers['X-Object-Meta-Test'], 'test1')
+
+        object2_name = self._make_name('object2-')
+        object2_brain = self._get_brain(object2_name)
+        # stop *2* primaries
+        object2_brain.stop_primary_half()
+        # PUT to *multiple* handoffs
+        object2_brain.put_object()
+        # sanity HEAD
+        object2_brain.head_object()
+        # restart primaries
+        object2_brain.start_primary_half()
+        # POST still works
+        object2_brain.post_object(headers={'X-Object-Meta-Test': 'test2'})
+        headers = object2_brain.head_object()
+        self.assertEqual(headers['X-Object-Meta-Test'], 'test2')
+
+    def test_mixed_primaries_with_old_datafile(self):
+        object_name = self._make_name('object-')
+        object_brain = self._get_brain(object_name)
+        # create object on primaries
+        object_brain.put_object()
+        # stop a single primary
+        server_number = random.choice(object_brain.node_numbers)
+        object_brain.servers.stop(number=server_number)
+        # delete object from remaining primaries
+        object_brain.delete_object()
+        # restore old primary
+        object_brain.servers.start(number=server_number)
+        # POST returns 503
+        with self.assertRaises(Exception) as cm:
+            object_brain.post_object()
+        self.assertEqual(cm.exception.http_status, 503)
 
 
 if __name__ == '__main__':
diff --git a/test/probe/test_object_metadata_replication.py b/test/probe/test_object_metadata_replication.py
new file mode 100644
index 0000000000..4b5b0d4484
--- /dev/null
+++ b/test/probe/test_object_metadata_replication.py
@@ -0,0 +1,841 @@
+#!/usr/bin/python -u
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from io import BytesIO
+import unittest
+
+import os
+import uuid
+
+from swift.common.direct_client import direct_get_suffix_hashes
+from swift.common.exceptions import DiskFileDeleted
+from swift.common.internal_client import UnexpectedResponse
+from swift.common.swob import normalize_etag
+from swift.container.backend import ContainerBroker
+from swift.common import utils
+from swiftclient import client
+from swift.common.ring import Ring
+from swift.common.utils import Timestamp, get_logger, hash_path
+from swift.obj.diskfile import DiskFileManager
+from swift.common.storage_policy import POLICIES
+
+from test.probe.brain import BrainSplitter
+from test.probe.common import ReplProbeTest
+
+
+class Test(ReplProbeTest):
+    def setUp(self):
+        """
+        Reset all environment and start all servers.
+        """
+        super(Test, self).setUp()
+        self.container_name = 'container-%s' % uuid.uuid4()
+        self.object_name = 'object-%s' % uuid.uuid4()
+        self.brain = BrainSplitter(self.url, self.token, self.container_name,
+                                   self.object_name, 'object',
+                                   policy=self.policy)
+        self.container_brain = BrainSplitter(self.url, self.token,
+                                             self.container_name)
+        self.int_client = self.make_internal_client()
+
+    def _get_object_info(self, account, container, obj, number):
+        obj_conf = self.configs['object-server']
+        config_path = obj_conf[number]
+        options = utils.readconf(config_path, 'app:object-server')
+        swift_dir = options.get('swift_dir', '/etc/swift')
+        ring = POLICIES.get_object_ring(int(self.policy), swift_dir)
+        part, nodes = ring.get_nodes(account, container, obj)
+        for node in nodes:
+            # assumes one to one mapping
+            if node['port'] == int(options.get('bind_port')):
+                device = node['device']
+                break
+        else:
+            return None
+        mgr = DiskFileManager(options, get_logger(options))
+        disk_file = mgr.get_diskfile(device, part, account, container, obj,
+                                     self.policy)
+        info = disk_file.read_metadata()
+        return info
+
+    def _assert_consistent_object_metadata(self):
+        obj_info = []
+        for i in range(1, 5):
+            info_i = self._get_object_info(self.account, self.container_name,
+                                           self.object_name, i)
+            if info_i:
+                obj_info.append(info_i)
+        self.assertGreater(len(obj_info), 1)
+        for other in obj_info[1:]:
+            self.assertDictEqual(obj_info[0], other)
+
+    def _assert_consistent_deleted_object(self):
+        for i in range(1, 5):
+            try:
+                info = self._get_object_info(self.account, self.container_name,
+                                             self.object_name, i)
+                if info is not None:
+                    self.fail('Expected no disk file info but found %s' % info)
+            except DiskFileDeleted:
+                pass
+
+    def _get_db_info(self, account, container, number):
+        server_type = 'container'
+        obj_conf = self.configs['%s-server' % server_type]
+        config_path = obj_conf[number]
+        options = utils.readconf(config_path, 'app:container-server')
+        root = options.get('devices')
+
+        swift_dir = options.get('swift_dir', '/etc/swift')
+        ring = Ring(swift_dir, ring_name=server_type)
+        part, nodes = ring.get_nodes(account, container)
+        for node in nodes:
+            # assumes one to one mapping
+            if node['port'] == int(options.get('bind_port')):
+                device = node['device']
+                break
+        else:
+            return None
+
+        path_hash = utils.hash_path(account, container)
+        _dir = utils.storage_directory('%ss' % server_type, part, path_hash)
+        db_dir = os.path.join(root, device, _dir)
+        db_file = os.path.join(db_dir, '%s.db' % path_hash)
+        db = ContainerBroker(db_file)
+        return db.get_info()
+
+    def _assert_consistent_container_dbs(self):
+        db_info = []
+        for i in range(1, 5):
+            info_i = self._get_db_info(self.account, self.container_name, i)
+            if info_i:
+                db_info.append(info_i)
+        self.assertGreater(len(db_info), 1)
+        for other in db_info[1:]:
+            self.assertEqual(db_info[0]['hash'], other['hash'],
+                             'Container db hash mismatch: %s != %s'
+                             % (db_info[0]['hash'], other['hash']))
+
+    def _assert_object_metadata_matches_listing(self, listing, metadata):
+        self.assertEqual(listing['bytes'], int(metadata['content-length']))
+        self.assertEqual(listing['hash'], normalize_etag(metadata['etag']))
+        self.assertEqual(listing['content_type'], metadata['content-type'])
+        modified = Timestamp(metadata['x-timestamp']).isoformat
+        self.assertEqual(listing['last_modified'], modified)
+
+    def _put_object(self, headers=None, body=b'stuff'):
+        headers = headers or {}
+        self.int_client.upload_object(BytesIO(body), self.account,
+                                      self.container_name,
+                                      self.object_name, headers)
+
+    def _post_object(self, headers):
+        self.int_client.set_object_metadata(self.account, self.container_name,
+                                            self.object_name, headers)
+
+    def _delete_object(self):
+        self.int_client.delete_object(self.account, self.container_name,
+                                      self.object_name)
+
+    def _get_object(self, headers=None, expect_statuses=(2,)):
+        return self.int_client.get_object(self.account,
+                                          self.container_name,
+                                          self.object_name,
+                                          headers,
+                                          acceptable_statuses=expect_statuses)
+
+    def _get_object_metadata(self):
+        return self.int_client.get_object_metadata(self.account,
+                                                   self.container_name,
+                                                   self.object_name)
+
+    def _assert_consistent_suffix_hashes(self):
+        opart, onodes = self.object_ring.get_nodes(
+            self.account, self.container_name, self.object_name)
+        name_hash = hash_path(
+            self.account, self.container_name, self.object_name)
+        results = []
+        for node in onodes:
+            results.append(
+                (node,
+                 direct_get_suffix_hashes(node, opart, [name_hash[-3:]])))
+        for (node, hashes) in results[1:]:
+            self.assertEqual(results[0][1], hashes,
+                             'Inconsistent suffix hashes found: %s' % results)
+
+    def test_object_delete_is_replicated(self):
+        self.brain.put_container()
+        # put object
+        self._put_object()
+
+        # put newer object with sysmeta to first server subset
+        self.brain.stop_primary_half()
+        self.container_brain.stop_primary_half()
+        self._put_object()
+        self.brain.start_primary_half()
+        self.container_brain.start_primary_half()
+
+        # delete object on second server subset
+        self.brain.stop_handoff_half()
+        self.container_brain.stop_handoff_half()
+        self._delete_object()
+        self.brain.start_handoff_half()
+        self.container_brain.start_handoff_half()
+
+        # run replicator
+        self.get_to_final_state()
+
+        # check object deletion has been replicated on first server set
+        self.brain.stop_primary_half()
+        self.container_brain.stop_primary_half()
+        self._get_object(expect_statuses=(4,))
+        self.brain.start_primary_half()
+        self.container_brain.start_primary_half()
+
+        # check object deletion persists on second server set
+        self.brain.stop_handoff_half()
+        self.container_brain.stop_handoff_half()
+        self._get_object(expect_statuses=(4,))
+
+        # put newer object to second server set
+        self._put_object()
+        self.brain.start_handoff_half()
+        self.container_brain.start_handoff_half()
+
+        # run replicator
+        self.get_to_final_state()
+
+        # check new object  has been replicated on first server set
+        self.brain.stop_primary_half()
+        self.container_brain.stop_primary_half()
+        self._get_object()
+        self.brain.start_primary_half()
+        self.container_brain.start_primary_half()
+
+        # check new object persists on second server set
+        self.brain.stop_handoff_half()
+        self.container_brain.stop_handoff_half()
+        self._get_object()
+
+    def test_object_after_replication_with_subsequent_post(self):
+        self.brain.put_container()
+
+        # put object
+        self._put_object(headers={'Content-Type': 'foo'}, body=b'older')
+
+        # put newer object to first server subset
+        self.brain.stop_primary_half()
+        self.container_brain.stop_primary_half()
+        self._put_object(headers={'Content-Type': 'bar'}, body=b'newer')
+        metadata = self._get_object_metadata()
+        etag = metadata['etag']
+        self.brain.start_primary_half()
+        self.container_brain.start_primary_half()
+
+        # post some user meta to all servers
+        self._post_object({'x-object-meta-bar': 'meta-bar'})
+
+        # run replicator
+        self.get_to_final_state()
+
+        # check that newer data has been replicated to second server subset
+        self.brain.stop_handoff_half()
+        self.container_brain.stop_handoff_half()
+        metadata = self._get_object_metadata()
+        self.assertEqual(etag, metadata['etag'])
+        self.assertEqual('bar', metadata['content-type'])
+        self.assertEqual('meta-bar', metadata['x-object-meta-bar'])
+        self.brain.start_handoff_half()
+        self.container_brain.start_handoff_half()
+
+        self._assert_consistent_object_metadata()
+        self._assert_consistent_container_dbs()
+        self._assert_consistent_suffix_hashes()
+
+    def test_sysmeta_after_replication_with_subsequent_put(self):
+        sysmeta = {'x-object-sysmeta-foo': 'older'}
+        sysmeta2 = {'x-object-sysmeta-foo': 'newer'}
+        usermeta = {'x-object-meta-bar': 'meta-bar'}
+        self.brain.put_container()
+
+        # put object with sysmeta to first server subset
+        self.brain.stop_primary_half()
+        self.container_brain.stop_primary_half()
+        self._put_object(headers=sysmeta)
+        metadata = self._get_object_metadata()
+        for key in sysmeta:
+            self.assertIn(key, metadata)
+            self.assertEqual(metadata[key], sysmeta[key])
+        self.brain.start_primary_half()
+        self.container_brain.start_primary_half()
+
+        # put object with updated sysmeta to second server subset
+        self.brain.stop_handoff_half()
+        self.container_brain.stop_handoff_half()
+        self._put_object(headers=sysmeta2)
+        metadata = self._get_object_metadata()
+        for key in sysmeta2:
+            self.assertIn(key, metadata)
+            self.assertEqual(metadata[key], sysmeta2[key])
+        self._post_object(usermeta)
+        metadata = self._get_object_metadata()
+        for key in usermeta:
+            self.assertIn(key, metadata)
+            self.assertEqual(metadata[key], usermeta[key])
+        for key in sysmeta2:
+            self.assertIn(key, metadata)
+            self.assertEqual(metadata[key], sysmeta2[key])
+
+        self.brain.start_handoff_half()
+        self.container_brain.start_handoff_half()
+
+        # run replicator
+        self.get_to_final_state()
+
+        # check sysmeta has been replicated to first server subset
+        self.brain.stop_primary_half()
+        self.container_brain.stop_primary_half()
+        metadata = self._get_object_metadata()
+        for key in usermeta:
+            self.assertIn(key, metadata)
+            self.assertEqual(metadata[key], usermeta[key])
+        for key in sysmeta2.keys():
+            self.assertIn(key, metadata, key)
+            self.assertEqual(metadata[key], sysmeta2[key])
+        self.brain.start_primary_half()
+        self.container_brain.start_primary_half()
+
+        # check user sysmeta ok on second server subset
+        self.brain.stop_handoff_half()
+        self.container_brain.stop_handoff_half()
+        metadata = self._get_object_metadata()
+        for key in usermeta:
+            self.assertIn(key, metadata)
+            self.assertEqual(metadata[key], usermeta[key])
+        for key in sysmeta2.keys():
+            self.assertIn(key, metadata, key)
+            self.assertEqual(metadata[key], sysmeta2[key])
+        self.brain.start_handoff_half()
+        self.container_brain.start_handoff_half()
+
+        self._assert_consistent_object_metadata()
+        self._assert_consistent_container_dbs()
+        self._assert_consistent_suffix_hashes()
+
+    def test_sysmeta_after_replication_with_subsequent_post(self):
+        sysmeta = {'x-object-sysmeta-foo': 'sysmeta-foo'}
+        usermeta = {'x-object-meta-bar': 'meta-bar'}
+        transient_sysmeta = {
+            'x-object-transient-sysmeta-bar': 'transient-sysmeta-bar'}
+        self.brain.put_container()
+        # put object
+        self._put_object()
+        # put newer object with sysmeta to first server subset
+        self.brain.stop_primary_half()
+        self.container_brain.stop_primary_half()
+        self._put_object(headers=sysmeta)
+        metadata = self._get_object_metadata()
+        for key in sysmeta:
+            self.assertIn(key, metadata)
+            self.assertEqual(metadata[key], sysmeta[key])
+        self.brain.start_primary_half()
+        self.container_brain.start_primary_half()
+
+        # post some user meta to second server subset
+        self.brain.stop_handoff_half()
+        self.container_brain.stop_handoff_half()
+        user_and_transient_sysmeta = dict(usermeta)
+        user_and_transient_sysmeta.update(transient_sysmeta)
+        self._post_object(user_and_transient_sysmeta)
+        metadata = self._get_object_metadata()
+        for key in user_and_transient_sysmeta:
+            self.assertIn(key, metadata)
+            self.assertEqual(metadata[key], user_and_transient_sysmeta[key])
+        for key in sysmeta:
+            self.assertNotIn(key, metadata)
+        self.brain.start_handoff_half()
+        self.container_brain.start_handoff_half()
+
+        # run replicator
+        self.get_to_final_state()
+
+        # check user metadata has been replicated to first server subset
+        # and sysmeta is unchanged
+        self.brain.stop_primary_half()
+        self.container_brain.stop_primary_half()
+        metadata = self._get_object_metadata()
+        expected = dict(sysmeta)
+        expected.update(usermeta)
+        expected.update(transient_sysmeta)
+        for key in expected.keys():
+            self.assertIn(key, metadata, key)
+            self.assertEqual(metadata[key], expected[key])
+        self.brain.start_primary_half()
+        self.container_brain.start_primary_half()
+
+        # check user metadata and sysmeta both on second server subset
+        self.brain.stop_handoff_half()
+        self.container_brain.stop_handoff_half()
+        metadata = self._get_object_metadata()
+        for key in expected.keys():
+            self.assertIn(key, metadata, key)
+            self.assertEqual(metadata[key], expected[key])
+        self.brain.start_handoff_half()
+        self.container_brain.start_handoff_half()
+
+        self._assert_consistent_object_metadata()
+        self._assert_consistent_container_dbs()
+        self._assert_consistent_suffix_hashes()
+
+    def test_sysmeta_after_replication_with_prior_post(self):
+        sysmeta = {'x-object-sysmeta-foo': 'sysmeta-foo'}
+        usermeta = {'x-object-meta-bar': 'meta-bar'}
+        transient_sysmeta = {
+            'x-object-transient-sysmeta-bar': 'transient-sysmeta-bar'}
+        self.brain.put_container()
+        # put object
+        self._put_object()
+
+        # put user meta to first server subset
+        self.brain.stop_handoff_half()
+        self.container_brain.stop_handoff_half()
+        user_and_transient_sysmeta = dict(usermeta)
+        user_and_transient_sysmeta.update(transient_sysmeta)
+        self._post_object(user_and_transient_sysmeta)
+        metadata = self._get_object_metadata()
+        for key in user_and_transient_sysmeta:
+            self.assertIn(key, metadata)
+            self.assertEqual(metadata[key], user_and_transient_sysmeta[key])
+        self.brain.start_handoff_half()
+        self.container_brain.start_handoff_half()
+
+        # put newer object with sysmeta to second server subset
+        self.brain.stop_primary_half()
+        self.container_brain.stop_primary_half()
+        self._put_object(headers=sysmeta)
+        metadata = self._get_object_metadata()
+        for key in sysmeta:
+            self.assertIn(key, metadata)
+            self.assertEqual(metadata[key], sysmeta[key])
+        self.brain.start_primary_half()
+        self.container_brain.start_primary_half()
+
+        # run replicator
+        self.get_to_final_state()
+
+        # check stale user metadata is not replicated to first server subset
+        # and sysmeta is unchanged
+        self.brain.stop_primary_half()
+        self.container_brain.stop_primary_half()
+        metadata = self._get_object_metadata()
+        for key in sysmeta:
+            self.assertIn(key, metadata)
+            self.assertEqual(metadata[key], sysmeta[key])
+        for key in user_and_transient_sysmeta:
+            self.assertNotIn(key, metadata)
+        self.brain.start_primary_half()
+        self.container_brain.start_primary_half()
+
+        # check stale user metadata is removed from second server subset
+        # and sysmeta is replicated
+        self.brain.stop_handoff_half()
+        self.container_brain.stop_handoff_half()
+        metadata = self._get_object_metadata()
+        for key in sysmeta:
+            self.assertIn(key, metadata)
+            self.assertEqual(metadata[key], sysmeta[key])
+        for key in user_and_transient_sysmeta:
+            self.assertNotIn(key, metadata)
+        self.brain.start_handoff_half()
+        self.container_brain.start_handoff_half()
+
+        self._assert_consistent_object_metadata()
+        self._assert_consistent_container_dbs()
+        self._assert_consistent_suffix_hashes()
+
+    def test_post_ctype_replicated_when_previous_incomplete_puts(self):
+        # primary half                     handoff half
+        # ------------                     ------------
+        # t0.data: ctype = foo
+        #                                  t1.data: ctype = bar
+        # t2.meta: ctype = baz
+        #
+        #              ...run replicator and expect...
+        #
+        #               t1.data:
+        #               t2.meta: ctype = baz
+        self.brain.put_container()
+
+        # incomplete write to primary half
+        self.brain.stop_handoff_half()
+        self.container_brain.stop_handoff_half()
+        self._put_object(headers={'Content-Type': 'foo'})
+        self.brain.start_handoff_half()
+        self.container_brain.start_handoff_half()
+
+        # handoff write
+        self.brain.stop_primary_half()
+        self.container_brain.stop_primary_half()
+        self._put_object(headers={'Content-Type': 'bar'})
+        self.brain.start_primary_half()
+        self.container_brain.start_primary_half()
+
+        # content-type update to primary half
+        self.brain.stop_handoff_half()
+        self.container_brain.stop_handoff_half()
+        self._post_object(headers={'Content-Type': 'baz'})
+        self.brain.start_handoff_half()
+        self.container_brain.start_handoff_half()
+
+        self.get_to_final_state()
+
+        # check object metadata
+        metadata = client.head_object(self.url, self.token,
+                                      self.container_name,
+                                      self.object_name)
+
+        # check container listing metadata
+        container_metadata, objs = client.get_container(self.url, self.token,
+                                                        self.container_name)
+
+        for obj in objs:
+            if obj['name'] == self.object_name:
+                break
+        expected = 'baz'
+        self.assertEqual(obj['content_type'], expected)
+        self._assert_object_metadata_matches_listing(obj, metadata)
+        self._assert_consistent_container_dbs()
+        self._assert_consistent_object_metadata()
+        self._assert_consistent_suffix_hashes()
+
+    def test_put_ctype_replicated_when_subsequent_post(self):
+        # primary half                     handoff half
+        # ------------                     ------------
+        # t0.data: ctype = foo
+        #                                  t1.data: ctype = bar
+        # t2.meta:
+        #
+        #              ...run replicator and expect...
+        #
+        #               t1.data: ctype = bar
+        #               t2.meta:
+        self.brain.put_container()
+
+        # incomplete write
+        self.brain.stop_handoff_half()
+        self.container_brain.stop_handoff_half()
+        self._put_object(headers={'Content-Type': 'foo'})
+        self.brain.start_handoff_half()
+        self.container_brain.start_handoff_half()
+
+        # handoff write
+        self.brain.stop_primary_half()
+        self.container_brain.stop_primary_half()
+        self._put_object(headers={'Content-Type': 'bar'})
+        self.brain.start_primary_half()
+        self.container_brain.start_primary_half()
+
+        # metadata update with newest data unavailable
+        self.brain.stop_handoff_half()
+        self.container_brain.stop_handoff_half()
+        self._post_object(headers={'X-Object-Meta-Color': 'Blue'})
+        self.brain.start_handoff_half()
+        self.container_brain.start_handoff_half()
+
+        self.get_to_final_state()
+
+        # check object metadata
+        metadata = client.head_object(self.url, self.token,
+                                      self.container_name,
+                                      self.object_name)
+
+        # check container listing metadata
+        container_metadata, objs = client.get_container(self.url, self.token,
+                                                        self.container_name)
+
+        for obj in objs:
+            if obj['name'] == self.object_name:
+                break
+        else:
+            self.fail('obj not found in container listing')
+        expected = 'bar'
+        self.assertEqual(obj['content_type'], expected)
+        self.assertEqual(metadata['x-object-meta-color'], 'Blue')
+        self._assert_object_metadata_matches_listing(obj, metadata)
+        self._assert_consistent_container_dbs()
+        self._assert_consistent_object_metadata()
+        self._assert_consistent_suffix_hashes()
+
+    def test_post_ctype_replicated_when_subsequent_post_without_ctype(self):
+        # primary half                     handoff half
+        # ------------                     ------------
+        # t0.data: ctype = foo
+        #                                  t1.data: ctype = bar
+        # t2.meta: ctype = bif
+        #                                  t3.data: ctype = baz, color = 'Red'
+        #               t4.meta: color = Blue
+        #
+        #              ...run replicator and expect...
+        #
+        #               t1.data:
+        #               t4-delta.meta: ctype = baz, color = Blue
+        self.brain.put_container()
+
+        # incomplete write
+        self.brain.stop_handoff_half()
+        self.container_brain.stop_handoff_half()
+        self._put_object(headers={'Content-Type': 'foo',
+                                  'X-Object-Sysmeta-Test': 'older'})
+        self.brain.start_handoff_half()
+        self.container_brain.start_handoff_half()
+
+        # handoff write
+        self.brain.stop_primary_half()
+        self.container_brain.stop_primary_half()
+        self._put_object(headers={'Content-Type': 'bar',
+                                  'X-Object-Sysmeta-Test': 'newer'})
+        self.brain.start_primary_half()
+        self.container_brain.start_primary_half()
+
+        # incomplete post with content type
+        self.brain.stop_handoff_half()
+        self.container_brain.stop_handoff_half()
+        self._post_object(headers={'Content-Type': 'bif'})
+        self.brain.start_handoff_half()
+        self.container_brain.start_handoff_half()
+
+        # incomplete post to handoff with content type
+        self.brain.stop_primary_half()
+        self.container_brain.stop_primary_half()
+        self._post_object(headers={'Content-Type': 'baz',
+                                   'X-Object-Meta-Color': 'Red'})
+        self.brain.start_primary_half()
+        self.container_brain.start_primary_half()
+
+        # complete post with no content type
+        self._post_object(headers={'X-Object-Meta-Color': 'Blue',
+                                   'X-Object-Sysmeta-Test': 'ignored'})
+
+        # 'baz' wins over 'bar' but 'Blue' wins over 'Red'
+        self.get_to_final_state()
+
+        # check object metadata
+        metadata = self._get_object_metadata()
+
+        # check container listing metadata
+        container_metadata, objs = client.get_container(self.url, self.token,
+                                                        self.container_name)
+
+        for obj in objs:
+            if obj['name'] == self.object_name:
+                break
+        expected = 'baz'
+        self.assertEqual(obj['content_type'], expected)
+        self.assertEqual(metadata['x-object-meta-color'], 'Blue')
+        self.assertEqual(metadata['x-object-sysmeta-test'], 'newer')
+        self._assert_object_metadata_matches_listing(obj, metadata)
+        self._assert_consistent_container_dbs()
+        self._assert_consistent_object_metadata()
+        self._assert_consistent_suffix_hashes()
+
+    def test_put_ctype_replicated_when_subsequent_posts_without_ctype(self):
+        # primary half                     handoff half
+        # ------------                     ------------
+        #               t0.data: ctype = foo
+        #                                  t1.data: ctype = bar
+        # t2.meta:
+        #                                  t3.meta
+        #
+        #              ...run replicator and expect...
+        #
+        #               t1.data: ctype = bar
+        #               t3.meta
+        self.brain.put_container()
+
+        self._put_object(headers={'Content-Type': 'foo',
+                                  'X-Object-Sysmeta-Test': 'older'})
+
+        # incomplete write to handoff half
+        self.brain.stop_primary_half()
+        self.container_brain.stop_primary_half()
+        self._put_object(headers={'Content-Type': 'bar',
+                                  'X-Object-Sysmeta-Test': 'newer'})
+        self.brain.start_primary_half()
+        self.container_brain.start_primary_half()
+
+        # incomplete post with no content type to primary half
+        self.brain.stop_handoff_half()
+        self.container_brain.stop_handoff_half()
+        self._post_object(headers={'X-Object-Meta-Color': 'Red',
+                                   'X-Object-Sysmeta-Test': 'ignored'})
+        self.brain.start_handoff_half()
+        self.container_brain.start_handoff_half()
+
+        # incomplete post with no content type to handoff half
+        self.brain.stop_primary_half()
+        self.container_brain.stop_primary_half()
+        self._post_object(headers={'X-Object-Meta-Color': 'Blue'})
+        self.brain.start_primary_half()
+        self.container_brain.start_primary_half()
+
+        self.get_to_final_state()
+
+        # check object metadata
+        metadata = self._get_object_metadata()
+
+        # check container listing metadata
+        container_metadata, objs = client.get_container(self.url, self.token,
+                                                        self.container_name)
+
+        for obj in objs:
+            if obj['name'] == self.object_name:
+                break
+        expected = 'bar'
+        self.assertEqual(obj['content_type'], expected)
+        self._assert_object_metadata_matches_listing(obj, metadata)
+        self.assertEqual(metadata['x-object-meta-color'], 'Blue')
+        self.assertEqual(metadata['x-object-sysmeta-test'], 'newer')
+        self._assert_object_metadata_matches_listing(obj, metadata)
+        self._assert_consistent_container_dbs()
+        self._assert_consistent_object_metadata()
+        self._assert_consistent_suffix_hashes()
+
+    def test_posted_metadata_only_persists_after_prior_put(self):
+        # newer metadata posted to subset of nodes should persist after an
+        # earlier put on other nodes, but older content-type on that subset
+        # should not persist
+        self.brain.put_container()
+        # incomplete put to handoff
+        self.brain.stop_primary_half()
+        self.container_brain.stop_primary_half()
+        self._put_object(headers={'Content-Type': 'oldest',
+                                  'X-Object-Sysmeta-Test': 'oldest',
+                                  'X-Object-Meta-Test': 'oldest'})
+        self.brain.start_primary_half()
+        self.container_brain.start_primary_half()
+        # incomplete put to primary
+        self.brain.stop_handoff_half()
+        self.container_brain.stop_handoff_half()
+        self._put_object(headers={'Content-Type': 'oldest',
+                                  'X-Object-Sysmeta-Test': 'oldest',
+                                  'X-Object-Meta-Test': 'oldest'})
+        self.brain.start_handoff_half()
+        self.container_brain.start_handoff_half()
+
+        # incomplete post with content-type to handoff
+        self.brain.stop_primary_half()
+        self.container_brain.stop_primary_half()
+        self._post_object(headers={'Content-Type': 'newer',
+                                   'X-Object-Meta-Test': 'newer'})
+        self.brain.start_primary_half()
+        self.container_brain.start_primary_half()
+
+        # incomplete put to primary
+        self.brain.stop_handoff_half()
+        self.container_brain.stop_handoff_half()
+        self._put_object(headers={'Content-Type': 'newest',
+                                  'X-Object-Sysmeta-Test': 'newest',
+                                  'X-Object-Meta-Test': 'newer'})
+        self.brain.start_handoff_half()
+        self.container_brain.start_handoff_half()
+
+        # incomplete post with no content-type to handoff which still has
+        # out of date content-type
+        self.brain.stop_primary_half()
+        self.container_brain.stop_primary_half()
+        self._post_object(headers={'X-Object-Meta-Test': 'newest'})
+        metadata = self._get_object_metadata()
+        self.assertEqual(metadata['x-object-meta-test'], 'newest')
+        self.assertEqual(metadata['content-type'], 'newer')
+        self.brain.start_primary_half()
+        self.container_brain.start_primary_half()
+
+        self.get_to_final_state()
+
+        # check object metadata
+        metadata = self._get_object_metadata()
+        self.assertEqual(metadata['x-object-meta-test'], 'newest')
+        self.assertEqual(metadata['x-object-sysmeta-test'], 'newest')
+        self.assertEqual(metadata['content-type'], 'newest')
+
+        # check container listing metadata
+        container_metadata, objs = client.get_container(self.url, self.token,
+                                                        self.container_name)
+
+        for obj in objs:
+            if obj['name'] == self.object_name:
+                break
+        self.assertEqual(obj['content_type'], 'newest')
+        self._assert_object_metadata_matches_listing(obj, metadata)
+        self._assert_object_metadata_matches_listing(obj, metadata)
+        self._assert_consistent_container_dbs()
+        self._assert_consistent_object_metadata()
+        self._assert_consistent_suffix_hashes()
+
+    def test_post_trumped_by_prior_delete(self):
+        # new metadata and content-type posted to subset of nodes should not
+        # cause object to persist after replication of an earlier delete on
+        # other nodes.
+        self.brain.put_container()
+        # incomplete put
+        self.brain.stop_primary_half()
+        self.container_brain.stop_primary_half()
+        self._put_object(headers={'Content-Type': 'oldest',
+                                  'X-Object-Sysmeta-Test': 'oldest',
+                                  'X-Object-Meta-Test': 'oldest'})
+        self.brain.start_primary_half()
+        self.container_brain.start_primary_half()
+
+        # incomplete put then delete
+        self.brain.stop_handoff_half()
+        self.container_brain.stop_handoff_half()
+        self._put_object(headers={'Content-Type': 'oldest',
+                                  'X-Object-Sysmeta-Test': 'oldest',
+                                  'X-Object-Meta-Test': 'oldest'})
+        self._delete_object()
+        self.brain.start_handoff_half()
+        self.container_brain.start_handoff_half()
+
+        # handoff post
+        self.brain.stop_primary_half()
+        self.container_brain.stop_primary_half()
+        self._post_object(headers={'Content-Type': 'newest',
+                                   'X-Object-Sysmeta-Test': 'ignored',
+                                   'X-Object-Meta-Test': 'newest'})
+
+        # check object metadata
+        metadata = self._get_object_metadata()
+        self.assertEqual(metadata['x-object-sysmeta-test'], 'oldest')
+        self.assertEqual(metadata['x-object-meta-test'], 'newest')
+        self.assertEqual(metadata['content-type'], 'newest')
+
+        self.brain.start_primary_half()
+        self.container_brain.start_primary_half()
+
+        # delete trumps later post
+        self.get_to_final_state()
+
+        # check object is now deleted
+        self.assertRaises(UnexpectedResponse, self._get_object_metadata)
+        container_metadata, objs = client.get_container(self.url, self.token,
+                                                        self.container_name)
+        self.assertEqual(0, len(objs))
+        self._assert_consistent_container_dbs()
+        self._assert_consistent_deleted_object()
+        self._assert_consistent_suffix_hashes()
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/test/probe/test_object_partpower_increase.py b/test/probe/test_object_partpower_increase.py
new file mode 100755
index 0000000000..ef4e3de538
--- /dev/null
+++ b/test/probe/test_object_partpower_increase.py
@@ -0,0 +1,201 @@
+#!/usr/bin/env python
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import os
+import subprocess
+
+from errno import EEXIST
+from shutil import copyfile, move
+from tempfile import mkstemp
+from time import time
+from unittest import main
+from uuid import uuid4
+
+from swiftclient import client
+
+from swift.common.manager import Manager, Server
+from swift.common.ring import RingBuilder
+from swift.common.utils import replace_partition_in_path, readconf
+from swift.obj.diskfile import get_data_dir
+from test.probe.common import ECProbeTest, ProbeTest, ReplProbeTest
+
+
+class TestPartPowerIncrease(ProbeTest):
+    def setUp(self):
+        super(TestPartPowerIncrease, self).setUp()
+        _, self.ring_file_backup = mkstemp()
+        _, self.builder_file_backup = mkstemp()
+        self.ring_file = self.object_ring.serialized_path
+        self.builder_file = self.ring_file.replace('ring.gz', 'builder')
+        copyfile(self.ring_file, self.ring_file_backup)
+        copyfile(self.builder_file, self.builder_file_backup)
+        # In case the test user is not allowed to write rings
+        self.assertTrue(os.access('/etc/swift', os.W_OK))
+        self.assertTrue(os.access('/etc/swift/backups', os.W_OK))
+        self.assertTrue(os.access('/etc/swift/object.builder', os.W_OK))
+        self.assertTrue(os.access('/etc/swift/object.ring.gz', os.W_OK))
+        # Ensure the test object will be erasure coded
+        self.data = ' ' * getattr(self.policy, 'ec_segment_size', 1)
+
+        self.conf_files = Server('object').conf_files()
+        self.devices = [readconf(conf_file)['app:object-server']['devices']
+                        for conf_file in self.conf_files]
+
+    def tearDown(self):
+        # Keep a backup copy of the modified .builder file
+        backup_dir = os.path.join(
+            os.path.dirname(self.builder_file), 'backups')
+        try:
+            os.mkdir(backup_dir)
+        except OSError as err:
+            if err.errno != EEXIST:
+                raise
+        backup_name = (os.path.join(
+            backup_dir,
+            '%d.probe.' % time() + os.path.basename(self.builder_file)))
+        copyfile(self.builder_file, backup_name)
+
+        # Restore original ring
+        move(self.ring_file_backup, self.ring_file)
+        move(self.builder_file_backup, self.builder_file)
+
+    def _find_objs_ondisk(self, container, obj):
+        locations = []
+        opart, onodes = self.object_ring.get_nodes(
+            self.account, container, obj)
+        for node in onodes:
+            start_dir = os.path.join(
+                self.device_dir(node),
+                get_data_dir(self.policy),
+                str(opart))
+            for root, dirs, files in os.walk(start_dir):
+                for filename in files:
+                    if filename.endswith('.data'):
+                        locations.append(os.path.join(root, filename))
+        return locations
+
+    def _test_main(self, cancel=False):
+        container = 'container-%s' % uuid4()
+        obj = 'object-%s' % uuid4()
+        obj2 = 'object-%s' % uuid4()
+
+        # Create container
+        headers = {'X-Storage-Policy': self.policy.name}
+        client.put_container(self.url, self.token, container, headers=headers)
+
+        # Create a new object
+        client.put_object(self.url, self.token, container, obj, self.data)
+        client.head_object(self.url, self.token, container, obj)
+
+        # Prepare partition power increase
+        builder = RingBuilder.load(self.builder_file)
+        builder.prepare_increase_partition_power()
+        builder.save(self.builder_file)
+        ring_data = builder.get_ring()
+        ring_data.save(self.ring_file)
+
+        # Ensure the proxy uses the changed ring
+        Manager(['proxy']).restart()
+
+        # Ensure object is still accessible
+        client.head_object(self.url, self.token, container, obj)
+
+        # Relink existing objects
+        for conf in self.conf_files:
+            subprocess.check_call(['swift-object-relinker', 'relink', conf])
+
+        # Create second object after relinking and ensure it is accessible
+        client.put_object(self.url, self.token, container, obj2, self.data)
+        client.head_object(self.url, self.token, container, obj2)
+
+        # Remember the original object locations
+        org_locations = self._find_objs_ondisk(container, obj)
+        org_locations += self._find_objs_ondisk(container, obj2)
+
+        # Remember the new object locations
+        new_locations = []
+        for loc in org_locations:
+            for dev_root in self.devices:
+                if loc.startswith(dev_root):
+                    break
+            else:
+                self.fail('Unable to find device for %s' % loc)
+            new_locations.append(replace_partition_in_path(
+                dev_root, str(loc), self.object_ring.part_power + 1))
+
+        # Overwrite existing object - to ensure that older timestamp files
+        # will be cleaned up properly later
+        client.put_object(self.url, self.token, container, obj, self.data)
+
+        # Ensure objects are still accessible
+        client.head_object(self.url, self.token, container, obj)
+        client.head_object(self.url, self.token, container, obj2)
+
+        # Increase partition power
+        builder = RingBuilder.load(self.builder_file)
+        if not cancel:
+            builder.increase_partition_power()
+        else:
+            builder.cancel_increase_partition_power()
+        builder.save(self.builder_file)
+        ring_data = builder.get_ring()
+        ring_data.save(self.ring_file)
+
+        # Ensure the proxy uses the changed ring
+        Manager(['proxy']).restart()
+
+        # Ensure objects are still accessible
+        client.head_object(self.url, self.token, container, obj)
+        client.head_object(self.url, self.token, container, obj2)
+
+        # Overwrite existing object - to ensure that older timestamp files
+        # will be cleaned up properly later
+        client.put_object(self.url, self.token, container, obj, self.data)
+
+        # Cleanup old objects in the wrong location
+        for conf in self.conf_files:
+            subprocess.check_call(['swift-object-relinker', 'cleanup', conf])
+
+        # Ensure objects are still accessible
+        client.head_object(self.url, self.token, container, obj)
+        client.head_object(self.url, self.token, container, obj2)
+
+        # Ensure data in old or relinked object locations is removed
+        if not cancel:
+            for fn in org_locations:
+                self.assertFalse(os.path.exists(fn))
+        else:
+            for fn in new_locations:
+                self.assertFalse(os.path.exists(fn))
+
+
+class TestReplPartPowerIncrease(TestPartPowerIncrease, ReplProbeTest):
+    def test_main(self):
+        self._test_main()
+
+    def test_canceled(self):
+        self._test_main(cancel=True)
+
+
+class TestECPartPowerIncrease(TestPartPowerIncrease, ECProbeTest):
+    def test_main(self):
+        self._test_main()
+
+    def test_canceled(self):
+        self._test_main(cancel=True)
+
+
+if __name__ == '__main__':
+    main()
diff --git a/test/probe/test_object_versioning.py b/test/probe/test_object_versioning.py
new file mode 100644
index 0000000000..730a143775
--- /dev/null
+++ b/test/probe/test_object_versioning.py
@@ -0,0 +1,342 @@
+#!/usr/bin/python -u
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from unittest import main
+import random
+
+from swiftclient import client
+
+from swift.common import direct_client
+from swift.common.request_helpers import get_reserved_name
+from swift.obj import reconstructor
+
+from test.probe.common import ReplProbeTest, ECProbeTest
+
+
+class TestObjectVersioning(ReplProbeTest):
+
+    def _assert_account_level(self, container_name, hdr_cont_count,
+                              hdr_obj_count, hdr_bytes, cont_count,
+                              cont_bytes):
+
+        headers, containers = client.get_account(self.url, self.token)
+        self.assertEqual(hdr_cont_count, headers['x-account-container-count'])
+        self.assertEqual(hdr_obj_count, headers['x-account-object-count'])
+        self.assertEqual(hdr_bytes, headers['x-account-bytes-used'])
+        self.assertEqual(len(containers), 1)
+        container = containers[0]
+        self.assertEqual(container_name, container['name'])
+        self.assertEqual(cont_count, container['count'])
+        self.assertEqual(cont_bytes, container['bytes'])
+
+    def test_account_listing(self):
+        versions_header_key = 'X-Versions-Enabled'
+
+        # Create container1
+        container_name = 'container1'
+        obj_name = 'object1'
+        client.put_container(self.url, self.token, container_name)
+
+        # Assert account level sees it
+        self._assert_account_level(
+            container_name,
+            hdr_cont_count='1',
+            hdr_obj_count='0',
+            hdr_bytes='0',
+            cont_count=0,
+            cont_bytes=0)
+
+        # Enable versioning
+        hdrs = {versions_header_key: 'True'}
+        client.post_container(self.url, self.token, container_name, hdrs)
+
+        # write multiple versions of same obj
+        client.put_object(self.url, self.token, container_name, obj_name,
+                          'version1')
+        client.put_object(self.url, self.token, container_name, obj_name,
+                          'version2')
+
+        # Assert account level doesn't see object data yet, but it
+        # does see the update for the hidden container
+        self._assert_account_level(
+            container_name,
+            hdr_cont_count='2',
+            hdr_obj_count='0',
+            hdr_bytes='0',
+            cont_count=0,
+            cont_bytes=0)
+
+        # Get to final state
+        self.get_to_final_state()
+
+        # Assert account level now sees updated values
+        # N.B: Note difference in values between header and container listing
+        # header object count is counting both symlink + object versions
+        # listing count is counting only symlink (in primary container)
+        self._assert_account_level(
+            container_name,
+            hdr_cont_count='2',
+            hdr_obj_count='3',
+            hdr_bytes='16',
+            cont_count=1,
+            cont_bytes=16)
+
+        client.delete_object(self.url, self.token, container_name, obj_name)
+        _headers, current_versions = client.get_container(
+            self.url, self.token, container_name)
+        self.assertEqual(len(current_versions), 0)
+        _headers, all_versions = client.get_container(
+            self.url, self.token, container_name, query_string='versions')
+        self.assertEqual(len(all_versions), 3)
+
+        # directly delete primary container to leave an orphan hidden
+        # container
+        self.direct_delete_container(container=container_name)
+
+        # Get to final state
+        self.get_to_final_state()
+
+        # The container count decreases, as well as object count. But bytes
+        # do not. The discrepancy between header object count, container
+        # object count and bytes should indicate orphan hidden container is
+        # still around consuming storage
+        self._assert_account_level(
+            container_name,
+            hdr_cont_count='1',
+            hdr_obj_count='3',
+            hdr_bytes='16',
+            cont_count=0,
+            cont_bytes=16)
+
+        # Can't HEAD or list anything, though
+        with self.assertRaises(client.ClientException) as caught:
+            client.head_container(self.url, self.token, container_name)
+        self.assertEqual(caught.exception.http_status, 404)
+        with self.assertRaises(client.ClientException) as caught:
+            client.get_container(self.url, self.token, container_name)
+        self.assertEqual(caught.exception.http_status, 404)
+        with self.assertRaises(client.ClientException) as caught:
+            client.get_container(self.url, self.token, container_name,
+                                 query_string='versions')
+        self.assertEqual(caught.exception.http_status, 404)
+        with self.assertRaises(client.ClientException) as caught:
+            client.get_object(
+                self.url, self.token, container_name, all_versions[1]['name'],
+                query_string='version-id=%s' % all_versions[1]['version_id'])
+        # A little funny -- maybe this should 404 instead?
+        self.assertEqual(caught.exception.http_status, 400)
+
+        # Fix isn't too bad -- just make the container again!
+        client.put_container(self.url, self.token, container_name)
+        _headers, current_versions = client.get_container(
+            self.url, self.token, container_name)
+        self.assertEqual(len(current_versions), 0)
+        _headers, all_versions = client.get_container(
+            self.url, self.token, container_name, query_string='versions')
+        self.assertEqual(len(all_versions), 3)
+
+        # ... but to actually *access* the versions, you have to enable
+        # versioning again
+        with self.assertRaises(client.ClientException) as caught:
+            client.get_object(
+                self.url, self.token, container_name, all_versions[1]['name'],
+                query_string='version-id=%s' % all_versions[1]['version_id'])
+        self.assertEqual(caught.exception.http_status, 400)
+        self.assertIn(b'version-aware operations require',
+                      caught.exception.http_response_content)
+        client.post_container(self.url, self.token, container_name,
+                              headers={'X-Versions-Enabled': 'true'})
+        client.get_object(
+            self.url, self.token, container_name, all_versions[1]['name'],
+            query_string='version-id=%s' % all_versions[1]['version_id'])
+
+    def test_missing_versions_container(self):
+        versions_header_key = 'X-Versions-Enabled'
+
+        # Create container1
+        container_name = 'container1'
+        obj_name = 'object1'
+        client.put_container(self.url, self.token, container_name)
+
+        # Write some data
+        client.put_object(self.url, self.token, container_name, obj_name,
+                          b'null version')
+
+        # Enable versioning
+        hdrs = {versions_header_key: 'True'}
+        client.post_container(self.url, self.token, container_name, hdrs)
+
+        # But directly delete hidden container to leave an orphan primary
+        # container
+        self.direct_delete_container(container=get_reserved_name(
+            'versions', container_name))
+
+        # Could be worse; we can still list versions and GET data
+        _headers, all_versions = client.get_container(
+            self.url, self.token, container_name, query_string='versions')
+        self.assertEqual(len(all_versions), 1)
+        self.assertEqual(all_versions[0]['name'], obj_name)
+        self.assertEqual(all_versions[0]['version_id'], 'null')
+
+        _headers, data = client.get_object(
+            self.url, self.token, container_name, obj_name)
+        self.assertEqual(data, b'null version')
+
+        _headers, data = client.get_object(
+            self.url, self.token, container_name, obj_name,
+            query_string='version-id=null')
+        self.assertEqual(data, b'null version')
+
+        # But most any write is going to fail
+        with self.assertRaises(client.ClientException) as caught:
+            client.put_object(self.url, self.token, container_name, obj_name,
+                              b'new version')
+        self.assertEqual(caught.exception.http_status, 500)
+        with self.assertRaises(client.ClientException) as caught:
+            client.delete_object(self.url, self.token, container_name,
+                                 obj_name)
+        self.assertEqual(caught.exception.http_status, 500)
+
+        # Version-aware delete can work, though!
+        client.delete_object(self.url, self.token, container_name, obj_name,
+                             query_string='version-id=null')
+
+        # Re-enabling versioning should square us
+        hdrs = {versions_header_key: 'True'}
+        client.post_container(self.url, self.token, container_name, hdrs)
+
+        client.put_object(self.url, self.token, container_name, obj_name,
+                          b'new version')
+
+        _headers, all_versions = client.get_container(
+            self.url, self.token, container_name, query_string='versions')
+        self.assertEqual(len(all_versions), 1)
+        self.assertEqual(all_versions[0]['name'], obj_name)
+        self.assertNotEqual(all_versions[0]['version_id'], 'null')
+
+        _headers, data = client.get_object(
+            self.url, self.token, container_name, obj_name)
+        self.assertEqual(data, b'new version')
+
+
+class TestECObjectVersioning(ECProbeTest):
+
+    def setUp(self):
+        super(TestECObjectVersioning, self).setUp()
+        self.part, self.nodes = self.object_ring.get_nodes(
+            self.account, self.container_name, self.object_name)
+
+    def test_versioning_with_metadata_replication(self):
+        # Enable versioning
+        client.put_container(self.url, self.token, self.container_name,
+                             headers={
+                                 'X-Storage-Policy': self.policy.name,
+                                 'X-Versions-Enabled': 'True',
+                             })
+        # create version with metadata in a handoff location
+        failed_primary = random.choice(self.nodes)
+        failed_primary_device_path = self.device_dir(failed_primary)
+        self.kill_drive(failed_primary_device_path)
+        headers = {'x-object-meta-foo': 'meta-foo'}
+        client.put_object(self.url, self.token, self.container_name,
+                          self.object_name, contents='some data',
+                          headers=headers)
+        headers_post = {'x-object-meta-bar': 'meta-bar'}
+        client.post_object(self.url, self.token, self.container_name,
+                           self.object_name, headers=headers_post)
+        # find the handoff
+        primary_ids = [n['id'] for n in self.nodes]
+        for handoff in self.object_ring.devs:
+            if handoff['id'] in primary_ids:
+                continue
+            try:
+                headers, etag = self.direct_get(handoff, self.part)
+            except direct_client.DirectClientException as err:
+                if err.http_status != 404:
+                    raise
+            else:
+                break
+        else:
+            self.fail('unable to find object on handoffs')
+        # we want to repair the fault, but avoid doing the handoff revert
+        self.revive_drive(failed_primary_device_path)
+        handoff_config = self.config_number(handoff)
+        failed_config = self.config_number(failed_primary)
+        partner_nodes = reconstructor._get_partners(
+            failed_primary['index'], self.nodes)
+        random.shuffle(partner_nodes)
+        for partner in partner_nodes:
+            fix_config = self.config_number(partner)
+            if fix_config not in (handoff_config, failed_config):
+                break
+        else:
+            self.fail('unable to find fix_config in %r excluding %r & %r' % (
+                [(d['device'], self.config_number(d)) for d in partner_nodes],
+                handoff_config, failed_config))
+
+        self.reconstructor.once(number=fix_config)
+        # validate object in all locations
+        missing = []
+        etags = set()
+        metadata = []
+        for node in self.nodes:
+            try:
+                headers, etag = self.direct_get(node, self.part)
+            except direct_client.DirectClientException as err:
+                if err.http_status != 404:
+                    raise
+                missing.append(node)
+                continue
+            etags.add(headers['X-Object-Sysmeta-Ec-Etag'])
+            metadata.append(headers.get(
+                'X-Object-Transient-Sysmeta-Crypto-Meta-Bar',
+                headers['X-Object-Meta-Bar']))
+        if missing:
+            self.fail('Ran reconstructor config #%s to repair %r but '
+                      'found 404 on primary: %r' % (
+                          fix_config, failed_primary['device'],
+                          [d['device'] for d in missing]))
+        self.assertEqual(1, len(etags))
+        if 'X-Object-Transient-Sysmeta-Crypto-Meta-Bar' in headers:
+            self.assertEqual(len(self.nodes), len(metadata))
+            self.assertEqual(1, len(set(metadata)))
+        else:
+            self.assertEqual(['meta-bar'] * len(self.nodes), metadata)
+        # process revert
+        self.reconstructor.once(number=handoff_config)
+        # validate object (still?) in primary locations
+        etags = set()
+        metadata = []
+        for node in self.nodes:
+            headers, etag = self.direct_get(node, self.part)
+            etags.add(headers['X-Object-Sysmeta-Ec-Etag'])
+            metadata.append(headers.get(
+                'X-Object-Transient-Sysmeta-Crypto-Meta-Bar',
+                headers['X-Object-Meta-Bar']))
+        self.assertEqual(1, len(etags))
+        if 'X-Object-Transient-Sysmeta-Crypto-Meta-Bar' in headers:
+            self.assertEqual(len(self.nodes), len(metadata))
+            self.assertEqual(1, len(set(metadata)))
+        else:
+            self.assertEqual(['meta-bar'] * len(self.nodes), metadata)
+        # and removed form handoff
+        with self.assertRaises(direct_client.DirectClientException) as ctx:
+            headers, etag = self.direct_get(handoff, self.part)
+        self.assertEqual(ctx.exception.http_status, 404)
+
+
+if __name__ == '__main__':
+    main()
diff --git a/test/probe/test_orphan_container.py b/test/probe/test_orphan_container.py
new file mode 100644
index 0000000000..414cb2bd7a
--- /dev/null
+++ b/test/probe/test_orphan_container.py
@@ -0,0 +1,150 @@
+#!/usr/bin/python -u
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import os
+
+from swiftclient import client
+from unittest import main
+
+from swift.common.exceptions import LockTimeout
+from swift.common.manager import Manager
+from swift.common.utils import hash_path, readconf, Timestamp
+from swift.container.backend import ContainerBroker
+
+from test.probe.common import (
+    kill_nonprimary_server, kill_server, start_server, ReplProbeTest)
+
+# Why is this not called test_container_orphan? Because the crash
+# happens in the account server, so both account and container
+# services are involved.
+#
+# The common way users do this is to use TripleO to deploy an overcloud
+# and add Gnocchi. Gnocchi is hammering Swift, its container has updates
+# all the time. Then, users crash the overcloud and re-deploy it,
+# using the new suffix in swift.conf. Thereafter, container service
+# inherits old container with outstanding updates, container updater
+# tries to send updates to the account server, while the account cannot
+# be found anymore. In this situation, in Swift 2.25.0, account server
+# tracebacks, and the cycle continues without end.
+
+
+class TestOrphanContainer(ReplProbeTest):
+
+    def get_account_db_files(self, account):
+
+        # This is "more correct" than (port_num%100)//10, but is it worth it?
+        # We have the assumption about port_num vs node_id embedded all over.
+        account_configs = {}
+        for _, cname in self.configs['account-server'].items():
+            conf = readconf(cname)
+            # config parser cannot know if it's a number or not, so int()
+            port = int(conf['app:account-server']['bind_port'])
+            account_configs[port] = conf
+
+        part, nodes = self.account_ring.get_nodes(account)
+        hash_str = hash_path(account)
+
+        ret = []
+        for node in nodes:
+
+            data_dir = 'accounts'
+            device = node['device']
+            conf = account_configs[node['port']]
+            devices = conf['app:account-server']['devices']
+
+            # os.path.join is for the weak
+            db_file = '%s/%s/%s/%s/%s/%s/%s.db' % (
+                devices, device, data_dir, part,
+                hash_str[-3:], hash_str, hash_str)
+            ret.append(db_file)
+        return ret
+
+    def test_update_pending(self):
+
+        # Create container
+        container = 'contx'
+        client.put_container(self.url, self.token, container)
+
+        part, nodes = self.account_ring.get_nodes(self.account)
+        anode = nodes[0]
+
+        # Stop a quorum of account servers
+        # This allows the put to continue later.
+        kill_nonprimary_server(nodes, self.ipport2server)
+        kill_server((anode['ip'], anode['port']), self.ipport2server)
+
+        # Put object
+        # This creates an outstanding update.
+        client.put_object(self.url, self.token, container, 'object1', b'123')
+
+        cont_db_files = self.get_container_db_files(container)
+        self.assertEqual(len(cont_db_files), 3)
+
+        # Collect the observable state from containers
+        outstanding_files = []
+        for cfile in cont_db_files:
+            broker = ContainerBroker(cfile)
+            try:
+                info = broker.get_info()
+            except LockTimeout:
+                self.fail('LockTimeout at %s' % (cfile,))
+            if Timestamp(info['put_timestamp']) <= 0:
+                self.fail('No put_timestamp at %s' % (cfile,))
+            # Correct even if reported_put_timestamp is zero.
+            if info['put_timestamp'] > info['reported_put_timestamp']:
+                outstanding_files.append(cfile)
+        self.assertGreater(len(outstanding_files), 0)
+
+        # At this point the users shut everything down and screw up the
+        # hash in swift.conf. But we destroy the account DB instead.
+        files = self.get_account_db_files(self.account)
+        for afile in files:
+            os.unlink(afile)
+
+        # Restart the stopped primary server
+        start_server((anode['ip'], anode['port']), self.ipport2server)
+
+        # Make sure updaters run
+        Manager(['container-updater']).once()
+
+        # Collect the observable state from containers again and examine it
+        outstanding_files_new = []
+        for cfile in cont_db_files:
+
+            # We aren't catching DatabaseConnectionError, because
+            # we only want to approve of DBs that were quarantined,
+            # and not otherwise damaged. So if the code below throws
+            # an exception for other reason, we want the test to fail.
+            if not os.path.exists(cfile):
+                continue
+
+            broker = ContainerBroker(cfile)
+            try:
+                info = broker.get_info()
+            except LockTimeout:
+                self.fail('LockTimeout at %s' % (cfile,))
+            if Timestamp(info['put_timestamp']) <= 0:
+                self.fail('No put_timestamp at %s' % (cfile,))
+            # Correct even if reported_put_timestamp is zero.
+            if info['put_timestamp'] > info['reported_put_timestamp']:
+                outstanding_files_new.append(cfile)
+        self.assertLengthEqual(outstanding_files_new, 0)
+
+        self.get_to_final_state()
+
+
+if __name__ == '__main__':
+    main()
diff --git a/test/probe/test_reconstructor_rebuild.py b/test/probe/test_reconstructor_rebuild.py
new file mode 100644
index 0000000000..37e1493f43
--- /dev/null
+++ b/test/probe/test_reconstructor_rebuild.py
@@ -0,0 +1,562 @@
+#!/usr/bin/python -u
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import itertools
+import unittest
+import uuid
+import random
+import time
+
+from swift.common.direct_client import DirectClientException
+from swift.common.header_key_dict import HeaderKeyDict
+from swift.common.internal_client import UnexpectedResponse
+from swift.common.manager import Manager
+from swift.common.swob import wsgi_to_str, str_to_wsgi
+from swift.common.utils import md5
+from swift.obj.reconstructor import ObjectReconstructor
+from test.probe.common import ECProbeTest
+
+from swift.common import direct_client
+
+from swiftclient import client, ClientException
+
+
+class Body(object):
+
+    def __init__(self, total=3.5 * 2 ** 20):
+        self.total = int(total)
+        self.hasher = md5(usedforsecurity=False)
+        self.size = 0
+        self.chunk = b'test' * 16 * 2 ** 10
+
+    @property
+    def etag(self):
+        return self.hasher.hexdigest()
+
+    def __iter__(self):
+        return self
+
+    def __next__(self):
+        if self.size > self.total:
+            raise StopIteration()
+        self.size += len(self.chunk)
+        self.hasher.update(self.chunk)
+        return self.chunk
+
+
+class TestReconstructorRebuild(ECProbeTest):
+
+    def setUp(self):
+        super(TestReconstructorRebuild, self).setUp()
+        self.int_client = self.make_internal_client()
+        # create EC container
+        headers = {'X-Storage-Policy': self.policy.name}
+        client.put_container(self.url, self.token, self.container_name,
+                             headers=headers)
+
+        # PUT object and POST some metadata
+        self.proxy_put()
+        self.headers_post = {
+            self._make_name('x-object-meta-').decode('utf8'):
+                self._make_name('meta-bar-').decode('utf8')}
+        client.post_object(self.url, self.token, self.container_name,
+                           self.object_name, headers=dict(self.headers_post))
+
+        self.opart, self.onodes = self.object_ring.get_nodes(
+            self.account, self.container_name, self.object_name)
+
+        # stash frag etags and metadata for later comparison
+        self.frag_headers, self.frag_etags = self._assert_all_nodes_have_frag()
+        for node_index, hdrs in self.frag_headers.items():
+            # sanity check
+            self.assertIn(
+                'X-Backend-Durable-Timestamp', hdrs,
+                'Missing durable timestamp in %r' % self.frag_headers)
+
+    def proxy_get(self):
+        # Use internal-client instead of python-swiftclient, since we can't
+        # handle UTF-8 headers properly w/ swiftclient.
+        # Still a proxy-server tho!
+        status, headers, body = self.int_client.get_object(
+            self.account,
+            self.container_name.decode('utf-8'),
+            self.object_name.decode('utf-8'))
+        resp_checksum = md5(usedforsecurity=False)
+        for chunk in body:
+            resp_checksum.update(chunk)
+        return HeaderKeyDict(headers), resp_checksum.hexdigest()
+
+    def _format_node(self, node):
+        return '%s#%s' % (node['device'], node['index'])
+
+    def _assert_all_nodes_have_frag(self, extra_headers=None):
+        # check all frags are in place
+        failures = []
+        frag_etags = {}
+        frag_headers = {}
+        for node in self.onodes:
+            try:
+                headers, etag = self.direct_get(node, self.opart,
+                                                extra_headers=extra_headers)
+                frag_etags[node['index']] = etag
+                del headers['Date']  # Date header will vary so remove it
+                frag_headers[node['index']] = headers
+            except direct_client.DirectClientException as err:
+                failures.append((node, err))
+        if failures:
+            self.fail('\n'.join(['    Node %r raised %r' %
+                                 (self._format_node(node), exc)
+                                 for (node, exc) in failures]))
+        return frag_headers, frag_etags
+
+    def _test_rebuild_scenario(self, failed, non_durable,
+                               reconstructor_cycles):
+        # helper method to test a scenario with some nodes missing their
+        # fragment and some nodes having non-durable fragments
+        with self.subTest(
+                failed=[self._format_node(self.onodes[n]) for n in failed],
+                non_durable=[self._format_node(self.onodes[n])
+                             for n in non_durable]):
+            self.break_nodes(self.onodes, self.opart, failed, non_durable)
+
+        # make sure we can still GET the object and it is correct; the
+        # proxy is doing decode on remaining fragments to get the obj
+        with self.subTest(
+                failed=[self._format_node(self.onodes[n]) for n in failed],
+                non_durable=[self._format_node(self.onodes[n])
+                             for n in non_durable]):
+            headers, etag = self.proxy_get()
+            self.assertEqual(self.etag, etag)
+            for key in self.headers_post:
+                # Since we use internal_client for the GET, headers come back
+                # as WSGI strings
+                wsgi_key = str_to_wsgi(key)
+                self.assertIn(wsgi_key, headers)
+                self.assertEqual(self.headers_post[key],
+                                 wsgi_to_str(headers[wsgi_key]))
+
+        # fire up reconstructor
+        for i in range(reconstructor_cycles):
+            self.reconstructor.once()
+
+        # check GET via proxy returns expected data and metadata
+        with self.subTest(
+                failed=[self._format_node(self.onodes[n]) for n in failed],
+                non_durable=[self._format_node(self.onodes[n])
+                             for n in non_durable]):
+            headers, etag = self.proxy_get()
+            self.assertEqual(self.etag, etag)
+            for key in self.headers_post:
+                wsgi_key = str_to_wsgi(key)
+                self.assertIn(wsgi_key, headers)
+                self.assertEqual(self.headers_post[key],
+                                 wsgi_to_str(headers[wsgi_key]))
+        # check all frags are intact, durable and have expected metadata
+        with self.subTest(
+                failed=[self._format_node(self.onodes[n]) for n in failed],
+                non_durable=[self._format_node(self.onodes[n])
+                             for n in non_durable]):
+            frag_headers, frag_etags = self._assert_all_nodes_have_frag()
+            self.assertEqual(self.frag_etags, frag_etags)
+            # self._frag_headers include X-Backend-Durable-Timestamp so this
+            # assertion confirms that the rebuilt frags are all durable
+            self.assertEqual(self.frag_headers, frag_headers)
+
+    def test_rebuild_missing_frags(self):
+        # build up a list of node lists to kill data from,
+        # first try a single node
+        # then adjacent nodes and then nodes >1 node apart
+        single_node = (random.randint(0, 5),)
+        adj_nodes = (0, 5)
+        far_nodes = (0, 4)
+
+        for failed_nodes in [single_node, adj_nodes, far_nodes]:
+            self._test_rebuild_scenario(failed_nodes, [], 1)
+
+    def test_rebuild_non_durable_frags(self):
+        # build up a list of node lists to make non-durable,
+        # first try a single node
+        # then adjacent nodes and then nodes >1 node apart
+        single_node = (random.randint(0, 5),)
+        adj_nodes = (0, 5)
+        far_nodes = (0, 4)
+
+        for non_durable_nodes in [single_node, adj_nodes, far_nodes]:
+            self._test_rebuild_scenario([], non_durable_nodes, 1)
+
+    def test_rebuild_with_missing_frags_and_non_durable_frags(self):
+        # pick some nodes with parts deleted, some with non-durable fragments
+        scenarios = [
+            # failed, non-durable
+            ((0, 2), (4,)),
+            ((0, 4), (2,)),
+        ]
+        for failed, non_durable in scenarios:
+            self._test_rebuild_scenario(failed, non_durable, 3)
+        scenarios = [
+            # failed, non-durable
+            ((0, 1), (2,)),
+            ((0, 2), (1,)),
+        ]
+        for failed, non_durable in scenarios:
+            # why 2 repeats? consider missing fragment on nodes 0, 1  and
+            # missing durable on node 2: first reconstructor cycle on node 3
+            # will make node 2 durable, first cycle on node 5 will rebuild on
+            # node 0; second cycle on node 0 or 2 will rebuild on node 1. Note
+            # that it is possible, that reconstructor processes on each node
+            # run in order such that all rebuild complete in once cycle, but
+            # that is not guaranteed, we allow 2 cycles to be sure.
+            self._test_rebuild_scenario(failed, non_durable, 2)
+        scenarios = [
+            # failed, non-durable
+            ((0, 2), (1, 3, 5)),
+            ((0,), (1, 2, 4, 5)),
+        ]
+        for failed, non_durable in scenarios:
+            # why 3 repeats? consider missing fragment on node 0 and single
+            # durable on node 3: first reconstructor cycle on node 3 will make
+            # nodes 2 and 4 durable, second cycle on nodes 2 and 4 will make
+            # node 1 and 5 durable, third cycle on nodes 1 or 5 will
+            # reconstruct the missing fragment on node 0.
+            self._test_rebuild_scenario(failed, non_durable, 3)
+
+    def test_rebuild_partner_down(self):
+        # we have to pick a lower index because we have few handoffs
+        nodes = self.onodes[:2]
+        random.shuffle(nodes)  # left or right is fine
+        primary_node, partner_node = nodes
+
+        # capture fragment etag from partner
+        failed_partner_meta, failed_partner_etag = self.direct_get(
+            partner_node, self.opart)
+
+        # and 507 the failed partner device
+        device_path = self.device_dir(partner_node)
+        self.kill_drive(device_path)
+
+        # reconstruct from the primary, while one of it's partners is 507'd
+        self.reconstructor.once(number=self.config_number(primary_node))
+
+        # a handoff will pickup the rebuild
+        hnodes = list(self.object_ring.get_more_nodes(self.opart))
+        for node in hnodes:
+            try:
+                found_meta, found_etag = self.direct_get(
+                    node, self.opart)
+            except DirectClientException as e:
+                if e.http_status != 404:
+                    raise
+            else:
+                break
+        else:
+            self.fail('Unable to fetch rebuilt frag from handoffs %r '
+                      'given primary nodes %r with %s unmounted '
+                      'trying to rebuild from %s' % (
+                          [h['device'] for h in hnodes],
+                          [n['device'] for n in self.onodes],
+                          partner_node['device'],
+                          primary_node['device'],
+                      ))
+        self.assertEqual(failed_partner_etag, found_etag)
+        del failed_partner_meta['Date']
+        del found_meta['Date']
+        self.assertEqual(failed_partner_meta, found_meta)
+
+        # just to be nice
+        self.revive_drive(device_path)
+
+    def test_sync_expired_object(self):
+        # verify that missing frag can be rebuilt for an expired object
+        delete_after = 2
+        self.proxy_put(extra_headers={'x-delete-after': delete_after})
+        self.proxy_get()  # sanity check
+        orig_frag_headers, orig_frag_etags = self._assert_all_nodes_have_frag(
+            extra_headers={'X-Backend-Replication': 'True'})
+
+        # wait for object to expire
+        timeout = time.time() + delete_after + 1
+        while time.time() < timeout:
+            try:
+                self.proxy_get()
+            except UnexpectedResponse as e:
+                if e.resp.status_int == 404:
+                    break
+                else:
+                    raise
+        else:
+            self.fail('Timed out waiting for %s/%s to expire after %ss' % (
+                self.container_name, self.object_name, delete_after))
+
+        # sanity check - X-Backend-Replication let's us get expired frag...
+        fail_node = random.choice(self.onodes)
+        self.assert_direct_get_succeeds(
+            fail_node, self.opart,
+            extra_headers={'X-Backend-Replication': 'True'})
+        # ...until we remove the frag from fail_node
+        self.break_nodes(
+            self.onodes, self.opart, [self.onodes.index(fail_node)], [])
+        # ...now it's really gone
+        with self.assertRaises(DirectClientException) as cm:
+            self.direct_get(fail_node, self.opart,
+                            extra_headers={'X-Backend-Replication': 'True'})
+        self.assertEqual(404, cm.exception.http_status)
+        self.assertNotIn('X-Backend-Timestamp', cm.exception.http_headers)
+
+        # run the reconstructor
+        self.reconstructor.once()
+
+        # the missing frag is now in place but expired
+        with self.assertRaises(DirectClientException) as cm:
+            self.direct_get(fail_node, self.opart)
+        self.assertEqual(404, cm.exception.http_status)
+        self.assertIn('X-Backend-Timestamp', cm.exception.http_headers)
+
+        # check all frags are intact, durable and have expected metadata
+        frag_headers, frag_etags = self._assert_all_nodes_have_frag(
+            extra_headers={'X-Backend-Replication': 'True'})
+        self.assertEqual(orig_frag_etags, frag_etags)
+        self.maxDiff = None
+        self.assertEqual(orig_frag_headers, frag_headers)
+
+    def test_sync_unexpired_object_metadata(self):
+        # verify that metadata can be sync'd to a frag that has missed a POST
+        # and consequently that frag appears to be expired, when in fact the
+        # POST removed the x-delete-at header
+        client.put_container(self.url, self.token, self.container_name,
+                             headers={'x-storage-policy': self.policy.name})
+        opart, onodes = self.object_ring.get_nodes(
+            self.account, self.container_name, self.object_name)
+        delete_at = int(time.time() + 3)
+        contents = ('body-%s' % uuid.uuid4()).encode()
+        headers = {'x-delete-at': delete_at}
+        client.put_object(self.url, self.token, self.container_name,
+                          self.object_name, headers=headers, contents=contents)
+        # fail a primary
+        post_fail_node = random.choice(onodes)
+        post_fail_path = self.device_dir(post_fail_node)
+        self.kill_drive(post_fail_path)
+        # post over w/o x-delete-at
+        client.post_object(self.url, self.token, self.container_name,
+                           self.object_name, {'content-type': 'something-new'})
+        # revive failed primary
+        self.revive_drive(post_fail_path)
+        # wait for the delete_at to pass, and check that it thinks the object
+        # is expired
+        timeout = time.time() + 5
+        err = None
+        while time.time() < timeout:
+            try:
+                direct_client.direct_head_object(
+                    post_fail_node, opart, self.account, self.container_name,
+                    self.object_name, headers={
+                        'X-Backend-Storage-Policy-Index': int(self.policy)})
+            except direct_client.ClientException as client_err:
+                if client_err.http_status != 404:
+                    raise
+                err = client_err
+                break
+            else:
+                time.sleep(0.1)
+        else:
+            self.fail('Failed to get a 404 from node with expired object')
+        self.assertEqual(err.http_status, 404)
+        self.assertIn('X-Backend-Timestamp', err.http_headers)
+
+        # but from the proxy we've got the whole story
+        headers, body = client.get_object(self.url, self.token,
+                                          self.container_name,
+                                          self.object_name)
+        self.assertNotIn('X-Delete-At', headers)
+        self.reconstructor.once()
+
+        # ... and all the nodes have the final unexpired state
+        for node in onodes:
+            headers = direct_client.direct_head_object(
+                node, opart, self.account, self.container_name,
+                self.object_name, headers={
+                    'X-Backend-Storage-Policy-Index': int(self.policy)})
+            self.assertNotIn('X-Delete-At', headers)
+
+    def test_rebuild_quarantines_lonely_frag(self):
+        # fail one device while the object is deleted so we are left with one
+        # fragment and some tombstones
+        failed_node = self.onodes[0]
+        device_path = self.device_dir(failed_node)
+        self.kill_drive(device_path)
+        self.assert_direct_get_fails(failed_node, self.opart, 507)  # sanity
+
+        # delete object
+        client.delete_object(self.url, self.token, self.container_name,
+                             self.object_name)
+
+        # check we have tombstones
+        for node in self.onodes[1:]:
+            err = self.assert_direct_get_fails(node, self.opart, 404)
+            self.assertIn('X-Backend-Timestamp', err.http_headers)
+
+        # run the reconstructor with zero reclaim age to clean up tombstones
+        for conf_index in self.configs['object-reconstructor'].keys():
+            self.run_custom_daemon(
+                ObjectReconstructor, 'object-reconstructor', conf_index,
+                {'reclaim_age': '0'})
+
+        # check we no longer have tombstones
+        for node in self.onodes[1:]:
+            err = self.assert_direct_get_fails(node, self.opart, 404)
+            self.assertNotIn('X-Timestamp', err.http_headers)
+
+        # revive the failed device and check it has a fragment
+        self.revive_drive(device_path)
+        self.assert_direct_get_succeeds(failed_node, self.opart)
+
+        # restart proxy to clear error-limiting so that the revived drive
+        # participates again
+        Manager(['proxy-server']).restart()
+
+        # client GET will fail with 503 ...
+        with self.assertRaises(ClientException) as cm:
+            client.get_object(self.url, self.token, self.container_name,
+                              self.object_name)
+        self.assertEqual(503, cm.exception.http_status)
+        # ... but client HEAD succeeds
+
+        path = self.int_client.make_path(
+            self.account,
+            self.container_name.decode('utf-8'),
+            self.object_name.decode('utf-8'))
+        resp = self.int_client.make_request(
+            'HEAD', path, {}, acceptable_statuses=(2,))
+        for key in self.headers_post:
+            wsgi_key = str_to_wsgi(key)
+            self.assertIn(wsgi_key, resp.headers)
+            self.assertEqual(self.headers_post[key],
+                             wsgi_to_str(resp.headers[wsgi_key]))
+
+        # run the reconstructor without quarantine_threshold set
+        error_lines = []
+        warning_lines = []
+        for conf_index in self.configs['object-reconstructor'].keys():
+            reconstructor = self.run_custom_daemon(
+                ObjectReconstructor, 'object-reconstructor', conf_index,
+                {'quarantine_age': '0'})
+            logger = reconstructor.logger
+            error_lines.append(logger.get_lines_for_level('error'))
+            warning_lines.append(logger.get_lines_for_level('warning'))
+
+        # check logs for errors
+        found_lines = False
+        for lines in error_lines:
+            if not lines:
+                continue
+            self.assertFalse(found_lines, error_lines)
+            found_lines = True
+            for line in itertools.islice(lines, 0, 6, 2):
+                self.assertIn(
+                    'Unable to get enough responses (1/4 from 1 ok '
+                    'responses)', line, lines)
+            for line in itertools.islice(lines, 1, 7, 2):
+                self.assertIn(
+                    'Unable to get enough responses (4 x 404 error '
+                    'responses)', line, lines)
+        self.assertTrue(found_lines, 'error lines not found')
+
+        for lines in warning_lines:
+            self.assertEqual([], lines)
+
+        # check we have still have a single fragment and no tombstones
+        self.assert_direct_get_succeeds(failed_node, self.opart)
+        for node in self.onodes[1:]:
+            err = self.assert_direct_get_fails(node, self.opart, 404)
+            self.assertNotIn('X-Timestamp', err.http_headers)
+
+        # run the reconstructor to quarantine the lonely frag
+        error_lines = []
+        warning_lines = []
+        for conf_index in self.configs['object-reconstructor'].keys():
+            reconstructor = self.run_custom_daemon(
+                ObjectReconstructor, 'object-reconstructor', conf_index,
+                {'quarantine_age': '0', 'quarantine_threshold': '1'})
+            logger = reconstructor.logger
+            error_lines.append(logger.get_lines_for_level('error'))
+            warning_lines.append(logger.get_lines_for_level('warning'))
+
+        # check logs for errors
+        found_lines = False
+        for index, lines in enumerate(error_lines):
+            if not lines:
+                continue
+            self.assertFalse(found_lines, error_lines)
+            found_lines = True
+            for line in itertools.islice(lines, 0, 6, 2):
+                self.assertIn(
+                    'Unable to get enough responses (1/4 from 1 ok '
+                    'responses)', line, lines)
+            for line in itertools.islice(lines, 1, 7, 2):
+                self.assertIn(
+                    'Unable to get enough responses (6 x 404 error '
+                    'responses)', line, lines)
+        self.assertTrue(found_lines, 'error lines not found')
+
+        # check logs for quarantine warning
+        found_lines = False
+        for lines in warning_lines:
+            if not lines:
+                continue
+            self.assertFalse(found_lines, warning_lines)
+            found_lines = True
+            self.assertEqual(1, len(lines), lines)
+            self.assertIn('Quarantined object', lines[0])
+        self.assertTrue(found_lines, 'warning lines not found')
+
+        # check we have nothing
+        for node in self.onodes:
+            err = self.assert_direct_get_fails(node, self.opart, 404)
+            self.assertNotIn('X-Backend-Timestamp', err.http_headers)
+        # client HEAD and GET now both 404
+        with self.assertRaises(ClientException) as cm:
+            client.get_object(self.url, self.token, self.container_name,
+                              self.object_name)
+        self.assertEqual(404, cm.exception.http_status)
+        with self.assertRaises(ClientException) as cm:
+            client.head_object(self.url, self.token, self.container_name,
+                               self.object_name)
+        self.assertEqual(404, cm.exception.http_status)
+
+        # run the reconstructor once more - should see no errors in logs!
+        error_lines = []
+        warning_lines = []
+        for conf_index in self.configs['object-reconstructor'].keys():
+            reconstructor = self.run_custom_daemon(
+                ObjectReconstructor, 'object-reconstructor', conf_index,
+                {'quarantine_age': '0', 'quarantine_threshold': '1'})
+            logger = reconstructor.logger
+            error_lines.append(logger.get_lines_for_level('error'))
+            warning_lines.append(logger.get_lines_for_level('warning'))
+
+        for lines in error_lines:
+            self.assertEqual([], lines)
+        for lines in warning_lines:
+            self.assertEqual([], lines)
+
+
+class TestReconstructorRebuildUTF8(TestReconstructorRebuild):
+
+    def _make_name(self, prefix):
+        return b'%s\xc3\xa8-%s' % (
+            prefix.encode(), str(uuid.uuid4()).encode())
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/test/probe/test_reconstructor_revert.py b/test/probe/test_reconstructor_revert.py
new file mode 100644
index 0000000000..910f4d741f
--- /dev/null
+++ b/test/probe/test_reconstructor_revert.py
@@ -0,0 +1,458 @@
+#!/usr/bin/python -u
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import itertools
+import unittest
+import random
+import shutil
+from collections import defaultdict
+
+from swift.obj.reconstructor import ObjectReconstructor
+from test.probe.common import ECProbeTest, Body
+
+from swift.common import direct_client
+from swift.obj import reconstructor
+
+from swiftclient import client
+
+
+class TestReconstructorRevert(ECProbeTest):
+
+    def test_revert_object(self):
+        # create EC container
+        headers = {'X-Storage-Policy': self.policy.name}
+        client.put_container(self.url, self.token, self.container_name,
+                             headers=headers)
+
+        # get our node lists
+        opart, onodes = self.object_ring.get_nodes(
+            self.account, self.container_name, self.object_name)
+        hnodes = self.object_ring.get_more_nodes(opart)
+
+        # kill 2 a parity count number of primary nodes so we can
+        # force data onto handoffs, we do that by renaming dev dirs
+        # to induce 507
+        p_dev1 = self.device_dir(onodes[0])
+        p_dev2 = self.device_dir(onodes[1])
+        self.kill_drive(p_dev1)
+        self.kill_drive(p_dev2)
+
+        # PUT object
+        contents = Body()
+        headers = {'x-object-meta-foo': 'meta-foo',
+                   u'x-object-meta-non-ascii-value1': u'meta-f\xf6\xf6'}
+        headers_post = {'x-object-meta-bar': 'meta-bar',
+                        u'x-object-meta-non-ascii-value2': u'meta-b\xe4r'}
+        client.put_object(self.url, self.token, self.container_name,
+                          self.object_name, contents=contents,
+                          headers=headers)
+        client.post_object(self.url, self.token, self.container_name,
+                           self.object_name, headers=headers_post)
+        # (Some versions of?) swiftclient will mutate the headers dict on post
+        headers_post.pop('X-Auth-Token', None)
+
+        # these primaries can't serve the data any more, we expect 507
+        # here and not 404 because we're using mount_check to kill nodes
+        for onode in (onodes[0], onodes[1]):
+            self.assert_direct_get_fails(onode, opart, 507)
+
+        # now take out another primary
+        p_dev3 = self.device_dir(onodes[2])
+        self.kill_drive(p_dev3)
+
+        # this node can't serve the data any more
+        self.assert_direct_get_fails(onodes[2], opart, 507)
+
+        # make sure we can still GET the object and its correct
+        # we're now pulling from handoffs and reconstructing
+        _headers, etag = self.proxy_get()
+        self.assertEqual(etag, contents.etag)
+
+        # rename the dev dirs so they don't 507 anymore
+        self.revive_drive(p_dev1)
+        self.revive_drive(p_dev2)
+        self.revive_drive(p_dev3)
+
+        # fire up reconstructor on handoff nodes only
+        for hnode in hnodes:
+            hnode_id = self.config_number(hnode)
+            self.reconstructor.once(number=hnode_id)
+
+        # first three primaries have data again
+        for onode in (onodes[0], onodes[2]):
+            self.assert_direct_get_succeeds(onode, opart)
+
+        # check meta
+        meta = client.head_object(self.url, self.token,
+                                  self.container_name,
+                                  self.object_name)
+        for key in headers_post:
+            self.assertIn(key, meta)
+            self.assertEqual(meta[key], headers_post[key])
+
+        # handoffs are empty
+        for hnode in hnodes:
+            self.assert_direct_get_fails(hnode, opart, 404)
+
+    def test_delete_propagate(self):
+        # create EC container
+        headers = {'X-Storage-Policy': self.policy.name}
+        client.put_container(self.url, self.token, self.container_name,
+                             headers=headers)
+
+        # get our node lists
+        opart, onodes = self.object_ring.get_nodes(
+            self.account, self.container_name, self.object_name)
+        hnodes = list(itertools.islice(
+            self.object_ring.get_more_nodes(opart), 2))
+
+        # PUT object
+        contents = Body()
+        client.put_object(self.url, self.token, self.container_name,
+                          self.object_name, contents=contents)
+
+        # now lets shut down a couple of primaries
+        failed_nodes = random.sample(onodes, 2)
+        for node in failed_nodes:
+            self.kill_drive(self.device_dir(node))
+
+        # Write tombstones over the nodes that are still online
+        client.delete_object(self.url, self.token,
+                             self.container_name,
+                             self.object_name)
+
+        # spot check the primary nodes that are still online
+        delete_timestamp = None
+        for node in onodes:
+            if node in failed_nodes:
+                continue
+            try:
+                self.direct_get(node, opart)
+            except direct_client.DirectClientException as err:
+                self.assertEqual(err.http_status, 404)
+                delete_timestamp = err.http_headers['X-Backend-Timestamp']
+            else:
+                self.fail('Node data on %r was not fully destroyed!' %
+                          (node,))
+
+        # run the reconstructor on the handoff node multiple times until
+        # tombstone is pushed out - each handoff node syncs to a few
+        # primaries each time
+        iterations = 0
+        while iterations < 52:
+            self.reconstructor.once(number=self.config_number(hnodes[0]))
+            iterations += 1
+            # see if the tombstone is reverted
+            try:
+                self.direct_get(hnodes[0], opart)
+            except direct_client.DirectClientException as err:
+                self.assertEqual(err.http_status, 404)
+                if 'X-Backend-Timestamp' not in err.http_headers:
+                    # this means the tombstone is *gone* so it's reverted
+                    break
+        else:
+            self.fail('Still found tombstone on %r after %s iterations' % (
+                hnodes[0], iterations))
+
+        # tombstone is still on the *second* handoff
+        try:
+            self.direct_get(hnodes[1], opart)
+        except direct_client.DirectClientException as err:
+            self.assertEqual(err.http_status, 404)
+            self.assertEqual(err.http_headers['X-Backend-Timestamp'],
+                             delete_timestamp)
+        else:
+            self.fail('Found obj data on %r' % hnodes[1])
+
+        # repair the primaries
+        self.revive_drive(self.device_dir(failed_nodes[0]))
+        self.revive_drive(self.device_dir(failed_nodes[1]))
+
+        # run reconstructor on second handoff
+        self.reconstructor.once(number=self.config_number(hnodes[1]))
+
+        # verify tombstone is reverted on the first pass
+        try:
+            self.direct_get(hnodes[1], opart)
+        except direct_client.DirectClientException as err:
+            self.assertEqual(err.http_status, 404)
+            self.assertNotIn('X-Backend-Timestamp', err.http_headers)
+        else:
+            self.fail('Found obj data on %r' % hnodes[1])
+
+        # sanity make sure proxy get can't find it
+        try:
+            self.proxy_get()
+        except Exception as err:
+            self.assertEqual(err.http_status, 404)
+        else:
+            self.fail('Node data on %r was not fully destroyed!' %
+                      (onodes[0]))
+
+    def test_reconstruct_from_reverted_fragment_archive(self):
+        headers = {'X-Storage-Policy': self.policy.name}
+        client.put_container(self.url, self.token, self.container_name,
+                             headers=headers)
+
+        # get our node lists
+        opart, onodes = self.object_ring.get_nodes(
+            self.account, self.container_name, self.object_name)
+
+        # find a primary server that only has one of it's devices in the
+        # primary node list
+        group_nodes_by_config = defaultdict(list)
+        for n in onodes:
+            group_nodes_by_config[self.config_number(n)].append(n)
+        for config_number, node_list in group_nodes_by_config.items():
+            if len(node_list) == 1:
+                break
+        else:
+            self.fail('ring balancing did not use all available nodes')
+        primary_node = node_list[0]
+
+        # ... and 507 it's device
+        primary_device = self.device_dir(primary_node)
+        self.kill_drive(primary_device)
+
+        # PUT object
+        contents = Body()
+        etag = client.put_object(self.url, self.token, self.container_name,
+                                 self.object_name, contents=contents)
+        self.assertEqual(contents.etag, etag)
+
+        # fix the primary device and sanity GET
+        self.revive_drive(primary_device)
+        _headers, actual_etag = self.proxy_get()
+        self.assertEqual(etag, actual_etag)
+
+        # find a handoff holding the fragment
+        for hnode in self.object_ring.get_more_nodes(opart):
+            try:
+                _hdrs, reverted_fragment_etag = self.direct_get(hnode, opart)
+            except direct_client.DirectClientException as err:
+                if err.http_status != 404:
+                    raise
+            else:
+                break
+        else:
+            self.fail('Unable to find handoff fragment!')
+
+        # we'll force the handoff device to revert instead of potentially
+        # racing with rebuild by deleting any other fragments that may be on
+        # the same server
+        handoff_fragment_etag = None
+        for node in onodes:
+            if self.is_local_to(node, hnode):
+                # we'll keep track of the etag of this fragment we're removing
+                # in case we need it later (queue forshadowing music)...
+                try:
+                    _hdrs, handoff_fragment_etag = self.direct_get(node, opart)
+                except direct_client.DirectClientException as err:
+                    if err.http_status != 404:
+                        raise
+                    # this just means our handoff device was on the same
+                    # machine as the primary!
+                    continue
+                # use the primary nodes device - not the hnode device
+                part_dir = self.storage_dir(node, part=opart)
+                shutil.rmtree(part_dir, True)
+
+        # revert from handoff device with reconstructor
+        self.reconstructor.once(number=self.config_number(hnode))
+
+        # verify fragment reverted to primary server
+        self.assertEqual(reverted_fragment_etag,
+                         self.direct_get(primary_node, opart)[1])
+
+        # now we'll remove some data on one of the primary node's partners
+        partner = random.choice(reconstructor._get_partners(
+            primary_node['index'], onodes))
+
+        try:
+            _hdrs, rebuilt_fragment_etag = self.direct_get(partner, opart)
+        except direct_client.DirectClientException as err:
+            if err.http_status != 404:
+                raise
+            # partner already had it's fragment removed
+            if (handoff_fragment_etag is not None and
+                    self.is_local_to(hnode, partner)):
+                # oh, well that makes sense then...
+                rebuilt_fragment_etag = handoff_fragment_etag
+            else:
+                # I wonder what happened?
+                self.fail('Partner inexplicably missing fragment!')
+        part_dir = self.storage_dir(partner, part=opart)
+        shutil.rmtree(part_dir, True)
+
+        # sanity, it's gone
+        try:
+            self.direct_get(partner, opart)
+        except direct_client.DirectClientException as err:
+            if err.http_status != 404:
+                raise
+        else:
+            self.fail('successful GET of removed partner fragment archive!?')
+
+        # and force the primary node to do a rebuild
+        self.reconstructor.once(number=self.config_number(primary_node))
+
+        # and validate the partners rebuilt_fragment_etag
+        try:
+            self.assertEqual(rebuilt_fragment_etag,
+                             self.direct_get(partner, opart)[1])
+        except direct_client.DirectClientException as err:
+            if err.http_status != 404:
+                raise
+            else:
+                self.fail('Did not find rebuilt fragment on partner node')
+
+    def test_handoff_non_durable(self):
+        # verify that reconstructor reverts non-durable frags from handoff to
+        # primary (and also durable frag of same object on same handoff) and
+        # cleans up non-durable data files on handoffs after revert
+        headers = {'X-Storage-Policy': self.policy.name}
+        client.put_container(self.url, self.token, self.container_name,
+                             headers=headers)
+
+        # get our node lists
+        opart, onodes = self.object_ring.get_nodes(
+            self.account, self.container_name, self.object_name)
+        pdevs = [self.device_dir(onode) for onode in onodes]
+        hnodes = list(itertools.islice(
+            self.object_ring.get_more_nodes(opart), 2))
+
+        # kill a primary nodes so we can force data onto a handoff
+        self.kill_drive(pdevs[0])
+
+        # PUT object at t1
+        contents = Body(total=3.5 * 2 ** 20)
+        headers = {'x-object-meta-foo': 'meta-foo'}
+        headers_post = {'content-type': 'meta/bar'}
+        client.put_object(self.url, self.token, self.container_name,
+                          self.object_name, contents=contents,
+                          headers=headers)
+        client.post_object(self.url, self.token, self.container_name,
+                           self.object_name, headers=headers_post)
+        # (Some versions of?) swiftclient will mutate the headers dict on post
+        headers_post.pop('X-Auth-Token', None)
+
+        # this primary can't serve the data; we expect 507 here and not 404
+        # because we're using mount_check to kill nodes
+        self.assert_direct_get_fails(onodes[0], opart, 507)
+        # these primaries and first handoff do have the data
+        for onode in (onodes[1:]):
+            self.assert_direct_get_succeeds(onode, opart)
+        _hdrs, older_frag_etag = self.assert_direct_get_succeeds(hnodes[0],
+                                                                 opart)
+        self.assert_direct_get_fails(hnodes[1], opart, 404)
+
+        # make sure we can GET the object; there's 5 primaries and 1 handoff
+        headers, older_obj_etag = self.proxy_get()
+        self.assertEqual(contents.etag, older_obj_etag)
+        self.assertEqual('meta/bar', headers.get('content-type'))
+
+        # PUT object at t2; make all frags non-durable so that the previous
+        # durable frags at t1 remain on object server; use InternalClient so
+        # that x-backend-no-commit is passed through
+        internal_client = self.make_internal_client()
+        contents2 = Body(total=2.5 * 2 ** 20)  # different content
+        self.assertNotEqual(contents2.etag, older_obj_etag)  # sanity check
+        headers = {'x-backend-no-commit': 'True',
+                   'content-type': 'meta/bar-new'}
+        internal_client.upload_object(contents2, self.account,
+                                      self.container_name.decode('utf8'),
+                                      self.object_name.decode('utf8'),
+                                      headers)
+        # GET should still return the older durable object
+        headers, obj_etag = self.proxy_get()
+        self.assertEqual(older_obj_etag, obj_etag)
+        self.assertEqual('meta/bar', headers.get('content-type'))
+        # on handoff we have older durable and newer non-durable
+        _hdrs, frag_etag = self.assert_direct_get_succeeds(hnodes[0], opart)
+        self.assertEqual(older_frag_etag, frag_etag)
+        _hdrs, newer_frag_etag = self.assert_direct_get_succeeds(
+            hnodes[0], opart, require_durable=False)
+        self.assertNotEqual(older_frag_etag, newer_frag_etag)
+
+        # now make all the newer frags durable only on the 5 primaries
+        self.assertEqual(5, self.make_durable(onodes[1:], opart))
+        # now GET will return the newer object
+        headers, newer_obj_etag = self.proxy_get()
+        self.assertEqual(contents2.etag, newer_obj_etag)
+        self.assertNotEqual(older_obj_etag, newer_obj_etag)
+        self.assertEqual('meta/bar-new', headers.get('content-type'))
+
+        # fix the 507'ing primary
+        self.revive_drive(pdevs[0])
+
+        # fire up reconstructor on handoff node only; commit_window is
+        # set to zero to ensure the nondurable handoff frag is purged
+        hnode_id = self.config_number(hnodes[0])
+        self.run_custom_daemon(
+            ObjectReconstructor, 'object-reconstructor', hnode_id,
+            {'commit_window': '0'})
+
+        # primary now has only the newer non-durable frag
+        self.assert_direct_get_fails(onodes[0], opart, 404)
+        _hdrs, frag_etag = self.assert_direct_get_succeeds(
+            onodes[0], opart, require_durable=False)
+        self.assertEqual(newer_frag_etag, frag_etag)
+
+        # handoff has only the older durable
+        _hdrs, frag_etag = self.assert_direct_get_succeeds(hnodes[0], opart)
+        self.assertEqual(older_frag_etag, frag_etag)
+        headers, frag_etag = self.assert_direct_get_succeeds(
+            hnodes[0], opart, require_durable=False)
+        self.assertEqual(older_frag_etag, frag_etag)
+        self.assertEqual('meta/bar', headers.get('content-type'))
+
+        # fire up reconstructor on handoff node only, again
+        self.reconstructor.once(number=hnode_id)
+
+        # primary now has the newer non-durable frag and the older durable frag
+        headers, frag_etag = self.assert_direct_get_succeeds(onodes[0], opart)
+        self.assertEqual(older_frag_etag, frag_etag)
+        self.assertEqual('meta/bar', headers.get('content-type'))
+        headers, frag_etag = self.assert_direct_get_succeeds(
+            onodes[0], opart, require_durable=False)
+        self.assertEqual(newer_frag_etag, frag_etag)
+        self.assertEqual('meta/bar-new', headers.get('content-type'))
+
+        # handoff has nothing
+        self.assert_direct_get_fails(hnodes[0], opart, 404,
+                                     require_durable=False)
+
+        # kill all but first two primaries
+        for pdev in pdevs[2:]:
+            self.kill_drive(pdev)
+        # fire up reconstructor on the remaining primary[1]; without the
+        # other primaries, primary[1] cannot rebuild the frag but it can let
+        # primary[0] know that its non-durable frag can be made durable
+        self.reconstructor.once(number=self.config_number(onodes[1]))
+
+        # first primary now has a *durable* *newer* frag - it *was* useful to
+        # sync the non-durable!
+        headers, frag_etag = self.assert_direct_get_succeeds(onodes[0], opart)
+        self.assertEqual(newer_frag_etag, frag_etag)
+        self.assertEqual('meta/bar-new', headers.get('content-type'))
+
+        # revive primaries (in case we want to debug)
+        for pdev in pdevs[2:]:
+            self.revive_drive(pdev)
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/test/probe/test_replication_servers_working.py b/test/probe/test_replication_servers_working.py
new file mode 100644
index 0000000000..3bc7ed928e
--- /dev/null
+++ b/test/probe/test_replication_servers_working.py
@@ -0,0 +1,233 @@
+#!/usr/bin/python -u
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from io import BytesIO
+from unittest import main
+from uuid import uuid4
+import os
+import time
+import shutil
+import re
+
+from swiftclient import client
+from swift.obj.diskfile import get_data_dir
+
+from test.probe.common import ReplProbeTest
+from swift.common.request_helpers import get_reserved_name
+from swift.common.utils import readconf
+
+EXCLUDE_FILES = re.compile(r'^(hashes\.(pkl|invalid)|lock(-\d+)?)$')
+
+
+def collect_info(path_list):
+    """
+    Recursive collect dirs and files in path_list directory.
+
+    :param path_list: start directory for collecting
+    :return: files_list, dir_list tuple of included
+    directories and files
+    """
+    files_list = []
+    dir_list = []
+    for path in path_list:
+        temp_files_list = []
+        temp_dir_list = []
+        for root, dirs, files in os.walk(path):
+            files = [f for f in files if not EXCLUDE_FILES.match(f)]
+            temp_files_list += files
+            temp_dir_list += dirs
+        files_list.append(temp_files_list)
+        dir_list.append(temp_dir_list)
+    return files_list, dir_list
+
+
+def find_max_occupancy_node(dir_list):
+    """
+    Find node with maximum occupancy.
+
+    :param dir_list: list of directories for each node.
+    :return: number number node in list_dir
+    """
+    count = 0
+    number = 0
+    length = 0
+    for dirs in dir_list:
+        if length < len(dirs):
+            length = len(dirs)
+            number = count
+        count += 1
+    return number
+
+
+class TestReplicatorFunctions(ReplProbeTest):
+    """
+    Class for testing replicators and replication servers.
+
+    By default configuration - replication servers not used.
+    For testing separate replication servers servers need to change
+    ring's files using set_info command or new ring's files with
+    different port values.
+    """
+
+    def put_data(self):
+        container = 'container-%s' % uuid4()
+        client.put_container(self.url, self.token, container,
+                             headers={'X-Storage-Policy':
+                                      self.policy.name})
+
+        obj = 'object-%s' % uuid4()
+        client.put_object(self.url, self.token, container, obj, 'VERIFY')
+
+    def test_main(self):
+        # Create one account, container and object file.
+        # Find node with account, container and object replicas.
+        # Delete all directories and files from this node (device).
+        # Wait 60 seconds and check replication results.
+        # Delete directories and files in objects storage without
+        # deleting file "hashes.pkl".
+        # Check, that files not replicated.
+        # Delete file "hashes.pkl".
+        # Check, that all files were replicated.
+        path_list = []
+        data_dir = get_data_dir(self.policy)
+        # Figure out where the devices are
+        for node_id in range(1, 5):
+            conf = readconf(self.configs['object-server'][node_id])
+            device_path = conf['app:object-server']['devices']
+            for dev in self.object_ring.devs:
+                if dev['port'] == int(conf['app:object-server']['bind_port']):
+                    device = dev['device']
+            path_list.append(os.path.join(device_path, device))
+
+        # Put data to storage nodes
+        self.put_data()
+
+        # Get all data file information
+        (files_list, dir_list) = collect_info(path_list)
+        num = find_max_occupancy_node(dir_list)
+        test_node = path_list[num]
+        test_node_files_list = []
+        for files in files_list[num]:
+            if not files.endswith('.pending'):
+                test_node_files_list.append(files)
+        test_node_dir_list = []
+        for d in dir_list[num]:
+            if not d.startswith('tmp'):
+                test_node_dir_list.append(d)
+        # Run all replicators
+        try:
+            # Delete some files
+            for directory in os.listdir(test_node):
+                shutil.rmtree(os.path.join(test_node, directory))
+
+            self.assertFalse(os.listdir(test_node))
+
+            self.replicators.start()
+
+            # We will keep trying these tests until they pass for up to 60s
+            begin = time.time()
+            while True:
+                (new_files_list, new_dir_list) = collect_info([test_node])
+
+                try:
+                    # Check replicate files and dir
+                    for files in test_node_files_list:
+                        self.assertIn(files, new_files_list[0])
+
+                    for directory in test_node_dir_list:
+                        self.assertIn(directory, new_dir_list[0])
+
+                    # We want to make sure that replication is completely
+                    # settled; any invalidated hashes should be rehashed so
+                    # hashes.pkl is stable
+                    for directory in os.listdir(
+                            os.path.join(test_node, data_dir)):
+                        hashes_invalid_path = os.path.join(
+                            test_node, data_dir, directory, 'hashes.invalid')
+                        self.assertEqual(os.stat(
+                            hashes_invalid_path).st_size, 0)
+                    break
+                except Exception:
+                    if time.time() - begin > 60:
+                        raise
+                    time.sleep(1)
+
+            self.replicators.stop()
+
+            # Delete directories and files in objects storage without
+            # deleting file "hashes.pkl".
+            for directory in os.listdir(os.path.join(test_node, data_dir)):
+                for input_dir in os.listdir(os.path.join(
+                        test_node, data_dir, directory)):
+                    if os.path.isdir(os.path.join(
+                            test_node, data_dir, directory, input_dir)):
+                        shutil.rmtree(os.path.join(
+                            test_node, data_dir, directory, input_dir))
+
+            self.replicators.once()
+            # Check, that files not replicated.
+            for directory in os.listdir(os.path.join(
+                    test_node, data_dir)):
+                for input_dir in os.listdir(os.path.join(
+                        test_node, data_dir, directory)):
+                    self.assertFalse(os.path.isdir(
+                        os.path.join(test_node, data_dir,
+                                     directory, input_dir)))
+
+            self.replicators.start()
+            # Now, delete file "hashes.pkl".
+            # Check, that all files were replicated.
+            for directory in os.listdir(os.path.join(test_node, data_dir)):
+                os.remove(os.path.join(
+                    test_node, data_dir, directory, 'hashes.pkl'))
+
+            # We will keep trying these tests until they pass for up to 60s
+            begin = time.time()
+            while True:
+                try:
+                    (new_files_list, new_dir_list) = collect_info([test_node])
+
+                    # Check replicate files and dirs
+                    for files in test_node_files_list:
+                        self.assertIn(files, new_files_list[0])
+
+                    for directory in test_node_dir_list:
+                        self.assertIn(directory, new_dir_list[0])
+                    break
+                except Exception:
+                    if time.time() - begin > 60:
+                        raise
+                    time.sleep(1)
+        finally:
+            self.replicators.stop()
+
+
+class TestReplicatorFunctionsReservedNames(TestReplicatorFunctions):
+    def put_data(self):
+        int_client = self.make_internal_client()
+        int_client.create_account(self.account)
+        container = get_reserved_name('container', str(uuid4()))
+        int_client.create_container(self.account, container,
+                                    headers={'X-Storage-Policy':
+                                             self.policy.name})
+
+        obj = get_reserved_name('object', str(uuid4()))
+        int_client.upload_object(
+            BytesIO(b'VERIFY'), self.account, container, obj)
+
+
+if __name__ == '__main__':
+    main()
diff --git a/test/probe/test_reserved_name.py b/test/probe/test_reserved_name.py
new file mode 100644
index 0000000000..bce0095058
--- /dev/null
+++ b/test/probe/test_reserved_name.py
@@ -0,0 +1,131 @@
+#!/usr/bin/python -u
+# Copyright (c) 2019 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import unittest
+
+from io import BytesIO
+from uuid import uuid4
+
+from swift.common.request_helpers import get_reserved_name
+
+from test.probe.common import ReplProbeTest
+
+from swiftclient import client, ClientException
+
+
+class TestReservedNames(ReplProbeTest):
+
+    def test_simple_crud(self):
+        int_client = self.make_internal_client()
+
+        # Create reserve named container
+        user_cont = 'container-%s' % uuid4()
+        reserved_cont = get_reserved_name('container-%s' % uuid4())
+        client.put_container(self.url, self.token, user_cont)
+        int_client.create_container(self.account, reserved_cont)
+
+        # Check that we can list both reserved and non-reserved containers
+        self.assertEqual([reserved_cont, user_cont], [
+            c['name'] for c in int_client.iter_containers(self.account)])
+
+        # sanity, user can't get to reserved name
+        with self.assertRaises(ClientException) as cm:
+            client.head_container(self.url, self.token, reserved_cont)
+        self.assertEqual(412, cm.exception.http_status)
+
+        user_obj = 'obj-%s' % uuid4()
+        reserved_obj = get_reserved_name('obj-%s' % uuid4())
+
+        # InternalClient can write & read reserved names fine
+        int_client.upload_object(
+            BytesIO(b'data'), self.account, reserved_cont, reserved_obj)
+        int_client.get_object_metadata(
+            self.account, reserved_cont, reserved_obj)
+        _, _, app_iter = int_client.get_object(
+            self.account, reserved_cont, reserved_obj)
+        self.assertEqual(b''.join(app_iter), b'data')
+        self.assertEqual([reserved_obj], [
+            o['name']
+            for o in int_client.iter_objects(self.account, reserved_cont)])
+
+        # But reserved objects must be in reserved containers, and
+        # user objects must be in user containers (at least for now)
+        int_client.upload_object(
+            BytesIO(b'data'), self.account, reserved_cont, user_obj,
+            acceptable_statuses=(400,))
+
+        int_client.upload_object(
+            BytesIO(b'data'), self.account, user_cont, reserved_obj,
+            acceptable_statuses=(400,))
+
+        # Make sure we can clean up, too
+        int_client.delete_object(self.account, reserved_cont, reserved_obj)
+        int_client.delete_container(self.account, reserved_cont)
+
+    def test_symlink_target(self):
+        if 'symlink' not in self.cluster_info:
+            raise unittest.SkipTest(
+                "Symlink not enabled in proxy; can't test "
+                "symlink to reserved name")
+        int_client = self.make_internal_client()
+
+        # create link container first, ensure account gets created too
+        client.put_container(self.url, self.token, 'c1')
+
+        # Create reserve named container
+        tgt_cont = get_reserved_name('container-%s' % uuid4())
+        int_client.create_container(self.account, tgt_cont)
+
+        # sanity, user can't get to reserved name
+        with self.assertRaises(ClientException) as cm:
+            client.head_container(self.url, self.token, tgt_cont)
+        self.assertEqual(412, cm.exception.http_status)
+
+        tgt_obj = get_reserved_name('obj-%s' % uuid4())
+        int_client.upload_object(
+            BytesIO(b'target object'), self.account, tgt_cont, tgt_obj)
+        metadata = int_client.get_object_metadata(
+            self.account, tgt_cont, tgt_obj)
+        etag = metadata['etag']
+
+        # users can write a dynamic symlink that targets a reserved
+        # name object
+        client.put_object(
+            self.url, self.token, 'c1', 'symlink',
+            headers={
+                'X-Symlink-Target': '%s/%s' % (tgt_cont, tgt_obj),
+                'Content-Type': 'application/symlink',
+            })
+
+        # but can't read the symlink
+        with self.assertRaises(ClientException) as cm:
+            client.get_object(self.url, self.token, 'c1', 'symlink')
+        self.assertEqual(412, cm.exception.http_status)
+
+        # user's can't create static symlink to reserved name
+        with self.assertRaises(ClientException) as cm:
+            client.put_object(
+                self.url, self.token, 'c1', 'static-symlink',
+                headers={
+                    'X-Symlink-Target': '%s/%s' % (tgt_cont, tgt_obj),
+                    'X-Symlink-Target-Etag': etag,
+                    'Content-Type': 'application/symlink',
+                })
+        self.assertEqual(412, cm.exception.http_status)
+
+        # clean-up
+        client.delete_object(self.url, self.token, 'c1', 'symlink')
+        int_client.delete_object(self.account, tgt_cont, tgt_obj)
+        int_client.delete_container(self.account, tgt_cont)
diff --git a/test/probe/test_sharder.py b/test/probe/test_sharder.py
new file mode 100644
index 0000000000..fe9f8b67df
--- /dev/null
+++ b/test/probe/test_sharder.py
@@ -0,0 +1,4482 @@
+# Copyright (c) 2017 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import json
+import os
+import pickle
+import shutil
+import subprocess
+import unittest
+import uuid
+
+from unittest import SkipTest
+from urllib.parse import quote
+
+from swift.common import direct_client, utils
+from swift.common.header_key_dict import HeaderKeyDict
+from swift.common.internal_client import UnexpectedResponse
+from swift.common.manager import Manager
+from swift.common.memcached import MemcacheRing
+from swift.common.utils import ShardRange, parse_db_filename, quorum_size, \
+    config_true_value, Timestamp, md5, Namespace
+from swift.container.backend import ContainerBroker, UNSHARDED, SHARDING, \
+    SHARDED
+from swift.container.sharder import CleavingContext, ContainerSharder
+from swift.container.replicator import ContainerReplicator
+from swiftclient import client, get_auth, ClientException
+
+from swift.proxy.controllers.base import get_cache_key
+from swift.proxy.controllers.obj import num_container_updates
+from test.debug_logger import debug_logger
+from test.probe import PROXY_BASE_URL
+from test.probe.brain import BrainSplitter
+from test.probe.common import ReplProbeTest, get_server_number, \
+    wait_for_server_to_hangup, ENABLED_POLICIES, exclude_nodes
+from unittest import mock
+
+try:
+    from swiftclient.requests_compat import requests as client_requests
+except ImportError:
+    # legacy location
+    from swiftclient.client import requests as client_requests
+
+MIN_SHARD_CONTAINER_THRESHOLD = 4
+MAX_SHARD_CONTAINER_THRESHOLD = 100
+
+
+class ShardCollector(object):
+    """
+    Returns map of node to tuples of (headers, shard ranges) returned from node
+    """
+    def __init__(self):
+        self.ranges = {}
+
+    def __call__(self, cnode, cpart, account, container):
+        self.ranges[cnode['id']] = direct_client.direct_get_container(
+            cnode, cpart, account, container,
+            headers={'X-Backend-Record-Type': 'shard'})
+
+
+class BaseTestContainerSharding(ReplProbeTest):
+    DELIM = '-'
+
+    def _maybe_skip_test(self):
+        try:
+            self.cont_configs = [
+                utils.readconf(p, 'container-sharder')
+                for p in self.configs['container-sharder'].values()]
+        except ValueError:
+            raise SkipTest('No [container-sharder] section found in '
+                           'container-server configs')
+
+        self.max_shard_size = max(
+            int(c.get('shard_container_threshold', '1000000'))
+            for c in self.cont_configs)
+
+        skip_reasons = []
+        if not (MIN_SHARD_CONTAINER_THRESHOLD <= self.max_shard_size
+                <= MAX_SHARD_CONTAINER_THRESHOLD):
+            skip_reasons.append(
+                'shard_container_threshold %d must be between %d and %d' %
+                (self.max_shard_size, MIN_SHARD_CONTAINER_THRESHOLD,
+                 MAX_SHARD_CONTAINER_THRESHOLD))
+
+        def skip_check(reason_list, option, required):
+            values = {int(c.get(option, required)) for c in self.cont_configs}
+            if values != {required}:
+                reason_list.append('%s must be %s' % (option, required))
+
+        skip_check(skip_reasons, 'shard_scanner_batch_size', 10)
+        skip_check(skip_reasons, 'shard_batch_size', 2)
+
+        if skip_reasons:
+            raise SkipTest(', '.join(skip_reasons))
+
+    def _load_rings_and_configs(self):
+        super(BaseTestContainerSharding, self)._load_rings_and_configs()
+        # perform checks for skipping test before starting services
+        self._maybe_skip_test()
+
+    def _make_object_names(self, number, start=0):
+        return ['obj%s%04d' % (self.DELIM, x)
+                for x in range(start, start + number)]
+
+    def _setup_container_name(self):
+        # Container where we're PUTting objects
+        self.container_name = 'container%s%s' % (self.DELIM, uuid.uuid4())
+
+    def setUp(self):
+        client.logger.setLevel(client.logging.WARNING)
+        client_requests.logging.getLogger().setLevel(
+            client_requests.logging.WARNING)
+        super(BaseTestContainerSharding, self).setUp()
+        _, self.admin_token = get_auth(
+            PROXY_BASE_URL + '/auth/v1.0', 'admin:admin', 'admin')
+        self._setup_container_name()
+        self.init_brain(self.container_name)
+        self.sharders = Manager(['container-sharder'])
+        self.internal_client = self.make_internal_client()
+        self.logger = debug_logger('sharder-test')
+        self.memcache = MemcacheRing(['127.0.0.1:11211'], logger=self.logger)
+        self.container_replicators = Manager(['container-replicator'])
+
+    def init_brain(self, container_name):
+        self.container_to_shard = container_name
+        self.brain = BrainSplitter(
+            self.url, self.token, self.container_to_shard,
+            None, 'container')
+        self.brain.put_container(policy_index=int(self.policy))
+
+    def stop_container_servers(self, node_numbers=None):
+        if node_numbers:
+            ipports = []
+            server2ipport = {v: k for k, v in self.ipport2server.items()}
+            for number in self.brain.node_numbers[node_numbers]:
+                self.brain.servers.stop(number=number)
+                server = 'container%d' % number
+                ipports.append(server2ipport[server])
+        else:
+            ipports = [k for k, v in self.ipport2server.items()
+                       if v.startswith('container')]
+            self.brain.servers.stop()
+        for ipport in ipports:
+            wait_for_server_to_hangup(ipport)
+
+    def put_objects(self, obj_names, contents=None):
+        conn = client.Connection(preauthurl=self.url, preauthtoken=self.token)
+        results = []
+        for obj in obj_names:
+            rdict = {}
+            conn.put_object(self.container_name, obj,
+                            contents=contents, response_dict=rdict)
+            results.append((obj, rdict['headers'].get('x-object-version-id')))
+        return results
+
+    def delete_objects(self, obj_names_and_versions):
+        conn = client.Connection(preauthurl=self.url, preauthtoken=self.token)
+        for obj in obj_names_and_versions:
+            if isinstance(obj, tuple):
+                obj, version = obj
+                conn.delete_object(self.container_name, obj,
+                                   query_string='version-id=%s' % version)
+            else:
+                conn.delete_object(self.container_name, obj)
+
+    def get_container_listing(self, account=None, container=None,
+                              headers=None, params=None):
+        account = account if account else self.account
+        container = container if container else self.container_to_shard
+        path = self.internal_client.make_path(account, container)
+        headers = headers or {}
+        return self.internal_client.make_request(
+            'GET', path + '?format=json', headers, [200], params=params)
+
+    def get_container_objects(self, account=None, container=None,
+                              headers=None, params=None):
+        headers = HeaderKeyDict(headers) if headers else {}
+        resp = self.get_container_listing(account, container, headers,
+                                          params=params)
+        req_record_type = headers.get('X-Backend-Record-Type')
+        resp_record_type = resp.headers.get('X-Backend-Record-Type')
+        if req_record_type and req_record_type.lower() == 'object':
+            self.assertEqual('object', resp_record_type)
+        else:
+            self.assertIsNone(resp_record_type)
+        self.assertNotIn('X-Backend-Record-Shard-Format', resp.headers)
+        return json.loads(resp.body)
+
+    def get_container_shard_ranges(self, account=None, container=None,
+                                   headers=None, params=None):
+        headers = dict(headers) if headers else {}
+        headers.update({'X-Backend-Record-Type': 'shard'})
+        resp = self.get_container_listing(account, container, headers,
+                                          params=params)
+        self.assertEqual('shard', resp.headers.get('X-Backend-Record-Type'))
+        self.assertEqual('full',
+                         resp.headers.get('X-Backend-Record-Shard-Format'))
+        return [ShardRange.from_dict(sr) for sr in json.loads(resp.body)]
+
+    def get_container_namespaces(self, account=None, container=None,
+                                 headers=None, params=None):
+        headers = dict(headers) if headers else {}
+        headers.update({'X-Backend-Record-Type': 'shard',
+                        'X-Backend-Record-Shard-Format': 'namespace'})
+        resp = self.get_container_listing(account, container, headers,
+                                          params=params)
+        self.assertEqual('shard', resp.headers.get('X-Backend-Record-Type'))
+        self.assertEqual('namespace',
+                         resp.headers.get('X-Backend-Record-Shard-Format'))
+        return [Namespace(**ns) for ns in json.loads(resp.body)]
+
+    def direct_get_container_shard_ranges(self, account=None, container=None,
+                                          expect_failure=False):
+        collector = ShardCollector()
+        self.direct_container_op(
+            collector, account, container, expect_failure)
+        return collector.ranges
+
+    def get_storage_dir(self, part, node, account=None, container=None):
+        account = account or self.brain.account
+        container = container or self.container_name
+        server_type, config_number = get_server_number(
+            (node['ip'], node['port']), self.ipport2server)
+        assert server_type == 'container'
+        repl_server = '%s-replicator' % server_type
+        conf = utils.readconf(self.configs[repl_server][config_number],
+                              section_name=repl_server)
+        datadir = os.path.join(conf['devices'], node['device'], 'containers')
+        container_hash = utils.hash_path(account, container)
+        return (utils.storage_directory(datadir, part, container_hash),
+                container_hash)
+
+    def get_db_file(self, part, node, account=None, container=None):
+        container_dir, container_hash = self.get_storage_dir(
+            part, node, account=account, container=container)
+        for f in os.listdir(container_dir):
+            path = os.path.join(container_dir, f)
+            if path.endswith('.db'):
+                return path
+
+    def get_broker(self, part, node, account=None, container=None):
+        return ContainerBroker(
+            self.get_db_file(part, node, account, container))
+
+    def get_shard_broker(self, shard_range, node_index=0):
+        shard_part, shard_nodes = self.brain.ring.get_nodes(
+            shard_range.account, shard_range.container)
+        return self.get_broker(
+            shard_part, shard_nodes[node_index], shard_range.account,
+            shard_range.container)
+
+    def categorize_container_dir_content(self, account=None, container=None,
+                                         more_nodes=False):
+        account = account or self.brain.account
+        container = container or self.container_name
+        part, nodes = self.brain.ring.get_nodes(account, container)
+        if more_nodes:
+            nodes.extend(self.brain.ring.get_more_nodes(part))
+        storage_dirs = [
+            self.get_storage_dir(part, node, account=account,
+                                 container=container)[0]
+            for node in nodes]
+        result = {
+            'shard_dbs': [],
+            'normal_dbs': [],
+            'pendings': [],
+            'locks': [],
+            'other': [],
+        }
+        for storage_dir in storage_dirs:
+            for f in os.listdir(storage_dir):
+                path = os.path.join(storage_dir, f)
+                if path.endswith('.db'):
+                    hash_, epoch, ext = parse_db_filename(path)
+                    if epoch:
+                        result['shard_dbs'].append(path)
+                    else:
+                        result['normal_dbs'].append(path)
+                elif path.endswith('.db.pending'):
+                    result['pendings'].append(path)
+                elif path.endswith('/.lock'):
+                    result['locks'].append(path)
+                else:
+                    result['other'].append(path)
+        if result['other']:
+            self.fail('Found unexpected files in storage directory:\n  %s' %
+                      '\n  '.join(result['other']))
+        return result
+
+    def assert_dict_contains(self, expected_items, actual_dict):
+        ignored = set(expected_items) ^ set(actual_dict)
+        filtered_actual = {k: actual_dict[k]
+                           for k in actual_dict if k not in ignored}
+        self.assertEqual(expected_items, filtered_actual)
+
+    def assert_shard_ranges_contiguous(self, expected_number, shard_ranges,
+                                       first_lower='', last_upper=''):
+        if shard_ranges and isinstance(shard_ranges[0], ShardRange):
+            actual_shard_ranges = sorted(shard_ranges)
+        else:
+            actual_shard_ranges = sorted(ShardRange.from_dict(d)
+                                         for d in shard_ranges)
+        self.assertLengthEqual(actual_shard_ranges, expected_number)
+        if expected_number:
+            with self.subTest(shard_ranges=actual_shard_ranges):
+                self.assertEqual(first_lower, actual_shard_ranges[0].lower_str)
+                for x, y in zip(actual_shard_ranges, actual_shard_ranges[1:]):
+                    self.assertEqual(x.upper, y.lower)
+                self.assertEqual(last_upper, actual_shard_ranges[-1].upper_str)
+
+    def assert_shard_range_equal(self, expected, actual, excludes=None):
+        excludes = excludes or []
+        expected_dict = dict(expected)
+        actual_dict = dict(actual)
+        for k in excludes:
+            expected_dict.pop(k, None)
+            actual_dict.pop(k, None)
+        self.assertEqual(expected_dict, actual_dict)
+
+    def assert_shard_range_lists_equal(self, expected, actual, excludes=None):
+        self.assertEqual(len(expected), len(actual))
+        for expected, actual in zip(expected, actual):
+            self.assert_shard_range_equal(expected, actual, excludes=excludes)
+
+    def assert_shard_range_state(self, expected_state, shard_ranges):
+        if shard_ranges and not isinstance(shard_ranges[0], ShardRange):
+            shard_ranges = [ShardRange.from_dict(data)
+                            for data in shard_ranges]
+        self.assertEqual([expected_state] * len(shard_ranges),
+                         [sr.state for sr in shard_ranges])
+
+    def assert_total_object_count(self, expected_object_count, shard_ranges):
+        actual = sum(sr['object_count'] for sr in shard_ranges)
+        self.assertEqual(expected_object_count, actual)
+
+    def assert_container_listing(self, expected_listing, req_hdrs=None):
+        req_hdrs = req_hdrs if req_hdrs else {}
+        headers, actual_listing = client.get_container(
+            self.url, self.token, self.container_name, headers=req_hdrs)
+        self.assertIn('x-container-object-count', headers)
+        expected_obj_count = len(expected_listing)
+        self.assertEqual(expected_listing, [
+            x['name'] for x in actual_listing])
+        self.assertEqual(str(expected_obj_count),
+                         headers['x-container-object-count'])
+        return headers, actual_listing
+
+    def assert_container_object_count(self, expected_obj_count):
+        headers = client.head_container(
+            self.url, self.token, self.container_name)
+        self.assertIn('x-container-object-count', headers)
+        self.assertEqual(str(expected_obj_count),
+                         headers['x-container-object-count'])
+
+    def assert_container_post_ok(self, meta_value):
+        key = 'X-Container-Meta-Assert-Post-Works'
+        headers = {key: meta_value}
+        client.post_container(
+            self.url, self.token, self.container_name, headers=headers)
+        resp_headers = client.head_container(
+            self.url, self.token, self.container_name)
+        self.assertEqual(meta_value, resp_headers.get(key.lower()))
+
+    def assert_container_post_fails(self, meta_value):
+        key = 'X-Container-Meta-Assert-Post-Works'
+        headers = {key: meta_value}
+        with self.assertRaises(ClientException) as cm:
+            client.post_container(
+                self.url, self.token, self.container_name, headers=headers)
+        self.assertEqual(404, cm.exception.http_status)
+
+    def assert_container_delete_fails(self):
+        with self.assertRaises(ClientException) as cm:
+            client.delete_container(self.url, self.token, self.container_name)
+        self.assertEqual(409, cm.exception.http_status)
+
+    def assert_container_not_found(self):
+        with self.assertRaises(ClientException) as cm:
+            client.get_container(self.url, self.token, self.container_name)
+        self.assertEqual(404, cm.exception.http_status)
+        # check for headers leaking out while deleted
+        resp_headers = cm.exception.http_response_headers
+        self.assertNotIn('X-Container-Object-Count', resp_headers)
+        self.assertNotIn('X-Container-Bytes-Used', resp_headers)
+        self.assertNotIn('X-Timestamp', resp_headers)
+        self.assertNotIn('X-PUT-Timestamp', resp_headers)
+
+    def assert_container_has_shard_sysmeta(self):
+        node_headers = self.direct_head_container()
+        for node_id, headers in node_headers.items():
+            with self.subTest(node_id=node_id, nodes=node_headers.keys()):
+                for k, v in headers.items():
+                    if k.lower().startswith('x-container-sysmeta-shard'):
+                        break
+                else:
+                    self.fail('No shard sysmeta found in %s' % headers)
+
+    def assert_container_state(self, node, expected_state, num_shard_ranges,
+                               account=None, container=None, part=None,
+                               override_deleted=False):
+        account = account or self.account
+        container = container or self.container_to_shard
+        part = part or self.brain.part
+        headers = {'X-Backend-Record-Type': 'shard'}
+        if override_deleted:
+            headers['x-backend-override-deleted'] = True
+        headers, shard_ranges = direct_client.direct_get_container(
+            node, part, account, container,
+            headers=headers)
+        self.assertEqual(num_shard_ranges, len(shard_ranges))
+        self.assertIn('X-Backend-Sharding-State', headers)
+        self.assertEqual(
+            expected_state, headers['X-Backend-Sharding-State'])
+        return [ShardRange.from_dict(sr) for sr in shard_ranges]
+
+    def assert_container_states(self, expected_state, num_shard_ranges):
+        for node in self.brain.nodes:
+            self.assert_container_state(node, expected_state, num_shard_ranges)
+
+    def assert_subprocess_success(self, cmd_args):
+        try:
+            return subprocess.check_output(cmd_args, stderr=subprocess.STDOUT)
+        except Exception as exc:
+            # why not 'except CalledProcessError'? because in my py3.6 tests
+            # the CalledProcessError wasn't caught by that! despite type(exc)
+            # being a CalledProcessError, isinstance(exc, CalledProcessError)
+            # is False and the type has a different hash - could be
+            # related to https://github.com/eventlet/eventlet/issues/413
+            try:
+                # assume this is a CalledProcessError
+                self.fail('%s with output:\n%s' % (exc, exc.output))
+            except AttributeError:
+                raise exc
+
+    def get_part_and_node_numbers(self, shard_range):
+        """Return the partition and node numbers for a shard range."""
+        part, nodes = self.brain.ring.get_nodes(
+            shard_range.account, shard_range.container)
+        return part, [n['id'] + 1 for n in nodes]
+
+    def run_sharders(self, shard_ranges, exclude_partitions=None):
+        """Run the sharder on partitions for given shard ranges."""
+        if not isinstance(shard_ranges, (list, tuple, set)):
+            shard_ranges = (shard_ranges,)
+        exclude_partitions = exclude_partitions or []
+        shard_parts = []
+        for sr in shard_ranges:
+            sr_part = self.get_part_and_node_numbers(sr)[0]
+            if sr_part not in exclude_partitions:
+                shard_parts.append(str(sr_part))
+        partitions = ','.join(shard_parts)
+        self.sharders.once(additional_args='--partitions=%s' % partitions)
+
+    def run_sharder_sequentially(self, shard_range=None):
+        """Run sharder node by node on partition for given shard range."""
+        if shard_range:
+            part, node_numbers = self.get_part_and_node_numbers(shard_range)
+        else:
+            part, node_numbers = self.brain.part, self.brain.node_numbers
+        for node_number in node_numbers:
+            self.sharders.once(number=node_number,
+                               additional_args='--partitions=%s' % part)
+
+    def run_custom_sharder(self, conf_index, custom_conf, **kwargs):
+        return self.run_custom_daemon(ContainerSharder, 'container-sharder',
+                                      conf_index, custom_conf, **kwargs)
+
+    def sharders_once_non_auto(self, **kwargs):
+        # inhibit auto_sharding regardless of the config setting
+        additional_args = kwargs.get('additional_args', [])
+        if not isinstance(additional_args, list):
+            additional_args = [additional_args]
+        additional_args.append('--no-auto-shard')
+        kwargs['additional_args'] = additional_args
+        self.sharders.once(**kwargs)
+
+
+class BaseAutoContainerSharding(BaseTestContainerSharding):
+
+    def _maybe_skip_test(self):
+        super(BaseAutoContainerSharding, self)._maybe_skip_test()
+        auto_shard = all(config_true_value(c.get('auto_shard', False))
+                         for c in self.cont_configs)
+        if not auto_shard:
+            raise SkipTest('auto_shard must be true '
+                           'in all container_sharder configs')
+
+
+class TestContainerShardingNonUTF8(BaseAutoContainerSharding):
+    def test_sharding_listing(self):
+        # verify parameterised listing of a container during sharding
+        all_obj_names = self._make_object_names(4 * self.max_shard_size)
+        obj_names = all_obj_names[::2]
+        obj_content = 'testing'
+        self.put_objects(obj_names, contents=obj_content)
+        # choose some names approx in middle of each expected shard range
+        markers = [
+            obj_names[i] for i in range(self.max_shard_size // 4,
+                                        2 * self.max_shard_size,
+                                        self.max_shard_size // 2)]
+
+        def check_listing(objects, req_hdrs=None, **params):
+            req_hdrs = req_hdrs if req_hdrs else {}
+            qs = '&'.join('%s=%s' % (k, quote(str(v)))
+                          for k, v in params.items())
+            headers, listing = client.get_container(
+                self.url, self.token, self.container_name, query_string=qs,
+                headers=req_hdrs)
+            listing = [x['name'] for x in listing]
+            if params.get('reverse'):
+                marker = params.get('marker', ShardRange.MAX)
+                end_marker = params.get('end_marker', ShardRange.MIN)
+                expected = [o for o in objects if end_marker < o < marker]
+                expected.reverse()
+            else:
+                marker = params.get('marker', ShardRange.MIN)
+                end_marker = params.get('end_marker', ShardRange.MAX)
+                expected = [o for o in objects if marker < o < end_marker]
+            if 'limit' in params:
+                expected = expected[:params['limit']]
+            self.assertEqual(expected, listing)
+            self.assertIn('x-timestamp', headers)
+            self.assertIn('last-modified', headers)
+            self.assertIn('x-trans-id', headers)
+            self.assertEqual('bytes', headers.get('accept-ranges'))
+            self.assertEqual('application/json; charset=utf-8',
+                             headers.get('content-type'))
+
+        def check_listing_fails(exp_status, **params):
+            qs = '&'.join(['%s=%s' % param for param in params.items()])
+            with self.assertRaises(ClientException) as cm:
+                client.get_container(
+                    self.url, self.token, self.container_name, query_string=qs)
+            self.assertEqual(exp_status, cm.exception.http_status)
+            return cm.exception
+
+        def do_listing_checks(objs, hdrs=None):
+            hdrs = hdrs if hdrs else {}
+            check_listing(objs, hdrs)
+            check_listing(objs, hdrs, marker=markers[0], end_marker=markers[1])
+            check_listing(objs, hdrs, marker=markers[0], end_marker=markers[2])
+            check_listing(objs, hdrs, marker=markers[1], end_marker=markers[3])
+            check_listing(objs, hdrs, marker=markers[1], end_marker=markers[3],
+                          limit=self.max_shard_size // 4)
+            check_listing(objs, hdrs, marker=markers[1], end_marker=markers[3],
+                          limit=self.max_shard_size // 4)
+            check_listing(objs, hdrs, marker=markers[1], end_marker=markers[2],
+                          limit=self.max_shard_size // 2)
+            check_listing(objs, hdrs, marker=markers[1], end_marker=markers[1])
+            check_listing(objs, hdrs, reverse=True)
+            check_listing(objs, hdrs, reverse=True, end_marker=markers[1])
+            check_listing(objs, hdrs, reverse=True, marker=markers[3],
+                          end_marker=markers[1],
+                          limit=self.max_shard_size // 4)
+            check_listing(objs, hdrs, reverse=True, marker=markers[3],
+                          end_marker=markers[1], limit=0)
+            check_listing([], hdrs, marker=markers[0], end_marker=markers[0])
+            check_listing([], hdrs, marker=markers[0], end_marker=markers[1],
+                          reverse=True)
+            check_listing(objs, hdrs, prefix='obj')
+            check_listing([], hdrs, prefix='zzz')
+            # delimiter
+            headers, listing = client.get_container(
+                self.url, self.token, self.container_name,
+                query_string='delimiter=' + quote(self.DELIM), headers=hdrs)
+            self.assertEqual([{'subdir': 'obj' + self.DELIM}], listing)
+            headers, listing = client.get_container(
+                self.url, self.token, self.container_name,
+                query_string='delimiter=j' + quote(self.DELIM), headers=hdrs)
+            self.assertEqual([{'subdir': 'obj' + self.DELIM}], listing)
+
+            limit = self.cluster_info['swift']['container_listing_limit']
+            exc = check_listing_fails(412, limit=limit + 1)
+            self.assertIn(b'Maximum limit', exc.http_response_content)
+            exc = check_listing_fails(400, delimiter='%ff')
+            self.assertIn(b'not valid UTF-8', exc.http_response_content)
+
+        # sanity checks
+        do_listing_checks(obj_names)
+
+        # Shard the container
+        client.post_container(self.url, self.admin_token, self.container_name,
+                              headers={'X-Container-Sharding': 'on'})
+        # First run the 'leader' in charge of scanning, which finds all shard
+        # ranges and cleaves first two
+        self.sharders.once(number=self.brain.node_numbers[0],
+                           additional_args='--partitions=%s' % self.brain.part)
+        # Then run sharder on other nodes which will also cleave first two
+        # shard ranges
+        for n in self.brain.node_numbers[1:]:
+            self.sharders.once(
+                number=n, additional_args='--partitions=%s' % self.brain.part)
+
+        # sanity check shard range states
+        self.assert_container_states('sharding', 4)
+        shard_ranges = self.get_container_shard_ranges()
+        self.assertLengthEqual(shard_ranges, 4)
+        self.assert_shard_range_state(ShardRange.CLEAVED, shard_ranges[:2])
+        self.assert_shard_range_state(ShardRange.CREATED, shard_ranges[2:])
+
+        self.assert_container_delete_fails()
+        self.assert_container_has_shard_sysmeta()  # confirm no sysmeta deleted
+        self.assert_container_post_ok('sharding')
+        do_listing_checks(obj_names)
+
+        # put some new objects spread through entire namespace; object updates
+        # should be directed to the shard container (both the cleaved and the
+        # created shards)
+        new_obj_names = all_obj_names[1::4]
+        self.put_objects(new_obj_names, obj_content)
+
+        # new objects that fell into the first two cleaved shard ranges are
+        # reported in listing; new objects in the yet-to-be-cleaved shard
+        # ranges are not yet included in listing because listings prefer the
+        # root over the final two shards that are not yet-cleaved
+        exp_obj_names = [o for o in obj_names + new_obj_names
+                         if o <= shard_ranges[1].upper]
+        exp_obj_names += [o for o in obj_names
+                          if o > shard_ranges[1].upper]
+        exp_obj_names.sort()
+        do_listing_checks(exp_obj_names)
+
+        # run all the sharders again and the last two shard ranges get cleaved
+        self.sharders.once(additional_args='--partitions=%s' % self.brain.part)
+        self.assert_container_states('sharded', 4)
+        shard_ranges = self.get_container_shard_ranges()
+        self.assert_shard_range_state(ShardRange.ACTIVE, shard_ranges)
+
+        # listings are now gathered from all four shard ranges so should have
+        # all the specified objects
+        exp_obj_names = obj_names + new_obj_names
+        exp_obj_names.sort()
+        do_listing_checks(exp_obj_names)
+        # shard ranges may now be cached by proxy so do listings checks again
+        # forcing backend request
+        do_listing_checks(exp_obj_names, hdrs={'X-Newest': 'true'})
+
+        # post more metadata to the container and check that it is read back
+        # correctly from backend (using x-newest) and cache
+        test_headers = {'x-container-meta-test': 'testing',
+                        'x-container-read': 'read_acl',
+                        'x-container-write': 'write_acl',
+                        'x-container-sync-key': 'sync_key',
+                        # 'x-container-sync-to': 'sync_to',
+                        'x-versions-location': 'versions',
+                        'x-container-meta-access-control-allow-origin': 'aa',
+                        'x-container-meta-access-control-expose-headers': 'bb',
+                        'x-container-meta-access-control-max-age': '123'}
+        client.post_container(self.url, self.admin_token, self.container_name,
+                              headers=test_headers)
+        headers, listing = client.get_container(
+            self.url, self.token, self.container_name,
+            headers={'X-Newest': 'true'})
+        exp_headers = dict(test_headers)
+        exp_headers.update({
+            'x-container-object-count': str(len(exp_obj_names)),
+            'x-container-bytes-used':
+            str(len(exp_obj_names) * len(obj_content))
+        })
+        for k, v in exp_headers.items():
+            self.assertIn(k, headers)
+            self.assertEqual(v, headers[k], dict(headers))
+
+        cache_headers, listing = client.get_container(
+            self.url, self.token, self.container_name)
+        for k, v in exp_headers.items():
+            self.assertIn(k, cache_headers)
+            self.assertEqual(v, cache_headers[k], dict(exp_headers))
+        # we don't expect any of these headers to be equal...
+        for k in ('x-timestamp', 'last-modified', 'date', 'x-trans-id',
+                  'x-openstack-request-id'):
+            headers.pop(k, None)
+            cache_headers.pop(k, None)
+        self.assertEqual(headers, cache_headers)
+
+        self.assert_container_delete_fails()
+        self.assert_container_has_shard_sysmeta()
+        self.assert_container_post_ok('sharded')
+
+        # delete original objects
+        self.delete_objects(obj_names)
+        do_listing_checks(new_obj_names)
+        self.assert_container_delete_fails()
+        self.assert_container_has_shard_sysmeta()
+        self.assert_container_post_ok('sharded')
+
+
+class TestContainerShardingFunkyNames(TestContainerShardingNonUTF8):
+    DELIM = '\n'
+
+    def _make_object_names(self, number, start=0):
+        return ['obj\n%04d%%Ff' % x for x in range(start, start + number)]
+
+    def _setup_container_name(self):
+        self.container_name = 'container\n%%Ff\n%s' % uuid.uuid4()
+
+
+class TestContainerShardingUTF8(TestContainerShardingNonUTF8):
+    def _make_object_names(self, number, start=0):
+        # override default with names that include non-ascii chars
+        name_length = self.cluster_info['swift']['max_object_name_length']
+        obj_names = []
+        for x in range(start, start + number):
+            name = (u'obj-\u00e4\u00ea\u00ec\u00f2\u00fb\u1234-%04d' % x)
+            name = name.encode('utf8').ljust(name_length, b'o').decode('utf8')
+            obj_names.append(name)
+        return obj_names
+
+    def _setup_container_name(self):
+        # override default with max length name that includes non-ascii chars
+        super(TestContainerShardingUTF8, self)._setup_container_name()
+        name_length = self.cluster_info['swift']['max_container_name_length']
+        cont_name = \
+            self.container_name + u'-\u00e4\u00ea\u00ec\u00f2\u00fb\u1234'
+        self.container_name = cont_name.encode('utf8').ljust(
+            name_length, b'x').decode('utf8')
+
+
+class TestContainerShardingObjectVersioning(BaseAutoContainerSharding):
+    def _maybe_skip_test(self):
+        super(TestContainerShardingObjectVersioning, self)._maybe_skip_test()
+        try:
+            vw_config = utils.readconf(self.configs['proxy-server'],
+                                       'filter:versioned_writes')
+        except ValueError:
+            raise SkipTest('No [filter:versioned_writes] section found in '
+                           'proxy-server configs')
+        allow_object_versioning = config_true_value(
+            vw_config.get('allow_object_versioning', False))
+        if not allow_object_versioning:
+            raise SkipTest('allow_object_versioning must be true '
+                           'in all versioned_writes configs')
+
+    def init_brain(self, container_name):
+        client.put_container(self.url, self.token, container_name, headers={
+            'X-Storage-Policy': self.policy.name,
+            'X-Versions-Enabled': 'true',
+        })
+        self.container_to_shard = '\x00versions\x00' + container_name
+        self.brain = BrainSplitter(
+            self.url, self.token, self.container_to_shard,
+            None, 'container')
+
+    def test_sharding_listing(self):
+        # verify parameterised listing of a container during sharding
+        all_obj_names = self._make_object_names(3) * self.max_shard_size
+        all_obj_names.extend(self._make_object_names(self.max_shard_size,
+                                                     start=3))
+        obj_names = all_obj_names[::2]
+        obj_names_and_versions = self.put_objects(obj_names)
+
+        def sort_key(obj_and_ver):
+            obj, ver = obj_and_ver
+            return obj, ~Timestamp(ver)
+
+        obj_names_and_versions.sort(key=sort_key)
+        # choose some names approx in middle of each expected shard range
+        markers = [
+            obj_names_and_versions[i]
+            for i in range(self.max_shard_size // 4,
+                           2 * self.max_shard_size,
+                           self.max_shard_size // 2)]
+
+        def check_listing(objects, **params):
+            params['versions'] = ''
+            qs = '&'.join('%s=%s' % param for param in params.items())
+            headers, listing = client.get_container(
+                self.url, self.token, self.container_name, query_string=qs)
+            listing = [(x['name'], x['version_id'])
+                       for x in listing]
+            if params.get('reverse'):
+                marker = (
+                    params.get('marker', ShardRange.MAX),
+                    ~Timestamp(params['version_marker'])
+                    if 'version_marker' in params else ~Timestamp('0'),
+                )
+                end_marker = (
+                    params.get('end_marker', ShardRange.MIN),
+                    Timestamp('0'),
+                )
+                expected = [o for o in objects
+                            if end_marker < sort_key(o) < marker]
+                expected.reverse()
+            else:
+                marker = (
+                    params.get('marker', ShardRange.MIN),
+                    ~Timestamp(params['version_marker'])
+                    if 'version_marker' in params else Timestamp('0'),
+                )
+                end_marker = (
+                    params.get('end_marker', ShardRange.MAX),
+                    ~Timestamp('0'),
+                )
+                expected = [o for o in objects
+                            if marker < sort_key(o) < end_marker]
+            if 'limit' in params:
+                expected = expected[:params['limit']]
+            self.assertEqual(expected, listing)
+
+        def check_listing_fails(exp_status, **params):
+            params['versions'] = ''
+            qs = '&'.join('%s=%s' % param for param in params.items())
+            with self.assertRaises(ClientException) as cm:
+                client.get_container(
+                    self.url, self.token, self.container_name, query_string=qs)
+            self.assertEqual(exp_status, cm.exception.http_status)
+            return cm.exception
+
+        def do_listing_checks(objects):
+            check_listing(objects)
+            check_listing(objects,
+                          marker=markers[0][0], version_marker=markers[0][1])
+            check_listing(objects,
+                          marker=markers[0][0], version_marker=markers[0][1],
+                          limit=self.max_shard_size // 10)
+            check_listing(objects,
+                          marker=markers[0][0], version_marker=markers[0][1],
+                          limit=self.max_shard_size // 4)
+            check_listing(objects,
+                          marker=markers[0][0], version_marker=markers[0][1],
+                          limit=self.max_shard_size // 2)
+            check_listing(objects,
+                          marker=markers[1][0], version_marker=markers[1][1])
+            check_listing(objects,
+                          marker=markers[1][0], version_marker=markers[1][1],
+                          limit=self.max_shard_size // 10)
+            check_listing(objects,
+                          marker=markers[2][0], version_marker=markers[2][1],
+                          limit=self.max_shard_size // 4)
+            check_listing(objects,
+                          marker=markers[2][0], version_marker=markers[2][1],
+                          limit=self.max_shard_size // 2)
+            check_listing(objects, reverse=True)
+            check_listing(objects, reverse=True,
+                          marker=markers[1][0], version_marker=markers[1][1])
+
+            check_listing(objects, prefix='obj')
+            check_listing([], prefix='zzz')
+            # delimiter
+            headers, listing = client.get_container(
+                self.url, self.token, self.container_name,
+                query_string='delimiter=-')
+            self.assertEqual([{'subdir': 'obj-'}], listing)
+            headers, listing = client.get_container(
+                self.url, self.token, self.container_name,
+                query_string='delimiter=j-')
+            self.assertEqual([{'subdir': 'obj-'}], listing)
+
+            limit = self.cluster_info['swift']['container_listing_limit']
+            exc = check_listing_fails(412, limit=limit + 1)
+            self.assertIn(b'Maximum limit', exc.http_response_content)
+            exc = check_listing_fails(400, delimiter='%ff')
+            self.assertIn(b'not valid UTF-8', exc.http_response_content)
+
+        # sanity checks
+        do_listing_checks(obj_names_and_versions)
+
+        # Shard the container. Use an internal_client so we get an implicit
+        # X-Backend-Allow-Reserved-Names header
+        self.internal_client.set_container_metadata(
+            self.account, self.container_to_shard, {
+                'X-Container-Sysmeta-Sharding': 'True',
+            })
+        # First run the 'leader' in charge of scanning, which finds all shard
+        # ranges and cleaves first two
+        self.sharders.once(number=self.brain.node_numbers[0],
+                           additional_args='--partitions=%s' % self.brain.part)
+        # Then run sharder on other nodes which will also cleave first two
+        # shard ranges
+        for n in self.brain.node_numbers[1:]:
+            self.sharders.once(
+                number=n, additional_args='--partitions=%s' % self.brain.part)
+
+        # sanity check shard range states
+        self.assert_container_states('sharding', 4)
+        shard_ranges = self.get_container_shard_ranges()
+        self.assertLengthEqual(shard_ranges, 4)
+        self.assert_shard_range_state(ShardRange.CLEAVED, shard_ranges[:2])
+        self.assert_shard_range_state(ShardRange.CREATED, shard_ranges[2:])
+
+        self.assert_container_delete_fails()
+        self.assert_container_has_shard_sysmeta()  # confirm no sysmeta deleted
+        self.assert_container_post_ok('sharding')
+        do_listing_checks(obj_names_and_versions)
+
+        # put some new objects spread through entire namespace
+        new_obj_names = all_obj_names[1::4]
+        new_obj_names_and_versions = self.put_objects(new_obj_names)
+
+        # new objects that fell into the first two cleaved shard ranges are
+        # reported in listing, new objects in the yet-to-be-cleaved shard
+        # ranges are not yet included in listing
+        exp_obj_names_and_versions = [
+            o for o in obj_names_and_versions + new_obj_names_and_versions
+            if '\x00' + o[0] <= shard_ranges[1].upper]
+        exp_obj_names_and_versions += [
+            o for o in obj_names_and_versions
+            if '\x00' + o[0] > shard_ranges[1].upper]
+        exp_obj_names_and_versions.sort(key=sort_key)
+        do_listing_checks(exp_obj_names_and_versions)
+
+        # run all the sharders again and the last two shard ranges get cleaved
+        self.sharders.once(additional_args='--partitions=%s' % self.brain.part)
+        self.assert_container_states('sharded', 4)
+        shard_ranges = self.get_container_shard_ranges()
+        self.assert_shard_range_state(ShardRange.ACTIVE, shard_ranges)
+
+        exp_obj_names_and_versions = \
+            obj_names_and_versions + new_obj_names_and_versions
+        exp_obj_names_and_versions.sort(key=sort_key)
+        do_listing_checks(exp_obj_names_and_versions)
+        self.assert_container_delete_fails()
+        self.assert_container_has_shard_sysmeta()
+        self.assert_container_post_ok('sharded')
+
+        # delete original objects
+        self.delete_objects(obj_names_and_versions)
+        new_obj_names_and_versions.sort(key=sort_key)
+        do_listing_checks(new_obj_names_and_versions)
+        self.assert_container_delete_fails()
+        self.assert_container_has_shard_sysmeta()
+        self.assert_container_post_ok('sharded')
+
+
+class TestContainerSharding(BaseAutoContainerSharding):
+    def _test_sharded_listing(self, run_replicators=False):
+        obj_names = self._make_object_names(self.max_shard_size)
+        self.put_objects(obj_names)
+
+        # Verify that we start out with normal DBs, no shards
+        found = self.categorize_container_dir_content()
+        self.assertLengthEqual(found['normal_dbs'], 3)
+        self.assertLengthEqual(found['shard_dbs'], 0)
+        for db_file in found['normal_dbs']:
+            broker = ContainerBroker(db_file)
+            self.assertIs(True, broker.is_root_container())
+            self.assertEqual('unsharded', broker.get_db_state())
+            self.assertLengthEqual(broker.get_shard_ranges(), 0)
+
+        headers, pre_sharding_listing = client.get_container(
+            self.url, self.token, self.container_name)
+        self.assertEqual(obj_names, [
+            x['name'] for x in pre_sharding_listing])  # sanity
+
+        # Shard it
+        client.post_container(self.url, self.admin_token, self.container_name,
+                              headers={'X-Container-Sharding': 'on'})
+        pre_sharding_headers = client.head_container(
+            self.url, self.admin_token, self.container_name)
+        self.assertEqual('True',
+                         pre_sharding_headers.get('x-container-sharding'))
+
+        # Only run the one in charge of scanning
+        self.sharders.once(number=self.brain.node_numbers[0],
+                           additional_args='--partitions=%s' % self.brain.part)
+
+        # Verify that we have one sharded db -- though the other normal DBs
+        # received the shard ranges that got defined
+        found = self.categorize_container_dir_content()
+        self.assertLengthEqual(found['shard_dbs'], 1)
+        broker = self.get_broker(self.brain.part, self.brain.nodes[0])
+        # sanity check - the shard db is on replica 0
+        self.assertEqual(found['shard_dbs'][0], broker.db_file)
+        self.assertIs(True, broker.is_root_container())
+        self.assertEqual('sharded', broker.get_db_state())
+        orig_root_shard_ranges = [dict(sr) for sr in broker.get_shard_ranges()]
+        self.assertLengthEqual(orig_root_shard_ranges, 2)
+        self.assert_total_object_count(len(obj_names), orig_root_shard_ranges)
+        self.assert_shard_ranges_contiguous(2, orig_root_shard_ranges)
+        self.assertEqual([ShardRange.ACTIVE, ShardRange.ACTIVE],
+                         [sr['state'] for sr in orig_root_shard_ranges])
+        # Contexts should still be there, and should be complete
+        contexts = set([ctx.done()
+                        for ctx, _ in CleavingContext.load_all(broker)])
+        self.assertEqual({True}, contexts)
+        self.direct_delete_container(expect_failure=True)
+
+        self.assertLengthEqual(found['normal_dbs'], 2)
+        for db_file in found['normal_dbs']:
+            broker = ContainerBroker(db_file)
+            self.assertIs(True, broker.is_root_container())
+            self.assertEqual('unsharded', broker.get_db_state())
+            shard_ranges = [dict(sr) for sr in broker.get_shard_ranges()]
+            self.assertEqual([ShardRange.CREATED, ShardRange.CREATED],
+                             [sr['state'] for sr in shard_ranges])
+            # the sharded db had shard range meta_timestamps and state updated
+            # during cleaving, so we do not expect those to be equal on other
+            # nodes
+            self.assert_shard_range_lists_equal(
+                orig_root_shard_ranges, shard_ranges,
+                excludes=['meta_timestamp', 'state', 'state_timestamp'])
+
+            contexts = list(CleavingContext.load_all(broker))
+            self.assertEqual([], contexts)  # length check
+
+        if run_replicators:
+            Manager(['container-replicator']).once()
+            # replication doesn't change the db file names
+            found = self.categorize_container_dir_content()
+            self.assertLengthEqual(found['shard_dbs'], 1)
+            self.assertLengthEqual(found['normal_dbs'], 2)
+
+        # Now that everyone has shard ranges, run *everyone*
+        self.sharders.once(additional_args='--partitions=%s' % self.brain.part)
+
+        # Verify that we only have shard dbs now
+        found = self.categorize_container_dir_content()
+        self.assertLengthEqual(found['shard_dbs'], 3)
+        self.assertLengthEqual(found['normal_dbs'], 0)
+        # Shards stayed the same
+        for db_file in found['shard_dbs']:
+            broker = ContainerBroker(db_file)
+            self.assertIs(True, broker.is_root_container())
+            self.assertEqual('sharded', broker.get_db_state())
+            # Well, except for meta_timestamps, since the shards each reported
+            self.assert_shard_range_lists_equal(
+                orig_root_shard_ranges, broker.get_shard_ranges(),
+                excludes=['meta_timestamp', 'state_timestamp'])
+            for orig, updated in zip(orig_root_shard_ranges,
+                                     broker.get_shard_ranges()):
+                self.assertGreaterEqual(updated.state_timestamp,
+                                        orig['state_timestamp'])
+                self.assertGreaterEqual(updated.meta_timestamp,
+                                        orig['meta_timestamp'])
+            # Contexts should still be there, and should be complete
+            contexts = set([ctx.done()
+                            for ctx, _ in CleavingContext.load_all(broker)])
+            self.assertEqual({True}, contexts)
+
+        # Check that entire listing is available
+        headers, actual_listing = self.assert_container_listing(obj_names)
+        # ... and check some other container properties
+        self.assertEqual(headers['last-modified'],
+                         pre_sharding_headers['last-modified'])
+        # It even works in reverse!
+        headers, listing = client.get_container(self.url, self.token,
+                                                self.container_name,
+                                                query_string='reverse=on')
+        self.assertEqual(pre_sharding_listing[::-1], listing)
+
+        # and repeat checks to use shard ranges now cached in proxy
+        headers, actual_listing = self.assert_container_listing(obj_names)
+        self.assertEqual(headers['last-modified'],
+                         pre_sharding_headers['last-modified'])
+        headers, listing = client.get_container(self.url, self.token,
+                                                self.container_name,
+                                                query_string='reverse=on')
+        self.assertEqual(pre_sharding_listing[::-1], listing)
+
+        # Now put some new objects into first shard, taking its count to
+        # 3 shard ranges' worth
+        more_obj_names = [
+            'beta%03d' % x for x in range(self.max_shard_size)]
+        self.put_objects(more_obj_names)
+
+        # The listing includes new objects (shard ranges haven't changed, just
+        # their object content, so cached shard ranges are still correct)...
+        headers, listing = self.assert_container_listing(
+            more_obj_names + obj_names)
+        self.assertEqual(pre_sharding_listing, listing[len(more_obj_names):])
+
+        # ...but root object count is out of date until the sharders run and
+        # update the root
+        self.assert_container_object_count(len(obj_names))
+
+        # run sharders on the shard to get root updated
+        shard_1 = ShardRange.from_dict(orig_root_shard_ranges[0])
+        self.run_sharders(shard_1)
+        self.assert_container_object_count(len(more_obj_names + obj_names))
+
+        # we've added objects enough that we need to shard the first shard
+        # *again* into three new sub-shards, but nothing happens until the root
+        # leader identifies shard candidate...
+        root_shard_ranges = self.direct_get_container_shard_ranges()
+        for node, (hdrs, root_shards) in root_shard_ranges.items():
+            self.assertLengthEqual(root_shards, 2)
+            with self.subTest(node=node):
+                self.assertEqual(
+                    [ShardRange.ACTIVE] * 2,
+                    [sr['state'] for sr in root_shards])
+                # orig shards 0, 1 should be contiguous
+                self.assert_shard_ranges_contiguous(2, root_shards)
+
+        # Now run the root leader to identify shard candidate...while one of
+        # the shard container servers is down
+        shard_1_part, shard_1_nodes = self.get_part_and_node_numbers(shard_1)
+        self.brain.servers.stop(number=shard_1_nodes[2])
+        self.sharders.once(number=self.brain.node_numbers[0],
+                           additional_args='--partitions=%s' % self.brain.part)
+
+        # ... so third replica of first shard state is not moved to sharding
+        found_for_shard = self.categorize_container_dir_content(
+            shard_1.account, shard_1.container)
+        self.assertLengthEqual(found_for_shard['normal_dbs'], 3)
+        self.assertEqual(
+            [ShardRange.SHARDING, ShardRange.SHARDING, ShardRange.ACTIVE],
+            [ContainerBroker(db_file).get_own_shard_range().state
+             for db_file in found_for_shard['normal_dbs']])
+
+        # ...then run first cycle of first shard sharders in order, leader
+        # first, to get to predictable state where all nodes have cleaved 2 out
+        # of 3 ranges...starting with first two nodes
+        for node_number in shard_1_nodes[:2]:
+            self.sharders.once(
+                number=node_number,
+                additional_args='--partitions=%s' % shard_1_part)
+
+        # ... first two replicas start sharding to sub-shards
+        found_for_shard = self.categorize_container_dir_content(
+            shard_1.account, shard_1.container)
+        self.assertLengthEqual(found_for_shard['shard_dbs'], 2)
+        for db_file in found_for_shard['shard_dbs'][:2]:
+            broker = ContainerBroker(db_file)
+            with self.subTest(db_file=db_file):
+                self.assertIs(False, broker.is_root_container())
+                self.assertEqual('sharding', broker.get_db_state())
+                self.assertEqual(
+                    ShardRange.SHARDING, broker.get_own_shard_range().state)
+                shard_shards = broker.get_shard_ranges()
+                self.assertEqual(
+                    [ShardRange.CLEAVED, ShardRange.CLEAVED,
+                     ShardRange.CREATED],
+                    [sr.state for sr in shard_shards])
+                self.assert_shard_ranges_contiguous(
+                    3, shard_shards,
+                    first_lower=orig_root_shard_ranges[0]['lower'],
+                    last_upper=orig_root_shard_ranges[0]['upper'])
+
+                contexts = list(CleavingContext.load_all(broker))
+                self.assertEqual(len(contexts), 1)
+                context, _lm = contexts[0]
+                self.assertIs(context.cleaving_done, False)
+                self.assertIs(context.misplaced_done, True)
+                self.assertEqual(context.ranges_done, 2)
+                self.assertEqual(context.ranges_todo, 1)
+                self.assertEqual(context.max_row,
+                                 self.max_shard_size * 3 // 2)
+
+        # but third replica still has no idea it should be sharding
+        self.assertLengthEqual(found_for_shard['normal_dbs'], 3)
+        broker = ContainerBroker(found_for_shard['normal_dbs'][2])
+        self.assertEqual(ShardRange.ACTIVE, broker.get_own_shard_range().state)
+
+        # ...but once sharder runs on third replica it will learn its state and
+        # fetch its sub-shard ranges durng audit; note that any root replica on
+        # the stopped container server also won't know about the shards being
+        # in sharding state, so leave that server stopped for now so that shard
+        # fetches its state from an up-to-date root replica
+        self.sharders.once(
+            number=shard_1_nodes[2],
+            additional_args='--partitions=%s' % shard_1_part)
+
+        # third replica is sharding and has sub-shard ranges so can start
+        # cleaving...
+        found_for_shard = self.categorize_container_dir_content(
+            shard_1.account, shard_1.container)
+        self.assertLengthEqual(found_for_shard['shard_dbs'], 3)
+        self.assertLengthEqual(found_for_shard['normal_dbs'], 3)
+        sharding_broker = ContainerBroker(found_for_shard['normal_dbs'][2])
+        self.assertEqual('sharding', sharding_broker.get_db_state())
+        self.assertEqual(
+            ShardRange.SHARDING, sharding_broker.get_own_shard_range().state)
+        self.assertEqual(3, len(sharding_broker.get_shard_ranges()))
+
+        # there may also be a sub-shard replica missing so run replicators on
+        # all nodes to fix that if necessary
+        self.brain.servers.start(number=shard_1_nodes[2])
+        self.replicators.once()
+
+        # Now that the replicators have all run, third replica sees cleaving
+        # contexts for the first two (plus its own cleaving context)
+        contexts = list(CleavingContext.load_all(sharding_broker))
+        self.assertEqual(len(contexts), 3)
+        broker_id = broker.get_info()['id']
+        self.assertIn(broker_id, [ctx[0].ref for ctx in contexts])
+
+        # check original first shard range state and sub-shards - all replicas
+        # should now be in consistent state
+        found_for_shard = self.categorize_container_dir_content(
+            shard_1.account, shard_1.container)
+        self.assertLengthEqual(found_for_shard['shard_dbs'], 3)
+        self.assertLengthEqual(found_for_shard['normal_dbs'], 3)
+        for db_file in found_for_shard['shard_dbs']:
+            broker = ContainerBroker(db_file)
+            with self.subTest(db_file=db_file):
+                self.assertIs(False, broker.is_root_container())
+                self.assertEqual('sharding', broker.get_db_state())
+                self.assertEqual(
+                    ShardRange.SHARDING, broker.get_own_shard_range().state)
+                shard_shards = broker.get_shard_ranges()
+                self.assertEqual(
+                    [ShardRange.CLEAVED, ShardRange.CLEAVED,
+                     ShardRange.CREATED],
+                    [sr.state for sr in shard_shards])
+                self.assert_shard_ranges_contiguous(
+                    3, shard_shards,
+                    first_lower=orig_root_shard_ranges[0]['lower'],
+                    last_upper=orig_root_shard_ranges[0]['upper'])
+
+        # check third sub-shard is in created state
+        sub_shard = shard_shards[2]
+        found_for_sub_shard = self.categorize_container_dir_content(
+            sub_shard.account, sub_shard.container)
+        self.assertFalse(found_for_sub_shard['shard_dbs'])
+        self.assertLengthEqual(found_for_sub_shard['normal_dbs'], 3)
+        for db_file in found_for_sub_shard['normal_dbs']:
+            broker = ContainerBroker(db_file)
+            with self.subTest(db_file=db_file):
+                self.assertIs(False, broker.is_root_container())
+                self.assertEqual('unsharded', broker.get_db_state())
+                self.assertEqual(
+                    ShardRange.CREATED, broker.get_own_shard_range().state)
+                self.assertFalse(broker.get_shard_ranges())
+
+        # check root shard ranges
+        root_shard_ranges = self.direct_get_container_shard_ranges()
+        for node, (hdrs, root_shards) in root_shard_ranges.items():
+            self.assertLengthEqual(root_shards, 5)
+            with self.subTest(node=node):
+                # shard ranges are sorted by upper, state, lower, so expect:
+                # sub-shards, orig shard 0, orig shard 1
+                self.assertEqual(
+                    [ShardRange.CLEAVED, ShardRange.CLEAVED,
+                     ShardRange.CREATED, ShardRange.SHARDING,
+                     ShardRange.ACTIVE],
+                    [sr['state'] for sr in root_shards])
+                # sub-shards 0, 1, 2, orig shard 1 should be contiguous
+                self.assert_shard_ranges_contiguous(
+                    4, root_shards[:3] + root_shards[4:])
+                # orig shards 0, 1 should be contiguous
+                self.assert_shard_ranges_contiguous(2, root_shards[3:])
+
+        self.assert_container_listing(more_obj_names + obj_names)
+        self.assert_container_object_count(len(more_obj_names + obj_names))
+
+        # Before writing, kill the cache
+        self.memcache.delete(get_cache_key(
+            self.account, self.container_name, shard='updating'))
+        # add another object that lands in the first of the new sub-shards
+        self.put_objects(['alpha'])
+
+        # check that alpha object is in the first new shard
+        shard_listings = self.direct_get_container(shard_shards[0].account,
+                                                   shard_shards[0].container)
+        for node, (hdrs, listing) in shard_listings.items():
+            with self.subTest(node=node):
+                self.assertIn('alpha', [o['name'] for o in listing])
+        self.assert_container_listing(['alpha'] + more_obj_names + obj_names)
+        # Run sharders again so things settle.
+        self.run_sharders(shard_1)
+        # Also run replicators to settle cleaving contexts
+        self.replicators.once()
+
+        # check original first shard range shards
+        for db_file in found_for_shard['shard_dbs']:
+            broker = ContainerBroker(db_file)
+            with self.subTest(db_file=db_file):
+                self.assertIs(False, broker.is_root_container())
+                self.assertEqual('sharded', broker.get_db_state())
+                self.assertEqual(
+                    [ShardRange.ACTIVE] * 3,
+                    [sr.state for sr in broker.get_shard_ranges()])
+
+                # Contexts should still be there, and should be complete
+                contexts = set([ctx.done()
+                                for ctx, _
+                                in CleavingContext.load_all(broker)])
+                self.assertEqual({True}, contexts)
+
+        # check root shard ranges
+        root_shard_ranges = self.direct_get_container_shard_ranges()
+        for node, (hdrs, root_shards) in root_shard_ranges.items():
+            # old first shard range should have been deleted
+            self.assertLengthEqual(root_shards, 4)
+            with self.subTest(node=node):
+                self.assertEqual(
+                    [ShardRange.ACTIVE] * 4,
+                    [sr['state'] for sr in root_shards])
+                self.assert_shard_ranges_contiguous(4, root_shards)
+
+        headers, final_listing = self.assert_container_listing(
+            ['alpha'] + more_obj_names + obj_names)
+
+        # check root
+        found = self.categorize_container_dir_content()
+        self.assertLengthEqual(found['shard_dbs'], 3)
+        self.assertLengthEqual(found['normal_dbs'], 0)
+        new_shard_ranges = None
+        for db_file in found['shard_dbs']:
+            broker = ContainerBroker(db_file)
+            self.assertIs(True, broker.is_root_container())
+            self.assertEqual('sharded', broker.get_db_state())
+            if new_shard_ranges is None:
+                new_shard_ranges = broker.get_shard_ranges(
+                    include_deleted=True)
+                self.assertLengthEqual(new_shard_ranges, 5)
+                # Second half is still there, and unchanged
+                self.assertIn(
+                    dict(orig_root_shard_ranges[1], meta_timestamp=None,
+                         state_timestamp=None),
+                    [dict(sr, meta_timestamp=None, state_timestamp=None)
+                     for sr in new_shard_ranges])
+                # But the first half split in three, then deleted
+                by_name = {sr.name: sr for sr in new_shard_ranges}
+                self.assertIn(orig_root_shard_ranges[0]['name'], by_name)
+                old_shard_range = by_name.pop(
+                    orig_root_shard_ranges[0]['name'])
+                self.assertTrue(old_shard_range.deleted)
+                self.assert_shard_ranges_contiguous(4, list(by_name.values()))
+            else:
+                # Everyone's on the same page. Well, except for
+                # meta_timestamps, since the shards each reported
+                other_shard_ranges = broker.get_shard_ranges(
+                    include_deleted=True)
+                self.assert_shard_range_lists_equal(
+                    new_shard_ranges, other_shard_ranges,
+                    excludes=['meta_timestamp', 'state_timestamp'])
+                for orig, updated in zip(orig_root_shard_ranges,
+                                         other_shard_ranges):
+                    self.assertGreaterEqual(updated.meta_timestamp,
+                                            orig['meta_timestamp'])
+
+        self.assert_container_delete_fails()
+
+        for obj in final_listing:
+            client.delete_object(
+                self.url, self.token, self.container_name, obj['name'])
+
+        # the objects won't be listed anymore
+        self.assert_container_listing([])
+        # but root container stats will not yet be aware of the deletions
+        self.assert_container_delete_fails()
+
+        # One server was down while the shard sharded its first two sub-shards,
+        # so there may be undeleted handoff db(s) for sub-shard(s) that were
+        # not fully replicated; run replicators now to clean up so they no
+        # longer report bogus stats to root.
+        self.replicators.once()
+
+        # Run sharder so that shard containers update the root. Do not run
+        # sharder on root container because that triggers shrinks which can
+        # cause root object count to temporarily be non-zero and prevent the
+        # final delete.
+        self.run_sharders(self.get_container_shard_ranges())
+        # then root is empty and can be deleted
+        self.assert_container_listing([])
+        self.assert_container_object_count(0)
+        client.delete_container(self.url, self.token, self.container_name)
+
+    def test_sharded_listing_no_replicators(self):
+        self._test_sharded_listing()
+
+    def test_sharded_listing_with_replicators(self):
+        self._test_sharded_listing(run_replicators=True)
+
+    def test_listing_under_populated_replica(self):
+        # the leader node and one other primary have all the objects and will
+        # cleave to 4 shard ranges, but the third primary only has 1 object in
+        # the final shard range
+        obj_names = self._make_object_names(2 * self.max_shard_size)
+        self.brain.servers.stop(number=self.brain.node_numbers[2])
+        self.put_objects(obj_names)
+        self.brain.servers.start(number=self.brain.node_numbers[2])
+        subset_obj_names = [obj_names[-1]]
+        self.put_objects(subset_obj_names)
+        self.brain.servers.stop(number=self.brain.node_numbers[2])
+
+        # sanity check: the first 2 primaries will list all objects
+        self.assert_container_listing(obj_names, req_hdrs={'x-newest': 'true'})
+
+        # Run sharder on the fully populated nodes, starting with the leader
+        client.post_container(self.url, self.admin_token, self.container_name,
+                              headers={'X-Container-Sharding': 'on'})
+        self.sharders.once(number=self.brain.node_numbers[0],
+                           additional_args='--partitions=%s' % self.brain.part)
+        self.sharders.once(number=self.brain.node_numbers[1],
+                           additional_args='--partitions=%s' % self.brain.part)
+
+        # Verify that the first 2 primary nodes have cleaved the first batch of
+        # 2 shard ranges
+        broker = self.get_broker(self.brain.part, self.brain.nodes[0])
+        self.assertEqual('sharding', broker.get_db_state())
+        shard_ranges = [dict(sr) for sr in broker.get_shard_ranges()]
+        self.assertLengthEqual(shard_ranges, 4)
+        self.assertEqual([ShardRange.CLEAVED, ShardRange.CLEAVED,
+                          ShardRange.CREATED, ShardRange.CREATED],
+                         [sr['state'] for sr in shard_ranges])
+        self.assertEqual(
+            {False},
+            set([ctx.done() for ctx, _ in CleavingContext.load_all(broker)]))
+
+        # listing is complete (from the fully populated primaries at least);
+        # the root serves the listing parts for the last 2 shard ranges which
+        # are not yet cleaved
+        self.assert_container_listing(obj_names, req_hdrs={'x-newest': 'true'})
+
+        # Run the sharder on the under-populated node to get it fully
+        # cleaved.
+        self.brain.servers.start(number=self.brain.node_numbers[2])
+        Manager(['container-replicator']).once(
+            number=self.brain.node_numbers[2])
+        self.sharders.once(number=self.brain.node_numbers[2],
+                           additional_args='--partitions=%s' % self.brain.part)
+
+        broker = self.get_broker(self.brain.part, self.brain.nodes[2])
+        self.assertEqual('sharded', broker.get_db_state())
+        shard_ranges = [dict(sr) for sr in broker.get_shard_ranges()]
+        self.assertLengthEqual(shard_ranges, 4)
+        self.assertEqual([ShardRange.ACTIVE, ShardRange.ACTIVE,
+                          ShardRange.ACTIVE, ShardRange.ACTIVE],
+                         [sr['state'] for sr in shard_ranges])
+        self.assertEqual(
+            {True, False},
+            set([ctx.done() for ctx, _ in CleavingContext.load_all(broker)]))
+
+        # Get a consistent view of shard range states then check listing
+        Manager(['container-replicator']).once(
+            number=self.brain.node_numbers[2])
+        # oops, the listing is incomplete because the last 2 listing parts are
+        # now served by the under-populated shard ranges.
+        self.assert_container_listing(
+            obj_names[:self.max_shard_size] + subset_obj_names,
+            req_hdrs={'x-newest': 'true'})
+
+        # but once another replica has completed cleaving the listing is
+        # complete again
+        self.sharders.once(number=self.brain.node_numbers[1],
+                           additional_args='--partitions=%s' % self.brain.part)
+        self.assert_container_listing(obj_names, req_hdrs={'x-newest': 'true'})
+
+    def assertInAsyncFile(self, async_path, expected):
+        with open(async_path, 'rb') as fd:
+            async_data = pickle.load(fd)
+
+        errors = []
+        for k, v in expected.items():
+            if k not in async_data:
+                errors.append("Key '%s' does not exist" % k)
+                continue
+            if async_data[k] != v:
+                errors.append(
+                    "Exp value %s != %s" % (str(v), str(async_data[k])))
+                continue
+
+        if errors:
+            self.fail('\n'.join(errors))
+
+    def assertNotInAsyncFile(self, async_path, not_expect_keys):
+        with open(async_path, 'rb') as fd:
+            async_data = pickle.load(fd)
+
+        errors = []
+        for k in not_expect_keys:
+            if k in async_data:
+                errors.append(
+                    "Key '%s' exists with value '%s'" % (k, async_data[k]))
+                continue
+
+        if errors:
+            self.fail('\n'.join(errors))
+
+    def test_async_pendings(self):
+        obj_names = self._make_object_names(self.max_shard_size * 2)
+
+        # There are some updates *everyone* gets
+        self.put_objects(obj_names[::5])
+        # But roll some outages so each container only get ~2/5 more object
+        # records i.e. total of 3/5 updates per container; and async pendings
+        # pile up
+        for i, n in enumerate(self.brain.node_numbers, start=1):
+            self.brain.servers.stop(number=n)
+            self.put_objects(obj_names[i::5])
+            self.brain.servers.start(number=n)
+
+        # Check the async pendings, they are unsharded so that's the db_state
+        async_files = self.gather_async_pendings()
+        self.assertTrue(async_files)
+        for af in async_files:
+            self.assertInAsyncFile(af, {'db_state': 'unsharded'})
+            self.assertNotInAsyncFile(af, ['container_path'])
+
+        # But there are also 1/5 updates *no one* gets
+        self.brain.servers.stop()
+        self.put_objects(obj_names[4::5])
+        self.brain.servers.start()
+
+        # Shard it
+        client.post_container(self.url, self.admin_token, self.container_name,
+                              headers={'X-Container-Sharding': 'on'})
+        headers = client.head_container(self.url, self.admin_token,
+                                        self.container_name)
+        self.assertEqual('True', headers.get('x-container-sharding'))
+
+        # sanity check
+        found = self.categorize_container_dir_content()
+        self.assertLengthEqual(found['shard_dbs'], 0)
+        self.assertLengthEqual(found['normal_dbs'], 3)
+        for db_file in found['normal_dbs']:
+            broker = ContainerBroker(db_file)
+            self.assertIs(True, broker.is_root_container())
+            self.assertEqual(len(obj_names) * 3 // 5,
+                             broker.get_info()['object_count'])
+
+        # Only run the 'leader' in charge of scanning.
+        # Each container has ~2 * max * 3/5 objects
+        # which are distributed from obj000 to obj<2 * max - 1>,
+        # so expect 3 shard ranges to be found: the first two will be complete
+        # shards with max/2 objects and lower/upper bounds spaced by approx:
+        #     (2 * max - 1)/(2 * max * 3/5) * (max/2) =~ 5/6 * max
+        #
+        # Note that during this shard cycle the leader replicates to other
+        # nodes so they will end up with ~2 * max * 4/5 objects.
+        self.sharders.once(number=self.brain.node_numbers[0],
+                           additional_args='--partitions=%s' % self.brain.part)
+
+        # Verify that we have one shard db -- though the other normal DBs
+        # received the shard ranges that got defined
+        found = self.categorize_container_dir_content()
+        self.assertLengthEqual(found['shard_dbs'], 1)
+        node_index_zero_db = found['shard_dbs'][0]
+        broker = ContainerBroker(node_index_zero_db)
+        self.assertIs(True, broker.is_root_container())
+        self.assertEqual(SHARDING, broker.get_db_state())
+        expected_shard_ranges = broker.get_shard_ranges()
+        self.assertLengthEqual(expected_shard_ranges, 3)
+        self.assertEqual(
+            [ShardRange.CLEAVED, ShardRange.CLEAVED, ShardRange.CREATED],
+            [sr.state for sr in expected_shard_ranges])
+
+        # Still have all three big DBs -- we've only cleaved 2 of the 3 shard
+        # ranges that got defined
+        self.assertLengthEqual(found['normal_dbs'], 3)
+        db_states = []
+        for db_file in found['normal_dbs']:
+            broker = ContainerBroker(db_file)
+            self.assertIs(True, broker.is_root_container())
+            db_states.append(broker.get_db_state())
+            # the sharded db had shard range meta_timestamps updated during
+            # cleaving, so we do not expect those to be equal on other nodes
+            self.assert_shard_range_lists_equal(
+                expected_shard_ranges, broker.get_shard_ranges(),
+                excludes=['meta_timestamp', 'state_timestamp', 'state'])
+            self.assertEqual(len(obj_names) * 3 // 5,
+                             broker.get_info()['object_count'])
+        self.assertEqual([SHARDING, UNSHARDED, UNSHARDED], sorted(db_states))
+
+        # Run the other sharders so we're all in (roughly) the same state
+        for n in self.brain.node_numbers[1:]:
+            self.sharders.once(
+                number=n,
+                additional_args='--partitions=%s' % self.brain.part)
+        found = self.categorize_container_dir_content()
+        self.assertLengthEqual(found['shard_dbs'], 3)
+        self.assertLengthEqual(found['normal_dbs'], 3)
+        for db_file in found['normal_dbs']:
+            broker = ContainerBroker(db_file)
+            self.assertEqual(SHARDING, broker.get_db_state())
+            # no new rows
+            self.assertEqual(len(obj_names) * 3 // 5,
+                             broker.get_info()['object_count'])
+
+        # Run updaters to clear the async pendings
+        Manager(['object-updater']).once()
+
+        async_files = self.gather_async_pendings()
+        self.assertFalse(async_files)
+
+        # Our "big" dbs didn't take updates
+        for db_file in found['normal_dbs']:
+            broker = ContainerBroker(db_file)
+            self.assertEqual(len(obj_names) * 3 // 5,
+                             broker.get_info()['object_count'])
+
+        # confirm that the async pending updates got redirected to the shards
+        for sr in expected_shard_ranges:
+            shard_listings = self.direct_get_container(sr.account,
+                                                       sr.container)
+            for node, (hdrs, listing) in shard_listings.items():
+                shard_listing_names = [o['name'] for o in listing]
+                for obj in obj_names[4::5]:
+                    if obj in sr:
+                        self.assertIn(obj, shard_listing_names)
+                    else:
+                        self.assertNotIn(obj, shard_listing_names)
+
+        # The entire listing is not yet available - we have two cleaved shard
+        # ranges, complete with async updates, but for the remainder of the
+        # namespace only what landed in the original container
+        headers, listing = client.get_container(self.url, self.token,
+                                                self.container_name)
+        start_listing = [
+            o for o in obj_names if o <= expected_shard_ranges[1].upper]
+        self.assertEqual(
+            [x['name'] for x in listing[:len(start_listing)]],
+            start_listing)
+        # we can't assert much about the remaining listing, other than that
+        # there should be something
+        self.assertTrue(
+            [x['name'] for x in listing[len(start_listing):]])
+        self.assertIn('x-container-object-count', headers)
+        self.assertEqual(str(len(listing)),
+                         headers['x-container-object-count'])
+        headers, listing = client.get_container(self.url, self.token,
+                                                self.container_name,
+                                                query_string='reverse=on')
+        self.assertEqual([x['name'] for x in listing[-len(start_listing):]],
+                         list(reversed(start_listing)))
+        self.assertIn('x-container-object-count', headers)
+        self.assertEqual(str(len(listing)),
+                         headers['x-container-object-count'])
+        self.assertTrue(
+            [x['name'] for x in listing[:-len(start_listing)]])
+
+        # Run the sharders again to get everything to settle
+        self.sharders.once()
+        found = self.categorize_container_dir_content()
+        self.assertLengthEqual(found['shard_dbs'], 3)
+        self.assertLengthEqual(found['normal_dbs'], 0)
+        # now all shards have been cleaved we should get the complete listing
+        headers, listing = client.get_container(self.url, self.token,
+                                                self.container_name)
+        self.assertEqual([x['name'] for x in listing],
+                         obj_names)
+
+        # Create a few more objects in async pending. Check them, they should
+        # now have the correct db_state as sharded
+        more_obj_names = self._make_object_names(10, self.max_shard_size * 2)
+
+        # No one should get these updates
+        self.brain.servers.stop()
+        self.put_objects(more_obj_names)
+        self.brain.servers.start()
+
+        async_files = self.gather_async_pendings()
+        self.assertTrue(async_files)
+        for af in async_files:
+            # They should have a sharded db_state
+            self.assertInAsyncFile(af, {'db_state': 'sharded'})
+            # But because the container-servers were down, they wont have
+            # container-path (because it couldn't get a shard range back)
+            self.assertNotInAsyncFile(af, ['container_path'])
+
+        # they don't exist yet
+        headers, listing = client.get_container(self.url, self.token,
+                                                self.container_name)
+        self.assertEqual([x['name'] for x in listing], obj_names)
+
+        # Now clear them out and they should now exist where we expect.
+        Manager(['object-updater']).once()
+        headers, listing = client.get_container(self.url, self.token,
+                                                self.container_name)
+        self.assertEqual([x['name'] for x in listing],
+                         obj_names + more_obj_names)
+
+        # And they're cleared up
+        async_files = self.gather_async_pendings()
+        self.assertFalse(async_files)
+
+        # If we take 1/2 the nodes offline when we add some more objects,
+        # we should get async pendings with container-path because there
+        # was a container-server to respond.
+        even_more_obj_names = self._make_object_names(
+            10, self.max_shard_size * 2 + 10)
+
+        self.brain.stop_primary_half()
+        self.put_objects(even_more_obj_names)
+        self.brain.start_primary_half()
+
+        async_files = self.gather_async_pendings()
+        self.assertTrue(async_files)
+        for af in async_files:
+            # They should have a sharded db_state AND container_path
+            self.assertInAsyncFile(af, {'db_state': 'sharded',
+                                        'container_path': mock.ANY})
+
+        Manager(['object-updater']).once()
+
+        # And they're cleared up
+        async_files = self.gather_async_pendings()
+        self.assertFalse(async_files)
+
+    def test_shrinking(self):
+        int_client = self.make_internal_client()
+
+        def check_node_data(node_data, exp_hdrs, exp_obj_count, exp_shards,
+                            exp_sharded_root_range=False):
+            hdrs, range_data = node_data
+            self.assert_dict_contains(exp_hdrs, hdrs)
+            sharded_root_range = False
+            other_range_data = []
+            for data in range_data:
+                sr = ShardRange.from_dict(data)
+                if (sr.account == self.account and
+                        sr.container == self.container_name and
+                        sr.state == ShardRange.SHARDED):
+                    # only expect one root range
+                    self.assertFalse(sharded_root_range, range_data)
+                    sharded_root_range = True
+                    self.assertEqual(ShardRange.MIN, sr.lower, sr)
+                    self.assertEqual(ShardRange.MAX, sr.upper, sr)
+                else:
+                    # include active root range in further assertions
+                    other_range_data.append(data)
+            self.assertEqual(exp_sharded_root_range, sharded_root_range)
+            self.assert_shard_ranges_contiguous(exp_shards, other_range_data)
+            self.assert_total_object_count(exp_obj_count, other_range_data)
+
+        def check_shard_nodes_data(node_data, expected_state='unsharded',
+                                   expected_shards=0, exp_obj_count=0,
+                                   exp_sharded_root_range=False):
+            # checks that shard range is consistent on all nodes
+            root_path = '%s/%s' % (self.account, self.container_name)
+            exp_shard_hdrs = {
+                'X-Container-Sysmeta-Shard-Quoted-Root': quote(root_path),
+                'X-Backend-Sharding-State': expected_state}
+            object_counts = []
+            bytes_used = []
+            for node_id, node_data in node_data.items():
+                with self.subTest(node_id=node_id):
+                    check_node_data(
+                        node_data, exp_shard_hdrs, exp_obj_count,
+                        expected_shards, exp_sharded_root_range)
+                hdrs = node_data[0]
+                object_counts.append(int(hdrs['X-Container-Object-Count']))
+                bytes_used.append(int(hdrs['X-Container-Bytes-Used']))
+            if len(set(object_counts)) != 1:
+                self.fail('Inconsistent object counts: %s' % object_counts)
+            if len(set(bytes_used)) != 1:
+                self.fail('Inconsistent bytes used: %s' % bytes_used)
+            return object_counts[0], bytes_used[0]
+
+        repeat = [0]
+
+        def do_shard_then_shrink():
+            repeat[0] += 1
+            obj_names = ['obj-%s-%03d' % (repeat[0], x)
+                         for x in range(self.max_shard_size)]
+            self.put_objects(obj_names)
+            # these two object names will fall at start of first shard range...
+            alpha = 'alpha-%s' % repeat[0]
+            beta = 'beta-%s' % repeat[0]
+
+            # Enable sharding
+            client.post_container(
+                self.url, self.admin_token, self.container_name,
+                headers={'X-Container-Sharding': 'on'})
+
+            # sanity check
+            self.assert_container_listing(obj_names)
+
+            # Only run the one in charge of scanning
+            self.sharders.once(
+                number=self.brain.node_numbers[0],
+                additional_args='--partitions=%s' % self.brain.part)
+
+            # check root container
+            root_nodes_data = self.direct_get_container_shard_ranges()
+            self.assertEqual(3, len(root_nodes_data))
+
+            # nodes on which sharder has not run are still in unsharded state
+            # but have had shard ranges replicated to them
+            exp_obj_count = len(obj_names)
+            exp_hdrs = {'X-Backend-Sharding-State': 'unsharded',
+                        'X-Container-Object-Count': str(exp_obj_count)}
+            node_id = self.brain.node_numbers[1] - 1
+            check_node_data(
+                root_nodes_data[node_id], exp_hdrs, exp_obj_count, 2)
+            node_id = self.brain.node_numbers[2] - 1
+            check_node_data(
+                root_nodes_data[node_id], exp_hdrs, exp_obj_count, 2)
+
+            # only one that ran sharder is in sharded state
+            exp_hdrs['X-Backend-Sharding-State'] = 'sharded'
+            node_id = self.brain.node_numbers[0] - 1
+            check_node_data(
+                root_nodes_data[node_id], exp_hdrs, exp_obj_count, 2)
+
+            orig_range_data = root_nodes_data[node_id][1]
+            orig_shard_ranges = [ShardRange.from_dict(r)
+                                 for r in orig_range_data]
+
+            # check first shard
+            shard_nodes_data = self.direct_get_container_shard_ranges(
+                orig_shard_ranges[0].account, orig_shard_ranges[0].container)
+            obj_count, bytes_used = check_shard_nodes_data(shard_nodes_data)
+            total_shard_object_count = obj_count
+
+            # check second shard
+            shard_nodes_data = self.direct_get_container_shard_ranges(
+                orig_shard_ranges[1].account, orig_shard_ranges[1].container)
+            obj_count, bytes_used = check_shard_nodes_data(shard_nodes_data)
+            total_shard_object_count += obj_count
+            self.assertEqual(exp_obj_count, total_shard_object_count)
+
+            # Now that everyone has shard ranges, run *everyone*
+            self.sharders.once(
+                additional_args='--partitions=%s' % self.brain.part)
+
+            # all root container nodes should now be in sharded state
+            root_nodes_data = self.direct_get_container_shard_ranges()
+            self.assertEqual(3, len(root_nodes_data))
+            for node_id, node_data in root_nodes_data.items():
+                with self.subTest(node_id=node_id):
+                    check_node_data(node_data, exp_hdrs, exp_obj_count, 2)
+
+            # run updaters to update .sharded account; shard containers have
+            # not updated account since having objects replicated to them
+            self.updaters.once()
+            shard_cont_count, shard_obj_count = int_client.get_account_info(
+                orig_shard_ranges[0].account, [204])
+            self.assertEqual(2 * repeat[0], shard_cont_count)
+            # the shards account should always have zero object count to avoid
+            # double accounting
+            self.assertEqual(0, shard_obj_count)
+
+            # checking the listing also refreshes proxy container info cache so
+            # that the proxy becomes aware that container is sharded and will
+            # now look up the shard target for subsequent updates
+            self.assert_container_listing(obj_names)
+
+            # Before writing, kill the cache
+            self.memcache.delete(get_cache_key(
+                self.account, self.container_name, shard='updating'))
+
+            # delete objects from first shard range
+            first_shard_objects = [obj_name for obj_name in obj_names
+                                   if obj_name <= orig_shard_ranges[0].upper]
+            for obj in first_shard_objects:
+                client.delete_object(
+                    self.url, self.token, self.container_name, obj)
+                with self.assertRaises(ClientException):
+                    client.get_object(
+                        self.url, self.token, self.container_name, obj)
+
+            second_shard_objects = [obj_name for obj_name in obj_names
+                                    if obj_name > orig_shard_ranges[1].lower]
+            self.assert_container_listing(second_shard_objects)
+
+            # put a new object 'alpha' in first shard range
+            self.put_objects([alpha])
+            second_shard_objects = [obj_name for obj_name in obj_names
+                                    if obj_name > orig_shard_ranges[1].lower]
+            self.assert_container_listing([alpha] + second_shard_objects)
+
+            # while container servers are down, but proxy has container info in
+            # cache from recent listing, put another object; this update will
+            # lurk in async pending until the updaters run again; because all
+            # the root container servers are down and therefore cannot respond
+            # to a GET for a redirect target, the object update will default to
+            # being targeted at the root container
+            self.stop_container_servers()
+
+            # Before writing, kill the cache
+            self.memcache.delete(get_cache_key(
+                self.account, self.container_name, shard='updating'))
+
+            self.put_objects([beta])
+            self.brain.servers.start()
+            async_pendings = self.gather_async_pendings()
+            num_container_replicas = len(self.brain.nodes)
+            num_obj_replicas = self.policy.object_ring.replica_count
+            expected_num_updates = num_container_updates(
+                num_container_replicas, quorum_size(num_container_replicas),
+                num_obj_replicas, self.policy.quorum)
+            expected_num_pendings = min(expected_num_updates, num_obj_replicas)
+            # sanity check
+            with self.subTest(policy=self.policy):
+                self.assertLengthEqual(async_pendings, expected_num_pendings)
+
+            # root object count is not updated...
+            self.assert_container_object_count(len(obj_names))
+            self.assert_container_listing([alpha] + second_shard_objects)
+            root_nodes_data = self.direct_get_container_shard_ranges()
+            self.assertEqual(3, len(root_nodes_data))
+            for node_id, node_data in root_nodes_data.items():
+                with self.subTest(node_id=node_id):
+                    check_node_data(node_data, exp_hdrs, exp_obj_count, 2)
+                range_data = node_data[1]
+                self.assert_shard_range_lists_equal(
+                    orig_range_data, range_data,
+                    excludes=['meta_timestamp', 'state_timestamp'])
+
+            # ...until the sharders run and update root; reclaim tombstones so
+            # that the shard is shrinkable
+            shard_0_part = self.get_part_and_node_numbers(
+                orig_shard_ranges[0])[0]
+            for conf_index in self.configs['container-sharder'].keys():
+                self.run_custom_sharder(conf_index, {'reclaim_age': 0},
+                                        override_partitions=[shard_0_part])
+            exp_obj_count = len(second_shard_objects) + 1
+            self.assert_container_object_count(exp_obj_count)
+            self.assert_container_listing([alpha] + second_shard_objects)
+
+            # root sharder finds donor, acceptor pair and pushes changes
+            self.sharders.once(
+                additional_args='--partitions=%s' % self.brain.part)
+            self.assert_container_listing([alpha] + second_shard_objects)
+            # run sharder on donor to shrink and replicate to acceptor
+            self.run_sharders(orig_shard_ranges[0])
+            self.assert_container_listing([alpha] + second_shard_objects)
+            # run sharder on acceptor to update root with stats
+            self.run_sharders(orig_shard_ranges[1])
+            self.assert_container_listing([alpha] + second_shard_objects)
+            self.assert_container_object_count(len(second_shard_objects) + 1)
+
+            # check root container
+            root_nodes_data = self.direct_get_container_shard_ranges()
+            self.assertEqual(3, len(root_nodes_data))
+            exp_hdrs['X-Container-Object-Count'] = str(exp_obj_count)
+            for node_id, node_data in root_nodes_data.items():
+                with self.subTest(node_id=node_id):
+                    # NB now only *one* shard range in root
+                    check_node_data(node_data, exp_hdrs, exp_obj_count, 1)
+
+            # the acceptor shard is intact..
+            shard_nodes_data = self.direct_get_container_shard_ranges(
+                orig_shard_ranges[1].account, orig_shard_ranges[1].container)
+            obj_count, bytes_used = check_shard_nodes_data(shard_nodes_data)
+            # all objects should now be in this shard
+            self.assertEqual(exp_obj_count, obj_count)
+
+            # the donor shard is also still intact
+            donor = orig_shard_ranges[0]
+            shard_nodes_data = self.direct_get_container_shard_ranges(
+                donor.account, donor.container)
+            # donor has the acceptor shard range but not the root shard range
+            # because the root is still in ACTIVE state;
+            # the donor's shard range will have the acceptor's projected stats
+            obj_count, bytes_used = check_shard_nodes_data(
+                shard_nodes_data, expected_state='sharded', expected_shards=1,
+                exp_obj_count=len(second_shard_objects) + 1)
+            # but the donor is empty and so reports zero stats
+            self.assertEqual(0, obj_count)
+            self.assertEqual(0, bytes_used)
+            # check the donor own shard range state
+            part, nodes = self.brain.ring.get_nodes(
+                donor.account, donor.container)
+            for node in nodes:
+                with self.subTest(node=node):
+                    broker = self.get_broker(
+                        part, node, donor.account, donor.container)
+                    own_sr = broker.get_own_shard_range()
+                    self.assertEqual(ShardRange.SHRUNK, own_sr.state)
+                    self.assertTrue(own_sr.deleted)
+
+            # delete all the second shard's object apart from 'alpha'
+            for obj in second_shard_objects:
+                client.delete_object(
+                    self.url, self.token, self.container_name, obj)
+
+            self.assert_container_listing([alpha])
+
+            # run sharders: second range should not shrink away yet because it
+            # has tombstones
+            self.sharders.once()  # second shard updates root stats
+            self.assert_container_listing([alpha])
+            self.sharders.once()  # root finds shrinkable shard
+            self.assert_container_listing([alpha])
+            self.sharders.once()  # shards shrink themselves
+            self.assert_container_listing([alpha])
+
+            # the acceptor shard is intact...
+            shard_nodes_data = self.direct_get_container_shard_ranges(
+                orig_shard_ranges[1].account, orig_shard_ranges[1].container)
+            obj_count, bytes_used = check_shard_nodes_data(shard_nodes_data)
+            self.assertEqual(1, obj_count)
+
+            # run sharders to reclaim tombstones so that the second shard is
+            # shrinkable
+            shard_1_part = self.get_part_and_node_numbers(
+                orig_shard_ranges[1])[0]
+            for conf_index in self.configs['container-sharder'].keys():
+                self.run_custom_sharder(conf_index, {'reclaim_age': 0},
+                                        override_partitions=[shard_1_part])
+            self.assert_container_listing([alpha])
+
+            # run sharders so second range shrinks away, requires up to 2
+            # cycles
+            self.sharders.once()  # root finds shrinkable shard
+            self.assert_container_listing([alpha])
+            self.sharders.once()  # shards shrink themselves
+            self.assert_container_listing([alpha])
+
+            # the second shard range has sharded and is empty
+            shard_nodes_data = self.direct_get_container_shard_ranges(
+                orig_shard_ranges[1].account, orig_shard_ranges[1].container)
+            check_shard_nodes_data(
+                shard_nodes_data, expected_state='sharded', expected_shards=1,
+                exp_obj_count=0)
+
+            # check root container
+            root_nodes_data = self.direct_get_container_shard_ranges()
+            self.assertEqual(3, len(root_nodes_data))
+            exp_hdrs = {'X-Backend-Sharding-State': 'collapsed',
+                        # just the alpha object
+                        'X-Container-Object-Count': '1'}
+            for node_id, node_data in root_nodes_data.items():
+                with self.subTest(node_id=node_id):
+                    # NB now no shard ranges in root
+                    check_node_data(node_data, exp_hdrs, 0, 0)
+
+            # delete the alpha object
+            client.delete_object(
+                self.url, self.token, self.container_name, alpha)
+            # should now be able to delete the *apparently* empty container
+            client.delete_container(self.url, self.token, self.container_name)
+            self.assert_container_not_found()
+            self.direct_head_container(expect_failure=True)
+
+            # and the container stays deleted even after sharders run and shard
+            # send updates
+            self.sharders.once()
+            self.assert_container_not_found()
+            self.direct_head_container(expect_failure=True)
+
+            # now run updaters to deal with the async pending for the beta
+            # object
+            self.updaters.once()
+            # and the container is revived!
+            self.assert_container_listing([beta])
+
+            # finally, clear out the container
+            client.delete_object(
+                self.url, self.token, self.container_name, beta)
+
+        do_shard_then_shrink()
+        # repeat from starting point of a collapsed and previously deleted
+        # container
+        do_shard_then_shrink()
+
+    def test_delete_root_reclaim(self):
+        all_obj_names = self._make_object_names(self.max_shard_size)
+        self.put_objects(all_obj_names)
+        # Shard the container
+        client.post_container(self.url, self.admin_token, self.container_name,
+                              headers={'X-Container-Sharding': 'on'})
+        for n in self.brain.node_numbers:
+            self.sharders.once(
+                number=n, additional_args='--partitions=%s' % self.brain.part)
+        # sanity checks
+        self.assert_container_states('sharded', 2)
+        self.assert_container_delete_fails()
+        self.assert_container_has_shard_sysmeta()
+        self.assert_container_post_ok('sharded')
+        self.assert_container_listing(all_obj_names)
+
+        # delete all objects - updates redirected to shards
+        self.delete_objects(all_obj_names)
+        self.assert_container_listing([])
+        self.assert_container_post_ok('has objects')
+        # root not yet updated with shard stats
+        self.assert_container_object_count(len(all_obj_names))
+        self.assert_container_delete_fails()
+        self.assert_container_has_shard_sysmeta()
+
+        # run sharder on shard containers to update root stats
+        shard_ranges = self.get_container_shard_ranges()
+        self.assertLengthEqual(shard_ranges, 2)
+        self.run_sharders(shard_ranges)
+        self.assert_container_listing([])
+        self.assert_container_post_ok('empty')
+        self.assert_container_object_count(0)
+
+        # and now we can delete it!
+        client.delete_container(self.url, self.token, self.container_name)
+        self.assert_container_post_fails('deleted')
+        self.assert_container_not_found()
+
+        # see if it will reclaim
+        Manager(['container-updater']).once()
+        for conf_file in self.configs['container-replicator'].values():
+            conf = utils.readconf(conf_file, 'container-replicator')
+            conf['reclaim_age'] = 0
+            ContainerReplicator(conf).run_once()
+
+        # we don't expect warnings from sharder root audits
+        for conf_index in self.configs['container-sharder'].keys():
+            sharder = self.run_custom_sharder(conf_index, {})
+            self.assertEqual([], sharder.logger.get_lines_for_level('warning'))
+
+        # until the root wants to start reclaiming but we haven't shrunk yet!
+        found_warning = False
+        for conf_index in self.configs['container-sharder'].keys():
+            sharder = self.run_custom_sharder(conf_index, {'reclaim_age': 0})
+            warnings = sharder.logger.get_lines_for_level('warning')
+            if warnings:
+                self.assertTrue(warnings[0].startswith(
+                    'Reclaimable db stuck waiting for shrinking'))
+                self.assertEqual(1, len(warnings))
+                found_warning = True
+        self.assertTrue(found_warning)
+
+        # TODO: shrink empty shards and assert everything reclaims
+
+    def _setup_replication_scenario(self, num_shards, extra_objs=('alpha',)):
+        # Get cluster to state where 2 replicas are sharding or sharded but 3rd
+        # replica is unsharded and has an object that the first 2 are missing.
+
+        # put objects while all servers are up
+        obj_names = self._make_object_names(
+            num_shards * self.max_shard_size // 2)
+        self.put_objects(obj_names)
+
+        client.post_container(self.url, self.admin_token, self.container_name,
+                              headers={'X-Container-Sharding': 'on'})
+        node_numbers = self.brain.node_numbers
+
+        # run replicators first time to get sync points set
+        self.replicators.once()
+
+        # stop the leader node and one other server
+        self.stop_container_servers(slice(0, 2))
+
+        # ...then put one more object in first shard range namespace
+        self.put_objects(extra_objs)
+
+        # start leader and first other server, stop third server
+        for number in node_numbers[:2]:
+            self.brain.servers.start(number=number)
+        self.brain.servers.stop(number=node_numbers[2])
+        self.assert_container_listing(obj_names)  # sanity check
+
+        # shard the container - first two shard ranges are cleaved
+        for number in node_numbers[:2]:
+            self.sharders.once(
+                number=number,
+                additional_args='--partitions=%s' % self.brain.part)
+
+        self.assert_container_listing(obj_names)  # sanity check
+        return obj_names
+
+    def test_replication_to_sharding_container(self):
+        # verify that replication from an unsharded replica to a sharding
+        # replica does not replicate rows but does replicate shard ranges
+        obj_names = self._setup_replication_scenario(3)
+        for node in self.brain.nodes[:2]:
+            self.assert_container_state(node, 'sharding', 3)
+
+        # bring third server back up, run replicator
+        node_numbers = self.brain.node_numbers
+        self.brain.servers.start(number=node_numbers[2])
+        # sanity check...
+        self.assert_container_state(self.brain.nodes[2], 'unsharded', 0)
+        self.replicators.once(number=node_numbers[2])
+        # check db files unchanged
+        found = self.categorize_container_dir_content()
+        self.assertLengthEqual(found['shard_dbs'], 2)
+        self.assertLengthEqual(found['normal_dbs'], 3)
+
+        # the 'alpha' object is NOT replicated to the two sharded nodes
+        for node in self.brain.nodes[:2]:
+            broker = self.get_broker(self.brain.part, node)
+            with self.subTest(node=node['id'], nodes=self.brain.nodes[:2]):
+                self.assertFalse(broker.get_objects())
+                self.assert_container_state(node, 'sharding', 3)
+        self.brain.servers.stop(number=node_numbers[2])
+        self.assert_container_listing(obj_names)
+
+        # all nodes now have shard ranges
+        self.brain.servers.start(number=node_numbers[2])
+        node_data = self.direct_get_container_shard_ranges()
+        for node, (hdrs, shard_ranges) in node_data.items():
+            with self.subTest(node=node):
+                self.assert_shard_ranges_contiguous(3, shard_ranges)
+
+        # complete cleaving third shard range on first two nodes
+        self.brain.servers.stop(number=node_numbers[2])
+        for number in node_numbers[:2]:
+            self.sharders.once(
+                number=number,
+                additional_args='--partitions=%s' % self.brain.part)
+        # ...and now they are in sharded state
+        self.assert_container_state(self.brain.nodes[0], 'sharded', 3)
+        self.assert_container_state(self.brain.nodes[1], 'sharded', 3)
+        # ...still no 'alpha' object in listing
+        self.assert_container_listing(obj_names)
+
+        # run the sharder on the third server, alpha object is included in
+        # shards that it cleaves
+        self.brain.servers.start(number=node_numbers[2])
+        self.assert_container_state(self.brain.nodes[2], 'unsharded', 3)
+        self.sharders.once(number=node_numbers[2],
+                           additional_args='--partitions=%s' % self.brain.part)
+        self.assert_container_state(self.brain.nodes[2], 'sharding', 3)
+        self.sharders.once(number=node_numbers[2],
+                           additional_args='--partitions=%s' % self.brain.part)
+        self.assert_container_state(self.brain.nodes[2], 'sharded', 3)
+        self.assert_container_listing(['alpha'] + obj_names)
+
+    def test_replication_to_sharded_container(self):
+        # verify that replication from an unsharded replica to a sharded
+        # replica does not replicate rows but does replicate shard ranges
+        obj_names = self._setup_replication_scenario(2)
+        for node in self.brain.nodes[:2]:
+            self.assert_container_state(node, 'sharded', 2)
+
+        # sanity check
+        found = self.categorize_container_dir_content()
+        self.assertLengthEqual(found['shard_dbs'], 2)
+        self.assertLengthEqual(found['normal_dbs'], 1)
+        for node in self.brain.nodes[:2]:
+            broker = self.get_broker(self.brain.part, node)
+            info = broker.get_info()
+            with self.subTest(node=node['id'], nodes=self.brain.nodes[:2]):
+                self.assertEqual(len(obj_names), info['object_count'])
+                self.assertFalse(broker.get_objects())
+
+        # bring third server back up, run replicator
+        node_numbers = self.brain.node_numbers
+        self.brain.servers.start(number=node_numbers[2])
+        # sanity check...
+        self.assert_container_state(self.brain.nodes[2], 'unsharded', 0)
+        self.replicators.once(number=node_numbers[2])
+        # check db files unchanged
+        found = self.categorize_container_dir_content()
+        self.assertLengthEqual(found['shard_dbs'], 2)
+        self.assertLengthEqual(found['normal_dbs'], 1)
+
+        # the 'alpha' object is NOT replicated to the two sharded nodes
+        for node in self.brain.nodes[:2]:
+            broker = self.get_broker(self.brain.part, node)
+            with self.subTest(node=node['id'], nodes=self.brain.nodes[:2]):
+                self.assertFalse(broker.get_objects())
+                self.assert_container_state(node, 'sharded', 2)
+        self.brain.servers.stop(number=node_numbers[2])
+        self.assert_container_listing(obj_names)
+
+        # all nodes now have shard ranges
+        self.brain.servers.start(number=node_numbers[2])
+        node_data = self.direct_get_container_shard_ranges()
+        for node, (hdrs, shard_ranges) in node_data.items():
+            with self.subTest(node=node):
+                self.assert_shard_ranges_contiguous(2, shard_ranges)
+
+        # run the sharder on the third server, alpha object is included in
+        # shards that it cleaves
+        self.assert_container_state(self.brain.nodes[2], 'unsharded', 2)
+        self.sharders.once(number=node_numbers[2],
+                           additional_args='--partitions=%s' % self.brain.part)
+        self.assert_container_state(self.brain.nodes[2], 'sharded', 2)
+        self.assert_container_listing(['alpha'] + obj_names)
+
+    def test_sharding_requires_sufficient_replication(self):
+        # verify that cleaving only progresses if each cleaved shard range is
+        # sufficiently replicated
+
+        # put enough objects for 4 shard ranges
+        obj_names = self._make_object_names(2 * self.max_shard_size)
+        self.put_objects(obj_names)
+
+        client.post_container(self.url, self.admin_token, self.container_name,
+                              headers={'X-Container-Sharding': 'on'})
+        node_numbers = self.brain.node_numbers
+        leader_node = self.brain.nodes[0]
+        leader_num = node_numbers[0]
+
+        # run replicators first time to get sync points set
+        self.replicators.once()
+
+        # start sharding on the leader node
+        self.sharders.once(number=leader_num,
+                           additional_args='--partitions=%s' % self.brain.part)
+        shard_ranges = self.assert_container_state(leader_node, 'sharding', 4)
+        self.assertEqual([ShardRange.CLEAVED] * 2 + [ShardRange.CREATED] * 2,
+                         [sr.state for sr in shard_ranges])
+
+        # Check the current progress. It shouldn't be complete.
+        recon = direct_client.direct_get_recon(leader_node, "sharding")
+        expected_in_progress = {'all': [{'account': 'AUTH_test',
+                                         'active': 0,
+                                         'cleaved': 2,
+                                         'created': 2,
+                                         'found': 0,
+                                         'db_state': 'sharding',
+                                         'state': 'sharding',
+                                         'error': None,
+                                         'file_size': mock.ANY,
+                                         'meta_timestamp': mock.ANY,
+                                         'node_index': 0,
+                                         'object_count': len(obj_names),
+                                         'tombstones': -1,
+                                         'container': mock.ANY,
+                                         'path': mock.ANY,
+                                         'root': mock.ANY,
+                                         'processing_time': mock.ANY,
+                                         }]}
+        actual = recon['sharding_stats']['sharding']['sharding_in_progress']
+        self.assertEqual(expected_in_progress, actual)
+
+        # stop *all* container servers for third shard range
+        sr_part, sr_node_nums = self.get_part_and_node_numbers(shard_ranges[2])
+        for node_num in sr_node_nums:
+            self.brain.servers.stop(number=node_num)
+
+        # attempt to continue sharding on the leader node
+        self.sharders.once(number=leader_num,
+                           additional_args='--partitions=%s' % self.brain.part)
+
+        # no cleaving progress was made
+        for node_num in sr_node_nums:
+            self.brain.servers.start(number=node_num)
+        shard_ranges = self.assert_container_state(leader_node, 'sharding', 4)
+        self.assertEqual([ShardRange.CLEAVED] * 2 + [ShardRange.CREATED] * 2,
+                         [sr.state for sr in shard_ranges])
+
+        # stop two of the servers for third shard range, not including any
+        # server that happens to be the leader node
+        stopped = []
+        for node_num in sr_node_nums:
+            if node_num != leader_num:
+                self.brain.servers.stop(number=node_num)
+                stopped.append(node_num)
+                if len(stopped) >= 2:
+                    break
+        self.assertLengthEqual(stopped, 2)  # sanity check
+
+        # attempt to continue sharding on the leader node
+        self.sharders.once(number=leader_num,
+                           additional_args='--partitions=%s' % self.brain.part)
+
+        # no cleaving progress was made
+        for node_num in stopped:
+            self.brain.servers.start(number=node_num)
+        shard_ranges = self.assert_container_state(leader_node, 'sharding', 4)
+        self.assertEqual([ShardRange.CLEAVED] * 2 + [ShardRange.CREATED] * 2,
+                         [sr.state for sr in shard_ranges])
+
+        # stop just one of the servers for third shard range
+        stopped = []
+        for node_num in sr_node_nums:
+            if node_num != leader_num:
+                self.brain.servers.stop(number=node_num)
+                stopped.append(node_num)
+                break
+        self.assertLengthEqual(stopped, 1)  # sanity check
+
+        # attempt to continue sharding the container
+        self.sharders.once(number=leader_num,
+                           additional_args='--partitions=%s' % self.brain.part)
+
+        # this time cleaving completed
+        self.brain.servers.start(number=stopped[0])
+        shard_ranges = self.assert_container_state(leader_node, 'sharded', 4)
+        self.assertEqual([ShardRange.ACTIVE] * 4,
+                         [sr.state for sr in shard_ranges])
+
+        # Check the leader's progress again, this time is should be complete
+        recon = direct_client.direct_get_recon(leader_node, "sharding")
+        expected_in_progress = {'all': [{'account': 'AUTH_test',
+                                         'active': 4,
+                                         'cleaved': 0,
+                                         'created': 0,
+                                         'found': 0,
+                                         'db_state': 'sharded',
+                                         'state': 'sharded',
+                                         'error': None,
+                                         'file_size': mock.ANY,
+                                         'meta_timestamp': mock.ANY,
+                                         'node_index': 0,
+                                         'object_count': len(obj_names),
+                                         'tombstones': -1,
+                                         'container': mock.ANY,
+                                         'path': mock.ANY,
+                                         'root': mock.ANY,
+                                         'processing_time': mock.ANY,
+                                         'total_sharding_time': mock.ANY,
+                                         'total_replicate_time': mock.ANY
+                                         }]}
+        actual = recon['sharding_stats']['sharding']['sharding_in_progress']
+        self.assertEqual(expected_in_progress, actual)
+
+    def test_sharded_delete(self):
+        all_obj_names = self._make_object_names(self.max_shard_size)
+        self.put_objects(all_obj_names)
+        # Shard the container
+        client.post_container(self.url, self.admin_token, self.container_name,
+                              headers={'X-Container-Sharding': 'on'})
+        for n in self.brain.node_numbers:
+            self.sharders.once(
+                number=n, additional_args='--partitions=%s' % self.brain.part)
+        # sanity checks
+        self.assert_container_states('sharded', 2)
+        self.assert_container_delete_fails()
+        self.assert_container_has_shard_sysmeta()
+        self.assert_container_post_ok('sharded')
+        self.assert_container_listing(all_obj_names)
+
+        # delete all objects - updates redirected to shards
+        self.delete_objects(all_obj_names)
+        self.assert_container_listing([])
+        self.assert_container_post_ok('has objects')
+        # root not yet updated with shard stats
+        self.assert_container_object_count(len(all_obj_names))
+        self.assert_container_delete_fails()
+        self.assert_container_has_shard_sysmeta()
+
+        # run sharder on shard containers to update root stats
+        shard_ranges = self.get_container_shard_ranges()
+        self.assertLengthEqual(shard_ranges, 2)
+        self.run_sharders(shard_ranges)
+        self.assert_container_listing([])
+        self.assert_container_post_ok('empty')
+        self.assert_container_object_count(0)
+
+        # put a new object - update redirected to shard
+        self.put_objects(['alpha'])
+        self.assert_container_listing(['alpha'])
+        self.assert_container_object_count(0)
+
+        # before root learns about new object in shard, delete the container
+        client.delete_container(self.url, self.token, self.container_name)
+        self.assert_container_post_fails('deleted')
+        self.assert_container_not_found()
+
+        # run the sharders to update root with shard stats
+        self.run_sharders(shard_ranges)
+
+        self.assert_container_listing(['alpha'])
+        self.assert_container_object_count(1)
+        self.assert_container_delete_fails()
+        self.assert_container_post_ok('revived')
+
+    def _do_test_sharded_can_get_objects_different_policy(self,
+                                                          policy_idx,
+                                                          new_policy_idx):
+        # create sharded container
+        client.delete_container(self.url, self.token, self.container_name)
+        self.brain.put_container(policy_index=int(policy_idx))
+        all_obj_names = self._make_object_names(self.max_shard_size)
+        self.put_objects(all_obj_names)
+        client.post_container(self.url, self.admin_token, self.container_name,
+                              headers={'X-Container-Sharding': 'on'})
+        for n in self.brain.node_numbers:
+            self.sharders.once(
+                number=n, additional_args='--partitions=%s' % self.brain.part)
+        # empty and delete
+        self.delete_objects(all_obj_names)
+        shard_ranges = self.get_container_shard_ranges()
+        self.run_sharders(shard_ranges)
+        client.delete_container(self.url, self.token, self.container_name)
+
+        # re-create with new_policy_idx
+        self.brain.put_container(policy_index=int(new_policy_idx))
+
+        # we re-use shard ranges
+        new_shard_ranges = self.get_container_shard_ranges()
+        self.assertEqual(shard_ranges, new_shard_ranges)
+        self.put_objects(all_obj_names)
+
+        # The shard is still on the old policy index, but the root spi
+        # is passed to shard container server and is used to pull objects
+        # of that index out.
+        self.assert_container_listing(all_obj_names)
+        # although a head request is getting object count for the shard spi
+        self.assert_container_object_count(0)
+
+        # we can force the listing to use the old policy index in which case we
+        # expect no objects to be listed
+        try:
+            resp = self.internal_client.make_request(
+                'GET',
+                path=self.internal_client.make_path(
+                    self.account, self.container_name),
+                headers={'X-Backend-Storage-Policy-Index': str(policy_idx)},
+                acceptable_statuses=(2,),
+                params={'format': 'json'}
+            )
+        except UnexpectedResponse as exc:
+            self.fail('Listing failed with %s' % exc.resp.status)
+
+        self.assertEqual([], json.loads(b''.join(resp.app_iter)))
+
+    @unittest.skipIf(len(ENABLED_POLICIES) < 2, "Need more than one policy")
+    def test_sharded_can_get_objects_different_policy(self):
+        policy_idx = self.policy.idx
+        new_policy_idx = [pol.idx for pol in ENABLED_POLICIES
+                          if pol != self.policy.idx][0]
+        self._do_test_sharded_can_get_objects_different_policy(
+            policy_idx, new_policy_idx)
+
+    @unittest.skipIf(len(ENABLED_POLICIES) < 2, "Need more than one policy")
+    def test_sharded_can_get_objects_different_policy_reversed(self):
+        policy_idx = [pol.idx for pol in ENABLED_POLICIES
+                      if pol != self.policy][0]
+        new_policy_idx = self.policy.idx
+        self._do_test_sharded_can_get_objects_different_policy(
+            policy_idx, new_policy_idx)
+
+    def test_object_update_redirection(self):
+        all_obj_names = self._make_object_names(self.max_shard_size)
+        self.put_objects(all_obj_names)
+        # Shard the container
+        client.post_container(self.url, self.admin_token, self.container_name,
+                              headers={'X-Container-Sharding': 'on'})
+        for n in self.brain.node_numbers:
+            self.sharders.once(
+                number=n, additional_args='--partitions=%s' % self.brain.part)
+        # sanity checks
+        self.assert_container_states('sharded', 2)
+        self.assert_container_delete_fails()
+        self.assert_container_has_shard_sysmeta()
+        self.assert_container_post_ok('sharded')
+        self.assert_container_listing(all_obj_names)
+
+        # delete all objects - updates redirected to shards
+        self.delete_objects(all_obj_names)
+        self.assert_container_listing([])
+        self.assert_container_post_ok('has objects')
+
+        # run sharder on shard containers to update root stats; reclaim
+        # the tombstones so that the shards appear to be shrinkable
+        shard_ranges = self.get_container_shard_ranges()
+        self.assertLengthEqual(shard_ranges, 2)
+        shard_partitions = [self.get_part_and_node_numbers(sr)[0]
+                            for sr in shard_ranges]
+        for conf_index in self.configs['container-sharder'].keys():
+            self.run_custom_sharder(conf_index, {'reclaim_age': 0},
+                                    override_partitions=shard_partitions)
+        self.assert_container_object_count(0)
+
+        # First, test a misplaced object moving from one shard to another.
+        # with one shard server down, put a new 'alpha' object...
+        shard_part, shard_nodes = self.get_part_and_node_numbers(
+            shard_ranges[0])
+        self.brain.servers.stop(number=shard_nodes[2])
+        self.put_objects(['alpha'])
+        self.assert_container_listing(['alpha'])
+        self.assert_container_object_count(0)
+        self.assertLengthEqual(self.gather_async_pendings(), 1)
+        self.brain.servers.start(number=shard_nodes[2])
+
+        # run sharder on root to discover first shrink candidate
+        self.sharders.once(additional_args='--partitions=%s' % self.brain.part)
+        # then run sharder on the shard node without the alpha object
+        self.sharders.once(additional_args='--partitions=%s' % shard_part,
+                           number=shard_nodes[2])
+        # root sees first shard has shrunk
+        self.assertLengthEqual(self.get_container_shard_ranges(), 1)
+        # cached shard ranges still show first shard range as active so listing
+        # will include 'alpha' if the shard listing is fetched from node (0,1)
+        # but not if fetched from node 2; to achieve predictability we use
+        # x-newest to use shard ranges from the root so that only the second
+        # shard range is used for listing, so alpha object not in listing
+        self.assert_container_listing([], req_hdrs={'x-newest': 'true'})
+        self.assert_container_object_count(0)
+
+        # run the updaters: the async pending update will be redirected from
+        # shrunk shard to second shard
+        self.updaters.once()
+        self.assert_container_listing(['alpha'])
+        self.assert_container_object_count(0)  # root not yet updated
+
+        # then run sharder on other shard nodes to complete shrinking
+        for number in shard_nodes[:2]:
+            self.sharders.once(additional_args='--partitions=%s' % shard_part,
+                               number=number)
+        # and get root updated
+        self.run_sharders(shard_ranges[1])
+        self.assert_container_listing(['alpha'])
+        self.assert_container_object_count(1)
+        self.assertLengthEqual(self.get_container_shard_ranges(), 1)
+
+        # Now we have just one active shard, test a misplaced object moving
+        # from that shard to the root.
+        # with one shard server down, delete 'alpha' and put a 'beta' object...
+        shard_part, shard_nodes = self.get_part_and_node_numbers(
+            shard_ranges[1])
+        self.brain.servers.stop(number=shard_nodes[2])
+        # Before writing, kill the cache
+        self.memcache.delete(get_cache_key(
+            self.account, self.container_name, shard='updating'))
+        self.delete_objects(['alpha'])
+        self.put_objects(['beta'])
+        self.assert_container_listing(['beta'])
+        self.assert_container_object_count(1)
+        self.assertLengthEqual(self.gather_async_pendings(), 2)
+        self.brain.servers.start(number=shard_nodes[2])
+
+        # run sharder on root to discover second shrink candidate - root is not
+        # yet aware of the beta object
+        self.sharders.once(additional_args='--partitions=%s' % self.brain.part)
+        # then run sharder on the shard node without the beta object, to shrink
+        # it to root - note this moves stale copy of alpha to the root db
+        self.sharders.once(additional_args='--partitions=%s' % shard_part,
+                           number=shard_nodes[2])
+        # now there are no active shards
+        self.assertFalse(self.get_container_shard_ranges())
+
+        # with other two shard servers down, listing won't find beta object
+        for number in shard_nodes[:2]:
+            self.brain.servers.stop(number=number)
+        self.assert_container_listing(['alpha'])
+        self.assert_container_object_count(1)
+
+        # run the updaters: the async pending update will be redirected from
+        # shrunk shard to the root
+        self.updaters.once()
+        self.assert_container_listing(['beta'])
+        self.assert_container_object_count(1)
+
+    def test_misplaced_object_movement(self):
+        def merge_object(shard_range, name, deleted=0):
+            # it's hard to get a test to put a misplaced object into a shard,
+            # so this hack is used force an object record directly into a shard
+            # container db. Note: the actual object won't exist, we're just
+            # using this to test object records in container dbs.
+            shard_part, shard_nodes = self.brain.ring.get_nodes(
+                shard_range.account, shard_range.container)
+            shard_broker = self.get_broker(
+                shard_part, shard_nodes[0], shard_range.account,
+                shard_range.container)
+            shard_broker.merge_items(
+                [{'name': name, 'created_at': Timestamp.now().internal,
+                  'size': 0, 'content_type': 'text/plain',
+                  'etag': md5(usedforsecurity=False).hexdigest(),
+                  'deleted': deleted,
+                  'storage_policy_index': shard_broker.storage_policy_index}])
+            return shard_nodes[0]
+
+        all_obj_names = self._make_object_names(self.max_shard_size)
+        self.put_objects(all_obj_names)
+        # Shard the container
+        client.post_container(self.url, self.admin_token, self.container_name,
+                              headers={'X-Container-Sharding': 'on'})
+        for n in self.brain.node_numbers:
+            self.sharders.once(
+                number=n, additional_args='--partitions=%s' % self.brain.part)
+        # sanity checks
+        self.assert_container_states('sharded', 2)
+        self.assert_container_delete_fails()
+        self.assert_container_has_shard_sysmeta()
+        self.assert_container_post_ok('sharded')
+        self.assert_container_listing(all_obj_names)
+
+        # delete all objects in first shard range - updates redirected to shard
+        shard_ranges = self.get_container_shard_ranges()
+        self.assertLengthEqual(shard_ranges, 2)
+        shard_0_objects = [name for name in all_obj_names
+                           if name in shard_ranges[0]]
+        shard_1_objects = [name for name in all_obj_names
+                           if name in shard_ranges[1]]
+        self.delete_objects(shard_0_objects)
+        self.assert_container_listing(shard_1_objects)
+        self.assert_container_post_ok('has objects')
+
+        # run sharder on first shard container to update root stats; reclaim
+        # the tombstones so that the shard appears to be shrinkable
+        shard_0_part = self.get_part_and_node_numbers(shard_ranges[0])[0]
+        for conf_index in self.configs['container-sharder'].keys():
+            self.run_custom_sharder(conf_index, {'reclaim_age': 0},
+                                    override_partitions=[shard_0_part])
+        self.assert_container_object_count(len(shard_1_objects))
+
+        # First, test a misplaced object moving from one shard to another.
+        # run sharder on root to discover first shrink candidate
+        self.sharders.once(additional_args='--partitions=%s' % self.brain.part)
+        # then run sharder on first shard range to shrink it
+        self.run_sharders(shard_ranges[0])
+        # force a misplaced object into the shrunken shard range to simulate
+        # a client put that was in flight when it started to shrink
+        misplaced_node = merge_object(shard_ranges[0], 'alpha', deleted=0)
+        # root sees first shard has shrunk, only second shard range used for
+        # listing so alpha object not in listing
+        self.assertLengthEqual(self.get_container_shard_ranges(), 1)
+        self.assert_container_listing(shard_1_objects)
+        self.assert_container_object_count(len(shard_1_objects))
+        # until sharder runs on that node to move the misplaced object to the
+        # second shard range
+        shard_part, shard_nodes_numbers = self.get_part_and_node_numbers(
+            shard_ranges[0])
+        self.sharders.once(additional_args='--partitions=%s' % shard_part,
+                           number=misplaced_node['id'] + 1)
+        self.assert_container_listing(['alpha'] + shard_1_objects)
+        # root not yet updated
+        self.assert_container_object_count(len(shard_1_objects))
+
+        # run sharder to get root updated
+        self.run_sharders(shard_ranges[1])
+        self.assert_container_listing(['alpha'] + shard_1_objects)
+        self.assert_container_object_count(len(shard_1_objects) + 1)
+        self.assertLengthEqual(self.get_container_shard_ranges(), 1)
+
+        # Now we have just one active shard, test a misplaced object moving
+        # from that shard to the root.
+        # delete most objects from second shard range, reclaim the tombstones,
+        # and run sharder on root to discover second shrink candidate
+        self.delete_objects(shard_1_objects)
+        shard_1_part = self.get_part_and_node_numbers(shard_ranges[1])[0]
+        for conf_index in self.configs['container-sharder'].keys():
+            self.run_custom_sharder(conf_index, {'reclaim_age': 0},
+                                    override_partitions=[shard_1_part])
+        self.sharders.once(additional_args='--partitions=%s' % self.brain.part)
+        # then run sharder on the shard node to shrink it to root - note this
+        # moves alpha to the root db
+        self.run_sharders(shard_ranges[1])
+        # now there are no active shards
+        self.assertFalse(self.get_container_shard_ranges())
+
+        # force some misplaced object updates into second shrunk shard range
+        merge_object(shard_ranges[1], 'alpha', deleted=1)
+        misplaced_node = merge_object(shard_ranges[1], 'beta', deleted=0)
+        # root is not yet aware of them
+        self.assert_container_listing(['alpha'])
+        self.assert_container_object_count(1)
+        # until sharder runs on that node to move the misplaced object
+        shard_part, shard_nodes_numbers = self.get_part_and_node_numbers(
+            shard_ranges[1])
+        self.sharders.once(additional_args='--partitions=%s' % shard_part,
+                           number=misplaced_node['id'] + 1)
+        self.assert_container_listing(['beta'])
+        self.assert_container_object_count(1)
+        self.assert_container_delete_fails()
+
+    def test_misplaced_object_movement_from_deleted_shard(self):
+        def merge_object(shard_range, name, deleted=0):
+            # it's hard to get a test to put a misplaced object into a shard,
+            # so this hack is used force an object record directly into a shard
+            # container db. Note: the actual object won't exist, we're just
+            # using this to test object records in container dbs.
+            shard_part, shard_nodes = self.brain.ring.get_nodes(
+                shard_range.account, shard_range.container)
+            shard_broker = self.get_shard_broker(shard_range)
+            # In this test we want to merge into a deleted container shard
+            shard_broker.delete_db(Timestamp.now().internal)
+            shard_broker.merge_items(
+                [{'name': name, 'created_at': Timestamp.now().internal,
+                  'size': 0, 'content_type': 'text/plain',
+                  'etag': md5(usedforsecurity=False).hexdigest(),
+                  'deleted': deleted,
+                  'storage_policy_index': shard_broker.storage_policy_index}])
+            return shard_nodes[0]
+
+        all_obj_names = self._make_object_names(self.max_shard_size)
+        self.put_objects(all_obj_names)
+        # Shard the container
+        client.post_container(self.url, self.admin_token, self.container_name,
+                              headers={'X-Container-Sharding': 'on'})
+        for n in self.brain.node_numbers:
+            self.sharders.once(
+                number=n, additional_args='--partitions=%s' % self.brain.part)
+        # sanity checks
+        self.assert_container_states('sharded', 2)
+        self.assert_container_delete_fails()
+        self.assert_container_has_shard_sysmeta()
+        self.assert_container_post_ok('sharded')
+        self.assert_container_listing(all_obj_names)
+
+        # delete all objects in first shard range - updates redirected to shard
+        shard_ranges = self.get_container_shard_ranges()
+        self.assertLengthEqual(shard_ranges, 2)
+        shard_0_objects = [name for name in all_obj_names
+                           if name in shard_ranges[0]]
+        shard_1_objects = [name for name in all_obj_names
+                           if name in shard_ranges[1]]
+        self.delete_objects(shard_0_objects)
+        self.assert_container_listing(shard_1_objects)
+        self.assert_container_post_ok('has objects')
+
+        # run sharder on first shard container to update root stats
+        shard_0_part = self.get_part_and_node_numbers(shard_ranges[0])[0]
+        for conf_index in self.configs['container-sharder'].keys():
+            self.run_custom_sharder(conf_index, {'reclaim_age': 0},
+                                    override_partitions=[shard_0_part])
+        self.assert_container_object_count(len(shard_1_objects))
+
+        # First, test a misplaced object moving from one shard to another.
+        # run sharder on root to discover first shrink candidate
+        self.sharders.once(additional_args='--partitions=%s' % self.brain.part)
+        # then run sharder on first shard range to shrink it
+        self.run_sharders(shard_ranges[0])
+        # force a misplaced object into the shrunken shard range to simulate
+        # a client put that was in flight when it started to shrink
+        misplaced_node = merge_object(shard_ranges[0], 'alpha', deleted=0)
+        # root sees first shard has shrunk, only second shard range used for
+        # listing so alpha object not in listing
+        self.assertLengthEqual(self.get_container_shard_ranges(), 1)
+        self.assert_container_listing(shard_1_objects)
+        self.assert_container_object_count(len(shard_1_objects))
+        # until sharder runs on that node to move the misplaced object to the
+        # second shard range
+        shard_part, shard_nodes_numbers = self.get_part_and_node_numbers(
+            shard_ranges[0])
+        self.sharders.once(additional_args='--partitions=%s' % shard_part,
+                           number=misplaced_node['id'] + 1)
+        self.assert_container_listing(['alpha'] + shard_1_objects)
+        # root not yet updated
+        self.assert_container_object_count(len(shard_1_objects))
+
+        # check the deleted shard did not push the wrong root path into the
+        # other container
+        for replica in 0, 1, 2:
+            shard_x_broker = self.get_shard_broker(shard_ranges[1], replica)
+            self.assertEqual("%s/%s" % (self.account, self.container_name),
+                             shard_x_broker.root_path)
+
+        # run the sharder of the existing shard to update the root stats
+        # to prove the misplaced object was moved to the other shard _and_
+        # the other shard still has the correct root because it updates root's
+        # stats
+        self.run_sharders(shard_ranges[1])
+        self.assert_container_object_count(len(shard_1_objects) + 1)
+
+    def test_replication_to_sharded_container_from_unsharded_old_primary(self):
+        primary_ids = [n['id'] for n in self.brain.nodes]
+        handoff_node = next(n for n in self.brain.ring.devs
+                            if n['id'] not in primary_ids)
+
+        # start with two sharded replicas and one unsharded with extra object
+        obj_names = self._setup_replication_scenario(2)
+        for node in self.brain.nodes[:2]:
+            self.assert_container_state(node, 'sharded', 2)
+
+        # Fake a ring change - copy unsharded db which has no shard ranges to a
+        # handoff to create illusion of a new unpopulated primary node
+        node_numbers = self.brain.node_numbers
+        new_primary_node = self.brain.nodes[2]
+        new_primary_node_number = node_numbers[2]
+        new_primary_dir, container_hash = self.get_storage_dir(
+            self.brain.part, new_primary_node)
+        old_primary_dir, container_hash = self.get_storage_dir(
+            self.brain.part, handoff_node)
+        utils.mkdirs(os.path.dirname(old_primary_dir))
+        shutil.move(new_primary_dir, old_primary_dir)
+
+        # make the cluster more or less "healthy" again
+        self.brain.servers.start(number=new_primary_node_number)
+
+        # get a db on every node...
+        client.put_container(self.url, self.token, self.container_name)
+        self.assertTrue(os.path.exists(os.path.join(
+            new_primary_dir, container_hash + '.db')))
+        found = self.categorize_container_dir_content()
+        self.assertLengthEqual(found['normal_dbs'], 1)  # "new" primary
+        self.assertLengthEqual(found['shard_dbs'], 2)  # existing primaries
+
+        # catastrophic failure! drive dies and is replaced on unchanged primary
+        failed_node = self.brain.nodes[0]
+        failed_dir, _container_hash = self.get_storage_dir(
+            self.brain.part, failed_node)
+        shutil.rmtree(failed_dir)
+
+        # replicate the "old primary" to everybody except the "new primary"
+        self.brain.servers.stop(number=new_primary_node_number)
+        self.replicators.once(number=handoff_node['id'] + 1)
+
+        # We're willing to rsync the retiring db to the failed primary.
+        # This may or may not have shard ranges, depending on the order in
+        # which we hit the primaries, but it definitely *doesn't* have an
+        # epoch in its name yet. All objects are replicated.
+        self.assertTrue(os.path.exists(os.path.join(
+            failed_dir, container_hash + '.db')))
+        self.assertLengthEqual(os.listdir(failed_dir), 1)
+        broker = self.get_broker(self.brain.part, failed_node)
+        self.assertLengthEqual(broker.get_objects(), len(obj_names) + 1)
+
+        # The other out-of-date primary is within usync range but objects are
+        # not replicated to it because the handoff db learns about shard ranges
+        broker = self.get_broker(self.brain.part, self.brain.nodes[1])
+        self.assertLengthEqual(broker.get_objects(), 0)
+
+        # Handoff db still exists and now has shard ranges!
+        self.assertTrue(os.path.exists(os.path.join(
+            old_primary_dir, container_hash + '.db')))
+        broker = self.get_broker(self.brain.part, handoff_node)
+        shard_ranges = broker.get_shard_ranges()
+        self.assertLengthEqual(shard_ranges, 2)
+        self.assert_container_state(handoff_node, 'unsharded', 2)
+
+        # Replicate again, this time *including* "new primary"
+        self.brain.servers.start(number=new_primary_node_number)
+        self.replicators.once(number=handoff_node['id'] + 1)
+
+        # Ordinarily, we would have rsync_then_merge'd to "new primary"
+        # but instead we wait
+        broker = self.get_broker(self.brain.part, new_primary_node)
+        self.assertLengthEqual(broker.get_objects(), 0)
+        shard_ranges = broker.get_shard_ranges()
+        self.assertLengthEqual(shard_ranges, 2)
+
+        # so the next time the sharder comes along, it can push rows out
+        # and delete the big db
+        self.sharders.once(number=handoff_node['id'] + 1,
+                           additional_args='--partitions=%s' % self.brain.part)
+        self.assert_container_state(handoff_node, 'sharded', 2)
+        self.assertFalse(os.path.exists(os.path.join(
+            old_primary_dir, container_hash + '.db')))
+        # the sharded db hangs around until replication confirms durability
+        # first attempt is not sufficiently successful
+        self.brain.servers.stop(number=node_numbers[0])
+        self.replicators.once(number=handoff_node['id'] + 1)
+        self.assertTrue(os.path.exists(old_primary_dir))
+        self.assert_container_state(handoff_node, 'sharded', 2)
+        # second attempt is successful and handoff db is deleted
+        self.brain.servers.start(number=node_numbers[0])
+        self.replicators.once(number=handoff_node['id'] + 1)
+        self.assertFalse(os.path.exists(old_primary_dir))
+
+        # run all the sharders, get us into a consistent state
+        self.sharders.once(additional_args='--partitions=%s' % self.brain.part)
+        self.assert_container_listing(['alpha'] + obj_names)
+
+    def test_replication_to_empty_new_primary_from_sharding_old_primary(self):
+        primary_ids = [n['id'] for n in self.brain.nodes]
+        handoff_node = next(n for n in self.brain.ring.devs
+                            if n['id'] not in primary_ids)
+        num_shards = 3
+        obj_names = self._make_object_names(
+            num_shards * self.max_shard_size // 2)
+        self.put_objects(obj_names)
+        client.post_container(self.url, self.admin_token, self.container_name,
+                              headers={'X-Container-Sharding': 'on'})
+
+        # run replicators first time to get sync points set
+        self.replicators.once()
+        # start sharding on only the leader node
+        leader_node = self.brain.nodes[0]
+        leader_node_number = self.brain.node_numbers[0]
+        self.sharders.once(number=leader_node_number)
+        self.assert_container_state(leader_node, 'sharding', 3)
+        for node in self.brain.nodes[1:]:
+            self.assert_container_state(node, 'unsharded', 3)
+
+        # Fake a ring change - copy leader node db to a handoff to create
+        # illusion of a new unpopulated primary leader node
+        new_primary_dir, container_hash = self.get_storage_dir(
+            self.brain.part, leader_node)
+        old_primary_dir, container_hash = self.get_storage_dir(
+            self.brain.part, handoff_node)
+        utils.mkdirs(os.path.dirname(old_primary_dir))
+        shutil.move(new_primary_dir, old_primary_dir)
+        self.assert_container_state(handoff_node, 'sharding', 3)
+
+        # run replicator on handoff node to create a fresh db on new primary
+        self.assertFalse(os.path.exists(new_primary_dir))
+        self.replicators.once(number=handoff_node['id'] + 1)
+        self.assertTrue(os.path.exists(new_primary_dir))
+        self.assert_container_state(leader_node, 'sharded', 3)
+        broker = self.get_broker(self.brain.part, leader_node)
+        shard_ranges = broker.get_shard_ranges()
+        self.assertLengthEqual(shard_ranges, 3)
+        self.assertEqual(
+            [ShardRange.CLEAVED, ShardRange.CLEAVED, ShardRange.CREATED],
+            [sr.state for sr in shard_ranges])
+
+        # db still exists on handoff
+        self.assertTrue(os.path.exists(old_primary_dir))
+        self.assert_container_state(handoff_node, 'sharding', 3)
+        # continue sharding it...
+        self.sharders.once(number=handoff_node['id'] + 1)
+        self.assert_container_state(leader_node, 'sharded', 3)
+        # now handoff is fully sharded the replicator will delete it
+        self.replicators.once(number=handoff_node['id'] + 1)
+        self.assertFalse(os.path.exists(old_primary_dir))
+
+        # all primaries now have active shard ranges but only one is in sharded
+        # state
+        self.assert_container_state(leader_node, 'sharded', 3)
+        for node in self.brain.nodes[1:]:
+            self.assert_container_state(node, 'unsharded', 3)
+        node_data = self.direct_get_container_shard_ranges()
+        for node_id, (hdrs, shard_ranges) in node_data.items():
+            with self.subTest(node_id=node_id, nodes=node_data.keys()):
+                self.assert_shard_range_state(ShardRange.ACTIVE, shard_ranges)
+
+        # check handoff cleaved all objects before it was deleted - stop all
+        # but leader node so that listing is fetched from shards
+        for number in self.brain.node_numbers[1:3]:
+            self.brain.servers.stop(number=number)
+
+        self.assert_container_listing(obj_names)
+
+        for number in self.brain.node_numbers[1:3]:
+            self.brain.servers.start(number=number)
+
+        self.sharders.once()
+        self.assert_container_state(leader_node, 'sharded', 3)
+        for node in self.brain.nodes[1:]:
+            self.assert_container_state(node, 'sharding', 3)
+        self.sharders.once()
+        self.assert_container_states('sharded', 3)
+
+        self.assert_container_listing(obj_names)
+
+    def test_sharded_account_updates(self):
+        # verify that .shards account updates have zero object count and bytes
+        # to avoid double accounting
+        all_obj_names = self._make_object_names(self.max_shard_size)
+        self.put_objects(all_obj_names, contents='xyz')
+        # Shard the container into 2 shards
+        client.post_container(self.url, self.admin_token, self.container_name,
+                              headers={'X-Container-Sharding': 'on'})
+        for n in self.brain.node_numbers:
+            self.sharders.once(
+                number=n, additional_args='--partitions=%s' % self.brain.part)
+        # sanity checks
+        for node in self.brain.nodes:
+            shard_ranges = self.assert_container_state(node, 'sharded', 2)
+        self.assert_container_delete_fails()
+        self.assert_container_has_shard_sysmeta()
+        self.assert_container_post_ok('sharded')
+        self.assert_container_listing(all_obj_names)
+        # run the updaters to get account stats updated
+        self.updaters.once()
+        # check user account stats
+        metadata = self.internal_client.get_account_metadata(self.account)
+        self.assertEqual(1, int(metadata.get('x-account-container-count')))
+        self.assertEqual(self.max_shard_size,
+                         int(metadata.get('x-account-object-count')))
+        self.assertEqual(3 * self.max_shard_size,
+                         int(metadata.get('x-account-bytes-used')))
+        # check hidden .shards account stats
+        metadata = self.internal_client.get_account_metadata(
+            shard_ranges[0].account)
+        self.assertEqual(2, int(metadata.get('x-account-container-count')))
+        self.assertEqual(0, int(metadata.get('x-account-object-count')))
+        self.assertEqual(0, int(metadata.get('x-account-bytes-used')))
+
+
+class TestShardedAPI(BaseTestContainerSharding):
+    def _assert_namespace_equivalence(
+            self, namespaces_list, other_namespaces_list):
+        # verify given lists are equivalent when cast to Namespaces
+        self.assertEqual(len(namespaces_list), len(other_namespaces_list))
+        self.assertEqual(
+            [Namespace(sr.name, sr.lower, sr.upper)
+             for sr in namespaces_list],
+            [Namespace(sr.name, sr.lower, sr.upper)
+             for sr in other_namespaces_list])
+
+    def test_GET(self):
+        all_obj_names = self._make_object_names(10)
+        self.put_objects(all_obj_names)
+
+        # unsharded container
+        objs = self.get_container_objects()
+        self.assertEqual(all_obj_names, [obj['name'] for obj in objs])
+
+        objs = self.get_container_objects(
+            headers={'X-Backend-Record-Type': 'auto'})
+        self.assertEqual(all_obj_names, [obj['name'] for obj in objs])
+
+        objs = self.get_container_objects(
+            headers={'X-Backend-Record-Type': 'object'})
+        self.assertEqual(all_obj_names, [obj['name'] for obj in objs])
+
+        objs = self.get_container_objects(
+            headers={'X-Backend-Record-Type': 'banana'})
+        self.assertEqual(all_obj_names, [obj['name'] for obj in objs])
+
+        shard_ranges = self.get_container_shard_ranges()
+        self.assertFalse(shard_ranges)
+
+        # Shard the container
+        client.post_container(self.url, self.admin_token, self.container_name,
+                              headers={'X-Container-Sharding': 'on'})
+        self.assert_subprocess_success([
+            'swift-manage-shard-ranges',
+            self.get_db_file(self.brain.part, self.brain.nodes[0]),
+            'find_and_replace', '5', '--enable', '--minimum-shard-size', '5'])
+        self.replicators.once()
+        # "Run container-sharder on all nodes to shard the container."
+        # first pass cleaves 2 shards
+        self.sharders_once_non_auto(
+            additional_args='--partitions=%s' % self.brain.part)
+        # sanity check
+        self.assert_container_states('sharded', 2)
+
+        orig_shard_ranges = self.get_container_shard_ranges()
+        self.assertEqual(2, len(orig_shard_ranges))
+        namespaces = self.get_container_namespaces()
+        self._assert_namespace_equivalence(orig_shard_ranges, namespaces)
+
+        # the container is sharded so *all* shard ranges should satisfy
+        # updating and listing state aliases
+        shard_ranges = self.get_container_shard_ranges(
+            params={'states': 'updating'})
+        self._assert_namespace_equivalence(orig_shard_ranges, shard_ranges)
+
+        shard_ranges = self.get_container_shard_ranges(
+            params={'states': 'listing'})
+        self._assert_namespace_equivalence(orig_shard_ranges, shard_ranges)
+
+        shard_ranges = self.get_container_shard_ranges(
+            headers={'X-Newest': 'true'},
+            params={'states': 'listing'})
+        self._assert_namespace_equivalence(orig_shard_ranges, shard_ranges)
+
+        # this is what the sharder requests...
+        shard_ranges = self.get_container_shard_ranges(
+            headers={'X-Newest': 'true'},
+            params={'states': 'auditing'})
+        own_ns = Namespace('%s/%s' % (self.account, self.container_name),
+                           lower='', upper='')
+        self._assert_namespace_equivalence(orig_shard_ranges + [own_ns],
+                                           shard_ranges)
+
+        shard_ranges = self.get_container_shard_ranges(
+            params={'includes': all_obj_names[1]})
+        self._assert_namespace_equivalence(orig_shard_ranges[:1], shard_ranges)
+        namespaces = self.get_container_namespaces(
+            params={'includes': all_obj_names[1]})
+        self._assert_namespace_equivalence(shard_ranges, namespaces)
+
+        shard_ranges = self.get_container_shard_ranges(
+            # override 'includes'
+            headers={'X-Backend-Override-Shard-Name-Filter': 'sharded'},
+            params={'includes': all_obj_names[1]})
+        self._assert_namespace_equivalence(orig_shard_ranges, shard_ranges)
+        namespaces = self.get_container_namespaces(
+            # override 'includes'
+            headers={'X-Backend-Override-Shard-Name-Filter': 'sharded'},
+            params={'includes': all_obj_names[1]})
+        self._assert_namespace_equivalence(shard_ranges, namespaces)
+
+        shard_ranges = self.get_container_shard_ranges(
+            params={'end_marker': all_obj_names[1]})
+        self._assert_namespace_equivalence(orig_shard_ranges[:1], shard_ranges)
+        namespaces = self.get_container_namespaces(
+            params={'end_marker': all_obj_names[1]})
+        self._assert_namespace_equivalence(shard_ranges, namespaces)
+
+        shard_ranges = self.get_container_shard_ranges(
+            # override 'end_marker'
+            headers={'X-Backend-Override-Shard-Name-Filter': 'sharded'},
+            params={'end_marker': all_obj_names[1]})
+        self._assert_namespace_equivalence(orig_shard_ranges, shard_ranges)
+        namespaces = self.get_container_namespaces(
+            # override 'end_marker'
+            headers={'X-Backend-Override-Shard-Name-Filter': 'sharded'},
+            params={'end_marker': all_obj_names[1]})
+        self._assert_namespace_equivalence(shard_ranges, namespaces)
+
+        shard_ranges = self.get_container_shard_ranges(
+            params={'reverse': 'true'})
+        self._assert_namespace_equivalence(list(reversed(orig_shard_ranges)),
+                                           shard_ranges)
+        namespaces = self.get_container_namespaces(
+            params={'reverse': 'true'})
+        self._assert_namespace_equivalence(shard_ranges, namespaces)
+
+        shard_ranges = self.get_container_shard_ranges(
+            # override 'reverse'
+            headers={'X-Backend-Override-Shard-Name-Filter': 'sharded'},
+            params={'reverse': 'true'})
+        self._assert_namespace_equivalence(orig_shard_ranges, shard_ranges)
+        namespaces = self.get_container_namespaces(
+            # override 'reverse'
+            headers={'X-Backend-Override-Shard-Name-Filter': 'sharded'},
+            params={'reverse': 'true'})
+        self._assert_namespace_equivalence(shard_ranges, namespaces)
+
+        objs = self.get_container_objects()
+        self.assertEqual(all_obj_names, [obj['name'] for obj in objs])
+
+        objs = self.get_container_objects(
+            headers={'X-Newest': 'true'})
+        self.assertEqual(all_obj_names, [obj['name'] for obj in objs])
+
+        objs = self.get_container_objects(
+            headers={'X-Backend-Record-Type': 'auto'})
+        self.assertEqual(all_obj_names, [obj['name'] for obj in objs])
+
+        objs = self.get_container_objects(
+            headers={'X-Backend-Record-Type': 'banana'})
+        self.assertEqual(all_obj_names, [obj['name'] for obj in objs])
+
+        # note: explicitly asking for the root object rows, but it has None
+        objs = self.get_container_objects(
+            headers={'X-Backend-Record-Type': 'object'})
+        self.assertEqual([], objs)
+
+
+class TestContainerShardingMoreUTF8(TestContainerSharding):
+    def _make_object_names(self, number, start=0):
+        # override default with names that include non-ascii chars
+        name_length = self.cluster_info['swift']['max_object_name_length']
+        obj_names = []
+        for x in range(start, start + number):
+            name = (u'obj-\u00e4\u00ea\u00ec\u00f2\u00fb-%04d' % x)
+            name = name.encode('utf8').ljust(name_length, b'o').decode('utf8')
+            obj_names.append(name)
+        return obj_names
+
+    def _setup_container_name(self):
+        # override default with max length name that includes non-ascii chars
+        super(TestContainerShardingMoreUTF8, self)._setup_container_name()
+        name_length = self.cluster_info['swift']['max_container_name_length']
+        cont_name = \
+            self.container_name + u'-\u00e4\u00ea\u00ec\u00f2\u00fb\u1234'
+        self.container_name = cont_name.encode('utf8').ljust(
+            name_length, b'x').decode('utf8')
+
+
+class TestManagedContainerSharding(BaseTestContainerSharding):
+    """Test sharding using swift-manage-shard-ranges"""
+
+    def test_manage_shard_ranges(self):
+        obj_names = self._make_object_names(10)
+        self.put_objects(obj_names)
+
+        client.post_container(self.url, self.admin_token, self.container_name,
+                              headers={'X-Container-Sharding': 'on'})
+
+        # run replicators first time to get sync points set
+        self.replicators.once()
+
+        # sanity check: we don't have nearly enough objects for this to shard
+        # automatically
+        self.sharders_once_non_auto(
+            number=self.brain.node_numbers[0],
+            additional_args='--partitions=%s' % self.brain.part)
+        self.assert_container_state(self.brain.nodes[0], 'unsharded', 0)
+
+        self.assert_subprocess_success([
+            'swift-manage-shard-ranges',
+            self.get_db_file(self.brain.part, self.brain.nodes[0]),
+            'find_and_replace', '3', '--enable', '--minimum-shard-size', '2'])
+        self.assert_container_state(self.brain.nodes[0], 'unsharded', 3)
+
+        # "Run container-replicator to replicate them to other nodes."
+        self.replicators.once()
+        # "Run container-sharder on all nodes to shard the container."
+        # first pass cleaves 2 shards
+        self.sharders_once_non_auto(
+            additional_args='--partitions=%s' % self.brain.part)
+        self.assert_container_state(self.brain.nodes[0], 'sharding', 3)
+        self.assert_container_state(self.brain.nodes[1], 'sharding', 3)
+        shard_ranges = self.assert_container_state(
+            self.brain.nodes[2], 'sharding', 3)
+        self.assert_container_listing(obj_names)
+
+        # make the un-cleaved shard update the root container...
+        self.assertEqual([3, 3, 4], [sr.object_count for sr in shard_ranges])
+        shard_part, nodes = self.get_part_and_node_numbers(shard_ranges[2])
+        self.sharders_once_non_auto(
+            additional_args='--partitions=%s' % shard_part)
+        shard_ranges = self.assert_container_state(
+            self.brain.nodes[2], 'sharding', 3)
+        # ...it does not report zero-stats despite being empty, because it has
+        # not yet reached CLEAVED state
+        self.assertEqual([3, 3, 4], [sr.object_count for sr in shard_ranges])
+
+        # second pass cleaves final shard
+        self.sharders_once_non_auto(
+            additional_args='--partitions=%s' % self.brain.part)
+
+        # Everybody's settled
+        self.assert_container_state(self.brain.nodes[0], 'sharded', 3)
+        self.assert_container_state(self.brain.nodes[1], 'sharded', 3)
+        shard_ranges = self.assert_container_state(
+            self.brain.nodes[2], 'sharded', 3)
+        self.assertEqual([3, 3, 4], [sr.object_count for sr in shard_ranges])
+        self.assert_container_listing(obj_names)
+
+    def test_manage_shard_ranges_compact(self):
+        # verify shard range compaction using swift-manage-shard-ranges
+        obj_names = self._make_object_names(8)
+        self.put_objects(obj_names)
+        client.post_container(self.url, self.admin_token, self.container_name,
+                              headers={'X-Container-Sharding': 'on'})
+        # run replicators first time to get sync points set, and get container
+        # sharded into 4 shards
+        self.replicators.once()
+        self.assert_subprocess_success([
+            'swift-manage-shard-ranges',
+            self.get_db_file(self.brain.part, self.brain.nodes[0]),
+            'find_and_replace', '2', '--enable'])
+        self.assert_container_state(self.brain.nodes[0], 'unsharded', 4)
+        self.replicators.once()
+        # run sharders twice to cleave all 4 shard ranges
+        self.sharders_once_non_auto(
+            additional_args='--partitions=%s' % self.brain.part)
+        self.sharders_once_non_auto(
+            additional_args='--partitions=%s' % self.brain.part)
+        self.assert_container_states('sharded', 4)
+        self.assert_container_listing(obj_names)
+
+        # now compact some ranges; use --max-shrinking to allow 2 shrinking
+        # shards
+        self.assert_subprocess_success([
+            'swift-manage-shard-ranges',
+            self.get_db_file(self.brain.part, self.brain.nodes[0]),
+            'compact', '--max-expanding', '1', '--max-shrinking', '2',
+            '--yes'])
+        shard_ranges = self.assert_container_state(
+            self.brain.nodes[0], 'sharded', 4)
+        self.assertEqual([ShardRange.SHRINKING] * 2 + [ShardRange.ACTIVE] * 2,
+                         [sr.state for sr in shard_ranges])
+        self.replicators.once()
+        self.sharders_once_non_auto()
+        # check there's now just 2 remaining shard ranges
+        shard_ranges = self.assert_container_state(
+            self.brain.nodes[0], 'sharded', 2)
+        self.assertEqual([ShardRange.ACTIVE] * 2,
+                         [sr.state for sr in shard_ranges])
+        self.assert_container_listing(obj_names, req_hdrs={'X-Newest': 'True'})
+
+        # root container own shard range should still be SHARDED
+        for i, node in enumerate(self.brain.nodes):
+            with self.subTest(i=i):
+                broker = self.get_broker(self.brain.part, node)
+                self.assertEqual(ShardRange.SHARDED,
+                                 broker.get_own_shard_range().state)
+
+        # now compact the final two shard ranges to the root; use
+        # --max-shrinking to allow 2 shrinking shards
+        self.assert_subprocess_success([
+            'swift-manage-shard-ranges',
+            self.get_db_file(self.brain.part, self.brain.nodes[0]),
+            'compact', '--yes', '--max-shrinking', '2'])
+        shard_ranges = self.assert_container_state(
+            self.brain.nodes[0], 'sharded', 2)
+        self.assertEqual([ShardRange.SHRINKING] * 2,
+                         [sr.state for sr in shard_ranges])
+        self.replicators.once()
+        self.sharders_once_non_auto()
+        self.assert_container_state(self.brain.nodes[0], 'collapsed', 0)
+        self.assert_container_listing(obj_names, req_hdrs={'X-Newest': 'True'})
+
+        # root container own shard range should now be ACTIVE
+        for i, node in enumerate(self.brain.nodes):
+            with self.subTest(i=i):
+                broker = self.get_broker(self.brain.part, node)
+                self.assertEqual(ShardRange.ACTIVE,
+                                 broker.get_own_shard_range().state)
+
+    def test_manage_shard_ranges_repair_root(self):
+        # provoke overlaps in root container and repair
+        obj_names = self._make_object_names(16)
+        self.put_objects(obj_names)
+
+        client.post_container(self.url, self.admin_token, self.container_name,
+                              headers={'X-Container-Sharding': 'on'})
+
+        # run replicators first time to get sync points set
+        self.replicators.once()
+
+        # find 4 shard ranges on nodes[0] - let's denote these ranges 0.0, 0.1,
+        # 0.2 and 0.3 that are installed with epoch_0
+        self.assert_subprocess_success([
+            'swift-manage-shard-ranges',
+            self.get_db_file(self.brain.part, self.brain.nodes[0]),
+            'find_and_replace', '4', '--enable'])
+        shard_ranges_0 = self.assert_container_state(self.brain.nodes[0],
+                                                     'unsharded', 4)
+
+        # *Also* go find 3 shard ranges on *another node*, like a dumb-dumb -
+        # let's denote these ranges 1.0, 1.1 and 1.2 that are installed with
+        # epoch_1
+        self.assert_subprocess_success([
+            'swift-manage-shard-ranges',
+            self.get_db_file(self.brain.part, self.brain.nodes[1]),
+            'find_and_replace', '7', '--enable'])
+        shard_ranges_1 = self.assert_container_state(self.brain.nodes[1],
+                                                     'unsharded', 3)
+
+        # Run sharder in specific order so that the replica with the older
+        # epoch_0 starts sharding first - this will prove problematic later!
+        # On first pass the first replica passes audit, creates shards and then
+        # syncs shard ranges with the other replicas, so it has a mix of 0.*
+        # shard ranges in CLEAVED state and 1.* ranges in FOUND state. It
+        # proceeds to cleave shard 0.0, but after 0.0 cleaving stalls because
+        # next in iteration is shard range 1.0 in FOUND state from the other
+        # replica that it cannot yet cleave.
+        self.sharders_once_non_auto(
+            number=self.brain.node_numbers[0],
+            additional_args='--partitions=%s' % self.brain.part)
+
+        # On first pass the second replica passes audit (it has its own found
+        # ranges and the first replica's created shard ranges but none in the
+        # same state overlap), creates its shards and then syncs shard ranges
+        # with the other replicas. All of the 7 shard ranges on this replica
+        # are now in CREATED state so it proceeds to cleave the first two shard
+        # ranges, 0.1 and 1.0.
+        self.sharders_once_non_auto(
+            number=self.brain.node_numbers[1],
+            additional_args='--partitions=%s' % self.brain.part)
+        self.replicators.once()
+
+        # Uh-oh
+        self.assert_container_state(self.brain.nodes[0], 'sharding', 7)
+        self.assert_container_state(self.brain.nodes[1], 'sharding', 7)
+        # There's a race: the third replica may be sharding, may be unsharded
+
+        # Try it again a few times
+        self.sharders_once_non_auto(
+            additional_args='--partitions=%s' % self.brain.part)
+        self.replicators.once()
+        self.sharders_once_non_auto(
+            additional_args='--partitions=%s' % self.brain.part)
+
+        # It's not really fixing itself... the sharder audit will detect
+        # overlapping ranges which prevents cleaving proceeding; expect the
+        # shard ranges to be mostly still in created state, with one or two
+        # possibly cleaved during first pass before the sharding got stalled
+        shard_ranges = self.assert_container_state(self.brain.nodes[0],
+                                                   'sharding', 7)
+        self.assertEqual([ShardRange.CLEAVED] * 2 + [ShardRange.CREATED] * 5,
+                         [sr.state for sr in shard_ranges])
+        shard_ranges = self.assert_container_state(self.brain.nodes[1],
+                                                   'sharding', 7)
+        self.assertEqual([ShardRange.CLEAVED] * 2 + [ShardRange.CREATED] * 5,
+                         [sr.state for sr in shard_ranges])
+        # But hey, at least listings still work! They're just going to get
+        # horribly out of date as more objects are added
+        self.assert_container_listing(obj_names)
+
+        # 'swift-manage-shard-ranges repair' will choose the second set of 3
+        # shard ranges (1.*) over the first set of 4 (0.*) because that's the
+        # path with most cleaving progress, and so shrink shard ranges 0.*.
+        db_file = self.get_db_file(self.brain.part, self.brain.nodes[0])
+        self.assert_subprocess_success(
+            ['swift-manage-shard-ranges', db_file, 'repair', '--yes',
+             '--min-shard-age', '0'])
+
+        # make sure all root replicas now sync their shard ranges
+        self.replicators.once()
+        # Run sharder on the shrinking shards. This should not change the state
+        # of any of the acceptors, particularly the ones that have yet to have
+        # object cleaved from the roots, because we don't want the as yet
+        # uncleaved acceptors becoming prematurely active and creating 'holes'
+        # in listings. The shrinking shard ranges should however get deleted in
+        # root container table.
+        self.run_sharders(shard_ranges_0)
+
+        shard_ranges = self.assert_container_state(self.brain.nodes[1],
+                                                   'sharding', 3)
+        self.assertEqual([ShardRange.CLEAVED] * 1 + [ShardRange.CREATED] * 2,
+                         [sr.state for sr in shard_ranges])
+        self.assert_container_listing(obj_names)
+        # check the unwanted shards did shrink away...
+        for shard_range in shard_ranges_0:
+            with self.subTest(shard_range=shard_range):
+                found_for_shard = self.categorize_container_dir_content(
+                    shard_range.account, shard_range.container)
+                self.assertLengthEqual(found_for_shard['shard_dbs'], 3)
+                actual = []
+                for shard_db in found_for_shard['shard_dbs']:
+                    broker = ContainerBroker(shard_db)
+                    own_sr = broker.get_own_shard_range()
+                    actual.append(
+                        (broker.get_db_state(), own_sr.state, own_sr.deleted))
+                self.assertEqual([(SHARDED, ShardRange.SHRUNK, True)] * 3,
+                                 actual)
+
+        # At this point one of the first two replicas may have done some useful
+        # cleaving of 1.* shards, the other may have only cleaved 0.* shards,
+        # and the third replica may have cleaved no shards. We therefore need
+        # two more passes of the sharder to get to a predictable state where
+        # all replicas have cleaved all three 0.* shards.
+        self.sharders_once_non_auto()
+        self.sharders_once_non_auto()
+
+        # now we expect all replicas to have just the three 1.* shards, with
+        # the 0.* shards all deleted
+        brokers = {}
+        exp_shard_ranges = sorted(
+            [sr.copy(state=ShardRange.SHRUNK, deleted=True)
+             for sr in shard_ranges_0] +
+            [sr.copy(state=ShardRange.ACTIVE)
+             for sr in shard_ranges_1],
+            key=ShardRange.sort_key)
+        for node in (0, 1, 2):
+            with self.subTest(node=node):
+                broker = self.get_broker(self.brain.part,
+                                         self.brain.nodes[node])
+                brokers[node] = broker
+                shard_ranges = broker.get_shard_ranges()
+                self.assertEqual(shard_ranges_1, shard_ranges)
+                shard_ranges = broker.get_shard_ranges(include_deleted=True)
+                self.assertLengthEqual(shard_ranges, len(exp_shard_ranges))
+                self.maxDiff = None
+                self.assertEqual(exp_shard_ranges, shard_ranges)
+                self.assertEqual(ShardRange.SHARDED,
+                                 broker.get_own_shard_range().state)
+
+        # Sadly, the first replica to start sharding is still reporting its db
+        # state to be 'unsharded' because, although it has sharded, its shard
+        # db epoch (epoch_0) does not match its own shard range epoch
+        # (epoch_1), and that is because the second replica (with epoch_1)
+        # updated the own shard range and replicated it to all other replicas.
+        # If we had run the sharder on the second replica before the first
+        # replica, then by the time the first replica started sharding it would
+        # have learnt the newer epoch_1 and we wouldn't see this inconsistency.
+        self.assertEqual(UNSHARDED, brokers[0].get_db_state())
+        self.assertEqual(SHARDED, brokers[1].get_db_state())
+        self.assertEqual(SHARDED, brokers[2].get_db_state())
+        epoch_1 = brokers[1].db_epoch
+        self.assertEqual(epoch_1, brokers[2].db_epoch)
+        self.assertLess(brokers[0].db_epoch, epoch_1)
+        # the root replica that thinks it is unsharded is problematic - it will
+        # not return shard ranges for listings, but has no objects, so it's
+        # luck of the draw whether we get a listing or not at this point :(
+
+        # Run the sharders again: the first replica that is still 'unsharded'
+        # because of the older epoch_0 in its db filename will now start to
+        # shard again with a newer epoch_1 db, and will start to re-cleave the
+        # 3 active shards, albeit with zero objects to cleave.
+        self.sharders_once_non_auto()
+        for node in (0, 1, 2):
+            with self.subTest(node=node):
+                broker = self.get_broker(self.brain.part,
+                                         self.brain.nodes[node])
+                brokers[node] = broker
+                shard_ranges = broker.get_shard_ranges()
+                self.assertEqual(shard_ranges_1, shard_ranges)
+                shard_ranges = broker.get_shard_ranges(include_deleted=True)
+                self.assertLengthEqual(shard_ranges, len(exp_shard_ranges))
+                self.assertEqual(exp_shard_ranges, shard_ranges)
+                self.assertEqual(ShardRange.SHARDED,
+                                 broker.get_own_shard_range().state)
+                self.assertEqual(epoch_1, broker.db_epoch)
+        self.assertIn(brokers[0].get_db_state(), (SHARDING, SHARDED))
+        self.assertEqual(SHARDED, brokers[1].get_db_state())
+        self.assertEqual(SHARDED, brokers[2].get_db_state())
+
+        # This cycle of the sharders also guarantees that all shards have had
+        # their state updated to ACTIVE from the root; this was not necessarily
+        # true at end of the previous sharder pass because a shard audit (when
+        # the shard is updated from a root) may have happened before all roots
+        # have had their shard ranges transitioned to ACTIVE.
+        for shard_range in shard_ranges_1:
+            with self.subTest(shard_range=shard_range):
+                found_for_shard = self.categorize_container_dir_content(
+                    shard_range.account, shard_range.container)
+                self.assertLengthEqual(found_for_shard['normal_dbs'], 3)
+                actual = []
+                for shard_db in found_for_shard['normal_dbs']:
+                    broker = ContainerBroker(shard_db)
+                    own_sr = broker.get_own_shard_range()
+                    actual.append(
+                        (broker.get_db_state(), own_sr.state, own_sr.deleted))
+                self.assertEqual([(UNSHARDED, ShardRange.ACTIVE, False)] * 3,
+                                 actual)
+
+        # We may need one more pass of the sharder before all three shard
+        # ranges are cleaved (2 per pass) and all the root replicas are
+        # predictably in sharded state. Note: the accelerated cleaving of >2
+        # zero-object shard ranges per cycle is defeated if a shard happens
+        # to exist on the same node as the root because the roots cleaving
+        # process doesn't think that it created the shard db and will therefore
+        # replicate it as per a normal cleave.
+        self.sharders_once_non_auto()
+        for node in (0, 1, 2):
+            with self.subTest(node=node):
+                broker = self.get_broker(self.brain.part,
+                                         self.brain.nodes[node])
+                brokers[node] = broker
+                shard_ranges = broker.get_shard_ranges()
+                self.assertEqual(shard_ranges_1, shard_ranges)
+                shard_ranges = broker.get_shard_ranges(include_deleted=True)
+                self.assertLengthEqual(shard_ranges, len(exp_shard_ranges))
+                self.assertEqual(exp_shard_ranges, shard_ranges)
+                self.assertEqual(ShardRange.SHARDED,
+                                 broker.get_own_shard_range().state)
+                self.assertEqual(epoch_1, broker.db_epoch)
+                self.assertEqual(SHARDED, broker.get_db_state())
+
+        # Finally, with all root replicas in a consistent state, the listing
+        # will be be predictably correct
+        self.assert_container_listing(obj_names)
+
+    def test_manage_shard_ranges_repair_shard(self):
+        # provoke overlaps in a shard container and repair them
+        obj_names = self._make_object_names(24)
+        initial_obj_names = obj_names[::2]
+        # put 12 objects in container
+        self.put_objects(initial_obj_names)
+        client.post_container(self.url, self.admin_token, self.container_name,
+                              headers={'X-Container-Sharding': 'on'})
+        # run replicators first time to get sync points set
+        self.replicators.once()
+        # find 3 shard ranges on root nodes[0] and get the root sharded
+        self.assert_subprocess_success([
+            'swift-manage-shard-ranges',
+            self.get_db_file(self.brain.part, self.brain.nodes[0]),
+            'find_and_replace', '4', '--enable'])
+        self.replicators.once()
+        # cleave first two shards
+        self.sharders_once_non_auto(
+            additional_args='--partitions=%s' % self.brain.part)
+        # cleave third shard
+        self.sharders_once_non_auto(
+            additional_args='--partitions=%s' % self.brain.part)
+        # ensure all shards learn their ACTIVE state from root
+        self.sharders_once_non_auto()
+        for node in (0, 1, 2):
+            with self.subTest(node=node):
+                shard_ranges = self.assert_container_state(
+                    self.brain.nodes[node], 'sharded', 3)
+                for sr in shard_ranges:
+                    self.assertEqual(ShardRange.ACTIVE, sr.state)
+        self.assert_container_listing(initial_obj_names)
+
+        # add objects to second shard range so it has 8 objects ; this range
+        # has bounds (obj-0006,obj-0014]
+        root_shard_ranges = self.get_container_shard_ranges()
+        self.assertEqual(3, len(root_shard_ranges))
+        shard_1 = root_shard_ranges[1]
+        self.assertEqual(obj_names[6], shard_1.lower)
+        self.assertEqual(obj_names[14], shard_1.upper)
+        more_obj_names = obj_names[7:15:2]
+        self.put_objects(more_obj_names)
+        expected_obj_names = sorted(initial_obj_names + more_obj_names)
+        self.assert_container_listing(expected_obj_names)
+
+        shard_1_part, shard_1_nodes = self.brain.ring.get_nodes(
+            shard_1.account, shard_1.container)
+
+        # find 3 sub-shards on one shard node; use --force-commits to ensure
+        # the recently PUT objects are included when finding the shard range
+        # pivot points
+        self.assert_subprocess_success([
+            'swift-manage-shard-ranges', '--force-commits',
+            self.get_db_file(shard_1_part, shard_1_nodes[1], shard_1.account,
+                             shard_1.container),
+            'find_and_replace', '3', '--enable'])
+        # ... and mistakenly find 4 shard ranges on a different shard node :(
+        self.assert_subprocess_success([
+            'swift-manage-shard-ranges', '--force-commits',
+            self.get_db_file(shard_1_part, shard_1_nodes[2], shard_1.account,
+                             shard_1.container),
+            'find_and_replace', '2', '--enable'])
+        # replicate the muddle of shard ranges between shard replicas, merged
+        # result is:
+        # '' - 6  shard     ACTIVE
+        #  6 - 8  sub-shard FOUND
+        #  6 - 9  sub-shard FOUND
+        #  8 - 10 sub-shard FOUND
+        #  9 - 12 sub-shard FOUND
+        # 10 - 12 sub-shard FOUND
+        # 12 - 14 sub-shard FOUND
+        # 12 - 14 sub-shard FOUND
+        #  6 - 14 shard     SHARDING
+        # 14 - '' shard     ACTIVE
+        self.replicators.once()
+
+        # try hard to shard the shard...
+        self.sharders_once_non_auto(
+            additional_args='--partitions=%s' % shard_1_part)
+        self.sharders_once_non_auto(
+            additional_args='--partitions=%s' % shard_1_part)
+        self.sharders_once_non_auto(
+            additional_args='--partitions=%s' % shard_1_part)
+        # sharding hasn't completed and there's overlaps in the shard and root:
+        # the sub-shards will have been cleaved in the order listed above, but
+        # sub-shards (10 -12) and one of (12 - 14) will be overlooked because
+        # the cleave cursor will have moved past their namespace before they
+        # were yielded by the shard range iterator, so we now have:
+        # '' - 6  shard     ACTIVE
+        #  6 - 8  sub-shard ACTIVE
+        #  6 - 9  sub-shard ACTIVE
+        #  8 - 10 sub-shard ACTIVE
+        # 10 - 12 sub-shard CREATED
+        #  9 - 12 sub-shard ACTIVE
+        # 12 - 14 sub-shard CREATED
+        # 12 - 14 sub-shard ACTIVE
+        # 14 - '' shard     ACTIVE
+        sub_shard_ranges = self.get_container_shard_ranges(
+            shard_1.account, shard_1.container)
+        self.assertEqual(7, len(sub_shard_ranges), sub_shard_ranges)
+        root_shard_ranges = self.get_container_shard_ranges()
+        self.assertEqual(9, len(root_shard_ranges), root_shard_ranges)
+        self.assertEqual([ShardRange.ACTIVE] * 4 +
+                         [ShardRange.CREATED, ShardRange.ACTIVE] * 2 +
+                         [ShardRange.ACTIVE],
+                         [sr.state for sr in root_shard_ranges])
+
+        # fix the overlaps - a set of 3 ACTIVE sub-shards will be chosen and 4
+        # other sub-shards will be shrunk away; apply the fix at the root
+        # container
+        db_file = self.get_db_file(self.brain.part, self.brain.nodes[0])
+        self.assert_subprocess_success(
+            ['swift-manage-shard-ranges', db_file, 'repair', '--yes',
+             '--min-shard-age', '0'])
+        self.replicators.once()
+        self.sharders_once_non_auto()
+        self.sharders_once_non_auto()
+
+        # check root now has just 5 shard ranges
+        root_shard_ranges = self.get_container_shard_ranges()
+        self.assertEqual(5, len(root_shard_ranges), root_shard_ranges)
+        self.assertEqual([ShardRange.ACTIVE] * 5,
+                         [sr.state for sr in root_shard_ranges])
+        # check there are 1 sharded shard and 4 shrunk sub-shard ranges in the
+        # root (note, shard_1's shard ranges aren't updated once it has sharded
+        # because the sub-shards report their state to the root; we cannot make
+        # assertions about shrunk states in shard_1's shard range table)
+        root_shard_ranges = self.get_container_shard_ranges(
+            headers={'X-Backend-Include-Deleted': 'true'})
+        self.assertEqual(10, len(root_shard_ranges), root_shard_ranges)
+        shrunk_shard_ranges = [sr for sr in root_shard_ranges
+                               if sr.state == ShardRange.SHRUNK]
+        self.assertEqual(4, len(shrunk_shard_ranges), root_shard_ranges)
+        self.assertEqual([True] * 4,
+                         [sr.deleted for sr in shrunk_shard_ranges])
+        sharded_shard_ranges = [sr for sr in root_shard_ranges
+                                if sr.state == ShardRange.SHARDED]
+        self.assertEqual(1, len(sharded_shard_ranges), root_shard_ranges)
+
+        self.assert_container_listing(expected_obj_names)
+
+    def test_manage_shard_ranges_repair_parent_child_ranges(self):
+        # Test repairing a transient parent-child shard range overlap in the
+        # root container, expect no repairs to be done.
+        # note: be careful not to add a container listing to this test which
+        # would get shard ranges into memcache
+        obj_names = self._make_object_names(4)
+        self.put_objects(obj_names)
+
+        client.post_container(self.url, self.admin_token, self.container_name,
+                              headers={'X-Container-Sharding': 'on'})
+
+        # run replicators first time to get sync points set
+        self.container_replicators.once(
+            additional_args='--partitions=%s' % self.brain.part)
+
+        # shard root
+        root_0_db_file = self.get_db_file(self.brain.part, self.brain.nodes[0])
+        self.assert_subprocess_success([
+            'swift-manage-shard-ranges',
+            root_0_db_file,
+            'find_and_replace', '2', '--enable'])
+        self.container_replicators.once(
+            additional_args='--partitions=%s' % self.brain.part)
+        self.assert_container_states('unsharded', 2)
+        self.sharders_once_non_auto(
+            additional_args='--partitions=%s' % self.brain.part)
+        # get shards to update state from parent...
+        self.sharders_once_non_auto()
+        self.assert_container_states('sharded', 2)
+
+        # sanity check, all is well
+        msg = self.assert_subprocess_success([
+            'swift-manage-shard-ranges', root_0_db_file, 'repair', '--gaps',
+            '--dry-run'])
+        self.assertIn(b'No repairs necessary.', msg)
+
+        # shard first shard into 2 sub-shards while root node 0 is disabled
+        self.stop_container_servers(node_numbers=slice(0, 1))
+        shard_ranges = self.get_container_shard_ranges()
+        shard_brokers = [self.get_shard_broker(shard_ranges[0], node_index=i)
+                         for i in range(3)]
+        self.assert_subprocess_success([
+            'swift-manage-shard-ranges',
+            shard_brokers[0].db_file,
+            'find_and_replace', '1', '--enable'])
+        shard_part, shard_nodes = self.brain.ring.get_nodes(
+            shard_ranges[0].account, shard_ranges[0].container)
+        self.container_replicators.once(
+            additional_args='--partitions=%s' % shard_part)
+        for node in exclude_nodes(shard_nodes, self.brain.nodes[0]):
+            self.assert_container_state(
+                node, 'unsharded', 2, account=shard_ranges[0].account,
+                container=shard_ranges[0].container, part=shard_part)
+        self.sharders_once_non_auto(
+            additional_args='--partitions=%s' % shard_part)
+        # get shards to update state from parent...
+        self.sharders_once_non_auto()
+        for node in exclude_nodes(shard_nodes, self.brain.nodes[0]):
+            self.assert_container_state(
+                node, 'sharded', 2, account=shard_ranges[0].account,
+                container=shard_ranges[0].container, part=shard_part)
+
+        # put an object into the second of the 2 sub-shards so that the shard
+        # will update the root next time the sharder is run; do this before
+        # restarting root node 0 so that the object update is definitely
+        # redirected to a sub-shard by root node 1 or 2.
+        new_obj_name = obj_names[0] + 'a'
+        self.put_objects([new_obj_name])
+
+        # restart root node 0
+        self.brain.servers.start(number=self.brain.node_numbers[0])
+        # node 0 DB doesn't know about the sub-shards
+        root_brokers = [self.get_broker(self.brain.part, node)
+                        for node in self.brain.nodes]
+        broker = root_brokers[0]
+        self.assertEqual(
+            [(ShardRange.ACTIVE, False, ShardRange.MIN, obj_names[1]),
+             (ShardRange.ACTIVE, False, obj_names[1], ShardRange.MAX)],
+            [(sr.state, sr.deleted, sr.lower, sr.upper)
+             for sr in broker.get_shard_ranges(include_deleted=True)])
+
+        for broker in root_brokers[1:]:
+            self.assertEqual(
+                [(ShardRange.ACTIVE, False, ShardRange.MIN, obj_names[0]),
+                 (ShardRange.ACTIVE, False, obj_names[0], obj_names[1]),
+                 (ShardRange.SHARDED, True, ShardRange.MIN, obj_names[1]),
+                 (ShardRange.ACTIVE, False, obj_names[1], ShardRange.MAX)],
+                [(sr.state, sr.deleted, sr.lower, sr.upper)
+                 for sr in broker.get_shard_ranges(include_deleted=True)])
+
+        sub_shard = root_brokers[1].get_shard_ranges()[1]
+        self.assertEqual(obj_names[0], sub_shard.lower)
+        self.assertEqual(obj_names[1], sub_shard.upper)
+        sub_shard_part, nodes = self.get_part_and_node_numbers(sub_shard)
+        # we want the sub-shard to update root node 0 but not the sharded
+        # shard, but there is a small chance the two will be in same partition
+        # TODO: how can we work around this?
+        self.assertNotEqual(sub_shard_part, shard_part,
+                            'You were unlucky, try again')
+        self.sharders_once_non_auto(
+            additional_args='--partitions=%s' % sub_shard_part)
+
+        # now root node 0 has the original shards plus one of the sub-shards
+        # but all are active :(
+        self.assertEqual(
+            [(ShardRange.ACTIVE, False, ShardRange.MIN, obj_names[1]),
+             # note: overlap!
+             (ShardRange.ACTIVE, False, obj_names[0], obj_names[1]),
+             (ShardRange.ACTIVE, False, obj_names[1], ShardRange.MAX)],
+            [(sr.state, sr.deleted, sr.lower, sr.upper)
+             for sr in root_brokers[0].get_shard_ranges(include_deleted=True)])
+
+        # try to fix the overlap and expect no repair has been done.
+        msg = self.assert_subprocess_success(
+            ['swift-manage-shard-ranges', root_0_db_file, 'repair', '--yes',
+             '--min-shard-age', '0'])
+        self.assertIn(
+            b'1 donor shards ignored due to parent-child relationship checks',
+            msg)
+
+        # verify parent-child checks has prevented repair to be done.
+        self.assertEqual(
+            [(ShardRange.ACTIVE, False, ShardRange.MIN, obj_names[1]),
+             # note: overlap!
+             (ShardRange.ACTIVE, False, obj_names[0], obj_names[1]),
+             (ShardRange.ACTIVE, False, obj_names[1], ShardRange.MAX)],
+            [(sr.state, sr.deleted, sr.lower, sr.upper)
+             for sr in root_brokers[0].get_shard_ranges(include_deleted=True)])
+
+        # the transient overlap is 'fixed' in subsequent sharder cycles...
+        self.sharders_once_non_auto()
+        self.sharders_once_non_auto()
+        self.container_replicators.once()
+
+        for broker in root_brokers:
+            self.assertEqual(
+                [(ShardRange.ACTIVE, False, ShardRange.MIN, obj_names[0]),
+                 (ShardRange.ACTIVE, False, obj_names[0], obj_names[1]),
+                 (ShardRange.SHARDED, True, ShardRange.MIN, obj_names[1]),
+                 (ShardRange.ACTIVE, False, obj_names[1], ShardRange.MAX)],
+                [(sr.state, sr.deleted, sr.lower, sr.upper)
+                 for sr in broker.get_shard_ranges(include_deleted=True)])
+
+    def test_manage_shard_ranges_repair_root_gap(self):
+        # create a gap in root container; repair the gap.
+        # note: be careful not to add a container listing to this test which
+        # would get shard ranges into memcache
+        obj_names = self._make_object_names(8)
+        self.put_objects(obj_names)
+
+        client.post_container(self.url, self.admin_token, self.container_name,
+                              headers={'X-Container-Sharding': 'on'})
+
+        # run replicators first time to get sync points set
+        self.container_replicators.once(
+            additional_args='--partitions=%s' % self.brain.part)
+
+        # shard root
+        root_0_db_file = self.get_db_file(self.brain.part, self.brain.nodes[0])
+        self.assert_subprocess_success([
+            'swift-manage-shard-ranges',
+            root_0_db_file,
+            'find_and_replace', '2', '--enable'])
+        self.container_replicators.once(
+            additional_args='--partitions=%s' % self.brain.part)
+        self.assert_container_states('unsharded', 4)
+        self.sharders_once_non_auto(
+            additional_args='--partitions=%s' % self.brain.part)
+        # get shards to update state from parent...
+        self.sharders_once_non_auto()
+        self.assert_container_states('sharded', 4)
+
+        # sanity check, all is well
+        msg = self.assert_subprocess_success([
+            'swift-manage-shard-ranges', root_0_db_file, 'repair', '--gaps',
+            '--dry-run'])
+        self.assertIn(b'No repairs necessary.', msg)
+
+        # deliberately create a gap in root shard ranges (don't ever do this
+        # for real)
+        # TODO: replace direct broker modification with s-m-s-r merge
+        root_brokers = [self.get_broker(self.brain.part, node)
+                        for node in self.brain.nodes]
+        shard_ranges = root_brokers[0].get_shard_ranges()
+        self.assertEqual(4, len(shard_ranges))
+        shard_ranges[2].set_deleted()
+        root_brokers[0].merge_shard_ranges(shard_ranges)
+        shard_ranges = root_brokers[0].get_shard_ranges()
+        self.assertEqual(3, len(shard_ranges))
+        self.container_replicators.once()
+
+        # confirm that we made a gap.
+        for broker in root_brokers:
+            self.assertEqual(
+                [(ShardRange.ACTIVE, False, ShardRange.MIN, obj_names[1]),
+                 (ShardRange.ACTIVE, False, obj_names[1], obj_names[3]),
+                 (ShardRange.ACTIVE, True, obj_names[3], obj_names[5]),
+                 (ShardRange.ACTIVE, False, obj_names[5], ShardRange.MAX)],
+                [(sr.state, sr.deleted, sr.lower, sr.upper)
+                 for sr in broker.get_shard_ranges(include_deleted=True)])
+
+        msg = self.assert_subprocess_success([
+            'swift-manage-shard-ranges', root_0_db_file, 'repair', '--gaps',
+            '--yes'])
+        self.assertIn(b'Repairs necessary to fill gaps.', msg)
+
+        self.sharders_once_non_auto()
+        self.sharders_once_non_auto()
+        self.container_replicators.once()
+
+        # yay! we fixed the gap (without creating an overlap)
+        for broker in root_brokers:
+            self.assertEqual(
+                [(ShardRange.ACTIVE, False, ShardRange.MIN, obj_names[1]),
+                 (ShardRange.ACTIVE, False, obj_names[1], obj_names[3]),
+                 (ShardRange.ACTIVE, True, obj_names[3], obj_names[5]),
+                 (ShardRange.ACTIVE, False, obj_names[3], ShardRange.MAX)],
+                [(sr.state, sr.deleted, sr.lower, sr.upper)
+                 for sr in broker.get_shard_ranges(include_deleted=True)])
+
+        msg = self.assert_subprocess_success([
+            'swift-manage-shard-ranges', root_0_db_file, 'repair',
+            '--dry-run', '--min-shard-age', '0'])
+        self.assertIn(b'No repairs necessary.', msg)
+        msg = self.assert_subprocess_success([
+            'swift-manage-shard-ranges', root_0_db_file, 'repair', '--gaps',
+            '--dry-run'])
+        self.assertIn(b'No repairs necessary.', msg)
+
+        # put an object into the gap namespace
+        new_objs = [obj_names[4] + 'a']
+        self.put_objects(new_objs)
+        # get root stats up to date
+        self.sharders_once_non_auto()
+        # new object is in listing but old objects in the gap have been lost -
+        # don't delete shard ranges!
+        self.assert_container_listing(obj_names[:4] + new_objs + obj_names[6:])
+
+    def test_manage_shard_ranges_unsharded_deleted_root(self):
+        # verify that a deleted DB will still be sharded
+
+        # choose a node that will not be sharded initially
+        sharded_nodes = []
+        unsharded_node = None
+        for node in self.brain.nodes:
+            if self.brain.node_numbers[node['index']] \
+                    in self.brain.handoff_numbers:
+                unsharded_node = node
+            else:
+                sharded_nodes.append(node)
+
+        # put some objects - not enough to trigger auto-sharding
+        obj_names = self._make_object_names(MIN_SHARD_CONTAINER_THRESHOLD - 1)
+        self.put_objects(obj_names)
+
+        # run replicators first time to get sync points set and commit updates
+        self.replicators.once()
+
+        # setup sharding...
+        self.assert_subprocess_success([
+            'swift-manage-shard-ranges',
+            self.get_db_file(self.brain.part, sharded_nodes[0]),
+            'find_and_replace', '2', '--enable', '--minimum-shard-size', '1'])
+
+        # Run container-replicator to replicate shard ranges
+        self.container_replicators.once()
+        self.assert_container_state(sharded_nodes[0], 'unsharded', 2)
+        self.assert_container_state(sharded_nodes[1], 'unsharded', 2)
+        self.assert_container_state(unsharded_node, 'unsharded', 2)
+
+        # Run container-sharder to shard the 2 primary replicas that did
+        # receive the object PUTs
+        for num in self.brain.primary_numbers:
+            self.sharders_once_non_auto(
+                number=num,
+                additional_args='--partitions=%s' % self.brain.part)
+
+        # delete the objects - the proxy's will have cached container info with
+        # out-of-date db_state=unsharded, so updates go to the root DBs
+        self.delete_objects(obj_names)
+        # deal with DELETE's being misplaced in root db's...
+        for num in self.brain.primary_numbers:
+            self.sharders_once_non_auto(
+                number=num,
+                additional_args='--partitions=%s' % self.brain.part)
+
+        self.assert_container_state(sharded_nodes[0], 'sharded', 2)
+        self.assert_container_state(sharded_nodes[1], 'sharded', 2)
+        shard_ranges = self.assert_container_state(
+            unsharded_node, 'unsharded', 2)
+
+        # get root stats updated - but avoid sharding the remaining root DB
+        self.run_sharders(shard_ranges, exclude_partitions=[self.brain.part])
+        self.assert_container_listing([])
+
+        # delete the empty container
+        client.delete_container(self.url, self.admin_token,
+                                self.container_name)
+
+        # sanity check - unsharded DB is deleted
+        broker = self.get_broker(self.brain.part, unsharded_node,
+                                 self.account, self.container_name)
+        self.assertEqual(UNSHARDED, broker.get_db_state())
+        self.assertTrue(broker.is_deleted())
+        self.assertEqual(0, broker.get_info()['object_count'])
+        self.assertEqual(0, broker.get_shard_usage()['object_count'])
+
+        # now shard the final DB
+        for num in self.brain.handoff_numbers:
+            self.sharders_once_non_auto(
+                number=num,
+                additional_args='--partitions=%s' % self.brain.part)
+
+        # all DBs should now be sharded and still deleted
+        for node in self.brain.nodes:
+            with self.subTest(node_index=node['index'],
+                              nodes=[n['index'] for n in self.brain.nodes]):
+                self.assert_container_state(node, 'sharded', 2,
+                                            override_deleted=True)
+                broker = self.get_broker(self.brain.part, node,
+                                         self.account, self.container_name)
+                self.assertEqual(SHARDED, broker.get_db_state())
+                self.assertEqual(0, broker.get_info()['object_count'])
+                self.assertEqual(0,
+                                 broker.get_shard_usage()['object_count'])
+                self.assertTrue(broker.is_deleted())
+
+    def test_manage_shard_ranges_unsharded_deleted_root_gets_undeleted(self):
+        # verify that an apparently deleted DB (no object rows in root db) will
+        # still be sharded and also become undeleted when objects are
+        # discovered in the shards
+
+        # choose a node that will not be sharded initially
+        sharded_nodes = []
+        unsharded_node = None
+        for node in self.brain.nodes:
+            if self.brain.node_numbers[node['index']] \
+                    in self.brain.handoff_numbers:
+                unsharded_node = node
+            else:
+                sharded_nodes.append(node)
+
+        # put some objects, but only to 2 replicas - not enough to trigger
+        # auto-sharding
+        self.brain.stop_handoff_half()
+
+        obj_names = self._make_object_names(MIN_SHARD_CONTAINER_THRESHOLD - 1)
+        self.put_objects(obj_names)
+        # run replicators first time to get sync points set and commit puts
+        self.replicators.once()
+
+        # setup sharding...
+        self.assert_subprocess_success([
+            'swift-manage-shard-ranges',
+            self.get_db_file(self.brain.part, sharded_nodes[0]),
+            'find_and_replace', '2', '--enable', '--minimum-shard-size', '1'])
+
+        # Run container-replicator to replicate shard ranges - object rows will
+        # not be sync'd now there are shard ranges
+        for num in self.brain.primary_numbers:
+            self.container_replicators.once(number=num)
+        self.assert_container_state(sharded_nodes[0], 'unsharded', 2)
+        self.assert_container_state(sharded_nodes[1], 'unsharded', 2)
+
+        # revive the stopped node
+        self.brain.start_handoff_half()
+        self.assert_container_state(unsharded_node, 'unsharded', 0)
+
+        # delete the empty replica
+        direct_client.direct_delete_container(
+            unsharded_node, self.brain.part, self.account,
+            self.container_name)
+
+        # Run container-sharder to shard the 2 primary replicas that did
+        # receive the object PUTs
+        for num in self.brain.primary_numbers:
+            self.sharders_once_non_auto(
+                number=num,
+                additional_args='--partitions=%s' % self.brain.part)
+
+        self.assert_container_state(sharded_nodes[0], 'sharded', 2)
+        self.assert_container_state(sharded_nodes[1], 'sharded', 2)
+        # the sharder syncs shard ranges ...
+        self.assert_container_state(unsharded_node, 'unsharded', 2,
+                                    override_deleted=True)
+
+        # sanity check - unsharded DB is empty and deleted
+        broker = self.get_broker(self.brain.part, unsharded_node,
+                                 self.account, self.container_name)
+        self.assertEqual(UNSHARDED, broker.get_db_state())
+        self.assertEqual(0, broker.get_info()['object_count'])
+        # the shard ranges do have object count but are in CREATED state so
+        # not reported in shard usage...
+        self.assertEqual(0, broker.get_shard_usage()['object_count'])
+        self.assertTrue(broker.is_deleted())
+
+        # now shard the final DB
+        for num in self.brain.handoff_numbers:
+            self.sharders_once_non_auto(
+                number=num,
+                additional_args='--partitions=%s' % self.brain.part)
+        shard_ranges = self.assert_container_state(
+            unsharded_node, 'sharded', 2, override_deleted=True)
+
+        # and get roots updated and sync'd
+        self.container_replicators.once()
+        self.run_sharders(shard_ranges, exclude_partitions=[self.brain.part])
+
+        # all DBs should now be sharded and NOT deleted
+        for node in self.brain.nodes:
+            with self.subTest(node_index=node['index'],
+                              nodes=[n['index'] for n in self.brain.nodes]):
+                broker = self.get_broker(self.brain.part, node,
+                                         self.account, self.container_name)
+                self.assertEqual(SHARDED, broker.get_db_state())
+                self.assertEqual(3, broker.get_info()['object_count'])
+                self.assertEqual(3,
+                                 broker.get_shard_usage()['object_count'])
+                self.assertFalse(broker.is_deleted())
+
+    def test_handoff_replication_does_not_cause_reset_epoch(self):
+        obj_names = self._make_object_names(100)
+        self.put_objects(obj_names)
+
+        client.post_container(self.url, self.admin_token, self.container_name,
+                              headers={'X-Container-Sharding': 'on'})
+
+        # run replicators first time to get sync points set
+        self.replicators.once()
+
+        # sanity check: we don't have nearly enough objects for this to shard
+        # automatically
+        self.sharders_once_non_auto(
+            number=self.brain.node_numbers[0],
+            additional_args='--partitions=%s' % self.brain.part)
+        self.assert_container_state(self.brain.nodes[0], 'unsharded', 0)
+
+        self.assert_subprocess_success([
+            'swift-manage-shard-ranges',
+            self.get_db_file(self.brain.part, self.brain.nodes[0]),
+            'find_and_replace', '50', '--enable',
+            '--minimum-shard-size', '40'])
+        self.assert_container_state(self.brain.nodes[0], 'unsharded', 2)
+
+        # "Run container-replicator to replicate them to other nodes."
+        self.replicators.once()
+        # "Run container-sharder on all nodes to shard the container."
+        self.sharders_once_non_auto(
+            additional_args='--partitions=%s' % self.brain.part)
+
+        # Everybody's settled
+        self.assert_container_state(self.brain.nodes[0], 'sharded', 2)
+        self.assert_container_state(self.brain.nodes[1], 'sharded', 2)
+        self.assert_container_state(self.brain.nodes[2], 'sharded', 2)
+        self.assert_container_listing(obj_names)
+
+        # now lets put the container again and make sure it lands on a handoff
+        self.brain.stop_primary_half()
+        self.brain.put_container(policy_index=int(self.policy))
+        self.brain.start_primary_half()
+
+        dir_content = self.categorize_container_dir_content(more_nodes=True)
+        # the handoff node is considered normal because it doesn't have an
+        # epoch
+        self.assertEqual(len(dir_content['normal_dbs']), 1)
+        self.assertEqual(len(dir_content['shard_dbs']), 3)
+
+        # let's replicate
+        self.replicators.once()
+        self.sharders_once_non_auto(
+            additional_args='--partitions=%s' % self.brain.part)
+
+        # let's now check the handoff broker it should have all the shards
+        handoff_broker = ContainerBroker(dir_content['normal_dbs'][0])
+        self.assertEqual(len(handoff_broker.get_shard_ranges()), 2)
+        handoff_osr = handoff_broker.get_own_shard_range(no_default=True)
+        self.assertIsNotNone(handoff_osr.epoch)
+
+    def test_force_replication_of_a_reset_own_shard_range(self):
+        obj_names = self._make_object_names(100)
+        self.put_objects(obj_names)
+
+        client.post_container(self.url, self.admin_token, self.container_name,
+                              headers={'X-Container-Sharding': 'on'})
+
+        # run replicators first time to get sync points set
+        self.replicators.once()
+
+        # sanity check: we don't have nearly enough objects for this to shard
+        # automatically
+        self.sharders_once_non_auto(
+            number=self.brain.node_numbers[0],
+            additional_args='--partitions=%s' % self.brain.part)
+        self.assert_container_state(self.brain.nodes[0], 'unsharded', 0)
+
+        self.assert_subprocess_success([
+            'swift-manage-shard-ranges',
+            self.get_db_file(self.brain.part, self.brain.nodes[0]),
+            'find_and_replace', '50', '--enable',
+            '--minimum-shard-size', '40'])
+        self.assert_container_state(self.brain.nodes[0], 'unsharded', 2)
+
+        # "Run container-replicator to replicate them to other nodes."
+        self.replicators.once()
+        # "Run container-sharder on all nodes to shard the container."
+        self.sharders_once_non_auto(
+            additional_args='--partitions=%s' % self.brain.part)
+
+        # Everybody's settled
+        self.assert_container_state(self.brain.nodes[0], 'sharded', 2)
+        self.assert_container_state(self.brain.nodes[1], 'sharded', 2)
+        self.assert_container_state(self.brain.nodes[2], 'sharded', 2)
+        self.assert_container_listing(obj_names)
+
+        # Lets delete a primary to simulate a new primary and force an
+        # own_shard_range reset.
+        new_primary = self.brain.nodes[2]
+        db_file = self.get_db_file(self.brain.part, new_primary)
+        os.remove(db_file)
+
+        # issue a new PUT to create the "new" primary container
+        self.brain.put_container(policy_index=int(self.policy))
+
+        # put a bunch of objects that should land in the primary so it'll be
+        # shardable (in case this makes any kind of difference).
+        self.put_objects(obj_names)
+
+        # The new primary isn't considered a shard_db because it hasn't
+        # sunk with the other primaries yet.
+        dir_content = self.categorize_container_dir_content()
+        self.assertEqual(len(dir_content['normal_dbs']), 1)
+        self.assertEqual(len(dir_content['shard_dbs']), 2)
+
+        # run the sharders incase this will trigger a reset osr
+        self.sharders_once_non_auto(
+            additional_args='--partitions=%s' % self.brain.part)
+        new_primary_broker = self.get_broker(self.brain.part, new_primary)
+        # Nope, still no default/reset osr
+        self.assertIsNone(
+            new_primary_broker.get_own_shard_range(no_default=True))
+
+        # Let's reset the osr by hand.
+        reset_osr = new_primary_broker.get_own_shard_range()
+        self.assertIsNone(reset_osr.epoch)
+        self.assertEqual(reset_osr.state, ShardRange.ACTIVE)
+        new_primary_broker.merge_shard_ranges(reset_osr)
+
+        # now let's replicate with the old primaries
+        self.replicators.once()
+        # Pull an old primary own_shard_range
+        dir_content = self.categorize_container_dir_content()
+        old_broker = ContainerBroker(dir_content['shard_dbs'][0])
+        old_osr = old_broker.get_own_shard_range()
+        new_primary_broker = ContainerBroker(dir_content['normal_dbs'][0])
+        new_osr = new_primary_broker.get_own_shard_range()
+
+        # This version stops replicating a remote non-epoch osr over a local
+        # epoched osr. But it doesn't do the other way. So it means the
+        # primary with non-epoched OSR get's stuck with it, if it is newer then
+        # the other epoched versions.
+        self.assertIsNotNone(old_osr.epoch)
+        self.assertEqual(old_osr.state, ShardRange.SHARDED)
+
+        self.assertIsNone(new_osr.epoch)
+        self.assertGreater(new_osr.timestamp, old_osr.timestamp)
+
+    def test_manage_shard_ranges_missing_epoch_no_false_positives(self):
+        # when one replica of a shard is sharding before the others, it's epoch
+        # is not None but it is normal for the other replica to replicate to it
+        # sending their own shard ranges with epoch=None until they also shard
+        obj_names = self._make_object_names(4)
+        self.put_objects(obj_names)
+        client.post_container(self.url, self.admin_token, self.container_name,
+                              headers={'X-Container-Sharding': 'on'})
+        # run replicators first time to get sync points set, and get container
+        # sharded into 4 shards
+        self.replicators.once()
+        self.assert_subprocess_success([
+            'swift-manage-shard-ranges',
+            self.get_db_file(self.brain.part, self.brain.nodes[0]),
+            'find_and_replace', '2', '--enable'])
+        ranges = self.assert_container_state(
+            self.brain.nodes[0], 'unsharded', 2)
+
+        # "Run container-replicator to replicate them to other nodes."
+        self.replicators.once()
+        # "Run container-sharder on all nodes to shard the container."
+        self.sharders_once_non_auto(
+            additional_args='--partitions=%s' % self.brain.part)
+        # Run them again, just so the shards themselves can pull down the
+        # latest sharded versions of their OSRs.
+        self.sharders_once_non_auto()
+
+        # Everybody's settled
+        self.assert_container_state(self.brain.nodes[0], 'sharded', 2)
+        self.assert_container_state(self.brain.nodes[1], 'sharded', 2)
+        ranges = self.assert_container_state(self.brain.nodes[2], 'sharded', 2)
+        self.assert_container_listing(obj_names)
+
+        # Now we need to shard a shard. A shard's OSR always exist and should
+        # have an epoch of None, so we should get some false positives.
+        # we'll shard ranges[1] which have a range of objs-0002 - MAX
+        shard_obj_names = ['objs-0001%d' % i for i in range(2)]
+        self.put_objects(shard_obj_names)
+
+        part, shard_node_numbers = self.get_part_and_node_numbers(ranges[1])
+        shard_nodes = self.brain.ring.get_part_nodes(part)
+        shard_broker = self.get_shard_broker(ranges[1], 0)
+        # set the account, container instance variables
+        shard_broker.get_info()
+        self.replicators.once()
+        self.assert_subprocess_success([
+            'swift-manage-shard-ranges',
+            shard_broker.db_file,
+            'find_and_replace', '2', '--enable'])
+        self.assert_container_state(
+            shard_nodes[0], 'unsharded', 2,
+            shard_broker.account, shard_broker.container, part)
+
+        # index 0 has an epoch now but 1 and 2 don't
+        for idx in 1, 2:
+            sb = self.get_shard_broker(ranges[1], idx)
+            osr = sb.get_own_shard_range(no_default=True)
+            self.assertIsNone(osr.epoch)
+
+        expected_false_positive_line_snippet = 'Ignoring remote osr w/o epoch:'
+        # run the replicator on the node with an epoch and it'll complain the
+        # others dont have an epoch and not set it.
+        replicator = self.run_custom_daemon(
+            ContainerReplicator, 'container-replicator',
+            shard_node_numbers[0], {})
+        warnings = replicator.logger.get_lines_for_level('warning')
+
+        self.assertFalse([w for w in warnings
+                          if expected_false_positive_line_snippet in w])
+
+        # But it does send the new OSR with an epoch so the others should all
+        # have it now.
+        for idx in 1, 2:
+            sb = self.get_shard_broker(ranges[1], idx)
+            osr = sb.get_own_shard_range(no_default=True)
+            self.assertIsNotNone(osr.epoch)
+
+    def test_manage_shard_ranges_deleted_child_and_parent_gap(self):
+        # Test to produce a scenario where a parent container is stuck at
+        # sharding because of a gap in shard ranges. And the gap is caused by
+        # deleted child shard range which finishes sharding before its parent
+        # does.
+        # note: be careful not to add a container listing to this test which
+        # would get shard ranges into memcache.
+        obj_names = self._make_object_names(20)
+        self.put_objects(obj_names)
+
+        client.post_container(self.url, self.admin_token, self.container_name,
+                              headers={'X-Container-Sharding': 'on'})
+        # run replicators first time to get sync points set.
+        self.container_replicators.once(
+            additional_args='--partitions=%s' % self.brain.part)
+
+        # shard root into two child-shards.
+        root_0_db_file = self.get_db_file(self.brain.part, self.brain.nodes[0])
+        self.assert_subprocess_success([
+            'swift-manage-shard-ranges',
+            root_0_db_file,
+            'find_and_replace', '10', '--enable'])
+        # Run container-replicator to replicate them to other nodes.
+        self.container_replicators.once(
+            additional_args='--partitions=%s' % self.brain.part)
+        self.assert_container_states('unsharded', 2)
+        # Run container-sharder on all nodes to shard the container.
+        self.sharders_once_non_auto(
+            additional_args='--partitions=%s' % self.brain.part)
+        # get shards to update state from parent...
+        self.sharders_once_non_auto()
+        self.assert_container_states('sharded', 2)
+
+        # shard first child shard into 2 grand-child-shards.
+        c_shard_ranges = self.get_container_shard_ranges()
+        c_shard_brokers = [self.get_shard_broker(
+            c_shard_ranges[0], node_index=i) for i in range(3)]
+        self.assert_subprocess_success([
+            'swift-manage-shard-ranges',
+            c_shard_brokers[0].db_file,
+            'find_and_replace', '5', '--enable'])
+        child_shard_part, c_shard_nodes = self.brain.ring.get_nodes(
+            c_shard_ranges[0].account, c_shard_ranges[0].container)
+        self.container_replicators.once(
+            additional_args='--partitions=%s' % child_shard_part)
+        for node in c_shard_nodes:
+            self.assert_container_state(
+                node, 'unsharded', 2, account=c_shard_ranges[0].account,
+                container=c_shard_ranges[0].container, part=child_shard_part)
+
+        # run sharder on only 2 of the child replicas by renaming the third
+        # replica's DB file directory.
+        # NOTE: if we only rename the retiring DB file, other replicas will
+        # create a "fresh" DB with timestamp during replication, and then
+        # after we restore the retiring DB back, there will be two DB files
+        # in the same folder, and container state will appear to be "sharding"
+        # instead of "unsharded".
+        c_shard_dir = os.path.dirname(c_shard_brokers[2].db_file)
+        c_shard_tmp_dir = c_shard_dir + ".tmp"
+        os.rename(c_shard_dir, c_shard_tmp_dir)
+        self.sharders_once_non_auto(additional_args='--partitions=%s' %
+                                                    child_shard_part)
+        for node in c_shard_nodes[:2]:
+            self.assert_container_state(
+                node, 'sharded', 2, account=c_shard_ranges[0].account,
+                container=c_shard_ranges[0].container, part=child_shard_part)
+        # get updates done...
+        self.sharders_once_non_auto()
+
+        # shard first grand-child shard into 2 grand-grand-child-shards.
+        gc_shard_ranges = self.get_container_shard_ranges(
+            account=c_shard_ranges[0].account,
+            container=c_shard_ranges[0].container)
+        shard_brokers = [self.get_shard_broker(
+            gc_shard_ranges[0],
+            node_index=i) for i in range(3)]
+        self.assert_subprocess_success([
+            'swift-manage-shard-ranges',
+            shard_brokers[0].db_file,
+            'find_and_replace', '3', '--enable'])
+        grandchild_shard_part, gc_shard_nodes = self.brain.ring.get_nodes(
+            gc_shard_ranges[0].account, gc_shard_ranges[0].container)
+        self.container_replicators.once(
+            additional_args='--partitions=%s' % grandchild_shard_part)
+        self.sharders_once_non_auto(additional_args='--partitions=%s' %
+                                                    grandchild_shard_part)
+
+        # get shards to update state from parent...
+        self.sharders_once_non_auto()
+        self.sharders_once_non_auto()
+        self.container_replicators.once(
+            additional_args='--partitions=%s' % child_shard_part)
+
+        # restore back the DB file directory of the disable child replica.
+        shutil.rmtree(c_shard_dir, ignore_errors=True)
+        os.rename(c_shard_tmp_dir, c_shard_dir)
+
+        # the 2 child shards that sharded earlier still have their original
+        # grand-child shards because they stopped updating form root once
+        # sharded.
+        for node in c_shard_nodes[:2]:
+            self.assert_container_state(
+                node, 'sharded', 2, account=c_shard_ranges[0].account,
+                container=c_shard_ranges[0].container, part=child_shard_part)
+        # the child shard that did not shard earlier has not been touched by
+        # the sharder since, so still has two grand-child shards.
+        self.assert_container_state(
+            c_shard_nodes[2],
+            'unsharded', 2, account=c_shard_ranges[0].account,
+            container=c_shard_ranges[0].container, part=child_shard_part)
+
+        # now, finally, run the sharder on the child that is still waiting to
+        # shard. It will get 2 great-grandchild ranges from root to replace
+        # deleted grandchild.
+        self.sharders_once_non_auto(
+            additional_args=['--partitions=%s' %
+                             child_shard_part, '--devices=%s' %
+                             c_shard_nodes[2]['device']])
+        # batch size is 2 but this replicas has 3 shard ranges so we need two
+        # runs of the sharder
+        self.sharders_once_non_auto(
+            additional_args=['--partitions=%s' %
+                             child_shard_part, '--devices=%s' %
+                             c_shard_nodes[2]['device']])
+        self.assert_container_state(
+            c_shard_nodes[2], 'sharded', 3, account=c_shard_ranges[0].account,
+            container=c_shard_ranges[0].container, part=child_shard_part)
diff --git a/test/probe/test_signals.py b/test/probe/test_signals.py
new file mode 100644
index 0000000000..91f46197c6
--- /dev/null
+++ b/test/probe/test_signals.py
@@ -0,0 +1,496 @@
+#!/usr/bin/python -u
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+
+from contextlib import contextmanager
+import eventlet
+import json
+import os
+import random
+import shutil
+import time
+from uuid import uuid4
+
+import http.client
+from urllib.parse import urlparse
+
+from swift.common.ring import Ring
+from swift.common.manager import Manager
+
+from test.probe import PROXY_BASE_URL
+from test.probe.common import resetswift, ReplProbeTest, client
+
+
+def putrequest(conn, method, path, headers):
+
+    conn.putrequest(method, path, skip_host=(headers and 'Host' in headers))
+    if headers:
+        for header, value in headers.items():
+            conn.putheader(header, str(value))
+    conn.endheaders()
+
+
+def get_server_and_worker_pids(manager, old_workers=None):
+    # Gets all the server parent pids, as well as the set of all worker PIDs
+    # (i.e. any PID whose PPID is in the set of parent pids).
+    server_pid_set = {pid for server in manager.servers
+                      for (_, pid) in server.iter_pid_files()}
+    children_pid_set = set()
+    old_worker_pid_set = set(old_workers or [])
+    all_pids = [int(f) for f in os.listdir('/proc') if f.isdigit()]
+    for pid in all_pids:
+        try:
+            with open('/proc/%d/status' % pid, 'r') as fh:
+                for line in fh:
+                    if line.startswith('PPid:\t'):
+                        ppid = int(line[6:])
+                        if ppid in server_pid_set or pid in old_worker_pid_set:
+                            children_pid_set.add(pid)
+                        break
+        except Exception:
+            # No big deal, a process could have exited since we listed /proc,
+            # so we just ignore errors
+            pass
+    return {'server': server_pid_set, 'worker': children_pid_set}
+
+
+def wait_for_pids(manager, callback, timeout=15, old_workers=None):
+    # Waits up to `timeout` seconds for the supplied callback to return True
+    # when passed in the manager's pid set.
+    start_time = time.time()
+
+    pid_sets = get_server_and_worker_pids(manager, old_workers=old_workers)
+    got = callback(pid_sets)
+    while not got and time.time() - start_time < timeout:
+        time.sleep(0.1)
+        pid_sets = get_server_and_worker_pids(manager, old_workers=old_workers)
+        got = callback(pid_sets)
+    if time.time() - start_time >= timeout:
+        raise AssertionError('timed out waiting for PID state; got %r' % (
+            pid_sets))
+    return pid_sets
+
+
+class TestWSGIServerProcessHandling(ReplProbeTest):
+    # Subclasses need to define SERVER_NAME
+    HAS_INFO = False
+    PID_TIMEOUT = 25
+
+    def setUp(self):
+        super(TestWSGIServerProcessHandling, self).setUp()
+        self.container = 'container-%s' % uuid4()
+        client.put_container(self.url, self.token, self.container,
+                             headers={'X-Storage-Policy':
+                                      self.policy.name})
+        self.manager = Manager([self.SERVER_NAME])
+        for server in self.manager.servers:
+            self.assertTrue(server.get_running_pids,
+                            'No running PIDs for %s' % server.cmd)
+        self.starting_pids = get_server_and_worker_pids(self.manager)
+
+    def assert4xx(self, resp):
+        self.assertEqual(resp.status // 100, 4)
+        got_body = resp.read()
+        try:
+            self.assertIn('resource could not be found', got_body)
+        except AssertionError:
+            self.assertIn('Invalid path: blah', got_body)
+
+    def get_conn(self):
+        scheme, ip, port = self.get_scheme_ip_port()
+        if scheme == 'https':
+            return http.client.HTTPSConnection('%s:%s' % (ip, port))
+        return http.client.HTTPConnection('%s:%s' % (ip, port))
+
+    def _check_reload(self):
+        conn = self.get_conn()
+        self.addCleanup(conn.close)
+
+        if self.HAS_INFO:
+            self.check_info_values({'max_header_size': 8192,
+                                    'max_request_line': 8192})
+
+        # sanity request
+        self.start_write_req(conn, 'sanity', request_line_len=8099,
+                             extra_header_size=8191)
+        resp = self.finish_write_req(conn)
+        self.check_write_resp(resp)
+
+        # Start another write request before reloading...
+        self.start_write_req(conn, 'across-reload')
+
+        if self.HAS_INFO:
+            self.swap_configs()  # new server's max_header_size == 8191
+
+        self.do_reload()
+
+        wait_for_pids(self.manager, self.make_post_reload_pid_cb(),
+                      old_workers=self.starting_pids['worker'],
+                      timeout=self.PID_TIMEOUT)
+
+        # ... and make sure we can finish what we were doing
+        resp = self.finish_write_req(conn)
+        self.check_write_resp(resp)
+
+        # After this, we're in a funny spot. With eventlet 0.22.0, the
+        # connection's now closed, but with prior versions we could keep
+        # going indefinitely. See https://bugs.launchpad.net/swift/+bug/1792615
+
+        # Close our connections, to make sure old eventlet shuts down
+        conn.close()
+
+        # sanity
+        wait_for_pids(self.manager, self.make_post_close_pid_cb(),
+                      old_workers=self.starting_pids['worker'],
+                      timeout=self.PID_TIMEOUT)
+
+        if self.HAS_INFO:
+            self.check_info_values({'max_header_size': 8191,
+                                    'max_request_line': 8100})
+        return conn
+
+
+class OldReloadMixin(object):
+    def make_post_reload_pid_cb(self):
+        def _cb(post_reload_pids):
+            # We expect all old server PIDs to be gone, a new server present,
+            # and for there to be exactly 1 old worker PID plus additional new
+            # worker PIDs.
+            old_servers_dead = not (self.starting_pids['server'] &
+                                    post_reload_pids['server'])
+            one_old_worker = 1 == len(self.starting_pids['worker'] &
+                                      post_reload_pids['worker'])
+            new_workers_present = (post_reload_pids['worker'] -
+                                   self.starting_pids['worker'])
+            return (post_reload_pids['server'] and old_servers_dead and
+                    one_old_worker and new_workers_present)
+        return _cb
+
+    def make_post_close_pid_cb(self):
+        def _cb(post_close_pids):
+            # We expect all old server PIDs to be gone, a new server present,
+            # no old worker PIDs, and additional new worker PIDs.
+            old_servers_dead = not (self.starting_pids['server'] &
+                                    post_close_pids['server'])
+            old_workers_dead = not (self.starting_pids['worker'] &
+                                    post_close_pids['worker'])
+            new_workers_present = (post_close_pids['worker'] -
+                                   self.starting_pids['worker'])
+            return (post_close_pids['server'] and old_servers_dead and
+                    old_workers_dead and new_workers_present)
+        return _cb
+
+    def do_reload(self):
+        self.manager.reload()
+
+
+class SeamlessReloadMixin(object):
+    def make_post_reload_pid_cb(self):
+        def _cb(post_reload_pids):
+            # We expect all orig server PIDs to STILL BE PRESENT, no new server
+            # present, and for there to be exactly 1 old worker PID plus
+            # additional new worker PIDs.
+            same_servers = (self.starting_pids['server'] ==
+                            post_reload_pids['server'])
+            one_old_worker = 1 == len(self.starting_pids['worker'] &
+                                      post_reload_pids['worker'])
+            new_workers_present = (post_reload_pids['worker'] -
+                                   self.starting_pids['worker'])
+            return (post_reload_pids['server'] and same_servers and
+                    one_old_worker and new_workers_present)
+        return _cb
+
+    def make_post_close_pid_cb(self):
+        def _cb(post_close_pids):
+            # We expect all orig server PIDs to STILL BE PRESENT, no new server
+            # present, no old worker PIDs, and additional new worker PIDs.
+            same_servers = (self.starting_pids['server'] ==
+                            post_close_pids['server'])
+            old_workers_dead = not (self.starting_pids['worker'] &
+                                    post_close_pids['worker'])
+            new_workers_present = (post_close_pids['worker'] -
+                                   self.starting_pids['worker'])
+            return (post_close_pids['server'] and same_servers and
+                    old_workers_dead and new_workers_present)
+        return _cb
+
+    def do_reload(self):
+        self.manager.reload_seamless()
+
+
+class ChildReloadMixin(object):
+    def make_post_reload_pid_cb(self):
+        def _cb(post_reload_pids):
+            # We expect all orig server PIDs to STILL BE PRESENT, no new server
+            # present, and for there to be exactly 1 old worker PID plus
+            # all but one additional new worker PIDs.
+            num_workers = len(self.starting_pids['worker'])
+            same_servers = (self.starting_pids['server'] ==
+                            post_reload_pids['server'])
+            one_old_worker = 1 == len(self.starting_pids['worker'] &
+                                      post_reload_pids['worker'])
+            new_workers_present = (post_reload_pids['worker'] -
+                                   self.starting_pids['worker'])
+            return (post_reload_pids['server'] and same_servers and
+                    one_old_worker and
+                    len(new_workers_present) == num_workers - 1)
+        return _cb
+
+    def make_post_close_pid_cb(self):
+        def _cb(post_close_pids):
+            # We expect all orig server PIDs to STILL BE PRESENT, no new server
+            # present, no old worker PIDs, and all new worker PIDs.
+            same_servers = (self.starting_pids['server'] ==
+                            post_close_pids['server'])
+            old_workers_dead = not (self.starting_pids['worker'] &
+                                    post_close_pids['worker'])
+            new_workers_present = (post_close_pids['worker'] -
+                                   self.starting_pids['worker'])
+            return (post_close_pids['server'] and same_servers and
+                    old_workers_dead and new_workers_present)
+        return _cb
+
+    def do_reload(self):
+        self.manager.kill_child_pids(seamless=True)
+
+
+class TestObjectServerReloadBase(TestWSGIServerProcessHandling):
+    SERVER_NAME = 'object'
+    PID_TIMEOUT = 35
+
+    def get_scheme_ip_port(self):
+        self.policy.load_ring('/etc/swift')
+        self.ring_node = random.choice(
+            self.policy.object_ring.get_part_nodes(1))
+        return 'http', self.ring_node['ip'], self.ring_node['port']
+
+    def start_write_req(self, conn, suffix, *args, **kwargs):
+        putrequest(conn, 'PUT', '/%s/123/%s/%s/blah-%s' % (
+            self.ring_node['device'], self.account, self.container, suffix),
+            headers={'X-Timestamp': str(time.time()),
+                     'Content-Type': 'application/octet-string',
+                     'Content-Length': len(self.BODY),
+                     'X-Backend-Storage-Policy-Index': str(self.policy.idx)})
+
+    def finish_write_req(self, conn):
+        conn.send(self.BODY)
+        return conn.getresponse()
+
+    def check_write_resp(self, resp):
+        got_body = resp.read()
+        self.assertEqual(resp.status // 100, 2, 'Got status %d; %r' %
+                         (resp.status, got_body))
+        self.assertEqual(b'', got_body)
+        return resp
+
+
+class TestObjectServerReload(OldReloadMixin, TestObjectServerReloadBase):
+    BODY = b'test-object' * 10
+
+    def test_object_reload(self):
+        self._check_reload()
+
+
+class TestObjectServerReloadSeamless(SeamlessReloadMixin,
+                                     TestObjectServerReloadBase):
+    BODY = b'test-object' * 10
+
+    def test_object_reload_seamless(self):
+        self._check_reload()
+
+
+class TestObjectServerReloadChild(ChildReloadMixin,
+                                  TestObjectServerReloadBase):
+    BODY = b'test-object' * 10
+
+    def test_object_reload_child(self):
+        self._check_reload()
+
+
+class TestProxyServerReloadBase(TestWSGIServerProcessHandling):
+    SERVER_NAME = 'proxy-server'
+    HAS_INFO = True
+
+    def setUp(self):
+        super(TestProxyServerReloadBase, self).setUp()
+        self.swift_conf_path = '/etc/swift/swift.conf'
+        self.new_swift_conf_path = self.swift_conf_path + '.new'
+        self.saved_swift_conf_path = self.swift_conf_path + '.orig'
+        shutil.copy(self.swift_conf_path, self.saved_swift_conf_path)
+        with open(self.swift_conf_path, 'r') as rfh:
+            config = rfh.read()
+            section_header = '\n[swift-constraints]\n'
+        if section_header in config:
+            config = config.replace(
+                section_header,
+                section_header +
+                'max_header_size = 8191\n'
+                'max_request_line = 8100\n',
+                1)
+        else:
+            config += (section_header +
+                       'max_header_size = 8191\n'
+                       'max_request_line = 8100\n')
+        with open(self.new_swift_conf_path, 'w') as wfh:
+            wfh.write(config)
+            wfh.flush()
+
+    def tearDown(self):
+        shutil.move(self.saved_swift_conf_path, self.swift_conf_path)
+        try:
+            os.unlink(self.new_swift_conf_path)
+        except OSError:
+            pass
+        super(TestProxyServerReloadBase, self).tearDown()
+
+    def swap_configs(self):
+        shutil.copy(self.new_swift_conf_path, self.swift_conf_path)
+
+    def get_scheme_ip_port(self):
+        parsed = urlparse(PROXY_BASE_URL)
+        host, port = parsed.netloc.partition(':')[::2]
+        if not port:
+            port = '443' if parsed.scheme == 'https' else '80'
+        return parsed.scheme, host, int(port)
+
+    def check_info_values(self, expected_info):
+        # verify that we're talking to the expected server
+        conn2 = self.get_conn()
+        putrequest(conn2, 'GET', '/info',
+                   headers={'Content-Length': '0',
+                            'Accept': 'application/json'})
+        conn2.send('')
+        resp = conn2.getresponse()
+        self.assertEqual(resp.status // 100, 2)
+        info_dict = json.loads(resp.read())
+        conn2.close()
+        actual = {}
+        for key in expected_info:
+            actual[key] = info_dict['swift'].get(key)
+        self.assertEqual(expected_info, actual)
+
+    def start_write_req(self, conn, suffix, request_line_len=None,
+                        extra_header_size=None):
+        path = '/v1/%s/%s/blah-%s' % (self.account, self.container, suffix)
+        if request_line_len is not None:
+            # pad request line to request_line_len
+            # request line = PUT <path> HTTP/1.1\r\n
+            req_line = 'PUT %s? HTTP/1.1\r\n' % path
+            path += '?%s' % ('x' * (request_line_len - len(req_line)))
+        headers = {'X-Auth-Token': self.token,
+                   'Content-Length': len(self.BODY)}
+        if extra_header_size is not None:
+            # add header line of extra_header_size
+            # header line = '<key>: <value>\r\n'
+            hdr_line = 'x-foo: \r\n'
+            headers['x-foo'] = 'x' * (extra_header_size - len(hdr_line))
+        putrequest(conn, 'PUT', path, headers=headers)
+
+    def finish_write_req(self, conn):
+        conn.send(self.BODY)
+        return conn.getresponse()
+
+    def check_write_resp(self, resp):
+        got_body = resp.read()
+        self.assertEqual(resp.status // 100, 2, 'Got status %d; %r %s' %
+                         (resp.status, got_body, resp.getheaders()))
+        self.assertEqual(b'', got_body)
+        return resp
+
+
+class TestProxyServerReload(OldReloadMixin, TestProxyServerReloadBase):
+    BODY = b'proxy' * 10
+
+    def test_proxy_reload(self):
+        conn = self._check_reload()
+        # verify reduced max_header_size (header line must be < 8191)
+        self.start_write_req(conn, 'header-too-long', extra_header_size=8191)
+        resp = self.finish_write_req(conn)
+        self.assertEqual(400, resp.status)
+        # verify reduced max_request_line (request line must be < 8100)
+        self.start_write_req(conn, 'request-too-long', request_line_len=8100)
+        resp = self.finish_write_req(conn)
+        self.assertEqual(414, resp.status)
+
+
+class TestProxyServerReloadSeamless(SeamlessReloadMixin,
+                                    TestProxyServerReloadBase):
+    BODY = b'proxy-seamless' * 10
+
+    def test_proxy_reload_seamless(self):
+        self._check_reload()
+
+
+class TestProxyServerReloadChild(ChildReloadMixin,
+                                 TestProxyServerReloadBase):
+    BODY = b'proxy-seamless' * 10
+    # A bit of a lie, but the respawned child won't pick up the updated config
+    HAS_INFO = False
+
+    def test_proxy_reload_child(self):
+        self._check_reload()
+
+
+@contextmanager
+def spawn_services(ip_ports, timeout=10):
+    q = eventlet.Queue()
+
+    def service(sock):
+        try:
+            conn, address = sock.accept()
+            q.put(address)
+            eventlet.sleep(timeout)
+            conn.close()
+        finally:
+            sock.close()
+
+    pool = eventlet.GreenPool()
+    for ip, port in ip_ports:
+        sock = eventlet.listen((ip, port))
+        pool.spawn(service, sock)
+
+    try:
+        yield q
+    finally:
+        for gt in list(pool.coroutines_running):
+            gt.kill()
+
+
+class TestHungDaemon(unittest.TestCase):
+
+    def setUp(self):
+        resetswift()
+        self.ip_ports = [
+            (dev['ip'], dev['port'])
+            for dev in Ring('/etc/swift', ring_name='account').devs
+            if dev
+        ]
+
+    def test_main(self):
+        reconciler = Manager(['container-reconciler'])
+        with spawn_services(self.ip_ports) as q:
+            reconciler.start()
+            # wait for the reconciler to connect
+            q.get()
+            # once it's hung in our connection - send it sig term
+            print('Attempting to stop reconciler!')
+            reconciler.stop()
+        self.assertEqual(1, reconciler.status())
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/s3api/__init__.py b/test/s3api/__init__.py
new file mode 100644
index 0000000000..5616f27503
--- /dev/null
+++ b/test/s3api/__init__.py
@@ -0,0 +1,301 @@
+# Copyright (c) 2019 SwiftStack, Inc.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import functools
+import logging
+import os
+import unittest
+import uuid
+import time
+
+import boto3
+from botocore.exceptions import ClientError
+import urllib.parse
+
+from swift.common.utils import config_true_value, readconf
+
+from test import get_config
+
+_CONFIG = None
+
+
+# boto's loggign can get pretty noisy; require opt-in to see it all
+if not config_true_value(os.environ.get('BOTO3_DEBUG')):
+    logging.getLogger('boto3').setLevel(logging.INFO)
+    logging.getLogger('botocore').setLevel(logging.INFO)
+
+
+class ConfigError(Exception):
+    '''Error test conf misconfigurations'''
+
+
+def load_aws_config(conf_file):
+    """
+    Read user credentials from an AWS CLI style credentials file and translate
+    to a swift test config. Currently only supports a single user.
+
+    :param conf_file: path to AWS credentials file
+    """
+    conf = readconf(conf_file, 'default')
+    global _CONFIG
+    _CONFIG = {
+        'endpoint': conf.get('endpoint', 'https://s3.amazonaws.com'),
+        'region': conf.get('region', 'us-east-1'),
+        'access_key1': conf.get('aws_access_key_id'),
+        'secret_key1': conf.get('aws_secret_access_key'),
+        'session_token1': conf.get('aws_session_token')
+    }
+
+
+aws_config_file = os.environ.get('SWIFT_TEST_AWS_CONFIG_FILE')
+if aws_config_file:
+    load_aws_config(aws_config_file)
+    print('Loaded test config from %s' % aws_config_file)
+
+
+def get_opt_or_error(option):
+    global _CONFIG
+    if _CONFIG is None:
+        _CONFIG = get_config('s3api_test')
+
+    value = _CONFIG.get(option)
+    if not value:
+        raise ConfigError('must supply [s3api_test]%s' % option)
+    return value
+
+
+def get_opt(option, default=None):
+    try:
+        return get_opt_or_error(option)
+    except ConfigError:
+        return default
+
+
+def get_s3_client(user=1, signature_version='s3v4', addressing_style='path'):
+    '''
+    Get a boto3 client to talk to an S3 endpoint.
+
+    :param user: user number to use. Should be one of:
+        1 -- primary user
+        2 -- secondary user
+        3 -- unprivileged user
+    :param signature_version: S3 signing method. Should be one of:
+        s3 -- v2 signatures; produces Authorization headers like
+              ``AWS access_key:signature``
+        s3-query -- v2 pre-signed URLs; produces query strings like
+                    ``?AWSAccessKeyId=access_key&Signature=signature``
+        s3v4 -- v4 signatures; produces Authorization headers like
+                ``AWS4-HMAC-SHA256
+                Credential=access_key/date/region/s3/aws4_request,
+                Signature=signature``
+        s3v4-query -- v4 pre-signed URLs; produces query strings like
+                      ``?X-Amz-Algorithm=AWS4-HMAC-SHA256&
+                      X-Amz-Credential=access_key/date/region/s3/aws4_request&
+                      X-Amz-Signature=signature``
+    :param addressing_style: One of:
+        path -- produces URLs like ``http(s)://host.domain/bucket/key``
+        virtual -- produces URLs like ``http(s)://bucket.host.domain/key``
+    '''
+    endpoint = get_opt('endpoint', None)
+    if endpoint:
+        scheme = urllib.parse.urlsplit(endpoint).scheme
+        if scheme not in ('http', 'https'):
+            raise ConfigError('unexpected scheme in endpoint: %r; '
+                              'expected http or https' % scheme)
+    else:
+        scheme = None
+    region = get_opt('region', 'us-east-1')
+    access_key = get_opt_or_error('access_key%d' % user)
+    secret_key = get_opt_or_error('secret_key%d' % user)
+    session_token = get_opt('session_token%d' % user)
+
+    ca_cert = get_opt('ca_cert')
+    if ca_cert is not None:
+        try:
+            # do a quick check now; it's more expensive to have boto check
+            os.stat(ca_cert)
+        except OSError as e:
+            raise ConfigError(str(e))
+
+    return boto3.client(
+        's3',
+        endpoint_url=endpoint,
+        region_name=region,
+        use_ssl=(scheme == 'https'),
+        verify=ca_cert,
+        config=boto3.session.Config(s3={
+            'signature_version': signature_version,
+            'addressing_style': addressing_style,
+        }),
+        aws_access_key_id=access_key,
+        aws_secret_access_key=secret_key,
+        aws_session_token=session_token
+    )
+
+
+def is_s3_acl_tests_enabled():
+    explicit_opt = get_opt('s3_acl_tests_enabled', None)
+    if explicit_opt is not None:
+        return config_true_value(explicit_opt)
+    else:
+        legacy_opt = get_opt('s3_acl_tests_disabled', 'false')
+        return not config_true_value(legacy_opt)
+
+
+def skip_if_s3_acl_tests_disabled(func):
+    @functools.wraps(func)
+    def wrapper(*args, **kwargs):
+        if not is_s3_acl_tests_enabled():
+            raise unittest.SkipTest('s3_acl_tests_enabled is false')
+        return func(*args, **kwargs)
+    return wrapper
+
+
+def etag_from_resp(response):
+    return response['ETag']
+
+
+def code_from_error(error):
+    return error.response['Error']['Code']
+
+
+def status_from_error(error):
+    return error.response['ResponseMetadata']['HTTPStatusCode']
+
+
+TEST_PREFIX = 's3api-test-'
+
+
+class BaseS3Mixin(object):
+    # Default to v4 signatures (as aws-cli does), but subclasses can override
+    signature_version = 's3v4'
+
+    @classmethod
+    def get_s3_client(cls, user):
+        return get_s3_client(user, cls.signature_version)
+
+    @classmethod
+    def _remove_all_object_versions_from_bucket(cls, client, bucket_name):
+        resp = client.list_object_versions(Bucket=bucket_name)
+        objs_to_delete = (resp.get('Versions', []) +
+                          resp.get('DeleteMarkers', []))
+        while objs_to_delete:
+            multi_delete_body = {
+                'Objects': [
+                    {'Key': obj['Key'], 'VersionId': obj['VersionId']}
+                    for obj in objs_to_delete
+                ],
+                'Quiet': False,
+            }
+            del_resp = client.delete_objects(Bucket=bucket_name,
+                                             Delete=multi_delete_body)
+            if any(del_resp.get('Errors', [])):
+                raise Exception('Unable to delete %r' % del_resp['Errors'])
+            if not resp['IsTruncated']:
+                break
+            key_marker = resp['NextKeyMarker']
+            version_id_marker = resp['NextVersionIdMarker']
+            resp = client.list_object_versions(
+                Bucket=bucket_name, KeyMarker=key_marker,
+                VersionIdMarker=version_id_marker)
+            objs_to_delete = (resp.get('Versions', []) +
+                              resp.get('DeleteMarkers', []))
+
+    @classmethod
+    def clear_bucket(cls, client, bucket_name):
+        timeout = time.time() + 10
+        backoff = 0.1
+        cls._remove_all_object_versions_from_bucket(client, bucket_name)
+        try:
+            client.delete_bucket(Bucket=bucket_name)
+        except ClientError as e:
+            if 'NoSuchBucket' in str(e):
+                return
+            if 'BucketNotEmpty' not in str(e):
+                raise
+            # Something's gone sideways. Try harder
+            client.put_bucket_versioning(
+                Bucket=bucket_name,
+                VersioningConfiguration={'Status': 'Suspended'})
+            while True:
+                cls._remove_all_object_versions_from_bucket(
+                    client, bucket_name)
+                # also try some version-unaware operations...
+                for key in client.list_objects(Bucket=bucket_name).get(
+                        'Contents', []):
+                    client.delete_object(Bucket=bucket_name, Key=key['Key'])
+
+                # *then* try again
+                try:
+                    client.delete_bucket(Bucket=bucket_name)
+                except ClientError as e:
+                    if 'NoSuchBucket' in str(e):
+                        return
+                    if 'BucketNotEmpty' not in str(e):
+                        raise
+                    if time.time() > timeout:
+                        raise Exception('Timeout clearing %r' % bucket_name)
+                    time.sleep(backoff)
+                    backoff *= 2
+                else:
+                    break
+
+    @classmethod
+    def create_name(cls, slug):
+        return '%s%s-%s' % (TEST_PREFIX, slug, uuid.uuid4().hex)
+
+    @classmethod
+    def clear_account(cls, client):
+        for bucket in client.list_buckets()['Buckets']:
+            if not bucket['Name'].startswith(TEST_PREFIX):
+                # these tests run against real s3 accounts
+                continue
+            cls.clear_bucket(client, bucket['Name'])
+
+
+class BaseS3TestCase(BaseS3Mixin, unittest.TestCase):
+    def tearDown(self):
+        client = self.get_s3_client(1)
+        self.clear_account(client)
+        try:
+            client = self.get_s3_client(2)
+        except ConfigError:
+            pass
+        else:
+            self.clear_account(client)
+
+    def check_owner(self, owner):
+        # as of July 2025, S3 may or may not send DisplayName
+        # https://docs.aws.amazon.com/AmazonS3/latest/API/API_Owner.html
+        owner.pop('DisplayName', None)
+        self.assertEqual(['ID'], list(owner.keys()))
+
+
+class BaseS3TestCaseWithBucket(BaseS3Mixin, unittest.TestCase):
+    @classmethod
+    def setUpClass(cls):
+        cls.bucket_name = cls.create_name('bucket')
+        client = cls.get_s3_client(1)
+        client.create_bucket(Bucket=cls.bucket_name)
+
+    @classmethod
+    def tearDownClass(cls):
+        client = cls.get_s3_client(1)
+        cls.clear_account(client)
+        try:
+            client = cls.get_s3_client(2)
+        except ConfigError:
+            pass
+        else:
+            cls.clear_account(client)
diff --git a/test/s3api/test_conditional_writes.py b/test/s3api/test_conditional_writes.py
new file mode 100644
index 0000000000..c7986b3156
--- /dev/null
+++ b/test/s3api/test_conditional_writes.py
@@ -0,0 +1,142 @@
+# Copyright (c) 2025 Nvidia
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from test.s3api import BaseS3TestCaseWithBucket, status_from_error, \
+    code_from_error
+from botocore.exceptions import ClientError
+
+
+class TestConditionalWrites(BaseS3TestCaseWithBucket):
+    def test_if_none_match_star_simple_put(self):
+        client = self.get_s3_client(1)
+        key_name = self.create_name('if-none-match-simple')
+        # Can create new object fine
+        resp = client.put_object(
+            Bucket=self.bucket_name,
+            Key=key_name,
+            IfNoneMatch='*',
+            Body=b'',
+        )
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        # But overwrite is blocked
+        with self.assertRaises(ClientError) as caught:
+            client.put_object(
+                Bucket=self.bucket_name,
+                Key=key_name,
+                IfNoneMatch='*',
+                Body=b'',
+            )
+        self.assertEqual(412, status_from_error(caught.exception))
+        self.assertEqual('PreconditionFailed',
+                         code_from_error(caught.exception))
+
+    def test_if_none_match_star_mpu(self):
+        client = self.get_s3_client(1)
+        key_name = self.create_name('if-none-match-mpu')
+
+        create_mpu_resp = client.create_multipart_upload(
+            Bucket=self.bucket_name, Key=key_name)
+        self.assertEqual(200, create_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        upload_id = create_mpu_resp['UploadId']
+        parts = []
+        for part_num in range(1, 4):
+            part_resp = client.upload_part(
+                Body=b'x' * 5 * 1024 * 1024,
+                Bucket=self.bucket_name, Key=key_name,
+                PartNumber=part_num, UploadId=upload_id)
+            self.assertEqual(200, part_resp[
+                'ResponseMetadata']['HTTPStatusCode'])
+            parts.append({
+                'ETag': part_resp['ETag'],
+                'PartNumber': part_num,
+            })
+
+        # Nothing there, so complete succeeds
+        complete_mpu_resp = client.complete_multipart_upload(
+            Bucket=self.bucket_name,
+            Key=key_name,
+            MultipartUpload={'Parts': parts[:2]},
+            UploadId=upload_id,
+            IfNoneMatch='*',
+        )
+        self.assertEqual(200, complete_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+
+        # Retrying with more parts fails
+        with self.assertRaises(ClientError) as caught:
+            client.complete_multipart_upload(
+                Bucket=self.bucket_name,
+                Key=key_name,
+                MultipartUpload={'Parts': parts},
+                UploadId=upload_id,
+                IfNoneMatch='*',
+            )
+        self.assertEqual(404, status_from_error(caught.exception))
+        self.assertEqual('NoSuchUpload',
+                         code_from_error(caught.exception))
+
+        # Ditto fewer
+        with self.assertRaises(ClientError) as caught:
+            client.complete_multipart_upload(
+                Bucket=self.bucket_name,
+                Key=key_name,
+                MultipartUpload={'Parts': parts[:1]},
+                UploadId=upload_id,
+                IfNoneMatch='*',
+            )
+        self.assertEqual(404, status_from_error(caught.exception))
+        self.assertEqual('NoSuchUpload',
+                         code_from_error(caught.exception))
+
+        # Can retry with all the same parts and 200 though
+        complete_mpu_resp = client.complete_multipart_upload(
+            Bucket=self.bucket_name,
+            Key=key_name,
+            MultipartUpload={'Parts': parts[:2]},
+            UploadId=upload_id,
+            IfNoneMatch='*',
+        )
+        self.assertEqual(200, complete_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+
+        # Can still start a new upload
+        create_mpu_resp = client.create_multipart_upload(
+            Bucket=self.bucket_name, Key=key_name)
+        self.assertEqual(200, create_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        upload_id = create_mpu_resp['UploadId']
+        # And upload parts
+        part_resp = client.upload_part(
+            Body=b'', Bucket=self.bucket_name, Key=key_name,
+            PartNumber=1, UploadId=upload_id)
+        self.assertEqual(200, part_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        parts = [{
+            'ETag': part_resp['ETag'],
+            'PartNumber': 1,
+        }]
+        # But completion will be blocked
+        with self.assertRaises(ClientError) as caught:
+            client.complete_multipart_upload(
+                Bucket=self.bucket_name,
+                Key=key_name,
+                MultipartUpload={'Parts': parts},
+                UploadId=upload_id,
+                IfNoneMatch='*',
+            )
+        self.assertEqual(412, status_from_error(caught.exception))
+        self.assertEqual('PreconditionFailed',
+                         code_from_error(caught.exception))
diff --git a/test/s3api/test_input_errors.py b/test/s3api/test_input_errors.py
new file mode 100644
index 0000000000..10e9b9f758
--- /dev/null
+++ b/test/s3api/test_input_errors.py
@@ -0,0 +1,3887 @@
+# Copyright (c) 2024 NVIDIA
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import binascii
+import base64
+import datetime
+import gzip
+import hashlib
+import hmac
+import os
+import requests
+import requests.models
+import struct
+import zlib
+from urllib.parse import urlsplit, urlunsplit, quote
+
+from swift.common import bufferedhttp
+from swift.common.utils.ipaddrs import parse_socket_string
+
+from test.s3api import BaseS3TestCaseWithBucket, get_opt, get_s3_client
+
+
+def _hmac(key, message, digest):
+    if not isinstance(key, bytes):
+        key = key.encode('utf8')
+    if not isinstance(message, bytes):
+        message = message.encode('utf8')
+    return hmac.new(key, message, digest).digest()
+
+
+def _sha256(payload=b''):
+    if not isinstance(payload, bytes):
+        payload = payload.encode('utf8')
+    return hashlib.sha256(payload).hexdigest()
+
+
+def _md5(payload=b''):
+    return base64.b64encode(
+        hashlib.md5(payload).digest()
+    ).decode('ascii')
+
+
+def _crc32(payload=b''):
+    return base64.b64encode(
+        struct.pack('!I', zlib.crc32(payload))
+    ).decode('ascii')
+
+
+def get_raw_conn(request):
+    # requests is going to try *real hard* to either send a "Content-Length" or
+    # "Transfer-encoding: chunked" header so dip down to our bufferedhttp to do
+    # the sending/parsing when we want to override those headers
+    host, port = parse_socket_string(request['host'], None)
+    if port:
+        port = int(port)
+    return bufferedhttp.http_connect_raw(
+        host,
+        port,
+        request['method'],
+        request['path'],
+        request['headers'],
+        '&'.join('%s=%s' % (k, v) for k, v in request['query'].items()),
+        request['https']
+    )
+
+
+EMPTY_SHA256 = _sha256()
+EPOCH = datetime.datetime.fromtimestamp(0, datetime.timezone.utc)
+
+
+class S3Session(object):
+    bucket_in_host = False
+    default_expiration = 900  # 15 min
+    ignored_auth_query_params = frozenset()
+
+    def __init__(
+        self,
+        endpoint,
+        access_key,
+        secret_key,
+        region='us-east-1',
+        session_token='',
+    ):
+        parts = urlsplit(endpoint)
+        self.https = (parts.scheme == 'https')
+        self.host = parts.netloc  # note: may include port
+        self.region = region
+        self.access_key = access_key
+        self.secret_key = secret_key
+        self.session_token = session_token
+        self.session = requests.Session()
+
+    def _query_string(self, query):
+        """
+        Compose a dict of query parameters into an appropriately formated query
+        string. The returned query string does NOT have a leading '?'.
+
+        :param query: a dict of query parameters
+        :returns: s query string
+        """
+        # Subclasses should implement this method.
+        raise NotImplementedError
+
+    def make_request(
+        self,
+        bucket=None,
+        key=None,
+        method='GET',
+        query=None,
+        headers=None,
+        body=b'',
+        stream=False,
+    ):
+        req = self.build_request(bucket, key, method, query, headers, stream)
+        self.sign_request(req)
+        return self.send_request(req, body)
+
+    def build_request(
+        self,
+        bucket=None,
+        key=None,
+        method='GET',
+        query=None,
+        headers=None,
+        stream=False,
+    ):
+        request = {
+            'https': self.https,
+            'host': self.host,
+            'method': method,
+            'path': '/',
+            'query': query or {},
+            'headers': requests.models.CaseInsensitiveDict(headers or {}),
+            'stream_response': stream,  # set to True for large downloads
+            'bucket': bucket,
+            'key': key,
+            'now': datetime.datetime.now(datetime.timezone.utc),
+        }
+
+        if bucket:
+            if self.bucket_in_host:
+                request['host'] = bucket + '.' + request['host']
+            else:
+                request['path'] += bucket + '/'
+
+        if key:
+            if not bucket:
+                raise ValueError('bucket required')
+            request['path'] += key
+
+        request['headers'].update({
+            'Date': request['now'].strftime("%a, %d %b %Y %H:%M:%S GMT"),
+        })
+
+        return request
+
+    def date_to_sign(self, request):
+        raise NotImplementedError
+
+    def sign_request(self, request):
+        raise NotImplementedError
+
+    def send_request(self, request, body):
+        url = urlunsplit((
+            'https' if request['https'] else 'http',
+            request['host'],
+            request['path'],
+            self._query_string(request['query']),
+            None,  # no fragment
+        ))
+        # Note that
+        # * requests will automatically include a Content-Length header when
+        #   sending a bytes body
+        # * no signing method incorporates the value of any Content-Length
+        #   header or even its existence/absence
+        return self.session.request(
+            request['method'],
+            url,
+            headers=request['headers'],
+            data=body,
+            stream=request['stream_response'],
+        )
+
+
+class S3SessionV2(S3Session):
+    def _query_string(self, query):
+        # S3 v2 seems to require ?key (without value) for valueless params and
+        # Swift's sigv2 seems happy with either ?key or ?key=<truthy>
+        return '&'.join(('%s' % k) if v is True else ('%s=%s' % (k, v))
+                        for k, v in sorted(query.items()))
+
+    def build_request(
+        self,
+        bucket=None,
+        key=None,
+        method='GET',
+        query=None,
+        headers=None,
+        stream=False,
+    ):
+        request = super().build_request(
+            bucket,
+            key,
+            method,
+            query,
+            headers,
+            stream,
+        )
+        if self.session_token:
+            request['headers']['x-amz-security-token'] = self.session_token
+        return request
+
+    def sign_v2(self, request):
+        string_to_sign_lines = [
+            request['method'],
+            request['headers'].get('content-md5', ''),
+            request['headers'].get('Content-Type', ''),
+            self.date_to_sign(request),
+        ]
+
+        amz_headers = sorted(
+            (h.strip(), v.strip())
+            for h, v in request['headers'].lower_items()
+            if h.startswith('x-amz-')
+        )
+        string_to_sign_lines.extend('%s:%s' % (h, v)
+                                    for h, v in amz_headers)
+
+        resource = '/' + request['bucket'] if self.bucket_in_host else ''
+        resource += request['path']
+        query_to_sign = {k: v for k, v in request['query'].items()
+                         if k not in self.ignored_auth_query_params}
+        if query_to_sign:
+            resource += '?' + self._query_string(query_to_sign)
+        string_to_sign_lines.append(resource)
+
+        signature = base64.b64encode(_hmac(
+            self.secret_key,
+            '\n'.join(string_to_sign_lines),
+            hashlib.sha1,
+        )).decode('ascii')
+        return {
+            'credential': self.access_key,
+            'signature': signature,
+        }
+
+
+class S3SessionV2Headers(S3SessionV2):
+    def date_to_sign(self, request):
+        if 'X-Amz-Date' in request['headers']:
+            return ''
+        else:
+            return request['headers']['Date']
+
+    def sign_request(self, request):
+        bundle = self.sign_v2(request)
+        request['headers']['Authorization'] = 'AWS ' + ':'.join([
+            bundle['credential'],
+            bundle['signature'],
+        ])
+
+
+class S3SessionV2Query(S3SessionV2):
+    ignored_auth_query_params = frozenset({
+        'Expires', 'AWSAccessKeyId', 'Signature'})
+
+    def build_request(
+        self,
+        bucket=None,
+        key=None,
+        method='GET',
+        query=None,
+        headers=None,
+        stream=False,
+    ):
+        request = super().build_request(
+            bucket,
+            key,
+            method,
+            query,
+            headers,
+            stream,
+        )
+
+        expires = int((request['now'] - EPOCH).total_seconds()) \
+            + self.default_expiration
+        request['query'].update({
+            'Expires': str(expires),
+            'AWSAccessKeyId': self.access_key,
+        })
+
+        return request
+
+    def date_to_sign(self, request):
+        return request['query']['Expires']
+
+    def sign_request(self, request):
+        bundle = self.sign_v2(request)
+        request['query'].update({
+            'Signature': quote(bundle['signature'], safe='-_.~'),
+        })
+
+
+class S3SessionV4(S3Session):
+    def _query_string(self, query):
+        # S3 v4 seems happy to receive either ?key or ?key=<truthy> for
+        # valueless params but Swift's sigv4 checking expects ?key=<truthy>
+        return '&'.join('%s=%s' % (k, v) for k, v in sorted(query.items()))
+
+    def sign_v4(self, request):
+        canonical_request_lines = [
+            request['method'],
+            ('/' + request['bucket'] if self.bucket_in_host else '')
+            + request['path'],
+            self._query_string(request['query']),
+        ]
+        canonical_request_lines.extend(
+            '%s:%s' % (h, request['headers'][h].strip())
+            for h in request['signed_headers'])
+        canonical_request_lines.extend([
+            '',
+            ';'.join(request['signed_headers']),
+            request['headers'].get('x-amz-content-sha256', 'UNSIGNED-PAYLOAD')
+        ])
+        scope = [
+            request['now'].strftime('%Y%m%d'),
+            self.region,
+            's3',
+            'aws4_request',
+        ]
+        string_to_sign_lines = [
+            'AWS4-HMAC-SHA256',
+            self.date_to_sign(request),
+            '/'.join(scope),
+            _sha256('\n'.join(canonical_request_lines)),
+        ]
+        key = 'AWS4' + self.secret_key
+        for piece in scope:
+            key = _hmac(key, piece, hashlib.sha256)
+        signature = binascii.hexlify(_hmac(
+            key,
+            '\n'.join(string_to_sign_lines),
+            hashlib.sha256
+        )).decode('ascii')
+        return {
+            'credential': self.access_key + '/' + '/'.join(scope),
+            'signature': signature,
+        }
+
+    def sign_chunk(self, request, previous_signature, current_chunk_sha):
+        scope = [
+            request['now'].strftime('%Y%m%d'),
+            self.region,
+            's3',
+            'aws4_request',
+        ]
+        string_to_sign_lines = [
+            'AWS4-HMAC-SHA256-PAYLOAD',
+            self.date_to_sign(request),
+            '/'.join(scope),
+            previous_signature,
+            _sha256(),  # ??
+            current_chunk_sha,
+        ]
+        key = 'AWS4' + self.secret_key
+        for piece in scope:
+            key = _hmac(key, piece, hashlib.sha256)
+        return binascii.hexlify(_hmac(
+            key,
+            '\n'.join(string_to_sign_lines),
+            hashlib.sha256
+        )).decode('ascii')
+
+    def sign_trailer(self, request, previous_signature, trailer):
+        # rough canonicalization
+        trailer = trailer.replace(b'\r', b'').replace(b' ', b'')
+        # AWS always wants at least the newline
+        if not trailer:
+            trailer = b'\n'
+        scope = [
+            request['now'].strftime('%Y%m%d'),
+            self.region,
+            's3',
+            'aws4_request',
+        ]
+        string_to_sign_lines = [
+            'AWS4-HMAC-SHA256-TRAILER',
+            self.date_to_sign(request),
+            '/'.join(scope),
+            previous_signature,
+            _sha256(trailer),
+        ]
+        key = 'AWS4' + self.secret_key
+        for piece in scope:
+            key = _hmac(key, piece, hashlib.sha256)
+        return binascii.hexlify(_hmac(
+            key,
+            '\n'.join(string_to_sign_lines),
+            hashlib.sha256
+        )).decode('ascii')
+
+
+class S3SessionV4Headers(S3SessionV4):
+    def build_request(
+        self,
+        bucket=None,
+        key=None,
+        method='GET',
+        query=None,
+        headers=None,
+        stream=False,
+    ):
+        request = super().build_request(
+            bucket,
+            key,
+            method,
+            query,
+            headers,
+            stream,
+        )
+
+        request['headers'].update({
+            'Host': request['host'],
+            'X-Amz-Date': request['now'].strftime('%Y%m%dT%H%M%SZ'),
+        })
+
+        if self.session_token:
+            request['headers']['x-amz-security-token'] = self.session_token
+
+        request['signed_headers'] = sorted(
+            h.strip()
+            for h, _ in request['headers'].lower_items()
+            if h in ('host', 'content-type', 'content-md5')
+            or h.startswith('x-amz-')
+        )
+
+        return request
+
+    def date_to_sign(self, request):
+        return request['headers']['X-Amz-Date']
+
+    def sign_request(self, request):
+        bundle = self.sign_v4(request)
+        request['headers']['Authorization'] = 'AWS4-HMAC-SHA256 ' + \
+            ','.join([
+                'Credential=' + bundle['credential'],
+                'SignedHeaders=' + ';'.join(request['signed_headers']),
+                'Signature=' + quote(bundle['signature'], safe='-_.~'),
+            ])
+
+
+class S3SessionV4Query(S3SessionV4):
+    # Note that v4 doesn't ignore any auth query params when signing
+    def build_request(
+        self,
+        bucket=None,
+        key=None,
+        method='GET',
+        query=None,
+        headers=None,
+        stream=False,
+    ):
+        request = super().build_request(
+            bucket,
+            key,
+            method,
+            query,
+            headers,
+            stream,
+        )
+
+        request['headers'].update({
+            'Host': request['host'],
+        })
+        scope = [
+            request['now'].strftime('%Y%m%d'),
+            self.region,
+            's3',
+            'aws4_request',
+        ]
+        for k, v in {
+            'X-Amz-Expires': str(self.default_expiration),
+            'X-Amz-Algorithm': 'AWS4-HMAC-SHA256',
+            'X-Amz-Credential': quote(
+                self.access_key + '/' + '/'.join(scope),
+                safe='-_.~'),
+            'X-Amz-Date': request['now'].strftime('%Y%m%dT%H%M%SZ'),
+        }.items():
+            request['query'].setdefault(k, v)
+
+        if self.session_token:
+            request['query']['X-Amz-Security-Token'] = quote(
+                self.session_token, safe='-_.~')
+
+        request['signed_headers'] = sorted(
+            h.strip()
+            for h, _ in request['headers'].lower_items()
+            if h in ('host', 'content-type', 'content-md5')
+            or h.startswith('x-amz-')
+        )
+
+        return request
+
+    def date_to_sign(self, request):
+        return request['query']['X-Amz-Date']
+
+    def sign_request(self, request):
+        request['query'].setdefault(
+            'X-Amz-SignedHeaders',
+            '%3B'.join(request['signed_headers']),
+        )
+        bundle = self.sign_v4(request)
+        request['query'].update({
+            'X-Amz-Signature': bundle['signature'],
+            'X-Amz-SignedHeaders': '%3B'.join(
+                request['signed_headers']),
+        })
+
+
+TEST_BODY = os.urandom(32)
+
+
+class InputErrorsMixin(object):
+    session_cls = None
+
+    @classmethod
+    def setUpClass(cls):
+        super(InputErrorsMixin, cls).setUpClass()
+        cls.conn = cls.session_cls(
+            get_opt('endpoint', None),
+            get_opt('access_key1', None),
+            get_opt('secret_key1', None),
+            get_opt('region', 'us-east-1'),
+            get_opt('session_token1', None),
+        )
+
+    def assertOK(self, resp, expected_body=b''):
+        respbody = resp.content
+        if not isinstance(respbody, str):
+            try:
+                respbody = respbody.decode('utf8')
+            except UnicodeError:
+                pass  # just trying to improve the error message
+        self.assertEqual(
+            (resp.status_code, resp.reason),
+            (200, 'OK'),
+            respbody)
+        if expected_body is not None:
+            self.assertEqual(resp.content, expected_body)
+
+    def assertMissingMD5OrChecksumHeader(self, resp):
+        self.assertEqual(resp.status_code, 400, resp.content)
+        self.assertIn(b'<Code>InvalidRequest</Code>', resp.content)
+        self.assertIn(b'<Message>Missing required header for this request: '
+                      b'Content-MD5 OR x-amz-checksum-*</Message>',
+                      resp.content)
+
+    def assertSHA256Mismatch(self, resp, sha_in_headers, sha_of_body):
+        respbody = resp.content
+        if not isinstance(respbody, str):
+            respbody = respbody.decode('utf8')
+        self.assertEqual(
+            (resp.status_code, resp.reason),
+            (400, 'Bad Request'),
+            respbody)
+        self.assertIn('<Code>XAmzContentSHA256Mismatch</Code>', respbody)
+        self.assertIn("<Message>The provided 'x-amz-content-sha256' header "
+                      "does not match what was computed.</Message>",
+                      respbody)
+        self.assertIn('<ClientComputedContentSHA256>%s'
+                      '</ClientComputedContentSHA256>'
+                      % sha_in_headers, respbody)
+        self.assertIn('<S3ComputedContentSHA256>%s</S3ComputedContentSHA256>'
+                      % sha_of_body, respbody)
+
+    def assertInvalidDigest(self, resp, md5_in_headers):
+        respbody = resp.content
+        if not isinstance(respbody, str):
+            respbody = respbody.decode('utf8')
+        self.assertEqual(
+            (resp.status_code, resp.reason),
+            (400, 'Bad Request'),
+            respbody)
+        self.assertIn('<Code>InvalidDigest</Code>', respbody)
+        self.assertIn("<Message>The Content-MD5 you specified was "
+                      "invalid.</Message>",
+                      respbody)
+        # TODO: AWS provides this, but swift doesn't (yet)
+        # self.assertIn('<Content-MD5>%s</Content-MD5>' % md5_in_headers,
+        #               respbody)
+
+    def assertBadDigest(self, resp, md5_in_headers, md5_of_body,
+                        expected_digest_should_be_hex=True):
+        """
+        Check that the response is a well-formed BadDigest error
+
+        :param resp: the ``requests`` response
+        :param md5_in_headers: the base64-encoded content-md5 sent in the
+            request headers
+        :param md5_of_body: the base64-encoded MD5 of the actual request body
+        :param expected_digest_should_be_hex: whether the <ExpectedDigest> in
+            the response should be hex-encoded; if not, expect it to be
+            base64-encoded
+        """
+        respbody = resp.content
+        if not isinstance(respbody, str):
+            respbody = respbody.decode('utf8')
+        self.assertEqual(
+            (resp.status_code, resp.reason),
+            (400, 'Bad Request'),
+            respbody)
+        self.assertIn('<Code>BadDigest</Code>', respbody)
+        self.assertIn("<Message>The Content-MD5 you specified did not match "
+                      "what we received.</Message>",
+                      respbody)
+        exp_digest = md5_in_headers
+        if expected_digest_should_be_hex:
+            # AWS needs b64 in headers, but is inconsistent in what it returns
+            # in the <ExpectedDigest> element: sometimes hex, sometimes b64
+            exp_digest = binascii.hexlify(
+                base64.b64decode(exp_digest)).decode('ascii')
+        self.assertIn('<ExpectedDigest>%s</ExpectedDigest>' % exp_digest,
+                      respbody)
+        # AWS always returns b64 in the <CalculatedDigest> element
+        # TODO: AWS provides this, but swift doesn't (yet)
+        # self.assertIn('<CalculatedDigest>%s</CalculatedDigest>'
+        #               % md5_of_body, respbody)
+
+    def assertBadChecksumDigest(self, resp, crc_type, crc_in_headers):
+        """
+        Check that the response is a well-formed BadDigest error that would be
+        raised for a checksum mismatch
+
+        :param resp: the ``requests`` response
+        :param crc_type: the CRC type
+        :param crc_in_headers: the crc value sent in headers
+        """
+        respbody = resp.content
+        if not isinstance(respbody, str):
+            respbody = respbody.decode('utf8')
+        self.assertEqual((resp.status_code, resp.reason), (400, 'Bad Request'),
+                         respbody)
+        self.assertIn('<Code>BadDigest</Code>', respbody)
+        self.assertIn("<Message>The %s you specified did not match the "
+                      "calculated checksum.</Message>" % crc_type,
+                      respbody)
+        self.assertNotIn('Expected', respbody)
+        self.assertNotIn('Computed', respbody)
+        self.assertNotIn(crc_in_headers, respbody)
+
+    def assertIncompleteBody(
+        self,
+        resp,
+        bytes_provided=None,
+        bytes_expected=None,
+    ):
+        self.assertEqual(resp.status_code, 400, resp.content)
+        self.assertIn(b'<Code>IncompleteBody</Code>', resp.content)
+        if bytes_provided is None:
+            self.assertIn(b'<Message>The request body terminated '
+                          b'unexpectedly</Message>',
+                          resp.content)
+            self.assertNotIn(b'<NumberBytesExpected>', resp.content)
+            self.assertNotIn(b'<NumberBytesProvided>', resp.content)
+        else:
+            self.assertIn(b'<Message>You did not provide the number of bytes '
+                          b'specified by the Content-Length HTTP header'
+                          b'</Message>',
+                          resp.content)
+            self.assertIn(b'<NumberBytesExpected>%d</NumberBytesExpected>'
+                          % bytes_expected,
+                          resp.content)
+            self.assertIn(b'<NumberBytesProvided>%d</NumberBytesProvided>'
+                          % bytes_provided,
+                          resp.content)
+
+    def test_get_service_no_sha(self):
+        resp = self.conn.make_request()
+        self.assertOK(resp, None)
+
+    def test_get_service_invalid_sha(self):
+        resp = self.conn.make_request(headers={
+            'x-amz-content-sha256': 'invalid'})
+        # (!) invalid doesn't matter on GET, at least most of the time
+        self.assertOK(resp, None)
+
+    def test_get_service_bad_sha(self):
+        resp = self.conn.make_request(headers={
+            'x-amz-content-sha256': _sha256(b'not the body')})
+        # (!) mismatch doesn't matter on GET, either
+        self.assertOK(resp, None)
+
+    def test_get_service_good_sha(self):
+        resp = self.conn.make_request(headers={
+            'x-amz-content-sha256': EMPTY_SHA256})
+        self.assertOK(resp, None)
+
+    def test_get_service_unsigned(self):
+        resp = self.conn.make_request(headers={
+            'x-amz-content-sha256': 'UNSIGNED-PAYLOAD'})
+        self.assertOK(resp, None)
+
+    def test_head_service_no_sha(self):
+        resp = self.conn.make_request(method='HEAD')
+        self.assertEqual(
+            (resp.status_code, resp.reason),
+            (405, 'Method Not Allowed'))
+
+    def test_head_service_invalid_sha(self):
+        resp = self.conn.make_request(method='HEAD', headers={
+            'x-amz-content-sha256': 'invalid'})
+        self.assertEqual(
+            (resp.status_code, resp.reason),
+            (405, 'Method Not Allowed'))
+
+    def test_head_service_bad_sha(self):
+        resp = self.conn.make_request(method='HEAD', headers={
+            'x-amz-content-sha256': _sha256(b'not the body')})
+        self.assertEqual(
+            (resp.status_code, resp.reason),
+            (405, 'Method Not Allowed'))
+
+    def test_head_service_good_sha(self):
+        resp = self.conn.make_request(method='HEAD', headers={
+            'x-amz-content-sha256': EMPTY_SHA256})
+        self.assertEqual(
+            (resp.status_code, resp.reason),
+            (405, 'Method Not Allowed'))
+
+    def test_head_service_unsigned(self):
+        resp = self.conn.make_request(method='HEAD', headers={
+            'x-amz-content-sha256': 'UNSIGNED-PAYLOAD'})
+        self.assertEqual(
+            (resp.status_code, resp.reason),
+            (405, 'Method Not Allowed'))
+
+    def test_get_bucket_no_md5_no_sha(self):
+        resp = self.conn.make_request(self.bucket_name)
+        self.assertOK(resp, None)
+
+    def test_get_bucket_no_md5_invalid_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            headers={
+                'x-amz-content-sha256': 'invalid'})
+        self.assertOK(resp, None)
+
+    def test_get_bucket_no_md5_bad_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            headers={
+                'x-amz-content-sha256': _sha256(b'not the body')})
+        self.assertOK(resp, None)
+
+    def test_get_bucket_no_md5_good_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            headers={
+                'x-amz-content-sha256': _sha256(TEST_BODY)})
+        self.assertOK(resp, None)
+
+    def test_get_bucket_no_md5_unsigned(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            headers={
+                'x-amz-content-sha256': 'UNSIGNED-PAYLOAD'})
+        self.assertOK(resp, None)
+
+    def test_get_bucket_good_md5_no_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            headers={
+                'content-md5': _md5(TEST_BODY)})
+        self.assertOK(resp, None)
+
+    def test_get_bucket_good_md5_good_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            headers={
+                'content-md5': _md5(TEST_BODY),
+                'x-amz-content-sha256': _sha256(TEST_BODY)})
+        self.assertOK(resp, None)
+
+    def test_head_bucket_no_md5_no_sha(self):
+        resp = self.conn.make_request(self.bucket_name, method='HEAD')
+        self.assertOK(resp)
+
+    def test_head_bucket_no_md5_good_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            method='HEAD',
+            headers={
+                'x-amz-content-sha256': _sha256(TEST_BODY)})
+        self.assertOK(resp)
+
+    def test_head_bucket_good_md5_no_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            method='HEAD',
+            headers={
+                'content-md5': _md5(TEST_BODY)})
+        self.assertOK(resp)
+
+    def test_head_bucket_good_md5_good_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            method='HEAD',
+            headers={
+                'content-md5': _md5(TEST_BODY),
+                'x-amz-content-sha256': _sha256(TEST_BODY)})
+        self.assertOK(resp)
+
+    def test_no_md5_no_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY)
+        self.assertOK(resp)
+
+    def get_response_put_object_no_md5_no_sha_no_content_length(self):
+        request = self.conn.build_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+        )
+        self.conn.sign_request(request)
+        raw_conn = get_raw_conn(request)
+        raw_conn.send(TEST_BODY)
+        return raw_conn.getresponse()
+
+    def test_no_md5_no_sha_no_content_length(self):
+        resp = self.get_response_put_object_no_md5_no_sha_no_content_length()
+        body = resp.read()
+        self.assertEqual(resp.status, 411, body)
+        self.assertIn(b'<Code>MissingContentLength</Code>', body)
+        self.assertIn(b'<Message>You must provide the Content-Length HTTP '
+                      b'header.</Message>', body)
+
+    def test_no_md5_invalid_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={'x-amz-content-sha256': 'invalid'})
+        self.assertSHA256Mismatch(resp, 'invalid', _sha256(TEST_BODY))
+
+    def test_no_md5_invalid_sha_ucase(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={'X-AMZ-CONTENT-SHA256': 'INVALID'})
+        # Despite the upper-cased header name in the request,
+        # the error message has it lower
+        self.assertSHA256Mismatch(resp, 'INVALID', _sha256(TEST_BODY))
+
+    def test_no_md5_bad_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={'x-amz-content-sha256': EMPTY_SHA256})
+        self.assertSHA256Mismatch(resp, EMPTY_SHA256, _sha256(TEST_BODY))
+
+    def test_no_md5_bad_sha_ucase(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={'X-AMZ-CONTENT-SHA256': EMPTY_SHA256.upper()})
+        # Despite the upper-cased header name in the request,
+        # the error message has it lower
+        self.assertSHA256Mismatch(
+            resp, EMPTY_SHA256.upper(), _sha256(TEST_BODY))
+
+    def test_good_md5_good_sha_good_crc(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'good-checksum',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'content-md5': _md5(TEST_BODY),
+                'x-amz-content-sha256': _sha256(TEST_BODY),
+                'x-amz-checksum-crc32': _crc32(TEST_BODY),
+            })
+        self.assertOK(resp)
+
+    def test_good_md5_good_sha_good_crc_declared(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'good-checksum',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'content-md5': _md5(TEST_BODY),
+                'x-amz-content-sha256': _sha256(TEST_BODY),
+                # can flag that you're going to send it
+                'x-amz-sdk-checksum-algorithm': 'CRC32',
+                'x-amz-checksum-crc32': _crc32(TEST_BODY),
+            })
+        self.assertOK(resp)
+
+    def test_good_md5_good_sha_no_crc_but_declared(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'missing-checksum',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'content-md5': _md5(TEST_BODY),
+                'x-amz-content-sha256': _sha256(TEST_BODY),
+                # but if you flag it, you gotta send it
+                'x-amz-sdk-checksum-algorithm': 'CRC32',
+            })
+        self.assertEqual(resp.status_code, 400, resp.content)
+        self.assertIn(b'<Code>InvalidRequest</Code>', resp.content)
+        self.assertIn(b'<Message>x-amz-sdk-checksum-algorithm specified, but '
+                      b'no corresponding x-amz-checksum-* or x-amz-trailer '
+                      b'headers were found.</Message>', resp.content)
+
+    def test_good_md5_good_sha_good_crc_algo_mismatch(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'good-checksum',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'content-md5': _md5(TEST_BODY),
+                'x-amz-content-sha256': _sha256(TEST_BODY),
+                'x-amz-sdk-checksum-algorithm': 'CRC32C',
+                'x-amz-checksum-crc32': _crc32(TEST_BODY),
+            })
+        self.assertEqual(resp.status_code, 400, resp.content)
+        self.assertIn(b'<Code>InvalidRequest</Code>', resp.content)
+        # Note that if there's a mismatch between what you flag and what you
+        # send, the message isn't super clear
+        self.assertIn(b'<Message>Value for x-amz-sdk-checksum-algorithm '
+                      b'header is invalid.</Message>', resp.content)
+
+    def test_good_md5_good_sha_invalid_crc_header(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'invalid-checksum',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'content-md5': _md5(TEST_BODY),
+                'x-amz-content-sha256': _sha256(TEST_BODY),
+                'x-amz-checksum-crc32': 'bad'})
+        self.assertEqual(resp.status_code, 400, resp.content)
+        self.assertIn(b'<Code>InvalidRequest</Code>', resp.content)
+        self.assertIn(b'<Message>Value for x-amz-checksum-crc32 header is '
+                      b'invalid.</Message>', resp.content)
+
+    def test_good_md5_good_sha_bad_crc_header(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'bad-checksum',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'content-md5': _md5(TEST_BODY),
+                'x-amz-content-sha256': _sha256(TEST_BODY),
+                'x-amz-checksum-crc32': _crc32(b'not the body')})
+        self.assertBadChecksumDigest(resp, 'CRC32', _crc32(b'not the body'))
+
+    def test_good_md5_bad_sha_bad_crc_header(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'bad-checksum',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'content-md5': _md5(TEST_BODY),
+                'x-amz-content-sha256': _sha256(b'not the body'),
+                'x-amz-checksum-crc32': _crc32(b'not the body')})
+        # SHA256 trumps checksum
+        self.assertSHA256Mismatch(
+            resp, _sha256(b'not the body'), _sha256(TEST_BODY))
+
+    def test_no_md5_good_sha_good_crc_header(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'bad-checksum',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'x-amz-content-sha256': _sha256(TEST_BODY),
+                'x-amz-checksum-crc32': _crc32(TEST_BODY)})
+        self.assertOK(resp)
+
+    def test_no_md5_good_sha_unsupported_crc_header(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'bad-checksum',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'x-amz-content-sha256': _sha256(TEST_BODY),
+                'x-amz-checksum-bad': _crc32(TEST_BODY)})
+        self.assertEqual(resp.status_code, 400, resp.content)
+        self.assertIn(b'<Code>InvalidRequest</Code>', resp.content)
+        self.assertIn(b'<Message>The algorithm type you specified in '
+                      b'x-amz-checksum- header is invalid.</Message>',
+                      resp.content)
+
+    def test_no_md5_good_sha_multiple_crc_in_headers(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'bad-checksum',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'x-amz-content-sha256': _sha256(TEST_BODY),
+                'x-amz-checksum-crc32c': _crc32(TEST_BODY),
+                'x-amz-checksum-crc32': _crc32(TEST_BODY)})
+        self.assertEqual(resp.status_code, 400, resp.content)
+        self.assertIn(b'<Code>InvalidRequest</Code>', resp.content)
+        self.assertIn(b'<Message>Expecting a single x-amz-checksum- header. '
+                      b'Multiple checksum Types are not allowed.</Message>',
+                      resp.content)
+
+    def test_no_md5_good_sha_multiple_crc_in_headers_algo_mismatch(self):
+        # repeats trump the algo mismatch
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'bad-checksum',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'x-amz-sdk-checksum-algorithm': 'sha256',
+                'x-amz-content-sha256': _sha256(TEST_BODY),
+                'x-amz-checksum-crc32c': _crc32(TEST_BODY),
+                'x-amz-checksum-crc32': _crc32(TEST_BODY)})
+        self.assertEqual(resp.status_code, 400, resp.content)
+        self.assertIn(b'<Code>InvalidRequest</Code>', resp.content)
+        self.assertIn(b'<Message>Expecting a single x-amz-checksum- header. '
+                      b'Multiple checksum Types are not allowed.</Message>',
+                      resp.content)
+
+    def test_no_md5_good_sha_crc_in_trailer_but_not_streaming(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'bad-checksum',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'x-amz-sdk-checksum-algorithm': 'crc32',
+                'x-amz-content-sha256': _sha256(TEST_BODY),
+                'x-amz-trailer': 'x-amz-checksum-crc32'})
+        self.assertEqual(resp.status_code, 400, resp.content)
+        self.assertIn(b'<Code>MalformedTrailerError</Code>', resp.content)
+        self.assertIn(b'<Message>The request contained trailing data that was '
+                      b'not well-formed or did not conform to our published '
+                      b'schema.</Message>', resp.content)
+
+    def test_no_md5_good_sha_duplicated_crc_in_trailer_algo_mismatch(self):
+        # repeats trump the algo mismatch
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'bad-checksum',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'x-amz-sdk-checksum-algorithm': 'sha256',
+                'x-amz-content-sha256': _sha256(TEST_BODY),
+                'x-amz-checksum-crc32': _crc32(TEST_BODY),
+                'x-amz-trailer': 'x-amz-checksum-crc32, x-amz-checksum-crc32'})
+        self.assertEqual(resp.status_code, 400, resp.content)
+        self.assertIn(b'<Code>InvalidRequest</Code>', resp.content)
+        self.assertIn(b'<Message>Expecting a single x-amz-checksum- header. '
+                      b'Multiple checksum Types are not allowed.</Message>',
+                      resp.content)
+
+    def test_no_md5_good_sha_multiple_crc_in_trailer_algo_mismatch(self):
+        # repeats trump the algo mismatch
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'bad-checksum',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'x-amz-sdk-checksum-algorithm': 'sha256',
+                'x-amz-content-sha256': _sha256(TEST_BODY),
+                'x-amz-checksum-crc32': _crc32(TEST_BODY),
+                'x-amz-trailer': 'x-amz-checksum-crc32, x-amz-checksum-crc32c'}
+        )
+        self.assertEqual(resp.status_code, 400, resp.content)
+        self.assertIn(b'<Code>InvalidRequest</Code>', resp.content)
+        self.assertIn(b'<Message>Expecting a single x-amz-checksum- header. '
+                      b'Multiple checksum Types are not allowed.</Message>',
+                      resp.content)
+
+    def test_no_md5_good_sha_different_crc_in_trailer_and_header(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'bad-checksum',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'x-amz-sdk-checksum-algorithm': 'crc32',
+                'x-amz-content-sha256': _sha256(TEST_BODY),
+                'x-amz-checksum-crc32': _crc32(TEST_BODY),
+                'x-amz-trailer': 'x-amz-checksum-crc32c'})
+        self.assertEqual(resp.status_code, 400, resp.content)
+        self.assertIn(b'<Code>InvalidRequest</Code>', resp.content)
+        self.assertIn(b'<Message>Expecting a single x-amz-checksum- header'
+                      b'</Message>', resp.content)
+
+    def test_no_md5_good_sha_same_crc_in_trailer_and_header(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'bad-checksum',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'x-amz-sdk-checksum-algorithm': 'crc32',
+                'x-amz-content-sha256': _sha256(TEST_BODY),
+                'x-amz-checksum-crc32': _crc32(TEST_BODY),
+                'x-amz-trailer': 'x-amz-checksum-crc32'})
+        self.assertEqual(resp.status_code, 400, resp.content)
+        self.assertIn(b'<Code>InvalidRequest</Code>', resp.content)
+        self.assertIn(b'<Message>Expecting a single x-amz-checksum- header'
+                      b'</Message>', resp.content)
+
+    def test_no_md5_good_sha_multiple_crc_in_trailer_and_header(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'bad-checksum',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'x-amz-sdk-checksum-algorithm': 'crc32',
+                'x-amz-content-sha256': _sha256(TEST_BODY),
+                'x-amz-checksum-crc32': _crc32(TEST_BODY),
+                'x-amz-trailer': 'x-amz-checksum-crc32, x-amz-checksum-crc32c'}
+        )
+        self.assertEqual(resp.status_code, 400, resp.content)
+        self.assertIn(b'<Code>InvalidRequest</Code>', resp.content)
+        self.assertIn(b'<Message>Expecting a single x-amz-checksum- header. '
+                      b'Multiple checksum Types are not allowed.</Message>',
+                      resp.content)
+
+    def test_no_md5_good_sha_multiple_crc_in_header_and_trailer(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'bad-checksum',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'x-amz-sdk-checksum-algorithm': 'crc32',
+                'x-amz-content-sha256': _sha256(TEST_BODY),
+                'x-amz-checksum-crc32': _crc32(TEST_BODY),
+                'x-amz-checksum-sha256': _sha256(TEST_BODY),
+                'x-amz-trailer': 'x-amz-checksum-crc32'}
+        )
+        self.assertEqual(resp.status_code, 400, resp.content)
+        self.assertIn(b'<Code>InvalidRequest</Code>', resp.content)
+        self.assertIn(b'<Message>Expecting a single x-amz-checksum- header. '
+                      b'Multiple checksum Types are not allowed.</Message>',
+                      resp.content)
+
+    def test_no_md5_bad_sha_empty_body(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            headers={'x-amz-content-sha256': _sha256(b'not the body')})
+        self.assertSHA256Mismatch(resp, _sha256(b'not the body'), EMPTY_SHA256)
+
+    def test_no_md5_good_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={'x-amz-content-sha256': _sha256(TEST_BODY)})
+        self.assertOK(resp)
+
+    def test_no_md5_good_sha_chunk_encoding_declared_ok(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={'x-amz-content-sha256': _sha256(TEST_BODY),
+                     'content-encoding': 'aws-chunked'})  # but not really
+        self.assertOK(resp)
+
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            headers={'x-amz-content-sha256': 'UNSIGNED-PAYLOAD'})
+        self.assertOK(resp, TEST_BODY)
+        self.assertEqual(resp.headers.get('Content-Encoding'), 'aws-chunked')
+
+    def test_no_md5_good_sha_ucase(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={'x-amz-content-sha256': _sha256(TEST_BODY).upper()})
+        self.assertOK(resp)
+
+    def test_no_md5_good_sha_no_content_length(self):
+        request = self.conn.build_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            headers={'x-amz-content-sha256': _sha256(TEST_BODY)},
+        )
+        self.conn.sign_request(request)
+        raw_conn = get_raw_conn(request)
+        raw_conn.send(TEST_BODY)
+        resp = raw_conn.getresponse()
+        body = resp.read()
+        self.assertEqual(resp.status, 411, body)
+        self.assertIn(b'<Code>MissingContentLength</Code>', body)
+        self.assertIn(b'<Message>You must provide the Content-Length HTTP '
+                      b'header.</Message>', body)
+
+    def test_no_md5_unsigned(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={'x-amz-content-sha256': 'UNSIGNED-PAYLOAD'})
+        self.assertOK(resp)
+
+    def test_no_md5_unsigned_lcase(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={'x-amz-content-sha256': 'unsigned-payload'})
+        self.assertSHA256Mismatch(resp, 'unsigned-payload', _sha256(TEST_BODY))
+
+    def test_no_md5_streaming_unsigned_no_encoding_no_length(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER'})
+        respbody = resp.content
+        if not isinstance(respbody, str):
+            respbody = respbody.decode('utf8')
+        self.assertEqual(
+            (resp.status_code, resp.reason),
+            (411, 'Length Required'),
+            respbody)
+        self.assertIn('<Code>MissingContentLength</Code>', respbody)
+        # NB: we *do* provide Content-Length (or rather, urllib does)
+        # they really mean X-Amz-Decoded-Content-Length
+        self.assertIn("<Message>You must provide the Content-Length HTTP "
+                      "header.</Message>",
+                      respbody)
+
+    def test_no_md5_streaming_unsigned_bad_decoded_content_length(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': 'not an int'})
+        respbody = resp.content
+        if not isinstance(respbody, str):
+            respbody = respbody.decode('utf8')
+        self.assertEqual(
+            (resp.status_code, resp.reason),
+            (411, 'Length Required'),
+            respbody)
+        self.assertIn('<Code>MissingContentLength</Code>', respbody)
+        # NB: we *do* provide Content-Length (or rather, urllib does)
+        # they really mean X-Amz-Decoded-Content-Length
+        self.assertIn("<Message>You must provide the Content-Length HTTP "
+                      "header.</Message>",
+                      respbody)
+
+    def test_invalid_md5_no_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={'content-md5': 'invalid'})
+        self.assertInvalidDigest(resp, 'invalid')
+
+    def test_invalid_md5_invalid_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={'content-md5': 'invalid',
+                     'x-amz-content-sha256': 'invalid'})
+        self.assertInvalidDigest(resp, 'invalid')
+
+    def test_invalid_md5_bad_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={'content-md5': 'invalid',
+                     'x-amz-content-sha256': EMPTY_SHA256})
+        self.assertInvalidDigest(resp, 'invalid')
+
+    def test_invalid_md5_good_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={'content-md5': 'invalid',
+                     'x-amz-content-sha256': _sha256(TEST_BODY)})
+        self.assertInvalidDigest(resp, 'invalid')
+
+    def test_bad_md5_no_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={'content-md5': _md5(b'')})
+        self.assertBadDigest(resp, _md5(b''), _md5(TEST_BODY))
+
+    def test_bad_md5_invalid_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'content-md5': _md5(b''),
+                'x-amz-content-sha256': 'invalid'})
+        # Neither is right; "mismatched" sha256 trumps
+        self.assertSHA256Mismatch(resp, 'invalid', _sha256(TEST_BODY))
+
+    def test_bad_md5_bad_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'content-md5': _md5(b''),
+                'x-amz-content-sha256': EMPTY_SHA256})
+        # Neither is right; bad sha256 trumps
+        self.assertSHA256Mismatch(resp, EMPTY_SHA256, _sha256(TEST_BODY))
+
+    def test_bad_md5_good_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'content-md5': _md5(b''),
+                'x-amz-content-sha256': _sha256(TEST_BODY)})
+        self.assertBadDigest(resp, _md5(b''), _md5(TEST_BODY))
+
+    def test_good_md5_no_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={'content-md5': _md5(TEST_BODY)})
+        self.assertOK(resp)
+
+    def test_good_md5_invalid_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'content-md5': _md5(TEST_BODY),
+                'x-amz-content-sha256': 'invalid'})
+        self.assertSHA256Mismatch(resp, 'invalid', _sha256(TEST_BODY))
+
+    def test_good_md5_bad_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'content-md5': _md5(TEST_BODY),
+                'x-amz-content-sha256': EMPTY_SHA256})
+        self.assertSHA256Mismatch(resp, EMPTY_SHA256, _sha256(TEST_BODY))
+
+    def test_good_md5_good_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'content-md5': _md5(TEST_BODY),
+                'x-amz-content-sha256': _sha256(TEST_BODY)})
+        self.assertOK(resp)
+
+    def test_get_object_no_sha(self):
+        obj_name = self.create_name('get-object')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            obj_name,
+            method='PUT',
+            body=TEST_BODY,
+            headers={'x-amz-content-sha256': 'UNSIGNED-PAYLOAD'})
+        self.assertOK(resp)
+
+        resp = self.conn.make_request(self.bucket_name, obj_name)
+        self.assertOK(resp, TEST_BODY)
+
+    def test_get_object_invalid_sha(self):
+        obj_name = self.create_name('get-object')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            obj_name,
+            method='PUT',
+            body=TEST_BODY,
+            headers={'x-amz-content-sha256': 'UNSIGNED-PAYLOAD'})
+        self.assertOK(resp)
+
+        resp = self.conn.make_request(
+            self.bucket_name,
+            obj_name,
+            headers={'x-amz-content-sha256': 'invalid'})
+        self.assertOK(resp, TEST_BODY)
+
+    def test_get_object_bad_sha(self):
+        obj_name = self.create_name('get-object')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            obj_name,
+            method='PUT',
+            body=TEST_BODY,
+            headers={'x-amz-content-sha256': 'UNSIGNED-PAYLOAD'})
+        self.assertOK(resp)
+
+        resp = self.conn.make_request(
+            self.bucket_name,
+            obj_name,
+            headers={'x-amz-content-sha256': _sha256(b'not the body')})
+        self.assertOK(resp, TEST_BODY)
+
+    def test_get_object_good_sha(self):
+        obj_name = self.create_name('get-object')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            obj_name,
+            method='PUT',
+            body=TEST_BODY,
+            headers={'x-amz-content-sha256': 'UNSIGNED-PAYLOAD'})
+        self.assertOK(resp)
+
+        resp = self.conn.make_request(
+            self.bucket_name,
+            obj_name,
+            headers={'x-amz-content-sha256': _sha256()})
+        self.assertOK(resp, TEST_BODY)
+
+    def test_get_object_unsigned(self):
+        obj_name = self.create_name('get-object')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            obj_name,
+            method='PUT',
+            body=TEST_BODY,
+            headers={'x-amz-content-sha256': 'UNSIGNED-PAYLOAD'})
+        self.assertOK(resp)
+
+        resp = self.conn.make_request(
+            self.bucket_name,
+            obj_name,
+            headers={'x-amz-content-sha256': 'UNSIGNED-PAYLOAD'})
+        self.assertOK(resp, TEST_BODY)
+
+    def test_head_object_no_sha(self):
+        obj_name = self.create_name('get-object')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            obj_name,
+            method='PUT',
+            body=TEST_BODY,
+            headers={'x-amz-content-sha256': 'UNSIGNED-PAYLOAD'})
+        self.assertOK(resp)
+
+        resp = self.conn.make_request(
+            self.bucket_name,
+            obj_name,
+            method='HEAD')
+        self.assertOK(resp)
+
+    def test_head_object_invalid_sha(self):
+        obj_name = self.create_name('get-object')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            obj_name,
+            method='PUT',
+            body=TEST_BODY,
+            headers={'x-amz-content-sha256': 'UNSIGNED-PAYLOAD'})
+        self.assertOK(resp)
+
+        resp = self.conn.make_request(
+            self.bucket_name,
+            obj_name,
+            method='HEAD',
+            headers={'x-amz-content-sha256': 'invalid'})
+        self.assertOK(resp)
+
+    def test_head_object_bad_sha(self):
+        obj_name = self.create_name('get-object')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            obj_name,
+            method='PUT',
+            body=TEST_BODY,
+            headers={'x-amz-content-sha256': 'UNSIGNED-PAYLOAD'})
+        self.assertOK(resp)
+
+        resp = self.conn.make_request(
+            self.bucket_name,
+            obj_name,
+            method='HEAD',
+            headers={'x-amz-content-sha256': _sha256(b'not the body')})
+        self.assertOK(resp)
+
+    def test_head_object_good_sha(self):
+        obj_name = self.create_name('get-object')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            obj_name,
+            method='PUT',
+            body=TEST_BODY,
+            headers={'x-amz-content-sha256': 'UNSIGNED-PAYLOAD'})
+        self.assertOK(resp)
+
+        resp = self.conn.make_request(
+            self.bucket_name,
+            obj_name,
+            method='HEAD',
+            headers={'x-amz-content-sha256': _sha256()})
+        self.assertOK(resp)
+
+    def test_head_object_unsigned(self):
+        obj_name = self.create_name('get-object')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            obj_name,
+            method='PUT',
+            body=TEST_BODY,
+            headers={'x-amz-content-sha256': 'UNSIGNED-PAYLOAD'})
+        self.assertOK(resp)
+
+        resp = self.conn.make_request(
+            self.bucket_name,
+            obj_name,
+            method='HEAD',
+            headers={'x-amz-content-sha256': 'UNSIGNED-PAYLOAD'})
+        self.assertOK(resp)
+
+    def _setup_mpu(self, key):
+        # create an mpu and upload a part
+        client = get_s3_client(1)
+        create_mpu_resp = client.create_multipart_upload(
+            Bucket=self.bucket_name, Key=key)
+        self.assertEqual(200, create_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        upload_id = create_mpu_resp['UploadId']
+        part_resp = client.upload_part(
+            Body='x' * 1024,
+            Bucket=self.bucket_name,
+            Key=key,
+            PartNumber=1,
+            UploadId=upload_id)
+        self.assertEqual(200, part_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        complete_request_body = (
+            '<?xml version=\'1.0\' encoding=\'UTF-8\'?>\n'
+            '<CompleteMultipartUpload '
+            'xmlns="http://s3.amazonaws.com/doc/2006-03-01/">'
+            '<Part>'
+            '<PartNumber>1</PartNumber>'
+            '<ETag>%s</ETag>'
+            '</Part>'
+            '</CompleteMultipartUpload>' % part_resp['ETag']
+        ).encode('utf-8')
+        return upload_id, complete_request_body
+
+    def test_good_md5_good_sha_good_crc_header_mpu(self):
+        key = 'mpu-name'
+        upload_id, complete_mpu_body = self._setup_mpu(key)
+        resp = self.conn.make_request(
+            self.bucket_name,
+            key,
+            query={'uploadId': upload_id},
+            method='POST',
+            body=complete_mpu_body,
+            headers={
+                'content-md5': _md5(complete_mpu_body),
+                'x-amz-content-sha256': _sha256(complete_mpu_body),
+                'x-amz-checksum-crc32': _crc32(complete_mpu_body),
+            }
+        )
+        self.assertEqual(resp.status_code, 200, resp.content)
+        self.assertIn(b'CompleteMultipartUploadResult', resp.content)
+
+    def test_bad_md5_good_sha_good_crc_header_mpu(self):
+        key = 'mpu-name'
+        upload_id, complete_mpu_body = self._setup_mpu(key)
+        resp = self.conn.make_request(
+            self.bucket_name,
+            key,
+            query={'uploadId': upload_id},
+            method='POST',
+            body=complete_mpu_body,
+            headers={
+                'content-md5': _md5(b'not the body'),
+                'x-amz-content-sha256': _sha256(complete_mpu_body),
+                'x-amz-checksum-crc32': _crc32(complete_mpu_body),
+            }
+        )
+        self.assertBadDigest(
+            resp, _md5(b'not the body'), _md5(complete_mpu_body),
+            expected_digest_should_be_hex=False)
+
+    def test_good_md5_bad_sha_good_crc_header_mpu(self):
+        key = 'mpu-name'
+        upload_id, complete_mpu_body = self._setup_mpu(key)
+        resp = self.conn.make_request(
+            self.bucket_name,
+            key,
+            query={'uploadId': upload_id},
+            method='POST',
+            body=complete_mpu_body,
+            headers={
+                'content-md5': _md5(complete_mpu_body),
+                'x-amz-content-sha256': _sha256(b'not the body'),
+                'x-amz-checksum-crc32': _crc32(complete_mpu_body),
+            }
+        )
+        self.assertSHA256Mismatch(
+            resp, _sha256(b'not the body'), _sha256(complete_mpu_body))
+
+    def test_good_md5_good_sha_bad_crc_header_mpu(self):
+        key = 'mpu-name'
+        upload_id, complete_mpu_body = self._setup_mpu(key)
+        resp = self.conn.make_request(
+            self.bucket_name,
+            key,
+            query={'uploadId': upload_id},
+            method='POST',
+            body=complete_mpu_body,
+            headers={
+                'content-md5': _md5(complete_mpu_body),
+                'x-amz-content-sha256': _sha256(complete_mpu_body),
+                'x-amz-checksum-crc32': _crc32(b'not the body'),
+            }
+        )
+        # Despite the bad checksum, we complete successfully!
+        self.assertEqual(resp.status_code, 200, resp.content)
+        self.assertIn(b'CompleteMultipartUploadResult', resp.content)
+
+    def _setup_multi_delete(self):
+        key_name = 'test-obj'
+        client = get_s3_client(1)
+        put_resp = client.put_object(Bucket=self.bucket_name,
+                                     Key=key_name,
+                                     Body=b'test data')
+        self.assertEqual(200, put_resp['ResponseMetadata']['HTTPStatusCode'])
+        delete_request_body = (
+            '<?xml version=\'1.0\' encoding=\'UTF-8\'?>\n'
+            '<Delete '
+            'xmlns="http://s3.amazonaws.com/doc/2006-03-01/">'
+            '<Object>'
+            '<Key>%s</Key>'
+            '</Object>'
+            '</Delete>' % key_name
+        ).encode('utf-8')
+        return delete_request_body
+
+    def test_no_md5_no_sha_no_crc_header_multi_delete(self):
+        delete_request_body = self._setup_multi_delete()
+        resp = self.conn.make_request(
+            self.bucket_name,
+            key=None,
+            query={'delete': True},
+            method='POST',
+            body=delete_request_body,
+        )
+        self.assertMissingMD5OrChecksumHeader(resp)
+
+    def test_good_md5_good_sha_good_crc_header_multi_delete(self):
+        delete_request_body = self._setup_multi_delete()
+        resp = self.conn.make_request(
+            self.bucket_name,
+            key=None,
+            query={'delete': True},
+            method='POST',
+            body=delete_request_body,
+            headers={
+                'content-md5': _md5(delete_request_body),
+                'x-amz-content-sha256': _sha256(delete_request_body),
+                'x-amz-checksum-crc32': _crc32(delete_request_body),
+            }
+        )
+        self.assertEqual(resp.status_code, 200, resp.content)
+        self.assertIn(b'DeleteResult', resp.content)
+
+    def test_no_md5_good_sha_no_crc_header_multi_delete(self):
+        delete_request_body = self._setup_multi_delete()
+        resp = self.conn.make_request(
+            self.bucket_name,
+            key=None,
+            query={'delete': True},
+            method='POST',
+            body=delete_request_body,
+            headers={
+                'x-amz-content-sha256': _sha256(delete_request_body),
+            }
+        )
+        self.assertMissingMD5OrChecksumHeader(resp)
+
+    def test_bad_md5_good_sha_good_crc_header_multi_delete(self):
+        delete_request_body = self._setup_multi_delete()
+        resp = self.conn.make_request(
+            self.bucket_name,
+            key=None,
+            query={'delete': True},
+            method='POST',
+            body=delete_request_body,
+            headers={
+                'content-md5': _md5(b'not the body'),
+                'x-amz-content-sha256': _sha256(delete_request_body),
+                'x-amz-checksum-crc32': _crc32(delete_request_body),
+            }
+        )
+        self.assertBadDigest(
+            resp, _md5(b'not the body'), _md5(delete_request_body),
+            expected_digest_should_be_hex=False)
+
+    def test_good_md5_bad_sha_good_crc_header_multi_delete(self):
+        delete_request_body = self._setup_multi_delete()
+        resp = self.conn.make_request(
+            self.bucket_name,
+            key=None,
+            query={'delete': True},
+            method='POST',
+            body=delete_request_body,
+            headers={
+                'content-md5': _md5(delete_request_body),
+                'x-amz-content-sha256': _sha256(b'not the body'),
+                'x-amz-checksum-crc32': _crc32(delete_request_body),
+            }
+        )
+        self.assertSHA256Mismatch(
+            resp, _sha256(b'not the body'), _sha256(delete_request_body))
+
+    def test_good_md5_good_sha_bad_crc_header_multi_delete(self):
+        delete_request_body = self._setup_multi_delete()
+        resp = self.conn.make_request(
+            self.bucket_name,
+            key=None,
+            query={'delete': True},
+            method='POST',
+            body=delete_request_body,
+            headers={
+                'content-md5': _md5(delete_request_body),
+                'x-amz-content-sha256': _sha256(delete_request_body),
+                'x-amz-checksum-crc32': _crc32(b'not the body'),
+            }
+        )
+        self.assertBadChecksumDigest(resp, 'CRC32', _crc32(b'not the body'))
+
+    def test_no_md5_no_sha_good_crc_header_multi_delete(self):
+        delete_request_body = self._setup_multi_delete()
+        resp = self.conn.make_request(
+            self.bucket_name,
+            key=None,
+            query={'delete': True},
+            method='POST',
+            body=delete_request_body,
+            headers={
+                'x-amz-checksum-crc32': _crc32(delete_request_body),
+            }
+        )
+        self.assertEqual(resp.status_code, 200, resp.content)
+        self.assertIn(b'DeleteResult', resp.content)
+
+    def test_no_md5_no_sha_bad_crc_header_multi_delete(self):
+        delete_request_body = self._setup_multi_delete()
+        resp = self.conn.make_request(
+            self.bucket_name,
+            key=None,
+            query={'delete': True},
+            method='POST',
+            body=delete_request_body,
+            headers={
+                'x-amz-checksum-crc32': _crc32(b'not the body'),
+            }
+        )
+        self.assertBadChecksumDigest(resp, 'CRC32', _crc32(b'not the body'))
+
+    def test_no_md5_unsigned_no_crc_header_multi_delete(self):
+        delete_request_body = self._setup_multi_delete()
+        resp = self.conn.make_request(
+            self.bucket_name,
+            key=None,
+            query={'delete': True},
+            method='POST',
+            body=delete_request_body,
+            headers={
+                'x-amz-content-sha256': 'UNSIGNED-PAYLOAD',
+            }
+        )
+        self.assertMissingMD5OrChecksumHeader(resp)
+
+    def test_no_md5_unsigned_good_crc_header_multi_delete(self):
+        delete_request_body = self._setup_multi_delete()
+        resp = self.conn.make_request(
+            self.bucket_name,
+            key=None,
+            query={'delete': True},
+            method='POST',
+            body=delete_request_body,
+            headers={
+                'x-amz-content-sha256': 'UNSIGNED-PAYLOAD',
+                'x-amz-checksum-crc32': _crc32(delete_request_body),
+            }
+        )
+        self.assertEqual(resp.status_code, 200, resp.content)
+        self.assertIn(b'DeleteResult', resp.content)
+
+    def test_no_md5_unsigned_bad_crc_header_multi_delete(self):
+        delete_request_body = self._setup_multi_delete()
+        resp = self.conn.make_request(
+            self.bucket_name,
+            key=None,
+            query={'delete': True},
+            method='POST',
+            body=delete_request_body,
+            headers={
+                'x-amz-content-sha256': 'UNSIGNED-PAYLOAD',
+                'x-amz-checksum-crc32': _crc32(b'not the body'),
+            }
+        )
+        self.assertBadChecksumDigest(resp, 'CRC32', _crc32(b'not the body'))
+
+
+class TestV4AuthHeaders(InputErrorsMixin, BaseS3TestCaseWithBucket):
+    session_cls = S3SessionV4Headers
+
+    def assertMissingSHA256(self, resp):
+        self.assertEqual(resp.status_code, 400, resp.content)
+        self.assertIn(b'<Code>InvalidRequest</Code>', resp.content)
+        self.assertIn(b'<Message>Missing required header for this '
+                      b'request: x-amz-content-sha256</Message>',
+                      resp.content)
+
+    def assertInvalidSHA256(self, resp, sha_in_headers):
+        respbody = resp.content
+        if not isinstance(respbody, str):
+            respbody = respbody.decode('utf8')
+        self.assertEqual(
+            (resp.status_code, resp.reason),
+            (400, 'Bad Request'),
+            respbody)
+        self.assertIn('<Code>InvalidArgument</Code>', respbody)
+        self.assertIn('<Message>x-amz-content-sha256 must be '
+                      'UNSIGNED-PAYLOAD', respbody)
+        # There can be a whole list here, but Swift only supports these
+        # two at the moment
+        self.assertIn('or a valid sha256 value.</Message>', respbody)
+        self.assertIn('<ArgumentName>x-amz-content-sha256</ArgumentName>',
+                      respbody)
+        self.assertIn('<ArgumentValue>%s</ArgumentValue>' % sha_in_headers,
+                      respbody)
+
+    def assertSignatureMismatch(self, resp, sts_first_line='AWS4-HMAC-SHA256'):
+        respbody = resp.content
+        if not isinstance(respbody, str):
+            respbody = respbody.decode('utf8')
+        self.assertEqual(
+            (resp.status_code, resp.reason),
+            (403, 'Forbidden'),
+            respbody)
+        self.assertIn('<Code>SignatureDoesNotMatch</Code>', respbody)
+        self.assertIn('<Message>The request signature we calculated does not '
+                      'match the signature you provided. Check your key and '
+                      'signing method.</Message>', respbody)
+        self.assertIn('<AWSAccessKeyId>', respbody)
+        self.assertIn(f'<StringToSign>{sts_first_line}\n', respbody)
+        self.assertIn('<SignatureProvided>', respbody)
+        self.assertIn('<StringToSignBytes>', respbody)
+        self.assertIn('<CanonicalRequest>', respbody)
+        self.assertIn('<CanonicalRequestBytes>', respbody)
+
+    def assertMalformedTrailer(self, resp):
+        respbody = resp.content
+        if not isinstance(respbody, str):
+            respbody = respbody.decode('utf8')
+        self.assertEqual(
+            (resp.status_code, resp.reason),
+            (400, 'Bad Request'),
+            respbody)
+        self.assertIn('<Code>MalformedTrailerError</Code>', respbody)
+        self.assertIn('<Message>The request contained trailing data that was '
+                      'not well-formed or did not conform to our published '
+                      'schema.</Message>', respbody)
+
+    def assertUnsupportedTrailerHeader(self, resp):
+        self.assertEqual(resp.status_code, 400, resp.content)
+        self.assertIn(b'<Code>InvalidRequest</Code>', resp.content)
+        self.assertIn(b'<Message>The value specified in the x-amz-trailer '
+                      b'header is not supported</Message>',
+                      resp.content)
+
+    def test_get_service_no_sha(self):
+        resp = self.conn.make_request()
+        self.assertMissingSHA256(resp)
+
+    def test_get_service_invalid_sha(self):
+        resp = self.conn.make_request(headers={
+            'x-amz-content-sha256': 'invalid'})
+        self.assertInvalidSHA256(resp, 'invalid')
+
+    def test_head_service_no_sha(self):
+        resp = self.conn.make_request(method='HEAD')
+        self.assertEqual(
+            (resp.status_code, resp.reason),
+            (400, 'Bad Request'))
+
+    def test_head_service_invalid_sha(self):
+        resp = self.conn.make_request(method='HEAD', headers={
+            'x-amz-content-sha256': 'invalid'})
+        self.assertEqual(
+            (resp.status_code, resp.reason),
+            (400, 'Bad Request'))
+
+    def test_get_bucket_no_md5_no_sha(self):
+        resp = self.conn.make_request(self.bucket_name)
+        self.assertMissingSHA256(resp)
+
+    def test_get_bucket_no_md5_invalid_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            headers={
+                'x-amz-content-sha256': 'invalid'})
+        self.assertInvalidSHA256(resp, 'invalid')
+
+    def test_get_bucket_good_md5_no_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            headers={
+                'content-md5': _md5(TEST_BODY)})
+        self.assertMissingSHA256(resp)
+
+    def test_head_bucket_no_md5_no_sha(self):
+        resp = self.conn.make_request(self.bucket_name, method='HEAD')
+        self.assertEqual(
+            (resp.status_code, resp.reason),
+            (400, 'Bad Request'))
+
+    def test_head_bucket_good_md5_no_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            method='HEAD',
+            headers={
+                'content-md5': _md5(TEST_BODY)})
+        self.assertEqual(
+            (resp.status_code, resp.reason),
+            (400, 'Bad Request'))
+
+    def test_no_md5_no_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY)
+        self.assertMissingSHA256(resp)
+
+    def test_no_md5_no_sha_no_content_length(self):
+        resp = self.get_response_put_object_no_md5_no_sha_no_content_length()
+        body = resp.read()
+        self.assertEqual(resp.status, 400, body)
+        self.assertIn(b'<Code>InvalidRequest</Code>', body)
+        self.assertIn(b'<Message>Missing required header for this '
+                      b'request: x-amz-content-sha256</Message>',
+                      body)
+
+    def test_no_md5_invalid_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={'x-amz-content-sha256': 'invalid'})
+        self.assertInvalidSHA256(resp, 'invalid')
+
+    def test_no_md5_invalid_sha_ucase(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={'X-AMZ-CONTENT-SHA256': 'INVALID'})
+        # Despite the upper-cased header name in the request,
+        # the error message has it lower
+        self.assertInvalidSHA256(resp, 'INVALID')
+
+    def test_no_md5_unsigned_lcase(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={'x-amz-content-sha256': 'unsigned-payload'})
+        self.assertInvalidSHA256(resp, 'unsigned-payload')
+
+    def test_no_md5_no_sha_good_crc(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'bad-checksum',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'x-amz-checksum-crc32': _crc32(TEST_BODY)})
+        self.assertMissingSHA256(resp)
+
+    def test_no_md5_no_sha_no_crc_header_multi_delete(self):
+        delete_request_body = self._setup_multi_delete()
+        resp = self.conn.make_request(
+            self.bucket_name,
+            key=None,
+            query={'delete': True},
+            method='POST',
+            body=delete_request_body,
+        )
+        self.assertMissingSHA256(resp)
+
+    def test_no_md5_no_sha_good_crc_header_multi_delete(self):
+        delete_request_body = self._setup_multi_delete()
+        resp = self.conn.make_request(
+            self.bucket_name,
+            key=None,
+            query={'delete': True},
+            method='POST',
+            body=delete_request_body,
+            headers={
+                'x-amz-checksum-crc32': _crc32(delete_request_body),
+            }
+        )
+        self.assertMissingSHA256(resp)
+
+    def test_no_md5_no_sha_bad_crc_header_multi_delete(self):
+        delete_request_body = self._setup_multi_delete()
+        resp = self.conn.make_request(
+            self.bucket_name,
+            key=None,
+            query={'delete': True},
+            method='POST',
+            body=delete_request_body,
+            headers={
+                'x-amz-checksum-crc32': _crc32(b'not the body'),
+            }
+        )
+        self.assertMissingSHA256(resp)
+
+    def test_strm_unsgnd_pyld_trl_not_encoded(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        self.assertIncompleteBody(resp)
+
+    def test_strm_unsgnd_pyld_trl_encoding_declared_not_encoded(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        self.assertIncompleteBody(resp)
+
+    def test_strm_unsgnd_pyld_trl_no_trailer_ok(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        self.assertOK(resp)
+
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='GET',
+            headers={'x-amz-content-sha256': 'UNSIGNED-PAYLOAD'})
+        self.assertOK(resp, TEST_BODY)
+        self.assertNotIn('Content-Encoding', resp.headers)
+
+    def test_strm_unsgnd_pyld_trl_te_chunked_ok(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])
+        # Use iter(list-of-bytes) to force requests to send
+        # Transfer-Encoding: chunked
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=iter([chunked_body]),
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        self.assertOK(resp)
+
+    def test_strm_unsgnd_pyld_trl_te_chunked_no_decoded_content_length(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])
+        # Use iter(list-of-bytes) to force requests to send
+        # Transfer-Encoding: chunked
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=iter([chunked_body]),
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked'})
+        self.assertEqual(resp.status_code, 411, resp.content)
+        self.assertIn(b'<Code>MissingContentLength</Code>', resp.content)
+        self.assertIn(b'<Message>You must provide the Content-Length HTTP '
+                      b'header.</Message>', resp.content)
+
+    def test_strm_unsgnd_pyld_trl_crc_header_ok(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-checksum-crc32': _crc32(TEST_BODY),
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        self.assertOK(resp)
+
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='GET',
+            headers={'x-amz-content-sha256': 'UNSIGNED-PAYLOAD'})
+        self.assertOK(resp, TEST_BODY)
+        self.assertNotIn('Content-Encoding', resp.headers)
+
+    def test_strm_unsgnd_pyld_trl_crc_header_x_amz_checksum_type_ok(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-checksum-crc32': _crc32(TEST_BODY),
+                # unexpected with a PUT but tolerated...
+                'x-amz-checksum-type': 'COMPOSITE',
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        self.assertOK(resp)
+
+    def test_strm_unsgnd_pyld_trl_crc_header_x_amz_checksum_algorithm_ok(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-checksum-crc32': _crc32(TEST_BODY),
+                # unexpected with a PUT but tolerated...
+                'x-amz-checksum-algorithm': 'crc32',
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        self.assertOK(resp)
+
+    def test_strm_unsgnd_pyld_trl_crc_header_algo_mismatch(self):
+        chunked_body = b'nonsense ignored'
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-sdk-checksum-algorithm': 'sha256',
+                'x-amz-checksum-crc32': _crc32(TEST_BODY),
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        self.assertEqual(resp.status_code, 400, resp.content)
+        self.assertIn(b'<Code>InvalidRequest</Code>', resp.content)
+        self.assertIn(b'<Message>Value for x-amz-sdk-checksum-algorithm '
+                      b'header is invalid.</Message>', resp.content)
+
+    def test_strm_unsgnd_pyld_trl_multiple_crc_header(self):
+        chunked_body = b'nonsense ignored'
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-checksum-crc32c': _crc32(TEST_BODY),
+                'x-amz-checksum-crc32': _crc32(TEST_BODY),
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        self.assertEqual(resp.status_code, 400, resp.content)
+        self.assertIn(b'<Code>InvalidRequest</Code>', resp.content)
+        self.assertIn(b'<Message>Expecting a single x-amz-checksum- header. '
+                      b'Multiple checksum Types are not allowed.</Message>',
+                      resp.content)
+
+    def test_strm_unsgnd_pyld_trl_crc_header_mismatch(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-sdk-checksum-algorithm': 'crc32',
+                'x-amz-checksum-crc32': _crc32(b'not the body'),
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        self.assertBadChecksumDigest(resp, 'CRC32', _crc32(b'not the body'))
+
+    def test_strm_unsgnd_pyld_trl_declared_algo_declared_no_trailer_sent(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-sdk-checksum-algorithm': 'crc32',
+                'x-amz-trailer': 'x-amz-checksum-crc32',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        self.assertMalformedTrailer(resp)
+
+    def test_strm_unsgnd_pyld_trl_declared_no_trailer_sent(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-trailer': 'x-amz-checksum-crc32',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        self.assertMalformedTrailer(resp)
+
+    def test_strm_sgnd_pyld_trl_no_trailer(self):
+        req = self.conn.build_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            headers={
+                'x-amz-content-sha256':
+                    'STREAMING-AWS4-HMAC-SHA256-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        prev_sig = self.conn.sign_v4(req)['signature']
+        self.conn.sign_request(req)
+        body_parts = []
+        for chunk in [TEST_BODY, b'']:
+            chunk_sig = self.conn.sign_chunk(req, prev_sig, _sha256(chunk))
+            body_parts.append(b'%x;chunk-signature=%s\r\n%s%s' % (
+                len(chunk), chunk_sig.encode('ascii'), chunk,
+                b'\r\n' if chunk else b''))
+            prev_sig = chunk_sig
+        trailers = b''
+        body_parts.append(trailers)
+        trailer_sig = self.conn.sign_trailer(req, prev_sig, trailers)
+        body_parts.append(
+            b'x-amz-trailer-signature:%s\r\n' % trailer_sig.encode('ascii'))
+        resp = self.conn.send_request(req, b''.join(body_parts))
+        self.assertIncompleteBody(resp)
+
+    def test_strm_unsgnd_pyld_trl_no_trailer_tr_chunked_ok(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=iter([chunked_body]),
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        self.assertOK(resp)
+
+    def test_strm_unsgnd_pyld_trl_with_trailer_ok(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])[:-2]
+        chunked_body += ''.join([
+            f'x-amz-checksum-crc32: {_crc32(TEST_BODY)}\r\n',
+        ]).encode('ascii')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY)),
+                'x-amz-trailer': 'x-amz-checksum-crc32'})
+        self.assertOK(resp)
+
+    def test_strm_unsgnd_pyld_trl_with_comma_in_trailer_ok(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])[:-2]
+        chunked_body += ''.join([
+            f'x-amz-checksum-crc32: {_crc32(TEST_BODY)}\r\n',
+        ]).encode('ascii')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY)),
+                'x-amz-trailer': 'x-amz-checksum-crc32,'})
+        self.assertOK(resp)
+
+    def test_strm_unsgnd_pyld_trl_with_commas_in_trailer_1(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])[:-2]
+        chunked_body += ''.join([
+            f'x-amz-checksum-crc32: {_crc32(TEST_BODY)}\r\n',
+        ]).encode('ascii')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY)),
+                'x-amz-trailer': ', x-amz-checksum-crc32, ,'})
+        self.assertUnsupportedTrailerHeader(resp)
+
+    def test_strm_unsgnd_pyld_trl_with_commas_in_trailer_2(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])[:-2]
+        chunked_body += ''.join([
+            f'x-amz-checksum-crc32: {_crc32(TEST_BODY)}\r\n',
+        ]).encode('ascii')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY)),
+                'x-amz-trailer': ', x-amz-checksum-crc32'})
+        self.assertUnsupportedTrailerHeader(resp)
+
+    def test_strm_unsgnd_pyld_trl_with_commas_in_trailer_3(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])[:-2]
+        chunked_body += ''.join([
+            f'x-amz-checksum-crc32: {_crc32(TEST_BODY)}\r\n',
+        ]).encode('ascii')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY)),
+                'x-amz-trailer': ',x-amz-checksum-crc32'})
+        self.assertUnsupportedTrailerHeader(resp)
+
+    def test_strm_unsgnd_pyld_trl_with_commas_in_trailer_4(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])[:-2]
+        chunked_body += ''.join([
+            f'x-amz-checksum-crc32: {_crc32(TEST_BODY)}\r\n',
+        ]).encode('ascii')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY)),
+                'x-amz-trailer': 'x-amz-checksum-crc32,,'})
+        self.assertOK(resp)
+
+    def test_strm_unsgnd_pyld_trl_with_commas_in_trailer_5(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])[:-2]
+        chunked_body += ''.join([
+            f'x-amz-checksum-crc32: {_crc32(TEST_BODY)}\r\n',
+        ]).encode('ascii')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY)),
+                'x-amz-trailer': 'x-amz-checksum-crc32, ,'})
+        self.assertUnsupportedTrailerHeader(resp)
+
+    def test_strm_unsgnd_pyld_trl_with_commas_in_trailer_6(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])[:-2]
+        chunked_body += ''.join([
+            f'x-amz-checksum-crc32: {_crc32(TEST_BODY)}\r\n',
+        ]).encode('ascii')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY)),
+                'x-amz-trailer': 'x-amz-checksum-crc32, '})
+        self.assertOK(resp)
+
+    def test_strm_unsgnd_pyld_trl_with_trailer_checksum_mismatch(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])[:-2]
+        chunked_body += ''.join([
+            f'x-amz-checksum-crc32: {_crc32(b"not the body")}\r\n',
+        ]).encode('ascii')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY)),
+                'x-amz-trailer': 'x-amz-checksum-crc32'})
+        self.assertBadChecksumDigest(resp, 'CRC32', _crc32(b'not the body'))
+
+    def test_strm_unsgnd_pyld_trl_with_trailer_checksum_invalid(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])[:-2]
+        chunked_body += ''.join([
+            f'x-amz-checksum-crc32: {"not-base-64"}\r\n',
+        ]).encode('ascii')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY)),
+                'x-amz-trailer': 'x-amz-checksum-crc32'})
+        self.assertEqual(resp.status_code, 400, resp.content)
+        self.assertIn(b'<Code>InvalidRequest</Code>', resp.content)
+        self.assertIn(b'<Message>Value for x-amz-checksum-crc32 trailing '
+                      b'header is invalid.</Message>', resp.content)
+        # the bad value is not reflected back in the response
+        self.assertNotIn(b'not-base-64', resp.content)
+
+    def test_strm_unsgnd_pyld_trl_content_sha256_in_trailer(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])[:-2]
+        chunked_body += ''.join([
+            f'x-amz-content-sha256: {_sha256(TEST_BODY)}\r\n',
+        ]).encode('ascii')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY)),
+                'x-amz-trailer': 'x-amz-content-sha256'})
+        self.assertUnsupportedTrailerHeader(resp)
+
+    def test_strm_unsgnd_pyld_trl_with_trailer_no_cr(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])[:-2]
+        chunked_body += ''.join([
+            f'x-amz-checksum-crc32: {_crc32(TEST_BODY)}\n',
+        ]).encode('ascii')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY)),
+                'x-amz-trailer': 'x-amz-checksum-crc32'})
+        self.assertIncompleteBody(resp)
+
+    def test_strm_unsgnd_pyld_trl_with_trailer_no_lf(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])[:-2]
+        chunked_body += ''.join([
+            f'x-amz-checksum-crc32: {_crc32(TEST_BODY)}\r',
+        ]).encode('ascii')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY)),
+                'x-amz-trailer': 'x-amz-checksum-crc32'})
+        self.assertIncompleteBody(resp)
+
+    def test_strm_unsgnd_pyld_trl_with_trailer_no_crlf(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])[:-2]
+        chunked_body += ''.join([
+            f'x-amz-checksum-crc32: {_crc32(TEST_BODY)}',
+        ]).encode('ascii')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY)),
+                'x-amz-trailer': 'x-amz-checksum-crc32'})
+        self.assertIncompleteBody(resp)
+
+    def test_strm_unsgnd_pyld_trl_with_trailer_extra_line_before(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])[:-2]
+        chunked_body += ''.join([
+            '\r\n',
+            f'x-amz-checksum-crc32: {_crc32(TEST_BODY)}\r\n',
+        ]).encode('ascii')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY)),
+                'x-amz-trailer': 'x-amz-checksum-crc32'})
+        self.assertMalformedTrailer(resp)
+
+    def test_strm_unsgnd_pyld_trl_extra_line_after_trailer_ok(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])[:-2]
+        chunked_body += ''.join([
+            f'x-amz-checksum-crc32: {_crc32(TEST_BODY)}\r\n',
+            '\r\n',
+        ]).encode('ascii')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY)),
+                'x-amz-trailer': 'x-amz-checksum-crc32'})
+        self.assertOK(resp)
+
+    def test_strm_unsgnd_pyld_trl_with_trailer_extra_line_junk_ok(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])[:-2]
+        chunked_body += ''.join([
+            f'x-amz-checksum-crc32: {_crc32(TEST_BODY)}\r\n',
+            '\r\n',
+            '\xff\xde\xad\xbe\xef\xff',
+        ]).encode('latin1')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY)),
+                'x-amz-trailer': 'x-amz-checksum-crc32'})
+        self.assertOK(resp)  # really??
+
+    def test_strm_unsgnd_pyld_trl_extra_lines_after_trailer_ok(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])[:-2]
+        chunked_body += ''.join([
+            f'x-amz-checksum-crc32: {_crc32(TEST_BODY)}\r\n',
+            '\r\n',
+            '\r\n',
+        ]).encode('ascii')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY)),
+                'x-amz-trailer': 'x-amz-checksum-crc32'})
+        self.assertOK(resp)
+
+    def test_strm_unsgnd_pyld_trl_mismatch_trailer(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])[:-2]
+        chunked_body += ''.join([
+            f'x-amz-checksum-crc32: {_crc32(TEST_BODY)}\r\n',
+        ]).encode('ascii')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY)),
+                'x-amz-trailer': 'x-amz-checksum-crc32c'})
+        self.assertMalformedTrailer(resp)
+
+    def test_strm_unsgnd_pyld_trl_unsupported_trailer_sent(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])[:-2]
+        chunked_body += ''.join([
+            f'x-amz-checksum-bad: {_crc32(TEST_BODY)}\r\n',
+        ]).encode('ascii')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY)),
+                'x-amz-trailer': 'x-amz-checksum-crc32c'})
+        self.assertMalformedTrailer(resp)
+
+    def test_strm_unsgnd_pyld_trl_non_checksum_trailer(self):
+        def do_test(trailer, value):
+            chunked_body = b''.join(
+                b'%x\r\n%s\r\n' % (len(chunk), chunk)
+                for chunk in [TEST_BODY, b''])[:-2]
+            chunked_body += ''.join([
+                f'{trailer}: {value}\r\n',
+            ]).encode('ascii')
+            resp = self.conn.make_request(
+                self.bucket_name,
+                'test-obj',
+                method='PUT',
+                body=chunked_body,
+                headers={
+                    'x-amz-content-sha256':
+                        'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                    'content-encoding': 'aws-chunked',
+                    'x-amz-decoded-content-length': str(len(TEST_BODY)),
+                    'x-amz-trailer': trailer})
+            self.assertUnsupportedTrailerHeader(resp)
+
+        do_test('foo', 'bar')
+        do_test('content-md5', _md5(TEST_BODY))
+        do_test('x-amz-content-sha256', _sha256(TEST_BODY))
+
+    def test_strm_unsgnd_pyld_trl_unsupported_trailer_declared(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])[:-2]
+        chunked_body += ''.join([
+            f'x-amz-checksum-crc32: {_crc32(TEST_BODY)}\r\n',
+        ]).encode('ascii')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY)),
+                'x-amz-trailer': 'x-amz-checksum-bad'})
+        self.assertUnsupportedTrailerHeader(resp)
+
+    def test_strm_unsgnd_pyld_trl_multiple_checksum_trailers(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])[:-2]
+        chunked_body += ''.join([
+            f'x-amz-checksum-crc32: {_crc32(TEST_BODY)}\r\n',
+            f'x-amz-checksum-sha256: {_sha256(TEST_BODY)}\r\n',
+        ]).encode('ascii')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY)),
+                'x-amz-trailer':
+                    'x-amz-checksum-crc32, x-amz-checksum-sha256'})
+        self.assertEqual(resp.status_code, 400, resp.content)
+        self.assertIn(b'<Code>InvalidRequest</Code>', resp.content)
+        self.assertIn(b'<Message>Expecting a single x-amz-checksum- header. '
+                      b'Multiple checksum Types are not allowed.</Message>',
+                      resp.content)
+
+    def test_strm_unsgnd_pyld_trl_multiple_trailers_unsupported(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])[:-2]
+        chunked_body += ''.join([
+            f'x-amz-checksum-crc32: {_crc32(TEST_BODY)}\r\n',
+            'x-amz-foo: bar\r\n',
+        ]).encode('ascii')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY)),
+                'x-amz-trailer':
+                    'x-amz-checksum-crc32, x-amz-foo'})
+        self.assertUnsupportedTrailerHeader(resp)
+
+    def test_strm_unsgnd_pyld_trl_extra_trailer(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])[:-2]
+        chunked_body += ''.join([
+            f'x-amz-checksum-crc32: {_crc32(TEST_BODY)}\r\n',
+            'bonus: trailer\r\n',
+        ]).encode('ascii')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY)),
+                'x-amz-trailer': 'x-amz-checksum-crc32'})
+        self.assertMalformedTrailer(resp)
+
+    def test_strm_unsgnd_pyld_trl_bad_then_good_trailer_ok(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])[:-2]
+        chunked_body += ''.join([
+            f'x-amz-checksum-crc32: {_crc32(TEST_BODY[:-1])}\r\n',
+            f'x-amz-checksum-crc32: {_crc32(TEST_BODY)}\r\n',
+        ]).encode('ascii')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY)),
+                'x-amz-trailer': 'x-amz-checksum-crc32'})
+        self.assertOK(resp)
+
+    def test_strm_unsgnd_pyld_trl_good_then_bad_trailer(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])[:-2]
+        chunked_body += ''.join([
+            f'x-amz-checksum-crc32: {_crc32(TEST_BODY)}\r\n',
+            f'x-amz-checksum-crc32: {_crc32(TEST_BODY[:-1])}\r\n',
+        ]).encode('ascii')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY)),
+                'x-amz-trailer': 'x-amz-checksum-crc32'})
+        self.assertBadChecksumDigest(resp, 'CRC32', _crc32(TEST_BODY[:-1]))
+
+    def test_strm_unsgnd_pyld_trl_extra_line_then_trailer_ok(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])[:-2]
+        chunked_body += ''.join([
+            f'x-amz-checksum-crc32: {_crc32(TEST_BODY)}\r\n',
+            '\r\n',
+            'bonus: trailer\r\n',
+        ]).encode('ascii')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY)),
+                'x-amz-trailer': 'x-amz-checksum-crc32'})
+        self.assertOK(resp)  # ???
+
+    def test_strm_unsgnd_pyld_trl_no_cr(self):
+        chunked_body = b''.join(
+            b'%x\n%s\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        self.assertIncompleteBody(resp)
+
+    def test_strm_unsgnd_pyld_trl_no_lf(self):
+        chunked_body = b''.join(
+            b'%x\r%s\r' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        self.assertIncompleteBody(resp)
+
+    def test_strm_unsgnd_pyld_trl_no_trailing_lf(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])
+        chunked_body = chunked_body[:-1]
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        self.assertIncompleteBody(resp)
+
+    def test_strm_unsgnd_pyld_trl_no_trailing_crlf_ok(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])
+        chunked_body = chunked_body[:-2]
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        # dafuk?
+        self.assertOK(resp)
+
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='GET',
+            headers={'x-amz-content-sha256': 'UNSIGNED-PAYLOAD'})
+        self.assertOK(resp, TEST_BODY)
+        self.assertNotIn('Content-Encoding', resp.headers)
+
+    def test_strm_unsgnd_pyld_trl_cl_matches_decoded_cl(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(chunked_body))})
+        self.assertIncompleteBody(resp)
+
+    def test_strm_sgnd_pyld_cl_matches_decoded_cl(self):
+        # Used to calculate our bad decoded-content-length
+        dummy_body = b''.join(
+            b'%x;chunk-signature=%064x\r\n%s\r\n' % (len(chunk), 0, chunk)
+            for chunk in [TEST_BODY, b''])
+        req = self.conn.build_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            headers={
+                'x-amz-content-sha256':
+                    'STREAMING-AWS4-HMAC-SHA256-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(dummy_body))})
+        prev_sig = self.conn.sign_v4(req)['signature']
+        self.conn.sign_request(req)
+        body_parts = []
+        for chunk in [TEST_BODY, b'']:
+            chunk_sig = self.conn.sign_chunk(req, prev_sig, _sha256(chunk))
+            body_parts.append(b'%x;chunk-signature=%s\r\n%s\r\n' % (
+                len(chunk), chunk_sig.encode('ascii'), chunk))
+            prev_sig = chunk_sig
+        resp = self.conn.send_request(req, b''.join(body_parts))
+        self.assertIncompleteBody(resp)
+
+    def test_strm_unsgnd_pyld_trl_no_zero_chunk(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY])
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        self.assertIncompleteBody(resp)
+
+    def test_strm_unsgnd_pyld_trl_zero_chunk_mid_stream(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY[:4], b'', TEST_BODY[4:], b''])
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        self.assertIncompleteBody(resp, 4, len(TEST_BODY))
+
+    def test_strm_unsgnd_pyld_trl_too_many_bytes(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY * 2, b''])
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        self.assertIncompleteBody(resp, 2 * len(TEST_BODY), len(TEST_BODY))
+
+    def test_strm_unsgnd_pyld_trl_no_encoding_ok(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        self.assertOK(resp)
+
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='GET',
+            headers={'x-amz-content-sha256': 'UNSIGNED-PAYLOAD'})
+        self.assertOK(resp, TEST_BODY)
+        self.assertNotIn('Content-Encoding', resp.headers)
+
+    def test_strm_unsgnd_pyld_trl_custom_encoding_ok(self):
+        # As best we can tell, AWS doesn't care at all about how
+        # > If one or more encodings have been applied to a representation,
+        # > the sender that applied the encodings MUST generate a
+        # > Content-Encoding header field that lists the content codings in
+        # > the order in which they were applied.
+        # See https://www.rfc-editor.org/rfc/rfc9110.html#section-8.4
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'foo, aws-chunked, bar',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        self.assertOK(resp)
+
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='GET',
+            headers={'x-amz-content-sha256': 'UNSIGNED-PAYLOAD'})
+        self.assertOK(resp, TEST_BODY)
+        self.assertIn('Content-Encoding', resp.headers)
+        self.assertEqual(resp.headers['Content-Encoding'], 'foo, bar')
+
+    def test_strm_unsgnd_pyld_trl_gzipped_undeclared_ok(self):
+        alt_body = gzip.compress(TEST_BODY)
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [alt_body, b''])
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'gzip',
+                'x-amz-decoded-content-length': str(len(alt_body))})
+        self.assertOK(resp)
+
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='GET',
+            headers={'x-amz-content-sha256': 'UNSIGNED-PAYLOAD'},
+            stream=True)  # needed so requests won't try to be "helpful"
+        read_body = resp.raw.read()
+        self.assertEqual(read_body, alt_body)
+        self.assertEqual(resp.headers['Content-Length'], str(len(alt_body)))
+        self.assertOK(resp)  # already read body
+        self.assertIn('Content-Encoding', resp.headers)
+        self.assertEqual(resp.headers['Content-Encoding'], 'gzip')
+
+    def test_strm_unsgnd_pyld_trl_gzipped_declared_swapped_ok(self):
+        alt_body = gzip.compress(TEST_BODY)
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [alt_body, b''])
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked, gzip',
+                'x-amz-decoded-content-length': str(len(alt_body))})
+        self.assertOK(resp)
+
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='GET',
+            headers={'x-amz-content-sha256': 'UNSIGNED-PAYLOAD'},
+            stream=True)
+        read_body = resp.raw.read()
+        self.assertEqual(read_body, alt_body)
+        self.assertEqual(resp.headers['Content-Length'], str(len(alt_body)))
+        self.assertOK(resp)  # already read body
+        self.assertIn('Content-Encoding', resp.headers)
+        self.assertEqual(resp.headers['Content-Encoding'], 'gzip')
+
+    def test_strm_unsgnd_pyld_trl_gzipped_declared_ok(self):
+        alt_body = gzip.compress(TEST_BODY)
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [alt_body, b''])
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'gzip, aws-chunked',
+                'x-amz-decoded-content-length': str(len(alt_body))})
+        self.assertOK(resp)
+
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='GET',
+            headers={'x-amz-content-sha256': 'UNSIGNED-PAYLOAD'},
+            stream=True)
+        read_body = resp.raw.read()
+        self.assertEqual(read_body, alt_body)
+        self.assertEqual(resp.headers['Content-Length'], str(len(alt_body)))
+        self.assertOK(resp)  # already read body
+        self.assertIn('Content-Encoding', resp.headers)
+        self.assertEqual(resp.headers['Content-Encoding'], 'gzip')
+
+    def test_strm_sgnd_pyld_no_signatures(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-AWS4-HMAC-SHA256-PAYLOAD',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        self.assertIncompleteBody(resp)
+
+    def test_strm_sgnd_pyld_blank_signatures(self):
+        chunked_body = b''.join(
+            b'%x;chunk-signature=\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-AWS4-HMAC-SHA256-PAYLOAD',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        self.assertIncompleteBody(resp)
+
+    def test_strm_sgnd_pyld_invalid_signatures(self):
+        chunked_body = b''.join(
+            b'%x;chunk-signature=invalid\r\n%s\r\n' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-AWS4-HMAC-SHA256-PAYLOAD',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        self.assertSignatureMismatch(resp, 'AWS4-HMAC-SHA256-PAYLOAD')
+
+    def test_strm_sgnd_pyld_bad_signatures(self):
+        chunked_body = b''.join(
+            b'%x;chunk-signature=%064x\r\n%s\r\n' % (len(chunk), 0, chunk)
+            for chunk in [TEST_BODY, b''])
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-AWS4-HMAC-SHA256-PAYLOAD',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        self.assertSignatureMismatch(resp, 'AWS4-HMAC-SHA256-PAYLOAD')
+
+    def test_strm_sgnd_pyld_good_signatures_ok(self):
+        req = self.conn.build_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            headers={
+                'x-amz-content-sha256': 'STREAMING-AWS4-HMAC-SHA256-PAYLOAD',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        prev_sig = self.conn.sign_v4(req)['signature']
+        self.conn.sign_request(req)
+        body_parts = []
+        for chunk in [TEST_BODY, b'']:
+            chunk_sig = self.conn.sign_chunk(req, prev_sig, _sha256(chunk))
+            body_parts.append(b'%x;chunk-signature=%s\r\n%s\r\n' % (
+                len(chunk), chunk_sig.encode('ascii'), chunk))
+            prev_sig = chunk_sig
+        resp = self.conn.send_request(req, b''.join(body_parts))
+        self.assertOK(resp)
+
+    def test_strm_sgnd_pyld_ragged_chunk_lengths_ok(self):
+        req = self.conn.build_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            headers={
+                'x-amz-content-sha256': 'STREAMING-AWS4-HMAC-SHA256-PAYLOAD',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str((15 + 8 + 16) * 1024)})
+        prev_sig = self.conn.sign_v4(req)['signature']
+        self.conn.sign_request(req)
+        body_parts = []
+        for chunk in [
+                b'x' * 15 * 1024,
+                b'y' * 8 * 1024,
+                b'z' * 16 * 1024,
+                b'',
+        ]:
+            chunk_sig = self.conn.sign_chunk(req, prev_sig, _sha256(chunk))
+            body_parts.append(b'%x;chunk-signature=%s\r\n%s\r\n' % (
+                len(chunk), chunk_sig.encode('ascii'), chunk))
+            prev_sig = chunk_sig
+        resp = self.conn.send_request(req, b''.join(body_parts))
+        self.assertOK(resp)
+
+    def test_strm_sgnd_pyld_no_zero_chunk(self):
+        req = self.conn.build_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            headers={
+                'x-amz-content-sha256': 'STREAMING-AWS4-HMAC-SHA256-PAYLOAD',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        prev_sig = self.conn.sign_v4(req)['signature']
+        self.conn.sign_request(req)
+        body_parts = []
+        for chunk in [TEST_BODY]:
+            chunk_sig = self.conn.sign_chunk(req, prev_sig, _sha256(chunk))
+            body_parts.append(b'%x;chunk-signature=%s\r\n%s\r\n' % (
+                len(chunk), chunk_sig.encode('ascii'), chunk))
+            prev_sig = chunk_sig
+        resp = self.conn.send_request(req, b''.join(body_parts))
+        self.assertIncompleteBody(resp)
+
+    def test_strm_sgnd_pyld_negative_chunk_length(self):
+        req = self.conn.build_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            headers={
+                'x-amz-content-sha256': 'STREAMING-AWS4-HMAC-SHA256-PAYLOAD',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        prev_sig = self.conn.sign_v4(req)['signature']
+        self.conn.sign_request(req)
+        body_parts = []
+        for chunk in [TEST_BODY, b'']:
+            chunk_sig = self.conn.sign_chunk(req, prev_sig, _sha256(chunk))
+            body_parts.append(b'-%x;chunk-signature=%s\r\n%s\r\n' % (
+                len(chunk), chunk_sig.encode('ascii'), chunk))
+            prev_sig = chunk_sig
+        resp = self.conn.send_request(req, b''.join(body_parts))
+        # AWS reliably 500s at time of writing
+        self.assertNotEqual(resp.status_code, 200)
+
+    def test_strm_sgnd_pyld_too_small_chunks(self):
+        req = self.conn.build_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            headers={
+                'x-amz-content-sha256': 'STREAMING-AWS4-HMAC-SHA256-PAYLOAD',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(9 * 1024)})
+        prev_sig = self.conn.sign_v4(req)['signature']
+        self.conn.sign_request(req)
+        body_parts = []
+        for chunk in [b'x' * 1024, b'y' * 4 * 1024, b'z' * 3 * 1024, b'']:
+            chunk_sig = self.conn.sign_chunk(req, prev_sig, _sha256(chunk))
+            body_parts.append(b'%x;chunk-signature=%s\r\n%s\r\n' % (
+                len(chunk), chunk_sig.encode('ascii'), chunk))
+            prev_sig = chunk_sig
+        resp = self.conn.send_request(req, b''.join(body_parts))
+        self.assertEqual(
+            (resp.status_code, resp.reason),
+            (403, 'Forbidden'))  # ???
+        respbody = resp.content.decode('utf8')
+        self.assertIn('<Code>InvalidChunkSizeError</Code>', respbody)
+        self.assertIn("<Message>Only the last chunk is allowed to have a "
+                      "size less than 8192 bytes</Message>",
+                      respbody)
+        # Yeah, it points at the wrong chunk number
+        self.assertIn("<Chunk>2</Chunk>", respbody)
+        # But at least it complains about the right size!
+        self.assertIn("<BadChunkSize>%d</BadChunkSize>" % 1024,
+                      respbody)
+
+    def test_strm_sgnd_pyld_spaced_out_chunk_param_ok(self):
+        req = self.conn.build_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            headers={
+                'x-amz-content-sha256': 'STREAMING-AWS4-HMAC-SHA256-PAYLOAD',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        prev_sig = self.conn.sign_v4(req)['signature']
+        self.conn.sign_request(req)
+        body_parts = []
+        for chunk in [TEST_BODY, b'']:
+            chunk_sig = self.conn.sign_chunk(req, prev_sig, _sha256(chunk))
+            body_parts.append(b'%x ; chunk-signature=%s\r\n%s\r\n' % (
+                len(chunk), chunk_sig.encode('ascii'), chunk))
+            prev_sig = chunk_sig
+        resp = self.conn.send_request(req, b''.join(body_parts))
+        self.assertOK(resp)
+
+    def test_strm_sgnd_pyld_spaced_out_chunk_param_value_ok(self):
+        req = self.conn.build_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            headers={
+                'x-amz-content-sha256': 'STREAMING-AWS4-HMAC-SHA256-PAYLOAD',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        prev_sig = self.conn.sign_v4(req)['signature']
+        self.conn.sign_request(req)
+        body_parts = []
+        for chunk in [TEST_BODY, b'']:
+            chunk_sig = self.conn.sign_chunk(req, prev_sig, _sha256(chunk))
+            body_parts.append(b'%x;chunk-signature = %s \r\n%s\r\n' % (
+                len(chunk), chunk_sig.encode('ascii'), chunk))
+            prev_sig = chunk_sig
+        resp = self.conn.send_request(req, b''.join(body_parts))
+        self.assertOK(resp)
+
+    def test_strm_sgnd_pyld_bad_final_signature(self):
+        req = self.conn.build_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            headers={
+                'x-amz-content-sha256': 'STREAMING-AWS4-HMAC-SHA256-PAYLOAD',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        prev_sig = self.conn.sign_v4(req)['signature']
+        self.conn.sign_request(req)
+        body_parts = []
+        for chunk in [TEST_BODY, b'']:
+            chunk_sig = self.conn.sign_chunk(
+                req, prev_sig, _sha256(chunk or b'x'))
+            body_parts.append(b'%x;chunk-signature=%s\r\n%s\r\n' % (
+                len(chunk), chunk_sig.encode('ascii'), chunk))
+            prev_sig = chunk_sig
+        resp = self.conn.send_request(req, b''.join(body_parts))
+        self.assertSignatureMismatch(resp, 'AWS4-HMAC-SHA256-PAYLOAD')
+
+    def test_strm_sgnd_pyld_extra_param_before(self):
+        req = self.conn.build_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            headers={
+                'x-amz-content-sha256': 'STREAMING-AWS4-HMAC-SHA256-PAYLOAD',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        prev_sig = self.conn.sign_v4(req)['signature']
+        self.conn.sign_request(req)
+        body_parts = []
+        for chunk in [TEST_BODY, b'']:
+            chunk_sig = self.conn.sign_chunk(req, prev_sig, _sha256(chunk))
+            body_parts.append(
+                b'%x;extra=param;chunk-signature=%s\r\n%s\r\n' % (
+                    len(chunk), chunk_sig.encode('ascii'), chunk))
+            prev_sig = chunk_sig
+        resp = self.conn.send_request(req, b''.join(body_parts))
+        self.assertSignatureMismatch(resp, 'AWS4-HMAC-SHA256-PAYLOAD')
+
+    def test_strm_sgnd_pyld_extra_param_after(self):
+        req = self.conn.build_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            headers={
+                'x-amz-content-sha256': 'STREAMING-AWS4-HMAC-SHA256-PAYLOAD',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        prev_sig = self.conn.sign_v4(req)['signature']
+        self.conn.sign_request(req)
+        body_parts = []
+        for chunk in [TEST_BODY, b'']:
+            chunk_sig = self.conn.sign_chunk(req, prev_sig, _sha256(chunk))
+            body_parts.append(
+                b'%x;chunk-signature=%s;extra=param\r\n%s\r\n' % (
+                    len(chunk), chunk_sig.encode('ascii'), chunk))
+            prev_sig = chunk_sig
+        resp = self.conn.send_request(req, b''.join(body_parts))
+        self.assertIncompleteBody(resp)
+
+    def test_strm_sgnd_pyld_missing_final_chunk(self):
+        req = self.conn.build_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            headers={
+                'x-amz-content-sha256': 'STREAMING-AWS4-HMAC-SHA256-PAYLOAD',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        prev_sig = self.conn.sign_v4(req)['signature']
+        self.conn.sign_request(req)
+        chunk_sig = self.conn.sign_chunk(req, prev_sig, _sha256(TEST_BODY))
+        body = b'%x;chunk-signature=%s\r\n%s\r\n' % (
+            len(TEST_BODY), chunk_sig.encode('ascii'), TEST_BODY)
+        resp = self.conn.send_request(req, body)
+        self.assertIncompleteBody(resp)
+
+    def test_strm_sgnd_pyld_trl_ok(self):
+        req = self.conn.build_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            headers={
+                'x-amz-content-sha256':
+                    'STREAMING-AWS4-HMAC-SHA256-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-trailer': 'x-amz-checksum-crc32',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        prev_sig = self.conn.sign_v4(req)['signature']
+        self.conn.sign_request(req)
+        body_parts = []
+        for chunk in [TEST_BODY, b'']:
+            chunk_sig = self.conn.sign_chunk(req, prev_sig, _sha256(chunk))
+            body_parts.append(b'%x;chunk-signature=%s\r\n%s%s' % (
+                len(chunk), chunk_sig.encode('ascii'), chunk,
+                b'\r\n' if chunk else b''))
+            prev_sig = chunk_sig
+        trailers = (
+            f'x-amz-checksum-crc32: {_crc32(TEST_BODY)}\r\n'
+        ).encode('ascii')
+        body_parts.append(trailers)
+        trailer_sig = self.conn.sign_trailer(req, prev_sig, trailers)
+        body_parts.append(
+            b'x-amz-trailer-signature:%s\r\n' % trailer_sig.encode('ascii'))
+        body_parts.append(b'\r\n')
+        resp = self.conn.send_request(req, b''.join(body_parts))
+        self.assertOK(resp)
+
+    def test_strm_sgnd_pyld_trl_missing_trl_sig(self):
+        req = self.conn.build_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            headers={
+                'x-amz-content-sha256':
+                    'STREAMING-AWS4-HMAC-SHA256-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-trailer': 'x-amz-checksum-crc32',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        prev_sig = self.conn.sign_v4(req)['signature']
+        self.conn.sign_request(req)
+        body_parts = []
+        for chunk in [TEST_BODY, b'']:
+            chunk_sig = self.conn.sign_chunk(req, prev_sig, _sha256(chunk))
+            body_parts.append(b'%x;chunk-signature=%s\r\n%s%s' % (
+                len(chunk), chunk_sig.encode('ascii'), chunk,
+                b'\r\n' if chunk else b''))
+            prev_sig = chunk_sig
+        trailers = (
+            f'x-amz-checksum-crc32: {_crc32(TEST_BODY)}\r\n'
+        ).encode('ascii')
+        body_parts.append(trailers)
+        resp = self.conn.send_request(req, b''.join(body_parts))
+        self.assertIncompleteBody(resp)
+
+    def test_strm_sgnd_pyld_trl_bad_trl_sig(self):
+        req = self.conn.build_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            headers={
+                'x-amz-content-sha256':
+                    'STREAMING-AWS4-HMAC-SHA256-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-trailer': 'x-amz-checksum-crc32',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        prev_sig = self.conn.sign_v4(req)['signature']
+        self.conn.sign_request(req)
+        body_parts = []
+        for chunk in [TEST_BODY, b'']:
+            chunk_sig = self.conn.sign_chunk(req, prev_sig, _sha256(chunk))
+            body_parts.append(b'%x;chunk-signature=%s\r\n%s%s' % (
+                len(chunk), chunk_sig.encode('ascii'), chunk,
+                b'\r\n' if chunk else b''))
+            prev_sig = chunk_sig
+        trailers = (
+            f'x-amz-checksum-crc32: {_crc32(TEST_BODY)}\r\n'
+        ).encode('ascii')
+        body_parts.append(trailers)
+        trailer_sig = self.conn.sign_trailer(req, prev_sig, trailers[:-1])
+        body_parts.append(
+            b'x-amz-trailer-signature:%s\r\n' % trailer_sig.encode('ascii'))
+        resp = self.conn.send_request(req, b''.join(body_parts))
+        self.assertSignatureMismatch(resp, 'AWS4-HMAC-SHA256-TRAILER')
+
+    def test_invalid_md5_no_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={'content-md5': 'invalid'})
+        self.assertMissingSHA256(resp)
+
+    def test_invalid_md5_invalid_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={'content-md5': 'invalid',
+                     'x-amz-content-sha256': 'invalid'})
+        # Both invalid; sha256 trumps
+        self.assertInvalidSHA256(resp, 'invalid')
+
+    def test_bad_md5_no_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={'content-md5': _md5(b'')})
+        self.assertMissingSHA256(resp)
+
+    def test_bad_md5_invalid_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'content-md5': _md5(b''),
+                'x-amz-content-sha256': 'invalid'})
+        # Neither is right; invalid sha256 trumps
+        self.assertInvalidSHA256(resp, 'invalid')
+
+    def test_good_md5_no_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={'content-md5': _md5(TEST_BODY)})
+        self.assertMissingSHA256(resp)
+
+    def test_good_md5_invalid_sha(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'content-md5': _md5(TEST_BODY),
+                'x-amz-content-sha256': 'invalid'})
+        self.assertInvalidSHA256(resp, 'invalid')
+
+    def test_get_object_no_sha(self):
+        obj_name = self.create_name('get-object')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            obj_name,
+            method='PUT',
+            body=TEST_BODY,
+            headers={'x-amz-content-sha256': 'UNSIGNED-PAYLOAD'})
+        self.assertOK(resp)
+
+        resp = self.conn.make_request(self.bucket_name, obj_name)
+        self.assertMissingSHA256(resp)
+
+    def test_get_object_invalid_sha(self):
+        obj_name = self.create_name('get-object')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            obj_name,
+            method='PUT',
+            body=TEST_BODY,
+            headers={'x-amz-content-sha256': 'UNSIGNED-PAYLOAD'})
+        self.assertOK(resp)
+
+        resp = self.conn.make_request(
+            self.bucket_name,
+            obj_name,
+            headers={'x-amz-content-sha256': 'invalid'})
+        self.assertInvalidSHA256(resp, 'invalid')
+
+    def test_head_object_no_sha(self):
+        obj_name = self.create_name('get-object')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            obj_name,
+            method='PUT',
+            body=TEST_BODY,
+            headers={'x-amz-content-sha256': 'UNSIGNED-PAYLOAD'})
+        self.assertOK(resp)
+
+        resp = self.conn.make_request(
+            self.bucket_name,
+            obj_name,
+            method='HEAD')
+        # Since it's a HEAD, all we get is status
+        self.assertEqual(
+            (resp.status_code, resp.reason),
+            (400, 'Bad Request'))
+
+    def test_head_object_invalid_sha(self):
+        obj_name = self.create_name('get-object')
+        resp = self.conn.make_request(
+            self.bucket_name,
+            obj_name,
+            method='PUT',
+            body=TEST_BODY,
+            headers={'x-amz-content-sha256': 'UNSIGNED-PAYLOAD'})
+        self.assertOK(resp)
+
+        resp = self.conn.make_request(
+            self.bucket_name,
+            obj_name,
+            method='HEAD',
+            headers={'x-amz-content-sha256': 'invalid'})
+        # Since it's a HEAD, all we get is status
+        self.assertEqual(
+            (resp.status_code, resp.reason),
+            (400, 'Bad Request'))
+
+
+class NotV4AuthHeadersMixin:
+    def test_strm_unsgnd_pyld_trl_not_encoded(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        self.assertSHA256Mismatch(resp, 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                                  _sha256(TEST_BODY))
+
+    def test_strm_unsgnd_pyld_trl_encoding_declared_not_encoded(self):
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=TEST_BODY,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        self.assertSHA256Mismatch(resp, 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                                  _sha256(TEST_BODY))
+
+    def test_strm_unsgnd_pyld_trl_no_trailer(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        self.assertIncompleteBody(resp, len(chunked_body), len(TEST_BODY))
+
+    def test_strm_unsgnd_pyld_trl_cl_matches_decoded_cl(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(chunked_body))})
+        self.assertSHA256Mismatch(resp, 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                                  _sha256(chunked_body))
+
+    def test_strm_sgnd_pyld_trl_no_trailer(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-AWS4-HMAC-SHA256-PAYLOAD',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(TEST_BODY))})
+        self.assertIncompleteBody(resp, len(chunked_body), len(TEST_BODY))
+
+    def test_strm_sgnd_pyld_cl_matches_decoded_cl(self):
+        chunked_body = b''.join(
+            b'%x\r\n%s' % (len(chunk), chunk)
+            for chunk in [TEST_BODY, b''])
+        resp = self.conn.make_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            body=chunked_body,
+            headers={
+                'x-amz-content-sha256': 'STREAMING-AWS4-HMAC-SHA256-PAYLOAD',
+                'content-encoding': 'aws-chunked',
+                'x-amz-decoded-content-length': str(len(chunked_body))})
+        self.assertSHA256Mismatch(resp, 'STREAMING-AWS4-HMAC-SHA256-PAYLOAD',
+                                  _sha256(chunked_body))
+
+    def test_no_md5_no_sha_good_crc_header_body_too_long_ok(self):
+        request = self.conn.build_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            headers={
+                'x-amz-checksum-crc32': _crc32(TEST_BODY),
+                'content-length': str(len(TEST_BODY)),
+            },
+        )
+        self.conn.sign_request(request)
+        raw_conn = get_raw_conn(request)
+        # send more than expected body; as long as the crc is correct for the
+        # content-length part of the body that is actually read then it's ok
+        raw_conn.send(TEST_BODY + b'0123456789')
+        resp = raw_conn.getresponse()
+        body = resp.read()
+        self.assertEqual(resp.status, 200, body)
+
+    def test_no_md5_no_sha_bad_crc_header_body_too_long(self):
+        request = self.conn.build_request(
+            self.bucket_name,
+            'test-obj',
+            method='PUT',
+            headers={
+                'x-amz-checksum-crc32': _crc32(TEST_BODY),
+                'content-length': str(len(TEST_BODY[:-10])),
+            },
+        )
+        self.conn.sign_request(request)
+        raw_conn = get_raw_conn(request)
+        # content-length is less than sent body; not all the body is read so
+        # the calculated crc will mismatch the body crc
+        raw_conn.send(TEST_BODY)
+        resp = raw_conn.getresponse()
+        body = resp.read().decode('utf-8')
+        self.assertEqual(resp.status, 400, body)
+        self.assertIn('<Code>BadDigest</Code>', body)
+        self.assertIn('<Message>The CRC32 you specified did not match the '
+                      'calculated checksum.</Message>', body)
+
+
+class TestV4AuthQuery(InputErrorsMixin,
+                      NotV4AuthHeadersMixin,
+                      BaseS3TestCaseWithBucket):
+    session_cls = S3SessionV4Query
+
+
+class TestV2AuthHeaders(InputErrorsMixin,
+                        NotV4AuthHeadersMixin,
+                        BaseS3TestCaseWithBucket):
+    session_cls = S3SessionV2Headers
+
+
+class TestV2AuthQuery(InputErrorsMixin,
+                      NotV4AuthHeadersMixin,
+                      BaseS3TestCaseWithBucket):
+    session_cls = S3SessionV2Query
diff --git a/test/s3api/test_mpu.py b/test/s3api/test_mpu.py
new file mode 100644
index 0000000000..0c60b28d0c
--- /dev/null
+++ b/test/s3api/test_mpu.py
@@ -0,0 +1,891 @@
+# Copyright (c) 2021 Nvidia
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from test.s3api import BaseS3TestCase, status_from_error, code_from_error, \
+    etag_from_resp
+from botocore.exceptions import ClientError
+
+
+class BaseMultiPartUploadTestCase(BaseS3TestCase):
+    maxDiff = None
+
+    def setUp(self):
+        self.client = self.get_s3_client(1)
+        self.bucket_name = self.create_name('mpu-bucket')
+        resp = self.client.create_bucket(Bucket=self.bucket_name)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        self.num_parts = 3
+        self.part_size = 5 * (2 ** 20)  # 5 MB
+
+    def tearDown(self):
+        self.clear_bucket(self.client, self.bucket_name)
+        super(BaseMultiPartUploadTestCase, self).tearDown()
+
+    def _make_part_bodies(self):
+        return [
+            ('%d' % i) * self.part_size
+            for i in range(self.num_parts)
+        ]
+
+    def _iter_part_num_ranges(self):
+        for i in range(self.num_parts):
+            start = self.part_size * i
+            end = start + self.part_size
+            # part_num is 1 indexed
+            yield i + 1, start, end
+
+    def _upload_mpu(self, key_name):
+        create_mpu_resp = self.client.create_multipart_upload(
+            Bucket=self.bucket_name, Key=key_name)
+        self.assertEqual(200, create_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        upload_id = create_mpu_resp['UploadId']
+
+        part_bodies = self._make_part_bodies()
+        parts = []
+        for i, body in enumerate(part_bodies, 1):
+            part_resp = self.client.upload_part(
+                Body=body, Bucket=self.bucket_name, Key=key_name,
+                PartNumber=i, UploadId=upload_id)
+            self.assertEqual(200, part_resp[
+                'ResponseMetadata']['HTTPStatusCode'])
+            parts.append({
+                'ETag': part_resp['ETag'],
+                'PartNumber': i,
+            })
+        # this helper doesn't bother calling list-parts, it's not required
+        # and we know what we uploaded
+        complete_mpu_resp = self.client.complete_multipart_upload(
+            Bucket=self.bucket_name, Key=key_name,
+            MultipartUpload={
+                'Parts': parts,
+            },
+            UploadId=upload_id,
+        )
+        self.assertEqual(200, complete_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        return complete_mpu_resp
+
+    def upload_mpu_version(self, key_name):
+        complete_mpu_resp = self._upload_mpu(key_name)
+        # AWS returns the version_id *in* the MPU-complete response but s3api
+        # does NOT (see https://bugs.launchpad.net/swift/+bug/2043619), so we
+        # do an extra HEAD to get the version
+        head_object_resp = self.client.head_object(
+            Bucket=self.bucket_name, Key=key_name)
+
+        self.assertEqual(200, head_object_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+
+        return complete_mpu_resp['ETag'], head_object_resp.get('VersionId')
+
+    def upload_mpu(self, key_name):
+        complete_mpu_resp = self._upload_mpu(key_name)
+        return complete_mpu_resp['ETag']
+
+    def _verify_part_num_response(self, method, key_name, mpu_etag,
+                                  version=None):
+        part_bodies = self._make_part_bodies()
+        total_size = self.num_parts * self.part_size
+
+        for part_num, start, end in self._iter_part_num_ranges():
+            extra_kwargs = {}
+            if version is not None:
+                extra_kwargs['VersionId'] = version
+            resp = method(Bucket=self.bucket_name, Key=key_name,
+                          PartNumber=part_num, **extra_kwargs)
+            self.assertEqual(206, resp['ResponseMetadata'][
+                'HTTPStatusCode'])
+            self.assertEqual(self.part_size, resp['ContentLength'])
+            if method == self.client.get_object:
+                resp_body = b''.join(resp['Body']).decode()
+                # our part_bodies are zero indexed
+                self.assertEqual(resp_body, part_bodies[part_num - 1])
+                expected_range = 'bytes %s-%s/%s' % (
+                    start, end - 1, total_size)
+                self.assertEqual(expected_range, resp['ContentRange'])
+            # ETag and PartsCount are from the MPU
+            self.assertEqual(mpu_etag, resp['ETag'], mpu_etag)
+            self.assertEqual(self.num_parts, resp['PartsCount'])
+            self.assertEqual('bytes', resp['AcceptRanges'])
+            if version is None:
+                self.assertNotIn('VersionId', resp)
+            else:
+                self.assertEqual(version, resp['VersionId'])
+
+    def _verify_copy_parts(self, key_src, key_dest, upload_id):
+        parts = []
+        for part_num, start, end in self._iter_part_num_ranges():
+            copy_range = 'bytes=%d-%d' % (start, end - 1)
+            copy_resp = self.client.\
+                upload_part_copy(Bucket=self.bucket_name,
+                                 Key=key_dest, PartNumber=part_num,
+                                 CopySource={
+                                     'Bucket': self.bucket_name,
+                                     'Key': key_src,
+                                 }, CopySourceRange=copy_range,
+                                 UploadId=upload_id)
+            self.assertEqual(200, copy_resp[
+                'ResponseMetadata']['HTTPStatusCode'])
+            self.assertTrue(copy_resp['CopyPartResult']['ETag'])
+            self.assertTrue(copy_resp['CopyPartResult']['LastModified'])
+            parts.append({
+                'ETag': copy_resp['CopyPartResult']['ETag'],
+                'PartNumber': part_num,
+            })
+
+        complete_mpu_resp = self.client.complete_multipart_upload(
+            Bucket=self.bucket_name, Key=key_dest,
+            MultipartUpload={
+                'Parts': parts,
+            },
+            UploadId=upload_id,
+        )
+        self.assertEqual(200, complete_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+
+        return complete_mpu_resp['ETag']
+
+
+class TestMultiPartUpload(BaseMultiPartUploadTestCase):
+
+    def setUp(self):
+        super(TestMultiPartUpload, self).setUp()
+
+    def _discover_max_part_num(self):
+        key_name = self.create_name('discover-max-part-num')
+        self.upload_mpu(key_name)
+        with self.assertRaises(ClientError) as cm:
+            self.client.get_object(Bucket=self.bucket_name,
+                                   Key=key_name, PartNumber=0)
+        err_resp = cm.exception.response
+        self.assertEqual(400, err_resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual('InvalidArgument', err_resp['Error']['Code'])
+        err_msg = err_resp['Error']['Message']
+        preamble = 'Part number must be an integer between 1 and '
+        self.assertIn(preamble, err_msg)
+        return int(err_msg[len(preamble):].split(',')[0])
+
+    def create_mpu(self, key_name):
+        create_mpu_resp = self.client.create_multipart_upload(
+            Bucket=self.bucket_name, Key=key_name)
+        self.assertEqual(200, create_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        return create_mpu_resp['UploadId']
+
+    def list_mpus(self):
+        list_mpu_resp = self.client.list_multipart_uploads(
+            Bucket=self.bucket_name)
+        self.assertEqual(200, list_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        mpus = list_mpu_resp.get('Uploads', [])
+        return [(mpu['Key'], mpu['UploadId']) for mpu in mpus]
+
+    def list_parts(self, key_name, upload_id):
+        list_parts_resp = self.client.list_parts(
+            Bucket=self.bucket_name, Key=key_name,
+            UploadId=upload_id,
+        )
+        self.assertEqual(200, list_parts_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        return [{k: p[k] for k in ('ETag', 'PartNumber')}
+                for p in list_parts_resp.get('Parts', [])]
+
+    def upload_part_indexes(self, key_name, upload_id, part_indexes):
+        parts = []
+        for i in part_indexes:
+            body = ('%d' % i) * 5 * (2 ** 20)
+            part_resp = self.client.upload_part(
+                Body=body, Bucket=self.bucket_name, Key=key_name,
+                PartNumber=i, UploadId=upload_id)
+            self.assertEqual(200, part_resp[
+                'ResponseMetadata']['HTTPStatusCode'])
+            parts.append({
+                'ETag': part_resp['ETag'],
+                'PartNumber': i,
+            })
+        self.assertEqual(parts, self.list_parts(key_name, upload_id))
+        return parts
+
+    def upload_parts(self, key_name, upload_id, num_parts):
+        return self.upload_part_indexes(key_name, upload_id,
+                                        range(1, num_parts + 1))
+
+    def complete_mpu(self, key_name, upload_id, parts):
+        complete_mpu_resp = self.client.complete_multipart_upload(
+            Bucket=self.bucket_name, Key=key_name,
+            MultipartUpload={
+                'Parts': parts,
+            },
+            UploadId=upload_id,
+        )
+        self.assertEqual(200, complete_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        return complete_mpu_resp
+
+    def abort_mpu(self, key_name, upload_id):
+        abort_resp = self.client.abort_multipart_upload(
+            Bucket=self.bucket_name,
+            Key=key_name,
+            UploadId=upload_id,
+        )
+        self.assertEqual(204, abort_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        return abort_resp
+
+    def head_part(self, key_name, part_number):
+        resp = self.client.head_object(Bucket=self.bucket_name, Key=key_name,
+                                       PartNumber=part_number)
+        self.assertEqual(206, resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        return resp
+
+    def get_part(self, key_name, part_number):
+        resp = self.client.get_object(Bucket=self.bucket_name, Key=key_name,
+                                      PartNumber=part_number)
+        self.assertEqual(206, resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        return resp
+
+    def delete_object(self, key_name):
+        delete_resp = self.client.delete_object(
+            Bucket=self.bucket_name, Key=key_name)
+        self.assertEqual(204, delete_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+
+    def assert_object_not_found(self, key_name):
+        with self.assertRaises(ClientError) as cm:
+            self.client.head_object(
+                Bucket=self.bucket_name, Key=key_name,
+            )
+        self.assertEqual(404, status_from_error(cm.exception))
+
+    def test_basic_upload(self):
+        key_name = self.create_name('key')
+        create_mpu_resp = self.client.create_multipart_upload(
+            Bucket=self.bucket_name, Key=key_name)
+        self.assertEqual(200, create_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        upload_id = create_mpu_resp['UploadId']
+
+        list_mpu_resp = self.client.list_multipart_uploads(
+            Bucket=self.bucket_name)
+        self.assertEqual(200, list_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        found_uploads = list_mpu_resp.get('Uploads', [])
+        self.assertEqual(1, len(found_uploads), found_uploads)
+        self.assertEqual(upload_id, found_uploads[0]['UploadId'])
+
+        parts = []
+        for i in range(1, 3):
+            body = ('%d' % i) * 5 * (2 ** 20)
+            part_resp = self.client.upload_part(
+                Body=body, Bucket=self.bucket_name, Key=key_name,
+                PartNumber=i, UploadId=upload_id)
+            self.assertEqual(200, part_resp[
+                'ResponseMetadata']['HTTPStatusCode'])
+            parts.append({
+                'ETag': part_resp['ETag'],
+                'PartNumber': i,
+            })
+        list_parts_resp = self.client.list_parts(
+            Bucket=self.bucket_name, Key=key_name,
+            UploadId=upload_id,
+        )
+        self.assertEqual(200, list_parts_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual(parts, [{k: p[k] for k in ('ETag', 'PartNumber')}
+                                 for p in list_parts_resp['Parts']])
+        complete_mpu_resp = self.client.complete_multipart_upload(
+            Bucket=self.bucket_name, Key=key_name,
+            MultipartUpload={
+                'Parts': parts,
+            },
+            UploadId=upload_id,
+        )
+        self.assertEqual(200, complete_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+
+    def test_zero_byte_segment_upload(self):
+        key_name = self.create_name('key')
+        create_mpu_resp = self.client.create_multipart_upload(
+            Bucket=self.bucket_name, Key=key_name)
+        self.assertEqual(200, create_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        upload_id = create_mpu_resp['UploadId']
+        part_resp = self.client.upload_part(
+            Body='', Bucket=self.bucket_name, Key=key_name,
+            PartNumber=1, UploadId=upload_id)
+        self.assertEqual(200, part_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        parts = [{
+            'ETag': part_resp['ETag'],
+            'PartNumber': 1,
+        }]
+        list_parts_resp = self.client.list_parts(
+            Bucket=self.bucket_name, Key=key_name,
+            UploadId=upload_id,
+        )
+        self.assertEqual(200, list_parts_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual(parts, [{k: p[k] for k in ('ETag', 'PartNumber')}
+                                 for p in list_parts_resp['Parts']])
+        complete_mpu_resp = self.client.complete_multipart_upload(
+            Bucket=self.bucket_name, Key=key_name,
+            MultipartUpload={
+                'Parts': parts,
+            },
+            UploadId=upload_id,
+        )
+        self.assertEqual(200, complete_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+
+    def _check_part_num_invalid_exc(self, exc, val, max_part_num,
+                                    is_head=False):
+        err_resp = exc.response
+        self.assertEqual(400, err_resp['ResponseMetadata']['HTTPStatusCode'])
+        if is_head:
+            err_code = '400'
+            err_msg = 'Bad Request'
+        else:
+            err_code = 'InvalidArgument'
+            err_msg = 'Part number must be an integer between ' \
+                      '1 and %d, inclusive' % max_part_num
+        self.assertEqual(err_code, err_resp['Error']['Code'], err_resp)
+        self.assertEqual(err_msg, err_resp['Error']['Message'])
+        if is_head:
+            self.assertNotIn('ArgumentName', err_resp['Error'])
+            self.assertNotIn('ArgumentValue', err_resp['Error'])
+        else:
+            self.assertEqual('partNumber', err_resp['Error']['ArgumentName'])
+            self.assertEqual(str(val), err_resp['Error']['ArgumentValue'])
+
+    def _check_part_num_out_of_range_exc(self, exc, is_head=False):
+        err_resp = exc.response
+        self.assertEqual(416, err_resp['ResponseMetadata']['HTTPStatusCode'])
+        if is_head:
+            err_code = '416'
+            err_msg = 'Requested Range Not Satisfiable'
+        else:
+            err_code = 'InvalidPartNumber'
+            err_msg = 'The requested partnumber is not satisfiable'
+        self.assertEqual(err_code, err_resp['Error']['Code'], err_resp)
+        self.assertEqual(err_msg, err_resp['Error']['Message'], err_resp)
+
+    def test_get_object_partNumber_errors(self):
+        max_part_num = self._discover_max_part_num()
+        key_name = self.create_name('invalid-part-num-test')
+        mpu_etag = self.upload_mpu(key_name)
+
+        # partNumber argument is 1 indexed
+        with self.assertRaises(ClientError) as caught:
+            self.client.get_object(Bucket=self.bucket_name,
+                                   Key=key_name, PartNumber=0)
+        self._check_part_num_invalid_exc(caught.exception, 0, max_part_num)
+
+        # all other partNumber args are valid
+        self._verify_part_num_response(
+            self.client.get_object, key_name, mpu_etag)
+
+        with self.assertRaises(ClientError) as caught:
+            self.client.get_object(Bucket=self.bucket_name,
+                                   Key=key_name, PartNumber=self.num_parts + 1)
+        self._check_part_num_out_of_range_exc(caught.exception)
+
+        with self.assertRaises(ClientError) as caught:
+            self.client.get_object(Bucket=self.bucket_name,
+                                   Key=key_name, PartNumber=max_part_num)
+        self._check_part_num_out_of_range_exc(caught.exception)
+
+        # because of ParamValidationError we can't test 'foo'
+        val = -1
+        with self.assertRaises(ClientError) as caught:
+            self.client.get_object(Bucket=self.bucket_name,
+                                   Key=key_name, PartNumber=val)
+        self._check_part_num_invalid_exc(caught.exception, val, max_part_num)
+        val = max_part_num + 1
+        with self.assertRaises(ClientError) as caught:
+            self.client.get_object(Bucket=self.bucket_name,
+                                   Key=key_name, PartNumber=val)
+        self._check_part_num_invalid_exc(caught.exception, val, max_part_num)
+
+    def test_head_object_partNumber_errors(self):
+        max_part_num = self._discover_max_part_num()
+        key_name = self.create_name('invalid-part-num-head')
+        mpu_etag = self.upload_mpu(key_name)
+
+        # partNumber argument is 1 indexed
+        with self.assertRaises(ClientError) as caught:
+            self.client.head_object(Bucket=self.bucket_name,
+                                    Key=key_name, PartNumber=0)
+        self._check_part_num_invalid_exc(caught.exception, 0, max_part_num,
+                                         is_head=True)
+
+        # all other partNumber args are valid
+        self._verify_part_num_response(
+            self.client.head_object, key_name, mpu_etag)
+
+        with self.assertRaises(ClientError) as caught:
+            self.client.head_object(Bucket=self.bucket_name, Key=key_name,
+                                    PartNumber=self.num_parts + 1)
+        self._check_part_num_out_of_range_exc(caught.exception, is_head=True)
+
+        with self.assertRaises(ClientError) as caught:
+            self.client.head_object(Bucket=self.bucket_name, Key=key_name,
+                                    PartNumber=max_part_num)
+        self._check_part_num_out_of_range_exc(caught.exception, is_head=True)
+
+        # because of ParamValidationError we can't test 'foo'
+        val = -1
+        with self.assertRaises(ClientError) as caught:
+            self.client.head_object(Bucket=self.bucket_name, Key=key_name,
+                                    PartNumber=val)
+        self._check_part_num_invalid_exc(caught.exception, val, max_part_num,
+                                         is_head=True)
+        val = max_part_num + 1
+        with self.assertRaises(ClientError) as caught:
+            self.client.head_object(Bucket=self.bucket_name, Key=key_name,
+                                    PartNumber=val)
+        self._check_part_num_invalid_exc(caught.exception, val, max_part_num,
+                                         is_head=True)
+
+    def test_part_number_non_mpu(self):
+        max_part_num = self._discover_max_part_num()
+        key_name = self.create_name('part-num-non-mpu')
+        self.client.put_object(Bucket=self.bucket_name,
+                               Key=key_name,
+                               Body=b'non-mpu-object')
+        head_resp = self.client.head_object(Bucket=self.bucket_name,
+                                            Key=key_name)
+        # sanity check
+        self.assertEqual(200,
+                         head_resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual(head_resp['AcceptRanges'], 'bytes')
+        self.assertEqual(head_resp['ContentLength'], 14)
+
+        head_resp = self.client.head_object(Bucket=self.bucket_name,
+                                            Key=key_name,
+                                            PartNumber=1)
+        self.assertEqual(206,
+                         head_resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual(head_resp['ContentLength'], 14)
+
+        get_resp = self.client.get_object(Bucket=self.bucket_name,
+                                          Key=key_name,
+                                          PartNumber=1)
+        self.assertEqual(206,
+                         get_resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual(get_resp['ContentLength'], 14)
+        self.assertEqual(get_resp['ContentRange'], 'bytes 0-13/14')
+        self.assertEqual(b'non-mpu-object', b''.join(get_resp['Body']))
+
+        with self.assertRaises(ClientError) as caught:
+            self.client.get_object(Bucket=self.bucket_name,
+                                   Key=key_name,
+                                   PartNumber=4)
+        self._check_part_num_out_of_range_exc(caught.exception)
+
+        with self.assertRaises(ClientError) as caught:
+            self.client.head_object(Bucket=self.bucket_name,
+                                    Key=key_name,
+                                    PartNumber=4)
+        self._check_part_num_out_of_range_exc(caught.exception, is_head=True)
+
+        with self.assertRaises(ClientError) as caught:
+            self.client.get_object(Bucket=self.bucket_name,
+                                   Key=key_name,
+                                   PartNumber=0)
+        self._check_part_num_invalid_exc(caught.exception, 0, max_part_num)
+
+        with self.assertRaises(ClientError) as caught:
+            self.client.head_object(Bucket=self.bucket_name,
+                                    Key=key_name,
+                                    PartNumber=0)
+        self._check_part_num_invalid_exc(caught.exception, 0, max_part_num,
+                                         is_head=True)
+
+        invalid_part_num = 10001
+        with self.assertRaises(ClientError) as caught:
+            self.client.get_object(Bucket=self.bucket_name,
+                                   Key=key_name,
+                                   PartNumber=invalid_part_num)
+        self._check_part_num_invalid_exc(caught.exception, invalid_part_num,
+                                         max_part_num)
+
+        with self.assertRaises(ClientError) as caught:
+            self.client.head_object(Bucket=self.bucket_name,
+                                    Key=key_name,
+                                    PartNumber=invalid_part_num)
+        self._check_part_num_invalid_exc(caught.exception, invalid_part_num,
+                                         max_part_num, is_head=True)
+
+    def test_get_object_partNumber_and_range(self):
+        # partNumber not allowed with Range even for non-mpu object
+        key_name = self.create_name('part-num-mpu')
+        self._upload_mpu(key_name)
+        with self.assertRaises(ClientError) as caught:
+            self.client.get_object(Bucket=self.bucket_name,
+                                   Key=key_name,
+                                   PartNumber=1,
+                                   Range='bytes=1-2')
+        err_resp = caught.exception.response
+        self.assertEqual(400, err_resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual('InvalidRequest', err_resp['Error']['Code'], err_resp)
+        self.assertEqual('Cannot specify both Range header and partNumber '
+                         'query parameter', err_resp['Error']['Message'])
+
+        key_name = self.create_name('part-num-non-mpu')
+        self.client.put_object(Bucket=self.bucket_name,
+                               Key=key_name,
+                               Body=b'non-mpu-object')
+        with self.assertRaises(ClientError) as caught:
+            self.client.get_object(Bucket=self.bucket_name,
+                                   Key=key_name,
+                                   PartNumber=1,
+                                   Range='bytes=1-2')
+        err_resp = caught.exception.response
+        self.assertEqual(400, err_resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual('InvalidRequest', err_resp['Error']['Code'], err_resp)
+        self.assertEqual('Cannot specify both Range header and partNumber '
+                         'query parameter', err_resp['Error']['Message'])
+
+        # partNumber + Range error trumps bad partNumber
+        with self.assertRaises(ClientError) as caught:
+            self.client.get_object(Bucket=self.bucket_name,
+                                   Key=key_name,
+                                   PartNumber=0,
+                                   Range='bytes=1-2')
+        err_resp = caught.exception.response
+        self.assertEqual(400, err_resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual('InvalidRequest', err_resp['Error']['Code'], err_resp)
+        self.assertEqual('Cannot specify both Range header and partNumber '
+                         'query parameter', err_resp['Error']['Message'])
+
+    def test_upload_part_copy(self):
+        self.num_parts = 4
+        key_src = self.create_name('part-copy-src')
+        key_dest = self.create_name('part-copy-dest')
+        mpu_etag_src = self.upload_mpu(key_src)
+        self._verify_part_num_response(
+            self.client.get_object, key_src, mpu_etag_src)
+        self._verify_part_num_response(
+            self.client.head_object, key_src, mpu_etag_src)
+
+        create_mpu_dest = self.client.create_multipart_upload(
+            Bucket=self.bucket_name, Key=key_dest)
+        self.assertEqual(200, create_mpu_dest[
+            'ResponseMetadata']['HTTPStatusCode'])
+
+        upload_id = create_mpu_dest['UploadId']
+        mpu_etag_dst = self._verify_copy_parts(key_src, key_dest, upload_id)
+        self._verify_part_num_response(
+            self.client.get_object, key_dest, mpu_etag_dst)
+        self._verify_part_num_response(
+            self.client.head_object, key_dest, mpu_etag_dst)
+
+    def test_copy_mpu_from_parts(self):
+        key_src = self.create_name('copy-from-from-src')
+        mpu_etag_src = self.upload_mpu(key_src)
+
+        # client wanting to copy object would first HEAD
+        head_object_resp = self.client.head_object(
+            Bucket=self.bucket_name, Key=key_src)
+        # the client will know it's an mpu and how many parts
+        self.assertEqual(mpu_etag_src, head_object_resp['ETag'])
+        self.assertIn('-', mpu_etag_src)
+        num_parts = int(mpu_etag_src.strip('"').rsplit('-')[-1])
+
+        # create new mpu
+        key_dest = self.create_name('copy-from-from-dest')
+        create_mpu_dest = self.client.create_multipart_upload(
+            Bucket=self.bucket_name, Key=key_dest)
+        self.assertEqual(200, create_mpu_dest[
+            'ResponseMetadata']['HTTPStatusCode'])
+        upload_id = create_mpu_dest['UploadId']
+
+        parts = []
+        start = 0
+        # do HEAD?partNumber to get copy range
+        for part_num in range(1, num_parts + 1):
+            part_head_resp = self.client.head_object(
+                Bucket=self.bucket_name, Key=key_src, PartNumber=part_num)
+            end = start + part_head_resp['ContentLength']
+            copy_range = 'bytes=%s-%s' % (start, end - 1)
+            copy_resp = self.client.upload_part_copy(
+                Bucket=self.bucket_name, Key=key_dest, PartNumber=part_num,
+                CopySource={
+                    'Bucket': self.bucket_name,
+                    'Key': key_src,
+                },
+                CopySourceRange=copy_range, UploadId=upload_id)
+            self.assertEqual(200, copy_resp[
+                'ResponseMetadata']['HTTPStatusCode'])
+            parts.append({
+                'ETag': copy_resp['CopyPartResult']['ETag'],
+                'PartNumber': part_num,
+            })
+            start = end
+
+        complete_mpu_resp = self.client.complete_multipart_upload(
+            Bucket=self.bucket_name, Key=key_dest,
+            MultipartUpload={
+                'Parts': parts,
+            },
+            UploadId=upload_id,
+        )
+        self.assertEqual(200, complete_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual(complete_mpu_resp['ETag'], mpu_etag_src)
+
+    def test_create_list_abort_multipart_uploads(self):
+        key_name = self.create_name('key')
+        create_mpu_resp = self.client.create_multipart_upload(
+            Bucket=self.bucket_name, Key=key_name)
+        self.assertEqual(200, create_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        upload_id = create_mpu_resp['UploadId']
+
+        # our upload is in progress
+        list_mpu_resp = self.client.list_multipart_uploads(
+            Bucket=self.bucket_name)
+        self.assertEqual(200, list_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        found_uploads = list_mpu_resp.get('Uploads', [])
+        self.assertEqual(1, len(found_uploads), found_uploads)
+        self.assertEqual(upload_id, found_uploads[0]['UploadId'])
+
+        abort_resp = self.client.abort_multipart_upload(
+            Bucket=self.bucket_name,
+            Key=key_name,
+            UploadId=upload_id,
+        )
+        self.assertEqual(204, abort_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+
+        # no more inprogress uploads
+        list_mpu_resp = self.client.list_multipart_uploads(
+            Bucket=self.bucket_name)
+        self.assertEqual(200, list_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual([], list_mpu_resp.get('Uploads', []))
+
+    def test_create_upload_complete_complete(self):
+        key_name = self.create_name('key')
+        upload_id = self.create_mpu(key_name)
+        parts = self.upload_parts(key_name, upload_id, 2)
+        self.complete_mpu(key_name, upload_id, parts)
+        # repeat complete gets 200
+        self.complete_mpu(key_name, upload_id, parts)
+
+    def test_create_upload_complete_delete_complete(self):
+        key_name = self.create_name('key')
+        upload_id = self.create_mpu(key_name)
+        parts = self.upload_parts(key_name, upload_id, 2)
+        self.complete_mpu(key_name, upload_id, parts)
+        self.delete_object(key_name)
+        self.assert_object_not_found(key_name)
+        # repeat complete gets 404
+        with self.assertRaises(ClientError) as cm:
+            self.complete_mpu(key_name, upload_id, parts)
+        self.assertEqual(404, status_from_error(cm.exception))
+        self.assertEqual('NoSuchUpload', code_from_error(cm.exception))
+
+    def test_create_upload_abort_complete(self):
+        key_name = self.create_name('key')
+        upload_id = self.create_mpu(key_name)
+        parts = self.upload_parts(key_name, upload_id, 1)
+        self.abort_mpu(key_name, upload_id)
+        with self.assertRaises(ClientError) as cm:
+            self.complete_mpu(key_name, upload_id, parts)
+        self.assertEqual(404, status_from_error(cm.exception))
+        self.assertEqual('NoSuchUpload', code_from_error(cm.exception))
+
+    def test_abort_bogus_id(self):
+        key_name = self.create_name('key')
+        upload_id = self.create_mpu(key_name)
+        with self.assertRaises(ClientError) as cm:
+            self.abort_mpu(key_name, upload_id + 'x')
+        self.assertEqual(404, status_from_error(cm.exception))
+        self.assertEqual('NoSuchUpload', code_from_error(cm.exception))
+
+    def test_create_upload_abort_list_parts(self):
+        key_name = self.create_name('key')
+        upload_id = self.create_mpu(key_name)
+        self.upload_parts(key_name, upload_id, 1)
+        self.abort_mpu(key_name, upload_id)
+        with self.assertRaises(ClientError) as cm:
+            self.list_parts(key_name, upload_id)
+        self.assertEqual(404, status_from_error(cm.exception))
+        self.assertEqual('NoSuchUpload', code_from_error(cm.exception))
+
+    def test_create_upload_abort_upload(self):
+        key_name = self.create_name('key')
+        upload_id = self.create_mpu(key_name)
+        self.upload_parts(key_name, upload_id, 1)
+        self.abort_mpu(key_name, upload_id)
+        with self.assertRaises(ClientError) as cm:
+            self.upload_parts(key_name, upload_id, 1)
+        self.assertEqual(404, status_from_error(cm.exception))
+        self.assertEqual('NoSuchUpload', code_from_error(cm.exception))
+
+    def test_create_upload_complete_subset_of_parts_list(self):
+        key_name = self.create_name('key')
+        upload_id = self.create_mpu(key_name)
+        parts = self.upload_parts(key_name, upload_id, 3)
+        subset_parts = parts[:2]
+        self.complete_mpu(key_name, upload_id, subset_parts)
+
+        response = self.head_part(key_name, 1)
+        self.assertTrue(etag_from_resp(response).endswith('-2"'))
+        response2 = self.head_part(key_name, 2)
+        self.assertEqual(etag_from_resp(response), etag_from_resp(response2))
+
+        with self.assertRaises(ClientError) as cm:
+            self.get_part(key_name, 3)
+        self.assertEqual(416, status_from_error(cm.exception))
+        self.assertEqual('InvalidPartNumber', code_from_error(cm.exception))
+
+    def test_create_upload_complete_subset_of_parts_list_with_gaps(self):
+        # only a subset of uploaded parts are referenced in complete
+        key_name = self.create_name('key')
+        upload_id = self.create_mpu(key_name)
+        parts = self.upload_parts(key_name, upload_id, 3)
+        subset_parts = [parts[0], parts[2]]
+        self.complete_mpu(key_name, upload_id, subset_parts)
+        # GET partNumbers are not same as uploaded part numbers!
+        self.head_part(key_name, 1)
+        response = self.head_part(key_name, 1)
+        self.assertTrue(etag_from_resp(response).endswith('-2"'))
+        response2 = self.head_part(key_name, 2)
+        self.assertEqual(etag_from_resp(response), etag_from_resp(response2))
+
+        with self.assertRaises(ClientError) as cm:
+            self.get_part(key_name, 3)
+        self.assertEqual(416, status_from_error(cm.exception))
+        self.assertEqual('InvalidPartNumber', code_from_error(cm.exception))
+
+    def test_create_upload_complete_parts_list_with_gaps(self):
+        # only a subset of part indexes are uploaded
+        key_name = self.create_name('key')
+        upload_id = self.create_mpu(key_name)
+        parts = self.upload_part_indexes(key_name, upload_id, [1, 1000])
+        actual_parts = self.list_parts(key_name, upload_id)
+        self.assertEqual([1, 1000], [p['PartNumber'] for p in actual_parts])
+        self.complete_mpu(key_name, upload_id, parts)
+        # GET partNumbers are not same as uploaded part numbers!
+        self.head_part(key_name, 1)
+        response = self.head_part(key_name, 1)
+        self.assertTrue(etag_from_resp(response).endswith('-2"'))
+        response2 = self.head_part(key_name, 2)
+        self.assertEqual(etag_from_resp(response), etag_from_resp(response2))
+
+        with self.assertRaises(ClientError) as cm:
+            self.get_part(key_name, 3)
+        self.assertEqual(416, status_from_error(cm.exception), cm.exception)
+        self.assertEqual('InvalidPartNumber', code_from_error(cm.exception))
+
+    def test_create_upload_complete_misordered_parts(self):
+        key_name = self.create_name('key')
+        upload_id = self.create_mpu(key_name)
+        parts = self.upload_parts(key_name, upload_id, 3)
+        with self.assertRaises(ClientError) as cm:
+            self.complete_mpu(key_name, upload_id, list(reversed(parts)))
+        self.assertEqual(400, status_from_error(cm.exception))
+        self.assertEqual('InvalidPartOrder', code_from_error(cm.exception))
+
+    def test_create_list_mpus_abort_list_mpus(self):
+        key_name = self.create_name('key')
+        upload_id = self.create_mpu(key_name)
+        # our upload is in progress
+        found_uploads = self.list_mpus()
+        self.assertEqual([(key_name, upload_id)], found_uploads)
+        self.assertEqual([], self.list_parts(key_name, upload_id))
+        self.abort_mpu(key_name, upload_id)
+        # no more inprogress uploads
+        self.assertEqual([], self.list_mpus())
+
+    def test_complete_multipart_upload_malformed_request(self):
+        key_name = self.create_name('key')
+        create_mpu_resp = self.client.create_multipart_upload(
+            Bucket=self.bucket_name, Key=key_name)
+        self.assertEqual(200, create_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        upload_id = create_mpu_resp['UploadId']
+        parts = []
+        for i in range(1, 3):
+            body = ('%d' % i) * 5 * (2 ** 20)
+            part_resp = self.client.upload_part(
+                Body=body, Bucket=self.bucket_name, Key=key_name,
+                PartNumber=i, UploadId=upload_id)
+            self.assertEqual(200, part_resp[
+                'ResponseMetadata']['HTTPStatusCode'])
+            parts.append({
+                'PartNumber': i,
+                'ETag': '',
+            })
+        with self.assertRaises(ClientError) as caught:
+            self.client.complete_multipart_upload(
+                Bucket=self.bucket_name, Key=key_name,
+                MultipartUpload={
+                    'Parts': parts,
+                },
+                UploadId=upload_id,
+            )
+        complete_mpu_resp = caught.exception.response
+        self.assertEqual(400, complete_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual('InvalidPart', complete_mpu_resp[
+            'Error']['Code'])
+        self.assertEqual(
+            "One or more of the specified parts could not be found.  The part "
+            "may not have been uploaded, or the specified entity tag may not "
+            "match the part's entity tag.",
+            complete_mpu_resp['Error']['Message'])
+        self.assertEqual(complete_mpu_resp['Error']['UploadId'], upload_id)
+        self.assertIn(complete_mpu_resp['Error']['PartNumber'], ('1', '2'))
+        self.assertEqual(complete_mpu_resp['Error']['ETag'], None)
+
+
+class TestVersionedMultiPartUpload(BaseMultiPartUploadTestCase):
+
+    def setUp(self):
+        super(TestVersionedMultiPartUpload, self).setUp()
+        resp = self.client.put_bucket_versioning(
+            Bucket=self.bucket_name,
+            VersioningConfiguration={'Status': 'Enabled'})
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+
+    def tearDown(self):
+        resp = self.client.put_bucket_versioning(
+            Bucket=self.bucket_name,
+            VersioningConfiguration={'Status': 'Suspended'})
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        super(TestVersionedMultiPartUpload, self).tearDown()
+
+    def test_get_by_part_number_with_versioning(self):
+        # create 3 version with progressively larger sizes
+        parts_counts = [2, 3, 4]
+        key_name = self.create_name('part-num-versions')
+        version_vars = []
+        for num_parts in parts_counts:
+            self.num_parts = num_parts
+            etag, version_id = self.upload_mpu_version(key_name)
+            version_vars.append((num_parts, etag, version_id))
+        for num_parts, mpu_etag, version in version_vars:
+            self.num_parts = num_parts
+            self._verify_part_num_response(
+                self.client.get_object, key_name, mpu_etag, version)
+            self._verify_part_num_response(
+                self.client.head_object, key_name, mpu_etag, version)
diff --git a/test/s3api/test_object_checksums.py b/test/s3api/test_object_checksums.py
new file mode 100644
index 0000000000..783209a38e
--- /dev/null
+++ b/test/s3api/test_object_checksums.py
@@ -0,0 +1,600 @@
+# Copyright (c) 2010-2023 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import binascii
+import botocore
+import hashlib
+from unittest import SkipTest
+
+from swift.common.utils import base64_str
+from swift.common.utils.checksum import crc32c
+from test.s3api import BaseS3TestCaseWithBucket
+
+TEST_BODY = b'123456789'
+
+
+def boto_at_least(*version):
+    return tuple(int(x) for x in botocore.__version__.split('.')) >= version
+
+
+class ObjectChecksumMixin(object):
+
+    @classmethod
+    def setUpClass(cls):
+        super().setUpClass()
+        cls.client = cls.get_s3_client(1)
+        cls.use_tls = cls.client._endpoint.host.startswith('https:')
+        cls.CHECKSUM_HDR = 'x-amz-checksum-' + cls.ALGORITHM.lower()
+
+    def assert_error(self, resp, err_code, err_msg, obj_name, **extra):
+        self.assertEqual(400, resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual(err_code, resp['Error']['Code'])
+        self.assertEqual(err_msg, resp['Error']['Message'])
+        self.assertEqual({k: resp['Error'].get(k) for k in extra}, extra)
+
+        # Sanity check: object was not created
+        with self.assertRaises(botocore.exceptions.ClientError) as caught:
+            self.client.head_object(Bucket=self.bucket_name, Key=obj_name)
+        resp = caught.exception.response
+        self.assertEqual(404, resp['ResponseMetadata']['HTTPStatusCode'])
+
+    def test_let_sdk_compute(self):
+        obj_name = self.create_name(self.ALGORITHM + '-sdk')
+        resp = self.client.put_object(
+            Bucket=self.bucket_name,
+            Key=obj_name,
+            Body=TEST_BODY,
+            ChecksumAlgorithm=self.ALGORITHM,
+        )
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+
+    def test_good_checksum(self):
+        obj_name = self.create_name(self.ALGORITHM + '-with-algo-header')
+        resp = self.client.put_object(
+            Bucket=self.bucket_name,
+            Key=obj_name,
+            Body=TEST_BODY,
+            ChecksumAlgorithm=self.ALGORITHM,
+            **{'Checksum' + self.ALGORITHM: self.EXPECTED}
+        )
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+
+    def test_good_checksum_no_algorithm_header(self):
+        obj_name = self.create_name(self.ALGORITHM + '-no-algo-header')
+        resp = self.client.put_object(
+            Bucket=self.bucket_name,
+            Key=obj_name,
+            Body=TEST_BODY,
+            **{'Checksum' + self.ALGORITHM: self.EXPECTED}
+        )
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+
+    def test_invalid_checksum(self):
+        obj_name = self.create_name(self.ALGORITHM + '-invalid')
+        with self.assertRaises(botocore.exceptions.ClientError) as caught:
+            self.client.put_object(
+                Bucket=self.bucket_name,
+                Key=obj_name,
+                Body=TEST_BODY,
+                ChecksumAlgorithm=self.ALGORITHM,
+                **{'Checksum' + self.ALGORITHM: self.INVALID}
+            )
+        self.assert_error(
+            caught.exception.response,
+            'InvalidRequest',
+            'Value for %s header is invalid.' % self.CHECKSUM_HDR,
+            obj_name,
+        )
+
+    def test_bad_checksum(self):
+        obj_name = self.create_name(self.ALGORITHM + '-bad')
+        with self.assertRaises(botocore.exceptions.ClientError) as caught:
+            self.client.put_object(
+                Bucket=self.bucket_name,
+                Key=obj_name,
+                Body=TEST_BODY,
+                ChecksumAlgorithm=self.ALGORITHM,
+                **{'Checksum' + self.ALGORITHM: self.BAD}
+            )
+        self.assert_error(
+            caught.exception.response,
+            'BadDigest',
+            'The %s you specified did not match the calculated checksum.'
+            % self.ALGORITHM,
+            obj_name,
+        )
+
+    def test_mpu_upload_part_invalid_checksum(self):
+        obj_name = self.create_name(
+            self.ALGORITHM + '-mpu-upload-part-invalid-checksum')
+        create_mpu_resp = self.client.create_multipart_upload(
+            Bucket=self.bucket_name, Key=obj_name,
+            ChecksumAlgorithm=self.ALGORITHM)
+        self.assertEqual(200, create_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        upload_id = create_mpu_resp['UploadId']
+        with self.assertRaises(botocore.exceptions.ClientError) as caught:
+            self.client.upload_part(
+                Bucket=self.bucket_name,
+                Key=obj_name,
+                UploadId=upload_id,
+                PartNumber=1,
+                Body=TEST_BODY,
+                **{'Checksum' + self.ALGORITHM: self.INVALID},
+            )
+        self.assert_error(
+            caught.exception.response,
+            'InvalidRequest',
+            'Value for %s header is invalid.' % self.CHECKSUM_HDR,
+            obj_name,
+        )
+
+    def test_mpu_upload_part_bad_checksum(self):
+        obj_name = self.create_name(
+            self.ALGORITHM + '-mpu-upload-part-bad-checksum')
+        create_mpu_resp = self.client.create_multipart_upload(
+            Bucket=self.bucket_name, Key=obj_name,
+            ChecksumAlgorithm=self.ALGORITHM)
+        self.assertEqual(200, create_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        upload_id = create_mpu_resp['UploadId']
+        with self.assertRaises(botocore.exceptions.ClientError) as caught:
+            self.client.upload_part(
+                Bucket=self.bucket_name,
+                Key=obj_name,
+                UploadId=upload_id,
+                PartNumber=1,
+                Body=TEST_BODY,
+                **{'Checksum' + self.ALGORITHM: self.BAD},
+            )
+        self.assert_error(
+            caught.exception.response,
+            'BadDigest',
+            'The %s you specified did not match the calculated '
+            'checksum.' % self.ALGORITHM,
+            obj_name,
+        )
+
+    def test_mpu_upload_part_good_checksum(self):
+        obj_name = self.create_name(self.ALGORITHM + '-mpu-upload-part-good')
+        create_mpu_resp = self.client.create_multipart_upload(
+            Bucket=self.bucket_name, Key=obj_name,
+            ChecksumAlgorithm=self.ALGORITHM)
+        self.assertEqual(200, create_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        upload_id = create_mpu_resp['UploadId']
+        part_resp = self.client.upload_part(
+            Bucket=self.bucket_name,
+            Key=obj_name,
+            UploadId=upload_id,
+            PartNumber=1,
+            Body=TEST_BODY,
+            **{'Checksum' + self.ALGORITHM: self.EXPECTED},
+        )
+        self.assertEqual(200, part_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+
+    def test_mpu_complete_good_checksum(self):
+        checksum_kwargs = {
+            'ChecksumAlgorithm': self.ALGORITHM,
+        }
+        if boto_at_least(1, 36):
+            if self.ALGORITHM == 'CRC64NVME':
+                # crc64nvme only allows full-object
+                checksum_kwargs['ChecksumType'] = 'FULL_OBJECT'
+            else:
+                checksum_kwargs['ChecksumType'] = 'COMPOSITE'
+
+        obj_name = self.create_name(self.ALGORITHM + '-mpu-complete-good')
+        create_mpu_resp = self.client.create_multipart_upload(
+            Bucket=self.bucket_name, Key=obj_name,
+            **checksum_kwargs)
+        self.assertEqual(200, create_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        upload_id = create_mpu_resp['UploadId']
+        part_resp = self.client.upload_part(
+            Bucket=self.bucket_name,
+            Key=obj_name,
+            UploadId=upload_id,
+            PartNumber=1,
+            Body=TEST_BODY,
+            **{'Checksum' + self.ALGORITHM: self.EXPECTED},
+        )
+        self.assertEqual(200, part_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        complete_mpu_resp = self.client.complete_multipart_upload(
+            Bucket=self.bucket_name, Key=obj_name,
+            MultipartUpload={
+                'Parts': [
+                    {
+                        'ETag': part_resp['ETag'],
+                        'PartNumber': 1,
+                        'Checksum' + self.ALGORITHM: self.EXPECTED,
+                    },
+                ],
+            },
+            UploadId=upload_id,
+        )
+        self.assertEqual(200, complete_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+
+
+class TestObjectChecksumCRC32(ObjectChecksumMixin, BaseS3TestCaseWithBucket):
+    ALGORITHM = 'CRC32'
+    EXPECTED = 'y/Q5Jg=='
+    INVALID = 'y/Q5Jh=='
+    BAD = 'z/Q5Jg=='
+
+
+class TestObjectChecksumCRC32C(ObjectChecksumMixin, BaseS3TestCaseWithBucket):
+    ALGORITHM = 'CRC32C'
+    EXPECTED = '4waSgw=='
+    INVALID = '4waSgx=='
+    BAD = '5waSgw=='
+
+    @classmethod
+    def setUpClass(cls):
+        if not botocore.httpchecksum.HAS_CRT:
+            raise SkipTest('botocore cannot crc32c (run `pip install awscrt`)')
+        super().setUpClass()
+
+
+class TestObjectChecksumCRC64NVME(ObjectChecksumMixin,
+                                  BaseS3TestCaseWithBucket):
+    ALGORITHM = 'CRC64NVME'
+    EXPECTED = 'rosUhgp5mIg='
+    INVALID = 'rosUhgp5mIh='
+    BAD = 'sosUhgp5mIg='
+
+    @classmethod
+    def setUpClass(cls):
+        if [int(x) for x in botocore.__version__.split('.')] < [1, 36]:
+            raise SkipTest('botocore cannot crc64nvme (run '
+                           '`pip install -U boto3 botocore`)')
+        if not botocore.httpchecksum.HAS_CRT:
+            raise SkipTest('botocore cannot crc64nvme (run '
+                           '`pip install awscrt`)')
+        super().setUpClass()
+
+
+class TestObjectChecksumSHA1(ObjectChecksumMixin, BaseS3TestCaseWithBucket):
+    ALGORITHM = 'SHA1'
+    EXPECTED = '98O8HYCOBHMq32eZZczDTKeuNEE='
+    INVALID = '98O8HYCOBHMq32eZZczDTKeuNEF='
+    BAD = '+8O8HYCOBHMq32eZZczDTKeuNEE='
+
+
+class TestObjectChecksumSHA256(ObjectChecksumMixin, BaseS3TestCaseWithBucket):
+    ALGORITHM = 'SHA256'
+    EXPECTED = 'FeKw08M4keuw8e9gnsQZQgwg4yDOlMZfvIwzEkSOsiU='
+    INVALID = 'FeKw08M4keuw8e9gnsQZQgwg4yDOlMZfvIwzEkSOsiV='
+    BAD = 'GeKw08M4keuw8e9gnsQZQgwg4yDOlMZfvIwzEkSOsiU='
+
+
+class TestObjectChecksums(BaseS3TestCaseWithBucket):
+
+    @classmethod
+    def setUpClass(cls):
+        super().setUpClass()
+        cls.client = cls.get_s3_client(1)
+        cls.use_tls = cls.client._endpoint.host.startswith('https:')
+
+    def test_multi_checksum(self):
+        with self.assertRaises(botocore.exceptions.ClientError) as caught:
+            self.client.put_object(
+                Bucket=self.bucket_name,
+                Key=self.create_name('multi-checksum'),
+                Body=TEST_BODY,
+                # Note: Both valid! Ought to be able to validate & store both
+                ChecksumCRC32='y/Q5Jg==',
+                ChecksumSHA1='98O8HYCOBHMq32eZZczDTKeuNEE=',
+            )
+        resp = caught.exception.response
+        code = resp['ResponseMetadata']['HTTPStatusCode']
+        self.assertEqual(400, code)
+        self.assertEqual('InvalidRequest', resp['Error']['Code'])
+        self.assertEqual(
+            resp['Error']['Message'],
+            'Expecting a single x-amz-checksum- header. '
+            'Multiple checksum Types are not allowed.')
+
+    def test_different_checksum_requested(self):
+        with self.assertRaises(botocore.exceptions.ClientError) as caught:
+            self.client.put_object(
+                Bucket=self.bucket_name,
+                Key=self.create_name('different-checksum'),
+                Body=TEST_BODY,
+                ChecksumCRC32='y/Q5Jg==',
+                ChecksumAlgorithm='SHA1',
+            )
+        resp = caught.exception.response
+        code = resp['ResponseMetadata']['HTTPStatusCode']
+        self.assertEqual(400, code)
+        self.assertEqual('InvalidRequest', resp['Error']['Code'])
+        if boto_at_least(1, 36):
+            self.assertEqual(
+                resp['Error']['Message'],
+                'Value for x-amz-sdk-checksum-algorithm header is invalid.')
+        else:
+            self.assertEqual(
+                resp['Error']['Message'],
+                'Expecting a single x-amz-checksum- header')
+
+    def assert_invalid(self, resp):
+        code = resp['ResponseMetadata']['HTTPStatusCode']
+        self.assertEqual(400, code)
+        self.assertEqual('InvalidRequest', resp['Error']['Code'])
+        self.assertEqual(
+            resp['Error']['Message'],
+            'Value for x-amz-checksum-crc32 header is invalid.')
+
+    def test_invalid_base64_invalid_length(self):
+        put_kwargs = {
+            'Bucket': self.bucket_name,
+            'Key': self.create_name('invalid-bad-length'),
+            'Body': TEST_BODY,
+            'ChecksumCRC32': 'short===',  # invalid length for base64
+        }
+        with self.assertRaises(botocore.exceptions.ClientError) as caught:
+            self.client.put_object(**put_kwargs)
+        self.assert_invalid(caught.exception.response)
+
+    def test_invalid_base64_too_short(self):
+        put_kwargs = {
+            'Bucket': self.bucket_name,
+            'Key': self.create_name('invalid-short'),
+            'Body': TEST_BODY,
+            'ChecksumCRC32': 'shrt',  # only 3 bytes
+        }
+        with self.assertRaises(botocore.exceptions.ClientError) as caught:
+            self.client.put_object(**put_kwargs)
+        self.assert_invalid(caught.exception.response)
+
+    def test_invalid_base64_too_long(self):
+        put_kwargs = {
+            'Bucket': self.bucket_name,
+            'Key': self.create_name('invalid-long'),
+            'Body': TEST_BODY,
+            'ChecksumCRC32': 'toolong=',  # 5 bytes
+        }
+        with self.assertRaises(botocore.exceptions.ClientError) as caught:
+            self.client.put_object(**put_kwargs)
+        self.assert_invalid(caught.exception.response)
+
+    def test_invalid_base64_all_invalid_chars(self):
+        put_kwargs = {
+            'Bucket': self.bucket_name,
+            'Key': self.create_name('purely-invalid'),
+            'Body': TEST_BODY,
+            'ChecksumCRC32': '^^^^^^==',  # all invalid char
+        }
+        with self.assertRaises(botocore.exceptions.ClientError) as caught:
+            self.client.put_object(**put_kwargs)
+        self.assert_invalid(caught.exception.response)
+
+    def test_invalid_base64_includes_invalid_chars(self):
+        put_kwargs = {
+            'Bucket': self.bucket_name,
+            'Key': self.create_name('contains-invalid'),
+            'Body': TEST_BODY,
+            'ChecksumCRC32': 'y^/^Q5^J^g==',  # spaced out with invalid chars
+        }
+        with self.assertRaises(botocore.exceptions.ClientError) as caught:
+            self.client.put_object(**put_kwargs)
+        self.assert_invalid(caught.exception.response)
+
+    def test_mpu_no_checksum_upload_part_invalid_checksum(self):
+        obj_name = self.create_name('no-checksum-mpu')
+        create_mpu_resp = self.client.create_multipart_upload(
+            Bucket=self.bucket_name, Key=obj_name)
+        self.assertEqual(200, create_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        upload_id = create_mpu_resp['UploadId']
+        with self.assertRaises(botocore.exceptions.ClientError) as caught:
+            self.client.upload_part(
+                Bucket=self.bucket_name,
+                Key=obj_name,
+                UploadId=upload_id,
+                PartNumber=1,
+                Body=TEST_BODY,
+                ChecksumCRC32=TestObjectChecksumCRC32.INVALID,
+            )
+        self.assert_invalid(caught.exception.response)
+
+    def test_mpu_has_no_checksum(self):
+        # Clients don't need to be thinking about checksums at all
+        obj_name = self.create_name('no-checksum-mpu')
+        create_mpu_resp = self.client.create_multipart_upload(
+            Bucket=self.bucket_name, Key=obj_name)
+        self.assertEqual(200, create_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        upload_id = create_mpu_resp['UploadId']
+        part_resp = self.client.upload_part(
+            Bucket=self.bucket_name,
+            Key=obj_name,
+            UploadId=upload_id,
+            PartNumber=1,
+            Body=TEST_BODY,
+        )
+        complete_mpu_resp = self.client.complete_multipart_upload(
+            Bucket=self.bucket_name, Key=obj_name,
+            MultipartUpload={
+                'Parts': [
+                    {
+                        'ETag': part_resp['ETag'],
+                        'PartNumber': 1,
+                    },
+                ],
+            },
+            UploadId=upload_id,
+        )
+        self.assertEqual(200, complete_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+
+        head_resp = self.client.head_object(
+            Bucket=self.bucket_name, Key=obj_name)
+        self.assertFalse([k for k in head_resp
+                          if k.startswith('Checksum')])
+
+    def test_mpu_upload_part_multi_checksum(self):
+        obj_name = self.create_name('multi-checksum-mpu')
+        create_mpu_resp = self.client.create_multipart_upload(
+            Bucket=self.bucket_name, Key=obj_name,
+            ChecksumAlgorithm='CRC32C')
+        self.assertEqual(200, create_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        upload_id = create_mpu_resp['UploadId']
+        with self.assertRaises(botocore.exceptions.ClientError) as caught:
+            self.client.upload_part(
+                Bucket=self.bucket_name,
+                Key=obj_name,
+                UploadId=upload_id,
+                PartNumber=1,
+                Body=TEST_BODY,
+                # Both valid!
+                ChecksumCRC32=TestObjectChecksumCRC32.EXPECTED,
+                ChecksumCRC32C=TestObjectChecksumCRC32C.EXPECTED,
+            )
+        resp = caught.exception.response
+        self.assertEqual(400, resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual(resp['Error'], {
+            'Code': 'InvalidRequest',
+            'Message': ('Expecting a single x-amz-checksum- header. '
+                        'Multiple checksum Types are not allowed.'),
+        })
+        # You'd think we ought to be able to validate & store both...
+
+    def test_multipart_mpu(self):
+        obj_name = self.create_name('multipart-mpu')
+        create_mpu_resp = self.client.create_multipart_upload(
+            Bucket=self.bucket_name, Key=obj_name,
+            ChecksumAlgorithm='CRC32C')
+        self.assertEqual(200, create_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        upload_id = create_mpu_resp['UploadId']
+        part_body = b'\x00' * 5 * 1024 * 1024
+        part_crc32c = base64_str(crc32c(part_body).digest())
+
+        upload_part_resp = self.client.upload_part(
+            Bucket=self.bucket_name,
+            Key=obj_name,
+            UploadId=upload_id,
+            PartNumber=1,
+            Body=part_body,
+            ChecksumCRC32C=part_crc32c,
+        )
+        self.assertEqual(200, upload_part_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        # then do another
+        upload_part_resp = self.client.upload_part(
+            Bucket=self.bucket_name,
+            Key=obj_name,
+            UploadId=upload_id,
+            PartNumber=2,
+            Body=part_body,
+            ChecksumCRC32C=part_crc32c,
+        )
+        self.assertEqual(200, upload_part_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+
+        complete_mpu_resp = self.client.complete_multipart_upload(
+            Bucket=self.bucket_name, Key=obj_name,
+            MultipartUpload={
+                'Parts': [
+                    {
+                        'PartNumber': 1,
+                        'ETag': upload_part_resp['ETag'],
+                        'ChecksumCRC32C': part_crc32c,
+                    },
+                    {
+                        'PartNumber': 2,
+                        'ETag': upload_part_resp['ETag'],
+                        'ChecksumCRC32C': part_crc32c,
+                    },
+                ],
+            },
+            UploadId=upload_id,
+        )
+        self.assertEqual(200, complete_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        mpu_etag = '"' + hashlib.md5(binascii.unhexlify(
+            upload_part_resp['ETag'].strip('"')) * 2).hexdigest() + '-2"'
+        self.assertEqual(mpu_etag,
+                         complete_mpu_resp['ETag'])
+
+    def test_multipart_mpu_no_etags(self):
+        obj_name = self.create_name('multipart-mpu')
+        create_mpu_resp = self.client.create_multipart_upload(
+            Bucket=self.bucket_name, Key=obj_name,
+            ChecksumAlgorithm='CRC32C')
+        self.assertEqual(200, create_mpu_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        upload_id = create_mpu_resp['UploadId']
+        part_body = b'\x00' * 5 * 1024 * 1024
+        part_crc32c = base64_str(crc32c(part_body).digest())
+
+        upload_part_resp = self.client.upload_part(
+            Bucket=self.bucket_name,
+            Key=obj_name,
+            UploadId=upload_id,
+            PartNumber=1,
+            Body=part_body,
+            ChecksumCRC32C=part_crc32c,
+        )
+        self.assertEqual(200, upload_part_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+        # then do another
+        upload_part_resp = self.client.upload_part(
+            Bucket=self.bucket_name,
+            Key=obj_name,
+            UploadId=upload_id,
+            PartNumber=2,
+            Body=part_body,
+            ChecksumCRC32C=part_crc32c,
+        )
+        self.assertEqual(200, upload_part_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
+
+        with self.assertRaises(botocore.exceptions.ClientError) as caught:
+            self.client.complete_multipart_upload(
+                Bucket=self.bucket_name, Key=obj_name,
+                MultipartUpload={
+                    'Parts': [
+                        {
+                            'PartNumber': 1,
+                            'ChecksumCRC32C': part_crc32c,
+                        },
+                        {
+                            'PartNumber': 2,
+                            'ChecksumCRC32C': part_crc32c,
+                        },
+                    ],
+                },
+                UploadId=upload_id,
+            )
+        resp = caught.exception.response
+        self.assertEqual(400, resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual(resp['Error']['Code'], 'MalformedXML')
+        self.assertEqual(
+            resp['Error']['Message'],
+            'The XML you provided was not well-formed or did not validate '
+            'against our published schema'
+        )
+        abort_resp = self.client.abort_multipart_upload(
+            Bucket=self.bucket_name, Key=obj_name,
+            UploadId=upload_id,
+        )
+        self.assertEqual(204, abort_resp[
+            'ResponseMetadata']['HTTPStatusCode'])
diff --git a/test/s3api/test_object_lock.py b/test/s3api/test_object_lock.py
new file mode 100644
index 0000000000..a944008257
--- /dev/null
+++ b/test/s3api/test_object_lock.py
@@ -0,0 +1,51 @@
+# Copyright (c) 2010-2023 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import botocore
+
+from test.s3api import BaseS3TestCase
+
+
+class TestObjectLockConfiguration(BaseS3TestCase):
+
+    maxDiff = None
+
+    def setUp(self):
+        self.client = self.get_s3_client(1)
+        self.bucket_name = self.create_name('objlock')
+        resp = self.client.create_bucket(Bucket=self.bucket_name)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+
+    def tearDown(self):
+        self.clear_bucket(self.client, self.bucket_name)
+        super(TestObjectLockConfiguration, self).tearDown()
+
+    def test_get_object_lock_configuration(self):
+        with self.assertRaises(botocore.exceptions.ClientError) as ce:
+            self.client.get_object_lock_configuration(
+                Bucket=self.bucket_name)
+
+        self.assertEqual(
+            ce.exception.response['ResponseMetadata']['HTTPStatusCode'],
+            404)
+        self.assertEqual(
+            ce.exception.response['Error']['Code'],
+            'ObjectLockConfigurationNotFoundError')
+
+        self.assertEqual(
+            str(ce.exception),
+            'An error occurred (ObjectLockConfigurationNotFoundError) when '
+            'calling the GetObjectLockConfiguration operation: Object Lock '
+            'configuration does not exist for this bucket')
diff --git a/test/s3api/test_request_target_style.py b/test/s3api/test_request_target_style.py
new file mode 100644
index 0000000000..c3d19ac995
--- /dev/null
+++ b/test/s3api/test_request_target_style.py
@@ -0,0 +1,48 @@
+# Copyright (c) 2022 Nvidia
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from unittest import SkipTest
+
+from test.s3api import BaseS3TestCaseWithBucket
+
+
+class AlwaysAbsoluteURLProxyConfig(object):
+
+    def __init__(self):
+        self.settings = {'proxy_use_forwarding_for_https': True}
+
+    def proxy_url_for(self, request_url):
+        return request_url
+
+    def proxy_headers_for(self, proxy_url):
+        return {}
+
+
+class TestRequestTargetStyle(BaseS3TestCaseWithBucket):
+
+    def setUp(self):
+        self.client = self.get_s3_client(1)
+        if not self.client._endpoint.host.startswith('https:'):
+            raise SkipTest('Absolute URL test requires https')
+
+    def test_absolute_url(self):
+        sess = self.client._endpoint.http_session
+        sess._proxy_config = AlwaysAbsoluteURLProxyConfig()
+        self.assertEqual({'use_forwarding_for_https': True},
+                         sess._proxies_kwargs())
+        resp = self.client.list_buckets()
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertIn(self.bucket_name, {
+            info['Name'] for info in resp['Buckets']})
diff --git a/test/s3api/test_service.py b/test/s3api/test_service.py
new file mode 100644
index 0000000000..f100f92266
--- /dev/null
+++ b/test/s3api/test_service.py
@@ -0,0 +1,144 @@
+# Copyright (c) 2019 SwiftStack, Inc.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+from collections import defaultdict
+import botocore.exceptions
+
+from test.s3api import BaseS3TestCase, ConfigError, \
+    skip_if_s3_acl_tests_disabled, is_s3_acl_tests_enabled
+
+
+class TestGetServiceSigV4(BaseS3TestCase):
+    def setUp(self):
+        super().setUp()
+        # Capture existing buckets before running tests
+        self.existing_buckets = defaultdict(list)
+        self.existing_buckets[1] = self._get_buckets(1)
+        if is_s3_acl_tests_enabled():
+            # client2 seems to be always able to list buckets
+            try:
+                self.get_s3_client(2)
+            except ConfigError:
+                pass
+            else:
+                self.existing_buckets[2] = self._get_buckets(2)
+            # client3 gets AccessDenied unless s3_acl = True
+            try:
+                self.get_s3_client(3)
+            except ConfigError:
+                pass
+            else:
+                try:
+                    self.existing_buckets[3] = self._get_buckets(3)
+                except botocore.exceptions.ClientError as e:
+                    # but the lack of the existing_buckets doesn't really
+                    # matter to most tests
+                    if e.response['Error']['Code'] == 'AccessDenied':
+                        pass
+                    else:
+                        raise
+
+    def _get_buckets(self, client_num):
+        client = self.get_s3_client(client_num)
+        resp = client.list_buckets()
+        return [bucket['Name'] for bucket in resp['Buckets']]
+
+    def _do_test_existing_service(self, client_num):
+        client = self.get_s3_client(client_num)
+        resp = client.list_buckets()
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        found_buckets = [bucket['Name'] for bucket in resp['Buckets']]
+        self.assertEqual(self.existing_buckets[client_num], found_buckets)
+        self.assertIn('x-amz-request-id',
+                      resp['ResponseMetadata']['HTTPHeaders'])
+        self.check_owner(resp['Owner'])
+        self.assertIn('ID', resp['Owner'])
+
+    def test_existing_service(self):
+        self._do_test_existing_service(1)
+
+    @skip_if_s3_acl_tests_disabled
+    def test_existing_service_client3(self):
+        try:
+            self.get_s3_client(3)
+        except ConfigError as err:
+            raise unittest.SkipTest(str(err))
+        else:
+            self._do_test_existing_service(3)
+
+    def _create_buckets(self, client_num):
+        client = self.get_s3_client(client_num)
+        buckets = [self.create_name('bucket%s' % i) for i in range(5)]
+        for bucket in buckets:
+            client.create_bucket(Bucket=bucket)
+        return buckets
+
+    def _do_test_service_with_buckets(self, client_num, buckets):
+        client = self.get_s3_client(client_num)
+        resp = client.list_buckets()
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        expected_buckets = buckets + self.existing_buckets[client_num]
+        self.assertEqual(sorted(expected_buckets), [
+            bucket['Name'] for bucket in resp['Buckets']])
+        self.assertTrue(all('CreationDate' in bucket
+                            for bucket in resp['Buckets']))
+        self.assertIn('x-amz-request-id',
+                      resp['ResponseMetadata']['HTTPHeaders'])
+        self.check_owner(resp['Owner'])
+
+    def test_service_with_buckets(self):
+        client_num = 1
+        buckets = self._create_buckets(client_num)
+        self._do_test_service_with_buckets(client_num, buckets)
+
+    @skip_if_s3_acl_tests_disabled
+    def test_service_with_buckets_client2(self):
+        # Second user can only see its own buckets
+        try:
+            client2 = self.get_s3_client(2)
+        except ConfigError as err:
+            raise unittest.SkipTest(str(err))
+        self._create_buckets(1)
+        buckets2 = self._create_buckets(2)
+        expected_buckets = buckets2 + self.existing_buckets[2]
+        resp = client2.list_buckets()
+        found_buckets = [bucket['Name'] for bucket in resp['Buckets']]
+        self.assertEqual(sorted(expected_buckets), found_buckets)
+
+    @skip_if_s3_acl_tests_disabled
+    def test_service_with_buckets_client3(self):
+        # Unprivileged user can only see its own buckets
+        # (which should be empty)
+        try:
+            client3 = self.get_s3_client(3)
+        except ConfigError as err:
+            raise unittest.SkipTest(str(err))
+        self._create_buckets(1)
+        resp = client3.list_buckets()
+        found_buckets = [bucket['Name'] for bucket in resp['Buckets']]
+        self.assertEqual(self.existing_buckets[3], found_buckets)
+
+
+class TestGetServiceSigV2(TestGetServiceSigV4):
+    signature_version = 's3'
+
+
+class TestGetServicePresignedV2(TestGetServiceSigV4):
+    signature_version = 's3-query'
+
+
+class TestGetServicePresignedV4(TestGetServiceSigV4):
+    signature_version = 's3v4-query'
diff --git a/test/s3api/test_versioning.py b/test/s3api/test_versioning.py
new file mode 100644
index 0000000000..9dab49b570
--- /dev/null
+++ b/test/s3api/test_versioning.py
@@ -0,0 +1,758 @@
+# Copyright (c) 2019 SwiftStack, Inc.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import time
+from collections import defaultdict
+
+from botocore.exceptions import ClientError
+import io
+
+from swift.common.header_key_dict import HeaderKeyDict
+from swift.common.utils import md5
+from test.s3api import BaseS3TestCase
+
+
+def retry(f, timeout=10):
+    timelimit = time.time() + timeout
+    while True:
+        try:
+            f()
+        except (ClientError, AssertionError):
+            if time.time() > timelimit:
+                raise
+            continue
+        else:
+            break
+
+
+class TestObjectVersioning(BaseS3TestCase):
+
+    maxDiff = None
+
+    def _sanitize_obj_listing(self, obj):
+        # there's some object listing parameters that are not deterministic
+        obj.pop('LastModified')
+        obj.pop('Owner', None)
+        # there's some object listing parameters that Swift doesn't return,
+        obj.pop('ChecksumAlgorithm', None)
+        obj.pop('ChecksumType', None)
+
+    def setUp(self):
+        self.client = self.get_s3_client(1)
+        self.bucket_name = self.create_name('versioning')
+        resp = self.client.create_bucket(Bucket=self.bucket_name)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+
+        def enable_versioning():
+            resp = self.client.put_bucket_versioning(
+                Bucket=self.bucket_name,
+                VersioningConfiguration={'Status': 'Enabled'})
+            self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        retry(enable_versioning)
+
+    def tearDown(self):
+        resp = self.client.put_bucket_versioning(
+            Bucket=self.bucket_name,
+            VersioningConfiguration={'Status': 'Suspended'})
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        self.clear_bucket(self.client, self.bucket_name)
+        super(TestObjectVersioning, self).tearDown()
+
+    def test_setup(self):
+        bucket_name = self.create_name('new-bucket')
+        resp = self.client.create_bucket(Bucket=bucket_name)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        expected_location = '/%s' % bucket_name
+        self.assertEqual(expected_location, resp['Location'])
+        headers = HeaderKeyDict(resp['ResponseMetadata']['HTTPHeaders'])
+        self.assertEqual('0', headers['content-length'])
+        self.assertEqual(expected_location, headers['location'])
+
+        # get versioning
+        resp = self.client.get_bucket_versioning(Bucket=bucket_name)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertNotIn('Status', resp)
+
+        # put versioning
+        versioning_config = {
+            'Status': 'Enabled',
+        }
+        resp = self.client.put_bucket_versioning(
+            Bucket=bucket_name,
+            VersioningConfiguration=versioning_config)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+
+        # ... now it's enabled
+        def check_status():
+            resp = self.client.get_bucket_versioning(Bucket=bucket_name)
+            self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+            try:
+                self.assertEqual('Enabled', resp['Status'])
+            except KeyError:
+                self.fail('Status was not in %r' % resp)
+        retry(check_status)
+
+        # send over some bogus junk
+        versioning_config['Status'] = 'Disabled'
+        with self.assertRaises(ClientError) as ctx:
+            self.client.put_bucket_versioning(
+                Bucket=bucket_name,
+                VersioningConfiguration=versioning_config)
+        expected_err = 'An error occurred (MalformedXML) when calling the ' \
+            'PutBucketVersioning operation: The XML you provided was ' \
+            'not well-formed or did not validate against our published schema'
+        self.assertEqual(expected_err, str(ctx.exception))
+
+        # disable it
+        versioning_config['Status'] = 'Suspended'
+        resp = self.client.put_bucket_versioning(
+            Bucket=bucket_name,
+            VersioningConfiguration=versioning_config)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+
+        # ... now it's disabled again
+        def check_status():
+            resp = self.client.get_bucket_versioning(Bucket=bucket_name)
+            self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+            self.assertEqual('Suspended', resp['Status'])
+        retry(check_status)
+
+    def test_upload_fileobj_versioned(self):
+        obj_data = self.create_name('some-data').encode('ascii')
+        obj_etag = md5(obj_data, usedforsecurity=False).hexdigest()
+        obj_name = self.create_name('versioned-obj')
+        self.client.upload_fileobj(io.BytesIO(obj_data),
+                                   self.bucket_name, obj_name)
+
+        # object is in the listing
+        resp = self.client.list_objects_v2(Bucket=self.bucket_name)
+        objs = resp.get('Contents', [])
+        for obj in objs:
+            self._sanitize_obj_listing(obj)
+        self.assertEqual([{
+            'ETag': '"%s"' % obj_etag,
+            'Key': obj_name,
+            'Size': len(obj_data),
+            'StorageClass': 'STANDARD',
+        }], objs)
+
+        # object version listing
+        resp = self.client.list_object_versions(Bucket=self.bucket_name)
+        objs = resp.get('Versions', [])
+        for obj in objs:
+            self._sanitize_obj_listing(obj)
+            obj.pop('VersionId')
+        self.assertEqual([{
+            'ETag': '"%s"' % obj_etag,
+            'IsLatest': True,
+            'Key': obj_name,
+            'Size': len(obj_data),
+            'StorageClass': 'STANDARD',
+        }], objs)
+
+        # overwrite the object
+        new_obj_data = self.create_name('some-new-data').encode('ascii')
+        new_obj_etag = md5(new_obj_data, usedforsecurity=False).hexdigest()
+        self.client.upload_fileobj(io.BytesIO(new_obj_data),
+                                   self.bucket_name, obj_name)
+
+        # new object is in the listing
+        resp = self.client.list_objects_v2(Bucket=self.bucket_name)
+        objs = resp.get('Contents', [])
+        for obj in objs:
+            self._sanitize_obj_listing(obj)
+        self.assertEqual([{
+            'ETag': '"%s"' % new_obj_etag,
+            'Key': obj_name,
+            'Size': len(new_obj_data),
+            'StorageClass': 'STANDARD',
+        }], objs)
+
+        # both object versions in the versions listing
+        resp = self.client.list_object_versions(Bucket=self.bucket_name)
+        objs = resp.get('Versions', [])
+        for obj in objs:
+            self._sanitize_obj_listing(obj)
+            obj.pop('VersionId')
+        self.assertEqual([{
+            'ETag': '"%s"' % new_obj_etag,
+            'IsLatest': True,
+            'Key': obj_name,
+            'Size': len(new_obj_data),
+            'StorageClass': 'STANDARD',
+        }, {
+            'ETag': '"%s"' % obj_etag,
+            'IsLatest': False,
+            'Key': obj_name,
+            'Size': len(obj_data),
+            'StorageClass': 'STANDARD',
+        }], objs)
+
+    def test_delete_versioned_objects(self):
+        etags = []
+        obj_name = self.create_name('versioned-obj')
+        for i in range(3):
+            obj_data = self.create_name('some-data-%s' % i).encode('ascii')
+            etags.insert(0, md5(obj_data, usedforsecurity=False).hexdigest())
+            self.client.upload_fileobj(io.BytesIO(obj_data),
+                                       self.bucket_name, obj_name)
+
+        # only one object appears in the listing
+        resp = self.client.list_objects_v2(Bucket=self.bucket_name)
+        objs = resp.get('Contents', [])
+        for obj in objs:
+            self._sanitize_obj_listing(obj)
+        self.assertEqual([{
+            'ETag': '"%s"' % etags[0],
+            'Key': obj_name,
+            'Size': len(obj_data),
+            'StorageClass': 'STANDARD',
+        }], objs)
+
+        # but everything is layed out in the object versions listing
+        resp = self.client.list_object_versions(Bucket=self.bucket_name)
+        objs = resp.get('Versions', [])
+        versions = []
+        for obj in objs:
+            self._sanitize_obj_listing(obj)
+            versions.append(obj.pop('VersionId'))
+        self.assertEqual([{
+            'ETag': '"%s"' % etags[0],
+            'IsLatest': True,
+            'Key': obj_name,
+            'Size': len(obj_data),
+            'StorageClass': 'STANDARD',
+        }, {
+            'ETag': '"%s"' % etags[1],
+            'IsLatest': False,
+            'Key': obj_name,
+            'Size': len(obj_data),
+            'StorageClass': 'STANDARD',
+        }, {
+            'ETag': '"%s"' % etags[2],
+            'IsLatest': False,
+            'Key': obj_name,
+            'Size': len(obj_data),
+            'StorageClass': 'STANDARD',
+        }], objs)
+
+        # we can delete a specific version
+        resp = self.client.delete_object(Bucket=self.bucket_name,
+                                         Key=obj_name,
+                                         VersionId=versions[1])
+
+        # and that just pulls it out of the versions listing
+        resp = self.client.list_object_versions(Bucket=self.bucket_name)
+        objs = resp.get('Versions', [])
+        for obj in objs:
+            self._sanitize_obj_listing(obj)
+            obj.pop('VersionId')
+        self.assertEqual([{
+            'ETag': '"%s"' % etags[0],
+            'IsLatest': True,
+            'Key': obj_name,
+            'Size': len(obj_data),
+            'StorageClass': 'STANDARD',
+        }, {
+            'ETag': '"%s"' % etags[2],
+            'IsLatest': False,
+            'Key': obj_name,
+            'Size': len(obj_data),
+            'StorageClass': 'STANDARD',
+        }], objs)
+
+        # ... but the current listing is unaffected
+        resp = self.client.list_objects_v2(Bucket=self.bucket_name)
+        objs = resp.get('Contents', [])
+        for obj in objs:
+            self._sanitize_obj_listing(obj)
+        self.assertEqual([{
+            'ETag': '"%s"' % etags[0],
+            'Key': obj_name,
+            'Size': len(obj_data),
+            'StorageClass': 'STANDARD',
+        }], objs)
+
+        # OTOH, if you delete specifically the latest version
+        # we can delete a specific version
+        resp = self.client.delete_object(Bucket=self.bucket_name,
+                                         Key=obj_name,
+                                         VersionId=versions[0])
+
+        # the versions listing has a new IsLatest
+        resp = self.client.list_object_versions(Bucket=self.bucket_name)
+        objs = resp.get('Versions', [])
+        for obj in objs:
+            self._sanitize_obj_listing(obj)
+            obj.pop('VersionId')
+        self.assertEqual([{
+            'ETag': '"%s"' % etags[2],
+            'IsLatest': True,
+            'Key': obj_name,
+            'Size': len(obj_data),
+            'StorageClass': 'STANDARD',
+        }], objs)
+
+        # and the stack pops
+        resp = self.client.list_objects_v2(Bucket=self.bucket_name)
+        objs = resp.get('Contents', [])
+        for obj in objs:
+            self._sanitize_obj_listing(obj)
+        self.assertEqual([{
+            'ETag': '"%s"' % etags[2],
+            'Key': obj_name,
+            'Size': len(obj_data),
+            'StorageClass': 'STANDARD',
+        }], objs)
+
+    def test_delete_versioned_deletes(self):
+        etags = []
+        obj_name = self.create_name('versioned-obj')
+        for i in range(3):
+            obj_data = self.create_name('some-data-%s' % i).encode('ascii')
+            etags.insert(0, md5(obj_data, usedforsecurity=False).hexdigest())
+            self.client.upload_fileobj(io.BytesIO(obj_data),
+                                       self.bucket_name, obj_name)
+            # and make a delete marker
+            self.client.delete_object(Bucket=self.bucket_name, Key=obj_name)
+
+        # current listing is empty
+        resp = self.client.list_objects_v2(Bucket=self.bucket_name)
+        objs = resp.get('Contents', [])
+        self.assertEqual([], objs)
+
+        # but everything is in layed out in the versions listing
+        resp = self.client.list_object_versions(Bucket=self.bucket_name)
+        objs = resp.get('Versions', [])
+        versions = []
+        for obj in objs:
+            self._sanitize_obj_listing(obj)
+            versions.append(obj.pop('VersionId'))
+        self.assertEqual([{
+            'ETag': '"%s"' % etag,
+            'IsLatest': False,
+            'Key': obj_name,
+            'Size': len(obj_data),
+            'StorageClass': 'STANDARD',
+        } for etag in etags], objs)
+        # ... plus the delete markers
+        delete_markers = resp.get('DeleteMarkers', [])
+        marker_versions = []
+        for marker in delete_markers:
+            self._sanitize_obj_listing(marker)
+            marker_versions.append(marker.pop('VersionId'))
+        self.assertEqual([{
+            'Key': obj_name,
+            'IsLatest': is_latest,
+        } for is_latest in (True, False, False)], delete_markers)
+
+        # delete an old delete markers
+        resp = self.client.delete_object(Bucket=self.bucket_name,
+                                         Key=obj_name,
+                                         VersionId=marker_versions[2])
+
+        # since IsLatest is still marker we'll raise NoSuchKey
+        with self.assertRaises(ClientError) as caught:
+            resp = self.client.get_object(Bucket=self.bucket_name,
+                                          Key=obj_name)
+        expected_err = 'An error occurred (NoSuchKey) when calling the ' \
+            'GetObject operation: The specified key does not exist.'
+        self.assertEqual(expected_err, str(caught.exception))
+
+        # now delete the delete marker (IsLatest)
+        resp = self.client.delete_object(Bucket=self.bucket_name,
+                                         Key=obj_name,
+                                         VersionId=marker_versions[0])
+
+        # most recent version is now latest
+        resp = self.client.get_object(Bucket=self.bucket_name,
+                                      Key=obj_name)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual('"%s"' % etags[0], resp['ETag'])
+
+        # now delete the IsLatest object version
+        resp = self.client.delete_object(Bucket=self.bucket_name,
+                                         Key=obj_name,
+                                         VersionId=versions[0])
+
+        # and object is deleted again
+        with self.assertRaises(ClientError) as caught:
+            resp = self.client.get_object(Bucket=self.bucket_name,
+                                          Key=obj_name)
+        expected_err = 'An error occurred (NoSuchKey) when calling the ' \
+            'GetObject operation: The specified key does not exist.'
+        self.assertEqual(expected_err, str(caught.exception))
+
+        # delete marker IsLatest
+        resp = self.client.list_object_versions(Bucket=self.bucket_name)
+        delete_markers = resp.get('DeleteMarkers', [])
+        for marker in delete_markers:
+            self._sanitize_obj_listing(marker)
+        self.assertEqual([{
+            'Key': obj_name,
+            'IsLatest': True,
+            'VersionId': marker_versions[1],
+        }], delete_markers)
+
+    def test_multipart_upload(self):
+        obj_name = self.create_name('versioned-obj')
+        obj_data = b'data'
+
+        mu = self.client.create_multipart_upload(
+            Bucket=self.bucket_name,
+            Key=obj_name)
+        part_md5 = self.client.upload_part(
+            Bucket=self.bucket_name,
+            Key=obj_name,
+            UploadId=mu['UploadId'],
+            PartNumber=1,
+            Body=obj_data)['ETag']
+        complete_response = self.client.complete_multipart_upload(
+            Bucket=self.bucket_name,
+            Key=obj_name,
+            UploadId=mu['UploadId'],
+            MultipartUpload={'Parts': [
+                {'PartNumber': 1, 'ETag': part_md5},
+            ]})
+        obj_etag = complete_response['ETag']
+
+        delete_response = self.client.delete_object(
+            Bucket=self.bucket_name,
+            Key=obj_name)
+        marker_version_id = delete_response['VersionId']
+
+        resp = self.client.list_object_versions(Bucket=self.bucket_name)
+        objs = resp.get('Versions', [])
+        versions = []
+        for obj in objs:
+            self._sanitize_obj_listing(obj)
+            versions.append(obj.pop('VersionId'))
+        self.assertEqual([{
+            'ETag': obj_etag,
+            'IsLatest': False,
+            'Key': obj_name,
+            'Size': len(obj_data),
+            'StorageClass': 'STANDARD',
+        }], objs)
+
+        markers = resp.get('DeleteMarkers', [])
+        for marker in markers:
+            marker.pop('LastModified')
+            marker.pop('Owner')
+        self.assertEqual([{
+            'IsLatest': True,
+            'Key': obj_name,
+            'VersionId': marker_version_id,
+        }], markers)
+
+        # Can still get the old version
+        resp = self.client.get_object(
+            Bucket=self.bucket_name,
+            Key=obj_name,
+            VersionId=versions[0])
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual(obj_etag, resp['ETag'])
+
+        delete_response = self.client.delete_object(
+            Bucket=self.bucket_name,
+            Key=obj_name,
+            VersionId=versions[0])
+
+        resp = self.client.list_object_versions(Bucket=self.bucket_name)
+        self.assertEqual([], resp.get('Versions', []))
+
+        markers = resp.get('DeleteMarkers', [])
+        for marker in markers:
+            self._sanitize_obj_listing(marker)
+        self.assertEqual([{
+            'IsLatest': True,
+            'Key': obj_name,
+            'VersionId': marker_version_id,
+        }], markers)
+
+    def test_get_versioned_object(self):
+        etags = []
+        obj_name = self.create_name('versioned-obj')
+        for i in range(3):
+            obj_data = self.create_name('some-data-%s' % i).encode('ascii')
+            # TODO: pull etag from response instead
+            etags.insert(0, md5(obj_data, usedforsecurity=False).hexdigest())
+            self.client.upload_fileobj(
+                io.BytesIO(obj_data), self.bucket_name, obj_name)
+
+        resp = self.client.list_object_versions(Bucket=self.bucket_name)
+        objs = resp.get('Versions', [])
+        versions = []
+        for obj in objs:
+            self._sanitize_obj_listing(obj)
+            versions.append(obj.pop('VersionId'))
+        self.assertEqual([{
+            'ETag': '"%s"' % etags[0],
+            'IsLatest': True,
+            'Key': obj_name,
+            'Size': len(obj_data),
+            'StorageClass': 'STANDARD',
+        }, {
+            'ETag': '"%s"' % etags[1],
+            'IsLatest': False,
+            'Key': obj_name,
+            'Size': len(obj_data),
+            'StorageClass': 'STANDARD',
+        }, {
+            'ETag': '"%s"' % etags[2],
+            'IsLatest': False,
+            'Key': obj_name,
+            'Size': len(obj_data),
+            'StorageClass': 'STANDARD',
+        }], objs)
+
+        # un-versioned get_object returns IsLatest
+        resp = self.client.get_object(Bucket=self.bucket_name, Key=obj_name)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual('"%s"' % etags[0], resp['ETag'])
+
+        # but you can get any object by version
+        for i, version in enumerate(versions):
+            resp = self.client.get_object(
+                Bucket=self.bucket_name, Key=obj_name, VersionId=version)
+            self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+            self.assertEqual('"%s"' % etags[i], resp['ETag'])
+
+        # and head_object works about the same
+        resp = self.client.head_object(Bucket=self.bucket_name, Key=obj_name)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual('"%s"' % etags[0], resp['ETag'])
+        self.assertEqual(versions[0], resp['VersionId'])
+        for version, etag in zip(versions, etags):
+            resp = self.client.head_object(
+                Bucket=self.bucket_name, Key=obj_name, VersionId=version)
+            self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+            self.assertEqual(version, resp['VersionId'])
+            self.assertEqual('"%s"' % etag, resp['ETag'])
+
+    def test_get_versioned_object_invalid_params(self):
+        with self.assertRaises(ClientError) as ctx:
+            self.client.list_object_versions(Bucket=self.bucket_name,
+                                             KeyMarker='',
+                                             VersionIdMarker='bogus')
+        expected_err = 'An error occurred (InvalidArgument) when calling ' \
+            'the ListObjectVersions operation: Invalid version id specified'
+        self.assertEqual(expected_err, str(ctx.exception))
+
+        with self.assertRaises(ClientError) as ctx:
+            self.client.list_object_versions(
+                Bucket=self.bucket_name,
+                VersionIdMarker='a' * 32)
+        expected_err = 'An error occurred (InvalidArgument) when calling ' \
+            'the ListObjectVersions operation: A version-id marker cannot ' \
+            'be specified without a key marker.'
+        self.assertEqual(expected_err, str(ctx.exception))
+
+    def test_get_versioned_object_key_marker(self):
+        obj00_name = self.create_name('00-versioned-obj')
+        obj01_name = self.create_name('01-versioned-obj')
+        names = [obj00_name] * 3 + [obj01_name] * 3
+        latest = [True, False, False, True, False, False]
+        etags = []
+        for i in range(3):
+            obj_data = self.create_name('some-data-%s' % i).encode('ascii')
+            etags.insert(0, '"%s"' % md5(
+                obj_data, usedforsecurity=False).hexdigest())
+            self.client.upload_fileobj(
+                io.BytesIO(obj_data), self.bucket_name, obj01_name)
+        for i in range(3):
+            obj_data = self.create_name('some-data-%s' % i).encode('ascii')
+            etags.insert(0, '"%s"' % md5(
+                obj_data, usedforsecurity=False).hexdigest())
+            self.client.upload_fileobj(
+                io.BytesIO(obj_data), self.bucket_name, obj00_name)
+        resp = self.client.list_object_versions(Bucket=self.bucket_name)
+        versions = []
+        objs = []
+        for o in resp.get('Versions', []):
+            versions.append(o['VersionId'])
+            objs.append({
+                'Key': o['Key'],
+                'VersionId': o['VersionId'],
+                'IsLatest': o['IsLatest'],
+                'ETag': o['ETag'],
+            })
+        expected = [{
+            'Key': name,
+            'VersionId': version,
+            'IsLatest': is_latest,
+            'ETag': etag,
+        } for name, etag, version, is_latest in zip(
+            names, etags, versions, latest)]
+        self.assertEqual(expected, objs)
+
+        # on s3 this makes expected[0]['IsLatest'] magicaly change to False?
+        # resp = self.client.list_object_versions(Bucket=self.bucket_name,
+        #                                         KeyMarker='',
+        #                                         VersionIdMarker=versions[0])
+        # objs = [{
+        #     'Key': o['Key'],
+        #     'VersionId': o['VersionId'],
+        #     'IsLatest': o['IsLatest'],
+        #     'ETag': o['ETag'],
+        # } for o in resp.get('Versions', [])]
+        # self.assertEqual(expected, objs)
+
+        # KeyMarker skips past that key
+        resp = self.client.list_object_versions(Bucket=self.bucket_name,
+                                                KeyMarker=obj00_name)
+        objs = [{
+            'Key': o['Key'],
+            'VersionId': o['VersionId'],
+            'IsLatest': o['IsLatest'],
+            'ETag': o['ETag'],
+        } for o in resp.get('Versions', [])]
+        self.assertEqual(expected[3:], objs)
+
+        # KeyMarker with VersionIdMarker skips past that version
+        resp = self.client.list_object_versions(Bucket=self.bucket_name,
+                                                KeyMarker=obj00_name,
+                                                VersionIdMarker=versions[0])
+        objs = [{
+            'Key': o['Key'],
+            'VersionId': o['VersionId'],
+            'IsLatest': o['IsLatest'],
+            'ETag': o['ETag'],
+        } for o in resp.get('Versions', [])]
+        self.assertEqual(expected[1:], objs)
+
+        # KeyMarker with bogus version skips past that key
+        resp = self.client.list_object_versions(
+            Bucket=self.bucket_name,
+            KeyMarker=obj00_name,
+            VersionIdMarker=versions[4])
+        objs = [{
+            'Key': o['Key'],
+            'VersionId': o['VersionId'],
+            'IsLatest': o['IsLatest'],
+            'ETag': o['ETag'],
+        } for o in resp.get('Versions', [])]
+        self.assertEqual(expected[3:], objs)
+
+    def test_list_objects(self):
+        etags = defaultdict(list)
+        for i in range(3):
+            obj_name = self.create_name('versioned-obj')
+            for i in range(3):
+                obj_data = self.create_name('some-data-%s' % i).encode('ascii')
+                etags[obj_name].insert(0, md5(
+                    obj_data, usedforsecurity=False).hexdigest())
+                self.client.upload_fileobj(
+                    io.BytesIO(obj_data), self.bucket_name, obj_name)
+
+        # both unversioned list_objects responses are similar
+        expected = []
+        for name, obj_etags in sorted(etags.items()):
+            expected.append({
+                'ETag': '"%s"' % obj_etags[0],
+                'Key': name,
+                'Size': len(obj_data),
+                'StorageClass': 'STANDARD',
+            })
+        resp = self.client.list_objects(Bucket=self.bucket_name)
+        objs = resp.get('Contents', [])
+        for obj in objs:
+            owner = obj.pop('Owner')
+            # one difference seems to be the Owner key
+            self.check_owner(owner)
+            self._sanitize_obj_listing(obj)
+        self.assertEqual(expected, objs)
+        resp = self.client.list_objects_v2(Bucket=self.bucket_name)
+        objs = resp.get('Contents', [])
+        for obj in objs:
+            self._sanitize_obj_listing(obj)
+        self.assertEqual(expected, objs)
+
+        # versioned listings has something for everyone
+        expected = []
+        for name, obj_etags in sorted(etags.items()):
+            is_latest = True
+            for etag in obj_etags:
+                expected.append({
+                    'ETag': '"%s"' % etag,
+                    'IsLatest': is_latest,
+                    'Key': name,
+                    'Size': len(obj_data),
+                    'StorageClass': 'STANDARD',
+                })
+                is_latest = False
+
+        resp = self.client.list_object_versions(Bucket=self.bucket_name)
+        objs = resp.get('Versions', [])
+        versions = []
+        for obj in objs:
+            self._sanitize_obj_listing(obj)
+            versions.append(obj.pop('VersionId'))
+        self.assertEqual(expected, objs)
+
+    def test_copy_object(self):
+        etags = []
+        obj_name = self.create_name('versioned-obj')
+        for i in range(3):
+            obj_data = self.create_name('some-data-%s' % i).encode('ascii')
+            etags.insert(0, md5(
+                obj_data, usedforsecurity=False).hexdigest())
+            self.client.upload_fileobj(
+                io.BytesIO(obj_data), self.bucket_name, obj_name)
+
+        resp = self.client.list_object_versions(Bucket=self.bucket_name)
+        objs = resp.get('Versions', [])
+        versions = []
+        for obj in objs:
+            versions.append(obj.pop('VersionId'))
+
+        # CopySource can just be Bucket/Key string
+        first_target = self.create_name('target-obj1')
+        copy_resp = self.client.copy_object(
+            Bucket=self.bucket_name, Key=first_target,
+            CopySource='%s/%s' % (self.bucket_name, obj_name))
+        self.assertEqual(versions[0], copy_resp['CopySourceVersionId'])
+
+        # and you'll just get the most recent version
+        resp = self.client.head_object(Bucket=self.bucket_name,
+                                       Key=first_target)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual('"%s"' % etags[0], resp['ETag'])
+
+        # or you can be more explicit
+        explicit_target = self.create_name('target-%s' % versions[0])
+        copy_source = {'Bucket': self.bucket_name, 'Key': obj_name,
+                       'VersionId': versions[0]}
+        copy_resp = self.client.copy_object(
+            Bucket=self.bucket_name, Key=explicit_target,
+            CopySource=copy_source)
+        self.assertEqual(versions[0], copy_resp['CopySourceVersionId'])
+        # and you still get the same thing
+        resp = self.client.head_object(Bucket=self.bucket_name,
+                                       Key=explicit_target)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual('"%s"' % etags[0], resp['ETag'])
+
+        # but you can also copy from a specific version
+        version_target = self.create_name('target-%s' % versions[2])
+        copy_source['VersionId'] = versions[2]
+        copy_resp = self.client.copy_object(
+            Bucket=self.bucket_name, Key=version_target,
+            CopySource=copy_source)
+        self.assertEqual(versions[2], copy_resp['CopySourceVersionId'])
+        resp = self.client.head_object(Bucket=self.bucket_name,
+                                       Key=version_target)
+        self.assertEqual(200, resp['ResponseMetadata']['HTTPStatusCode'])
+        self.assertEqual('"%s"' % etags[2], resp['ETag'])
diff --git a/test/sample.conf b/test/sample.conf
index d40fb0fe47..581455df14 100644
--- a/test/sample.conf
+++ b/test/sample.conf
@@ -1,14 +1,42 @@
+[s3api_test]
+endpoint = http://127.0.0.1:8080
+#ca_cert=/path/to/ca.crt
+region = us-east-1
+# First and second users should be account owners
+access_key1 = test:tester
+secret_key1 = testing
+access_key2 = test:tester2
+secret_key2 = testing2
+# Third user should be unprivileged
+access_key3 = test:tester3
+secret_key3 = testing3
+
+# Some tests require advanced compatibility features to pass.  Add the
+# following non-default options to the s3api section of your proxy-server.conf
+#   s3_acl = True
+#   check_bucket_owner = True
+# Alternatively, skip those tests by setting this option to False
+s3_acl_tests_enabled = True
+
 [func_test]
-# sample config
-auth_host = 127.0.0.1
-auth_port = 8080
-auth_ssl = no
-auth_prefix = /auth/
+# Sample config for Swift with tempauth
+auth_uri = http://127.0.0.1:8080/auth/v1.0
+# Sample config for Swift with Keystone v2 API.
+# For keystone v2 change auth_version to 2 and auth_prefix to /v2.0/.
+# And "allow_account_management" should not be set "true".
+#auth_version = 3
+#auth_uri = http://localhost:5000/v3/
+
+# Used by s3api functional tests, which don't contact auth directly
+#s3_storage_url = http://127.0.0.1:8080/
+#s3_region = us-east-1
 
 # Primary functional test account (needs admin access to the account)
 account = test
 username = tester
 password = testing
+s3_access_key = test:tester
+s3_secret_key = testing
 
 # User on a second account (needs admin access to the account)
 account2 = test2
@@ -18,26 +46,101 @@ password2 = testing2
 # User on same account as first, but without admin access
 username3 = tester3
 password3 = testing3
+# s3api requires the same account with the primary one and different users
+# one swift owner:
+s3_access_key2 = test:tester2
+s3_secret_key2 = testing2
+# one unprivileged:
+s3_access_key3 = test:tester3
+s3_secret_key3 = testing3
+
+# Fourth user is required for keystone v3 specific tests.
+# Account must be in a non-default domain.
+#account4 = test4
+#username4 = tester4
+#password4 = testing4
+#domain4 = test-domain
+
+# Fifth user is required for service token-specific tests.
+# The account must be different from the primary test account.
+# The user must not have a group (tempauth) or role (keystoneauth) on
+# the primary test account. The user must have a group/role that is unique
+# and not given to the primary tester and is specified in the options
+# <prefix>_require_group (tempauth) or <prefix>_service_roles (keystoneauth).
+#account5 = test5
+#username5 = tester5
+#password5 = testing5
+
+# The service_prefix option is used for service token-specific tests.
+# If service_prefix or username5 above is not supplied, the tests are skipped.
+# To set the value and enable the service token tests, look at the
+# reseller_prefix option in /etc/swift/proxy-server.conf. There must be at
+# least two prefixes. If not, add a prefix as follows (where we add SERVICE):
+#     reseller_prefix = AUTH, SERVICE
+# The service_prefix must match the <prefix> used in <prefix>_require_group
+# (tempauth) or <prefix>_service_roles (keystoneauth); for example:
+#    SERVICE_require_group = service
+#    SERVICE_service_roles = service
+# Note: Do not enable service token tests if the first prefix in
+# reseller_prefix is the empty prefix AND the primary functional test
+# account contains an underscore.
+#service_prefix = SERVICE
+
+# Sixth user is required for access control tests.
+# Account must have a role for reseller_admin_role(keystoneauth).
+#account6 = test
+#username6 = tester6
+#password6 = testing6
+
+collate = C
+
+# Only necessary if a pre-existing server uses self-signed certificate
+insecure = no
+
+# Tests that are dependent on domain_remap middleware being installed also
+# require one of the domain_remap storage_domain values to be specified here,
+# otherwise those tests will be skipped.
+storage_domain =
+
+[unit_test]
+fake_syslog = False
+
+[probe_test]
+# check_server_timeout = 30
+# subprocess_wait_timeout = 30
+# validate_rsync = false
+# proxy_base_url = http://localhost:8080
 
-# Default constraints if not defined here, the test runner will try
-# to set them from /etc/swift/swift.conf. If that file isn't found,
-# the test runner will skip tests that depend on these values.
-# Note that the cluster must have "sane" values for the test suite to pass.
+[swift-constraints]
+# The functional test runner will try to use the constraint values provided in
+# the swift-constraints section of test.conf.
+#
+# If a constraint value does not exist in that section, or because the
+# swift-constraints section does not exist, the constraints values found in
+# the /info API call (if successful) will be used.
+#
+# If a constraint value cannot be found in the /info results, either because
+# the /info API call failed, or a value is not present, the constraint value
+# used will fall back to those loaded by the constraints module at time of
+# import (which will attempt to load /etc/swift/swift.conf, see the
+# swift.common.constraints module for more information).
+#
+# Note that the cluster must have "sane" values for the test suite to pass
+# (for some definition of sane).
+#
 #max_file_size = 5368709122
 #max_meta_name_length = 128
 #max_meta_value_length = 256
 #max_meta_count = 90
 #max_meta_overall_size = 4096
+#max_header_size = 8192
+#extra_header_count = 0
 #max_object_name_length = 1024
 #container_listing_limit = 10000
 #account_listing_limit = 10000
 #max_account_name_length = 256
 #max_container_name_length = 256
 
-collate = C
-
-[unit_test]
-fake_syslog = False
-
-[probe_test]
-# check_server_timeout = 30
+# Newer swift versions default to strict cors mode, but older ones were the
+# opposite.
+#strict_cors_mode = true
diff --git a/test/unit/__init__.py b/test/unit/__init__.py
index 54af5290bc..afa8388b22 100644
--- a/test/unit/__init__.py
+++ b/test/unit/__init__.py
@@ -1,39 +1,588 @@
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
 """ Swift tests """
 
-import sys
 import os
 import copy
 import logging
-from sys import exc_info
+import logging.handlers
+import sys
 from contextlib import contextmanager
 from collections import defaultdict
+from collections.abc import Iterable
+import itertools
+from numbers import Number
 from tempfile import NamedTemporaryFile
+import time
+import eventlet
+from eventlet import greenpool, debug as eventlet_debug
 from eventlet.green import socket
-from tempfile import mkdtemp
+from tempfile import mkdtemp, mkstemp, gettempdir
 from shutil import rmtree
+import signal
+import json
+import random
+import errno
+import xattr
+from io import BytesIO
+from uuid import uuid4
+from http.client import HTTPException
+
+from swift.common import memcached
+from swift.common import storage_policy, swob, utils, exceptions
+from swift.common.memcached import MemcacheConnectionError
+from swift.common.storage_policy import (StoragePolicy, ECStoragePolicy,
+                                         VALID_EC_TYPES)
+from swift.common.utils import Timestamp, md5, close_if_possible, checksum
 from test import get_config
-from ConfigParser import MissingSectionHeaderError
-from StringIO import StringIO
-from swift.common.utils import readconf, config_true_value
-from logging import Handler
-import logging.handlers
+from test.debug_logger import FakeLogger
+from test.unit.common.test_memcached import MockedMemcachePool, \
+    MockMemcached
+from swift.common.header_key_dict import HeaderKeyDict
+from swift.common.ring import Ring, RingData, RingBuilder
+from swift.obj import server
+
+import functools
+from unittest import mock as mocklib
+import inspect
+from unittest import SkipTest
+
+
+# try not to import this module from swift
+if not os.path.basename(sys.argv[0]).startswith('swift'):
+    # never patch HASH_PATH_SUFFIX AGAIN!
+    utils.HASH_PATH_SUFFIX = b'endcap'
+
+
+EC_TYPE_PREFERENCE = [
+    'liberasurecode_rs_vand',
+    'jerasure_rs_vand',
+]
+for eclib_name in EC_TYPE_PREFERENCE:
+    if eclib_name in VALID_EC_TYPES:
+        break
+else:
+    raise SystemExit('ERROR: unable to find suitable PyECLib type'
+                     ' (none of %r found in %r)' % (
+                         EC_TYPE_PREFERENCE,
+                         VALID_EC_TYPES,
+                     ))
+DEFAULT_TEST_EC_TYPE = eclib_name
+
+
+def patch_policies(thing_or_policies=None, legacy_only=False,
+                   with_ec_default=False, fake_ring_args=None):
+    if isinstance(thing_or_policies, (
+            Iterable, storage_policy.StoragePolicyCollection)):
+        return PatchPolicies(thing_or_policies, fake_ring_args=fake_ring_args)
+
+    if legacy_only:
+        default_policies = [
+            StoragePolicy(0, name='legacy', is_default=True),
+        ]
+        default_ring_args = [{}]
+    elif with_ec_default:
+        default_policies = [
+            ECStoragePolicy(0, name='ec', is_default=True,
+                            ec_type=DEFAULT_TEST_EC_TYPE, ec_ndata=10,
+                            ec_nparity=4, ec_segment_size=4096),
+            StoragePolicy(1, name='unu'),
+        ]
+        default_ring_args = [{'replicas': 14}, {}]
+    else:
+        default_policies = [
+            StoragePolicy(0, name='nulo', is_default=True),
+            StoragePolicy(1, name='unu'),
+        ]
+        default_ring_args = [{}, {}]
+
+    fake_ring_args = fake_ring_args or default_ring_args
+    decorator = PatchPolicies(default_policies, fake_ring_args=fake_ring_args)
+
+    if not thing_or_policies:
+        return decorator
+    else:
+        # it's a thing, we return the wrapped thing instead of the decorator
+        return decorator(thing_or_policies)
+
+
+class PatchPolicies(object):
+    """
+    Why not mock.patch?  In my case, when used as a decorator on the class it
+    seemed to patch setUp at the wrong time (i.e. in setUp the global wasn't
+    patched yet)
+    """
+
+    def __init__(self, policies, fake_ring_args=None):
+        if isinstance(policies, storage_policy.StoragePolicyCollection):
+            self.policies = policies
+        else:
+            self.policies = storage_policy.StoragePolicyCollection(policies)
+        self.fake_ring_args = fake_ring_args or [None] * len(self.policies)
+
+    def _setup_rings(self):
+        """
+        Our tests tend to use the policies rings like their own personal
+        playground - which can be a problem in the particular case of a
+        patched TestCase class where the FakeRing objects are scoped in the
+        call to the patch_policies wrapper outside of the TestCase instance
+        which can lead to some bled state.
+
+        To help tests get better isolation without having to think about it,
+        here we're capturing the args required to *build* a new FakeRing
+        instances so we can ensure each test method gets a clean ring setup.
+
+        The TestCase can always "tweak" these fresh rings in setUp - or if
+        they'd prefer to get the same "reset" behavior with custom FakeRing's
+        they can pass in their own fake_ring_args to patch_policies instead of
+        setting the object_ring on the policy definitions.
+        """
+        for policy, fake_ring_arg in zip(self.policies, self.fake_ring_args):
+            if fake_ring_arg is not None:
+                policy.object_ring = FakeRing(**fake_ring_arg)
+
+    def __call__(self, thing):
+        if isinstance(thing, type):
+            return self._patch_class(thing)
+        else:
+            return self._patch_method(thing)
+
+    def _patch_class(self, cls):
+        """
+        Creating a new class that inherits from decorated class is the more
+        common way I've seen class decorators done - but it seems to cause
+        infinite recursion when super is called from inside methods in the
+        decorated class.
+        """
+
+        orig_setUp = cls.setUp
+
+        def unpatch_cleanup(cls_self):
+            if cls_self._policies_patched:
+                self.__exit__(None, None, None)
+                cls_self._policies_patched = False
+
+        def setUp(cls_self):
+            if not getattr(cls_self, '_policies_patched', False):
+                self.__enter__()
+                cls_self._policies_patched = True
+                cls_self.addCleanup(unpatch_cleanup, cls_self)
+            orig_setUp(cls_self)
+
+        cls.setUp = setUp
+
+        return cls
+
+    def _patch_method(self, f):
+        @functools.wraps(f)
+        def mywrapper(*args, **kwargs):
+            with self:
+                return f(*args, **kwargs)
+        return mywrapper
+
+    def __enter__(self):
+        self._orig_POLICIES = storage_policy._POLICIES
+        storage_policy._POLICIES = self.policies
+        try:
+            self._setup_rings()
+        except:  # noqa
+            self.__exit__(None, None, None)
+            raise
+
+    def __exit__(self, *args):
+        storage_policy._POLICIES = self._orig_POLICIES
+
+
+class FakeRing(Ring):
+
+    def __init__(self, replicas=3, max_more_nodes=0, part_power=0,
+                 base_port=1000, separate_replication=False,
+                 next_part_power=None, reload_time=15):
+        self.serialized_path = '/foo/bar/object.ring.gz'
+        self._base_port = base_port
+        self.max_more_nodes = max_more_nodes
+        self._part_shift = 32 - part_power
+        self._init_device_char()
+        self.separate_replication = separate_replication
+        # 9 total nodes (6 more past the initial 3) is the cap, no matter if
+        # this is set higher, or R^2 for R replicas
+        self.reload_time = reload_time
+        self.set_replicas(replicas)
+        self._next_part_power = next_part_power
+        self._reload()
+
+    def has_changed(self):
+        """
+        The real implementation uses getmtime on the serialized_path attribute,
+        which doesn't exist on our fake and relies on the implementation of
+        _reload which we override.  So ... just NOOPE.
+        """
+        return False
+
+    def _reload(self):
+        self._rtime = time.time()
+
+    @property
+    def device_char(self):
+        return next(self._device_char_iter)
+
+    def _init_device_char(self):
+        self._device_char_iter = itertools.cycle(
+            ['sd%s' % chr(ord('a') + x) for x in range(26)])
+
+    def add_node(self, dev):
+        # round trip through json to ensure unicode like real rings
+        self._devs.append(json.loads(json.dumps(dev)))
+
+    def set_replicas(self, replicas):
+        self.replicas = replicas
+        self._devs = []
+        self._init_device_char()
+        for x in range(self.replicas):
+            ip = '10.0.0.%s' % x
+            port = self._base_port + x
+            if self.separate_replication:
+                repl_ip = '10.0.1.%s' % x
+                repl_port = port + 100
+            else:
+                repl_ip, repl_port = ip, port
+            dev = {
+                'ip': ip,
+                'replication_ip': repl_ip,
+                'port': port,
+                'replication_port': repl_port,
+                'device': self.device_char,
+                'zone': x % 3,
+                'region': x % 2,
+                'id': x,
+                'weight': 1,
+            }
+            self.add_node(dev)
+
+    @property
+    def replica_count(self):
+        return self.replicas
+
+    def _get_part_nodes(self, part):
+        return [dict(node, index=i) for i, node in enumerate(list(self._devs))]
+
+    def get_more_nodes(self, part):
+        index_counter = itertools.count()
+        for x in range(self.replicas, (self.replicas + self.max_more_nodes)):
+            ip = '10.0.0.%s' % x
+            port = self._base_port + x
+            if self.separate_replication:
+                repl_ip = '10.0.1.%s' % x
+                repl_port = port + 100
+            else:
+                repl_ip, repl_port = ip, port
+            yield {'ip': ip,
+                   'replication_ip': repl_ip,
+                   'port': port,
+                   'replication_port': repl_port,
+                   'device': 'sda',
+                   'zone': x % 3,
+                   'region': x % 2,
+                   'id': x,
+                   'handoff_index': next(index_counter)}
+
+
+def write_fake_ring(path, *devs):
+    """
+    Pretty much just a two node, two replica, 2 part power ring...
+    """
+    dev1 = {'id': 0, 'region': 1, 'zone': 0, 'device': 'sda1',
+            'ip': '127.0.0.1', 'port': 6200}
+    dev2 = {'id': 1, 'region': 1, 'zone': 0, 'device': 'sdb1',
+            'ip': '127.0.0.1', 'port': 6200}
+
+    dev1_updates, dev2_updates = devs or ({}, {})
+
+    dev1.update(dev1_updates)
+    dev2.update(dev2_updates)
+
+    replica2part2dev_id = [[0, 1, 0, 1], [1, 0, 1, 0]]
+    devs = [dev1, dev2]
+    part_shift = 30
+    RingData(replica2part2dev_id, devs, part_shift).save(path)
+
+
+def write_stub_builder(tmpdir, region=1, name=''):
+    """
+    Pretty much just a three node, three replica, 8 part power builder...
+
+    :param tmpdir: a place to write the builder, be sure to clean it up!
+    :param region: an integer, fills in region and ip
+    :param name: the name of the builder (i.e. <name>.builder)
+    """
+    name = name or str(region)
+    replicas = 3
+    builder = RingBuilder(8, replicas, 1)
+    for i in range(replicas):
+        dev = {'weight': 100,
+               'region': '%d' % region,
+               'zone': '1',
+               'ip': '10.0.0.%d' % region,
+               'port': '3600',
+               'device': 'sdb%d' % i}
+        builder.add_dev(dev)
+    builder.rebalance()
+    builder_file = os.path.join(tmpdir, '%s.builder' % name)
+    builder.save(builder_file)
+    return builder, builder_file
+
+
+class FabricatedRing(Ring):
+    """
+    When a FakeRing just won't do - you can fabricate one to meet
+    your tests needs.
+    """
+
+    def __init__(self, replicas=6, devices=8, nodes=4, port=6200,
+                 part_power=4):
+        self.devices = devices
+        self.nodes = nodes
+        self.port = port
+        self.replicas = replicas
+        self._part_shift = 32 - part_power
+        self._reload()
+
+    def has_changed(self):
+        return False
+
+    def _reload(self, *args, **kwargs):
+        self._rtime = time.time() * 2
+        if hasattr(self, '_replica2part2dev_id'):
+            return
+        self._devs = [{
+            'region': 1,
+            'zone': 1,
+            'weight': 1.0,
+            'id': i,
+            'device': 'sda%d' % i,
+            'ip': '10.0.0.%d' % (i % self.nodes),
+            'replication_ip': '10.0.0.%d' % (i % self.nodes),
+            'port': self.port,
+            'replication_port': self.port,
+        } for i in range(self.devices)]
+
+        self._replica2part2dev_id = [
+            [None] * 2 ** self.part_power
+            for i in range(self.replicas)
+        ]
+        dev_ids = itertools.cycle(range(self.devices))
+        for p in range(2 ** self.part_power):
+            for r in range(self.replicas):
+                self._replica2part2dev_id[r][p] = next(dev_ids)
+        self._update_bookkeeping()
+
+
+def track(f):
+    def wrapper(self, *a, **kw):
+        self.calls.append(getattr(mocklib.call, f.__name__)(*a, **kw))
+        return f(self, *a, **kw)
+    return wrapper
+
+
+class FakeMemcache(object):
+    """
+    Simple in-memory test helper for basic memcache GET/SET operations.
+
+    This class provides a lightweight mock that stores data in a Python dict.
+    It does not implement TTL expiration or the full memcache protocol, and
+    bypasses MemcacheRing's internal handling (e.g., atomic incr operations).
+    Use this for simple tests that only need basic key-value storage.
+    """
+
+    def __init__(self, error_on_set=None, error_on_get=None):
+        self.store = {}
+        self.times = {}
+        self.calls = []
+        self.error_on_incr = False
+        self.error_on_get = error_on_get or []
+        self.error_on_set = error_on_set or []
+        self.init_incr_return_neg = False
+
+    def clear_calls(self):
+        del self.calls[:]
+
+    @track
+    def get(self, key, raise_on_error=False):
+        if self.error_on_get and self.error_on_get.pop(0):
+            if raise_on_error:
+                raise MemcacheConnectionError()
+        return self.store.get(key)
+
+    @property
+    def keys(self):
+        return self.store.keys
+
+    @track
+    def set(self, key, value, serialize=True, time=0, raise_on_error=False):
+        if self.error_on_set and self.error_on_set.pop(0):
+            if raise_on_error:
+                raise MemcacheConnectionError()
+        if serialize:
+            value = json.loads(json.dumps(value))
+        else:
+            assert isinstance(value, (str, bytes))
+        self.store[key] = value
+        self.times[key] = time
+        return True
+
+    @track
+    def incr(self, key, delta=1, time=0):
+        if self.error_on_incr:
+            raise MemcacheConnectionError('Memcache restarting')
+        if self.init_incr_return_neg:
+            # simulate initial hit, force reset of memcache
+            self.init_incr_return_neg = False
+            return -10000000
+        self.store[key] = int(self.store.setdefault(key, 0)) + delta
+        if self.store[key] < 0:
+            self.store[key] = 0
+        return self.store[key]
+
+    # tracked via incr()
+    def decr(self, key, delta=1, time=0):
+        return self.incr(key, delta=-delta, time=time)
+
+    @track
+    def delete(self, key):
+        try:
+            del self.store[key]
+            del self.times[key]
+        except Exception:
+            pass
+        return True
+
+    def delete_all(self):
+        self.store.clear()
+        self.times.clear()
+
+
+# This decorator only makes sense in the context of FakeMemcache;
+# may as well clean it up now
+del track
+
+
+class TestableMemcacheRing(memcached.MemcacheRing):
+    """
+    Real MemcacheRing with injectable errors for testing concurrent scenarios.
+
+    This class wraps the actual MemcacheRing implementation while allowing
+    controlled injection of connection errors. It preserves MemcacheRing's
+    internal behavior including atomic operations and protocol compliance.
+    Use this for testing components that rely on memcache features like
+    atomic incr/decr or when testing concurrent access patterns.
+    """
+
+    def __init__(self, servers, inject_incr_error=None, inject_set_error=None,
+                 inject_get_error=None, inject_del_error=None, **kwargs):
+        self.inject_incr_error = inject_incr_error
+        self.inject_set_error = inject_set_error
+        self.inject_get_error = inject_get_error
+        self.inject_del_error = inject_del_error
+        super().__init__(servers, **kwargs)
+        mock_cache = MockMemcached()
+        self._client_cache['1.2.3.4:11211'] = MockedMemcachePool(
+            [(mock_cache, mock_cache)] * 2)
+        self.set_calls = []
+        self.incr_calls = []
+        self.get_calls = []
+        self.del_calls = []
+
+    def incr(self, key, delta=1, time=0):
+        self.incr_calls.append((key, delta, time))
+        if self.inject_incr_error:
+            raise MemcacheConnectionError
+        return super().incr(key, delta, time)
+
+    def set(self, key, value, serialize=True, time=0,
+            min_compress_len=0, raise_on_error=False):
+        self.set_calls.append((key, value, time))
+        if self.inject_set_error:
+            if raise_on_error:
+                raise MemcacheConnectionError
+            else:
+                return None
+        super().set(
+            key, value, serialize, time, min_compress_len, raise_on_error)
+
+    def get(self, key, raise_on_error=False):
+        self.get_calls.append(key)
+        if self.inject_get_error:
+            if raise_on_error:
+                raise MemcacheConnectionError
+            else:
+                return None
+        return super().get(key, raise_on_error)
+
+    def delete(self, key, server_key=None):
+        self.del_calls.append(key)
+        if self.inject_del_error:
+            raise MemcacheConnectionError
+        super().delete(key, server_key)
+
+
+class FakeIterable(object):
+    def __init__(self, values):
+        self.next_call_count = 0
+        self.close_call_count = 0
+        self.values = iter(values)
+
+    def __iter__(self):
+        return self
+
+    def __next__(self):
+        self.next_call_count += 1
+        return next(self.values)
+
+    def close(self):
+        self.close_call_count += 1
 
 
 def readuntil2crlfs(fd):
-    rv = ''
-    lc = ''
+    rv = b''
+    lc = b''
     crlfs = 0
     while crlfs < 2:
         c = fd.read(1)
+        if not c:
+            raise ValueError("didn't get two CRLFs; just got %r" % rv)
         rv = rv + c
-        if c == '\r' and lc != '\n':
+        if c == b'\r' and lc != b'\n':
             crlfs = 0
-        if lc == '\r' and c == '\n':
+        if lc == b'\r' and c == b'\n':
             crlfs += 1
         lc = c
     return rv
 
 
+def readlength(fd, size, timeout=1.0):
+    buf = b''
+    with eventlet.Timeout(timeout):
+        while len(buf) < size:
+            chunk = fd.read(min(64, size - len(buf)))
+            buf += chunk
+            if len(buf) >= size:
+                break
+    return buf
+
+
 def connect_tcp(hostport):
     rv = socket.socket()
     rv.connect(hostport)
@@ -50,36 +599,6 @@ def tmpfile(content):
     finally:
         os.unlink(file_name)
 
-xattr_data = {}
-
-
-def _get_inode(fd):
-    if not isinstance(fd, int):
-        try:
-            fd = fd.fileno()
-        except AttributeError:
-            return os.stat(fd).st_ino
-    return os.fstat(fd).st_ino
-
-
-def _setxattr(fd, k, v):
-    inode = _get_inode(fd)
-    data = xattr_data.get(inode, {})
-    data[k] = v
-    xattr_data[inode] = data
-
-
-def _getxattr(fd, k):
-    inode = _get_inode(fd)
-    data = xattr_data.get(inode, {}).get(k)
-    if not data:
-        raise IOError
-    return data
-
-import xattr
-xattr.setxattr = _setxattr
-xattr.getxattr = _getxattr
-
 
 @contextmanager
 def temptree(files, contents=''):
@@ -102,86 +621,45 @@ def temptree(files, contents=''):
         rmtree(tempdir)
 
 
-class NullLoggingHandler(logging.Handler):
-
-    def emit(self, record):
-        pass
-
-
-class FakeLogger(object):
-    # a thread safe logger
-
-    def __init__(self, *args, **kwargs):
-        self._clear()
-        self.level = logging.NOTSET
-        if 'facility' in kwargs:
-            self.facility = kwargs['facility']
-
-    def _clear(self):
-        self.log_dict = defaultdict(list)
-
-    def _store_in(store_name):
-        def stub_fn(self, *args, **kwargs):
-            self.log_dict[store_name].append((args, kwargs))
-        return stub_fn
-
-    error = _store_in('error')
-    info = _store_in('info')
-    warning = _store_in('warning')
-    debug = _store_in('debug')
-
-    def exception(self, *args, **kwargs):
-        self.log_dict['exception'].append((args, kwargs, str(exc_info()[1])))
-
-    # mock out the StatsD logging methods:
-    increment = _store_in('increment')
-    decrement = _store_in('decrement')
-    timing = _store_in('timing')
-    timing_since = _store_in('timing_since')
-    update_stats = _store_in('update_stats')
-    set_statsd_prefix = _store_in('set_statsd_prefix')
-
-    def get_increments(self):
-        return [call[0][0] for call in self.log_dict['increment']]
-
-    def get_increment_counts(self):
-        counts = {}
-        for metric in self.get_increments():
-            if metric not in counts:
-                counts[metric] = 0
-            counts[metric] += 1
-        return counts
-
-    def setFormatter(self, obj):
-        self.formatter = obj
+def with_tempdir(f):
+    """
+    Decorator to give a single test a tempdir as argument to test method.
+    """
+    @functools.wraps(f)
+    def wrapped(*args, **kwargs):
+        tempdir = mkdtemp()
+        args = list(args)
+        args.append(tempdir)
+        try:
+            return f(*args, **kwargs)
+        finally:
+            rmtree(tempdir)
+    return wrapped
 
-    def close(self):
-        self._clear()
 
-    def set_name(self, name):
-        # don't touch _handlers
-        self._name = name
+class NullLoggingHandler(logging.Handler):
 
-    def acquire(self):
+    def emit(self, record):
         pass
 
-    def release(self):
-        pass
 
-    def createLock(self):
-        pass
+class UnmockTimeModule(object):
+    """
+    Even if a test mocks time.time - you can restore unmolested behavior in a
+    another module who imports time directly by monkey patching it's imported
+    reference to the module with an instance of this class
+    """
 
-    def emit(self, record):
-        pass
+    _orig_time = time.time
 
-    def handle(self, record):
-        pass
+    def __getattribute__(self, name):
+        if name == 'time':
+            return UnmockTimeModule._orig_time
+        return getattr(time, name)
 
-    def flush(self):
-        pass
 
-    def handleError(self, record):
-        pass
+# logging.LogRecord.__init__ calls time.time
+logging.time = UnmockTimeModule()
 
 
 original_syslog_handler = logging.handlers.SysLogHandler
@@ -198,53 +676,43 @@ def fake_syslog_handler():
     logging.handlers.SysLogHandler = FakeLogger
 
 
-if config_true_value(get_config('unit_test').get('fake_syslog', 'False')):
+if utils.config_true_value(
+        get_config('unit_test').get('fake_syslog', 'False')):
     fake_syslog_handler()
 
 
-class MockTrue(object):
-    """
-    Instances of MockTrue evaluate like True
-    Any attr accessed on an instance of MockTrue will return a MockTrue
-    instance. Any method called on an instance of MockTrue will return
-    a MockTrue instance.
-
-    >>> thing = MockTrue()
-    >>> thing
-    True
-    >>> thing == True # True == True
-    True
-    >>> thing == False # True == False
-    False
-    >>> thing != True # True != True
-    False
-    >>> thing != False # True != False
-    True
-    >>> thing.attribute
-    True
-    >>> thing.method()
-    True
-    >>> thing.attribute.method()
-    True
-    >>> thing.method().attribute
-    True
-
-    """
-
-    def __getattribute__(self, *args, **kwargs):
-        return self
+@contextmanager
+def quiet_eventlet_exceptions():
+    orig_state = greenpool.DEBUG
+    eventlet_debug.hub_exceptions(False)
+    try:
+        yield
+    finally:
+        eventlet_debug.hub_exceptions(orig_state)
 
-    def __call__(self, *args, **kwargs):
-        return self
 
-    def __repr__(*args, **kwargs):
-        return repr(True)
+@contextmanager
+def mock_check_drive(isdir=False, ismount=False):
+    """
+    All device/drive/mount checking should be done through the constraints
+    module. If we keep the mocking consistently within that module, we can
+    keep our tests robust to further rework on that interface.
 
-    def __eq__(self, other):
-        return other is True
+    Replace the constraint modules underlying os calls with mocks.
 
-    def __ne__(self, other):
-        return other is not True
+    :param isdir: return value of constraints isdir calls, default False
+    :param ismount: return value of constraints ismount calls, default False
+    :returns: a dict of constraint module mocks
+    """
+    mock_base = 'swift.common.constraints.'
+    with mocklib.patch(mock_base + 'isdir') as mock_isdir, \
+            mocklib.patch(mock_base + 'utils.ismount') as mock_ismount:
+        mock_isdir.return_value = isdir
+        mock_ismount.return_value = ismount
+        yield {
+            'isdir': mock_isdir,
+            'ismount': mock_ismount,
+        }
 
 
 @contextmanager
@@ -262,8 +730,905 @@ def mock(update):
         else:
             deletes.append((module, attr))
         setattr(module, attr, value)
-    yield True
-    for module, attr, value in returns:
-        setattr(module, attr, value)
-    for module, attr in deletes:
-        delattr(module, attr)
+    try:
+        yield True
+    finally:
+        for module, attr, value in returns:
+            setattr(module, attr, value)
+        for module, attr in deletes:
+            delattr(module, attr)
+
+
+class FakeStatus(object):
+    """
+    This will work with our fake_http_connect, if you hand in one of these
+    instead of a status int or status int tuple to the "codes" iter you can
+    add some eventlet sleep to the expect and response stages of the
+    connection.
+    """
+
+    def __init__(self, status, expect_sleep=None, response_sleep=None):
+        """
+        :param status: the response status int, or a tuple of
+                       ([expect_status, ...], response_status)
+        :param expect_sleep: float, time to eventlet sleep during expect, can
+                             be a iter of floats
+        :param response_sleep: float, time to eventlet sleep during response
+        """
+        # connect exception
+        if inspect.isclass(status) and issubclass(status, Exception):
+            raise status('FakeStatus Error')
+        if isinstance(status, (Exception, eventlet.Timeout)):
+            raise status
+        if isinstance(status, tuple):
+            self.expect_status = list(status[:-1])
+            self.status = status[-1]
+            self.explicit_expect_list = True
+        else:
+            self.expect_status, self.status = ([], status)
+            self.explicit_expect_list = False
+        if not self.expect_status:
+            # when a swift backend service returns a status before reading
+            # from the body (mostly an error response) eventlet.wsgi will
+            # respond with that status line immediately instead of 100
+            # Continue, even if the client sent the Expect 100 header.
+            # BufferedHttp and the proxy both see these error statuses
+            # when they call getexpect, so our FakeConn tries to act like
+            # our backend services and return certain types of responses
+            # as expect statuses just like a real backend server would do.
+            if self.status in (507, 412, 409):
+                self.expect_status = [status]
+            else:
+                self.expect_status = [100, 100]
+
+        # setup sleep attributes
+        if not isinstance(expect_sleep, (list, tuple)):
+            expect_sleep = [expect_sleep] * len(self.expect_status)
+        self.expect_sleep_list = list(expect_sleep)
+        while len(self.expect_sleep_list) < len(self.expect_status):
+            self.expect_sleep_list.append(None)
+        self.response_sleep = response_sleep
+
+    def __repr__(self):
+        return '%s(%s, expect_status=%r, response_sleep=%s)' % (
+            self.__class__.__name__, self.status,
+            self.expect_status, self.response_sleep)
+
+    def get_response_status(self):
+        if self.response_sleep is not None:
+            eventlet.sleep(self.response_sleep)
+        if self.expect_status and self.explicit_expect_list:
+            raise Exception('Test did not consume all fake '
+                            'expect status: %r' % (self.expect_status,))
+        if isinstance(self.status, (Exception, eventlet.Timeout)):
+            raise self.status
+        return self.status
+
+    def get_expect_status(self):
+        expect_sleep = self.expect_sleep_list.pop(0)
+        if expect_sleep is not None:
+            eventlet.sleep(expect_sleep)
+        expect_status = self.expect_status.pop(0)
+        if isinstance(expect_status, (Exception, eventlet.Timeout)):
+            raise expect_status
+        return expect_status
+
+
+class SlowBody(object):
+    """
+    This will work with our fake_http_connect, if you hand in these
+    instead of strings it will make reads take longer by the given
+    amount.  It should be a little bit easier to extend than the
+    current slow kwarg - which inserts whitespace in the response.
+    Also it should be easy to detect if you have one of these (or a
+    subclass) for the body inside of FakeConn if we wanted to do
+    something smarter than just duck-type the str/buffer api
+    enough to get by.
+    """
+
+    def __init__(self, body, slowness):
+        self.body = body
+        self.slowness = slowness
+
+    def slowdown(self):
+        eventlet.sleep(self.slowness)
+
+    def __getitem__(self, s):
+        return SlowBody(self.body[s], self.slowness)
+
+    def __len__(self):
+        return len(self.body)
+
+    def __radd__(self, other):
+        self.slowdown()
+        return other + self.body
+
+
+def fake_http_connect(*code_iter, **kwargs):
+
+    class FakeConn(object):
+
+        SLOW_READS = 4
+        SLOW_WRITES = 4
+
+        def __init__(self, status, etag=None, body=b'', timestamp=-1,
+                     headers=None, expect_headers=None, connection_id=None,
+                     give_send=None, give_expect=None):
+            if not isinstance(status, FakeStatus):
+                status = FakeStatus(status)
+            self._status = status
+            self.reason = 'Fake'
+            self.host = '1.2.3.4'
+            self.port = '1234'
+            self.sent = 0
+            self.received = 0
+            self.etag = etag
+            self.body = body
+            self._headers = headers or {}
+            self.expect_headers = expect_headers or {}
+            if timestamp == -1:
+                # -1 is reserved to mean "magic default"
+                if status.status != 404:
+                    self.timestamp = '1'
+                else:
+                    self.timestamp = '0'
+            else:
+                # tests may specify int, string, Timestamp or None
+                self.timestamp = timestamp
+            self.connection_id = connection_id
+            self.give_send = give_send
+            self.give_expect = give_expect
+            self.closed = False
+            if 'slow' in kwargs and isinstance(kwargs['slow'], list):
+                try:
+                    self._next_sleep = kwargs['slow'].pop(0)
+                except IndexError:
+                    self._next_sleep = None
+
+            # if we're going to be slow, we need a body to send slowly
+            am_slow, _junk = self.get_slow()
+            if am_slow and len(self.body) < self.SLOW_READS:
+                self.body += b" " * (self.SLOW_READS - len(self.body))
+
+            # be nice to trixy bits with node_iter's
+            eventlet.sleep()
+
+        def getresponse(self):
+            exc = kwargs.get('raise_exc')
+            if exc:
+                if isinstance(exc, (Exception, eventlet.Timeout)):
+                    raise exc
+                raise Exception('test')
+            if kwargs.get('raise_timeout_exc'):
+                raise eventlet.Timeout()
+            self.status = self._status.get_response_status()
+            return self
+
+        def getexpect(self):
+            if self.give_expect:
+                self.give_expect(self)
+            expect_status = self._status.get_expect_status()
+            headers = dict(self.expect_headers)
+            if expect_status == 409:
+                headers['X-Backend-Timestamp'] = self.timestamp
+            response = FakeConn(expect_status,
+                                timestamp=self.timestamp,
+                                headers=headers)
+            response.status = expect_status
+            return response
+
+        def getheaders(self):
+            etag = self.etag
+            if not etag:
+                if isinstance(self.body, bytes):
+                    etag = ('"' + md5(
+                        self.body, usedforsecurity=False).hexdigest() + '"')
+                else:
+                    etag = '"68b329da9893e34099c7d8ad5cb9c940"'
+
+            am_slow, _junk = self.get_slow()
+            headers = HeaderKeyDict({
+                'content-length': len(self.body),
+                'content-type': 'x-application/test',
+                'x-timestamp': self.timestamp,
+                'x-backend-timestamp': self.timestamp,
+                'last-modified': self.timestamp,
+                'x-object-meta-test': 'testing',
+                'x-delete-at': '9876543210',
+                'etag': etag,
+                'x-works': 'yes',
+            })
+            if self.status // 100 == 2:
+                headers['x-account-container-count'] = \
+                    kwargs.get('count', 12345)
+            if not self.timestamp:
+                # when timestamp is None, HeaderKeyDict raises KeyError
+                headers.pop('x-timestamp', None)
+            try:
+                if next(container_ts_iter) is False:
+                    headers['x-container-timestamp'] = '1'
+            except StopIteration:
+                pass
+            headers.update(self._headers)
+            return headers.items()
+
+        def get_slow(self):
+            if 'slow' in kwargs and isinstance(kwargs['slow'], list):
+                if self._next_sleep is not None:
+                    return True, self._next_sleep
+                else:
+                    return False, 0.01
+            if kwargs.get('slow') and isinstance(kwargs['slow'], Number):
+                return True, kwargs['slow']
+            return bool(kwargs.get('slow')), 0.1
+
+        def read(self, amt=None):
+            am_slow, value = self.get_slow()
+            if am_slow:
+                if self.sent < self.SLOW_READS:
+                    slowly_read_byte = self.body[self.sent:self.sent + 1]
+                    self.sent += 1
+                    eventlet.sleep(value)
+                    return slowly_read_byte
+            if amt is None:
+                rv = self.body[self.sent:]
+            else:
+                rv = self.body[self.sent:self.sent + amt]
+            self.sent += len(rv)
+            return rv
+
+        def send(self, data=None):
+            if self.give_send:
+                self.give_send(self, data)
+            am_slow, value = self.get_slow()
+            if am_slow:
+                if self.received < self.SLOW_WRITES:
+                    self.received += 1
+                    eventlet.sleep(value)
+
+        def getheader(self, name, default=None):
+            return HeaderKeyDict(self.getheaders()).get(name, default)
+
+        def nuke_from_orbit(self):
+            # wrapped connections from buffered_http have this helper
+            self.close()
+
+        def close(self):
+            self.closed = True
+
+    # unless tests provide timestamps we use the "magic default"
+    timestamps_iter = iter(kwargs.get('timestamps') or [-1] * len(code_iter))
+    etag_iter = iter(kwargs.get('etags') or [None] * len(code_iter))
+    if isinstance(kwargs.get('headers'), (list, tuple)):
+        headers_iter = iter(kwargs['headers'])
+    else:
+        headers_iter = iter([kwargs.get('headers', {})] * len(code_iter))
+    if isinstance(kwargs.get('expect_headers'), (list, tuple)):
+        expect_headers_iter = iter(kwargs['expect_headers'])
+    else:
+        expect_headers_iter = iter([kwargs.get('expect_headers', {})] *
+                                   len(code_iter))
+
+    x = kwargs.get('missing_container', [False] * len(code_iter))
+    if not isinstance(x, (tuple, list)):
+        x = [x] * len(code_iter)
+    container_ts_iter = iter(x)
+    code_iter = iter(code_iter)
+    conn_id_and_code_iter = enumerate(code_iter)
+    static_body = kwargs.get('body', None)
+    body_iter = kwargs.get('body_iter', None)
+    if body_iter:
+        body_iter = iter(body_iter)
+    unexpected_requests = []
+
+    def connect(*args, **ckwargs):
+        if kwargs.get('slow_connect', False):
+            eventlet.sleep(0.1)
+        if 'give_content_type' in kwargs:
+            if len(args) >= 7 and 'Content-Type' in args[6]:
+                kwargs['give_content_type'](args[6]['Content-Type'])
+            else:
+                kwargs['give_content_type']('')
+        try:
+            i, status = next(conn_id_and_code_iter)
+        except StopIteration:
+            # the code under test may swallow the StopIteration, so by logging
+            # unexpected requests here we allow the test framework to check for
+            # them after the connect function has been used.
+            unexpected_requests.append((args, ckwargs))
+            raise
+
+        if 'give_connect' in kwargs:
+            give_conn_fn = kwargs['give_connect']
+
+            argspec = inspect.getfullargspec(give_conn_fn)
+            if argspec.varkw or 'connection_id' in argspec.args:
+                ckwargs['connection_id'] = i
+            give_conn_fn(*args, **ckwargs)
+        etag = next(etag_iter)
+        headers = next(headers_iter)
+        expect_headers = next(expect_headers_iter)
+        timestamp = next(timestamps_iter)
+
+        if isinstance(status, int) and status <= 0:
+            raise HTTPException()
+        if body_iter is None:
+            body = static_body or b''
+        else:
+            body = next(body_iter)
+        conn = FakeConn(status, etag, body=body, timestamp=timestamp,
+                        headers=headers, expect_headers=expect_headers,
+                        connection_id=i, give_send=kwargs.get('give_send'),
+                        give_expect=kwargs.get('give_expect'))
+        if 'capture_connections' in kwargs:
+            kwargs['capture_connections'].append(conn)
+        return conn
+
+    connect.unexpected_requests = unexpected_requests
+    connect.code_iter = code_iter
+
+    return connect
+
+
+@contextmanager
+def mocked_http_conn(*args, **kwargs):
+    requests = []
+    responses = []
+
+    def capture_requests(ip, port, method, path, headers, qs, ssl):
+        req = {
+            'ip': ip,
+            'port': port,
+            'method': method,
+            'path': path,
+            'headers': headers,
+            'qs': qs,
+            'ssl': ssl,
+        }
+        requests.append(req)
+    kwargs.setdefault('give_connect', capture_requests)
+    kwargs['capture_connections'] = responses
+    fake_conn = fake_http_connect(*args, **kwargs)
+    fake_conn.requests = requests
+    fake_conn.responses = responses
+    with mocklib.patch('swift.common.bufferedhttp.http_connect_raw',
+                       new=fake_conn):
+        yield fake_conn
+        left_over_status = list(fake_conn.code_iter)
+        if left_over_status:
+            raise AssertionError('left over status %r' % left_over_status)
+        if fake_conn.unexpected_requests:
+            raise AssertionError(
+                '%d unexpected requests:\n%s' %
+                (len(fake_conn.unexpected_requests),
+                 '\n  '.join('%r' % (req,)
+                             for req in fake_conn.unexpected_requests)))
+
+
+def make_timestamp_iter(offset=0):
+    return iter(Timestamp(t)
+                for t in itertools.count(int(time.time()) + offset))
+
+
+@contextmanager
+def mock_timestamp_now(now=None, klass=Timestamp):
+    if now is None:
+        now = klass.now()
+    with mocklib.patch('swift.common.utils.Timestamp.now',
+                       classmethod(lambda c: now)):
+        yield now
+
+
+@contextmanager
+def mock_timestamp_now_with_iter(ts_iter):
+    with mocklib.patch('swift.common.utils.Timestamp.now',
+                       side_effect=ts_iter):
+        yield
+
+
+class Timeout(object):
+    def __init__(self, seconds):
+        self.seconds = seconds
+
+    def __enter__(self):
+        signal.signal(signal.SIGALRM, self._exit)
+        signal.alarm(self.seconds)
+
+    def __exit__(self, type, value, traceback):
+        signal.alarm(0)
+
+    def _exit(self, signum, frame):
+        class TimeoutException(Exception):
+            pass
+        raise TimeoutException
+
+
+def requires_o_tmpfile_support_in_tmp(func):
+    @functools.wraps(func)
+    def wrapper(*args, **kwargs):
+        if not utils.o_tmpfile_in_tmpdir_supported():
+            raise SkipTest('Requires O_TMPFILE support in TMPDIR')
+        return func(*args, **kwargs)
+    return wrapper
+
+
+def requires_crc32c(func):
+    @functools.wraps(func)
+    def wrapper(*args, **kwargs):
+        try:
+            checksum.crc32c()
+        except NotImplementedError as e:
+            raise SkipTest(str(e))
+        return func(*args, **kwargs)
+    return wrapper
+
+
+def requires_crc64nvme(func):
+    @functools.wraps(func)
+    def wrapper(*args, **kwargs):
+        try:
+            checksum.crc64nvme()
+        except NotImplementedError as e:
+            raise SkipTest(str(e))
+        return func(*args, **kwargs)
+    return wrapper
+
+
+class StubResponse(object):
+
+    def __init__(self, status, body=b'', headers=None, frag_index=None,
+                 slowdown=None, slowdown_after=0):
+        self.status = status
+        self.body = body
+        self.readable = BytesIO(body)
+        try:
+            self._slowdown = iter(slowdown)
+        except TypeError:
+            self._slowdown = iter([slowdown])
+        self.slowdown_after = slowdown_after
+        self.headers = HeaderKeyDict(headers)
+        if frag_index is not None:
+            self.headers['X-Object-Sysmeta-Ec-Frag-Index'] = frag_index
+        fake_reason = ('Fake', 'This response is a lie.')
+        self.reason = swob.RESPONSE_REASONS.get(status, fake_reason)[0]
+        self.bytes_read = 0
+
+    def slowdown(self):
+        if self.bytes_read < self.slowdown_after:
+            return
+        try:
+            wait = next(self._slowdown)
+        except StopIteration:
+            wait = None
+        if wait is not None:
+            eventlet.sleep(wait)
+
+    def nuke_from_orbit(self):
+        if hasattr(self, 'swift_conn'):
+            self.swift_conn.close()
+
+    def getheader(self, header_name, default=None):
+        return self.headers.get(header_name, default)
+
+    def getheaders(self):
+        if 'Content-Length' not in self.headers:
+            self.headers['Content-Length'] = len(self.body)
+        return self.headers.items()
+
+    def read(self, amt=0):
+        self.slowdown()
+        res = self.readable.read(amt)
+        self.bytes_read += len(res)
+        return res
+
+    def readline(self, size=-1):
+        self.slowdown()
+        res = self.readable.readline(size)
+        self.bytes_read += len(res)
+        return res
+
+    def __repr__(self):
+        info = ['Status: %s' % self.status]
+        if self.headers:
+            info.append('Headers: %r' % dict(self.headers))
+        if self.body:
+            info.append('Body: %r' % self.body)
+        return '<StubResponse %s>' % ', '.join(info)
+
+
+def encode_frag_archive_bodies(policy, body):
+    """
+    Given a stub body produce a list of complete frag_archive bodies as
+    strings in frag_index order.
+
+    :param policy: a StoragePolicy instance, with policy_type EC_POLICY
+    :param body: a string, the body to encode into frag archives
+
+    :returns: list of strings, the complete frag_archive bodies for the given
+              plaintext
+    """
+    segment_size = policy.ec_segment_size
+    # split up the body into buffers
+    chunks = [body[x:x + segment_size]
+              for x in range(0, len(body), segment_size)]
+    # encode the buffers into fragment payloads
+    fragment_payloads = []
+    for chunk in chunks:
+        fragments = policy.pyeclib_driver.encode(chunk) \
+            * policy.ec_duplication_factor
+        if not fragments:
+            break
+        fragment_payloads.append(fragments)
+
+    # join up the fragment payloads per node
+    ec_archive_bodies = [b''.join(frags)
+                         for frags in zip(*fragment_payloads)]
+    return ec_archive_bodies
+
+
+def make_ec_object_stub(test_body, policy, timestamp):
+    segment_size = policy.ec_segment_size
+    test_body = test_body or (
+        b'test' * segment_size)[:-random.randint(1, 1000)]
+    timestamp = timestamp or utils.Timestamp.now()
+    etag = md5(test_body, usedforsecurity=False).hexdigest()
+    ec_archive_bodies = encode_frag_archive_bodies(policy, test_body)
+
+    return {
+        'body': test_body,
+        'etag': etag,
+        'frags': ec_archive_bodies,
+        'timestamp': timestamp
+    }
+
+
+def fake_ec_node_response(node_frags, policy):
+    """
+    Given a list of entries for each node in ring order, where the entries
+    are a dict (or list of dicts) which describes the fragment (or
+    fragments) that are on the node; create a function suitable for use
+    with capture_http_requests that will accept a req object and return a
+    response that will suitably fake the behavior of an object server who
+    had the given fragments on disk at the time.
+
+    :param node_frags: a list. Each item in the list describes the
+        fragments that are on a node; each item is a dict or list of dicts,
+        each dict describing a single fragment; where the item is a list,
+        repeated calls to get_response will return fragments in the order
+        of the list; each dict has keys:
+            - obj: an object stub, as generated by _make_ec_object_stub,
+                that defines all of the fragments that compose an object
+                at a specific timestamp.
+            - frag: the index of a fragment to be selected from the object
+                stub
+            - durable (optional): True if the selected fragment is durable
+    :param policy: storage policy to return
+    """
+    node_map = {}  # maps node ip and port to node index
+    all_nodes = []
+    call_count = {}  # maps node index to get_response call count for node
+
+    def _build_node_map(req, policy):
+        part = utils.split_path(req['path'], 5, 5, True)[1]
+        all_nodes.extend(policy.object_ring.get_part_nodes(part))
+        all_nodes.extend(policy.object_ring.get_more_nodes(part))
+        for i, node in enumerate(all_nodes):
+            node_map[(node['ip'], node['port'])] = i
+            call_count[i] = 0
+
+    # normalize node_frags to a list of fragments for each node even
+    # if there's only one fragment in the dataset provided.
+    for i, frags in enumerate(node_frags):
+        if isinstance(frags, dict):
+            node_frags[i] = [frags]
+
+    def get_response(req):
+        requested_policy = int(
+            req['headers']['X-Backend-Storage-Policy-Index'])
+        if int(policy) != requested_policy:
+            AssertionError(
+                "Requested polciy doesn't fit the fake response policy")
+        if not node_map:
+            _build_node_map(req, policy)
+
+        try:
+            node_index = node_map[(req['ip'], req['port'])]
+        except KeyError:
+            raise Exception("Couldn't find node %s:%s in %r" % (
+                req['ip'], req['port'], all_nodes))
+        try:
+            frags = node_frags[node_index]
+        except IndexError:
+            raise Exception('Found node %r:%r at index %s - '
+                            'but only got %s stub response nodes' % (
+                                req['ip'], req['port'], node_index,
+                                len(node_frags)))
+
+        if not frags:
+            return StubResponse(404)
+
+        # determine response fragment (if any) for this call
+        resp_frag = frags[call_count[node_index]]
+        call_count[node_index] += 1
+        frag_prefs = req['headers'].get('X-Backend-Fragment-Preferences')
+        if not (frag_prefs or resp_frag.get('durable', True)):
+            return StubResponse(404)
+
+        # prepare durable timestamp and backend frags header for this node
+        obj_stub = resp_frag['obj']
+        ts2frags = defaultdict(list)
+        durable_timestamp = None
+        for frag in frags:
+            ts_frag = frag['obj']['timestamp']
+            if frag.get('durable', True):
+                durable_timestamp = ts_frag.internal
+            ts2frags[ts_frag].append(frag['frag'])
+
+        try:
+            body = obj_stub['frags'][resp_frag['frag']]
+        except IndexError as err:
+            raise Exception(
+                'Frag index %s not defined: node index %s, frags %r\n%s' %
+                (resp_frag['frag'], node_index, [f['frag'] for f in frags],
+                 err))
+        headers = {
+            'X-Object-Sysmeta-Ec-Content-Length': len(obj_stub['body']),
+            'X-Object-Sysmeta-Ec-Etag': obj_stub['etag'],
+            'X-Object-Sysmeta-Ec-Frag-Index':
+                policy.get_backend_index(resp_frag['frag']),
+            'X-Backend-Timestamp': obj_stub['timestamp'].internal,
+            'X-Timestamp': obj_stub['timestamp'].normal,
+            'X-Backend-Data-Timestamp': obj_stub['timestamp'].internal,
+            'X-Backend-Fragments':
+                server._make_backend_fragments_header(ts2frags)
+        }
+        if durable_timestamp:
+            headers['X-Backend-Durable-Timestamp'] = durable_timestamp
+
+        return StubResponse(200, body, headers)
+
+    return get_response
+
+
+supports_xattr_cached_val = None
+
+
+def xattr_supported_check():
+    """
+    This check simply sets more than 4k of metadata on a tempfile and
+    returns True if it worked and False if not.
+
+    We want to use *more* than 4k of metadata in this check because
+    some filesystems (eg ext4) only allow one blocksize worth of
+    metadata. The XFS filesystem doesn't have this limit, and so this
+    check returns True when TMPDIR is XFS. This check will return
+    False under ext4 (which supports xattrs <= 4k) and tmpfs (which
+    doesn't support xattrs at all).
+
+    """
+    global supports_xattr_cached_val
+
+    if supports_xattr_cached_val is not None:
+        return supports_xattr_cached_val
+
+    # assume the worst -- xattrs aren't supported
+    supports_xattr_cached_val = False
+
+    big_val = b'x' * (4096 + 1)  # more than 4k of metadata
+    try:
+        fd, tmppath = mkstemp()
+        xattr.setxattr(fd, 'user.swift.testing_key', big_val)
+    except IOError as e:
+        if errno.errorcode.get(e.errno) in ('ENOSPC', 'ENOTSUP', 'EOPNOTSUPP',
+                                            'ERANGE'):
+            # filesystem does not support xattr of this size
+            return False
+        raise
+    else:
+        supports_xattr_cached_val = True
+        return True
+    finally:
+        # clean up the tmpfile
+        os.close(fd)
+        os.unlink(tmppath)
+
+
+def skip_if_no_xattrs():
+    if not xattr_supported_check():
+        raise SkipTest('Large xattrs not supported in `%s`. Skipping test' %
+                       gettempdir())
+
+
+def unlink_files(paths):
+    for path in paths:
+        try:
+            os.unlink(path)
+        except OSError as err:
+            if err.errno != errno.ENOENT:
+                raise
+
+
+class FakeHTTPResponse(object):
+
+    def __init__(self, resp):
+        self.resp = resp
+
+    @property
+    def status(self):
+        return self.resp.status_int
+
+    @property
+    def data(self):
+        return self.resp.body
+
+
+def attach_fake_replication_rpc(rpc, replicate_hook=None, errors=None):
+    class FakeReplConnection(object):
+
+        def __init__(self, node, partition, hash_, logger):
+            self.logger = logger
+            self.node = node
+            self.partition = partition
+            self.path = '/%s/%s/%s' % (node['device'], partition, hash_)
+            self.host = node['replication_ip']
+
+        def replicate(self, op, *sync_args):
+            print('REPLICATE: %s, %s, %r' % (self.path, op, sync_args))
+            resp = None
+            if errors and op in errors and errors[op]:
+                resp = errors[op].pop(0)
+            if not resp:
+                replicate_args = self.path.lstrip('/').split('/')
+                args = [op] + copy.deepcopy(list(sync_args))
+                with mock_check_drive(isdir=not rpc.mount_check,
+                                      ismount=rpc.mount_check):
+                    swob_response = rpc.dispatch(replicate_args, args)
+                resp = FakeHTTPResponse(swob_response)
+            if replicate_hook:
+                replicate_hook(op, *sync_args)
+            return resp
+
+    return FakeReplConnection
+
+
+def group_by_byte(contents):
+    # This looks a little funny, but iterating through a byte string on py3
+    # yields a sequence of ints, not a sequence of single-byte byte strings
+    # as it did on py2.
+    byte_iter = (contents[i:i + 1] for i in range(len(contents)))
+    return [
+        (char, sum(1 for _ in grp))
+        for char, grp in itertools.groupby(byte_iter)]
+
+
+def generate_db_path(tempdir, server_type):
+    return os.path.join(
+        tempdir, '%ss' % server_type, 'part', 'suffix', 'hash',
+        '%s-%s.db' % (server_type, uuid4()))
+
+
+class FakeSource(object):
+    def __init__(self, chunks, headers=None, body=b''):
+        self.chunks = list(chunks)
+        self.headers = headers or {}
+        self.status = 200
+        self.swift_conn = None
+        self.body = body
+
+    def read(self, _read_size):
+        if self.chunks:
+            chunk = self.chunks.pop(0)
+            if chunk is None:
+                raise exceptions.ChunkReadTimeout()
+            else:
+                return chunk
+        else:
+            return self.body
+
+    def getheader(self, header):
+        # content-length for the whole object is generated dynamically
+        # by summing non-None chunks
+        if header.lower() == "content-length":
+            if self.chunks:
+                return str(sum(len(c) for c in self.chunks
+                               if c is not None))
+            return len(self.read(-1))
+        return self.headers.get(header.lower())
+
+    def getheaders(self):
+        return [('content-length', self.getheader('content-length'))] + \
+               [(k, v) for k, v in self.headers.items()]
+
+
+class CaptureIterator(object):
+    """
+    Wraps an iterable, forwarding all calls to the wrapped iterable but
+    capturing the calls via a callback.
+
+    This class may be used to observe garbage collection, so tests should not
+    have to hold a reference to instances of this class because that would
+    prevent them being garbage collected. Calls are therefore captured via a
+    callback rather than being stashed locally.
+
+    :param wrapped: an iterable to wrap.
+    :param call_capture_callback: a function that will be called to capture
+        calls to this iterator.
+    """
+    def __init__(self, wrapped, call_capture_callback):
+        self.call_capture_callback = call_capture_callback
+        self.wrapped_iter = wrapped
+
+    def _capture_call(self):
+        # call home to capture the call
+        self.call_capture_callback(inspect.stack()[1][3])
+
+    def __iter__(self):
+        return self
+
+    def __next__(self):
+        self._capture_call()
+        return next(self.wrapped_iter)
+
+    def __del__(self):
+        self._capture_call()
+
+    def close(self):
+        self._capture_call()
+        close_if_possible(self.wrapped_iter)
+
+
+class CaptureIteratorFactory(object):
+    """
+    Create instances of ``CaptureIterator`` to wrap a given iterable, and
+    provides a callback function for the ``CaptureIterator`` to capture its
+    calls.
+
+    :param wrapped: an iterable to wrap.
+    """
+    def __init__(self, wrapped):
+        self.wrapped = wrapped
+        self.instance_count = 0
+        self.captured_calls = defaultdict(list)
+
+    def log_call(self, instance_number, call):
+        self.captured_calls[instance_number].append(call)
+
+    def __call__(self, *args, **kwargs):
+        # note: do not keep a reference to the CaptureIterator because that
+        # would prevent it being garbage collected
+        self.instance_count += 1
+        return CaptureIterator(
+            self.wrapped(*args, **kwargs),
+            functools.partial(self.log_call, self.instance_count))
+
+
+def get_node_error_stats(proxy_app, ring_node):
+    node_key = proxy_app.error_limiter.node_key(ring_node)
+    return proxy_app.error_limiter.stats.get(node_key) or {}
+
+
+def node_error_count(proxy_app, ring_node):
+    # Reach into the proxy's internals to get the error count for a
+    # particular node
+    return get_node_error_stats(proxy_app, ring_node).get('errors', 0)
+
+
+def node_error_counts(proxy_app, ring_nodes):
+    # Reach into the proxy's internals to get the error counts for a
+    # list of nodes
+    return sorted([get_node_error_stats(proxy_app, node).get('errors', 0)
+                   for node in ring_nodes], reverse=True)
+
+
+def node_last_error(proxy_app, ring_node):
+    # Reach into the proxy's internals to get the last error for a
+    # particular node
+    return get_node_error_stats(proxy_app, ring_node).get('last_error')
+
+
+def set_node_errors(proxy_app, ring_node, value, last_error):
+    # Set the node's error count to value
+    node_key = proxy_app.error_limiter.node_key(ring_node)
+    stats = {'errors': value,
+             'last_error': last_error}
+    proxy_app.error_limiter.stats[node_key] = stats
diff --git a/test/unit/account/test_auditor.py b/test/unit/account/test_auditor.py
index 11b3bc384d..5b46d16dae 100644
--- a/test/unit/account/test_auditor.py
+++ b/test/unit/account/test_auditor.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,15 +13,132 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-# TODO: Tests
-
+from collections import defaultdict
+import itertools
 import unittest
+import time
+import os
+import random
+
 from swift.account import auditor
+from swift.common.storage_policy import POLICIES
+from swift.common.utils import Timestamp
+from test.debug_logger import debug_logger
+from test.unit import patch_policies, with_tempdir
+from test.unit.account.test_backend import (
+    AccountBrokerPreTrackContainerCountSetup)
+
+
+@patch_policies
+class TestAuditorRealBrokerMigration(
+        AccountBrokerPreTrackContainerCountSetup, unittest.TestCase):
+
+    def test_db_migration(self):
+        # add a few containers
+        policies = itertools.cycle(POLICIES)
+        num_containers = len(POLICIES) * 3
+        per_policy_container_counts = defaultdict(int)
+        for i in range(num_containers):
+            name = 'test-container-%02d' % i
+            policy = next(policies)
+            self.broker.put_container(name, next(self.ts).internal,
+                                      0, 0, 0, int(policy))
+            per_policy_container_counts[int(policy)] += 1
+
+        self.broker._commit_puts()
+        self.assertEqual(num_containers,
+                         self.broker.get_info()['container_count'])
+
+        # still un-migrated
+        self.assertUnmigrated(self.broker)
+
+        # run auditor, and validate migration
+        conf = {'devices': self.testdir, 'mount_check': False,
+                'recon_cache_path': self.testdir}
+        test_auditor = auditor.AccountAuditor(conf, logger=debug_logger())
+        test_auditor.run_once()
+
+        self.restore_account_broker()
+
+        broker = auditor.AccountBroker(self.db_path, account='a')
+        broker.initialize(Timestamp('1').internal, 0)
+        # go after rows directly to avoid unintentional migration
+        with broker.get() as conn:
+            rows = conn.execute('''
+                SELECT storage_policy_index, container_count
+                FROM policy_stat
+            ''').fetchall()
+        for policy_index, container_count in rows:
+            self.assertEqual(container_count,
+                             per_policy_container_counts[policy_index])
+
+
+class TestAuditorRealBroker(unittest.TestCase):
+
+    def setUp(self):
+        self.logger = debug_logger()
+        # really, this would come by way of base_prefix/tail_prefix in
+        # get_logger, ultimately tracing back to section_name in daemon...
+        self.logger.logger.statsd_client._prefix = 'account-auditor.'
+
+    @with_tempdir
+    def test_db_validate_fails(self, tempdir):
+        ts = (Timestamp(t).internal for t in itertools.count(int(time.time())))
+        db_path = os.path.join(tempdir, 'sda', 'accounts',
+                               '0', '0', '0', 'test.db')
+        broker = auditor.AccountBroker(db_path, account='a')
+        broker.initialize(next(ts))
+        # add a few containers
+        policies = itertools.cycle(POLICIES)
+        num_containers = len(POLICIES) * 3
+        per_policy_container_counts = defaultdict(int)
+        for i in range(num_containers):
+            name = 'test-container-%02d' % i
+            policy = next(policies)
+            broker.put_container(name, next(ts), 0, 0, 0, int(policy))
+            per_policy_container_counts[int(policy)] += 1
+
+        broker._commit_puts()
+        self.assertEqual(broker.get_info()['container_count'], num_containers)
+
+        messed_up_policy = random.choice(list(POLICIES))
+
+        # now mess up a policy_stats table count
+        with broker.get() as conn:
+            conn.executescript('''
+                UPDATE policy_stat
+                SET container_count = container_count - 1
+                WHERE storage_policy_index = %d;
+            ''' % int(messed_up_policy))
+
+        # validate it's messed up
+        policy_stats = broker.get_policy_stats()
+        self.assertEqual(
+            policy_stats[int(messed_up_policy)]['container_count'],
+            per_policy_container_counts[int(messed_up_policy)] - 1)
 
-class TestAuditor(unittest.TestCase):
+        # do an audit
+        conf = {'devices': tempdir, 'mount_check': False,
+                'recon_cache_path': tempdir}
+        test_auditor = auditor.AccountAuditor(conf, logger=self.logger)
+        test_auditor.run_once()
 
-    def test_placeholder(self):
-        pass
+        # validate errors
+        self.assertEqual(test_auditor.failures, 1)
+        error_lines = test_auditor.logger.get_lines_for_level('error')
+        self.assertEqual(len(error_lines), 1)
+        error_message = error_lines[0]
+        self.assertIn(broker.db_file, error_message)
+        self.assertIn(
+            'The total container_count for the account a (%d) does not match '
+            'the sum of container_count across policies (%d)'
+            % (num_containers, num_containers - 1), error_message)
+        self.assertEqual(
+            test_auditor.logger.statsd_client.get_stats_counts(),
+            {'failures': 1})
+        self.assertIn(
+            (b'account-auditor.failures:1|c', ('host', 8125)),
+            test_auditor.logger.statsd_client.sendto_calls)
 
 
 if __name__ == '__main__':
diff --git a/test/unit/account/test_backend.py b/test/unit/account/test_backend.py
new file mode 100644
index 0000000000..20622f420b
--- /dev/null
+++ b/test/unit/account/test_backend.py
@@ -0,0 +1,2043 @@
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+""" Tests for swift.account.backend """
+from collections import defaultdict
+import json
+import pickle
+import os
+from time import sleep, time
+from uuid import uuid4
+import sqlite3
+import itertools
+from contextlib import contextmanager
+import random
+from unittest import mock
+import base64
+import shutil
+
+from swift.account.backend import AccountBroker
+from swift.common.utils import Timestamp
+from test.unit import patch_policies, with_tempdir, make_timestamp_iter
+from swift.common.db import DatabaseConnectionError, TombstoneReclaimer
+from swift.common.request_helpers import get_reserved_name
+from swift.common.storage_policy import StoragePolicy, POLICIES
+from swift.common.utils import md5
+
+from test.unit.common import test_db
+
+
+@patch_policies
+class TestAccountBroker(test_db.TestDbBase):
+    """Tests for AccountBroker"""
+
+    def setUp(self):
+        super(TestAccountBroker, self).setUp()
+        # tests seem to assume x-timestamp was set by the proxy before "now"
+        self.ts = make_timestamp_iter(offset=-1)
+
+    def test_creation(self):
+        # Test AccountBroker.__init__
+        db_file = self.get_db_path()
+        broker = AccountBroker(db_file, account='a')
+        self.assertEqual(broker.db_file, db_file)
+        try:
+            with broker.get() as conn:
+                pass
+        except DatabaseConnectionError as e:
+            self.assertTrue(hasattr(e, 'path'))
+            self.assertEqual(e.path, db_file)
+            self.assertTrue(hasattr(e, 'msg'))
+            self.assertEqual(e.msg, "DB doesn't exist")
+        except Exception as e:
+            self.fail("Unexpected exception raised: %r" % e)
+        else:
+            self.fail("Expected a DatabaseConnectionError exception")
+        broker.initialize(Timestamp('1').internal)
+        with broker.get() as conn:
+            curs = conn.cursor()
+            curs.execute('SELECT 1')
+            self.assertEqual(curs.fetchall()[0][0], 1)
+
+    def test_initialize_fail(self):
+        broker = AccountBroker(self.get_db_path())
+        with self.assertRaises(ValueError) as cm:
+            broker.initialize(Timestamp('1').internal)
+        self.assertEqual(str(cm.exception), 'Attempting to create a new'
+                         ' database with no account set')
+
+    def test_exception(self):
+        # Test AccountBroker throwing a conn away after exception
+        first_conn = None
+        broker = AccountBroker(self.get_db_path(), account='a')
+        broker.initialize(Timestamp('1').internal)
+        with broker.get() as conn:
+            first_conn = conn
+        try:
+            with broker.get() as conn:
+                self.assertEqual(first_conn, conn)
+                raise Exception('OMG')
+        except Exception:
+            pass
+        self.assertIsNone(broker.conn)
+
+    def test_empty(self):
+        # Test AccountBroker.empty
+        broker = AccountBroker(self.get_db_path(), account='a')
+        broker.initialize(Timestamp('1').internal)
+        self.assertTrue(broker.empty())
+        broker.put_container('o', Timestamp.now().internal, 0, 0, 0,
+                             POLICIES.default.idx)
+        self.assertFalse(broker.empty())
+        sleep(.00001)
+        broker.put_container('o', 0, Timestamp.now().internal, 0, 0,
+                             POLICIES.default.idx)
+        self.assertTrue(broker.empty())
+
+    def test_is_status_deleted(self):
+        # Test AccountBroker.is_status_deleted
+        broker1 = AccountBroker(self.get_db_path(), account='a')
+        broker1.initialize(Timestamp.now().internal)
+        self.assertFalse(broker1.is_status_deleted())
+        broker1.delete_db(Timestamp.now().internal)
+        self.assertTrue(broker1.is_status_deleted())
+        broker2 = AccountBroker(self.get_db_path(), account='a')
+        broker2.initialize(Timestamp.now().internal)
+        # Set delete_timestamp greater than put_timestamp
+        broker2.merge_timestamps(
+            time(), Timestamp.now().internal,
+            Timestamp(time() + 999).internal)
+        self.assertTrue(broker2.is_status_deleted())
+
+    def test_reclaim(self):
+        broker = AccountBroker(self.get_db_path(), account='test_account')
+        broker.initialize(Timestamp('1').internal)
+        broker.put_container('c', Timestamp.now().internal, 0, 0, 0,
+                             POLICIES.default.idx)
+        # commit pending file into db
+        broker._commit_puts()
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM container "
+                "WHERE deleted = 0").fetchone()[0], 1)
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM container "
+                "WHERE deleted = 1").fetchone()[0], 0)
+        broker.reclaim(Timestamp(time() - 999).internal, time())
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM container "
+                "WHERE deleted = 0").fetchone()[0], 1)
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM container "
+                "WHERE deleted = 1").fetchone()[0], 0)
+        sleep(.00001)
+        broker.put_container('c', 0, Timestamp.now().internal, 0, 0,
+                             POLICIES.default.idx)
+        broker._commit_puts()
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM container "
+                "WHERE deleted = 0").fetchone()[0], 0)
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM container "
+                "WHERE deleted = 1").fetchone()[0], 1)
+        broker.reclaim(Timestamp(time() - 999).internal, time())
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM container "
+                "WHERE deleted = 0").fetchone()[0], 0)
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM container "
+                "WHERE deleted = 1").fetchone()[0], 1)
+        sleep(.00001)
+        broker.reclaim(Timestamp.now().internal, time())
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM container "
+                "WHERE deleted = 0").fetchone()[0], 0)
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM container "
+                "WHERE deleted = 1").fetchone()[0], 0)
+        # Test reclaim after deletion. Create 3 test containers
+        broker.put_container('x', 0, 0, 0, 0, POLICIES.default.idx)
+        broker.put_container('y', 0, 0, 0, 0, POLICIES.default.idx)
+        broker.put_container('z', 0, 0, 0, 0, POLICIES.default.idx)
+        broker._commit_puts()
+        broker.reclaim(Timestamp.now().internal, time())
+        # Now delete the account
+        broker.delete_db(Timestamp.now().internal)
+        broker.reclaim(Timestamp.now().internal, time())
+
+    def test_batched_reclaim(self):
+        num_of_containers = 60
+        container_specs = []
+        now = time()
+        top_of_the_minute = now - (now % 60)
+        c = itertools.cycle([True, False])
+        for m, is_deleted in zip(range(num_of_containers), c):
+            offset = top_of_the_minute - (m * 60)
+            container_specs.append((Timestamp(offset), is_deleted))
+        random.seed(now)
+        random.shuffle(container_specs)
+        policy_indexes = list(p.idx for p in POLICIES)
+        broker = AccountBroker(self.get_db_path(), account='test_account')
+        broker.initialize(Timestamp('1').internal)
+        for i, container_spec in enumerate(container_specs):
+            # with container12 before container2 and shuffled ts.internal we
+            # shouldn't be able to accidently rely on any implicit ordering
+            name = 'container%s' % i
+            pidx = random.choice(policy_indexes)
+            ts, is_deleted = container_spec
+            if is_deleted:
+                broker.put_container(name, 0, ts.internal, 0, 0, pidx)
+            else:
+                broker.put_container(name, ts.internal, 0, 0, 0, pidx)
+
+        # commit pending file into db
+        broker._commit_puts()
+
+        def count_reclaimable(conn, reclaim_age):
+            return conn.execute(
+                "SELECT count(*) FROM container "
+                "WHERE deleted = 1 AND delete_timestamp < ?", (reclaim_age,)
+            ).fetchone()[0]
+
+        # This is intended to divide the set of timestamps exactly in half
+        # regardless of the value of now
+        reclaim_age = top_of_the_minute + 1 - (num_of_containers / 2 * 60)
+        with broker.get() as conn:
+            self.assertEqual(count_reclaimable(conn, reclaim_age),
+                             num_of_containers / 4)
+
+        trace = []
+
+        class TracingReclaimer(TombstoneReclaimer):
+            def _reclaim(self, conn):
+                trace.append(
+                    (self.age_timestamp, self.marker,
+                     count_reclaimable(conn, self.age_timestamp)))
+                return super(TracingReclaimer, self)._reclaim(conn)
+
+        with mock.patch(
+                'swift.common.db.TombstoneReclaimer', TracingReclaimer), \
+                mock.patch('swift.common.db.RECLAIM_PAGE_SIZE', 10):
+            broker.reclaim(reclaim_age, reclaim_age)
+        with broker.get() as conn:
+            self.assertEqual(count_reclaimable(conn, reclaim_age), 0)
+        self.assertEqual(3, len(trace), trace)
+        self.assertEqual([age for age, marker, reclaimable in trace],
+                         [reclaim_age] * 3)
+        # markers are in-order
+        self.assertLess(trace[0][1], trace[1][1])
+        self.assertLess(trace[1][1], trace[2][1])
+        # reclaimable count gradually decreases
+        # generally, count1 > count2 > count3, but because of the randomness
+        # we may occassionally have count1 == count2 or count2 == count3
+        self.assertGreaterEqual(trace[0][2], trace[1][2])
+        self.assertGreaterEqual(trace[1][2], trace[2][2])
+        # technically, this might happen occasionally, but *really* rarely
+        self.assertTrue(trace[0][2] > trace[1][2] or
+                        trace[1][2] > trace[2][2])
+
+    def test_delete_db_status(self):
+        start = next(self.ts)
+        broker = AccountBroker(self.get_db_path(), account='a')
+        broker.initialize(start.internal)
+        info = broker.get_info()
+        self.assertEqual(info['put_timestamp'], start.internal)
+        self.assertGreaterEqual(Timestamp(info['created_at']), start)
+        self.assertEqual(info['delete_timestamp'], '0')
+        if self.__class__ == TestAccountBrokerBeforeMetadata:
+            self.assertEqual(info['status_changed_at'], '0')
+        else:
+            self.assertEqual(info['status_changed_at'], start.internal)
+
+        # delete it
+        delete_timestamp = next(self.ts)
+        broker.delete_db(delete_timestamp.internal)
+        info = broker.get_info()
+        self.assertEqual(info['put_timestamp'], start.internal)
+        self.assertGreaterEqual(Timestamp(info['created_at']), start)
+        self.assertEqual(info['delete_timestamp'], delete_timestamp.internal)
+        self.assertEqual(info['status_changed_at'], delete_timestamp.internal)
+
+    def test_delete_container(self):
+        # Test AccountBroker.delete_container
+        broker = AccountBroker(self.get_db_path(), account='a')
+        broker.initialize(Timestamp('1').internal)
+        broker.put_container('o', Timestamp.now().internal, 0, 0, 0,
+                             POLICIES.default.idx)
+        # commit pending file into db
+        broker._commit_puts()
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM container "
+                "WHERE deleted = 0").fetchone()[0], 1)
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM container "
+                "WHERE deleted = 1").fetchone()[0], 0)
+        sleep(.00001)
+        broker.put_container('o', 0, Timestamp.now().internal, 0, 0,
+                             POLICIES.default.idx)
+        broker._commit_puts()
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM container "
+                "WHERE deleted = 0").fetchone()[0], 0)
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM container "
+                "WHERE deleted = 1").fetchone()[0], 1)
+
+    def test_put_container(self):
+        # Test AccountBroker.put_container
+        broker = AccountBroker(self.get_db_path(), account='a')
+        broker.initialize(Timestamp('1').internal)
+
+        # Create initial container
+        timestamp = Timestamp.now().internal
+        broker.put_container('"{<container \'&\' name>}"', timestamp, 0, 0, 0,
+                             POLICIES.default.idx)
+        # commit pending file into db
+        broker._commit_puts()
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT name FROM container").fetchone()[0],
+                '"{<container \'&\' name>}"')
+            self.assertEqual(conn.execute(
+                "SELECT put_timestamp FROM container").fetchone()[0],
+                timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT deleted FROM container").fetchone()[0], 0)
+
+        # Reput same event
+        broker.put_container('"{<container \'&\' name>}"', timestamp, 0, 0, 0,
+                             POLICIES.default.idx)
+        broker._commit_puts()
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT name FROM container").fetchone()[0],
+                '"{<container \'&\' name>}"')
+            self.assertEqual(conn.execute(
+                "SELECT put_timestamp FROM container").fetchone()[0],
+                timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT deleted FROM container").fetchone()[0], 0)
+
+        # Put new event
+        sleep(.00001)
+        timestamp = Timestamp.now().internal
+        broker.put_container('"{<container \'&\' name>}"', timestamp, 0, 0, 0,
+                             POLICIES.default.idx)
+        broker._commit_puts()
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT name FROM container").fetchone()[0],
+                '"{<container \'&\' name>}"')
+            self.assertEqual(conn.execute(
+                "SELECT put_timestamp FROM container").fetchone()[0],
+                timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT deleted FROM container").fetchone()[0], 0)
+
+        # Put old event
+        otimestamp = Timestamp(float(Timestamp(timestamp)) - 1).internal
+        broker.put_container('"{<container \'&\' name>}"', otimestamp, 0, 0, 0,
+                             POLICIES.default.idx)
+        broker._commit_puts()
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT name FROM container").fetchone()[0],
+                '"{<container \'&\' name>}"')
+            self.assertEqual(conn.execute(
+                "SELECT put_timestamp FROM container").fetchone()[0],
+                timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT deleted FROM container").fetchone()[0], 0)
+
+        # Put old delete event
+        dtimestamp = Timestamp(float(Timestamp(timestamp)) - 1).internal
+        broker.put_container('"{<container \'&\' name>}"', 0, dtimestamp, 0, 0,
+                             POLICIES.default.idx)
+        broker._commit_puts()
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT name FROM container").fetchone()[0],
+                '"{<container \'&\' name>}"')
+            self.assertEqual(conn.execute(
+                "SELECT put_timestamp FROM container").fetchone()[0],
+                timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT delete_timestamp FROM container").fetchone()[0],
+                dtimestamp)
+            self.assertEqual(conn.execute(
+                "SELECT deleted FROM container").fetchone()[0], 0)
+
+        # Put new delete event
+        sleep(.00001)
+        timestamp = Timestamp.now().internal
+        broker.put_container('"{<container \'&\' name>}"', 0, timestamp, 0, 0,
+                             POLICIES.default.idx)
+        broker._commit_puts()
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT name FROM container").fetchone()[0],
+                '"{<container \'&\' name>}"')
+            self.assertEqual(conn.execute(
+                "SELECT delete_timestamp FROM container").fetchone()[0],
+                timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT deleted FROM container").fetchone()[0], 1)
+
+        # Put new event
+        sleep(.00001)
+        timestamp = Timestamp.now().internal
+        broker.put_container('"{<container \'&\' name>}"', timestamp, 0, 0, 0,
+                             POLICIES.default.idx)
+        broker._commit_puts()
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT name FROM container").fetchone()[0],
+                '"{<container \'&\' name>}"')
+            self.assertEqual(conn.execute(
+                "SELECT put_timestamp FROM container").fetchone()[0],
+                timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT deleted FROM container").fetchone()[0], 0)
+
+    def test_get_info(self):
+        # Test AccountBroker.get_info
+        broker = AccountBroker(self.get_db_path(), account='test1')
+        put_ts = next(self.ts)
+        broker.initialize(put_ts.internal)
+
+        info = broker.get_info()
+        self.assertEqual(info['account'], 'test1')
+        self.assertEqual(info['hash'], '00000000000000000000000000000000')
+        self.assertEqual(info['put_timestamp'], put_ts.internal)
+        self.assertEqual(info['delete_timestamp'], '0')
+        if self.__class__ == TestAccountBrokerBeforeMetadata:
+            self.assertEqual(info['status_changed_at'], '0')
+        else:
+            self.assertEqual(info['status_changed_at'], put_ts.internal)
+
+        info = broker.get_info()
+        self.assertEqual(info['container_count'], 0)
+
+        broker.put_container('c1', Timestamp.now().internal, 0, 0, 0,
+                             POLICIES.default.idx)
+        info = broker.get_info()
+        self.assertEqual(info['container_count'], 1)
+
+        sleep(.00001)
+        broker.put_container('c2', Timestamp.now().internal, 0, 0, 0,
+                             POLICIES.default.idx)
+        info = broker.get_info()
+        self.assertEqual(info['container_count'], 2)
+
+        sleep(.00001)
+        broker.put_container('c2', Timestamp.now().internal, 0, 0, 0,
+                             POLICIES.default.idx)
+        info = broker.get_info()
+        self.assertEqual(info['container_count'], 2)
+
+        sleep(.00001)
+        broker.put_container('c1', 0, Timestamp.now().internal, 0, 0,
+                             POLICIES.default.idx)
+        info = broker.get_info()
+        self.assertEqual(info['container_count'], 1)
+
+        sleep(.00001)
+        broker.put_container('c2', 0, Timestamp.now().internal, 0, 0,
+                             POLICIES.default.idx)
+        info = broker.get_info()
+        self.assertEqual(info['container_count'], 0)
+
+    def test_list_containers_iter(self):
+        # Test AccountBroker.list_containers_iter
+        broker = AccountBroker(self.get_db_path(), account='a')
+        broker.initialize(Timestamp('1').internal)
+        for cont1 in range(4):
+            for cont2 in range(125):
+                broker.put_container('%d-%04d' % (cont1, cont2),
+                                     Timestamp.now().internal, 0, 0, 0,
+                                     POLICIES.default.idx)
+        for cont in range(125):
+            broker.put_container('2-0051-%04d' % cont,
+                                 Timestamp.now().internal, 0, 0, 0,
+                                 POLICIES.default.idx)
+
+        for cont in range(125):
+            broker.put_container('3-%04d-0049' % cont,
+                                 Timestamp.now().internal, 0, 0, 0,
+                                 POLICIES.default.idx)
+
+        listing = broker.list_containers_iter(100, '', None, None, '')
+        self.assertEqual(len(listing), 100)
+        self.assertEqual(listing[0][0], '0-0000')
+        self.assertEqual(listing[-1][0], '0-0099')
+
+        listing = broker.list_containers_iter(100, '', '0-0050', None, '')
+        self.assertEqual(len(listing), 50)
+        self.assertEqual(listing[0][0], '0-0000')
+        self.assertEqual(listing[-1][0], '0-0049')
+
+        listing = broker.list_containers_iter(100, '0-0099', None, None, '')
+        self.assertEqual(len(listing), 100)
+        self.assertEqual(listing[0][0], '0-0100')
+        self.assertEqual(listing[-1][0], '1-0074')
+
+        listing = broker.list_containers_iter(55, '1-0074', None, None, '')
+        self.assertEqual(len(listing), 55)
+        self.assertEqual(listing[0][0], '1-0075')
+        self.assertEqual(listing[-1][0], '2-0004')
+
+        listing = broker.list_containers_iter(10, '', None, '0-01', '')
+        self.assertEqual(len(listing), 10)
+        self.assertEqual(listing[0][0], '0-0100')
+        self.assertEqual(listing[-1][0], '0-0109')
+
+        listing = broker.list_containers_iter(10, '', None, '0-01', '-')
+        self.assertEqual(len(listing), 10)
+        self.assertEqual(listing[0][0], '0-0100')
+        self.assertEqual(listing[-1][0], '0-0109')
+
+        listing = broker.list_containers_iter(10, '', None, '0-00', '-',
+                                              reverse=True)
+        self.assertEqual(len(listing), 10)
+        self.assertEqual(listing[0][0], '0-0099')
+        self.assertEqual(listing[-1][0], '0-0090')
+
+        listing = broker.list_containers_iter(10, '', None, '0-', '-')
+        self.assertEqual(len(listing), 10)
+        self.assertEqual(listing[0][0], '0-0000')
+        self.assertEqual(listing[-1][0], '0-0009')
+
+        listing = broker.list_containers_iter(10, '', None, '0-', '-',
+                                              reverse=True)
+        self.assertEqual(len(listing), 10)
+        self.assertEqual(listing[0][0], '0-0124')
+        self.assertEqual(listing[-1][0], '0-0115')
+
+        listing = broker.list_containers_iter(10, '', None, '', '-')
+        self.assertEqual(len(listing), 4)
+        self.assertEqual([row[0] for row in listing],
+                         ['0-', '1-', '2-', '3-'])
+
+        listing = broker.list_containers_iter(10, '', None, '', '-',
+                                              reverse=True)
+        self.assertEqual(len(listing), 4)
+        self.assertEqual([row[0] for row in listing],
+                         ['3-', '2-', '1-', '0-'])
+
+        listing = broker.list_containers_iter(10, '2-', None, None, '-')
+        self.assertEqual(len(listing), 1)
+        self.assertEqual([row[0] for row in listing], ['3-'])
+
+        listing = broker.list_containers_iter(10, '2-', None, None, '-',
+                                              reverse=True)
+        self.assertEqual(len(listing), 2)
+        self.assertEqual([row[0] for row in listing], ['1-', '0-'])
+
+        listing = broker.list_containers_iter(10, '2.', None, None, '-',
+                                              reverse=True)
+        self.assertEqual(len(listing), 3)
+        self.assertEqual([row[0] for row in listing], ['2-', '1-', '0-'])
+
+        listing = broker.list_containers_iter(10, '', None, '2', '-')
+        self.assertEqual(len(listing), 1)
+        self.assertEqual([row[0] for row in listing], ['2-'])
+
+        listing = broker.list_containers_iter(10, '2-0050', None, '2-', '-')
+        self.assertEqual(len(listing), 10)
+        self.assertEqual(listing[0][0], '2-0051')
+        self.assertEqual(listing[1][0], '2-0051-')
+        self.assertEqual(listing[2][0], '2-0052')
+        self.assertEqual(listing[-1][0], '2-0059')
+
+        listing = broker.list_containers_iter(10, '3-0045', None, '3-', '-')
+        self.assertEqual(len(listing), 10)
+        self.assertEqual([row[0] for row in listing],
+                         ['3-0045-', '3-0046', '3-0046-', '3-0047',
+                          '3-0047-', '3-0048', '3-0048-', '3-0049',
+                          '3-0049-', '3-0050'])
+
+        broker.put_container('3-0049-', Timestamp.now().internal, 0, 0, 0,
+                             POLICIES.default.idx)
+        listing = broker.list_containers_iter(10, '3-0048', None, None, None)
+        self.assertEqual(len(listing), 10)
+        self.assertEqual([row[0] for row in listing],
+                         ['3-0048-0049', '3-0049', '3-0049-', '3-0049-0049',
+                          '3-0050', '3-0050-0049', '3-0051', '3-0051-0049',
+                          '3-0052', '3-0052-0049'])
+
+        listing = broker.list_containers_iter(10, '3-0048', None, '3-', '-')
+        self.assertEqual(len(listing), 10)
+        self.assertEqual([row[0] for row in listing],
+                         ['3-0048-', '3-0049', '3-0049-', '3-0050',
+                          '3-0050-', '3-0051', '3-0051-', '3-0052',
+                          '3-0052-', '3-0053'])
+
+        listing = broker.list_containers_iter(10, None, None, '3-0049-', '-')
+        self.assertEqual(len(listing), 2)
+        self.assertEqual([row[0] for row in listing],
+                         ['3-0049-', '3-0049-0049'])
+
+    def test_list_objects_iter_order_and_reverse(self):
+        # Test ContainerBroker.list_objects_iter
+        broker = AccountBroker(self.get_db_path(), account='a')
+        put_ts = next(self.ts)
+        broker.initialize(put_ts.internal, 0)
+
+        broker.put_container(
+            'c1', next(self.ts).internal, 0, 0, 0, POLICIES.default.idx)
+        broker.put_container(
+            'c10', next(self.ts).internal, 0, 0, 0, POLICIES.default.idx)
+        broker.put_container(
+            'C1', next(self.ts).internal, 0, 0, 0, POLICIES.default.idx)
+        broker.put_container(
+            'c2', next(self.ts).internal, 0, 0, 0, POLICIES.default.idx)
+        broker.put_container(
+            'c3', next(self.ts).internal, 0, 0, 0, POLICIES.default.idx)
+        broker.put_container(
+            'C4', next(self.ts).internal, 0, 0, 0, POLICIES.default.idx)
+
+        listing = broker.list_containers_iter(100, None, None, '', '',
+                                              reverse=False)
+        self.assertEqual([row[0] for row in listing],
+                         ['C1', 'C4', 'c1', 'c10', 'c2', 'c3'])
+        listing = broker.list_containers_iter(100, None, None, '', '',
+                                              reverse=True)
+        self.assertEqual([row[0] for row in listing],
+                         ['c3', 'c2', 'c10', 'c1', 'C4', 'C1'])
+        listing = broker.list_containers_iter(2, None, None, '', '',
+                                              reverse=True)
+        self.assertEqual([row[0] for row in listing],
+                         ['c3', 'c2'])
+        listing = broker.list_containers_iter(100, 'c2', 'C4', '', '',
+                                              reverse=True)
+        self.assertEqual([row[0] for row in listing],
+                         ['c10', 'c1'])
+
+    def test_list_container_iter_with_reserved_name(self):
+        # Test ContainerBroker.list_objects_iter
+        broker = AccountBroker(self.get_db_path(), account='a')
+        broker.initialize(next(self.ts).internal, 0)
+
+        broker.put_container(
+            'foo', next(self.ts).internal, 0, 0, 0, POLICIES.default.idx)
+        broker.put_container(
+            get_reserved_name('foo'), next(self.ts).internal, 0, 0, 0,
+            POLICIES.default.idx)
+
+        listing = broker.list_containers_iter(100, None, None, '', '')
+        self.assertEqual([row[0] for row in listing], ['foo'])
+
+        listing = broker.list_containers_iter(100, None, None, '', '',
+                                              reverse=True)
+        self.assertEqual([row[0] for row in listing], ['foo'])
+
+        listing = broker.list_containers_iter(100, None, None, '', '',
+                                              allow_reserved=True)
+        self.assertEqual([row[0] for row in listing],
+                         [get_reserved_name('foo'), 'foo'])
+
+        listing = broker.list_containers_iter(100, None, None, '', '',
+                                              reverse=True,
+                                              allow_reserved=True)
+        self.assertEqual([row[0] for row in listing],
+                         ['foo', get_reserved_name('foo')])
+
+    def test_reverse_prefix_delim(self):
+        expectations = [
+            {
+                'containers': [
+                    'topdir1-subdir1,0-c1',
+                    'topdir1-subdir1,1-c1',
+                    'topdir1-subdir1-c1',
+                ],
+                'params': {
+                    'prefix': 'topdir1-',
+                    'delimiter': '-',
+                },
+                'expected': [
+                    'topdir1-subdir1,0-',
+                    'topdir1-subdir1,1-',
+                    'topdir1-subdir1-',
+                ],
+            },
+            {
+                'containers': [
+                    'topdir1-subdir1,0-c1',
+                    'topdir1-subdir1,1-c1',
+                    'topdir1-subdir1-c1',
+                    'topdir1-subdir1.',
+                    'topdir1-subdir1.-c1',
+                ],
+                'params': {
+                    'prefix': 'topdir1-',
+                    'delimiter': '-',
+                },
+                'expected': [
+                    'topdir1-subdir1,0-',
+                    'topdir1-subdir1,1-',
+                    'topdir1-subdir1-',
+                    'topdir1-subdir1.',
+                    'topdir1-subdir1.-',
+                ],
+            },
+            {
+                'containers': [
+                    'topdir1-subdir1-c1',
+                    'topdir1-subdir1,0-c1',
+                    'topdir1-subdir1,1-c1',
+                ],
+                'params': {
+                    'prefix': 'topdir1-',
+                    'delimiter': '-',
+                    'reverse': True,
+                },
+                'expected': [
+                    'topdir1-subdir1-',
+                    'topdir1-subdir1,1-',
+                    'topdir1-subdir1,0-',
+                ],
+            },
+            {
+                'containers': [
+                    'topdir1-subdir1.-c1',
+                    'topdir1-subdir1.',
+                    'topdir1-subdir1-c1',
+                    'topdir1-subdir1-',
+                    'topdir1-subdir1,',
+                    'topdir1-subdir1,0-c1',
+                    'topdir1-subdir1,1-c1',
+                ],
+                'params': {
+                    'prefix': 'topdir1-',
+                    'delimiter': '-',
+                    'reverse': True,
+                },
+                'expected': [
+                    'topdir1-subdir1.-',
+                    'topdir1-subdir1.',
+                    'topdir1-subdir1-',
+                    'topdir1-subdir1,1-',
+                    'topdir1-subdir1,0-',
+                    'topdir1-subdir1,',
+                ],
+            },
+            {
+                'containers': [
+                    '1',
+                    '2',
+                    '3:1',
+                    '3:2:1',
+                    '3:2:2',
+                    '3:3',
+                    '4',
+                ],
+                'params': {
+                    'prefix': '3:',
+                    'delimiter': ':',
+                    'reverse': True,
+                },
+                'expected': [
+                    '3:3',
+                    '3:2:',
+                    '3:1',
+                ],
+            },
+        ]
+        default_listing_params = {
+            'limit': 10000,
+            'marker': '',
+            'end_marker': None,
+            'prefix': None,
+            'delimiter': None,
+        }
+        failures = []
+        for expected in expectations:
+            broker = AccountBroker(self.get_db_path(), account='a')
+            broker.initialize(next(self.ts).internal, 0)
+            for name in expected['containers']:
+                broker.put_container(name, next(self.ts).internal, 0, 0, 0,
+                                     POLICIES.default.idx)
+            # commit pending file into db
+            broker._commit_puts()
+            params = default_listing_params.copy()
+            params.update(expected['params'])
+            listing = list(c[0] for c in broker.list_containers_iter(**params))
+            if listing != expected['expected']:
+                expected['listing'] = listing
+                failures.append(
+                    "With containers %(containers)r, the params %(params)r "
+                    "produced %(listing)r instead of %(expected)r" % expected)
+        self.assertFalse(failures, "Found the following failures:\n%s" %
+                         '\n'.join(failures))
+
+    def test_double_check_trailing_delimiter(self):
+        # Test AccountBroker.list_containers_iter for an
+        # account that has an odd container with a trailing delimiter
+        broker = AccountBroker(self.get_db_path(), account='a')
+        broker.initialize(Timestamp('1').internal)
+        broker.put_container('a', Timestamp.now().internal, 0, 0, 0,
+                             POLICIES.default.idx)
+        broker.put_container('a-', Timestamp.now().internal, 0, 0, 0,
+                             POLICIES.default.idx)
+        broker.put_container('a-a', Timestamp.now().internal, 0, 0, 0,
+                             POLICIES.default.idx)
+        broker.put_container('a-a-a', Timestamp.now().internal, 0, 0, 0,
+                             POLICIES.default.idx)
+        broker.put_container('a-a-b', Timestamp.now().internal, 0, 0, 0,
+                             POLICIES.default.idx)
+        broker.put_container('a-b', Timestamp.now().internal, 0, 0, 0,
+                             POLICIES.default.idx)
+        # NB: ord(".") == ord("-") + 1
+        broker.put_container('a.', Timestamp.now().internal, 0, 0, 0,
+                             POLICIES.default.idx)
+        broker.put_container('a.b', Timestamp.now().internal, 0, 0, 0,
+                             POLICIES.default.idx)
+        broker.put_container('b', Timestamp.now().internal, 0, 0, 0,
+                             POLICIES.default.idx)
+        broker.put_container('b-a', Timestamp.now().internal, 0, 0, 0,
+                             POLICIES.default.idx)
+        broker.put_container('b-b', Timestamp.now().internal, 0, 0, 0,
+                             POLICIES.default.idx)
+        broker.put_container('c', Timestamp.now().internal, 0, 0, 0,
+                             POLICIES.default.idx)
+        listing = broker.list_containers_iter(15, None, None, None, None)
+        self.assertEqual([row[0] for row in listing],
+                         ['a', 'a-', 'a-a', 'a-a-a', 'a-a-b', 'a-b', 'a.',
+                          'a.b', 'b', 'b-a', 'b-b', 'c'])
+        listing = broker.list_containers_iter(15, None, None, '', '-')
+        self.assertEqual([row[0] for row in listing],
+                         ['a', 'a-', 'a.', 'a.b', 'b', 'b-', 'c'])
+        listing = broker.list_containers_iter(15, None, None, 'a-', '-')
+        self.assertEqual([row[0] for row in listing],
+                         ['a-', 'a-a', 'a-a-', 'a-b'])
+        listing = broker.list_containers_iter(15, None, None, 'b-', '-')
+        self.assertEqual([row[0] for row in listing], ['b-a', 'b-b'])
+
+    def test_chexor(self):
+        broker = AccountBroker(self.get_db_path(), account='a')
+        put_ts = next(self.ts)
+        delete_ts = Timestamp(0)
+        timestamps = [next(self.ts) for _ in range(3)]
+        broker.initialize(put_ts.internal)
+        broker.put_container('a', timestamps[0].internal,
+                             delete_ts.internal, 0, 0,
+                             POLICIES.default.idx)
+        broker.put_container('b', timestamps[1].internal,
+                             delete_ts.internal, 0, 0,
+                             POLICIES.default.idx)
+        text = '%s-%s' % ('a', "%s-%s-%s-%s" % (
+               timestamps[0].internal, delete_ts.internal, 0, 0))
+        hasha = md5(text.encode('ascii'), usedforsecurity=False).digest()
+        text = '%s-%s' % ('b', "%s-%s-%s-%s" % (
+               timestamps[1].internal, delete_ts.internal, 0, 0))
+        hashb = md5(text.encode('ascii'), usedforsecurity=False).digest()
+        hashc = ''.join(('%02x' % (a ^ b)
+                         for a, b in zip(hasha, hashb)))
+        self.assertEqual(broker.get_info()['hash'], hashc)
+        broker.put_container('b', timestamps[2].internal,
+                             delete_ts.internal, 0, 0,
+                             POLICIES.default.idx)
+        text = '%s-%s' % ('b', "%s-%s-%s-%s" % (
+               timestamps[2].internal, delete_ts.internal, 0, 0))
+        hashb = md5(text.encode('ascii'), usedforsecurity=False).digest()
+        hashc = ''.join(('%02x' % (a ^ b)
+                         for a, b in zip(hasha, hashb)))
+        self.assertEqual(broker.get_info()['hash'], hashc)
+
+    def test_merge_items(self):
+        broker1 = AccountBroker(self.get_db_path(), account='a')
+        broker1.initialize(Timestamp('1').internal)
+        broker2 = AccountBroker(self.get_db_path(), account='a')
+        broker2.initialize(Timestamp('1').internal)
+        broker1.put_container('a', Timestamp(1).internal, 0, 0, 0,
+                              POLICIES.default.idx)
+        broker1.put_container('b', Timestamp(2).internal, 0, 0, 0,
+                              POLICIES.default.idx)
+        id = broker1.get_info()['id']
+        broker2.merge_items(broker1.get_items_since(
+            broker2.get_sync(id), 1000), id)
+        items = broker2.get_items_since(-1, 1000)
+        self.assertEqual(len(items), 2)
+        self.assertEqual(['a', 'b'], sorted([rec['name'] for rec in items]))
+        broker1.put_container('c', Timestamp(3).internal, 0, 0, 0,
+                              POLICIES.default.idx)
+        broker2.merge_items(broker1.get_items_since(
+            broker2.get_sync(id), 1000), id)
+        items = broker2.get_items_since(-1, 1000)
+        self.assertEqual(len(items), 3)
+        self.assertEqual(['a', 'b', 'c'],
+                         sorted([rec['name'] for rec in items]))
+
+    def test_merge_items_overwrite_unicode(self):
+        snowman = u'\N{SNOWMAN}'
+        broker1 = AccountBroker(self.get_db_path(), account='a')
+        broker1.initialize(Timestamp('1').internal, 0)
+        id1 = broker1.get_info()['id']
+        broker2 = AccountBroker(self.get_db_path(), account='a')
+        broker2.initialize(Timestamp('1').internal, 0)
+        broker1.put_container(snowman, Timestamp(2).internal, 0, 1, 100,
+                              POLICIES.default.idx)
+        broker1.put_container('b', Timestamp(3).internal, 0, 0, 0,
+                              POLICIES.default.idx)
+        broker2.merge_items(json.loads(json.dumps(broker1.get_items_since(
+            broker2.get_sync(id1), 1000))), id1)
+        broker1.put_container(snowman, Timestamp(4).internal, 0, 2, 200,
+                              POLICIES.default.idx)
+        broker2.merge_items(json.loads(json.dumps(broker1.get_items_since(
+            broker2.get_sync(id1), 1000))), id1)
+        items = broker2.get_items_since(-1, 1000)
+        self.assertEqual(['b', snowman],
+                         sorted([rec['name'] for rec in items]))
+        items_by_name = dict((rec['name'], rec) for rec in items)
+
+        self.assertEqual(items_by_name[snowman]['object_count'], 2)
+        self.assertEqual(items_by_name[snowman]['bytes_used'], 200)
+
+        self.assertEqual(items_by_name['b']['object_count'], 0)
+        self.assertEqual(items_by_name['b']['bytes_used'], 0)
+
+    @with_tempdir
+    def test_load_old_pending_puts(self, tempdir):
+        # pending puts from pre-storage-policy account brokers won't contain
+        # the storage policy index
+        broker_path = os.path.join(tempdir, 'test-load-old.db')
+        broker = AccountBroker(broker_path, account='real')
+        broker.initialize(Timestamp(1).internal)
+        with open(broker.pending_file, 'a+b') as pending:
+            pending.write(b':')
+            pending.write(base64.b64encode(pickle.dumps(
+                # name, put_timestamp, delete_timestamp, object_count,
+                # bytes_used, deleted
+                ('oldcon', Timestamp(200).internal,
+                 Timestamp(0).internal,
+                 896, 9216695, 0))))
+
+        broker._commit_puts()
+        with broker.get() as conn:
+            results = list(conn.execute('''
+                SELECT name, storage_policy_index FROM container
+            '''))
+        self.assertEqual(len(results), 1)
+        self.assertEqual(dict(results[0]),
+                         {'name': 'oldcon', 'storage_policy_index': 0})
+
+    @with_tempdir
+    def test_get_info_stale_read_ok(self, tempdir):
+        # test getting a stale read from the db
+        broker_path = os.path.join(tempdir, 'test-load-old.db')
+
+        def mock_commit_puts():
+            raise sqlite3.OperationalError('unable to open database file')
+
+        broker = AccountBroker(broker_path, account='real',
+                               stale_reads_ok=True)
+        broker.initialize(Timestamp(1).internal)
+        with open(broker.pending_file, 'a+b') as pending:
+            pending.write(b':')
+            pending.write(base64.b64encode(pickle.dumps(
+                # name, put_timestamp, delete_timestamp, object_count,
+                # bytes_used, deleted
+                ('oldcon', Timestamp(200).internal,
+                 Timestamp(0).internal,
+                 896, 9216695, 0))))
+
+        broker._commit_puts = mock_commit_puts
+        broker.get_info()
+
+    @with_tempdir
+    def test_get_info_no_stale_reads(self, tempdir):
+        broker_path = os.path.join(tempdir, 'test-load-old.db')
+
+        def mock_commit_puts():
+            raise sqlite3.OperationalError('unable to open database file')
+
+        broker = AccountBroker(broker_path, account='real',
+                               stale_reads_ok=False)
+        broker.initialize(Timestamp(1).internal)
+        with open(broker.pending_file, 'a+b') as pending:
+            pending.write(b':')
+            pending.write(base64.b64encode(pickle.dumps(
+                # name, put_timestamp, delete_timestamp, object_count,
+                # bytes_used, deleted
+                ('oldcon', Timestamp(200).internal,
+                 Timestamp(0).internal,
+                 896, 9216695, 0))))
+
+        broker._commit_puts = mock_commit_puts
+
+        with self.assertRaises(sqlite3.OperationalError) as exc_context:
+            broker.get_info()
+        self.assertIn('unable to open database file',
+                      str(exc_context.exception))
+
+    @patch_policies([StoragePolicy(0, 'zero', False),
+                     StoragePolicy(1, 'one', True),
+                     StoragePolicy(2, 'two', False),
+                     StoragePolicy(3, 'three', False)])
+    def test_get_policy_stats(self):
+        broker = AccountBroker(self.get_db_path(), account='a')
+        broker.initialize(next(self.ts).internal)
+        # check empty policy_stats
+        self.assertTrue(broker.empty())
+        policy_stats = broker.get_policy_stats()
+        self.assertEqual(policy_stats, {})
+
+        # add some empty containers
+        for policy in POLICIES:
+            container_name = 'c-%s' % policy.name
+            put_timestamp = next(self.ts)
+            broker.put_container(container_name,
+                                 put_timestamp.internal, 0,
+                                 0, 0,
+                                 policy.idx)
+            policy_stats = broker.get_policy_stats()
+            stats = policy_stats[policy.idx]
+            if 'container_count' in stats:
+                self.assertEqual(stats['container_count'], 1)
+            self.assertEqual(stats['object_count'], 0)
+            self.assertEqual(stats['bytes_used'], 0)
+
+        # update the containers object & byte count
+        for policy in POLICIES:
+            container_name = 'c-%s' % policy.name
+            put_timestamp = next(self.ts)
+            count = policy.idx * 100  # good as any integer
+            broker.put_container(container_name,
+                                 put_timestamp.internal, 0,
+                                 count, count,
+                                 policy.idx)
+
+            policy_stats = broker.get_policy_stats()
+            stats = policy_stats[policy.idx]
+            if 'container_count' in stats:
+                self.assertEqual(stats['container_count'], 1)
+            self.assertEqual(stats['object_count'], count)
+            self.assertEqual(stats['bytes_used'], count)
+
+        # check all the policy_stats at once
+        for policy_index, stats in policy_stats.items():
+            policy = POLICIES[policy_index]
+            count = policy.idx * 100  # coupled with policy for test
+            if 'container_count' in stats:
+                self.assertEqual(stats['container_count'], 1)
+            self.assertEqual(stats['object_count'], count)
+            self.assertEqual(stats['bytes_used'], count)
+
+        # now delete the containers one by one
+        for policy in POLICIES:
+            container_name = 'c-%s' % policy.name
+            delete_timestamp = next(self.ts)
+            broker.put_container(container_name,
+                                 0, delete_timestamp.internal,
+                                 0, 0,
+                                 policy.idx)
+
+            policy_stats = broker.get_policy_stats()
+            stats = policy_stats[policy.idx]
+            if 'container_count' in stats:
+                self.assertEqual(stats['container_count'], 0)
+            self.assertEqual(stats['object_count'], 0)
+            self.assertEqual(stats['bytes_used'], 0)
+
+    @patch_policies([StoragePolicy(0, 'zero', False),
+                     StoragePolicy(1, 'one', True)])
+    def test_policy_stats_tracking(self):
+        broker = AccountBroker(self.get_db_path(), account='a')
+        broker.initialize(next(self.ts).internal)
+
+        # policy 0
+        broker.put_container('con1', next(self.ts).internal, 0, 12, 2798641, 0)
+        broker.put_container('con1', next(self.ts).internal, 0, 13, 8156441, 0)
+        # policy 1
+        broker.put_container('con2', next(self.ts).internal, 0, 7, 5751991, 1)
+        broker.put_container('con2', next(self.ts).internal, 0, 8, 6085379, 1)
+
+        stats = broker.get_policy_stats()
+        self.assertEqual(len(stats), 2)
+        if 'container_count' in stats[0]:
+            self.assertEqual(stats[0]['container_count'], 1)
+        self.assertEqual(stats[0]['object_count'], 13)
+        self.assertEqual(stats[0]['bytes_used'], 8156441)
+        if 'container_count' in stats[1]:
+            self.assertEqual(stats[1]['container_count'], 1)
+        self.assertEqual(stats[1]['object_count'], 8)
+        self.assertEqual(stats[1]['bytes_used'], 6085379)
+
+        # Break encapsulation here to make sure that there's only 2 rows in
+        # the stats table. It's possible that there could be 4 rows (one per
+        # put_container) but that they came out in the right order so that
+        # get_policy_stats() collapsed them down to the right number. To prove
+        # that's not so, we have to go peek at the broker's internals.
+        with broker.get() as conn:
+            nrows = conn.execute(
+                "SELECT COUNT(*) FROM policy_stat").fetchall()[0][0]
+        self.assertEqual(nrows, 2)
+
+    @with_tempdir
+    def test_newid(self, tempdir):
+        # test DatabaseBroker.newid
+        db_path = os.path.join(
+            tempdir, "d1234", 'accounts', 'part', 'suffix', 'hsh')
+        os.makedirs(db_path)
+        broker = AccountBroker(os.path.join(db_path, 'my.db'),
+                               account='a')
+        broker.initialize(Timestamp('1').internal, 0)
+        id = broker.get_info()['id']
+        broker.newid('someid')
+        self.assertNotEqual(id, broker.get_info()['id'])
+        # ends in the device name (from the path) unless it's an old
+        # container with just a uuid4 (tested in legecy broker
+        # tests e.g *BeforeMetaData)
+        if len(id) > 36:
+            self.assertTrue(id.endswith('d1234'))
+        # But the newid'ed version will now have the decide
+        self.assertTrue(broker.get_info()['id'].endswith('d1234'))
+
+        # if we move the broker (happens after an rsync)
+        new_db_path = os.path.join(
+            tempdir, "d5678", 'contianers', 'part', 'suffix', 'hsh')
+        os.makedirs(new_db_path)
+        shutil.copy(os.path.join(db_path, 'my.db'),
+                    os.path.join(new_db_path, 'my.db'))
+
+        new_broker = AccountBroker(os.path.join(new_db_path, 'my.db'),
+                                   account='a')
+        new_broker.newid(id)
+        # ends in the device name (from the path)
+        self.assertFalse(new_broker.get_info()['id'].endswith('d1234'))
+        self.assertTrue(new_broker.get_info()['id'].endswith('d5678'))
+
+    def _create_db(self, account='a'):
+        db_file = self.get_db_path()
+        b = AccountBroker(db_file, account=account)
+        b.initialize(Timestamp('1').internal)
+        return db_file
+
+    def test_path_caches_account(self):
+        db_file = self._create_db()
+        b = AccountBroker(db_file)
+        self.assertIsNone(b.account)
+        called = {'n': 0}
+
+        orig_get_info = AccountBroker.get_info
+
+        def capture_get_info(self):
+            called['n'] += 1
+            return orig_get_info(self)
+
+        self.assertEqual(0, called['n'])
+        with mock.patch.object(AccountBroker, 'get_info', capture_get_info):
+            self.assertEqual('a', b.path)
+            # accessing path will call get_info!
+            self.assertEqual(1, called['n'])
+            # and populate the account attribute
+            self.assertEqual('a', b.account)
+            # it's cached
+            for i in range(3):
+                self.assertEqual('a', b.path)
+                self.assertEqual('a', b.account)
+        # we only call get_info once
+        self.assertEqual(1, called['n'])
+
+    def test_path_uses_account_kwag(self):
+        db_file = self._create_db()
+        b = AccountBroker(db_file, account='a')
+        called = {'n': 0}
+
+        orig_get_info = AccountBroker.get_info
+
+        def capture_get_info(self):
+            called['n'] += 1
+            return orig_get_info(self)
+
+        self.assertEqual(0, called['n'])
+        with mock.patch.object(AccountBroker, 'get_info', capture_get_info):
+            self.assertEqual('a', b.path)
+        # we never call get_info
+        self.assertEqual(0, called['n'])
+
+    def test_path_on_uninitialized_broker(self):
+        db_file = self.get_db_path()
+        b = AccountBroker(db_file)
+        self.assertEqual(b.db_file, db_file)
+        with self.assertRaises(DatabaseConnectionError) as ctx:
+            getattr(b, 'path')
+        self.assertIn("DB doesn't exist", str(ctx.exception))
+        self.assertIn(db_file, str(ctx.exception))
+        with self.assertRaises(ValueError) as ctx:
+            b.initialize(next(self.ts))
+        self.assertEqual(
+            'Attempting to create a new database with no account set',
+            str(ctx.exception))
+        b.account = 'a'
+        self.assertEqual('a', b.path)
+
+
+def prespi_AccountBroker_initialize(self, conn, put_timestamp, **kwargs):
+    """
+    The AccountBroker initialze() function before we added the
+    policy stat table.  Used by test_policy_table_creation() to
+    make sure that the AccountBroker will correctly add the table
+    for cases where the DB existed before the policy support was added.
+
+    :param conn: DB connection object
+    :param put_timestamp: put timestamp
+    """
+    if not self.account:
+        raise ValueError(
+            'Attempting to create a new database with no account set')
+    self.create_container_table(conn)
+    self.create_account_stat_table(conn, put_timestamp)
+
+
+def premetadata_create_account_stat_table(self, conn, put_timestamp):
+    """
+    Copied from AccountBroker before the metadata column was
+    added; used for testing with TestAccountBrokerBeforeMetadata.
+
+    Create account_stat table which is specific to the account DB.
+
+    :param conn: DB connection object
+    :param put_timestamp: put timestamp
+    """
+    conn.executescript('''
+        CREATE TABLE account_stat (
+            account TEXT,
+            created_at TEXT,
+            put_timestamp TEXT DEFAULT '0',
+            delete_timestamp TEXT DEFAULT '0',
+            container_count INTEGER,
+            object_count INTEGER DEFAULT 0,
+            bytes_used INTEGER DEFAULT 0,
+            hash TEXT default '00000000000000000000000000000000',
+            id TEXT,
+            status TEXT DEFAULT '',
+            status_changed_at TEXT DEFAULT '0'
+        );
+
+        INSERT INTO account_stat (container_count) VALUES (0);
+    ''')
+
+    conn.execute('''
+        UPDATE account_stat SET account = ?, created_at = ?, id = ?,
+               put_timestamp = ?
+        ''', (self.account, Timestamp.now().internal, str(uuid4()),
+              put_timestamp))
+
+
+class TestCommonAccountBroker(test_db.TestExampleBroker):
+
+    broker_class = AccountBroker
+    server_type = 'account'
+
+    def setUp(self):
+        super(TestCommonAccountBroker, self).setUp()
+        self.policy = random.choice(list(POLICIES))
+
+    def put_item(self, broker, timestamp):
+        broker.put_container('test', timestamp, 0, 0, 0,
+                             int(self.policy))
+
+    def delete_item(self, broker, timestamp):
+        broker.put_container('test', 0, timestamp, 0, 0,
+                             int(self.policy))
+
+
+class TestAccountBrokerBeforeMetadata(TestAccountBroker):
+    """
+    Tests for AccountBroker against databases created before
+    the metadata column was added.
+    """
+
+    def setUp(self):
+        super(TestAccountBroker, self).setUp()
+        # tests seem to assume x-timestamp was set by the proxy before "now"
+        self.ts = make_timestamp_iter(offset=-1)
+        self._imported_create_account_stat_table = \
+            AccountBroker.create_account_stat_table
+        AccountBroker.create_account_stat_table = \
+            premetadata_create_account_stat_table
+        broker = AccountBroker(self.get_db_path(), account='a')
+        broker.initialize(Timestamp('1').internal)
+        exc = None
+        with broker.get() as conn:
+            try:
+                conn.execute('SELECT metadata FROM account_stat')
+            except BaseException as err:
+                exc = err
+        self.assertIn('no such column: metadata', str(exc))
+
+    def tearDown(self):
+        AccountBroker.create_account_stat_table = \
+            self._imported_create_account_stat_table
+        broker = AccountBroker(self.get_db_path(), account='a')
+        broker.initialize(Timestamp('1').internal)
+        with broker.get() as conn:
+            conn.execute('SELECT metadata FROM account_stat')
+        super(TestAccountBrokerBeforeMetadata, self).tearDown()
+
+
+def prespi_create_container_table(self, conn):
+    """
+    Copied from AccountBroker before the sstoage_policy_index column was
+    added; used for testing with TestAccountBrokerBeforeSPI.
+
+    Create container table which is specific to the account DB.
+
+    :param conn: DB connection object
+    """
+    conn.executescript("""
+        CREATE TABLE container (
+            ROWID INTEGER PRIMARY KEY AUTOINCREMENT,
+            name TEXT,
+            put_timestamp TEXT,
+            delete_timestamp TEXT,
+            object_count INTEGER,
+            bytes_used INTEGER,
+            deleted INTEGER DEFAULT 0
+        );
+
+        CREATE INDEX ix_container_deleted_name ON
+            container (deleted, name);
+
+        CREATE TRIGGER container_insert AFTER INSERT ON container
+        BEGIN
+            UPDATE account_stat
+            SET container_count = container_count + (1 - new.deleted),
+                object_count = object_count + new.object_count,
+                bytes_used = bytes_used + new.bytes_used,
+                hash = chexor(hash, new.name,
+                              new.put_timestamp || '-' ||
+                                new.delete_timestamp || '-' ||
+                                new.object_count || '-' || new.bytes_used);
+        END;
+
+        CREATE TRIGGER container_update BEFORE UPDATE ON container
+        BEGIN
+            SELECT RAISE(FAIL, 'UPDATE not allowed; DELETE and INSERT');
+        END;
+
+
+        CREATE TRIGGER container_delete AFTER DELETE ON container
+        BEGIN
+            UPDATE account_stat
+            SET container_count = container_count - (1 - old.deleted),
+                object_count = object_count - old.object_count,
+                bytes_used = bytes_used - old.bytes_used,
+                hash = chexor(hash, old.name,
+                              old.put_timestamp || '-' ||
+                                old.delete_timestamp || '-' ||
+                                old.object_count || '-' || old.bytes_used);
+        END;
+    """)
+
+
+class TestAccountBrokerBeforeSPI(TestAccountBroker):
+    """
+    Tests for AccountBroker against databases created before
+    the storage_policy_index column was added.
+    """
+
+    def setUp(self):
+        super(TestAccountBrokerBeforeSPI, self).setUp()
+        # tests seem to assume x-timestamp was set by the proxy before "now"
+        self.ts = make_timestamp_iter(offset=-1)
+        self._imported_create_container_table = \
+            AccountBroker.create_container_table
+        AccountBroker.create_container_table = \
+            prespi_create_container_table
+        self._imported_initialize = AccountBroker._initialize
+        AccountBroker._initialize = prespi_AccountBroker_initialize
+        broker = AccountBroker(self.get_db_path(), account='a')
+        broker.initialize(Timestamp('1').internal)
+        exc = None
+        with broker.get() as conn:
+            try:
+                conn.execute('SELECT storage_policy_index FROM container')
+            except BaseException as err:
+                exc = err
+        self.assertIn('no such column: storage_policy_index', str(exc))
+        with broker.get() as conn:
+            try:
+                conn.execute('SELECT * FROM policy_stat')
+            except sqlite3.OperationalError as err:
+                self.assertIn('no such table: policy_stat', str(err))
+            else:
+                self.fail('database created with policy_stat table')
+
+    def tearDown(self):
+        AccountBroker.create_container_table = \
+            self._imported_create_container_table
+        AccountBroker._initialize = self._imported_initialize
+        broker = AccountBroker(self.get_db_path(), account='a')
+        broker.initialize(Timestamp('1').internal)
+        with broker.get() as conn:
+            conn.execute('SELECT storage_policy_index FROM container')
+        super(TestAccountBrokerBeforeSPI, self).tearDown()
+
+    @with_tempdir
+    def test_policy_table_migration(self, tempdir):
+        db_path = os.path.join(tempdir, 'account.db')
+
+        # first init an acct DB without the policy_stat table present
+        broker = AccountBroker(db_path, account='a')
+        broker.initialize(Timestamp('1').internal)
+
+        def confirm_no_table():
+            with broker.get() as conn:
+                try:
+                    conn.execute('''
+                        SELECT * FROM policy_stat
+                        ''').fetchone()[0]
+                except sqlite3.OperationalError as err:
+                    # confirm that the table really isn't there
+                    self.assertIn('no such table: policy_stat', str(err))
+                else:
+                    self.fail('broker did not raise sqlite3.OperationalError '
+                              'trying to select from policy_stat table!')
+
+        confirm_no_table()
+
+        # make sure we can HEAD this thing w/o the table
+        stats = broker.get_policy_stats()
+        self.assertEqual(len(stats), 0)
+
+        confirm_no_table()
+
+        # now do a PUT to create the table
+        broker.put_container('o', Timestamp.now().internal, 0, 0, 0,
+                             POLICIES.default.idx)
+        broker._commit_puts_stale_ok()
+
+        # now confirm that the table was created
+        with broker.get() as conn:
+            conn.execute('SELECT * FROM policy_stat')
+
+        stats = broker.get_policy_stats()
+        self.assertEqual(len(stats), 1)
+
+    @with_tempdir
+    def test_policy_table_migration_in_get_policy_stats(self, tempdir):
+        db_path = os.path.join(tempdir, 'account.db')
+
+        # first init an acct DB without the policy_stat table present
+        broker = AccountBroker(db_path, account='a')
+        broker.initialize(Timestamp('1').internal)
+
+        # And manually add some container records for the default policy
+        with broker.get() as conn:
+            conn.execute('''
+                INSERT INTO container (
+                    name, put_timestamp, delete_timestamp,
+                    object_count, bytes_used
+                ) VALUES (
+                    'c', '%s', '0', 0, 0
+                )''' % Timestamp.now().internal).fetchone()
+            conn.commit()
+
+        def confirm_no_table():
+            with broker.get() as conn:
+                try:
+                    conn.execute('''
+                        SELECT * FROM policy_stat
+                        ''').fetchone()[0]
+                except sqlite3.OperationalError as err:
+                    # confirm that the table really isn't there
+                    self.assertIn('no such table: policy_stat', str(err))
+                else:
+                    self.fail('broker did not raise sqlite3.OperationalError '
+                              'trying to select from policy_stat table!')
+
+        confirm_no_table()
+
+        # make sure we can HEAD this thing w/o the table
+        stats = broker.get_policy_stats()
+        self.assertEqual(len(stats), 0)
+
+        confirm_no_table()
+
+        # but if we pass in do_migrations (like in the auditor), it comes in
+        stats = broker.get_policy_stats(do_migrations=True)
+        self.assertEqual(len(stats), 1)
+
+        # double check that it really exists
+        with broker.get() as conn:
+            conn.execute('SELECT * FROM policy_stat')
+
+    @patch_policies
+    @with_tempdir
+    def test_container_table_migration(self, tempdir):
+        db_path = os.path.join(tempdir, 'account.db')
+
+        # first init an acct DB without the policy_stat table present
+        broker = AccountBroker(db_path, account='a')
+        broker.initialize(Timestamp('1').internal)
+        with broker.get() as conn:
+            try:
+                conn.execute('''
+                    SELECT storage_policy_index FROM container
+                    ''').fetchone()[0]
+            except sqlite3.OperationalError as err:
+                # confirm that the table doesn't have this column
+                self.assertIn('no such column: storage_policy_index',
+                              str(err))
+            else:
+                self.fail('broker did not raise sqlite3.OperationalError '
+                          'trying to select from storage_policy_index '
+                          'from container table!')
+
+        # manually insert an existing row to avoid migration
+        timestamp = Timestamp.now().internal
+        with broker.get() as conn:
+            conn.execute('''
+                INSERT INTO container (name, put_timestamp,
+                    delete_timestamp, object_count, bytes_used,
+                    deleted)
+                VALUES (?, ?, ?, ?, ?, ?)
+            ''', ('test_name', timestamp, 0, 1, 2, 0))
+            conn.commit()
+
+        # make sure we can iter containers without the migration
+        for c in broker.list_containers_iter(1, None, None, None, None):
+            self.assertEqual(c, ('test_name', 1, 2, timestamp, 0, 0))
+
+        # stats table is mysteriously empty...
+        stats = broker.get_policy_stats()
+        self.assertEqual(len(stats), 0)
+
+        # now do a PUT with a different value for storage_policy_index
+        # which will update the DB schema as well as update policy_stats
+        # for legacy containers in the DB (those without an SPI)
+        other_policy = [p for p in POLICIES if p.idx != 0][0]
+        broker.put_container('test_second', Timestamp.now().internal,
+                             0, 3, 4, other_policy.idx)
+        broker._commit_puts_stale_ok()
+
+        with broker.get() as conn:
+            rows = conn.execute('''
+                SELECT name, storage_policy_index FROM container
+                ''').fetchall()
+            for row in rows:
+                if row[0] == 'test_name':
+                    self.assertEqual(row[1], 0)
+                else:
+                    self.assertEqual(row[1], other_policy.idx)
+
+        # we should have stats for both containers
+        stats = broker.get_policy_stats()
+        self.assertEqual(len(stats), 2)
+        if 'container_count' in stats[0]:
+            self.assertEqual(stats[0]['container_count'], 1)
+        self.assertEqual(stats[0]['object_count'], 1)
+        self.assertEqual(stats[0]['bytes_used'], 2)
+        if 'container_count' in stats[1]:
+            self.assertEqual(stats[1]['container_count'], 1)
+        self.assertEqual(stats[1]['object_count'], 3)
+        self.assertEqual(stats[1]['bytes_used'], 4)
+
+        # now lets delete a container and make sure policy_stats is OK
+        with broker.get() as conn:
+            conn.execute('''
+                DELETE FROM container WHERE name = ?
+                ''', ('test_name',))
+            conn.commit()
+        stats = broker.get_policy_stats()
+        self.assertEqual(len(stats), 2)
+        if 'container_count' in stats[0]:
+            self.assertEqual(stats[0]['container_count'], 0)
+        self.assertEqual(stats[0]['object_count'], 0)
+        self.assertEqual(stats[0]['bytes_used'], 0)
+        if 'container_count' in stats[1]:
+            self.assertEqual(stats[1]['container_count'], 1)
+        self.assertEqual(stats[1]['object_count'], 3)
+        self.assertEqual(stats[1]['bytes_used'], 4)
+
+    @with_tempdir
+    def test_half_upgraded_database(self, tempdir):
+        db_path = os.path.join(tempdir, 'account.db')
+
+        broker = AccountBroker(db_path, account='a')
+        broker.initialize(next(self.ts).internal)
+
+        self.assertTrue(broker.empty())
+
+        # add a container (to pending file)
+        broker.put_container('c', next(self.ts).internal, 0, 0, 0,
+                             POLICIES.default.idx)
+
+        real_get = broker.get
+        called = []
+
+        class ExpectedError(Exception):
+            '''Expected error to be raised during the test'''
+
+        @contextmanager
+        def mock_get():
+            with real_get() as conn:
+
+                class MockConn(object):
+                    def __init__(self, real_conn):
+                        self.real_conn = real_conn
+
+                    @property
+                    def cursor(self):
+                        return self.real_conn.cursor
+
+                    @property
+                    def execute(self):
+                        return self.real_conn.execute
+
+                    def executescript(self, script):
+                        if called:
+                            raise ExpectedError('kaboom!')
+                        called.append(script)
+
+                yield MockConn(conn)
+
+        broker.get = mock_get
+
+        try:
+            broker._commit_puts()
+        except ExpectedError:
+            pass
+        else:
+            self.fail('mock exception was not raised')
+
+        self.assertEqual(len(called), 1)
+        self.assertIn('CREATE TABLE policy_stat', called[0])
+
+        # nothing was committed
+        broker = AccountBroker(db_path, account='a')
+        with broker.get() as conn:
+            try:
+                conn.execute('SELECT * FROM policy_stat')
+            except sqlite3.OperationalError as err:
+                self.assertIn('no such table: policy_stat', str(err))
+            else:
+                self.fail('half upgraded database!')
+            container_count = conn.execute(
+                'SELECT count(*) FROM container').fetchone()[0]
+            self.assertEqual(container_count, 0)
+
+        # try again to commit puts
+        self.assertFalse(broker.empty())
+
+        # full migration successful
+        with broker.get() as conn:
+            conn.execute('SELECT * FROM policy_stat')
+            conn.execute('SELECT storage_policy_index FROM container')
+
+    @with_tempdir
+    def test_pre_storage_policy_replication(self, tempdir):
+        # make and two account database "replicas"
+        old_broker = AccountBroker(os.path.join(tempdir, 'old_account.db'),
+                                   account='a')
+        old_broker.initialize(next(self.ts).internal)
+        new_broker = AccountBroker(os.path.join(tempdir, 'new_account.db'),
+                                   account='a')
+        new_broker.initialize(next(self.ts).internal)
+        timestamp = next(self.ts).internal
+
+        # manually insert an existing row to avoid migration for old database
+        with old_broker.get() as conn:
+            conn.execute('''
+                INSERT INTO container (name, put_timestamp,
+                    delete_timestamp, object_count, bytes_used,
+                    deleted)
+                VALUES (?, ?, ?, ?, ?, ?)
+            ''', ('test_name', timestamp, 0, 1, 2, 0))
+            conn.commit()
+
+        # get replication info and rows form old database
+        info = old_broker.get_info()
+        rows = old_broker.get_items_since(0, 10)
+
+        # "send" replication rows to new database
+        new_broker.merge_items(rows, info['id'])
+
+        # make sure "test_name" container in new database
+        self.assertEqual(new_broker.get_info()['container_count'], 1)
+        for c in new_broker.list_containers_iter(1, None, None, None, None):
+            self.assertEqual(c, ('test_name', 1, 2, timestamp, 0, 0))
+
+        # full migration successful
+        with new_broker.get() as conn:
+            conn.execute('SELECT * FROM policy_stat')
+            conn.execute('SELECT storage_policy_index FROM container')
+
+
+def pre_track_containers_create_policy_stat(self, conn):
+    """
+    Copied from AccountBroker before the container_count column was
+    added.
+    Create policy_stat table which is specific to the account DB.
+    Not a part of Pluggable Back-ends, internal to the baseline code.
+
+    :param conn: DB connection object
+    """
+    conn.executescript("""
+        CREATE TABLE policy_stat (
+            storage_policy_index INTEGER PRIMARY KEY,
+            object_count INTEGER DEFAULT 0,
+            bytes_used INTEGER DEFAULT 0
+        );
+        INSERT OR IGNORE INTO policy_stat (
+            storage_policy_index, object_count, bytes_used
+        )
+        SELECT 0, object_count, bytes_used
+        FROM account_stat
+        WHERE container_count > 0;
+    """)
+
+
+def pre_track_containers_create_container_table(self, conn):
+    """
+    Copied from AccountBroker before the container_count column was
+    added (using old stat trigger script)
+    Create container table which is specific to the account DB.
+
+    :param conn: DB connection object
+    """
+    # revert to old trigger script to support one of the tests
+    OLD_POLICY_STAT_TRIGGER_SCRIPT = """
+        CREATE TRIGGER container_insert_ps AFTER INSERT ON container
+        BEGIN
+            INSERT OR IGNORE INTO policy_stat
+                (storage_policy_index, object_count, bytes_used)
+                VALUES (new.storage_policy_index, 0, 0);
+            UPDATE policy_stat
+            SET object_count = object_count + new.object_count,
+                bytes_used = bytes_used + new.bytes_used
+            WHERE storage_policy_index = new.storage_policy_index;
+        END;
+        CREATE TRIGGER container_delete_ps AFTER DELETE ON container
+        BEGIN
+            UPDATE policy_stat
+            SET object_count = object_count - old.object_count,
+                bytes_used = bytes_used - old.bytes_used
+            WHERE storage_policy_index = old.storage_policy_index;
+        END;
+
+    """
+    conn.executescript("""
+        CREATE TABLE container (
+            ROWID INTEGER PRIMARY KEY AUTOINCREMENT,
+            name TEXT,
+            put_timestamp TEXT,
+            delete_timestamp TEXT,
+            object_count INTEGER,
+            bytes_used INTEGER,
+            deleted INTEGER DEFAULT 0,
+            storage_policy_index INTEGER DEFAULT 0
+        );
+
+        CREATE INDEX ix_container_deleted_name ON
+            container (deleted, name);
+
+        CREATE TRIGGER container_insert AFTER INSERT ON container
+        BEGIN
+            UPDATE account_stat
+            SET container_count = container_count + (1 - new.deleted),
+                object_count = object_count + new.object_count,
+                bytes_used = bytes_used + new.bytes_used,
+                hash = chexor(hash, new.name,
+                              new.put_timestamp || '-' ||
+                                new.delete_timestamp || '-' ||
+                                new.object_count || '-' || new.bytes_used);
+        END;
+
+        CREATE TRIGGER container_update BEFORE UPDATE ON container
+        BEGIN
+            SELECT RAISE(FAIL, 'UPDATE not allowed; DELETE and INSERT');
+        END;
+
+
+        CREATE TRIGGER container_delete AFTER DELETE ON container
+        BEGIN
+            UPDATE account_stat
+            SET container_count = container_count - (1 - old.deleted),
+                object_count = object_count - old.object_count,
+                bytes_used = bytes_used - old.bytes_used,
+                hash = chexor(hash, old.name,
+                              old.put_timestamp || '-' ||
+                                old.delete_timestamp || '-' ||
+                                old.object_count || '-' || old.bytes_used);
+        END;
+    """ + OLD_POLICY_STAT_TRIGGER_SCRIPT)
+
+
+class AccountBrokerPreTrackContainerCountSetup(test_db.TestDbBase):
+    def assertUnmigrated(self, broker):
+        with broker.get() as conn:
+            try:
+                conn.execute('''
+                    SELECT container_count FROM policy_stat
+                    ''').fetchone()[0]
+            except sqlite3.OperationalError as err:
+                # confirm that the column really isn't there
+                self.assertIn('no such column: container_count', str(err))
+            else:
+                self.fail('broker did not raise sqlite3.OperationalError '
+                          'trying to select container_count from policy_stat!')
+
+    def setUp(self):
+        super(AccountBrokerPreTrackContainerCountSetup, self).setUp()
+        # use old version of policy_stat
+        self._imported_create_policy_stat_table = \
+            AccountBroker.create_policy_stat_table
+        AccountBroker.create_policy_stat_table = \
+            pre_track_containers_create_policy_stat
+        # use old container table so we use old trigger for
+        # updating policy_stat
+        self._imported_create_container_table = \
+            AccountBroker.create_container_table
+        AccountBroker.create_container_table = \
+            pre_track_containers_create_container_table
+
+        broker = AccountBroker(self.get_db_path(), account='a')
+        broker.initialize(Timestamp('1').internal)
+        self.assertUnmigrated(broker)
+
+        # tests seem to assume x-timestamp was set by the proxy before "now"
+        self.ts = make_timestamp_iter(offset=-1)
+
+        self.db_path = os.path.join(self.testdir, 'sda', 'accounts',
+                                    '0', '0', '0', 'test.db')
+        self.broker = AccountBroker(self.get_db_path(), account='a')
+        self.broker.initialize(next(self.ts).internal)
+
+        # Common sanity-check that our starting, pre-migration state correctly
+        # does not have the container_count column.
+        self.assertUnmigrated(self.broker)
+
+    def tearDown(self):
+        self.restore_account_broker()
+
+        broker = AccountBroker(self.get_db_path(), account='a')
+        broker.initialize(Timestamp('1').internal)
+        with broker.get() as conn:
+            conn.execute('SELECT container_count FROM policy_stat')
+        super(AccountBrokerPreTrackContainerCountSetup, self).tearDown()
+
+    def restore_account_broker(self):
+        AccountBroker.create_policy_stat_table = \
+            self._imported_create_policy_stat_table
+        AccountBroker.create_container_table = \
+            self._imported_create_container_table
+
+
+@patch_policies([StoragePolicy(0, 'zero', False),
+                 StoragePolicy(1, 'one', True),
+                 StoragePolicy(2, 'two', False),
+                 StoragePolicy(3, 'three', False)])
+class TestAccountBrokerBeforePerPolicyContainerTrack(
+        AccountBrokerPreTrackContainerCountSetup, TestAccountBroker):
+    """
+    Tests for AccountBroker against databases created before
+    the container_count column was added to the policy_stat table.
+    """
+
+    def test_policy_table_cont_count_do_migrations(self):
+        # add a few containers
+        num_containers = 8
+        policies = itertools.cycle(POLICIES)
+        per_policy_container_counts = defaultdict(int)
+
+        # add a few container entries
+        for i in range(num_containers):
+            name = 'test-container-%02d' % i
+            policy = next(policies)
+            self.broker.put_container(name, next(self.ts).internal,
+                                      0, 0, 0, int(policy))
+            per_policy_container_counts[int(policy)] += 1
+
+        total_container_count = self.broker.get_info()['container_count']
+        self.assertEqual(total_container_count, num_containers)
+
+        # still un-migrated
+        self.assertUnmigrated(self.broker)
+
+        policy_stats = self.broker.get_policy_stats()
+        self.assertEqual(len(policy_stats), len(per_policy_container_counts))
+        for stats in policy_stats.values():
+            self.assertEqual(stats['object_count'], 0)
+            self.assertEqual(stats['bytes_used'], 0)
+            # un-migrated dbs should not return container_count
+            self.assertNotIn('container_count', stats)
+
+        # now force the migration
+        policy_stats = self.broker.get_policy_stats(do_migrations=True)
+        self.assertEqual(len(policy_stats), len(per_policy_container_counts))
+        for policy_index, stats in policy_stats.items():
+            self.assertEqual(stats['object_count'], 0)
+            self.assertEqual(stats['bytes_used'], 0)
+            self.assertEqual(stats['container_count'],
+                             per_policy_container_counts[policy_index])
+
+    def test_policy_table_cont_count_update_get_stats(self):
+        # add a few container entries
+        ts_zero = Timestamp(0)
+        for policy in POLICIES:
+            for i in range(0, policy.idx + 1):
+                container_name = 'c%s_0' % policy.idx
+                self.broker.put_container('c%s_%s' % (policy.idx, i),
+                                          ts_zero.internal, ts_zero.internal,
+                                          0, 0, policy.idx)
+        # _commit_puts_stale_ok() called by get_policy_stats()
+
+        # calling get_policy_stats() with do_migrations will alter the table
+        # and populate it based on what's in the container table now
+        stats = self.broker.get_policy_stats(do_migrations=True)
+
+        # now confirm that the column was created
+        with self.broker.get() as conn:
+            conn.execute('SELECT container_count FROM policy_stat')
+
+        # confirm stats reporting back correctly
+        self.assertEqual(len(stats), 4)
+        for policy in POLICIES:
+            self.assertEqual(stats[policy.idx]['container_count'],
+                             policy.idx + 1)
+
+        # now delete one from each policy and check the stats
+        with self.broker.get() as conn:
+            for policy in POLICIES:
+                container_name = 'c%s_0' % policy.idx
+                conn.execute('''
+                        DELETE FROM container
+                        WHERE name = ?
+                        ''', (container_name,))
+            conn.commit()
+        stats = self.broker.get_policy_stats()
+        self.assertEqual(len(stats), 4)
+        for policy in POLICIES:
+            self.assertEqual(stats[policy.idx]['container_count'],
+                             policy.idx)
+
+        # now put them back and make sure things are still cool
+        for policy in POLICIES:
+            container_name = 'c%s_0' % policy.idx
+            self.broker.put_container(
+                container_name, ts_zero.internal, ts_zero.internal, 0, 0,
+                policy.idx)
+        # _commit_puts_stale_ok() called by get_policy_stats()
+
+        # confirm stats reporting back correctly
+        stats = self.broker.get_policy_stats()
+        self.assertEqual(len(stats), 4)
+        for policy in POLICIES:
+            self.assertEqual(stats[policy.idx]['container_count'],
+                             policy.idx + 1)
+
+    def test_per_policy_cont_count_migration_with_deleted(self):
+        num_containers = 15
+        policies = itertools.cycle(POLICIES)
+        container_policy_map = {}
+
+        # add a few container entries
+        for i in range(num_containers):
+            name = 'test-container-%02d' % i
+            policy = next(policies)
+            self.broker.put_container(name, next(self.ts).internal,
+                                      0, 0, 0, int(policy))
+            # keep track of stub container policies
+            container_policy_map[name] = policy
+
+        # delete about half of the containers
+        for i in range(0, num_containers, 2):
+            name = 'test-container-%02d' % i
+            policy = container_policy_map[name]
+            self.broker.put_container(name, 0, next(self.ts).internal,
+                                      0, 0, int(policy))
+
+        total_container_count = self.broker.get_info()['container_count']
+        self.assertEqual(total_container_count, num_containers // 2)
+
+        # trigger migration
+        policy_info = self.broker.get_policy_stats(do_migrations=True)
+        self.assertEqual(len(policy_info), min(num_containers, len(POLICIES)))
+        policy_container_count = sum(p['container_count'] for p in
+                                     policy_info.values())
+        self.assertEqual(total_container_count, policy_container_count)
+
+    def test_per_policy_cont_count_migration_with_single_policy(self):
+        num_containers = 100
+
+        with patch_policies(legacy_only=True):
+            policy = POLICIES[0]
+            # add a few container entries
+            for i in range(num_containers):
+                name = 'test-container-%02d' % i
+                self.broker.put_container(name, next(self.ts).internal,
+                                          0, 0, 0, int(policy))
+            # delete about half of the containers
+            for i in range(0, num_containers, 2):
+                name = 'test-container-%02d' % i
+                self.broker.put_container(name, 0, next(self.ts).internal,
+                                          0, 0, int(policy))
+
+            total_container_count = self.broker.get_info()['container_count']
+            # trigger migration
+            policy_info = self.broker.get_policy_stats(do_migrations=True)
+
+        self.assertEqual(total_container_count, num_containers / 2)
+
+        self.assertEqual(len(policy_info), 1)
+        policy_container_count = sum(p['container_count'] for p in
+                                     policy_info.values())
+        self.assertEqual(total_container_count, policy_container_count)
+
+    def test_per_policy_cont_count_migration_impossible(self):
+        with patch_policies(legacy_only=True):
+            # add a container for the legacy policy
+            policy = POLICIES[0]
+            self.broker.put_container('test-legacy-container',
+                                      next(self.ts).internal, 0, 0, 0,
+                                      int(policy))
+
+            # now create an impossible situation by adding a container for a
+            # policy index that doesn't exist
+            non_existent_policy_index = int(policy) + 1
+            self.broker.put_container('test-non-existent-policy',
+                                      next(self.ts).internal, 0, 0, 0,
+                                      non_existent_policy_index)
+
+            total_container_count = self.broker.get_info()['container_count']
+
+            # trigger migration
+            policy_info = self.broker.get_policy_stats(do_migrations=True)
+
+        self.assertEqual(total_container_count, 2)
+        self.assertEqual(len(policy_info), 2)
+        for policy_stat in policy_info.values():
+            self.assertEqual(policy_stat['container_count'], 1)
+
+    def test_migrate_add_storage_policy_index_fail(self):
+        broker = AccountBroker(self.db_path, account='a')
+        broker.initialize(Timestamp('1').internal)
+        with mock.patch.object(
+                broker, 'create_policy_stat_table',
+                side_effect=sqlite3.OperationalError('foobar')):
+            with broker.get() as conn:
+                self.assertRaisesRegex(
+                    sqlite3.OperationalError, '.*foobar.*',
+                    broker._migrate_add_storage_policy_index,
+                    conn=conn)
diff --git a/test/unit/account/test_reaper.py b/test/unit/account/test_reaper.py
index 5ddaf2ac03..35a80859f1 100644
--- a/test/unit/account/test_reaper.py
+++ b/test/unit/account/test_reaper.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,16 +13,27 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-# TODO: Tests
-
+import os
+import time
+import random
+import shutil
+import tempfile
 import unittest
 
+from unittest.mock import patch, call, DEFAULT
+import eventlet
+
 from swift.account import reaper
-from swift.common.utils import normalize_timestamp
+from swift.account.backend import DATADIR
+from swift.common.exceptions import ClientException
+from swift.common.utils import normalize_timestamp, Timestamp
 
+from test import unit
+from test.debug_logger import debug_logger
+from swift.common.storage_policy import StoragePolicy, POLICIES
 
-class FakeBroker(object):
 
+class FakeBroker(object):
     def __init__(self):
         self.info = {}
 
@@ -30,22 +41,211 @@ def get_info(self):
         return self.info
 
 
+class FakeAccountBroker(object):
+    def __init__(self, containers, logger):
+        self.containers = containers
+        self.containers_yielded = []
+
+    def get_info(self):
+        info = {'account': 'a',
+                'delete_timestamp': time.time() - 10}
+        return info
+
+    def list_containers_iter(self, limit, marker, *args, **kwargs):
+        if not kwargs.pop('allow_reserved'):
+            raise RuntimeError('Expected allow_reserved to be True!')
+        if kwargs:
+            raise RuntimeError('Got unexpected keyword arguments: %r' % (
+                kwargs, ))
+        for cont in self.containers:
+            if cont > marker:
+                yield cont, None, None, None, None, None
+            limit -= 1
+            if limit <= 0:
+                break
+
+    def is_status_deleted(self):
+        return True
+
+    def empty(self):
+        return False
+
+
+class FakeRing(object):
+    def __init__(self):
+        self.nodes = [{'id': '1',
+                       'ip': '10.10.10.1',
+                       'port': 6202,
+                       'device': 'sda1'},
+                      {'id': '2',
+                       'ip': '10.10.10.2',
+                       'port': 6202,
+                       'device': 'sda1'},
+                      {'id': '3',
+                       'ip': '10.10.10.3',
+                       'port': 6202,
+                       'device': None},
+                      {'id': '4',
+                       'ip': '10.10.10.1',
+                       'port': 6202,
+                       'device': 'sda2'},
+                      {'id': '5',
+                       'ip': '10.10.10.1',
+                       'port': 6202,
+                       'device': 'sda3'},
+                      ]
+
+    def get_nodes(self, *args, **kwargs):
+        return ('partition', self.nodes)
+
+    def get_part_nodes(self, *args, **kwargs):
+        return self.nodes
+
+
+acc_nodes = [{'device': 'sda1',
+              'ip': '',
+              'port': ''},
+             {'device': 'sda1',
+              'ip': '',
+              'port': ''},
+             {'device': 'sda1',
+              'ip': '',
+              'port': ''},
+             {'device': 'sda1',
+              'ip': '',
+              'port': ''},
+             {'device': 'sda1',
+              'ip': '',
+              'port': ''}]
+
+cont_nodes = [{'device': 'sda1',
+               'ip': '',
+               'port': ''},
+              {'device': 'sda1',
+               'ip': '',
+               'port': ''},
+              {'device': 'sda1',
+               'ip': '',
+               'port': ''},
+              {'device': 'sda1',
+               'ip': '',
+               'port': ''},
+              {'device': 'sda1',
+               'ip': '',
+               'port': ''}]
+
+
+@unit.patch_policies([StoragePolicy(0, 'zero', False,
+                                    object_ring=unit.FakeRing()),
+                      StoragePolicy(1, 'one', True,
+                                    object_ring=unit.FakeRing(replicas=4))])
 class TestReaper(unittest.TestCase):
 
+    def setUp(self):
+        self.to_delete = []
+        self.myexp = ClientException("", http_host=None,
+                                     http_port=None,
+                                     http_device=None,
+                                     http_status=404,
+                                     http_reason=None
+                                     )
+
+    def tearDown(self):
+        for todel in self.to_delete:
+            shutil.rmtree(todel)
+
+    def fake_direct_delete_object(self, *args, **kwargs):
+        if self.amount_fail < self.max_fail:
+            self.amount_fail += 1
+            raise self.myexp
+        if self.reap_obj_timeout:
+            raise eventlet.Timeout()
+
+    def fake_direct_delete_container(self, *args, **kwargs):
+        if self.amount_delete_fail < self.max_delete_fail:
+            self.amount_delete_fail += 1
+            raise self.myexp
+
+    def fake_direct_get_container(self, *args, **kwargs):
+        if self.get_fail:
+            raise self.myexp
+        if self.timeout:
+            raise eventlet.Timeout()
+        objects = [{'name': u'o1'},
+                   {'name': u'o2'},
+                   {'name': u'o3'},
+                   {'name': u'o4'}]
+        return None, [o for o in objects if o['name'] > kwargs['marker']]
+
+    def fake_container_ring(self):
+        return FakeRing()
+
+    def fake_reap_object(self, *args, **kwargs):
+        if self.reap_obj_fail:
+            raise Exception
+
+    def prepare_data_dir(self, ts=False, device='sda1'):
+        devices_path = tempfile.mkdtemp()
+        # will be deleted by teardown
+        self.to_delete.append(devices_path)
+        path = os.path.join(devices_path, device, DATADIR)
+        os.makedirs(path)
+        path = os.path.join(path, '100',
+                            'a86', 'a8c682d2472e1720f2d81ff8993aba6')
+        os.makedirs(path)
+        suffix = 'db'
+        if ts:
+            suffix = 'ts'
+        with open(os.path.join(path, 'a8c682203aba6.%s' % suffix), 'w') as fd:
+            fd.write('')
+        return devices_path
+
+    def init_reaper(self, conf=None, myips=None, fakelogger=False):
+        if conf is None:
+            conf = {}
+        if myips is None:
+            myips = ['10.10.10.1']
+
+        r = reaper.AccountReaper(conf)
+        r.myips = myips
+        if fakelogger:
+            r.logger = debug_logger('test-reaper')
+        return r
+
+    def fake_reap_account(self, *args, **kwargs):
+        self.called_amount += 1
+
+    def fake_account_ring(self):
+        return FakeRing()
+
+    def test_creation(self):
+        # later config should be extended to assert more config options
+        r = reaper.AccountReaper({'node_timeout': '3.5'})
+        self.assertEqual(r.node_timeout, 3.5)
+
     def test_delay_reaping_conf_default(self):
         r = reaper.AccountReaper({})
-        self.assertEquals(r.delay_reaping, 0)
+        self.assertEqual(r.delay_reaping, 0)
         r = reaper.AccountReaper({'delay_reaping': ''})
-        self.assertEquals(r.delay_reaping, 0)
+        self.assertEqual(r.delay_reaping, 0)
 
     def test_delay_reaping_conf_set(self):
         r = reaper.AccountReaper({'delay_reaping': '123'})
-        self.assertEquals(r.delay_reaping, 123)
+        self.assertEqual(r.delay_reaping, 123)
 
     def test_delay_reaping_conf_bad_value(self):
         self.assertRaises(ValueError, reaper.AccountReaper,
                           {'delay_reaping': 'abc'})
 
+    def test_reap_warn_after_conf_set(self):
+        conf = {'delay_reaping': '2', 'reap_warn_after': '3'}
+        r = reaper.AccountReaper(conf)
+        self.assertEqual(r.reap_not_done_after, 5)
+
+    def test_reap_warn_after_conf_bad_value(self):
+        self.assertRaises(ValueError, reaper.AccountReaper,
+                          {'reap_warn_after': 'abc'})
+
     def test_reap_delay(self):
         time_value = [100]
 
@@ -72,6 +272,572 @@ def _time():
         finally:
             reaper.time = time_orig
 
+    def test_reset_stats(self):
+        conf = {}
+        r = reaper.AccountReaper(conf)
+        self.assertDictEqual(r.stats_return_codes, {})
+        self.assertEqual(r.stats_containers_deleted, 0)
+        self.assertEqual(r.stats_containers_remaining, 0)
+        self.assertEqual(r.stats_containers_possibly_remaining, 0)
+        self.assertEqual(r.stats_objects_deleted, 0)
+        self.assertEqual(r.stats_objects_remaining, 0)
+        self.assertEqual(r.stats_objects_possibly_remaining, 0)
+        # also make sure reset actually resets values
+        r.stats_return_codes = {"hello": "swift"}
+        r.stats_containers_deleted = random.randint(1, 100)
+        r.stats_containers_remaining = random.randint(1, 100)
+        r.stats_containers_possibly_remaining = random.randint(1, 100)
+        r.stats_objects_deleted = random.randint(1, 100)
+        r.stats_objects_remaining = random.randint(1, 100)
+        r.stats_objects_possibly_remaining = random.randint(1, 100)
+        r.reset_stats()
+        self.assertDictEqual(r.stats_return_codes, {})
+        self.assertEqual(r.stats_containers_deleted, 0)
+        self.assertEqual(r.stats_containers_remaining, 0)
+        self.assertEqual(r.stats_containers_possibly_remaining, 0)
+        self.assertEqual(r.stats_objects_deleted, 0)
+        self.assertEqual(r.stats_objects_remaining, 0)
+        self.assertEqual(r.stats_objects_possibly_remaining, 0)
+
+    def test_reap_object(self):
+        conf = {
+            'mount_check': 'false',
+        }
+        r = reaper.AccountReaper(conf, logger=debug_logger())
+        mock_path = 'swift.account.reaper.direct_delete_object'
+        for policy in POLICIES:
+            r.reset_stats()
+            with patch(mock_path) as fake_direct_delete:
+                ts_now = Timestamp(1429117638.86767)
+                with patch('swift.common.utils.Timestamp.now',
+                           return_value=ts_now) as mock_now:
+                    r.reap_object('a', 'c', 'partition', cont_nodes, 'o',
+                                  policy.idx)
+                    mock_now.assert_called_once_with()
+                    for i, call_args in enumerate(
+                            fake_direct_delete.call_args_list):
+                        cnode = cont_nodes[i % len(cont_nodes)]
+                        host = '%(ip)s:%(port)s' % cnode
+                        device = cnode['device']
+                        headers = {
+                            'X-Container-Host': host,
+                            'X-Container-Partition': 'partition',
+                            'X-Container-Device': device,
+                            'X-Backend-Storage-Policy-Index': policy.idx,
+                            'X-Timestamp': ts_now.internal,
+                            'x-backend-use-replication-network': 'true',
+                        }
+                        ring = r.get_object_ring(policy.idx)
+                        expected = call(dict(ring.devs[i], index=i), 0,
+                                        'a', 'c', 'o',
+                                        headers=headers, conn_timeout=0.5,
+                                        response_timeout=10)
+                        self.assertEqual(call_args, expected)
+                    self.assertEqual(policy.object_ring.replicas - 1, i)
+            self.assertEqual(r.stats_objects_deleted,
+                             policy.object_ring.replicas)
+
+    def test_reap_object_fail(self):
+        r = self.init_reaper({}, fakelogger=True)
+        self.amount_fail = 0
+        self.max_fail = 1
+        self.reap_obj_timeout = False
+        policy = random.choice(list(POLICIES))
+        with patch('swift.account.reaper.direct_delete_object',
+                   self.fake_direct_delete_object):
+            r.reap_object('a', 'c', 'partition', cont_nodes, 'o',
+                          policy.idx)
+        # IMHO, the stat handling in the node loop of reap object is
+        # over indented, but no one has complained, so I'm not inclined
+        # to move it.  However it's worth noting we're currently keeping
+        # stats on deletes per *replica* - which is rather obvious from
+        # these tests, but this results is surprising because of some
+        # funny logic to *skip* increments on successful deletes of
+        # replicas until we have more successful responses than
+        # failures.  This means that while the first replica doesn't
+        # increment deleted because of the failure, the second one
+        # *does* get successfully deleted, but *also does not* increment
+        # the counter (!?).
+        #
+        # In the three replica case this leaves only the last deleted
+        # object incrementing the counter - in the four replica case
+        # this leaves the last two.
+        #
+        # Basically this test will always result in:
+        #   deleted == num_replicas - 2
+        self.assertEqual(r.stats_objects_deleted,
+                         policy.object_ring.replicas - 2)
+        self.assertEqual(r.stats_objects_remaining, 1)
+        self.assertEqual(r.stats_objects_possibly_remaining, 1)
+        self.assertEqual(r.stats_return_codes[2],
+                         policy.object_ring.replicas - 1)
+        self.assertEqual(r.stats_return_codes[4], 1)
+
+    def test_reap_object_timeout(self):
+        r = self.init_reaper({}, fakelogger=True)
+        self.amount_fail = 1
+        self.max_fail = 0
+        self.reap_obj_timeout = True
+        with patch('swift.account.reaper.direct_delete_object',
+                   self.fake_direct_delete_object):
+            r.reap_object('a', 'c', 'partition', cont_nodes, 'o', 1)
+        self.assertEqual(r.stats_objects_deleted, 0)
+        self.assertEqual(r.stats_objects_remaining, 4)
+        self.assertEqual(r.stats_objects_possibly_remaining, 0)
+        self.assertTrue(r.logger.get_lines_for_level(
+            'error')[-1].startswith('Timeout Exception'))
+
+    def test_reap_object_non_exist_policy_index(self):
+        r = self.init_reaper({}, fakelogger=True)
+        r.reap_object('a', 'c', 'partition', cont_nodes, 'o', 2)
+        self.assertEqual(r.stats_objects_deleted, 0)
+        self.assertEqual(r.stats_objects_remaining, 1)
+        self.assertEqual(r.stats_objects_possibly_remaining, 0)
+
+    @patch('swift.account.reaper.Ring',
+           lambda *args, **kwargs: unit.FakeRing())
+    def test_reap_container(self):
+        policy = random.choice(list(POLICIES))
+        r = self.init_reaper({}, fakelogger=True)
+        with patch.multiple('swift.account.reaper',
+                            direct_get_container=DEFAULT,
+                            direct_delete_object=DEFAULT,
+                            direct_delete_container=DEFAULT) as mocks:
+            headers = {'X-Backend-Storage-Policy-Index': policy.idx}
+            obj_listing = [{'name': 'o'}]
+
+            def fake_get_container(*args, **kwargs):
+                try:
+                    obj = obj_listing.pop(0)
+                except IndexError:
+                    obj_list = []
+                else:
+                    obj_list = [obj]
+                return headers, obj_list
+
+            mocks['direct_get_container'].side_effect = fake_get_container
+            mock_timestamps = [Timestamp(1429117638.86767),
+                               Timestamp(1429117639.67676)]
+            with patch('swift.common.utils.Timestamp.now',
+                       side_effect=mock_timestamps):
+                r.reap_container('a', 'partition', acc_nodes, 'c')
+
+            # verify calls to direct_delete_object
+            mock_calls = mocks['direct_delete_object'].call_args_list
+            self.assertEqual(policy.object_ring.replicas, len(mock_calls))
+            for call_args in mock_calls:
+                _args, kwargs = call_args
+                self.assertEqual(kwargs['headers']
+                                 ['X-Backend-Storage-Policy-Index'],
+                                 policy.idx)
+                self.assertEqual(kwargs['headers']['X-Timestamp'],
+                                 mock_timestamps[0].internal)
+
+            # verify calls to direct_delete_container
+            self.assertEqual(mocks['direct_delete_container'].call_count, 3)
+            for i, call_args in enumerate(
+                    mocks['direct_delete_container'].call_args_list):
+                anode = acc_nodes[i % len(acc_nodes)]
+                host = '%(ip)s:%(port)s' % anode
+                device = anode['device']
+                headers = {
+                    'X-Account-Host': host,
+                    'X-Account-Partition': 'partition',
+                    'X-Account-Device': device,
+                    'X-Account-Override-Deleted': 'yes',
+                    'X-Timestamp': mock_timestamps[1].internal,
+                    'x-backend-use-replication-network': 'true',
+                }
+                ring = r.get_object_ring(policy.idx)
+                expected = call(dict(ring.devs[i], index=i), 0, 'a', 'c',
+                                headers=headers, conn_timeout=0.5,
+                                response_timeout=10)
+                self.assertEqual(call_args, expected)
+        self.assertEqual(r.stats_objects_deleted, policy.object_ring.replicas)
+
+    def test_reap_container_get_object_fail(self):
+        r = self.init_reaper({}, fakelogger=True)
+        self.get_fail = True
+        self.reap_obj_fail = False
+        self.amount_delete_fail = 0
+        self.max_delete_fail = 0
+        with patch('swift.account.reaper.direct_get_container',
+                   self.fake_direct_get_container), \
+                patch('swift.account.reaper.direct_delete_container',
+                      self.fake_direct_delete_container), \
+                patch('swift.account.reaper.AccountReaper.get_container_ring',
+                      self.fake_container_ring), \
+                patch('swift.account.reaper.AccountReaper.reap_object',
+                      self.fake_reap_object):
+            r.reap_container('a', 'partition', acc_nodes, 'c')
+        self.assertEqual(
+            r.logger.statsd_client.get_stats_counts()['return_codes.4'], 1)
+        self.assertEqual(r.stats_containers_deleted, 1)
+
+    def test_reap_container_partial_fail(self):
+        r = self.init_reaper({}, fakelogger=True)
+        self.get_fail = False
+        self.timeout = False
+        self.reap_obj_fail = False
+        self.amount_delete_fail = 0
+        self.max_delete_fail = 4
+        with patch('swift.account.reaper.direct_get_container',
+                   self.fake_direct_get_container), \
+                patch('swift.account.reaper.direct_delete_container',
+                      self.fake_direct_delete_container), \
+                patch('swift.account.reaper.AccountReaper.get_container_ring',
+                      self.fake_container_ring), \
+                patch('swift.account.reaper.AccountReaper.reap_object',
+                      self.fake_reap_object):
+            r.reap_container('a', 'partition', acc_nodes, 'c')
+        self.assertEqual(
+            r.logger.statsd_client.get_stats_counts()['return_codes.4'], 4)
+        self.assertEqual(r.stats_containers_possibly_remaining, 1)
+
+    def test_reap_container_full_fail(self):
+        r = self.init_reaper({}, fakelogger=True)
+        self.get_fail = False
+        self.timeout = False
+        self.reap_obj_fail = False
+        self.amount_delete_fail = 0
+        self.max_delete_fail = 5
+        with patch('swift.account.reaper.direct_get_container',
+                   self.fake_direct_get_container), \
+                patch('swift.account.reaper.direct_delete_container',
+                      self.fake_direct_delete_container), \
+                patch('swift.account.reaper.AccountReaper.get_container_ring',
+                      self.fake_container_ring), \
+                patch('swift.account.reaper.AccountReaper.reap_object',
+                      self.fake_reap_object):
+            r.reap_container('a', 'partition', acc_nodes, 'c')
+        self.assertEqual(
+            r.logger.statsd_client.get_stats_counts()['return_codes.4'], 5)
+        self.assertEqual(r.stats_containers_remaining, 1)
+
+    def test_reap_container_get_object_timeout(self):
+        r = self.init_reaper({}, fakelogger=True)
+        self.get_fail = False
+        self.timeout = True
+        self.reap_obj_fail = False
+        self.amount_delete_fail = 0
+        self.max_delete_fail = 0
+        with patch('swift.account.reaper.direct_get_container',
+                   self.fake_direct_get_container), \
+                patch('swift.account.reaper.direct_delete_container',
+                      self.fake_direct_delete_container), \
+                patch('swift.account.reaper.AccountReaper.get_container_ring',
+                      self.fake_container_ring), \
+                patch('swift.account.reaper.AccountReaper.reap_object',
+                      self.fake_reap_object):
+            r.reap_container('a', 'partition', acc_nodes, 'c')
+        self.assertTrue(r.logger.get_lines_for_level(
+            'error')[-1].startswith('Timeout Exception'))
+
+    @patch('swift.account.reaper.Ring',
+           lambda *args, **kwargs: unit.FakeRing())
+    def test_reap_container_non_exist_policy_index(self):
+        r = self.init_reaper({}, fakelogger=True)
+        with patch.multiple('swift.account.reaper',
+                            direct_get_container=DEFAULT,
+                            direct_delete_object=DEFAULT,
+                            direct_delete_container=DEFAULT) as mocks:
+            headers = {'X-Backend-Storage-Policy-Index': 2}
+            obj_listing = [{'name': 'o'}]
+
+            def fake_get_container(*args, **kwargs):
+                try:
+                    obj = obj_listing.pop(0)
+                except IndexError:
+                    obj_list = []
+                else:
+                    obj_list = [obj]
+                return headers, obj_list
+
+            mocks['direct_get_container'].side_effect = fake_get_container
+            r.reap_container('a', 'partition', acc_nodes, 'c')
+        self.assertEqual(r.logger.get_lines_for_level('error'), [
+            'ERROR: invalid storage policy index: 2'])
+
+    def fake_reap_container(self, *args, **kwargs):
+        self.called_amount += 1
+        self.r.stats_containers_deleted = 1
+        self.r.stats_objects_deleted = 1
+        self.r.stats_containers_remaining = 1
+        self.r.stats_objects_remaining = 1
+        self.r.stats_containers_possibly_remaining = 1
+        self.r.stats_objects_possibly_remaining = 1
+        self.r.stats_return_codes[2] = \
+            self.r.stats_return_codes.get(2, 0) + 1
+
+    def test_reap_account(self):
+        containers = ('c1', 'c2', 'c3', 'c4')
+        broker = FakeAccountBroker(containers, debug_logger())
+        self.called_amount = 0
+        self.r = r = self.init_reaper({}, fakelogger=True)
+        r.start_time = time.time()
+        with patch('swift.account.reaper.AccountReaper.reap_container',
+                   self.fake_reap_container), \
+                patch('swift.account.reaper.AccountReaper.get_account_ring',
+                      self.fake_account_ring):
+            nodes = r.get_account_ring().get_part_nodes()
+            for container_shard, node in enumerate(nodes):
+                self.assertTrue(
+                    r.reap_account(broker, 'partition', nodes,
+                                   container_shard=container_shard))
+        self.assertEqual(self.called_amount, 4)
+        info_lines = r.logger.get_lines_for_level('info')
+        self.assertEqual(len(info_lines), 10)
+        for start_line, stat_line in zip(*[iter(info_lines)] * 2):
+            self.assertEqual(start_line, 'Beginning pass on account a')
+            self.assertTrue(stat_line.find('1 containers deleted'))
+            self.assertTrue(stat_line.find('1 objects deleted'))
+            self.assertTrue(stat_line.find('1 containers remaining'))
+            self.assertTrue(stat_line.find('1 objects remaining'))
+            self.assertTrue(stat_line.find('1 containers possibly remaining'))
+            self.assertTrue(stat_line.find('1 objects possibly remaining'))
+            self.assertTrue(stat_line.find('return codes: 2 2xxs'))
+
+    @patch('swift.account.reaper.Ring',
+           lambda *args, **kwargs: unit.FakeRing())
+    def test_basic_reap_account(self):
+        self.r = reaper.AccountReaper({})
+        self.r.account_ring = None
+        self.r.get_account_ring()
+        self.assertEqual(self.r.account_ring.replica_count, 3)
+        self.assertEqual(len(self.r.account_ring.devs), 3)
+
+    def test_reap_account_no_container(self):
+        broker = FakeAccountBroker(tuple(), debug_logger())
+        self.r = r = self.init_reaper({}, fakelogger=True)
+        self.called_amount = 0
+        r.start_time = time.time()
+        with patch('swift.account.reaper.AccountReaper.reap_container',
+                   self.fake_reap_container), \
+                patch('swift.account.reaper.AccountReaper.get_account_ring',
+                      self.fake_account_ring):
+            nodes = r.get_account_ring().get_part_nodes()
+            self.assertTrue(r.reap_account(broker, 'partition', nodes))
+        self.assertTrue(r.logger.get_lines_for_level(
+            'info')[-1].startswith('Completed pass'))
+        self.assertEqual(self.called_amount, 0)
+
+    def test_reap_device(self):
+        devices = self.prepare_data_dir()
+        self.called_amount = 0
+        conf = {'devices': devices}
+        r = self.init_reaper(conf)
+        with patch('swift.account.reaper.AccountBroker',
+                   FakeAccountBroker), \
+                patch('swift.account.reaper.AccountReaper.get_account_ring',
+                      self.fake_account_ring), \
+                patch('swift.account.reaper.AccountReaper.reap_account',
+                      self.fake_reap_account):
+            r.reap_device('sda1')
+        self.assertEqual(self.called_amount, 1)
+
+    def test_reap_device_with_ts(self):
+        devices = self.prepare_data_dir(ts=True)
+        self.called_amount = 0
+        conf = {'devices': devices}
+        r = self.init_reaper(conf=conf)
+        with patch('swift.account.reaper.AccountBroker',
+                   FakeAccountBroker), \
+                patch('swift.account.reaper.AccountReaper.get_account_ring',
+                      self.fake_account_ring), \
+                patch('swift.account.reaper.AccountReaper.reap_account',
+                      self.fake_reap_account):
+            r.reap_device('sda1')
+        self.assertEqual(self.called_amount, 0)
+
+    def test_reap_device_with_not_my_ip(self):
+        devices = self.prepare_data_dir()
+        self.called_amount = 0
+        conf = {'devices': devices}
+        r = self.init_reaper(conf, myips=['10.10.1.2'])
+        with patch('swift.account.reaper.AccountBroker',
+                   FakeAccountBroker), \
+                patch('swift.account.reaper.AccountReaper.get_account_ring',
+                      self.fake_account_ring), \
+                patch('swift.account.reaper.AccountReaper.reap_account',
+                      self.fake_reap_account):
+            r.reap_device('sda1')
+        self.assertEqual(self.called_amount, 0)
+
+    def test_reap_device_with_sharding(self):
+        devices = self.prepare_data_dir()
+        conf = {'devices': devices}
+        r = self.init_reaper(conf, myips=['10.10.10.2'])
+        container_shard_used = [-1]
+
+        def fake_reap_account(*args, **kwargs):
+            container_shard_used[0] = kwargs.get('container_shard')
+
+        with patch('swift.account.reaper.AccountBroker',
+                   FakeAccountBroker), \
+                patch('swift.account.reaper.AccountReaper.get_account_ring',
+                      self.fake_account_ring), \
+                patch('swift.account.reaper.AccountReaper.reap_account',
+                      fake_reap_account):
+            r.reap_device('sda1')
+        # 10.10.10.2 is second node from ring
+        self.assertEqual(container_shard_used[0], 1)
+
+    def test_reap_device_with_sharding_and_various_devices(self):
+        devices = self.prepare_data_dir(device='sda2')
+        conf = {'devices': devices}
+        r = self.init_reaper(conf)
+        container_shard_used = [-1]
+
+        def fake_reap_account(*args, **kwargs):
+            container_shard_used[0] = kwargs.get('container_shard')
+
+        with patch('swift.account.reaper.AccountBroker',
+                   FakeAccountBroker), \
+                patch('swift.account.reaper.AccountReaper.get_account_ring',
+                      self.fake_account_ring), \
+                patch('swift.account.reaper.AccountReaper.reap_account',
+                      fake_reap_account):
+            r.reap_device('sda2')
+
+        # 10.10.10.2 is second node from ring
+        self.assertEqual(container_shard_used[0], 3)
+
+        devices = self.prepare_data_dir(device='sda3')
+        conf = {'devices': devices}
+        r = self.init_reaper(conf)
+        container_shard_used = [-1]
+
+        with patch('swift.account.reaper.AccountBroker',
+                   FakeAccountBroker), \
+                patch('swift.account.reaper.AccountReaper.get_account_ring',
+                      self.fake_account_ring), \
+                patch('swift.account.reaper.AccountReaper.reap_account',
+                      fake_reap_account):
+            r.reap_device('sda3')
+
+        # 10.10.10.2 is second node from ring
+        self.assertEqual(container_shard_used[0], 4)
+
+    def test_reap_account_with_sharding(self):
+        devices = self.prepare_data_dir()
+        self.called_amount = 0
+        conf = {'devices': devices}
+        r = self.init_reaper(conf, myips=['10.10.10.2'], fakelogger=True)
+
+        container_reaped = [0]
+
+        def fake_list_containers_iter(self, *args, **kwargs):
+            if not kwargs.pop('allow_reserved'):
+                raise RuntimeError('Expected allow_reserved to be True!')
+            if kwargs:
+                raise RuntimeError('Got unexpected keyword arguments: %r' % (
+                    kwargs, ))
+            for container in self.containers:
+                if container in self.containers_yielded:
+                    continue
+
+                yield container, None, None, None, None, None
+                self.containers_yielded.append(container)
+
+        def fake_reap_container(self, account, account_partition,
+                                account_nodes, container):
+            container_reaped[0] += 1
+
+        fake_ring = FakeRing()
+        fake_logger = debug_logger()
+        with patch('swift.account.reaper.AccountBroker',
+                   FakeAccountBroker), \
+                patch(
+                    'swift.account.reaper.AccountBroker.list_containers_iter',
+                    fake_list_containers_iter), \
+                patch('swift.account.reaper.AccountReaper.reap_container',
+                      fake_reap_container):
+
+            fake_broker = FakeAccountBroker(['c', 'd', 'e', 'f', 'g'],
+                                            fake_logger)
+            r.reap_account(fake_broker, 10, fake_ring.nodes, 0)
+            self.assertEqual(container_reaped[0], 0)
+
+            fake_broker = FakeAccountBroker(['c', 'd', 'e', 'f', 'g'],
+                                            fake_logger)
+            container_reaped[0] = 0
+            r.reap_account(fake_broker, 10, fake_ring.nodes, 1)
+            self.assertEqual(container_reaped[0], 1)
+
+            container_reaped[0] = 0
+            fake_broker = FakeAccountBroker(['c', 'd', 'e', 'f', 'g'],
+                                            fake_logger)
+            r.reap_account(fake_broker, 10, fake_ring.nodes, 2)
+            self.assertEqual(container_reaped[0], 0)
+
+            container_reaped[0] = 0
+            fake_broker = FakeAccountBroker(['c', 'd', 'e', 'f', 'g'],
+                                            fake_logger)
+            r.reap_account(fake_broker, 10, fake_ring.nodes, 3)
+            self.assertEqual(container_reaped[0], 3)
+
+            container_reaped[0] = 0
+            fake_broker = FakeAccountBroker(['c', 'd', 'e', 'f', 'g'],
+                                            fake_logger)
+            r.reap_account(fake_broker, 10, fake_ring.nodes, 4)
+            self.assertEqual(container_reaped[0], 1)
+
+    def test_run_once(self):
+        def prepare_data_dir():
+            devices_path = tempfile.mkdtemp()
+            # will be deleted by teardown
+            self.to_delete.append(devices_path)
+            path = os.path.join(devices_path, 'sda1', DATADIR)
+            os.makedirs(path)
+            return devices_path
+
+        def init_reaper(devices):
+            r = reaper.AccountReaper({'devices': devices})
+            return r
+
+        devices = prepare_data_dir()
+        r = init_reaper(devices)
+
+        with patch('swift.account.reaper.AccountReaper.reap_device') as foo, \
+                unit.mock_check_drive(ismount=True):
+            r.run_once()
+        self.assertEqual(foo.called, 1)
+
+        with patch('swift.account.reaper.AccountReaper.reap_device') as foo, \
+                unit.mock_check_drive(ismount=False):
+            r.run_once()
+        self.assertFalse(foo.called)
+
+        with patch('swift.account.reaper.AccountReaper.reap_device') as foo:
+            r.logger = debug_logger('test-reaper')
+            r.devices = 'thisdeviceisbad'
+            r.run_once()
+        self.assertTrue(r.logger.get_lines_for_level(
+            'error')[-1].startswith('Exception in top-level account reaper'))
+
+    def test_run_forever(self):
+        def fake_sleep(val):
+            self.val = val
+
+        def fake_random():
+            return 1
+
+        def fake_run_once():
+            raise Exception('exit')
+
+        def init_reaper():
+            r = reaper.AccountReaper({'interval': 1})
+            r.run_once = fake_run_once
+            return r
+
+        r = init_reaper()
+        with patch('swift.account.reaper.sleep', fake_sleep):
+            with patch('swift.account.reaper.random.random', fake_random):
+                with self.assertRaises(Exception) as raised:
+                    r.run_forever()
+        self.assertEqual(self.val, 1)
+        self.assertEqual(str(raised.exception), 'exit')
+
 
 if __name__ == '__main__':
     unittest.main()
diff --git a/test/unit/account/test_replicator.py b/test/unit/account/test_replicator.py
index 23d0027b2e..36b8b9d1ab 100644
--- a/test/unit/account/test_replicator.py
+++ b/test/unit/account/test_replicator.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,19 +13,135 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
+import os
+import time
 import unittest
-from swift.account import replicator
+import shutil
 
+from swift.account import replicator, backend, server
+from swift.common.utils import normalize_timestamp
+from swift.common.storage_policy import POLICIES
 
-class TestReplicator(unittest.TestCase):
-    """
-    swift.account.replicator is currently just a subclass with some class
-    variables overridden, but at least this test stub will ensure proper Python
-    syntax.
-    """
+from test.unit.common import test_db_replicator
 
-    def test_placeholder(self):
-        pass
+
+class TestReplicatorSync(test_db_replicator.TestReplicatorSync):
+
+    backend = backend.AccountBroker
+    datadir = server.DATADIR
+    replicator_daemon = replicator.AccountReplicator
+
+    def test_sync(self):
+        broker = self._get_broker('a', node_index=0)
+        put_timestamp = normalize_timestamp(time.time())
+        broker.initialize(put_timestamp)
+        # "replicate" to same database
+        daemon = replicator.AccountReplicator({})
+        part, node = self._get_broker_part_node(broker)
+        info = broker.get_replication_info()
+        success = daemon._repl_to_node(node, broker, part, info)
+        # nothing to do
+        self.assertTrue(success)
+        self.assertEqual(1, daemon.stats['no_change'])
+
+    def test_sync_remote_missing(self):
+        broker = self._get_broker('a', node_index=0)
+        put_timestamp = time.time()
+        broker.initialize(put_timestamp)
+        # "replicate" to all other nodes
+        part, node = self._get_broker_part_node(broker)
+        daemon = self._run_once(node)
+        # complete rsync
+        self.assertEqual(2, daemon.stats['rsync'])
+        local_info = self._get_broker(
+            'a', node_index=0).get_info()
+        for i in range(1, 3):
+            remote_broker = self._get_broker('a', node_index=i)
+            self.assertTrue(os.path.exists(remote_broker.db_file))
+            remote_info = remote_broker.get_info()
+            for k, v in local_info.items():
+                if k == 'id':
+                    continue
+                self.assertEqual(remote_info[k], v,
+                                 "mismatch remote %s %r != %r" % (
+                                     k, remote_info[k], v))
+
+    def test_sync_remote_missing_most_rows(self):
+        put_timestamp = time.time()
+        # create "local" broker
+        broker = self._get_broker('a', node_index=0)
+        broker.initialize(put_timestamp)
+        # create "remote" broker
+        remote_broker = self._get_broker('a', node_index=1)
+        remote_broker.initialize(put_timestamp)
+        # add a row to "local" db
+        broker.put_container('/a/c', time.time(), 0, 0, 0,
+                             POLICIES.default.idx)
+        # replicate
+        daemon = replicator.AccountReplicator({'per_diff': 1})
+
+        def _rsync_file(broker_arg, remote_file, **kwargs):
+            self.assertIs(broker_arg, broker)
+
+            remote_server, remote_path = remote_file.split('/', 1)
+            dest_path = os.path.join(self.root, remote_path)
+            shutil.copy(broker_arg.db_file, dest_path)
+            return True
+
+        daemon._rsync_file = _rsync_file
+        part, node = self._get_broker_part_node(remote_broker)
+        info = broker.get_replication_info()
+        success = daemon._repl_to_node(node, broker, part, info)
+        self.assertTrue(success)
+        # row merge
+        self.assertEqual(1, daemon.stats['remote_merge'])
+        local_info = self._get_broker(
+            'a', node_index=0).get_info()
+        remote_info = self._get_broker(
+            'a', node_index=1).get_info()
+        for k, v in local_info.items():
+            if k == 'id':
+                continue
+            self.assertEqual(remote_info[k], v,
+                             "mismatch remote %s %r != %r" % (
+                                 k, remote_info[k], v))
+
+    def test_sync_remote_missing_one_rows(self):
+        put_timestamp = time.time()
+        # create "local" broker
+        broker = self._get_broker('a', node_index=0)
+        broker.initialize(put_timestamp)
+        # create "remote" broker
+        remote_broker = self._get_broker('a', node_index=1)
+        remote_broker.initialize(put_timestamp)
+        # add some rows to both db
+        for i in range(10):
+            put_timestamp = time.time()
+            for db in (broker, remote_broker):
+                path = '/a/c_%s' % i
+                db.put_container(path, put_timestamp, 0, 0, 0,
+                                 POLICIES.default.idx)
+        # now a row to the "local" broker only
+        broker.put_container('/a/c_missing', time.time(), 0, 0, 0,
+                             POLICIES.default.idx)
+        # replicate
+        daemon = replicator.AccountReplicator({})
+        part, node = self._get_broker_part_node(remote_broker)
+        info = broker.get_replication_info()
+        success = daemon._repl_to_node(node, broker, part, info)
+        self.assertTrue(success)
+        # row merge
+        self.assertEqual(1, daemon.stats['diff'])
+        local_info = self._get_broker(
+            'a', node_index=0).get_info()
+        remote_info = self._get_broker(
+            'a', node_index=1).get_info()
+        for k, v in local_info.items():
+            if k == 'id':
+                continue
+            self.assertEqual(remote_info[k], v,
+                             "mismatch remote %s %r != %r" % (
+                                 k, remote_info[k], v))
 
 
 if __name__ == '__main__':
diff --git a/test/unit/account/test_server.py b/test/unit/account/test_server.py
index 8ed6a5ae51..07d3a73f6d 100644
--- a/test/unit/account/test_server.py
+++ b/test/unit/account/test_server.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -15,873 +15,1737 @@
 
 import errno
 import os
+from unittest import mock
+import posix
 import unittest
+from tempfile import mkdtemp
 from shutil import rmtree
-from StringIO import StringIO
+import itertools
+import random
+from io import BytesIO, StringIO
 
-import simplejson
+import json
+from urllib.parse import quote
 import xml.dom.minidom
 
-from swift.common.swob import Request
-from swift.account.server import AccountController, ACCOUNT_LISTING_LIMIT
-from swift.common.utils import normalize_timestamp
+from swift import __version__ as swift_version
+from swift.common.swob import (Request, WsgiBytesIO, HTTPNoContent)
+from swift.common.constraints import ACCOUNT_LISTING_LIMIT
+from swift.account.backend import AccountBroker
+from swift.account.server import AccountController
+from swift.common.utils import (normalize_timestamp, replication, public,
+                                mkdirs, storage_directory, Timestamp)
+from swift.common.request_helpers import get_sys_meta_prefix, get_reserved_name
+from test.debug_logger import debug_logger
+from test.unit import patch_policies, mock_check_drive, make_timestamp_iter
+from swift.common.storage_policy import StoragePolicy, POLICIES
 
 
+@patch_policies
 class TestAccountController(unittest.TestCase):
-    """ Test swift.account_server.AccountController """
+    """Test swift.account.server.AccountController"""
     def setUp(self):
-        """ Set up for testing swift.account_server.AccountController """
-        self.testdir = os.path.join(os.path.dirname(__file__), 'account_server')
+        """Set up for testing swift.account.server.AccountController"""
+        self.testdir_base = mkdtemp()
+        self.testdir = os.path.join(self.testdir_base, 'account_server')
+        mkdirs(os.path.join(self.testdir, 'sda1'))
+        self.logger = debug_logger()
         self.controller = AccountController(
-            {'devices': self.testdir, 'mount_check': 'false'})
+            {'devices': self.testdir, 'mount_check': 'false'},
+            logger=self.logger)
+        self.ts = make_timestamp_iter()
 
     def tearDown(self):
-        """ Tear down for testing swift.account_server.AccountController """
+        """Tear down for testing swift.account.server.AccountController"""
         try:
-            rmtree(self.testdir)
-        except OSError, err:
+            rmtree(self.testdir_base)
+        except OSError as err:
             if err.errno != errno.ENOENT:
                 raise
 
+    def test_init(self):
+        conf = {
+            'devices': self.testdir,
+            'mount_check': 'false',
+        }
+        AccountController(conf, logger=self.logger)
+        self.assertEqual(self.logger.get_lines_for_level('warning'), [])
+
+    def test_OPTIONS(self):
+        server_handler = AccountController(
+            {'devices': self.testdir, 'mount_check': 'false'})
+        req = Request.blank('/sda1/p/a/c/o', {'REQUEST_METHOD': 'OPTIONS'})
+        req.content_length = 0
+        resp = server_handler.OPTIONS(req)
+        self.assertEqual(200, resp.status_int)
+        for verb in 'OPTIONS GET POST PUT DELETE HEAD REPLICATE'.split():
+            self.assertIn(verb, resp.headers['Allow'].split(', '))
+        self.assertEqual(len(resp.headers['Allow'].split(', ')), 7)
+        self.assertEqual(resp.headers['Server'],
+                         (server_handler.server_type + '/' + swift_version))
+
+    def test_insufficient_storage_mount_check_true(self):
+        conf = {'devices': self.testdir, 'mount_check': 'true'}
+        account_controller = AccountController(conf)
+        self.assertTrue(account_controller.mount_check)
+        for method in account_controller.allowed_methods:
+            if method == 'OPTIONS':
+                continue
+            req = Request.blank('/sda1/p/a-or-suff', method=method,
+                                headers={'x-timestamp': '1'})
+            with mock_check_drive() as mocks:
+                try:
+                    resp = req.get_response(account_controller)
+                    self.assertEqual(resp.status_int, 507)
+                    mocks['ismount'].return_value = True
+                    resp = req.get_response(account_controller)
+                    self.assertNotEqual(resp.status_int, 507)
+                    # feel free to rip out this last assertion...
+                    expected = 2 if method == 'PUT' else 4
+                    self.assertEqual(resp.status_int // 100, expected)
+                except AssertionError as e:
+                    self.fail('%s for %s' % (e, method))
+
+    def test_insufficient_storage_mount_check_false(self):
+        conf = {'devices': self.testdir, 'mount_check': 'false'}
+        account_controller = AccountController(conf)
+        self.assertFalse(account_controller.mount_check)
+        for method in account_controller.allowed_methods:
+            if method == 'OPTIONS':
+                continue
+            req = Request.blank('/sda1/p/a-or-suff', method=method,
+                                headers={'x-timestamp': '1'})
+            with mock_check_drive() as mocks:
+                try:
+                    resp = req.get_response(account_controller)
+                    self.assertEqual(resp.status_int, 507)
+                    mocks['isdir'].return_value = True
+                    resp = req.get_response(account_controller)
+                    self.assertNotEqual(resp.status_int, 507)
+                    # feel free to rip out this last assertion...
+                    expected = 2 if method == 'PUT' else 4
+                    self.assertEqual(resp.status_int // 100, expected)
+                except AssertionError as e:
+                    self.fail('%s for %s' % (e, method))
+
     def test_DELETE_not_found(self):
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'DELETE',
-            'HTTP_X_TIMESTAMP': '0'})
-        resp = self.controller.DELETE(req)
-        self.assertEquals(resp.status_int, 404)
+                                                  'HTTP_X_TIMESTAMP': '0'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)
+        self.assertNotIn('X-Account-Status', resp.headers)
 
     def test_DELETE_empty(self):
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        self.controller.PUT(req)
+                                                  'HTTP_X_TIMESTAMP': '0'})
+        req.get_response(self.controller)
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'DELETE',
-            'HTTP_X_TIMESTAMP': '1'})
-        resp = self.controller.DELETE(req)
-        self.assertEquals(resp.status_int, 204)
+                                                  'HTTP_X_TIMESTAMP': '1'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers['X-Account-Status'], 'Deleted')
 
     def test_DELETE_not_empty(self):
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        self.controller.PUT(req)
+                                                  'HTTP_X_TIMESTAMP': '0'})
+        req.get_response(self.controller)
         req = Request.blank('/sda1/p/a/c1', environ={'REQUEST_METHOD': 'PUT'},
                             headers={'X-Put-Timestamp': '1',
                                      'X-Delete-Timestamp': '0',
                                      'X-Object-Count': '0',
                                      'X-Bytes-Used': '0'})
-        self.controller.PUT(req)
+        req.get_response(self.controller)
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'DELETE',
-            'HTTP_X_TIMESTAMP': '1'})
-        resp = self.controller.DELETE(req)
+                                                  'HTTP_X_TIMESTAMP': '1'})
+        resp = req.get_response(self.controller)
         # We now allow deleting non-empty accounts
-        self.assertEquals(resp.status_int, 204)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers['X-Account-Status'], 'Deleted')
 
     def test_DELETE_now_empty(self):
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        self.controller.PUT(req)
+                                                  'HTTP_X_TIMESTAMP': '0'})
+        req.get_response(self.controller)
         req = Request.blank('/sda1/p/a/c1', environ={'REQUEST_METHOD': 'PUT'},
                             headers={'X-Put-Timestamp': '1',
                                      'X-Delete-Timestamp': '0',
                                      'X-Object-Count': '0',
                                      'X-Bytes-Used': '0',
                                      'X-Timestamp': normalize_timestamp(0)})
-        self.controller.PUT(req)
-        req = Request.blank('/sda1/p/a/c1',
+        req.get_response(self.controller)
+        req = Request.blank(
+            '/sda1/p/a/c1',
             environ={'REQUEST_METHOD': 'PUT'},
             headers={'X-Put-Timestamp': '1',
                      'X-Delete-Timestamp': '2',
                      'X-Object-Count': '0',
                      'X-Bytes-Used': '0',
                      'X-Timestamp': normalize_timestamp(0)})
-        resp = self.controller.PUT(req)
-        self.assertEquals(resp.status_int, 204)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'DELETE',
-            'HTTP_X_TIMESTAMP': '1'})
-        resp = self.controller.DELETE(req)
-        self.assertEquals(resp.status_int, 204)
+                                                  'HTTP_X_TIMESTAMP': '1'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers['X-Account-Status'], 'Deleted')
+
+    def test_DELETE_invalid_partition(self):
+        req = Request.blank('/sda1/./a', environ={'REQUEST_METHOD': 'DELETE',
+                                                  'HTTP_X_TIMESTAMP': '1'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 400)
+
+    def test_DELETE_timestamp_not_float(self):
+        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT',
+                                                  'HTTP_X_TIMESTAMP': '0'})
+        req.get_response(self.controller)
+        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'DELETE'},
+                            headers={'X-Timestamp': 'not-float'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 400)
+
+    def test_REPLICATE_insufficient_space(self):
+        conf = {'devices': self.testdir,
+                'mount_check': 'false',
+                'fallocate_reserve': '2%'}
+        account_controller = AccountController(conf)
+
+        req = Request.blank('/sda1/p/a',
+                            environ={'REQUEST_METHOD': 'REPLICATE'})
+        statvfs_result = posix.statvfs_result([
+            4096,     # f_bsize
+            4096,     # f_frsize
+            2854907,  # f_blocks
+            59000,    # f_bfree
+            57000,    # f_bavail  (just under 2% free)
+            1280000,  # f_files
+            1266040,  # f_ffree,
+            1266040,  # f_favail,
+            4096,     # f_flag
+            255,      # f_namemax
+        ])
+        with mock.patch('os.statvfs',
+                        return_value=statvfs_result) as mock_statvfs:
+            resp = req.get_response(account_controller)
+        self.assertEqual(resp.status_int, 507)
+        self.assertEqual(mock_statvfs.mock_calls,
+                         [mock.call(os.path.join(self.testdir, 'sda1'))])
+
+    def test_REPLICATE_rsync_then_merge_works(self):
+        def fake_rsync_then_merge(self, drive, db_file, args):
+            return HTTPNoContent()
+
+        with mock.patch("swift.common.db_replicator.ReplicatorRpc."
+                        "rsync_then_merge", fake_rsync_then_merge):
+            req = Request.blank('/sda1/p/a/',
+                                environ={'REQUEST_METHOD': 'REPLICATE'},
+                                headers={})
+            json_string = b'["rsync_then_merge", "a.db"]'
+            inbuf = WsgiBytesIO(json_string)
+            req.environ['wsgi.input'] = inbuf
+            resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+
+    def test_REPLICATE_complete_rsync_works(self):
+        def fake_complete_rsync(self, drive, db_file, args):
+            return HTTPNoContent()
+        # check complete_rsync
+        with mock.patch("swift.common.db_replicator.ReplicatorRpc."
+                        "complete_rsync", fake_complete_rsync):
+            req = Request.blank('/sda1/p/a/',
+                                environ={'REQUEST_METHOD': 'REPLICATE'},
+                                headers={})
+            json_string = b'["complete_rsync", "a.db"]'
+            inbuf = WsgiBytesIO(json_string)
+            req.environ['wsgi.input'] = inbuf
+            resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+
+    def test_REPLICATE_value_error_works(self):
+        req = Request.blank('/sda1/p/a/',
+                            environ={'REQUEST_METHOD': 'REPLICATE'},
+                            headers={})
+
+        # check valuerror
+        wsgi_input_valuerror = b'["sync" : sync, "-1"]'
+        inbuf1 = WsgiBytesIO(wsgi_input_valuerror)
+        req.environ['wsgi.input'] = inbuf1
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 400)
+
+    def test_REPLICATE_unknown_sync(self):
+        # First without existing DB file
+        req = Request.blank('/sda1/p/a/',
+                            environ={'REQUEST_METHOD': 'REPLICATE'},
+                            headers={})
+        json_string = b'["unknown_sync", "a.db"]'
+        inbuf = WsgiBytesIO(json_string)
+        req.environ['wsgi.input'] = inbuf
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)
+
+        mkdirs(os.path.join(self.testdir, 'sda1', 'accounts', 'p', 'a', 'a'))
+        db_file = os.path.join(self.testdir, 'sda1',
+                               storage_directory('accounts', 'p', 'a'),
+                               'a' + '.db')
+        open(db_file, 'w')
+        req = Request.blank('/sda1/p/a/',
+                            environ={'REQUEST_METHOD': 'REPLICATE'},
+                            headers={})
+        json_string = b'["unknown_sync", "a.db"]'
+        inbuf = WsgiBytesIO(json_string)
+        req.environ['wsgi.input'] = inbuf
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 500)
 
     def test_HEAD_not_found(self):
+        # Test the case in which account does not exist (can be recreated)
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'HEAD'})
-        resp = self.controller.HEAD(req)
-        self.assertEquals(resp.status_int, 404)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)
+        self.assertNotIn('X-Account-Status', resp.headers)
+
+        # Test the case in which account was deleted but not yet reaped
+        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT',
+                                                  'HTTP_X_TIMESTAMP': '0'})
+        req.get_response(self.controller)
+        req = Request.blank('/sda1/p/a/c1', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Put-Timestamp': '1',
+                                     'X-Delete-Timestamp': '0',
+                                     'X-Object-Count': '0',
+                                     'X-Bytes-Used': '0'})
+        req.get_response(self.controller)
+        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'DELETE',
+                                                  'HTTP_X_TIMESTAMP': '1'})
+        resp = req.get_response(self.controller)
+        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'HEAD'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)
+        self.assertEqual(resp.headers['X-Account-Status'], 'Deleted')
+
+    def test_HEAD_has_content_length(self):
+        # create the account
+        put_timestamp = next(self.ts)
+        req = Request.blank('/sda1/p/a', method='PUT', headers={
+            'x-timestamp': put_timestamp.normal})
+        created_at_timestamp = next(self.ts)
+        with mock.patch('swift.account.backend.Timestamp.now',
+                        return_value=created_at_timestamp):
+            resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        # do a HEAD
+        req = Request.blank('/sda1/p/a', method='HEAD')
+        status, headers, body_iter = req.call_application(self.controller)
+        self.assertEqual('204 No Content', status)
+        self.assertEqual({
+            'Content-Type': 'text/plain; charset=utf-8',
+            'Content-Length': '0',
+            'X-Account-Container-Count': '0',
+            'X-Account-Object-Count': '0',
+            'X-Account-Bytes-Used': '0',
+            'X-Timestamp': created_at_timestamp.normal,
+            'X-Put-Timestamp': put_timestamp.normal,
+        }, dict(headers))
+        self.assertEqual(b'', b''.join(body_iter))
 
     def test_HEAD_empty_account(self):
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        self.controller.PUT(req)
+                                                  'HTTP_X_TIMESTAMP': '0'})
+        req.get_response(self.controller)
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'HEAD'})
-        resp = self.controller.HEAD(req)
-        self.assertEquals(resp.status_int, 204)
-        self.assertEquals(resp.headers['x-account-container-count'], '0')
-        self.assertEquals(resp.headers['x-account-object-count'], '0')
-        self.assertEquals(resp.headers['x-account-bytes-used'], '0')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers['x-account-container-count'], '0')
+        self.assertEqual(resp.headers['x-account-object-count'], '0')
+        self.assertEqual(resp.headers['x-account-bytes-used'], '0')
 
     def test_HEAD_with_containers(self):
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT'},
                             headers={'X-Timestamp': '0'})
-        self.controller.PUT(req)
+        req.get_response(self.controller)
         req = Request.blank('/sda1/p/a/c1', environ={'REQUEST_METHOD': 'PUT'},
                             headers={'X-Put-Timestamp': '1',
                                      'X-Delete-Timestamp': '0',
                                      'X-Object-Count': '0',
                                      'X-Bytes-Used': '0',
                                      'X-Timestamp': normalize_timestamp(0)})
-        self.controller.PUT(req)
+        req.get_response(self.controller)
         req = Request.blank('/sda1/p/a/c2', environ={'REQUEST_METHOD': 'PUT'},
                             headers={'X-Put-Timestamp': '2',
                                      'X-Delete-Timestamp': '0',
                                      'X-Object-Count': '0',
                                      'X-Bytes-Used': '0',
                                      'X-Timestamp': normalize_timestamp(0)})
-        self.controller.PUT(req)
+        req.get_response(self.controller)
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'HEAD'})
-        resp = self.controller.HEAD(req)
-        self.assertEquals(resp.status_int, 204)
-        self.assertEquals(resp.headers['x-account-container-count'], '2')
-        self.assertEquals(resp.headers['x-account-object-count'], '0')
-        self.assertEquals(resp.headers['x-account-bytes-used'], '0')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers['x-account-container-count'], '2')
+        self.assertEqual(resp.headers['x-account-object-count'], '0')
+        self.assertEqual(resp.headers['x-account-bytes-used'], '0')
         req = Request.blank('/sda1/p/a/c1', environ={'REQUEST_METHOD': 'PUT'},
                             headers={'X-Put-Timestamp': '1',
                                      'X-Delete-Timestamp': '0',
                                      'X-Object-Count': '1',
                                      'X-Bytes-Used': '2',
                                      'X-Timestamp': normalize_timestamp(0)})
-        self.controller.PUT(req)
+        req.get_response(self.controller)
         req = Request.blank('/sda1/p/a/c2', environ={'REQUEST_METHOD': 'PUT'},
                             headers={'X-Put-Timestamp': '2',
                                      'X-Delete-Timestamp': '0',
                                      'X-Object-Count': '3',
                                      'X-Bytes-Used': '4',
                                      'X-Timestamp': normalize_timestamp(0)})
-        self.controller.PUT(req)
+        req.get_response(self.controller)
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'HEAD',
-            'HTTP_X_TIMESTAMP': '5'})
-        resp = self.controller.HEAD(req)
-        self.assertEquals(resp.status_int, 204)
-        self.assertEquals(resp.headers['x-account-container-count'], '2')
-        self.assertEquals(resp.headers['x-account-object-count'], '4')
-        self.assertEquals(resp.headers['x-account-bytes-used'], '6')
+                                                  'HTTP_X_TIMESTAMP': '5'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers['x-account-container-count'], '2')
+        self.assertEqual(resp.headers['x-account-object-count'], '4')
+        self.assertEqual(resp.headers['x-account-bytes-used'], '6')
+
+    def test_HEAD_invalid_partition(self):
+        req = Request.blank('/sda1/./a', environ={'REQUEST_METHOD': 'HEAD',
+                                                  'HTTP_X_TIMESTAMP': '1'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 400)
+
+    def test_HEAD_invalid_content_type(self):
+        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'Accept': 'application/plain'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 406)
+
+    def test_HEAD_invalid_accept(self):
+        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'Accept': 'application/plain;q=1;q=0.5'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 400)
+        self.assertEqual(resp.body, b'')
+
+    def test_HEAD_invalid_format(self):
+        format = '%D1%BD%8A9'  # invalid UTF-8; should be %E1%BD%8A9 (E -> D)
+        req = Request.blank('/sda1/p/a?format=' + format,
+                            environ={'REQUEST_METHOD': 'HEAD'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 400)
 
     def test_PUT_not_found(self):
-        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
             headers={'X-PUT-Timestamp': normalize_timestamp(1),
                      'X-DELETE-Timestamp': normalize_timestamp(0),
                      'X-Object-Count': '1',
                      'X-Bytes-Used': '1',
                      'X-Timestamp': normalize_timestamp(0)})
-        resp = self.controller.PUT(req)
-        self.assertEquals(resp.status_int, 404)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)
+        self.assertNotIn('X-Account-Status', resp.headers)
+
+    def test_PUT_insufficient_space(self):
+        conf = {'devices': self.testdir,
+                'mount_check': 'false',
+                'fallocate_reserve': '2%'}
+        account_controller = AccountController(conf)
+
+        req = Request.blank(
+            '/sda1/p/a',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': '1517612949.541469'})
+        statvfs_result = posix.statvfs_result([
+            4096,     # f_bsize
+            4096,     # f_frsize
+            2854907,  # f_blocks
+            59000,    # f_bfree
+            57000,    # f_bavail  (just under 2% free)
+            1280000,  # f_files
+            1266040,  # f_ffree,
+            1266040,  # f_favail,
+            4096,     # f_flag
+            255,      # f_namemax
+        ])
+        with mock.patch('os.statvfs',
+                        return_value=statvfs_result) as mock_statvfs:
+            resp = req.get_response(account_controller)
+        self.assertEqual(resp.status_int, 507)
+        self.assertEqual(mock_statvfs.mock_calls,
+                         [mock.call(os.path.join(self.testdir, 'sda1'))])
 
     def test_PUT(self):
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        resp = self.controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
+                                                  'HTTP_X_TIMESTAMP': '0'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '1'})
-        resp = self.controller.PUT(req)
-        self.assertEquals(resp.status_int, 202)
+                                                  'HTTP_X_TIMESTAMP': '1'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 202)
+
+    def test_PUT_simulated_create_race(self):
+        state = ['initial']
+
+        from swift.account.backend import AccountBroker as OrigAcBr
+
+        class InterceptedAcBr(OrigAcBr):
+
+            def __init__(self, *args, **kwargs):
+                super(InterceptedAcBr, self).__init__(*args, **kwargs)
+                if state[0] == 'initial':
+                    # Do nothing initially
+                    pass
+                elif state[0] == 'race':
+                    # Save the original db_file attribute value
+                    self._saved_db_file = self.db_file
+                    self._db_file += '.doesnotexist'
+
+            def initialize(self, *args, **kwargs):
+                if state[0] == 'initial':
+                    # Do nothing initially
+                    pass
+                elif state[0] == 'race':
+                    # Restore the original db_file attribute to get the race
+                    # behavior
+                    self._db_file = self._saved_db_file
+                return super(InterceptedAcBr, self).initialize(*args, **kwargs)
+
+        with mock.patch("swift.account.server.AccountBroker", InterceptedAcBr):
+            req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT',
+                                                      'HTTP_X_TIMESTAMP': '0'})
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 201)
+            state[0] = "race"
+            req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT',
+                                                      'HTTP_X_TIMESTAMP': '1'})
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 202)
 
     def test_PUT_after_DELETE(self):
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT'},
                             headers={'X-Timestamp': normalize_timestamp(1)})
-        resp = self.controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'DELETE'},
                             headers={'X-Timestamp': normalize_timestamp(1)})
-        resp = self.controller.DELETE(req)
-        self.assertEquals(resp.status_int, 204)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT'},
                             headers={'X-Timestamp': normalize_timestamp(2)})
-        resp = self.controller.PUT(req)
-        self.assertEquals(resp.status_int, 403)
-        self.assertEquals(resp.body, 'Recently deleted')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 403)
+        self.assertEqual(resp.body, b'Recently deleted')
+        self.assertEqual(resp.headers['X-Account-Status'], 'Deleted')
+
+    def test_create_reserved_namespace_account(self):
+        path = '/sda1/p/%s' % get_reserved_name('a')
+        req = Request.blank(path, method='PUT', headers={
+            'X-Timestamp': next(self.ts).internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status, '201 Created')
+
+        path = '/sda1/p/%s' % get_reserved_name('foo', 'bar')
+        req = Request.blank(path, method='PUT', headers={
+            'X-Timestamp': next(self.ts).internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status, '201 Created')
+
+    def test_create_invalid_reserved_namespace_account(self):
+        account_name = get_reserved_name('foo', 'bar')[1:]
+        path = '/sda1/p/%s' % account_name
+        req = Request.blank(path, method='PUT', headers={
+            'X-Timestamp': next(self.ts).internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status, '400 Bad Request')
+
+    def test_create_reserved_container_in_account(self):
+        # create account
+        path = '/sda1/p/a'
+        req = Request.blank(path, method='PUT', headers={
+            'X-Timestamp': next(self.ts).internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        # put null container in it
+        path += '/%s' % get_reserved_name('c', 'stuff')
+        req = Request.blank(path, method='PUT', headers={
+            'X-Timestamp': next(self.ts).internal,
+            'X-Put-Timestamp': next(self.ts).internal,
+            'X-Delete-Timestamp': 0,
+            'X-Object-Count': 0,
+            'X-Bytes-Used': 0,
+        })
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status, '201 Created')
+
+    def test_create_invalid_reserved_container_in_account(self):
+        # create account
+        path = '/sda1/p/a'
+        req = Request.blank(path, method='PUT', headers={
+            'X-Timestamp': next(self.ts).internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        # put invalid container in it
+        path += '/%s' % get_reserved_name('c', 'stuff')[1:]
+        req = Request.blank(path, method='PUT', headers={
+            'X-Timestamp': next(self.ts).internal,
+            'X-Put-Timestamp': next(self.ts).internal,
+            'X-Delete-Timestamp': 0,
+            'X-Object-Count': 0,
+            'X-Bytes-Used': 0,
+        })
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status, '400 Bad Request')
+
+    def test_PUT_non_utf8_metadata(self):
+        # Set metadata header
+        req = Request.blank(
+            '/sda1/p/a', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': normalize_timestamp(1),
+                     'X-Account-Meta-Test': b'\xff'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 400)
+        # Set sysmeta header
+        req = Request.blank(
+            '/sda1/p/a', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': normalize_timestamp(1),
+                     'X-Account-Sysmeta-Access-Control': b'\xff'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 400)
+        # Send other
+        req = Request.blank(
+            '/sda1/p/a', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': normalize_timestamp(1),
+                     'X-Will-Not-Be-Saved': b'\xff'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 202)
+
+    def test_utf8_metadata(self):
+        ts_str = normalize_timestamp(1)
+
+        def get_test_meta(method, headers):
+            # Set metadata header
+            headers.setdefault('X-Timestamp', ts_str)
+            req = Request.blank(
+                '/sda1/p/a', environ={'REQUEST_METHOD': method},
+                headers=headers)
+            resp = req.get_response(self.controller)
+            self.assertIn(resp.status_int, (201, 202, 204))
+            db_path = os.path.join(*next(
+                (dir_name, file_name)
+                for dir_name, _, files in os.walk(self.testdir)
+                for file_name in files if file_name.endswith('.db')
+            ))
+            broker = AccountBroker(db_path)
+            # Why not use broker.metadata, you ask? Because we want to get
+            # as close to the on-disk format as is reasonable.
+            result = json.loads(broker.get_raw_metadata())
+            # Clear it out for the next run
+            with broker.get() as conn:
+                conn.execute("UPDATE account_stat SET metadata=''")
+                conn.commit()
+            return result
+
+        wsgi_str = '\xf0\x9f\x91\x8d'
+        uni_str = u'\U0001f44d'
+
+        self.assertEqual(
+            get_test_meta('PUT', {'x-account-sysmeta-' + wsgi_str: wsgi_str}),
+            {u'X-Account-Sysmeta-' + uni_str: [uni_str, ts_str]})
+
+        self.assertEqual(
+            get_test_meta('PUT', {'x-account-meta-' + wsgi_str: wsgi_str}),
+            {u'X-Account-Meta-' + uni_str: [uni_str, ts_str]})
+
+        self.assertEqual(
+            get_test_meta('POST', {'x-account-sysmeta-' + wsgi_str: wsgi_str}),
+            {u'X-Account-Sysmeta-' + uni_str: [uni_str, ts_str]})
+
+        self.assertEqual(
+            get_test_meta('POST', {'x-account-meta-' + wsgi_str: wsgi_str}),
+            {u'X-Account-Meta-' + uni_str: [uni_str, ts_str]})
 
     def test_PUT_GET_metadata(self):
         # Set metadata header
-        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT'},
+        req = Request.blank(
+            '/sda1/p/a', environ={'REQUEST_METHOD': 'PUT'},
             headers={'X-Timestamp': normalize_timestamp(1),
                      'X-Account-Meta-Test': 'Value'})
-        resp = self.controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
-        req = Request.blank('/sda1/p/a')
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 204)
-        self.assertEquals(resp.headers.get('x-account-meta-test'), 'Value')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers.get('x-account-meta-test'), 'Value')
         # Set another metadata header, ensuring old one doesn't disappear
-        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'POST'},
+        req = Request.blank(
+            '/sda1/p/a', environ={'REQUEST_METHOD': 'POST'},
             headers={'X-Timestamp': normalize_timestamp(1),
                      'X-Account-Meta-Test2': 'Value2'})
-        resp = self.controller.POST(req)
-        self.assertEquals(resp.status_int, 204)
-        req = Request.blank('/sda1/p/a')
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 204)
-        self.assertEquals(resp.headers.get('x-account-meta-test'), 'Value')
-        self.assertEquals(resp.headers.get('x-account-meta-test2'), 'Value2')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers.get('x-account-meta-test'), 'Value')
+        self.assertEqual(resp.headers.get('x-account-meta-test2'), 'Value2')
         # Update metadata header
-        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT'},
+        req = Request.blank(
+            '/sda1/p/a', environ={'REQUEST_METHOD': 'PUT'},
             headers={'X-Timestamp': normalize_timestamp(3),
                      'X-Account-Meta-Test': 'New Value'})
-        resp = self.controller.PUT(req)
-        self.assertEquals(resp.status_int, 202)
-        req = Request.blank('/sda1/p/a')
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 204)
-        self.assertEquals(resp.headers.get('x-account-meta-test'), 'New Value')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 202)
+        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers.get('x-account-meta-test'), 'New Value')
         # Send old update to metadata header
-        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT'},
+        req = Request.blank(
+            '/sda1/p/a', environ={'REQUEST_METHOD': 'PUT'},
             headers={'X-Timestamp': normalize_timestamp(2),
                      'X-Account-Meta-Test': 'Old Value'})
-        resp = self.controller.PUT(req)
-        self.assertEquals(resp.status_int, 202)
-        req = Request.blank('/sda1/p/a')
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 204)
-        self.assertEquals(resp.headers.get('x-account-meta-test'), 'New Value')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 202)
+        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers.get('x-account-meta-test'), 'New Value')
         # Remove metadata header (by setting it to empty)
-        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT'},
+        req = Request.blank(
+            '/sda1/p/a', environ={'REQUEST_METHOD': 'PUT'},
             headers={'X-Timestamp': normalize_timestamp(4),
                      'X-Account-Meta-Test': ''})
-        resp = self.controller.PUT(req)
-        self.assertEquals(resp.status_int, 202)
-        req = Request.blank('/sda1/p/a')
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 204)
-        self.assert_('x-account-meta-test' not in resp.headers)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 202)
+        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertNotIn('x-account-meta-test', resp.headers)
+
+    def test_PUT_GET_sys_metadata(self):
+        prefix = get_sys_meta_prefix('account')
+        hdr = '%stest' % prefix
+        hdr2 = '%stest2' % prefix
+        # Set metadata header
+        req = Request.blank(
+            '/sda1/p/a', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': normalize_timestamp(1),
+                     hdr.title(): 'Value'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers.get(hdr), 'Value')
+        # Set another metadata header, ensuring old one doesn't disappear
+        req = Request.blank(
+            '/sda1/p/a', environ={'REQUEST_METHOD': 'POST'},
+            headers={'X-Timestamp': normalize_timestamp(1),
+                     hdr2.title(): 'Value2'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers.get(hdr), 'Value')
+        self.assertEqual(resp.headers.get(hdr2), 'Value2')
+        # Update metadata header
+        req = Request.blank(
+            '/sda1/p/a', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': normalize_timestamp(3),
+                     hdr.title(): 'New Value'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 202)
+        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers.get(hdr), 'New Value')
+        # Send old update to metadata header
+        req = Request.blank(
+            '/sda1/p/a', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': normalize_timestamp(2),
+                     hdr.title(): 'Old Value'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 202)
+        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers.get(hdr), 'New Value')
+        # Remove metadata header (by setting it to empty)
+        req = Request.blank(
+            '/sda1/p/a', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': normalize_timestamp(4),
+                     hdr.title(): ''})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 202)
+        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertNotIn(hdr, resp.headers)
+
+    def test_PUT_invalid_partition(self):
+        req = Request.blank('/sda1/./a', environ={'REQUEST_METHOD': 'PUT',
+                                                  'HTTP_X_TIMESTAMP': '1'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 400)
 
     def test_POST_HEAD_metadata(self):
-        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT'},
+        req = Request.blank(
+            '/sda1/p/a', environ={'REQUEST_METHOD': 'PUT'},
             headers={'X-Timestamp': normalize_timestamp(1)})
-        resp = self.controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
         # Set metadata header
-        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'POST'},
+        req = Request.blank(
+            '/sda1/p/a', environ={'REQUEST_METHOD': 'POST'},
             headers={'X-Timestamp': normalize_timestamp(1),
                      'X-Account-Meta-Test': 'Value'})
-        resp = self.controller.POST(req)
-        self.assertEquals(resp.status_int, 204)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204, resp.body)
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'HEAD'})
-        resp = self.controller.HEAD(req)
-        self.assertEquals(resp.status_int, 204)
-        self.assertEquals(resp.headers.get('x-account-meta-test'), 'Value')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers.get('x-account-meta-test'), 'Value')
         # Update metadata header
-        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'POST'},
+        req = Request.blank(
+            '/sda1/p/a', environ={'REQUEST_METHOD': 'POST'},
             headers={'X-Timestamp': normalize_timestamp(3),
                      'X-Account-Meta-Test': 'New Value'})
-        resp = self.controller.POST(req)
-        self.assertEquals(resp.status_int, 204)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'HEAD'})
-        resp = self.controller.HEAD(req)
-        self.assertEquals(resp.status_int, 204)
-        self.assertEquals(resp.headers.get('x-account-meta-test'), 'New Value')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers.get('x-account-meta-test'), 'New Value')
         # Send old update to metadata header
-        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'POST'},
+        req = Request.blank(
+            '/sda1/p/a', environ={'REQUEST_METHOD': 'POST'},
             headers={'X-Timestamp': normalize_timestamp(2),
                      'X-Account-Meta-Test': 'Old Value'})
-        resp = self.controller.POST(req)
-        self.assertEquals(resp.status_int, 204)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'HEAD'})
-        resp = self.controller.HEAD(req)
-        self.assertEquals(resp.status_int, 204)
-        self.assertEquals(resp.headers.get('x-account-meta-test'), 'New Value')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers.get('x-account-meta-test'), 'New Value')
         # Remove metadata header (by setting it to empty)
-        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'POST'},
+        req = Request.blank(
+            '/sda1/p/a', environ={'REQUEST_METHOD': 'POST'},
             headers={'X-Timestamp': normalize_timestamp(4),
                      'X-Account-Meta-Test': ''})
-        resp = self.controller.POST(req)
-        self.assertEquals(resp.status_int, 204)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'HEAD'})
-        resp = self.controller.HEAD(req)
-        self.assertEquals(resp.status_int, 204)
-        self.assert_('x-account-meta-test' not in resp.headers)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertNotIn('x-account-meta-test', resp.headers)
+
+    def test_POST_HEAD_sys_metadata(self):
+        prefix = get_sys_meta_prefix('account')
+        hdr = '%stest' % prefix
+        req = Request.blank(
+            '/sda1/p/a', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': normalize_timestamp(1)})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        # Set metadata header
+        req = Request.blank(
+            '/sda1/p/a', environ={'REQUEST_METHOD': 'POST'},
+            headers={'X-Timestamp': normalize_timestamp(1),
+                     hdr.title(): 'Value'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'HEAD'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers.get(hdr), 'Value')
+        # Update metadata header
+        req = Request.blank(
+            '/sda1/p/a', environ={'REQUEST_METHOD': 'POST'},
+            headers={'X-Timestamp': normalize_timestamp(3),
+                     hdr.title(): 'New Value'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'HEAD'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers.get(hdr), 'New Value')
+        # Send old update to metadata header
+        req = Request.blank(
+            '/sda1/p/a', environ={'REQUEST_METHOD': 'POST'},
+            headers={'X-Timestamp': normalize_timestamp(2),
+                     hdr.title(): 'Old Value'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'HEAD'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers.get(hdr), 'New Value')
+        # Remove metadata header (by setting it to empty)
+        req = Request.blank(
+            '/sda1/p/a', environ={'REQUEST_METHOD': 'POST'},
+            headers={'X-Timestamp': normalize_timestamp(4),
+                     hdr.title(): ''})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'HEAD'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertNotIn(hdr, resp.headers)
+
+    def test_POST_invalid_partition(self):
+        req = Request.blank('/sda1/./a', environ={'REQUEST_METHOD': 'POST',
+                                                  'HTTP_X_TIMESTAMP': '1'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 400)
+
+    def test_POST_insufficient_space(self):
+        conf = {'devices': self.testdir,
+                'mount_check': 'false',
+                'fallocate_reserve': '2%'}
+        account_controller = AccountController(conf)
+
+        req = Request.blank(
+            '/sda1/p/a',
+            environ={'REQUEST_METHOD': 'POST'},
+            headers={'X-Timestamp': '1517611584.937603'})
+        statvfs_result = posix.statvfs_result([
+            4096,     # f_bsize
+            4096,     # f_frsize
+            2854907,  # f_blocks
+            59000,    # f_bfree
+            57000,    # f_bavail  (just under 2% free)
+            1280000,  # f_files
+            1266040,  # f_ffree,
+            1266040,  # f_favail,
+            4096,     # f_flag
+            255,      # f_namemax
+        ])
+        with mock.patch('os.statvfs',
+                        return_value=statvfs_result) as mock_statvfs:
+            resp = req.get_response(account_controller)
+        self.assertEqual(resp.status_int, 507)
+        self.assertEqual(mock_statvfs.mock_calls,
+                         [mock.call(os.path.join(self.testdir, 'sda1'))])
+
+    def test_POST_timestamp_not_float(self):
+        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'POST',
+                                                  'HTTP_X_TIMESTAMP': '0'},
+                            headers={'X-Timestamp': 'not-float'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 400)
+
+    def test_POST_after_DELETE_not_found(self):
+        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT',
+                                                  'HTTP_X_TIMESTAMP': '0'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'DELETE',
+                                                  'HTTP_X_TIMESTAMP': '1'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'POST',
+                                                  'HTTP_X_TIMESTAMP': '2'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)
+        self.assertEqual(resp.headers['X-Account-Status'], 'Deleted')
 
     def test_GET_not_found_plain(self):
+        # Test the case in which account does not exist (can be recreated)
+        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)
+        self.assertNotIn('X-Account-Status', resp.headers)
+
+        # Test the case in which account was deleted but not yet reaped
+        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT',
+                                                  'HTTP_X_TIMESTAMP': '0'})
+        req.get_response(self.controller)
+        req = Request.blank('/sda1/p/a/c1', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Put-Timestamp': '1',
+                                     'X-Delete-Timestamp': '0',
+                                     'X-Object-Count': '0',
+                                     'X-Bytes-Used': '0'})
+        req.get_response(self.controller)
+        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'DELETE',
+                                                  'HTTP_X_TIMESTAMP': '1'})
+        resp = req.get_response(self.controller)
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 404)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)
+        self.assertEqual(resp.headers['X-Account-Status'], 'Deleted')
 
     def test_GET_not_found_json(self):
         req = Request.blank('/sda1/p/a?format=json',
                             environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 404)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)
 
     def test_GET_not_found_xml(self):
         req = Request.blank('/sda1/p/a?format=xml',
                             environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 404)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)
 
     def test_GET_empty_account_plain(self):
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        self.controller.PUT(req)
+                                                  'HTTP_X_TIMESTAMP': '0'})
+        req.get_response(self.controller)
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 204)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers['Content-Type'],
+                         'text/plain; charset=utf-8')
 
     def test_GET_empty_account_json(self):
         req = Request.blank('/sda1/p/a?format=json',
-            environ={'REQUEST_METHOD': 'PUT', 'HTTP_X_TIMESTAMP': '0'})
-        self.controller.PUT(req)
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'HTTP_X_TIMESTAMP': '0'})
+        req.get_response(self.controller)
         req = Request.blank('/sda1/p/a?format=json',
                             environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['Content-Type'],
+                         'application/json; charset=utf-8')
 
     def test_GET_empty_account_xml(self):
         req = Request.blank('/sda1/p/a?format=xml',
-            environ={'REQUEST_METHOD': 'PUT', 'HTTP_X_TIMESTAMP': '0'})
-        self.controller.PUT(req)
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'HTTP_X_TIMESTAMP': '0'})
+        req.get_response(self.controller)
         req = Request.blank('/sda1/p/a?format=xml',
                             environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['Content-Type'],
+                         'application/xml; charset=utf-8')
+
+    def test_GET_invalid_accept(self):
+        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Accept': 'application/plain;q=foo'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 400)
+        self.assertEqual(resp.body, b'Invalid Accept header')
 
     def test_GET_over_limit(self):
-        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        self.controller.PUT(req)
-        req = Request.blank('/sda1/p/a?limit=%d' %
-            (ACCOUNT_LISTING_LIMIT + 1), environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 412)
+        req = Request.blank(
+            '/sda1/p/a?limit=%d' % (ACCOUNT_LISTING_LIMIT + 1),
+            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 412)
 
     def test_GET_with_containers_plain(self):
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        self.controller.PUT(req)
+                                                  'HTTP_X_TIMESTAMP': '0'})
+        req.get_response(self.controller)
         req = Request.blank('/sda1/p/a/c1', environ={'REQUEST_METHOD': 'PUT'},
                             headers={'X-Put-Timestamp': '1',
                                      'X-Delete-Timestamp': '0',
                                      'X-Object-Count': '0',
                                      'X-Bytes-Used': '0',
                                      'X-Timestamp': normalize_timestamp(0)})
-        self.controller.PUT(req)
+        req.get_response(self.controller)
         req = Request.blank('/sda1/p/a/c2', environ={'REQUEST_METHOD': 'PUT'},
                             headers={'X-Put-Timestamp': '2',
                                      'X-Delete-Timestamp': '0',
                                      'X-Object-Count': '0',
                                      'X-Bytes-Used': '0',
                                      'X-Timestamp': normalize_timestamp(0)})
-        self.controller.PUT(req)
+        req.get_response(self.controller)
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(resp.body.strip().split('\n'), ['c1', 'c2'])
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.body.strip().split(b'\n'),
+                         [b'c1', b'c2'])
         req = Request.blank('/sda1/p/a/c1', environ={'REQUEST_METHOD': 'PUT'},
                             headers={'X-Put-Timestamp': '1',
                                      'X-Delete-Timestamp': '0',
                                      'X-Object-Count': '1',
                                      'X-Bytes-Used': '2',
                                      'X-Timestamp': normalize_timestamp(0)})
-        self.controller.PUT(req)
+        req.get_response(self.controller)
         req = Request.blank('/sda1/p/a/c2', environ={'REQUEST_METHOD': 'PUT'},
                             headers={'X-Put-Timestamp': '2',
                                      'X-Delete-Timestamp': '0',
                                      'X-Object-Count': '3',
                                      'X-Bytes-Used': '4',
                                      'X-Timestamp': normalize_timestamp(0)})
-        self.controller.PUT(req)
+        req.get_response(self.controller)
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(resp.body.strip().split('\n'), ['c1', 'c2'])
-        self.assertEquals(resp.content_type, 'text/plain')
-        self.assertEquals(resp.charset, 'utf-8')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.body.strip().split(b'\n'),
+                         [b'c1', b'c2'])
+        self.assertEqual(resp.content_type, 'text/plain')
+        self.assertEqual(resp.charset, 'utf-8')
 
         # test unknown format uses default plain
         req = Request.blank('/sda1/p/a?format=somethinglese',
                             environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(resp.body.strip().split('\n'), ['c1', 'c2'])
-        self.assertEquals(resp.content_type, 'text/plain')
-        self.assertEquals(resp.charset, 'utf-8')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.body.strip().split(b'\n'),
+                         [b'c1', b'c2'])
+        self.assertEqual(resp.content_type, 'text/plain')
+        self.assertEqual(resp.charset, 'utf-8')
 
+    @patch_policies([StoragePolicy(0, 'zero', is_default=True),
+                     StoragePolicy(1, 'one', is_default=False)])
     def test_GET_with_containers_json(self):
+        put_timestamps = {}
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        self.controller.PUT(req)
+                                                  'HTTP_X_TIMESTAMP': '0'})
+        req.get_response(self.controller)
+        put_timestamps['c1'] = normalize_timestamp(1)
         req = Request.blank('/sda1/p/a/c1', environ={'REQUEST_METHOD': 'PUT'},
-                            headers={'X-Put-Timestamp': '1',
+                            headers={'X-Put-Timestamp': put_timestamps['c1'],
                                      'X-Delete-Timestamp': '0',
                                      'X-Object-Count': '0',
                                      'X-Bytes-Used': '0',
                                      'X-Timestamp': normalize_timestamp(0)})
-        self.controller.PUT(req)
+        req.get_response(self.controller)
+        put_timestamps['c2'] = normalize_timestamp(2)
         req = Request.blank('/sda1/p/a/c2', environ={'REQUEST_METHOD': 'PUT'},
-                            headers={'X-Put-Timestamp': '2',
+                            headers={'X-Put-Timestamp': put_timestamps['c2'],
                                      'X-Delete-Timestamp': '0',
                                      'X-Object-Count': '0',
                                      'X-Bytes-Used': '0',
-                                     'X-Timestamp': normalize_timestamp(0)})
-        self.controller.PUT(req)
+                                     'X-Timestamp': normalize_timestamp(0),
+                                     'X-Backend-Storage-Policy-Index': 1})
+        req.get_response(self.controller)
         req = Request.blank('/sda1/p/a?format=json',
                             environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(simplejson.loads(resp.body),
-                          [{'count': 0, 'bytes': 0, 'name': 'c1'},
-                           {'count': 0, 'bytes': 0, 'name': 'c2'}])
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(
+            json.loads(resp.body),
+            [{'count': 0, 'bytes': 0, 'name': 'c1',
+              'last_modified': Timestamp(put_timestamps['c1']).isoformat,
+              'storage_policy': POLICIES[0].name},
+             {'count': 0, 'bytes': 0, 'name': 'c2',
+              'last_modified': Timestamp(put_timestamps['c2']).isoformat,
+              'storage_policy': POLICIES[1].name}])
+        put_timestamps['c1'] = normalize_timestamp(3)
         req = Request.blank('/sda1/p/a/c1', environ={'REQUEST_METHOD': 'PUT'},
-                            headers={'X-Put-Timestamp': '1',
+                            headers={'X-Put-Timestamp': put_timestamps['c1'],
                                      'X-Delete-Timestamp': '0',
                                      'X-Object-Count': '1',
                                      'X-Bytes-Used': '2',
                                      'X-Timestamp': normalize_timestamp(0)})
-        self.controller.PUT(req)
+        req.get_response(self.controller)
+        put_timestamps['c2'] = normalize_timestamp(4)
         req = Request.blank('/sda1/p/a/c2', environ={'REQUEST_METHOD': 'PUT'},
-                            headers={'X-Put-Timestamp': '2',
+                            headers={'X-Put-Timestamp': put_timestamps['c2'],
                                      'X-Delete-Timestamp': '0',
                                      'X-Object-Count': '3',
                                      'X-Bytes-Used': '4',
-                                     'X-Timestamp': normalize_timestamp(0)})
-        self.controller.PUT(req)
+                                     'X-Timestamp': normalize_timestamp(0),
+                                     'X-Backend-Storage-Policy-Index': 1})
+        req.get_response(self.controller)
         req = Request.blank('/sda1/p/a?format=json',
                             environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(simplejson.loads(resp.body),
-                          [{'count': 1, 'bytes': 2, 'name': 'c1'},
-                           {'count': 3, 'bytes': 4, 'name': 'c2'}])
-        self.assertEquals(resp.content_type, 'application/json')
-        self.assertEquals(resp.charset, 'utf-8')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(
+            json.loads(resp.body),
+            [{'count': 1, 'bytes': 2, 'name': 'c1',
+              'last_modified': Timestamp(put_timestamps['c1']).isoformat,
+              'storage_policy': POLICIES[0].name},
+             {'count': 3, 'bytes': 4, 'name': 'c2',
+              'last_modified': Timestamp(put_timestamps['c2']).isoformat,
+              'storage_policy': POLICIES[1].name}])
+        self.assertEqual(resp.content_type, 'application/json')
+        self.assertEqual(resp.charset, 'utf-8')
 
+    @patch_policies([StoragePolicy(0, 'zero', is_default=True),
+                     StoragePolicy(1, 'one', is_default=False)])
     def test_GET_with_containers_xml(self):
+        put_timestamps = {}
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        self.controller.PUT(req)
+                                                  'HTTP_X_TIMESTAMP': '0'})
+        req.get_response(self.controller)
+        put_timestamps['c1'] = normalize_timestamp(1)
         req = Request.blank('/sda1/p/a/c1', environ={'REQUEST_METHOD': 'PUT'},
-                            headers={'X-Put-Timestamp': '1',
+                            headers={'X-Put-Timestamp': put_timestamps['c1'],
                                      'X-Delete-Timestamp': '0',
                                      'X-Object-Count': '0',
                                      'X-Bytes-Used': '0',
                                      'X-Timestamp': normalize_timestamp(0)})
-        self.controller.PUT(req)
+        req.get_response(self.controller)
+        put_timestamps['c2'] = normalize_timestamp(2)
         req = Request.blank('/sda1/p/a/c2', environ={'REQUEST_METHOD': 'PUT'},
-                            headers={'X-Put-Timestamp': '2',
+                            headers={'X-Put-Timestamp': put_timestamps['c2'],
                                      'X-Delete-Timestamp': '0',
                                      'X-Object-Count': '0',
                                      'X-Bytes-Used': '0',
-                                     'X-Timestamp': normalize_timestamp(0)})
-        self.controller.PUT(req)
+                                     'X-Timestamp': normalize_timestamp(0),
+                                     'X-Backend-Storage-Policy-Index': 1})
+        req.get_response(self.controller)
         req = Request.blank('/sda1/p/a?format=xml',
                             environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.content_type, 'application/xml')
-        self.assertEquals(resp.status_int, 200)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.content_type, 'application/xml')
+        self.assertEqual(resp.status_int, 200)
         dom = xml.dom.minidom.parseString(resp.body)
-        self.assertEquals(dom.firstChild.nodeName, 'account')
+        self.assertEqual(dom.firstChild.nodeName, 'account')
         listing = \
             [n for n in dom.firstChild.childNodes if n.nodeName != '#text']
-        self.assertEquals(len(listing), 2)
-        self.assertEquals(listing[0].nodeName, 'container')
+        self.assertEqual(len(listing), 2)
+        self.assertEqual(listing[0].nodeName, 'container')
         container = [n for n in listing[0].childNodes if n.nodeName != '#text']
-        self.assertEquals(sorted([n.nodeName for n in container]),
-                          ['bytes', 'count', 'name'])
+        self.assertEqual(sorted([n.nodeName for n in container]),
+                         ['bytes', 'count', 'last_modified', 'name',
+                          'storage_policy'])
         node = [n for n in container if n.nodeName == 'name'][0]
-        self.assertEquals(node.firstChild.nodeValue, 'c1')
+        self.assertEqual(node.firstChild.nodeValue, 'c1')
         node = [n for n in container if n.nodeName == 'count'][0]
-        self.assertEquals(node.firstChild.nodeValue, '0')
+        self.assertEqual(node.firstChild.nodeValue, '0')
         node = [n for n in container if n.nodeName == 'bytes'][0]
-        self.assertEquals(node.firstChild.nodeValue, '0')
-        self.assertEquals(listing[-1].nodeName, 'container')
+        self.assertEqual(node.firstChild.nodeValue, '0')
+        node = [n for n in container if n.nodeName == 'last_modified'][0]
+        self.assertEqual(node.firstChild.nodeValue,
+                         Timestamp(put_timestamps['c1']).isoformat)
+        node = [n for n in container if n.nodeName == 'storage_policy'][0]
+        self.assertEqual(node.firstChild.nodeValue, POLICIES[0].name)
+        self.assertEqual(listing[-1].nodeName, 'container')
         container = \
             [n for n in listing[-1].childNodes if n.nodeName != '#text']
-        self.assertEquals(sorted([n.nodeName for n in container]),
-                          ['bytes', 'count', 'name'])
+        self.assertEqual(sorted([n.nodeName for n in container]),
+                         ['bytes', 'count', 'last_modified', 'name',
+                          'storage_policy'])
         node = [n for n in container if n.nodeName == 'name'][0]
-        self.assertEquals(node.firstChild.nodeValue, 'c2')
+        self.assertEqual(node.firstChild.nodeValue, 'c2')
         node = [n for n in container if n.nodeName == 'count'][0]
-        self.assertEquals(node.firstChild.nodeValue, '0')
+        self.assertEqual(node.firstChild.nodeValue, '0')
         node = [n for n in container if n.nodeName == 'bytes'][0]
-        self.assertEquals(node.firstChild.nodeValue, '0')
+        self.assertEqual(node.firstChild.nodeValue, '0')
+        node = [n for n in container if n.nodeName == 'last_modified'][0]
+        self.assertEqual(node.firstChild.nodeValue,
+                         Timestamp(put_timestamps['c2']).isoformat)
+        node = [n for n in container if n.nodeName == 'storage_policy'][0]
+        self.assertEqual(node.firstChild.nodeValue, POLICIES[1].name)
         req = Request.blank('/sda1/p/a/c1', environ={'REQUEST_METHOD': 'PUT'},
                             headers={'X-Put-Timestamp': '1',
                                      'X-Delete-Timestamp': '0',
                                      'X-Object-Count': '1',
                                      'X-Bytes-Used': '2',
                                      'X-Timestamp': normalize_timestamp(0)})
-        self.controller.PUT(req)
+        req.get_response(self.controller)
         req = Request.blank('/sda1/p/a/c2', environ={'REQUEST_METHOD': 'PUT'},
                             headers={'X-Put-Timestamp': '2',
                                      'X-Delete-Timestamp': '0',
                                      'X-Object-Count': '3',
                                      'X-Bytes-Used': '4',
-                                     'X-Timestamp': normalize_timestamp(0)})
-        self.controller.PUT(req)
+                                     'X-Timestamp': normalize_timestamp(0),
+                                     'X-Backend-Storage-Policy-Index': 1})
+        req.get_response(self.controller)
         req = Request.blank('/sda1/p/a?format=xml',
                             environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
         dom = xml.dom.minidom.parseString(resp.body)
-        self.assertEquals(dom.firstChild.nodeName, 'account')
+        self.assertEqual(dom.firstChild.nodeName, 'account')
         listing = \
             [n for n in dom.firstChild.childNodes if n.nodeName != '#text']
-        self.assertEquals(len(listing), 2)
-        self.assertEquals(listing[0].nodeName, 'container')
+        self.assertEqual(len(listing), 2)
+        self.assertEqual(listing[0].nodeName, 'container')
         container = [n for n in listing[0].childNodes if n.nodeName != '#text']
-        self.assertEquals(sorted([n.nodeName for n in container]),
-                          ['bytes', 'count', 'name'])
+        self.assertEqual(sorted([n.nodeName for n in container]),
+                         ['bytes', 'count', 'last_modified', 'name',
+                          'storage_policy'])
         node = [n for n in container if n.nodeName == 'name'][0]
-        self.assertEquals(node.firstChild.nodeValue, 'c1')
+        self.assertEqual(node.firstChild.nodeValue, 'c1')
         node = [n for n in container if n.nodeName == 'count'][0]
-        self.assertEquals(node.firstChild.nodeValue, '1')
+        self.assertEqual(node.firstChild.nodeValue, '1')
         node = [n for n in container if n.nodeName == 'bytes'][0]
-        self.assertEquals(node.firstChild.nodeValue, '2')
-        self.assertEquals(listing[-1].nodeName, 'container')
-        container = [n for n in listing[-1].childNodes if n.nodeName != '#text']
-        self.assertEquals(sorted([n.nodeName for n in container]),
-                          ['bytes', 'count', 'name'])
+        self.assertEqual(node.firstChild.nodeValue, '2')
+        node = [n for n in container if n.nodeName == 'last_modified'][0]
+        self.assertEqual(node.firstChild.nodeValue,
+                         Timestamp(put_timestamps['c1']).isoformat)
+        node = [n for n in container if n.nodeName == 'storage_policy'][0]
+        self.assertEqual(node.firstChild.nodeValue, POLICIES[0].name)
+        self.assertEqual(listing[-1].nodeName, 'container')
+        container = [
+            n for n in listing[-1].childNodes if n.nodeName != '#text']
+        self.assertEqual(sorted([n.nodeName for n in container]),
+                         ['bytes', 'count', 'last_modified', 'name',
+                          'storage_policy'])
         node = [n for n in container if n.nodeName == 'name'][0]
-        self.assertEquals(node.firstChild.nodeValue, 'c2')
+        self.assertEqual(node.firstChild.nodeValue, 'c2')
         node = [n for n in container if n.nodeName == 'count'][0]
-        self.assertEquals(node.firstChild.nodeValue, '3')
+        self.assertEqual(node.firstChild.nodeValue, '3')
         node = [n for n in container if n.nodeName == 'bytes'][0]
-        self.assertEquals(node.firstChild.nodeValue, '4')
-        self.assertEquals(resp.charset, 'utf-8')
+        self.assertEqual(node.firstChild.nodeValue, '4')
+        node = [n for n in container if n.nodeName == 'last_modified'][0]
+        self.assertEqual(node.firstChild.nodeValue,
+                         Timestamp(put_timestamps['c2']).isoformat)
+        node = [n for n in container if n.nodeName == 'storage_policy'][0]
+        self.assertEqual(node.firstChild.nodeValue, POLICIES[1].name)
+        self.assertEqual(resp.charset, 'utf-8')
+
+    def test_GET_xml_escapes_account_name(self):
+        req = Request.blank(
+            '/sda1/p/%22%27',   # "'
+            environ={'REQUEST_METHOD': 'PUT', 'HTTP_X_TIMESTAMP': '0'})
+        req.get_response(self.controller)
+
+        req = Request.blank(
+            '/sda1/p/%22%27?format=xml',
+            environ={'REQUEST_METHOD': 'GET', 'HTTP_X_TIMESTAMP': '1'})
+        resp = req.get_response(self.controller)
+
+        dom = xml.dom.minidom.parseString(resp.body)
+        self.assertEqual(dom.firstChild.attributes['name'].value, '"\'')
+
+    def test_GET_xml_escapes_container_name(self):
+        req = Request.blank(
+            '/sda1/p/a',
+            environ={'REQUEST_METHOD': 'PUT', 'HTTP_X_TIMESTAMP': '0'})
+        req.get_response(self.controller)
+
+        req = Request.blank(
+            '/sda1/p/a/%22%3Cword',  # "<word
+            environ={'REQUEST_METHOD': 'PUT', 'HTTP_X_TIMESTAMP': '1',
+                     'HTTP_X_PUT_TIMESTAMP': '1', 'HTTP_X_OBJECT_COUNT': '0',
+                     'HTTP_X_DELETE_TIMESTAMP': '0', 'HTTP_X_BYTES_USED': '1'})
+        req.get_response(self.controller)
+
+        req = Request.blank(
+            '/sda1/p/a?format=xml',
+            environ={'REQUEST_METHOD': 'GET', 'HTTP_X_TIMESTAMP': '1'})
+        resp = req.get_response(self.controller)
+        dom = xml.dom.minidom.parseString(resp.body)
+
+        self.assertEqual(
+            dom.firstChild.firstChild.nextSibling.firstChild.firstChild.data,
+            '"<word')
+
+    def test_GET_xml_escapes_container_name_as_subdir(self):
+        req = Request.blank(
+            '/sda1/p/a',
+            environ={'REQUEST_METHOD': 'PUT', 'HTTP_X_TIMESTAMP': '0'})
+        req.get_response(self.controller)
+
+        req = Request.blank(
+            '/sda1/p/a/%22%3Cword-test',  # "<word-test
+            environ={'REQUEST_METHOD': 'PUT', 'HTTP_X_TIMESTAMP': '1',
+                     'HTTP_X_PUT_TIMESTAMP': '1', 'HTTP_X_OBJECT_COUNT': '0',
+                     'HTTP_X_DELETE_TIMESTAMP': '0', 'HTTP_X_BYTES_USED': '1'})
+        req.get_response(self.controller)
+
+        req = Request.blank(
+            '/sda1/p/a?format=xml&delimiter=-',
+            environ={'REQUEST_METHOD': 'GET', 'HTTP_X_TIMESTAMP': '1'})
+        resp = req.get_response(self.controller)
+        dom = xml.dom.minidom.parseString(resp.body)
+
+        self.assertEqual(
+            dom.firstChild.firstChild.nextSibling.attributes['name'].value,
+            '"<word-')
 
     def test_GET_limit_marker_plain(self):
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        self.controller.PUT(req)
-        for c in xrange(5):
-            req = Request.blank('/sda1/p/a/c%d' % c,
-                                environ={'REQUEST_METHOD': 'PUT'},
-                                headers={'X-Put-Timestamp': str(c + 1),
-                                         'X-Delete-Timestamp': '0',
-                                         'X-Object-Count': '2',
-                                         'X-Bytes-Used': '3',
-                                         'X-Timestamp': normalize_timestamp(0)})
-            self.controller.PUT(req)
+                                                  'HTTP_X_TIMESTAMP': '0'})
+        req.get_response(self.controller)
+        put_timestamp = normalize_timestamp(0)
+        for c in range(5):
+            req = Request.blank(
+                '/sda1/p/a/c%d' % c,
+                environ={'REQUEST_METHOD': 'PUT'},
+                headers={'X-Put-Timestamp': put_timestamp,
+                         'X-Delete-Timestamp': '0',
+                         'X-Object-Count': '2',
+                         'X-Bytes-Used': '3',
+                         'X-Timestamp': put_timestamp})
+            req.get_response(self.controller)
         req = Request.blank('/sda1/p/a?limit=3',
                             environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(resp.body.strip().split('\n'), ['c0', 'c1', 'c2'])
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.body.strip().split(b'\n'),
+                         [b'c0', b'c1', b'c2'])
         req = Request.blank('/sda1/p/a?limit=3&marker=c2',
                             environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(resp.body.strip().split('\n'), ['c3', 'c4'])
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.body.strip().split(b'\n'),
+                         [b'c3', b'c4'])
 
+    @patch_policies([StoragePolicy(0, 'zero', is_default=True),
+                     StoragePolicy(1, 'one', is_default=False)])
     def test_GET_limit_marker_json(self):
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        self.controller.PUT(req)
-        for c in xrange(5):
-            req = Request.blank('/sda1/p/a/c%d' % c,
-                                environ={'REQUEST_METHOD': 'PUT'},
-                                headers={'X-Put-Timestamp': str(c + 1),
-                                         'X-Delete-Timestamp': '0',
-                                         'X-Object-Count': '2',
-                                         'X-Bytes-Used': '3',
-                                         'X-Timestamp': normalize_timestamp(0)})
-            self.controller.PUT(req)
+                                                  'HTTP_X_TIMESTAMP': '0'})
+        req.get_response(self.controller)
+        for c in range(5):
+            put_timestamp = normalize_timestamp(c + 1)
+            req = Request.blank(
+                '/sda1/p/a/c%d' % c,
+                environ={'REQUEST_METHOD': 'PUT'},
+                headers={'X-Put-Timestamp': put_timestamp,
+                         'X-Delete-Timestamp': '0',
+                         'X-Object-Count': '2',
+                         'X-Bytes-Used': '3',
+                         'X-Timestamp': put_timestamp,
+                         'X-Backend-Storage-Policy-Index': c % 2})
+            req.get_response(self.controller)
         req = Request.blank('/sda1/p/a?limit=3&format=json',
                             environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(simplejson.loads(resp.body),
-                          [{'count': 2, 'bytes': 3, 'name': 'c0'},
-                           {'count': 2, 'bytes': 3, 'name': 'c1'},
-                           {'count': 2, 'bytes': 3, 'name': 'c2'}])
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        expected = [{'count': 2, 'bytes': 3, 'name': 'c0',
+                     'last_modified': Timestamp('1').isoformat,
+                     'storage_policy': POLICIES[0].name},
+                    {'count': 2, 'bytes': 3, 'name': 'c1',
+                     'last_modified': Timestamp('2').isoformat,
+                     'storage_policy': POLICIES[1].name},
+                    {'count': 2, 'bytes': 3, 'name': 'c2',
+                     'last_modified': Timestamp('3').isoformat,
+                     'storage_policy': POLICIES[0].name}]
+        self.assertEqual(json.loads(resp.body), expected)
         req = Request.blank('/sda1/p/a?limit=3&marker=c2&format=json',
                             environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(simplejson.loads(resp.body),
-                          [{'count': 2, 'bytes': 3, 'name': 'c3'},
-                           {'count': 2, 'bytes': 3, 'name': 'c4'}])
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        expected = [{'count': 2, 'bytes': 3, 'name': 'c3',
+                     'last_modified': Timestamp('4').isoformat,
+                     'storage_policy': POLICIES[1].name},
+                    {'count': 2, 'bytes': 3, 'name': 'c4',
+                     'last_modified': Timestamp('5').isoformat,
+                     'storage_policy': POLICIES[0].name}]
+        self.assertEqual(json.loads(resp.body), expected)
 
+    @patch_policies([StoragePolicy(0, 'zero', is_default=True),
+                     StoragePolicy(1, 'one', is_default=False)])
     def test_GET_limit_marker_xml(self):
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        self.controller.PUT(req)
-        for c in xrange(5):
-            req = Request.blank('/sda1/p/a/c%d' % c,
-                                environ={'REQUEST_METHOD': 'PUT'},
-                                headers={'X-Put-Timestamp': str(c + 1),
-                                         'X-Delete-Timestamp': '0',
-                                         'X-Object-Count': '2',
-                                         'X-Bytes-Used': '3',
-                                         'X-Timestamp': normalize_timestamp(c)})
-            self.controller.PUT(req)
+                                                  'HTTP_X_TIMESTAMP': '0'})
+        req.get_response(self.controller)
+        for c in range(5):
+            put_timestamp = normalize_timestamp(c + 1)
+            req = Request.blank(
+                '/sda1/p/a/c%d' % c,
+                environ={'REQUEST_METHOD': 'PUT'},
+                headers={'X-Put-Timestamp': put_timestamp,
+                         'X-Delete-Timestamp': '0',
+                         'X-Object-Count': '2',
+                         'X-Bytes-Used': '3',
+                         'X-Timestamp': put_timestamp,
+                         'X-Backend-Storage-Policy-Index': c % 2})
+            req.get_response(self.controller)
         req = Request.blank('/sda1/p/a?limit=3&format=xml',
                             environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
         dom = xml.dom.minidom.parseString(resp.body)
-        self.assertEquals(dom.firstChild.nodeName, 'account')
+        self.assertEqual(dom.firstChild.nodeName, 'account')
         listing = \
             [n for n in dom.firstChild.childNodes if n.nodeName != '#text']
-        self.assertEquals(len(listing), 3)
-        self.assertEquals(listing[0].nodeName, 'container')
+        self.assertEqual(len(listing), 3)
+        self.assertEqual(listing[0].nodeName, 'container')
         container = [n for n in listing[0].childNodes if n.nodeName != '#text']
-        self.assertEquals(sorted([n.nodeName for n in container]),
-                          ['bytes', 'count', 'name'])
+        self.assertEqual(sorted([n.nodeName for n in container]),
+                         ['bytes', 'count', 'last_modified', 'name',
+                          'storage_policy'])
         node = [n for n in container if n.nodeName == 'name'][0]
-        self.assertEquals(node.firstChild.nodeValue, 'c0')
+        self.assertEqual(node.firstChild.nodeValue, 'c0')
         node = [n for n in container if n.nodeName == 'count'][0]
-        self.assertEquals(node.firstChild.nodeValue, '2')
+        self.assertEqual(node.firstChild.nodeValue, '2')
         node = [n for n in container if n.nodeName == 'bytes'][0]
-        self.assertEquals(node.firstChild.nodeValue, '3')
-        self.assertEquals(listing[-1].nodeName, 'container')
-        container = [n for n in listing[-1].childNodes if n.nodeName != '#text']
-        self.assertEquals(sorted([n.nodeName for n in container]),
-                          ['bytes', 'count', 'name'])
+        self.assertEqual(node.firstChild.nodeValue, '3')
+        node = [n for n in container if n.nodeName == 'last_modified'][0]
+        self.assertEqual(node.firstChild.nodeValue,
+                         Timestamp('1').isoformat)
+        node = [n for n in container if n.nodeName == 'storage_policy'][0]
+        self.assertEqual(node.firstChild.nodeValue, POLICIES[0].name)
+        self.assertEqual(listing[-1].nodeName, 'container')
+        container = [
+            n for n in listing[-1].childNodes if n.nodeName != '#text']
+        self.assertEqual(sorted([n.nodeName for n in container]),
+                         ['bytes', 'count', 'last_modified', 'name',
+                         'storage_policy'])
         node = [n for n in container if n.nodeName == 'name'][0]
-        self.assertEquals(node.firstChild.nodeValue, 'c2')
+        self.assertEqual(node.firstChild.nodeValue, 'c2')
         node = [n for n in container if n.nodeName == 'count'][0]
-        self.assertEquals(node.firstChild.nodeValue, '2')
+        self.assertEqual(node.firstChild.nodeValue, '2')
         node = [n for n in container if n.nodeName == 'bytes'][0]
-        self.assertEquals(node.firstChild.nodeValue, '3')
+        self.assertEqual(node.firstChild.nodeValue, '3')
+        node = [n for n in container if n.nodeName == 'last_modified'][0]
+        self.assertEqual(node.firstChild.nodeValue,
+                         Timestamp('3').isoformat)
+        node = [n for n in container if n.nodeName == 'storage_policy'][0]
+        self.assertEqual(node.firstChild.nodeValue, POLICIES[0].name)
         req = Request.blank('/sda1/p/a?limit=3&marker=c2&format=xml',
                             environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
         dom = xml.dom.minidom.parseString(resp.body)
-        self.assertEquals(dom.firstChild.nodeName, 'account')
+        self.assertEqual(dom.firstChild.nodeName, 'account')
         listing = \
             [n for n in dom.firstChild.childNodes if n.nodeName != '#text']
-        self.assertEquals(len(listing), 2)
-        self.assertEquals(listing[0].nodeName, 'container')
+        self.assertEqual(len(listing), 2)
+        self.assertEqual(listing[0].nodeName, 'container')
         container = [n for n in listing[0].childNodes if n.nodeName != '#text']
-        self.assertEquals(sorted([n.nodeName for n in container]),
-                          ['bytes', 'count', 'name'])
+        self.assertEqual(sorted([n.nodeName for n in container]),
+                         ['bytes', 'count', 'last_modified', 'name',
+                          'storage_policy'])
         node = [n for n in container if n.nodeName == 'name'][0]
-        self.assertEquals(node.firstChild.nodeValue, 'c3')
+        self.assertEqual(node.firstChild.nodeValue, 'c3')
         node = [n for n in container if n.nodeName == 'count'][0]
-        self.assertEquals(node.firstChild.nodeValue, '2')
+        self.assertEqual(node.firstChild.nodeValue, '2')
         node = [n for n in container if n.nodeName == 'bytes'][0]
-        self.assertEquals(node.firstChild.nodeValue, '3')
-        self.assertEquals(listing[-1].nodeName, 'container')
-        container = [n for n in listing[-1].childNodes if n.nodeName != '#text']
-        self.assertEquals(sorted([n.nodeName for n in container]),
-                          ['bytes', 'count', 'name'])
+        self.assertEqual(node.firstChild.nodeValue, '3')
+        node = [n for n in container if n.nodeName == 'last_modified'][0]
+        self.assertEqual(node.firstChild.nodeValue,
+                         Timestamp('4').isoformat)
+        node = [n for n in container if n.nodeName == 'storage_policy'][0]
+        self.assertEqual(node.firstChild.nodeValue, POLICIES[1].name)
+        self.assertEqual(listing[-1].nodeName, 'container')
+        container = [
+            n for n in listing[-1].childNodes if n.nodeName != '#text']
+        self.assertEqual(sorted([n.nodeName for n in container]),
+                         ['bytes', 'count', 'last_modified', 'name',
+                          'storage_policy'])
         node = [n for n in container if n.nodeName == 'name'][0]
-        self.assertEquals(node.firstChild.nodeValue, 'c4')
+        self.assertEqual(node.firstChild.nodeValue, 'c4')
         node = [n for n in container if n.nodeName == 'count'][0]
-        self.assertEquals(node.firstChild.nodeValue, '2')
+        self.assertEqual(node.firstChild.nodeValue, '2')
         node = [n for n in container if n.nodeName == 'bytes'][0]
-        self.assertEquals(node.firstChild.nodeValue, '3')
+        self.assertEqual(node.firstChild.nodeValue, '3')
+        node = [n for n in container if n.nodeName == 'last_modified'][0]
+        self.assertEqual(node.firstChild.nodeValue,
+                         Timestamp('5').isoformat)
+        node = [n for n in container if n.nodeName == 'storage_policy'][0]
+        self.assertEqual(node.firstChild.nodeValue, POLICIES[0].name)
 
     def test_GET_accept_wildcard(self):
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        self.controller.PUT(req)
+                                                  'HTTP_X_TIMESTAMP': '0'})
+        req.get_response(self.controller)
         req = Request.blank('/sda1/p/a/c1', environ={'REQUEST_METHOD': 'PUT'},
                             headers={'X-Put-Timestamp': '1',
                                      'X-Delete-Timestamp': '0',
                                      'X-Object-Count': '0',
                                      'X-Bytes-Used': '0',
                                      'X-Timestamp': normalize_timestamp(0)})
-        self.controller.PUT(req)
+        req.get_response(self.controller)
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'GET'})
         req.accept = '*/*'
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(resp.body, 'c1\n')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.body, b'c1\n')
 
     def test_GET_accept_application_wildcard(self):
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        self.controller.PUT(req)
+                                                  'HTTP_X_TIMESTAMP': '0'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
         req = Request.blank('/sda1/p/a/c1', environ={'REQUEST_METHOD': 'PUT'},
                             headers={'X-Put-Timestamp': '1',
                                      'X-Delete-Timestamp': '0',
                                      'X-Object-Count': '0',
                                      'X-Bytes-Used': '0',
                                      'X-Timestamp': normalize_timestamp(0)})
-        resp = self.controller.PUT(req)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'GET'})
         req.accept = 'application/*'
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(len(simplejson.loads(resp.body)), 1)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(len(json.loads(resp.body)), 1)
 
     def test_GET_accept_json(self):
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        self.controller.PUT(req)
+                                                  'HTTP_X_TIMESTAMP': '0'})
+        req.get_response(self.controller)
         req = Request.blank('/sda1/p/a/c1', environ={'REQUEST_METHOD': 'PUT'},
                             headers={'X-Put-Timestamp': '1',
                                      'X-Delete-Timestamp': '0',
                                      'X-Object-Count': '0',
                                      'X-Bytes-Used': '0',
                                      'X-Timestamp': normalize_timestamp(0)})
-        self.controller.PUT(req)
+        req.get_response(self.controller)
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'GET'})
         req.accept = 'application/json'
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(len(simplejson.loads(resp.body)), 1)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(len(json.loads(resp.body)), 1)
 
     def test_GET_accept_xml(self):
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        self.controller.PUT(req)
+                                                  'HTTP_X_TIMESTAMP': '0'})
+        req.get_response(self.controller)
         req = Request.blank('/sda1/p/a/c1', environ={'REQUEST_METHOD': 'PUT'},
                             headers={'X-Put-Timestamp': '1',
                                      'X-Delete-Timestamp': '0',
                                      'X-Object-Count': '0',
                                      'X-Bytes-Used': '0',
                                      'X-Timestamp': normalize_timestamp(0)})
-        self.controller.PUT(req)
+        req.get_response(self.controller)
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'GET'})
         req.accept = 'application/xml'
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
         dom = xml.dom.minidom.parseString(resp.body)
-        self.assertEquals(dom.firstChild.nodeName, 'account')
+        self.assertEqual(dom.firstChild.nodeName, 'account')
         listing = \
             [n for n in dom.firstChild.childNodes if n.nodeName != '#text']
-        self.assertEquals(len(listing), 1)
+        self.assertEqual(len(listing), 1)
 
     def test_GET_accept_conflicting(self):
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        self.controller.PUT(req)
+                                                  'HTTP_X_TIMESTAMP': '0'})
+        req.get_response(self.controller)
         req = Request.blank('/sda1/p/a/c1', environ={'REQUEST_METHOD': 'PUT'},
                             headers={'X-Put-Timestamp': '1',
                                      'X-Delete-Timestamp': '0',
                                      'X-Object-Count': '0',
                                      'X-Bytes-Used': '0',
                                      'X-Timestamp': normalize_timestamp(0)})
-        self.controller.PUT(req)
-        req = Request.blank('/sda1/p/a?format=plain', 
+        req.get_response(self.controller)
+        req = Request.blank('/sda1/p/a?format=plain',
                             environ={'REQUEST_METHOD': 'GET'})
         req.accept = 'application/json'
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(resp.body, 'c1\n')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.body, b'c1\n')
 
     def test_GET_accept_not_valid(self):
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        self.controller.PUT(req)
+                                                  'HTTP_X_TIMESTAMP': '0'})
+        req.get_response(self.controller)
         req = Request.blank('/sda1/p/a/c1', environ={'REQUEST_METHOD': 'PUT'},
                             headers={'X-Put-Timestamp': '1',
                                      'X-Delete-Timestamp': '0',
                                      'X-Object-Count': '0',
                                      'X-Bytes-Used': '0',
                                      'X-Timestamp': normalize_timestamp(0)})
-        self.controller.PUT(req)
+        req.get_response(self.controller)
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'GET'})
         req.accept = 'application/xml*'
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 406)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 406)
 
-    def test_GET_prefix_delimeter_plain(self):
+    def test_GET_prefix_delimiter_plain(self):
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        resp = self.controller.PUT(req)
+                                                  'HTTP_X_TIMESTAMP': '0'})
+        resp = req.get_response(self.controller)
         for first in range(3):
-            req = Request.blank('/sda1/p/a/sub.%s' % first,
+            req = Request.blank(
+                '/sda1/p/a/sub.%s' % first,
                 environ={'REQUEST_METHOD': 'PUT'},
                 headers={'X-Put-Timestamp': '1',
                          'X-Delete-Timestamp': '0',
                          'X-Object-Count': '0',
                          'X-Bytes-Used': '0',
                          'X-Timestamp': normalize_timestamp(0)})
-            self.controller.PUT(req)
+            req.get_response(self.controller)
             for second in range(3):
-                req = Request.blank('/sda1/p/a/sub.%s.%s' % (first, second),
+                req = Request.blank(
+                    '/sda1/p/a/sub.%s.%s' % (first, second),
                     environ={'REQUEST_METHOD': 'PUT'},
                     headers={'X-Put-Timestamp': '1',
                              'X-Delete-Timestamp': '0',
                              'X-Object-Count': '0',
                              'X-Bytes-Used': '0',
                              'X-Timestamp': normalize_timestamp(0)})
-                self.controller.PUT(req)
+                req.get_response(self.controller)
         req = Request.blank('/sda1/p/a?delimiter=.',
-            environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(resp.body.strip().split('\n'), ['sub.'])
+                            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.body.strip().split(b'\n'),
+                         [b'sub.'])
         req = Request.blank('/sda1/p/a?prefix=sub.&delimiter=.',
-            environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(resp.body.strip().split('\n'),
-            ['sub.0', 'sub.0.', 'sub.1', 'sub.1.', 'sub.2', 'sub.2.'])
+                            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(
+            resp.body.strip().split(b'\n'),
+            [b'sub.0', b'sub.0.', b'sub.1', b'sub.1.', b'sub.2', b'sub.2.'])
         req = Request.blank('/sda1/p/a?prefix=sub.1.&delimiter=.',
-            environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(resp.body.strip().split('\n'),
-            ['sub.1.0', 'sub.1.1', 'sub.1.2'])
+                            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.body.strip().split(b'\n'),
+                         [b'sub.1.0', b'sub.1.1', b'sub.1.2'])
 
-    def test_GET_prefix_delimeter_json(self):
+    def test_GET_prefix_delimiter_json(self):
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT',
-                'HTTP_X_TIMESTAMP': '0'})
-        resp = self.controller.PUT(req)
+                                                  'HTTP_X_TIMESTAMP': '0'})
+        resp = req.get_response(self.controller)
         for first in range(3):
-            req = Request.blank('/sda1/p/a/sub.%s' % first,
+            req = Request.blank(
+                '/sda1/p/a/sub.%s' % first,
                 environ={'REQUEST_METHOD': 'PUT'},
                 headers={'X-Put-Timestamp': '1',
                          'X-Delete-Timestamp': '0',
                          'X-Object-Count': '0',
                          'X-Bytes-Used': '0',
                          'X-Timestamp': normalize_timestamp(0)})
-            self.controller.PUT(req)
+            req.get_response(self.controller)
             for second in range(3):
-                req = Request.blank('/sda1/p/a/sub.%s.%s' % (first, second),
+                req = Request.blank(
+                    '/sda1/p/a/sub.%s.%s' % (first, second),
                     environ={'REQUEST_METHOD': 'PUT'},
                     headers={'X-Put-Timestamp': '1',
                              'X-Delete-Timestamp': '0',
                              'X-Object-Count': '0',
                              'X-Bytes-Used': '0',
                              'X-Timestamp': normalize_timestamp(0)})
-                self.controller.PUT(req)
+                req.get_response(self.controller)
         req = Request.blank('/sda1/p/a?delimiter=.&format=json',
-            environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals([n.get('name', 's:' + n.get('subdir', 'error'))
-                           for n in simplejson.loads(resp.body)], ['s:sub.'])
+                            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual([n.get('name', 's:' + n.get('subdir', 'error'))
+                          for n in json.loads(resp.body)], ['s:sub.'])
         req = Request.blank('/sda1/p/a?prefix=sub.&delimiter=.&format=json',
-            environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals([n.get('name', 's:' + n.get('subdir', 'error'))
-                           for n in simplejson.loads(resp.body)],
+                            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(
+            [n.get('name', 's:' + n.get('subdir', 'error'))
+             for n in json.loads(resp.body)],
             ['sub.0', 's:sub.0.', 'sub.1', 's:sub.1.', 'sub.2', 's:sub.2.'])
         req = Request.blank('/sda1/p/a?prefix=sub.1.&delimiter=.&format=json',
-            environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals([n.get('name', 's:' + n.get('subdir', 'error'))
-                           for n in simplejson.loads(resp.body)],
+                            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(
+            [n.get('name', 's:' + n.get('subdir', 'error'))
+             for n in json.loads(resp.body)],
             ['sub.1.0', 'sub.1.1', 'sub.1.2'])
 
-    def test_GET_prefix_delimeter_xml(self):
+    def test_GET_prefix_delimiter_xml(self):
         req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        resp = self.controller.PUT(req)
+                                                  'HTTP_X_TIMESTAMP': '0'})
+        resp = req.get_response(self.controller)
         for first in range(3):
-            req = Request.blank('/sda1/p/a/sub.%s' % first,
+            req = Request.blank(
+                '/sda1/p/a/sub.%s' % first,
                 environ={'REQUEST_METHOD': 'PUT'},
                 headers={'X-Put-Timestamp': '1',
                          'X-Delete-Timestamp': '0',
                          'X-Object-Count': '0',
                          'X-Bytes-Used': '0',
                          'X-Timestamp': normalize_timestamp(0)})
-            self.controller.PUT(req)
+            req.get_response(self.controller)
             for second in range(3):
-                req = Request.blank('/sda1/p/a/sub.%s.%s' % (first, second),
+                req = Request.blank(
+                    '/sda1/p/a/sub.%s.%s' % (first, second),
                     environ={'REQUEST_METHOD': 'PUT'},
                     headers={'X-Put-Timestamp': '1',
                              'X-Delete-Timestamp': '0',
                              'X-Object-Count': '0',
                              'X-Bytes-Used': '0',
                              'X-Timestamp': normalize_timestamp(0)})
-                self.controller.PUT(req)
-        req = Request.blank('/sda1/p/a?delimiter=.&format=xml',
+                req.get_response(self.controller)
+        req = Request.blank(
+            '/sda1/p/a?delimiter=.&format=xml',
             environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
         dom = xml.dom.minidom.parseString(resp.body)
         listing = []
         for node1 in dom.firstChild.childNodes:
@@ -891,11 +1755,12 @@ def test_GET_prefix_delimeter_xml(self):
                 for node2 in node1.childNodes:
                     if node2.nodeName == 'name':
                         listing.append(node2.firstChild.nodeValue)
-        self.assertEquals(listing, ['s:sub.'])
-        req = Request.blank('/sda1/p/a?prefix=sub.&delimiter=.&format=xml',
+        self.assertEqual(listing, ['s:sub.'])
+        req = Request.blank(
+            '/sda1/p/a?prefix=sub.&delimiter=.&format=xml',
             environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
         dom = xml.dom.minidom.parseString(resp.body)
         listing = []
         for node1 in dom.firstChild.childNodes:
@@ -905,12 +1770,14 @@ def test_GET_prefix_delimeter_xml(self):
                 for node2 in node1.childNodes:
                     if node2.nodeName == 'name':
                         listing.append(node2.firstChild.nodeValue)
-        self.assertEquals(listing,
+        self.assertEqual(
+            listing,
             ['sub.0', 's:sub.0.', 'sub.1', 's:sub.1.', 'sub.2', 's:sub.2.'])
-        req = Request.blank('/sda1/p/a?prefix=sub.1.&delimiter=.&format=xml',
+        req = Request.blank(
+            '/sda1/p/a?prefix=sub.1.&delimiter=.&format=xml',
             environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
         dom = xml.dom.minidom.parseString(resp.body)
         listing = []
         for node1 in dom.firstChild.childNodes:
@@ -920,14 +1787,584 @@ def test_GET_prefix_delimeter_xml(self):
                 for node2 in node1.childNodes:
                     if node2.nodeName == 'name':
                         listing.append(node2.firstChild.nodeValue)
-        self.assertEquals(listing, ['sub.1.0', 'sub.1.1', 'sub.1.2'])
+        self.assertEqual(listing, ['sub.1.0', 'sub.1.1', 'sub.1.2'])
+
+    def test_GET_leading_delimiter(self):
+        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'PUT',
+                                                  'HTTP_X_TIMESTAMP': '0'})
+        resp = req.get_response(self.controller)
+        for first in range(3):
+            req = Request.blank(
+                '/sda1/p/a/.sub.%s' % first,
+                environ={'REQUEST_METHOD': 'PUT'},
+                headers={'X-Put-Timestamp': '1',
+                         'X-Delete-Timestamp': '0',
+                         'X-Object-Count': '0',
+                         'X-Bytes-Used': '0',
+                         'X-Timestamp': normalize_timestamp(0)})
+            req.get_response(self.controller)
+            for second in range(3):
+                req = Request.blank(
+                    '/sda1/p/a/.sub.%s.%s' % (first, second),
+                    environ={'REQUEST_METHOD': 'PUT'},
+                    headers={'X-Put-Timestamp': '1',
+                             'X-Delete-Timestamp': '0',
+                             'X-Object-Count': '0',
+                             'X-Bytes-Used': '0',
+                             'X-Timestamp': normalize_timestamp(0)})
+                req.get_response(self.controller)
+        req = Request.blank('/sda1/p/a?delimiter=.',
+                            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.body.strip().split(b'\n'),
+                         [b'.'])
+        req = Request.blank('/sda1/p/a?prefix=.&delimiter=.',
+                            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.body.strip().split(b'\n'),
+                         [b'.sub.'])
+        req = Request.blank('/sda1/p/a?prefix=.sub.&delimiter=.',
+                            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(
+            resp.body.strip().split(b'\n'),
+            [b'.sub.0', b'.sub.0.', b'.sub.1', b'.sub.1.',
+             b'.sub.2', b'.sub.2.'])
+        req = Request.blank('/sda1/p/a?prefix=.sub.1.&delimiter=.',
+                            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.body.strip().split(b'\n'),
+                         [b'.sub.1.0', b'.sub.1.1', b'.sub.1.2'])
+
+    def test_GET_multichar_delimiter(self):
+        self.maxDiff = None
+        req = Request.blank('/sda1/p/a', method='PUT', headers={
+            'x-timestamp': '0'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201, resp.body)
+        for i in ('US~~TX~~A', 'US~~TX~~B', 'US~~OK~~A', 'US~~OK~~B',
+                  'US~~OK~Tulsa~~A', 'US~~OK~Tulsa~~B',
+                  'US~~UT~~A', 'US~~UT~~~B'):
+            req = Request.blank('/sda1/p/a/%s' % i, method='PUT', headers={
+                'X-Put-Timestamp': '1',
+                'X-Delete-Timestamp': '0',
+                'X-Object-Count': '0',
+                'X-Bytes-Used': '0',
+                'X-Timestamp': normalize_timestamp(0)})
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 201)
+        req = Request.blank(
+            '/sda1/p/a?prefix=US~~&delimiter=~~&format=json',
+            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            json.loads(resp.body),
+            [{"subdir": "US~~OK~Tulsa~~"},
+             {"subdir": "US~~OK~~"},
+             {"subdir": "US~~TX~~"},
+             {"subdir": "US~~UT~~"}])
+
+        req = Request.blank(
+            '/sda1/p/a?prefix=US~~&delimiter=~~&format=json&reverse=on',
+            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            json.loads(resp.body),
+            [{"subdir": "US~~UT~~"},
+             {"subdir": "US~~TX~~"},
+             {"subdir": "US~~OK~~"},
+             {"subdir": "US~~OK~Tulsa~~"}])
+
+        req = Request.blank(
+            '/sda1/p/a?prefix=US~~UT&delimiter=~~&format=json',
+            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            json.loads(resp.body),
+            [{"subdir": "US~~UT~~"}])
+
+        req = Request.blank(
+            '/sda1/p/a?prefix=US~~UT&delimiter=~~&format=json&reverse=on',
+            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            json.loads(resp.body),
+            [{"subdir": "US~~UT~~"}])
+
+        req = Request.blank(
+            '/sda1/p/a?prefix=US~~UT~&delimiter=~~&format=json',
+            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            [{k: v for k, v in item.items() if k in ('subdir', 'name')}
+             for item in json.loads(resp.body)],
+            [{"name": "US~~UT~~A"},
+             {"subdir": "US~~UT~~~"}])
+
+        req = Request.blank(
+            '/sda1/p/a?prefix=US~~UT~&delimiter=~~&format=json&reverse=on',
+            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            [{k: v for k, v in item.items() if k in ('subdir', 'name')}
+             for item in json.loads(resp.body)],
+            [{"subdir": "US~~UT~~~"},
+             {"name": "US~~UT~~A"}])
+
+        req = Request.blank(
+            '/sda1/p/a?prefix=US~~UT~~&delimiter=~~&format=json',
+            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            [{k: v for k, v in item.items() if k in ('subdir', 'name')}
+             for item in json.loads(resp.body)],
+            [{"name": "US~~UT~~A"},
+             {"name": "US~~UT~~~B"}])
+
+        req = Request.blank(
+            '/sda1/p/a?prefix=US~~UT~~&delimiter=~~&format=json&reverse=on',
+            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            [{k: v for k, v in item.items() if k in ('subdir', 'name')}
+             for item in json.loads(resp.body)],
+            [{"name": "US~~UT~~~B"},
+             {"name": "US~~UT~~A"}])
+
+        req = Request.blank(
+            '/sda1/p/a?prefix=US~~UT~~~&delimiter=~~&format=json',
+            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            [{k: v for k, v in item.items() if k in ('subdir', 'name')}
+             for item in json.loads(resp.body)],
+            [{"name": "US~~UT~~~B"}])
+
+    def _expected_listing(self, containers):
+        return [dict(
+            last_modified=c['timestamp'].isoformat, **{
+                k: v for k, v in c.items()
+                if k != 'timestamp'
+            }) for c in sorted(containers, key=lambda c: c['name'])]
+
+    def _report_containers(self, containers, account='a'):
+        req = Request.blank('/sda1/p/%s' % account, method='PUT', headers={
+            'x-timestamp': next(self.ts).internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int // 100, 2, resp.body)
+        for container in containers:
+            path = '/sda1/p/%s/%s' % (account, container['name'])
+            headers = {
+                'X-Put-Timestamp': container['timestamp'].internal,
+                'X-Delete-Timestamp': container.get(
+                    'deleted', Timestamp(0)).internal,
+                'X-Object-Count': container['count'],
+                'X-Bytes-Used': container['bytes'],
+            }
+            if 'storage_policy' in container:
+                headers['X-Backend-Storage-Policy-Index'] = (
+                    POLICIES.get_by_name(container['storage_policy']).idx
+                )
+            req = Request.blank(path, method='PUT', headers=headers)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int // 100, 2, resp.body)
+
+    def test_delimiter_with_reserved_and_no_public(self):
+        containers = [{
+            'name': get_reserved_name('null', 'test01'),
+            'bytes': 200,
+            'count': 2,
+            'timestamp': next(self.ts),
+            'storage_policy': POLICIES[0].name,
+        }]
+        self._report_containers(containers)
+
+        req = Request.blank('/sda1/p/a', headers={
+            'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body), [])
+
+        req = Request.blank('/sda1/p/a', headers={
+            'X-Backend-Allow-Reserved-Names': 'true',
+            'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body),
+                         self._expected_listing(containers))
+
+        req = Request.blank('/sda1/p/a?prefix=%s&delimiter=l' %
+                            get_reserved_name('nul'), headers={
+                                'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body), [])
+
+        req = Request.blank('/sda1/p/a?prefix=%s&delimiter=l' %
+                            get_reserved_name('nul'), headers={
+                                'X-Backend-Allow-Reserved-Names': 'true',
+                                'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body), [{
+            'subdir': '%s' % get_reserved_name('null')}])
+
+    @patch_policies([StoragePolicy(0, 'zero', is_default=True),
+                     StoragePolicy(1, 'one', is_default=False)])
+    def test_delimiter_with_reserved_and_public(self):
+        containers = [{
+            'name': get_reserved_name('null', 'test01'),
+            'bytes': 200,
+            'count': 2,
+            'timestamp': next(self.ts),
+            'storage_policy': POLICIES[0].name,
+        }, {
+            'name': 'nullish',
+            'bytes': 10,
+            'count': 10,
+            'timestamp': next(self.ts),
+            'storage_policy': POLICIES[1].name,
+        }]
+        self._report_containers(containers)
+
+        req = Request.blank('/sda1/p/a?prefix=nul&delimiter=l', headers={
+            'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body), [{'subdir': 'null'}])
+
+        # allow-reserved header doesn't really make a difference
+        req = Request.blank('/sda1/p/a?prefix=nul&delimiter=l', headers={
+            'X-Backend-Allow-Reserved-Names': 'true',
+            'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body), [{'subdir': 'null'}])
+
+        req = Request.blank('/sda1/p/a?prefix=%s&delimiter=l' %
+                            get_reserved_name('nul'), headers={
+                                'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body), [])
+
+        req = Request.blank('/sda1/p/a?prefix=%s&delimiter=l' %
+                            get_reserved_name('nul'), headers={
+                                'X-Backend-Allow-Reserved-Names': 'true',
+                                'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body), [{
+            'subdir': '%s' % get_reserved_name('null')}])
+
+        req = Request.blank('/sda1/p/a?delimiter=%00', headers={
+                            'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body),
+                         self._expected_listing(containers)[1:])
+
+        req = Request.blank('/sda1/p/a?delimiter=%00', headers={
+                            'X-Backend-Allow-Reserved-Names': 'true',
+                            'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body),
+                         [{'subdir': '\x00'}] +
+                         self._expected_listing(containers)[1:])
+
+    @patch_policies([StoragePolicy(0, 'zero', is_default=True),
+                     StoragePolicy(1, 'one', is_default=False)])
+    def test_markers_with_reserved(self):
+        containers = [{
+            'name': get_reserved_name('null', 'test01'),
+            'bytes': 200,
+            'count': 2,
+            'timestamp': next(self.ts),
+            'storage_policy': POLICIES[0].name,
+        }, {
+            'name': get_reserved_name('null', 'test02'),
+            'bytes': 10,
+            'count': 10,
+            'timestamp': next(self.ts),
+            'storage_policy': POLICIES[1].name,
+        }]
+        self._report_containers(containers)
+
+        req = Request.blank('/sda1/p/a?marker=%s' %
+                            get_reserved_name('null', ''), headers={
+                                'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body), [])
+
+        req = Request.blank('/sda1/p/a?marker=%s' %
+                            get_reserved_name('null', ''), headers={
+                                'X-Backend-Allow-Reserved-Names': 'true',
+                                'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body),
+                         self._expected_listing(containers))
+
+        req = Request.blank('/sda1/p/a?marker=%s' % quote(
+            self._expected_listing(containers)[0]['name']), headers={
+                'X-Backend-Allow-Reserved-Names': 'true',
+                'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body),
+                         self._expected_listing(containers)[1:])
+
+        containers.append({
+            'name': get_reserved_name('null', 'test03'),
+            'bytes': 300,
+            'count': 30,
+            'timestamp': next(self.ts),
+            'storage_policy': POLICIES[0].name,
+        })
+        self._report_containers(containers)
+
+        req = Request.blank('/sda1/p/a?marker=%s' % quote(
+            self._expected_listing(containers)[0]['name']), headers={
+                'X-Backend-Allow-Reserved-Names': 'true',
+                'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body),
+                         self._expected_listing(containers)[1:])
+
+        req = Request.blank('/sda1/p/a?marker=%s' % quote(
+            self._expected_listing(containers)[1]['name']), headers={
+                'X-Backend-Allow-Reserved-Names': 'true',
+                'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body),
+                         self._expected_listing(containers)[-1:])
+
+    @patch_policies([StoragePolicy(0, 'zero', is_default=True),
+                     StoragePolicy(1, 'one', is_default=False)])
+    def test_prefix_with_reserved(self):
+        containers = [{
+            'name': get_reserved_name('null', 'test01'),
+            'bytes': 200,
+            'count': 2,
+            'timestamp': next(self.ts),
+            'storage_policy': POLICIES[0].name,
+        }, {
+            'name': get_reserved_name('null', 'test02'),
+            'bytes': 10,
+            'count': 10,
+            'timestamp': next(self.ts),
+            'storage_policy': POLICIES[1].name,
+        }, {
+            'name': get_reserved_name('null', 'foo'),
+            'bytes': 10,
+            'count': 10,
+            'timestamp': next(self.ts),
+            'storage_policy': POLICIES[0].name,
+        }, {
+            'name': get_reserved_name('nullish'),
+            'bytes': 300,
+            'count': 32,
+            'timestamp': next(self.ts),
+            'storage_policy': POLICIES[1].name,
+        }]
+        self._report_containers(containers)
+
+        req = Request.blank('/sda1/p/a?prefix=%s' %
+                            get_reserved_name('null', 'test'), headers={
+                                'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body), [])
+
+        req = Request.blank('/sda1/p/a?prefix=%s' %
+                            get_reserved_name('null', 'test'), headers={
+                                'X-Backend-Allow-Reserved-Names': 'true',
+                                'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body),
+                         self._expected_listing(containers[:2]))
+
+    @patch_policies([StoragePolicy(0, 'zero', is_default=True),
+                     StoragePolicy(1, 'one', is_default=False)])
+    def test_prefix_and_delim_with_reserved(self):
+        containers = [{
+            'name': get_reserved_name('null', 'test01'),
+            'bytes': 200,
+            'count': 2,
+            'timestamp': next(self.ts),
+            'storage_policy': POLICIES[0].name,
+        }, {
+            'name': get_reserved_name('null', 'test02'),
+            'bytes': 10,
+            'count': 10,
+            'timestamp': next(self.ts),
+            'storage_policy': POLICIES[1].name,
+        }, {
+            'name': get_reserved_name('null', 'foo'),
+            'bytes': 10,
+            'count': 10,
+            'timestamp': next(self.ts),
+            'storage_policy': POLICIES[0].name,
+        }, {
+            'name': get_reserved_name('nullish'),
+            'bytes': 300,
+            'count': 32,
+            'timestamp': next(self.ts),
+            'storage_policy': POLICIES[1].name,
+        }]
+        self._report_containers(containers)
+
+        req = Request.blank('/sda1/p/a?prefix=%s&delimiter=%s' % (
+            get_reserved_name('null'), get_reserved_name()), headers={
+                'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body), [])
+
+        req = Request.blank('/sda1/p/a?prefix=%s&delimiter=%s' % (
+            get_reserved_name('null'), get_reserved_name()), headers={
+                'X-Backend-Allow-Reserved-Names': 'true',
+                'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        expected = [{'subdir': get_reserved_name('null', '')}] + \
+            self._expected_listing(containers[-1:])
+        self.assertEqual(json.loads(resp.body), expected)
+
+    @patch_policies([StoragePolicy(0, 'zero', is_default=True),
+                     StoragePolicy(1, 'one', is_default=False)])
+    def test_reserved_markers_with_non_reserved(self):
+        containers = [{
+            'name': get_reserved_name('null', 'test01'),
+            'bytes': 200,
+            'count': 2,
+            'timestamp': next(self.ts),
+            'storage_policy': POLICIES[0].name,
+        }, {
+            'name': get_reserved_name('null', 'test02'),
+            'bytes': 10,
+            'count': 10,
+            'timestamp': next(self.ts),
+            'storage_policy': POLICIES[1].name,
+        }, {
+            'name': 'nullish',
+            'bytes': 300,
+            'count': 32,
+            'timestamp': next(self.ts),
+            'storage_policy': POLICIES[0].name,
+        }]
+        self._report_containers(containers)
+
+        req = Request.blank('/sda1/p/a?marker=%s' %
+                            get_reserved_name('null', ''), headers={
+                                'X-Backend-Allow-Reserved-Names': 'true',
+                                'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body),
+                         self._expected_listing(containers))
+
+        req = Request.blank('/sda1/p/a?marker=%s' %
+                            get_reserved_name('null', ''), headers={
+                                'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body),
+                         [c for c in self._expected_listing(containers)
+                          if get_reserved_name() not in c['name']])
+
+        req = Request.blank('/sda1/p/a?marker=%s' %
+                            get_reserved_name('null', ''), headers={
+                                'X-Backend-Allow-Reserved-Names': 'true',
+                                'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body),
+                         self._expected_listing(containers))
+
+        req = Request.blank('/sda1/p/a?marker=%s' % quote(
+            self._expected_listing(containers)[0]['name']), headers={
+                'X-Backend-Allow-Reserved-Names': 'true',
+                'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body),
+                         self._expected_listing(containers)[1:])
+
+    @patch_policies([StoragePolicy(0, 'zero', is_default=True),
+                     StoragePolicy(1, 'one', is_default=False)])
+    def test_null_markers(self):
+        containers = [{
+            'name': get_reserved_name('null', ''),
+            'bytes': 200,
+            'count': 2,
+            'timestamp': next(self.ts),
+            'storage_policy': POLICIES[0].name,
+        }, {
+            'name': get_reserved_name('null', 'test01'),
+            'bytes': 200,
+            'count': 2,
+            'timestamp': next(self.ts),
+            'storage_policy': POLICIES[1].name,
+        }, {
+            'name': 'null',
+            'bytes': 300,
+            'count': 32,
+            'timestamp': next(self.ts),
+            'storage_policy': POLICIES[0].name,
+        }]
+        self._report_containers(containers)
+
+        req = Request.blank('/sda1/p/a?marker=%s' % get_reserved_name('null'),
+                            headers={'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body),
+                         self._expected_listing(containers)[-1:])
+
+        req = Request.blank('/sda1/p/a?marker=%s' % get_reserved_name('null'),
+                            headers={'X-Backend-Allow-Reserved-Names': 'true',
+                                     'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body),
+                         self._expected_listing(containers))
+
+        req = Request.blank('/sda1/p/a?marker=%s' %
+                            get_reserved_name('null', ''), headers={
+                                'X-Backend-Allow-Reserved-Names': 'true',
+                                'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body),
+                         self._expected_listing(containers)[1:])
+
+        req = Request.blank('/sda1/p/a?marker=%s' %
+                            get_reserved_name('null', 'test00'), headers={
+                                'X-Backend-Allow-Reserved-Names': 'true',
+                                'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body),
+                         self._expected_listing(containers)[1:])
 
     def test_through_call(self):
-        inbuf = StringIO()
+        inbuf = BytesIO()
         errbuf = StringIO()
         outbuf = StringIO()
+
         def start_response(*args):
-            outbuf.writelines(args)
+            outbuf.write(args[0])
+
         self.controller.__call__({'REQUEST_METHOD': 'GET',
                                   'SCRIPT_NAME': '',
                                   'PATH_INFO': '/sda1/p/a',
@@ -943,15 +2380,17 @@ def start_response(*args):
                                   'wsgi.multiprocess': False,
                                   'wsgi.run_once': False},
                                  start_response)
-        self.assertEquals(errbuf.getvalue(), '')
-        self.assertEquals(outbuf.getvalue()[:4], '404 ')
+        self.assertEqual(errbuf.getvalue(), '')
+        self.assertEqual(outbuf.getvalue()[:4], '404 ')
 
     def test_through_call_invalid_path(self):
-        inbuf = StringIO()
+        inbuf = BytesIO()
         errbuf = StringIO()
         outbuf = StringIO()
+
         def start_response(*args):
-            outbuf.writelines(args)
+            outbuf.write(args[0])
+
         self.controller.__call__({'REQUEST_METHOD': 'GET',
                                   'SCRIPT_NAME': '',
                                   'PATH_INFO': '/bob',
@@ -967,107 +2406,539 @@ def start_response(*args):
                                   'wsgi.multiprocess': False,
                                   'wsgi.run_once': False},
                                  start_response)
-        self.assertEquals(errbuf.getvalue(), '')
-        self.assertEquals(outbuf.getvalue()[:4], '400 ')
+        self.assertEqual(errbuf.getvalue(), '')
+        self.assertEqual(outbuf.getvalue()[:4], '400 ')
+
+    def test_through_call_invalid_path_utf8(self):
+        inbuf = BytesIO()
+        errbuf = StringIO()
+        outbuf = StringIO()
+
+        def start_response(*args):
+            outbuf.write(args[0])
+
+        self.controller.__call__({'REQUEST_METHOD': 'GET',
+                                  'SCRIPT_NAME': '',
+                                  'PATH_INFO': '/sda1/p/a/c\xd8\x3e%20',
+                                  'SERVER_NAME': '127.0.0.1',
+                                  'SERVER_PORT': '8080',
+                                  'SERVER_PROTOCOL': 'HTTP/1.0',
+                                  'CONTENT_LENGTH': '0',
+                                  'wsgi.version': (1, 0),
+                                  'wsgi.url_scheme': 'http',
+                                  'wsgi.input': inbuf,
+                                  'wsgi.errors': errbuf,
+                                  'wsgi.multithread': False,
+                                  'wsgi.multiprocess': False,
+                                  'wsgi.run_once': False},
+                                 start_response)
+        self.assertEqual(errbuf.getvalue(), '')
+        self.assertEqual(outbuf.getvalue()[:4], '412 ')
 
     def test_invalid_method_doesnt_exist(self):
-        inbuf = StringIO()
         errbuf = StringIO()
         outbuf = StringIO()
+
         def start_response(*args):
-            outbuf.writelines(args)
+            outbuf.write(args[0])
+
         self.controller.__call__({'REQUEST_METHOD': 'method_doesnt_exist',
                                   'PATH_INFO': '/sda1/p/a'},
                                  start_response)
-        self.assertEquals(errbuf.getvalue(), '')
-        self.assertEquals(outbuf.getvalue()[:4], '405 ')
+        self.assertEqual(errbuf.getvalue(), '')
+        self.assertEqual(outbuf.getvalue()[:4], '405 ')
 
     def test_invalid_method_is_not_public(self):
-        inbuf = StringIO()
         errbuf = StringIO()
         outbuf = StringIO()
+
         def start_response(*args):
-            outbuf.writelines(args)
+            outbuf.write(args[0])
+
         self.controller.__call__({'REQUEST_METHOD': '__init__',
                                   'PATH_INFO': '/sda1/p/a'},
                                  start_response)
-        self.assertEquals(errbuf.getvalue(), '')
-        self.assertEquals(outbuf.getvalue()[:4], '405 ')
+        self.assertEqual(errbuf.getvalue(), '')
+        self.assertEqual(outbuf.getvalue()[:4], '405 ')
 
     def test_params_format(self):
-        self.controller.PUT(Request.blank('/sda1/p/a',
-                            headers={'X-Timestamp': normalize_timestamp(1)},
-                            environ={'REQUEST_METHOD': 'PUT'}))
+        Request.blank('/sda1/p/a',
+                      headers={'X-Timestamp': normalize_timestamp(1)},
+                      environ={'REQUEST_METHOD': 'PUT'}).get_response(
+                          self.controller)
         for format in ('xml', 'json'):
             req = Request.blank('/sda1/p/a?format=%s' % format,
                                 environ={'REQUEST_METHOD': 'GET'})
-            resp = self.controller.GET(req)
-            self.assertEquals(resp.status_int, 200)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 200)
 
     def test_params_utf8(self):
-        self.controller.PUT(Request.blank('/sda1/p/a',
-                            headers={'X-Timestamp': normalize_timestamp(1)},
-                            environ={'REQUEST_METHOD': 'PUT'}))
-        for param in ('delimiter', 'limit', 'marker', 'prefix'):
+        # Bad UTF8 sequence, all parameters should cause 400 error
+        for param in ('delimiter', 'limit', 'marker', 'prefix', 'end_marker',
+                      'format'):
             req = Request.blank('/sda1/p/a?%s=\xce' % param,
                                 environ={'REQUEST_METHOD': 'GET'})
-            resp = self.controller.GET(req)
-            self.assertEquals(resp.status_int, 400)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 400,
+                             "%d on param %s" % (resp.status_int, param))
+        Request.blank('/sda1/p/a',
+                      headers={'X-Timestamp': normalize_timestamp(1)},
+                      environ={'REQUEST_METHOD': 'PUT'}).get_response(
+                          self.controller)
+        # Good UTF8 sequence, ignored for limit, doesn't affect other queries
+        for param in ('limit', 'marker', 'prefix', 'end_marker', 'format',
+                      'delimiter'):
             req = Request.blank('/sda1/p/a?%s=\xce\xa9' % param,
                                 environ={'REQUEST_METHOD': 'GET'})
-            resp = self.controller.GET(req)
-            self.assert_(resp.status_int in (204, 412), resp.status_int)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 204,
+                             "%d on param %s" % (resp.status_int, param))
 
-    def test_put_auto_create(self):
+    def test_PUT_auto_create(self):
         headers = {'x-put-timestamp': normalize_timestamp(1),
                    'x-delete-timestamp': normalize_timestamp(0),
                    'x-object-count': '0',
                    'x-bytes-used': '0'}
 
-        resp = self.controller.PUT(Request.blank('/sda1/p/a/c',
-            environ={'REQUEST_METHOD': 'PUT'}, headers=dict(headers)))
-        self.assertEquals(resp.status_int, 404)
+        req = Request.blank('/sda1/p/a/c',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers=dict(headers))
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)
 
-        resp = self.controller.PUT(Request.blank('/sda1/p/.a/c',
-            environ={'REQUEST_METHOD': 'PUT'}, headers=dict(headers)))
-        self.assertEquals(resp.status_int, 201)
+        req = Request.blank('/sda1/p/.a/c',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers=dict(headers))
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
 
-        resp = self.controller.PUT(Request.blank('/sda1/p/a/.c',
-            environ={'REQUEST_METHOD': 'PUT'}, headers=dict(headers)))
-        self.assertEquals(resp.status_int, 404)
+        req = Request.blank('/sda1/p/a/.c',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers=dict(headers))
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)
 
     def test_content_type_on_HEAD(self):
-        self.controller.PUT(Request.blank('/sda1/p/a',
-                            headers={'X-Timestamp': normalize_timestamp(1)},
-                            environ={'REQUEST_METHOD': 'PUT'}))
+        Request.blank('/sda1/p/a',
+                      headers={'X-Timestamp': normalize_timestamp(1)},
+                      environ={'REQUEST_METHOD': 'PUT'}).get_response(
+                          self.controller)
 
         env = {'REQUEST_METHOD': 'HEAD'}
 
         req = Request.blank('/sda1/p/a?format=xml', environ=env)
-        resp = self.controller.HEAD(req)
-        self.assertEquals(resp.content_type, 'application/xml')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.content_type, 'application/xml')
 
         req = Request.blank('/sda1/p/a?format=json', environ=env)
-        resp = self.controller.HEAD(req)
-        self.assertEquals(resp.content_type, 'application/json')
-        self.assertEquals(resp.charset, 'utf-8')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.content_type, 'application/json')
+        self.assertEqual(resp.charset, 'utf-8')
 
         req = Request.blank('/sda1/p/a', environ=env)
-        resp = self.controller.HEAD(req)
-        self.assertEquals(resp.content_type, 'text/plain')
-        self.assertEquals(resp.charset, 'utf-8')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.content_type, 'text/plain')
+        self.assertEqual(resp.charset, 'utf-8')
 
         req = Request.blank(
             '/sda1/p/a', headers={'Accept': 'application/json'}, environ=env)
-        resp = self.controller.HEAD(req)
-        self.assertEquals(resp.content_type, 'application/json')
-        self.assertEquals(resp.charset, 'utf-8')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.content_type, 'application/json')
+        self.assertEqual(resp.charset, 'utf-8')
 
         req = Request.blank(
             '/sda1/p/a', headers={'Accept': 'application/xml'}, environ=env)
-        resp = self.controller.HEAD(req)
-        self.assertEquals(resp.content_type, 'application/xml')
-        self.assertEquals(resp.charset, 'utf-8')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.content_type, 'application/xml')
+        self.assertEqual(resp.charset, 'utf-8')
+
+    def test_serv_reserv(self):
+        # Test replication_server flag was set from configuration file.
+        conf = {'devices': self.testdir, 'mount_check': 'false'}
+        self.assertTrue(AccountController(conf).replication_server)
+        for val in [True, '1', 'True', 'true']:
+            conf['replication_server'] = val
+            self.assertTrue(AccountController(conf).replication_server)
+        for val in [False, 0, '0', 'False', 'false', 'test_string']:
+            conf['replication_server'] = val
+            self.assertFalse(AccountController(conf).replication_server)
+
+    def test_list_allowed_methods(self):
+        # Test list of allowed_methods
+        obj_methods = ['DELETE', 'PUT', 'HEAD', 'GET', 'POST']
+        repl_methods = ['REPLICATE']
+        for method_name in obj_methods:
+            method = getattr(self.controller, method_name)
+            self.assertFalse(hasattr(method, 'replication'))
+        for method_name in repl_methods:
+            method = getattr(self.controller, method_name)
+            self.assertEqual(method.replication, True)
+
+    def test_correct_allowed_method(self):
+        # Test correct work for allowed method using
+        # swift.account.server.AccountController.__call__
+        inbuf = BytesIO()
+        errbuf = StringIO()
+        self.controller = AccountController(
+            {'devices': self.testdir,
+             'mount_check': 'false',
+             'replication_server': 'false'})
+
+        def start_response(*args):
+            pass
+
+        method = 'PUT'
+        env = {'REQUEST_METHOD': method,
+               'SCRIPT_NAME': '',
+               'PATH_INFO': '/sda1/p/a/c',
+               'SERVER_NAME': '127.0.0.1',
+               'SERVER_PORT': '8080',
+               'SERVER_PROTOCOL': 'HTTP/1.0',
+               'CONTENT_LENGTH': '0',
+               'wsgi.version': (1, 0),
+               'wsgi.url_scheme': 'http',
+               'wsgi.input': inbuf,
+               'wsgi.errors': errbuf,
+               'wsgi.multithread': False,
+               'wsgi.multiprocess': False,
+               'wsgi.run_once': False}
+
+        method_res = mock.MagicMock()
+        mock_method = public(lambda x: mock.MagicMock(return_value=method_res))
+        with mock.patch.object(self.controller, method,
+                               new=mock_method):
+            mock_method.replication = False
+            response = self.controller(env, start_response)
+            self.assertEqual(response, method_res)
+
+    def test_not_allowed_method(self):
+        # Test correct work for NOT allowed method using
+        # swift.account.server.AccountController.__call__
+        inbuf = BytesIO()
+        errbuf = StringIO()
+        self.controller = AccountController(
+            {'devices': self.testdir, 'mount_check': 'false',
+             'replication_server': 'false'})
+
+        def start_response(*args):
+            pass
+
+        method = 'PUT'
+        env = {'REQUEST_METHOD': method,
+               'SCRIPT_NAME': '',
+               'PATH_INFO': '/sda1/p/a/c',
+               'SERVER_NAME': '127.0.0.1',
+               'SERVER_PORT': '8080',
+               'SERVER_PROTOCOL': 'HTTP/1.0',
+               'CONTENT_LENGTH': '0',
+               'wsgi.version': (1, 0),
+               'wsgi.url_scheme': 'http',
+               'wsgi.input': inbuf,
+               'wsgi.errors': errbuf,
+               'wsgi.multithread': False,
+               'wsgi.multiprocess': False,
+               'wsgi.run_once': False}
+
+        answer = [b'<html><h1>Method Not Allowed</h1><p>The method is not '
+                  b'allowed for this resource.</p></html>']
+        mock_method = replication(public(lambda x: mock.MagicMock()))
+        with mock.patch.object(self.controller, method,
+                               new=mock_method):
+            mock_method.replication = True
+            response = self.controller.__call__(env, start_response)
+            self.assertEqual(response, answer)
+
+    def test_replicaiton_server_call_all_methods(self):
+        inbuf = BytesIO()
+        errbuf = StringIO()
+        outbuf = StringIO()
+        self.controller = AccountController(
+            {'devices': self.testdir, 'mount_check': 'false',
+             'replication_server': 'true'})
+
+        def start_response(*args):
+            outbuf.write(args[0])
+
+        obj_methods = ['PUT', 'HEAD', 'GET', 'POST', 'DELETE', 'OPTIONS']
+        for method in obj_methods:
+            env = {'REQUEST_METHOD': method,
+                   'SCRIPT_NAME': '',
+                   'PATH_INFO': '/sda1/p/a',
+                   'SERVER_NAME': '127.0.0.1',
+                   'SERVER_PORT': '8080',
+                   'SERVER_PROTOCOL': 'HTTP/1.0',
+                   'HTTP_X_TIMESTAMP': next(self.ts).internal,
+                   'CONTENT_LENGTH': '0',
+                   'wsgi.version': (1, 0),
+                   'wsgi.url_scheme': 'http',
+                   'wsgi.input': inbuf,
+                   'wsgi.errors': errbuf,
+                   'wsgi.multithread': False,
+                   'wsgi.multiprocess': False,
+                   'wsgi.run_once': False}
+            self.controller(env, start_response)
+            self.assertEqual(errbuf.getvalue(), '')
+            self.assertIn(outbuf.getvalue()[:4], ('200 ', '201 ', '204 '))
+
+    def test__call__raise_timeout(self):
+        inbuf = WsgiBytesIO()
+        errbuf = StringIO()
+        self.logger = debug_logger('test')
+        self.account_controller = AccountController(
+            {'devices': self.testdir, 'mount_check': 'false',
+             'replication_server': 'false', 'log_requests': 'false'},
+            logger=self.logger)
+
+        def start_response(*args):
+            pass
+
+        method = 'PUT'
+
+        env = {'REQUEST_METHOD': method,
+               'SCRIPT_NAME': '',
+               'PATH_INFO': '/sda1/p/a/c',
+               'SERVER_NAME': '127.0.0.1',
+               'SERVER_PORT': '8080',
+               'SERVER_PROTOCOL': 'HTTP/1.0',
+               'CONTENT_LENGTH': '0',
+               'wsgi.version': (1, 0),
+               'wsgi.url_scheme': 'http',
+               'wsgi.input': inbuf,
+               'wsgi.errors': errbuf,
+               'wsgi.multithread': False,
+               'wsgi.multiprocess': False,
+               'wsgi.run_once': False}
+
+        @public
+        def mock_put_method(*args, **kwargs):
+            raise Exception()
+
+        with mock.patch.object(self.account_controller, method,
+                               new=mock_put_method):
+            response = self.account_controller.__call__(env, start_response)
+            self.assertTrue(response[0].decode('ascii').startswith(
+                'Traceback (most recent call last):'))
+            self.assertEqual(self.logger.get_lines_for_level('error'), [
+                'ERROR __call__ error with %(method)s %(path)s : ' % {
+                    'method': 'PUT', 'path': '/sda1/p/a/c'},
+            ])
+            self.assertEqual(self.logger.get_lines_for_level('info'), [])
+
+    def test_GET_log_requests_true(self):
+        self.controller.logger = debug_logger()
+        self.controller.log_requests = True
+
+        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)
+        self.assertTrue(self.controller.logger.log_dict['info'])
+
+    def test_GET_log_requests_false(self):
+        self.controller.logger = debug_logger()
+        self.controller.log_requests = False
+        req = Request.blank('/sda1/p/a', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)
+        self.assertFalse(self.controller.logger.log_dict['info'])
+
+    def test_log_line_format(self):
+        req = Request.blank(
+            '/sda1/p/a',
+            environ={'REQUEST_METHOD': 'HEAD', 'REMOTE_ADDR': '1.2.3.4'})
+        self.controller.logger = debug_logger()
+        with mock.patch(
+                'time.time',
+                mock.MagicMock(side_effect=[10000.0, 10001.0, 10002.0,
+                                            10002.0, 10002.0])):
+            with mock.patch(
+                    'os.getpid', mock.MagicMock(return_value=1234)):
+                req.get_response(self.controller)
+        self.assertEqual(
+            self.controller.logger.get_lines_for_level('info'),
+            ['1.2.3.4 - - [01/Jan/1970:02:46:42 +0000] "HEAD /sda1/p/a" 404 '
+             '- "-" "-" "-" 2.0000 "-" 1234 -'])
+
+    def test_policy_stats_with_legacy(self):
+        ts = itertools.count()
+        # create the account
+        req = Request.blank('/sda1/p/a', method='PUT', headers={
+            'X-Timestamp': normalize_timestamp(next(ts))})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)  # sanity
+
+        # add a container
+        req = Request.blank('/sda1/p/a/c1', method='PUT', headers={
+            'X-Put-Timestamp': normalize_timestamp(next(ts)),
+            'X-Delete-Timestamp': '0',
+            'X-Object-Count': '2',
+            'X-Bytes-Used': '4',
+        })
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+
+        # read back rollup
+        for method in ('GET', 'HEAD'):
+            req = Request.blank('/sda1/p/a', method=method)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int // 100, 2)
+            self.assertEqual(resp.headers['X-Account-Object-Count'], '2')
+            self.assertEqual(resp.headers['X-Account-Bytes-Used'], '4')
+            self.assertEqual(
+                resp.headers['X-Account-Storage-Policy-%s-Object-Count' %
+                             POLICIES[0].name], '2')
+            self.assertEqual(
+                resp.headers['X-Account-Storage-Policy-%s-Bytes-Used' %
+                             POLICIES[0].name], '4')
+            self.assertEqual(
+                resp.headers['X-Account-Storage-Policy-%s-Container-Count' %
+                             POLICIES[0].name], '1')
+
+    def test_policy_stats_non_default(self):
+        ts = itertools.count()
+        # create the account
+        req = Request.blank('/sda1/p/a', method='PUT', headers={
+            'X-Timestamp': normalize_timestamp(next(ts))})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)  # sanity
+
+        # add a container
+        non_default_policies = [p for p in POLICIES if not p.is_default]
+        policy = random.choice(non_default_policies)
+        req = Request.blank('/sda1/p/a/c1', method='PUT', headers={
+            'X-Put-Timestamp': normalize_timestamp(next(ts)),
+            'X-Delete-Timestamp': '0',
+            'X-Object-Count': '2',
+            'X-Bytes-Used': '4',
+            'X-Backend-Storage-Policy-Index': policy.idx,
+        })
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+
+        # read back rollup
+        for method in ('GET', 'HEAD'):
+            req = Request.blank('/sda1/p/a', method=method)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int // 100, 2)
+            self.assertEqual(resp.headers['X-Account-Object-Count'], '2')
+            self.assertEqual(resp.headers['X-Account-Bytes-Used'], '4')
+            self.assertEqual(
+                resp.headers['X-Account-Storage-Policy-%s-Object-Count' %
+                             policy.name], '2')
+            self.assertEqual(
+                resp.headers['X-Account-Storage-Policy-%s-Bytes-Used' %
+                             policy.name], '4')
+            self.assertEqual(
+                resp.headers['X-Account-Storage-Policy-%s-Container-Count' %
+                             policy.name], '1')
+
+    def test_empty_policy_stats(self):
+        ts = itertools.count()
+        # create the account
+        req = Request.blank('/sda1/p/a', method='PUT', headers={
+            'X-Timestamp': normalize_timestamp(next(ts))})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)  # sanity
+
+        for method in ('GET', 'HEAD'):
+            req = Request.blank('/sda1/p/a', method=method)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int // 100, 2)
+            for key in resp.headers:
+                self.assertNotIn('storage-policy', key.lower())
+
+    def test_empty_except_for_used_policies(self):
+        ts = itertools.count()
+        # create the account
+        req = Request.blank('/sda1/p/a', method='PUT', headers={
+            'X-Timestamp': normalize_timestamp(next(ts))})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)  # sanity
+
+        # starts empty
+        for method in ('GET', 'HEAD'):
+            req = Request.blank('/sda1/p/a', method=method)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int // 100, 2)
+            for key in resp.headers:
+                self.assertNotIn('storage-policy', key.lower())
+
+        # add a container
+        policy = random.choice(POLICIES)
+        req = Request.blank('/sda1/p/a/c1', method='PUT', headers={
+            'X-Put-Timestamp': normalize_timestamp(next(ts)),
+            'X-Delete-Timestamp': '0',
+            'X-Object-Count': '2',
+            'X-Bytes-Used': '4',
+            'X-Backend-Storage-Policy-Index': policy.idx,
+        })
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+
+        # only policy of the created container should be in headers
+        for method in ('GET', 'HEAD'):
+            req = Request.blank('/sda1/p/a', method=method)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int // 100, 2)
+            for key in resp.headers:
+                if 'storage-policy' in key.lower():
+                    self.assertIn(policy.name.lower(), key.lower())
+
+    def test_multiple_policies_in_use(self):
+        ts = itertools.count()
+        # create the account
+        req = Request.blank('/sda1/p/a', method='PUT', headers={
+            'X-Timestamp': normalize_timestamp(next(ts))})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)  # sanity
+
+        # add some containers
+        for policy in POLICIES:
+            count = policy.idx * 100  # good as any integer
+            container_path = '/sda1/p/a/c_%s' % policy.name
+            req = Request.blank(
+                container_path, method='PUT', headers={
+                    'X-Put-Timestamp': normalize_timestamp(next(ts)),
+                    'X-Delete-Timestamp': '0',
+                    'X-Object-Count': count,
+                    'X-Bytes-Used': count,
+                    'X-Backend-Storage-Policy-Index': policy.idx,
+                })
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 201)
+
+        req = Request.blank('/sda1/p/a', method='HEAD')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int // 100, 2)
+
+        # check container counts in roll up headers
+        total_object_count = 0
+        total_bytes_used = 0
+        for key in resp.headers:
+            if 'storage-policy' not in key.lower():
+                continue
+            for policy in POLICIES:
+                if policy.name.lower() not in key.lower():
+                    continue
+                if key.lower().endswith('object-count'):
+                    object_count = int(resp.headers[key])
+                    self.assertEqual(policy.idx * 100, object_count)
+                    total_object_count += object_count
+                if key.lower().endswith('bytes-used'):
+                    bytes_used = int(resp.headers[key])
+                    self.assertEqual(policy.idx * 100, bytes_used)
+                    total_bytes_used += bytes_used
+
+        expected_total_count = sum([p.idx * 100 for p in POLICIES])
+        self.assertEqual(expected_total_count, total_object_count)
+        self.assertEqual(expected_total_count, total_bytes_used)
+
+
+@patch_policies([StoragePolicy(0, 'zero', False),
+                 StoragePolicy(1, 'one', True),
+                 StoragePolicy(2, 'two', False),
+                 StoragePolicy(3, 'three', False)])
+class TestNonLegacyDefaultStoragePolicy(TestAccountController):
+    pass
 
 
 if __name__ == '__main__':
diff --git a/test/unit/account/test_utils.py b/test/unit/account/test_utils.py
new file mode 100644
index 0000000000..12cb44a6e8
--- /dev/null
+++ b/test/unit/account/test_utils.py
@@ -0,0 +1,358 @@
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import itertools
+import time
+import unittest
+import json
+
+from unittest import mock
+
+from swift.account import utils, backend
+from swift.common.storage_policy import POLICIES, StoragePolicy
+from swift.common.swob import Request
+from swift.common.utils import Timestamp
+from swift.common.header_key_dict import HeaderKeyDict
+from swift.common.request_helpers import get_reserved_name
+
+from test.unit import patch_policies, make_timestamp_iter, mock_timestamp_now
+from test.unit.common.test_db import TestDbBase
+
+
+class TestFakeAccountBroker(unittest.TestCase):
+
+    def test_fake_broker_get_info(self):
+        broker = utils.FakeAccountBroker()
+        with mock_timestamp_now() as timestamp:
+            info = broker.get_info()
+        expected = {
+            'container_count': 0,
+            'object_count': 0,
+            'bytes_used': 0,
+            'created_at': timestamp.internal,
+            'put_timestamp': timestamp.internal,
+        }
+        self.assertEqual(info, expected)
+
+    def test_fake_broker_list_containers_iter(self):
+        broker = utils.FakeAccountBroker()
+        self.assertEqual(broker.list_containers_iter(), [])
+
+    def test_fake_broker_metadata(self):
+        broker = utils.FakeAccountBroker()
+        self.assertEqual(broker.metadata, {})
+
+    def test_fake_broker_get_policy_stats(self):
+        broker = utils.FakeAccountBroker()
+        self.assertEqual(broker.get_policy_stats(), {})
+
+
+class TestAccountUtils(TestDbBase):
+    server_type = 'account'
+
+    def setUp(self):
+        super(TestAccountUtils, self).setUp()
+        self.ts = make_timestamp_iter()
+
+    def test_get_response_headers_fake_broker(self):
+        broker = utils.FakeAccountBroker()
+        now = time.time()
+        expected = {
+            'X-Account-Container-Count': 0,
+            'X-Account-Object-Count': 0,
+            'X-Account-Bytes-Used': 0,
+            'X-Timestamp': Timestamp(now).normal,
+            'X-PUT-Timestamp': Timestamp(now).normal,
+        }
+        with mock.patch('time.time', new=lambda: now):
+            resp_headers = utils.get_response_headers(broker)
+        self.assertEqual(resp_headers, expected)
+
+    def test_get_response_headers_empty_memory_broker(self):
+        broker = backend.AccountBroker(self.db_path, account='a')
+        now = time.time()
+        with mock.patch('time.time', new=lambda: now):
+            broker.initialize(Timestamp(now).internal)
+        expected = {
+            'X-Account-Container-Count': 0,
+            'X-Account-Object-Count': 0,
+            'X-Account-Bytes-Used': 0,
+            'X-Timestamp': Timestamp(now).normal,
+            'X-PUT-Timestamp': Timestamp(now).normal,
+        }
+        resp_headers = utils.get_response_headers(broker)
+        self.assertEqual(resp_headers, expected)
+
+    @patch_policies
+    def test_get_response_headers_with_data(self):
+        broker = backend.AccountBroker(self.db_path, account='a')
+        now = time.time()
+        with mock.patch('time.time', new=lambda: now):
+            broker.initialize(Timestamp(now).internal)
+        # add some container data
+        ts = (Timestamp(t).internal for t in itertools.count(int(now)))
+        total_containers = 0
+        total_objects = 0
+        total_bytes = 0
+        for policy in POLICIES:
+            delete_timestamp = next(ts)
+            put_timestamp = next(ts)
+            object_count = int(policy)
+            bytes_used = int(policy) * 10
+            broker.put_container('c-%s' % policy.name, put_timestamp,
+                                 delete_timestamp, object_count, bytes_used,
+                                 int(policy))
+            total_containers += 1
+            total_objects += object_count
+            total_bytes += bytes_used
+        expected = HeaderKeyDict({
+            'X-Account-Container-Count': total_containers,
+            'X-Account-Object-Count': total_objects,
+            'X-Account-Bytes-Used': total_bytes,
+            'X-Timestamp': Timestamp(now).normal,
+            'X-PUT-Timestamp': Timestamp(now).normal,
+        })
+        for policy in POLICIES:
+            prefix = 'X-Account-Storage-Policy-%s-' % policy.name
+            expected[prefix + 'Container-Count'] = 1
+            expected[prefix + 'Object-Count'] = int(policy)
+            expected[prefix + 'Bytes-Used'] = int(policy) * 10
+        resp_headers = utils.get_response_headers(broker)
+        per_policy_container_headers = [
+            h for h in resp_headers if
+            h.lower().startswith('x-account-storage-policy-') and
+            h.lower().endswith('-container-count')]
+        self.assertTrue(per_policy_container_headers)
+        for key, value in resp_headers.items():
+            expected_value = expected.pop(key)
+            self.assertEqual(expected_value, str(value),
+                             'value for %r was %r not %r' % (
+                                 key, value, expected_value))
+        self.assertFalse(expected)
+
+    @patch_policies
+    def test_get_response_headers_with_legacy_data(self):
+        broker = backend.AccountBroker(self.db_path, account='a')
+        now = time.time()
+        with mock.patch('time.time', new=lambda: now):
+            broker.initialize(Timestamp(now).internal)
+        # add some container data
+        ts = (Timestamp(t).internal for t in itertools.count(int(now)))
+        total_containers = 0
+        total_objects = 0
+        total_bytes = 0
+        for policy in POLICIES:
+            delete_timestamp = next(ts)
+            put_timestamp = next(ts)
+            object_count = int(policy)
+            bytes_used = int(policy) * 10
+            broker.put_container('c-%s' % policy.name, put_timestamp,
+                                 delete_timestamp, object_count, bytes_used,
+                                 int(policy))
+            total_containers += 1
+            total_objects += object_count
+            total_bytes += bytes_used
+        expected = HeaderKeyDict({
+            'X-Account-Container-Count': total_containers,
+            'X-Account-Object-Count': total_objects,
+            'X-Account-Bytes-Used': total_bytes,
+            'X-Timestamp': Timestamp(now).normal,
+            'X-PUT-Timestamp': Timestamp(now).normal,
+        })
+        for policy in POLICIES:
+            prefix = 'X-Account-Storage-Policy-%s-' % policy.name
+            expected[prefix + 'Object-Count'] = int(policy)
+            expected[prefix + 'Bytes-Used'] = int(policy) * 10
+        orig_policy_stats = broker.get_policy_stats
+
+        def stub_policy_stats(*args, **kwargs):
+            policy_stats = orig_policy_stats(*args, **kwargs)
+            for stats in policy_stats.values():
+                # legacy db's won't return container_count
+                del stats['container_count']
+            return policy_stats
+        broker.get_policy_stats = stub_policy_stats
+        resp_headers = utils.get_response_headers(broker)
+        per_policy_container_headers = [
+            h for h in resp_headers if
+            h.lower().startswith('x-account-storage-policy-') and
+            h.lower().endswith('-container-count')]
+        self.assertFalse(per_policy_container_headers)
+        for key, value in resp_headers.items():
+            expected_value = expected.pop(key)
+            self.assertEqual(expected_value, str(value),
+                             'value for %r was %r not %r' % (
+                                 key, value, expected_value))
+        self.assertFalse(expected)
+
+    def test_account_listing_response(self):
+        req = Request.blank('')
+        now = time.time()
+        with mock.patch('time.time', new=lambda: now):
+            resp = utils.account_listing_response('a', req, 'text/plain')
+        self.assertEqual(resp.status_int, 204)
+        expected = HeaderKeyDict({
+            'Content-Type': 'text/plain; charset=utf-8',
+            'X-Account-Container-Count': 0,
+            'X-Account-Object-Count': 0,
+            'X-Account-Bytes-Used': 0,
+            'X-Timestamp': Timestamp(now).normal,
+            'X-PUT-Timestamp': Timestamp(now).normal,
+        })
+        self.assertEqual(expected, resp.headers)
+        self.assertEqual(b'', resp.body)
+
+    @patch_policies([StoragePolicy(0, 'zero', is_default=True),
+                     StoragePolicy(1, 'one', is_default=False)])
+    def test_account_listing_with_containers(self):
+        broker = backend.AccountBroker(self.db_path, account='a')
+        put_timestamp = next(self.ts)
+        now = time.time()
+        with mock.patch('time.time', new=lambda: now):
+            broker.initialize(put_timestamp.internal)
+        container_timestamp = next(self.ts)
+        broker.put_container('foo',
+                             container_timestamp.internal, 0, 10, 100, 0)
+        broker.put_container('bar',
+                             container_timestamp.internal, 0, 10, 100, 1)
+        # Can eat rows for policies not in POLICIES
+        broker.put_container('baz',
+                             container_timestamp.internal, 0, 10, 100, 2)
+
+        req = Request.blank('')
+        resp = utils.account_listing_response(
+            'a', req, 'application/json', broker)
+        self.assertEqual(resp.status_int, 200)
+        expected = HeaderKeyDict({
+            'Content-Type': 'application/json; charset=utf-8',
+            'Content-Length': str(len(resp.body)),
+            'X-Account-Container-Count': 3,
+            'X-Account-Object-Count': 30,
+            'X-Account-Bytes-Used': 300,
+            'X-Timestamp': Timestamp(now).normal,
+            'X-PUT-Timestamp': put_timestamp.normal,
+            'X-Account-Storage-Policy-Zero-Container-Count': 1,
+            'X-Account-Storage-Policy-Zero-Object-Count': 10,
+            'X-Account-Storage-Policy-Zero-Bytes-Used': 100,
+            'X-Account-Storage-Policy-One-Container-Count': 1,
+            'X-Account-Storage-Policy-One-Object-Count': 10,
+            'X-Account-Storage-Policy-One-Bytes-Used': 100,
+            # No POLICIES[2], so only account totals can include baz
+        })
+        self.assertEqual(expected, resp.headers)
+        expected = [{
+            "last_modified": container_timestamp.isoformat,
+            "count": 10,
+            "bytes": 100,
+            "name": 'bar',
+            'storage_policy': POLICIES[1].name,
+        }, {
+            "last_modified": container_timestamp.isoformat,
+            "count": 10,
+            "bytes": 100,
+            "name": 'baz',
+        }, {
+            "last_modified": container_timestamp.isoformat,
+            "count": 10,
+            "bytes": 100,
+            "name": 'foo',
+            'storage_policy': POLICIES[0].name,
+        }]
+        self.assertEqual(expected, json.loads(resp.body))
+
+        req = Request.blank('')
+        resp = utils.account_listing_response(
+            'a', req, 'application/json', broker, delimiter='a')
+        self.assertEqual(resp.status_int, 200)
+        expected = [{
+            "subdir": "ba",
+        }, {
+            "last_modified": container_timestamp.isoformat,
+            "count": 10,
+            "bytes": 100,
+            "name": 'foo',
+            'storage_policy': POLICIES[0].name,
+        }]
+        self.assertEqual(expected, json.loads(resp.body))
+
+    @patch_policies([StoragePolicy(0, 'zero', is_default=True),
+                     StoragePolicy(1, 'one', is_default=False)])
+    def test_account_listing_reserved_names(self):
+        broker = backend.AccountBroker(self.db_path, account='a')
+        put_timestamp = next(self.ts)
+        now = time.time()
+        with mock.patch('time.time', new=lambda: now):
+            broker.initialize(put_timestamp.internal)
+        container_timestamp = next(self.ts)
+        broker.put_container(get_reserved_name('foo'),
+                             container_timestamp.internal, 0, 10, 100, 0)
+        broker.put_container(get_reserved_name('bar'),
+                             container_timestamp.internal, 0, 10, 100, 1)
+
+        req = Request.blank('')
+        resp = utils.account_listing_response(
+            'a', req, 'application/json', broker)
+        self.assertEqual(resp.status_int, 200)
+        expected = HeaderKeyDict({
+            'Content-Type': 'application/json; charset=utf-8',
+            'Content-Length': 2,
+            'X-Account-Container-Count': 2,
+            'X-Account-Object-Count': 20,
+            'X-Account-Bytes-Used': 200,
+            'X-Timestamp': Timestamp(now).normal,
+            'X-PUT-Timestamp': put_timestamp.normal,
+            'X-Account-Storage-Policy-Zero-Container-Count': 1,
+            'X-Account-Storage-Policy-Zero-Object-Count': 10,
+            'X-Account-Storage-Policy-Zero-Bytes-Used': 100,
+            'X-Account-Storage-Policy-One-Container-Count': 1,
+            'X-Account-Storage-Policy-One-Object-Count': 10,
+            'X-Account-Storage-Policy-One-Bytes-Used': 100,
+        })
+        self.assertEqual(expected, resp.headers)
+        self.assertEqual(b'[]', resp.body)
+
+        req = Request.blank('', headers={
+            'X-Backend-Allow-Reserved-Names': 'true'})
+        resp = utils.account_listing_response(
+            'a', req, 'application/json', broker)
+        self.assertEqual(resp.status_int, 200)
+        expected = HeaderKeyDict({
+            'Content-Type': 'application/json; charset=utf-8',
+            'Content-Length': 245,
+            'X-Account-Container-Count': 2,
+            'X-Account-Object-Count': 20,
+            'X-Account-Bytes-Used': 200,
+            'X-Timestamp': Timestamp(now).normal,
+            'X-PUT-Timestamp': put_timestamp.normal,
+            'X-Account-Storage-Policy-Zero-Container-Count': 1,
+            'X-Account-Storage-Policy-Zero-Object-Count': 10,
+            'X-Account-Storage-Policy-Zero-Bytes-Used': 100,
+            'X-Account-Storage-Policy-One-Container-Count': 1,
+            'X-Account-Storage-Policy-One-Object-Count': 10,
+            'X-Account-Storage-Policy-One-Bytes-Used': 100,
+        })
+        self.assertEqual(expected, resp.headers)
+        expected = [{
+            "last_modified": container_timestamp.isoformat,
+            "count": 10,
+            "bytes": 100,
+            "name": get_reserved_name('bar'),
+            'storage_policy': POLICIES[1].name,
+        }, {
+            "last_modified": container_timestamp.isoformat,
+            "count": 10,
+            "bytes": 100,
+            "name": get_reserved_name('foo'),
+            'storage_policy': POLICIES[0].name,
+        }]
+        self.assertEqual(expected, json.loads(resp.body))
diff --git a/test/unit/cli/__init__.py b/test/unit/cli/__init__.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/test/unit/cli/test_container_deleter.py b/test/unit/cli/test_container_deleter.py
new file mode 100644
index 0000000000..f68101a5e0
--- /dev/null
+++ b/test/unit/cli/test_container_deleter.py
@@ -0,0 +1,282 @@
+# Licensed under the Apache License, Version 2.0 (the "License"); you may not
+# use this file except in compliance with the License. You may obtain a copy
+# of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
+# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
+# License for the specific language governing permissions and limitations
+# under the License.
+
+import collections
+import itertools
+import json
+from unittest import mock
+import unittest
+
+from swift.cli import container_deleter
+from swift.common import internal_client
+from swift.common import swob
+from swift.common import utils
+
+AppCall = collections.namedtuple('AppCall', [
+    'method', 'path', 'query', 'headers', 'body'])
+
+
+class FakeInternalClient(internal_client.InternalClient):
+    def __init__(self, responses):
+        self.resp_iter = iter(responses)
+        self.calls = []
+
+    def make_request(self, method, path, headers, acceptable_statuses,
+                     body_file=None, params=None):
+        if body_file is None:
+            body = None
+        else:
+            body = body_file.read()
+        path, _, query = path.partition('?')
+        self.calls.append(AppCall(method, path, query, headers, body))
+        resp = next(self.resp_iter)
+        if isinstance(resp, Exception):
+            raise resp
+        return resp
+
+    def __enter__(self):
+        return self
+
+    def __exit__(self, *args):
+        unused_responses = [r for r in self.resp_iter]
+        if unused_responses:
+            raise Exception('Unused responses: %r' % unused_responses)
+
+
+class TestContainerDeleter(unittest.TestCase):
+    def setUp(self):
+        patcher = mock.patch.object(container_deleter.time, 'time',
+                                    side_effect=itertools.count())
+        patcher.__enter__()
+        self.addCleanup(patcher.__exit__, None, None, None)
+
+        patcher = mock.patch.object(container_deleter, 'OBJECTS_PER_UPDATE', 5)
+        patcher.__enter__()
+        self.addCleanup(patcher.__exit__, None, None, None)
+
+    def test_make_delete_jobs(self):
+        ts = '1558463777.42739'
+        self.assertEqual(
+            container_deleter.make_delete_jobs(
+                'acct', 'cont', ['obj1', 'obj2'],
+                utils.Timestamp(ts)),
+            [{'name': ts + '-acct/cont/obj1',
+              'deleted': 0,
+              'created_at': ts,
+              'etag': utils.MD5_OF_EMPTY_STRING,
+              'size': 0,
+              'storage_policy_index': 0,
+              'content_type': 'application/async-deleted'},
+             {'name': ts + '-acct/cont/obj2',
+              'deleted': 0,
+              'created_at': ts,
+              'etag': utils.MD5_OF_EMPTY_STRING,
+              'size': 0,
+              'storage_policy_index': 0,
+              'content_type': 'application/async-deleted'}])
+
+    def test_make_delete_jobs_native_utf8(self):
+        ts = '1558463777.42739'
+        uacct = acct = u'acct-\U0001f334'
+        ucont = cont = u'cont-\N{SNOWMAN}'
+        uobj1 = obj1 = u'obj-\N{GREEK CAPITAL LETTER ALPHA}'
+        uobj2 = obj2 = u'/obj-\N{GREEK CAPITAL LETTER OMEGA}'
+        self.assertEqual(
+            container_deleter.make_delete_jobs(
+                acct, cont, [obj1, obj2], utils.Timestamp(ts)),
+            [{'name': u'%s-%s/%s/%s' % (ts, uacct, ucont, uobj1),
+              'deleted': 0,
+              'created_at': ts,
+              'etag': utils.MD5_OF_EMPTY_STRING,
+              'size': 0,
+              'storage_policy_index': 0,
+              'content_type': 'application/async-deleted'},
+             {'name': u'%s-%s/%s/%s' % (ts, uacct, ucont, uobj2),
+              'deleted': 0,
+              'created_at': ts,
+              'etag': utils.MD5_OF_EMPTY_STRING,
+              'size': 0,
+              'storage_policy_index': 0,
+              'content_type': 'application/async-deleted'}])
+
+    def test_make_delete_jobs_unicode_utf8(self):
+        ts = '1558463777.42739'
+        acct = u'acct-\U0001f334'
+        cont = u'cont-\N{SNOWMAN}'
+        obj1 = u'obj-\N{GREEK CAPITAL LETTER ALPHA}'
+        obj2 = u'obj-\N{GREEK CAPITAL LETTER OMEGA}'
+        self.assertEqual(
+            container_deleter.make_delete_jobs(
+                acct, cont, [obj1, obj2], utils.Timestamp(ts)),
+            [{'name': u'%s-%s/%s/%s' % (ts, acct, cont, obj1),
+              'deleted': 0,
+              'created_at': ts,
+              'etag': utils.MD5_OF_EMPTY_STRING,
+              'size': 0,
+              'storage_policy_index': 0,
+              'content_type': 'application/async-deleted'},
+             {'name': u'%s-%s/%s/%s' % (ts, acct, cont, obj2),
+              'deleted': 0,
+              'created_at': ts,
+              'etag': utils.MD5_OF_EMPTY_STRING,
+              'size': 0,
+              'storage_policy_index': 0,
+              'content_type': 'application/async-deleted'}])
+
+    def test_mark_for_deletion_empty_no_yield(self):
+        with FakeInternalClient([
+            swob.Response(json.dumps([
+            ])),
+        ]) as swift:
+            self.assertEqual(container_deleter.mark_for_deletion(
+                swift,
+                'account',
+                'container',
+                'marker',
+                'end',
+                'prefix',
+                timestamp=None,
+                yield_time=None,
+            ), 0)
+            self.assertEqual(swift.calls, [
+                ('GET', '/v1/account/container',
+                 'format=json&marker=marker&end_marker=end&prefix=prefix',
+                 {}, None),
+            ])
+
+    def test_mark_for_deletion_empty_with_yield(self):
+        with FakeInternalClient([
+            swob.Response(json.dumps([
+            ])),
+        ]) as swift:
+            self.assertEqual(list(container_deleter.mark_for_deletion(
+                swift,
+                'account',
+                'container',
+                'marker',
+                'end',
+                'prefix',
+                timestamp=None,
+                yield_time=0.5,
+            )), [(0, None)])
+            self.assertEqual(swift.calls, [
+                ('GET', '/v1/account/container',
+                 'format=json&marker=marker&end_marker=end&prefix=prefix',
+                 {}, None),
+            ])
+
+    def test_mark_for_deletion_one_update_no_yield(self):
+        ts = '1558463777.42739'
+        with FakeInternalClient([
+            swob.Response(json.dumps([
+                {'name': '/obj1'},
+                {'name': 'obj2'},
+                {'name': 'obj3'},
+            ])),
+            swob.Response(json.dumps([
+            ])),
+            swob.Response(status=202),
+        ]) as swift:
+            self.assertEqual(container_deleter.mark_for_deletion(
+                swift,
+                'account',
+                'container',
+                '',
+                '',
+                '',
+                timestamp=utils.Timestamp(ts),
+                yield_time=None,
+            ), 3)
+            self.assertEqual(swift.calls, [
+                ('GET', '/v1/account/container',
+                 'format=json&marker=&end_marker=&prefix=', {}, None),
+                ('GET', '/v1/account/container',
+                 'format=json&marker=obj3&end_marker=&prefix=', {}, None),
+                ('UPDATE', '/v1/.expiring_objects/' + ts.split('.')[0], '', {
+                    'X-Backend-Allow-Private-Methods': 'True',
+                    'X-Backend-Storage-Policy-Index': '0',
+                    'X-Timestamp': ts}, mock.ANY),
+            ])
+            self.assertEqual(
+                json.loads(swift.calls[-1].body),
+                container_deleter.make_delete_jobs(
+                    'account', 'container', ['/obj1', 'obj2', 'obj3'],
+                    utils.Timestamp(ts)
+                )
+            )
+
+    def test_mark_for_deletion_two_updates_with_yield(self):
+        ts = '1558463777.42739'
+        with FakeInternalClient([
+            swob.Response(json.dumps([
+                {'name': 'obj1'},
+                {'name': 'obj2'},
+                {'name': 'obj3'},
+                {'name': u'obj4-\N{SNOWMAN}'},
+                {'name': 'obj5'},
+                {'name': 'obj6'},
+            ])),
+            swob.Response(status=202),
+            swob.Response(json.dumps([
+            ])),
+            swob.Response(status=202),
+        ]) as swift:
+            self.assertEqual(list(container_deleter.mark_for_deletion(
+                swift,
+                'account',
+                'container',
+                '',
+                'end',
+                'pre',
+                timestamp=utils.Timestamp(ts),
+                yield_time=0,
+            )), [(5, 'obj5'), (6, 'obj6'), (6, None)])
+            self.assertEqual(swift.calls, [
+                ('GET', '/v1/account/container',
+                 'format=json&marker=&end_marker=end&prefix=pre', {}, None),
+                ('UPDATE', '/v1/.expiring_objects/' + ts.split('.')[0], '', {
+                    'X-Backend-Allow-Private-Methods': 'True',
+                    'X-Backend-Storage-Policy-Index': '0',
+                    'X-Timestamp': ts}, mock.ANY),
+                ('GET', '/v1/account/container',
+                 'format=json&marker=obj6&end_marker=end&prefix=pre',
+                 {}, None),
+                ('UPDATE', '/v1/.expiring_objects/' + ts.split('.')[0], '', {
+                    'X-Backend-Allow-Private-Methods': 'True',
+                    'X-Backend-Storage-Policy-Index': '0',
+                    'X-Timestamp': ts}, mock.ANY),
+            ])
+            self.assertEqual(
+                json.loads(swift.calls[-3].body),
+                container_deleter.make_delete_jobs(
+                    'account', 'container',
+                    ['obj1', 'obj2', 'obj3', u'obj4-\N{SNOWMAN}', 'obj5'],
+                    utils.Timestamp(ts)
+                )
+            )
+            self.assertEqual(
+                json.loads(swift.calls[-1].body),
+                container_deleter.make_delete_jobs(
+                    'account', 'container', ['obj6'],
+                    utils.Timestamp(ts)
+                )
+            )
+
+    def test_init_internal_client_log_name(self):
+        with mock.patch(
+                'swift.cli.container_deleter.InternalClient') \
+                as mock_ic:
+            container_deleter.main(['a', 'c', '--request-tries', '2'])
+        mock_ic.assert_called_once_with(
+            '/etc/swift/internal-client.conf',
+            'Swift Container Deleter', 2,
+            global_conf={'log_name': 'container-deleter-ic'})
diff --git a/test/unit/cli/test_default_output.stub b/test/unit/cli/test_default_output.stub
new file mode 100644
index 0000000000..3bb9f5e44c
--- /dev/null
+++ b/test/unit/cli/test_default_output.stub
@@ -0,0 +1,11 @@
+__RINGFILE__, build version 4, id (not assigned)
+64 partitions, 3.000000 replicas, 4 regions, 4 zones, 4 devices, 2-byte IDs, 100.00 balance, 0.00 dispersion
+The minimum number of hours before a partition can be reassigned is 1 (0:00:00 remaining)
+The overload factor is 0.00% (0.000000)
+Ring file __RINGFILE__.ring.gz not found, probably it hasn't been written yet
+Devices:   id region zone ip address:port replication ip:port  name weight partitions balance flags meta
+            0      0    0  127.0.0.1:6200      127.0.0.1:6200  sda1 100.00          0 -100.00       some meta data
+            1      1    1  127.0.0.2:6201      127.0.0.2:6201  sda2 100.00          0 -100.00
+            2      2    2  127.0.0.3:6202      127.0.0.3:6202  sdc3 100.00          0 -100.00
+            3      3    3  127.0.0.4:6203      127.0.0.4:6203  sdd4 100.00          0 -100.00
+
diff --git a/test/unit/cli/test_default_output_id_assigned.stub b/test/unit/cli/test_default_output_id_assigned.stub
new file mode 100644
index 0000000000..b5a4abcfea
--- /dev/null
+++ b/test/unit/cli/test_default_output_id_assigned.stub
@@ -0,0 +1,11 @@
+__RINGFILE__, build version 4, id __BUILDER_ID__
+64 partitions, 3.000000 replicas, 4 regions, 4 zones, 4 devices, 2-byte IDs, 100.00 balance, 0.00 dispersion
+The minimum number of hours before a partition can be reassigned is 1 (0:00:00 remaining)
+The overload factor is 0.00% (0.000000)
+Ring file __RINGFILE__.ring.gz not found, probably it hasn't been written yet
+Devices:   id region zone ip address:port replication ip:port  name weight partitions balance flags meta
+            0      0    0  127.0.0.1:6200      127.0.0.1:6200  sda1 100.00          0 -100.00       some meta data
+            1      1    1  127.0.0.2:6201      127.0.0.2:6201  sda2 100.00          0 -100.00
+            2      2    2  127.0.0.3:6202      127.0.0.3:6202  sdc3 100.00          0 -100.00
+            3      3    3  127.0.0.4:6203      127.0.0.4:6203  sdd4 100.00          0 -100.00
+
diff --git a/test/unit/cli/test_default_sorted_output.stub b/test/unit/cli/test_default_sorted_output.stub
new file mode 100644
index 0000000000..55af7c5306
--- /dev/null
+++ b/test/unit/cli/test_default_sorted_output.stub
@@ -0,0 +1,10 @@
+__RINGFILE__, build version 9, id __BUILDER_ID__
+64 partitions, 3.000000 replicas, 2 regions, 4 zones, 4 devices, 2-byte IDs, 100.00 balance, 0.00 dispersion
+The minimum number of hours before a partition can be reassigned is 1 (1:00:00 remaining)
+The overload factor is 0.00% (0.000000)
+Ring file __RINGFILE__.ring.gz is obsolete
+Devices:   id region zone ip address:port replication ip:port  name weight partitions balance flags meta
+            1      1    1  127.0.0.2:6201      127.0.0.2:6201  sda2 100.00         64   33.33
+            4      1    2  127.0.0.5:6004      127.0.0.5:6004  sda5 100.00         64   33.33
+            0      2    1  127.0.0.6:6005      127.0.0.6:6005  sdb6 100.00          0 -100.00
+            2      2    2  127.0.0.3:6202      127.0.0.3:6202  sdc3 100.00         64   33.33
diff --git a/test/unit/cli/test_dispersion_report.py b/test/unit/cli/test_dispersion_report.py
new file mode 100644
index 0000000000..0a6bd83d91
--- /dev/null
+++ b/test/unit/cli/test_dispersion_report.py
@@ -0,0 +1,21 @@
+# Licensed under the Apache License, Version 2.0 (the "License"); you may not
+# use this file except in compliance with the License. You may obtain a copy
+# of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
+# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
+# License for the specific language governing permissions and limitations
+# under the License.
+
+import unittest
+
+from swift.cli import dispersion_report
+
+
+class TestDispersionReport(unittest.TestCase):
+
+    def test_placeholder(self):
+        self.assertTrue(callable(dispersion_report.main))
diff --git a/test/unit/cli/test_form_signature.py b/test/unit/cli/test_form_signature.py
new file mode 100644
index 0000000000..673caa0862
--- /dev/null
+++ b/test/unit/cli/test_form_signature.py
@@ -0,0 +1,110 @@
+# -*- coding: utf-8 -*-
+# Copyright (c) 2014 Samuel Merritt <sam@swiftstack.com>
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import io
+import hashlib
+import hmac
+from unittest import mock
+import unittest
+
+from swift.cli import form_signature
+
+
+class TestFormSignature(unittest.TestCase):
+    def test_prints_signature(self):
+        the_time = 1406143563.020043
+        key = b'secret squirrel'
+        expires = 3600
+        path = '/v1/a/c/o'
+        redirect = 'https://example.com/done.html'
+        max_file_size = str(int(1024 * 1024 * 1024 * 3.14159))  # π GiB
+        max_file_count = '3'
+
+        data = "\n".join((
+            path, redirect, max_file_size, max_file_count,
+            str(int(the_time + expires)))).encode('utf8')
+
+        expected_signature = hmac.new(key, data, hashlib.sha1).hexdigest()
+
+        out = io.StringIO()
+        with mock.patch('swift.cli.form_signature.time', lambda: the_time):
+            with mock.patch('sys.stdout', out):
+                exitcode = form_signature.main([
+                    '/path/to/swift-form-signature',
+                    path, redirect, max_file_size,
+                    max_file_count, str(expires), key])
+
+        self.assertEqual(exitcode, 0)
+        self.assertIn("Signature: %s" % expected_signature,
+                      out.getvalue())
+        self.assertIn("Expires: %d" % (the_time + expires,),
+                      out.getvalue())
+
+        sig_input = ('<input type="hidden" name="signature" value="%s" />'
+                     % expected_signature)
+        self.assertIn(sig_input, out.getvalue())
+
+    def test_too_few_args(self):
+        out = io.StringIO()
+        with mock.patch('sys.stdout', out):
+            exitcode = form_signature.main([
+                '/path/to/swift-form-signature',
+                '/v1/a/c/o', '', '12', '34', '3600'])
+
+        self.assertNotEqual(exitcode, 0)
+        usage = 'Syntax: swift-form-signature <path>'
+        self.assertIn(usage, out.getvalue())
+
+    def test_invalid_filesize_arg(self):
+        out = io.StringIO()
+        key = 'secret squirrel'
+        with mock.patch('sys.stdout', out):
+            exitcode = form_signature.main([
+                '/path/to/swift-form-signature',
+                '/v1/a/c/o', '', '-1', '34', '3600', key])
+        self.assertNotEqual(exitcode, 0)
+
+    def test_invalid_filecount_arg(self):
+        out = io.StringIO()
+        key = 'secret squirrel'
+        with mock.patch('sys.stdout', out):
+            exitcode = form_signature.main([
+                '/path/to/swift-form-signature',
+                '/v1/a/c/o', '', '12', '-34', '3600', key])
+        self.assertNotEqual(exitcode, 0)
+
+    def test_invalid_path_arg(self):
+        out = io.StringIO()
+        key = 'secret squirrel'
+        with mock.patch('sys.stdout', out):
+            exitcode = form_signature.main([
+                '/path/to/swift-form-signature',
+                '/v1/a/', '', '12', '34', '3600', key])
+        self.assertNotEqual(exitcode, 0)
+
+    def test_invalid_seconds_arg(self):
+        out = io.StringIO()
+        key = 'secret squirrel'
+        with mock.patch('sys.stdout', out):
+            exitcode = form_signature.main([
+                '/path/to/swift-form-signature',
+                '/v1/a/c/o', '', '12', '34',
+                '-922337203685477580799999999999999', key])
+        self.assertNotEqual(exitcode, 0)
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/cli/test_info.py b/test/unit/cli/test_info.py
new file mode 100644
index 0000000000..43cd0edf9f
--- /dev/null
+++ b/test/unit/cli/test_info.py
@@ -0,0 +1,1744 @@
+# Licensed under the Apache License, Version 2.0 (the "License"); you may not
+# use this file except in compliance with the License. You may obtain a copy
+# of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
+# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
+# License for the specific language governing permissions and limitations
+# under the License.
+
+"""Tests for swift.cli.info"""
+
+from argparse import Namespace
+import os
+import unittest
+from unittest import mock
+from shutil import rmtree
+from tempfile import mkdtemp
+
+from io import StringIO
+from test.unit import patch_policies, write_fake_ring, skip_if_no_xattrs, \
+    make_timestamp_iter
+
+from swift.common import ring, utils
+from swift.common.swob import Request
+from swift.common.storage_policy import StoragePolicy, POLICIES
+from swift.cli.info import (print_db_info_metadata, print_ring_locations,
+                            print_info, print_obj_metadata, print_obj,
+                            InfoSystemExit, print_item_locations,
+                            parse_get_node_args, print_db_syncs)
+from swift.account.server import AccountController
+from swift.container.server import ContainerController
+from swift.container.backend import UNSHARDED, SHARDED
+from swift.obj.diskfile import write_metadata
+
+
+@patch_policies([StoragePolicy(0, 'zero', True),
+                 StoragePolicy(1, 'one', False),
+                 StoragePolicy(2, 'two', False),
+                 StoragePolicy(3, 'three', False)])
+class TestCliInfoBase(unittest.TestCase):
+    def setUp(self):
+        skip_if_no_xattrs()
+        self.ts_iter = make_timestamp_iter()
+        self.orig_hp = utils.HASH_PATH_PREFIX, utils.HASH_PATH_SUFFIX
+        utils.HASH_PATH_PREFIX = b'info'
+        utils.HASH_PATH_SUFFIX = b'info'
+        self.testdir = os.path.join(mkdtemp(), 'tmp_test_cli_info')
+        utils.mkdirs(self.testdir)
+        rmtree(self.testdir)
+        utils.mkdirs(os.path.join(self.testdir, 'sda1'))
+        utils.mkdirs(os.path.join(self.testdir, 'sda1', 'tmp'))
+        utils.mkdirs(os.path.join(self.testdir, 'sdb1'))
+        utils.mkdirs(os.path.join(self.testdir, 'sdb1', 'tmp'))
+        self.account_ring_path = os.path.join(self.testdir, 'account.ring.gz')
+        account_devs = [
+            {'ip': '127.0.0.1', 'port': 42},
+            {'ip': '127.0.0.2', 'port': 43},
+        ]
+        write_fake_ring(self.account_ring_path, *account_devs)
+        self.container_ring_path = os.path.join(self.testdir,
+                                                'container.ring.gz')
+        container_devs = [
+            {'ip': '127.0.0.3', 'port': 42},
+            {'ip': '127.0.0.4', 'port': 43},
+        ]
+        write_fake_ring(self.container_ring_path, *container_devs)
+        self.object_ring_path = os.path.join(self.testdir, 'object.ring.gz')
+        object_devs = [
+            {'ip': '127.0.0.3', 'port': 42},
+            {'ip': '127.0.0.4', 'port': 43},
+        ]
+        write_fake_ring(self.object_ring_path, *object_devs)
+        # another ring for policy 1
+        self.one_ring_path = os.path.join(self.testdir, 'object-1.ring.gz')
+        write_fake_ring(self.one_ring_path, *object_devs)
+        # ... and another for policy 2
+        self.two_ring_path = os.path.join(self.testdir, 'object-2.ring.gz')
+        write_fake_ring(self.two_ring_path, *object_devs)
+        # ... and one for policy 3 with some v6 IPs in it
+        object_devs_ipv6 = [
+            {'ip': 'feed:face::dead:beef', 'port': 42},
+            {'ip': 'deca:fc0f:feeb:ad11::1', 'port': 43}
+        ]
+        self.three_ring_path = os.path.join(self.testdir, 'object-3.ring.gz')
+        write_fake_ring(self.three_ring_path, *object_devs_ipv6)
+
+    def tearDown(self):
+        utils.HASH_PATH_PREFIX, utils.HASH_PATH_SUFFIX = self.orig_hp
+        rmtree(os.path.dirname(self.testdir))
+
+    def assertRaisesMessage(self, exc, msg, func, *args, **kwargs):
+        with self.assertRaises(exc) as ctx:
+            func(*args, **kwargs)
+        self.assertIn(msg, str(ctx.exception))
+
+
+class TestCliInfo(TestCliInfoBase):
+    def test_print_db_info_metadata(self):
+        self.assertRaisesMessage(ValueError, 'Wrong DB type',
+                                 print_db_info_metadata, 't', {}, {})
+        self.assertRaisesMessage(ValueError, 'DB info is None',
+                                 print_db_info_metadata, 'container', None, {})
+        self.assertRaisesMessage(ValueError, 'Info is incomplete',
+                                 print_db_info_metadata, 'container', {}, {})
+
+        info = {
+            'account': 'acct',
+            'is_deleted': False,
+            'created_at': 100.1,
+            'put_timestamp': 106.3,
+            'delete_timestamp': 107.9,
+            'status_changed_at': 108.3,
+            'container_count': '3',
+            'object_count': '20',
+            'bytes_used': '42',
+            'hash': 'abaddeadbeefcafe',
+            'id': 'abadf100d0ddba11',
+        }
+        md = {'x-account-meta-mydata': ('swift', '0000000000.00000'),
+              'x-other-something': ('boo', '0000000000.00000')}
+        out = StringIO()
+        with mock.patch('sys.stdout', out):
+            print_db_info_metadata('account', info, md)
+        exp_out = '''Path: /acct
+  Account: acct
+  Deleted: False
+  Account Hash: dc5be2aa4347a22a0fee6bc7de505b47
+Metadata:
+  Created at: 1970-01-01T00:01:40.100000 (100.1)
+  Put Timestamp: 1970-01-01T00:01:46.300000 (106.3)
+  Delete Timestamp: 1970-01-01T00:01:47.900000 (107.9)
+  Status Timestamp: 1970-01-01T00:01:48.300000 (108.3)
+  Container Count: 3
+  Object Count: 20
+  Bytes Used: 42
+  Chexor: abaddeadbeefcafe
+  UUID: abadf100d0ddba11
+  X-Other-Something: boo
+No system metadata found in db file
+  User Metadata:
+    x-account-meta-mydata: swift'''
+
+        self.assertEqual(out.getvalue().strip().split('\n'),
+                         exp_out.split('\n'))
+
+        info = dict(
+            account='acct',
+            container='cont',
+            storage_policy_index=0,
+            created_at='0000000100.10000',
+            put_timestamp='0000000106.30000',
+            delete_timestamp='0000000107.90000',
+            status_changed_at='0000000108.30000',
+            object_count='20',
+            bytes_used='42',
+            reported_put_timestamp='0000010106.30000',
+            reported_delete_timestamp='0000010107.90000',
+            reported_object_count='20',
+            reported_bytes_used='42',
+            x_container_foo='bar',
+            x_container_bar='goo',
+            db_state=UNSHARDED,
+            is_root=True,
+            is_deleted=False,
+            hash='abaddeadbeefcafe',
+            id='abadf100d0ddba11')
+        md = {'x-container-sysmeta-mydata': ('swift', '0000000000.00000')}
+        out = StringIO()
+        with mock.patch('sys.stdout', out):
+            print_db_info_metadata('container', info, md, True)
+        exp_out = '''Path: /acct/cont
+  Account: acct
+  Container: cont
+  Deleted: False
+  Container Hash: d49d0ecbb53be1fcc49624f2f7c7ccae
+Metadata:
+  Created at: 1970-01-01T00:01:40.100000 (0000000100.10000)
+  Put Timestamp: 1970-01-01T00:01:46.300000 (0000000106.30000)
+  Delete Timestamp: 1970-01-01T00:01:47.900000 (0000000107.90000)
+  Status Timestamp: 1970-01-01T00:01:48.300000 (0000000108.30000)
+  Object Count: 20
+  Bytes Used: 42
+  Storage Policy: %s (0)
+  Reported Put Timestamp: 1970-01-01T02:48:26.300000 (0000010106.30000)
+  Reported Delete Timestamp: 1970-01-01T02:48:27.900000 (0000010107.90000)
+  Reported Object Count: 20
+  Reported Bytes Used: 42
+  Chexor: abaddeadbeefcafe
+  UUID: abadf100d0ddba11
+  X-Container-Bar: goo
+  X-Container-Foo: bar
+  System Metadata:
+    mydata: swift
+No user metadata found in db file
+Sharding Metadata:
+  Type: root
+  State: unsharded''' % POLICIES[0].name
+        self.assertEqual(sorted(out.getvalue().strip().split('\n')),
+                         sorted(exp_out.split('\n')))
+
+        info = {
+            'account': 'acct',
+            'is_deleted': True,
+            'created_at': 100.1,
+            'put_timestamp': 106.3,
+            'delete_timestamp': 107.9,
+            'status_changed_at': 108.3,
+            'container_count': '3',
+            'object_count': '20',
+            'bytes_used': '42',
+            'hash': 'abaddeadbeefcafe',
+            'id': 'abadf100d0ddba11',
+        }
+        md = {'x-account-meta-mydata': ('swift', '0000000000.00000'),
+              'x-other-something': ('boo', '0000000000.00000')}
+        out = StringIO()
+        with mock.patch('sys.stdout', out):
+            print_db_info_metadata('account', info, md)
+        exp_out = '''Path: /acct
+  Account: acct
+  Deleted: True
+  Account Hash: dc5be2aa4347a22a0fee6bc7de505b47
+Metadata:
+  Created at: 1970-01-01T00:01:40.100000 (100.1)
+  Put Timestamp: 1970-01-01T00:01:46.300000 (106.3)
+  Delete Timestamp: 1970-01-01T00:01:47.900000 (107.9)
+  Status Timestamp: 1970-01-01T00:01:48.300000 (108.3)
+  Container Count: 3
+  Object Count: 20
+  Bytes Used: 42
+  Chexor: abaddeadbeefcafe
+  UUID: abadf100d0ddba11
+  X-Other-Something: boo
+No system metadata found in db file
+  User Metadata:
+    x-account-meta-mydata: swift'''
+
+        self.assertEqual(sorted(out.getvalue().strip().split('\n')),
+                         sorted(exp_out.split('\n')))
+
+    def test_print_db_info_metadata_with_shard_ranges(self):
+        timestamps = [utils.Timestamp(i) for i in range(4)]
+        shard_ranges = [utils.ShardRange(
+            name='.sharded_a/shard_range_%s' % i,
+            timestamp=timestamps[i], lower='%da' % i,
+            upper='%dz' % i, object_count=i, bytes_used=i,
+            meta_timestamp=timestamps[i])
+            for i in range(1, 4)]
+        shard_ranges[0].state = utils.ShardRange.CLEAVED
+        shard_ranges[1].state = utils.ShardRange.CREATED
+
+        info = dict(
+            account='acct',
+            container='cont',
+            storage_policy_index=0,
+            created_at='0000000100.10000',
+            put_timestamp='0000000106.30000',
+            delete_timestamp='0000000107.90000',
+            status_changed_at='0000000108.30000',
+            object_count='20',
+            bytes_used='42',
+            reported_put_timestamp='0000010106.30000',
+            reported_delete_timestamp='0000010107.90000',
+            reported_object_count='20',
+            reported_bytes_used='42',
+            db_state=SHARDED,
+            is_root=True,
+            shard_ranges=shard_ranges,
+            is_deleted=False,
+            hash='abaddeadbeefcafe',
+            id='abadf100d0ddba11')
+        out = StringIO()
+        with mock.patch('sys.stdout', out):
+            print_db_info_metadata('container', info, {}, verbose=True)
+        exp_out = '''Path: /acct/cont
+  Account: acct
+  Container: cont
+  Deleted: False
+  Container Hash: d49d0ecbb53be1fcc49624f2f7c7ccae
+Metadata:
+  Created at: 1970-01-01T00:01:40.100000 (0000000100.10000)
+  Put Timestamp: 1970-01-01T00:01:46.300000 (0000000106.30000)
+  Delete Timestamp: 1970-01-01T00:01:47.900000 (0000000107.90000)
+  Status Timestamp: 1970-01-01T00:01:48.300000 (0000000108.30000)
+  Object Count: 20
+  Bytes Used: 42
+  Storage Policy: %s (0)
+  Reported Put Timestamp: 1970-01-01T02:48:26.300000 (0000010106.30000)
+  Reported Delete Timestamp: 1970-01-01T02:48:27.900000 (0000010107.90000)
+  Reported Object Count: 20
+  Reported Bytes Used: 42
+  Chexor: abaddeadbeefcafe
+  UUID: abadf100d0ddba11
+No system metadata found in db file
+No user metadata found in db file
+Sharding Metadata:
+  Type: root
+  State: sharded
+Shard Ranges (3):
+  States:
+        found: 1
+      created: 1
+      cleaved: 1
+  Name: .sharded_a/shard_range_1
+    lower: '1a', upper: '1z'
+    Object Count: 1, Bytes Used: 1, State: cleaved (30)
+    Created at: 1970-01-01T00:00:01.000000 (%s)
+    Meta Timestamp: 1970-01-01T00:00:01.000000 (%s)
+  Name: .sharded_a/shard_range_2
+    lower: '2a', upper: '2z'
+    Object Count: 2, Bytes Used: 2, State: created (20)
+    Created at: 1970-01-01T00:00:02.000000 (%s)
+    Meta Timestamp: 1970-01-01T00:00:02.000000 (%s)
+  Name: .sharded_a/shard_range_3
+    lower: '3a', upper: '3z'
+    Object Count: 3, Bytes Used: 3, State: found (10)
+    Created at: 1970-01-01T00:00:03.000000 (%s)
+    Meta Timestamp: 1970-01-01T00:00:03.000000 (%s)''' % \
+                  (POLICIES[0].name,
+                   timestamps[1].internal, timestamps[1].internal,
+                   timestamps[2].internal, timestamps[2].internal,
+                   timestamps[3].internal, timestamps[3].internal)
+        self.assertEqual(out.getvalue().strip().split('\n'),
+                         exp_out.strip().split('\n'))
+
+    def test_print_db_info_metadata_with_many_shard_ranges(self):
+
+        shard_ranges = [utils.ShardRange(
+            name='.sharded_a/shard_range_%s' % i,
+            timestamp=utils.Timestamp(i), lower='%02da' % i,
+            upper='%02dz' % i, object_count=i, bytes_used=i,
+            meta_timestamp=utils.Timestamp(i)) for i in range(1, 20)]
+        shard_ranges[0].state = utils.ShardRange.CLEAVED
+        shard_ranges[1].state = utils.ShardRange.CREATED
+
+        info = dict(
+            account='acct',
+            container='cont',
+            storage_policy_index=0,
+            created_at='0000000100.10000',
+            put_timestamp='0000000106.30000',
+            delete_timestamp='0000000107.90000',
+            status_changed_at='0000000108.30000',
+            object_count='20',
+            bytes_used='42',
+            reported_put_timestamp='0000010106.30000',
+            reported_delete_timestamp='0000010107.90000',
+            reported_object_count='20',
+            reported_bytes_used='42',
+            db_state=SHARDED,
+            is_root=True,
+            shard_ranges=shard_ranges,
+            is_deleted=False,
+            hash='abaddeadbeefcafe',
+            id='abadf100d0ddba11')
+        out = StringIO()
+        with mock.patch('sys.stdout', out):
+            print_db_info_metadata('container', info, {})
+        exp_out = '''
+Path: /acct/cont
+  Account: acct
+  Container: cont
+  Deleted: False
+  Container Hash: d49d0ecbb53be1fcc49624f2f7c7ccae
+Metadata:
+  Created at: 1970-01-01T00:01:40.100000 (0000000100.10000)
+  Put Timestamp: 1970-01-01T00:01:46.300000 (0000000106.30000)
+  Delete Timestamp: 1970-01-01T00:01:47.900000 (0000000107.90000)
+  Status Timestamp: 1970-01-01T00:01:48.300000 (0000000108.30000)
+  Object Count: 20
+  Bytes Used: 42
+  Storage Policy: %s (0)
+  Reported Put Timestamp: 1970-01-01T02:48:26.300000 (0000010106.30000)
+  Reported Delete Timestamp: 1970-01-01T02:48:27.900000 (0000010107.90000)
+  Reported Object Count: 20
+  Reported Bytes Used: 42
+  Chexor: abaddeadbeefcafe
+  UUID: abadf100d0ddba11
+No system metadata found in db file
+No user metadata found in db file
+Sharding Metadata:
+  Type: root
+  State: sharded
+Shard Ranges (19):
+  States:
+        found: 17
+      created: 1
+      cleaved: 1
+(Use -v/--verbose to show more Shard Ranges details)
+''' %\
+                  POLICIES[0].name
+        self.assertEqual(out.getvalue().strip().split('\n'),
+                         exp_out.strip().split('\n'))
+
+    def test_print_db_info_metadata_with_shard_ranges_bis(self):
+        timestamps = [utils.Timestamp(i) for i in range(4)]
+        shard_ranges = [utils.ShardRange(
+            name='.sharded_a/shard_range_%s' % i,
+            timestamp=timestamps[i], lower=u'%d\u30a2' % i,
+            upper=u'%d\u30e4' % i, object_count=i, bytes_used=i,
+            meta_timestamp=timestamps[i]) for i in range(1, 4)]
+        shard_ranges[0].state = utils.ShardRange.CLEAVED
+        shard_ranges[1].state = utils.ShardRange.CREATED
+
+        info = dict(
+            account='acct',
+            container='cont',
+            storage_policy_index=0,
+            created_at='0000000100.10000',
+            put_timestamp='0000000106.30000',
+            delete_timestamp='0000000107.90000',
+            status_changed_at='0000000108.30000',
+            object_count='20',
+            bytes_used='42',
+            reported_put_timestamp='0000010106.30000',
+            reported_delete_timestamp='0000010107.90000',
+            reported_object_count='20',
+            reported_bytes_used='42',
+            db_state=SHARDED,
+            is_root=True,
+            shard_ranges=shard_ranges)
+        info['hash'] = 'abaddeadbeefcafe'
+        info['id'] = 'abadf100d0ddba11'
+        info['is_deleted'] = False
+        out = StringIO()
+        with mock.patch('sys.stdout', out):
+            print_db_info_metadata('container', info, {}, verbose=True)
+        s_a = '\u30a2'
+        s_ya = '\u30e4'
+        exp_out = '''Path: /acct/cont
+  Account: acct
+  Container: cont
+  Deleted: False
+  Container Hash: d49d0ecbb53be1fcc49624f2f7c7ccae
+Metadata:
+  Created at: 1970-01-01T00:01:40.100000 (0000000100.10000)
+  Put Timestamp: 1970-01-01T00:01:46.300000 (0000000106.30000)
+  Delete Timestamp: 1970-01-01T00:01:47.900000 (0000000107.90000)
+  Status Timestamp: 1970-01-01T00:01:48.300000 (0000000108.30000)
+  Object Count: 20
+  Bytes Used: 42
+  Storage Policy: %s (0)
+  Reported Put Timestamp: 1970-01-01T02:48:26.300000 (0000010106.30000)
+  Reported Delete Timestamp: 1970-01-01T02:48:27.900000 (0000010107.90000)
+  Reported Object Count: 20
+  Reported Bytes Used: 42
+  Chexor: abaddeadbeefcafe
+  UUID: abadf100d0ddba11
+No system metadata found in db file
+No user metadata found in db file
+Sharding Metadata:
+  Type: root
+  State: sharded
+Shard Ranges (3):
+  States:
+        found: 1
+      created: 1
+      cleaved: 1
+  Name: .sharded_a/shard_range_1
+    lower: '1%s', upper: '1%s'
+    Object Count: 1, Bytes Used: 1, State: cleaved (30)
+    Created at: 1970-01-01T00:00:01.000000 (%s)
+    Meta Timestamp: 1970-01-01T00:00:01.000000 (%s)
+  Name: .sharded_a/shard_range_2
+    lower: '2%s', upper: '2%s'
+    Object Count: 2, Bytes Used: 2, State: created (20)
+    Created at: 1970-01-01T00:00:02.000000 (%s)
+    Meta Timestamp: 1970-01-01T00:00:02.000000 (%s)
+  Name: .sharded_a/shard_range_3
+    lower: '3%s', upper: '3%s'
+    Object Count: 3, Bytes Used: 3, State: found (10)
+    Created at: 1970-01-01T00:00:03.000000 (%s)
+    Meta Timestamp: 1970-01-01T00:00:03.000000 (%s)''' %\
+                  (POLICIES[0].name,
+                   s_a, s_ya,
+                   timestamps[1].internal, timestamps[1].internal,
+                   s_a, s_ya,
+                   timestamps[2].internal, timestamps[2].internal,
+                   s_a, s_ya,
+                   timestamps[3].internal, timestamps[3].internal,)
+        self.assertEqual(out.getvalue().strip().split('\n'),
+                         exp_out.strip().split('\n'))
+
+    def test_print_ring_locations_invalid_args(self):
+        self.assertRaises(ValueError, print_ring_locations,
+                          None, 'dir', 'acct')
+        self.assertRaises(ValueError, print_ring_locations,
+                          [], None, 'acct')
+        self.assertRaises(ValueError, print_ring_locations,
+                          [], 'dir', None)
+        self.assertRaises(ValueError, print_ring_locations,
+                          [], 'dir', 'acct', 'con')
+        self.assertRaises(ValueError, print_ring_locations,
+                          [], 'dir', 'acct', obj='o')
+
+    def test_print_ring_locations_account(self):
+        out = StringIO()
+        with mock.patch('sys.stdout', out):
+            acctring = ring.Ring(self.testdir, ring_name='account')
+            print_ring_locations(acctring, 'dir', 'acct')
+        exp_db = os.path.join('${DEVICE:-/srv/node*}', 'sdb1', 'dir', '3',
+                              'b47', 'dc5be2aa4347a22a0fee6bc7de505b47')
+        self.assertIn(exp_db, out.getvalue())
+        self.assertIn('127.0.0.1', out.getvalue())
+        self.assertIn('127.0.0.2', out.getvalue())
+
+    def test_print_ring_locations_container(self):
+        out = StringIO()
+        with mock.patch('sys.stdout', out):
+            contring = ring.Ring(self.testdir, ring_name='container')
+            print_ring_locations(contring, 'dir', 'acct', 'con')
+        exp_db = os.path.join('${DEVICE:-/srv/node*}', 'sdb1', 'dir', '1',
+                              'fe6', '63e70955d78dfc62821edc07d6ec1fe6')
+        self.assertIn(exp_db, out.getvalue())
+
+    def test_print_ring_locations_obj(self):
+        out = StringIO()
+        with mock.patch('sys.stdout', out):
+            objring = ring.Ring(self.testdir, ring_name='object')
+            print_ring_locations(objring, 'dir', 'acct', 'con', 'obj')
+        exp_obj = os.path.join('${DEVICE:-/srv/node*}', 'sda1', 'dir', '1',
+                               '117', '4a16154fc15c75e26ba6afadf5b1c117')
+        self.assertIn(exp_obj, out.getvalue())
+
+    def test_print_ring_locations_partition_number(self):
+        out = StringIO()
+        with mock.patch('sys.stdout', out):
+            objring = ring.Ring(self.testdir, ring_name='object')
+            print_ring_locations(objring, 'objects', None, tpart='1')
+        exp_obj1 = os.path.join('${DEVICE:-/srv/node*}', 'sda1',
+                                'objects', '1')
+        exp_obj2 = os.path.join('${DEVICE:-/srv/node*}', 'sdb1',
+                                'objects', '1')
+        self.assertIn(exp_obj1, out.getvalue())
+        self.assertIn(exp_obj2, out.getvalue())
+
+    def test_print_item_locations_invalid_args(self):
+        # No target specified
+        self.assertRaises(InfoSystemExit, print_item_locations,
+                          None)
+        # Need a ring or policy
+        self.assertRaises(InfoSystemExit, print_item_locations,
+                          None, account='account', obj='object')
+        # No account specified
+        self.assertRaises(InfoSystemExit, print_item_locations,
+                          None, container='con')
+        # No policy named 'xyz' (unrecognized policy)
+        self.assertRaises(InfoSystemExit, print_item_locations,
+                          None, obj='object', policy_name='xyz')
+        # No container specified
+        objring = ring.Ring(self.testdir, ring_name='object')
+        self.assertRaises(InfoSystemExit, print_item_locations,
+                          objring, account='account', obj='object')
+
+    def test_print_item_locations_ring_policy_mismatch_no_target(self):
+        out = StringIO()
+        with mock.patch('sys.stdout', out):
+            objring = ring.Ring(self.testdir, ring_name='object')
+            # Test mismatch of ring and policy name (valid policy)
+            self.assertRaises(InfoSystemExit, print_item_locations,
+                              objring, policy_name='zero')
+        self.assertIn('WARNING: mismatch between ring and policy name!',
+                      out.getvalue())
+        self.assertIn('No target specified', out.getvalue())
+
+    def test_print_item_locations_invalid_policy_no_target(self):
+        out = StringIO()
+        policy_name = 'nineteen'
+        with mock.patch('sys.stdout', out):
+            objring = ring.Ring(self.testdir, ring_name='object')
+            self.assertRaises(InfoSystemExit, print_item_locations,
+                              objring, policy_name=policy_name)
+        exp_msg = 'WARNING: Policy %s is not valid' % policy_name
+        self.assertIn(exp_msg, out.getvalue())
+        self.assertIn('No target specified', out.getvalue())
+
+    def test_print_item_locations_policy_object(self):
+        out = StringIO()
+        part = '1'
+        with mock.patch('sys.stdout', out):
+            print_item_locations(None, partition=part, policy_name='zero',
+                                 swift_dir=self.testdir)
+        exp_part_msg = 'Partition\t%s' % part
+        self.assertIn(exp_part_msg, out.getvalue())
+        self.assertNotIn('Account', out.getvalue())
+        self.assertNotIn('Container', out.getvalue())
+        self.assertNotIn('Object', out.getvalue())
+
+    def test_print_item_locations_dashed_ring_name_partition(self):
+        out = StringIO()
+        part = '1'
+        with mock.patch('sys.stdout', out):
+            print_item_locations(None, policy_name='one',
+                                 ring_name='foo-bar', partition=part,
+                                 swift_dir=self.testdir)
+        exp_part_msg = 'Partition\t%s' % part
+        self.assertIn(exp_part_msg, out.getvalue())
+        self.assertNotIn('Account', out.getvalue())
+        self.assertNotIn('Container', out.getvalue())
+        self.assertNotIn('Object', out.getvalue())
+
+    def test_print_item_locations_account_with_ring(self):
+        out = StringIO()
+        account = 'account'
+        with mock.patch('sys.stdout', out):
+            account_ring = ring.Ring(self.testdir, ring_name=account)
+            print_item_locations(account_ring, account=account)
+        exp_msg = 'Account  \t%s' % account
+        self.assertIn(exp_msg, out.getvalue())
+        exp_warning = 'WARNING: account specified ' + \
+                      'but ring not named "account"'
+        self.assertIn(exp_warning, out.getvalue())
+        exp_acct_msg = 'Account  \t%s' % account
+        self.assertIn(exp_acct_msg, out.getvalue())
+        self.assertNotIn('Container', out.getvalue())
+        self.assertNotIn('Object', out.getvalue())
+
+    def test_print_item_locations_account_no_ring(self):
+        out = StringIO()
+        account = 'account'
+        with mock.patch('sys.stdout', out):
+            print_item_locations(None, account=account,
+                                 swift_dir=self.testdir)
+        exp_acct_msg = 'Account  \t%s' % account
+        self.assertIn(exp_acct_msg, out.getvalue())
+        self.assertNotIn('Container', out.getvalue())
+        self.assertNotIn('Object', out.getvalue())
+
+    def test_print_item_locations_account_container_ring(self):
+        out = StringIO()
+        account = 'account'
+        container = 'container'
+        with mock.patch('sys.stdout', out):
+            container_ring = ring.Ring(self.testdir, ring_name='container')
+            print_item_locations(container_ring, account=account,
+                                 container=container)
+        exp_acct_msg = 'Account  \t%s' % account
+        exp_cont_msg = 'Container\t%s' % container
+        self.assertIn(exp_acct_msg, out.getvalue())
+        self.assertIn(exp_cont_msg, out.getvalue())
+        self.assertNotIn('Object', out.getvalue())
+
+    def test_print_item_locations_account_container_no_ring(self):
+        out = StringIO()
+        account = 'account'
+        container = 'container'
+        with mock.patch('sys.stdout', out):
+            print_item_locations(None, account=account,
+                                 container=container, swift_dir=self.testdir)
+        exp_acct_msg = 'Account  \t%s' % account
+        exp_cont_msg = 'Container\t%s' % container
+        self.assertIn(exp_acct_msg, out.getvalue())
+        self.assertIn(exp_cont_msg, out.getvalue())
+        self.assertNotIn('Object', out.getvalue())
+
+    def test_print_item_locations_account_container_object_ring(self):
+        out = StringIO()
+        account = 'account'
+        container = 'container'
+        obj = 'object'
+        with mock.patch('sys.stdout', out):
+            object_ring = ring.Ring(self.testdir, ring_name='object')
+            print_item_locations(object_ring, ring_name='object',
+                                 account=account, container=container,
+                                 obj=obj)
+        exp_acct_msg = 'Account  \t%s' % account
+        exp_cont_msg = 'Container\t%s' % container
+        exp_obj_msg = 'Object   \t%s' % obj
+        self.assertIn(exp_acct_msg, out.getvalue())
+        self.assertIn(exp_cont_msg, out.getvalue())
+        self.assertIn(exp_obj_msg, out.getvalue())
+
+    def test_print_db_syncs(self):
+        # first the empty case
+        for incoming in (True, False):
+            out = StringIO()
+            with mock.patch('sys.stdout', out):
+                print_db_syncs(incoming, [])
+            if incoming:
+                exp_heading = 'Incoming Syncs:'
+            else:
+                exp_heading = 'Outgoing Syncs:'
+            exp_heading += '\n  Sync Point\tRemote ID\tUpdated At'
+            self.assertIn(exp_heading, out.getvalue())
+
+        # now add some syncs
+        ts0 = utils.Timestamp(1)
+        ts1 = utils.Timestamp(2)
+        syncs = [{'sync_point': 0, 'remote_id': 'remote_0',
+                  'updated_at': str(int(ts0))},
+                 {'sync_point': 1, 'remote_id': 'remote_1',
+                  'updated_at': str(int(ts1))}]
+
+        template_output = """%s:\n  Sync Point\tRemote ID\tUpdated At
+  0         \tremote_0 \t%s (%s)
+  1         \tremote_1 \t%s (%s)
+"""
+        for incoming in (True, False):
+            out = StringIO()
+            with mock.patch('sys.stdout', out):
+                print_db_syncs(incoming, syncs)
+            output = template_output % (
+                'Incoming Syncs' if incoming else 'Outgoing Syncs',
+                ts0.isoformat, str(int(ts0)), ts1.isoformat, str(int(ts1)))
+            self.assertEqual(output, out.getvalue())
+
+    def test_print_item_locations_account_container_object_dashed_ring(self):
+        out = StringIO()
+        account = 'account'
+        container = 'container'
+        obj = 'object'
+        with mock.patch('sys.stdout', out):
+            object_ring = ring.Ring(self.testdir, ring_name='object-1')
+            print_item_locations(object_ring, ring_name='object-1',
+                                 account=account, container=container,
+                                 obj=obj)
+        exp_acct_msg = 'Account  \t%s' % account
+        exp_cont_msg = 'Container\t%s' % container
+        exp_obj_msg = 'Object   \t%s' % obj
+        self.assertIn(exp_acct_msg, out.getvalue())
+        self.assertIn(exp_cont_msg, out.getvalue())
+        self.assertIn(exp_obj_msg, out.getvalue())
+
+    def test_print_info(self):
+        db_file = 'foo'
+        self.assertRaises(InfoSystemExit, print_info, 'object', db_file)
+        db_file = os.path.join(self.testdir, './acct.db')
+        self.assertRaises(InfoSystemExit, print_info, 'account', db_file)
+
+        controller = AccountController(
+            {'devices': self.testdir, 'mount_check': 'false'})
+        req = Request.blank('/sda1/1/acct', environ={'REQUEST_METHOD': 'PUT',
+                                                     'HTTP_X_TIMESTAMP': '0'})
+        resp = req.get_response(controller)
+        self.assertEqual(resp.status_int, 201)
+        out = StringIO()
+        exp_raised = False
+        with mock.patch('sys.stdout', out):
+            db_file = os.path.join(self.testdir, 'sda1', 'accounts',
+                                   '1', 'b47',
+                                   'dc5be2aa4347a22a0fee6bc7de505b47',
+                                   'dc5be2aa4347a22a0fee6bc7de505b47.db')
+            print_info('account', db_file, swift_dir=self.testdir)
+        self.assertGreater(len(out.getvalue().strip()), 800)
+
+        controller = ContainerController(
+            {'devices': self.testdir, 'mount_check': 'false'})
+        req = Request.blank('/sda1/1/acct/cont',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'HTTP_X_TIMESTAMP': '0'})
+        resp = req.get_response(controller)
+        self.assertEqual(resp.status_int, 201)
+        out = StringIO()
+        exp_raised = False
+        with mock.patch('sys.stdout', out):
+            db_file = os.path.join(self.testdir, 'sda1', 'containers',
+                                   '1', 'cae',
+                                   'd49d0ecbb53be1fcc49624f2f7c7ccae',
+                                   'd49d0ecbb53be1fcc49624f2f7c7ccae.db')
+            orig_cwd = os.getcwd()
+            try:
+                os.chdir(os.path.dirname(db_file))
+                print_info('container', os.path.basename(db_file),
+                           swift_dir='/dev/null')
+            except Exception:
+                exp_raised = True
+            finally:
+                os.chdir(orig_cwd)
+        if exp_raised:
+            self.fail("Unexpected exception raised")
+        else:
+            self.assertGreater(len(out.getvalue().strip()), 600)
+
+        out = StringIO()
+        exp_raised = False
+        with mock.patch('sys.stdout', out):
+            db_file = os.path.join(self.testdir, 'sda1', 'containers',
+                                   '1', 'cae',
+                                   'd49d0ecbb53be1fcc49624f2f7c7ccae',
+                                   'd49d0ecbb53be1fcc49624f2f7c7ccae.db')
+            orig_cwd = os.getcwd()
+            try:
+                os.chdir(os.path.dirname(db_file))
+                print_info('account', os.path.basename(db_file),
+                           swift_dir='/dev/null')
+            except InfoSystemExit:
+                exp_raised = True
+            finally:
+                os.chdir(orig_cwd)
+        if exp_raised:
+            exp_out = 'Does not appear to be a DB of type "account":' \
+                ' ./d49d0ecbb53be1fcc49624f2f7c7ccae.db'
+            self.assertEqual(out.getvalue().strip(), exp_out)
+        else:
+            self.fail("Expected an InfoSystemExit exception to be raised")
+
+    def test_parse_get_node_args(self):
+        # Capture error messages
+        # (without any parameters)
+        options = Namespace(policy_name=None, partition=None, quoted=None)
+        args = ''
+        self.assertRaisesMessage(InfoSystemExit,
+                                 'Need to specify policy_name or <ring.gz>',
+                                 parse_get_node_args, options, args.split())
+        # a
+        options = Namespace(policy_name=None, partition=None, quoted=None)
+        args = 'a'
+        self.assertRaisesMessage(InfoSystemExit,
+                                 'Need to specify policy_name or <ring.gz>',
+                                 parse_get_node_args, options, args.split())
+        # a c
+        options = Namespace(policy_name=None, partition=None, quoted=None)
+        args = 'a c'
+        self.assertRaisesMessage(InfoSystemExit,
+                                 'Need to specify policy_name or <ring.gz>',
+                                 parse_get_node_args, options, args.split())
+        # a c o
+        options = Namespace(policy_name=None, partition=None, quoted=None)
+        args = 'a c o'
+        self.assertRaisesMessage(InfoSystemExit,
+                                 'Need to specify policy_name or <ring.gz>',
+                                 parse_get_node_args, options, args.split())
+
+        # a/c
+        options = Namespace(policy_name=None, partition=None, quoted=None)
+        args = 'a/c'
+        self.assertRaisesMessage(InfoSystemExit,
+                                 'Need to specify policy_name or <ring.gz>',
+                                 parse_get_node_args, options, args.split())
+        # a/c/o
+        options = Namespace(policy_name=None, partition=None, quoted=None)
+        args = 'a/c/o'
+        self.assertRaisesMessage(InfoSystemExit,
+                                 'Need to specify policy_name or <ring.gz>',
+                                 parse_get_node_args, options, args.split())
+
+        # account container junk/test.ring.gz
+        options = Namespace(policy_name=None, partition=None, quoted=None)
+        args = 'account container junk/test.ring.gz'
+        self.assertRaisesMessage(InfoSystemExit,
+                                 'Need to specify policy_name or <ring.gz>',
+                                 parse_get_node_args, options, args.split())
+
+        # account container object junk/test.ring.gz
+        options = Namespace(policy_name=None, partition=None, quoted=None)
+        args = 'account container object junk/test.ring.gz'
+        self.assertRaisesMessage(InfoSystemExit,
+                                 'Need to specify policy_name or <ring.gz>',
+                                 parse_get_node_args, options, args.split())
+
+        # object.ring.gz(without any arguments i.e. a c o)
+        options = Namespace(policy_name=None, partition=None, quoted=None)
+        args = 'object.ring.gz'
+        self.assertRaisesMessage(InfoSystemExit,
+                                 'Ring file does not exist',
+                                 parse_get_node_args, options, args.split())
+
+        # Valid policy
+        # -P zero
+        options = Namespace(policy_name='zero', partition=None, quoted=None)
+        args = ''
+        self.assertRaisesMessage(InfoSystemExit,
+                                 'No target specified',
+                                 parse_get_node_args, options, args.split())
+        # -P one a/c/o
+        options = Namespace(policy_name='one', partition=None, quoted=None)
+        args = 'a/c/o'
+        ring_path, args = parse_get_node_args(options, args.split())
+        self.assertIsNone(ring_path)
+        self.assertEqual(args, ['a', 'c', 'o'])
+        # -P one account container photos/cat.jpg
+        options = Namespace(policy_name='one', partition=None, quoted=None)
+        args = 'account container photos/cat.jpg'
+        ring_path, args = parse_get_node_args(options, args.split())
+        self.assertIsNone(ring_path)
+        self.assertEqual(args, ['account', 'container', 'photos/cat.jpg'])
+        # -P one account/container/photos/cat.jpg
+        options = Namespace(policy_name='one', partition=None, quoted=None)
+        args = 'account/container/photos/cat.jpg'
+        ring_path, args = parse_get_node_args(options, args.split())
+        self.assertIsNone(ring_path)
+        self.assertEqual(args, ['account', 'container', 'photos/cat.jpg'])
+        # -P one account/container/junk/test.ring.gz(object endswith 'ring.gz')
+        options = Namespace(policy_name='one', partition=None, quoted=None)
+        args = 'account/container/junk/test.ring.gz'
+        ring_path, args = parse_get_node_args(options, args.split())
+        self.assertIsNone(ring_path)
+        self.assertEqual(args, ['account', 'container', 'junk/test.ring.gz'])
+        # -P two a c o hooya
+        options = Namespace(policy_name='two', partition=None, quoted=None)
+        args = 'a c o hooya'
+        self.assertRaisesMessage(InfoSystemExit,
+                                 'Invalid arguments',
+                                 parse_get_node_args, options, args.split())
+        # -P zero -p 1
+        options = Namespace(policy_name='zero', partition='1', quoted=None)
+        args = ''
+        ring_path, args = parse_get_node_args(options, args.split())
+        self.assertIsNone(ring_path)
+        self.assertFalse(args)
+        # -P one -p 1 a/c/o
+        options = Namespace(policy_name='one', partition='1', quoted=None)
+        args = 'a/c/o'
+        ring_path, args = parse_get_node_args(options, args.split())
+        self.assertIsNone(ring_path)
+        self.assertEqual(args, ['a', 'c', 'o'])
+        # -P two -p 1 a c o hooya
+        options = Namespace(policy_name='two', partition='1', quoted=None)
+        args = 'a c o hooya'
+        self.assertRaisesMessage(InfoSystemExit,
+                                 'Invalid arguments',
+                                 parse_get_node_args, options, args.split())
+
+        # Invalid policy
+        # -P undefined
+        options = Namespace(policy_name='undefined')
+        args = ''
+        self.assertRaisesMessage(InfoSystemExit,
+                                 "No policy named 'undefined'",
+                                 parse_get_node_args, options, args.split())
+        # -P undefined -p 1
+        options = Namespace(policy_name='undefined', partition='1')
+        args = ''
+        self.assertRaisesMessage(InfoSystemExit,
+                                 "No policy named 'undefined'",
+                                 parse_get_node_args, options, args.split())
+        # -P undefined a
+        options = Namespace(policy_name='undefined')
+        args = 'a'
+        self.assertRaisesMessage(InfoSystemExit,
+                                 "No policy named 'undefined'",
+                                 parse_get_node_args, options, args.split())
+        # -P undefined a c
+        options = Namespace(policy_name='undefined')
+        args = 'a c'
+        self.assertRaisesMessage(InfoSystemExit,
+                                 "No policy named 'undefined'",
+                                 parse_get_node_args, options, args.split())
+        # -P undefined a c o
+        options = Namespace(policy_name='undefined')
+        args = 'a c o'
+        self.assertRaisesMessage(InfoSystemExit,
+                                 "No policy named 'undefined'",
+                                 parse_get_node_args, options, args.split())
+        # -P undefined a/c
+        options = Namespace(policy_name='undefined')
+        args = 'a/c'
+        # ring_path, args = parse_get_node_args(options, args.split())
+        self.assertRaisesMessage(InfoSystemExit,
+                                 "No policy named 'undefined'",
+                                 parse_get_node_args, options, args)
+        # -P undefined a/c/o
+        options = Namespace(policy_name='undefined')
+        args = 'a/c/o'
+        # ring_path, args = parse_get_node_args(options, args.split())
+        self.assertRaisesMessage(InfoSystemExit,
+                                 "No policy named 'undefined'",
+                                 parse_get_node_args, options, args)
+
+        # Mock tests
+        # /etc/swift/object.ring.gz(without any arguments i.e. a c o)
+        options = Namespace(policy_name=None, partition=None, quoted=None)
+        args = '/etc/swift/object.ring.gz'
+        with mock.patch('swift.cli.info.os.path.exists') as exists:
+            exists.return_value = True
+            self.assertRaisesMessage(
+                InfoSystemExit,
+                'No target specified',
+                parse_get_node_args, options, args.split())
+        # Similar ring_path and arguments
+        # /etc/swift/object.ring.gz /etc/swift/object.ring.gz
+        options = Namespace(policy_name=None, partition=None, quoted=None)
+        args = '/etc/swift/object.ring.gz /etc/swift/object.ring.gz'
+        with mock.patch('swift.cli.info.os.path.exists') as exists:
+            exists.return_value = True
+            ring_path, args = parse_get_node_args(options, args.split())
+        self.assertEqual(ring_path, '/etc/swift/object.ring.gz')
+        self.assertEqual(args, ['etc', 'swift', 'object.ring.gz'])
+        # /etc/swift/object.ring.gz a/c/etc/swift/object.ring.gz
+        options = Namespace(policy_name=None, partition=None, quoted=None)
+        args = '/etc/swift/object.ring.gz a/c/etc/swift/object.ring.gz'
+        with mock.patch('swift.cli.info.os.path.exists') as exists:
+            exists.return_value = True
+            ring_path, args = parse_get_node_args(options, args.split())
+        self.assertEqual(ring_path, '/etc/swift/object.ring.gz')
+        self.assertEqual(args, ['a', 'c', 'etc/swift/object.ring.gz'])
+        # Invalid path as mentioned in BUG#1539275
+        # /etc/swift/object.tar.gz account container object
+        options = Namespace(policy_name=None, partition=None, quoted=None)
+        args = '/etc/swift/object.tar.gz account container object'
+        self.assertRaisesMessage(
+            InfoSystemExit,
+            'Need to specify policy_name or <ring.gz>',
+            parse_get_node_args, options, args.split())
+
+        # object.ring.gz a/
+        options = Namespace(policy_name=None, quoted=None)
+        args = 'object.ring.gz a/'
+        with mock.patch('swift.cli.info.os.path.exists') as exists:
+            exists.return_value = True
+            ring_path, args = parse_get_node_args(options, args.split())
+        self.assertEqual(ring_path, 'object.ring.gz')
+        self.assertEqual(args, ['a'])
+        # object.ring.gz a/c
+        options = Namespace(policy_name=None, quoted=None)
+        args = 'object.ring.gz a/c'
+        with mock.patch('swift.cli.info.os.path.exists') as exists:
+            exists.return_value = True
+            ring_path, args = parse_get_node_args(options, args.split())
+        self.assertEqual(ring_path, 'object.ring.gz')
+        self.assertEqual(args, ['a', 'c'])
+        # object.ring.gz a/c/o
+        options = Namespace(policy_name=None, quoted=None)
+        args = 'object.ring.gz a/c/o'
+        with mock.patch('swift.cli.info.os.path.exists') as exists:
+            exists.return_value = True
+            ring_path, args = parse_get_node_args(options, args.split())
+        self.assertEqual(ring_path, 'object.ring.gz')
+        self.assertEqual(args, ['a', 'c', 'o'])
+        # object.ring.gz a/c/o/junk/test.ring.gz
+        options = Namespace(policy_name=None, quoted=None)
+        args = 'object.ring.gz a/c/o/junk/test.ring.gz'
+        with mock.patch('swift.cli.info.os.path.exists') as exists:
+            exists.return_value = True
+            ring_path, args = parse_get_node_args(options, args.split())
+        self.assertEqual(ring_path, 'object.ring.gz')
+        self.assertEqual(args, ['a', 'c', 'o/junk/test.ring.gz'])
+        # object.ring.gz a
+        options = Namespace(policy_name=None, quoted=None)
+        args = 'object.ring.gz a'
+        with mock.patch('swift.cli.info.os.path.exists') as exists:
+            exists.return_value = True
+            ring_path, args = parse_get_node_args(options, args.split())
+        self.assertEqual(ring_path, 'object.ring.gz')
+        self.assertEqual(args, ['a'])
+        # object.ring.gz a c
+        options = Namespace(policy_name=None, quoted=None)
+        args = 'object.ring.gz a c'
+        with mock.patch('swift.cli.info.os.path.exists') as exists:
+            exists.return_value = True
+            ring_path, args = parse_get_node_args(options, args.split())
+        self.assertEqual(ring_path, 'object.ring.gz')
+        self.assertEqual(args, ['a', 'c'])
+        # object.ring.gz a c o
+        options = Namespace(policy_name=None, quoted=None)
+        args = 'object.ring.gz a c o'
+        with mock.patch('swift.cli.info.os.path.exists') as exists:
+            exists.return_value = True
+            ring_path, args = parse_get_node_args(options, args.split())
+        self.assertEqual(ring_path, 'object.ring.gz')
+        self.assertEqual(args, ['a', 'c', 'o'])
+        # object.ring.gz a c o blah blah
+        options = Namespace(policy_name=None, quoted=None)
+        args = 'object.ring.gz a c o blah blah'
+        with mock.patch('swift.cli.info.os.path.exists') as exists:
+            exists.return_value = True
+            self.assertRaisesMessage(
+                InfoSystemExit,
+                'Invalid arguments',
+                parse_get_node_args, options, args.split())
+        # object.ring.gz a/c/o/blah/blah
+        options = Namespace(policy_name=None, quoted=None)
+        args = 'object.ring.gz a/c/o/blah/blah'
+        with mock.patch('swift.cli.info.os.path.exists') as exists:
+            exists.return_value = True
+            ring_path, args = parse_get_node_args(options, args.split())
+        self.assertEqual(ring_path, 'object.ring.gz')
+        self.assertEqual(args, ['a', 'c', 'o/blah/blah'])
+
+        # object.ring.gz -p 1
+        options = Namespace(policy_name=None, partition='1', quoted=None)
+        args = 'object.ring.gz'
+        with mock.patch('swift.cli.info.os.path.exists') as exists:
+            exists.return_value = True
+            ring_path, args = parse_get_node_args(options, args.split())
+        self.assertEqual(ring_path, 'object.ring.gz')
+        self.assertFalse(args)
+        # object.ring.gz -p 1 a c o
+        options = Namespace(policy_name=None, partition='1', quoted=None)
+        args = 'object.ring.gz a c o'
+        with mock.patch('swift.cli.info.os.path.exists') as exists:
+            exists.return_value = True
+            ring_path, args = parse_get_node_args(options, args.split())
+        self.assertEqual(ring_path, 'object.ring.gz')
+        self.assertEqual(args, ['a', 'c', 'o'])
+        # object.ring.gz -p 1 a c o forth_arg
+        options = Namespace(policy_name=None, partition='1', quoted=None)
+        args = 'object.ring.gz a c o forth_arg'
+        with mock.patch('swift.cli.info.os.path.exists') as exists:
+            exists.return_value = True
+            self.assertRaisesMessage(
+                InfoSystemExit,
+                'Invalid arguments',
+                parse_get_node_args, options, args.split())
+        # object.ring.gz -p 1 a/c/o
+        options = Namespace(policy_name=None, partition='1', quoted=None)
+        args = 'object.ring.gz a/c/o'
+        with mock.patch('swift.cli.info.os.path.exists') as exists:
+            exists.return_value = True
+            ring_path, args = parse_get_node_args(options, args.split())
+        self.assertEqual(ring_path, 'object.ring.gz')
+        self.assertEqual(args, ['a', 'c', 'o'])
+        # object.ring.gz -p 1 a/c/junk/test.ring.gz
+        options = Namespace(policy_name=None, partition='1', quoted=None)
+        args = 'object.ring.gz a/c/junk/test.ring.gz'
+        with mock.patch('swift.cli.info.os.path.exists') as exists:
+            exists.return_value = True
+            ring_path, args = parse_get_node_args(options, args.split())
+        self.assertEqual(ring_path, 'object.ring.gz')
+        self.assertEqual(args, ['a', 'c', 'junk/test.ring.gz'])
+        # object.ring.gz -p 1 a/c/photos/cat.jpg
+        options = Namespace(policy_name=None, partition='1', quoted=None)
+        args = 'object.ring.gz a/c/photos/cat.jpg'
+        with mock.patch('swift.cli.info.os.path.exists') as exists:
+            exists.return_value = True
+            ring_path, args = parse_get_node_args(options, args.split())
+        self.assertEqual(ring_path, 'object.ring.gz')
+        self.assertEqual(args, ['a', 'c', 'photos/cat.jpg'])
+
+        # --all object.ring.gz a
+        options = Namespace(all=True, policy_name=None, quoted=None)
+        args = 'object.ring.gz a'
+        with mock.patch('swift.cli.info.os.path.exists') as exists:
+            exists.return_value = True
+            ring_path, args = parse_get_node_args(options, args.split())
+        self.assertEqual(ring_path, 'object.ring.gz')
+        self.assertEqual(args, ['a'])
+        # --all object.ring.gz a c
+        options = Namespace(all=True, policy_name=None, quoted=None)
+        args = 'object.ring.gz a c'
+        with mock.patch('swift.cli.info.os.path.exists') as exists:
+            exists.return_value = True
+            ring_path, args = parse_get_node_args(options, args.split())
+        self.assertEqual(ring_path, 'object.ring.gz')
+        self.assertEqual(args, ['a', 'c'])
+        # --all object.ring.gz a c o
+        options = Namespace(all=True, policy_name=None, quoted=None)
+        args = 'object.ring.gz a c o'
+        with mock.patch('swift.cli.info.os.path.exists') as exists:
+            exists.return_value = True
+            ring_path, args = parse_get_node_args(options, args.split())
+        self.assertEqual(ring_path, 'object.ring.gz')
+        self.assertEqual(args, ['a', 'c', 'o'])
+        # object.ring.gz account container photos/cat.jpg
+        options = Namespace(policy_name=None, partition=None, quoted=None)
+        args = 'object.ring.gz account container photos/cat.jpg'
+        with mock.patch('swift.cli.info.os.path.exists') as exists:
+            exists.return_value = True
+            ring_path, args = parse_get_node_args(options, args.split())
+        self.assertEqual(ring_path, 'object.ring.gz')
+        self.assertEqual(args, ['account', 'container', 'photos/cat.jpg'])
+        # object.ring.gz /account/container/photos/cat.jpg
+        options = Namespace(policy_name=None, partition=None, quoted=None)
+        args = 'object.ring.gz account/container/photos/cat.jpg'
+        with mock.patch('swift.cli.info.os.path.exists') as exists:
+            exists.return_value = True
+            ring_path, args = parse_get_node_args(options, args.split())
+        self.assertEqual(ring_path, 'object.ring.gz')
+        self.assertEqual(args, ['account', 'container', 'photos/cat.jpg'])
+        # Object name ends with 'ring.gz'
+        # object.ring.gz /account/container/junk/test.ring.gz
+        options = Namespace(policy_name=None, partition=None, quoted=None)
+        args = 'object.ring.gz account/container/junk/test.ring.gz'
+        with mock.patch('swift.cli.info.os.path.exists') as exists:
+            exists.return_value = True
+            ring_path, args = parse_get_node_args(options, args.split())
+        self.assertEqual(ring_path, 'object.ring.gz')
+        self.assertEqual(args, ['account', 'container', 'junk/test.ring.gz'])
+
+        # Object name has special characters
+        # object.ring.gz /account/container/obj\nwith%0anewline
+        options = Namespace(policy_name=None, partition=None, quoted=None)
+        args = ['object.ring.gz', 'account/container/obj\nwith%0anewline']
+        with mock.patch('swift.cli.info.os.path.exists') as exists:
+            exists.return_value = True
+            ring_path, args = parse_get_node_args(options, args)
+        self.assertEqual(ring_path, 'object.ring.gz')
+        self.assertEqual(args, ['account', 'container', 'obj\nwith%0anewline'])
+
+        options = Namespace(policy_name=None, partition=None, quoted=True)
+        args = ['object.ring.gz', 'account/container/obj\nwith%0anewline']
+        with mock.patch('swift.cli.info.os.path.exists') as exists:
+            exists.return_value = True
+            ring_path, args = parse_get_node_args(options, args)
+        self.assertEqual(ring_path, 'object.ring.gz')
+        self.assertEqual(args, ['account', 'container', 'obj\nwith\nnewline'])
+
+        options = Namespace(policy_name=None, partition=None, quoted=False)
+        args = ['object.ring.gz', 'account/container/obj\nwith%0anewline']
+        with mock.patch('swift.cli.info.os.path.exists') as exists:
+            exists.return_value = True
+            ring_path, args = parse_get_node_args(options, args)
+        self.assertEqual(ring_path, 'object.ring.gz')
+        self.assertEqual(args, ['account', 'container', 'obj\nwith%0anewline'])
+
+
+class TestPrintObj(TestCliInfoBase):
+
+    def setUp(self):
+        super(TestPrintObj, self).setUp()
+        self.datafile = os.path.join(self.testdir,
+                                     '1402017432.46642.data')
+        with open(self.datafile, 'wb') as fp:
+            md = {'name': '/AUTH_admin/c/obj',
+                  'Content-Type': 'application/octet-stream'}
+            write_metadata(fp, md)
+
+    def test_print_obj_invalid(self):
+        datafile = '1402017324.68634.data'
+        self.assertRaises(InfoSystemExit, print_obj, datafile)
+        datafile = os.path.join(self.testdir, './1234.data')
+        self.assertRaises(InfoSystemExit, print_obj, datafile)
+
+        with open(datafile, 'wb') as fp:
+            fp.write(b'1234')
+
+        out = StringIO()
+        with mock.patch('sys.stdout', out):
+            self.assertRaises(InfoSystemExit, print_obj, datafile)
+            self.assertEqual(out.getvalue().strip(),
+                             'Invalid metadata')
+
+    def test_print_obj_valid(self):
+        out = StringIO()
+        with mock.patch('sys.stdout', out):
+            print_obj(self.datafile, swift_dir=self.testdir)
+        etag_msg = 'ETag: Not found in metadata'
+        length_msg = 'Content-Length: Not found in metadata'
+        self.assertIn(etag_msg, out.getvalue())
+        self.assertIn(length_msg, out.getvalue())
+
+    def test_print_obj_with_policy(self):
+        out = StringIO()
+        with mock.patch('sys.stdout', out):
+            print_obj(self.datafile, swift_dir=self.testdir, policy_name='one')
+        etag_msg = 'ETag: Not found in metadata'
+        length_msg = 'Content-Length: Not found in metadata'
+        ring_loc_msg = 'ls -lah'
+        self.assertIn(etag_msg, out.getvalue())
+        self.assertIn(length_msg, out.getvalue())
+        self.assertIn(ring_loc_msg, out.getvalue())
+
+    def test_missing_etag(self):
+        out = StringIO()
+        with mock.patch('sys.stdout', out):
+            print_obj(self.datafile)
+        self.assertIn('ETag: Not found in metadata', out.getvalue())
+
+
+class TestPrintObjFullMeta(TestCliInfoBase):
+    def setUp(self):
+        super(TestPrintObjFullMeta, self).setUp()
+        self.datafile = os.path.join(self.testdir,
+                                     'sda', 'objects-1',
+                                     '1', 'ea8',
+                                     'db4449e025aca992307c7c804a67eea8',
+                                     '1402017884.18202.data')
+        utils.mkdirs(os.path.dirname(self.datafile))
+        with open(self.datafile, 'wb') as fp:
+            md = {'name': '/AUTH_admin/c/obj',
+                  'Content-Type': 'application/octet-stream',
+                  'ETag': 'd41d8cd98f00b204e9800998ecf8427e',
+                  'Content-Length': '0'}
+            write_metadata(fp, md)
+
+    def test_print_obj(self):
+        out = StringIO()
+        with mock.patch('sys.stdout', out):
+            print_obj(self.datafile, swift_dir=self.testdir)
+        self.assertIn('/objects-1/', out.getvalue())
+
+    def test_print_obj_policy_index(self):
+        # Check an output of policy index when current directory is in
+        # object-* directory
+        out = StringIO()
+        hash_dir = os.path.dirname(self.datafile)
+        file_name = os.path.basename(self.datafile)
+
+        # Change working directory to object hash dir
+        cwd = os.getcwd()
+        try:
+            os.chdir(hash_dir)
+            with mock.patch('sys.stdout', out):
+                print_obj(file_name, swift_dir=self.testdir)
+        finally:
+            os.chdir(cwd)
+        self.assertIn('X-Backend-Storage-Policy-Index: 1', out.getvalue())
+
+    def test_print_obj_curl_command_ipv4(self):
+        # Note: policy 2 has IPv4 addresses in its ring
+        datafile2 = os.path.join(
+            self.testdir,
+            'sda', 'objects-2', '1', 'ea8',
+            'db4449e025aca992307c7c804a67eea8', '1402017884.18202.data')
+        utils.mkdirs(os.path.dirname(datafile2))
+        with open(datafile2, 'wb') as fp:
+            md = {'name': '/AUTH_admin/c/obj',
+                  'Content-Type': 'application/octet-stream',
+                  'ETag': 'd41d8cd98f00b204e9800998ecf8427e',
+                  'Content-Length': '0'}
+            write_metadata(fp, md)
+
+        object_ring = ring.Ring(self.testdir, ring_name='object-2')
+        part, nodes = object_ring.get_nodes('AUTH_admin', 'c', 'obj')
+        node = nodes[0]
+
+        out = StringIO()
+        hash_dir = os.path.dirname(datafile2)
+        file_name = os.path.basename(datafile2)
+
+        # Change working directory to object hash dir
+        cwd = os.getcwd()
+        try:
+            os.chdir(hash_dir)
+            with mock.patch('sys.stdout', out):
+                print_obj(file_name, swift_dir=self.testdir)
+        finally:
+            os.chdir(cwd)
+
+        exp_curl = (
+            'curl -g -I -XHEAD '
+            '"http://{host}:{port}/{device}/{part}/AUTH_admin/c/obj" '
+            '-H "X-Backend-Storage-Policy-Index: 2" --path-as-is').format(
+                host=node['ip'],
+                port=node['port'],
+                device=node['device'],
+                part=part)
+        self.assertIn(exp_curl, out.getvalue())
+
+    def test_print_obj_curl_command_ipv6(self):
+        # Note: policy 3 has IPv6 addresses in its ring
+        datafile3 = os.path.join(
+            self.testdir,
+            'sda', 'objects-3', '1', 'ea8',
+            'db4449e025aca992307c7c804a67eea8', '1402017884.18202.data')
+        utils.mkdirs(os.path.dirname(datafile3))
+        with open(datafile3, 'wb') as fp:
+            md = {'name': '/AUTH_admin/c/obj',
+                  'Content-Type': 'application/octet-stream',
+                  'ETag': 'd41d8cd98f00b204e9800998ecf8427e',
+                  'Content-Length': '0'}
+            write_metadata(fp, md)
+
+        object_ring = ring.Ring(self.testdir, ring_name='object-3')
+        part, nodes = object_ring.get_nodes('AUTH_admin', 'c', 'obj')
+        node = nodes[0]
+
+        out = StringIO()
+        hash_dir = os.path.dirname(datafile3)
+        file_name = os.path.basename(datafile3)
+
+        # Change working directory to object hash dir
+        cwd = os.getcwd()
+        try:
+            os.chdir(hash_dir)
+            with mock.patch('sys.stdout', out):
+                print_obj(file_name, swift_dir=self.testdir)
+        finally:
+            os.chdir(cwd)
+
+        exp_curl = (
+            'curl -g -I -XHEAD '
+            '"http://[{host}]:{port}'
+            '/{device}/{part}/AUTH_admin/c/obj" '
+            '-H "X-Backend-Storage-Policy-Index: 3" --path-as-is').format(
+                host=node['ip'],
+                port=node['port'],
+                device=node['device'],
+                part=part)
+        self.assertIn(exp_curl, out.getvalue())
+
+    def test_print_obj_meta_and_ts_files(self):
+        # verify that print_obj will also read from meta and ts files
+        base = os.path.splitext(self.datafile)[0]
+        for ext in ('.meta', '.ts'):
+            test_file = '%s%s' % (base, ext)
+            os.link(self.datafile, test_file)
+            out = StringIO()
+            with mock.patch('sys.stdout', out):
+                print_obj(test_file, swift_dir=self.testdir)
+            self.assertIn('/objects-1/', out.getvalue())
+
+    def test_print_obj_no_ring(self):
+        no_rings_dir = os.path.join(self.testdir, 'no_rings_here')
+        os.mkdir(no_rings_dir)
+
+        out = StringIO()
+        with mock.patch('sys.stdout', out):
+            print_obj(self.datafile, swift_dir=no_rings_dir)
+        self.assertIn('d41d8cd98f00b204e9800998ecf8427e', out.getvalue())
+        self.assertNotIn('Partition', out.getvalue())
+
+    def test_print_obj_policy_name_mismatch(self):
+        out = StringIO()
+        with mock.patch('sys.stdout', out):
+            print_obj(self.datafile, policy_name='two', swift_dir=self.testdir)
+        ring_alert_msg = 'WARNING: Ring does not match policy!'
+        self.assertIn(ring_alert_msg, out.getvalue())
+
+    def test_valid_etag(self):
+        out = StringIO()
+        with mock.patch('sys.stdout', out):
+            print_obj(self.datafile)
+        self.assertIn('ETag: d41d8cd98f00b204e9800998ecf8427e (valid)',
+                      out.getvalue())
+
+    def test_invalid_etag(self):
+        with open(self.datafile, 'wb') as fp:
+            md = {'name': '/AUTH_admin/c/obj',
+                  'Content-Type': 'application/octet-stream',
+                  'ETag': 'badetag',
+                  'Content-Length': '0'}
+            write_metadata(fp, md)
+
+        out = StringIO()
+        with mock.patch('sys.stdout', out):
+            print_obj(self.datafile)
+        self.assertIn('ETag: badetag doesn\'t match file hash',
+                      out.getvalue())
+
+    def test_unchecked_etag(self):
+        out = StringIO()
+        with mock.patch('sys.stdout', out):
+            print_obj(self.datafile, check_etag=False)
+        self.assertIn('ETag: d41d8cd98f00b204e9800998ecf8427e (not checked)',
+                      out.getvalue())
+
+    def test_print_obj_metadata(self):
+        self.assertRaisesMessage(ValueError, 'Metadata is None',
+                                 print_obj_metadata, [])
+        ts_data = utils.Timestamp(106.3)
+
+        def get_metadata(items):
+            md = {
+                'name': '/AUTH_admin/c/dummy',
+                'Content-Type': 'application/octet-stream',
+                'X-Timestamp': ts_data.internal,
+            }
+            md.update(items)
+            return md
+
+        metadata = get_metadata({'X-Object-Meta-Mtime': '107.3'})
+        out = StringIO()
+        with mock.patch('sys.stdout', out):
+            print_obj_metadata(metadata)
+        exp_out = '''Path: /AUTH_admin/c/dummy
+  Account: AUTH_admin
+  Container: c
+  Object: dummy
+  Object hash: 128fdf98bddd1b1e8695f4340e67a67a
+Content-Type: application/octet-stream
+Timestamp: 1970-01-01T00:01:46.300000 (%s)
+System Metadata:
+  No metadata found
+Transient System Metadata:
+  No metadata found
+User Metadata:
+  X-Object-Meta-Mtime: 107.3
+Other Metadata:
+  No metadata found''' % ts_data.internal
+
+        self.assertEqual(out.getvalue().strip(), exp_out)
+
+        metadata = get_metadata({
+            'X-Object-Sysmeta-Mtime': '107.3',
+            'X-Object-Sysmeta-Name': 'Obj name',
+        })
+        out = StringIO()
+        with mock.patch('sys.stdout', out):
+            print_obj_metadata(metadata, True)
+        exp_out = '''Path: /AUTH_admin/c/dummy
+  Account: AUTH_admin
+  Container: c
+  Object: dummy
+  Object hash: 128fdf98bddd1b1e8695f4340e67a67a
+Content-Type: application/octet-stream
+Timestamp: 1970-01-01T00:01:46.300000 (%s)
+System Metadata:
+  Mtime: 107.3
+  Name: Obj name
+Transient System Metadata:
+  No metadata found
+User Metadata:
+  No metadata found
+Other Metadata:
+  No metadata found''' % ts_data.internal
+
+        self.assertEqual(out.getvalue().strip(), exp_out)
+
+        metadata = get_metadata({
+            'X-Object-Meta-Mtime': '107.3',
+            'X-Object-Sysmeta-Mtime': '107.3',
+            'X-Object-Mtime': '107.3',
+        })
+        out = StringIO()
+        with mock.patch('sys.stdout', out):
+            print_obj_metadata(metadata)
+        exp_out = '''Path: /AUTH_admin/c/dummy
+  Account: AUTH_admin
+  Container: c
+  Object: dummy
+  Object hash: 128fdf98bddd1b1e8695f4340e67a67a
+Content-Type: application/octet-stream
+Timestamp: 1970-01-01T00:01:46.300000 (%s)
+System Metadata:
+  X-Object-Sysmeta-Mtime: 107.3
+Transient System Metadata:
+  No metadata found
+User Metadata:
+  X-Object-Meta-Mtime: 107.3
+Other Metadata:
+  X-Object-Mtime: 107.3''' % ts_data.internal
+
+        self.assertEqual(out.getvalue().strip(), exp_out)
+
+        metadata = get_metadata({})
+        out = StringIO()
+        with mock.patch('sys.stdout', out):
+            print_obj_metadata(metadata)
+        exp_out = '''Path: /AUTH_admin/c/dummy
+  Account: AUTH_admin
+  Container: c
+  Object: dummy
+  Object hash: 128fdf98bddd1b1e8695f4340e67a67a
+Content-Type: application/octet-stream
+Timestamp: 1970-01-01T00:01:46.300000 (%s)
+System Metadata:
+  No metadata found
+Transient System Metadata:
+  No metadata found
+User Metadata:
+  No metadata found
+Other Metadata:
+  No metadata found''' % ts_data.internal
+
+        self.assertEqual(out.getvalue().strip(), exp_out)
+
+        metadata = get_metadata({'X-Object-Meta-Mtime': '107.3'})
+        metadata['name'] = '/a-s'
+        self.assertRaisesMessage(ValueError, 'Path is invalid',
+                                 print_obj_metadata, metadata)
+
+        metadata = get_metadata({'X-Object-Meta-Mtime': '107.3'})
+        del metadata['name']
+        out = StringIO()
+        with mock.patch('sys.stdout', out):
+            print_obj_metadata(metadata, True)
+        exp_out = '''Path: Not found in metadata
+Content-Type: application/octet-stream
+Timestamp: 1970-01-01T00:01:46.300000 (%s)
+System Metadata:
+  No metadata found
+Transient System Metadata:
+  No metadata found
+User Metadata:
+  Mtime: 107.3
+Other Metadata:
+  No metadata found''' % ts_data.internal
+
+        self.assertEqual(out.getvalue().strip(), exp_out)
+
+        metadata = get_metadata({'X-Object-Meta-Mtime': '107.3'})
+        del metadata['Content-Type']
+        out = StringIO()
+        with mock.patch('sys.stdout', out):
+            print_obj_metadata(metadata)
+        exp_out = '''Path: /AUTH_admin/c/dummy
+  Account: AUTH_admin
+  Container: c
+  Object: dummy
+  Object hash: 128fdf98bddd1b1e8695f4340e67a67a
+Content-Type: Not found in metadata
+Timestamp: 1970-01-01T00:01:46.300000 (%s)
+System Metadata:
+  No metadata found
+Transient System Metadata:
+  No metadata found
+User Metadata:
+  X-Object-Meta-Mtime: 107.3
+Other Metadata:
+  No metadata found''' % ts_data.internal
+
+        self.assertEqual(out.getvalue().strip(), exp_out)
+
+        metadata = get_metadata({'X-Object-Meta-Mtime': '107.3'})
+        del metadata['X-Timestamp']
+        out = StringIO()
+        with mock.patch('sys.stdout', out):
+            print_obj_metadata(metadata, True)
+        exp_out = '''Path: /AUTH_admin/c/dummy
+  Account: AUTH_admin
+  Container: c
+  Object: dummy
+  Object hash: 128fdf98bddd1b1e8695f4340e67a67a
+Content-Type: application/octet-stream
+Timestamp: Not found in metadata
+System Metadata:
+  No metadata found
+Transient System Metadata:
+  No metadata found
+User Metadata:
+  Mtime: 107.3
+Other Metadata:
+  No metadata found'''
+
+        self.assertEqual(out.getvalue().strip(), exp_out)
+
+        metadata = get_metadata({
+            'X-Object-Meta-Mtime': '107.3',
+            'X-Object-Sysmeta-Mtime': '106.3',
+            'X-Object-Transient-Sysmeta-Mtime': '105.3',
+            'X-Object-Mtime': '104.3',
+        })
+        out = StringIO()
+        with mock.patch('sys.stdout', out):
+            print_obj_metadata(metadata)
+        exp_out = '''Path: /AUTH_admin/c/dummy
+  Account: AUTH_admin
+  Container: c
+  Object: dummy
+  Object hash: 128fdf98bddd1b1e8695f4340e67a67a
+Content-Type: application/octet-stream
+Timestamp: 1970-01-01T00:01:46.300000 (%s)
+System Metadata:
+  X-Object-Sysmeta-Mtime: 106.3
+Transient System Metadata:
+  X-Object-Transient-Sysmeta-Mtime: 105.3
+User Metadata:
+  X-Object-Meta-Mtime: 107.3
+Other Metadata:
+  X-Object-Mtime: 104.3''' % ts_data.internal
+
+        self.assertEqual(out.getvalue().strip(), exp_out)
+
+        metadata = get_metadata({
+            'X-Object-Meta-Mtime': '107.3',
+            'X-Object-Sysmeta-Mtime': '106.3',
+            'X-Object-Transient-Sysmeta-Mtime': '105.3',
+            'X-Object-Mtime': '104.3',
+        })
+        out = StringIO()
+        with mock.patch('sys.stdout', out):
+            print_obj_metadata(metadata, True)
+        exp_out = '''Path: /AUTH_admin/c/dummy
+  Account: AUTH_admin
+  Container: c
+  Object: dummy
+  Object hash: 128fdf98bddd1b1e8695f4340e67a67a
+Content-Type: application/octet-stream
+Timestamp: 1970-01-01T00:01:46.300000 (%s)
+System Metadata:
+  Mtime: 106.3
+Transient System Metadata:
+  Mtime: 105.3
+User Metadata:
+  Mtime: 107.3
+Other Metadata:
+  X-Object-Mtime: 104.3''' % ts_data.internal
+
+        self.assertEqual(out.getvalue().strip(), exp_out)
+
+    def test_print_obj_crypto_metadata(self):
+        cryto_body_meta = '%7B%22body_key%22%3A+%7B%22iv%22%3A+%22HmpwLDjlo' \
+            '6JxFvOOCVyT6Q%3D%3D%22%2C+%22key%22%3A+%22dEox1dyZJPCs4mtmiQDg' \
+            'u%2Fv1RTointi%2FUhm2y%2BgB3F8%3D%22%7D%2C+%22cipher%22%3A+%22A' \
+            'ES_CTR_256%22%2C+%22iv%22%3A+%22l3W0NZekjt4PFkAJXubVYQ%3D%3D%2' \
+            '2%2C+%22key_id%22%3A+%7B%22path%22%3A+%22%2FAUTH_test%2Ftest%2' \
+            'Ftest%22%2C+%22secret_id%22%3A+%222018%22%2C+%22v%22%3A+%221%2' \
+            '2%7D%7D'
+
+        crypto_meta_meta = '%7B%22cipher%22%3A+%22AES_CTR_256%22%2C+%22key_' \
+            'id%22%3A+%7B%22path%22%3A+%22%2FAUTH_test%2Ftest%2Ftest%22%2C+' \
+            '%22secret_id%22%3A+%222018%22%2C+%22v%22%3A+%221%22%7D%7D'
+
+        stub_metadata = {
+            'name': '/AUTH_test/test/test',
+            'Content-Type': 'application/sekret',
+            'X-Timestamp': '1549899598.237075',
+            'X-Object-Sysmeta-Crypto-Body-Meta': cryto_body_meta,
+            'X-Object-Transient-Sysmeta-Crypto-Meta': crypto_meta_meta,
+        }
+        out = StringIO()
+        with mock.patch('sys.stdout', out):
+            print_obj_metadata(stub_metadata)
+        exp_out = '''Path: /AUTH_test/test/test
+  Account: AUTH_test
+  Container: test
+  Object: test
+  Object hash: dc3a7d53522b9392b0d19571a752fdfb
+Content-Type: application/sekret
+Timestamp: 2019-02-11T15:39:58.237080 (1549899598.23708)
+System Metadata:
+  X-Object-Sysmeta-Crypto-Body-Meta: %s
+Transient System Metadata:
+  X-Object-Transient-Sysmeta-Crypto-Meta: %s
+User Metadata:
+  No metadata found
+Other Metadata:
+  No metadata found
+Data crypto details: {
+  "body_key": {
+    "iv": "HmpwLDjlo6JxFvOOCVyT6Q==",
+    "key": "dEox1dyZJPCs4mtmiQDgu/v1RTointi/Uhm2y+gB3F8="
+  },
+  "cipher": "AES_CTR_256",
+  "iv": "l3W0NZekjt4PFkAJXubVYQ==",
+  "key_id": {
+    "path": "/AUTH_test/test/test",
+    "secret_id": "2018",
+    "v": "1"
+  }
+}
+Metadata crypto details: {
+  "cipher": "AES_CTR_256",
+  "key_id": {
+    "path": "/AUTH_test/test/test",
+    "secret_id": "2018",
+    "v": "1"
+  }
+}''' % (cryto_body_meta, crypto_meta_meta)
+
+        self.maxDiff = None
+        self.assertMultiLineEqual(out.getvalue().strip(), exp_out)
+
+
+class TestPrintObjWeirdPath(TestPrintObjFullMeta):
+    def setUp(self):
+        super(TestPrintObjWeirdPath, self).setUp()
+        # device name is objects-0 instead of sda, this is weird.
+        self.datafile = os.path.join(self.testdir,
+                                     'objects-0', 'objects-1',
+                                     '1', 'ea8',
+                                     'db4449e025aca992307c7c804a67eea8',
+                                     '1402017884.18202.data')
+        utils.mkdirs(os.path.dirname(self.datafile))
+        with open(self.datafile, 'wb') as fp:
+            md = {'name': '/AUTH_admin/c/obj',
+                  'Content-Type': 'application/octet-stream',
+                  'ETag': 'd41d8cd98f00b204e9800998ecf8427e',
+                  'Content-Length': '0'}
+            write_metadata(fp, md)
diff --git a/test/unit/cli/test_ipv6_output.stub b/test/unit/cli/test_ipv6_output.stub
new file mode 100644
index 0000000000..8571b79db7
--- /dev/null
+++ b/test/unit/cli/test_ipv6_output.stub
@@ -0,0 +1,10 @@
+__RINGFILE__, build version 4, id __BUILDER_ID__
+256 partitions, 3.000000 replicas, 4 regions, 4 zones, 4 devices, 2-byte IDs, 100.00 balance, 0.00 dispersion
+The minimum number of hours before a partition can be reassigned is 1 (0:00:00 remaining)
+The overload factor is 0.00% (0.000000)
+Ring file __RINGFILE__.ring.gz not found, probably it hasn't been written yet
+Devices:   id region zone                     ip address:port                  replication ip:port   name   weight partitions balance flags meta
+            0      0    0 [2001:db8:85a3::8a2e:370:7334]:6200  [2001:db8:85a3::8a2e:370:7334]:6200   sda1   100.00          0 -100.00       some meta data
+            1      1    1                      127.0.0.1:66201                      127.0.0.1:66201  sda2   100.00          0 -100.00
+            2      2    2 [2001:db8:85a3::8a2e:370:7336]:6202                    127.0.10.127:7070   sdc3 10000.00          0 -100.00
+            3      3    3 [2001:db8:85a3::8a2e:370:7337]:6203  [7001:db8:85a3::8a2e:370:7337]:11664  sdd4   100.00          0 -100.00
diff --git a/test/unit/cli/test_manage_shard_ranges.py b/test/unit/cli/test_manage_shard_ranges.py
new file mode 100644
index 0000000000..96c362cf17
--- /dev/null
+++ b/test/unit/cli/test_manage_shard_ranges.py
@@ -0,0 +1,2959 @@
+# Licensed under the Apache License, Version 2.0 (the "License"); you may not
+# use this file except in compliance with the License. You may obtain a copy
+# of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
+# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
+# License for the specific language governing permissions and limitations
+# under the License.
+
+import json
+import os
+import sys
+import unittest
+from argparse import Namespace
+from textwrap import dedent
+
+from unittest import mock
+from shutil import rmtree
+from tempfile import mkdtemp
+
+from io import StringIO
+
+from swift.cli.manage_shard_ranges import main
+from swift.common import utils
+from swift.common.utils import Timestamp, ShardRange
+from swift.container.backend import ContainerBroker
+from swift.container.sharder import make_shard_ranges
+from test.unit import mock_timestamp_now, make_timestamp_iter, with_tempdir
+
+
+class TestManageShardRanges(unittest.TestCase):
+    def setUp(self):
+        self.ts_iter = make_timestamp_iter()
+        self.testdir = os.path.join(mkdtemp(), 'tmp_test_cli_find_shards')
+        utils.mkdirs(self.testdir)
+        rmtree(self.testdir)
+        self.shard_data = [
+            {'index': 0, 'lower': '', 'upper': 'obj09',
+             'object_count': 10},
+            {'index': 1, 'lower': 'obj09', 'upper': 'obj19',
+             'object_count': 10},
+            {'index': 2, 'lower': 'obj19', 'upper': 'obj29',
+             'object_count': 10},
+            {'index': 3, 'lower': 'obj29', 'upper': 'obj39',
+             'object_count': 10},
+            {'index': 4, 'lower': 'obj39', 'upper': 'obj49',
+             'object_count': 10},
+            {'index': 5, 'lower': 'obj49', 'upper': 'obj59',
+             'object_count': 10},
+            {'index': 6, 'lower': 'obj59', 'upper': 'obj69',
+             'object_count': 10},
+            {'index': 7, 'lower': 'obj69', 'upper': 'obj79',
+             'object_count': 10},
+            {'index': 8, 'lower': 'obj79', 'upper': 'obj89',
+             'object_count': 10},
+            {'index': 9, 'lower': 'obj89', 'upper': '',
+             'object_count': 10},
+        ]
+
+        self.overlap_shard_data_1 = [
+            {'index': 0, 'lower': '', 'upper': 'obj10',
+             'object_count': 1},
+            {'index': 1, 'lower': 'obj10', 'upper': 'obj20',
+             'object_count': 1},
+            {'index': 2, 'lower': 'obj20', 'upper': 'obj30',
+             'object_count': 1},
+            {'index': 3, 'lower': 'obj30', 'upper': 'obj39',
+             'object_count': 1},
+            {'index': 4, 'lower': 'obj39', 'upper': 'obj49',
+             'object_count': 1},
+            {'index': 5, 'lower': 'obj49', 'upper': 'obj58',
+             'object_count': 1},
+            {'index': 6, 'lower': 'obj58', 'upper': 'obj68',
+             'object_count': 1},
+            {'index': 7, 'lower': 'obj68', 'upper': 'obj78',
+             'object_count': 1},
+            {'index': 8, 'lower': 'obj78', 'upper': 'obj88',
+             'object_count': 1},
+            {'index': 9, 'lower': 'obj88', 'upper': '',
+             'object_count': 1},
+        ]
+
+        self.overlap_shard_data_2 = [
+            {'index': 0, 'lower': '', 'upper': 'obj11', 'object_count': 1},
+            {'index': 1, 'lower': 'obj11', 'upper': 'obj21',
+             'object_count': 1},
+        ]
+
+    def tearDown(self):
+        rmtree(os.path.dirname(self.testdir))
+
+    def assert_shard_ranges_equal(self, expected, actual):
+        self.assertEqual([dict(sr) for sr in expected],
+                         [dict(sr) for sr in actual])
+
+    def assert_starts_with(self, value, prefix):
+        self.assertTrue(value.startswith(prefix),
+                        "%r does not start with %r" % (value, prefix))
+
+    def assert_formatted_json(self, output, expected):
+        try:
+            loaded = json.loads(output)
+        except ValueError as err:
+            self.fail('Invalid JSON: %s\n%r' % (err, output))
+        # Check this one first, for a prettier diff
+        self.assertEqual(loaded, expected)
+        formatted = json.dumps(expected, sort_keys=True, indent=2) + '\n'
+        self.assertEqual(output, formatted)
+
+    def _make_broker(self, account='a', container='c',
+                     device='sda', part=0):
+        datadir = os.path.join(
+            self.testdir, device, 'containers', str(part), 'ash', 'hash')
+        db_file = os.path.join(datadir, 'hash.db')
+        broker = ContainerBroker(
+            db_file, account=account, container=container)
+        broker.initialize()
+        return broker
+
+    def _move_broker_to_sharded_state(self, broker):
+        epoch = Timestamp.now()
+        broker.enable_sharding(epoch)
+        self.assertTrue(broker.set_sharding_state())
+        self.assertTrue(broker.set_sharded_state())
+        own_sr = broker.get_own_shard_range()
+        own_sr.update_state(ShardRange.SHARDED, epoch)
+        broker.merge_shard_ranges([own_sr])
+        return epoch
+
+    def test_conf_file_options(self):
+        db_file = os.path.join(self.testdir, 'hash.db')
+        broker = ContainerBroker(db_file, account='a', container='c')
+        broker.initialize()
+
+        conf = """
+        [container-sharder]
+        shrink_threshold = 150
+        expansion_limit = 650
+        shard_container_threshold = 1000
+        rows_per_shard = 600
+        max_shrinking = 33
+        max_expanding = 31
+        minimum_shard_size = 88
+        """
+
+        conf_file = os.path.join(self.testdir, 'sharder.conf')
+        with open(conf_file, 'w') as fd:
+            fd.write(dedent(conf))
+
+        # default values
+        with mock.patch('swift.cli.manage_shard_ranges.find_ranges',
+                        return_value=0) as mocked:
+            ret = main([db_file, 'find'])
+        self.assertEqual(0, ret)
+        expected = Namespace(conf_file=None,
+                             path_to_file=mock.ANY,
+                             func=mock.ANY,
+                             rows_per_shard=500000,
+                             subcommand='find',
+                             skip_commits=False,
+                             verbose=0,
+                             minimum_shard_size=100000)
+        mocked.assert_called_once_with(mock.ANY, expected)
+
+        # conf file
+        with mock.patch('swift.cli.manage_shard_ranges.find_ranges',
+                        return_value=0) as mocked:
+            ret = main([db_file, '--config', conf_file, 'find'])
+        self.assertEqual(0, ret)
+        expected = Namespace(conf_file=conf_file,
+                             path_to_file=mock.ANY,
+                             func=mock.ANY,
+                             rows_per_shard=600,
+                             subcommand='find',
+                             skip_commits=False,
+                             verbose=0,
+                             minimum_shard_size=88)
+        mocked.assert_called_once_with(mock.ANY, expected)
+
+        # cli options override conf file
+        with mock.patch('swift.cli.manage_shard_ranges.find_ranges',
+                        return_value=0) as mocked:
+            ret = main([db_file, '--config', conf_file, 'find', '12345',
+                        '--minimum-shard-size', '99'])
+        self.assertEqual(0, ret)
+        expected = Namespace(conf_file=conf_file,
+                             path_to_file=mock.ANY,
+                             func=mock.ANY,
+                             rows_per_shard=12345,
+                             subcommand='find',
+                             skip_commits=False,
+                             verbose=0,
+                             minimum_shard_size=99)
+        mocked.assert_called_once_with(mock.ANY, expected)
+
+        # default values
+        with mock.patch('swift.cli.manage_shard_ranges.compact_shard_ranges',
+                        return_value=0) as mocked:
+            ret = main([db_file, 'compact'])
+        self.assertEqual(0, ret)
+        expected = Namespace(conf_file=None,
+                             path_to_file=mock.ANY,
+                             func=mock.ANY,
+                             subcommand='compact',
+                             skip_commits=False,
+                             verbose=0,
+                             max_expanding=-1,
+                             max_shrinking=1,
+                             shrink_threshold=100000,
+                             expansion_limit=750000,
+                             yes=False,
+                             dry_run=False)
+        mocked.assert_called_once_with(mock.ANY, expected)
+
+        # conf file
+        with mock.patch('swift.cli.manage_shard_ranges.compact_shard_ranges',
+                        return_value=0) as mocked:
+            ret = main([db_file, '--config', conf_file, 'compact'])
+        self.assertEqual(0, ret)
+        expected = Namespace(conf_file=conf_file,
+                             path_to_file=mock.ANY,
+                             func=mock.ANY,
+                             subcommand='compact',
+                             skip_commits=False,
+                             verbose=0,
+                             max_expanding=31,
+                             max_shrinking=33,
+                             shrink_threshold=150,
+                             expansion_limit=650,
+                             yes=False,
+                             dry_run=False)
+        mocked.assert_called_once_with(mock.ANY, expected)
+
+        # cli options
+        with mock.patch('swift.cli.manage_shard_ranges.compact_shard_ranges',
+                        return_value=0) as mocked:
+            ret = main([db_file, '--config', conf_file, 'compact',
+                        '--max-shrinking', '22',
+                        '--max-expanding', '11',
+                        '--expansion-limit', '3456',
+                        '--shrink-threshold', '1234'])
+        self.assertEqual(0, ret)
+        expected = Namespace(conf_file=conf_file,
+                             path_to_file=mock.ANY,
+                             func=mock.ANY,
+                             subcommand='compact',
+                             skip_commits=False,
+                             verbose=0,
+                             max_expanding=11,
+                             max_shrinking=22,
+                             shrink_threshold=1234,
+                             expansion_limit=3456,
+                             yes=False,
+                             dry_run=False)
+        mocked.assert_called_once_with(mock.ANY, expected)
+
+    def test_conf_file_deprecated_options(self):
+        # verify that deprecated percent-based do get applied
+        db_file = os.path.join(self.testdir, 'hash.db')
+        broker = ContainerBroker(db_file, account='a', container='c')
+        broker.initialize()
+
+        conf = """
+        [container-sharder]
+        shard_shrink_point = 15
+        shard_shrink_merge_point = 65
+        shard_container_threshold = 1000
+        max_shrinking = 33
+        max_expanding = 31
+        """
+
+        conf_file = os.path.join(self.testdir, 'sharder.conf')
+        with open(conf_file, 'w') as fd:
+            fd.write(dedent(conf))
+
+        with mock.patch('swift.cli.manage_shard_ranges.compact_shard_ranges',
+                        return_value=0) as mocked:
+            ret = main([db_file, '--config', conf_file, 'compact'])
+        self.assertEqual(0, ret)
+        expected = Namespace(conf_file=conf_file,
+                             path_to_file=mock.ANY,
+                             func=mock.ANY,
+                             subcommand='compact',
+                             skip_commits=False,
+                             verbose=0,
+                             max_expanding=31,
+                             max_shrinking=33,
+                             shrink_threshold=150,
+                             expansion_limit=650,
+                             yes=False,
+                             dry_run=False)
+        mocked.assert_called_once_with(mock.ANY, expected)
+
+        # absolute value options take precedence if specified in the conf file
+        conf = """
+        [container-sharder]
+        shard_shrink_point = 15
+        shrink_threshold = 123
+        shard_shrink_merge_point = 65
+        expansion_limit = 456
+        shard_container_threshold = 1000
+        max_shrinking = 33
+        max_expanding = 31
+        """
+
+        conf_file = os.path.join(self.testdir, 'sharder.conf')
+        with open(conf_file, 'w') as fd:
+            fd.write(dedent(conf))
+
+        with mock.patch('swift.cli.manage_shard_ranges.compact_shard_ranges') \
+                as mocked:
+            main([db_file, '--config', conf_file, 'compact'])
+        expected = Namespace(conf_file=conf_file,
+                             path_to_file=mock.ANY,
+                             func=mock.ANY,
+                             subcommand='compact',
+                             skip_commits=False,
+                             verbose=0,
+                             max_expanding=31,
+                             max_shrinking=33,
+                             shrink_threshold=123,
+                             expansion_limit=456,
+                             yes=False,
+                             dry_run=False)
+        mocked.assert_called_once_with(mock.ANY, expected)
+
+        # conf file - small percentages resulting in zero absolute values
+        # should be respected rather than falling back to defaults, to avoid
+        # nasty surprises
+        conf = """
+        [container-sharder]
+        shard_shrink_point = 1
+        shard_shrink_merge_point = 2
+        shard_container_threshold = 10
+        max_shrinking = 33
+        max_expanding = 31
+        """
+        conf_file = os.path.join(self.testdir, 'sharder.conf')
+        with open(conf_file, 'w') as fd:
+            fd.write(dedent(conf))
+
+        with mock.patch('swift.cli.manage_shard_ranges.compact_shard_ranges') \
+                as mocked:
+            main([db_file, '--config', conf_file, 'compact'])
+        expected = Namespace(conf_file=conf_file,
+                             path_to_file=mock.ANY,
+                             func=mock.ANY,
+                             subcommand='compact',
+                             skip_commits=False,
+                             verbose=0,
+                             max_expanding=31,
+                             max_shrinking=33,
+                             shrink_threshold=0,
+                             expansion_limit=0,
+                             yes=False,
+                             dry_run=False)
+        mocked.assert_called_once_with(mock.ANY, expected)
+
+    def test_conf_file_invalid(self):
+        db_file = os.path.join(self.testdir, 'hash.db')
+        broker = ContainerBroker(db_file, account='a', container='c')
+        broker.initialize()
+
+        # conf file - invalid value for shard_container_threshold
+        conf = """
+        [container-sharder]
+        shrink_threshold = 1
+        expansion_limit = 2
+        shard_container_threshold = 0
+        max_shrinking = 33
+        max_expanding = 31
+        """
+        conf_file = os.path.join(self.testdir, 'sharder.conf')
+        with open(conf_file, 'w') as fd:
+            fd.write(dedent(conf))
+
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([db_file, '--config', conf_file, 'compact'])
+        self.assertEqual(2, ret)
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Error loading config')
+        self.assertIn('shard_container_threshold', err_lines[0])
+
+    def test_conf_file_invalid_deprecated_options(self):
+        db_file = os.path.join(self.testdir, 'hash.db')
+        broker = ContainerBroker(db_file, account='a', container='c')
+        broker.initialize()
+
+        # conf file - invalid value for shard_container_threshold
+        conf = """
+        [container-sharder]
+        shard_shrink_point = -1
+        shard_shrink_merge_point = 2
+        shard_container_threshold = 1000
+        max_shrinking = 33
+        max_expanding = 31
+        """
+        conf_file = os.path.join(self.testdir, 'sharder.conf')
+        with open(conf_file, 'w') as fd:
+            fd.write(dedent(conf))
+
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            main([db_file, '--config', conf_file, 'compact'])
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Error loading config')
+        self.assertIn('shard_shrink_point', err_lines[0])
+
+    def test_conf_file_does_not_exist(self):
+        db_file = os.path.join(self.testdir, 'hash.db')
+        broker = ContainerBroker(db_file, account='a', container='c')
+        broker.initialize()
+        conf_file = os.path.join(self.testdir, 'missing_sharder.conf')
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([db_file, '--config', conf_file, 'compact'])
+        self.assertEqual(1, ret)
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Error opening config file')
+
+    def test_find_shard_ranges(self):
+        db_file = os.path.join(self.testdir, 'hash.db')
+        broker = ContainerBroker(db_file)
+        broker.account = 'a'
+        broker.container = 'c'
+        broker.initialize()
+        ts = utils.Timestamp.now()
+        broker.merge_items([
+            {'name': 'obj%02d' % i, 'created_at': ts.internal, 'size': 0,
+             'content_type': 'application/octet-stream', 'etag': 'not-really',
+             'deleted': 0, 'storage_policy_index': 0,
+             'ctype_timestamp': ts.internal, 'meta_timestamp': ts.internal}
+            for i in range(100)])
+
+        # Default uses a large enough value that sharding isn't required
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([db_file, 'find'])
+        self.assertEqual(0, ret)
+        self.assert_formatted_json(out.getvalue(), [])
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        self.assert_starts_with(err_lines[1], 'Found 0 ranges in ')
+
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([db_file, 'find', '100'])
+        self.assertEqual(0, ret)
+        self.assert_formatted_json(out.getvalue(), [])
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        self.assert_starts_with(err_lines[1], 'Found 0 ranges in ')
+
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([db_file, 'find', '99', '--minimum-shard-size', '1'])
+        self.assertEqual(0, ret)
+        self.assert_formatted_json(out.getvalue(), [
+            {'index': 0, 'lower': '', 'upper': 'obj98', 'object_count': 99},
+            {'index': 1, 'lower': 'obj98', 'upper': '', 'object_count': 1},
+        ])
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        self.assert_starts_with(err_lines[1], 'Found 2 ranges in ')
+
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([db_file, 'find', '10'])
+        self.assertEqual(0, ret)
+        self.assert_formatted_json(out.getvalue(), [
+            {'index': 0, 'lower': '', 'upper': 'obj09', 'object_count': 10},
+            {'index': 1, 'lower': 'obj09', 'upper': 'obj19',
+             'object_count': 10},
+            {'index': 2, 'lower': 'obj19', 'upper': 'obj29',
+             'object_count': 10},
+            {'index': 3, 'lower': 'obj29', 'upper': 'obj39',
+             'object_count': 10},
+            {'index': 4, 'lower': 'obj39', 'upper': 'obj49',
+             'object_count': 10},
+            {'index': 5, 'lower': 'obj49', 'upper': 'obj59',
+             'object_count': 10},
+            {'index': 6, 'lower': 'obj59', 'upper': 'obj69',
+             'object_count': 10},
+            {'index': 7, 'lower': 'obj69', 'upper': 'obj79',
+             'object_count': 10},
+            {'index': 8, 'lower': 'obj79', 'upper': 'obj89',
+             'object_count': 10},
+            {'index': 9, 'lower': 'obj89', 'upper': '', 'object_count': 10},
+        ])
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        self.assert_starts_with(err_lines[1], 'Found 10 ranges in ')
+
+    def test_find_shard_ranges_with_minimum_size(self):
+        db_file = os.path.join(self.testdir, 'hash.db')
+        broker = ContainerBroker(db_file)
+        broker.account = 'a'
+        broker.container = 'c'
+        broker.initialize()
+        ts = utils.Timestamp.now()
+        # with 105 objects and rows_per_shard = 50 there is the potential for a
+        # tail shard of size 5
+        broker.merge_items([
+            {'name': 'obj%03d' % i, 'created_at': ts.internal, 'size': 0,
+             'content_type': 'application/octet-stream', 'etag': 'not-really',
+             'deleted': 0, 'storage_policy_index': 0,
+             'ctype_timestamp': ts.internal, 'meta_timestamp': ts.internal}
+            for i in range(105)])
+
+        def assert_tail_shard_not_extended(minimum):
+            out = StringIO()
+            err = StringIO()
+            with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+                ret = main([db_file, 'find', '50',
+                            '--minimum-shard-size', str(minimum)])
+            self.assertEqual(0, ret)
+            self.assert_formatted_json(out.getvalue(), [
+                {'index': 0, 'lower': '', 'upper': 'obj049',
+                 'object_count': 50},
+                {'index': 1, 'lower': 'obj049', 'upper': 'obj099',
+                 'object_count': 50},
+                {'index': 2, 'lower': 'obj099', 'upper': '',
+                 'object_count': 5},
+            ])
+            err_lines = err.getvalue().split('\n')
+            self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+            self.assert_starts_with(err_lines[1], 'Found 3 ranges in ')
+
+        # tail shard size > minimum
+        assert_tail_shard_not_extended(1)
+        assert_tail_shard_not_extended(4)
+        assert_tail_shard_not_extended(5)
+
+        def assert_tail_shard_extended(minimum):
+            out = StringIO()
+            err = StringIO()
+            if minimum is not None:
+                extra_args = ['--minimum-shard-size', str(minimum)]
+            else:
+                extra_args = []
+            with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+                ret = main([db_file, 'find', '50'] + extra_args)
+            self.assertEqual(0, ret)
+            err_lines = err.getvalue().split('\n')
+            self.assert_formatted_json(out.getvalue(), [
+                {'index': 0, 'lower': '', 'upper': 'obj049',
+                 'object_count': 50},
+                {'index': 1, 'lower': 'obj049', 'upper': '',
+                 'object_count': 55},
+            ])
+            self.assert_starts_with(err_lines[1], 'Found 2 ranges in ')
+            self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+
+        # sanity check - no minimum specified, defaults to rows_per_shard/5
+        assert_tail_shard_extended(None)
+        assert_tail_shard_extended(6)
+        assert_tail_shard_extended(50)
+
+        def assert_too_large_value_handled(minimum):
+            out = StringIO()
+            err = StringIO()
+            with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+                ret = main([db_file, 'find', '50',
+                            '--minimum-shard-size', str(minimum)])
+            self.assertEqual(2, ret)
+            self.assertEqual(
+                'Invalid config: minimum_shard_size (%s) must be <= '
+                'rows_per_shard (50)' % minimum, err.getvalue().strip())
+
+        assert_too_large_value_handled(51)
+        assert_too_large_value_handled(52)
+
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            with self.assertRaises(SystemExit):
+                main([db_file, 'find', '50', '--minimum-shard-size', '-1'])
+
+    def test_info(self):
+        broker = self._make_broker()
+        ts = next(self.ts_iter)
+        broker.merge_items([
+            {'name': 'obj%02d' % i, 'created_at': ts.internal, 'size': 9,
+             'content_type': 'application/octet-stream', 'etag': 'not-really',
+             'deleted': 0, 'storage_policy_index': 0,
+             'ctype_timestamp': ts.internal, 'meta_timestamp': ts.internal}
+            for i in range(100)])
+        broker.update_metadata({'X-Container-Sysmeta-Sharding':
+                                (True, Timestamp.now().internal)})
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'info'])
+        self.assertEqual(0, ret)
+        expected = ['Sharding enabled = True',
+                    'Own shard range: None',
+                    'db_state = unsharded',
+                    'object_count = 100',
+                    'bytes_used = 900',
+                    'Metadata:',
+                    '  X-Container-Sysmeta-Sharding = True']
+        self.assertEqual(expected, out.getvalue().splitlines())
+        self.assertEqual(['Loaded db broker for a/c'],
+                         err.getvalue().splitlines())
+
+        retiring_db_id = broker.get_info()['id']
+        broker.merge_shard_ranges(ShardRange('.shards/cc', Timestamp.now()))
+        epoch = Timestamp.now()
+        with mock_timestamp_now(epoch) as now:
+            broker.enable_sharding(epoch)
+        self.assertTrue(broker.set_sharding_state())
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            with mock_timestamp_now(now):
+                ret = main([broker.db_file, 'info'])
+        self.assertEqual(0, ret)
+        expected = ['Sharding enabled = True',
+                    'Own shard range: {',
+                    '  "bytes_used": 0,',
+                    '  "deleted": 0,',
+                    '  "epoch": "%s",' % epoch.internal,
+                    '  "lower": "",',
+                    '  "meta_timestamp": "%s",' % now.internal,
+                    '  "name": "a/c",',
+                    '  "object_count": 0,',
+                    '  "reported": 0,',
+                    '  "state": "sharding",',
+                    '  "state_timestamp": "%s",' % now.internal,
+                    '  "timestamp": "%s",' % now.internal,
+                    '  "tombstones": -1,',
+                    '  "upper": ""',
+                    '}',
+                    'db_state = sharding',
+                    'object_count = 100',
+                    'bytes_used = 900',
+                    'Retiring db id: %s' % retiring_db_id,
+                    'Cleaving context: {',
+                    '  "cleave_to_row": null,',
+                    '  "cleaving_done": false,',
+                    '  "cursor": "",',
+                    '  "last_cleave_to_row": null,',
+                    '  "max_row": 100,',
+                    '  "misplaced_done": false,',
+                    '  "ranges_done": 0,',
+                    '  "ranges_todo": 0,',
+                    '  "ref": "%s",' % retiring_db_id,
+                    '  "replication_time": 0',
+                    '}',
+                    'Metadata:',
+                    '  X-Container-Sysmeta-Sharding = True']
+        result = [x for x in out.getvalue().splitlines()]
+        self.assertEqual(expected, result)
+        self.assertEqual(['Loaded db broker for a/c'],
+                         err.getvalue().splitlines())
+
+        self.assertTrue(broker.set_sharded_state())
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            with mock_timestamp_now(now):
+                ret = main([broker.db_file, 'info'])
+        self.assertEqual(0, ret)
+        expected = ['Sharding enabled = True',
+                    'Own shard range: {',
+                    '  "bytes_used": 0,',
+                    '  "deleted": 0,',
+                    '  "epoch": "%s",' % epoch.internal,
+                    '  "lower": "",',
+                    '  "meta_timestamp": "%s",' % now.internal,
+                    '  "name": "a/c",',
+                    '  "object_count": 0,',
+                    '  "reported": 0,',
+                    '  "state": "sharding",',
+                    '  "state_timestamp": "%s",' % now.internal,
+                    '  "timestamp": "%s",' % now.internal,
+                    '  "tombstones": -1,',
+                    '  "upper": ""',
+                    '}',
+                    'db_state = sharded',
+                    # in sharded state the object stats are determined by the
+                    # shard ranges, and we haven't created any in the test...
+                    'object_count = 0',
+                    'bytes_used = 0',
+                    'Metadata:',
+                    '  X-Container-Sysmeta-Sharding = True']
+        self.assertEqual(expected,
+                         [x.rstrip() for x in out.getvalue().splitlines()])
+        self.assertEqual(['Loaded db broker for a/c'],
+                         err.getvalue().splitlines())
+
+    def test_show(self):
+        broker = self._make_broker()
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'show'])
+        self.assertEqual(0, ret)
+        expected = [
+            'Loaded db broker for a/c',
+            'No shard data found.',
+        ]
+        self.assertEqual(expected, err.getvalue().splitlines())
+        self.assertEqual('', out.getvalue())
+
+        shard_ranges = make_shard_ranges(broker, self.shard_data, '.shards_')
+        expected_shard_ranges = [
+            dict(sr, state=ShardRange.STATES[sr.state])
+            for sr in shard_ranges
+        ]
+        broker.merge_shard_ranges(shard_ranges)
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'show'])
+        self.assertEqual(0, ret)
+        expected = [
+            'Loaded db broker for a/c',
+            'Existing shard ranges:',
+        ]
+        self.assertEqual(expected, err.getvalue().splitlines())
+        self.assertEqual(expected_shard_ranges, json.loads(out.getvalue()))
+
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'show', '--includes', 'foo'])
+        self.assertEqual(0, ret)
+        expected = [
+            'Loaded db broker for a/c',
+            'Existing shard ranges:',
+        ]
+        self.assertEqual(expected, err.getvalue().splitlines())
+        self.assertEqual(expected_shard_ranges[:1], json.loads(out.getvalue()))
+
+    def test_merge(self):
+        broker = self._make_broker()
+        broker.update_metadata({'X-Container-Sysmeta-Sharding':
+                                (True, Timestamp.now().internal)})
+        good_shard_ranges = []
+        for shard in self.shard_data[:3]:
+            good_shard_ranges.append(ShardRange(name='a/c_' + shard['lower'],
+                                                timestamp=next(self.ts_iter),
+                                                state=ShardRange.ACTIVE,
+                                                lower=shard['lower'],
+                                                upper=shard['upper']))
+        # insert an overlap..
+        bad_shard_range = ShardRange(
+            name='a/c_bad_' + self.shard_data[1]['lower'],
+            timestamp=next(self.ts_iter),
+            state=ShardRange.ACTIVE,
+            lower=self.shard_data[1]['lower'],
+            upper=self.shard_data[2]['upper'])
+        broker.merge_shard_ranges(good_shard_ranges + [bad_shard_range])
+        self.assertEqual(
+            [('', 'obj09'),
+             ('obj09', 'obj19'),
+             ('obj09', 'obj29'),
+             ('obj19', 'obj29')],
+            [(sr.lower_str, sr.upper_str) for sr in broker.get_shard_ranges()])
+
+        # use command to merge in a deleted version of the bad shard range
+        bad_shard_range.update_state(ShardRange.SHRUNK,
+                                     state_timestamp=next(self.ts_iter))
+        bad_shard_range.set_deleted(next(self.ts_iter))
+        bad_shard_range.update_meta(0, 0, next(self.ts_iter))
+        input_file = os.path.join(self.testdir, 'shards')
+        with open(input_file, 'w') as fd:
+            json.dump([dict(bad_shard_range)], fd)
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, '-v', 'merge', input_file,
+                        '--replace-timeout', '1', '--yes'])
+        self.assertEqual(0, ret)
+        affected_shard_ranges = [dict(sr) for sr in good_shard_ranges]
+        expected_msg = [
+            'This change will result in the following shard ranges in the '
+            'affected namespace:']
+        expected_msg.extend(
+            json.dumps(affected_shard_ranges, indent=2).splitlines())
+        expected_msg.extend(
+            ['Injected 1 shard ranges.',
+             'Run container-replicator to replicate them to other nodes.'])
+        self.assertEqual(expected_msg, out.getvalue().splitlines())
+        self.assertEqual(['Loaded db broker for a/c'],
+                         err.getvalue().splitlines())
+        self.assertEqual(
+            [dict(sr) for sr in good_shard_ranges],
+            [dict(sr) for sr in broker.get_shard_ranges()])
+        self.assertEqual(
+            dict(bad_shard_range),
+            dict(broker.get_shard_ranges(include_deleted=True)[3]))
+
+    def test_merge_fills_gap(self):
+        broker = self._make_broker()
+        broker.update_metadata({'X-Container-Sysmeta-Sharding':
+                                (True, Timestamp.now().internal)})
+        old_shard_ranges = []
+        for shard in self.shard_data[:1]:
+            old_shard_ranges.append(ShardRange(name='a/c_' + shard['lower'],
+                                               timestamp=next(self.ts_iter),
+                                               state=ShardRange.ACTIVE,
+                                               lower=shard['lower'],
+                                               upper=shard['upper']))
+
+        # use command to merge in a deleted version of the existing and two
+        # new ranges
+        new_shard_ranges = [
+            old_shard_ranges[0].copy(deleted=True,
+                                     timestamp=next(self.ts_iter)),
+            ShardRange(
+                name='a/c_1_' + self.shard_data[0]['lower'],
+                timestamp=next(self.ts_iter),
+                state=ShardRange.ACTIVE,
+                lower=self.shard_data[0]['lower'],
+                upper=self.shard_data[0]['upper'] + 'a'),
+            ShardRange(
+                name='a/c_1_' + self.shard_data[0]['upper'] + 'a',
+                timestamp=next(self.ts_iter),
+                state=ShardRange.ACTIVE,
+                lower=self.shard_data[0]['upper'] + 'a',
+                upper=self.shard_data[1]['upper'] + 'a'),
+        ]
+
+        input_file = os.path.join(self.testdir, 'shards')
+        with open(input_file, 'w') as fd:
+            json.dump([dict(sr) for sr in new_shard_ranges], fd)
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, '-v', 'merge', input_file,
+                        '--replace-timeout', '1', '--yes'])
+        self.assertEqual(0, ret)
+        affected_shard_ranges = [dict(sr) for sr in new_shard_ranges[1:]]
+        expected_msg = [
+            'This change will result in the following shard ranges in the '
+            'affected namespace:']
+        expected_msg.extend(
+            json.dumps(affected_shard_ranges, indent=2).splitlines())
+        expected_msg.extend(
+            ['Injected 3 shard ranges.',
+             'Run container-replicator to replicate them to other nodes.'])
+        self.assertEqual(expected_msg, out.getvalue().splitlines())
+        self.assertEqual(['Loaded db broker for a/c'],
+                         err.getvalue().splitlines())
+        self.assertEqual(
+            [dict(sr) for sr in new_shard_ranges[1:]],
+            [dict(sr) for sr in broker.get_shard_ranges()])
+        self.assertEqual(
+            [dict(sr) for sr in new_shard_ranges],
+            [dict(sr) for sr in broker.get_shard_ranges(include_deleted=True)])
+
+    def test_merge_warns_of_overlap(self):
+        broker = self._make_broker()
+        broker.update_metadata({'X-Container-Sysmeta-Sharding':
+                                (True, Timestamp.now().internal)})
+        old_shard_ranges = []
+        for shard in self.shard_data[:3]:
+            old_shard_ranges.append(ShardRange(name='a/c_' + shard['lower'],
+                                               timestamp=next(self.ts_iter),
+                                               state=ShardRange.ACTIVE,
+                                               lower=shard['lower'],
+                                               upper=shard['upper']))
+        broker.merge_shard_ranges(old_shard_ranges)
+
+        # use command to merge in a new range that overlaps...
+        new_shard_range = ShardRange(
+            name='a/c_bad_' + self.shard_data[1]['lower'],
+            timestamp=next(self.ts_iter),
+            state=ShardRange.ACTIVE,
+            lower=self.shard_data[1]['lower'] + 'a',
+            upper=self.shard_data[1]['upper'])
+        input_file = os.path.join(self.testdir, 'shards')
+        with open(input_file, 'w') as fd:
+            json.dump([dict(new_shard_range)], fd)
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, '-v', 'merge', input_file,
+                        '--replace-timeout', '1', '-n'])
+        self.assertEqual(3, ret)
+        affected_shard_ranges = [
+            dict(sr) for sr in [old_shard_ranges[0], old_shard_ranges[1],
+                                new_shard_range, old_shard_ranges[2]]]
+        expected_msg = [
+            'This change will result in the following shard ranges in the '
+            'affected namespace:']
+        expected_msg.extend(
+            json.dumps(affected_shard_ranges, indent=2).splitlines())
+        expected_msg.extend(
+            ['WARNING: this change will result in shard ranges overlaps!',
+             'No changes applied'])
+        self.assertEqual(expected_msg, out.getvalue().splitlines())
+        self.assertEqual(['Loaded db broker for a/c'],
+                         err.getvalue().splitlines())
+        self.assertEqual(
+            [dict(sr) for sr in old_shard_ranges],
+            [dict(sr) for sr in broker.get_shard_ranges()])
+
+        # repeat without -v flag
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'merge', input_file,
+                        '--replace-timeout', '1', '-n'])
+        self.assertEqual(3, ret)
+        expected_msg = [
+            'WARNING: this change will result in shard ranges overlaps!',
+            'No changes applied']
+        self.assertEqual(expected_msg, out.getvalue().splitlines())
+        self.assertEqual(['Loaded db broker for a/c'],
+                         err.getvalue().splitlines())
+        self.assertEqual(
+            [dict(sr) for sr in old_shard_ranges],
+            [dict(sr) for sr in broker.get_shard_ranges()])
+
+    def test_merge_warns_of_gap(self):
+        broker = self._make_broker()
+        broker.update_metadata({'X-Container-Sysmeta-Sharding':
+                                (True, Timestamp.now().internal)})
+        old_shard_ranges = []
+        for shard in self.shard_data[:3]:
+            old_shard_ranges.append(ShardRange(name='a/c_' + shard['lower'],
+                                               timestamp=next(self.ts_iter),
+                                               state=ShardRange.ACTIVE,
+                                               lower=shard['lower'],
+                                               upper=shard['upper']))
+        broker.merge_shard_ranges(old_shard_ranges)
+
+        # use command to merge in a deleted range that creates a gap...
+        new_shard_range = old_shard_ranges[1].copy(
+            timestamp=next(self.ts_iter), deleted=True)
+        input_file = os.path.join(self.testdir, 'shards')
+        with open(input_file, 'w') as fd:
+            json.dump([dict(new_shard_range)], fd)
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, '-v', 'merge', input_file,
+                        '--replace-timeout', '1', '-n'])
+        self.assertEqual(3, ret)
+        affected_shard_ranges = [
+            dict(sr) for sr in [old_shard_ranges[0], old_shard_ranges[2]]]
+        expected_msg = [
+            'This change will result in the following shard ranges in the '
+            'affected namespace:']
+        expected_msg.extend(
+            json.dumps(affected_shard_ranges, indent=2).splitlines())
+        expected_msg.extend(
+            ['WARNING: this change will result in shard ranges gaps!',
+             'No changes applied'])
+        self.assertEqual(expected_msg, out.getvalue().splitlines())
+        self.assertEqual(['Loaded db broker for a/c'],
+                         err.getvalue().splitlines())
+        self.assertEqual(
+            [dict(sr) for sr in old_shard_ranges],
+            [dict(sr) for sr in broker.get_shard_ranges()])
+
+    def test_replace(self):
+        broker = self._make_broker()
+        broker.update_metadata({'X-Container-Sysmeta-Sharding':
+                                (True, Timestamp.now().internal)})
+        input_file = os.path.join(self.testdir, 'shards')
+        with open(input_file, 'w') as fd:
+            json.dump(self.shard_data, fd)
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'replace', input_file])
+        self.assertEqual(0, ret)
+        expected = [
+            'No shard ranges found to delete.',
+            'Injected 10 shard ranges.',
+            'Run container-replicator to replicate them to other nodes.',
+            'Use the enable sub-command to enable sharding.']
+        self.assertEqual(expected, out.getvalue().splitlines())
+        self.assertEqual(['Loaded db broker for a/c'],
+                         err.getvalue().splitlines())
+        self.assertEqual(
+            [(data['lower'], data['upper']) for data in self.shard_data],
+            [(sr.lower_str, sr.upper_str) for sr in broker.get_shard_ranges()])
+
+        def check_user_exit(user_input):
+            # try again now db has shard ranges, simulate user quitting
+            with open(input_file, 'w') as fd:
+                json.dump(self.overlap_shard_data_1, fd)
+            out = StringIO()
+            err = StringIO()
+            to_patch = 'swift.cli.manage_shard_ranges.input'
+            with mock.patch('sys.stdout', out), \
+                    mock.patch('sys.stderr', err), \
+                    mock.patch(to_patch, side_effect=[user_input]):
+                ret = main([broker.db_file, 'replace', input_file])
+            self.assertEqual(3, ret)
+            expected = ['This will delete existing 10 shard ranges.']
+            self.assertEqual(expected, out.getvalue().splitlines())
+            self.assertEqual(['Loaded db broker for a/c'],
+                             err.getvalue().splitlines())
+            self.assertEqual(
+                [(data['lower'], data['upper']) for data in self.shard_data],
+                [(sr.lower_str, sr.upper_str)
+                 for sr in broker.get_shard_ranges()])
+
+        check_user_exit('q')
+        check_user_exit(EOFError)
+        check_user_exit(KeyboardInterrupt)
+
+    def test_analyze_stdin(self):
+        out = StringIO()
+        err = StringIO()
+        stdin = StringIO()
+        stdin.write(json.dumps([]))  # empty but valid json
+        stdin.seek(0)
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err), \
+                mock.patch('sys.stdin', stdin):
+            ret = main(['-', 'analyze'])
+        self.assertEqual(1, ret)
+        expected = [
+            'Found no complete sequence of shard ranges.',
+            'Repairs necessary to fill gaps.',
+            'Gap filling not supported by this tool. No repairs performed.',
+        ]
+
+        self.assertEqual(expected, out.getvalue().splitlines())
+        broker = self._make_broker()
+        broker.update_metadata({'X-Container-Sysmeta-Sharding':
+                                (True, Timestamp.now().internal)})
+        shard_ranges = [
+            dict(sr, state=ShardRange.STATES[sr.state])
+            for sr in make_shard_ranges(broker, self.shard_data, '.shards_')
+        ]
+        out = StringIO()
+        err = StringIO()
+        stdin = StringIO()
+        stdin.write(json.dumps(shard_ranges))
+        stdin.seek(0)
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err), \
+                mock.patch('sys.stdin', stdin):
+            ret = main(['-', 'analyze'])
+        self.assertEqual(0, ret)
+        expected = [
+            'Found one complete sequence of 10 shard ranges '
+            'and no overlapping shard ranges.',
+            'No repairs necessary.',
+        ]
+        self.assertEqual(expected, out.getvalue().splitlines())
+
+    def test_analyze_stdin_with_overlaps(self):
+        broker = self._make_broker()
+        broker.set_sharding_sysmeta('Quoted-Root', 'a/c')
+        with mock_timestamp_now(next(self.ts_iter)):
+            shard_ranges = make_shard_ranges(
+                broker, self.shard_data, '.shards_')
+        with mock_timestamp_now(next(self.ts_iter)):
+            overlap_shard_ranges_1 = make_shard_ranges(
+                broker, self.overlap_shard_data_1, '.shards_')
+        broker.merge_shard_ranges(shard_ranges + overlap_shard_ranges_1)
+        shard_ranges = [
+            dict(sr, state=ShardRange.STATES[sr.state])
+            for sr in broker.get_shard_ranges()
+        ]
+        out = StringIO()
+        err = StringIO()
+        stdin = StringIO()
+        stdin.write(json.dumps(shard_ranges))
+        stdin.seek(0)
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err), \
+                mock.patch('sys.stdin', stdin):
+            ret = main(['-', 'analyze'])
+        self.assertEqual(0, ret)
+        expected = [
+            'Repairs necessary to remove overlapping shard ranges.',
+            'Chosen a complete sequence of 10 shard ranges with '
+            'current total of 100 object records to accept object records '
+            'from 10 overlapping donor shard ranges.',
+            'Once applied to the broker these changes will result in:',
+            '    10 shard ranges being removed.',
+            '    10 object records being moved to the chosen shard ranges.',
+        ]
+        self.assertEqual(expected, out.getvalue().splitlines())
+
+    def _assert_enabled(self, broker, epoch):
+        own_sr = broker.get_own_shard_range()
+        self.assertEqual(ShardRange.SHARDING, own_sr.state)
+        self.assertEqual(epoch, own_sr.epoch)
+        self.assertEqual(ShardRange.MIN, own_sr.lower)
+        self.assertEqual(ShardRange.MAX, own_sr.upper)
+        self.assertEqual(
+            'True', broker.metadata['X-Container-Sysmeta-Sharding'][0])
+
+    def test_enable(self):
+        broker = self._make_broker()
+        ts = next(self.ts_iter)
+        broker.merge_items([
+            {'name': 'obj%02d' % i, 'created_at': ts.internal, 'size': 9,
+             'content_type': 'application/octet-stream', 'etag': 'not-really',
+             'deleted': 0, 'storage_policy_index': 0,
+             'ctype_timestamp': ts.internal, 'meta_timestamp': ts.internal}
+            for i in range(100)])
+        broker.update_metadata({'X-Container-Sysmeta-Sharding':
+                                (True, Timestamp.now().internal)})
+        # no shard ranges
+        out = StringIO()
+        err = StringIO()
+        with self.assertRaises(SystemExit) as cm:
+            with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+                main([broker.db_file, 'enable'])
+        self.assertEqual(1, cm.exception.code)
+        expected = ["WARNING: invalid shard ranges: ['No shard ranges.'].",
+                    'Aborting.']
+        self.assertEqual(expected, out.getvalue().splitlines())
+        self.assertEqual(['Loaded db broker for a/c'],
+                         err.getvalue().splitlines())
+
+        # success
+        shard_ranges = []
+        for data in self.shard_data:
+            path = ShardRange.make_path(
+                '.shards_a', 'c', 'c', Timestamp.now(), data['index'])
+            shard_ranges.append(
+                ShardRange(path, Timestamp.now(), data['lower'],
+                           data['upper'], data['object_count'], bytes_used=9))
+        broker.merge_shard_ranges(shard_ranges)
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            with mock_timestamp_now() as now:
+                ret = main([broker.db_file, 'enable'])
+        self.assertEqual(0, ret)
+        expected = [
+            "Container moved to state 'sharding' with epoch %s." %
+            now.internal,
+            'Run container-sharder on all nodes to shard the container.']
+        self.assertEqual(expected, out.getvalue().splitlines())
+        self.assertEqual(['Loaded db broker for a/c'],
+                         err.getvalue().splitlines())
+        self._assert_enabled(broker, now)
+        self.assertEqual(100, broker.get_info()['object_count'])
+        self.assertEqual(100, broker.get_own_shard_range().object_count)
+        self.assertEqual(900, broker.get_info()['bytes_used'])
+        self.assertEqual(900, broker.get_own_shard_range().bytes_used)
+
+        # already enabled
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'enable'])
+        self.assertEqual(0, ret)
+        expected = [
+            "Container already in state 'sharding' with epoch %s." %
+            now.internal,
+            'No action required.',
+            'Run container-sharder on all nodes to shard the container.']
+        self.assertEqual(expected, out.getvalue().splitlines())
+        self.assertEqual(['Loaded db broker for a/c'],
+                         err.getvalue().splitlines())
+        self._assert_enabled(broker, now)
+
+    def test_find_replace_enable(self):
+        db_file = os.path.join(self.testdir, 'hash.db')
+        broker = ContainerBroker(db_file)
+        broker.account = 'a'
+        broker.container = 'c'
+        broker.initialize()
+        ts = utils.Timestamp.now()
+        broker.merge_items([
+            {'name': 'obj%02d' % i, 'created_at': ts.internal, 'size': 0,
+             'content_type': 'application/octet-stream', 'etag': 'not-really',
+             'deleted': 0, 'storage_policy_index': 0,
+             'ctype_timestamp': ts.internal, 'meta_timestamp': ts.internal}
+            for i in range(100)])
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            with mock_timestamp_now() as now:
+                ret = main([broker.db_file, 'find_and_replace', '10',
+                            '--enable'])
+        self.assertEqual(0, ret)
+        expected = [
+            'No shard ranges found to delete.',
+            'Injected 10 shard ranges.',
+            'Run container-replicator to replicate them to other nodes.',
+            "Container moved to state 'sharding' with epoch %s." %
+            now.internal,
+            'Run container-sharder on all nodes to shard the container.']
+        self.assertEqual(expected, out.getvalue().splitlines())
+        self.assertEqual(['Loaded db broker for a/c'],
+                         err.getvalue().splitlines())
+        self._assert_enabled(broker, now)
+        found_shard_ranges = broker.get_shard_ranges()
+        self.assertEqual(
+            [(data['lower'], data['upper']) for data in self.shard_data],
+            [(sr.lower_str, sr.upper_str) for sr in found_shard_ranges])
+
+        def check_user_exit(user_input):
+            # Do another find & replace but quit when prompted about existing
+            # shard ranges
+            out = StringIO()
+            err = StringIO()
+            to_patch = 'swift.cli.manage_shard_ranges.input'
+            with mock.patch('sys.stdout', out), mock_timestamp_now(), \
+                    mock.patch('sys.stderr', err), \
+                    mock.patch(to_patch, side_effect=[user_input]):
+                ret = main([broker.db_file, 'find_and_replace', '10'])
+            self.assertEqual(3, ret)
+            # Shard ranges haven't changed at all
+            self.assertEqual(found_shard_ranges, broker.get_shard_ranges())
+            expected = ['This will delete existing 10 shard ranges.']
+            self.assertEqual(expected, out.getvalue().splitlines())
+            self.assertEqual(['Loaded db broker for a/c'],
+                             err.getvalue().splitlines())
+
+        check_user_exit('q')
+        check_user_exit(EOFError)
+        check_user_exit(KeyboardInterrupt)
+
+    def test_compact_bad_args(self):
+        broker = self._make_broker()
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            with self.assertRaises(SystemExit) as cm:
+                main([broker.db_file, 'compact', '--shrink-threshold', '0'])
+            self.assertEqual(2, cm.exception.code)
+            with self.assertRaises(SystemExit) as cm:
+                main([broker.db_file, 'compact', '--expansion-limit', '0'])
+            self.assertEqual(2, cm.exception.code)
+            with self.assertRaises(SystemExit) as cm:
+                main([broker.db_file, 'compact', '--max-shrinking', '0'])
+            self.assertEqual(2, cm.exception.code)
+            with self.assertRaises(SystemExit) as cm:
+                main([broker.db_file, 'compact', '--max-expanding', '0'])
+            self.assertEqual(2, cm.exception.code)
+
+    def test_compact_not_root(self):
+        broker = self._make_broker()
+        shard_ranges = make_shard_ranges(broker, self.shard_data, '.shards_')
+        broker.merge_shard_ranges(shard_ranges)
+        # make broker appear to not be a root container
+        out = StringIO()
+        err = StringIO()
+        broker.set_sharding_sysmeta('Quoted-Root', 'not_a/c')
+        self.assertFalse(broker.is_root_container())
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'compact'])
+        self.assertEqual(1, ret)
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        out_lines = out.getvalue().split('\n')
+        self.assertEqual(
+            ['WARNING: Shard containers cannot be compacted.',
+             'This command should be used on a root container.'],
+            out_lines[:2]
+        )
+        updated_ranges = broker.get_shard_ranges()
+        self.assertEqual(shard_ranges, updated_ranges)
+        self.assertEqual([ShardRange.FOUND] * 10,
+                         [sr.state for sr in updated_ranges])
+
+    def test_compact_not_sharded(self):
+        broker = self._make_broker()
+        shard_ranges = make_shard_ranges(broker, self.shard_data, '.shards_')
+        broker.merge_shard_ranges(shard_ranges)
+        # make broker appear to be a root container but it isn't sharded
+        out = StringIO()
+        err = StringIO()
+        broker.set_sharding_sysmeta('Quoted-Root', 'a/c')
+        self.assertTrue(broker.is_root_container())
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'compact'])
+        self.assertEqual(1, ret)
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        out_lines = out.getvalue().split('\n')
+        self.assertEqual(
+            ['WARNING: Container is not yet sharded so cannot be compacted.'],
+            out_lines[:1])
+        updated_ranges = broker.get_shard_ranges()
+        self.assertEqual(shard_ranges, updated_ranges)
+        self.assertEqual([ShardRange.FOUND] * 10,
+                         [sr.state for sr in updated_ranges])
+
+    def test_compact_overlapping_shard_ranges(self):
+        # verify that containers with overlaps will not be compacted
+        broker = self._make_broker()
+        shard_ranges = make_shard_ranges(broker, self.shard_data, '.shards_')
+        for i, sr in enumerate(shard_ranges):
+            sr.update_state(ShardRange.ACTIVE)
+        shard_ranges[3].upper = shard_ranges[4].upper
+        broker.merge_shard_ranges(shard_ranges)
+        self._move_broker_to_sharded_state(broker)
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file,
+                        'compact', '--yes', '--max-expanding', '10'])
+        self.assertEqual(1, ret)
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        out_lines = out.getvalue().split('\n')
+        self.assertEqual(
+            ['WARNING: Container has overlapping shard ranges so cannot be '
+             'compacted.'],
+            out_lines[:1])
+        updated_ranges = broker.get_shard_ranges()
+        self.assertEqual(shard_ranges, updated_ranges)
+        self.assertEqual([ShardRange.ACTIVE] * 10,
+                         [sr.state for sr in updated_ranges])
+
+    def test_compact_shard_ranges_in_found_state(self):
+        broker = self._make_broker()
+        shard_ranges = make_shard_ranges(broker, self.shard_data, '.shards_')
+        broker.merge_shard_ranges(shard_ranges)
+        self._move_broker_to_sharded_state(broker)
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'compact'])
+        self.assertEqual(0, ret)
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        out_lines = out.getvalue().split('\n')
+        self.assertEqual(
+            ['No shards identified for compaction.'],
+            out_lines[:1])
+        updated_ranges = broker.get_shard_ranges()
+        self.assertEqual([ShardRange.FOUND] * 10,
+                         [sr.state for sr in updated_ranges])
+
+    def test_compact_user_input(self):
+        # verify user input 'yes' or 'n' is respected
+        small_ranges = (3, 4, 7)
+        broker = self._make_broker()
+        shard_ranges = make_shard_ranges(broker, self.shard_data, '.shards_')
+        for i, sr in enumerate(shard_ranges):
+            sr.tombstones = 999
+            if i not in small_ranges:
+                sr.object_count = 100001
+            sr.update_state(ShardRange.ACTIVE)
+        broker.merge_shard_ranges(shard_ranges)
+        self._move_broker_to_sharded_state(broker)
+
+        expected_base = [
+            'Donor shard range(s) with total of 2018 rows:',
+            "  '.shards_a",
+            "    objects:        10, tombstones:       999, lower: 'obj29'",
+            "      state:    active, deleted: 0             upper: 'obj39'",
+            "  '.shards_a",
+            "    objects:        10, tombstones:       999, lower: 'obj39'",
+            "      state:    active, deleted: 0             upper: 'obj49'",
+            'can be compacted into acceptor shard range:',
+            "  '.shards_a",
+            "    objects:    100001, tombstones:       999, lower: 'obj49'",
+            "      state:    active, deleted: 0             upper: 'obj59'",
+            'Donor shard range(s) with total of 1009 rows:',
+            "  '.shards_a",
+            "    objects:        10, tombstones:       999, lower: 'obj69'",
+            "      state:    active, deleted: 0             upper: 'obj79'",
+            'can be compacted into acceptor shard range:',
+            "  '.shards_a",
+            "    objects:    100001, tombstones:       999, lower: 'obj79'",
+            "      state:    active, deleted: 0             upper: 'obj89'",
+            'Total of 2 shard sequences identified for compaction.',
+            'Once applied to the broker these changes will result in '
+            'shard range compaction the next time the sharder runs.',
+        ]
+
+        def do_compact(user_input, options, exp_changes, exit_code):
+            out = StringIO()
+            err = StringIO()
+            with mock.patch('sys.stdout', out), \
+                    mock.patch('sys.stderr', err), \
+                    mock.patch('swift.cli.manage_shard_ranges.input',
+                               side_effect=[user_input]):
+                ret = main([broker.db_file, 'compact',
+                            '--max-shrinking', '99'] + options)
+            self.assertEqual(exit_code, ret)
+            err_lines = err.getvalue().split('\n')
+            self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+            out_lines = out.getvalue().split('\n')
+            expected = list(expected_base)
+            if exp_changes:
+                expected.extend([
+                    'Updated 2 shard sequences for compaction.',
+                    'Run container-replicator to replicate the changes to '
+                    'other nodes.',
+                    'Run container-sharder on all nodes to compact shards.',
+                    '',
+                ])
+            else:
+                expected.extend([
+                    'No changes applied',
+                    '',
+                ])
+            self.assertEqual(expected, [l.split('/', 1)[0] for l in out_lines])
+            return broker.get_shard_ranges()
+
+        broker_ranges = do_compact('n', [], False, 3)
+        # expect no changes to shard ranges
+        self.assertEqual(shard_ranges, broker_ranges)
+        for i, sr in enumerate(broker_ranges):
+            self.assertEqual(ShardRange.ACTIVE, sr.state)
+
+        broker_ranges = do_compact(EOFError, [], False, 3)
+        # expect no changes to shard ranges
+        self.assertEqual(shard_ranges, broker_ranges)
+        for i, sr in enumerate(broker_ranges):
+            self.assertEqual(ShardRange.ACTIVE, sr.state)
+
+        broker_ranges = do_compact(KeyboardInterrupt, [], False, 3)
+        # expect no changes to shard ranges
+        self.assertEqual(shard_ranges, broker_ranges)
+        for i, sr in enumerate(broker_ranges):
+            self.assertEqual(ShardRange.ACTIVE, sr.state)
+
+        broker_ranges = do_compact('yes', ['--dry-run'], False, 3)
+        # expect no changes to shard ranges
+        self.assertEqual(shard_ranges, broker_ranges)
+        for i, sr in enumerate(broker_ranges):
+            self.assertEqual(ShardRange.ACTIVE, sr.state)
+
+        broker_ranges = do_compact('yes', [], True, 0)
+        # expect updated shard ranges
+        shard_ranges[5].lower = shard_ranges[3].lower
+        shard_ranges[8].lower = shard_ranges[7].lower
+        self.assertEqual(shard_ranges, broker_ranges)
+        for i, sr in enumerate(broker_ranges):
+            if i in small_ranges:
+                self.assertEqual(ShardRange.SHRINKING, sr.state)
+            else:
+                self.assertEqual(ShardRange.ACTIVE, sr.state)
+
+    def test_compact_four_donors_two_acceptors(self):
+        small_ranges = (2, 3, 4, 7)
+        broker = self._make_broker()
+        shard_ranges = make_shard_ranges(broker, self.shard_data, '.shards_')
+        for i, sr in enumerate(shard_ranges):
+            if i not in small_ranges:
+                sr.object_count = 100001
+            sr.update_state(ShardRange.ACTIVE)
+        broker.merge_shard_ranges(shard_ranges)
+        self._move_broker_to_sharded_state(broker)
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'compact', '--yes',
+                        '--max-shrinking', '99'])
+        self.assertEqual(0, ret)
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        out_lines = out.getvalue().split('\n')
+        self.assertIn('Updated 2 shard sequences for compaction.', out_lines)
+        updated_ranges = broker.get_shard_ranges()
+        for i, sr in enumerate(updated_ranges):
+            if i in small_ranges:
+                self.assertEqual(ShardRange.SHRINKING, sr.state)
+            else:
+                self.assertEqual(ShardRange.ACTIVE, sr.state)
+        shard_ranges[5].lower = shard_ranges[2].lower
+        shard_ranges[8].lower = shard_ranges[7].lower
+        self.assertEqual(shard_ranges, updated_ranges)
+        for i in (5, 8):
+            # acceptors should have updated timestamp
+            self.assertLess(shard_ranges[i].timestamp,
+                            updated_ranges[i].timestamp)
+        # check idempotency
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'compact', '--yes',
+                        '--max-shrinking', '99'])
+
+        self.assertEqual(0, ret)
+        updated_ranges = broker.get_shard_ranges()
+        self.assertEqual(shard_ranges, updated_ranges)
+        for i, sr in enumerate(updated_ranges):
+            if i in small_ranges:
+                self.assertEqual(ShardRange.SHRINKING, sr.state)
+            else:
+                self.assertEqual(ShardRange.ACTIVE, sr.state)
+
+    def test_compact_all_donors_shrink_to_root(self):
+        # by default all shard ranges are small enough to shrink so the root
+        # becomes the acceptor
+        broker = self._make_broker()
+        shard_ranges = make_shard_ranges(broker, self.shard_data, '.shards_')
+        for i, sr in enumerate(shard_ranges):
+            sr.update_state(ShardRange.ACTIVE)
+        broker.merge_shard_ranges(shard_ranges)
+        epoch = self._move_broker_to_sharded_state(broker)
+        own_sr = broker.get_own_shard_range(no_default=True)
+        self.assertEqual(epoch, own_sr.state_timestamp)  # sanity check
+        self.assertEqual(ShardRange.SHARDED, own_sr.state)  # sanity check
+
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'compact', '--yes',
+                        '--max-shrinking', '99'])
+        self.assertEqual(0, ret, 'stdout:\n%s\nstderr\n%s' %
+                         (out.getvalue(), err.getvalue()))
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        out_lines = out.getvalue().split('\n')
+        self.assertIn('Updated 1 shard sequences for compaction.', out_lines)
+        updated_ranges = broker.get_shard_ranges()
+        self.assertEqual(shard_ranges, updated_ranges)
+        self.assertEqual([ShardRange.SHRINKING] * 10,
+                         [sr.state for sr in updated_ranges])
+        updated_own_sr = broker.get_own_shard_range(no_default=True)
+        self.assertEqual(own_sr.timestamp, updated_own_sr.timestamp)
+        self.assertEqual(own_sr.epoch, updated_own_sr.epoch)
+        self.assertLess(own_sr.state_timestamp,
+                        updated_own_sr.state_timestamp)
+        self.assertEqual(ShardRange.ACTIVE, updated_own_sr.state)
+
+    def test_compact_single_donor_shrink_to_root(self):
+        # single shard range small enough to shrink so the root becomes the
+        # acceptor
+        broker = self._make_broker()
+        shard_data = [
+            {'index': 0, 'lower': '', 'upper': '', 'object_count': 10}
+        ]
+
+        shard_ranges = make_shard_ranges(broker, shard_data, '.shards_')
+        shard_ranges[0].update_state(ShardRange.ACTIVE)
+        broker.merge_shard_ranges(shard_ranges)
+        epoch = self._move_broker_to_sharded_state(broker)
+        own_sr = broker.get_own_shard_range(no_default=True)
+        self.assertEqual(epoch, own_sr.state_timestamp)  # sanity check
+        self.assertEqual(ShardRange.SHARDED, own_sr.state)  # sanity check
+
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'compact', '--yes'])
+        self.assertEqual(0, ret, 'stdout:\n%s\nstderr\n%s' %
+                         (out.getvalue(), err.getvalue()))
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        out_lines = out.getvalue().split('\n')
+        self.assertIn('Updated 1 shard sequences for compaction.', out_lines)
+        updated_ranges = broker.get_shard_ranges()
+        self.assertEqual(shard_ranges, updated_ranges)
+        self.assertEqual([ShardRange.SHRINKING],
+                         [sr.state for sr in updated_ranges])
+        updated_own_sr = broker.get_own_shard_range(no_default=True)
+        self.assertEqual(own_sr.timestamp, updated_own_sr.timestamp)
+        self.assertEqual(own_sr.epoch, updated_own_sr.epoch)
+        self.assertLess(own_sr.state_timestamp,
+                        updated_own_sr.state_timestamp)
+        self.assertEqual(ShardRange.ACTIVE, updated_own_sr.state)
+
+    def test_compact_donors_but_no_suitable_acceptor(self):
+        # if shard ranges are already shrinking, check that the final one is
+        # not made into an acceptor if a suitable adjacent acceptor is not
+        # found (unexpected scenario but possible in an overlap situation)
+        broker = self._make_broker()
+        shard_ranges = make_shard_ranges(broker, self.shard_data, '.shards_')
+        for i, state in enumerate([ShardRange.SHRINKING] * 3 +
+                                  [ShardRange.SHARDING] +
+                                  [ShardRange.ACTIVE] * 6):
+            shard_ranges[i].update_state(state)
+        broker.merge_shard_ranges(shard_ranges)
+        epoch = self._move_broker_to_sharded_state(broker)
+        with mock_timestamp_now(epoch):
+            own_sr = broker.get_own_shard_range(no_default=True)
+        self.assertEqual(epoch, own_sr.state_timestamp)  # sanity check
+        self.assertEqual(ShardRange.SHARDED, own_sr.state)  # sanity check
+
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'compact', '--yes',
+                        '--max-shrinking', '99'])
+        self.assertEqual(0, ret, 'stdout:\n%s\nstderr\n%s' %
+                         (out.getvalue(), err.getvalue()))
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        out_lines = out.getvalue().split('\n')
+        self.assertIn('Updated 1 shard sequences for compaction.', out_lines)
+        updated_ranges = broker.get_shard_ranges()
+        shard_ranges[9].lower = shard_ranges[4].lower  # expanded acceptor
+        self.assertEqual(shard_ranges, updated_ranges)
+        self.assertEqual([ShardRange.SHRINKING] * 3 +  # unchanged
+                         [ShardRange.SHARDING] +  # unchanged
+                         [ShardRange.SHRINKING] * 5 +  # moved to shrinking
+                         [ShardRange.ACTIVE],  # unchanged
+                         [sr.state for sr in updated_ranges])
+        with mock_timestamp_now(epoch):  # force equal meta-timestamp
+            updated_own_sr = broker.get_own_shard_range(no_default=True)
+        self.assertEqual(dict(own_sr), dict(updated_own_sr))
+
+    def test_compact_no_gaps(self):
+        # verify that compactible sequences do not include gaps
+        broker = self._make_broker()
+        shard_ranges = make_shard_ranges(broker, self.shard_data, '.shards_')
+        for i, sr in enumerate(shard_ranges):
+            sr.update_state(ShardRange.ACTIVE)
+        gapped_ranges = shard_ranges[:3] + shard_ranges[4:]
+        broker.merge_shard_ranges(gapped_ranges)
+        self._move_broker_to_sharded_state(broker)
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'compact', '--yes',
+                        '--max-shrinking', '99'])
+        self.assertEqual(0, ret)
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        out_lines = out.getvalue().split('\n')
+        self.assertIn('Updated 2 shard sequences for compaction.', out_lines)
+        updated_ranges = broker.get_shard_ranges()
+        gapped_ranges[2].lower = gapped_ranges[0].lower
+        gapped_ranges[8].lower = gapped_ranges[3].lower
+        self.assertEqual(gapped_ranges, updated_ranges)
+        self.assertEqual([ShardRange.SHRINKING] * 2 + [ShardRange.ACTIVE] +
+                         [ShardRange.SHRINKING] * 5 + [ShardRange.ACTIVE],
+                         [sr.state for sr in updated_ranges])
+
+    def test_compact_max_shrinking_default(self):
+        # verify default limit on number of shrinking shards per acceptor
+        broker = self._make_broker()
+        shard_ranges = make_shard_ranges(broker, self.shard_data, '.shards_')
+        for i, sr in enumerate(shard_ranges):
+            sr.update_state(ShardRange.ACTIVE)
+        broker.merge_shard_ranges(shard_ranges)
+        self._move_broker_to_sharded_state(broker)
+
+        def do_compact(expect_msg):
+            out = StringIO()
+            err = StringIO()
+            with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+                ret = main([broker.db_file, 'compact', '--yes'])
+            self.assertEqual(0, ret)
+            err_lines = err.getvalue().split('\n')
+            self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+            out_lines = out.getvalue().split('\n')
+            self.assertIn(expect_msg, out_lines)
+            return broker.get_shard_ranges()
+
+        updated_ranges = do_compact(
+            'Updated 5 shard sequences for compaction.')
+        for acceptor in (1, 3, 5, 7, 9):
+            shard_ranges[acceptor].lower = shard_ranges[acceptor - 1].lower
+        self.assertEqual(shard_ranges, updated_ranges)
+        self.assertEqual([ShardRange.SHRINKING, ShardRange.ACTIVE] * 5,
+                         [sr.state for sr in updated_ranges])
+
+        # check idempotency
+        updated_ranges = do_compact('No shards identified for compaction.')
+        self.assertEqual(shard_ranges, updated_ranges)
+        self.assertEqual([ShardRange.SHRINKING, ShardRange.ACTIVE] * 5,
+                         [sr.state for sr in updated_ranges])
+
+    def test_compact_max_shrinking(self):
+        # verify option to limit the number of shrinking shards per acceptor
+        broker = self._make_broker()
+        shard_ranges = make_shard_ranges(broker, self.shard_data, '.shards_')
+        for i, sr in enumerate(shard_ranges):
+            sr.update_state(ShardRange.ACTIVE)
+        broker.merge_shard_ranges(shard_ranges)
+        self._move_broker_to_sharded_state(broker)
+
+        def do_compact(expect_msg):
+            out = StringIO()
+            err = StringIO()
+            with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+                ret = main([broker.db_file, 'compact', '--yes',
+                            '--max-shrinking', '7'])
+            self.assertEqual(0, ret)
+            err_lines = err.getvalue().split('\n')
+            self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+            out_lines = out.getvalue().split('\n')
+            self.assertIn(expect_msg, out_lines)
+            return broker.get_shard_ranges()
+
+        updated_ranges = do_compact(
+            'Updated 2 shard sequences for compaction.')
+        shard_ranges[7].lower = shard_ranges[0].lower
+        shard_ranges[9].lower = shard_ranges[8].lower
+        self.assertEqual(shard_ranges, updated_ranges)
+        self.assertEqual([ShardRange.SHRINKING] * 7 + [ShardRange.ACTIVE] +
+                         [ShardRange.SHRINKING] + [ShardRange.ACTIVE],
+                         [sr.state for sr in updated_ranges])
+
+        # check idempotency
+        updated_ranges = do_compact('No shards identified for compaction.')
+        self.assertEqual(shard_ranges, updated_ranges)
+        self.assertEqual([ShardRange.SHRINKING] * 7 + [ShardRange.ACTIVE] +
+                         [ShardRange.SHRINKING] + [ShardRange.ACTIVE],
+                         [sr.state for sr in updated_ranges])
+
+    def test_compact_max_expanding(self):
+        # verify option to limit the number of expanding shards per acceptor
+        broker = self._make_broker()
+        shard_ranges = make_shard_ranges(broker, self.shard_data, '.shards_')
+        for i, sr in enumerate(shard_ranges):
+            sr.update_state(ShardRange.ACTIVE)
+        broker.merge_shard_ranges(shard_ranges)
+        self._move_broker_to_sharded_state(broker)
+
+        def do_compact(expect_msg):
+            out = StringIO()
+            err = StringIO()
+            # note: max_shrinking is set to 3 so that there is opportunity for
+            # more than 2 acceptors
+            with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+                ret = main([broker.db_file, 'compact', '--yes',
+                            '--max-shrinking', '3', '--max-expanding', '2'])
+            self.assertEqual(0, ret)
+            err_lines = err.getvalue().split('\n')
+            self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+            out_lines = out.getvalue().split('\n')
+            self.assertIn(expect_msg, out_lines)
+            return broker.get_shard_ranges()
+
+        updated_ranges = do_compact(
+            'Updated 2 shard sequences for compaction.')
+        shard_ranges[3].lower = shard_ranges[0].lower
+        shard_ranges[7].lower = shard_ranges[4].lower
+        self.assertEqual(shard_ranges, updated_ranges)
+        self.assertEqual([ShardRange.SHRINKING] * 3 + [ShardRange.ACTIVE] +
+                         [ShardRange.SHRINKING] * 3 + [ShardRange.ACTIVE] * 3,
+                         [sr.state for sr in updated_ranges])
+
+        # check idempotency - no more sequences found while existing sequences
+        # are shrinking
+        updated_ranges = do_compact('No shards identified for compaction.')
+        self.assertEqual(shard_ranges, updated_ranges)
+        self.assertEqual([ShardRange.SHRINKING] * 3 + [ShardRange.ACTIVE] +
+                         [ShardRange.SHRINKING] * 3 + [ShardRange.ACTIVE] * 3,
+                         [sr.state for sr in updated_ranges])
+
+    def test_compact_expansion_limit(self):
+        # verify option to limit the size of each acceptor after compaction
+        broker = self._make_broker()
+        shard_ranges = make_shard_ranges(broker, self.shard_data, '.shards_')
+        for i, sr in enumerate(shard_ranges):
+            sr.update_state(ShardRange.ACTIVE)
+        broker.merge_shard_ranges(shard_ranges)
+        self._move_broker_to_sharded_state(broker)
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'compact', '--yes',
+                        '--expansion-limit', '20'])
+        self.assertEqual(0, ret, err.getvalue())
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        out_lines = out.getvalue().rstrip('\n').split('\n')
+        self.assertIn('Updated 5 shard sequences for compaction.', out_lines)
+        updated_ranges = broker.get_shard_ranges()
+        shard_ranges[1].lower = shard_ranges[0].lower
+        shard_ranges[3].lower = shard_ranges[2].lower
+        shard_ranges[5].lower = shard_ranges[4].lower
+        shard_ranges[7].lower = shard_ranges[6].lower
+        shard_ranges[9].lower = shard_ranges[8].lower
+        self.assertEqual(shard_ranges, updated_ranges)
+        self.assertEqual([ShardRange.SHRINKING] + [ShardRange.ACTIVE] +
+                         [ShardRange.SHRINKING] + [ShardRange.ACTIVE] +
+                         [ShardRange.SHRINKING] + [ShardRange.ACTIVE] +
+                         [ShardRange.SHRINKING] + [ShardRange.ACTIVE] +
+                         [ShardRange.SHRINKING] + [ShardRange.ACTIVE],
+                         [sr.state for sr in updated_ranges])
+
+    def test_compact_expansion_limit_less_than_shrink_threshold(self):
+        broker = self._make_broker()
+        shard_ranges = make_shard_ranges(broker, self.shard_data, '.shards_')
+        for i, sr in enumerate(shard_ranges):
+            if i % 2:
+                sr.object_count = 25
+            else:
+                sr.object_count = 3
+            sr.update_state(ShardRange.ACTIVE)
+        broker.merge_shard_ranges(shard_ranges)
+        self._move_broker_to_sharded_state(broker)
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'compact', '--yes',
+                        '--shrink-threshold', '10',
+                        '--expansion-limit', '5'])
+        self.assertEqual(0, ret)
+        out_lines = out.getvalue().split('\n')
+        self.assertEqual(
+            ['No shards identified for compaction.'],
+            out_lines[:1])
+
+    def test_compact_nothing_to_do(self):
+        broker = self._make_broker()
+        shard_ranges = make_shard_ranges(broker, self.shard_data, '.shards_')
+        for i, sr in enumerate(shard_ranges):
+            sr.update_state(ShardRange.ACTIVE)
+        broker.merge_shard_ranges(shard_ranges)
+        self._move_broker_to_sharded_state(broker)
+        out = StringIO()
+        err = StringIO()
+        # all shards are too big to shrink
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'compact', '--yes',
+                        '--shrink-threshold', '5',
+                        '--expansion-limit', '8'])
+        self.assertEqual(0, ret)
+        out_lines = out.getvalue().split('\n')
+        self.assertEqual(
+            ['No shards identified for compaction.'],
+            out_lines[:1])
+
+        # all shards could shrink but acceptors would be too large
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'compact', '--yes',
+                        '--shrink-threshold', '11',
+                        '--expansion-limit', '12'])
+        self.assertEqual(0, ret)
+        out_lines = out.getvalue().split('\n')
+        self.assertEqual(
+            ['No shards identified for compaction.'],
+            out_lines[:1])
+
+    def _do_test_compact_shrink_threshold(self, broker, shard_ranges):
+        # verify option to set the shrink threshold for compaction;
+        for i, sr in enumerate(shard_ranges):
+            sr.update_state(ShardRange.ACTIVE)
+        # (n-2)th shard range has one extra object
+        shard_ranges[-2].object_count = shard_ranges[-2].object_count + 1
+        broker.merge_shard_ranges(shard_ranges)
+        self._move_broker_to_sharded_state(broker)
+        # with threshold set to 10 no shard ranges can be shrunk
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'compact', '--yes',
+                        '--max-shrinking', '99',
+                        '--shrink-threshold', '10'])
+        self.assertEqual(0, ret)
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        out_lines = out.getvalue().split('\n')
+        self.assertEqual(
+            ['No shards identified for compaction.'],
+            out_lines[:1])
+        updated_ranges = broker.get_shard_ranges()
+        self.assertEqual(shard_ranges, updated_ranges)
+        self.assertEqual([ShardRange.ACTIVE] * 10,
+                         [sr.state for sr in updated_ranges])
+
+        # with threshold == 11 all but the final 2 shard ranges can be shrunk;
+        # note: the (n-1)th shard range is NOT shrunk to root
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'compact', '--yes',
+                        '--max-shrinking', '99',
+                        '--shrink-threshold', '11'])
+        self.assertEqual(0, ret)
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        out_lines = out.getvalue().split('\n')
+        self.assertIn('Updated 1 shard sequences for compaction.', out_lines)
+        updated_ranges = broker.get_shard_ranges()
+        shard_ranges[8].lower = shard_ranges[0].lower
+        self.assertEqual(shard_ranges, updated_ranges)
+        self.assertEqual([ShardRange.SHRINKING] * 8 + [ShardRange.ACTIVE] * 2,
+                         [sr.state for sr in updated_ranges])
+
+    def test_compact_shrink_threshold(self):
+        broker = self._make_broker()
+        shard_ranges = make_shard_ranges(broker, self.shard_data, '.shards_')
+        self._do_test_compact_shrink_threshold(broker, shard_ranges)
+
+    def test_compact_shrink_threshold_with_tombstones(self):
+        broker = self._make_broker()
+        shard_ranges = make_shard_ranges(broker, self.shard_data, '.shards_')
+        for i, sr in enumerate(shard_ranges):
+            sr.object_count = sr.object_count - i
+            sr.tombstones = i
+        self._do_test_compact_shrink_threshold(broker, shard_ranges)
+
+    def test_repair_not_root(self):
+        broker = self._make_broker()
+        shard_ranges = make_shard_ranges(broker, self.shard_data, '.shards_')
+        broker.merge_shard_ranges(shard_ranges)
+        # make broker appear to not be a root container
+        out = StringIO()
+        err = StringIO()
+        broker.set_sharding_sysmeta('Quoted-Root', 'not_a/c')
+        self.assertFalse(broker.is_root_container())
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'repair'])
+        self.assertEqual(1, ret)
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        out_lines = out.getvalue().split('\n')
+        self.assertEqual(
+            ['WARNING: Shard containers cannot be repaired.',
+             'This command should be used on a root container.'],
+            out_lines[:2]
+        )
+        updated_ranges = broker.get_shard_ranges()
+        self.assert_shard_ranges_equal(shard_ranges, updated_ranges)
+
+    def test_repair_no_shard_ranges(self):
+        broker = self._make_broker()
+        broker.set_sharding_sysmeta('Quoted-Root', 'a/c')
+        self.assertTrue(broker.is_root_container())
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'repair'])
+        self.assertEqual(0, ret)
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        out_lines = out.getvalue().split('\n')
+        self.assertEqual(
+            ['No shards found, nothing to do.'],
+            out_lines[:1])
+        updated_ranges = broker.get_shard_ranges()
+        self.assert_shard_ranges_equal([], updated_ranges)
+
+    def test_repair_one_incomplete_sequence(self):
+        broker = self._make_broker()
+        broker.set_sharding_sysmeta('Quoted-Root', 'a/c')
+        with mock_timestamp_now(next(self.ts_iter)):
+            shard_ranges = make_shard_ranges(
+                broker, self.shard_data[:-1], '.shards_')
+        broker.merge_shard_ranges(shard_ranges)
+        self.assertTrue(broker.is_root_container())
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'repair'])
+        self.assertEqual(1, ret)
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        out_lines = out.getvalue().split('\n')
+        self.assertEqual(
+            ['Found no complete sequence of shard ranges.'],
+            out_lines[:1])
+        updated_ranges = broker.get_shard_ranges()
+        self.assert_shard_ranges_equal(shard_ranges, updated_ranges)
+
+    def test_repair_overlapping_incomplete_sequences(self):
+        broker = self._make_broker()
+        broker.set_sharding_sysmeta('Quoted-Root', 'a/c')
+        with mock_timestamp_now(next(self.ts_iter)):
+            shard_ranges = make_shard_ranges(
+                broker, self.shard_data[:-1], '.shards_')
+        with mock_timestamp_now(next(self.ts_iter)):
+            # use new time to get distinct shard names
+            overlap_shard_ranges = make_shard_ranges(
+                broker,
+                self.overlap_shard_data_1[:2] + self.overlap_shard_data_1[6:],
+                '.shards_')
+        broker.merge_shard_ranges(shard_ranges + overlap_shard_ranges)
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'repair'])
+        self.assertEqual(1, ret)
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        out_lines = out.getvalue().split('\n')
+        self.assertEqual(
+            ['Found no complete sequence of shard ranges.'],
+            out_lines[:1])
+        updated_ranges = broker.get_shard_ranges()
+        expected = sorted(shard_ranges + overlap_shard_ranges,
+                          key=ShardRange.sort_key)
+        self.assert_shard_ranges_equal(expected, updated_ranges)
+
+    def test_repair_gaps(self):
+        def do_test(missing_index, expander_index, missing_state=None):
+            broker = self._make_broker()
+            broker.set_sharding_sysmeta('Quoted-Root', 'a/c')
+            for shard in self.shard_data:
+                shard['state'] = ShardRange.ACTIVE
+            with mock_timestamp_now(next(self.ts_iter)):
+                all_shard_ranges = make_shard_ranges(
+                    broker, self.shard_data, '.shards_')
+            shard_ranges = list(all_shard_ranges)
+            if missing_state is None:
+                missing_range = shard_ranges.pop(missing_index)
+                exp_gap_contents = []
+            else:
+                missing_range = shard_ranges[missing_index]
+                missing_range.state = missing_state
+                exp_gap_contents = [
+                    "      '%s'" % missing_range.name, mock.ANY, mock.ANY]
+            broker.merge_shard_ranges(shard_ranges)
+            self.assertTrue(broker.is_root_container())
+            out = StringIO()
+            err = StringIO()
+            with mock_timestamp_now(next(self.ts_iter)) as ts_now, \
+                    mock.patch('sys.stdout', out), \
+                    mock.patch('sys.stderr', err):
+                ret = main([broker.db_file, 'repair', '--gaps', '--yes'])
+            self.assertEqual(0, ret)
+            err_lines = err.getvalue().split('\n')
+            self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+            out_lines = out.getvalue().split('\n')
+            expander = all_shard_ranges[expander_index]
+            if missing_index < expander_index:
+                expander.lower = missing_range.lower
+            else:
+                expander.upper = missing_range.upper
+            expander.state_timestamp = expander.timestamp
+            expander.meta_timestamp = expander.timestamp
+            expander.timestamp = ts_now
+            self.assertEqual(
+                ['Found 1 gaps:',
+                 '  gap: %r - %r' % (missing_range.lower, missing_range.upper),
+                 '    apparent gap contents:']
+                + exp_gap_contents +
+                ['    gap can be fixed by expanding neighbor range:',
+                 "      '%s'" % expander.name] +
+                [mock.ANY] * 2 +
+                ['',
+                 'Repairs necessary to fill gaps.',
+                 'The following expanded shard range(s) will be applied to '
+                 'the DB:',
+                 "    '%s'" % expander.name] +
+                [mock.ANY] * 2 +
+                ['',
+                 'It is recommended that no other concurrent changes are made '
+                 'to the ',
+                 'shard ranges while fixing gaps. If necessary, abort '
+                 'this change ',
+                 'and stop any auto-sharding processes before repeating '
+                 'this command.',
+                 '',
+                 'Run container-replicator to replicate the changes to '
+                 'other nodes.',
+                 'Run container-sharder on all nodes to fill gaps.',
+                 ''],
+                out_lines)
+            updated_ranges = broker.get_shard_ranges()
+            self.assert_shard_ranges_equal(shard_ranges, updated_ranges)
+            os.remove(broker.db_file)
+
+        for i in range(len(self.shard_data) - 1):
+            do_test(i, i + 1)
+
+        do_test(len(self.shard_data) - 1, len(self.shard_data) - 2)
+
+        for i in range(len(self.shard_data) - 1):
+            do_test(i, i + 1, ShardRange.SHRINKING)
+
+        do_test(len(self.shard_data) - 1, len(self.shard_data) - 2,
+                ShardRange.SHRINKING)
+
+    def test_repair_gaps_multiple_missing(self):
+        def do_test(broker, max_expanding):
+            broker.set_sharding_sysmeta('Quoted-Root', 'a/c')
+            states = [
+                ShardRange.ACTIVE,
+                ShardRange.SHRINKING,
+                ShardRange.SHRUNK,
+                ShardRange.ACTIVE,
+                ShardRange.SHRUNK,
+                ShardRange.SHRINKING,
+                ShardRange.ACTIVE,
+                ShardRange.SHRINKING,
+                ShardRange.SHRUNK,
+                ShardRange.SHARDED,
+            ]
+            for i, shard in enumerate(self.shard_data):
+                shard['state'] = states[i]
+                if states[i] in (ShardRange.SHRUNK, ShardRange.SHARDED):
+                    shard['deleted'] = 1
+            with mock_timestamp_now(next(self.ts_iter)):
+                shard_ranges = make_shard_ranges(
+                    broker, self.shard_data, '.shards_')
+            broker.merge_shard_ranges(shard_ranges)
+            self.assertTrue(broker.is_root_container())
+            orig_shard_ranges = broker.get_shard_ranges(include_deleted=True)
+            out = StringIO()
+            err = StringIO()
+            args = [broker.db_file, 'repair', '--gaps', '--yes']
+            if max_expanding is not None:
+                args.extend(['--max-expanding', str(max_expanding)])
+            with mock_timestamp_now(next(self.ts_iter)) as ts_now, \
+                    mock.patch('sys.stdout', out), \
+                    mock.patch('sys.stderr', err):
+                ret = main(args)
+            self.assertEqual(0, ret)
+            err_lines = err.getvalue().split('\n')
+            self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+            out_lines = out.getvalue().split('\n')
+            os.remove(broker.db_file)
+            return orig_shard_ranges, out_lines, ts_now
+
+        # max-expanding 1
+        broker = self._make_broker()
+        orig_shard_ranges, out_lines, ts_now = do_test(broker, 1)
+        orig_shard_ranges[3].timestamp = ts_now
+        orig_shard_ranges[3].lower = orig_shard_ranges[1].lower
+        self.assertEqual(
+            ['Found 3 gaps:',
+             '  gap: %r - %r' % (orig_shard_ranges[1].lower,
+                                 orig_shard_ranges[2].upper),
+             '    apparent gap contents:']
+            + [mock.ANY] * 6 +
+            ['    gap can be fixed by expanding neighbor range:',
+             "      '%s'" % orig_shard_ranges[3].name] +
+            [mock.ANY] * 2 +
+            ['  gap: %r - %r' % (orig_shard_ranges[4].lower,
+                                 orig_shard_ranges[5].upper),
+             '    apparent gap contents:'] +
+            [mock.ANY] * 6 +
+            ['    gap can be fixed by expanding neighbor range:',
+             "      '%s'" % orig_shard_ranges[6].name] +
+            [mock.ANY] * 2 +
+            ['  gap: %r - %r' % (orig_shard_ranges[7].lower,
+                                 orig_shard_ranges[9].upper),
+             '    apparent gap contents:'] +
+            [mock.ANY] * 9 +
+            ['    gap can be fixed by expanding neighbor range:',
+             "      '%s'" % orig_shard_ranges[6].name] +
+            [mock.ANY] * 2 +
+            ['',
+             'Repairs necessary to fill gaps.',
+             'The following expanded shard range(s) will be applied to the '
+             'DB:',
+             "    '%s'" % orig_shard_ranges[3].name] +
+            [mock.ANY] * 6 +
+            ['',
+             'Run container-replicator to replicate the changes to '
+             'other nodes.',
+             'Run container-sharder on all nodes to fill gaps.',
+             ''],
+            out_lines)
+        updated_ranges = broker.get_shard_ranges(include_deleted=True)
+        self.assert_shard_ranges_equal(
+            sorted(orig_shard_ranges, key=lambda s: s.name),
+            sorted(updated_ranges, key=lambda s: s.name))
+
+        # max-expanding 2
+        broker = self._make_broker()
+        orig_shard_ranges, out_lines, ts_now = do_test(broker, 2)
+        orig_shard_ranges[3].timestamp = ts_now
+        orig_shard_ranges[3].lower = orig_shard_ranges[1].lower
+        orig_shard_ranges[6].timestamp = ts_now
+        orig_shard_ranges[6].lower = orig_shard_ranges[4].lower
+        self.assertEqual(
+            ['Found 3 gaps:',
+             '  gap: %r - %r' % (orig_shard_ranges[1].lower,
+                                 orig_shard_ranges[2].upper),
+             '    apparent gap contents:'] +
+            [mock.ANY] * 6 +
+            ['    gap can be fixed by expanding neighbor range:',
+             "      '%s'" % orig_shard_ranges[3].name] +
+            [mock.ANY] * 2 +
+            ['  gap: %r - %r' % (orig_shard_ranges[4].lower,
+                                 orig_shard_ranges[5].upper),
+             '    apparent gap contents:'] +
+            [mock.ANY] * 6 +
+            ['    gap can be fixed by expanding neighbor range:',
+             "      '%s'" % orig_shard_ranges[6].name] +
+            [mock.ANY] * 2 +
+            ['  gap: %r - %r' % (orig_shard_ranges[7].lower,
+                                 orig_shard_ranges[9].upper),
+             '    apparent gap contents:'] +
+            [mock.ANY] * 9 +
+            ['    gap can be fixed by expanding neighbor range:',
+             "      '%s'" % orig_shard_ranges[6].name] +
+            [mock.ANY] * 2 +
+            ['',
+             'Repairs necessary to fill gaps.',
+             'The following expanded shard range(s) will be applied to the '
+             'DB:',
+             "    '%s'" % orig_shard_ranges[3].name] +
+            [mock.ANY] * 2 +
+            ["    '%s'" % orig_shard_ranges[6].name] +
+            [mock.ANY] * 6 +
+            ['',
+             'Run container-replicator to replicate the changes to '
+             'other nodes.',
+             'Run container-sharder on all nodes to fill gaps.',
+             ''],
+            out_lines)
+        updated_ranges = broker.get_shard_ranges(include_deleted=True)
+        self.assert_shard_ranges_equal(
+            sorted(orig_shard_ranges, key=lambda s: s.name),
+            sorted(updated_ranges, key=lambda s: s.name))
+
+        # max-expanding unlimited
+        broker = self._make_broker()
+        orig_shard_ranges, out_lines, ts_now = do_test(broker, None)
+        orig_shard_ranges[3].timestamp = ts_now
+        orig_shard_ranges[3].lower = orig_shard_ranges[1].lower
+        orig_shard_ranges[6].timestamp = ts_now
+        orig_shard_ranges[6].lower = orig_shard_ranges[4].lower
+        orig_shard_ranges[6].upper = orig_shard_ranges[9].upper
+        self.assertEqual(
+            ['Found 3 gaps:',
+             '  gap: %r - %r' % (orig_shard_ranges[1].lower,
+                                 orig_shard_ranges[2].upper),
+             '    apparent gap contents:'] +
+            [mock.ANY] * 6 +
+            ['    gap can be fixed by expanding neighbor range:',
+             "      '%s'" % orig_shard_ranges[3].name] +
+            [mock.ANY] * 2 +
+            ['  gap: %r - %r' % (orig_shard_ranges[4].lower,
+                                 orig_shard_ranges[5].upper),
+             '    apparent gap contents:'] +
+            [mock.ANY] * 6 +
+            ['    gap can be fixed by expanding neighbor range:',
+             "      '%s'" % orig_shard_ranges[6].name] +
+            [mock.ANY] * 2 +
+            ['  gap: %r - %r' % (orig_shard_ranges[7].lower,
+                                 orig_shard_ranges[9].upper),
+             '    apparent gap contents:'] +
+            [mock.ANY] * 9 +
+            ['    gap can be fixed by expanding neighbor range:',
+             "      '%s'" % orig_shard_ranges[6].name] +
+            [mock.ANY] * 2 +
+            ['',
+             'Repairs necessary to fill gaps.',
+             'The following expanded shard range(s) will be applied to the '
+             'DB:',
+             "    '%s'" % orig_shard_ranges[3].name] +
+            [mock.ANY] * 2 +
+            ["    '%s'" % orig_shard_ranges[6].name] +
+            [mock.ANY] * 6 +
+            ['',
+             'Run container-replicator to replicate the changes to '
+             'other nodes.',
+             'Run container-sharder on all nodes to fill gaps.',
+             ''],
+            out_lines)
+        updated_ranges = broker.get_shard_ranges(include_deleted=True)
+        self.assert_shard_ranges_equal(
+            sorted(orig_shard_ranges, key=lambda s: s.name),
+            sorted(updated_ranges, key=lambda s: s.name))
+
+    def test_repair_gaps_complete_sequence(self):
+        broker = self._make_broker()
+        broker.set_sharding_sysmeta('Quoted-Root', 'a/c')
+        for shard in self.shard_data:
+            shard['state'] = ShardRange.ACTIVE
+        with mock_timestamp_now(next(self.ts_iter)):
+            shard_ranges = make_shard_ranges(
+                broker, self.shard_data, '.shards_')
+        broker.merge_shard_ranges(shard_ranges)
+        self.assertTrue(broker.is_root_container())
+        out = StringIO()
+        err = StringIO()
+        with mock_timestamp_now(next(self.ts_iter)), \
+                mock.patch('sys.stdout', out), \
+                mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'repair', '--gaps', '--yes'])
+        self.assertEqual(0, ret)
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        out_lines = out.getvalue().split('\n')
+        self.assertEqual(
+            ['Found one complete sequence of %d shard ranges with no gaps.'
+             % len(self.shard_data),
+             'No repairs necessary.'], out_lines[:2])
+        updated_ranges = broker.get_shard_ranges()
+        self.assert_shard_ranges_equal(shard_ranges, updated_ranges)
+
+    def test_repair_gaps_with_overlap(self):
+        # verify that overlaps don't look like gaps
+        broker = self._make_broker()
+        broker.set_sharding_sysmeta('Quoted-Root', 'a/c')
+        for shard in self.shard_data:
+            shard['state'] = ShardRange.ACTIVE
+        with mock_timestamp_now(next(self.ts_iter)):
+            shard_ranges = make_shard_ranges(
+                broker, self.shard_data, '.shards_')
+        # create a gap
+        shard_ranges[3].state = ShardRange.SHRINKING
+        # create an overlap
+        shard_ranges[5].lower = 'obj45'
+        self.assertLess(shard_ranges[5].lower, shard_ranges[4].upper)
+        broker.merge_shard_ranges(shard_ranges)
+        orig_shard_ranges = broker.get_shard_ranges()
+        self.assertTrue(broker.is_root_container())
+        out = StringIO()
+        err = StringIO()
+        with mock_timestamp_now(next(self.ts_iter)) as ts_now, \
+                mock.patch('sys.stdout', out), \
+                mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'repair', '--gaps', '--yes'])
+        self.assertEqual(0, ret)
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        out_lines = out.getvalue().split('\n')
+        self.assertEqual(
+            ['Found 1 gaps:',
+             '  gap: %r - %r' % (shard_ranges[3].lower,
+                                 shard_ranges[3].upper),
+             '    apparent gap contents:'] +
+            [mock.ANY] * 3 +
+            ['    gap can be fixed by expanding neighbor range:',
+             "      '%s'" % shard_ranges[4].name] +
+            [mock.ANY] * 2 +
+            ['',
+             'Repairs necessary to fill gaps.',
+             'The following expanded shard range(s) will be applied to the '
+             'DB:',
+             "    '%s'" % shard_ranges[4].name] +
+            [mock.ANY] * 6 +
+            ['',
+             'Run container-replicator to replicate the changes to '
+             'other nodes.',
+             'Run container-sharder on all nodes to fill gaps.',
+             ''],
+            out_lines)
+        orig_shard_ranges[4].lower = shard_ranges[3].lower
+        orig_shard_ranges[4].timestamp = ts_now
+        updated_ranges = broker.get_shard_ranges()
+        self.assert_shard_ranges_equal(orig_shard_ranges, updated_ranges)
+
+    def test_repair_gaps_not_root(self):
+        broker = self._make_broker()
+        shard_ranges = make_shard_ranges(broker, self.shard_data, '.shards_')
+        broker.merge_shard_ranges(shard_ranges)
+        # make broker appear to not be a root container
+        out = StringIO()
+        err = StringIO()
+        broker.set_sharding_sysmeta('Quoted-Root', 'not_a/c')
+        self.assertFalse(broker.is_root_container())
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'repair', '--gaps'])
+        self.assertEqual(1, ret)
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        out_lines = out.getvalue().split('\n')
+        self.assertEqual(
+            ['WARNING: Shard containers cannot be repaired.',
+             'This command should be used on a root container.'],
+            out_lines[:2]
+        )
+        updated_ranges = broker.get_shard_ranges()
+        self.assert_shard_ranges_equal(shard_ranges, updated_ranges)
+
+    def test_repair_not_needed(self):
+        broker = self._make_broker()
+        broker.set_sharding_sysmeta('Quoted-Root', 'a/c')
+        shard_ranges = make_shard_ranges(
+            broker, self.shard_data, '.shards_')
+        broker.merge_shard_ranges(shard_ranges)
+        self.assertTrue(broker.is_root_container())
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'repair'])
+        self.assertEqual(0, ret)
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        out_lines = out.getvalue().split('\n')
+        self.assertEqual(
+            ['Found one complete sequence of 10 shard ranges and no '
+             'overlapping shard ranges.',
+             'No repairs necessary.'],
+            out_lines[:2])
+        updated_ranges = broker.get_shard_ranges()
+        self.assert_shard_ranges_equal(shard_ranges, updated_ranges)
+
+    def _do_test_repair_exits_if_undesirable_state(self, undesirable_state):
+        broker = self._make_broker()
+        broker.set_sharding_sysmeta('Quoted-Root', 'a/c')
+        with mock_timestamp_now(next(self.ts_iter)):
+            shard_ranges = make_shard_ranges(
+                broker, self.shard_data, '.shards_')
+        # make one shard be in an undesirable state
+        shard_ranges[2].update_state(undesirable_state)
+        with mock_timestamp_now(next(self.ts_iter)):
+            overlap_shard_ranges_2 = make_shard_ranges(
+                broker, self.overlap_shard_data_2, '.shards_')
+        broker.merge_shard_ranges(shard_ranges + overlap_shard_ranges_2)
+        self.assertTrue(broker.is_root_container())
+
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), \
+                mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'repair'])
+        self.assertEqual(1, ret)
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        out_lines = out.getvalue().split('\n')
+        self.assertEqual(
+            ['WARNING: Found shard ranges in %s state'
+             % ShardRange.STATES[undesirable_state]], out_lines[:1])
+        # nothing changed in DB
+        self.assert_shard_ranges_equal(
+            sorted(shard_ranges + overlap_shard_ranges_2,
+                   key=ShardRange.sort_key),
+            broker.get_shard_ranges())
+
+    def test_repair_exits_if_sharding_state(self):
+        self._do_test_repair_exits_if_undesirable_state(ShardRange.SHARDING)
+
+    def test_repair_exits_if_shrinking_state(self):
+        self._do_test_repair_exits_if_undesirable_state(ShardRange.SHRINKING)
+
+    def test_repair_one_complete_sequences_one_incomplete(self):
+        broker = self._make_broker()
+        broker.set_sharding_sysmeta('Quoted-Root', 'a/c')
+        with mock_timestamp_now(next(self.ts_iter)):
+            shard_ranges = make_shard_ranges(
+                broker, self.shard_data, '.shards_')
+        with mock_timestamp_now(next(self.ts_iter)):
+            overlap_shard_ranges_2 = make_shard_ranges(
+                broker, self.overlap_shard_data_2, '.shards_')
+        broker.merge_shard_ranges(shard_ranges + overlap_shard_ranges_2)
+        self.assertTrue(broker.is_root_container())
+
+        def do_repair(user_input, ts_now, options, exit_code):
+            options = options if options else []
+            out = StringIO()
+            err = StringIO()
+            with mock.patch('sys.stdout', out), \
+                    mock.patch('sys.stderr', err), \
+                    mock_timestamp_now(ts_now), \
+                    mock.patch('swift.cli.manage_shard_ranges.input',
+                               side_effect=[user_input]):
+                ret = main(
+                    [broker.db_file, 'repair', '--min-shard-age', '0'] +
+                    options)
+            self.assertEqual(exit_code, ret)
+            err_lines = err.getvalue().split('\n')
+            self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+            out_lines = out.getvalue().split('\n')
+            self.assertEqual(
+                ['Repairs necessary to remove overlapping shard ranges.'],
+                out_lines[:1])
+
+        # user input 'n'
+        ts_now = next(self.ts_iter)
+        do_repair('n', ts_now, [], 3)
+        updated_ranges = broker.get_shard_ranges()
+        expected = sorted(
+            shard_ranges + overlap_shard_ranges_2,
+            key=ShardRange.sort_key)
+        self.assert_shard_ranges_equal(expected, updated_ranges)
+
+        ts_now = next(self.ts_iter)
+        do_repair(EOFError, ts_now, [], 3)
+        updated_ranges = broker.get_shard_ranges()
+        self.assert_shard_ranges_equal(expected, updated_ranges)
+
+        ts_now = next(self.ts_iter)
+        do_repair(KeyboardInterrupt, ts_now, [], 3)
+        updated_ranges = broker.get_shard_ranges()
+        self.assert_shard_ranges_equal(expected, updated_ranges)
+
+        # --dry-run
+        ts_now = next(self.ts_iter)
+        do_repair('y', ts_now, ['--dry-run'], 3)
+        updated_ranges = broker.get_shard_ranges()
+        expected = sorted(
+            shard_ranges + overlap_shard_ranges_2,
+            key=ShardRange.sort_key)
+        self.assert_shard_ranges_equal(expected, updated_ranges)
+
+        # --n
+        ts_now = next(self.ts_iter)
+        do_repair('y', ts_now, ['-n'], 3)
+        updated_ranges = broker.get_shard_ranges()
+        expected = sorted(
+            shard_ranges + overlap_shard_ranges_2,
+            key=ShardRange.sort_key)
+        self.assert_shard_ranges_equal(expected, updated_ranges)
+
+        # user input 'yes'
+        ts_now = next(self.ts_iter)
+        do_repair('yes', ts_now, [], 0)
+        updated_ranges = broker.get_shard_ranges()
+        for sr in overlap_shard_ranges_2:
+            sr.update_state(ShardRange.SHRINKING, ts_now)
+            sr.epoch = ts_now
+        expected = sorted(
+            shard_ranges + overlap_shard_ranges_2,
+            key=ShardRange.sort_key)
+        self.assert_shard_ranges_equal(expected, updated_ranges)
+
+    def test_repair_younger_overlapping_donor_shards(self):
+        # test shard range repair on the normal acceptor ranges and young
+        # overlapping shard ranges which are younger than '--min-shard-age',
+        # expect them not to be repaired.
+        broker = self._make_broker()
+        broker.set_sharding_sysmeta('Quoted-Root', 'a/c')
+        ts_now = next(self.ts_iter)
+        with mock_timestamp_now(Timestamp(float(ts_now) - 61)):
+            acceptor_ranges = make_shard_ranges(
+                broker, self.shard_data, '.shards_')
+        with mock_timestamp_now(ts_now):
+            overlap_donor_ranges = make_shard_ranges(
+                broker, self.overlap_shard_data_2, '.shards_')
+        broker.merge_shard_ranges(acceptor_ranges + overlap_donor_ranges)
+        self.assertTrue(broker.is_root_container())
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main(
+                [broker.db_file, 'repair', '--min-shard-age', '60', '-y'])
+        self.assertEqual(0, ret)
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        out_lines = out.getvalue().split('\n')
+        self.assertEqual(
+            ['2 overlapping donor shards ignored due to minimum age limit'],
+            out_lines[:1])
+        updated_ranges = broker.get_shard_ranges()
+        expected = sorted(
+            acceptor_ranges + overlap_donor_ranges,
+            key=ShardRange.sort_key)
+        self.assert_shard_ranges_equal(expected, updated_ranges)
+
+    def test_repair_younger_acceptor_with_overlapping_donor_shards(self):
+        # test shard range repair on the overlapping normal donor ranges and
+        # young acceptor shard ranges who are younger than '--min-shard-age',
+        # expect no overlapping ranges to be repaired.
+        broker = self._make_broker()
+        broker.set_sharding_sysmeta('Quoted-Root', 'a/c')
+        ts_now = next(self.ts_iter)
+        with mock_timestamp_now(Timestamp(float(ts_now) + 3601)):
+            acceptor_ranges = make_shard_ranges(
+                broker, self.shard_data, '.shards_')
+        with mock_timestamp_now(ts_now):
+            overlap_donor_ranges = make_shard_ranges(
+                broker, self.overlap_shard_data_2, '.shards_')
+        broker.merge_shard_ranges(acceptor_ranges + overlap_donor_ranges)
+        self.assertTrue(broker.is_root_container())
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), \
+                mock.patch('sys.stderr', err), \
+                mock_timestamp_now(Timestamp(float(ts_now) + 3601 + 59)):
+            ret = main(
+                [broker.db_file, 'repair', '--min-shard-age', '60', '-y'])
+        self.assertEqual(0, ret)
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        out_lines = out.getvalue().split('\n')
+        self.assertEqual(
+            ['2 donor shards ignored due to existence of overlapping young'
+             ' acceptors'], out_lines[:1])
+        updated_ranges = broker.get_shard_ranges()
+        expected = sorted(
+            acceptor_ranges + overlap_donor_ranges,
+            key=ShardRange.sort_key)
+        self.assert_shard_ranges_equal(expected, updated_ranges)
+
+    def test_repair_older_overlapping_donor_and_acceptor_shards(self):
+        # test shard range repair on the overlapping donor and acceptor shard
+        # ranges which all are older than '--min-shard-age', expect them to be
+        # repaired.
+        broker = self._make_broker()
+        broker.set_sharding_sysmeta('Quoted-Root', 'a/c')
+        ts_now = next(self.ts_iter)
+        with mock_timestamp_now(ts_now):
+            acceptor_ranges = make_shard_ranges(
+                broker, self.shard_data, '.shards_')
+        with mock_timestamp_now(Timestamp(float(ts_now) + 1800)):
+            overlap_donor_ranges = make_shard_ranges(
+                broker, self.overlap_shard_data_2, '.shards_')
+        broker.merge_shard_ranges(acceptor_ranges + overlap_donor_ranges)
+        self.assertTrue(broker.is_root_container())
+        out = StringIO()
+        err = StringIO()
+        ts_1hr_after = Timestamp(float(ts_now) + 3601)
+        with mock.patch('sys.stdout', out), \
+                mock.patch('sys.stderr', err), \
+                mock_timestamp_now(ts_1hr_after):
+            ret = main(
+                [broker.db_file, 'repair', '--min-shard-age', '60', '-y'])
+        self.assertEqual(0, ret)
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        out_lines = out.getvalue().split('\n')
+        self.assertEqual(
+            ['Repairs necessary to remove overlapping shard ranges.'],
+            out_lines[:1])
+        updated_ranges = broker.get_shard_ranges()
+        for sr in overlap_donor_ranges:
+            sr.update_state(ShardRange.SHRINKING, ts_1hr_after)
+            sr.epoch = ts_1hr_after
+        expected = sorted(
+            acceptor_ranges + overlap_donor_ranges,
+            key=ShardRange.sort_key)
+        self.assert_shard_ranges_equal(expected, updated_ranges)
+
+    def test_repair_overlapping_donor_and_acceptor_shards_default(self):
+        # test shard range repair on the overlapping donor and acceptor shard
+        # ranges wth default '--min-shard-age' value.
+        broker = self._make_broker()
+        broker.set_sharding_sysmeta('Quoted-Root', 'a/c')
+        ts_now = next(self.ts_iter)
+        with mock_timestamp_now(ts_now):
+            acceptor_ranges = make_shard_ranges(
+                broker, self.shard_data, '.shards_')
+        with mock_timestamp_now(Timestamp(int(ts_now) + 1)):
+            overlap_donor_ranges = make_shard_ranges(
+                broker, self.overlap_shard_data_2, '.shards_')
+        broker.merge_shard_ranges(acceptor_ranges + overlap_donor_ranges)
+        self.assertTrue(broker.is_root_container())
+        out = StringIO()
+        err = StringIO()
+        ts_repair = Timestamp(int(ts_now) + 4 * 3600 - 1)
+        with mock.patch('sys.stdout', out), \
+                mock.patch('sys.stderr', err), \
+                mock_timestamp_now(ts_repair):
+            # default min-shard-age prevents repair...
+            ret = main([broker.db_file, 'repair', '-y'])
+        self.assertEqual(0, ret)
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        out_lines = out.getvalue().split('\n')
+        self.assertEqual(
+            ['2 overlapping donor shards ignored due to minimum age limit'],
+            out_lines[:1])
+        updated_ranges = broker.get_shard_ranges()
+        expected = sorted(
+            acceptor_ranges + overlap_donor_ranges,
+            key=ShardRange.sort_key)
+        self.assert_shard_ranges_equal(expected, updated_ranges)
+
+        out = StringIO()
+        err = StringIO()
+        ts_repair = Timestamp(int(ts_now) + 4 * 3600 + 2)
+        with mock.patch('sys.stdout', out), \
+                mock.patch('sys.stderr', err), \
+                mock_timestamp_now(ts_repair):
+            # default min-shard-age allows repair now...
+            ret = main([broker.db_file, 'repair', '-y'])
+        self.assertEqual(0, ret)
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        out_lines = out.getvalue().split('\n')
+        self.assertEqual(
+            ['Repairs necessary to remove overlapping shard ranges.'],
+            out_lines[:1])
+        updated_ranges = broker.get_shard_ranges()
+        for sr in overlap_donor_ranges:
+            sr.update_state(ShardRange.SHRINKING, ts_repair)
+            sr.epoch = ts_repair
+        expected = sorted(
+            acceptor_ranges + overlap_donor_ranges,
+            key=ShardRange.sort_key)
+        self.assert_shard_ranges_equal(expected, updated_ranges)
+
+    def test_repair_two_complete_sequences_one_incomplete(self):
+        broker = self._make_broker()
+        broker.set_sharding_sysmeta('Quoted-Root', 'a/c')
+        with mock_timestamp_now(next(self.ts_iter)):
+            shard_ranges = make_shard_ranges(
+                broker, self.shard_data, '.shards_')
+        with mock_timestamp_now(next(self.ts_iter)):
+            overlap_shard_ranges_1 = make_shard_ranges(
+                broker, self.overlap_shard_data_1, '.shards_')
+        with mock_timestamp_now(next(self.ts_iter)):
+            overlap_shard_ranges_2 = make_shard_ranges(
+                broker, self.overlap_shard_data_2, '.shards_')
+        broker.merge_shard_ranges(shard_ranges + overlap_shard_ranges_1 +
+                                  overlap_shard_ranges_2)
+        self.assertTrue(broker.is_root_container())
+        out = StringIO()
+        err = StringIO()
+        ts_now = next(self.ts_iter)
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err), \
+                mock_timestamp_now(ts_now):
+            ret = main([broker.db_file, 'repair', '--yes',
+                        '--min-shard-age', '0'])
+        self.assertEqual(0, ret)
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        out_lines = out.getvalue().split('\n')
+        self.assertEqual(
+            ['Repairs necessary to remove overlapping shard ranges.'],
+            out_lines[:1])
+        updated_ranges = broker.get_shard_ranges()
+        for sr in overlap_shard_ranges_1 + overlap_shard_ranges_2:
+            sr.update_state(ShardRange.SHRINKING, ts_now)
+            sr.epoch = ts_now
+        expected = sorted(
+            shard_ranges + overlap_shard_ranges_1 + overlap_shard_ranges_2,
+            key=ShardRange.sort_key)
+        self.assert_shard_ranges_equal(expected, updated_ranges)
+
+    def test_repair_parent_overlaps_with_children_donors(self):
+        # Verify that the overlap repair command ignores expected transient
+        # overlaps between parent shard acceptor and child donor shards.
+        root_broker = self._make_broker()
+        root_broker.set_sharding_sysmeta('Quoted-Root', 'a/c')
+        self.assertTrue(root_broker.is_root_container())
+
+        # The parent shard range would have been set to state SHARDING in the
+        # shard container but is still showing as ACTIVE in the root container.
+        # (note: it is valid for a single shard to span entire namespace)
+        ts_parent = next(self.ts_iter)
+        parent_shard = ShardRange(
+            ShardRange.make_path('.shards_a', 'c', 'c', ts_parent, 0),
+            ts_parent, lower='', upper='', object_count=10,
+            state=ShardRange.ACTIVE)
+
+        # Children shards have reported themselves to root as CLEAVING/
+        # CREATED.
+        ts_child = next(self.ts_iter)
+        child_shards = [
+            ShardRange(
+                ShardRange.make_path(
+                    '.shards_a', 'c', parent_shard.container, ts_child, 0),
+                ts_child, lower='', upper='p', object_count=1,
+                state=ShardRange.CLEAVED),
+            ShardRange(
+                ShardRange.make_path(
+                    '.shards_a', 'c', parent_shard.container, ts_child, 1),
+                ts_child, lower='p', upper='', object_count=1,
+                state=ShardRange.CLEAVED)]
+        root_broker.merge_shard_ranges([parent_shard] + child_shards)
+
+        out = StringIO()
+        err = StringIO()
+        ts_now = next(self.ts_iter)
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err), \
+                mock_timestamp_now(ts_now):
+            ret = main([root_broker.db_file, 'repair',
+                       '--yes', '--min-shard-age', '0'])
+        err_lines = err.getvalue().split('\n')
+        out_lines = out.getvalue().split('\n')
+        self.assertEqual(0, ret, err_lines + out_lines)
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        self.assertNotIn(
+            'Repairs necessary to remove overlapping shard ranges.',
+            out_lines)
+        self.assertEqual(
+            ['2 donor shards ignored due to parent-child relationship'
+             ' checks'], out_lines[:1])
+        updated_ranges = root_broker.get_shard_ranges()
+        # Expect no change to shard ranges.
+        expected = sorted([parent_shard] + child_shards,
+                          key=ShardRange.sort_key)
+        self.assert_shard_ranges_equal(expected, updated_ranges)
+
+    def test_repair_children_overlaps_with_parent_donor(self):
+        # Verify that the overlap repair command ignores expected transient
+        # overlaps between child shard acceptors and parent donor shards.
+        root_broker = self._make_broker()
+        root_broker.set_sharding_sysmeta('Quoted-Root', 'a/c')
+        self.assertTrue(root_broker.is_root_container())
+
+        # The parent shard range would have been set to state SHARDING in the
+        # shard container but is still showing as ACTIVE in the root container.
+        # (note: it is valid for a single shard to span entire namespace)
+        ts_parent = next(self.ts_iter)
+        parent_shard = ShardRange(
+            ShardRange.make_path('.shards_a', 'c', 'c', ts_parent, 0),
+            ts_parent, lower='', upper='', object_count=5,
+            state=ShardRange.ACTIVE)
+
+        # Children shards have reported themselves to root as CLEAVING/CREATED,
+        # but they will end up with becoming acceptor shards due to having more
+        # objects than the above parent shard.
+        ts_child = next(self.ts_iter)
+        child_shards = [
+            ShardRange(
+                ShardRange.make_path(
+                    '.shards_a', 'c', parent_shard.container, ts_child, 0),
+                ts_child, lower='', upper='p', object_count=5,
+                state=ShardRange.CLEAVED),
+            ShardRange(
+                ShardRange.make_path(
+                    '.shards_a', 'c', parent_shard.container, ts_child, 1),
+                ts_child, lower='p', upper='', object_count=5,
+                state=ShardRange.CLEAVED)]
+        root_broker.merge_shard_ranges([parent_shard] + child_shards)
+
+        out = StringIO()
+        err = StringIO()
+        ts_now = next(self.ts_iter)
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err), \
+                mock_timestamp_now(ts_now):
+            ret = main([root_broker.db_file, 'repair',
+                       '--yes', '--min-shard-age', '0'])
+        err_lines = err.getvalue().split('\n')
+        out_lines = out.getvalue().split('\n')
+        self.assertEqual(0, ret, err_lines + out_lines)
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        self.assertNotIn(
+            'Repairs necessary to remove overlapping shard ranges.',
+            out_lines)
+        self.assertEqual(
+            ['1 donor shards ignored due to parent-child relationship'
+             ' checks'], out_lines[:1])
+        updated_ranges = root_broker.get_shard_ranges()
+        # Expect no change to shard ranges.
+        expected = sorted([parent_shard] + child_shards,
+                          key=ShardRange.sort_key)
+        self.assert_shard_ranges_equal(expected, updated_ranges)
+
+    @with_tempdir
+    def test_show_and_analyze(self, tempdir):
+        broker = self._make_broker()
+        broker.set_sharding_sysmeta('Quoted-Root', 'a/c')
+        with mock_timestamp_now(next(self.ts_iter)):  # t1
+            shard_ranges = make_shard_ranges(
+                broker, self.shard_data, '.shards_')
+        with mock_timestamp_now(next(self.ts_iter)):
+            overlap_shard_ranges_1 = make_shard_ranges(
+                broker, self.overlap_shard_data_1, '.shards_')
+        with mock_timestamp_now(next(self.ts_iter)):
+            overlap_shard_ranges_2 = make_shard_ranges(
+                broker, self.overlap_shard_data_2, '.shards_')
+        broker.merge_shard_ranges(shard_ranges + overlap_shard_ranges_1 +
+                                  overlap_shard_ranges_2)
+        self.assertTrue(broker.is_root_container())
+
+        # run show command
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'show'])
+        self.assertEqual(0, ret)
+        err_lines = err.getvalue().split('\n')
+        self.assert_starts_with(err_lines[0], 'Loaded db broker for ')
+        shard_json = json.loads(out.getvalue())
+        expected = sorted(
+            shard_ranges + overlap_shard_ranges_1 + overlap_shard_ranges_2,
+            key=ShardRange.sort_key)
+        self.assert_shard_ranges_equal(
+            expected, [ShardRange.from_dict(data) for data in shard_json])
+
+        # dump data to a file and then run analyze subcommand
+        shard_file = os.path.join(tempdir, 'shards.json')
+        with open(shard_file, 'w') as fd:
+            json.dump(shard_json, fd)
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([shard_file, 'analyze'])
+        self.assertEqual(0, ret)
+        self.assertEqual('', err.getvalue())
+        out_lines = out.getvalue().split('\n')
+        self.assertEqual(
+            ['Repairs necessary to remove overlapping shard ranges.'],
+            out_lines[:1])
+
+        # no changes made to broker
+        updated_ranges = broker.get_shard_ranges()
+        expected = sorted(
+            shard_ranges + overlap_shard_ranges_1 + overlap_shard_ranges_2,
+            key=ShardRange.sort_key)
+        self.assert_shard_ranges_equal(expected, updated_ranges)
+
+        # tweak timestamps to make the preferred path include shards from two
+        # sets, so that shards to remove have name-timestamps that are also in
+        # shards to keep
+        t4 = next(self.ts_iter)
+        for sr in shard_ranges[:5] + overlap_shard_ranges_1[5:]:
+            sr.timestamp = t4
+        broker.merge_shard_ranges(shard_ranges + overlap_shard_ranges_1 +
+                                  overlap_shard_ranges_2)
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([broker.db_file, 'show'])
+        self.assertEqual(0, ret)
+        shard_json = json.loads(out.getvalue())
+        expected = sorted(
+            shard_ranges + overlap_shard_ranges_1 + overlap_shard_ranges_2,
+            key=ShardRange.sort_key)
+        self.assert_shard_ranges_equal(
+            expected, [ShardRange.from_dict(data) for data in shard_json])
+        with open(shard_file, 'w') as fd:
+            json.dump(shard_json, fd)
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([shard_file, 'analyze'])
+        self.assertEqual(0, ret)
+        self.assertEqual('', err.getvalue())
+        out_lines = out.getvalue().split('\n')
+        self.assertEqual(
+            ['Repairs necessary to remove overlapping shard ranges.'],
+            out_lines[:1])
+
+        filtered_shard_json = [{k: v for k, v in sr.items() if k != 'epoch'}
+                               for sr in shard_json]
+        with open(shard_file, 'w') as fd:
+            json.dump(filtered_shard_json, fd)
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), mock.patch('sys.stderr', err):
+            ret = main([shard_file, 'analyze'])
+        self.assertEqual(0, ret)
+        self.assertEqual('', err.getvalue())
+        new_out_lines = out.getvalue().split('\n')
+        self.assertEqual(out_lines, new_out_lines)
+
+    def test_subcommand_required(self):
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), \
+                mock.patch('sys.stderr', err):
+            ret = main(['db file'])
+            self.assertEqual(2, ret)
+            err_lines = err.getvalue().split('\n')
+            self.assertIn('A sub-command is required.', err_lines)
+
+    def test_dry_run_and_yes_is_invalid(self):
+        out = StringIO()
+        err = StringIO()
+        with mock.patch('sys.stdout', out), \
+                mock.patch('sys.stderr', err), \
+                self.assertRaises(SystemExit) as cm:
+            main(['db file', 'repair', '--dry-run', '--yes'])
+        self.assertEqual(2, cm.exception.code)
+        err_lines = err.getvalue().split('\n')
+        runner = os.path.basename(sys.argv[0])
+        self.assertIn(
+            'usage: %s path_to_file repair [-h] [--yes | --dry-run]' % runner,
+            err_lines[0])
+        self.assertIn(
+            "argument --yes/-y: not allowed with argument --dry-run/-n",
+            err_lines[-2], err_lines)
+
+    def test_skip_commits_and_force_commits_args(self):
+        broker = self._make_broker()
+
+        with mock.patch('swift.cli.manage_shard_ranges.find_ranges',
+                        return_value=0) as mocked:
+            ret = main([broker.db_file, '--skip-commits', 'find'])
+        self.assertEqual(0, ret)
+        args = mocked.call_args[0][1]
+        self.assertTrue(args.skip_commits,
+                        '--skip-commits should set skip_commits to True')
+
+        with mock.patch('swift.cli.manage_shard_ranges.find_ranges',
+                        return_value=0) as mocked:
+            ret = main([broker.db_file, '--force-commits', 'find'])
+        self.assertEqual(0, ret)
+        args = mocked.call_args[0][1]
+        self.assertFalse(args.skip_commits,
+                         '--force-commits should set skip_commits to False')
+
+        # default (no flag) sets skip_commits to False
+        with mock.patch('swift.cli.manage_shard_ranges.find_ranges',
+                        return_value=0) as mocked:
+            ret = main([broker.db_file, 'find'])
+        self.assertEqual(0, ret)
+        args = mocked.call_args[0][1]
+        self.assertFalse(args.skip_commits,
+                         'default should set skip_commits to False')
diff --git a/test/unit/cli/test_recon.py b/test/unit/cli/test_recon.py
new file mode 100644
index 0000000000..d77191a043
--- /dev/null
+++ b/test/unit/cli/test_recon.py
@@ -0,0 +1,1391 @@
+# Copyright (c) 2013 Christian Schwede <christian.schwede@enovance.com>
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import json
+from unittest import mock
+import os
+import random
+import re
+import tempfile
+import time
+import unittest
+import shutil
+import string
+import sys
+
+from eventlet.green import socket
+from io import StringIO
+import urllib
+
+from swift.cli import recon
+from swift.common import utils
+from swift.common.ring import builder
+from swift.common.ring import utils as ring_utils
+from swift.common.storage_policy import StoragePolicy, POLICIES
+from test.unit import patch_policies
+
+from eventlet.green.urllib import request as urllib_request
+GREEN_URLLIB_URLOPEN = 'eventlet.green.urllib.request.urlopen'
+
+
+class TestHelpers(unittest.TestCase):
+    def test_seconds2timeunit(self):
+        self.assertEqual(recon.seconds2timeunit(10), (10, 'seconds'))
+        self.assertEqual(recon.seconds2timeunit(600), (10, 'minutes'))
+        self.assertEqual(recon.seconds2timeunit(36000), (10, 'hours'))
+        self.assertEqual(recon.seconds2timeunit(60 * 60 * 24 * 10),
+                         (10, 'days'))
+
+    def test_size_suffix(self):
+        self.assertEqual(recon.size_suffix(5 * 10 ** 2), '500 bytes')
+        self.assertEqual(recon.size_suffix(5 * 10 ** 3), '5 kB')
+        self.assertEqual(recon.size_suffix(5 * 10 ** 6), '5 MB')
+        self.assertEqual(recon.size_suffix(5 * 10 ** 9), '5 GB')
+        self.assertEqual(recon.size_suffix(5 * 10 ** 12), '5 TB')
+        self.assertEqual(recon.size_suffix(5 * 10 ** 15), '5 PB')
+        self.assertEqual(recon.size_suffix(5 * 10 ** 18), '5 EB')
+        self.assertEqual(recon.size_suffix(5 * 10 ** 21), '5 ZB')
+
+
+class TestScout(unittest.TestCase):
+    def setUp(self, *_args, **_kwargs):
+        self.scout_instance = recon.Scout("type", suppress_errors=True)
+        self.url = 'http://127.0.0.1:8080/recon/type'
+        self.server_type_url = 'http://127.0.0.1:8080/'
+
+    @mock.patch(GREEN_URLLIB_URLOPEN)
+    def test_scout_ok(self, mock_urlopen):
+        mock_urlopen.return_value.read = lambda: json.dumps([])
+        url, content, status, ts_start, ts_end = self.scout_instance.scout(
+            ("127.0.0.1", "8080"))
+        self.assertEqual(url, self.url)
+        self.assertEqual(content, [])
+        self.assertEqual(status, 200)
+
+    @mock.patch(GREEN_URLLIB_URLOPEN)
+    def test_scout_url_error(self, mock_urlopen):
+        mock_urlopen.side_effect = urllib_request.URLError("")
+        url, content, status, ts_start, ts_end = self.scout_instance.scout(
+            ("127.0.0.1", "8080"))
+        self.assertIsInstance(content, urllib_request.URLError)
+        self.assertEqual(url, self.url)
+        self.assertEqual(status, -1)
+
+    @mock.patch(GREEN_URLLIB_URLOPEN)
+    def test_scout_http_error(self, mock_urlopen):
+        mock_urlopen.side_effect = urllib_request.HTTPError(
+            self.url, 404, "Internal error", None, None)
+        url, content, status, ts_start, ts_end = self.scout_instance.scout(
+            ("127.0.0.1", "8080"))
+        self.assertEqual(url, self.url)
+        self.assertIsInstance(content, urllib_request.HTTPError)
+        self.assertEqual(status, 404)
+
+    @mock.patch(GREEN_URLLIB_URLOPEN)
+    def test_scout_socket_timeout(self, mock_urlopen):
+        mock_urlopen.side_effect = socket.timeout("timeout")
+        url, content, status, ts_start, ts_end = self.scout_instance.scout(
+            ("127.0.0.1", "8080"))
+        self.assertIsInstance(content, socket.timeout)
+        self.assertEqual(url, self.url)
+        self.assertEqual(status, -1)
+
+    @mock.patch(GREEN_URLLIB_URLOPEN)
+    def test_scout_server_type_ok(self, mock_urlopen):
+        def getheader(name):
+            d = {'Server': 'server-type'}
+            return d.get(name)
+        mock_urlopen.return_value.info.return_value.get = getheader
+        url, content, status = self.scout_instance.scout_server_type(
+            ("127.0.0.1", "8080"))
+        self.assertEqual(url, self.server_type_url)
+        self.assertEqual(content, 'server-type')
+        self.assertEqual(status, 200)
+
+    @mock.patch(GREEN_URLLIB_URLOPEN)
+    def test_scout_server_type_url_error(self, mock_urlopen):
+        mock_urlopen.side_effect = urllib_request.URLError("")
+        url, content, status = self.scout_instance.scout_server_type(
+            ("127.0.0.1", "8080"))
+        self.assertIsInstance(content, urllib_request.URLError)
+        self.assertEqual(url, self.server_type_url)
+        self.assertEqual(status, -1)
+
+    @mock.patch(GREEN_URLLIB_URLOPEN)
+    def test_scout_server_type_http_error(self, mock_urlopen):
+        mock_urlopen.side_effect = urllib_request.HTTPError(
+            self.server_type_url, 404, "Internal error", None, None)
+        url, content, status = self.scout_instance.scout_server_type(
+            ("127.0.0.1", "8080"))
+        self.assertEqual(url, self.server_type_url)
+        self.assertIsInstance(content, urllib_request.HTTPError)
+        self.assertEqual(status, 404)
+
+    @mock.patch(GREEN_URLLIB_URLOPEN)
+    def test_scout_server_type_socket_timeout(self, mock_urlopen):
+        mock_urlopen.side_effect = socket.timeout("timeout")
+        url, content, status = self.scout_instance.scout_server_type(
+            ("127.0.0.1", "8080"))
+        self.assertIsInstance(content, socket.timeout)
+        self.assertEqual(url, self.server_type_url)
+        self.assertEqual(status, -1)
+
+
+@patch_policies
+class TestRecon(unittest.TestCase):
+    def setUp(self, *_args, **_kwargs):
+        self.swift_conf_file = utils.SWIFT_CONF_FILE
+        self.recon_instance = recon.SwiftRecon()
+        self.swift_dir = tempfile.mkdtemp()
+        self.ring_name = POLICIES.legacy.ring_name
+        self.tmpfile_name = os.path.join(
+            self.swift_dir, self.ring_name + '.ring.gz')
+        self.ring_name2 = POLICIES[1].ring_name
+        self.tmpfile_name2 = os.path.join(
+            self.swift_dir, self.ring_name2 + '.ring.gz')
+
+        swift_conf = os.path.join(self.swift_dir, 'swift.conf')
+        self.policy_name = ''.join(random.sample(string.ascii_letters, 20))
+        swift_conf_data = '''
+[swift-hash]
+swift_hash_path_suffix = changeme
+
+[storage-policy:0]
+name = default
+default = yes
+
+[storage-policy:1]
+name = unu
+aliases = %s
+''' % self.policy_name
+        with open(swift_conf, "wb") as sc:
+            sc.write(swift_conf_data.encode('utf8'))
+
+    def tearDown(self, *_args, **_kwargs):
+        utils.SWIFT_CONF_FILE = self.swift_conf_file
+        shutil.rmtree(self.swift_dir, ignore_errors=True)
+
+    def _make_object_rings(self):
+        ringbuilder = builder.RingBuilder(2, 3, 1)
+        devs = [
+            'r0z0-127.0.0.1:10000/sda1',
+            'r0z1-127.0.0.1:10001/sda1',
+            'r1z0-127.0.0.1:10002/sda1',
+            'r1z1-127.0.0.1:10003/sda1',
+        ]
+        for raw_dev_str in devs:
+            dev = ring_utils.parse_add_value(raw_dev_str)
+            dev['weight'] = 1.0
+            ringbuilder.add_dev(dev)
+        ringbuilder.rebalance()
+        ringbuilder.get_ring().save(self.tmpfile_name)
+
+        ringbuilder = builder.RingBuilder(2, 2, 1)
+        devs = [
+            'r0z0-127.0.0.1:10000/sda1',
+            'r0z1-127.0.0.2:10004/sda1',
+        ]
+        for raw_dev_str in devs:
+            dev = ring_utils.parse_add_value(raw_dev_str)
+            dev['weight'] = 1.0
+            ringbuilder.add_dev(dev)
+        ringbuilder.rebalance()
+        ringbuilder.get_ring().save(self.tmpfile_name2)
+
+    def test_gen_stats(self):
+        stats = self.recon_instance._gen_stats((1, 4, 10, None), 'Sample')
+        self.assertEqual(stats.get('name'), 'Sample')
+        self.assertEqual(stats.get('average'), 5.0)
+        self.assertEqual(stats.get('high'), 10)
+        self.assertEqual(stats.get('reported'), 3)
+        self.assertEqual(stats.get('low'), 1)
+        self.assertEqual(stats.get('total'), 15)
+        self.assertEqual(stats.get('number_none'), 1)
+        self.assertEqual(stats.get('perc_none'), 25.0)
+
+    def test_ptime(self):
+        with mock.patch('time.gmtime') as mock_gmtime:
+            mock_gmtime.return_value = time.struct_time(
+                (2013, 12, 17, 10, 0, 0, 1, 351, 0))
+
+            timestamp = self.recon_instance._ptime(1387274400)
+            self.assertEqual(timestamp, "2013-12-17 10:00:00")
+            mock_gmtime.assert_called_with(1387274400)
+
+            timestamp2 = self.recon_instance._ptime()
+            self.assertEqual(timestamp2, "2013-12-17 10:00:00")
+            mock_gmtime.assert_called_with()
+
+    def test_get_hosts(self):
+        self._make_object_rings()
+
+        ips = self.recon_instance.get_hosts(
+            None, None, self.swift_dir, [self.ring_name])
+        self.assertEqual(
+            set([('127.0.0.1', 10000), ('127.0.0.1', 10001),
+                 ('127.0.0.1', 10002), ('127.0.0.1', 10003)]), ips)
+
+        ips = self.recon_instance.get_hosts(
+            0, None, self.swift_dir, [self.ring_name])
+        self.assertEqual(
+            set([('127.0.0.1', 10000), ('127.0.0.1', 10001)]), ips)
+
+        ips = self.recon_instance.get_hosts(
+            1, None, self.swift_dir, [self.ring_name])
+        self.assertEqual(
+            set([('127.0.0.1', 10002), ('127.0.0.1', 10003)]), ips)
+
+        ips = self.recon_instance.get_hosts(
+            0, 0, self.swift_dir, [self.ring_name])
+        self.assertEqual(set([('127.0.0.1', 10000)]), ips)
+
+        ips = self.recon_instance.get_hosts(
+            1, 1, self.swift_dir, [self.ring_name])
+        self.assertEqual(set([('127.0.0.1', 10003)]), ips)
+
+        ips = self.recon_instance.get_hosts(
+            None, None, self.swift_dir, [self.ring_name, self.ring_name2])
+        self.assertEqual(
+            set([('127.0.0.1', 10000), ('127.0.0.1', 10001),
+                 ('127.0.0.1', 10002), ('127.0.0.1', 10003),
+                 ('127.0.0.2', 10004)]), ips)
+
+        ips = self.recon_instance.get_hosts(
+            0, None, self.swift_dir, [self.ring_name, self.ring_name2])
+        self.assertEqual(
+            set([('127.0.0.1', 10000), ('127.0.0.1', 10001),
+                 ('127.0.0.2', 10004)]), ips)
+
+        ips = self.recon_instance.get_hosts(
+            1, None, self.swift_dir, [self.ring_name, self.ring_name2])
+        self.assertEqual(
+            set([('127.0.0.1', 10002), ('127.0.0.1', 10003)]), ips)
+
+        ips = self.recon_instance.get_hosts(
+            0, 1, self.swift_dir, [self.ring_name, self.ring_name2])
+        self.assertEqual(set([('127.0.0.1', 10001),
+                              ('127.0.0.2', 10004)]), ips)
+
+    def test_get_error_ringnames(self):
+        # create invalid ring name files
+        invalid_ring_file_names = ('object.sring.gz',
+                                   'object-1.sring.gz',
+                                   'broken')
+        for invalid_ring in invalid_ring_file_names:
+            ring_path = os.path.join(self.swift_dir, invalid_ring)
+            with open(ring_path, 'w'):
+                pass
+
+        hosts = [("127.0.0.1", "8080")]
+        self.recon_instance.verbose = True
+        self.recon_instance.server_type = 'object'
+        stdout = StringIO()
+        with mock.patch('sys.stdout', new=stdout), \
+                mock.patch('swift.common.utils.md5'):
+            self.recon_instance.get_ringmd5(hosts, self.swift_dir)
+        output = stdout.getvalue()
+        self.assertNotIn('On disk ', output)
+
+    def test_get_ringmd5(self):
+        for server_type in ('account', 'container', 'object', 'object-1'):
+            ring_name = '%s.ring.gz' % server_type
+            ring_file = os.path.join(self.swift_dir, ring_name)
+            open(ring_file, 'w')
+
+        empty_file_hash = 'd41d8cd98f00b204e9800998ecf8427e'
+        bad_file_hash = '00000000000000000000000000000000'
+        hosts = [("127.0.0.1", "8080")]
+        with mock.patch('swift.cli.recon.Scout') as mock_scout:
+            scout_instance = mock.MagicMock()
+            url = 'http://%s:%s/recon/ringmd5' % hosts[0]
+            response = {
+                '/etc/swift/account.ring.gz': empty_file_hash,
+                '/etc/swift/container.ring.gz': empty_file_hash,
+                '/etc/swift/object.ring.gz': empty_file_hash,
+                '/etc/swift/object-1.ring.gz': empty_file_hash,
+            }
+            status = 200
+            scout_instance.scout.return_value = (url, response, status, 0, 0)
+            mock_scout.return_value = scout_instance
+            mock_hash = mock.MagicMock()
+
+            # Check correct account, container and object ring hashes
+            for server_type in ('account', 'container', 'object'):
+                self.recon_instance.server_type = server_type
+                stdout = StringIO()
+                with mock.patch('sys.stdout', new=stdout), \
+                        mock.patch('swift.common.utils.md5', new=mock_hash):
+                    mock_hash.return_value.hexdigest.return_value = \
+                        empty_file_hash
+                    self.recon_instance.get_ringmd5(hosts, self.swift_dir)
+                output = stdout.getvalue()
+                expected = '1/1 hosts matched'
+                found = False
+                for line in output.splitlines():
+                    if '!!' in line:
+                        self.fail('Unexpected Error in output: %r' % line)
+                    if expected in line:
+                        found = True
+                if not found:
+                    self.fail('Did not find expected substring %r '
+                              'in output:\n%s' % (expected, output))
+
+            # Check bad container ring hash
+            self.recon_instance.server_type = 'container'
+            response = {
+                '/etc/swift/account.ring.gz': empty_file_hash,
+                '/etc/swift/container.ring.gz': bad_file_hash,
+                '/etc/swift/object.ring.gz': empty_file_hash,
+                '/etc/swift/object-1.ring.gz': empty_file_hash,
+            }
+            scout_instance.scout.return_value = (url, response, status, 0, 0)
+            mock_scout.return_value = scout_instance
+            stdout = StringIO()
+            with mock.patch('sys.stdout', new=stdout), \
+                    mock.patch('swift.common.utils.md5', new=mock_hash):
+                mock_hash.return_value.hexdigest.return_value = \
+                    empty_file_hash
+                self.recon_instance.get_ringmd5(hosts, self.swift_dir)
+            output = stdout.getvalue()
+            expected = '0/1 hosts matched'
+            found = False
+            for line in output.splitlines():
+                if '!!' in line:
+                    self.assertIn('doesn\'t match on disk md5sum', line)
+                if expected in line:
+                    found = True
+            if not found:
+                self.fail('Did not find expected substring %r '
+                          'in output:\n%s' % (expected, output))
+
+            # Check object ring, container mismatch should be ignored
+            self.recon_instance.server_type = 'object'
+            stdout = StringIO()
+            with mock.patch('sys.stdout', new=stdout), \
+                    mock.patch('swift.common.utils.md5', new=mock_hash):
+                mock_hash.return_value.hexdigest.return_value = \
+                    empty_file_hash
+                self.recon_instance.get_ringmd5(hosts, self.swift_dir)
+            output = stdout.getvalue()
+            expected = '1/1 hosts matched'
+            for line in output.splitlines():
+                if '!!' in line:
+                    self.fail('Unexpected Error in output: %r' % line)
+                if expected in line:
+                    found = True
+            if not found:
+                self.fail('Did not find expected substring %r '
+                          'in output:\n%s' % (expected, output))
+
+        # Cleanup
+        self.recon_instance.server_type = 'object'
+        for ring in ('account', 'container', 'object', 'object-1'):
+            os.remove(os.path.join(self.swift_dir, "%s.ring.gz" % ring))
+
+    def test_quarantine_check(self):
+        hosts = [('127.0.0.1', 6010), ('127.0.0.1', 6020),
+                 ('127.0.0.1', 6030), ('127.0.0.1', 6040),
+                 ('127.0.0.1', 6050)]
+        # sample json response from http://<host>:<port>/recon/quarantined
+        responses = {6010: {'accounts': 0, 'containers': 0, 'objects': 1,
+                            'policies': {'0': {'objects': 0},
+                                         '1': {'objects': 1}}},
+                     6020: {'accounts': 1, 'containers': 1, 'objects': 3,
+                            'policies': {'0': {'objects': 1},
+                                         '1': {'objects': 2}}},
+                     6030: {'accounts': 2, 'containers': 2, 'objects': 5,
+                            'policies': {'0': {'objects': 2},
+                                         '1': {'objects': 3}}},
+                     6040: {'accounts': 3, 'containers': 3, 'objects': 7,
+                            'policies': {'0': {'objects': 3},
+                                         '1': {'objects': 4}}},
+                     # A server without storage policies enabled
+                     6050: {'accounts': 0, 'containers': 0, 'objects': 4}}
+        # <low> <high> <avg> <total> <Failed> <no_result> <reported>
+        expected = {'objects_0': (0, 3, 1.5, 6, 0.0, 0, 4),
+                    'objects_1': (1, 4, 2.5, 10, 0.0, 0, 4),
+                    'objects': (1, 7, 4.0, 20, 0.0, 0, 5),
+                    'accounts': (0, 3, 1.2, 6, 0.0, 0, 5),
+                    'containers': (0, 3, 1.2, 6, 0.0, 0, 5)}
+
+        def mock_scout_quarantine(app, host):
+            url = 'http://%s:%s/recon/quarantined' % host
+            response = responses[host[1]]
+            status = 200
+            return url, response, status, 0, 0
+
+        stdout = StringIO()
+        with mock.patch('swift.cli.recon.Scout.scout',
+                        mock_scout_quarantine), \
+                mock.patch('sys.stdout', new=stdout):
+            self.recon_instance.quarantine_check(hosts)
+
+        output = stdout.getvalue()
+        r = re.compile(r"\[quarantined_(.*)\](.*)")
+        for line in output.splitlines():
+            m = r.match(line)
+            if m:
+                ex = expected.pop(m.group(1))
+                self.assertEqual(m.group(2),
+                                 " low: %s, high: %s, avg: %s, total: %s,"
+                                 " Failed: %s%%, no_result: %s, reported: %s"
+                                 % ex)
+        self.assertFalse(expected)
+
+    def test_async_check(self):
+        hosts = [('127.0.0.1', 6011), ('127.0.0.1', 6021),
+                 ('127.0.0.1', 6031), ('127.0.0.1', 6041)]
+        # sample json response from http://<host>:<port>/recon/async
+        responses = {6011: {'async_pending': 15},
+                     6021: {'async_pending': 0},
+                     6031: {'async_pending': 257},
+                     6041: {'async_pending': 56}}
+        # <low> <high> <avg> <total> <Failed> <no_result> <reported>
+        expected = (0, 257, 82.0, 328, 0.0, 0, 4)
+
+        def mock_scout_async(app, host):
+            url = 'http://%s:%s/recon/async' % host
+            response = responses[host[1]]
+            status = 200
+            return url, response, status, 0, 0
+
+        stdout = StringIO()
+        with mock.patch('swift.cli.recon.Scout.scout',
+                        mock_scout_async), \
+                mock.patch('sys.stdout', new=stdout):
+            self.recon_instance.async_check(hosts)
+
+        output = stdout.getvalue()
+        r = re.compile(r"\[async_pending(.*)\](.*)")
+        lines = output.splitlines()
+        self.assertTrue(lines)
+        for line in lines:
+            m = r.match(line)
+            if m:
+                self.assertEqual(m.group(2),
+                                 " low: %s, high: %s, avg: %s, total: %s,"
+                                 " Failed: %s%%, no_result: %s, reported: %s"
+                                 % expected)
+                break
+        else:
+            self.fail('The expected line is not found')
+
+    def test_umount_check(self):
+        hosts = [('127.0.0.1', 6010), ('127.0.0.1', 6020),
+                 ('127.0.0.1', 6030), ('127.0.0.1', 6040)]
+        # sample json response from http://<host>:<port>/recon/unmounted
+        responses = {6010: [{'device': 'sdb1', 'mounted': False}],
+                     6020: [{'device': 'sdb2', 'mounted': False}],
+                     6030: [{'device': 'sdb3', 'mounted': False}],
+                     6040: [{'device': 'sdb4', 'mounted': 'bad'}]}
+
+        expected = ['Not mounted: sdb1 on 127.0.0.1:6010',
+                    'Not mounted: sdb2 on 127.0.0.1:6020',
+                    'Not mounted: sdb3 on 127.0.0.1:6030',
+                    'Device errors: sdb4 on 127.0.0.1:6040']
+
+        def mock_scout_umount(app, host):
+            url = 'http://%s:%s/recon/unmounted' % host
+            response = responses[host[1]]
+            status = 200
+            return url, response, status, 0, 0
+
+        stdout = StringIO()
+        with mock.patch('swift.cli.recon.Scout.scout',
+                        mock_scout_umount), \
+                mock.patch('sys.stdout', new=stdout):
+            self.recon_instance.umount_check(hosts)
+
+        output = stdout.getvalue()
+        r = re.compile(r"^Not mounted:|Device errors: .*")
+        lines = output.splitlines()
+        self.assertTrue(lines)
+        for line in lines:
+            m = r.match(line)
+            if m:
+                self.assertIn(line, expected)
+                expected.remove(line)
+        self.assertFalse(expected)
+
+    def test_drive_audit_check(self):
+        hosts = [('127.0.0.1', 6010), ('127.0.0.1', 6020),
+                 ('127.0.0.1', 6030), ('127.0.0.1', 6040)]
+        # sample json response from http://<host>:<port>/recon/driveaudit
+        responses = {6010: {'drive_audit_errors': 15},
+                     6020: {'drive_audit_errors': 0},
+                     6030: {'drive_audit_errors': 257},
+                     6040: {'drive_audit_errors': 56}}
+        # <low> <high> <avg> <total> <Failed> <no_result> <reported>
+        expected = (0, 257, 82.0, 328, 0.0, 0, 4)
+
+        def mock_scout_driveaudit(app, host):
+            url = 'http://%s:%s/recon/driveaudit' % host
+            response = responses[host[1]]
+            status = 200
+            return url, response, status, 0, 0
+
+        stdout = StringIO()
+        with mock.patch('swift.cli.recon.Scout.scout',
+                        mock_scout_driveaudit), \
+                mock.patch('sys.stdout', new=stdout):
+            self.recon_instance.driveaudit_check(hosts)
+
+        output = stdout.getvalue()
+        r = re.compile(r"\[drive_audit_errors(.*)\](.*)")
+        lines = output.splitlines()
+        self.assertTrue(lines)
+        for line in lines:
+            m = r.match(line)
+            if m:
+                self.assertEqual(m.group(2),
+                                 " low: %s, high: %s, avg: %s, total: %s,"
+                                 " Failed: %s%%, no_result: %s, reported: %s"
+                                 % expected)
+
+    def test_get_ring_names(self):
+        self.recon_instance.server_type = 'not-object'
+        self.assertEqual(self.recon_instance._get_ring_names(), ['not-object'])
+
+        self.recon_instance.server_type = 'object'
+
+        with patch_policies([StoragePolicy(0, 'zero', is_default=True)]):
+            self.assertEqual(self.recon_instance._get_ring_names(),
+                             ['object'])
+
+        with patch_policies([StoragePolicy(0, 'zero', is_default=True),
+                             StoragePolicy(1, 'one')]):
+            self.assertEqual(self.recon_instance._get_ring_names(),
+                             ['object', 'object-1'])
+            self.assertEqual(self.recon_instance._get_ring_names('0'),
+                             ['object'])
+            self.assertEqual(self.recon_instance._get_ring_names('zero'),
+                             ['object'])
+            self.assertEqual(self.recon_instance._get_ring_names('1'),
+                             ['object-1'])
+            self.assertEqual(self.recon_instance._get_ring_names('one'),
+                             ['object-1'])
+
+            self.assertEqual(self.recon_instance._get_ring_names('3'), [])
+            self.assertEqual(self.recon_instance._get_ring_names('wrong'),
+                             [])
+
+    def test_main_object_hosts_default_all_policies(self):
+        self._make_object_rings()
+        discovered_hosts = set()
+
+        def server_type_check(hosts):
+            for h in hosts:
+                discovered_hosts.add(h)
+
+        self.recon_instance.server_type_check = server_type_check
+        with mock.patch.object(sys, 'argv', [
+                "prog", "object", "--swiftdir=%s" % self.swift_dir,
+                "--validate-servers"]):
+            self.recon_instance.main()
+
+        expected = set([
+            ('127.0.0.1', 10000),
+            ('127.0.0.1', 10001),
+            ('127.0.0.1', 10002),
+            ('127.0.0.1', 10003),
+            ('127.0.0.2', 10004),
+        ])
+
+        self.assertEqual(expected, discovered_hosts)
+
+    def _test_main_object_hosts_policy_name(self, policy_name='unu'):
+        self._make_object_rings()
+        discovered_hosts = set()
+
+        def server_type_check(hosts):
+            for h in hosts:
+                discovered_hosts.add(h)
+
+        self.recon_instance.server_type_check = server_type_check
+
+        with mock.patch.object(sys, 'argv', [
+                "prog", "object", "--swiftdir=%s" % self.swift_dir,
+                "--validate-servers", '--policy', policy_name]):
+
+            self.recon_instance.main()
+
+        expected = set([
+            ('127.0.0.1', 10000),
+            ('127.0.0.2', 10004),
+        ])
+        self.assertEqual(expected, discovered_hosts)
+
+    def test_main_object_hosts_default_unu(self):
+        self._test_main_object_hosts_policy_name()
+
+    def test_main_object_hosts_default_alias(self):
+        self._test_main_object_hosts_policy_name(self.policy_name)
+
+    def test_main_object_hosts_default_invalid(self):
+        self._make_object_rings()
+        stdout = StringIO()
+        with mock.patch.object(sys, 'argv', [
+                "prog", "object", "--swiftdir=%s" % self.swift_dir,
+                "--validate-servers", '--policy=invalid']), \
+                mock.patch('sys.stdout', stdout):
+            self.assertRaises(SystemExit, recon.main)
+            self.assertIn('Invalid Storage Policy', stdout.getvalue())
+
+    def test_calculate_least_and_most_recent(self):
+        now = 1517894596
+
+        def test_least_most(data, expected):
+            stdout = StringIO()
+            with mock.patch('sys.stdout', new=stdout), \
+                    mock.patch('time.time', return_value=now):
+                self.recon_instance._calculate_least_and_most_recent(data)
+            self.assertEqual(stdout.getvalue(), expected)
+
+        # first the empty set
+        test_least_most([], '')
+        expected = 'Oldest completion was NEVER by my.url.\n'
+        test_least_most([('http://my.url/is/awesome', 0)], expected)
+
+        expected = (
+            'Oldest completion was 2018-02-06 05:23:11 (5 seconds ago) '
+            'by my.url.\n'
+            'Most recent completion was 2018-02-06 05:23:11 (5 seconds ago) '
+            'by my.url.\n')
+        data = [('http://my.url/is/awesome', now - 5)]
+        test_least_most(data, expected)
+
+        expected = (
+            'Oldest completion was 2018-02-06 05:06:36 (16 minutes ago) '
+            'by a.diff.url.\n'
+            'Most recent completion was 2018-02-06 05:23:11 (5 seconds ago) '
+            'by my.url.\n')
+        data.append(('http://a.diff.url/not/as/awesome', now - 1000))
+        test_least_most(data, expected)
+
+        # now through larger sets at it
+        for extra in (5, 10, 40, 100):
+            data.extend([
+                ('http://extra.%d.url/blah' % (extra + r),
+                 now - random.randint(6, 999)) for r in range(extra)])
+            random.shuffle(data)
+            test_least_most(data, expected)
+
+
+class TestReconCommands(unittest.TestCase):
+    def setUp(self):
+        self.recon = recon.SwiftRecon()
+        self.hosts = set([('127.0.0.1', 10000)])
+
+    def mock_responses(self, resps):
+
+        def fake_urlopen(url, timeout):
+            scheme, netloc, path, _, _, _ = urllib.parse.urlparse(url)
+            self.assertEqual(scheme, 'http')  # can't handle anything else
+            self.assertTrue(path.startswith('/recon/'))
+
+            if ':' in netloc:
+                host, port = netloc.split(':', 1)
+                port = int(port)
+            else:
+                host = netloc
+                port = 80
+
+            response_body = resps[(host, port, path[7:])]
+
+            resp = mock.MagicMock()
+            resp.read = mock.MagicMock(side_effect=[
+                response_body.encode('utf8')])
+            return resp
+
+        return mock.patch(GREEN_URLLIB_URLOPEN, fake_urlopen)
+
+    def test_server_type_check(self):
+        hosts = [('127.0.0.1', 6010), ('127.0.0.1', 6011),
+                 ('127.0.0.1', 6012)]
+
+        # sample json response from http://<host>:<port>/
+        responses = {6010: 'object-server', 6011: 'container-server',
+                     6012: 'account-server'}
+
+        def mock_scout_server_type(app, host):
+            url = 'http://%s:%s/' % (host[0], host[1])
+            response = responses[host[1]]
+            status = 200
+            return url, response, status
+
+        stdout = StringIO()
+        res_object = 'Invalid: http://127.0.0.1:6010/ is object-server'
+        res_container = 'Invalid: http://127.0.0.1:6011/ is container-server'
+        res_account = 'Invalid: http://127.0.0.1:6012/ is account-server'
+        valid = "1/1 hosts ok, 0 error[s] while checking hosts."
+
+        # Test for object server type - default
+        with mock.patch('swift.cli.recon.Scout.scout_server_type',
+                        mock_scout_server_type), \
+                mock.patch('sys.stdout', new=stdout):
+            self.recon.server_type_check(hosts)
+
+        output = stdout.getvalue()
+        self.assertIn(res_container, output.splitlines())
+        self.assertIn(res_account, output.splitlines())
+        stdout.truncate(0)
+
+        # Test ok for object server type - default
+        with mock.patch('swift.cli.recon.Scout.scout_server_type',
+                        mock_scout_server_type), \
+                mock.patch('sys.stdout', new=stdout):
+            self.recon.server_type_check([hosts[0]])
+
+        output = stdout.getvalue()
+        self.assertIn(valid, output.splitlines())
+        stdout.truncate(0)
+
+        # Test for account server type
+        with mock.patch('swift.cli.recon.Scout.scout_server_type',
+                        mock_scout_server_type), \
+                mock.patch('sys.stdout', new=stdout):
+            self.recon.server_type = 'account'
+            self.recon.server_type_check(hosts)
+
+        output = stdout.getvalue()
+        self.assertIn(res_container, output.splitlines())
+        self.assertIn(res_object, output.splitlines())
+        stdout.truncate(0)
+
+        # Test ok for account server type
+        with mock.patch('swift.cli.recon.Scout.scout_server_type',
+                        mock_scout_server_type), \
+                mock.patch('sys.stdout', new=stdout):
+            self.recon.server_type = 'account'
+            self.recon.server_type_check([hosts[2]])
+
+        output = stdout.getvalue()
+        self.assertIn(valid, output.splitlines())
+        stdout.truncate(0)
+
+        # Test for container server type
+        with mock.patch('swift.cli.recon.Scout.scout_server_type',
+                        mock_scout_server_type), \
+                mock.patch('sys.stdout', new=stdout):
+            self.recon.server_type = 'container'
+            self.recon.server_type_check(hosts)
+
+        output = stdout.getvalue()
+        self.assertIn(res_account, output.splitlines())
+        self.assertIn(res_object, output.splitlines())
+        stdout.truncate(0)
+
+        # Test ok for container server type
+        with mock.patch('swift.cli.recon.Scout.scout_server_type',
+                        mock_scout_server_type), \
+                mock.patch('sys.stdout', new=stdout):
+            self.recon.server_type = 'container'
+            self.recon.server_type_check([hosts[1]])
+
+        output = stdout.getvalue()
+        self.assertIn(valid, output.splitlines())
+
+    def test_get_swiftconfmd5(self):
+        hosts = set([('10.1.1.1', 10000),
+                     ('10.2.2.2', 10000)])
+        cksum = '729cf900f2876dead617d088ece7fe8c'
+
+        responses = {
+            ('10.1.1.1', 10000, 'swiftconfmd5'):
+            json.dumps({'/etc/swift/swift.conf': cksum}),
+            ('10.2.2.2', 10000, 'swiftconfmd5'):
+            json.dumps({'/etc/swift/swift.conf': cksum})}
+
+        printed = []
+        with self.mock_responses(responses):
+            with mock.patch('swift.cli.recon.md5_hash_for_file',
+                            lambda _: cksum):
+                self.recon.get_swiftconfmd5(hosts, printfn=printed.append)
+
+        output = '\n'.join(printed) + '\n'
+        self.assertIn("2/2 hosts matched", output)
+
+    def test_get_swiftconfmd5_mismatch(self):
+        hosts = set([('10.1.1.1', 10000),
+                     ('10.2.2.2', 10000)])
+        cksum = '29d5912b1fcfcc1066a7f51412769c1d'
+
+        responses = {
+            ('10.1.1.1', 10000, 'swiftconfmd5'):
+            json.dumps({'/etc/swift/swift.conf': cksum}),
+            ('10.2.2.2', 10000, 'swiftconfmd5'):
+            json.dumps({'/etc/swift/swift.conf': 'bogus'})}
+
+        printed = []
+        with self.mock_responses(responses):
+            with mock.patch('swift.cli.recon.md5_hash_for_file',
+                            lambda _: cksum):
+                self.recon.get_swiftconfmd5(hosts, printfn=printed.append)
+
+        output = '\n'.join(printed) + '\n'
+        self.assertIn("1/2 hosts matched", output)
+        self.assertIn("http://10.2.2.2:10000/recon/swiftconfmd5 (bogus) "
+                      "doesn't match on disk md5sum", output)
+
+    def test_object_auditor_check(self):
+        # Recon middleware response from an object server
+        def dummy_request(*args, **kwargs):
+            values = {
+                'passes': 0, 'errors': 0, 'audit_time': 0,
+                'start_time': 0, 'quarantined': 0, 'bytes_processed': 0}
+
+            return [('http://127.0.0.1:6010/recon/auditor/object', {
+                'object_auditor_stats_ALL': values,
+                'object_auditor_stats_ZBF': values,
+            }, 200, 0, 0)]
+
+        response = {}
+
+        def catch_print(computed):
+            response[computed.get('name')] = computed
+
+        cli = recon.SwiftRecon()
+        cli.pool.imap = dummy_request
+        cli._print_stats = catch_print
+
+        cli.object_auditor_check([('127.0.0.1', 6010)])
+
+        # Now check that output contains all keys and names
+        keys = ['average', 'number_none', 'high',
+                'reported', 'low', 'total', 'perc_none']
+
+        names = [
+            'ALL_audit_time_last_path',
+            'ALL_quarantined_last_path',
+            'ALL_errors_last_path',
+            'ALL_passes_last_path',
+            'ALL_bytes_processed_last_path',
+            'ZBF_audit_time_last_path',
+            'ZBF_quarantined_last_path',
+            'ZBF_errors_last_path',
+            'ZBF_bytes_processed_last_path'
+        ]
+
+        for name in names:
+            computed = response.get(name)
+            self.assertTrue(computed)
+            for key in keys:
+                self.assertIn(key, computed)
+
+    def test_disk_usage(self):
+        def dummy_request(*args, **kwargs):
+            return [('http://127.0.0.1:6010/recon/diskusage', [
+                {"device": "sdb1", "mounted": True,
+                 "avail": 10, "used": 90, "size": 100},
+                {"device": "sdc1", "mounted": True,
+                 "avail": 15, "used": 85, "size": 100},
+                {"device": "sdd1", "mounted": True,
+                 "avail": 15, "used": 85, "size": 100}],
+                200,
+                0,
+                0)]
+
+        cli = recon.SwiftRecon()
+        cli.pool.imap = dummy_request
+
+        default_calls = [
+            mock.call('Distribution Graph:'),
+            mock.call(' 85%    2 **********************************' +
+                      '***********************************'),
+            mock.call(' 90%    1 **********************************'),
+            mock.call('Disk usage: space used: 260 of 300'),
+            mock.call('Disk usage: space free: 40 of 300'),
+            mock.call('Disk usage: lowest: 85.0%, '
+                      'highest: 90.0%, avg: 86.66666666666667%'),
+            mock.call('=' * 79),
+        ]
+
+        with mock.patch('builtins.print') as mock_print:
+            cli.disk_usage([('127.0.0.1', 6010)])
+            mock_print.assert_has_calls(default_calls)
+
+        with mock.patch('builtins.print') as mock_print:
+            expected_calls = default_calls + [
+                mock.call('LOWEST 5'),
+                mock.call('85.00%  127.0.0.1       sdc1'),
+                mock.call('85.00%  127.0.0.1       sdd1'),
+                mock.call('90.00%  127.0.0.1       sdb1')
+            ]
+            cli.disk_usage([('127.0.0.1', 6010)], 0, 5)
+            mock_print.assert_has_calls(expected_calls)
+
+        with mock.patch('builtins.print') as mock_print:
+            expected_calls = default_calls + [
+                mock.call('TOP 5'),
+                mock.call('90.00%  127.0.0.1       sdb1'),
+                mock.call('85.00%  127.0.0.1       sdc1'),
+                mock.call('85.00%  127.0.0.1       sdd1')
+            ]
+            cli.disk_usage([('127.0.0.1', 6010)], 5, 0)
+            mock_print.assert_has_calls(expected_calls)
+
+    @mock.patch('builtins.print')
+    @mock.patch('time.time')
+    def test_replication_check(self, mock_now, mock_print):
+        now = 1430000000.0
+
+        def dummy_request(*args, **kwargs):
+            return [
+                ('http://127.0.0.1:6011/recon/replication/container',
+                 {"replication_last": now,
+                  "replication_stats": {
+                      "no_change": 2, "rsync": 0, "success": 3, "failure": 1,
+                      "attempted": 0, "ts_repl": 0, "remove": 0,
+                      "remote_merge": 0, "diff_capped": 0, "start": now,
+                      "hashmatch": 0, "diff": 0, "empty": 0},
+                  "replication_time": 42},
+                 200,
+                 0,
+                 0),
+                ('http://127.0.0.1:6021/recon/replication/container',
+                 {"replication_last": now,
+                  "replication_stats": {
+                      "no_change": 0, "rsync": 0, "success": 1, "failure": 0,
+                      "attempted": 0, "ts_repl": 0, "remove": 0,
+                      "remote_merge": 0, "diff_capped": 0, "start": now,
+                      "hashmatch": 0, "diff": 0, "empty": 0},
+                  "replication_time": 23},
+                 200,
+                 0,
+                 0),
+            ]
+
+        cli = recon.SwiftRecon()
+        cli.pool.imap = dummy_request
+
+        default_calls = [
+            mock.call('[replication_failure] low: 0, high: 1, avg: 0.5, ' +
+                      'total: 1, Failed: 0.0%, no_result: 0, reported: 2'),
+            mock.call('[replication_success] low: 1, high: 3, avg: 2.0, ' +
+                      'total: 4, Failed: 0.0%, no_result: 0, reported: 2'),
+            mock.call('[replication_time] low: 23, high: 42, avg: 32.5, ' +
+                      'total: 65, Failed: 0.0%, no_result: 0, reported: 2'),
+            mock.call('[replication_attempted] low: 0, high: 0, avg: 0.0, ' +
+                      'total: 0, Failed: 0.0%, no_result: 0, reported: 2'),
+            mock.call('Oldest completion was 2015-04-25 22:13:20 ' +
+                      '(42 seconds ago) by 127.0.0.1:6011.'),
+            mock.call('Most recent completion was 2015-04-25 22:13:20 ' +
+                      '(42 seconds ago) by 127.0.0.1:6011.'),
+        ]
+
+        mock_now.return_value = now + 42
+        cli.replication_check([('127.0.0.1', 6011), ('127.0.0.1', 6021)])
+        # We need any_order=True because the order of calls depends on the dict
+        # that is returned from the recon middleware, thus can't rely on it
+        mock_print.assert_has_calls(default_calls, any_order=True)
+
+    @mock.patch('builtins.print')
+    @mock.patch('time.time')
+    def test_sharding_check(self, mock_now, mock_print):
+        now = 1430000000.0
+
+        def dummy_request(*args, **kwargs):
+            return [
+                ('http://127.0.0.1:6011/recon/replication/container',
+                 {"sharding_last": now - 50,
+                  "sharding_stats": {
+                      "attempted": 0, "deferred": 0, "diff": 0,
+                      "diff_capped": 0, "empty": 0, "failure": 0,
+                      "hashmatch": 0, "no_change": 0, "remote_merge": 0,
+                      "remove": 0, "rsync": 0,
+                      "sharding": {
+                          "audit_root": {
+                              "attempted": 0, "failure": 0, "success": 0},
+                          "audit_shard": {
+                              "attempted": 0, "failure": 0, "success": 0},
+                          "cleaved": {
+                              "attempted": 0, "failure": 0, "max_time": 0,
+                              "min_time": 0, "success": 0},
+                          "created": {
+                              "attempted": 0, "failure": 0, "success": 0},
+                          "misplaced": {
+                              "attempted": 0, "failure": 0, "found": 0,
+                              "placed": 0, "success": 0, "unplaced": 0},
+                          "scanned": {
+                              "attempted": 0, "failure": 0, "found": 0,
+                              "max_time": 0, "min_time": 0, "success": 0},
+                          "sharding_candidates": {
+                              "found": 0,
+                              "top": []},
+                          "shrinking_candidates": {
+                              "found": 0,
+                              "top": []},
+                          "visited": {
+                              "attempted": 0, "completed": 0, "failure": 0,
+                              "skipped": 1381, "success": 0}},
+                      "start": now - 80,
+                      "success": 0, "ts_repl": 0},
+                  "sharding_time": 27.6},
+                 200,
+                 0,
+                 0),
+                ('http://127.0.0.1:6021/recon/sharding',
+                 {"sharding_last": now - 50,
+                  "sharding_stats": {
+                      "attempted": 0, "deferred": 0, "diff": 0,
+                      "diff_capped": 0, "empty": 0, "failure": 0,
+                      "hashmatch": 0, "no_change": 0, "remote_merge": 0,
+                      "remove": 0, "rsync": 0,
+                      "sharding": {
+                          "audit_root": {
+                              "attempted": 0, "failure": 0, "success": 0},
+                          "audit_shard": {
+                              "attempted": 0, "failure": 0, "success": 0},
+                          "cleaved": {
+                              "attempted": 0, "failure": 0, "max_time": 0,
+                              "min_time": 0, "success": 0},
+                          "created": {
+                              "attempted": 0, "failure": 0, "success": 0},
+                          "misplaced": {
+                              "attempted": 0, "failure": 0, "found": 0,
+                              "placed": 0, "success": 0, "unplaced": 0},
+                          "scanned": {
+                              "attempted": 0, "failure": 0, "found": 0,
+                              "max_time": 0, "min_time": 0, "success": 0},
+                          "sharding_candidates": {
+                              "found": 0,
+                              "top": []},
+                          "shrinking_candidates": {
+                              "found": 0,
+                              "top": []},
+                          "visited": {
+                              "attempted": 0, "completed": 0, "failure": 0,
+                              "skipped": 1381, "success": 0}},
+                      "start": now - 80,
+                      "success": 0, "ts_repl": 0},
+                  "sharding_time": 27.6},
+                 200,
+                 0,
+                 0),
+            ]
+
+        cli = recon.SwiftRecon()
+        cli.pool.imap = dummy_request
+
+        # All totals are zero in our test set above. Maybe do better later.
+        default_calls = [
+            mock.call('[sharding_time] low: 27, high: 27, avg: 27.6, ' +
+                      'total: 55, Failed: 0.0%, no_result: 0, reported: 2'),
+            mock.call('[attempted] low: 0, high: 0, avg: 0.0, ' +
+                      'total: 0, Failed: 0.0%, no_result: 0, reported: 2'),
+            mock.call('[failure] low: 0, high: 0, avg: 0.0, ' +
+                      'total: 0, Failed: 0.0%, no_result: 0, reported: 2'),
+            mock.call('[success] low: 0, high: 0, avg: 0.0, ' +
+                      'total: 0, Failed: 0.0%, no_result: 0, reported: 2'),
+            mock.call('Oldest completion was 2015-04-25 22:12:30 ' +
+                      '(1 minutes ago) by 127.0.0.1:6011.'),
+            mock.call('Most recent completion was 2015-04-25 22:12:30 ' +
+                      '(1 minutes ago) by 127.0.0.1:6011.'),
+        ]
+
+        mock_now.return_value = now + 48
+        cli.sharding_check([('127.0.0.1', 6011), ('127.0.0.1', 6021)])
+        mock_print.assert_has_calls(default_calls, any_order=True)
+
+    @mock.patch('builtins.print')
+    @mock.patch('time.time')
+    def test_reconstruction_check(self, mock_now, mock_print):
+        now = 1430000000.0
+
+        def dummy_request(*args, **kwargs):
+            return [
+                ('http://127.0.0.1:6011/recon/reconstruction',
+                 {"object_reconstruction_last": now,
+                  "object_reconstruction_time": 42},
+                 200, 0, 0),
+                ('http://127.0.0.1:6021/recon/reconstruction',
+                 {"object_reconstruction_last": now,
+                  "object_reconstruction_time": 23},
+                 200, 0, 0)]
+
+        cli = recon.SwiftRecon()
+        cli.pool.imap = dummy_request
+
+        default_calls = [
+            mock.call('[object_reconstruction_time] low: 23, high: 42, '
+                      'avg: 32.5, total: 65, Failed: 0.0%, no_result: 0, '
+                      'reported: 2'),
+            mock.call('Oldest completion was 2015-04-25 22:13:20 ' +
+                      '(42 seconds ago) by 127.0.0.1:6011.'),
+            mock.call('Most recent completion was 2015-04-25 22:13:20 ' +
+                      '(42 seconds ago) by 127.0.0.1:6011.'),
+        ]
+
+        mock_now.return_value = now + 42
+        cli.reconstruction_check([('127.0.0.1', 6011), ('127.0.0.1', 6021)])
+        # We need any_order=True because the order of calls depends on the dict
+        # that is returned from the recon middleware, thus can't rely on it
+        mock_print.assert_has_calls(default_calls, any_order=True)
+
+    @mock.patch('builtins.print')
+    @mock.patch('time.time')
+    def test_load_check(self, mock_now, mock_print):
+        now = 1430000000.0
+
+        def dummy_request(*args, **kwargs):
+            return [
+                ('http://127.0.0.1:6010/recon/load',
+                 {"1m": 0.2, "5m": 0.4, "15m": 0.25,
+                  "processes": 10000, "tasks": "1/128"},
+                 200, 0, 0),
+                ('http://127.0.0.1:6020/recon/load',
+                 {"1m": 0.4, "5m": 0.8, "15m": 0.75,
+                  "processes": 9000, "tasks": "1/200"},
+                 200, 0, 0)]
+
+        cli = recon.SwiftRecon()
+        cli.pool.imap = dummy_request
+
+        default_calls = [
+            mock.call('[5m_load_avg] low: 0, high: 0, avg: 0.6, total: 1, ' +
+                      'Failed: 0.0%, no_result: 0, reported: 2'),
+            mock.call('[15m_load_avg] low: 0, high: 0, avg: 0.5, total: 1, ' +
+                      'Failed: 0.0%, no_result: 0, reported: 2'),
+            mock.call('[1m_load_avg] low: 0, high: 0, avg: 0.3, total: 0, ' +
+                      'Failed: 0.0%, no_result: 0, reported: 2'),
+        ]
+
+        mock_now.return_value = now + 42
+        cli.load_check([('127.0.0.1', 6010), ('127.0.0.1', 6020)])
+        # We need any_order=True because the order of calls depends on the dict
+        # that is returned from the recon middleware, thus can't rely on it
+        mock_print.assert_has_calls(default_calls, any_order=True)
+
+    @mock.patch('builtins.print')
+    @mock.patch('time.time')
+    def test_time_check(self, mock_now, mock_print):
+        now = 1430000000.0
+        mock_now.return_value = now
+
+        def dummy_request(*args, **kwargs):
+            return [
+                ('http://127.0.0.1:6010/recon/time',
+                 now,
+                 200,
+                 now - 0.5,
+                 now + 0.5),
+                ('http://127.0.0.1:6020/recon/time',
+                 now,
+                 200,
+                 now,
+                 now),
+            ]
+
+        cli = recon.SwiftRecon()
+        cli.pool.imap = dummy_request
+
+        default_calls = [
+            mock.call('2/2 hosts matched, 0 error[s] while checking hosts.')
+        ]
+
+        cli.time_check([('127.0.0.1', 6010), ('127.0.0.1', 6020)])
+        # We need any_order=True because the order of calls depends on the dict
+        # that is returned from the recon middleware, thus can't rely on it
+        mock_print.assert_has_calls(default_calls, any_order=True)
+
+    @mock.patch('builtins.print')
+    @mock.patch('time.time')
+    def test_time_check_mismatch(self, mock_now, mock_print):
+        now = 1430000000.0
+        mock_now.return_value = now
+
+        def dummy_request(*args, **kwargs):
+            return [
+                ('http://127.0.0.1:6010/recon/time',
+                 now,
+                 200,
+                 now + 0.5,
+                 now + 1.3),
+                ('http://127.0.0.1:6020/recon/time',
+                 now,
+                 200,
+                 now,
+                 now),
+            ]
+
+        cli = recon.SwiftRecon()
+        cli.pool.imap = dummy_request
+
+        default_calls = [
+            mock.call("!! http://127.0.0.1:6010/recon/time current time is "
+                      "2015-04-25 22:13:21, but remote is "
+                      "2015-04-25 22:13:20, differs by 1.3000 sec"),
+            mock.call('1/2 hosts matched, 0 error[s] while checking hosts.'),
+        ]
+
+        cli.time_check([('127.0.0.1', 6010), ('127.0.0.1', 6020)])
+
+        # We need any_order=True because the order of calls depends on the dict
+        # that is returned from the recon middleware, thus can't rely on it
+        mock_print.assert_has_calls(default_calls, any_order=True)
+
+    @mock.patch('builtins.print')
+    @mock.patch('time.time')
+    def test_time_check_jitter(self, mock_now, mock_print):
+        now = 1430000000.0
+        mock_now.return_value = now
+
+        def dummy_request(*args, **kwargs):
+            return [
+                ('http://127.0.0.1:6010/recon/time',
+                 now - 2,
+                 200,
+                 now,
+                 now + 3),
+                ('http://127.0.0.1:6020/recon/time',
+                 now + 2,
+                 200,
+                 now - 3,
+                 now),
+            ]
+
+        cli = recon.SwiftRecon()
+        cli.pool.imap = dummy_request
+
+        default_calls = [
+            mock.call('2/2 hosts matched, 0 error[s] while checking hosts.')
+        ]
+
+        cli.time_check([('127.0.0.1', 6010), ('127.0.0.1', 6020)], 3)
+        # We need any_order=True because the order of calls depends on the dict
+        # that is returned from the recon middleware, thus can't rely on it
+        mock_print.assert_has_calls(default_calls, any_order=True)
+
+    @mock.patch('builtins.print')
+    def test_version_check(self, mock_print):
+        version = "2.7.1.dev144"
+
+        def dummy_request(*args, **kwargs):
+            return [
+                ('http://127.0.0.1:6010/recon/version',
+                 {'version': version},
+                 200,
+                 0,
+                 0),
+                ('http://127.0.0.1:6020/recon/version',
+                 {'version': version},
+                 200,
+                 0,
+                 0),
+            ]
+
+        cli = recon.SwiftRecon()
+        cli.pool.imap = dummy_request
+
+        default_calls = [
+            mock.call("Versions matched (%s), "
+                      "0 error[s] while checking hosts." % version)
+        ]
+
+        cli.version_check([('127.0.0.1', 6010), ('127.0.0.1', 6020)])
+        # We need any_order=True because the order of calls depends on the dict
+        # that is returned from the recon middleware, thus can't rely on it
+        mock_print.assert_has_calls(default_calls, any_order=True)
+
+    @mock.patch('builtins.print')
+    @mock.patch('time.time')
+    def test_time_check_jitter_mismatch(self, mock_now, mock_print):
+        now = 1430000000.0
+        mock_now.return_value = now
+
+        def dummy_request(*args, **kwargs):
+            return [
+                ('http://127.0.0.1:6010/recon/time',
+                 now - 4,
+                 200,
+                 now,
+                 now + 2),
+                ('http://127.0.0.1:6020/recon/time',
+                 now + 4,
+                 200,
+                 now - 2,
+                 now),
+            ]
+
+        cli = recon.SwiftRecon()
+        cli.pool.imap = dummy_request
+
+        default_calls = [
+            mock.call("!! http://127.0.0.1:6010/recon/time current time is "
+                      "2015-04-25 22:13:22, but remote is "
+                      "2015-04-25 22:13:16, differs by 6.0000 sec"),
+            mock.call("!! http://127.0.0.1:6020/recon/time current time is "
+                      "2015-04-25 22:13:20, but remote is "
+                      "2015-04-25 22:13:24, differs by 4.0000 sec"),
+            mock.call('0/2 hosts matched, 0 error[s] while checking hosts.'),
+        ]
+
+        cli.time_check([('127.0.0.1', 6010), ('127.0.0.1', 6020)], 3)
+        # We need any_order=True because the order of calls depends on the dict
+        # that is returned from the recon middleware, thus can't rely on it
+        mock_print.assert_has_calls(default_calls, any_order=True)
+
+    @mock.patch('builtins.print')
+    def test_version_check_differs(self, mock_print):
+        def dummy_request(*args, **kwargs):
+            return [
+                ('http://127.0.0.1:6010/recon/version',
+                 {'version': "2.7.1.dev144"},
+                 200,
+                 0,
+                 0),
+                ('http://127.0.0.1:6020/recon/version',
+                 {'version': "2.7.1.dev145"},
+                 200,
+                 0,
+                 0),
+            ]
+
+        cli = recon.SwiftRecon()
+        cli.pool.imap = dummy_request
+
+        default_calls = [
+            mock.call("Versions not matched (2.7.1.dev144, 2.7.1.dev145), "
+                      "0 error[s] while checking hosts.")
+        ]
+
+        cli.version_check([('127.0.0.1', 6010), ('127.0.0.1', 6020)])
+        # We need any_order=True because the order of calls depends on the dict
+        # that is returned from the recon middleware, thus can't rely on it
+        mock_print.assert_has_calls(default_calls, any_order=True)
+
+    @mock.patch('builtins.print')
+    @mock.patch('swift.cli.recon.SwiftRecon.get_hosts')
+    def test_multiple_server_types(self, mock_get_hosts, mock_print):
+        mock_get_hosts.return_value = set([('127.0.0.1', 10000)])
+
+        self.recon.object_auditor_check = mock.MagicMock()
+        self.recon.auditor_check = mock.MagicMock()
+
+        with mock.patch.object(
+                sys, 'argv',
+                ["prog", "account", "container", "object", "--auditor"]):
+            self.recon.main()
+        expected_calls = [
+            mock.call("--> Starting reconnaissance on 1 hosts (account)"),
+            mock.call("--> Starting reconnaissance on 1 hosts (container)"),
+            mock.call("--> Starting reconnaissance on 1 hosts (object)"),
+        ]
+        mock_print.assert_has_calls(expected_calls, any_order=True)
+
+        expected = mock.call(set([('127.0.0.1', 10000)]))
+        self.recon.object_auditor_check.assert_has_calls([expected])
+        # Two calls expected - one account, one container
+        self.recon.auditor_check.assert_has_calls([expected, expected])
diff --git a/test/unit/cli/test_recon_cron.py b/test/unit/cli/test_recon_cron.py
new file mode 100644
index 0000000000..11ea534d8e
--- /dev/null
+++ b/test/unit/cli/test_recon_cron.py
@@ -0,0 +1,80 @@
+# Copyright (c) 2010-2022 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import tempfile
+import shutil
+import os
+from unittest import mock
+
+from unittest import TestCase
+from swift.cli.recon_cron import get_async_count
+from swift.obj.diskfile import ASYNCDIR_BASE
+
+
+class TestReconCron(TestCase):
+
+    def setUp(self):
+        self.temp_dir = tempfile.mkdtemp()
+
+    def tearDown(self):
+        shutil.rmtree(self.temp_dir)
+
+    def test_get_async_count(self):
+        device_dir = os.path.join(self.temp_dir, 'device')
+        device_index = os.path.join(device_dir, '1')
+        async_dir = os.path.join(device_index, ASYNCDIR_BASE)
+        entry1 = os.path.join(async_dir, 'entry1')
+        entry2 = os.path.join(async_dir, 'entry2')
+        os.makedirs(entry1)
+        os.makedirs(entry2)
+
+        pending_file1 = os.path.join(entry1, 'pending_file1')
+        pending_file2 = os.path.join(entry1, 'pending_file2')
+        pending_file3 = os.path.join(entry2, 'pending_file3')
+        open(pending_file1, 'w').close()
+        open(pending_file2, 'w').close()
+        open(pending_file3, 'w').close()
+
+        count = get_async_count(device_dir)
+        self.assertEqual(count, 3)
+
+    def test_get_async_count_deleted(self):
+        device_dir = os.path.join(self.temp_dir, 'device')
+        device_index = os.path.join(device_dir, '1')
+        async_dir = os.path.join(device_index, ASYNCDIR_BASE)
+        entry1 = os.path.join(async_dir, 'entry1')
+        entry2 = os.path.join(async_dir, 'entry2')
+        os.makedirs(entry1)
+        os.makedirs(entry2)
+
+        pending_file1 = os.path.join(entry1, 'pending_file1')
+        pending_file2 = os.path.join(entry1, 'pending_file2')
+        pending_file3 = os.path.join(entry2, 'pending_file3')
+        open(pending_file1, 'w').close()
+        open(pending_file2, 'w').close()
+        open(pending_file3, 'w').close()
+
+        orig_isdir = os.path.isdir
+
+        def racy_isdir(d):
+            result = orig_isdir(d)
+            if d == entry1:
+                # clean it up before caller has a chance to descend
+                shutil.rmtree(entry1)
+            return result
+
+        with mock.patch('os.path.isdir', racy_isdir):
+            count = get_async_count(device_dir)
+        self.assertEqual(count, 1)
diff --git a/test/unit/cli/test_relinker.py b/test/unit/cli/test_relinker.py
new file mode 100644
index 0000000000..b549599905
--- /dev/null
+++ b/test/unit/cli/test_relinker.py
@@ -0,0 +1,3929 @@
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import errno
+import fcntl
+import json
+from contextlib import contextmanager
+import logging
+from textwrap import dedent
+
+from unittest import mock
+import os
+import pickle
+import shutil
+import tempfile
+import time
+import unittest
+import uuid
+
+from io import StringIO
+
+from swift.cli import relinker
+from swift.common import ring, utils
+from swift.common import storage_policy
+from swift.common.exceptions import PathNotDir
+from swift.common.storage_policy import (
+    StoragePolicy, StoragePolicyCollection, POLICIES, ECStoragePolicy,
+    get_policy_string)
+
+from swift.obj.diskfile import write_metadata, DiskFileRouter, \
+    DiskFileManager, relink_paths, BaseDiskFileManager
+
+from test.debug_logger import debug_logger
+from test.unit import skip_if_no_xattrs, DEFAULT_TEST_EC_TYPE, \
+    patch_policies
+
+
+PART_POWER = 8
+
+
+class TestRelinker(unittest.TestCase):
+
+    maxDiff = None
+
+    def setUp(self):
+        skip_if_no_xattrs()
+        self.logger = debug_logger()
+        self.testdir = tempfile.mkdtemp()
+        self.devices = os.path.join(self.testdir, 'node')
+        self.recon_cache_path = os.path.join(self.testdir, 'cache')
+        self.recon_cache = os.path.join(self.recon_cache_path,
+                                        'relinker.recon')
+        shutil.rmtree(self.testdir, ignore_errors=True)
+        os.mkdir(self.testdir)
+        os.mkdir(self.devices)
+        os.mkdir(self.recon_cache_path)
+
+        self.rb = ring.RingBuilder(PART_POWER, 6.0, 1)
+
+        for i in range(6):
+            ip = "127.0.0.%s" % i
+            self.rb.add_dev({'id': i, 'region': 0, 'zone': 0, 'weight': 1,
+                             'ip': ip, 'port': 10000, 'device': 'sda1'})
+        self.rb.rebalance(seed=1)
+
+        self.conf_file = os.path.join(self.testdir, 'relinker.conf')
+        self._setup_config()
+
+        self.existing_device = 'sda1'
+        os.mkdir(os.path.join(self.devices, self.existing_device))
+        self.objects = os.path.join(self.devices, self.existing_device,
+                                    'objects')
+        self.policy = StoragePolicy(0, 'platinum', True)
+        storage_policy._POLICIES = StoragePolicyCollection([self.policy])
+        self._setup_object(policy=self.policy)
+
+        patcher = mock.patch('swift.cli.relinker.hubs')
+        self.mock_hubs = patcher.start()
+        self.addCleanup(patcher.stop)
+
+    def _setup_config(self):
+        config = """
+        [DEFAULT]
+        swift_dir = {swift_dir}
+        devices = {devices}
+        mount_check = {mount_check}
+
+        [object-relinker]
+        recon_cache_path = {recon_cache_path}
+        # update every chance we get!
+        stats_interval = 0
+        """.format(
+            swift_dir=self.testdir,
+            devices=self.devices,
+            mount_check=False,
+            recon_cache_path=self.recon_cache_path,
+        )
+        with open(self.conf_file, 'w') as f:
+            f.write(dedent(config))
+
+    def _get_object_name(self, condition=None):
+        attempts = []
+        for _ in range(50):
+            account = 'a'
+            container = 'c'
+            obj = 'o-' + str(uuid.uuid4())
+            _hash = utils.hash_path(account, container, obj)
+            part = utils.get_partition_for_hash(_hash, PART_POWER)
+            next_part = utils.get_partition_for_hash(_hash, PART_POWER + 1)
+            obj_path = os.path.join(os.path.sep, account, container, obj)
+            # There's 1/512 chance that both old and new parts will be 0;
+            # that's not a terribly interesting case, as there's nothing to do
+            attempts.append((part, next_part, 2**PART_POWER))
+            if (part != next_part and
+                    (condition(part) if condition else True)):
+                break
+        else:
+            self.fail('Failed to setup object satisfying test preconditions %s'
+                      % attempts)
+        return _hash, part, next_part, obj_path
+
+    def _create_object(self, policy, part, _hash, ext='.data'):
+        objects_dir = os.path.join(self.devices, self.existing_device,
+                                   get_policy_string('objects', policy))
+        shutil.rmtree(objects_dir, ignore_errors=True)
+        os.mkdir(objects_dir)
+        objdir = os.path.join(objects_dir, str(part), _hash[-3:], _hash)
+        os.makedirs(objdir)
+        timestamp = utils.Timestamp.now()
+        filename = timestamp.internal + ext
+        objname = os.path.join(objdir, filename)
+        with open(objname, "wb") as dummy:
+            dummy.write(b"Hello World!")
+            write_metadata(dummy,
+                           {'name': self.obj_path, 'Content-Length': '12'})
+        return objdir, filename, timestamp
+
+    def _setup_object(self, condition=None, policy=None, ext='.data'):
+        policy = policy or self.policy
+        _hash, part, next_part, obj_path = self._get_object_name(condition)
+        self._hash = _hash
+        self.part = part
+        self.next_part = next_part
+        self.obj_path = obj_path
+        objects_dir = os.path.join(self.devices, self.existing_device,
+                                   get_policy_string('objects', policy))
+
+        self.objdir, self.object_fname, self.obj_ts = self._create_object(
+            policy, part, _hash, ext)
+
+        self.objname = os.path.join(self.objdir, self.object_fname)
+        self.part_dir = os.path.join(objects_dir, str(self.part))
+        self.suffix = self._hash[-3:]
+        self.suffix_dir = os.path.join(self.part_dir, self.suffix)
+        self.next_part_dir = os.path.join(objects_dir, str(self.next_part))
+        self.next_suffix_dir = os.path.join(self.next_part_dir, self.suffix)
+        self.expected_dir = os.path.join(self.next_suffix_dir, self._hash)
+        self.expected_file = os.path.join(self.expected_dir, self.object_fname)
+
+    def _make_link(self, filename, part_power):
+        # make a file in the older part_power location and link it to a file in
+        # the next part power location
+        new_filepath = os.path.join(self.expected_dir, filename)
+        older_filepath = utils.replace_partition_in_path(
+            self.devices, new_filepath, part_power)
+        os.makedirs(os.path.dirname(older_filepath))
+        with open(older_filepath, 'w') as fd:
+            fd.write(older_filepath)
+        os.makedirs(self.expected_dir)
+        os.link(older_filepath, new_filepath)
+        with open(new_filepath, 'r') as fd:
+            self.assertEqual(older_filepath, fd.read())  # sanity check
+        return older_filepath, new_filepath
+
+    def _save_ring(self, policies=POLICIES):
+        self.rb._ring = None
+        rd = self.rb.get_ring()
+        for policy in policies:
+            rd.save(os.path.join(
+                self.testdir, '%s.ring.gz' % policy.ring_name))
+            # Enforce ring reloading in relinker
+            policy.object_ring = None
+
+    def tearDown(self):
+        shutil.rmtree(self.testdir, ignore_errors=True)
+        storage_policy.reload_storage_policies()
+
+    @contextmanager
+    def _mock_listdir(self):
+        orig_listdir = utils.listdir
+
+        def mocked(path):
+            if path == self.objects:
+                raise OSError
+            return orig_listdir(path)
+
+        with mock.patch('swift.common.utils.listdir', mocked):
+            yield
+
+    @contextmanager
+    def _mock_relinker(self):
+        with mock.patch.object(relinker.logging, 'getLogger',
+                               return_value=self.logger), \
+                mock.patch.object(relinker, 'get_logger',
+                                  return_value=self.logger), \
+                mock.patch('swift.cli.relinker.DEFAULT_RECON_CACHE_PATH',
+                           self.recon_cache_path):
+            yield
+
+    def test_workers_parent(self):
+        os.mkdir(os.path.join(self.devices, 'sda2'))
+        self.rb.prepare_increase_partition_power()
+        self.rb.increase_partition_power()
+        self._save_ring()
+        pids = {
+            2: 0,
+            3: 0,
+        }
+
+        def mock_wait():
+            return pids.popitem()
+
+        with mock.patch('os.fork', side_effect=list(pids.keys())), \
+                mock.patch('os.wait', mock_wait):
+            self.assertEqual(0, relinker.main([
+                'cleanup',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+                '--workers', '2',
+                '--skip-mount',
+            ]))
+        self.assertEqual(pids, {})
+
+    def test_workers_parent_bubbles_up_errors(self):
+        def do_test(wait_result, msg):
+            pids = {
+                2: 0,
+                3: 0,
+                4: 0,
+                5: wait_result,
+                6: 0,
+            }
+
+            with mock.patch('os.fork', side_effect=list(pids.keys())), \
+                    mock.patch('os.wait', lambda: pids.popitem()), \
+                    self._mock_relinker():
+                self.assertEqual(1, relinker.main([
+                    'cleanup',
+                    '--swift-dir', self.testdir,
+                    '--devices', self.devices,
+                    '--skip-mount',
+                ]))
+            self.assertEqual(pids, {})
+            self.assertEqual([], self.logger.get_lines_for_level('error'))
+            warning_lines = self.logger.get_lines_for_level('warning')
+            self.assertTrue(
+                warning_lines[0].startswith('Worker (pid=5, devs='))
+            self.assertTrue(
+                warning_lines[0].endswith(msg),
+                'Expected log line to end with %r; got %r'
+                % (msg, warning_lines[0]))
+            self.assertFalse(warning_lines[1:])
+            info_lines = self.logger.get_lines_for_level('info')
+            self.assertEqual(2, len(info_lines))
+            self.assertIn('Starting relinker (cleanup=True) using 5 workers:',
+                          info_lines[0])
+            self.assertIn('Finished relinker (cleanup=True):',
+                          info_lines[1])
+            print(info_lines)
+            self.logger.clear()
+
+        os.mkdir(os.path.join(self.devices, 'sda2'))
+        os.mkdir(os.path.join(self.devices, 'sda3'))
+        os.mkdir(os.path.join(self.devices, 'sda4'))
+        os.mkdir(os.path.join(self.devices, 'sda5'))
+        self.rb.prepare_increase_partition_power()
+        self.rb.increase_partition_power()
+        self._save_ring()
+        # signals get the low bits
+        do_test(9, 'exited in 0.0s after receiving signal: 9')
+        # exit codes get the high
+        do_test(1 << 8, 'completed in 0.0s with errors')
+        do_test(42 << 8, 'exited in 0.0s with unexpected status 42')
+
+    def test_workers_children(self):
+        os.mkdir(os.path.join(self.devices, 'sda2'))
+        os.mkdir(os.path.join(self.devices, 'sda3'))
+        os.mkdir(os.path.join(self.devices, 'sda4'))
+        os.mkdir(os.path.join(self.devices, 'sda5'))
+        self.rb.prepare_increase_partition_power()
+        self.rb.increase_partition_power()
+        self._save_ring()
+
+        calls = []
+
+        def fake_fork():
+            calls.append('fork')
+            return 0
+
+        def fake_run(self):
+            calls.append(('run', self.device_list))
+            return 0
+
+        def fake_exit(status):
+            calls.append(('exit', status))
+
+        with mock.patch('os.fork', fake_fork), \
+                mock.patch('os._exit', fake_exit), \
+                mock.patch('swift.cli.relinker.Relinker.run', fake_run):
+            self.assertEqual(0, relinker.main([
+                'cleanup',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+                '--workers', '2',
+                '--skip-mount',
+            ]))
+        self.assertEqual([
+            'fork',
+            ('run', ['sda1', 'sda3', 'sda5']),
+            ('exit', 0),
+            'fork',
+            ('run', ['sda2', 'sda4']),
+            ('exit', 0),
+        ], calls)
+
+        # test too many workers
+        calls = []
+
+        with mock.patch('os.fork', fake_fork), \
+                mock.patch('os._exit', fake_exit), \
+                mock.patch('swift.cli.relinker.Relinker.run', fake_run):
+            self.assertEqual(0, relinker.main([
+                'cleanup',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+                '--workers', '6',
+                '--skip-mount',
+            ]))
+        self.assertEqual([
+            'fork',
+            ('run', ['sda1']),
+            ('exit', 0),
+            'fork',
+            ('run', ['sda2']),
+            ('exit', 0),
+            'fork',
+            ('run', ['sda3']),
+            ('exit', 0),
+            'fork',
+            ('run', ['sda4']),
+            ('exit', 0),
+            'fork',
+            ('run', ['sda5']),
+            ('exit', 0),
+        ], calls)
+
+    def _do_test_relinker_drop_privileges(self, command):
+        @contextmanager
+        def do_mocks():
+            # attach mocks to call_capture so that call order can be asserted
+            call_capture = mock.Mock()
+            mod = 'swift.cli.relinker.'
+            with mock.patch(mod + 'Relinker') as mock_relinker, \
+                    mock.patch(mod + 'drop_privileges') as mock_dp, \
+                    mock.patch(mod + 'os.listdir',
+                               return_value=['sda', 'sdb']):
+                mock_relinker.return_value.run.return_value = 0
+                call_capture.attach_mock(mock_dp, 'drop_privileges')
+                call_capture.attach_mock(mock_relinker, 'run')
+                yield call_capture
+
+        # no user option
+        with do_mocks() as capture:
+            self.assertEqual(0, relinker.main([command, '--workers', '0']))
+        self.assertEqual([mock.call.run(mock.ANY, mock.ANY, ['sda', 'sdb'],
+                                        do_cleanup=(command == 'cleanup'))],
+                         capture.method_calls)
+
+        # cli option --user
+        with do_mocks() as capture:
+            self.assertEqual(0, relinker.main([command, '--user', 'cli_user',
+                                               '--workers', '0']))
+        self.assertEqual([('drop_privileges', ('cli_user',), {}),
+                          mock.call.run(mock.ANY, mock.ANY, ['sda', 'sdb'],
+                                        do_cleanup=(command == 'cleanup'))],
+                         capture.method_calls)
+
+        # cli option --user takes precedence over conf file user
+        with do_mocks() as capture:
+            with mock.patch('swift.cli.relinker.readconf',
+                            return_value={'user': 'conf_user'}):
+                self.assertEqual(0, relinker.main([command, 'conf_file',
+                                                   '--user', 'cli_user',
+                                                   '--workers', '0']))
+        self.assertEqual([('drop_privileges', ('cli_user',), {}),
+                          mock.call.run(mock.ANY, mock.ANY, ['sda', 'sdb'],
+                                        do_cleanup=(command == 'cleanup'))],
+                         capture.method_calls)
+
+        # conf file user
+        with do_mocks() as capture:
+            with mock.patch('swift.cli.relinker.readconf',
+                            return_value={'user': 'conf_user',
+                                          'workers': '0'}):
+                self.assertEqual(0, relinker.main([command, 'conf_file']))
+        self.assertEqual([('drop_privileges', ('conf_user',), {}),
+                          mock.call.run(mock.ANY, mock.ANY, ['sda', 'sdb'],
+                                        do_cleanup=(command == 'cleanup'))],
+                         capture.method_calls)
+
+    def test_relinker_drop_privileges(self):
+        self._do_test_relinker_drop_privileges('relink')
+        self._do_test_relinker_drop_privileges('cleanup')
+
+    def _do_test_relinker_files_per_second(self, command):
+        # no files per second
+        with mock.patch('swift.cli.relinker.RateLimitedIterator') as it:
+            self.assertEqual(0, relinker.main([
+                command,
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+                '--skip-mount',
+            ]))
+        it.assert_not_called()
+
+        # zero files per second
+        with mock.patch('swift.cli.relinker.RateLimitedIterator') as it:
+            self.assertEqual(0, relinker.main([
+                command,
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+                '--skip-mount',
+                '--files-per-second', '0'
+            ]))
+        it.assert_not_called()
+
+        # positive files per second
+        locations = iter([])
+        with mock.patch('swift.cli.relinker.audit_location_generator',
+                        return_value=locations):
+            with mock.patch('swift.cli.relinker.RateLimitedIterator') as it:
+                self.assertEqual(0, relinker.main([
+                    command,
+                    '--swift-dir', self.testdir,
+                    '--devices', self.devices,
+                    '--skip-mount',
+                    '--files-per-second', '1.23'
+                ]))
+        it.assert_called_once_with(locations, 1.23)
+
+        # negative files per second
+        err = StringIO()
+        with mock.patch('sys.stderr', err):
+            with self.assertRaises(SystemExit) as cm:
+                relinker.main([
+                    command,
+                    '--swift-dir', self.testdir,
+                    '--devices', self.devices,
+                    '--skip-mount',
+                    '--files-per-second', '-1'
+                ])
+        self.assertEqual(2, cm.exception.code)  # NB exit code 2 from argparse
+        self.assertIn('--files-per-second: invalid non_negative_float value',
+                      err.getvalue())
+
+    def test_relink_files_per_second(self):
+        self.rb.prepare_increase_partition_power()
+        self._save_ring()
+        self._do_test_relinker_files_per_second('relink')
+
+    def test_cleanup_files_per_second(self):
+        self._common_test_cleanup()
+        self._do_test_relinker_files_per_second('cleanup')
+
+    @patch_policies(
+        [StoragePolicy(0, name='gold', is_default=True),
+         ECStoragePolicy(1, name='platinum', ec_type=DEFAULT_TEST_EC_TYPE,
+                         ec_ndata=4, ec_nparity=2)],
+        fake_ring_args=[{}, {}])
+    def test_conf_file(self):
+        config = """
+        [DEFAULT]
+        swift_dir = %s
+        devices = /test/node
+        mount_check = false
+        reclaim_age = 5184000
+
+        [object-relinker]
+        log_level = WARNING
+        log_name = test-relinker
+        """ % self.testdir
+        conf_file = os.path.join(self.testdir, 'relinker.conf')
+        with open(conf_file, 'w') as f:
+            f.write(dedent(config))
+
+        # cite conf file on command line
+        with mock.patch('swift.cli.relinker.Relinker') as mock_relinker:
+            relinker.main(['relink', conf_file, '--device', 'sdx', '--debug'])
+        exp_conf = {
+            '__file__': mock.ANY,
+            'swift_dir': self.testdir,
+            'devices': '/test/node',
+            'mount_check': False,
+            'reclaim_age': '5184000',
+            'files_per_second': 0.0,
+            'log_name': 'test-relinker',
+            'log_level': 'DEBUG',
+            'policies': POLICIES,
+            'workers': 'auto',
+            'partitions': set(),
+            'recon_cache_path': '/var/cache/swift',
+            'stats_interval': 300.0,
+            'clobber_hardlink_collisions': False,
+        }
+        mock_relinker.assert_called_once_with(
+            exp_conf, mock.ANY, ['sdx'], do_cleanup=False)
+        logger = mock_relinker.call_args[0][1]
+        # --debug overrides conf file
+        self.assertEqual(logging.DEBUG, logger.getEffectiveLevel())
+        self.assertEqual('test-relinker', logger.logger.name)
+
+        # check the conf is passed to DiskFileRouter
+        self._save_ring()
+        with mock.patch('swift.cli.relinker.diskfile.DiskFileRouter',
+                        side_effect=DiskFileRouter) as mock_dfr:
+            relinker.main(['relink', conf_file, '--device', 'sdx', '--debug'])
+        mock_dfr.assert_called_once_with(exp_conf, mock.ANY)
+
+        # flip mount_check, no --debug...
+        config = """
+        [DEFAULT]
+        swift_dir = test/swift/dir
+        devices = /test/node
+        mount_check = true
+
+        [object-relinker]
+        log_level = WARNING
+        log_name = test-relinker
+        files_per_second = 11.1
+        recon_cache_path = /var/cache/swift-foo
+        stats_interval = 111
+        """
+        with open(conf_file, 'w') as f:
+            f.write(dedent(config))
+        with mock.patch('swift.cli.relinker.Relinker') as mock_relinker:
+            relinker.main(['relink', conf_file, '--device', 'sdx'])
+        mock_relinker.assert_called_once_with({
+            '__file__': mock.ANY,
+            'swift_dir': 'test/swift/dir',
+            'devices': '/test/node',
+            'mount_check': True,
+            'files_per_second': 11.1,
+            'log_name': 'test-relinker',
+            'log_level': 'WARNING',
+            'policies': POLICIES,
+            'partitions': set(),
+            'workers': 'auto',
+            'recon_cache_path': '/var/cache/swift-foo',
+            'stats_interval': 111.0,
+            'clobber_hardlink_collisions': False,
+        }, mock.ANY, ['sdx'], do_cleanup=False)
+        logger = mock_relinker.call_args[0][1]
+        self.assertEqual(logging.WARNING, logger.getEffectiveLevel())
+        self.assertEqual('test-relinker', logger.logger.name)
+
+        # override with cli options...
+        logger = debug_logger()
+        with mock.patch('swift.cli.relinker.Relinker') as mock_relinker:
+            with mock.patch('swift.cli.relinker.get_logger',
+                            return_value=logger):
+                relinker.main([
+                    'relink', conf_file, '--device', 'sdx', '--debug',
+                    '--swift-dir', 'cli-dir', '--devices', 'cli-devs',
+                    '--skip-mount-check', '--files-per-second', '2.2',
+                    '--policy', '1', '--partition', '123',
+                    '--partition', '123', '--partition', '456',
+                    '--workers', '2',
+                    '--stats-interval', '222',
+                ])
+        mock_relinker.assert_called_once_with({
+            '__file__': mock.ANY,
+            'swift_dir': 'cli-dir',
+            'devices': 'cli-devs',
+            'mount_check': False,
+            'files_per_second': 2.2,
+            'log_level': 'DEBUG',
+            'log_name': 'test-relinker',
+            'policies': {POLICIES[1]},
+            'partitions': {123, 456},
+            'workers': 2,
+            'recon_cache_path': '/var/cache/swift-foo',
+            'stats_interval': 222.0,
+            'clobber_hardlink_collisions': False,
+        }, mock.ANY, ['sdx'], do_cleanup=False)
+
+        with mock.patch('swift.cli.relinker.Relinker') as mock_relinker, \
+                mock.patch('logging.basicConfig') as mock_logging_config:
+            relinker.main(['relink', '--device', 'sdx',
+                           '--swift-dir', 'cli-dir', '--devices', 'cli-devs',
+                           '--skip-mount-check'])
+        mock_relinker.assert_called_once_with({
+            'swift_dir': 'cli-dir',
+            'devices': 'cli-devs',
+            'mount_check': False,
+            'files_per_second': 0.0,
+            'log_level': 'INFO',
+            'policies': POLICIES,
+            'partitions': set(),
+            'workers': 'auto',
+            'recon_cache_path': '/var/cache/swift',
+            'stats_interval': 300.0,
+            'clobber_hardlink_collisions': False,
+        }, mock.ANY, ['sdx'], do_cleanup=False)
+        mock_logging_config.assert_called_once_with(
+            format='%(message)s', level=logging.INFO, filename=None)
+
+        with mock.patch('swift.cli.relinker.Relinker') as mock_relinker, \
+                mock.patch('logging.basicConfig') as mock_logging_config:
+            relinker.main([
+                'relink', '--debug',
+                '--swift-dir', 'cli-dir',
+                '--devices', 'cli-devs',
+                '--device', 'sdx',
+                '--skip-mount-check',
+                '--policy', '0',
+                '--policy', '1',
+                '--policy', '0',
+            ])
+        mock_relinker.assert_called_once_with({
+            'swift_dir': 'cli-dir',
+            'devices': 'cli-devs',
+            'mount_check': False,
+            'files_per_second': 0.0,
+            'log_level': 'DEBUG',
+            'policies': set(POLICIES),
+            'partitions': set(),
+            'workers': 'auto',
+            'recon_cache_path': '/var/cache/swift',
+            'stats_interval': 300.0,
+            'clobber_hardlink_collisions': False,
+        }, mock.ANY, ['sdx'], do_cleanup=False)
+        # --debug is now effective
+        mock_logging_config.assert_called_once_with(
+            format='%(message)s', level=logging.DEBUG, filename=None)
+
+        # now test overriding workers back to auto
+        config = """
+                [DEFAULT]
+                swift_dir = test/swift/dir
+                devices = /test/node
+                mount_check = true
+
+                [object-relinker]
+                log_level = WARNING
+                log_name = test-relinker
+                files_per_second = 11.1
+                workers = 8
+                """
+        with open(conf_file, 'w') as f:
+            f.write(dedent(config))
+        devices = ['sdx%d' % i for i in range(8, 1)]
+        cli_cmd = ['relink', conf_file, '--device', 'sdx', '--workers', 'auto']
+        for device in devices:
+            cli_cmd.extend(['--device', device])
+        with mock.patch('swift.cli.relinker.Relinker') as mock_relinker:
+            relinker.main(cli_cmd)
+        mock_relinker.assert_called_once_with({
+            '__file__': mock.ANY,
+            'swift_dir': 'test/swift/dir',
+            'devices': '/test/node',
+            'mount_check': True,
+            'files_per_second': 11.1,
+            'log_name': 'test-relinker',
+            'log_level': 'WARNING',
+            'policies': POLICIES,
+            'partitions': set(),
+            'workers': 'auto',
+            'recon_cache_path': '/var/cache/swift',
+            'stats_interval': 300.0,
+            'clobber_hardlink_collisions': False,
+        }, mock.ANY, ['sdx'], do_cleanup=False)
+        logger = mock_relinker.call_args[0][1]
+        self.assertEqual(logging.WARNING, logger.getEffectiveLevel())
+        self.assertEqual('test-relinker', logger.logger.name)
+
+        # and now globally
+        config = """
+                        [DEFAULT]
+                        swift_dir = test/swift/dir
+                        devices = /test/node
+                        mount_check = true
+                        workers = 8
+
+                        [object-relinker]
+                        log_level = WARNING
+                        log_name = test-relinker
+                        files_per_second = 11.1
+                        """
+        with open(conf_file, 'w') as f:
+            f.write(dedent(config))
+        with mock.patch('swift.cli.relinker.Relinker') as mock_relinker:
+            relinker.main(cli_cmd)
+        mock_relinker.assert_called_once_with({
+            '__file__': mock.ANY,
+            'swift_dir': 'test/swift/dir',
+            'devices': '/test/node',
+            'mount_check': True,
+            'files_per_second': 11.1,
+            'log_name': 'test-relinker',
+            'log_level': 'WARNING',
+            'policies': POLICIES,
+            'partitions': set(),
+            'workers': 'auto',
+            'recon_cache_path': '/var/cache/swift',
+            'stats_interval': 300.0,
+            'clobber_hardlink_collisions': False,
+        }, mock.ANY, ['sdx'], do_cleanup=False)
+        logger = mock_relinker.call_args[0][1]
+        self.assertEqual(logging.WARNING, logger.getEffectiveLevel())
+        self.assertEqual('test-relinker', logger.logger.name)
+
+    def test_relinker_clobber_hardlink_collisions_default(self):
+        config = """
+        [DEFAULT]
+        swift_dir = %(swift_dir)s
+        devices = /test/node
+        mount_check = false
+
+        [object-relinker]
+        log_name = test-relinker
+        """ % {
+            'swift_dir': self.testdir,
+        }
+
+        conf_file = os.path.join(self.testdir, 'relinker.conf')
+        with open(conf_file, 'w') as f:
+            f.write(dedent(config))
+
+        captured_relinker_instance = None
+
+        def capture_relinker(instance_self):
+            nonlocal captured_relinker_instance
+            captured_relinker_instance = instance_self
+
+        with mock.patch('swift.cli.relinker.Relinker.run', capture_relinker):
+            relinker.main(['relink', conf_file, '--device', 'sdx'])
+
+        self.assertFalse(
+            captured_relinker_instance.conf['clobber_hardlink_collisions'])
+
+    def test_relinker_clobber_hardlink_collisions_config(self):
+        config = """
+        [DEFAULT]
+        swift_dir = %(swift_dir)s
+        devices = /test/node
+        mount_check = false
+
+        [object-relinker]
+        log_name = test-relinker
+        clobber_hardlink_collisions = true
+        """ % {
+            'swift_dir': self.testdir,
+        }
+
+        conf_file = os.path.join(self.testdir, 'relinker.conf')
+        with open(conf_file, 'w') as f:
+            f.write(dedent(config))
+
+        captured_relinker_instance = None
+
+        def capture_relinker(instance_self):
+            nonlocal captured_relinker_instance
+            captured_relinker_instance = instance_self
+
+        with mock.patch('swift.cli.relinker.Relinker.run', capture_relinker):
+            relinker.main(['relink', conf_file, '--device', 'sdx'])
+
+        self.assertTrue(
+            captured_relinker_instance.conf['clobber_hardlink_collisions'])
+
+    def test_relinker_clobber_hardlink_collisions_arg(self):
+        config = """
+        [DEFAULT]
+        swift_dir = %(swift_dir)s
+        devices = /test/node
+        mount_check = false
+
+        [object-relinker]
+        log_name = test-relinker
+        clobber_hardlink_collisions = false
+        """ % {
+            'swift_dir': self.testdir,
+        }
+
+        conf_file = os.path.join(self.testdir, 'relinker.conf')
+        with open(conf_file, 'w') as f:
+            f.write(dedent(config))
+
+        captured_relinker_instance = None
+
+        def capture_relinker(instance_self):
+            nonlocal captured_relinker_instance
+            captured_relinker_instance = instance_self
+
+        with mock.patch('swift.cli.relinker.Relinker.run', capture_relinker):
+            relinker.main(['relink', conf_file, '--device', 'sdx',
+                           '--clobber-hardlink-collisions'])
+
+        self.assertTrue(
+            captured_relinker_instance.conf['clobber_hardlink_collisions'])
+
+    def test_relinker_utils_get_hub(self):
+        cli_cmd = ['relink', '--device', 'sdx', '--workers', 'auto',
+                   '--device', '/some/device']
+        with mock.patch('swift.cli.relinker.Relinker'):
+            relinker.main(cli_cmd)
+
+        self.mock_hubs.use_hub.assert_called_with(utils.get_hub())
+
+    def test_relink_first_quartile_no_rehash(self):
+        # we need object name in lower half of current part
+        self._setup_object(lambda part: part < 2 ** (PART_POWER - 1))
+        self.assertLess(self.next_part, 2 ** PART_POWER)
+        self.rb.prepare_increase_partition_power()
+        self._save_ring()
+
+        with mock.patch('swift.obj.diskfile.DiskFileManager._hash_suffix',
+                        return_value='foo') as mock_hash_suffix:
+            self.assertEqual(0, relinker.main([
+                'relink',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+                '--skip-mount',
+            ]))
+        # ... and no rehash
+        self.assertEqual([], mock_hash_suffix.call_args_list)
+
+        self.assertTrue(os.path.isdir(self.expected_dir))
+        self.assertTrue(os.path.isfile(self.expected_file))
+
+        stat_old = os.stat(os.path.join(self.objdir, self.object_fname))
+        stat_new = os.stat(self.expected_file)
+        self.assertEqual(stat_old.st_ino, stat_new.st_ino)
+        # Invalidated now, rehashed during cleanup
+        with open(os.path.join(self.next_part_dir, 'hashes.invalid')) as fp:
+            self.assertEqual(fp.read(), self._hash[-3:] + '\n')
+        self.assertFalse(os.path.exists(
+            os.path.join(self.next_part_dir, 'hashes.pkl')))
+
+    def test_relink_second_quartile_does_rehash(self):
+        # we need a part in upper half of current part power
+        self._setup_object(lambda part: part >= 2 ** (PART_POWER - 1))
+        self.assertGreaterEqual(self.next_part, 2 ** PART_POWER)
+        self.assertTrue(self.rb.prepare_increase_partition_power())
+        self._save_ring()
+
+        with mock.patch('swift.obj.diskfile.DiskFileManager._hash_suffix',
+                        return_value='foo') as mock_hash_suffix:
+            self.assertEqual(0, relinker.main([
+                'relink',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+                '--skip-mount',
+            ]))
+        # we rehash the new suffix dirs as we go
+        self.assertEqual([mock.call(self.next_suffix_dir, policy=self.policy)],
+                         mock_hash_suffix.call_args_list)
+
+        # Invalidated and rehashed during relinking
+        with open(os.path.join(self.next_part_dir, 'hashes.invalid')) as fp:
+            self.assertEqual(fp.read(), '')
+        with open(os.path.join(self.next_part_dir, 'hashes.pkl'), 'rb') as fp:
+            hashes = pickle.load(fp)
+        self.assertIn(self._hash[-3:], hashes)
+        self.assertEqual('foo', hashes[self._hash[-3:]])
+        self.assertFalse(os.path.exists(
+            os.path.join(self.part_dir, 'hashes.invalid')))
+        # Check that only the dirty partition in upper half of next part power
+        # has been created and rehashed
+        other_next_part = self.next_part ^ 1
+        other_next_part_dir = os.path.join(self.objects, str(other_next_part))
+        self.assertFalse(os.path.exists(other_next_part_dir))
+
+    def _do_link_test(self, command, old_file_specs, new_file_specs,
+                      conflict_file_specs, exp_old_specs, exp_new_specs,
+                      exp_ret_code=0, relink_errors=None,
+                      mock_relink_paths=None, extra_options=None):
+        # Each 'spec' is a tuple (file extension, timestamp delta in seconds);
+        # files are created for each old_file_specs and links are created for
+        # each in new_file_specs, then cleanup is run and checks made that
+        # exp_old_specs and exp_new_specs exist.
+        # - conflict_file_specs are files in the new partition that are *not*
+        #   linked to the same file in the old partition
+        # - relink_errors is a dict ext->exception; the exception will be
+        #   raised each time relink_paths is called with a target_path ending
+        #   with 'ext'
+        self.assertFalse(relink_errors and mock_relink_paths)  # sanity check
+        new_file_specs = [] if new_file_specs is None else new_file_specs
+        conflict_file_specs = ([] if conflict_file_specs is None
+                               else conflict_file_specs)
+        exp_old_specs = [] if exp_old_specs is None else exp_old_specs
+        relink_errors = {} if relink_errors is None else relink_errors
+        extra_options = extra_options if extra_options else []
+        # remove the file created by setUp - we'll create it again if wanted
+        os.unlink(self.objname)
+
+        def make_filenames(specs):
+            filenames = []
+            for ext, ts_delta in specs:
+                # modify self.obj_ts by ts_delta seconds
+                ts = utils.Timestamp(self.obj_ts, delta=ts_delta * 10000)
+                filename = '.'.join([ts.internal, ext])
+                filenames.append(filename)
+            return filenames
+
+        old_filenames = make_filenames(old_file_specs)
+        new_filenames = make_filenames(new_file_specs)
+        conflict_filenames = make_filenames(conflict_file_specs)
+        if new_filenames or conflict_filenames:
+            os.makedirs(self.expected_dir)
+        for filename in old_filenames:
+            filepath = os.path.join(self.objdir, filename)
+            with open(filepath, 'w') as fd:
+                fd.write(filepath)
+        for filename in new_filenames:
+            new_filepath = os.path.join(self.expected_dir, filename)
+            if filename in old_filenames:
+                filepath = os.path.join(self.objdir, filename)
+                os.link(filepath, new_filepath)
+            else:
+                with open(new_filepath, 'w') as fd:
+                    fd.write(new_filepath)
+        for filename in conflict_filenames:
+            new_filepath = os.path.join(self.expected_dir, filename)
+            with open(new_filepath, 'w') as fd:
+                fd.write(new_filepath)
+
+        orig_relink_paths = relink_paths
+
+        def default_mock_relink_paths(target_path, new_target_path, **kwargs):
+            for ext, error in relink_errors.items():
+                if target_path.endswith(ext):
+                    raise error
+            return orig_relink_paths(target_path, new_target_path,
+                                     **kwargs)
+
+        with mock.patch('swift.cli.relinker.diskfile.relink_paths',
+                        mock_relink_paths if mock_relink_paths
+                        else default_mock_relink_paths):
+            with self._mock_relinker():
+                self.assertEqual(exp_ret_code, relinker.main([
+                    command,
+                    '--swift-dir', self.testdir,
+                    '--devices', self.devices,
+                    '--skip-mount',
+                ] + extra_options), [self.logger.all_log_lines()])
+
+        if exp_new_specs:
+            self.assertTrue(os.path.isdir(self.expected_dir))
+            exp_filenames = make_filenames(exp_new_specs)
+            actual_new = sorted(os.listdir(self.expected_dir))
+            self.assertEqual(sorted(exp_filenames), sorted(actual_new))
+        else:
+            self.assertFalse(os.path.exists(self.expected_dir))
+        if exp_old_specs:
+            exp_filenames = make_filenames(exp_old_specs)
+            actual_old = sorted(os.listdir(self.objdir))
+            self.assertEqual(sorted(exp_filenames), sorted(actual_old))
+        else:
+            self.assertFalse(os.path.exists(self.objdir))
+        if exp_ret_code == 0:
+            # a successful relink should not have logged errors
+            self.assertEqual([], self.logger.get_lines_for_level('error'))
+        elif conflict_file_specs:
+            # if a conflict was an error, we should have logged it
+            error_lines = self.logger.get_lines_for_level('error')
+            self.assertEqual(len(conflict_file_specs), len(error_lines))
+            for err_msg in error_lines:
+                self.assertTrue(err_msg.startswith("Error relinking"))
+                self.assertIn("hardlink collision", err_msg)
+                self.assertTrue(err_msg.endswith(
+                    "(consider enabling clobber_hardlink_collisions)"))
+
+    def _relink_test(self, old_file_specs, new_file_specs,
+                     exp_old_specs, exp_new_specs):
+        # force the rehash to not happen during relink so that we can inspect
+        # files in the new partition hash dir before they are cleaned up
+        self._setup_object(lambda part: part < 2 ** (PART_POWER - 1))
+        self.rb.prepare_increase_partition_power()
+        self._save_ring()
+        self._do_link_test('relink', old_file_specs, new_file_specs, None,
+                           exp_old_specs, exp_new_specs)
+
+    def test_relink_data_file(self):
+        self._relink_test((('data', 0),),
+                          None,
+                          (('data', 0),),
+                          (('data', 0),))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=False) '
+                      '(1 files, 1 linked, 0 removed, 0 errors)', info_lines)
+
+    def test_relink_data_meta_files(self):
+        self._relink_test((('data', 0), ('meta', 1)),
+                          None,
+                          (('data', 0), ('meta', 1)),
+                          (('data', 0), ('meta', 1)))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=False) '
+                      '(2 files, 2 linked, 0 removed, 0 errors)', info_lines)
+
+    def test_relink_meta_file(self):
+        self._relink_test((('meta', 0),),
+                          None,
+                          (('meta', 0),),
+                          (('meta', 0),))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=False) '
+                      '(1 files, 1 linked, 0 removed, 0 errors)', info_lines)
+
+    def test_relink_ts_file(self):
+        self._relink_test((('ts', 0),),
+                          None,
+                          (('ts', 0),),
+                          (('ts', 0),))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=False) '
+                      '(1 files, 1 linked, 0 removed, 0 errors)', info_lines)
+
+    def test_relink_data_meta_ts_files(self):
+        self._relink_test((('data', 0), ('meta', 1), ('ts', 2)),
+                          None,
+                          (('ts', 2),),
+                          (('ts', 2),))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=False) '
+                      '(1 files, 1 linked, 0 removed, 0 errors)', info_lines)
+
+    def test_relink_data_ts_meta_files(self):
+        self._relink_test((('data', 0), ('ts', 1), ('meta', 2)),
+                          None,
+                          (('ts', 1), ('meta', 2)),
+                          (('ts', 1), ('meta', 2)))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=False) '
+                      '(2 files, 2 linked, 0 removed, 0 errors)', info_lines)
+
+    def test_relink_ts_data_meta_files(self):
+        self._relink_test((('ts', 0), ('data', 1), ('meta', 2)),
+                          None,
+                          (('data', 1), ('meta', 2)),
+                          (('data', 1), ('meta', 2)))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=False) '
+                      '(2 files, 2 linked, 0 removed, 0 errors)', info_lines)
+
+    def test_relink_data_data_meta_files(self):
+        self._relink_test((('data', 0), ('data', 1), ('meta', 2)),
+                          None,
+                          (('data', 1), ('meta', 2)),
+                          (('data', 1), ('meta', 2)))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=False) '
+                      '(2 files, 2 linked, 0 removed, 0 errors)', info_lines)
+
+    def test_relink_data_existing_meta_files(self):
+        self._relink_test((('data', 0), ('meta', 1)),
+                          (('meta', 1),),
+                          (('data', 0), ('meta', 1)),
+                          (('data', 0), ('meta', 1)))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=False) '
+                      '(2 files, 1 linked, 0 removed, 0 errors)', info_lines)
+
+    def test_relink_data_meta_existing_newer_data_files(self):
+        self._relink_test((('data', 0), ('meta', 2)),
+                          (('data', 1),),
+                          (('data', 0), ('meta', 2)),
+                          (('data', 1), ('meta', 2)))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=False) '
+                      '(1 files, 1 linked, 0 removed, 0 errors)', info_lines)
+
+    def test_relink_data_existing_older_data_files_no_cleanup(self):
+        self._relink_test((('data', 1),),
+                          (('data', 0),),
+                          (('data', 1),),
+                          (('data', 0), ('data', 1)))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=False) '
+                      '(1 files, 1 linked, 0 removed, 0 errors)', info_lines)
+
+    def test_relink_data_existing_older_meta_files(self):
+        self._relink_test((('data', 0), ('meta', 2)),
+                          (('meta', 1),),
+                          (('data', 0), ('meta', 2)),
+                          (('data', 0), ('meta', 1), ('meta', 2)))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=False) '
+                      '(2 files, 2 linked, 0 removed, 0 errors)', info_lines)
+
+    def test_relink_existing_data_meta_ts_files(self):
+        self._relink_test((('data', 0), ('meta', 1), ('ts', 2)),
+                          (('data', 0),),
+                          (('ts', 2),),
+                          (('data', 0), ('ts', 2),))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=False) '
+                      '(1 files, 1 linked, 0 removed, 0 errors)', info_lines)
+
+    def test_relink_existing_data_meta_older_ts_files(self):
+        self._relink_test((('data', 1), ('meta', 2)),
+                          (('ts', 0),),
+                          (('data', 1), ('meta', 2)),
+                          (('ts', 0), ('data', 1), ('meta', 2)))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=False) '
+                      '(2 files, 2 linked, 0 removed, 0 errors)', info_lines)
+
+    def test_relink_data_meta_existing_ts_files(self):
+        self._relink_test((('data', 0), ('meta', 1), ('ts', 2)),
+                          (('ts', 2),),
+                          (('ts', 2),),
+                          (('ts', 2),))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=False) '
+                      '(1 files, 0 linked, 0 removed, 0 errors)', info_lines)
+
+    def test_relink_data_meta_existing_newer_ts_files(self):
+        self._relink_test((('data', 0), ('meta', 1)),
+                          (('ts', 2),),
+                          (('data', 0), ('meta', 1)),
+                          (('ts', 2),))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=False) '
+                      '(0 files, 0 linked, 0 removed, 0 errors)', info_lines)
+
+    def test_relink_ts_existing_newer_data_files(self):
+        self._relink_test((('ts', 0),),
+                          (('data', 2),),
+                          (('ts', 0),),
+                          (('data', 2),))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=False) '
+                      '(0 files, 0 linked, 0 removed, 0 errors)', info_lines)
+
+    def test_relink_conflicting_ts_file(self):
+        self._setup_object(lambda part: part >= 2 ** (PART_POWER - 1))
+        self.rb.prepare_increase_partition_power()
+        self._save_ring()
+        self._do_link_test('relink',
+                           (('ts', 0),),
+                           None,
+                           (('ts', 0),),
+                           (('ts', 0),),
+                           (('ts', 0),),
+                           exp_ret_code=0)
+        warning_lines = self.logger.get_lines_for_level('warning')
+        self.assertEqual([], warning_lines)
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=False) '
+                      '(1 files, 0 linked, 0 removed, 0 errors)',
+                      info_lines)
+
+    def test_relink_link_already_exists_but_different_inode(self):
+        self.rb.prepare_increase_partition_power()
+        self._save_ring()
+
+        # make a file where we'd expect the link to be created
+        os.makedirs(self.expected_dir)
+        with open(self.expected_file, 'w'):
+            pass
+
+        # expect an error
+        with self._mock_relinker():
+            self.assertEqual(1, relinker.main([
+                'relink',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+                '--skip-mount',
+            ]))
+
+        error_lines = self.logger.get_lines_for_level('error')
+        self.assertEqual([
+            'Error relinking: hardlink collision: %s to %s '
+            '(consider enabling clobber_hardlink_collisions)' % (
+                self.objname,
+                self.expected_file,
+            ),
+        ], error_lines)
+        self.assertEqual([
+            '1 hash dirs processed (cleanup=False) '
+            '(1 files, 0 linked, 0 removed, 1 errors)',
+        ], self.logger.get_lines_for_level('warning'))
+
+    def test_relink_link_already_exists_clobber_hardlink_collisions(self):
+        self.rb.prepare_increase_partition_power()
+        self._save_ring()
+
+        # make a file where we'd expect the link to be created
+        os.makedirs(self.expected_dir)
+        with open(self.expected_file, 'w'):
+            pass
+
+        # expect no error w/ --clobber-hardlink-collisions
+        with self._mock_relinker():
+            self.assertEqual(0, relinker.main([
+                'relink',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+                '--skip-mount',
+                '--clobber-hardlink-collisions',
+            ]))
+
+        for level in ['error', 'warning']:
+            self.assertEqual([], self.logger.get_lines_for_level(level))
+        # ... just info about clobbering your hardlink collisions
+        info_lines = self.logger.get_lines_for_level('info')
+        clobbering_lines = [
+            line for line in info_lines
+            if line.startswith('Relinking: clobbering hardlink collision')]
+        self.assertEqual(1, len(clobbering_lines), info_lines)
+        quarantine_dir = os.path.join(
+            self.devices, 'sda1', 'quarantined', 'objects')
+        self.assertIn(quarantine_dir, clobbering_lines[0])
+        self.assertEqual(
+            '1 hash dirs processed (cleanup=False) '
+            '(1 files, 1 linked, 0 removed, 0 errors)',
+            info_lines[-2])
+
+    def test_relink_clobber_hardlink_collisions_after_quarantine(self):
+        self.rb.prepare_increase_partition_power()
+        self._save_ring()
+
+        # make a file where we'd expect the link to be created
+        os.makedirs(self.expected_dir)
+        with open(self.expected_file, 'w'):
+            pass
+
+        # expect error
+        with mock.patch(
+                'swift.obj.diskfile.quarantine_renamer') as mock_quarantine, \
+                self._mock_relinker():
+            mock_quarantine.return_value = '/the/quarantine/dir'
+            self.assertEqual(1, relinker.main([
+                'relink',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+                '--skip-mount',
+                '--clobber-hardlink-collisions',
+            ]))
+
+        dev_path = os.path.join(self.devices, 'sda1')
+        self.assertEqual([
+            mock.call(dev_path, self.expected_file)
+        ], mock_quarantine.call_args_list)
+
+        # we still log info about clobbering hardlink collisions
+        info_lines = self.logger.get_lines_for_level('info')
+        clobbering_lines = [
+            line for line in info_lines
+            if line.startswith('Relinking: clobbering hardlink collision')]
+        self.assertEqual(1, len(clobbering_lines), info_lines)
+        self.assertIn('/the/quarantine/dir', clobbering_lines[0])
+
+        # but there was a *another* hardlink collision (!?)
+        warning_lines = self.logger.get_lines_for_level('warning')
+        collision_lines = [
+            line for line in warning_lines
+            if line.startswith('Relinking: hardlink collision')]
+        self.assertEqual(1, len(collision_lines), warning_lines)
+        self.assertIn('persists after quarantine', collision_lines[0])
+
+        # XXX this is kind of sketch: we got exit code 1 but no *error* lines;
+        # does relinker just treat errors as warnings?
+        self.assertEqual([], self.logger.get_lines_for_level('error'))
+        self.assertEqual(
+            '1 hash dirs processed (cleanup=False) '
+            '(1 files, 0 linked, 0 removed, 1 errors)',
+            warning_lines[-1])
+
+    def test_cleanup_link_already_exists_clobber_hardlink_collisions(self):
+        self.rb.prepare_increase_partition_power()
+        self.rb.increase_partition_power()
+        self._save_ring()
+
+        # make a file where we'd expect the link to be created
+        os.makedirs(self.expected_dir)
+        with open(self.expected_file, 'w'):
+            pass
+
+        with self._mock_relinker():
+            self.assertEqual(0, relinker.main([
+                'cleanup',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+                '--skip-mount',
+                '--debug',
+                '--clobber-hardlink-collisions',
+            ]))
+
+        for level in ['error', 'warning']:
+            self.assertEqual([], self.logger.get_lines_for_level(level))
+        debug_lines = self.logger.get_lines_for_level('debug')
+        relinking_lines = [
+            line for line in debug_lines
+            if line.startswith('Relinking (cleanup):')]
+        self.assertEqual(1, len(relinking_lines), debug_lines)
+        self.assertIn('tolerating hardlink collision', relinking_lines[0])
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertEqual(
+            '1 hash dirs processed (cleanup=True) '
+            '(1 files, 0 linked, 1 removed, 0 errors)',
+            info_lines[-2])
+
+    def test_relink_link_already_exists(self):
+        self.rb.prepare_increase_partition_power()
+        self._save_ring()
+        orig_relink_paths = relink_paths
+
+        def mock_relink_paths(target_path, new_target_path, **kwargs):
+            # pretend another process has created the link before this one
+            os.makedirs(self.expected_dir)
+            os.link(target_path, new_target_path)
+            return orig_relink_paths(target_path, new_target_path,
+                                     **kwargs)
+
+        with self._mock_relinker():
+            with mock.patch('swift.cli.relinker.diskfile.relink_paths',
+                            mock_relink_paths):
+                self.assertEqual(0, relinker.main([
+                    'relink',
+                    '--swift-dir', self.testdir,
+                    '--devices', self.devices,
+                    '--skip-mount',
+                ]))
+
+        self.assertTrue(os.path.isdir(self.expected_dir))
+        self.assertTrue(os.path.isfile(self.expected_file))
+        stat_old = os.stat(os.path.join(self.objdir, self.object_fname))
+        stat_new = os.stat(self.expected_file)
+        self.assertEqual(stat_old.st_ino, stat_new.st_ino)
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=False) '
+                      '(1 files, 0 linked, 0 removed, 0 errors)', info_lines)
+        self.assertEqual([], self.logger.get_lines_for_level('error'))
+
+    def test_relink_link_target_disappears(self):
+        # we need object name in lower half of current part so that there is no
+        # rehash of the new partition which wold erase the empty new partition
+        # - we want to assert it was created
+        self._setup_object(lambda part: part < 2 ** (PART_POWER - 1))
+        self.rb.prepare_increase_partition_power()
+        self._save_ring()
+        orig_relink_paths = relink_paths
+
+        def mock_relink_paths(target_path, new_target_path, **kwargs):
+            # pretend another process has cleaned up the target path
+            os.unlink(target_path)
+            return orig_relink_paths(target_path, new_target_path,
+                                     **kwargs)
+
+        with self._mock_relinker():
+            with mock.patch('swift.cli.relinker.diskfile.relink_paths',
+                            mock_relink_paths):
+                self.assertEqual(0, relinker.main([
+                    'relink',
+                    '--swift-dir', self.testdir,
+                    '--devices', self.devices,
+                    '--skip-mount',
+                ]))
+
+        self.assertTrue(os.path.isdir(self.expected_dir))
+        self.assertFalse(os.path.isfile(self.expected_file))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=False) '
+                      '(1 files, 0 linked, 0 removed, 0 errors)', info_lines)
+        self.assertEqual([], self.logger.get_lines_for_level('error'))
+
+    def test_relink_no_applicable_policy(self):
+        # NB do not prepare part power increase
+        self._save_ring()
+        with self._mock_relinker():
+            self.assertEqual(2, relinker.main([
+                'relink',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+            ]))
+        self.assertEqual(self.logger.get_lines_for_level('warning'),
+                         ['No policy found to increase the partition power.'])
+        self.assertEqual([], self.logger.get_lines_for_level('error'))
+
+    def test_relink_not_mounted(self):
+        self.rb.prepare_increase_partition_power()
+        self._save_ring()
+        with self._mock_relinker():
+            self.assertEqual(1, relinker.main([
+                'relink',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+            ]))
+        self.assertEqual(self.logger.get_lines_for_level('warning'), [
+            'Skipping sda1 as it is not mounted',
+            '1 disks were unmounted',
+            '0 hash dirs processed (cleanup=False) '
+            '(0 files, 0 linked, 0 removed, 0 errors)',
+        ])
+        self.assertEqual([], self.logger.get_lines_for_level('error'))
+
+    def test_relink_listdir_error(self):
+        self.rb.prepare_increase_partition_power()
+        self._save_ring()
+        with self._mock_relinker():
+            with self._mock_listdir():
+                self.assertEqual(1, relinker.main([
+                    'relink',
+                    '--swift-dir', self.testdir,
+                    '--devices', self.devices,
+                    '--skip-mount-check'
+                ]))
+        self.assertEqual(self.logger.get_lines_for_level('warning'), [
+            'Skipping %s because ' % self.objects,
+            'There were 1 errors listing partition directories',
+            '0 hash dirs processed (cleanup=False) '
+            '(0 files, 0 linked, 0 removed, 1 errors)',
+        ])
+        self.assertEqual([], self.logger.get_lines_for_level('error'))
+
+    def test_relink_device_filter(self):
+        self.rb.prepare_increase_partition_power()
+        self._save_ring()
+        self.assertEqual(0, relinker.main([
+            'relink',
+            '--swift-dir', self.testdir,
+            '--devices', self.devices,
+            '--skip-mount',
+            '--device', self.existing_device,
+        ]))
+
+        self.assertTrue(os.path.isdir(self.expected_dir))
+        self.assertTrue(os.path.isfile(self.expected_file))
+
+        stat_old = os.stat(os.path.join(self.objdir, self.object_fname))
+        stat_new = os.stat(self.expected_file)
+        self.assertEqual(stat_old.st_ino, stat_new.st_ino)
+
+    def test_relink_device_filter_invalid(self):
+        self.rb.prepare_increase_partition_power()
+        self._save_ring()
+        self.assertEqual(0, relinker.main([
+            'relink',
+            '--swift-dir', self.testdir,
+            '--devices', self.devices,
+            '--skip-mount',
+            '--device', 'none',
+        ]))
+
+        self.assertFalse(os.path.isdir(self.expected_dir))
+        self.assertFalse(os.path.isfile(self.expected_file))
+
+    def test_relink_partition_filter(self):
+        # ensure partitions are in second quartile so that new partitions are
+        # not included in the relinked partitions when the relinker is re-run:
+        # this makes the number of partitions visited predictable (i.e. 3)
+        self._setup_object(lambda part: part >= 2 ** (PART_POWER - 1))
+        # create some other test files in different partitions
+        other_objs = []
+        used_parts = [self.part, self.part + 1]
+        for i in range(2):
+            _hash, part, next_part, obj = self._get_object_name(
+                lambda part:
+                part >= 2 ** (PART_POWER - 1) and part not in used_parts)
+            obj_dir = os.path.join(self.objects, str(part), _hash[-3:], _hash)
+            os.makedirs(obj_dir)
+            obj_file = os.path.join(obj_dir, self.object_fname)
+            with open(obj_file, 'w'):
+                pass
+            other_objs.append((part, obj_file))
+            used_parts.append(part)
+
+        self.rb.prepare_increase_partition_power()
+        self._save_ring()
+
+        # invalid partition
+        with mock.patch('sys.stdout'), mock.patch('sys.stderr'):
+            with self.assertRaises(SystemExit) as cm:
+                self.assertEqual(0, relinker.main([
+                    'relink',
+                    '--swift-dir', self.testdir,
+                    '--devices', self.devices,
+                    '--skip-mount',
+                    '--partition', '-1',
+                ]))
+        self.assertEqual(2, cm.exception.code)
+
+        with mock.patch('sys.stdout'), mock.patch('sys.stderr'):
+            with self.assertRaises(SystemExit) as cm:
+                self.assertEqual(0, relinker.main([
+                    'relink',
+                    '--swift-dir', self.testdir,
+                    '--devices', self.devices,
+                    '--skip-mount',
+                    '--partition', 'abc',
+                ]))
+        self.assertEqual(2, cm.exception.code)
+
+        # restrict to a partition with no test object
+        self.logger.clear()
+        with self._mock_relinker():
+            self.assertEqual(0, relinker.main([
+                'relink',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+                '--skip-mount',
+                '--partition', str(self.part + 1),
+            ]))
+        self.assertFalse(os.path.isdir(self.expected_dir))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertEqual(4, len(info_lines))
+        self.assertIn('Starting relinker (cleanup=False) using 1 workers:',
+                      info_lines[0])
+        self.assertEqual(
+            ['Processing files for policy platinum under %s (cleanup=False)'
+             % os.path.join(self.devices, 'sda1'),
+             '0 hash dirs processed (cleanup=False) (0 files, 0 linked, '
+             '0 removed, 0 errors)'], info_lines[1:3]
+        )
+        self.assertIn('Finished relinker (cleanup=False):',
+                      info_lines[3])
+        self.assertEqual([], self.logger.get_lines_for_level('error'))
+
+        # restrict to one partition with a test object
+        self.logger.clear()
+        with self._mock_relinker():
+            self.assertEqual(0, relinker.main([
+                'relink',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+                '--skip-mount',
+                '--partition', str(self.part),
+            ]))
+        self.assertTrue(os.path.isdir(self.expected_dir))
+        self.assertTrue(os.path.isfile(self.expected_file))
+        stat_old = os.stat(os.path.join(self.objdir, self.object_fname))
+        stat_new = os.stat(self.expected_file)
+        self.assertEqual(stat_old.st_ino, stat_new.st_ino)
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertEqual(5, len(info_lines))
+        self.assertIn('Starting relinker (cleanup=False) using 1 workers:',
+                      info_lines[0])
+        self.assertEqual(
+            ['Processing files for policy platinum under %s (cleanup=False)'
+             % os.path.join(self.devices, 'sda1'),
+             'Step: relink Device: sda1 Policy: platinum Partitions: 1/3',
+             '1 hash dirs processed (cleanup=False) (1 files, 1 linked, '
+             '0 removed, 0 errors)'], info_lines[1:4]
+        )
+        self.assertIn('Finished relinker (cleanup=False):',
+                      info_lines[4])
+        self.assertEqual([], self.logger.get_lines_for_level('error'))
+
+        # restrict to two partitions with test objects
+        self.logger.clear()
+        with self._mock_relinker():
+            self.assertEqual(0, relinker.main([
+                'relink',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+                '--skip-mount',
+                '--partition', str(other_objs[0][0]),
+                '-p', str(other_objs[0][0]),  # duplicates should be ignored
+                '-p', str(other_objs[1][0]),
+            ]))
+        expected_file = utils.replace_partition_in_path(
+            self.devices, other_objs[0][1], PART_POWER + 1)
+        self.assertTrue(os.path.isfile(expected_file))
+        stat_old = os.stat(other_objs[0][1])
+        stat_new = os.stat(expected_file)
+        self.assertEqual(stat_old.st_ino, stat_new.st_ino)
+        expected_file = utils.replace_partition_in_path(
+            self.devices, other_objs[1][1], PART_POWER + 1)
+        self.assertTrue(os.path.isfile(expected_file))
+        stat_old = os.stat(other_objs[1][1])
+        stat_new = os.stat(expected_file)
+        self.assertEqual(stat_old.st_ino, stat_new.st_ino)
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertEqual(6, len(info_lines))
+        self.assertIn('Starting relinker (cleanup=False) using 1 workers:',
+                      info_lines[0])
+        self.assertEqual(
+            ['Processing files for policy platinum under %s (cleanup=False)'
+             % os.path.join(self.devices, 'sda1'),
+             'Step: relink Device: sda1 Policy: platinum Partitions: 2/3',
+             'Step: relink Device: sda1 Policy: platinum Partitions: 3/3',
+             '2 hash dirs processed (cleanup=False) (2 files, 2 linked, '
+             '0 removed, 0 errors)'], info_lines[1:5]
+        )
+        self.assertIn('Finished relinker (cleanup=False):',
+                      info_lines[5])
+        self.assertEqual([], self.logger.get_lines_for_level('error'))
+
+    @patch_policies(
+        [StoragePolicy(0, name='gold', is_default=True),
+         ECStoragePolicy(1, name='platinum', ec_type=DEFAULT_TEST_EC_TYPE,
+                         ec_ndata=4, ec_nparity=2)])
+    def test_relink_policy_option(self):
+        self._setup_object()
+        self.rb.prepare_increase_partition_power()
+        self._save_ring()
+
+        # invalid policy
+        with mock.patch('sys.stdout'), mock.patch('sys.stderr'):
+            with self.assertRaises(SystemExit) as cm:
+                relinker.main([
+                    'relink',
+                    '--swift-dir', self.testdir,
+                    '--policy', '9',
+                    '--skip-mount',
+                    '--devices', self.devices,
+                    '--device', self.existing_device,
+                ])
+        self.assertEqual(2, cm.exception.code)
+
+        with mock.patch('sys.stdout'), mock.patch('sys.stderr'):
+            with self.assertRaises(SystemExit) as cm:
+                relinker.main([
+                    'relink',
+                    '--swift-dir', self.testdir,
+                    '--policy', 'pewter',
+                    '--skip-mount',
+                    '--devices', self.devices,
+                    '--device', self.existing_device,
+                ])
+            self.assertEqual(2, cm.exception.code)
+
+        # policy with no object
+        with self._mock_relinker():
+            self.assertEqual(0, relinker.main([
+                'relink',
+                '--swift-dir', self.testdir,
+                '--policy', '1',
+                '--skip-mount',
+                '--devices', self.devices,
+                '--device', self.existing_device,
+            ]))
+        self.assertFalse(os.path.isdir(self.expected_dir))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertEqual(4, len(info_lines))
+        self.assertIn('Starting relinker (cleanup=False) using 1 workers:',
+                      info_lines[0])
+        self.assertEqual(
+            ['Processing files for policy platinum under %s/%s (cleanup=False)'
+             % (self.devices, self.existing_device),
+             '0 hash dirs processed (cleanup=False) (0 files, 0 linked, '
+             '0 removed, 0 errors)'], info_lines[1:3]
+        )
+        self.assertIn('Finished relinker (cleanup=False):',
+                      info_lines[3])
+        self.assertEqual([], self.logger.get_lines_for_level('error'))
+
+        # policy with object
+        self.logger.clear()
+        with self._mock_relinker():
+            self.assertEqual(0, relinker.main([
+                'relink',
+                '--swift-dir', self.testdir,
+                '--policy', '0',
+                '--skip-mount',
+                '--devices', self.devices,
+                '--device', self.existing_device,
+            ]))
+        self.assertTrue(os.path.isdir(self.expected_dir))
+        self.assertTrue(os.path.isfile(self.expected_file))
+        stat_old = os.stat(os.path.join(self.objdir, self.object_fname))
+        stat_new = os.stat(self.expected_file)
+        self.assertEqual(stat_old.st_ino, stat_new.st_ino)
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertEqual(5, len(info_lines))
+        self.assertIn('Starting relinker (cleanup=False) using 1 workers:',
+                      info_lines[0])
+        self.assertEqual(
+            ['Processing files for policy gold under %s/%s (cleanup=False)'
+             % (self.devices, self.existing_device),
+             'Step: relink Device: sda1 Policy: gold Partitions: 1/1',
+             '1 hash dirs processed (cleanup=False) (1 files, 1 linked, '
+             '0 removed, 0 errors)'], info_lines[1:4]
+        )
+        self.assertIn('Finished relinker (cleanup=False):',
+                      info_lines[4])
+        self.assertEqual([], self.logger.get_lines_for_level('error'))
+
+        # policy name works, too
+        self.logger.clear()
+        with self._mock_relinker():
+            self.assertEqual(0, relinker.main([
+                'relink',
+                '--swift-dir', self.testdir,
+                '--policy', 'gold',
+                '--skip-mount',
+                '--devices', self.devices,
+                '--device', self.existing_device,
+            ]))
+        self.assertTrue(os.path.isdir(self.expected_dir))
+        self.assertTrue(os.path.isfile(self.expected_file))
+        stat_old = os.stat(os.path.join(self.objdir, self.object_fname))
+        stat_new = os.stat(self.expected_file)
+        self.assertEqual(stat_old.st_ino, stat_new.st_ino)
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertEqual(4, len(info_lines))
+        self.assertIn('Starting relinker (cleanup=False) using 1 workers:',
+                      info_lines[0])
+        self.assertEqual(
+            ['Processing files for policy gold under %s/%s (cleanup=False)'
+             % (self.devices, self.existing_device),
+             '0 hash dirs processed (cleanup=False) '
+             '(0 files, 0 linked, 0 removed, 0 errors)'], info_lines[1:3]
+        )
+        self.assertIn('Finished relinker (cleanup=False):',
+                      info_lines[3])
+        self.assertEqual([], self.logger.get_lines_for_level('error'))
+
+    @patch_policies(
+        [StoragePolicy(0, name='gold', is_default=True),
+         ECStoragePolicy(1, name='platinum', ec_type=DEFAULT_TEST_EC_TYPE,
+                         ec_ndata=4, ec_nparity=2)])
+    def test_relink_all_policies(self):
+        # verify that only policies in appropriate state are processed
+        def do_relink(options=None):
+            options = [] if options is None else options
+            with self._mock_relinker():
+                with mock.patch(
+                        'swift.cli.relinker.Relinker.process_policy') \
+                        as mocked:
+                    res = relinker.main([
+                        'relink',
+                        '--swift-dir', self.testdir,
+                        '--skip-mount',
+                        '--devices', self.devices,
+                        '--device', self.existing_device,
+                    ] + options)
+                self.assertEqual([], self.logger.get_lines_for_level('error'))
+                return res, mocked
+
+        self._save_ring(POLICIES)  # no ring prepared for increase
+        res, mocked = do_relink()
+        self.assertEqual([], mocked.call_args_list)
+        self.assertEqual(2, res)
+
+        self._save_ring([POLICIES[0]])  # not prepared for increase
+        self.rb.prepare_increase_partition_power()
+        self._save_ring([POLICIES[1]])  # prepared for increase
+        res, mocked = do_relink()
+        self.assertEqual([mock.call(POLICIES[1])], mocked.call_args_list)
+        self.assertEqual(0, res)
+
+        res, mocked = do_relink(['--policy', '0'])
+        self.assertEqual([], mocked.call_args_list)
+        self.assertEqual(2, res)
+
+        self._save_ring([POLICIES[0]])  # prepared for increase
+        res, mocked = do_relink()
+        self.assertEqual([mock.call(POLICIES[0]), mock.call(POLICIES[1])],
+                         mocked.call_args_list)
+        self.assertEqual(0, res)
+
+        self.rb.increase_partition_power()
+        self._save_ring([POLICIES[0]])  # increased
+        res, mocked = do_relink()
+        self.assertEqual([mock.call(POLICIES[1])], mocked.call_args_list)
+        self.assertEqual(0, res)
+
+        self._save_ring([POLICIES[1]])  # increased
+        res, mocked = do_relink()
+        self.assertEqual([], mocked.call_args_list)
+        self.assertEqual(2, res)
+
+        res, mocked = do_relink(['--policy', '0'])
+        self.assertEqual([], mocked.call_args_list)
+        self.assertEqual(2, res)
+
+        self.rb.finish_increase_partition_power()
+        self._save_ring(POLICIES)  # all rings finished
+        res, mocked = do_relink()
+        self.assertEqual([], mocked.call_args_list)
+        self.assertEqual(2, res)
+
+    def test_relink_conflicting_ts_is_linked_to_part_power(self):
+        # link from next partition to current partition;
+        # different file in current-1 partition
+        self._setup_object(lambda part: part >= 2 ** (PART_POWER - 1))
+        self.rb.prepare_increase_partition_power()
+        self._save_ring()
+        filename = '.'.join([self.obj_ts.internal, 'ts'])
+        new_filepath = os.path.join(self.expected_dir, filename)
+        old_filepath = os.path.join(self.objdir, filename)
+        # setup a file in the current-1 part power (PART_POWER - 1) location
+        # that is *not* linked to the file in the next part power location
+        older_filepath = utils.replace_partition_in_path(
+            self.devices, new_filepath, PART_POWER - 1)
+        os.makedirs(os.path.dirname(older_filepath))
+        with open(older_filepath, 'w') as fd:
+            fd.write(older_filepath)
+        self._do_link_test('relink',
+                           (('ts', 0),),
+                           (('ts', 0),),
+                           None,
+                           (('ts', 0),),
+                           (('ts', 0),),
+                           exp_ret_code=0)
+        info_lines = self.logger.get_lines_for_level('info')
+        # both the PART_POWER and PART_POWER - N partitions are visited, no new
+        # links are created, and both the older files are retained
+        self.assertIn('2 hash dirs processed (cleanup=False) '
+                      '(2 files, 0 linked, 0 removed, 0 errors)',
+                      info_lines)
+        with open(new_filepath, 'r') as fd:
+            self.assertEqual(old_filepath, fd.read())
+        self.assertTrue(os.path.exists(older_filepath))
+
+    def test_relink_conflicting_ts_is_linked_to_part_power_minus_1(self):
+        # link from next partition to current-1 partition;
+        # different file in current partition
+        self._setup_object(lambda part: part >= 2 ** (PART_POWER - 1))
+        self.rb.prepare_increase_partition_power()
+        self._save_ring()
+        # setup a file in the next part power (PART_POWER + 1) location that is
+        # linked to a file in an older (PART_POWER - 1) location
+        filename = '.'.join([self.obj_ts.internal, 'ts'])
+        older_filepath, new_filepath = self._make_link(filename,
+                                                       PART_POWER - 1)
+        self._do_link_test('relink',
+                           (('ts', 0),),
+                           None,
+                           None,  # we already made file linked to older part
+                           (('ts', 0),),  # retained
+                           (('ts', 0),),
+                           exp_ret_code=0)
+        info_lines = self.logger.get_lines_for_level('info')
+        # both the PART_POWER and PART_POWER - N partitions are visited, no new
+        # links are created, and both the older files are retained
+        self.assertIn('2 hash dirs processed (cleanup=False) '
+                      '(2 files, 0 linked, 0 removed, 0 errors)',
+                      info_lines)
+        with open(new_filepath, 'r') as fd:
+            self.assertEqual(older_filepath, fd.read())
+        # prev part power file is retained because it is link target
+        self.assertTrue(os.path.exists(older_filepath))
+
+    def test_relink_conflicting_ts_is_linked_to_part_power_minus_2_err(self):
+        # link from next partition to current-2 partition;
+        # different file in current partition
+        # by default the relinker will NOT validate the current-2 location
+        self._setup_object(lambda part: part >= 2 ** (PART_POWER - 1))
+        self.rb.prepare_increase_partition_power()
+        self._save_ring()
+        # setup a file in the next part power (PART_POWER + 1) location that is
+        # linked to a file in an older (PART_POWER - 2) location
+        filename = '.'.join([self.obj_ts.internal, 'ts'])
+        older_filepath, new_filepath = self._make_link(filename,
+                                                       PART_POWER - 2)
+
+        self._do_link_test('relink',
+                           (('ts', 0),),
+                           None,
+                           None,  # we already made file linked to older part
+                           (('ts', 0),),  # retained
+                           (('ts', 0),),
+                           exp_ret_code=0)
+        warning_lines = self.logger.get_lines_for_level('warning')
+        self.assertEqual([], warning_lines)
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('2 hash dirs processed (cleanup=False) '
+                      '(2 files, 0 linked, 0 removed, 0 errors)',
+                      info_lines)
+        with open(new_filepath, 'r') as fd:
+            self.assertEqual(older_filepath, fd.read())
+        # prev-1 part power file is always retained because it is link target
+        self.assertTrue(os.path.exists(older_filepath))
+
+    def test_relink_conflicting_ts_both_in_older_part_powers(self):
+        # link from next partition to current-1 partition;
+        # different file in current partition
+        # different file in current-2 location
+        self._setup_object(lambda part: part >= 2 ** (PART_POWER - 2))
+        self.rb.prepare_increase_partition_power()
+        self._save_ring()
+        # setup a file in the next part power (PART_POWER + 1) location that is
+        # linked to a file in an older (PART_POWER - 1) location
+        filename = '.'.join([self.obj_ts.internal, 'ts'])
+        older_filepath, new_filepath = self._make_link(filename,
+                                                       PART_POWER - 1)
+        # setup a file in an even older part power (PART_POWER - 2) location
+        # that is *not* linked to the file in the next part power location
+        oldest_filepath = utils.replace_partition_in_path(
+            self.devices, new_filepath, PART_POWER - 2)
+        os.makedirs(os.path.dirname(oldest_filepath))
+        with open(oldest_filepath, 'w') as fd:
+            fd.write(oldest_filepath)
+
+        self._do_link_test('relink',
+                           (('ts', 0),),
+                           None,
+                           None,  # we already made file linked to older part
+                           (('ts', 0),),  # retained
+                           (('ts', 0),),
+                           exp_ret_code=0)
+        info_lines = self.logger.get_lines_for_level('info')
+        # both the PART_POWER and PART_POWER - N partitions are visited, no new
+        # links are created, and both the older files are retained
+        self.assertIn('3 hash dirs processed (cleanup=False) '
+                      '(3 files, 0 linked, 0 removed, 0 errors)',
+                      info_lines)
+        with open(new_filepath, 'r') as fd:
+            self.assertEqual(older_filepath, fd.read())
+        self.assertTrue(os.path.exists(older_filepath))  # linked so retained
+        self.assertTrue(os.path.exists(oldest_filepath))  # retained anyway
+
+    @patch_policies(
+        [StoragePolicy(0, name='gold', is_default=True),
+         ECStoragePolicy(1, name='platinum', ec_type=DEFAULT_TEST_EC_TYPE,
+                         ec_ndata=4, ec_nparity=2)])
+    def test_cleanup_all_policies(self):
+        # verify that only policies in appropriate state are processed
+        def do_cleanup(options=None):
+            options = [] if options is None else options
+            with mock.patch(
+                    'swift.cli.relinker.Relinker.process_policy') as mocked:
+                res = relinker.main([
+                    'cleanup',
+                    '--swift-dir', self.testdir,
+                    '--skip-mount',
+                    '--devices', self.devices,
+                    '--device', self.existing_device,
+                ] + options)
+            return res, mocked
+
+        self._save_ring(POLICIES)  # no ring prepared for increase
+        res, mocked = do_cleanup()
+        self.assertEqual([], mocked.call_args_list)
+        self.assertEqual(2, res)
+
+        self.rb.prepare_increase_partition_power()
+        self._save_ring(POLICIES)  # all rings prepared for increase
+        res, mocked = do_cleanup()
+        self.assertEqual([], mocked.call_args_list)
+        self.assertEqual(2, res)
+
+        self.rb.increase_partition_power()
+        self._save_ring([POLICIES[0]])  # increased
+        res, mocked = do_cleanup()
+        self.assertEqual([mock.call(POLICIES[0])], mocked.call_args_list)
+        self.assertEqual(0, res)
+
+        res, mocked = do_cleanup(['--policy', '1'])
+        self.assertEqual([], mocked.call_args_list)
+        self.assertEqual(2, res)
+
+        self._save_ring([POLICIES[1]])  # increased
+        res, mocked = do_cleanup()
+        self.assertEqual([mock.call(POLICIES[0]), mock.call(POLICIES[1])],
+                         mocked.call_args_list)
+        self.assertEqual(0, res)
+
+        self.rb.finish_increase_partition_power()
+        self._save_ring([POLICIES[1]])  # finished
+        res, mocked = do_cleanup()
+        self.assertEqual([mock.call(POLICIES[0])], mocked.call_args_list)
+        self.assertEqual(0, res)
+
+        self._save_ring([POLICIES[0]])  # finished
+        res, mocked = do_cleanup()
+        self.assertEqual([], mocked.call_args_list)
+        self.assertEqual(2, res)
+
+        res, mocked = do_cleanup(['--policy', '1'])
+        self.assertEqual([], mocked.call_args_list)
+        self.assertEqual(2, res)
+
+    def _common_test_cleanup(self, relink=True):
+        # Create a ring that has prev_part_power set
+        self.rb.prepare_increase_partition_power()
+        self._save_ring()
+
+        if relink:
+            conf = {'swift_dir': self.testdir,
+                    'devices': self.devices,
+                    'mount_check': False,
+                    'files_per_second': 0,
+                    'policies': POLICIES,
+                    'recon_cache_path': self.recon_cache_path,
+                    'workers': 0}
+            self.assertEqual(0, relinker.Relinker(
+                conf, logger=self.logger, device_list=[self.existing_device],
+                do_cleanup=False).run())
+        self.rb.increase_partition_power()
+        self._save_ring()
+
+    def _cleanup_test(self, old_file_specs, new_file_specs,
+                      conflict_file_specs, exp_old_specs, exp_new_specs,
+                      exp_ret_code=0, relink_errors=None):
+        # force the new partitions to be greater than the median so that they
+        # are not rehashed during cleanup, meaning we can inspect the outcome
+        # of the cleanup relinks and removes
+        self._setup_object(lambda part: part >= 2 ** (PART_POWER - 1))
+        self.rb.prepare_increase_partition_power()
+        self.rb.increase_partition_power()
+        self._save_ring()
+        self._do_link_test('cleanup', old_file_specs, new_file_specs,
+                           conflict_file_specs, exp_old_specs, exp_new_specs,
+                           exp_ret_code, relink_errors)
+
+    def test_cleanup_data_meta_files(self):
+        self._cleanup_test((('data', 0), ('meta', 1)),
+                           (('data', 0), ('meta', 1)),
+                           None,
+                           None,
+                           (('data', 0), ('meta', 1)))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(2 files, 0 linked, 2 removed, 0 errors)',
+                      info_lines)
+
+    def test_cleanup_missing_data_file(self):
+        self._cleanup_test((('data', 0),),
+                           None,
+                           None,
+                           None,
+                           (('data', 0),))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(1 files, 1 linked, 1 removed, 0 errors)',
+                      info_lines)
+
+    def test_cleanup_missing_data_missing_meta_files(self):
+        self._cleanup_test((('data', 0), ('meta', 1)),
+                           None,
+                           None,
+                           None,
+                           (('data', 0), ('meta', 1)))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(2 files, 2 linked, 2 removed, 0 errors)',
+                      info_lines)
+
+    def test_cleanup_missing_meta_file(self):
+        self._cleanup_test((('meta', 0),),
+                           None,
+                           None,
+                           None,
+                           (('meta', 0),))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(1 files, 1 linked, 1 removed, 0 errors)',
+                      info_lines)
+
+    def test_cleanup_missing_ts_file(self):
+        self._cleanup_test((('ts', 0),),
+                           None,
+                           None,
+                           None,
+                           (('ts', 0),))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(1 files, 1 linked, 1 removed, 0 errors)',
+                      info_lines)
+
+    def test_cleanup_missing_data_missing_meta_missing_ts_files(self):
+        self._cleanup_test((('data', 0), ('meta', 1), ('ts', 2)),
+                           None,
+                           None,
+                           None,
+                           (('ts', 2),))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(1 files, 1 linked, 1 removed, 0 errors)',
+                      info_lines)
+
+    def test_cleanup_missing_data_missing_ts_missing_meta_files(self):
+        self._cleanup_test((('data', 0), ('ts', 1), ('meta', 2)),
+                           None,
+                           None,
+                           None,
+                           (('ts', 1), ('meta', 2)))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(2 files, 2 linked, 2 removed, 0 errors)',
+                      info_lines)
+
+    def test_cleanup_missing_ts_missing_data_missing_meta_files(self):
+        self._cleanup_test((('ts', 0), ('data', 1), ('meta', 2)),
+                           None,
+                           None,
+                           None,
+                           (('data', 1), ('meta', 2)))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(2 files, 2 linked, 2 removed, 0 errors)',
+                      info_lines)
+
+    def test_cleanup_missing_data_missing_data_missing_meta_files(self):
+        self._cleanup_test((('data', 0), ('data', 1), ('meta', 2)),
+                           None,
+                           None,
+                           None,
+                           (('data', 1), ('meta', 2)))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(2 files, 2 linked, 2 removed, 0 errors)',
+                      info_lines)
+
+    def test_cleanup_missing_data_existing_meta_files(self):
+        self._cleanup_test((('data', 0), ('meta', 1)),
+                           (('meta', 1),),
+                           None,
+                           None,
+                           (('data', 0), ('meta', 1)))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(2 files, 1 linked, 2 removed, 0 errors)',
+                      info_lines)
+
+    def test_cleanup_missing_meta_existing_newer_data_files(self):
+        self._cleanup_test((('data', 0), ('meta', 2)),
+                           (('data', 1),),
+                           None,
+                           None,
+                           (('data', 1), ('meta', 2)))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(1 files, 1 linked, 2 removed, 0 errors)',
+                      info_lines)
+
+    def test_cleanup_missing_data_missing_meta_existing_older_meta_files(self):
+        self._cleanup_test((('data', 0), ('meta', 2)),
+                           (('meta', 1),),
+                           None,
+                           None,
+                           (('data', 0), ('meta', 2)))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(2 files, 2 linked, 2 removed, 0 errors)',
+                      info_lines)
+
+    def test_cleanup_missing_meta_missing_ts_files(self):
+        self._cleanup_test((('data', 0), ('meta', 1), ('ts', 2)),
+                           (('data', 0),),
+                           None,
+                           None,
+                           (('ts', 2),))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(1 files, 1 linked, 1 removed, 0 errors)',
+                      info_lines)
+
+    def test_cleanup_missing_data_missing_meta_existing_older_ts_files(self):
+        self._cleanup_test((('data', 1), ('meta', 2)),
+                           (('ts', 0),),
+                           None,
+                           None,
+                           (('data', 1), ('meta', 2)))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(2 files, 2 linked, 2 removed, 0 errors)',
+                      info_lines)
+
+    def test_cleanup_data_meta_existing_ts_files(self):
+        self._cleanup_test((('data', 0), ('meta', 1), ('ts', 2)),
+                           (('ts', 2),),
+                           None,
+                           None,
+                           (('ts', 2),))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(1 files, 0 linked, 1 removed, 0 errors)',
+                      info_lines)
+
+    def test_cleanup_data_meta_existing_newer_ts_files(self):
+        self._cleanup_test((('data', 0), ('meta', 1)),
+                           (('ts', 2),),
+                           None,
+                           None,
+                           (('ts', 2),))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(0 files, 0 linked, 2 removed, 0 errors)',
+                      info_lines)
+
+    def test_cleanup_ts_existing_newer_data_files(self):
+        self._cleanup_test((('ts', 0),),
+                           (('data', 2),),
+                           None,
+                           None,
+                           (('data', 2),))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(0 files, 0 linked, 1 removed, 0 errors)',
+                      info_lines)
+
+    def test_cleanup_missing_data_file_relink_fails(self):
+        self._cleanup_test((('data', 0), ('meta', 1)),
+                           (('meta', 1),),
+                           None,
+                           (('data', 0), ('meta', 1)),  # nothing is removed
+                           (('meta', 1),),
+                           exp_ret_code=1,
+                           relink_errors={'data': OSError(errno.EPERM, 'oops')}
+                           )
+        warning_lines = self.logger.get_lines_for_level('warning')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(2 files, 0 linked, 0 removed, 1 errors)',
+                      warning_lines)
+
+    def test_cleanup_missing_meta_file_relink_fails(self):
+        self._cleanup_test((('data', 0), ('meta', 1)),
+                           (('data', 0),),
+                           None,
+                           (('data', 0), ('meta', 1)),  # nothing is removed
+                           (('data', 0),),
+                           exp_ret_code=1,
+                           relink_errors={'meta': OSError(errno.EPERM, 'oops')}
+                           )
+        warning_lines = self.logger.get_lines_for_level('warning')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(2 files, 0 linked, 0 removed, 1 errors)',
+                      warning_lines)
+
+    def test_cleanup_missing_data_and_meta_file_one_relink_fails(self):
+        self._cleanup_test((('data', 0), ('meta', 1)),
+                           None,
+                           None,
+                           (('data', 0), ('meta', 1)),  # nothing is removed
+                           (('data', 0),),
+                           exp_ret_code=1,
+                           relink_errors={'meta': OSError(errno.EPERM, 'oops')}
+                           )
+        warning_lines = self.logger.get_lines_for_level('warning')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(2 files, 1 linked, 0 removed, 1 errors)',
+                      warning_lines)
+
+    def test_cleanup_missing_data_and_meta_file_both_relinks_fails(self):
+        self._cleanup_test((('data', 0), ('meta', 1)),
+                           None,
+                           None,
+                           (('data', 0), ('meta', 1)),  # nothing is removed
+                           None,
+                           exp_ret_code=1,
+                           relink_errors={'data': OSError(errno.EPERM, 'oops'),
+                                          'meta': OSError(errno.EPERM, 'oops')}
+                           )
+        error_lines = self.logger.get_lines_for_level('error')
+        self.assertEqual(2, len(error_lines))
+        for err_msg in error_lines:
+            self.assertTrue(err_msg.startswith("Error relinking"))
+            self.assertIn("failed to relink", err_msg)
+        warning_lines = self.logger.get_lines_for_level('warning')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(2 files, 0 linked, 0 removed, 2 errors)',
+                      warning_lines)
+
+    def test_cleanup_conflicting_data_file(self):
+        self._cleanup_test((('data', 0),),
+                           None,
+                           (('data', 0),),  # different inode
+                           (('data', 0),),
+                           (('data', 0),),
+                           exp_ret_code=1)
+        warning_lines = self.logger.get_lines_for_level('warning')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(1 files, 0 linked, 0 removed, 1 errors)',
+                      warning_lines)
+
+    def test_cleanup_conflicting_ts_file(self):
+        self._cleanup_test((('ts', 0),),
+                           None,
+                           (('ts', 0),),  # different inode but same timestamp
+                           None,
+                           (('ts', 0),),
+                           exp_ret_code=0)
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(1 files, 0 linked, 1 removed, 0 errors)',
+                      info_lines)
+        warning_lines = self.logger.get_lines_for_level('warning')
+        self.assertEqual([], warning_lines)
+
+    def test_cleanup_conflicting_ts_is_linked_to_part_power_minus_1(self):
+        self._setup_object(lambda part: part >= 2 ** (PART_POWER - 1))
+        self.rb.prepare_increase_partition_power()
+        self.rb.increase_partition_power()
+        self._save_ring()
+        # setup a file in the next part power (PART_POWER + 1) location that is
+        # linked to a file in an older PART_POWER - 1 location
+        filename = '.'.join([self.obj_ts.internal, 'ts'])
+        older_filepath, new_filepath = self._make_link(filename,
+                                                       PART_POWER - 1)
+        self._do_link_test('cleanup',
+                           (('ts', 0),),
+                           None,
+                           None,  # we already made file linked to older part
+                           None,
+                           (('ts', 0),),
+                           exp_ret_code=0)
+        info_lines = self.logger.get_lines_for_level('info')
+        # both the PART_POWER and PART_POWER - N partitions are visited, no new
+        # links are created, and both the older files are removed
+        self.assertIn('2 hash dirs processed (cleanup=True) '
+                      '(2 files, 0 linked, 2 removed, 0 errors)',
+                      info_lines)
+        with open(new_filepath, 'r') as fd:
+            self.assertEqual(older_filepath, fd.read())
+        self.assertFalse(os.path.exists(older_filepath))
+
+    def test_cleanup_conflicting_ts_is_linked_to_part_power_minus_2_err(self):
+        # link from next partition to current-2 partition;
+        # different file in current partition
+        # by default the relinker will NOT validate the current-2 location
+        self._setup_object(lambda part: part >= 2 ** (PART_POWER - 1))
+        self.rb.prepare_increase_partition_power()
+        self.rb.increase_partition_power()
+        self._save_ring()
+        # setup a file in the next part power (PART_POWER + 1) location that is
+        # linked to a file in an older (PART_POWER - 2) location
+        filename = '.'.join([self.obj_ts.internal, 'ts'])
+        older_filepath, new_filepath = self._make_link(filename,
+                                                       PART_POWER - 2)
+
+        self._do_link_test('cleanup',
+                           (('ts', 0),),
+                           None,
+                           None,  # we already made file linked to older part
+                           None,  # different inode but same timestamp: removed
+                           (('ts', 0),),
+                           exp_ret_code=0)
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('2 hash dirs processed (cleanup=True) '
+                      '(2 files, 0 linked, 2 removed, 0 errors)',
+                      info_lines)
+        warning_lines = self.logger.get_lines_for_level('warning')
+        self.assertEqual([], warning_lines)
+        with open(new_filepath, 'r') as fd:
+            self.assertEqual(older_filepath, fd.read())
+        # current-2 is linked so can be removed in cleanup
+        self.assertFalse(os.path.exists(older_filepath))
+
+    def test_cleanup_conflicting_ts_is_linked_to_part_power_minus_2_ok(self):
+        # link from next partition to current-2 partition;
+        # different file in current partition
+        self._setup_object(lambda part: part >= 2 ** (PART_POWER - 1))
+        self.rb.prepare_increase_partition_power()
+        self.rb.increase_partition_power()
+        self._save_ring()
+        # setup a file in the next part power (PART_POWER + 1) location that is
+        # linked to a file in an older (PART_POWER - 2) location
+        filename = '.'.join([self.obj_ts.internal, 'ts'])
+        older_filepath, new_filepath = self._make_link(filename,
+                                                       PART_POWER - 2)
+        self._do_link_test('cleanup',
+                           (('ts', 0),),
+                           None,
+                           None,  # we already made file linked to older part
+                           None,
+                           (('ts', 0),),
+                           exp_ret_code=0)
+        info_lines = self.logger.get_lines_for_level('info')
+        # both the PART_POWER and PART_POWER - N partitions are visited, no new
+        # links are created, and both the older files are removed
+        self.assertIn('2 hash dirs processed (cleanup=True) '
+                      '(2 files, 0 linked, 2 removed, 0 errors)',
+                      info_lines)
+        warning_lines = self.logger.get_lines_for_level('warning')
+        self.assertEqual([], warning_lines)
+        with open(new_filepath, 'r') as fd:
+            self.assertEqual(older_filepath, fd.read())
+        self.assertFalse(os.path.exists(older_filepath))
+
+    def test_cleanup_conflicting_older_data_file(self):
+        # older conflicting file isn't relevant so cleanup succeeds
+        self._cleanup_test((('data', 0),),
+                           (('data', 1),),
+                           (('data', 0),),  # different inode
+                           None,
+                           (('data', 1),),  # cleanup_ondisk_files rm'd 0.data
+                           exp_ret_code=0)
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(0 files, 0 linked, 1 removed, 0 errors)',
+                      info_lines)
+
+    def test_cleanup_conflicting_data_file_conflicting_meta_file(self):
+        self._cleanup_test((('data', 0), ('meta', 1)),
+                           None,
+                           (('data', 0), ('meta', 1)),  # different inodes
+                           (('data', 0), ('meta', 1)),
+                           (('data', 0), ('meta', 1)),
+                           exp_ret_code=1)
+        warning_lines = self.logger.get_lines_for_level('warning')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(2 files, 0 linked, 0 removed, 2 errors)',
+                      warning_lines)
+
+    def test_cleanup_conflicting_data_file_existing_meta_file(self):
+        # if just one link fails to be created then *nothing* is removed from
+        # old dir
+        self._cleanup_test((('data', 0), ('meta', 1)),
+                           (('meta', 1),),
+                           (('data', 0),),  # different inode
+                           (('data', 0), ('meta', 1)),
+                           (('data', 0), ('meta', 1)),
+                           exp_ret_code=1)
+        warning_lines = self.logger.get_lines_for_level('warning')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(2 files, 0 linked, 0 removed, 1 errors)',
+                      warning_lines)
+
+    def test_cleanup_first_quartile_does_rehash(self):
+        # we need object name in lower half of current part
+        self._setup_object(lambda part: part < 2 ** (PART_POWER - 1))
+        self.assertLess(self.next_part, 2 ** PART_POWER)
+        self._common_test_cleanup()
+
+        # don't mock re-hash for variety (and so we can assert side-effects)
+        self.assertEqual(0, relinker.main([
+            'cleanup',
+            '--swift-dir', self.testdir,
+            '--devices', self.devices,
+            '--skip-mount',
+        ]))
+
+        # Old objectname should be removed, new should still exist
+        self.assertTrue(os.path.isdir(self.expected_dir))
+        self.assertTrue(os.path.isfile(self.expected_file))
+        self.assertFalse(os.path.isfile(
+            os.path.join(self.objdir, self.object_fname)))
+        self.assertFalse(os.path.exists(self.part_dir))
+
+        with open(os.path.join(self.next_part_dir, 'hashes.invalid')) as fp:
+            self.assertEqual(fp.read(), '')
+        with open(os.path.join(self.next_part_dir, 'hashes.pkl'), 'rb') as fp:
+            hashes = pickle.load(fp)
+        self.assertIn(self._hash[-3:], hashes)
+
+        # create an object in a first quartile partition and pretend it should
+        # be there; check that cleanup does not fail and does not remove the
+        # partition!
+        self._setup_object(lambda part: part < 2 ** (PART_POWER - 1))
+        with mock.patch('swift.cli.relinker.replace_partition_in_path',
+                        lambda *args, **kwargs: args[1]):
+            self.assertEqual(0, relinker.main([
+                'cleanup',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+                '--skip-mount',
+            ]))
+        self.assertTrue(os.path.exists(self.objname))
+
+    def test_cleanup_second_quartile_no_rehash(self):
+        # we need a part in upper half of current part power
+        self._setup_object(lambda part: part >= 2 ** (PART_POWER - 1))
+        self.assertGreaterEqual(self.part, 2 ** (PART_POWER - 1))
+        self._common_test_cleanup()
+
+        def fake_hash_suffix(suffix_dir, policy):
+            # check that the hash dir is empty and remove it just like the
+            # real _hash_suffix
+            self.assertEqual([self._hash], os.listdir(suffix_dir))
+            hash_dir = os.path.join(suffix_dir, self._hash)
+            self.assertEqual([], os.listdir(hash_dir))
+            os.rmdir(hash_dir)
+            os.rmdir(suffix_dir)
+            raise PathNotDir()
+
+        with mock.patch('swift.obj.diskfile.DiskFileManager._hash_suffix',
+                        side_effect=fake_hash_suffix) as mock_hash_suffix:
+            self.assertEqual(0, relinker.main([
+                'cleanup',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+                '--skip-mount',
+            ]))
+
+        # the old suffix dir is rehashed before the old partition is removed,
+        # but the new suffix dir is not rehashed
+        self.assertEqual([mock.call(self.suffix_dir, policy=self.policy)],
+                         mock_hash_suffix.call_args_list)
+
+        # Old objectname should be removed, new should still exist
+        self.assertTrue(os.path.isdir(self.expected_dir))
+        self.assertTrue(os.path.isfile(self.expected_file))
+        self.assertFalse(os.path.isfile(
+            os.path.join(self.objdir, self.object_fname)))
+        self.assertFalse(os.path.exists(self.part_dir))
+
+        with open(os.path.join(self.objects, str(self.next_part),
+                               'hashes.invalid')) as fp:
+            self.assertEqual(fp.read(), '')
+        with open(os.path.join(self.objects, str(self.next_part),
+                               'hashes.pkl'), 'rb') as fp:
+            hashes = pickle.load(fp)
+        self.assertIn(self._hash[-3:], hashes)
+
+    def test_cleanup_no_applicable_policy(self):
+        # NB do not prepare part power increase
+        self._save_ring()
+        with self._mock_relinker():
+            self.assertEqual(2, relinker.main([
+                'cleanup',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+            ]))
+        self.assertEqual(self.logger.get_lines_for_level('warning'),
+                         ['No policy found to increase the partition power.'])
+        self.assertEqual([], self.logger.get_lines_for_level('error'))
+
+    def test_cleanup_not_mounted(self):
+        self._common_test_cleanup()
+        with self._mock_relinker():
+            self.assertEqual(1, relinker.main([
+                'cleanup',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+            ]))
+        self.assertEqual(self.logger.get_lines_for_level('warning'), [
+            'Skipping sda1 as it is not mounted',
+            '1 disks were unmounted',
+            '0 hash dirs processed (cleanup=True) '
+            '(0 files, 0 linked, 0 removed, 0 errors)',
+        ])
+        self.assertEqual([], self.logger.get_lines_for_level('error'))
+
+    def test_cleanup_listdir_error(self):
+        self._common_test_cleanup()
+        with self._mock_relinker():
+            with self._mock_listdir():
+                self.assertEqual(1, relinker.main([
+                    'cleanup',
+                    '--swift-dir', self.testdir,
+                    '--devices', self.devices,
+                    '--skip-mount-check'
+                ]))
+        self.assertEqual(self.logger.get_lines_for_level('warning'), [
+            'Skipping %s because ' % self.objects,
+            'There were 1 errors listing partition directories',
+            '0 hash dirs processed (cleanup=True) '
+            '(0 files, 0 linked, 0 removed, 1 errors)',
+        ])
+        self.assertEqual([], self.logger.get_lines_for_level('error'))
+
+    def test_cleanup_device_filter(self):
+        self._common_test_cleanup()
+        with self._mock_relinker():
+            self.assertEqual(0, relinker.main([
+                'cleanup',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+                '--skip-mount',
+                '--device', self.existing_device,
+            ]))
+
+        # Old objectname should be removed, new should still exist
+        self.assertTrue(os.path.isdir(self.expected_dir))
+        self.assertTrue(os.path.isfile(self.expected_file))
+        self.assertFalse(os.path.isfile(
+            os.path.join(self.objdir, self.object_fname)))
+        self.assertEqual([], self.logger.get_lines_for_level('error'))
+
+    def test_cleanup_device_filter_invalid(self):
+        self._common_test_cleanup()
+        with self._mock_relinker():
+            self.assertEqual(0, relinker.main([
+                'cleanup',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+                '--skip-mount',
+                '--device', 'none',
+            ]))
+
+        # Old objectname should still exist, new should still exist
+        self.assertTrue(os.path.isdir(self.expected_dir))
+        self.assertTrue(os.path.isfile(self.expected_file))
+        self.assertTrue(os.path.isfile(
+            os.path.join(self.objdir, self.object_fname)))
+        self.assertEqual([], self.logger.get_lines_for_level('error'))
+
+    def _time_iter(self, start):
+        yield start
+        while True:
+            yield start + 1
+
+    @patch_policies(
+        [StoragePolicy(0, 'platinum', True),
+         ECStoragePolicy(
+             1, name='ec', is_default=False, ec_type=DEFAULT_TEST_EC_TYPE,
+             ec_ndata=4, ec_nparity=2)])
+    @mock.patch('os.getpid', return_value=100)
+    def test_relink_cleanup(self, mock_getpid):
+        # setup a policy-0 object in a part in the second quartile so that its
+        # next part *will not* be handled during cleanup
+        self._setup_object(lambda part: part >= 2 ** (PART_POWER - 1))
+        # create policy-1 object in a part in the first quartile so that its
+        # next part *will* be handled during cleanup
+        _hash, pol_1_part, pol_1_next_part, objpath = self._get_object_name(
+            lambda part: part < 2 ** (PART_POWER - 1))
+        self._create_object(POLICIES[1], pol_1_part, _hash)
+
+        state_files = {
+            POLICIES[0]: os.path.join(self.devices, self.existing_device,
+                                      'relink.objects.json'),
+            POLICIES[1]: os.path.join(self.devices, self.existing_device,
+                                      'relink.objects-1.json'),
+        }
+
+        self.rb.prepare_increase_partition_power()
+        self._save_ring()
+        ts1 = time.time()
+        with mock.patch('time.time', side_effect=self._time_iter(ts1)):
+            self.assertEqual(0, relinker.main([
+                'relink',
+                self.conf_file,
+            ]))
+
+        orig_inodes = {}
+        for policy, part in zip(POLICIES,
+                                (self.part, pol_1_part)):
+            state_file = state_files[policy]
+            orig_inodes[policy] = os.stat(state_file).st_ino
+            state = {str(part): True}
+            with open(state_files[policy], 'rt') as f:
+                self.assertEqual(json.load(f), {
+                    "part_power": PART_POWER,
+                    "next_part_power": PART_POWER + 1,
+                    "state": state})
+        recon_progress = utils.load_recon_cache(self.recon_cache)
+        expected_recon_data = {
+            'devices': {'sda1': {'parts_done': 2,
+                                 'policies': {'0': {
+                                     'next_part_power': PART_POWER + 1,
+                                     'part_power': PART_POWER,
+                                     'parts_done': 1,
+                                     'start_time': mock.ANY,
+                                     'stats': {'errors': 0,
+                                               'files': 1,
+                                               'hash_dirs': 1,
+                                               'linked': 1,
+                                               'removed': 0},
+                                     'step': 'relink',
+                                     'timestamp': mock.ANY,
+                                     'total_parts': 1,
+                                     'total_time': 0.0},
+                                     '1': {
+                                         'next_part_power': PART_POWER + 1,
+                                         'part_power': PART_POWER,
+                                         'parts_done': 1,
+                                         'start_time': mock.ANY,
+                                         'stats': {
+                                             'errors': 0,
+                                             'files': 1,
+                                             'hash_dirs': 1,
+                                             'linked': 1,
+                                             'removed': 0},
+                                         'step': 'relink',
+                                         'timestamp': mock.ANY,
+                                         'total_parts': 1,
+                                         'total_time': 0.0}},
+                                 'start_time': mock.ANY,
+                                 'stats': {'errors': 0,
+                                           'files': 2,
+                                           'hash_dirs': 2,
+                                           'linked': 2,
+                                           'removed': 0},
+                                 'timestamp': mock.ANY,
+                                 'total_parts': 2,
+                                 'total_time': 0}},
+            'workers': {'100': {'devices': ['sda1'],
+                                'return_code': 0,
+                                'timestamp': mock.ANY}}}
+        self.assertEqual(recon_progress, expected_recon_data)
+
+        self.rb.increase_partition_power()
+        self.rb._ring = None  # Force builder to reload ring
+        self._save_ring()
+        with open(state_files[0], 'rt'), open(state_files[1], 'rt'):
+            # Keep the state files open during cleanup so the inode can't be
+            # released/re-used when it gets unlinked
+            self.assertEqual(orig_inodes[0], os.stat(state_files[0]).st_ino)
+            self.assertEqual(orig_inodes[1], os.stat(state_files[1]).st_ino)
+            ts1 = time.time()
+            with mock.patch('time.time', side_effect=self._time_iter(ts1)):
+                self.assertEqual(0, relinker.main([
+                    'cleanup',
+                    self.conf_file,
+                ]))
+            self.assertNotEqual(orig_inodes[0], os.stat(state_files[0]).st_ino)
+            self.assertNotEqual(orig_inodes[1], os.stat(state_files[1]).st_ino)
+        for policy, part, next_part in zip(POLICIES,
+                                           (self.part, pol_1_part),
+                                           (None, pol_1_next_part)):
+            state_file = state_files[policy]
+            state = {str(part): True}
+            if next_part is not None:
+                # cleanup will process the new partition as well as the old if
+                # old is in first quartile
+                state[str(next_part)] = True
+            with open(state_file, 'rt') as f:
+                # NB: part_power/next_part_power tuple changed, so state was
+                # reset (though we track prev_part_power for an efficient clean
+                # up)
+                self.assertEqual(json.load(f), {
+                    "prev_part_power": PART_POWER,
+                    "part_power": PART_POWER + 1,
+                    "next_part_power": PART_POWER + 1,
+                    "state": state})
+        recon_progress = utils.load_recon_cache(self.recon_cache)
+        expected_recon_data = {
+            'devices': {'sda1': {'parts_done': 3,
+                                 'policies': {'0': {
+                                     'next_part_power': PART_POWER + 1,
+                                     'part_power': PART_POWER + 1,
+                                     'parts_done': 1,
+                                     'start_time': mock.ANY,
+                                     'stats': {'errors': 0,
+                                               'files': 1,
+                                               'hash_dirs': 1,
+                                               'linked': 0,
+                                               'removed': 1},
+                                     'step': 'cleanup',
+                                     'timestamp': mock.ANY,
+                                     'total_parts': 1,
+                                     'total_time': 0.0},
+                                     '1': {
+                                         'next_part_power': PART_POWER + 1,
+                                         'part_power': PART_POWER + 1,
+                                         'parts_done': 2,
+                                         'start_time': mock.ANY,
+                                         'stats': {
+                                             'errors': 0,
+                                             'files': 1,
+                                             'hash_dirs': 1,
+                                             'linked': 0,
+                                             'removed': 1},
+                                         'step': 'cleanup',
+                                         'timestamp': mock.ANY,
+                                         'total_parts': 2,
+                                         'total_time': 0.0}},
+                                 'start_time': mock.ANY,
+                                 'stats': {'errors': 0,
+                                           'files': 2,
+                                           'hash_dirs': 2,
+                                           'linked': 0,
+                                           'removed': 2},
+                                 'timestamp': mock.ANY,
+                                 'total_parts': 3,
+                                 'total_time': 0}},
+            'workers': {'100': {'devices': ['sda1'],
+                                'return_code': 0,
+                                'timestamp': mock.ANY}}}
+        self.assertEqual(recon_progress, expected_recon_data)
+
+    def test_devices_filter_filtering(self):
+        # With no filtering, returns all devices
+        r = relinker.Relinker(
+            {'devices': self.devices,
+             'recon_cache_path': self.recon_cache_path},
+            self.logger, self.existing_device)
+        devices = r.devices_filter("", [self.existing_device])
+        self.assertEqual(set([self.existing_device]), devices)
+
+        # With a matching filter, returns what is matching
+        devices = r.devices_filter("", [self.existing_device, 'sda2'])
+        self.assertEqual(set([self.existing_device]), devices)
+
+        # With a non matching filter, returns nothing
+        r.device_list = ['none']
+        devices = r.devices_filter("", [self.existing_device])
+        self.assertEqual(set(), devices)
+
+    def test_hook_pre_post_device_locking(self):
+        r = relinker.Relinker(
+            {'devices': self.devices,
+             'recon_cache_path': self.recon_cache_path},
+            self.logger, self.existing_device)
+        device_path = os.path.join(self.devices, self.existing_device)
+        r.datadir = 'object'  # would get set in process_policy
+        r.states = {"state": {}, "part_power": PART_POWER,
+                    "next_part_power": PART_POWER + 1}  # ditto
+        lock_file = os.path.join(device_path, '.relink.%s.lock' % r.datadir)
+        r.policy = self.policy
+
+        # The first run gets the lock
+        r.hook_pre_device(device_path)
+        self.assertIsNotNone(r.dev_lock)
+
+        # A following run would block
+        with self.assertRaises(IOError) as raised:
+            with open(lock_file, 'a') as f:
+                fcntl.flock(f.fileno(), fcntl.LOCK_EX | fcntl.LOCK_NB)
+        self.assertEqual(errno.EAGAIN, raised.exception.errno)
+
+        # Another must not get the lock, so it must return an empty list
+        r.hook_post_device(device_path)
+        self.assertIsNone(r.dev_lock)
+
+        with open(lock_file, 'a') as f:
+            fcntl.flock(f.fileno(), fcntl.LOCK_EX | fcntl.LOCK_NB)
+
+    def _test_state_file(self, pol, expected_recon_data):
+        r = relinker.Relinker(
+            {'devices': self.devices,
+             'recon_cache_path': self.recon_cache_path,
+             'stats_interval': 0.0},
+            self.logger, [self.existing_device])
+        device_path = os.path.join(self.devices, self.existing_device)
+        r.datadir = 'objects'
+        r.part_power = PART_POWER
+        r.next_part_power = PART_POWER + 1
+        datadir_path = os.path.join(device_path, r.datadir)
+        state_file = os.path.join(device_path, 'relink.%s.json' % r.datadir)
+        r.policy = pol
+        r.pid = 1234  # for recon workers stats
+
+        recon_progress = utils.load_recon_cache(self.recon_cache)
+        # the progress for the current policy should be gone. So we should
+        # just have anything from any other process polices.. if any.
+        self.assertEqual(recon_progress, expected_recon_data)
+
+        # Start relinking
+        r.states = {
+            "part_power": PART_POWER,
+            "next_part_power": PART_POWER + 1,
+            "state": {},
+        }
+
+        # Load the states: As it starts, it must be empty
+        r.hook_pre_device(device_path)
+        self.assertEqual({}, r.states["state"])
+        os.close(r.dev_lock)  # Release the lock
+
+        # Partition 312 is ignored because it must have been created with the
+        # next_part_power, so it does not need to be relinked
+        # 96 and 227 are reverse ordered
+        # auditor_status_ALL.json is ignored because it's not a partition
+        self.assertEqual(['227', '96'], r.partitions_filter(
+            "", ['96', '227', '312', 'auditor_status.json']))
+        self.assertEqual(r.states["state"], {'96': False, '227': False})
+
+        r.diskfile_mgr = DiskFileRouter({
+            'devices': self.devices,
+            'mount_check': False,
+        }, self.logger)[r.policy]
+
+        # Ack partition 96
+        r.hook_pre_partition(os.path.join(datadir_path, '96'))
+        r.hook_post_partition(os.path.join(datadir_path, '96'))
+        self.assertEqual(r.states["state"], {'96': True, '227': False})
+        self.assertEqual(self.logger.get_lines_for_level("info"), [
+            "Step: relink Device: sda1 Policy: %s "
+            "Partitions: 1/2" % r.policy.name,
+        ])
+        with open(state_file, 'rt') as f:
+            self.assertEqual(json.load(f), {
+                "part_power": PART_POWER,
+                "next_part_power": PART_POWER + 1,
+                "state": {'96': True, '227': False}})
+        recon_progress = utils.load_recon_cache(self.recon_cache)
+        expected_recon_data.update(
+            {'devices': {
+                'sda1': {
+                    'parts_done': 1,
+                    'policies': {
+                        str(pol.idx): {
+                            'next_part_power': PART_POWER + 1,
+                            'part_power': PART_POWER,
+                            'parts_done': 1,
+                            'start_time': mock.ANY,
+                            'stats': {
+                                'errors': 0,
+                                'files': 0,
+                                'hash_dirs': 0,
+                                'linked': 0,
+                                'removed': 0},
+                            'step': 'relink',
+                            'timestamp': mock.ANY,
+                            'total_parts': 2}},
+                    'start_time': mock.ANY,
+                    'stats': {
+                        'errors': 0,
+                        'files': 0,
+                        'hash_dirs': 0,
+                        'linked': 0,
+                        'removed': 0},
+                    'timestamp': mock.ANY,
+                    'total_parts': 2,
+                    'total_time': 0}},
+             'workers': {
+                '1234': {'timestamp': mock.ANY,
+                         'return_code': None,
+                         'devices': ['sda1']}}})
+        self.assertEqual(recon_progress, expected_recon_data)
+
+        # Restart relinking after only part 96 was done
+        self.logger.clear()
+        self.assertEqual(['227'],
+                         r.partitions_filter("", ['96', '227', '312']))
+        self.assertEqual(r.states["state"], {'96': True, '227': False})
+
+        # ...but there's an error
+        r.hook_pre_partition(os.path.join(datadir_path, '227'))
+        r.stats['errors'] += 1
+        r.hook_post_partition(os.path.join(datadir_path, '227'))
+        self.assertEqual(self.logger.get_lines_for_level("info"), [
+            "Step: relink Device: sda1 Policy: %s "
+            "Partitions: 1/2" % r.policy.name,
+        ])
+        self.assertEqual(r.states["state"], {'96': True, '227': False})
+        with open(state_file, 'rt') as f:
+            self.assertEqual(json.load(f), {
+                "part_power": PART_POWER,
+                "next_part_power": PART_POWER + 1,
+                "state": {'96': True, '227': False}})
+
+        # OK, one more try
+        self.logger.clear()
+        self.assertEqual(['227'],
+                         r.partitions_filter("", ['96', '227', '312']))
+        self.assertEqual(r.states["state"], {'96': True, '227': False})
+
+        # Ack partition 227
+        r.hook_pre_partition(os.path.join(datadir_path, '227'))
+        r.hook_post_partition(os.path.join(datadir_path, '227'))
+        self.assertEqual(self.logger.get_lines_for_level("info"), [
+            "Step: relink Device: sda1 Policy: %s "
+            "Partitions: 2/2" % r.policy.name,
+        ])
+        self.assertEqual(r.states["state"], {'96': True, '227': True})
+        with open(state_file, 'rt') as f:
+            self.assertEqual(json.load(f), {
+                "part_power": PART_POWER,
+                "next_part_power": PART_POWER + 1,
+                "state": {'96': True, '227': True}})
+        recon_progress = utils.load_recon_cache(self.recon_cache)
+        expected_recon_data.update(
+            {'devices': {
+                'sda1': {
+                    'parts_done': 2,
+                    'policies': {
+                        str(pol.idx): {
+                            'next_part_power': PART_POWER + 1,
+                            'part_power': PART_POWER,
+                            'parts_done': 2,
+                            'start_time': mock.ANY,
+                            'stats': {
+                                'errors': 1,
+                                'files': 0,
+                                'hash_dirs': 0,
+                                'linked': 0,
+                                'removed': 0},
+                            'step': 'relink',
+                            'timestamp': mock.ANY,
+                            'total_parts': 2}},
+                    'start_time': mock.ANY,
+                    'stats': {
+                        'errors': 1,
+                        'files': 0,
+                        'hash_dirs': 0,
+                        'linked': 0,
+                        'removed': 0},
+                    'timestamp': mock.ANY,
+                    'total_parts': 2,
+                    'total_time': 0}}})
+        self.assertEqual(recon_progress, expected_recon_data)
+
+        # If the process restarts, it reload the state
+        r.states = {
+            "part_power": PART_POWER,
+            "next_part_power": PART_POWER + 1,
+            "state": {},
+        }
+        r.hook_pre_device(device_path)
+        self.assertEqual(r.states, {
+            "part_power": PART_POWER,
+            "next_part_power": PART_POWER + 1,
+            "state": {'96': True, '227': True}})
+        os.close(r.dev_lock)  # Release the lock
+
+        # Start cleanup -- note that part_power and next_part_power now match!
+        r.do_cleanup = True
+        r.part_power = PART_POWER + 1
+        r.states = {
+            "part_power": PART_POWER + 1,
+            "next_part_power": PART_POWER + 1,
+            "state": {},
+        }
+        # ...which means our state file was ignored
+        r.hook_pre_device(device_path)
+        self.assertEqual(r.states, {
+            "prev_part_power": PART_POWER,
+            "part_power": PART_POWER + 1,
+            "next_part_power": PART_POWER + 1,
+            "state": {}})
+        os.close(r.dev_lock)  # Release the lock
+
+        self.assertEqual(['227', '96'],
+                         r.partitions_filter("", ['96', '227', '312']))
+        # Ack partition 227
+        r.hook_pre_partition(os.path.join(datadir_path, '227'))
+        r.hook_post_partition(os.path.join(datadir_path, '227'))
+        self.assertIn("Step: cleanup Device: sda1 Policy: %s "
+                      "Partitions: 1/2" % r.policy.name,
+                      self.logger.get_lines_for_level("info"))
+        self.assertEqual(r.states["state"],
+                         {'96': False, '227': True})
+        with open(state_file, 'rt') as f:
+            self.assertEqual(json.load(f), {
+                "prev_part_power": PART_POWER,
+                "part_power": PART_POWER + 1,
+                "next_part_power": PART_POWER + 1,
+                "state": {'96': False, '227': True}})
+        recon_progress = utils.load_recon_cache(self.recon_cache)
+        expected_recon_data.update(
+            {'devices': {
+                'sda1': {
+                    'parts_done': 1,
+                    'policies': {
+                        str(pol.idx): {
+                            'next_part_power': PART_POWER + 1,
+                            'part_power': PART_POWER + 1,
+                            'parts_done': 1,
+                            'start_time': mock.ANY,
+                            'stats': {
+                                'errors': 0,
+                                'files': 0,
+                                'hash_dirs': 0,
+                                'linked': 0,
+                                'removed': 0},
+                            'step': 'cleanup',
+                            'timestamp': mock.ANY,
+                            'total_parts': 2}},
+                    'start_time': mock.ANY,
+                    'stats': {
+                        'errors': 0,
+                        'files': 0,
+                        'hash_dirs': 0,
+                        'linked': 0,
+                        'removed': 0},
+                    'timestamp': mock.ANY,
+                    'total_parts': 2,
+                    'total_time': 0}}})
+        self.assertEqual(recon_progress, expected_recon_data)
+
+        # Restart cleanup after only part 227 was done
+        self.assertEqual(['96'], r.partitions_filter("", ['96', '227', '312']))
+        self.assertEqual(r.states["state"],
+                         {'96': False, '227': True})
+
+        # Ack partition 96
+        r.hook_post_partition(os.path.join(datadir_path, '96'))
+        self.assertIn("Step: cleanup Device: sda1 Policy: %s "
+                      "Partitions: 2/2" % r.policy.name,
+                      self.logger.get_lines_for_level("info"))
+        self.assertEqual(r.states["state"],
+                         {'96': True, '227': True})
+        with open(state_file, 'rt') as f:
+            self.assertEqual(json.load(f), {
+                "prev_part_power": PART_POWER,
+                "part_power": PART_POWER + 1,
+                "next_part_power": PART_POWER + 1,
+                "state": {'96': True, '227': True}})
+
+        recon_progress = utils.load_recon_cache(self.recon_cache)
+        expected_recon_data.update(
+            {'devices': {
+                'sda1': {
+                    'parts_done': 2,
+                    'policies': {
+                        str(pol.idx): {
+                            'next_part_power': PART_POWER + 1,
+                            'part_power': PART_POWER + 1,
+                            'parts_done': 2,
+                            'start_time': mock.ANY,
+                            'stats': {
+                                'errors': 0,
+                                'files': 0,
+                                'hash_dirs': 0,
+                                'linked': 0,
+                                'removed': 0},
+                            'step': 'cleanup',
+                            'timestamp': mock.ANY,
+                            'total_parts': 2}},
+                    'start_time': mock.ANY,
+                    'stats': {
+                        'errors': 0,
+                        'files': 0,
+                        'hash_dirs': 0,
+                        'linked': 0,
+                        'removed': 0},
+                    'timestamp': mock.ANY,
+                    'total_parts': 2,
+                    'total_time': 0}}})
+        self.assertEqual(recon_progress, expected_recon_data)
+
+        # At the end, the state is still accurate
+        r.states = {
+            "prev_part_power": PART_POWER,
+            "part_power": PART_POWER + 1,
+            "next_part_power": PART_POWER + 1,
+            "state": {},
+        }
+        r.hook_pre_device(device_path)
+        self.assertEqual(r.states["state"],
+                         {'96': True, '227': True})
+        os.close(r.dev_lock)  # Release the lock
+
+        # If the part_power/next_part_power tuple differs, restart from scratch
+        r.states = {
+            "part_power": PART_POWER + 1,
+            "next_part_power": PART_POWER + 2,
+            "state": {},
+        }
+        r.hook_pre_device(device_path)
+        self.assertEqual(r.states["state"], {})
+        self.assertFalse(os.path.exists(state_file))
+        # this will also reset the recon stats
+        recon_progress = utils.load_recon_cache(self.recon_cache)
+        expected_recon_data.update({
+            'devices': {
+                'sda1': {
+                    'parts_done': 0,
+                    'policies': {
+                        str(pol.idx): {
+                            'next_part_power': PART_POWER + 2,
+                            'part_power': PART_POWER + 1,
+                            'parts_done': 0,
+                            'start_time': mock.ANY,
+                            'stats': {
+                                'errors': 0,
+                                'files': 0,
+                                'hash_dirs': 0,
+                                'linked': 0,
+                                'removed': 0},
+                            'step': 'cleanup',
+                            'timestamp': mock.ANY,
+                            'total_parts': 0}},
+                    'start_time': mock.ANY,
+                    'stats': {
+                        'errors': 0,
+                        'files': 0,
+                        'hash_dirs': 0,
+                        'linked': 0,
+                        'removed': 0},
+                    'timestamp': mock.ANY,
+                    'total_parts': 0,
+                    'total_time': 0}}})
+        self.assertEqual(recon_progress, expected_recon_data)
+        os.close(r.dev_lock)  # Release the lock
+
+        # If the file gets corrupted, restart from scratch
+        with open(state_file, 'wt') as f:
+            f.write('NOT JSON')
+        r.states = {
+            "part_power": PART_POWER,
+            "next_part_power": PART_POWER + 1,
+            "state": {},
+        }
+        r.hook_pre_device(device_path)
+        self.assertEqual(r.states["state"], {})
+        self.assertFalse(os.path.exists(state_file))
+        recon_progress = utils.load_recon_cache(self.recon_cache)
+        expected_recon_data.update({
+            'devices': {
+                'sda1': {
+                    'parts_done': 0,
+                    'policies': {
+                        str(pol.idx): {
+                            'next_part_power': PART_POWER + 1,
+                            'part_power': PART_POWER,
+                            'parts_done': 0,
+                            'start_time': mock.ANY,
+                            'stats': {
+                                'errors': 0,
+                                'files': 0,
+                                'hash_dirs': 0,
+                                'linked': 0,
+                                'removed': 0},
+                            'step': 'cleanup',
+                            'timestamp': mock.ANY,
+                            'total_parts': 0}},
+                    'start_time': mock.ANY,
+                    'stats': {
+                        'errors': 0,
+                        'files': 0,
+                        'hash_dirs': 0,
+                        'linked': 0,
+                        'removed': 0},
+                    'timestamp': mock.ANY,
+                    'total_parts': 0,
+                    'total_time': 0}}})
+        self.assertEqual(recon_progress, expected_recon_data)
+        os.close(r.dev_lock)  # Release the lock
+        return expected_recon_data
+
+    @patch_policies(
+        [StoragePolicy(0, 'platinum', True),
+         ECStoragePolicy(
+            1, name='ec', is_default=False, ec_type=DEFAULT_TEST_EC_TYPE,
+            ec_ndata=4, ec_nparity=2)])
+    def test_state_file(self):
+        expected_recon_data = {}
+        for policy in POLICIES:
+            # because we specifying a device, it should be itself reset
+            expected_recon_data = self._test_state_file(
+                policy, expected_recon_data)
+            self.logger.clear()
+
+    def test_cleanup_relinked_ok(self):
+        self._common_test_cleanup()
+        with self._mock_relinker():
+            self.assertEqual(0, relinker.main([
+                'cleanup',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+                '--skip-mount',
+            ]))
+
+        self.assertTrue(os.path.isfile(self.expected_file))  # link intact
+        self.assertEqual([], self.logger.get_lines_for_level('warning'))
+        # old partition should be cleaned up
+        self.assertFalse(os.path.exists(self.part_dir))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(1 files, 0 linked, 1 removed, 0 errors)', info_lines)
+        self.assertEqual([], self.logger.get_lines_for_level('error'))
+
+    def test_cleanup_not_yet_relinked(self):
+        # force new partition to be above range of partitions visited during
+        # cleanup
+        self._setup_object(lambda part: part >= 2 ** (PART_POWER - 1))
+        self._common_test_cleanup(relink=False)
+        with self._mock_relinker():
+            self.assertEqual(0, relinker.main([
+                'cleanup',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+                '--skip-mount',
+            ]))
+
+        self.assertTrue(os.path.isfile(self.expected_file))  # link created
+        # old partition should be cleaned up
+        self.assertFalse(os.path.exists(self.part_dir))
+        self.assertEqual([], self.logger.get_lines_for_level('warning'))
+        self.assertIn(
+            'Relinking (cleanup) created link: %s to %s'
+            % (self.objname, self.expected_file),
+            self.logger.get_lines_for_level('debug'))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(1 files, 1 linked, 1 removed, 0 errors)', info_lines)
+        # suffix should be invalidated and rehashed in new partition
+        hashes_invalid = os.path.join(self.next_part_dir, 'hashes.invalid')
+        self.assertTrue(os.path.exists(hashes_invalid))
+        with open(hashes_invalid, 'r') as fd:
+            self.assertEqual('', fd.read().strip())
+        self.assertEqual([], self.logger.get_lines_for_level('error'))
+
+    def test_cleanup_not_yet_relinked_low(self):
+        # force new partition to be in the range of partitions visited during
+        # cleanup, but not exist until after cleanup would have visited it
+        self._setup_object(lambda part: part < 2 ** (PART_POWER - 1))
+        self._common_test_cleanup(relink=False)
+        self.assertFalse(os.path.isfile(self.expected_file))
+        self.assertFalse(os.path.exists(self.next_part_dir))
+        # Relinker processes partitions in reverse order; as a result, the
+        # "normal" rehash during cleanup won't hit this, since it doesn't
+        # exist yet -- but when we finish processing the old partition,
+        # we'll loop back around.
+        with self._mock_relinker():
+            self.assertEqual(0, relinker.main([
+                'cleanup',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+                '--skip-mount',
+            ]))
+
+        self.assertTrue(os.path.isfile(self.expected_file))  # link created
+        # old partition should be cleaned up
+        self.assertFalse(os.path.exists(self.part_dir))
+        self.assertEqual([], self.logger.get_lines_for_level('warning'))
+        self.assertIn(
+            'Relinking (cleanup) created link: %s to %s'
+            % (self.objname, self.expected_file),
+            self.logger.get_lines_for_level('debug'))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(1 files, 1 linked, 1 removed, 0 errors)', info_lines)
+        # suffix should be invalidated and rehashed in new partition
+        hashes_invalid = os.path.join(self.next_part_dir, 'hashes.invalid')
+        self.assertTrue(os.path.exists(hashes_invalid))
+        with open(hashes_invalid, 'r') as fd:
+            self.assertEqual('', fd.read().strip())
+        self.assertEqual([], self.logger.get_lines_for_level('error'))
+
+    def test_cleanup_same_object_different_inode_in_new_partition(self):
+        # force rehash of new partition to not happen during cleanup
+        self._setup_object(lambda part: part >= 2 ** (PART_POWER - 1))
+        self._common_test_cleanup(relink=False)
+        # new file in the new partition but different inode
+        os.makedirs(self.expected_dir)
+        with open(self.expected_file, 'w') as fd:
+            fd.write('same but different')
+
+        with self._mock_relinker():
+            res = relinker.main([
+                'cleanup',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+                '--skip-mount',
+            ])
+
+        self.assertEqual(1, res)
+        self.assertTrue(os.path.isfile(self.objname))
+        with open(self.objname, 'r') as fd:
+            self.assertEqual('Hello World!', fd.read())
+        self.assertTrue(os.path.isfile(self.expected_file))
+        with open(self.expected_file, 'r') as fd:
+            self.assertEqual('same but different', fd.read())
+        error_lines = self.logger.get_lines_for_level('error')
+        self.assertEqual([
+            'Error relinking (cleanup): hardlink collision: %s to %s'
+            ' (consider enabling clobber_hardlink_collisions)'
+            % (self.objname, self.expected_file),
+        ], error_lines)
+        # suffix should not be invalidated in new partition
+        hashes_invalid = os.path.join(self.next_part_dir, 'hashes.invalid')
+        self.assertFalse(os.path.exists(hashes_invalid))
+        warning_lines = self.logger.get_lines_for_level('warning')
+        self.assertEqual([
+            '1 hash dirs processed (cleanup=True) '
+            '(1 files, 0 linked, 0 removed, 1 errors)',
+        ], warning_lines)
+
+    def test_cleanup_older_object_in_new_partition(self):
+        # relink of the current object failed, but there is an older version of
+        # same object in the new partition
+        # force rehash of new partition to not happen during cleanup
+        self._setup_object(lambda part: part >= 2 ** (PART_POWER - 1))
+        self._common_test_cleanup(relink=False)
+        os.makedirs(self.expected_dir)
+        older_obj_file = os.path.join(
+            self.expected_dir,
+            utils.Timestamp(int(self.obj_ts) - 1).internal + '.data')
+        with open(older_obj_file, "wb") as fd:
+            fd.write(b"Hello Olde Worlde!")
+            write_metadata(fd, {'name': self.obj_path, 'Content-Length': '18'})
+
+        with self._mock_relinker():
+            res = relinker.main([
+                'cleanup',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+                '--skip-mount',
+            ])
+
+        self.assertEqual(0, res)
+        # old partition should be cleaned up
+        self.assertFalse(os.path.exists(self.part_dir))
+        # which is also going to clean up the older file
+        self.assertFalse(os.path.isfile(older_obj_file))
+        self.assertTrue(os.path.isfile(self.expected_file))  # link created
+        self.assertIn(
+            'Relinking (cleanup) created link: %s to %s'
+            % (self.objname, self.expected_file),
+            self.logger.get_lines_for_level('debug'))
+        self.assertEqual([], self.logger.get_lines_for_level('warning'))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(1 files, 1 linked, 1 removed, 0 errors)', info_lines)
+        # suffix should be invalidated and rehashed in new partition
+        hashes_invalid = os.path.join(self.next_part_dir, 'hashes.invalid')
+        self.assertTrue(os.path.exists(hashes_invalid))
+        with open(hashes_invalid, 'r') as fd:
+            self.assertEqual('', fd.read().strip())
+        self.assertEqual([], self.logger.get_lines_for_level('error'))
+
+    def test_cleanup_deleted(self):
+        # force rehash of new partition to not happen during cleanup
+        self._setup_object(lambda part: part >= 2 ** (PART_POWER - 1))
+        self._common_test_cleanup()
+        # rehash during relink creates hashes.invalid...
+        hashes_invalid = os.path.join(self.next_part_dir, 'hashes.invalid')
+        self.assertTrue(os.path.exists(hashes_invalid))
+
+        # Pretend the object got deleted in between and there is a tombstone
+        # note: the tombstone would normally be at a newer timestamp but here
+        # we make the tombstone at same timestamp - it  is treated as the
+        # 'required' file in the new partition, so the .data is deleted in the
+        # old partition
+        fname_ts = self.expected_file[:-4] + "ts"
+        os.rename(self.expected_file, fname_ts)
+        self.assertTrue(os.path.isfile(fname_ts))
+
+        with self._mock_relinker():
+            self.assertEqual(0, relinker.main([
+                'cleanup',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+                '--skip-mount',
+            ]))
+        self.assertTrue(os.path.isfile(fname_ts))
+        # old partition should be cleaned up
+        self.assertFalse(os.path.exists(self.part_dir))
+        # suffix should not be invalidated in new partition
+        self.assertTrue(os.path.exists(hashes_invalid))
+        with open(hashes_invalid, 'r') as fd:
+            self.assertEqual('', fd.read().strip())
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(0 files, 0 linked, 1 removed, 0 errors)', info_lines)
+        self.assertEqual([], self.logger.get_lines_for_level('error'))
+
+    def test_cleanup_old_part_careful_file(self):
+        self._common_test_cleanup()
+        # make some extra junk file in the part
+        extra_file = os.path.join(self.part_dir, 'extra')
+        with open(extra_file, 'w'):
+            pass
+        with self._mock_relinker():
+            self.assertEqual(0, relinker.main([
+                'cleanup',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+                '--skip-mount',
+            ]))
+        # old partition can't be cleaned up
+        self.assertTrue(os.path.exists(self.part_dir))
+        self.assertEqual([], self.logger.get_lines_for_level('error'))
+
+    def test_cleanup_old_part_careful_dir(self):
+        self._common_test_cleanup()
+        # make some extra junk directory in the part
+        extra_dir = os.path.join(self.part_dir, 'extra')
+        os.mkdir(extra_dir)
+        self.assertEqual(0, relinker.main([
+            'cleanup',
+            '--swift-dir', self.testdir,
+            '--devices', self.devices,
+            '--skip-mount',
+        ]))
+        # old partition can't be cleaned up
+        self.assertTrue(os.path.exists(self.part_dir))
+        self.assertTrue(os.path.exists(extra_dir))
+
+    def test_cleanup_old_part_replication_lock_taken(self):
+        # verify that relinker must take the replication lock before deleting
+        # it, and handles the LockTimeout when unable to take it
+        self._common_test_cleanup()
+
+        config = """
+        [DEFAULT]
+        swift_dir = %s
+        devices = %s
+        mount_check = false
+        replication_lock_timeout = 1
+
+        [object-relinker]
+        """ % (self.testdir, self.devices)
+        conf_file = os.path.join(self.testdir, 'relinker.conf')
+        with open(conf_file, 'w') as f:
+            f.write(dedent(config))
+
+        with utils.lock_path(self.part_dir, name='replication'):
+            # lock taken so relinker should be unable to remove the lock file
+            with self._mock_relinker():
+                self.assertEqual(0, relinker.main(['cleanup', conf_file]))
+        # old partition can't be cleaned up
+        self.assertTrue(os.path.exists(self.part_dir))
+        self.assertTrue(os.path.exists(
+            os.path.join(self.part_dir, '.lock-replication')))
+        self.assertEqual([], self.logger.get_lines_for_level('error'))
+
+    def test_cleanup_old_part_partition_lock_taken_during_get_hashes(self):
+        # verify that relinker handles LockTimeouts when rehashing
+        self._common_test_cleanup()
+
+        config = """
+        [DEFAULT]
+        swift_dir = %s
+        devices = %s
+        mount_check = false
+        replication_lock_timeout = 1
+
+        [object-relinker]
+        """ % (self.testdir, self.devices)
+        conf_file = os.path.join(self.testdir, 'relinker.conf')
+        with open(conf_file, 'w') as f:
+            f.write(dedent(config))
+
+        orig_get_hashes = BaseDiskFileManager.get_hashes
+
+        def new_get_hashes(*args, **kwargs):
+            # lock taken so relinker should be unable to rehash
+            with utils.lock_path(self.part_dir):
+                return orig_get_hashes(*args, **kwargs)
+
+        with self._mock_relinker(), \
+                mock.patch('swift.common.utils.DEFAULT_LOCK_TIMEOUT', 0.1), \
+                mock.patch.object(BaseDiskFileManager,
+                                  'get_hashes', new_get_hashes):
+            self.assertEqual(0, relinker.main(['cleanup', conf_file]))
+        # old partition can't be cleaned up
+        self.assertTrue(os.path.exists(self.part_dir))
+        self.assertTrue(os.path.exists(
+            os.path.join(self.part_dir, '.lock')))
+        self.assertEqual([], self.logger.get_lines_for_level('error'))
+        self.assertEqual([], self.logger.get_lines_for_level('warning'))
+
+    def test_cleanup_old_part_lock_taken_between_get_hashes_and_rm(self):
+        # verify that relinker must take the partition lock before deleting
+        # it, and handles the LockTimeout when unable to take it
+        self._common_test_cleanup()
+
+        config = """
+        [DEFAULT]
+        swift_dir = %s
+        devices = %s
+        mount_check = false
+        replication_lock_timeout = 1
+
+        [object-relinker]
+        """ % (self.testdir, self.devices)
+        conf_file = os.path.join(self.testdir, 'relinker.conf')
+        with open(conf_file, 'w') as f:
+            f.write(dedent(config))
+
+        orig_replication_lock = BaseDiskFileManager.replication_lock
+
+        @contextmanager
+        def new_lock(*args, **kwargs):
+            # lock taken so relinker should be unable to rehash
+            with utils.lock_path(self.part_dir):
+                with orig_replication_lock(*args, **kwargs) as cm:
+                    yield cm
+
+        with self._mock_relinker(), \
+                mock.patch('swift.common.utils.DEFAULT_LOCK_TIMEOUT', 0.1), \
+                mock.patch.object(BaseDiskFileManager,
+                                  'replication_lock', new_lock):
+            self.assertEqual(0, relinker.main(['cleanup', conf_file]))
+        # old partition can't be cleaned up
+        self.assertTrue(os.path.exists(self.part_dir))
+        self.assertTrue(os.path.exists(
+            os.path.join(self.part_dir, '.lock')))
+        self.assertEqual([], self.logger.get_lines_for_level('error'))
+        self.assertEqual([], self.logger.get_lines_for_level('warning'))
+
+    def test_cleanup_old_part_robust(self):
+        self._common_test_cleanup()
+
+        orig_get_hashes = DiskFileManager.get_hashes
+        calls = []
+
+        def mock_get_hashes(mgr, device, part, suffixes, policy):
+            orig_resp = orig_get_hashes(mgr, device, part, suffixes, policy)
+            if part == self.part:
+                expected_files = ['.lock', 'hashes.pkl', 'hashes.invalid']
+                self.assertEqual(set(expected_files),
+                                 set(os.listdir(self.part_dir)))
+                # unlink a random file, should be empty
+                os.unlink(os.path.join(self.part_dir, 'hashes.pkl'))
+                # create an ssync replication lock, too
+                with open(os.path.join(self.part_dir,
+                                       '.lock-replication'), 'w'):
+                    pass
+                calls.append(True)
+            elif part == self.next_part:
+                # sometimes our random obj needs to rehash the next part too
+                pass
+            else:
+                self.fail('Unexpected call to get_hashes for %r' % part)
+            return orig_resp
+
+        with mock.patch.object(DiskFileManager, 'get_hashes', mock_get_hashes):
+            with self._mock_relinker():
+                self.assertEqual(0, relinker.main([
+                    'cleanup',
+                    '--swift-dir', self.testdir,
+                    '--devices', self.devices,
+                    '--skip-mount',
+                ]))
+        self.assertEqual([True], calls)
+        # old partition can still be cleaned up
+        self.assertFalse(os.path.exists(self.part_dir))
+        self.assertEqual([], self.logger.get_lines_for_level('error'))
+
+    def test_cleanup_reapable(self):
+        # relink a tombstone
+        fname_ts = self.objname[:-4] + "ts"
+        os.rename(self.objname, fname_ts)
+        self.objname = fname_ts
+        self.expected_file = self.expected_file[:-4] + "ts"
+        self._common_test_cleanup()
+        self.assertTrue(os.path.exists(self.expected_file))  # sanity check
+
+        with self._mock_relinker(), \
+                mock.patch('time.time', return_value=1e10 - 1):  # far future
+            self.assertEqual(0, relinker.main([
+                'cleanup',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+                '--skip-mount',
+            ]))
+        self.assertEqual(self.logger.get_lines_for_level('error'), [])
+        self.assertEqual(self.logger.get_lines_for_level('warning'), [])
+        # reclaimed during relinker cleanup...
+        self.assertFalse(os.path.exists(self.objname))
+        # reclaimed during relinker relink or relinker cleanup, depending on
+        # which quartile the partition is in ...
+        self.assertFalse(os.path.exists(self.expected_file))
+
+    def test_cleanup_new_does_not_exist(self):
+        self._common_test_cleanup()
+        # Pretend the file in the new place got deleted in between relink and
+        # cleanup: cleanup should re-create the link
+        os.remove(self.expected_file)
+
+        with self._mock_relinker():
+            self.assertEqual(0, relinker.main([
+                'cleanup',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+                '--skip-mount',
+            ]))
+        self.assertTrue(os.path.isfile(self.expected_file))  # link created
+        # old partition should be cleaned up
+        self.assertFalse(os.path.exists(self.part_dir))
+        self.assertIn(
+            'Relinking (cleanup) created link: %s to %s'
+            % (self.objname, self.expected_file),
+            self.logger.get_lines_for_level('debug'))
+        self.assertEqual([], self.logger.get_lines_for_level('warning'))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(1 files, 1 linked, 1 removed, 0 errors)', info_lines)
+        self.assertEqual([], self.logger.get_lines_for_level('error'))
+
+    def test_cleanup_new_does_not_exist_and_relink_raises_os_error(self):
+        # force rehash of new partition to not happen during cleanup
+        self._setup_object(lambda part: part >= 2 ** (PART_POWER - 1))
+        self._common_test_cleanup()
+        # rehash during relink creates hashes.invalid...
+        hashes_invalid = os.path.join(self.next_part_dir, 'hashes.invalid')
+        self.assertTrue(os.path.exists(hashes_invalid))
+        # Pretend the file in the new place got deleted in between relink and
+        # cleanup: cleanup attempts to re-create the link but fails
+        os.remove(self.expected_file)
+
+        with mock.patch('swift.obj.diskfile.os.link',
+                        side_effect=OSError('os-error!')):
+            with self._mock_relinker():
+                self.assertEqual(1, relinker.main([
+                    'cleanup',
+                    '--swift-dir', self.testdir,
+                    '--devices', self.devices,
+                    '--skip-mount',
+                ]))
+        self.assertFalse(os.path.isfile(self.expected_file))
+        self.assertTrue(os.path.isfile(self.objname))  # old file intact
+        self.assertEqual(self.logger.get_lines_for_level('error'), [
+            'Error relinking (cleanup): failed to relink %s to %s: os-error!'
+            % (self.objname, self.expected_file),
+        ])
+        self.assertEqual(self.logger.get_lines_for_level('warning'), [
+            '1 hash dirs processed (cleanup=True) '
+            '(1 files, 0 linked, 0 removed, 1 errors)',
+        ])
+        # suffix should not be invalidated in new partition
+        self.assertTrue(os.path.exists(hashes_invalid))
+        with open(hashes_invalid, 'r') as fd:
+            self.assertEqual('', fd.read().strip())
+        # nor in the old partition
+        old_hashes_invalid = os.path.join(self.part_dir, 'hashes.invalid')
+        self.assertFalse(os.path.exists(old_hashes_invalid))
+
+    def test_cleanup_new_does_not_exist_and_relink_raises_other_error(self):
+        # force rehash of new partition to not happen during cleanup
+        self._setup_object(lambda part: part >= 2 ** (PART_POWER - 1))
+        self._common_test_cleanup()
+        # rehash during relink creates hashes.invalid...
+        hashes_invalid = os.path.join(self.next_part_dir, 'hashes.invalid')
+        self.assertTrue(os.path.exists(hashes_invalid))
+        # Pretend the file in the new place got deleted in between relink and
+        # cleanup: cleanup attempts to re-create the link but fails
+        os.remove(self.expected_file)
+
+        with mock.patch('swift.obj.diskfile.os.link',
+                        side_effect=ValueError('kaboom!')):
+            with self._mock_relinker():
+                self.assertEqual(1, relinker.main([
+                    'cleanup',
+                    '--swift-dir', self.testdir,
+                    '--devices', self.devices,
+                    '--skip-mount',
+                ]))
+        self.assertFalse(os.path.isfile(self.expected_file))
+        self.assertTrue(os.path.isfile(self.objname))  # old file intact
+        self.assertEqual(self.logger.get_lines_for_level('error'), [
+            'Error relinking (cleanup): failed to relink %s to %s: kaboom!'
+            % (self.objname, self.expected_file),
+        ])
+        self.assertEqual(self.logger.get_lines_for_level('warning'), [
+            '1 hash dirs processed (cleanup=True) '
+            '(1 files, 0 linked, 0 removed, 1 errors)',
+        ])
+        # suffix should not be invalidated in new partition
+        self.assertTrue(os.path.exists(hashes_invalid))
+        with open(hashes_invalid, 'r') as fd:
+            self.assertEqual('', fd.read().strip())
+        # nor in the old partition
+        old_hashes_invalid = os.path.join(self.part_dir, 'hashes.invalid')
+        self.assertFalse(os.path.exists(old_hashes_invalid))
+
+    def test_cleanup_remove_fails(self):
+        meta_file = utils.Timestamp(int(self.obj_ts) + 1).internal + '.meta'
+        old_meta_path = os.path.join(self.objdir, meta_file)
+        new_meta_path = os.path.join(self.expected_dir, meta_file)
+
+        with open(old_meta_path, 'w') as fd:
+            fd.write('meta file in old partition')
+        self._common_test_cleanup()
+
+        calls = []
+        orig_remove = os.remove
+
+        def mock_remove(path, *args, **kwargs):
+            calls.append(path)
+            if len(calls) == 1:
+                raise OSError
+            return orig_remove(path)
+
+        with mock.patch('swift.obj.diskfile.os.remove', mock_remove):
+            with self._mock_relinker():
+                self.assertEqual(1, relinker.main([
+                    'cleanup',
+                    '--swift-dir', self.testdir,
+                    '--devices', self.devices,
+                    '--skip-mount',
+                ]))
+        self.assertEqual([old_meta_path, self.objname], calls)
+        self.assertTrue(os.path.isfile(self.expected_file))  # new file intact
+        self.assertTrue(os.path.isfile(new_meta_path))  # new file intact
+        self.assertFalse(os.path.isfile(self.objname))  # old file removed
+        self.assertTrue(os.path.isfile(old_meta_path))  # meta file remove fail
+        self.assertEqual(self.logger.get_lines_for_level('warning'), [
+            'Error cleaning up %s: OSError()' % old_meta_path,
+            '1 hash dirs processed (cleanup=True) '
+            '(2 files, 0 linked, 1 removed, 1 errors)',
+        ])
+        self.assertEqual([], self.logger.get_lines_for_level('error'))
+
+    def test_cleanup_two_files_need_linking(self):
+        meta_file = utils.Timestamp(int(self.obj_ts) + 1).internal + '.meta'
+        old_meta_path = os.path.join(self.objdir, meta_file)
+        new_meta_path = os.path.join(self.expected_dir, meta_file)
+
+        with open(old_meta_path, 'w') as fd:
+            fd.write('unexpected file in old partition')
+        self._common_test_cleanup(relink=False)
+        self.assertFalse(os.path.isfile(self.expected_file))  # link missing
+        self.assertFalse(os.path.isfile(new_meta_path))  # link missing
+
+        with self._mock_relinker():
+            self.assertEqual(0, relinker.main([
+                'cleanup',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+                '--skip-mount',
+            ]))
+        self.assertTrue(os.path.isfile(self.expected_file))  # new file created
+        self.assertTrue(os.path.isfile(new_meta_path))  # new file created
+        self.assertFalse(os.path.isfile(self.objname))  # old file removed
+        self.assertFalse(os.path.isfile(old_meta_path))  # meta file removed
+        self.assertEqual([], self.logger.get_lines_for_level('warning'))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(2 files, 2 linked, 2 removed, 0 errors)', info_lines)
+        self.assertEqual([], self.logger.get_lines_for_level('error'))
+
+    @patch_policies(
+        [ECStoragePolicy(
+         0, name='platinum', is_default=True, ec_type=DEFAULT_TEST_EC_TYPE,
+         ec_ndata=4, ec_nparity=2)])
+    def test_cleanup_diskfile_error(self):
+        # Switch the policy type so all fragments raise DiskFileError: they
+        # are included in the diskfile data as 'unexpected' files and cleanup
+        # should include them
+        self._common_test_cleanup()
+        with self._mock_relinker():
+            self.assertEqual(0, relinker.main([
+                'cleanup',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+                '--skip-mount',
+            ]))
+        log_lines = self.logger.get_lines_for_level('warning')
+        # The error is logged six times:
+        # during _common_test_cleanup() relink: once for cleanup_ondisk_files
+        # in old and once for get_ondisk_files of union of files;
+        # during cleanup: once for cleanup_ondisk_files in old and new
+        # location, once for get_ondisk_files of union of files;
+        # during either relink or cleanup: once for the rehash of the new
+        # partition
+        self.assertEqual(6, len(log_lines),
+                         'Expected 6 log lines, got %r' % log_lines)
+        for line in log_lines:
+            self.assertIn('Bad fragment index: None', line, log_lines)
+        self.assertTrue(os.path.isfile(self.expected_file))  # new file intact
+        # old partition should be cleaned up
+        self.assertFalse(os.path.exists(self.part_dir))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(1 files, 0 linked, 1 removed, 0 errors)', info_lines)
+        self.assertEqual([], self.logger.get_lines_for_level('error'))
+
+    @patch_policies(
+        [ECStoragePolicy(
+            0, name='platinum', is_default=True, ec_type=DEFAULT_TEST_EC_TYPE,
+            ec_ndata=4, ec_nparity=2)])
+    def test_cleanup_diskfile_error_new_file_missing(self):
+        self._common_test_cleanup(relink=False)
+        # Switch the policy type so all fragments raise DiskFileError: they
+        # are included in the diskfile data as 'unexpected' files and cleanup
+        # should include them
+        with self._mock_relinker():
+            self.assertEqual(0, relinker.main([
+                'cleanup',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+                '--skip-mount',
+            ]))
+        warning_lines = self.logger.get_lines_for_level('warning')
+        # once for cleanup_ondisk_files in old, again for the get_ondisk_files
+        # of union of files, and one last time when the new partition gets
+        # rehashed at the end of processing the old one
+        self.assertEqual(3, len(warning_lines),
+                         'Expected 3 log lines, got %r' % warning_lines)
+        for line in warning_lines:
+            self.assertIn('Bad fragment index: None', line, warning_lines)
+        self.assertIn(
+            'Relinking (cleanup) created link: %s to %s'
+            % (self.objname, self.expected_file),
+            self.logger.get_lines_for_level('debug'))
+        self.assertTrue(os.path.isfile(self.expected_file))  # new file intact
+        # old partition should be cleaned up
+        self.assertFalse(os.path.exists(self.part_dir))
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('1 hash dirs processed (cleanup=True) '
+                      '(1 files, 1 linked, 1 removed, 0 errors)', info_lines)
+        self.assertEqual([], self.logger.get_lines_for_level('error'))
+
+    def test_rehashing(self):
+        calls = []
+
+        @contextmanager
+        def do_mocks():
+            orig_invalidate = relinker.diskfile.invalidate_hash
+            orig_get_hashes = DiskFileManager.get_hashes
+
+            def mock_invalidate(suffix_dir):
+                calls.append(('invalidate', suffix_dir))
+                return orig_invalidate(suffix_dir)
+
+            def mock_get_hashes(self, *args):
+                calls.append(('get_hashes', ) + args)
+                return orig_get_hashes(self, *args)
+
+            with mock.patch.object(relinker.diskfile, 'invalidate_hash',
+                                   mock_invalidate), \
+                    mock.patch.object(DiskFileManager, 'get_hashes',
+                                      mock_get_hashes):
+                with self._mock_relinker():
+                    yield
+
+        with do_mocks():
+            self.rb.prepare_increase_partition_power()
+            self._save_ring()
+            self.assertEqual(0, relinker.main([
+                'relink',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+                '--skip-mount',
+            ]))
+            expected = [('invalidate', self.next_suffix_dir)]
+            if self.part >= 2 ** (PART_POWER - 1):
+                expected.append(('get_hashes', self.existing_device,
+                                 self.next_part, [], POLICIES[0]))
+
+            self.assertEqual(calls, expected)
+            # Depending on partition, there may or may not be a get_hashes here
+            self.rb._ring = None  # Force builder to reload ring
+            self.rb.increase_partition_power()
+            self._save_ring()
+            self.assertEqual(0, relinker.main([
+                'cleanup',
+                '--swift-dir', self.testdir,
+                '--devices', self.devices,
+                '--skip-mount',
+            ]))
+            if self.part < 2 ** (PART_POWER - 1):
+                expected.append(('get_hashes', self.existing_device,
+                                 self.next_part, [], POLICIES[0]))
+            expected.extend([
+                ('invalidate', self.suffix_dir),
+                ('get_hashes', self.existing_device, self.part, [],
+                 POLICIES[0]),
+            ])
+            self.assertEqual(calls, expected)
+            self.assertEqual([], self.logger.get_lines_for_level('error'))
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/cli/test_reload.py b/test/unit/cli/test_reload.py
new file mode 100644
index 0000000000..3e4f20445b
--- /dev/null
+++ b/test/unit/cli/test_reload.py
@@ -0,0 +1,214 @@
+# Copyright (c) 2022 NVIDIA
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from unittest import mock
+import signal
+import socket
+import subprocess
+import unittest
+
+from io import StringIO
+from swift.cli import reload
+
+
+@mock.patch('sys.stderr', new_callable=StringIO)
+class TestValidateManagerPid(unittest.TestCase):
+    def test_good(self, mock_stderr):
+        cmd_args = [
+            '/usr/local/bin/python3.9',
+            '/usr/local/bin/swift-proxy-server',
+            '/etc/swift/proxy-server.conf',
+            'some',
+            'extra',
+            'args',
+        ]
+        with mock.patch.object(reload, 'open', mock.mock_open(
+            read_data='\x00'.join(cmd_args) + '\x00'
+        )) as mock_open, mock.patch('os.getsid', return_value=123):
+            self.assertEqual(reload.validate_manager_pid(123), (
+                cmd_args,
+                'swift-proxy-server',
+            ))
+        self.assertEqual(mock_open.mock_calls[0],
+                         mock.call('/proc/123/cmdline', 'r'))
+
+    def test_open_error(self, mock_stderr):
+        with mock.patch.object(reload, 'open', side_effect=OSError), \
+                self.assertRaises(SystemExit) as caught:
+            reload.validate_manager_pid(123)
+        self.assertEqual(caught.exception.args, (reload.EXIT_BAD_PID,))
+        self.assertEqual(mock_stderr.getvalue(),
+                         'Failed to get process information for 123\n')
+
+    def test_non_python(self, mock_stderr):
+        with mock.patch.object(reload, 'open', mock.mock_open(
+            read_data='/usr/bin/rsync\x00'
+        )), mock.patch('os.getsid', return_value=56), \
+                self.assertRaises(SystemExit) as caught:
+            reload.validate_manager_pid(56)
+        self.assertEqual(caught.exception.args, (reload.EXIT_BAD_PID,))
+        self.assertEqual(mock_stderr.getvalue(),
+                         "Non-swift process: '/usr/bin/rsync'\n")
+
+    def test_non_swift(self, mock_stderr):
+        with mock.patch.object(reload, 'open', mock.mock_open(
+            read_data='/usr/bin/python\x00some-script\x00'
+        )), mock.patch('os.getsid', return_value=123), \
+                self.assertRaises(SystemExit) as caught:
+            reload.validate_manager_pid(123)
+        self.assertEqual(caught.exception.args, (reload.EXIT_BAD_PID,))
+        self.assertEqual(mock_stderr.getvalue(),
+                         "Non-swift process: '/usr/bin/python some-script'\n")
+
+    def test_worker(self, mock_stderr):
+        cmd_args = [
+            '/usr/bin/python3.9',
+            '/usr/bin/swift-proxy-server',
+            '/etc/swift/proxy-server.conf',
+        ]
+        with mock.patch.object(reload, 'open', mock.mock_open(
+            read_data='\x00'.join(cmd_args) + '\x00'
+        )) as mock_open, mock.patch('os.getsid', return_value=123), \
+                self.assertRaises(SystemExit) as caught:
+            reload.validate_manager_pid(56)
+        self.assertEqual(caught.exception.args, (reload.EXIT_BAD_PID,))
+        self.assertEqual(mock_stderr.getvalue(),
+                         'Process appears to be a swift-proxy-server worker, '
+                         'not a manager. Did you mean 123?\n')
+        self.assertEqual(mock_open.mock_calls[0],
+                         mock.call('/proc/56/cmdline', 'r'))
+
+    def test_non_server(self, mock_stderr):
+        cmd_args = [
+            '/usr/bin/swift-ring-builder',
+            '/etc/swift/object.builder',
+            'rebalance',
+        ]
+        with mock.patch.object(reload, 'open', mock.mock_open(
+            read_data='\x00'.join(cmd_args) + '\x00'
+        )) as mock_open, mock.patch('os.getsid', return_value=123), \
+                self.assertRaises(SystemExit) as caught:
+            reload.validate_manager_pid(123)
+        self.assertEqual(caught.exception.args, (reload.EXIT_BAD_PID,))
+        self.assertEqual(mock_stderr.getvalue(),
+                         'Process does not support config checks: '
+                         'swift-ring-builder\n')
+        self.assertEqual(mock_open.mock_calls[0],
+                         mock.call('/proc/123/cmdline', 'r'))
+
+
+class TestMain(unittest.TestCase):
+    def setUp(self):
+        patcher = mock.patch('sys.stderr', new_callable=StringIO)
+        self.mock_stderr = patcher.start()
+        self.addCleanup(patcher.stop)
+
+        patcher = mock.patch('subprocess.check_call')
+        self.mock_check_call = patcher.start()
+        self.addCleanup(patcher.stop)
+
+        patcher = mock.patch.object(reload, 'validate_manager_pid')
+        self.mock_validate = patcher.start()
+        self.addCleanup(patcher.stop)
+
+        patcher = mock.patch.object(reload, 'NotificationServer')
+        self.mock_notify_server = patcher.start()
+        self.addCleanup(patcher.stop)
+
+        patcher = mock.patch('os.kill')
+        self.mock_kill = patcher.start()
+        self.addCleanup(patcher.stop)
+
+    def test_good(self):
+        self.mock_validate.return_value = (
+            [
+                '/usr/bin/swift-proxy-server',
+                '/etc/swift/proxy-server.conf'
+            ],
+            'swift-proxy-server',
+        )
+        self.mock_notify_server().__enter__().receive.side_effect = [
+            b'RELOADING=1',
+            b'READY=1',
+        ]
+        self.assertIsNone(reload.main(['123', '-v']))
+        self.assertEqual(self.mock_check_call.mock_calls, [mock.call([
+            '/usr/bin/swift-proxy-server',
+            '/etc/swift/proxy-server.conf',
+            '--test-config',
+        ])])
+        self.assertEqual(self.mock_kill.mock_calls, [
+            mock.call(123, signal.SIGUSR1),
+        ])
+
+    @mock.patch('time.time', side_effect=[1, 10, 100, 400])
+    def test_timeout(self, mock_time):
+        self.mock_validate.return_value = (
+            [
+                '/usr/bin/python3',
+                '/usr/bin/swift-proxy-server',
+                '/etc/swift/proxy-server.conf'
+            ],
+            'swift-proxy-server',
+        )
+        self.mock_notify_server().__enter__().receive.side_effect = [
+            b'RELOADING=1',
+            socket.timeout,
+        ]
+        with self.assertRaises(SystemExit) as caught:
+            reload.main(['123'])
+        self.assertEqual(caught.exception.args, (reload.EXIT_RELOAD_TIMEOUT,))
+        self.assertEqual(self.mock_check_call.mock_calls, [mock.call([
+            '/usr/bin/python3',
+            '/usr/bin/swift-proxy-server',
+            '/etc/swift/proxy-server.conf',
+            '--test-config',
+        ])])
+        self.assertEqual(self.mock_kill.mock_calls, [
+            mock.call(123, signal.SIGUSR1),
+        ])
+        self.assertEqual(self.mock_stderr.getvalue(),
+                         'Timed out reloading swift-proxy-server\n')
+
+    def test_check_failed(self):
+        self.mock_validate.return_value = (
+            [
+                '/usr/bin/python3',
+                '/usr/bin/swift-object-server',
+                '/etc/swift/object-server/1.conf'
+            ],
+            'swift-object-server',
+        )
+        self.mock_check_call.side_effect = subprocess.CalledProcessError(
+            2, 'swift-object-server')
+        with self.assertRaises(SystemExit) as caught:
+            reload.main(['123'])
+        self.assertEqual(caught.exception.args, (reload.EXIT_RELOAD_FAILED,))
+        self.assertEqual(self.mock_check_call.mock_calls, [mock.call([
+            '/usr/bin/python3',
+            '/usr/bin/swift-object-server',
+            '/etc/swift/object-server/1.conf',
+            '--test-config',
+        ])])
+        self.assertEqual(self.mock_kill.mock_calls, [])
+
+    def test_needs_pid(self):
+        with self.assertRaises(SystemExit) as caught:
+            reload.main([])
+        self.assertEqual(caught.exception.args, (reload.EXIT_BAD_PID,))
+        msg = 'usage: \nSafely reload WSGI servers'
+        self.assertEqual(self.mock_stderr.getvalue()[:len(msg)], msg)
+        msg = '\n: error: the following arguments are required: pid\n'
+        self.assertEqual(self.mock_stderr.getvalue()[-len(msg):], msg)
diff --git a/test/unit/cli/test_ring_builder_analyzer.py b/test/unit/cli/test_ring_builder_analyzer.py
new file mode 100644
index 0000000000..dff60132b4
--- /dev/null
+++ b/test/unit/cli/test_ring_builder_analyzer.py
@@ -0,0 +1,255 @@
+#! /usr/bin/env python
+# Copyright (c) 2015 Samuel Merritt <sam@swiftstack.com>
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import os
+import json
+from unittest import mock
+from io import StringIO
+import unittest
+from test.unit import with_tempdir
+
+from swift.cli.ring_builder_analyzer import parse_scenario, run_scenario
+
+
+class TestRunScenario(unittest.TestCase):
+    @with_tempdir
+    def test_it_runs(self, tempdir):
+        builder_path = os.path.join(tempdir, 'test.builder')
+        scenario = {
+            'replicas': 3, 'part_power': 8, 'random_seed': 123, 'overload': 0,
+            'rounds': [[['add', 'r1z2-3.4.5.6:7/sda8', 100],
+                        ['add', 'z2-3.4.5.6:7/sda9', 200],
+                        ['add', 'z2-3.4.5.6:7/sda10', 200],
+                        ['add', 'z2-3.4.5.6:7/sda11', 200]],
+                       [['set_weight', 0, 150]],
+                       [['remove', 1]],
+                       [['save', builder_path]]]}
+        parsed = parse_scenario(json.dumps(scenario))
+
+        fake_stdout = StringIO()
+        with mock.patch('sys.stdout', fake_stdout):
+            run_scenario(parsed)
+
+        # Just test that it produced some output as it ran; the fact that
+        # this doesn't crash and produces output that resembles something
+        # useful is good enough.
+        self.assertIn('Rebalance', fake_stdout.getvalue())
+        self.assertTrue(os.path.exists(builder_path))
+
+
+class TestParseScenario(unittest.TestCase):
+    def test_good(self):
+        scenario = {
+            'replicas': 3, 'part_power': 8, 'random_seed': 123, 'overload': 0,
+            'rounds': [[['add', 'r1z2-3.4.5.6:7/sda8', 100],
+                        ['add', 'z2-3.4.5.6:7/sda9', 200]],
+                       [['set_weight', 0, 150]],
+                       [['remove', 1]]]}
+        parsed = parse_scenario(json.dumps(scenario))
+
+        self.assertEqual(parsed['replicas'], 3)
+        self.assertEqual(parsed['part_power'], 8)
+        self.assertEqual(parsed['random_seed'], 123)
+        self.assertEqual(parsed['overload'], 0)
+        self.assertEqual(parsed['rounds'], [
+            [['add', {'device': 'sda8',
+                      'ip': '3.4.5.6',
+                      'meta': '',
+                      'port': 7,
+                      'region': 1,
+                      'replication_ip': '3.4.5.6',
+                      'replication_port': 7,
+                      'weight': 100.0,
+                      'zone': 2}],
+             ['add', {'device': u'sda9',
+                      'ip': u'3.4.5.6',
+                      'meta': '',
+                      'port': 7,
+                      'region': 1,
+                      'replication_ip': '3.4.5.6',
+                      'replication_port': 7,
+                      'weight': 200.0,
+                      'zone': 2}]],
+            [['set_weight', 0, 150.0]],
+            [['remove', 1]]])
+
+    # The rest of this test class is just a catalog of the myriad ways that
+    # the input can be malformed.
+    def test_invalid_json(self):
+        self.assertRaises(ValueError, parse_scenario, "{")
+
+    def test_json_not_object(self):
+        self.assertRaises(ValueError, parse_scenario, "[]")
+        self.assertRaises(ValueError, parse_scenario, "\"stuff\"")
+
+    def test_bad_replicas(self):
+        working_scenario = {
+            'replicas': 3, 'part_power': 8, 'random_seed': 123, 'overload': 0,
+            'rounds': [[['add', 'r1z2-3.4.5.6:7/sda8', 100]]]}
+
+        busted = dict(working_scenario)
+        del busted['replicas']
+        self.assertRaises(ValueError, parse_scenario, json.dumps(busted))
+
+        busted = dict(working_scenario, replicas='blahblah')
+        self.assertRaises(ValueError, parse_scenario, json.dumps(busted))
+
+        busted = dict(working_scenario, replicas=-1)
+        self.assertRaises(ValueError, parse_scenario, json.dumps(busted))
+
+    def test_bad_part_power(self):
+        working_scenario = {
+            'replicas': 3, 'part_power': 8, 'random_seed': 123, 'overload': 0,
+            'rounds': [[['add', 'r1z2-3.4.5.6:7/sda8', 100]]]}
+
+        busted = dict(working_scenario)
+        del busted['part_power']
+        self.assertRaises(ValueError, parse_scenario, json.dumps(busted))
+
+        busted = dict(working_scenario, part_power='blahblah')
+        self.assertRaises(ValueError, parse_scenario, json.dumps(busted))
+
+        busted = dict(working_scenario, part_power=0)
+        self.assertRaises(ValueError, parse_scenario, json.dumps(busted))
+
+        busted = dict(working_scenario, part_power=33)
+        self.assertRaises(ValueError, parse_scenario, json.dumps(busted))
+
+    def test_bad_random_seed(self):
+        working_scenario = {
+            'replicas': 3, 'part_power': 8, 'random_seed': 123, 'overload': 0,
+            'rounds': [[['add', 'r1z2-3.4.5.6:7/sda8', 100]]]}
+
+        busted = dict(working_scenario)
+        del busted['random_seed']
+        self.assertRaises(ValueError, parse_scenario, json.dumps(busted))
+
+        busted = dict(working_scenario, random_seed='blahblah')
+        self.assertRaises(ValueError, parse_scenario, json.dumps(busted))
+
+    def test_bad_overload(self):
+        working_scenario = {
+            'replicas': 3, 'part_power': 8, 'random_seed': 123, 'overload': 0,
+            'rounds': [[['add', 'r1z2-3.4.5.6:7/sda8', 100]]]}
+
+        busted = dict(working_scenario)
+        del busted['overload']
+        self.assertRaises(ValueError, parse_scenario, json.dumps(busted))
+
+        busted = dict(working_scenario, overload='blahblah')
+        self.assertRaises(ValueError, parse_scenario, json.dumps(busted))
+
+        busted = dict(working_scenario, overload=-0.01)
+        self.assertRaises(ValueError, parse_scenario, json.dumps(busted))
+
+    def test_bad_rounds(self):
+        base = {
+            'replicas': 3, 'part_power': 8, 'random_seed': 123, 'overload': 0}
+
+        self.assertRaises(ValueError, parse_scenario, json.dumps(base))
+
+        busted = dict(base, rounds={})
+        self.assertRaises(ValueError, parse_scenario, json.dumps(busted))
+
+        busted = dict(base, rounds=[{}])
+        self.assertRaises(ValueError, parse_scenario, json.dumps(busted))
+
+        busted = dict(base, rounds=[[['bork']]])
+        self.assertRaises(ValueError, parse_scenario, json.dumps(busted))
+
+    def test_bad_add(self):
+        base = {
+            'replicas': 3, 'part_power': 8, 'random_seed': 123, 'overload': 0}
+
+        # no dev
+        busted = dict(base, rounds=[[['add']]])
+        self.assertRaises(ValueError, parse_scenario, json.dumps(busted))
+
+        # no weight
+        busted = dict(base, rounds=[[['add', 'r1z2-1.2.3.4:6200/d7']]])
+        self.assertRaises(ValueError, parse_scenario, json.dumps(busted))
+
+        # too many fields
+        busted = dict(base, rounds=[[['add', 'r1z2-1.2.3.4:6200/d7', 1, 2]]])
+        self.assertRaises(ValueError, parse_scenario, json.dumps(busted))
+
+        # can't parse
+        busted = dict(base, rounds=[[['add', 'not a good value', 100]]])
+        # N.B. the ValueError's coming out of ring.utils.parse_add_value
+        # are already pretty good
+        expected = "Invalid device specifier (round 0, command 0): " \
+            "Invalid add value: not a good value"
+        try:
+            parse_scenario(json.dumps(busted))
+        except ValueError as err:
+            self.assertEqual(str(err), expected)
+
+        # negative weight
+        busted = dict(base, rounds=[[['add', 'r1z2-1.2.3.4:6200/d7', -1]]])
+        self.assertRaises(ValueError, parse_scenario, json.dumps(busted))
+
+    def test_bad_remove(self):
+        base = {
+            'replicas': 3, 'part_power': 8, 'random_seed': 123, 'overload': 0}
+
+        # no dev
+        busted = dict(base, rounds=[[['remove']]])
+        self.assertRaises(ValueError, parse_scenario, json.dumps(busted))
+
+        # bad dev id
+        busted = dict(base, rounds=[[['remove', 'not an int']]])
+        self.assertRaises(ValueError, parse_scenario, json.dumps(busted))
+
+        # too many fields
+        busted = dict(base, rounds=[[['remove', 1, 2]]])
+        self.assertRaises(ValueError, parse_scenario, json.dumps(busted))
+
+    def test_bad_set_weight(self):
+        base = {
+            'replicas': 3, 'part_power': 8, 'random_seed': 123, 'overload': 0}
+
+        # no dev
+        busted = dict(base, rounds=[[['set_weight']]])
+        self.assertRaises(ValueError, parse_scenario, json.dumps(busted))
+
+        # no weight
+        busted = dict(base, rounds=[[['set_weight', 0]]])
+        self.assertRaises(ValueError, parse_scenario, json.dumps(busted))
+
+        # bad dev id
+        busted = dict(base, rounds=[[['set_weight', 'not an int', 90]]])
+        expected = "Invalid device ID in set_weight (round 0, command 0): " \
+            "invalid literal for int() with base 10: 'not an int'"
+        try:
+            parse_scenario(json.dumps(busted))
+        except ValueError as e:
+            self.assertEqual(str(e), expected)
+
+        # negative weight
+        busted = dict(base, rounds=[[['set_weight', 1, -1]]])
+        self.assertRaises(ValueError, parse_scenario, json.dumps(busted))
+
+        # bogus weight
+        busted = dict(base, rounds=[[['set_weight', 1, 'bogus']]])
+        self.assertRaises(ValueError, parse_scenario, json.dumps(busted))
+
+    def test_bad_save(self):
+        base = {
+            'replicas': 3, 'part_power': 8, 'random_seed': 123, 'overload': 0}
+
+        # no builder name
+        busted = dict(base, rounds=[[['save']]])
+        self.assertRaises(ValueError, parse_scenario, json.dumps(busted))
diff --git a/test/unit/cli/test_ringbuilder.py b/test/unit/cli/test_ringbuilder.py
new file mode 100644
index 0000000000..82ec9d301f
--- /dev/null
+++ b/test/unit/cli/test_ringbuilder.py
@@ -0,0 +1,3088 @@
+# Copyright (c) 2014 Christian Schwede <christian.schwede@enovance.com>
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import errno
+import itertools
+import logging
+from unittest import mock
+import os
+import re
+import io
+import tempfile
+import unittest
+import uuid
+import shlex
+import shutil
+import time
+
+from swift.cli import ringbuilder
+from swift.cli.ringbuilder import EXIT_SUCCESS, EXIT_WARNING, EXIT_ERROR
+from swift.common import exceptions
+from swift.common.ring import RingBuilder
+from swift.common.ring.io import RingReader
+from swift.common.ring.composite_builder import CompositeRingBuilder
+
+from test.unit import Timeout, write_stub_builder
+
+try:
+    from itertools import zip_longest
+except ImportError:
+    from itertools import izip_longest as zip_longest
+
+
+class RunSwiftRingBuilderMixin(object):
+
+    def run_srb(self, *argv, **kwargs):
+        if len(argv) == 1 and isinstance(argv[0], str):
+            # convert a single string to a list
+            argv = shlex.split(argv[0])
+        mock_stdout = io.StringIO()
+        mock_stderr = io.StringIO()
+
+        if 'exp_results' in kwargs:
+            exp_results = kwargs['exp_results']
+        else:
+            exp_results = None
+
+        srb_args = ["", self.tempfile] + [str(s) for s in argv]
+
+        try:
+            with mock.patch("sys.stdout", mock_stdout):
+                with mock.patch("sys.stderr", mock_stderr):
+                    ringbuilder.main(srb_args)
+        except SystemExit as err:
+            valid_exit_codes = None
+            if exp_results is not None and 'valid_exit_codes' in exp_results:
+                valid_exit_codes = exp_results['valid_exit_codes']
+            else:
+                valid_exit_codes = (0, 1)  # (success, warning)
+
+            if err.code not in valid_exit_codes:
+                msg = 'Unexpected exit status %s\n' % err.code
+                msg += 'STDOUT:\n%s\nSTDERR:\n%s\n' % (
+                    mock_stdout.getvalue(), mock_stderr.getvalue())
+                self.fail(msg)
+        return (mock_stdout.getvalue(), mock_stderr.getvalue())
+
+
+class TestCommands(unittest.TestCase, RunSwiftRingBuilderMixin):
+
+    def __init__(self, *args, **kwargs):
+        super(TestCommands, self).__init__(*args, **kwargs)
+
+        # List of search values for various actions
+        # These should all match the first device in the sample ring
+        # (see below) but not the second device
+        self.search_values = ["d0", "/sda1", "r0", "z0", "z0-127.0.0.1",
+                              "127.0.0.1", "z0:6200", ":6200", "R127.0.0.1",
+                              "127.0.0.1R127.0.0.1", "R:6200",
+                              "_some meta data"]
+
+    def setUp(self):
+        self.tmpdir = tempfile.mkdtemp()
+        tmpf = tempfile.NamedTemporaryFile(dir=self.tmpdir)
+        self.tempfile = self.tmpfile = tmpf.name
+
+    def tearDown(self):
+        try:
+            shutil.rmtree(self.tmpdir, True)
+        except OSError:
+            pass
+
+    def assertOutputStub(self, output, ext='stub',
+                         builder_id='(not assigned)'):
+        """
+        assert that the given output string is equal to a in-tree stub file,
+        if a test needs to check multiple outputs it can use custom ext's
+        """
+        filepath = os.path.abspath(
+            os.path.join(os.path.dirname(__file__), self.id().split('.')[-1]))
+        print(filepath)
+        filepath = '%s.%s' % (filepath, ext)
+        try:
+            with open(filepath, 'r') as f:
+                stub = f.read()
+        except (IOError, OSError) as e:
+            if e.errno == errno.ENOENT:
+                self.fail('%r does not exist' % filepath)
+            else:
+                self.fail('%r could not be read (%s)' % (filepath, e))
+        output = output.replace(self.tempfile, '__RINGFILE__')
+        stub = stub.replace('__BUILDER_ID__', builder_id)
+        for i, (value, expected) in enumerate(
+                zip_longest(output.splitlines(), stub.splitlines())):
+            # N.B. differences in trailing whitespace are ignored!
+            value = (value or '').rstrip()
+            expected = (expected or '').rstrip()
+            try:
+                self.assertEqual(value, expected)
+            except AssertionError:
+                msg = 'Line #%s value is not like expected:\n%r\n%r' % (
+                    i, value, expected)
+                msg += '\n\nFull output was:\n'
+                for i, line in enumerate(output.splitlines()):
+                    msg += '%3d: %s\n' % (i, line)
+                msg += '\n\nCompared to stub:\n'
+                for i, line in enumerate(stub.splitlines()):
+                    msg += '%3d: %s\n' % (i, line)
+                self.fail(msg)
+
+    def create_sample_ring(self, part_power=6, replicas=3, overload=None,
+                           empty=False):
+        """
+        Create a sample ring with four devices
+
+        At least four devices are needed to test removing
+        a device, since having less devices than replicas
+        is not allowed.
+        """
+
+        # Ensure there is no existing test builder file because
+        # create_sample_ring() might be used more than once in a single test
+        try:
+            os.remove(self.tmpfile)
+        except OSError:
+            pass
+
+        ring = RingBuilder(part_power, replicas, 1)
+        if overload is not None:
+            ring.set_overload(overload)
+        if not empty:
+            ring.add_dev({'weight': 100.0,
+                          'region': 0,
+                          'zone': 0,
+                          'ip': '127.0.0.1',
+                          'port': 6200,
+                          'device': 'sda1',
+                          'meta': 'some meta data',
+                          })
+            ring.add_dev({'weight': 100.0,
+                          'region': 1,
+                          'zone': 1,
+                          'ip': '127.0.0.2',
+                          'port': 6201,
+                          'device': 'sda2'
+                          })
+            ring.add_dev({'weight': 100.0,
+                          'region': 2,
+                          'zone': 2,
+                          'ip': '127.0.0.3',
+                          'port': 6202,
+                          'device': 'sdc3'
+                          })
+            ring.add_dev({'weight': 100.0,
+                          'region': 3,
+                          'zone': 3,
+                          'ip': '127.0.0.4',
+                          'port': 6203,
+                          'device': 'sdd4'
+                          })
+        ring.save(self.tmpfile)
+        return ring
+
+    def assertSystemExit(self, return_code, func, *argv):
+        with self.assertRaises(SystemExit) as cm:
+            func(*argv)
+        self.assertEqual(return_code, cm.exception.code)
+
+    def test_parse_search_values_old_format(self):
+        # Test old format
+        argv = ["d0r0z0-127.0.0.1:6200R127.0.0.1:6200/sda1_some meta data"]
+        search_values = ringbuilder._parse_search_values(argv)
+        self.assertEqual(search_values['id'], 0)
+        self.assertEqual(search_values['region'], 0)
+        self.assertEqual(search_values['zone'], 0)
+        self.assertEqual(search_values['ip'], '127.0.0.1')
+        self.assertEqual(search_values['port'], 6200)
+        self.assertEqual(search_values['replication_ip'], '127.0.0.1')
+        self.assertEqual(search_values['replication_port'], 6200)
+        self.assertEqual(search_values['device'], 'sda1')
+        self.assertEqual(search_values['meta'], 'some meta data')
+
+    def test_parse_search_values_new_format(self):
+        # Test new format
+        argv = ["--id", "0", "--region", "0", "--zone", "0",
+                "--ip", "127.0.0.1",
+                "--port", "6200",
+                "--replication-ip", "127.0.0.1",
+                "--replication-port", "6200",
+                "--device", "sda1", "--meta", "some meta data",
+                "--weight", "100"]
+        search_values = ringbuilder._parse_search_values(argv)
+        self.assertEqual(search_values['id'], 0)
+        self.assertEqual(search_values['region'], 0)
+        self.assertEqual(search_values['zone'], 0)
+        self.assertEqual(search_values['ip'], '127.0.0.1')
+        self.assertEqual(search_values['port'], 6200)
+        self.assertEqual(search_values['replication_ip'], '127.0.0.1')
+        self.assertEqual(search_values['replication_port'], 6200)
+        self.assertEqual(search_values['device'], 'sda1')
+        self.assertEqual(search_values['meta'], 'some meta data')
+        self.assertEqual(search_values['weight'], 100)
+
+    def test_parse_search_values_number_of_arguments(self):
+        # Test Number of arguments abnormal
+        argv = ["--region", "2", "test"]
+        self.assertSystemExit(
+            EXIT_ERROR, ringbuilder._parse_search_values, argv)
+
+    def test_find_parts(self):
+        rb = RingBuilder(8, 3, 0)
+        rb.add_dev({'id': 0, 'region': 1, 'zone': 0, 'weight': 100,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 3, 'region': 1, 'zone': 0, 'weight': 100,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdb1'})
+        rb.add_dev({'id': 1, 'region': 1, 'zone': 1, 'weight': 100,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sda1'})
+        rb.add_dev({'id': 4, 'region': 1, 'zone': 1, 'weight': 100,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sdb1'})
+        rb.add_dev({'id': 2, 'region': 1, 'zone': 2, 'weight': 100,
+                    'ip': '127.0.0.1', 'port': 10002, 'device': 'sda1'})
+        rb.add_dev({'id': 5, 'region': 1, 'zone': 2, 'weight': 100,
+                    'ip': '127.0.0.1', 'port': 10002, 'device': 'sdb1'})
+        rb.rebalance()
+
+        rb.add_dev({'id': 6, 'region': 2, 'zone': 1, 'weight': 10,
+                    'ip': '127.0.0.1', 'port': 10004, 'device': 'sda1'})
+        rb.pretend_min_part_hours_passed()
+        rb.rebalance()
+
+        ringbuilder.builder = rb
+        sorted_partition_count = ringbuilder._find_parts(
+            rb.search_devs({'ip': '127.0.0.1'}))
+
+        # Expect 256 partitions in the output
+        self.assertEqual(256, len(sorted_partition_count))
+
+        # Each partitions should have 3 replicas
+        for partition, count in sorted_partition_count:
+            self.assertEqual(
+                3, count, "Partition %d has only %d replicas" %
+                (partition, count))
+
+    def test_parse_list_parts_values_number_of_arguments(self):
+        # Test Number of arguments abnormal
+        argv = ["--region", "2", "test"]
+        self.assertSystemExit(
+            EXIT_ERROR, ringbuilder._parse_list_parts_values, argv)
+
+    def test_parse_add_values_number_of_arguments(self):
+        # Test Number of arguments abnormal
+        argv = ["--region", "2", "test"]
+        self.assertSystemExit(
+            EXIT_ERROR, ringbuilder._parse_add_values, argv)
+
+    def test_set_weight_values_no_devices(self):
+        # Test no devices
+        # _set_weight_values doesn't take argv-like arguments
+        self.assertSystemExit(
+            EXIT_ERROR, ringbuilder._set_weight_values, [], 100, {})
+
+    def test_parse_set_weight_values_number_of_arguments(self):
+        # Test Number of arguments abnormal
+        argv = ["r1", "100", "r2"]
+        self.assertSystemExit(
+            EXIT_ERROR, ringbuilder._parse_set_weight_values, argv)
+
+        argv = ["--region", "2"]
+        self.assertSystemExit(
+            EXIT_ERROR, ringbuilder._parse_set_weight_values, argv)
+
+    def test_set_region_values_no_devices(self):
+        # Test no devices
+        self.assertSystemExit(
+            EXIT_ERROR, ringbuilder._set_region_values, [], 100, {})
+
+    def test_parse_set_region_values_number_of_arguments(self):
+        # Test Number of arguments abnormal
+        argv = ["r1", "100", "r2"]
+        self.assertSystemExit(
+            EXIT_ERROR, ringbuilder._parse_set_region_values, argv)
+
+        argv = ["--region", "2"]
+        self.assertSystemExit(
+            EXIT_ERROR, ringbuilder._parse_set_region_values, argv)
+
+    def test_set_zone_values_no_devices(self):
+        # Test no devices
+        self.assertSystemExit(
+            EXIT_ERROR, ringbuilder._set_zone_values, [], 100, {})
+
+    def test_parse_set_zone_values_number_of_arguments(self):
+        # Test Number of arguments abnormal
+        argv = ["r1", "100", "r2"]
+        self.assertSystemExit(
+            EXIT_ERROR, ringbuilder._parse_set_zone_values, argv)
+
+        argv = ["--region", "2"]
+        self.assertSystemExit(
+            EXIT_ERROR, ringbuilder._parse_set_zone_values, argv)
+
+    def test_set_info_values_no_devices(self):
+        # Test no devices
+        # _set_info_values doesn't take argv-like arguments
+        self.assertSystemExit(
+            EXIT_ERROR, ringbuilder._set_info_values, [], 100, {})
+
+    def test_parse_set_info_values_number_of_arguments(self):
+        # Test Number of arguments abnormal
+        argv = ["r1", "127.0.0.1", "r2"]
+        self.assertSystemExit(
+            EXIT_ERROR, ringbuilder._parse_set_info_values, argv)
+
+    def test_parse_remove_values_number_of_arguments(self):
+        # Test Number of arguments abnormal
+        argv = ["--region", "2", "test"]
+        self.assertSystemExit(
+            EXIT_ERROR, ringbuilder._parse_remove_values, argv)
+
+    def test_create_ring(self):
+        argv = ["", self.tmpfile, "create", "6", "3.14159265359", "1"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring = RingBuilder.load(self.tmpfile)
+        self.assertEqual(ring.part_power, 6)
+        self.assertEqual(ring.replicas, 3.14159265359)
+        self.assertEqual(ring.min_part_hours, 1)
+
+    def test_create_ring_number_of_arguments(self):
+        # Test missing arguments
+        argv = ["", self.tmpfile, "create"]
+        self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+
+    def test_add_device_ipv4_old_format(self):
+        self.create_sample_ring()
+        # Test ipv4(old format)
+        argv = ["", self.tmpfile, "add",
+                "r2z3-127.0.0.1:6200/sda3_some meta data", "3.14159265359"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        # Check that device was created with given data
+        ring = RingBuilder.load(self.tmpfile)
+        dev = ring.devs[-1]
+        self.assertEqual(dev['region'], 2)
+        self.assertEqual(dev['zone'], 3)
+        self.assertEqual(dev['ip'], '127.0.0.1')
+        self.assertEqual(dev['port'], 6200)
+        self.assertEqual(dev['device'], 'sda3')
+        self.assertEqual(dev['weight'], 3.14159265359)
+        self.assertEqual(dev['replication_ip'], '127.0.0.1')
+        self.assertEqual(dev['replication_port'], 6200)
+        self.assertEqual(dev['meta'], 'some meta data')
+
+    def test_add_duplicate_devices(self):
+        self.create_sample_ring()
+        # Test adding duplicate devices
+        argv = ["", self.tmpfile, "add",
+                "r1z1-127.0.0.1:6200/sda9", "3.14159265359",
+                "r1z1-127.0.0.1:6200/sda9", "2"]
+        self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+
+    def test_add_device_ipv6_old_format(self):
+        self.create_sample_ring()
+        # Test ipv6(old format)
+        argv = \
+            ["", self.tmpfile, "add",
+             "r2z3-2001:0000:1234:0000:0000:C1C0:ABCD:0876:6200"
+             "R2::10:7000/sda3_some meta data",
+             "3.14159265359"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        # Check that device was created with given data
+        ring = RingBuilder.load(self.tmpfile)
+        dev = ring.devs[-1]
+        self.assertEqual(dev['region'], 2)
+        self.assertEqual(dev['zone'], 3)
+        self.assertEqual(dev['ip'], '2001:0:1234::c1c0:abcd:876')
+        self.assertEqual(dev['port'], 6200)
+        self.assertEqual(dev['device'], 'sda3')
+        self.assertEqual(dev['weight'], 3.14159265359)
+        self.assertEqual(dev['replication_ip'], '2::10')
+        self.assertEqual(dev['replication_port'], 7000)
+        self.assertEqual(dev['meta'], 'some meta data')
+        # Final check, rebalance and check ring is ok
+        ring.rebalance()
+        self.assertTrue(ring.validate())
+
+    def test_add_device_ipv4_new_format(self):
+        self.create_sample_ring()
+        # Test ipv4(new format)
+        argv = \
+            ["", self.tmpfile, "add",
+             "--region", "2", "--zone", "3",
+             "--ip", "127.0.0.2",
+             "--port", "6200",
+             "--replication-ip", "127.0.0.2",
+             "--replication-port", "6200",
+             "--device", "sda3", "--meta", "some meta data",
+             "--weight", "3.14159265359"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        # Check that device was created with given data
+        ring = RingBuilder.load(self.tmpfile)
+        dev = ring.devs[-1]
+        self.assertEqual(dev['region'], 2)
+        self.assertEqual(dev['zone'], 3)
+        self.assertEqual(dev['ip'], '127.0.0.2')
+        self.assertEqual(dev['port'], 6200)
+        self.assertEqual(dev['device'], 'sda3')
+        self.assertEqual(dev['weight'], 3.14159265359)
+        self.assertEqual(dev['replication_ip'], '127.0.0.2')
+        self.assertEqual(dev['replication_port'], 6200)
+        self.assertEqual(dev['meta'], 'some meta data')
+        # Final check, rebalance and check ring is ok
+        ring.rebalance()
+        self.assertTrue(ring.validate())
+
+    def test_add_device_ipv6_new_format(self):
+        self.create_sample_ring()
+        # Test ipv6(new format)
+        argv = \
+            ["", self.tmpfile, "add",
+             "--region", "2", "--zone", "3",
+             "--ip", "[3001:0000:1234:0000:0000:C1C0:ABCD:0876]",
+             "--port", "6200",
+             "--replication-ip", "[3::10]",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data",
+             "--weight", "3.14159265359"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        # Check that device was created with given data
+        ring = RingBuilder.load(self.tmpfile)
+        dev = ring.devs[-1]
+        self.assertEqual(dev['region'], 2)
+        self.assertEqual(dev['zone'], 3)
+        self.assertEqual(dev['ip'], '3001:0:1234::c1c0:abcd:876')
+        self.assertEqual(dev['port'], 6200)
+        self.assertEqual(dev['device'], 'sda3')
+        self.assertEqual(dev['weight'], 3.14159265359)
+        self.assertEqual(dev['replication_ip'], '3::10')
+        self.assertEqual(dev['replication_port'], 7000)
+        self.assertEqual(dev['meta'], 'some meta data')
+        # Final check, rebalance and check ring is ok
+        ring.rebalance()
+        self.assertTrue(ring.validate())
+
+    def test_add_device_domain_new_format(self):
+        self.create_sample_ring()
+        # Test domain name
+        argv = \
+            ["", self.tmpfile, "add",
+             "--region", "2", "--zone", "3",
+             "--ip", "test.test.com",
+             "--port", "6200",
+             "--replication-ip", "r.test.com",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data",
+             "--weight", "3.14159265359"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        # Check that device was created with given data
+        ring = RingBuilder.load(self.tmpfile)
+        dev = ring.devs[-1]
+        self.assertEqual(dev['region'], 2)
+        self.assertEqual(dev['zone'], 3)
+        self.assertEqual(dev['ip'], 'test.test.com')
+        self.assertEqual(dev['port'], 6200)
+        self.assertEqual(dev['device'], 'sda3')
+        self.assertEqual(dev['weight'], 3.14159265359)
+        self.assertEqual(dev['replication_ip'], 'r.test.com')
+        self.assertEqual(dev['replication_port'], 7000)
+        self.assertEqual(dev['meta'], 'some meta data')
+        # Final check, rebalance and check ring is ok
+        ring.rebalance()
+        self.assertTrue(ring.validate())
+
+    def test_add_device_number_of_arguments(self):
+        # Test Number of arguments abnormal
+        argv = ["", self.tmpfile, "add"]
+        self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+
+    def test_add_device_already_exists(self):
+        # Test Add a device that already exists
+        argv = ["", self.tmpfile, "add",
+                "r0z0-127.0.0.1:6200/sda1_some meta data", "100"]
+        self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+
+    def test_add_device_old_missing_region(self):
+        self.create_sample_ring()
+        # Test add device without specifying a region
+        argv = ["", self.tmpfile, "add",
+                "z3-127.0.0.1:6200/sde3_some meta data", "3.14159265359"]
+        exp_results = {'valid_exit_codes': [2]}
+        self.run_srb(*argv, exp_results=exp_results)
+        # Check that ring was created with sane value for region
+        ring = RingBuilder.load(self.tmpfile)
+        dev = ring.devs[-1]
+        self.assertGreater(dev['region'], 0)
+
+    def test_add_device_part_power_increase(self):
+        self.create_sample_ring()
+        ring = RingBuilder.load(self.tmpfile)
+        ring.next_part_power = 1
+        ring.save(self.tmpfile)
+
+        argv = ["", self.tmpfile, "add",
+                "r0z0-127.0.1.1:6200/sda1_some meta data", "100"]
+        self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+
+    def test_remove_device(self):
+        for search_value in self.search_values:
+            self.create_sample_ring()
+            argv = ["", self.tmpfile, "remove", search_value]
+            self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+            ring = RingBuilder.load(self.tmpfile)
+
+            # Check that weight was set to 0
+            dev = ring.devs[0]
+            self.assertEqual(dev['weight'], 0)
+
+            # Check that device is in list of devices to be removed
+            self.assertEqual(dev['region'], 0)
+            self.assertEqual(dev['zone'], 0)
+            self.assertEqual(dev['ip'], '127.0.0.1')
+            self.assertEqual(dev['port'], 6200)
+            self.assertEqual(dev['device'], 'sda1')
+            self.assertEqual(dev['weight'], 0)
+            self.assertEqual(dev['replication_ip'], '127.0.0.1')
+            self.assertEqual(dev['replication_port'], 6200)
+            self.assertEqual(dev['meta'], 'some meta data')
+
+            # Check that second device in ring is not affected
+            dev = ring.devs[1]
+            self.assertEqual(dev['weight'], 100)
+            self.assertFalse([d for d in ring._remove_devs if d['id'] == 1])
+
+            # Final check, rebalance and check ring is ok
+            ring.rebalance()
+            self.assertTrue(ring.validate())
+
+    def test_remove_device_ipv4_old_format(self):
+        self.create_sample_ring()
+        # Test ipv4(old format)
+        argv = ["", self.tmpfile, "remove",
+                "d0r0z0-127.0.0.1:6200R127.0.0.1:6200/sda1_some meta data"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring = RingBuilder.load(self.tmpfile)
+
+        # Check that weight was set to 0
+        dev = ring.devs[0]
+        self.assertEqual(dev['weight'], 0)
+
+        # Check that device is in list of devices to be removed
+        self.assertEqual(dev['region'], 0)
+        self.assertEqual(dev['zone'], 0)
+        self.assertEqual(dev['ip'], '127.0.0.1')
+        self.assertEqual(dev['port'], 6200)
+        self.assertEqual(dev['device'], 'sda1')
+        self.assertEqual(dev['weight'], 0)
+        self.assertEqual(dev['replication_ip'], '127.0.0.1')
+        self.assertEqual(dev['replication_port'], 6200)
+        self.assertEqual(dev['meta'], 'some meta data')
+
+        # Check that second device in ring is not affected
+        dev = ring.devs[1]
+        self.assertEqual(dev['weight'], 100)
+        self.assertFalse([d for d in ring._remove_devs if d['id'] == 1])
+
+        # Final check, rebalance and check ring is ok
+        ring.rebalance()
+        self.assertTrue(ring.validate())
+
+    def test_remove_device_ipv6_old_format(self):
+        self.create_sample_ring()
+        # add IPV6
+        argv = \
+            ["", self.tmpfile, "add",
+             "--region", "2", "--zone", "3",
+             "--ip", "[2001:0000:1234:0000:0000:C1C0:ABCD:0876]",
+             "--port", "6200",
+             "--replication-ip", "[2::10]",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data",
+             "--weight", "3.14159265359"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        # Test ipv6(old format)
+        argv = ["", self.tmpfile, "remove",
+                "d4r2z3-[2001:0000:1234:0000:0000:C1C0:ABCD:0876]:6200"
+                "R[2::10]:7000/sda3_some meta data"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring = RingBuilder.load(self.tmpfile)
+
+        # Check that second device in ring is not affected
+        dev = ring.devs[0]
+        self.assertEqual(dev['weight'], 100)
+        self.assertFalse([d for d in ring._remove_devs if d['id'] == 0])
+
+        # Check that second device in ring is not affected
+        dev = ring.devs[1]
+        self.assertEqual(dev['weight'], 100)
+        self.assertFalse([d for d in ring._remove_devs if d['id'] == 1])
+
+        # Check that weight was set to 0
+        dev = ring.devs[-1]
+        self.assertEqual(dev['weight'], 0)
+
+        # Check that device is in list of devices to be removed
+        self.assertEqual(dev['region'], 2)
+        self.assertEqual(dev['zone'], 3)
+        self.assertEqual(dev['ip'], '2001:0:1234::c1c0:abcd:876')
+        self.assertEqual(dev['port'], 6200)
+        self.assertEqual(dev['device'], 'sda3')
+        self.assertEqual(dev['weight'], 0)
+        self.assertEqual(dev['replication_ip'], '2::10')
+        self.assertEqual(dev['replication_port'], 7000)
+        self.assertEqual(dev['meta'], 'some meta data')
+
+        # Final check, rebalance and check ring is ok
+        ring.rebalance()
+        self.assertTrue(ring.validate())
+
+    def test_remove_device_ipv4_new_format(self):
+        self.create_sample_ring()
+        # Test ipv4(new format)
+        argv = \
+            ["", self.tmpfile, "remove",
+             "--id", "0", "--region", "0", "--zone", "0",
+             "--ip", "127.0.0.1",
+             "--port", "6200",
+             "--replication-ip", "127.0.0.1",
+             "--replication-port", "6200",
+             "--device", "sda1", "--meta", "some meta data"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring = RingBuilder.load(self.tmpfile)
+
+        # Check that weight was set to 0
+        dev = ring.devs[0]
+        self.assertEqual(dev['weight'], 0)
+
+        # Check that device is in list of devices to be removed
+        self.assertEqual(dev['region'], 0)
+        self.assertEqual(dev['zone'], 0)
+        self.assertEqual(dev['ip'], '127.0.0.1')
+        self.assertEqual(dev['port'], 6200)
+        self.assertEqual(dev['device'], 'sda1')
+        self.assertEqual(dev['weight'], 0)
+        self.assertEqual(dev['replication_ip'], '127.0.0.1')
+        self.assertEqual(dev['replication_port'], 6200)
+        self.assertEqual(dev['meta'], 'some meta data')
+
+        # Check that second device in ring is not affected
+        dev = ring.devs[1]
+        self.assertEqual(dev['weight'], 100)
+        self.assertFalse([d for d in ring._remove_devs if d['id'] == 1])
+
+        # Final check, rebalance and check ring is ok
+        ring.rebalance()
+        self.assertTrue(ring.validate())
+
+    def test_remove_device_ipv6_new_format(self):
+        self.create_sample_ring()
+        argv = \
+            ["", self.tmpfile, "add",
+             "--region", "2", "--zone", "3",
+             "--ip", "[3001:0000:1234:0000:0000:C1C0:ABCD:0876]",
+             "--port", "8000",
+             "--replication-ip", "[3::10]",
+             "--replication-port", "9000",
+             "--device", "sda30", "--meta", "other meta data",
+             "--weight", "3.14159265359"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        # Test ipv6(new format)
+        argv = \
+            ["", self.tmpfile, "remove",
+             "--id", "4", "--region", "2", "--zone", "3",
+             "--ip", "[3001:0000:1234:0000:0000:C1C0:ABCD:0876]",
+             "--port", "8000",
+             "--replication-ip", "[3::10]",
+             "--replication-port", "9000",
+             "--device", "sda30", "--meta", "other meta data"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring = RingBuilder.load(self.tmpfile)
+
+        # Check that second device in ring is not affected
+        dev = ring.devs[0]
+        self.assertEqual(dev['weight'], 100)
+        self.assertFalse([d for d in ring._remove_devs if d['id'] == 0])
+
+        # Check that second device in ring is not affected
+        dev = ring.devs[1]
+        self.assertEqual(dev['weight'], 100)
+        self.assertFalse([d for d in ring._remove_devs if d['id'] == 1])
+
+        # Check that weight was set to 0
+        dev = ring.devs[-1]
+        self.assertEqual(dev['weight'], 0)
+
+        # Check that device is in list of devices to be removed
+        self.assertEqual(dev['region'], 2)
+        self.assertEqual(dev['zone'], 3)
+        self.assertEqual(dev['ip'], '3001:0:1234::c1c0:abcd:876')
+        self.assertEqual(dev['port'], 8000)
+        self.assertEqual(dev['device'], 'sda30')
+        self.assertEqual(dev['weight'], 0)
+        self.assertEqual(dev['replication_ip'], '3::10')
+        self.assertEqual(dev['replication_port'], 9000)
+        self.assertEqual(dev['meta'], 'other meta data')
+
+        # Final check, rebalance and check ring is ok
+        ring.rebalance()
+        self.assertTrue(ring.validate())
+
+    def test_remove_device_domain_new_format(self):
+        self.create_sample_ring()
+        # add domain name
+        argv = \
+            ["", self.tmpfile, "add",
+             "--region", "2", "--zone", "3",
+             "--ip", "test.test.com",
+             "--port", "6200",
+             "--replication-ip", "r.test.com",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data",
+             "--weight", "3.14159265359"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        # Test domain name
+        argv = \
+            ["", self.tmpfile, "remove",
+             "--id", "4", "--region", "2", "--zone", "3",
+             "--ip", "test.test.com",
+             "--port", "6200",
+             "--replication-ip", "r.test.com",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring = RingBuilder.load(self.tmpfile)
+
+        # Check that second device in ring is not affected
+        dev = ring.devs[0]
+        self.assertEqual(dev['weight'], 100)
+        self.assertFalse([d for d in ring._remove_devs if d['id'] == 0])
+
+        # Check that second device in ring is not affected
+        dev = ring.devs[1]
+        self.assertEqual(dev['weight'], 100)
+        self.assertFalse([d for d in ring._remove_devs if d['id'] == 1])
+
+        # Check that weight was set to 0
+        dev = ring.devs[-1]
+        self.assertEqual(dev['weight'], 0)
+
+        # Check that device is in list of devices to be removed
+        self.assertEqual(dev['region'], 2)
+        self.assertEqual(dev['zone'], 3)
+        self.assertEqual(dev['ip'], 'test.test.com')
+        self.assertEqual(dev['port'], 6200)
+        self.assertEqual(dev['device'], 'sda3')
+        self.assertEqual(dev['weight'], 0)
+        self.assertEqual(dev['replication_ip'], 'r.test.com')
+        self.assertEqual(dev['replication_port'], 7000)
+        self.assertEqual(dev['meta'], 'some meta data')
+
+        # Final check, rebalance and check ring is ok
+        ring.rebalance()
+        self.assertTrue(ring.validate())
+
+    def test_remove_device_number_of_arguments(self):
+        self.create_sample_ring()
+        # Test Number of arguments abnormal
+        argv = ["", self.tmpfile, "remove"]
+        self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+
+    def test_remove_device_no_matching(self):
+        self.create_sample_ring()
+        # Test No matching devices
+        argv = ["", self.tmpfile, "remove",
+                "--ip", "unknown"]
+        self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+
+    def test_remove_device_part_power_increase(self):
+        self.create_sample_ring()
+        ring = RingBuilder.load(self.tmpfile)
+        ring.next_part_power = 1
+        ring.save(self.tmpfile)
+
+        argv = ["", self.tmpfile, "remove", "d0"]
+        self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+
+    def test_set_weight(self):
+        for search_value in self.search_values:
+            self.create_sample_ring()
+
+            argv = ["", self.tmpfile, "set_weight",
+                    search_value, "3.14159265359"]
+            self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+            ring = RingBuilder.load(self.tmpfile)
+
+            # Check that weight was changed
+            dev = ring.devs[0]
+            self.assertEqual(dev['weight'], 3.14159265359)
+
+            # Check that second device in ring is not affected
+            dev = ring.devs[1]
+            self.assertEqual(dev['weight'], 100)
+
+            # Final check, rebalance and check ring is ok
+            ring.rebalance()
+            self.assertTrue(ring.validate())
+
+    def test_set_weight_old_format_two_devices(self):
+        # Would block without the 'yes' argument
+        self.create_sample_ring()
+        argv = ["", self.tmpfile, "set_weight",
+                "d2", "3.14", "d1", "6.28", "--yes"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        ring = RingBuilder.load(self.tmpfile)
+        # Check that weight was changed
+        self.assertEqual(ring.devs[2]['weight'], 3.14)
+        self.assertEqual(ring.devs[1]['weight'], 6.28)
+        # Check that other devices in ring are not affected
+        self.assertEqual(ring.devs[0]['weight'], 100)
+        self.assertEqual(ring.devs[3]['weight'], 100)
+
+    def test_set_weight_ipv4_old_format(self):
+        self.create_sample_ring()
+        # Test ipv4(old format)
+        argv = ["", self.tmpfile, "set_weight",
+                "d0r0z0-127.0.0.1:6200R127.0.0.1:6200/sda1_some meta data",
+                "3.14159265359"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring = RingBuilder.load(self.tmpfile)
+
+        # Check that weight was changed
+        dev = ring.devs[0]
+        self.assertEqual(dev['weight'], 3.14159265359)
+
+        # Check that second device in ring is not affected
+        dev = ring.devs[1]
+        self.assertEqual(dev['weight'], 100)
+
+        # Final check, rebalance and check ring is ok
+        ring.rebalance()
+        self.assertTrue(ring.validate())
+
+    def test_set_weight_ipv6_old_format(self):
+        self.create_sample_ring()
+        # add IPV6
+        argv = \
+            ["", self.tmpfile, "add",
+             "--region", "2", "--zone", "3",
+             "--ip", "[2001:0000:1234:0000:0000:C1C0:ABCD:0876]",
+             "--port", "6200",
+             "--replication-ip", "[2::10]",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data",
+             "--weight", "100"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        # Test ipv6(old format)
+        argv = ["", self.tmpfile, "set_weight",
+                "d4r2z3-[2001:0000:1234:0000:0000:C1C0:ABCD:0876]:6200"
+                "R[2::10]:7000/sda3_some meta data", "3.14159265359"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring = RingBuilder.load(self.tmpfile)
+
+        # Check that second device in ring is not affected
+        dev = ring.devs[0]
+        self.assertEqual(dev['weight'], 100)
+
+        # Check that second device in ring is not affected
+        dev = ring.devs[1]
+        self.assertEqual(dev['weight'], 100)
+
+        # Check that weight was changed
+        dev = ring.devs[-1]
+        self.assertEqual(dev['weight'], 3.14159265359)
+
+        # Final check, rebalance and check ring is ok
+        ring.rebalance()
+        self.assertTrue(ring.validate())
+
+    def test_set_weight_ipv4_new_format(self):
+        self.create_sample_ring()
+        # Test ipv4(new format)
+        argv = \
+            ["", self.tmpfile, "set_weight",
+             "--id", "0", "--region", "0", "--zone", "0",
+             "--ip", "127.0.0.1",
+             "--port", "6200",
+             "--replication-ip", "127.0.0.1",
+             "--replication-port", "6200",
+             "--device", "sda1", "--meta", "some meta data", "3.14159265359"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring = RingBuilder.load(self.tmpfile)
+
+        # Check that weight was changed
+        dev = ring.devs[0]
+        self.assertEqual(dev['weight'], 3.14159265359)
+
+        # Check that second device in ring is not affected
+        dev = ring.devs[1]
+        self.assertEqual(dev['weight'], 100)
+
+        # Final check, rebalance and check ring is ok
+        ring.rebalance()
+        self.assertTrue(ring.validate())
+
+    def test_set_weight_ipv6_new_format(self):
+        self.create_sample_ring()
+        # add IPV6
+        argv = \
+            ["", self.tmpfile, "add",
+             "--region", "2", "--zone", "3",
+             "--ip", "[2001:0000:1234:0000:0000:C1C0:ABCD:0876]",
+             "--port", "6200",
+             "--replication-ip", "[2::10]",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data",
+             "--weight", "100"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        # Test ipv6(new format)
+        argv = \
+            ["", self.tmpfile, "set_weight",
+             "--id", "4", "--region", "2", "--zone", "3",
+             "--ip", "[2001:0000:1234:0000:0000:C1C0:ABCD:0876]",
+             "--port", "6200",
+             "--replication-ip", "[2::10]",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data", "3.14159265359"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring = RingBuilder.load(self.tmpfile)
+
+        # Check that second device in ring is not affected
+        dev = ring.devs[0]
+        self.assertEqual(dev['weight'], 100)
+
+        # Check that second device in ring is not affected
+        dev = ring.devs[1]
+        self.assertEqual(dev['weight'], 100)
+
+        # Check that weight was changed
+        dev = ring.devs[-1]
+        self.assertEqual(dev['weight'], 3.14159265359)
+
+        # Final check, rebalance and check ring is ok
+        ring.rebalance()
+        self.assertTrue(ring.validate())
+
+    def test_set_weight_domain_new_format(self):
+        self.create_sample_ring()
+        # add domain name
+        argv = \
+            ["", self.tmpfile, "add",
+             "--region", "2", "--zone", "3",
+             "--ip", "test.test.com",
+             "--port", "6200",
+             "--replication-ip", "r.test.com",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data",
+             "--weight", "100"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        # Test domain name
+        argv = \
+            ["", self.tmpfile, "set_weight",
+             "--id", "4", "--region", "2", "--zone", "3",
+             "--ip", "test.test.com",
+             "--port", "6200",
+             "--replication-ip", "r.test.com",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data", "3.14159265359"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring = RingBuilder.load(self.tmpfile)
+
+        # Check that second device in ring is not affected
+        dev = ring.devs[0]
+        self.assertEqual(dev['weight'], 100)
+
+        # Check that second device in ring is not affected
+        dev = ring.devs[1]
+        self.assertEqual(dev['weight'], 100)
+
+        # Check that weight was changed
+        dev = ring.devs[-1]
+        self.assertEqual(dev['weight'], 3.14159265359)
+
+        # Final check, rebalance and check ring is ok
+        ring.rebalance()
+        self.assertTrue(ring.validate())
+
+    def test_set_weight_number_of_arguments(self):
+        self.create_sample_ring()
+        # Test Number of arguments abnormal
+        argv = ["", self.tmpfile, "set_weight"]
+        self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+
+    def test_set_weight_no_matching(self):
+        self.create_sample_ring()
+        # Test No matching devices
+        argv = ["", self.tmpfile, "set_weight",
+                "--ip", "unknown"]
+        self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+
+    def _check_region(self, ring, dev_id, expected_region):
+        for dev in ring.devs:
+            if dev['id'] != dev_id:
+                self.assertNotEqual(dev['region'], expected_region)
+            else:
+                self.assertEqual(dev['region'], expected_region)
+
+        # Final check, rebalance and check ring is ok
+        ring.rebalance()
+        self.assertTrue(ring.validate())
+
+    def test_set_region(self):
+        for search_value in self.search_values:
+            self.create_sample_ring()
+
+            argv = ["", self.tmpfile, "set_region",
+                    search_value, "314"]
+            self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+            ring = RingBuilder.load(self.tmpfile)
+            self._check_region(ring, 0, 314)
+
+    def test_set_region_ipv4_old_format(self):
+        self.create_sample_ring()
+        # Test ipv4(old format)
+        argv = ["", self.tmpfile, "set_region",
+                "d0r0z0-127.0.0.1:6200R127.0.0.1:6200/sda1_some meta data",
+                "314"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring = RingBuilder.load(self.tmpfile)
+
+        self._check_region(ring, 0, 314)
+
+    def test_set_region_ipv6_old_format(self):
+        self.create_sample_ring()
+        # add IPV6
+        argv = \
+            ["", self.tmpfile, "add",
+             "--region", "2", "--zone", "3",
+             "--ip", "[2001:0000:1234:0000:0000:C1C0:ABCD:0876]",
+             "--port", "6000",
+             "--replication-ip", "[2::10]",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data",
+             "--weight", "100"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        # Test ipv6(old format)
+        argv = ["", self.tmpfile, "set_region",
+                "d4r2z3-[2001:0000:1234:0000:0000:C1C0:ABCD:0876]:6000"
+                "R[2::10]:7000/sda3_some meta data", "314"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring = RingBuilder.load(self.tmpfile)
+
+        self._check_region(ring, 4, 314)
+
+    def test_set_region_ipv4_new_format(self):
+        self.create_sample_ring()
+        # Test ipv4(new format)
+        argv = \
+            ["", self.tmpfile, "set_region",
+             "--id", "0", "--region", "0", "--zone", "0",
+             "--ip", "127.0.0.1",
+             "--port", "6200",
+             "--replication-ip", "127.0.0.1",
+             "--replication-port", "6200",
+             "--device", "sda1", "--meta", "some meta data", "314"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring = RingBuilder.load(self.tmpfile)
+
+        self._check_region(ring, 0, 314)
+
+    def test_set_region_ipv6_new_format(self):
+        self.create_sample_ring()
+        # add IPV6
+        argv = \
+            ["", self.tmpfile, "add",
+             "--region", "2", "--zone", "3",
+             "--ip", "[2001:0000:1234:0000:0000:C1C0:ABCD:0876]",
+             "--port", "6000",
+             "--replication-ip", "[2::10]",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data",
+             "--weight", "100"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        # Test ipv6(new format)
+        argv = \
+            ["", self.tmpfile, "set_region",
+             "--id", "4", "--region", "2", "--zone", "3",
+             "--ip", "[2001:0000:1234:0000:0000:C1C0:ABCD:0876]",
+             "--port", "6000",
+             "--replication-ip", "[2::10]",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data", "314"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring = RingBuilder.load(self.tmpfile)
+
+        self._check_region(ring, 4, 314)
+
+    def test_set_region_domain_new_format(self):
+        self.create_sample_ring()
+        # add domain name
+        argv = \
+            ["", self.tmpfile, "add",
+             "--region", "2", "--zone", "3",
+             "--ip", "test.test.com",
+             "--port", "6000",
+             "--replication-ip", "r.test.com",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data",
+             "--weight", "100"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        # Test domain name
+        argv = \
+            ["", self.tmpfile, "set_region",
+             "--id", "4", "--region", "2", "--zone", "3",
+             "--ip", "test.test.com",
+             "--port", "6000",
+             "--replication-ip", "r.test.com",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data", "314"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring = RingBuilder.load(self.tmpfile)
+
+        self._check_region(ring, 4, 314)
+
+    def test_set_region_number_of_arguments(self):
+        self.create_sample_ring()
+        # Test Number of arguments abnormal
+        argv = ["", self.tmpfile, "set_region"]
+        self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+
+    def test_set_region_no_matching(self):
+        self.create_sample_ring()
+        # Test No matching devices
+        argv = ["", self.tmpfile, "set_region",
+                "--ip", "unknown"]
+        self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+
+    def test_set_zone(self):
+        for search_value in self.search_values:
+            self.create_sample_ring()
+
+            argv = ["", self.tmpfile, "set_zone",
+                    search_value, "314"]
+            self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+            ring = RingBuilder.load(self.tmpfile)
+
+            self._check_zone(ring, 0, 314)
+
+    def test_set_zone_ipv4_old_format(self):
+        self.create_sample_ring()
+        # Test ipv4(old format)
+        argv = ["", self.tmpfile, "set_zone",
+                "d0r0z0-127.0.0.1:6200R127.0.0.1:6200/sda1_some meta data",
+                "314"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring = RingBuilder.load(self.tmpfile)
+
+        self._check_zone(ring, 0, 314)
+
+    def _check_zone(self, ring, dev_id, expected_zone):
+        for dev in ring.devs:
+            if dev['id'] != dev_id:
+                self.assertFalse(dev['zone'] == expected_zone)
+            else:
+                self.assertEqual(dev['zone'], expected_zone)
+
+        # Final check, rebalance and check ring is ok
+        ring.rebalance()
+        self.assertTrue(ring.validate())
+
+    def test_set_zone_ipv6_old_format(self):
+        self.create_sample_ring()
+        # add IPV6
+        argv = \
+            ["", self.tmpfile, "add",
+             "--region", "2", "--zone", "3",
+             "--ip", "[2001:0000:1234:0000:0000:C1C0:ABCD:0876]",
+             "--port", "6000",
+             "--replication-ip", "[2::10]",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data",
+             "--weight", "100"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        # Test ipv6(old format)
+        argv = ["", self.tmpfile, "set_zone",
+                "d4r2z3-[2001:0000:1234:0000:0000:C1C0:ABCD:0876]:6000"
+                "R[2::10]:7000/sda3_some meta data", "314"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring = RingBuilder.load(self.tmpfile)
+
+        self._check_zone(ring, 4, 314)
+
+    def test_set_zone_ipv4_new_format(self):
+        self.create_sample_ring()
+        # Test ipv4(new format)
+        argv = \
+            ["", self.tmpfile, "set_zone",
+             "--id", "0", "--region", "0", "--zone", "0",
+             "--ip", "127.0.0.1",
+             "--port", "6200",
+             "--replication-ip", "127.0.0.1",
+             "--replication-port", "6200",
+             "--device", "sda1", "--meta", "some meta data", "314"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring = RingBuilder.load(self.tmpfile)
+
+        self._check_zone(ring, 0, 314)
+
+    def test_set_zone_ipv6_new_format(self):
+        self.create_sample_ring()
+        # add IPV6
+        argv = \
+            ["", self.tmpfile, "add",
+             "--region", "2", "--zone", "3",
+             "--ip", "[2001:0000:1234:0000:0000:C1C0:ABCD:0876]",
+             "--port", "6000",
+             "--replication-ip", "[2::10]",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data",
+             "--weight", "100"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        # Test ipv6(new format)
+        argv = \
+            ["", self.tmpfile, "set_zone",
+             "--id", "4", "--region", "2",
+             "--ip", "[2001:0000:1234:0000:0000:C1C0:ABCD:0876]",
+             "--port", "6000",
+             "--replication-ip", "[2::10]",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data", "314"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring = RingBuilder.load(self.tmpfile)
+
+        self._check_zone(ring, 4, 314)
+
+    def test_set_zone_domain_new_format(self):
+        self.create_sample_ring()
+        # add domain name
+        argv = \
+            ["", self.tmpfile, "add",
+             "--region", "2", "--zone", "3",
+             "--ip", "test.test.com",
+             "--port", "6000",
+             "--replication-ip", "r.test.com",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data",
+             "--weight", "100"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        # Test domain name
+        argv = \
+            ["", self.tmpfile, "set_zone",
+             "--id", "4", "--region", "2", "--zone", "3",
+             "--ip", "test.test.com",
+             "--port", "6000",
+             "--replication-ip", "r.test.com",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data", "314"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring = RingBuilder.load(self.tmpfile)
+
+        self._check_zone(ring, 4, 314)
+
+    def test_set_zone_number_of_arguments(self):
+        self.create_sample_ring()
+        # Test Number of arguments abnormal
+        argv = ["", self.tmpfile, "set_zone"]
+        self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+
+    def test_set_zone_no_matching(self):
+        self.create_sample_ring()
+        # Test No matching devices
+        argv = ["", self.tmpfile, "set_zone",
+                "--ip", "unknown"]
+        self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+
+    def test_set_info(self):
+        for search_value in self.search_values:
+
+            self.create_sample_ring()
+            argv = ["", self.tmpfile, "set_info", search_value,
+                    "127.0.1.1:8000/sda1_other meta data"]
+            self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+            # Check that device was created with given data
+            ring = RingBuilder.load(self.tmpfile)
+            dev = ring.devs[0]
+            self.assertEqual(dev['ip'], '127.0.1.1')
+            self.assertEqual(dev['port'], 8000)
+            self.assertEqual(dev['device'], 'sda1')
+            self.assertEqual(dev['meta'], 'other meta data')
+
+            # Check that second device in ring is not affected
+            dev = ring.devs[1]
+            self.assertEqual(dev['ip'], '127.0.0.2')
+            self.assertEqual(dev['port'], 6201)
+            self.assertEqual(dev['device'], 'sda2')
+            self.assertEqual(dev['meta'], '')
+
+            # Final check, rebalance and check ring is ok
+            ring.rebalance()
+            self.assertTrue(ring.validate())
+
+    def test_set_info_ipv4_old_format(self):
+        self.create_sample_ring()
+        # Test ipv4(old format)
+        argv = ["", self.tmpfile, "set_info",
+                "d0r0z0-127.0.0.1:6200R127.0.0.1:6200/sda1_some meta data",
+                "127.0.1.1:8000R127.0.1.1:8000/sda10_other meta data"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        # Check that device was created with given data
+        ring = RingBuilder.load(self.tmpfile)
+        dev = ring.devs[0]
+        self.assertEqual(dev['ip'], '127.0.1.1')
+        self.assertEqual(dev['port'], 8000)
+        self.assertEqual(dev['replication_ip'], '127.0.1.1')
+        self.assertEqual(dev['replication_port'], 8000)
+        self.assertEqual(dev['device'], 'sda10')
+        self.assertEqual(dev['meta'], 'other meta data')
+
+        # Check that second device in ring is not affected
+        dev = ring.devs[1]
+        self.assertEqual(dev['ip'], '127.0.0.2')
+        self.assertEqual(dev['port'], 6201)
+        self.assertEqual(dev['device'], 'sda2')
+        self.assertEqual(dev['meta'], '')
+
+        # Final check, rebalance and check ring is ok
+        ring.rebalance()
+        self.assertTrue(ring.validate())
+
+    def test_set_info_ipv6_old_format(self):
+        self.create_sample_ring()
+        # add IPV6
+        argv = \
+            ["", self.tmpfile, "add",
+             "--region", "2", "--zone", "3",
+             "--ip", "[2001:0000:1234:0000:0000:C1C0:ABCD:0876]",
+             "--port", "6200",
+             "--replication-ip", "[2::10]",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data",
+             "--weight", "3.14159265359"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        # Test ipv6(old format)
+        argv = ["", self.tmpfile, "set_info",
+                "d4r2z3-[2001:0000:1234:0000:0000:C1C0:ABCD:0876]:6200"
+                "R[2::10]:7000/sda3_some meta data",
+                "[3001:0000:1234:0000:0000:C1C0:ABCD:0876]:8000"
+                "R[3::10]:8000/sda30_other meta data"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring = RingBuilder.load(self.tmpfile)
+
+        # Check that second device in ring is not affected
+        dev = ring.devs[0]
+        self.assertEqual(dev['ip'], '127.0.0.1')
+        self.assertEqual(dev['port'], 6200)
+        self.assertEqual(dev['replication_ip'], '127.0.0.1')
+        self.assertEqual(dev['replication_port'], 6200)
+        self.assertEqual(dev['device'], 'sda1')
+        self.assertEqual(dev['meta'], 'some meta data')
+
+        # Check that second device in ring is not affected
+        dev = ring.devs[1]
+        self.assertEqual(dev['ip'], '127.0.0.2')
+        self.assertEqual(dev['port'], 6201)
+        self.assertEqual(dev['device'], 'sda2')
+        self.assertEqual(dev['meta'], '')
+
+        # Check that device was created with given data
+        dev = ring.devs[-1]
+        self.assertEqual(dev['ip'], '3001:0:1234::c1c0:abcd:876')
+        self.assertEqual(dev['port'], 8000)
+        self.assertEqual(dev['replication_ip'], '3::10')
+        self.assertEqual(dev['replication_port'], 8000)
+        self.assertEqual(dev['device'], 'sda30')
+        self.assertEqual(dev['meta'], 'other meta data')
+
+        # Final check, rebalance and check ring is ok
+        ring.rebalance()
+        self.assertTrue(ring.validate())
+
+    def test_set_info_ipv4_new_format(self):
+        self.create_sample_ring()
+        # Test ipv4(new format)
+        argv = \
+            ["", self.tmpfile, "set_info",
+             "--id", "0", "--region", "0", "--zone", "0",
+             "--ip", "127.0.0.1",
+             "--port", "6200",
+             "--replication-ip", "127.0.0.1",
+             "--replication-port", "6200",
+             "--device", "sda1", "--meta", "some meta data",
+             "--change-ip", "127.0.2.1",
+             "--change-port", "9000",
+             "--change-replication-ip", "127.0.2.1",
+             "--change-replication-port", "9000",
+             "--change-device", "sda100", "--change-meta", "other meta data"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        # Check that device was created with given data
+        ring = RingBuilder.load(self.tmpfile)
+        dev = ring.devs[0]
+        self.assertEqual(dev['ip'], '127.0.2.1')
+        self.assertEqual(dev['port'], 9000)
+        self.assertEqual(dev['replication_ip'], '127.0.2.1')
+        self.assertEqual(dev['replication_port'], 9000)
+        self.assertEqual(dev['device'], 'sda100')
+        self.assertEqual(dev['meta'], 'other meta data')
+
+        # Check that second device in ring is not affected
+        dev = ring.devs[1]
+        self.assertEqual(dev['ip'], '127.0.0.2')
+        self.assertEqual(dev['port'], 6201)
+        self.assertEqual(dev['device'], 'sda2')
+        self.assertEqual(dev['meta'], '')
+
+        # Final check, rebalance and check ring is ok
+        ring.rebalance()
+        self.assertTrue(ring.validate())
+
+    def test_set_info_ipv6_new_format(self):
+        self.create_sample_ring()
+        # add IPV6
+        argv = \
+            ["", self.tmpfile, "add",
+             "--region", "2", "--zone", "3",
+             "--ip", "[2001:0000:1234:0000:0000:C1C0:ABCD:0876]",
+             "--port", "6200",
+             "--replication-ip", "[2::10]",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data",
+             "--weight", "3.14159265359"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        # Test ipv6(new format)
+        argv = \
+            ["", self.tmpfile, "set_info",
+             "--id", "4", "--region", "2", "--zone", "3",
+             "--ip", "[2001:0000:1234:0000:0000:C1C0:ABCD:0876]",
+             "--port", "6200",
+             "--replication-ip", "[2::10]",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data",
+             "--change-ip", "[4001:0000:1234:0000:0000:C1C0:ABCD:0876]",
+             "--change-port", "9000",
+             "--change-replication-ip", "[4::10]",
+             "--change-replication-port", "9000",
+             "--change-device", "sda300", "--change-meta", "other meta data"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring = RingBuilder.load(self.tmpfile)
+
+        # Check that second device in ring is not affected
+        dev = ring.devs[0]
+        self.assertEqual(dev['ip'], '127.0.0.1')
+        self.assertEqual(dev['port'], 6200)
+        self.assertEqual(dev['replication_ip'], '127.0.0.1')
+        self.assertEqual(dev['replication_port'], 6200)
+        self.assertEqual(dev['device'], 'sda1')
+        self.assertEqual(dev['meta'], 'some meta data')
+
+        # Check that second device in ring is not affected
+        dev = ring.devs[1]
+        self.assertEqual(dev['ip'], '127.0.0.2')
+        self.assertEqual(dev['port'], 6201)
+        self.assertEqual(dev['device'], 'sda2')
+        self.assertEqual(dev['meta'], '')
+
+        # Check that device was created with given data
+        ring = RingBuilder.load(self.tmpfile)
+        dev = ring.devs[-1]
+        self.assertEqual(dev['ip'], '4001:0:1234::c1c0:abcd:876')
+        self.assertEqual(dev['port'], 9000)
+        self.assertEqual(dev['replication_ip'], '4::10')
+        self.assertEqual(dev['replication_port'], 9000)
+        self.assertEqual(dev['device'], 'sda300')
+        self.assertEqual(dev['meta'], 'other meta data')
+
+        # Final check, rebalance and check ring is ok
+        ring.rebalance()
+        self.assertTrue(ring.validate())
+
+    def test_set_info_domain_new_format(self):
+        self.create_sample_ring()
+        # add domain name
+        argv = \
+            ["", self.tmpfile, "add",
+             "--region", "2", "--zone", "3",
+             "--ip", "test.test.com",
+             "--port", "6200",
+             "--replication-ip", "r.test.com",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data",
+             "--weight", "3.14159265359"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        # Test domain name
+        argv = \
+            ["", self.tmpfile, "set_info",
+             "--id", "4", "--region", "2", "--zone", "3",
+             "--ip", "test.test.com",
+             "--port", "6200",
+             "--replication-ip", "r.test.com",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data",
+             "--change-ip", "test.test2.com",
+             "--change-port", "9000",
+             "--change-replication-ip", "r.test2.com",
+             "--change-replication-port", "9000",
+             "--change-device", "sda300", "--change-meta", "other meta data"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring = RingBuilder.load(self.tmpfile)
+
+        # Check that second device in ring is not affected
+        dev = ring.devs[0]
+        self.assertEqual(dev['ip'], '127.0.0.1')
+        self.assertEqual(dev['port'], 6200)
+        self.assertEqual(dev['replication_ip'], '127.0.0.1')
+        self.assertEqual(dev['replication_port'], 6200)
+        self.assertEqual(dev['device'], 'sda1')
+        self.assertEqual(dev['meta'], 'some meta data')
+
+        # Check that second device in ring is not affected
+        dev = ring.devs[1]
+        self.assertEqual(dev['ip'], '127.0.0.2')
+        self.assertEqual(dev['port'], 6201)
+        self.assertEqual(dev['device'], 'sda2')
+        self.assertEqual(dev['meta'], '')
+
+        # Check that device was created with given data
+        dev = ring.devs[-1]
+        self.assertEqual(dev['ip'], 'test.test2.com')
+        self.assertEqual(dev['port'], 9000)
+        self.assertEqual(dev['replication_ip'], 'r.test2.com')
+        self.assertEqual(dev['replication_port'], 9000)
+        self.assertEqual(dev['device'], 'sda300')
+        self.assertEqual(dev['meta'], 'other meta data')
+
+        # Final check, rebalance and check ring is ok
+        ring.rebalance()
+        self.assertTrue(ring.validate())
+
+    def test_set_info_number_of_arguments(self):
+        self.create_sample_ring()
+        # Test Number of arguments abnormal
+        argv = ["", self.tmpfile, "set_info"]
+        self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+
+    def test_set_info_no_matching(self):
+        self.create_sample_ring()
+        # Test No matching devices
+        argv = ["", self.tmpfile, "set_info",
+                "--ip", "unknown"]
+        self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+
+    def test_set_info_already_exists(self):
+        self.create_sample_ring()
+        # Test Set a device that already exists
+        argv = \
+            ["", self.tmpfile, "set_info",
+             "--id", "0", "--region", "0", "--zone", "0",
+             "--ip", "127.0.0.1",
+             "--port", "6200",
+             "--replication-ip", "127.0.0.1",
+             "--replication-port", "6200",
+             "--device", "sda1", "--meta", "some meta data",
+             "--change-ip", "127.0.0.2",
+             "--change-port", "6201",
+             "--change-replication-ip", "127.0.0.2",
+             "--change-replication-port", "6201",
+             "--change-device", "sda2", "--change-meta", ""]
+        self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+
+    def test_set_min_part_hours(self):
+        self.create_sample_ring()
+        argv = ["", self.tmpfile, "set_min_part_hours", "24"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring = RingBuilder.load(self.tmpfile)
+        self.assertEqual(ring.min_part_hours, 24)
+
+    def test_set_min_part_hours_number_of_arguments(self):
+        self.create_sample_ring()
+        # Test Number of arguments abnormal
+        argv = ["", self.tmpfile, "set_min_part_hours"]
+        self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+
+    def test_set_replicas(self):
+        self.create_sample_ring()
+        argv = ["", self.tmpfile, "set_replicas", "3.14159265359"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring = RingBuilder.load(self.tmpfile)
+        self.assertEqual(ring.replicas, 3.14159265359)
+
+    def test_set_overload(self):
+        self.create_sample_ring()
+        argv = ["", self.tmpfile, "set_overload", "0.19878"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring = RingBuilder.load(self.tmpfile)
+        self.assertEqual(ring.overload, 0.19878)
+
+    def test_set_overload_negative(self):
+        self.create_sample_ring()
+        argv = ["", self.tmpfile, "set_overload", "-0.19878"]
+        self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+        ring = RingBuilder.load(self.tmpfile)
+        self.assertEqual(ring.overload, 0.0)
+
+    def test_set_overload_non_numeric(self):
+        self.create_sample_ring()
+        argv = ["", self.tmpfile, "set_overload", "swedish fish"]
+        self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+        ring = RingBuilder.load(self.tmpfile)
+        self.assertEqual(ring.overload, 0.0)
+
+    def test_set_overload_percent(self):
+        self.create_sample_ring()
+        argv = "set_overload 10%".split()
+        out, err = self.run_srb(*argv)
+        ring = RingBuilder.load(self.tmpfile)
+        self.assertEqual(ring.overload, 0.1)
+        self.assertIn('10.00%', out)
+        self.assertIn('0.100000', out)
+
+    def test_set_overload_percent_strange_input(self):
+        self.create_sample_ring()
+        argv = "set_overload 26%%%%".split()
+        out, err = self.run_srb(*argv)
+        ring = RingBuilder.load(self.tmpfile)
+        self.assertEqual(ring.overload, 0.26)
+        self.assertIn('26.00%', out)
+        self.assertIn('0.260000', out)
+
+    def test_server_overload_crazy_high(self):
+        self.create_sample_ring()
+        argv = "set_overload 10".split()
+        out, err = self.run_srb(*argv)
+        ring = RingBuilder.load(self.tmpfile)
+        self.assertEqual(ring.overload, 10.0)
+        self.assertIn('Warning overload is greater than 100%', out)
+        self.assertIn('1000.00%', out)
+        self.assertIn('10.000000', out)
+        # but it's cool if you do it on purpose
+        argv[-1] = '1000%'
+        out, err = self.run_srb(*argv)
+        ring = RingBuilder.load(self.tmpfile)
+        self.assertEqual(ring.overload, 10.0)
+        self.assertNotIn('Warning overload is greater than 100%', out)
+        self.assertIn('1000.00%', out)
+        self.assertIn('10.000000', out)
+
+    def test_set_overload_number_of_arguments(self):
+        self.create_sample_ring()
+        # Test missing arguments
+        argv = ["", self.tmpfile, "set_overload"]
+        self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+
+    def test_set_replicas_number_of_arguments(self):
+        self.create_sample_ring()
+        # Test Number of arguments abnormal
+        argv = ["", self.tmpfile, "set_replicas"]
+        self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+
+    def test_set_replicas_invalid_value(self):
+        self.create_sample_ring()
+        # Test not a valid number
+        argv = ["", self.tmpfile, "set_replicas", "test"]
+        self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+
+        # Test new replicas is 0
+        argv = ["", self.tmpfile, "set_replicas", "0"]
+        self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+
+    def test_validate(self):
+        self.create_sample_ring()
+        ring = RingBuilder.load(self.tmpfile)
+        ring.rebalance()
+        ring.save(self.tmpfile)
+        argv = ["", self.tmpfile, "validate"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+    def test_validate_composite_builder_file(self):
+        b1, b1_file = write_stub_builder(self.tmpdir, 1)
+        b2, b2_file = write_stub_builder(self.tmpdir, 2)
+        cb = CompositeRingBuilder([b1_file, b2_file])
+        cb.compose()
+        cb_file = os.path.join(self.tmpdir, 'composite.builder')
+        cb.save(cb_file)
+        argv = ["", cb_file, "validate"]
+        with mock.patch("sys.stdout", io.StringIO()) as mock_stdout:
+            self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+        lines = mock_stdout.getvalue().strip().split('\n')
+        self.assertIn("Ring Builder file is invalid", lines[0])
+        self.assertIn("appears to be a composite ring builder file", lines[0])
+        self.assertFalse(lines[1:])
+
+    def test_validate_empty_file(self):
+        open(self.tmpfile, 'a').close
+        argv = ["", self.tmpfile, "validate"]
+        with mock.patch("sys.stdout", io.StringIO()) as mock_stdout:
+            self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+        lines = mock_stdout.getvalue().strip().split('\n')
+        self.assertIn("Ring Builder file is invalid", lines[0])
+        self.assertNotIn("appears to be a composite ring builder file",
+                         lines[0])
+        self.assertFalse(lines[1:])
+
+    def test_validate_corrupted_file(self):
+        self.create_sample_ring()
+        ring = RingBuilder.load(self.tmpfile)
+        ring.rebalance()
+        self.assertTrue(ring.validate())  # ring is valid until now
+        ring.save(self.tmpfile)
+        argv = ["", self.tmpfile, "validate"]
+
+        # corrupt the file
+        with open(self.tmpfile, 'wb') as f:
+            f.write(os.urandom(1024))
+        with mock.patch("sys.stdout", io.StringIO()) as mock_stdout:
+            self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+        lines = mock_stdout.getvalue().strip().split('\n')
+        self.assertIn("Ring Builder file is invalid", lines[0])
+        self.assertNotIn("appears to be a composite ring builder file",
+                         lines[0])
+        self.assertFalse(lines[1:])
+
+    def test_validate_non_existent_file(self):
+        rand_file = '%s/%s' % (tempfile.gettempdir(), str(uuid.uuid4()))
+        argv = ["", rand_file, "validate"]
+        with mock.patch("sys.stdout", io.StringIO()) as mock_stdout:
+            self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+        lines = mock_stdout.getvalue().strip().split('\n')
+        self.assertIn("Ring Builder file does not exist", lines[0])
+        self.assertNotIn("appears to be a composite ring builder file",
+                         lines[0])
+        self.assertFalse(lines[1:])
+
+    def test_validate_non_accessible_file(self):
+        with mock.patch.object(
+                RingBuilder, 'load',
+                mock.Mock(side_effect=exceptions.PermissionError("boom"))):
+            argv = ["", self.tmpfile, "validate"]
+            with mock.patch("sys.stdout", io.StringIO()) as mock_stdout:
+                self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+        lines = mock_stdout.getvalue().strip().split('\n')
+        self.assertIn("boom", lines[0])
+        self.assertFalse(lines[1:])
+
+    def test_validate_generic_error(self):
+        with mock.patch.object(
+                RingBuilder, 'load', mock.Mock(
+                    side_effect=IOError('Generic error occurred'))):
+            argv = ["", self.tmpfile, "validate"]
+            self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+
+    def test_search_device_ipv4_old_format(self):
+        self.create_sample_ring()
+        # Test ipv4(old format)
+        argv = ["", self.tmpfile, "search",
+                "d0r0z0-127.0.0.1:6200R127.0.0.1:6200/sda1_some meta data"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+    def test_search_device_ipv6_old_format(self):
+        self.create_sample_ring()
+        # add IPV6
+        argv = \
+            ["", self.tmpfile, "add",
+             "--region", "2", "--zone", "3",
+             "--ip", "[2001:0000:1234:0000:0000:C1C0:ABCD:0876]",
+             "--port", "6200",
+             "--replication-ip", "[2::10]",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data",
+             "--weight", "3.14159265359"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        # write ring file
+        ring = RingBuilder.load(self.tmpfile)
+        ring.rebalance()
+        ring.save(self.tmpfile)
+
+        # Test ipv6(old format)
+        argv = ["", self.tmpfile, "search",
+                "d4r2z3-[2001:0000:1234:0000:0000:C1C0:ABCD:0876]:6200"
+                "R[2::10]:7000/sda3_some meta data"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+    def test_search_device_ipv4_new_format(self):
+        self.create_sample_ring()
+        # Test ipv4(new format)
+        argv = \
+            ["", self.tmpfile, "search",
+             "--id", "0", "--region", "0", "--zone", "0",
+             "--ip", "127.0.0.1",
+             "--port", "6200",
+             "--replication-ip", "127.0.0.1",
+             "--replication-port", "6200",
+             "--device", "sda1", "--meta", "some meta data"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+    def test_search_device_ipv6_new_format(self):
+        self.create_sample_ring()
+        # add IPV6
+        argv = \
+            ["", self.tmpfile, "add",
+             "--region", "2", "--zone", "3",
+             "--ip", "[2001:0000:1234:0000:0000:C1C0:ABCD:0876]",
+             "--port", "6200",
+             "--replication-ip", "[2::10]",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data",
+             "--weight", "3.14159265359"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        # write ring file
+        ring = RingBuilder.load(self.tmpfile)
+        ring.rebalance()
+        ring.save(self.tmpfile)
+
+        # Test ipv6(new format)
+        argv = \
+            ["", self.tmpfile, "search",
+             "--id", "4", "--region", "2", "--zone", "3",
+             "--ip", "[2001:0000:1234:0000:0000:C1C0:ABCD:0876]",
+             "--port", "6200",
+             "--replication-ip", "[2::10]",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+    def test_search_device_domain_new_format(self):
+        self.create_sample_ring()
+        # add domain name
+        argv = \
+            ["", self.tmpfile, "add",
+             "--region", "2", "--zone", "3",
+             "--ip", "test.test.com",
+             "--port", "6200",
+             "--replication-ip", "r.test.com",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data",
+             "--weight", "3.14159265359"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        # write ring file
+        ring = RingBuilder.load(self.tmpfile)
+        ring.rebalance()
+        ring.save(self.tmpfile)
+
+        # Test domain name
+        argv = \
+            ["", self.tmpfile, "search",
+             "--id", "4", "--region", "2", "--zone", "3",
+             "--ip", "test.test.com",
+             "--port", "6200",
+             "--replication-ip", "r.test.com",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+    def test_search_device_number_of_arguments(self):
+        self.create_sample_ring()
+        # Test Number of arguments abnormal
+        argv = ["", self.tmpfile, "search"]
+        self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+
+    def test_search_device_no_matching(self):
+        self.create_sample_ring()
+        # Test No matching devices
+        argv = ["", self.tmpfile, "search",
+                "--ip", "unknown"]
+        self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+
+    def test_list_parts_ipv4_old_format(self):
+        self.create_sample_ring()
+        ring = RingBuilder.load(self.tmpfile)
+        ring.rebalance()
+        ring.save(self.tmpfile)
+        # Test ipv4(old format)
+        argv = ["", self.tmpfile, "list_parts",
+                "d0r0z0-127.0.0.1:6200R127.0.0.1:6200/sda1_some meta data"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+    def test_list_parts_ipv6_old_format(self):
+        self.create_sample_ring()
+        # add IPV6
+        argv = \
+            ["", self.tmpfile, "add",
+             "--region", "2", "--zone", "3",
+             "--ip", "[2001:0000:1234:0000:0000:C1C0:ABCD:0876]",
+             "--port", "6200",
+             "--replication-ip", "[2::10]",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data",
+             "--weight", "3.14159265359"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        # write ring file
+        ring = RingBuilder.load(self.tmpfile)
+        ring.rebalance()
+        ring.save(self.tmpfile)
+
+        # Test ipv6(old format)
+        argv = ["", self.tmpfile, "list_parts",
+                "d4r2z3-[2001:0000:1234:0000:0000:C1C0:ABCD:0876]:6200"
+                "R[2::10]:7000/sda3_some meta data"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+    def test_list_parts_ipv4_new_format(self):
+        self.create_sample_ring()
+        ring = RingBuilder.load(self.tmpfile)
+        ring.rebalance()
+        ring.save(self.tmpfile)
+        # Test ipv4(new format)
+        argv = \
+            ["", self.tmpfile, "list_parts",
+             "--id", "0", "--region", "0", "--zone", "0",
+             "--ip", "127.0.0.1",
+             "--port", "6200",
+             "--replication-ip", "127.0.0.1",
+             "--replication-port", "6200",
+             "--device", "sda1", "--meta", "some meta data"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+    def test_list_parts_ipv6_new_format(self):
+        self.create_sample_ring()
+        # add IPV6
+        argv = \
+            ["", self.tmpfile, "add",
+             "--region", "2", "--zone", "3",
+             "--ip", "[2001:0000:1234:0000:0000:C1C0:ABCD:0876]",
+             "--port", "6200",
+             "--replication-ip", "[2::10]",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data",
+             "--weight", "3.14159265359"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        # write ring file
+        ring = RingBuilder.load(self.tmpfile)
+        ring.rebalance()
+        ring.save(self.tmpfile)
+
+        # Test ipv6(new format)
+        argv = \
+            ["", self.tmpfile, "list_parts",
+             "--id", "4", "--region", "2", "--zone", "3",
+             "--ip", "[2001:0000:1234:0000:0000:C1C0:ABCD:0876]",
+             "--port", "6200",
+             "--replication-ip", "[2::10]",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+    def test_list_parts_domain_new_format(self):
+        self.create_sample_ring()
+        # add domain name
+        argv = \
+            ["", self.tmpfile, "add",
+             "--region", "2", "--zone", "3",
+             "--ip", "test.test.com",
+             "--port", "6200",
+             "--replication-ip", "r.test.com",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data",
+             "--weight", "3.14159265359"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        # write ring file
+        ring = RingBuilder.load(self.tmpfile)
+        ring.rebalance()
+        ring.save(self.tmpfile)
+
+        # Test domain name
+        argv = \
+            ["", self.tmpfile, "list_parts",
+             "--id", "4", "--region", "2", "--zone", "3",
+             "--ip", "test.test.com",
+             "--port", "6200",
+             "--replication-ip", "r.test.com",
+             "--replication-port", "7000",
+             "--device", "sda3", "--meta", "some meta data"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+    def test_list_parts_number_of_arguments(self):
+        self.create_sample_ring()
+        # Test Number of arguments abnormal
+        argv = ["", self.tmpfile, "list_parts"]
+        self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+
+    def test_list_parts_no_matching(self):
+        self.create_sample_ring()
+        # Test No matching devices
+        argv = ["", self.tmpfile, "list_parts",
+                "--ip", "unknown"]
+        self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+
+    def test_unknown(self):
+        self.create_sample_ring()
+        argv = ["", self.tmpfile, "unknown"]
+        self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+
+    def test_default(self):
+        self.create_sample_ring()
+        argv = ["", self.tmpfile]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+    def test_default_output(self):
+        with mock.patch('uuid.uuid4', return_value=mock.Mock(hex=None)):
+            self.create_sample_ring()
+        out, err = self.run_srb('')
+        self.assertOutputStub(out)
+
+    def test_default_output_id_assigned(self):
+        ring = self.create_sample_ring()
+        out, err = self.run_srb('')
+        self.assertOutputStub(out, builder_id=ring.id)
+
+    def test_ipv6_output(self):
+        ring = RingBuilder(8, 3, 1)
+        ring.add_dev({'weight': 100.0,
+                      'region': 0,
+                      'zone': 0,
+                      'ip': '2001:db8:85a3::8a2e:370:7334',
+                      'port': 6200,
+                      'device': 'sda1',
+                      'meta': 'some meta data',
+                      })
+        ring.add_dev({'weight': 100.0,
+                      'region': 1,
+                      'zone': 1,
+                      'ip': '127.0.0.1',
+                      'port': 66201,
+                      'device': 'sda2',
+                      })
+        ring.add_dev({'weight': 10000.0,
+                      'region': 2,
+                      'zone': 2,
+                      'ip': '2001:db8:85a3::8a2e:370:7336',
+                      'port': 6202,
+                      'device': 'sdc3',
+                      'replication_ip': '127.0.10.127',
+                      'replication_port': 7070,
+                      })
+        ring.add_dev({'weight': 100.0,
+                      'region': 3,
+                      'zone': 3,
+                      'ip': '2001:db8:85a3::8a2e:370:7337',
+                      'port': 6203,
+                      'device': 'sdd4',
+                      'replication_ip': '7001:db8:85a3::8a2e:370:7337',
+                      'replication_port': 11664,
+                      })
+        ring.save(self.tmpfile)
+        out, err = self.run_srb('')
+        self.assertOutputStub(out, builder_id=ring.id)
+
+    def test_default_show_removed(self):
+        mock_stdout = io.StringIO()
+        mock_stderr = io.StringIO()
+
+        ring = self.create_sample_ring()
+
+        # Note: it also sets device's weight to zero.
+        argv = ["", self.tmpfile, "remove", "--id", "1"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        # Setting another device's weight to zero to be sure we distinguish
+        # real removed device and device with zero weight.
+        argv = ["", self.tmpfile, "set_weight", "0", "--id", "3"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        argv = ["", self.tmpfile]
+        with mock.patch("sys.stdout", mock_stdout):
+            with mock.patch("sys.stderr", mock_stderr):
+                self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        expected = "%s, build version 6, id %s\n" \
+            "64 partitions, 3.000000 replicas, 4 regions, 4 zones, " \
+            "4 devices, 2-byte IDs, 100.00 balance, 0.00 dispersion\n" \
+            "The minimum number of hours before a partition can be " \
+            "reassigned is 1 (0:00:00 remaining)\n" \
+            "The overload factor is 0.00%% (0.000000)\n" \
+            "Ring file %s.ring.gz not found, probably " \
+            "it hasn't been written yet\n" \
+            "Devices:   id region zone ip address:port " \
+            "replication ip:port  name weight " \
+            "partitions balance flags meta\n" \
+            "            0      0    0  127.0.0.1:6200 " \
+            "     127.0.0.1:6200  sda1 100.00" \
+            "          0 -100.00       some meta data\n" \
+            "            1      1    1  127.0.0.2:6201 " \
+            "     127.0.0.2:6201  sda2   0.00" \
+            "          0    0.00   DEL \n" \
+            "            2      2    2  127.0.0.3:6202 " \
+            "     127.0.0.3:6202  sdc3 100.00" \
+            "          0 -100.00       \n" \
+            "            3      3    3  127.0.0.4:6203 " \
+            "     127.0.0.4:6203  sdd4   0.00" \
+            "          0    0.00       \n" %\
+                   (self.tmpfile, ring.id, self.tmpfile)
+        self.assertEqual(expected, mock_stdout.getvalue())
+
+    def test_default_sorted_output(self):
+        mock_stdout = io.StringIO()
+        mock_stderr = io.StringIO()
+
+        # Create a sample ring and remove/add some devices.
+        now = time.time()
+        ring = self.create_sample_ring()
+        argv = ["", self.tmpfile, "add",
+                "--region", "1", "--zone", "2",
+                "--ip", "127.0.0.5", "--port", "6004",
+                "--replication-ip", "127.0.0.5",
+                "--replication-port", "6004",
+                "--device", "sda5", "--weight", "100.0"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        argv = ["", self.tmpfile, "remove", "--id", "0"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        argv = ["", self.tmpfile, "remove", "--id", "3"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        argv = ["", self.tmpfile, "rebalance"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        argv = \
+            ["", self.tmpfile, "add",
+             "--region", "2", "--zone", "1",
+             "--ip", "127.0.0.6", "--port", "6005",
+             "--replication-ip", "127.0.0.6",
+             "--replication-port", "6005",
+             "--device", "sdb6", "--weight", "100.0"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        # Check the order of the devices listed the output.
+        argv = ["", self.tmpfile]
+        with mock.patch("sys.stdout", mock_stdout), mock.patch(
+                "sys.stderr", mock_stderr), mock.patch(
+                    'swift.common.ring.builder.time', return_value=now):
+            self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        self.assertOutputStub(mock_stdout.getvalue(), builder_id=ring.id)
+
+    def test_default_ringfile_check(self):
+        self.create_sample_ring()
+
+        # ring file not created
+        mock_stdout = io.StringIO()
+        mock_stderr = io.StringIO()
+        argv = ["", self.tmpfile]
+        with mock.patch("sys.stdout", mock_stdout):
+            with mock.patch("sys.stderr", mock_stderr):
+                self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring_not_found_re = re.compile(r"Ring file .*\.ring\.gz not found")
+        self.assertTrue(ring_not_found_re.findall(mock_stdout.getvalue()))
+
+        # write ring file
+        argv = ["", self.tmpfile, "rebalance"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        # ring file is up-to-date
+        mock_stdout = io.StringIO()
+        argv = ["", self.tmpfile]
+        with mock.patch("sys.stdout", mock_stdout):
+            with mock.patch("sys.stderr", mock_stderr):
+                self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring_up_to_date_re = re.compile(
+            r"Ring file .*\.ring\.gz is up-to-date"
+        )
+        self.assertTrue(ring_up_to_date_re.findall(mock_stdout.getvalue()))
+
+        # change builder (set weight)
+        argv = ["", self.tmpfile, "set_weight", "0", "--id", "3"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        # ring file is obsolete after set_weight
+        mock_stdout = io.StringIO()
+        argv = ["", self.tmpfile]
+        with mock.patch("sys.stdout", mock_stdout):
+            with mock.patch("sys.stderr", mock_stderr):
+                self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring_obsolete_re = re.compile(r"Ring file .*\.ring\.gz is obsolete")
+        self.assertTrue(ring_obsolete_re.findall(mock_stdout.getvalue()))
+
+        # write ring file
+        argv = ["", self.tmpfile, "write_ring"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        # ring file up-to-date again
+        mock_stdout = io.StringIO()
+        argv = ["", self.tmpfile]
+        with mock.patch("sys.stdout", mock_stdout):
+            with mock.patch("sys.stderr", mock_stderr):
+                self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        self.assertTrue(ring_up_to_date_re.findall(mock_stdout.getvalue()))
+
+        # Break ring file e.g. just make it empty
+        open('%s.ring.gz' % self.tmpfile, 'w').close()
+        # ring file is invalid
+        mock_stdout = io.StringIO()
+        argv = ["", self.tmpfile]
+        with mock.patch("sys.stdout", mock_stdout):
+            with mock.patch("sys.stderr", mock_stderr):
+                self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring_invalid_re = re.compile(r"Ring file .*\.ring\.gz is invalid")
+        self.assertTrue(ring_invalid_re.findall(mock_stdout.getvalue()))
+
+    def test_default_no_device_ring_without_exception(self):
+        self.create_sample_ring()
+
+        # remove devices from ring file
+        mock_stdout = io.StringIO()
+        mock_stderr = io.StringIO()
+        for device in ["d0", "d1", "d2", "d3"]:
+            argv = ["", self.tmpfile, "remove", device]
+            with mock.patch("sys.stdout", mock_stdout):
+                with mock.patch("sys.stderr", mock_stderr):
+                    self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        # default ring file without exception
+        mock_stdout = io.StringIO()
+        mock_stderr = io.StringIO()
+        argv = ["", self.tmpfile, "default"]
+        with mock.patch("sys.stdout", mock_stdout):
+            with mock.patch("sys.stderr", mock_stderr):
+                self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        deleted_dev_list = (
+            "            0      0    0  127.0.0.1:6200      127.0.0.1:6200  "
+            "sda1   0.00          0    0.00   DEL some meta data\n"
+            "            1      1    1  127.0.0.2:6201      127.0.0.2:6201  "
+            "sda2   0.00          0    0.00   DEL \n"
+            "            2      2    2  127.0.0.3:6202      127.0.0.3:6202  "
+            "sdc3   0.00          0    0.00   DEL \n"
+            "            3      3    3  127.0.0.4:6203      127.0.0.4:6203  "
+            "sdd4   0.00          0    0.00   DEL \n")
+
+        output = mock_stdout.getvalue()
+        self.assertIn("64 partitions", output)
+        self.assertIn("all devices have been deleted", output)
+        self.assertIn("all devices have been deleted", output)
+        self.assertIn(deleted_dev_list, output)
+
+    def test_empty_ring(self):
+        self.create_sample_ring(empty=True)
+
+        # default ring file without exception
+        mock_stdout = io.StringIO()
+        mock_stderr = io.StringIO()
+        argv = ["", self.tmpfile, "default"]
+        with mock.patch("sys.stdout", mock_stdout):
+            with mock.patch("sys.stderr", mock_stderr):
+                self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        output = mock_stdout.getvalue()
+        self.assertIn("64 partitions", output)
+        self.assertIn("There are no devices in this ring", output)
+
+    def test_pretend_min_part_hours_passed(self):
+        self.run_srb("create", 8, 3, 1)
+        argv_pretend = ["", self.tmpfile, "pretend_min_part_hours_passed"]
+        # pretend_min_part_hours_passed should success, even not rebalanced
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv_pretend)
+        self.run_srb("add",
+                     "r1z1-10.1.1.1:2345/sda", 100.0,
+                     "r1z1-10.1.1.1:2345/sdb", 100.0,
+                     "r1z1-10.1.1.1:2345/sdc", 100.0)
+        argv_rebalance = ["", self.tmpfile, "rebalance"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv_rebalance)
+        self.run_srb("add", "r1z1-10.1.1.1:2345/sdd", 100.0)
+        # rebalance fail without pretend_min_part_hours_passed
+        self.assertSystemExit(EXIT_WARNING, ringbuilder.main, argv_rebalance)
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv_pretend)
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv_rebalance)
+
+    def test_rebalance(self):
+        self.create_sample_ring()
+        argv = ["", self.tmpfile, "rebalance", "3"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring = RingBuilder.load(self.tmpfile)
+        self.assertTrue(ring.validate())
+
+    def test_rebalance_no_device_change(self):
+        self.create_sample_ring()
+        ring = RingBuilder.load(self.tmpfile)
+        ring.rebalance()
+        ring.save(self.tmpfile)
+        # Test No change to the device
+        argv = ["", self.tmpfile, "rebalance", "3"]
+        with mock.patch('swift.common.ring.RingBuilder.save') as mock_save:
+            self.assertSystemExit(EXIT_WARNING, ringbuilder.main, argv)
+        self.assertEqual(len(mock_save.calls), 0)
+
+    def test_rebalance_saves_dispersion_improvement(self):
+        # We set up a situation where dispersion improves but balance
+        # doesn't. We construct a ring with one zone, then add a second zone
+        # concurrently with a new device in the first zone. That first
+        # device won't acquire any partitions, so the ring's balance won't
+        # change. However, dispersion will improve.
+
+        ring = RingBuilder(6, 6, 1)
+        devs = ('d%s' % i for i in itertools.count())
+        for i in range(6):
+            ring.add_dev({
+                'region': 1, 'zone': 1,
+                'ip': '10.0.0.1', 'port': 20001, 'weight': 1000,
+                'device': next(devs)})
+        ring.rebalance()
+
+        # The last guy in zone 1
+        ring.add_dev({
+            'region': 1, 'zone': 1,
+            'ip': '10.0.0.1', 'port': 20001, 'weight': 1000,
+            'device': next(devs)})
+
+        # Add zone 2 (same total weight as zone 1)
+        for i in range(7):
+            ring.add_dev({
+                'region': 1, 'zone': 2,
+                'ip': '10.0.0.2', 'port': 20001, 'weight': 1000,
+                'device': next(devs)})
+        ring.pretend_min_part_hours_passed()
+        ring.save(self.tmpfile)
+        del ring
+
+        # Rebalance once: this gets 1/6th replica into zone 2; the ring is
+        # saved because devices changed.
+        argv = ["", self.tmpfile, "rebalance", "5759339"]
+        self.assertSystemExit(EXIT_WARNING, ringbuilder.main, argv)
+        rb = RingBuilder.load(self.tmpfile)
+        self.assertEqual(rb.dispersion, 33.333333333333336)
+        self.assertEqual(rb.get_balance(), 100)
+        self.run_srb('pretend_min_part_hours_passed')
+
+        # Rebalance again: this gets 2/6th replica into zone 2, but no devices
+        # changed and the balance stays the same. The only improvement is
+        # dispersion.
+
+        captured = {}
+
+        def capture_save(rb, path):
+            captured['dispersion'] = rb.dispersion
+            captured['balance'] = rb.get_balance()
+        # The warning is benign; it's just telling the user to keep on
+        # rebalancing. The important assertion is that the builder was
+        # saved.
+        with mock.patch('swift.common.ring.RingBuilder.save', capture_save):
+            self.assertSystemExit(EXIT_WARNING, ringbuilder.main, argv)
+        self.assertEqual(captured, {
+            'dispersion': 16.666666666666668,
+            'balance': 100,
+        })
+
+    def test_rebalance_no_devices(self):
+        # Test no devices
+        argv = ["", self.tmpfile, "create", "6", "3.14159265359", "1"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        argv = ["", self.tmpfile, "rebalance"]
+        self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+
+    def test_rebalance_remove_zero_weighted_device(self):
+        self.create_sample_ring()
+        ring = RingBuilder.load(self.tmpfile)
+        ring.set_dev_weight(2, 0.0)
+        ring.rebalance()
+        ring.pretend_min_part_hours_passed()
+        ring.remove_dev(2)
+        ring.save(self.tmpfile)
+
+        # Test rebalance after remove 0 weighted device
+        argv = ["", self.tmpfile, "rebalance", "3"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring = RingBuilder.load(self.tmpfile)
+        self.assertTrue(ring.validate())
+        self.assertEqual(len(ring.devs), 4)
+        self.assertIsNone(ring.devs[2])
+
+    def test_rebalance_remove_off_end_trims_dev_list(self):
+        self.create_sample_ring()
+        ring = RingBuilder.load(self.tmpfile)
+        ring.set_dev_weight(3, 0.0)
+        ring.rebalance()
+        ring.pretend_min_part_hours_passed()
+        ring.remove_dev(3)
+        ring.save(self.tmpfile)
+
+        # Test rebalance after remove 0 weighted device
+        argv = ["", self.tmpfile, "rebalance", "3"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        ring = RingBuilder.load(self.tmpfile)
+        self.assertTrue(ring.validate())
+        self.assertEqual(len(ring.devs), 3)
+
+    def test_rebalance_resets_time_remaining(self):
+        self.create_sample_ring()
+        ring = RingBuilder.load(self.tmpfile)
+
+        time_path = 'swift.common.ring.builder.time'
+        argv = ["", self.tmpfile, "rebalance", "3"]
+        time = 0
+
+        # first rebalance, should have 1 hour left before next rebalance
+        time += 3600
+        with mock.patch(time_path, return_value=time):
+            self.assertEqual(ring.min_part_seconds_left, 0)
+            self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+            ring = RingBuilder.load(self.tmpfile)
+            self.assertEqual(ring.min_part_seconds_left, 3600)
+
+        # min part hours passed, change ring and save for rebalance
+        ring.set_dev_weight(0, ring.devs[0]['weight'] * 2)
+        ring.save(self.tmpfile)
+
+        # second rebalance, should have 1 hour left
+        time += 3600
+        with mock.patch(time_path, return_value=time):
+            self.assertEqual(ring.min_part_seconds_left, 0)
+            self.assertSystemExit(EXIT_WARNING, ringbuilder.main, argv)
+            ring = RingBuilder.load(self.tmpfile)
+            self.assertEqual(ring.min_part_seconds_left, 3600)
+
+    def test_time_remaining(self):
+        self.create_sample_ring()
+        now = time.time()
+        with mock.patch('swift.common.ring.builder.time', return_value=now):
+            self.run_srb('rebalance')
+            out, err = self.run_srb('rebalance')
+        self.assertIn('No partitions could be reassigned', out)
+        self.assertIn('must be at least min_part_hours', out)
+        self.assertIn('1 hours (1:00:00 remaining)', out)
+        the_future = now + 3600
+        with mock.patch('swift.common.ring.builder.time',
+                        return_value=the_future):
+            out, err = self.run_srb('rebalance')
+        self.assertIn('No partitions could be reassigned', out)
+        self.assertIn('There is no need to do so at this time', out)
+        # or you can pretend_min_part_hours_passed
+        self.run_srb('pretend_min_part_hours_passed')
+        out, err = self.run_srb('rebalance')
+        self.assertIn('No partitions could be reassigned', out)
+        self.assertIn('There is no need to do so at this time', out)
+
+    def test_rebalance_failure_does_not_reset_last_moves_epoch(self):
+        ring = RingBuilder(8, 3, 1)
+        ring.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                      'ip': '127.0.0.1', 'port': 6010, 'device': 'sda1'})
+        ring.add_dev({'id': 1, 'region': 0, 'zone': 0, 'weight': 1,
+                      'ip': '127.0.0.1', 'port': 6020, 'device': 'sdb1'})
+        ring.add_dev({'id': 2, 'region': 0, 'zone': 0, 'weight': 1,
+                      'ip': '127.0.0.1', 'port': 6030, 'device': 'sdc1'})
+
+        time_path = 'swift.common.ring.builder.time'
+        argv = ["", self.tmpfile, "rebalance", "3"]
+
+        with mock.patch(time_path, return_value=0):
+            ring.rebalance()
+        ring.save(self.tmpfile)
+
+        # min part hours not passed
+        with mock.patch(time_path, return_value=(3600 * 0.6)):
+            self.assertSystemExit(EXIT_WARNING, ringbuilder.main, argv)
+            ring = RingBuilder.load(self.tmpfile)
+            self.assertEqual(ring.min_part_seconds_left, 3600 * 0.4)
+
+        ring.save(self.tmpfile)
+
+        # min part hours passed, no partitions need to be moved
+        with mock.patch(time_path, return_value=(3600 * 1.5)):
+            self.assertSystemExit(EXIT_WARNING, ringbuilder.main, argv)
+            ring = RingBuilder.load(self.tmpfile)
+            self.assertEqual(ring.min_part_seconds_left, 0)
+
+    def test_rebalance_with_seed(self):
+        self.create_sample_ring()
+        # Test rebalance using explicit seed parameter
+        argv = ["", self.tmpfile, "rebalance", "--seed", "2"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+    def test_rebalance_removed_devices(self):
+        self.create_sample_ring()
+        argvs = [
+            ["", self.tmpfile, "rebalance", "3"],
+            ["", self.tmpfile, "remove", "d0"],
+            ["", self.tmpfile, "rebalance", "3"]]
+        for argv in argvs:
+            self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+    def test_rebalance_min_part_hours_not_passed(self):
+        self.create_sample_ring()
+        argvs = [
+            ["", self.tmpfile, "rebalance", "3"],
+            ["", self.tmpfile, "set_weight", "d0", "1000"]]
+        for argv in argvs:
+            self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        ring = RingBuilder.load(self.tmpfile)
+        last_replica2part2dev = ring._replica2part2dev
+
+        mock_stdout = io.StringIO()
+        argv = ["", self.tmpfile, "rebalance", "3"]
+        with mock.patch("sys.stdout", mock_stdout):
+            self.assertSystemExit(EXIT_WARNING, ringbuilder.main, argv)
+        expected = "No partitions could be reassigned.\n" + \
+                   "The time between rebalances must be " + \
+                   "at least min_part_hours: 1 hours"
+        self.assertTrue(expected in mock_stdout.getvalue())
+
+        # Messages can be faked, so let's assure that the partition assignment
+        # did not change at all, despite the warning
+        ring = RingBuilder.load(self.tmpfile)
+        self.assertEqual(last_replica2part2dev, ring._replica2part2dev)
+
+    def test_rebalance_part_power_increase(self):
+        self.create_sample_ring()
+        ring = RingBuilder.load(self.tmpfile)
+        ring.next_part_power = 1
+        ring.save(self.tmpfile)
+
+        argv = ["", self.tmpfile, "rebalance", "3"]
+        self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+
+    def test_write_ring(self):
+        self.create_sample_ring()
+        argv = ["", self.tmpfile, "rebalance"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        argv = ["", self.tmpfile, "write_ring"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        for version in ("1", "2"):
+            argv = ["", self.tmpfile, "write_ring", "--format-version",
+                    version]
+            self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+            with RingReader.open("%s.ring.gz" % self.tmpfile) as reader:
+                self.assertEqual(int(version), reader.version)
+
+        exp_results = {'valid_exit_codes': [EXIT_ERROR]}
+        out, err = self.run_srb("write_ring", "--format-version", "3",
+                                exp_results=exp_results)
+        self.assertIn('invalid choice', err)
+
+    def test_write_empty_ring(self):
+        ring = RingBuilder(6, 3, 1)
+        ring.save(self.tmpfile)
+        exp_results = {'valid_exit_codes': [EXIT_ERROR]}
+        out, err = self.run_srb("write_ring", exp_results=exp_results)
+        exp_out = 'Unable to write empty ring.\n'
+        self.assertEqual(exp_out, out[-len(exp_out):])
+        self.assertIn("Defaulting to --format-version=1", out)
+
+        for version in (1, 2):
+            out, err = self.run_srb("write_ring",
+                                    "--format-version={}".format(version),
+                                    exp_results=exp_results)
+            self.assertEqual(exp_out, out)
+
+    def test_write_builder(self):
+        # Test builder file already exists
+        self.create_sample_ring()
+        argv = ["", self.tmpfile, "rebalance"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        argv = ["", self.tmpfile, "write_builder"]
+        exp_results = {'valid_exit_codes': [2]}
+        self.run_srb(*argv, exp_results=exp_results)
+
+    def test_write_builder_fractional_replicas(self):
+        # Test builder file already exists
+        self.create_sample_ring(replicas=1.2)
+        argv = ["", self.tmpfile, "rebalance"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        ring_file = os.path.join(os.path.dirname(self.tmpfile),
+                                 os.path.basename(self.tmpfile) + ".ring.gz")
+        os.remove(self.tmpfile)  # loses file...
+
+        argv = ["", ring_file, "write_builder", "24"]
+        self.assertIsNone(ringbuilder.main(argv))
+
+        # Note that we've picked up an extension
+        builder = RingBuilder.load(self.tmpfile + '.builder')
+        # Version was recorded in the .ring.gz!
+        self.assertEqual(builder.version, 5)
+        # Note that this is different from the original! But it more-closely
+        # reflects the reality that we have an extra replica for 12 of 64 parts
+        self.assertEqual(builder.replicas, 1.1875)
+
+    def test_write_builder_no_version(self):
+        self.create_sample_ring()
+        rb = RingBuilder.load(self.tmpfile)
+        rb.rebalance()
+
+        # Make sure we write down the ring in the old way, with no version
+        rd = rb.get_ring()
+        rd.version = None
+        rd.save(self.tmpfile + ".ring.gz")
+
+        ring_file = os.path.join(os.path.dirname(self.tmpfile),
+                                 os.path.basename(self.tmpfile) + ".ring.gz")
+        os.remove(self.tmpfile)  # loses file...
+
+        argv = ["", ring_file, "write_builder", "24"]
+        self.assertIsNone(ringbuilder.main(argv))
+
+        # Note that we've picked up an extension
+        builder = RingBuilder.load(self.tmpfile + '.builder')
+        # No version in the .ring.gz; default to 0
+        self.assertEqual(builder.version, 0)
+
+    def test_write_builder_after_device_removal(self):
+        # Test regenerating builder file after having removed a device
+        # and lost the builder file
+        self.create_sample_ring()
+
+        argv = ["", self.tmpfile, "add", "r1z1-127.0.0.1:6200/sdb", "1.0"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        argv = ["", self.tmpfile, "add", "r1z1-127.0.0.1:6200/sdc", "1.0"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        argv = ["", self.tmpfile, "rebalance"]
+        self.assertSystemExit(EXIT_WARNING, ringbuilder.main, argv)
+
+        argv = ["", self.tmpfile, "remove", "--id", "0"]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+        argv = ["", self.tmpfile, "rebalance"]
+        self.assertSystemExit(EXIT_WARNING, ringbuilder.main, argv)
+
+        backup_file = os.path.join(os.path.dirname(self.tmpfile),
+                                   os.path.basename(self.tmpfile) + ".ring.gz")
+        os.remove(self.tmpfile)  # loses file...
+
+        argv = ["", backup_file, "write_builder", "24"]
+        self.assertIsNone(ringbuilder.main(argv))
+
+        rb = RingBuilder.load(self.tmpfile + '.builder')
+        self.assertIsNotNone(rb._last_part_moves)
+        rb._last_part_moves = None
+        rb.save(self.tmpfile)
+
+        argv = ["", self.tmpfile + '.builder', "rebalance"]
+        self.assertSystemExit(EXIT_WARNING, ringbuilder.main, argv)
+
+    def test_version_serialization_default(self):
+        self.create_sample_ring()
+        rb = RingBuilder.load(self.tmpfile)
+        rb.rebalance()
+        rd = rb.get_ring()
+        rd.save(self.tmpfile + ".ring.gz")
+
+        ring_file = os.path.join(os.path.dirname(self.tmpfile),
+                                 os.path.basename(self.tmpfile) + ".ring.gz")
+
+        argv = ["", ring_file, "version"]
+        mock_stdout = io.StringIO()
+        with mock.patch("sys.stdout", mock_stdout):
+            self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        expected = ("%s.ring.gz: Serialization version: 1 (2-byte IDs), "
+                    "build version: 5\n" % self.tmpfile)
+        self.assertEqual(expected, mock_stdout.getvalue())
+
+    def test_version_serialization_1(self):
+        self.create_sample_ring()
+        rb = RingBuilder.load(self.tmpfile)
+        rb.rebalance()
+        rd = rb.get_ring()
+        rd.save(self.tmpfile + ".ring.gz", format_version=1)
+
+        ring_file = os.path.join(os.path.dirname(self.tmpfile),
+                                 os.path.basename(self.tmpfile) + ".ring.gz")
+
+        argv = ["", ring_file, "version"]
+        mock_stdout = io.StringIO()
+        with mock.patch("sys.stdout", mock_stdout):
+            self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        expected = ("%s.ring.gz: Serialization version: 1 (2-byte IDs), "
+                    "build version: 5\n" % self.tmpfile)
+        self.assertEqual(expected, mock_stdout.getvalue())
+
+    def test_version_serialization_2(self):
+        self.create_sample_ring()
+        rb = RingBuilder.load(self.tmpfile)
+        rb.rebalance()
+        rd = rb.get_ring()
+        rd.save(self.tmpfile + ".ring.gz", format_version=2)
+
+        ring_file = os.path.join(os.path.dirname(self.tmpfile),
+                                 os.path.basename(self.tmpfile) + ".ring.gz")
+
+        argv = ["", ring_file, "version"]
+        mock_stdout = io.StringIO()
+        with mock.patch("sys.stdout", mock_stdout):
+            self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        expected = ("%s.ring.gz: Serialization version: 2 (2-byte IDs), "
+                    "build version: 5\n" % self.tmpfile)
+        self.assertEqual(expected, mock_stdout.getvalue())
+
+    def test_version_from_builder_file(self):
+        self.create_sample_ring()
+        rb = RingBuilder.load(self.tmpfile)
+        rb.rebalance()
+        rd = rb.get_ring()
+        rd.save(self.tmpfile + ".ring.gz", format_version=2)
+
+        # read version from ring when builder file given as argument
+        argv = ["", self.tmpfile, "version"]
+        mock_stdout = io.StringIO()
+        with mock.patch("sys.stdout", mock_stdout):
+            self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        # output still reports ring file
+        expected = ("%s.ring.gz: Serialization version: 2 (2-byte IDs), "
+                    "build version: 5\n" % self.tmpfile)
+        self.assertEqual(expected, mock_stdout.getvalue())
+
+    def test_version_with_builder_file_missing(self):
+        self.create_sample_ring()
+        rb = RingBuilder.load(self.tmpfile)
+        rb.rebalance()
+        rd = rb.get_ring()
+        rd.save(self.tmpfile + ".ring.gz", format_version=2)
+
+        # remove the builder to hit some interesting except blocks in main
+        os.unlink(self.tmpfile)
+
+        test_args = [
+            # explicit ring file version of course works when builder missing
+            self.tmpfile + ".ring.gz",
+            # even when builder file is missing you can still implicitly
+            # identify the ring file and read the version
+            self.tmpfile,
+        ]
+
+        for path in test_args:
+            argv = ["", path, "version"]
+            mock_stdout = io.StringIO()
+            with mock.patch("sys.stdout", mock_stdout):
+                self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+            expected = ("%s.ring.gz: Serialization version: 2 (2-byte IDs), "
+                        "build version: 5\n" % self.tmpfile)
+            self.assertEqual(expected, mock_stdout.getvalue())
+
+        # but of course if the path is nonsensical we get an error
+        argv = ["", self.tmpfile + ".nonsense", "version"]
+        with self.assertRaises(FileNotFoundError):
+            ringbuilder.main(argv)
+
+    def test_version_from_builder_file_with_ring_missing(self):
+        self.create_sample_ring()
+        rb = RingBuilder.load(self.tmpfile)
+        rb.rebalance()
+        # Don't even bother to write the ring
+
+        test_args = [
+            self.tmpfile + ".ring.gz",
+            # If provided with the (existing) builder, we can infer the
+            # (nonexisting) ring
+            self.tmpfile,
+        ]
+
+        for path in test_args:
+            argv = ["", path, "version"]
+            # Gotta have a ring to get the version info
+            with self.assertRaises(FileNotFoundError):
+                ringbuilder.main(argv)
+
+    def test_warn_at_risk(self):
+        # check that warning is generated when rebalance does not achieve
+        # satisfactory balance
+        self.create_sample_ring()
+        orig_rebalance = RingBuilder.rebalance
+        fake_balance = 6
+
+        def fake_rebalance(builder_instance, *args, **kwargs):
+            parts, balance, removed_devs = orig_rebalance(builder_instance)
+            return parts, fake_balance, removed_devs
+
+        argv = ["", self.tmpfile, "rebalance"]
+        with mock.patch("swift.common.ring.builder.RingBuilder.rebalance",
+                        fake_rebalance):
+            self.assertSystemExit(EXIT_WARNING, ringbuilder.main, argv)
+
+        # even when some overload is allowed
+        self.create_sample_ring(overload=0.05)
+        argv = ["", self.tmpfile, "rebalance"]
+        with mock.patch("swift.common.ring.builder.RingBuilder.rebalance",
+                        fake_rebalance):
+            self.assertSystemExit(EXIT_WARNING, ringbuilder.main, argv)
+
+    def test_no_warn_when_balanced(self):
+        # check that no warning is generated when satisfactory balance is
+        # achieved...
+        self.create_sample_ring()
+        orig_rebalance = RingBuilder.rebalance
+        fake_balance = 5
+
+        def fake_rebalance(builder_instance, *args, **kwargs):
+            parts, balance, removed_devs = orig_rebalance(builder_instance)
+            return parts, fake_balance, removed_devs
+
+        argv = ["", self.tmpfile, "rebalance"]
+        with mock.patch("swift.common.ring.builder.RingBuilder.rebalance",
+                        fake_rebalance):
+            self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        # ...or balance is within permitted overload
+        self.create_sample_ring(overload=0.06)
+        fake_balance = 6
+        argv = ["", self.tmpfile, "rebalance"]
+        with mock.patch("swift.common.ring.builder.RingBuilder.rebalance",
+                        fake_rebalance):
+            self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+    def test_invalid_device_name(self):
+        self.create_sample_ring()
+        for device_name in ["", " ", " sda1", "sda1 ", " meta "]:
+
+            argv = ["",
+                    self.tmpfile,
+                    "add",
+                    "r1z1-127.0.0.1:6200/%s" % device_name,
+                    "1"]
+            self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+
+            argv = ["",
+                    self.tmpfile,
+                    "add",
+                    "--region", "1",
+                    "--zone", "1",
+                    "--ip", "127.0.0.1",
+                    "--port", "6200",
+                    "--device", device_name,
+                    "--weight", "100"]
+            self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+
+    def test_dispersion_command(self):
+        self.create_sample_ring()
+        self.run_srb('rebalance')
+        out, err = self.run_srb('dispersion -v')
+        self.assertIn('dispersion', out.lower())
+        self.assertFalse(err)
+
+    def test_dispersion_command_recalculate(self):
+        rb = RingBuilder(8, 3, 0)
+        for i in range(3):
+            i += 1
+            rb.add_dev({'region': 1, 'zone': i, 'weight': 1.0,
+                        'ip': '127.0.0.%d' % i, 'port': 6000, 'device': 'sda'})
+        # extra device in z1
+        rb.add_dev({'region': 1, 'zone': 1, 'weight': 1.0,
+                    'ip': '127.0.0.1', 'port': 6000, 'device': 'sdb'})
+        rb.rebalance()
+        self.assertEqual(rb.dispersion, 16.666666666666668)
+        # simulate an out-of-date dispersion calculation
+        rb.dispersion = 50
+        rb.save(self.tempfile)
+        old_version = rb.version
+        out, err = self.run_srb('dispersion')
+        self.assertIn('Dispersion is 50.000000', out)
+        out, err = self.run_srb('dispersion --recalculate')
+        self.assertIn('Dispersion is 16.666667', out)
+        rb = RingBuilder.load(self.tempfile)
+        self.assertEqual(rb.version, old_version + 1)
+
+    def test_use_ringfile_as_builderfile(self):
+        mock_stdout = io.StringIO()
+        mock_stderr = io.StringIO()
+
+        argv = ["", self.tmpfile, "rebalance", "3"],
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+        argv = ["", "%s.ring.gz" % self.tmpfile]
+
+        with mock.patch("sys.stdout", mock_stdout):
+            with mock.patch("sys.stderr", mock_stderr):
+                self.assertSystemExit(EXIT_ERROR, ringbuilder.main, argv)
+        expected = "Note: using %s.builder instead of %s.ring.gz " \
+            "as builder file\n" \
+            "Ring Builder file does not exist: %s.builder\n" % (
+                self.tmpfile, self.tmpfile, self.tmpfile)
+        self.assertEqual(expected, mock_stdout.getvalue())
+
+    def test_main_no_arguments(self):
+        # Test calling main with no arguments
+        argv = []
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+    def test_main_single_argument(self):
+        # Test calling main with single argument
+        argv = [""]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+    def test_main_with_safe(self):
+        # Test calling main with '-safe' argument
+        self.create_sample_ring()
+        argv = ["-safe", self.tmpfile]
+        self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+    def test_remove_all_devices(self):
+        # Would block without the 'yes' argument
+        self.create_sample_ring()
+        argv = ["", self.tmpfile, "remove", "--weight", "100", "--yes"]
+        with Timeout(5):
+            self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+    def test_set_info_all_devices(self):
+        # Would block without the 'yes' argument
+        self.create_sample_ring()
+        argv = ["", self.tmpfile, "set_info", "--weight", "100",
+                "--change-meta", "something", "--yes"]
+        with Timeout(5):
+            self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+    def test_set_weight_all_devices(self):
+        # Would block without the 'yes' argument
+        self.create_sample_ring()
+        argv = ["", self.tmpfile, "set_weight",
+                "--weight", "100", "200", "--yes"]
+        with Timeout(5):
+            self.assertSystemExit(EXIT_SUCCESS, ringbuilder.main, argv)
+
+
+class TestRebalanceCommand(unittest.TestCase, RunSwiftRingBuilderMixin):
+
+    def __init__(self, *args, **kwargs):
+        super(TestRebalanceCommand, self).__init__(*args, **kwargs)
+
+    def setUp(self):
+        self.tmpdir = tempfile.mkdtemp()
+        tmpf = tempfile.NamedTemporaryFile(dir=self.tmpdir)
+        self.tempfile = self.tmpfile = tmpf.name
+
+    def tearDown(self):
+        try:
+            shutil.rmtree(self.tmpdir, True)
+        except OSError:
+            pass
+
+    def run_srb(self, *argv):
+        mock_stdout = io.StringIO()
+        mock_stderr = io.StringIO()
+
+        srb_args = ["", self.tempfile] + [str(s) for s in argv]
+
+        try:
+            with mock.patch("sys.stdout", mock_stdout):
+                with mock.patch("sys.stderr", mock_stderr):
+                    ringbuilder.main(srb_args)
+        except SystemExit as err:
+            if err.code not in (0, 1):  # (success, warning)
+                raise
+        return (mock_stdout.getvalue(), mock_stderr.getvalue())
+
+    def test_debug(self):
+        # NB: getLogger(name) always returns the same object
+        rb_logger = logging.getLogger("swift.ring.builder")
+        try:
+            self.assertNotEqual(rb_logger.getEffectiveLevel(), logging.DEBUG)
+
+            self.run_srb("create", 8, 3, 1)
+            self.run_srb("add",
+                         "r1z1-10.1.1.1:2345/sda", 100.0,
+                         "r1z1-10.1.1.1:2345/sdb", 100.0,
+                         "r1z1-10.1.1.1:2345/sdc", 100.0,
+                         "r1z1-10.1.1.1:2345/sdd", 100.0)
+            self.run_srb("rebalance", "--debug")
+            self.assertEqual(rb_logger.getEffectiveLevel(), logging.DEBUG)
+
+            rb_logger.setLevel(logging.INFO)
+            self.run_srb("rebalance", "--debug", "123")
+            self.assertEqual(rb_logger.getEffectiveLevel(), logging.DEBUG)
+
+            rb_logger.setLevel(logging.INFO)
+            self.run_srb("rebalance", "123", "--debug")
+            self.assertEqual(rb_logger.getEffectiveLevel(), logging.DEBUG)
+
+        finally:
+            rb_logger.setLevel(logging.INFO)  # silence other test cases
+
+    def test_rebalance_warning_appears(self):
+        self.run_srb("create", 8, 3, 24)
+        # all in one machine: totally balanceable
+        self.run_srb("add",
+                     "r1z1-10.1.1.1:2345/sda", 100.0,
+                     "r1z1-10.1.1.1:2345/sdb", 100.0,
+                     "r1z1-10.1.1.1:2345/sdc", 100.0,
+                     "r1z1-10.1.1.1:2345/sdd", 100.0)
+        out, err = self.run_srb("rebalance")
+        self.assertNotIn("rebalance/repush", out)
+
+        # 2 machines of equal size: balanceable, but not in one pass due to
+        # min_part_hours > 0
+        self.run_srb("add",
+                     "r1z1-10.1.1.2:2345/sda", 100.0,
+                     "r1z1-10.1.1.2:2345/sdb", 100.0,
+                     "r1z1-10.1.1.2:2345/sdc", 100.0,
+                     "r1z1-10.1.1.2:2345/sdd", 100.0)
+        self.run_srb("pretend_min_part_hours_passed")
+        out, err = self.run_srb("rebalance")
+        self.assertIn("rebalance/repush", out)
+
+        # after two passes, it's all balanced out
+        self.run_srb("pretend_min_part_hours_passed")
+        out, err = self.run_srb("rebalance")
+        self.assertNotIn("rebalance/repush", out)
+
+    def test_rebalance_warning_with_overload(self):
+        self.run_srb("create", 8, 3, 24)
+        self.run_srb("set_overload", 0.12)
+        # The ring's balance is at least 5, so normally we'd get a warning,
+        # but it's suppressed due to the overload factor.
+        self.run_srb("add",
+                     "r1z1-10.1.1.1:2345/sda", 100.0,
+                     "r1z1-10.1.1.1:2345/sdb", 100.0,
+                     "r1z1-10.1.1.1:2345/sdc", 120.0)
+        out, err = self.run_srb("rebalance")
+        self.assertNotIn("rebalance/repush", out)
+
+        # Now we add in a really big device, but not enough partitions move
+        # to fill it in one pass, so we see the rebalance warning.
+        self.run_srb("add", "r1z1-10.1.1.1:2345/sdd", 99999.0)
+        self.run_srb("pretend_min_part_hours_passed")
+        out, err = self.run_srb("rebalance")
+        self.assertIn("rebalance/repush", out)
+
+    def test_cached_dispersion_value(self):
+        self.run_srb("create", 8, 3, 24)
+        self.run_srb("add",
+                     "r1z1-10.1.1.1:2345/sda", 100.0,
+                     "r1z1-10.1.1.1:2345/sdb", 100.0,
+                     "r1z1-10.1.1.1:2345/sdc", 100.0,
+                     "r1z1-10.1.1.1:2345/sdd", 100.0)
+        self.run_srb('rebalance')
+        out, err = self.run_srb()  # list devices
+        self.assertIn('dispersion', out)
+        # remove cached dispersion value
+        builder = RingBuilder.load(self.tempfile)
+        builder.dispersion = None
+        builder.save(self.tempfile)
+        # now dispersion output is suppressed
+        out, err = self.run_srb()  # list devices
+        self.assertNotIn('dispersion', out)
+        # but will show up after rebalance
+        self.run_srb('rebalance', '-f')
+        out, err = self.run_srb()  # list devices
+        self.assertIn('dispersion', out)
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/cli/test_ringcomposer.py b/test/unit/cli/test_ringcomposer.py
new file mode 100644
index 0000000000..54b5bcf877
--- /dev/null
+++ b/test/unit/cli/test_ringcomposer.py
@@ -0,0 +1,195 @@
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import io
+import json
+
+import os
+import shutil
+import tempfile
+import unittest
+
+from unittest import mock
+
+from swift.cli import ringcomposer
+from test.unit import write_stub_builder
+
+
+class TestCommands(unittest.TestCase):
+
+    def setUp(self):
+        self.tmpdir = tempfile.mkdtemp()
+        self.composite_builder_file = os.path.join(self.tmpdir,
+                                                   'composite.builder')
+        self.composite_ring_file = os.path.join(self.tmpdir,
+                                                'composite.ring')
+
+    def tearDown(self):
+        shutil.rmtree(self.tmpdir)
+
+    def _run_composer(self, args):
+        mock_stdout = io.StringIO()
+        mock_stderr = io.StringIO()
+        with mock.patch("sys.stdout", mock_stdout):
+            with mock.patch("sys.stderr", mock_stderr):
+                with self.assertRaises(SystemExit) as cm:
+                    ringcomposer.main(args)
+        return (cm.exception.code,
+                mock_stdout.getvalue(),
+                mock_stderr.getvalue())
+
+    def test_unknown_command(self):
+        args = ('', self.composite_builder_file, 'unknown')
+        exit_code, stdout, stderr = self._run_composer(args)
+        self.assertEqual(2, exit_code)
+        self.assertIn('invalid choice', stderr)
+
+        args = ('', 'non-existent-file', 'unknown')
+        exit_code, stdout, stderr = self._run_composer(args)
+        self.assertEqual(2, exit_code)
+        self.assertIn('invalid choice', stderr)
+
+    def test_bad_composite_builder_file(self):
+        cmds = (('', self.composite_builder_file, 'show'),
+                ('', self.composite_builder_file, 'compose',
+                 'b1_file', 'b2_file', '--output', self.composite_ring_file))
+        for cmd in cmds:
+            try:
+                with open(self.composite_builder_file, 'wb') as fd:
+                    fd.write(b'not json')
+                exit_code, stdout, stderr = self._run_composer(cmd)
+                self.assertEqual(2, exit_code)
+                self.assertIn('An error occurred while loading the composite '
+                              'builder file', stderr)
+                self.assertIn(
+                    'File does not contain valid composite ring data', stderr)
+            except AssertionError as err:
+                self.fail('Failed testing command %r due to: %s' % (cmd, err))
+
+    def test_compose(self):
+        b1, b1_file = write_stub_builder(self.tmpdir, 1)
+        b2, b2_file = write_stub_builder(self.tmpdir, 2)
+        args = ('', self.composite_builder_file, 'compose', b1_file, b2_file,
+                '--output', self.composite_ring_file)
+        exit_code, stdout, stderr = self._run_composer(args)
+        self.assertEqual(0, exit_code)
+        self.assertTrue(os.path.exists(self.composite_builder_file))
+        self.assertTrue(os.path.exists(self.composite_ring_file))
+
+    def test_compose_existing(self):
+        b1, b1_file = write_stub_builder(self.tmpdir, 1)
+        b2, b2_file = write_stub_builder(self.tmpdir, 2)
+        args = ('', self.composite_builder_file, 'compose', b1_file, b2_file,
+                '--output', self.composite_ring_file)
+        exit_code, stdout, stderr = self._run_composer(args)
+        self.assertEqual(0, exit_code)
+        os.unlink(self.composite_ring_file)
+        # no changes - expect failure
+        args = ('', self.composite_builder_file, 'compose',
+                '--output', self.composite_ring_file)
+        exit_code, stdout, stderr = self._run_composer(args)
+        self.assertEqual(2, exit_code)
+        self.assertFalse(os.path.exists(self.composite_ring_file))
+        # --force should force output
+        args = ('', self.composite_builder_file, 'compose',
+                '--output', self.composite_ring_file, '--force')
+        exit_code, stdout, stderr = self._run_composer(args)
+        self.assertEqual(0, exit_code)
+        self.assertTrue(os.path.exists(self.composite_ring_file))
+
+    def test_compose_insufficient_component_builder_files(self):
+        b1, b1_file = write_stub_builder(self.tmpdir, 1)
+        args = ('', self.composite_builder_file, 'compose', b1_file,
+                '--output', self.composite_ring_file)
+        exit_code, stdout, stderr = self._run_composer(args)
+        self.assertEqual(2, exit_code)
+        self.assertIn('An error occurred while composing the ring', stderr)
+        self.assertIn('Two or more component builders are required', stderr)
+        self.assertFalse(os.path.exists(self.composite_builder_file))
+        self.assertFalse(os.path.exists(self.composite_ring_file))
+
+    def test_compose_nonexistent_component_builder_file(self):
+        b1, b1_file = write_stub_builder(self.tmpdir, 1)
+        bad_file = os.path.join(self.tmpdir, 'non-existent-file')
+        args = ('', self.composite_builder_file, 'compose', b1_file, bad_file,
+                '--output', self.composite_ring_file)
+        exit_code, stdout, stderr = self._run_composer(args)
+        self.assertIn('An error occurred while composing the ring', stderr)
+        self.assertIn('Ring Builder file does not exist', stderr)
+        self.assertEqual(2, exit_code)
+        self.assertFalse(os.path.exists(self.composite_builder_file))
+        self.assertFalse(os.path.exists(self.composite_ring_file))
+
+    def test_compose_fails_to_write_composite_ring_file(self):
+        b1, b1_file = write_stub_builder(self.tmpdir, 1)
+        b2, b2_file = write_stub_builder(self.tmpdir, 2)
+        args = ('', self.composite_builder_file, 'compose', b1_file, b2_file,
+                '--output', self.composite_ring_file)
+        with mock.patch('swift.common.ring.RingData.save',
+                        side_effect=IOError('io error')):
+            exit_code, stdout, stderr = self._run_composer(args)
+        self.assertEqual(2, exit_code)
+        self.assertIn(
+            'An error occurred while writing the composite ring file', stderr)
+        self.assertIn('io error', stderr)
+        self.assertFalse(os.path.exists(self.composite_builder_file))
+        self.assertFalse(os.path.exists(self.composite_ring_file))
+
+    def test_compose_fails_to_write_composite_builder_file(self):
+        b1, b1_file = write_stub_builder(self.tmpdir, 1)
+        b2, b2_file = write_stub_builder(self.tmpdir, 2)
+        args = ('', self.composite_builder_file, 'compose', b1_file, b2_file,
+                '--output', self.composite_ring_file)
+        func = 'swift.common.ring.composite_builder.CompositeRingBuilder.save'
+        with mock.patch(func, side_effect=IOError('io error')):
+            exit_code, stdout, stderr = self._run_composer(args)
+        self.assertEqual(2, exit_code)
+        self.assertIn(
+            'An error occurred while writing the composite builder file',
+            stderr)
+        self.assertIn('io error', stderr)
+        self.assertFalse(os.path.exists(self.composite_builder_file))
+        self.assertTrue(os.path.exists(self.composite_ring_file))
+
+    def test_show(self):
+        b1, b1_file = write_stub_builder(self.tmpdir, 1)
+        b2, b2_file = write_stub_builder(self.tmpdir, 2)
+        args = ('', self.composite_builder_file, 'compose', b1_file, b2_file,
+                '--output', self.composite_ring_file)
+        exit_code, stdout, stderr = self._run_composer(args)
+        self.assertEqual(0, exit_code)
+        args = ('', self.composite_builder_file, 'show')
+        exit_code, stdout, stderr = self._run_composer(args)
+        self.assertEqual(0, exit_code)
+        expected = {'component_builder_files': {b1.id: b1_file,
+                                                b2.id: b2_file},
+                    'components': [
+                        {'id': b1.id,
+                         'replicas': b1.replicas,
+                         # added replicas devices plus rebalance
+                         'version': b1.replicas + 1},
+                        {'id': b2.id,
+                         'replicas': b2.replicas,
+                         # added replicas devices plus rebalance
+                         'version': b2.replicas + 1}],
+                    'version': 1
+                    }
+        self.assertEqual(expected, json.loads(stdout))
+
+    def test_show_nonexistent_composite_builder_file(self):
+        args = ('', 'non-existent-file', 'show')
+        exit_code, stdout, stderr = self._run_composer(args)
+        self.assertEqual(2, exit_code)
+        self.assertIn(
+            'An error occurred while loading the composite builder file',
+            stderr)
+        self.assertIn("No such file or directory: 'non-existent-file'", stderr)
diff --git a/test/unit/common/malformed_example.db b/test/unit/common/malformed_example.db
index 7cbe1bf716..995a24791a 100644
Binary files a/test/unit/common/malformed_example.db and b/test/unit/common/malformed_example.db differ
diff --git a/test/unit/common/malformed_schema_example.db b/test/unit/common/malformed_schema_example.db
new file mode 100644
index 0000000000..bdd46e61ef
Binary files /dev/null and b/test/unit/common/malformed_schema_example.db differ
diff --git a/test/unit/common/middleware/crypto/__init__.py b/test/unit/common/middleware/crypto/__init__.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/test/unit/common/middleware/crypto/crypto_helpers.py b/test/unit/common/middleware/crypto/crypto_helpers.py
new file mode 100644
index 0000000000..333ca0faf6
--- /dev/null
+++ b/test/unit/common/middleware/crypto/crypto_helpers.py
@@ -0,0 +1,73 @@
+# Copyright (c) 2015-2016 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import base64
+
+from swift.common.exceptions import UnknownSecretIdError
+from swift.common.middleware.crypto.crypto_utils import Crypto
+from swift.common.utils import md5
+
+
+def fetch_crypto_keys(key_id=None):
+    id_to_keys = {None: {'account': b'This is an account key 012345678',
+                         'container': b'This is a container key 01234567',
+                         'object': b'This is an object key 0123456789'},
+                  'myid': {'account': b'This is an account key 123456789',
+                           'container': b'This is a container key 12345678',
+                           'object': b'This is an object key 1234567890'}}
+    key_id = key_id or {}
+    secret_id = key_id.get('secret_id') or None
+    try:
+        keys = dict(id_to_keys[secret_id])
+    except KeyError:
+        raise UnknownSecretIdError(secret_id)
+    keys['id'] = {'v': 'fake', 'path': '/a/c/fake'}
+    if secret_id:
+        keys['id']['secret_id'] = secret_id
+    keys['all_ids'] = [{'v': 'fake', 'path': '/a/c/fake'},
+                       {'v': 'fake', 'path': '/a/c/fake', 'secret_id': 'myid'}]
+    return keys
+
+
+def md5hex(s):
+    return md5(s, usedforsecurity=False).hexdigest()
+
+
+def encrypt(val, key=None, iv=None, ctxt=None):
+    if ctxt is None:
+        ctxt = Crypto({}).create_encryption_ctxt(key, iv)
+    enc_val = ctxt.update(val)
+    return enc_val
+
+
+def decrypt(key, iv, enc_val):
+    dec_ctxt = Crypto({}).create_decryption_ctxt(key, iv, 0)
+    dec_val = dec_ctxt.update(enc_val)
+    return dec_val
+
+
+FAKE_IV = b"This is an IV123"
+# do not use this example encryption_root_secret in production, use a randomly
+# generated value with high entropy
+TEST_KEYMASTER_CONF = {
+    'encryption_root_secret': base64.b64encode(b'x' * 32),
+    'encryption_root_secret_1': base64.b64encode(b'y' * 32),
+    'encryption_root_secret_2': base64.b64encode(b'z' * 32)
+}
+
+
+def fake_get_crypto_meta(**kwargs):
+    meta = {'iv': FAKE_IV, 'cipher': Crypto.cipher}
+    meta.update(kwargs)
+    return meta
diff --git a/test/unit/common/middleware/crypto/test_crypto.py b/test/unit/common/middleware/crypto/test_crypto.py
new file mode 100644
index 0000000000..aa9e91e552
--- /dev/null
+++ b/test/unit/common/middleware/crypto/test_crypto.py
@@ -0,0 +1,72 @@
+# Copyright (c) 2016 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import unittest
+from unittest import mock
+
+from swift.common import registry
+from swift.common.middleware import crypto
+
+
+class TestCrypto(unittest.TestCase):
+    def test_filter_factory(self):
+        def do_test(conf, expect_enabled):
+            fake_app = object()
+
+            with mock.patch.dict('swift.common.registry._swift_admin_info',
+                                 clear=True):
+                # we're not expecting utils._swift_info to be modified but mock
+                # it anyway just in case it is
+                with mock.patch.dict('swift.common.registry._swift_info',
+                                     clear=True):
+                    # Sanity checks...
+                    self.assertNotIn('encryption', registry._swift_admin_info)
+                    self.assertNotIn('encryption',
+                                     registry.get_swift_info(admin=True))
+                    self.assertNotIn(
+                        'encryption',
+                        registry.get_swift_info(admin=True)['admin'])
+
+                    factory = crypto.filter_factory(conf)
+                    self.assertTrue(callable(factory))
+                    filtered_app = factory(fake_app)
+
+                    self.assertNotIn('encryption', registry._swift_info)
+                    self.assertNotIn('encryption', registry.get_swift_info())
+                    self.assertNotIn('encryption',
+                                     registry.get_swift_info(admin=True))
+
+                    self.assertIn('encryption', registry._swift_admin_info)
+                    self.assertDictEqual(
+                        {'enabled': expect_enabled},
+                        registry._swift_admin_info['encryption'])
+                    self.assertIn('encryption',
+                                  registry.get_swift_info(admin=True)['admin'])
+                    self.assertDictEqual(
+                        {'enabled': expect_enabled},
+                        registry.get_swift_info(
+                            admin=True)['admin']['encryption'])
+
+            self.assertIsInstance(filtered_app, crypto.decrypter.Decrypter)
+            self.assertIsInstance(filtered_app.app, crypto.encrypter.Encrypter)
+            self.assertIs(filtered_app.app.app, fake_app)
+
+        # default enabled
+        do_test({}, True)
+
+        # explicitly enabled
+        do_test({'disable_encryption': False}, True)
+
+        # explicitly disabled
+        do_test({'disable_encryption': True}, False)
diff --git a/test/unit/common/middleware/crypto/test_crypto_utils.py b/test/unit/common/middleware/crypto/test_crypto_utils.py
new file mode 100644
index 0000000000..7c1122f626
--- /dev/null
+++ b/test/unit/common/middleware/crypto/test_crypto_utils.py
@@ -0,0 +1,556 @@
+# Copyright (c) 2015-2016 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import os
+import unittest
+
+from unittest import mock
+from cryptography.hazmat.backends import default_backend
+from cryptography.hazmat.primitives.ciphers import Cipher, algorithms, modes
+
+from swift.common.exceptions import EncryptionException
+from swift.common.middleware.crypto import crypto_utils
+from swift.common.middleware.crypto.crypto_utils import (
+    CRYPTO_KEY_CALLBACK, Crypto, CryptoWSGIContext)
+from swift.common.swob import HTTPException
+from test.debug_logger import debug_logger
+from test.unit.common.middleware.crypto.crypto_helpers import fetch_crypto_keys
+
+
+class TestCryptoWsgiContext(unittest.TestCase):
+    def setUp(self):
+        class FakeFilter(object):
+            app = None
+            crypto = Crypto({})
+
+        self.fake_logger = debug_logger()
+        self.crypto_context = CryptoWSGIContext(
+            FakeFilter(), 'object', self.fake_logger)
+
+    def test_get_keys(self):
+        # ok
+        env = {CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        keys = self.crypto_context.get_keys(env)
+        self.assertDictEqual(fetch_crypto_keys(), keys)
+
+        # only default required keys are checked
+        subset_keys = {'object': fetch_crypto_keys()['object']}
+        env = {CRYPTO_KEY_CALLBACK: lambda *args, **kwargs: subset_keys}
+        keys = self.crypto_context.get_keys(env)
+        self.assertDictEqual(subset_keys, keys)
+
+        # only specified required keys are checked
+        subset_keys = {'container': fetch_crypto_keys()['container']}
+        env = {CRYPTO_KEY_CALLBACK: lambda *args, **kwargs: subset_keys}
+        keys = self.crypto_context.get_keys(env, required=['container'])
+        self.assertDictEqual(subset_keys, keys)
+
+        subset_keys = {'object': fetch_crypto_keys()['object'],
+                       'container': fetch_crypto_keys()['container']}
+        env = {CRYPTO_KEY_CALLBACK: lambda *args, **kwargs: subset_keys}
+        keys = self.crypto_context.get_keys(
+            env, required=['object', 'container'])
+        self.assertDictEqual(subset_keys, keys)
+
+    def test_get_keys_with_crypto_meta(self):
+        # verify that key_id from crypto_meta is passed to fetch_crypto_keys
+        keys = fetch_crypto_keys()
+        mock_fetch_crypto_keys = mock.MagicMock(return_value=keys)
+        env = {CRYPTO_KEY_CALLBACK: mock_fetch_crypto_keys}
+        key_id = {'secret_id': '123'}
+        keys = self.crypto_context.get_keys(env, key_id=key_id)
+        self.assertDictEqual(fetch_crypto_keys(), keys)
+        mock_fetch_crypto_keys.assert_called_with(key_id={'secret_id': '123'})
+
+        # but it's ok for there to be no crypto_meta
+        keys = self.crypto_context.get_keys(env, key_id={})
+        self.assertDictEqual(fetch_crypto_keys(), keys)
+        mock_fetch_crypto_keys.assert_called_with(key_id={})
+        keys = self.crypto_context.get_keys(env)
+        self.assertDictEqual(fetch_crypto_keys(), keys)
+        mock_fetch_crypto_keys.assert_called_with(key_id=None)
+
+    def test_get_keys_missing_callback(self):
+        with self.assertRaises(HTTPException) as cm:
+            self.crypto_context.get_keys({})
+        self.assertIn('500 Internal Error', cm.exception.status)
+        self.assertIn('missing callback',
+                      self.fake_logger.get_lines_for_level('error')[0])
+        self.assertIn(b'Unable to retrieve encryption keys.',
+                      cm.exception.body)
+
+    def test_get_keys_callback_exception(self):
+        def callback(*args, **kwargs):
+            raise Exception('boom')
+        with self.assertRaises(HTTPException) as cm:
+            self.crypto_context.get_keys({CRYPTO_KEY_CALLBACK: callback})
+        self.assertIn('500 Internal Error', cm.exception.status)
+        self.assertIn('from callback: boom',
+                      self.fake_logger.get_lines_for_level('error')[0])
+        self.assertIn(b'Unable to retrieve encryption keys.',
+                      cm.exception.body)
+
+    def test_get_keys_missing_key_for_default_required_list(self):
+        bad_keys = dict(fetch_crypto_keys())
+        bad_keys.pop('object')
+        with self.assertRaises(HTTPException) as cm:
+            self.crypto_context.get_keys(
+                {CRYPTO_KEY_CALLBACK: lambda *args, **kwargs: bad_keys})
+        self.assertIn('500 Internal Error', cm.exception.status)
+        self.assertIn("Missing key for 'object'",
+                      self.fake_logger.get_lines_for_level('error')[0])
+        self.assertIn(b'Unable to retrieve encryption keys.',
+                      cm.exception.body)
+
+    def test_get_keys_missing_object_key_for_specified_required_list(self):
+        bad_keys = dict(fetch_crypto_keys())
+        bad_keys.pop('object')
+        with self.assertRaises(HTTPException) as cm:
+            self.crypto_context.get_keys(
+                {CRYPTO_KEY_CALLBACK: lambda *args, **kwargs: bad_keys},
+                required=['object', 'container'])
+        self.assertIn('500 Internal Error', cm.exception.status)
+        self.assertIn("Missing key for 'object'",
+                      self.fake_logger.get_lines_for_level('error')[0])
+        self.assertIn(b'Unable to retrieve encryption keys.',
+                      cm.exception.body)
+
+    def test_get_keys_missing_container_key_for_specified_required_list(self):
+        bad_keys = dict(fetch_crypto_keys())
+        bad_keys.pop('container')
+        with self.assertRaises(HTTPException) as cm:
+            self.crypto_context.get_keys(
+                {CRYPTO_KEY_CALLBACK: lambda *args, **kwargs: bad_keys},
+                required=['object', 'container'])
+        self.assertIn('500 Internal Error', cm.exception.status)
+        self.assertIn("Missing key for 'container'",
+                      self.fake_logger.get_lines_for_level('error')[0])
+        self.assertIn(b'Unable to retrieve encryption keys.',
+                      cm.exception.body)
+
+    def test_bad_object_key_for_default_required_list(self):
+        bad_keys = dict(fetch_crypto_keys())
+        bad_keys['object'] = b'the minor key'
+        with self.assertRaises(HTTPException) as cm:
+            self.crypto_context.get_keys(
+                {CRYPTO_KEY_CALLBACK: lambda *args, **kwargs: bad_keys})
+        self.assertIn('500 Internal Error', cm.exception.status)
+        self.assertIn("Bad key for 'object'",
+                      self.fake_logger.get_lines_for_level('error')[0])
+        self.assertIn(b'Unable to retrieve encryption keys.',
+                      cm.exception.body)
+
+    def test_bad_container_key_for_default_required_list(self):
+        bad_keys = dict(fetch_crypto_keys())
+        bad_keys['container'] = b'the major key'
+        with self.assertRaises(HTTPException) as cm:
+            self.crypto_context.get_keys(
+                {CRYPTO_KEY_CALLBACK: lambda *args, **kwargs: bad_keys},
+                required=['object', 'container'])
+        self.assertIn('500 Internal Error', cm.exception.status)
+        self.assertIn("Bad key for 'container'",
+                      self.fake_logger.get_lines_for_level('error')[0])
+        self.assertIn(b'Unable to retrieve encryption keys.',
+                      cm.exception.body)
+
+    def test_get_keys_not_a_dict(self):
+        with self.assertRaises(HTTPException) as cm:
+            self.crypto_context.get_keys(
+                {CRYPTO_KEY_CALLBACK:
+                    lambda *args, **kwargs: ['key', 'quay', 'qui']})
+        self.assertEqual('500 Internal Error', cm.exception.status)
+        self.assertIn("Did not get a keys dict",
+                      self.fake_logger.get_lines_for_level('error')[0])
+        self.assertIn(b'Unable to retrieve encryption keys.',
+                      cm.exception.body)
+
+    def test_get_multiple_keys(self):
+        env = {CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        mutliple_keys = self.crypto_context.get_multiple_keys(env)
+        self.assertEqual(
+            [fetch_crypto_keys(),
+             fetch_crypto_keys(key_id={'secret_id': 'myid'})],
+            mutliple_keys)
+
+
+class TestModuleMethods(unittest.TestCase):
+    meta = {'iv': b'0123456789abcdef', 'cipher': 'AES_CTR_256'}
+    serialized_meta = '%7B%22cipher%22%3A+%22AES_CTR_256%22%2C+%22' \
+                      'iv%22%3A+%22MDEyMzQ1Njc4OWFiY2RlZg%3D%3D%22%7D'
+
+    meta_with_key = {'iv': b'0123456789abcdef', 'cipher': 'AES_CTR_256',
+                     'body_key': {'key': b'fedcba9876543210fedcba9876543210',
+                                  'iv': b'fedcba9876543210'}}
+    serialized_meta_with_key = '%7B%22body_key%22%3A+%7B%22iv%22%3A+%22ZmVkY' \
+                               '2JhOTg3NjU0MzIxMA%3D%3D%22%2C+%22key%22%3A+%' \
+                               '22ZmVkY2JhOTg3NjU0MzIxMGZlZGNiYTk4NzY1NDMyMT' \
+                               'A%3D%22%7D%2C+%22cipher%22%3A+%22AES_CTR_256' \
+                               '%22%2C+%22iv%22%3A+%22MDEyMzQ1Njc4OWFiY2RlZg' \
+                               '%3D%3D%22%7D'
+
+    def test_dump_crypto_meta(self):
+        actual = crypto_utils.dump_crypto_meta(self.meta)
+        self.assertEqual(self.serialized_meta, actual)
+
+        actual = crypto_utils.dump_crypto_meta(self.meta_with_key)
+        self.assertEqual(self.serialized_meta_with_key, actual)
+
+    def test_load_crypto_meta(self):
+        actual = crypto_utils.load_crypto_meta(self.serialized_meta)
+        self.assertEqual(self.meta, actual)
+
+        actual = crypto_utils.load_crypto_meta(self.serialized_meta_with_key)
+        self.assertEqual(self.meta_with_key, actual)
+
+        def assert_raises(value, message):
+            with self.assertRaises(EncryptionException) as cm:
+                crypto_utils.load_crypto_meta(value)
+            self.assertIn('Bad crypto meta %r' % value, cm.exception.args[0])
+            if isinstance(message, (tuple, list)):
+                for opt in message:
+                    if opt in cm.exception.args[0]:
+                        break
+                else:
+                    self.fail('Expected to find one of %r in %r' % (
+                        message, cm.exception.args[0]))
+            else:
+                self.assertIn(message, cm.exception.args[0])
+
+        assert_raises(None, 'crypto meta not a string')
+        assert_raises(99, 'crypto meta not a string')
+        assert_raises('', ('No JSON object could be decoded',
+                           'Expecting value: line 1 column 1'))
+        assert_raises('abc', ('No JSON object could be decoded',
+                              'Expecting value: line 1 column 1'))
+        assert_raises('[]', 'crypto meta not a Mapping')
+        bad_type_messages = [
+            'must be string or buffer',
+            'argument should be a bytes-like object or ASCII string',
+        ]
+        assert_raises('{"iv": "abcdef"}', 'Incorrect padding')
+        assert_raises('{"iv": []}', bad_type_messages)
+        assert_raises('{"iv": {}}', bad_type_messages)
+        assert_raises('{"iv": 99}', bad_type_messages)
+        assert_raises('{"key": "abcdef"}', 'Incorrect padding')
+        assert_raises('{"key": []}', bad_type_messages)
+        assert_raises('{"key": {}}', bad_type_messages)
+        assert_raises('{"key": 99}', bad_type_messages)
+        assert_raises('{"body_key": {"iv": "abcdef"}}', 'Incorrect padding')
+        assert_raises('{"body_key": {"iv": []}}', bad_type_messages)
+        assert_raises('{"body_key": {"iv": {}}}', bad_type_messages)
+        assert_raises('{"body_key": {"iv": 99}}', bad_type_messages)
+        assert_raises('{"body_key": {"key": "abcdef"}}', 'Incorrect padding')
+        assert_raises('{"body_key": {"key": []}}', bad_type_messages)
+        assert_raises('{"body_key": {"key": {}}}', bad_type_messages)
+        assert_raises('{"body_key": {"key": 99}}', bad_type_messages)
+
+    def test_dump_then_load_crypto_meta(self):
+        actual = crypto_utils.load_crypto_meta(
+            crypto_utils.dump_crypto_meta(self.meta))
+        self.assertEqual(self.meta, actual)
+
+        actual = crypto_utils.load_crypto_meta(
+            crypto_utils.dump_crypto_meta(self.meta_with_key))
+        self.assertEqual(self.meta_with_key, actual)
+
+    def test_append_crypto_meta(self):
+        actual = crypto_utils.append_crypto_meta('abc', self.meta)
+        expected = 'abc; swift_meta=%s' % self.serialized_meta
+        self.assertEqual(actual, expected)
+
+        actual = crypto_utils.append_crypto_meta('abc', self.meta_with_key)
+        expected = 'abc; swift_meta=%s' % self.serialized_meta_with_key
+        self.assertEqual(actual, expected)
+
+        def check_bad_value(value):
+            with self.assertRaises(ValueError):
+                crypto_utils.append_crypto_meta(value, self.meta)
+
+        check_bad_value(None)
+        check_bad_value({})
+        check_bad_value(1)
+
+    def test_extract_crypto_meta(self):
+        val, meta = crypto_utils.extract_crypto_meta(
+            'abc; swift_meta=%s' % self.serialized_meta)
+        self.assertEqual('abc', val)
+        self.assertDictEqual(self.meta, meta)
+
+        val, meta = crypto_utils.extract_crypto_meta(
+            'abc; swift_meta=%s' % self.serialized_meta_with_key)
+        self.assertEqual('abc', val)
+        self.assertDictEqual(self.meta_with_key, meta)
+
+        val, meta = crypto_utils.extract_crypto_meta('abc')
+        self.assertEqual('abc', val)
+        self.assertIsNone(meta)
+
+        # other param names will be ignored
+        val, meta = crypto_utils.extract_crypto_meta('abc; foo=bar')
+        self.assertEqual('abc', val)
+        self.assertIsNone(meta)
+
+        val, meta = crypto_utils.extract_crypto_meta(
+            'abc; swift_meta=%s; foo=bar' % self.serialized_meta_with_key)
+        self.assertEqual('abc', val)
+        self.assertDictEqual(self.meta_with_key, meta)
+
+    def test_append_then_extract_crypto_meta(self):
+        val = 'abc'
+        actual = crypto_utils.extract_crypto_meta(
+            crypto_utils.append_crypto_meta(val, self.meta))
+        self.assertEqual((val, self.meta), actual)
+
+
+class TestCrypto(unittest.TestCase):
+
+    def setUp(self):
+        self.crypto = Crypto({})
+
+    def test_create_encryption_context(self):
+        value = b'encrypt me' * 100  # more than one cipher block
+        key = os.urandom(32)
+        iv = os.urandom(16)
+        ctxt = self.crypto.create_encryption_ctxt(key, iv)
+        expected = Cipher(
+            algorithms.AES(key), modes.CTR(iv),
+            backend=default_backend()).encryptor().update(value)
+        self.assertEqual(expected, ctxt.update(value))
+
+        for bad_iv in (b'a little too long', b'too short'):
+            self.assertRaises(
+                ValueError, self.crypto.create_encryption_ctxt, key, bad_iv)
+
+        for bad_key in (b'objKey', b'a' * 31, b'a' * 33, b'a' * 16, b'a' * 24):
+            self.assertRaises(
+                ValueError, self.crypto.create_encryption_ctxt, bad_key, iv)
+
+    def test_create_decryption_context(self):
+        value = b'decrypt me' * 100  # more than one cipher block
+        key = os.urandom(32)
+        iv = os.urandom(16)
+        ctxt = self.crypto.create_decryption_ctxt(key, iv, 0)
+        expected = Cipher(
+            algorithms.AES(key), modes.CTR(iv),
+            backend=default_backend()).decryptor().update(value)
+        self.assertEqual(expected, ctxt.update(value))
+
+        for bad_iv in (b'a little too long', b'too short'):
+            self.assertRaises(
+                ValueError, self.crypto.create_decryption_ctxt, key, bad_iv, 0)
+
+        for bad_key in (b'objKey', b'a' * 31, b'a' * 33, b'a' * 16, b'a' * 24):
+            self.assertRaises(
+                ValueError, self.crypto.create_decryption_ctxt, bad_key, iv, 0)
+
+        with self.assertRaises(ValueError) as cm:
+            self.crypto.create_decryption_ctxt(key, iv, -1)
+        self.assertEqual("Offset must not be negative", cm.exception.args[0])
+
+    def test_enc_dec_small_chunks(self):
+        self.enc_dec_chunks([b'encrypt me', b'because I', b'am sensitive'])
+
+    def test_enc_dec_large_chunks(self):
+        self.enc_dec_chunks([os.urandom(65536), os.urandom(65536)])
+
+    def enc_dec_chunks(self, chunks):
+        key = b'objL7wjV6L79Sfs4y7dy41273l0k6Wki'
+        iv = self.crypto.create_iv()
+        enc_ctxt = self.crypto.create_encryption_ctxt(key, iv)
+        enc_val = [enc_ctxt.update(chunk) for chunk in chunks]
+        self.assertTrue(b''.join(enc_val) != chunks)
+        dec_ctxt = self.crypto.create_decryption_ctxt(key, iv, 0)
+        dec_val = [dec_ctxt.update(chunk) for chunk in enc_val]
+        self.assertEqual(b''.join(chunks), b''.join(dec_val),
+                         'Expected value {%s} but got {%s}' %
+                         (b''.join(chunks), b''.join(dec_val)))
+
+    def test_decrypt_range(self):
+        chunks = [b'0123456789abcdef', b'ghijklmnopqrstuv']
+        key = b'objL7wjV6L79Sfs4y7dy41273l0k6Wki'
+        iv = self.crypto.create_iv()
+        enc_ctxt = self.crypto.create_encryption_ctxt(key, iv)
+        enc_val = [enc_ctxt.update(chunk) for chunk in chunks]
+
+        # Simulate a ranged GET from byte 19 to 32 : 'jklmnopqrstuv'
+        dec_ctxt = self.crypto.create_decryption_ctxt(key, iv, 19)
+        ranged_chunks = [enc_val[1][3:]]
+        dec_val = [dec_ctxt.update(chunk) for chunk in ranged_chunks]
+        self.assertEqual(b'jklmnopqrstuv', b''.join(dec_val),
+                         'Expected value {%s} but got {%s}' %
+                         (b'jklmnopqrstuv', b''.join(dec_val)))
+
+    def test_create_decryption_context_non_zero_offset(self):
+        # Verify that iv increments for each 16 bytes of offset.
+        # For a ranged GET we pass a non-zero offset so that the decrypter
+        # counter is incremented to the correct value to start decrypting at
+        # that offset into the object body. The counter should increment by one
+        # from the starting IV value for every 16 bytes offset into the object
+        # body, until it reaches 2^128 -1 when it should wrap to zero. We check
+        # that is happening by verifying a decrypted value using various
+        # offsets.
+        key = b'objL7wjV6L79Sfs4y7dy41273l0k6Wki'
+
+        def do_test():
+            for offset, exp_iv in mappings.items():
+                dec_ctxt = self.crypto.create_decryption_ctxt(key, iv, offset)
+                offset_in_block = offset % 16
+                cipher = Cipher(algorithms.AES(key),
+                                modes.CTR(exp_iv),
+                                backend=default_backend())
+                expected = cipher.decryptor().update(
+                    b'p' * offset_in_block + b'ciphertext')
+                actual = dec_ctxt.update(b'ciphertext')
+                expected = expected[offset % 16:]
+                self.assertEqual(expected, actual,
+                                 'Expected %r but got %r, iv=%s and offset=%s'
+                                 % (expected, actual, iv, offset))
+
+        iv = b'0000000010000000'
+        mappings = {
+            2: b'0000000010000000',
+            16: b'0000000010000001',
+            19: b'0000000010000001',
+            48: b'0000000010000003',
+            1024: b'000000001000000p',
+            5119: b'000000001000001o'
+        }
+        do_test()
+
+        # choose max iv value and test that it wraps to zero
+        iv = b'\xff' * 16
+        mappings = {
+            2: iv,
+            16: bytes(bytearray.fromhex('00' * 16)),  # iv wraps to 0
+            19: bytes(bytearray.fromhex('00' * 16)),
+            48: bytes(bytearray.fromhex('00' * 15 + '02')),
+            1024: bytes(bytearray.fromhex('00' * 15 + '3f')),
+            5119: bytes(bytearray.fromhex('00' * 14 + '013E'))
+        }
+        do_test()
+
+        iv = b'\x00' * 16
+        mappings = {
+            2: iv,
+            16: bytes(bytearray.fromhex('00' * 15 + '01')),
+            19: bytes(bytearray.fromhex('00' * 15 + '01')),
+            48: bytes(bytearray.fromhex('00' * 15 + '03')),
+            1024: bytes(bytearray.fromhex('00' * 15 + '40')),
+            5119: bytes(bytearray.fromhex('00' * 14 + '013F'))
+        }
+        do_test()
+
+        iv = b'\x00' * 8 + b'\xff' * 8
+        mappings = {
+            2: iv,
+            16: bytes(bytearray.fromhex('00' * 7 + '01' + '00' * 8)),
+            19: bytes(bytearray.fromhex('00' * 7 + '01' + '00' * 8)),
+            48: bytes(bytearray.fromhex('00' * 7 + '01' + '00' * 7 + '02')),
+            1024: bytes(bytearray.fromhex('00' * 7 + '01' + '00' * 7 + '3F')),
+            5119: bytes(bytearray.fromhex('00' * 7 + '01' + '00' * 6 + '013E'))
+        }
+        do_test()
+
+    def test_check_key(self):
+        for key in ('objKey', 'a' * 31, 'a' * 33, 'a' * 16, 'a' * 24):
+            with self.assertRaises(ValueError) as cm:
+                self.crypto.check_key(key)
+            self.assertEqual("Key must be length 32 bytes",
+                             cm.exception.args[0])
+
+    def test_check_crypto_meta(self):
+        meta = {'cipher': 'AES_CTR_256'}
+        with self.assertRaises(EncryptionException) as cm:
+            self.crypto.check_crypto_meta(meta)
+        self.assertEqual("Bad crypto meta: Missing 'iv'",
+                         cm.exception.args[0])
+
+        for bad_iv in ('a little too long', 'too short'):
+            meta['iv'] = bad_iv
+            with self.assertRaises(EncryptionException) as cm:
+                self.crypto.check_crypto_meta(meta)
+            self.assertEqual("Bad crypto meta: IV must be length 16 bytes",
+                             cm.exception.args[0])
+
+        meta = {'iv': os.urandom(16)}
+        with self.assertRaises(EncryptionException) as cm:
+            self.crypto.check_crypto_meta(meta)
+        self.assertEqual("Bad crypto meta: Missing 'cipher'",
+                         cm.exception.args[0])
+
+        meta['cipher'] = 'Mystery cipher'
+        with self.assertRaises(EncryptionException) as cm:
+            self.crypto.check_crypto_meta(meta)
+        self.assertEqual("Bad crypto meta: Cipher must be AES_CTR_256",
+                         cm.exception.args[0])
+
+    def test_create_iv(self):
+        self.assertEqual(16, len(self.crypto.create_iv()))
+        # crude check that we get back different values on each call
+        self.assertNotEqual(self.crypto.create_iv(), self.crypto.create_iv())
+
+    def test_get_crypto_meta(self):
+        meta = self.crypto.create_crypto_meta()
+        self.assertIsInstance(meta, dict)
+        # this is deliberately brittle so that if new items are added then the
+        # test will need to be updated
+        self.assertEqual(2, len(meta))
+        self.assertIn('iv', meta)
+        self.assertEqual(16, len(meta['iv']))
+        self.assertIn('cipher', meta)
+        self.assertEqual('AES_CTR_256', meta['cipher'])
+        self.crypto.check_crypto_meta(meta)  # sanity check
+        meta2 = self.crypto.create_crypto_meta()
+        self.assertNotEqual(meta['iv'], meta2['iv'])  # crude sanity check
+
+    def test_create_random_key(self):
+        # crude check that we get unique keys on each call
+        keys = set()
+        for i in range(10):
+            key = self.crypto.create_random_key()
+            self.assertEqual(32, len(key))
+            keys.add(key)
+        self.assertEqual(10, len(keys))
+
+    def test_wrap_unwrap_key(self):
+        wrapping_key = os.urandom(32)
+        key_to_wrap = os.urandom(32)
+        iv = os.urandom(16)
+        with mock.patch(
+                'swift.common.middleware.crypto.crypto_utils.Crypto.create_iv',
+                return_value=iv):
+            wrapped = self.crypto.wrap_key(wrapping_key, key_to_wrap)
+        cipher = Cipher(algorithms.AES(wrapping_key), modes.CTR(iv),
+                        backend=default_backend())
+        expected = {'key': cipher.encryptor().update(key_to_wrap),
+                    'iv': iv}
+        self.assertEqual(expected, wrapped)
+
+        unwrapped = self.crypto.unwrap_key(wrapping_key, wrapped)
+        self.assertEqual(key_to_wrap, unwrapped)
+
+    def test_unwrap_bad_key(self):
+        # verify that ValueError is raised if unwrapped key is invalid
+        wrapping_key = os.urandom(32)
+        for length in (0, 16, 24, 31, 33):
+            key_to_wrap = os.urandom(length)
+            wrapped = self.crypto.wrap_key(wrapping_key, key_to_wrap)
+            with self.assertRaises(ValueError) as cm:
+                self.crypto.unwrap_key(wrapping_key, wrapped)
+            self.assertEqual(
+                cm.exception.args[0], 'Key must be length 32 bytes')
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/crypto/test_decrypter.py b/test/unit/common/middleware/crypto/test_decrypter.py
new file mode 100644
index 0000000000..1921bd5032
--- /dev/null
+++ b/test/unit/common/middleware/crypto/test_decrypter.py
@@ -0,0 +1,1240 @@
+# Copyright (c) 2015-2016 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import base64
+import json
+import os
+import unittest
+
+from unittest import mock
+
+from swift.common.request_helpers import is_object_transient_sysmeta
+from swift.common.utils import MD5_OF_EMPTY_STRING
+from swift.common.header_key_dict import HeaderKeyDict
+from swift.common.middleware.crypto import decrypter, keymaster
+from swift.common.middleware.crypto.crypto_utils import CRYPTO_KEY_CALLBACK, \
+    dump_crypto_meta, Crypto, load_crypto_meta
+from swift.common.swob import Request, HTTPException, HTTPOk, \
+    HTTPPreconditionFailed, HTTPNotFound, HTTPPartialContent, bytes_to_wsgi
+
+from test.debug_logger import debug_logger
+from test.unit.common.middleware.crypto.crypto_helpers import md5hex, \
+    fetch_crypto_keys, FAKE_IV, encrypt, fake_get_crypto_meta
+from test.unit.common.middleware.helpers import FakeSwift, FakeAppThatExcepts
+
+
+def get_crypto_meta_header(crypto_meta=None):
+    if crypto_meta is None:
+        crypto_meta = fake_get_crypto_meta()
+    return dump_crypto_meta(crypto_meta)
+
+
+def encrypt_and_append_meta(value, key, crypto_meta=None):
+    if not isinstance(value, bytes):
+        value = value.encode('ascii')
+    return '%s; swift_meta=%s' % (
+        base64.b64encode(encrypt(value, key, FAKE_IV)).decode('ascii'),
+        get_crypto_meta_header(crypto_meta))
+
+
+class TestDecrypterObjectRequests(unittest.TestCase):
+    def setUp(self):
+        self.app = FakeSwift()
+        self.decrypter = decrypter.Decrypter(self.app, {})
+        self.decrypter.logger = debug_logger()
+
+    def _make_response_headers(self, content_length, plaintext_etag, keys,
+                               body_key, key_id=None):
+        # helper method to make a typical set of response headers for a GET or
+        # HEAD request
+        cont_key = keys['container']
+        object_key = keys['object']
+        body_key_meta = {'key': encrypt(body_key, object_key, FAKE_IV),
+                         'iv': FAKE_IV}
+        body_crypto_meta = fake_get_crypto_meta(body_key=body_key_meta)
+        other_crypto_meta = fake_get_crypto_meta()
+        if key_id:
+            body_crypto_meta['key_id'] = key_id
+            other_crypto_meta['key_id'] = key_id
+        return HeaderKeyDict({
+            'Etag': 'hashOfCiphertext',
+            'content-type': 'text/plain',
+            'content-length': content_length,
+            'X-Object-Sysmeta-Crypto-Etag': '%s; swift_meta=%s' % (
+                bytes_to_wsgi(base64.b64encode(encrypt(
+                    plaintext_etag.encode('ascii'), object_key, FAKE_IV))),
+                get_crypto_meta_header(other_crypto_meta)),
+            'X-Object-Sysmeta-Crypto-Body-Meta':
+                get_crypto_meta_header(body_crypto_meta),
+            'X-Object-Transient-Sysmeta-Crypto-Meta':
+                get_crypto_meta_header(other_crypto_meta),
+            'x-object-transient-sysmeta-crypto-meta-test':
+                bytes_to_wsgi(base64.b64encode(encrypt(
+                    b'encrypt me', object_key, FAKE_IV))) +
+                ';swift_meta=' + get_crypto_meta_header(other_crypto_meta),
+            'x-object-sysmeta-container-update-override-etag':
+                encrypt_and_append_meta('encrypt me, too', cont_key),
+            'x-object-sysmeta-test': 'do not encrypt me',
+        })
+
+    def _test_request_success(self, method, body, key_id=None):
+        env = {'REQUEST_METHOD': method,
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        req = Request.blank('/v1/a/c/o', environ=env)
+        plaintext_etag = md5hex(body)
+        body_key = os.urandom(32)
+        enc_body = encrypt(body, body_key, FAKE_IV)
+        hdrs = self._make_response_headers(
+            len(enc_body), plaintext_etag, fetch_crypto_keys(key_id=key_id),
+            body_key, key_id=key_id)
+        if key_id:
+            crypto_meta = load_crypto_meta(
+                hdrs['X-Object-Sysmeta-Crypto-Body-Meta'])
+            # sanity check that the test setup used provided key_id
+            self.assertEqual(key_id, crypto_meta['key_id'])
+        # there shouldn't be any x-object-meta- headers, but if there are
+        # then the decrypted header will win where there is a name clash...
+        hdrs.update({
+            'x-object-meta-test': 'unexpected, overwritten by decrypted value',
+            'x-object-meta-distinct': 'unexpected but distinct from encrypted'
+        })
+        self.app.register(
+            method, '/v1/a/c/o', HTTPOk, body=enc_body, headers=hdrs)
+        resp = req.get_response(self.decrypter)
+        self.assertEqual('200 OK', resp.status)
+        self.assertEqual(plaintext_etag, resp.headers['Etag'])
+        self.assertEqual('text/plain', resp.headers['Content-Type'])
+        self.assertEqual('encrypt me', resp.headers['x-object-meta-test'])
+        self.assertEqual('unexpected but distinct from encrypted',
+                         resp.headers['x-object-meta-distinct'])
+        self.assertEqual('do not encrypt me',
+                         resp.headers['x-object-sysmeta-test'])
+        self.assertEqual(
+            'encrypt me, too',
+            resp.headers['X-Object-Sysmeta-Container-Update-Override-Etag'])
+        self.assertNotIn('X-Object-Sysmeta-Crypto-Body-Meta', resp.headers)
+        self.assertNotIn('X-Object-Sysmeta-Crypto-Etag', resp.headers)
+        self.assertNotIn('Access-Control-Expose-Headers', resp.headers)
+        return resp
+
+    def test_GET_success(self):
+        body = b'FAKE APP'
+        resp = self._test_request_success('GET', body)
+        self.assertEqual(body, resp.body)
+
+        key_id_val = {'secret_id': 'myid'}
+        resp = self._test_request_success('GET', body, key_id=key_id_val)
+        self.assertEqual(body, resp.body)
+
+        key_id_val = {'secret_id': ''}
+        resp = self._test_request_success('GET', body, key_id=key_id_val)
+        self.assertEqual(body, resp.body)
+
+    def test_HEAD_success(self):
+        body = b'FAKE APP'
+        resp = self._test_request_success('HEAD', body)
+        self.assertEqual(b'', resp.body)
+
+        key_id_val = {'secret_id': 'myid'}
+        resp = self._test_request_success('HEAD', body, key_id=key_id_val)
+        self.assertEqual(b'', resp.body)
+
+        key_id_val = {'secret_id': ''}
+        resp = self._test_request_success('HEAD', body, key_id=key_id_val)
+        self.assertEqual(b'', resp.body)
+
+    def _check_different_keys_for_data_and_metadata(self, method):
+        env = {'REQUEST_METHOD': method,
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        req = Request.blank('/v1/a/c/o', environ=env)
+        data_key_id = {}
+        metadata_key_id = {'secret_id': 'myid'}
+        body = b'object data'
+        plaintext_etag = md5hex(body)
+        body_key = os.urandom(32)
+        enc_body = encrypt(body, body_key, FAKE_IV)
+        data_key = fetch_crypto_keys(data_key_id)
+        metadata_key = fetch_crypto_keys(metadata_key_id)
+        # synthesise response headers to mimic different key used for data PUT
+        # vs metadata POST
+        hdrs = self._make_response_headers(
+            len(enc_body), plaintext_etag, data_key, body_key,
+            key_id=data_key_id)
+        metadata_hdrs = self._make_response_headers(
+            len(enc_body), plaintext_etag, metadata_key, body_key,
+            key_id=metadata_key_id)
+        for k, v in metadata_hdrs.items():
+            if is_object_transient_sysmeta(k):
+                self.assertNotEqual(hdrs[k], v)  # sanity check
+                hdrs[k] = v
+
+        self.app.register(
+            method, '/v1/a/c/o', HTTPOk, body=enc_body, headers=hdrs)
+        resp = req.get_response(self.decrypter)
+        self.assertEqual('200 OK', resp.status)
+        self.assertEqual(plaintext_etag, resp.headers['Etag'])
+        self.assertEqual('text/plain', resp.headers['Content-Type'])
+        self.assertEqual('encrypt me', resp.headers['x-object-meta-test'])
+        self.assertEqual(
+            'encrypt me, too',
+            resp.headers['X-Object-Sysmeta-Container-Update-Override-Etag'])
+        return resp
+
+    def test_GET_different_keys_for_data_and_metadata(self):
+        resp = self._check_different_keys_for_data_and_metadata('GET')
+        self.assertEqual(b'object data', resp.body)
+
+    def test_HEAD_different_keys_for_data_and_metadata(self):
+        resp = self._check_different_keys_for_data_and_metadata('HEAD')
+        self.assertEqual(b'', resp.body)
+
+    def _check_unencrypted_data_and_encrypted_metadata(self, method):
+        env = {'REQUEST_METHOD': method,
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        req = Request.blank('/v1/a/c/o', environ=env)
+        body = b'object data'
+        plaintext_etag = md5hex(body)
+        metadata_key = fetch_crypto_keys()
+        # synthesise headers for unencrypted PUT + headers for encrypted POST
+        hdrs = HeaderKeyDict({
+            'Etag': plaintext_etag,
+            'content-type': 'text/plain',
+            'content-length': len(body)})
+        # we don't the data related headers but need a body key to keep the
+        # helper function happy
+        body_key = os.urandom(32)
+        metadata_hdrs = self._make_response_headers(
+            len(body), plaintext_etag, metadata_key, body_key)
+        for k, v in metadata_hdrs.items():
+            if is_object_transient_sysmeta(k):
+                hdrs[k] = v
+
+        self.app.register(
+            method, '/v1/a/c/o', HTTPOk, body=body, headers=hdrs)
+        resp = req.get_response(self.decrypter)
+        self.assertEqual('200 OK', resp.status)
+        self.assertEqual(plaintext_etag, resp.headers['Etag'])
+        self.assertEqual('text/plain', resp.headers['Content-Type'])
+        self.assertEqual('encrypt me', resp.headers['x-object-meta-test'])
+        self.assertNotIn('Access-Control-Expose-Headers', resp.headers)
+        return resp
+
+    def test_GET_unencrypted_data_and_encrypted_metadata(self):
+        resp = self._check_unencrypted_data_and_encrypted_metadata('GET')
+        self.assertEqual(b'object data', resp.body)
+
+    def test_HEAD_unencrypted_data_and_encrypted_metadata(self):
+        resp = self._check_unencrypted_data_and_encrypted_metadata('HEAD')
+        self.assertEqual(b'', resp.body)
+
+    def _check_encrypted_data_and_unencrypted_metadata(self, method):
+        env = {'REQUEST_METHOD': method,
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        req = Request.blank('/v1/a/c/o', environ=env)
+        body = b'object data'
+        plaintext_etag = md5hex(body)
+        body_key = os.urandom(32)
+        enc_body = encrypt(body, body_key, FAKE_IV)
+        data_key = fetch_crypto_keys()
+        hdrs = self._make_response_headers(
+            len(enc_body), plaintext_etag, data_key, body_key)
+        to_remove = [k for k in hdrs if is_object_transient_sysmeta(k)]
+        for k in to_remove:
+            hdrs.pop(k)
+        hdrs['x-object-meta-test'] = 'unencrypted'
+
+        self.app.register(
+            method, '/v1/a/c/o', HTTPOk, body=enc_body, headers=hdrs)
+        resp = req.get_response(self.decrypter)
+        self.assertEqual('200 OK', resp.status)
+        self.assertEqual(plaintext_etag, resp.headers['Etag'])
+        self.assertEqual('text/plain', resp.headers['Content-Type'])
+        self.assertEqual('unencrypted', resp.headers['x-object-meta-test'])
+        self.assertNotIn('Access-Control-Expose-Headers', resp.headers)
+        return resp
+
+    def test_GET_encrypted_data_and_unencrypted_metadata(self):
+        resp = self._check_encrypted_data_and_unencrypted_metadata('GET')
+        self.assertEqual(b'object data', resp.body)
+
+    def test_HEAD_encrypted_data_and_unencrypted_metadata(self):
+        resp = self._check_encrypted_data_and_unencrypted_metadata('HEAD')
+        self.assertEqual(b'', resp.body)
+
+    def test_headers_case(self):
+        body = b'fAkE ApP'
+        req = Request.blank('/v1/a/c/o', body='FaKe', headers={
+            'Origin': 'http://example.com'})
+        req.environ[CRYPTO_KEY_CALLBACK] = fetch_crypto_keys
+        plaintext_etag = md5hex(body)
+        body_key = os.urandom(32)
+        enc_body = encrypt(body, body_key, FAKE_IV)
+        hdrs = self._make_response_headers(
+            len(enc_body), plaintext_etag, fetch_crypto_keys(), body_key)
+
+        hdrs.update({
+            'x-Object-mEta-ignoRes-caSe': 'thIs pArt WilL bE cOol',
+            'access-control-Expose-Headers': 'x-object-meta-ignores-case',
+            'access-control-allow-origin': '*',
+        })
+        self.assertNotIn('x-object-meta-test', [k.lower() for k in hdrs])
+        self.app.register(
+            'GET', '/v1/a/c/o', HTTPOk, body=enc_body, headers=hdrs)
+
+        status, headers, app_iter = req.call_application(self.decrypter)
+        self.assertEqual(status, '200 OK')
+        expected = {
+            'Etag': '7f7837924188f7b511a9e3881a9f77a8',
+            'X-Object-Sysmeta-Container-Update-Override-Etag':
+            'encrypt me, too',
+            'X-Object-Meta-Test': 'encrypt me',
+            'Content-Length': '8',
+            'X-Object-Meta-Ignores-Case': 'thIs pArt WilL bE cOol',
+            'X-Object-Sysmeta-Test': 'do not encrypt me',
+            'Content-Type': 'text/plain',
+            'Access-Control-Expose-Headers': ', '.join([
+                'x-object-meta-ignores-case',
+                'x-object-meta-test',
+            ]),
+            'Access-Control-Allow-Origin': '*',
+        }
+        self.assertEqual(dict(headers), expected)
+        self.assertEqual(b'fAkE ApP', b''.join(app_iter))
+
+    def _test_412_response(self, method):
+        # simulate a 412 response to a conditional GET which has an Etag header
+        data = b'the object content'
+        env = {CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        req = Request.blank('/v1/a/c/o', environ=env, method=method)
+        resp_body = b'I am sorry, you have failed to meet a precondition'
+        hdrs = self._make_response_headers(
+            len(resp_body), md5hex(data), fetch_crypto_keys(), b'not used')
+        self.app.register(method, '/v1/a/c/o', HTTPPreconditionFailed,
+                          body=resp_body, headers=hdrs)
+        resp = req.get_response(self.decrypter)
+
+        self.assertEqual('412 Precondition Failed', resp.status)
+        # the response body should not be decrypted, it is already plaintext
+        self.assertEqual(resp_body if method == 'GET' else b'', resp.body)
+        # whereas the Etag and other headers should be decrypted
+        self.assertEqual(md5hex(data), resp.headers['Etag'])
+        self.assertEqual('text/plain', resp.headers['Content-Type'])
+        self.assertEqual('encrypt me', resp.headers['x-object-meta-test'])
+        self.assertEqual('do not encrypt me',
+                         resp.headers['x-object-sysmeta-test'])
+
+    def test_GET_412_response(self):
+        self._test_412_response('GET')
+
+    def test_HEAD_412_response(self):
+        self._test_412_response('HEAD')
+
+    def _test_404_response(self, method):
+        # simulate a 404 response, sanity check response headers
+        env = {CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        req = Request.blank('/v1/a/c/o', environ=env, method=method)
+        resp_body = b'You still have not found what you are looking for'
+        hdrs = {'content-type': 'text/plain',
+                'content-length': len(resp_body)}
+        self.app.register(method, '/v1/a/c/o', HTTPNotFound,
+                          body=resp_body, headers=hdrs)
+        resp = req.get_response(self.decrypter)
+
+        self.assertEqual('404 Not Found', resp.status)
+        # the response body should not be decrypted, it is already plaintext
+        self.assertEqual(resp_body if method == 'GET' else b'', resp.body)
+        # there should be no etag header inserted by decrypter
+        self.assertNotIn('Etag', resp.headers)
+        self.assertEqual('text/plain', resp.headers['Content-Type'])
+
+    def test_GET_404_response(self):
+        self._test_404_response('GET')
+
+    def test_HEAD_404_response(self):
+        self._test_404_response('HEAD')
+
+    def test_GET_missing_etag_crypto_meta(self):
+        env = {'REQUEST_METHOD': 'GET',
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        req = Request.blank('/v1/a/c/o', environ=env)
+        body = b'FAKE APP'
+        key = fetch_crypto_keys()['object']
+        enc_body = encrypt(body, key, FAKE_IV)
+        hdrs = self._make_response_headers(
+            len(body), md5hex(body), fetch_crypto_keys(), b'not used')
+        # simulate missing crypto meta from encrypted etag
+        hdrs['X-Object-Sysmeta-Crypto-Etag'] = bytes_to_wsgi(base64.b64encode(
+            encrypt(md5hex(body).encode('ascii'), key, FAKE_IV)))
+        self.app.register('GET', '/v1/a/c/o', HTTPOk, body=enc_body,
+                          headers=hdrs)
+        resp = req.get_response(self.decrypter)
+        self.assertEqual('500 Internal Error', resp.status)
+        self.assertIn(b'Error decrypting header', resp.body)
+        self.assertIn('Error decrypting header X-Object-Sysmeta-Crypto-Etag',
+                      self.decrypter.logger.get_lines_for_level('error')[0])
+
+    def _test_override_etag_bad_meta(self, method, bad_crypto_meta):
+        env = {'REQUEST_METHOD': method,
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        req = Request.blank('/v1/a/c/o', environ=env)
+        body = b'FAKE APP'
+        key = fetch_crypto_keys()['object']
+        enc_body = encrypt(body, key, FAKE_IV)
+        hdrs = self._make_response_headers(
+            len(body), md5hex(body), fetch_crypto_keys(), b'not used')
+        # simulate missing crypto meta from encrypted override etag
+        hdrs['X-Object-Sysmeta-Container-Update-Override-Etag'] = \
+            encrypt_and_append_meta(
+                md5hex(body), key, crypto_meta=bad_crypto_meta)
+        self.app.register(method, '/v1/a/c/o', HTTPOk, body=enc_body,
+                          headers=hdrs)
+        resp = req.get_response(self.decrypter)
+        self.assertEqual('500 Internal Error', resp.status)
+        self.assertIn('Error decrypting header '
+                      'X-Object-Sysmeta-Container-Update-Override-Etag',
+                      self.decrypter.logger.get_lines_for_level('error')[0])
+        return resp
+
+    def test_GET_override_etag_bad_iv(self):
+        bad_crypto_meta = fake_get_crypto_meta()
+        bad_crypto_meta['iv'] = b'bad_iv'
+        resp = self._test_override_etag_bad_meta('GET', bad_crypto_meta)
+        self.assertIn(b'Error decrypting header', resp.body)
+
+    def test_HEAD_override_etag_bad_iv(self):
+        bad_crypto_meta = fake_get_crypto_meta()
+        bad_crypto_meta['iv'] = b'bad_iv'
+        resp = self._test_override_etag_bad_meta('HEAD', bad_crypto_meta)
+        self.assertEqual(b'', resp.body)
+
+    def test_GET_override_etag_bad_cipher(self):
+        bad_crypto_meta = fake_get_crypto_meta()
+        bad_crypto_meta['cipher'] = 'unknown cipher'
+        resp = self._test_override_etag_bad_meta('GET', bad_crypto_meta)
+        self.assertIn(b'Error decrypting header', resp.body)
+
+    def test_HEAD_override_etag_bad_cipher(self):
+        bad_crypto_meta = fake_get_crypto_meta()
+        bad_crypto_meta['cipher'] = 'unknown cipher'
+        resp = self._test_override_etag_bad_meta('HEAD', bad_crypto_meta)
+        self.assertEqual(b'', resp.body)
+
+    def _test_bad_key(self, method):
+        # use bad key
+        def bad_fetch_crypto_keys(**kwargs):
+            keys = fetch_crypto_keys()
+            keys['object'] = b'bad key'
+            return keys
+
+        env = {'REQUEST_METHOD': method,
+               CRYPTO_KEY_CALLBACK: bad_fetch_crypto_keys}
+        req = Request.blank('/v1/a/c/o', environ=env)
+        body = b'FAKE APP'
+        key = fetch_crypto_keys()['object']
+        enc_body = encrypt(body, key, FAKE_IV)
+        hdrs = self._make_response_headers(
+            len(body), md5hex(body), fetch_crypto_keys(), b'not used')
+        self.app.register(method, '/v1/a/c/o', HTTPOk, body=enc_body,
+                          headers=hdrs)
+        return req.get_response(self.decrypter)
+
+    def test_HEAD_with_bad_key(self):
+        resp = self._test_bad_key('HEAD')
+        self.assertEqual('500 Internal Error', resp.status)
+        self.assertIn("Bad key for 'object'",
+                      self.decrypter.logger.get_lines_for_level('error')[0])
+
+    def test_GET_with_bad_key(self):
+        resp = self._test_bad_key('GET')
+        self.assertEqual('500 Internal Error', resp.status)
+        self.assertEqual(b'Unable to retrieve encryption keys.',
+                         resp.body)
+        self.assertIn("Bad key for 'object'",
+                      self.decrypter.logger.get_lines_for_level('error')[0])
+
+    def _test_bad_crypto_meta_for_user_metadata(self, method, bad_crypto_meta):
+        # use bad iv for metadata headers
+        env = {'REQUEST_METHOD': method,
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        req = Request.blank('/v1/a/c/o', environ=env)
+        body = b'FAKE APP'
+        key = fetch_crypto_keys()['object']
+        enc_body = encrypt(body, key, FAKE_IV)
+        hdrs = self._make_response_headers(
+            len(body), md5hex(body),
+            fetch_crypto_keys(), b'not used')
+        enc_val = base64.b64encode(encrypt(
+            b'encrypt me', key, FAKE_IV)).decode('ascii')
+        if bad_crypto_meta:
+            enc_val += ';swift_meta=' + get_crypto_meta_header(
+                crypto_meta=bad_crypto_meta)
+        hdrs['x-object-transient-sysmeta-crypto-meta-test'] = enc_val
+        self.app.register(method, '/v1/a/c/o', HTTPOk, body=enc_body,
+                          headers=hdrs)
+        resp = req.get_response(self.decrypter)
+        self.assertEqual('500 Internal Error', resp.status)
+        self.assertIn(
+            'Error decrypting header X-Object-Transient-Sysmeta-Crypto-Meta-'
+            'Test', self.decrypter.logger.get_lines_for_level('error')[0])
+        return resp
+
+    def test_HEAD_with_missing_crypto_meta_for_user_metadata(self):
+        self._test_bad_crypto_meta_for_user_metadata('HEAD', None)
+        self.assertIn('Missing crypto meta in value',
+                      self.decrypter.logger.get_lines_for_level('error')[0])
+
+    def test_GET_with_missing_crypto_meta_for_user_metadata(self):
+        self._test_bad_crypto_meta_for_user_metadata('GET', None)
+        self.assertIn('Missing crypto meta in value',
+                      self.decrypter.logger.get_lines_for_level('error')[0])
+
+    def test_HEAD_with_bad_iv_for_user_metadata(self):
+        bad_crypto_meta = fake_get_crypto_meta()
+        bad_crypto_meta['iv'] = b'bad_iv'
+        self._test_bad_crypto_meta_for_user_metadata('HEAD', bad_crypto_meta)
+        self.assertIn('IV must be length 16',
+                      self.decrypter.logger.get_lines_for_level('error')[0])
+
+    def test_HEAD_with_missing_iv_for_user_metadata(self):
+        bad_crypto_meta = fake_get_crypto_meta()
+        bad_crypto_meta.pop('iv')
+        self._test_bad_crypto_meta_for_user_metadata('HEAD', bad_crypto_meta)
+        self.assertIn(
+            'iv', self.decrypter.logger.get_lines_for_level('error')[0])
+
+    def test_GET_with_bad_iv_for_user_metadata(self):
+        bad_crypto_meta = fake_get_crypto_meta()
+        bad_crypto_meta['iv'] = b'bad_iv'
+        resp = self._test_bad_crypto_meta_for_user_metadata(
+            'GET', bad_crypto_meta)
+        self.assertEqual(b'Error decrypting header', resp.body)
+        self.assertIn('IV must be length 16',
+                      self.decrypter.logger.get_lines_for_level('error')[0])
+
+    def test_GET_with_missing_iv_for_user_metadata(self):
+        bad_crypto_meta = fake_get_crypto_meta()
+        bad_crypto_meta.pop('iv')
+        resp = self._test_bad_crypto_meta_for_user_metadata(
+            'GET', bad_crypto_meta)
+        self.assertEqual(b'Error decrypting header', resp.body)
+        self.assertIn(
+            'iv', self.decrypter.logger.get_lines_for_level('error')[0])
+
+    def _test_GET_with_bad_crypto_meta_for_object_body(self, bad_crypto_meta):
+        # use bad iv for object body
+        env = {'REQUEST_METHOD': 'GET',
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        req = Request.blank('/v1/a/c/o', environ=env)
+        body = b'FAKE APP'
+        key = fetch_crypto_keys()['object']
+        enc_body = encrypt(body, key, FAKE_IV)
+        hdrs = self._make_response_headers(
+            len(body), md5hex(body), fetch_crypto_keys(), b'not used')
+        hdrs['X-Object-Sysmeta-Crypto-Body-Meta'] = \
+            get_crypto_meta_header(crypto_meta=bad_crypto_meta)
+        self.app.register('GET', '/v1/a/c/o', HTTPOk, body=enc_body,
+                          headers=hdrs)
+        resp = req.get_response(self.decrypter)
+        self.assertEqual('500 Internal Error', resp.status)
+        self.assertEqual(b'Error decrypting object', resp.body)
+        self.assertIn('Error decrypting object',
+                      self.decrypter.logger.get_lines_for_level('error')[0])
+
+    def test_GET_with_bad_iv_for_object_body(self):
+        bad_crypto_meta = fake_get_crypto_meta(key=os.urandom(32))
+        bad_crypto_meta['iv'] = b'bad_iv'
+        self._test_GET_with_bad_crypto_meta_for_object_body(bad_crypto_meta)
+        self.assertIn('IV must be length 16',
+                      self.decrypter.logger.get_lines_for_level('error')[0])
+
+    def test_GET_with_missing_iv_for_object_body(self):
+        bad_crypto_meta = fake_get_crypto_meta(key=os.urandom(32))
+        bad_crypto_meta.pop('iv')
+        self._test_GET_with_bad_crypto_meta_for_object_body(bad_crypto_meta)
+        self.assertIn("Missing 'iv'",
+                      self.decrypter.logger.get_lines_for_level('error')[0])
+
+    def test_GET_with_bad_body_key_for_object_body(self):
+        body_key_meta = {'key': b'wrapped too short key', 'iv': FAKE_IV}
+        bad_crypto_meta = fake_get_crypto_meta(body_key=body_key_meta)
+        self._test_GET_with_bad_crypto_meta_for_object_body(bad_crypto_meta)
+        self.assertIn('Key must be length 32',
+                      self.decrypter.logger.get_lines_for_level('error')[0])
+
+    def test_GET_with_missing_body_key_for_object_body(self):
+        bad_crypto_meta = fake_get_crypto_meta()  # no key by default
+        self._test_GET_with_bad_crypto_meta_for_object_body(bad_crypto_meta)
+        self.assertIn("Missing 'body_key'",
+                      self.decrypter.logger.get_lines_for_level('error')[0])
+
+    def _test_req_metadata_not_encrypted(self, method):
+        # check that metadata is not decrypted if it does not have crypto meta;
+        # testing for case of an unencrypted POST to an object.
+        env = {'REQUEST_METHOD': method,
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        req = Request.blank('/v1/a/c/o', environ=env)
+        body = b'FAKE APP'
+        plaintext_etag = md5hex(body)
+        body_key = os.urandom(32)
+        enc_body = encrypt(body, body_key, FAKE_IV)
+        hdrs = self._make_response_headers(
+            len(body), plaintext_etag, fetch_crypto_keys(), body_key)
+        hdrs.pop('x-object-transient-sysmeta-crypto-meta-test')
+        hdrs['x-object-meta-test'] = 'plaintext not encrypted'
+        self.app.register(
+            method, '/v1/a/c/o', HTTPOk, body=enc_body, headers=hdrs)
+        resp = req.get_response(self.decrypter)
+        self.assertEqual('200 OK', resp.status)
+        self.assertEqual(plaintext_etag, resp.headers['Etag'])
+        self.assertEqual('text/plain', resp.headers['Content-Type'])
+        self.assertEqual('plaintext not encrypted',
+                         resp.headers['x-object-meta-test'])
+
+    def test_HEAD_metadata_not_encrypted(self):
+        self._test_req_metadata_not_encrypted('HEAD')
+
+    def test_GET_metadata_not_encrypted(self):
+        self._test_req_metadata_not_encrypted('GET')
+
+    def test_GET_unencrypted_data(self):
+        # testing case of an unencrypted object with encrypted metadata from
+        # a later POST
+        env = {'REQUEST_METHOD': 'GET',
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        req = Request.blank('/v1/a/c/o', environ=env)
+        body = b'FAKE APP'
+        obj_key = fetch_crypto_keys()['object']
+        hdrs = {'Etag': md5hex(body),
+                'content-type': 'text/plain',
+                'content-length': len(body),
+                'x-object-transient-sysmeta-crypto-meta-test':
+                    bytes_to_wsgi(base64.b64encode(encrypt(
+                        b'encrypt me', obj_key, FAKE_IV))) +
+                    ';swift_meta=' + get_crypto_meta_header(),
+                'x-object-sysmeta-test': 'do not encrypt me'}
+        self.app.register('GET', '/v1/a/c/o', HTTPOk, body=body, headers=hdrs)
+        resp = req.get_response(self.decrypter)
+        self.assertEqual(body, resp.body)
+        self.assertEqual('200 OK', resp.status)
+        self.assertEqual(md5hex(body), resp.headers['Etag'])
+        self.assertEqual('text/plain', resp.headers['Content-Type'])
+        # POSTed user meta was encrypted
+        self.assertEqual('encrypt me', resp.headers['x-object-meta-test'])
+        # PUT sysmeta was not encrypted
+        self.assertEqual('do not encrypt me',
+                         resp.headers['x-object-sysmeta-test'])
+
+    def test_GET_multiseg(self):
+        env = {'REQUEST_METHOD': 'GET',
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        req = Request.blank('/v1/a/c/o', environ=env)
+        chunks = [b'some', b'chunks', b'of data']
+        body = b''.join(chunks)
+        plaintext_etag = md5hex(body)
+        body_key = os.urandom(32)
+        ctxt = Crypto().create_encryption_ctxt(body_key, FAKE_IV)
+        enc_body = [encrypt(chunk, ctxt=ctxt) for chunk in chunks]
+        hdrs = self._make_response_headers(
+            sum(map(len, enc_body)), plaintext_etag, fetch_crypto_keys(),
+            body_key)
+        self.app.register(
+            'GET', '/v1/a/c/o', HTTPOk, body=enc_body, headers=hdrs)
+        resp = req.get_response(self.decrypter)
+        self.assertEqual(body, resp.body)
+        self.assertEqual('200 OK', resp.status)
+        self.assertEqual(plaintext_etag, resp.headers['Etag'])
+        self.assertEqual('text/plain', resp.headers['Content-Type'])
+
+    def test_GET_multiseg_with_range(self):
+        env = {'REQUEST_METHOD': 'GET',
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        req = Request.blank('/v1/a/c/o', environ=env)
+        req.headers['Content-Range'] = 'bytes 3-10/17'
+        chunks = [b'0123', b'45678', b'9abcdef']
+        body = b''.join(chunks)
+        plaintext_etag = md5hex(body)
+        body_key = os.urandom(32)
+        ctxt = Crypto().create_encryption_ctxt(body_key, FAKE_IV)
+        enc_body = [encrypt(chunk, ctxt=ctxt) for chunk in chunks]
+        enc_body = [enc_body[0][3:], enc_body[1], enc_body[2][:2]]
+        hdrs = self._make_response_headers(
+            sum(map(len, enc_body)), plaintext_etag, fetch_crypto_keys(),
+            body_key)
+        hdrs['content-range'] = req.headers['Content-Range']
+        self.app.register(
+            'GET', '/v1/a/c/o', HTTPOk, body=enc_body, headers=hdrs)
+        resp = req.get_response(self.decrypter)
+        self.assertEqual(b'3456789a', resp.body)
+        self.assertEqual('200 OK', resp.status)
+        self.assertEqual(plaintext_etag, resp.headers['Etag'])
+        self.assertEqual('text/plain', resp.headers['Content-Type'])
+
+    # Force the decrypter context updates to be less than one of our range
+    # sizes to check that the decrypt context offset is setup correctly with
+    # offset to first byte of range for first update and then re-used.
+    # Do mocking here to have the mocked value have effect in the generator
+    # function.
+    @mock.patch.object(decrypter, 'DECRYPT_CHUNK_SIZE', 4)
+    def test_GET_multipart_ciphertext(self):
+        # build fake multipart response body
+        body_key = os.urandom(32)
+        plaintext = b'Cwm fjord veg balks nth pyx quiz'
+        plaintext_etag = md5hex(plaintext)
+        ciphertext = encrypt(plaintext, body_key, FAKE_IV)
+        parts = ((0, 3, 'text/plain'),
+                 (4, 9, 'text/plain; charset=us-ascii'),
+                 (24, 32, 'text/plain'))
+        length = len(ciphertext)
+        body = b''
+        for start, end, ctype in parts:
+            body += b'--multipartboundary\r\n'
+            body += b'Content-Type: %s\r\n' % ctype.encode('utf-8')
+            body += b'Content-Range: bytes %d-%d/%d' % (start, end - 1, length)
+            body += b'\r\n\r\n' + ciphertext[start:end] + b'\r\n'
+        body += b'--multipartboundary--'
+
+        # register request with fake swift
+        hdrs = self._make_response_headers(
+            len(body), plaintext_etag, fetch_crypto_keys(), body_key)
+        hdrs['content-type'] = \
+            'multipart/byteranges;boundary=multipartboundary'
+        self.app.register('GET', '/v1/a/c/o', HTTPPartialContent, body=body,
+                          headers=hdrs)
+
+        # issue request
+        env = {'REQUEST_METHOD': 'GET',
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        req = Request.blank('/v1/a/c/o', environ=env)
+        resp = req.get_response(self.decrypter)
+
+        self.assertEqual('206 Partial Content', resp.status)
+        self.assertEqual(plaintext_etag, resp.headers['Etag'])
+        self.assertEqual(len(body), int(resp.headers['Content-Length']))
+        self.assertEqual('multipart/byteranges;boundary=multipartboundary',
+                         resp.headers['Content-Type'])
+
+        # the multipart headers could be re-ordered, so parse response body to
+        # verify expected content
+        resp_lines = resp.body.split(b'\r\n')
+        resp_lines.reverse()
+        for start, end, ctype in parts:
+            self.assertEqual(b'--multipartboundary', resp_lines.pop())
+            expected_header_lines = {
+                b'Content-Type: %s' % ctype.encode('utf8'),
+                b'Content-Range: bytes %d-%d/%d' % (start, end - 1, length)}
+            resp_header_lines = {resp_lines.pop(), resp_lines.pop()}
+            self.assertEqual(expected_header_lines, resp_header_lines)
+            self.assertEqual(b'', resp_lines.pop())
+            self.assertEqual(plaintext[start:end], resp_lines.pop())
+        self.assertEqual(b'--multipartboundary--', resp_lines.pop())
+
+        # we should have consumed the whole response body
+        self.assertFalse(resp_lines)
+
+    def test_GET_multipart_content_type(self):
+        # *just* having multipart content type shouldn't trigger the mime doc
+        # code path
+        body_key = os.urandom(32)
+        plaintext = b'Cwm fjord veg balks nth pyx quiz'
+        plaintext_etag = md5hex(plaintext)
+        ciphertext = encrypt(plaintext, body_key, FAKE_IV)
+
+        # register request with fake swift
+        hdrs = self._make_response_headers(
+            len(ciphertext), plaintext_etag, fetch_crypto_keys(), body_key)
+        hdrs['content-type'] = \
+            'multipart/byteranges;boundary=multipartboundary'
+        self.app.register('GET', '/v1/a/c/o', HTTPOk, body=ciphertext,
+                          headers=hdrs)
+
+        # issue request
+        env = {'REQUEST_METHOD': 'GET',
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        req = Request.blank('/v1/a/c/o', environ=env)
+        resp = req.get_response(self.decrypter)
+
+        self.assertEqual('200 OK', resp.status)
+        self.assertEqual(plaintext_etag, resp.headers['Etag'])
+        self.assertEqual(len(plaintext), int(resp.headers['Content-Length']))
+        self.assertEqual('multipart/byteranges;boundary=multipartboundary',
+                         resp.headers['Content-Type'])
+        self.assertEqual(plaintext, resp.body)
+
+    def test_GET_multipart_no_body_crypto_meta(self):
+        # build fake multipart response body
+        plaintext = b'Cwm fjord veg balks nth pyx quiz'
+        plaintext_etag = md5hex(plaintext)
+        parts = ((0, 3, 'text/plain'),
+                 (4, 9, 'text/plain; charset=us-ascii'),
+                 (24, 32, 'text/plain'))
+        length = len(plaintext)
+        body = b''
+        for start, end, ctype in parts:
+            body += b'--multipartboundary\r\n'
+            body += b'Content-Type: %s\r\n' % ctype.encode('utf-8')
+            body += b'Content-Range: bytes %d-%d/%d' % (start, end - 1, length)
+            body += b'\r\n\r\n' + plaintext[start:end] + b'\r\n'
+        body += b'--multipartboundary--'
+
+        # register request with fake swift
+        hdrs = {
+            'Etag': plaintext_etag,
+            'content-type': 'multipart/byteranges;boundary=multipartboundary',
+            'content-length': len(body)}
+        self.app.register('GET', '/v1/a/c/o', HTTPPartialContent, body=body,
+                          headers=hdrs)
+
+        # issue request
+        env = {'REQUEST_METHOD': 'GET',
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        req = Request.blank('/v1/a/c/o', environ=env)
+        resp = req.get_response(self.decrypter)
+
+        self.assertEqual('206 Partial Content', resp.status)
+        self.assertEqual(plaintext_etag, resp.headers['Etag'])
+        self.assertEqual(len(body), int(resp.headers['Content-Length']))
+        self.assertEqual('multipart/byteranges;boundary=multipartboundary',
+                         resp.headers['Content-Type'])
+
+        # the multipart response body should be unchanged
+        self.assertEqual(body, resp.body)
+
+    def _test_GET_multipart_bad_body_crypto_meta(self, bad_crypto_meta):
+        # build fake multipart response body
+        key = fetch_crypto_keys()['object']
+        ctxt = Crypto().create_encryption_ctxt(key, FAKE_IV)
+        plaintext = b'Cwm fjord veg balks nth pyx quiz'
+        plaintext_etag = md5hex(plaintext)
+        ciphertext = encrypt(plaintext, ctxt=ctxt)
+        parts = ((0, 3, 'text/plain'),
+                 (4, 9, 'text/plain; charset=us-ascii'),
+                 (24, 32, 'text/plain'))
+        length = len(ciphertext)
+        body = b''
+        for start, end, ctype in parts:
+            body += b'--multipartboundary\r\n'
+            body += b'Content-Type: %s\r\n' % ctype.encode('utf-8')
+            body += b'Content-Range: bytes %d-%d/%d' % (start, end - 1, length)
+            body += b'\r\n\r\n' + ciphertext[start:end] + b'\r\n'
+        body += b'--multipartboundary--'
+
+        # register request with fake swift
+        hdrs = self._make_response_headers(
+            len(body), plaintext_etag, fetch_crypto_keys(), b'not used')
+        hdrs['content-type'] = \
+            'multipart/byteranges;boundary=multipartboundary'
+        hdrs['X-Object-Sysmeta-Crypto-Body-Meta'] = \
+            get_crypto_meta_header(bad_crypto_meta)
+        self.app.register('GET', '/v1/a/c/o', HTTPOk, body=body, headers=hdrs)
+
+        # issue request
+        env = {'REQUEST_METHOD': 'GET',
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        req = Request.blank('/v1/a/c/o', environ=env)
+        resp = req.get_response(self.decrypter)
+
+        self.assertEqual('500 Internal Error', resp.status)
+        self.assertEqual(b'Error decrypting object', resp.body)
+        self.assertIn('Error decrypting object',
+                      self.decrypter.logger.get_lines_for_level('error')[0])
+
+    def test_GET_multipart_bad_body_cipher(self):
+        self._test_GET_multipart_bad_body_crypto_meta(
+            {'cipher': 'Mystery cipher', 'iv': b'1234567887654321'})
+        self.assertIn('Cipher must be AES_CTR_256',
+                      self.decrypter.logger.get_lines_for_level('error')[0])
+
+    def test_GET_multipart_missing_body_cipher(self):
+        self._test_GET_multipart_bad_body_crypto_meta(
+            {'iv': b'1234567887654321'})
+        self.assertIn('cipher',
+                      self.decrypter.logger.get_lines_for_level('error')[0])
+
+    def test_GET_multipart_too_short_body_iv(self):
+        self._test_GET_multipart_bad_body_crypto_meta(
+            {'cipher': 'AES_CTR_256', 'iv': b'too short'})
+        self.assertIn('IV must be length 16',
+                      self.decrypter.logger.get_lines_for_level('error')[0])
+
+    def test_GET_multipart_too_long_body_iv(self):
+        self._test_GET_multipart_bad_body_crypto_meta(
+            {'cipher': 'AES_CTR_256', 'iv': b'a little too long'})
+        self.assertIn('IV must be length 16',
+                      self.decrypter.logger.get_lines_for_level('error')[0])
+
+    def test_GET_multipart_missing_body_iv(self):
+        self._test_GET_multipart_bad_body_crypto_meta(
+            {'cipher': 'AES_CTR_256'})
+        self.assertIn('iv',
+                      self.decrypter.logger.get_lines_for_level('error')[0])
+
+    def test_GET_missing_key_callback(self):
+        # Do not provide keys, and do not set override flag
+        env = {'REQUEST_METHOD': 'GET'}
+        req = Request.blank('/v1/a/c/o', environ=env)
+        body = b'FAKE APP'
+        enc_body = encrypt(body, fetch_crypto_keys()['object'], FAKE_IV)
+        hdrs = self._make_response_headers(
+            len(body), md5hex(b'not the body'),
+            fetch_crypto_keys(), b'not used')
+        self.app.register(
+            'GET', '/v1/a/c/o', HTTPOk, body=enc_body, headers=hdrs)
+        resp = req.get_response(self.decrypter)
+        self.assertEqual('500 Internal Error', resp.status)
+        self.assertEqual(b'Unable to retrieve encryption keys.',
+                         resp.body)
+        self.assertIn('missing callback',
+                      self.decrypter.logger.get_lines_for_level('error')[0])
+
+    def test_GET_error_in_key_callback(self):
+        def raise_exc(**kwargs):
+            raise Exception('Testing')
+
+        env = {'REQUEST_METHOD': 'GET',
+               CRYPTO_KEY_CALLBACK: raise_exc}
+        req = Request.blank('/v1/a/c/o', environ=env)
+        body = b'FAKE APP'
+        enc_body = encrypt(body, fetch_crypto_keys()['object'], FAKE_IV)
+        hdrs = self._make_response_headers(
+            len(body), md5hex(body), fetch_crypto_keys(), b'not used')
+        self.app.register(
+            'GET', '/v1/a/c/o', HTTPOk, body=enc_body, headers=hdrs)
+        resp = req.get_response(self.decrypter)
+        self.assertEqual('500 Internal Error', resp.status)
+        self.assertEqual(b'Unable to retrieve encryption keys.',
+                         resp.body)
+        self.assertIn('from callback: Testing',
+                      self.decrypter.logger.get_lines_for_level('error')[0])
+
+    def test_GET_cipher_mismatch_for_body(self):
+        # Cipher does not match
+        env = {'REQUEST_METHOD': 'GET',
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        req = Request.blank('/v1/a/c/o', environ=env)
+        body = b'FAKE APP'
+        enc_body = encrypt(body, fetch_crypto_keys()['object'], FAKE_IV)
+        bad_crypto_meta = fake_get_crypto_meta()
+        bad_crypto_meta['cipher'] = 'unknown_cipher'
+        hdrs = self._make_response_headers(
+            len(enc_body), md5hex(body), fetch_crypto_keys(), b'not used')
+        hdrs['X-Object-Sysmeta-Crypto-Body-Meta'] = \
+            get_crypto_meta_header(crypto_meta=bad_crypto_meta)
+        self.app.register(
+            'GET', '/v1/a/c/o', HTTPOk, body=enc_body, headers=hdrs)
+        resp = req.get_response(self.decrypter)
+        self.assertEqual('500 Internal Error', resp.status)
+        self.assertEqual(b'Error decrypting object', resp.body)
+        self.assertIn('Error decrypting object',
+                      self.decrypter.logger.get_lines_for_level('error')[0])
+        self.assertIn('Bad crypto meta: Cipher',
+                      self.decrypter.logger.get_lines_for_level('error')[0])
+
+    def test_GET_cipher_mismatch_for_metadata(self):
+        # Cipher does not match
+        env = {'REQUEST_METHOD': 'GET',
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        req = Request.blank('/v1/a/c/o', environ=env)
+        body = b'FAKE APP'
+        key = fetch_crypto_keys()['object']
+        enc_body = encrypt(body, key, FAKE_IV)
+        bad_crypto_meta = fake_get_crypto_meta()
+        bad_crypto_meta['cipher'] = 'unknown_cipher'
+        hdrs = self._make_response_headers(
+            len(enc_body), md5hex(body), fetch_crypto_keys(), b'not used')
+        enc_val = bytes_to_wsgi(base64.b64encode(
+            encrypt(b'encrypt me', key, FAKE_IV)))
+
+        hdrs.update({'x-object-transient-sysmeta-crypto-meta-test':
+                     enc_val + ';swift_meta=' +
+                     get_crypto_meta_header(crypto_meta=bad_crypto_meta)})
+        self.app.register(
+            'GET', '/v1/a/c/o', HTTPOk, body=enc_body, headers=hdrs)
+        resp = req.get_response(self.decrypter)
+        self.assertEqual('500 Internal Error', resp.status)
+        self.assertEqual(b'Error decrypting header', resp.body)
+        self.assertIn(
+            'Error decrypting header X-Object-Transient-Sysmeta-Crypto-Meta-'
+            'Test', self.decrypter.logger.get_lines_for_level('error')[0])
+
+    def test_GET_decryption_override(self):
+        # This covers the case of an old un-encrypted object
+        env = {'REQUEST_METHOD': 'GET',
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys,
+               'swift.crypto.override': True}
+        req = Request.blank('/v1/a/c/o', environ=env)
+        body = b'FAKE APP'
+        hdrs = {'Etag': md5hex(body),
+                'content-type': 'text/plain',
+                'content-length': len(body),
+                'x-object-meta-test': 'do not encrypt me',
+                'x-object-sysmeta-test': 'do not encrypt me'}
+        self.app.register('GET', '/v1/a/c/o', HTTPOk, body=body, headers=hdrs)
+        resp = req.get_response(self.decrypter)
+        self.assertEqual(body, resp.body)
+        self.assertEqual('200 OK', resp.status)
+        self.assertEqual(md5hex(body), resp.headers['Etag'])
+        self.assertEqual('text/plain', resp.headers['Content-Type'])
+        self.assertEqual('do not encrypt me',
+                         resp.headers['x-object-meta-test'])
+        self.assertEqual('do not encrypt me',
+                         resp.headers['x-object-sysmeta-test'])
+
+
+class TestDecrypterContainerRequests(unittest.TestCase):
+    def setUp(self):
+        self.app = FakeSwift()
+        self.decrypter = decrypter.Decrypter(self.app, {})
+        self.decrypter.logger = debug_logger()
+
+    def _make_cont_get_req(self, resp_body, format, override=False,
+                           callback=fetch_crypto_keys):
+        path = '/v1/a/c'
+        content_type = 'text/plain'
+        if format:
+            path = '%s/?format=%s' % (path, format)
+            content_type = 'application/' + format
+        env = {'REQUEST_METHOD': 'GET',
+               CRYPTO_KEY_CALLBACK: callback}
+        if override:
+            env['swift.crypto.override'] = True
+        req = Request.blank(path, environ=env)
+        hdrs = {'content-type': content_type}
+        self.app.register('GET', path, HTTPOk, body=resp_body, headers=hdrs)
+        return req.get_response(self.decrypter)
+
+    def test_GET_container_success(self):
+        # no format requested, listing has names only
+        fake_body = b'testfile1\ntestfile2\n'
+        calls = [0]
+
+        def wrapped_fetch_crypto_keys():
+            calls[0] += 1
+            return fetch_crypto_keys()
+
+        resp = self._make_cont_get_req(fake_body, None,
+                                       callback=wrapped_fetch_crypto_keys)
+
+        self.assertEqual('200 OK', resp.status)
+        self.assertEqual(resp.body.split(b'\n'), [
+            b'testfile1',
+            b'testfile2',
+            b'',
+        ])
+        self.assertEqual(0, calls[0])
+
+    def test_GET_container_json(self):
+        content_type_1 = u'\uF10F\uD20D\uB30B\u9409'
+        content_type_2 = 'text/plain; param=foo'
+        pt_etag1 = 'c6e8196d7f0fff6444b90861fe8d609d'
+        pt_etag2 = 'ac0374ed4d43635f803c82469d0b5a10'
+        key = fetch_crypto_keys()['container']
+
+        subdir = {"subdir": "pseudo-dir/"}
+
+        obj_dict_1 = {"bytes": 16,
+                      "last_modified": "2015-04-14T23:33:06.439040",
+                      "hash": encrypt_and_append_meta(
+                          pt_etag1.encode('utf-8'), key),
+                      "name": "testfile",
+                      "content_type": content_type_1}
+
+        obj_dict_2 = {"bytes": 24,
+                      "last_modified": "2015-04-14T23:33:06.519020",
+                      "hash": encrypt_and_append_meta(
+                          pt_etag2.encode('utf-8'), key),
+                      "name": "testfile2",
+                      "content_type": content_type_2}
+
+        listing = [subdir, obj_dict_1, obj_dict_2]
+        fake_body = json.dumps(listing).encode('ascii')
+
+        resp = self._make_cont_get_req(fake_body, 'json')
+
+        self.assertEqual('200 OK', resp.status)
+        body = resp.body
+        self.assertEqual(len(body), int(resp.headers['Content-Length']))
+        body_json = json.loads(body)
+        self.assertEqual(3, len(body_json))
+        self.assertDictEqual(subdir, body_json[0])
+        obj_dict_1['hash'] = pt_etag1
+        self.assertDictEqual(obj_dict_1, body_json[1])
+        obj_dict_2['hash'] = pt_etag2
+        self.assertDictEqual(obj_dict_2, body_json[2])
+
+    def test_GET_container_json_with_crypto_override(self):
+        content_type_1 = 'image/jpeg'
+        content_type_2 = 'text/plain; param=foo'
+        pt_etag1 = 'c6e8196d7f0fff6444b90861fe8d609d'
+        pt_etag2 = 'ac0374ed4d43635f803c82469d0b5a10'
+
+        obj_dict_1 = {"bytes": 16,
+                      "last_modified": "2015-04-14T23:33:06.439040",
+                      "hash": pt_etag1,
+                      "name": "testfile",
+                      "content_type": content_type_1}
+
+        obj_dict_2 = {"bytes": 24,
+                      "last_modified": "2015-04-14T23:33:06.519020",
+                      "hash": pt_etag2,
+                      "name": "testfile2",
+                      "content_type": content_type_2}
+
+        listing = [obj_dict_1, obj_dict_2]
+        fake_body = json.dumps(listing).encode('ascii')
+
+        resp = self._make_cont_get_req(fake_body, 'json', override=True)
+
+        self.assertEqual('200 OK', resp.status)
+        body = resp.body
+        self.assertEqual(len(body), int(resp.headers['Content-Length']))
+        body_json = json.loads(body)
+        self.assertEqual(2, len(body_json))
+        self.assertDictEqual(obj_dict_1, body_json[0])
+        self.assertDictEqual(obj_dict_2, body_json[1])
+
+    def test_cont_get_json_req_with_cipher_mismatch(self):
+        bad_crypto_meta = fake_get_crypto_meta()
+        bad_crypto_meta['cipher'] = 'unknown_cipher'
+        key = fetch_crypto_keys()['container']
+        pt_etag = 'c6e8196d7f0fff6444b90861fe8d609d'
+        ct_etag = encrypt_and_append_meta(pt_etag, key,
+                                          crypto_meta=bad_crypto_meta)
+
+        obj_dict_1 = {"bytes": 16,
+                      "last_modified": "2015-04-14T23:33:06.439040",
+                      "hash": ct_etag,
+                      "name": "testfile",
+                      "content_type": "image/jpeg"}
+
+        listing = [obj_dict_1]
+        fake_body = json.dumps(listing).encode('ascii')
+
+        resp = self._make_cont_get_req(fake_body, 'json')
+
+        self.assertEqual('200 OK', resp.status)
+        self.assertEqual(
+            ['<unknown>'],
+            [x['hash'] for x in json.loads(resp.body)])
+        self.assertIn("Cipher must be AES_CTR_256",
+                      self.decrypter.logger.get_lines_for_level('error')[0])
+        self.assertIn('Error decrypting container listing',
+                      self.decrypter.logger.get_lines_for_level('error')[0])
+
+    def test_cont_get_json_req_with_unknown_secret_id(self):
+        bad_crypto_meta = fake_get_crypto_meta()
+        bad_crypto_meta['key_id'] = {'secret_id': 'unknown_key'}
+        key = fetch_crypto_keys()['container']
+        pt_etag = 'c6e8196d7f0fff6444b90861fe8d609d'
+        ct_etag = encrypt_and_append_meta(pt_etag, key,
+                                          crypto_meta=bad_crypto_meta)
+
+        obj_dict_1 = {"bytes": 16,
+                      "last_modified": "2015-04-14T23:33:06.439040",
+                      "hash": ct_etag,
+                      "name": "testfile",
+                      "content_type": "image/jpeg"}
+
+        listing = [obj_dict_1]
+        fake_body = json.dumps(listing).encode('ascii')
+
+        resp = self._make_cont_get_req(fake_body, 'json')
+
+        self.assertEqual('200 OK', resp.status)
+        self.assertEqual(
+            ['<unknown>'],
+            [x['hash'] for x in json.loads(resp.body)])
+        self.assertEqual(self.decrypter.logger.get_lines_for_level('error'), [
+            'get_keys(): unknown key id: unknown_key',
+            'Error decrypting container listing: unknown_key',
+        ])
+
+    def test_GET_container_json_not_encrypted_obj(self):
+        pt_etag = '%s; symlink_path=/a/c/o' % MD5_OF_EMPTY_STRING
+
+        obj_dict = {"bytes": 0,
+                    "last_modified": "2015-04-14T23:33:06.439040",
+                    "hash": pt_etag,
+                    "name": "symlink",
+                    "content_type": 'application/symlink'}
+
+        listing = [obj_dict]
+        fake_body = json.dumps(listing).encode('ascii')
+
+        resp = self._make_cont_get_req(fake_body, 'json')
+
+        self.assertEqual('200 OK', resp.status)
+        body = resp.body
+        self.assertEqual(len(body), int(resp.headers['Content-Length']))
+        body_json = json.loads(body)
+        self.assertEqual(1, len(body_json))
+        self.assertEqual(pt_etag, body_json[0]['hash'])
+
+
+class TestModuleMethods(unittest.TestCase):
+    def test_purge_crypto_sysmeta_headers(self):
+        retained_headers = {'x-object-sysmeta-test1': 'keep',
+                            'x-object-meta-test2': 'retain',
+                            'x-object-transient-sysmeta-test3': 'leave intact',
+                            'etag': 'hold onto',
+                            'x-other': 'cherish',
+                            'x-object-not-meta': 'do not remove'}
+        purged_headers = {'x-object-sysmeta-crypto-test1': 'remove',
+                          'x-object-transient-sysmeta-crypto-test2': 'purge'}
+        test_headers = retained_headers.copy()
+        test_headers.update(purged_headers)
+        actual = decrypter.purge_crypto_sysmeta_headers(test_headers.items())
+
+        for k, v in actual:
+            k = k.lower()
+            self.assertNotIn(k, purged_headers)
+            self.assertEqual(retained_headers[k], v)
+            retained_headers.pop(k)
+        self.assertFalse(retained_headers)
+
+
+class TestDecrypter(unittest.TestCase):
+    def test_app_exception(self):
+        app = decrypter.Decrypter(FakeAppThatExcepts(HTTPException), {})
+        req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'})
+        with self.assertRaises(HTTPException) as catcher:
+            req.get_response(app)
+        self.assertEqual(FakeAppThatExcepts.MESSAGE, catcher.exception.body)
+
+    def test_non_swift_path(self):
+        path = '/\xC0.\xC0./\xC0.\xC0./\xC0.\xC0./\xC0.\xC0./winnt/win.ini'
+        fake_swift = FakeSwift()
+        fake_swift.register('GET', path, HTTPNotFound, {})
+        app = keymaster.KeyMaster(decrypter.Decrypter(fake_swift, {}), {
+            'encryption_root_secret': 'A' * 80,
+        })
+        app.app.logger = debug_logger()
+        req = Request.blank(path)
+        resp = req.get_response(app)
+        self.assertEqual(resp.status_int, 404)
+
+    def test_invalid_swift_path(self):
+        path = '/v1/\xC0.\xC0./\xC0.\xC0./\xC0.\xC0./\xC0.\xC0./winnt/win.ini'
+        fake_swift = FakeSwift()
+        fake_swift.register('GET', path, HTTPNotFound, {})
+        app = keymaster.KeyMaster(decrypter.Decrypter(fake_swift, {}), {
+            'encryption_root_secret': 'A' * 80,
+        })
+        app.app.logger = debug_logger()
+        req = Request.blank(path)
+        resp = req.get_response(app)
+        self.assertEqual(resp.status_int, 404)
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/crypto/test_encrypter.py b/test/unit/common/middleware/crypto/test_encrypter.py
new file mode 100644
index 0000000000..291387b300
--- /dev/null
+++ b/test/unit/common/middleware/crypto/test_encrypter.py
@@ -0,0 +1,1034 @@
+# Copyright (c) 2015-2016 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import base64
+import hashlib
+import hmac
+import json
+import os
+import unittest
+
+from unittest import mock
+
+import urllib.parse
+from swift.common.middleware.crypto import encrypter
+from swift.common.middleware.crypto.crypto_utils import (
+    CRYPTO_KEY_CALLBACK, Crypto)
+from swift.common.swob import (
+    Request, HTTPException, HTTPCreated, HTTPAccepted, HTTPOk, HTTPBadRequest,
+    wsgi_to_bytes, bytes_to_wsgi)
+from swift.common.utils import FileLikeIter, MD5_OF_EMPTY_STRING
+
+from test.debug_logger import debug_logger
+from test.unit.common.middleware.crypto.crypto_helpers import (
+    fetch_crypto_keys, md5hex, FAKE_IV, encrypt)
+from test.unit.common.middleware.helpers import FakeSwift, FakeAppThatExcepts
+
+
+@mock.patch('swift.common.middleware.crypto.crypto_utils.Crypto.create_iv',
+            lambda *args: FAKE_IV)
+class TestEncrypter(unittest.TestCase):
+    def setUp(self):
+        self.app = FakeSwift()
+        self.encrypter = encrypter.Encrypter(self.app, {})
+        self.encrypter.logger = debug_logger()
+
+    def _verify_user_metadata(self, req_hdrs, name, value, key):
+        # verify encrypted version of user metadata
+        self.assertNotIn('X-Object-Meta-' + name, req_hdrs)
+        expected_hdr = 'X-Object-Transient-Sysmeta-Crypto-Meta-' + name
+        self.assertIn(expected_hdr, req_hdrs)
+        enc_val, param = req_hdrs[expected_hdr].split(';')
+        param = param.strip()
+        self.assertTrue(param.startswith('swift_meta='))
+        actual_meta = json.loads(
+            urllib.parse.unquote_plus(param[len('swift_meta='):]))
+        self.assertEqual(Crypto.cipher, actual_meta['cipher'])
+        meta_iv = base64.b64decode(actual_meta['iv'])
+        self.assertEqual(FAKE_IV, meta_iv)
+        self.assertEqual(
+            base64.b64encode(encrypt(wsgi_to_bytes(value), key, meta_iv)),
+            wsgi_to_bytes(enc_val))
+        # if there is any encrypted user metadata then this header should exist
+        self.assertIn('X-Object-Transient-Sysmeta-Crypto-Meta', req_hdrs)
+        common_meta = json.loads(urllib.parse.unquote_plus(
+            req_hdrs['X-Object-Transient-Sysmeta-Crypto-Meta']))
+        self.assertDictEqual({'cipher': Crypto.cipher,
+                              'key_id': {'v': 'fake', 'path': '/a/c/fake'}},
+                             common_meta)
+
+    def test_PUT_req(self):
+        body_key = os.urandom(32)
+        object_key = fetch_crypto_keys()['object']
+        plaintext = b'FAKE APP'
+        plaintext_etag = md5hex(plaintext)
+        ciphertext = encrypt(plaintext, body_key, FAKE_IV)
+        ciphertext_etag = md5hex(ciphertext)
+
+        env = {'REQUEST_METHOD': 'PUT',
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        hdrs = {'etag': plaintext_etag,
+                'content-type': 'text/plain',
+                'content-length': str(len(plaintext)),
+                'x-object-meta-etag': 'not to be confused with the Etag!',
+                'x-object-meta-test': 'encrypt me',
+                'x-object-sysmeta-test': 'do not encrypt me'}
+        req = Request.blank(
+            '/v1/a/c/o', environ=env, body=plaintext, headers=hdrs)
+        self.app.register('PUT', '/v1/a/c/o', HTTPCreated, {})
+        with mock.patch(
+            'swift.common.middleware.crypto.crypto_utils.'
+            'Crypto.create_random_key',
+                return_value=body_key):
+            resp = req.get_response(self.encrypter)
+        self.assertEqual('201 Created', resp.status)
+        self.assertEqual(plaintext_etag, resp.headers['Etag'])
+
+        # verify metadata items
+        self.assertEqual(1, len(self.app.call_list), self.app.calls)
+        call = self.app.call_list[0]
+        self.assertEqual(('PUT', '/v1/a/c/o'), (call.method, call.path))
+
+        # verify body crypto meta
+        actual = call.footers['X-Object-Sysmeta-Crypto-Body-Meta']
+        actual = json.loads(urllib.parse.unquote_plus(actual))
+        self.assertEqual(Crypto().cipher, actual['cipher'])
+        self.assertEqual(FAKE_IV, base64.b64decode(actual['iv']))
+
+        # verify wrapped body key
+        expected_wrapped_key = encrypt(body_key, object_key, FAKE_IV)
+        self.assertEqual(expected_wrapped_key,
+                         base64.b64decode(actual['body_key']['key']))
+        self.assertEqual(FAKE_IV,
+                         base64.b64decode(actual['body_key']['iv']))
+        self.assertEqual(fetch_crypto_keys()['id'], actual['key_id'])
+
+        # verify etag
+        self.assertEqual(ciphertext_etag, call.footers['Etag'])
+
+        encrypted_etag, _junk, etag_meta = \
+            call.footers['X-Object-Sysmeta-Crypto-Etag'].partition(
+                '; swift_meta=')
+        # verify crypto_meta was appended to this etag
+        self.assertTrue(etag_meta)
+        actual_meta = json.loads(urllib.parse.unquote_plus(etag_meta))
+        self.assertEqual(Crypto().cipher, actual_meta['cipher'])
+
+        # verify encrypted version of plaintext etag
+        actual = base64.b64decode(encrypted_etag)
+        etag_iv = base64.b64decode(actual_meta['iv'])
+        enc_etag = encrypt(plaintext_etag.encode('ascii'), object_key, etag_iv)
+        self.assertEqual(enc_etag, actual)
+
+        # verify etag MAC for conditional requests
+        actual_hmac = base64.b64decode(
+            call.footers['X-Object-Sysmeta-Crypto-Etag-Mac'])
+        exp_hmac = hmac.new(
+            object_key,
+            plaintext_etag.encode('ascii'),
+            hashlib.sha256).digest()
+        self.assertEqual(actual_hmac, exp_hmac)
+
+        # verify encrypted etag for container update
+        self.assertIn(
+            'X-Object-Sysmeta-Container-Update-Override-Etag', call.footers)
+        parts = call.footers[
+            'X-Object-Sysmeta-Container-Update-Override-Etag'].rsplit(';', 1)
+        self.assertEqual(2, len(parts))
+
+        # extract crypto_meta from end of etag for container update
+        param = parts[1].strip()
+        crypto_meta_tag = 'swift_meta='
+        self.assertTrue(param.startswith(crypto_meta_tag), param)
+        actual_meta = json.loads(
+            urllib.parse.unquote_plus(param[len(crypto_meta_tag):]))
+        self.assertEqual(Crypto().cipher, actual_meta['cipher'])
+        self.assertEqual(fetch_crypto_keys()['id'], actual_meta['key_id'])
+
+        cont_key = fetch_crypto_keys()['container']
+        cont_etag_iv = base64.b64decode(actual_meta['iv'])
+        self.assertEqual(FAKE_IV, cont_etag_iv)
+        exp_etag = encrypt(plaintext_etag.encode('ascii'),
+                           cont_key, cont_etag_iv)
+        self.assertEqual(exp_etag, base64.b64decode(parts[0]))
+
+        # content-type is not encrypted
+        self.assertEqual('text/plain', call.headers['Content-Type'])
+
+        # user meta is encrypted
+        self._verify_user_metadata(
+            call.headers, 'Test', 'encrypt me', object_key)
+        self._verify_user_metadata(
+            call.headers, 'Etag', 'not to be confused with the Etag!',
+            object_key)
+
+        # sysmeta is not encrypted
+        self.assertEqual('do not encrypt me',
+                         call.headers['X-Object-Sysmeta-Test'])
+
+        # verify object is encrypted by getting direct from the app
+        get_req = Request.blank('/v1/a/c/o', environ={'REQUEST_METHOD': 'GET'})
+        resp = get_req.get_response(self.app)
+        self.assertEqual(ciphertext, resp.body)
+        self.assertEqual(ciphertext_etag, resp.headers['Etag'])
+
+    def test_PUT_zero_size_object(self):
+        # object body encryption should be skipped for zero sized object body
+        object_key = fetch_crypto_keys()['object']
+        plaintext_etag = MD5_OF_EMPTY_STRING
+
+        env = {'REQUEST_METHOD': 'PUT',
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        hdrs = {'etag': MD5_OF_EMPTY_STRING,
+                'content-type': 'text/plain',
+                'content-length': '0',
+                'x-object-meta-etag': 'not to be confused with the Etag!',
+                'x-object-meta-test': 'encrypt me',
+                'x-object-sysmeta-test': 'do not encrypt me'}
+        req = Request.blank(
+            '/v1/a/c/o', environ=env, body='', headers=hdrs)
+        self.app.register('PUT', '/v1/a/c/o', HTTPCreated, {})
+
+        resp = req.get_response(self.encrypter)
+
+        self.assertEqual('201 Created', resp.status)
+        self.assertEqual(plaintext_etag, resp.headers['Etag'])
+        self.assertEqual(1, len(self.app.call_list), self.app.calls)
+        call = self.app.call_list[0]
+        self.assertEqual('PUT', call.method)
+
+        # verify that there is no body crypto meta
+        self.assertNotIn('X-Object-Sysmeta-Crypto-Meta', call.footers)
+        # verify etag is md5 of plaintext
+        self.assertEqual(MD5_OF_EMPTY_STRING, call.footers['Etag'])
+        # verify there is no etag crypto meta
+        self.assertNotIn('X-Object-Sysmeta-Crypto-Etag', call.footers)
+        # verify there is no container update override for etag
+        self.assertNotIn(
+            'X-Object-Sysmeta-Container-Update-Override-Etag', call.footers)
+
+        # user meta is still encrypted
+        self._verify_user_metadata(
+            call.headers, 'Test', 'encrypt me', object_key)
+        self._verify_user_metadata(
+            call.headers, 'Etag', 'not to be confused with the Etag!',
+            object_key)
+
+        # sysmeta is not encrypted
+        self.assertEqual('do not encrypt me',
+                         call.headers['X-Object-Sysmeta-Test'])
+
+        # verify object is empty by getting direct from the app
+        get_req = Request.blank('/v1/a/c/o', environ={'REQUEST_METHOD': 'GET'})
+        resp = get_req.get_response(self.app)
+        self.assertEqual(b'', resp.body)
+        self.assertEqual(MD5_OF_EMPTY_STRING, resp.headers['Etag'])
+
+    def _test_PUT_with_other_footers(self, override_etag):
+        # verify handling of another middleware's footer callback
+        body_key = os.urandom(32)
+        object_key = fetch_crypto_keys()['object']
+        plaintext = b'FAKE APP'
+        plaintext_etag = md5hex(plaintext)
+        ciphertext = encrypt(plaintext, body_key, FAKE_IV)
+        ciphertext_etag = md5hex(ciphertext)
+        other_footers = {
+            'Etag': plaintext_etag,
+            'X-Object-Sysmeta-Other': 'other sysmeta',
+            'X-Object-Sysmeta-Container-Update-Override-Size':
+                'other override',
+            'X-Object-Sysmeta-Container-Update-Override-Etag':
+                override_etag}
+
+        env = {'REQUEST_METHOD': 'PUT',
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys,
+               'swift.callback.update_footers':
+                   lambda footers: footers.update(other_footers)}
+        hdrs = {'content-type': 'text/plain',
+                'content-length': str(len(plaintext)),
+                'Etag': 'correct etag is in footers'}
+        req = Request.blank(
+            '/v1/a/c/o', environ=env, body=plaintext, headers=hdrs)
+        self.app.register('PUT', '/v1/a/c/o', HTTPCreated, {})
+
+        with mock.patch(
+            'swift.common.middleware.crypto.crypto_utils.'
+            'Crypto.create_random_key',
+                lambda *args: body_key):
+            resp = req.get_response(self.encrypter)
+
+        self.assertEqual('201 Created', resp.status)
+        self.assertEqual(plaintext_etag, resp.headers['Etag'])
+
+        # verify metadata items
+        self.assertEqual(1, len(self.app.call_list), self.app.calls)
+        call = self.app.call_list[0]
+        self.assertEqual(('PUT', '/v1/a/c/o'), (call.method, call.path))
+
+        # verify that other middleware's footers made it to app, including any
+        # container update overrides but nothing Etag-related
+        other_footers.pop('Etag')
+        other_footers.pop('X-Object-Sysmeta-Container-Update-Override-Etag')
+        for k, v in other_footers.items():
+            self.assertEqual(v, call.footers[k])
+
+        # verify encryption footers are ok
+        encrypted_etag, _junk, etag_meta = \
+            call.footers['X-Object-Sysmeta-Crypto-Etag'].partition(
+                '; swift_meta=')
+        self.assertTrue(etag_meta)
+        actual_meta = json.loads(urllib.parse.unquote_plus(etag_meta))
+        self.assertEqual(Crypto().cipher, actual_meta['cipher'])
+
+        self.assertEqual(ciphertext_etag, call.footers['Etag'])
+        actual = base64.b64decode(encrypted_etag)
+        etag_iv = base64.b64decode(actual_meta['iv'])
+        exp_etag = encrypt(plaintext_etag.encode('ascii'), object_key, etag_iv)
+        self.assertEqual(exp_etag, actual)
+
+        # verify encrypted etag for container update
+        self.assertIn(
+            'X-Object-Sysmeta-Container-Update-Override-Etag', call.footers)
+        parts = call.footers[
+            'X-Object-Sysmeta-Container-Update-Override-Etag'].rsplit(';', 1)
+        self.assertEqual(2, len(parts))
+
+        # extract crypto_meta from end of etag for container update
+        param = parts[1].strip()
+        crypto_meta_tag = 'swift_meta='
+        self.assertTrue(param.startswith(crypto_meta_tag), param)
+        actual_meta = json.loads(
+            urllib.parse.unquote_plus(param[len(crypto_meta_tag):]))
+        self.assertEqual(Crypto().cipher, actual_meta['cipher'])
+
+        cont_key = fetch_crypto_keys()['container']
+        cont_etag_iv = base64.b64decode(actual_meta['iv'])
+        self.assertEqual(FAKE_IV, cont_etag_iv)
+        exp_etag = encrypt(override_etag.encode('ascii'),
+                           cont_key, cont_etag_iv)
+        self.assertEqual(exp_etag, base64.b64decode(parts[0]))
+
+        # verify body crypto meta
+        actual = call.footers['X-Object-Sysmeta-Crypto-Body-Meta']
+        actual = json.loads(urllib.parse.unquote_plus(actual))
+        self.assertEqual(Crypto().cipher, actual['cipher'])
+        self.assertEqual(FAKE_IV, base64.b64decode(actual['iv']))
+
+        # verify wrapped body key
+        expected_wrapped_key = encrypt(body_key, object_key, FAKE_IV)
+        self.assertEqual(expected_wrapped_key,
+                         base64.b64decode(actual['body_key']['key']))
+        self.assertEqual(FAKE_IV,
+                         base64.b64decode(actual['body_key']['iv']))
+        self.assertEqual(fetch_crypto_keys()['id'], actual['key_id'])
+
+    def test_PUT_with_other_footers(self):
+        self._test_PUT_with_other_footers('override etag')
+
+    def test_PUT_with_other_footers_and_etag_of_empty_body(self):
+        # verify that an override etag value of MD5_OF_EMPTY_STRING will be
+        # encrypted when there was a non-zero body length
+        self._test_PUT_with_other_footers(MD5_OF_EMPTY_STRING)
+
+    def _test_PUT_with_etag_override_in_headers(self, override_etag):
+        # verify handling of another middleware's
+        # container-update-override-etag in headers
+        plaintext = b'FAKE APP'
+        plaintext_etag = md5hex(plaintext)
+
+        env = {'REQUEST_METHOD': 'PUT',
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        hdrs = {'content-type': 'text/plain',
+                'content-length': str(len(plaintext)),
+                'Etag': plaintext_etag,
+                'X-Object-Sysmeta-Container-Update-Override-Etag':
+                    override_etag}
+        req = Request.blank(
+            '/v1/a/c/o', environ=env, body=plaintext, headers=hdrs)
+        self.app.register('PUT', '/v1/a/c/o', HTTPCreated, {})
+        resp = req.get_response(self.encrypter)
+
+        self.assertEqual('201 Created', resp.status)
+        self.assertEqual(plaintext_etag, resp.headers['Etag'])
+
+        # verify metadata items
+        self.assertEqual(1, len(self.app.call_list), self.app.calls)
+        call = self.app.call_list[0]
+        self.assertEqual(('PUT', '/v1/a/c/o'), (call.method, call.path))
+
+        # verify encrypted etag for container update
+        self.assertIn(
+            'X-Object-Sysmeta-Container-Update-Override-Etag', call.footers)
+        parts = call.footers[
+            'X-Object-Sysmeta-Container-Update-Override-Etag'].rsplit(';', 1)
+        self.assertEqual(2, len(parts))
+        cont_key = fetch_crypto_keys()['container']
+
+        # extract crypto_meta from end of etag for container update
+        param = parts[1].strip()
+        crypto_meta_tag = 'swift_meta='
+        self.assertTrue(param.startswith(crypto_meta_tag), param)
+        actual_meta = json.loads(
+            urllib.parse.unquote_plus(param[len(crypto_meta_tag):]))
+        self.assertEqual(Crypto().cipher, actual_meta['cipher'])
+        self.assertEqual(fetch_crypto_keys()['id'], actual_meta['key_id'])
+
+        cont_etag_iv = base64.b64decode(actual_meta['iv'])
+        self.assertEqual(FAKE_IV, cont_etag_iv)
+        exp_etag = encrypt(override_etag.encode('ascii'),
+                           cont_key, cont_etag_iv)
+        self.assertEqual(exp_etag, base64.b64decode(parts[0]))
+
+    def test_PUT_with_etag_override_in_headers(self):
+        self._test_PUT_with_etag_override_in_headers('override_etag')
+
+    def test_PUT_with_etag_of_empty_body_override_in_headers(self):
+        # verify that an override etag value of MD5_OF_EMPTY_STRING will be
+        # encrypted when there was a non-zero body length
+        self._test_PUT_with_etag_override_in_headers(MD5_OF_EMPTY_STRING)
+
+    def _test_PUT_with_empty_etag_override_in_headers(self, plaintext):
+        # verify that an override etag value of '' from other middleware is
+        # passed through unencrypted
+        plaintext_etag = md5hex(plaintext)
+        override_etag = ''
+        env = {'REQUEST_METHOD': 'PUT',
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        hdrs = {'content-type': 'text/plain',
+                'content-length': str(len(plaintext)),
+                'Etag': plaintext_etag,
+                'X-Object-Sysmeta-Container-Update-Override-Etag':
+                    override_etag}
+        req = Request.blank(
+            '/v1/a/c/o', environ=env, body=plaintext, headers=hdrs)
+        self.app.register('PUT', '/v1/a/c/o', HTTPCreated, {})
+        resp = req.get_response(self.encrypter)
+
+        self.assertEqual('201 Created', resp.status)
+        self.assertEqual(plaintext_etag, resp.headers['Etag'])
+        self.assertEqual(1, len(self.app.call_list), self.app.calls)
+        call = self.app.call_list[0]
+        self.assertEqual(('PUT', '/v1/a/c/o'), (call.method, call.path))
+        self.assertIn(
+            'X-Object-Sysmeta-Container-Update-Override-Etag', call.headers)
+        self.assertEqual(
+            override_etag,
+            call.headers['X-Object-Sysmeta-Container-Update-Override-Etag'])
+
+    def test_PUT_with_empty_etag_override_in_headers(self):
+        self._test_PUT_with_empty_etag_override_in_headers(b'body')
+
+    def test_PUT_with_empty_etag_override_in_headers_no_body(self):
+        self._test_PUT_with_empty_etag_override_in_headers(b'')
+
+    def _test_PUT_with_empty_etag_override_in_footers(self, plaintext):
+        # verify that an override etag value of '' from other middleware is
+        # passed through unencrypted
+        plaintext_etag = md5hex(plaintext)
+        override_etag = ''
+        other_footers = {
+            'X-Object-Sysmeta-Container-Update-Override-Etag': override_etag}
+        env = {'REQUEST_METHOD': 'PUT',
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys,
+               'swift.callback.update_footers':
+                   lambda footers: footers.update(other_footers)}
+
+        hdrs = {'content-type': 'text/plain',
+                'content-length': str(len(plaintext)),
+                'Etag': plaintext_etag}
+        req = Request.blank(
+            '/v1/a/c/o', environ=env, body=plaintext, headers=hdrs)
+        self.app.register('PUT', '/v1/a/c/o', HTTPCreated, {})
+        resp = req.get_response(self.encrypter)
+
+        self.assertEqual('201 Created', resp.status)
+        self.assertEqual(plaintext_etag, resp.headers['Etag'])
+        self.assertEqual(1, len(self.app.call_list), self.app.calls)
+        call = self.app.call_list[0]
+        self.assertEqual(('PUT', '/v1/a/c/o'), (call.method, call.path))
+        self.assertIn(
+            'X-Object-Sysmeta-Container-Update-Override-Etag', call.footers)
+        self.assertEqual(
+            override_etag,
+            call.footers['X-Object-Sysmeta-Container-Update-Override-Etag'])
+
+    def test_PUT_with_empty_etag_override_in_footers(self):
+        self._test_PUT_with_empty_etag_override_in_footers(b'body')
+
+    def test_PUT_with_empty_etag_override_in_footers_no_body(self):
+        self._test_PUT_with_empty_etag_override_in_footers(b'')
+
+    def test_PUT_with_bad_etag_in_other_footers(self):
+        # verify that etag supplied in footers from other middleware overrides
+        # header etag when validating inbound plaintext etags
+        plaintext = b'FAKE APP'
+        plaintext_etag = md5hex(plaintext)
+        other_footers = {
+            'Etag': 'bad etag',
+            'X-Object-Sysmeta-Other': 'other sysmeta',
+            'X-Object-Sysmeta-Container-Update-Override-Etag':
+                'other override'}
+
+        env = {'REQUEST_METHOD': 'PUT',
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys,
+               'swift.callback.update_footers':
+                   lambda footers: footers.update(other_footers)}
+        hdrs = {'content-type': 'text/plain',
+                'content-length': str(len(plaintext)),
+                'Etag': plaintext_etag}
+        req = Request.blank(
+            '/v1/a/c/o', environ=env, body=plaintext, headers=hdrs)
+        self.app.register('PUT', '/v1/a/c/o', HTTPCreated, {})
+        resp = req.get_response(self.encrypter)
+        self.assertEqual('422 Unprocessable Entity', resp.status)
+        self.assertNotIn('Etag', resp.headers)
+
+    def test_PUT_with_bad_etag_in_headers_and_other_footers(self):
+        # verify that etag supplied in headers from other middleware is used if
+        # none is supplied in footers when validating inbound plaintext etags
+        plaintext = 'FAKE APP'
+        other_footers = {
+            'X-Object-Sysmeta-Other': 'other sysmeta',
+            'X-Object-Sysmeta-Container-Update-Override-Etag':
+                'other override'}
+
+        env = {'REQUEST_METHOD': 'PUT',
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys,
+               'swift.callback.update_footers':
+                   lambda footers: footers.update(other_footers)}
+        hdrs = {'content-type': 'text/plain',
+                'content-length': str(len(plaintext)),
+                'Etag': 'bad etag'}
+        req = Request.blank(
+            '/v1/a/c/o', environ=env, body=plaintext, headers=hdrs)
+        self.app.register('PUT', '/v1/a/c/o', HTTPCreated, {})
+        resp = req.get_response(self.encrypter)
+        self.assertEqual('422 Unprocessable Entity', resp.status)
+        self.assertNotIn('Etag', resp.headers)
+
+    def test_PUT_nothing_read(self):
+        # simulate an artificial scenario of a downstream filter/app not
+        # actually reading the input stream from encrypter.
+        class NonReadingApp(object):
+            def __call__(self, env, start_response):
+                # note: no read from wsgi.input
+                req = Request(env)
+                env['swift.callback.update_footers'](req.headers)
+                call_headers.append(req.headers)
+                resp = HTTPCreated(req=req, headers={'Etag': 'response etag'})
+                return resp(env, start_response)
+
+        env = {'REQUEST_METHOD': 'PUT',
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        hdrs = {'content-type': 'text/plain',
+                'content-length': 0,
+                'etag': 'etag from client'}
+        req = Request.blank('/v1/a/c/o', environ=env, body='', headers=hdrs)
+
+        call_headers = []
+        resp = req.get_response(encrypter.Encrypter(NonReadingApp(), {}))
+        self.assertEqual('201 Created', resp.status)
+        self.assertEqual('response etag', resp.headers['Etag'])
+        self.assertEqual(1, len(call_headers))
+        self.assertEqual('etag from client', call_headers[0]['etag'])
+        # verify no encryption footers
+        for k in call_headers[0]:
+            self.assertFalse(k.lower().startswith('x-object-sysmeta-crypto-'))
+
+        # check that an upstream footer callback gets called
+        other_footers = {
+            'Etag': MD5_OF_EMPTY_STRING,
+            'X-Object-Sysmeta-Other': 'other sysmeta',
+            'X-Object-Sysmeta-Container-Update-Override-Etag':
+                'other override'}
+        env.update({'swift.callback.update_footers':
+                    lambda footers: footers.update(other_footers)})
+        req = Request.blank('/v1/a/c/o', environ=env, body='', headers=hdrs)
+
+        call_headers = []
+        resp = req.get_response(encrypter.Encrypter(NonReadingApp(), {}))
+
+        self.assertEqual('201 Created', resp.status)
+        self.assertEqual('response etag', resp.headers['Etag'])
+        self.assertEqual(1, len(call_headers))
+
+        # verify encrypted override etag for container update.
+        self.assertIn(
+            'X-Object-Sysmeta-Container-Update-Override-Etag', call_headers[0])
+        parts = call_headers[0][
+            'X-Object-Sysmeta-Container-Update-Override-Etag'].rsplit(';', 1)
+        self.assertEqual(2, len(parts))
+        cont_key = fetch_crypto_keys()['container']
+
+        param = parts[1].strip()
+        crypto_meta_tag = 'swift_meta='
+        self.assertTrue(param.startswith(crypto_meta_tag), param)
+        actual_meta = json.loads(
+            urllib.parse.unquote_plus(param[len(crypto_meta_tag):]))
+        self.assertEqual(Crypto().cipher, actual_meta['cipher'])
+        self.assertEqual(fetch_crypto_keys()['id'], actual_meta['key_id'])
+
+        cont_etag_iv = base64.b64decode(actual_meta['iv'])
+        self.assertEqual(FAKE_IV, cont_etag_iv)
+        self.assertEqual(encrypt(b'other override', cont_key, cont_etag_iv),
+                         base64.b64decode(parts[0]))
+
+        # verify that other middleware's footers made it to app
+        other_footers.pop('X-Object-Sysmeta-Container-Update-Override-Etag')
+        for k, v in other_footers.items():
+            self.assertEqual(v, call_headers[0][k])
+        # verify no encryption footers
+        for k in call_headers[0]:
+            self.assertFalse(k.lower().startswith('x-object-sysmeta-crypto-'))
+
+        # if upstream footer override etag is for an empty body then check that
+        # it is not encrypted
+        other_footers = {
+            'Etag': MD5_OF_EMPTY_STRING,
+            'X-Object-Sysmeta-Container-Update-Override-Etag':
+            MD5_OF_EMPTY_STRING}
+        env.update({'swift.callback.update_footers':
+                    lambda footers: footers.update(other_footers)})
+        req = Request.blank('/v1/a/c/o', environ=env, body='', headers=hdrs)
+
+        call_headers = []
+        resp = req.get_response(encrypter.Encrypter(NonReadingApp(), {}))
+
+        self.assertEqual('201 Created', resp.status)
+        self.assertEqual('response etag', resp.headers['Etag'])
+        self.assertEqual(1, len(call_headers))
+
+        # verify that other middleware's footers made it to app
+        for k, v in other_footers.items():
+            self.assertEqual(v, call_headers[0][k])
+        # verify no encryption footers
+        for k in call_headers[0]:
+            self.assertFalse(k.lower().startswith('x-object-sysmeta-crypto-'))
+
+        # if upstream footer override etag is an empty string then check that
+        # it is not encrypted
+        other_footers = {
+            'Etag': MD5_OF_EMPTY_STRING,
+            'X-Object-Sysmeta-Container-Update-Override-Etag': ''}
+        env.update({'swift.callback.update_footers':
+                    lambda footers: footers.update(other_footers)})
+        req = Request.blank('/v1/a/c/o', environ=env, body='', headers=hdrs)
+
+        call_headers = []
+        resp = req.get_response(encrypter.Encrypter(NonReadingApp(), {}))
+
+        self.assertEqual('201 Created', resp.status)
+        self.assertEqual('response etag', resp.headers['Etag'])
+        self.assertEqual(1, len(call_headers))
+
+        # verify that other middleware's footers made it to app
+        for k, v in other_footers.items():
+            self.assertEqual(v, call_headers[0][k])
+        # verify no encryption footers
+        for k in call_headers[0]:
+            self.assertFalse(k.lower().startswith('x-object-sysmeta-crypto-'))
+
+    def test_POST_req(self):
+        body = b'FAKE APP'
+        env = {'REQUEST_METHOD': 'POST',
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        hdrs = {'x-object-meta-test': 'encrypt me',
+                'x-object-meta-test2': '',
+                'x-object-sysmeta-test': 'do not encrypt me'}
+        req = Request.blank('/v1/a/c/o', environ=env, body=body, headers=hdrs)
+        key = fetch_crypto_keys()['object']
+        self.app.register('POST', '/v1/a/c/o', HTTPAccepted, {})
+        resp = req.get_response(self.encrypter)
+        self.assertEqual('202 Accepted', resp.status)
+        self.assertNotIn('Etag', resp.headers)
+
+        # verify metadata items
+        self.assertEqual(1, len(self.app.call_list), self.app.calls)
+        call = self.app.call_list[0]
+        self.assertEqual(('POST', '/v1/a/c/o'), (call.method, call.path))
+
+        # user meta is encrypted
+        self._verify_user_metadata(call.headers, 'Test', 'encrypt me', key)
+        # unless it had no value
+        self.assertEqual('', call.headers['X-Object-Meta-Test2'])
+
+        # sysmeta is not encrypted
+        self.assertEqual('do not encrypt me',
+                         call.headers['X-Object-Sysmeta-Test'])
+
+    def _test_no_user_metadata(self, method):
+        # verify that x-object-transient-sysmeta-crypto-meta is not set when
+        # there is no user metadata
+        env = {'REQUEST_METHOD': method,
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        req = Request.blank('/v1/a/c/o', environ=env, body='body')
+        self.app.register(method, '/v1/a/c/o', HTTPAccepted, {})
+        resp = req.get_response(self.encrypter)
+        self.assertEqual('202 Accepted', resp.status)
+        self.assertEqual(1, len(self.app.calls), self.app.calls)
+        self.assertEqual(method, self.app.calls[0][0])
+        self.assertNotIn('x-object-transient-sysmeta-crypto-meta',
+                         self.app.headers[0])
+
+    def test_PUT_no_user_metadata(self):
+        self._test_no_user_metadata('PUT')
+
+    def test_POST_no_user_metadata(self):
+        self._test_no_user_metadata('POST')
+
+    def _test_if_match(self, method, match_header_name):
+        def do_test(method, plain_etags, expected_plain_etags=None):
+            env = {CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+            match_header_value = ', '.join(plain_etags)
+            req = Request.blank(
+                '/v1/a/c/o', environ=env, method=method,
+                headers={match_header_name: match_header_value})
+            app = FakeSwift()
+            app.register(method, '/v1/a/c/o', HTTPOk, {})
+            resp = req.get_response(encrypter.Encrypter(app, {}))
+            self.assertEqual('200 OK', resp.status)
+
+            self.assertEqual(1, len(app.call_list), app.calls)
+            call = app.call_list[0]
+            self.assertEqual(method, call.method)
+
+            # verify the alternate etag location has been specified
+            if match_header_value and match_header_value != '*':
+                self.assertIn('X-Backend-Etag-Is-At', call.headers)
+                self.assertEqual('X-Object-Sysmeta-Crypto-Etag-Mac',
+                                 call.headers['X-Backend-Etag-Is-At'])
+
+            # verify etags have been supplemented with masked values
+            self.assertIn(match_header_name, call.headers)
+            actual_etags = set(call.headers[match_header_name].split(', '))
+            # masked values for secret_id None
+            key = fetch_crypto_keys()['object']
+            masked_etags = [
+                '"%s"' % bytes_to_wsgi(base64.b64encode(hmac.new(
+                    key, wsgi_to_bytes(etag.strip('"')),
+                    hashlib.sha256).digest()))
+                for etag in plain_etags if etag not in ('*', '')]
+            # masked values for secret_id myid
+            key = fetch_crypto_keys(key_id={'secret_id': 'myid'})['object']
+            masked_etags_myid = [
+                '"%s"' % bytes_to_wsgi(base64.b64encode(hmac.new(
+                    key, wsgi_to_bytes(etag.strip('"')),
+                    hashlib.sha256).digest()))
+                for etag in plain_etags if etag not in ('*', '')]
+            expected_etags = set((expected_plain_etags or plain_etags) +
+                                 masked_etags + masked_etags_myid)
+            self.assertEqual(expected_etags, actual_etags)
+            # check that the request environ was returned to original state
+            self.assertEqual(set(plain_etags),
+                             set(req.headers[match_header_name].split(', ')))
+
+        do_test(method, [''])
+        do_test(method, ['"an etag"'])
+        do_test(method, ['"an etag"', '"another_etag"'])
+        do_test(method, ['*'])
+        # rfc2616 does not allow wildcard *and* etag but test it anyway
+        do_test(method, ['*', '"an etag"'])
+        # etags should be quoted but check we can cope if they are not
+        do_test(
+            method, ['*', 'an etag', 'another_etag'],
+            expected_plain_etags=['*', '"an etag"', '"another_etag"'])
+
+    def test_GET_if_match(self):
+        self._test_if_match('GET', 'If-Match')
+
+    def test_HEAD_if_match(self):
+        self._test_if_match('HEAD', 'If-Match')
+
+    def test_GET_if_none_match(self):
+        self._test_if_match('GET', 'If-None-Match')
+
+    def test_HEAD_if_none_match(self):
+        self._test_if_match('HEAD', 'If-None-Match')
+
+    def _test_existing_etag_is_at_header(self, method, match_header_name):
+        # if another middleware has already set X-Backend-Etag-Is-At then
+        # encrypter should not override that value
+        env = {CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        req = Request.blank(
+            '/v1/a/c/o', environ=env, method=method,
+            headers={match_header_name: "an etag",
+                     'X-Backend-Etag-Is-At': 'X-Object-Sysmeta-Other-Etag'})
+        self.app.register(method, '/v1/a/c/o', HTTPOk, {})
+        resp = req.get_response(self.encrypter)
+        self.assertEqual('200 OK', resp.status)
+
+        self.assertEqual(1, len(self.app.call_list), self.app.calls)
+        call = self.app.call_list[0]
+        self.assertEqual((method, '/v1/a/c/o'), (call.method, call.path))
+        self.assertIn('X-Backend-Etag-Is-At', call.headers)
+        self.assertEqual(
+            'X-Object-Sysmeta-Other-Etag,X-Object-Sysmeta-Crypto-Etag-Mac',
+            call.headers['X-Backend-Etag-Is-At'])
+        actual_etags = set(call.headers[match_header_name].split(', '))
+        self.assertIn('"an etag"', actual_etags)
+
+    def test_GET_if_match_with_existing_etag_is_at_header(self):
+        self._test_existing_etag_is_at_header('GET', 'If-Match')
+
+    def test_HEAD_if_match_with_existing_etag_is_at_header(self):
+        self._test_existing_etag_is_at_header('HEAD', 'If-Match')
+
+    def test_GET_if_none_match_with_existing_etag_is_at_header(self):
+        self._test_existing_etag_is_at_header('GET', 'If-None-Match')
+
+    def test_HEAD_if_none_match_with_existing_etag_is_at_header(self):
+        self._test_existing_etag_is_at_header('HEAD', 'If-None-Match')
+
+    def _test_etag_is_at_not_duplicated(self, method):
+        # verify only one occurrence of X-Object-Sysmeta-Crypto-Etag-Mac in
+        # X-Backend-Etag-Is-At
+        key = fetch_crypto_keys()['object']
+        env = {CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        req = Request.blank(
+            '/v1/a/c/o', environ=env, method=method,
+            headers={'If-Match': '"an etag"',
+                     'If-None-Match': '"another etag"'})
+        self.app.register(method, '/v1/a/c/o', HTTPOk, {})
+        resp = req.get_response(self.encrypter)
+        self.assertEqual('200 OK', resp.status)
+
+        self.assertEqual(1, len(self.app.calls), self.app.calls)
+        call = self.app.call_list[0]
+        self.assertEqual((method, '/v1/a/c/o'), (call.method, call.path))
+        self.assertIn('X-Backend-Etag-Is-At', call.headers)
+        self.assertEqual('X-Object-Sysmeta-Crypto-Etag-Mac',
+                         call.headers['X-Backend-Etag-Is-At'])
+
+        self.assertIn('"%s"' % bytes_to_wsgi(base64.b64encode(
+            hmac.new(key, b'an etag', hashlib.sha256).digest())),
+            call.headers['If-Match'])
+        self.assertIn('"another etag"', call.headers['If-None-Match'])
+        self.assertIn('"%s"' % bytes_to_wsgi(base64.b64encode(
+            hmac.new(key, b'another etag', hashlib.sha256).digest())),
+            call.headers['If-None-Match'])
+
+    def test_GET_etag_is_at_not_duplicated(self):
+        self._test_etag_is_at_not_duplicated('GET')
+
+    def test_HEAD_etag_is_at_not_duplicated(self):
+        self._test_etag_is_at_not_duplicated('HEAD')
+
+    def test_PUT_response_inconsistent_etag_is_not_replaced(self):
+        # if response is success but etag does not match the ciphertext md5
+        # then verify that we do *not* replace it with the plaintext etag
+        body = 'FAKE APP'
+        env = {'REQUEST_METHOD': 'PUT',
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        hdrs = {'content-type': 'text/plain',
+                'content-length': str(len(body))}
+        req = Request.blank('/v1/a/c/o', environ=env, body=body, headers=hdrs)
+        self.app.register('PUT', '/v1/a/c/o', HTTPCreated,
+                          {'Etag': 'not the ciphertext etag'})
+        resp = req.get_response(self.encrypter)
+        self.assertEqual('201 Created', resp.status)
+        self.assertEqual('not the ciphertext etag', resp.headers['Etag'])
+
+    def test_PUT_multiseg_no_client_etag(self):
+        body_key = os.urandom(32)
+        chunks = [b'some', b'chunks', b'of data']
+        body = b''.join(chunks)
+        env = {'REQUEST_METHOD': 'PUT',
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys,
+               'wsgi.input': FileLikeIter(chunks)}
+        hdrs = {'content-type': 'text/plain',
+                'content-length': str(len(body))}
+        req = Request.blank('/v1/a/c/o', environ=env, headers=hdrs)
+        self.app.register('PUT', '/v1/a/c/o', HTTPCreated, {})
+
+        with mock.patch(
+            'swift.common.middleware.crypto.crypto_utils.'
+            'Crypto.create_random_key',
+                lambda *args: body_key):
+            resp = req.get_response(self.encrypter)
+
+        self.assertEqual('201 Created', resp.status)
+        # verify object is encrypted by getting direct from the app
+        get_req = Request.blank('/v1/a/c/o', environ={'REQUEST_METHOD': 'GET'})
+        self.assertEqual(encrypt(body, body_key, FAKE_IV),
+                         get_req.get_response(self.app).body)
+
+    def test_PUT_multiseg_good_client_etag(self):
+        body_key = os.urandom(32)
+        chunks = [b'some', b'chunks', b'of data']
+        body = b''.join(chunks)
+        env = {'REQUEST_METHOD': 'PUT',
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys,
+               'wsgi.input': FileLikeIter(chunks)}
+        hdrs = {'content-type': 'text/plain',
+                'content-length': str(len(body)),
+                'Etag': md5hex(body)}
+        req = Request.blank('/v1/a/c/o', environ=env, headers=hdrs)
+        self.app.register('PUT', '/v1/a/c/o', HTTPCreated, {})
+
+        with mock.patch(
+            'swift.common.middleware.crypto.crypto_utils.'
+            'Crypto.create_random_key',
+                lambda *args: body_key):
+            resp = req.get_response(self.encrypter)
+
+        self.assertEqual('201 Created', resp.status)
+        # verify object is encrypted by getting direct from the app
+        get_req = Request.blank('/v1/a/c/o', environ={'REQUEST_METHOD': 'GET'})
+        self.assertEqual(encrypt(body, body_key, FAKE_IV),
+                         get_req.get_response(self.app).body)
+
+    def test_PUT_multiseg_bad_client_etag(self):
+        chunks = [b'some', b'chunks', b'of data']
+        body = b''.join(chunks)
+        env = {'REQUEST_METHOD': 'PUT',
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys,
+               'wsgi.input': FileLikeIter(chunks)}
+        hdrs = {'content-type': 'text/plain',
+                'content-length': str(len(body)),
+                'Etag': 'badclientetag'}
+        req = Request.blank('/v1/a/c/o', environ=env, headers=hdrs)
+        self.app.register('PUT', '/v1/a/c/o', HTTPCreated, {})
+        resp = req.get_response(self.encrypter)
+        self.assertEqual('422 Unprocessable Entity', resp.status)
+
+    def test_PUT_missing_key_callback(self):
+        body = b'FAKE APP'
+        env = {'REQUEST_METHOD': 'PUT'}
+        hdrs = {'content-type': 'text/plain',
+                'content-length': str(len(body))}
+        req = Request.blank('/v1/a/c/o', environ=env, body=body, headers=hdrs)
+        resp = req.get_response(self.encrypter)
+        self.assertEqual('500 Internal Error', resp.status)
+        self.assertIn('missing callback',
+                      self.encrypter.logger.get_lines_for_level('error')[0])
+        self.assertEqual(b'Unable to retrieve encryption keys.', resp.body)
+
+    def test_PUT_error_in_key_callback(self):
+        def raise_exc(*args, **kwargs):
+            raise Exception('Testing')
+
+        body = b'FAKE APP'
+        env = {'REQUEST_METHOD': 'PUT',
+               CRYPTO_KEY_CALLBACK: raise_exc}
+        hdrs = {'content-type': 'text/plain',
+                'content-length': str(len(body))}
+        req = Request.blank('/v1/a/c/o', environ=env, body=body, headers=hdrs)
+        resp = req.get_response(self.encrypter)
+        self.assertEqual('500 Internal Error', resp.status)
+        self.assertIn('from callback: Testing',
+                      self.encrypter.logger.get_lines_for_level('error')[0])
+        self.assertEqual(b'Unable to retrieve encryption keys.', resp.body)
+
+    def test_PUT_encryption_override(self):
+        # set crypto override to disable encryption.
+        # simulate another middleware wanting to set footers
+        other_footers = {
+            'Etag': 'other etag',
+            'X-Object-Sysmeta-Other': 'other sysmeta',
+            'X-Object-Sysmeta-Container-Update-Override-Etag':
+                'other override'}
+        body = b'FAKE APP'
+        env = {'REQUEST_METHOD': 'PUT',
+               'swift.crypto.override': True,
+               'swift.callback.update_footers':
+                   lambda footers: footers.update(other_footers)}
+        hdrs = {'content-type': 'text/plain',
+                'content-length': str(len(body))}
+        req = Request.blank('/v1/a/c/o', environ=env, body=body, headers=hdrs)
+        self.app.register('PUT', '/v1/a/c/o', HTTPCreated, {})
+        resp = req.get_response(self.encrypter)
+        self.assertEqual('201 Created', resp.status)
+
+        # verify that other middleware's footers made it to app
+        self.assertEqual(1, len(self.app.call_list))
+        call = self.app.call_list[0]
+        for k, v in other_footers.items():
+            self.assertEqual(v, call.footers[k])
+
+        # verify object is NOT encrypted by getting direct from the app
+        get_req = Request.blank('/v1/a/c/o', environ={'REQUEST_METHOD': 'GET'})
+        self.assertEqual(body, get_req.get_response(self.app).body)
+
+    def _test_constraints_checking(self, method):
+        # verify that the check_metadata function is called on PUT and POST
+        body = b'FAKE APP'
+        env = {'REQUEST_METHOD': method,
+               CRYPTO_KEY_CALLBACK: fetch_crypto_keys}
+        hdrs = {'content-type': 'text/plain',
+                'content-length': str(len(body))}
+        req = Request.blank('/v1/a/c/o', environ=env, body=body, headers=hdrs)
+        mocked_func = 'swift.common.middleware.crypto.encrypter.check_metadata'
+        with mock.patch(mocked_func) as mocked:
+            mocked.side_effect = [HTTPBadRequest(b'testing')]
+            resp = req.get_response(self.encrypter)
+        self.assertEqual('400 Bad Request', resp.status)
+        self.assertEqual(1, mocked.call_count)
+        mocked.assert_called_once_with(mock.ANY, 'object')
+        self.assertEqual(req.headers,
+                         mocked.call_args_list[0][0][0].headers)
+
+    def test_PUT_constraints_checking(self):
+        self._test_constraints_checking('PUT')
+
+    def test_POST_constraints_checking(self):
+        self._test_constraints_checking('POST')
+
+    def test_config_true_value_on_disable_encryption(self):
+        app = FakeSwift()
+        self.assertFalse(encrypter.Encrypter(app, {}).disable_encryption)
+        for val in ('true', '1', 'yes', 'on', 't', 'y'):
+            app = encrypter.Encrypter(app,
+                                      {'disable_encryption': val})
+            self.assertTrue(app.disable_encryption)
+
+    def test_PUT_app_exception(self):
+        app = encrypter.Encrypter(FakeAppThatExcepts(HTTPException), {})
+        req = Request.blank('/', environ={'REQUEST_METHOD': 'PUT'})
+        with self.assertRaises(HTTPException) as catcher:
+            req.get_response(app)
+        self.assertEqual(FakeAppThatExcepts.MESSAGE, catcher.exception.body)
+
+    def test_encrypt_header_val(self):
+        # Prepare key and Crypto instance
+        object_key = fetch_crypto_keys()['object']
+
+        # - Normal string can be crypted
+        encrypted = encrypter.encrypt_header_val(Crypto(), 'aaa', object_key)
+        # sanity: return value is 2 item tuple
+        self.assertEqual(2, len(encrypted))
+        crypted_val, crypt_info = encrypted
+        expected_crypt_val = base64.b64encode(
+            encrypt(b'aaa', object_key, FAKE_IV))
+        expected_crypt_info = {
+            'cipher': 'AES_CTR_256', 'iv': b'This is an IV123'}
+        self.assertEqual(expected_crypt_val, wsgi_to_bytes(crypted_val))
+        self.assertEqual(expected_crypt_info, crypt_info)
+
+        # - Empty string raises a ValueError for safety
+        with self.assertRaises(ValueError) as cm:
+            encrypter.encrypt_header_val(Crypto(), '', object_key)
+
+        self.assertEqual('empty value is not acceptable',
+                         cm.exception.args[0])
+
+        # - None also raises a ValueError for safety
+        with self.assertRaises(ValueError) as cm:
+            encrypter.encrypt_header_val(Crypto(), None, object_key)
+
+        self.assertEqual('empty value is not acceptable',
+                         cm.exception.args[0])
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/crypto/test_encryption.py b/test/unit/common/middleware/crypto/test_encryption.py
new file mode 100644
index 0000000000..d1f983a941
--- /dev/null
+++ b/test/unit/common/middleware/crypto/test_encryption.py
@@ -0,0 +1,662 @@
+# Copyright (c) 2015-2016 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import base64
+import hashlib
+import hmac
+import json
+import unittest
+import uuid
+
+from swift.common import storage_policy, constraints
+from swift.common.middleware import copy
+from swift.common.middleware import crypto
+from swift.common.middleware.crypto import keymaster
+from swift.common.middleware.crypto.crypto_utils import (
+    load_crypto_meta, Crypto)
+from swift.common.ring import Ring
+from swift.common.swob import Request, str_to_wsgi
+from swift.obj import diskfile
+
+from test.debug_logger import debug_logger
+from test.unit import skip_if_no_xattrs
+from test.unit.common.middleware.crypto.crypto_helpers import (
+    md5hex, encrypt, TEST_KEYMASTER_CONF)
+from test.unit.helpers import setup_servers, teardown_servers
+
+
+class TestCryptoPipelineChanges(unittest.TestCase):
+    # Tests the consequences of crypto middleware being in/out of the pipeline
+    # or having encryption disabled for PUT/GET requests on same object. Uses
+    # real backend servers so that the handling of headers and sysmeta is
+    # verified to diskfile and back.
+    _test_context = None
+
+    @classmethod
+    def setUpClass(cls):
+        cls._test_context = setup_servers()
+        cls.proxy_app = cls._test_context["test_servers"][0]
+
+    @classmethod
+    def tearDownClass(cls):
+        if cls._test_context is not None:
+            teardown_servers(cls._test_context)
+            cls._test_context = None
+
+    def setUp(self):
+        skip_if_no_xattrs()
+        self.plaintext = b'unencrypted body content'
+        self.plaintext_etag = md5hex(self.plaintext)
+        self._setup_crypto_app()
+
+    def _setup_crypto_app(self, disable_encryption=False, root_secret_id=None):
+        # Set up a pipeline of crypto middleware ending in the proxy app so
+        # that tests can make requests to either the proxy server directly or
+        # via the crypto middleware. Make a fresh instance for each test to
+        # avoid any state coupling.
+        conf = {'disable_encryption': disable_encryption}
+        self.encryption = crypto.filter_factory(conf)(self.proxy_app)
+        self.encryption.logger = self.proxy_app.logger
+        km_conf = dict(TEST_KEYMASTER_CONF)
+        if root_secret_id is not None:
+            km_conf['active_root_secret_id'] = root_secret_id
+        self.km = keymaster.KeyMaster(self.encryption, km_conf)
+        self.crypto_app = self.km  # for clarity
+        self.crypto_app.logger = self.encryption.logger
+
+    def _create_container(self, app, policy_name='one', container_path=None):
+        if not container_path:
+            # choose new container name so that the policy can be specified
+            self.container_name = uuid.uuid4().hex
+            self.container_path = 'http://foo:8080/v1/a/' + self.container_name
+            self.object_name = 'o'
+            self.object_path = self.container_path + '/' + self.object_name
+            container_path = self.container_path
+        req = Request.blank(
+            str_to_wsgi(container_path), method='PUT',
+            headers={'X-Storage-Policy': policy_name})
+        resp = req.get_response(app)
+        self.assertEqual('201 Created', resp.status)
+        # sanity check
+        req = Request.blank(
+            str_to_wsgi(container_path), method='HEAD',
+            headers={'X-Storage-Policy': policy_name})
+        resp = req.get_response(app)
+        self.assertEqual(policy_name, resp.headers['X-Storage-Policy'])
+
+    def _put_object(self, app, body):
+        req = Request.blank(
+            str_to_wsgi(self.object_path), method='PUT', body=body,
+            headers={'Content-Type': 'application/test'})
+        resp = req.get_response(app)
+        self.assertEqual('201 Created', resp.status)
+        self.assertEqual(self.plaintext_etag, resp.headers['Etag'])
+        return resp
+
+    def _post_object(self, app):
+        req = Request.blank(str_to_wsgi(self.object_path), method='POST',
+                            headers={'Content-Type': 'application/test',
+                                     'X-Object-Meta-Fruit': 'Kiwi'})
+        resp = req.get_response(app)
+        self.assertEqual('202 Accepted', resp.status)
+        return resp
+
+    def _copy_object(self, app, destination):
+        req = Request.blank(str_to_wsgi(self.object_path), method='COPY',
+                            headers={'Destination': destination})
+        resp = req.get_response(app)
+        self.assertEqual('201 Created', resp.status)
+        self.assertEqual(self.plaintext_etag, resp.headers['Etag'])
+        return resp
+
+    def _check_GET_and_HEAD(self, app, object_path=None):
+        object_path = str_to_wsgi(object_path or self.object_path)
+        req = Request.blank(object_path, method='GET')
+        resp = req.get_response(app)
+        self.assertEqual('200 OK', resp.status)
+        self.assertEqual(self.plaintext, resp.body)
+        self.assertEqual('Kiwi', resp.headers['X-Object-Meta-Fruit'])
+
+        req = Request.blank(object_path, method='HEAD')
+        resp = req.get_response(app)
+        self.assertEqual('200 OK', resp.status)
+        self.assertEqual(b'', resp.body)
+        self.assertEqual('Kiwi', resp.headers['X-Object-Meta-Fruit'])
+
+    def _check_match_requests(self, method, app, object_path=None):
+        object_path = str_to_wsgi(object_path or self.object_path)
+        # verify conditional match requests
+        expected_body = self.plaintext if method == 'GET' else b''
+
+        # If-Match matches
+        req = Request.blank(object_path, method=method,
+                            headers={'If-Match': '"%s"' % self.plaintext_etag})
+        resp = req.get_response(app)
+        self.assertEqual('200 OK', resp.status)
+        self.assertEqual(expected_body, resp.body)
+        self.assertEqual(self.plaintext_etag, resp.headers['Etag'])
+        self.assertEqual('Kiwi', resp.headers['X-Object-Meta-Fruit'])
+
+        # If-Match wildcard
+        req = Request.blank(object_path, method=method,
+                            headers={'If-Match': '*'})
+        resp = req.get_response(app)
+        self.assertEqual('200 OK', resp.status)
+        self.assertEqual(expected_body, resp.body)
+        self.assertEqual(self.plaintext_etag, resp.headers['Etag'])
+        self.assertEqual('Kiwi', resp.headers['X-Object-Meta-Fruit'])
+
+        # If-Match does not match
+        req = Request.blank(object_path, method=method,
+                            headers={'If-Match': '"not the etag"'})
+        resp = req.get_response(app)
+        self.assertEqual('412 Precondition Failed', resp.status)
+        self.assertEqual(b'', resp.body)
+        self.assertEqual(self.plaintext_etag, resp.headers['Etag'])
+
+        # If-None-Match matches
+        req = Request.blank(
+            object_path, method=method,
+            headers={'If-None-Match': '"%s"' % self.plaintext_etag})
+        resp = req.get_response(app)
+        self.assertEqual('304 Not Modified', resp.status)
+        self.assertEqual(b'', resp.body)
+        self.assertEqual(self.plaintext_etag, resp.headers['Etag'])
+
+        # If-None-Match wildcard
+        req = Request.blank(object_path, method=method,
+                            headers={'If-None-Match': '*'})
+        resp = req.get_response(app)
+        self.assertEqual('304 Not Modified', resp.status)
+        self.assertEqual(b'', resp.body)
+        self.assertEqual(self.plaintext_etag, resp.headers['Etag'])
+
+        # If-None-Match does not match
+        req = Request.blank(object_path, method=method,
+                            headers={'If-None-Match': '"not the etag"'})
+        resp = req.get_response(app)
+        self.assertEqual('200 OK', resp.status)
+        self.assertEqual(expected_body, resp.body)
+        self.assertEqual(self.plaintext_etag, resp.headers['Etag'])
+        self.assertEqual('Kiwi', resp.headers['X-Object-Meta-Fruit'])
+
+    def _check_listing(self, app, expect_mismatch=False, container_path=None):
+        container_path = str_to_wsgi(container_path or self.container_path)
+        req = Request.blank(
+            container_path, method='GET', query_string='format=json')
+        resp = req.get_response(app)
+        self.assertEqual('200 OK', resp.status)
+        listing = json.loads(resp.body)
+        self.assertEqual(1, len(listing))
+        self.assertEqual(self.object_name, listing[0]['name'])
+        self.assertEqual(len(self.plaintext), listing[0]['bytes'])
+        if expect_mismatch:
+            self.assertNotEqual(self.plaintext_etag, listing[0]['hash'])
+        else:
+            self.assertEqual(self.plaintext_etag, listing[0]['hash'])
+
+    def test_write_with_crypto_and_override_headers(self):
+        self._create_container(self.proxy_app, policy_name='one')
+
+        def verify_overrides():
+            # verify object sysmeta
+            req = Request.blank(
+                self.object_path, method='GET')
+            resp = req.get_response(self.crypto_app)
+            for k, v in overrides.items():
+                self.assertIn(k, resp.headers)
+                self.assertEqual(overrides[k], resp.headers[k])
+
+            # check container listing
+            req = Request.blank(
+                self.container_path, method='GET', query_string='format=json')
+            resp = req.get_response(self.crypto_app)
+            self.assertEqual('200 OK', resp.status)
+            listing = json.loads(resp.body)
+            self.assertEqual(1, len(listing))
+            self.assertEqual('o', listing[0]['name'])
+            self.assertEqual(
+                overrides['x-object-sysmeta-container-update-override-size'],
+                str(listing[0]['bytes']))
+            self.assertEqual(
+                overrides['x-object-sysmeta-container-update-override-etag'],
+                listing[0]['hash'])
+
+        # include overrides in headers
+        overrides = {'x-object-sysmeta-container-update-override-etag': 'foo',
+                     'x-object-sysmeta-container-update-override-size':
+                         str(len(self.plaintext) + 1)}
+        req = Request.blank(self.object_path, method='PUT',
+                            body=self.plaintext, headers=overrides.copy())
+        resp = req.get_response(self.crypto_app)
+        self.assertEqual('201 Created', resp.status)
+        self.assertEqual(self.plaintext_etag, resp.headers['Etag'])
+        verify_overrides()
+
+        # include overrides in footers
+        overrides = {'x-object-sysmeta-container-update-override-etag': 'bar',
+                     'x-object-sysmeta-container-update-override-size':
+                         str(len(self.plaintext) + 2)}
+
+        def callback(footers):
+            footers.update(overrides)
+
+        req = Request.blank(
+            self.object_path, method='PUT', body=self.plaintext)
+        req.environ['swift.callback.update_footers'] = callback
+        resp = req.get_response(self.crypto_app)
+        self.assertEqual('201 Created', resp.status)
+        self.assertEqual(self.plaintext_etag, resp.headers['Etag'])
+        verify_overrides()
+
+    def test_write_with_crypto_read_with_crypto(self):
+        self._create_container(self.proxy_app, policy_name='one')
+        self._put_object(self.crypto_app, self.plaintext)
+        self._post_object(self.crypto_app)
+        self._check_GET_and_HEAD(self.crypto_app)
+        self._check_match_requests('GET', self.crypto_app)
+        self._check_match_requests('HEAD', self.crypto_app)
+        self._check_listing(self.crypto_app)
+
+    def test_write_with_crypto_read_with_crypto_different_root_secrets(self):
+        root_secret = self.crypto_app.root_secret
+        self._create_container(self.proxy_app, policy_name='one')
+        self._put_object(self.crypto_app, self.plaintext)
+        # change root secret
+        self._setup_crypto_app(root_secret_id='1')
+        root_secret_1 = self.crypto_app.root_secret
+        self.assertNotEqual(root_secret, root_secret_1)  # sanity check
+        self._post_object(self.crypto_app)
+        self._check_GET_and_HEAD(self.crypto_app)
+        self._check_match_requests('GET', self.crypto_app)
+        self._check_match_requests('HEAD', self.crypto_app)
+        self._check_listing(self.crypto_app)
+        # change root secret
+        self._setup_crypto_app(root_secret_id='2')
+        root_secret_2 = self.crypto_app.root_secret
+        self.assertNotEqual(root_secret_2, root_secret_1)  # sanity check
+        self.assertNotEqual(root_secret_2, root_secret)  # sanity check
+        self._check_GET_and_HEAD(self.crypto_app)
+        self._check_match_requests('GET', self.crypto_app)
+        self._check_match_requests('HEAD', self.crypto_app)
+        self._check_listing(self.crypto_app)
+        # write object again
+        self._put_object(self.crypto_app, self.plaintext)
+        self._post_object(self.crypto_app)
+        self._check_GET_and_HEAD(self.crypto_app)
+        self._check_match_requests('GET', self.crypto_app)
+        self._check_match_requests('HEAD', self.crypto_app)
+        self._check_listing(self.crypto_app)
+
+    def test_write_with_crypto_read_with_crypto_ec(self):
+        self._create_container(self.proxy_app, policy_name='ec')
+        self._put_object(self.crypto_app, self.plaintext)
+        self._post_object(self.crypto_app)
+        self._check_GET_and_HEAD(self.crypto_app)
+        self._check_match_requests('GET', self.crypto_app)
+        self._check_match_requests('HEAD', self.crypto_app)
+        self._check_listing(self.crypto_app)
+
+    def test_put_without_crypto_post_with_crypto_read_with_crypto(self):
+        self._create_container(self.proxy_app, policy_name='one')
+        self._put_object(self.proxy_app, self.plaintext)
+        self._post_object(self.crypto_app)
+        self._check_GET_and_HEAD(self.crypto_app)
+        self._check_match_requests('GET', self.crypto_app)
+        self._check_match_requests('HEAD', self.crypto_app)
+        self._check_listing(self.crypto_app)
+
+    def test_write_without_crypto_read_with_crypto(self):
+        self._create_container(self.proxy_app, policy_name='one')
+        self._put_object(self.proxy_app, self.plaintext)
+        self._post_object(self.proxy_app)
+        self._check_GET_and_HEAD(self.proxy_app)  # sanity check
+        self._check_GET_and_HEAD(self.crypto_app)
+        self._check_match_requests('GET', self.proxy_app)  # sanity check
+        self._check_match_requests('GET', self.crypto_app)
+        self._check_match_requests('HEAD', self.proxy_app)  # sanity check
+        self._check_match_requests('HEAD', self.crypto_app)
+        self._check_listing(self.crypto_app)
+
+    def test_write_without_crypto_read_with_crypto_ec(self):
+        self._create_container(self.proxy_app, policy_name='ec')
+        self._put_object(self.proxy_app, self.plaintext)
+        self._post_object(self.proxy_app)
+        self._check_GET_and_HEAD(self.proxy_app)  # sanity check
+        self._check_GET_and_HEAD(self.crypto_app)
+        self._check_match_requests('GET', self.proxy_app)  # sanity check
+        self._check_match_requests('GET', self.crypto_app)
+        self._check_match_requests('HEAD', self.proxy_app)  # sanity check
+        self._check_match_requests('HEAD', self.crypto_app)
+        self._check_listing(self.crypto_app)
+
+    def _check_GET_and_HEAD_not_decrypted(self, app):
+        req = Request.blank(self.object_path, method='GET')
+        resp = req.get_response(app)
+        self.assertEqual('200 OK', resp.status)
+        self.assertNotEqual(self.plaintext, resp.body)
+        self.assertEqual('%s' % len(self.plaintext),
+                         resp.headers['Content-Length'])
+        self.assertNotEqual('Kiwi', resp.headers['X-Object-Meta-Fruit'])
+
+        req = Request.blank(self.object_path, method='HEAD')
+        resp = req.get_response(app)
+        self.assertEqual('200 OK', resp.status)
+        self.assertEqual(b'', resp.body)
+        self.assertNotEqual('Kiwi', resp.headers['X-Object-Meta-Fruit'])
+
+    def test_write_with_crypto_read_without_crypto(self):
+        self._create_container(self.proxy_app, policy_name='one')
+        self._put_object(self.crypto_app, self.plaintext)
+        self._post_object(self.crypto_app)
+        self._check_GET_and_HEAD(self.crypto_app)  # sanity check
+        # without crypto middleware, GET and HEAD returns ciphertext
+        self._check_GET_and_HEAD_not_decrypted(self.proxy_app)
+        self._check_listing(self.proxy_app, expect_mismatch=True)
+
+    def test_write_with_crypto_read_without_crypto_ec(self):
+        self._create_container(self.proxy_app, policy_name='ec')
+        self._put_object(self.crypto_app, self.plaintext)
+        self._post_object(self.crypto_app)
+        self._check_GET_and_HEAD(self.crypto_app)  # sanity check
+        # without crypto middleware, GET and HEAD returns ciphertext
+        self._check_GET_and_HEAD_not_decrypted(self.proxy_app)
+        self._check_listing(self.proxy_app, expect_mismatch=True)
+
+    def test_disable_encryption_config_option(self):
+        # check that on disable_encryption = true, object is not encrypted
+        self._setup_crypto_app(disable_encryption=True)
+        self._create_container(self.proxy_app, policy_name='one')
+        self._put_object(self.crypto_app, self.plaintext)
+        self._post_object(self.crypto_app)
+        self._check_GET_and_HEAD(self.crypto_app)
+        # check as if no crypto middleware exists
+        self._check_GET_and_HEAD(self.proxy_app)
+        self._check_match_requests('GET', self.crypto_app)
+        self._check_match_requests('HEAD', self.crypto_app)
+        self._check_match_requests('GET', self.proxy_app)
+        self._check_match_requests('HEAD', self.proxy_app)
+
+    def test_write_with_crypto_read_with_disable_encryption_conf(self):
+        self._create_container(self.proxy_app, policy_name='one')
+        self._put_object(self.crypto_app, self.plaintext)
+        self._post_object(self.crypto_app)
+        self._check_GET_and_HEAD(self.crypto_app)  # sanity check
+        # turn on disable_encryption config option
+        self._setup_crypto_app(disable_encryption=True)
+        # GET and HEAD of encrypted objects should still work
+        self._check_GET_and_HEAD(self.crypto_app)
+        self._check_listing(self.crypto_app, expect_mismatch=False)
+        self._check_match_requests('GET', self.crypto_app)
+        self._check_match_requests('HEAD', self.crypto_app)
+
+    def _test_ondisk_data_after_write_with_crypto(self, policy_name):
+        policy = storage_policy.POLICIES.get_by_name(policy_name)
+        self._create_container(self.proxy_app, policy_name=policy_name)
+        self._put_object(self.crypto_app, self.plaintext)
+        self._post_object(self.crypto_app)
+
+        # Verify container listing etag is encrypted by direct GET to container
+        # server. We can use any server for all nodes since they all share same
+        # devices dir.
+        cont_server = self._test_context['test_servers'][3]
+        cont_ring = Ring(self._test_context['testdir'], ring_name='container')
+        part, nodes = cont_ring.get_nodes('a', self.container_name)
+        for node in nodes:
+            req = Request.blank('/%s/%s/a/%s'
+                                % (node['device'], part, self.container_name),
+                                method='GET', query_string='format=json')
+            resp = req.get_response(cont_server)
+            listing = json.loads(resp.body)
+            # sanity checks...
+            self.assertEqual(1, len(listing))
+            self.assertEqual('o', listing[0]['name'])
+            self.assertEqual('application/test', listing[0]['content_type'])
+            # verify encrypted etag value
+            parts = listing[0]['hash'].rsplit(';', 1)
+            crypto_meta_param = parts[1].strip()
+            crypto_meta = crypto_meta_param[len('swift_meta='):]
+            listing_etag_iv = load_crypto_meta(crypto_meta)['iv']
+            exp_enc_listing_etag = base64.b64encode(
+                encrypt(self.plaintext_etag.encode('ascii'),
+                        self.km.create_key('/a/%s' % self.container_name),
+                        listing_etag_iv)).decode('ascii')
+            self.assertEqual(exp_enc_listing_etag, parts[0])
+
+        # Verify diskfile data and metadata is encrypted
+        ring_object = self.proxy_app.get_object_ring(int(policy))
+        partition, nodes = ring_object.get_nodes('a', self.container_name, 'o')
+        conf = {'devices': self._test_context["testdir"],
+                'mount_check': 'false'}
+        df_mgr = diskfile.DiskFileRouter(conf, debug_logger())[policy]
+        ondisk_data = []
+        exp_enc_body = None
+        for node_index, node in enumerate(nodes):
+            df = df_mgr.get_diskfile(node['device'], partition,
+                                     'a', self.container_name, 'o',
+                                     policy=policy)
+            with df.open():
+                meta = df.get_metadata()
+                contents = b''.join(df.reader())
+                metadata = dict((k.lower(), v) for k, v in meta.items())
+                # verify on disk data - body
+                body_iv = load_crypto_meta(
+                    metadata['x-object-sysmeta-crypto-body-meta'])['iv']
+                body_key_meta = load_crypto_meta(
+                    metadata['x-object-sysmeta-crypto-body-meta'])['body_key']
+                obj_key = self.km.create_key('/a/%s/o' % self.container_name)
+                body_key = Crypto().unwrap_key(obj_key, body_key_meta)
+                exp_enc_body = encrypt(self.plaintext, body_key, body_iv)
+                ondisk_data.append((node, contents))
+
+                # verify on disk user metadata
+                enc_val, meta = metadata[
+                    'x-object-transient-sysmeta-crypto-meta-fruit'].split(';')
+                meta = meta.strip()[len('swift_meta='):]
+                metadata_iv = load_crypto_meta(meta)['iv']
+                exp_enc_meta = base64.b64encode(encrypt(
+                    b'Kiwi', obj_key, metadata_iv)).decode('ascii')
+                self.assertEqual(exp_enc_meta, enc_val)
+                self.assertNotIn('x-object-meta-fruit', metadata)
+
+                self.assertIn(
+                    'x-object-transient-sysmeta-crypto-meta', metadata)
+                meta = load_crypto_meta(
+                    metadata['x-object-transient-sysmeta-crypto-meta'])
+                self.assertIn('key_id', meta)
+                self.assertIn('path', meta['key_id'])
+                self.assertEqual(
+                    '/a/%s/%s' % (self.container_name, self.object_name),
+                    meta['key_id']['path'])
+                self.assertIn('v', meta['key_id'])
+                self.assertEqual('2', meta['key_id']['v'])
+                self.assertIn('cipher', meta)
+                self.assertEqual(Crypto.cipher, meta['cipher'])
+
+                # verify etag
+                actual_enc_etag, _junk, actual_etag_meta = metadata[
+                    'x-object-sysmeta-crypto-etag'].partition('; swift_meta=')
+                etag_iv = load_crypto_meta(actual_etag_meta)['iv']
+                exp_enc_etag = base64.b64encode(encrypt(
+                    self.plaintext_etag.encode('ascii'),
+                    obj_key, etag_iv)).decode('ascii')
+                self.assertEqual(exp_enc_etag, actual_enc_etag)
+
+                # verify etag hmac
+                exp_etag_mac = hmac.new(
+                    obj_key, self.plaintext_etag.encode('ascii'),
+                    digestmod=hashlib.sha256).digest()
+                exp_etag_mac = base64.b64encode(exp_etag_mac).decode('ascii')
+                self.assertEqual(exp_etag_mac,
+                                 metadata['x-object-sysmeta-crypto-etag-mac'])
+
+                # verify etag override for container updates
+                override = 'x-object-sysmeta-container-update-override-etag'
+                parts = metadata[override].rsplit(';', 1)
+                crypto_meta_param = parts[1].strip()
+                crypto_meta = crypto_meta_param[len('swift_meta='):]
+                listing_etag_iv = load_crypto_meta(crypto_meta)['iv']
+                cont_key = self.km.create_key('/a/%s' % self.container_name)
+                exp_enc_listing_etag = base64.b64encode(
+                    encrypt(self.plaintext_etag.encode('ascii'), cont_key,
+                            listing_etag_iv)).decode('ascii')
+                self.assertEqual(exp_enc_listing_etag, parts[0])
+
+        self._check_GET_and_HEAD(self.crypto_app)
+        return exp_enc_body, ondisk_data
+
+    def test_ondisk_data_after_write_with_crypto(self):
+        exp_body, ondisk_data = self._test_ondisk_data_after_write_with_crypto(
+            policy_name='one')
+        for node, body in ondisk_data:
+            self.assertEqual(exp_body, body)
+
+    def test_ondisk_data_after_write_with_crypto_ec(self):
+        exp_body, ondisk_data = self._test_ondisk_data_after_write_with_crypto(
+            policy_name='ec')
+        policy = storage_policy.POLICIES.get_by_name('ec')
+        for frag_selection in (ondisk_data[:2], ondisk_data[1:]):
+            frags = [frag for node, frag in frag_selection]
+            self.assertEqual(exp_body, policy.pyeclib_driver.decode(frags))
+
+    def _test_copy_encrypted_to_encrypted(
+            self, src_policy_name, dest_policy_name):
+        self._create_container(self.proxy_app, policy_name=src_policy_name)
+        self._put_object(self.crypto_app, self.plaintext)
+        self._post_object(self.crypto_app)
+
+        copy_crypto_app = copy.ServerSideCopyMiddleware(self.crypto_app, {})
+
+        dest_container = uuid.uuid4().hex
+        dest_container_path = 'http://localhost:8080/v1/a/' + dest_container
+        self._create_container(copy_crypto_app, policy_name=dest_policy_name,
+                               container_path=dest_container_path)
+        dest_obj_path = dest_container_path + '/o'
+        dest = '/%s/%s' % (dest_container, 'o')
+        self._copy_object(copy_crypto_app, dest)
+
+        self._check_GET_and_HEAD(copy_crypto_app, object_path=dest_obj_path)
+        self._check_listing(
+            copy_crypto_app, container_path=dest_container_path)
+        self._check_match_requests(
+            'GET', copy_crypto_app, object_path=dest_obj_path)
+        self._check_match_requests(
+            'HEAD', copy_crypto_app, object_path=dest_obj_path)
+
+    def test_copy_encrypted_to_encrypted(self):
+        self._test_copy_encrypted_to_encrypted('ec', 'ec')
+        self._test_copy_encrypted_to_encrypted('one', 'ec')
+        self._test_copy_encrypted_to_encrypted('ec', 'one')
+        self._test_copy_encrypted_to_encrypted('one', 'one')
+
+    def _test_copy_encrypted_to_unencrypted(
+            self, src_policy_name, dest_policy_name):
+        self._create_container(self.proxy_app, policy_name=src_policy_name)
+        self._put_object(self.crypto_app, self.plaintext)
+        self._post_object(self.crypto_app)
+
+        # make a pipeline with encryption disabled, use it to copy object
+        self._setup_crypto_app(disable_encryption=True)
+        copy_app = copy.ServerSideCopyMiddleware(self.crypto_app, {})
+
+        dest_container = uuid.uuid4().hex
+        dest_container_path = 'http://localhost:8080/v1/a/' + dest_container
+        self._create_container(self.crypto_app, policy_name=dest_policy_name,
+                               container_path=dest_container_path)
+        dest_obj_path = dest_container_path + '/o'
+        dest = '/%s/%s' % (dest_container, 'o')
+        self._copy_object(copy_app, dest)
+
+        self._check_GET_and_HEAD(copy_app, object_path=dest_obj_path)
+        self._check_GET_and_HEAD(self.proxy_app, object_path=dest_obj_path)
+        self._check_listing(copy_app, container_path=dest_container_path)
+        self._check_listing(self.proxy_app, container_path=dest_container_path)
+        self._check_match_requests(
+            'GET', self.proxy_app, object_path=dest_obj_path)
+        self._check_match_requests(
+            'HEAD', self.proxy_app, object_path=dest_obj_path)
+
+    def test_copy_encrypted_to_unencrypted(self):
+        self._test_copy_encrypted_to_unencrypted('ec', 'ec')
+        self._test_copy_encrypted_to_unencrypted('one', 'ec')
+        self._test_copy_encrypted_to_unencrypted('ec', 'one')
+        self._test_copy_encrypted_to_unencrypted('one', 'one')
+
+    def _test_copy_unencrypted_to_encrypted(
+            self, src_policy_name, dest_policy_name):
+        self._create_container(self.proxy_app, policy_name=src_policy_name)
+        self._put_object(self.proxy_app, self.plaintext)
+        self._post_object(self.proxy_app)
+
+        copy_crypto_app = copy.ServerSideCopyMiddleware(self.crypto_app, {})
+
+        dest_container = uuid.uuid4().hex
+        dest_container_path = 'http://localhost:8080/v1/a/' + dest_container
+        self._create_container(copy_crypto_app, policy_name=dest_policy_name,
+                               container_path=dest_container_path)
+        dest_obj_path = dest_container_path + '/o'
+        dest = '/%s/%s' % (dest_container, 'o')
+        self._copy_object(copy_crypto_app, dest)
+
+        self._check_GET_and_HEAD(copy_crypto_app, object_path=dest_obj_path)
+        self._check_listing(
+            copy_crypto_app, container_path=dest_container_path)
+        self._check_match_requests(
+            'GET', copy_crypto_app, object_path=dest_obj_path)
+        self._check_match_requests(
+            'HEAD', copy_crypto_app, object_path=dest_obj_path)
+
+    def test_copy_unencrypted_to_encrypted(self):
+        self._test_copy_unencrypted_to_encrypted('ec', 'ec')
+        self._test_copy_unencrypted_to_encrypted('one', 'ec')
+        self._test_copy_unencrypted_to_encrypted('ec', 'one')
+        self._test_copy_unencrypted_to_encrypted('one', 'one')
+
+    def test_crypto_max_length_path(self):
+        # the path is stashed in the key_id in crypto meta; check that a long
+        # path is ok
+        self.container_name = 'c' * constraints.MAX_CONTAINER_NAME_LENGTH
+        self.object_name = 'o' * constraints.MAX_OBJECT_NAME_LENGTH
+        self.container_path = 'http://foo:8080/v1/a/' + self.container_name
+        self.object_path = '%s/%s' % (self.container_path, self.object_name)
+
+        self._create_container(self.proxy_app, policy_name='one',
+                               container_path=self.container_path)
+
+        self._put_object(self.crypto_app, self.plaintext)
+        self._post_object(self.crypto_app)
+        self._check_GET_and_HEAD(self.crypto_app)
+        self._check_match_requests('GET', self.crypto_app)
+        self._check_match_requests('HEAD', self.crypto_app)
+        self._check_listing(self.crypto_app)
+
+    def test_crypto_UTF8_path(self):
+        # check that UTF8 path is ok
+        self.container_name = self.object_name = u'\u010brypto'
+        self.container_path = 'http://foo:8080/v1/a/' + self.container_name
+        self.object_path = '%s/%s' % (self.container_path, self.object_name)
+
+        self._create_container(self.proxy_app, policy_name='one',
+                               container_path=self.container_path)
+
+        self._put_object(self.crypto_app, self.plaintext)
+        self._post_object(self.crypto_app)
+        self._check_GET_and_HEAD(self.crypto_app)
+        self._check_match_requests('GET', self.crypto_app)
+        self._check_match_requests('HEAD', self.crypto_app)
+        self._check_listing(self.crypto_app)
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/crypto/test_keymaster.py b/test/unit/common/middleware/crypto/test_keymaster.py
new file mode 100644
index 0000000000..61ea9a589e
--- /dev/null
+++ b/test/unit/common/middleware/crypto/test_keymaster.py
@@ -0,0 +1,843 @@
+#  Copyright (c) 2015 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import base64
+import copy
+import hashlib
+import hmac
+
+import os
+
+from unittest import mock
+import unittest
+
+from getpass import getuser
+from swift.common import swob
+from swift.common.middleware.crypto import keymaster
+from swift.common.middleware.crypto.crypto_utils import CRYPTO_KEY_CALLBACK
+from swift.common.swob import Request
+from test.unit.common.middleware.helpers import FakeSwift, FakeAppThatExcepts
+from test.unit.common.middleware.crypto.crypto_helpers import (
+    TEST_KEYMASTER_CONF)
+from test.unit import tmpfile
+
+
+def capture_start_response():
+    calls = []
+
+    def start_response(*args):
+        calls.append(args)
+    return start_response, calls
+
+
+class TestKeymaster(unittest.TestCase):
+
+    def setUp(self):
+        super(TestKeymaster, self).setUp()
+        self.swift = FakeSwift()
+        self.app = keymaster.KeyMaster(self.swift, TEST_KEYMASTER_CONF)
+
+    def test_object_path(self):
+        self.verify_v3_keys_for_path(
+            '/a/c/o', expected_keys=('object', 'container'))
+        self.verify_v3_keys_for_path(
+            '/a/c//o', expected_keys=('object', 'container'))
+        self.verify_keys_for_path(
+            '/a/c//o', expected_keys=('object', 'container'))
+        self.verify_v1_keys_for_path(
+            '/a/c//o', expected_keys=('object', 'container'))
+
+    def test_container_path(self):
+        self.verify_v3_keys_for_path(
+            '/a/c', expected_keys=('container',))
+
+    def test_unicode_object_path(self):
+        # NB: path is WSGI
+        self.verify_v3_keys_for_path(
+            '/\xe2\x98\x83/\xf0\x9f\x8c\xb4/\xf0\x9f\x8c\x8a',
+            expected_keys=('object', 'container'))
+        self.verify_keys_for_path(
+            '/\xe2\x98\x83/\xf0\x9f\x8c\xb4/\xf0\x9f\x8c\x8a',
+            expected_keys=('object', 'container'))
+        self.verify_v1_keys_for_path(
+            '/\xe2\x98\x83/\xf0\x9f\x8c\xb4/\xf0\x9f\x8c\x8a',
+            expected_keys=('object', 'container'))
+
+        # Double-whammy: *also* hit the os.path.join issue
+        self.verify_v3_keys_for_path(
+            '/\xe2\x98\x83/\xf0\x9f\x8c\xb4//\xf0\x9f\x8c\x8a',
+            expected_keys=('object', 'container'))
+        self.verify_keys_for_path(
+            '/\xe2\x98\x83/\xf0\x9f\x8c\xb4//\xf0\x9f\x8c\x8a',
+            expected_keys=('object', 'container'))
+        self.verify_v1_keys_for_path(
+            '/\xe2\x98\x83/\xf0\x9f\x8c\xb4//\xf0\x9f\x8c\x8a',
+            expected_keys=('object', 'container'))
+
+    def verify_v3_keys_for_path(self, wsgi_path, expected_keys, key_id=None):
+        put_keys = None
+        self.app.meta_version_to_write = '3'
+        for method, resp_class, status in (
+                ('PUT', swob.HTTPCreated, '201'),
+                ('POST', swob.HTTPAccepted, '202'),
+                ('GET', swob.HTTPOk, '200'),
+                ('HEAD', swob.HTTPNoContent, '204')):
+            resp_headers = {}
+            self.swift.register(
+                method, '/v1' + wsgi_path, resp_class, resp_headers, b'')
+            req = Request.blank(
+                '/v1' + wsgi_path, environ={'REQUEST_METHOD': method})
+            start_response, calls = capture_start_response()
+            self.app(req.environ, start_response)
+            self.assertEqual(1, len(calls))
+            self.assertTrue(calls[0][0].startswith(status))
+            self.assertNotIn('swift.crypto.override', req.environ)
+            self.assertIn(CRYPTO_KEY_CALLBACK, req.environ,
+                          '%s not set in env' % CRYPTO_KEY_CALLBACK)
+            keys = req.environ.get(CRYPTO_KEY_CALLBACK)(key_id=key_id)
+            self.assertIn('id', keys)
+            id = keys.pop('id')
+            path = swob.wsgi_to_str(wsgi_path)
+            self.assertEqual(path, id['path'])
+            self.assertEqual('3', id['v'])
+            keys.pop('all_ids')
+            self.assertListEqual(sorted(expected_keys), sorted(keys.keys()),
+                                 '%s %s got keys %r, but expected %r'
+                                 % (method, path, keys.keys(), expected_keys))
+            if put_keys is not None:
+                # check all key sets were consistent for this path
+                self.assertDictEqual(put_keys, keys)
+            else:
+                put_keys = keys
+        self.app.meta_version_to_write = '2'  # Clean up after ourselves
+        return put_keys
+
+    def verify_keys_for_path(self, wsgi_path, expected_keys, key_id=None):
+        put_keys = None
+        for method, resp_class, status in (
+                ('PUT', swob.HTTPCreated, '201'),
+                ('POST', swob.HTTPAccepted, '202'),
+                ('GET', swob.HTTPOk, '200'),
+                ('HEAD', swob.HTTPNoContent, '204')):
+            resp_headers = {}
+            self.swift.register(
+                method, '/v1' + wsgi_path, resp_class, resp_headers, b'')
+            req = Request.blank(
+                '/v1' + wsgi_path, environ={'REQUEST_METHOD': method})
+            start_response, calls = capture_start_response()
+            self.app(req.environ, start_response)
+            self.assertEqual(1, len(calls))
+            self.assertTrue(calls[0][0].startswith(status))
+            self.assertNotIn('swift.crypto.override', req.environ)
+            self.assertIn(CRYPTO_KEY_CALLBACK, req.environ,
+                          '%s not set in env' % CRYPTO_KEY_CALLBACK)
+            keys = req.environ.get(CRYPTO_KEY_CALLBACK)(key_id=key_id)
+            self.assertIn('id', keys)
+            id = keys.pop('id')
+            path = swob.wsgi_to_str(wsgi_path)
+            self.assertEqual(swob.str_to_wsgi(path), id['path'])
+            self.assertEqual('2', id['v'])
+            keys.pop('all_ids')
+            self.assertListEqual(sorted(expected_keys), sorted(keys.keys()),
+                                 '%s %s got keys %r, but expected %r'
+                                 % (method, path, keys.keys(), expected_keys))
+            if put_keys is not None:
+                # check all key sets were consistent for this path
+                self.assertDictEqual(put_keys, keys)
+            else:
+                put_keys = keys
+        return put_keys
+
+    def verify_v1_keys_for_path(self, wsgi_path, expected_keys, key_id=None):
+        put_keys = None
+        self.app.meta_version_to_write = '1'
+        for method, resp_class, status in (
+                ('PUT', swob.HTTPCreated, '201'),
+                ('POST', swob.HTTPAccepted, '202'),
+                ('GET', swob.HTTPOk, '200'),
+                ('HEAD', swob.HTTPNoContent, '204')):
+            resp_headers = {}
+            self.swift.register(
+                method, '/v1' + wsgi_path, resp_class, resp_headers, b'')
+            req = Request.blank(
+                '/v1' + wsgi_path, environ={'REQUEST_METHOD': method})
+            start_response, calls = capture_start_response()
+            self.app(req.environ, start_response)
+            self.assertEqual(1, len(calls))
+            self.assertTrue(calls[0][0].startswith(status))
+            self.assertNotIn('swift.crypto.override', req.environ)
+            self.assertIn(CRYPTO_KEY_CALLBACK, req.environ,
+                          '%s not set in env' % CRYPTO_KEY_CALLBACK)
+            keys = req.environ.get(CRYPTO_KEY_CALLBACK)(key_id=key_id)
+            self.assertIn('id', keys)
+            id = keys.pop('id')
+            path = swob.wsgi_to_str(wsgi_path)
+            if '//' in path:
+                path = path[path.index('//') + 1:]
+            self.assertEqual(swob.str_to_wsgi(path), id['path'])
+            self.assertEqual('1', id['v'])
+            keys.pop('all_ids')
+            self.assertListEqual(sorted(expected_keys), sorted(keys.keys()),
+                                 '%s %s got keys %r, but expected %r'
+                                 % (method, path, keys.keys(), expected_keys))
+            if put_keys is not None:
+                # check all key sets were consistent for this path
+                self.assertDictEqual(put_keys, keys)
+            else:
+                put_keys = keys
+        self.app.meta_version_to_write = '2'  # Clean up after ourselves
+        return put_keys
+
+    def test_key_uniqueness(self):
+        # a rudimentary check that different keys are made for different paths
+        ref_path_parts = ('a1', 'c1', 'o1')
+        path = '/' + '/'.join(ref_path_parts)
+        ref_keys = self.verify_keys_for_path(
+            path, expected_keys=('object', 'container'))
+
+        # for same path and for each differing path check that keys are unique
+        # when path to object or container is unique and vice-versa
+        for path_parts in [(a, c, o) for a in ('a1', 'a2')
+                           for c in ('c1', 'c2')
+                           for o in ('o1', 'o2')]:
+            path = '/' + '/'.join(path_parts)
+            keys = self.verify_keys_for_path(
+                path, expected_keys=('object', 'container'))
+            # object keys should only be equal when complete paths are equal
+            self.assertEqual(path_parts == ref_path_parts,
+                             keys['object'] == ref_keys['object'],
+                             'Path %s keys:\n%s\npath %s keys\n%s' %
+                             (ref_path_parts, ref_keys, path_parts, keys))
+            # container keys should only be equal when paths to container are
+            # equal
+            self.assertEqual(path_parts[:2] == ref_path_parts[:2],
+                             keys['container'] == ref_keys['container'],
+                             'Path %s keys:\n%s\npath %s keys\n%s' %
+                             (ref_path_parts, ref_keys, path_parts, keys))
+
+    def test_filter(self):
+        factory = keymaster.filter_factory(TEST_KEYMASTER_CONF)
+        self.assertTrue(callable(factory))
+        self.assertTrue(callable(factory(self.swift)))
+
+    def test_app_exception(self):
+        app = keymaster.KeyMaster(
+            FakeAppThatExcepts(), TEST_KEYMASTER_CONF)
+        req = Request.blank('/', environ={'REQUEST_METHOD': 'PUT'})
+        start_response, _ = capture_start_response()
+        self.assertRaises(Exception, app, req.environ, start_response)
+
+    def test_missing_conf_section(self):
+        sample_conf = "[default]\nuser = %s\n" % getuser()
+        with tmpfile(sample_conf) as conf_file:
+            self.assertRaisesRegex(
+                ValueError, 'Unable to find keymaster config section in.*',
+                keymaster.KeyMaster, self.swift, {
+                    'keymaster_config_path': conf_file})
+
+    def test_root_secret(self):
+        def do_test(dflt_id):
+            for secret in (os.urandom(32), os.urandom(33), os.urandom(50)):
+                encoded_secret = base64.b64encode(secret)
+                self.assertIsInstance(encoded_secret, bytes)
+                for conf_val in (
+                        encoded_secret,
+                        encoded_secret.decode('ascii'),
+                        encoded_secret[:30] + b'\n' + encoded_secret[30:],
+                        (encoded_secret[:30] + b'\n' +
+                         encoded_secret[30:]).decode('ascii')):
+                    try:
+                        app = keymaster.KeyMaster(
+                            self.swift, {'encryption_root_secret': conf_val,
+                                         'active_root_secret_id': dflt_id,
+                                         'keymaster_config_path': ''})
+                        self.assertEqual(secret, app.root_secret)
+                    except AssertionError as err:
+                        self.fail(str(err) + ' for secret %r' % conf_val)
+        do_test(None)
+        do_test('')
+
+    def test_no_root_secret(self):
+        with self.assertRaises(ValueError) as cm:
+            keymaster.KeyMaster(self.swift, {})
+        self.assertEqual('No secret loaded for active_root_secret_id None',
+                         str(cm.exception))
+
+    def test_multiple_root_secrets(self):
+        secrets = {None: os.urandom(32),
+                   '22': os.urandom(33),
+                   'my_secret_id': os.urandom(50)}
+
+        conf = {}
+        for secret_id, secret in secrets.items():
+            opt = ('encryption_root_secret%s' %
+                   (('_%s' % secret_id) if secret_id else ''))
+            conf[opt] = base64.b64encode(secret)
+        app = keymaster.KeyMaster(self.swift, conf)
+        self.assertEqual(secrets, app._root_secrets)
+        self.assertEqual([None, '22', 'my_secret_id'], app.root_secret_ids)
+
+    def test_chained_keymasters(self):
+        conf_inner = {'active_root_secret_id': '22'}
+        conf_inner.update(
+            ('encryption_root_secret_%s' % secret_id, base64.b64encode(secret))
+            for secret_id, secret in [('22', os.urandom(33)),
+                                      ('my_secret_id', os.urandom(50))])
+        conf_outer = {'encryption_root_secret': base64.b64encode(
+            os.urandom(32))}
+        app = keymaster.KeyMaster(
+            keymaster.KeyMaster(self.swift, conf_inner),
+            conf_outer)
+
+        self.swift.register('GET', '/v1/a/c', swob.HTTPOk, {}, b'')
+        req = Request.blank('/v1/a/c')
+        start_response, calls = capture_start_response()
+        app(req.environ, start_response)
+        self.assertEqual(1, len(calls))
+        self.assertNotIn('swift.crypto.override', req.environ)
+        self.assertIn(CRYPTO_KEY_CALLBACK, req.environ,
+                      '%s not set in env' % CRYPTO_KEY_CALLBACK)
+        keys = copy.deepcopy(req.environ[CRYPTO_KEY_CALLBACK](key_id=None))
+        self.assertIn('id', keys)
+        self.assertEqual(keys.pop('id'), {
+            'v': '2',
+            'path': '/a/c',
+            'secret_id': '22',
+        })
+        # Inner-most active root secret wins
+        root_key = base64.b64decode(conf_inner['encryption_root_secret_22'])
+        self.assertIn('container', keys)
+        self.assertEqual(keys.pop('container'),
+                         hmac.new(root_key, b'/a/c',
+                                  digestmod=hashlib.sha256).digest())
+        self.assertIn('all_ids', keys)
+        all_keys = set()
+        at_least_one_old_style_id = False
+        for key_id in keys.pop('all_ids'):
+            # Can get key material for each key_id
+            all_keys.add(req.environ[CRYPTO_KEY_CALLBACK](
+                key_id=key_id)['container'])
+
+            if 'secret_id' in key_id:
+                self.assertIn(key_id.pop('secret_id'), {'22', 'my_secret_id'})
+            else:
+                at_least_one_old_style_id = True
+            self.assertEqual(key_id, {
+                'path': '/a/c',
+                'v': '2',
+            })
+        self.assertTrue(at_least_one_old_style_id)
+        self.assertEqual(len(all_keys), 3)
+        self.assertFalse(keys)
+
+        # Also all works for objects
+        self.swift.register('GET', '/v1/a/c/o', swob.HTTPOk, {}, b'')
+        req = Request.blank('/v1/a/c/o')
+        start_response, calls = capture_start_response()
+        app(req.environ, start_response)
+        self.assertEqual(1, len(calls))
+        self.assertNotIn('swift.crypto.override', req.environ)
+        self.assertIn(CRYPTO_KEY_CALLBACK, req.environ,
+                      '%s not set in env' % CRYPTO_KEY_CALLBACK)
+        keys = req.environ.get(CRYPTO_KEY_CALLBACK)(key_id=None)
+        self.assertIn('id', keys)
+        self.assertEqual(keys.pop('id'), {
+            'v': '2',
+            'path': '/a/c/o',
+            'secret_id': '22',
+        })
+        root_key = base64.b64decode(conf_inner['encryption_root_secret_22'])
+        self.assertIn('container', keys)
+        self.assertEqual(keys.pop('container'),
+                         hmac.new(root_key, b'/a/c',
+                                  digestmod=hashlib.sha256).digest())
+        self.assertIn('object', keys)
+        self.assertEqual(keys.pop('object'),
+                         hmac.new(root_key, b'/a/c/o',
+                                  digestmod=hashlib.sha256).digest())
+        self.assertIn('all_ids', keys)
+        at_least_one_old_style_id = False
+        for key_id in keys.pop('all_ids'):
+            if 'secret_id' not in key_id:
+                at_least_one_old_style_id = True
+            else:
+                self.assertIn(key_id.pop('secret_id'), {'22', 'my_secret_id'})
+            self.assertEqual(key_id, {
+                'path': '/a/c/o',
+                'v': '2',
+            })
+        self.assertTrue(at_least_one_old_style_id)
+        self.assertEqual(len(all_keys), 3)
+        self.assertFalse(keys)
+
+    def test_multiple_root_secrets_with_invalid_secret(self):
+        conf = {'encryption_root_secret': base64.b64encode(os.urandom(32)),
+                # too short...
+                'encryption_root_secret_22': base64.b64encode(os.urandom(31))}
+        with self.assertRaises(ValueError) as err:
+            keymaster.KeyMaster(self.swift, conf)
+        self.assertEqual(
+            'encryption_root_secret_22 option in proxy-server.conf '
+            'must be a base64 encoding of at least 32 raw bytes',
+            str(err.exception))
+
+    def test_multiple_root_secrets_with_invalid_id(self):
+        def do_test(bad_option):
+            conf = {'encryption_root_secret': base64.b64encode(os.urandom(32)),
+                    bad_option: base64.b64encode(os.urandom(32))}
+            with self.assertRaises(ValueError) as err:
+                keymaster.KeyMaster(self.swift, conf)
+            self.assertEqual(
+                'Malformed multi-key option name %s' % bad_option,
+                str(err.exception))
+        do_test('encryption_root_secret1')
+        do_test('encryption_root_secret123')
+        do_test('encryption_root_secret_')
+
+    def test_multiple_root_secrets_missing_active_root_secret_id(self):
+        conf = {'encryption_root_secret_22': base64.b64encode(os.urandom(32))}
+        with self.assertRaises(ValueError) as err:
+            keymaster.KeyMaster(self.swift, conf)
+        self.assertEqual(
+            'No secret loaded for active_root_secret_id None',
+            str(err.exception))
+
+        conf = {'encryption_root_secret_22': base64.b64encode(os.urandom(32)),
+                'active_root_secret_id': 'missing'}
+        with self.assertRaises(ValueError) as err:
+            keymaster.KeyMaster(self.swift, conf)
+        self.assertEqual(
+            'No secret loaded for active_root_secret_id missing',
+            str(err.exception))
+
+    def test_correct_root_secret_used(self):
+        secrets = {None: os.urandom(32),
+                   '22': os.urandom(33),
+                   'my_secret_id': os.urandom(50)}
+
+        # no active_root_secret_id configured
+        conf = {}
+        for secret_id, secret in secrets.items():
+            opt = ('encryption_root_secret%s' %
+                   (('_%s' % secret_id) if secret_id else ''))
+            conf[opt] = base64.b64encode(secret)
+        self.app = keymaster.KeyMaster(self.swift, conf)
+        keys = self.verify_keys_for_path('/a/c/o', ('container', 'object'))
+        expected_keys = {
+            'container': hmac.new(secrets[None], b'/a/c',
+                                  digestmod=hashlib.sha256).digest(),
+            'object': hmac.new(secrets[None], b'/a/c/o',
+                               digestmod=hashlib.sha256).digest()}
+        self.assertEqual(expected_keys, keys)
+
+        # active_root_secret_id configured
+        conf['active_root_secret_id'] = '22'
+        self.app = keymaster.KeyMaster(self.swift, conf)
+        keys = self.verify_keys_for_path('/a/c/o', ('container', 'object'))
+        expected_keys = {
+            'container': hmac.new(secrets['22'], b'/a/c',
+                                  digestmod=hashlib.sha256).digest(),
+            'object': hmac.new(secrets['22'], b'/a/c/o',
+                               digestmod=hashlib.sha256).digest()}
+        self.assertEqual(expected_keys, keys)
+
+        # secret_id passed to fetch_crypto_keys callback
+        for secret_id in ('my_secret_id', None):
+            keys = self.verify_keys_for_path(
+                '/a/c/o', ('container', 'object'),
+                key_id={'secret_id': secret_id, 'v': '2', 'path': '/a/c/o'})
+            expected_keys = {
+                'container': hmac.new(secrets[secret_id], b'/a/c',
+                                      digestmod=hashlib.sha256).digest(),
+                'object': hmac.new(secrets[secret_id], b'/a/c/o',
+                                   digestmod=hashlib.sha256).digest()}
+            self.assertEqual(expected_keys, keys)
+
+    def test_keys_cached(self):
+        secrets = {None: os.urandom(32),
+                   '22': os.urandom(33),
+                   'my_secret_id': os.urandom(50)}
+        conf = {}
+        for secret_id, secret in secrets.items():
+            opt = ('encryption_root_secret%s' %
+                   (('_%s' % secret_id) if secret_id else ''))
+            conf[opt] = base64.b64encode(secret)
+        conf['active_root_secret_id'] = '22'
+        self.app = keymaster.KeyMaster(self.swift, conf)
+        orig_create_key = self.app.create_key
+        calls = []
+
+        def mock_create_key(path, secret_id=None):
+            calls.append((path, secret_id))
+            return orig_create_key(path, secret_id)
+
+        context = keymaster.KeyMasterContext(self.app, 'a', 'c', 'o')
+        with mock.patch.object(self.app, 'create_key', mock_create_key):
+            keys = context.fetch_crypto_keys()
+        expected_keys = {
+            'container': hmac.new(secrets['22'], b'/a/c',
+                                  digestmod=hashlib.sha256).digest(),
+            'object': hmac.new(secrets['22'], b'/a/c/o',
+                               digestmod=hashlib.sha256).digest(),
+            'id': {'path': '/a/c/o', 'secret_id': '22', 'v': '2'},
+            'all_ids': [
+                {'path': '/a/c/o', 'v': '2'},
+                {'path': '/a/c/o', 'secret_id': '22', 'v': '2'},
+                {'path': '/a/c/o', 'secret_id': 'my_secret_id', 'v': '2'}]}
+        self.assertEqual(expected_keys, keys)
+        self.assertEqual([('/a/c', '22'), ('/a/c/o', '22')], calls)
+        with mock.patch.object(self.app, 'create_key', mock_create_key):
+            keys = context.fetch_crypto_keys()
+        # no more calls to create_key
+        self.assertEqual([('/a/c', '22'), ('/a/c/o', '22')], calls)
+        self.assertEqual(expected_keys, keys)
+        with mock.patch.object(self.app, 'create_key', mock_create_key):
+            keys = context.fetch_crypto_keys(key_id={
+                'secret_id': None, 'v': '2', 'path': '/a/c/o'})
+        expected_keys = {
+            'container': hmac.new(secrets[None], b'/a/c',
+                                  digestmod=hashlib.sha256).digest(),
+            'object': hmac.new(secrets[None], b'/a/c/o',
+                               digestmod=hashlib.sha256).digest(),
+            'id': {'path': '/a/c/o', 'v': '2'},
+            'all_ids': [
+                {'path': '/a/c/o', 'v': '2'},
+                {'path': '/a/c/o', 'secret_id': '22', 'v': '2'},
+                {'path': '/a/c/o', 'secret_id': 'my_secret_id', 'v': '2'}]}
+        self.assertEqual(expected_keys, keys)
+        self.assertEqual([('/a/c', '22'), ('/a/c/o', '22'),
+                          ('/a/c', None), ('/a/c/o', None)],
+                         calls)
+
+    def test_v1_keys(self):
+        secrets = {None: os.urandom(32),
+                   '22': os.urandom(33)}
+        conf = {}
+        for secret_id, secret in secrets.items():
+            opt = ('encryption_root_secret%s' %
+                   (('_%s' % secret_id) if secret_id else ''))
+            conf[opt] = base64.b64encode(secret)
+        conf['active_root_secret_id'] = '22'
+        self.app = keymaster.KeyMaster(self.swift, conf)
+        orig_create_key = self.app.create_key
+        calls = []
+
+        def mock_create_key(path, secret_id=None):
+            calls.append((path, secret_id))
+            return orig_create_key(path, secret_id)
+
+        context = keymaster.KeyMasterContext(self.app, 'a', 'c', 'o')
+        for version in ('1', '2', '3'):
+            with mock.patch.object(self.app, 'create_key', mock_create_key):
+                keys = context.fetch_crypto_keys(key_id={
+                    'v': version, 'path': '/a/c/o'})
+            expected_keys = {
+                'container': hmac.new(secrets[None], b'/a/c',
+                                      digestmod=hashlib.sha256).digest(),
+                'object': hmac.new(secrets[None], b'/a/c/o',
+                                   digestmod=hashlib.sha256).digest(),
+                'id': {'path': '/a/c/o', 'v': version},
+                'all_ids': [
+                    {'path': '/a/c/o', 'v': version},
+                    {'path': '/a/c/o', 'secret_id': '22', 'v': version}]}
+            self.assertEqual(expected_keys, keys)
+            self.assertEqual([('/a/c', None), ('/a/c/o', None)], calls)
+            del calls[:]
+
+        context = keymaster.KeyMasterContext(self.app, 'a', 'c', '/o')
+        with mock.patch.object(self.app, 'create_key', mock_create_key):
+            keys = context.fetch_crypto_keys(key_id={
+                'v': '1', 'path': '/o'})
+        expected_keys = {
+            'container': hmac.new(secrets[None], b'/a/c',
+                                  digestmod=hashlib.sha256).digest(),
+            'object': hmac.new(secrets[None], b'/o',
+                               digestmod=hashlib.sha256).digest(),
+            'id': {'path': '/o', 'v': '1'},
+            'all_ids': [
+                {'path': '/o', 'v': '1'},
+                {'path': '/o', 'secret_id': '22', 'v': '1'}]}
+        self.assertEqual(expected_keys, keys)
+        self.assertEqual([('/a/c', None), ('/o', None)], calls)
+        del calls[:]
+
+        context = keymaster.KeyMasterContext(self.app, 'a', 'c', '/o')
+        with mock.patch.object(self.app, 'create_key', mock_create_key):
+            keys = context.fetch_crypto_keys(key_id={
+                'v': '2', 'path': '/a/c//o'})
+        expected_keys = {
+            'container': hmac.new(secrets[None], b'/a/c',
+                                  digestmod=hashlib.sha256).digest(),
+            'object': hmac.new(secrets[None], b'/a/c//o',
+                               digestmod=hashlib.sha256).digest(),
+            'id': {'path': '/a/c//o', 'v': '2'},
+            'all_ids': [
+                {'path': '/a/c//o', 'v': '2'},
+                {'path': '/a/c//o', 'secret_id': '22', 'v': '2'}]}
+        self.assertEqual(expected_keys, keys)
+        self.assertEqual([('/a/c', None), ('/a/c//o', None)], calls)
+
+    def test_v1_keys_with_weird_paths(self):
+        secrets = {None: os.urandom(32),
+                   '22': os.urandom(33)}
+        conf = {}
+        for secret_id, secret in secrets.items():
+            opt = ('encryption_root_secret%s' %
+                   (('_%s' % secret_id) if secret_id else ''))
+            conf[opt] = base64.b64encode(secret)
+        conf['active_root_secret_id'] = '22'
+        self.app = keymaster.KeyMaster(self.swift, conf)
+        orig_create_key = self.app.create_key
+        calls = []
+
+        def mock_create_key(path, secret_id=None):
+            calls.append((path, secret_id))
+            return orig_create_key(path, secret_id)
+
+        # request path doesn't match stored path -- this could happen if you
+        # misconfigured your proxy to have copy right of encryption
+        context = keymaster.KeyMasterContext(self.app, 'a', 'not-c', 'not-o')
+        for version in ('1', '2', '3'):
+            with mock.patch.object(self.app, 'create_key', mock_create_key):
+                keys = context.fetch_crypto_keys(key_id={
+                    'v': version, 'path': '/a/c/o'})
+            expected_keys = {
+                'container': hmac.new(secrets[None], b'/a/c',
+                                      digestmod=hashlib.sha256).digest(),
+                'object': hmac.new(secrets[None], b'/a/c/o',
+                                   digestmod=hashlib.sha256).digest(),
+                'id': {'path': '/a/c/o', 'v': version},
+                'all_ids': [
+                    {'path': '/a/c/o', 'v': version},
+                    {'path': '/a/c/o', 'secret_id': '22', 'v': version}]}
+            self.assertEqual(expected_keys, keys)
+            self.assertEqual([('/a/c', None), ('/a/c/o', None)], calls)
+            del calls[:]
+
+        context = keymaster.KeyMasterContext(
+            self.app, 'not-a', 'not-c', '/not-o')
+        with mock.patch.object(self.app, 'create_key', mock_create_key):
+            keys = context.fetch_crypto_keys(key_id={
+                'v': '1', 'path': '/o'})
+        expected_keys = {
+            'container': hmac.new(secrets[None], b'/not-a/not-c',
+                                  digestmod=hashlib.sha256).digest(),
+            'object': hmac.new(secrets[None], b'/o',
+                               digestmod=hashlib.sha256).digest(),
+            'id': {'path': '/o', 'v': '1'},
+            'all_ids': [
+                {'path': '/o', 'v': '1'},
+                {'path': '/o', 'secret_id': '22', 'v': '1'}]}
+        self.assertEqual(expected_keys, keys)
+        self.assertEqual([('/not-a/not-c', None), ('/o', None)], calls)
+        del calls[:]
+
+        context = keymaster.KeyMasterContext(
+            self.app, 'not-a', 'not-c', '/not-o')
+        with mock.patch.object(self.app, 'create_key', mock_create_key):
+            keys = context.fetch_crypto_keys(key_id={
+                'v': '2', 'path': '/a/c//o'})
+        expected_keys = {
+            'container': hmac.new(secrets[None], b'/a/c',
+                                  digestmod=hashlib.sha256).digest(),
+            'object': hmac.new(secrets[None], b'/a/c//o',
+                               digestmod=hashlib.sha256).digest(),
+            'id': {'path': '/a/c//o', 'v': '2'},
+            'all_ids': [
+                {'path': '/a/c//o', 'v': '2'},
+                {'path': '/a/c//o', 'secret_id': '22', 'v': '2'}]}
+        self.assertEqual(expected_keys, keys)
+        self.assertEqual([('/a/c', None), ('/a/c//o', None)], calls)
+
+    def test_v2_keys(self):
+        secrets = {None: os.urandom(32),
+                   '22': os.urandom(33)}
+        conf = {}
+        for secret_id, secret in secrets.items():
+            opt = ('encryption_root_secret%s' %
+                   (('_%s' % secret_id) if secret_id else ''))
+            conf[opt] = base64.b64encode(secret)
+        conf['active_root_secret_id'] = '22'
+        self.app = keymaster.KeyMaster(self.swift, conf)
+        orig_create_key = self.app.create_key
+        calls = []
+
+        def mock_create_key(path, secret_id=None):
+            calls.append((path, secret_id))
+            return orig_create_key(path, secret_id)
+
+        container = u'\N{SNOWMAN}'
+        obj = u'\N{SNOWFLAKE}'
+        good_con_path = '/a/%s' % container
+        good_path = '/a/%s/%s' % (container, obj)
+
+        mangled_con_path = ('/a/%s' % container).encode(
+            'utf-8').decode('latin-1')
+        mangled_path = ('/a/%s/%s' % (
+            container, obj)).encode('utf-8').decode('latin-1')
+
+        context = keymaster.KeyMasterContext(self.app, 'a', container, obj)
+        for version in ('1', '2', '3'):
+            with mock.patch.object(self.app, 'create_key', mock_create_key):
+                keys = context.fetch_crypto_keys(key_id={
+                    'v': version, 'path': good_path})
+            key_id_path = (good_path if version == '3' else mangled_path)
+            expected_keys = {
+                'container': hmac.new(secrets[None], b'/a/\xe2\x98\x83',
+                                      digestmod=hashlib.sha256).digest(),
+                'object': hmac.new(
+                    secrets[None], b'/a/\xe2\x98\x83/\xe2\x9d\x84',
+                    digestmod=hashlib.sha256).digest(),
+                'id': {'path': key_id_path, 'v': version},
+                'all_ids': [
+                    {'path': key_id_path, 'v': version},
+                    {'path': key_id_path, 'secret_id': '22', 'v': version}]}
+            self.assertEqual(expected_keys, keys)
+            self.assertEqual([(good_con_path, None), (good_path, None)], calls)
+            del calls[:]
+
+        context = keymaster.KeyMasterContext(self.app, 'a', container, obj)
+        for version in ('1', '2'):
+            with mock.patch.object(self.app, 'create_key', mock_create_key):
+                keys = context.fetch_crypto_keys(key_id={
+                    'v': version, 'path': mangled_path})
+            key_id_path = mangled_path
+            expected_keys = {
+                'container': hmac.new(secrets[None], b'/a/\xe2\x98\x83',
+                                      digestmod=hashlib.sha256).digest(),
+                'object': hmac.new(
+                    secrets[None], b'/a/\xe2\x98\x83/\xe2\x9d\x84',
+                    digestmod=hashlib.sha256).digest(),
+                'id': {'path': key_id_path, 'v': version},
+                'all_ids': [
+                    {'path': key_id_path, 'v': version},
+                    {'path': key_id_path, 'secret_id': '22', 'v': version}]}
+            self.assertEqual(expected_keys, keys)
+            self.assertEqual([(good_con_path, None), (good_path, None)], calls)
+            del calls[:]
+
+        # If v3, we know to trust the meta -- presumably, data was PUT with
+        # the mojibake path then COPYed to the right path (but with bad
+        # pipeline placement for copy)
+        with mock.patch.object(self.app, 'create_key', mock_create_key):
+            keys = context.fetch_crypto_keys(key_id={
+                'v': '3', 'path': mangled_path})
+        expected_keys = {
+            'container': hmac.new(
+                secrets[None], b'/a/\xc3\xa2\xc2\x98\xc2\x83',
+                digestmod=hashlib.sha256).digest(),
+            'object': hmac.new(
+                secrets[None],
+                b'/a/\xc3\xa2\xc2\x98\xc2\x83/\xc3\xa2\xc2\x9d\xc2\x84',
+                digestmod=hashlib.sha256).digest(),
+            'id': {'path': mangled_path, 'v': '3'},
+            'all_ids': [
+                {'path': mangled_path, 'v': '3'},
+                {'path': mangled_path, 'secret_id': '22', 'v': '3'}]}
+        self.assertEqual(expected_keys, keys)
+        self.assertEqual([(mangled_con_path, None), (mangled_path, None)],
+                         calls)
+        del calls[:]
+
+    @mock.patch('swift.common.middleware.crypto.keymaster.readconf')
+    def test_keymaster_config_path(self, mock_readconf):
+        for secret in (os.urandom(32), os.urandom(33), os.urandom(50)):
+            enc_secret = base64.b64encode(secret)
+            self.assertIsInstance(enc_secret, bytes)
+            for conf_val in (enc_secret, enc_secret.decode('ascii'),
+                             enc_secret[:30] + b'\n' + enc_secret[30:],
+                             enc_secret[:30] + b'\r\n' + enc_secret[30:],
+                             (enc_secret[:30] + b'\n' +
+                              enc_secret[30:]).decode('ascii'),
+                             (enc_secret[:30] + b'\r\n' +
+                              enc_secret[30:]).decode('ascii')):
+                mock_readconf.reset_mock()
+                mock_readconf.return_value = {
+                    'encryption_root_secret': conf_val}
+
+                app = keymaster.KeyMaster(self.swift, {
+                    'keymaster_config_path': '/some/path'})
+                try:
+                    self.assertEqual(secret, app.root_secret)
+                    self.assertEqual(mock_readconf.mock_calls, [
+                        mock.call('/some/path', 'keymaster')])
+                except AssertionError as err:
+                    self.fail(str(err) + ' for secret %r' % secret)
+
+    def test_invalid_root_secret(self):
+        for secret in (base64.b64encode(os.urandom(31)),  # too short
+                       base64.b64encode(os.urandom(31)).decode('ascii'),
+                       u'a' * 44 + u'????', b'a' * 44 + b'????',  # not base64
+                       u'a' * 45, b'a' * 45,  # bad padding
+                       99, None):
+            conf = {'encryption_root_secret': secret}
+            try:
+                with self.assertRaises(ValueError) as err:
+                    keymaster.KeyMaster(self.swift, conf)
+                self.assertEqual(
+                    'encryption_root_secret option in proxy-server.conf '
+                    'must be a base64 encoding of at least 32 raw bytes',
+                    str(err.exception))
+            except AssertionError as err:
+                self.fail(str(err) + ' for conf %s' % str(conf))
+
+    @mock.patch('swift.common.middleware.crypto.keymaster.readconf')
+    def test_root_secret_path_invalid_secret(self, mock_readconf):
+        for secret in (base64.b64encode(os.urandom(31)),  # too short
+                       base64.b64encode(os.urandom(31)).decode('ascii'),
+                       u'a' * 44 + u'????', b'a' * 44 + b'????',  # not base64
+                       u'a' * 45, b'a' * 45,  # bad padding
+                       99, None):
+            mock_readconf.reset_mock()
+            mock_readconf.return_value = {'encryption_root_secret': secret}
+
+            try:
+                with self.assertRaises(ValueError) as err:
+                    keymaster.KeyMaster(self.swift, {
+                        'keymaster_config_path': '/some/other/path'})
+                self.assertEqual(
+                    'encryption_root_secret option in /some/other/path '
+                    'must be a base64 encoding of at least 32 raw bytes',
+                    str(err.exception))
+                self.assertEqual(mock_readconf.mock_calls, [
+                    mock.call('/some/other/path', 'keymaster')])
+            except AssertionError as err:
+                self.fail(str(err) + ' for secret %r' % secret)
+
+    def test_can_only_configure_secret_in_one_place(self):
+        def do_test(conf):
+            with self.assertRaises(ValueError) as err:
+                keymaster.KeyMaster(self.swift, conf)
+            expected_message = ('keymaster_config_path is set, but there are '
+                                'other config options specified:')
+            self.assertTrue(str(err.exception).startswith(expected_message),
+                            "Error message does not start with '%s'" %
+                            expected_message)
+
+        conf = {'encryption_root_secret': 'a' * 44,
+                'keymaster_config_path': '/etc/swift/keymaster.conf'}
+        do_test(conf)
+        conf = {'encryption_root_secret_1': 'a' * 44,
+                'keymaster_config_path': '/etc/swift/keymaster.conf'}
+        do_test(conf)
+        conf = {'encryption_root_secret_': 'a' * 44,
+                'keymaster_config_path': '/etc/swift/keymaster.conf'}
+        do_test(conf)
+        conf = {'active_root_secret_id': '1',
+                'keymaster_config_path': '/etc/swift/keymaster.conf'}
+        do_test(conf)
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/crypto/test_kmip_keymaster.py b/test/unit/common/middleware/crypto/test_kmip_keymaster.py
new file mode 100644
index 0000000000..2bcc8ff67a
--- /dev/null
+++ b/test/unit/common/middleware/crypto/test_kmip_keymaster.py
@@ -0,0 +1,328 @@
+# -*- coding: utf-8 -*-
+#  Copyright (c) 2018 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import logging
+from unittest import mock
+import os
+import unittest
+from tempfile import mkdtemp
+from textwrap import dedent
+from shutil import rmtree
+import sys
+sys.modules['kmip'] = mock.Mock()
+sys.modules['kmip.pie'] = mock.Mock()
+sys.modules['kmip.pie.client'] = mock.Mock()
+
+from swift.common.middleware.crypto import kmip_keymaster
+
+
+KMIP_CLIENT_CLASS = \
+    'swift.common.middleware.crypto.kmip_keymaster.ProxyKmipClient'
+
+
+class MockProxyKmipClient(object):
+    def __init__(self, secrets, calls, kwargs):
+        calls.append(('__init__', kwargs))
+        self.secrets = secrets
+        self.calls = calls
+
+    def get(self, uid):
+        self.calls.append(('get', uid))
+        return self.secrets[uid]
+
+    def __enter__(self):
+        return self
+
+    def __exit__(self, exc_type, exc_value, traceback):
+        pass
+
+
+def create_secret(algorithm_name, length, value):
+    algorithm = mock.MagicMock()
+    algorithm.name = algorithm_name
+    secret = mock.MagicMock(cryptographic_algorithm=algorithm,
+                            cryptographic_length=length,
+                            value=value)
+    return secret
+
+
+def create_mock_client(secrets, calls):
+    def mock_client(*args, **kwargs):
+        if args:
+            raise Exception('unexpected args provided: %r' % (args,))
+        return MockProxyKmipClient(secrets, calls, kwargs)
+    return mock_client
+
+
+class InMemoryHandler(logging.Handler):
+    def __init__(self):
+        self.messages = []
+        super(InMemoryHandler, self).__init__()
+
+    def handle(self, record):
+        self.messages.append(record.msg)
+
+
+class TestKmipKeymaster(unittest.TestCase):
+
+    def setUp(self):
+        self.tempdir = mkdtemp()
+
+    def tearDown(self):
+        rmtree(self.tempdir)
+
+    def test_config_in_filter_section(self):
+        conf = {'__file__': '/etc/swift/proxy-server.conf',
+                '__name__': 'kmip_keymaster',
+                'key_id': '1234'}
+        secrets = {'1234': create_secret('AES', 256, b'x' * 32)}
+        calls = []
+        with mock.patch(KMIP_CLIENT_CLASS, create_mock_client(secrets, calls)):
+            km = kmip_keymaster.filter_factory(conf)(None)
+
+        self.assertEqual({None: b'x' * 32}, km._root_secrets)
+        self.assertEqual(None, km.active_secret_id)
+        self.assertIsNone(km.keymaster_config_path)
+        self.assertEqual(calls, [
+            ('__init__', {'config_file': '/etc/swift/proxy-server.conf',
+                          'config': 'filter:kmip_keymaster'}),
+            ('get', '1234'),
+        ])
+
+    def test_multikey_config_in_filter_section(self):
+        conf = {'__file__': '/etc/swift/proxy-server.conf',
+                '__name__': 'kmip-keymaster',
+                'key_id': '1234',
+                'key_id_xyzzy': 'foobar',
+                'key_id_alt_secret_id': 'foobar',
+                'active_root_secret_id': 'xyzzy'}
+        secrets = {'1234': create_secret('AES', 256, b'x' * 32),
+                   'foobar': create_secret('AES', 256, b'y' * 32)}
+        calls = []
+        with mock.patch(KMIP_CLIENT_CLASS, create_mock_client(secrets, calls)):
+            km = kmip_keymaster.KmipKeyMaster(None, conf)
+
+        self.assertEqual({None: b'x' * 32, 'xyzzy': b'y' * 32,
+                          'alt_secret_id': b'y' * 32},
+                         km._root_secrets)
+        self.assertEqual('xyzzy', km.active_secret_id)
+        self.assertIsNone(km.keymaster_config_path)
+        self.assertEqual(calls, [
+            ('__init__', {'config_file': '/etc/swift/proxy-server.conf',
+                          'config': 'filter:kmip-keymaster'}),
+            ('get', '1234'),
+            ('get', 'foobar'),
+        ])
+
+    def test_bad_active_key(self):
+        conf = {'__file__': '/etc/swift/proxy-server.conf',
+                '__name__': 'kmip_keymaster',
+                'key_id': '1234',
+                'key_id_xyzzy': 'foobar',
+                'active_root_secret_id': 'unknown'}
+        secrets = {'1234': create_secret('AES', 256, b'x' * 32),
+                   'foobar': create_secret('AES', 256, b'y' * 32)}
+        calls = []
+        with mock.patch(KMIP_CLIENT_CLASS,
+                        create_mock_client(secrets, calls)), \
+                self.assertRaises(ValueError) as raised:
+            kmip_keymaster.KmipKeyMaster(None, conf)
+        self.assertEqual('No secret loaded for active_root_secret_id unknown',
+                         str(raised.exception))
+
+    def test_config_in_separate_file(self):
+        km_conf = """
+        [kmip_keymaster]
+        key_id = 4321
+        """
+        km_config_file = os.path.join(self.tempdir, 'km.conf')
+        with open(km_config_file, 'wt') as fd:
+            fd.write(dedent(km_conf))
+
+        conf = {'__file__': '/etc/swift/proxy-server.conf',
+                '__name__': 'keymaster-kmip',
+                'keymaster_config_path': km_config_file}
+        secrets = {'4321': create_secret('AES', 256, b'x' * 32)}
+        calls = []
+        with mock.patch(KMIP_CLIENT_CLASS, create_mock_client(secrets, calls)):
+            km = kmip_keymaster.KmipKeyMaster(None, conf)
+        self.assertEqual({None: b'x' * 32}, km._root_secrets)
+        self.assertEqual(None, km.active_secret_id)
+        self.assertEqual(km_config_file, km.keymaster_config_path)
+        self.assertEqual(calls, [
+            ('__init__', {'config_file': km_config_file,
+                          'config': 'kmip_keymaster'}),
+            ('get', '4321')])
+
+    def test_multikey_config_in_separate_file(self):
+        km_conf = """
+        [kmip_keymaster]
+        key_id = 4321
+        key_id_secret_id = another id
+        active_root_secret_id = secret_id
+        """
+        km_config_file = os.path.join(self.tempdir, 'km.conf')
+        with open(km_config_file, 'wt') as fd:
+            fd.write(dedent(km_conf))
+
+        conf = {'__file__': '/etc/swift/proxy-server.conf',
+                '__name__': 'kmip_keymaster',
+                'keymaster_config_path': km_config_file}
+        secrets = {'4321': create_secret('AES', 256, b'x' * 32),
+                   'another id': create_secret('AES', 256, b'y' * 32)}
+        calls = []
+        with mock.patch(KMIP_CLIENT_CLASS, create_mock_client(secrets, calls)):
+            km = kmip_keymaster.KmipKeyMaster(None, conf)
+        self.assertEqual({None: b'x' * 32, 'secret_id': b'y' * 32},
+                         km._root_secrets)
+        self.assertEqual('secret_id', km.active_secret_id)
+        self.assertEqual(km_config_file, km.keymaster_config_path)
+        self.assertEqual(calls, [
+            ('__init__', {'config_file': km_config_file,
+                          'config': 'kmip_keymaster'}),
+            ('get', '4321'),
+            ('get', 'another id')])
+
+    def test_proxy_server_conf_dir(self):
+        proxy_server_conf_dir = os.path.join(self.tempdir, 'proxy_server.d')
+        os.mkdir(proxy_server_conf_dir)
+
+        # KmipClient can't read conf from a dir, so check that is caught early
+        conf = {'__file__': proxy_server_conf_dir,
+                '__name__': 'kmip_keymaster',
+                'key_id': '789'}
+        with self.assertRaises(ValueError) as cm:
+            kmip_keymaster.KmipKeyMaster(None, conf)
+        self.assertIn('config cannot be read from conf dir', str(cm.exception))
+
+        # ...but a conf file in a conf dir could point back to itself for the
+        # KmipClient config
+        km_config_file = os.path.join(proxy_server_conf_dir, '40.conf')
+        km_conf = """
+        [filter:kmip_keymaster]
+        keymaster_config_file = %s
+
+        [kmip_keymaster]
+        key_id = 789
+        """ % km_config_file
+
+        with open(km_config_file, 'wt') as fd:
+            fd.write(dedent(km_conf))
+
+        conf = {'__file__': proxy_server_conf_dir,
+                '__name__': 'kmip_keymaster',
+                'keymaster_config_path': km_config_file}
+        secrets = {'789': create_secret('AES', 256, b'x' * 32)}
+        calls = []
+        with mock.patch(KMIP_CLIENT_CLASS, create_mock_client(secrets, calls)):
+            km = kmip_keymaster.KmipKeyMaster(None, conf)
+        self.assertEqual({None: b'x' * 32}, km._root_secrets)
+        self.assertEqual(None, km.active_secret_id)
+        self.assertEqual(km_config_file, km.keymaster_config_path)
+        self.assertEqual(calls, [
+            ('__init__', {'config_file': km_config_file,
+                          # NB: no "filter:"
+                          'config': 'kmip_keymaster'}),
+            ('get', '789')])
+
+    def test_bad_key_length(self):
+        conf = {'__file__': '/etc/swift/proxy-server.conf',
+                '__name__': 'kmip_keymaster',
+                'key_id': '1234'}
+        secrets = {'1234': create_secret('AES', 128, b'x' * 16)}
+        calls = []
+        with mock.patch(KMIP_CLIENT_CLASS,
+                        create_mock_client(secrets, calls)), \
+                self.assertRaises(ValueError) as cm:
+            kmip_keymaster.KmipKeyMaster(None, conf)
+        self.assertIn('Expected key 1234 to be an AES-256 key',
+                      str(cm.exception))
+        self.assertEqual(calls, [
+            ('__init__', {'config_file': '/etc/swift/proxy-server.conf',
+                          'config': 'filter:kmip_keymaster'}),
+            ('get', '1234')])
+
+    def test_bad_key_algorithm(self):
+        conf = {'__file__': '/etc/swift/proxy-server.conf',
+                '__name__': 'kmip_keymaster',
+                'key_id': '1234'}
+        secrets = {'1234': create_secret('notAES', 256, b'x' * 32)}
+        calls = []
+        with mock.patch(KMIP_CLIENT_CLASS,
+                        create_mock_client(secrets, calls)), \
+                self.assertRaises(ValueError) as cm:
+            kmip_keymaster.KmipKeyMaster(None, conf)
+        self.assertIn('Expected key 1234 to be an AES-256 key',
+                      str(cm.exception))
+        self.assertEqual(calls, [
+            ('__init__', {'config_file': '/etc/swift/proxy-server.conf',
+                          'config': 'filter:kmip_keymaster'}),
+            ('get', '1234')])
+
+    def test_missing_key_id(self):
+        conf = {'__file__': '/etc/swift/proxy-server.conf',
+                '__name__': 'kmip_keymaster'}
+        secrets = {}
+        calls = []
+        with mock.patch(KMIP_CLIENT_CLASS,
+                        create_mock_client(secrets, calls)), \
+                self.assertRaises(ValueError) as cm:
+            kmip_keymaster.KmipKeyMaster(None, conf)
+        self.assertEqual('No secret loaded for active_root_secret_id None',
+                         str(cm.exception))
+        # We make the client, but never use it
+        self.assertEqual(calls, [
+            ('__init__', {'config_file': '/etc/swift/proxy-server.conf',
+                          'config': 'filter:kmip_keymaster'})])
+
+    def test_logger_manipulations(self):
+        root_logger = logging.getLogger()
+        old_level = root_logger.getEffectiveLevel()
+        handler = InMemoryHandler()
+        try:
+            root_logger.setLevel(logging.DEBUG)
+            root_logger.addHandler(handler)
+
+            conf = {'__file__': '/etc/swift/proxy-server.conf',
+                    '__name__': 'kmip_keymaster'}
+            secrets = {}
+            calls = []
+            with mock.patch(KMIP_CLIENT_CLASS,
+                            create_mock_client(secrets, calls)), \
+                    self.assertRaises(ValueError):
+                # missing key_id, as above, but that's not the interesting bit
+                kmip_keymaster.KmipKeyMaster(None, conf)
+
+            self.assertEqual(handler.messages, [])
+
+            logger = logging.getLogger('kmip.services.server.kmip_protocol')
+            logger.debug('Something secret!')
+            logger.info('Something useful')
+            self.assertNotIn('Something secret!', handler.messages)
+            self.assertIn('Something useful', handler.messages)
+
+            logger = logging.getLogger('kmip.core.config_helper')
+            logger.debug('Also secret')
+            logger.warning('Also useful')
+            self.assertNotIn('Also secret', handler.messages)
+            self.assertIn('Also useful', handler.messages)
+
+            logger = logging.getLogger('kmip')
+            logger.debug('Boring, but not secret')
+            self.assertIn('Boring, but not secret', handler.messages)
+        finally:
+            root_logger.setLevel(old_level)
+            root_logger.removeHandler(handler)
diff --git a/test/unit/common/middleware/crypto/test_kms_keymaster.py b/test/unit/common/middleware/crypto/test_kms_keymaster.py
new file mode 100644
index 0000000000..a6506b13f7
--- /dev/null
+++ b/test/unit/common/middleware/crypto/test_kms_keymaster.py
@@ -0,0 +1,870 @@
+# -*- coding: utf-8 -*-
+#  Copyright (c) 2015 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import base64
+from unittest import mock
+import unittest
+import sys
+sys.modules['castellan'] = mock.Mock()
+sys.modules['castellan.common'] = mock.Mock()
+sys.modules['castellan.common.credentials'] = mock.Mock()
+
+from keystoneauth1.exceptions.connection import ConnectFailure
+from keystoneauth1.exceptions.http import Unauthorized
+from keystoneclient.exceptions import DiscoveryFailure
+from swift.common.middleware.crypto import kms_keymaster
+from swift.common.swob import Request
+from test.unit.common.middleware.helpers import FakeSwift, FakeAppThatExcepts
+
+TEST_KMS_INVALID_KEY_ID = 'invalid-kms-key-id'
+TEST_KMS_NONEXISTENT_KEY_ID = '11111111-1111-1111-1111-ffffffffffff'
+TEST_KMS_OPAQUE_KEY_ID = '22222222-2222-2222-2222-aaaaaaaaaaaa'
+TEST_KMS_SHORT_KEY_ID = '22222222-2222-2222-2222-bbbbbbbbbbbb'
+TEST_KMS_DES_KEY_ID = '22222222-2222-2222-2222-cccccccccccc'
+TEST_KMS_NONE_KEY_ID = '22222222-2222-2222-2222-dddddddddddd'
+TEST_KMS_INVALID_API_VERSION = 'vBadVersion'
+TEST_KMS_INVALID_USER_DOMAIN_NAME = "baduserdomainname"
+TEST_KMS_CONNECT_FAILURE_URL = 'http://endpoint_url_connect_error:45621'
+TEST_KMS_NON_BARBICAN_URL = 'http://endpoint_url_nonbarbican:45621'
+TEST_PROXYSERVER_CONF_EXTERNAL_KEYMASTER_CONF = {
+    'keymaster_config_path': 'PATH_TO_KEYMASTER_CONFIG_FILE',
+}
+TEST_KMS_KEYMASTER_CONF = {
+    'auth_endpoint': 'kmsauthurlv3',
+    'password': 'kmspass',
+    'username': 'kmsuser',
+    'user_domain_id': None,
+    'user_domain_name': 'default',
+    'project_id': None,
+    'project_name': 'kmsproject',
+    'project_domain_id': None,
+    'project_domain_name': 'default',
+    'key_id': 'valid_kms_key_id-abcdefg-123456'
+}
+
+
+def capture_start_response():
+    calls = []
+
+    def start_response(*args):
+        calls.append(args)
+    return start_response, calls
+
+
+def mock_castellan_api_side_effect(*args, **kwargs):
+    return MockBarbicanKeyManager(args[0])
+
+
+def mock_options_set_defaults_side_effect(*args, **kwargs):
+    '''
+    Add options from kwargs into args dict.
+    '''
+    args[0].update(kwargs)
+
+
+def mock_config_opts_side_effect(*args, **kwargs):
+    return dict()
+
+
+def mock_keystone_password_side_effect(auth_url, username, password,
+                                       project_name, user_domain_name,
+                                       project_domain_name, user_id,
+                                       user_domain_id, trust_id,
+                                       domain_id, domain_name, project_id,
+                                       project_domain_id, reauthenticate):
+    return MockPassword(auth_url, username, password, project_name,
+                        user_domain_name, project_domain_name, user_id,
+                        user_domain_id, trust_id, domain_id, domain_name,
+                        project_id, project_domain_id, reauthenticate)
+
+
+ERR_MESSAGE_SECRET_INCORRECTLY_SPECIFIED = 'Secret incorrectly specified.'
+ERR_MESSAGE_KEY_UUID_NOT_FOUND = 'Key not found, uuid: '
+
+
+class MockBarbicanKeyManager(object):
+    def __init__(self, conf):
+        self.conf = conf
+
+    def get(self, ctxt, key_id):
+        # If authentication fails, raise an exception here.
+        if (TEST_KMS_KEYMASTER_CONF['username'] !=
+                ctxt.username
+                or TEST_KMS_KEYMASTER_CONF['password'] !=
+                ctxt.password or
+                TEST_KMS_KEYMASTER_CONF['user_domain_name'] !=
+                ctxt.user_domain_name):
+            raise Unauthorized(
+                message='The request you have made requires authentication.',
+                http_status=401)
+        elif self.conf['auth_endpoint'] == TEST_KMS_CONNECT_FAILURE_URL:
+            raise ConnectFailure('Unable to establish connection')
+        elif self.conf['auth_endpoint'] == TEST_KMS_NON_BARBICAN_URL:
+            raise DiscoveryFailure(
+                'Could not determine a suitable URL for the plugin')
+        elif (self.conf['auth_endpoint'] !=
+              TEST_KMS_KEYMASTER_CONF['auth_endpoint']):
+            raise Unauthorized(
+                message='Cannot authorize API client.')
+        elif (key_id == TEST_KMS_NONEXISTENT_KEY_ID):
+            message = ERR_MESSAGE_KEY_UUID_NOT_FOUND + key_id
+            '''
+            Raising a ManagedObjectNotFoundError would require importing it
+            from castellan.common.exception. To avoid this import, raising a
+            general Exception.
+            '''
+            raise Exception(message)
+        elif key_id == TEST_KMS_INVALID_KEY_ID:
+            raise ValueError(ERR_MESSAGE_SECRET_INCORRECTLY_SPECIFIED)
+        elif key_id == TEST_KMS_NONE_KEY_ID:
+            return None
+        if 'unicode' in key_id:
+            key_str = key_id[0] * 32
+        else:
+            key_str = (str(key_id[0]) * 32).encode('utf8')
+        return MockBarbicanKey(key_str, key_id)
+
+
+class MockBarbicanKey(object):
+    def __init__(self, key_material, key_id):
+        self.key_material = key_material
+        self.bit_length = len(key_material) * 8
+        if key_id == TEST_KMS_OPAQUE_KEY_ID:
+            self.format = 'Opaque'
+        else:
+            self.format = 'RAW'
+            self.algorithm = "aes"
+        if key_id == TEST_KMS_DES_KEY_ID:
+            self.format = 'des'
+        if key_id == TEST_KMS_SHORT_KEY_ID:
+            self.bit_length = 128
+            self.key_material[:128]
+
+    def get_encoded(self):
+        return self.key_material
+
+    def format(self):
+        return self.format
+
+
+class MockPassword(object):
+    def __init__(self, auth_url, username, password, project_name,
+                 user_domain_name, project_domain_name, user_id,
+                 user_domain_id, trust_id, domain_id, domain_name, project_id,
+                 project_domain_id, reauthenticate):
+        self.auth_url = auth_url
+        self.password = password
+        self.username = username
+        self.user_domain_name = user_domain_name
+        self.project_name = project_name
+        self.project_domain_name = project_domain_name
+        self.user_id = user_id,
+        self.user_domain_id = user_domain_id,
+        self.trust_id = trust_id,
+        self.domain_id = domain_id,
+        self.domain_name = domain_name,
+        self.project_id = project_id,
+        self.project_domain_id = project_domain_id,
+        self.reauthenticate = reauthenticate
+
+
+class TestKmsKeymaster(unittest.TestCase):
+    """
+    Unit tests for storing the encryption root secret in a Barbican external
+    key management system accessed using Castellan.
+    """
+
+    def setUp(self):
+        super(TestKmsKeymaster, self).setUp()
+        self.swift = FakeSwift()
+
+    """
+    Tests using the v3 Identity API, where all calls to Barbican are mocked.
+    """
+
+    @mock.patch('swift.common.middleware.crypto.keymaster.readconf')
+    @mock.patch.object(kms_keymaster.KmsKeyMaster,
+                       '_get_root_secret')
+    def test_filter_v3(self, mock_get_root_secret_from_kms,
+                       mock_readconf):
+        mock_get_root_secret_from_kms.return_value = (
+            base64.b64encode(b'x' * 32))
+        mock_readconf.return_value = TEST_KMS_KEYMASTER_CONF
+        factory = kms_keymaster.filter_factory(TEST_KMS_KEYMASTER_CONF)
+        self.assertTrue(callable(factory))
+        self.assertTrue(callable(factory(self.swift)))
+
+    @mock.patch('swift.common.middleware.crypto.keymaster.readconf')
+    @mock.patch.object(kms_keymaster.KmsKeyMaster,
+                       '_get_root_secret')
+    def test_app_exception_v3(self, mock_get_root_secret_from_kms,
+                              mock_readconf):
+        mock_get_root_secret_from_kms.return_value = (
+            base64.b64encode(b'x' * 32))
+        mock_readconf.return_value = TEST_KMS_KEYMASTER_CONF
+        app = kms_keymaster.KmsKeyMaster(
+            FakeAppThatExcepts(), TEST_KMS_KEYMASTER_CONF)
+        req = Request.blank('/', environ={'REQUEST_METHOD': 'PUT'})
+        start_response, _ = capture_start_response()
+        self.assertRaises(Exception, app, req.environ, start_response)
+
+    @mock.patch.object(kms_keymaster.KmsKeyMaster, '_get_root_secret')
+    def test_get_root_secret(
+            self, mock_get_root_secret_from_kms):
+        # Successful call with coarse _get_root_secret_from_kms() mock.
+        mock_get_root_secret_from_kms.return_value = (
+            base64.b64encode(b'x' * 32))
+        # Provide valid Barbican configuration parameters in proxy-server
+        # config.
+        self.app = kms_keymaster.KmsKeyMaster(self.swift,
+                                              TEST_KMS_KEYMASTER_CONF)
+        # Verify that _get_root_secret_from_kms() was called with the
+        # correct parameters.
+        mock_get_root_secret_from_kms.assert_called_with(
+            TEST_KMS_KEYMASTER_CONF
+        )
+
+    @mock.patch('swift.common.middleware.crypto.keymaster.readconf')
+    @mock.patch.object(kms_keymaster.KmsKeyMaster, '_get_root_secret')
+    def test_get_root_secret_from_external_file(
+            self, mock_get_root_secret_from_kms, mock_readconf):
+        # Return valid Barbican configuration parameters.
+        mock_readconf.return_value = TEST_KMS_KEYMASTER_CONF
+        # Successful call with coarse _get_root_secret_from_kms() mock.
+        mock_get_root_secret_from_kms.return_value = (
+            base64.b64encode(b'x' * 32))
+        # Point to external config in proxy-server config.
+        self.app = kms_keymaster.KmsKeyMaster(
+            self.swift, TEST_PROXYSERVER_CONF_EXTERNAL_KEYMASTER_CONF)
+        # Verify that _get_root_secret_from_kms() was called with the
+        # correct parameters.
+        mock_get_root_secret_from_kms.assert_called_with(
+            TEST_KMS_KEYMASTER_CONF
+        )
+        self.assertEqual(mock_readconf.mock_calls, [
+            mock.call('PATH_TO_KEYMASTER_CONFIG_FILE', 'kms_keymaster')])
+
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.'
+                'keystone_password.KeystonePassword')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.cfg')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.options')
+    @mock.patch('swift.common.middleware.crypto.keymaster.readconf')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.key_manager')
+    def test_mocked_castellan_keymanager(
+            self, mock_castellan_key_manager, mock_readconf,
+            mock_castellan_options, mock_oslo_config, mock_keystone_password):
+        # Successful call with finer grained mocks.
+        mock_keystone_password.side_effect = (
+            mock_keystone_password_side_effect)
+        '''
+        Set side_effect functions.
+        '''
+        mock_castellan_key_manager.API.side_effect = (
+            mock_castellan_api_side_effect)
+        mock_castellan_options.set_defaults.side_effect = (
+            mock_options_set_defaults_side_effect)
+        mock_oslo_config.ConfigOpts.side_effect = (
+            mock_config_opts_side_effect)
+        '''
+        Return valid Barbican configuration parameters.
+        '''
+        mock_readconf.return_value = TEST_KMS_KEYMASTER_CONF
+
+        '''
+        Verify that no exceptions are raised by the mocked functions.
+        '''
+        try:
+            self.app = kms_keymaster.KmsKeyMaster(self.swift,
+                                                  TEST_KMS_KEYMASTER_CONF)
+        except Exception:
+            print("Unexpected error: %s" % sys.exc_info()[0])
+            raise
+
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.'
+                'keystone_password.KeystonePassword')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.cfg')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.options')
+    @mock.patch('swift.common.middleware.crypto.keymaster.readconf')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.key_manager')
+    def test_mocked_castellan_keymanager_invalid_key_id(
+            self, mock_castellan_key_manager, mock_readconf,
+            mock_castellan_options, mock_oslo_config,
+            mock_keystone_password):
+        # Invalid key ID.
+        mock_keystone_password.side_effect = (
+            mock_keystone_password_side_effect)
+        '''
+        Set side_effect functions.
+        '''
+        mock_castellan_key_manager.API.side_effect = (
+            mock_castellan_api_side_effect)
+        mock_castellan_options.set_defaults.side_effect = (
+            mock_options_set_defaults_side_effect)
+        mock_oslo_config.ConfigOpts.side_effect = (
+            mock_config_opts_side_effect)
+        '''
+        Return invalid Barbican configuration parameters.
+        '''
+        kms_conf = dict(TEST_KMS_KEYMASTER_CONF)
+        kms_conf['key_id'] = TEST_KMS_INVALID_KEY_ID
+        mock_readconf.return_value = kms_conf
+
+        '''
+        Verify that an exception is raised by the mocked function.
+        '''
+        try:
+            self.app = kms_keymaster.KmsKeyMaster(
+                self.swift, TEST_PROXYSERVER_CONF_EXTERNAL_KEYMASTER_CONF)
+            raise Exception('Success even though key id invalid')
+        except ValueError as e:
+            self.assertEqual(e.args[0],
+                             ERR_MESSAGE_SECRET_INCORRECTLY_SPECIFIED)
+        except Exception:
+            print("Unexpected error: %s" % sys.exc_info()[0])
+            raise
+
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.'
+                'keystone_password.KeystonePassword')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.cfg')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.options')
+    @mock.patch('swift.common.middleware.crypto.keymaster.readconf')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.key_manager')
+    def test_mocked_castellan_keymanager_nonexistent_key_id(
+            self, mock_castellan_key_manager, mock_readconf,
+            mock_castellan_options, mock_oslo_config,
+            mock_keystone_password):
+        # Nonexistent key.
+        mock_keystone_password.side_effect = (
+            mock_keystone_password_side_effect)
+        '''
+        Set side_effect functions.
+        '''
+        mock_castellan_key_manager.API.side_effect = (
+            mock_castellan_api_side_effect)
+        mock_castellan_options.set_defaults.side_effect = (
+            mock_options_set_defaults_side_effect)
+        mock_oslo_config.ConfigOpts.side_effect = (
+            mock_config_opts_side_effect)
+        '''
+        Return invalid Barbican configuration parameters.
+        '''
+        kms_conf = dict(TEST_KMS_KEYMASTER_CONF)
+        kms_conf['key_id'] = TEST_KMS_NONEXISTENT_KEY_ID
+        mock_readconf.return_value = kms_conf
+
+        '''
+        Verify that an exception is raised by the mocked function.
+        '''
+        try:
+            self.app = kms_keymaster.KmsKeyMaster(
+                self.swift, TEST_PROXYSERVER_CONF_EXTERNAL_KEYMASTER_CONF)
+            raise Exception('Success even though key id invalid')
+        except Exception as e:
+            expected_message = ('Key not found, uuid: ' +
+                                TEST_KMS_NONEXISTENT_KEY_ID)
+            self.assertEqual(e.args[0], expected_message)
+
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.'
+                'keystone_password.KeystonePassword')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.cfg')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.options')
+    @mock.patch('swift.common.middleware.crypto.keymaster.readconf')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.key_manager')
+    def test_mocked_castellan_keymanager_invalid_key_format(
+            self, mock_castellan_key_manager, mock_readconf,
+            mock_castellan_options, mock_oslo_config,
+            mock_keystone_password):
+        # Nonexistent key.
+        mock_keystone_password.side_effect = (
+            mock_keystone_password_side_effect)
+        '''
+        Set side_effect functions.
+        '''
+        mock_castellan_key_manager.API.side_effect = (
+            mock_castellan_api_side_effect)
+        mock_castellan_options.set_defaults.side_effect = (
+            mock_options_set_defaults_side_effect)
+        mock_oslo_config.ConfigOpts.side_effect = (
+            mock_config_opts_side_effect)
+        '''
+        Return invalid Barbican configuration parameters.
+        '''
+        kms_conf = dict(TEST_KMS_KEYMASTER_CONF)
+        kms_conf['key_id'] = TEST_KMS_OPAQUE_KEY_ID
+        mock_readconf.return_value = kms_conf
+
+        '''
+        Verify that an exception is raised by the mocked function.
+        '''
+        try:
+            self.app = kms_keymaster.KmsKeyMaster(
+                self.swift, TEST_PROXYSERVER_CONF_EXTERNAL_KEYMASTER_CONF)
+            raise Exception('Success even though key format invalid')
+        except ValueError:
+            pass
+        except Exception:
+            print("Unexpected error: %s" % sys.exc_info()[0])
+            raise
+
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.'
+                'keystone_password.KeystonePassword')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.cfg')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.options')
+    @mock.patch('swift.common.middleware.crypto.keymaster.readconf')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.key_manager')
+    def test_mocked_castellan_keymanager_config_file_and_params(
+            self, mock_castellan_key_manager, mock_readconf,
+            mock_castellan_options, mock_oslo_config,
+            mock_keystone_password):
+        # Both external config file and config parameters specified.
+        mock_keystone_password.side_effect = (
+            mock_keystone_password_side_effect)
+        '''
+        Set side_effect functions.
+        '''
+        mock_castellan_key_manager.API.side_effect = (
+            mock_castellan_api_side_effect)
+        mock_castellan_options.set_defaults.side_effect = (
+            mock_options_set_defaults_side_effect)
+        mock_oslo_config.ConfigOpts.side_effect = (
+            mock_config_opts_side_effect)
+        '''
+        Return invalid Barbican configuration parameters.
+        '''
+        kms_conf = dict(TEST_KMS_KEYMASTER_CONF)
+        kms_conf['keymaster_config_path'] = (
+            'PATH_TO_KEYMASTER_CONFIG_FILE'
+        )
+        mock_readconf.return_value = kms_conf
+
+        '''
+        Verify that an exception is raised by the mocked function.
+        '''
+        try:
+            self.app = kms_keymaster.KmsKeyMaster(self.swift, kms_conf)
+            raise Exception('Success even though config invalid')
+        except Exception as e:
+            expected_message = ('keymaster_config_path is set, but there are '
+                                'other config options specified:')
+            self.assertTrue(e.args[0].startswith(expected_message),
+                            "Error message does not start with '%s'" %
+                            expected_message)
+
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.'
+                'keystone_password.KeystonePassword')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.cfg')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.options')
+    @mock.patch('swift.common.middleware.crypto.keymaster.readconf')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.key_manager')
+    def test_mocked_castellan_keymanager_invalid_username(
+            self, mock_castellan_key_manager, mock_readconf,
+            mock_castellan_options, mock_oslo_config,
+            mock_keystone_password):
+        # Invalid username.
+        mock_keystone_password.side_effect = (
+            mock_keystone_password_side_effect)
+        '''
+        Set side_effect functions.
+        '''
+        mock_castellan_key_manager.API.side_effect = (
+            mock_castellan_api_side_effect)
+        mock_castellan_options.set_defaults.side_effect = (
+            mock_options_set_defaults_side_effect)
+        mock_oslo_config.ConfigOpts.side_effect = (
+            mock_config_opts_side_effect)
+        '''
+        Return invalid Barbican configuration parameters.
+        '''
+        kms_conf = dict(TEST_KMS_KEYMASTER_CONF)
+        kms_conf['username'] = 'invaliduser'
+        mock_readconf.return_value = kms_conf
+
+        '''
+        Verify that an exception is raised by the mocked function.
+        '''
+        try:
+            self.app = kms_keymaster.KmsKeyMaster(
+                self.swift, TEST_PROXYSERVER_CONF_EXTERNAL_KEYMASTER_CONF)
+            raise Exception('Success even though username invalid')
+        except Unauthorized as e:
+            self.assertEqual(e.http_status, 401)
+        except Exception:
+            print("Unexpected error: %s" % sys.exc_info()[0])
+            raise
+
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.'
+                'keystone_password.KeystonePassword')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.cfg')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.options')
+    @mock.patch('swift.common.middleware.crypto.keymaster.readconf')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.key_manager')
+    def test_mocked_castellan_keymanager_invalid_password(
+            self, mock_castellan_key_manager, mock_readconf,
+            mock_castellan_options, mock_oslo_config,
+            mock_keystone_password):
+        # Invalid password.
+        mock_keystone_password.side_effect = (
+            mock_keystone_password_side_effect)
+        '''
+        Set side_effect functions.
+        '''
+        mock_castellan_key_manager.API.side_effect = (
+            mock_castellan_api_side_effect)
+        mock_castellan_options.set_defaults.side_effect = (
+            mock_options_set_defaults_side_effect)
+        mock_oslo_config.ConfigOpts.side_effect = (
+            mock_config_opts_side_effect)
+        '''
+        Return invalid Barbican configuration parameters.
+        '''
+        kms_conf = dict(TEST_KMS_KEYMASTER_CONF)
+        kms_conf['password'] = 'invalidpassword'
+        mock_readconf.return_value = kms_conf
+
+        '''
+        Verify that an exception is raised by the mocked function.
+        '''
+        try:
+            self.app = kms_keymaster.KmsKeyMaster(
+                self.swift, TEST_PROXYSERVER_CONF_EXTERNAL_KEYMASTER_CONF)
+            raise Exception('Success even though password invalid')
+        except Unauthorized as e:
+            self.assertEqual(e.http_status, 401)
+        except Exception:
+            print("Unexpected error: %s" % sys.exc_info()[0])
+            raise
+
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.'
+                'keystone_password.KeystonePassword')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.cfg')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.options')
+    @mock.patch('swift.common.middleware.crypto.keymaster.readconf')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.key_manager')
+    def test_mocked_castellan_keymanager_connect_failure_auth_url(
+            self, mock_castellan_key_manager, mock_readconf,
+            mock_castellan_options, mock_oslo_config, mock_keystone_password):
+        # Connect failure kms auth_url.
+        mock_keystone_password.side_effect = (
+            mock_keystone_password_side_effect)
+        '''
+        Set side_effect functions.
+        '''
+        mock_castellan_key_manager.API.side_effect = (
+            mock_castellan_api_side_effect)
+        mock_castellan_options.set_defaults.side_effect = (
+            mock_options_set_defaults_side_effect)
+        mock_oslo_config.ConfigOpts.side_effect = (
+            mock_config_opts_side_effect)
+        '''
+        Return invalid Barbican configuration parameters.
+        '''
+        kms_conf = dict(TEST_KMS_KEYMASTER_CONF)
+        kms_conf['auth_endpoint'] = TEST_KMS_CONNECT_FAILURE_URL
+        mock_readconf.return_value = kms_conf
+
+        '''
+        Verify that an exception is raised by the mocked function.
+        '''
+        try:
+            self.app = kms_keymaster.KmsKeyMaster(
+                self.swift, TEST_PROXYSERVER_CONF_EXTERNAL_KEYMASTER_CONF)
+            raise Exception('Success even though auth_url invalid')
+        except ConnectFailure:
+            pass
+        except Exception:
+            print("Unexpected error: %s" % sys.exc_info()[0])
+            raise
+
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.'
+                'keystone_password.KeystonePassword')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.cfg')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.options')
+    @mock.patch('swift.common.middleware.crypto.keymaster.readconf')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.key_manager')
+    def test_mocked_castellan_keymanager_bad_auth_url(
+            self, mock_castellan_key_manager, mock_readconf,
+            mock_castellan_options, mock_oslo_config,
+            mock_keystone_password):
+        # Bad kms auth_url.
+        mock_keystone_password.side_effect = (
+            mock_keystone_password_side_effect)
+        '''
+        Set side_effect functions.
+        '''
+        mock_castellan_key_manager.API.side_effect = (
+            mock_castellan_api_side_effect)
+        mock_castellan_options.set_defaults.side_effect = (
+            mock_options_set_defaults_side_effect)
+        mock_oslo_config.ConfigOpts.side_effect = (
+            mock_config_opts_side_effect)
+        '''
+        Return invalid Barbican configuration parameters.
+        '''
+        kms_conf = dict(TEST_KMS_KEYMASTER_CONF)
+        kms_conf['auth_endpoint'] = TEST_KMS_NON_BARBICAN_URL
+        mock_readconf.return_value = kms_conf
+
+        '''
+        Verify that an exception is raised by the mocked function.
+        '''
+        try:
+            self.app = kms_keymaster.KmsKeyMaster(
+                self.swift, TEST_PROXYSERVER_CONF_EXTERNAL_KEYMASTER_CONF)
+            raise Exception('Success even though auth_url invalid')
+        except DiscoveryFailure:
+            pass
+        except Exception:
+            print("Unexpected error: %s" % sys.exc_info()[0])
+            raise
+
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.'
+                'keystone_password.KeystonePassword')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.cfg')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.options')
+    @mock.patch('swift.common.middleware.crypto.keymaster.readconf')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.key_manager')
+    def test_mocked_castellan_keymanager_bad_user_domain_name(
+            self, mock_castellan_key_manager, mock_readconf,
+            mock_castellan_options, mock_oslo_config, mock_keystone_password):
+        # Bad user domain name with mocks.
+        mock_keystone_password.side_effect = (
+            mock_keystone_password_side_effect)
+        '''
+        Set side_effect functions.
+        '''
+        mock_castellan_key_manager.API.side_effect = (
+            mock_castellan_api_side_effect)
+        mock_castellan_options.set_defaults.side_effect = (
+            mock_options_set_defaults_side_effect)
+        mock_oslo_config.ConfigOpts.side_effect = (
+            mock_config_opts_side_effect)
+        '''
+        Return invalid Barbican configuration parameters.
+        '''
+        kms_conf = dict(TEST_KMS_KEYMASTER_CONF)
+        kms_conf['user_domain_name'] = (
+            TEST_KMS_INVALID_USER_DOMAIN_NAME)
+        mock_readconf.return_value = kms_conf
+
+        '''
+        Verify that an exception is raised by the mocked function.
+        '''
+        try:
+            self.app = kms_keymaster.KmsKeyMaster(
+                self.swift, TEST_PROXYSERVER_CONF_EXTERNAL_KEYMASTER_CONF)
+            raise Exception('Success even though api_version invalid')
+        except Unauthorized as e:
+            self.assertEqual(e.http_status, 401)
+        except Exception:
+            print("Unexpected error: %s" % sys.exc_info()[0])
+            raise
+
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.'
+                'keystone_password.KeystonePassword')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.cfg')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.options')
+    @mock.patch('swift.common.middleware.crypto.keymaster.readconf')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.key_manager')
+    def test_mocked_castellan_keymanager_invalid_key_algorithm(
+            self, mock_castellan_key_manager, mock_readconf,
+            mock_castellan_options, mock_oslo_config,
+            mock_keystone_password):
+        # Nonexistent key.
+        mock_keystone_password.side_effect = (
+            mock_keystone_password_side_effect)
+        '''
+        Set side_effect functions.
+        '''
+        mock_castellan_key_manager.API.side_effect = (
+            mock_castellan_api_side_effect)
+        mock_castellan_options.set_defaults.side_effect = (
+            mock_options_set_defaults_side_effect)
+        mock_oslo_config.ConfigOpts.side_effect = (
+            mock_config_opts_side_effect)
+        '''
+        Return invalid Barbican configuration parameters.
+        '''
+        kms_conf = dict(TEST_KMS_KEYMASTER_CONF)
+        kms_conf['key_id'] = TEST_KMS_DES_KEY_ID
+        mock_readconf.return_value = kms_conf
+
+        '''
+        Verify that an exception is raised by the mocked function.
+        '''
+        try:
+            self.app = kms_keymaster.KmsKeyMaster(
+                self.swift, TEST_PROXYSERVER_CONF_EXTERNAL_KEYMASTER_CONF)
+            raise Exception('Success even though key format invalid')
+        except ValueError:
+            pass
+        except Exception:
+            print("Unexpected error: %s" % sys.exc_info()[0])
+            raise
+
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.'
+                'keystone_password.KeystonePassword')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.cfg')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.options')
+    @mock.patch('swift.common.middleware.crypto.keymaster.readconf')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.key_manager')
+    def test_mocked_castellan_keymanager_invalid_key_length(
+            self, mock_castellan_key_manager, mock_readconf,
+            mock_castellan_options, mock_oslo_config,
+            mock_keystone_password):
+        # Nonexistent key.
+        mock_keystone_password.side_effect = (
+            mock_keystone_password_side_effect)
+        '''
+        Set side_effect functions.
+        '''
+        mock_castellan_key_manager.API.side_effect = (
+            mock_castellan_api_side_effect)
+        mock_castellan_options.set_defaults.side_effect = (
+            mock_options_set_defaults_side_effect)
+        mock_oslo_config.ConfigOpts.side_effect = (
+            mock_config_opts_side_effect)
+        '''
+        Return invalid Barbican configuration parameters.
+        '''
+        kms_conf = dict(TEST_KMS_KEYMASTER_CONF)
+        kms_conf['key_id'] = TEST_KMS_SHORT_KEY_ID
+        mock_readconf.return_value = kms_conf
+
+        '''
+        Verify that an exception is raised by the mocked function.
+        '''
+        try:
+            self.app = kms_keymaster.KmsKeyMaster(
+                self.swift, TEST_PROXYSERVER_CONF_EXTERNAL_KEYMASTER_CONF)
+            raise Exception('Success even though key format invalid')
+        except ValueError:
+            pass
+        except Exception:
+            print("Unexpected error: %s" % sys.exc_info()[0])
+            raise
+
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.'
+                'keystone_password.KeystonePassword')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.cfg')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.options')
+    @mock.patch('swift.common.middleware.crypto.keymaster.readconf')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.key_manager')
+    def test_mocked_castellan_keymanager_none_key(
+            self, mock_castellan_key_manager, mock_readconf,
+            mock_castellan_options, mock_oslo_config,
+            mock_keystone_password):
+        # Nonexistent key.
+        mock_keystone_password.side_effect = (
+            mock_keystone_password_side_effect)
+        '''
+        Set side_effect functions.
+        '''
+        mock_castellan_key_manager.API.side_effect = (
+            mock_castellan_api_side_effect)
+        mock_castellan_options.set_defaults.side_effect = (
+            mock_options_set_defaults_side_effect)
+        mock_oslo_config.ConfigOpts.side_effect = (
+            mock_config_opts_side_effect)
+        '''
+        Return invalid Barbican configuration parameters.
+        '''
+        kms_conf = dict(TEST_KMS_KEYMASTER_CONF)
+        kms_conf['key_id'] = TEST_KMS_NONE_KEY_ID
+        mock_readconf.return_value = kms_conf
+
+        '''
+        Verify that an exception is raised by the mocked function.
+        '''
+        try:
+            self.app = kms_keymaster.KmsKeyMaster(
+                self.swift, TEST_PROXYSERVER_CONF_EXTERNAL_KEYMASTER_CONF)
+            raise Exception('Success even though None key returned')
+        except ValueError:
+            pass
+        except Exception:
+            print("Unexpected error: %s" % sys.exc_info()[0])
+            raise
+
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.'
+                'keystone_password.KeystonePassword', MockPassword)
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.cfg')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.options')
+    @mock.patch('swift.common.middleware.crypto.keymaster.readconf')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.key_manager')
+    def test_get_root_secret_multiple_keys(
+            self, mock_castellan_key_manager, mock_readconf,
+            mock_castellan_options, mock_oslo_config,):
+        config = dict(TEST_KMS_KEYMASTER_CONF)
+        config.update({
+            'key_id_foo': 'foo-valid_kms_key_id-123456',
+            'key_id_bar': 'bar-valid_kms_key_id-123456',
+            'key_id_baz': 'zz-valid_unicode_kms_key_id-123456',
+            'key_id_non_ascii': u'\N{SNOWMAN}_unicode_key_id',
+            'active_root_secret_id': 'foo'})
+
+        # Set side_effect functions.
+        mock_castellan_key_manager.API.side_effect = (
+            mock_castellan_api_side_effect)
+        mock_castellan_options.set_defaults.side_effect = (
+            mock_options_set_defaults_side_effect)
+        mock_oslo_config.ConfigOpts.side_effect = (
+            mock_config_opts_side_effect)
+
+        # Return valid Barbican configuration parameters.
+        mock_readconf.return_value = config
+
+        self.app = kms_keymaster.KmsKeyMaster(self.swift,
+                                              config)
+
+        expected_secrets = {
+            None: b'vvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvv',
+            'foo': b'ffffffffffffffffffffffffffffffff',
+            'bar': b'bbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbb',
+            'baz': b'zzzzzzzzzzzzzzzzzzzzzzzzzzzzzzzz',
+            'non_ascii': b'\xe2\x98\x83' * 32}
+        self.assertDictEqual(self.app._root_secrets, expected_secrets)
+        self.assertEqual(self.app.active_secret_id, 'foo')
+
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.'
+                'keystone_password.KeystonePassword', MockPassword)
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.cfg')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.options')
+    @mock.patch('swift.common.middleware.crypto.keymaster.readconf')
+    @mock.patch('swift.common.middleware.crypto.kms_keymaster.key_manager')
+    def test_get_root_secret_legacy_key_id(
+            self, mock_castellan_key_manager, mock_readconf,
+            mock_castellan_options, mock_oslo_config):
+
+        # Set side_effect functions.
+        mock_castellan_key_manager.API.side_effect = (
+            mock_castellan_api_side_effect)
+        mock_castellan_options.set_defaults.side_effect = (
+            mock_options_set_defaults_side_effect)
+        mock_oslo_config.ConfigOpts.side_effect = (
+            mock_config_opts_side_effect)
+
+        # Return valid Barbican configuration parameters.
+        mock_readconf.return_value = TEST_KMS_KEYMASTER_CONF
+
+        self.app = kms_keymaster.KmsKeyMaster(self.swift,
+                                              TEST_KMS_KEYMASTER_CONF)
+
+        expected_secrets = {None: b'vvvvvvvvvvvvvvvvvvvvvvvvvvvvvvvv'}
+        self.assertDictEqual(self.app._root_secrets, expected_secrets)
+        self.assertIsNone(self.app.active_secret_id)
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/helpers.py b/test/unit/common/middleware/helpers.py
new file mode 100644
index 0000000000..6225e1d136
--- /dev/null
+++ b/test/unit/common/middleware/helpers.py
@@ -0,0 +1,497 @@
+# Copyright (c) 2013 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# This stuff can't live in test/unit/__init__.py due to its swob dependency.
+from collections import defaultdict
+from urllib import parse
+from swift.common import swob
+from swift.common.header_key_dict import HeaderKeyDict
+from swift.common.request_helpers import is_user_meta, \
+    is_object_transient_sysmeta, resolve_etag_is_at_header, \
+    resolve_ignore_range_header
+from swift.common.storage_policy import POLICIES
+from swift.common.swob import HTTPMethodNotAllowed
+from swift.common.utils import split_path, md5
+
+from test.debug_logger import debug_logger
+from test.unit import FakeRing
+
+
+class LeakTrackingIter(object):
+    def __init__(self, inner_iter, mark_closed, mark_read, key):
+        if isinstance(inner_iter, bytes):
+            inner_iter = (inner_iter, )
+        self.inner_iter = iter(inner_iter)
+        self.mark_closed = mark_closed
+        self.mark_read = mark_read
+        self.key = key
+
+    def __iter__(self):
+        return self
+
+    def __next__(self):
+        try:
+            return next(self.inner_iter)
+        except StopIteration:
+            self.mark_read(self.key)
+            raise
+
+    def close(self):
+        self.mark_closed(self.key)
+
+
+class FakeSwiftDummyValue:
+    _instance = None
+
+    @classmethod
+    def singleton(cls):
+        if not cls._instance:
+            cls._instance = FakeSwiftDummyValue()
+        return cls._instance
+
+
+class FakeSwiftCall(object):
+    """
+    Encapsulate properties of a request captured by FakeSwift.
+    """
+    DUMMY_VALUE = FakeSwiftDummyValue.singleton()
+
+    def __init__(self, req):
+        self.req = req
+        self.method = req.method
+        path = req.environ['PATH_INFO']
+        if req.environ.get('QUERY_STRING'):
+            path += '?' + req.environ['QUERY_STRING']
+        self.path = normalize_path(path)
+        self.headers = HeaderKeyDict(req.headers)
+        # footers is populated if/when it is passed by FakeSwift to any
+        # update_footers callback that has been set in the request environment.
+        self.footers = HeaderKeyDict()
+        self._env = self._partial_copy(req.environ)
+        # leave FakeSwift to read body and set this attribute after the call
+        # has been captured
+        self.body = None
+
+    def _partial_copy(self, value):
+        # Ideally we want a snapshot of the environ, with deep copies of
+        # mutable values. However, some things (e.g. EncInputWrapper) won't
+        # deepcopy. To avoid a confusing mixed of copied and original
+        # values, replace un-copied values with DUMMY_VALUE.
+        if value is None:
+            return value
+        elif isinstance(value, (bool, int, float, str, bytes)):
+            return value
+        elif isinstance(value, (list, tuple, set)):
+            return value.__class__([self._partial_copy(v) for v in value])
+        elif isinstance(value, dict):
+            return dict([(k, self._partial_copy(v))
+                         for k, v in value.items()])
+        else:
+            return self.DUMMY_VALUE
+
+    @property
+    def env(self):
+        """
+        Returns a partial deepcopy of the request environ as it was received by
+        ``FakeSwift``.
+
+        It may not be possible to deepcopy everything in a request environ, so
+        only values of type ``bool``, ``int``, ``float``, ``str``, ``bytes``,
+        ``list``, ``tuple``, ``set``, or ``dict`` are copied. Other values are
+        replaced with a ``FakeSwiftCall.DUMMY_VALUE`` sentinel so that tests
+        can still check for that key being in ``env``, but not mistakenly
+        assume that the value is a copy.
+
+        Tests that need to make assertions about values not copied into
+        ``FakeSwiftCall.env`` can access the original request environ via
+        ``FakeSwiftCall.req.environ``.
+
+        Writing tests that assert the equality of ``env`` is discouraged (e.g.
+        ``self.assertEqual(expected, call.env)``) because those assertions will
+        break when new default keys are added to the request environ. Tests
+        should instead make assertions about individual items in ``env`` (e.g.
+        ``self.assertEqual(expected, call.env['swift.source')``).
+        """
+        return self._env
+
+
+def normalize_query_string(qs):
+    if qs.startswith('?'):
+        qs = qs[1:]
+    if not qs:
+        return ''
+    else:
+        # N.B. sort params so app.call asserts can hard code qs
+        return '?%s' % parse.urlencode(sorted(parse.parse_qsl(qs)))
+
+
+def normalize_path(path):
+    parsed = parse.urlparse(path)
+    return parsed.path + normalize_query_string(parsed.query)
+
+
+class FakeSwift(object):
+    """
+    A good-enough fake Swift proxy server to use in testing middleware.
+
+    Responses for expected requests should be registered using the ``register``
+    method. Registered requests are keyed by their method and path *including
+    query string*.
+
+    Received requests are matched to registered requests with the same method
+    as follows, in order of preference:
+
+      * A received request matches a registered request if the received
+        request's path, including query string, is the same as the registered
+        request's path, including query string.
+      * A received request matches a registered request if the received
+        request's path, excluding query string, is the same as the registered
+        request's path, including query string.
+
+    A received ``HEAD`` request will be matched to a registered ``GET``,
+    according to the same path preferences, if a match cannot be made to a
+    registered ``HEAD`` request.
+
+    A ``PUT`` request that matches a registered ``PUT`` request will create an
+    entry in the ``uploaded`` object cache that is keyed by the received
+    request's path, excluding query string. A subsequent ``GET`` or ``HEAD``
+    request that does not match a registered request will match an ``uploaded``
+    object based on the ``GET`` or ``HEAD`` request's path, excluding query
+    string.
+
+    A ``POST`` request whose path, excluding query string, matches an object in
+    the ``uploaded`` cache will modify the metadata of the object in the
+    ``uploaded`` cache. However, the ``POST`` request must first match a
+    registered ``POST`` request.
+
+    Examples:
+
+      * received ``GET /v1/a/c/o`` will match registered ``GET /v1/a/c/o``
+      * received ``GET /v1/a/c/o?x=y`` will match registered ``GET /v1/a/c/o``
+      * received ``HEAD /v1/a/c/o?x=y`` will match registered ``GET /v1/a/c/o``
+      * received ``GET /v1/a/c/o`` will NOT match registered
+        ``GET /v1/a/c/o?x=y``
+      * received ``PUT /v1/a/c/o?x=y``, if it matches a registered ``PUT``,
+        will create uploaded ``/v1/a/c/o``
+      * received ``POST /v1/a/c/o?x=y``, if it matches a registered ``POST``,
+        will update uploaded ``/v1/a/c/o``
+    """
+    ALLOWED_METHODS = [
+        'PUT', 'POST', 'DELETE', 'GET', 'HEAD', 'OPTIONS', 'REPLICATE',
+        'SSYNC', 'UPDATE']
+    container_existence_skip_cache = 0.0
+    account_existence_skip_cache = 0.0
+
+    def __init__(self, capture_unexpected_calls=True, test_read_size=-1):
+        self.capture_unexpected_calls = capture_unexpected_calls
+        self.read_size = test_read_size
+        self._calls = []
+        self._unclosed_req_keys = defaultdict(int)
+        self._unread_req_paths = defaultdict(int)
+        self.uploaded = {}
+        # mapping of (method, path) --> (response class, headers, body)
+        self._responses = {}
+        self._sticky_headers = {}
+        self.logger = debug_logger('fake-swift')
+        self.account_ring = FakeRing()
+        self.container_ring = FakeRing()
+        self.get_object_ring = lambda policy_index: FakeRing()
+        self.auto_create_account_prefix = '.'
+        self.backend_user_agent = "fake_swift"
+        self._pipeline_final_app = self
+        # Object Servers learned to resolve_ignore_range_header in Jan-2020,
+        # and although we still maintain some middleware tests that assert
+        # proper behavior across rolling upgrades, having a FakeSwift not act
+        # like modern swift is now opt-in.
+        self.can_ignore_range = True
+
+    def _find_response(self, method, path):
+        path = normalize_path(path)
+        resps = self._responses[(method, path)]
+        if len(resps) == 1:
+            # we'll return the last registered response forever
+            return resps[0]
+        else:
+            return resps.pop(0)
+
+    def _select_response(self, env):
+        # in some cases we can borrow different registered response
+        # ... the order is brittle and significant
+        method = env['REQUEST_METHOD']
+        path = self._parse_path(env)[0]
+        preferences = [(method, path)]
+        if env.get('QUERY_STRING'):
+            # we can always reuse response w/o query string
+            preferences.append((method, env['PATH_INFO']))
+        if method == 'HEAD':
+            # any path suitable for GET always works for HEAD
+            # N.B. list(preferences) to avoid iter+modify/sigkill
+            preferences.extend(('GET', p) for _, p in list(preferences))
+        for m, p in preferences:
+            try:
+                resp_class, headers, body = self._find_response(m, p)
+            except KeyError:
+                pass
+            else:
+                break
+        else:
+            # special case for re-reading an uploaded file
+            # ... uploaded is only objects and always raw path
+            if method in ('GET', 'HEAD') and env['PATH_INFO'] in self.uploaded:
+                resp_class = swob.HTTPOk
+                headers, body = self.uploaded[env['PATH_INFO']]
+            else:
+                raise KeyError("Didn't find %r in allowed responses" % (
+                    (method, path),))
+
+        if method == 'HEAD':
+            # HEAD resp never has body
+            body = None
+
+        try:
+            is_success = resp_class().is_success
+        except Exception:
+            # test_reconciler passes in an exploding response
+            is_success = False
+        if is_success and method in ('GET', 'HEAD'):
+            # update sticky resp headers with headers from registered resp
+            sticky_headers = self._sticky_headers.get(env['PATH_INFO'], {})
+            resp_headers = HeaderKeyDict(sticky_headers)
+            resp_headers.update(headers)
+        else:
+            # error responses don't get sticky resp headers
+            resp_headers = HeaderKeyDict(headers)
+
+        return resp_class, resp_headers, body
+
+    def _get_policy_index(self, acc, cont):
+        path = '/v1/%s/%s' % (acc, cont)
+        env = {'PATH_INFO': path,
+               'REQUEST_METHOD': 'HEAD'}
+        try:
+            resp_class, headers, _ = self._select_response(env)
+            policy_index = headers.get('X-Backend-Storage-Policy-Index')
+        except KeyError:
+            policy_index = None
+        if policy_index is None:
+            policy_index = str(int(POLICIES.default))
+        return policy_index
+
+    def _parse_path(self, env):
+        path = env['PATH_INFO']
+
+        _, acc, cont, obj = split_path(env['PATH_INFO'], 0, 4,
+                                       rest_with_last=True)
+        if env.get('QUERY_STRING'):
+            path += '?' + env['QUERY_STRING']
+        path = normalize_path(path)
+        return path, acc, cont, obj
+
+    def __call__(self, env, start_response):
+        method = env['REQUEST_METHOD']
+        if method not in self.ALLOWED_METHODS:
+            return HTTPMethodNotAllowed()(env, start_response)
+
+        path, acc, cont, obj = self._parse_path(env)
+
+        if 'swift.authorize' in env:
+            resp = env['swift.authorize'](swob.Request(env))
+            if resp:
+                return resp(env, start_response)
+
+        req = swob.Request(env)
+
+        # Capture the request before reading the body, in case the iter raises
+        # an exception.
+        call = FakeSwiftCall(req)
+        try:
+            resp_class, headers, body = self._select_response(env)
+        except KeyError:
+            if self.capture_unexpected_calls:
+                self._calls.append(call)
+            raise
+        else:
+            self._calls.append(call)
+
+        if (cont and not obj and method == 'UPDATE') or (
+                obj and method == 'PUT'):
+            if self.read_size < 0:
+                call.body = b''.join(iter(env['wsgi.input'].read, b''))
+            else:
+                call.body = b''
+                buf = env['wsgi.input'].read(self.read_size)
+                while buf:
+                    call.body += buf
+                    buf = env['wsgi.input'].read(self.read_size)
+
+        # simulate object PUT
+        if method == 'PUT' and obj:
+            if 'swift.callback.update_footers' in env:
+                footers = HeaderKeyDict()
+                env['swift.callback.update_footers'](footers)
+                call.footers.update(footers)
+            etag = md5(call.body, usedforsecurity=False).hexdigest()
+            headers.setdefault('Etag', etag)
+            headers.setdefault('Content-Length', len(call.body))
+
+            # keep it for subsequent GET requests later
+            metadata = dict(call.headers, **call.footers)
+            if "CONTENT_TYPE" in env:
+                metadata['Content-Type'] = env["CONTENT_TYPE"]
+            self.uploaded[env['PATH_INFO']] = (metadata, call.body)
+
+        # simulate object POST
+        elif method == 'POST' and obj:
+            metadata, data = self.uploaded.get(env['PATH_INFO'], ({}, None))
+            # select items to keep from existing...
+            new_metadata = dict(
+                (k, v) for k, v in metadata.items()
+                if (not is_user_meta('object', k) and not
+                    is_object_transient_sysmeta(k)))
+            # apply from new
+            new_metadata.update(
+                dict((k, v)
+                     for k, v in dict(call.headers, **call.footers).items()
+                     if (is_user_meta('object', k) or
+                         is_object_transient_sysmeta(k) or
+                         k.lower == 'content-type')))
+            self.uploaded[env['PATH_INFO']] = new_metadata, data
+
+        # Some middlewares (e.g. proxy_logging) inspect the request headers
+        # after it has been handled, so simulate some request headers updates
+        # that the real proxy makes. Do this *after* the request has been
+        # captured in the state it was received.
+        if obj:
+            req.headers.setdefault('X-Backend-Storage-Policy-Index',
+                                   self._get_policy_index(acc, cont))
+
+        # Apply conditional etag overrides
+        conditional_etag = resolve_etag_is_at_header(req, headers)
+
+        if self.can_ignore_range:
+            # avoid popping range from original environ
+            req = swob.Request(dict(req.environ))
+            resolve_ignore_range_header(req, headers)
+
+        # range requests ought to work, hence conditional_response=True
+        if not isinstance(body, (bytes, str)):
+            resp = resp_class(
+                req=req, headers=headers, app_iter=body,
+                conditional_response=req.method in ('GET', 'HEAD'),
+                conditional_etag=conditional_etag)
+        else:
+            resp = resp_class(
+                req=req, headers=headers, body=body,
+                conditional_response=req.method in ('GET', 'HEAD'),
+                conditional_etag=conditional_etag)
+        wsgi_iter = resp(req.environ, start_response)
+        self.mark_opened((method, path))
+        return LeakTrackingIter(wsgi_iter, self.mark_closed,
+                                self.mark_read, (method, path))
+
+    def clear_calls(self):
+        del self._calls[:]
+
+    def mark_opened(self, key):
+        self._unclosed_req_keys[key] += 1
+        self._unread_req_paths[key] += 1
+
+    def mark_closed(self, key):
+        self._unclosed_req_keys[key] -= 1
+
+    def mark_read(self, key):
+        self._unread_req_paths[key] -= 1
+
+    @property
+    def unclosed_requests(self):
+        return {key: count
+                for key, count in self._unclosed_req_keys.items()
+                if count > 0}
+
+    @property
+    def unread_requests(self):
+        return {path: count
+                for path, count in self._unread_req_paths.items()
+                if count > 0}
+
+    @property
+    def call_list(self):
+        """
+        Returns a list of instances of ``FakeSwiftCall``.
+        """
+        return self._calls
+
+    @property
+    def calls(self):
+        """
+        Returns a list of 2-tuples (<method>, <path>) for each item in
+        ``call_list``.
+        """
+        return [(call.method, call.path) for call in self._calls]
+
+    @property
+    def headers(self):
+        """
+        Returns a list of headers for each item in ``call_list``.
+        """
+        return [call.headers for call in self._calls]
+
+    @property
+    def calls_with_headers(self):
+        """
+        Returns a list of 3-tuples (<method>, <path>, <headers>) for each item
+        in ``call_list``.
+        """
+        return [(call.method, call.path, call.headers)
+                for call in self._calls]
+
+    @property
+    def call_count(self):
+        return len(self.call_list)
+
+    @property
+    def txn_ids(self):
+        return [call.env.get('swift.trans_id') for call in self.call_list]
+
+    @property
+    def swift_sources(self):
+        return [call.env.get('swift.source') for call in self.call_list]
+
+    def update_sticky_response_headers(self, path, headers):
+        """
+        Tests setUp can use this to ensure any successful GET/HEAD response for
+        a given path will include these headers.
+        """
+        sticky_headers = self._sticky_headers.setdefault(path, {})
+        sticky_headers.update(headers)
+
+    def register(self, method, path, response_class, headers, body=b''):
+        path = normalize_path(path)
+        self._responses[(method, path)] = [(response_class, headers, body)]
+
+    def register_next_response(self, method, path,
+                               response_class, headers, body=b''):
+        resp_key = (method, normalize_path(path))
+        next_resp = (response_class, headers, body)
+        self._responses.setdefault(resp_key, []).append(next_resp)
+
+
+class FakeAppThatExcepts(object):
+    MESSAGE = b"We take exception to that!"
+
+    def __init__(self, exception_class=Exception):
+        self.exception_class = exception_class
+
+    def __call__(self, env, start_response):
+        raise self.exception_class(self.MESSAGE)
diff --git a/test/unit/common/middleware/s3api/__init__.py b/test/unit/common/middleware/s3api/__init__.py
new file mode 100644
index 0000000000..ab42f01964
--- /dev/null
+++ b/test/unit/common/middleware/s3api/__init__.py
@@ -0,0 +1,354 @@
+# Copyright (c) 2011-2014 OpenStack Foundation.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import json
+import unittest
+from datetime import datetime
+from datetime import timezone
+import email
+from unittest import mock
+import time
+from contextlib import contextmanager
+
+from swift.common import swob
+from swift.common.http import is_success
+
+from swift.common.middleware.s3api.s3api import filter_factory
+from swift.common.middleware.s3api.etree import fromstring
+from swift.common.middleware.s3api.subresource import Owner, encode_acl, \
+    Grant, User, ACL, PERMISSIONS, AllUsers, AuthenticatedUsers
+from test import BaseTestCase
+
+from test.unit.common.middleware.helpers import FakeSwift
+from test.debug_logger import FakeLabeledStatsdClient
+
+
+class FakeAuthApp(object):
+    container_existence_skip_cache = 0.0
+    account_existence_skip_cache = 0.0
+
+    def __init__(self, app):
+        self.remote_user = 'authorized'
+        self.app = app
+
+    def _update_s3_path_info(self, env):
+        """
+        For S3 requests, Swift auth middleware replaces a user name in
+        env['PATH_INFO'] with a valid tenant id.
+        E.g. '/v1/test:tester/bucket/object' will become
+        '/v1/AUTH_test/bucket/object'. This method emulates the behavior.
+        """
+        tenant_user = swob.str_to_wsgi(env['s3api.auth_details']['access_key'])
+        tenant, user = tenant_user.rsplit(':', 1)
+
+        path = env['PATH_INFO']
+        # Make sure it's valid WSGI
+        swob.wsgi_to_str(path)
+        env['PATH_INFO'] = path.replace(tenant_user, 'AUTH_' + tenant)
+
+    @staticmethod
+    def authorize_cb(req):
+        # Assume swift owner, if not yet set
+        req.environ.setdefault('swift_owner', True)
+        # But then default to blocking authz, to ensure we've replaced
+        # the default auth system
+        return swob.HTTPForbidden(request=req)
+
+    def handle(self, env):
+        if 's3api.auth_details' in env:
+            self._update_s3_path_info(env)
+        else:
+            return
+
+        if self.remote_user:
+            env['REMOTE_USER'] = self.remote_user
+
+        if env['REQUEST_METHOD'] == 'TEST':
+            env['swift.authorize'] = self.authorize_cb
+        else:
+            env['swift.authorize'] = lambda req: None
+
+        if 'swift.authorize_override' in env:
+            return
+
+    def __call__(self, env, start_response):
+        self.handle(env)
+        return self.app(env, start_response)
+
+
+class S3ApiTestCase(BaseTestCase):
+
+    def __init__(self, name):
+        unittest.TestCase.__init__(self, name)
+
+    def _wrap_app(self, app):
+        return FakeAuthApp(app)
+
+    def setUp(self):
+        super().setUp()
+        # setup default config dict
+        self.conf = {
+            'allow_no_owner': False,
+            'location': 'us-east-1',
+            'dns_compliant_bucket_names': True,
+            'max_bucket_listing': 1000,
+            'max_parts_listing': 1000,
+            'max_multi_delete_objects': 1000,
+            's3_acl': False,
+            'storage_domain': 'localhost',
+            'auth_pipeline_check': True,
+            'max_upload_part_num': 10000,
+            'check_bucket_owner': False,
+            'force_swift_request_proxy_log': False,
+            'allow_multipart_uploads': True,
+            'min_segment_size': 5242880,
+            'log_level': 'debug'
+        }
+
+        # note: self.conf has no __file__ key so check_pipeline will be skipped
+        # when constructing self.s3api
+        self.swift = FakeSwift()
+        self.app = self._wrap_app(self.swift)
+        self.app._pipeline_final_app = self.swift
+        with mock.patch('swift.common.statsd_client.LabeledStatsdClient',
+                        FakeLabeledStatsdClient):
+            self.s3api = filter_factory({}, **self.conf)(self.app)
+        self.logger = self.s3api.logger = self.swift.logger
+        self.statsd = self.s3api.statsd
+
+        # if you change the registered acl response for /bucket or
+        # /bucket/object tearDown will complain at you; you can set this to
+        # True in order to indicate you know what you're doing
+        self.s3acl_response_modified = False
+
+        self.swift.register('HEAD', '/v1/AUTH_test',
+                            swob.HTTPOk, {}, None)
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket',
+                            swob.HTTPNoContent, {}, None)
+        self.swift.register('PUT', '/v1/AUTH_test/bucket',
+                            swob.HTTPCreated, {}, None)
+        self.swift.register('POST', '/v1/AUTH_test/bucket',
+                            swob.HTTPNoContent, {}, None)
+        self.swift.register('DELETE', '/v1/AUTH_test/bucket',
+                            swob.HTTPNoContent, {}, None)
+        self.swift.register('GET', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPOk, {'etag': 'object etag'}, "")
+        self.swift.register('PUT', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPCreated, {'etag': 'object etag'}, None)
+        self.swift.register('DELETE', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPNoContent, {}, None)
+
+        self.mock_get_swift_info_result = {'object_versioning': {}}
+        for s3api_path in (
+            'controllers.obj',
+            'controllers.bucket',
+            'controllers.multi_delete',
+            'controllers.versioning',
+        ):
+            patcher = mock.patch(
+                'swift.common.middleware.s3api.%s.get_swift_info' % s3api_path,
+                return_value=self.mock_get_swift_info_result)
+            patcher.start()
+            self.addCleanup(patcher.stop)
+
+    def _register_bucket_policy_index_head(self, bucket, bucket_policy_index):
+        # register bucket HEAD response with given policy index header
+        headers = {'X-Backend-Storage-Policy-Index': str(bucket_policy_index)}
+        self.swift.register('HEAD', '/v1/AUTH_test/' + bucket,
+                            swob.HTTPNoContent, headers)
+
+    def _assert_policy_index(self, req_headers, resp_headers, policy_index):
+        self.assertNotIn('X-Backend-Storage-Policy-Index', req_headers)
+        self.assertEqual(resp_headers.get('X-Backend-Storage-Policy-Index'),
+                         str(policy_index))
+
+    def _get_error_code(self, body):
+        elem = fromstring(body, 'Error')
+        return elem.find('./Code').text
+
+    def _get_error_message(self, body):
+        elem = fromstring(body, 'Error')
+        return elem.find('./Message').text
+
+    def _test_method_error(self, method, path, response_class, headers={},
+                           env={}, expected_xml_tags=None,
+                           expected_status=None):
+        if not path.startswith('/'):
+            path = '/' + path  # add a missing slash before the path
+
+        uri = '/v1/AUTH_test'
+        if path != '/':
+            uri += path
+
+        self.swift.register(method, uri, response_class, headers, None)
+        headers.update({'Authorization': 'AWS test:tester:hmac',
+                        'Date': self.get_date_header()})
+        env.update({'REQUEST_METHOD': method})
+        req = swob.Request.blank(path, environ=env, headers=headers)
+        status, headers, body = self.call_s3api(req)
+        if expected_status is not None:
+            self.assertEqual(status, expected_status)
+        if expected_xml_tags is not None:
+            elem = fromstring(body, 'Error')
+            self.assertEqual(set(expected_xml_tags),
+                             {x.tag for x in elem})
+        return self._get_error_code(body)
+
+    def get_date_header(self, skew=0):
+        # email.utils.formatdate returns utc timestamp in default
+        return email.utils.formatdate(time.time() + skew)
+
+    def get_v4_amz_date_header(self, offset=None):
+        when = datetime.now(timezone.utc)
+        if offset is not None:
+            when += offset
+        return when.strftime('%Y%m%dT%H%M%SZ')
+
+    def call_app(self, req, app=None, expect_exception=False):
+        if app is None:
+            app = self.app
+
+        req.headers.setdefault("User-Agent", "Mozzarella Foxfire")
+
+        status = [None]
+        headers = [None]
+
+        def start_response(s, h, ei=None):
+            status[0] = s
+            headers[0] = swob.HeaderKeyDict(h)
+
+        body_iter = app(req.environ, start_response)
+        body = b''
+        caught_exc = None
+        try:
+            for chunk in body_iter:
+                body += chunk
+        except Exception as exc:
+            if expect_exception:
+                caught_exc = exc
+            else:
+                raise
+
+        if expect_exception:
+            return status[0], headers[0], body, caught_exc
+        else:
+            return status[0], headers[0], body
+
+    @contextmanager
+    def stubbed_container_info(self, versioning_enabled=False):
+        """
+        some tests might want to opt-out of container_info HEAD requests; e.g.
+
+        with self.stubbed_container_info():
+            status, headers, body = self.call_s3api(req)
+        """
+        fake_info = {'status': 204}
+        if versioning_enabled:
+            fake_info['sysmeta'] = {
+                'versions-container': '\x00versions\x00bucket',
+            }
+
+        with mock.patch('swift.common.middleware.s3api.s3request.'
+                        'get_container_info', return_value=fake_info):
+            yield
+
+    def call_s3api(self, req, **kwargs):
+        return self.call_app(req, app=self.s3api, **kwargs)
+
+
+def _gen_test_headers(owner, grants=[], resource='container'):
+    if not grants:
+        grants = [Grant(User('test:tester'), 'FULL_CONTROL')]
+    return encode_acl(resource, ACL(owner, grants))
+
+
+def _gen_grant(permission):
+    # generate Grant with a grantee named by "permission"
+    account_name = '%s:%s' % ('test', permission.lower())
+    return Grant(User(account_name), permission)
+
+
+class S3ApiTestCaseAcl(S3ApiTestCase):
+
+    def setUp(self):
+        super(S3ApiTestCaseAcl, self).setUp()
+        self.s3api.conf.s3_acl = True
+
+        # some extra buckets for s3acl tests
+        buckets = ['bucket', 'public', 'authenticated']
+        for bucket in buckets:
+            path = '/v1/AUTH_test/' + bucket
+            self.swift.register('HEAD', path, swob.HTTPNoContent, {}, None),
+            self.swift.register('GET', path, swob.HTTPOk, {}, json.dumps([])),
+
+        # setup sticky ACL headers...
+        self.grants = [_gen_grant(perm) for perm in PERMISSIONS]
+        self.default_owner = Owner('test:tester', 'test:tester')
+        container_headers = _gen_test_headers(self.default_owner, self.grants)
+        object_headers = _gen_test_headers(
+            self.default_owner, self.grants, 'object')
+        public_headers = _gen_test_headers(
+            self.default_owner, [Grant(AllUsers(), 'READ')])
+        authenticated_headers = _gen_test_headers(
+            self.default_owner, [Grant(AuthenticatedUsers(), 'READ')],
+            'bucket')
+
+        sticky_s3acl_headers = {
+            '/v1/AUTH_test/bucket': container_headers,
+            '/v1/AUTH_test/bucket+segments': container_headers,
+            '/v1/AUTH_test/bucket/object': object_headers,
+            '/v1/AUTH_test/public': public_headers,
+            '/v1/AUTH_test/authenticated': authenticated_headers,
+        }
+        for path, headers in sticky_s3acl_headers.items():
+            self.swift.update_sticky_response_headers(path, headers)
+
+    def tearDown(self):
+        # sanity the test didn't break the the ACLs
+        swift_path_acl_resp_checks = {
+            '/v1/AUTH_test/bucket': (
+                'X-Container-Sysmeta-S3api-Acl', '/bucket',
+                swob.HTTPNoContent),
+            '/v1/AUTH_test/bucket/object': (
+                'X-Object-Sysmeta-S3api-Acl', '/bucket/object', swob.HTTPOk),
+        }
+        check_paths = []
+        for swift_path, (acl, check, resp_class) in \
+                swift_path_acl_resp_checks.items():
+            if self.s3acl_response_modified:
+                # this is expected to reset back to the original sticky headers
+                self.swift.register('HEAD', swift_path, resp_class, {}, None)
+            req = swob.Request.blank(swift_path, method='HEAD')
+            status, headers, body = self.call_app(req)
+            if is_success(int(status.split()[0])):
+                self.assertIn(acl, headers,
+                              'In tearDown it seems the test (accidently?) '
+                              'removed the ACL on %s' % swift_path)
+                check_paths.append(check)
+            else:
+                self.fail('test changed resp for %s' % swift_path)
+        account_expected = {
+            'test:tester': 200,
+            'test:other': 403,
+        }
+        for account, expected in account_expected.items():
+            for path in check_paths:
+                req = swob.Request.blank(path, method='HEAD', headers={
+                    'Authorization': 'AWS %s:hmac' % account,
+                    'Date': self.get_date_header()})
+                status, headers, body = self.call_s3api(req)
+                self.assertEqual(int(status.split()[0]), expected,
+                                 'In tearDown it seems the test (accidently?) '
+                                 'broke ACL access for %s to %s' % (
+                                     account, path))
diff --git a/test/unit/common/test_bench.py b/test/unit/common/middleware/s3api/exceptions.py
similarity index 69%
rename from test/unit/common/test_bench.py
rename to test/unit/common/middleware/s3api/exceptions.py
index 8f748d70b0..1f8d62f0db 100644
--- a/test/unit/common/test_bench.py
+++ b/test/unit/common/middleware/s3api/exceptions.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2013 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,17 +13,6 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-# TODO: Tests
 
-import unittest
-from swift.common import bench
-
-
-class TestBench(unittest.TestCase):
-
-    def test_placeholder(self):
-        pass
-
-
-if __name__ == '__main__':
-    unittest.main()
+class NotMethodException(Exception):
+    pass
diff --git a/test/unit/common/middleware/s3api/helpers.py b/test/unit/common/middleware/s3api/helpers.py
new file mode 100644
index 0000000000..2de66f03a9
--- /dev/null
+++ b/test/unit/common/middleware/s3api/helpers.py
@@ -0,0 +1,39 @@
+# Copyright (c) 2013 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+# This stuff can't live in test/unit/__init__.py due to its swob dependency.
+
+
+class UnreadableInput(object):
+    # Some clients will send neither a Content-Length nor a Transfer-Encoding
+    # header, which will cause (some versions of?) eventlet to bomb out on
+    # reads. This class helps us simulate that behavior.
+    def __init__(self, test_case):
+        self.calls = 0
+        self.test_case = test_case
+
+    def read(self, *a, **kw):
+        self.calls += 1
+        # Calling wsgi.input.read with neither a Content-Length nor
+        # a Transfer-Encoding header will raise TypeError (See
+        # https://bugs.launchpad.net/swift3/+bug/1593870 in detail)
+        # This unreadable class emulates the behavior
+        raise TypeError
+
+    def __enter__(self):
+        return self
+
+    def __exit__(self, *args):
+        self.test_case.assertEqual(0, self.calls)
diff --git a/test/unit/common/middleware/s3api/test_acl.py b/test/unit/common/middleware/s3api/test_acl.py
new file mode 100644
index 0000000000..60d8f466c0
--- /dev/null
+++ b/test/unit/common/middleware/s3api/test_acl.py
@@ -0,0 +1,241 @@
+# Copyright (c) 2014 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import base64
+import unittest
+from unittest import mock
+
+from io import BytesIO
+
+from swift.common.swob import Request, HTTPAccepted
+from swift.common.middleware.s3api.etree import fromstring, tostring, \
+    Element, SubElement, XMLNS_XSI
+from swift.common.middleware.s3api.s3response import InvalidArgument
+from swift.common.middleware.s3api.acl_utils import handle_acl_header
+from swift.common.utils import md5
+
+from test.unit.common.middleware.s3api import S3ApiTestCase, S3ApiTestCaseAcl
+from test.unit.common.middleware.s3api.helpers import UnreadableInput
+
+
+class BaseS3ApiAcl(object):
+
+    def setUp(self):
+        super(BaseS3ApiAcl, self).setUp()
+        # All ACL API should be called against to existing bucket.
+        self.swift.register('PUT', '/v1/AUTH_test/bucket',
+                            HTTPAccepted, {}, None)
+
+    def _check_acl(self, owner, body):
+        elem = fromstring(body, 'AccessControlPolicy')
+        permission = elem.find('./AccessControlList/Grant/Permission').text
+        self.assertEqual(permission, 'FULL_CONTROL')
+        name = elem.find('./AccessControlList/Grant/Grantee/ID').text
+        self.assertEqual(name, owner)
+
+    def test_bucket_acl_GET(self):
+        req = Request.blank('/bucket?acl',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        if not self.s3api.conf.s3_acl:
+            self._check_acl('test:tester', body)
+        self.assertSetEqual(set((('HEAD', '/v1/AUTH_test/bucket'),)),
+                            set(self.swift.calls))
+
+    def _test_put_no_body(self, use_content_length=False,
+                          use_transfer_encoding=False, string_to_md5=b''):
+        content_md5 = base64.b64encode(
+            md5(string_to_md5, usedforsecurity=False).digest()).strip()
+        with UnreadableInput(self) as fake_input:
+            req = Request.blank(
+                '/bucket?acl',
+                environ={
+                    'REQUEST_METHOD': 'PUT',
+                    'wsgi.input': fake_input},
+                headers={
+                    'Authorization': 'AWS test:tester:hmac',
+                    'Date': self.get_date_header(),
+                    'Content-MD5': content_md5},
+                body='')
+            if not use_content_length:
+                req.environ.pop('CONTENT_LENGTH')
+            if use_transfer_encoding:
+                req.environ['HTTP_TRANSFER_ENCODING'] = 'chunked'
+            status, headers, body = self.call_s3api(req)
+        self.assertEqual(status, '400 Bad Request')
+        self.assertEqual(self._get_error_code(body), 'MissingSecurityHeader')
+        self.assertEqual(self._get_error_message(body),
+                         'Your request was missing a required header.')
+        self.assertIn(b'<MissingHeaderName>x-amz-acl</MissingHeaderName>',
+                      body)
+
+    def test_bucket_fails_with_neither_acl_header_nor_xml_PUT(self):
+        self._test_put_no_body()
+        self._test_put_no_body(string_to_md5=b'test')
+        self._test_put_no_body(use_content_length=True)
+        self._test_put_no_body(use_content_length=True, string_to_md5=b'test')
+        self._test_put_no_body(use_transfer_encoding=True)
+        self._test_put_no_body(use_transfer_encoding=True, string_to_md5=b'zz')
+
+    def test_object_acl_GET(self):
+        req = Request.blank('/bucket/object?acl',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        if not self.s3api.conf.s3_acl:
+            self._check_acl('test:tester', body)
+        self.assertSetEqual(set((('HEAD', '/v1/AUTH_test/bucket/object'),)),
+                            set(self.swift.calls))
+
+
+class TestS3ApiAclNoSetup(BaseS3ApiAcl, S3ApiTestCase):
+
+    def test_bucket_acl_PUT(self):
+        elem = Element('AccessControlPolicy')
+        owner = SubElement(elem, 'Owner')
+        SubElement(owner, 'ID').text = 'id'
+        acl = SubElement(elem, 'AccessControlList')
+        grant = SubElement(acl, 'Grant')
+        grantee = SubElement(grant, 'Grantee', nsmap={'xsi': XMLNS_XSI})
+        grantee.set('{%s}type' % XMLNS_XSI, 'Group')
+        SubElement(grantee, 'URI').text = \
+            'http://acs.amazonaws.com/groups/global/AllUsers'
+        SubElement(grant, 'Permission').text = 'READ'
+
+        xml = tostring(elem)
+        req = Request.blank('/bucket?acl',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()},
+                            body=xml)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+
+        req = Request.blank('/bucket?acl',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'wsgi.input': BytesIO(xml)},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'Transfer-Encoding': 'chunked'})
+        self.assertIsNone(req.content_length)
+        self.assertIsNone(req.message_length())
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+
+    def test_bucket_canned_acl_PUT(self):
+        req = Request.blank('/bucket?acl',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'X-AMZ-ACL': 'public-read'})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+
+    def test_bucket_fails_with_both_acl_header_and_xml_PUT(self):
+        elem = Element('AccessControlPolicy')
+        owner = SubElement(elem, 'Owner')
+        SubElement(owner, 'ID').text = 'id'
+        acl = SubElement(elem, 'AccessControlList')
+        grant = SubElement(acl, 'Grant')
+        grantee = SubElement(grant, 'Grantee', nsmap={'xsi': XMLNS_XSI})
+        grantee.set('{%s}type' % XMLNS_XSI, 'Group')
+        SubElement(grantee, 'URI').text = \
+            'http://acs.amazonaws.com/groups/global/AllUsers'
+        SubElement(grant, 'Permission').text = 'READ'
+
+        xml = tostring(elem)
+        req = Request.blank('/bucket?acl',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'X-AMZ-ACL': 'public-read'},
+                            body=xml)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body),
+                         'UnexpectedContent')
+
+    def test_invalid_xml(self):
+        req = Request.blank('/bucket?acl',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()},
+                            body='invalid')
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'MalformedACLError')
+
+    def test_handle_acl_header(self):
+        def check_generated_acl_header(acl, targets):
+            req = Request.blank('/bucket',
+                                headers={'X-Amz-Acl': acl})
+            handle_acl_header(req)
+            for target in targets:
+                self.assertTrue(target[0] in req.headers)
+                self.assertEqual(req.headers[target[0]], target[1])
+
+        check_generated_acl_header('public-read',
+                                   [('X-Container-Read', '.r:*,.rlistings')])
+        check_generated_acl_header('public-read-write',
+                                   [('X-Container-Read', '.r:*,.rlistings'),
+                                    ('X-Container-Write', '.r:*')])
+        check_generated_acl_header('private',
+                                   [('X-Container-Read', '.'),
+                                    ('X-Container-Write', '.')])
+
+    def test_handle_acl_with_invalid_header_string(self):
+        req = Request.blank('/bucket', headers={'X-Amz-Acl': 'invalid'})
+        with self.assertRaises(InvalidArgument) as cm:
+            handle_acl_header(req)
+        self.assertTrue('argument_name' in cm.exception.info)
+        self.assertEqual(cm.exception.info['argument_name'], 'x-amz-acl')
+        self.assertTrue('argument_value' in cm.exception.info)
+        self.assertEqual(cm.exception.info['argument_value'], 'invalid')
+
+
+class TestS3ApiAclCommonSetup(BaseS3ApiAcl, S3ApiTestCaseAcl):
+
+    def test_bucket_canned_acl_PUT_with_s3acl(self):
+        req = Request.blank('/bucket?acl',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'X-AMZ-ACL': 'public-read'})
+        with mock.patch('swift.common.middleware.s3api.s3request.'
+                        'handle_acl_header') as mock_handler:
+            status, headers, body = self.call_s3api(req)
+            self.assertEqual(status.split()[0], '200')
+            self.assertEqual(mock_handler.call_count, 0)
+
+    def test_handle_acl_header_with_s3acl(self):
+        def check_generated_acl_header(acl, targets):
+            req = Request.blank('/bucket',
+                                headers={'X-Amz-Acl': acl})
+            for target in targets:
+                self.assertTrue(target not in req.headers)
+            self.assertTrue('HTTP_X_AMZ_ACL' in req.environ)
+            # TODO: add transration and assertion for s3acl
+
+        check_generated_acl_header('public-read',
+                                   ['X-Container-Read'])
+        check_generated_acl_header('public-read-write',
+                                   ['X-Container-Read', 'X-Container-Write'])
+        check_generated_acl_header('private',
+                                   ['X-Container-Read', 'X-Container-Write'])
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/s3api/test_acl_handlers.py b/test/unit/common/middleware/s3api/test_acl_handlers.py
new file mode 100644
index 0000000000..0c3a98ccac
--- /dev/null
+++ b/test/unit/common/middleware/s3api/test_acl_handlers.py
@@ -0,0 +1,42 @@
+# Copyright (c) 2014 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+
+from swift.common.middleware.s3api.acl_handlers import S3AclHandler, \
+    BucketAclHandler, ObjectAclHandler, BaseAclHandler, PartAclHandler, \
+    UploadAclHandler, UploadsAclHandler, get_acl_handler
+
+
+class TestAclHandlers(unittest.TestCase):
+    def test_get_acl_handler(self):
+        expected_handlers = (('Bucket', BucketAclHandler),
+                             ('Object', ObjectAclHandler),
+                             ('S3Acl', S3AclHandler),
+                             ('Part', PartAclHandler),
+                             ('Upload', UploadAclHandler),
+                             ('Uploads', UploadsAclHandler),
+                             ('Foo', BaseAclHandler))
+        for name, expected in expected_handlers:
+            handler = get_acl_handler(name)
+            self.assertTrue(issubclass(handler, expected))
+
+    def test_handle_acl(self):
+        # we have already have tests for s3_acl checking at test_s3_acl.py
+        pass
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/s3api/test_acl_utils.py b/test/unit/common/middleware/s3api/test_acl_utils.py
new file mode 100644
index 0000000000..9a8ee1a749
--- /dev/null
+++ b/test/unit/common/middleware/s3api/test_acl_utils.py
@@ -0,0 +1,74 @@
+# Copyright (c) 2014 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+
+from swift.common.swob import Request
+from swift.common.middleware.s3api import s3response
+from swift.common.middleware.s3api.acl_utils import handle_acl_header
+
+from test.unit.common.middleware.s3api import S3ApiTestCase
+
+
+class TestS3ApiAclUtils(S3ApiTestCase):
+
+    def setUp(self):
+        super(TestS3ApiAclUtils, self).setUp()
+
+    def check_generated_acl_header(self, acl, expected):
+        req = Request.blank('/bucket',
+                            headers={'X-Amz-Acl': acl})
+        try:
+            handle_acl_header(req)
+        except s3response.ErrorResponse as e:
+            if isinstance(e, expected):
+                self.assertEqual(expected._status, e._status)
+            else:
+                raise
+        else:
+            for target in expected:
+                self.assertTrue(target[0] in req.headers)
+                self.assertEqual(req.headers[target[0]], target[1])
+
+    def test_canned_acl_header(self):
+        # https://docs.aws.amazon.com/AmazonS3/latest/userguide/acl-overview.html#canned-acl
+        self.check_generated_acl_header(
+            'private',
+            [('X-Container-Read', '.'), ('X-Container-Write', '.')])
+        self.check_generated_acl_header(
+            'public-read', [('X-Container-Read', '.r:*,.rlistings')])
+        self.check_generated_acl_header(
+            'public-read-write', [('X-Container-Read', '.r:*,.rlistings'),
+                                  ('X-Container-Write', '.r:*')])
+        self.check_generated_acl_header(
+            'aws-exec-read', s3response.InvalidArgument)
+        self.check_generated_acl_header(
+            'authenticated-read', s3response.S3NotImplemented)
+        self.check_generated_acl_header(
+            'bucket-owner-read', [('X-Container-Read', '.'),
+                                  ('X-Container-Write', '.')])
+        self.check_generated_acl_header(
+            'bucket-owner-full-control', [('X-Container-Read', '.'),
+                                          ('X-Container-Write', '.')])
+        self.check_generated_acl_header(
+            'log-delivery-write', s3response.S3NotImplemented)
+
+        # the 400 response is the catch all
+        self.check_generated_acl_header(
+            'some-non-sense', s3response.InvalidArgument)
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/s3api/test_bucket.py b/test/unit/common/middleware/s3api/test_bucket.py
new file mode 100644
index 0000000000..aa54dbdc41
--- /dev/null
+++ b/test/unit/common/middleware/s3api/test_bucket.py
@@ -0,0 +1,1660 @@
+# Copyright (c) 2014 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+from unittest import mock
+from hashlib import sha256
+
+from urllib.parse import quote, parse_qsl
+
+from swift.common import swob
+from swift.common.middleware.proxy_logging import ProxyLoggingMiddleware
+from swift.common.middleware.versioned_writes.object_versioning import \
+    DELETE_MARKER_CONTENT_TYPE
+from swift.common.swob import Request
+from swift.common.utils import json
+
+from swift.common.middleware.s3api.etree import fromstring, tostring, \
+    Element, SubElement
+from swift.common.middleware.s3api.subresource import Owner, encode_acl, \
+    ACLPublicRead
+from swift.common.middleware.s3api.s3request import MAX_32BIT_INT
+
+from test.unit.common.middleware.helpers import normalize_path
+from test.unit.common.middleware.s3api import S3ApiTestCase, S3ApiTestCaseAcl
+from test.unit.common.middleware.s3api.helpers import UnreadableInput
+
+# Example etag from ProxyFS; note that it is already quote-wrapped
+PFS_ETAG = '"pfsv2/AUTH_test/01234567/89abcdef-32"'
+
+
+class BaseS3ApiBucket(object):
+    def setup_objects(self):
+        self.objects = (('lily', '2011-01-05T02:19:14.275290', '0', '3909'),
+                        (u'lily-\u062a', '2011-01-05T02:19:14.275290', 0, 390),
+                        ('mu', '2011-01-05T02:19:14.275290',
+                         'md5-of-the-manifest; s3_etag=0', '3909'),
+                        ('pfs-obj', '2011-01-05T02:19:14.275290',
+                         PFS_ETAG, '3909'),
+                        ('rose', '2011-01-05T02:19:14.275290', 0, 303),
+                        ('slo', '2011-01-05T02:19:14.275290',
+                         'md5-of-the-manifest', '3909'),
+                        ('viola', '2011-01-05T02:19:14.275290', '0', 3909),
+                        ('with space', '2011-01-05T02:19:14.275290', 0, 390),
+                        ('with%20space', '2011-01-05T02:19:14.275290', 0, 390))
+
+        self.objects_list = [
+            {'name': item[0], 'last_modified': str(item[1]),
+             'content_type': 'application/octet-stream',
+             'hash': str(item[2]), 'bytes': str(item[3])}
+            for item in self.objects]
+        self.objects_list[5]['slo_etag'] = '"0"'
+        self.versioned_objects = [{
+            'name': 'rose',
+            'version_id': '2',
+            'hash': '0',
+            'bytes': '0',
+            'last_modified': '2010-03-01T17:09:51.510928',
+            'content_type': DELETE_MARKER_CONTENT_TYPE,
+            'is_latest': False,
+        }, {
+            'name': 'rose',
+            'version_id': '1',
+            'hash': '1234',
+            'bytes': '6',
+            'last_modified': '2010-03-01T17:09:50.510928',
+            'content_type': 'application/octet-stream',
+            'is_latest': False,
+        }]
+
+        listing_body = json.dumps(self.objects_list)
+        self.prefixes = ['rose', 'viola', 'lily']
+        object_list_subdir = [{"subdir": p} for p in self.prefixes]
+
+        self.swift.register('DELETE', '/v1/AUTH_test/bucket+segments',
+                            swob.HTTPNoContent, {}, json.dumps([]))
+        for name, _, _, _ in self.objects:
+            self.swift.register(
+                'DELETE',
+                '/v1/AUTH_test/bucket+segments/' +
+                swob.bytes_to_wsgi(name.encode('utf-8')),
+                swob.HTTPNoContent, {}, json.dumps([]))
+        self.swift.register(
+            'GET',
+            '/v1/AUTH_test/bucket+segments?format=json&marker=with%2520space',
+            swob.HTTPOk,
+            {'Content-Type': 'application/json; charset=utf-8'},
+            json.dumps([]))
+        self.swift.register(
+            'GET', '/v1/AUTH_test/bucket+segments?format=json&marker=',
+            swob.HTTPOk, {'Content-Type': 'application/json'}, listing_body)
+        self.swift.register(
+            'HEAD', '/v1/AUTH_test/junk', swob.HTTPNoContent,
+            {'X-Backend-Storage-Policy-Index': '3'}, None)
+        self.swift.register(
+            'HEAD', '/v1/AUTH_test/nojunk', swob.HTTPNotFound, {}, None)
+        self.swift.register(
+            'HEAD', '/v1/AUTH_test/unavailable', swob.HTTPServiceUnavailable,
+            {}, None)
+        self.swift.register(
+            'GET', '/v1/AUTH_test/junk', swob.HTTPOk,
+            {'Content-Type': 'application/json',
+             'X-Backend-Storage-Policy-Index': '3'}, listing_body)
+        self.swift.register(
+            'GET', '/v1/AUTH_test/junk-subdir', swob.HTTPOk,
+            {'Content-Type': 'application/json; charset=utf-8'},
+            json.dumps(object_list_subdir))
+        self.swift.register(
+            'GET',
+            '/v1/AUTH_test/subdirs?delimiter=/&limit=3',
+            swob.HTTPOk, {}, json.dumps([
+                {'subdir': 'nothing/'},
+                {'subdir': u'but-\u062a/'},
+                {'subdir': 'subdirs/'},
+            ]))
+
+    def setUp(self):
+        super(BaseS3ApiBucket, self).setUp()
+        self.setup_objects()
+
+    def _add_versions_request(self, orig_objects=None, versioned_objects=None,
+                              bucket='junk'):
+        if orig_objects is None:
+            orig_objects = self.objects_list
+        if versioned_objects is None:
+            versioned_objects = self.versioned_objects
+        all_versions = versioned_objects + [
+            dict(i, version_id='null', is_latest=True)
+            for i in orig_objects]
+        all_versions.sort(key=lambda o: (
+            o['name'], '' if o['version_id'] == 'null' else o['version_id']))
+        self.swift.register(
+            'GET', '/v1/AUTH_test/%s' % bucket, swob.HTTPOk,
+            {'Content-Type': 'application/json'}, json.dumps(all_versions))
+
+    def _assert_delete_markers(self, elem):
+        delete_markers = elem.findall('./DeleteMarker')
+        self.assertEqual(len(delete_markers), 1)
+        self.assertEqual(delete_markers[0].find('./IsLatest').text, 'false')
+        self.assertEqual(delete_markers[0].find('./VersionId').text, '2')
+        self.assertEqual(delete_markers[0].find('./Key').text, 'rose')
+
+    def _test_bucket_PUT_with_location(self, root_element):
+        elem = Element(root_element)
+        SubElement(elem, 'LocationConstraint').text = 'us-east-1'
+        xml = tostring(elem)
+
+        req = Request.blank('/bucket',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()},
+                            body=xml)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+
+    def _test_method_error_delete(self, path, sw_resp):
+        self.swift.register('HEAD', '/v1/AUTH_test' + path, sw_resp, {}, None)
+        return self._test_method_error('DELETE', path, sw_resp)
+
+    def test_bucket_GET_error(self):
+        code = self._test_method_error('GET', '/bucket', swob.HTTPUnauthorized)
+        self.assertEqual(code, 'SignatureDoesNotMatch')
+        code = self._test_method_error('GET', '/bucket', swob.HTTPForbidden)
+        self.assertEqual(code, 'AccessDenied')
+        code = self._test_method_error('GET', '/bucket', swob.HTTPNotFound)
+        self.assertEqual(code, 'NoSuchBucket')
+        code = self._test_method_error('GET', '/bucket',
+                                       swob.HTTPServiceUnavailable)
+        self.assertEqual(code, 'ServiceUnavailable')
+        code = self._test_method_error('GET', '/bucket', swob.HTTPServerError)
+        self.assertEqual(code, 'InternalError')
+
+    def test_bucket_GET_non_json(self):
+        # Suppose some middleware accidentally makes it return txt instead
+        resp_body = b'\n'.join([b'obj%d' % i for i in range(100)])
+        self.swift.register('GET', '/v1/AUTH_test/bucket', swob.HTTPOk, {},
+                            resp_body)
+        # When we do our GET...
+        req = Request.blank('/bucket',
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        # ...there isn't much choice but to error...
+        self.assertEqual(self._get_error_code(body), 'InternalError')
+        # ... but we should at least log the body to aid in debugging
+        self.assertIn(
+            'Got non-JSON response trying to list /bucket: %r'
+            % (resp_body[:60] + b'...'),
+            self.s3api.logger.get_lines_for_level('error'))
+
+    def test_bucket_PUT_error(self):
+        code = self._test_method_error('PUT', '/bucket', swob.HTTPCreated,
+                                       headers={'Content-Length': 'a'})
+        self.assertEqual(code, 'InvalidArgument')
+        code = self._test_method_error('PUT', '/bucket', swob.HTTPCreated,
+                                       headers={'Content-Length': '-1'})
+        self.assertEqual(code, 'InvalidArgument')
+        code = self._test_method_error('PUT', '/bucket', swob.HTTPUnauthorized)
+        self.assertEqual(code, 'SignatureDoesNotMatch')
+        code = self._test_method_error('PUT', '/bucket', swob.HTTPForbidden)
+        self.assertEqual(code, 'AccessDenied')
+        code = self._test_method_error('PUT', '/bucket', swob.HTTPAccepted)
+        self.assertEqual(code, 'BucketAlreadyOwnedByYou')
+        with mock.patch(
+                'swift.common.middleware.s3api.s3request.get_container_info',
+                return_value={'sysmeta': {'s3api-acl': '{"Owner": "nope"}'}}):
+            code = self._test_method_error(
+                'PUT', '/bucket', swob.HTTPAccepted)
+        self.assertEqual(code, 'BucketAlreadyExists')
+        code = self._test_method_error('PUT', '/bucket', swob.HTTPServerError)
+        self.assertEqual(code, 'InternalError')
+        code = self._test_method_error(
+            'PUT', '/bucket', swob.HTTPServiceUnavailable)
+        self.assertEqual(code, 'ServiceUnavailable')
+        code = self._test_method_error(
+            'PUT', '/bucket+bucket', swob.HTTPCreated)
+        self.assertEqual(code, 'InvalidBucketName')
+        code = self._test_method_error(
+            'PUT', '/192.168.11.1', swob.HTTPCreated)
+        self.assertEqual(code, 'InvalidBucketName')
+        code = self._test_method_error(
+            'PUT', '/bucket.-bucket', swob.HTTPCreated)
+        self.assertEqual(code, 'InvalidBucketName')
+        code = self._test_method_error(
+            'PUT', '/bucket-.bucket', swob.HTTPCreated)
+        self.assertEqual(code, 'InvalidBucketName')
+        code = self._test_method_error('PUT', '/bucket*', swob.HTTPCreated)
+        self.assertEqual(code, 'InvalidBucketName')
+        code = self._test_method_error('PUT', '/b', swob.HTTPCreated)
+        self.assertEqual(code, 'InvalidBucketName')
+        code = self._test_method_error(
+            'PUT', '/%s' % ''.join(['b' for x in range(64)]),
+            swob.HTTPCreated)
+        self.assertEqual(code, 'InvalidBucketName')
+
+    def test_bucket_PUT_bucket_already_owned_by_you(self):
+        self.swift.register(
+            'PUT', '/v1/AUTH_test/bucket', swob.HTTPAccepted,
+            {'X-Container-Object-Count': 0}, None)
+        req = Request.blank('/bucket',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status, '409 Conflict')
+        self.assertIn(b'BucketAlreadyOwnedByYou', body)
+
+    def test_bucket_PUT_first_put_fail(self):
+        self.swift.register(
+            'PUT', '/v1/AUTH_test/bucket',
+            swob.HTTPServiceUnavailable,
+            {'X-Container-Object-Count': 0}, None)
+        req = Request.blank('/bucket',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status, '503 Service Unavailable')
+        # The last call was PUT not POST for acl set
+        self.assertEqual(self.swift.calls, [
+            ('PUT', '/v1/AUTH_test/bucket'),
+        ])
+
+    def test_bucket_PUT(self):
+        req = Request.blank('/bucket',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(body, b'')
+        self.assertEqual(status.split()[0], '200')
+        self.assertEqual(headers['Location'], '/bucket')
+        method, path, sw_headers = self.swift.calls_with_headers[0]
+        self.assertEqual('PUT', method)
+        self.assertEqual('/v1/AUTH_test/bucket', path)
+        self.assertNotIn('X-Timestamp', sw_headers)
+
+    def test_bucket_PUT_chunked_transfer(self):
+        # Apparently some clients will include a chunked transfer-encoding
+        # even with no body
+        req = Request.blank('/bucket',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'Transfer-Encoding': 'chunked'})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(body, b'')
+        self.assertEqual(status.split()[0], '200')
+        self.assertEqual(headers['Location'], '/bucket')
+        method, path, sw_headers = self.swift.calls_with_headers[0]
+        self.assertEqual('PUT', method)
+        self.assertEqual('/v1/AUTH_test/bucket', path)
+        self.assertNotIn('X-Timestamp', sw_headers)
+
+    def test_bucket_PUT_unreadable_input(self):
+        with UnreadableInput(self) as fake_input:
+            req = Request.blank(
+                '/bucket',
+                environ={'REQUEST_METHOD': 'PUT',
+                         'wsgi.input': fake_input},
+                headers={'Authorization': 'AWS test:tester:hmac',
+                         'Date': self.get_date_header()})
+            status, headers, body = self.call_s3api(req)
+        self.assertEqual(body, b'')
+        self.assertEqual(status.split()[0], '200')
+        self.assertEqual(headers['Location'], '/bucket')
+        method, path, sw_headers = self.swift.calls_with_headers[0]
+        self.assertEqual('PUT', method)
+        self.assertEqual('/v1/AUTH_test/bucket', path)
+        self.assertNotIn('X-Timestamp', sw_headers)
+
+    def test_bucket_PUT_with_location(self):
+        self._test_bucket_PUT_with_location('CreateBucketConfiguration')
+
+    def test_bucket_PUT_with_ami_location(self):
+        # ec2-ami-tools apparently uses CreateBucketConstraint instead?
+        self._test_bucket_PUT_with_location('CreateBucketConstraint')
+
+    def test_bucket_PUT_with_strange_location(self):
+        # Even crazier: it doesn't seem to matter
+        self._test_bucket_PUT_with_location('foo')
+
+    def test_bucket_PUT_with_location_error(self):
+        elem = Element('CreateBucketConfiguration')
+        SubElement(elem, 'LocationConstraint').text = 'XXX'
+        xml = tostring(elem)
+
+        req = Request.blank('/bucket',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()},
+                            body=xml)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body),
+                         'InvalidLocationConstraint')
+
+    def test_bucket_PUT_with_location_invalid_xml(self):
+        req = Request.blank('/bucket',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()},
+                            body='invalid_xml')
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'MalformedXML')
+
+    def test_bucket_DELETE_error(self):
+        code = self._test_method_error_delete('/bucket', swob.HTTPUnauthorized)
+        self.assertEqual(code, 'SignatureDoesNotMatch')
+        code = self._test_method_error_delete('/bucket', swob.HTTPForbidden)
+        self.assertEqual(code, 'AccessDenied')
+        code = self._test_method_error_delete('/bucket', swob.HTTPNotFound)
+        self.assertEqual(code, 'NoSuchBucket')
+        code = self._test_method_error_delete('/bucket', swob.HTTPServerError)
+        self.assertEqual(code, 'InternalError')
+
+        # bucket not empty is now validated at s3api
+        self.swift._responses.get(('HEAD', '/v1/AUTH_test/bucket'))
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket', swob.HTTPNoContent,
+                            {'X-Container-Object-Count': '1'}, None)
+        req = Request.blank('/bucket',
+                            environ={'REQUEST_METHOD': 'DELETE'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, _headers, body = self.call_s3api(req)
+        self.assertEqual('409 Conflict', status)
+        self.assertEqual('BucketNotEmpty', self._get_error_code(body))
+        self.assertNotIn('You must delete all versions in the bucket',
+                         self._get_error_message(body))
+
+    def test_bucket_DELETE_error_with_enabled_versioning(self):
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket', swob.HTTPNoContent,
+                            {'X-Container-Object-Count': '1',
+                             'X-Container-Sysmeta-Versions-Enabled': 'True'},
+                            None)
+        req = Request.blank('/bucket',
+                            environ={'REQUEST_METHOD': 'DELETE'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, _headers, body = self.call_s3api(req)
+        self.assertEqual('409 Conflict', status)
+        self.assertEqual('BucketNotEmpty', self._get_error_code(body))
+        self.assertIn('You must delete all versions in the bucket',
+                      self._get_error_message(body))
+
+    def test_bucket_DELETE_error_with_suspended_versioning(self):
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket', swob.HTTPNoContent,
+                            {'X-Container-Object-Count': '1',
+                             'X-Container-Sysmeta-Versions-Enabled': 'False'},
+                            None)
+        req = Request.blank('/bucket',
+                            environ={'REQUEST_METHOD': 'DELETE'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, _headers, body = self.call_s3api(req)
+        self.assertEqual('409 Conflict', status)
+        self.assertEqual('BucketNotEmpty', self._get_error_code(body))
+        self.assertIn('You must delete all versions in the bucket',
+                      self._get_error_message(body))
+
+    def test_bucket_DELETE(self):
+        # overwrite default HEAD to return x-container-object-count
+        self.swift.register(
+            'HEAD', '/v1/AUTH_test/bucket', swob.HTTPNoContent,
+            {'X-Container-Object-Count': 0}, None)
+
+        req = Request.blank('/bucket',
+                            environ={'REQUEST_METHOD': 'DELETE'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '204')
+        method, path, sw_headers = self.swift.calls_with_headers[-1]
+        self.assertEqual('DELETE', method)
+        self.assertEqual('/v1/AUTH_test/bucket', path)
+        self.assertNotIn('X-Timestamp', sw_headers)
+
+    def test_bucket_DELETE_with_empty_versioning(self):
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket+versioning',
+                            swob.HTTPNoContent, {}, None)
+        self.swift.register('DELETE', '/v1/AUTH_test/bucket+versioning',
+                            swob.HTTPNoContent, {}, None)
+        # overwrite default HEAD to return x-container-object-count
+        self.swift.register(
+            'HEAD', '/v1/AUTH_test/bucket', swob.HTTPNoContent,
+            {'X-Container-Object-Count': 0}, None)
+
+        req = Request.blank('/bucket',
+                            environ={'REQUEST_METHOD': 'DELETE'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '204')
+
+    def test_bucket_DELETE_error_while_segment_bucket_delete(self):
+        # An error occurred while deleting segment objects
+        self.swift.register('DELETE', '/v1/AUTH_test/bucket+segments/lily',
+                            swob.HTTPServiceUnavailable, {}, json.dumps([]))
+        # overwrite default HEAD to return x-container-object-count
+        self.swift.register(
+            'HEAD', '/v1/AUTH_test/bucket', swob.HTTPNoContent,
+            {'X-Container-Object-Count': 0}, None)
+
+        req = Request.blank('/bucket',
+                            environ={'REQUEST_METHOD': 'DELETE'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '503')
+        called = [(method, path) for method, path, _ in
+                  self.swift.calls_with_headers]
+        # Don't delete original bucket when error occurred in segment container
+        self.assertNotIn(('DELETE', '/v1/AUTH_test/bucket'), called)
+
+
+class TestS3ApiBucketNoACL(BaseS3ApiBucket, S3ApiTestCase):
+
+    def test_bucket_HEAD(self):
+        req = Request.blank('/junk',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+
+    def _do_test_bucket_HEAD_policy_index_logging(self, bucket_policy_index):
+        self.logger.clear()
+        self._register_bucket_policy_index_head('junk', bucket_policy_index)
+        req = Request.blank('/junk',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        self.s3api = ProxyLoggingMiddleware(self.s3api, {}, logger=self.logger)
+        status, headers, body = self.call_s3api(req)
+        self._assert_policy_index(req.headers, headers, bucket_policy_index)
+        self.assertEqual('/v1/AUTH_test/junk',
+                         req.environ['swift.backend_path'])
+        access_lines = self.logger.get_lines_for_level('info')
+        self.assertEqual(1, len(access_lines))
+        parts = access_lines[0].split()
+        self.assertEqual(' '.join(parts[3:7]), 'HEAD /junk HTTP/1.0 200')
+        self.assertEqual(parts[-2], str(bucket_policy_index))
+        self.assertEqual(parts[-1], 'test:tester')  # access_user_id
+
+    def test_bucket_HEAD_policy_index_logging(self):
+        self._do_test_bucket_HEAD_policy_index_logging(0)
+        self._do_test_bucket_HEAD_policy_index_logging(1)
+
+    def test_bucket_HEAD_error(self):
+        req = Request.blank('/nojunk',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '404')
+        self.assertEqual(body, b'')  # sanity
+
+    def test_bucket_HEAD_503(self):
+        req = Request.blank('/unavailable',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '503')
+        self.assertEqual(body, b'')  # sanity
+
+    def test_bucket_HEAD_slash(self):
+        req = Request.blank('/junk/',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+
+    def test_bucket_HEAD_slash_error(self):
+        req = Request.blank('/nojunk/',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '404')
+
+    def test_bucket_GET(self):
+        bucket_name = 'junk'
+        req = Request.blank('/%s' % bucket_name,
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+        self._assert_policy_index(req.headers, headers, 3)
+        self.assertEqual('/v1/AUTH_test/junk',
+                         req.environ.get('swift.backend_path'))
+        elem = fromstring(body, 'ListBucketResult')
+        name = elem.find('./Name').text
+        self.assertEqual(name, bucket_name)
+
+        objects = elem.iterchildren('Contents')
+
+        items = []
+        for o in objects:
+            items.append((o.find('./Key').text, o.find('./ETag').text))
+            self.assertEqual('2011-01-05T02:19:15.000Z',
+                             o.find('./LastModified').text)
+        expected = [
+            (i[0],
+             PFS_ETAG if i[0] == 'pfs-obj' else
+             '"0-N"' if i[0] == 'slo' else '"0"')
+            for i in self.objects
+        ]
+        self.assertEqual(items, expected)
+
+    def test_bucket_GET_last_modified_rounding(self):
+        objects_list = [
+            {'name': 'a', 'last_modified': '2011-01-05T02:19:59.275290',
+             'content_type': 'application/octet-stream',
+             'hash': 'ahash', 'bytes': '12345'},
+            {'name': 'b', 'last_modified': '2011-01-05T02:19:59.000000',
+             'content_type': 'application/octet-stream',
+             'hash': 'ahash', 'bytes': '12345'},
+        ]
+        self.swift.register(
+            'GET', '/v1/AUTH_test/junk',
+            swob.HTTPOk, {'Content-Type': 'application/json'},
+            json.dumps(objects_list))
+        req = Request.blank('/junk',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+
+        elem = fromstring(body, 'ListBucketResult')
+        name = elem.find('./Name').text
+        self.assertEqual(name, 'junk')
+        objects = elem.iterchildren('Contents')
+        actual = [(obj.find('./Key').text, obj.find('./LastModified').text)
+                  for obj in objects]
+        self.assertEqual(
+            [('a', '2011-01-05T02:20:00.000Z'),
+             ('b', '2011-01-05T02:19:59.000Z')],
+            actual)
+
+    def test_bucket_GET_url_encoded(self):
+        bucket_name = 'junk'
+        req = Request.blank('/%s?encoding-type=url' % bucket_name,
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+
+        elem = fromstring(body, 'ListBucketResult')
+        name = elem.find('./Name').text
+        self.assertEqual(name, bucket_name)
+
+        objects = elem.iterchildren('Contents')
+
+        items = []
+        for o in objects:
+            items.append((o.find('./Key').text, o.find('./ETag').text))
+            self.assertEqual('2011-01-05T02:19:15.000Z',
+                             o.find('./LastModified').text)
+
+        self.assertEqual(items, [
+            (quote(i[0].encode('utf-8')),
+             PFS_ETAG if i[0] == 'pfs-obj' else
+             '"0-N"' if i[0] == 'slo' else '"0"')
+            for i in self.objects])
+
+    def test_bucket_GET_subdir(self):
+        bucket_name = 'junk-subdir'
+        req = Request.blank('/%s' % bucket_name,
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+        elem = fromstring(body, 'ListBucketResult')
+        name = elem.find('./Name').text
+        self.assertEqual(name, bucket_name)
+
+        prefixes = elem.findall('CommonPrefixes')
+
+        self.assertEqual(len(prefixes), len(self.prefixes))
+        for p in prefixes:
+            self.assertTrue(p.find('./Prefix').text in self.prefixes)
+
+    def test_bucket_GET_is_truncated(self):
+        bucket_name = 'junk'
+
+        req = Request.blank(
+            '/%s?max-keys=%d' % (bucket_name, len(self.objects)),
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Authorization': 'AWS test:tester:hmac',
+                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'ListBucketResult')
+        self.assertEqual(elem.find('./IsTruncated').text, 'false')
+
+        req = Request.blank(
+            '/%s?max-keys=%d' % (bucket_name, len(self.objects) - 1),
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Authorization': 'AWS test:tester:hmac',
+                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'ListBucketResult')
+        self.assertEqual(elem.find('./IsTruncated').text, 'true')
+
+        req = Request.blank('/subdirs?delimiter=/&max-keys=2',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'ListBucketResult')
+        self.assertEqual(elem.find('./IsTruncated').text, 'true')
+        self.assertEqual(elem.find('./NextMarker').text,
+                         u'but-\u062a/')
+
+    def test_bucket_GET_is_truncated_url_encoded(self):
+        bucket_name = 'junk'
+
+        req = Request.blank(
+            '/%s?encoding-type=url&max-keys=%d' % (
+                bucket_name, len(self.objects)),
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Authorization': 'AWS test:tester:hmac',
+                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'ListBucketResult')
+        self.assertEqual(elem.find('./IsTruncated').text, 'false')
+
+        req = Request.blank(
+            '/%s?encoding-type=url&max-keys=%d' % (
+                bucket_name, len(self.objects) - 1),
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Authorization': 'AWS test:tester:hmac',
+                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'ListBucketResult')
+        self.assertEqual(elem.find('./IsTruncated').text, 'true')
+
+        req = Request.blank('/subdirs?encoding-type=url&delimiter=/&'
+                            'max-keys=2',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'ListBucketResult')
+        self.assertEqual(elem.find('./IsTruncated').text, 'true')
+        self.assertEqual(elem.find('./NextMarker').text,
+                         quote(u'but-\u062a/'.encode('utf-8')))
+
+    def test_bucket_GET_v2_is_truncated(self):
+        bucket_name = 'junk'
+
+        req = Request.blank(
+            '/%s?list-type=2&max-keys=%d' % (bucket_name, len(self.objects)),
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Authorization': 'AWS test:tester:hmac',
+                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'ListBucketResult')
+        self.assertEqual(elem.find('./KeyCount').text, str(len(self.objects)))
+        self.assertEqual(elem.find('./IsTruncated').text, 'false')
+
+        req = Request.blank(
+            '/%s?list-type=2&max-keys=%d' % (bucket_name,
+                                             len(self.objects) - 1),
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Authorization': 'AWS test:tester:hmac',
+                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'ListBucketResult')
+        self.assertIsNotNone(elem.find('./NextContinuationToken'))
+        self.assertEqual(elem.find('./KeyCount').text,
+                         str(len(self.objects) - 1))
+        self.assertEqual(elem.find('./IsTruncated').text, 'true')
+
+        req = Request.blank('/subdirs?list-type=2&delimiter=/&max-keys=2',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'ListBucketResult')
+        self.assertIsNotNone(elem.find('./NextContinuationToken'))
+        self.assertEqual(elem.find('./KeyCount').text, '2')
+        self.assertEqual(elem.find('./IsTruncated').text, 'true')
+
+    def test_bucket_GET_max_keys(self):
+        bucket_name = 'junk'
+
+        req = Request.blank('/%s?max-keys=5' % bucket_name,
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'ListBucketResult')
+        self.assertEqual(elem.find('./MaxKeys').text, '5')
+        _, path = self.swift.calls[-1]
+        _, query_string = path.split('?')
+        args = dict(parse_qsl(query_string))
+        self.assertEqual(args['limit'], '6')
+
+        req = Request.blank('/%s?max-keys=5000' % bucket_name,
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'ListBucketResult')
+        self.assertEqual(elem.find('./MaxKeys').text, '5000')
+        _, path = self.swift.calls[-1]
+        _, query_string = path.split('?')
+        args = dict(parse_qsl(query_string))
+        self.assertEqual(args['limit'], '1001')
+
+    def test_bucket_GET_str_max_keys(self):
+        bucket_name = 'junk'
+
+        req = Request.blank('/%s?max-keys=invalid' % bucket_name,
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+
+    def test_bucket_GET_negative_max_keys(self):
+        bucket_name = 'junk'
+
+        req = Request.blank('/%s?max-keys=-1' % bucket_name,
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+
+    def test_bucket_GET_over_32bit_int_max_keys(self):
+        bucket_name = 'junk'
+
+        req = Request.blank('/%s?max-keys=%s' %
+                            (bucket_name, MAX_32BIT_INT + 1),
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+
+    def test_bucket_GET_passthroughs(self):
+        bucket_name = 'junk'
+        req = Request.blank('/%s?delimiter=a&marker=b&prefix=c' % bucket_name,
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'ListBucketResult')
+        self.assertEqual(elem.find('./Prefix').text, 'c')
+        self.assertEqual(elem.find('./Marker').text, 'b')
+        self.assertEqual(elem.find('./Delimiter').text, 'a')
+        _, path = self.swift.calls[-1]
+        _, query_string = path.split('?')
+        args = dict(parse_qsl(query_string))
+        self.assertEqual(args['delimiter'], 'a')
+        self.assertEqual(args['marker'], 'b')
+        self.assertEqual(args['prefix'], 'c')
+
+    def test_bucket_GET_v2_passthroughs(self):
+        bucket_name = 'junk'
+        req = Request.blank(
+            '/%s?list-type=2&delimiter=a&start-after=b&prefix=c' % bucket_name,
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Authorization': 'AWS test:tester:hmac',
+                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'ListBucketResult')
+        self.assertEqual(elem.find('./Prefix').text, 'c')
+        self.assertEqual(elem.find('./StartAfter').text, 'b')
+        self.assertEqual(elem.find('./Delimiter').text, 'a')
+        _, path = self.swift.calls[-1]
+        _, query_string = path.split('?')
+        args = dict(parse_qsl(query_string))
+        self.assertEqual(args['delimiter'], 'a')
+        # "start-after" is converted to "marker"
+        self.assertEqual(args['marker'], 'b')
+        self.assertEqual(args['prefix'], 'c')
+
+    def test_bucket_GET_with_nonascii_queries(self):
+        bucket_name = 'junk'
+        req = Request.blank(
+            '/%s?delimiter=\xef\xbc\xa1&marker=\xef\xbc\xa2&'
+            'prefix=\xef\xbc\xa3' % bucket_name,
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Authorization': 'AWS test:tester:hmac',
+                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'ListBucketResult')
+        self.assertEqual(elem.find('./Prefix').text,
+                         swob.wsgi_to_str('\xef\xbc\xa3'))
+        self.assertEqual(elem.find('./Marker').text,
+                         swob.wsgi_to_str('\xef\xbc\xa2'))
+        self.assertEqual(elem.find('./Delimiter').text,
+                         swob.wsgi_to_str('\xef\xbc\xa1'))
+        _, path = self.swift.calls[-1]
+        _, query_string = path.split('?')
+        args = [part.partition('=')[::2] for part in query_string.split('&')]
+        self.assertEqual(sorted(args), [
+            ('delimiter', '%EF%BC%A1'),
+            ('limit', '1001'),
+            ('marker', '%EF%BC%A2'),
+            ('prefix', '%EF%BC%A3'),
+        ])
+
+        req = Request.blank(
+            '/%s?delimiter=\xef\xbc\xa1&marker=\xef\xbc\xa2&'
+            'prefix=\xef\xbc\xa3&encoding-type=url' % bucket_name,
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Authorization': 'AWS test:tester:hmac',
+                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'ListBucketResult')
+        self.assertEqual(elem.find('./Prefix').text, '%EF%BC%A3')
+        self.assertEqual(elem.find('./Marker').text, '%EF%BC%A2')
+        self.assertEqual(elem.find('./Delimiter').text, '%EF%BC%A1')
+        _, path = self.swift.calls[-1]
+        _, query_string = path.split('?')
+        args = [part.partition('=')[::2] for part in query_string.split('&')]
+        self.assertEqual(sorted(args), [
+            ('delimiter', '%EF%BC%A1'),
+            ('limit', '1001'),
+            ('marker', '%EF%BC%A2'),
+            ('prefix', '%EF%BC%A3'),
+        ])
+
+    def test_bucket_GET_v2_with_nonascii_queries(self):
+        bucket_name = 'junk'
+        req = Request.blank(
+            '/%s?list-type=2&delimiter=\xef\xbc\xa1&start-after=\xef\xbc\xa2&'
+            'prefix=\xef\xbc\xa3' % bucket_name,
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Authorization': 'AWS test:tester:hmac',
+                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'ListBucketResult')
+        self.assertEqual(elem.find('./Prefix').text,
+                         swob.wsgi_to_str('\xef\xbc\xa3'))
+        self.assertEqual(elem.find('./StartAfter').text,
+                         swob.wsgi_to_str('\xef\xbc\xa2'))
+        self.assertEqual(elem.find('./Delimiter').text,
+                         swob.wsgi_to_str('\xef\xbc\xa1'))
+        _, path = self.swift.calls[-1]
+        _, query_string = path.split('?')
+        args = [part.partition('=')[::2] for part in query_string.split('&')]
+        self.assertEqual(sorted(args), [
+            ('delimiter', '%EF%BC%A1'),
+            ('limit', '1001'),
+            ('marker', '%EF%BC%A2'),
+            ('prefix', '%EF%BC%A3'),
+        ])
+
+        req = Request.blank(
+            '/%s?list-type=2&delimiter=\xef\xbc\xa1&start-after=\xef\xbc\xa2&'
+            'prefix=\xef\xbc\xa3&encoding-type=url' % bucket_name,
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Authorization': 'AWS test:tester:hmac',
+                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'ListBucketResult')
+        self.assertEqual(elem.find('./Prefix').text, '%EF%BC%A3')
+        self.assertEqual(elem.find('./StartAfter').text, '%EF%BC%A2')
+        self.assertEqual(elem.find('./Delimiter').text, '%EF%BC%A1')
+        _, path = self.swift.calls[-1]
+        _, query_string = path.split('?')
+        args = [part.partition('=')[::2] for part in query_string.split('&')]
+        self.assertEqual(sorted(args), [
+            ('delimiter', '%EF%BC%A1'),
+            ('limit', '1001'),
+            ('marker', '%EF%BC%A2'),
+            ('prefix', '%EF%BC%A3'),
+        ])
+
+    def test_bucket_GET_with_delimiter_max_keys(self):
+        bucket_name = 'junk'
+        req = Request.blank('/%s?delimiter=a&max-keys=4' % bucket_name,
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+        elem = fromstring(body, 'ListBucketResult')
+        self.assertEqual(elem.find('./NextMarker').text,
+                         self.objects_list[3]['name'])
+        self.assertEqual(elem.find('./MaxKeys').text, '4')
+        self.assertEqual(elem.find('./IsTruncated').text, 'true')
+
+    def test_bucket_GET_v2_with_delimiter_max_keys(self):
+        bucket_name = 'junk'
+        req = Request.blank(
+            '/%s?list-type=2&delimiter=a&max-keys=2' % bucket_name,
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Authorization': 'AWS test:tester:hmac',
+                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+        elem = fromstring(body, 'ListBucketResult')
+        next_token = elem.find('./NextContinuationToken')
+        self.assertIsNotNone(next_token)
+        self.assertEqual(elem.find('./MaxKeys').text, '2')
+        self.assertEqual(elem.find('./IsTruncated').text, 'true')
+
+        req = Request.blank(
+            '/%s?list-type=2&delimiter=a&max-keys=2&continuation-token=%s' %
+            (bucket_name, next_token.text),
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Authorization': 'AWS test:tester:hmac',
+                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+        elem = fromstring(body, 'ListBucketResult')
+        names = [o.find('./Key').text for o in elem.iterchildren('Contents')]
+        self.assertEqual(names[0], 'lily')
+
+    def test_bucket_GET_subdir_with_delimiter_max_keys(self):
+        bucket_name = 'junk-subdir'
+        req = Request.blank('/%s?delimiter=a&max-keys=1' % bucket_name,
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+        elem = fromstring(body, 'ListBucketResult')
+        self.assertEqual(elem.find('./NextMarker').text, 'rose')
+        self.assertEqual(elem.find('./MaxKeys').text, '1')
+        self.assertEqual(elem.find('./IsTruncated').text, 'true')
+
+    def test_bucket_GET_v2_fetch_owner(self):
+        bucket_name = 'junk'
+        req = Request.blank('/%s?list-type=2' % bucket_name,
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+
+        elem = fromstring(body, 'ListBucketResult')
+        name = elem.find('./Name').text
+        self.assertEqual(name, bucket_name)
+
+        objects = elem.iterchildren('Contents')
+        for o in objects:
+            self.assertIsNone(o.find('./Owner'))
+
+        req = Request.blank('/%s?list-type=2&fetch-owner=true' % bucket_name,
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+
+        elem = fromstring(body, 'ListBucketResult')
+        name = elem.find('./Name').text
+        self.assertEqual(name, bucket_name)
+
+        objects = elem.iterchildren('Contents')
+        for o in objects:
+            self.assertIsNotNone(o.find('./Owner'))
+
+    def test_bucket_GET_with_versions_versioning_not_configured(self):
+        for obj in self.objects:
+            self.swift.register(
+                'HEAD', '/v1/AUTH_test/junk/%s' % quote(obj[0].encode('utf8')),
+                swob.HTTPOk, {}, None)
+
+        self._add_versions_request(versioned_objects=[])
+        req = Request.blank('/junk?versions',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+
+        self.assertEqual(status.split()[0], '200')
+        elem = fromstring(body, 'ListVersionsResult')
+        self.assertEqual(elem.find('./Name').text, 'junk')
+        self.assertIsNone(elem.find('./Prefix').text)
+        self.assertIsNone(elem.find('./KeyMarker').text)
+        self.assertIsNone(elem.find('./VersionIdMarker').text)
+        self.assertEqual(elem.find('./MaxKeys').text, '1000')
+        self.assertEqual(elem.find('./IsTruncated').text, 'false')
+        self.assertEqual(elem.findall('./DeleteMarker'), [])
+        versions = elem.findall('./Version')
+        objects = list(self.objects)
+        expected = [v[0] for v in objects]
+        self.assertEqual([v.find('./Key').text for v in versions], expected)
+        self.assertEqual([v.find('./IsLatest').text for v in versions],
+                         ['true' for v in objects])
+        self.assertEqual([v.find('./VersionId').text for v in versions],
+                         ['null' for v in objects])
+        # Last modified in self.objects is 2011-01-05T02:19:14.275290 but
+        # the returned value is rounded up to 2011-01-05T02:19:15Z
+        self.assertEqual([v.find('./LastModified').text for v in versions],
+                         ['2011-01-05T02:19:15.000Z'] * len(objects))
+        self.assertEqual([v.find('./ETag').text for v in versions],
+                         [PFS_ETAG if v[0] == 'pfs-obj' else
+                          '"0-N"' if v[0] == 'slo' else '"0"'
+                          for v in objects])
+        self.assertEqual([v.find('./Size').text for v in versions],
+                         [str(v[3]) for v in objects])
+        self.assertEqual([v.find('./Owner/ID').text for v in versions],
+                         ['test:tester' for v in objects])
+        self.assertEqual([v.find('./Owner/DisplayName').text
+                          for v in versions],
+                         ['test:tester' for v in objects])
+        self.assertEqual([v.find('./StorageClass').text for v in versions],
+                         ['STANDARD' for v in objects])
+
+    def test_bucket_GET_with_versions(self):
+        self._add_versions_request()
+        req = Request.blank('/junk?versions',
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+
+        self.assertEqual(status.split()[0], '200')
+        elem = fromstring(body, 'ListVersionsResult')
+        self.assertEqual(elem.find('./Name').text, 'junk')
+        self._assert_delete_markers(elem)
+        versions = elem.findall('./Version')
+        self.assertEqual(len(versions), len(self.objects) + 1)
+
+        expected = []
+        for o in self.objects_list:
+            name = o['name']
+            expected.append((name, 'true', 'null'))
+            if name == 'rose':
+                expected.append((name, 'false', '1'))
+        discovered = [
+            tuple(e.find('./%s' % key).text for key in (
+                'Key', 'IsLatest', 'VersionId'))
+            for e in versions
+        ]
+        self.assertEqual(expected, discovered)
+
+    def test_bucket_GET_with_versions_with_max_keys(self):
+        self._add_versions_request()
+        req = Request.blank('/junk?versions&max-keys=7',
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+
+        self.assertEqual(status.split()[0], '200')
+        elem = fromstring(body, 'ListVersionsResult')
+        self.assertEqual(elem.find('./MaxKeys').text, '7')
+        self.assertEqual(elem.find('./IsTruncated').text, 'true')
+        self._assert_delete_markers(elem)
+        versions = elem.findall('./Version')
+        self.assertEqual(len(versions), 6)
+
+        expected = []
+        for o in self.objects_list[:5]:
+            name = o['name']
+            expected.append((name, 'true', 'null'))
+            if name == 'rose':
+                expected.append((name, 'false', '1'))
+        discovered = [
+            tuple(e.find('./%s' % key).text for key in (
+                'Key', 'IsLatest', 'VersionId'))
+            for e in versions
+        ]
+        self.assertEqual(expected, discovered)
+
+    def test_bucket_GET_with_versions_with_max_keys_and_key_marker(self):
+        self._add_versions_request(orig_objects=self.objects_list[4:])
+        req = Request.blank('/junk?versions&max-keys=3&key-marker=ros',
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+
+        self.assertEqual(status.split()[0], '200')
+        elem = fromstring(body, 'ListVersionsResult')
+        self.assertEqual(elem.find('./MaxKeys').text, '3')
+        self.assertEqual(elem.find('./IsTruncated').text, 'true')
+        self._assert_delete_markers(elem)
+        versions = elem.findall('./Version')
+        self.assertEqual(len(versions), 2)
+
+        expected = [
+            ('rose', 'true', 'null'),
+            ('rose', 'false', '1'),
+        ]
+        discovered = [
+            tuple(e.find('./%s' % key).text for key in (
+                'Key', 'IsLatest', 'VersionId'))
+            for e in versions
+        ]
+        self.assertEqual(expected, discovered)
+
+    def test_bucket_GET_versions_with_key_marker_and_version_id_marker(self):
+        container_listing = [{
+            "bytes": 8192,
+            "content_type": "binary/octet-stream",
+            "hash": "221994040b14294bdf7fbc128e66633c",
+            "last_modified": "2019-08-16T19:39:53.152780",
+            "name": "subdir/foo",
+        }]
+        versions_listing = [{
+            'bytes': 0,
+            'content_type': DELETE_MARKER_CONTENT_TYPE,
+            'hash': '0',
+            "last_modified": "2019-08-19T19:05:33.565940",
+            'name': 'subdir/bar',
+            "version_id": "1565241533.55320",
+            'is_latest': True,
+        }, {
+            "bytes": 8192,
+            "content_type": "binary/octet-stream",
+            "hash": "221994040b14294bdf7fbc128e66633c",
+            "last_modified": "2019-08-16T19:39:53.508510",
+            "name": "subdir/bar",
+            "version_id": "1564984393.68962",
+            'is_latest': False,
+        }, {
+            "bytes": 8192,
+            "content_type": "binary/octet-stream",
+            "hash": "221994040b14294bdf7fbc128e66633c",
+            "last_modified": "2019-08-16T19:39:42.673260",
+            "name": "subdir/foo",
+            "version_id": "1565984382.67326",
+            'is_latest': False,
+        }]
+        self._add_versions_request(container_listing, versions_listing,
+                                   bucket='mybucket')
+        req = Request.blank(
+            '/mybucket?versions&key-marker=subdir/bar&'
+            'version-id-marker=1566589611.065522',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Authorization': 'AWS test:tester:hmac',
+                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+        elem = fromstring(body, 'ListVersionsResult')
+        self.assertEqual(elem.find('./IsTruncated').text, 'false')
+        delete_markers = elem.findall('./DeleteMarker')
+        self.assertEqual(['subdir/bar'], [
+            o.find('Key').text for o in delete_markers])
+        expected = [
+            ('subdir/bar', 'false', '1564984393.68962'),
+            ('subdir/foo', 'true', 'null'),
+            ('subdir/foo', 'false', '1565984382.67326'),
+        ]
+        discovered = [
+            tuple(e.find('./%s' % key).text for key in (
+                'Key', 'IsLatest', 'VersionId'))
+            for e in elem.findall('./Version')
+        ]
+        self.assertEqual(expected, discovered)
+
+        self._add_versions_request(container_listing, versions_listing[1:],
+                                   bucket='mybucket')
+        req = Request.blank(
+            '/mybucket?versions&key-marker=subdir/bar&'
+            'version-id-marker=1565241533.55320',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Authorization': 'AWS test:tester:hmac',
+                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+        elem = fromstring(body, 'ListVersionsResult')
+        self.assertEqual(elem.find('./IsTruncated').text, 'false')
+        delete_markers = elem.findall('./DeleteMarker')
+        self.assertEqual(0, len(delete_markers))
+        expected = [
+            ('subdir/bar', 'false', '1564984393.68962'),
+            ('subdir/foo', 'true', 'null'),
+            ('subdir/foo', 'false', '1565984382.67326'),
+        ]
+        discovered = [
+            tuple(e.find('./%s' % key).text for key in (
+                'Key', 'IsLatest', 'VersionId'))
+            for e in elem.findall('./Version')
+        ]
+        self.assertEqual(expected, discovered)
+
+        self._add_versions_request([], versions_listing[-1:],
+                                   bucket='mybucket')
+        req = Request.blank(
+            '/mybucket?versions&key-marker=subdir/foo&'
+            'version-id-marker=null',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Authorization': 'AWS test:tester:hmac',
+                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+        elem = fromstring(body, 'ListVersionsResult')
+        self.assertEqual(elem.find('./IsTruncated').text, 'false')
+        delete_markers = elem.findall('./DeleteMarker')
+        self.assertEqual(0, len(delete_markers))
+        expected = [
+            ('subdir/foo', 'false', '1565984382.67326'),
+        ]
+        discovered = [
+            tuple(e.find('./%s' % key).text for key in (
+                'Key', 'IsLatest', 'VersionId'))
+            for e in elem.findall('./Version')
+        ]
+        self.assertEqual(expected, discovered)
+
+    def test_bucket_GET_versions_with_version_id_marker(self):
+        self._add_versions_request()
+        req = Request.blank(
+            '/junk?versions',
+            headers={'Authorization': 'AWS test:tester:hmac',
+                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+
+        # sanity
+        elem = fromstring(body, 'ListVersionsResult')
+        expected = [('rose', 'false', '2')]
+        discovered = [
+            tuple(e.find('./%s' % key).text for key in (
+                'Key', 'IsLatest', 'VersionId'))
+            for e in elem.findall('./DeleteMarker')
+        ]
+        self.assertEqual(expected, discovered)
+        expected = [
+            ('lily', 'true', 'null'),
+            ('lily-\u062a', 'true', 'null'),
+            ('mu', 'true', 'null'),
+            ('pfs-obj', 'true', 'null'),
+            ('rose', 'true', 'null'),
+            ('rose', 'false', '1'),
+            ('slo', 'true', 'null'),
+            ('viola', 'true', 'null'),
+            ('with space', 'true', 'null'),
+            ('with%20space', 'true', 'null'),
+        ]
+
+        discovered = [
+            tuple(e.find('./%s' % key).text for key in (
+                'Key', 'IsLatest', 'VersionId'))
+            for e in elem.findall('./Version')
+        ]
+        self.assertEqual(expected, discovered)
+
+        self._add_versions_request(self.objects_list[5:])
+        req = Request.blank(
+            '/junk?versions&key-marker=rose&version-id-marker=null',
+            headers={'Authorization': 'AWS test:tester:hmac',
+                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+
+        self.assertEqual(status.split()[0], '200')
+        elem = fromstring(body, 'ListVersionsResult')
+        self.assertEqual(elem.find('./IsTruncated').text, 'false')
+        delete_markers = elem.findall('./DeleteMarker')
+        self.assertEqual(len(delete_markers), 1)
+
+        expected = [
+            ('rose', 'false', '1'),
+            ('slo', 'true', 'null'),
+            ('viola', 'true', 'null'),
+            ('with space', 'true', 'null'),
+            ('with%20space', 'true', 'null'),
+        ]
+        discovered = [
+            tuple(e.find('./%s' % key).text for key in (
+                'Key', 'IsLatest', 'VersionId'))
+            for e in elem.findall('./Version')
+        ]
+        self.assertEqual(expected, discovered)
+
+        # N.B. versions are sorted most recent to oldest
+        self._add_versions_request(self.objects_list[5:],
+                                   self.versioned_objects[1:])
+        req = Request.blank(
+            '/junk?versions&key-marker=rose&version-id-marker=2',
+            headers={'Authorization': 'AWS test:tester:hmac',
+                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+
+        self.assertEqual(status.split()[0], '200')
+        elem = fromstring(body, 'ListVersionsResult')
+        self.assertEqual(elem.find('./IsTruncated').text, 'false')
+        delete_markers = elem.findall('./DeleteMarker')
+        self.assertEqual(len(delete_markers), 0)
+
+        expected = [
+            ('rose', 'false', '1'),
+            ('slo', 'true', 'null'),
+            ('viola', 'true', 'null'),
+            ('with space', 'true', 'null'),
+            ('with%20space', 'true', 'null'),
+        ]
+        discovered = [
+            tuple(e.find('./%s' % key).text for key in (
+                'Key', 'IsLatest', 'VersionId'))
+            for e in elem.findall('./Version')
+        ]
+        self.assertEqual(expected, discovered)
+
+        self._add_versions_request(self.objects_list[5:],
+                                   self.versioned_objects[2:])
+        req = Request.blank(
+            '/junk?versions&key-marker=rose&version-id-marker=1',
+            headers={'Authorization': 'AWS test:tester:hmac',
+                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+
+        self.assertEqual(status.split()[0], '200')
+        elem = fromstring(body, 'ListVersionsResult')
+        self.assertEqual(elem.find('./IsTruncated').text, 'false')
+        delete_markers = elem.findall('./DeleteMarker')
+        self.assertEqual(len(delete_markers), 0)
+
+        expected = [
+            ('slo', 'true', 'null'),
+            ('viola', 'true', 'null'),
+            ('with space', 'true', 'null'),
+            ('with%20space', 'true', 'null'),
+        ]
+        discovered = [
+            tuple(e.find('./%s' % key).text for key in (
+                'Key', 'IsLatest', 'VersionId'))
+            for e in elem.findall('./Version')
+        ]
+        self.assertEqual(expected, discovered)
+
+    def test_bucket_GET_versions_non_existent_version_id_marker(self):
+        self._add_versions_request(orig_objects=self.objects_list[5:])
+        req = Request.blank(
+            '/junk?versions&key-marker=rose&'
+            'version-id-marker=null',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Authorization': 'AWS test:tester:hmac',
+                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+
+        self.assertEqual(status.split()[0], '200', body)
+        elem = fromstring(body, 'ListVersionsResult')
+        self.assertEqual(elem.find('./Name').text, 'junk')
+        delete_markers = elem.findall('./DeleteMarker')
+        self.assertEqual(len(delete_markers), 1)
+
+        expected = [
+            ('rose', 'false', '1'),
+            ('slo', 'true', 'null'),
+            ('viola', 'true', 'null'),
+            ('with space', 'true', 'null'),
+            ('with%20space', 'true', 'null'),
+        ]
+        discovered = [
+            tuple(e.find('./%s' % key).text for key in (
+                'Key', 'IsLatest', 'VersionId'))
+            for e in elem.findall('./Version')
+        ]
+        self.assertEqual(expected, discovered)
+        self.assertEqual(self.swift.calls, [
+            ('GET', normalize_path('/v1/AUTH_test/junk?'
+             'limit=1001&marker=rose&version_marker=null&versions=')),
+        ])
+
+    def test_bucket_GET_versions_prefix(self):
+        container_listing = [{
+            "bytes": 8192,
+            "content_type": "binary/octet-stream",
+            "hash": "221994040b14294bdf7fbc128e66633c",
+            "last_modified": "2019-08-16T19:39:53.152780",
+            "name": "subdir/foo",
+        }]
+        versions_listing = [{
+            "bytes": 8192,
+            "content_type": "binary/octet-stream",
+            "hash": "221994040b14294bdf7fbc128e66633c",
+            "last_modified": "2019-08-16T19:39:53.508510",
+            "name": "subdir/bar",
+            "version_id": "1565984393.68962",
+            "is_latest": True,
+        }, {
+            'bytes': 0,
+            'content_type': DELETE_MARKER_CONTENT_TYPE,
+            'hash': '0',
+            "last_modified": "2019-08-19T19:05:33.565940",
+            'name': 'subdir/bar',
+            'version_id': '1566241533.55320',
+            'is_latest': False,
+        }, {
+            "bytes": 8192,
+            "content_type": "binary/octet-stream",
+            "hash": "221994040b14294bdf7fbc128e66633c",
+            "last_modified": "2019-08-16T19:39:42.673260",
+            "name": "subdir/foo",
+            "version_id": "1565984382.67326",
+            'is_latest': False,
+        }]
+        self._add_versions_request(container_listing, versions_listing)
+        req = Request.blank(
+            '/junk?versions&prefix=subdir/',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Authorization': 'AWS test:tester:hmac',
+                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+
+        self.assertEqual(status.split()[0], '200')
+        elem = fromstring(body, 'ListVersionsResult')
+        self.assertEqual(elem.find('./Name').text, 'junk')
+        delete_markers = elem.findall('./DeleteMarker')
+        self.assertEqual(len(delete_markers), 1)
+
+        expected = [
+            ('subdir/bar', 'true', '1565984393.68962'),
+            ('subdir/foo', 'true', 'null'),
+            ('subdir/foo', 'false', '1565984382.67326'),
+        ]
+        discovered = [
+            tuple(e.find('./%s' % key).text for key in (
+                'Key', 'IsLatest', 'VersionId'))
+            for e in elem.findall('./Version')
+        ]
+        self.assertEqual(expected, discovered)
+
+        self.assertEqual(self.swift.calls, [
+            ('GET', normalize_path('/v1/AUTH_test/junk'
+             '?limit=1001&prefix=subdir/&versions=')),
+        ])
+
+    def test_bucket_PUT_with_mixed_case_location(self):
+        self.s3api.conf.location = 'RegionOne'
+        elem = Element('CreateBucketConfiguration')
+        # We've observed some clients (like aws-sdk-net) shift regions
+        # to lower case
+        SubElement(elem, 'LocationConstraint').text = 'regionone'
+        headers = {
+            'Authorization': 'AWS4-HMAC-SHA256 ' + ', '.join([
+                'Credential=test:tester/%s/regionone/s3/aws4_request' %
+                self.get_v4_amz_date_header().split('T', 1)[0],
+                'SignedHeaders=host',
+                'Signature=X',
+            ]),
+            'Date': self.get_date_header(),
+            'x-amz-content-sha256': 'UNSIGNED-PAYLOAD',
+        }
+        req = Request.blank('/bucket',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers=headers,
+                            body=tostring(elem))
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200', body)
+
+    def test_bucket_PUT_v4_with_body(self):
+        elem = Element('CreateBucketConfiguration')
+        SubElement(elem, 'LocationConstraint').text = self.s3api.conf.location
+        req_body = tostring(elem)
+        body_sha = sha256(req_body).hexdigest()
+        headers = {
+            'Authorization': 'AWS4-HMAC-SHA256 ' + ', '.join([
+                'Credential=test:tester/%s/us-east-1/s3/aws4_request' %
+                self.get_v4_amz_date_header().split('T', 1)[0],
+                'SignedHeaders=host',
+                'Signature=X',
+            ]),
+            'Date': self.get_date_header(),
+            'x-amz-content-sha256': body_sha,
+        }
+        req = Request.blank('/bucket',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers=headers,
+                            body=req_body)
+
+        # Test V4 bucket creation and access_user_id setting
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200', body)
+
+        # Verify access_user_id is set correctly in environ for V4 bucket
+        # creation
+        self.assertEqual(req.environ['swift.access_logging']['user_id'],
+                         'test:tester')
+
+    def test_bucket_PUT_v4_with_body_bad_hash(self):
+        elem = Element('CreateBucketConfiguration')
+        SubElement(elem, 'LocationConstraint').text = self.s3api.conf.location
+        req_body = tostring(elem)
+        headers = {
+            'Authorization': 'AWS4-HMAC-SHA256 ' + ', '.join([
+                'Credential=test:tester/%s/us-east-1/s3/aws4_request' %
+                self.get_v4_amz_date_header().split('T', 1)[0],
+                'SignedHeaders=host',
+                'Signature=X',
+            ]),
+            'Date': self.get_date_header(),
+            'x-amz-content-sha256': '0' * 64,
+        }
+        req = Request.blank('/bucket',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers=headers,
+                            body=req_body)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '400')
+        self.assertEqual(self._get_error_code(body),
+                         'XAmzContentSHA256Mismatch')
+        self.assertIn(b'x-amz-content-sha256', body)
+        # we maybe haven't parsed the location/path yet?
+        self.assertNotIn('swift.backend_path', req.environ)
+
+    def test_bucket_PUT_with_canned_acl(self):
+        req = Request.blank('/bucket',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'X-Amz-Acl': 'public-read'})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+        _, _, headers = self.swift.calls_with_headers[-1]
+        self.assertTrue('X-Container-Read' in headers)
+        self.assertEqual(headers.get('X-Container-Read'), '.r:*,.rlistings')
+        self.assertNotIn('X-Container-Sysmeta-S3api-Acl', headers)
+
+
+class TestS3ApiBucketAcl(BaseS3ApiBucket, S3ApiTestCaseAcl):
+    def test_bucket_PUT_with_canned_s3acl(self):
+        account = 'test:tester'
+        acl = \
+            encode_acl('container', ACLPublicRead(Owner(account, account)))
+        req = Request.blank('/bucket',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'X-Amz-Acl': 'public-read'})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+        _, _, headers = self.swift.calls_with_headers[-1]
+        self.assertNotIn('X-Container-Read', headers)
+        self.assertIn('X-Container-Sysmeta-S3api-Acl', headers)
+        self.assertEqual(headers.get('X-Container-Sysmeta-S3api-Acl'),
+                         acl['x-container-sysmeta-s3api-acl'])
+
+    def test_bucket_PUT_error_non_swift_owner(self):
+        code = self._test_method_error('PUT', '/bucket', swob.HTTPAccepted,
+                                       env={'swift_owner': False})
+        self.assertEqual(code, 'AccessDenied')
+
+    def _test_bucket_for_s3acl(self, method, account):
+        req = Request.blank('/bucket',
+                            environ={'REQUEST_METHOD': method},
+                            headers={'Authorization': 'AWS %s:hmac' % account,
+                                     'Date': self.get_date_header()})
+
+        return self.call_s3api(req)
+
+    def test_bucket_GET_without_permission(self):
+        status, headers, body = self._test_bucket_for_s3acl('GET',
+                                                            'test:other')
+        self.assertEqual(self._get_error_code(body), 'AccessDenied')
+
+    def test_bucket_GET_with_read_permission(self):
+        status, headers, body = self._test_bucket_for_s3acl('GET',
+                                                            'test:read')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_bucket_GET_with_fullcontrol_permission(self):
+        status, headers, body = \
+            self._test_bucket_for_s3acl('GET', 'test:full_control')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_bucket_GET_with_owner_permission(self):
+        status, headers, body = self._test_bucket_for_s3acl('GET',
+                                                            'test:tester')
+        self.assertEqual(status.split()[0], '200')
+
+    def _test_bucket_GET_canned_acl(self, bucket):
+        req = Request.blank('/%s' % bucket,
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+
+        return self.call_s3api(req)
+
+    def test_bucket_GET_authenticated_users(self):
+        status, headers, body = \
+            self._test_bucket_GET_canned_acl('authenticated')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_bucket_GET_all_users(self):
+        status, headers, body = self._test_bucket_GET_canned_acl('public')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_bucket_DELETE_without_permission(self):
+        status, headers, body = self._test_bucket_for_s3acl('DELETE',
+                                                            'test:other')
+        self.assertEqual(self._get_error_code(body), 'AccessDenied')
+        # Don't delete anything in backend Swift
+        called = [method for method, _, _ in self.swift.calls_with_headers]
+        self.assertNotIn('DELETE', called)
+
+    def test_bucket_DELETE_with_write_permission(self):
+        status, headers, body = self._test_bucket_for_s3acl('DELETE',
+                                                            'test:write')
+        self.assertEqual(self._get_error_code(body), 'AccessDenied')
+        # Don't delete anything in backend Swift
+        called = [method for method, _, _ in self.swift.calls_with_headers]
+        self.assertNotIn('DELETE', called)
+
+    def test_bucket_DELETE_with_fullcontrol_permission(self):
+        status, headers, body = \
+            self._test_bucket_for_s3acl('DELETE', 'test:full_control')
+        self.assertEqual(self._get_error_code(body), 'AccessDenied')
+        # Don't delete anything in backend Swift
+        called = [method for method, _, _ in self.swift.calls_with_headers]
+        self.assertNotIn('DELETE', called)
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/s3api/test_cfg.py b/test/unit/common/middleware/s3api/test_cfg.py
new file mode 100644
index 0000000000..64ffc0fa30
--- /dev/null
+++ b/test/unit/common/middleware/s3api/test_cfg.py
@@ -0,0 +1,45 @@
+# Copyright (c) 2014 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+
+from swift.common.middleware.s3api.utils import Config
+
+
+class TestS3ApiCfg(unittest.TestCase):
+    def test_config(self):
+        conf = Config(
+            {
+                'a': 'str',
+                'b': 10,
+                'c': True,
+            }
+        )
+
+        conf.update(
+            {
+                'a': 'str2',
+                'b': '100',
+                'c': 'false',
+            }
+        )
+
+        self.assertEqual(conf['a'], 'str2')
+        self.assertEqual(conf['b'], 100)
+        self.assertEqual(conf['c'], False)
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/s3api/test_etree.py b/test/unit/common/middleware/s3api/test_etree.py
new file mode 100644
index 0000000000..fea608e35b
--- /dev/null
+++ b/test/unit/common/middleware/s3api/test_etree.py
@@ -0,0 +1,73 @@
+# Copyright (c) 2014 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+
+from swift.common.middleware.s3api import etree
+
+
+class TestS3ApiEtree(unittest.TestCase):
+    def test_xml_namespace(self):
+        def test_xml(ns, prefix):
+            return '<A %(ns)s><%(prefix)sB>C</%(prefix)sB></A>' % \
+                ({'ns': ns, 'prefix': prefix})
+
+        # No namespace is same as having the S3 namespace.
+        xml = test_xml('', '')
+        elem = etree.fromstring(xml)
+        self.assertEqual(elem.find('./B').text, 'C')
+
+        # The S3 namespace is handled as no namespace.
+        xml = test_xml('xmlns="%s"' % etree.XMLNS_S3, '')
+        elem = etree.fromstring(xml)
+        self.assertEqual(elem.find('./B').text, 'C')
+
+        xml = test_xml('xmlns:s3="%s"' % etree.XMLNS_S3, 's3:')
+        elem = etree.fromstring(xml)
+        self.assertEqual(elem.find('./B').text, 'C')
+
+        # Any namespaces without a prefix work as no namespace.
+        xml = test_xml('xmlns="http://example.com/"', '')
+        elem = etree.fromstring(xml)
+        self.assertEqual(elem.find('./B').text, 'C')
+
+        xml = test_xml('xmlns:s3="http://example.com/"', 's3:')
+        elem = etree.fromstring(xml)
+        self.assertIsNone(elem.find('./B'))
+
+    def test_xml_with_comments(self):
+        xml = '<A><!-- comment --><B>C</B></A>'
+        elem = etree.fromstring(xml)
+        self.assertEqual(elem.find('./B').text, 'C')
+
+    def test_tostring_with_nonascii_text(self):
+        elem = etree.Element('Test')
+        sub = etree.SubElement(elem, 'FOO')
+        sub.text = '\xef\xbc\xa1'
+        self.assertIsInstance(sub.text, str)
+        xml_string = etree.tostring(elem)
+        self.assertIsInstance(xml_string, bytes)
+
+    def test_fromstring_with_nonascii_text(self):
+        input_str = b'<?xml version="1.0" encoding="UTF-8"?>\n' \
+                    b'<Test><FOO>\xef\xbc\xa1</FOO></Test>'
+        elem = etree.fromstring(input_str)
+        text = elem.find('FOO').text
+        self.assertEqual(text, b'\xef\xbc\xa1'.decode('utf8'))
+        self.assertIsInstance(text, str)
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/s3api/test_location.py b/test/unit/common/middleware/s3api/test_location.py
new file mode 100644
index 0000000000..c8524e6705
--- /dev/null
+++ b/test/unit/common/middleware/s3api/test_location.py
@@ -0,0 +1,51 @@
+# Copyright (c) 2014 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+
+from swift.common.swob import Request
+
+from test.unit.common.middleware.s3api import S3ApiTestCase
+from swift.common.middleware.s3api.etree import fromstring
+
+
+class TestS3ApiLocation(S3ApiTestCase):
+
+    def test_object_location(self):
+        req = Request.blank('/bucket?location',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+        elem = fromstring(body, 'LocationConstraint')
+        location = elem.text
+        self.assertIsNone(location)
+
+    def test_object_location_setting_as_us_west_1(self):
+        self.s3api.conf.location = 'us-west-1'
+        req = Request.blank('/bucket?location',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+        elem = fromstring(body, 'LocationConstraint')
+        location = elem.text
+        self.assertEqual(location, 'us-west-1')
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/s3api/test_logging.py b/test/unit/common/middleware/s3api/test_logging.py
new file mode 100644
index 0000000000..6f0b2655ae
--- /dev/null
+++ b/test/unit/common/middleware/s3api/test_logging.py
@@ -0,0 +1,67 @@
+# Copyright (c) 2014 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+
+from swift.common.swob import Request
+
+from test.unit.common.middleware.s3api import S3ApiTestCase
+from swift.common.middleware.s3api.etree import fromstring
+
+
+class TestS3ApiLogging(S3ApiTestCase):
+
+    def setUp(self):
+        super(TestS3ApiLogging, self).setUp()
+
+    def test_bucket_logging_GET(self):
+        req = Request.blank('/bucket?logging',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        xml = fromstring(body, 'BucketLoggingStatus')
+        self.assertEqual(xml.keys(), [])
+        self.assertEqual(status.split()[0], '200')
+
+    def test_object_logging_GET_error(self):
+        req = Request.blank('/bucket/object?logging',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'NoLoggingStatusForKey')
+
+    def test_bucket_logging_PUT(self):
+        req = Request.blank('/bucket?logging',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        # FIXME: Support PUT logging
+        # self.assertEqual(status, 201)
+        self.assertEqual(self._get_error_code(body), 'NotImplemented')
+
+    def test_object_logging_PUT_error(self):
+        req = Request.blank('/bucket/object?logging',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'NoLoggingStatusForKey')
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/s3api/test_multi_delete.py b/test/unit/common/middleware/s3api/test_multi_delete.py
new file mode 100644
index 0000000000..7c2cf6027c
--- /dev/null
+++ b/test/unit/common/middleware/s3api/test_multi_delete.py
@@ -0,0 +1,763 @@
+# -*- coding: utf-8 -*-
+# Copyright (c) 2014 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import base64
+import hashlib
+import json
+import unittest
+from datetime import datetime
+from unittest import mock
+
+from swift.common import swob
+from swift.common.swob import Request
+
+from test.unit import make_timestamp_iter
+from test.unit.common.middleware.s3api import S3ApiTestCase, S3ApiTestCaseAcl
+from test.unit.common.middleware.s3api.helpers import UnreadableInput
+from swift.common.middleware.s3api.etree import fromstring, tostring, \
+    Element, SubElement
+from swift.common.utils import checksum, md5
+
+
+class BaseS3ApiMultiDelete(object):
+
+    def setUp(self):
+        super(BaseS3ApiMultiDelete, self).setUp()
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/Key1',
+                            swob.HTTPOk, {}, None)
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/Key2',
+                            swob.HTTPNotFound, {}, None)
+        self.swift.register('HEAD',
+                            '/v1/AUTH_test/bucket/business/caf\xc3\xa9',
+                            swob.HTTPOk, {}, None)
+        self.ts = make_timestamp_iter()
+
+    def test_object_multi_DELETE_to_object(self):
+        elem = Element('Delete')
+        obj = SubElement(elem, 'Object')
+        SubElement(obj, 'Key').text = 'object'
+        body = tostring(elem, use_s3ns=False)
+        content_md5 = base64.b64encode(
+            md5(body, usedforsecurity=False).digest()).strip()
+
+        req = Request.blank('/bucket/object?delete',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'Content-MD5': content_md5},
+                            body=body)
+
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+
+    def test_object_multi_DELETE_no_content_md5(self):
+        elem = Element('Delete')
+        obj = SubElement(elem, 'Object')
+        SubElement(obj, 'Key').text = 'object'
+        body = tostring(elem, use_s3ns=False)
+
+        req = Request.blank('/bucket/object?delete',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     },
+                            body=body)
+
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '400')
+        self.assertEqual(self._get_error_code(body), 'InvalidRequest')
+        self.assertIn(b'Missing required header', body)
+        self.assertIn(b'Content-MD5', body)
+
+    def test_object_multi_DELETE_sha256_invalid(self):
+        elem = Element('Delete')
+        obj = SubElement(elem, 'Object')
+        SubElement(obj, 'Key').text = 'object'
+        body = tostring(elem, use_s3ns=False)
+        content_sha256 = 'invalid'
+
+        req = Request.blank('/bucket/object?delete',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'X-Amz-Content-SHA256': content_sha256,
+                                     },
+                            body=body)
+
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '400')
+        self.assertEqual(self._get_error_code(body),
+                         'XAmzContentSHA256Mismatch')
+        self.assertIn(b"provided 'x-amz-content-sha256' header "
+                      b"does not match", body)
+
+    def test_object_multi_DELETE_sha256_bad(self):
+        elem = Element('Delete')
+        obj = SubElement(elem, 'Object')
+        SubElement(obj, 'Key').text = 'object'
+        body = tostring(elem, use_s3ns=False)
+        content_sha256 = hashlib.sha256(body[:-1]).hexdigest()
+
+        req = Request.blank('/bucket/object?delete',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'X-Amz-Content-SHA256': content_sha256,
+                                     },
+                            body=body)
+
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '400')
+        self.assertEqual(self._get_error_code(body),
+                         'XAmzContentSHA256Mismatch')
+        self.assertIn(b"provided 'x-amz-content-sha256' header "
+                      b"does not match", body)
+
+    def test_object_multi_DELETE_sha256_valid(self):
+        elem = Element('Delete')
+        obj = SubElement(elem, 'Object')
+        SubElement(obj, 'Key').text = 'object'
+        body = tostring(elem, use_s3ns=False)
+        content_sha256 = hashlib.sha256(body).hexdigest()
+
+        req = Request.blank('/bucket/object?delete',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'X-Amz-Content-SHA256': content_sha256,
+                                     },
+                            body=body)
+
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '400')
+        self.assertIn(b'<Code>InvalidRequest</Code>', body)
+        self.assertIn(b'<Message>Missing required header for this request: '
+                      b'Content-MD5 OR x-amz-checksum-*</Message>', body)
+
+    def test_object_multi_DELETE_crc32_valid(self):
+        elem = Element('Delete')
+        obj = SubElement(elem, 'Object')
+        SubElement(obj, 'Key').text = 'object'
+        body = tostring(elem, use_s3ns=False)
+        content_crc32 = base64.b64encode(checksum.crc32(body).digest()).strip()
+
+        req = Request.blank('/bucket/object?delete',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'X-Amz-Checksum-CRC32': content_crc32,
+                                     },
+                            body=body)
+
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+
+    def test_object_multi_DELETE(self):
+        self.swift.register('DELETE', '/v1/AUTH_test/bucket/Key1',
+                            swob.HTTPNoContent, {}, None)
+        self.swift.register('DELETE', '/v1/AUTH_test/bucket/Key2',
+                            swob.HTTPNotFound, {}, None)
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/Key3',
+                            swob.HTTPOk,
+                            {'x-static-large-object': 'True'},
+                            None)
+        self.swift.register('DELETE',
+                            '/v1/AUTH_test/bucket/business/caf\xc3\xa9',
+                            swob.HTTPNoContent, {}, None)
+        slo_delete_resp = {
+            'Number Not Found': 0,
+            'Response Status': '200 OK',
+            'Errors': [],
+            'Response Body': '',
+            'Number Deleted': 8
+        }
+        self.swift.register('DELETE', '/v1/AUTH_test/bucket/Key3',
+                            swob.HTTPOk, {}, json.dumps(slo_delete_resp))
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/Key4',
+                            swob.HTTPOk,
+                            {'x-static-large-object': 'True',
+                             'x-object-sysmeta-s3api-etag': 'some-etag'},
+                            None)
+        self.swift.register('DELETE', '/v1/AUTH_test/bucket/Key4',
+                            swob.HTTPNoContent, {}, None)
+
+        elem = Element('Delete')
+        for key in ['Key1', 'Key2', 'Key3', 'Key4', 'business/café']:
+            obj = SubElement(elem, 'Object')
+            SubElement(obj, 'Key').text = key
+        body = tostring(elem, use_s3ns=False)
+        content_md5 = base64.b64encode(
+            md5(body, usedforsecurity=False).digest()).strip()
+
+        req = Request.blank('/bucket?delete',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Content-Type': 'multipart/form-data',
+                                     'Date': self.get_date_header(),
+                                     'Content-MD5': content_md5},
+                            body=body)
+        with self.stubbed_container_info():
+            status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+
+        elem = fromstring(body)
+        self.assertEqual(len(elem.findall('Deleted')), 5)
+        self.assertEqual(len(elem.findall('Error')), 0)
+        self.assertEqual(self.swift.calls, [
+            ('HEAD', '/v1/AUTH_test/bucket'),
+            ('HEAD', '/v1/AUTH_test/bucket/Key1?symlink=get'),
+            ('DELETE', '/v1/AUTH_test/bucket/Key1'),
+            ('HEAD', '/v1/AUTH_test/bucket/Key2?symlink=get'),
+            ('DELETE', '/v1/AUTH_test/bucket/Key2'),
+            ('HEAD', '/v1/AUTH_test/bucket/Key3?symlink=get'),
+            ('DELETE', '/v1/AUTH_test/bucket/Key3?multipart-manifest=delete'),
+            ('HEAD', '/v1/AUTH_test/bucket/Key4?symlink=get'),
+            ('DELETE',
+             '/v1/AUTH_test/bucket/Key4?async=on&multipart-manifest=delete'),
+            ('HEAD', '/v1/AUTH_test/bucket/business/caf\xc3\xa9?symlink=get'),
+            ('DELETE', '/v1/AUTH_test/bucket/business/caf\xc3\xa9'),
+        ])
+        # s3api doesn't set storage policy index nor x-timestamp on these swift
+        # subrequests
+        spi = [hdrs.get('X-Backend-Storage-Policy-Index')
+               for _, _, hdrs in self.swift.calls_with_headers]
+        self.assertEqual(spi, [None] * 11)
+        ts = [hdrs.get('X-Timestamp')
+              for _, _, hdrs in self.swift.calls_with_headers]
+        self.assertEqual(ts, [None] * 11)
+
+    def test_object_multi_DELETE_with_error(self):
+        self.swift.register('DELETE', '/v1/AUTH_test/bucket/Key1',
+                            swob.HTTPNoContent, {}, None)
+        self.swift.register('DELETE', '/v1/AUTH_test/bucket/Key2',
+                            swob.HTTPNotFound, {}, None)
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/Key3',
+                            swob.HTTPForbidden, {}, None)
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/Key4',
+                            swob.HTTPOk,
+                            {'x-static-large-object': 'True'},
+                            None)
+        slo_delete_resp = {
+            'Number Not Found': 0,
+            'Response Status': '400 Bad Request',
+            'Errors': [
+                ["/bucket+segments/obj1", "403 Forbidden"],
+                ["/bucket+segments/obj2", "403 Forbidden"]
+            ],
+            'Response Body': '',
+            'Number Deleted': 8
+        }
+        self.swift.register('DELETE', '/v1/AUTH_test/bucket/Key4',
+                            swob.HTTPOk, {}, json.dumps(slo_delete_resp))
+
+        elem = Element('Delete')
+        for key in ['Key1', 'Key2', 'Key3', 'Key4']:
+            obj = SubElement(elem, 'Object')
+            SubElement(obj, 'Key').text = key
+        body = tostring(elem, use_s3ns=False)
+        content_md5 = base64.b64encode(
+            md5(body, usedforsecurity=False).digest()).strip()
+
+        req = Request.blank('/bucket?delete',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Content-Type': 'multipart/form-data',
+                                     'Date': self.get_date_header(),
+                                     'Content-MD5': content_md5},
+                            body=body)
+        with self.stubbed_container_info():
+            status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+
+        elem = fromstring(body)
+        self.assertEqual(len(elem.findall('Deleted')), 2)
+        self.assertEqual(len(elem.findall('Error')), 2)
+        self.assertEqual(
+            [(el.find('Code').text, el.find('Message').text)
+             for el in elem.findall('Error')],
+            [('AccessDenied', 'Access Denied.'),
+             ('SLODeleteError', '\n'.join([
+                 '400 Bad Request',
+                 '/bucket+segments/obj1: 403 Forbidden',
+                 '/bucket+segments/obj2: 403 Forbidden']))]
+        )
+        self.assertEqual(self.swift.calls, [
+            ('HEAD', '/v1/AUTH_test/bucket'),
+            ('HEAD', '/v1/AUTH_test/bucket/Key1?symlink=get'),
+            ('DELETE', '/v1/AUTH_test/bucket/Key1'),
+            ('HEAD', '/v1/AUTH_test/bucket/Key2?symlink=get'),
+            ('DELETE', '/v1/AUTH_test/bucket/Key2'),
+            ('HEAD', '/v1/AUTH_test/bucket/Key3?symlink=get'),
+            ('HEAD', '/v1/AUTH_test/bucket/Key4?symlink=get'),
+            ('DELETE', '/v1/AUTH_test/bucket/Key4?multipart-manifest=delete'),
+        ])
+
+    def test_object_multi_DELETE_with_non_json(self):
+        self.swift.register('DELETE', '/v1/AUTH_test/bucket/Key1',
+                            swob.HTTPNoContent, {}, None)
+        self.swift.register('DELETE', '/v1/AUTH_test/bucket/Key2',
+                            swob.HTTPNotFound, {}, None)
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/Key3',
+                            swob.HTTPForbidden, {}, None)
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/Key4',
+                            swob.HTTPOk,
+                            {'x-static-large-object': 'True'},
+                            None)
+        self.swift.register('DELETE', '/v1/AUTH_test/bucket/Key4',
+                            swob.HTTPOk, {}, b'asdf')
+
+        elem = Element('Delete')
+        for key in ['Key1', 'Key2', 'Key3', 'Key4']:
+            obj = SubElement(elem, 'Object')
+            SubElement(obj, 'Key').text = key
+        body = tostring(elem, use_s3ns=False)
+        content_md5 = base64.b64encode(
+            md5(body, usedforsecurity=False).digest()).strip()
+
+        req = Request.blank('/bucket?delete',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Content-Type': 'multipart/form-data',
+                                     'Date': self.get_date_header(),
+                                     'Content-MD5': content_md5},
+                            body=body)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+
+        elem = fromstring(body)
+        self.assertEqual(len(elem.findall('Deleted')), 2)
+        self.assertEqual(len(elem.findall('Error')), 2)
+        self.assertEqual(
+            [tuple(el.find(x).text for x in ('Key', 'Code', 'Message'))
+             for el in elem.findall('Error')],
+            [('Key3', 'AccessDenied', 'Access Denied.'),
+             ('Key4', 'SLODeleteError', 'Unexpected swift response')])
+
+        self.assertEqual(self.s3api.logger.get_lines_for_level('error'), [
+            'Could not parse SLO delete response (200 OK): %s: ' % b'asdf'])
+        self.s3api.logger.clear()
+
+    def test_object_multi_DELETE_quiet(self):
+        self.swift.register('DELETE', '/v1/AUTH_test/bucket/Key1',
+                            swob.HTTPNoContent, {}, None)
+        self.swift.register('DELETE', '/v1/AUTH_test/bucket/Key2',
+                            swob.HTTPNotFound, {}, None)
+
+        for true_value in ('true', 'True', 'TRUE', 'trUE'):
+            elem = Element('Delete')
+            SubElement(elem, 'Quiet').text = true_value
+            for key in ['Key1', 'Key2']:
+                obj = SubElement(elem, 'Object')
+                SubElement(obj, 'Key').text = key
+            body = tostring(elem, use_s3ns=False)
+            content_md5 = base64.b64encode(
+                md5(body, usedforsecurity=False).digest()).strip()
+
+            req = Request.blank('/bucket?delete',
+                                environ={'REQUEST_METHOD': 'POST'},
+                                headers={
+                                    'Authorization': 'AWS test:tester:hmac',
+                                    'Date': self.get_date_header(),
+                                    'Content-MD5': content_md5},
+                                body=body)
+            status, headers, body = self.call_s3api(req)
+            self.assertEqual(status.split()[0], '200')
+
+            elem = fromstring(body)
+            self.assertEqual(len(elem.findall('Deleted')), 0)
+
+    def test_object_multi_DELETE_no_key(self):
+        self.swift.register('DELETE', '/v1/AUTH_test/bucket/Key1',
+                            swob.HTTPNoContent, {}, None)
+        self.swift.register('DELETE', '/v1/AUTH_test/bucket/Key2',
+                            swob.HTTPNotFound, {}, None)
+
+        elem = Element('Delete')
+        SubElement(elem, 'Quiet').text = 'true'
+        for key in ['Key1', 'Key2']:
+            obj = SubElement(elem, 'Object')
+            SubElement(obj, 'Key')
+        body = tostring(elem, use_s3ns=False)
+        content_md5 = base64.b64encode(
+            md5(body, usedforsecurity=False).digest()).strip()
+
+        req = Request.blank('/bucket?delete',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'Content-MD5': content_md5},
+                            body=body)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'UserKeyMustBeSpecified')
+
+    def test_object_multi_DELETE_versioned_enabled(self):
+        self.swift.register(
+            'HEAD', '/v1/AUTH_test/bucket', swob.HTTPNoContent, {
+                'X-Container-Sysmeta-Versions-Enabled': 'True',
+            }, None)
+        t1 = next(self.ts)
+        key1 = '/v1/AUTH_test/bucket/Key1' \
+            '?symlink=get&version-id=%s' % t1.normal
+        self.swift.register('HEAD', key1, swob.HTTPOk, {}, None)
+        self.swift.register('DELETE', key1, swob.HTTPNoContent, {}, None)
+        t2 = next(self.ts)
+        key2 = '/v1/AUTH_test/bucket/Key2' \
+            '?symlink=get&version-id=%s' % t2.normal
+        # this 404 could just mean it's a delete marker
+        self.swift.register('HEAD', key2, swob.HTTPNotFound, {}, None)
+        self.swift.register('DELETE', key2, swob.HTTPNoContent, {}, None)
+        key3 = '/v1/AUTH_test/bucket/Key3'
+        self.swift.register('HEAD', key3 + '?symlink=get',
+                            swob.HTTPOk, {}, None)
+        self.swift.register('DELETE', key3, swob.HTTPNoContent, {}, None)
+        key4 = '/v1/AUTH_test/bucket/Key4?symlink=get&version-id=null'
+        self.swift.register('HEAD', key4, swob.HTTPOk, {}, None)
+        self.swift.register('DELETE', key4, swob.HTTPNoContent, {}, None)
+
+        elem = Element('Delete')
+        items = (
+            ('Key1', t1.normal),
+            ('Key2', t2.normal),
+            ('Key3', None),
+            ('Key4', 'null'),
+        )
+        for key, version in items:
+            obj = SubElement(elem, 'Object')
+            SubElement(obj, 'Key').text = key
+            if version:
+                SubElement(obj, 'VersionId').text = version
+        body = tostring(elem, use_s3ns=False)
+        content_md5 = base64.b64encode(
+            md5(body, usedforsecurity=False).digest()).strip()
+
+        req = Request.blank('/bucket?delete',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'Content-MD5': content_md5},
+                            body=body)
+        # XXX versioning_enabled=True not required?
+        with self.stubbed_container_info():
+            status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+
+        self.assertEqual(self.swift.calls, [
+            ('HEAD', '/v1/AUTH_test/bucket'),
+            ('HEAD', key1),
+            ('DELETE', key1),
+            ('HEAD', key2),
+            ('DELETE', key2),
+            ('HEAD', key3 + '?symlink=get'),
+            ('DELETE', key3),
+            ('HEAD', key4),
+            ('DELETE', key4),
+        ])
+
+        elem = fromstring(body)
+        self.assertEqual({'Key1', 'Key2', 'Key3', 'Key4'}, set(
+            e.findtext('Key') for e in elem.findall('Deleted')))
+
+    def test_object_multi_DELETE_versioned_suspended(self):
+        self.swift.register(
+            'HEAD', '/v1/AUTH_test/bucket', swob.HTTPNoContent, {}, None)
+        t1 = next(self.ts)
+        key1 = '/v1/AUTH_test/bucket/Key1' + \
+            '?symlink=get&version-id=%s' % t1.normal
+        self.swift.register('HEAD', key1, swob.HTTPOk, {}, None)
+        self.swift.register('DELETE', key1, swob.HTTPNoContent, {}, None)
+        t2 = next(self.ts)
+        key2 = '/v1/AUTH_test/bucket/Key2' + \
+            '?symlink=get&version-id=%s' % t2.normal
+        self.swift.register('HEAD', key2, swob.HTTPNotFound, {}, None)
+        self.swift.register('DELETE', key2, swob.HTTPNotFound, {}, None)
+        key3 = '/v1/AUTH_test/bucket/Key3'
+        self.swift.register('HEAD', key3, swob.HTTPOk, {}, None)
+        self.swift.register('DELETE', key3, swob.HTTPNoContent, {}, None)
+
+        elem = Element('Delete')
+        items = (
+            ('Key1', t1),
+            ('Key2', t2),
+            ('Key3', None),
+        )
+        for key, ts in items:
+            obj = SubElement(elem, 'Object')
+            SubElement(obj, 'Key').text = key
+            if ts:
+                SubElement(obj, 'VersionId').text = ts.normal
+        body = tostring(elem, use_s3ns=False)
+        content_md5 = base64.b64encode(
+            md5(body, usedforsecurity=False).digest()).strip()
+
+        req = Request.blank('/bucket?delete',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'Content-MD5': content_md5},
+                            body=body)
+        # XXX versioning_enabled=True not required?
+        with self.stubbed_container_info():
+            status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+        elem = fromstring(body)
+        self.assertEqual(len(elem.findall('Deleted')), 3)
+
+        self.assertEqual(self.swift.calls, [
+            ('HEAD', '/v1/AUTH_test/bucket'),
+            ('HEAD', '/v1/AUTH_test/bucket/Key1'
+             '?symlink=get&version-id=%s' % t1.normal),
+            ('DELETE', '/v1/AUTH_test/bucket/Key1'
+             '?symlink=get&version-id=%s' % t1.normal),
+            ('HEAD', '/v1/AUTH_test/bucket/Key2'
+             '?symlink=get&version-id=%s' % t2.normal),
+            ('DELETE', '/v1/AUTH_test/bucket/Key2'
+             '?symlink=get&version-id=%s' % t2.normal),
+            ('HEAD', '/v1/AUTH_test/bucket/Key3?symlink=get'),
+            ('DELETE', '/v1/AUTH_test/bucket/Key3'),
+        ])
+
+    def test_object_multi_DELETE_with_invalid_md5(self):
+        elem = Element('Delete')
+        for key in ['Key1', 'Key2']:
+            obj = SubElement(elem, 'Object')
+            SubElement(obj, 'Key').text = key
+        body = tostring(elem, use_s3ns=False)
+
+        req = Request.blank('/bucket?delete',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'Content-MD5': 'XXXX'},
+                            body=body)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidDigest')
+
+    def test_object_multi_DELETE_without_md5(self):
+        elem = Element('Delete')
+        for key in ['Key1', 'Key2']:
+            obj = SubElement(elem, 'Object')
+            SubElement(obj, 'Key').text = key
+        body = tostring(elem, use_s3ns=False)
+
+        req = Request.blank('/bucket?delete',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()},
+                            body=body)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidRequest')
+
+    def test_object_multi_DELETE_lots_of_keys(self):
+        elem = Element('Delete')
+        for i in range(self.s3api.conf.max_multi_delete_objects):
+            status = swob.HTTPOk if i % 2 else swob.HTTPNotFound
+            name = 'x' * 1000 + str(i)
+            self.swift.register('HEAD', '/v1/AUTH_test/bucket/%s' % name,
+                                status, {}, None)
+            self.swift.register('DELETE', '/v1/AUTH_test/bucket/%s' % name,
+                                swob.HTTPNoContent, {}, None)
+            obj = SubElement(elem, 'Object')
+            SubElement(obj, 'Key').text = name
+        body = tostring(elem, use_s3ns=False)
+        content_md5 = (base64.b64encode(
+            md5(body, usedforsecurity=False).digest()).strip())
+
+        req = Request.blank('/bucket?delete',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'Content-MD5': content_md5},
+                            body=body)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual('200 OK', status)
+
+        elem = fromstring(body)
+        self.assertEqual(len(elem.findall('Deleted')),
+                         self.s3api.conf.max_multi_delete_objects)
+
+    def test_object_multi_DELETE_too_many_keys(self):
+        elem = Element('Delete')
+        for i in range(self.s3api.conf.max_multi_delete_objects + 1):
+            obj = SubElement(elem, 'Object')
+            SubElement(obj, 'Key').text = 'x' * 1000 + str(i)
+        body = tostring(elem, use_s3ns=False)
+        content_md5 = (base64.b64encode(
+            md5(body, usedforsecurity=False).digest()).strip())
+
+        req = Request.blank('/bucket?delete',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'Content-MD5': content_md5},
+                            body=body)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'MalformedXML')
+
+    def test_object_multi_DELETE_unhandled_exception(self):
+        exploding_resp = mock.MagicMock(
+            side_effect=Exception('kaboom'))
+        self.swift.register('DELETE', '/v1/AUTH_test/bucket/Key1',
+                            exploding_resp, {}, None)
+        elem = Element('Delete')
+        obj = SubElement(elem, 'Object')
+        SubElement(obj, 'Key').text = 'Key1'
+        body = tostring(elem, use_s3ns=False)
+        content_md5 = (base64.b64encode(
+            md5(body, usedforsecurity=False).digest()).strip())
+
+        req = Request.blank('/bucket?delete',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'Content-MD5': content_md5},
+                            body=body)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+        self.assertIn(b'<Error><Key>Key1</Key><Code>Server Error</Code>', body)
+
+    def _test_no_body(self, use_content_length=False,
+                      use_transfer_encoding=False, string_to_md5=b''):
+        content_md5 = (base64.b64encode(
+            md5(string_to_md5, usedforsecurity=False).digest())
+            .strip())
+        with UnreadableInput(self) as fake_input:
+            req = Request.blank(
+                '/bucket?delete',
+                environ={
+                    'REQUEST_METHOD': 'POST',
+                    'wsgi.input': fake_input},
+                headers={
+                    'Authorization': 'AWS test:tester:hmac',
+                    'Date': self.get_date_header(),
+                    'Content-MD5': content_md5},
+                body='')
+            if not use_content_length:
+                req.environ.pop('CONTENT_LENGTH')
+            if use_transfer_encoding:
+                req.environ['HTTP_TRANSFER_ENCODING'] = 'chunked'
+            status, headers, body = self.call_s3api(req)
+        self.assertEqual(status, '400 Bad Request')
+        self.assertEqual(self._get_error_code(body), 'MissingRequestBodyError')
+
+    def test_object_multi_DELETE_empty_body(self):
+        self._test_no_body()
+        self._test_no_body(string_to_md5=b'test')
+        self._test_no_body(use_content_length=True)
+        self._test_no_body(use_content_length=True, string_to_md5=b'test')
+        self._test_no_body(use_transfer_encoding=True)
+        self._test_no_body(use_transfer_encoding=True, string_to_md5=b'test')
+
+
+class TestS3ApiMultiDeleteNoAcl(BaseS3ApiMultiDelete, S3ApiTestCase):
+
+    def test_object_multi_DELETE_with_system_entity(self):
+        self.keys = ['Key1', 'Key2']
+        self.swift.register(
+            'DELETE', '/v1/AUTH_test/bucket/%s' % self.keys[0],
+            swob.HTTPNotFound, {}, None)
+        self.swift.register(
+            'DELETE', '/v1/AUTH_test/bucket/%s' % self.keys[1],
+            swob.HTTPNoContent, {}, None)
+
+        elem = Element('Delete')
+        for key in self.keys:
+            obj = SubElement(elem, 'Object')
+            SubElement(obj, 'Key').text = key
+        body = tostring(elem, use_s3ns=False)
+        body = body.replace(
+            b'?>\n',
+            b'?>\n<!DOCTYPE foo '
+            b'[<!ENTITY ent SYSTEM "file:///etc/passwd"> ]>\n',
+        ).replace(b'>Key1<', b'>Key1&ent;<')
+        content_md5 = (
+            base64.b64encode(md5(body, usedforsecurity=False).digest())
+            .strip())
+
+        req = Request.blank('/bucket?delete',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={
+                                'Authorization': 'AWS test:full_control:hmac',
+                                'Date': self.get_date_header(),
+                                'Content-MD5': content_md5},
+                            body=body)
+        req.date = datetime.now()
+        req.content_type = 'text/plain'
+
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status, '200 OK', body)
+        self.assertIn(b'<Deleted><Key>Key2</Key></Deleted>', body)
+        self.assertNotIn(b'root:/root', body)
+        self.assertIn(b'<Deleted><Key>Key1</Key></Deleted>', body)
+
+
+class TestS3ApiMultiDeleteAcl(BaseS3ApiMultiDelete, S3ApiTestCaseAcl):
+
+    def _test_object_multi_DELETE(self, account):
+        self.keys = ['Key1', 'Key2']
+        self.swift.register(
+            'DELETE', '/v1/AUTH_test/bucket/%s' % self.keys[0],
+            swob.HTTPNoContent, {}, None)
+        self.swift.register(
+            'DELETE', '/v1/AUTH_test/bucket/%s' % self.keys[1],
+            swob.HTTPNotFound, {}, None)
+
+        elem = Element('Delete')
+        for key in self.keys:
+            obj = SubElement(elem, 'Object')
+            SubElement(obj, 'Key').text = key
+        body = tostring(elem, use_s3ns=False)
+        content_md5 = (
+            base64.b64encode(md5(body, usedforsecurity=False).digest())
+            .strip())
+
+        req = Request.blank('/bucket?delete',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS %s:hmac' % account,
+                                     'Date': self.get_date_header(),
+                                     'Content-MD5': content_md5},
+                            body=body)
+        req.date = datetime.now()
+        req.content_type = 'text/plain'
+
+        return self.call_s3api(req)
+
+    def test_object_multi_DELETE_without_permission(self):
+        status, headers, body = self._test_object_multi_DELETE('test:other')
+        self.assertEqual(status.split()[0], '200')
+        elem = fromstring(body)
+        errors = elem.findall('Error')
+        self.assertEqual(len(errors), len(self.keys))
+        for e in errors:
+            self.assertTrue(e.find('Key').text in self.keys)
+            self.assertEqual(e.find('Code').text, 'AccessDenied')
+            self.assertEqual(e.find('Message').text, 'Access Denied.')
+
+    def test_object_multi_DELETE_with_write_permission(self):
+        status, headers, body = self._test_object_multi_DELETE('test:write')
+        self.assertEqual(status.split()[0], '200')
+        elem = fromstring(body)
+        self.assertEqual(len(elem.findall('Deleted')), len(self.keys))
+
+    def test_object_multi_DELETE_with_fullcontrol_permission(self):
+        status, headers, body = \
+            self._test_object_multi_DELETE('test:full_control')
+        self.assertEqual(status.split()[0], '200')
+        elem = fromstring(body)
+        self.assertEqual(len(elem.findall('Deleted')), len(self.keys))
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/s3api/test_multi_get.py b/test/unit/common/middleware/s3api/test_multi_get.py
new file mode 100644
index 0000000000..0e06238b8c
--- /dev/null
+++ b/test/unit/common/middleware/s3api/test_multi_get.py
@@ -0,0 +1,661 @@
+# Copyright (c) 2023 NVIDIA
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import binascii
+import string
+import json
+from unittest import mock
+
+from swift.common import swob, utils
+from swift.common.request_helpers import get_reserved_name
+from swift.common.middleware import symlink
+from swift.common.middleware.versioned_writes import object_versioning as ov
+
+from test.unit import make_timestamp_iter
+from test.unit.common.middleware.test_slo import slo, md5hex
+from test.unit.common.middleware.s3api import (
+    S3ApiTestCase, S3ApiTestCaseAcl, _gen_test_headers)
+
+
+def _prepare_mpu(swift, ts_iter, upload_id, num_segments,
+                 segment_bucket='bucket+segments', segment_key='mpu'):
+    manifest = []
+    for i, letter in enumerate(string.ascii_lowercase):
+        if len(manifest) >= num_segments:
+            break
+        size = (i + 1) * 5
+        body = letter * size
+        etag = md5hex(body)
+        path = '/%s/%s/%s/%s' % (segment_bucket, segment_key, upload_id, i + 1)
+        swift.register('GET', '/v1/AUTH_test' + path, swob.HTTPOk, {
+            'Content-Length': len(body),
+            'Etag': etag,
+        }, body)
+        manifest.append({
+            "name": path,
+            "bytes": size,
+            "hash": etag,
+            "content_type": "application/octet-stream",
+            "last_modified": next(ts_iter).isoformat,
+        })
+    slo_etag = md5hex(''.join(s['hash'] for s in manifest))
+    s3_hash = md5hex(binascii.a2b_hex(''.join(
+        s['hash'] for s in manifest)))
+    s3_etag = "%s-%s" % (s3_hash, len(manifest))
+    manifest_json = json.dumps(manifest)
+    json_md5 = md5hex(manifest_json)
+    manifest_headers = {
+        'Content-Length': str(len(manifest_json)),
+        'X-Static-Large-Object': 'true',
+        'Etag': json_md5,
+        'Content-Type': 'application/octet-stream',
+        'X-Object-Sysmeta-Slo-Etag': slo_etag,
+        'X-Object-Sysmeta-Slo-Size': str(sum(
+            s['bytes'] for s in manifest)),
+        'X-Object-Sysmeta-S3Api-Etag': s3_etag,
+        'X-Object-Sysmeta-S3Api-Upload-Id': upload_id,
+        'X-Object-Sysmeta-Container-Update-Override-Etag':
+        '%s; s3_etag=%s; slo_etag=%s' % (json_md5, s3_etag, slo_etag),
+    }
+    return manifest_headers, manifest_json
+
+
+class TestMpuGETorHEAD(S3ApiTestCase):
+
+    def _wrap_app(self, app):
+        self.slo = slo.filter_factory({'rate_limit_under_size': '0'})(app)
+        return super(TestMpuGETorHEAD, self)._wrap_app(self.slo)
+
+    def setUp(self):
+        # this will call our _wrap_app
+        super(TestMpuGETorHEAD, self).setUp()
+        self.ts = make_timestamp_iter()
+        manifest_headers, manifest_json = _prepare_mpu(
+            self.swift, self.ts, 'X', 3)
+        self.s3_etag = manifest_headers['X-Object-Sysmeta-S3Api-Etag']
+        self.swift.register(
+            'GET', '/v1/AUTH_test/bucket/mpu',
+            swob.HTTPOk, manifest_headers, manifest_json.encode('ascii'))
+        self.s3_acl = False
+
+    def test_mpu_GET(self):
+        req = swob.Request.blank('/bucket/mpu', headers={
+            'Authorization': 'AWS test:tester:hmac',
+            'Date': self.get_date_header()
+        })
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+        self.assertEqual(body, b'aaaaabbbbbbbbbbccccccccccccccc')
+        expected_calls = [
+            ('GET', '/v1/AUTH_test/bucket/mpu'),
+            ('GET', '/v1/AUTH_test/bucket+segments/mpu/X/1'
+             '?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/bucket+segments/mpu/X/2'
+             '?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/bucket+segments/mpu/X/3'
+             '?multipart-manifest=get'),
+        ]
+        if self.s3_acl:
+            # pre-flight object ACL check
+            expected_calls.insert(0, ('HEAD', '/v1/AUTH_test/bucket/mpu'))
+        self.assertEqual(self.swift.calls, expected_calls)
+        self.assertEqual(headers['Content-Length'], '30')
+        self.assertEqual(headers['Etag'], '"%s"' % self.s3_etag)
+        self.assertNotIn('X-Amz-Mp-Parts-Count', headers)
+
+    def test_mpu_GET_part_num(self):
+        req = swob.Request.blank('/bucket/mpu', params={
+            'partNumber': '2',
+        }, headers={
+            'Authorization': 'AWS test:tester:hmac',
+            'Date': self.get_date_header()
+        })
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '206')
+        self.assertEqual(body, b'bbbbbbbbbb')
+        expected_calls = [
+            ('GET', '/v1/AUTH_test/bucket/mpu?part-number=2'),
+            ('GET', '/v1/AUTH_test/bucket+segments/mpu/X/2'
+             '?multipart-manifest=get'),
+        ]
+        if self.s3_acl:
+            expected_calls.insert(0, ('HEAD', '/v1/AUTH_test/bucket/mpu'))
+        self.assertEqual(self.swift.calls, expected_calls)
+        self.assertEqual(headers['Content-Length'], '10')
+        self.assertEqual(headers['Content-Range'], 'bytes 5-14/30')
+        self.assertEqual(headers['Etag'], '"%s"' % self.s3_etag)
+        self.assertEqual(headers['X-Amz-Mp-Parts-Count'], '3')
+
+    def test_mpu_GET_invalid_part_num(self):
+        req = swob.Request.blank('/bucket/mpu', params={
+            'partNumber': 'foo',
+        }, headers={
+            'Authorization': 'AWS test:tester:hmac',
+            'Date': self.get_date_header()
+        })
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '400')
+        self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+        self.assertEqual(self.swift.calls, [])
+
+    def test_mpu_GET_zero_part_num(self):
+        req = swob.Request.blank('/bucket/mpu', params={
+            'partNumber': '0',
+        }, headers={
+            'Authorization': 'AWS test:tester:hmac',
+            'Date': self.get_date_header()
+        })
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '400')
+        self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+        self.assertEqual(self.swift.calls, [])
+
+    def _do_test_mpu_GET_out_of_range_part_num(self, part_number):
+        self.swift.clear_calls()
+        req = swob.Request.blank('/bucket/mpu', params={
+            'partNumber': str(part_number),
+        }, headers={
+            'Authorization': 'AWS test:tester:hmac',
+            'Date': self.get_date_header()
+        })
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '416')
+        self.assertEqual(self._get_error_code(body), 'InvalidPartNumber')
+        expected_calls = [
+            # s3api.controller.obj doesn't know yet if it's SLO, we delegate
+            # param validation
+            ('GET', '/v1/AUTH_test/bucket/mpu?part-number=%s' % part_number),
+        ]
+        if self.s3_acl:
+            expected_calls.insert(0, ('HEAD', '/v1/AUTH_test/bucket/mpu'))
+        self.assertEqual(self.swift.calls, expected_calls)
+
+    def test_mpu_GET_out_of_range_part_num(self):
+        self._do_test_mpu_GET_out_of_range_part_num(4)
+        self._do_test_mpu_GET_out_of_range_part_num(10000)
+
+    def test_existing_part_number_greater_than_max_parts_allowed(self):
+        part_number = 3
+        max_parts = 2
+        req = swob.Request.blank('/bucket/mpu', params={
+            'partNumber': str(part_number),
+        }, headers={
+            'Authorization': 'AWS test:tester:hmac',
+            'Date': self.get_date_header()
+        })
+        bad_req = swob.Request.blank('/bucket/mpu', params={
+            'partNumber': str(part_number + 1),
+        }, headers={
+            'Authorization': 'AWS test:tester:hmac',
+            'Date': self.get_date_header()
+        })
+        with mock.patch.object(self.s3api.conf,
+                               'max_upload_part_num', max_parts):
+            # num_parts >= part number > max parts
+            status, headers, body = self.call_s3api(req)
+            self.assertEqual(status.split()[0], '206')
+            # part number > num parts > max parts
+            status, headers, body = self.call_s3api(bad_req)
+            self.assertEqual(status.split()[0], '400')
+            self.assertIn('must be an integer between 1 and 3, inclusive',
+                          self._get_error_message(body))
+
+        max_parts = part_number + 1
+        with mock.patch.object(self.s3api.conf,
+                               'max_upload_part_num', max_parts):
+            # max_parts > num_parts >= part number
+            status, headers, body = self.call_s3api(req)
+            self.assertEqual(status.split()[0], '206')
+            # max_parts >= part number > num parts
+            status, headers, body = self.call_s3api(bad_req)
+            self.assertEqual(status.split()[0], '416')
+            self.assertIn('The requested partnumber is not satisfiable',
+                          self._get_error_message(body))
+            # part number > max_parts > num parts
+            bad_req.params = {'partNumber': str(max_parts + 1)}
+            status, headers, body = self.call_s3api(bad_req)
+            self.assertEqual(status.split()[0], '400')
+            self.assertIn('must be an integer between 1 and 4, inclusive',
+                          self._get_error_message(body))
+
+    def test_mpu_GET_huge_part_num(self):
+        req = swob.Request.blank('/bucket/mpu', params={
+            'partNumber': '10001',
+        }, headers={
+            'Authorization': 'AWS test:tester:hmac',
+            'Date': self.get_date_header()
+        })
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '400')
+        self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+        expected_calls = [
+            # XXX is this value configurable?  do we need the SLO request?
+            ('GET', '/v1/AUTH_test/bucket/mpu?part-number=10001'),
+        ]
+        if self.s3_acl:
+            expected_calls.insert(0, ('HEAD', '/v1/AUTH_test/bucket/mpu'))
+        self.assertEqual(self.swift.calls, expected_calls)
+
+    def test_mpu_HEAD_part_num(self):
+        req = swob.Request.blank('/bucket/mpu', params={
+            'partNumber': '1',
+        }, headers={
+            'Authorization': 'AWS test:tester:hmac',
+            'Date': self.get_date_header()
+        }, method='HEAD')
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '206')
+        self.assertEqual(body, b'')
+        self.assertEqual(self.swift.calls, [
+            ('HEAD', '/v1/AUTH_test/bucket/mpu?part-number=1'),
+            ('GET', '/v1/AUTH_test/bucket/mpu?part-number=1'),
+        ])
+        self.assertEqual(headers['Content-Length'], '5')
+        self.assertEqual(headers['Content-Range'], 'bytes 0-4/30')
+        self.assertEqual(headers['Etag'], '"%s"' % self.s3_etag)
+        self.assertEqual(headers['X-Amz-Mp-Parts-Count'], '3')
+
+    def test_mpu_HEAD_invalid_part_num(self):
+        req = swob.Request.blank('/bucket/mpu', method='HEAD', params={
+            'partNumber': 'foo',
+        }, headers={
+            'Authorization': 'AWS test:tester:hmac',
+            'Date': self.get_date_header()
+        })
+        status, headers, _ = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '400')
+        self.assertEqual(self.swift.calls, [])
+
+    def test_mpu_HEAD_zero_part_num(self):
+        req = swob.Request.blank('/bucket/mpu', method='HEAD', params={
+            'partNumber': '0',
+        }, headers={
+            'Authorization': 'AWS test:tester:hmac',
+            'Date': self.get_date_header()
+        })
+        status, headers, _ = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '400')
+        self.assertEqual(self.swift.calls, [])
+
+    def _do_test_mpu_HEAD_out_of_range_part_num(self, part_number):
+        self.swift.clear_calls()
+        req = swob.Request.blank('/bucket/mpu', method='HEAD', params={
+            'partNumber': str(part_number),
+        }, headers={
+            'Authorization': 'AWS test:tester:hmac',
+            'Date': self.get_date_header()
+        })
+        status, headers, _ = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '416')
+        self.assertEqual(self.swift.calls, [
+            ('HEAD', '/v1/AUTH_test/bucket/mpu?part-number=%s' % part_number),
+            # SLO has to refetch to *see* if it's out-of-bounds
+            ('GET', '/v1/AUTH_test/bucket/mpu?part-number=%s' % part_number),
+        ])
+
+    def test_mpu_HEAD_out_of_range_part_num(self):
+        self._do_test_mpu_HEAD_out_of_range_part_num(4)
+        self._do_test_mpu_HEAD_out_of_range_part_num(10000)
+
+    def test_mpu_HEAD_huge_part_num(self):
+        req = swob.Request.blank('/bucket/mpu', method='HEAD', params={
+            'partNumber': '10001',
+        }, headers={
+            'Authorization': 'AWS test:tester:hmac',
+            'Date': self.get_date_header()
+        })
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '400')
+        self.assertEqual(self.swift.calls, [
+            ('HEAD', '/v1/AUTH_test/bucket/mpu?part-number=10001'),
+            # XXX were two requests worth it to 400?
+            # how big can you configure SLO?
+            # do such manifests *exist*?
+            ('GET', '/v1/AUTH_test/bucket/mpu?part-number=10001'),
+        ])
+
+
+class TestMpuGETorHEADAcl(TestMpuGETorHEAD, S3ApiTestCaseAcl):
+
+    def setUp(self):
+        super(TestMpuGETorHEADAcl, self).setUp()
+        object_headers = _gen_test_headers(
+            self.default_owner, self.grants, 'object')
+        self.swift.update_sticky_response_headers(
+            '/v1/AUTH_test/bucket/mpu', object_headers)
+        # this is used to flag insertion of expected HEAD pre-flight request of
+        # object ACLs
+        self.s3_acl = True
+
+
+class TestVersionedMpuGETorHEAD(S3ApiTestCase):
+
+    def _wrap_app(self, app):
+        self.sym = symlink.filter_factory({})(app)
+        self.sym.logger = self.swift.logger
+        self.ov = ov.ObjectVersioningMiddleware(self.sym, {})
+        self.ov.logger = self.swift.logger
+        self.slo = slo.filter_factory({'rate_limit_under_size': '0'})(self.ov)
+        self.slo.logger = self.swift.logger
+        return super(TestVersionedMpuGETorHEAD, self)._wrap_app(self.slo)
+
+    def setUp(self):
+        # this will call our _wrap_app
+        super(TestVersionedMpuGETorHEAD, self).setUp()
+        self.ts = make_timestamp_iter()
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket+segments',
+                            swob.HTTPNoContent, {}, None)
+        versions_container = get_reserved_name('versions', 'bucket')
+        self.swift.register(
+            'HEAD', '/v1/AUTH_test/bucket', swob.HTTPNoContent, {
+                ov.SYSMETA_VERSIONS_CONT: versions_container,
+                ov.SYSMETA_VERSIONS_ENABLED: True,
+            }, None)
+        self.swift.register('HEAD', '/v1/AUTH_test/%s' % versions_container,
+                            swob.HTTPNoContent, {}, None)
+        num_versions = 3
+        self.version_ids = []
+        for v in range(num_versions):
+            upload_id = 'X%s' % v
+            num_segments = 3 + v
+            manifest_headers, manifest_json = _prepare_mpu(
+                self.swift, self.ts, upload_id, num_segments)
+            version_ts = next(self.ts)
+            # add in a little user-meta to keep versions stright
+            manifest_version_headers = dict(manifest_headers, **{
+                'x-object-meta-user-notes': 'version%s' % v,
+                'x-backend-timestamp': version_ts.internal,
+            })
+            self.version_ids.append(version_ts.normal)
+            obj_version_path = get_reserved_name('mpu', (~version_ts).normal)
+            self.swift.register(
+                'GET', '/v1/AUTH_test/%s/%s' % (
+                    versions_container, obj_version_path),
+                swob.HTTPOk, manifest_version_headers,
+                manifest_json.encode('ascii'))
+        # TODO: make a current version symlink
+        symlink_target = '%s/%s' % (versions_container, obj_version_path)
+        slo_etag = manifest_headers['X-Object-Sysmeta-Slo-Etag']
+        s3_etag = manifest_headers['X-Object-Sysmeta-S3Api-Etag']
+        symlink_target_etag = json_md5 = manifest_headers['Etag']
+        symlink_target_bytes = manifest_headers['X-Object-Sysmeta-Slo-Size']
+        manifest_symlink_headers = dict(manifest_headers, **{
+            'X-Object-Sysmeta-Container-Update-Override-Etag':
+            '%s; s3_etag=%s; slo_etag=%s; symlink_target=%s; '
+            'symlink_target_etag=%s; symlink_target_bytes=%s' % (
+                json_md5, s3_etag, slo_etag, symlink_target,
+                symlink_target_etag, symlink_target_bytes),
+            'X-Object-Sysmeta-Allow-Reserved-Names': 'true',
+            'X-Object-Sysmeta-Symlink-Target': symlink_target,
+            'X-Object-Sysmeta-Symlink-Target-Bytes': str(symlink_target_bytes),
+            'X-Object-Sysmeta-Symlink-Target-Etag': symlink_target_etag,
+            'X-Object-Sysmeta-Symloop-Extend': 'true',
+            'X-Object-Sysmeta-Versions-Symlink': 'true',
+        })
+        self.swift.register(
+            'GET', '/v1/AUTH_test/bucket/mpu', swob.HTTPOk,
+            manifest_symlink_headers, '')
+        self.s3_acl = False
+
+    def test_mpu_GET_version(self):
+        req = swob.Request.blank('/bucket/mpu', params={
+            'versionId': self.version_ids[0],
+        }, headers={
+            'Authorization': 'AWS test:tester:hmac',
+            'Date': self.get_date_header()
+        })
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(headers['x-amz-meta-user-notes'], 'version0')
+        self.assertEqual(headers['Content-Length'], '30')
+        self.assertEqual(body, b'aaaaabbbbbbbbbbccccccccccccccc')
+        expected_calls = [
+            ('HEAD', '/v1/AUTH_test'),
+            ('HEAD', '/v1/AUTH_test/bucket'),
+            ('HEAD', '/v1/AUTH_test/\x00versions\x00bucket'),
+            ('GET', '/v1/AUTH_test/\x00versions\x00bucket/\x00mpu\x00%s'
+             '?version-id=%s' % (
+                 (~utils.Timestamp(self.version_ids[0])).normal,
+                 self.version_ids[0])),
+            ('HEAD', '/v1/AUTH_test/bucket+segments'),
+            ('GET', '/v1/AUTH_test/bucket+segments/mpu/X0/1'
+             '?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/bucket+segments/mpu/X0/2'
+             '?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/bucket+segments/mpu/X0/3'
+             '?multipart-manifest=get')
+        ]
+        if self.s3_acl:
+            expected_calls.insert(3, (
+                'HEAD', '/v1/AUTH_test/\x00versions\x00bucket/\x00mpu\x00%s'
+                '?version-id=%s' % (
+                    (~utils.Timestamp(self.version_ids[0])).normal,
+                    self.version_ids[0])
+            ))
+        self.assertEqual(self.swift.calls, expected_calls)
+
+    def test_mpu_GET_last_version(self):
+        req = swob.Request.blank('/bucket/mpu', headers={
+            'Authorization': 'AWS test:tester:hmac',
+            'Date': self.get_date_header()
+        })
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(headers['x-amz-meta-user-notes'], 'version2')
+        self.assertEqual(headers['Content-Length'], '75')
+        expected_calls = [
+            ('HEAD', '/v1/AUTH_test'),
+            ('HEAD', '/v1/AUTH_test/bucket'),
+            ('HEAD', '/v1/AUTH_test/\x00versions\x00bucket'),
+            ('GET', '/v1/AUTH_test/bucket/mpu'),
+            ('GET', '/v1/AUTH_test/\x00versions\x00bucket/\x00mpu\x00%s' % (
+                ~utils.Timestamp(self.version_ids[2])).normal),
+            ('HEAD', '/v1/AUTH_test/bucket+segments'),
+            ('GET', '/v1/AUTH_test/bucket+segments/mpu/X2/1'
+             '?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/bucket+segments/mpu/X2/2'
+             '?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/bucket+segments/mpu/X2/3'
+             '?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/bucket+segments/mpu/X2/4'
+             '?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/bucket+segments/mpu/X2/5'
+             '?multipart-manifest=get'),
+        ]
+        if self.s3_acl:
+            # the pre-flight head on version marker get's symlinked; but I
+            # think maybe symlink makes metadata addative?
+            expected_calls = expected_calls[:3] + [
+                ('HEAD', '/v1/AUTH_test/bucket/mpu'),
+                ('HEAD', '/v1/AUTH_test/\x00versions\x00bucket/\x00mpu\x00'
+                 '%s' % (~utils.Timestamp(self.version_ids[2])).normal),
+            ] + expected_calls[3:]
+        self.assertEqual(expected_calls, self.swift.calls)
+
+    def test_mpu_HEAD_last_version(self):
+        req = swob.Request.blank('/bucket/mpu', method='HEAD', headers={
+            'Authorization': 'AWS test:tester:hmac',
+            'Date': self.get_date_header()
+        })
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(headers['x-amz-meta-user-notes'], 'version2')
+        self.assertEqual(headers['Content-Length'], '75')
+        self.assertEqual([
+            ('HEAD', '/v1/AUTH_test'),
+            ('HEAD', '/v1/AUTH_test/bucket'),
+            ('HEAD', '/v1/AUTH_test/\x00versions\x00bucket'),
+            ('HEAD', '/v1/AUTH_test/bucket/mpu'),
+            ('HEAD', '/v1/AUTH_test/\x00versions\x00bucket/\x00mpu\x00%s' % (
+                ~utils.Timestamp(self.version_ids[2])).normal),
+        ], self.swift.calls)
+
+    def test_mpu_HEAD_version(self):
+        req = swob.Request.blank('/bucket/mpu', method='HEAD', params={
+            'versionId': self.version_ids[1],
+        }, headers={
+            'Authorization': 'AWS test:tester:hmac',
+            'Date': self.get_date_header()
+        })
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(headers['x-amz-meta-user-notes'], 'version1')
+        self.assertEqual(headers['Content-Length'], '50')
+        self.assertEqual(body, b'')
+        self.assertEqual([
+            ('HEAD', '/v1/AUTH_test'),
+            ('HEAD', '/v1/AUTH_test/bucket'),
+            ('HEAD', '/v1/AUTH_test/\x00versions\x00bucket'),
+            ('HEAD', '/v1/AUTH_test/\x00versions\x00bucket/\x00mpu\x00%s'
+             '?version-id=%s' % (
+                 (~utils.Timestamp(self.version_ids[1])).normal,
+                 self.version_ids[1])),
+        ], self.swift.calls)
+
+    def test_mpu_GET_version_part_num(self):
+        req = swob.Request.blank('/bucket/mpu', params={
+            'versionId': self.version_ids[2],
+            'partNumber': 5,
+        }, headers={
+            'Authorization': 'AWS test:tester:hmac',
+            'Date': self.get_date_header()
+        })
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(headers['x-amz-meta-user-notes'], 'version2')
+        self.assertEqual(headers['Content-Length'], '25')
+        self.assertEqual(body, b'e' * 25)
+        expected_calls = [
+            ('HEAD', '/v1/AUTH_test'),
+            ('HEAD', '/v1/AUTH_test/bucket'),
+            ('HEAD', '/v1/AUTH_test/\x00versions\x00bucket'),
+            ('GET', '/v1/AUTH_test/\x00versions\x00bucket/\x00mpu\x00%s'
+             '?part-number=5&version-id=%s' % (
+                 (~utils.Timestamp(self.version_ids[2])).normal,
+                 self.version_ids[2])),
+            ('HEAD', '/v1/AUTH_test/bucket+segments'),
+            ('GET', '/v1/AUTH_test/bucket+segments/mpu/X2/5'
+             '?multipart-manifest=get'),
+        ]
+        if self.s3_acl:
+            expected_calls.insert(3, (
+                'HEAD', '/v1/AUTH_test/\x00versions\x00bucket/\x00mpu\x00%s'
+                '?version-id=%s' % (
+                    (~utils.Timestamp(self.version_ids[2])).normal,
+                    self.version_ids[2])
+            ))
+        self.assertEqual(expected_calls, self.swift.calls)
+
+    def test_mpu_HEAD_version_part_num(self):
+        req = swob.Request.blank('/bucket/mpu', method='HEAD', params={
+            'versionId': self.version_ids[2],
+            'partNumber': 3,
+        }, headers={
+            'Authorization': 'AWS test:tester:hmac',
+            'Date': self.get_date_header()
+        })
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(headers['x-amz-meta-user-notes'], 'version2')
+        self.assertEqual(headers['Content-Length'], '15')
+        self.assertEqual(body, b'')
+        self.assertEqual(self.swift.calls, [
+            ('HEAD', '/v1/AUTH_test'),
+            ('HEAD', '/v1/AUTH_test/bucket'),
+            ('HEAD', '/v1/AUTH_test/\x00versions\x00bucket'),
+            ('HEAD', '/v1/AUTH_test/\x00versions\x00bucket/\x00mpu\x00%s'
+             '?part-number=3&version-id=%s' % (
+                 (~utils.Timestamp(self.version_ids[2])).normal,
+                 self.version_ids[2])),
+            ('GET', '/v1/AUTH_test/\x00versions\x00bucket/\x00mpu\x00%s'
+             '?part-number=3&version-id=%s' % (
+                 (~utils.Timestamp(self.version_ids[2])).normal,
+                 self.version_ids[2])),
+        ])
+
+    def test_mpu_GET_last_version_part_num(self):
+        req = swob.Request.blank('/bucket/mpu', params={
+            'partNumber': 4,
+        }, headers={
+            'Authorization': 'AWS test:tester:hmac',
+            'Date': self.get_date_header()
+        })
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(headers['x-amz-meta-user-notes'], 'version2')
+        self.assertEqual(headers['Content-Length'], '20')
+        self.assertEqual(body, b'd' * 20)
+        expected_calls = [
+            ('HEAD', '/v1/AUTH_test'),
+            ('HEAD', '/v1/AUTH_test/bucket'),
+            ('HEAD', '/v1/AUTH_test/\x00versions\x00bucket'),
+            ('GET', '/v1/AUTH_test/bucket/mpu?part-number=4'),
+            ('GET', '/v1/AUTH_test/\x00versions\x00bucket/\x00mpu\x00%s'
+             '?part-number=4' % (
+                 ~utils.Timestamp(self.version_ids[2])).normal),
+            ('HEAD', '/v1/AUTH_test/bucket+segments'),
+            ('GET', '/v1/AUTH_test/bucket+segments/mpu/X2/4'
+             '?multipart-manifest=get'),
+        ]
+        if self.s3_acl:
+            expected_calls = expected_calls[:3] + [
+                ('HEAD', '/v1/AUTH_test/bucket/mpu'),
+                ('HEAD', '/v1/AUTH_test/\x00versions\x00bucket/\x00mpu\x00'
+                 '%s' % (~utils.Timestamp(self.version_ids[2])).normal),
+            ] + expected_calls[3:]
+        self.assertEqual(expected_calls, self.swift.calls)
+
+    def test_mpu_HEAD_last_version_part_num(self):
+        req = swob.Request.blank('/bucket/mpu', method='HEAD', params={
+            'partNumber': 5,
+        }, headers={
+            'Authorization': 'AWS test:tester:hmac',
+            'Date': self.get_date_header()
+        })
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(headers['x-amz-meta-user-notes'], 'version2')
+        self.assertEqual(headers['Content-Length'], '25')
+        self.assertEqual(self.swift.calls, [
+            ('HEAD', '/v1/AUTH_test'),
+            ('HEAD', '/v1/AUTH_test/bucket'),
+            ('HEAD', '/v1/AUTH_test/\x00versions\x00bucket'),
+            ('HEAD', '/v1/AUTH_test/bucket/mpu?part-number=5'),
+            ('HEAD', '/v1/AUTH_test/\x00versions\x00bucket/\x00mpu\x00%s'
+             '?part-number=5' % (
+                 ~utils.Timestamp(self.version_ids[2])).normal),
+            ('GET', '/v1/AUTH_test/bucket/mpu?part-number=5'),
+            ('GET', '/v1/AUTH_test/\x00versions\x00bucket/\x00mpu\x00%s'
+             '?part-number=5' % (
+                 ~utils.Timestamp(self.version_ids[2])).normal),
+        ])
+
+
+class TestVersionedMpuGETorHEADAcl(TestVersionedMpuGETorHEAD,
+                                   S3ApiTestCaseAcl):
+
+    def setUp(self):
+        super(TestVersionedMpuGETorHEADAcl, self).setUp()
+        object_headers = _gen_test_headers(
+            self.default_owner, self.grants, 'object')
+        for version_id in self.version_ids:
+            # s3acl would add the default object ACL on PUT to each version
+            version_path = '/v1/AUTH_test/\x00versions\x00bucket/' \
+                '\x00mpu\x00%s' % (~utils.Timestamp(version_id)).normal
+            self.swift.update_sticky_response_headers(
+                version_path, object_headers)
+        # this is used to flag insertion of expected HEAD pre-flight request of
+        # object ACLs
+        self.s3_acl = True
diff --git a/test/unit/common/middleware/s3api/test_multi_upload.py b/test/unit/common/middleware/s3api/test_multi_upload.py
new file mode 100644
index 0000000000..e5737d1218
--- /dev/null
+++ b/test/unit/common/middleware/s3api/test_multi_upload.py
@@ -0,0 +1,2972 @@
+# Copyright (c) 2014 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import base64
+import binascii
+import hashlib
+from unittest.mock import patch
+import os
+import time
+import unittest
+from urllib.parse import parse_qs, quote, quote_plus
+
+from swift.common import swob
+from swift.common.swob import Request
+from swift.common.utils import json, md5, Timestamp
+
+from test.unit import FakeMemcache, patch_policies
+from test.unit.common.middleware.s3api import S3ApiTestCase, S3ApiTestCaseAcl
+from test.unit.common.middleware.s3api.helpers import UnreadableInput
+from swift.common.middleware.s3api.etree import fromstring, tostring
+from swift.common.middleware.s3api.subresource import Owner, Grant, User, \
+    ACL, encode_acl, decode_acl, ACLPublicRead
+from swift.common.middleware.s3api.utils import sysmeta_header, mktime, \
+    S3Timestamp
+from swift.common.middleware.s3api.s3request import MAX_32BIT_INT
+from swift.common.storage_policy import StoragePolicy, POLICIES
+from swift.proxy.controllers.base import get_cache_key
+
+XML = '<CompleteMultipartUpload>' \
+    '<Part>' \
+    '<PartNumber>1</PartNumber>' \
+    '<ETag>0123456789abcdef0123456789abcdef</ETag>' \
+    '</Part>' \
+    '<Part>' \
+    '<PartNumber>2</PartNumber>' \
+    '<ETag>"fedcba9876543210fedcba9876543210"</ETag>' \
+    '</Part>' \
+    '</CompleteMultipartUpload>'
+
+OBJECTS_TEMPLATE = \
+    (('object/X/1', '2014-05-07T19:47:51.592270', '0123456789abcdef', 100,
+      '2014-05-07T19:47:52.000Z'),
+     ('object/X/2', '2014-05-07T19:47:52.592270', 'fedcba9876543210', 200,
+      '2014-05-07T19:47:53.000Z'))
+
+MULTIPARTS_TEMPLATE = \
+    (('object/X', '2014-05-07T19:47:50.592270', 'HASH', 1,
+      '2014-05-07T19:47:51.000Z'),
+     ('object/X/1', '2014-05-07T19:47:51.592270', '0123456789abcdef', 11,
+      '2014-05-07T19:47:52.000Z'),
+     ('object/X/2', '2014-05-07T19:47:52.592270', 'fedcba9876543210', 21,
+      '2014-05-07T19:47:53.000Z'),
+     ('object/Y', '2014-05-07T19:47:53.592270', 'HASH', 2,
+      '2014-05-07T19:47:54.000Z'),
+     ('object/Y/1', '2014-05-07T19:47:54.592270', '0123456789abcdef', 12,
+      '2014-05-07T19:47:55.000Z'),
+     ('object/Y/2', '2014-05-07T19:47:55.592270', 'fedcba9876543210', 22,
+      '2014-05-07T19:47:56.000Z'),
+     ('object/Z', '2014-05-07T19:47:56.592270', 'HASH', 3,
+      '2014-05-07T19:47:57.000Z'),
+     ('object/Z/1', '2014-05-07T19:47:57.592270', '0123456789abcdef', 13,
+      '2014-05-07T19:47:58.000Z'),
+     ('object/Z/2', '2014-05-07T19:47:58.592270', 'fedcba9876543210', 23,
+      '2014-05-07T19:47:59.000Z'),
+     ('subdir/object/Z', '2014-05-07T19:47:58.592270', 'HASH', 4,
+      '2014-05-07T19:47:59.000Z'),
+     ('subdir/object/Z/1', '2014-05-07T19:47:58.592270', '0123456789abcdef',
+      41, '2014-05-07T19:47:59.000Z'),
+     ('subdir/object/Z/2', '2014-05-07T19:47:58.592270', 'fedcba9876543210',
+      41, '2014-05-07T19:47:59.000Z'),
+     # NB: wsgi strings
+     ('subdir/object/completed\xe2\x98\x83/W/1', '2014-05-07T19:47:58.592270',
+      '0123456789abcdef', 41, '2014-05-07T19:47:59.000Z'),
+     ('subdir/object/completed\xe2\x98\x83/W/2', '2014-05-07T19:47:58.592270',
+      'fedcba9876543210', 41, '2014-05-07T19:47:59'))
+
+S3_ETAG = '"%s-2"' % md5(binascii.a2b_hex(
+    '0123456789abcdef0123456789abcdef'
+    'fedcba9876543210fedcba9876543210'), usedforsecurity=False).hexdigest()
+
+
+class BaseS3ApiMultiUpload(object):
+
+    def setUp(self):
+        super(BaseS3ApiMultiUpload, self).setUp()
+
+        self.segment_bucket = '/v1/AUTH_test/bucket+segments'
+        self.etag = '7dfa07a8e59ddbcd1dc84d4c4f82aea1'
+        self.last_modified = 'Fri, 01 Apr 2014 12:00:00 GMT'
+        put_headers = {'etag': self.etag, 'last-modified': self.last_modified}
+
+        self.s3api.conf.min_segment_size = 1
+
+        objects = [{'name': item[0], 'last_modified': item[1],
+                    'hash': item[2], 'bytes': item[3]}
+                   for item in OBJECTS_TEMPLATE]
+
+        self.swift.register('PUT', self.segment_bucket,
+                            swob.HTTPAccepted, {}, None)
+        # default to just returning everybody...
+        self.swift.register('GET', self.segment_bucket, swob.HTTPOk, {},
+                            json.dumps(objects))
+        self.swift.register('GET', '%s?format=json&marker=%s' % (
+                            self.segment_bucket, objects[-1]['name']),
+                            swob.HTTPOk, {}, json.dumps([]))
+        # but for the listing when aborting an upload, break it up into pages
+        self.swift.register(
+            'GET', '%s?delimiter=/&format=json&marker=&prefix=object/X/' % (
+                self.segment_bucket, ),
+            swob.HTTPOk, {}, json.dumps(objects[:1]))
+        self.swift.register(
+            'GET', '%s?delimiter=/&format=json&marker=%s&prefix=object/X/' % (
+                self.segment_bucket, objects[0]['name']),
+            swob.HTTPOk, {}, json.dumps(objects[1:]))
+        self.swift.register(
+            'GET', '%s?delimiter=/&format=json&marker=%s&prefix=object/X/' % (
+                self.segment_bucket, objects[-1]['name']),
+            swob.HTTPOk, {}, '[]')
+        self.swift.register('HEAD', self.segment_bucket + '/object/X',
+                            swob.HTTPOk,
+                            {'x-object-meta-foo': 'bar',
+                             'content-type': 'application/directory',
+                             'x-object-sysmeta-s3api-has-content-type': 'yes',
+                             'x-object-sysmeta-s3api-content-type':
+                             'baz/quux'}, None)
+        self.swift.register('PUT', self.segment_bucket + '/object/X',
+                            swob.HTTPCreated, {}, None)
+        self.swift.register('DELETE', self.segment_bucket + '/object/X',
+                            swob.HTTPNoContent, {}, None)
+        self.swift.register('GET', self.segment_bucket + '/object/invalid',
+                            swob.HTTPNotFound, {}, None)
+        self.swift.register('PUT', self.segment_bucket + '/object/X/1',
+                            swob.HTTPCreated, put_headers, None)
+        self.swift.register('DELETE', self.segment_bucket + '/object/X/1',
+                            swob.HTTPNoContent, {}, None)
+        self.swift.register('DELETE', self.segment_bucket + '/object/X/2',
+                            swob.HTTPNoContent, {}, None)
+
+    def test_bucket_upload_part_missing_key(self):
+        req = Request.blank('/bucket?partNumber=1&uploadId=x',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidRequest')
+        self.assertEqual([], self.swift.calls)
+        self.assertNotIn('X-Backend-Storage-Policy-Index', headers)
+
+    def test_object_multipart_uploads_list(self):
+        req = Request.blank('/bucket/object?uploads',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidRequest')
+
+    def test_bucket_multipart_uploads_initiate(self):
+        req = Request.blank('/bucket?uploads',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidRequest')
+
+    def test_bucket_list_parts(self):
+        req = Request.blank('/bucket?uploadId=x',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidRequest')
+
+    def test_bucket_multipart_uploads_abort(self):
+        req = Request.blank('/bucket?uploadId=x',
+                            environ={'REQUEST_METHOD': 'DELETE'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidRequest')
+        self.assertEqual(self._get_error_message(body),
+                         'A key must be specified')
+
+    def test_bucket_multipart_uploads_complete(self):
+        req = Request.blank('/bucket?uploadId=x',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidRequest')
+
+    def _test_bucket_multipart_uploads_GET(self, query='',
+                                           multiparts=None):
+        objects = multiparts or MULTIPARTS_TEMPLATE
+        objects = [{'name': item[0], 'last_modified': item[1],
+                    'hash': item[2], 'bytes': item[3]}
+                   for item in objects]
+        object_list = json.dumps(objects).encode('ascii')
+        query_parts = parse_qs(query)
+        swift_query = {'format': 'json'}
+        if 'upload-id-marker' in query_parts and 'key-marker' in query_parts:
+            swift_query['marker'] = '%s/%s' % (
+                query_parts['key-marker'][0],
+                query_parts['upload-id-marker'][0])
+        elif 'key-marker' in query_parts:
+            swift_query['marker'] = '%s/~' % (query_parts['key-marker'][0])
+        if 'prefix' in query_parts:
+            swift_query['prefix'] = query_parts['prefix'][0]
+
+        self.swift.register(
+            'GET', '%s?%s' % (self.segment_bucket,
+                              '&'.join(['%s=%s' % (k, v)
+                                        for k, v in swift_query.items()])),
+            swob.HTTPOk, {}, object_list)
+        swift_query['marker'] = objects[-1]['name']
+        self.swift.register(
+            'GET', '%s?%s' % (self.segment_bucket,
+                              '&'.join(['%s=%s' % (k, v)
+                                        for k, v in swift_query.items()])),
+            swob.HTTPOk, {}, json.dumps([]))
+
+        query = '?uploads&' + query if query else '?uploads'
+        req = Request.blank('/bucket/%s' % query,
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        return self.call_s3api(req)
+
+    def test_bucket_multipart_uploads_GET(self):
+        status, headers, body = self._test_bucket_multipart_uploads_GET()
+        elem = fromstring(body, 'ListMultipartUploadsResult')
+        self.assertEqual(elem.find('Bucket').text, 'bucket')
+        self.assertIsNone(elem.find('KeyMarker').text)
+        self.assertIsNone(elem.find('UploadIdMarker').text)
+        self.assertEqual(elem.find('NextUploadIdMarker').text, 'Z')
+        self.assertEqual(elem.find('MaxUploads').text, '1000')
+        self.assertEqual(elem.find('IsTruncated').text, 'false')
+        self.assertEqual(len(elem.findall('Upload')), 4)
+        objects = [(o[0], o[4]) for o in MULTIPARTS_TEMPLATE]
+        for u in elem.findall('Upload'):
+            name = u.find('Key').text + '/' + u.find('UploadId').text
+            initiated = u.find('Initiated').text
+            self.assertTrue((name, initiated) in objects)
+            self.assertEqual(u.find('Initiator/ID').text, 'test:tester')
+            self.assertEqual(u.find('Initiator/DisplayName').text,
+                             'test:tester')
+            self.assertEqual(u.find('Owner/ID').text, 'test:tester')
+            self.assertEqual(u.find('Owner/DisplayName').text, 'test:tester')
+            self.assertEqual(u.find('StorageClass').text, 'STANDARD')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_bucket_multipart_uploads_GET_without_segment_bucket(self):
+        segment_bucket = '/v1/AUTH_test/bucket+segments'
+        self.swift.register('GET', segment_bucket, swob.HTTPNotFound, {}, '')
+
+        req = Request.blank('/bucket?uploads',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+
+        status, haeaders, body = self.call_s3api(req)
+
+        self.assertEqual(status.split()[0], '200')
+        elem = fromstring(body, 'ListMultipartUploadsResult')
+        self.assertEqual(elem.find('Bucket').text, 'bucket')
+        self.assertIsNone(elem.find('KeyMarker').text)
+        self.assertIsNone(elem.find('UploadIdMarker').text)
+        self.assertIsNone(elem.find('NextUploadIdMarker').text)
+        self.assertEqual(elem.find('MaxUploads').text, '1000')
+        self.assertEqual(elem.find('IsTruncated').text, 'false')
+        self.assertEqual(len(elem.findall('Upload')), 0)
+
+    @patch('swift.common.middleware.s3api.s3request.get_container_info',
+           lambda env, app, swift_source: {'status': 404})
+    def test_bucket_multipart_uploads_GET_without_bucket(self):
+        self.s3acl_response_modified = True
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket',
+                            swob.HTTPNotFound, {}, '')
+        req = Request.blank('/bucket?uploads',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, haeaders, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '404')
+        self.assertEqual(self._get_error_code(body), 'NoSuchBucket')
+
+    def test_bucket_multipart_uploads_GET_encoding_type_error(self):
+        query = 'encoding-type=xml'
+        status, headers, body = \
+            self._test_bucket_multipart_uploads_GET(query)
+        self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+
+    def test_bucket_multipart_uploads_GET_maxuploads(self):
+        query = 'max-uploads=2'
+        status, headers, body = \
+            self._test_bucket_multipart_uploads_GET(query)
+        elem = fromstring(body, 'ListMultipartUploadsResult')
+        self.assertEqual(len(elem.findall('Upload/UploadId')), 2)
+        self.assertEqual(elem.find('NextKeyMarker').text, 'object')
+        self.assertEqual(elem.find('NextUploadIdMarker').text, 'Y')
+        self.assertEqual(elem.find('MaxUploads').text, '2')
+        self.assertEqual(elem.find('IsTruncated').text, 'true')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_bucket_multipart_uploads_GET_str_maxuploads(self):
+        query = 'max-uploads=invalid'
+        status, headers, body = \
+            self._test_bucket_multipart_uploads_GET(query)
+        self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+
+    def test_bucket_multipart_uploads_GET_negative_maxuploads(self):
+        query = 'max-uploads=-1'
+        status, headers, body = \
+            self._test_bucket_multipart_uploads_GET(query)
+        self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+
+    def test_bucket_multipart_uploads_GET_maxuploads_over_default(self):
+        query = 'max-uploads=1001'
+        status, headers, body = \
+            self._test_bucket_multipart_uploads_GET(query)
+        elem = fromstring(body, 'ListMultipartUploadsResult')
+        self.assertEqual(len(elem.findall('Upload/UploadId')), 4)
+        self.assertEqual(elem.find('NextKeyMarker').text, 'subdir/object')
+        self.assertEqual(elem.find('NextUploadIdMarker').text, 'Z')
+        self.assertEqual(elem.find('MaxUploads').text, '1000')
+        self.assertEqual(elem.find('IsTruncated').text, 'false')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_bucket_multipart_uploads_GET_maxuploads_over_max_32bit_int(self):
+        query = 'max-uploads=%s' % (MAX_32BIT_INT + 1)
+        status, headers, body = \
+            self._test_bucket_multipart_uploads_GET(query)
+        self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+
+    def test_bucket_multipart_uploads_GET_with_id_and_key_marker(self):
+        query = 'upload-id-marker=Y&key-marker=object'
+        multiparts = \
+            (('object/Y', '2014-05-07T19:47:53.592270', 'HASH', 2,
+              '2014-05-07T19:47:54.000Z'),
+             ('object/Y/1', '2014-05-07T19:47:54.592270', 'HASH', 12,
+              '2014-05-07T19:47:55.000Z'),
+             ('object/Y/2', '2014-05-07T19:47:55.592270', 'HASH', 22,
+              '2014-05-07T19:47:56.000Z'))
+
+        status, headers, body = \
+            self._test_bucket_multipart_uploads_GET(query, multiparts)
+        elem = fromstring(body, 'ListMultipartUploadsResult')
+        self.assertEqual(elem.find('KeyMarker').text, 'object')
+        self.assertEqual(elem.find('UploadIdMarker').text, 'Y')
+        self.assertEqual(len(elem.findall('Upload')), 1)
+        objects = [(o[0], o[4]) for o in multiparts]
+        for u in elem.findall('Upload'):
+            name = u.find('Key').text + '/' + u.find('UploadId').text
+            initiated = u.find('Initiated').text
+            self.assertTrue((name, initiated) in objects)
+        self.assertEqual(status.split()[0], '200')
+
+        _, path, _ = self.swift.calls_with_headers[-1]
+        path, query_string = path.split('?', 1)
+        query = {}
+        for q in query_string.split('&'):
+            key, arg = q.split('=')
+            query[key] = arg
+        self.assertEqual(query['format'], 'json')
+        self.assertEqual(query['marker'], quote_plus('object/Y/2'))
+
+    def test_bucket_multipart_uploads_GET_with_key_marker(self):
+        query = 'key-marker=object'
+        multiparts = \
+            (('object/X', '2014-05-07T19:47:50.592270', 'HASH', 1,
+              '2014-05-07T19:47:51.000Z'),
+             ('object/X/1', '2014-05-07T19:47:51.592270', 'HASH', 11,
+              '2014-05-07T19:47:52.000Z'),
+             ('object/X/2', '2014-05-07T19:47:52.592270', 'HASH', 21,
+              '2014-05-07T19:47:53.000Z'),
+             ('object/Y', '2014-05-07T19:47:53.592270', 'HASH', 2,
+              '2014-05-07T19:47:54.000Z'),
+             ('object/Y/1', '2014-05-07T19:47:54.592270', 'HASH', 12,
+              '2014-05-07T19:47:55.000Z'),
+             ('object/Y/2', '2014-05-07T19:47:55.592270', 'HASH', 22,
+              '2014-05-07T19:47:56.000Z'))
+        status, headers, body = \
+            self._test_bucket_multipart_uploads_GET(query, multiparts)
+        elem = fromstring(body, 'ListMultipartUploadsResult')
+        self.assertEqual(elem.find('KeyMarker').text, 'object')
+        self.assertEqual(elem.find('NextKeyMarker').text, 'object')
+        self.assertEqual(elem.find('NextUploadIdMarker').text, 'Y')
+        self.assertEqual(len(elem.findall('Upload')), 2)
+        objects = [(o[0], o[4]) for o in multiparts]
+        for u in elem.findall('Upload'):
+            name = u.find('Key').text + '/' + u.find('UploadId').text
+            initiated = u.find('Initiated').text
+            self.assertIn((name, initiated), objects)
+        self.assertEqual(status.split()[0], '200')
+
+        _, path, _ = self.swift.calls_with_headers[-1]
+        path, query_string = path.split('?', 1)
+        query = {}
+        for q in query_string.split('&'):
+            key, arg = q.split('=')
+            query[key] = arg
+        self.assertEqual(query['format'], 'json')
+        self.assertEqual(query['marker'], quote_plus('object/Y/2'))
+
+    def test_bucket_multipart_uploads_GET_with_prefix(self):
+        query = 'prefix=X'
+        multiparts = \
+            (('object/X', '2014-05-07T19:47:50.592270', 'HASH', 1,
+              '2014-05-07T19:47:51.000Z'),
+             ('object/X/1', '2014-05-07T19:47:51.592270', 'HASH', 11,
+              '2014-05-07T19:47:52.000Z'),
+             ('object/X/2', '2014-05-07T19:47:52.592270', 'HASH', 21,
+              '2014-05-07T19:47:53.000Z'))
+        status, headers, body = \
+            self._test_bucket_multipart_uploads_GET(query, multiparts)
+        elem = fromstring(body, 'ListMultipartUploadsResult')
+        self.assertEqual(len(elem.findall('Upload')), 1)
+        objects = [(o[0], o[4]) for o in multiparts]
+        for u in elem.findall('Upload'):
+            name = u.find('Key').text + '/' + u.find('UploadId').text
+            initiated = u.find('Initiated').text
+            self.assertTrue((name, initiated) in objects)
+        self.assertEqual(status.split()[0], '200')
+
+        _, path, _ = self.swift.calls_with_headers[-1]
+        path, query_string = path.split('?', 1)
+        query = {}
+        for q in query_string.split('&'):
+            key, arg = q.split('=')
+            query[key] = arg
+        self.assertEqual(query['format'], 'json')
+        self.assertEqual(query['prefix'], 'X')
+
+    def test_bucket_multipart_uploads_GET_with_delimiter(self):
+        query = 'delimiter=/'
+        multiparts = \
+            (('object/X', '2014-05-07T19:47:50.592270', 'HASH', 1,
+              '2014-05-07T19:47:51.000Z'),
+             ('object/X/1', '2014-05-07T19:47:51.592270', 'HASH', 11,
+              '2014-05-07T19:47:52.000Z'),
+             ('object/X/2', '2014-05-07T19:47:52.592270', 'HASH', 21,
+              '2014-05-07T19:47:53.000Z'),
+             ('object/Y', '2014-05-07T19:47:50.592270', 'HASH', 2,
+              '2014-05-07T19:47:51.000Z'),
+             ('object/Y/1', '2014-05-07T19:47:51.592270', 'HASH', 21,
+              '2014-05-07T19:47:52.000Z'),
+             ('object/Y/2', '2014-05-07T19:47:52.592270', 'HASH', 22,
+              '2014-05-07T19:47:53.000Z'),
+             ('object/Z', '2014-05-07T19:47:50.592270', 'HASH', 3,
+              '2014-05-07T19:47:51.000Z'),
+             ('object/Z/1', '2014-05-07T19:47:51.592270', 'HASH', 31,
+              '2014-05-07T19:47:52.000Z'),
+             ('object/Z/2', '2014-05-07T19:47:52.592270', 'HASH', 32,
+              '2014-05-07T19:47:53.000Z'),
+             ('subdir/object/X', '2014-05-07T19:47:50.592270', 'HASH', 4,
+              '2014-05-07T19:47:51.000Z'),
+             ('subdir/object/X/1', '2014-05-07T19:47:51.592270', 'HASH', 41,
+              '2014-05-07T19:47:52.000Z'),
+             ('subdir/object/X/2', '2014-05-07T19:47:52.592270', 'HASH', 42,
+              '2014-05-07T19:47:53.000Z'),
+             ('subdir/object/Y', '2014-05-07T19:47:50.592270', 'HASH', 5,
+              '2014-05-07T19:47:51.000Z'),
+             ('subdir/object/Y/1', '2014-05-07T19:47:51.592270', 'HASH', 51,
+              '2014-05-07T19:47:52.000Z'),
+             ('subdir/object/Y/2', '2014-05-07T19:47:52.592270', 'HASH', 52,
+              '2014-05-07T19:47:53.000Z'),
+             ('subdir2/object/Z', '2014-05-07T19:47:50.592270', 'HASH', 6,
+              '2014-05-07T19:47:51.000Z'),
+             ('subdir2/object/Z/1', '2014-05-07T19:47:51.592270', 'HASH', 61,
+              '2014-05-07T19:47:52.000Z'),
+             ('subdir2/object/Z/2', '2014-05-07T19:47:52.592270', 'HASH', 62,
+              '2014-05-07T19:47:53.000Z'))
+
+        status, headers, body = \
+            self._test_bucket_multipart_uploads_GET(query, multiparts)
+        elem = fromstring(body, 'ListMultipartUploadsResult')
+        self.assertEqual(len(elem.findall('Upload')), 3)
+        self.assertEqual(len(elem.findall('CommonPrefixes')), 2)
+        objects = [(o[0], o[4]) for o in multiparts
+                   if o[0].startswith('o')]
+        prefixes = set([o[0].split('/')[0] + '/' for o in multiparts
+                       if o[0].startswith('s')])
+        for u in elem.findall('Upload'):
+            name = u.find('Key').text + '/' + u.find('UploadId').text
+            initiated = u.find('Initiated').text
+            self.assertIn((name, initiated), objects)
+        for p in elem.findall('CommonPrefixes'):
+            prefix = p.find('Prefix').text
+            self.assertTrue(prefix in prefixes)
+
+        self.assertEqual(status.split()[0], '200')
+        _, path, _ = self.swift.calls_with_headers[-1]
+        path, query_string = path.split('?', 1)
+        query = {}
+        for q in query_string.split('&'):
+            key, arg = q.split('=')
+            query[key] = arg
+        self.assertEqual(query['format'], 'json')
+        self.assertTrue(query.get('delimiter') is None)
+
+    def test_bucket_multipart_uploads_GET_with_multi_chars_delimiter(self):
+        query = 'delimiter=subdir'
+        multiparts = \
+            (('object/X', '2014-05-07T19:47:50.592270', 'HASH', 1,
+              '2014-05-07T19:47:51.000Z'),
+             ('object/X/1', '2014-05-07T19:47:51.592270', 'HASH', 11,
+              '2014-05-07T19:47:52.000Z'),
+             ('object/X/2', '2014-05-07T19:47:52.592270', 'HASH', 21,
+              '2014-05-07T19:47:53.000Z'),
+             ('dir/subdir/object/X', '2014-05-07T19:47:50.592270',
+              'HASH', 3, '2014-05-07T19:47:51.000Z'),
+             ('dir/subdir/object/X/1', '2014-05-07T19:47:51.592270',
+              'HASH', 31, '2014-05-07T19:47:52.000Z'),
+             ('dir/subdir/object/X/2', '2014-05-07T19:47:52.592270',
+              'HASH', 32, '2014-05-07T19:47:53.000Z'),
+             ('subdir/object/X', '2014-05-07T19:47:50.592270', 'HASH', 4,
+              '2014-05-07T19:47:51.000Z'),
+             ('subdir/object/X/1', '2014-05-07T19:47:51.592270', 'HASH', 41,
+              '2014-05-07T19:47:52.000Z'),
+             ('subdir/object/X/2', '2014-05-07T19:47:52.592270', 'HASH', 42,
+              '2014-05-07T19:47:53.000Z'),
+             ('subdir/object/Y', '2014-05-07T19:47:50.592270', 'HASH', 5,
+              '2014-05-07T19:47:51.000Z'),
+             ('subdir/object/Y/1', '2014-05-07T19:47:51.592270', 'HASH', 51,
+              '2014-05-07T19:47:52.000Z'),
+             ('subdir/object/Y/2', '2014-05-07T19:47:52.592270', 'HASH', 52,
+              '2014-05-07T19:47:53.000Z'),
+             ('subdir2/object/Z', '2014-05-07T19:47:50.592270', 'HASH', 6,
+              '2014-05-07T19:47:51.000Z'),
+             ('subdir2/object/Z/1', '2014-05-07T19:47:51.592270', 'HASH', 61,
+              '2014-05-07T19:47:52.000Z'),
+             ('subdir2/object/Z/2', '2014-05-07T19:47:52.592270', 'HASH', 62,
+              '2014-05-07T19:47:53.000Z'))
+
+        status, headers, body = \
+            self._test_bucket_multipart_uploads_GET(query, multiparts)
+        elem = fromstring(body, 'ListMultipartUploadsResult')
+        self.assertEqual(len(elem.findall('Upload')), 1)
+        self.assertEqual(len(elem.findall('CommonPrefixes')), 2)
+        objects = [(o[0], o[4]) for o in multiparts
+                   if o[0].startswith('object')]
+        prefixes = ('dir/subdir', 'subdir')
+        for u in elem.findall('Upload'):
+            name = u.find('Key').text + '/' + u.find('UploadId').text
+            initiated = u.find('Initiated').text
+            self.assertTrue((name, initiated) in objects)
+        for p in elem.findall('CommonPrefixes'):
+            prefix = p.find('Prefix').text
+            self.assertTrue(prefix in prefixes)
+
+        self.assertEqual(status.split()[0], '200')
+        _, path, _ = self.swift.calls_with_headers[-1]
+        path, query_string = path.split('?', 1)
+        query = {}
+        for q in query_string.split('&'):
+            key, arg = q.split('=')
+            query[key] = arg
+        self.assertEqual(query['format'], 'json')
+        self.assertTrue(query.get('delimiter') is None)
+
+    def test_bucket_multipart_uploads_GET_with_prefix_and_delimiter(self):
+        query = 'prefix=dir/&delimiter=/'
+        multiparts = \
+            (('dir/subdir/object/X', '2014-05-07T19:47:50.592270',
+              'HASH', 4, '2014-05-07T19:47:51.000Z'),
+             ('dir/subdir/object/X/1', '2014-05-07T19:47:51.592270',
+              'HASH', 41, '2014-05-07T19:47:52.000Z'),
+             ('dir/subdir/object/X/2', '2014-05-07T19:47:52.592270',
+              'HASH', 42, '2014-05-07T19:47:53.000Z'),
+             ('dir/object/X', '2014-05-07T19:47:50.592270', 'HASH', 5,
+              '2014-05-07T19:47:51.000Z'),
+             ('dir/object/X/1', '2014-05-07T19:47:51.592270', 'HASH', 51,
+              '2014-05-07T19:47:52.000Z'),
+             ('dir/object/X/2', '2014-05-07T19:47:52.592270', 'HASH', 52,
+              '2014-05-07T19:47:53.000Z'))
+
+        status, headers, body = \
+            self._test_bucket_multipart_uploads_GET(query, multiparts)
+        elem = fromstring(body, 'ListMultipartUploadsResult')
+        self.assertEqual(len(elem.findall('Upload')), 1)
+        self.assertEqual(len(elem.findall('CommonPrefixes')), 1)
+        objects = [(o[0], o[4]) for o in multiparts
+                   if o[0].startswith('dir/o')]
+        prefixes = ['dir/subdir/']
+        for u in elem.findall('Upload'):
+            name = u.find('Key').text + '/' + u.find('UploadId').text
+            initiated = u.find('Initiated').text
+            self.assertIn((name, initiated), objects)
+        for p in elem.findall('CommonPrefixes'):
+            prefix = p.find('Prefix').text
+            self.assertTrue(prefix in prefixes)
+
+        self.assertEqual(status.split()[0], '200')
+        _, path, _ = self.swift.calls_with_headers[-1]
+        path, query_string = path.split('?', 1)
+        query = {}
+        for q in query_string.split('&'):
+            key, arg = q.split('=')
+            query[key] = arg
+        self.assertEqual(query['format'], 'json')
+        self.assertEqual(query['prefix'], quote_plus('dir/'))
+        self.assertTrue(query.get('delimiter') is None)
+
+    def test_object_multipart_upload_complete_error(self):
+        malformed_xml = 'malformed_XML'
+        req = Request.blank('/bucket/object?uploadId=X',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()},
+                            body=malformed_xml)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'MalformedXML')
+
+        # without target bucket
+        req = Request.blank('/nobucket/object?uploadId=X',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(), },
+                            body=XML)
+        with patch(
+                'swift.common.middleware.s3api.s3request.get_container_info',
+                lambda env, app, swift_source: {'status': 404}):
+            self.swift.register('HEAD', '/v1/AUTH_test/nobucket',
+                                swob.HTTPNotFound, {}, None)
+            status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'NoSuchBucket')
+
+    def test_object_multipart_upload_abort_error(self):
+        req = Request.blank('/bucket/object?uploadId=invalid',
+                            environ={'REQUEST_METHOD': 'DELETE'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'NoSuchUpload')
+
+        # without target bucket
+        req = Request.blank('/nobucket/object?uploadId=X',
+                            environ={'REQUEST_METHOD': 'DELETE'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        with patch(
+                'swift.common.middleware.s3api.s3request.get_container_info',
+                lambda env, app, swift_source: {'status': 404}):
+            self.swift.register('HEAD', '/v1/AUTH_test/nobucket',
+                                swob.HTTPNotFound, {}, None)
+            status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'NoSuchBucket')
+
+    def test_object_multipart_upload_abort(self):
+        req = Request.blank('/bucket/object?uploadId=X',
+                            environ={'REQUEST_METHOD': 'DELETE'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '204')
+
+    @patch('swift.common.middleware.s3api.s3request.get_container_info',
+           lambda env, app, swift_source: {'status': 204})
+    def test_object_upload_part_error(self):
+        # without upload id
+        req = Request.blank('/bucket/object?partNumber=1',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()},
+                            body='part object')
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+
+        # invalid part number
+        req = Request.blank('/bucket/object?partNumber=invalid&uploadId=X',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()},
+                            body='part object')
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+        self.assertEqual(self._get_error_message(body),
+                         'Part number must be an integer between 1 and 10000, '
+                         'inclusive')
+
+        # part number must be > 0
+        req = Request.blank('/bucket/object?partNumber=0&uploadId=X',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()},
+                            body='part object')
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+        self.assertEqual(self._get_error_message(body),
+                         'Part number must be an integer between 1 and 10000, '
+                         'inclusive')
+
+        # part number must be < 10001
+        req = Request.blank('/bucket/object?partNumber=10001&uploadId=X',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()},
+                            body='part object')
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+        self.assertEqual(self._get_error_message(body),
+                         'Part number must be an integer between 1 and 10000, '
+                         'inclusive')
+
+        with patch.object(self.s3api.conf, 'max_upload_part_num', 1000):
+            # part number must be < 1001
+            req = Request.blank(
+                '/bucket/object?partNumber=1001&uploadId=X',
+                environ={'REQUEST_METHOD': 'PUT'},
+                headers={'Authorization': 'AWS test:tester:hmac',
+                         'Date': self.get_date_header()},
+                body='part object')
+            status, headers, body = self.call_s3api(req)
+            self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+            self.assertEqual(self._get_error_message(body),
+                             'Part number must be an integer between 1 and '
+                             '1000, inclusive')
+
+        # without target bucket
+        req = Request.blank('/nobucket/object?partNumber=1&uploadId=X',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()},
+                            body='part object')
+        with patch(
+                'swift.common.middleware.s3api.s3request.get_container_info',
+                lambda env, app, swift_source: {'status': 404}):
+            self.swift.register('HEAD', '/v1/AUTH_test/nobucket',
+                                swob.HTTPNotFound, {}, None)
+            status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'NoSuchBucket')
+
+    def test_object_upload_part(self):
+        req = Request.blank('/bucket/object?partNumber=1&uploadId=X',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()},
+                            body='part object')
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+
+    def test_object_list_parts_error(self):
+        req = Request.blank('/bucket/object?uploadId=invalid',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'NoSuchUpload')
+
+        # without target bucket
+        req = Request.blank('/nobucket/object?uploadId=X',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        with patch(
+                'swift.common.middleware.s3api.s3request.get_container_info',
+                lambda env, app, swift_source: {'status': 404}):
+            self.swift.register('HEAD', '/v1/AUTH_test/nobucket',
+                                swob.HTTPNotFound, {}, None)
+            status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'NoSuchBucket')
+
+    def test_object_list_parts(self):
+        swift_parts = [
+            {'name': 'object/X/%d' % i,
+             'last_modified': '2014-05-07T19:47:%02d.592270' % (i % 60),
+             'hash': hex(i),
+             'bytes': 100 * i}
+            for i in range(1, 2000)]
+        ceil_last_modified = ['2014-05-07T19:%02d:%02d.000Z'
+                              % (47 if (i + 1) % 60 else 48, (i + 1) % 60)
+                              for i in range(1, 2000)]
+        swift_sorted = sorted(swift_parts, key=lambda part: part['name'])
+        self.swift.register('GET',
+                            "%s?delimiter=/&format=json&marker=&"
+                            "prefix=object/X/" % self.segment_bucket,
+                            swob.HTTPOk, {}, json.dumps(swift_sorted))
+        self.swift.register('GET',
+                            "%s?delimiter=/&format=json&marker=object/X/999&"
+                            "prefix=object/X/" % self.segment_bucket,
+                            swob.HTTPOk, {}, json.dumps({}))
+        req = Request.blank('/bucket/object?uploadId=X',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'ListPartsResult')
+        self.assertEqual(elem.find('Bucket').text, 'bucket')
+        self.assertEqual(elem.find('Key').text, 'object')
+        self.assertEqual(elem.find('UploadId').text, 'X')
+        self.assertEqual(elem.find('Initiator/ID').text, 'test:tester')
+        self.assertEqual(elem.find('Initiator/ID').text, 'test:tester')
+        self.assertEqual(elem.find('Owner/ID').text, 'test:tester')
+        self.assertEqual(elem.find('Owner/ID').text, 'test:tester')
+        self.assertEqual(elem.find('StorageClass').text, 'STANDARD')
+        self.assertEqual(elem.find('PartNumberMarker').text, '0')
+        self.assertEqual(elem.find('NextPartNumberMarker').text, '1000')
+        self.assertEqual(elem.find('MaxParts').text, '1000')
+        self.assertEqual(elem.find('IsTruncated').text, 'true')
+        self.assertEqual(len(elem.findall('Part')), 1000)
+        s3_parts = []
+        for p in elem.findall('Part'):
+            partnum = int(p.find('PartNumber').text)
+            s3_parts.append(partnum)
+            self.assertEqual(
+                p.find('LastModified').text,
+                ceil_last_modified[partnum - 1])
+            self.assertEqual(p.find('ETag').text.strip(),
+                             '"%s"' % swift_parts[partnum - 1]['hash'])
+            self.assertEqual(p.find('Size').text,
+                             str(swift_parts[partnum - 1]['bytes']))
+        self.assertEqual(status.split()[0], '200')
+        self.assertEqual(s3_parts, list(range(1, 1001)))
+
+    def _test_copy_for_s3acl(self, account, src_permission=None,
+                             src_path='/src_bucket/src_obj', src_headers=None,
+                             head_resp=swob.HTTPOk, put_header=None,
+                             timestamp=None):
+        owner = 'test:tester'
+        grants = [Grant(User(account), src_permission)] \
+            if src_permission else [Grant(User(owner), 'FULL_CONTROL')]
+        src_o_headers = encode_acl('object', ACL(Owner(owner, owner), grants))
+        src_o_headers.update({'last-modified': self.last_modified})
+        src_o_headers.update(src_headers or {})
+        self.swift.register('HEAD', '/v1/AUTH_test/%s' % src_path.lstrip('/'),
+                            head_resp, src_o_headers, None)
+        put_header = put_header or {}
+        put_headers = {'Authorization': 'AWS %s:hmac' % account,
+                       'Date': self.get_date_header(),
+                       'X-Amz-Copy-Source': src_path}
+        put_headers.update(put_header)
+        req = Request.blank(
+            '/bucket/object?partNumber=1&uploadId=X',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers=put_headers)
+        timestamp = timestamp or time.time()
+        with patch('swift.common.middleware.s3api.utils.time.time',
+                   return_value=timestamp):
+            return self.call_s3api(req)
+
+    def test_upload_part_copy(self):
+        date_header = self.get_date_header()
+        timestamp = mktime(date_header)
+        last_modified = S3Timestamp(timestamp).s3xmlformat
+        status, headers, body = self._test_copy_for_s3acl(
+            'test:tester', put_header={'Date': date_header},
+            timestamp=timestamp)
+        self.assertEqual(status.split()[0], '200')
+        self.assertEqual(headers['Content-Type'], 'application/xml')
+        self.assertTrue(headers.get('etag') is None)
+        elem = fromstring(body, 'CopyPartResult')
+        self.assertEqual(elem.find('LastModified').text, last_modified)
+        self.assertEqual(elem.find('ETag').text, '"%s"' % self.etag)
+
+        _, _, headers = self.swift.calls_with_headers[-1]
+        self.assertEqual(headers['X-Copy-From'], '/src_bucket/src_obj')
+        self.assertEqual(headers['Content-Length'], '0')
+        # Some headers *need* to get cleared in case we're copying from
+        # another multipart upload
+        for header in (
+            'X-Object-Sysmeta-S3api-Etag',
+            'X-Object-Sysmeta-Slo-Etag',
+            'X-Object-Sysmeta-Slo-Size',
+            'X-Object-Sysmeta-Container-Update-Override-Etag',
+            'X-Object-Sysmeta-Swift3-Etag',
+        ):
+            self.assertEqual(headers[header], '')
+
+    def test_upload_part_copy_headers_error(self):
+        account = 'test:tester'
+        etag = '7dfa07a8e59ddbcd1dc84d4c4f82aea1'
+        last_modified_since = 'Fri, 01 Apr 2014 12:00:00 GMT'
+
+        header = {'X-Amz-Copy-Source-If-Match': etag}
+        status, header, body = \
+            self._test_copy_for_s3acl(account,
+                                      head_resp=swob.HTTPPreconditionFailed,
+                                      put_header=header)
+        self.assertEqual(self._get_error_code(body), 'PreconditionFailed')
+
+        header = {'X-Amz-Copy-Source-If-None-Match': etag}
+        status, header, body = \
+            self._test_copy_for_s3acl(account,
+                                      head_resp=swob.HTTPNotModified,
+                                      put_header=header)
+        self.assertEqual(self._get_error_code(body), 'PreconditionFailed')
+
+        header = {'X-Amz-Copy-Source-If-Modified-Since': last_modified_since}
+        status, header, body = \
+            self._test_copy_for_s3acl(account,
+                                      head_resp=swob.HTTPNotModified,
+                                      put_header=header)
+        self.assertEqual(self._get_error_code(body), 'PreconditionFailed')
+
+        header = \
+            {'X-Amz-Copy-Source-If-Unmodified-Since': last_modified_since}
+        status, header, body = \
+            self._test_copy_for_s3acl(account,
+                                      head_resp=swob.HTTPPreconditionFailed,
+                                      put_header=header)
+        self.assertEqual(self._get_error_code(body), 'PreconditionFailed')
+
+    def _test_no_body(self, use_content_length=False,
+                      use_transfer_encoding=False, string_to_md5=b''):
+        raw_md5 = md5(string_to_md5, usedforsecurity=False).digest()
+        content_md5 = base64.b64encode(raw_md5).strip()
+        with UnreadableInput(self) as fake_input:
+            req = Request.blank(
+                '/bucket/object?uploadId=X',
+                environ={
+                    'REQUEST_METHOD': 'POST',
+                    'wsgi.input': fake_input},
+                headers={
+                    'Authorization': 'AWS test:tester:hmac',
+                    'Date': self.get_date_header(),
+                    'Content-MD5': content_md5},
+                body='')
+            if not use_content_length:
+                req.environ.pop('CONTENT_LENGTH')
+            if use_transfer_encoding:
+                req.environ['HTTP_TRANSFER_ENCODING'] = 'chunked'
+            status, headers, body = self.call_s3api(req)
+        self.assertEqual(status, '400 Bad Request')
+        self.assertEqual(self._get_error_code(body), 'InvalidRequest')
+        self.assertEqual(self._get_error_message(body),
+                         'You must specify at least one part')
+
+    def test_object_multi_upload_empty_body(self):
+        self._test_no_body()
+        self._test_no_body(string_to_md5=b'test')
+        self._test_no_body(use_content_length=True)
+        self._test_no_body(use_content_length=True, string_to_md5=b'test')
+        self._test_no_body(use_transfer_encoding=True)
+        self._test_no_body(use_transfer_encoding=True, string_to_md5=b'test')
+
+
+class TestS3ApiMultiUpload(BaseS3ApiMultiUpload, S3ApiTestCase):
+
+    def _do_test_bucket_upload_part_success(self, bucket_policy_index,
+                                            segment_bucket_policy_index):
+        self._register_bucket_policy_index_head('bucket', bucket_policy_index)
+        self._register_bucket_policy_index_head('bucket+segments',
+                                                segment_bucket_policy_index)
+        req = Request.blank('/bucket/object?partNumber=1&uploadId=X',
+                            method='PUT',
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        with patch('swift.common.middleware.s3api.s3request.'
+                   'get_container_info',
+                   lambda env, app, swift_source: {'status': 204}):
+            status, headers, body = self.call_s3api(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual([
+            ('HEAD', '/v1/AUTH_test/bucket+segments/object/X'),
+            ('PUT', '/v1/AUTH_test/bucket+segments/object/X/1'),
+        ], self.swift.calls)
+        self.assertEqual(req.environ.get('swift.backend_path'),
+                         '/v1/AUTH_test/bucket+segments/object/X/1')
+        self._assert_policy_index(req.headers, headers,
+                                  segment_bucket_policy_index)
+        # It's not clear if it is necessary or even appropriate for s3api to
+        # set x-timestamp on these requests. However, while it does we'll
+        # assert that it sets a *valid* timestamp.
+        put_headers = self.swift.calls_with_headers[-1][2]
+        self.assert_valid_timestamp(put_headers.get('X-Timestamp'))
+
+    def test_bucket_upload_part_success(self):
+        self._do_test_bucket_upload_part_success(0, 0)
+
+    def test_bucket_upload_part_success_mixed_policy(self):
+        self._do_test_bucket_upload_part_success(0, 1)
+
+    def test_bucket_upload_part_v4_bad_hash(self):
+        authz_header = 'AWS4-HMAC-SHA256 ' + ', '.join([
+            'Credential=test:tester/%s/us-east-1/s3/aws4_request' %
+            self.get_v4_amz_date_header().split('T', 1)[0],
+            'SignedHeaders=host;x-amz-date',
+            'Signature=X',
+        ])
+        req = Request.blank(
+            '/bucket/object?partNumber=1&uploadId=X',
+            method='PUT',
+            headers={'Authorization': authz_header,
+                     'X-Amz-Date': self.get_v4_amz_date_header(),
+                     'X-Amz-Content-SHA256': '0' * 64},
+            body=b'test')
+        with patch('swift.common.middleware.s3api.s3request.'
+                   'get_container_info',
+                   lambda env, app, swift_source: {'status': 204}):
+            status, headers, body = self.call_s3api(req)
+        self.assertEqual(status, '400 Bad Request')
+        self.assertEqual(self._get_error_code(body),
+                         'XAmzContentSHA256Mismatch')
+        self.assertEqual([
+            ('HEAD', '/v1/AUTH_test/bucket+segments/object/X'),
+            ('PUT', '/v1/AUTH_test/bucket+segments/object/X/1'),
+        ], self.swift.calls)
+        self.assertEqual('/v1/AUTH_test/bucket+segments/object/X/1',
+                         req.environ.get('swift.backend_path'))
+
+    def test_bucket_multipart_uploads_GET_paginated(self):
+        uploads = [
+            ['object/abc'] + ['object/abc/%d' % i for i in range(1, 1000)],
+            ['object/def'] + ['object/def/%d' % i for i in range(1, 1000)],
+            ['object/ghi'] + ['object/ghi/%d' % i for i in range(1, 1000)],
+        ]
+
+        objects = [
+            {'name': name, 'last_modified': '2014-05-07T19:47:50.592270',
+             'hash': 'HASH', 'bytes': 42}
+            for upload in uploads for name in upload
+        ]
+        end = 1000
+        while True:
+            if end == 1000:
+                self.swift.register(
+                    'GET', '%s?format=json' % (self.segment_bucket),
+                    swob.HTTPOk, {}, json.dumps(objects[:end]))
+            else:
+                self.swift.register(
+                    'GET', '%s?format=json&marker=%s' % (
+                        self.segment_bucket, objects[end - 1001]['name']),
+                    swob.HTTPOk, {}, json.dumps(objects[end - 1000:end]))
+            if not objects[end - 1000:end]:
+                break
+            end += 1000
+        req = Request.blank('/bucket/?uploads',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'ListMultipartUploadsResult')
+        self.assertEqual(elem.find('Bucket').text, 'bucket')
+        self.assertIsNone(elem.find('KeyMarker').text)
+        self.assertIsNone(elem.find('UploadIdMarker').text)
+        self.assertEqual(elem.find('NextUploadIdMarker').text, 'ghi')
+        self.assertEqual(elem.find('MaxUploads').text, '1000')
+        self.assertEqual(elem.find('IsTruncated').text, 'false')
+        self.assertEqual(len(elem.findall('Upload')), len(uploads))
+        expected_uploads = [(upload[0], '2014-05-07T19:47:51.000Z')
+                            for upload in uploads]
+        for u in elem.findall('Upload'):
+            name = u.find('Key').text + '/' + u.find('UploadId').text
+            initiated = u.find('Initiated').text
+            self.assertIn((name, initiated), expected_uploads)
+            self.assertEqual(u.find('Initiator/ID').text, 'test:tester')
+            self.assertEqual(u.find('Initiator/DisplayName').text,
+                             'test:tester')
+            self.assertEqual(u.find('Owner/ID').text, 'test:tester')
+            self.assertEqual(u.find('Owner/DisplayName').text, 'test:tester')
+            self.assertEqual(u.find('StorageClass').text, 'STANDARD')
+        self.assertEqual(status.split()[0], '200')
+
+    @patch('swift.common.middleware.s3api.controllers.'
+           'multi_upload.unique_id', lambda: 'X')
+    def _test_object_multipart_upload_initiate(
+            self, headers, cache=None, bucket_exists=True,
+            bucket_policy_index=int(POLICIES.default),
+            segment_bucket_policy_index=None,
+            expected_read_acl=None,
+            expected_write_acl=None):
+        if segment_bucket_policy_index is None:
+            segment_bucket_policy_index = bucket_policy_index
+        self._register_bucket_policy_index_head('bucket', bucket_policy_index)
+        self._register_bucket_policy_index_head('bucket+segments',
+                                                segment_bucket_policy_index)
+        headers.update({
+            'Authorization': 'AWS test:tester:hmac',
+            'Date': self.get_date_header(),
+            'x-amz-meta-foo': 'bar',
+            'content-encoding': 'gzip',
+        })
+        req = Request.blank('/bucket/object?uploads',
+                            environ={'REQUEST_METHOD': 'POST',
+                                     'swift.cache': cache},
+                            headers=headers)
+        status, headers, body = self.call_s3api(req)
+        fromstring(body, 'InitiateMultipartUploadResult')
+        self.assertEqual(status.split()[0], '200')
+
+        self.assertEqual(req.environ['swift.backend_path'],
+                         '/v1/AUTH_test/bucket+segments/object/X')
+        self._assert_policy_index(req.headers, headers,
+                                  segment_bucket_policy_index)
+
+        _, _, req_headers = self.swift.calls_with_headers[-1]
+        self.assertEqual(req_headers.get('X-Object-Meta-Foo'), 'bar')
+        self.assertEqual(req_headers.get('Content-Encoding'), 'gzip')
+        self.assertNotIn('Etag', req_headers)
+        self.assertNotIn('Content-MD5', req_headers)
+        if bucket_exists:
+            self.assertEqual([
+                ('PUT', '/v1/AUTH_test/bucket+segments/object/X'),
+            ], self.swift.calls)
+        else:
+            self.assertEqual([
+                ('PUT', '/v1/AUTH_test/bucket+segments'),
+                ('PUT', '/v1/AUTH_test/bucket+segments/object/X'),
+            ], self.swift.calls)
+            expected_policy = POLICIES[bucket_policy_index].name
+            _, _, req_headers = self.swift.calls_with_headers[-2]
+            self.assertEqual(req_headers.get('X-Storage-Policy'),
+                             expected_policy)
+
+            if expected_read_acl:
+                _, _, req_headers = self.swift.calls_with_headers[-2]
+                self.assertEqual(req_headers.get('X-Container-Read'),
+                                 expected_read_acl)
+            else:
+                self.assertNotIn('X-Container-Read', req_headers)
+
+            if expected_write_acl:
+                _, _, req_headers = self.swift.calls_with_headers[-2]
+                self.assertEqual(req_headers.get('X-Container-Write'),
+                                 expected_write_acl)
+            else:
+                self.assertNotIn('X-Container-Write', req_headers)
+        self.swift.clear_calls()
+
+    def test_object_multipart_upload_initiate_with_segment_bucket(self):
+        fake_memcache = FakeMemcache()
+        fake_memcache.store[get_cache_key(
+            'AUTH_test', 'bucket+segments')] = {'status': 204}
+        fake_memcache.store[get_cache_key(
+            'AUTH_test', 'bucket')] = {'status': 204}
+        self._test_object_multipart_upload_initiate({}, fake_memcache)
+        self._test_object_multipart_upload_initiate({'Etag': 'blahblahblah'},
+                                                    fake_memcache)
+        self._test_object_multipart_upload_initiate({
+            'Content-MD5': base64.b64encode(b'blahblahblahblah').strip()},
+            fake_memcache)
+
+    def test_object_multipart_upload_initiate_with_checksum_algorithm(self):
+        fake_memcache = FakeMemcache()
+        fake_memcache.store[get_cache_key(
+            'AUTH_test', 'bucket+segments')] = {'status': 204}
+        fake_memcache.store[get_cache_key(
+            'AUTH_test', 'bucket')] = {'status': 204}
+        self._test_object_multipart_upload_initiate(
+            {'X-Amz-Checksum-Algorithm': 'CRC32',
+             'X-Amz-Checksum-Type': 'COMPOSITE'}, fake_memcache)
+
+    def test_object_mpu_initiate_with_segment_bucket_mixed_policy(self):
+        fake_memcache = FakeMemcache()
+        fake_memcache.store[get_cache_key(
+            'AUTH_test', 'bucket+segments')] = {'status': 204}
+        fake_memcache.store[get_cache_key(
+            'AUTH_test', 'bucket')] = {'status': 204}
+        self._test_object_multipart_upload_initiate(
+            {}, fake_memcache, bucket_policy_index=0,
+            segment_bucket_policy_index=1)
+
+    def test_object_multipart_upload_initiate_without_segment_bucket(self):
+        self.swift.register('PUT', '/v1/AUTH_test/bucket+segments',
+                            swob.HTTPCreated, {}, None)
+        fake_memcache = FakeMemcache()
+        fake_memcache.store[get_cache_key(
+            'AUTH_test', 'bucket')] = {'status': 204}
+        fake_memcache.store[get_cache_key(
+            'AUTH_test', 'bucket+segments')] = {'status': 404}
+        self._test_object_multipart_upload_initiate({}, fake_memcache,
+                                                    bucket_exists=False)
+        self._test_object_multipart_upload_initiate({'Etag': 'blahblahblah'},
+                                                    fake_memcache,
+                                                    bucket_exists=False)
+        self._test_object_multipart_upload_initiate(
+            {'Content-MD5': base64.b64encode(b'blahblahblahblah').strip()},
+            fake_memcache,
+            bucket_exists=False)
+
+    @patch_policies([
+        StoragePolicy(0, 'gold', is_default=True),
+        StoragePolicy(1, 'silver')])
+    def test_object_mpu_initiate_without_segment_bucket_same_policy(self):
+        self.swift.register('PUT', '/v1/AUTH_test/bucket+segments',
+                            swob.HTTPCreated,
+                            {'X-Storage-Policy': 'silver'}, None)
+        fake_memcache = FakeMemcache()
+        fake_memcache.store[get_cache_key(
+            'AUTH_test', 'bucket')] = {'status': 204,
+                                       'storage_policy': '1'}
+        fake_memcache.store[get_cache_key(
+            'AUTH_test', 'bucket+segments')] = {'status': 404}
+        self.s3api.conf.derived_container_policy_use_default = False
+        self._test_object_multipart_upload_initiate({}, fake_memcache,
+                                                    bucket_exists=False,
+                                                    bucket_policy_index=1)
+        self._test_object_multipart_upload_initiate({'Etag': 'blahblahblah'},
+                                                    fake_memcache,
+                                                    bucket_exists=False,
+                                                    bucket_policy_index=1)
+        self._test_object_multipart_upload_initiate(
+            {'Content-MD5': base64.b64encode(b'blahblahblahblah').strip()},
+            fake_memcache,
+            bucket_exists=False,
+            bucket_policy_index=1)
+
+    def test_object_mpu_initiate_without_segment_bucket_same_acls(self):
+        self.swift.register('PUT', '/v1/AUTH_test/bucket+segments',
+                            swob.HTTPCreated, {}, None)
+        fake_memcache = FakeMemcache()
+        fake_memcache.store[get_cache_key(
+            'AUTH_test', 'bucket')] = {'status': 204,
+                                       'read_acl': 'alice,bob',
+                                       'write_acl': 'bob,charles'}
+        fake_memcache.store[get_cache_key(
+            'AUTH_test', 'bucket+segments')] = {'status': 404}
+        self.s3api.conf.derived_container_policy_use_default = False
+        self._test_object_multipart_upload_initiate(
+            {}, fake_memcache,
+            bucket_exists=False,
+            expected_read_acl='alice,bob', expected_write_acl='bob,charles')
+        self._test_object_multipart_upload_initiate(
+            {'Etag': 'blahblahblah'}, fake_memcache,
+            bucket_exists=False,
+            expected_read_acl='alice,bob', expected_write_acl='bob,charles')
+        self._test_object_multipart_upload_initiate(
+            {'Content-MD5': base64.b64encode(b'blahblahblahblah').strip()},
+            fake_memcache,
+            bucket_exists=False,
+            expected_read_acl='alice,bob', expected_write_acl='bob,charles')
+
+    def test_object_mpu_initiate_without_segment_bucket_make_public(self):
+        self.swift.register('PUT', '/v1/AUTH_test/bucket+segments',
+                            swob.HTTPCreated, {}, None)
+        fake_memcache = FakeMemcache()
+        fake_memcache.store[get_cache_key(
+            'AUTH_test', 'bucket')] = {'status': 204,
+                                       'read_acl': '.r:*,.rlistings'}
+        fake_memcache.store[get_cache_key(
+            'AUTH_test', 'bucket+segments')] = {'status': 404}
+        self.s3api.conf.derived_container_policy_use_default = False
+        self._test_object_multipart_upload_initiate(
+            {}, fake_memcache,
+            bucket_exists=False,
+            expected_read_acl='.r:*,.rlistings')
+        self._test_object_multipart_upload_initiate(
+            {'Etag': 'blahblahblah'}, fake_memcache,
+            bucket_exists=False,
+            expected_read_acl='.r:*,.rlistings')
+        self._test_object_multipart_upload_initiate(
+            {'Content-MD5': base64.b64encode(b'blahblahblahblah').strip()},
+            fake_memcache,
+            bucket_exists=False,
+            expected_read_acl='.r:*,.rlistings')
+
+    @patch('swift.common.middleware.s3api.controllers.multi_upload.'
+           'unique_id', lambda: 'X')
+    def _test_object_multipart_upload_initiate_s3acl(
+            self, cache, existance_cached, should_head, should_put,
+            bucket_policy_index=int(POLICIES.default),
+            segment_bucket_policy_index=None):
+        if segment_bucket_policy_index is None:
+            segment_bucket_policy_index = bucket_policy_index
+        # N.B. this s3acl test does NOT use the common S3ApiTestAcl setUp
+        self.s3api.conf.s3_acl = True
+        container_headers = encode_acl('container', ACL(
+            Owner('test:tester', 'test:tester'),
+            [Grant(User('test:tester'), 'FULL_CONTROL')]))
+        container_headers['X-Backend-Storage-Policy-Index'] = \
+            bucket_policy_index
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket',
+                            swob.HTTPNoContent, container_headers, None)
+        self._register_bucket_policy_index_head('bucket+segments',
+                                                segment_bucket_policy_index)
+        cache.store[get_cache_key('AUTH_test')] = {'status': 204}
+
+        req = Request.blank('/bucket/object?uploads',
+                            environ={'REQUEST_METHOD': 'POST',
+                                     'swift.cache': cache},
+                            headers={'Authorization':
+                                     'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'x-amz-acl': 'public-read',
+                                     'x-amz-meta-foo': 'bar',
+                                     'Content-Type': 'cat/picture'})
+        status, headers, body = self.call_s3api(req)
+        fromstring(body, 'InitiateMultipartUploadResult')
+        self.assertEqual(status.split()[0], '200')
+        self.assertEqual(req.environ['swift.backend_path'],
+                         '/v1/AUTH_test/bucket+segments/object/X')
+        self._assert_policy_index(req.headers, headers,
+                                  segment_bucket_policy_index)
+        # This is the get_container_info existance check :'(
+        expected = []
+        if not existance_cached:
+            expected.append(('HEAD', '/v1/AUTH_test/bucket'))
+        if should_head:
+            expected.append(('HEAD', '/v1/AUTH_test/bucket+segments'))
+        # XXX: For some reason check ACLs always does second HEAD (???)
+        expected.append(('HEAD', '/v1/AUTH_test/bucket'))
+        if should_put:
+            expected.append(('PUT', '/v1/AUTH_test/bucket+segments'))
+        expected.append(('PUT', '/v1/AUTH_test/bucket+segments/object/X'))
+        self.assertEqual(expected, self.swift.calls)
+
+        _, _, req_headers = self.swift.calls_with_headers[-1]
+        self.assertEqual(req_headers.get('X-Object-Meta-Foo'), 'bar')
+        self.assertEqual(req_headers.get(
+            'X-Object-Sysmeta-S3api-Has-Content-Type'), 'yes')
+        self.assertEqual(req_headers.get(
+            'X-Object-Sysmeta-S3api-Content-Type'), 'cat/picture')
+        tmpacl_header = req_headers.get(sysmeta_header('object', 'tmpacl'))
+        self.assertTrue(tmpacl_header)
+        acl_header = encode_acl('object',
+                                ACLPublicRead(Owner('test:tester',
+                                                    'test:tester')))
+        self.assertEqual(acl_header.get(sysmeta_header('object', 'acl')),
+                         tmpacl_header)
+
+    def test_object_mpu_initiate_s3acl_with_segment_bucket(self):
+        kwargs = {
+            'existance_cached': False,
+            'should_head': True,
+            'should_put': False,
+        }
+        self._test_object_multipart_upload_initiate_s3acl(
+            FakeMemcache(), **kwargs)
+
+    def test_object_mpu_initiate_s3acl_with_segment_bucket_mixed_policy(self):
+        kwargs = {
+            'existance_cached': False,
+            'should_head': True,
+            'should_put': False,
+        }
+        self._test_object_multipart_upload_initiate_s3acl(
+            FakeMemcache(), bucket_policy_index=0,
+            segment_bucket_policy_index=1, **kwargs)
+
+    def test_object_multipart_upload_initiate_s3acl_with_cached_seg_buck(self):
+        fake_memcache = FakeMemcache()
+        fake_memcache.store.update({
+            get_cache_key('AUTH_test', 'bucket'): {'status': 204},
+            get_cache_key('AUTH_test', 'bucket+segments'): {'status': 204},
+        })
+        kwargs = {
+            'existance_cached': True,
+            'should_head': False,
+            'should_put': False,
+        }
+        self._test_object_multipart_upload_initiate_s3acl(
+            fake_memcache, **kwargs)
+
+    def test_object_mpu_initiate_s3acl_without_segment_bucket(
+            self):
+        fake_memcache = FakeMemcache()
+        fake_memcache.store.update({
+            get_cache_key('AUTH_test', 'bucket'): {'status': 204},
+            get_cache_key('AUTH_test', 'bucket+segments'): {'status': 404},
+        })
+        self.swift.register('PUT', '/v1/AUTH_test/bucket+segments',
+                            swob.HTTPCreated, {}, None)
+        kwargs = {
+            'existance_cached': True,
+            'should_head': False,
+            'should_put': True,
+        }
+        self._test_object_multipart_upload_initiate_s3acl(
+            fake_memcache, **kwargs)
+
+    def test_object_mpu_initiate_s3acl_without_segment_bucket_mixed_policy(
+            self):
+        fake_memcache = FakeMemcache()
+        fake_memcache.store.update({
+            get_cache_key('AUTH_test', 'bucket'): {'status': 204},
+            get_cache_key('AUTH_test', 'bucket+segments'): {'status': 404},
+        })
+        self.swift.register('PUT', '/v1/AUTH_test/bucket+segments',
+                            swob.HTTPCreated, {}, None)
+        kwargs = {
+            'existance_cached': True,
+            'should_head': False,
+            'should_put': True,
+        }
+        self._test_object_multipart_upload_initiate_s3acl(
+            fake_memcache, bucket_policy_index=0,
+            segment_bucket_policy_index=0, **kwargs)
+
+    @patch('swift.common.middleware.s3api.controllers.'
+           'multi_upload.unique_id', lambda: 'X')
+    def test_object_multipart_upload_initiate_without_bucket(self):
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket',
+                            swob.HTTPNotFound, {}, None)
+        req = Request.blank('/bucket/object?uploads',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization':
+                                     'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '404')
+        self.assertEqual(self._get_error_code(body), 'NoSuchBucket')
+
+    def _do_test_object_multipart_upload_complete(
+            self, bucket_policy_index=int(POLICIES.default),
+            segment_bucket_policy_index=None, extra_headers=None):
+        extra_headers = extra_headers or {}
+        content_md5 = base64.b64encode(md5(
+            XML.encode('ascii'), usedforsecurity=False).digest())
+        req = Request.blank('/bucket/object?uploadId=X',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'Content-MD5': content_md5,
+                                     **extra_headers},
+                            body=XML)
+        if segment_bucket_policy_index is None:
+            segment_bucket_policy_index = bucket_policy_index
+        self._register_bucket_policy_index_head('bucket', bucket_policy_index)
+        self._register_bucket_policy_index_head('bucket+segments',
+                                                segment_bucket_policy_index)
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'CompleteMultipartUploadResult')
+        self.assertNotIn('Etag', headers)
+        self.assertEqual(elem.find('ETag').text, S3_ETAG)
+        self.assertEqual(status.split()[0], '200')
+
+        self.assertEqual(self.swift.calls, [
+            # Bucket exists
+            ('HEAD', '/v1/AUTH_test'),
+            ('HEAD', '/v1/AUTH_test/bucket'),
+            # Upload marker exists
+            ('HEAD', '/v1/AUTH_test/bucket+segments/object/X'),
+            # Create the SLO
+            ('PUT', '/v1/AUTH_test/bucket/object'
+                    '?heartbeat=on&multipart-manifest=put'),
+            # Delete the in-progress-upload marker
+            ('DELETE', '/v1/AUTH_test/bucket+segments/object/X')
+        ])
+        self.assertEqual(req.environ['swift.backend_path'],
+                         '/v1/AUTH_test/bucket+segments/object/X')
+        self._assert_policy_index(req.headers, headers,
+                                  segment_bucket_policy_index)
+
+        _, _, headers = self.swift.calls_with_headers[-2]
+        self.assertEqual(headers.get('X-Object-Meta-Foo'), 'bar')
+        self.assertEqual(headers.get('Content-Type'), 'baz/quux')
+        # SLO will provide a base value
+        override_etag = '; s3_etag=%s' % S3_ETAG.strip('"')
+        h = 'X-Object-Sysmeta-Container-Update-Override-Etag'
+        self.assertEqual(headers.get(h), override_etag)
+        self.assertEqual(headers.get('X-Object-Sysmeta-S3Api-Upload-Id'), 'X')
+
+        # s3api doesn't set storage policy index nor x-timestamp on these swift
+        # subrequests
+        spi = [hdrs.get('X-Backend-Storage-Policy-Index')
+               for _, _, hdrs in self.swift.calls_with_headers]
+        self.assertEqual(spi, [None] * 5)
+        ts = [hdrs.get('X-Timestamp')
+              for _, _, hdrs in self.swift.calls_with_headers]
+        self.assertEqual(ts, [None] * 5)
+
+    def test_object_multipart_upload_complete(self):
+        self._do_test_object_multipart_upload_complete()
+
+    def test_object_multipart_upload_complete_with_if_none_match_star(self):
+        self._do_test_object_multipart_upload_complete(
+            extra_headers={'If-None-Match': '*'}
+        )
+
+    def test_object_multipart_upload_complete_mixed_policy(self):
+        self._do_test_object_multipart_upload_complete(
+            bucket_policy_index=0, segment_bucket_policy_index=1
+        )
+
+    def test_mpu_complete_mixed_policy_with_if_none_match_star(self):
+        self._do_test_object_multipart_upload_complete(
+            bucket_policy_index=0, segment_bucket_policy_index=1,
+            extra_headers={'If-None-Match': '*'}
+        )
+
+    def _do_test_object_multipart_upload_complete_501(self, extra_headers):
+        bucket_policy_index = int(POLICIES.default)
+        segment_bucket_policy_index = bucket_policy_index
+        content_md5 = base64.b64encode(md5(
+            XML.encode('ascii'), usedforsecurity=False).digest())
+        req = Request.blank('/bucket/object?uploadId=X',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'Content-MD5': content_md5,
+                                     **extra_headers},
+                            body=XML)
+        self._register_bucket_policy_index_head('bucket', bucket_policy_index)
+        self._register_bucket_policy_index_head('bucket+segments',
+                                                segment_bucket_policy_index)
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'Error')
+        self.assertEqual(elem.find('Code').text, 'NotImplemented')
+        self.assertEqual(status.split()[0], '501')
+
+        self.assertEqual(self.swift.calls, [
+            # Bucket exists
+            ('HEAD', '/v1/AUTH_test'),
+            ('HEAD', '/v1/AUTH_test/bucket'),
+            # And then we bail because of the 501
+        ])
+
+    def test_object_multipart_upload_complete_with_if_match(self):
+        self._do_test_object_multipart_upload_complete_501(
+            extra_headers={'If-Match': 'not-the-etag'}
+        )
+
+    def test_object_multipart_upload_complete_with_if_none_match(self):
+        self._do_test_object_multipart_upload_complete_501(
+            extra_headers={'If-None-Match': 'not-the-etag'}
+        )
+
+    def test_object_multipart_upload_complete_with_if_modified_since(self):
+        self._do_test_object_multipart_upload_complete_501(
+            extra_headers={'If-Modified-Since': 'not-the-etag'}
+        )
+
+    def test_object_multipart_upload_complete_with_if_unmodified_since(self):
+        self._do_test_object_multipart_upload_complete_501(
+            extra_headers={'If-Unmodified-Since': 'not-the-etag'}
+        )
+
+    def test_object_multipart_upload_complete_other_headers(self):
+        headers = {'x-object-meta-foo': 'bar',
+                   'content-type': 'application/directory',
+                   'x-object-sysmeta-s3api-has-content-type': 'yes',
+                   'x-object-sysmeta-s3api-content-type': 'baz/quux',
+                   'content-encoding': 'gzip',
+                   'content-language': 'de-DE',
+                   'content-disposition': 'attachment',
+                   'expires': 'Fri, 25 Mar 2022 09:34:00 GMT',
+                   'cache-control': 'no-cache'
+                   }
+        self.swift.register('HEAD', self.segment_bucket + '/object/X',
+                            swob.HTTPOk, headers, None)
+        self._do_test_object_multipart_upload_complete()
+        _, _, headers = self.swift.calls_with_headers[-2]
+        self.assertEqual('gzip', headers.get('Content-Encoding'))
+        self.assertEqual('de-DE', headers.get('Content-Language'))
+        self.assertEqual('attachment', headers.get('Content-Disposition'))
+        self.assertEqual('Fri, 25 Mar 2022 09:34:00 GMT',
+                         headers.get('Expires'))
+        self.assertEqual('no-cache', headers.get('Cache-Control'))
+
+    def test_object_multipart_upload_complete_non_ascii(self):
+        wsgi_snowman = '\xe2\x98\x83'
+
+        self.swift.register(
+            'HEAD', '/v1/AUTH_test/bucket+segments/%s/X' % wsgi_snowman,
+            swob.HTTPOk, {}, None)
+        self.swift.register('PUT', '/v1/AUTH_test/bucket/%s' % wsgi_snowman,
+                            swob.HTTPCreated, {}, None)
+        self.swift.register(
+            'DELETE', '/v1/AUTH_test/bucket+segments/%s/X' % wsgi_snowman,
+            swob.HTTPOk, {}, None)
+
+        content_md5 = base64.b64encode(md5(
+            XML.encode('ascii'), usedforsecurity=False).digest())
+        req = Request.blank('/bucket/%s?uploadId=X' % wsgi_snowman,
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'Content-MD5': content_md5, },
+                            body=XML)
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'CompleteMultipartUploadResult')
+        self.assertNotIn('Etag', headers)
+        self.assertEqual(elem.find('ETag').text, S3_ETAG)
+        self.assertEqual(status.split()[0], '200')
+
+        self.assertEqual(self.swift.calls, [
+            # Bucket exists
+            ('HEAD', '/v1/AUTH_test'),
+            ('HEAD', '/v1/AUTH_test/bucket'),
+            # Upload marker exists
+            ('HEAD', '/v1/AUTH_test/bucket+segments/%s/X' % wsgi_snowman),
+            # Create the SLO
+            ('PUT', '/v1/AUTH_test/bucket/%s'
+                    '?heartbeat=on&multipart-manifest=put' % wsgi_snowman),
+            # Delete the in-progress-upload marker
+            ('DELETE', '/v1/AUTH_test/bucket+segments/%s/X' % wsgi_snowman)
+        ])
+
+        self.assertEqual(json.loads(self.swift.call_list[-2].body), [
+            {"path": u"/bucket+segments/\N{SNOWMAN}/X/1",
+             "etag": "0123456789abcdef0123456789abcdef"},
+            {"path": u"/bucket+segments/\N{SNOWMAN}/X/2",
+             "etag": "fedcba9876543210fedcba9876543210"},
+        ])
+
+    def _do_test_object_multipart_upload_retry_complete(
+            self, bucket_policy_index=int(POLICIES.default),
+            segment_bucket_policy_index=None, extra_headers=None):
+        extra_headers = extra_headers or {}
+        if segment_bucket_policy_index is None:
+            segment_bucket_policy_index = bucket_policy_index
+        self._register_bucket_policy_index_head('bucket', bucket_policy_index)
+        self._register_bucket_policy_index_head('bucket+segments',
+                                                segment_bucket_policy_index)
+        content_md5 = base64.b64encode(md5(
+            XML.encode('ascii'), usedforsecurity=False).digest())
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket+segments/object/X',
+                            swob.HTTPNotFound, {}, None)
+        recent_ts = S3Timestamp.now(delta=-1000000).internal  # 10s ago
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPOk,
+                            {'x-object-meta-foo': 'bar',
+                             'content-type': 'baz/quux',
+                             'x-object-sysmeta-s3api-upload-id': 'X',
+                             'x-object-sysmeta-s3api-etag': S3_ETAG.strip('"'),
+                             'x-timestamp': recent_ts}, None)
+        req = Request.blank('/bucket/object?uploadId=X',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'Content-MD5': content_md5,
+                                     **extra_headers},
+                            body=XML)
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'CompleteMultipartUploadResult')
+        self.assertNotIn('Etag', headers)
+        self.assertEqual(elem.find('ETag').text, S3_ETAG)
+        self.assertEqual(status.split()[0], '200')
+
+        self.assertEqual(self.swift.calls, [
+            # Bucket exists
+            ('HEAD', '/v1/AUTH_test'),
+            ('HEAD', '/v1/AUTH_test/bucket'),
+            # Upload marker does not exist
+            ('HEAD', '/v1/AUTH_test/bucket+segments/object/X'),
+            # But the object does, and with the same upload ID
+            ('HEAD', '/v1/AUTH_test/bucket/object'),
+            # So no PUT necessary
+        ])
+        self.assertEqual(req.environ['swift.backend_path'],
+                         '/v1/AUTH_test/bucket+segments/object/X')
+        self._assert_policy_index(req.headers, headers,
+                                  segment_bucket_policy_index)
+
+    def test_object_multipart_upload_retry_complete(self):
+        self._do_test_object_multipart_upload_retry_complete()
+
+    def test_mpu_retry_complete_with_if_none_match_star(self):
+        self._do_test_object_multipart_upload_retry_complete(
+            extra_headers={'If-None-Match': '*'})
+
+    def test_object_multipart_upload_retry_complete_mixed_policy(self):
+        self._do_test_object_multipart_upload_retry_complete(
+            bucket_policy_index=0, segment_bucket_policy_index=1)
+
+    def test_mpu_retry_complete_mixed_policy_with_if_none_match_star(self):
+        self._do_test_object_multipart_upload_retry_complete(
+            bucket_policy_index=0, segment_bucket_policy_index=1,
+            extra_headers={'If-None-Match': '*'})
+
+    def _do_object_multipart_upload_retry_complete_etag_mismatch(
+            self, extra_headers=None):
+        extra_headers = extra_headers or {}
+        content_md5 = base64.b64encode(md5(
+            XML.encode('ascii'), usedforsecurity=False).digest())
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket+segments/object/X',
+                            swob.HTTPNotFound, {}, None)
+        recent_ts = S3Timestamp.now(delta=-1000000).internal
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPOk,
+                            {'x-object-meta-foo': 'bar',
+                             'content-type': 'baz/quux',
+                             'x-object-sysmeta-s3api-upload-id': 'X',
+                             'x-object-sysmeta-s3api-etag': 'not-the-etag',
+                             'x-timestamp': recent_ts}, None)
+        req = Request.blank('/bucket/object?uploadId=X',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'Content-MD5': content_md5,
+                                     **extra_headers},
+                            body=XML)
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'Error')
+        self.assertEqual(elem.find('Code').text, 'NoSuchUpload')
+        self.assertEqual(status.split()[0], '404')
+
+        self.assertEqual(self.swift.calls, [
+            # Bucket exists
+            ('HEAD', '/v1/AUTH_test'),
+            ('HEAD', '/v1/AUTH_test/bucket'),
+            # Upload marker does not exist
+            ('HEAD', '/v1/AUTH_test/bucket+segments/object/X'),
+            # But the object does, and with the same upload ID
+            ('HEAD', '/v1/AUTH_test/bucket/object'),
+            # And then we bail
+        ])
+        self.assertEqual(req.environ['swift.backend_path'],
+                         '/v1/AUTH_test/bucket+segments/object/X')
+
+    def test_object_multipart_upload_retry_complete_etag_mismatch(self):
+        self._do_object_multipart_upload_retry_complete_etag_mismatch()
+
+    def test_object_multipart_upload_retry_complete_with_if_none_match_star(
+            self):
+        self._do_object_multipart_upload_retry_complete_etag_mismatch(
+            {'If-None-Match': '*'})
+
+    def _do_object_multipart_upload_retry_complete_etag_mismatch_501(
+            self, extra_headers):
+        content_md5 = base64.b64encode(md5(
+            XML.encode('ascii'), usedforsecurity=False).digest())
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket+segments/object/X',
+                            swob.HTTPNotFound, {}, None)
+        recent_ts = S3Timestamp.now(delta=-1000000).internal
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPOk,
+                            {'x-object-meta-foo': 'bar',
+                             'content-type': 'baz/quux',
+                             'x-object-sysmeta-s3api-upload-id': 'X',
+                             'x-object-sysmeta-s3api-etag': 'not-the-etag',
+                             'x-timestamp': recent_ts}, None)
+        req = Request.blank('/bucket/object?uploadId=X',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'Content-MD5': content_md5,
+                                     **extra_headers},
+                            body=XML)
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'Error')
+        self.assertEqual(elem.find('Code').text, 'NotImplemented')
+        self.assertEqual(status.split()[0], '501')
+
+        self.assertEqual(self.swift.calls, [
+            # Bucket exists
+            ('HEAD', '/v1/AUTH_test'),
+            ('HEAD', '/v1/AUTH_test/bucket'),
+            # And then we bail because of the 501
+        ])
+
+    def test_object_multipart_upload_retry_complete_with_if_match(self):
+        self._do_object_multipart_upload_retry_complete_etag_mismatch_501(
+            {'If-Match': 'not-the-etag'})
+
+    def test_object_multipart_upload_retry_complete_with_if_none_match(self):
+        self._do_object_multipart_upload_retry_complete_etag_mismatch_501(
+            {'If-None-Match': 'not-the-etag'})
+
+    def test_object_multipart_upload_retry_complete_with_if_modified_since(
+            self):
+        self._do_object_multipart_upload_retry_complete_etag_mismatch_501(
+            {'If-Modified-Since': 'not-the-etag'})
+
+    def test_object_multipart_upload_retry_complete_with_if_unmodified_since(
+            self):
+        self._do_object_multipart_upload_retry_complete_etag_mismatch_501(
+            {'If-Unmodified-Since': 'not-the-etag'})
+
+    def test_object_multipart_upload_retry_complete_upload_id_mismatch(self):
+        content_md5 = base64.b64encode(md5(
+            XML.encode('ascii'), usedforsecurity=False).digest())
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket+segments/object/X',
+                            swob.HTTPNotFound, {}, None)
+        recent_ts = S3Timestamp.now(delta=-1000000).internal
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPOk,
+                            {'x-object-meta-foo': 'bar',
+                             'content-type': 'baz/quux',
+                             'x-object-sysmeta-s3api-upload-id': 'Y',
+                             'x-object-sysmeta-s3api-etag': S3_ETAG.strip('"'),
+                             'x-timestamp': recent_ts}, None)
+        req = Request.blank('/bucket/object?uploadId=X',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'Content-MD5': content_md5, },
+                            body=XML)
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'Error')
+        self.assertEqual(elem.find('Code').text, 'NoSuchUpload')
+        self.assertEqual(status.split()[0], '404')
+
+        self.assertEqual(self.swift.calls, [
+            # Bucket exists
+            ('HEAD', '/v1/AUTH_test'),
+            ('HEAD', '/v1/AUTH_test/bucket'),
+            # Upload marker does not exist
+            ('HEAD', '/v1/AUTH_test/bucket+segments/object/X'),
+            # But the object does, and with the same upload ID
+            ('HEAD', '/v1/AUTH_test/bucket/object'),
+        ])
+        self.assertEqual(req.environ['swift.backend_path'],
+                         '/v1/AUTH_test/bucket+segments/object/X')
+
+    def test_object_multipart_upload_retry_complete_nothing_there(self):
+        content_md5 = base64.b64encode(md5(
+            XML.encode('ascii'), usedforsecurity=False).digest())
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket+segments/object/X',
+                            swob.HTTPNotFound, {}, None)
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPNotFound, {}, None)
+        req = Request.blank('/bucket/object?uploadId=X',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'Content-MD5': content_md5, },
+                            body=XML)
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'Error')
+        self.assertEqual(elem.find('Code').text, 'NoSuchUpload')
+        self.assertEqual(status.split()[0], '404')
+
+        self.assertEqual(self.swift.calls, [
+            # Bucket exists
+            ('HEAD', '/v1/AUTH_test'),
+            ('HEAD', '/v1/AUTH_test/bucket'),
+            # Upload marker does not exist
+            ('HEAD', '/v1/AUTH_test/bucket+segments/object/X'),
+            # Neither does the object
+            ('HEAD', '/v1/AUTH_test/bucket/object'),
+        ])
+        self.assertEqual(req.environ['swift.backend_path'],
+                         '/v1/AUTH_test/bucket+segments/object/X')
+
+    def test_object_multipart_upload_invalid_md5(self):
+        bad_md5 = base64.b64encode(md5(
+            XML.encode('ascii') + b'some junk', usedforsecurity=False)
+            .digest())
+        req = Request.blank('/bucket/object?uploadId=X',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'Content-MD5': bad_md5, },
+                            body=XML)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual('400 Bad Request', status)
+        self.assertEqual(self._get_error_code(body), 'BadDigest')
+        self.assertEqual(self._get_error_message(body),
+                         'The Content-MD5 you specified did '
+                         'not match what we received.')
+
+    def test_object_multipart_upload_invalid_sha256(self):
+        bad_sha = hashlib.sha256(
+            XML.encode('ascii') + b'some junk').hexdigest()
+        authz_header = 'AWS4-HMAC-SHA256 ' + ', '.join([
+            'Credential=test:tester/%s/us-east-1/s3/aws4_request' %
+            self.get_v4_amz_date_header().split('T', 1)[0],
+            'SignedHeaders=host;x-amz-date',
+            'Signature=X',
+        ])
+        req = Request.blank(
+            '/bucket/object?uploadId=X',
+            environ={'REQUEST_METHOD': 'POST'},
+            headers={'Authorization': authz_header,
+                     'X-Amz-Date': self.get_v4_amz_date_header(),
+                     'X-Amz-Content-SHA256': bad_sha, },
+            body=XML)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual('400 Bad Request', status)
+        self.assertEqual(self._get_error_code(body),
+                         'XAmzContentSHA256Mismatch')
+        self.assertEqual('/v1/AUTH_test/bucket+segments/object/X',
+                         req.environ.get('swift.backend_path'))
+
+    def test_object_multipart_upload_upper_sha256(self):
+        upper_sha = hashlib.sha256(
+            XML.encode('ascii')).hexdigest().upper()
+        authz_header = 'AWS4-HMAC-SHA256 ' + ', '.join([
+            'Credential=test:tester/%s/us-east-1/s3/aws4_request' %
+            self.get_v4_amz_date_header().split('T', 1)[0],
+            'SignedHeaders=host;x-amz-date',
+            'Signature=X',
+        ])
+        req = Request.blank(
+            '/bucket/object?uploadId=X',
+            environ={'REQUEST_METHOD': 'POST'},
+            headers={'Authorization': authz_header,
+                     'X-Amz-Date': self.get_v4_amz_date_header(),
+                     'X-Amz-Content-SHA256': upper_sha, },
+            body=XML)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual('200 OK', status)
+
+    @patch('swift.common.middleware.s3api.controllers.multi_upload.time')
+    def test_object_multipart_upload_complete_with_heartbeat(self, mock_time):
+        self.swift.register(
+            'HEAD', '/v1/AUTH_test/bucket+segments/heartbeat-ok/X',
+            swob.HTTPOk, {}, None)
+        self.swift.register(
+            'GET', '/v1/AUTH_test/bucket+segments', swob.HTTPOk, {},
+            json.dumps([
+                {'name': item[0].replace('object', 'heartbeat-ok'),
+                 'last_modified': item[1], 'hash': item[2], 'bytes': item[3]}
+                for item in OBJECTS_TEMPLATE
+            ]))
+        self.swift.register(
+            'PUT', '/v1/AUTH_test/bucket/heartbeat-ok',
+            swob.HTTPAccepted, {}, [b' ', b' ', b' ', json.dumps({
+                'Etag': '"slo-etag"',
+                'Response Status': '201 Created',
+                'Errors': [],
+            }).encode('ascii')])
+        mock_time.time.side_effect = (
+            1,  # start_time
+            12,  # first whitespace
+            13,  # second...
+            14,  # third...
+            15,  # JSON body
+        )
+        self.swift.register(
+            'DELETE', '/v1/AUTH_test/bucket+segments/heartbeat-ok/X',
+            swob.HTTPNoContent, {}, None)
+
+        req = Request.blank('/bucket/heartbeat-ok?uploadId=X',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(), },
+                            body=XML)
+        status, headers, body = self.call_s3api(req)
+        lines = body.split(b'\n')
+        self.assertTrue(lines[0].startswith(b'<?xml '))
+        self.assertTrue(lines[1])
+        self.assertFalse(lines[1].strip())
+        fromstring(body, 'CompleteMultipartUploadResult')
+        self.assertEqual(status.split()[0], '200')
+        # NB: S3_ETAG includes quotes
+        self.assertIn(('<ETag>%s</ETag>' % S3_ETAG).encode('ascii'), body)
+        self.assertEqual(self.swift.calls, [
+            ('HEAD', '/v1/AUTH_test'),
+            ('HEAD', '/v1/AUTH_test/bucket'),
+            ('HEAD', '/v1/AUTH_test/bucket+segments/heartbeat-ok/X'),
+            ('PUT', '/v1/AUTH_test/bucket/heartbeat-ok?'
+                    'heartbeat=on&multipart-manifest=put'),
+            ('DELETE', '/v1/AUTH_test/bucket+segments/heartbeat-ok/X'),
+        ])
+
+    @patch('swift.common.middleware.s3api.controllers.multi_upload.time')
+    def test_object_multipart_upload_complete_failure_with_heartbeat(
+            self, mock_time):
+        self.swift.register(
+            'HEAD', '/v1/AUTH_test/bucket+segments/heartbeat-fail/X',
+            swob.HTTPOk, {}, None)
+        self.swift.register(
+            'GET', '/v1/AUTH_test/bucket+segments', swob.HTTPOk, {},
+            json.dumps([
+                {'name': item[0].replace('object', 'heartbeat-fail'),
+                 'last_modified': item[1], 'hash': item[2], 'bytes': item[3]}
+                for item in OBJECTS_TEMPLATE
+            ]))
+        self.swift.register(
+            'PUT', '/v1/AUTH_test/bucket/heartbeat-fail',
+            swob.HTTPAccepted, {}, [b' ', b' ', b' ', json.dumps({
+                'Response Status': '400 Bad Request',
+                'Errors': [['some/object', '403 Forbidden']],
+            }).encode('ascii')])
+        mock_time.time.side_effect = (
+            1,  # start_time
+            12,  # first whitespace
+            13,  # second...
+            14,  # third...
+            15,  # JSON body
+        )
+
+        req = Request.blank('/bucket/heartbeat-fail?uploadId=X',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(), },
+                            body=XML)
+        status, headers, body = self.call_s3api(req)
+        lines = body.split(b'\n')
+        self.assertTrue(lines[0].startswith(b'<?xml '), (status, lines))
+        self.assertTrue(lines[1])
+        self.assertFalse(lines[1].strip())
+        fromstring(body, 'Error')
+        self.assertEqual(status.split()[0], '200')
+        self.assertEqual(self._get_error_code(body), 'InvalidRequest')
+        self.assertEqual(self._get_error_message(body),
+                         'some/object: 403 Forbidden')
+        self.assertEqual(self.swift.calls, [
+            ('HEAD', '/v1/AUTH_test'),
+            ('HEAD', '/v1/AUTH_test/bucket'),
+            ('HEAD', '/v1/AUTH_test/bucket+segments/heartbeat-fail/X'),
+            ('PUT', '/v1/AUTH_test/bucket/heartbeat-fail?'
+                    'heartbeat=on&multipart-manifest=put'),
+        ])
+
+    @patch('swift.common.middleware.s3api.controllers.multi_upload.time')
+    def test_object_multipart_upload_missing_part_with_heartbeat(
+            self, mock_time):
+        self.swift.register(
+            'HEAD', '/v1/AUTH_test/bucket+segments/heartbeat-fail/X',
+            swob.HTTPOk, {}, None)
+        self.swift.register(
+            'GET', '/v1/AUTH_test/bucket+segments', swob.HTTPOk, {},
+            json.dumps([
+                {'name': item[0].replace('object', 'heartbeat-fail'),
+                 'last_modified': item[1], 'hash': item[2], 'bytes': item[3]}
+                for item in OBJECTS_TEMPLATE
+            ]))
+        self.swift.register(
+            'PUT', '/v1/AUTH_test/bucket/heartbeat-fail',
+            swob.HTTPAccepted, {}, [b' ', b' ', b' ', json.dumps({
+                'Response Status': '400 Bad Request',
+                'Errors': [['some/object', '404 Not Found']],
+            }).encode('ascii')])
+        mock_time.time.side_effect = (
+            1,  # start_time
+            12,  # first whitespace
+            13,  # second...
+            14,  # third...
+            15,  # JSON body
+        )
+
+        req = Request.blank('/bucket/heartbeat-fail?uploadId=X',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(), },
+                            body=XML)
+        status, headers, body = self.call_s3api(req)
+        lines = body.split(b'\n')
+        self.assertTrue(lines[0].startswith(b'<?xml '))
+        self.assertTrue(lines[1])
+        self.assertFalse(lines[1].strip())
+        fromstring(body, 'Error')
+        self.assertEqual(status.split()[0], '200')
+        self.assertEqual(self._get_error_code(body), 'InvalidPart')
+        self.assertEqual(
+            "One or more of the specified parts could not be found.  The part "
+            "may not have been uploaded, or the specified entity tag may not "
+            "match the part's entity tag.",
+            self._get_error_message(body))
+        self.assertEqual(self.swift.calls, [
+            ('HEAD', '/v1/AUTH_test'),
+            ('HEAD', '/v1/AUTH_test/bucket'),
+            ('HEAD', '/v1/AUTH_test/bucket+segments/heartbeat-fail/X'),
+            ('PUT', '/v1/AUTH_test/bucket/heartbeat-fail?'
+                    'heartbeat=on&multipart-manifest=put'),
+        ])
+
+    def test_object_multipart_upload_complete_404_on_marker_delete(self):
+        segment_bucket = '/v1/AUTH_test/bucket+segments'
+        self.swift.register('DELETE', segment_bucket + '/object/X',
+                            swob.HTTPNotFound, {}, None)
+        req = Request.blank('/bucket/object?uploadId=X',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(), },
+                            body=XML)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+        fromstring(body, 'CompleteMultipartUploadResult')
+
+        _, _, headers = self.swift.calls_with_headers[-2]
+        self.assertEqual(headers.get('X-Object-Meta-Foo'), 'bar')
+        self.assertEqual(headers.get('Content-Type'), 'baz/quux')
+
+    def _do_test_object_multipart_upload_complete_marker_in_future(
+            self, marker_timestamp, now_timestamp):
+        # verify that clock skew is detected before manifest is created and
+        # results in a 503
+        segment_bucket = '/v1/AUTH_test/bucket+segments'
+        self.swift.register('HEAD', segment_bucket + '/object/X',
+                            swob.HTTPOk,
+                            {'x-object-meta-foo': 'bar',
+                             'content-type': 'application/directory',
+                             'x-object-sysmeta-s3api-has-content-type': 'yes',
+                             'x-object-sysmeta-s3api-content-type':
+                                 'baz/quux',
+                             'X-Backend-Timestamp': marker_timestamp.internal},
+                            None)
+        req = Request.blank('/bucket/object?uploadId=X',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(skew=100), },
+                            body=XML)
+
+        # marker created in the future
+        with patch('swift.common.middleware.s3api.controllers.multi_upload.'
+                   'Timestamp.now', return_value=now_timestamp):
+            status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '503')
+        self.assertEqual('ServiceUnavailable', self._get_error_code(body))
+        self.assertEqual(self.swift.calls, [
+            ('HEAD', '/v1/AUTH_test'),
+            ('HEAD', '/v1/AUTH_test/bucket'),
+            ('HEAD', '/v1/AUTH_test/bucket+segments/object/X')])
+
+    def test_object_multipart_upload_complete_marker_ts_now(self):
+        marker_timestamp = now_timestamp = Timestamp.now()
+        self._do_test_object_multipart_upload_complete_marker_in_future(
+            marker_timestamp, now_timestamp)
+
+    def test_object_multipart_upload_complete_marker_ts_in_future(self):
+        marker_timestamp = Timestamp.now()
+        now_timestamp = Timestamp(float(marker_timestamp) - 1)
+        self._do_test_object_multipart_upload_complete_marker_in_future(
+            marker_timestamp, now_timestamp)
+
+    def test_object_multipart_upload_complete_409_on_marker_delete(self):
+        # verify that clock skew preventing an upload marker DELETE results in
+        # a 503 (this would be unexpected because there's a check for clock
+        # skew before the manifest PUT and marker DELETE)
+        segment_bucket = '/v1/AUTH_test/bucket+segments'
+        self.swift.register('DELETE', segment_bucket + '/object/X',
+                            swob.HTTPConflict, {}, None)
+        req = Request.blank('/bucket/object?uploadId=X',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(), },
+                            body=XML)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '503')
+        self.assertEqual('ServiceUnavailable', self._get_error_code(body))
+
+    def test_object_multipart_upload_complete_old_content_type(self):
+        self.swift.register(
+            'HEAD', '/v1/AUTH_test/bucket+segments/object/X',
+            swob.HTTPOk, {"Content-Type": "thingy/dingy"}, None)
+
+        req = Request.blank('/bucket/object?uploadId=X',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(), },
+                            body=XML)
+        status, headers, body = self.call_s3api(req)
+        fromstring(body, 'CompleteMultipartUploadResult')
+        self.assertEqual(status.split()[0], '200')
+
+        _, _, headers = self.swift.calls_with_headers[-2]
+        self.assertEqual(headers.get('Content-Type'), 'thingy/dingy')
+
+    def test_object_multipart_upload_complete_no_content_type(self):
+        self.swift.register(
+            'HEAD', '/v1/AUTH_test/bucket+segments/object/X',
+            swob.HTTPOk, {"X-Object-Sysmeta-S3api-Has-Content-Type": "no"},
+            None)
+
+        req = Request.blank('/bucket/object?uploadId=X',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(), },
+                            body=XML)
+        status, headers, body = self.call_s3api(req)
+        fromstring(body, 'CompleteMultipartUploadResult')
+        self.assertEqual(status.split()[0], '200')
+
+        _, _, headers = self.swift.calls_with_headers[-2]
+        self.assertNotIn('Content-Type', headers)
+
+    def test_object_multipart_upload_complete_weird_host_name(self):
+        # This happens via boto signature v4
+        req = Request.blank('/bucket/object?uploadId=X',
+                            environ={'REQUEST_METHOD': 'POST',
+                                     'HTTP_HOST': 'localhost:8080:8080'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(), },
+                            body=XML)
+        status, headers, body = self.call_s3api(req)
+        fromstring(body, 'CompleteMultipartUploadResult')
+        self.assertEqual(status.split()[0], '200')
+
+        _, _, headers = self.swift.calls_with_headers[-2]
+        self.assertEqual(headers.get('X-Object-Meta-Foo'), 'bar')
+
+    def test_object_multipart_upload_complete_segment_too_small(self):
+        msg = ('some/path: s3api requires that each segment be at least '
+               '%d bytes') % self.s3api.conf.min_segment_size
+        self.swift.register('PUT', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPBadRequest, {}, msg)
+        req = Request.blank(
+            '/bucket/object?uploadId=X',
+            environ={'REQUEST_METHOD': 'POST'},
+            headers={'Authorization': 'AWS test:tester:hmac',
+                     'Date': self.get_date_header(), },
+            body=XML)
+
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '400')
+        self.assertEqual(self._get_error_code(body), 'EntityTooSmall')
+        self.assertEqual(self._get_error_message(body), msg)
+        # We punt to SLO to do the validation
+        self.assertEqual(self.swift.calls, [
+            ('HEAD', '/v1/AUTH_test'),
+            ('HEAD', '/v1/AUTH_test/bucket'),
+            ('HEAD', '/v1/AUTH_test/bucket+segments/object/X'),
+            ('PUT', '/v1/AUTH_test/bucket/object'
+             '?heartbeat=on&multipart-manifest=put'),
+        ])
+
+        self.swift.clear_calls()
+        self.s3api.conf.min_segment_size = 5242880
+        msg = ('some/path: s3api requires that each segment be at least '
+               '%d bytes') % self.s3api.conf.min_segment_size
+        self.swift.register('PUT', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPBadRequest, {}, msg)
+        req = Request.blank(
+            '/bucket/object?uploadId=X',
+            environ={'REQUEST_METHOD': 'POST'},
+            headers={'Authorization': 'AWS test:tester:hmac',
+                     'Date': self.get_date_header(), },
+            body=XML)
+
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '400')
+        self.assertEqual(self._get_error_code(body), 'EntityTooSmall')
+        self.assertEqual(self._get_error_message(body), msg)
+        # Again, we punt to SLO to do the validation
+        self.assertEqual(self.swift.calls, [
+            ('HEAD', '/v1/AUTH_test'),
+            ('HEAD', '/v1/AUTH_test/bucket'),
+            ('HEAD', '/v1/AUTH_test/bucket+segments/object/X'),
+            ('PUT', '/v1/AUTH_test/bucket/object'
+             '?heartbeat=on&multipart-manifest=put'),
+        ])
+
+    def test_object_multipart_upload_complete_zero_segments(self):
+        segment_bucket = '/v1/AUTH_test/empty-bucket+segments'
+
+        object_list = [{
+            'name': 'object/X/1',
+            'last_modified': self.last_modified,
+            'hash': 'd41d8cd98f00b204e9800998ecf8427e',
+            'bytes': '0',
+        }]
+
+        self.swift.register('GET', segment_bucket, swob.HTTPOk, {},
+                            json.dumps(object_list))
+        self.swift.register('HEAD', '/v1/AUTH_test/empty-bucket',
+                            swob.HTTPNoContent, {}, None)
+        self.swift.register('HEAD', segment_bucket + '/object/X',
+                            swob.HTTPOk, {'x-object-meta-foo': 'bar',
+                                          'content-type': 'baz/quux'}, None)
+        self.swift.register('PUT', '/v1/AUTH_test/empty-bucket/object',
+                            swob.HTTPCreated, {}, None)
+        self.swift.register('DELETE', segment_bucket + '/object/X/1',
+                            swob.HTTPOk, {}, None)
+        self.swift.register('DELETE', segment_bucket + '/object/X',
+                            swob.HTTPOk, {}, None)
+
+        xml = '<CompleteMultipartUpload></CompleteMultipartUpload>'
+
+        req = Request.blank('/empty-bucket/object?uploadId=X',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(), },
+                            body=xml)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '400')
+        fromstring(body, 'Error')
+
+        self.assertEqual(self.swift.calls, [
+            ('HEAD', '/v1/AUTH_test'),
+            ('HEAD', '/v1/AUTH_test/empty-bucket'),
+            ('HEAD', '/v1/AUTH_test/empty-bucket+segments/object/X'),
+        ])
+
+    def test_object_multipart_upload_complete_single_zero_length_segment(self):
+        segment_bucket = '/v1/AUTH_test/empty-bucket+segments'
+        put_headers = {'etag': self.etag, 'last-modified': self.last_modified}
+
+        object_list = [{
+            'name': 'object/X/1',
+            'last_modified': self.last_modified,
+            'hash': 'd41d8cd98f00b204e9800998ecf8427e',
+            'bytes': '0',
+        }]
+
+        self.swift.register('GET', segment_bucket, swob.HTTPOk, {},
+                            json.dumps(object_list))
+        self.swift.register('HEAD', '/v1/AUTH_test/empty-bucket',
+                            swob.HTTPNoContent, {}, None)
+        self.swift.register('HEAD', segment_bucket + '/object/X',
+                            swob.HTTPOk, {'x-object-meta-foo': 'bar',
+                                          'content-type': 'baz/quux'}, None)
+        self.swift.register('PUT', '/v1/AUTH_test/empty-bucket/object',
+                            swob.HTTPCreated, {}, None)
+        self.swift.register('DELETE', segment_bucket + '/object/X/1',
+                            swob.HTTPOk, {}, None)
+        self.swift.register('DELETE', segment_bucket + '/object/X',
+                            swob.HTTPOk, {}, None)
+
+        xml = '<CompleteMultipartUpload>' \
+            '<Part>' \
+            '<PartNumber>1</PartNumber>' \
+            '<ETag>d41d8cd98f00b204e9800998ecf8427e</ETag>' \
+            '</Part>' \
+            '</CompleteMultipartUpload>'
+
+        req = Request.blank('/empty-bucket/object?uploadId=X',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(), },
+                            body=xml)
+        status, headers, body = self.call_s3api(req)
+        fromstring(body, 'CompleteMultipartUploadResult')
+        self.assertEqual(status.split()[0], '200')
+
+        self.assertEqual(self.swift.calls, [
+            ('HEAD', '/v1/AUTH_test'),
+            ('HEAD', '/v1/AUTH_test/empty-bucket'),
+            ('HEAD', '/v1/AUTH_test/empty-bucket+segments/object/X'),
+            ('PUT', '/v1/AUTH_test/empty-bucket/object?'
+                    'heartbeat=on&multipart-manifest=put'),
+            ('DELETE', '/v1/AUTH_test/empty-bucket+segments/object/X'),
+        ])
+        _, _, put_headers = self.swift.calls_with_headers[-2]
+        self.assertEqual(put_headers.get('X-Object-Meta-Foo'), 'bar')
+        self.assertEqual(put_headers.get('Content-Type'), 'baz/quux')
+
+    def test_object_multipart_upload_complete_zero_length_final_segment(self):
+        segment_bucket = '/v1/AUTH_test/bucket+segments'
+
+        object_list = [{
+            'name': 'object/X/1',
+            'last_modified': self.last_modified,
+            'hash': '0123456789abcdef0123456789abcdef',
+            'bytes': '100',
+        }, {
+            'name': 'object/X/2',
+            'last_modified': self.last_modified,
+            'hash': 'fedcba9876543210fedcba9876543210',
+            'bytes': '1',
+        }, {
+            'name': 'object/X/3',
+            'last_modified': self.last_modified,
+            'hash': 'd41d8cd98f00b204e9800998ecf8427e',
+            'bytes': '0',
+        }]
+
+        self.swift.register('GET', segment_bucket, swob.HTTPOk, {},
+                            json.dumps(object_list))
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket',
+                            swob.HTTPNoContent, {}, None)
+        self.swift.register('HEAD', segment_bucket + '/object/X',
+                            swob.HTTPOk, {'x-object-meta-foo': 'bar',
+                                          'content-type': 'baz/quux'}, None)
+        self.swift.register('DELETE', segment_bucket + '/object/X/3',
+                            swob.HTTPNoContent, {}, None)
+
+        xml = '<CompleteMultipartUpload>' \
+            '<Part>' \
+            '<PartNumber>1</PartNumber>' \
+            '<ETag>0123456789abcdef0123456789abcdef</ETag>' \
+            '</Part>' \
+            '<Part>' \
+            '<PartNumber>2</PartNumber>' \
+            '<ETag>fedcba9876543210fedcba9876543210</ETag>' \
+            '</Part>' \
+            '<Part>' \
+            '<PartNumber>3</PartNumber>' \
+            '<ETag>d41d8cd98f00b204e9800998ecf8427e</ETag>' \
+            '</Part>' \
+            '</CompleteMultipartUpload>'
+
+        req = Request.blank('/bucket/object?uploadId=X',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(), },
+                            body=xml)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+        elem = fromstring(body, 'CompleteMultipartUploadResult')
+        self.assertNotIn('Etag', headers)
+        expected_etag = ('"%s-3"' % md5(binascii.unhexlify(''.join(
+            x['hash'] for x in object_list)), usedforsecurity=False)
+            .hexdigest())
+        self.assertEqual(elem.find('ETag').text, expected_etag)
+
+        self.assertEqual(self.swift.calls, [
+            ('HEAD', '/v1/AUTH_test'),
+            ('HEAD', '/v1/AUTH_test/bucket'),
+            ('HEAD', '/v1/AUTH_test/bucket+segments/object/X'),
+            ('PUT', '/v1/AUTH_test/bucket/object?'
+                    'heartbeat=on&multipart-manifest=put'),
+            ('DELETE', '/v1/AUTH_test/bucket+segments/object/X'),
+        ])
+
+        _, _, headers = self.swift.calls_with_headers[-2]
+        # SLO will provide a base value
+        override_etag = '; s3_etag=%s' % expected_etag.strip('"')
+        h = 'X-Object-Sysmeta-Container-Update-Override-Etag'
+        self.assertEqual(headers.get(h), override_etag)
+
+    def test_object_list_parts_encoding_type(self):
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket+segments/object@@/X',
+                            swob.HTTPOk, {}, None)
+        self.swift.register('GET', "%s?delimiter=/&format=json&"
+                            "marker=object/X/2&prefix=object@@/X/"
+                            % self.segment_bucket, swob.HTTPOk, {},
+                            json.dumps({}))
+        req = Request.blank('/bucket/object@@?uploadId=X&encoding-type=url',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'ListPartsResult')
+        self.assertEqual(elem.find('Key').text, quote('object@@'))
+        self.assertEqual(elem.find('EncodingType').text, 'url')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_object_list_parts_without_encoding_type(self):
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket+segments/object@@/X',
+                            swob.HTTPOk, {}, None)
+        self.swift.register('GET', "%s?delimiter=/&format=json&"
+                            "marker=object/X/2&prefix=object@@/X/"
+                            % self.segment_bucket, swob.HTTPOk, {},
+                            json.dumps({}))
+        req = Request.blank('/bucket/object@@?uploadId=X',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'ListPartsResult')
+        self.assertEqual(elem.find('Key').text, 'object@@')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_object_list_parts_encoding_type_error(self):
+        req = Request.blank('/bucket/object?uploadId=X&encoding-type=xml',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+
+    def test_object_list_parts_max_parts(self):
+        req = Request.blank('/bucket/object?uploadId=X&max-parts=1',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'ListPartsResult')
+        self.assertEqual(elem.find('IsTruncated').text, 'true')
+        self.assertEqual(len(elem.findall('Part')), 1)
+        self.assertEqual(status.split()[0], '200')
+
+    def test_object_list_parts_str_max_parts(self):
+        req = Request.blank('/bucket/object?uploadId=X&max-parts=invalid',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+
+    def test_object_list_parts_negative_max_parts(self):
+        req = Request.blank('/bucket/object?uploadId=X&max-parts=-1',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+
+    def test_object_list_parts_over_max_parts(self):
+        req = Request.blank('/bucket/object?uploadId=X&max-parts=%d' %
+                            (self.s3api.conf.max_parts_listing + 1),
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'ListPartsResult')
+        self.assertEqual(elem.find('Bucket').text, 'bucket')
+        self.assertEqual(elem.find('Key').text, 'object')
+        self.assertEqual(elem.find('UploadId').text, 'X')
+        self.assertEqual(elem.find('Initiator/ID').text, 'test:tester')
+        self.assertEqual(elem.find('Owner/ID').text, 'test:tester')
+        self.assertEqual(elem.find('StorageClass').text, 'STANDARD')
+        self.assertEqual(elem.find('PartNumberMarker').text, '0')
+        self.assertEqual(elem.find('NextPartNumberMarker').text, '2')
+        self.assertEqual(elem.find('MaxParts').text, '1000')
+        self.assertEqual(elem.find('IsTruncated').text, 'false')
+        self.assertEqual(len(elem.findall('Part')), 2)
+        for p in elem.findall('Part'):
+            partnum = int(p.find('PartNumber').text)
+            self.assertEqual(p.find('LastModified').text,
+                             OBJECTS_TEMPLATE[partnum - 1][4])
+            self.assertEqual(p.find('ETag').text,
+                             '"%s"' % OBJECTS_TEMPLATE[partnum - 1][2])
+            self.assertEqual(p.find('Size').text,
+                             str(OBJECTS_TEMPLATE[partnum - 1][3]))
+        self.assertEqual(status.split()[0], '200')
+
+    def test_object_list_parts_over_max_32bit_int(self):
+        req = Request.blank('/bucket/object?uploadId=X&max-parts=%d' %
+                            (MAX_32BIT_INT + 1),
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+
+    def test_object_list_parts_with_part_number_marker(self):
+        req = Request.blank('/bucket/object?uploadId=X&'
+                            'part-number-marker=1',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'ListPartsResult')
+        self.assertEqual(len(elem.findall('Part')), 1)
+        self.assertEqual(elem.find('Part/PartNumber').text, '2')
+        self.assertEqual(elem.find('PartNumberMarker').text, '1')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_object_list_parts_str_part_number_marker(self):
+        req = Request.blank('/bucket/object?uploadId=X&part-number-marker='
+                            'invalid',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+
+    def test_object_list_parts_negative_part_number_marker(self):
+        req = Request.blank('/bucket/object?uploadId=X&part-number-marker='
+                            '-1',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+
+    def test_object_list_parts_over_part_number_marker(self):
+        part_number_marker = str(self.s3api.conf.max_upload_part_num + 1)
+        req = Request.blank('/bucket/object?uploadId=X&'
+                            'part-number-marker=%s' % part_number_marker,
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'ListPartsResult')
+        self.assertEqual(len(elem.findall('Part')), 0)
+        self.assertEqual(elem.find('PartNumberMarker').text,
+                         part_number_marker)
+        self.assertEqual(status.split()[0], '200')
+
+    def test_object_list_parts_over_max_32bit_int_part_number_marker(self):
+        req = Request.blank('/bucket/object?uploadId=X&part-number-marker='
+                            '%s' % ((MAX_32BIT_INT + 1)),
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+
+    def test_object_list_parts_same_max_marts_as_objects_num(self):
+        req = Request.blank('/bucket/object?uploadId=X&max-parts=2',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'ListPartsResult')
+        self.assertEqual(len(elem.findall('Part')), 2)
+        self.assertEqual(status.split()[0], '200')
+
+    def test_upload_part_copy_headers_with_match(self):
+        account = 'test:tester'
+        etag = '7dfa07a8e59ddbcd1dc84d4c4f82aea1'
+        last_modified_since = 'Fri, 01 Apr 2014 11:00:00 GMT'
+
+        header = {'X-Amz-Copy-Source-If-Match': etag,
+                  'X-Amz-Copy-Source-If-Modified-Since': last_modified_since}
+        status, header, body = \
+            self._test_copy_for_s3acl(account, put_header=header)
+
+        self.assertEqual(status.split()[0], '200')
+
+        self.assertEqual(self.swift.calls, [
+            ('HEAD', '/v1/AUTH_test'),
+            ('HEAD', '/v1/AUTH_test/bucket'),
+            ('HEAD', '/v1/AUTH_test/bucket+segments/object/X'),
+            ('HEAD', '/v1/AUTH_test/src_bucket/src_obj'),
+            ('PUT', '/v1/AUTH_test/bucket+segments/object/X/1'),
+        ])
+        _, _, headers = self.swift.calls_with_headers[-2]
+        self.assertEqual(headers['If-Match'], etag)
+        self.assertEqual(headers['If-Modified-Since'], last_modified_since)
+        _, _, headers = self.swift.calls_with_headers[-1]
+        self.assertTrue(headers.get('If-Match') is None)
+        self.assertTrue(headers.get('If-Modified-Since') is None)
+        _, _, headers = self.swift.calls_with_headers[0]
+        self.assertTrue(headers.get('If-Match') is None)
+        self.assertTrue(headers.get('If-Modified-Since') is None)
+
+    def test_upload_part_copy_headers_with_not_match(self):
+        account = 'test:tester'
+        etag = '7dfa07a8e59ddbcd1dc84d4c4f82aea1'
+        last_modified_since = 'Fri, 01 Apr 2014 12:00:00 GMT'
+
+        header = {'X-Amz-Copy-Source-If-None-Match': etag,
+                  'X-Amz-Copy-Source-If-Unmodified-Since': last_modified_since}
+        status, header, body = \
+            self._test_copy_for_s3acl(account, put_header=header)
+
+        self.assertEqual(status.split()[0], '200')
+        self.assertEqual(self.swift.calls, [
+            ('HEAD', '/v1/AUTH_test'),
+            ('HEAD', '/v1/AUTH_test/bucket'),
+            ('HEAD', '/v1/AUTH_test/bucket+segments/object/X'),
+            ('HEAD', '/v1/AUTH_test/src_bucket/src_obj'),
+            ('PUT', '/v1/AUTH_test/bucket+segments/object/X/1'),
+        ])
+        _, _, headers = self.swift.calls_with_headers[-2]
+        self.assertEqual(headers['If-None-Match'], etag)
+        self.assertEqual(headers['If-Unmodified-Since'], last_modified_since)
+        _, _, headers = self.swift.calls_with_headers[-1]
+        self.assertTrue(headers.get('If-None-Match') is None)
+        self.assertTrue(headers.get('If-Unmodified-Since') is None)
+        _, _, headers = self.swift.calls_with_headers[0]
+        self.assertTrue(headers.get('If-None-Match') is None)
+        self.assertTrue(headers.get('If-Unmodified-Since') is None)
+
+    def test_upload_part_copy_range_unsatisfiable(self):
+        account = 'test:tester'
+
+        header = {'X-Amz-Copy-Source-Range': 'bytes=1000-'}
+        status, header, body = self._test_copy_for_s3acl(
+            account, src_headers={'Content-Length': '10'}, put_header=header)
+
+        self.assertEqual(status.split()[0], '400')
+        self.assertIn(b'Range specified is not valid for '
+                      b'source object of size: 10', body)
+
+        self.assertEqual([
+            ('HEAD', '/v1/AUTH_test'),
+            ('HEAD', '/v1/AUTH_test/bucket'),
+            ('HEAD', '/v1/AUTH_test/bucket+segments/object/X'),
+            ('HEAD', '/v1/AUTH_test/src_bucket/src_obj'),
+        ], self.swift.calls)
+
+    def test_upload_part_copy_range_invalid(self):
+        account = 'test:tester'
+
+        header = {'X-Amz-Copy-Source-Range': '0-9'}
+        status, header, body = \
+            self._test_copy_for_s3acl(account, put_header=header)
+
+        self.assertEqual(status.split()[0], '400', body)
+
+        header = {'X-Amz-Copy-Source-Range': 'asdf'}
+        status, header, body = \
+            self._test_copy_for_s3acl(account, put_header=header)
+
+        self.assertEqual(status.split()[0], '400', body)
+
+    def test_upload_part_copy_range(self):
+        account = 'test:tester'
+
+        header = {'X-Amz-Copy-Source-Range': 'bytes=0-9'}
+        status, header, body = self._test_copy_for_s3acl(
+            account, src_headers={'Content-Length': '20'}, put_header=header)
+
+        self.assertEqual(status.split()[0], '200', body)
+
+        self.assertEqual([
+            ('HEAD', '/v1/AUTH_test'),
+            ('HEAD', '/v1/AUTH_test/bucket'),
+            ('HEAD', '/v1/AUTH_test/bucket+segments/object/X'),
+            ('HEAD', '/v1/AUTH_test/src_bucket/src_obj'),
+            ('PUT', '/v1/AUTH_test/bucket+segments/object/X/1'),
+        ], self.swift.calls)
+        put_headers = self.swift.calls_with_headers[-1][2]
+        self.assertEqual('bytes=0-9', put_headers['Range'])
+        self.assertEqual('/src_bucket/src_obj', put_headers['X-Copy-From'])
+
+
+class TestS3ApiMultiUploadNonUTC(TestS3ApiMultiUpload):
+    def setUp(self):
+        self.orig_tz = os.environ.get('TZ', '')
+        os.environ['TZ'] = 'EST+05EDT,M4.1.0,M10.5.0'
+        time.tzset()
+        super(TestS3ApiMultiUploadNonUTC, self).setUp()
+
+    def tearDown(self):
+        super(TestS3ApiMultiUploadNonUTC, self).tearDown()
+        os.environ['TZ'] = self.orig_tz
+        time.tzset()
+
+
+class TestS3ApiMultiUploadAcl(BaseS3ApiMultiUpload, S3ApiTestCaseAcl):
+
+    @patch('swift.common.middleware.s3api.controllers.'
+           'multi_upload.unique_id', lambda: 'X')
+    def test_object_multipart_upload_initiate_no_content_type(self):
+        req = Request.blank('/bucket/object?uploads',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization':
+                                     'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'x-amz-acl': 'public-read',
+                                     'x-amz-meta-foo': 'bar'})
+        status, headers, body = self.call_s3api(req)
+        fromstring(body, 'InitiateMultipartUploadResult')
+        self.assertEqual(status.split()[0], '200')
+
+        _, _, req_headers = self.swift.calls_with_headers[-1]
+        self.assertEqual(req_headers.get('X-Object-Meta-Foo'), 'bar')
+        self.assertEqual(req_headers.get(
+            'X-Object-Sysmeta-S3api-Has-Content-Type'), 'no')
+        tmpacl_header = req_headers.get(sysmeta_header('object', 'tmpacl'))
+        self.assertTrue(tmpacl_header)
+        acl_header = encode_acl('object',
+                                ACLPublicRead(Owner('test:tester',
+                                                    'test:tester')))
+        self.assertEqual(acl_header.get(sysmeta_header('object', 'acl')),
+                         tmpacl_header)
+
+    def test_object_multipart_upload_complete_s3acl(self):
+        acl_headers = encode_acl('object', ACLPublicRead(Owner('test:tester',
+                                                               'test:tester')))
+        headers = {}
+        headers[sysmeta_header('object', 'tmpacl')] = \
+            acl_headers.get(sysmeta_header('object', 'acl'))
+        headers['X-Object-Meta-Foo'] = 'bar'
+        headers['Content-Type'] = 'baz/quux'
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket+segments/object/X',
+                            swob.HTTPOk, headers, None)
+        req = Request.blank('/bucket/object?uploadId=X',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()},
+                            body=XML)
+        status, headers, body = self.call_s3api(req)
+        fromstring(body, 'CompleteMultipartUploadResult')
+        self.assertEqual(status.split()[0], '200')
+
+        _, _, headers = self.swift.calls_with_headers[-2]
+        self.assertEqual(headers.get('X-Object-Meta-Foo'), 'bar')
+        self.assertEqual(headers.get('Content-Type'), 'baz/quux')
+        self.assertEqual(
+            tostring(ACLPublicRead(Owner('test:tester',
+                                         'test:tester')).elem()),
+            tostring(decode_acl('object', headers, False).elem()))
+
+    def _test_for_s3acl(self, method, query, account, hasObj=True, body=None):
+        path = '/bucket%s' % ('/object' + query if hasObj else query)
+        req = Request.blank(path,
+                            environ={'REQUEST_METHOD': method},
+                            headers={'Authorization': 'AWS %s:hmac' % account,
+                                     'Date': self.get_date_header()},
+                            body=body)
+        return self.call_s3api(req)
+
+    def test_upload_part_acl_without_permission(self):
+        status, headers, body = \
+            self._test_for_s3acl('PUT', '?partNumber=1&uploadId=X',
+                                 'test:other')
+        self.assertEqual(status.split()[0], '403')
+
+    def test_upload_part_acl_with_write_permission(self):
+        status, headers, body = \
+            self._test_for_s3acl('PUT', '?partNumber=1&uploadId=X',
+                                 'test:write')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_upload_part_acl_with_fullcontrol_permission(self):
+        status, headers, body = \
+            self._test_for_s3acl('PUT', '?partNumber=1&uploadId=X',
+                                 'test:full_control')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_list_multipart_uploads_acl_without_permission(self):
+        status, headers, body = \
+            self._test_for_s3acl('GET', '?uploads', 'test:other',
+                                 hasObj=False)
+        self.assertEqual(status.split()[0], '403')
+
+    def test_list_multipart_uploads_acl_with_read_permission(self):
+        status, headers, body = \
+            self._test_for_s3acl('GET', '?uploads', 'test:read',
+                                 hasObj=False)
+        self.assertEqual(status.split()[0], '200')
+
+    def test_list_multipart_uploads_acl_with_fullcontrol_permission(self):
+        status, headers, body = \
+            self._test_for_s3acl('GET', '?uploads', 'test:full_control',
+                                 hasObj=False)
+        self.assertEqual(status.split()[0], '200')
+
+    @patch('swift.common.middleware.s3api.controllers.'
+           'multi_upload.unique_id', lambda: 'X')
+    def test_initiate_multipart_upload_acl_without_permission(self):
+        status, headers, body = \
+            self._test_for_s3acl('POST', '?uploads', 'test:other')
+        self.assertEqual(status.split()[0], '403')
+
+    @patch('swift.common.middleware.s3api.controllers.'
+           'multi_upload.unique_id', lambda: 'X')
+    def test_initiate_multipart_upload_acl_with_write_permission(self):
+        status, headers, body = \
+            self._test_for_s3acl('POST', '?uploads', 'test:write')
+        self.assertEqual(status.split()[0], '200')
+
+    @patch('swift.common.middleware.s3api.controllers.'
+           'multi_upload.unique_id', lambda: 'X')
+    def test_initiate_multipart_upload_acl_with_fullcontrol_permission(self):
+        status, headers, body = \
+            self._test_for_s3acl('POST', '?uploads', 'test:full_control')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_list_parts_acl_without_permission(self):
+        status, headers, body = \
+            self._test_for_s3acl('GET', '?uploadId=X', 'test:other')
+        self.assertEqual(status.split()[0], '403')
+
+    def test_list_parts_acl_with_read_permission(self):
+        status, headers, body = \
+            self._test_for_s3acl('GET', '?uploadId=X', 'test:read')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_list_parts_acl_with_fullcontrol_permission(self):
+        status, headers, body = \
+            self._test_for_s3acl('GET', '?uploadId=X', 'test:full_control')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_abort_multipart_upload_acl_without_permission(self):
+        status, headers, body = \
+            self._test_for_s3acl('DELETE', '?uploadId=X', 'test:other')
+        self.assertEqual(status.split()[0], '403')
+
+    def test_abort_multipart_upload_acl_with_write_permission(self):
+        status, headers, body = \
+            self._test_for_s3acl('DELETE', '?uploadId=X', 'test:write')
+        self.assertEqual(status.split()[0], '204')
+
+    def test_abort_multipart_upload_acl_with_fullcontrol_permission(self):
+        status, headers, body = \
+            self._test_for_s3acl('DELETE', '?uploadId=X', 'test:full_control')
+        self.assertEqual(status.split()[0], '204')
+        self.assertEqual([
+            path for method, path in self.swift.calls if method == 'DELETE'
+        ], [
+            '/v1/AUTH_test/bucket+segments/object/X',
+            '/v1/AUTH_test/bucket+segments/object/X/1',
+            '/v1/AUTH_test/bucket+segments/object/X/2',
+        ])
+
+    def test_complete_multipart_upload_acl_without_permission(self):
+        status, headers, body = \
+            self._test_for_s3acl('POST', '?uploadId=X', 'test:other',
+                                 body=XML)
+        self.assertEqual(status.split()[0], '403')
+
+    def test_complete_multipart_upload_acl_with_write_permission(self):
+        status, headers, body = \
+            self._test_for_s3acl('POST', '?uploadId=X', 'test:write',
+                                 body=XML)
+        self.assertEqual(status.split()[0], '200')
+
+    def test_complete_multipart_upload_acl_with_fullcontrol_permission(self):
+        status, headers, body = \
+            self._test_for_s3acl('POST', '?uploadId=X', 'test:full_control',
+                                 body=XML)
+        self.assertEqual(status.split()[0], '200')
+
+    def test_upload_part_copy_acl_with_owner_permission(self):
+        status, headers, body = \
+            self._test_copy_for_s3acl('test:tester')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_upload_part_copy_acl_without_permission(self):
+        status, headers, body = \
+            self._test_copy_for_s3acl('test:other', 'READ')
+        self.assertEqual(status.split()[0], '403')
+
+    def test_upload_part_copy_acl_with_write_permission(self):
+        status, headers, body = \
+            self._test_copy_for_s3acl('test:write', 'READ')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_upload_part_copy_acl_with_fullcontrol_permission(self):
+        status, headers, body = \
+            self._test_copy_for_s3acl('test:full_control', 'READ')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_upload_part_copy_acl_without_src_permission(self):
+        status, headers, body = \
+            self._test_copy_for_s3acl('test:write', 'WRITE')
+        self.assertEqual(status.split()[0], '403')
+
+    def test_upload_part_copy_acl_invalid_source(self):
+        self.s3acl_response_modified = True
+        status, headers, body = \
+            self._test_copy_for_s3acl('test:write', 'WRITE', '')
+        self.assertEqual(status.split()[0], '400')
+
+        status, headers, body = \
+            self._test_copy_for_s3acl('test:write', 'WRITE', '/')
+        self.assertEqual(status.split()[0], '400')
+
+        status, headers, body = \
+            self._test_copy_for_s3acl('test:write', 'WRITE', '/bucket')
+        self.assertEqual(status.split()[0], '400')
+
+        status, headers, body = \
+            self._test_copy_for_s3acl('test:write', 'WRITE', '/bucket/')
+        self.assertEqual(status.split()[0], '400')
+
+    def test_upload_part_copy_headers_with_match_and_s3acl(self):
+        account = 'test:tester'
+        etag = '7dfa07a8e59ddbcd1dc84d4c4f82aea1'
+        last_modified_since = 'Fri, 01 Apr 2014 11:00:00 GMT'
+
+        header = {'X-Amz-Copy-Source-If-Match': etag,
+                  'X-Amz-Copy-Source-If-Modified-Since': last_modified_since}
+        with self.stubbed_container_info():
+            status, header, body = \
+                self._test_copy_for_s3acl(account, put_header=header)
+
+        self.assertEqual(status.split()[0], '200')
+        self.assertEqual(len(self.swift.calls_with_headers), 4)
+        # Before the check of the copy source in the case of s3acl is valid,
+        # s3api check the bucket write permissions and the object existence
+        # of the destination.
+        _, _, headers = self.swift.calls_with_headers[-3]
+        self.assertTrue(headers.get('If-Match') is None)
+        self.assertTrue(headers.get('If-Modified-Since') is None)
+        _, _, headers = self.swift.calls_with_headers[-2]
+        self.assertEqual(headers['If-Match'], etag)
+        self.assertEqual(headers['If-Modified-Since'], last_modified_since)
+        _, _, headers = self.swift.calls_with_headers[-1]
+        self.assertTrue(headers.get('If-Match') is None)
+        self.assertTrue(headers.get('If-Modified-Since') is None)
+        _, _, headers = self.swift.calls_with_headers[0]
+        self.assertTrue(headers.get('If-Match') is None)
+        self.assertTrue(headers.get('If-Modified-Since') is None)
+
+    def test_upload_part_copy_headers_with_not_match_and_s3acl(self):
+        account = 'test:tester'
+        etag = '7dfa07a8e59ddbcd1dc84d4c4f82aea1'
+        last_modified_since = 'Fri, 01 Apr 2014 12:00:00 GMT'
+
+        header = {'X-Amz-Copy-Source-If-None-Match': etag,
+                  'X-Amz-Copy-Source-If-Unmodified-Since': last_modified_since}
+        with self.stubbed_container_info():
+            status, header, body = \
+                self._test_copy_for_s3acl(account, put_header=header)
+
+        self.assertEqual(status.split()[0], '200')
+        self.assertEqual(len(self.swift.calls_with_headers), 4)
+        # Before the check of the copy source in the case of s3acl is valid,
+        # s3api check the bucket write permissions and the object existence
+        # of the destination.
+        _, _, headers = self.swift.calls_with_headers[-3]
+        self.assertTrue(headers.get('If-Match') is None)
+        self.assertTrue(headers.get('If-Modified-Since') is None)
+        _, _, headers = self.swift.calls_with_headers[-2]
+        self.assertEqual(headers['If-None-Match'], etag)
+        self.assertEqual(headers['If-Unmodified-Since'], last_modified_since)
+        self.assertTrue(headers.get('If-Match') is None)
+        self.assertTrue(headers.get('If-Modified-Since') is None)
+        _, _, headers = self.swift.calls_with_headers[-1]
+        self.assertTrue(headers.get('If-None-Match') is None)
+        self.assertTrue(headers.get('If-Unmodified-Since') is None)
+        _, _, headers = self.swift.calls_with_headers[0]
+
+
+class TestS3ApiMultiUploadAclNonUTC(TestS3ApiMultiUploadAcl):
+    def setUp(self):
+        self.orig_tz = os.environ.get('TZ', '')
+        os.environ['TZ'] = 'EST+05EDT,M4.1.0,M10.5.0'
+        time.tzset()
+        super(TestS3ApiMultiUploadAclNonUTC, self).setUp()
+
+    def tearDown(self):
+        super(TestS3ApiMultiUploadAclNonUTC, self).tearDown()
+        os.environ['TZ'] = self.orig_tz
+        time.tzset()
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/s3api/test_obj.py b/test/unit/common/middleware/s3api/test_obj.py
new file mode 100644
index 0000000000..4d95204d9b
--- /dev/null
+++ b/test/unit/common/middleware/s3api/test_obj.py
@@ -0,0 +1,2171 @@
+# Copyright (c) 2014 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import binascii
+import unittest
+from datetime import datetime
+import functools
+from hashlib import sha256
+import os
+from os.path import join
+import time
+from unittest.mock import patch
+import json
+
+from swift.common import swob
+from swift.common.storage_policy import StoragePolicy
+from swift.common.swob import Request
+from swift.common.middleware.proxy_logging import ProxyLoggingMiddleware
+from test.unit import mock_timestamp_now, patch_policies
+
+from test.unit.common.middleware.s3api import S3ApiTestCase, S3ApiTestCaseAcl
+from swift.common.middleware.s3api.s3request import SigV4Request
+from swift.common.middleware.s3api.subresource import ACL, User, encode_acl, \
+    Owner, Grant
+from swift.common.middleware.s3api.etree import fromstring
+from swift.common.middleware.s3api.utils import mktime, S3Timestamp
+from swift.common.middleware.versioned_writes.object_versioning import \
+    DELETE_MARKER_CONTENT_TYPE
+from swift.common.utils import md5
+
+
+class BaseS3ApiObj(object):
+
+    def setUp(self):
+        super(BaseS3ApiObj, self).setUp()
+
+        self.object_body = b'hello'
+        self.etag = md5(self.object_body, usedforsecurity=False).hexdigest()
+        self.last_modified = 'Fri, 01 Apr 2014 12:00:00 GMT'
+
+        self.response_headers = {'Content-Type': 'text/html',
+                                 'Content-Length': len(self.object_body),
+                                 'Accept-Ranges': 'bytes',
+                                 'Content-Disposition': 'inline',
+                                 'Content-Language': 'en',
+                                 'x-object-meta-test': 'swift',
+                                 'etag': self.etag,
+                                 'last-modified': self.last_modified,
+                                 'expires': 'Mon, 21 Sep 2015 12:00:00 GMT',
+                                 'x-robots-tag': 'nofollow',
+                                 'cache-control': 'private'}
+
+        self.swift.register('GET', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPOk, self.response_headers,
+                            self.object_body)
+        self.swift.register('GET', '/v1/AUTH_test/bucket/object?symlink=get',
+                            swob.HTTPOk, self.response_headers,
+                            self.object_body)
+        self.swift.register('PUT', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPCreated,
+                            {'etag': self.etag,
+                             'last-modified': self.last_modified,
+                             'x-object-meta-something': 'oh hai'},
+                            None)
+
+        self.bucket_policy_index = 1
+        self._register_bucket_policy_index_head(
+            'bucket', self.bucket_policy_index)
+
+    def _test_object_GETorHEAD(self, method):
+        req = Request.blank('/bucket/object',
+                            environ={'REQUEST_METHOD': method},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        self.assertNotIn('swift.access_logging', req.environ)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(req.environ['swift.access_logging'],
+                         {'user_id': 'test:tester'})
+        self.assertEqual(status.split()[0], '200')
+        # we'll want this for logging
+        self._assert_policy_index(req.headers, headers,
+                                  self.bucket_policy_index)
+
+        unexpected_headers = []
+        for key, val in self.response_headers.items():
+            if key in ('Content-Length', 'Content-Type', 'content-encoding',
+                       'last-modified', 'cache-control', 'Content-Disposition',
+                       'Content-Language', 'expires', 'x-robots-tag',
+                       'Accept-Ranges'):
+                self.assertIn(key, headers)
+                self.assertEqual(headers[key], str(val))
+
+            elif key == 'etag':
+                self.assertEqual(headers[key], '"%s"' % val)
+
+            elif key.startswith('x-object-meta-'):
+                self.assertIn('x-amz-meta-' + key[14:], headers)
+                self.assertEqual(headers['x-amz-meta-' + key[14:]], val)
+
+            else:
+                unexpected_headers.append((key, val))
+
+        if unexpected_headers:
+            self.fail('unexpected headers: %r' % unexpected_headers)
+
+        self.assertEqual(headers['etag'],
+                         '"%s"' % self.response_headers['etag'])
+
+        if method == 'GET':
+            self.assertEqual(body, self.object_body)
+
+    def test_object_GET(self):
+        self._test_object_GETorHEAD('GET')
+
+    def test_object_HEAD(self):
+        self._test_object_GETorHEAD('HEAD')
+
+    def test_object_HEAD_error(self):
+        # HEAD does not return the body even an error response in the
+        # specifications of the REST API.
+        # So, check the response code for error test of HEAD.
+        req = Request.blank('/bucket/object',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        self.s3acl_response_modified = True
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPUnauthorized, {}, None)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '403')
+        self.assertEqual(body, b'')  # sanity
+
+        req = Request.blank('/bucket/object',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPForbidden, {}, None)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '403')
+        self.assertEqual(body, b'')  # sanity
+
+        req = Request.blank('/bucket/object',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPNotFound, {}, None)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '404')
+        self.assertEqual(body, b'')  # sanity
+
+        req = Request.blank('/bucket/object',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPPreconditionFailed, {}, None)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '412')
+        self.assertEqual(body, b'')  # sanity
+
+        req = Request.blank('/bucket/object',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPServerError, {}, None)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '500')
+        self.assertEqual(body, b'')  # sanity
+
+        req = Request.blank('/bucket/object',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPServiceUnavailable, {}, None)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '503')
+        self.assertEqual(body, b'')  # sanity
+
+    def _do_test_object_policy_index_logging(self, bucket_policy_index):
+        self.logger.clear()
+        req = Request.blank('/bucket/object',
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        self.s3api = ProxyLoggingMiddleware(self.s3api, {}, logger=self.logger)
+        status, headers, body = self.call_s3api(req)
+        self._assert_policy_index(req.headers, headers, bucket_policy_index)
+        self.assertEqual('/v1/AUTH_test/bucket/object',
+                         req.environ['swift.backend_path'])
+        access_lines = self.logger.get_lines_for_level('info')
+        self.assertEqual(1, len(access_lines))
+        parts = access_lines[0].split()
+        self.assertEqual(' '.join(parts[3:7]),
+                         'GET /bucket/object HTTP/1.0 200')
+        self.assertEqual(parts[-2], str(bucket_policy_index))
+        self.assertEqual(parts[-1], 'test:tester')  # access_user_id
+
+    def _test_object_HEAD_Range(self, range_value):
+        req = Request.blank('/bucket/object',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Range': range_value,
+                                     'Date': self.get_date_header()})
+        return self.call_s3api(req)
+
+    def test_object_HEAD_Range_with_invalid_value(self):
+        range_value = ''
+        status, headers, body = self._test_object_HEAD_Range(range_value)
+        self.assertEqual(status.split()[0], '200')
+        self.assertTrue('content-length' in headers)
+        self.assertEqual(headers['content-length'], '5')
+        self.assertTrue('content-range' not in headers)
+
+        range_value = 'hoge'
+        status, headers, body = self._test_object_HEAD_Range(range_value)
+        self.assertEqual(status.split()[0], '200')
+        self.assertTrue('content-length' in headers)
+        self.assertEqual(headers['content-length'], '5')
+        self.assertTrue('content-range' not in headers)
+
+        range_value = 'bytes='
+        status, headers, body = self._test_object_HEAD_Range(range_value)
+        self.assertEqual(status.split()[0], '200')
+        self.assertTrue('content-length' in headers)
+        self.assertEqual(headers['content-length'], '5')
+        self.assertTrue('content-range' not in headers)
+
+        range_value = 'bytes=1'
+        status, headers, body = self._test_object_HEAD_Range(range_value)
+        self.assertEqual(status.split()[0], '200')
+        self.assertTrue('content-length' in headers)
+        self.assertEqual(headers['content-length'], '5')
+        self.assertTrue('content-range' not in headers)
+
+        range_value = 'bytes=5-1'
+        status, headers, body = self._test_object_HEAD_Range(range_value)
+        self.assertEqual(status.split()[0], '200')
+        self.assertTrue('content-length' in headers)
+        self.assertEqual(headers['content-length'], '5')
+        self.assertTrue('content-range' not in headers)
+
+        range_value = 'bytes=5-10'
+        status, headers, body = self._test_object_HEAD_Range(range_value)
+        self.assertEqual(status.split()[0], '416')
+
+    def test_object_HEAD_Range(self):
+        # update response headers
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPOk, self.response_headers,
+                            self.object_body)
+        range_value = 'bytes=0-3'
+        status, headers, body = self._test_object_HEAD_Range(range_value)
+        self.assertEqual(status.split()[0], '206')
+        self.assertTrue('content-length' in headers)
+        self.assertEqual(headers['content-length'], '4')
+        self.assertTrue('content-range' in headers)
+        self.assertTrue(headers['content-range'].startswith('bytes 0-3'))
+        self.assertTrue('x-amz-meta-test' in headers)
+        self.assertEqual('swift', headers['x-amz-meta-test'])
+
+        range_value = 'bytes=3-3'
+        status, headers, body = self._test_object_HEAD_Range(range_value)
+        self.assertEqual(status.split()[0], '206')
+        self.assertTrue('content-length' in headers)
+        self.assertEqual(headers['content-length'], '1')
+        self.assertTrue('content-range' in headers)
+        self.assertTrue(headers['content-range'].startswith('bytes 3-3'))
+        self.assertTrue('x-amz-meta-test' in headers)
+        self.assertEqual('swift', headers['x-amz-meta-test'])
+
+        range_value = 'bytes=1-'
+        status, headers, body = self._test_object_HEAD_Range(range_value)
+        self.assertEqual(status.split()[0], '206')
+        self.assertTrue('content-length' in headers)
+        self.assertEqual(headers['content-length'], '4')
+        self.assertTrue('content-range' in headers)
+        self.assertTrue(headers['content-range'].startswith('bytes 1-4'))
+        self.assertTrue('x-amz-meta-test' in headers)
+        self.assertEqual('swift', headers['x-amz-meta-test'])
+
+        range_value = 'bytes=-3'
+        status, headers, body = self._test_object_HEAD_Range(range_value)
+        self.assertEqual(status.split()[0], '206')
+        self.assertTrue('content-length' in headers)
+        self.assertEqual(headers['content-length'], '3')
+        self.assertTrue('content-range' in headers)
+        self.assertTrue(headers['content-range'].startswith('bytes 2-4'))
+        self.assertTrue('x-amz-meta-test' in headers)
+        self.assertEqual('swift', headers['x-amz-meta-test'])
+
+    def test_object_GET_error(self):
+        self.s3acl_response_modified = True
+        code = self._test_method_error('GET', '/bucket/object',
+                                       swob.HTTPUnauthorized)
+        self.assertEqual(code, 'SignatureDoesNotMatch')
+        code = self._test_method_error('GET', '/bucket/object',
+                                       swob.HTTPForbidden)
+        self.assertEqual(code, 'AccessDenied')
+        code = self._test_method_error('GET', '/bucket/object',
+                                       swob.HTTPNotFound)
+        self.assertEqual(code, 'NoSuchKey')
+        code = self._test_method_error('GET', '/bucket/object',
+                                       swob.HTTPServerError)
+        self.assertEqual(code, 'InternalError')
+        code = self._test_method_error('GET', '/bucket/object',
+                                       swob.HTTPPreconditionFailed)
+        self.assertEqual(code, 'PreconditionFailed')
+        code = self._test_method_error('GET', '/bucket/object',
+                                       swob.HTTPServiceUnavailable)
+        self.assertEqual(code, 'ServiceUnavailable')
+        code = self._test_method_error('GET', '/bucket/object',
+                                       swob.HTTPConflict)
+        self.assertEqual(code, 'BrokenMPU')
+
+        code = self._test_method_error(
+            'GET', '/bucket/object',
+            functools.partial(swob.Response, status='498 Rate Limited'),
+            expected_status='503 Slow Down')
+        self.assertEqual(code, 'SlowDown')
+
+        with patch.object(self.s3api.conf, 'ratelimit_as_client_error', True):
+            code = self._test_method_error(
+                'GET', '/bucket/object',
+                functools.partial(swob.Response, status='498 Rate Limited'),
+                expected_status='429 Slow Down')
+            self.assertEqual(code, 'SlowDown')
+
+    def _test_non_slo_object_GETorHEAD_part_num(self, method, part_number):
+        req = Request.blank('/bucket/object?partNumber=%s' % part_number,
+                            environ={'REQUEST_METHOD': method},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '206')
+        self.assertEqual(headers['content-length'], '5')
+        self.assertTrue('content-range' in headers)
+        self.assertEqual(headers['content-range'], 'bytes 0-4/5')
+        self.assertEqual(headers['content-type'], 'text/html')
+        # we'll want this for logging
+        self._assert_policy_index(req.headers, headers,
+                                  self.bucket_policy_index)
+        self.assertEqual(headers['etag'],
+                         '"%s"' % self.response_headers['etag'])
+
+        if method == 'GET':
+            self.assertEqual(body, self.object_body)
+
+    def test_non_slo_object_GET_part_num(self):
+        self._test_non_slo_object_GETorHEAD_part_num('GET', 1)
+
+    def test_non_slo_object_HEAD_part_num(self):
+        self._test_non_slo_object_GETorHEAD_part_num('HEAD', 1)
+
+    def _do_test_non_slo_object_part_num_not_satisfiable(self, method,
+                                                         part_number):
+        req = Request.blank('/bucket/object',
+                            params={'partNumber': part_number},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        req.method = method
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '416')
+        return body
+
+    def test_non_slo_object_GET_part_num_not_satisfiable(self):
+        body = self._do_test_non_slo_object_part_num_not_satisfiable(
+            'GET', '2')
+        self.assertEqual(self._get_error_code(body), 'InvalidPartNumber')
+        body = self._do_test_non_slo_object_part_num_not_satisfiable(
+            'GET', '10000')
+        self.assertEqual(self._get_error_code(body), 'InvalidPartNumber')
+
+    def test_non_slo_object_HEAD_part_num_not_satisfiable(self):
+        body = self._do_test_non_slo_object_part_num_not_satisfiable(
+            'HEAD', '2')
+        self.assertEqual(body, b'')
+        body = self._do_test_non_slo_object_part_num_not_satisfiable(
+            'HEAD', '10000')
+        self.assertEqual(body, b'')
+
+    def _do_test_non_slo_object_part_num_invalid(self, method, part_number):
+        req = Request.blank('/bucket/object',
+                            params={'partNumber': part_number},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        req.method = method
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '400')
+        return body
+
+    def test_non_slo_object_GET_part_num_invalid(self):
+        body = self._do_test_non_slo_object_part_num_invalid('GET', '0')
+        self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+        body = self._do_test_non_slo_object_part_num_invalid('GET', '-1')
+        self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+        body = self._do_test_non_slo_object_part_num_invalid('GET', '10001')
+        self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+        with patch.object(self.s3api.conf, 'max_upload_part_num', 1000):
+            body = self._do_test_non_slo_object_part_num_invalid('GET', '1001')
+            self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+            self.assertEqual(
+                self._get_error_message(body),
+                'Part number must be an integer between 1 and 1000, inclusive')
+
+        body = self._do_test_non_slo_object_part_num_invalid('GET', 'foo')
+        self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+        self.assertEqual(
+            self._get_error_message(body),
+            'Part number must be an integer between 1 and 10000, inclusive')
+
+    def test_non_slo_object_HEAD_part_num_invalid(self):
+        body = self._do_test_non_slo_object_part_num_invalid('HEAD', '0')
+        self.assertEqual(body, b'')
+        body = self._do_test_non_slo_object_part_num_invalid('HEAD', '-1')
+        self.assertEqual(body, b'')
+        body = self._do_test_non_slo_object_part_num_invalid('HEAD', '10001')
+        self.assertEqual(body, b'')
+        body = self._do_test_non_slo_object_part_num_invalid('HEAD', 'foo')
+        self.assertEqual(body, b'')
+
+    def test_non_slo_object_GET_part_num_and_range(self):
+        req = Request.blank('/bucket/object',
+                            params={'partNumber': '1'},
+                            headers={'Range': 'bytes=1-2',
+                                     'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        req.method = 'GET'
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '400')
+        self.assertEqual(self._get_error_code(body), 'InvalidRequest')
+        self.assertEqual(
+            self._get_error_message(body),
+            'Cannot specify both Range header and partNumber query parameter')
+
+        # partNumber + Range error trumps bad partNumber
+        req = Request.blank('/bucket/object',
+                            params={'partNumber': '0'},
+                            headers={'Range': 'bytes=1-2',
+                                     'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        req.method = 'GET'
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '400')
+        self.assertEqual(self._get_error_code(body), 'InvalidRequest')
+        self.assertEqual(
+            self._get_error_message(body),
+            'Cannot specify both Range header and partNumber query parameter')
+
+    def test_non_slo_object_HEAD_part_num_and_range(self):
+        req = Request.blank('/bucket/object',
+                            params={'partNumber': '1'},
+                            headers={'Range': 'bytes=1-2',
+                                     'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        req.method = 'HEAD'
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '400')
+
+    def test_object_GET_Range(self):
+        req = Request.blank('/bucket/object',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Range': 'bytes=0-3',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '206')
+
+        self.assertTrue('content-range' in headers)
+        self.assertTrue(headers['content-range'].startswith('bytes 0-3'))
+
+    def test_object_GET_Response(self):
+        req = Request.blank('/bucket/object',
+                            environ={'REQUEST_METHOD': 'GET',
+                                     'QUERY_STRING':
+                                     'response-content-type=%s&'
+                                     'response-content-language=%s&'
+                                     'response-expires=%s&'
+                                     'response-cache-control=%s&'
+                                     'response-content-disposition=%s&'
+                                     'response-content-encoding=%s&'
+                                     % ('text/plain', 'en',
+                                        'Fri, 01 Apr 2014 12:00:00 GMT',
+                                        'no-cache',
+                                        'attachment',
+                                        'gzip')},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+
+        self.assertTrue('content-type' in headers)
+        self.assertEqual(headers['content-type'], 'text/plain')
+        self.assertTrue('content-language' in headers)
+        self.assertEqual(headers['content-language'], 'en')
+        self.assertTrue('expires' in headers)
+        self.assertEqual(headers['expires'], 'Fri, 01 Apr 2014 12:00:00 GMT')
+        self.assertTrue('cache-control' in headers)
+        self.assertEqual(headers['cache-control'], 'no-cache')
+        self.assertTrue('content-disposition' in headers)
+        self.assertTrue('accept-ranges' in headers)
+        self.assertEqual(headers['accept-ranges'], 'bytes')
+        self.assertEqual(headers['content-disposition'],
+                         'attachment')
+        self.assertTrue('content-encoding' in headers)
+        self.assertEqual(headers['content-encoding'], 'gzip')
+
+    def test_object_GET_version_id_not_implemented(self):
+        # GET version that is not null
+        req = Request.blank('/bucket/object?versionId=2',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+
+        with patch('swift.common.middleware.s3api.controllers.obj.'
+                   'get_swift_info', return_value={}):
+            status, headers, body = self.call_s3api(req)
+            self.assertEqual(status.split()[0], '501', body)
+
+        # GET current version
+        req = Request.blank('/bucket/object?versionId=null',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        with patch('swift.common.middleware.s3api.controllers.obj.'
+                   'get_swift_info', return_value={}):
+            status, headers, body = self.call_s3api(req)
+            self.assertEqual(status.split()[0], '200', body)
+            self.assertEqual(body, self.object_body)
+            self.assertTrue('accept-ranges' in headers)
+            self.assertEqual(headers['accept-ranges'], 'bytes')
+
+    def test_object_GET_version_id(self):
+        # GET current version
+        req = Request.blank('/bucket/object?versionId=null',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200', body)
+        self.assertEqual(body, self.object_body)
+
+        # GET current version that is not null
+        req = Request.blank('/bucket/object?versionId=2',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        with self.stubbed_container_info(versioning_enabled=True):
+            status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200', body)
+        self.assertEqual(body, self.object_body)
+        self.assertTrue('accept-ranges' in headers)
+        self.assertEqual(headers['accept-ranges'], 'bytes')
+
+        # GET version in archive
+        headers = self.response_headers.copy()
+        headers['Content-Length'] = 6
+        account = 'test:tester'
+        grants = [Grant(User(account), 'FULL_CONTROL')]
+        headers.update(
+            encode_acl('object', ACL(Owner(account, account), grants)))
+        self.swift.register(
+            'HEAD', '/v1/AUTH_test/bucket/object?version-id=1', swob.HTTPOk,
+            headers, None)
+        self.swift.register(
+            'GET', '/v1/AUTH_test/bucket/object?version-id=1', swob.HTTPOk,
+            headers, 'hello1')
+        req = Request.blank('/bucket/object?versionId=1',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        with self.stubbed_container_info(versioning_enabled=True):
+            status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200', body)
+        self.assertEqual(body, b'hello1')
+
+        # Version not found
+        self.swift.register(
+            'GET', '/v1/AUTH_test/bucket/object?version-id=A',
+            swob.HTTPNotFound, {}, None)
+        req = Request.blank('/bucket/object?versionId=A',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        with self.stubbed_container_info(versioning_enabled=True):
+            status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '404')
+
+    def test_object_GET_with_version_id_but_not_enabled(self):
+        req = Request.blank('/bucket/object?versionId=A',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        with self.stubbed_container_info():
+            status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '404')
+        elem = fromstring(body, 'Error')
+        self.assertEqual(elem.find('Code').text, 'NoSuchVersion')
+        self.assertEqual(elem.find('Key').text, 'object')
+        self.assertEqual(elem.find('VersionId').text, 'A')
+        expected_calls = []
+        # NB: No actual backend GET!
+        self.assertEqual(expected_calls, self.swift.calls)
+
+    def test_object_PUT_error(self):
+        code = self._test_method_error('PUT', '/bucket/object',
+                                       swob.HTTPUnauthorized)
+        self.assertEqual(code, 'SignatureDoesNotMatch')
+        code = self._test_method_error('PUT', '/bucket/object',
+                                       swob.HTTPForbidden)
+        self.assertEqual(code, 'AccessDenied')
+        code = self._test_method_error('PUT', '/bucket/object',
+                                       swob.HTTPNotFound)
+        self.assertEqual(code, 'NoSuchBucket')
+        code = self._test_method_error('PUT', '/bucket/object',
+                                       swob.HTTPRequestEntityTooLarge)
+        self.assertEqual(code, 'EntityTooLarge')
+        code = self._test_method_error('PUT', '/bucket/object',
+                                       swob.HTTPServerError)
+        self.assertEqual(code, 'InternalError')
+        code = self._test_method_error(
+            'PUT', '/bucket/object',
+            swob.HTTPUnprocessableEntity,
+            headers={'Content-MD5': '1B2M2Y8AsgTpgAmY7PhCfg=='})
+        self.assertEqual(code, 'BadDigest')
+        code = self._test_method_error('PUT', '/bucket/object',
+                                       swob.HTTPLengthRequired)
+        self.assertEqual(code, 'MissingContentLength')
+        # Swift can 412 if the versions container is missing
+        code = self._test_method_error('PUT', '/bucket/object',
+                                       swob.HTTPPreconditionFailed)
+        self.assertEqual(code, 'PreconditionFailed')
+        code = self._test_method_error('PUT', '/bucket/object',
+                                       swob.HTTPServiceUnavailable)
+        self.assertEqual(code, 'ServiceUnavailable')
+        code = self._test_method_error('PUT', '/bucket/object',
+                                       swob.HTTPCreated,
+                                       {'X-Amz-Copy-Source': ''})
+        self.assertEqual(code, 'InvalidArgument')
+        code = self._test_method_error('PUT', '/bucket/object',
+                                       swob.HTTPCreated,
+                                       {'X-Amz-Copy-Source': '/'})
+        self.assertEqual(code, 'InvalidArgument')
+        code = self._test_method_error('PUT', '/bucket/object',
+                                       swob.HTTPCreated,
+                                       {'X-Amz-Copy-Source': '/bucket'})
+        self.assertEqual(code, 'InvalidArgument')
+        code = self._test_method_error('PUT', '/bucket/object',
+                                       swob.HTTPCreated,
+                                       {'X-Amz-Copy-Source': '/bucket/'})
+        self.assertEqual(code, 'InvalidArgument')
+        code = self._test_method_error(
+            'PUT', '/bucket/object',
+            swob.HTTPCreated,
+            {'X-Amz-Copy-Source': '/bucket/src_obj?foo=bar'})
+        self.assertEqual(code, 'InvalidArgument')
+        # adding other query paramerters will cause an error
+        code = self._test_method_error(
+            'PUT', '/bucket/object',
+            swob.HTTPCreated,
+            {'X-Amz-Copy-Source': '/bucket/src_obj?versionId=foo&bar=baz'})
+        self.assertEqual(code, 'InvalidArgument')
+        # ...even versionId appears in the last
+        code = self._test_method_error(
+            'PUT', '/bucket/object',
+            swob.HTTPCreated,
+            {'X-Amz-Copy-Source': '/bucket/src_obj?bar=baz&versionId=foo'})
+        self.assertEqual(code, 'InvalidArgument')
+        code = self._test_method_error(
+            'PUT', '/bucket/object',
+            swob.HTTPCreated,
+            {'X-Amz-Copy-Source': '/src_bucket/src_object',
+             'X-Amz-Copy-Source-Range': 'bytes=0-0'})
+        self.assertEqual(code, 'InvalidArgument')
+        code = self._test_method_error('PUT', '/bucket/object',
+                                       swob.HTTPRequestTimeout)
+        self.assertEqual(code, 'RequestTimeout')
+        code = self._test_method_error('PUT', '/bucket/object',
+                                       swob.HTTPClientDisconnect,
+                                       {})
+        self.assertEqual(code, 'RequestTimeout')
+
+    def test_object_PUT(self):
+        etag = self.response_headers['etag']
+        content_md5 = binascii.b2a_base64(
+            binascii.a2b_hex(etag)).strip().decode('ascii')
+
+        req = Request.blank(
+            '/bucket/object',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'Authorization': 'AWS test:tester:hmac',
+                     'x-amz-storage-class': 'STANDARD',
+                     'Content-MD5': content_md5,
+                     'Date': self.get_date_header()},
+            body=self.object_body)
+        req.date = datetime.now()
+        req.content_type = 'text/plain'
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+        # Check that s3api returns an etag header.
+        self.assertEqual(headers['etag'], '"%s"' % etag)
+
+        _, _, sw_headers = self.swift.calls_with_headers[-1]
+        # Check that s3api converts a Content-MD5 header into an etag.
+        self.assertEqual(sw_headers['etag'], etag)
+        # It's not clear if it is necessary or even appropriate for s3api to
+        # set x-timestamp on these requests. However, while it does we'll
+        # assert that it sets a *valid* timestamp.
+        self.assert_valid_timestamp(sw_headers.get('X-Timestamp'))
+
+    def test_object_PUT_bad_hash(self):
+        # FakeSwift doesn't care if the etag matches, so we explicitly register
+        # the 422 that the proxy would have passed on from the object servers
+        self.swift.register('PUT', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPUnprocessableEntity, {},
+                            'Unprocessable Entity')
+
+        bad_etag = md5(b'not-same-content').hexdigest()
+        content_md5 = binascii.b2a_base64(
+            binascii.a2b_hex(bad_etag)).strip().decode('ascii')
+
+        req = Request.blank(
+            '/bucket/object',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'Authorization': 'AWS test:tester:hmac',
+                     'x-amz-storage-class': 'STANDARD',
+                     'Content-MD5': content_md5,
+                     'Date': self.get_date_header()},
+            body=self.object_body)
+        req.date = datetime.now()
+        req.content_type = 'text/plain'
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '400')
+        self.assertEqual(self._get_error_code(body), 'BadDigest')
+        self.assertIn(b'Content-MD5', body)
+        self.assertEqual('/v1/AUTH_test/bucket/object',
+                         req.environ.get('swift.backend_path'))
+
+    def test_object_PUT_quota_exceeded(self):
+        etag = self.response_headers['etag']
+        content_md5 = binascii.b2a_base64(
+            binascii.a2b_hex(etag)).strip().decode('ascii')
+
+        self.swift.register(
+            'PUT', '/v1/AUTH_test/bucket/object',
+            swob.HTTPRequestEntityTooLarge, {}, 'Upload exceeds quota.')
+        req = Request.blank(
+            '/bucket/object',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'Authorization': 'AWS test:tester:hmac',
+                     'x-amz-storage-class': 'STANDARD',
+                     'Content-MD5': content_md5,
+                     'Date': self.get_date_header()},
+            body=self.object_body)
+        req.date = datetime.now()
+        req.content_type = 'text/plain'
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '400')
+        self.assertIn(b'<Code>EntityTooLarge</Code>', body)
+        self.assertIn(b'<Message>Upload exceeds quota.</Message', body)
+
+    def test_object_PUT_v4(self):
+        body_sha = sha256(self.object_body).hexdigest()
+        req = Request.blank(
+            '/bucket/object',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={
+                'Authorization':
+                    'AWS4-HMAC-SHA256 '
+                    'Credential=test:tester/%s/us-east-1/s3/aws4_request, '
+                    'SignedHeaders=host;x-amz-date, '
+                    'Signature=hmac' % (
+                        self.get_v4_amz_date_header().split('T', 1)[0]),
+                'x-amz-date': self.get_v4_amz_date_header(),
+                'x-amz-storage-class': 'STANDARD',
+                'x-amz-content-sha256': body_sha,
+                'Date': self.get_date_header()},
+            body=self.object_body)
+        req.date = datetime.now()
+        req.content_type = 'text/plain'
+
+        # Test V4 signature processing and access_user_id setting
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+        # Check that s3api returns an etag header.
+        self.assertEqual(headers['etag'],
+                         '"%s"' % self.response_headers['etag'])
+
+        _, _, sw_headers = self.swift.calls_with_headers[-1]
+        # No way to determine ETag to send
+        self.assertNotIn('etag', sw_headers)
+        self.assertEqual('/v1/AUTH_test/bucket/object',
+                         req.environ.get('swift.backend_path'))
+
+        # Verify access_user_id is set correctly in environ for V4 signature
+        self.assertEqual(req.environ['swift.access_logging']['user_id'],
+                         'test:tester')
+        # It's not clear if it is necessary or even appropriate for s3api to
+        # set x-timestamp on these requests. However, while it does we'll
+        # assert that it sets a *valid* timestamp.
+        self.assert_valid_timestamp(sw_headers.get('X-Timestamp'))
+
+    def test_object_PUT_v4_bad_hash(self):
+        orig_app = self.s3api.app
+
+        def error_catching_app(env, start_response):
+            try:
+                return orig_app(env, start_response)
+            except Exception:
+                self.logger.exception('uh oh')
+                start_response('599 Uh Oh', [])
+                return [b'']
+
+        self.s3api.app = error_catching_app
+
+        req = Request.blank(
+            '/bucket/object',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={
+                'Authorization':
+                    'AWS4-HMAC-SHA256 '
+                    'Credential=test:tester/%s/us-east-1/s3/aws4_request, '
+                    'SignedHeaders=host;x-amz-date, '
+                    'Signature=hmac' % (
+                        self.get_v4_amz_date_header().split('T', 1)[0]),
+                'x-amz-date': self.get_v4_amz_date_header(),
+                'x-amz-storage-class': 'STANDARD',
+                'x-amz-content-sha256': '0' * 64,
+                'Date': self.get_date_header()},
+            body=self.object_body)
+        req.date = datetime.now()
+        req.content_type = 'text/plain'
+        self.assertNotIn('swift.access_logging', req.environ)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(req.environ['swift.access_logging'],
+                         {'user_id': 'test:tester'})
+        self.assertEqual(status.split()[0], '400')
+        self.assertEqual(self._get_error_code(body),
+                         'XAmzContentSHA256Mismatch')
+        self.assertIn(b'x-amz-content-sha256', body)
+        self.assertEqual('/v1/AUTH_test/bucket/object',
+                         req.environ.get('swift.backend_path'))
+
+        req = Request.blank(
+            '/bucket/object',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={
+                'Authorization':
+                    'AWS4-HMAC-SHA256 '
+                    'Credential=test:tester/%s/us-east-1/s3/aws4_request, '
+                    'SignedHeaders=host;x-amz-date, '
+                    'Signature=hmac' % (
+                        self.get_v4_amz_date_header().split('T', 1)[0]),
+                'x-amz-date': self.get_v4_amz_date_header(),
+                'x-amz-storage-class': 'STANDARD',
+                'x-amz-content-sha256': 'not the hash',
+                'Date': self.get_date_header()},
+            body=self.object_body)
+        req.date = datetime.now()
+        req.content_type = 'text/plain'
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '400')
+        self.assertEqual(self._get_error_code(body),
+                         'InvalidArgument')
+        self.assertIn(b'<ArgumentName>x-amz-content-sha256</ArgumentName>',
+                      body)
+        self.assertNotIn('swift.backend_path', req.environ)
+
+    def test_object_PUT_v4_unsigned_payload(self):
+        req = Request.blank(
+            '/bucket/object',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={
+                'Authorization':
+                    'AWS4-HMAC-SHA256 '
+                    'Credential=test:tester/%s/us-east-1/s3/aws4_request, '
+                    'SignedHeaders=host;x-amz-date, '
+                    'Signature=hmac' % (
+                        self.get_v4_amz_date_header().split('T', 1)[0]),
+                'x-amz-date': self.get_v4_amz_date_header(),
+                'x-amz-storage-class': 'STANDARD',
+                'x-amz-content-sha256': 'UNSIGNED-PAYLOAD',
+                'Date': self.get_date_header()},
+            body=self.object_body)
+        req.date = datetime.now()
+        req.content_type = 'text/plain'
+
+        # Test V4 UNSIGNED-PAYLOAD signature processing and access_user_id
+        # setting
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+        # Check that s3api returns an etag header.
+        self.assertEqual(headers['etag'],
+                         '"%s"' % self.response_headers['etag'])
+
+        _, _, headers = self.swift.calls_with_headers[-1]
+        # No way to determine ETag to send
+        self.assertNotIn('etag', headers)
+        self.assertIn(b'UNSIGNED-PAYLOAD', SigV4Request(
+            req.environ, self.s3api.conf)._canonical_request())
+
+        # Verify access_user_id is set correctly in environ for V4
+        # UNSIGNED-PAYLOAD
+        self.assertEqual(req.environ['swift.access_logging']['user_id'],
+                         'test:tester')
+
+    def _test_object_PUT_copy(self, head_resp, put_header=None,
+                              src_path='/some/source', timestamp=None):
+        account = 'test:tester'
+        grants = [Grant(User(account), 'FULL_CONTROL')]
+        head_headers = \
+            encode_acl('object',
+                       ACL(Owner(account, account), grants))
+        head_headers.update({'last-modified': self.last_modified})
+        self.swift.register('HEAD', '/v1/AUTH_test/some/source',
+                            head_resp, head_headers, None)
+        put_header = put_header or {}
+        return self._call_object_copy(src_path, put_header, timestamp)
+
+    def _test_object_PUT_copy_self(self, head_resp,
+                                   put_header=None, timestamp=None):
+        account = 'test:tester'
+        grants = [Grant(User(account), 'FULL_CONTROL')]
+        head_headers = \
+            encode_acl('object',
+                       ACL(Owner(account, account), grants))
+        head_headers.update({'last-modified': self.last_modified})
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/object',
+                            head_resp, head_headers, None)
+        put_header = put_header or {}
+        return self._call_object_copy('/bucket/object', put_header, timestamp)
+
+    def _call_object_copy(self, src_path, put_header, timestamp=None):
+        put_headers = {'Authorization': 'AWS test:tester:hmac',
+                       'X-Amz-Copy-Source': src_path,
+                       'Date': self.get_date_header()}
+        put_headers.update(put_header)
+
+        req = Request.blank('/bucket/object',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers=put_headers)
+
+        req.date = datetime.now()
+        req.content_type = 'text/plain'
+        timestamp = timestamp or time.time()
+        with patch('swift.common.middleware.s3api.utils.time.time',
+                   return_value=timestamp):
+            return self.call_s3api(req)
+
+    def test_object_PUT_copy(self):
+        def do_test(src_path):
+            date_header = self.get_date_header()
+            timestamp = mktime(date_header)
+            allowed_last_modified = [S3Timestamp(timestamp).s3xmlformat]
+            status, headers, body = self._test_object_PUT_copy(
+                swob.HTTPOk, put_header={'Date': date_header},
+                timestamp=timestamp, src_path=src_path)
+            # may have gotten unlucky and had the clock roll over
+            date_header = self.get_date_header()
+            timestamp = mktime(date_header)
+            allowed_last_modified.append(S3Timestamp(timestamp).s3xmlformat)
+
+            self.assertEqual(status.split()[0], '200')
+            self.assertEqual(headers['Content-Type'], 'application/xml')
+
+            self.assertTrue(headers.get('etag') is None)
+            self.assertTrue(headers.get('x-amz-meta-something') is None)
+            elem = fromstring(body, 'CopyObjectResult')
+            self.assertIn(elem.find('LastModified').text,
+                          allowed_last_modified)
+            self.assertEqual(elem.find('ETag').text, '"%s"' % self.etag)
+
+            _, _, sw_headers = self.swift.calls_with_headers[-1]
+            self.assertEqual(sw_headers['X-Copy-From'], '/some/source')
+            self.assertTrue(sw_headers.get('X-Fresh-Metadata') is None)
+            self.assertEqual(sw_headers['Content-Length'], '0')
+            # It's not clear if it is necessary or even appropriate for s3api
+            # to set x-timestamp on these requests. However, while it does
+            # we'll assert that it sets a *valid* timestamp.
+            self.assert_valid_timestamp(sw_headers.get('X-Timestamp'))
+
+        do_test('/some/source')
+        do_test('/some/source?')
+        do_test('/some/source?versionId=null')
+        # Some clients (like Boto) don't include the leading slash;
+        # AWS seems to tolerate this so we should, too
+        do_test('some/source')
+
+    def test_object_PUT_copy_metadata_replace(self):
+        with mock_timestamp_now(klass=S3Timestamp) as now:
+            status, headers, body = \
+                self._test_object_PUT_copy(
+                    swob.HTTPOk,
+                    {'X-Amz-Metadata-Directive': 'REPLACE',
+                     'X-Amz-Meta-Something': 'oh hai',
+                     'X-Amz-Meta-Unreadable-Prefix': '\x04w',
+                     'X-Amz-Meta-Unreadable-Suffix': 'h\x04',
+                     'X-Amz-Meta-Lots-Of-Unprintable': 5 * '\x04',
+                     'Cache-Control': 'hello',
+                     'content-disposition': 'how are you',
+                     'content-encoding': 'good and you',
+                     'content-language': 'great',
+                     'content-type': 'so',
+                     'expires': 'yeah',
+                     'x-robots-tag': 'bye'})
+
+        self.assertEqual(status.split()[0], '200')
+        self.assertEqual(headers['Content-Type'], 'application/xml')
+        self.assertIsNone(headers.get('etag'))
+        elem = fromstring(body, 'CopyObjectResult')
+        self.assertEqual(S3Timestamp(now.ceil()).s3xmlformat,
+                         elem.find('LastModified').text)
+        self.assertEqual(elem.find('ETag').text, '"%s"' % self.etag)
+
+        _, _, headers = self.swift.calls_with_headers[-1]
+        self.assertEqual(headers['X-Copy-From'], '/some/source')
+        # Check that metadata is included if replace directive is specified
+        # and that Fresh Metadata is set
+        self.assertTrue(headers.get('X-Fresh-Metadata') == 'True')
+        self.assertEqual(headers['X-Object-Meta-Something'], 'oh hai')
+        self.assertEqual(headers['X-Object-Meta-Unreadable-Prefix'],
+                         '=?UTF-8?Q?=04w?=')
+        self.assertEqual(headers['X-Object-Meta-Unreadable-Suffix'],
+                         '=?UTF-8?Q?h=04?=')
+        self.assertEqual(headers['X-Object-Meta-Lots-Of-Unprintable'],
+                         '=?UTF-8?B?BAQEBAQ=?=')
+        # Check other metadata is set
+        self.assertEqual(headers['Cache-Control'], 'hello')
+        self.assertEqual(headers['Content-Disposition'], 'how are you')
+        self.assertEqual(headers['Content-Encoding'], 'good and you')
+        self.assertEqual(headers['Content-Language'], 'great')
+        self.assertEqual(headers['Content-Type'], 'so')
+        self.assertEqual(headers['Expires'], 'yeah')
+        self.assertEqual(headers['X-Robots-Tag'], 'bye')
+
+        self.assertEqual(headers['Content-Length'], '0')
+
+    def test_object_PUT_copy_metadata_copy(self):
+        with mock_timestamp_now(klass=S3Timestamp) as now:
+            status, headers, body = \
+                self._test_object_PUT_copy(
+                    swob.HTTPOk,
+                    {'X-Amz-Metadata-Directive': 'COPY',
+                     'X-Amz-Meta-Something': 'oh hai',
+                     'X-Amz-Meta-Unreadable-Prefix': '\x04w',
+                     'X-Amz-Meta-Unreadable-Suffix': 'h\x04',
+                     'X-Amz-Meta-Lots-Of-Unprintable': 5 * '\x04',
+                     'Cache-Control': 'hello',
+                     'content-disposition': 'how are you',
+                     'content-encoding': 'good and you',
+                     'content-language': 'great',
+                     'content-type': 'so',
+                     'expires': 'yeah',
+                     'x-robots-tag': 'bye'})
+
+        self.assertEqual(status.split()[0], '200')
+        self.assertEqual(headers['Content-Type'], 'application/xml')
+        self.assertIsNone(headers.get('etag'))
+
+        elem = fromstring(body, 'CopyObjectResult')
+        self.assertEqual(S3Timestamp(now.ceil()).s3xmlformat,
+                         elem.find('LastModified').text)
+        self.assertEqual(elem.find('ETag').text, '"%s"' % self.etag)
+
+        _, _, headers = self.swift.calls_with_headers[-1]
+        self.assertEqual(headers['X-Copy-From'], '/some/source')
+        # Check that metadata is omited if COPY directive is specified
+        self.assertIsNone(headers.get('X-Fresh-Metadata'))
+        self.assertIsNone(headers.get('X-Object-Meta-Something'))
+        self.assertIsNone(headers.get('X-Object-Meta-Unreadable-Prefix'))
+        self.assertIsNone(headers.get('X-Object-Meta-Unreadable-Suffix'))
+        self.assertIsNone(headers.get('X-Object-Meta-Lots-Of-Unprintable'))
+        self.assertIsNone(headers.get('Cache-Control'))
+        self.assertIsNone(headers.get('Content-Disposition'))
+        self.assertIsNone(headers.get('Content-Encoding'))
+        self.assertIsNone(headers.get('Content-Language'))
+        self.assertIsNone(headers.get('Content-Type'))
+        self.assertIsNone(headers.get('Expires'))
+        self.assertIsNone(headers.get('X-Robots-Tag'))
+
+        self.assertEqual(headers['Content-Length'], '0')
+
+    def test_object_PUT_copy_self(self):
+        status, headers, body = \
+            self._test_object_PUT_copy_self(swob.HTTPOk)
+        self.assertEqual(status.split()[0], '400')
+        elem = fromstring(body, 'Error')
+        err_msg = ("This copy request is illegal because it is trying to copy "
+                   "an object to itself without changing the object's "
+                   "metadata, storage class, website redirect location or "
+                   "encryption attributes.")
+        self.assertEqual(elem.find('Code').text, 'InvalidRequest')
+        self.assertEqual(elem.find('Message').text, err_msg)
+
+    def test_object_PUT_copy_self_metadata_copy(self):
+        header = {'x-amz-metadata-directive': 'COPY'}
+        status, headers, body = \
+            self._test_object_PUT_copy_self(swob.HTTPOk, header)
+        self.assertEqual(status.split()[0], '400')
+        elem = fromstring(body, 'Error')
+        err_msg = ("This copy request is illegal because it is trying to copy "
+                   "an object to itself without changing the object's "
+                   "metadata, storage class, website redirect location or "
+                   "encryption attributes.")
+        self.assertEqual(elem.find('Code').text, 'InvalidRequest')
+        self.assertEqual(elem.find('Message').text, err_msg)
+
+    def test_object_PUT_copy_self_metadata_replace(self):
+        date_header = self.get_date_header()
+        timestamp = mktime(date_header)
+        allowed_last_modified = [S3Timestamp(timestamp).s3xmlformat]
+        header = {'x-amz-metadata-directive': 'REPLACE',
+                  'Date': date_header}
+        status, headers, body = self._test_object_PUT_copy_self(
+            swob.HTTPOk, header, timestamp=timestamp)
+        date_header = self.get_date_header()
+        timestamp = mktime(date_header)
+        allowed_last_modified.append(S3Timestamp(timestamp).s3xmlformat)
+
+        self.assertEqual(status.split()[0], '200')
+        self.assertEqual(headers['Content-Type'], 'application/xml')
+        self.assertTrue(headers.get('etag') is None)
+        elem = fromstring(body, 'CopyObjectResult')
+        self.assertIn(elem.find('LastModified').text, allowed_last_modified)
+        self.assertEqual(elem.find('ETag').text, '"%s"' % self.etag)
+
+        _, _, headers = self.swift.calls_with_headers[-1]
+        self.assertEqual(headers['X-Copy-From'], '/bucket/object')
+        self.assertEqual(headers['Content-Length'], '0')
+
+    def test_object_PUT_copy_headers_error(self):
+        etag = '7dfa07a8e59ddbcd1dc84d4c4f82aea1'
+        last_modified_since = 'Fri, 01 Apr 2014 12:00:00 GMT'
+
+        header = {'X-Amz-Copy-Source-If-Match': etag,
+                  'Date': self.get_date_header()}
+        status, header, body = \
+            self._test_object_PUT_copy(swob.HTTPPreconditionFailed,
+                                       header)
+        self.assertEqual(self._get_error_code(body), 'PreconditionFailed')
+
+        header = {'X-Amz-Copy-Source-If-None-Match': etag}
+        status, header, body = \
+            self._test_object_PUT_copy(swob.HTTPNotModified,
+                                       header)
+        self.assertEqual(self._get_error_code(body), 'PreconditionFailed')
+
+        header = {'X-Amz-Copy-Source-If-Modified-Since': last_modified_since}
+        status, header, body = \
+            self._test_object_PUT_copy(swob.HTTPNotModified,
+                                       header)
+        self.assertEqual(self._get_error_code(body), 'PreconditionFailed')
+
+        header = \
+            {'X-Amz-Copy-Source-If-Unmodified-Since': last_modified_since}
+        status, header, body = \
+            self._test_object_PUT_copy(swob.HTTPPreconditionFailed,
+                                       header)
+        self.assertEqual(self._get_error_code(body), 'PreconditionFailed')
+
+    def test_object_POST_error(self):
+        code = self._test_method_error('POST', '/bucket/object', None)
+        self.assertEqual(code, 'NotImplemented')
+
+    def test_object_DELETE_error(self):
+        code = self._test_method_error('DELETE', '/bucket/object',
+                                       swob.HTTPUnauthorized)
+        self.assertEqual(code, 'SignatureDoesNotMatch')
+        code = self._test_method_error('DELETE', '/bucket/object',
+                                       swob.HTTPForbidden)
+        self.assertEqual(code, 'AccessDenied')
+        code = self._test_method_error('DELETE', '/bucket/object',
+                                       swob.HTTPServerError)
+        self.assertEqual(code, 'InternalError')
+        code = self._test_method_error('DELETE', '/bucket/object',
+                                       swob.HTTPServiceUnavailable)
+        self.assertEqual(code, 'ServiceUnavailable')
+
+        with patch(
+                'swift.common.middleware.s3api.s3request.get_container_info',
+                return_value={'status': 404}):
+            code = self._test_method_error('DELETE', '/bucket/object',
+                                           swob.HTTPNotFound)
+            self.assertEqual(code, 'NoSuchBucket')
+
+    def test_object_DELETE_no_multipart(self):
+        self.s3api.conf.allow_multipart_uploads = False
+        req = Request.blank('/bucket/object',
+                            environ={'REQUEST_METHOD': 'DELETE'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '204')
+
+        self.assertNotIn(('HEAD', '/v1/AUTH_test/bucket/object'),
+                         self.swift.calls)
+        self.assertIn(('DELETE', '/v1/AUTH_test/bucket/object'),
+                      self.swift.calls)
+        _, path, sw_headers = self.swift.calls_with_headers[-1]
+        self.assertEqual(path.count('?'), 0)
+        self.assertNotIn('X-Timestamp', sw_headers)
+
+    def test_object_DELETE_with_version_id_but_not_enabled(self):
+        req = Request.blank('/bucket/object?versionId=1574358170.12293',
+                            method='DELETE', headers={
+                                'Authorization': 'AWS test:tester:hmac',
+                                'Date': self.get_date_header()})
+        with self.stubbed_container_info():
+            status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '204')
+        expected_calls = []
+        # NB: No actual backend DELETE!
+        self.assertEqual(expected_calls, self.swift.calls)
+
+    def test_object_DELETE_multipart(self):
+        req = Request.blank('/bucket/object',
+                            environ={'REQUEST_METHOD': 'DELETE'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '204')
+
+        self.assertIn(('HEAD', '/v1/AUTH_test/bucket/object?symlink=get'),
+                      self.swift.calls)
+        self.assertEqual(('DELETE', '/v1/AUTH_test/bucket/object'),
+                         self.swift.calls[-1])
+        _, path = self.swift.calls[-1]
+        self.assertEqual(path.count('?'), 0)
+
+    def test_object_DELETE_missing(self):
+        self.s3acl_response_modified = True
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPNotFound, {}, None)
+        req = Request.blank('/bucket/object',
+                            environ={'REQUEST_METHOD': 'DELETE'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '204')
+
+        self.assertEqual(('HEAD', '/v1/AUTH_test/bucket/object?symlink=get'),
+                         self.swift.calls[0])
+        # the s3acl retests w/ a get_container_info HEAD @ self.swift.calls[1]
+        self.assertEqual(('DELETE', '/v1/AUTH_test/bucket/object'),
+                         self.swift.calls[-1])
+
+    def test_slo_object_DELETE(self):
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPOk,
+                            {'x-static-large-object': 'True'},
+                            None)
+        self.swift.register('DELETE', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPOk, {}, '<SLO delete results>')
+        req = Request.blank('/bucket/object',
+                            environ={'REQUEST_METHOD': 'DELETE'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'Content-Type': 'foo/bar'})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '204')
+        self.assertEqual(body, b'')
+
+        self.assertIn(('HEAD', '/v1/AUTH_test/bucket/object?symlink=get'),
+                      self.swift.calls)
+        self.assertIn(('DELETE', '/v1/AUTH_test/bucket/object'
+                                 '?multipart-manifest=delete'),
+                      self.swift.calls)
+        _, path, headers = self.swift.calls_with_headers[-1]
+        path, query_string = path.split('?', 1)
+        query = {}
+        for q in query_string.split('&'):
+            key, arg = q.split('=')
+            query[key] = arg
+        self.assertEqual(query['multipart-manifest'], 'delete')
+        # HEAD did not indicate that it was an S3 MPU, so no async delete
+        self.assertNotIn('async', query)
+        self.assertNotIn('Content-Type', headers)
+
+    def test_slo_object_async_DELETE(self):
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPOk,
+                            {'x-static-large-object': 'True',
+                             'x-object-sysmeta-s3api-etag': 's3-style-etag'},
+                            None)
+        self.swift.register('DELETE', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPNoContent, {}, '')
+        req = Request.blank('/bucket/object',
+                            environ={'REQUEST_METHOD': 'DELETE'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'Content-Type': 'foo/bar'})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '204')
+        self.assertEqual(body, b'')
+
+        self.assertIn(('HEAD', '/v1/AUTH_test/bucket/object?symlink=get'),
+                      self.swift.calls)
+        self.assertIn(('DELETE', '/v1/AUTH_test/bucket/object'
+                                 '?async=on&multipart-manifest=delete'),
+                      self.swift.calls)
+        _, path, headers = self.swift.calls_with_headers[-1]
+        path, query_string = path.split('?', 1)
+        query = {}
+        for q in query_string.split('&'):
+            key, arg = q.split('=')
+            query[key] = arg
+        self.assertEqual(query['multipart-manifest'], 'delete')
+        self.assertEqual(query['async'], 'on')
+        self.assertNotIn('Content-Type', headers)
+
+    def _test_set_container_permission(self, account, permission):
+        self.s3acl_response_modified = True
+        grants = [Grant(User(account), permission)]
+        headers = \
+            encode_acl('container',
+                       ACL(Owner('test:tester', 'test:tester'), grants))
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket',
+                            swob.HTTPNoContent, headers, None)
+
+
+class TestS3ApiObj(BaseS3ApiObj, S3ApiTestCase):
+
+    def test_object_GET_Range_error(self):
+        code = self._test_method_error('GET', '/bucket/object',
+                                       swob.HTTPRequestedRangeNotSatisfiable)
+        self.assertEqual(code, 'InvalidRange')
+
+    @patch_policies([
+        StoragePolicy(0, 'gold', is_default=True),
+        StoragePolicy(1, 'silver')])
+    def test_object_policy_index_logging(self):
+        self._do_test_object_policy_index_logging(self.bucket_policy_index)
+        self._register_bucket_policy_index_head('bucket', 0)
+        self._do_test_object_policy_index_logging(0)
+
+    def test_object_PUT_with_version(self):
+        self.swift.register('GET',
+                            '/v1/AUTH_test/bucket/src_obj?version-id=foo',
+                            swob.HTTPOk, self.response_headers,
+                            self.object_body)
+        self.swift.register('PUT', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPCreated, {
+                                'etag': self.etag,
+                                'last-modified': self.last_modified,
+                            }, None)
+
+        req = Request.blank('/bucket/object', method='PUT', body='', headers={
+            'Authorization': 'AWS test:tester:hmac',
+            'Date': self.get_date_header(),
+            'X-Amz-Copy-Source': '/bucket/src_obj?versionId=foo',
+        })
+        status, headers, body = self.call_s3api(req)
+
+        self.assertEqual('200 OK', status)
+        elem = fromstring(body, 'CopyObjectResult')
+        self.assertEqual(elem.find('ETag').text, '"%s"' % self.etag)
+
+        self.assertEqual(self.swift.calls, [
+            ('HEAD', '/v1/AUTH_test/bucket/src_obj?version-id=foo'),
+            ('PUT', '/v1/AUTH_test/bucket/object?version-id=foo'),
+        ])
+        _, _, headers = self.swift.calls_with_headers[-1]
+        self.assertEqual(headers['x-copy-from'], '/bucket/src_obj')
+
+    def test_object_PUT_headers(self):
+        content_md5 = binascii.b2a_base64(binascii.a2b_hex(
+            self.etag)).strip().decode('ascii')
+
+        self.swift.register('HEAD', '/v1/AUTH_test/some/source',
+                            swob.HTTPOk, {'last-modified': self.last_modified},
+                            None)
+        req = Request.blank(
+            '/bucket/object',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'Authorization': 'AWS test:tester:hmac',
+                     'X-Amz-Storage-Class': 'STANDARD',
+                     'X-Amz-Meta-Something': 'oh hai',
+                     'X-Amz-Meta-Unreadable-Prefix': '\x04w',
+                     'X-Amz-Meta-Unreadable-Suffix': 'h\x04',
+                     'X-Amz-Meta-Lots-Of-Unprintable': 5 * '\x04',
+                     'X-Amz-Copy-Source': '/some/source',
+                     'Content-MD5': content_md5,
+                     'Date': self.get_date_header()},
+            body=self.object_body)
+        req.date = datetime.now()
+        req.content_type = 'text/plain'
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual('200 ', status[:4], body)
+        # Check that s3api does not return an etag header,
+        # specified copy source.
+        self.assertNotIn('etag', headers)
+        # Check that s3api does not return custom metadata in response
+        self.assertNotIn('x-amz-meta-something', headers)
+
+        _, _, headers = self.swift.calls_with_headers[-1]
+        # Check that s3api converts a Content-MD5 header into an etag.
+        self.assertEqual(headers['ETag'], self.etag)
+        # Check that metadata is omited if no directive is specified
+        self.assertIsNone(headers.get('X-Object-Meta-Something'))
+        self.assertIsNone(headers.get('X-Object-Meta-Unreadable-Prefix'))
+        self.assertIsNone(headers.get('X-Object-Meta-Unreadable-Suffix'))
+        self.assertIsNone(headers.get('X-Object-Meta-Lots-Of-Unprintable'))
+
+        self.assertEqual(headers['X-Copy-From'], '/some/source')
+        self.assertEqual(headers['Content-Length'], '0')
+
+    @patch_policies([
+        StoragePolicy(0, 'gold', is_default=True),
+        StoragePolicy(1, 'silver')])
+    def test_simple_object_copy(self):
+        src_policy_index = 0
+        self._register_bucket_policy_index_head('some', src_policy_index)
+        dst_policy_index = 1
+        self._register_bucket_policy_index_head('bucket', dst_policy_index)
+        self.swift.register('HEAD', '/v1/AUTH_test/some/source',
+                            swob.HTTPOk, {}, None)
+        req = Request.blank(
+            '/bucket/object', method='PUT',
+            headers={
+                'Authorization': 'AWS test:tester:hmac',
+                'X-Amz-Copy-Source': '/some/source',
+                'Date': self.get_date_header(),
+            },
+        )
+        timestamp = time.time()
+        with patch('swift.common.middleware.s3api.utils.time.time',
+                   return_value=timestamp):
+            status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+        self._assert_policy_index(req.headers, headers, dst_policy_index)
+        self.assertEqual('/v1/AUTH_test/bucket/object',
+                         req.environ['swift.backend_path'])
+
+        head_call, put_call = self.swift.call_list
+        self.assertNotIn('x-backend-storage-policy-index', head_call.headers)
+        self.assertNotIn('x-backend-storage-policy-index', put_call.headers)
+        self.assertEqual(put_call.headers['x-copy-from'], '/some/source')
+
+    def test_object_PUT_copy_headers_with_match(self):
+        etag = '7dfa07a8e59ddbcd1dc84d4c4f82aea1'
+        last_modified_since = 'Fri, 01 Apr 2014 11:00:00 GMT'
+
+        header = {'X-Amz-Copy-Source-If-Match': etag,
+                  'X-Amz-Copy-Source-If-Modified-Since': last_modified_since,
+                  'Date': self.get_date_header()}
+        status, header, body = \
+            self._test_object_PUT_copy(swob.HTTPOk, header)
+        self.assertEqual(status.split()[0], '200')
+        self.assertEqual(len(self.swift.calls_with_headers), 2)
+        _, _, headers = self.swift.calls_with_headers[-1]
+        self.assertTrue(headers.get('If-Match') is None)
+        self.assertTrue(headers.get('If-Modified-Since') is None)
+        _, _, headers = self.swift.calls_with_headers[0]
+        self.assertEqual(headers['If-Match'], etag)
+        self.assertEqual(headers['If-Modified-Since'], last_modified_since)
+
+    def test_object_PUT_copy_headers_with_not_match(self):
+        etag = '7dfa07a8e59ddbcd1dc84d4c4f82aea1'
+        last_modified_since = 'Fri, 01 Apr 2014 12:00:00 GMT'
+
+        header = {'X-Amz-Copy-Source-If-None-Match': etag,
+                  'X-Amz-Copy-Source-If-Unmodified-Since': last_modified_since,
+                  'Date': self.get_date_header()}
+        status, header, body = \
+            self._test_object_PUT_copy(swob.HTTPOk, header)
+
+        self.assertEqual(status.split()[0], '200')
+        self.assertEqual(len(self.swift.calls_with_headers), 2)
+        _, _, headers = self.swift.calls_with_headers[-1]
+        self.assertTrue(headers.get('If-None-Match') is None)
+        self.assertTrue(headers.get('If-Unmodified-Since') is None)
+        _, _, headers = self.swift.calls_with_headers[0]
+        self.assertEqual(headers['If-None-Match'], etag)
+        self.assertEqual(headers['If-Unmodified-Since'], last_modified_since)
+
+    def test_object_DELETE_old_version_id(self):
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPOk, self.response_headers, None)
+        resp_headers = {'X-Object-Current-Version-Id': '1574360804.34906'}
+        self.swift.register('DELETE', '/v1/AUTH_test/bucket/object'
+                            '?symlink=get&version-id=1574358170.12293',
+                            swob.HTTPNoContent, resp_headers, None)
+        req = Request.blank('/bucket/object?versionId=1574358170.12293',
+                            method='DELETE', headers={
+                                'Authorization': 'AWS test:tester:hmac',
+                                'Date': self.get_date_header()})
+
+        with self.stubbed_container_info(versioning_enabled=True):
+            status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '204')
+        self.assertEqual([
+            ('HEAD', '/v1/AUTH_test/bucket/object'
+             '?symlink=get&version-id=1574358170.12293'),
+            ('DELETE', '/v1/AUTH_test/bucket/object'
+             '?symlink=get&version-id=1574358170.12293')
+        ], self.swift.calls)
+
+    def test_object_DELETE_current_version_id(self):
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPOk, self.response_headers, None)
+        resp_headers = {'X-Object-Current-Version-Id': 'null'}
+        self.swift.register('DELETE', '/v1/AUTH_test/bucket/object'
+                            '?symlink=get&version-id=1574358170.12293',
+                            swob.HTTPNoContent, resp_headers, None)
+        old_versions = [{
+            'name': 'object',
+            'version_id': '1574341899.21751',
+            'content_type': 'application/found',
+        }, {
+            'name': 'object',
+            'version_id': '1574333192.15190',
+            'content_type': 'application/older',
+        }]
+        self.swift.register('GET', '/v1/AUTH_test/bucket', swob.HTTPOk, {},
+                            json.dumps(old_versions))
+        req = Request.blank('/bucket/object?versionId=1574358170.12293',
+                            method='DELETE', headers={
+                                'Authorization': 'AWS test:tester:hmac',
+                                'Date': self.get_date_header()})
+        fake_info = {
+            'status': 204,
+            'sysmeta': {
+                'versions-container': '\x00versions\x00bucket',
+            }
+        }
+        with patch('swift.common.middleware.s3api.s3request.'
+                   'get_container_info', return_value=fake_info):
+            status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '204')
+        self.assertEqual([
+            ('HEAD', '/v1/AUTH_test/bucket/object'
+             '?symlink=get&version-id=1574358170.12293', None),
+            ('DELETE', '/v1/AUTH_test/bucket/object'
+             '?symlink=get&version-id=1574358170.12293', None),
+            ('GET', '/v1/AUTH_test/bucket'
+             '?prefix=object&versions=True', '0'),
+            ('PUT', '/v1/AUTH_test/bucket/object'
+             '?version-id=1574341899.21751', '0'),
+        ], [
+            (method, path, headers.get('content-length'))
+            for method, path, headers in self.swift.calls_with_headers])
+
+    def test_object_DELETE_version_id_not_implemented(self):
+        req = Request.blank('/bucket/object?versionId=1574358170.12293',
+                            method='DELETE', headers={
+                                'Authorization': 'AWS test:tester:hmac',
+                                'Date': self.get_date_header()})
+
+        with patch('swift.common.middleware.s3api.controllers.obj.'
+                   'get_swift_info', return_value={}):
+            status, headers, body = self.call_s3api(req)
+            self.assertEqual(status.split()[0], '501', body)
+
+    def test_object_DELETE_current_version_id_is_delete_marker(self):
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPOk, self.response_headers, None)
+        resp_headers = {'X-Object-Current-Version-Id': 'null'}
+        self.swift.register('DELETE', '/v1/AUTH_test/bucket/object'
+                            '?symlink=get&version-id=1574358170.12293',
+                            swob.HTTPNoContent, resp_headers, None)
+        old_versions = [{
+            'name': 'object',
+            'version_id': '1574341899.21751',
+            'content_type': 'application/x-deleted;swift_versions_deleted=1',
+        }]
+        self.swift.register('GET', '/v1/AUTH_test/bucket', swob.HTTPOk, {},
+                            json.dumps(old_versions))
+        req = Request.blank('/bucket/object?versionId=1574358170.12293',
+                            method='DELETE', headers={
+                                'Authorization': 'AWS test:tester:hmac',
+                                'Date': self.get_date_header()})
+        fake_info = {
+            'status': 204,
+            'sysmeta': {
+                'versions-container': '\x00versions\x00bucket',
+            }
+        }
+        with patch('swift.common.middleware.s3api.s3request.'
+                   'get_container_info', return_value=fake_info):
+            status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '204')
+        self.assertEqual([
+            ('HEAD', '/v1/AUTH_test/bucket/object'
+             '?symlink=get&version-id=1574358170.12293'),
+            ('DELETE', '/v1/AUTH_test/bucket/object'
+             '?symlink=get&version-id=1574358170.12293'),
+            ('GET', '/v1/AUTH_test/bucket'
+             '?prefix=object&versions=True'),
+        ], self.swift.calls)
+
+    def test_object_DELETE_current_version_id_is_missing(self):
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPOk, self.response_headers, None)
+        resp_headers = {'X-Object-Current-Version-Id': 'null'}
+        self.swift.register('DELETE', '/v1/AUTH_test/bucket/object'
+                            '?symlink=get&version-id=1574358170.12293',
+                            swob.HTTPNoContent, resp_headers, None)
+        old_versions = [{
+            'name': 'object',
+            'version_id': '1574341899.21751',
+            'content_type': 'application/missing',
+        }, {
+            'name': 'object',
+            'version_id': '1574333192.15190',
+            'content_type': 'application/found',
+        }]
+        self.swift.register('GET', '/v1/AUTH_test/bucket', swob.HTTPOk, {},
+                            json.dumps(old_versions))
+        self.swift.register('PUT', '/v1/AUTH_test/bucket/object'
+                            '?version-id=1574341899.21751',
+                            swob.HTTPPreconditionFailed, {}, None)
+        self.swift.register('PUT', '/v1/AUTH_test/bucket/object'
+                            '?version-id=1574333192.15190',
+                            swob.HTTPCreated, {}, None)
+        req = Request.blank('/bucket/object?versionId=1574358170.12293',
+                            method='DELETE', headers={
+                                'Authorization': 'AWS test:tester:hmac',
+                                'Date': self.get_date_header()})
+        fake_info = {
+            'status': 204,
+            'sysmeta': {
+                'versions-container': '\x00versions\x00bucket',
+            }
+        }
+        with patch('swift.common.middleware.s3api.s3request.'
+                   'get_container_info', return_value=fake_info):
+            status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '204')
+        self.assertEqual([
+            ('HEAD', '/v1/AUTH_test/bucket/object'
+             '?symlink=get&version-id=1574358170.12293'),
+            ('DELETE', '/v1/AUTH_test/bucket/object'
+             '?symlink=get&version-id=1574358170.12293'),
+            ('GET', '/v1/AUTH_test/bucket'
+             '?prefix=object&versions=True'),
+            ('PUT', '/v1/AUTH_test/bucket/object'
+             '?version-id=1574341899.21751'),
+            ('PUT', '/v1/AUTH_test/bucket/object'
+             '?version-id=1574333192.15190'),
+        ], self.swift.calls)
+
+    def test_object_DELETE_current_version_id_GET_error(self):
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPOk, self.response_headers, None)
+        resp_headers = {'X-Object-Current-Version-Id': 'null'}
+        self.swift.register('DELETE', '/v1/AUTH_test/bucket/object'
+                            '?symlink=get&version-id=1574358170.12293',
+                            swob.HTTPNoContent, resp_headers, None)
+        self.swift.register('GET', '/v1/AUTH_test/bucket',
+                            swob.HTTPServerError, {}, '')
+        req = Request.blank('/bucket/object?versionId=1574358170.12293',
+                            method='DELETE', headers={
+                                'Authorization': 'AWS test:tester:hmac',
+                                'Date': self.get_date_header()})
+        fake_info = {
+            'status': 204,
+            'sysmeta': {
+                'versions-container': '\x00versions\x00bucket',
+            }
+        }
+        with patch('swift.common.middleware.s3api.s3request.'
+                   'get_container_info', return_value=fake_info):
+            status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '500')
+        self.assertEqual([
+            ('HEAD', '/v1/AUTH_test/bucket/object'
+             '?symlink=get&version-id=1574358170.12293'),
+            ('DELETE', '/v1/AUTH_test/bucket/object'
+             '?symlink=get&version-id=1574358170.12293'),
+            ('GET', '/v1/AUTH_test/bucket'
+             '?prefix=object&versions=True'),
+        ], self.swift.calls)
+
+    def test_object_DELETE_current_version_id_PUT_error(self):
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPOk, self.response_headers, None)
+        resp_headers = {'X-Object-Current-Version-Id': 'null'}
+        self.swift.register('DELETE', '/v1/AUTH_test/bucket/object'
+                            '?symlink=get&version-id=1574358170.12293',
+                            swob.HTTPNoContent, resp_headers, None)
+        old_versions = [{
+            'name': 'object',
+            'version_id': '1574341899.21751',
+            'content_type': 'application/foo',
+        }]
+        self.swift.register('GET', '/v1/AUTH_test/bucket', swob.HTTPOk, {},
+                            json.dumps(old_versions))
+        self.swift.register('PUT', '/v1/AUTH_test/bucket/object'
+                            '?version-id=1574341899.21751',
+                            swob.HTTPServerError, {}, None)
+        req = Request.blank('/bucket/object?versionId=1574358170.12293',
+                            method='DELETE', headers={
+                                'Authorization': 'AWS test:tester:hmac',
+                                'Date': self.get_date_header()})
+        fake_info = {
+            'status': 204,
+            'sysmeta': {
+                'versions-container': '\x00versions\x00bucket',
+            }
+        }
+        with patch('swift.common.middleware.s3api.s3request.'
+                   'get_container_info', return_value=fake_info):
+            status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '500')
+        self.assertEqual([
+            ('HEAD', '/v1/AUTH_test/bucket/object'
+             '?symlink=get&version-id=1574358170.12293'),
+            ('DELETE', '/v1/AUTH_test/bucket/object'
+             '?symlink=get&version-id=1574358170.12293'),
+            ('GET', '/v1/AUTH_test/bucket'
+             '?prefix=object&versions=True'),
+            ('PUT', '/v1/AUTH_test/bucket/object'
+             '?version-id=1574341899.21751'),
+        ], self.swift.calls)
+
+    def test_object_DELETE_in_versioned_container_without_version(self):
+        resp_headers = {
+            'X-Object-Version-Id': '1574360804.34906',
+            'X-Backend-Content-Type': DELETE_MARKER_CONTENT_TYPE}
+        self.swift.register('DELETE', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPNoContent, resp_headers, None)
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket',
+                            swob.HTTPNoContent, {
+                                'X-Container-Sysmeta-Versions-Enabled': True},
+                            None)
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPNotFound, self.response_headers, None)
+        req = Request.blank('/bucket/object', method='DELETE', headers={
+            'Authorization': 'AWS test:tester:hmac',
+            'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '204')
+        self.assertEqual([
+            ('HEAD', '/v1/AUTH_test/bucket/object?symlink=get'),
+            ('HEAD', '/v1/AUTH_test'),
+            ('HEAD', '/v1/AUTH_test/bucket'),
+            ('DELETE', '/v1/AUTH_test/bucket/object'),
+        ], self.swift.calls)
+
+        self.assertEqual('1574360804.34906', headers.get('x-amz-version-id'))
+        self.assertEqual('true', headers.get('x-amz-delete-marker'))
+
+    def test_object_DELETE_in_versioned_container_with_version_id(self):
+        resp_headers = {
+            'X-Object-Version-Id': '1574701081.61553'}
+        self.swift.register('DELETE', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPNoContent, resp_headers, None)
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPNotFound, self.response_headers, None)
+        req = Request.blank('/bucket/object?versionId=1574701081.61553',
+                            method='DELETE', headers={
+                                'Authorization': 'AWS test:tester:hmac',
+                                'Date': self.get_date_header()})
+        fake_info = {
+            'status': 204,
+            'sysmeta': {
+                'versions-container': '\x00versions\x00bucket',
+            }
+        }
+        with patch('swift.common.middleware.s3api.s3request.'
+                   'get_container_info', return_value=fake_info):
+            status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '204')
+        self.assertEqual([
+            ('HEAD', '/v1/AUTH_test/bucket/object'
+             '?symlink=get&version-id=1574701081.61553'),
+            ('DELETE', '/v1/AUTH_test/bucket/object'
+             '?symlink=get&version-id=1574701081.61553'),
+        ], self.swift.calls)
+
+        self.assertEqual('1574701081.61553', headers.get('x-amz-version-id'))
+
+    def test_cors_preflight(self):
+        req = Request.blank(
+            '/bucket/cors-object',
+            environ={'REQUEST_METHOD': 'OPTIONS'},
+            headers={'Origin': 'http://example.com',
+                     'Access-Control-Request-Method': 'GET',
+                     'Access-Control-Request-Headers': 'authorization'})
+        self.s3api.conf.cors_preflight_allow_origin = ['*']
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status, '200 OK')
+        self.assertDictEqual(headers, {
+            'Allow': 'GET, HEAD, PUT, POST, DELETE, OPTIONS',
+            'Access-Control-Allow-Origin': 'http://example.com',
+            'Access-Control-Allow-Methods': ('GET, HEAD, PUT, POST, DELETE, '
+                                             'OPTIONS'),
+            'Access-Control-Allow-Headers': 'authorization',
+            'Vary': 'Origin, Access-Control-Request-Headers',
+        })
+
+        # test more allow_origins
+        self.s3api.conf.cors_preflight_allow_origin = ['http://example.com',
+                                                       'http://other.com']
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status, '200 OK')
+        self.assertDictEqual(headers, {
+            'Allow': 'GET, HEAD, PUT, POST, DELETE, OPTIONS',
+            'Access-Control-Allow-Origin': 'http://example.com',
+            'Access-Control-Allow-Methods': ('GET, HEAD, PUT, POST, DELETE, '
+                                             'OPTIONS'),
+            'Access-Control-Allow-Headers': 'authorization',
+            'Vary': 'Origin, Access-Control-Request-Headers',
+        })
+
+        # test presigned urls
+        req = Request.blank(
+            '/bucket/cors-object?AWSAccessKeyId=test%3Atester&'
+            'Expires=1621558415&Signature=MKMdW3FpYcoFEJlTLF3EhP7AJgc%3D',
+            environ={'REQUEST_METHOD': 'OPTIONS'},
+            headers={'Origin': 'http://example.com',
+                     'Access-Control-Request-Method': 'PUT'})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status, '200 OK')
+        self.assertDictEqual(headers, {
+            'Allow': 'GET, HEAD, PUT, POST, DELETE, OPTIONS',
+            'Access-Control-Allow-Origin': 'http://example.com',
+            'Access-Control-Allow-Methods': ('GET, HEAD, PUT, POST, DELETE, '
+                                             'OPTIONS'),
+            'Vary': 'Origin, Access-Control-Request-Headers',
+        })
+        req = Request.blank(
+            '/bucket/cors-object?X-Amz-Algorithm=AWS4-HMAC-SHA256&'
+            'X-Amz-Credential=test%3Atester%2F20210521%2Fus-east-1%2Fs3%2F'
+            'aws4_request&X-Amz-Date=20210521T003835Z&X-Amz-Expires=900&'
+            'X-Amz-Signature=e413549f2cbeddb457c5fddb2d28820ce58de514bb900'
+            '5d588800d7ebb1a6a2d&X-Amz-SignedHeaders=host',
+            environ={'REQUEST_METHOD': 'OPTIONS'},
+            headers={'Origin': 'http://example.com',
+                     'Access-Control-Request-Method': 'DELETE'})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status, '200 OK')
+        self.assertDictEqual(headers, {
+            'Allow': 'GET, HEAD, PUT, POST, DELETE, OPTIONS',
+            'Access-Control-Allow-Origin': 'http://example.com',
+            'Access-Control-Allow-Methods': ('GET, HEAD, PUT, POST, DELETE, '
+                                             'OPTIONS'),
+            'Vary': 'Origin, Access-Control-Request-Headers',
+        })
+
+        # Wrong protocol
+        self.s3api.conf.cors_preflight_allow_origin = ['https://example.com']
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status, '401 Unauthorized')
+        self.assertEqual(headers, {
+            'Allow': 'GET, HEAD, PUT, POST, DELETE, OPTIONS',
+        })
+
+    def test_cors_headers(self):
+        # note: Access-Control-Allow-Methods would normally be expected in
+        # response to an OPTIONS request but its included here in GET/PUT tests
+        # to check that it is always passed back in S3Response
+        cors_headers = {
+            'Access-Control-Allow-Origin': '*',
+            'Access-Control-Allow-Methods': ('GET, PUT, POST, COPY, '
+                                             'DELETE, PUT, OPTIONS'),
+            'Access-Control-Expose-Headers':
+                'x-object-meta-test, x-object-meta-test=5funderscore, etag',
+        }
+        get_resp_headers = self.response_headers
+        get_resp_headers['x-object-meta-test=5funderscore'] = 'underscored'
+        self.swift.register(
+            'GET', '/v1/AUTH_test/bucket/cors-object', swob.HTTPOk,
+            dict(get_resp_headers, **cors_headers),
+            self.object_body)
+        self.swift.register(
+            'PUT', '/v1/AUTH_test/bucket/cors-object', swob.HTTPCreated,
+            dict({'etag': self.etag,
+                  'last-modified': self.last_modified,
+                  'x-object-meta-something': 'oh hai',
+                  'x-object-meta-test=5funderscore': 'underscored'},
+                 **cors_headers),
+            None)
+
+        req = Request.blank(
+            '/bucket/cors-object',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Authorization': 'AWS test:tester:hmac',
+                     'Date': self.get_date_header(),
+                     'Origin': 'http://example.com',
+                     'Access-Control-Request-Method': 'GET',
+                     'Access-Control-Request-Headers': 'authorization'})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status, '200 OK')
+        self.assertIn('Access-Control-Allow-Origin', headers)
+        self.assertEqual(headers['Access-Control-Allow-Origin'], '*')
+        self.assertIn('Access-Control-Expose-Headers', headers)
+        self.assertEqual(
+            headers['Access-Control-Expose-Headers'],
+            'x-amz-meta-test, x-amz-meta-test_underscore, etag, '
+            'x-amz-request-id, x-amz-id-2')
+        self.assertIn('Access-Control-Allow-Methods', headers)
+        self.assertEqual(
+            headers['Access-Control-Allow-Methods'],
+            'GET, PUT, POST, DELETE, PUT, OPTIONS')
+        self.assertIn('x-amz-meta-test_underscore', headers)
+        self.assertEqual('underscored', headers['x-amz-meta-test_underscore'])
+
+        req = Request.blank(
+            '/bucket/cors-object',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'Authorization': 'AWS test:tester:hmac',
+                     'Date': self.get_date_header(),
+                     'Origin': 'http://example.com',
+                     'Access-Control-Request-Method': 'PUT',
+                     'Access-Control-Request-Headers': 'authorization'})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status, '200 OK')
+        self.assertIn('Access-Control-Allow-Origin', headers)
+        self.assertEqual(headers['Access-Control-Allow-Origin'], '*')
+        self.assertIn('Access-Control-Expose-Headers', headers)
+        self.assertEqual(
+            headers['Access-Control-Expose-Headers'],
+            'x-amz-meta-test, x-amz-meta-test_underscore, etag, '
+            'x-amz-request-id, x-amz-id-2')
+        self.assertIn('Access-Control-Allow-Methods', headers)
+        self.assertEqual(
+            headers['Access-Control-Allow-Methods'],
+            'GET, PUT, POST, DELETE, PUT, OPTIONS')
+        self.assertEqual('underscored', headers['x-amz-meta-test_underscore'])
+
+
+class TestS3ApiObjNonUTC(TestS3ApiObj):
+    def setUp(self):
+        self.orig_tz = os.environ.get('TZ', '')
+        os.environ['TZ'] = 'EST+05EDT,M4.1.0,M10.5.0'
+        time.tzset()
+        super(TestS3ApiObjNonUTC, self).setUp()
+
+    def tearDown(self):
+        super(TestS3ApiObjNonUTC, self).tearDown()
+        os.environ['TZ'] = self.orig_tz
+        time.tzset()
+
+
+class TestS3ApiObjAcl(BaseS3ApiObj, S3ApiTestCaseAcl):
+
+    def _test_object_for_s3acl(self, method, account):
+        req = Request.blank('/bucket/object',
+                            environ={'REQUEST_METHOD': method},
+                            headers={'Authorization': 'AWS %s:hmac' % account,
+                                     'Date': self.get_date_header()})
+        return self.call_s3api(req)
+
+    def _test_object_copy_for_s3acl(self, account, src_permission=None,
+                                    src_path='/src_bucket/src_obj'):
+        owner = 'test:tester'
+        grants = [Grant(User(account), src_permission)] \
+            if src_permission else [Grant(User(owner), 'FULL_CONTROL')]
+        src_o_headers = \
+            encode_acl('object', ACL(Owner(owner, owner), grants))
+        src_o_headers.update({'last-modified': self.last_modified})
+        self.swift.register(
+            'HEAD', join('/v1/AUTH_test', src_path.lstrip('/')),
+            swob.HTTPOk, src_o_headers, None)
+
+        req = Request.blank(
+            '/bucket/object',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'Authorization': 'AWS %s:hmac' % account,
+                     'X-Amz-Copy-Source': src_path,
+                     'Date': self.get_date_header()})
+
+        return self.call_s3api(req)
+
+    def test_object_GET_with_s3acl_and_unknown_user(self):
+        req = Request.blank('/bucket/object',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        with patch.object(self.app, 'remote_user', None):
+            status, headers, body = self.call_s3api(req)
+        self.assertEqual(status, '403 Forbidden')
+        self.assertEqual(self._get_error_code(body), 'SignatureDoesNotMatch')
+
+    def test_object_GET_with_s3acl_and_keystone(self):
+        # for passing keystone authentication root
+        orig_auth = self.app.handle
+        calls = []
+
+        def wrapped_auth(env):
+            calls.append((env['REQUEST_METHOD'], 's3api.auth_details' in env))
+            orig_auth(env)
+
+        with patch.object(self.app, 'handle', wrapped_auth):
+            self._test_object_GETorHEAD('GET')
+        self.assertEqual(calls, [
+            ('TEST', True),
+            ('HEAD', False),
+            ('GET', False),
+        ])
+
+    def test_object_PUT_copy_headers_with_match_and_s3acl(self):
+        etag = '7dfa07a8e59ddbcd1dc84d4c4f82aea1'
+        last_modified_since = 'Fri, 01 Apr 2014 11:00:00 GMT'
+
+        header = {'X-Amz-Copy-Source-If-Match': etag,
+                  'X-Amz-Copy-Source-If-Modified-Since': last_modified_since,
+                  'Date': self.get_date_header()}
+        status, header, body = \
+            self._test_object_PUT_copy(swob.HTTPOk, header)
+
+        self.assertEqual(status.split()[0], '200')
+        self.assertEqual(len(self.swift.calls_with_headers), 3)
+        # After the check of the copy source in the case of s3acl is valid,
+        # s3api check the bucket write permissions of the destination.
+        _, _, headers = self.swift.calls_with_headers[-2]
+        self.assertTrue(headers.get('If-Match') is None)
+        self.assertTrue(headers.get('If-Modified-Since') is None)
+        _, _, headers = self.swift.calls_with_headers[-1]
+        self.assertTrue(headers.get('If-Match') is None)
+        self.assertTrue(headers.get('If-Modified-Since') is None)
+        _, _, headers = self.swift.calls_with_headers[0]
+        self.assertEqual(headers['If-Match'], etag)
+        self.assertEqual(headers['If-Modified-Since'], last_modified_since)
+
+    def test_object_PUT_copy_headers_with_not_match_and_s3acl(self):
+        etag = '7dfa07a8e59ddbcd1dc84d4c4f82aea1'
+        last_modified_since = 'Fri, 01 Apr 2014 12:00:00 GMT'
+
+        header = {'X-Amz-Copy-Source-If-None-Match': etag,
+                  'X-Amz-Copy-Source-If-Unmodified-Since': last_modified_since,
+                  'Date': self.get_date_header()}
+        status, header, body = \
+            self._test_object_PUT_copy(swob.HTTPOk, header)
+        self.assertEqual(status.split()[0], '200')
+        # After the check of the copy source in the case of s3acl is valid,
+        # s3api check the bucket write permissions of the destination.
+        self.assertEqual(len(self.swift.calls_with_headers), 3)
+        _, _, headers = self.swift.calls_with_headers[-1]
+        self.assertTrue(headers.get('If-None-Match') is None)
+        self.assertTrue(headers.get('If-Unmodified-Since') is None)
+        _, _, headers = self.swift.calls_with_headers[0]
+        self.assertEqual(headers['If-None-Match'], etag)
+        self.assertEqual(headers['If-Unmodified-Since'], last_modified_since)
+
+    def test_object_GET_Range_error(self):
+        # needed for pre-flight ACL HEAD request, FakeSwift finds the 416
+        # for the GET and returns it for HEAD but s3api won't error
+        # correctly to 416 on HEAD
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPOk, {}, None),
+        code = self._test_method_error('GET', '/bucket/object',
+                                       swob.HTTPRequestedRangeNotSatisfiable)
+        self.assertEqual(code, 'InvalidRange')
+
+    def test_object_GET_without_permission(self):
+        status, headers, body = self._test_object_for_s3acl('GET',
+                                                            'test:other')
+        self.assertEqual(self._get_error_code(body), 'AccessDenied')
+
+    def test_object_GET_with_read_permission(self):
+        status, headers, body = self._test_object_for_s3acl('GET',
+                                                            'test:read')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_object_GET_with_fullcontrol_permission(self):
+        status, headers, body = \
+            self._test_object_for_s3acl('GET', 'test:full_control')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_object_PUT_without_permission(self):
+        status, headers, body = self._test_object_for_s3acl('PUT',
+                                                            'test:other')
+        self.assertEqual(self._get_error_code(body), 'AccessDenied')
+
+    def test_object_PUT_with_owner_permission(self):
+        status, headers, body = self._test_object_for_s3acl('PUT',
+                                                            'test:tester')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_object_PUT_with_write_permission(self):
+        account = 'test:other'
+        self._test_set_container_permission(account, 'WRITE')
+        status, headers, body = self._test_object_for_s3acl('PUT', account)
+        self.assertEqual(status.split()[0], '200')
+
+    def test_object_PUT_with_fullcontrol_permission(self):
+        account = 'test:other'
+        self._test_set_container_permission(account, 'FULL_CONTROL')
+        status, headers, body = \
+            self._test_object_for_s3acl('PUT', account)
+        self.assertEqual(status.split()[0], '200')
+
+    def test_object_DELETE_without_permission(self):
+        account = 'test:other'
+        status, headers, body = self._test_object_for_s3acl('DELETE',
+                                                            account)
+        self.assertEqual(self._get_error_code(body), 'AccessDenied')
+
+    def test_object_DELETE_with_owner_permission(self):
+        status, headers, body = self._test_object_for_s3acl('DELETE',
+                                                            'test:tester')
+        self.assertEqual(status.split()[0], '204')
+
+    def test_object_DELETE_with_write_permission(self):
+        account = 'test:other'
+        self._test_set_container_permission(account, 'WRITE')
+        status, headers, body = self._test_object_for_s3acl('DELETE',
+                                                            account)
+        self.assertEqual(status.split()[0], '204')
+
+    def test_object_DELETE_with_fullcontrol_permission(self):
+        account = 'test:other'
+        self._test_set_container_permission(account, 'FULL_CONTROL')
+        status, headers, body = self._test_object_for_s3acl('DELETE', account)
+        self.assertEqual(status.split()[0], '204')
+
+    def test_object_PUT_copy_with_owner_permission(self):
+        status, headers, body = \
+            self._test_object_copy_for_s3acl('test:tester')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_object_PUT_copy_with_fullcontrol_permission(self):
+        status, headers, body = \
+            self._test_object_copy_for_s3acl('test:full_control',
+                                             'FULL_CONTROL')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_object_PUT_copy_with_grantee_permission(self):
+        status, headers, body = \
+            self._test_object_copy_for_s3acl('test:write', 'READ')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_object_PUT_copy_without_src_obj_permission(self):
+        status, headers, body = \
+            self._test_object_copy_for_s3acl('test:write')
+        self.assertEqual(status.split()[0], '403')
+
+    def test_object_PUT_copy_without_dst_container_permission(self):
+        status, headers, body = \
+            self._test_object_copy_for_s3acl('test:other', 'READ')
+        self.assertEqual(status.split()[0], '403')
+
+    def test_object_PUT_copy_empty_src_path(self):
+        self.swift.register('PUT', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPPreconditionFailed, {}, None)
+        status, headers, body = self._test_object_copy_for_s3acl(
+            'test:write', 'READ', src_path='')
+        self.assertEqual(status.split()[0], '400')
+
+
+class TestS3ApiObjNonUTCAcl(TestS3ApiObjAcl):
+    def setUp(self):
+        self.orig_tz = os.environ.get('TZ', '')
+        os.environ['TZ'] = 'EST+05EDT,M4.1.0,M10.5.0'
+        time.tzset()
+        super(TestS3ApiObjNonUTCAcl, self).setUp()
+
+    def tearDown(self):
+        super(TestS3ApiObjNonUTCAcl, self).tearDown()
+        os.environ['TZ'] = self.orig_tz
+        time.tzset()
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/s3api/test_object_lock.py b/test/unit/common/middleware/s3api/test_object_lock.py
new file mode 100644
index 0000000000..3bdf307e29
--- /dev/null
+++ b/test/unit/common/middleware/s3api/test_object_lock.py
@@ -0,0 +1,67 @@
+# Copyright (c) 2010-2023 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+
+from swift.common.swob import Request
+
+from test.unit.common.middleware.s3api import S3ApiTestCase
+from swift.common.middleware.s3api.etree import fromstring
+
+
+class TestS3ApiObjectLock(S3ApiTestCase):
+
+    # The object-lock controller currently only returns a static response
+    # as disabled. Things like ansible need this. So there isn't much to test.
+
+    def test_get_object_lock(self):
+        req = Request.blank('/bucket?object-lock',
+                            environ={'REQUEST_METHOD': 'GET',
+                                     'swift.trans_id': 'txt1234'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '404')
+        elem = fromstring(body, 'Error')
+
+        self.assertTrue(elem.getchildren())
+        for child in elem.iterchildren():
+            if child.tag == 'Code':
+                self.assertEqual(child.text,
+                                 'ObjectLockConfigurationNotFoundError')
+            elif child.tag == 'Message':
+                self.assertEqual(child.text,
+                                 'Object Lock configuration does not exist '
+                                 'for this bucket')
+            elif child.tag == 'RequestId':
+                self.assertEqual(child.text,
+                                 'txt1234')
+            elif child.tag == 'BucketName':
+                self.assertEqual(child.text, 'bucket')
+            else:
+                self.fail('Found unknown sub entry')
+
+    def test_put_object_lock(self):
+        req = Request.blank('/bucket?object-lock',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        # This currently isn't implemented.
+        self.assertEqual(status.split()[0], '501')
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/s3api/test_s3_acl.py b/test/unit/common/middleware/s3api/test_s3_acl.py
new file mode 100644
index 0000000000..0bd2af4be8
--- /dev/null
+++ b/test/unit/common/middleware/s3api/test_s3_acl.py
@@ -0,0 +1,387 @@
+# Copyright (c) 2014 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+
+from swift.common.swob import Request
+from swift.common.middleware.s3api.etree import tostring, Element, SubElement
+from swift.common.middleware.s3api.subresource import ACL, ACLPrivate, User, \
+    Owner, Grant
+from test.unit.common.middleware.s3api import S3ApiTestCaseAcl
+
+
+XMLNS_XSI = 'http://www.w3.org/2001/XMLSchema-instance'
+
+
+def _make_xml(grantee):
+    owner = 'test:tester'
+    permission = 'READ'
+    elem = Element('AccessControlPolicy')
+    elem_owner = SubElement(elem, 'Owner')
+    SubElement(elem_owner, 'ID').text = owner
+    SubElement(elem_owner, 'DisplayName').text = owner
+    acl_list_elem = SubElement(elem, 'AccessControlList')
+    elem_grant = SubElement(acl_list_elem, 'Grant')
+    elem_grant.append(grantee)
+    SubElement(elem_grant, 'Permission').text = permission
+    return tostring(elem)
+
+
+class TestS3ApiS3Acl(S3ApiTestCaseAcl):
+
+    def test_bucket_acl_PUT_with_other_owner(self):
+        req = Request.blank('/bucket?acl',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()},
+                            body=tostring(
+                                ACLPrivate(
+                                    Owner(id='test:other',
+                                          name='test:other')).elem()))
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'AccessDenied')
+
+    def test_object_acl_PUT_xml_error(self):
+        req = Request.blank('/bucket/object?acl',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()},
+                            body="invalid xml")
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'MalformedACLError')
+
+    def test_canned_acl_private(self):
+        req = Request.blank('/bucket/object?acl',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'x-amz-acl': 'private'})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+        self.assertIn('REMOTE_USER', req.environ)
+
+    def test_canned_acl_public_read(self):
+        req = Request.blank('/bucket/object?acl',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'x-amz-acl': 'public-read'})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+
+    def test_canned_acl_public_read_write(self):
+        req = Request.blank('/bucket/object?acl',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'x-amz-acl': 'public-read-write'})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+
+    def test_canned_acl_authenticated_read(self):
+        req = Request.blank('/bucket/object?acl',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'x-amz-acl': 'authenticated-read'})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+
+    def test_canned_acl_bucket_owner_read(self):
+        req = Request.blank('/bucket/object?acl',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'x-amz-acl': 'bucket-owner-read'})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+
+    def test_canned_acl_bucket_owner_full_control(self):
+        req = Request.blank('/bucket/object?acl',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'x-amz-acl': 'bucket-owner-full-control'})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+
+    def test_invalid_canned_acl(self):
+        req = Request.blank('/bucket/object?acl',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'x-amz-acl': 'invalid'})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+
+    def _test_grant_header(self, permission):
+        req = Request.blank('/bucket/object?acl',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'x-amz-grant-' + permission:
+                                     'id=test:tester'})
+        return self.call_s3api(req)
+
+    def test_grant_read(self):
+        status, headers, body = self._test_grant_header('read')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_grant_write(self):
+        status, headers, body = self._test_grant_header('write')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_grant_read_acp(self):
+        status, headers, body = self._test_grant_header('read-acp')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_grant_write_acp(self):
+        status, headers, body = self._test_grant_header('write-acp')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_grant_full_control(self):
+        status, headers, body = self._test_grant_header('full-control')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_grant_invalid_permission(self):
+        status, headers, body = self._test_grant_header('invalid')
+        self.assertEqual(self._get_error_code(body), 'MissingSecurityHeader')
+
+    def test_grant_with_both_header_and_xml(self):
+        req = Request.blank('/bucket/object?acl',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'x-amz-grant-full-control':
+                                     'id=test:tester'},
+                            body=tostring(
+                                ACLPrivate(
+                                    Owner(id='test:tester',
+                                          name='test:tester')).elem()))
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'UnexpectedContent')
+
+    def test_grant_with_both_header_and_canned_acl(self):
+        req = Request.blank('/bucket/object?acl',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'x-amz-grant-full-control':
+                                     'id=test:tester',
+                                     'x-amz-acl': 'public-read'})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidRequest')
+
+    def test_grant_email(self):
+        req = Request.blank('/bucket/object?acl',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'x-amz-grant-read': 'emailAddress=a@b.c'})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'NotImplemented')
+
+    def test_grant_email_xml(self):
+        grantee = Element('Grantee', nsmap={'xsi': XMLNS_XSI})
+        grantee.set('{%s}type' % XMLNS_XSI, 'AmazonCustomerByEmail')
+        SubElement(grantee, 'EmailAddress').text = 'Grantees@email.com'
+        xml = _make_xml(grantee=grantee)
+        req = Request.blank('/bucket/object?acl',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()},
+                            body=xml)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'NotImplemented')
+
+    def test_grant_invalid_group_xml(self):
+        grantee = Element('Grantee', nsmap={'xsi': XMLNS_XSI})
+        grantee.set('{%s}type' % XMLNS_XSI, 'Invalid')
+        xml = _make_xml(grantee=grantee)
+        req = Request.blank('/bucket/object?acl',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()},
+                            body=xml)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'MalformedACLError')
+
+    def test_grant_authenticated_users(self):
+        req = Request.blank('/bucket/object?acl',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'x-amz-grant-read':
+                                     'uri="http://acs.amazonaws.com/groups/'
+                                     'global/AuthenticatedUsers"'})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+
+    def test_grant_all_users(self):
+        req = Request.blank('/bucket/object?acl',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'x-amz-grant-read':
+                                     'uri="http://acs.amazonaws.com/groups/'
+                                     'global/AllUsers"'})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+
+    def test_grant_all_users_with_uppercase_type(self):
+        req = Request.blank('/bucket/object?acl',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'x-amz-grant-read':
+                                     'URI="http://acs.amazonaws.com/groups/'
+                                     'global/AllUsers"'})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+
+    def test_grant_invalid_uri(self):
+        req = Request.blank('/bucket/object?acl',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'x-amz-grant-read':
+                                     'uri="http://localhost/"'})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+
+    def test_grant_invalid_uri_xml(self):
+        grantee = Element('Grantee', nsmap={'xsi': XMLNS_XSI})
+        grantee.set('{%s}type' % XMLNS_XSI, 'Group')
+        SubElement(grantee, 'URI').text = 'invalid'
+        xml = _make_xml(grantee)
+
+        req = Request.blank('/bucket/object?acl',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()},
+                            body=xml)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+
+    def test_grant_invalid_target(self):
+        req = Request.blank('/bucket/object?acl',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'x-amz-grant-read': 'key=value'})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+
+    def _test_bucket_acl_GET(self, account):
+        req = Request.blank('/bucket?acl',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS %s:hmac' % account,
+                                     'Date': self.get_date_header()})
+        return self.call_s3api(req)
+
+    def test_bucket_acl_GET_without_permission(self):
+        status, headers, body = self._test_bucket_acl_GET('test:other')
+        self.assertEqual(self._get_error_code(body), 'AccessDenied')
+
+    def test_bucket_acl_GET_with_read_acp_permission(self):
+        status, headers, body = self._test_bucket_acl_GET('test:read_acp')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_bucket_acl_GET_with_fullcontrol_permission(self):
+        status, headers, body = self._test_bucket_acl_GET('test:full_control')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_bucket_acl_GET_with_owner_permission(self):
+        status, headers, body = self._test_bucket_acl_GET('test:tester')
+        self.assertEqual(status.split()[0], '200')
+
+    def _test_bucket_acl_PUT(self, account, permission='FULL_CONTROL'):
+        acl = ACL(self.default_owner, [Grant(User(account), permission)])
+        req = Request.blank('/bucket?acl',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS %s:hmac' % account,
+                                     'Date': self.get_date_header()},
+                            body=tostring(acl.elem()))
+
+        return self.call_s3api(req)
+
+    def test_bucket_acl_PUT_without_permission(self):
+        status, headers, body = self._test_bucket_acl_PUT('test:other')
+        self.assertEqual(self._get_error_code(body), 'AccessDenied')
+
+    def test_bucket_acl_PUT_with_write_acp_permission(self):
+        status, headers, body = self._test_bucket_acl_PUT('test:write_acp')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_bucket_acl_PUT_with_fullcontrol_permission(self):
+        status, headers, body = self._test_bucket_acl_PUT('test:full_control')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_bucket_acl_PUT_with_owner_permission(self):
+        status, headers, body = self._test_bucket_acl_PUT('test:tester')
+        self.assertEqual(status.split()[0], '200')
+
+    def _test_object_acl_GET(self, account):
+        req = Request.blank('/bucket/object?acl',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS %s:hmac' % account,
+                                     'Date': self.get_date_header()})
+        return self.call_s3api(req)
+
+    def test_object_acl_GET_without_permission(self):
+        status, headers, body = self._test_object_acl_GET('test:other')
+        self.assertEqual(self._get_error_code(body), 'AccessDenied')
+
+    def test_object_acl_GET_with_read_acp_permission(self):
+        status, headers, body = self._test_object_acl_GET('test:read_acp')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_object_acl_GET_with_fullcontrol_permission(self):
+        status, headers, body = self._test_object_acl_GET('test:full_control')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_object_acl_GET_with_owner_permission(self):
+        status, headers, body = self._test_object_acl_GET('test:tester')
+        self.assertEqual(status.split()[0], '200')
+
+    def _test_object_acl_PUT(self, account, permission='FULL_CONTROL'):
+        acl = ACL(self.default_owner, [Grant(User(account), permission)])
+        req = Request.blank('/bucket/object?acl',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS %s:hmac' % account,
+                                     'Date': self.get_date_header()},
+                            body=tostring(acl.elem()))
+
+        return self.call_s3api(req)
+
+    def test_object_acl_PUT_without_permission(self):
+        status, headers, body = self._test_object_acl_PUT('test:other')
+        self.assertEqual(self._get_error_code(body), 'AccessDenied')
+
+    def test_object_acl_PUT_with_write_acp_permission(self):
+        status, headers, body = self._test_object_acl_PUT('test:write_acp')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_object_acl_PUT_with_fullcontrol_permission(self):
+        status, headers, body = self._test_object_acl_PUT('test:full_control')
+        self.assertEqual(status.split()[0], '200')
+
+    def test_object_acl_PUT_with_owner_permission(self):
+        status, headers, body = self._test_object_acl_PUT('test:tester')
+        self.assertEqual(status.split()[0], '200')
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/s3api/test_s3api.py b/test/unit/common/middleware/s3api/test_s3api.py
new file mode 100644
index 0000000000..056f32edf1
--- /dev/null
+++ b/test/unit/common/middleware/s3api/test_s3api.py
@@ -0,0 +1,2362 @@
+
+# Copyright (c) 2011-2014 OpenStack Foundation.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import base64
+import hashlib
+import io
+import unittest
+from unittest.mock import patch, MagicMock
+import calendar
+from datetime import datetime
+from datetime import timezone
+from unittest import mock
+import requests
+import json
+from paste.deploy import loadwsgi
+from urllib.parse import unquote, quote
+
+import swift.common.middleware.s3api
+from swift.common.middleware.proxy_logging import ProxyLoggingMiddleware
+from swift.common.middleware.s3api.s3response import ErrorResponse, \
+    AccessDenied
+from swift.common.middleware.s3api.utils import Config
+from swift.common.middleware.keystoneauth import KeystoneAuth
+from swift.common import swob, registry
+from swift.common.request_helpers import get_log_info
+from swift.common.swob import Request
+from swift.common.utils import md5, get_logger
+
+from keystonemiddleware.auth_token import AuthProtocol
+from keystoneauth1.access import AccessInfoV2
+
+from test.debug_logger import debug_logger, FakeStatsdClient, \
+    FakeLabeledStatsdClient
+from test.unit.common.middleware.s3api import S3ApiTestCase
+from test.unit.common.middleware.helpers import FakeSwift
+from test.unit.common.middleware.s3api.test_s3token import \
+    GOOD_RESPONSE_V2, GOOD_RESPONSE_V3
+from swift.common.middleware.s3api.s3request import SigV4Request, S3Request
+from swift.common.middleware.s3api.etree import fromstring
+from swift.common.middleware.s3api.s3api import filter_factory, \
+    S3ApiMiddleware
+from swift.common.middleware.s3api.s3token import S3Token
+
+SHA256_OF_EMPTY_STRING = \
+    'e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855'
+
+
+class TestListingMiddleware(S3ApiTestCase):
+    def test_s3_etag_in_json(self):
+        # This translation happens all the time, even on normal swift requests
+        body_data = json.dumps([
+            {'name': 'obj1', 'hash': '0123456789abcdef0123456789abcdef'},
+            {'name': 'obj2', 'hash': 'swiftetag; s3_etag=mu-etag'},
+            {'name': 'obj2', 'hash': 'swiftetag; something=else'},
+            {'subdir': 'path/'},
+        ]).encode('ascii')
+        self.swift.register(
+            'GET', '/v1/a/c', swob.HTTPOk,
+            {'Content-Type': 'application/json; charset=UTF-8'},
+            body_data)
+
+        req = Request.blank('/v1/a/c')
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(json.loads(body), [
+            {'name': 'obj1', 'hash': '0123456789abcdef0123456789abcdef'},
+            {'name': 'obj2', 'hash': 'swiftetag', 's3_etag': '"mu-etag"'},
+            {'name': 'obj2', 'hash': 'swiftetag; something=else'},
+            {'subdir': 'path/'},
+        ])
+
+    def test_s3_etag_non_json(self):
+        self.swift.register(
+            'GET', '/v1/a/c', swob.HTTPOk,
+            {'Content-Type': 'application/json; charset=UTF-8'},
+            b'Not actually JSON')
+        req = Request.blank('/v1/a/c')
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(body, b'Not actually JSON')
+
+        # Yes JSON, but wrong content-type
+        body_data = json.dumps([
+            {'name': 'obj1', 'hash': '0123456789abcdef0123456789abcdef'},
+            {'name': 'obj2', 'hash': 'swiftetag; s3_etag=mu-etag'},
+            {'name': 'obj2', 'hash': 'swiftetag; something=else'},
+            {'subdir': 'path/'},
+        ]).encode('ascii')
+        self.swift.register(
+            'GET', '/v1/a/c', swob.HTTPOk,
+            {'Content-Type': 'text/plain; charset=UTF-8'},
+            body_data)
+        req = Request.blank('/v1/a/c')
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(body, body_data)
+
+
+class TestS3ApiMiddleware(S3ApiTestCase):
+    def setUp(self):
+        super(TestS3ApiMiddleware, self).setUp()
+
+        self.swift.register('GET', '/something', swob.HTTPOk, {}, 'FAKE APP')
+
+    def test_init_config(self):
+        # verify config loading
+        # note: test confs do not have __file__ attribute so check_pipeline
+        # will be short-circuited
+
+        # check all defaults
+        expected = dict(Config())
+        expected.update({
+            'auth_pipeline_check': True,
+            'check_bucket_owner': False,
+            'max_bucket_listing': 1000,
+            'max_multi_delete_objects': 1000,
+            'max_parts_listing': 1000,
+            'max_upload_part_num': 1000,
+            'min_segment_size': 5242880,
+            'multi_delete_concurrency': 2,
+            's3_acl': False,
+            'cors_preflight_allow_origin': [],
+            'ratelimit_as_client_error': False,
+        })
+        s3api = S3ApiMiddleware(None, {})
+        self.assertEqual(expected, s3api.conf)
+
+        # check all non-defaults are loaded
+        conf = {
+            'storage_domain': 'somewhere,some.other.where',
+            'location': 'us-west-1',
+            'force_swift_request_proxy_log': True,
+            'dns_compliant_bucket_names': False,
+            'allow_multipart_uploads': False,
+            'allow_no_owner': True,
+            'allowable_clock_skew': 300,
+            'auth_pipeline_check': False,
+            'check_bucket_owner': True,
+            'max_bucket_listing': 500,
+            'max_multi_delete_objects': 600,
+            'max_parts_listing': 70,
+            'max_upload_part_num': 800,
+            'min_segment_size': 1000000,
+            'multi_delete_concurrency': 1,
+            's3_acl': True,
+            'cors_preflight_allow_origin': 'foo.example.com,bar.example.com',
+            'ratelimit_as_client_error': True,
+        }
+        s3api = S3ApiMiddleware(None, conf)
+        conf['cors_preflight_allow_origin'] = \
+            conf['cors_preflight_allow_origin'].split(',')
+        conf['storage_domains'] = conf.pop('storage_domain').split(',')
+        self.assertEqual(conf, s3api.conf)
+
+        # test allow_origin list with a '*' fails.
+        conf = {
+            'storage_domain': 'somewhere',
+            'location': 'us-west-1',
+            'force_swift_request_proxy_log': True,
+            'dns_compliant_bucket_names': False,
+            'allow_multipart_uploads': False,
+            'allow_no_owner': True,
+            'allowable_clock_skew': 300,
+            'auth_pipeline_check': False,
+            'check_bucket_owner': True,
+            'max_bucket_listing': 500,
+            'max_multi_delete_objects': 600,
+            'max_parts_listing': 70,
+            'max_upload_part_num': 800,
+            'min_segment_size': 1000000,
+            'multi_delete_concurrency': 1,
+            's3_acl': True,
+            'cors_preflight_allow_origin': 'foo.example.com,bar.example.com,*',
+        }
+        with self.assertRaises(ValueError) as ex:
+            S3ApiMiddleware(None, conf)
+        self.assertIn("if cors_preflight_allow_origin should include all "
+                      "domains, * must be the only entry", str(ex.exception))
+
+        def check_bad_positive_ints(**kwargs):
+            bad_conf = dict(conf, **kwargs)
+            self.assertRaises(ValueError, S3ApiMiddleware, None, bad_conf)
+
+        check_bad_positive_ints(allowable_clock_skew=-100)
+        check_bad_positive_ints(allowable_clock_skew=0)
+        check_bad_positive_ints(max_bucket_listing=-100)
+        check_bad_positive_ints(max_bucket_listing=0)
+        check_bad_positive_ints(max_multi_delete_objects=-100)
+        check_bad_positive_ints(max_multi_delete_objects=0)
+        check_bad_positive_ints(max_parts_listing=-100)
+        check_bad_positive_ints(max_parts_listing=0)
+        check_bad_positive_ints(max_upload_part_num=-100)
+        check_bad_positive_ints(max_upload_part_num=0)
+        check_bad_positive_ints(min_segment_size=-100)
+        check_bad_positive_ints(min_segment_size=0)
+        check_bad_positive_ints(multi_delete_concurrency=-100)
+        check_bad_positive_ints(multi_delete_concurrency=0)
+
+    def test_init_passes_wsgi_conf_file_to_check_pipeline(self):
+        # verify that check_pipeline is called during init: add __file__ attr
+        # to test config to make it more representative of middleware being
+        # init'd by wgsi
+        context = mock.Mock()
+        with patch("swift.common.middleware.s3api.s3api.loadcontext",
+                   return_value=context) as loader, \
+                patch("swift.common.middleware.s3api.s3api.PipelineWrapper") \
+                as pipeline:
+            conf = dict(self.conf,
+                        auth_pipeline_check=True,
+                        __file__='proxy-conf-file')
+            pipeline.return_value = 's3api tempauth proxy-server'
+            self.s3api = S3ApiMiddleware(None, conf)
+            loader.assert_called_with(loadwsgi.APP, 'proxy-conf-file')
+            pipeline.assert_called_with(context)
+
+    def test_init_logger(self):
+        proxy_logger = get_logger({}, log_route='proxy-server').logger
+
+        s3api = S3ApiMiddleware(None, {})
+        self.assertEqual('s3api', s3api.logger.name)
+        self.assertEqual('s3api', s3api.logger.logger.name)
+        self.assertIsNot(s3api.logger.logger, proxy_logger)
+        self.assertEqual('swift', s3api.logger.server)
+        # there's a stats client, but with no host, it can't send anything
+        self.assertIsNone(s3api.logger.logger.statsd_client._host)
+
+        with mock.patch('swift.common.statsd_client.StatsdClient',
+                        FakeStatsdClient):
+            s3api = S3ApiMiddleware(None, {'log_name': 'proxy-server',
+                                           'log_statsd_host': '1.2.3.4'})
+            s3api.logger.increment('test-metric')
+        self.assertEqual('s3api', s3api.logger.name)
+        self.assertEqual('s3api', s3api.logger.logger.name)
+        self.assertIsNot(s3api.logger.logger, proxy_logger)
+        self.assertEqual('proxy-server', s3api.logger.server)
+        self.assertEqual('s3api.', s3api.logger.logger.statsd_client._prefix)
+        client = s3api.logger.logger.statsd_client
+        self.assertEqual({'test-metric': 1}, client.get_stats_counts())
+        self.assertEqual([(b's3api.test-metric:1|c', ('1.2.3.4', 8125))],
+                         client.sendto_calls)
+
+    def test_init_logs_checksum_implementation(self):
+        with mock.patch('swift.common.middleware.s3api.s3api.get_logger',
+                        return_value=self.logger), \
+                mock.patch('swift.common.utils.checksum.crc32c_isal') \
+                as mock_crc32c, \
+                mock.patch('swift.common.utils.checksum.crc64nvme_isal') \
+                as mock_crc64nvme:
+            mock_crc32c.__name__ = 'crc32c_isal'
+            mock_crc64nvme.__name__ = 'crc64nvme_isal'
+            S3ApiMiddleware(None, {})
+        self.assertEqual(
+            {
+                'debug': [
+                    'Labeled statsd mode: disabled (fake-swift)',
+                ],
+                'info': [
+                    'Using crc32c_isal implementation for CRC32C.',
+                    'Using crc64nvme_isal implementation for CRC64NVME.',
+                ],
+            },
+            self.logger.all_log_lines())
+
+    def test_init_statsd_options_user_labels(self):
+        conf = {
+            'log_statsd_host': 'example.com',
+            'log_statsd_port': '1234',
+            'statsd_label_mode': 'dogstatsd',
+            'statsd_emit_legacy': False,
+            'statsd_user_label_userdefined': 'whatever',
+        }
+        with mock.patch('swift.common.statsd_client.LabeledStatsdClient',
+                        FakeLabeledStatsdClient):
+            s3api = S3ApiMiddleware(None, conf)
+
+        statsd = s3api.statsd
+        self.assertIsInstance(statsd, FakeLabeledStatsdClient)
+        statsd.increment('baz', labels={'label_foo': 'foo'})
+        self.assertEqual(
+            [(b'baz:1|c|#label_foo:foo,user_userdefined:whatever',
+             ('example.com', 1234))],
+            statsd.sendto_calls)
+
+    def test_non_s3_request_passthrough(self):
+        req = Request.blank('/something')
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(body, b'FAKE APP')
+        self.assertFalse(self.statsd.calls['increment'])
+
+    def test_bad_format_authorization(self):
+        req = Request.blank('/something',
+                            headers={'Authorization': 'hoge',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'AccessDenied')
+        self.assertEqual(
+            {'403.AccessDenied.invalid_header_auth': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:AccessDenied.invalid_header_auth',
+                         get_log_info(req.environ))
+
+    def test_bad_method(self):
+        req = Request.blank('/',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'MethodNotAllowed')
+        self.assertEqual(
+            {'405.MethodNotAllowed': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:MethodNotAllowed',
+                         get_log_info(req.environ))
+
+    def test_bad_method_but_method_exists_in_controller(self):
+        req = Request.blank(
+            '/bucket',
+            environ={'REQUEST_METHOD': '_delete_segments_bucket'},
+            headers={'Authorization': 'AWS test:tester:hmac',
+                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'MethodNotAllowed')
+        self.assertEqual(
+            {'405.MethodNotAllowed': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:MethodNotAllowed',
+                         get_log_info(req.environ))
+
+    def test_path_info_encode(self):
+        bucket_name = 'b%75cket'
+        object_name = 'ob%6aect:1'
+        self.swift.register('GET', '/v1/AUTH_test/bucket/object:1',
+                            swob.HTTPOk, {}, None)
+        req = Request.blank('/%s/%s' % (bucket_name, object_name),
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        raw_path_info = "/%s/%s" % (bucket_name, object_name)
+        path_info = req.environ['PATH_INFO']
+        self.assertEqual(path_info, unquote(raw_path_info))
+        self.assertEqual(req.path, quote(path_info))
+        self.assertIn('swift.backend_path', req.environ)
+        self.assertEqual('/v1/AUTH_test/bucket/object:1',
+                         req.environ['swift.backend_path'])
+
+    def test_canonical_string_v2(self):
+        """
+        The hashes here were generated by running the same requests against
+        boto.utils.canonical_string
+        """
+        def canonical_string(path, headers):
+            if '?' in path:
+                path, query_string = path.split('?', 1)
+            else:
+                query_string = ''
+            env = {
+                'REQUEST_METHOD': 'GET',
+                'PATH_INFO': path,
+                'QUERY_STRING': query_string,
+                'HTTP_AUTHORIZATION': 'AWS X:Y:Z',
+                'wsgi.input': io.BytesIO(),
+            }
+            for header, value in headers.items():
+                header = 'HTTP_' + header.replace('-', '_').upper()
+                if header in ('HTTP_CONTENT_TYPE', 'HTTP_CONTENT_LENGTH'):
+                    header = header[5:]
+                env[header] = value
+
+            with patch('swift.common.middleware.s3api.s3request.'
+                       'S3Request._validate_headers'), \
+                    patch('swift.common.middleware.s3api.s3request.'
+                          'S3Request._validate_dates'):
+                req = S3Request(env)
+            return req.environ['s3api.auth_details']['string_to_sign']
+
+        def verify(hash, path, headers):
+            s = canonical_string(path, headers)
+            self.assertEqual(hash, md5(s, usedforsecurity=False).hexdigest())
+
+        verify('6dd08c75e42190a1ce9468d1fd2eb787', '/bucket/object',
+               {'Content-Type': 'text/plain', 'X-Amz-Something': 'test',
+                'Date': 'whatever'})
+
+        verify('c8447135da232ae7517328f3429df481', '/bucket/object',
+               {'Content-Type': 'text/plain', 'X-Amz-Something': 'test'})
+
+        verify('bf49304103a4de5c325dce6384f2a4a2', '/bucket/object',
+               {'content-type': 'text/plain'})
+
+        verify('be01bd15d8d47f9fe5e2d9248cc6f180', '/bucket/object', {})
+
+        verify('e9ec7dca45eef3e2c7276af23135e896', '/bucket/object',
+               {'Content-MD5': 'somestuff'})
+
+        verify('a822deb31213ad09af37b5a7fe59e55e', '/bucket/object?acl', {})
+
+        verify('cce5dd1016595cb706c93f28d3eaa18f', '/bucket/object',
+               {'Content-Type': 'text/plain', 'X-Amz-A': 'test',
+                'X-Amz-Z': 'whatever', 'X-Amz-B': 'lalala',
+                'X-Amz-Y': 'lalalalalalala'})
+
+        verify('7506d97002c7d2de922cc0ec34af8846', '/bucket/object',
+               {'Content-Type': None, 'X-Amz-Something': 'test'})
+
+        verify('28f76d6162444a193b612cd6cb20e0be', '/bucket/object',
+               {'Content-Type': None,
+                'X-Amz-Date': 'Mon, 11 Jul 2011 10:52:57 +0000',
+                'Date': 'Tue, 12 Jul 2011 10:52:57 +0000'})
+
+        verify('ed6971e3eca5af4ee361f05d7c272e49', '/bucket/object',
+               {'Content-Type': None,
+                'Date': 'Tue, 12 Jul 2011 10:52:57 +0000'})
+
+        verify('41ecd87e7329c33fea27826c1c9a6f91', '/bucket/object?cors', {})
+
+        verify('d91b062f375d8fab407d6dab41fd154e', '/bucket/object?tagging',
+               {})
+
+        verify('ebab878a96814b30eb178e27efb3973f', '/bucket/object?restore',
+               {})
+
+        verify('f6bf1b2d92b054350d3679d28739fc69', '/bucket/object?'
+               'response-cache-control&response-content-disposition&'
+               'response-content-encoding&response-content-language&'
+               'response-content-type&response-expires', {})
+
+        str1 = canonical_string('/', headers={'Content-Type': None,
+                                              'X-Amz-Something': 'test'})
+        str2 = canonical_string('/', headers={'Content-Type': '',
+                                              'X-Amz-Something': 'test'})
+        str3 = canonical_string('/', headers={'X-Amz-Something': 'test'})
+
+        self.assertEqual(str1, str2)
+        self.assertEqual(str2, str3)
+
+        # Note that boto does not do proper stripping (as of 2.42.0).
+        # These were determined by examining the StringToSignBytes element of
+        # resulting SignatureDoesNotMatch errors from AWS.
+        str1 = canonical_string('/', {'Content-Type': 'text/plain',
+                                      'Content-MD5': '##'})
+        str2 = canonical_string('/', {'Content-Type': '\x01\x02text/plain',
+                                      'Content-MD5': '\x1f ##'})
+        str3 = canonical_string('/', {'Content-Type': 'text/plain \x10',
+                                      'Content-MD5': '##\x18'})
+
+        self.assertEqual(str1, str2)
+        self.assertEqual(str2, str3)
+
+    def test_signed_urls_expired(self):
+        expire = '1000000000'
+        req = Request.blank('/bucket/object?Signature=X&Expires=%s&'
+                            'AWSAccessKeyId=test:tester' % expire,
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Date': self.get_date_header()})
+        req.headers['Date'] = datetime.now(timezone.utc)
+        req.content_type = 'text/plain'
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'AccessDenied')
+        self.assertEqual(
+            {'403.AccessDenied.expired': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:AccessDenied.expired',
+                         get_log_info(req.environ))
+
+    def test_signed_urls(self):
+        # Set expire to last 32b timestamp value
+        # This number can't be higher, because it breaks tests on 32b systems
+        expire = '2147483647'  # 19 Jan 2038 03:14:07
+        utc_date = datetime.now(timezone.utc)
+        req = Request.blank('/bucket/object?Signature=X&Expires=%s&'
+                            'AWSAccessKeyId=test:tester&Timestamp=%s' %
+                            (expire, utc_date.isoformat().rsplit('.')[0]),
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Date': self.get_date_header()})
+        req.content_type = 'text/plain'
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+        self.assertIn('swift.backend_path', req.environ)
+        self.assertEqual('/v1/AUTH_test/bucket/object',
+                         req.environ['swift.backend_path'])
+        for _, path, headers in self.swift.calls_with_headers:
+            self.assertNotIn('Authorization', headers)
+
+    def test_signed_urls_no_timestamp(self):
+        expire = '2147483647'  # 19 Jan 2038 03:14:07
+        req = Request.blank('/bucket/object?Signature=X&Expires=%s&'
+                            'AWSAccessKeyId=test:tester' % expire,
+                            environ={'REQUEST_METHOD': 'GET'})
+        req.content_type = 'text/plain'
+        status, headers, body = self.call_s3api(req)
+        # Curious! But actually S3 doesn't verify any x-amz-date/date headers
+        # for signed_url access and it also doesn't check timestamp
+        self.assertEqual(status.split()[0], '200')
+        self.assertIn('swift.backend_path', req.environ)
+        self.assertEqual('/v1/AUTH_test/bucket/object',
+                         req.environ['swift.backend_path'])
+        for _, _, headers in self.swift.calls_with_headers:
+            self.assertNotIn('Authorization', headers)
+
+    def test_signed_urls_invalid_expire(self):
+        expire = 'invalid'
+        req = Request.blank('/bucket/object?Signature=X&Expires=%s&'
+                            'AWSAccessKeyId=test:tester' % expire,
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Date': self.get_date_header()})
+        req.headers['Date'] = datetime.now(timezone.utc)
+        req.content_type = 'text/plain'
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'AccessDenied')
+        self.assertEqual(
+            {'403.AccessDenied.invalid_expires': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:AccessDenied.invalid_expires',
+                         get_log_info(req.environ))
+
+    def test_signed_urls_no_sign(self):
+        expire = '2147483647'  # 19 Jan 2038 03:14:07
+        req = Request.blank('/bucket/object?Expires=%s&'
+                            'AWSAccessKeyId=test:tester' % expire,
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Date': self.get_date_header()})
+        req.headers['Date'] = datetime.now(timezone.utc)
+        req.content_type = 'text/plain'
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'AccessDenied')
+        self.assertEqual(
+            {'403.AccessDenied.invalid_query_auth': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:AccessDenied.invalid_query_auth',
+                         get_log_info(req.environ))
+
+    def test_signed_urls_no_access(self):
+        expire = '2147483647'  # 19 Jan 2038 03:14:07
+        req = Request.blank('/bucket/object?Expires=%s&'
+                            'AWSAccessKeyId=' % expire,
+                            environ={'REQUEST_METHOD': 'GET'})
+        req.headers['Date'] = datetime.now(timezone.utc)
+        req.content_type = 'text/plain'
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'AccessDenied')
+        self.assertEqual(
+            {'403.AccessDenied.invalid_query_auth': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:AccessDenied.invalid_query_auth',
+                         get_log_info(req.environ))
+
+    def test_signed_urls_v4(self):
+        req = Request.blank(
+            '/bucket/object'
+            '?X-Amz-Algorithm=AWS4-HMAC-SHA256'
+            '&X-Amz-Credential=test:tester/%s/us-east-1/s3/aws4_request'
+            '&X-Amz-Date=%s'
+            '&X-Amz-Expires=1000'
+            '&X-Amz-SignedHeaders=host'
+            '&X-Amz-Signature=X' % (
+                self.get_v4_amz_date_header().split('T', 1)[0],
+                self.get_v4_amz_date_header()),
+            headers={'Date': self.get_date_header()},
+            environ={'REQUEST_METHOD': 'GET'})
+        req.content_type = 'text/plain'
+
+        # Test with ProxyLoggingMiddleware for access_user_id logging for
+        # presigned URLs
+        app = ProxyLoggingMiddleware(self.s3api, {}, logger=self.logger)
+        status, headers, body = self.call_app(req, app=app)
+        self.assertIn('swift.backend_path', req.environ)
+        self.assertEqual('/v1/AUTH_test/bucket/object',
+                         req.environ['swift.backend_path'])
+        self.assertEqual(status.split()[0], '200', body)
+        for _, _, headers in self.swift.calls_with_headers:
+            self.assertNotIn('Authorization', headers)
+            self.assertNotIn('X-Auth-Token', headers)
+
+        # Verify access_user_id is logged correctly for V4 presigned URLs
+        access_lines = self.logger.get_lines_for_level('info')
+        self.assertEqual(1, len(access_lines))
+        parts = access_lines[0].split()
+        # For presigned URLs, the logged path includes query parameters
+        self.assertTrue(' '.join(parts[3:6]).startswith('GET /bucket/object'))
+        self.assertEqual(parts[5], 'HTTP/1.0')
+        self.assertEqual(parts[6], '200')
+        self.assertEqual(parts[-1], 'test:tester')  # access_user_id
+
+    def test_signed_urls_v4_bad_credential(self):
+        def test(credential, message, extra=b''):
+            req = Request.blank(
+                '/bucket/object'
+                '?X-Amz-Algorithm=AWS4-HMAC-SHA256'
+                '&X-Amz-Credential=%s'
+                '&X-Amz-Date=%s'
+                '&X-Amz-Expires=1000'
+                '&X-Amz-SignedHeaders=host'
+                '&X-Amz-Signature=X' % (
+                    credential,
+                    self.get_v4_amz_date_header()),
+                headers={'Date': self.get_date_header()},
+                environ={'REQUEST_METHOD': 'GET'})
+            req.content_type = 'text/plain'
+            self.s3api.logger.logger.clear()
+            status, headers, body = self.call_s3api(req)
+            self.assertEqual(status.split()[0], '400', body)
+            self.assertEqual(self._get_error_code(body),
+                             'AuthorizationQueryParametersError')
+            self.assertEqual(self._get_error_message(body), message)
+            self.assertIn(extra, body)
+            self.assertEqual(
+                {'400.AuthorizationQueryParametersError': 1},
+                self.s3api.logger.logger.statsd_client.get_stats_counts())
+            self.assertEqual('s3:err:AuthorizationQueryParametersError',
+                             get_log_info(req.environ))
+
+        dt = self.get_v4_amz_date_header().split('T', 1)[0]
+        test('test:tester/not-a-date/us-east-1/s3/aws4_request',
+             'Invalid credential date "not-a-date". This date is not the same '
+             'as X-Amz-Date: "%s".' % dt)
+        test('test:tester/%s/us-west-1/s3/aws4_request' % dt,
+             "Error parsing the X-Amz-Credential parameter; the region "
+             "'us-west-1' is wrong; expecting 'us-east-1'",
+             b'<Region>us-east-1</Region>')
+        test('test:tester/%s/us-east-1/not-s3/aws4_request' % dt,
+             'Error parsing the X-Amz-Credential parameter; incorrect service '
+             '"not-s3". This endpoint belongs to "s3".')
+        test('test:tester/%s/us-east-1/s3/not-aws4_request' % dt,
+             'Error parsing the X-Amz-Credential parameter; incorrect '
+             'terminal "not-aws4_request". This endpoint uses "aws4_request".')
+
+    def test_signed_urls_v4_missing_x_amz_date(self):
+        req = Request.blank(
+            '/bucket/object'
+            '?X-Amz-Algorithm=AWS4-HMAC-SHA256'
+            '&X-Amz-Credential=test/20T20Z/us-east-1/s3/aws4_request'
+            '&X-Amz-Expires=1000'
+            '&X-Amz-SignedHeaders=host'
+            '&X-Amz-Signature=X',
+            environ={'REQUEST_METHOD': 'GET'})
+        req.content_type = 'text/plain'
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'AccessDenied')
+        self.assertEqual(
+            {'403.AccessDenied.invalid_date': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:AccessDenied.invalid_date',
+                         get_log_info(req.environ))
+
+    def test_signed_urls_v4_invalid_algorithm(self):
+        req = Request.blank(
+            '/bucket/object'
+            '?X-Amz-Algorithm=FAKE'
+            '&X-Amz-Credential=test/20T20Z/us-east-1/s3/aws4_request'
+            '&X-Amz-Date=%s'
+            '&X-Amz-Expires=1000'
+            '&X-Amz-SignedHeaders=host'
+            '&X-Amz-Signature=X' %
+            self.get_v4_amz_date_header(),
+            environ={'REQUEST_METHOD': 'GET'})
+        req.content_type = 'text/plain'
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+        self.assertEqual(
+            {'400.InvalidArgument': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:InvalidArgument',
+                         get_log_info(req.environ))
+
+    def test_signed_urls_v4_missing_signed_headers(self):
+        req = Request.blank(
+            '/bucket/object'
+            '?X-Amz-Algorithm=AWS4-HMAC-SHA256'
+            '&X-Amz-Credential=test/20T20Z/us-east-1/s3/aws4_request'
+            '&X-Amz-Date=%s'
+            '&X-Amz-Expires=1000'
+            '&X-Amz-Signature=X' %
+            self.get_v4_amz_date_header(),
+            environ={'REQUEST_METHOD': 'GET'})
+        req.content_type = 'text/plain'
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body),
+                         'AuthorizationHeaderMalformed')
+        self.assertEqual(
+            {'400.AuthorizationHeaderMalformed': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:AuthorizationHeaderMalformed',
+                         get_log_info(req.environ))
+
+    def test_signed_urls_v4_invalid_credentials(self):
+        req = Request.blank('/bucket/object'
+                            '?X-Amz-Algorithm=AWS4-HMAC-SHA256'
+                            '&X-Amz-Credential=test'
+                            '&X-Amz-Date=%s'
+                            '&X-Amz-Expires=1000'
+                            '&X-Amz-SignedHeaders=host'
+                            '&X-Amz-Signature=X' %
+                            self.get_v4_amz_date_header(),
+                            environ={'REQUEST_METHOD': 'GET'})
+        req.content_type = 'text/plain'
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'AccessDenied')
+        self.assertEqual(
+            {'403.AccessDenied.invalid_credential': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:AccessDenied.invalid_credential',
+                         get_log_info(req.environ))
+
+    def test_signed_urls_v4_missing_signature(self):
+        req = Request.blank(
+            '/bucket/object'
+            '?X-Amz-Algorithm=AWS4-HMAC-SHA256'
+            '&X-Amz-Credential=test/20T20Z/us-east-1/s3/aws4_request'
+            '&X-Amz-Date=%s'
+            '&X-Amz-Expires=1000'
+            '&X-Amz-SignedHeaders=host' %
+            self.get_v4_amz_date_header(),
+            environ={'REQUEST_METHOD': 'GET'})
+        req.content_type = 'text/plain'
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'AccessDenied')
+        self.assertEqual(
+            {'403.AccessDenied.invalid_query_auth': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:AccessDenied.invalid_query_auth',
+                         get_log_info(req.environ))
+
+    def test_bucket_virtual_hosted_style(self):
+        req = Request.blank(
+            '/',
+            environ={'HTTP_HOST': 'bucket.localhost:80',
+                     'REQUEST_METHOD': 'HEAD',
+                     'HTTP_AUTHORIZATION':
+                         'AWS test:tester:hmac'},
+            headers={'Date': self.get_date_header(),
+                     'X-Amz-Content-SHA256': SHA256_OF_EMPTY_STRING})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+        self.assertIn('swift.backend_path', req.environ)
+        self.assertEqual('/v1/AUTH_test/bucket',
+                         req.environ['swift.backend_path'])
+        exp_labels = {'account': 'AUTH_test',
+                      'container': 'bucket',
+                      'method': 'HEAD',
+                      'type': 'container',
+                      'status': 200,
+                      'header_x_amz_content_sha256': 'hash_64'}
+        self.assertEqual([(('swift_s3_checksum_algo_request',),
+                           {'labels': exp_labels})],
+                         self.statsd.calls['increment'])
+
+    def test_object_virtual_hosted_style(self):
+        req = Request.blank(
+            '/object',
+            environ={'HTTP_HOST': 'bucket.localhost:80',
+                     'REQUEST_METHOD': 'HEAD',
+                     'HTTP_AUTHORIZATION':
+                         'AWS test:tester:hmac'},
+            headers={'Date': self.get_date_header(),
+                     'X-Amz-Content-SHA256': SHA256_OF_EMPTY_STRING})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+        self.assertIn('swift.backend_path', req.environ)
+        self.assertEqual('/v1/AUTH_test/bucket/object',
+                         req.environ['swift.backend_path'])
+        exp_labels = {'account': 'AUTH_test',
+                      'container': 'bucket',
+                      'method': 'HEAD',
+                      'type': 'object',
+                      'status': 200,
+                      'header_x_amz_content_sha256': 'hash_64'}
+        self.assertEqual([(('swift_s3_checksum_algo_request',),
+                           {'labels': exp_labels})],
+                         self.statsd.calls['increment'])
+
+    def test_token_generation(self):
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket+segments/'
+                                    'object/123456789abcdef',
+                            swob.HTTPOk, {}, None)
+        self.swift.register('PUT', '/v1/AUTH_test/bucket+segments/'
+                                   'object/123456789abcdef/1',
+                            swob.HTTPCreated, {}, None)
+        req = Request.blank('/bucket/object?uploadId=123456789abcdef'
+                            '&partNumber=1',
+                            environ={'REQUEST_METHOD': 'PUT'})
+        req.headers['Authorization'] = 'AWS test:tester:hmac'
+        date_header = self.get_date_header()
+        req.headers['Date'] = date_header
+        with mock.patch('swift.common.middleware.s3api.s3request.'
+                        'SigCheckerV2.check_signature') as mock_cs:
+            status, headers, body = self.call_s3api(req)
+            self.assertIn('swift.backend_path', req.environ)
+            self.assertEqual(
+                '/v1/AUTH_test/bucket+segments/object/123456789abcdef/1',
+                req.environ['swift.backend_path'])
+
+        _, _, headers = self.swift.calls_with_headers[-1]
+        self.assertEqual(req.environ['s3api.auth_details'], {
+            'access_key': 'test:tester',
+            'signature': 'hmac',
+            'string_to_sign': b'\n'.join([
+                b'PUT', b'', b'', date_header.encode('ascii'),
+                b'/bucket/object?partNumber=1&uploadId=123456789abcdef']),
+            'check_signature': mock_cs})
+
+    def test_non_ascii_user(self):
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket+segments/'
+                                    'object/123456789abcdef',
+                            swob.HTTPOk, {}, None)
+        self.swift.register('PUT', '/v1/AUTH_test/bucket+segments/'
+                                   'object/123456789abcdef/1',
+                            swob.HTTPCreated, {}, None)
+        req = Request.blank('/bucket/object?uploadId=123456789abcdef'
+                            '&partNumber=1',
+                            environ={'REQUEST_METHOD': 'PUT'})
+        # NB: WSGI string for a snowman
+        req.headers['Authorization'] = 'AWS test:\xe2\x98\x83:sig'
+        date_header = self.get_date_header()
+        req.headers['Date'] = date_header
+        with mock.patch('swift.common.middleware.s3api.s3request.'
+                        'SigCheckerV2.check_signature') as mock_cs:
+            status, headers, body = self.call_s3api(req)
+            self.assertIn('swift.backend_path', req.environ)
+            self.assertEqual(
+                '/v1/AUTH_test/bucket+segments/object/123456789abcdef/1',
+                req.environ['swift.backend_path'])
+
+        _, _, headers = self.swift.calls_with_headers[-1]
+        self.assertEqual(req.environ['s3api.auth_details'], {
+            'access_key': u'test:\N{SNOWMAN}',
+            'signature': 'sig',
+            'string_to_sign': b'\n'.join([
+                b'PUT', b'', b'', date_header.encode('ascii'),
+                b'/bucket/object?partNumber=1&uploadId=123456789abcdef']),
+            'check_signature': mock_cs})
+
+    def test_invalid_uri(self):
+        req = Request.blank('/bucket/invalid\xffname',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidURI')
+        self.assertEqual(
+            {'400.InvalidURI': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:InvalidURI', get_log_info(req.environ))
+
+    def test_object_create_bad_md5_unreadable(self):
+        req = Request.blank('/bucket/object',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'HTTP_AUTHORIZATION': 'AWS X:Y:Z',
+                                     'HTTP_CONTENT_MD5': '#'},
+                            headers={'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidDigest')
+        self.assertEqual(
+            {'400.InvalidDigest': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:InvalidDigest', get_log_info(req.environ))
+
+    def test_object_create_bad_md5_too_short(self):
+        too_short_digest = md5(b'hey', usedforsecurity=False).digest()[:-1]
+        md5_str = base64.b64encode(too_short_digest).strip().decode('ascii')
+        req = Request.blank(
+            '/bucket/object',
+            environ={'REQUEST_METHOD': 'PUT',
+                     'HTTP_AUTHORIZATION': 'AWS X:Y:Z',
+                     'HTTP_CONTENT_MD5': md5_str},
+            headers={'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidDigest')
+        self.assertEqual(
+            {'400.InvalidDigest': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:InvalidDigest', get_log_info(req.environ))
+
+    def test_object_create_bad_md5_bad_padding(self):
+        too_short_digest = md5(b'hey', usedforsecurity=False).digest()
+        md5_str = base64.b64encode(too_short_digest).strip(
+            b'=\n').decode('ascii')
+        req = Request.blank(
+            '/bucket/object',
+            environ={'REQUEST_METHOD': 'PUT',
+                     'HTTP_AUTHORIZATION': 'AWS X:Y:Z',
+                     'HTTP_CONTENT_MD5': md5_str},
+            headers={'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidDigest')
+        self.assertEqual(
+            {'400.InvalidDigest': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:InvalidDigest', get_log_info(req.environ))
+
+    def test_object_create_bad_md5_too_long(self):
+        too_long_digest = md5(
+            b'hey', usedforsecurity=False).digest() + b'suffix'
+        md5_str = base64.b64encode(too_long_digest).strip().decode('ascii')
+        req = Request.blank(
+            '/bucket/object',
+            environ={'REQUEST_METHOD': 'PUT',
+                     'HTTP_AUTHORIZATION': 'AWS X:Y:Z',
+                     'HTTP_CONTENT_MD5': md5_str},
+            headers={'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidDigest')
+        self.assertEqual(
+            {'400.InvalidDigest': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:InvalidDigest', get_log_info(req.environ))
+
+    def test_invalid_metadata_directive(self):
+        req = Request.blank('/',
+                            environ={'REQUEST_METHOD': 'GET',
+                                     'HTTP_AUTHORIZATION': 'AWS X:Y:Z',
+                                     'HTTP_X_AMZ_METADATA_DIRECTIVE':
+                                     'invalid'},
+                            headers={'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+        self.assertEqual(
+            {'400.InvalidArgument': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:InvalidArgument',
+                         get_log_info(req.environ))
+
+    def test_invalid_storage_class(self):
+        req = Request.blank('/',
+                            environ={'REQUEST_METHOD': 'GET',
+                                     'HTTP_AUTHORIZATION': 'AWS X:Y:Z',
+                                     'HTTP_X_AMZ_STORAGE_CLASS': 'INVALID'},
+                            headers={'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidStorageClass')
+        self.assertEqual(
+            {'400.InvalidStorageClass': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:InvalidStorageClass',
+                         get_log_info(req.environ))
+
+    def test_invalid_ssc(self):
+        req = Request.blank('/',
+                            environ={'REQUEST_METHOD': 'GET',
+                                     'HTTP_AUTHORIZATION': 'AWS X:Y:Z'},
+                            headers={'x-amz-server-side-encryption': 'invalid',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'InvalidArgument')
+        self.assertEqual(
+            {'400.InvalidArgument': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:InvalidArgument',
+                         get_log_info(req.environ))
+
+    def _test_unsupported_header(self, header, value=None):
+        if value is None:
+            value = 'value'
+        req = Request.blank('/error',
+                            environ={'REQUEST_METHOD': 'GET',
+                                     'HTTP_AUTHORIZATION': 'AWS X:Y:Z'},
+                            headers={header: value,
+                                     'Date': self.get_date_header()})
+        self.s3api.logger.logger.clear()
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'NotImplemented')
+        self.assertEqual(
+            {'501.NotImplemented': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:NotImplemented',
+                         get_log_info(req.environ))
+
+    def test_mfa(self):
+        self._test_unsupported_header('x-amz-mfa')
+
+    @mock.patch.object(registry, '_swift_admin_info', dict())
+    def test_server_side_encryption(self):
+        sse_header = 'x-amz-server-side-encryption'
+        self._test_unsupported_header(sse_header, 'AES256')
+        self._test_unsupported_header(sse_header, 'aws:kms')
+        registry.register_swift_info('encryption', admin=True, enabled=False)
+        self._test_unsupported_header(sse_header, 'AES256')
+        self._test_unsupported_header(sse_header, 'aws:kms')
+        registry.register_swift_info('encryption', admin=True, enabled=True)
+        # AES256 now works
+        self.swift.register('PUT', '/v1/AUTH_X/bucket/object',
+                            swob.HTTPCreated, {}, None)
+        req = Request.blank('/bucket/object',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'HTTP_AUTHORIZATION': 'AWS X:Y:Z'},
+                            headers={sse_header: 'AES256',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status, '200 OK')
+        self.assertIn('swift.backend_path', req.environ)
+        self.assertEqual('/v1/AUTH_X/bucket/object',
+                         req.environ['swift.backend_path'])
+        # ...but aws:kms continues to fail
+        self._test_unsupported_header(sse_header, 'aws:kms')
+
+    def test_website_redirect_location(self):
+        self._test_unsupported_header('x-amz-website-redirect-location')
+
+    def test_object_tagging(self):
+        self._test_unsupported_header('x-amz-tagging')
+
+    def _test_unsupported_resource(self, resource):
+        req = Request.blank('/error?' + resource,
+                            environ={'REQUEST_METHOD': 'GET',
+                                     'HTTP_AUTHORIZATION': 'AWS X:Y:Z'},
+                            headers={'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'NotImplemented')
+        self.assertEqual(
+            {'501.NotImplemented': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:NotImplemented',
+                         get_log_info(req.environ))
+
+    def test_notification(self):
+        self._test_unsupported_resource('notification')
+
+    def test_policy(self):
+        self._test_unsupported_resource('policy')
+
+    def test_request_payment(self):
+        self._test_unsupported_resource('requestPayment')
+
+    def test_torrent(self):
+        self._test_unsupported_resource('torrent')
+
+    def test_website(self):
+        self._test_unsupported_resource('website')
+
+    def test_cors(self):
+        self._test_unsupported_resource('cors')
+
+    def test_tagging(self):
+        req = Request.blank('/bucket?tagging',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+        self.assertEqual(
+            {},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+
+        req = Request.blank('/bucket?tagging',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        self.s3api.logger.logger.clear()
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'NotImplemented')
+        self.assertEqual(
+            {'501.NotImplemented': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:NotImplemented',
+                         get_log_info(req.environ))
+
+        req = Request.blank('/bucket?tagging',
+                            environ={'REQUEST_METHOD': 'DELETE'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        self.s3api.logger.logger.clear()
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(self._get_error_code(body), 'NotImplemented')
+        self.assertEqual(
+            {'501.NotImplemented': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:NotImplemented',
+                         get_log_info(req.environ))
+
+    def test_restore(self):
+        self._test_unsupported_resource('restore')
+
+    def test_unsupported_method(self):
+        req = Request.blank('/bucket?acl',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        elem = fromstring(body, 'Error')
+        self.assertEqual(elem.find('./Code').text, 'MethodNotAllowed')
+        self.assertEqual(elem.find('./Method').text, 'POST')
+        self.assertEqual(elem.find('./ResourceType').text, 'ACL')
+        self.assertEqual(
+            {'405.MethodNotAllowed': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:MethodNotAllowed',
+                         get_log_info(req.environ))
+
+    @mock.patch.object(registry, '_sensitive_headers', set())
+    @mock.patch.object(registry, '_sensitive_params', set())
+    def test_registered_sensitive_info(self):
+        self.assertFalse(registry.get_sensitive_headers())
+        self.assertFalse(registry.get_sensitive_params())
+        filter_factory(self.conf)
+        sensitive = registry.get_sensitive_headers()
+        self.assertIn('authorization', sensitive)
+        sensitive = registry.get_sensitive_params()
+        self.assertIn('X-Amz-Signature', sensitive)
+        self.assertIn('Signature', sensitive)
+
+    @mock.patch.object(registry, '_swift_info', dict())
+    def test_registered_defaults(self):
+        conf_from_file = {k: str(v) for k, v in self.conf.items()}
+        filter_factory(conf_from_file)
+        swift_info = registry.get_swift_info()
+        self.assertTrue('s3api' in swift_info)
+        registered_keys = [
+            'max_bucket_listing', 'max_parts_listing', 'max_upload_part_num',
+            'max_multi_delete_objects', 'allow_multipart_uploads',
+            'min_segment_size', 's3_acl']
+        expected = dict((k, self.conf[k]) for k in registered_keys)
+        self.assertEqual(expected, swift_info['s3api'])
+
+    def test_check_pipeline(self):
+        with patch("swift.common.middleware.s3api.s3api.loadcontext"), \
+                patch("swift.common.middleware.s3api.s3api.PipelineWrapper") \
+                as pipeline:
+            # cause check_pipeline to not return early...
+            self.conf['__file__'] = ''
+            # ...and enable pipeline auth checking
+            self.s3api.conf.auth_pipeline_check = True
+
+            pipeline.return_value = 's3api tempauth proxy-server'
+            self.s3api.check_pipeline(self.conf)
+
+            # This *should* still work; authtoken will remove our auth details,
+            # but the X-Auth-Token we drop in will remain
+            # if we found one in the response
+            pipeline.return_value = 's3api s3token authtoken keystoneauth ' \
+                'proxy-server'
+            self.s3api.check_pipeline(self.conf)
+
+            # This should work now; no more doubled-up requests to keystone!
+            pipeline.return_value = 's3api s3token keystoneauth proxy-server'
+            self.s3api.check_pipeline(self.conf)
+
+            # Note that authtoken would need to have delay_auth_decision=True
+            pipeline.return_value = 's3api authtoken s3token keystoneauth ' \
+                'proxy-server'
+            self.s3api.check_pipeline(self.conf)
+
+            pipeline.return_value = 's3api proxy-server'
+            with self.assertRaises(ValueError) as cm:
+                self.s3api.check_pipeline(self.conf)
+            self.assertIn('expected auth between s3api and proxy-server',
+                          cm.exception.args[0])
+
+            pipeline.return_value = 'proxy-server'
+            with self.assertRaises(ValueError) as cm:
+                self.s3api.check_pipeline(self.conf)
+            self.assertIn("missing filters ['s3api']",
+                          cm.exception.args[0])
+
+    def test_s3api_initialization_with_disabled_pipeline_check(self):
+        with patch("swift.common.middleware.s3api.s3api.loadcontext"), \
+                patch("swift.common.middleware.s3api.s3api.PipelineWrapper") \
+                as pipeline:
+            # cause check_pipeline to not return early...
+            self.conf['__file__'] = ''
+            # ...but disable pipeline auth checking
+            self.s3api.conf.auth_pipeline_check = False
+
+            pipeline.return_value = 's3api tempauth proxy-server'
+            self.s3api.check_pipeline(self.conf)
+
+            pipeline.return_value = 's3api s3token authtoken keystoneauth ' \
+                'proxy-server'
+            self.s3api.check_pipeline(self.conf)
+
+            pipeline.return_value = 's3api authtoken s3token keystoneauth ' \
+                'proxy-server'
+            self.s3api.check_pipeline(self.conf)
+
+            pipeline.return_value = 's3api proxy-server'
+            self.s3api.check_pipeline(self.conf)
+
+            pipeline.return_value = 'proxy-server'
+            with self.assertRaises(ValueError):
+                self.s3api.check_pipeline(self.conf)
+
+    def test_signature_v4(self):
+        environ = {
+            'REQUEST_METHOD': 'GET'}
+        authz_header = 'AWS4-HMAC-SHA256 ' + ', '.join([
+            'Credential=test:tester/%s/us-east-1/s3/aws4_request' %
+            self.get_v4_amz_date_header().split('T', 1)[0],
+            'SignedHeaders=host;x-amz-date',
+            'Signature=X',
+        ])
+        headers = {
+            'Authorization': authz_header,
+            'X-Amz-Date': self.get_v4_amz_date_header(),
+            'X-Amz-Content-SHA256': '0' * 64}
+        req = Request.blank('/bucket/object', environ=environ, headers=headers)
+        req.content_type = 'text/plain'
+
+        # Test with ProxyLoggingMiddleware to verify access_user_id logging
+        app = ProxyLoggingMiddleware(self.s3api, {}, logger=self.logger)
+        status, headers, body = self.call_app(req, app=app)
+        self.assertEqual(status.split()[0], '200', body)
+        self.assertIn('swift.backend_path', req.environ)
+        self.assertEqual('/v1/AUTH_test/bucket/object',
+                         req.environ['swift.backend_path'])
+        for _, _, headers in self.swift.calls_with_headers:
+            self.assertEqual(authz_header, headers['Authorization'])
+            self.assertNotIn('X-Auth-Token', headers)
+
+        # Verify access_user_id is logged correctly for V4 signature
+        access_lines = self.logger.get_lines_for_level('info')
+        self.assertEqual(1, len(access_lines))
+        parts = access_lines[0].split()
+        self.assertEqual(' '.join(parts[3:7]),
+                         'GET /bucket/object HTTP/1.0 200')
+        self.assertEqual(parts[-1], 'test:tester')  # access_user_id
+
+    def test_signature_v4_no_date(self):
+        environ = {
+            'REQUEST_METHOD': 'GET'}
+        headers = {
+            'Authorization':
+                'AWS4-HMAC-SHA256 '
+                'Credential=test:tester/20130524/us-east-1/s3/aws4_request, '
+                'SignedHeaders=host;range;x-amz-date,'
+                'Signature=X',
+            'X-Amz-Content-SHA256': '0123456789'}
+        req = Request.blank('/bucket/object', environ=environ, headers=headers)
+        req.content_type = 'text/plain'
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '403')
+        self.assertEqual(self._get_error_code(body), 'AccessDenied')
+        self.assertEqual(
+            {'403.AccessDenied.invalid_date': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:AccessDenied.invalid_date',
+                         get_log_info(req.environ))
+
+    def test_signature_v4_no_payload(self):
+        environ = {
+            'REQUEST_METHOD': 'GET'}
+        headers = {
+            'Authorization':
+                'AWS4-HMAC-SHA256 '
+                'Credential=test:tester/%s/us-east-1/s3/aws4_request, '
+                'SignedHeaders=host;x-amz-date,'
+                'Signature=X' % self.get_v4_amz_date_header().split('T', 1)[0],
+            'X-Amz-Date': self.get_v4_amz_date_header()}
+        req = Request.blank('/bucket/object', environ=environ, headers=headers)
+        req.content_type = 'text/plain'
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '400')
+        self.assertEqual(self._get_error_code(body), 'InvalidRequest')
+        self.assertEqual(
+            self._get_error_message(body),
+            'Missing required header for this request: x-amz-content-sha256')
+        self.assertEqual(
+            {'400.InvalidRequest': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:InvalidRequest',
+                         get_log_info(req.environ))
+
+    def test_signature_v4_bad_authorization_string(self):
+        def test(auth_str, error, msg, metric, extra=b''):
+            environ = {
+                'REQUEST_METHOD': 'GET'}
+            headers = {
+                'Authorization': auth_str,
+                'X-Amz-Date': self.get_v4_amz_date_header(),
+                'X-Amz-Content-SHA256': '0123456789'}
+            req = Request.blank('/bucket/object', environ=environ,
+                                headers=headers)
+            req.content_type = 'text/plain'
+            self.s3api.logger.logger.clear()
+            status, headers, body = self.call_s3api(req)
+            self.assertEqual(self._get_error_code(body), error)
+            self.assertEqual(self._get_error_message(body), msg)
+            self.assertIn(extra, body)
+            self.assertEqual(
+                {metric: 1},
+                self.s3api.logger.logger.statsd_client.get_stats_counts())
+            self.assertEqual('s3:err:%s' % metric[4:],
+                             get_log_info(req.environ))
+
+        auth_str = ('AWS4-HMAC-SHA256 '
+                    'SignedHeaders=host;x-amz-date,'
+                    'Signature=X')
+        test(auth_str, 'AccessDenied', 'Access Denied.',
+             '403.AccessDenied.invalid_credential')
+
+        auth_str = (
+            'AWS4-HMAC-SHA256 '
+            'Credential=test:tester/20130524/us-east-1/s3/aws4_request, '
+            'Signature=X')
+        test(auth_str, 'AuthorizationHeaderMalformed',
+             'The authorization header is malformed; the authorization '
+             'header requires three components: Credential, SignedHeaders, '
+             'and Signature.', '400.AuthorizationHeaderMalformed')
+
+        auth_str = ('AWS4-HMAC-SHA256 '
+                    'Credential=test:tester/%s/us-west-2/s3/aws4_request, '
+                    'Signature=X, SignedHeaders=host;x-amz-date' %
+                    self.get_v4_amz_date_header().split('T', 1)[0])
+        test(auth_str, 'AuthorizationHeaderMalformed',
+             "The authorization header is malformed; "
+             "the region 'us-west-2' is wrong; expecting 'us-east-1'",
+             '400.AuthorizationHeaderMalformed', b'<Region>us-east-1</Region>')
+
+        auth_str = ('AWS4-HMAC-SHA256 '
+                    'Credential=test:tester/%s/us-east-1/not-s3/aws4_request, '
+                    'Signature=X, SignedHeaders=host;x-amz-date' %
+                    self.get_v4_amz_date_header().split('T', 1)[0])
+        test(auth_str, 'AuthorizationHeaderMalformed',
+             'The authorization header is malformed; '
+             'incorrect service "not-s3". This endpoint belongs to "s3".',
+             '400.AuthorizationHeaderMalformed')
+
+        auth_str = ('AWS4-HMAC-SHA256 '
+                    'Credential=test:tester/%s/us-east-1/s3/not-aws4_request, '
+                    'Signature=X, SignedHeaders=host;x-amz-date' %
+                    self.get_v4_amz_date_header().split('T', 1)[0])
+        test(auth_str, 'AuthorizationHeaderMalformed',
+             'The authorization header is malformed; '
+             'incorrect terminal "not-aws4_request". '
+             'This endpoint uses "aws4_request".',
+             '400.AuthorizationHeaderMalformed')
+
+        auth_str = (
+            'AWS4-HMAC-SHA256 '
+            'Credential=test:tester/20130524/us-east-1/s3/aws4_request, '
+            'SignedHeaders=host;x-amz-date')
+        test(auth_str, 'AccessDenied', 'Access Denied.',
+             '403.AccessDenied.invalid_header_auth')
+
+    def test_canonical_string_v4(self):
+        def _get_req(path, environ):
+            if '?' in path:
+                path, query_string = path.split('?', 1)
+            else:
+                query_string = ''
+
+            env = {
+                'REQUEST_METHOD': 'GET',
+                'PATH_INFO': path,
+                'QUERY_STRING': query_string,
+                'HTTP_DATE': 'Mon, 09 Sep 2011 23:36:00 GMT',
+                'HTTP_X_AMZ_CONTENT_SHA256':
+                    'e3b0c44298fc1c149afbf4c8996fb924'
+                    '27ae41e4649b934ca495991b7852b855',
+                'HTTP_AUTHORIZATION':
+                    'AWS4-HMAC-SHA256 '
+                    'Credential=X:Y/20110909/us-east-1/s3/aws4_request, '
+                    'SignedHeaders=content-md5;content-type;date, '
+                    'Signature=x',
+                'wsgi.input': io.BytesIO(),
+            }
+            fake_time = calendar.timegm((2011, 9, 9, 23, 36, 0))
+            env.update(environ)
+            with patch('swift.common.middleware.s3api.s3request.'
+                       'S3Request._validate_headers'), \
+                    patch('swift.common.middleware.s3api.utils.time.time',
+                          return_value=fake_time):
+                req = SigV4Request(env, conf=self.s3api.conf)
+            return req
+
+        def canonical_string(path, environ):
+            return _get_req(path, environ)._canonical_request()
+
+        def verify(hash_val, path, environ):
+            # See http://docs.aws.amazon.com/general/latest/gr
+            # /signature-v4-test-suite.html for where location, service, and
+            # signing key came from
+            with patch.object(self.s3api.conf, 'location', 'us-east-1'), \
+                    patch.object(swift.common.middleware.s3api.s3request,
+                                 'SERVICE', 'host'):
+                req = _get_req(path, environ)
+                hash_in_sts = req.sig_checker._string_to_sign().split(b'\n')[3]
+                self.assertEqual(hash_val, hash_in_sts.decode('ascii'))
+                self.assertTrue(req.sig_checker.check_signature(
+                    'wJalrXUtnFEMI/K7MDENG+bPxRfiCYEXAMPLEKEY'))
+
+        # all next data got from aws4_testsuite from Amazon
+        # http://docs.aws.amazon.com/general/latest/gr/samples
+        # /aws4_testsuite.zip
+        # Each *expected* hash value is the 4th line in <test-name>.sts in the
+        # test suite.
+
+        # get-vanilla
+        env = {
+            'HTTP_AUTHORIZATION': (
+                'AWS4-HMAC-SHA256 '
+                'Credential=AKIDEXAMPLE/20110909/us-east-1/host/aws4_request, '
+                'SignedHeaders=date;host, '
+                'Signature=b27ccfbfa7df52a200ff74193ca6e32d'
+                '4b48b8856fab7ebf1c595d0670a7e470'),
+            'HTTP_HOST': 'host.foo.com'}
+        verify('366b91fb121d72a00f46bbe8d395f53a'
+               '102b06dfb7e79636515208ed3fa606b1',
+               '/', env)
+
+        # get-header-value-trim
+        env = {
+            'REQUEST_METHOD': 'POST',
+            'HTTP_AUTHORIZATION': (
+                'AWS4-HMAC-SHA256 '
+                'Credential=AKIDEXAMPLE/20110909/us-east-1/host/aws4_request, '
+                'SignedHeaders=date;host;p, '
+                'Signature=debf546796015d6f6ded8626f5ce9859'
+                '7c33b47b9164cf6b17b4642036fcb592'),
+            'HTTP_HOST': 'host.foo.com',
+            'HTTP_P': 'phfft'}
+        verify('dddd1902add08da1ac94782b05f9278c'
+               '08dc7468db178a84f8950d93b30b1f35',
+               '/', env)
+
+        # get-utf8 (not exact)
+        env = {
+            'HTTP_AUTHORIZATION': (
+                'AWS4-HMAC-SHA256 '
+                'Credential=AKIDEXAMPLE/20110909/us-east-1/host/aws4_request, '
+                'SignedHeaders=date;host, '
+                'Signature=8d6634c189aa8c75c2e51e106b6b5121'
+                'bed103fdb351f7d7d4381c738823af74'),
+            'HTTP_HOST': 'host.foo.com',
+            'RAW_PATH_INFO': '/%E1%88%B4'}
+
+        # This might look weird because actually S3 doesn't care about utf-8
+        # encoded multi-byte bucket name from bucket-in-host name constraint.
+        # However, aws4_testsuite has only a sample hash with utf-8 *bucket*
+        # name to make sure the correctness (probably it can be used in other
+        # aws resource except s3) so, to test also utf-8, skip the bucket name
+        # validation in the following test.
+
+        # NOTE: eventlet's PATH_INFO is unquoted
+        with patch('swift.common.middleware.s3api.utils.'
+                   'validate_bucket_name'):
+            verify('27ba31df5dbc6e063d8f87d62eb07143'
+                   'f7f271c5330a917840586ac1c85b6f6b',
+                   swob.wsgi_unquote('/%E1%88%B4'), env)
+
+        # get-vanilla-query-order-key
+        env = {
+            'HTTP_AUTHORIZATION': (
+                'AWS4-HMAC-SHA256 '
+                'Credential=AKIDEXAMPLE/20110909/us-east-1/host/aws4_request, '
+                'SignedHeaders=date;host, '
+                'Signature=0dc122f3b28b831ab48ba65cb47300de'
+                '53fbe91b577fe113edac383730254a3b'),
+            'HTTP_HOST': 'host.foo.com'}
+        verify('2f23d14fe13caebf6dfda346285c6d9c'
+               '14f49eaca8f5ec55c627dd7404f7a727',
+               '/?a=foo&b=foo', env)
+
+        # post-header-value-case
+        env = {
+            'REQUEST_METHOD': 'POST',
+            'HTTP_AUTHORIZATION': (
+                'AWS4-HMAC-SHA256 '
+                'Credential=AKIDEXAMPLE/20110909/us-east-1/host/aws4_request, '
+                'SignedHeaders=date;host;zoo, '
+                'Signature=273313af9d0c265c531e11db70bbd653'
+                'f3ba074c1009239e8559d3987039cad7'),
+            'HTTP_HOST': 'host.foo.com',
+            'HTTP_ZOO': 'ZOOBAR'}
+        verify('3aae6d8274b8c03e2cc96fc7d6bda4b9'
+               'bd7a0a184309344470b2c96953e124aa',
+               '/', env)
+
+        # post-x-www-form-urlencoded-parameters
+        env = {
+            'REQUEST_METHOD': 'POST',
+            'HTTP_AUTHORIZATION': (
+                'AWS4-HMAC-SHA256 '
+                'Credential=AKIDEXAMPLE/20110909/us-east-1/host/aws4_request, '
+                'SignedHeaders=date;host;content-type, '
+                'Signature=b105eb10c6d318d2294de9d49dd8b031'
+                'b55e3c3fe139f2e637da70511e9e7b71'),
+            'HTTP_HOST': 'host.foo.com',
+            'HTTP_X_AMZ_CONTENT_SHA256':
+                '3ba8907e7a252327488df390ed517c45'
+                'b96dead033600219bdca7107d1d3f88a',
+            'CONTENT_TYPE':
+                'application/x-www-form-urlencoded; charset=utf8'}
+        verify('c4115f9e54b5cecf192b1eaa23b8e88e'
+               'd8dc5391bd4fde7b3fff3d9c9fe0af1f',
+               '/', env)
+
+        # post-x-www-form-urlencoded
+        env = {
+            'REQUEST_METHOD': 'POST',
+            'HTTP_AUTHORIZATION': (
+                'AWS4-HMAC-SHA256 '
+                'Credential=AKIDEXAMPLE/20110909/us-east-1/host/aws4_request, '
+                'SignedHeaders=date;host;content-type, '
+                'Signature=5a15b22cf462f047318703b92e6f4f38'
+                '884e4a7ab7b1d6426ca46a8bd1c26cbc'),
+            'HTTP_HOST': 'host.foo.com',
+            'HTTP_X_AMZ_CONTENT_SHA256':
+                '3ba8907e7a252327488df390ed517c45'
+                'b96dead033600219bdca7107d1d3f88a',
+            'CONTENT_TYPE':
+                'application/x-www-form-urlencoded'}
+        verify('4c5c6e4b52fb5fb947a8733982a8a5a6'
+               '1b14f04345cbfe6e739236c76dd48f74',
+               '/', env)
+
+        # Note that boto does not do proper stripping (as of 2.42.0).
+        # These were determined by examining the StringToSignBytes element of
+        # resulting SignatureDoesNotMatch errors from AWS.
+        str1 = canonical_string('/', {'CONTENT_TYPE': 'text/plain',
+                                      'HTTP_CONTENT_MD5': '##'})
+        str2 = canonical_string('/', {'CONTENT_TYPE': '\x01\x02text/plain',
+                                      'HTTP_CONTENT_MD5': '\x1f ##'})
+        str3 = canonical_string('/', {'CONTENT_TYPE': 'text/plain \x10',
+                                      'HTTP_CONTENT_MD5': '##\x18'})
+
+        self.assertEqual(str1, str2)
+        self.assertEqual(str2, str3)
+
+    def test_mixture_param_v4(self):
+        # now we have an Authorization header
+        headers = {
+            'Authorization':
+                'AWS4-HMAC-SHA256 '
+                'Credential=test/20130524/us-east-1/s3/aws4_request_A, '
+                'SignedHeaders=hostA;rangeA;x-amz-dateA,'
+                'Signature=X',
+            'X-Amz-Date': self.get_v4_amz_date_header(),
+            'X-Amz-Content-SHA256': '0123456789'}
+
+        # and then, different auth info (Credential, SignedHeaders, Signature)
+        # in query
+        req = Request.blank(
+            '/bucket/object'
+            '?X-Amz-Algorithm=AWS4-HMAC-SHA256'
+            '&X-Amz-Credential=test/20T20Z/us-east-1/s3/aws4_requestB'
+            '&X-Amz-SignedHeaders=hostB'
+            '&X-Amz-Signature=Y',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers=headers)
+        req.content_type = 'text/plain'
+        status, headers, body = self.call_s3api(req)
+        # FIXME: should this failed as 400 or pass via query auth?
+        # for now, 403 forbidden for safety
+        self.assertEqual(status.split()[0], '403', body)
+        self.assertEqual(
+            {'403.AccessDenied.invalid_expires': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:AccessDenied.invalid_expires',
+                         get_log_info(req.environ))
+
+        # But if we are missing Signature in query param
+        req = Request.blank(
+            '/bucket/object'
+            '?X-Amz-Algorithm=AWS4-HMAC-SHA256'
+            '&X-Amz-Credential=test/20T20Z/us-east-1/s3/aws4_requestB'
+            '&X-Amz-SignedHeaders=hostB',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers=headers)
+        req.content_type = 'text/plain'
+        self.s3api.logger.logger.clear()
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '403', body)
+        self.assertEqual(
+            {'403.AccessDenied.invalid_expires': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:AccessDenied.invalid_expires',
+                         get_log_info(req.environ))
+
+    def test_s3api_with_only_s3_token(self):
+        self.swift = FakeSwift()
+        self.keystone_auth = KeystoneAuth(
+            self.swift, {'operator_roles': 'swift-user'})
+        self.s3_token = S3Token(
+            self.keystone_auth, {'auth_uri': 'https://fakehost/identity'})
+        self.s3api = S3ApiMiddleware(self.s3_token, self.conf)
+        self.s3api.logger = debug_logger()
+        req = Request.blank(
+            '/bucket',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'Authorization': 'AWS access:signature',
+                     'Date': self.get_date_header()})
+        self.swift.register('PUT', '/v1/AUTH_TENANT_ID/bucket',
+                            swob.HTTPCreated, {}, None)
+        self.swift.register('HEAD', '/v1/AUTH_TENANT_ID',
+                            swob.HTTPOk, {}, None)
+        with patch.object(self.s3_token, '_json_request') as mock_req:
+            mock_resp = requests.Response()
+            mock_resp._content = json.dumps(GOOD_RESPONSE_V2).encode('ascii')
+            mock_resp.status_code = 201
+            mock_req.return_value = mock_resp
+
+            status, headers, body = self.call_s3api(req)
+            self.assertEqual(body, b'')
+            self.assertEqual(1, mock_req.call_count)
+            self.assertIn('swift.backend_path', req.environ)
+            self.assertEqual('/v1/AUTH_TENANT_ID/bucket',
+                             req.environ['swift.backend_path'])
+
+    def test_s3api_with_only_s3_token_v3(self):
+        self.swift = FakeSwift()
+        self.keystone_auth = KeystoneAuth(
+            self.swift, {'operator_roles': 'swift-user'})
+        self.s3_token = S3Token(
+            self.keystone_auth, {'auth_uri': 'https://fakehost/identity'})
+        self.s3api = S3ApiMiddleware(self.s3_token, self.conf)
+        self.s3api.logger = debug_logger()
+        req = Request.blank(
+            '/bucket',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'Authorization': 'AWS access:signature',
+                     'Date': self.get_date_header()})
+        self.swift.register('PUT', '/v1/AUTH_PROJECT_ID/bucket',
+                            swob.HTTPCreated, {}, None)
+        self.swift.register('HEAD', '/v1/AUTH_PROJECT_ID',
+                            swob.HTTPOk, {}, None)
+        with patch.object(self.s3_token, '_json_request') as mock_req:
+            mock_resp = requests.Response()
+            mock_resp._content = json.dumps(GOOD_RESPONSE_V3).encode('ascii')
+            mock_resp.status_code = 200
+            mock_req.return_value = mock_resp
+
+            status, headers, body = self.call_s3api(req)
+            self.assertEqual(body, b'')
+            self.assertEqual(1, mock_req.call_count)
+            self.assertIn('swift.backend_path', req.environ)
+            self.assertEqual('/v1/AUTH_PROJECT_ID/bucket',
+                             req.environ['swift.backend_path'])
+
+    def test_s3api_with_s3_token_and_auth_token(self):
+        self.swift = FakeSwift()
+        self.keystone_auth = KeystoneAuth(
+            self.swift, {'operator_roles': 'swift-user'})
+        self.auth_token = AuthProtocol(
+            self.keystone_auth, {'delay_auth_decision': 'True'})
+        self.s3_token = S3Token(
+            self.auth_token, {'auth_uri': 'https://fakehost/identity'})
+        self.s3api = S3ApiMiddleware(self.s3_token, self.conf)
+        self.s3api.logger = debug_logger()
+        req = Request.blank(
+            '/bucket',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'Authorization': 'AWS access:signature',
+                     'Date': self.get_date_header()})
+        self.swift.register('PUT', '/v1/AUTH_TENANT_ID/bucket',
+                            swob.HTTPCreated, {}, None)
+        self.swift.register('HEAD', '/v1/AUTH_TENANT_ID',
+                            swob.HTTPOk, {}, None)
+        with patch.object(self.s3_token, '_json_request') as mock_req:
+            with patch.object(self.auth_token,
+                              '_do_fetch_token') as mock_fetch:
+                # sanity check
+                self.assertIn('id', GOOD_RESPONSE_V2['access']['token'])
+                mock_resp = requests.Response()
+                mock_resp._content = json.dumps(
+                    GOOD_RESPONSE_V2).encode('ascii')
+                mock_resp.status_code = 201
+                mock_req.return_value = mock_resp
+
+                mock_access_info = AccessInfoV2(GOOD_RESPONSE_V2)
+                mock_access_info.will_expire_soon = \
+                    lambda stale_duration: False
+                mock_fetch.return_value = (MagicMock(), mock_access_info)
+
+                status, headers, body = self.call_s3api(req)
+                # Even though s3token got a token back from keystone, we drop
+                # it on the floor, resulting in a 401 Unauthorized at
+                # `swift.common.middleware.keystoneauth` because
+                # keystonemiddleware's auth_token strips out all auth headers,
+                # significantly 'X-Identity-Status'. Without a token, it then
+                # sets 'X-Identity-Status: Invalid' and never contacts
+                # Keystone.
+                self.assertEqual('403 Forbidden', status)
+                self.assertIn('swift.backend_path', req.environ)
+                self.assertEqual('/v1/AUTH_TENANT_ID/bucket',
+                                 req.environ['swift.backend_path'])
+                self.assertEqual(1, mock_req.call_count)
+                # it never even tries to contact keystone
+                self.assertEqual(0, mock_fetch.call_count)
+                statsd_client = self.s3api.logger.logger.statsd_client
+                self.assertEqual(
+                    {'403.SignatureDoesNotMatch': 1},
+                    statsd_client.get_stats_counts())
+            self.assertEqual('s3:err:SignatureDoesNotMatch',
+                             get_log_info(req.environ))
+
+    def test_s3api_with_only_s3_token_in_s3acl(self):
+        self.swift = FakeSwift()
+        self.keystone_auth = KeystoneAuth(
+            self.swift, {'operator_roles': 'swift-user'})
+        self.s3_token = S3Token(
+            self.keystone_auth, {'auth_uri': 'https://fakehost/identity'})
+
+        self.conf['s3_acl'] = True
+        self.s3api = S3ApiMiddleware(self.s3_token, self.conf)
+        self.s3api.logger = debug_logger()
+        req = Request.blank(
+            '/bucket',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'Authorization': 'AWS access:signature',
+                     'Date': self.get_date_header()})
+        self.swift.register('PUT', '/v1/AUTH_TENANT_ID/bucket',
+                            swob.HTTPCreated, {}, None)
+        # For now, s3 acl commits the bucket owner acl via POST
+        # after PUT container so we need to register the resposne here
+        self.swift.register('POST', '/v1/AUTH_TENANT_ID/bucket',
+                            swob.HTTPNoContent, {}, None)
+        with patch.object(self.s3_token, '_json_request') as mock_req:
+            mock_resp = requests.Response()
+            mock_resp._content = json.dumps(GOOD_RESPONSE_V2).encode('ascii')
+            mock_resp.status_code = 201
+            mock_req.return_value = mock_resp
+
+            status, headers, body = self.call_s3api(req)
+            self.assertEqual(body, b'')
+            self.assertIn('swift.backend_path', req.environ)
+            self.assertEqual('/v1/AUTH_TENANT_ID/bucket',
+                             req.environ['swift.backend_path'])
+            self.assertEqual(1, mock_req.call_count)
+
+    def test_s3api_with_time_skew(self):
+        def do_test(skew):
+            req = Request.blank(
+                '/object',
+                environ={'HTTP_HOST': 'bucket.localhost:80',
+                         'REQUEST_METHOD': 'GET',
+                         'HTTP_AUTHORIZATION':
+                             'AWS test:tester:hmac'},
+                headers={'Date': self.get_date_header(skew=skew)})
+            self.s3api.logger.logger.clear()
+            status, headers, body = self.call_s3api(req)
+            return req, status, headers, body
+
+        req, status, _, body = do_test(800)
+        self.assertEqual('200 OK', status)
+        self.assertFalse(
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+
+        req, status, _, body = do_test(-800)
+        self.assertEqual('200 OK', status)
+        self.assertFalse(
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+
+        req, status, _, body = do_test(1000)
+        self.assertEqual('403 Forbidden', status)
+        self.assertEqual(self._get_error_code(body), 'RequestTimeTooSkewed')
+        self.assertEqual(
+            {'403.RequestTimeTooSkewed': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:RequestTimeTooSkewed',
+                         get_log_info(req.environ))
+
+        req, status, _, body = do_test(-1000)
+        self.assertEqual('403 Forbidden', status)
+        self.assertEqual(self._get_error_code(body), 'RequestTimeTooSkewed')
+        self.assertEqual(
+            {'403.RequestTimeTooSkewed': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:RequestTimeTooSkewed',
+                         get_log_info(req.environ))
+
+        self.s3api.conf.allowable_clock_skew = 100
+        req, status, _, body = do_test(800)
+        self.assertEqual('403 Forbidden', status)
+        self.assertEqual(self._get_error_code(body), 'RequestTimeTooSkewed')
+        self.assertEqual(
+            {'403.RequestTimeTooSkewed': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:RequestTimeTooSkewed',
+                         get_log_info(req.environ))
+
+    def test_s3api_error_metric(self):
+        class KaboomResponse(ErrorResponse):
+            _code = 'ka boom'
+
+        def do_test(err_response):
+            req = Request.blank(
+                '/object',
+                environ={'HTTP_HOST': 'bucket.localhost:80',
+                         'REQUEST_METHOD': 'GET',
+                         'HTTP_AUTHORIZATION':
+                             'AWS test:tester:hmac'},
+                headers={'Date': self.get_date_header()})
+            self.s3api.logger.logger.clear()
+            with mock.patch.object(
+                    self.s3api, 'handle_request', side_effect=err_response):
+                self.call_s3api(req)
+            return req
+
+        req = do_test(ErrorResponse(status=403, msg='not good', reason='bad'))
+        self.assertEqual(
+            {'403.ErrorResponse.bad': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:ErrorResponse.bad',
+                         get_log_info(req.environ))
+
+        req = do_test(AccessDenied(msg='no entry', reason='invalid_date'))
+        self.assertEqual(
+            {'403.AccessDenied.invalid_date': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:AccessDenied.invalid_date',
+                         get_log_info(req.environ))
+
+        # check whitespace replaced with underscore
+        req = do_test(KaboomResponse(status=400, msg='boom',
+                                     reason='boom boom'))
+        self.assertEqual(
+            {'400.ka_boom.boom_boom': 1},
+            self.s3api.logger.logger.statsd_client.get_stats_counts())
+        self.assertEqual('s3:err:ka_boom.boom_boom',
+                         get_log_info(req.environ))
+
+    def test_error_response_reason_logging(self):
+        # verify that proxy logging gets error reason in log_info
+        environ = {'REQUEST_METHOD': 'HEAD'}
+        headers = {
+            'Authorization':
+                'AWS4-HMAC-SHA256 SignedHeaders=host;x-amz-date,Signature=X',
+            'X-Amz-Date': self.get_v4_amz_date_header(),
+            # invalid sha
+            'X-Amz-Content-SHA256': '0123456789'}
+        req = Request.blank('/bucket/object', environ=environ,
+                            headers=headers)
+        req.content_type = 'text/plain'
+        log_conf = {'log_msg_template': '{method} {path} {log_info}'}
+        app = ProxyLoggingMiddleware(self.s3api, log_conf, self.logger)
+        self.assertNotIn('swift.access_logging', req.environ)
+        status, headers, body = self.call_app(req, app=app)
+        self.assertNotIn('swift.access_logging', req.environ)
+
+        self.assertEqual(
+            ['403.AccessDenied.invalid_credential'],
+            self.s3api.logger.statsd_client.get_increments())
+        self.assertEqual('s3:err:AccessDenied.invalid_credential',
+                         get_log_info(req.environ))
+        self.assertEqual(
+            ['HEAD /bucket/object s3:err:AccessDenied.invalid_credential'],
+            self.logger.get_lines_for_level('info'))
+
+    def _do_test_emit_header_stats(self, extra_headers,
+                                   method='PUT',
+                                   path='/bucket/object'):
+        authz_header = 'AWS4-HMAC-SHA256 ' + ', '.join([
+            'Credential=test:tester/%s/us-east-1/s3/aws4_request' %
+            self.get_v4_amz_date_header().split('T', 1)[0],
+            'SignedHeaders=host;x-amz-date',
+            'Signature=X',
+        ])
+        headers = {
+            'Authorization': authz_header,
+            'X-Amz-Date': self.get_v4_amz_date_header(),
+            'Content-Type': 'text/plain',
+            'Content-Length': '0',
+        }
+        headers.update(extra_headers)
+        req = Request.blank(path, headers=headers, body='')
+        req.method = method
+        self.statsd.clear()
+
+        # verify that request headers are sampled before request is handled by
+        # mocking the controller to mutate the request headers
+        orig_get_response = S3Request.get_response
+        captured_envs = []
+
+        def mock_handler(req, *args, **kwargs):
+            # note: only requests that succeed in constructing an S3Request
+            # will reach this handler
+            captured_envs.append(req)
+            resp = orig_get_response(req, *args, **kwargs)
+            for k in extra_headers:
+                req.headers.pop(k, None)
+            return resp
+
+        with mock.patch('swift.common.middleware.s3api.s3request.S3Request.'
+                        'get_response', mock_handler):
+            _, _, body = self.call_s3api(req)
+        self.assertEqual([(('swift_s3_checksum_algo_request',), mock.ANY)],
+                         self.statsd.calls['increment'])
+        kwargs = self.statsd.calls['increment'][0][1]
+        self.assertIn('labels', kwargs)
+        return kwargs['labels']
+
+    def test_emit_stats_x_amx_content_sha256_real_hash(self):
+        headers = {'X-Amz-Content-SHA256': SHA256_OF_EMPTY_STRING}
+        labels = self._do_test_emit_header_stats(headers)
+        self.assertEqual({'account': 'AUTH_test',
+                          'container': 'bucket',
+                          'method': 'PUT',
+                          'type': 'object',
+                          'status': 200,
+                          'header_x_amz_content_sha256': 'hash_64'},
+                         labels)
+
+    def test_emit_stats_x_amx_content_sha256_real_hash_GET(self):
+        # boto3 sends this header with GETs...
+        headers = {'X-Amz-Content-SHA256': SHA256_OF_EMPTY_STRING}
+        resp_body = json.dumps([]).encode('ascii')
+        self.swift.register('GET', '/v1/AUTH_test', swob.HTTPOk, {}, resp_body)
+        labels = self._do_test_emit_header_stats(headers,
+                                                 method='GET',
+                                                 path='/')
+        self.assertEqual({'account': 'AUTH_test',
+                          'method': 'GET',
+                          'type': 'account',
+                          'status': 200,
+                          'header_x_amz_content_sha256': 'hash_64'},
+                         labels)
+
+        self.swift.register('GET', '/v1/AUTH_test/bucket', swob.HTTPOk, {},
+                            resp_body)
+        labels = self._do_test_emit_header_stats(headers,
+                                                 method='GET',
+                                                 path='/bucket')
+        self.assertEqual({'account': 'AUTH_test',
+                          'container': 'bucket',
+                          'method': 'GET',
+                          'type': 'container',
+                          'status': 200,
+                          'header_x_amz_content_sha256': 'hash_64'},
+                         labels)
+
+        labels = self._do_test_emit_header_stats(headers,
+                                                 method='GET',
+                                                 path='/bucket/object')
+        self.assertEqual({'account': 'AUTH_test',
+                          'container': 'bucket',
+                          'method': 'GET',
+                          'type': 'object',
+                          'status': 200,
+                          'header_x_amz_content_sha256': 'hash_64'},
+                         labels)
+
+        self.swift.register('GET', '/v1/AUTH_test/bucket/object',
+                            swob.HTTPNotFound, {}, "")
+        labels = self._do_test_emit_header_stats(headers,
+                                                 method='GET',
+                                                 path='/bucket/object')
+        self.assertEqual({'account': 'AUTH_test',
+                          'container': 'bucket',
+                          'method': 'GET',
+                          'type': 'object',
+                          'status': 404,
+                          'header_x_amz_content_sha256': 'hash_64'},
+                         labels)
+
+    def test_emit_stats_x_amx_checksum_sha256_real_hash(self):
+        headers = {'X-Amz-Checksum-SHA256': base64.b64encode(
+            hashlib.sha256().digest())}
+        labels = self._do_test_emit_header_stats(headers)
+        self.assertEqual({'method': 'PUT',
+                          'type': 'UNKNOWN',
+                          'status': 400,
+                          'header_x_amz_checksum_sha256': 'b64_44'},
+                         labels)
+
+    def test_emit_stats_x_amx_content_sha256_supported_aliases(self):
+        def do_test(alias):
+            headers = {'X-Amz-Content-SHA256': alias}
+            labels = self._do_test_emit_header_stats(headers)
+            self.assertEqual({'account': 'AUTH_test',
+                              'container': 'bucket',
+                              'method': 'PUT',
+                              'type': 'object',
+                              'status': 200,
+                              'header_x_amz_content_sha256': alias},
+                             labels)
+
+        do_test('UNSIGNED-PAYLOAD')
+
+    def test_emit_stats_x_amx_content_sha256_supported_streaming_aliases(self):
+        def do_test(alias):
+            headers = {'X-Amz-Content-SHA256': alias,
+                       'x-amz-decoded-content-length': '0'}
+            labels = self._do_test_emit_header_stats(headers)
+            self.assertEqual({'account': 'AUTH_test',
+                              'container': 'bucket',
+                              'method': 'PUT',
+                              'type': 'object',
+                              'status': 400,  # incomplete payload
+                              'header_x_amz_decoded_content_length': True,
+                              'header_x_amz_content_sha256': alias},
+                             labels)
+
+        do_test('STREAMING-UNSIGNED-PAYLOAD-TRAILER')
+        do_test('STREAMING-AWS4-HMAC-SHA256-PAYLOAD')
+        do_test('STREAMING-AWS4-HMAC-SHA256-PAYLOAD-TRAILER')
+
+    def test_emit_stats_x_amx_content_sha256_unsupported_aliases(self):
+        def do_test(alias):
+            headers = {'X-Amz-Content-SHA256': alias,
+                       'x-amz-decoded-content-length': '0'}
+            labels = self._do_test_emit_header_stats(headers)
+            self.assertEqual({'method': 'PUT',
+                              'type': 'UNKNOWN',
+                              'status': 501,
+                              'header_x_amz_decoded_content_length': True,
+                              'header_x_amz_content_sha256': alias},
+                             labels)
+
+        do_test('STREAMING-AWS4-ECDSA-P256-SHA256-PAYLOAD')
+        do_test('STREAMING-AWS4-ECDSA-P256-SHA256-PAYLOAD-TRAILER')
+
+    def test_emit_stats_x_amx_content_sha256_invalid(self):
+        def do_test(value):
+            headers = {'X-Amz-Content-SHA256': value}
+            labels = self._do_test_emit_header_stats(headers)
+            self.assertEqual({'method': 'PUT',
+                              'type': 'UNKNOWN',
+                              'status': 400,
+                              'header_x_amz_content_sha256': 'unknown'},
+                             labels)
+        do_test('0' * 63)
+        do_test('UNSIGNED-NONSENSE')
+
+    def test_emit_stats_content_md5(self):
+        headers = {'Content-MD5': base64.b64encode(md5(b'').digest()),
+                   # X-Amz-Content-SHA256 is required
+                   'X-Amz-Content-SHA256': SHA256_OF_EMPTY_STRING}
+        labels = self._do_test_emit_header_stats(headers)
+        self.assertEqual({'account': 'AUTH_test',
+                          'container': 'bucket',
+                          'method': 'PUT',
+                          'type': 'object',
+                          'status': 200,
+                          'header_content_md5': 'b64_24',
+                          'header_x_amz_content_sha256': 'hash_64'},
+                         labels)
+
+        headers = {'Content-MD5': 'nonsense',
+                   'X-Amz-Content-SHA256': SHA256_OF_EMPTY_STRING}
+        labels = self._do_test_emit_header_stats(headers)
+        self.assertEqual({'method': 'PUT',
+                          'type': 'UNKNOWN',
+                          'status': 400,
+                          'header_content_md5': 'b64_8',
+                          'header_x_amz_content_sha256': 'hash_64'},
+                         labels)
+
+    def test_emit_stats_content_encoding(self):
+        headers = {'Content-Encoding': 'aws-chunked',
+                   'X-Amz-Content-SHA256': SHA256_OF_EMPTY_STRING}
+        labels = self._do_test_emit_header_stats(headers)
+        self.assertEqual({'account': 'AUTH_test',
+                          'container': 'bucket',
+                          'method': 'PUT',
+                          'type': 'object',
+                          'status': 200,
+                          'header_content_encoding': 'aws-chunked',
+                          'header_x_amz_content_sha256': 'hash_64'},
+                         labels)
+
+        headers = {'Content-Encoding': 'aws-chunked,gzip',
+                   'X-Amz-Content-SHA256': SHA256_OF_EMPTY_STRING}
+        labels = self._do_test_emit_header_stats(headers)
+        self.assertEqual({'account': 'AUTH_test',
+                          'container': 'bucket',
+                          'method': 'PUT',
+                          'type': 'object',
+                          'status': 200,
+                          'header_content_encoding': 'aws-chunked',
+                          'header_x_amz_content_sha256': 'hash_64'},
+                         labels)
+
+        # s3api sees 'aws-chunked' in 'not-aws-chunked' and treats the
+        # request as unsupported rather than ignoring 'not-aws-chunked' !
+        headers = {'Content-Encoding': 'not-aws-chunked',
+                   'X-Amz-Content-SHA256': SHA256_OF_EMPTY_STRING}
+        labels = self._do_test_emit_header_stats(headers)
+        self.assertEqual({'account': 'AUTH_test',
+                          'container': 'bucket',
+                          'method': 'PUT',
+                          'type': 'object',
+                          'status': 200,
+                          'header_x_amz_content_sha256': 'hash_64'},
+                         labels)
+
+    def test_emit_stats_transfer_encoding(self):
+        headers = {'Transfer-Encoding': 'chunked',
+                   'X-Amz-Content-SHA256': SHA256_OF_EMPTY_STRING}
+        labels = self._do_test_emit_header_stats(headers)
+        self.assertEqual({'account': 'AUTH_test',
+                          'container': 'bucket',
+                          'type': 'object',
+                          'method': 'PUT',
+                          'status': 200,
+                          'header_transfer_encoding': 'chunked',
+                          'header_x_amz_content_sha256': 'hash_64'},
+                         labels)
+
+        headers = {'Transfer-Encoding': 'chunked,gzip',
+                   'X-Amz-Content-SHA256': SHA256_OF_EMPTY_STRING}
+        labels = self._do_test_emit_header_stats(headers)
+        self.assertEqual({'account': 'AUTH_test',
+                          'container': 'bucket',
+                          'type': 'object',
+                          'method': 'PUT',
+                          'status': 200,
+                          'header_transfer_encoding': 'chunked',
+                          'header_x_amz_content_sha256': 'hash_64'},
+                         labels)
+
+        headers = {'Transfer-Encoding': 'aws-chunked',
+                   'X-Amz-Content-SHA256': SHA256_OF_EMPTY_STRING}
+        labels = self._do_test_emit_header_stats(headers)
+        self.assertEqual({'account': 'AUTH_test',
+                          'container': 'bucket',
+                          'type': 'object',
+                          'method': 'PUT',
+                          'status': 200,
+                          'header_x_amz_content_sha256': 'hash_64'},
+                         labels)
+
+    def test_emit_stats_x_amz_decoded_content_length(self):
+        headers = {'X-Amz-Decoded-Content-Length': '123',
+                   'X-Amz-Content-SHA256': SHA256_OF_EMPTY_STRING}
+        labels = self._do_test_emit_header_stats(headers)
+        self.assertEqual({'account': 'AUTH_test',
+                          'container': 'bucket',
+                          'method': 'PUT',
+                          'type': 'object',
+                          'status': 200,
+                          'header_x_amz_decoded_content_length': True,
+                          'header_x_amz_content_sha256': 'hash_64'},
+                         labels)
+
+    def test_emit_stats_x_amz_checksum_crc32(self):
+        headers = {'X-Amz-Checksum-Crc32': base64.b64encode(b'1234'),
+                   'X-Amz-Content-SHA256': SHA256_OF_EMPTY_STRING}
+        labels = self._do_test_emit_header_stats(headers)
+        self.assertEqual({'account': 'AUTH_test',
+                          'container': 'bucket',
+                          'method': 'PUT',
+                          'type': 'object',
+                          'status': 400,  # bad digest
+                          'header_x_amz_checksum_crc32': 'b64_8',
+                          'header_x_amz_content_sha256': 'hash_64'},
+                         labels)
+
+        headers = {'X-Amz-Checksum-Crc32': base64.b64encode(b'123'),  # bad
+                   'X-Amz-Content-SHA256': SHA256_OF_EMPTY_STRING}
+        labels = self._do_test_emit_header_stats(headers)
+        self.assertEqual({'method': 'PUT',
+                          'type': 'UNKNOWN',
+                          'status': 400,
+                          'header_x_amz_checksum_crc32': 'unknown',
+                          'header_x_amz_content_sha256': 'hash_64'},
+                         labels)
+
+    def test_emit_stats_x_amz_checksum_crc32c(self):
+        headers = {'X-Amz-Checksum-Crc32c': base64.b64encode(b'1234'),
+                   'X-Amz-Content-SHA256': SHA256_OF_EMPTY_STRING}
+        labels = self._do_test_emit_header_stats(headers)
+        self.assertEqual({'account': 'AUTH_test',
+                          'container': 'bucket',
+                          'method': 'PUT',
+                          'type': 'object',
+                          'status': 400,  # bad digest
+                          'header_x_amz_checksum_crc32c': 'b64_8',
+                          'header_x_amz_content_sha256': 'hash_64'},
+                         labels)
+
+        headers = {'X-Amz-Checksum-Crc32c': base64.b64encode(b'123'),  # bad
+                   'X-Amz-Content-SHA256': SHA256_OF_EMPTY_STRING}
+        labels = self._do_test_emit_header_stats(headers)
+        self.assertEqual({'method': 'PUT',
+                          'type': 'UNKNOWN',
+                          'status': 400,
+                          'header_x_amz_checksum_crc32c': 'unknown',
+                          'header_x_amz_content_sha256': 'hash_64'},
+                         labels)
+
+    def test_emit_stats_x_amz_checksum_crc64nvme(self):
+        headers = {'X-Amz-Checksum-Crc32c': base64.b64encode(b'12345678'),
+                   'X-Amz-Content-SHA256': SHA256_OF_EMPTY_STRING}
+        labels = self._do_test_emit_header_stats(headers)
+        self.assertEqual({'type': 'UNKNOWN',
+                          'method': 'PUT',
+                          'status': 400,  # bad digest
+                          'header_x_amz_checksum_crc32c': 'b64_12',
+                          'header_x_amz_content_sha256': 'hash_64'},
+                         labels)
+
+    def test_emit_stats_x_amz_checksum_sha1(self):
+        headers = {'X-Amz-Checksum-SHA1': base64.b64encode(b'1234' * 5),
+                   'X-Amz-Content-SHA256': SHA256_OF_EMPTY_STRING}
+        labels = self._do_test_emit_header_stats(headers)
+        self.assertEqual({'account': 'AUTH_test',
+                          'container': 'bucket',
+                          'method': 'PUT',
+                          'type': 'object',
+                          'status': 400,  # bad digest
+                          'header_x_amz_checksum_sha1': 'b64_28',
+                          'header_x_amz_content_sha256': 'hash_64'},
+                         labels)
+
+        headers = {'X-Amz-Checksum-SHA1': base64.b64encode(b'123' * 5),  # bad
+                   'X-Amz-Content-SHA256': SHA256_OF_EMPTY_STRING}
+        labels = self._do_test_emit_header_stats(headers)
+        self.assertEqual({'method': 'PUT',
+                          'type': 'UNKNOWN',
+                          'status': 400,  # invalid header value
+                          'header_x_amz_checksum_sha1': 'unknown',
+                          'header_x_amz_content_sha256': 'hash_64'},
+                         labels)
+
+    def test_emit_stats_multiple_x_amz_checksums(self):
+        headers = {'X-Amz-Checksum-SHA1': base64.b64encode(b'1234' * 5),
+                   'X-Amz-Checksum-CRC32': base64.b64encode(b'1234'),
+                   'X-Amz-Content-SHA256': SHA256_OF_EMPTY_STRING}
+        labels = self._do_test_emit_header_stats(headers)
+        self.assertEqual({'type': 'UNKNOWN',
+                          'status': 400,
+                          'method': 'PUT',
+                          'header_x_amz_checksum_crc32': 'b64_8',
+                          'header_x_amz_checksum_sha1': 'b64_28',
+                          'header_x_amz_content_sha256': 'hash_64'},
+                         labels)
+
+    def test_emit_stats_x_amz_trailer_unknown(self):
+        def do_test(header_value):
+            headers = {
+                'X-Amz-Trailer': header_value,
+                'X-Amz-Content-SHA256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'x-amz-decoded-content-length': '0'
+            }
+            labels = self._do_test_emit_header_stats(headers)
+            self.assertEqual({'method': 'PUT',
+                              'type': 'UNKNOWN',
+                              'status': 400,
+                              'header_x_amz_decoded_content_length': True,
+                              'header_x_amz_trailer': 'unknown',
+                              'header_x_amz_content_sha256':
+                                  'STREAMING-UNSIGNED-PAYLOAD-TRAILER'},
+                             labels)
+
+        do_test('content-md5')
+        do_test('x-amz-checksum-sha2')
+        do_test('content-md5,x-amz-checksum-sha256')
+        do_test('x-amz-checksum-sha256,x-amz-checksum-crc32')
+
+    def test_emit_stats_x_amz_trailer(self):
+        def do_test(header_value):
+            headers = {
+                'X-Amz-Trailer': header_value,
+                'X-Amz-Content-SHA256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+                'x-amz-decoded-content-length': '0'
+            }
+            labels = self._do_test_emit_header_stats(headers)
+            self.assertEqual({'account': 'AUTH_test',
+                              'container': 'bucket',
+                              'method': 'PUT',
+                              'type': 'object',
+                              'status': 400,  # IncompleteBody
+                              'header_x_amz_decoded_content_length': True,
+                              'header_x_amz_trailer': header_value,
+                              'header_x_amz_content_sha256':
+                                  'STREAMING-UNSIGNED-PAYLOAD-TRAILER'},
+                             labels)
+
+        do_test('x-amz-checksum-crc32')
+        do_test('x-amz-checksum-crc32c')
+        with mock.patch('swift.common.utils.checksum.crc64nvme_isal') \
+                as mock_crc64nvme:
+            mock_crc64nvme.__name__ = 'crc64nvme_isal'
+            do_test('x-amz-checksum-crc64nvme')
+        do_test('x-amz-checksum-sha1')
+        do_test('x-amz-checksum-sha256')
+
+    def test_emit_stats_x_amz_sdk_checksum_algorithm(self):
+        def do_test(algo):
+            headers = {
+                'x-amz-sdk-checksum-algorithm': algo,
+            }
+            labels = self._do_test_emit_header_stats(headers)
+            self.assertEqual({'method': 'PUT',
+                              'type': 'UNKNOWN',
+                              'status': 400,
+                              'header_x_amz_sdk_checksum_algorithm':
+                                  algo.replace('-', '')},
+                             labels)
+        do_test('CRC32')
+        do_test('CRC32C')
+        do_test('CRC64NVME')
+        do_test('SHA1')
+        do_test('SHA256')
+        do_test('CRC-32')
+        do_test('CRC-32C')
+        do_test('CRC-64NVME')
+        do_test('SHA-1')
+        do_test('SHA-256')
+
+    def test_emit_stats_x_amz_checksum_algorithm(self):
+        def do_test(algo):
+            headers = {
+                'X-Amz-Checksum-Algorithm': algo,
+            }
+            labels = self._do_test_emit_header_stats(headers)
+            self.assertEqual({'method': 'PUT',
+                              'type': 'UNKNOWN',
+                              'status': 400,
+                              'header_x_amz_checksum_algorithm':
+                                  algo.replace('-', '')},
+                             labels)
+        do_test('CRC32')
+        do_test('CRC32C')
+        do_test('CRC64NVME')
+        do_test('SHA1')
+        do_test('SHA256')
+        do_test('CRC-32')
+        do_test('CRC-32C')
+        do_test('CRC-64NVME')
+        do_test('SHA-1')
+        do_test('SHA-256')
+
+    def test_emit_stats_x_amz_checksum_algorithm_unknown(self):
+        headers = {
+            'X-Amz-Checksum-Algorithm': 'CRC128',
+        }
+        labels = self._do_test_emit_header_stats(headers)
+        self.assertEqual({'method': 'PUT',
+                          'type': 'UNKNOWN',
+                          'status': 400,
+                          'header_x_amz_checksum_algorithm': 'unknown'},
+                         labels)
+
+    def test_access_user_id_logging(self):
+        # verify that proxy logging gets access_user_id from S3 requests
+        environ = {'REQUEST_METHOD': 'GET'}
+        headers = {
+            'Authorization': 'AWS test:tester:hmac',
+            'Date': self.get_date_header()}
+        req = Request.blank('/bucket/object', environ=environ,
+                            headers=headers)
+
+        # Use a log template that includes access_user_id
+        log_conf = {
+            'log_msg_template':
+                '{method} {path} {account} {container} {object} '
+                '{status_int} {access_user_id}'
+        }
+        app = ProxyLoggingMiddleware(self.s3api, log_conf, self.logger)
+        status, headers, body = self.call_app(req, app=app)
+
+        # Should be successful GET
+        self.assertEqual(status.split()[0], '200')
+        # Verify the access_user_id is logged correctly
+        expected_log = ('GET /bucket/object AUTH_test bucket object '
+                        '200 test:tester')
+        self.assertEqual([expected_log],
+                         self.logger.get_lines_for_level('info'))
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/s3api/test_s3request.py b/test/unit/common/middleware/s3api/test_s3request.py
new file mode 100644
index 0000000000..0a866d204d
--- /dev/null
+++ b/test/unit/common/middleware/s3api/test_s3request.py
@@ -0,0 +1,3041 @@
+# Copyright (c) 2014 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import base64
+import io
+from datetime import timedelta
+import hashlib
+from unittest.mock import patch, MagicMock
+import unittest
+import unittest.mock as mock
+
+from io import BytesIO
+
+from swift.common import swob
+from swift.common.middleware.s3api import s3request, s3response, controllers
+from swift.common.middleware.s3api.exception import S3InputChecksumMismatch
+from swift.common.swob import Request, HTTPNoContent
+from swift.common.middleware.s3api.utils import mktime, Config
+from swift.common.middleware.s3api.acl_handlers import get_acl_handler
+from swift.common.middleware.s3api.subresource import ACL, User, Owner, \
+    Grant, encode_acl
+from swift.common.middleware.s3api.s3request import S3Request, \
+    S3AclRequest, SigV4Request, SIGV4_X_AMZ_DATE_FORMAT, HashingInput, \
+    ChunkReader, StreamingInput, S3InputSHA256Mismatch, \
+    S3InputChunkSignatureMismatch, _get_checksum_hasher
+from swift.common.middleware.s3api.s3response import InvalidArgument, \
+    NoSuchBucket, InternalError, ServiceUnavailable, \
+    AccessDenied, SignatureDoesNotMatch, RequestTimeTooSkewed, \
+    InvalidPartArgument, InvalidPartNumber, InvalidRequest, \
+    XAmzContentSHA256Mismatch, ErrorResponse, S3NotImplemented
+from swift.common.utils import checksum
+from test.debug_logger import debug_logger
+from test.unit import requires_crc32c, requires_crc64nvme
+from test.unit.common.middleware.s3api.test_s3api import S3ApiTestCase
+
+Fake_ACL_MAP = {
+    # HEAD Bucket
+    ('HEAD', 'HEAD', 'container'):
+    {'Resource': 'container',
+     'Permission': 'READ'},
+    # GET Bucket
+    ('GET', 'GET', 'container'):
+    {'Resource': 'container',
+     'Permission': 'READ'},
+    # HEAD Object
+    ('HEAD', 'HEAD', 'object'):
+    {'Resource': 'object',
+     'Permission': 'READ'},
+    # GET Object
+    ('GET', 'GET', 'object'):
+    {'Resource': 'object',
+     'Permission': 'READ'},
+}
+
+
+def _gen_test_acl_header(owner, permission=None, grantee=None,
+                         resource='container'):
+    if permission is None:
+        return ACL(owner, [])
+
+    if grantee is None:
+        grantee = User('test:tester')
+    return encode_acl(resource, ACL(owner, [Grant(grantee, permission)]))
+
+
+class FakeResponse(object):
+    def __init__(self, s3_acl):
+        self.sysmeta_headers = {}
+        if s3_acl:
+            owner = Owner(id='test:tester', name='test:tester')
+            self.sysmeta_headers.update(
+                _gen_test_acl_header(owner, 'FULL_CONTROL',
+                                     resource='container'))
+            self.sysmeta_headers.update(
+                _gen_test_acl_header(owner, 'FULL_CONTROL',
+                                     resource='object'))
+
+
+class FakeSwiftResponse(object):
+    def __init__(self):
+        self.environ = {
+            'PATH_INFO': '/v1/AUTH_test',
+            'HTTP_X_TENANT_NAME': 'test',
+            'HTTP_X_USER_NAME': 'tester',
+            'HTTP_X_AUTH_TOKEN': 'token',
+        }
+
+
+class TestRequest(S3ApiTestCase):
+
+    def setUp(self):
+        super(TestRequest, self).setUp()
+        self.s3api.conf.s3_acl = True
+        s3request.SIGV4_CHUNK_MIN_SIZE = 2
+
+    @patch('swift.common.middleware.s3api.acl_handlers.ACL_MAP', Fake_ACL_MAP)
+    @patch('swift.common.middleware.s3api.s3request.S3AclRequest.authenticate',
+           lambda x, y: None)
+    def _test_get_response(self, method, container='bucket', obj=None,
+                           permission=None, skip_check=False,
+                           req_klass=S3Request, fake_swift_resp=None):
+        path = '/' + container + ('/' + obj if obj else '')
+        req = Request.blank(path,
+                            environ={'REQUEST_METHOD': method},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        s3_req = req_klass(req.environ, conf=self.s3api.conf)
+        s3_req.set_acl_handler(
+            get_acl_handler(s3_req.controller_name)(s3_req, debug_logger()))
+        with patch('swift.common.middleware.s3api.s3request.S3Request.'
+                   '_get_response') as mock_get_resp, \
+                patch('swift.common.middleware.s3api.subresource.ACL.'
+                      'check_permission') as m_check_permission:
+            mock_get_resp.return_value = fake_swift_resp \
+                or FakeResponse(self.s3api.conf.s3_acl)
+            return mock_get_resp, m_check_permission, \
+                s3_req.get_response(self.s3api)
+
+    def test_get_response_without_s3_acl(self):
+        self.s3api.conf.s3_acl = False
+        mock_get_resp, m_check_permission, s3_resp = \
+            self._test_get_response('HEAD')
+        self.assertFalse(hasattr(s3_resp, 'bucket_acl'))
+        self.assertFalse(hasattr(s3_resp, 'object_acl'))
+        self.assertEqual(mock_get_resp.call_count, 1)
+        self.assertEqual(m_check_permission.call_count, 0)
+
+    def test_get_response_without_match_ACL_MAP(self):
+        with self.assertRaises(Exception) as e:
+            self._test_get_response('POST', req_klass=S3AclRequest)
+        self.assertEqual(e.exception.args[0],
+                         'No permission to be checked exists')
+
+    def test_get_response_without_duplication_HEAD_request(self):
+        obj = 'object'
+        mock_get_resp, m_check_permission, s3_resp = \
+            self._test_get_response('HEAD', obj=obj,
+                                    req_klass=S3AclRequest)
+        self.assertTrue(s3_resp.bucket_acl is not None)
+        self.assertTrue(s3_resp.object_acl is not None)
+        self.assertEqual(mock_get_resp.call_count, 1)
+        args, kargs = mock_get_resp.call_args_list[0]
+        get_resp_obj = args[3]
+        self.assertEqual(get_resp_obj, obj)
+        self.assertEqual(m_check_permission.call_count, 1)
+        args, kargs = m_check_permission.call_args
+        permission = args[1]
+        self.assertEqual(permission, 'READ')
+
+    def test_get_response_with_check_object_permission(self):
+        obj = 'object'
+        mock_get_resp, m_check_permission, s3_resp = \
+            self._test_get_response('GET', obj=obj,
+                                    req_klass=S3AclRequest)
+        self.assertTrue(s3_resp.bucket_acl is not None)
+        self.assertTrue(s3_resp.object_acl is not None)
+        self.assertEqual(mock_get_resp.call_count, 2)
+        args, kargs = mock_get_resp.call_args_list[0]
+        get_resp_obj = args[3]
+        self.assertEqual(get_resp_obj, obj)
+        self.assertEqual(m_check_permission.call_count, 1)
+        args, kargs = m_check_permission.call_args
+        permission = args[1]
+        self.assertEqual(permission, 'READ')
+
+    def test_get_response_with_check_container_permission(self):
+        mock_get_resp, m_check_permission, s3_resp = \
+            self._test_get_response('GET',
+                                    req_klass=S3AclRequest)
+        self.assertTrue(s3_resp.bucket_acl is not None)
+        self.assertTrue(s3_resp.object_acl is not None)
+        self.assertEqual(mock_get_resp.call_count, 2)
+        args, kargs = mock_get_resp.call_args_list[0]
+        get_resp_obj = args[3]
+        self.assertEqual(get_resp_obj, '')
+        self.assertEqual(m_check_permission.call_count, 1)
+        args, kargs = m_check_permission.call_args
+        permission = args[1]
+        self.assertEqual(permission, 'READ')
+
+    def test_get_validate_param(self):
+        def create_s3request_with_param(param, value):
+            req = Request.blank(
+                '/bucket?%s=%s' % (param, value),
+                environ={'REQUEST_METHOD': 'GET'},
+                headers={'Authorization': 'AWS test:tester:hmac',
+                         'Date': self.get_date_header()})
+            return S3Request(req.environ)
+
+        s3req = create_s3request_with_param('max-keys', '1')
+
+        # a param in the range
+        self.assertEqual(s3req.get_validated_param('max-keys', 1000, 1000), 1)
+        self.assertEqual(s3req.get_validated_param('max-keys', 0, 1), 1)
+
+        # a param in the out of the range
+        self.assertEqual(s3req.get_validated_param('max-keys', 0, 0), 0)
+
+        # a param in the out of the integer range
+        s3req = create_s3request_with_param('max-keys', '1' * 30)
+        with self.assertRaises(InvalidArgument) as result:
+            s3req.get_validated_param('max-keys', 1)
+        self.assertIn(
+            b'not an integer or within integer range', result.exception.body)
+        self.assertEqual(
+            result.exception.headers['content-type'], 'application/xml')
+
+        # a param is negative integer
+        s3req = create_s3request_with_param('max-keys', '-1')
+        with self.assertRaises(InvalidArgument) as result:
+            s3req.get_validated_param('max-keys', 1)
+        self.assertIn(
+            b'must be an integer between 0 and', result.exception.body)
+        self.assertEqual(
+            result.exception.headers['content-type'], 'application/xml')
+
+        # a param is not integer
+        s3req = create_s3request_with_param('max-keys', 'invalid')
+        with self.assertRaises(InvalidArgument) as result:
+            s3req.get_validated_param('max-keys', 1)
+        self.assertIn(
+            b'not an integer or within integer range', result.exception.body)
+        self.assertEqual(
+            result.exception.headers['content-type'], 'application/xml')
+
+    def test_authenticate_delete_Authorization_from_s3req(self):
+        req = Request.blank('/bucket/obj',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        with patch.object(Request, 'get_response') as m_swift_resp, \
+                patch.object(Request, 'remote_user', 'authorized'):
+
+            m_swift_resp.return_value = FakeSwiftResponse()
+            s3_req = S3AclRequest(req.environ, self.s3api.conf, None)
+            self.assertNotIn('s3api.auth_details', s3_req.environ)
+
+    def test_to_swift_req_Authorization_not_exist_in_swreq(self):
+        # the difference from
+        # test_authenticate_delete_Authorization_from_s3req_headers above is
+        # this method asserts *to_swift_req* method.
+        container = 'bucket'
+        obj = 'obj'
+        method = 'GET'
+        req = Request.blank('/%s/%s' % (container, obj),
+                            environ={'REQUEST_METHOD': method},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        with patch.object(Request, 'get_response') as m_swift_resp, \
+                patch.object(Request, 'remote_user', 'authorized'):
+
+            m_swift_resp.return_value = FakeSwiftResponse()
+            s3_req = S3AclRequest(req.environ)
+            # Yes, we *want* to assert this
+            sw_req = s3_req.to_swift_req(method, container, obj)
+            # So since the result of S3AclRequest init tests and with this
+            # result to_swift_req doesn't add Authorization header and token
+            self.assertNotIn('s3api.auth_details', sw_req.environ)
+            self.assertNotIn('X-Auth-Token', sw_req.headers)
+
+    def test_to_swift_req_subrequest_proxy_access_log(self):
+        container = 'bucket'
+        obj = 'obj'
+        method = 'GET'
+
+        # force_swift_request_proxy_log is True
+        req = Request.blank('/%s/%s' % (container, obj),
+                            environ={'REQUEST_METHOD': method,
+                                     'swift.proxy_access_log_made': True},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        with patch.object(Request, 'get_response') as m_swift_resp, \
+                patch.object(Request, 'remote_user', 'authorized'):
+            m_swift_resp.return_value = FakeSwiftResponse()
+            s3_req = S3AclRequest(
+                req.environ,
+                conf=Config({'force_swift_request_proxy_log': True}))
+            sw_req = s3_req.to_swift_req(method, container, obj)
+            self.assertFalse(sw_req.environ['swift.proxy_access_log_made'])
+
+        # force_swift_request_proxy_log is False
+        req = Request.blank('/%s/%s' % (container, obj),
+                            environ={'REQUEST_METHOD': method,
+                                     'swift.proxy_access_log_made': True},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        with patch.object(Request, 'get_response') as m_swift_resp, \
+                patch.object(Request, 'remote_user', 'authorized'):
+            m_swift_resp.return_value = FakeSwiftResponse()
+            s3_req = S3AclRequest(
+                req.environ,
+                conf=Config({'force_swift_request_proxy_log': False}))
+            sw_req = s3_req.to_swift_req(method, container, obj)
+            self.assertTrue(sw_req.environ['swift.proxy_access_log_made'])
+
+    def test_get_container_info(self):
+        s3api_acl = '{"Owner":"owner","Grant":'\
+            '[{"Grantee":"owner","Permission":"FULL_CONTROL"}]}'
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket', HTTPNoContent,
+                            {'x-container-read': 'foo',
+                             'X-container-object-count': '5',
+                             'x-container-sysmeta-versions-location':
+                                'bucket2',
+                             'x-container-sysmeta-s3api-acl': s3api_acl,
+                             'X-container-meta-foo': 'bar'}, None)
+        req = Request.blank('/bucket', environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        s3_req = S3Request(req.environ)
+        # first, call get_response('HEAD')
+        info = s3_req.get_container_info(self.app)
+        self.assertTrue('status' in info)  # sanity
+        self.assertEqual(204, info['status'])  # sanity
+        self.assertEqual('foo', info['read_acl'])  # sanity
+        self.assertEqual(5, info['object_count'])  # sanity
+        self.assertEqual(
+            'bucket2', info['sysmeta']['versions-location'])  # sanity
+        self.assertEqual(s3api_acl, info['sysmeta']['s3api-acl'])  # sanity
+        self.assertEqual({'foo': 'bar'}, info['meta'])  # sanity
+        with patch(
+                'swift.common.middleware.s3api.s3request.get_container_info',
+                return_value={'status': 204}) as mock_info:
+            # Then all calls goes to get_container_info
+            for x in range(10):
+                info = s3_req.get_container_info(self.swift)
+                self.assertTrue('status' in info)  # sanity
+                self.assertEqual(204, info['status'])  # sanity
+            self.assertEqual(10, mock_info.call_count)
+
+        expected_errors = [(404, NoSuchBucket), (0, InternalError),
+                           (503, ServiceUnavailable)]
+        for status, expected_error in expected_errors:
+            with patch('swift.common.middleware.s3api.s3request.'
+                       'get_container_info',
+                       return_value={'status': status}):
+                self.assertRaises(
+                    expected_error, s3_req.get_container_info, MagicMock())
+
+    def test_date_header_missing(self):
+        self.swift.register('HEAD', '/v1/AUTH_test/nojunk', swob.HTTPNotFound,
+                            {}, None)
+        req = Request.blank('/nojunk',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'Authorization': 'AWS test:tester:hmac'})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '403')
+        self.assertEqual(body, b'')
+
+    def test_date_header_expired(self):
+        self.swift.register('HEAD', '/v1/AUTH_test/nojunk', swob.HTTPNotFound,
+                            {}, None)
+        req = Request.blank('/nojunk',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': 'Fri, 01 Apr 2014 12:00:00 GMT'})
+
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '403')
+        self.assertEqual(body, b'')
+
+    def test_date_header_with_x_amz_date_valid(self):
+        self.swift.register('HEAD', '/v1/AUTH_test/nojunk', swob.HTTPNotFound,
+                            {}, None)
+        req = Request.blank('/nojunk',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': 'Fri, 01 Apr 2014 12:00:00 GMT',
+                                     'x-amz-date': self.get_date_header()})
+
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '404')
+        self.assertEqual(body, b'')
+
+    def test_date_header_with_x_amz_date_expired(self):
+        self.swift.register('HEAD', '/v1/AUTH_test/nojunk', swob.HTTPNotFound,
+                            {}, None)
+        req = Request.blank('/nojunk',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header(),
+                                     'x-amz-date':
+                                     'Fri, 01 Apr 2014 12:00:00 GMT'})
+
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '403')
+        self.assertEqual(body, b'')
+
+    def test_put_object_if_none_match(self):
+        req = Request.blank('/bucket/object', method='PUT',
+                            headers={'If-None-Match': 'asdf',
+                                     'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        with self.assertRaises(s3response.S3NotImplemented) as cm:
+            S3Request(req.environ, self.s3api.conf)._validate_headers()
+        self.assertIn('501 Not Implemented', str(cm.exception))
+
+    def test_put_object_if_match(self):
+        req = Request.blank('/bucket/object', method='PUT',
+                            headers={'If-Match': '*',
+                                     'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        with self.assertRaises(s3response.S3NotImplemented) as cm:
+            S3Request(req.environ, self.s3api.conf)._validate_headers()
+        self.assertIn('501 Not Implemented', str(cm.exception))
+
+    def test_put_object_if_modified_since(self):
+        req = Request.blank('/bucket/object', method='PUT',
+                            headers={'If-Modified-Since':
+                                     'Sat, 27 Jun 2015 00:00:00 GMT',
+                                     'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        with self.assertRaises(s3response.S3NotImplemented) as cm:
+            S3Request(req.environ, self.s3api.conf)._validate_headers()
+        self.assertIn('501 Not Implemented', str(cm.exception))
+
+    def test_put_object_if_unmodified_since(self):
+        req = Request.blank('/bucket/object', method='PUT',
+                            headers={'If-Unmodified-Since':
+                                     'Sat, 27 Jun 2015 00:00:00 GMT',
+                                     'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        with self.assertRaises(s3response.S3NotImplemented) as cm:
+            S3Request(req.environ, self.s3api.conf)._validate_headers()
+        self.assertIn('501 Not Implemented', str(cm.exception))
+
+    def test_put_object_if_none_match_star(self):
+        # This is the only allowed case, should NOT raise
+        req = Request.blank('/bucket/object', method='PUT',
+                            headers={'If-None-Match': '*',
+                                     'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        try:
+            S3Request(req.environ, self.s3api.conf)._validate_headers()
+        except ErrorResponse as err:
+            self.fail('Unexpected exception raised: %s' % err)
+
+    def _test_request_timestamp_sigv4(self, date_header):
+        # signature v4 here
+        environ = {
+            'REQUEST_METHOD': 'GET'}
+
+        if 'X-Amz-Date' in date_header:
+            included_header = 'x-amz-date'
+            scope_date = date_header['X-Amz-Date'].split('T', 1)[0]
+        elif 'Date' in date_header:
+            included_header = 'date'
+            scope_date = self.get_v4_amz_date_header().split('T', 1)[0]
+        else:
+            self.fail('Invalid date header specified as test')
+
+        headers = {
+            'Authorization':
+                'AWS4-HMAC-SHA256 '
+                'Credential=test/%s/us-east-1/s3/aws4_request, '
+                'SignedHeaders=%s,'
+                'Signature=X' % (
+                    scope_date,
+                    ';'.join(sorted(['host', included_header]))),
+            'X-Amz-Content-SHA256': '0' * 64}
+
+        headers.update(date_header)
+        req = Request.blank('/', environ=environ, headers=headers)
+        sigv4_req = SigV4Request(req.environ, conf=self.s3api.conf)
+
+        if 'X-Amz-Date' in date_header:
+            timestamp = mktime(
+                date_header['X-Amz-Date'], SIGV4_X_AMZ_DATE_FORMAT)
+        elif 'Date' in date_header:
+            timestamp = mktime(date_header['Date'])
+
+        self.assertEqual(timestamp, int(sigv4_req.timestamp))
+
+    def test_request_timestamp_sigv4(self):
+        access_denied_message = \
+            b'AWS authentication requires a valid Date or x-amz-date header'
+
+        # normal X-Amz-Date header
+        date_header = {'X-Amz-Date': self.get_v4_amz_date_header()}
+        self._test_request_timestamp_sigv4(date_header)
+
+        # normal Date header
+        date_header = {'Date': self.get_date_header()}
+        self._test_request_timestamp_sigv4(date_header)
+
+        # mangled X-Amz-Date header
+        date_header = {'X-Amz-Date': self.get_v4_amz_date_header()[:-1]}
+        with self.assertRaises(AccessDenied) as cm:
+            self._test_request_timestamp_sigv4(date_header)
+
+        self.assertEqual('403 Forbidden', cm.exception.args[0])
+        self.assertIn(access_denied_message, cm.exception.body)
+
+        # mangled Date header
+        date_header = {'Date': self.get_date_header()[20:]}
+        with self.assertRaises(AccessDenied) as cm:
+            self._test_request_timestamp_sigv4(date_header)
+
+        self.assertEqual('403 Forbidden', cm.exception.args[0])
+        self.assertIn(access_denied_message, cm.exception.body)
+
+        # Negative timestamp
+        date_header = {'X-Amz-Date': '00160523T054055Z'}
+        with self.assertRaises(AccessDenied) as cm:
+            self._test_request_timestamp_sigv4(date_header)
+
+        self.assertEqual('403 Forbidden', cm.exception.args[0])
+        self.assertIn(access_denied_message, cm.exception.body)
+
+        # far-past Date header
+        date_header = {'Date': 'Tue, 07 Jul 999 21:53:04 GMT'}
+        with self.assertRaises(AccessDenied) as cm:
+            self._test_request_timestamp_sigv4(date_header)
+
+        self.assertEqual('403 Forbidden', cm.exception.args[0])
+        self.assertIn(access_denied_message, cm.exception.body)
+
+        # near-past X-Amz-Date headers
+        date_header = {'X-Amz-Date': self.get_v4_amz_date_header(
+            timedelta(minutes=-10)
+        )}
+        self._test_request_timestamp_sigv4(date_header)
+
+        date_header = {'X-Amz-Date': self.get_v4_amz_date_header(
+            timedelta(minutes=-10)
+        )}
+        with self.assertRaises(RequestTimeTooSkewed) as cm, \
+                patch.object(self.s3api.conf, 'allowable_clock_skew', 300):
+            self._test_request_timestamp_sigv4(date_header)
+
+        # near-future X-Amz-Date headers
+        date_header = {'X-Amz-Date': self.get_v4_amz_date_header(
+            timedelta(minutes=10)
+        )}
+        self._test_request_timestamp_sigv4(date_header)
+
+        date_header = {'X-Amz-Date': self.get_v4_amz_date_header(
+            timedelta(minutes=10)
+        )}
+        with self.assertRaises(RequestTimeTooSkewed) as cm, \
+                patch.object(self.s3api.conf, 'allowable_clock_skew', 300):
+            self._test_request_timestamp_sigv4(date_header)
+
+        date_header = {'X-Amz-Date': self.get_v4_amz_date_header(
+            timedelta(days=1)
+        )}
+        with self.assertRaises(RequestTimeTooSkewed) as cm:
+            self._test_request_timestamp_sigv4(date_header)
+
+        # far-future Date header
+        date_header = {'Date': 'Tue, 07 Jul 9999 21:53:04 GMT'}
+        with self.assertRaises(RequestTimeTooSkewed) as cm:
+            self._test_request_timestamp_sigv4(date_header)
+
+        self.assertEqual('403 Forbidden', cm.exception.args[0])
+        self.assertIn(b'The difference between the request time and the '
+                      b'current time is too large.', cm.exception.body)
+
+    def _test_request_timestamp_sigv2(self, date_header):
+        # signature v4 here
+        environ = {
+            'REQUEST_METHOD': 'GET'}
+
+        headers = {'Authorization': 'AWS test:tester:hmac'}
+        headers.update(date_header)
+        req = Request.blank('/', environ=environ, headers=headers)
+        sigv2_req = S3Request(req.environ)
+
+        if 'X-Amz-Date' in date_header:
+            timestamp = mktime(req.headers.get('X-Amz-Date'))
+        elif 'Date' in date_header:
+            timestamp = mktime(req.headers.get('Date'))
+        else:
+            self.fail('Invalid date header specified as test')
+        self.assertEqual(timestamp, int(sigv2_req.timestamp))
+
+    def test_request_timestamp_sigv2(self):
+        access_denied_message = \
+            b'AWS authentication requires a valid Date or x-amz-date header'
+
+        # In v2 format, normal X-Amz-Date header is same
+        date_header = {'X-Amz-Date': self.get_date_header()}
+        self._test_request_timestamp_sigv2(date_header)
+
+        # normal Date header
+        date_header = {'Date': self.get_date_header()}
+        self._test_request_timestamp_sigv2(date_header)
+
+        # mangled X-Amz-Date header
+        date_header = {'X-Amz-Date': self.get_date_header()[:-20]}
+        with self.assertRaises(AccessDenied) as cm:
+            self._test_request_timestamp_sigv2(date_header)
+
+        self.assertEqual('403 Forbidden', cm.exception.args[0])
+        self.assertIn(access_denied_message, cm.exception.body)
+
+        # mangled Date header
+        date_header = {'Date': self.get_date_header()[:-20]}
+        with self.assertRaises(AccessDenied) as cm:
+            self._test_request_timestamp_sigv2(date_header)
+
+        self.assertEqual('403 Forbidden', cm.exception.args[0])
+        self.assertIn(access_denied_message, cm.exception.body)
+
+        # Negative timestamp
+        date_header = {'X-Amz-Date': '00160523T054055Z'}
+        with self.assertRaises(AccessDenied) as cm:
+            self._test_request_timestamp_sigv2(date_header)
+
+        self.assertEqual('403 Forbidden', cm.exception.args[0])
+        self.assertIn(access_denied_message, cm.exception.body)
+
+        # far-past Date header
+        date_header = {'Date': 'Tue, 07 Jul 999 21:53:04 GMT'}
+        with self.assertRaises(AccessDenied) as cm:
+            self._test_request_timestamp_sigv2(date_header)
+
+        self.assertEqual('403 Forbidden', cm.exception.args[0])
+        self.assertIn(access_denied_message, cm.exception.body)
+
+        # far-future Date header
+        date_header = {'Date': 'Tue, 07 Jul 9999 21:53:04 GMT'}
+        with self.assertRaises(RequestTimeTooSkewed) as cm:
+            self._test_request_timestamp_sigv2(date_header)
+
+        self.assertEqual('403 Forbidden', cm.exception.args[0])
+        self.assertIn(b'The difference between the request time and the '
+                      b'current time is too large.', cm.exception.body)
+
+    def test_headers_to_sign_sigv4(self):
+        environ = {
+            'REQUEST_METHOD': 'GET'}
+
+        # host and x-amz-date
+        x_amz_date = self.get_v4_amz_date_header()
+        headers = {
+            'Authorization':
+                'AWS4-HMAC-SHA256 '
+                'Credential=test/%s/us-east-1/s3/aws4_request, '
+                'SignedHeaders=host;x-amz-content-sha256;x-amz-date,'
+                'Signature=X' % self.get_v4_amz_date_header().split('T', 1)[0],
+            'X-Amz-Content-SHA256': '0' * 64,
+            'Date': self.get_date_header(),
+            'X-Amz-Date': x_amz_date}
+
+        req = Request.blank('/', environ=environ, headers=headers)
+        sigv4_req = SigV4Request(req.environ)
+
+        headers_to_sign = sigv4_req._headers_to_sign()
+        self.assertEqual(headers_to_sign, [
+            ('host', 'localhost:80'),
+            ('x-amz-content-sha256', '0' * 64),
+            ('x-amz-date', x_amz_date)])
+
+        # no x-amz-date
+        headers = {
+            'Authorization':
+                'AWS4-HMAC-SHA256 '
+                'Credential=test/%s/us-east-1/s3/aws4_request, '
+                'SignedHeaders=host;x-amz-content-sha256,'
+                'Signature=X' % self.get_v4_amz_date_header().split('T', 1)[0],
+            'X-Amz-Content-SHA256': '1' * 64,
+            'Date': self.get_date_header()}
+
+        req = Request.blank('/', environ=environ, headers=headers)
+        sigv4_req = SigV4Request(req.environ)
+
+        headers_to_sign = sigv4_req._headers_to_sign()
+        self.assertEqual(headers_to_sign, [
+            ('host', 'localhost:80'),
+            ('x-amz-content-sha256', '1' * 64)])
+
+        # SignedHeaders says, host and x-amz-date included but there is not
+        # X-Amz-Date header
+        headers = {
+            'Authorization':
+                'AWS4-HMAC-SHA256 '
+                'Credential=test/%s/us-east-1/s3/aws4_request, '
+                'SignedHeaders=host;x-amz-content-sha256;x-amz-date,'
+                'Signature=X' % self.get_v4_amz_date_header().split('T', 1)[0],
+            'X-Amz-Content-SHA256': '2' * 64,
+            'Date': self.get_date_header()}
+
+        req = Request.blank('/', environ=environ, headers=headers)
+        with self.assertRaises(SignatureDoesNotMatch):
+            sigv4_req = SigV4Request(req.environ)
+            sigv4_req._headers_to_sign()
+
+    def test_canonical_uri_sigv2(self):
+        environ = {
+            'HTTP_HOST': 'bucket1.s3.test.com',
+            'REQUEST_METHOD': 'GET'}
+
+        headers = {'Authorization': 'AWS test:tester:hmac',
+                   'X-Amz-Date': self.get_date_header()}
+
+        # Virtual hosted-style
+        req = Request.blank('/', environ=environ, headers=headers)
+        sigv2_req = S3Request(
+            req.environ, conf=Config({'storage_domains': ['s3.test.com']}))
+        uri = sigv2_req._canonical_uri()
+        self.assertEqual(uri, '/bucket1/')
+        self.assertEqual(req.environ['PATH_INFO'], '/')
+
+        req = Request.blank('/obj1', environ=environ, headers=headers)
+        sigv2_req = S3Request(
+            req.environ, conf=Config({'storage_domains': ['s3.test.com']}))
+        uri = sigv2_req._canonical_uri()
+        self.assertEqual(uri, '/bucket1/obj1')
+        self.assertEqual(req.environ['PATH_INFO'], '/obj1')
+
+        req = Request.blank('/obj2', environ=environ, headers=headers)
+        sigv2_req = S3Request(
+            req.environ, conf=Config({
+                'storage_domains': ['alternate.domain', 's3.test.com']}))
+        uri = sigv2_req._canonical_uri()
+        self.assertEqual(uri, '/bucket1/obj2')
+        self.assertEqual(req.environ['PATH_INFO'], '/obj2')
+
+        # Now check the other storage_domain
+        environ = {
+            'HTTP_HOST': 'bucket1.alternate.domain',
+            'REQUEST_METHOD': 'GET'}
+        req = Request.blank('/obj2', environ=environ, headers=headers)
+        sigv2_req = S3Request(
+            req.environ, conf=Config({
+                'storage_domains': ['alternate.domain', 's3.test.com']}))
+        uri = sigv2_req._canonical_uri()
+        self.assertEqual(uri, '/bucket1/obj2')
+        self.assertEqual(req.environ['PATH_INFO'], '/obj2')
+
+        # Non existent storage_domain means we can't find the  container
+        environ = {
+            'HTTP_HOST': 'bucket1.incorrect.domain',
+            'REQUEST_METHOD': 'GET'}
+        req = Request.blank('/obj2', environ=environ, headers=headers)
+        sigv2_req = S3Request(
+            req.environ, conf=Config({
+                'storage_domains': ['alternate.domain', 's3.test.com']}))
+        uri = sigv2_req._canonical_uri()
+        # uo oh, no bucket
+        self.assertEqual(uri, '/obj2')
+        self.assertEqual(sigv2_req.container_name, 'obj2')
+
+        environ = {
+            'HTTP_HOST': 's3.test.com',
+            'REQUEST_METHOD': 'GET'}
+
+        # Path-style
+        req = Request.blank('/', environ=environ, headers=headers)
+        sigv2_req = S3Request(req.environ)
+        uri = sigv2_req._canonical_uri()
+
+        self.assertEqual(uri, '/')
+        self.assertEqual(req.environ['PATH_INFO'], '/')
+
+        req = Request.blank('/bucket1/obj1',
+                            environ=environ,
+                            headers=headers)
+        sigv2_req = S3Request(req.environ)
+        uri = sigv2_req._canonical_uri()
+        self.assertEqual(uri, '/bucket1/obj1')
+        self.assertEqual(req.environ['PATH_INFO'], '/bucket1/obj1')
+
+    def test_canonical_uri_sigv4(self):
+        environ = {
+            'HTTP_HOST': 'bucket.s3.test.com',
+            'REQUEST_METHOD': 'GET'}
+
+        # host and x-amz-date
+        x_amz_date = self.get_v4_amz_date_header()
+        headers = {
+            'Authorization':
+                'AWS4-HMAC-SHA256 '
+                'Credential=test/%s/us-east-1/s3/aws4_request, '
+                'SignedHeaders=host;x-amz-content-sha256;x-amz-date,'
+                'Signature=X' % self.get_v4_amz_date_header().split('T', 1)[0],
+            'X-Amz-Content-SHA256': '0' * 64,
+            'Date': self.get_date_header(),
+            'X-Amz-Date': x_amz_date}
+
+        # Virtual hosted-style
+        self.s3api.conf.storage_domains = ['s3.test.com']
+        req = Request.blank('/', environ=environ, headers=headers)
+        sigv4_req = SigV4Request(req.environ)
+        uri = sigv4_req._canonical_uri()
+
+        self.assertEqual(uri, b'/')
+        self.assertEqual(req.environ['PATH_INFO'], '/')
+
+        req = Request.blank('/obj1', environ=environ, headers=headers)
+        sigv4_req = SigV4Request(req.environ)
+        uri = sigv4_req._canonical_uri()
+
+        self.assertEqual(uri, b'/obj1')
+        self.assertEqual(req.environ['PATH_INFO'], '/obj1')
+
+        environ = {
+            'HTTP_HOST': 's3.test.com',
+            'REQUEST_METHOD': 'GET'}
+
+        # Path-style
+        self.s3api.conf.storage_domains = []
+        req = Request.blank('/', environ=environ, headers=headers)
+        sigv4_req = SigV4Request(req.environ)
+        uri = sigv4_req._canonical_uri()
+
+        self.assertEqual(uri, b'/')
+        self.assertEqual(req.environ['PATH_INFO'], '/')
+
+        req = Request.blank('/bucket/obj1',
+                            environ=environ,
+                            headers=headers)
+        sigv4_req = SigV4Request(req.environ)
+        uri = sigv4_req._canonical_uri()
+
+        self.assertEqual(uri, b'/bucket/obj1')
+        self.assertEqual(req.environ['PATH_INFO'], '/bucket/obj1')
+
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def _test_check_signature_sigv2(self, secret):
+        # See https://web.archive.org/web/20151226025049/http://
+        # docs.aws.amazon.com//AmazonS3/latest/dev/RESTAuthentication.html
+        req = Request.blank('/photos/puppy.jpg', headers={
+            'Host': 'johnsmith.s3.amazonaws.com',
+            'Date': 'Tue, 27 Mar 2007 19:36:42 +0000',
+            'Authorization': ('AWS AKIAIOSFODNN7EXAMPLE:'
+                              'bWq2s1WEIj+Ydj0vQ697zp+IXMU='),
+        })
+        sigv2_req = S3Request(req.environ, conf=Config({
+            'storage_domains': ['s3.amazonaws.com']}))
+        expected_sts = b'\n'.join([
+            b'GET',
+            b'',
+            b'',
+            b'Tue, 27 Mar 2007 19:36:42 +0000',
+            b'/johnsmith/photos/puppy.jpg',
+        ])
+        self.assertEqual(expected_sts, sigv2_req.sig_checker.string_to_sign)
+        self.assertTrue(sigv2_req.sig_checker.check_signature(secret))
+
+        req = Request.blank('/photos/puppy.jpg', method='PUT', headers={
+            'Content-Type': 'image/jpeg',
+            'Content-Length': '94328',
+            'Host': 'johnsmith.s3.amazonaws.com',
+            'Date': 'Tue, 27 Mar 2007 21:15:45 +0000',
+            'Authorization': ('AWS AKIAIOSFODNN7EXAMPLE:'
+                              'MyyxeRY7whkBe+bq8fHCL/2kKUg='),
+        })
+        sigv2_req = S3Request(req.environ, conf=Config({
+            'storage_domains': ['s3.amazonaws.com']}))
+        expected_sts = b'\n'.join([
+            b'PUT',
+            b'',
+            b'image/jpeg',
+            b'Tue, 27 Mar 2007 21:15:45 +0000',
+            b'/johnsmith/photos/puppy.jpg',
+        ])
+        self.assertEqual(expected_sts, sigv2_req.sig_checker.string_to_sign)
+        self.assertTrue(sigv2_req.sig_checker.check_signature(secret))
+
+        req = Request.blank(
+            '/?prefix=photos&max-keys=50&marker=puppy',
+            headers={
+                'User-Agent': 'Mozilla/5.0',
+                'Host': 'johnsmith.s3.amazonaws.com',
+                'Date': 'Tue, 27 Mar 2007 19:42:41 +0000',
+                'Authorization': ('AWS AKIAIOSFODNN7EXAMPLE:'
+                                  'htDYFYduRNen8P9ZfE/s9SuKy0U='),
+            })
+        sigv2_req = S3Request(req.environ, conf=Config({
+            'storage_domains': ['s3.amazonaws.com']}))
+        expected_sts = b'\n'.join([
+            b'GET',
+            b'',
+            b'',
+            b'Tue, 27 Mar 2007 19:42:41 +0000',
+            b'/johnsmith/',
+        ])
+        self.assertEqual(expected_sts, sigv2_req.sig_checker.string_to_sign)
+        self.assertTrue(sigv2_req.sig_checker.check_signature(secret))
+
+        with patch('swift.common.middleware.s3api.s3request.streq_const_time',
+                   return_value=True) as mock_eq:
+            self.assertTrue(sigv2_req.sig_checker.check_signature(secret))
+        mock_eq.assert_called_once()
+
+    def test_check_signature_sigv2(self):
+        self._test_check_signature_sigv2(
+            'wJalrXUtnFEMI/K7MDENG/bPxRfiCYEXAMPLEKEY')
+
+    def test_check_signature_sigv2_unicode_string(self):
+        self._test_check_signature_sigv2(
+            u'wJalrXUtnFEMI/K7MDENG/bPxRfiCYEXAMPLEKEY')
+
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def test_check_signature_multi_bytes_secret_failure(self):
+        # Test v2 check_signature with multi bytes invalid secret
+        req = Request.blank('/photos/puppy.jpg', headers={
+            'Host': 'johnsmith.s3.amazonaws.com',
+            'Date': 'Tue, 27 Mar 2007 19:36:42 +0000',
+            'Authorization': ('AWS AKIAIOSFODNN7EXAMPLE:'
+                              'bWq2s1WEIj+Ydj0vQ697zp+IXMU='),
+        })
+        sigv2_req = S3Request(req.environ, Config({
+            'storage_domains': ['s3.amazonaws.com']}))
+        # This is a failure case with utf-8 non-ascii multi-bytes charactor
+        # but we expect to return just False instead of exceptions
+        self.assertFalse(sigv2_req.sig_checker.check_signature(
+            u'\u30c9\u30e9\u30b4\u30f3'))
+
+        # Test v4 check_signature with multi bytes invalid secret
+        amz_date_header = self.get_v4_amz_date_header()
+        req = Request.blank('/photos/puppy.jpg', headers={
+            'Authorization':
+                'AWS4-HMAC-SHA256 '
+                'Credential=test/%s/us-east-1/s3/aws4_request, '
+                'SignedHeaders=host;x-amz-content-sha256;x-amz-date,'
+                'Signature=X' % amz_date_header.split('T', 1)[0],
+            'X-Amz-Content-SHA256': '0' * 64,
+            'X-Amz-Date': amz_date_header
+        })
+        sigv4_req = SigV4Request(
+            req.environ, Config({'storage_domains': ['s3.amazonaws.com']}))
+        self.assertFalse(sigv4_req.sig_checker.check_signature(
+            u'\u30c9\u30e9\u30b4\u30f3'))
+
+        with patch('swift.common.middleware.s3api.s3request.streq_const_time',
+                   return_value=False) as mock_eq:
+            self.assertFalse(sigv4_req.sig_checker.check_signature(
+                u'\u30c9\u30e9\u30b4\u30f3'))
+        mock_eq.assert_called_once()
+
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def test_check_signature_sigv4_unsigned_payload(self):
+        environ = {
+            'HTTP_HOST': 'bucket.s3.test.com',
+            'REQUEST_METHOD': 'GET'}
+        headers = {
+            'Authorization':
+                'AWS4-HMAC-SHA256 '
+                'Credential=test/20210104/us-east-1/s3/aws4_request, '
+                'SignedHeaders=host;x-amz-content-sha256;x-amz-date,'
+                'Signature=f721a7941d5b7710344bc62cc45f87e66f4bb1dd00d9075ee61'
+                '5b1a5c72b0f8c',
+            'X-Amz-Content-SHA256': 'UNSIGNED-PAYLOAD',
+            'Date': 'Mon, 04 Jan 2021 10:26:23 -0000',
+            'X-Amz-Date': '20210104T102623Z'}
+
+        # Virtual hosted-style
+        self.s3api.conf.storage_domains = ['s3.test.com']
+        req = Request.blank('/', environ=environ, headers=headers)
+        sigv4_req = SigV4Request(req.environ)
+        self.assertTrue(
+            sigv4_req._canonical_request().endswith(b'UNSIGNED-PAYLOAD'))
+        self.assertTrue(sigv4_req.sig_checker.check_signature('secret'))
+
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def test_check_signature_sigv4_url_encode(self):
+        environ = {
+            'HTTP_HOST': 'bucket.s3.test.com',
+            'REQUEST_METHOD': 'PUT',
+            'RAW_PATH_INFO': '/test/~/file,1_1:1-1'}
+        headers = {
+            'Authorization':
+                'AWS4-HMAC-SHA256 '
+                'Credential=test/20210104/us-east-1/s3/aws4_request, '
+                'SignedHeaders=host;x-amz-content-sha256;x-amz-date,'
+                'Signature=06559fbf839b7ceac19d69f510a2d3b7dcb569c8df310965cc1'
+                '6a1dc55b3394a',
+            'X-Amz-Content-SHA256': 'UNSIGNED-PAYLOAD',
+            'Date': 'Mon, 04 Jan 2021 10:26:23 -0000',
+            'X-Amz-Date': '20210104T102623Z'}
+
+        # Virtual hosted-style
+        self.s3api.conf.storage_domain = 's3.test.com'
+        req = Request.blank(
+            environ['RAW_PATH_INFO'], environ=environ, headers=headers)
+        sigv4_req = SigV4Request(req.environ)
+        canonical_req = sigv4_req._canonical_request()
+        self.assertIn(b'PUT\n/test/~/file%2C1_1%3A1-1\n', canonical_req)
+        self.assertTrue(canonical_req.endswith(b'UNSIGNED-PAYLOAD'))
+        self.assertTrue(sigv4_req.sig_checker.check_signature('secret'))
+
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def test_check_sigv4_req_zero_content_length_sha256(self):
+        # Virtual hosted-style
+        self.s3api.conf.storage_domains = ['s3.test.com']
+
+        # bad sha256 -- but note that SHAs are not checked for GET/HEAD!
+        environ = {
+            'HTTP_HOST': 'bucket.s3.test.com',
+            'REQUEST_METHOD': 'PUT'}
+        headers = {
+            'Authorization':
+                'AWS4-HMAC-SHA256 '
+                'Credential=test/20210104/us-east-1/s3/aws4_request, '
+                'SignedHeaders=host;x-amz-content-sha256;x-amz-date,'
+                'Signature=5f31c77dbc63e7c6ffc84dae60a9261c57c44884fe7927baeb9'
+                '84f418d4d511a',
+            'X-Amz-Content-SHA256': '0' * 64,
+            'Date': 'Mon, 04 Jan 2021 10:26:23 -0000',
+            'X-Amz-Date': '20210104T102623Z',
+            'Content-Length': 0,
+        }
+
+        # lowercase sha256
+        req = Request.blank('/', environ=environ, headers=headers)
+        self.assertRaises(XAmzContentSHA256Mismatch, SigV4Request, req.environ)
+        sha256_of_nothing = hashlib.sha256().hexdigest().encode('ascii')
+        headers = {
+            'Authorization':
+                'AWS4-HMAC-SHA256 '
+                'Credential=test/20210104/us-east-1/s3/aws4_request, '
+                'SignedHeaders=host;x-amz-content-sha256;x-amz-date,'
+                'Signature=96df261d8f0b617b7c6368e0c5d96ee61f1ec84005e826ece65'
+                'c0e0f97eba945',
+            'X-Amz-Content-SHA256': sha256_of_nothing,
+            'Date': 'Mon, 04 Jan 2021 10:26:23 -0000',
+            'X-Amz-Date': '20210104T102623Z',
+            'Content-Length': 0,
+        }
+        req = Request.blank('/', environ=environ, headers=headers)
+        sigv4_req = SigV4Request(req.environ)
+        self.assertTrue(
+            sigv4_req._canonical_request().endswith(sha256_of_nothing))
+        self.assertTrue(sigv4_req.sig_checker.check_signature('secret'))
+
+        # uppercase sha256 -- signature changes, but content's valid
+        headers = {
+            'Authorization':
+                'AWS4-HMAC-SHA256 '
+                'Credential=test/20210104/us-east-1/s3/aws4_request, '
+                'SignedHeaders=host;x-amz-content-sha256;x-amz-date,'
+                'Signature=7a3c396fd6043fb397888e6f4d6acc294a99636ff0bb57b283d'
+                '9e075ed87fce2',
+            'X-Amz-Content-SHA256': sha256_of_nothing.upper(),
+            'Date': 'Mon, 04 Jan 2021 10:26:23 -0000',
+            'X-Amz-Date': '20210104T102623Z',
+            'Content-Length': 0,
+        }
+        req = Request.blank('/', environ=environ, headers=headers)
+        sigv4_req = SigV4Request(req.environ)
+        self.assertTrue(
+            sigv4_req._canonical_request().endswith(sha256_of_nothing.upper()))
+        self.assertTrue(sigv4_req.sig_checker.check_signature('secret'))
+
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def test_v4_req_xmz_content_sha256_mismatch(self):
+        # Virtual hosted-style
+        def fake_app(environ, start_response):
+            environ['wsgi.input'].read()
+
+        self.s3api.conf.storage_domains = ['s3.test.com']
+        environ = {
+            'HTTP_HOST': 'bucket.s3.test.com',
+            'REQUEST_METHOD': 'PUT'}
+        sha256_of_body = hashlib.sha256(b'body').hexdigest()
+        headers = {
+            'Authorization':
+                'AWS4-HMAC-SHA256 '
+                'Credential=test/20210104/us-east-1/s3/aws4_request, '
+                'SignedHeaders=host;x-amz-date,'
+                'Signature=5f31c77dbc63e7c6ffc84dae60a9261c57c44884fe7927baeb9'
+                '84f418d4d511a',
+            'Date': 'Mon, 04 Jan 2021 10:26:23 -0000',
+            'X-Amz-Date': '20210104T102623Z',
+            'Content-Length': 4,
+            'X-Amz-Content-SHA256': sha256_of_body,
+        }
+        req = Request.blank('/', environ=environ, headers=headers,
+                            body=b'not_body')
+        with self.assertRaises(XAmzContentSHA256Mismatch) as caught:
+            SigV4Request(req.environ).get_response(fake_app)
+        self.assertIn(b'<Code>XAmzContentSHA256Mismatch</Code>',
+                      caught.exception.body)
+        self.assertIn(
+            ('<ClientComputedContentSHA256>%s</ClientComputedContentSHA256>'
+             % sha256_of_body).encode('ascii'),
+            caught.exception.body)
+        self.assertIn(
+            ('<S3ComputedContentSHA256>%s</S3ComputedContentSHA256>'
+             % hashlib.sha256(b'not_body').hexdigest()).encode('ascii'),
+            caught.exception.body)
+
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def test_v4_req_amz_content_sha256_missing(self):
+        # Virtual hosted-style
+        self.s3api.conf.storage_domains = ['s3.test.com']
+        environ = {
+            'HTTP_HOST': 'bucket.s3.test.com',
+            'REQUEST_METHOD': 'PUT'}
+        headers = {
+            'Authorization':
+                'AWS4-HMAC-SHA256 '
+                'Credential=test/20210104/us-east-1/s3/aws4_request, '
+                'SignedHeaders=host;x-amz-date,'
+                'Signature=5f31c77dbc63e7c6ffc84dae60a9261c57c44884fe7927baeb9'
+                '84f418d4d511a',
+            'Date': 'Mon, 04 Jan 2021 10:26:23 -0000',
+            'X-Amz-Date': '20210104T102623Z',
+            'Content-Length': 0,
+        }
+        req = Request.blank('/', environ=environ, headers=headers)
+        self.assertRaises(InvalidRequest, SigV4Request, req.environ)
+
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def test_v4_req_x_mz_content_sha256_bad_format(self):
+        # Virtual hosted-style
+        self.s3api.conf.storage_domains = ['s3.test.com']
+        environ = {
+            'HTTP_HOST': 'bucket.s3.test.com',
+            'REQUEST_METHOD': 'PUT'}
+        headers = {
+            'Authorization':
+                'AWS4-HMAC-SHA256 '
+                'Credential=test/20210104/us-east-1/s3/aws4_request, '
+                'SignedHeaders=host;x-amz-date,'
+                'Signature=5f31c77dbc63e7c6ffc84dae60a9261c57c44884fe7927baeb9'
+                '84f418d4d511a',
+            'Date': 'Mon, 04 Jan 2021 10:26:23 -0000',
+            'X-Amz-Date': '20210104T102623Z',
+            'Content-Length': 0,
+            'X-Amz-Content-SHA256': '0' * 63  # too short
+        }
+        req = Request.blank('/', environ=environ, headers=headers)
+        self.assertRaises(InvalidArgument, SigV4Request, req.environ)
+
+        headers['X-Amz-Content-SHA256'] = '0' * 63 + 'x'  # bad character
+        req = Request.blank('/', environ=environ, headers=headers)
+        self.assertRaises(InvalidArgument, SigV4Request, req.environ)
+
+    def test_validate_part_number(self):
+        sw_req = Request.blank('/nojunk',
+                               environ={'REQUEST_METHOD': 'GET'},
+                               headers={
+                                   'Authorization': 'AWS test:tester:hmac',
+                                   'Date': self.get_date_header()})
+        req = S3Request(sw_req.environ)
+        self.assertIsNone(req.validate_part_number())
+
+        # ok
+        sw_req = Request.blank('/nojunk?partNumber=102',
+                               environ={'REQUEST_METHOD': 'GET'},
+                               headers={
+                                   'Authorization': 'AWS test:tester:hmac',
+                                   'Date': self.get_date_header()})
+        req = S3Request(sw_req.environ)
+        self.assertEqual(102, req.validate_part_number())
+        req = S3Request(sw_req.environ,
+                        conf=Config({'max_upload_part_num': 100}))
+        self.assertEqual(102, req.validate_part_number(102))
+        req = S3Request(sw_req.environ,
+                        conf=Config({'max_upload_part_num': 102}))
+        self.assertEqual(102, req.validate_part_number(102))
+
+    def test_validate_part_number_invalid_argument(self):
+        def check_invalid_argument(part_num, max_parts, parts_count, exp_max):
+            sw_req = Request.blank('/nojunk?partNumber=%s' % part_num,
+                                   environ={'REQUEST_METHOD': 'GET'},
+                                   headers={
+                                       'Authorization': 'AWS test:tester:hmac',
+                                       'Date': self.get_date_header()})
+            req = S3Request(sw_req.environ,
+                            conf=Config({'max_upload_part_num': max_parts}))
+            with self.assertRaises(InvalidPartArgument) as cm:
+                req.validate_part_number(parts_count=parts_count)
+            self.assertEqual('400 Bad Request', str(cm.exception))
+            self.assertIn(
+                b'Part number must be an integer between 1 and %d' % exp_max,
+                cm.exception.body)
+
+        check_invalid_argument(102, 99, None, 99)
+        check_invalid_argument(102, 100, 99, 100)
+        check_invalid_argument(102, 100, 101, 101)
+        check_invalid_argument(102, 101, 100, 101)
+        check_invalid_argument(102, 101, 101, 101)
+        check_invalid_argument('banana', 1000, None, 1000)
+        check_invalid_argument(0, 10000, None, 10000)
+
+    def test_validate_part_number_invalid_part_number(self):
+        def check_invalid_part_num(part_num, max_parts, parts_count):
+            sw_req = Request.blank('/nojunk?partNumber=%s' % part_num,
+                                   environ={'REQUEST_METHOD': 'GET'},
+                                   headers={
+                                       'Authorization': 'AWS test:tester:hmac',
+                                       'Date': self.get_date_header()})
+            req = S3Request(sw_req.environ,
+                            conf=Config({'max_upload_part_num': max_parts}))
+            with self.assertRaises(InvalidPartNumber) as cm:
+                req.validate_part_number(parts_count=parts_count)
+            self.assertEqual('416 Requested Range Not Satisfiable',
+                             str(cm.exception))
+            self.assertIn(b'The requested partnumber is not satisfiable',
+                          cm.exception.body)
+
+        check_invalid_part_num(102, 10000, 1)
+        check_invalid_part_num(102, 102, 101)
+        check_invalid_part_num(102, 10000, 101)
+
+    def test_validate_part_number_with_range_header(self):
+        sw_req = Request.blank('/nojunk?partNumber=1',
+                               environ={'REQUEST_METHOD': 'GET'},
+                               headers={
+                                   'Range': 'bytes=1-2',
+                                   'Authorization': 'AWS test:tester:hmac',
+                                   'Date': self.get_date_header()})
+        req = S3Request(sw_req.environ)
+        with self.assertRaises(InvalidRequest) as cm:
+            req.validate_part_number()
+        self.assertEqual('400 Bad Request',
+                         str(cm.exception))
+        self.assertIn(b'Cannot specify both Range header and partNumber query '
+                      b'parameter', cm.exception.body)
+
+        # bad part number AND Range header
+        sw_req = Request.blank('/nojunk?partNumber=0',
+                               environ={'REQUEST_METHOD': 'GET'},
+                               headers={
+                                   'Range': 'bytes=1-2',
+                                   'Authorization': 'AWS test:tester:hmac',
+                                   'Date': self.get_date_header()})
+        req = S3Request(sw_req.environ)
+        with self.assertRaises(InvalidRequest) as cm:
+            req.validate_part_number()
+        self.assertEqual('400 Bad Request',
+                         str(cm.exception))
+        self.assertIn(b'Cannot specify both Range header and partNumber query '
+                      b'parameter', cm.exception.body)
+
+    @mock.patch('swift.common.middleware.s3api.subresource.ACL.check_owner')
+    def test_sigv2_content_sha256_ok(self, mock_check_owner):
+        good_sha_256 = hashlib.sha256(b'body').hexdigest()
+        req = Request.blank('/bucket/object',
+                            method='PUT',
+                            body=b'body',
+                            headers={'content-encoding': 'aws-chunked',
+                                     'x-amz-content-sha256': good_sha_256,
+                                     'Content-Length': '4',
+                                     'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status, '200 OK')
+
+    @mock.patch('swift.common.middleware.s3api.subresource.ACL.check_owner')
+    def test_sigv2_content_sha256_bad_value(self, mock_check_owner):
+        good_sha_256 = hashlib.sha256(b'body').hexdigest()
+        bad_sha_256 = hashlib.sha256(b'not body').hexdigest()
+        req = Request.blank('/bucket/object',
+                            method='PUT',
+                            body=b'body',
+                            headers={'content-encoding': 'aws-chunked',
+                                     'x-amz-content-sha256':
+                                         bad_sha_256,
+                                     'Content-Length': '4',
+                                     'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status, '400 Bad Request')
+        self.assertIn(f'<ClientComputedContentSHA256>{bad_sha_256}'
+                      '</ClientComputedContentSHA256>',
+                      body.decode('utf8'))
+        self.assertIn(f'<S3ComputedContentSHA256>{good_sha_256}'
+                      '</S3ComputedContentSHA256>',
+                      body.decode('utf8'))
+
+    @mock.patch('swift.common.middleware.s3api.subresource.ACL.check_owner')
+    def test_sigv2_content_encoding_aws_chunked_is_ignored(
+            self, mock_check_owner):
+        req = Request.blank('/bucket/object',
+                            method='PUT',
+                            headers={'content-encoding': 'aws-chunked',
+                                     'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+
+        status, _, body = self.call_s3api(req)
+        self.assertEqual(status, '200 OK')
+
+    def test_sigv2_content_sha256_streaming_is_bad_request(self):
+        def do_test(sha256):
+            req = Request.blank(
+                '/bucket/object',
+                method='PUT',
+                headers={'content-encoding': 'aws-chunked',
+                         'x-amz-content-sha256': sha256,
+                         'Content-Length': '0',
+                         'x-amz-decoded-content-length': '0',
+                         'Authorization': 'AWS test:tester:hmac',
+                         'Date': self.get_date_header()})
+            status, _, body = self.call_s3api(req)
+            # sig v2 wants that to actually be the SHA!
+            self.assertEqual(status, '400 Bad Request', body)
+            self.assertEqual(self._get_error_code(body),
+                             'XAmzContentSHA256Mismatch')
+            self.assertIn(f'<ClientComputedContentSHA256>{sha256}'
+                          '</ClientComputedContentSHA256>',
+                          body.decode('utf8'))
+
+        do_test('STREAMING-UNSIGNED-PAYLOAD-TRAILER')
+        do_test('STREAMING-AWS4-HMAC-SHA256-PAYLOAD')
+        do_test('STREAMING-AWS4-HMAC-SHA256-PAYLOAD-TRAILER')
+        do_test('STREAMING-AWS4-ECDSA-P256-SHA256-PAYLOAD')
+        do_test('STREAMING-AWS4-ECDSA-P256-SHA256-PAYLOAD-TRAILER')
+
+    def test_sigv2_content_sha256_streaming_no_decoded_content_length(self):
+        # MissingContentLength trumps XAmzContentSHA256Mismatch
+        def do_test(sha256):
+            req = Request.blank(
+                '/bucket/object',
+                method='PUT',
+                headers={'content-encoding': 'aws-chunked',
+                         'x-amz-content-sha256': sha256,
+                         'Content-Length': '0',
+                         'Authorization': 'AWS test:tester:hmac',
+                         'Date': self.get_date_header()})
+            status, _, body = self.call_s3api(req)
+            self.assertEqual(status, '411 Length Required', body)
+            self.assertEqual(self._get_error_code(body),
+                             'MissingContentLength')
+
+        do_test('STREAMING-UNSIGNED-PAYLOAD-TRAILER')
+        do_test('STREAMING-AWS4-HMAC-SHA256-PAYLOAD')
+        do_test('STREAMING-AWS4-HMAC-SHA256-PAYLOAD-TRAILER')
+        do_test('STREAMING-AWS4-ECDSA-P256-SHA256-PAYLOAD')
+        do_test('STREAMING-AWS4-ECDSA-P256-SHA256-PAYLOAD-TRAILER')
+
+    def _make_sig_v4_unsigned_payload_req(self, body=None, extra_headers=None):
+        environ = {
+            'HTTP_HOST': 's3.test.com',
+            'REQUEST_METHOD': 'PUT',
+            'RAW_PATH_INFO': '/test/file'}
+        headers = {
+            'Authorization':
+                'AWS4-HMAC-SHA256 '
+                'Credential=test/20220330/us-east-1/s3/aws4_request,'
+                'SignedHeaders=content-length;host;x-amz-content-sha256;'
+                'x-amz-date,'
+                'Signature=d14bba0da2bba545c8275cb75c99b326cbdfdad015465dbaeca'
+                'e18c7647c73da',
+            'Content-Length': '27',
+            'Host': 's3.test.com',
+            'X-Amz-Content-SHA256': 'UNSIGNED-PAYLOAD',
+            'X-Amz-Date': '20220330T095351Z',
+        }
+        if extra_headers:
+            headers.update(extra_headers)
+        return Request.blank(environ['RAW_PATH_INFO'], environ=environ,
+                             headers=headers, body=body)
+
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def _test_sig_v4_unsigned_payload(self, body=None, extra_headers=None):
+        req = self._make_sig_v4_unsigned_payload_req(
+            body=body, extra_headers=extra_headers)
+        sigv4_req = SigV4Request(req.environ)
+        # Verify header signature
+        self.assertTrue(sigv4_req.sig_checker.check_signature('secret'))
+        return sigv4_req
+
+    def test_sig_v4_unsgnd_pyld_no_crc_ok(self):
+        body = b'abcdefghijklmnopqrstuvwxyz\n'
+        sigv4_req = self._test_sig_v4_unsigned_payload(body=body)
+        resp_body = sigv4_req.environ['wsgi.input'].read()
+        self.assertEqual(body, resp_body)
+
+    def test_sig_v4_unsgnd_pyld_crc32_ok(self):
+        body = b'abcdefghijklmnopqrstuvwxyz\n'
+        crc = base64.b64encode(checksum.crc32(body).digest())
+        sigv4_req = self._test_sig_v4_unsigned_payload(
+            body=body,
+            extra_headers={'X-Amz-Checksum-Crc32': crc}
+        )
+        resp_body = sigv4_req.environ['wsgi.input'].read()
+        self.assertEqual(body, resp_body)
+
+    def test_sig_v4_unsgnd_pyld_crc32_mismatch(self):
+        body = b'abcdefghijklmnopqrstuvwxyz\n'
+        crc = base64.b64encode(checksum.crc32(b'not the body').digest())
+        sigv4_req = self._test_sig_v4_unsigned_payload(
+            body=body,
+            extra_headers={'X-Amz-Checksum-Crc32': crc}
+        )
+        with self.assertRaises(S3InputChecksumMismatch):
+            sigv4_req.environ['wsgi.input'].read()
+
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def test_sig_v4_unsgnd_pyld_crc32_invalid(self):
+        req = self._make_sig_v4_unsigned_payload_req(
+            extra_headers={'X-Amz-Checksum-Crc32': 'not a crc'}
+        )
+        with self.assertRaises(s3request.InvalidRequest):
+            SigV4Request(req.environ)
+
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def test_sig_v4_unsgnd_pyld_declares_crc32_trailer(self):
+        req = self._make_sig_v4_unsigned_payload_req(
+            extra_headers={'X-Amz-Trailer': 'x-amz-checksum-crc32'})
+        with self.assertRaises(s3request.MalformedTrailerError):
+            SigV4Request(req.environ)
+
+    def _make_valid_v4_streaming_hmac_sha256_payload_request(self):
+        environ = {
+            'HTTP_HOST': 's3.test.com',
+            'REQUEST_METHOD': 'PUT',
+            'RAW_PATH_INFO': '/test/file'}
+        headers = {
+            'Authorization':
+                'AWS4-HMAC-SHA256 '
+                'Credential=test/20220330/us-east-1/s3/aws4_request,'
+                'SignedHeaders=content-encoding;content-length;host;x-amz-con'
+                'tent-sha256;x-amz-date;x-amz-decoded-content-length,'
+                'Signature=aa1b67fc5bc4503d05a636e6e740dcb757d3aa2352f32e7493f'
+                '261f71acbe1d5',
+            'Content-Encoding': 'aws-chunked',
+            'Content-Length': '369',
+            'Host': 's3.test.com',
+            'X-Amz-Content-SHA256': 'STREAMING-AWS4-HMAC-SHA256-PAYLOAD',
+            'X-Amz-Date': '20220330T095351Z',
+            'X-Amz-Decoded-Content-Length': '25'}
+        body = 'a;chunk-signature=4a397f01db2cd700402dc38931b462e789ae49911d' \
+               'c229d93c9f9c46fd3e0b21\r\nabcdefghij\r\n' \
+               'a;chunk-signature=49177768ee3e9b77c6353ab9f3b9747d188adc11d4' \
+               '5b38be94a130616e6d64dc\r\nklmnopqrst\r\n' \
+               '5;chunk-signature=c884ebbca35b923cf864854e2a906aa8f5895a7140' \
+               '6c73cc6d4ee057527a8c23\r\nuvwz\n\r\n' \
+               '0;chunk-signature=50f7c470d6bf6c59126eecc2cb020d532a69c92322' \
+               'ddfbbd21811de45491022c\r\n\r\n'
+
+        req = Request.blank(environ['RAW_PATH_INFO'], environ=environ,
+                            headers=headers, body=body.encode('utf8'))
+        return SigV4Request(req.environ)
+
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def test_check_signature_v4_hmac_sha256_payload_chunk_valid(self):
+        s3req = self._make_valid_v4_streaming_hmac_sha256_payload_request()
+        # Verify header signature
+        self.assertTrue(s3req.sig_checker.check_signature('secret'))
+
+        self.assertEqual(b'abcdefghij', s3req.environ['wsgi.input'].read(10))
+        self.assertEqual(b'klmnopqrst', s3req.environ['wsgi.input'].read(10))
+        self.assertEqual(b'uvwz\n', s3req.environ['wsgi.input'].read(10))
+        self.assertEqual(b'', s3req.environ['wsgi.input'].read(10))
+        self.assertTrue(s3req.sig_checker._all_chunk_signatures_valid)
+
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def test_check_signature_v4_hmac_sha256_payload_no_secret(self):
+        # verify S3InputError if auth middleware does NOT call check_signature
+        # before the stream is read
+        s3req = self._make_valid_v4_streaming_hmac_sha256_payload_request()
+        with self.assertRaises(s3request.S3InputMissingSecret) as cm:
+            s3req.environ['wsgi.input'].read(10)
+
+        # ...which in context gets translated to a 501 response
+        s3req = self._make_valid_v4_streaming_hmac_sha256_payload_request()
+        with self.assertRaises(s3response.S3NotImplemented) as cm, \
+                s3req.translate_read_errors():
+            s3req.environ['wsgi.input'].read(10)
+        self.assertIn(
+            'Transferring payloads in multiple chunks using aws-chunked is '
+            'not supported.', str(cm.exception.body))
+
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def test_check_signature_v4_hmac_sha256_payload_chunk_invalid(self):
+        environ = {
+            'HTTP_HOST': 's3.test.com',
+            'REQUEST_METHOD': 'PUT',
+            'RAW_PATH_INFO': '/test/file'}
+        headers = {
+            'Authorization':
+                'AWS4-HMAC-SHA256 '
+                'Credential=test/20220330/us-east-1/s3/aws4_request,'
+                'SignedHeaders=content-encoding;content-length;host;x-amz-con'
+                'tent-sha256;x-amz-date;x-amz-decoded-content-length,'
+                'Signature=aa1b67fc5bc4503d05a636e6e740dcb757d3aa2352f32e7493f'
+                '261f71acbe1d5',
+            'Content-Encoding': 'aws-chunked',
+            'Content-Length': '369',
+            'Host': 's3.test.com',
+            'X-Amz-Content-SHA256': 'STREAMING-AWS4-HMAC-SHA256-PAYLOAD',
+            'X-Amz-Date': '20220330T095351Z',
+            'X-Amz-Decoded-Content-Length': '25'}
+        # second chunk signature is incorrect, should be
+        # 49177768ee3e9b77c6353ab9f3b9747d188adc11d45b38be94a130616e6d64dc
+        body = 'a;chunk-signature=4a397f01db2cd700402dc38931b462e789ae49911d' \
+               'c229d93c9f9c46fd3e0b21\r\nabcdefghij\r\n' \
+               'a;chunk-signature=49177768ee3e9b77c6353ab0f3b9747d188adc11d4' \
+               '5b38be94a130616e6d64dc\r\nklmnopqrst\r\n' \
+               '5;chunk-signature=c884ebbca35b923cf864854e2a906aa8f5895a7140' \
+               '6c73cc6d4ee057527a8c23\r\nuvwz\n\r\n' \
+               '0;chunk-signature=50f7c470d6bf6c59126eecc2cb020d532a69c92322' \
+               'ddfbbd21811de45491022c\r\n\r\n'
+
+        req = Request.blank(environ['RAW_PATH_INFO'], environ=environ,
+                            headers=headers, body=body.encode('utf8'))
+        sigv4_req = SigV4Request(req.environ)
+        # Verify header signature
+        self.assertTrue(sigv4_req.sig_checker.check_signature('secret'))
+
+        self.assertEqual(b'abcdefghij', req.environ['wsgi.input'].read(10))
+        with self.assertRaises(s3request.S3InputChunkSignatureMismatch):
+            req.environ['wsgi.input'].read(10)
+
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def test_check_signature_v4_hmac_sha256_payload_chunk_wrong_size(self):
+        environ = {
+            'HTTP_HOST': 's3.test.com',
+            'REQUEST_METHOD': 'PUT',
+            'RAW_PATH_INFO': '/test/file'}
+        headers = {
+            'Authorization':
+                'AWS4-HMAC-SHA256 '
+                'Credential=test/20220330/us-east-1/s3/aws4_request,'
+                'SignedHeaders=content-encoding;content-length;host;x-amz-con'
+                'tent-sha256;x-amz-date;x-amz-decoded-content-length,'
+                'Signature=aa1b67fc5bc4503d05a636e6e740dcb757d3aa2352f32e7493f'
+                '261f71acbe1d5',
+            'Content-Encoding': 'aws-chunked',
+            'Content-Length': '369',
+            'Host': 's3.test.com',
+            'X-Amz-Content-SHA256': 'STREAMING-AWS4-HMAC-SHA256-PAYLOAD',
+            'X-Amz-Date': '20220330T095351Z',
+            'X-Amz-Decoded-Content-Length': '25'}
+        # 2nd chunk contains an incorrect chunk size (9 should be a)...
+        body = 'a;chunk-signature=4a397f01db2cd700402dc38931b462e789ae49911d' \
+               'c229d93c9f9c46fd3e0b21\r\nabcdefghij\r\n' \
+               '9;chunk-signature=49177768ee3e9b77c6353ab9f3b9747d188adc11d4' \
+               '5b38be94a130616e6d64dc\r\nklmnopqrst\r\n' \
+               '5;chunk-signature=c884ebbca35b923cf864854e2a906aa8f5895a7140' \
+               '6c73cc6d4ee057527a8c23\r\nuvwz\n\r\n' \
+               '0;chunk-signature=50f7c470d6bf6c59126eecc2cb020d532a69c92322' \
+               'ddfbbd21811de45491022c\r\n\r\n'
+
+        req = Request.blank(environ['RAW_PATH_INFO'], environ=environ,
+                            headers=headers, body=body.encode('utf8'))
+        sigv4_req = SigV4Request(req.environ)
+        # Verify header signature
+        self.assertTrue(sigv4_req.sig_checker.check_signature('secret'))
+
+        self.assertEqual(b'abcdefghij', req.environ['wsgi.input'].read(10))
+        with self.assertRaises(s3request.S3InputChunkSignatureMismatch):
+            req.environ['wsgi.input'].read(10)
+
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def test_check_signature_v4_hmac_sha256_payload_chunk_no_last_chunk(self):
+        environ = {
+            'HTTP_HOST': 's3.test.com',
+            'REQUEST_METHOD': 'PUT',
+            'RAW_PATH_INFO': '/test/file'}
+        headers = {
+            'Authorization':
+                'AWS4-HMAC-SHA256 '
+                'Credential=test/20220330/us-east-1/s3/aws4_request,'
+                'SignedHeaders=content-encoding;content-length;host;x-amz-con'
+                'tent-sha256;x-amz-date;x-amz-decoded-content-length,'
+                'Signature=99759fb2823febb695950e6b75a7a1396b164742da9d204f71f'
+                'db3a3a52216aa',
+            'Content-Encoding': 'aws-chunked',
+            'Content-Length': '283',
+            'Host': 's3.test.com',
+            'X-Amz-Content-SHA256': 'STREAMING-AWS4-HMAC-SHA256-PAYLOAD',
+            'X-Amz-Date': '20220330T095351Z',
+            'X-Amz-Decoded-Content-Length': '25'}
+        body = 'a;chunk-signature=9c35d0203ce923cb7837b5e4a2984f2c107b05ac45' \
+               '80bafce7541c4b142b9712\r\nabcdefghij\r\n' \
+               'a;chunk-signature=f514382beed5f287a5181b8293399fe006fd9398ee' \
+               '4b8aed910238092a4d5ec7\r\nklmnopqrst\r\n' \
+               '5;chunk-signature=ed6a54f035b920e7daa378ab2d255518c082573c98' \
+               '60127c80d43697375324f4\r\nuvwz\n\r\n'
+
+        req = Request.blank(environ['RAW_PATH_INFO'], environ=environ,
+                            headers=headers, body=body.encode('utf8'))
+        sigv4_req = SigV4Request(req.environ)
+        # Verify header signature
+        self.assertTrue(sigv4_req.sig_checker.check_signature('secret'))
+        self.assertEqual(b'abcdefghij', req.environ['wsgi.input'].read(10))
+        self.assertEqual(b'klmnopqrst', req.environ['wsgi.input'].read(10))
+        with self.assertRaises(s3request.S3InputIncomplete):
+            req.environ['wsgi.input'].read(5)
+
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def _test_sig_v4_streaming_aws_hmac_sha256_payload_trailer(
+            self, body):
+        environ = {
+            'HTTP_HOST': 's3.test.com',
+            'REQUEST_METHOD': 'PUT',
+            'RAW_PATH_INFO': '/test/file'}
+        headers = {
+            'Authorization':
+                'AWS4-HMAC-SHA256 '
+                'Credential=test/20220330/us-east-1/s3/aws4_request,'
+                'SignedHeaders=content-encoding;content-length;host;x-amz-con'
+                'tent-sha256;x-amz-date;x-amz-decoded-content-length,'
+                'Signature=bee7ad4f1a4f16c22f3b24155ab749b2aca0773065ccf08bc41'
+                'a1e8e84748311',
+            'Content-Encoding': 'aws-chunked',
+            'Content-Length': '369',
+            'Host': 's3.test.com',
+            'X-Amz-Content-SHA256':
+                'STREAMING-AWS4-HMAC-SHA256-PAYLOAD-TRAILER',
+            'X-Amz-Date': '20220330T095351Z',
+            'X-Amz-Decoded-Content-Length': '27',
+            'X-Amz-Trailer': 'x-amz-checksum-sha256',
+        }
+        req = Request.blank(environ['RAW_PATH_INFO'], environ=environ,
+                            headers=headers, body=body.encode('utf8'))
+        sigv4_req = SigV4Request(req.environ)
+        # Verify header signature
+        self.assertTrue(sigv4_req.sig_checker.check_signature('secret'))
+        return sigv4_req
+
+    def test_check_sig_v4_streaming_aws_hmac_sha256_payload_trailer_ok(self):
+        body = 'a;chunk-signature=c9dd07703599d3d0bd51c96193110756d4f7091d5a' \
+               '4408314a53a802e635b1ad\r\nabcdefghij\r\n' \
+               'a;chunk-signature=662dc18fb1a3ddad6abc2ce9ebb0748bedacd219eb' \
+               '223a5e80721c2637d30240\r\nklmnopqrst\r\n' \
+               '7;chunk-signature=b63f141c2012de9ac60b961795ef31ad3202b125aa' \
+               '873b4142cf9d815360abc0\r\nuvwxyz\n\r\n' \
+               '0;chunk-signature=b1ff1f86dccfbe9bcc80011e2b87b72e43e0c7f543' \
+               'bb93612c06f9808ccb772e\r\n' \
+               'x-amz-checksum-sha256:EBCn52FhCYCsWRNZyHH3JN4VDyNEDrtZWaxMBy' \
+               'TJHZE=\r\n' \
+               'x-amz-trailer-signature:1212d72cb487bf08ed25d1329dc93f65fde0' \
+               'dcb21739a48f3182c86cfe79737b\r\n'
+        req = self._test_sig_v4_streaming_aws_hmac_sha256_payload_trailer(body)
+        self.assertEqual(b'abcdefghijklmnopqrstuvwxyz\n',
+                         req.environ['wsgi.input'].read())
+
+    def test_check_sig_v4_streaming_aws_hmac_sha256_missing_trailer_sig(self):
+        body = 'a;chunk-signature=c9dd07703599d3d0bd51c96193110756d4f7091d5a' \
+               '4408314a53a802e635b1ad\r\nabcdefghij\r\n' \
+               'a;chunk-signature=662dc18fb1a3ddad6abc2ce9ebb0748bedacd219eb' \
+               '223a5e80721c2637d30240\r\nklmnopqrst\r\n' \
+               '7;chunk-signature=b63f141c2012de9ac60b961795ef31ad3202b125aa' \
+               '873b4142cf9d815360abc0\r\nuvwxyz\n\r\n' \
+               '0;chunk-signature=b1ff1f86dccfbe9bcc80011e2b87b72e43e0c7f543' \
+               'bb93612c06f9808ccb772e\r\n' \
+               'x-amz-checksum-sha256:foo\r\n'
+        req = self._test_sig_v4_streaming_aws_hmac_sha256_payload_trailer(body)
+        with self.assertRaises(s3request.S3InputIncomplete):
+            req.environ['wsgi.input'].read()
+
+    def test_check_sig_v4_streaming_aws_hmac_sha256_payload_trailer_bad(self):
+        # second chunk has bad signature
+        body = 'a;chunk-signature=c9dd07703599d3d0bd51c96193110756d4f7091d5a' \
+               '4408314a53a802e635b1ad\r\nabcdefghij\r\n' \
+               'a;chunk-signature=badbadbadbad000000000000000000000000000000' \
+               '0000000000000000000000\r\nklmnopqrst\r\n' \
+               '7;chunk-signature=b63f141c2012de9ac60b961795ef31ad3202b125aa' \
+               '873b4142cf9d815360abc0\r\nuvwxyz\n\r\n' \
+               '0;chunk-signature=b1ff1f86dccfbe9bcc80011e2b87b72e43e0c7f543' \
+               'bb93612c06f9808ccb772e\r\n' \
+               'x-amz-checksum-sha256:foo\r\n'
+        req = self._test_sig_v4_streaming_aws_hmac_sha256_payload_trailer(body)
+        self.assertEqual(b'abcdefghij', req.environ['wsgi.input'].read(10))
+        with self.assertRaises(s3request.S3InputChunkSignatureMismatch):
+            req.environ['wsgi.input'].read(10)
+
+    def _make_sig_v4_streaming_unsigned_payload_trailer_req(
+            self, body=None, wsgi_input=None, extra_headers=None):
+        environ = {
+            'HTTP_HOST': 's3.test.com',
+            'REQUEST_METHOD': 'PUT',
+            'RAW_PATH_INFO': '/test/file'}
+        if body:
+            body = body.encode('utf8')
+        elif wsgi_input:
+            environ['wsgi.input'] = wsgi_input
+        headers = {
+            'Authorization':
+                'AWS4-HMAC-SHA256 '
+                'Credential=test/20220330/us-east-1/s3/aws4_request,'
+                'SignedHeaders=content-encoding;content-length;host;x-amz-con'
+                'tent-sha256;x-amz-date;x-amz-decoded-content-length,'
+                'Signature=43727fcfa7765e97cd3cbfc112fed5fedc31e2b7930588ddbca'
+                '3feaa1205a7f2',
+            'Content-Encoding': 'aws-chunked',
+            'Content-Length': '369',
+            'Host': 's3.test.com',
+            'X-Amz-Content-SHA256': 'STREAMING-UNSIGNED-PAYLOAD-TRAILER',
+            'X-Amz-Date': '20220330T095351Z',
+            'X-Amz-Decoded-Content-Length': '27',
+        }
+        if extra_headers:
+            headers.update(extra_headers)
+        return Request.blank(environ['RAW_PATH_INFO'], environ=environ,
+                             headers=headers, body=body)
+
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def _test_sig_v4_streaming_unsigned_payload_trailer(
+            self, body=None, x_amz_trailer='x-amz-checksum-sha256'):
+        if x_amz_trailer is None:
+            headers = {}
+        else:
+            headers = {'X-Amz-Trailer': x_amz_trailer}
+
+        req = self._make_sig_v4_streaming_unsigned_payload_trailer_req(
+            body=body, extra_headers=headers)
+        sigv4_req = SigV4Request(req.environ)
+        # Verify header signature
+        self.assertTrue(sigv4_req.sig_checker.check_signature('secret'))
+        return sigv4_req
+
+    def test_sig_v4_strm_unsgnd_pyld_trl_ok(self):
+        body = 'a\r\nabcdefghij\r\n' \
+               'a\r\nklmnopqrst\r\n' \
+               '7\r\nuvwxyz\n\r\n' \
+               '0\r\n' \
+               'x-amz-checksum-sha256:EBCn52FhCYCsWRNZyHH3JN4VDyNEDrtZWaxMB' \
+               'yTJHZE=\r\n'
+        s3req = self._test_sig_v4_streaming_unsigned_payload_trailer(body)
+        self.assertEqual(b'abcdefghijklmnopqrstuvwxyz\n',
+                         s3req.environ['wsgi.input'].read())
+
+    def test_sig_v4_strm_unsgnd_pyld_trl_none_ok(self):
+        # verify it's ok to not send any trailer
+        body = 'a\r\nabcdefghij\r\n' \
+               'a\r\nklmnopqrst\r\n' \
+               '7\r\nuvwxyz\n\r\n' \
+               '0\r\n'
+        s3req = self._test_sig_v4_streaming_unsigned_payload_trailer(
+            body, x_amz_trailer=None)
+        self.assertEqual(b'abcdefghijklmnopqrstuvwxyz\n',
+                         s3req.environ['wsgi.input'].read())
+
+    def test_sig_v4_strm_unsgnd_pyld_trl_undeclared(self):
+        body = 'a\r\nabcdefghij\r\n' \
+               'a\r\nklmnopqrst\r\n' \
+               '7\r\nuvwxyz\n\r\n' \
+               '0\r\n' \
+               'x-amz-checksum-sha256:undeclared\r\n'
+        s3req = self._test_sig_v4_streaming_unsigned_payload_trailer(
+            body, x_amz_trailer=None)
+        self.assertEqual(b'abcdefghijklmnopqrst',
+                         s3req.environ['wsgi.input'].read(20))
+        with self.assertRaises(s3request.S3InputIncomplete):
+            s3req.environ['wsgi.input'].read()
+
+    def test_sig_v4_strm_unsgnd_pyld_trl_multiple(self):
+        body = 'a\r\nabcdefghij\r\n' \
+               'a\r\nklmnopqrst\r\n' \
+               '7\r\nuvwxyz\n\r\n' \
+               '0\r\n' \
+               'x-amz-checksum-sha256:undeclared\r\n'
+        with self.assertRaises(s3request.InvalidRequest):
+            self._test_sig_v4_streaming_unsigned_payload_trailer(
+                body,
+                x_amz_trailer='x-amz-checksum-sha256,x-amz-checksum-crc32')
+
+    def test_sig_v4_strm_unsgnd_pyld_trl_with_commas_invalid(self):
+        body = 'a\r\nabcdefghij\r\n' \
+               'a\r\nklmnopqrst\r\n' \
+               '7\r\nuvwxyz\n\r\n' \
+               '0\r\n' \
+               'x-amz-checksum-sha256:undeclared\r\n'
+        with self.assertRaises(s3request.InvalidRequest):
+            self._test_sig_v4_streaming_unsigned_payload_trailer(
+                body,
+                x_amz_trailer=', x-amz-checksum-crc32, ,')
+        with self.assertRaises(s3request.InvalidRequest):
+            self._test_sig_v4_streaming_unsigned_payload_trailer(
+                body,
+                x_amz_trailer=', x-amz-checksum-crc32')
+        with self.assertRaises(s3request.InvalidRequest):
+            self._test_sig_v4_streaming_unsigned_payload_trailer(
+                body,
+                x_amz_trailer=',x-amz-checksum-crc32')
+        with self.assertRaises(s3request.InvalidRequest):
+            self._test_sig_v4_streaming_unsigned_payload_trailer(
+                body,
+                x_amz_trailer='x-amz-checksum-crc32, ,')
+
+    def test_sig_v4_strm_unsgnd_pyld_trl_with_commas_ok(self):
+        body = 'a\r\nabcdefghij\r\n' \
+               'a\r\nklmnopqrst\r\n' \
+               '7\r\nuvwxyz\n\r\n' \
+               '0\r\n' \
+               'x-amz-checksum-sha256:EBCn52FhCYCsWRNZyHH3JN4VDyNEDrtZWaxMB' \
+               'yTJHZE=\r\n'
+        s3req = self._test_sig_v4_streaming_unsigned_payload_trailer(
+            body, x_amz_trailer='x-amz-checksum-sha256, ')
+        self.assertEqual(b'abcdefghijklmnopqrstuvwxyz\n',
+                         s3req.environ['wsgi.input'].read())
+        s3req = self._test_sig_v4_streaming_unsigned_payload_trailer(
+            body, x_amz_trailer='x-amz-checksum-sha256,,')
+        self.assertEqual(b'abcdefghijklmnopqrstuvwxyz\n',
+                         s3req.environ['wsgi.input'].read())
+
+    def test_sig_v4_strm_unsgnd_pyld_trl_unrecognised(self):
+        body = 'a\r\nabcdefghij\r\n' \
+               'a\r\nklmnopqrst\r\n' \
+               '7\r\nuvwxyz\n\r\n' \
+               '0\r\n'
+        with self.assertRaises(s3request.InvalidRequest):
+            self._test_sig_v4_streaming_unsigned_payload_trailer(
+                body,
+                x_amz_trailer='x-amz-content-sha256')
+
+    def test_sig_v4_strm_unsgnd_pyld_trl_mismatch(self):
+        # the unexpected footer is detected before the incomplete line
+        body = 'a\r\nabcdefghij\r\n' \
+               'a\r\nklmnopqrst\r\n' \
+               '7\r\nuvwxyz\n\r\n' \
+               '0\r\n' \
+               'x-amz-checksum-not-sha256:foo\r\n' \
+               'x-'
+        s3req = self._test_sig_v4_streaming_unsigned_payload_trailer(body)
+        self.assertEqual(b'abcdefghijklmnopqrst',
+                         s3req.environ['wsgi.input'].read(20))
+        # trailers are read with penultimate chunk??
+        with self.assertRaises(s3request.S3InputMalformedTrailer):
+            s3req.environ['wsgi.input'].read()
+
+    def test_sig_v4_strm_unsgnd_pyld_trl_missing(self):
+        body = 'a\r\nabcdefghij\r\n' \
+               'a\r\nklmnopqrst\r\n' \
+               '7\r\nuvwxyz\n\r\n' \
+               '0\r\n' \
+               '\r\n'
+        s3req = self._test_sig_v4_streaming_unsigned_payload_trailer(body)
+        self.assertEqual(b'abcdefghijklmnopqrst',
+                         s3req.environ['wsgi.input'].read(20))
+        # trailers are read with penultimate chunk??
+        with self.assertRaises(s3request.S3InputMalformedTrailer):
+            s3req.environ['wsgi.input'].read()
+
+    def test_sig_v4_strm_unsgnd_pyld_trl_extra(self):
+        body = 'a\r\nabcdefghij\r\n' \
+               'a\r\nklmnopqrst\r\n' \
+               '7\r\nuvwxyz\n\r\n' \
+               '0\r\n' \
+               'x-amz-checksum-crc32:foo\r\n' \
+               'x-amz-checksum-sha32:foo\r\n'
+        s3req = self._test_sig_v4_streaming_unsigned_payload_trailer(body)
+        self.assertEqual(b'abcdefghijklmnopqrst',
+                         s3req.environ['wsgi.input'].read(20))
+        # trailers are read with penultimate chunk??
+        with self.assertRaises(s3request.S3InputMalformedTrailer):
+            s3req.environ['wsgi.input'].read()
+
+    def test_sig_v4_strm_unsgnd_pyld_trl_duplicate(self):
+        body = 'a\r\nabcdefghij\r\n' \
+               'a\r\nklmnopqrst\r\n' \
+               '7\r\nuvwxyz\n\r\n' \
+               '0\r\n' \
+               'x-amz-checksum-sha256:foo\r\n' \
+               'x-amz-checksum-sha256:EBCn52FhCYCsWRNZyHH3JN4VDyNEDrtZWaxMB' \
+               'yTJHZE=\r\n'
+        s3req = self._test_sig_v4_streaming_unsigned_payload_trailer(body)
+        self.assertEqual(b'abcdefghijklmnopqrst',
+                         s3req.environ['wsgi.input'].read(20))
+        # Reading the rest succeeds! AWS would complain about the checksum,
+        # but we aren't looking at it (yet)
+        s3req.environ['wsgi.input'].read()
+
+    def test_sig_v4_strm_unsgnd_pyld_trl_short(self):
+        body = 'a\r\nabcdefghij\r\n' \
+               'a\r\nklmnopqrst\r\n' \
+               '7\r\nuvwxyz\n\r\n' \
+               '0\r\n' \
+               'x-amz-checksum-sha256'
+        s3req = self._test_sig_v4_streaming_unsigned_payload_trailer(body)
+        self.assertEqual(b'abcdefghijklmnopqrst',
+                         s3req.environ['wsgi.input'].read(20))
+        # trailers are read with penultimate chunk??
+        with self.assertRaises(s3request.S3InputIncomplete):
+            s3req.environ['wsgi.input'].read()
+
+    def test_sig_v4_strm_unsgnd_pyld_trl_invalid(self):
+        body = 'a\r\nabcdefghij\r\n' \
+               'a\r\nklmnopqrst\r\n' \
+               '7\r\nuvwxyz\n\r\n' \
+               '0\r\n' \
+               'x-amz-checksum-sha256: not=base-64\r\n'
+        s3req = self._test_sig_v4_streaming_unsigned_payload_trailer(body)
+        self.assertEqual(b'abcdefghijklmnopqrst',
+                         s3req.environ['wsgi.input'].read(20))
+        with self.assertRaises(s3request.S3InputChecksumTrailerInvalid):
+            s3req.environ['wsgi.input'].read()
+
+        # ...which in context gets translated to a 400 response
+        with self.assertRaises(s3response.InvalidRequest) as cm, \
+                s3req.translate_read_errors():
+            s3req.environ['wsgi.input'].read()
+        self.assertIn(
+            'Value for x-amz-checksum-sha256 trailing header is invalid.',
+            str(cm.exception.body))
+
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def test_sig_v4_strm_unsgnd_pyld_trl_checksum_hdr_sha256_ok(self):
+        # TODO: do we already have coverage for this?
+        body = 'a\r\nabcdefghij\r\n' \
+               'a\r\nklmnopqrst\r\n' \
+               '7\r\nuvwxyz\n\r\n' \
+               '0\r\n'
+        headers = {
+            'x-amz-checksum-sha256':
+                'EBCn52FhCYCsWRNZyHH3JN4VDyNEDrtZWaxMByTJHZE=',
+        }
+        req = self._make_sig_v4_streaming_unsigned_payload_trailer_req(
+            body=body,
+            extra_headers=headers
+        )
+        sigv4_req = SigV4Request(req.environ)
+        self.assertEqual(b'abcdefghijklmnopqrstuvwxyz\n',
+                         sigv4_req.environ['wsgi.input'].read())
+
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def test_sig_v4_strm_unsgnd_pyld_trl_checksum_sha256_mismatch(self):
+        # TODO: do we already have coverage for this?
+        body = 'a\r\nabcdefghij\r\n' \
+               'a\r\nklmnopqrst\r\n' \
+               '7\r\nuvwxyz\n\r\n' \
+               '0\r\n'
+        headers = {
+            'x-amz-sdk-checksum-algorithm': 'sha256',
+            'x-amz-checksum-sha256':
+                'BADBADBADBADWRNZyHH3JN4VDyNEDrtZWaxMByTJHZE=',
+        }
+        req = self._make_sig_v4_streaming_unsigned_payload_trailer_req(
+            body=body,
+            extra_headers=headers
+        )
+        sigv4_req = SigV4Request(req.environ)
+        with self.assertRaises(s3request.BadDigest) as cm, \
+                sigv4_req.translate_read_errors():
+            sigv4_req.environ['wsgi.input'].read()
+        self.assertIn('The SHA256 you specified did not match the calculated '
+                      'checksum.', str(cm.exception.body))
+
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def test_sig_v4_strm_unsgnd_pyld_trl_checksum_hdr_crc32_ok(self):
+        body = 'a\r\nabcdefghij\r\n' \
+               'a\r\nklmnopqrst\r\n' \
+               '7\r\nuvwxyz\n\r\n' \
+               '0\r\n'
+        crc = base64.b64encode(
+            checksum.crc32(b'abcdefghijklmnopqrstuvwxyz\n').digest())
+        req = self._make_sig_v4_streaming_unsigned_payload_trailer_req(
+            body=body,
+            extra_headers={'x-amz-checksum-crc32': crc}
+        )
+        sigv4_req = SigV4Request(req.environ)
+        self.assertEqual(b'abcdefghijklmnopqrstuvwxyz\n',
+                         sigv4_req.environ['wsgi.input'].read())
+
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def test_sig_v4_strm_unsgnd_pyld_trl_checksum_hdr_crc32_mismatch(self):
+        body = 'a\r\nabcdefghij\r\n' \
+               'a\r\nklmnopqrst\r\n' \
+               '7\r\nuvwxyz\n\r\n' \
+               '0\r\n'
+        crc = base64.b64encode(checksum.crc32(b'not-the-body').digest())
+        req = self._make_sig_v4_streaming_unsigned_payload_trailer_req(
+            body=body,
+            extra_headers={'x-amz-checksum-crc32': crc}
+        )
+        sigv4_req = SigV4Request(req.environ)
+        with self.assertRaises(S3InputChecksumMismatch):
+            sigv4_req.environ['wsgi.input'].read()
+
+    @requires_crc32c
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def test_sig_v4_strm_unsgnd_pyld_trl_checksum_hdr_crc32c_ok(self):
+        body = 'a\r\nabcdefghij\r\n' \
+               'a\r\nklmnopqrst\r\n' \
+               '7\r\nuvwxyz\n\r\n' \
+               '0\r\n'
+        crc = base64.b64encode(
+            checksum.crc32c(b'abcdefghijklmnopqrstuvwxyz\n').digest())
+        req = self._make_sig_v4_streaming_unsigned_payload_trailer_req(
+            body=body,
+            extra_headers={'x-amz-checksum-crc32c': crc}
+        )
+        sigv4_req = SigV4Request(req.environ)
+        self.assertEqual(b'abcdefghijklmnopqrstuvwxyz\n',
+                         sigv4_req.environ['wsgi.input'].read())
+
+    @requires_crc32c
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def test_sig_v4_strm_unsgnd_pyld_trl_checksum_hdr_crc32c_mismatch(self):
+        body = 'a\r\nabcdefghij\r\n' \
+               'a\r\nklmnopqrst\r\n' \
+               '7\r\nuvwxyz\n\r\n' \
+               '0\r\n'
+        crc = base64.b64encode(checksum.crc32c(b'not-the-body').digest())
+        req = self._make_sig_v4_streaming_unsigned_payload_trailer_req(
+            body=body,
+            extra_headers={'x-amz-checksum-crc32c': crc}
+        )
+        sigv4_req = SigV4Request(req.environ)
+        with self.assertRaises(S3InputChecksumMismatch):
+            sigv4_req.environ['wsgi.input'].read()
+
+    @requires_crc64nvme
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def test_sig_v4_strm_unsgnd_pyld_trl_checksum_hdr_crc64nvme_ok(self):
+        body = 'a\r\nabcdefghij\r\n' \
+               'a\r\nklmnopqrst\r\n' \
+               '7\r\nuvwxyz\n\r\n' \
+               '0\r\n'
+        crc = base64.b64encode(
+            checksum.crc64nvme(b'abcdefghijklmnopqrstuvwxyz\n').digest())
+        req = self._make_sig_v4_streaming_unsigned_payload_trailer_req(
+            body=body,
+            extra_headers={'x-amz-checksum-crc64nvme': crc}
+        )
+        sigv4_req = SigV4Request(req.environ)
+        self.assertEqual(b'abcdefghijklmnopqrstuvwxyz\n',
+                         sigv4_req.environ['wsgi.input'].read())
+
+    @requires_crc64nvme
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def test_sig_v4_strm_unsgnd_pyld_trl_checksum_hdr_crc64nvme_invalid(self):
+        body = 'a\r\nabcdefghij\r\n' \
+               'a\r\nklmnopqrst\r\n' \
+               '7\r\nuvwxyz\n\r\n' \
+               '0\r\n'
+        crc = base64.b64encode(checksum.crc64nvme(b'not-the-body').digest())
+        req = self._make_sig_v4_streaming_unsigned_payload_trailer_req(
+            body=body,
+            extra_headers={'x-amz-checksum-crc64nvme': crc}
+        )
+        sigv4_req = SigV4Request(req.environ)
+        with self.assertRaises(S3InputChecksumMismatch):
+            sigv4_req.environ['wsgi.input'].read()
+
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def test_sig_v4_strm_unsgnd_pyld_trl_checksum_hdr_sha1_ok(self):
+        body = 'a\r\nabcdefghij\r\n' \
+               'a\r\nklmnopqrst\r\n' \
+               '7\r\nuvwxyz\n\r\n' \
+               '0\r\n'
+        crc = base64.b64encode(
+            hashlib.sha1(b'abcdefghijklmnopqrstuvwxyz\n').digest())
+        req = self._make_sig_v4_streaming_unsigned_payload_trailer_req(
+            body=body,
+            extra_headers={'x-amz-checksum-sha1': crc}
+        )
+        sigv4_req = SigV4Request(req.environ)
+        self.assertEqual(b'abcdefghijklmnopqrstuvwxyz\n',
+                         sigv4_req.environ['wsgi.input'].read())
+
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def test_sig_v4_strm_unsgnd_pyld_trl_checksum_hdr_sha1_mismatch(self):
+        body = 'a\r\nabcdefghij\r\n' \
+               'a\r\nklmnopqrst\r\n' \
+               '7\r\nuvwxyz\n\r\n' \
+               '0\r\n'
+        crc = base64.b64encode(hashlib.sha1(b'not-the-body').digest())
+        req = self._make_sig_v4_streaming_unsigned_payload_trailer_req(
+            body=body,
+            extra_headers={'x-amz-checksum-sha1': crc}
+        )
+        sigv4_req = SigV4Request(req.environ)
+        with self.assertRaises(S3InputChecksumMismatch):
+            sigv4_req.environ['wsgi.input'].read()
+
+    @requires_crc32c
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def test_sig_v4_strm_unsgnd_pyld_trl_checksum_hdr_unsupported(self):
+        body = 'a\r\nabcdefghij\r\n' \
+               'a\r\nklmnopqrst\r\n' \
+               '7\r\nuvwxyz\n\r\n' \
+               '0\r\n'
+        crc = base64.b64encode(
+            checksum.crc32c(b'abcdefghijklmnopqrstuvwxyz\n').digest())
+        req = self._make_sig_v4_streaming_unsigned_payload_trailer_req(
+            body=body,
+            extra_headers={'x-amz-checksum-crc32c': crc}
+        )
+        with patch('swift.common.middleware.s3api.s3request.checksum.'
+                   '_select_crc32c_impl', side_effect=NotImplementedError):
+            with self.assertRaises(S3NotImplemented):
+                SigV4Request(req.environ)
+
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def test_sig_v4_strm_unsgnd_pyld_trl_checksum_hdr_and_trailer(self):
+        wsgi_input = io.BytesIO(b'123')
+        self.assertEqual(0, wsgi_input.tell())
+        headers = {
+            'x-amz-checksum-sha256':
+                'EBCn52FhCYCsWRNZyHH3JN4VDyNEDrtZWaxMByTJHZE=',
+            'x-amz-trailer': 'x-amz-checksum-sha256'
+        }
+        req = self._make_sig_v4_streaming_unsigned_payload_trailer_req(
+            wsgi_input=wsgi_input,
+            extra_headers=headers
+        )
+        with self.assertRaises(InvalidRequest) as cm:
+            SigV4Request(req.environ)
+        self.assertIn('Expecting a single x-amz-checksum- header',
+                      str(cm.exception.body))
+
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def test_sig_v4_strm_unsgnd_pyld_trl_checksum_algo_mismatch(self):
+        wsgi_input = io.BytesIO(b'123')
+        self.assertEqual(0, wsgi_input.tell())
+        headers = {
+            'x-amz-sdk-checksum-algorithm': 'crc32',
+            'x-amz-checksum-sha256':
+                'EBCn52FhCYCsWRNZyHH3JN4VDyNEDrtZWaxMByTJHZE=',
+        }
+        req = self._make_sig_v4_streaming_unsigned_payload_trailer_req(
+            wsgi_input=wsgi_input,
+            extra_headers=headers
+        )
+        with self.assertRaises(InvalidRequest) as cm:
+            SigV4Request(req.environ)
+        self.assertIn('Value for x-amz-sdk-checksum-algorithm header is '
+                      'invalid.', str(cm.exception.body))
+
+    def _make_sig_v4_unsgnd_pyld_multi_delete_req(self, body, extra_headers):
+        environ = {
+            'HTTP_HOST': 's3.test.com',
+            'REQUEST_METHOD': 'POST',
+            'RAW_PATH_INFO': '/test/file',
+            'QUERY_STRING': 'delete=true'}
+        headers = {
+            'Authorization':
+                'AWS4-HMAC-SHA256 '
+                'Credential=test/20220330/us-east-1/s3/aws4_request,'
+                'SignedHeaders=content-length;host;x-amz-content-sha256;'
+                'x-amz-date,'
+                'Signature=6829034c62cb588ce44e41788851a6acdc22f0d0e5f68e4f733'
+                'e56bb29687cb8',
+            'Content-Length': len(body),
+            'Host': 's3.test.com',
+            'X-Amz-Content-SHA256': 'UNSIGNED-PAYLOAD',
+            'X-Amz-Date': '20220330T095351Z',
+        }
+        if extra_headers:
+            headers.update(extra_headers)
+        return Request.blank(environ['RAW_PATH_INFO'], environ=environ,
+                             headers=headers, body=body)
+
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def test_sig_v4_unsgnd_pyld_multi_delete_crc32_ok(self):
+        body = (b"<?xml version='1.0' encoding='UTF-8'?>\n"
+                b"<Delete><Object><Key>object</Key></Object></Delete>")
+        crc = base64.b64encode(checksum.crc32(body).digest())
+        extra_headers = {'X-Amz-Checksum-Crc32': crc}
+        req = self._make_sig_v4_unsgnd_pyld_multi_delete_req(
+            body, extra_headers)
+        sigv4_req = SigV4Request(req.environ)
+        # Verify header signature
+        self.assertTrue(sigv4_req.sig_checker.check_signature('secret'))
+        resp_body = sigv4_req.environ['wsgi.input'].read()
+        self.assertEqual(body, resp_body)
+
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def test_sig_v4_unsgnd_pyld_multi_delete_crc32_mismatch(self):
+        body = (b"<?xml version='1.0' encoding='UTF-8'?>\n"
+                b"<Delete><Object><Key>object</Key></Object></Delete>")
+        crc = base64.b64encode(checksum.crc32c(b'not-the-body').digest())
+        extra_headers = {'X-Amz-Checksum-Crc32': crc}
+        req = self._make_sig_v4_unsgnd_pyld_multi_delete_req(
+            body, extra_headers)
+        sigv4_req = SigV4Request(req.environ)
+        # Verify header signature
+        self.assertTrue(sigv4_req.sig_checker.check_signature('secret'))
+        # the crc is verified for a multi-delete POST
+        with self.assertRaises(S3InputChecksumMismatch):
+            sigv4_req.environ['wsgi.input'].read()
+
+    def _make_sig_v4_unsgnd_pyld_multi_upload_req(self, body, extra_headers):
+        environ = {
+            'HTTP_HOST': 's3.test.com',
+            'REQUEST_METHOD': 'POST',
+            'RAW_PATH_INFO': '/test/file',
+            'QUERY_STRING': 'uploadId=foo'}
+        headers = {
+            'Authorization':
+                'AWS4-HMAC-SHA256 '
+                'Credential=test/20220330/us-east-1/s3/aws4_request,'
+                'SignedHeaders=content-length;host;x-amz-content-sha256;'
+                'x-amz-date,'
+                'Signature=66a9a5a4d7ce7775da0741740a679b4a75598607b8600bba86f'
+                '3d6122e397bef',
+            'Content-Length': len(body),
+            'Host': 's3.test.com',
+            'X-Amz-Content-SHA256': 'UNSIGNED-PAYLOAD',
+            'X-Amz-Date': '20220330T095351Z',
+        }
+        if extra_headers:
+            headers.update(extra_headers)
+        return Request.blank(environ['RAW_PATH_INFO'], environ=environ,
+                             headers=headers, body=body)
+
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def test_sig_v4_unsgnd_pyld_multi_upload_crc32_ok(self):
+        body = (b"<?xml version='1.0' encoding='UTF-8'?>\n"
+                b'<CompleteMultipartUpload><Part>'
+                b'<PartNumber>1</PartNumber>'
+                b'<ETag>0123456789abcdef0123456789abcdef</ETag>'
+                b'</Part></CompleteMultipartUpload>')
+        crc = base64.b64encode(checksum.crc32(body).digest())
+        extra_headers = {'X-Amz-Checksum-Crc32': crc}
+        req = self._make_sig_v4_unsgnd_pyld_multi_upload_req(
+            body, extra_headers)
+        sigv4_req = SigV4Request(req.environ)
+        # Verify header signature
+        self.assertTrue(sigv4_req.sig_checker.check_signature('secret'))
+        resp_body = sigv4_req.environ['wsgi.input'].read()
+        self.assertEqual(body, resp_body)
+
+    @patch.object(S3Request, '_validate_dates', lambda *a: None)
+    def test_sig_v4_unsgnd_pyld_multi_upload_crc32_mismatch(self):
+        body = (b"<?xml version='1.0' encoding='UTF-8'?>\n"
+                b'<CompleteMultipartUpload><Part>'
+                b'<PartNumber>1</PartNumber>'
+                b'<ETag>0123456789abcdef0123456789abcdef</ETag>'
+                b'</Part></CompleteMultipartUpload>')
+        crc = base64.b64encode(checksum.crc32c(b'not-the-body').digest())
+        extra_headers = {'X-Amz-Checksum-Crc32': crc}
+        req = self._make_sig_v4_unsgnd_pyld_multi_upload_req(
+            body, extra_headers)
+        sigv4_req = SigV4Request(req.environ)
+        # Verify header signature
+        self.assertTrue(sigv4_req.sig_checker.check_signature('secret'))
+        # the crc is not verified for a multi-upload complete POST
+        resp_body = sigv4_req.environ['wsgi.input'].read()
+        self.assertEqual(body, resp_body)
+
+
+class TestSigV4Request(S3ApiTestCase):
+    def setUp(self):
+        super(TestSigV4Request, self).setUp()
+        self.s3api.conf.s3_acl = True
+
+    def test_init_header_authorization(self):
+        environ = {
+            'HTTP_HOST': 'bucket.s3.test.com',
+            'REQUEST_METHOD': 'GET'}
+
+        def do_check_ok(conf, auth):
+            x_amz_date = self.get_v4_amz_date_header()
+            headers = {
+                'Authorization': auth,
+                'X-Amz-Content-SHA256': '0' * 64,
+                'Date': self.get_date_header(),
+                'X-Amz-Date': x_amz_date}
+            req = Request.blank('/', environ=environ, headers=headers)
+            sigv4_req = SigV4Request(req.environ, conf=conf)
+            self.assertEqual('X', sigv4_req.signature)
+            self.assertEqual('test', sigv4_req.access_key)
+            return sigv4_req
+
+        auth = ('AWS4-HMAC-SHA256 '
+                'Credential=test/%s/us-east-1/s3/aws4_request,'
+                'SignedHeaders=host;x-amz-content-sha256;x-amz-date,'
+                'Signature=X' % self.get_v4_amz_date_header().split('T', 1)[0])
+        # location lowercase matches
+        sigv4_req = do_check_ok(Config({'location': 'us-east-1'}), auth)
+        self.assertEqual('us-east-1', sigv4_req.location)
+        # location case mis-matches
+        sigv4_req = do_check_ok(Config({'location': 'US-East-1'}), auth)
+        self.assertEqual('us-east-1', sigv4_req.location)
+        # location uppercase matches
+        auth = ('AWS4-HMAC-SHA256 '
+                'Credential=test/%s/US-East-1/s3/aws4_request,'
+                'SignedHeaders=host;x-amz-content-sha256;x-amz-date,'
+                'Signature=X' % self.get_v4_amz_date_header().split('T', 1)[0])
+        sigv4_req = do_check_ok(Config({'location': 'US-East-1'}), auth)
+        self.assertEqual('US-East-1', sigv4_req.location)
+
+        def do_check_bad(conf, auth, exc):
+            x_amz_date = self.get_v4_amz_date_header()
+            headers = {
+                'Authorization': auth,
+                'X-Amz-Content-SHA256': '0' * 64,
+                'Date': self.get_date_header(),
+                'X-Amz-Date': x_amz_date}
+            req = Request.blank('/', environ=environ, headers=headers)
+            self.assertRaises(exc, SigV4Request, req.environ, conf)
+
+        # location case mismatch
+        auth = ('AWS4-HMAC-SHA256 '
+                'Credential=test/%s/US-East-1/s3/aws4_request,'
+                'SignedHeaders=host;x-amz-content-sha256;x-amz-date,'
+                'Signature=X' % self.get_v4_amz_date_header().split('T', 1)[0])
+        do_check_bad(Config({'location': 'us-east-1'}), auth,
+                     s3response.AuthorizationHeaderMalformed)
+        # bad location
+        auth = ('AWS4-HMAC-SHA256 '
+                'Credential=test/%s/us-west-1/s3/aws4_request,'
+                'SignedHeaders=host;x-amz-content-sha256;x-amz-date,'
+                'Signature=X' % self.get_v4_amz_date_header().split('T', 1)[0])
+        do_check_bad(Config({'location': 'us-east-1'}), auth,
+                     s3response.AuthorizationHeaderMalformed)
+        # bad service name
+        auth = ('AWS4-HMAC-SHA256 '
+                'Credential=test/%s/us-east-1/S3/aws4_request,'
+                'SignedHeaders=host;x-amz-content-sha256;x-amz-date,'
+                'Signature=X' % self.get_v4_amz_date_header().split('T', 1)[0])
+        do_check_bad(Config({'location': 'us-east-1'}), auth,
+                     s3response.AuthorizationHeaderMalformed)
+        # bad terminal name
+        auth = ('AWS4-HMAC-SHA256 '
+                'Credential=test/%s/us-east-1/s3/AWS4_request,'
+                'SignedHeaders=host;x-amz-content-sha256;x-amz-date,'
+                'Signature=X' % self.get_v4_amz_date_header().split('T', 1)[0])
+        do_check_bad(Config({'location': 'us-east-1'}), auth,
+                     s3response.AuthorizationHeaderMalformed)
+        # bad Signature
+        auth = ('AWS4-HMAC-SHA256 '
+                'Credential=test/%s/us-east-1/s3/aws4_request,'
+                'SignedHeaders=host;x-amz-content-sha256;x-amz-date,'
+                'Signature=' % self.get_v4_amz_date_header().split('T', 1)[0])
+        do_check_bad(Config({'location': 'us-east-1'}), auth,
+                     s3response.AccessDenied)
+        # bad SignedHeaders
+        auth = ('AWS4-HMAC-SHA256 '
+                'Credential=test/%s/us-east-1/s3/aws4_request,'
+                'SignedHeaders=,'
+                'Signature=X' % self.get_v4_amz_date_header().split('T', 1)[0])
+        do_check_bad(Config({'location': 'us-east-1'}), auth,
+                     s3response.AuthorizationHeaderMalformed)
+
+    def test_init_query_authorization(self):
+        environ = {
+            'HTTP_HOST': 'bucket.s3.test.com',
+            'REQUEST_METHOD': 'GET'}
+
+        def do_check_ok(conf, params):
+            x_amz_date = self.get_v4_amz_date_header()
+            params['X-Amz-Date'] = x_amz_date
+            signed_headers = {
+                'X-Amz-Content-SHA256': '0' * 64,
+                'Date': self.get_date_header(),
+                'X-Amz-Date': x_amz_date}
+            req = Request.blank('/', environ=environ, headers=signed_headers,
+                                params=params)
+            sigv4_req = SigV4Request(req.environ, conf=conf)
+            self.assertEqual('X', sigv4_req.signature)
+            self.assertEqual('test', sigv4_req.access_key)
+            return sigv4_req
+
+        ok_params = {
+            'AWSAccessKeyId': 'test',
+            'X-Amz-Expires': '3600',
+            'X-Amz-Algorithm': 'AWS4-HMAC-SHA256',
+            'X-Amz-Credential': 'test/%s/us-east-1/s3/aws4_request' %
+            self.get_v4_amz_date_header().split('T', 1)[0],
+            'X-Amz-SignedHeaders': 'host;x-amz-content-sha256;x-amz-date',
+            'X-Amz-Signature': 'X'}
+        # location lowercase matches
+        sigv4_req = do_check_ok(Config({'location': 'us-east-1'}), ok_params)
+        self.assertEqual('us-east-1', sigv4_req.location)
+        # location case mis-matches
+        sigv4_req = do_check_ok(Config({'location': 'US-East-1'}), ok_params)
+        self.assertEqual('us-east-1', sigv4_req.location)
+        # location uppercase matches
+        ok_params['X-Amz-Credential'] = (
+            'test/%s/US-East-1/s3/aws4_request' %
+            self.get_v4_amz_date_header().split('T', 1)[0])
+        sigv4_req = do_check_ok(Config({'location': 'US-East-1'}), ok_params)
+        self.assertEqual('US-East-1', sigv4_req.location)
+
+        def do_check_bad(conf, params, exc):
+            x_amz_date = self.get_v4_amz_date_header()
+            params['X-Amz-Date'] = x_amz_date
+            signed_headers = {
+                'X-Amz-Content-SHA256': '0' * 64,
+                'Date': self.get_date_header(),
+                'X-Amz-Date': x_amz_date}
+            req = Request.blank('/', environ=environ, headers=signed_headers,
+                                params=params)
+            self.assertRaises(exc, SigV4Request, req.environ, conf)
+
+        # location case mismatch
+        bad_params = dict(ok_params)
+        bad_params['X-Amz-Credential'] = (
+            'test/%s/US-East-1/s3/aws4_request' %
+            self.get_v4_amz_date_header().split('T', 1)[0])
+        do_check_bad(Config({'location': 'us-east-1'}), bad_params,
+                     s3response.AuthorizationQueryParametersError)
+        # bad location
+        bad_params = dict(ok_params)
+        bad_params['X-Amz-Credential'] = (
+            'test/%s/us-west-1/s3/aws4_request' %
+            self.get_v4_amz_date_header().split('T', 1)[0])
+        do_check_bad(Config({'location': 'us-east-1'}), bad_params,
+                     s3response.AuthorizationQueryParametersError)
+        # bad service name
+        bad_params = dict(ok_params)
+        bad_params['X-Amz-Credential'] = (
+            'test/%s/us-east-1/S3/aws4_request' %
+            self.get_v4_amz_date_header().split('T', 1)[0])
+        do_check_bad(Config({'location': 'us-east-1'}), bad_params,
+                     s3response.AuthorizationQueryParametersError)
+        # bad terminal name
+        bad_params = dict(ok_params)
+        bad_params['X-Amz-Credential'] = (
+            'test/%s/us-east-1/s3/AWS4_request' %
+            self.get_v4_amz_date_header().split('T', 1)[0])
+        do_check_bad(Config({'location': 'us-east-1'}), bad_params,
+                     s3response.AuthorizationQueryParametersError)
+        # bad Signature
+        bad_params = dict(ok_params)
+        bad_params['X-Amz-Signature'] = ''
+        do_check_bad(Config({'location': 'us-east-1'}), bad_params,
+                     s3response.AccessDenied)
+        # bad SignedHeaders
+        bad_params = dict(ok_params)
+        bad_params['X-Amz-SignedHeaders'] = ''
+        do_check_bad(Config({'location': 'us-east-1'}), bad_params,
+                     s3response.AuthorizationQueryParametersError)
+
+    def test_controller_allow_multipart_uploads(self):
+        environ = {
+            'HTTP_HOST': 'bucket.s3.test.com',
+            'REQUEST_METHOD': 'GET'}
+        x_amz_date = self.get_v4_amz_date_header()
+        auth = ('AWS4-HMAC-SHA256 '
+                'Credential=test/%s/us-east-1/s3/aws4_request,'
+                'SignedHeaders=host;x-amz-content-sha256;x-amz-date,'
+                'Signature=X' % self.get_v4_amz_date_header().split('T', 1)[0])
+        headers = {
+            'Authorization': auth,
+            'X-Amz-Content-SHA256': '0' * 64,
+            'Date': self.get_date_header(),
+            'X-Amz-Date': x_amz_date}
+
+        def make_s3req(config, path, params):
+            req = Request.blank(path, environ=environ, headers=headers,
+                                params=params)
+            return SigV4Request(req.environ, None, config)
+
+        s3req = make_s3req(Config(), '/bkt', {'partNumber': '3'})
+        self.assertEqual(controllers.ObjectController,
+                         s3req.controller)
+
+        s3req = make_s3req(Config(), '/bkt', {'uploadId': '4'})
+        self.assertEqual(controllers.multi_upload.UploadController,
+                         s3req.controller)
+
+        s3req = make_s3req(Config(), '/bkt', {'uploads': '99'})
+        self.assertEqual(controllers.multi_upload.UploadsController,
+                         s3req.controller)
+
+        # multi part requests require allow_multipart_uploads
+        def do_check_slo_not_enabled(params):
+            s3req = make_s3req(Config({
+                'allow_multipart_uploads': False}), '/bkt', params)
+            self.assertRaises(s3response.S3NotImplemented,
+                              lambda: s3req.controller)
+
+        do_check_slo_not_enabled({'partNumber': '3'})
+        do_check_slo_not_enabled({'uploadId': '4'})
+        do_check_slo_not_enabled({'uploads': '99'})
+
+        # service requests not dependent on allow_multipart_uploads
+        s3req = make_s3req(Config(), '/', {'partNumber': '3'})
+        self.assertEqual(controllers.ServiceController,
+                         s3req.controller)
+        s3req = make_s3req(Config({'allow_multipart_uploads': False}), '/',
+                           {'partNumber': '3'})
+        self.assertEqual(controllers.ServiceController,
+                         s3req.controller)
+
+    def test_controller_for_multipart_upload_requests(self):
+        environ = {
+            'HTTP_HOST': 'bucket.s3.test.com',
+            'REQUEST_METHOD': 'PUT'}
+        x_amz_date = self.get_v4_amz_date_header()
+        auth = ('AWS4-HMAC-SHA256 '
+                'Credential=test/%s/us-east-1/s3/aws4_request,'
+                'SignedHeaders=host;x-amz-content-sha256;x-amz-date,'
+                'Signature=X' % self.get_v4_amz_date_header().split('T', 1)[0])
+        headers = {
+            'Authorization': auth,
+            'X-Amz-Content-SHA256': '0' * 64,
+            'Date': self.get_date_header(),
+            'X-Amz-Date': x_amz_date}
+
+        def make_s3req(config, path, params):
+            req = Request.blank(path, environ=environ, headers=headers,
+                                params=params)
+            return SigV4Request(req.environ, None, config)
+
+        s3req = make_s3req(Config(), '/bkt', {'partNumber': '3',
+                                              'uploadId': '4'})
+        self.assertEqual(controllers.multi_upload.PartController,
+                         s3req.controller)
+
+        s3req = make_s3req(Config(), '/bkt', {'partNumber': '3'})
+        self.assertEqual(controllers.multi_upload.PartController,
+                         s3req.controller)
+
+        s3req = make_s3req(Config(), '/bkt', {'uploadId': '4',
+                                              'partNumber': '3',
+                                              'copySource': 'bkt2/obj2'})
+        self.assertEqual(controllers.multi_upload.PartController,
+                         s3req.controller)
+
+
+class TestHashingInput(S3ApiTestCase):
+    def test_good(self):
+        raw = b'123456789'
+        wrapped = HashingInput(
+            BytesIO(raw), 9, hashlib.sha256(raw).hexdigest())
+        self.assertEqual(b'1234', wrapped.read(4))
+        self.assertEqual(b'56', wrapped.read(2))
+        # trying to read past the end gets us whatever's left
+        self.assertEqual(b'789', wrapped.read(4))
+        # can continue trying to read -- but it'll be empty
+        self.assertEqual(b'', wrapped.read(2))
+
+        self.assertFalse(wrapped.wsgi_input.closed)
+        wrapped.close()
+        self.assertTrue(wrapped.wsgi_input.closed)
+
+    def test_good_readline(self):
+        raw = b'12345\n6789'
+        wrapped = HashingInput(
+            BytesIO(raw), 10, hashlib.sha256(raw).hexdigest())
+        self.assertEqual(b'12345\n', wrapped.readline())
+        self.assertEqual(b'6789', wrapped.readline())
+        self.assertEqual(b'', wrapped.readline())
+
+    def test_empty(self):
+        wrapped = HashingInput(
+            BytesIO(b''), 0, hashlib.sha256(b'').hexdigest())
+        self.assertEqual(b'', wrapped.read(4))
+        self.assertEqual(b'', wrapped.read(2))
+
+        self.assertFalse(wrapped.wsgi_input.closed)
+        wrapped.close()
+        self.assertTrue(wrapped.wsgi_input.closed)
+
+    def test_too_long(self):
+        raw = b'123456789'
+        wrapped = HashingInput(
+            BytesIO(raw), 8, hashlib.sha256(raw).hexdigest())
+        self.assertEqual(b'1234', wrapped.read(4))
+        self.assertEqual(b'56', wrapped.read(2))
+        # even though the hash matches, there was more data than we expected
+        with self.assertRaises(S3InputSHA256Mismatch) as raised:
+            wrapped.read(3)
+        self.assertIsInstance(raised.exception, BaseException)
+        # won't get caught by most things in a pipeline
+        self.assertNotIsInstance(raised.exception, Exception)
+        # the error causes us to close the input
+        self.assertTrue(wrapped.wsgi_input.closed)
+
+    def test_too_short_read_piecemeal(self):
+        raw = b'123456789'
+        wrapped = HashingInput(
+            BytesIO(raw), 10, hashlib.sha256(raw).hexdigest())
+        self.assertEqual(b'1234', wrapped.read(4))
+        self.assertEqual(b'56789', wrapped.read(5))
+        # even though the hash matches, there was less data than we expected
+        with self.assertRaises(S3InputSHA256Mismatch):
+            wrapped.read(1)
+        self.assertTrue(wrapped.wsgi_input.closed)
+
+    def test_too_short_read_all(self):
+        raw = b'123456789'
+        wrapped = HashingInput(
+            BytesIO(raw), 10, hashlib.sha256(raw).hexdigest())
+        with self.assertRaises(S3InputSHA256Mismatch):
+            wrapped.read()
+        self.assertTrue(wrapped.wsgi_input.closed)
+
+    def test_bad_hash(self):
+        raw = b'123456789'
+        wrapped = HashingInput(
+            BytesIO(raw), 9, hashlib.sha256().hexdigest())
+        self.assertEqual(b'1234', wrapped.read(4))
+        self.assertEqual(b'5678', wrapped.read(4))
+        with self.assertRaises(S3InputSHA256Mismatch):
+            wrapped.read(4)
+        self.assertTrue(wrapped.wsgi_input.closed)
+
+    def test_empty_bad_hash(self):
+        _input = BytesIO(b'')
+        self.assertFalse(_input.closed)
+        with self.assertRaises(XAmzContentSHA256Mismatch):
+            # Don't even get a chance to try to read it
+            HashingInput(_input, 0, 'nope')
+        self.assertTrue(_input.closed)
+
+    def test_bad_hash_readline(self):
+        raw = b'12345\n6789'
+        wrapped = HashingInput(
+            BytesIO(raw), 10, hashlib.sha256(raw[:-3]).hexdigest())
+        self.assertEqual(b'12345\n', wrapped.readline())
+        with self.assertRaises(S3InputSHA256Mismatch):
+            self.assertEqual(b'6789', wrapped.readline())
+
+
+class TestChunkReader(unittest.TestCase):
+    def test_read_sig_checker_ok(self):
+        raw = '123456789\r\n0;chunk-signature=ok\r\n\r\n'.encode('utf8')
+
+        mock_validator = MagicMock(return_value=True)
+        bytes_input = BytesIO(raw)
+        reader = ChunkReader(
+            bytes_input, 9, mock_validator, 'chunk-signature=signature')
+        self.assertEqual(9, reader.to_read)
+        self.assertEqual(b'123456789', reader.read())
+        self.assertEqual(0, reader.to_read)
+        self.assertEqual(
+            [mock.call(hashlib.sha256(b'123456789').hexdigest(), 'signature')],
+            mock_validator.call_args_list)
+        self.assertFalse(bytes_input.closed)
+
+        mock_validator = MagicMock(return_value=True)
+        reader = ChunkReader(
+            BytesIO(raw), 9, mock_validator, 'chunk-signature=signature')
+        self.assertEqual(9, reader.to_read)
+        self.assertEqual(b'12345678', reader.read(8))
+        self.assertEqual(1, reader.to_read)
+        self.assertEqual(b'9', reader.read(8))
+        self.assertEqual(0, reader.to_read)
+        self.assertEqual(
+            [mock.call(hashlib.sha256(b'123456789').hexdigest(), 'signature')],
+            mock_validator.call_args_list)
+
+        mock_validator = MagicMock(return_value=True)
+        reader = ChunkReader(
+            BytesIO(raw), 9, mock_validator, 'chunk-signature=signature')
+        self.assertEqual(9, reader.to_read)
+        self.assertEqual(b'123456789', reader.read(10))
+        self.assertEqual(0, reader.to_read)
+        self.assertEqual(
+            [mock.call(hashlib.sha256(b'123456789').hexdigest(), 'signature')],
+            mock_validator.call_args_list)
+
+        mock_validator = MagicMock(return_value=True)
+        reader = ChunkReader(
+            BytesIO(raw), 9, mock_validator, 'chunk-signature=signature')
+        self.assertEqual(9, reader.to_read)
+        self.assertEqual(b'123456789', reader.read(-1))
+        self.assertEqual(0, reader.to_read)
+        self.assertEqual(
+            [mock.call(hashlib.sha256(b'123456789').hexdigest(), 'signature')],
+            mock_validator.call_args_list)
+
+    def test_read_sig_checker_bad(self):
+        raw = '123456789\r\n0;chunk-signature=ok\r\n\r\n'.encode('utf8')
+        mock_validator = MagicMock(return_value=False)
+        bytes_input = BytesIO(raw)
+        reader = ChunkReader(
+            bytes_input, 9, mock_validator, 'chunk-signature=signature')
+        reader.read(8)
+        self.assertEqual(1, reader.to_read)
+        with self.assertRaises(S3InputChunkSignatureMismatch):
+            reader.read(1)
+        self.assertEqual(0, reader.to_read)
+        self.assertEqual(
+            [mock.call(hashlib.sha256(b'123456789').hexdigest(), 'signature')],
+            mock_validator.call_args_list)
+        self.assertTrue(bytes_input.closed)
+
+    def test_read_no_sig_checker(self):
+        raw = '123456789\r\n0;chunk-signature=ok\r\n\r\n'.encode('utf8')
+        bytes_input = BytesIO(raw)
+        reader = ChunkReader(bytes_input, 9, None, None)
+        self.assertEqual(9, reader.to_read)
+        self.assertEqual(b'123456789', reader.read())
+        self.assertEqual(0, reader.to_read)
+        self.assertFalse(bytes_input.closed)
+
+    def test_readline_sig_checker_ok_newline_is_midway_through_chunk(self):
+        raw = '123456\n7\r\n0;chunk-signature=ok\r\n\r\n'.encode('utf8')
+        mock_validator = MagicMock(return_value=True)
+        bytes_input = BytesIO(raw)
+        reader = ChunkReader(
+            bytes_input, 8, mock_validator, 'chunk-signature=signature')
+        self.assertEqual(8, reader.to_read)
+        self.assertEqual(b'123456\n', reader.readline())
+        self.assertEqual(1, reader.to_read)
+        self.assertEqual(b'7', reader.readline())
+        self.assertEqual(0, reader.to_read)
+        self.assertEqual(
+            [mock.call(hashlib.sha256(b'123456\n7').hexdigest(), 'signature')],
+            mock_validator.call_args_list)
+        self.assertFalse(bytes_input.closed)
+
+    def test_readline_sig_checker_ok_newline_is_end_of_chunk(self):
+        raw = '1234567\n\r\n0;chunk-signature=ok\r\n\r\n'.encode('utf8')
+        mock_validator = MagicMock(return_value=True)
+        bytes_input = BytesIO(raw)
+        reader = ChunkReader(
+            bytes_input, 8, mock_validator, 'chunk-signature=signature')
+        self.assertEqual(8, reader.to_read)
+        self.assertEqual(b'1234567\n', reader.readline())
+        self.assertEqual(0, reader.to_read)
+        self.assertEqual(
+            [mock.call(hashlib.sha256(b'1234567\n').hexdigest(), 'signature')],
+            mock_validator.call_args_list)
+        self.assertFalse(bytes_input.closed)
+
+    def test_readline_sig_checker_ok_partial_line_read(self):
+        raw = '1234567\n\r\n0;chunk-signature=ok\r\n\r\n'.encode('utf8')
+        mock_validator = MagicMock(return_value=True)
+        bytes_input = BytesIO(raw)
+        reader = ChunkReader(
+            bytes_input, 8, mock_validator, 'chunk-signature=signature')
+        self.assertEqual(8, reader.to_read)
+        self.assertEqual(b'12345', reader.readline(5))
+        self.assertEqual(3, reader.to_read)
+        self.assertEqual(b'67', reader.readline(2))
+        self.assertEqual(1, reader.to_read)
+        self.assertEqual(b'\n', reader.readline())
+        self.assertEqual(0, reader.to_read)
+        self.assertEqual(
+            [mock.call(hashlib.sha256(b'1234567\n').hexdigest(), 'signature')],
+            mock_validator.call_args_list)
+        self.assertFalse(bytes_input.closed)
+
+
+class TestStreamingInput(S3ApiTestCase):
+    def setUp(self):
+        super(TestStreamingInput, self).setUp()
+        # Override chunk min size
+        s3request.SIGV4_CHUNK_MIN_SIZE = 2
+        self.fake_sig_checker = MagicMock()
+        self.fake_sig_checker.check_chunk_signature = \
+            lambda chunk, signature: signature == 'ok'
+
+    def test_read(self):
+        raw = '9;chunk-signature=ok\r\n123456789\r\n' \
+              '0;chunk-signature=ok\r\n\r\n'.encode('utf8')
+        wrapped = StreamingInput(BytesIO(raw), 9, set(), self.fake_sig_checker)
+        self.assertEqual(b'123456789', wrapped.read())
+        self.assertFalse(wrapped._input.closed)
+        wrapped.close()
+        self.assertTrue(wrapped._input.closed)
+
+    def test_read_with_size(self):
+        raw = '9;chunk-signature=ok\r\n123456789\r\n' \
+              '0;chunk-signature=ok\r\n\r\n'.encode('utf8')
+        wrapped = StreamingInput(BytesIO(raw), 9, set(), self.fake_sig_checker)
+        self.assertEqual(b'1234', wrapped.read(4))
+        self.assertEqual(b'56', wrapped.read(2))
+        # trying to read past the end gets us whatever's left
+        self.assertEqual(b'789', wrapped.read(4))
+        # can continue trying to read -- but it'll be empty
+        self.assertEqual(b'', wrapped.read(2))
+
+        self.assertFalse(wrapped._input.closed)
+        wrapped.close()
+        self.assertTrue(wrapped._input.closed)
+
+    def test_read_multiple_chunks(self):
+        raw = '9;chunk-signature=ok\r\n123456789\r\n' \
+              '7;chunk-signature=ok\r\nabc\ndef\r\n' \
+              '0;chunk-signature=ok\r\n\r\n'.encode('utf8')
+        wrapped = StreamingInput(BytesIO(raw), 16, set(),
+                                 self.fake_sig_checker)
+        self.assertEqual(b'123456789abc\ndef', wrapped.read())
+        self.assertEqual(b'', wrapped.read(2))
+
+    def test_read_multiple_chunks_with_size(self):
+        raw = '9;chunk-signature=ok\r\n123456789\r\n' \
+              '7;chunk-signature=ok\r\nabc\ndef\r\n' \
+              '0;chunk-signature=ok\r\n\r\n'.encode('utf8')
+        wrapped = StreamingInput(BytesIO(raw), 16, set(),
+                                 self.fake_sig_checker)
+        self.assertEqual(b'123456789a', wrapped.read(10))
+        self.assertEqual(b'bc\n', wrapped.read(3))
+        self.assertEqual(b'def', wrapped.read(4))
+        self.assertEqual(b'', wrapped.read(2))
+
+    def test_readline_newline_in_middle_and_at_end(self):
+        raw = 'a;chunk-signature=ok\r\n123456\n789\r\n' \
+              '4;chunk-signature=ok\r\nabc\n\r\n' \
+              '0;chunk-signature=ok\r\n\r\n'.encode('utf8')
+        wrapped = StreamingInput(BytesIO(raw), 14, set(),
+                                 self.fake_sig_checker)
+        self.assertEqual(b'123456\n', wrapped.readline())
+        self.assertEqual(b'789abc\n', wrapped.readline())
+        self.assertEqual(b'', wrapped.readline())
+
+    def test_readline_newline_in_middle_not_at_end(self):
+        raw = 'a;chunk-signature=ok\r\n123456\n789\r\n' \
+              '3;chunk-signature=ok\r\nabc\r\n' \
+              '0;chunk-signature=ok\r\n\r\n'.encode('utf8')
+        wrapped = StreamingInput(BytesIO(raw), 13, set(),
+                                 self.fake_sig_checker)
+        self.assertEqual(b'123456\n', wrapped.readline())
+        self.assertEqual(b'789abc', wrapped.readline())
+        self.assertEqual(b'', wrapped.readline())
+
+    def test_readline_no_newline(self):
+        raw = '9;chunk-signature=ok\r\n123456789\r\n' \
+              '3;chunk-signature=ok\r\nabc\r\n' \
+              '0;chunk-signature=ok\r\n\r\n'.encode('utf8')
+        wrapped = StreamingInput(BytesIO(raw), 12, set(),
+                                 self.fake_sig_checker)
+        self.assertEqual(b'123456789abc', wrapped.readline())
+        self.assertEqual(b'', wrapped.readline())
+
+    def test_readline_line_spans_chunks(self):
+        raw = '9;chunk-signature=ok\r\nblah\nblah\r\n' \
+              '9;chunk-signature=ok\r\n123456789\r\n' \
+              '7;chunk-signature=ok\r\nabc\ndef\r\n' \
+              '0;chunk-signature=ok\r\n\r\n'.encode('utf8')
+        wrapped = StreamingInput(BytesIO(raw), 25, set(),
+                                 self.fake_sig_checker)
+        self.assertEqual(b'blah\n', wrapped.readline())
+        self.assertEqual(b'blah123456789abc\n', wrapped.readline())
+        self.assertEqual(b'def', wrapped.readline())
+
+    def test_readline_with_size_line_spans_chunks(self):
+        raw = '9;chunk-signature=ok\r\nblah\nblah\r\n' \
+              '9;chunk-signature=ok\r\n123456789\r\n' \
+              '7;chunk-signature=ok\r\nabc\ndef\r\n' \
+              '0;chunk-signature=ok\r\n\r\n'.encode('utf8')
+        wrapped = StreamingInput(BytesIO(raw), 25, set(),
+                                 self.fake_sig_checker)
+        self.assertEqual(b'blah\n', wrapped.readline(8))
+        self.assertEqual(b'blah123456789a', wrapped.readline(14))
+        self.assertEqual(b'bc\n', wrapped.readline(99))
+        self.assertEqual(b'def', wrapped.readline(99))
+
+    def test_chunk_separator_missing(self):
+        raw = '9;chunk-signature=ok\r\n123456789' \
+              '0;chunk-signature=ok\r\n\r\n'.encode('utf8')
+        wrapped = StreamingInput(BytesIO(raw), 9, set(), self.fake_sig_checker)
+        with self.assertRaises(s3request.S3InputIncomplete):
+            wrapped.read()
+        self.assertTrue(wrapped._input.closed)
+
+    def test_final_newline_missing(self):
+        raw = '9;chunk-signature=ok\r\n123456789\r\n' \
+              '0;chunk-signature=ok\r\n\r'.encode('utf8')
+        wrapped = StreamingInput(BytesIO(raw), 9, set(), self.fake_sig_checker)
+        with self.assertRaises(s3request.S3InputIncomplete):
+            wrapped.read()
+        self.assertTrue(wrapped._input.closed)
+
+    def test_trailing_garbage_ok(self):
+        raw = '9;chunk-signature=ok\r\n123456789\r\n' \
+              '0;chunk-signature=ok\r\n\r\ngarbage'.encode('utf8')
+        wrapped = StreamingInput(BytesIO(raw), 9, set(), self.fake_sig_checker)
+        self.assertEqual(b'123456789', wrapped.read())
+
+    def test_good_with_trailers(self):
+        raw = '9;chunk-signature=ok\r\n123456789\r\n' \
+              '0;chunk-signature=ok\r\n' \
+              'x-amz-checksum-crc32: AAAAAA==\r\n'.encode('utf8')
+        wrapped = StreamingInput(
+            BytesIO(raw), 9, {'x-amz-checksum-crc32'}, self.fake_sig_checker)
+        self.assertEqual(b'1234', wrapped.read(4))
+        self.assertEqual(b'56', wrapped.read(2))
+        # not at end, trailers haven't been read
+        self.assertEqual({}, wrapped.trailers)
+        # if we get exactly to the end, we go ahead and read the trailers
+        self.assertEqual(b'789', wrapped.read(3))
+        self.assertEqual({'x-amz-checksum-crc32': 'AAAAAA=='},
+                         wrapped.trailers)
+        # can continue trying to read -- but it'll be empty
+        self.assertEqual(b'', wrapped.read(2))
+        self.assertEqual({'x-amz-checksum-crc32': 'AAAAAA=='},
+                         wrapped.trailers)
+
+        self.assertFalse(wrapped._input.closed)
+        wrapped.close()
+        self.assertTrue(wrapped._input.closed)
+
+    def test_unexpected_trailers(self):
+        def do_test(raw):
+            wrapped = StreamingInput(
+                BytesIO(raw), 9, {'x-amz-checksum-crc32'},
+                self.fake_sig_checker)
+            with self.assertRaises(s3request.S3InputMalformedTrailer):
+                wrapped.read()
+            self.assertTrue(wrapped._input.closed)
+
+        do_test('9;chunk-signature=ok\r\n123456789\r\n'
+                '0;chunk-signature=ok\r\n'
+                'x-amz-checksum-sha256: value\r\n'.encode('utf8'))
+        do_test('9;chunk-signature=ok\r\n123456789\r\n'
+                '0;chunk-signature=ok\r\n'
+                'x-amz-checksum-crc32=value\r\n'.encode('utf8'))
+        do_test('9;chunk-signature=ok\r\n123456789\r\n'
+                '0;chunk-signature=ok\r\n'
+                'x-amz-checksum-crc32\r\n'.encode('utf8'))
+
+    def test_wrong_signature_first_chunk(self):
+        raw = '9;chunk-signature=ko\r\n123456789\r\n' \
+              '0;chunk-signature=ok\r\n\r\n'.encode('utf8')
+        wrapped = StreamingInput(BytesIO(raw), 9, set(), self.fake_sig_checker)
+        # Can read while in the chunk...
+        self.assertEqual(b'1234', wrapped.read(4))
+        self.assertEqual(b'5678', wrapped.read(4))
+        # But once we hit the end, bomb out
+        with self.assertRaises(s3request.S3InputChunkSignatureMismatch):
+            wrapped.read(4)
+        self.assertTrue(wrapped._input.closed)
+
+    def test_wrong_signature_middle_chunk(self):
+        raw = '2;chunk-signature=ok\r\n12\r\n' \
+              '2;chunk-signature=ok\r\n34\r\n' \
+              '2;chunk-signature=ko\r\n56\r\n' \
+              '2;chunk-signature=ok\r\n78\r\n' \
+              '0;chunk-signature=ok\r\n\r\n'.encode('utf8')
+        wrapped = StreamingInput(BytesIO(raw), 9, set(), self.fake_sig_checker)
+        self.assertEqual(b'1234', wrapped.read(4))
+        with self.assertRaises(s3request.S3InputChunkSignatureMismatch):
+            wrapped.read(4)
+        self.assertTrue(wrapped._input.closed)
+
+    def test_wrong_signature_last_chunk(self):
+        raw = '2;chunk-signature=ok\r\n12\r\n' \
+              '2;chunk-signature=ok\r\n34\r\n' \
+              '2;chunk-signature=ok\r\n56\r\n' \
+              '2;chunk-signature=ok\r\n78\r\n' \
+              '0;chunk-signature=ko\r\n\r\n'.encode('utf8')
+        wrapped = StreamingInput(BytesIO(raw), 9, set(), self.fake_sig_checker)
+        self.assertEqual(b'12345678', wrapped.read(8))
+        with self.assertRaises(s3request.S3InputChunkSignatureMismatch):
+            wrapped.read(4)
+        self.assertTrue(wrapped._input.closed)
+
+    def test_not_enough_content(self):
+        raw = '9;chunk-signature=ok\r\n123456789\r\n' \
+              '0;chunk-signature=ok\r\n\r\n'.encode('utf8')
+        wrapped = StreamingInput(
+            BytesIO(raw), 33, set(), self.fake_sig_checker)
+        with self.assertRaises(s3request.S3InputSizeError) as cm:
+            wrapped.read()
+        self.assertEqual(33, cm.exception.expected)
+        self.assertEqual(9, cm.exception.provided)
+        self.assertTrue(wrapped._input.closed)
+
+    def test_wrong_chunk_size(self):
+        # first chunk should be size 9 not a
+        raw = 'a;chunk-signature=ok\r\n123456789\r\n' \
+            '0;chunk-signature=ok\r\n\r\n'.encode('utf8')
+        wrapped = StreamingInput(BytesIO(raw), 9, set(), self.fake_sig_checker)
+        with self.assertRaises(s3request.S3InputSizeError) as cm:
+            wrapped.read(4)
+        self.assertEqual(9, cm.exception.expected)
+        self.assertEqual(10, cm.exception.provided)
+        self.assertTrue(wrapped._input.closed)
+
+    def test_small_first_chunk_size(self):
+        raw = '1;chunk-signature=ok\r\n1\r\n' \
+              '8;chunk-signature=ok\r\n23456789\r\n' \
+              '0;chunk-signature=ok\r\n\r\n'.encode('utf8')
+        wrapped = StreamingInput(BytesIO(raw), 9, set(), self.fake_sig_checker)
+        with self.assertRaises(s3request.S3InputChunkTooSmall) as cm:
+            wrapped.read(4)
+        # note: the chunk number is the one *after* the short chunk
+        self.assertEqual(2, cm.exception.chunk_number)
+        self.assertEqual(1, cm.exception.bad_chunk_size)
+        self.assertTrue(wrapped._input.closed)
+
+    def test_small_final_chunk_size_ok(self):
+        raw = '8;chunk-signature=ok\r\n12345678\r\n' \
+              '1;chunk-signature=ok\r\n9\r\n' \
+              '0;chunk-signature=ok\r\n\r\n'.encode('utf8')
+        wrapped = StreamingInput(BytesIO(raw), 9, set(), self.fake_sig_checker)
+        self.assertEqual(b'123456789', wrapped.read())
+
+    def test_invalid_chunk_size(self):
+        # the actual chunk data doesn't need to match the length in the
+        # chunk header for the test
+        raw = ('-1;chunk-signature=ok\r\n123456789\r\n'
+               '0;chunk-signature=ok\r\n\r\n').encode('utf8')
+        wrapped = StreamingInput(BytesIO(raw), 9, set(), None)
+        with self.assertRaises(s3request.S3InputIncomplete) as cm:
+            wrapped.read(4)
+        self.assertIn('invalid chunk header', str(cm.exception))
+        self.assertTrue(wrapped._input.closed)
+
+    def test_invalid_chunk_params(self):
+        def do_test(params, exp_exception):
+            raw = ('9;%s\r\n123456789\r\n'
+                   '0;chunk-signature=ok\r\n\r\n' % params).encode('utf8')
+            wrapped = StreamingInput(BytesIO(raw), 9, set(), MagicMock())
+            with self.assertRaises(exp_exception):
+                wrapped.read(4)
+            self.assertTrue(wrapped._input.closed)
+
+        do_test('chunk-signature=', s3request.S3InputIncomplete)
+        do_test('chunk-signature=ok;not-ok', s3request.S3InputIncomplete)
+        do_test('chunk-signature=ok;chunk-signature=ok',
+                s3request.S3InputIncomplete)
+        do_test('chunk-signature', s3request.S3InputIncomplete)
+        # note: underscore not hyphen...
+        do_test('chunk_signature=ok', s3request.S3InputChunkSignatureMismatch)
+        do_test('skunk-cignature=ok', s3request.S3InputChunkSignatureMismatch)
+
+
+class TestModuleFunctions(unittest.TestCase):
+    def test_get_checksum_hasher(self):
+        def do_test(crc):
+            hasher = _get_checksum_hasher('x-amz-checksum-%s' % crc)
+            self.assertEqual(crc, hasher.name)
+
+        do_test('crc32')
+        do_test('sha1')
+        do_test('sha256')
+
+        try:
+            checksum._select_crc32c_impl()
+        except NotImplementedError:
+            # This *should* always have a kernel implementation available as
+            # a fallback, but debian packaging (at least) has bumped into
+            # issues with even *that* not being available before
+            pass
+        else:
+            do_test('crc32c')
+
+        try:
+            checksum._select_crc64nvme_impl()
+        except NotImplementedError:
+            pass
+        else:
+            do_test('crc64nvme')
+
+    def test_get_checksum_hasher_invalid(self):
+        def do_test(crc):
+            with self.assertRaises(s3response.S3NotImplemented):
+                _get_checksum_hasher('x-amz-checksum-%s' % crc)
+
+        with mock.patch.object(checksum, '_select_crc64nvme_impl',
+                               side_effect=NotImplementedError):
+            do_test('crc64nvme')
+        do_test('nonsense')
+        do_test('')
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/s3api/test_s3response.py b/test/unit/common/middleware/s3api/test_s3response.py
new file mode 100644
index 0000000000..2cb8c47b1c
--- /dev/null
+++ b/test/unit/common/middleware/s3api/test_s3response.py
@@ -0,0 +1,151 @@
+# Copyright (c) 2014 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+
+from swift.common.swob import Response, Request
+from swift.common.utils import HeaderKeyDict
+from swift.common.middleware.catch_errors import CatchErrorMiddleware
+from swift.common.middleware.s3api.s3response import S3Response, ErrorResponse
+from swift.common.middleware.s3api.utils import sysmeta_prefix
+
+
+class TestResponse(unittest.TestCase):
+    def test_from_swift_resp_slo(self):
+        for expected, header_vals in \
+                ((True, ('true', '1')), (False, ('false', 'ugahhh', None))):
+            for val in header_vals:
+                resp = Response(headers={'X-Static-Large-Object': val,
+                                         'Etag': 'theetag'})
+                s3resp = S3Response.from_swift_resp(resp)
+                self.assertEqual(expected, s3resp.is_slo)
+                if s3resp.is_slo:
+                    self.assertEqual('"theetag-N"', s3resp.headers['ETag'])
+                else:
+                    self.assertEqual('"theetag"', s3resp.headers['ETag'])
+
+    def test_response_s3api_user_meta_headers(self):
+        resp = Response(headers={
+            'X-Object-Meta-Foo': 'Bar',
+            'X-Object-Meta-Non-\xdcnicode-Value': '\xff',
+            'X-Object-Meta-With=5FUnderscore': 'underscored',
+            'X-Object-Sysmeta-Baz': 'quux',
+            'Etag': 'unquoted',
+            'Content-type': 'text/plain',
+            'content-length': '0',
+        })
+        s3resp = S3Response.from_swift_resp(resp)
+        self.assertEqual(dict(s3resp.headers), {
+            'x-amz-meta-foo': 'Bar',
+            'x-amz-meta-non-\xdcnicode-value': '\xff',
+            'x-amz-meta-with_underscore': 'underscored',
+            'ETag': '"unquoted"',
+            'Content-Type': 'text/plain',
+            'Content-Length': '0',
+        })
+
+    def test_response_s3api_sysmeta_headers(self):
+        for _server_type in ('object', 'container'):
+            swift_headers = HeaderKeyDict(
+                {sysmeta_prefix(_server_type) + 'test': 'ok'})
+            resp = Response(headers=swift_headers)
+            s3resp = S3Response.from_swift_resp(resp)
+            self.assertEqual(swift_headers, s3resp.sysmeta_headers)
+
+    def test_response_s3api_sysmeta_headers_ignore_other_sysmeta(self):
+        for _server_type in ('object', 'container'):
+            swift_headers = HeaderKeyDict(
+                # sysmeta not leading sysmeta_prefix even including s3api word
+                {'x-%s-sysmeta-test-s3api' % _server_type: 'ok',
+                 sysmeta_prefix(_server_type) + 'test': 'ok'})
+            resp = Response(headers=swift_headers)
+            s3resp = S3Response.from_swift_resp(resp)
+            expected_headers = HeaderKeyDict(
+                {sysmeta_prefix(_server_type) + 'test': 'ok'})
+            self.assertEqual(expected_headers, s3resp.sysmeta_headers)
+            self.assertIn('x-%s-sysmeta-test-s3api' % _server_type,
+                          s3resp.sw_headers)
+
+    def test_response_s3api_sysmeta_from_swift3_sysmeta(self):
+        for _server_type in ('object', 'container'):
+            # swift could return older swift3 sysmeta
+            swift_headers = HeaderKeyDict(
+                {('x-%s-sysmeta-swift3-' % _server_type) + 'test': 'ok'})
+            resp = Response(headers=swift_headers)
+            s3resp = S3Response.from_swift_resp(resp)
+            expected_headers = HeaderKeyDict(
+                {sysmeta_prefix(_server_type) + 'test': 'ok'})
+            # but Response class should translates as s3api sysmeta
+            self.assertEqual(expected_headers, s3resp.sysmeta_headers)
+
+    def test_response_swift3_sysmeta_does_not_overwrite_s3api_sysmeta(self):
+        for _server_type in ('object', 'container'):
+            # same key name except sysmeta prefix
+            swift_headers = HeaderKeyDict(
+                {('x-%s-sysmeta-swift3-' % _server_type) + 'test': 'ng',
+                 sysmeta_prefix(_server_type) + 'test': 'ok'})
+            resp = Response(headers=swift_headers)
+            s3resp = S3Response.from_swift_resp(resp)
+            expected_headers = HeaderKeyDict(
+                {sysmeta_prefix(_server_type) + 'test': 'ok'})
+            # but only s3api sysmeta remains in the response sysmeta_headers
+            self.assertEqual(expected_headers, s3resp.sysmeta_headers)
+
+
+class DummyErrorResponse(ErrorResponse):
+    _status = "418 I'm a teapot"
+
+
+class TestErrorResponse(unittest.TestCase):
+    def test_error_response(self):
+        resp = DummyErrorResponse(msg='my-msg', reason='my reason')
+        self.assertEqual("418 I'm a teapot", str(resp))
+        self.assertEqual("418 I'm a teapot", resp.status)
+        self.assertEqual(418, resp.status_int)
+        self.assertEqual('my reason', resp.reason)
+        self.assertEqual('DummyErrorResponse.my_reason', resp.summary)
+        self.assertEqual('418.DummyErrorResponse.my_reason', resp.metric_name)
+        self.assertEqual(
+            b"<?xml version='1.0' encoding='UTF-8'?>\n"
+            b"<Error>"
+            b"<Code>DummyErrorResponse</Code>"
+            b"<Message>my-msg</Message>"
+            b"</Error>",
+            resp.body)
+
+    def test_error_response_trans_id(self):
+        req = Request.blank('/bucket/object')
+        err = DummyErrorResponse(msg='my-msg', reason='my reason')
+        app = CatchErrorMiddleware(err, {})
+        with unittest.mock.patch(
+                'swift.common.middleware.catch_errors.generate_trans_id',
+                return_value='fake-trans-id'):
+            resp = req.get_response(app)
+        self.assertIn('swift.trans_id', req.environ)
+        self.assertEqual(418, resp.status_int)
+        self.assertIn('X-Trans-Id', resp.headers)
+        self.assertEqual(
+            b"<?xml version='1.0' encoding='UTF-8'?>\n"
+            b"<Error>"
+            b"<Code>DummyErrorResponse</Code>"
+            b"<Message>my-msg</Message>"
+            b"<RequestId>fake-trans-id</RequestId>"
+            b"</Error>",
+            resp.body)
+        self.assertEqual(146, int(resp.headers['Content-Length']))
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/s3api/test_s3token.py b/test/unit/common/middleware/s3api/test_s3token.py
new file mode 100644
index 0000000000..2ff197ff04
--- /dev/null
+++ b/test/unit/common/middleware/s3api/test_s3token.py
@@ -0,0 +1,1008 @@
+# Copyright 2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License"); you may
+# not use this file except in compliance with the License. You may obtain
+# a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
+# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
+# License for the specific language governing permissions and limitations
+# under the License.
+
+import copy
+import base64
+import json
+import time
+import unittest
+import uuid
+
+from unittest import mock
+import requests
+from requests_mock.contrib import fixture as rm_fixture
+import urllib.parse
+
+from swift.common.middleware.s3api import s3token
+from swift.common.swob import Request, Response
+from swift.common.wsgi import ConfigFileError
+
+from test.debug_logger import debug_logger
+
+GOOD_RESPONSE_V2 = {'access': {
+    'user': {
+        'username': 'S3_USER',
+        'name': 'S3_USER',
+        'id': 'USER_ID',
+        'roles': [
+            {'name': 'swift-user'},
+            {'name': '_member_'},
+        ],
+    },
+    'token': {
+        'id': 'TOKEN_ID',
+        'tenant': {
+            'id': 'TENANT_ID',
+            'name': 'TENANT_NAME'
+        }
+    }
+}}
+GOOD_RESPONSE_V3 = {'token': {
+    'user': {
+        'domain': {
+            'name': 'Default',
+            'id': 'default',
+        },
+        'name': 'S3_USER',
+        'id': 'USER_ID',
+    },
+    'project': {
+        'domain': {
+            'name': 'PROJECT_DOMAIN_NAME',
+            'id': 'PROJECT_DOMAIN_ID',
+        },
+        'name': 'PROJECT_NAME',
+        'id': 'PROJECT_ID',
+    },
+    'roles': [
+        {'name': 'swift-user'},
+        {'name': '_member_'},
+    ],
+}}
+
+
+class FakeResponse(requests.Response):
+    """Utility class to wrap requests.Response.
+
+    Class used to wrap requests.Response and provide some convenience to
+    initialize with a dict.
+    """
+
+    def __init__(self, data):
+        self._text = None
+        super(FakeResponse, self).__init__()
+        if isinstance(data, dict):
+            self.status_code = data.get('status_code', 200)
+            headers = data.get('headers')
+            if headers:
+                self.headers.update(headers)
+            # Fake the text attribute to streamline Response creation
+            # _content is defined by requests.Response
+            self._content = data.get('text')
+        else:
+            self.status_code = data
+
+    def __eq__(self, other):
+        return self.__dict__ == other.__dict__
+
+    @property
+    def text(self):
+        return self.content
+
+
+class FakeApp(object):
+    calls = 0
+    """This represents a WSGI app protected by the auth_token middleware."""
+    def __call__(self, env, start_response):
+        self.calls += 1
+        resp = Response()
+        resp.environ = env
+        return resp(env, start_response)
+
+
+class S3TokenMiddlewareTestBase(unittest.TestCase):
+
+    TEST_AUTH_URI = 'https://fakehost/identity/v2.0'
+    TEST_URL = '%s/s3tokens' % (TEST_AUTH_URI, )
+    TEST_DOMAIN_ID = '1'
+    TEST_DOMAIN_NAME = 'aDomain'
+    TEST_GROUP_ID = uuid.uuid4().hex
+    TEST_ROLE_ID = uuid.uuid4().hex
+    TEST_TENANT_ID = '1'
+    TEST_TENANT_NAME = 'aTenant'
+    TEST_TOKEN = 'aToken'
+    TEST_TRUST_ID = 'aTrust'
+    TEST_USER = 'test'
+    TEST_USER_ID = uuid.uuid4().hex
+
+    TEST_ROOT_URL = 'http://127.0.0.1:5000/'
+
+    def setUp(self):
+        super(S3TokenMiddlewareTestBase, self).setUp()
+        self.logger = debug_logger()
+        self.time_patcher = mock.patch.object(time, 'time', lambda: 1234)
+        self.time_patcher.start()
+
+        self.app = FakeApp()
+        self.conf = {
+            'auth_uri': self.TEST_AUTH_URI,
+        }
+        self.middleware = self.make_middleware(self.conf)
+
+        self.requests_mock = rm_fixture.Fixture()
+        self.requests_mock.setUp()
+
+    def make_middleware(self, conf):
+        with mock.patch('swift.common.middleware.s3api.s3token.get_logger',
+                        return_value=self.logger):
+            return s3token.S3Token(self.app, conf)
+
+    def tearDown(self):
+        self.requests_mock.cleanUp()
+        self.time_patcher.stop()
+        super(S3TokenMiddlewareTestBase, self).tearDown()
+
+    def start_fake_response(self, status, headers):
+        self.response_status = int(status.split(' ', 1)[0])
+        self.response_headers = dict(headers)
+
+
+class S3TokenMiddlewareTestGood(S3TokenMiddlewareTestBase):
+
+    def setUp(self):
+        super(S3TokenMiddlewareTestGood, self).setUp()
+
+        self.requests_mock.post(self.TEST_URL,
+                                status_code=201,
+                                json=GOOD_RESPONSE_V2)
+
+    # Ignore the request and pass to the next middleware in the
+    # pipeline if no path has been specified.
+    def test_no_path_request(self):
+        req = Request.blank('/')
+        self.middleware(req.environ, self.start_fake_response)
+        self.assertEqual(self.response_status, 200)
+
+    # Ignore the request and pass to the next middleware in the
+    # pipeline if no Authorization header has been specified
+    def test_without_authorization(self):
+        req = Request.blank('/v1/AUTH_cfa/c/o')
+        self.middleware(req.environ, self.start_fake_response)
+        self.assertEqual(self.response_status, 200)
+
+    def test_nukes_auth_headers(self):
+        client_env = {
+            'HTTP_X_IDENTITY_STATUS': 'Confirmed',
+            'HTTP_X_ROLES': 'admin,_member_,swift-user',
+            'HTTP_X_TENANT_ID': 'cfa'
+        }
+        req = Request.blank('/v1/AUTH_cfa/c/o', environ=client_env)
+        self.middleware(req.environ, self.start_fake_response)
+        self.assertEqual(self.response_status, 200)
+        for key in client_env:
+            self.assertNotIn(key, req.environ)
+
+    def test_without_auth_storage_token(self):
+        req = Request.blank('/v1/AUTH_cfa/c/o')
+        req.headers['Authorization'] = 'AWS badboy'
+        self.middleware(req.environ, self.start_fake_response)
+        self.assertEqual(self.response_status, 200)
+
+    def _assert_authorized(self, req, account_path='/v1/AUTH_TENANT_ID/',
+                           access_key='access'):
+        self.assertTrue(
+            req.path.startswith(account_path),
+            '%r does not start with %r' % (req.path, account_path))
+        self.assertNotIn('X-Auth-Token', req.headers)
+        expected_headers = {
+            'X-Identity-Status': 'Confirmed',
+            'X-Roles': 'swift-user,_member_',
+            'X-User-Id': 'USER_ID',
+            'X-User-Name': 'S3_USER',
+            'X-Tenant-Id': 'TENANT_ID',
+            'X-Tenant-Name': 'TENANT_NAME',
+            'X-Project-Id': 'TENANT_ID',
+            'X-Project-Name': 'TENANT_NAME',
+        }
+        for header, value in expected_headers.items():
+            self.assertIn(header, req.headers)
+            self.assertEqual(value, req.headers[header])
+            # WSGI wants native strings for headers
+            self.assertIsInstance(req.headers[header], str)
+        self.assertEqual(1, self.middleware._app.calls)
+
+        self.assertEqual(1, self.requests_mock.call_count)
+        request_call = self.requests_mock.request_history[0]
+        self.assertEqual(json.loads(request_call.body), {'credentials': {
+            'access': access_key,
+            'signature': 'signature',
+            'token': base64.urlsafe_b64encode(b'token').decode('ascii')}})
+
+    def test_authorized(self):
+        req = Request.blank('/v1/AUTH_cfa/c/o')
+        req.environ['s3api.auth_details'] = {
+            'access_key': u'access',
+            'signature': u'signature',
+            'string_to_sign': u'token',
+        }
+        req.get_response(self.middleware)
+        self._assert_authorized(req)
+
+    def test_tolerate_missing_token_id(self):
+        resp = copy.deepcopy(GOOD_RESPONSE_V2)
+        del resp['access']['token']['id']
+        self.requests_mock.post(self.TEST_URL,
+                                status_code=201,
+                                json=resp)
+
+        req = Request.blank('/v1/AUTH_cfa/c/o')
+        req.environ['s3api.auth_details'] = {
+            'access_key': u'access',
+            'signature': u'signature',
+            'string_to_sign': u'token',
+        }
+        req.get_response(self.middleware)
+        self._assert_authorized(req)
+
+    def test_authorized_bytes(self):
+        req = Request.blank('/v1/AUTH_cfa/c/o')
+        req.environ['s3api.auth_details'] = {
+            'access_key': b'access',
+            'signature': b'signature',
+            'string_to_sign': b'token',
+        }
+        req.get_response(self.middleware)
+        self._assert_authorized(req)
+
+    def test_authorized_http(self):
+        auth_uri = 'http://fakehost:35357/v2.0'
+        self.requests_mock.post(
+            '%s/s3tokens' % auth_uri,
+            status_code=201, json=GOOD_RESPONSE_V2)
+
+        self.middleware = self.make_middleware({
+            'auth_uri': auth_uri})
+        req = Request.blank('/v1/AUTH_cfa/c/o')
+        req.environ['s3api.auth_details'] = {
+            'access_key': u'access',
+            'signature': u'signature',
+            'string_to_sign': u'token',
+        }
+        req.get_response(self.middleware)
+        self._assert_authorized(req)
+
+    def test_authorized_v3(self):
+        # Prior to https://github.com/openstack/keystone/commit/dd1e705
+        # even v3 URLs would respond with a v2-format response
+        auth_uri = 'http://fakehost:35357/v3'
+        self.requests_mock.post(
+            '%s/s3tokens' % auth_uri,
+            status_code=201, json=GOOD_RESPONSE_V2)
+
+        self.middleware = self.make_middleware({
+            'auth_uri': auth_uri})
+        req = Request.blank('/v1/AUTH_cfa/c/o')
+        req.environ['s3api.auth_details'] = {
+            'access_key': u'access',
+            'signature': u'signature',
+            'string_to_sign': u'token',
+        }
+        req.get_response(self.middleware)
+        self._assert_authorized(req)
+
+    def test_authorized_trailing_slash(self):
+        self.middleware = self.make_middleware({
+            'auth_uri': self.TEST_AUTH_URI + '/'})
+        req = Request.blank('/v1/AUTH_cfa/c/o')
+        req.environ['s3api.auth_details'] = {
+            'access_key': u'access',
+            'signature': u'signature',
+            'string_to_sign': u'token',
+        }
+        req.get_response(self.middleware)
+        self._assert_authorized(req)
+
+    def test_authorization_nova_toconnect(self):
+        req = Request.blank('/v1/AUTH_swiftint/c/o')
+        req.environ['s3api.auth_details'] = {
+            'access_key': u'access:FORCED_TENANT_ID',
+            'signature': u'signature',
+            'string_to_sign': u'token',
+        }
+        req.get_response(self.middleware)
+        self._assert_authorized(req, account_path='/v1/AUTH_FORCED_TENANT_ID/')
+
+    @mock.patch.object(requests, 'post')
+    def test_insecure(self, MOCK_REQUEST):
+        self.middleware = self.make_middleware({
+            'insecure': 'True', 'auth_uri': 'http://example.com'})
+
+        text_return_value = json.dumps(GOOD_RESPONSE_V2)
+        MOCK_REQUEST.return_value = FakeResponse({
+            'status_code': 201,
+            'text': text_return_value})
+
+        req = Request.blank('/v1/AUTH_cfa/c/o')
+        req.environ['s3api.auth_details'] = {
+            'access_key': u'access',
+            'signature': u'signature',
+            'string_to_sign': u'token',
+        }
+        req.get_response(self.middleware)
+
+        self.assertTrue(MOCK_REQUEST.called)
+        mock_args, mock_kwargs = MOCK_REQUEST.call_args
+        self.assertIs(mock_kwargs['verify'], False)
+
+    def test_insecure_option(self):
+        # insecure is passed as a string.
+
+        # Some non-secure values.
+        true_values = ['true', 'True', '1', 'yes']
+        for val in true_values:
+            config = {'insecure': val,
+                      'certfile': 'false_ind',
+                      'auth_uri': 'http://example.com'}
+            middleware = s3token.filter_factory(config)(self.app)
+            self.assertIs(False, middleware._verify)
+
+        # Some "secure" values, including unexpected value.
+        false_values = ['false', 'False', '0', 'no', 'someweirdvalue']
+        for val in false_values:
+            config = {'insecure': val,
+                      'certfile': 'false_ind',
+                      'auth_uri': 'http://example.com'}
+            middleware = s3token.filter_factory(config)(self.app)
+            self.assertEqual('false_ind', middleware._verify)
+
+        # Default is secure.
+        config = {'certfile': 'false_ind',
+                  'auth_uri': 'http://example.com'}
+        middleware = s3token.filter_factory(config)(self.app)
+        self.assertIs('false_ind', middleware._verify)
+
+    def test_reseller_prefix(self):
+        def do_test(conf, expected):
+            conf.update(self.conf)
+            middleware = s3token.filter_factory(conf)(self.app)
+            self.assertEqual(expected, middleware._reseller_prefix)
+        do_test({}, 'AUTH_')
+        do_test({'reseller_prefix': 'KEY_'}, 'KEY_')
+        do_test({'reseller_prefix': 'KEY'}, 'KEY_')
+
+    def test_auth_uris(self):
+        for conf, expected in [
+                ({'auth_uri': 'https://example.com/v2.0'},
+                 'https://example.com/v2.0/s3tokens'),
+                # Trailing slash doesn't interfere
+                ({'auth_uri': 'https://example.com/v2.0/'},
+                 'https://example.com/v2.0/s3tokens'),
+                # keystone running under mod_wsgi often has a path prefix
+                ({'auth_uri': 'https://example.com/identity/v2.0'},
+                 'https://example.com/identity/v2.0/s3tokens'),
+                ({'auth_uri': 'https://example.com/identity/v2.0/'},
+                 'https://example.com/identity/v2.0/s3tokens'),
+                # IPv4 addresses are fine
+                ({'auth_uri': 'http://127.0.0.1:35357/v3'},
+                 'http://127.0.0.1:35357/v3/s3tokens'),
+                ({'auth_uri': 'http://127.0.0.1:35357/v3/'},
+                 'http://127.0.0.1:35357/v3/s3tokens'),
+                # IPv6 addresses need [brackets] per RFC 3986
+                ({'auth_uri': 'https://[::FFFF:129.144.52.38]:5000/v3'},
+                 'https://[::FFFF:129.144.52.38]:5000/v3/s3tokens'),
+                ({'auth_uri': 'https://[::FFFF:129.144.52.38]:5000/v3/'},
+                 'https://[::FFFF:129.144.52.38]:5000/v3/s3tokens'),
+        ]:
+            middleware = s3token.filter_factory(conf)(self.app)
+            self.assertEqual(expected, middleware._request_uri)
+
+    @mock.patch.object(requests, 'post')
+    def test_http_timeout(self, MOCK_REQUEST):
+        self.middleware = self.make_middleware({
+            'http_timeout': '2',
+            'auth_uri': 'http://example.com',
+        })
+
+        MOCK_REQUEST.return_value = FakeResponse({
+            'status_code': 201,
+            'text': json.dumps(GOOD_RESPONSE_V2)})
+
+        req = Request.blank('/v1/AUTH_cfa/c/o')
+        req.environ['s3api.auth_details'] = {
+            'access_key': u'access',
+            'signature': u'signature',
+            'string_to_sign': u'token',
+        }
+        req.get_response(self.middleware)
+
+        self.assertTrue(MOCK_REQUEST.called)
+        mock_args, mock_kwargs = MOCK_REQUEST.call_args
+        self.assertEqual(mock_kwargs['timeout'], 2)
+
+    def test_http_timeout_option(self):
+        good_values = ['1', '5.3', '10', '.001']
+        for val in good_values:
+            middleware = s3token.filter_factory({
+                'http_timeout': val,
+                'auth_uri': 'http://example.com',
+            })(self.app)
+            self.assertEqual(float(val), middleware._timeout)
+
+        bad_values = ['1, 4', '-3', '100', 'foo', '0']
+        for val in bad_values:
+            with self.assertRaises(ValueError) as ctx:
+                s3token.filter_factory({
+                    'http_timeout': val,
+                    'auth_uri': 'http://example.com',
+                })(self.app)
+            self.assertTrue(ctx.exception.args[0].startswith((
+                'invalid literal for float():',
+                'could not convert string to float:',
+                'http_timeout must be between 0 and 60 seconds',
+            )), 'Unexpected error message: %s' % ctx.exception)
+
+        # default is 10 seconds
+        middleware = s3token.filter_factory({
+            'auth_uri': 'http://example.com'})(self.app)
+        self.assertEqual(10, middleware._timeout)
+
+    def test_bad_auth_uris(self):
+        for auth_uri in [
+                '/not/a/uri',
+                'http://',
+                '//example.com/path']:
+            with self.assertRaises(ConfigFileError) as cm:
+                s3token.filter_factory({'auth_uri': auth_uri})(self.app)
+            self.assertEqual('Invalid auth_uri; must include scheme and host',
+                             cm.exception.args[0])
+        with self.assertRaises(ConfigFileError) as cm:
+            s3token.filter_factory({
+                'auth_uri': 'nonhttp://example.com'})(self.app)
+        self.assertEqual('Invalid auth_uri; scheme must be http or https',
+                         cm.exception.args[0])
+        for auth_uri in [
+                'http://user@example.com/',
+                'http://example.com/?with=query',
+                'http://example.com/#with-fragment']:
+            with self.assertRaises(ConfigFileError) as cm:
+                s3token.filter_factory({'auth_uri': auth_uri})(self.app)
+            self.assertEqual('Invalid auth_uri; must not include username, '
+                             'query, or fragment', cm.exception.args[0])
+
+    def test_unicode_path(self):
+        url = u'/v1/AUTH_cfa/c/euro\u20ac'.encode('utf8')
+        req = Request.blank(urllib.parse.quote(url))
+        req.environ['s3api.auth_details'] = {
+            'access_key': u'access',
+            'signature': u'signature',
+            'string_to_sign': u'token',
+        }
+        req.get_response(self.middleware)
+        self._assert_authorized(req)
+
+    def test_authorize_with_access_key(self):
+        req = Request.blank('/v1/accesskey/c/o')
+        req.environ['s3api.auth_details'] = {
+            'access_key': u'access',
+            'signature': u'signature',
+            'string_to_sign': u'token',
+        }
+        req.get_response(self.middleware)
+        self._assert_authorized(req, account_path='/v1/')
+        self.assertEqual(req.environ['PATH_INFO'], '/v1/AUTH_TENANT_ID/c/o')
+
+    def test_authorize_with_unicode_access_key(self):
+        req = Request.blank('/v1/acc\xc3\xa9sskey/c/o')
+        req.environ['s3api.auth_details'] = {
+            'access_key': u'acc\u00e9ss',
+            'signature': u'signature',
+            'string_to_sign': u'token',
+        }
+        req.get_response(self.middleware)
+        self._assert_authorized(req, account_path='/v1/',
+                                access_key=u'acc\u00e9ss')
+        self.assertEqual(req.environ['PATH_INFO'], '/v1/AUTH_TENANT_ID/c/o')
+
+    def test_authorize_with_access_key_and_unquote_chars(self):
+        req = Request.blank('/v1/access%key=/c/o')
+        req.environ['s3api.auth_details'] = {
+            'access_key': u'access',
+            'signature': u'signature',
+            'string_to_sign': u'token',
+        }
+        req.get_response(self.middleware)
+        self._assert_authorized(req, account_path='/v1/')
+        self.assertEqual(req.environ['PATH_INFO'], '/v1/AUTH_TENANT_ID/c/o')
+
+    @mock.patch('swift.common.middleware.s3api.s3token.cache_from_env')
+    @mock.patch('keystoneclient.v3.client.Client')
+    @mock.patch.object(requests, 'post')
+    def test_secret_is_cached(self, MOCK_REQUEST, MOCK_KEYSTONE,
+                              MOCK_CACHE_FROM_ENV):
+        self.middleware = self.make_middleware({
+            'auth_uri': 'http://example.com',
+            'secret_cache_duration': '20',
+            'auth_type': 'v3password',
+            'auth_url': 'http://example.com:5000/v3',
+            'username': 'swift',
+            'password': 'secret',
+            'project_name': 'service',
+            'user_domain_name': 'default',
+            'project_domain_name': 'default',
+        })
+        self.assertEqual(20, self.middleware._secret_cache_duration)
+        self.assertIsNone(MOCK_KEYSTONE.mock_calls[0][2]['region_name'])
+
+        cache = MOCK_CACHE_FROM_ENV.return_value
+
+        fake_cache_response = ({}, {'id': 'tenant_id'}, 'secret')
+        cache.get.return_value = fake_cache_response
+
+        MOCK_REQUEST.return_value = FakeResponse({
+            'status_code': 201,
+            'text': json.dumps(GOOD_RESPONSE_V2)})
+
+        req = Request.blank('/v1/AUTH_cfa/c/o')
+        req.environ['s3api.auth_details'] = {
+            'access_key': u'access',
+            'signature': u'signature',
+            'string_to_sign': u'token',
+            'check_signature': lambda x: True
+        }
+        req.get_response(self.middleware)
+        # Ensure we don't request auth from keystone
+        self.assertFalse(MOCK_REQUEST.called)
+
+    @mock.patch('swift.common.middleware.s3api.s3token.cache_from_env')
+    @mock.patch('keystoneclient.v3.client.Client')
+    @mock.patch.object(requests, 'post')
+    def test_secret_sets_cache(self, MOCK_REQUEST, MOCK_KEYSTONE,
+                               MOCK_CACHE_FROM_ENV):
+        self.middleware = self.make_middleware({
+            'auth_uri': 'http://example.com',
+            'secret_cache_duration': '20',
+            'auth_type': 'v3password',
+            'auth_url': 'http://example.com:5000/v3',
+            'username': 'swift',
+            'password': 'secret',
+            'project_name': 'service',
+            'user_domain_name': 'default',
+            'project_domain_name': 'default',
+            'region_name': 'some-other-region',
+        })
+        self.assertEqual(20, self.middleware._secret_cache_duration)
+        self.assertEqual(MOCK_KEYSTONE.mock_calls[0][2]['region_name'],
+                         'some-other-region')
+
+        cache = MOCK_CACHE_FROM_ENV.return_value
+        cache.get.return_value = None
+
+        keystone_client = MOCK_KEYSTONE.return_value
+        keystone_client.session.get_auth_headers.return_value = {
+            'X-Auth-Token': 'bearer token',
+        }
+        keystone_client.ec2.get.return_value = mock.Mock(secret='secret')
+
+        MOCK_REQUEST.return_value = FakeResponse({
+            'status_code': 201,
+            'text': json.dumps(GOOD_RESPONSE_V2).encode('ascii')})
+
+        req = Request.blank('/v1/AUTH_cfa/c/o')
+        req.environ['s3api.auth_details'] = {
+            'access_key': u'access',
+            'signature': u'signature',
+            'string_to_sign': u'token',
+            'check_signature': lambda x: True
+        }
+        req.get_response(self.middleware)
+        expected_headers = {
+            'X-Identity-Status': u'Confirmed',
+            'X-Roles': u'swift-user,_member_',
+            'X-User-Id': u'USER_ID',
+            'X-User-Name': u'S3_USER',
+            'X-Tenant-Id': u'TENANT_ID',
+            'X-Tenant-Name': u'TENANT_NAME',
+            'X-Project-Id': u'TENANT_ID',
+            'X-Project-Name': u'TENANT_NAME',
+        }
+
+        self.assertTrue(MOCK_REQUEST.called)
+        self.assertEqual(MOCK_REQUEST.mock_calls, [
+            mock.call('http://example.com/s3tokens', headers={
+                'Content-Type': 'application/json',
+                'X-Auth-Token': 'bearer token',
+            }, data=json.dumps({
+                "credentials": {
+                    "access": "access",
+                    "token": "dG9rZW4=",
+                    "signature": "signature",
+                }
+            }), verify=None, timeout=10.0)
+        ])
+        tenant = GOOD_RESPONSE_V2['access']['token']['tenant']
+        expected_cache = (expected_headers, tenant, 'secret')
+        cache.set.assert_called_once_with('s3secret/access', expected_cache,
+                                          time=20)
+
+
+class S3TokenMiddlewareTestBad(S3TokenMiddlewareTestBase):
+    def test_unauthorized_token(self):
+        ret = {"error":
+               {"message": "EC2 access key not found.",
+                "code": 401,
+                "title": "Unauthorized"}}
+        self.requests_mock.post(self.TEST_URL, status_code=403, json=ret)
+        req = Request.blank('/v1/AUTH_cfa/c/o')
+        req.environ['s3api.auth_details'] = {
+            'access_key': u'access',
+            'signature': u'signature',
+            'string_to_sign': u'token',
+        }
+        resp = req.get_response(self.middleware)
+        s3_denied_req = self.middleware._deny_request('AccessDenied')
+        self.assertEqual(resp.body, s3_denied_req.body)
+        self.assertEqual(
+            resp.status_int,  # pylint: disable-msg=E1101
+            s3_denied_req.status_int)  # pylint: disable-msg=E1101
+        self.assertEqual(0, self.middleware._app.calls)
+
+        self.assertEqual(1, self.requests_mock.call_count)
+        request_call = self.requests_mock.request_history[0]
+        self.assertEqual(json.loads(request_call.body), {'credentials': {
+            'access': 'access',
+            'signature': 'signature',
+            'token': base64.urlsafe_b64encode(b'token').decode('ascii')}})
+
+    def test_no_s3_creds_defers_to_auth_middleware(self):
+        # Without an Authorization header, we should just pass through to the
+        # auth system to make a decision.
+        req = Request.blank('/v1/AUTH_cfa/c/o')
+        resp = req.get_response(self.middleware)
+        self.assertEqual(resp.status_int, 200)  # pylint: disable-msg=E1101
+        self.assertEqual(1, self.middleware._app.calls)
+
+    def test_fail_to_connect_to_keystone(self):
+        with mock.patch.object(self.middleware, '_json_request') as o:
+            s3_invalid_resp = self.middleware._deny_request('InvalidURI')
+            o.side_effect = s3_invalid_resp
+
+            req = Request.blank('/v1/AUTH_cfa/c/o')
+            req.environ['s3api.auth_details'] = {
+                'access_key': u'access',
+                'signature': u'signature',
+                'string_to_sign': u'token',
+            }
+            resp = req.get_response(self.middleware)
+            self.assertEqual(resp.body, s3_invalid_resp.body)
+            self.assertEqual(
+                resp.status_int,  # pylint: disable-msg=E1101
+                s3_invalid_resp.status_int)  # pylint: disable-msg=E1101
+            self.assertEqual(0, self.middleware._app.calls)
+
+    def _test_bad_reply(self, response_body):
+        self.requests_mock.post(self.TEST_URL,
+                                status_code=201,
+                                text=response_body)
+
+        req = Request.blank('/v1/AUTH_cfa/c/o')
+        req.environ['s3api.auth_details'] = {
+            'access_key': u'access',
+            'signature': u'signature',
+            'string_to_sign': u'token',
+        }
+        resp = req.get_response(self.middleware)
+        s3_invalid_resp = self.middleware._deny_request('InvalidURI')
+        self.assertEqual(resp.body, s3_invalid_resp.body)
+        self.assertEqual(
+            resp.status_int,  # pylint: disable-msg=E1101
+            s3_invalid_resp.status_int)  # pylint: disable-msg=E1101
+        self.assertEqual(0, self.middleware._app.calls)
+
+    def test_bad_reply_not_json(self):
+        self._test_bad_reply('<badreply>')
+
+    def _test_bad_reply_missing_parts(self, *parts):
+        resp = copy.deepcopy(GOOD_RESPONSE_V2)
+        part_dict = resp
+        for part in parts[:-1]:
+            part_dict = part_dict[part]
+        del part_dict[parts[-1]]
+        self._test_bad_reply(json.dumps(resp))
+
+    def test_bad_reply_missing_token_dict(self):
+        self._test_bad_reply_missing_parts('access', 'token')
+
+    def test_bad_reply_missing_user_dict(self):
+        self._test_bad_reply_missing_parts('access', 'user')
+
+    def test_bad_reply_missing_user_roles(self):
+        self._test_bad_reply_missing_parts('access', 'user', 'roles')
+
+    def test_bad_reply_missing_user_name(self):
+        self._test_bad_reply_missing_parts('access', 'user', 'name')
+
+    def test_bad_reply_missing_user_id(self):
+        self._test_bad_reply_missing_parts('access', 'user', 'id')
+
+    def test_bad_reply_missing_tenant_dict(self):
+        self._test_bad_reply_missing_parts('access', 'token', 'tenant')
+
+    def test_bad_reply_missing_tenant_id(self):
+        self._test_bad_reply_missing_parts('access', 'token', 'tenant', 'id')
+
+    def test_bad_reply_missing_tenant_name(self):
+        self._test_bad_reply_missing_parts('access', 'token', 'tenant', 'name')
+
+    def test_bad_reply_valid_but_bad_json(self):
+        self._test_bad_reply('{}')
+        self._test_bad_reply('[]')
+        self._test_bad_reply('null')
+        self._test_bad_reply('"foo"')
+        self._test_bad_reply('1')
+        self._test_bad_reply('true')
+
+
+class S3TokenMiddlewareTestDeferredAuth(S3TokenMiddlewareTestBase):
+    def setUp(self):
+        super(S3TokenMiddlewareTestDeferredAuth, self).setUp()
+        self.conf['delay_auth_decision'] = 'yes'
+        self.middleware = self.make_middleware(self.conf)
+
+    def test_unauthorized_token(self):
+        ret = {"error":
+               {"message": "EC2 access key not found.",
+                "code": 401,
+                "title": "Unauthorized"}}
+        self.requests_mock.post(self.TEST_URL, status_code=403, json=ret)
+        req = Request.blank('/v1/AUTH_cfa/c/o')
+        req.environ['s3api.auth_details'] = {
+            'access_key': u'access',
+            'signature': u'signature',
+            'string_to_sign': u'token',
+        }
+        resp = req.get_response(self.middleware)
+        self.assertEqual(
+            resp.status_int,  # pylint: disable-msg=E1101
+            200)
+        self.assertNotIn('X-Auth-Token', req.headers)
+        self.assertEqual(1, self.middleware._app.calls)
+
+        self.assertEqual(1, self.requests_mock.call_count)
+        request_call = self.requests_mock.request_history[0]
+        self.assertEqual(json.loads(request_call.body), {'credentials': {
+            'access': 'access',
+            'signature': 'signature',
+            'token': base64.urlsafe_b64encode(b'token').decode('ascii')}})
+
+    def test_fail_to_connect_to_keystone(self):
+        with mock.patch.object(self.middleware, '_json_request') as o:
+            o.side_effect = self.middleware._deny_request('InvalidURI')
+
+            req = Request.blank('/v1/AUTH_cfa/c/o')
+            req.environ['s3api.auth_details'] = {
+                'access_key': u'access',
+                'signature': u'signature',
+                'string_to_sign': u'token',
+            }
+            resp = req.get_response(self.middleware)
+            self.assertEqual(
+                resp.status_int,  # pylint: disable-msg=E1101
+                200)
+        self.assertNotIn('X-Auth-Token', req.headers)
+        self.assertEqual(1, self.middleware._app.calls)
+
+    def test_bad_reply(self):
+        self.requests_mock.post(self.TEST_URL,
+                                status_code=201,
+                                text="<badreply>")
+
+        req = Request.blank('/v1/AUTH_cfa/c/o')
+        req.environ['s3api.auth_details'] = {
+            'access_key': u'access',
+            'signature': u'signature',
+            'string_to_sign': u'token',
+        }
+        resp = req.get_response(self.middleware)
+        self.assertEqual(
+            resp.status_int,  # pylint: disable-msg=E1101
+            200)
+        self.assertNotIn('X-Auth-Token', req.headers)
+        self.assertEqual(1, self.middleware._app.calls)
+
+
+class S3TokenMiddlewareTestV3(S3TokenMiddlewareTestBase):
+
+    def setUp(self):
+        super(S3TokenMiddlewareTestV3, self).setUp()
+
+        self.requests_mock.post(self.TEST_URL,
+                                status_code=200,
+                                json=GOOD_RESPONSE_V3)
+
+    def _assert_authorized(self, req,
+                           account_path='/v1/AUTH_PROJECT_ID/'):
+        self.assertTrue(req.path.startswith(account_path))
+        expected_headers = {
+            'X-Identity-Status': 'Confirmed',
+            'X-Roles': 'swift-user,_member_',
+            'X-User-Id': 'USER_ID',
+            'X-User-Name': 'S3_USER',
+            'X-User-Domain-Id': 'default',
+            'X-User-Domain-Name': 'Default',
+            'X-Tenant-Id': 'PROJECT_ID',
+            'X-Tenant-Name': 'PROJECT_NAME',
+            'X-Project-Id': 'PROJECT_ID',
+            'X-Project-Name': 'PROJECT_NAME',
+            'X-Project-Domain-Id': 'PROJECT_DOMAIN_ID',
+            'X-Project-Domain-Name': 'PROJECT_DOMAIN_NAME',
+        }
+        for header, value in expected_headers.items():
+            self.assertIn(header, req.headers)
+            self.assertEqual(value, req.headers[header])
+            # WSGI wants native strings for headers
+            self.assertIsInstance(req.headers[header], str)
+        self.assertNotIn('X-Auth-Token', req.headers)
+        self.assertEqual(1, self.middleware._app.calls)
+
+    def test_authorized(self):
+        req = Request.blank('/v1/AUTH_cfa/c/o')
+        req.environ['s3api.auth_details'] = {
+            'access_key': u'access',
+            'signature': u'signature',
+            'string_to_sign': u'token',
+        }
+        req.get_response(self.middleware)
+        self._assert_authorized(req)
+
+    def test_authorized_bytes(self):
+        req = Request.blank('/v1/AUTH_cfa/c/o')
+        req.environ['s3api.auth_details'] = {
+            'access_key': b'access',
+            'signature': b'signature',
+            'string_to_sign': b'token',
+        }
+        req.get_response(self.middleware)
+        self._assert_authorized(req)
+
+    def test_authorized_http(self):
+        # Following https://github.com/openstack/keystone/commit/3ec1aa4
+        # even v2 URLs would respond with a v3-format response
+        auth_uri = 'http://fakehost:35357/v2.0/'
+        self.requests_mock.post(
+            auth_uri + 's3tokens',
+            status_code=201, json=GOOD_RESPONSE_V3)
+
+        self.middleware = self.make_middleware({
+            'auth_uri': auth_uri})
+        req = Request.blank('/v1/AUTH_cfa/c/o')
+        req.environ['s3api.auth_details'] = {
+            'access_key': u'access',
+            'signature': u'signature',
+            'string_to_sign': u'token',
+        }
+        req.get_response(self.middleware)
+        self._assert_authorized(req)
+
+    def test_authorized_v3(self):
+        auth_uri = 'http://fakehost:35357/v3/'
+        self.requests_mock.post(
+            auth_uri + 's3tokens',
+            status_code=201, json=GOOD_RESPONSE_V3)
+
+        self.middleware = self.make_middleware({
+            'auth_uri': auth_uri})
+        req = Request.blank('/v1/AUTH_cfa/c/o')
+        req.environ['s3api.auth_details'] = {
+            'access_key': u'access',
+            'signature': u'signature',
+            'string_to_sign': u'token',
+        }
+        req.get_response(self.middleware)
+        self._assert_authorized(req)
+
+    def test_authorized_trailing_slash(self):
+        self.middleware = self.make_middleware({
+            'auth_uri': self.TEST_AUTH_URI + '/'})
+        req = Request.blank('/v1/AUTH_cfa/c/o')
+        req.environ['s3api.auth_details'] = {
+            'access_key': u'access',
+            'signature': u'signature',
+            'string_to_sign': u'token',
+        }
+        req.get_response(self.middleware)
+        self._assert_authorized(req)
+
+    def test_authorization_nova_toconnect(self):
+        req = Request.blank('/v1/AUTH_swiftint/c/o')
+        req.environ['s3api.auth_details'] = {
+            'access_key': u'access:FORCED_TENANT_ID',
+            'signature': u'signature',
+            'string_to_sign': u'token',
+        }
+        req.get_response(self.middleware)
+        self._assert_authorized(req, account_path='/v1/AUTH_FORCED_TENANT_ID/')
+
+    def _test_bad_reply_missing_parts(self, *parts):
+        resp = copy.deepcopy(GOOD_RESPONSE_V3)
+        part_dict = resp
+        for part in parts[:-1]:
+            part_dict = part_dict[part]
+        del part_dict[parts[-1]]
+        self.requests_mock.post(self.TEST_URL,
+                                status_code=201,
+                                text=json.dumps(resp))
+
+        req = Request.blank('/v1/AUTH_cfa/c/o')
+        req.environ['s3api.auth_details'] = {
+            'access_key': u'access',
+            'signature': u'signature',
+            'string_to_sign': u'token',
+        }
+        resp = req.get_response(self.middleware)
+        s3_invalid_resp = self.middleware._deny_request('InvalidURI')
+        self.assertEqual(resp.body, s3_invalid_resp.body)
+        self.assertEqual(
+            resp.status_int,  # pylint: disable-msg=E1101
+            s3_invalid_resp.status_int)  # pylint: disable-msg=E1101
+        self.assertEqual(0, self.middleware._app.calls)
+
+    def test_bad_reply_missing_parts(self):
+        self._test_bad_reply_missing_parts('token', 'user', 'id')
+        self._test_bad_reply_missing_parts('token', 'user', 'name')
+        self._test_bad_reply_missing_parts('token', 'user', 'domain', 'id')
+        self._test_bad_reply_missing_parts('token', 'user', 'domain', 'name')
+        self._test_bad_reply_missing_parts('token', 'user', 'domain')
+        self._test_bad_reply_missing_parts('token', 'user')
+        self._test_bad_reply_missing_parts('token', 'project', 'id')
+        self._test_bad_reply_missing_parts('token', 'project', 'name')
+        self._test_bad_reply_missing_parts('token', 'project', 'domain', 'id')
+        self._test_bad_reply_missing_parts('token', 'project', 'domain',
+                                           'name')
+        self._test_bad_reply_missing_parts('token', 'project', 'domain')
+        self._test_bad_reply_missing_parts('token', 'project')
+        self._test_bad_reply_missing_parts('token', 'roles')
+
+    def test_authorize_with_access_key(self):
+        req = Request.blank('/v1/accesskey/c/o')
+        req.environ['s3api.auth_details'] = {
+            'access_key': u'access',
+            'signature': u'signature',
+            'string_to_sign': u'token',
+        }
+        req.get_response(self.middleware)
+        self._assert_authorized(req, account_path='/v1/')
+        self.assertEqual(req.environ['PATH_INFO'], '/v1/AUTH_PROJECT_ID/c/o')
+
+    def test_authorize_with_access_key_in_container(self):
+        req = Request.blank('/v1/accesskey/accesskey.c/o')
+        req.environ['s3api.auth_details'] = {
+            'access_key': u'access',
+            'signature': u'signature',
+            'string_to_sign': u'token',
+        }
+        req.get_response(self.middleware)
+        self._assert_authorized(req, account_path='/v1/')
+        self.assertEqual(req.environ['PATH_INFO'],
+                         '/v1/AUTH_PROJECT_ID/accesskey.c/o')
+
+    def test_authorize_with_access_key_and_unquote_chars(self):
+        req = Request.blank('/v1/ab%c=/c/o')
+        req.environ['s3api.auth_details'] = {
+            'access_key': u'access',
+            'signature': u'signature',
+            'string_to_sign': u'token',
+        }
+        req.get_response(self.middleware)
+        self._assert_authorized(req, account_path='/v1/')
+        self.assertEqual(req.environ['PATH_INFO'], '/v1/AUTH_PROJECT_ID/c/o')
diff --git a/test/unit/common/middleware/s3api/test_service.py b/test/unit/common/middleware/s3api/test_service.py
new file mode 100644
index 0000000000..799da683d9
--- /dev/null
+++ b/test/unit/common/middleware/s3api/test_service.py
@@ -0,0 +1,238 @@
+# Copyright (c) 2014 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+
+from swift.common import swob
+from swift.common.swob import Request
+from swift.common.utils import json
+
+from test.unit.common.middleware.s3api import S3ApiTestCase, S3ApiTestCaseAcl
+from swift.common.middleware.s3api.etree import fromstring
+from swift.common.middleware.s3api.subresource import ACL, Owner, encode_acl
+
+
+def create_bucket_list_json(buckets):
+    """
+    Create a json from bucket list
+    :param buckets: a list of tuples (or lists) consist of elements orderd as
+                    name, count, bytes
+    """
+    bucket_list = [{'name': item[0], 'count': item[1], 'bytes': item[2]}
+                   for item in buckets]
+    return json.dumps(bucket_list)
+
+
+class BaseS3ApiService(object):
+    def setup_buckets(self):
+        self.buckets = (('apple', 1, 200), ('orange', 3, 430))
+        bucket_list = create_bucket_list_json(self.buckets)
+        self.swift.register('GET', '/v1/AUTH_test', swob.HTTPOk, {},
+                            bucket_list)
+
+    def setUp(self):
+        super(BaseS3ApiService, self).setUp()
+
+        self.setup_buckets()
+
+    def test_service_GET(self):
+        req = Request.blank('/',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+
+        elem = fromstring(body, 'ListAllMyBucketsResult')
+
+        all_buckets = elem.find('./Buckets')
+        buckets = all_buckets.iterchildren('Bucket')
+        listing = list(list(buckets)[0])
+        self.assertEqual(len(listing), 2)
+
+        names = []
+        for b in all_buckets.iterchildren('Bucket'):
+            names.append(b.find('./Name').text)
+
+        self.assertEqual(len(names), len(self.buckets))
+        for i in self.buckets:
+            self.assertTrue(i[0] in names)
+
+    def test_service_GET_subresource(self):
+        req = Request.blank('/?acl',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+
+        elem = fromstring(body, 'ListAllMyBucketsResult')
+
+        all_buckets = elem.find('./Buckets')
+        buckets = all_buckets.iterchildren('Bucket')
+        listing = list(list(buckets)[0])
+        self.assertEqual(len(listing), 2)
+
+        names = []
+        for b in all_buckets.iterchildren('Bucket'):
+            names.append(b.find('./Name').text)
+
+        self.assertEqual(len(names), len(self.buckets))
+        for i in self.buckets:
+            self.assertTrue(i[0] in names)
+
+
+class TestS3ApiServiceNoAcl(BaseS3ApiService, S3ApiTestCase):
+
+    def test_service_GET_error(self):
+        code = self._test_method_error(
+            'GET', '', swob.HTTPUnauthorized, expected_xml_tags=(
+                'Code', 'Message', 'AWSAccessKeyId', 'StringToSign',
+                'StringToSignBytes', 'SignatureProvided'))
+        self.assertEqual(code, 'SignatureDoesNotMatch')
+        code = self._test_method_error('GET', '', swob.HTTPForbidden)
+        self.assertEqual(code, 'AccessDenied')
+        code = self._test_method_error('GET', '', swob.HTTPServerError)
+        self.assertEqual(code, 'InternalError')
+
+    def test_service_GET_with_blind_resource(self):
+        buckets = (('apple', 1, 200), ('orange', 3, 430),
+                   ('apple+segment', 1, 200))
+        expected = buckets[:-1]
+        bucket_list = create_bucket_list_json(buckets)
+        self.swift.register('GET', '/v1/AUTH_test', swob.HTTPOk, {},
+                            bucket_list)
+
+        req = Request.blank('/',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+
+        elem = fromstring(body, 'ListAllMyBucketsResult')
+        all_buckets = elem.find('./Buckets')
+        buckets = all_buckets.iterchildren('Bucket')
+        listing = list(list(buckets)[0])
+        self.assertEqual(len(listing), 2)
+
+        names = []
+        for b in all_buckets.iterchildren('Bucket'):
+            names.append(b.find('./Name').text)
+
+        self.assertEqual(len(names), len(expected))
+        for i in expected:
+            self.assertIn(i[0], names)
+
+
+class TestS3ApiServiceAcl(BaseS3ApiService, S3ApiTestCaseAcl):
+
+    def _test_service_GET_for_check_bucket_owner(self, buckets):
+        self.s3api.conf.check_bucket_owner = True
+        bucket_list = create_bucket_list_json(buckets)
+        self.swift.register('GET', '/v1/AUTH_test', swob.HTTPOk, {},
+                            bucket_list)
+
+        req = Request.blank('/',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+        return self.call_s3api(req)
+
+    def test_service_GET_without_bucket(self):
+        bucket_list = []
+        for var in range(0, 10):
+            bucket = 'bucket%s' % var
+            self.swift.register('HEAD', '/v1/AUTH_test/%s' % bucket,
+                                swob.HTTPNotFound, {}, None)
+            bucket_list.append((bucket, var, 300 + var))
+
+        status, headers, body = \
+            self._test_service_GET_for_check_bucket_owner(bucket_list)
+        self.assertEqual(status.split()[0], '200')
+
+        elem = fromstring(body, 'ListAllMyBucketsResult')
+
+        resp_buckets = elem.find('./Buckets')
+        buckets = resp_buckets.iterchildren('Bucket')
+        self.assertEqual(len(list(buckets)), 0)
+
+    def test_service_GET_without_owner_bucket(self):
+        bucket_list = []
+        for var in range(0, 10):
+            user_id = 'test:other'
+            bucket = 'bucket%s' % var
+            owner = Owner(user_id, user_id)
+            headers = encode_acl('container', ACL(owner, []))
+            self.swift.register('HEAD', '/v1/AUTH_test/%s' % bucket,
+                                swob.HTTPNoContent, headers, None)
+            bucket_list.append((bucket, var, 300 + var))
+
+        status, headers, body = \
+            self._test_service_GET_for_check_bucket_owner(bucket_list)
+        self.assertEqual(status.split()[0], '200')
+
+        elem = fromstring(body, 'ListAllMyBucketsResult')
+
+        resp_buckets = elem.find('./Buckets')
+        buckets = resp_buckets.iterchildren('Bucket')
+        self.assertEqual(len(list(buckets)), 0)
+
+    def test_service_GET_bucket_list(self):
+        bucket_list = []
+        for var in range(0, 10):
+            if var % 3 == 0:
+                user_id = 'test:tester'
+            else:
+                user_id = 'test:other'
+            bucket = 'bucket%s' % var
+            owner = Owner(user_id, user_id)
+            headers = encode_acl('container', ACL(owner, []))
+            # set register to get owner of buckets
+            if var % 3 == 2:
+                self.swift.register('HEAD', '/v1/AUTH_test/%s' % bucket,
+                                    swob.HTTPNotFound, {}, None)
+            else:
+                self.swift.register('HEAD', '/v1/AUTH_test/%s' % bucket,
+                                    swob.HTTPNoContent, headers, None)
+            bucket_list.append((bucket, var, 300 + var))
+
+        status, headers, body = \
+            self._test_service_GET_for_check_bucket_owner(bucket_list)
+        self.assertEqual(status.split()[0], '200')
+
+        elem = fromstring(body, 'ListAllMyBucketsResult')
+        resp_buckets = elem.find('./Buckets')
+        buckets = resp_buckets.iterchildren('Bucket')
+        listing = list(list(buckets)[0])
+        self.assertEqual(len(listing), 2)
+
+        names = []
+        for b in resp_buckets.iterchildren('Bucket'):
+            names.append(b.find('./Name').text)
+
+        # Check whether getting bucket only locate in multiples of 3 in
+        # bucket_list which mean requested user is owner.
+        expected_buckets = [b for i, b in enumerate(bucket_list)
+                            if i % 3 == 0]
+        self.assertEqual(len(names), len(expected_buckets))
+        for i in expected_buckets:
+            self.assertTrue(i[0] in names)
+        self.assertEqual(len(self.swift.calls_with_headers), 11)
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/s3api/test_subresource.py b/test/unit/common/middleware/s3api/test_subresource.py
new file mode 100644
index 0000000000..bdfb916c8e
--- /dev/null
+++ b/test/unit/common/middleware/s3api/test_subresource.py
@@ -0,0 +1,367 @@
+# Copyright (c) 2014 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+
+from swift.common.utils import json
+
+from swift.common.middleware.s3api.s3response import AccessDenied, \
+    InvalidArgument, S3NotImplemented
+from swift.common.middleware.s3api.subresource import User, \
+    AuthenticatedUsers, AllUsers, \
+    ACLPrivate, ACLPublicRead, ACLPublicReadWrite, ACLAuthenticatedRead, \
+    ACLBucketOwnerRead, ACLBucketOwnerFullControl, Owner, ACL, encode_acl, \
+    decode_acl, canned_acl_grantees, Grantee
+from swift.common.middleware.s3api.utils import sysmeta_header
+from swift.common.middleware.s3api.exception import InvalidSubresource
+
+
+class TestS3ApiSubresource(unittest.TestCase):
+
+    def setUp(self):
+        self.s3_acl = True
+        self.allow_no_owner = False
+
+    def test_acl_canonical_user(self):
+        grantee = User('test:tester')
+
+        self.assertTrue('test:tester' in grantee)
+        self.assertTrue('test:tester2' not in grantee)
+        self.assertEqual(str(grantee), 'test:tester')
+        self.assertEqual(grantee.elem().find('./ID').text, 'test:tester')
+
+    def test_acl_authenticated_users(self):
+        grantee = AuthenticatedUsers()
+
+        self.assertTrue('test:tester' in grantee)
+        self.assertTrue('test:tester2' in grantee)
+        uri = 'http://acs.amazonaws.com/groups/global/AuthenticatedUsers'
+        self.assertEqual(grantee.elem().find('./URI').text, uri)
+
+    def test_acl_all_users(self):
+        grantee = AllUsers()
+
+        self.assertTrue('test:tester' in grantee)
+        self.assertTrue('test:tester2' in grantee)
+        uri = 'http://acs.amazonaws.com/groups/global/AllUsers'
+        self.assertEqual(grantee.elem().find('./URI').text, uri)
+
+    def check_permission(self, acl, user_id, permission):
+        try:
+            acl.check_permission(user_id, permission)
+            return True
+        except AccessDenied:
+            return False
+
+    def test_acl_private(self):
+        acl = ACLPrivate(Owner(id='test:tester',
+                               name='test:tester'),
+                         s3_acl=self.s3_acl,
+                         allow_no_owner=self.allow_no_owner)
+
+        self.assertTrue(self.check_permission(acl, 'test:tester', 'READ'))
+        self.assertTrue(self.check_permission(acl, 'test:tester', 'WRITE'))
+        self.assertTrue(self.check_permission(acl, 'test:tester', 'READ_ACP'))
+        self.assertTrue(self.check_permission(acl, 'test:tester', 'WRITE_ACP'))
+        self.assertFalse(self.check_permission(acl, 'test:tester2', 'READ'))
+        self.assertFalse(self.check_permission(acl, 'test:tester2', 'WRITE'))
+        self.assertFalse(self.check_permission(acl, 'test:tester2',
+                                               'READ_ACP'))
+        self.assertFalse(self.check_permission(acl, 'test:tester2',
+                                               'WRITE_ACP'))
+
+    def test_acl_public_read(self):
+        acl = ACLPublicRead(Owner(id='test:tester',
+                                  name='test:tester'),
+                            s3_acl=self.s3_acl,
+                            allow_no_owner=self.allow_no_owner)
+
+        self.assertTrue(self.check_permission(acl, 'test:tester', 'READ'))
+        self.assertTrue(self.check_permission(acl, 'test:tester', 'WRITE'))
+        self.assertTrue(self.check_permission(acl, 'test:tester', 'READ_ACP'))
+        self.assertTrue(self.check_permission(acl, 'test:tester', 'WRITE_ACP'))
+        self.assertTrue(self.check_permission(acl, 'test:tester2', 'READ'))
+        self.assertFalse(self.check_permission(acl, 'test:tester2', 'WRITE'))
+        self.assertFalse(self.check_permission(acl, 'test:tester2',
+                                               'READ_ACP'))
+        self.assertFalse(self.check_permission(acl, 'test:tester2',
+                                               'WRITE_ACP'))
+
+    def test_acl_public_read_write(self):
+        acl = ACLPublicReadWrite(Owner(id='test:tester',
+                                       name='test:tester'),
+                                 s3_acl=self.s3_acl,
+                                 allow_no_owner=self.allow_no_owner)
+
+        self.assertTrue(self.check_permission(acl, 'test:tester', 'READ'))
+        self.assertTrue(self.check_permission(acl, 'test:tester', 'WRITE'))
+        self.assertTrue(self.check_permission(acl, 'test:tester', 'READ_ACP'))
+        self.assertTrue(self.check_permission(acl, 'test:tester', 'WRITE_ACP'))
+        self.assertTrue(self.check_permission(acl, 'test:tester2', 'READ'))
+        self.assertTrue(self.check_permission(acl, 'test:tester2', 'WRITE'))
+        self.assertFalse(self.check_permission(acl, 'test:tester2',
+                                               'READ_ACP'))
+        self.assertFalse(self.check_permission(acl, 'test:tester2',
+                                               'WRITE_ACP'))
+
+    def test_acl_authenticated_read(self):
+        acl = ACLAuthenticatedRead(Owner(id='test:tester',
+                                         name='test:tester'),
+                                   s3_acl=self.s3_acl,
+                                   allow_no_owner=self.allow_no_owner)
+
+        self.assertTrue(self.check_permission(acl, 'test:tester', 'READ'))
+        self.assertTrue(self.check_permission(acl, 'test:tester', 'WRITE'))
+        self.assertTrue(self.check_permission(acl, 'test:tester', 'READ_ACP'))
+        self.assertTrue(self.check_permission(acl, 'test:tester', 'WRITE_ACP'))
+        self.assertTrue(self.check_permission(acl, 'test:tester2', 'READ'))
+        self.assertFalse(self.check_permission(acl, 'test:tester2', 'WRITE'))
+        self.assertFalse(self.check_permission(acl, 'test:tester2',
+                                               'READ_ACP'))
+        self.assertFalse(self.check_permission(acl, 'test:tester2',
+                                               'WRITE_ACP'))
+
+    def test_acl_bucket_owner_read(self):
+        acl = ACLBucketOwnerRead(
+            bucket_owner=Owner('test:tester2', 'test:tester2'),
+            object_owner=Owner('test:tester', 'test:tester'),
+            s3_acl=self.s3_acl,
+            allow_no_owner=self.allow_no_owner)
+
+        self.assertTrue(self.check_permission(acl, 'test:tester', 'READ'))
+        self.assertTrue(self.check_permission(acl, 'test:tester', 'WRITE'))
+        self.assertTrue(self.check_permission(acl, 'test:tester', 'READ_ACP'))
+        self.assertTrue(self.check_permission(acl, 'test:tester', 'WRITE_ACP'))
+        self.assertTrue(self.check_permission(acl, 'test:tester2', 'READ'))
+        self.assertFalse(self.check_permission(acl, 'test:tester2', 'WRITE'))
+        self.assertFalse(self.check_permission(acl, 'test:tester2',
+                                               'READ_ACP'))
+        self.assertFalse(self.check_permission(acl, 'test:tester2',
+                                               'WRITE_ACP'))
+
+    def test_acl_bucket_owner_full_control(self):
+        acl = ACLBucketOwnerFullControl(
+            bucket_owner=Owner('test:tester2', 'test:tester2'),
+            object_owner=Owner('test:tester', 'test:tester'),
+            s3_acl=self.s3_acl,
+            allow_no_owner=self.allow_no_owner)
+
+        self.assertTrue(self.check_permission(acl, 'test:tester', 'READ'))
+        self.assertTrue(self.check_permission(acl, 'test:tester', 'WRITE'))
+        self.assertTrue(self.check_permission(acl, 'test:tester', 'READ_ACP'))
+        self.assertTrue(self.check_permission(acl, 'test:tester', 'WRITE_ACP'))
+        self.assertTrue(self.check_permission(acl, 'test:tester2', 'READ'))
+        self.assertTrue(self.check_permission(acl, 'test:tester2', 'WRITE'))
+        self.assertTrue(self.check_permission(acl, 'test:tester2', 'READ_ACP'))
+        self.assertTrue(self.check_permission(acl, 'test:tester2',
+                                              'WRITE_ACP'))
+
+    def test_acl_elem(self):
+        acl = ACLPrivate(Owner(id='test:tester',
+                               name='test:tester'),
+                         s3_acl=self.s3_acl,
+                         allow_no_owner=self.allow_no_owner)
+        elem = acl.elem()
+        self.assertTrue(elem.find('./Owner') is not None)
+        self.assertTrue(elem.find('./AccessControlList') is not None)
+        grants = [e for e in elem.findall('./AccessControlList/Grant')]
+        self.assertEqual(len(grants), 1)
+        self.assertEqual(grants[0].find('./Grantee/ID').text, 'test:tester')
+        self.assertEqual(
+            grants[0].find('./Grantee/DisplayName').text, 'test:tester')
+
+    def test_acl_from_elem(self):
+        # check translation from element
+        acl = ACLPrivate(Owner(id='test:tester',
+                               name='test:tester'),
+                         s3_acl=self.s3_acl,
+                         allow_no_owner=self.allow_no_owner)
+        elem = acl.elem()
+        acl = ACL.from_elem(elem, self.s3_acl, self.allow_no_owner)
+        self.assertTrue(self.check_permission(acl, 'test:tester', 'READ'))
+        self.assertTrue(self.check_permission(acl, 'test:tester', 'WRITE'))
+        self.assertTrue(self.check_permission(acl, 'test:tester', 'READ_ACP'))
+        self.assertTrue(self.check_permission(acl, 'test:tester', 'WRITE_ACP'))
+        self.assertFalse(self.check_permission(acl, 'test:tester2', 'READ'))
+        self.assertFalse(self.check_permission(acl, 'test:tester2', 'WRITE'))
+        self.assertFalse(self.check_permission(acl, 'test:tester2',
+                                               'READ_ACP'))
+        self.assertFalse(self.check_permission(acl, 'test:tester2',
+                                               'WRITE_ACP'))
+
+    def test_acl_from_elem_by_id_only(self):
+        elem = ACLPrivate(Owner(id='test:tester',
+                                name='test:tester'),
+                          s3_acl=self.s3_acl,
+                          allow_no_owner=self.allow_no_owner).elem()
+        elem.find('./Owner').remove(elem.find('./Owner/DisplayName'))
+        acl = ACL.from_elem(elem, self.s3_acl, self.allow_no_owner)
+        self.assertTrue(self.check_permission(acl, 'test:tester', 'READ'))
+        self.assertTrue(self.check_permission(acl, 'test:tester', 'WRITE'))
+        self.assertTrue(self.check_permission(acl, 'test:tester', 'READ_ACP'))
+        self.assertTrue(self.check_permission(acl, 'test:tester', 'WRITE_ACP'))
+        self.assertFalse(self.check_permission(acl, 'test:tester2', 'READ'))
+        self.assertFalse(self.check_permission(acl, 'test:tester2', 'WRITE'))
+        self.assertFalse(self.check_permission(acl, 'test:tester2',
+                                               'READ_ACP'))
+        self.assertFalse(self.check_permission(acl, 'test:tester2',
+                                               'WRITE_ACP'))
+
+    def test_decode_acl_container(self):
+        access_control_policy = \
+            {'Owner': 'test:tester',
+             'Grant': [{'Permission': 'FULL_CONTROL',
+                        'Grantee': 'test:tester'}]}
+        headers = {sysmeta_header('container', 'acl'):
+                   json.dumps(access_control_policy)}
+        acl = decode_acl('container', headers, self.allow_no_owner)
+
+        self.assertIsInstance(acl, ACL)
+        self.assertEqual(acl.owner.id, 'test:tester')
+        self.assertEqual(len(acl.grants), 1)
+        self.assertEqual(str(acl.grants[0].grantee), 'test:tester')
+        self.assertEqual(acl.grants[0].permission, 'FULL_CONTROL')
+
+    def test_decode_acl_object(self):
+        access_control_policy = \
+            {'Owner': 'test:tester',
+             'Grant': [{'Permission': 'FULL_CONTROL',
+                        'Grantee': 'test:tester'}]}
+        headers = {sysmeta_header('object', 'acl'):
+                   json.dumps(access_control_policy)}
+        acl = decode_acl('object', headers, self.allow_no_owner)
+
+        self.assertIsInstance(acl, ACL)
+        self.assertEqual(acl.owner.id, 'test:tester')
+        self.assertEqual(len(acl.grants), 1)
+        self.assertEqual(str(acl.grants[0].grantee), 'test:tester')
+        self.assertEqual(acl.grants[0].permission, 'FULL_CONTROL')
+
+    def test_decode_acl_undefined(self):
+        headers = {}
+        acl = decode_acl('container', headers, self.allow_no_owner)
+
+        self.assertIsInstance(acl, ACL)
+        self.assertIsNone(acl.owner.id)
+        self.assertEqual(len(acl.grants), 0)
+
+    def test_decode_acl_empty_list(self):
+        headers = {sysmeta_header('container', 'acl'): '[]'}
+        acl = decode_acl('container', headers, self.allow_no_owner)
+        self.assertIsInstance(acl, ACL)
+        self.assertIsNone(acl.owner.id)
+        self.assertEqual(len(acl.grants), 0)
+
+    def test_decode_acl_with_invalid_json(self):
+        headers = {sysmeta_header('container', 'acl'): '['}
+        self.assertRaises(
+            InvalidSubresource, decode_acl, 'container',
+            headers, self.allow_no_owner)
+
+    def test_encode_acl_container(self):
+        acl = ACLPrivate(Owner(id='test:tester',
+                               name='test:tester'))
+        acp = encode_acl('container', acl)
+        header_value = json.loads(acp[sysmeta_header('container', 'acl')])
+
+        self.assertTrue('Owner' in header_value)
+        self.assertTrue('Grant' in header_value)
+        self.assertEqual('test:tester', header_value['Owner'])
+        self.assertEqual(len(header_value['Grant']), 1)
+
+    def test_encode_acl_object(self):
+        acl = ACLPrivate(Owner(id='test:tester',
+                               name='test:tester'))
+        acp = encode_acl('object', acl)
+        header_value = json.loads(acp[sysmeta_header('object', 'acl')])
+
+        self.assertTrue('Owner' in header_value)
+        self.assertTrue('Grant' in header_value)
+        self.assertEqual('test:tester', header_value['Owner'])
+        self.assertEqual(len(header_value['Grant']), 1)
+
+    def test_encode_acl_many_grant(self):
+        headers = {}
+        users = []
+        for i in range(0, 99):
+            users.append('id=test:tester%s' % str(i))
+        users = ','.join(users)
+        headers['x-amz-grant-read'] = users
+        acl = ACL.from_headers(headers, Owner('test:tester', 'test:tester'))
+        acp = encode_acl('container', acl)
+
+        header_value = acp[sysmeta_header('container', 'acl')]
+        header_value = json.loads(header_value)
+
+        self.assertTrue('Owner' in header_value)
+        self.assertTrue('Grant' in header_value)
+        self.assertEqual('test:tester', header_value['Owner'])
+        self.assertEqual(len(header_value['Grant']), 99)
+
+    def test_from_headers_x_amz_acl(self):
+        canned_acls = ['public-read', 'public-read-write',
+                       'authenticated-read', 'bucket-owner-read',
+                       'bucket-owner-full-control', 'log-delivery-write']
+
+        owner = Owner('test:tester', 'test:tester')
+        grantee_map = canned_acl_grantees(owner)
+
+        for acl_str in canned_acls:
+            acl = ACL.from_headers({'x-amz-acl': acl_str}, owner)
+            expected = grantee_map[acl_str]
+
+            self.assertEqual(len(acl.grants), len(expected))  # sanity
+
+            # parse Grant object to permission and grantee
+            actual_grants = [(grant.permission, grant.grantee)
+                             for grant in acl.grants]
+
+            assertions = zip(sorted(expected), sorted(actual_grants))
+
+            for (expected_permission, expected_grantee), \
+                    (permission, grantee) in assertions:
+                self.assertEqual(expected_permission, permission)
+                self.assertIsInstance(grantee, expected_grantee.__class__)
+                if isinstance(grantee, User):
+                    self.assertEqual(expected_grantee.id, grantee.id)
+                    self.assertEqual(expected_grantee.display_name,
+                                     grantee.display_name)
+
+    def test_from_headers_x_amz_acl_invalid(self):
+        with self.assertRaises(InvalidArgument) as cm:
+            ACL.from_headers({'x-amz-acl': 'invalid'},
+                             Owner('test:tester', 'test:tester'))
+        self.assertTrue('argument_name' in cm.exception.info)
+        self.assertEqual(cm.exception.info['argument_name'], 'x-amz-acl')
+        self.assertTrue('argument_value' in cm.exception.info)
+        self.assertEqual(cm.exception.info['argument_value'], 'invalid')
+
+    def test_canned_acl_grantees(self):
+        grantee_map = canned_acl_grantees(Owner('test:tester', 'test:tester'))
+        canned_acls = ['private', 'public-read', 'public-read-write',
+                       'authenticated-read', 'bucket-owner-read',
+                       'bucket-owner-full-control', 'log-delivery-write']
+        for canned_acl in canned_acls:
+            self.assertTrue(canned_acl in grantee_map)
+        self.assertEqual(len(canned_acls), len(grantee_map))  # sanity
+
+    def test_base_grantee(self):
+        grantee = Grantee()
+        func = lambda: '' in grantee
+        self.assertRaises(S3NotImplemented, func)
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/s3api/test_utils.py b/test/unit/common/middleware/s3api/test_utils.py
new file mode 100644
index 0000000000..f2e415bf87
--- /dev/null
+++ b/test/unit/common/middleware/s3api/test_utils.py
@@ -0,0 +1,415 @@
+# Copyright (c) 2014 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import os
+import time
+import unittest
+
+from swift.common.swob import Request
+from swift.common.middleware.s3api import utils, s3request
+from swift.common.middleware.s3api.exception import InvalidBucketNameParseError
+from swift.common.middleware.s3api.utils import make_header_label
+
+strs = [
+    ('Owner', 'owner'),
+    ('DisplayName', 'display_name'),
+    ('AccessControlPolicy', 'access_control_policy'),
+]
+
+
+class TestS3ApiUtils(unittest.TestCase):
+    def test_camel_to_snake(self):
+        for s1, s2 in strs:
+            self.assertEqual(utils.camel_to_snake(s1), s2)
+
+    def test_snake_to_camel(self):
+        for s1, s2 in strs:
+            self.assertEqual(s1, utils.snake_to_camel(s2))
+
+    def test_make_header_label(self):
+        self.assertEqual('header_aa_b_c', make_header_label('Aa-B-C'))
+        self.assertEqual('header_aa_b_c', make_header_label('AA_B_C'))
+        self.assertEqual('header_aa_b_c', make_header_label('aA-b-c'))
+
+    def test_classify_checksum_header_value(self):
+        self.assertEqual(
+            utils.classify_checksum_header_value('00000000'), 'hash_8')
+        self.assertEqual(
+            utils.classify_checksum_header_value('a' * 64), 'hash_64')
+        self.assertEqual(
+            utils.classify_checksum_header_value('STUVWXYZ'), 'b64_8')
+        self.assertEqual(
+            utils.classify_checksum_header_value('abcdef&1'), 'unknown')
+        self.assertEqual(
+            utils.classify_checksum_header_value('z'), 'unknown')
+
+    def test_validate_bucket_name(self):
+        # good cases
+        self.assertTrue(utils.validate_bucket_name('bucket', True))
+        self.assertTrue(utils.validate_bucket_name('bucket1', True))
+        self.assertTrue(utils.validate_bucket_name('bucket-1', True))
+        self.assertTrue(utils.validate_bucket_name('b.u.c.k.e.t', True))
+        self.assertTrue(utils.validate_bucket_name('a' * 63, True))
+        self.assertTrue(utils.validate_bucket_name('v1.0', True))
+        # bad cases
+        self.assertFalse(utils.validate_bucket_name('a', True))
+        self.assertFalse(utils.validate_bucket_name('aa', True))
+        self.assertFalse(utils.validate_bucket_name('a+a', True))
+        self.assertFalse(utils.validate_bucket_name('a_a', True))
+        self.assertFalse(utils.validate_bucket_name('Bucket', True))
+        self.assertFalse(utils.validate_bucket_name('BUCKET', True))
+        self.assertFalse(utils.validate_bucket_name('bucket-', True))
+        self.assertFalse(utils.validate_bucket_name('bucket.', True))
+        self.assertFalse(utils.validate_bucket_name('bucket_', True))
+        self.assertFalse(utils.validate_bucket_name('bucket.-bucket', True))
+        self.assertFalse(utils.validate_bucket_name('bucket-.bucket', True))
+        self.assertFalse(utils.validate_bucket_name('bucket..bucket', True))
+        self.assertFalse(utils.validate_bucket_name('a' * 64, True))
+        self.assertFalse(utils.validate_bucket_name('v1', False))
+
+    def test_validate_bucket_name_with_dns_compliant_bucket_names_false(self):
+        # good cases
+        self.assertTrue(utils.validate_bucket_name('bucket', False))
+        self.assertTrue(utils.validate_bucket_name('bucket1', False))
+        self.assertTrue(utils.validate_bucket_name('bucket-1', False))
+        self.assertTrue(utils.validate_bucket_name('b.u.c.k.e.t', False))
+        self.assertTrue(utils.validate_bucket_name('a' * 63, False))
+        self.assertTrue(utils.validate_bucket_name('a' * 255, False))
+        self.assertTrue(utils.validate_bucket_name('a_a', False))
+        self.assertTrue(utils.validate_bucket_name('Bucket', False))
+        self.assertTrue(utils.validate_bucket_name('BUCKET', False))
+        self.assertTrue(utils.validate_bucket_name('bucket-', False))
+        self.assertTrue(utils.validate_bucket_name('bucket_', False))
+        self.assertTrue(utils.validate_bucket_name('bucket.-bucket', False))
+        self.assertTrue(utils.validate_bucket_name('bucket-.bucket', False))
+        self.assertTrue(utils.validate_bucket_name('bucket..bucket', False))
+        # bad cases
+        self.assertFalse(utils.validate_bucket_name('a', False))
+        self.assertFalse(utils.validate_bucket_name('aa', False))
+        self.assertFalse(utils.validate_bucket_name('a+a', False))
+        # ending with dot seems invalid in US standard, too
+        self.assertFalse(utils.validate_bucket_name('bucket.', False))
+        self.assertFalse(utils.validate_bucket_name('a' * 256, False))
+
+    def test_extract_bucket_and_key(self):
+        req = Request.blank(
+            '/bucket/object',
+            environ={
+                'REQUEST_METHOD': 'GET',
+            },
+            headers={
+                'Authorization': 'AWS test:tester:hmac',
+            },
+        )
+
+        cont, obj = utils.extract_bucket_and_key(req, [], False)
+        self.assertEqual(cont, 'bucket')
+        self.assertEqual(obj, 'object')
+
+    def test_extract_bucket_and_key_invalid_character(self):
+        req = Request.blank(
+            '/bucket/\x00object',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Authorization': 'AWS test:tester:hmac'},
+        )
+        self.assertEqual((None, None),
+                         utils.extract_bucket_and_key(req, [], False))
+
+    def test_extract_bucket_and_key_invalid_bucket(self):
+        req = Request.blank(
+            '/b/object',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Authorization': 'AWS test:tester:hmac'},
+        )
+        self.assertEqual((None, None),
+                         utils.extract_bucket_and_key(req, [], False))
+
+    def test_extract_bucket_and_key_invalid_dns_compliant(self):
+        req = Request.blank(
+            '/BUCKET/object',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Authorization': 'AWS test:tester:hmac'},
+        )
+        self.assertEqual(('BUCKET', 'object'),
+                         utils.extract_bucket_and_key(req, [], False))
+
+        self.assertEqual((None, None),
+                         utils.extract_bucket_and_key(req, [], True))
+
+    def test_extract_bucket_and_key_bucket_in_host(self):
+        req = Request.blank(
+            '/object/xyz',
+            environ={'REQUEST_METHOD': 'GET',
+                     'HTTP_HOST': 'bucket.localhost'},
+            headers={'Authorization': 'AWS test:atester:hmac'},
+        )
+        self.assertEqual(
+            ('bucket', 'object/xyz'),
+            utils.extract_bucket_and_key(req, ['localhost'], False))
+
+    def test_parse_host(self):
+        req = Request.blank(
+            '/bucket/object',
+            environ={
+                'REQUEST_METHOD': 'GET',
+                'SERVER_NAME': 'foo.boo'
+            },
+        )
+        del req.environ['HTTP_HOST']
+        self.assertEqual(utils.parse_host(req.environ, []), None)
+        self.assertEqual(utils.parse_host(req.environ, ['boo']), 'foo')
+        req = Request.blank(
+            '/bucket/object',
+            environ={
+                'REQUEST_METHOD': 'GET',
+                'HTTP_HOST': 'buckets.localhost',
+                'SERVER_NAME': 'foo.localhost',
+            },
+        )
+        self.assertEqual(utils.parse_host(req.environ, []), None)
+        self.assertEqual(utils.parse_host(
+            req.environ, ['notlocalhost']), None)
+        self.assertEqual(utils.parse_host(
+            req.environ, ['localhost']), 'buckets')
+        self.assertEqual(utils.parse_host(
+            req.environ, ['.localhost']), 'buckets')
+        self.assertEqual(utils.parse_host(
+            req.environ, ['notlocalhost', '.localhost']), 'buckets')
+
+    def test_parse_path(self):
+        req = Request.blank(
+            '/bucket/object',
+            environ={'REQUEST_METHOD': 'GET'},
+        )
+        bucket, obj = utils.parse_path(req, None, False)
+        self.assertEqual(bucket, 'bucket')
+        self.assertEqual(obj, 'object')
+        bucket, obj = utils.parse_path(req, None, True)
+        self.assertEqual(bucket, 'bucket')
+        self.assertEqual(obj, 'object')
+        bucket, obj = utils.parse_path(req, 'boo', True)
+        self.assertEqual(bucket, 'boo')
+        self.assertEqual(obj, 'bucket/object')
+
+    def test_parse_path_dns_compliant_bucket_names(self):
+        req = Request.blank(
+            '/BUCKET/object',
+            environ={'REQUEST_METHOD': 'GET'},
+        )
+        with self.assertRaises(InvalidBucketNameParseError):
+            utils.parse_path(req, None, True)
+        # non-compliant is ok if it somehow came in the host??
+        bucket, obj = utils.parse_path(req, 'BUCKET', True)
+        self.assertEqual(bucket, 'BUCKET')
+        self.assertEqual(obj, 'BUCKET/object')
+
+    def test_get_s3_access_key_id_not_s3_req(self):
+        headers = {'Authorization': 'not AWS my_access_key_id:signature'}
+        req = Request.blank('/v1/a/',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers=headers)
+        self.assertIsNone(utils.get_s3_access_key_id(req))
+
+    def test_get_s3_access_key_id_v2_header(self):
+        headers = {'Authorization': 'AWS my_access_key_id:signature'}
+        req = Request.blank('/v1/a/',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers=headers)
+        self.assertEqual('my_access_key_id', utils.get_s3_access_key_id(req))
+
+    def test_get_s3_access_key_id_v2_param(self):
+        params = {'AWSAccessKeyId': 'my_access_key_id'}
+        req = Request.blank('/v1/a/',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            params=params)
+        self.assertEqual('my_access_key_id', utils.get_s3_access_key_id(req))
+
+    def test_get_s3_access_key_id_v4_header(self):
+        headers = {
+            'Authorization':
+                'AWS4-HMAC-SHA256 '
+                'Credential=my_access_key_id/20130524/us-east-1/s3/'
+                'aws4_request,'
+                'SignedHeaders=host;range;x-amz-date,'
+                'Signature=fe5f80f77d5fa3beca038a248ff027d0445342fe2855ddc963'
+                '176630326f1024'}
+        req = Request.blank('/v1/a/',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers=headers)
+        self.assertEqual('my_access_key_id', utils.get_s3_access_key_id(req))
+
+    def test_get_s3_access_key_id_v4_param(self):
+        params = {'X-Amz-Credential':
+                  'my_access_key_id/20130721/us-east-1/s3/aws4_request'}
+        req = Request.blank('/v1/a/',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            params=params)
+        self.assertEqual('my_access_key_id', utils.get_s3_access_key_id(req))
+
+    def test_is_s3_req(self):
+        headers = {'Authorization': 'not AWS my_access_key_id:signature'}
+        req = Request.blank('/v1/a/',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers=headers)
+        self.assertIs(False, utils.is_s3_req(req))
+
+        headers = {'Authorization': 'AWS my_access_key_id:signature'}
+        req = Request.blank('/v1/a/',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers=headers)
+        self.assertIs(True, utils.is_s3_req(req))
+
+    def test_mktime(self):
+        date_headers = [
+            'Thu, 01 Jan 1970 00:00:00 -0000',
+            'Thu, 01 Jan 1970 00:00:00 GMT',
+            'Thu, 01 Jan 1970 00:00:00 UTC',
+            'Thu, 01 Jan 1970 08:00:00 +0800',
+            'Wed, 31 Dec 1969 16:00:00 -0800',
+            'Wed, 31 Dec 1969 16:00:00 PST',
+        ]
+        for header in date_headers:
+            ts = utils.mktime(header)
+            self.assertEqual(0, ts, 'Got %r for header %s' % (ts, header))
+
+        # Last-Modified response style
+        self.assertEqual(0, utils.mktime('1970-01-01T00:00:00'))
+
+        # X-Amz-Date style
+        self.assertEqual(0, utils.mktime('19700101T000000Z',
+                                         s3request.SIGV4_X_AMZ_DATE_FORMAT))
+
+    def test_mktime_weird_tz(self):
+        orig_tz = os.environ.get('TZ', '')
+        try:
+            os.environ['TZ'] = 'EST+05EDT,M4.1.0,M10.5.0'
+            time.tzset()
+            os.environ['TZ'] = '+0000'
+            # No tzset! Simulating what Swift would do.
+            self.assertNotEqual(0, time.timezone)
+            self.test_mktime()
+        finally:
+            os.environ['TZ'] = orig_tz
+            time.tzset()
+
+
+class TestS3Timestamp(unittest.TestCase):
+    def test_init(self):
+        ts = utils.S3Timestamp(1234567890.123451)
+        self.assertEqual('1234567890.12345', ts.internal)
+        self.assertEqual(1234567890.12345, float(ts))
+
+    def test_now(self):
+        with unittest.mock.patch(
+                'swift.common.middleware.s3api.utils.time.time',
+                return_value=1234567890.123451):
+            ts = utils.S3Timestamp.now()
+        self.assertEqual('1234567890.12345', ts.internal)
+        self.assertEqual(1234567890.12345, float(ts))
+
+    def test_s3xmlformat(self):
+        expected = '1970-01-01T00:00:01.000Z'
+        # integer
+        ts = utils.S3Timestamp(1)
+        self.assertEqual(expected, ts.s3xmlformat)
+        # microseconds digits are not included in Timestamp.normal so do not
+        # cause the timestamp to be rounded up
+        ts = utils.S3Timestamp(1.000001)
+        self.assertEqual(expected, ts.s3xmlformat)
+
+        # milliseconds unit should be rounded up
+        expected = '1970-01-01T00:00:02.000Z'
+        ts = utils.S3Timestamp(1.1)
+        self.assertEqual(expected, ts.s3xmlformat)
+        # float (deca-microseconds) should be rounded up too
+        ts = utils.S3Timestamp(1.000010)
+        self.assertEqual(expected, ts.s3xmlformat)
+        # Bigger float (milliseconds) should be rounded up too
+        ts = utils.S3Timestamp(1.9)
+        self.assertEqual(expected, ts.s3xmlformat)
+
+    def test_from_s3xmlformat(self):
+        ts = utils.S3Timestamp.from_s3xmlformat('2014-06-10T22:47:32.000Z')
+        self.assertIsInstance(ts, utils.S3Timestamp)
+        self.assertEqual(1402440452, float(ts))
+        self.assertEqual('2014-06-10T22:47:32.000000', ts.isoformat)
+
+        ts = utils.S3Timestamp.from_s3xmlformat('1970-01-01T00:00:00.000Z')
+        self.assertIsInstance(ts, utils.S3Timestamp)
+        self.assertEqual(0.0, float(ts))
+        self.assertEqual('1970-01-01T00:00:00.000000', ts.isoformat)
+
+        ts = utils.S3Timestamp(1402440452.0)
+        self.assertIsInstance(ts, utils.S3Timestamp)
+        ts1 = utils.S3Timestamp.from_s3xmlformat(ts.s3xmlformat)
+        self.assertIsInstance(ts1, utils.S3Timestamp)
+        self.assertEqual(ts, ts1)
+
+    def test_from_isoformat(self):
+        ts = utils.S3Timestamp.from_isoformat('2014-06-10T22:47:32.054580')
+        self.assertIsInstance(ts, utils.S3Timestamp)
+        self.assertEqual(1402440452.05458, float(ts))
+        self.assertEqual('2014-06-10T22:47:32.054580', ts.isoformat)
+        self.assertEqual('2014-06-10T22:47:33.000Z', ts.s3xmlformat)
+
+
+class TestConfig(unittest.TestCase):
+
+    def _assert_defaults(self, conf):
+        self.assertEqual([], conf.storage_domains)
+        self.assertEqual('us-east-1', conf.location)
+        self.assertFalse(conf.force_swift_request_proxy_log)
+        self.assertTrue(conf.dns_compliant_bucket_names)
+        self.assertTrue(conf.allow_multipart_uploads)
+        self.assertFalse(conf.allow_no_owner)
+        self.assertEqual(900, conf.allowable_clock_skew)
+        self.assertFalse(conf.ratelimit_as_client_error)
+
+    def test_defaults(self):
+        # deliberately brittle so new defaults will need to be added to test
+        conf = utils.Config()
+        self._assert_defaults(conf)
+        del conf.storage_domains
+        del conf.location
+        del conf.force_swift_request_proxy_log
+        del conf.dns_compliant_bucket_names
+        del conf.allow_multipart_uploads
+        del conf.allow_no_owner
+        del conf.allowable_clock_skew
+        del conf.ratelimit_as_client_error
+        del conf.max_upload_part_num
+        self.assertEqual({}, conf)
+
+    def test_update(self):
+        conf = utils.Config()
+        conf.update({'key1': 'val1', 'key2': 'val2'})
+        self._assert_defaults(conf)
+        self.assertEqual(conf.key1, 'val1')
+        self.assertEqual(conf.key2, 'val2')
+
+        conf.update({'allow_multipart_uploads': False})
+        self.assertFalse(conf.allow_multipart_uploads)
+
+    def test_set_get_delete(self):
+        conf = utils.Config()
+        self.assertRaises(AttributeError, lambda: conf.new_attr)
+        conf.new_attr = 123
+        self.assertEqual(123, conf.new_attr)
+        del conf.new_attr
+        self.assertRaises(AttributeError, lambda: conf.new_attr)
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/s3api/test_versioning.py b/test/unit/common/middleware/s3api/test_versioning.py
new file mode 100644
index 0000000000..96076ee0d4
--- /dev/null
+++ b/test/unit/common/middleware/s3api/test_versioning.py
@@ -0,0 +1,194 @@
+# Copyright (c) 2014 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+
+from unittest.mock import patch
+
+from swift.common.swob import Request, HTTPNoContent
+from swift.common.middleware.s3api.etree import fromstring, tostring, \
+    Element, SubElement
+
+from test.unit.common.middleware.s3api import S3ApiTestCase
+
+
+class TestS3ApiVersioning(S3ApiTestCase):
+
+    def _versioning_GET(self, path):
+        req = Request.blank('%s?versioning' % path,
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()})
+
+        status, headers, body = self.call_s3api(req)
+        return status, headers, body
+
+    def _versioning_GET_not_configured(self, path):
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket',
+                            HTTPNoContent, {}, None)
+
+        status, headers, body = self._versioning_GET(path)
+        self.assertEqual(status.split()[0], '200')
+        elem = fromstring(body, 'VersioningConfiguration')
+        self.assertEqual(list(elem), [])
+
+    def _versioning_GET_enabled(self, path):
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket', HTTPNoContent, {
+            'X-Container-Sysmeta-Versions-Enabled': 'True',
+        }, None)
+
+        status, headers, body = self._versioning_GET(path)
+        self.assertEqual(status.split()[0], '200')
+        elem = fromstring(body, 'VersioningConfiguration')
+        status = elem.find('./Status').text
+        self.assertEqual(status, 'Enabled')
+
+    def _versioning_GET_suspended(self, path):
+        self.swift.register('HEAD', '/v1/AUTH_test/bucket', HTTPNoContent, {
+            'X-Container-Sysmeta-Versions-Enabled': 'False',
+        }, None)
+
+        status, headers, body = self._versioning_GET('/bucket/object')
+        self.assertEqual(status.split()[0], '200')
+        elem = fromstring(body, 'VersioningConfiguration')
+        status = elem.find('./Status').text
+        self.assertEqual(status, 'Suspended')
+
+    def _versioning_PUT_error(self, path):
+        # Root tag is not VersioningConfiguration
+        elem = Element('foo')
+        SubElement(elem, 'Status').text = 'Enabled'
+        xml = tostring(elem)
+
+        req = Request.blank('%s?versioning' % path,
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()},
+                            body=xml)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '400')
+
+        # Status is not "Enabled" or "Suspended"
+        elem = Element('VersioningConfiguration')
+        SubElement(elem, 'Status').text = 'enabled'
+        xml = tostring(elem)
+
+        req = Request.blank('%s?versioning' % path,
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()},
+                            body=xml)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '400')
+
+    def _versioning_PUT_enabled(self, path):
+        elem = Element('VersioningConfiguration')
+        SubElement(elem, 'Status').text = 'Enabled'
+        xml = tostring(elem)
+
+        self.swift.register('POST', '/v1/AUTH_test/bucket', HTTPNoContent,
+                            {'X-Container-Sysmeta-Versions-Enabled': 'True'},
+                            None)
+
+        req = Request.blank('%s?versioning' % path,
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()},
+                            body=xml)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+
+        calls = self.swift.calls_with_headers
+        self.assertEqual(calls[-1][0], 'POST')
+        self.assertIn(('X-Versions-Enabled', 'true'),
+                      list(calls[-1][2].items()))
+
+    def _versioning_PUT_suspended(self, path):
+        elem = Element('VersioningConfiguration')
+        SubElement(elem, 'Status').text = 'Suspended'
+        xml = tostring(elem)
+
+        self.swift.register('POST', '/v1/AUTH_test/bucket', HTTPNoContent,
+                            {'x-container-sysmeta-versions-enabled': 'False'},
+                            None)
+
+        req = Request.blank('%s?versioning' % path,
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()},
+                            body=xml)
+        status, headers, body = self.call_s3api(req)
+        self.assertEqual(status.split()[0], '200')
+
+        calls = self.swift.calls_with_headers
+        self.assertEqual(calls[-1][0], 'POST')
+        self.assertIn(('X-Versions-Enabled', 'false'),
+                      list(calls[-1][2].items()))
+
+    def test_object_versioning_GET_not_configured(self):
+        self._versioning_GET_not_configured('/bucket/object')
+
+    def test_object_versioning_GET_enabled(self):
+        self._versioning_GET_enabled('/bucket/object')
+
+    def test_object_versioning_GET_suspended(self):
+        self._versioning_GET_suspended('/bucket/object')
+
+    def test_object_versioning_PUT_error(self):
+        self._versioning_PUT_error('/bucket/object')
+
+    def test_object_versioning_PUT_enabled(self):
+        self._versioning_PUT_enabled('/bucket/object')
+
+    def test_object_versioning_PUT_suspended(self):
+        self._versioning_PUT_suspended('/bucket/object')
+
+    def test_bucket_versioning_GET_not_configured(self):
+        self._versioning_GET_not_configured('/bucket')
+
+    def test_bucket_versioning_GET_enabled(self):
+        self._versioning_GET_enabled('/bucket')
+
+    def test_bucket_versioning_GET_suspended(self):
+        self._versioning_GET_suspended('/bucket')
+
+    def test_bucket_versioning_PUT_error(self):
+        self._versioning_PUT_error('/bucket')
+
+    def test_object_versioning_PUT_not_implemented(self):
+        elem = Element('VersioningConfiguration')
+        SubElement(elem, 'Status').text = 'Enabled'
+        xml = tostring(elem)
+
+        req = Request.blank('/bucket?versioning',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': self.get_date_header()},
+                            body=xml)
+
+        with patch('swift.common.middleware.s3api.controllers.versioning.'
+                   'get_swift_info', return_value={}):
+            status, headers, body = self.call_s3api(req)
+            self.assertEqual(status.split()[0], '501', body)
+
+    def test_bucket_versioning_PUT_enabled(self):
+        self._versioning_PUT_enabled('/bucket')
+
+    def test_bucket_versioning_PUT_suspended(self):
+        self._versioning_PUT_suspended('/bucket')
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/test_account_quotas.py b/test/unit/common/middleware/test_account_quotas.py
new file mode 100644
index 0000000000..92edca977d
--- /dev/null
+++ b/test/unit/common/middleware/test_account_quotas.py
@@ -0,0 +1,1107 @@
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+
+from swift.common.swob import Request, wsgify, HTTPForbidden, HTTPOk, \
+    HTTPServiceUnavailable, HTTPNotFound
+
+from swift.common.middleware import account_quotas, copy
+
+from test.unit import patch_policies
+from test.unit.common.middleware.helpers import FakeSwift
+
+
+class FakeCache(object):
+    def __init__(self, val):
+        self.val = val
+
+    def get(self, *args):
+        return self.val
+
+    def set(self, *args, **kwargs):
+        pass
+
+
+class FakeAuthFilter(object):
+
+    def __init__(self, app):
+        self.app = app
+
+    @wsgify
+    def __call__(self, req):
+        def authorize(req):
+            if req.headers['x-auth-token'] == 'secret':
+                return
+            return HTTPForbidden(request=req)
+        req.environ['swift.authorize'] = authorize
+        return req.get_response(self.app)
+
+
+class TestAccountQuota(unittest.TestCase):
+
+    def setUp(self):
+        self.app = FakeSwift()
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-bytes-used': '1000'})
+        self.app.register('HEAD', '/v1/a/c', HTTPOk, {
+            'x-backend-storage-policy-index': '1'})
+        self.app.register('POST', '/v1/a', HTTPOk, {})
+        self.app.register('PUT', '/v1/a/c/o', HTTPOk, {})
+
+    def test_unauthorized(self):
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache})
+        res = req.get_response(app)
+        # Response code of 200 because authentication itself is not done here
+        self.assertEqual(res.status_int, 200)
+
+    def test_no_quotas(self):
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_obj_request_ignores_attempt_to_set_quotas(self):
+        # If you try to set X-Account-Meta-* on an object, it's ignored, so
+        # the quota middleware shouldn't complain about it even if we're not a
+        # reseller admin.
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o',
+                            headers={'X-Account-Meta-Quota-Bytes': '99999'},
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_container_request_ignores_attempt_to_set_quotas(self):
+        # As with an object, if you try to set X-Account-Meta-* on a
+        # container, it's ignored.
+        self.app.register('PUT', '/v1/a/c', HTTPOk, {})
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c',
+                            headers={'X-Account-Meta-Quota-Bytes': '99999'},
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_bogus_quota_is_ignored(self):
+        # This can happen if the metadata was set by a user prior to the
+        # activation of the account-quota middleware
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-bytes-used': '1000',
+            'x-account-sysmeta-quota-bytes': 'pasty-plastogene'})
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_exceed_bytes_quota_legacy(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-bytes-used': '1000',
+            'x-account-meta-quota-bytes': '0'})
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 413)
+        self.assertEqual(res.body, b'Upload exceeds quota.')
+
+    def test_exceed_bytes_quota(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-bytes-used': '1000',
+            'x-account-sysmeta-quota-bytes': '0'})
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 413)
+        self.assertEqual(res.body, b'Upload exceeds quota.')
+
+    @patch_policies
+    def test_exceed_per_policy_quota(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-bytes-used': '100',
+            'x-account-storage-policy-unu-bytes-used': '100',
+            'x-account-sysmeta-quota-bytes-policy-1': '10',
+            'x-account-sysmeta-quota-bytes': '1000'})
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 413)
+        self.assertEqual(res.body, b'Upload exceeds policy quota.')
+
+    @patch_policies
+    def test_policy_quota_translation_legacy_loses(self):
+        # if we have both meta (legacy) and sysmeta, ensure sysmeta wins
+        def do_test(method):
+            self.app.register(method, '/v1/a', HTTPOk, {
+                'x-account-bytes-used': '100',
+                'x-account-storage-policy-unu-bytes-used': '100',
+                'x-account-sysmeta-quota-bytes-policy-1': '10',
+                'x-account-sysmeta-quota-bytes': '1000',
+                'x-account-meta-quota-bytes': '2000'})
+            app = account_quotas.AccountQuotaMiddleware(self.app)
+            cache = FakeCache(None)
+            req = Request.blank('/v1/a', method=method, environ={
+                'swift.cache': cache})
+            res = req.get_response(app)
+            self.assertEqual(res.status_int, 200)
+            self.assertEqual(res.headers.get(
+                'X-Account-Quota-Bytes'), '1000')
+            self.assertEqual(res.headers.get(
+                'X-Account-Meta-Quota-Bytes'), '2000')
+            self.assertEqual(res.headers.get(
+                'X-Account-Sysmeta-Quota-Bytes-Policy-1'), '10')
+            self.assertEqual(res.headers.get(
+                'X-Account-Quota-Bytes-Policy-Unu'), '10')
+            self.assertEqual(res.headers.get(
+                'X-Account-Storage-Policy-Unu-Bytes-Used'), '100')
+
+        do_test('GET')
+        do_test('HEAD')
+
+    @patch_policies
+    def test_policy_quota_translation(self):
+        def do_test(method):
+            self.app.register(method, '/v1/a', HTTPOk, {
+                'x-account-bytes-used': '100',
+                'x-account-storage-policy-unu-bytes-used': '100',
+                'x-account-sysmeta-quota-bytes-policy-1': '10',
+                'x-account-sysmeta-quota-bytes': '1000'})
+            app = account_quotas.AccountQuotaMiddleware(self.app)
+            cache = FakeCache(None)
+            req = Request.blank('/v1/a', method=method, environ={
+                'swift.cache': cache})
+            res = req.get_response(app)
+            self.assertEqual(res.status_int, 200)
+            self.assertEqual(res.headers.get(
+                'X-Account-Sysmeta-Quota-Bytes'), '1000')
+            self.assertEqual(res.headers.get(
+                'X-Account-Quota-Bytes'), '1000')
+            self.assertEqual(res.headers.get(
+                'X-Account-Sysmeta-Quota-Bytes-Policy-1'), '10')
+            self.assertEqual(res.headers.get(
+                'X-Account-Quota-Bytes-Policy-Unu'), '10')
+            self.assertEqual(res.headers.get(
+                'X-Account-Storage-Policy-Unu-Bytes-Used'), '100')
+
+        do_test('GET')
+        do_test('HEAD')
+
+    def test_exceed_quota_not_authorized(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-bytes-used': '1000',
+            'x-account-sysmeta-quota-bytes': '0'})
+        app = FakeAuthFilter(account_quotas.AccountQuotaMiddleware(self.app))
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o', method='PUT',
+                            headers={'x-auth-token': 'bad-secret'},
+                            environ={'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 403)
+
+    def test_exceed_quota_authorized_legacy(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-bytes-used': '1000',
+            'x-account-meta-quota-bytes': '0'})
+        app = FakeAuthFilter(account_quotas.AccountQuotaMiddleware(self.app))
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o', method='PUT',
+                            headers={'x-auth-token': 'secret'},
+                            environ={'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 413)
+
+    def test_exceed_quota_authorized(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-bytes-used': '1000',
+            'x-account-sysmeta-quota-bytes': '0'})
+        app = FakeAuthFilter(account_quotas.AccountQuotaMiddleware(self.app))
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o', method='PUT',
+                            headers={'x-auth-token': 'secret'},
+                            environ={'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 413)
+
+    def test_under_quota_not_authorized(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-bytes-used': '0',
+            'x-account-sysmeta-quota-bytes': '1000'})
+        app = FakeAuthFilter(account_quotas.AccountQuotaMiddleware(self.app))
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o', method='PUT',
+                            headers={'x-auth-token': 'bad-secret'},
+                            environ={'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 403)
+
+    def test_under_quota_authorized_legacy(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-bytes-used': '0',
+            'x-account-meta-quota-bytes': '1000'})
+        app = FakeAuthFilter(account_quotas.AccountQuotaMiddleware(self.app))
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o', method='PUT',
+                            headers={'x-auth-token': 'secret'},
+                            environ={'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_under_quota_authorized(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-bytes-used': '0',
+            'x-account-sysmeta-quota-bytes': '1000'})
+        app = FakeAuthFilter(account_quotas.AccountQuotaMiddleware(self.app))
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o', method='PUT',
+                            headers={'x-auth-token': 'secret'},
+                            environ={'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_exceed_quota_bytes_on_empty_account_authorized(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-bytes-used': '0',
+            'x-account-sysmeta-quota-bytes': '10'})
+        app = FakeAuthFilter(account_quotas.AccountQuotaMiddleware(self.app))
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o', method='PUT',
+                            headers={'x-auth-token': 'secret',
+                                     'content-length': '100'},
+                            environ={'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 413)
+        self.assertEqual(res.body, b'Upload exceeds quota.')
+
+    def test_exceed_quota_bytes_authorized(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-bytes-used': '100',
+            'x-account-sysmeta-quota-bytes': '1000'})
+        app = FakeAuthFilter(account_quotas.AccountQuotaMiddleware(self.app))
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o', method='PUT',
+                            headers={'x-auth-token': 'secret',
+                                     'content-length': '901'},
+                            environ={'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 413)
+        self.assertEqual(res.body, b'Upload exceeds quota.')
+
+    def test_exceed_multiple_quota_authorized(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-bytes-used': '100',
+            'x-account-object-count': '10',
+            'x-account-sysmeta-quota-count': '10',
+            'x-account-sysmeta-quota-bytes': '10'})
+        app = FakeAuthFilter(account_quotas.AccountQuotaMiddleware(self.app))
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o', method='PUT',
+                            headers={'x-auth-token': 'secret',
+                                     'content-length': '901'},
+                            environ={'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 413)
+        self.assertEqual(res.body, b'Upload exceeds quota.')
+
+    def test_over_quota_container_create_still_works(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-bytes-used': '1001',
+            'x-account-sysmeta-quota-bytes': '1000'})
+        self.app.register('PUT', '/v1/a/new_container', HTTPOk, {})
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/new_container',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'HTTP_X_CONTAINER_META_BERT': 'ernie',
+                                     'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_over_quota_container_post_still_works(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-bytes-used': '1001',
+            'x-account-sysmeta-quota-bytes': '1000'})
+        self.app.register('POST', '/v1/a/new_container', HTTPOk, {})
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/new_container',
+                            environ={'REQUEST_METHOD': 'POST',
+                                     'HTTP_X_CONTAINER_META_BERT': 'ernie',
+                                     'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_over_quota_obj_post_still_works(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-bytes-used': '1001',
+            'x-account-sysmeta-quota-bytes': '1000'})
+        self.app.register('POST', '/v1/a/c/o', HTTPOk, {})
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'POST',
+                                     'HTTP_X_OBJECT_META_BERT': 'ernie',
+                                     'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_exceed_bytes_quota_reseller(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-bytes-used': '1000',
+            'x-account-sysmeta-quota-bytes': '0'})
+        self.app.register('PUT', '/v1/a', HTTPOk, {})
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache,
+                                     'reseller_request': True})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_exceed_bytes_quota_reseller_copy_from(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-bytes-used': '500',
+            'x-account-sysmeta-quota-bytes': '1000'})
+        self.app.register('GET', '/v1/a/c2/o2', HTTPOk, {
+            'content-length': '1000'}, b'a' * 1000)
+        app = copy.filter_factory({})(
+            account_quotas.AccountQuotaMiddleware(self.app))
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache,
+                                     'reseller_request': True},
+                            headers={'x-copy-from': 'c2/o2'})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_exceed_bytes_quota_reseller_copy_verb(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-bytes-used': '500',
+            'x-account-sysmeta-quota-bytes': '1000'})
+        self.app.register('GET', '/v1/a/c2/o2', HTTPOk, {
+            'content-length': '1000'}, b'a' * 1000)
+        app = copy.filter_factory({})(
+            account_quotas.AccountQuotaMiddleware(self.app))
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c2/o2',
+                            environ={'REQUEST_METHOD': 'COPY',
+                                     'swift.cache': cache,
+                                     'reseller_request': True},
+                            headers={'Destination': 'c/o'})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_bad_application_quota(self):
+        self.app.register('PUT', '/v1/a/c/o', HTTPNotFound, {})
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 404)
+
+    def test_no_info_quota(self):
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_not_exceed_bytes_quota(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-bytes-used': '1000',
+            'x-account-sysmeta-quota-bytes': '2000'})
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_invalid_quotas(self):
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a',
+                            environ={'REQUEST_METHOD': 'POST',
+                                     'swift.cache': cache,
+                                     'HTTP_X_ACCOUNT_QUOTA_BYTES': 'abc',
+                                     'reseller_request': True})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 400)
+        self.assertEqual(self.app.calls, [])
+
+    @patch_policies
+    def test_invalid_policy_quota(self):
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a', environ={
+            'REQUEST_METHOD': 'POST',
+            'swift.cache': cache,
+            'HTTP_X_ACCOUNT_QUOTA_BYTES_POLICY_NULO': 'abc',
+            'reseller_request': True})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 400)
+        self.assertEqual(self.app.calls, [])
+
+    def test_valid_quotas_non_admin_fails(self):
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a',
+                            environ={'REQUEST_METHOD': 'POST',
+                                     'swift.cache': cache,
+                                     'HTTP_X_ACCOUNT_QUOTA_BYTES': '100'})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 403)
+        self.assertEqual(self.app.calls, [])
+
+    @patch_policies
+    def test_valid_policy_quota_admin(self):
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a', environ={
+            'REQUEST_METHOD': 'POST',
+            'swift.cache': cache,
+            'HTTP_X_ACCOUNT_QUOTA_BYTES_POLICY_UNU': '100'})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 403)
+        self.assertEqual(self.app.calls, [])
+
+    def test_valid_quotas_reseller_legacy(self):
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a',
+                            environ={'REQUEST_METHOD': 'POST',
+                                     'swift.cache': cache,
+                                     'HTTP_X_ACCOUNT_META_QUOTA_BYTES': '100',
+                                     'reseller_request': True})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+        self.assertEqual(self.app.calls_with_headers, [
+            ('POST', '/v1/a', {'Host': 'localhost:80',
+                               'X-Account-Quota-Bytes': '100',
+                               'X-Account-Meta-Quota-Bytes': '100',
+                               'X-Account-Sysmeta-Quota-Bytes': '100'})])
+
+    def test_valid_quotas_reseller_legacy_loses(self):
+        # if we have both meta (legacy) and sysmeta, ensure sysmeta wins
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a',
+                            environ={'REQUEST_METHOD': 'POST',
+                                     'swift.cache': cache,
+                                     'HTTP_X_ACCOUNT_QUOTA_BYTES': '100',
+                                     'HTTP_X_ACCOUNT_META_QUOTA_BYTES': '200',
+                                     'reseller_request': True})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+        self.assertEqual(self.app.calls_with_headers, [
+            ('POST', '/v1/a', {'Host': 'localhost:80',
+                               'X-Account-Quota-Bytes': '100',
+                               'X-Account-Meta-Quota-Bytes': '200',
+                               'X-Account-Sysmeta-Quota-Bytes': '100'})])
+
+    def test_valid_quotas_reseller(self):
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a',
+                            environ={'REQUEST_METHOD': 'POST',
+                                     'swift.cache': cache,
+                                     'HTTP_X_ACCOUNT_QUOTA_BYTES': '100',
+                                     'reseller_request': True})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+        self.assertEqual(self.app.calls_with_headers, [
+            ('POST', '/v1/a', {'Host': 'localhost:80',
+                               'X-Account-Quota-Bytes': '100',
+                               'X-Account-Sysmeta-Quota-Bytes': '100'})])
+
+    @patch_policies
+    def test_valid_policy_quota_reseller(self):
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a', environ={
+            'REQUEST_METHOD': 'POST',
+            'swift.cache': cache,
+            'HTTP_X_ACCOUNT_QUOTA_BYTES_POLICY_NULO': '100',
+            'reseller_request': True})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+        self.assertEqual(self.app.calls_with_headers, [
+            ('POST', '/v1/a', {
+                'Host': 'localhost:80',
+                'X-Account-Sysmeta-Quota-Bytes-Policy-0': '100'})])
+
+    def test_delete_quotas(self):
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a',
+                            environ={'REQUEST_METHOD': 'POST',
+                                     'swift.cache': cache,
+                                     'HTTP_X_ACCOUNT_QUOTA_BYTES': ''})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 403)
+
+    def test_delete_quotas_with_remove_header(self):
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a', environ={
+            'REQUEST_METHOD': 'POST',
+            'swift.cache': cache,
+            'HTTP_X_REMOVE_ACCOUNT_QUOTA_BYTES': 'True'})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 403)
+
+    def test_delete_quotas_reseller(self):
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        req = Request.blank('/v1/a',
+                            environ={'REQUEST_METHOD': 'POST',
+                                     'HTTP_X_ACCOUNT_QUOTA_BYTES': '',
+                                     'reseller_request': True})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_delete_quotas_with_remove_header_reseller(self):
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a', environ={
+            'REQUEST_METHOD': 'POST',
+            'swift.cache': cache,
+            'HTTP_X_REMOVE_ACCOUNT_QUOTA_BYTES': 'True',
+            'reseller_request': True})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_invalid_request_exception(self):
+        self.app.register('PUT', '/v1', HTTPServiceUnavailable, {})
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 503)
+
+    def test_obj_request_ignores_attempt_to_set_count_quotas(self):
+        # If you try to set X-Account-Meta-* on an object, it's ignored, so
+        # the quota middleware shouldn't complain about it even if we're not a
+        # reseller admin.
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o',
+                            headers={'X-Account-Meta-Quota-Count': '99999'},
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_container_request_ignores_attempt_to_set_count_quotas(self):
+        # As with an object, if you try to set X-Account-Meta-* on a
+        # container, it's ignored.
+        self.app.register('PUT', '/v1/a/c', HTTPOk, {})
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c',
+                            headers={'X-Account-Meta-Quota-Count': '99999'},
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_bogus_count_quota_is_ignored(self):
+        # This can happen if the metadata was set by a user prior to the
+        # activation of the account-quota middleware
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-bytes-used': '1000',
+            'x-account-meta-quota-count': 'pasty-plastogene'})
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_exceed_count_quota(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-object-count': '10',
+            'x-account-sysmeta-quota-count': '10'})
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 413)
+        self.assertEqual(res.body, b'Upload exceeds quota.')
+
+    def test_exceed_quota_count_not_authorized(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-sysmeta-quota-count': '0'})
+        app = FakeAuthFilter(account_quotas.AccountQuotaMiddleware(self.app))
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o', method='PUT',
+                            headers={'x-auth-token': 'bad-secret'},
+                            environ={'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 403)
+
+    def test_exceed_count_quota_authorized(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-sysmeta-quota-count': '0'})
+        app = FakeAuthFilter(account_quotas.AccountQuotaMiddleware(self.app))
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o', method='PUT',
+                            headers={'x-auth-token': 'secret'},
+                            environ={'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 413)
+
+    def test_under_quota_count_not_authorized(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-object-count': '0',
+            'x-account-sysmeta-quota-count': '5'})
+        app = FakeAuthFilter(account_quotas.AccountQuotaMiddleware(self.app))
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o', method='PUT',
+                            headers={'x-auth-token': 'bad-secret'},
+                            environ={'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 403)
+
+    def test_under_quota_count_authorized(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-object-count': '0',
+            'x-account-sysmeta-quota-count': '5'})
+        app = FakeAuthFilter(account_quotas.AccountQuotaMiddleware(self.app))
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o', method='PUT',
+                            headers={'x-auth-token': 'secret'},
+                            environ={'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_exceed_quota_count_on_empty_account_not_authorized(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-object-count': '0',
+            'x-account-sysmeta-quota-count': '0'})
+        app = FakeAuthFilter(account_quotas.AccountQuotaMiddleware(self.app))
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o', method='PUT',
+                            headers={'x-auth-token': 'bad-secret'},
+                            environ={'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 403)
+
+    def test_exceed_quota_count_authorized(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-object-count': '5',
+            'x-account-sysmeta-quota-count': '5'})
+        app = FakeAuthFilter(account_quotas.AccountQuotaMiddleware(self.app))
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o', method='PUT',
+                            headers={'x-auth-token': 'secret'},
+                            environ={'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 413)
+        self.assertEqual(res.body, b'Upload exceeds quota.')
+
+    def test_over_quota_count_container_create_still_works(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-object-count': '6',
+            'x-account-sysmeta-quota-count': '5'})
+        self.app.register('PUT', '/v1/a/new_container', HTTPOk, {})
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/new_container',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'HTTP_X_CONTAINER_META_BERT': 'ernie',
+                                     'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_over_quota_count_container_post_still_works(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-quota-count': '6',
+            'x-account-sysmeta-quota-count': '5'})
+        self.app.register('POST', '/v1/a/new_container', HTTPOk, {})
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/new_container',
+                            environ={'REQUEST_METHOD': 'POST',
+                                     'HTTP_X_CONTAINER_META_BERT': 'ernie',
+                                     'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_over_count_quota_obj_post_still_works(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-object-count': '101',
+            'x-account-sysmeta-quota-count': '100'})
+        self.app.register('POST', '/v1/a/c/o', HTTPOk, {})
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'POST',
+                                     'HTTP_X_OBJECT_META_BERT': 'ernie',
+                                     'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_exceed_count_quota_reseller(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-object-count': '1000',
+            'x-account-sysmeta-quota-count': '0'})
+        self.app.register('PUT', '/v1/a', HTTPOk, {})
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache,
+                                     'reseller_request': True})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_exceed_count_quota_reseller_copy_from(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-object-count': '10',
+            'x-account-sysmeta-quota-count': '10'})
+        self.app.register('GET', '/v1/a/c2/o2', HTTPOk, {
+            'content-length': '1000'}, b'a' * 1000)
+        app = copy.filter_factory({})(
+            account_quotas.AccountQuotaMiddleware(self.app))
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache,
+                                     'reseller_request': True},
+                            headers={'x-copy-from': 'c2/o2'})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_exceed_count_quota_reseller_copy_verb(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-object-count': '99',
+            'x-account-sysmeta-quota-count': '100'})
+        self.app.register('GET', '/v1/a/c2/o2', HTTPOk, {
+            'content-length': '1000'}, b'a' * 1000)
+        app = copy.filter_factory({})(
+            account_quotas.AccountQuotaMiddleware(self.app))
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c2/o2',
+                            environ={'REQUEST_METHOD': 'COPY',
+                                     'swift.cache': cache,
+                                     'reseller_request': True},
+                            headers={'Destination': 'c/o'})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_not_exceed_count_quota(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk, {
+            'x-account-object-count': '10',
+            'x-account-sysmeta-quota-count': '20'})
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_invalid_count_quotas_on_object(self):
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a',
+                            environ={'REQUEST_METHOD': 'POST',
+                                     'swift.cache': cache,
+                                     'HTTP_X_ACCOUNT_QUOTA_COUNT': 'abc',
+                                     'reseller_request': True})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 400)
+        self.assertEqual(self.app.calls, [])
+
+    def test_valid_count_quotas_admin(self):
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a',
+                            environ={'REQUEST_METHOD': 'POST',
+                                     'swift.cache': cache,
+                                     'HTTP_X_ACCOUNT_QUOTA_COUNT': '100'})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 403)
+        self.assertEqual(self.app.calls, [])
+
+    @patch_policies
+    def test_valid_policy_count_quota_admin(self):
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a', environ={
+            'REQUEST_METHOD': 'POST',
+            'swift.cache': cache,
+            'HTTP_X_ACCOUNT_QUOTA_COUNT_POLICY_UNU': '100'})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 403)
+        self.assertEqual(self.app.calls, [])
+
+    def test_valid_count_quota_reseller(self):
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a',
+                            environ={'REQUEST_METHOD': 'POST',
+                                     'swift.cache': cache,
+                                     'HTTP_X_ACCOUNT_QUOTA_COUNT': '100',
+                                     'reseller_request': True})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+        self.assertEqual(self.app.calls_with_headers, [
+            ('POST', '/v1/a', {'Host': 'localhost:80',
+                               'X-Account-Quota-Count': '100',
+                               'X-Account-Sysmeta-Quota-Count': '100'})])
+
+    @patch_policies
+    def test_valid_policy_count_quota_reseller(self):
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a', environ={
+            'REQUEST_METHOD': 'POST',
+            'swift.cache': cache,
+            'HTTP_X_ACCOUNT_QUOTA_COUNT_POLICY_NULO': '100',
+            'reseller_request': True})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+        self.assertEqual(self.app.calls_with_headers, [
+            ('POST', '/v1/a', {
+                'Host': 'localhost:80',
+                'X-Account-Sysmeta-Quota-Count-Policy-0': '100'})])
+
+    def test_delete_count_quotas(self):
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a',
+                            environ={'REQUEST_METHOD': 'POST',
+                                     'swift.cache': cache,
+                                     'HTTP_X_ACCOUNT_QUOTA_COUNT': ''})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 403)
+
+    def test_delete_count_quotas_with_remove_header(self):
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a', environ={
+            'REQUEST_METHOD': 'POST',
+            'swift.cache': cache,
+            'HTTP_X_REMOVE_ACCOUNT_QUOTA_COUNT': 'True'})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 403)
+
+    def test_delete_count_quotas_reseller(self):
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        req = Request.blank('/v1/a',
+                            environ={'REQUEST_METHOD': 'POST',
+                                     'HTTP_X_ACCOUNT_QUOTA_COUNT': '',
+                                     'reseller_request': True})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_delete_count_quotas_with_remove_header_reseller(self):
+        app = account_quotas.AccountQuotaMiddleware(self.app)
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a', environ={
+            'REQUEST_METHOD': 'POST',
+            'swift.cache': cache,
+            'HTTP_X_REMOVE_ACCOUNT_QUOTA_COUNT': 'True',
+            'reseller_request': True})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+
+class AccountQuotaCopyingTestCases(unittest.TestCase):
+
+    def setUp(self):
+        self.app = FakeSwift()
+        self.app.register('HEAD', '/v1/a/c', HTTPOk, {
+            'x-backend-storage-policy-index': '1'})
+        self.app.register('GET', '/v1/a/c2/o2', HTTPOk, {
+            'content-length': '1000'})
+        self.aq_filter = account_quotas.filter_factory({})(self.app)
+        self.copy_filter = copy.filter_factory({})(self.aq_filter)
+
+    def test_exceed_bytes_quota_copy_from(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk,
+                          [('x-account-bytes-used', '500'),
+                           ('x-account-sysmeta-quota-bytes', '1000')])
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache},
+                            headers={'x-copy-from': '/c2/o2'})
+        res = req.get_response(self.copy_filter)
+        self.assertEqual(res.status_int, 413)
+        self.assertEqual(res.body, b'Upload exceeds quota.')
+
+    def test_exceed_bytes_quota_copy_verb(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk,
+                          [('x-account-bytes-used', '500'),
+                           ('x-account-sysmeta-quota-bytes', '1000')])
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c2/o2',
+                            environ={'REQUEST_METHOD': 'COPY',
+                                     'swift.cache': cache},
+                            headers={'Destination': '/c/o'})
+        res = req.get_response(self.copy_filter)
+        self.assertEqual(res.status_int, 413)
+        self.assertEqual(res.body, b'Upload exceeds quota.')
+
+    def test_not_exceed_bytes_quota_copy_from(self):
+        self.app.register('PUT', '/v1/a/c/o', HTTPOk, {})
+        self.app.register('HEAD', '/v1/a', HTTPOk,
+                          [('x-account-bytes-used', '0'),
+                           ('x-account-sysmeta-quota-bytes', '1000')])
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache},
+                            headers={'x-copy-from': '/c2/o2'})
+        res = req.get_response(self.copy_filter)
+        self.assertEqual(res.status_int, 200)
+
+    def test_not_exceed_bytes_quota_copy_verb(self):
+        self.app.register('PUT', '/v1/a/c/o', HTTPOk, {})
+        self.app.register('HEAD', '/v1/a', HTTPOk,
+                          [('x-account-bytes-used', '0'),
+                           ('x-account-sysmeta-quota-bytes', '1000')])
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c2/o2',
+                            environ={'REQUEST_METHOD': 'COPY',
+                                     'swift.cache': cache},
+                            headers={'Destination': '/c/o'})
+        res = req.get_response(self.copy_filter)
+        self.assertEqual(res.status_int, 200)
+
+    def test_quota_copy_from_bad_src(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk,
+                          [('x-account-bytes-used', '0'),
+                           ('x-account-sysmeta-quota-bytes', '1000')])
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache},
+                            headers={'x-copy-from': 'bad_path'})
+        res = req.get_response(self.copy_filter)
+        self.assertEqual(res.status_int, 412)
+
+        self.app.register('HEAD', '/v1/a', HTTPOk,
+                          [('x-account-bytes-used', '1000'),
+                           ('x-account-sysmeta-quota-bytes', '0')])
+        res = req.get_response(self.copy_filter)
+        self.assertEqual(res.status_int, 412)
+
+    def test_exceed_bytes_count_quota_copy_from(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk,
+                          [('x-account-object-count', '5'),
+                           ('x-account-sysmeta-quota-count', '5')])
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache},
+                            headers={'x-copy-from': '/c2/o2'})
+        res = req.get_response(self.copy_filter)
+        self.assertEqual(res.status_int, 413)
+        self.assertEqual(res.body, b'Upload exceeds quota.')
+
+    def test_exceed_bytes_count_quota_copy_verb(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk,
+                          [('x-account-object-count', '5'),
+                           ('x-account-sysmeta-quota-count', '5')])
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c2/o2',
+                            environ={'REQUEST_METHOD': 'COPY',
+                                     'swift.cache': cache},
+                            headers={'Destination': '/c/o'})
+        res = req.get_response(self.copy_filter)
+        self.assertEqual(res.status_int, 413)
+        self.assertEqual(res.body, b'Upload exceeds quota.')
+
+    def test_not_exceed_bytes_count_quota_copy_from(self):
+        self.app.register('PUT', '/v1/a/c/o', HTTPOk, {})
+        self.app.register('HEAD', '/v1/a', HTTPOk,
+                          [('x-account-object-count', '5'),
+                           ('x-account-sysmeta-quota-count', '6')])
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache},
+                            headers={'x-copy-from': '/c2/o2'})
+        res = req.get_response(self.copy_filter)
+        self.assertEqual(res.status_int, 200)
+
+    def test_not_exceed_bytes_count_quota_copy_verb(self):
+        self.app.register('PUT', '/v1/a/c/o', HTTPOk, {})
+        self.app.register('HEAD', '/v1/a', HTTPOk,
+                          [('x-account-object-count', '5'),
+                           ('x-account-sysmeta-quota-count', '6')])
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c2/o2',
+                            environ={'REQUEST_METHOD': 'COPY',
+                                     'swift.cache': cache},
+                            headers={'Destination': '/c/o'})
+        res = req.get_response(self.copy_filter)
+        self.assertEqual(res.status_int, 200)
+
+    def test_count_quota_copy_from_bad_src(self):
+        self.app.register('HEAD', '/v1/a', HTTPOk,
+                          [('x-account-object-count', '0'),
+                           ('x-account-sysmeta-quota-count', '1')])
+        cache = FakeCache(None)
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache},
+                            headers={'x-copy-from': 'bad_path'})
+        res = req.get_response(self.copy_filter)
+        self.assertEqual(res.status_int, 412)
+
+        self.app.register('HEAD', '/v1/a', HTTPOk,
+                          [('x-account-object-count', '1'),
+                           ('x-account-sysmeta-quota-count', '0')])
+        res = req.get_response(self.copy_filter)
+        self.assertEqual(res.status_int, 412)
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/test_acl.py b/test/unit/common/middleware/test_acl.py
index 1a8f84e6b3..614056c0f2 100644
--- a/test/unit/common/middleware/test_acl.py
+++ b/test/unit/common/middleware/test_acl.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -22,36 +22,36 @@ class TestACL(unittest.TestCase):
 
     def test_clean_acl(self):
         value = acl.clean_acl('header', '.r:*')
-        self.assertEquals(value, '.r:*')
+        self.assertEqual(value, '.r:*')
         value = acl.clean_acl('header', '.r:specific.host')
-        self.assertEquals(value, '.r:specific.host')
+        self.assertEqual(value, '.r:specific.host')
         value = acl.clean_acl('header', '.r:.ending.with')
-        self.assertEquals(value, '.r:.ending.with')
+        self.assertEqual(value, '.r:.ending.with')
         value = acl.clean_acl('header', '.r:*.ending.with')
-        self.assertEquals(value, '.r:.ending.with')
+        self.assertEqual(value, '.r:.ending.with')
         value = acl.clean_acl('header', '.r:-*.ending.with')
-        self.assertEquals(value, '.r:-.ending.with')
+        self.assertEqual(value, '.r:-.ending.with')
         value = acl.clean_acl('header', '.r:one,.r:two')
-        self.assertEquals(value, '.r:one,.r:two')
+        self.assertEqual(value, '.r:one,.r:two')
         value = acl.clean_acl('header', '.r:*,.r:-specific.host')
-        self.assertEquals(value, '.r:*,.r:-specific.host')
+        self.assertEqual(value, '.r:*,.r:-specific.host')
         value = acl.clean_acl('header', '.r:*,.r:-.ending.with')
-        self.assertEquals(value, '.r:*,.r:-.ending.with')
+        self.assertEqual(value, '.r:*,.r:-.ending.with')
         value = acl.clean_acl('header', '.r:one,.r:-two')
-        self.assertEquals(value, '.r:one,.r:-two')
+        self.assertEqual(value, '.r:one,.r:-two')
         value = acl.clean_acl('header', '.r:one,.r:-two,account,account:user')
-        self.assertEquals(value, '.r:one,.r:-two,account,account:user')
+        self.assertEqual(value, '.r:one,.r:-two,account,account:user')
         value = acl.clean_acl('header', 'TEST_account')
-        self.assertEquals(value, 'TEST_account')
+        self.assertEqual(value, 'TEST_account')
         value = acl.clean_acl('header', '.ref:*')
-        self.assertEquals(value, '.r:*')
+        self.assertEqual(value, '.r:*')
         value = acl.clean_acl('header', '.referer:*')
-        self.assertEquals(value, '.r:*')
+        self.assertEqual(value, '.r:*')
         value = acl.clean_acl('header', '.referrer:*')
-        self.assertEquals(value, '.r:*')
-        value = acl.clean_acl('header', 
+        self.assertEqual(value, '.r:*')
+        value = acl.clean_acl('header',
                               ' .r : one , ,, .r:two , .r : - three ')
-        self.assertEquals(value, '.r:one,.r:two,.r:-three')
+        self.assertEqual(value, '.r:one,.r:two,.r:-three')
         self.assertRaises(ValueError, acl.clean_acl, 'header', '.unknown:test')
         self.assertRaises(ValueError, acl.clean_acl, 'header', '.r:')
         self.assertRaises(ValueError, acl.clean_acl, 'header', '.r:*.')
@@ -67,59 +67,141 @@ def test_clean_acl(self):
         self.assertRaises(ValueError, acl.clean_acl, 'write-header', '.r:r')
 
     def test_parse_acl(self):
-        self.assertEquals(acl.parse_acl(None), ([], []))
-        self.assertEquals(acl.parse_acl(''), ([], []))
-        self.assertEquals(acl.parse_acl('.r:ref1'), (['ref1'], []))
-        self.assertEquals(acl.parse_acl('.r:-ref1'), (['-ref1'], []))
-        self.assertEquals(acl.parse_acl('account:user'),
-                          ([], ['account:user']))
-        self.assertEquals(acl.parse_acl('account'), ([], ['account']))
-        self.assertEquals(acl.parse_acl('acc1,acc2:usr2,.r:ref3,.r:-ref4'),
-                          (['ref3', '-ref4'], ['acc1', 'acc2:usr2']))
-        self.assertEquals(acl.parse_acl(
+        self.assertEqual(acl.parse_acl(None), ([], []))
+        self.assertEqual(acl.parse_acl(''), ([], []))
+        self.assertEqual(acl.parse_acl('.r:ref1'), (['ref1'], []))
+        self.assertEqual(acl.parse_acl('.r:-ref1'), (['-ref1'], []))
+        self.assertEqual(acl.parse_acl('account:user'),
+                         ([], ['account:user']))
+        self.assertEqual(acl.parse_acl('account'), ([], ['account']))
+        self.assertEqual(acl.parse_acl('acc1,acc2:usr2,.r:ref3,.r:-ref4'),
+                         (['ref3', '-ref4'], ['acc1', 'acc2:usr2']))
+        self.assertEqual(acl.parse_acl(
             'acc1,acc2:usr2,.r:ref3,acc3,acc4:usr4,.r:ref5,.r:-ref6'),
             (['ref3', 'ref5', '-ref6'],
              ['acc1', 'acc2:usr2', 'acc3', 'acc4:usr4']))
 
+    def test_parse_v2_acl(self):
+        # For all these tests, the header name will be "hdr".
+        tests = [
+            # Simple case: all ACL data in one header line
+            ({'hdr': '{"a":1,"b":"foo"}'}, {'a': 1, 'b': 'foo'}),
+
+            # No header "hdr" exists -- should return None
+            ({}, None),
+            ({'junk': 'junk'}, None),
+
+            # Empty ACLs should return empty dict
+            ({'hdr': ''}, {}),
+            ({'hdr': '{}'}, {}),
+            ({'hdr': '{ }'}, {}),
+
+            # Bad input -- should return None
+            ({'hdr': '["array"]'}, None),
+            ({'hdr': 'null'}, None),
+            ({'hdr': '"some_string"'}, None),
+            ({'hdr': '123'}, None),
+        ]
+
+        for hdrs_in, expected in tests:
+            result = acl.parse_acl(version=2, data=hdrs_in.get('hdr'))
+            self.assertEqual(expected, result,
+                             '%r: %r != %r' % (hdrs_in, result, expected))
+
+    def test_format_v1_acl(self):
+        tests = [
+            ((['a', 'b'], ['c.com']), 'a,b,.r:c.com'),
+            ((['a', 'b'], ['c.com', '-x.c.com']), 'a,b,.r:c.com,.r:-x.c.com'),
+            ((['a', 'b'], None), 'a,b'),
+            ((None, ['c.com']), '.r:c.com'),
+            ((None, None), ''),
+        ]
+
+        for (groups, refs), expected in tests:
+            result = acl.format_acl(
+                version=1, groups=groups, referrers=refs, header_name='hdr')
+            self.assertEqual(expected, result, 'groups=%r, refs=%r: %r != %r'
+                             % (groups, refs, result, expected))
+
+    def test_format_v2_acl(self):
+        tests = [
+            ({}, '{}'),
+            ({'foo': 'bar'}, '{"foo":"bar"}'),
+            ({'groups': ['a', 'b'], 'referrers': ['c.com', '-x.c.com']},
+             '{"groups":["a","b"],"referrers":["c.com","-x.c.com"]}'),
+        ]
+
+        for data, expected in tests:
+            result = acl.format_acl(version=2, acl_dict=data)
+            self.assertEqual(expected, result,
+                             'data=%r: %r *!=* %r' % (data, result, expected))
+
+    def test_acls_from_account_info(self):
+        test_data = [
+            ({}, None),
+            ({'sysmeta': {}}, None),
+            ({'sysmeta':
+              {'core-access-control': '{"VERSION":1,"admin":["a","b"]}'}},
+             {'admin': ['a', 'b'], 'read-write': [], 'read-only': []}),
+            ({
+                'some-key': 'some-value',
+                'other-key': 'other-value',
+                'sysmeta': {
+                    'core-access-control': '{"VERSION":1,"admin":["a","b"],"r'
+                                           'ead-write":["c"],"read-only":[]}',
+                }},
+             {'admin': ['a', 'b'], 'read-write': ['c'], 'read-only': []}),
+        ]
+
+        for args, expected in test_data:
+            result = acl.acls_from_account_info(args)
+            self.assertEqual(expected, result, "%r: Got %r, expected %r" %
+                             (args, result, expected))
+
     def test_referrer_allowed(self):
-        self.assert_(not acl.referrer_allowed('host', None))
-        self.assert_(not acl.referrer_allowed('host', []))
-        self.assert_(acl.referrer_allowed(None, ['*']))
-        self.assert_(acl.referrer_allowed('', ['*']))
-        self.assert_(not acl.referrer_allowed(None, ['specific.host']))
-        self.assert_(not acl.referrer_allowed('', ['specific.host']))
-        self.assert_(acl.referrer_allowed('http://www.example.com/index.html',
-                                          ['.example.com']))
-        self.assert_(acl.referrer_allowed(
+        self.assertTrue(not acl.referrer_allowed('host', None))
+        self.assertTrue(not acl.referrer_allowed('host', []))
+        self.assertTrue(acl.referrer_allowed(None, ['*']))
+        self.assertTrue(acl.referrer_allowed('', ['*']))
+        self.assertTrue(not acl.referrer_allowed(None, ['specific.host']))
+        self.assertTrue(not acl.referrer_allowed('', ['specific.host']))
+        self.assertTrue(
+            acl.referrer_allowed('http://www.example.com/index.html',
+                                 ['.example.com']))
+        self.assertTrue(acl.referrer_allowed(
             'http://user@www.example.com/index.html', ['.example.com']))
-        self.assert_(acl.referrer_allowed(
+        self.assertTrue(acl.referrer_allowed(
             'http://user:pass@www.example.com/index.html', ['.example.com']))
-        self.assert_(acl.referrer_allowed(
+        self.assertTrue(acl.referrer_allowed(
             'http://www.example.com:8080/index.html', ['.example.com']))
-        self.assert_(acl.referrer_allowed(
+        self.assertTrue(acl.referrer_allowed(
             'http://user@www.example.com:8080/index.html', ['.example.com']))
-        self.assert_(acl.referrer_allowed(
+        self.assertTrue(acl.referrer_allowed(
             'http://user:pass@www.example.com:8080/index.html',
             ['.example.com']))
-        self.assert_(acl.referrer_allowed(
+        self.assertTrue(acl.referrer_allowed(
             'http://user:pass@www.example.com:8080', ['.example.com']))
-        self.assert_(acl.referrer_allowed('http://www.example.com',
-                                          ['.example.com']))
-        self.assert_(not acl.referrer_allowed('http://thief.example.com',
+        self.assertTrue(acl.referrer_allowed('http://www.example.com',
+                                             ['.example.com']))
+        self.assertTrue(not acl.referrer_allowed(
+            'http://thief.example.com',
             ['.example.com', '-thief.example.com']))
-        self.assert_(not acl.referrer_allowed('http://thief.example.com',
+        self.assertTrue(not acl.referrer_allowed(
+            'http://thief.example.com',
             ['*', '-thief.example.com']))
-        self.assert_(acl.referrer_allowed('http://www.example.com',
+        self.assertTrue(acl.referrer_allowed(
+            'http://www.example.com',
             ['.other.com', 'www.example.com']))
-        self.assert_(acl.referrer_allowed('http://www.example.com',
+        self.assertTrue(acl.referrer_allowed(
+            'http://www.example.com',
             ['-.example.com', 'www.example.com']))
         # This is considered a relative uri to the request uri, a mode not
         # currently supported.
-        self.assert_(not acl.referrer_allowed('www.example.com',
-                                              ['.example.com']))
-        self.assert_(not acl.referrer_allowed('../index.html',
-                                              ['.example.com']))
-        self.assert_(acl.referrer_allowed('www.example.com', ['*']))
+        self.assertTrue(not acl.referrer_allowed('www.example.com',
+                                                 ['.example.com']))
+        self.assertTrue(not acl.referrer_allowed('../index.html',
+                                                 ['.example.com']))
+        self.assertTrue(acl.referrer_allowed('www.example.com', ['*']))
 
 
 if __name__ == '__main__':
diff --git a/test/unit/common/middleware/test_backend_ratelimit.py b/test/unit/common/middleware/test_backend_ratelimit.py
new file mode 100644
index 0000000000..1d777b42d6
--- /dev/null
+++ b/test/unit/common/middleware/test_backend_ratelimit.py
@@ -0,0 +1,1075 @@
+# Copyright (c) 2022 NVIDIA
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+# Used by get_swift_info and register_swift_info to store information about
+# the swift cluster.
+import os
+import shutil
+import time
+import unittest
+from collections import defaultdict
+from tempfile import mkdtemp
+
+from unittest import mock
+
+from swift.common.middleware import backend_ratelimit
+from swift.common.middleware.backend_ratelimit import \
+    BackendRateLimitMiddleware
+from swift.common.swob import Request, HTTPOk
+from test.debug_logger import debug_logger
+from test.unit.common.middleware.helpers import FakeSwift
+
+
+class FakeApp(object):
+    def __init__(self):
+        self.calls = []
+
+    def __call__(self, env, start_response):
+        start_response('200 OK', {})
+        return ['']
+
+
+class TestBackendRatelimitMiddleware(unittest.TestCase):
+    def setUp(self):
+        super(TestBackendRatelimitMiddleware, self).setUp()
+        self.swift = FakeSwift()
+        self.tempdir = mkdtemp()
+        self.default_req_per_dev_per_sec = dict(
+            (key, 0.0) for key in
+            (None, 'GET', 'HEAD', 'PUT', 'POST', 'DELETE', 'UPDATE',
+             'REPLICATE')
+        )
+
+    def tearDown(self):
+        shutil.rmtree(self.tempdir, ignore_errors=True)
+
+    def test_init(self):
+        conf = {'swift_dir': self.tempdir}
+        factory = backend_ratelimit.filter_factory(conf)
+        rl = factory(self.swift)
+        self.assertEqual(self.default_req_per_dev_per_sec,
+                         rl.requests_per_device_per_second)
+        self.assertEqual(1.0, rl.requests_per_device_rate_buffer)
+        self.assertFalse(rl.is_any_rate_limit_configured)
+
+        conf = {'swift_dir': self.tempdir,
+                'requests_per_device_per_second': 1.3,
+                'requests_per_device_rate_buffer': 2.4}
+        factory = backend_ratelimit.filter_factory(conf)
+        rl = factory(self.swift)
+        exp_req_per_dev_per_sec = dict(self.default_req_per_dev_per_sec)
+        exp_req_per_dev_per_sec[None] = 1.3
+        self.assertEqual(exp_req_per_dev_per_sec,
+                         rl.requests_per_device_per_second)
+        self.assertEqual(2.4, rl.requests_per_device_rate_buffer)
+        self.assertTrue(rl.is_any_rate_limit_configured)
+
+        conf = {'requests_per_device_per_second': -1}
+        factory = backend_ratelimit.filter_factory(conf)
+        with self.assertRaises(ValueError) as cm:
+            factory(self.swift)
+        self.assertEqual(
+            'Value must be a non-negative float number, not "-1.0".',
+            str(cm.exception))
+
+        conf = {'requests_per_device_rate_buffer': -1}
+        factory = backend_ratelimit.filter_factory(conf)
+        with self.assertRaises(ValueError):
+            factory(self.swift)
+        self.assertEqual(
+            'Value must be a non-negative float number, not "-1.0".',
+            str(cm.exception))
+
+    def test_init_conf_path(self):
+        conf = {}
+        factory = backend_ratelimit.filter_factory(conf)
+        rl = factory(self.swift)
+        self.assertEqual('/etc/swift/backend-ratelimit.conf', rl.conf_path)
+        conf = {'backend_ratelimit_conf_path': '/etc/other/rl.conf'}
+        factory = backend_ratelimit.filter_factory(conf)
+        rl = factory(self.swift)
+        self.assertEqual('/etc/other/rl.conf', rl.conf_path)
+        conf = {'backend_ratelimit_conf_path': ''}
+        factory = backend_ratelimit.filter_factory(conf)
+        rl = factory(self.swift)
+        self.assertEqual('', rl.conf_path)
+
+    def test_init_conf_reload_interval(self):
+        conf = {}
+        factory = backend_ratelimit.filter_factory(conf)
+        rl = factory(self.swift)
+        self.assertEqual(60, rl.config_reload_interval)
+        conf = {'config_reload_interval': 600}
+        factory = backend_ratelimit.filter_factory(conf)
+        rl = factory(self.swift)
+        self.assertEqual(600, rl.config_reload_interval)
+        conf = {'config_reload_interval': 0}
+        factory = backend_ratelimit.filter_factory(conf)
+        rl = factory(self.swift)
+        self.assertEqual(0, rl.config_reload_interval)
+
+        def test_bad(value):
+            with self.assertRaises(ValueError) as cm:
+                conf = {'config_reload_interval': value}
+                factory = backend_ratelimit.filter_factory(conf)
+                factory(self.swift)
+            self.assertIn('Value must be a non-negative float number',
+                          str(cm.exception))
+        test_bad(-1)
+        test_bad('auto')
+
+    def test_init_config_file_set_and_missing(self):
+        # warn if missing conf file during init (conf_path set)
+        def do_test(conf_path):
+            conf = {'backend_ratelimit_conf_path': '%s' % conf_path,
+                    'requests_per_device_per_second': "1.3"}
+            factory = backend_ratelimit.filter_factory(conf)
+            with mock.patch(
+                    'swift.common.middleware.backend_ratelimit.get_logger',
+                    return_value=debug_logger()):
+                rl = factory(self.swift)
+            exp_req_per_dev_per_sec = dict(self.default_req_per_dev_per_sec)
+            exp_req_per_dev_per_sec.update({None: 1.3})
+            self.assertEqual(exp_req_per_dev_per_sec,
+                             rl.requests_per_device_per_second)
+            self.assertEqual(1.0, rl.requests_per_device_rate_buffer)
+            self.assertEqual([], rl.logger.get_lines_for_level('error'))
+            self.assertEqual(
+                ['Failed to load config file, config unchanged: Unable to '
+                 'read config from %s' % conf_path],
+                rl.logger.get_lines_for_level('warning'))
+
+        do_test('')
+        do_test(os.path.join(self.tempdir, 'backend_rl.conf'))
+
+    def test_init_config_file_unset_and_missing(self):
+        # don't warn if missing conf file during init (conf_path not set)
+        conf = {'swift_dir': self.tempdir,
+                'requests_per_device_per_second': "1.3"}
+        factory = backend_ratelimit.filter_factory(conf)
+        with mock.patch(
+                'swift.common.middleware.backend_ratelimit.get_logger',
+                return_value=debug_logger()):
+            rl = factory(self.swift)
+        exp_req_per_dev_per_sec = dict(self.default_req_per_dev_per_sec)
+        exp_req_per_dev_per_sec[None] = 1.3
+        self.assertEqual(exp_req_per_dev_per_sec,
+                         rl.requests_per_device_per_second)
+        self.assertEqual(1.0, rl.requests_per_device_rate_buffer)
+        self.assertEqual([], rl.logger.get_lines_for_level('error'))
+        self.assertEqual([], rl.logger.get_lines_for_level('warning'))
+
+    def test_init_config_file_no_section(self):
+        # warn and ignore conf file without section
+        conf_path = os.path.join(self.tempdir, 'backend_rl.conf')
+        with open(conf_path, 'w') as fd:
+            fd.write('[DEFAULT]\n'
+                     'requests_per_device_per_second = 12.3\n')
+        conf = {'backend_ratelimit_conf_path': '%s' % conf_path,
+                'requests_per_device_per_second': 1.3}
+        factory = backend_ratelimit.filter_factory(conf)
+        with mock.patch('swift.common.middleware.backend_ratelimit.get_logger',
+                        return_value=debug_logger()):
+            rl = factory(self.swift)
+        exp_req_per_dev_per_sec = dict(self.default_req_per_dev_per_sec)
+        exp_req_per_dev_per_sec[None] = 1.3
+        self.assertEqual(exp_req_per_dev_per_sec,
+                         rl.requests_per_device_per_second)
+        self.assertEqual(1.0, rl.requests_per_device_rate_buffer)
+        lines = rl.logger.get_lines_for_level('warning')
+        self.assertEqual(1, len(lines), lines)
+        self.assertIn('Invalid config file', lines[0])
+        self.assertEqual([], rl.logger.get_lines_for_level('error'))
+
+    def test_read_default_backend_ratelimit_conf(self):
+        conf = {'swift_dir': self.tempdir,
+                'requests_per_device_per_second': "1.3",
+                'requests_per_device_rate_buffer': "2.4",
+                # do not set 'backend_ratelimit_conf_path'
+                'config_reload_interval': 15}
+        # but set it up anyway
+        conf_path = os.path.join(self.tempdir, 'backend-ratelimit.conf')
+        with open(conf_path, 'w') as fd:
+            fd.write('[backend_ratelimit]\n'
+                     'requests_per_device_per_second = 12.3\n')
+        factory = backend_ratelimit.filter_factory(conf)
+        with mock.patch('swift.common.middleware.backend_ratelimit.get_logger',
+                        return_value=debug_logger()):
+            rl = factory(self.swift)
+        # backend-ratelimit.conf overrides options
+        exp_req_per_dev_per_sec = dict(self.default_req_per_dev_per_sec)
+        exp_req_per_dev_per_sec[None] = 12.3
+        self.assertEqual(exp_req_per_dev_per_sec,
+                         rl.requests_per_device_per_second)
+        # but only the ones that are listed
+        self.assertEqual(2.4, rl.requests_per_device_rate_buffer)
+        self.assertTrue(rl.is_any_rate_limit_configured)
+        lines = rl.logger.get_lines_for_level('info')
+        self.assertEqual(['Loaded config file %s, config changed' % conf_path],
+                         lines)
+
+    def test_config_reload_does_not_override_reload_options(self):
+        conf_path = os.path.join(self.tempdir, 'override-ratelimit.conf')
+        conf = {'swift_dir': self.tempdir,
+                'requests_per_device_per_second': "1.3",
+                'requests_per_device_rate_buffer': "2.4",
+                'backend_ratelimit_conf_path': conf_path,
+                'config_reload_interval': 15}
+        with open(conf_path, 'w') as fd:
+            fd.write('[backend_ratelimit]\n'
+                     'requests_per_device_per_second = 12.3\n'
+                     'requests_per_device_rate_buffer = 12.4\n'
+                     'backend_ratelimit_conf_path = /etc/swift/ignored.conf\n'
+                     'config_reload_interval = 999999\n')
+        factory = backend_ratelimit.filter_factory(conf)
+        with mock.patch('swift.common.middleware.backend_ratelimit.get_logger',
+                        return_value=debug_logger()):
+            rl = factory(self.swift)
+        exp_req_per_dev_per_sec = dict(self.default_req_per_dev_per_sec)
+        exp_req_per_dev_per_sec[None] = 12.3
+        self.assertEqual(exp_req_per_dev_per_sec,
+                         rl.requests_per_device_per_second)
+        self.assertEqual(12.4, rl.requests_per_device_rate_buffer)
+        self.assertTrue(rl.is_any_rate_limit_configured)
+        # options related to conf file loading are not loaded from conf file...
+        self.assertEqual(conf_path, rl.conf_path)
+        self.assertEqual(15, rl.config_reload_interval)
+        lines = rl.logger.logger.get_lines_for_level('info')
+        self.assertEqual(['Loaded config file %s, config changed' % conf_path],
+                         lines)
+
+    def _do_test_init_config_file_overrides_filter_conf(
+            self, path_to_actual_conf_file, configured_conf_path):
+        # verify that conf file options override filter conf options
+        # create the actual file, but no options
+        with open(path_to_actual_conf_file, 'w') as fd:
+            fd.write('[backend_ratelimit]')
+        conf = {'swift_dir': self.tempdir,
+                'requests_per_device_per_second': "1.3",
+                'requests_per_device_rate_buffer': "2.4",
+                'config_reload_interval': 15}
+        if configured_conf_path:
+            # only configure if given a conf_path
+            conf['backend_ratelimit_conf_path'] = configured_conf_path
+            exp_configured_conf_path = configured_conf_path
+        else:
+            # fall back to default
+            exp_configured_conf_path = os.path.join(self.tempdir,
+                                                    'backend-ratelimit.conf')
+        factory = backend_ratelimit.filter_factory(conf)
+        rl = factory(self.swift)
+        exp_req_per_dev_per_sec = dict(self.default_req_per_dev_per_sec)
+        exp_req_per_dev_per_sec[None] = 1.3
+        self.assertEqual(exp_req_per_dev_per_sec,
+                         rl.requests_per_device_per_second)
+        self.assertEqual(2.4, rl.requests_per_device_rate_buffer)
+        self.assertTrue(rl.is_any_rate_limit_configured)
+        self.assertEqual(exp_configured_conf_path, rl.conf_path)
+        self.assertEqual(15, rl.config_reload_interval)
+
+        # create file with option
+        with open(path_to_actual_conf_file, 'w') as fd:
+            fd.write('[backend_ratelimit]\n'
+                     'requests_per_device_per_second = 12.3\n'
+                     'backend_ratelimit_conf_path = /etc/swift/ignored.conf\n'
+                     'config_reload_interval = 999999\n')
+        factory = backend_ratelimit.filter_factory(conf)
+        rl = factory(self.swift)
+        exp_req_per_dev_per_sec[None] = 12.3
+        self.assertEqual(exp_req_per_dev_per_sec,
+                         rl.requests_per_device_per_second)
+        self.assertEqual(2.4, rl.requests_per_device_rate_buffer)
+        self.assertTrue(rl.is_any_rate_limit_configured)
+        # options related to conf file loading are not loaded from conf file...
+        self.assertEqual(exp_configured_conf_path, rl.conf_path)
+        self.assertEqual(15, rl.config_reload_interval)
+
+        with open(path_to_actual_conf_file, 'w') as fd:
+            fd.write(
+                '[backend_ratelimit]\n'
+                'requests_per_device_per_second = 5.3\n'
+                'requests_per_device_rate_buffer = 0.5\n'
+                'delete_requests_per_device_per_second = 1\n'
+                'get_requests_per_device_per_second = 2\n'
+                'head_requests_per_device_per_second = 3\n'
+                'post_requests_per_device_per_second = 4\n'
+                'put_requests_per_device_per_second = 5\n'
+                'replicate_requests_per_device_per_second = 6\n'
+                'update_requests_per_device_per_second = 7\n'
+                'backend_ratelimit_conf_path = /etc/swift/ignored.conf\n'
+                'config_reload_interval = 999999\n'
+            )
+        factory = backend_ratelimit.filter_factory(conf)
+        rl = factory(self.swift)
+        exp_req_per_dev_per_sec.update(
+            {
+                None: 5.3,
+                'DELETE': 1,
+                'GET': 2,
+                'HEAD': 3,
+                'POST': 4,
+                'PUT': 5,
+                'REPLICATE': 6,
+                'UPDATE': 7,
+            }
+        )
+        self.assertEqual(exp_req_per_dev_per_sec,
+                         rl.requests_per_device_per_second)
+        self.assertEqual(0.5, rl.requests_per_device_rate_buffer)
+        self.assertTrue(rl.is_any_rate_limit_configured)
+        # options related to conf file loading are not loaded from conf file...
+        self.assertEqual(exp_configured_conf_path, rl.conf_path)
+        self.assertEqual(15, rl.config_reload_interval)
+
+    def test_init_config_file_at_default_path_overrides_filter_conf(self):
+        # default conf path is loaded if it exists
+        default_conf_path = os.path.join(self.tempdir,
+                                         'backend-ratelimit.conf')
+        self._do_test_init_config_file_overrides_filter_conf(
+            path_to_actual_conf_file=default_conf_path,
+            configured_conf_path=None)
+
+        self._do_test_init_config_file_overrides_filter_conf(
+            path_to_actual_conf_file=default_conf_path,
+            configured_conf_path=default_conf_path)
+
+    def test_init_config_file_at_configured_path_overrides_filter_conf(self):
+        # explicitly configured conf path is loaded
+        custom_conf_path = os.path.join(self.tempdir, 'backend_rl.conf')
+        self._do_test_init_config_file_overrides_filter_conf(
+            path_to_actual_conf_file=custom_conf_path,
+            configured_conf_path=custom_conf_path)
+
+    def _do_test_config_file_reload(self, reload_interval):
+        # verify that conf file options are periodically reloaded
+        filter_conf = {'swift_dir': self.tempdir,
+                       'requests_per_device_per_second': "1.3",
+                       'requests_per_device_rate_buffer': "2.4",
+                       'head_requests_per_device_per_second': '6.2'}
+        if reload_interval:
+            filter_conf['config_reload_interval'] = reload_interval
+
+        now = time.time()
+        # create the actual file
+        conf_path = os.path.join(filter_conf['swift_dir'],
+                                 'backend-ratelimit.conf')
+        with open(conf_path, 'w') as fd:
+            fd.write('[backend_ratelimit]\n'
+                     'requests_per_device_per_second = 12.3\n'
+                     # conf file cannot re-configure where the conf file is...
+                     'backend_ratelimit_conf_path = /etc/ignored\n'
+                     'config_reload_interval = also_ignored\n')
+        factory = backend_ratelimit.filter_factory(filter_conf)
+        with mock.patch('swift.common.middleware.backend_ratelimit.time.time',
+                        return_value=now):
+            rl = factory(self.swift)
+        exp_req_per_dev_per_sec = dict(self.default_req_per_dev_per_sec)
+        exp_req_per_dev_per_sec.update({None: 12.3, 'HEAD': float(
+            filter_conf['head_requests_per_device_per_second'])})
+        self.assertEqual(exp_req_per_dev_per_sec,
+                         rl.requests_per_device_per_second)
+        self.assertEqual(float(filter_conf['requests_per_device_rate_buffer']),
+                         rl.requests_per_device_rate_buffer)
+        self.assertEqual(conf_path, rl.conf_path)
+
+        # modify the conf file
+        with open(conf_path, 'w') as fd:
+            fd.write('[backend_ratelimit]\n'
+                     'requests_per_device_per_second = 29.3\n'
+                     'requests_per_device_rate_buffer = 12.4\n'
+                     'backend_ratelimit_conf_path = /etc/ignored\n'
+                     'config_reload_interval = also_ignored\n'
+                     'head_requests_per_device_per_second = 5.1\n'
+                     'delete_requests_per_device_per_second = 7.3\n'
+                     'get_requests_per_device_per_second = 8.4\n')
+
+        # send some requests, but too soon for config file to be reloaded
+        req1 = Request.blank('/sda1/99/a/c/o')
+        req2 = Request.blank('/sda2/99/a/c/o',
+                             environ={'REQUEST_METHOD': 'DELETE'})
+        self.swift.register(req1.method, req1.path, HTTPOk, {})
+        self.swift.register(req2.method, req2.path, HTTPOk, {})
+        with mock.patch('swift.common.middleware.backend_ratelimit.time.time',
+                        return_value=now + rl.config_reload_interval - 1):
+            resp1 = req1.get_response(rl)
+            resp2 = req2.get_response(rl)
+        self.assertEqual(200, resp1.status_int)
+        self.assertEqual(200, resp2.status_int)
+        self.assertEqual(exp_req_per_dev_per_sec,
+                         rl.requests_per_device_per_second)
+        self.assertEqual(float(filter_conf['requests_per_device_rate_buffer']),
+                         rl.requests_per_device_rate_buffer)
+        self.assertEqual(conf_path, rl.conf_path)
+
+        # verify the per dev ratelimiters
+        self.assertEqual({('sda1', 'GET'): 0.0,
+                          ('sda2', 'DELETE'): 0.0,
+                          ('sda1', None): 12.3,
+                          ('sda2', None): 12.3},
+                         dict((key, val.max_rate)
+                              for key, val in rl.rate_limiters.items()))
+        for (dev, method), limiter in rl.rate_limiters.items():
+            self.assertEqual(2.4 * limiter.clock_accuracy,
+                             limiter.rate_buffer_ms, (dev, method))
+
+        # send some requests, time for config file to be reloaded
+        with mock.patch('swift.common.middleware.backend_ratelimit.time.time',
+                        return_value=now + rl.config_reload_interval + 0.01):
+            resp1 = req1.get_response(rl)
+            resp2 = req2.get_response(rl)
+        self.assertEqual(200, resp1.status_int)
+        self.assertEqual(200, resp2.status_int)
+        exp_req_per_dev_per_sec.update({
+            None: 29.3,
+            'HEAD': 5.1,
+            'DELETE': 7.3,
+            'GET': 8.4})
+        self.assertEqual(exp_req_per_dev_per_sec,
+                         rl.requests_per_device_per_second)
+        self.assertEqual(12.4, rl.requests_per_device_rate_buffer)
+        self.assertEqual(conf_path, rl.conf_path)
+
+        # verify the per dev ratelimiters were updated
+        self.assertEqual({('sda1', 'GET'): 8.4,
+                          ('sda2', 'DELETE'): 7.3,
+                          ('sda1', None): 29.3,
+                          ('sda2', None): 29.3},
+                         dict((key, val.max_rate)
+                              for key, val in rl.rate_limiters.items()))
+        for (dev, method), limiter in rl.rate_limiters.items():
+            self.assertEqual(12.4 * limiter.clock_accuracy,
+                             limiter.rate_buffer_ms, (dev, method))
+
+        # modify the config file again
+        # remove requests_per_device_per_second option
+        # remove [head|delete]_requests_per_device_per_second options
+        with open(conf_path, 'w') as fd:
+            fd.write('[backend_ratelimit]\n'
+                     'backend_ratelimit_conf_path = /etc/ignored\n'
+                     'config_reload_interval = also_ignored\n'
+                     'requests_per_device_rate_buffer = 0.5\n'
+                     'get_requests_per_device_per_second = 9.5\n')
+
+        # send some requests, not yet time for config file to be reloaded
+        with mock.patch('swift.common.middleware.backend_ratelimit.time.time',
+                        return_value=now + 2 * rl.config_reload_interval - 1):
+            resp1 = req1.get_response(rl)
+            resp2 = req2.get_response(rl)
+        self.assertEqual(200, resp1.status_int)
+        self.assertEqual(200, resp2.status_int)
+        self.assertEqual(exp_req_per_dev_per_sec,
+                         rl.requests_per_device_per_second)
+        self.assertEqual(12.4, rl.requests_per_device_rate_buffer)
+        self.assertEqual(conf_path, rl.conf_path)
+
+        # verify the per dev ratelimiters were not updated
+        self.assertEqual({('sda1', 'GET'): 8.4,
+                          ('sda2', 'DELETE'): 7.3,
+                          ('sda1', None): 29.3,
+                          ('sda2', None): 29.3},
+                         dict((key, val.max_rate)
+                              for key, val in rl.rate_limiters.items()))
+        for (dev, method), limiter in rl.rate_limiters.items():
+            self.assertEqual(12.4 * limiter.clock_accuracy,
+                             limiter.rate_buffer_ms, (dev, method))
+
+        # send some requests, time for config file to be reloaded
+        with mock.patch(
+                'swift.common.middleware.backend_ratelimit.time.time',
+                return_value=now + 2 * rl.config_reload_interval + 0.01):
+            resp1 = req1.get_response(rl)
+            resp2 = req2.get_response(rl)
+        self.assertEqual(200, resp1.status_int)
+        self.assertEqual(200, resp2.status_int)
+        # requests_per_device_per_second option reverts to filter conf
+        # delete_requests_per_device_per_second option reverts to default
+        # head_requests_per_device_per_second option reverts to filter conf
+        exp_req_per_dev_per_sec.update({
+            None: 1.3,
+            'HEAD': 6.2,
+            'DELETE': 0.0,
+            'GET': 9.5})
+        self.assertEqual(exp_req_per_dev_per_sec,
+                         rl.requests_per_device_per_second)
+        self.assertEqual(0.5, rl.requests_per_device_rate_buffer)
+        self.assertEqual(conf_path, rl.conf_path)
+
+        # verify the per dev ratelimiters were updated
+        self.assertEqual({('sda1', 'GET'): 9.5,
+                          ('sda2', 'DELETE'): 0.0,
+                          ('sda1', None): 1.3,
+                          ('sda2', None): 1.3},
+                         dict((key, val.max_rate)
+                              for key, val in rl.rate_limiters.items()))
+        for (dev, method), limiter in rl.rate_limiters.items():
+            self.assertEqual(0.5 * limiter.clock_accuracy,
+                             limiter.rate_buffer_ms, (dev, method))
+        return rl
+
+    def test_config_file_reload_default_interval(self):
+        rl = self._do_test_config_file_reload(None)
+        self.assertEqual(60, rl.config_reload_interval)
+
+    def test_config_file_reload_custom_interval(self):
+        rl = self._do_test_config_file_reload(30.1)
+        self.assertEqual(30.1, rl.config_reload_interval)
+
+    def test_config_file_reload_clears_all_limits(self):
+        # verify that reloaded config file can disable all rate limits
+        now = time.time()
+        conf_path = os.path.join(self.tempdir, 'missing')
+        filter_conf = {'swift_dir': self.tempdir,
+                       # path set so expect warning during init
+                       'backend_ratelimit_conf_path': conf_path,
+                       'requests_per_device_per_second': "1.3",
+                       'head_requests_per_device_per_second = 1.1\n'
+                       'requests_per_device_rate_buffer': "2.4"}
+        with open(conf_path, 'w') as fd:
+            fd.write('[backend_ratelimit]\n'
+                     'requests_per_device_per_second = 29.3\n'
+                     'head_requests_per_device_per_second = 5.1\n'
+                     'get_requests_per_device_per_second = 8.4\n')
+        factory = backend_ratelimit.filter_factory(filter_conf)
+
+        # expect warning during init
+        with mock.patch('swift.common.middleware.backend_ratelimit.time.time',
+                        return_value=now):
+            with mock.patch(
+                    'swift.common.middleware.backend_ratelimit.get_logger',
+                    return_value=debug_logger()):
+                rl = factory(self.swift)
+        # filter conf has been applied
+        exp_req_per_dev_per_sec = dict(self.default_req_per_dev_per_sec)
+        exp_req_per_dev_per_sec.update({
+            None: 29.3,
+            'HEAD': 5.1,
+            'GET': 8.4})
+        self.assertTrue(rl.is_any_rate_limit_configured)
+        self.assertEqual(exp_req_per_dev_per_sec,
+                         rl.requests_per_device_per_second)
+        self.assertEqual([], rl.logger.get_lines_for_level('warning'))
+        self.assertEqual([], rl.logger.get_lines_for_level('error'))
+
+        # write zero rate limits to conf file
+        # jump into future, send request, config reload attempted
+        with open(conf_path, 'w') as fd:
+            fd.write('[backend_ratelimit]\n'
+                     'requests_per_device_per_second = 0.0\n'
+                     'head_requests_per_device_per_second = 0.0\n'
+                     'get_requests_per_device_per_second = 0.0\n')
+        req1 = Request.blank('/sda1/99/a/c/o')
+        self.swift.register(req1.method, req1.path, HTTPOk, {})
+        with mock.patch('swift.common.middleware.backend_ratelimit.time.time',
+                        return_value=now + 10000):
+            resp1 = req1.get_response(rl)
+        self.assertEqual(200, resp1.status_int)
+        exp_req_per_dev_per_sec = dict(self.default_req_per_dev_per_sec)
+        self.assertFalse(rl.is_any_rate_limit_configured)
+        self.assertEqual(exp_req_per_dev_per_sec,
+                         rl.requests_per_device_per_second)
+        self.assertEqual([], rl.logger.get_lines_for_level('warning'))
+        self.assertEqual([], rl.logger.get_lines_for_level('error'))
+
+    def test_config_file_reload_set_and_missing(self):
+        now = time.time()
+        conf_path = os.path.join(self.tempdir, 'missing')
+        filter_conf = {'swift_dir': self.tempdir,
+                       # path set so expect warning during init
+                       'backend_ratelimit_conf_path': conf_path,
+                       'requests_per_device_per_second': "1.3",
+                       'requests_per_device_rate_buffer': "2.4"}
+        factory = backend_ratelimit.filter_factory(filter_conf)
+
+        # expect warning during init
+        with mock.patch('swift.common.middleware.backend_ratelimit.time.time',
+                        return_value=now):
+            with mock.patch(
+                    'swift.common.middleware.backend_ratelimit.get_logger',
+                    return_value=debug_logger()):
+                rl = factory(self.swift)
+        # filter conf has been applied
+        exp_req_per_dev_per_sec = dict(self.default_req_per_dev_per_sec)
+        exp_req_per_dev_per_sec[None] = 1.3
+        self.assertTrue(rl.is_any_rate_limit_configured)
+        self.assertEqual(exp_req_per_dev_per_sec,
+                         rl.requests_per_device_per_second)
+        self.assertEqual(2.4, rl.requests_per_device_rate_buffer)
+        self.assertEqual(
+            ['Failed to load config file, config unchanged: Unable to read '
+             'config from %s' % conf_path],
+            rl.logger.get_lines_for_level('warning'))
+        self.assertEqual([], rl.logger.get_lines_for_level('error'))
+
+        # jump into future, send request, config reload attempted
+        # no ongoing warning
+        rl.logger.logger.clear()
+        req1 = Request.blank('/sda1/99/a/c/o')
+        self.swift.register(req1.method, req1.path, HTTPOk, {})
+        with mock.patch('swift.common.middleware.backend_ratelimit.time.time',
+                        return_value=now + 10000):
+            resp1 = req1.get_response(rl)
+        self.assertEqual(200, resp1.status_int)
+        self.assertTrue(rl.is_any_rate_limit_configured)
+        self.assertEqual(exp_req_per_dev_per_sec,
+                         rl.requests_per_device_per_second)
+        self.assertEqual(2.4, rl.requests_per_device_rate_buffer)
+        self.assertEqual([], rl.logger.get_lines_for_level('warning'))
+        self.assertEqual([], rl.logger.get_lines_for_level('error'))
+
+    def test_config_file_reload_unset_and_missing(self):
+        now = time.time()
+        filter_conf = {'swift_dir': self.tempdir,
+                       # conf path not set so expect no warnings
+                       'requests_per_device_per_second': "1.3",
+                       'requests_per_device_rate_buffer': "2.4"}
+        factory = backend_ratelimit.filter_factory(filter_conf)
+
+        # expect NO warning during init
+        with mock.patch('swift.common.middleware.backend_ratelimit.time.time',
+                        return_value=now):
+            with mock.patch(
+                    'swift.common.middleware.backend_ratelimit.get_logger',
+                    return_value=debug_logger()):
+                rl = factory(self.swift)
+        # filter conf has been applied
+        exp_req_per_dev_per_sec = dict(self.default_req_per_dev_per_sec)
+        exp_req_per_dev_per_sec[None] = 1.3
+        self.assertEqual(exp_req_per_dev_per_sec,
+                         rl.requests_per_device_per_second)
+        self.assertEqual(2.4, rl.requests_per_device_rate_buffer)
+        self.assertEqual([], rl.logger.get_lines_for_level('warning'))
+        self.assertEqual([], rl.logger.get_lines_for_level('error'))
+
+        # jump into future, send request, config reload attempted
+        # no ongoing warning
+        req1 = Request.blank('/sda1/99/a/c/o')
+        self.swift.register(req1.method, req1.path, HTTPOk, {})
+        with mock.patch('swift.common.middleware.backend_ratelimit.time.time',
+                        return_value=now + 10000):
+            resp1 = req1.get_response(rl)
+        self.assertEqual(200, resp1.status_int)
+        # previous conf file value has been retained
+        self.assertEqual(exp_req_per_dev_per_sec,
+                         rl.requests_per_device_per_second)
+        self.assertEqual(2.4, rl.requests_per_device_rate_buffer)
+        self.assertEqual([], rl.logger.get_lines_for_level('warning'))
+        self.assertEqual([], rl.logger.get_lines_for_level('error'))
+
+    def test_config_file_reload_empty_section(self):
+        # verify that empty section is OK
+        now = time.time()
+        filter_conf = {'swift_dir': self.tempdir,
+                       'requests_per_device_per_second': "1.3",
+                       'requests_per_device_rate_buffer': "2.4"}
+        # create the actual file
+        conf_path = os.path.join(self.tempdir, 'backend-ratelimit.conf')
+        with open(conf_path, 'w') as fd:
+            fd.write('[backend_ratelimit]\n')
+        factory = backend_ratelimit.filter_factory(filter_conf)
+        with mock.patch('swift.common.middleware.backend_ratelimit.time.time',
+                        return_value=now):
+            with mock.patch(
+                    'swift.common.middleware.backend_ratelimit.get_logger',
+                    return_value=debug_logger()):
+                rl = factory(self.swift)
+        # conf file value has been applied
+        exp_req_per_dev_per_sec = dict(self.default_req_per_dev_per_sec)
+        exp_req_per_dev_per_sec[None] = 1.3
+        self.assertEqual(exp_req_per_dev_per_sec,
+                         rl.requests_per_device_per_second)
+        self.assertEqual(2.4, rl.requests_per_device_rate_buffer)
+        self.assertEqual([], rl.logger.get_lines_for_level('warning'))
+        self.assertEqual([], rl.logger.get_lines_for_level('error'))
+
+    def test_config_file_reload_error(self):
+        # verify that current config is preserved if reload fails
+        now = time.time()
+        filter_conf = {'swift_dir': self.tempdir,
+                       'requests_per_device_per_second': "1.3",
+                       'requests_per_device_rate_buffer': "2.4"}
+        # create the actual file
+        conf_path = os.path.join(self.tempdir, 'backend-ratelimit.conf')
+        with open(conf_path, 'w') as fd:
+            fd.write('[backend_ratelimit]\n'
+                     'requests_per_device_per_second = 12.3\n')
+        factory = backend_ratelimit.filter_factory(filter_conf)
+        with mock.patch('swift.common.middleware.backend_ratelimit.time.time',
+                        return_value=now):
+            with mock.patch(
+                    'swift.common.middleware.backend_ratelimit.get_logger',
+                    return_value=debug_logger()):
+                rl = factory(self.swift)
+        # conf file value has been applied
+        exp_req_per_dev_per_sec = dict(self.default_req_per_dev_per_sec)
+        exp_req_per_dev_per_sec[None] = 12.3
+        self.assertEqual(exp_req_per_dev_per_sec,
+                         rl.requests_per_device_per_second)
+        self.assertEqual(2.4, rl.requests_per_device_rate_buffer)
+        self.assertEqual([], rl.logger.get_lines_for_level('warning'))
+        self.assertEqual([], rl.logger.get_lines_for_level('error'))
+
+        with open(conf_path, 'w') as fd:
+            fd.write('[backend_ratelimit]\n'
+                     'requests_per_device_per_second = 29.3\n')
+
+        # jump into future, send request, config reload attempted but fails
+        req1 = Request.blank('/sda1/99/a/c/o')
+        self.swift.register(req1.method, req1.path, HTTPOk, {})
+        with mock.patch('swift.common.middleware.backend_ratelimit.time.time',
+                        return_value=now + 10000):
+            with mock.patch(
+                    'swift.common.middleware.backend_ratelimit.readconf',
+                    side_effect=ValueError('BOOM')
+            ) as mock_readconf:
+                resp1 = req1.get_response(rl)
+        self.assertEqual(200, resp1.status_int)
+        # previous conf file value has been retained
+        self.assertEqual(exp_req_per_dev_per_sec,
+                         rl.requests_per_device_per_second)
+        self.assertEqual(2.4, rl.requests_per_device_rate_buffer)
+        mock_readconf.assert_called_once()
+        self.assertEqual(
+            ['Invalid config file %s, config unchanged: BOOM' % conf_path],
+            rl.logger.get_lines_for_level('warning'))
+        self.assertEqual([], rl.logger.get_lines_for_level('error'))
+
+        # the reload is not tried again immediately
+        rl.logger = debug_logger()
+        with mock.patch('swift.common.middleware.backend_ratelimit.time.time',
+                        return_value=now + 10059):
+            resp1 = req1.get_response(rl)
+        self.assertEqual(200, resp1.status_int)
+        # previous conf file value has been retained
+        self.assertEqual(exp_req_per_dev_per_sec,
+                         rl.requests_per_device_per_second)
+        self.assertEqual(2.4, rl.requests_per_device_rate_buffer)
+        self.assertEqual([], rl.logger.get_lines_for_level('warning'))
+        self.assertEqual([], rl.logger.get_lines_for_level('error'))
+
+        # ..but will be retried after reload interval
+        rl.logger = debug_logger()
+        with mock.patch('swift.common.middleware.backend_ratelimit.time.time',
+                        return_value=now + 10060):
+            resp1 = req1.get_response(rl)
+        self.assertEqual(200, resp1.status_int)
+        # previous conf file value has been retained
+        exp_req_per_dev_per_sec.update({None: 29.3})
+        self.assertEqual(exp_req_per_dev_per_sec,
+                         rl.requests_per_device_per_second)
+        self.assertEqual(2.4, rl.requests_per_device_rate_buffer)
+        self.assertEqual([], rl.logger.get_lines_for_level('warning'))
+        self.assertEqual([], rl.logger.get_lines_for_level('error'))
+
+    def test_config_file_reload_logging(self):
+        # verify that config reload is logged when config changes
+        now = time.time()
+        filter_conf = {'swift_dir': self.tempdir,
+                       'requests_per_device_per_second': "1.3",
+                       'requests_per_device_rate_buffer': "2.4"}
+        # create the actual file
+        conf_path = os.path.join(self.tempdir, 'backend-ratelimit.conf')
+        with open(conf_path, 'w') as fd:
+            fd.write('[backend_ratelimit]\n'
+                     'requests_per_device_per_second = 12.3\n')
+        factory = backend_ratelimit.filter_factory(filter_conf)
+        with mock.patch('swift.common.middleware.backend_ratelimit.time.time',
+                        return_value=now):
+            with mock.patch(
+                    'swift.common.middleware.backend_ratelimit.get_logger',
+                    return_value=debug_logger()):
+                rl = factory(self.swift)
+        # conf file value has been applied
+        exp_req_per_dev_per_sec = dict(self.default_req_per_dev_per_sec)
+        exp_req_per_dev_per_sec[None] = 12.3
+        self.assertEqual(exp_req_per_dev_per_sec,
+                         rl.requests_per_device_per_second)
+        self.assertEqual(2.4, rl.requests_per_device_rate_buffer)
+        lines = rl.logger.get_lines_for_level('info')
+        self.assertEqual(['Loaded config file %s, config changed' % conf_path],
+                         lines)
+
+        # jump into future, send request, config reload attempted, no change
+        rl.logger.logger.clear()
+        req1 = Request.blank('/sda1/99/a/c/o')
+        self.swift.register(req1.method, req1.path, HTTPOk, {})
+        with mock.patch('swift.common.middleware.backend_ratelimit.time.time',
+                        return_value=now + 10000):
+            resp1 = req1.get_response(rl)
+        self.assertEqual(200, resp1.status_int)
+        self.assertEqual(exp_req_per_dev_per_sec,
+                         rl.requests_per_device_per_second)
+        self.assertEqual(2.4, rl.requests_per_device_rate_buffer)
+        lines = rl.logger.get_lines_for_level('info')
+        self.assertEqual([], lines)
+
+        # modify config file, jump into future, change logged
+        with open(conf_path, 'w') as fd:
+            fd.write('[backend_ratelimit]\n'
+                     'requests_per_device_per_second = 23.4\n')
+        rl.logger = debug_logger()
+        with mock.patch('swift.common.middleware.backend_ratelimit.time.time',
+                        return_value=now + 10060):
+            resp1 = req1.get_response(rl)
+        self.assertEqual(200, resp1.status_int)
+        # previous conf file value has been retained
+        exp_req_per_dev_per_sec.update({None: 23.4})
+        self.assertEqual(exp_req_per_dev_per_sec,
+                         rl.requests_per_device_per_second)
+        self.assertEqual(2.4, rl.requests_per_device_rate_buffer)
+        lines = rl.logger.get_lines_for_level('info')
+        self.assertEqual(['Loaded config file %s, config changed' % conf_path],
+                         lines)
+
+    def test_config_file_disappears_appears_logging(self):
+        # verify that config reload is logged when file reappears
+        now = time.time()
+        filter_conf = {'swift_dir': self.tempdir,
+                       'requests_per_device_per_second': "1.3",
+                       'requests_per_device_rate_buffer': "2.4"}
+        # create the actual file
+        conf_path = os.path.join(self.tempdir, 'backend-ratelimit.conf')
+        conf_str = ('[backend_ratelimit]\n'
+                    'requests_per_device_per_second = 12.3\n')
+        with open(conf_path, 'w') as fd:
+            fd.write(conf_str)
+        factory = backend_ratelimit.filter_factory(filter_conf)
+        with mock.patch('swift.common.middleware.backend_ratelimit.time.time',
+                        return_value=now):
+            with mock.patch(
+                    'swift.common.middleware.backend_ratelimit.get_logger',
+                    return_value=debug_logger()):
+                rl = factory(self.swift)
+        # conf file value has been applied
+        exp_req_per_dev_per_sec = dict(self.default_req_per_dev_per_sec)
+        exp_req_per_dev_per_sec[None] = 12.3
+        self.assertEqual(exp_req_per_dev_per_sec,
+                         rl.requests_per_device_per_second)
+        self.assertEqual(2.4, rl.requests_per_device_rate_buffer)
+        lines = rl.logger.get_lines_for_level('info')
+        self.assertEqual(
+            ['Loaded config file %s, config changed' % conf_path],
+            lines)
+        lines = rl.logger.get_lines_for_level('warning')
+        self.assertFalse(lines)
+
+        def do_request(now):
+            rl.logger.logger.clear()
+            req1 = Request.blank('/sda1/99/a/c/o')
+            self.swift.register(req1.method, req1.path, HTTPOk, {})
+            with mock.patch(
+                    'swift.common.middleware.backend_ratelimit.time.time',
+                    return_value=now):
+                resp = req1.get_response(rl)
+            self.assertEqual(200, resp.status_int)
+            info_lines = rl.logger.get_lines_for_level('info')
+            warning_lines = rl.logger.get_lines_for_level('warning')
+            return info_lines, warning_lines
+
+        # jump into future, send request, config reload fails - warning
+        os.unlink(conf_path)
+        now += 100
+        info_lines, warning_lines = do_request(now)
+        self.assertFalse(info_lines)
+        self.assertEqual(
+            ['Failed to load config file, config unchanged: Unable to '
+             'read config from %s' % conf_path], warning_lines)
+
+        # jump into future, send request, config reload fails - no warning
+        now += 100
+        info_lines, warning_lines = do_request(now)
+        self.assertFalse(info_lines)
+        self.assertFalse(warning_lines)
+
+        # reinstate conf file
+        with open(conf_path, 'w') as fd:
+            fd.write(conf_str)
+
+        # jump into future, send request, config reload succeeds - logged
+        now += 100
+        info_lines, warning_lines = do_request(now)
+        self.assertEqual('Loaded new config file %s, config unchanged'
+                         % conf_path, info_lines[0])
+        self.assertFalse(warning_lines)
+
+        # jump into future, send request, config reload succeeds - not logged
+        now += 100
+        info_lines, warning_lines = do_request(now)
+        self.assertFalse(info_lines)
+        self.assertFalse(warning_lines)
+
+    def test_config_file_reload_disabled(self):
+        # verify that conf file options are not periodically reloaded when
+        # interval is zero
+        now = time.time()
+        filter_conf = {'swift_dir': self.tempdir,
+                       'requests_per_device_per_second': "1.3",
+                       'requests_per_device_rate_buffer': "2.4",
+                       'config_reload_interval': 0}
+        conf_path = os.path.join(self.tempdir, 'backend-ratelimit.conf')
+        with open(conf_path, 'w') as fd:
+            fd.write('[backend_ratelimit]\n'
+                     'requests_per_device_per_second = 12.3\n')
+        factory = backend_ratelimit.filter_factory(filter_conf)
+        with mock.patch('swift.common.middleware.backend_ratelimit.time.time',
+                        return_value=now):
+            rl = factory(self.swift)
+        exp_req_per_dev_per_sec = dict(self.default_req_per_dev_per_sec)
+        exp_req_per_dev_per_sec[None] = 12.3
+        self.assertEqual(exp_req_per_dev_per_sec,
+                         rl.requests_per_device_per_second)
+        self.assertEqual(2.4, rl.requests_per_device_rate_buffer)
+
+        with open(conf_path, 'w') as fd:
+            fd.write('[backend_ratelimit]\n'
+                     'requests_per_device_per_second = 29.3\n')
+
+        req = Request.blank('/sda1/99/a/c/o')
+        self.swift.register(req.method, req.path, HTTPOk, {})
+        # jump way into the future...
+        with mock.patch('swift.common.middleware.backend_ratelimit.time.time',
+                        return_value=now + 100000):
+            resp = req.get_response(rl)
+        self.assertEqual(200, resp.status_int)
+        # no change
+        exp_req_per_dev_per_sec = dict(self.default_req_per_dev_per_sec)
+        exp_req_per_dev_per_sec[None] = 12.3
+        self.assertEqual(exp_req_per_dev_per_sec,
+                         rl.requests_per_device_per_second)
+        self.assertEqual(2.4, rl.requests_per_device_rate_buffer)
+
+    def _do_test_ratelimit(self, method, req_per_sec, rate_buffer,
+                           extra_conf=None):
+        # send 20 requests, time increments by 0.01 between each request
+        start = time.time()
+        fake_time = [start]
+
+        def mock_time():
+            return fake_time[0]
+
+        app = FakeSwift()
+        logger = debug_logger()
+        # apply a ratelimit
+        conf = {'swift_dir': self.tempdir,
+                'requests_per_device_per_second': req_per_sec,
+                'requests_per_device_rate_buffer': rate_buffer}
+        if extra_conf:
+            conf.update(extra_conf)
+        rl = BackendRateLimitMiddleware(app, conf, logger)
+        success = defaultdict(int)
+        ratelimited = 0
+
+        with mock.patch('swift.common.utils.time.time', mock_time):
+            for i in range(20):
+                for dev in ['sda1', 'sda2', 'sda3']:
+                    req = Request.blank('/%s/99/a/c/o' % dev,
+                                        environ={'REQUEST_METHOD': method})
+                    app.register(method, req.path, HTTPOk, {})
+                    resp = req.get_response(rl)
+                    if resp.status_int == 200:
+                        success[dev] += 1
+                    else:
+                        self.assertEqual(529, resp.status_int)
+                        self.assertTrue(resp.status.startswith(
+                            '529 Too Many Backend Requests'))
+                        ratelimited += 1
+                fake_time[0] += 0.01
+        self.assertEqual(
+            ratelimited,
+            logger.statsd_client.get_stats_counts().get(
+                'backend.ratelimit', 0))
+        return success
+
+    def test_method_ratelimited(self):
+        def do_test_ratelimit(method):
+            # no rate-limiting
+            success_per_dev = self._do_test_ratelimit(method, 0, 0)
+            self.assertEqual([20] * 3, list(success_per_dev.values()))
+
+            # global rate-limited
+            success_per_dev = self._do_test_ratelimit(method, 1, 0)
+            self.assertEqual([1] * 3, list(success_per_dev.values()))
+
+            success_per_dev = self._do_test_ratelimit(method, 10, 0)
+            self.assertEqual([2] * 3, list(success_per_dev.values()))
+
+            success_per_dev = self._do_test_ratelimit(method, 101, 0)
+            self.assertEqual([20] * 3, list(success_per_dev.values()))
+
+            # startup burst of 1 seconds allowance plus current allowance...
+            success_per_dev = self._do_test_ratelimit(method, 1, 1)
+            self.assertEqual([2] * 3, list(success_per_dev.values()))
+            success_per_dev = self._do_test_ratelimit(method, 10, 1)
+            self.assertEqual([12] * 3, list(success_per_dev.values()))
+
+            # method rate-limited
+            extra_conf = {
+                '%s_requests_per_device_per_second' % method.lower(): 1
+            }
+            success_per_dev = self._do_test_ratelimit(method, 0, 0, extra_conf)
+            self.assertEqual([1] * 3, list(success_per_dev.values()))
+
+            # method not rate-limited, global rate limited
+            extra_conf = {
+                '%s_requests_per_device_per_second' % method.lower(): 100
+            }
+            success_per_dev = self._do_test_ratelimit(method, 1, 0, extra_conf)
+            self.assertEqual([1] * 3, list(success_per_dev.values()))
+
+        do_test_ratelimit('GET')
+        do_test_ratelimit('HEAD')
+        do_test_ratelimit('PUT')
+        do_test_ratelimit('POST')
+        do_test_ratelimit('DELETE')
+        do_test_ratelimit('UPDATE')
+        do_test_ratelimit('REPLICATE')
+
+    def test_method_not_ratelimited(self):
+        def do_test_no_ratelimit(method):
+            # verify no rate-limiting
+            success_per_dev = self._do_test_ratelimit(method, 1, 0)
+            self.assertEqual([20] * 3, list(success_per_dev.values()))
+
+        do_test_no_ratelimit('OPTIONS')
+        do_test_no_ratelimit('SSYNC')
+
+    def test_no_ratelimiting_configured(self):
+        # verify shortcut path when no ratelimiting is configured
+        with mock.patch(
+                'swift.common.middleware.backend_ratelimit.'
+                'BackendRateLimitMiddleware._is_allowed') as mock_is_allowed:
+            success_per_dev = self._do_test_ratelimit('GET', 0, 0)
+        self.assertEqual([20] * 3, list(success_per_dev.values()))
+        mock_is_allowed.assert_not_called()
+
+    def test_unhandled_request(self):
+        app = FakeSwift()
+        logger = debug_logger()
+        conf = {'requests_per_device_per_second': 1,
+                'requests_per_device_rate_buffer': 1}
+
+        def do_test(path):
+            rl = BackendRateLimitMiddleware(app, conf, logger)
+            req = Request.blank(path)
+            app.register('GET', req.path, HTTPOk, {})
+            for i in range(10):
+                resp = req.get_response(rl)
+                self.assertEqual(200, resp.status_int)
+            self.assertEqual(
+                0, logger.statsd_client.get_stats_counts().get(
+                    'backend.ratelimit', 0))
+
+        do_test('/recon/version')
+        do_test('/healthcheck')
+        do_test('/v1/a/c/o')
diff --git a/test/unit/common/middleware/test_bulk.py b/test/unit/common/middleware/test_bulk.py
new file mode 100644
index 0000000000..f8ae6e8ce6
--- /dev/null
+++ b/test/unit/common/middleware/test_bulk.py
@@ -0,0 +1,1049 @@
+# -*- coding: utf-8 -*-
+# Copyright (c) 2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from collections import Counter
+import numbers
+import unittest
+import os
+import tarfile
+import zlib
+from unittest import mock
+from io import BytesIO
+from shutil import rmtree
+from tempfile import mkdtemp
+from eventlet import sleep
+from unittest.mock import patch, call
+from test.debug_logger import debug_logger
+from test.unit.common.middleware.helpers import FakeSwift
+from swift.common import utils, constraints, registry
+from swift.common.header_key_dict import HeaderKeyDict
+from swift.common.middleware import bulk
+from swift.common.swob import Request, Response, HTTPException, \
+    HTTPNoContent, HTTPCreated
+from swift.common.http import HTTP_NOT_FOUND, HTTP_UNAUTHORIZED
+
+
+class FakeApp(object):
+    def __init__(self):
+        self.calls = 0
+        self.delete_paths = []
+        self.put_paths = []
+        self.max_pathlen = 100
+        self.del_cont_total_calls = 2
+        self.del_cont_cur_call = 0
+
+    def __call__(self, env, start_response):
+        self.calls += 1
+        if env.get('swift.source') in ('EA', 'BD'):
+            assert not env.get('swift.proxy_access_log_made')
+        # Check that it's valid WSGI
+        assert all(0 <= ord(c) <= 255 for c in env['PATH_INFO'])
+
+        if env['REQUEST_METHOD'] == 'PUT':
+            self.put_paths.append(env['PATH_INFO'])
+        if env['PATH_INFO'].startswith('/unauth/'):
+            if env['PATH_INFO'].endswith('/c/f_ok'):
+                return Response(status='204 No Content')(env, start_response)
+            return Response(status=401)(env, start_response)
+        if env['PATH_INFO'].startswith('/create_cont/'):
+            if env['REQUEST_METHOD'] == 'HEAD':
+                return Response(status='404 Not Found')(env, start_response)
+            return Response(status='201 Created')(env, start_response)
+        if env['PATH_INFO'].startswith('/create_cont_fail/'):
+            if env['REQUEST_METHOD'] == 'HEAD':
+                return Response(status='403 Forbidden')(env, start_response)
+            return Response(status='404 Not Found')(env, start_response)
+        if env['PATH_INFO'].startswith('/create_obj_unauth/'):
+            if env['PATH_INFO'].endswith('/cont'):
+                return Response(status='201 Created')(env, start_response)
+            return Response(status=401)(env, start_response)
+        if env['PATH_INFO'].startswith('/tar_works/'):
+            if len(env['PATH_INFO']) > self.max_pathlen:
+                return Response(status='400 Bad Request')(env, start_response)
+            return Response(status='201 Created')(env, start_response)
+        if env['PATH_INFO'].startswith('/tar_works_cont_head_fail/'):
+            if env['REQUEST_METHOD'] == 'HEAD':
+                return Response(status='404 Not Found')(env, start_response)
+            if len(env['PATH_INFO']) > 100:
+                return Response(status='400 Bad Request')(env, start_response)
+            return Response(status='201 Created')(env, start_response)
+        if (env['PATH_INFO'].startswith('/delete_works/')
+                and env['REQUEST_METHOD'] == 'DELETE'):
+            self.delete_paths.append(env['PATH_INFO'])
+            if len(env['PATH_INFO']) > self.max_pathlen:
+                return Response(status='400 Bad Request')(env, start_response)
+            if env['PATH_INFO'].endswith('404'):
+                return Response(status='404 Not Found')(env, start_response)
+            if env['PATH_INFO'].endswith('badutf8'):
+                return Response(
+                    status='412 Precondition Failed')(env, start_response)
+            return Response(status='204 No Content')(env, start_response)
+        if env['PATH_INFO'].startswith('/delete_cont_fail/'):
+            return Response(status='409 Conflict')(env, start_response)
+        if env['PATH_INFO'].startswith('/broke/'):
+            return Response(status='500 Internal Error')(env, start_response)
+        if env['PATH_INFO'].startswith('/delete_cont_success_after_attempts/'):
+            if self.del_cont_cur_call < self.del_cont_total_calls:
+                self.del_cont_cur_call += 1
+                return Response(status='409 Conflict')(env, start_response)
+            else:
+                return Response(status='204 No Content')(env, start_response)
+
+
+def build_dir_tree(start_path, tree_obj):
+    if isinstance(tree_obj, list):
+        for obj in tree_obj:
+            build_dir_tree(start_path, obj)
+        return
+    if isinstance(tree_obj, dict):
+        for dir_name, obj in tree_obj.items():
+            dir_path = os.path.join(start_path, dir_name)
+            os.mkdir(dir_path)
+            build_dir_tree(dir_path, obj)
+        return
+    if isinstance(tree_obj, str):
+        obj_path = os.path.join(start_path, tree_obj)
+        with open(obj_path, 'w+') as tree_file:
+            tree_file.write('testing')
+        return
+    raise TypeError("can't build tree from %r" % tree_obj)
+
+
+def build_tar_tree(tar, start_path, tree_obj, base_path=''):
+    if isinstance(start_path, bytes):
+        start_path = start_path.decode('utf8', 'surrogateescape')
+    if isinstance(tree_obj, bytes):
+        tree_obj = tree_obj.decode('utf8', 'surrogateescape')
+
+    if isinstance(tree_obj, list):
+        for obj in tree_obj:
+            build_tar_tree(tar, start_path, obj, base_path=base_path)
+        return
+    if isinstance(tree_obj, dict):
+        for dir_name, obj in tree_obj.items():
+            if isinstance(dir_name, bytes):
+                dir_name = dir_name.decode('utf8', 'surrogateescape')
+            dir_path = os.path.join(start_path, dir_name)
+            tar_info = tarfile.TarInfo(dir_path[len(base_path):])
+            tar_info.type = tarfile.DIRTYPE
+            tar.addfile(tar_info)
+            build_tar_tree(tar, dir_path, obj, base_path=base_path)
+        return
+    if isinstance(tree_obj, str):
+        obj_path = os.path.join(start_path, tree_obj)
+        tar_info = tarfile.TarInfo('./' + obj_path[len(base_path):])
+        tar.addfile(tar_info)
+        return
+    raise TypeError("can't build tree from %r" % tree_obj)
+
+
+class TestUntarMetadata(unittest.TestCase):
+    def setUp(self):
+        self.app = FakeSwift()
+        self.bulk = bulk.filter_factory({})(self.app)
+        self.bulk.logger = debug_logger()
+        self.testdir = mkdtemp(suffix='tmp_test_bulk')
+
+    def tearDown(self):
+        rmtree(self.testdir, ignore_errors=1)
+
+    def test_extract_metadata(self):
+        self.app.register('HEAD', '/v1/a/c?extract-archive=tar',
+                          HTTPNoContent, {}, None)
+        self.app.register('PUT', '/v1/a/c/obj1?extract-archive=tar',
+                          HTTPCreated, {}, None)
+        self.app.register('PUT', '/v1/a/c/obj2?extract-archive=tar',
+                          HTTPCreated, {}, None)
+
+        # It's a real pain to instantiate TarInfo objects directly; they
+        # really want to come from a file on disk or a tarball. So, we write
+        # out some files and add pax headers to them as they get placed into
+        # the tarball.
+        with open(os.path.join(self.testdir, "obj1"), "w") as fh1:
+            fh1.write("obj1 contents\n")
+        with open(os.path.join(self.testdir, "obj2"), "w") as fh2:
+            fh2.write("obj2 contents\n")
+
+        tar_ball = BytesIO()
+        tar_file = tarfile.TarFile.open(fileobj=tar_ball, mode="w",
+                                        format=tarfile.PAX_FORMAT)
+
+        # With GNU tar 1.27.1 or later (possibly 1.27 as well), a file with
+        # extended attribute user.thingy = dingy gets put into the tarfile
+        # with pax_headers containing key/value pair
+        # (SCHILY.xattr.user.thingy, dingy), both unicode strings
+        #
+        # With BSD tar (libarchive), you get key/value pair
+        # (LIBARCHIVE.xattr.user.thingy, dingy), which strikes me as
+        # gratuitous incompatibility.
+        #
+        # Still, we'll support uploads with both. Just heap more code on the
+        # problem until you can forget it's under there.
+        with open(os.path.join(self.testdir, "obj1"), 'rb') as fh1:
+            tar_info1 = tar_file.gettarinfo(fileobj=fh1,
+                                            arcname="obj1")
+            tar_info1.pax_headers[u'SCHILY.xattr.user.mime_type'] = \
+                u'application/food-diary'
+            tar_info1.pax_headers[u'SCHILY.xattr.user.meta.lunch'] = \
+                u'sopa de albóndigas'
+            tar_info1.pax_headers[
+                u'SCHILY.xattr.user.meta.afternoon-snack'] = \
+                u'gigantic bucket of coffee'
+            tar_file.addfile(tar_info1, fh1)
+
+        with open(os.path.join(self.testdir, "obj2"), 'rb') as fh2:
+            tar_info2 = tar_file.gettarinfo(fileobj=fh2,
+                                            arcname="obj2")
+            tar_info2.pax_headers[
+                u'LIBARCHIVE.xattr.user.meta.muppet'] = u'bert'
+            tar_info2.pax_headers[
+                u'LIBARCHIVE.xattr.user.meta.cat'] = u'fluffy'
+            tar_info2.pax_headers[
+                u'LIBARCHIVE.xattr.user.notmeta'] = u'skipped'
+            tar_file.addfile(tar_info2, fh2)
+
+        tar_ball.seek(0)
+
+        req = Request.blank('/v1/a/c?extract-archive=tar')
+        req.environ['REQUEST_METHOD'] = 'PUT'
+        req.environ['wsgi.input'] = tar_ball
+        # Since there should be a proxy-logging left of us...
+        req.environ['swift.proxy_access_log_made'] = True
+        req.headers.update({
+            'transfer-encoding': 'chunked',
+            'accept': 'application/json;q=1.0',
+            'X-Delete-At': '1577383915',
+            'X-Object-Meta-Dog': 'Rantanplan',
+            'X-Horse': 'Jolly Jumper',
+            'X-Object-Meta-Cat': 'tabby',
+        })
+
+        resp = req.get_response(self.bulk)
+        self.assertEqual(resp.status_int, 200)
+
+        # sanity check to make sure the upload worked
+        upload_status = utils.json.loads(resp.body)
+        self.assertEqual(upload_status['Number Files Created'], 2)
+
+        put1_headers = HeaderKeyDict(self.app.calls_with_headers[1][2])
+        self.assertEqual(
+            put1_headers.get('Content-Type'),
+            'application/food-diary')
+        self.assertEqual(
+            put1_headers.get('X-Object-Meta-Lunch'),
+            'sopa de alb\xc3\xb3ndigas')
+        self.assertEqual(
+            put1_headers.get('X-Object-Meta-Afternoon-Snack'),
+            'gigantic bucket of coffee')
+        self.assertEqual(put1_headers.get('X-Delete-At'), '1577383915')
+        self.assertEqual(put1_headers.get('X-Object-Meta-Dog'), 'Rantanplan')
+        self.assertEqual(put1_headers.get('X-Object-Meta-Cat'), 'tabby')
+        self.assertIsNone(put1_headers.get('X-Horse'))
+
+        put2_headers = HeaderKeyDict(self.app.calls_with_headers[2][2])
+        self.assertEqual(put2_headers.get('X-Object-Meta-Muppet'), 'bert')
+        self.assertEqual(put2_headers.get('X-Object-Meta-Cat'), 'fluffy')
+        self.assertIsNone(put2_headers.get('Content-Type'))
+        self.assertIsNone(put2_headers.get('X-Object-Meta-Blah'))
+        self.assertEqual(put2_headers.get('X-Delete-At'), '1577383915')
+        self.assertEqual(put2_headers.get('X-Object-Meta-Dog'), 'Rantanplan')
+        self.assertIsNone(put2_headers.get('X-Horse'))
+
+
+class TestUntar(unittest.TestCase):
+
+    def setUp(self):
+        self.app = FakeApp()
+        self.bulk = bulk.filter_factory({})(self.app)
+        self.bulk.logger = debug_logger()
+        self.testdir = mkdtemp(suffix='tmp_test_bulk')
+
+    def tearDown(self):
+        self.app.calls = 0
+        rmtree(self.testdir, ignore_errors=1)
+
+    def handle_extract_and_iter(self, req, compress_format,
+                                out_content_type='application/json'):
+        iter = self.bulk.handle_extract_iter(
+            req, compress_format, out_content_type=out_content_type)
+        first_chunk = next(iter)
+        self.assertEqual(req.environ['eventlet.minimum_write_chunk_size'], 0)
+        resp_body = first_chunk + b''.join(iter)
+        return resp_body
+
+    def test_create_container_for_path(self):
+        req = Request.blank('/')
+        self.assertEqual(
+            self.bulk.create_container(req, '/create_cont/acc/cont'),
+            True)
+        self.assertEqual(self.app.calls, 2)
+        self.assertRaises(
+            bulk.CreateContainerError,
+            self.bulk.create_container,
+            req, '/create_cont_fail/acc/cont')
+        self.assertEqual(self.app.calls, 3)
+
+    def test_extract_tar_works(self):
+        # On systems where $TMPDIR is long (like OS X), we need to do this
+        # or else every upload will fail due to the path being too long.
+        self.app.max_pathlen += len(self.testdir)
+        for compress_format in ['', 'gz', 'bz2']:
+            base_name = 'base_works_%s' % compress_format
+            dir_tree = [
+                {base_name: [{'sub_dir1': ['sub1_file1', 'sub1_file2']},
+                             {'sub_dir2': ['sub2_file1', u'test obj \u2661']},
+                             'sub_file1',
+                             {'sub_dir3': [{'sub4_dir1': '../sub4 file1'}]},
+                             {'sub_dir4': []},
+                             ]}]
+
+            build_dir_tree(self.testdir, dir_tree)
+            mode = 'w'
+            extension = ''
+            if compress_format:
+                mode += ':' + compress_format
+                extension += '.' + compress_format
+            tar = tarfile.open(name=os.path.join(self.testdir,
+                                                 'tar_works.tar' + extension),
+                               mode=mode)
+            tar.add(os.path.join(self.testdir, base_name))
+            tar.close()
+            req = Request.blank('/tar_works/acc/cont/')
+            req.environ['wsgi.input'] = open(
+                os.path.join(self.testdir, 'tar_works.tar' + extension), 'rb')
+            req.headers['transfer-encoding'] = 'chunked'
+            resp_body = self.handle_extract_and_iter(req, compress_format)
+            resp_data = utils.json.loads(resp_body)
+            self.assertEqual(resp_data['Number Files Created'], 6)
+
+            # test out xml
+            req = Request.blank('/tar_works/acc/cont/')
+            req.environ['wsgi.input'] = open(
+                os.path.join(self.testdir, 'tar_works.tar' + extension), 'rb')
+            req.headers['transfer-encoding'] = 'chunked'
+            resp_body = self.handle_extract_and_iter(
+                req, compress_format, 'application/xml')
+            self.assertIn(
+                b'<response_status>201 Created</response_status>',
+                resp_body)
+            self.assertIn(
+                b'<number_files_created>6</number_files_created>',
+                resp_body)
+
+            # test out nonexistent format
+            req = Request.blank('/tar_works/acc/cont/?extract-archive=tar',
+                                headers={'Accept': 'good_xml'})
+            req.environ['REQUEST_METHOD'] = 'PUT'
+            req.environ['wsgi.input'] = open(
+                os.path.join(self.testdir, 'tar_works.tar' + extension), 'rb')
+            req.headers['transfer-encoding'] = 'chunked'
+
+            def fake_start_response(*args, **kwargs):
+                pass
+
+            app_iter = self.bulk(req.environ, fake_start_response)
+            resp_body = b''.join(app_iter)
+
+            self.assertIn(b'Response Status: 406', resp_body)
+
+    def test_extract_call(self):
+        base_name = 'base_works_gz'
+        dir_tree = [
+            {base_name: [{'sub_dir1': ['sub1_file1', 'sub1_file2']},
+                         {'sub_dir2': ['sub2_file1', 'sub2_file2']},
+                         'sub_file1',
+                         {'sub_dir3': [{'sub4_dir1': 'sub4_file1'}]}]}]
+        build_dir_tree(self.testdir, dir_tree)
+        tar = tarfile.open(name=os.path.join(self.testdir,
+                                             'tar_works.tar.gz'),
+                           mode='w:gz')
+        tar.add(os.path.join(self.testdir, base_name))
+        tar.close()
+
+        def fake_start_response(*args, **kwargs):
+            pass
+
+        req = Request.blank('/tar_works/acc/cont/?extract-archive=tar.gz')
+        req.environ['wsgi.input'] = open(
+            os.path.join(self.testdir, 'tar_works.tar.gz'), 'rb')
+        self.bulk(req.environ, fake_start_response)
+        self.assertEqual(self.app.calls, 1)
+
+        self.app.calls = 0
+        req.environ['wsgi.input'] = open(
+            os.path.join(self.testdir, 'tar_works.tar.gz'), 'rb')
+        req.headers['transfer-encoding'] = 'Chunked'
+        req.method = 'PUT'
+        app_iter = self.bulk(req.environ, fake_start_response)
+        list(app_iter)  # iter over resp
+        self.assertEqual(self.app.calls, 7)
+
+        self.app.calls = 0
+        req = Request.blank('/tar_works/acc/cont/?extract-archive=bad')
+        req.method = 'PUT'
+        req.headers['transfer-encoding'] = 'Chunked'
+        req.environ['wsgi.input'] = open(
+            os.path.join(self.testdir, 'tar_works.tar.gz'), 'rb')
+        t = self.bulk(req.environ, fake_start_response)
+        self.assertEqual(t, [b"Unsupported archive format"])
+
+        tar = tarfile.open(name=os.path.join(self.testdir,
+                                             'tar_works.tar'),
+                           mode='w')
+        tar.add(os.path.join(self.testdir, base_name))
+        tar.close()
+        self.app.calls = 0
+        req = Request.blank('/tar_works/acc/cont/?extract-archive=tar')
+        req.method = 'PUT'
+        req.headers['transfer-encoding'] = 'Chunked'
+        req.environ['wsgi.input'] = open(
+            os.path.join(self.testdir, 'tar_works.tar'), 'rb')
+        app_iter = self.bulk(req.environ, fake_start_response)
+        list(app_iter)  # iter over resp
+        self.assertEqual(self.app.calls, 7)
+
+    def test_bad_container(self):
+        req = Request.blank('/invalid/', body=b'')
+        resp_body = self.handle_extract_and_iter(req, '')
+        self.assertIn(b'404 Not Found', resp_body)
+
+    def test_content_length_required(self):
+        req = Request.blank('/create_cont_fail/acc/cont')
+        resp_body = self.handle_extract_and_iter(req, '')
+        self.assertIn(b'411 Length Required', resp_body)
+
+    def test_bad_tar(self):
+        req = Request.blank('/create_cont_fail/acc/cont', body='')
+
+        def bad_open(*args, **kwargs):
+            raise zlib.error('bad tar')
+
+        with patch.object(tarfile, 'open', bad_open):
+            resp_body = self.handle_extract_and_iter(req, '')
+            self.assertIn(b'400 Bad Request', resp_body)
+
+    def build_tar(self, dir_tree=None):
+        if not dir_tree:
+            dir_tree = [
+                {'base_fails1': [{'sub_dir1': ['sub1_file1']},
+                                 {'sub_dir2': ['sub2_file1', 'sub2_file2']},
+                                 'f' * 101,
+                                 {'sub_dir3': [{'sub4_dir1': 'sub4_file1'}]}]}]
+        tar = tarfile.open(name=os.path.join(self.testdir, 'tar_fails.tar'),
+                           mode='w')
+        build_tar_tree(tar, self.testdir, dir_tree,
+                       base_path=self.testdir + '/')
+        tar.close()
+        return tar
+
+    def test_extract_tar_with_basefile(self):
+        dir_tree = [
+            'base_lvl_file', 'another_base_file',
+            {'base_fails1': [{'sub_dir1': ['sub1_file1']},
+                             {'sub_dir2': ['sub2_file1', 'sub2_file2']},
+                             {'sub_dir3': [{'sub4_dir1': 'sub4_file1'}]}]}]
+        self.build_tar(dir_tree)
+        req = Request.blank('/tar_works/acc/')
+        req.environ['wsgi.input'] = open(os.path.join(self.testdir,
+                                                      'tar_fails.tar'), 'rb')
+        req.headers['transfer-encoding'] = 'chunked'
+        resp_body = self.handle_extract_and_iter(req, '')
+        resp_data = utils.json.loads(resp_body)
+        self.assertEqual(resp_data['Number Files Created'], 4)
+
+    def test_extract_tar_fail_cont_401(self):
+        self.build_tar()
+        req = Request.blank('/unauth/acc/',
+                            headers={'Accept': 'application/json'})
+        req.environ['wsgi.input'] = open(os.path.join(self.testdir,
+                                                      'tar_fails.tar'), 'rb')
+        req.headers['transfer-encoding'] = 'chunked'
+        resp_body = self.handle_extract_and_iter(req, '')
+        self.assertEqual(self.app.calls, 1)
+        resp_data = utils.json.loads(resp_body)
+        self.assertEqual(resp_data['Response Status'], '401 Unauthorized')
+        self.assertEqual(resp_data['Errors'], [])
+
+    def test_extract_tar_fail_obj_401(self):
+        self.build_tar()
+        req = Request.blank('/create_obj_unauth/acc/cont/',
+                            headers={'Accept': 'application/json'})
+        req.environ['wsgi.input'] = open(os.path.join(self.testdir,
+                                                      'tar_fails.tar'), 'rb')
+        req.headers['transfer-encoding'] = 'chunked'
+        resp_body = self.handle_extract_and_iter(req, '')
+        self.assertEqual(self.app.calls, 2)
+        resp_data = utils.json.loads(resp_body)
+        self.assertEqual(resp_data['Response Status'], '401 Unauthorized')
+        self.assertEqual(
+            resp_data['Errors'],
+            [['cont/base_fails1/sub_dir1/sub1_file1', '401 Unauthorized']])
+
+    def test_extract_tar_fail_obj_name_len(self):
+        self.build_tar()
+        req = Request.blank('/tar_works/acc/cont/',
+                            headers={'Accept': 'application/json'})
+        req.environ['wsgi.input'] = open(os.path.join(self.testdir,
+                                                      'tar_fails.tar'), 'rb')
+        req.headers['transfer-encoding'] = 'chunked'
+        resp_body = self.handle_extract_and_iter(req, '')
+        self.assertEqual(self.app.calls, 6)
+        resp_data = utils.json.loads(resp_body)
+        self.assertEqual(resp_data['Number Files Created'], 4)
+        self.assertEqual(
+            resp_data['Errors'],
+            [['cont/base_fails1/' + ('f' * 101), '400 Bad Request']])
+
+    def test_extract_tar_fail_compress_type(self):
+        self.build_tar()
+        req = Request.blank('/tar_works/acc/cont/',
+                            headers={'Accept': 'application/json'})
+        req.environ['wsgi.input'] = open(os.path.join(self.testdir,
+                                                      'tar_fails.tar'), 'rb')
+        req.headers['transfer-encoding'] = 'chunked'
+        resp_body = self.handle_extract_and_iter(req, 'gz')
+        self.assertEqual(self.app.calls, 0)
+        resp_data = utils.json.loads(resp_body)
+        self.assertEqual(resp_data['Response Status'], '400 Bad Request')
+        self.assertEqual(
+            resp_data['Response Body'].lower(),
+            'invalid tar file: not a gzip file')
+
+    def test_extract_tar_fail_max_failed_extractions(self):
+        self.build_tar()
+        with patch.object(self.bulk, 'max_failed_extractions', 1):
+            self.app.calls = 0
+            req = Request.blank('/tar_works/acc/cont/',
+                                headers={'Accept': 'application/json'})
+            req.environ['wsgi.input'] = open(
+                os.path.join(self.testdir, 'tar_fails.tar'), 'rb')
+            req.headers['transfer-encoding'] = 'chunked'
+            resp_body = self.handle_extract_and_iter(req, '')
+            self.assertEqual(self.app.calls, 5)
+            resp_data = utils.json.loads(resp_body)
+            self.assertEqual(resp_data['Number Files Created'], 3)
+            self.assertEqual(
+                resp_data['Errors'],
+                [['cont/base_fails1/' + ('f' * 101), '400 Bad Request']])
+
+    @patch.object(constraints, 'MAX_FILE_SIZE', 4)
+    def test_extract_tar_fail_max_file_size(self):
+        tar = self.build_tar()
+        dir_tree = [{'test': [{'sub_dir1': ['sub1_file1']}]}]
+        build_dir_tree(self.testdir, dir_tree)
+        tar = tarfile.open(name=os.path.join(self.testdir,
+                                             'tar_works.tar'),
+                           mode='w')
+        tar.add(os.path.join(self.testdir, 'test'))
+        tar.close()
+        self.app.calls = 0
+        req = Request.blank('/tar_works/acc/cont/',
+                            headers={'Accept': 'application/json'})
+        req.environ['wsgi.input'] = open(
+            os.path.join(self.testdir, 'tar_works.tar'), 'rb')
+        req.headers['transfer-encoding'] = 'chunked'
+        resp_body = self.handle_extract_and_iter(req, '')
+        resp_data = utils.json.loads(resp_body)
+        self.assertEqual(
+            resp_data['Errors'],
+            [['cont' + self.testdir + '/test/sub_dir1/sub1_file1',
+              '413 Request Entity Too Large']])
+
+    def test_extract_tar_fail_max_cont(self):
+        dir_tree = [{'sub_dir1': ['sub1_file1']},
+                    {'sub_dir2': ['sub2_file1', 'sub2_file2']},
+                    'f' * 101,
+                    {'sub_dir3': [{'sub4_dir1': 'sub4_file1'}]}]
+        self.build_tar(dir_tree)
+        with patch.object(self.bulk, 'max_containers', 1):
+            self.app.calls = 0
+            body = open(os.path.join(self.testdir, 'tar_fails.tar')).read()
+            req = Request.blank('/tar_works_cont_head_fail/acc/', body=body,
+                                headers={'Accept': 'application/json'})
+            req.headers['transfer-encoding'] = 'chunked'
+            resp_body = self.handle_extract_and_iter(req, '')
+            self.assertEqual(self.app.calls, 5)
+            resp_data = utils.json.loads(resp_body)
+            self.assertEqual(resp_data['Response Status'], '400 Bad Request')
+            self.assertEqual(
+                resp_data['Response Body'],
+                'More than 1 containers to create from tar.')
+
+    def test_extract_tar_fail_create_cont(self):
+        dir_tree = [{'base_fails1': [
+            {'sub_dir1': ['sub1_file1']},
+            {'sub_dir2': ['sub2_file1', 'sub2_file2']},
+            {'./sub_dir3': [{'sub4_dir1': 'sub4_file1'}]}]}]
+        self.build_tar(dir_tree)
+        req = Request.blank('/create_cont_fail/acc/cont/',
+                            headers={'Accept': 'application/json'})
+        req.environ['wsgi.input'] = open(os.path.join(self.testdir,
+                                                      'tar_fails.tar'), 'rb')
+        req.headers['transfer-encoding'] = 'chunked'
+        resp_body = self.handle_extract_and_iter(req, '')
+        resp_data = utils.json.loads(resp_body)
+        self.assertEqual(self.app.calls, 5)
+        self.assertEqual(len(resp_data['Errors']), 5)
+
+    def test_extract_tar_fail_create_cont_value_err(self):
+        self.build_tar()
+        req = Request.blank('/create_cont_fail/acc/cont/',
+                            headers={'Accept': 'application/json'})
+        req.environ['wsgi.input'] = open(os.path.join(self.testdir,
+                                                      'tar_fails.tar'), 'rb')
+        req.headers['transfer-encoding'] = 'chunked'
+
+        def bad_create(req, path):
+            raise ValueError('Test')
+
+        with patch.object(self.bulk, 'create_container', bad_create):
+            resp_body = self.handle_extract_and_iter(req, '')
+            resp_data = utils.json.loads(resp_body)
+            self.assertEqual(self.app.calls, 0)
+            self.assertEqual(len(resp_data['Errors']), 5)
+            self.assertEqual(
+                resp_data['Errors'][0],
+                ['cont/base_fails1/sub_dir1/sub1_file1', '400 Bad Request'])
+
+    def test_extract_tar_fail_unicode(self):
+        dir_tree = [{'sub_dir1': ['sub1_file1']},
+                    {'sub_dir2': [b'sub2\xdefile1', 'sub2_file2']},
+                    {b'good_\xe2\x98\x83': [{'still_good': b'\xe2\x98\x83'}]},
+                    {b'sub_\xdedir3': [{'sub4_dir1': 'sub4_file1'}]}]
+        self.build_tar(dir_tree)
+        req = Request.blank('/tar_works/acc/',
+                            headers={'Accept': 'application/json'})
+        req.environ['wsgi.input'] = open(os.path.join(self.testdir,
+                                                      'tar_fails.tar'), 'rb')
+        req.headers['transfer-encoding'] = 'chunked'
+        resp_body = self.handle_extract_and_iter(req, '')
+        resp_data = utils.json.loads(resp_body)
+        self.assertEqual(self.app.calls, 6)
+        self.assertEqual(resp_data['Number Files Created'], 3)
+        self.assertEqual(resp_data['Response Status'], '400 Bad Request')
+        self.assertEqual(
+            resp_data['Errors'],
+            [['sub_dir2/sub2%DEfile1', '412 Precondition Failed'],
+             ['sub_%DEdir3/sub4_dir1/sub4_file1', '412 Precondition Failed']])
+        self.assertEqual(self.app.put_paths, [
+            '/tar_works/acc/sub_dir1/sub1_file1',
+            '/tar_works/acc/sub_dir2/sub2_file2',
+            '/tar_works/acc/good_\xe2\x98\x83/still_good/\xe2\x98\x83',
+        ])
+
+    def test_get_response_body(self):
+        txt_body = bulk.get_heartbeat_response_body(
+            'bad_formay', {'hey': 'there'}, [['json > xml', '202 Accepted']],
+            "doesn't matter for text")
+        self.assertIn(b'hey: there', txt_body)
+        xml_body = bulk.get_heartbeat_response_body(
+            'text/xml', {'hey': 'there'}, [['json > xml', '202 Accepted']],
+            'root_tag')
+        self.assertIn(b'&gt', xml_body)
+        self.assertTrue(xml_body.startswith(b'<root_tag>\n'))
+        self.assertTrue(xml_body.endswith(b'\n</root_tag>\n'))
+
+
+class TestDelete(unittest.TestCase):
+    conf = {'delete_concurrency': 1}  # default to old single-threaded behavior
+
+    def setUp(self):
+        self.app = FakeApp()
+        self.bulk = bulk.filter_factory(self.conf)(self.app)
+        self.bulk.logger = debug_logger()
+
+    def tearDown(self):
+        self.app.calls = 0
+        self.app.delete_paths = []
+
+    def handle_delete_and_iter(self, req, out_content_type='application/json'):
+        iter = self.bulk.handle_delete_iter(
+            req, out_content_type=out_content_type)
+        first_chunk = next(iter)
+        self.assertEqual(req.environ['eventlet.minimum_write_chunk_size'], 0)
+        resp_body = first_chunk + b''.join(iter)
+        return resp_body
+
+    def test_bulk_delete_uses_predefined_object_errors(self):
+        req = Request.blank('/delete_works/AUTH_Acc')
+        objs_to_delete = [
+            {'name': '/c/file_a'},
+            {'name': '/c/file_b', 'error': {'code': HTTP_NOT_FOUND,
+                                            'message': 'not found'}},
+            {'name': '/c/file_c', 'error': {'code': HTTP_UNAUTHORIZED,
+                                            'message': 'unauthorized'}},
+            {'name': '/c/file_d'}]
+        resp_body = b''.join(self.bulk.handle_delete_iter(
+            req, objs_to_delete=objs_to_delete,
+            out_content_type='application/json'))
+        self.assertEqual(set(self.app.delete_paths),
+                         set(['/delete_works/AUTH_Acc/c/file_a',
+                              '/delete_works/AUTH_Acc/c/file_d']))
+        self.assertEqual(self.app.calls, 2)
+        resp_data = utils.json.loads(resp_body)
+        self.assertEqual(resp_data['Response Status'], '400 Bad Request')
+        self.assertEqual(resp_data['Number Deleted'], 2)
+        self.assertEqual(resp_data['Number Not Found'], 1)
+        self.assertEqual(resp_data['Errors'],
+                         [['/c/file_c', 'unauthorized']])
+
+    def test_bulk_delete_works_with_POST_verb(self):
+        req = Request.blank('/delete_works/AUTH_Acc', body='/c/f\n/c/f404',
+                            headers={'Accept': 'application/json'})
+        req.method = 'POST'
+        resp_body = self.handle_delete_and_iter(req)
+        self.assertEqual(set(self.app.delete_paths),
+                         set(['/delete_works/AUTH_Acc/c/f',
+                              '/delete_works/AUTH_Acc/c/f404']))
+        self.assertEqual(self.app.calls, 2)
+        resp_data = utils.json.loads(resp_body)
+        self.assertEqual(resp_data['Number Deleted'], 1)
+        self.assertEqual(resp_data['Number Not Found'], 1)
+
+    def test_bulk_delete_works_with_DELETE_verb(self):
+        req = Request.blank('/delete_works/AUTH_Acc', body='/c/f\n/c/f404',
+                            headers={'Accept': 'application/json'})
+        req.method = 'DELETE'
+        resp_body = self.handle_delete_and_iter(req)
+        self.assertEqual(set(self.app.delete_paths),
+                         set(['/delete_works/AUTH_Acc/c/f',
+                              '/delete_works/AUTH_Acc/c/f404']))
+        self.assertEqual(self.app.calls, 2)
+        resp_data = utils.json.loads(resp_body)
+        self.assertEqual(resp_data['Number Deleted'], 1)
+        self.assertEqual(resp_data['Number Not Found'], 1)
+
+    def test_bulk_delete_bad_content_type(self):
+        req = Request.blank('/delete_works/AUTH_Acc',
+                            headers={'Accept': 'badformat'})
+
+        req = Request.blank('/delete_works/AUTH_Acc',
+                            headers={'Accept': 'application/json',
+                                     'Content-Type': 'text/xml'})
+        req.method = 'POST'
+        req.environ['wsgi.input'] = BytesIO(b'/c/f\n/c/f404')
+        resp_body = self.handle_delete_and_iter(req)
+        resp_data = utils.json.loads(resp_body)
+        self.assertEqual(resp_data['Response Status'], '406 Not Acceptable')
+
+    def test_bulk_delete_call_and_content_type(self):
+        def fake_start_response(*args, **kwargs):
+            self.assertEqual(args[1][0], ('Content-Type', 'application/json'))
+
+        req = Request.blank('/delete_works/AUTH_Acc?bulk-delete')
+        req.method = 'POST'
+        req.headers['Transfer-Encoding'] = 'chunked'
+        req.headers['Accept'] = 'application/json'
+        req.environ['wsgi.input'] = BytesIO(b'/c/f%20')
+        list(self.bulk(req.environ, fake_start_response))  # iterate over resp
+        self.assertEqual(
+            self.app.delete_paths, ['/delete_works/AUTH_Acc/c/f '])
+        self.assertEqual(self.app.calls, 1)
+
+    def test_bulk_delete_get_objs(self):
+        req = Request.blank('/delete_works/AUTH_Acc', body='1%20\r\n2\r\n')
+        req.method = 'POST'
+        with patch.object(self.bulk, 'max_deletes_per_request', 2):
+            results = self.bulk.get_objs_to_delete(req)
+            self.assertEqual(results, [{'name': '1 '}, {'name': '2'}])
+
+        with patch.object(self.bulk, 'max_path_length', 2):
+            results = []
+            req.environ['wsgi.input'] = BytesIO(b'1\n2\n3')
+            results = self.bulk.get_objs_to_delete(req)
+            self.assertEqual(results,
+                             [{'name': '1'}, {'name': '2'}, {'name': '3'}])
+
+        with patch.object(self.bulk, 'max_deletes_per_request', 9):
+            with patch.object(self.bulk, 'max_path_length', 1):
+                req_body = '\n'.join([str(i) for i in range(10)])
+                req = Request.blank('/delete_works/AUTH_Acc', body=req_body)
+                self.assertRaises(
+                    HTTPException, self.bulk.get_objs_to_delete, req)
+
+    def test_bulk_delete_works_extra_newlines_extra_quoting(self):
+        req = Request.blank('/delete_works/AUTH_Acc',
+                            body='/c/f\n\n\n/c/f404\n\n\n/c/%2525',
+                            headers={'Accept': 'application/json'})
+        req.method = 'POST'
+        resp_body = self.handle_delete_and_iter(req)
+        self.assertEqual(
+            Counter(self.app.delete_paths),
+            Counter(['/delete_works/AUTH_Acc/c/f',
+                     '/delete_works/AUTH_Acc/c/f404',
+                     '/delete_works/AUTH_Acc/c/%25']))
+        self.assertEqual(self.app.calls, 3)
+        resp_data = utils.json.loads(resp_body)
+        self.assertEqual(resp_data['Number Deleted'], 2)
+        self.assertEqual(resp_data['Number Not Found'], 1)
+
+    def test_bulk_delete_too_many_newlines(self):
+        req = Request.blank('/delete_works/AUTH_Acc')
+        req.method = 'POST'
+        data = b'\n\n' * self.bulk.max_deletes_per_request
+        req.environ['wsgi.input'] = BytesIO(data)
+        req.content_length = len(data)
+        resp_body = self.handle_delete_and_iter(req)
+        self.assertIn(b'413 Request Entity Too Large', resp_body)
+
+    def test_bulk_delete_works_unicode(self):
+        body = (u'/c/ obj \u2661\r\n'.encode('utf8') +
+                b'c/ objbadutf8\r\n' +
+                b'/c/f\xdebadutf8\n')
+        req = Request.blank('/delete_works/AUTH_Acc', body=body,
+                            headers={'Accept': 'application/json'})
+        req.method = 'POST'
+        resp_body = self.handle_delete_and_iter(req)
+        self.assertEqual(
+            dict(Counter(self.app.delete_paths)),
+            dict(Counter(['/delete_works/AUTH_Acc/c/ obj \xe2\x99\xa1',
+                          '/delete_works/AUTH_Acc/c/ objbadutf8'])))
+
+        self.assertEqual(self.app.calls, 2)
+        resp_data = utils.json.loads(resp_body)
+        self.assertEqual(resp_data['Number Deleted'], 1)
+        self.assertEqual(len(resp_data['Errors']), 2)
+        self.assertEqual(
+            dict(Counter(map(tuple, resp_data['Errors']))),
+            dict(Counter([('c/%20objbadutf8',
+                           '412 Precondition Failed'),
+                          ('/c/f%DEbadutf8',
+                           '412 Precondition Failed')])))
+
+    def test_bulk_delete_no_body(self):
+        req = Request.blank('/unauth/AUTH_acc/')
+        resp_body = self.handle_delete_and_iter(req)
+        self.assertIn(b'411 Length Required', resp_body)
+
+    def test_bulk_delete_no_files_in_body(self):
+        req = Request.blank('/unauth/AUTH_acc/', body=' ')
+        resp_body = self.handle_delete_and_iter(req)
+        self.assertIn(b'400 Bad Request', resp_body)
+
+    def test_bulk_delete_unauth(self):
+        req = Request.blank('/unauth/AUTH_acc/', body='/c/f\n/c/f_ok\n',
+                            headers={'Accept': 'application/json'})
+        req.method = 'POST'
+        resp_body = self.handle_delete_and_iter(req)
+        self.assertEqual(self.app.calls, 2)
+        resp_data = utils.json.loads(resp_body)
+        self.assertEqual(resp_data['Errors'], [['/c/f', '401 Unauthorized']])
+        self.assertEqual(resp_data['Response Status'], '400 Bad Request')
+        self.assertEqual(resp_data['Number Deleted'], 1)
+
+    def test_bulk_delete_500_resp(self):
+        req = Request.blank('/broke/AUTH_acc/', body='/c/f\nc/f2\n',
+                            headers={'Accept': 'application/json'})
+        req.method = 'POST'
+        resp_body = self.handle_delete_and_iter(req)
+        resp_data = utils.json.loads(resp_body)
+        self.assertEqual(
+            Counter(map(tuple, resp_data['Errors'])),
+            Counter([('/c/f', '500 Internal Error'),
+                     ('c/f2', '500 Internal Error')]))
+        self.assertEqual(resp_data['Response Status'], '502 Bad Gateway')
+
+    def test_bulk_delete_bad_path(self):
+        req = Request.blank('/delete_cont_fail/')
+        resp_body = self.handle_delete_and_iter(req)
+        self.assertIn(b'404 Not Found', resp_body)
+
+    def test_bulk_delete_container_delete(self):
+        req = Request.blank('/delete_cont_fail/AUTH_Acc', body='c\n',
+                            headers={'Accept': 'application/json'})
+        req.method = 'POST'
+        with patch('swift.common.middleware.bulk.sleep',
+                   new=mock.MagicMock(wraps=sleep,
+                                      return_value=None)) as mock_sleep:
+            resp_body = self.handle_delete_and_iter(req)
+            resp_data = utils.json.loads(resp_body)
+            self.assertEqual(resp_data['Number Deleted'], 0)
+            self.assertEqual(resp_data['Errors'], [['c', '409 Conflict']])
+            self.assertEqual(resp_data['Response Status'], '400 Bad Request')
+            self.assertEqual([], mock_sleep.call_args_list)
+
+    def test_bulk_delete_container_delete_retry_and_fails(self):
+        self.bulk.retry_count = 3
+        req = Request.blank('/delete_cont_fail/AUTH_Acc', body='c\n',
+                            headers={'Accept': 'application/json'})
+        req.method = 'POST'
+        with patch('swift.common.middleware.bulk.sleep',
+                   new=mock.MagicMock(wraps=sleep,
+                                      return_value=None)) as mock_sleep:
+            resp_body = self.handle_delete_and_iter(req)
+            resp_data = utils.json.loads(resp_body)
+            self.assertEqual(resp_data['Number Deleted'], 0)
+            self.assertEqual(resp_data['Errors'], [['c', '409 Conflict']])
+            self.assertEqual(resp_data['Response Status'], '400 Bad Request')
+            self.assertEqual([call(self.bulk.retry_interval),
+                              call(self.bulk.retry_interval ** 2),
+                              call(self.bulk.retry_interval ** 3)],
+                             mock_sleep.call_args_list)
+
+    def test_bulk_delete_container_delete_retry_and_success(self):
+        self.bulk.retry_count = 3
+        self.app.del_container_total = 2
+        req = Request.blank('/delete_cont_success_after_attempts/AUTH_Acc',
+                            body='c\n', headers={'Accept': 'application/json'})
+        req.method = 'DELETE'
+        with patch('swift.common.middleware.bulk.sleep',
+                   new=mock.MagicMock(wraps=sleep,
+                                      return_value=None)) as mock_sleep:
+            resp_body = self.handle_delete_and_iter(req)
+            resp_data = utils.json.loads(resp_body)
+            self.assertEqual(resp_data['Number Deleted'], 1)
+            self.assertEqual(resp_data['Errors'], [])
+            self.assertEqual(resp_data['Response Status'], '200 OK')
+            self.assertEqual([call(self.bulk.retry_interval),
+                              call(self.bulk.retry_interval ** 2)],
+                             mock_sleep.call_args_list)
+
+    def test_bulk_delete_bad_file_too_long(self):
+        req = Request.blank('/delete_works/AUTH_Acc',
+                            headers={'Accept': 'application/json'})
+        req.method = 'POST'
+        bad_file = 'c/' + ('1' * self.bulk.max_path_length)
+        data = b'/c/f\n' + bad_file.encode('ascii') + b'\n/c/f'
+        req.environ['wsgi.input'] = BytesIO(data)
+        req.headers['Transfer-Encoding'] = 'chunked'
+        resp_body = self.handle_delete_and_iter(req)
+        resp_data = utils.json.loads(resp_body)
+        self.assertEqual(resp_data['Number Deleted'], 2)
+        self.assertEqual(resp_data['Errors'], [[bad_file, '400 Bad Request']])
+        self.assertEqual(resp_data['Response Status'], '400 Bad Request')
+
+    def test_bulk_delete_bad_file_over_twice_max_length(self):
+        body = '/c/f\nc/' + ('123456' * self.bulk.max_path_length) + '\n'
+        req = Request.blank('/delete_works/AUTH_Acc', body=body)
+        req.method = 'POST'
+        resp_body = self.handle_delete_and_iter(req)
+        self.assertIn(b'400 Bad Request', resp_body)
+
+    def test_bulk_delete_max_failures(self):
+        body = '\n'.join([
+            '/c/f1', '/c/f2', '/c/f3', '/c/f4', '/c/f5', '/c/f6',
+        ])
+        req = Request.blank('/unauth/AUTH_Acc', body=body,
+                            headers={'Accept': 'application/json'})
+        req.method = 'POST'
+        with patch.object(self.bulk, 'max_failed_deletes', 2):
+            resp_body = self.handle_delete_and_iter(req)
+            # We know there should be at least max_failed_deletes, but there
+            # may be more as we clean up in-progress requests.
+            self.assertGreaterEqual(self.app.calls,
+                                    self.bulk.max_failed_deletes)
+            # As we're pulling things off the pile, we:
+            #   - get delete result,
+            #   - process the result,
+            #   - check max_failed_deletes,
+            #   - spawn another delete, repeat.
+            # As a result, we know our app calls should be *strictly* less.
+            # Note this means that when delete_concurrency is one,
+            # self.app.calls will exactly equal self.bulk.max_failed_deletes.
+            self.assertLess(self.app.calls,
+                            self.bulk.max_failed_deletes +
+                            self.bulk.delete_concurrency)
+            resp_data = utils.json.loads(resp_body)
+            self.assertEqual(resp_data['Response Status'], '400 Bad Request')
+            self.assertEqual(resp_data['Response Body'],
+                             'Max delete failures exceeded')
+            self.assertIn(['/c/f1', '401 Unauthorized'], resp_data['Errors'])
+            self.assertIn(['/c/f2', '401 Unauthorized'], resp_data['Errors'])
+
+
+class TestConcurrentDelete(TestDelete):
+    conf = {'delete_concurrency': 3}
+
+    def test_concurrency_set(self):
+        self.assertEqual(self.bulk.delete_concurrency, 3)
+
+
+class TestConfig(unittest.TestCase):
+    def test_defaults(self):
+        expected_defaults = {
+            'delete_concurrency': 2,
+            'max_containers': 10000,
+            'max_deletes_per_request': 10000,
+            'max_failed_deletes': 1000,
+            'max_failed_extractions': 1000,
+            'retry_count': 0,
+            'retry_interval': 1.5,
+            'yield_frequency': 10,
+        }
+
+        filter_app = bulk.filter_factory({})(FakeApp())
+        self.assertEqual(expected_defaults, {k: getattr(filter_app, k)
+                                             for k in expected_defaults})
+
+        filter_app = bulk.Bulk(FakeApp(), None)
+        self.assertEqual(expected_defaults, {k: getattr(filter_app, k)
+                                             for k in expected_defaults})
+
+    def test_delete_concurrency(self):
+        # Must be an integer
+        conf = {'delete_concurrency': '1.5'}
+        self.assertRaises(ValueError, bulk.filter_factory, conf)
+
+        conf = {'delete_concurrency': 'asdf'}
+        self.assertRaises(ValueError, bulk.filter_factory, conf)
+
+        # Will be at least one
+        conf = {'delete_concurrency': '-1'}
+        filter_app = bulk.filter_factory(conf)(FakeApp())
+        self.assertEqual(1, filter_app.delete_concurrency)
+
+        conf = {'delete_concurrency': '0'}
+        filter_app = bulk.filter_factory(conf)(FakeApp())
+        self.assertEqual(1, filter_app.delete_concurrency)
+
+        # But if you want to set it stupid-high, we won't stop you
+        conf = {'delete_concurrency': '1000'}
+        filter_app = bulk.filter_factory(conf)(FakeApp())
+        self.assertEqual(1000, filter_app.delete_concurrency)
+
+        # ...unless it's extra-stupid-high, in which case we cap it
+        conf = {'delete_concurrency': '1001'}
+        filter_app = bulk.filter_factory(conf)(FakeApp())
+        self.assertEqual(1000, filter_app.delete_concurrency)
+
+
+class TestSwiftInfo(unittest.TestCase):
+    def setUp(self):
+        registry._swift_info = {}
+        registry._swift_admin_info = {}
+
+    def test_registered_defaults(self):
+        bulk.filter_factory({})
+        swift_info = registry.get_swift_info()
+        self.assertTrue('bulk_upload' in swift_info)
+        self.assertTrue(isinstance(
+            swift_info['bulk_upload'].get('max_containers_per_extraction'),
+            numbers.Integral))
+        self.assertTrue(isinstance(
+            swift_info['bulk_upload'].get('max_failed_extractions'),
+            numbers.Integral))
+
+        self.assertTrue('bulk_delete' in swift_info)
+        self.assertTrue(isinstance(
+            swift_info['bulk_delete'].get('max_deletes_per_request'),
+            numbers.Integral))
+        self.assertTrue(isinstance(
+            swift_info['bulk_delete'].get('max_failed_deletes'),
+            numbers.Integral))
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/test_catch_errors.py b/test/unit/common/middleware/test_catch_errors.py
new file mode 100644
index 0000000000..6b265b13d9
--- /dev/null
+++ b/test/unit/common/middleware/test_catch_errors.py
@@ -0,0 +1,223 @@
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+
+from swift.common.swob import Request, HTTPOk
+from swift.common.middleware import catch_errors
+from swift.common.utils import get_logger
+
+
+class StrangeException(BaseException):
+    pass
+
+
+class FakeApp(object):
+
+    def __init__(self, error=False, body_iter=None):
+        self.error = error
+        self.body_iter = body_iter
+
+    def __call__(self, env, start_response):
+        if 'swift.trans_id' not in env:
+            raise Exception('Trans id should always be in env')
+        if self.error:
+            if self.error == 'strange':
+                raise StrangeException('whoa')
+            raise Exception('An error occurred')
+        if self.body_iter is None:
+            return [b"FAKE APP"]
+        else:
+            return self.body_iter
+
+
+class TestCatchErrors(unittest.TestCase):
+
+    def setUp(self):
+        self.logger = get_logger({})
+        self.logger.txn_id = None
+
+    def start_response(self, status, headers, *args):
+        request_ids = ('X-Trans-Id', 'X-Openstack-Request-Id')
+        hdict = dict(headers)
+        for key in request_ids:
+            self.assertIn(key, hdict)
+        for key1, key2 in zip(request_ids, request_ids[1:]):
+            self.assertEqual(hdict[key1], hdict[key2])
+
+    def test_catcherrors_passthrough(self):
+        app = catch_errors.CatchErrorMiddleware(FakeApp(), {})
+        req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'})
+        resp = app(req.environ, self.start_response)
+        self.assertEqual(list(resp), [b'FAKE APP'])
+
+    def test_catcherrors(self):
+        app = catch_errors.CatchErrorMiddleware(FakeApp(True), {})
+        req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'})
+        resp = app(req.environ, self.start_response)
+        self.assertEqual(list(resp), [b'An error occurred'])
+
+    def test_trans_id_header_pass(self):
+        self.assertIsNone(self.logger.txn_id)
+
+        app = catch_errors.CatchErrorMiddleware(FakeApp(), {})
+        req = Request.blank('/v1/a/c/o')
+        app(req.environ, self.start_response)
+        self.assertEqual(len(self.logger.txn_id), 34)  # 32 hex + 'tx'
+
+    def test_trans_id_header_fail(self):
+        self.assertIsNone(self.logger.txn_id)
+
+        app = catch_errors.CatchErrorMiddleware(FakeApp(True), {})
+        req = Request.blank('/v1/a/c/o')
+        app(req.environ, self.start_response)
+        self.assertEqual(len(self.logger.txn_id), 34)
+
+    def test_error_in_iterator(self):
+        app = catch_errors.CatchErrorMiddleware(
+            FakeApp(body_iter=(int(x) for x in 'abcd')), {})
+        req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'})
+        resp = app(req.environ, self.start_response)
+        self.assertEqual(list(resp), [b'An error occurred'])
+
+    def test_trans_id_header_suffix(self):
+        self.assertIsNone(self.logger.txn_id)
+
+        app = catch_errors.CatchErrorMiddleware(
+            FakeApp(), {'trans_id_suffix': '-stuff'})
+        req = Request.blank('/v1/a/c/o')
+        app(req.environ, self.start_response)
+        self.assertTrue(self.logger.txn_id.endswith('-stuff'))
+
+    def test_trans_id_header_extra(self):
+        self.assertIsNone(self.logger.txn_id)
+
+        app = catch_errors.CatchErrorMiddleware(
+            FakeApp(), {'trans_id_suffix': '-fromconf'})
+        req = Request.blank('/v1/a/c/o',
+                            headers={'X-Trans-Id-Extra': 'fromuser'})
+        app(req.environ, self.start_response)
+        self.assertTrue(self.logger.txn_id.endswith('-fromconf-fromuser'))
+
+    def test_trans_id_header_extra_length_limit(self):
+        self.assertIsNone(self.logger.txn_id)
+
+        app = catch_errors.CatchErrorMiddleware(
+            FakeApp(), {'trans_id_suffix': '-fromconf'})
+        req = Request.blank('/v1/a/c/o',
+                            headers={'X-Trans-Id-Extra': 'a' * 1000})
+        app(req.environ, self.start_response)
+        self.assertTrue(self.logger.txn_id.endswith(
+            '-aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa'))
+
+    def test_trans_id_header_extra_quoted(self):
+        self.assertIsNone(self.logger.txn_id)
+
+        app = catch_errors.CatchErrorMiddleware(FakeApp(), {})
+        req = Request.blank('/v1/a/c/o',
+                            headers={'X-Trans-Id-Extra': 'xan than"gum'})
+        app(req.environ, self.start_response)
+        self.assertTrue(self.logger.txn_id.endswith('-xan%20than%22gum'))
+
+    def test_catcherrors_with_unexpected_error(self):
+        app = catch_errors.CatchErrorMiddleware(FakeApp(error='strange'), {})
+        req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'})
+        resp = app(req.environ, self.start_response)
+        self.assertEqual(list(resp), [b'An error occurred'])
+
+    def test_has_len(self):
+        # sanity
+        app = HTTPOk(body='test-body')
+        req = Request.blank('/')
+        captured_status_length = []
+
+        def capture_start_resp(status, headers, exc_info=None):
+            length = None
+            for k, v in headers:
+                if k == 'Content-Length':
+                    length = int(v)
+            captured_status_length.append((status, length))
+        iterable = app(req.environ, capture_start_resp)
+        self.assertEqual(captured_status_length, [('200 OK', 9)])
+        self.assertTrue(hasattr(iterable, '__len__'))
+        # wrapped should work the same way
+        app_resp = HTTPOk(body='test-body')
+        app = catch_errors.CatchErrorMiddleware(app_resp, {})
+        req = Request.blank('/')
+        captured_status_length = []
+        iterable = app(req.environ, capture_start_resp)
+        self.assertEqual(captured_status_length, [('200 OK', 9)])
+        self.assertTrue(hasattr(iterable, '__len__'))
+
+    def test_HEAD_with_content_length(self):
+        def cannot_count_app(env, sr):
+            sr("200 OK", [("Content-Length", "10")])
+            return [b""]
+
+        app = catch_errors.CatchErrorMiddleware(cannot_count_app, {})
+        list(app({'REQUEST_METHOD': 'HEAD'}, self.start_response))
+
+    def test_short_response_body(self):
+
+        def cannot_count_app(env, sr):
+            sr("200 OK", [("Content-Length", "2000")])
+            return [b"our staff tailor is Euripedes Imenedes"]
+
+        app = catch_errors.CatchErrorMiddleware(cannot_count_app, {})
+
+        with self.assertRaises(catch_errors.BadResponseLength):
+            list(app({'REQUEST_METHOD': 'GET'}, self.start_response))
+
+    def test_long_response_body(self):
+        def cannot_count_app(env, sr):
+            sr("200 OK", [("Content-Length", "10")])
+            return [b"our optometric firm is C.F. Eye Care"]
+
+        app = catch_errors.CatchErrorMiddleware(cannot_count_app, {})
+
+        with self.assertRaises(catch_errors.BadResponseLength):
+            list(app({'REQUEST_METHOD': 'GET'}, self.start_response))
+
+    def test_bogus_content_length(self):
+
+        def bogus_cl_app(env, sr):
+            sr("200 OK", [("Content-Length", "25 cm")])
+            return [b"our British cutlery specialist is Sir Irving Spoon"]
+
+        app = catch_errors.CatchErrorMiddleware(bogus_cl_app, {})
+        list(app({'REQUEST_METHOD': 'GET'}, self.start_response))
+
+    def test_no_content_length(self):
+
+        def no_cl_app(env, sr):
+            sr("200 OK", [("Content-Type", "application/names")])
+            return [b"our staff statistician is Marge Inovera"]
+
+        app = catch_errors.CatchErrorMiddleware(no_cl_app, {})
+        list(app({'REQUEST_METHOD': 'GET'}, self.start_response))
+
+    def test_multiple_content_lengths(self):
+
+        def poly_cl_app(env, sr):
+            sr("200 OK", [("Content-Length", "30"),
+                          ("Content-Length", "40")])
+            return [b"The head of our personal trainers is Jim Shortz"]
+
+        app = catch_errors.CatchErrorMiddleware(poly_cl_app, {})
+        list(app({'REQUEST_METHOD': 'GET'}, self.start_response))
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/test_cname_lookup.py b/test/unit/common/middleware/test_cname_lookup.py
index 13a5e71bf1..cfdaef4379 100644
--- a/test/unit/common/middleware/test_cname_lookup.py
+++ b/test/unit/common/middleware/test_cname_lookup.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -14,22 +14,33 @@
 # limitations under the License.
 
 import unittest
-from nose import SkipTest
+from unittest import mock
 
 try:
     # this test requires the dnspython package to be installed
-    import dns.resolver
+    import dns.resolver  # noqa
+    import dns.exception
 except ImportError:
     skip = True
 else:  # executed if the try has no errors
     skip = False
+from swift.common import registry
 from swift.common.middleware import cname_lookup
-from swift.common.swob import Request
+from swift.common.swob import Request, HTTPMovedPermanently
+
 
 class FakeApp(object):
 
     def __call__(self, env, start_response):
-        return "FAKE APP"
+        start_response('200 OK', [])
+        return [b"FAKE APP"]
+
+
+class RedirectSlashApp(object):
+
+    def __call__(self, env, start_response):
+        loc = env['PATH_INFO'] + '/'
+        return HTTPMovedPermanently(location=loc)(env, start_response)
 
 
 def start_response(*args):
@@ -38,47 +49,61 @@ def start_response(*args):
 
 class TestCNAMELookup(unittest.TestCase):
 
+    @unittest.skipIf(skip, "can't import dnspython")
     def setUp(self):
-        if skip:
-            raise SkipTest
         self.app = cname_lookup.CNAMELookupMiddleware(FakeApp(),
                                                       {'lookup_depth': 2})
 
-    def test_passthrough(self):
+    def test_pass_ip_addresses(self):
+        req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Host': '10.134.23.198'})
+        resp = self.app(req.environ, start_response)
+        self.assertEqual(resp, [b'FAKE APP'])
 
-        def my_lookup(d):
-            return 0, d
-        cname_lookup.lookup_cname = my_lookup
+        req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Host': 'fc00:7ea1:f155::6321:8841'})
+        resp = self.app(req.environ, start_response)
+        self.assertEqual(resp, [b'FAKE APP'])
 
+    @mock.patch('swift.common.middleware.cname_lookup.lookup_cname',
+                new=lambda d, r: (0, d))
+    def test_passthrough(self):
         req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'},
                             headers={'Host': 'foo.example.com'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, 'FAKE APP')
+        self.assertEqual(resp, [b'FAKE APP'])
         req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'},
                             headers={'Host': 'foo.example.com:8080'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, 'FAKE APP')
+        self.assertEqual(resp, [b'FAKE APP'])
+        req = Request.blank('/', environ={'REQUEST_METHOD': 'GET',
+                                          'SERVER_NAME': 'foo.example.com'},
+                            headers={'Host': None})
+        resp = self.app(req.environ, start_response)
+        self.assertEqual(resp, [b'FAKE APP'])
 
+    @mock.patch('swift.common.middleware.cname_lookup.lookup_cname',
+                new=lambda d, r: (0, '%s.example.com' % d))
     def test_good_lookup(self):
         req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'},
                             headers={'Host': 'mysite.com'})
-        
-        def my_lookup(d):
-            return 0, '%s.example.com' % d
-        cname_lookup.lookup_cname = my_lookup
-        
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, 'FAKE APP')
+        self.assertEqual(resp, [b'FAKE APP'])
         req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'},
                             headers={'Host': 'mysite.com:8080'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, 'FAKE APP')
+        self.assertEqual(resp, [b'FAKE APP'])
+        req = Request.blank('/', environ={'REQUEST_METHOD': 'GET',
+                                          'SERVER_NAME': 'mysite.com'},
+                            headers={'Host': None})
+        resp = self.app(req.environ, start_response)
+        self.assertEqual(resp, [b'FAKE APP'])
 
     def test_lookup_chain_too_long(self):
         req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'},
                             headers={'Host': 'mysite.com'})
-        
-        def my_lookup(d):
+
+        def my_lookup(d, r):
             if d == 'mysite.com':
                 site = 'level1.foo.com'
             elif d == 'level1.foo.com':
@@ -86,44 +111,40 @@ def my_lookup(d):
             elif d == 'level2.foo.com':
                 site = 'bar.example.com'
             return 0, site
-        cname_lookup.lookup_cname = my_lookup
-        
-        resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, ['CNAME lookup failed after 2 tries'])
 
+        with mock.patch('swift.common.middleware.cname_lookup.lookup_cname',
+                        new=my_lookup):
+            resp = self.app(req.environ, start_response)
+            self.assertEqual(resp, [b'CNAME lookup failed after 2 tries'])
+
+    @mock.patch('swift.common.middleware.cname_lookup.lookup_cname',
+                new=lambda d, r: (0, 'some.invalid.site.com'))
     def test_lookup_chain_bad_target(self):
         req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'},
                             headers={'Host': 'mysite.com'})
-        
-        def my_lookup(d):
-            return 0, 'some.invalid.site.com'
-        cname_lookup.lookup_cname = my_lookup
-        
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp,
-                         ['CNAME lookup failed to resolve to a valid domain'])
+        self.assertEqual(resp,
+                         [b'CNAME lookup failed to resolve to a valid domain'])
 
+    @mock.patch('swift.common.middleware.cname_lookup.lookup_cname',
+                new=lambda d, r: (0, None))
     def test_something_weird(self):
         req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'},
                             headers={'Host': 'mysite.com'})
-        
-        def my_lookup(d):
-            return 0, None
-        cname_lookup.lookup_cname = my_lookup
-        
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp,
-                         ['CNAME lookup failed to resolve to a valid domain'])
+        self.assertEqual(resp,
+                         [b'CNAME lookup failed to resolve to a valid domain'])
 
+    @mock.patch('swift.common.middleware.cname_lookup.lookup_cname',
+                new=lambda d, r: (0, '%s.example.com' % d))
     def test_with_memcache(self):
-        def my_lookup(d):
-            return 0, '%s.example.com' % d
-        cname_lookup.lookup_cname = my_lookup
         class memcache_stub(object):
             def __init__(self):
                 self.cache = {}
+
             def get(self, key):
                 return self.cache.get(key, None)
+
             def set(self, key, value, *a, **kw):
                 self.cache[key] = value
         memcache = memcache_stub()
@@ -131,35 +152,305 @@ def set(self, key, value, *a, **kw):
                                           'swift.cache': memcache},
                             headers={'Host': 'mysite.com'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, 'FAKE APP')
+        self.assertEqual(resp, [b'FAKE APP'])
         req = Request.blank('/', environ={'REQUEST_METHOD': 'GET',
                                           'swift.cache': memcache},
                             headers={'Host': 'mysite.com'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, 'FAKE APP')
+        self.assertEqual(resp, [b'FAKE APP'])
+
+    def test_caching(self):
+        fail_to_resolve = [b'CNAME lookup failed to resolve to a valid domain']
+
+        class memcache_stub(object):
+            def __init__(self):
+                self.cache = {}
 
+            def get(self, key):
+                return self.cache.get(key, None)
+
+            def set(self, key, value, *a, **kw):
+                # real memcache client will JSON-serialize, so our mock
+                # should be sure to return unicode
+                if isinstance(value, bytes):
+                    value = value.decode('utf-8')
+                self.cache[key] = value
+
+        module = 'swift.common.middleware.cname_lookup.lookup_cname'
+        dns_module = 'swift.common.middleware.cname_lookup.' \
+            'dns.resolver.Resolver.query'
+        memcache = memcache_stub()
+
+        with mock.patch(module) as m:
+            m.return_value = (3600, 'c.example.com')
+            req = Request.blank('/', environ={'REQUEST_METHOD': 'GET',
+                                              'swift.cache': memcache},
+                                headers={'Host': 'mysite2.com'})
+            resp = self.app(req.environ, start_response)
+            self.assertEqual(resp, [b'FAKE APP'])
+            self.assertEqual(m.call_count, 1)
+            self.assertEqual(memcache.cache.get('cname-mysite2.com'),
+                             'c.example.com')
+            self.assertIsInstance(req.environ['HTTP_HOST'], str)
+            self.assertEqual(req.environ['HTTP_HOST'], 'c.example.com')
+
+            req = Request.blank('/', environ={'REQUEST_METHOD': 'GET',
+                                              'swift.cache': memcache},
+                                headers={'Host': 'mysite2.com'})
+            resp = self.app(req.environ, start_response)
+            self.assertEqual(resp, [b'FAKE APP'])
+            self.assertEqual(m.call_count, 1)
+            self.assertEqual(memcache.cache.get('cname-mysite2.com'),
+                             'c.example.com')
+            self.assertIsInstance(req.environ['HTTP_HOST'], str)
+            self.assertEqual(req.environ['HTTP_HOST'], 'c.example.com')
+
+        for exc, num in ((dns.resolver.NXDOMAIN(), 3),
+                         (dns.resolver.NoAnswer(), 4)):
+            with mock.patch(dns_module) as m:
+                m.side_effect = exc
+                req = Request.blank('/', environ={'REQUEST_METHOD': 'GET',
+                                                  'swift.cache': memcache},
+                                    headers={'Host': 'mysite%d.com' % num})
+                resp = self.app(req.environ, start_response)
+                self.assertEqual(resp, fail_to_resolve)
+                self.assertEqual(m.call_count, 1)
+                self.assertEqual(memcache.cache.get('cname-mysite3.com'),
+                                 False)
+                req = Request.blank('/', environ={'REQUEST_METHOD': 'GET',
+                                                  'swift.cache': memcache},
+                                    headers={'Host': 'mysite%d.com' % num})
+                resp = self.app(req.environ, start_response)
+                self.assertEqual(resp, fail_to_resolve)
+                self.assertEqual(m.call_count, 1)
+                self.assertEqual(
+                    memcache.cache.get('cname-mysite%d.com' % num), False)
+
+        with mock.patch(dns_module) as m:
+            m.side_effect = dns.exception.DNSException()
+            req = Request.blank('/', environ={'REQUEST_METHOD': 'GET',
+                                              'swift.cache': memcache},
+                                headers={'Host': 'mysite5.com'})
+            resp = self.app(req.environ, start_response)
+            self.assertEqual(resp, fail_to_resolve)
+            self.assertEqual(m.call_count, 1)
+            self.assertFalse('cname-mysite5.com' in memcache.cache)
+            req = Request.blank('/', environ={'REQUEST_METHOD': 'GET',
+                                              'swift.cache': memcache},
+                                headers={'Host': 'mysite5.com'})
+            resp = self.app(req.environ, start_response)
+            self.assertEqual(resp, fail_to_resolve)
+            self.assertEqual(m.call_count, 2)
+            self.assertFalse('cname-mysite5.com' in memcache.cache)
+
+    @mock.patch('swift.common.middleware.cname_lookup.lookup_cname',
+                new=lambda d, r: (0, 'c.aexample.com'))
     def test_cname_matching_ending_not_domain(self):
         req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'},
                             headers={'Host': 'foo.com'})
-
-        def my_lookup(d):
-            return 0, 'c.aexample.com'
-        cname_lookup.lookup_cname = my_lookup
-
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp,
-                         ['CNAME lookup failed to resolve to a valid domain'])
+        self.assertEqual(resp,
+                         [b'CNAME lookup failed to resolve to a valid domain'])
 
+    @mock.patch('swift.common.middleware.cname_lookup.lookup_cname',
+                new=lambda d, r: (0, None))
     def test_cname_configured_with_empty_storage_domain(self):
         app = cname_lookup.CNAMELookupMiddleware(FakeApp(),
-                                                {'storage_domain': '',
-                                                 'lookup_depth': 2})
+                                                 {'storage_domain': '',
+                                                  'lookup_depth': 2})
         req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'},
                             headers={'Host': 'c.a.example.com'})
+        resp = app(req.environ, start_response)
+        self.assertEqual(resp, [b'FAKE APP'])
 
-        def my_lookup(d):
-            return 0, None
-        cname_lookup.lookup_cname = my_lookup
+    def test_storage_domains_conf_format(self):
+        conf = {'storage_domain': 'foo.com'}
+        app = cname_lookup.filter_factory(conf)(FakeApp())
+        self.assertEqual(app.storage_domain, ['.foo.com'])
 
-        resp = app(req.environ, start_response)
-        self.assertEquals(resp, 'FAKE APP')
+        conf = {'storage_domain': 'foo.com, '}
+        app = cname_lookup.filter_factory(conf)(FakeApp())
+        self.assertEqual(app.storage_domain, ['.foo.com'])
+
+        conf = {'storage_domain': 'foo.com, bar.com'}
+        app = cname_lookup.filter_factory(conf)(FakeApp())
+        self.assertEqual(app.storage_domain, ['.foo.com', '.bar.com'])
+
+        conf = {'storage_domain': 'foo.com, .bar.com'}
+        app = cname_lookup.filter_factory(conf)(FakeApp())
+        self.assertEqual(app.storage_domain, ['.foo.com', '.bar.com'])
+
+        conf = {'storage_domain': '.foo.com, .bar.com'}
+        app = cname_lookup.filter_factory(conf)(FakeApp())
+        self.assertEqual(app.storage_domain, ['.foo.com', '.bar.com'])
+
+    def test_multiple_storage_domains(self):
+        conf = {'storage_domain': 'storage1.com, storage2.com',
+                'lookup_depth': 2}
+        app = cname_lookup.CNAMELookupMiddleware(FakeApp(), conf)
+
+        def do_test(lookup_back):
+            req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'},
+                                headers={'Host': 'c.a.example.com'})
+            module = 'swift.common.middleware.cname_lookup.lookup_cname'
+            with mock.patch(module, lambda d, r: (0, lookup_back)):
+                return app(req.environ, start_response)
+
+        resp = do_test('c.storage1.com')
+        self.assertEqual(resp, [b'FAKE APP'])
+
+        resp = do_test('c.storage2.com')
+        self.assertEqual(resp, [b'FAKE APP'])
+
+        bad_domain = [b'CNAME lookup failed to resolve to a valid domain']
+        resp = do_test('c.badtest.com')
+        self.assertEqual(resp, bad_domain)
+
+    def test_host_is_storage_domain(self):
+        conf = {'storage_domain': 'storage.example.com',
+                'lookup_depth': 2}
+        app = cname_lookup.CNAMELookupMiddleware(FakeApp(), conf)
+
+        def do_test(host):
+            with mock.patch.object(
+                app.resolver, 'query',
+                side_effect=dns.exception.DNSException,
+            ) as mock_lookup:
+                req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'},
+                                    headers={'Host': host})
+                return app(req.environ, start_response), mock_lookup
+
+        bad_domain = [b'CNAME lookup failed to resolve to a valid domain']
+        resp, mock_lookup = do_test('c.badtest.com')
+        self.assertEqual(resp, bad_domain)
+        self.assertEqual(1, len(mock_lookup.mock_calls))
+
+        resp, mock_lookup = do_test('storage.example.com')
+        self.assertEqual(resp, [b'FAKE APP'])
+        self.assertEqual(0, len(mock_lookup.mock_calls))
+
+    def test_resolution_to_storage_domain_exactly(self):
+        conf = {'storage_domain': 'example.com',
+                'lookup_depth': 1}
+        app = cname_lookup.CNAMELookupMiddleware(FakeApp(), conf)
+
+        req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Host': 'mysite.com'})
+        module = 'swift.common.middleware.cname_lookup.lookup_cname'
+        with mock.patch(module, lambda d, r: (0, 'example.com')):
+            resp = app(req.environ, start_response)
+            self.assertEqual(resp, [b'FAKE APP'])
+
+    def test_redirect(self):
+        app = cname_lookup.CNAMELookupMiddleware(RedirectSlashApp(), {})
+
+        module = 'swift.common.middleware.cname_lookup.lookup_cname'
+        with mock.patch(module, lambda d, r: (0, 'cont.acct.example.com')):
+            req = Request.blank('/test', environ={'REQUEST_METHOD': 'GET'},
+                                headers={'Host': 'mysite.com'})
+            resp = req.get_response(app)
+            self.assertEqual(resp.status_int, 301)
+            self.assertEqual(resp.headers.get('Location'),
+                             'http://mysite.com/test/')
+
+    def test_configured_nameservers(self):
+        class MockedResolver(object):
+            def __init__(self):
+                self.nameservers = None
+                self.nameserver_ports = None
+
+            def query(self, *args, **kwargs):
+                raise Exception('Stop processing')
+
+            def reset(self):
+                self.nameservers = None
+                self.nameserver_ports = None
+
+        mocked_resolver = MockedResolver()
+        dns_module = 'swift.common.middleware.cname_lookup.' \
+            'dns.resolver.Resolver'
+
+        # If no nameservers provided in conf, resolver nameservers is unset
+        for conf in [{}, {'nameservers': ''}]:
+            mocked_resolver.reset()
+            with mock.patch(dns_module, return_value=mocked_resolver):
+                app = cname_lookup.CNAMELookupMiddleware(FakeApp(), conf)
+            self.assertIs(app.resolver, mocked_resolver)
+            self.assertIsNone(mocked_resolver.nameservers)
+
+        # If invalid nameservers provided, resolver nameservers is unset
+        mocked_resolver.reset()
+        conf = {'nameservers': '127.0.0.1, 127.0.0.2, a.b.c.d'}
+        with mock.patch(dns_module, return_value=mocked_resolver):
+            with self.assertRaises(ValueError) as exc_mgr:
+                app = cname_lookup.CNAMELookupMiddleware(FakeApp(), conf)
+            self.assertIn('Invalid cname_lookup/nameservers configuration',
+                          str(exc_mgr.exception))
+
+        # If nameservers provided in conf, resolver nameservers is set
+        mocked_resolver.reset()
+        conf = {'nameservers': '127.0.0.1'}
+        with mock.patch(dns_module, return_value=mocked_resolver):
+            app = cname_lookup.CNAMELookupMiddleware(FakeApp(), conf)
+        self.assertIs(app.resolver, mocked_resolver)
+        self.assertEqual(mocked_resolver.nameservers, ['127.0.0.1'])
+        self.assertEqual(mocked_resolver.nameserver_ports, {})
+
+        # IPv6 is OK
+        mocked_resolver.reset()
+        conf = {'nameservers': '[::1]'}
+        with mock.patch(dns_module, return_value=mocked_resolver):
+            app = cname_lookup.CNAMELookupMiddleware(FakeApp(), conf)
+        self.assertIs(app.resolver, mocked_resolver)
+        self.assertEqual(mocked_resolver.nameservers, ['::1'])
+        self.assertEqual(mocked_resolver.nameserver_ports, {})
+
+        # As are port overrides
+        mocked_resolver.reset()
+        conf = {'nameservers': '127.0.0.1:5354'}
+        with mock.patch(dns_module, return_value=mocked_resolver):
+            app = cname_lookup.CNAMELookupMiddleware(FakeApp(), conf)
+        self.assertIs(app.resolver, mocked_resolver)
+        self.assertEqual(mocked_resolver.nameservers, ['127.0.0.1'])
+        self.assertEqual(mocked_resolver.nameserver_ports, {'127.0.0.1': 5354})
+
+        # And IPv6 with port overrides
+        mocked_resolver.reset()
+        conf = {'nameservers': '[2001:db8::ff00:42:8329]:1234'}
+        with mock.patch(dns_module, return_value=mocked_resolver):
+            app = cname_lookup.CNAMELookupMiddleware(FakeApp(), conf)
+        self.assertIs(app.resolver, mocked_resolver)
+        self.assertEqual(mocked_resolver.nameservers, [
+            '2001:db8::ff00:42:8329'])
+        self.assertEqual(mocked_resolver.nameserver_ports, {
+            '2001:db8::ff00:42:8329': 1234})
+
+        # Also accept lists, and bring it all together
+        mocked_resolver.reset()
+        conf = {'nameservers': '[::1], 127.0.0.1:5354, '
+                               '[2001:db8::ff00:42:8329]:1234'}
+        with mock.patch(dns_module, return_value=mocked_resolver):
+            app = cname_lookup.CNAMELookupMiddleware(FakeApp(), conf)
+        self.assertIs(app.resolver, mocked_resolver)
+        self.assertEqual(mocked_resolver.nameservers, [
+            '::1', '127.0.0.1', '2001:db8::ff00:42:8329'])
+        self.assertEqual(mocked_resolver.nameserver_ports, {
+            '127.0.0.1': 5354, '2001:db8::ff00:42:8329': 1234})
+
+
+class TestSwiftInfo(unittest.TestCase):
+    def setUp(self):
+        registry._swift_info = {}
+        registry._swift_admin_info = {}
+
+    def test_registered_defaults(self):
+        cname_lookup.filter_factory({})
+        swift_info = registry.get_swift_info()
+        self.assertIn('cname_lookup', swift_info)
+        self.assertEqual(swift_info['cname_lookup'].get('lookup_depth'), 1)
+
+    def test_registered_nondefaults(self):
+        cname_lookup.filter_factory({'lookup_depth': '2'})
+        swift_info = registry.get_swift_info()
+        self.assertIn('cname_lookup', swift_info)
+        self.assertEqual(swift_info['cname_lookup'].get('lookup_depth'), 2)
diff --git a/test/unit/common/middleware/test_container_sync.py b/test/unit/common/middleware/test_container_sync.py
new file mode 100644
index 0000000000..eb01a7c11a
--- /dev/null
+++ b/test/unit/common/middleware/test_container_sync.py
@@ -0,0 +1,357 @@
+# Copyright (c) 2013 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import json
+import os
+import shutil
+import tempfile
+import unittest
+import uuid
+from unittest import mock
+
+from swift.common import swob
+from swift.common.middleware import container_sync
+from swift.common.utils.timestamp import Timestamp
+from swift.proxy.controllers.base import get_cache_key
+from swift.proxy.controllers.info import InfoController
+
+from test.debug_logger import debug_logger
+
+
+class FakeApp(object):
+
+    def __call__(self, env, start_response):
+        if env.get('PATH_INFO') == '/info':
+            controller = InfoController(
+                app=mock.Mock(logger=debug_logger()),
+                version=None, expose_info=True,
+                disallowed_sections=[], admin_key=None)
+            handler = getattr(controller, env.get('REQUEST_METHOD'))
+            return handler(swob.Request(env))(env, start_response)
+        if env.get('swift.authorize_override'):
+            body = b'Response to Authorized Request'
+        else:
+            body = b'Pass-Through Response'
+        headers = [('Content-Length', str(len(body)))]
+        if 'HTTP_X_TIMESTAMP' in env:
+            headers.append(('X-Timestamp', env['HTTP_X_TIMESTAMP']))
+        start_response('200 OK', headers)
+        return [body]
+
+
+class TestContainerSync(unittest.TestCase):
+
+    def setUp(self):
+        self.tempdir = tempfile.mkdtemp()
+        with open(
+                os.path.join(self.tempdir, 'container-sync-realms.conf'),
+                'w') as fp:
+            fp.write('''
+[US]
+key = 9ff3b71c849749dbaec4ccdd3cbab62b
+key2 = 1a0a5a0cbd66448084089304442d6776
+cluster_dfw1 = http://dfw1.host/v1/
+            ''')
+        self.app = FakeApp()
+        self.conf = {'swift_dir': self.tempdir}
+        self.sync = container_sync.ContainerSync(self.app, self.conf)
+
+    def tearDown(self):
+        shutil.rmtree(self.tempdir, ignore_errors=1)
+
+    def test_current_not_set(self):
+        # no 'current' option set by default
+        self.assertIsNone(self.sync.realm)
+        self.assertIsNone(self.sync.cluster)
+        info = {}
+
+        def capture_swift_info(key, **options):
+            info[key] = options
+
+        with mock.patch(
+                'swift.common.middleware.container_sync.register_swift_info',
+                new=capture_swift_info):
+            self.sync.register_info()
+
+        for realm, realm_info in info['container_sync']['realms'].items():
+            for cluster, options in realm_info['clusters'].items():
+                self.assertEqual(options.get('current', False), False)
+
+    def test_current_invalid(self):
+        self.conf = {'swift_dir': self.tempdir, 'current': 'foo'}
+        self.sync = container_sync.ContainerSync(self.app, self.conf,
+                                                 logger=debug_logger())
+        self.assertIsNone(self.sync.realm)
+        self.assertIsNone(self.sync.cluster)
+        info = {}
+
+        def capture_swift_info(key, **options):
+            info[key] = options
+
+        with mock.patch(
+                'swift.common.middleware.container_sync.register_swift_info',
+                new=capture_swift_info):
+            self.sync.register_info()
+
+        for realm, realm_info in info['container_sync']['realms'].items():
+            for cluster, options in realm_info['clusters'].items():
+                self.assertEqual(options.get('current', False), False)
+
+        error_lines = self.sync.logger.get_lines_for_level('error')
+        self.assertEqual(error_lines, ['Invalid current '
+                                       '//REALM/CLUSTER (foo)'])
+
+    def test_current_in_realms_conf(self):
+        self.conf = {'swift_dir': self.tempdir, 'current': '//us/dfw1'}
+        self.sync = container_sync.ContainerSync(self.app, self.conf)
+        self.assertEqual('US', self.sync.realm)
+        self.assertEqual('DFW1', self.sync.cluster)
+        info = {}
+
+        def capture_swift_info(key, **options):
+            info[key] = options
+
+        with mock.patch(
+                'swift.common.middleware.container_sync.register_swift_info',
+                new=capture_swift_info):
+            self.sync.register_info()
+
+        for realm, realm_info in info['container_sync']['realms'].items():
+            for cluster, options in realm_info['clusters'].items():
+                if options.get('current'):
+                    break
+        self.assertEqual(realm, self.sync.realm)
+        self.assertEqual(cluster, self.sync.cluster)
+
+    def test_missing_from_realms_conf(self):
+        self.conf = {'swift_dir': self.tempdir, 'current': 'foo/bar'}
+        self.sync = container_sync.ContainerSync(self.app, self.conf,
+                                                 logger=debug_logger())
+        self.assertEqual('FOO', self.sync.realm)
+        self.assertEqual('BAR', self.sync.cluster)
+        info = {}
+
+        def capture_swift_info(key, **options):
+            info[key] = options
+
+        with mock.patch(
+                'swift.common.middleware.container_sync.register_swift_info',
+                new=capture_swift_info):
+            self.sync.register_info()
+
+        for realm, realm_info in info['container_sync']['realms'].items():
+            for cluster, options in realm_info['clusters'].items():
+                self.assertEqual(options.get('current', False), False)
+
+        for line in self.sync.logger.get_lines_for_level('error'):
+            self.assertEqual(line, 'Unknown current '
+                             '//REALM/CLUSTER (//FOO/BAR)')
+
+    def test_pass_through(self):
+        req = swob.Request.blank('/v1/a/c')
+        resp = req.get_response(self.sync)
+        self.assertEqual(resp.status, '200 OK')
+        self.assertEqual(resp.body, b'Pass-Through Response')
+
+    def test_not_enough_args(self):
+        req = swob.Request.blank(
+            '/v1/a/c', headers={'x-container-sync-auth': 'a'})
+        resp = req.get_response(self.sync)
+        self.assertEqual(resp.status, '401 Unauthorized')
+        self.assertEqual(
+            resp.body,
+            b'X-Container-Sync-Auth header not valid; '
+            b'contact cluster operator for support.')
+        self.assertTrue(
+            'cs:not-3-args' in req.environ.get('swift.log_info'),
+            req.environ.get('swift.log_info'))
+
+    def test_realm_miss(self):
+        req = swob.Request.blank(
+            '/v1/a/c', headers={'x-container-sync-auth': 'invalid nonce sig'})
+        resp = req.get_response(self.sync)
+        self.assertEqual(resp.status, '401 Unauthorized')
+        self.assertEqual(
+            resp.body,
+            b'X-Container-Sync-Auth header not valid; '
+            b'contact cluster operator for support.')
+        self.assertTrue(
+            'cs:no-local-realm-key' in req.environ.get('swift.log_info'),
+            req.environ.get('swift.log_info'))
+
+    def test_user_key_miss(self):
+        req = swob.Request.blank(
+            '/v1/a/c', headers={'x-container-sync-auth': 'US nonce sig'})
+        resp = req.get_response(self.sync)
+        self.assertEqual(resp.status, '401 Unauthorized')
+        self.assertEqual(
+            resp.body,
+            b'X-Container-Sync-Auth header not valid; '
+            b'contact cluster operator for support.')
+        self.assertTrue(
+            'cs:no-local-user-key' in req.environ.get('swift.log_info'),
+            req.environ.get('swift.log_info'))
+
+    def test_invalid_sig(self):
+        req = swob.Request.blank(
+            '/v1/a/c', headers={'x-container-sync-auth': 'US nonce sig'})
+        infocache = req.environ.setdefault('swift.infocache', {})
+        infocache[get_cache_key('a', 'c')] = {'sync_key': 'abc'}
+        resp = req.get_response(self.sync)
+        self.assertEqual(resp.status, '401 Unauthorized')
+        self.assertEqual(
+            resp.body,
+            b'X-Container-Sync-Auth header not valid; '
+            b'contact cluster operator for support.')
+        self.assertIn('cs:invalid-sig', req.environ.get('swift.log_info'))
+        self.assertNotIn('swift.authorize_override', req.environ)
+        self.assertNotIn('swift.slo_override', req.environ)
+        self.assertNotIn('swift.symlink_override', req.environ)
+
+    def test_valid_sig(self):
+        ts = '1455221706.726999_0123456789abcdef'
+        sig = self.sync.realms_conf.get_sig(
+            'GET', '/v1/a/c', ts, 'nonce',
+            self.sync.realms_conf.key('US'), 'abc')
+        req = swob.Request.blank('/v1/a/c', headers={
+            'x-container-sync-auth': 'US nonce ' + sig,
+            'x-backend-inbound-x-timestamp': ts})
+        infocache = req.environ.setdefault('swift.infocache', {})
+        infocache[get_cache_key('a', 'c')] = {'sync_key': 'abc'}
+        resp = req.get_response(self.sync)
+        self.assertEqual(resp.status, '200 OK')
+        self.assertEqual(resp.body, b'Response to Authorized Request')
+        self.assertIn('cs:valid', req.environ.get('swift.log_info'))
+        self.assertIn('X-Timestamp', resp.headers)
+        self.assertEqual(ts, resp.headers['X-Timestamp'])
+        self.assertIn('swift.authorize_override', req.environ)
+        self.assertIn('swift.slo_override', req.environ)
+        self.assertIn('swift.symlink_override', req.environ)
+
+    def test_valid_sig2(self):
+        sig = self.sync.realms_conf.get_sig(
+            'GET', '/v1/a/c', '0', 'nonce',
+            self.sync.realms_conf.key2('US'), 'abc')
+        req = swob.Request.blank(
+            '/v1/a/c', headers={'x-container-sync-auth': 'US nonce ' + sig})
+        infocache = req.environ.setdefault('swift.infocache', {})
+        infocache[get_cache_key('a', 'c')] = {'sync_key': 'abc'}
+        resp = req.get_response(self.sync)
+        self.assertEqual(resp.status, '200 OK')
+        self.assertEqual(resp.body, b'Response to Authorized Request')
+        self.assertIn('cs:valid', req.environ.get('swift.log_info'))
+        self.assertIn('swift.authorize_override', req.environ)
+        self.assertIn('swift.slo_override', req.environ)
+        self.assertIn('swift.symlink_override', req.environ)
+
+    def test_valid_sig3(self):
+        ts = Timestamp.zero()
+        sig = self.sync.realms_conf.get_sig(
+            'GET', '/v1/a/c', ts.internal, 'nonce',
+            self.sync.realms_conf.key2('US'), 'abc')
+        req = swob.Request.blank(
+            '/v1/a/c', headers={'x-container-sync-auth': 'US nonce ' + sig,
+                                'x-timestamp': ts.internal})
+        infocache = req.environ.setdefault('swift.infocache', {})
+        infocache[get_cache_key('a', 'c')] = {'sync_key': 'abc'}
+        resp = req.get_response(self.sync)
+        self.assertEqual(resp.status, '200 OK')
+        self.assertEqual(resp.body, b'Response to Authorized Request')
+        self.assertIn('cs:valid', req.environ.get('swift.log_info'))
+        self.assertIn('swift.authorize_override', req.environ)
+        self.assertIn('swift.slo_override', req.environ)
+        self.assertIn('swift.symlink_override', req.environ)
+
+    def test_info(self):
+        req = swob.Request.blank('/info')
+        resp = req.get_response(self.sync)
+        self.assertEqual(resp.status, '200 OK')
+        result = json.loads(resp.body)
+        self.assertEqual(
+            result.get('container_sync'),
+            {'realms': {'US': {'clusters': {'DFW1': {}}}}})
+
+    def test_info_always_fresh(self):
+        req = swob.Request.blank('/info')
+        resp = req.get_response(self.sync)
+        self.assertEqual(resp.status, '200 OK')
+        result = json.loads(resp.body)
+        self.assertEqual(
+            result.get('container_sync'),
+            {'realms': {'US': {'clusters': {'DFW1': {}}}}})
+        with open(
+                os.path.join(self.tempdir, 'container-sync-realms.conf'),
+                'w') as fp:
+            fp.write('''
+[US]
+key = 9ff3b71c849749dbaec4ccdd3cbab62b
+key2 = 1a0a5a0cbd66448084089304442d6776
+cluster_dfw1 = http://dfw1.host/v1/
+
+[UK]
+key = 400b3b357a80413f9d956badff1d9dfe
+cluster_lon3 = http://lon3.host/v1/
+            ''')
+        self.sync.realms_conf.reload()
+        req = swob.Request.blank('/info')
+        resp = req.get_response(self.sync)
+        self.assertEqual(resp.status, '200 OK')
+        result = json.loads(resp.body)
+        self.assertEqual(
+            result.get('container_sync'),
+            {'realms': {
+                'US': {'clusters': {'DFW1': {}}},
+                'UK': {'clusters': {'LON3': {}}}}})
+
+    def test_allow_full_urls_setting(self):
+        req = swob.Request.blank(
+            '/v1/a/c',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'x-container-sync-to': 'http://host/v1/a/c'})
+        resp = req.get_response(self.sync)
+        self.assertEqual(resp.status, '200 OK')
+        self.conf = {'swift_dir': self.tempdir, 'allow_full_urls': 'false'}
+        self.sync = container_sync.ContainerSync(self.app, self.conf)
+        req = swob.Request.blank(
+            '/v1/a/c',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'x-container-sync-to': 'http://host/v1/a/c'})
+        resp = req.get_response(self.sync)
+        self.assertEqual(resp.status, '400 Bad Request')
+        self.assertEqual(
+            resp.body,
+            b'Full URLs are not allowed for X-Container-Sync-To values. Only '
+            b'realm values of the format //realm/cluster/account/container '
+            b'are allowed.\n')
+
+    def test_filter(self):
+        app = FakeApp()
+        unique = uuid.uuid4().hex
+        sync = container_sync.filter_factory(
+            {'global': 'global_value', 'swift_dir': unique},
+            **{'local': 'local_value'})(app)
+        self.assertEqual(sync.app, app)
+        self.assertEqual(sync.conf, {
+            'global': 'global_value', 'swift_dir': unique,
+            'local': 'local_value'})
+        req = swob.Request.blank('/info')
+        resp = req.get_response(sync)
+        self.assertEqual(resp.status, '200 OK')
+        result = json.loads(resp.body)
+        self.assertEqual(result.get('container_sync'), {'realms': {}})
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/test_copy.py b/test/unit/common/middleware/test_copy.py
new file mode 100644
index 0000000000..37201f5a5f
--- /dev/null
+++ b/test/unit/common/middleware/test_copy.py
@@ -0,0 +1,1567 @@
+#!/usr/bin/env python
+# Copyright (c) 2015 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from unittest import mock
+import unittest
+import urllib.parse
+import eventlet
+
+from swift.common import swob
+from swift.common.middleware import copy
+from swift.common.storage_policy import POLICIES
+from swift.common.swob import Request, HTTPException
+from swift.common.utils import close_if_possible, closing_if_possible, md5
+from test.debug_logger import debug_logger
+from test.unit import patch_policies, FakeRing
+from test.unit.common.middleware.helpers import FakeSwift
+from test.unit.proxy.controllers.test_obj import set_http_connect, \
+    PatchedObjControllerApp
+
+
+class TestCopyConstraints(unittest.TestCase):
+    def test_validate_copy_from(self):
+        req = Request.blank(
+            '/v/a/c/o',
+            headers={'x-copy-from': 'c/o2'})
+        src_cont, src_obj = copy._check_copy_from_header(req)
+        self.assertEqual(src_cont, 'c')
+        self.assertEqual(src_obj, 'o2')
+        req = Request.blank(
+            '/v/a/c/o',
+            headers={'x-copy-from': 'c/subdir/o2'})
+        src_cont, src_obj = copy._check_copy_from_header(req)
+        self.assertEqual(src_cont, 'c')
+        self.assertEqual(src_obj, 'subdir/o2')
+        req = Request.blank(
+            '/v/a/c/o',
+            headers={'x-copy-from': '/c/o2'})
+        src_cont, src_obj = copy._check_copy_from_header(req)
+        self.assertEqual(src_cont, 'c')
+        self.assertEqual(src_obj, 'o2')
+
+    def test_validate_bad_copy_from(self):
+        req = Request.blank(
+            '/v/a/c/o',
+            headers={'x-copy-from': 'bad_object'})
+        self.assertRaises(HTTPException,
+                          copy._check_copy_from_header, req)
+
+    def test_validate_destination(self):
+        req = Request.blank(
+            '/v/a/c/o',
+            headers={'destination': 'c/o2'})
+        src_cont, src_obj = copy._check_destination_header(req)
+        self.assertEqual(src_cont, 'c')
+        self.assertEqual(src_obj, 'o2')
+        req = Request.blank(
+            '/v/a/c/o',
+            headers={'destination': 'c/subdir/o2'})
+        src_cont, src_obj = copy._check_destination_header(req)
+        self.assertEqual(src_cont, 'c')
+        self.assertEqual(src_obj, 'subdir/o2')
+        req = Request.blank(
+            '/v/a/c/o',
+            headers={'destination': '/c/o2'})
+        src_cont, src_obj = copy._check_destination_header(req)
+        self.assertEqual(src_cont, 'c')
+        self.assertEqual(src_obj, 'o2')
+
+    def test_validate_bad_destination(self):
+        req = Request.blank(
+            '/v/a/c/o',
+            headers={'destination': 'bad_object'})
+        self.assertRaises(HTTPException,
+                          copy._check_destination_header, req)
+
+
+class TestServerSideCopyMiddleware(unittest.TestCase):
+    def setUp(self):
+        self.app = FakeSwift()
+        self.ssc = copy.filter_factory({})(self.app)
+        self.ssc.logger = self.app.logger
+
+    def tearDown(self):
+        self.assertEqual(self.app.unclosed_requests, {})
+
+    def call_app(self, req, app=None, expect_exception=False):
+        if app is None:
+            app = self.app
+
+        self.authorized = []
+
+        def authorize(req):
+            self.authorized.append(req)
+
+        if 'swift.authorize' not in req.environ:
+            req.environ['swift.authorize'] = authorize
+
+        req.headers.setdefault("User-Agent", "Bruce Wayne")
+
+        status = [None]
+        headers = [None]
+
+        def start_response(s, h, ei=None):
+            status[0] = s
+            headers[0] = h
+
+        body_iter = app(req.environ, start_response)
+        body = b''
+        caught_exc = None
+        try:
+            # appease the close-checker
+            with closing_if_possible(body_iter):
+                for chunk in body_iter:
+                    body += chunk
+        except Exception as exc:
+            if expect_exception:
+                caught_exc = exc
+            else:
+                raise
+
+        if expect_exception:
+            return status[0], headers[0], body, caught_exc
+        else:
+            return status[0], headers[0], body
+
+    def call_ssc(self, req, **kwargs):
+        return self.call_app(req, app=self.ssc, **kwargs)
+
+    def assertRequestEqual(self, req, other):
+        self.assertEqual(req.method, other.method)
+        self.assertEqual(req.path, other.path)
+
+    def test_no_object_in_path_pass_through(self):
+        self.app.register('PUT', '/v1/a/c', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c', method='PUT')
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+
+    def test_object_pass_through_methods(self):
+        for method in ['DELETE', 'GET', 'HEAD', 'REPLICATE']:
+            self.app.register(method, '/v1/a/c/o', swob.HTTPOk, {})
+            req = Request.blank('/v1/a/c/o', method=method)
+            status, headers, body = self.call_ssc(req)
+            self.assertEqual(status, '200 OK')
+            self.assertEqual(len(self.authorized), 1)
+            self.assertRequestEqual(req, self.authorized[0])
+            self.assertNotIn('swift.orig_req_method', req.environ)
+
+    def test_basic_put_with_x_copy_from(self):
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPOk, {}, 'passed')
+        self.app.register('PUT', '/v1/a/c/o2', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/o2', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Content-Length': '0',
+                                     'X-Copy-From': 'c/o'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        self.assertTrue(('X-Copied-From', 'c/o') in headers)
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a/c/o2', self.authorized[1].path)
+        self.assertEqual(self.app.swift_sources[0], 'SSC')
+        self.assertEqual(self.app.swift_sources[1], 'SSC')
+        # For basic test cases, assert orig_req_method behavior
+        self.assertNotIn('swift.orig_req_method', req.environ)
+
+    def test_static_large_object_manifest(self):
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPOk,
+                          {'X-Static-Large-Object': 'True',
+                           'Etag': 'should not be sent'}, 'passed')
+        self.app.register('PUT', '/v1/a/c/o2?multipart-manifest=put',
+                          swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/o2?multipart-manifest=get',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Content-Length': '0',
+                                     'X-Copy-From': 'c/o'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        self.assertTrue(('X-Copied-From', 'c/o') in headers)
+        self.assertEqual(2, len(self.app.calls))
+        self.assertEqual('GET', self.app.calls[0][0])
+        get_path, qs = self.app.calls[0][1].split('?')
+        params = urllib.parse.parse_qs(qs)
+        self.assertDictEqual(
+            {'format': ['raw'], 'multipart-manifest': ['get']}, params)
+        self.assertEqual(get_path, '/v1/a/c/o')
+        self.assertEqual(self.app.calls[1],
+                         ('PUT', '/v1/a/c/o2?multipart-manifest=put'))
+        req_headers = self.app.headers[1]
+        self.assertNotIn('X-Static-Large-Object', req_headers)
+        self.assertNotIn('Etag', req_headers)
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a/c/o2', self.authorized[1].path)
+
+    def test_static_large_object(self):
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPOk,
+                          {'X-Static-Large-Object': 'True',
+                           'Etag': 'should not be sent'}, 'passed')
+        self.app.register('PUT', '/v1/a/c/o2',
+                          swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/o2',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Content-Length': '0',
+                                     'X-Copy-From': 'c/o'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        self.assertTrue(('X-Copied-From', 'c/o') in headers)
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/a/c/o'),
+            ('PUT', '/v1/a/c/o2')])
+        req_headers = self.app.headers[1]
+        self.assertNotIn('X-Static-Large-Object', req_headers)
+        self.assertNotIn('Etag', req_headers)
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a/c/o2', self.authorized[1].path)
+
+    def test_basic_put_with_x_copy_from_across_container(self):
+        self.app.register('GET', '/v1/a/c1/o1', swob.HTTPOk, {}, 'passed')
+        self.app.register('PUT', '/v1/a/c2/o2', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c2/o2', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Content-Length': '0',
+                                     'X-Copy-From': 'c1/o1'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        self.assertTrue(('X-Copied-From', 'c1/o1') in headers)
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c1/o1', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a/c2/o2', self.authorized[1].path)
+
+    def test_basic_put_with_x_copy_from_across_container_and_account(self):
+        self.app.register('GET', '/v1/a1/c1/o1', swob.HTTPOk, {}, 'passed')
+        self.app.register('PUT', '/v1/a2/c2/o2', swob.HTTPCreated, {},
+                          'passed')
+        req = Request.blank('/v1/a2/c2/o2', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Content-Length': '0',
+                                     'X-Copy-From': 'c1/o1',
+                                     'X-Copy-From-Account': 'a1'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        self.assertTrue(('X-Copied-From', 'c1/o1') in headers)
+        self.assertTrue(('X-Copied-From-Account', 'a1') in headers)
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a1/c1/o1', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a2/c2/o2', self.authorized[1].path)
+
+    def test_copy_non_zero_content_length(self):
+        req = Request.blank('/v1/a/c2/o2', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Content-Length': '10',
+                                     'X-Copy-From': 'c1/o1'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '400 Bad Request')
+
+    def test_copy_non_zero_content_length_with_account(self):
+        req = Request.blank('/v1/a2/c2/o2', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Content-Length': '10',
+                                     'X-Copy-From': 'c1/o1',
+                                     'X-Copy-From-Account': 'a1'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '400 Bad Request')
+
+    def test_copy_with_slashes_in_x_copy_from(self):
+        self.app.register('GET', '/v1/a/c/o/o2', swob.HTTPOk, {}, 'passed')
+        self.app.register('PUT', '/v1/a/c/o', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Content-Length': '0',
+                                     'X-Copy-From': 'c/o/o2'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        self.assertTrue(('X-Copied-From', 'c/o/o2') in headers)
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o/o2', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[1].path)
+
+    def test_copy_with_slashes_in_x_copy_from_and_account(self):
+        self.app.register('GET', '/v1/a1/c1/o/o1', swob.HTTPOk, {}, 'passed')
+        self.app.register('PUT', '/v1/a2/c2/o2', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a2/c2/o2', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Content-Length': '0',
+                                     'X-Copy-From': 'c1/o/o1',
+                                     'X-Copy-From-Account': 'a1'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        self.assertTrue(('X-Copied-From', 'c1/o/o1') in headers)
+        self.assertTrue(('X-Copied-From-Account', 'a1') in headers)
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a1/c1/o/o1', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a2/c2/o2', self.authorized[1].path)
+
+    def test_copy_with_spaces_in_x_copy_from(self):
+        self.app.register('GET', '/v1/a/c/o o2', swob.HTTPOk, {}, 'passed')
+        self.app.register('PUT', '/v1/a/c/o', swob.HTTPCreated, {})
+        # space in soure path
+        req = Request.blank('/v1/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Content-Length': '0',
+                                     'X-Copy-From': 'c/o%20o2'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        calls = self.app.calls_with_headers
+        method, path, req_headers = calls[0]
+        self.assertEqual('GET', method)
+        self.assertEqual('/v1/a/c/o o2', path)
+        self.assertTrue(('X-Copied-From', 'c/o%20o2') in headers)
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o%20o2', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[1].path)
+
+    def test_copy_with_unicode(self):
+        self.app.register('GET', '/v1/a/c/\xF0\x9F\x8C\xB4', swob.HTTPOk,
+                          {}, 'passed')
+        self.app.register('PUT', '/v1/a/c/\xE2\x98\x83', swob.HTTPCreated, {})
+        # Just for fun, let's have a mix of properly encoded and not
+        req = Request.blank('/v1/a/c/%F0\x9F%8C%B4',
+                            environ={'REQUEST_METHOD': 'COPY'},
+                            headers={'Content-Length': '0',
+                                     'Destination': 'c/%E2\x98%83'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        calls = self.app.calls_with_headers
+        method, path, req_headers = calls[0]
+        self.assertEqual('GET', method)
+        self.assertEqual('/v1/a/c/\xF0\x9F\x8C\xB4', path)
+        self.assertIn(('X-Copied-From', 'c/%F0%9F%8C%B4'), headers)
+
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/%F0%9F%8C%B4', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a/c/%E2%98%83', self.authorized[1].path)
+
+    def test_copy_with_spaces_in_x_copy_from_and_account(self):
+        self.app.register('GET', '/v1/a/c/o o2', swob.HTTPOk, {}, b'passed')
+        self.app.register('PUT', '/v1/a1/c1/o', swob.HTTPCreated, {})
+        # space in soure path
+        req = Request.blank('/v1/a1/c1/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Content-Length': '0',
+                                     'X-Copy-From': 'c/o%20o2',
+                                     'X-Copy-From-Account': 'a'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        calls = self.app.calls_with_headers
+        method, path, req_headers = calls[0]
+        self.assertEqual('GET', method)
+        self.assertEqual('/v1/a/c/o o2', path)
+        self.assertTrue(('X-Copied-From', 'c/o%20o2') in headers)
+        self.assertTrue(('X-Copied-From-Account', 'a') in headers)
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o%20o2', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a1/c1/o', self.authorized[1].path)
+
+    def test_copy_with_leading_slash_in_x_copy_from(self):
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPOk, {}, 'passed')
+        self.app.register('PUT', '/v1/a/c/o', swob.HTTPCreated, {})
+        # repeat tests with leading /
+        req = Request.blank('/v1/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Content-Length': '0',
+                                     'X-Copy-From': '/c/o'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        calls = self.app.calls_with_headers
+        method, path, req_headers = calls[0]
+        self.assertEqual('GET', method)
+        self.assertEqual('/v1/a/c/o', path)
+        self.assertTrue(('X-Copied-From', 'c/o') in headers)
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[1].path)
+
+    def test_copy_with_leading_slash_in_x_copy_from_and_account(self):
+        # repeat tests with leading /
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPOk, {}, 'passed')
+        self.app.register('PUT', '/v1/a1/c1/o', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a1/c1/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Content-Length': '0',
+                                     'X-Copy-From': '/c/o',
+                                     'X-Copy-From-Account': 'a'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        calls = self.app.calls_with_headers
+        method, path, req_headers = calls[0]
+        self.assertEqual('GET', method)
+        self.assertEqual('/v1/a/c/o', path)
+        self.assertTrue(('X-Copied-From', 'c/o') in headers)
+        self.assertTrue(('X-Copied-From-Account', 'a') in headers)
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a1/c1/o', self.authorized[1].path)
+
+    def test_copy_with_leading_slash_and_slashes_in_x_copy_from(self):
+        self.app.register('GET', '/v1/a/c/o/o2', swob.HTTPOk, {}, 'passed')
+        self.app.register('PUT', '/v1/a/c/o', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Content-Length': '0',
+                                     'X-Copy-From': '/c/o/o2'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        calls = self.app.calls_with_headers
+        method, path, req_headers = calls[0]
+        self.assertEqual('GET', method)
+        self.assertEqual('/v1/a/c/o/o2', path)
+        self.assertTrue(('X-Copied-From', 'c/o/o2') in headers)
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o/o2', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[1].path)
+
+    def test_copy_with_leading_slash_and_slashes_in_x_copy_from_acct(self):
+        self.app.register('GET', '/v1/a/c/o/o2', swob.HTTPOk, {}, 'passed')
+        self.app.register('PUT', '/v1/a1/c1/o', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a1/c1/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Content-Length': '0',
+                                     'X-Copy-From': '/c/o/o2',
+                                     'X-Copy-From-Account': 'a'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        calls = self.app.calls_with_headers
+        method, path, req_headers = calls[0]
+        self.assertEqual('GET', method)
+        self.assertEqual('/v1/a/c/o/o2', path)
+        self.assertTrue(('X-Copied-From', 'c/o/o2') in headers)
+        self.assertTrue(('X-Copied-From-Account', 'a') in headers)
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o/o2', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a1/c1/o', self.authorized[1].path)
+
+    def test_copy_with_no_object_in_x_copy_from(self):
+        req = Request.blank('/v1/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Content-Length': '0',
+                                     'X-Copy-From': '/c'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '412 Precondition Failed')
+
+    def test_copy_with_no_object_in_x_copy_from_and_account(self):
+        req = Request.blank('/v1/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Content-Length': '0',
+                                     'X-Copy-From': '/c',
+                                     'X-Copy-From-Account': 'a'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '412 Precondition Failed')
+
+    def test_copy_with_bad_x_copy_from_account(self):
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Content-Length': '0',
+                                     'X-Copy-From': '/c/o',
+                                     'X-Copy-From-Account': '/i/am/bad'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '412 Precondition Failed')
+
+    def test_copy_server_error_reading_source(self):
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPServiceUnavailable, {})
+        req = Request.blank('/v1/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Content-Length': '0',
+                                     'X-Copy-From': '/c/o'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '503 Service Unavailable')
+
+    def test_copy_server_error_reading_source_and_account(self):
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPServiceUnavailable, {})
+        req = Request.blank('/v1/a1/c1/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Content-Length': '0',
+                                     'X-Copy-From': '/c/o',
+                                     'X-Copy-From-Account': 'a'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '503 Service Unavailable')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[0].path)
+
+    def test_copy_not_found_reading_source(self):
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPNotFound, {})
+        req = Request.blank('/v1/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Content-Length': '0',
+                                     'X-Copy-From': '/c/o'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '404 Not Found')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[0].path)
+
+    def test_copy_not_found_reading_source_and_account(self):
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPNotFound, {})
+        req = Request.blank('/v1/a1/c1/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Content-Length': '0',
+                                     'X-Copy-From': '/c/o',
+                                     'X-Copy-From-Account': 'a'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '404 Not Found')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[0].path)
+
+    def test_copy_with_object_metadata(self):
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPOk, {}, 'passed')
+        self.app.register('PUT', '/v1/a/c/o', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Content-Length': '0',
+                                     'X-Copy-From': '/c/o',
+                                     'X-Object-Meta-Ours': 'okay'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        calls = self.app.calls_with_headers
+        method, path, req_headers = calls[1]
+        self.assertEqual('PUT', method)
+        self.assertEqual('/v1/a/c/o', path)
+        self.assertEqual(req_headers['X-Object-Meta-Ours'], 'okay')
+        self.assertTrue(('X-Object-Meta-Ours', 'okay') in headers)
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[1].path)
+
+    def test_copy_with_object_metadata_and_account(self):
+        self.app.register('GET', '/v1/a1/c/o', swob.HTTPOk, {}, 'passed')
+        self.app.register('PUT', '/v1/a/c/o', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Content-Length': '0',
+                                     'X-Copy-From': '/c/o',
+                                     'X-Object-Meta-Ours': 'okay',
+                                     'X-Copy-From-Account': 'a1'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        calls = self.app.calls_with_headers
+        method, path, req_headers = calls[1]
+        self.assertEqual('PUT', method)
+        self.assertEqual('/v1/a/c/o', path)
+        self.assertEqual(req_headers['X-Object-Meta-Ours'], 'okay')
+        self.assertTrue(('X-Object-Meta-Ours', 'okay') in headers)
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a1/c/o', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[1].path)
+
+    def test_copy_source_larger_than_max_file_size(self):
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPOk, {}, "largebody")
+        req = Request.blank('/v1/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Content-Length': '0',
+                                     'X-Copy-From': '/c/o'})
+        with mock.patch('swift.common.middleware.copy.'
+                        'MAX_FILE_SIZE', 1):
+            status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '413 Request Entity Too Large')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[0].path)
+
+    def test_basic_COPY(self):
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPOk, {
+            'etag': 'is sent'}, 'passed')
+        self.app.register('PUT', '/v1/a/c/o-copy', swob.HTTPCreated, {})
+        req = Request.blank(
+            '/v1/a/c/o', method='COPY',
+            headers={'Content-Length': 0,
+                     'Destination': 'c/o-copy'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        self.assertTrue(('X-Copied-From', 'c/o') in headers)
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a/c/o-copy', self.authorized[1].path)
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/a/c/o'),
+            ('PUT', '/v1/a/c/o-copy')])
+        self.assertIn('etag', self.app.headers[1])
+        self.assertEqual(self.app.headers[1]['etag'], 'is sent')
+        # For basic test cases, assert orig_req_method behavior
+        self.assertEqual(req.environ['swift.orig_req_method'], 'COPY')
+
+    def test_basic_DLO(self):
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPOk, {
+            'x-object-manifest': 'some/path',
+            'etag': 'is not sent'}, 'passed')
+        self.app.register('PUT', '/v1/a/c/o-copy', swob.HTTPCreated, {})
+        req = Request.blank(
+            '/v1/a/c/o', method='COPY',
+            headers={'Content-Length': 0,
+                     'Destination': 'c/o-copy'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        self.assertTrue(('X-Copied-From', 'c/o') in headers)
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/a/c/o'),
+            ('PUT', '/v1/a/c/o-copy')])
+        self.assertNotIn('x-object-manifest', self.app.headers[1])
+        self.assertNotIn('etag', self.app.headers[1])
+
+    def test_basic_DLO_manifest(self):
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPOk, {
+            'x-object-manifest': 'some/path',
+            'etag': 'is sent'}, 'passed')
+        self.app.register('PUT', '/v1/a/c/o-copy', swob.HTTPCreated, {})
+        req = Request.blank(
+            '/v1/a/c/o?multipart-manifest=get', method='COPY',
+            headers={'Content-Length': 0,
+                     'Destination': 'c/o-copy'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        self.assertTrue(('X-Copied-From', 'c/o') in headers)
+        self.assertEqual(2, len(self.app.calls))
+        self.assertEqual('GET', self.app.calls[0][0])
+        get_path, qs = self.app.calls[0][1].split('?')
+        params = urllib.parse.parse_qs(qs)
+        self.assertDictEqual(
+            {'format': ['raw'], 'multipart-manifest': ['get']}, params)
+        self.assertEqual(get_path, '/v1/a/c/o')
+        self.assertEqual(self.app.calls[1], ('PUT', '/v1/a/c/o-copy'))
+        self.assertIn('x-object-manifest', self.app.headers[1])
+        self.assertEqual(self.app.headers[1]['x-object-manifest'], 'some/path')
+        self.assertIn('etag', self.app.headers[1])
+        self.assertEqual(self.app.headers[1]['etag'], 'is sent')
+
+    def test_COPY_source_metadata(self):
+        source_headers = {
+            'x-object-sysmeta-test1': 'copy me',
+            'x-object-meta-test2': 'copy me too',
+            'x-object-transient-sysmeta-test3': 'ditto',
+            'x-object-sysmeta-container-update-override-etag': 'etag val',
+            'x-object-sysmeta-container-update-override-size': 'size val',
+            'x-object-sysmeta-container-update-override-foo': 'bar',
+            'x-delete-at': 'delete-at-time'}
+
+        get_resp_headers = source_headers.copy()
+        get_resp_headers['etag'] = 'source etag'
+        self.app.register(
+            'GET', '/v1/a/c/o', swob.HTTPOk,
+            headers=get_resp_headers, body=b'passed')
+
+        def verify_headers(expected_headers, unexpected_headers,
+                           actual_headers):
+            for k, v in actual_headers:
+                if k.lower() in expected_headers:
+                    expected_val = expected_headers.pop(k.lower())
+                    self.assertEqual(expected_val, v)
+                self.assertNotIn(k.lower(), unexpected_headers)
+            self.assertFalse(expected_headers)
+
+        # use a COPY request
+        self.app.register('PUT', '/v1/a/c/o-copy0', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/o', method='COPY',
+                            headers={'Content-Length': 0,
+                                     'Destination': 'c/o-copy0'})
+        status, resp_headers, body = self.call_ssc(req)
+        self.assertEqual('201 Created', status)
+        verify_headers(source_headers.copy(), [], resp_headers)
+        method, path, put_headers = self.app.calls_with_headers[-1]
+        self.assertEqual('PUT', method)
+        self.assertEqual('/v1/a/c/o-copy0', path)
+        verify_headers(source_headers.copy(), [], put_headers.items())
+        self.assertIn('etag', put_headers)
+        self.assertEqual(put_headers['etag'], 'source etag')
+
+        req = Request.blank('/v1/a/c/o-copy0', method='GET')
+        status, resp_headers, body = self.call_ssc(req)
+        self.assertEqual('200 OK', status)
+        verify_headers(source_headers.copy(), [], resp_headers)
+
+        # use a COPY request with a Range header
+        self.app.register('PUT', '/v1/a/c/o-copy1', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/o', method='COPY',
+                            headers={'Content-Length': 0,
+                                     'Destination': 'c/o-copy1',
+                                     'Range': 'bytes=1-2'})
+        status, resp_headers, body = self.call_ssc(req)
+        expected_headers = source_headers.copy()
+        unexpected_headers = (
+            'x-object-sysmeta-container-update-override-etag',
+            'x-object-sysmeta-container-update-override-size',
+            'x-object-sysmeta-container-update-override-foo')
+        for h in unexpected_headers:
+            expected_headers.pop(h)
+        self.assertEqual('201 Created', status)
+        verify_headers(expected_headers, unexpected_headers, resp_headers)
+        method, path, put_headers = self.app.calls_with_headers[-1]
+        self.assertEqual('PUT', method)
+        self.assertEqual('/v1/a/c/o-copy1', path)
+        verify_headers(
+            expected_headers, unexpected_headers, put_headers.items())
+        # etag should not be copied with a Range request
+        self.assertNotIn('etag', put_headers)
+
+        req = Request.blank('/v1/a/c/o-copy1', method='GET')
+        status, resp_headers, body = self.call_ssc(req)
+        self.assertEqual('200 OK', status)
+        verify_headers(expected_headers, unexpected_headers, resp_headers)
+
+        # use a PUT with x-copy-from
+        self.app.register('PUT', '/v1/a/c/o-copy2', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/o-copy2', method='PUT',
+                            headers={'Content-Length': 0,
+                                     'X-Copy-From': 'c/o'})
+        status, resp_headers, body = self.call_ssc(req)
+        self.assertEqual('201 Created', status)
+        verify_headers(source_headers.copy(), [], resp_headers)
+        method, path, put_headers = self.app.calls_with_headers[-1]
+        self.assertEqual('PUT', method)
+        self.assertEqual('/v1/a/c/o-copy2', path)
+        verify_headers(source_headers.copy(), [], put_headers.items())
+        self.assertIn('etag', put_headers)
+        self.assertEqual(put_headers['etag'], 'source etag')
+
+        req = Request.blank('/v1/a/c/o-copy2', method='GET')
+        status, resp_headers, body = self.call_ssc(req)
+        self.assertEqual('200 OK', status)
+        verify_headers(source_headers.copy(), [], resp_headers)
+
+        # copy to same path as source
+        self.app.register('PUT', '/v1/a/c/o', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/o', method='PUT',
+                            headers={'Content-Length': 0,
+                                     'X-Copy-From': 'c/o'})
+        status, resp_headers, body = self.call_ssc(req)
+        self.assertEqual('201 Created', status)
+        verify_headers(source_headers.copy(), [], resp_headers)
+        method, path, put_headers = self.app.calls_with_headers[-1]
+        self.assertEqual('PUT', method)
+        self.assertEqual('/v1/a/c/o', path)
+        verify_headers(source_headers.copy(), [], put_headers.items())
+        self.assertIn('etag', put_headers)
+        self.assertEqual(put_headers['etag'], 'source etag')
+
+    def test_COPY_no_destination_header(self):
+        req = Request.blank(
+            '/v1/a/c/o', method='COPY', headers={'Content-Length': 0})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '412 Precondition Failed')
+        self.assertEqual(len(self.authorized), 0)
+
+    def test_basic_COPY_account(self):
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPOk, {}, 'passed')
+        self.app.register('PUT', '/v1/a1/c1/o2', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'COPY'},
+                            headers={'Destination': 'c1/o2',
+                                     'Destination-Account': 'a1'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        calls = self.app.calls_with_headers
+        method, path, req_headers = calls[0]
+        self.assertEqual('GET', method)
+        self.assertEqual('/v1/a/c/o', path)
+        method, path, req_headers = calls[1]
+        self.assertEqual('PUT', method)
+        self.assertEqual('/v1/a1/c1/o2', path)
+        self.assertTrue(('X-Copied-From', 'c/o') in headers)
+        self.assertTrue(('X-Copied-From-Account', 'a') in headers)
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a1/c1/o2', self.authorized[1].path)
+
+    def test_COPY_across_containers(self):
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPOk, {}, 'passed')
+        self.app.register('PUT', '/v1/a/c2/o', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'COPY'},
+                            headers={'Destination': 'c2/o'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        self.assertTrue(('X-Copied-From', 'c/o') in headers)
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a/c2/o', self.authorized[1].path)
+
+    def test_COPY_source_with_slashes_in_name(self):
+        self.app.register('GET', '/v1/a/c/o/o2', swob.HTTPOk, {}, 'passed')
+        self.app.register('PUT', '/v1/a/c/o', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/o/o2',
+                            environ={'REQUEST_METHOD': 'COPY'},
+                            headers={'Destination': 'c/o'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        calls = self.app.calls_with_headers
+        method, path, req_headers = calls[1]
+        self.assertEqual('PUT', method)
+        self.assertEqual('/v1/a/c/o', path)
+        self.assertTrue(('X-Copied-From', 'c/o/o2') in headers)
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o/o2', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[1].path)
+
+    def test_COPY_account_source_with_slashes_in_name(self):
+        self.app.register('GET', '/v1/a/c/o/o2', swob.HTTPOk, {}, 'passed')
+        self.app.register('PUT', '/v1/a1/c1/o', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/o/o2',
+                            environ={'REQUEST_METHOD': 'COPY'},
+                            headers={'Destination': 'c1/o',
+                                     'Destination-Account': 'a1'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        calls = self.app.calls_with_headers
+        method, path, req_headers = calls[1]
+        self.assertEqual('PUT', method)
+        self.assertEqual('/v1/a1/c1/o', path)
+        self.assertTrue(('X-Copied-From', 'c/o/o2') in headers)
+        self.assertTrue(('X-Copied-From-Account', 'a') in headers)
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o/o2', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a1/c1/o', self.authorized[1].path)
+
+    def test_COPY_destination_leading_slash(self):
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPOk, {}, 'passed')
+        self.app.register('PUT', '/v1/a/c/o', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'COPY'},
+                            headers={'Destination': '/c/o'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        self.assertTrue(('X-Copied-From', 'c/o') in headers)
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[1].path)
+
+    def test_COPY_account_destination_leading_slash(self):
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPOk, {}, 'passed')
+        self.app.register('PUT', '/v1/a1/c1/o', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'COPY'},
+                            headers={'Destination': '/c1/o',
+                                     'Destination-Account': 'a1'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        calls = self.app.calls_with_headers
+        method, path, req_headers = calls[1]
+        self.assertEqual('PUT', method)
+        self.assertEqual('/v1/a1/c1/o', path)
+        self.assertTrue(('X-Copied-From', 'c/o') in headers)
+        self.assertTrue(('X-Copied-From-Account', 'a') in headers)
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a1/c1/o', self.authorized[1].path)
+
+    def test_COPY_source_with_slashes_destination_leading_slash(self):
+        self.app.register('GET', '/v1/a/c/o/o2', swob.HTTPOk, {}, 'passed')
+        self.app.register('PUT', '/v1/a/c/o', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/o/o2',
+                            environ={'REQUEST_METHOD': 'COPY'},
+                            headers={'Destination': '/c/o'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        calls = self.app.calls_with_headers
+        method, path, req_headers = calls[1]
+        self.assertEqual('PUT', method)
+        self.assertEqual('/v1/a/c/o', path)
+        self.assertTrue(('X-Copied-From', 'c/o/o2') in headers)
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o/o2', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[1].path)
+
+    def test_COPY_account_source_with_slashes_destination_leading_slash(self):
+        self.app.register('GET', '/v1/a/c/o/o2', swob.HTTPOk, {}, 'passed')
+        self.app.register('PUT', '/v1/a1/c1/o', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/o/o2',
+                            environ={'REQUEST_METHOD': 'COPY'},
+                            headers={'Destination': '/c1/o',
+                                     'Destination-Account': 'a1'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        calls = self.app.calls_with_headers
+        method, path, req_headers = calls[1]
+        self.assertEqual('PUT', method)
+        self.assertEqual('/v1/a1/c1/o', path)
+        self.assertTrue(('X-Copied-From', 'c/o/o2') in headers)
+        self.assertTrue(('X-Copied-From-Account', 'a') in headers)
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o/o2', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a1/c1/o', self.authorized[1].path)
+
+    def test_COPY_no_object_in_destination(self):
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'COPY'},
+                            headers={'Destination': 'c_o'})
+        status, headers, body = self.call_ssc(req)
+
+        self.assertEqual(status, '412 Precondition Failed')
+
+    def test_COPY_account_no_object_in_destination(self):
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'COPY'},
+                            headers={'Destination': 'c_o',
+                                     'Destination-Account': 'a1'})
+        status, headers, body = self.call_ssc(req)
+
+        self.assertEqual(status, '412 Precondition Failed')
+
+    def test_COPY_account_bad_destination_account(self):
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'COPY'},
+                            headers={'Destination': '/c/o',
+                                     'Destination-Account': '/i/am/bad'})
+        status, headers, body = self.call_ssc(req)
+
+        self.assertEqual(status, '412 Precondition Failed')
+
+    def test_COPY_server_error_reading_source(self):
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPServiceUnavailable, {})
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'COPY'},
+                            headers={'Destination': '/c/o'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '503 Service Unavailable')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[0].path)
+
+    def test_COPY_account_server_error_reading_source(self):
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPServiceUnavailable, {})
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'COPY'},
+                            headers={'Destination': '/c1/o',
+                                     'Destination-Account': 'a1'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '503 Service Unavailable')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[0].path)
+
+    def test_COPY_not_found_reading_source(self):
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPNotFound, {})
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'COPY'},
+                            headers={'Destination': '/c/o'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '404 Not Found')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[0].path)
+
+    def test_COPY_account_not_found_reading_source(self):
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPNotFound, {})
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'COPY'},
+                            headers={'Destination': '/c1/o',
+                                     'Destination-Account': 'a1'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '404 Not Found')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[0].path)
+
+    def test_COPY_with_metadata(self):
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPOk, {}, "passed")
+        self.app.register('PUT', '/v1/a/c/o', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'COPY'},
+                            headers={'Destination': '/c/o',
+                                     'X-Object-Meta-Ours': 'okay'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        calls = self.app.calls_with_headers
+        method, path, req_headers = calls[1]
+        self.assertEqual('PUT', method)
+        self.assertEqual('/v1/a/c/o', path)
+        self.assertEqual(req_headers['X-Object-Meta-Ours'], 'okay')
+        self.assertTrue(('X-Object-Meta-Ours', 'okay') in headers)
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[1].path)
+
+    def test_COPY_account_with_metadata(self):
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPOk, {}, "passed")
+        self.app.register('PUT', '/v1/a1/c1/o', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'COPY'},
+                            headers={'Destination': '/c1/o',
+                                     'X-Object-Meta-Ours': 'okay',
+                                     'Destination-Account': 'a1'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        calls = self.app.calls_with_headers
+        method, path, req_headers = calls[1]
+        self.assertEqual('PUT', method)
+        self.assertEqual('/v1/a1/c1/o', path)
+        self.assertEqual(req_headers['X-Object-Meta-Ours'], 'okay')
+        self.assertTrue(('X-Object-Meta-Ours', 'okay') in headers)
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a1/c1/o', self.authorized[1].path)
+
+    def test_COPY_source_zero_content_length(self):
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPOk, {}, None)
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'COPY'},
+                            headers={'Destination': '/c/o'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '413 Request Entity Too Large')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[0].path)
+
+    def test_COPY_source_larger_than_max_file_size(self):
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPOk, {}, "largebody")
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'COPY'},
+                            headers={'Destination': '/c/o'})
+        with mock.patch('swift.common.middleware.copy.'
+                        'MAX_FILE_SIZE', 1):
+            status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '413 Request Entity Too Large')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[0].path)
+
+    def test_COPY_account_source_zero_content_length(self):
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPOk, {}, None)
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'COPY'},
+                            headers={'Destination': '/c/o',
+                                     'Destination-Account': 'a1'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '413 Request Entity Too Large')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[0].path)
+
+    def test_COPY_account_source_larger_than_max_file_size(self):
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPOk, {}, "largebody")
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'COPY'},
+                            headers={'Destination': '/c1/o',
+                                     'Destination-Account': 'a1'})
+        with mock.patch('swift.common.middleware.copy.'
+                        'MAX_FILE_SIZE', 1):
+            status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '413 Request Entity Too Large')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[0].path)
+
+    def test_COPY_newest(self):
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPOk,
+                          {'Last-Modified': '123'}, "passed")
+        self.app.register('PUT', '/v1/a/c/o', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'COPY'},
+                            headers={'Destination': '/c/o'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        self.assertTrue(('X-Copied-From-Last-Modified', '123') in headers)
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[1].path)
+
+    def test_COPY_account_newest(self):
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPOk,
+                          {'Last-Modified': '123'}, "passed")
+        self.app.register('PUT', '/v1/a1/c1/o', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'COPY'},
+                            headers={'Destination': '/c1/o',
+                                     'Destination-Account': 'a1'})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        self.assertTrue(('X-Copied-From-Last-Modified', '123') in headers)
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a1/c1/o', self.authorized[1].path)
+
+    def test_COPY_in_OPTIONS_response(self):
+        self.app.register('OPTIONS', '/v1/a/c/o', swob.HTTPOk,
+                          {'Allow': 'GET, PUT'})
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'OPTIONS'}, headers={})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '200 OK')
+        calls = self.app.calls_with_headers
+        method, path, req_headers = calls[0]
+        self.assertEqual('OPTIONS', method)
+        self.assertEqual('/v1/a/c/o', path)
+        self.assertTrue(('Allow', 'GET, PUT, COPY') in headers)
+        self.assertEqual(len(self.authorized), 1)
+        self.assertEqual('OPTIONS', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[0].path)
+        # For basic test cases, assert orig_req_method behavior
+        self.assertNotIn('swift.orig_req_method', req.environ)
+
+    def test_COPY_in_OPTIONS_response_CORS(self):
+        self.app.register('OPTIONS', '/v1/a/c/o', swob.HTTPOk,
+                          {'Allow': 'GET, PUT',
+                           'Access-Control-Allow-Methods': 'GET, PUT'})
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'OPTIONS'}, headers={})
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '200 OK')
+        calls = self.app.calls_with_headers
+        method, path, req_headers = calls[0]
+        self.assertEqual('OPTIONS', method)
+        self.assertEqual('/v1/a/c/o', path)
+        self.assertTrue(('Allow', 'GET, PUT, COPY') in headers)
+        self.assertTrue(('Access-Control-Allow-Methods',
+                         'GET, PUT, COPY') in headers)
+        self.assertEqual(len(self.authorized), 1)
+        self.assertEqual('OPTIONS', self.authorized[0].method)
+        self.assertEqual('/v1/a/c/o', self.authorized[0].path)
+
+    def _test_COPY_source_headers(self, extra_put_headers):
+        # helper method to perform a COPY with some metadata headers that
+        # should always be sent to the destination
+        put_headers = {'Destination': '/c1/o',
+                       'X-Object-Meta-Test2': 'added',
+                       'X-Object-Sysmeta-Test2': 'added',
+                       'X-Object-Transient-Sysmeta-Test2': 'added'}
+        put_headers.update(extra_put_headers)
+        get_resp_headers = {
+            'X-Timestamp': '1234567890.12345',
+            'X-Backend-Timestamp': '1234567890.12345',
+            'Content-Type': 'text/original',
+            'Content-Encoding': 'gzip',
+            'Content-Disposition': 'attachment; filename=myfile',
+            'X-Object-Meta-Test': 'original',
+            'X-Object-Sysmeta-Test': 'original',
+            'X-Object-Transient-Sysmeta-Test': 'original',
+            'X-Foo': 'Bar'}
+        self.app.register(
+            'GET', '/v1/a/c/o', swob.HTTPOk, headers=get_resp_headers)
+        self.app.register('PUT', '/v1/a/c1/o', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/o', method='COPY', headers=put_headers)
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(status, '201 Created')
+        calls = self.app.calls_with_headers
+        self.assertEqual(2, len(calls))
+        method, path, req_headers = calls[1]
+        self.assertEqual('PUT', method)
+        # these headers should always be applied to the destination
+        self.assertEqual('added', req_headers.get('X-Object-Meta-Test2'))
+        self.assertEqual('added', req_headers.get('X-Object-Sysmeta-Test2'))
+        self.assertEqual('added',
+                         req_headers.get('X-Object-Transient-Sysmeta-Test2'))
+        return req_headers
+
+    def test_COPY_source_headers_no_updates(self):
+        # copy should preserve existing metadata if not updated
+        req_headers = self._test_COPY_source_headers({})
+        self.assertEqual('text/original', req_headers.get('Content-Type'))
+        self.assertEqual('gzip', req_headers.get('Content-Encoding'))
+        self.assertEqual('attachment; filename=myfile',
+                         req_headers.get('Content-Disposition'))
+        self.assertEqual('original', req_headers.get('X-Object-Meta-Test'))
+        self.assertEqual('original', req_headers.get('X-Object-Sysmeta-Test'))
+        self.assertEqual('original',
+                         req_headers.get('X-Object-Transient-Sysmeta-Test'))
+        self.assertEqual('Bar', req_headers.get('X-Foo'))
+        self.assertNotIn('X-Timestamp', req_headers)
+        self.assertNotIn('X-Backend-Timestamp', req_headers)
+
+    def test_COPY_source_headers_with_updates(self):
+        # copy should apply any updated values to existing metadata
+        put_headers = {
+            'Content-Type': 'text/not_original',
+            'Content-Encoding': 'not_gzip',
+            'Content-Disposition': 'attachment; filename=notmyfile',
+            'X-Object-Meta-Test': 'not_original',
+            'X-Object-Sysmeta-Test': 'not_original',
+            'X-Object-Transient-Sysmeta-Test': 'not_original',
+            'X-Foo': 'Not Bar'}
+        req_headers = self._test_COPY_source_headers(put_headers)
+        self.assertEqual('text/not_original', req_headers.get('Content-Type'))
+        self.assertEqual('not_gzip', req_headers.get('Content-Encoding'))
+        self.assertEqual('attachment; filename=notmyfile',
+                         req_headers.get('Content-Disposition'))
+        self.assertEqual('not_original', req_headers.get('X-Object-Meta-Test'))
+        self.assertEqual('not_original',
+                         req_headers.get('X-Object-Sysmeta-Test'))
+        self.assertEqual('not_original',
+                         req_headers.get('X-Object-Transient-Sysmeta-Test'))
+        self.assertEqual('Not Bar', req_headers.get('X-Foo'))
+        self.assertNotIn('X-Timestamp', req_headers)
+        self.assertNotIn('X-Backend-Timestamp', req_headers)
+
+    def test_COPY_x_fresh_metadata_no_updates(self):
+        # existing user metadata should not be copied, sysmeta is copied
+        put_headers = {
+            'X-Fresh-Metadata': 'true',
+            'X-Extra': 'Fresh'}
+        req_headers = self._test_COPY_source_headers(put_headers)
+        self.assertEqual('text/original', req_headers.get('Content-Type'))
+        self.assertEqual('Fresh', req_headers.get('X-Extra'))
+        self.assertEqual('original',
+                         req_headers.get('X-Object-Sysmeta-Test'))
+        self.assertIn('X-Fresh-Metadata', req_headers)
+        self.assertNotIn('X-Object-Meta-Test', req_headers)
+        self.assertNotIn('X-Object-Transient-Sysmeta-Test', req_headers)
+        self.assertNotIn('X-Timestamp', req_headers)
+        self.assertNotIn('X-Backend-Timestamp', req_headers)
+        self.assertNotIn('Content-Encoding', req_headers)
+        self.assertNotIn('Content-Disposition', req_headers)
+        self.assertNotIn('X-Foo', req_headers)
+
+    def test_COPY_x_fresh_metadata_with_updates(self):
+        # existing user metadata should not be copied, new metadata replaces it
+        put_headers = {
+            'X-Fresh-Metadata': 'true',
+            'Content-Type': 'text/not_original',
+            'Content-Encoding': 'not_gzip',
+            'Content-Disposition': 'attachment; filename=notmyfile',
+            'X-Object-Meta-Test': 'not_original',
+            'X-Object-Sysmeta-Test': 'not_original',
+            'X-Object-Transient-Sysmeta-Test': 'not_original',
+            'X-Foo': 'Not Bar',
+            'X-Extra': 'Fresh'}
+        req_headers = self._test_COPY_source_headers(put_headers)
+        self.assertEqual('Fresh', req_headers.get('X-Extra'))
+        self.assertEqual('text/not_original', req_headers.get('Content-Type'))
+        self.assertEqual('not_gzip', req_headers.get('Content-Encoding'))
+        self.assertEqual('attachment; filename=notmyfile',
+                         req_headers.get('Content-Disposition'))
+        self.assertEqual('not_original', req_headers.get('X-Object-Meta-Test'))
+        self.assertEqual('not_original',
+                         req_headers.get('X-Object-Sysmeta-Test'))
+        self.assertEqual('not_original',
+                         req_headers.get('X-Object-Transient-Sysmeta-Test'))
+        self.assertEqual('Not Bar', req_headers.get('X-Foo'))
+
+    def test_COPY_with_single_range(self):
+        # verify that source etag is not copied when copying a range
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPOk,
+                          {'etag': 'bogus etag'}, "abcdefghijklmnop")
+        self.app.register('PUT', '/v1/a/c1/o', swob.HTTPCreated, {})
+        req = swob.Request.blank(
+            '/v1/a/c/o', method='COPY',
+            headers={'Destination': 'c1/o',
+                     'Range': 'bytes=5-10'})
+
+        status, headers, body = self.call_ssc(req)
+
+        self.assertEqual(status, '201 Created')
+        calls = self.app.calls_with_headers
+        self.assertEqual(2, len(calls))
+        method, path, req_headers = calls[1]
+        self.assertEqual('PUT', method)
+        self.assertEqual('/v1/a/c1/o', path)
+        self.assertNotIn('etag', (h.lower() for h in req_headers))
+        self.assertEqual('6', req_headers['content-length'])
+        req = swob.Request.blank('/v1/a/c1/o', method='GET')
+        status, headers, body = self.call_ssc(req)
+        self.assertEqual(b'fghijk', body)
+
+
+@patch_policies(with_ec_default=True)
+class TestServerSideCopyMiddlewareWithEC(unittest.TestCase):
+    container_info = {
+        'status': 200,
+        'write_acl': None,
+        'read_acl': None,
+        'storage_policy': None,
+        'sync_key': None,
+        'versions': None,
+    }
+
+    def setUp(self):
+        self.logger = debug_logger('proxy-server')
+        self.logger.thread_locals = ('txn1', '127.0.0.2')
+        self.app = PatchedObjControllerApp(
+            None, account_ring=FakeRing(),
+            container_ring=FakeRing(), logger=self.logger)
+        self.ssc = copy.filter_factory({})(self.app)
+        self.ssc.logger = self.app.logger
+        self.policy = POLICIES.default
+        self.app.container_info = dict(self.container_info)
+
+    def test_COPY_with_single_range(self):
+        req = swob.Request.blank(
+            '/v1/a/c/o', method='COPY',
+            headers={'Destination': 'c1/o',
+                     'Range': 'bytes=5-10'})
+        # turn a real body into fragments
+        segment_size = self.policy.ec_segment_size
+        real_body = (b'asdf' * segment_size)[:-10]
+
+        # split it up into chunks
+        chunks = [real_body[x:x + segment_size]
+                  for x in range(0, len(real_body), segment_size)]
+
+        # we need only first chunk to rebuild 5-10 range
+        fragments = self.policy.pyeclib_driver.encode(chunks[0])
+        fragment_payloads = []
+        fragment_payloads.append(fragments)
+
+        node_fragments = list(zip(*fragment_payloads))
+        self.assertEqual(len(node_fragments),
+                         self.policy.object_ring.replicas)  # sanity
+        headers = {'X-Object-Sysmeta-Ec-Content-Length': str(len(real_body))}
+        responses = [(200, b''.join(node_fragments[i]), headers)
+                     for i in range(POLICIES.default.ec_ndata)]
+        responses += [(201, b'', {})] * self.policy.object_ring.replicas
+        status_codes, body_iter, headers = zip(*responses)
+        expect_headers = {
+            'X-Obj-Metadata-Footer': 'yes',
+            'X-Obj-Multiphase-Commit': 'yes'
+        }
+
+        put_hdrs = []
+
+        def capture_conn(host, port, dev, part, method, path, *args, **kwargs):
+            if method == 'PUT':
+                put_hdrs.append(args[0])
+
+        with set_http_connect(*status_codes, body_iter=body_iter,
+                              headers=headers, expect_headers=expect_headers,
+                              give_connect=capture_conn):
+            resp = req.get_response(self.ssc)
+
+        self.assertEqual(resp.status_int, 201)
+        expected_puts = POLICIES.default.ec_ndata + POLICIES.default.ec_nparity
+        self.assertEqual(expected_puts, len(put_hdrs))
+        for hdrs in put_hdrs:
+            # etag should not be copied from source
+            self.assertNotIn('etag', (h.lower() for h in hdrs))
+
+    def test_COPY_with_invalid_ranges(self):
+        # real body size is segment_size - 10 (just 1 segment)
+        segment_size = self.policy.ec_segment_size
+        real_body = (b'a' * segment_size)[:-10]
+
+        # range is out of real body but in segment size
+        self._test_invalid_ranges('COPY', real_body,
+                                  segment_size, '%s-' % (segment_size - 10))
+        # range is out of both real body and segment size
+        self._test_invalid_ranges('COPY', real_body,
+                                  segment_size, '%s-' % (segment_size + 10))
+
+    def _test_invalid_ranges(self, method, real_body, segment_size, req_range):
+        # make a request with range starts from more than real size.
+        body_etag = md5(real_body, usedforsecurity=False).hexdigest()
+        req = swob.Request.blank(
+            '/v1/a/c/o', method=method,
+            headers={'Destination': 'c1/o',
+                     'Range': 'bytes=%s' % (req_range)})
+
+        fragments = self.policy.pyeclib_driver.encode(real_body)
+        fragment_payloads = [fragments]
+
+        node_fragments = list(zip(*fragment_payloads))
+        self.assertEqual(len(node_fragments),
+                         self.policy.object_ring.replicas)  # sanity
+        headers = {'X-Object-Sysmeta-Ec-Content-Length': str(len(real_body)),
+                   'X-Object-Sysmeta-Ec-Etag': body_etag}
+        start = int(req_range.split('-')[0])
+        self.assertTrue(start >= 0)  # sanity
+        title, exp = swob.RESPONSE_REASONS[416]
+        range_not_satisfiable_body = \
+            '<html><h1>%s</h1><p>%s</p></html>' % (title, exp)
+        range_not_satisfiable_body = range_not_satisfiable_body.encode('ascii')
+        if start >= segment_size:
+            responses = [(416, range_not_satisfiable_body, headers)
+                         for i in range(POLICIES.default.ec_ndata)]
+        else:
+            responses = [(200, b''.join(node_fragments[i]), headers)
+                         for i in range(POLICIES.default.ec_ndata)]
+        status_codes, body_iter, headers = zip(*responses)
+        expect_headers = {
+            'X-Obj-Metadata-Footer': 'yes',
+            'X-Obj-Multiphase-Commit': 'yes'
+        }
+        # TODO possibly use FakeApp here
+        with set_http_connect(*status_codes, body_iter=body_iter,
+                              headers=headers, expect_headers=expect_headers):
+            resp = req.get_response(self.ssc)
+        self.assertEqual(resp.status_int, 416)
+        self.assertEqual(resp.content_length, len(range_not_satisfiable_body))
+        self.assertEqual(resp.body, range_not_satisfiable_body)
+        self.assertEqual(resp.etag, body_etag)
+        self.assertEqual(resp.headers['Accept-Ranges'], 'bytes')
+
+
+class TestServerSideCopyHeartbeat(unittest.TestCase):
+    def setUp(self):
+        self.app = FakeSwift()
+        self.ssc = copy.filter_factory({'yield_frequency': '1'})(self.app)
+
+    def tearDown(self):
+        pass
+
+    def call_app(self, req, app=None):
+        if app is None:
+            app = self.app
+
+        self.authorized = []
+
+        def authorize(req):
+            self.authorized.append(req)
+
+        if 'swift.authorize' not in req.environ:
+            req.environ['swift.authorize'] = authorize
+
+        req.headers.setdefault("User-Agent", "Test User Agent")
+
+        status = [None]
+        headers = [None]
+
+        def start_response(s, h, ei=None):
+            status[0] = s
+            headers[0] = h
+
+        body_iter = app(req.environ, start_response)
+        body = b''
+        try:
+            for chunk in body_iter:
+                body += chunk
+        finally:
+            close_if_possible(body_iter)
+
+        return status[0], headers[0], body
+
+    def test_copy_with_heartbeat_success(self):
+        original_spawn = eventlet.spawn
+        self.app.register('GET', '/v1/a/c/o?heartbeat=true', swob.HTTPOk,
+                          {'Content-Length': '10'}, b'X' * 10)
+        self.app.register('PUT', '/v1/a/c/o2?heartbeat=true',
+                          swob.HTTPCreated, {})
+        heartbeats = []
+
+        def mock_spawn(func, *args, **kwargs):
+            def delayed_func(*a, **kw):
+                eventlet.sleep(2.5)
+                return func(*a, **kw)
+            return original_spawn(delayed_func, *args, **kwargs)
+        req = swob.Request.blank(
+            '/v1/a/c/o2?heartbeat=true',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'Content-Length': '0', 'X-Copy-From': 'c/o'})
+
+        with mock.patch('eventlet.spawn', mock_spawn):
+            status = [None]
+            headers_list = [None]
+
+            def start_response(s, h, ei=None):
+                status[0] = s
+                headers_list[0] = h
+            body_iter = self.ssc(req.environ, start_response)
+            self.assertEqual('202 Accepted', status[0])
+
+            try:
+                for chunk in body_iter:
+                    heartbeats.append(chunk)
+            finally:
+                close_if_possible(body_iter)
+        self.assertTrue(len(heartbeats) >= 3,
+                        f"Expected 3 heartbeats, got {len(heartbeats)}")
+        self.assertEqual(heartbeats[0], b' ')
+
+        for i in range(1, len(heartbeats) - 1):
+            self.assertEqual(heartbeats[i], b' ')
+        self.assertIn(b'201 Created', heartbeats[-1])
+        self.assertEqual(req.environ.get('eventlet.minimum_write_chunk_size'),
+                         0)
+        self.assertEqual(2, len(self.app.calls))
+        self.assertEqual(('GET', '/v1/a/c/o?heartbeat=true'),
+                         self.app.calls[0])
+        self.assertEqual(('PUT', '/v1/a/c/o2?heartbeat=true'),
+                         self.app.calls[1])
+
+    def test_copy_with_heartbeat_failure(self):
+        original_spawn = eventlet.spawn
+        self.app.register('GET', '/v1/a/c/o?heartbeat=true', swob.HTTPOk,
+                          {'Content-Length': '10'}, b'X' * 10)
+        self.app.register('PUT', '/v1/a/c/o2?heartbeat=true',
+                          swob.HTTPServiceUnavailable, {})
+        heartbeats = []
+
+        def mock_spawn(func, *args, **kwargs):
+
+            def delayed_func(*a, **kw):
+                eventlet.sleep(2.5)
+                return func(*a, **kw)
+            return original_spawn(delayed_func, *args, **kwargs)
+
+        req = swob.Request.blank(
+            '/v1/a/c/o2?heartbeat=true',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'Content-Length': '0', 'X-Copy-From': 'c/o'})
+
+        with mock.patch('eventlet.spawn', mock_spawn):
+            status = [None]
+            headers_list = [None]
+
+            def start_response(s, h, ei=None):
+                status[0] = s
+                headers_list[0] = h
+            body_iter = self.ssc(req.environ, start_response)
+            self.assertEqual('202 Accepted', status[0])
+
+            try:
+                for chunk in body_iter:
+                    heartbeats.append(chunk)
+            finally:
+                close_if_possible(body_iter)
+        self.assertTrue(len(heartbeats) >= 3,
+                        f"Expected 3 heartbeats, got {len(heartbeats)}")
+        self.assertEqual(heartbeats[0], b' ')
+
+        for i in range(1, len(heartbeats) - 1):
+            self.assertEqual(heartbeats[i], b' ')
+        self.assertIn(b'503 Service Unavailable', heartbeats[-1])
+        self.assertEqual(req.environ.get('eventlet.minimum_write_chunk_size'),
+                         0)
+        self.assertEqual(2, len(self.app.calls))
+        self.assertEqual(('GET', '/v1/a/c/o?heartbeat=true'),
+                         self.app.calls[0])
+        self.assertEqual(('PUT', '/v1/a/c/o2?heartbeat=true'),
+                         self.app.calls[1])
diff --git a/test/unit/common/middleware/test_crossdomain.py b/test/unit/common/middleware/test_crossdomain.py
new file mode 100644
index 0000000000..52d0c6be9c
--- /dev/null
+++ b/test/unit/common/middleware/test_crossdomain.py
@@ -0,0 +1,85 @@
+# Copyright (c) 2013 OpenStack Foundation.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+
+from swift.common.swob import Request
+
+from swift.common.middleware import crossdomain
+
+
+class FakeApp(object):
+
+    def __call__(self, env, start_response):
+        return b"FAKE APP"
+
+
+def start_response(*args):
+    pass
+
+
+class TestCrossDomain(unittest.TestCase):
+
+    def setUp(self):
+        self.app = crossdomain.filter_factory({})(FakeApp())
+
+    # GET of /crossdomain.xml (default)
+    def test_crossdomain_default(self):
+        expectedResponse = b'<?xml version="1.0"?>\n' \
+            b'<!DOCTYPE cross-domain-policy SYSTEM ' \
+            b'"http://www.adobe.com/xml/dtds/cross-domain-policy.dtd" >\n' \
+            b'<cross-domain-policy>\n' \
+            b'<allow-access-from domain="*" secure="false" />\n' \
+            b'</cross-domain-policy>'
+
+        req = Request.blank('/crossdomain.xml',
+                            environ={'REQUEST_METHOD': 'GET'})
+        resp = self.app(req.environ, start_response)
+        self.assertEqual(resp, [expectedResponse])
+
+    # GET of /crossdomain.xml (custom)
+    def test_crossdomain_custom(self):
+        conf = {'cross_domain_policy': '<dummy 1>\n<dummy 2>'}
+        self.app = crossdomain.CrossDomainMiddleware(FakeApp(), conf)
+        expectedResponse = b'<?xml version="1.0"?>\n' \
+            b'<!DOCTYPE cross-domain-policy SYSTEM ' \
+            b'"http://www.adobe.com/xml/dtds/cross-domain-policy.dtd" >\n' \
+            b'<cross-domain-policy>\n' \
+            b'<dummy 1>\n' \
+            b'<dummy 2>\n' \
+            b'</cross-domain-policy>'
+
+        req = Request.blank('/crossdomain.xml',
+                            environ={'REQUEST_METHOD': 'GET'})
+        resp = self.app(req.environ, start_response)
+        self.assertEqual(resp, [expectedResponse])
+
+    # GET to a different resource should be passed on
+    def test_crossdomain_pass(self):
+        req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'})
+        resp = self.app(req.environ, start_response)
+        self.assertEqual(resp, b'FAKE APP')
+
+    # Only GET is allowed on the /crossdomain.xml resource
+    def test_crossdomain_get_only(self):
+        for method in ['HEAD', 'PUT', 'POST', 'COPY', 'OPTIONS']:
+            req = Request.blank('/crossdomain.xml',
+                                environ={'REQUEST_METHOD': method})
+            resp = self.app(req.environ, start_response)
+            self.assertEqual(resp, b'FAKE APP')
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/test_dlo.py b/test/unit/common/middleware/test_dlo.py
new file mode 100644
index 0000000000..460ea4c434
--- /dev/null
+++ b/test/unit/common/middleware/test_dlo.py
@@ -0,0 +1,1045 @@
+# coding: utf-8
+# Copyright (c) 2013 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import json
+from unittest import mock
+import shutil
+import tempfile
+from textwrap import dedent
+import time
+import unittest
+
+from swift.common import swob
+from swift.common.header_key_dict import HeaderKeyDict
+from swift.common.middleware import dlo
+from swift.common.utils import closing_if_possible, md5
+from test.unit.common.middleware.helpers import FakeSwift
+
+
+LIMIT = 'swift.common.constraints.CONTAINER_LISTING_LIMIT'
+
+
+def md5hex(s):
+    if not isinstance(s, bytes):
+        s = s.encode('utf-8')
+    return md5(s, usedforsecurity=False).hexdigest()
+
+
+class DloTestCase(unittest.TestCase):
+    def call_dlo(self, req, app=None):
+        if app is None:
+            app = self.dlo
+
+        req.headers.setdefault("User-Agent", "Soap Opera")
+
+        status = [None]
+        headers = [None]
+
+        def start_response(s, h, ei=None):
+            status[0] = s
+            headers[0] = h
+
+        body_iter = app(req.environ, start_response)
+        body = b''
+        # appease the close-checker
+        with closing_if_possible(body_iter):
+            for chunk in body_iter:
+                body += chunk
+        return status[0], headers[0], body
+
+    def setUp(self):
+        self.app = FakeSwift()
+        self.dlo = dlo.filter_factory({
+            # don't slow down tests with rate limiting
+            'rate_limit_after_segment': '1000000',
+        })(self.app)
+        self.dlo.logger = self.app.logger
+        self.app.register(
+            'GET', '/v1/AUTH_test/c/seg_01',
+            swob.HTTPOk, {'Content-Length': '5', 'Etag': md5hex("aaaaa")},
+            b'aaaaa')
+        self.app.register(
+            'GET', '/v1/AUTH_test/c/seg_02',
+            swob.HTTPOk, {'Content-Length': '5', 'Etag': md5hex("bbbbb")},
+            b'bbbbb')
+        self.app.register(
+            'GET', '/v1/AUTH_test/c/seg_03',
+            swob.HTTPOk, {'Content-Length': '5', 'Etag': md5hex("ccccc")},
+            b'ccccc')
+        self.app.register(
+            'GET', '/v1/AUTH_test/c/seg_04',
+            swob.HTTPOk, {'Content-Length': '5', 'Etag': md5hex("ddddd")},
+            b'ddddd')
+        self.app.register(
+            'GET', '/v1/AUTH_test/c/seg_05',
+            swob.HTTPOk, {'Content-Length': '5', 'Etag': md5hex("eeeee")},
+            b'eeeee')
+
+        # an unrelated object (not seg*) to test the prefix matching
+        self.app.register(
+            'GET', '/v1/AUTH_test/c/catpicture.jpg',
+            swob.HTTPOk, {'Content-Length': '9',
+                          'Etag': md5hex("meow meow meow meow")},
+            b'meow meow meow meow')
+
+        self.app.register(
+            'GET', '/v1/AUTH_test/mancon/manifest',
+            swob.HTTPOk, {'Content-Length': '17', 'Etag': 'manifest-etag',
+                          'X-Object-Manifest': 'c/seg'},
+            b'manifest-contents')
+
+        lm = '2013-11-22T02:42:13.781760'
+        ct = 'application/octet-stream'
+        segs = [{"hash": md5hex("aaaaa"), "bytes": 5,
+                 "name": "seg_01", "last_modified": lm, "content_type": ct},
+                {"hash": md5hex("bbbbb"), "bytes": 5,
+                 "name": "seg_02", "last_modified": lm, "content_type": ct},
+                {"hash": md5hex("ccccc"), "bytes": 5,
+                 "name": "seg_03", "last_modified": lm, "content_type": ct},
+                {"hash": md5hex("ddddd"), "bytes": 5,
+                 "name": "seg_04", "last_modified": lm, "content_type": ct},
+                {"hash": md5hex("eeeee"), "bytes": 5,
+                 "name": "seg_05", "last_modified": lm, "content_type": ct}]
+
+        full_container_listing = segs + [{"hash": "cats-etag", "bytes": 9,
+                                          "name": "catpicture.jpg",
+                                          "last_modified": lm,
+                                          "content_type": "application/png"}]
+        self.app.register(
+            'GET', '/v1/AUTH_test/c',
+            swob.HTTPOk, {'Content-Type': 'application/json; charset=utf-8'},
+            json.dumps(full_container_listing).encode('ascii'))
+        self.app.register(
+            'GET', '/v1/AUTH_test/c?prefix=seg',
+            swob.HTTPOk, {'Content-Type': 'application/json; charset=utf-8'},
+            json.dumps(segs).encode('ascii'))
+
+        # This is to let us test multi-page container listings; we use the
+        # trailing underscore to send small (pagesize=3) listings.
+        #
+        # If you're testing against this, be sure to mock out
+        # CONTAINER_LISTING_LIMIT to 3 in your test.
+        self.app.register(
+            'GET', '/v1/AUTH_test/mancon/manifest-many-segments',
+            swob.HTTPOk, {'Content-Length': '7', 'Etag': 'etag-manyseg',
+                          'X-Object-Manifest': 'c/seg_'},
+            b'manyseg')
+        self.app.register(
+            'GET', '/v1/AUTH_test/c?prefix=seg_',
+            swob.HTTPOk, {'Content-Type': 'application/json; charset=utf-8'},
+            json.dumps(segs[:3]).encode('ascii'))
+        self.app.register(
+            'GET', '/v1/AUTH_test/c?prefix=seg_&marker=seg_03',
+            swob.HTTPOk, {'Content-Type': 'application/json; charset=utf-8'},
+            json.dumps(segs[3:]).encode('ascii'))
+
+        # Here's a manifest with 0 segments
+        self.app.register(
+            'GET', '/v1/AUTH_test/mancon/manifest-no-segments',
+            swob.HTTPOk, {'Content-Length': '7', 'Etag': 'noseg',
+                          'X-Object-Manifest': 'c/noseg_'},
+            b'noseg')
+        self.app.register(
+            'GET', '/v1/AUTH_test/c?prefix=noseg_',
+            swob.HTTPOk, {'Content-Type': 'application/json; charset=utf-8'},
+            json.dumps([]).encode('ascii'))
+
+
+class TestDloPutManifest(DloTestCase):
+    def setUp(self):
+        super(TestDloPutManifest, self).setUp()
+        self.app.register(
+            'PUT', '/v1/AUTH_test/c/m',
+            swob.HTTPCreated, {}, None)
+
+    def test_validating_x_object_manifest(self):
+        exp_okay = ["c/o",
+                    "c/obj/with/slashes",
+                    "c/obj/with/trailing/slash/",
+                    "c/obj/with//multiple///slashes////adjacent"]
+        exp_bad = ["",
+                   "/leading/slash",
+                   "double//slash",
+                   "container-only",
+                   "whole-container/",
+                   "c/o?short=querystring",
+                   "c/o?has=a&long-query=string"]
+
+        got_okay = []
+        got_bad = []
+        for val in (exp_okay + exp_bad):
+            req = swob.Request.blank("/v1/AUTH_test/c/m",
+                                     environ={'REQUEST_METHOD': 'PUT'},
+                                     headers={"X-Object-Manifest": val})
+            status, _, _ = self.call_dlo(req)
+            if status.startswith("201"):
+                got_okay.append(val)
+            else:
+                got_bad.append(val)
+
+        self.assertEqual(exp_okay, got_okay)
+        self.assertEqual(exp_bad, got_bad)
+
+    def test_validation_watches_manifests_with_slashes(self):
+        self.app.register(
+            'PUT', '/v1/AUTH_test/con/w/x/y/z',
+            swob.HTTPCreated, {}, None)
+
+        req = swob.Request.blank(
+            "/v1/AUTH_test/con/w/x/y/z", environ={'REQUEST_METHOD': 'PUT'},
+            headers={"X-Object-Manifest": 'good/value'})
+        status, _, _ = self.call_dlo(req)
+        self.assertEqual(status, "201 Created")
+
+        req = swob.Request.blank(
+            "/v1/AUTH_test/con/w/x/y/z", environ={'REQUEST_METHOD': 'PUT'},
+            headers={"X-Object-Manifest": '/badvalue'})
+        status, _, _ = self.call_dlo(req)
+        self.assertEqual(status, "400 Bad Request")
+
+    def test_validation_ignores_containers(self):
+        self.app.register(
+            'PUT', '/v1/a/c',
+            swob.HTTPAccepted, {}, None)
+        req = swob.Request.blank(
+            "/v1/a/c", environ={'REQUEST_METHOD': 'PUT'},
+            headers={"X-Object-Manifest": "/superbogus/?wrong=in&every=way"})
+        status, _, _ = self.call_dlo(req)
+        self.assertEqual(status, "202 Accepted")
+
+    def test_validation_ignores_accounts(self):
+        self.app.register(
+            'PUT', '/v1/a',
+            swob.HTTPAccepted, {}, None)
+        req = swob.Request.blank(
+            "/v1/a", environ={'REQUEST_METHOD': 'PUT'},
+            headers={"X-Object-Manifest": "/superbogus/?wrong=in&every=way"})
+        status, _, _ = self.call_dlo(req)
+        self.assertEqual(status, "202 Accepted")
+
+
+class TestDloHeadManifest(DloTestCase):
+    def test_head_large_object(self):
+        expected_etag = '"%s"' % md5hex(
+            md5hex("aaaaa") + md5hex("bbbbb") + md5hex("ccccc") +
+            md5hex("ddddd") + md5hex("eeeee"))
+        req = swob.Request.blank('/v1/AUTH_test/mancon/manifest',
+                                 environ={'REQUEST_METHOD': 'HEAD'})
+        status, headers, body = self.call_dlo(req)
+        headers = HeaderKeyDict(headers)
+        self.assertEqual(headers["Etag"], expected_etag)
+        self.assertEqual(headers["Content-Length"], "25")
+
+    def test_head_large_object_too_many_segments(self):
+        req = swob.Request.blank('/v1/AUTH_test/mancon/manifest-many-segments',
+                                 environ={'REQUEST_METHOD': 'HEAD'})
+        with mock.patch(LIMIT, 3):
+            status, headers, body = self.call_dlo(req)
+        headers = HeaderKeyDict(headers)
+
+        # etag is manifest's etag
+        self.assertEqual(headers["Etag"], "etag-manyseg")
+        self.assertIsNone(headers.get("Content-Length"))
+
+    def test_head_large_object_no_segments(self):
+        req = swob.Request.blank('/v1/AUTH_test/mancon/manifest-no-segments',
+                                 environ={'REQUEST_METHOD': 'HEAD'})
+        status, headers, body = self.call_dlo(req)
+        headers = HeaderKeyDict(headers)
+        self.assertEqual(headers["Etag"], '"%s"' % md5hex(""))
+        self.assertEqual(headers["Content-Length"], "0")
+
+        # one request to HEAD the manifest
+        # one request for the first page of listings
+        # *zero* requests for the second page of listings
+        self.assertEqual(
+            self.app.calls,
+            [('HEAD', '/v1/AUTH_test/mancon/manifest-no-segments'),
+             ('GET', '/v1/AUTH_test/c?prefix=noseg_')])
+
+
+class TestDloGetManifest(DloTestCase):
+    def tearDown(self):
+        self.assertEqual(self.app.unclosed_requests, {})
+
+    def test_get_manifest(self):
+        expected_etag = '"%s"' % md5hex(
+            md5hex("aaaaa") + md5hex("bbbbb") + md5hex("ccccc") +
+            md5hex("ddddd") + md5hex("eeeee"))
+        req = swob.Request.blank('/v1/AUTH_test/mancon/manifest',
+                                 environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_dlo(req)
+        headers = HeaderKeyDict(headers)
+        self.assertEqual(headers["Etag"], expected_etag)
+        self.assertEqual(headers["Content-Length"], "25")
+        self.assertEqual(body, b'aaaaabbbbbcccccdddddeeeee')
+
+        for _, _, hdrs in self.app.calls_with_headers[1:]:
+            ua = hdrs.get("User-Agent", "")
+            self.assertTrue("DLO MultipartGET" in ua)
+            self.assertFalse("DLO MultipartGET DLO MultipartGET" in ua)
+        # the first request goes through unaltered
+        self.assertFalse(
+            "DLO MultipartGET" in self.app.calls_with_headers[0][2])
+
+        # we set swift.source for everything but the first request
+        self.assertEqual(self.app.swift_sources,
+                         [None, 'DLO', 'DLO', 'DLO', 'DLO', 'DLO', 'DLO'])
+
+    def test_get_non_manifest_passthrough(self):
+        req = swob.Request.blank('/v1/AUTH_test/c/catpicture.jpg',
+                                 environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_dlo(req)
+        self.assertEqual(body, b"meow meow meow meow")
+
+    def test_get_non_object_passthrough(self):
+        self.app.register('GET', '/info', swob.HTTPOk,
+                          {}, 'useful stuff here')
+        req = swob.Request.blank('/info',
+                                 environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_dlo(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(body, b'useful stuff here')
+        self.assertEqual(self.app.call_count, 1)
+        self.assertFalse(self.app.unread_requests)
+
+    def test_get_manifest_passthrough(self):
+        # reregister it with the query param
+        self.app.register(
+            'GET', '/v1/AUTH_test/mancon/manifest?multipart-manifest=get',
+            swob.HTTPOk, {'Content-Length': '17', 'Etag': 'manifest-etag',
+                          'X-Object-Manifest': 'c/seg'},
+            'manifest-contents')
+        req = swob.Request.blank(
+            '/v1/AUTH_test/mancon/manifest',
+            environ={'REQUEST_METHOD': 'GET',
+                     'QUERY_STRING': 'multipart-manifest=get'})
+        status, headers, body = self.call_dlo(req)
+        headers = HeaderKeyDict(headers)
+        self.assertEqual(headers["Etag"], "manifest-etag")
+        self.assertEqual(body, b'manifest-contents')
+        self.assertFalse(self.app.unread_requests)
+
+        # HEAD query param worked, since GET with query param is registered
+        req = swob.Request.blank(
+            '/v1/AUTH_test/mancon/manifest',
+            environ={'REQUEST_METHOD': 'HEAD',
+                     'QUERY_STRING': 'multipart-manifest=get'})
+        status, headers, body = self.call_dlo(req)
+        headers = HeaderKeyDict(headers)
+        self.assertEqual(headers["Etag"], "manifest-etag")
+        self.assertEqual(body, b'')
+
+    def test_error_passthrough(self):
+        self.app.register(
+            'GET', '/v1/AUTH_test/gone/404ed',
+            swob.HTTPNotFound, {}, None)
+        req = swob.Request.blank('/v1/AUTH_test/gone/404ed',
+                                 environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_dlo(req)
+        self.assertEqual(status, '404 Not Found')
+
+        # ... and multipart-manifest=get also returns registered 404 response
+        req = swob.Request.blank('/v1/AUTH_test/gone/404ed',
+                                 method='GET',
+                                 params={'multipart-manifest': 'get'})
+        status, headers, body = self.call_dlo(req)
+        self.assertEqual(status, '404 Not Found')
+
+        # HEAD with same params find same registered GET
+        req = swob.Request.blank('/v1/AUTH_test/gone/404ed',
+                                 method='HEAD',
+                                 params={'multipart-manifest': 'get'})
+        status, headers, body = self.call_dlo(req)
+        self.assertEqual(status, '404 Not Found')
+
+    def test_get_range(self):
+        req = swob.Request.blank('/v1/AUTH_test/mancon/manifest',
+                                 environ={'REQUEST_METHOD': 'GET'},
+                                 headers={'Range': 'bytes=8-17'})
+        status, headers, body = self.call_dlo(req)
+        headers = HeaderKeyDict(headers)
+        self.assertEqual(status, "206 Partial Content")
+        self.assertEqual(headers["Content-Length"], "10")
+        self.assertEqual(body, b'bbcccccddd')
+        expected_etag = '"%s"' % md5hex(
+            md5hex("aaaaa") + md5hex("bbbbb") + md5hex("ccccc") +
+            md5hex("ddddd") + md5hex("eeeee"))
+        self.assertEqual(headers.get("Etag"), expected_etag)
+        self.assertEqual(self.app.unread_requests, {})
+
+    def test_get_big_manifest(self):
+        self.app.register(
+            'GET', '/v1/AUTH_test/mancon/big-manifest',
+            swob.HTTPOk, {'Content-Length': '17000', 'Etag': 'manifest-etag',
+                          'X-Object-Manifest': 'c/seg'},
+            b'manifest-contents' * 1000)
+        req = swob.Request.blank('/v1/AUTH_test/mancon/big-manifest',
+                                 environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_dlo(req)
+        headers = HeaderKeyDict(headers)
+        self.assertEqual(status, "200 OK")
+        self.assertEqual(headers["Content-Length"], "25")
+        self.assertEqual(body, b'aaaaabbbbbcccccdddddeeeee')
+        expected_etag = '"%s"' % md5hex(
+            md5hex("aaaaa") + md5hex("bbbbb") + md5hex("ccccc") +
+            md5hex("ddddd") + md5hex("eeeee"))
+        self.assertEqual(headers.get("Etag"), expected_etag)
+        self.assertEqual(self.app.unread_requests, {
+            # Since we don't know how big this will be, we just disconnect
+            ('GET', '/v1/AUTH_test/mancon/big-manifest'): 1,
+        })
+
+    def test_get_range_on_segment_boundaries(self):
+        req = swob.Request.blank('/v1/AUTH_test/mancon/manifest',
+                                 environ={'REQUEST_METHOD': 'GET'},
+                                 headers={'Range': 'bytes=10-19'})
+        status, headers, body = self.call_dlo(req)
+        headers = HeaderKeyDict(headers)
+        self.assertEqual(status, "206 Partial Content")
+        self.assertEqual(headers["Content-Length"], "10")
+        self.assertEqual(body, b'cccccddddd')
+
+    def test_get_range_first_byte(self):
+        req = swob.Request.blank('/v1/AUTH_test/mancon/manifest',
+                                 environ={'REQUEST_METHOD': 'GET'},
+                                 headers={'Range': 'bytes=0-0'})
+        status, headers, body = self.call_dlo(req)
+        headers = HeaderKeyDict(headers)
+        self.assertEqual(status, "206 Partial Content")
+        self.assertEqual(headers["Content-Length"], "1")
+        self.assertEqual(body, b'a')
+
+    def test_get_range_last_byte(self):
+        req = swob.Request.blank('/v1/AUTH_test/mancon/manifest',
+                                 environ={'REQUEST_METHOD': 'GET'},
+                                 headers={'Range': 'bytes=24-24'})
+        status, headers, body = self.call_dlo(req)
+        headers = HeaderKeyDict(headers)
+        self.assertEqual(status, "206 Partial Content")
+        self.assertEqual(headers["Content-Length"], "1")
+        self.assertEqual(body, b'e')
+
+    def test_get_range_overlapping_end(self):
+        req = swob.Request.blank('/v1/AUTH_test/mancon/manifest',
+                                 environ={'REQUEST_METHOD': 'GET'},
+                                 headers={'Range': 'bytes=18-30'})
+        status, headers, body = self.call_dlo(req)
+        headers = HeaderKeyDict(headers)
+        self.assertEqual(status, "206 Partial Content")
+        self.assertEqual(headers["Content-Length"], "7")
+        self.assertEqual(headers["Content-Range"], "bytes 18-24/25")
+        self.assertEqual(body, b'ddeeeee')
+
+    def test_get_range_unsatisfiable(self):
+        req = swob.Request.blank('/v1/AUTH_test/mancon/manifest',
+                                 environ={'REQUEST_METHOD': 'GET'},
+                                 headers={'Range': 'bytes=25-30'})
+        status, headers, body = self.call_dlo(req)
+        self.assertEqual(status, "416 Requested Range Not Satisfiable")
+        expected_headers = (
+            ('Accept-Ranges', 'bytes'),
+            ('Content-Range', 'bytes */25'),
+        )
+        for header_value_pair in expected_headers:
+            self.assertIn(header_value_pair, headers)
+
+    def test_get_range_many_segments_satisfiable(self):
+        req = swob.Request.blank('/v1/AUTH_test/mancon/manifest-many-segments',
+                                 environ={'REQUEST_METHOD': 'GET'},
+                                 headers={'Range': 'bytes=3-12'})
+        with mock.patch(LIMIT, 3):
+            status, headers, body = self.call_dlo(req)
+        headers = HeaderKeyDict(headers)
+        self.assertEqual(status, "206 Partial Content")
+        self.assertEqual(headers["Content-Length"], "10")
+        # The /15 here indicates that this is a 15-byte object. DLO can't tell
+        # if there are more segments or not without fetching more container
+        # listings, though, so we just go with the sum of the lengths of the
+        # segments we can see. In an ideal world, this would be "bytes 3-12/*"
+        # to indicate that we don't know the full object length. However, RFC
+        # 2616 section 14.16 explicitly forbids us from doing that:
+        #
+        #   A response with status code 206 (Partial Content) MUST NOT include
+        #   a Content-Range field with a byte-range-resp-spec of "*".
+        #
+        # Since the truth is forbidden, we lie.
+        self.assertEqual(headers["Content-Range"], "bytes 3-12/15")
+        self.assertEqual(body, b"aabbbbbccc")
+
+        self.assertEqual(
+            self.app.calls,
+            [('GET', '/v1/AUTH_test/mancon/manifest-many-segments'),
+             ('GET', '/v1/AUTH_test/c?prefix=seg_'),
+             ('GET', '/v1/AUTH_test/c/seg_01?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/c/seg_02?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/c/seg_03?multipart-manifest=get')])
+
+    def test_get_range_many_segments_satisfiability_unknown(self):
+        req = swob.Request.blank('/v1/AUTH_test/mancon/manifest-many-segments',
+                                 environ={'REQUEST_METHOD': 'GET'},
+                                 headers={'Range': 'bytes=10-22'})
+        with mock.patch(LIMIT, 3):
+            status, headers, body = self.call_dlo(req)
+        headers = HeaderKeyDict(headers)
+        self.assertEqual(status, "200 OK")
+        # this requires multiple pages of container listing, so we can't send
+        # a Content-Length header
+        self.assertIsNone(headers.get("Content-Length"))
+        self.assertEqual(body, b"aaaaabbbbbcccccdddddeeeee")
+
+    def test_get_suffix_range(self):
+        req = swob.Request.blank('/v1/AUTH_test/mancon/manifest',
+                                 environ={'REQUEST_METHOD': 'GET'},
+                                 headers={'Range': 'bytes=-40'})
+        status, headers, body = self.call_dlo(req)
+        headers = HeaderKeyDict(headers)
+        self.assertEqual(status, "206 Partial Content")
+        self.assertEqual(headers["Content-Length"], "25")
+        self.assertEqual(body, b"aaaaabbbbbcccccdddddeeeee")
+
+    def test_get_suffix_range_many_segments(self):
+        req = swob.Request.blank('/v1/AUTH_test/mancon/manifest-many-segments',
+                                 environ={'REQUEST_METHOD': 'GET'},
+                                 headers={'Range': 'bytes=-5'})
+        with mock.patch(LIMIT, 3):
+            status, headers, body = self.call_dlo(req)
+        headers = HeaderKeyDict(headers)
+        self.assertEqual(status, "200 OK")
+        self.assertIsNone(headers.get("Content-Length"))
+        self.assertIsNone(headers.get("Content-Range"))
+        self.assertEqual(body, b"aaaaabbbbbcccccdddddeeeee")
+
+    def test_get_multi_range(self):
+        # DLO doesn't support multi-range GETs. The way that you express that
+        # in HTTP is to return a 200 response containing the whole entity.
+        req = swob.Request.blank('/v1/AUTH_test/mancon/manifest',
+                                 environ={'REQUEST_METHOD': 'GET'},
+                                 headers={'Range': 'bytes=5-9,15-19'})
+        with mock.patch(LIMIT, 30):
+            status, headers, body = self.call_dlo(req)
+        headers = HeaderKeyDict(headers)
+        self.assertEqual(status, "200 OK")
+        self.assertEqual(headers.get("Content-Length"), '25')
+        self.assertIsNone(headers.get("Content-Range"))
+        self.assertEqual(body, b'aaaaabbbbbcccccdddddeeeee')
+
+    def test_if_match_matches(self):
+        manifest_etag = '"%s"' % md5hex(
+            md5hex("aaaaa") + md5hex("bbbbb") + md5hex("ccccc") +
+            md5hex("ddddd") + md5hex("eeeee"))
+        req = swob.Request.blank('/v1/AUTH_test/mancon/manifest',
+                                 environ={'REQUEST_METHOD': 'GET'},
+                                 headers={'If-Match': manifest_etag})
+
+        status, headers, body = self.call_dlo(req)
+        headers = HeaderKeyDict(headers)
+
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(headers['Content-Length'], '25')
+        self.assertEqual(body, b'aaaaabbbbbcccccdddddeeeee')
+
+    def test_if_match_does_not_match(self):
+        req = swob.Request.blank('/v1/AUTH_test/mancon/manifest',
+                                 environ={'REQUEST_METHOD': 'GET'},
+                                 headers={'If-Match': 'not it'})
+
+        status, headers, body = self.call_dlo(req)
+        headers = HeaderKeyDict(headers)
+
+        self.assertEqual(status, '412 Precondition Failed')
+        self.assertEqual(headers['Content-Length'], '0')
+        self.assertEqual(body, b'')
+
+    def test_if_none_match_matches(self):
+        manifest_etag = '"%s"' % md5hex(
+            md5hex("aaaaa") + md5hex("bbbbb") + md5hex("ccccc") +
+            md5hex("ddddd") + md5hex("eeeee"))
+        req = swob.Request.blank('/v1/AUTH_test/mancon/manifest',
+                                 environ={'REQUEST_METHOD': 'GET'},
+                                 headers={'If-None-Match': manifest_etag})
+
+        status, headers, body = self.call_dlo(req)
+        headers = HeaderKeyDict(headers)
+
+        self.assertEqual(status, '304 Not Modified')
+        self.assertEqual(headers['Content-Length'], '0')
+        self.assertEqual(body, b'')
+
+    def test_if_none_match_does_not_match(self):
+        req = swob.Request.blank('/v1/AUTH_test/mancon/manifest',
+                                 environ={'REQUEST_METHOD': 'GET'},
+                                 headers={'If-None-Match': 'not it'})
+
+        status, headers, body = self.call_dlo(req)
+        headers = HeaderKeyDict(headers)
+
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(headers['Content-Length'], '25')
+        self.assertEqual(body, b'aaaaabbbbbcccccdddddeeeee')
+
+    def test_get_with_if_modified_since(self):
+        # It's important not to pass the If-[Un]Modified-Since header to the
+        # proxy for segment GET requests, as it may result in 304 Not Modified
+        # responses, and those don't contain segment data.
+        req = swob.Request.blank(
+            '/v1/AUTH_test/mancon/manifest',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'If-Modified-Since': 'Wed, 12 Feb 2014 22:24:52 GMT',
+                     'If-Unmodified-Since': 'Thu, 13 Feb 2014 23:25:53 GMT'})
+        status, headers, body = self.call_dlo(req)
+
+        for _, _, hdrs in self.app.calls_with_headers[1:]:
+            self.assertFalse('If-Modified-Since' in hdrs)
+            self.assertFalse('If-Unmodified-Since' in hdrs)
+
+    def test_server_error_fetching_first_segment(self):
+        self.app.register(
+            'GET', '/v1/AUTH_test/c/seg_01',
+            swob.HTTPServiceUnavailable, {}, None)
+
+        req = swob.Request.blank('/v1/AUTH_test/mancon/manifest',
+                                 environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_dlo(req)
+        self.assertEqual(status, "503 Service Unavailable")
+        self.assertEqual(self.app.unread_requests, {})
+        self.assertEqual(self.dlo.logger.get_lines_for_level('error'), [
+            'While processing manifest /v1/AUTH_test/mancon/manifest, '
+            'got 503 (<html><h1>Service Unavailable</h1><p>The server is '
+            'curren...) while retrieving /v1/AUTH_test/c/seg_01',
+        ])
+
+    def test_client_error_fetching_first_segment(self):
+        self.app.register(
+            'GET', '/v1/AUTH_test/c/seg_01',
+            swob.HTTPForbidden, {}, None)
+
+        req = swob.Request.blank('/v1/AUTH_test/mancon/manifest',
+                                 environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_dlo(req)
+        self.assertEqual(status, "409 Conflict")
+        self.assertEqual(self.app.unread_requests, {})
+        self.assertEqual(self.dlo.logger.get_lines_for_level('error'), [
+            'While processing manifest /v1/AUTH_test/mancon/manifest, '
+            'got 403 (<html><h1>Forbidden</h1><p>Access was denied to this '
+            'reso...) while retrieving /v1/AUTH_test/c/seg_01',
+        ])
+
+    def test_error_fetching_second_segment(self):
+        self.app.register(
+            'GET', '/v1/AUTH_test/c/seg_02',
+            swob.HTTPForbidden, {}, None)
+
+        req = swob.Request.blank('/v1/AUTH_test/mancon/manifest',
+                                 environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_dlo(req)
+        headers = HeaderKeyDict(headers)
+
+        self.assertEqual(status, "200 OK")
+        # first segment made it out
+        self.assertEqual(body, b'aaaaa')
+        self.assertEqual(self.app.unread_requests, {})
+        self.assertEqual(self.dlo.logger.get_lines_for_level('error'), [
+            'While processing manifest /v1/AUTH_test/mancon/manifest, '
+            'got 403 (<html><h1>Forbidden</h1><p>Access was denied to this '
+            'reso...) while retrieving /v1/AUTH_test/c/seg_02',
+        ])
+
+    def test_error_listing_container_first_listing_request(self):
+        self.app.register(
+            'GET', '/v1/AUTH_test/c?prefix=seg_',
+            swob.HTTPNotFound, {}, None)
+
+        req = swob.Request.blank('/v1/AUTH_test/mancon/manifest-many-segments',
+                                 environ={'REQUEST_METHOD': 'GET'},
+                                 headers={'Range': 'bytes=-5'})
+        with mock.patch(LIMIT, 3):
+            status, headers, body = self.call_dlo(req)
+        self.assertEqual(status, "404 Not Found")
+
+    def test_error_listing_container_second_listing_request(self):
+        self.app.register(
+            'GET', '/v1/AUTH_test/c?prefix=seg_&marker=seg_03',
+            swob.HTTPNotFound, {}, None)
+
+        req = swob.Request.blank('/v1/AUTH_test/mancon/manifest-many-segments',
+                                 environ={'REQUEST_METHOD': 'GET'},
+                                 headers={'Range': 'bytes=-5'})
+        with mock.patch(LIMIT, 3):
+            status, headers, body = self.call_dlo(req)
+        self.assertEqual(status, "200 OK")
+        self.assertEqual(body, b'aaaaabbbbbccccc')
+
+    def test_error_listing_container_HEAD(self):
+        self.app.register(
+            'GET', '/v1/AUTH_test/c?prefix=seg_',
+            # for example, if a manifest refers to segments in another
+            # container, but the user is accessing the manifest via a
+            # container-level tempurl key
+            swob.HTTPUnauthorized, {}, None)
+
+        req = swob.Request.blank('/v1/AUTH_test/mancon/manifest-many-segments',
+                                 environ={'REQUEST_METHOD': 'HEAD'})
+        with mock.patch(LIMIT, 3):
+            status, headers, body = self.call_dlo(req)
+        self.assertEqual(status, "401 Unauthorized")
+        self.assertEqual(body, b"")
+
+    def test_mismatched_etag_fetching_second_segment(self):
+        self.app.register(
+            'GET', '/v1/AUTH_test/c/seg_02',
+            swob.HTTPOk, {'Content-Length': '5', 'Etag': md5hex("bbbbb")},
+            'WRONG')
+
+        req = swob.Request.blank('/v1/AUTH_test/mancon/manifest',
+                                 environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_dlo(req)
+        headers = HeaderKeyDict(headers)
+
+        self.assertEqual(status, "200 OK")
+        self.assertEqual(headers['Content-Length'], "25")
+        # stop after error
+        self.assertEqual(body, b"aaaaaWRONG")
+        log_lines = self.dlo.logger.get_lines_for_level('error')
+        self.assertEqual(len(log_lines), 1,
+                         'Expected one log line, got %r' % log_lines)
+        self.assertEqual(log_lines[0][:21], 'Bad MD5 checksum for ')
+
+    def test_mismatched_length_fetching_second_segment(self):
+        self.app.register(
+            'GET', '/v1/AUTH_test/c/seg_02',
+            swob.HTTPOk, {'Content-Length': '5', 'Etag': md5hex("bbbb")},
+            # Use a list so we can get a discrepency between content-length and
+            # number of bytes in the app_iter
+            [b'b' * 4])
+
+        req = swob.Request.blank('/v1/AUTH_test/mancon/manifest',
+                                 environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_dlo(req)
+        headers = HeaderKeyDict(headers)
+
+        self.assertEqual(status, "200 OK")
+        self.assertEqual(headers['Content-Length'], "25")
+        # stop after error
+        self.assertEqual(body, b"aaaaabbbb")
+        log_lines = self.dlo.logger.get_lines_for_level('error')
+        self.assertEqual(len(log_lines), 1,
+                         'Expected one log line, got %r' % log_lines)
+        self.assertEqual(log_lines[0][:24], 'Bad response length for ')
+
+    def test_etag_comparison_ignores_quotes(self):
+        # a little future-proofing here in case we ever fix this in swob
+        self.app.register(
+            'HEAD', '/v1/AUTH_test/mani/festo',
+            swob.HTTPOk, {'Content-Length': '0', 'Etag': 'blah',
+                          'X-Object-Manifest': 'c/quotetags'}, None)
+        self.app.register(
+            'GET', '/v1/AUTH_test/c?prefix=quotetags',
+            swob.HTTPOk, {'Content-Type': 'application/json; charset=utf-8'},
+            json.dumps([{"hash": "\"abc\"", "bytes": 5, "name": "quotetags1",
+                         "last_modified": "2013-11-22T02:42:14.261620",
+                         "content-type": "application/octet-stream"},
+                        {"hash": "def", "bytes": 5, "name": "quotetags2",
+                         "last_modified": "2013-11-22T02:42:14.261620",
+                         "content-type": "application/octet-stream"}]))
+
+        req = swob.Request.blank('/v1/AUTH_test/mani/festo',
+                                 environ={'REQUEST_METHOD': 'HEAD'})
+        status, headers, body = self.call_dlo(req)
+        headers = HeaderKeyDict(headers)
+        self.assertEqual(headers["Etag"],
+                         '"' + md5(b"abcdef",
+                                   usedforsecurity=False).hexdigest() + '"')
+
+    def test_object_prefix_quoting(self):
+        self.app.register(
+            'GET', '/v1/AUTH_test/man/accent',
+            swob.HTTPOk, {'Content-Length': '0', 'Etag': 'blah',
+                          'X-Object-Manifest': u'c/é'.encode('utf-8')}, None)
+
+        segs = [{"hash": md5hex("AAAAA"), "bytes": 5, "name": u"é1"},
+                {"hash": md5hex("AAAAA"), "bytes": 5, "name": u"é2"}]
+        self.app.register(
+            'GET', '/v1/AUTH_test/c?prefix=%C3%A9',
+            swob.HTTPOk, {'Content-Type': 'application/json'},
+            json.dumps(segs).encode('ascii'))
+
+        # NB: wsgi string
+        path = '/v1/AUTH_test/c/\xC3\xa9'
+        self.app.register(
+            'GET', path + '1',
+            swob.HTTPOk, {'Content-Length': '5', 'Etag': md5hex("AAAAA")},
+            b"AAAAA")
+        self.app.register(
+            'GET', path + '2',
+            swob.HTTPOk, {'Content-Length': '5', 'Etag': md5hex("BBBBB")},
+            b"BBBBB")
+
+        req = swob.Request.blank('/v1/AUTH_test/man/accent',
+                                 environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_dlo(req)
+        self.assertEqual(status, "200 OK")
+        self.assertEqual(body, b'AAAAABBBBB')
+
+    def test_get_taking_too_long(self):
+        the_time = [time.time()]
+
+        def mock_time():
+            return the_time[0]
+
+        # this is just a convenient place to hang a time jump
+        def mock_is_success(status_int):
+            the_time[0] += 9 * 3600
+            return status_int // 100 == 2
+
+        req = swob.Request.blank(
+            '/v1/AUTH_test/mancon/manifest',
+            environ={'REQUEST_METHOD': 'GET'})
+
+        with mock.patch('swift.common.request_helpers.time.time',
+                        mock_time), \
+                mock.patch('swift.common.request_helpers.is_success',
+                           mock_is_success), \
+                mock.patch.object(dlo, 'is_success', mock_is_success):
+            status, headers, body = self.call_dlo(req)
+
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(body, b'aaaaabbbbbccccc')
+
+    def test_get_oversize_segment(self):
+        # If we send a Content-Length header to the client, it's based on the
+        # container listing. If a segment gets bigger by the time we get to it
+        # (like if a client uploads a bigger segment w/the same name), we need
+        # to not send anything beyond the length we promised. Also, we should
+        # probably raise an exception.
+
+        # This is now longer than the original seg_03+seg_04+seg_05 combined
+        self.app.register(
+            'GET', '/v1/AUTH_test/c/seg_03',
+            swob.HTTPOk, {'Content-Length': '20', 'Etag': 'seg03-etag'},
+            'cccccccccccccccccccc')
+
+        req = swob.Request.blank(
+            '/v1/AUTH_test/mancon/manifest',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_dlo(req)
+        headers = HeaderKeyDict(headers)
+
+        self.assertEqual(status, '200 OK')  # sanity check
+        self.assertEqual(headers.get('Content-Length'), '25')  # sanity check
+        self.assertEqual(body, b'aaaaabbbbbccccccccccccccc')
+        self.assertEqual(
+            self.app.calls,
+            [('GET', '/v1/AUTH_test/mancon/manifest'),
+             ('GET', '/v1/AUTH_test/c?prefix=seg'),
+             ('GET', '/v1/AUTH_test/c/seg_01?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/c/seg_02?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/c/seg_03?multipart-manifest=get')])
+
+    def test_get_undersize_segment(self):
+        # If we send a Content-Length header to the client, it's based on the
+        # container listing. If a segment gets smaller by the time we get to
+        # it (like if a client uploads a smaller segment w/the same name), we
+        # need to raise an exception so that the connection will be closed by
+        # the WSGI server. Otherwise, the WSGI server will be waiting for the
+        # next request, the client will still be waiting for the rest of the
+        # response, and nobody will be happy.
+
+        # Shrink it by a single byte
+        self.app.register(
+            'GET', '/v1/AUTH_test/c/seg_03',
+            swob.HTTPOk, {'Content-Length': '4', 'Etag': md5hex("cccc")},
+            'cccc')
+
+        req = swob.Request.blank(
+            '/v1/AUTH_test/mancon/manifest',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_dlo(req)
+        headers = HeaderKeyDict(headers)
+
+        self.assertEqual(status, '200 OK')  # sanity check
+        self.assertEqual(headers.get('Content-Length'), '25')  # sanity check
+        self.assertEqual(body, b'aaaaabbbbbccccdddddeeeee')
+
+    def test_get_undersize_segment_range(self):
+        # Shrink it by a single byte
+        self.app.register(
+            'GET', '/v1/AUTH_test/c/seg_03',
+            swob.HTTPOk, {'Content-Length': '4', 'Etag': md5hex("cccc")},
+            'cccc')
+
+        req = swob.Request.blank(
+            '/v1/AUTH_test/mancon/manifest',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Range': 'bytes=0-14'})
+        status, headers, body = self.call_dlo(req)
+        headers = HeaderKeyDict(headers)
+
+        self.assertEqual(status, '206 Partial Content')  # sanity check
+        self.assertEqual(headers.get('Content-Length'), '15')  # sanity check
+        self.assertEqual(body, b'aaaaabbbbbcccc')
+
+    def test_get_with_auth_overridden(self):
+        auth_got_called = [0]
+
+        def my_auth(req):
+            auth_got_called[0] += 1
+            return None
+
+        req = swob.Request.blank('/v1/AUTH_test/mancon/manifest',
+                                 environ={'REQUEST_METHOD': 'GET',
+                                          'swift.authorize': my_auth})
+        status, headers, body = self.call_dlo(req)
+        self.assertTrue(auth_got_called[0] > 1)
+
+
+class TestDloConfiguration(unittest.TestCase):
+    """
+    For backwards compatibility, we will read a couple of values out of the
+    proxy's config section if we don't have any config values.
+    """
+
+    def setUp(self):
+        self.tmpdir = tempfile.mkdtemp()
+
+    def tearDown(self):
+        shutil.rmtree(self.tmpdir)
+
+    def test_skip_defaults_if_configured(self):
+        # The presence of even one config value in our config section means we
+        # won't go looking for the proxy config at all.
+        proxy_conf = dedent("""
+        [DEFAULT]
+        bind_ip = 10.4.5.6
+
+        [pipeline:main]
+        pipeline = catch_errors dlo ye-olde-proxy-server
+
+        [filter:catch_errors]
+        use = egg:swift#catch_errors
+
+        [filter:dlo]
+        use = egg:swift#dlo
+        max_get_time = 3600
+
+        [app:ye-olde-proxy-server]
+        use = egg:swift#proxy
+        rate_limit_segments_per_sec = 7
+        rate_limit_after_segment = 13
+        max_get_time = 2900
+        """)
+
+        conffile = tempfile.NamedTemporaryFile(mode='w')
+        conffile.write(proxy_conf)
+        conffile.flush()
+
+        mware = dlo.filter_factory({
+            'max_get_time': '3600',
+            '__file__': conffile.name
+        })("no app here")
+
+        self.assertEqual(1, mware.rate_limit_segments_per_sec)
+        self.assertEqual(10, mware.rate_limit_after_segment)
+        self.assertEqual(3600, mware.max_get_time)
+
+        conffile.close()
+
+    def test_finding_defaults_from_file(self):
+        # If DLO has no config vars, go pull them from the proxy server's
+        # config section
+        proxy_conf = dedent("""
+        [DEFAULT]
+        bind_ip = 10.4.5.6
+
+        [pipeline:main]
+        pipeline = catch_errors dlo ye-olde-proxy-server
+
+        [filter:catch_errors]
+        use = egg:swift#catch_errors
+
+        [filter:dlo]
+        use = egg:swift#dlo
+
+        [app:ye-olde-proxy-server]
+        use = egg:swift#proxy
+        rate_limit_after_segment = 13
+        set max_get_time = 2900
+        """)
+
+        conffile = tempfile.NamedTemporaryFile(mode='w')
+        conffile.write(proxy_conf)
+        conffile.flush()
+
+        mware = dlo.filter_factory({
+            '__file__': conffile.name
+        })("no app here")
+
+        self.assertEqual(1, mware.rate_limit_segments_per_sec)
+        self.assertEqual(13, mware.rate_limit_after_segment)
+        self.assertEqual(2900, mware.max_get_time)
+
+        conffile.close()
+
+    def test_finding_defaults_from_dir(self):
+        # If DLO has no config vars, go pull them from the proxy server's
+        # config section
+        proxy_conf1 = dedent("""
+        [DEFAULT]
+        bind_ip = 10.4.5.6
+
+        [pipeline:main]
+        pipeline = catch_errors dlo ye-olde-proxy-server
+        """)
+
+        proxy_conf2 = dedent("""
+        [filter:catch_errors]
+        use = egg:swift#catch_errors
+
+        [filter:dlo]
+        use = egg:swift#dlo
+
+        [app:ye-olde-proxy-server]
+        use = egg:swift#proxy
+        rate_limit_after_segment = 13
+        max_get_time = 2900
+        """)
+
+        conf_dir = self.tmpdir
+
+        conffile1 = tempfile.NamedTemporaryFile(mode='w',
+                                                dir=conf_dir, suffix='.conf')
+        conffile1.write(proxy_conf1)
+        conffile1.flush()
+
+        conffile2 = tempfile.NamedTemporaryFile(mode='w',
+                                                dir=conf_dir, suffix='.conf')
+        conffile2.write(proxy_conf2)
+        conffile2.flush()
+
+        mware = dlo.filter_factory({
+            '__file__': conf_dir
+        })("no app here")
+
+        self.assertEqual(1, mware.rate_limit_segments_per_sec)
+        self.assertEqual(13, mware.rate_limit_after_segment)
+        self.assertEqual(2900, mware.max_get_time)
+
+        conffile1.close()
+        conffile2.close()
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/test_domain_remap.py b/test/unit/common/middleware/test_domain_remap.py
index 897ce50baf..61d549bc06 100644
--- a/test/unit/common/middleware/test_domain_remap.py
+++ b/test/unit/common/middleware/test_domain_remap.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -15,14 +15,23 @@
 
 import unittest
 
-from swift.common.swob import Request
+from swift.common.swob import Request, HTTPMovedPermanently
 from swift.common.middleware import domain_remap
+from swift.common import registry
 
 
 class FakeApp(object):
 
     def __call__(self, env, start_response):
-        return env['PATH_INFO']
+        start_response('200 OK', [])
+        return [env['PATH_INFO'].encode('latin-1')]
+
+
+class RedirectSlashApp(object):
+
+    def __call__(self, env, start_response):
+        loc = env['PATH_INFO'] + '/'
+        return HTTPMovedPermanently(location=loc)(env, start_response)
 
 
 def start_response(*args):
@@ -35,66 +44,111 @@ def setUp(self):
         self.app = domain_remap.DomainRemapMiddleware(FakeApp(), {})
 
     def test_domain_remap_passthrough(self):
+        req = Request.blank('/', environ={'REQUEST_METHOD': 'GET',
+                                          'SERVER_NAME': 'example.com'},
+                            headers={'Host': None})
+        resp = self.app(req.environ, start_response)
+        self.assertEqual(resp, [b'/'])
         req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'},
                             headers={'Host': 'example.com'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, '/')
+        self.assertEqual(resp, [b'/'])
         req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'},
                             headers={'Host': 'example.com:8080'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, '/')
+        self.assertEqual(resp, [b'/'])
 
     def test_domain_remap_account(self):
+        req = Request.blank('/', environ={'REQUEST_METHOD': 'GET',
+                                          'SERVER_NAME': 'AUTH_a.example.com'},
+                            headers={'Host': None})
+        resp = self.app(req.environ, start_response)
+        self.assertEqual(resp, [b'/v1/AUTH_a/'])
         req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'},
                             headers={'Host': 'AUTH_a.example.com'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, '/v1/AUTH_a')
+        self.assertEqual(resp, [b'/v1/AUTH_a/'])
         req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'},
                             headers={'Host': 'AUTH-uuid.example.com'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, '/v1/AUTH_uuid')
+        self.assertEqual(resp, [b'/v1/AUTH_uuid/'])
 
     def test_domain_remap_account_container(self):
         req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'},
                             headers={'Host': 'c.AUTH_a.example.com'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, '/v1/AUTH_a/c')
+        self.assertEqual(resp, [b'/v1/AUTH_a/c/'])
 
     def test_domain_remap_extra_subdomains(self):
         req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'},
                             headers={'Host': 'x.y.c.AUTH_a.example.com'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, ['Bad domain in host header'])
+        self.assertEqual(resp, [b'Bad domain in host header'])
 
-    def test_domain_remap_account_with_path_root(self):
+    def test_domain_remap_account_with_path_root_container(self):
         req = Request.blank('/v1', environ={'REQUEST_METHOD': 'GET'},
                             headers={'Host': 'AUTH_a.example.com'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, '/v1/AUTH_a')
+        self.assertEqual(resp, [b'/v1/AUTH_a/v1'])
 
-    def test_domain_remap_account_container_with_path_root(self):
+    def test_domain_remap_account_with_path_root_unicode_container(self):
+        req = Request.blank('/%E4%BD%A0%E5%A5%BD',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Host': 'AUTH_a.example.com'})
+        resp = self.app(req.environ, start_response)
+        self.assertEqual(resp, [b'/v1/AUTH_a/\xe4\xbd\xa0\xe5\xa5\xbd'])
+
+    def test_domain_remap_account_container_with_path_root_obj(self):
         req = Request.blank('/v1', environ={'REQUEST_METHOD': 'GET'},
                             headers={'Host': 'c.AUTH_a.example.com'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, '/v1/AUTH_a/c')
+        self.assertEqual(resp, [b'/v1/AUTH_a/c/v1'])
+
+    def test_domain_remap_account_container_with_path_obj_slash_v1(self):
+        # Include http://localhost because urlparse used in Request.__init__
+        # parse //v1 as http://v1
+        req = Request.blank('http://localhost//v1',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Host': 'c.AUTH_a.example.com'})
+        resp = self.app(req.environ, start_response)
+        self.assertEqual(resp, [b'/v1/AUTH_a/c//v1'])
+
+    def test_domain_remap_account_container_with_root_path_obj_slash_v1(self):
+        req = Request.blank('/v1//v1',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Host': 'c.AUTH_a.example.com'})
+        resp = self.app(req.environ, start_response)
+        self.assertEqual(resp, [b'/v1/AUTH_a/c/v1//v1'])
+
+    def test_domain_remap_account_container_with_path_trailing_slash(self):
+        req = Request.blank('/obj/', environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Host': 'c.AUTH_a.example.com'})
+        resp = self.app(req.environ, start_response)
+        self.assertEqual(resp, [b'/v1/AUTH_a/c/obj/'])
 
     def test_domain_remap_account_container_with_path(self):
         req = Request.blank('/obj', environ={'REQUEST_METHOD': 'GET'},
                             headers={'Host': 'c.AUTH_a.example.com'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, '/v1/AUTH_a/c/obj')
+        self.assertEqual(resp, [b'/v1/AUTH_a/c/obj'])
 
     def test_domain_remap_account_container_with_path_root_and_path(self):
         req = Request.blank('/v1/obj', environ={'REQUEST_METHOD': 'GET'},
                             headers={'Host': 'c.AUTH_a.example.com'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, '/v1/AUTH_a/c/obj')
+        self.assertEqual(resp, [b'/v1/AUTH_a/c/v1/obj'])
+
+    def test_domain_remap_with_path_root_and_path_no_slash(self):
+        req = Request.blank('/v1obj', environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Host': 'c.AUTH_a.example.com'})
+        resp = self.app(req.environ, start_response)
+        self.assertEqual(resp, [b'/v1/AUTH_a/c/v1obj'])
 
     def test_domain_remap_account_matching_ending_not_domain(self):
         req = Request.blank('/dontchange', environ={'REQUEST_METHOD': 'GET'},
                             headers={'Host': 'c.aexample.com'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, '/dontchange')
+        self.assertEqual(resp, [b'/dontchange'])
 
     def test_domain_remap_configured_with_empty_storage_domain(self):
         self.app = domain_remap.DomainRemapMiddleware(FakeApp(),
@@ -102,7 +156,28 @@ def test_domain_remap_configured_with_empty_storage_domain(self):
         req = Request.blank('/test', environ={'REQUEST_METHOD': 'GET'},
                             headers={'Host': 'c.AUTH_a.example.com'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, '/test')
+        self.assertEqual(resp, [b'/test'])
+
+    def test_storage_domains_conf_format(self):
+        conf = {'storage_domain': 'foo.com'}
+        app = domain_remap.filter_factory(conf)(FakeApp())
+        self.assertEqual(app.storage_domain, ['.foo.com'])
+
+        conf = {'storage_domain': 'foo.com, '}
+        app = domain_remap.filter_factory(conf)(FakeApp())
+        self.assertEqual(app.storage_domain, ['.foo.com'])
+
+        conf = {'storage_domain': 'foo.com, bar.com'}
+        app = domain_remap.filter_factory(conf)(FakeApp())
+        self.assertEqual(app.storage_domain, ['.foo.com', '.bar.com'])
+
+        conf = {'storage_domain': 'foo.com, .bar.com'}
+        app = domain_remap.filter_factory(conf)(FakeApp())
+        self.assertEqual(app.storage_domain, ['.foo.com', '.bar.com'])
+
+        conf = {'storage_domain': '.foo.com, .bar.com'}
+        app = domain_remap.filter_factory(conf)(FakeApp())
+        self.assertEqual(app.storage_domain, ['.foo.com', '.bar.com'])
 
     def test_domain_remap_configured_with_prefixes(self):
         conf = {'reseller_prefixes': 'PREFIX'}
@@ -110,7 +185,7 @@ def test_domain_remap_configured_with_prefixes(self):
         req = Request.blank('/test', environ={'REQUEST_METHOD': 'GET'},
                             headers={'Host': 'c.prefix_uuid.example.com'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, '/v1/PREFIX_uuid/c/test')
+        self.assertEqual(resp, [b'/v1/PREFIX_uuid/c/test'])
 
     def test_domain_remap_configured_with_bad_prefixes(self):
         conf = {'reseller_prefixes': 'UNKNOWN'}
@@ -118,7 +193,146 @@ def test_domain_remap_configured_with_bad_prefixes(self):
         req = Request.blank('/test', environ={'REQUEST_METHOD': 'GET'},
                             headers={'Host': 'c.prefix_uuid.example.com'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, '/test')
+        self.assertEqual(resp, [b'/test'])
+
+    def test_domain_remap_configured_with_no_prefixes(self):
+        conf = {'reseller_prefixes': ''}
+        self.app = domain_remap.DomainRemapMiddleware(FakeApp(), conf)
+        req = Request.blank('/test', environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Host': 'c.uuid.example.com'})
+        resp = self.app(req.environ, start_response)
+        self.assertEqual(resp, [b'/v1/uuid/c/test'])
+
+    def test_domain_remap_add_prefix(self):
+        conf = {'default_reseller_prefix': 'FOO'}
+        self.app = domain_remap.DomainRemapMiddleware(FakeApp(), conf)
+        req = Request.blank('/test', environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Host': 'uuid.example.com'})
+        resp = self.app(req.environ, start_response)
+        self.assertEqual(resp, [b'/v1/FOO_uuid/test'])
+
+    def test_domain_remap_add_prefix_already_there(self):
+        conf = {'default_reseller_prefix': 'AUTH'}
+        self.app = domain_remap.DomainRemapMiddleware(FakeApp(), conf)
+        req = Request.blank('/test', environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Host': 'auth-uuid.example.com'})
+        resp = self.app(req.environ, start_response)
+        self.assertEqual(resp, [b'/v1/AUTH_uuid/test'])
+
+    def test_multiple_storage_domains(self):
+        conf = {'storage_domain': 'storage1.com, storage2.com'}
+        self.app = domain_remap.DomainRemapMiddleware(FakeApp(), conf)
+
+        def do_test(host):
+            req = Request.blank('/test', environ={'REQUEST_METHOD': 'GET'},
+                                headers={'Host': host})
+            return self.app(req.environ, start_response)
+
+        resp = do_test('auth-uuid.storage1.com')
+        self.assertEqual(resp, [b'/v1/AUTH_uuid/test'])
+
+        resp = do_test('auth-uuid.storage2.com')
+        self.assertEqual(resp, [b'/v1/AUTH_uuid/test'])
+
+        resp = do_test('auth-uuid.storage3.com')
+        self.assertEqual(resp, [b'/test'])
+
+    def test_domain_remap_redirect(self):
+        app = domain_remap.DomainRemapMiddleware(RedirectSlashApp(), {})
+
+        req = Request.blank('/cont', environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Host': 'auth-uuid.example.com'})
+        resp = req.get_response(app)
+        self.assertEqual(resp.status_int, 301)
+        self.assertEqual(resp.headers.get('Location'),
+                         'http://auth-uuid.example.com/cont/')
+
+        req = Request.blank('/cont/test', environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Host': 'auth-uuid.example.com'})
+        resp = req.get_response(app)
+        self.assertEqual(resp.status_int, 301)
+        self.assertEqual(resp.headers.get('Location'),
+                         'http://auth-uuid.example.com/cont/test/')
+
+        req = Request.blank('/test', environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Host': 'cont.auth-uuid.example.com'})
+        resp = req.get_response(app)
+        self.assertEqual(resp.status_int, 301)
+        self.assertEqual(resp.headers.get('Location'),
+                         'http://cont.auth-uuid.example.com/test/')
+
+
+class TestDomainRemapClientMangling(unittest.TestCase):
+    def setUp(self):
+        self.app = domain_remap.DomainRemapMiddleware(FakeApp(), {
+            'mangle_client_paths': True})
+
+    def test_domain_remap_account_with_path_root_container(self):
+        req = Request.blank('/v1', environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Host': 'AUTH_a.example.com'})
+        resp = self.app(req.environ, start_response)
+        self.assertEqual(resp, [b'/v1/AUTH_a/'])
+
+    def test_domain_remap_account_container_with_path_root_obj(self):
+        req = Request.blank('/v1', environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Host': 'c.AUTH_a.example.com'})
+        resp = self.app(req.environ, start_response)
+        self.assertEqual(resp, [b'/v1/AUTH_a/c/'])
+
+    def test_domain_remap_account_container_with_path_obj_slash_v1(self):
+        # Include http://localhost because urlparse used in Request.__init__
+        # parse //v1 as http://v1
+        req = Request.blank('http://localhost//v1',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Host': 'c.AUTH_a.example.com'})
+        resp = self.app(req.environ, start_response)
+        self.assertEqual(resp, [b'/v1/AUTH_a/c//v1'])
+
+    def test_domain_remap_account_container_with_root_path_obj_slash_v1(self):
+        req = Request.blank('/v1//v1',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Host': 'c.AUTH_a.example.com'})
+        resp = self.app(req.environ, start_response)
+        self.assertEqual(resp, [b'/v1/AUTH_a/c//v1'])
+
+    def test_domain_remap_account_container_with_path_trailing_slash(self):
+        req = Request.blank('/obj/', environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Host': 'c.AUTH_a.example.com'})
+        resp = self.app(req.environ, start_response)
+        self.assertEqual(resp, [b'/v1/AUTH_a/c/obj/'])
+
+    def test_domain_remap_account_container_with_path_root_and_path(self):
+        req = Request.blank('/v1/obj', environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Host': 'c.AUTH_a.example.com'})
+        resp = self.app(req.environ, start_response)
+        self.assertEqual(resp, [b'/v1/AUTH_a/c/obj'])
+
+    def test_domain_remap_with_path_root_and_path_no_slash(self):
+        req = Request.blank('/v1obj', environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Host': 'c.AUTH_a.example.com'})
+        resp = self.app(req.environ, start_response)
+        self.assertEqual(resp, [b'/v1/AUTH_a/c/v1obj'])
+
+
+class TestSwiftInfo(unittest.TestCase):
+    def setUp(self):
+        registry._swift_info = {}
+        registry._swift_admin_info = {}
+
+    def test_registered_defaults(self):
+        domain_remap.filter_factory({})
+        swift_info = registry.get_swift_info()
+        self.assertIn('domain_remap', swift_info)
+        self.assertEqual(swift_info['domain_remap'], {
+            'default_reseller_prefix': None})
+
+    def test_registered_nondefaults(self):
+        domain_remap.filter_factory({'default_reseller_prefix': 'cupcake',
+                                     'mangle_client_paths': 'yes'})
+        swift_info = registry.get_swift_info()
+        self.assertIn('domain_remap', swift_info)
+        self.assertEqual(swift_info['domain_remap'], {
+            'default_reseller_prefix': 'cupcake'})
 
 
 if __name__ == '__main__':
diff --git a/test/unit/common/middleware/test_etag_quoter.py b/test/unit/common/middleware/test_etag_quoter.py
new file mode 100644
index 0000000000..089fbea0e7
--- /dev/null
+++ b/test/unit/common/middleware/test_etag_quoter.py
@@ -0,0 +1,215 @@
+# Copyright (c) 2010-2020 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from unittest import mock
+import unittest
+
+from swift.common import swob
+from swift.common.middleware import etag_quoter
+from swift.proxy.controllers.base import get_cache_key
+
+from test.unit.common.middleware.helpers import FakeSwift
+
+
+def set_info_cache(req, cache_data, account, container=None):
+    req.environ.setdefault('swift.infocache', {})[
+        get_cache_key(account, container)] = cache_data
+
+
+class TestEtagQuoter(unittest.TestCase):
+    def get_mw(self, conf, etag='unquoted-etag', path=None):
+        if path is None:
+            path = '/v1/AUTH_acc/con/some/path/to/obj'
+        app = FakeSwift()
+        hdrs = {} if etag is None else {'ETag': etag}
+        app.register('GET', path, swob.HTTPOk, hdrs)
+        return etag_quoter.filter_factory({}, **conf)(app)
+
+    @mock.patch('swift.common.middleware.etag_quoter.register_swift_info')
+    def test_swift_info(self, mock_register):
+        self.get_mw({})
+        self.assertEqual(mock_register.mock_calls, [
+            mock.call('etag_quoter', enable_by_default=False)])
+        mock_register.reset_mock()
+
+        self.get_mw({'enable_by_default': '1'})
+        self.assertEqual(mock_register.mock_calls, [
+            mock.call('etag_quoter', enable_by_default=True)])
+        mock_register.reset_mock()
+
+        self.get_mw({'enable_by_default': 'no'})
+        self.assertEqual(mock_register.mock_calls, [
+            mock.call('etag_quoter', enable_by_default=False)])
+
+    def test_account_on_overrides_cluster_off(self):
+        req = swob.Request.blank('/v1/AUTH_acc/con/some/path/to/obj')
+        set_info_cache(req, {
+            'status': 200,
+            'sysmeta': {'rfc-compliant-etags': '1'},
+        }, 'AUTH_acc')
+        set_info_cache(req, {
+            'status': 200,
+            'sysmeta': {},
+        }, 'AUTH_acc', 'con')
+        resp = req.get_response(self.get_mw({'enable_by_default': 'false'}))
+        self.assertEqual(resp.headers['ETag'], '"unquoted-etag"')
+
+    def test_account_off_overrides_cluster_on(self):
+        req = swob.Request.blank('/v1/AUTH_acc/con/some/path/to/obj')
+        set_info_cache(req, {
+            'status': 200,
+            'sysmeta': {'rfc-compliant-etags': 'no'},
+        }, 'AUTH_acc')
+        set_info_cache(req, {
+            'status': 200,
+            'sysmeta': {},
+        }, 'AUTH_acc', 'con')
+        resp = req.get_response(self.get_mw({'enable_by_default': 'yes'}))
+        self.assertEqual(resp.headers['ETag'], 'unquoted-etag')
+
+    def test_container_on_overrides_cluster_off(self):
+        req = swob.Request.blank('/v1/AUTH_acc/con/some/path/to/obj')
+        set_info_cache(req, {
+            'status': 200,
+            'sysmeta': {},
+        }, 'AUTH_acc')
+        set_info_cache(req, {
+            'status': 200,
+            'sysmeta': {'rfc-compliant-etags': 't'},
+        }, 'AUTH_acc', 'con')
+        resp = req.get_response(self.get_mw({'enable_by_default': 'false'}))
+        self.assertEqual(resp.headers['ETag'], '"unquoted-etag"')
+
+    def test_container_off_overrides_cluster_on(self):
+        req = swob.Request.blank('/v1/AUTH_acc/con/some/path/to/obj')
+        set_info_cache(req, {
+            'status': 200,
+            'sysmeta': {},
+        }, 'AUTH_acc')
+        set_info_cache(req, {
+            'status': 200,
+            'sysmeta': {'rfc-compliant-etags': '0'},
+        }, 'AUTH_acc', 'con')
+        resp = req.get_response(self.get_mw({'enable_by_default': 'yes'}))
+        self.assertEqual(resp.headers['ETag'], 'unquoted-etag')
+
+    def test_container_on_overrides_account_off(self):
+        req = swob.Request.blank('/v1/AUTH_acc/con/some/path/to/obj')
+        set_info_cache(req, {
+            'status': 200,
+            'sysmeta': {'rfc-compliant-etags': 'no'},
+        }, 'AUTH_acc')
+        set_info_cache(req, {
+            'status': 200,
+            'sysmeta': {'rfc-compliant-etags': 't'},
+        }, 'AUTH_acc', 'con')
+        resp = req.get_response(self.get_mw({}))
+        self.assertEqual(resp.headers['ETag'], '"unquoted-etag"')
+
+    def test_container_off_overrides_account_on(self):
+        req = swob.Request.blank('/v1/AUTH_acc/con/some/path/to/obj')
+        set_info_cache(req, {
+            'status': 200,
+            'sysmeta': {'rfc-compliant-etags': 'yes'},
+        }, 'AUTH_acc')
+        set_info_cache(req, {
+            'status': 200,
+            'sysmeta': {'rfc-compliant-etags': 'false'},
+        }, 'AUTH_acc', 'con')
+        resp = req.get_response(self.get_mw({}))
+        self.assertEqual(resp.headers['ETag'], 'unquoted-etag')
+
+    def test_cluster_wide(self):
+        req = swob.Request.blank('/v1/AUTH_acc/con/some/path/to/obj')
+        set_info_cache(req, {'status': 200, 'sysmeta': {}}, 'AUTH_acc')
+        set_info_cache(req, {'status': 200, 'sysmeta': {}}, 'AUTH_acc', 'con')
+        resp = req.get_response(self.get_mw({'enable_by_default': 't'}))
+        self.assertEqual(resp.headers['ETag'], '"unquoted-etag"')
+
+    def test_already_valid(self):
+        req = swob.Request.blank('/v1/AUTH_acc/con/some/path/to/obj')
+        set_info_cache(req, {'status': 200, 'sysmeta': {}}, 'AUTH_acc')
+        set_info_cache(req, {'status': 200, 'sysmeta': {}}, 'AUTH_acc', 'con')
+        resp = req.get_response(self.get_mw({'enable_by_default': 't'},
+                                            '"quoted-etag"'))
+        self.assertEqual(resp.headers['ETag'], '"quoted-etag"')
+
+    def test_already_weak_but_valid(self):
+        req = swob.Request.blank('/v1/AUTH_acc/con/some/path/to/obj')
+        set_info_cache(req, {'status': 200, 'sysmeta': {}}, 'AUTH_acc')
+        set_info_cache(req, {'status': 200, 'sysmeta': {}}, 'AUTH_acc', 'con')
+        resp = req.get_response(self.get_mw({'enable_by_default': 't'},
+                                            'W/"weak-etag"'))
+        self.assertEqual(resp.headers['ETag'], 'W/"weak-etag"')
+
+    def test_only_half_valid(self):
+        req = swob.Request.blank('/v1/AUTH_acc/con/some/path/to/obj')
+        set_info_cache(req, {'status': 200, 'sysmeta': {}}, 'AUTH_acc')
+        set_info_cache(req, {'status': 200, 'sysmeta': {}}, 'AUTH_acc', 'con')
+        resp = req.get_response(self.get_mw({'enable_by_default': 't'},
+                                            '"weird-etag'))
+        self.assertEqual(resp.headers['ETag'], '""weird-etag"')
+
+    def test_no_etag(self):
+        req = swob.Request.blank('/v1/AUTH_acc/con/some/path/to/obj')
+        set_info_cache(req, {'status': 200, 'sysmeta': {}}, 'AUTH_acc')
+        set_info_cache(req, {'status': 200, 'sysmeta': {}}, 'AUTH_acc', 'con')
+        resp = req.get_response(self.get_mw({'enable_by_default': 't'},
+                                            etag=None))
+        self.assertNotIn('ETag', resp.headers)
+
+    def test_non_swift_path(self):
+        path = '/some/other/location/entirely'
+        req = swob.Request.blank(path)
+        resp = req.get_response(self.get_mw({'enable_by_default': 't'},
+                                            path=path))
+        self.assertEqual(resp.headers['ETag'], 'unquoted-etag')
+
+    def test_non_object_request(self):
+        path = '/v1/AUTH_acc/con'
+        req = swob.Request.blank(path)
+        resp = req.get_response(self.get_mw({'enable_by_default': 't'},
+                                            path=path))
+        self.assertEqual(resp.headers['ETag'], 'unquoted-etag')
+
+    def test_no_container_info(self):
+        mw = self.get_mw({'enable_by_default': 't'})
+        req = swob.Request.blank('/v1/AUTH_acc/con/some/path/to/obj')
+        set_info_cache(req, {'status': 200, 'sysmeta': {}}, 'AUTH_acc')
+        mw.app.register('HEAD', '/v1/AUTH_acc/con',
+                        swob.HTTPServiceUnavailable, {})
+        resp = req.get_response(mw)
+        self.assertEqual(resp.headers['ETag'], 'unquoted-etag')
+        set_info_cache(req, {'status': 404, 'sysmeta': {}}, 'AUTH_acc', 'con')
+        resp = req.get_response(mw)
+        self.assertEqual(resp.headers['ETag'], 'unquoted-etag')
+        set_info_cache(req, {'status': 200, 'sysmeta': {}}, 'AUTH_acc', 'con')
+        resp = req.get_response(mw)
+        self.assertEqual(resp.headers['ETag'], '"unquoted-etag"')
+
+    def test_no_account_info(self):
+        mw = self.get_mw({'enable_by_default': 't'})
+        req = swob.Request.blank('/v1/AUTH_acc/con/some/path/to/obj')
+        mw.app.register('HEAD', '/v1/AUTH_acc',
+                        swob.HTTPServiceUnavailable, {})
+        set_info_cache(req, {'status': 200, 'sysmeta': {}}, 'AUTH_acc', 'con')
+        resp = req.get_response(mw)
+        self.assertEqual(resp.headers['ETag'], 'unquoted-etag')
+        set_info_cache(req, {'status': 404, 'sysmeta': {}}, 'AUTH_acc')
+        resp = req.get_response(mw)
+        self.assertEqual(resp.headers['ETag'], 'unquoted-etag')
+        set_info_cache(req, {'status': 200, 'sysmeta': {}}, 'AUTH_acc')
+        resp = req.get_response(mw)
+        self.assertEqual(resp.headers['ETag'], '"unquoted-etag"')
diff --git a/test/unit/common/middleware/test_except.py b/test/unit/common/middleware/test_except.py
deleted file mode 100644
index 05c243777b..0000000000
--- a/test/unit/common/middleware/test_except.py
+++ /dev/null
@@ -1,86 +0,0 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#    http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-# implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-import unittest
-
-from swift.common.swob import Request, Response
-from swift.common.middleware import catch_errors
-from swift.common.utils import get_logger
-
-class FakeApp(object):
-    def __init__(self, error=False, body_iter=None):
-        self.error = error
-        self.body_iter = body_iter
-
-    def __call__(self, env, start_response):
-        if 'swift.trans_id' not in env:
-            raise Exception('Trans id should always be in env')
-        if self.error:
-            raise Exception('An error occurred')
-        if self.body_iter is None:
-            return ["FAKE APP"]
-        else:
-            return self.body_iter
-
-def start_response(*args):
-    pass
-
-class TestCatchErrors(unittest.TestCase):
-
-    def setUp(self):
-        self.logger = get_logger({})
-        self.logger.txn_id = None
-
-    def test_catcherrors_passthrough(self):
-        app = catch_errors.CatchErrorMiddleware(FakeApp(), {})
-        req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'})
-        resp = app(req.environ, start_response)
-        self.assertEquals(list(resp), ['FAKE APP'])
-
-    def test_catcherrors(self):
-        app = catch_errors.CatchErrorMiddleware(FakeApp(True), {})
-        req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'})
-        resp = app(req.environ, start_response)
-        self.assertEquals(list(resp), ['An error occurred'])
-
-    def test_trans_id_header_pass(self):
-        self.assertEquals(self.logger.txn_id, None)
-
-        def start_response(status, headers, exc_info=None):
-            self.assert_('x-trans-id' in (x[0] for x in headers))
-        app = catch_errors.CatchErrorMiddleware(FakeApp(), {})
-        req = Request.blank('/v1/a/c/o')
-        app(req.environ, start_response)
-        self.assertEquals(len(self.logger.txn_id), 34) # 32 hex + 'tx'
-
-    def test_trans_id_header_fail(self):
-        self.assertEquals(self.logger.txn_id, None)
-
-        def start_response(status, headers, exc_info=None):
-            self.assert_('x-trans-id' in (x[0] for x in headers))
-        app = catch_errors.CatchErrorMiddleware(FakeApp(True), {})
-        req = Request.blank('/v1/a/c/o')
-        app(req.environ, start_response)
-        self.assertEquals(len(self.logger.txn_id), 34)
-
-    def test_error_in_iterator(self):
-        app = catch_errors.CatchErrorMiddleware(
-            FakeApp(body_iter=(int(x) for x in 'abcd')), {})
-        req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'})
-        resp = app(req.environ, start_response)
-        self.assertEquals(list(resp), ['An error occurred'])
-
-if __name__ == '__main__':
-    unittest.main()
diff --git a/test/unit/common/middleware/test_formpost.py b/test/unit/common/middleware/test_formpost.py
index c4067f5918..f2dc359d0e 100644
--- a/test/unit/common/middleware/test_formpost.py
+++ b/test/unit/common/middleware/test_formpost.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2011 OpenStack, LLC.
+# Copyright (c) 2011 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,277 +13,114 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
+import base64
 import hmac
+import hashlib
 import unittest
-from hashlib import sha1
-from contextlib import contextmanager
-from StringIO import StringIO
 from time import time
 
-from swift.common.swob import Request, Response
-from swift.common.middleware import tempauth, formpost
-
-
-class FakeMemcache(object):
-
-    def __init__(self):
-        self.store = {}
-
-    def get(self, key):
-        return self.store.get(key)
-
-    def set(self, key, value, timeout=0):
-        self.store[key] = value
-        return True
+from unittest import mock
+from io import BytesIO, StringIO
 
-    def incr(self, key, timeout=0):
-        self.store[key] = self.store.setdefault(key, 0) + 1
-        return self.store[key]
+from swift.common.swob import Request, Response, wsgi_quote
+from swift.common.middleware import tempauth, formpost
+from swift.common.middleware.tempurl import DEFAULT_ALLOWED_DIGESTS
+from swift.common.utils import split_path
+from swift.common import registry, digest as digest_utils
+from swift.proxy.controllers.base import get_cache_key
+from test.debug_logger import debug_logger
 
-    @contextmanager
-    def soft_lock(self, key, timeout=0, retries=5):
-        yield True
 
-    def delete(self, key):
-        try:
-            del self.store[key]
-        except Exception:
-            pass
-        return True
+def hmac_msg(path, redirect, max_file_size, max_file_count, expires):
+    msg = '%s\n%s\n%s\n%s\n%s' % (
+        path, redirect, max_file_size, max_file_count, expires)
+    return msg.encode('utf-8')
 
 
 class FakeApp(object):
 
-    def __init__(self, status_headers_body_iter=None):
+    def __init__(self, status_headers_body_iter=None,
+                 check_no_query_string=True):
         self.status_headers_body_iter = status_headers_body_iter
         if not self.status_headers_body_iter:
             self.status_headers_body_iter = iter([('404 Not Found', {
                 'x-test-header-one-a': 'value1',
                 'x-test-header-two-a': 'value2',
-                'x-test-header-two-b': 'value3'}, '')])
+                'x-test-header-two-b': 'value3'}, b'')])
         self.requests = []
+        self.check_no_query_string = check_no_query_string
 
     def __call__(self, env, start_response):
-        body = ''
-        while True:
-            chunk = env['wsgi.input'].read()
-            if not chunk:
-                break
-            body += chunk
-        env['wsgi.input'] = StringIO(body)
-        self.requests.append(Request.blank('', environ=env))
-        if env.get('swift.authorize_override') and \
-                env.get('REMOTE_USER') != '.wsgi.pre_authed':
-            raise Exception(
-                'Invalid REMOTE_USER %r with swift.authorize_override' % (
-                    env.get('REMOTE_USER'),))
-        if 'swift.authorize' in env:
-            resp = env['swift.authorize'](self.requests[-1])
-            if resp:
-                return resp(env, start_response)
-        status, headers, body = self.status_headers_body_iter.next()
-        return Response(status=status, headers=headers,
-                        body=body)(env, start_response)
-
-
-class TestParseAttrs(unittest.TestCase):
-
-    def test_basic_content_type(self):
-        name, attrs = formpost._parse_attrs('text/plain')
-        self.assertEquals(name, 'text/plain')
-        self.assertEquals(attrs, {})
-
-    def test_content_type_with_charset(self):
-        name, attrs = formpost._parse_attrs('text/plain; charset=UTF8')
-        self.assertEquals(name, 'text/plain')
-        self.assertEquals(attrs, {'charset': 'UTF8'})
-
-    def test_content_disposition(self):
-        name, attrs = formpost._parse_attrs(
-            'form-data; name="somefile"; filename="test.html"')
-        self.assertEquals(name, 'form-data')
-        self.assertEquals(attrs, {'name': 'somefile', 'filename': 'test.html'})
-
-
-class TestIterRequests(unittest.TestCase):
-
-    def test_bad_start(self):
-        it = formpost._iter_requests(StringIO('blah'), 'unique')
-        exc = None
-        try:
-            it.next()
-        except formpost.FormInvalid, err:
-            exc = err
-        self.assertEquals(str(exc), 'invalid starting boundary')
-
-    def test_empty(self):
-        it = formpost._iter_requests(StringIO('--unique'), 'unique')
-        fp = it.next()
-        self.assertEquals(fp.read(), '')
-        exc = None
-        try:
-            it.next()
-        except StopIteration, err:
-            exc = err
-        self.assertTrue(exc is not None)
-
-    def test_basic(self):
-        it = formpost._iter_requests(
-            StringIO('--unique\r\nabcdefg\r\n--unique--'), 'unique')
-        fp = it.next()
-        self.assertEquals(fp.read(), 'abcdefg')
-        exc = None
-        try:
-            it.next()
-        except StopIteration, err:
-            exc = err
-        self.assertTrue(exc is not None)
-
-    def test_basic2(self):
-        it = formpost._iter_requests(
-            StringIO('--unique\r\nabcdefg\r\n--unique\r\nhijkl\r\n--unique--'),
-            'unique')
-        fp = it.next()
-        self.assertEquals(fp.read(), 'abcdefg')
-        fp = it.next()
-        self.assertEquals(fp.read(), 'hijkl')
-        exc = None
-        try:
-            it.next()
-        except StopIteration, err:
-            exc = err
-        self.assertTrue(exc is not None)
-
-    def test_tiny_reads(self):
-        it = formpost._iter_requests(
-            StringIO('--unique\r\nabcdefg\r\n--unique\r\nhijkl\r\n--unique--'),
-            'unique')
-        fp = it.next()
-        self.assertEquals(fp.read(2), 'ab')
-        self.assertEquals(fp.read(2), 'cd')
-        self.assertEquals(fp.read(2), 'ef')
-        self.assertEquals(fp.read(2), 'g')
-        self.assertEquals(fp.read(2), '')
-        fp = it.next()
-        self.assertEquals(fp.read(), 'hijkl')
-        exc = None
-        try:
-            it.next()
-        except StopIteration, err:
-            exc = err
-        self.assertTrue(exc is not None)
-
-    def test_big_reads(self):
-        it = formpost._iter_requests(
-            StringIO('--unique\r\nabcdefg\r\n--unique\r\nhijkl\r\n--unique--'),
-            'unique')
-        fp = it.next()
-        self.assertEquals(fp.read(65536), 'abcdefg')
-        self.assertEquals(fp.read(), '')
-        fp = it.next()
-        self.assertEquals(fp.read(), 'hijkl')
-        exc = None
-        try:
-            it.next()
-        except StopIteration, err:
-            exc = err
-        self.assertTrue(exc is not None)
-
-    def test_broken_mid_stream(self):
-        # We go ahead and accept whatever is sent instead of rejecting the
-        # whole request, in case the partial form is still useful.
-        it = formpost._iter_requests(
-            StringIO('--unique\r\nabc'), 'unique')
-        fp = it.next()
-        self.assertEquals(fp.read(), 'abc')
-        exc = None
-        try:
-            it.next()
-        except StopIteration, err:
-            exc = err
-        self.assertTrue(exc is not None)
-
-    def test_readline(self):
-        it = formpost._iter_requests(
-            StringIO('--unique\r\nab\r\ncd\ref\ng\r\n--unique\r\nhi\r\n\r\n'
-                     'jkl\r\n\r\n--unique--'), 'unique')
-        fp = it.next()
-        self.assertEquals(fp.readline(), 'ab\r\n')
-        self.assertEquals(fp.readline(), 'cd\ref\ng')
-        self.assertEquals(fp.readline(), '')
-        fp = it.next()
-        self.assertEquals(fp.readline(), 'hi\r\n')
-        self.assertEquals(fp.readline(), '\r\n')
-        self.assertEquals(fp.readline(), 'jkl\r\n')
-        exc = None
+        # use wsgi_quote to spot check that it really *is* a WSGI string
+        wsgi_quote(env['PATH_INFO'])
         try:
-            it.next()
-        except StopIteration, err:
-            exc = err
-        self.assertTrue(exc is not None)
-
-    def test_readline_with_tiny_chunks(self):
-        orig_read_chunk_size = formpost.READ_CHUNK_SIZE
-        try:
-            formpost.READ_CHUNK_SIZE = 2
-            it = formpost._iter_requests(
-                StringIO('--unique\r\nab\r\ncd\ref\ng\r\n--unique\r\nhi\r\n'
-                         '\r\njkl\r\n\r\n--unique--'), 'unique')
-            fp = it.next()
-            self.assertEquals(fp.readline(), 'ab\r\n')
-            self.assertEquals(fp.readline(), 'cd\ref\ng')
-            self.assertEquals(fp.readline(), '')
-            fp = it.next()
-            self.assertEquals(fp.readline(), 'hi\r\n')
-            self.assertEquals(fp.readline(), '\r\n')
-            self.assertEquals(fp.readline(), 'jkl\r\n')
-            exc = None
-            try:
-                it.next()
-            except StopIteration, err:
-                exc = err
-            self.assertTrue(exc is not None)
-        finally:
-            formpost.READ_CHUNK_SIZE = orig_read_chunk_size
+            if self.check_no_query_string and env.get('QUERY_STRING'):
+                raise Exception('Query string %s should have been discarded!' %
+                                env['QUERY_STRING'])
+            body = b''
+            while True:
+                chunk = env['wsgi.input'].read()
+                if not chunk:
+                    break
+                body += chunk
+            env['wsgi.input'] = BytesIO(body)
+            self.requests.append(Request.blank('', environ=env))
+            if env.get('swift.authorize_override') and \
+                    env.get('REMOTE_USER') != '.wsgi.pre_authed':
+                raise Exception(
+                    'Invalid REMOTE_USER %r with swift.authorize_override' % (
+                        env.get('REMOTE_USER'),))
+            if 'swift.authorize' in env:
+                resp = env['swift.authorize'](self.requests[-1])
+                if resp:
+                    return resp(env, start_response)
+            status, headers, body = next(self.status_headers_body_iter)
+            return Response(status=status, headers=headers,
+                            body=body)(env, start_response)
+        except EOFError:
+            start_response('499 Client Disconnect',
+                           [('Content-Type', 'text/plain')])
+            return [b'Client Disconnect\n']
 
 
 class TestCappedFileLikeObject(unittest.TestCase):
 
     def test_whole(self):
-        self.assertEquals(
-            formpost._CappedFileLikeObject(StringIO('abc'), 10).read(), 'abc')
+        self.assertEqual(
+            formpost._CappedFileLikeObject(BytesIO(b'abc'), 10).read(),
+            b'abc')
 
     def test_exceeded(self):
         exc = None
         try:
-            formpost._CappedFileLikeObject(StringIO('abc'), 2).read()
-        except EOFError, err:
+            formpost._CappedFileLikeObject(BytesIO(b'abc'), 2).read()
+        except EOFError as err:
             exc = err
-        self.assertEquals(str(exc), 'max_file_size exceeded')
+        self.assertEqual(str(exc), 'max_file_size exceeded')
 
     def test_whole_readline(self):
-        fp = formpost._CappedFileLikeObject(StringIO('abc\ndef'), 10)
-        self.assertEquals(fp.readline(), 'abc\n')
-        self.assertEquals(fp.readline(), 'def')
-        self.assertEquals(fp.readline(), '')
+        fp = formpost._CappedFileLikeObject(BytesIO(b'abc\ndef'), 10)
+        self.assertEqual(fp.readline(), b'abc\n')
+        self.assertEqual(fp.readline(), b'def')
+        self.assertEqual(fp.readline(), b'')
 
     def test_exceeded_readline(self):
-        fp = formpost._CappedFileLikeObject(StringIO('abc\ndef'), 5)
-        self.assertEquals(fp.readline(), 'abc\n')
+        fp = formpost._CappedFileLikeObject(BytesIO(b'abc\ndef'), 5)
+        self.assertEqual(fp.readline(), b'abc\n')
         exc = None
         try:
-            self.assertEquals(fp.readline(), 'def')
-        except EOFError, err:
+            self.assertEqual(fp.readline(), b'def')
+        except EOFError as err:
             exc = err
-        self.assertEquals(str(err), 'max_file_size exceeded')
+        self.assertEqual(str(exc), 'max_file_size exceeded')
 
     def test_read_sized(self):
-        fp = formpost._CappedFileLikeObject(StringIO('abcdefg'), 10)
-        self.assertEquals(fp.read(2), 'ab')
-        self.assertEquals(fp.read(2), 'cd')
-        self.assertEquals(fp.read(2), 'ef')
-        self.assertEquals(fp.read(2), 'g')
-        self.assertEquals(fp.read(2), '')
+        fp = formpost._CappedFileLikeObject(BytesIO(b'abcdefg'), 10)
+        self.assertEqual(fp.read(2), b'ab')
+        self.assertEqual(fp.read(2), b'cd')
+        self.assertEqual(fp.read(2), b'ef')
+        self.assertEqual(fp.read(2), b'g')
+        self.assertEqual(fp.read(2), b'')
 
 
 class TestFormPost(unittest.TestCase):
@@ -292,19 +129,55 @@ def setUp(self):
         self.app = FakeApp()
         self.auth = tempauth.filter_factory({})(self.app)
         self.formpost = formpost.filter_factory({})(self.auth)
+        self.logger = self.formpost.logger = debug_logger()
 
-    def _make_request(self, path, **kwargs):
+    def _make_request(self, path, tempurl_keys=(), **kwargs):
         req = Request.blank(path, **kwargs)
-        req.environ['swift.cache'] = FakeMemcache()
+
+        # Fake out the caching layer so that get_account_info() finds its
+        # data. Include something that isn't tempurl keys to prove we skip it.
+        meta = {'user-job-title': 'Personal Trainer',
+                'user-real-name': 'Jim Shortz'}
+        for idx, key in enumerate(tempurl_keys):
+            meta_name = 'temp-url-key' + (("-%d" % (idx + 1) if idx else ""))
+            if key:
+                meta[meta_name] = key
+
+        _junk, account, _junk, _junk = split_path(path, 2, 4)
+        req.environ.setdefault('swift.infocache', {})
+        req.environ['swift.infocache'][get_cache_key(account)] = \
+            self._fake_cache_env(account, tempurl_keys)
         return req
 
+    def _fake_cache_env(self, account, tempurl_keys=()):
+        # Fake out the caching layer so that get_account_info() finds its
+        # data. Include something that isn't tempurl keys to prove we skip it.
+        meta = {'user-job-title': 'Personal Trainer',
+                'user-real-name': 'Jim Shortz'}
+        for idx, key in enumerate(tempurl_keys):
+            meta_name = 'temp-url-key' + ("-%d" % (idx + 1) if idx else "")
+            if key:
+                meta[meta_name] = key
+
+        return {'status': 204,
+                'container_count': '0',
+                'total_object_count': '0',
+                'bytes': '0',
+                'meta': meta}
+
     def _make_sig_env_body(self, path, redirect, max_file_size, max_file_count,
-                           expires, key):
-        sig = hmac.new(
+                           expires, key, user_agent=True, algorithm='sha512',
+                           prefix=True):
+        alg_name = algorithm
+        mac = hmac.new(
             key,
-            '%s\n%s\n%s\n%s\n%s' % (
-                path, redirect, max_file_size, max_file_count, expires),
-            sha1).hexdigest()
+            hmac_msg(path, redirect, max_file_size, max_file_count, expires),
+            algorithm)
+        if prefix:
+            sig = alg_name + ':' + base64.b64encode(
+                mac.digest()).decode('ascii')
+        else:
+            sig = mac.hexdigest()
         body = [
             '------WebKitFormBoundaryNcxTqxSlX7t4TDkR',
             'Content-Disposition: form-data; name="redirect"',
@@ -336,6 +209,7 @@ def _make_sig_env_body(self, path, redirect, max_file_size, max_file_count,
             'Content-Disposition: form-data; name="file2"; '
             'filename="testfile2.txt"',
             'Content-Type: text/plain',
+            'Content-Encoding: gzip',
             '',
             'Test\nFile\nTwo\n',
             '------WebKitFormBoundaryNcxTqxSlX7t4TDkR',
@@ -346,6 +220,7 @@ def _make_sig_env_body(self, path, redirect, max_file_size, max_file_count,
             '------WebKitFormBoundaryNcxTqxSlX7t4TDkR--',
             '',
         ]
+        body = [line.encode('utf-8') for line in body]
         wsgi_errors = StringIO()
         env = {
             'CONTENT_TYPE': 'multipart/form-data; '
@@ -367,6 +242,7 @@ def _make_sig_env_body(self, path, redirect, max_file_size, max_file_count,
             'SERVER_NAME': '172.16.83.128',
             'SERVER_PORT': '8080',
             'SERVER_PROTOCOL': 'HTTP/1.0',
+            'swift.infocache': {},
             'wsgi.errors': wsgi_errors,
             'wsgi.multiprocess': False,
             'wsgi.multithread': True,
@@ -374,6 +250,9 @@ def _make_sig_env_body(self, path, redirect, max_file_size, max_file_count,
             'wsgi.url_scheme': 'http',
             'wsgi.version': (1, 0),
         }
+        if user_agent is False:
+            del env['HTTP_USER_AGENT']
+
         return sig, env, body
 
     def test_passthrough(self):
@@ -381,11 +260,44 @@ def test_passthrough(self):
             resp = self._make_request(
                 '/v1/a/c/o',
                 environ={'REQUEST_METHOD': method}).get_response(self.formpost)
-            self.assertEquals(resp.status_int, 401)
-            self.assertTrue('FormPost' not in resp.body)
+            self.assertEqual(resp.status_int, 401)
+            self.assertNotIn(b'FormPost', resp.body)
+
+    def test_auth_scheme(self):
+        # FormPost rejects
+        key = b'abc'
+        sig, env, body = self._make_sig_env_body(
+            '/v1/AUTH_test/container', '', 1024, 10, int(time() - 10), key)
+        env['wsgi.input'] = BytesIO(b'\r\n'.join(body))
+        env['swift.infocache'][get_cache_key('AUTH_test')] = (
+            self._fake_cache_env('AUTH_test', [key]))
+        self.app = FakeApp(iter([('201 Created', {}, b''),
+                                 ('201 Created', {}, b'')]))
+        self.auth = tempauth.filter_factory({})(self.app)
+        self.formpost = formpost.filter_factory({})(self.auth)
+        status = [None]
+        headers = [None]
+        exc_info = [None]
+
+        def start_response(s, h, e=None):
+            status[0] = s
+            headers[0] = h
+            exc_info[0] = e
+
+        body = b''.join(self.formpost(env, start_response))
+        status = status[0]
+        headers = headers[0]
+        exc_info = exc_info[0]
+        self.assertEqual(status, '401 Unauthorized')
+        authenticate_v = None
+        for h, v in headers:
+            if h.lower() == 'www-authenticate':
+                authenticate_v = v
+        self.assertTrue(b'FormPost: Form Expired' in body)
+        self.assertEqual('Swift realm="unknown"', authenticate_v)
 
     def test_safari(self):
-        key = 'abc'
+        key = b'abc'
         path = '/v1/AUTH_test/container'
         redirect = 'http://brim.net'
         max_file_size = 1024
@@ -393,12 +305,9 @@ def test_safari(self):
         expires = int(time() + 86400)
         sig = hmac.new(
             key,
-            '%s\n%s\n%s\n%s\n%s' % (
-                path, redirect, max_file_size, max_file_count, expires),
-            sha1).hexdigest()
-        memcache = FakeMemcache()
-        memcache.set('temp-url-key/AUTH_test', key)
-        wsgi_input = StringIO('\r\n'.join([
+            hmac_msg(path, redirect, max_file_size, max_file_count, expires),
+            hashlib.sha512).hexdigest()
+        wsgi_input = '\r\n'.join([
             '------WebKitFormBoundaryNcxTqxSlX7t4TDkR',
             'Content-Disposition: form-data; name="redirect"',
             '',
@@ -438,7 +347,8 @@ def test_safari(self):
             '',
             '------WebKitFormBoundaryNcxTqxSlX7t4TDkR--',
             '',
-        ]))
+        ])
+        wsgi_input = BytesIO(wsgi_input.encode('utf-8'))
         wsgi_errors = StringIO()
         env = {
             'CONTENT_TYPE': 'multipart/form-data; '
@@ -460,7 +370,11 @@ def test_safari(self):
             'SERVER_NAME': '172.16.83.128',
             'SERVER_PORT': '8080',
             'SERVER_PROTOCOL': 'HTTP/1.0',
-            'swift.cache': memcache,
+            'swift.infocache': {
+                get_cache_key('AUTH_test'): self._fake_cache_env(
+                    'AUTH_test', [key]),
+                get_cache_key('AUTH_test', 'container'): {
+                    'meta': {}}},
             'wsgi.errors': wsgi_errors,
             'wsgi.input': wsgi_input,
             'wsgi.multiprocess': False,
@@ -469,8 +383,8 @@ def test_safari(self):
             'wsgi.url_scheme': 'http',
             'wsgi.version': (1, 0),
         }
-        self.app = FakeApp(iter([('201 Created', {}, ''),
-                                 ('201 Created', {}, '')]))
+        self.app = FakeApp(iter([('201 Created', {}, b''),
+                                 ('201 Created', {}, b'')]))
         self.auth = tempauth.filter_factory({})(self.app)
         self.formpost = formpost.filter_factory({})(self.auth)
         status = [None]
@@ -482,24 +396,24 @@ def start_response(s, h, e=None):
             headers[0] = h
             exc_info[0] = e
 
-        body = ''.join(self.formpost(env, start_response))
+        body = b''.join(self.formpost(env, start_response))
         status = status[0]
         headers = headers[0]
         exc_info = exc_info[0]
-        self.assertEquals(status, '303 See Other')
+        self.assertEqual(status, '303 See Other')
         location = None
         for h, v in headers:
             if h.lower() == 'location':
                 location = v
-        self.assertEquals(location, 'http://brim.net?status=201&message=')
-        self.assertEquals(exc_info, None)
-        self.assertTrue('http://brim.net?status=201&message=' in body)
-        self.assertEquals(len(self.app.requests), 2)
-        self.assertEquals(self.app.requests[0].body, 'Test File\nOne\n')
-        self.assertEquals(self.app.requests[1].body, 'Test\nFile\nTwo\n')
+        self.assertEqual(location, 'http://brim.net?status=201&message=')
+        self.assertIsNone(exc_info)
+        self.assertTrue(b'http://brim.net?status=201&message=' in body)
+        self.assertEqual(len(self.app.requests), 2)
+        self.assertEqual(self.app.requests[0].body, b'Test File\nOne\n')
+        self.assertEqual(self.app.requests[1].body, b'Test\nFile\nTwo\n')
 
     def test_firefox(self):
-        key = 'abc'
+        key = b'abc'
         path = '/v1/AUTH_test/container'
         redirect = 'http://brim.net'
         max_file_size = 1024
@@ -507,12 +421,9 @@ def test_firefox(self):
         expires = int(time() + 86400)
         sig = hmac.new(
             key,
-            '%s\n%s\n%s\n%s\n%s' % (
-                path, redirect, max_file_size, max_file_count, expires),
-            sha1).hexdigest()
-        memcache = FakeMemcache()
-        memcache.set('temp-url-key/AUTH_test', key)
-        wsgi_input = StringIO('\r\n'.join([
+            hmac_msg(path, redirect, max_file_size, max_file_count, expires),
+            hashlib.sha512).hexdigest()
+        wsgi_input = '\r\n'.join([
             '-----------------------------168072824752491622650073',
             'Content-Disposition: form-data; name="redirect"',
             '',
@@ -552,7 +463,8 @@ def test_firefox(self):
             '',
             '-----------------------------168072824752491622650073--',
             ''
-        ]))
+        ])
+        wsgi_input = BytesIO(wsgi_input.encode('utf-8'))
         wsgi_errors = StringIO()
         env = {
             'CONTENT_TYPE': 'multipart/form-data; '
@@ -573,7 +485,11 @@ def test_firefox(self):
             'SERVER_NAME': '172.16.83.128',
             'SERVER_PORT': '8080',
             'SERVER_PROTOCOL': 'HTTP/1.0',
-            'swift.cache': memcache,
+            'swift.infocache': {
+                get_cache_key('AUTH_test'): self._fake_cache_env(
+                    'AUTH_test', [key]),
+                get_cache_key('AUTH_test', 'container'): {
+                    'meta': {}}},
             'wsgi.errors': wsgi_errors,
             'wsgi.input': wsgi_input,
             'wsgi.multiprocess': False,
@@ -582,8 +498,8 @@ def test_firefox(self):
             'wsgi.url_scheme': 'http',
             'wsgi.version': (1, 0),
         }
-        self.app = FakeApp(iter([('201 Created', {}, ''),
-                                 ('201 Created', {}, '')]))
+        self.app = FakeApp(iter([('201 Created', {}, b''),
+                                 ('201 Created', {}, b'')]))
         self.auth = tempauth.filter_factory({})(self.app)
         self.formpost = formpost.filter_factory({})(self.auth)
         status = [None]
@@ -595,24 +511,24 @@ def start_response(s, h, e=None):
             headers[0] = h
             exc_info[0] = e
 
-        body = ''.join(self.formpost(env, start_response))
+        body = b''.join(self.formpost(env, start_response))
         status = status[0]
         headers = headers[0]
         exc_info = exc_info[0]
-        self.assertEquals(status, '303 See Other')
+        self.assertEqual(status, '303 See Other')
         location = None
         for h, v in headers:
             if h.lower() == 'location':
                 location = v
-        self.assertEquals(location, 'http://brim.net?status=201&message=')
-        self.assertEquals(exc_info, None)
-        self.assertTrue('http://brim.net?status=201&message=' in body)
-        self.assertEquals(len(self.app.requests), 2)
-        self.assertEquals(self.app.requests[0].body, 'Test File\nOne\n')
-        self.assertEquals(self.app.requests[1].body, 'Test\nFile\nTwo\n')
+        self.assertEqual(location, 'http://brim.net?status=201&message=')
+        self.assertIsNone(exc_info)
+        self.assertTrue(b'http://brim.net?status=201&message=' in body)
+        self.assertEqual(len(self.app.requests), 2)
+        self.assertEqual(self.app.requests[0].body, b'Test File\nOne\n')
+        self.assertEqual(self.app.requests[1].body, b'Test\nFile\nTwo\n')
 
     def test_chrome(self):
-        key = 'abc'
+        key = b'abc'
         path = '/v1/AUTH_test/container'
         redirect = 'http://brim.net'
         max_file_size = 1024
@@ -620,12 +536,9 @@ def test_chrome(self):
         expires = int(time() + 86400)
         sig = hmac.new(
             key,
-            '%s\n%s\n%s\n%s\n%s' % (
-                path, redirect, max_file_size, max_file_count, expires),
-            sha1).hexdigest()
-        memcache = FakeMemcache()
-        memcache.set('temp-url-key/AUTH_test', key)
-        wsgi_input = StringIO('\r\n'.join([
+            hmac_msg(path, redirect, max_file_size, max_file_count, expires),
+            hashlib.sha512).hexdigest()
+        wsgi_input = '\r\n'.join([
             '------WebKitFormBoundaryq3CFxUjfsDMu8XsA',
             'Content-Disposition: form-data; name="redirect"',
             '',
@@ -665,7 +578,8 @@ def test_chrome(self):
             '',
             '------WebKitFormBoundaryq3CFxUjfsDMu8XsA--',
             ''
-        ]))
+        ])
+        wsgi_input = BytesIO(wsgi_input.encode('utf-8'))
         wsgi_errors = StringIO()
         env = {
             'CONTENT_TYPE': 'multipart/form-data; '
@@ -689,7 +603,11 @@ def test_chrome(self):
             'SERVER_NAME': '172.16.83.128',
             'SERVER_PORT': '8080',
             'SERVER_PROTOCOL': 'HTTP/1.0',
-            'swift.cache': memcache,
+            'swift.infocache': {
+                get_cache_key('AUTH_test'): self._fake_cache_env(
+                    'AUTH_test', [key]),
+                get_cache_key('AUTH_test', 'container'): {
+                    'meta': {}}},
             'wsgi.errors': wsgi_errors,
             'wsgi.input': wsgi_input,
             'wsgi.multiprocess': False,
@@ -698,8 +616,8 @@ def test_chrome(self):
             'wsgi.url_scheme': 'http',
             'wsgi.version': (1, 0),
         }
-        self.app = FakeApp(iter([('201 Created', {}, ''),
-                                 ('201 Created', {}, '')]))
+        self.app = FakeApp(iter([('201 Created', {}, b''),
+                                 ('201 Created', {}, b'')]))
         self.auth = tempauth.filter_factory({})(self.app)
         self.formpost = formpost.filter_factory({})(self.auth)
         status = [None]
@@ -711,24 +629,24 @@ def start_response(s, h, e=None):
             headers[0] = h
             exc_info[0] = e
 
-        body = ''.join(self.formpost(env, start_response))
+        body = b''.join(self.formpost(env, start_response))
         status = status[0]
         headers = headers[0]
         exc_info = exc_info[0]
-        self.assertEquals(status, '303 See Other')
+        self.assertEqual(status, '303 See Other')
         location = None
         for h, v in headers:
             if h.lower() == 'location':
                 location = v
-        self.assertEquals(location, 'http://brim.net?status=201&message=')
-        self.assertEquals(exc_info, None)
-        self.assertTrue('http://brim.net?status=201&message=' in body)
-        self.assertEquals(len(self.app.requests), 2)
-        self.assertEquals(self.app.requests[0].body, 'Test File\nOne\n')
-        self.assertEquals(self.app.requests[1].body, 'Test\nFile\nTwo\n')
+        self.assertEqual(location, 'http://brim.net?status=201&message=')
+        self.assertIsNone(exc_info)
+        self.assertTrue(b'http://brim.net?status=201&message=' in body)
+        self.assertEqual(len(self.app.requests), 2)
+        self.assertEqual(self.app.requests[0].body, b'Test File\nOne\n')
+        self.assertEqual(self.app.requests[1].body, b'Test\nFile\nTwo\n')
 
     def test_explorer(self):
-        key = 'abc'
+        key = b'abc'
         path = '/v1/AUTH_test/container'
         redirect = 'http://brim.net'
         max_file_size = 1024
@@ -736,12 +654,9 @@ def test_explorer(self):
         expires = int(time() + 86400)
         sig = hmac.new(
             key,
-            '%s\n%s\n%s\n%s\n%s' % (
-                path, redirect, max_file_size, max_file_count, expires),
-            sha1).hexdigest()
-        memcache = FakeMemcache()
-        memcache.set('temp-url-key/AUTH_test', key)
-        wsgi_input = StringIO('\r\n'.join([
+            hmac_msg(path, redirect, max_file_size, max_file_count, expires),
+            hashlib.sha512).hexdigest()
+        wsgi_input = '\r\n'.join([
             '-----------------------------7db20d93017c',
             'Content-Disposition: form-data; name="redirect"',
             '',
@@ -781,7 +696,8 @@ def test_explorer(self):
             '',
             '-----------------------------7db20d93017c--',
             ''
-        ]))
+        ])
+        wsgi_input = BytesIO(wsgi_input.encode('utf-8'))
         wsgi_errors = StringIO()
         env = {
             'CONTENT_TYPE': 'multipart/form-data; '
@@ -801,7 +717,121 @@ def test_explorer(self):
             'SERVER_NAME': '172.16.83.128',
             'SERVER_PORT': '8080',
             'SERVER_PROTOCOL': 'HTTP/1.0',
-            'swift.cache': memcache,
+            'swift.infocache': {
+                get_cache_key('AUTH_test'): self._fake_cache_env(
+                    'AUTH_test', [key]),
+                get_cache_key('AUTH_test', 'container'): {
+                    'meta': {}}},
+            'wsgi.errors': wsgi_errors,
+            'wsgi.input': wsgi_input,
+            'wsgi.multiprocess': False,
+            'wsgi.multithread': True,
+            'wsgi.run_once': False,
+            'wsgi.url_scheme': 'http',
+            'wsgi.version': (1, 0),
+        }
+        self.app = FakeApp(iter([('201 Created', {}, b''),
+                                 ('201 Created', {}, b'')]))
+        self.auth = tempauth.filter_factory({})(self.app)
+        self.formpost = formpost.filter_factory({})(self.auth)
+        status = [None]
+        headers = [None]
+        exc_info = [None]
+
+        def start_response(s, h, e=None):
+            status[0] = s
+            headers[0] = h
+            exc_info[0] = e
+
+        body = b''.join(self.formpost(env, start_response))
+        status = status[0]
+        headers = headers[0]
+        exc_info = exc_info[0]
+        self.assertEqual(status, '303 See Other')
+        location = None
+        for h, v in headers:
+            if h.lower() == 'location':
+                location = v
+        self.assertEqual(location, 'http://brim.net?status=201&message=')
+        self.assertIsNone(exc_info)
+        self.assertTrue(b'http://brim.net?status=201&message=' in body)
+        self.assertEqual(len(self.app.requests), 2)
+        self.assertEqual(self.app.requests[0].body, b'Test File\nOne\n')
+        self.assertEqual(self.app.requests[1].body, b'Test\nFile\nTwo\n')
+
+    def test_curl_with_unicode(self):
+        key = b'abc'
+        path = u'/v1/AUTH_test/container/let_it_\N{SNOWFLAKE}/'
+        redirect = 'http://brim.net'
+        max_file_size = 1024
+        max_file_count = 10
+        expires = int(time() + 86400)
+        sig = hmac.new(
+            key,
+            hmac_msg(path, redirect, max_file_size, max_file_count, expires),
+            hashlib.sha512).hexdigest()
+        wsgi_input = '\r\n'.join([
+            '--------------------------dea19ac8502ca805',
+            'Content-Disposition: form-data; name="redirect"',
+            '',
+            redirect,
+            '--------------------------dea19ac8502ca805',
+            'Content-Disposition: form-data; name="max_file_size"',
+            '',
+            str(max_file_size),
+            '--------------------------dea19ac8502ca805',
+            'Content-Disposition: form-data; name="max_file_count"',
+            '',
+            str(max_file_count),
+            '--------------------------dea19ac8502ca805',
+            'Content-Disposition: form-data; name="expires"',
+            '',
+            str(expires),
+            '--------------------------dea19ac8502ca805',
+            'Content-Disposition: form-data; name="signature"',
+            '',
+            sig,
+            '--------------------------dea19ac8502ca805',
+            'Content-Disposition: form-data; name="file1"; '
+            'filename="\xe2\x98\x83.txt"',
+            'Content-Type: text/plain',
+            '',
+            'Test File\nOne\n',
+            '--------------------------dea19ac8502ca805',
+            'Content-Disposition: form-data; name="file2"; '
+            'filename="testfile2.txt"',
+            'Content-Type: text/plain',
+            '',
+            'Test\nFile\nTwo\n',
+            '--------------------------dea19ac8502ca805',
+            'Content-Disposition: form-data; name="file3"; filename=""',
+            'Content-Type: application/octet-stream',
+            '',
+            '',
+            '--------------------------dea19ac8502ca805--',
+            ''
+        ]).encode('latin1')
+        wsgi_input = BytesIO(wsgi_input)
+        wsgi_errors = StringIO()
+        env = {
+            'CONTENT_LENGTH': str(len(wsgi_input.getvalue())),
+            'CONTENT_TYPE': 'multipart/form-data; '
+            'boundary=------------------------dea19ac8502ca805',
+            'HTTP_ACCEPT': '*/*',
+            'HTTP_HOST': 'ubuntu:8080',
+            'HTTP_USER_AGENT': 'curl/7.58.0',
+            'PATH_INFO': '/v1/AUTH_test/container/let_it_\xE2\x9D\x84/',
+            'REMOTE_ADDR': '172.16.83.1',
+            'REQUEST_METHOD': 'POST',
+            'SCRIPT_NAME': '',
+            'SERVER_NAME': '172.16.83.128',
+            'SERVER_PORT': '8080',
+            'SERVER_PROTOCOL': 'HTTP/1.0',
+            'swift.infocache': {
+                get_cache_key('AUTH_test'): self._fake_cache_env(
+                    'AUTH_test', [key]),
+                get_cache_key('AUTH_test', 'container'): {
+                    'meta': {}}},
             'wsgi.errors': wsgi_errors,
             'wsgi.input': wsgi_input,
             'wsgi.multiprocess': False,
@@ -810,8 +840,8 @@ def test_explorer(self):
             'wsgi.url_scheme': 'http',
             'wsgi.version': (1, 0),
         }
-        self.app = FakeApp(iter([('201 Created', {}, ''),
-                                 ('201 Created', {}, '')]))
+        self.app = FakeApp(iter([('201 Created', {}, b''),
+                                 ('201 Created', {}, b'')]))
         self.auth = tempauth.filter_factory({})(self.app)
         self.formpost = formpost.filter_factory({})(self.auth)
         status = [None]
@@ -823,37 +853,45 @@ def start_response(s, h, e=None):
             headers[0] = h
             exc_info[0] = e
 
-        body = ''.join(self.formpost(env, start_response))
+        body = b''.join(self.formpost(env, start_response))
         status = status[0]
         headers = headers[0]
         exc_info = exc_info[0]
-        self.assertEquals(status, '303 See Other')
+        self.assertEqual(status, '303 See Other', body)
         location = None
         for h, v in headers:
             if h.lower() == 'location':
                 location = v
-        self.assertEquals(location, 'http://brim.net?status=201&message=')
-        self.assertEquals(exc_info, None)
-        self.assertTrue('http://brim.net?status=201&message=' in body)
-        self.assertEquals(len(self.app.requests), 2)
-        self.assertEquals(self.app.requests[0].body, 'Test File\nOne\n')
-        self.assertEquals(self.app.requests[1].body, 'Test\nFile\nTwo\n')
+        self.assertEqual(location, 'http://brim.net?status=201&message=')
+        self.assertIsNone(exc_info)
+        self.assertTrue(b'http://brim.net?status=201&message=' in body)
+        self.assertEqual(len(self.app.requests), 2)
+        self.assertEqual(
+            self.app.requests[0].path,
+            '/v1/AUTH_test/container/let_it_%E2%9D%84/%E2%98%83.txt')
+        self.assertEqual(self.app.requests[0].body, b'Test File\nOne\n')
+        self.assertEqual(
+            self.app.requests[1].path,
+            '/v1/AUTH_test/container/let_it_%E2%9D%84/testfile2.txt')
+        self.assertEqual(self.app.requests[1].body, b'Test\nFile\nTwo\n')
 
     def test_messed_up_start(self):
-        key = 'abc'
+        key = b'abc'
         sig, env, body = self._make_sig_env_body(
             '/v1/AUTH_test/container', 'http://brim.net', 5, 10,
             int(time() + 86400), key)
-        env['wsgi.input'] = StringIO('XX' + '\r\n'.join(body))
-        env['swift.cache'] = FakeMemcache()
-        env['swift.cache'].set('temp-url-key/AUTH_test', key)
-        self.app = FakeApp(iter([('201 Created', {}, ''),
-                                 ('201 Created', {}, '')]))
+        env['wsgi.input'] = BytesIO(b'XX' + b'\r\n'.join(body))
+        env['swift.infocache'][get_cache_key('AUTH_test')] = (
+            self._fake_cache_env('AUTH_test', [key]))
+        env['swift.infocache'][get_cache_key(
+            'AUTH_test', 'container')] = {'meta': {}}
+        self.app = FakeApp(iter([('201 Created', {}, b''),
+                                 ('201 Created', {}, b'')]))
         self.auth = tempauth.filter_factory({})(self.app)
         self.formpost = formpost.filter_factory({})(self.auth)
 
         def log_assert_int_status(env, response_status_int):
-            self.assertTrue(isinstance(response_status_int, int))
+            self.assertIsInstance(response_status_int, int)
 
         self.formpost._log_request = log_assert_int_status
         status = [None]
@@ -865,25 +903,27 @@ def start_response(s, h, e=None):
             headers[0] = h
             exc_info[0] = e
 
-        body = ''.join(self.formpost(env, start_response))
+        body = b''.join(self.formpost(env, start_response))
         status = status[0]
         headers = headers[0]
         exc_info = exc_info[0]
-        self.assertEquals(status, '400 Bad Request')
-        self.assertEquals(exc_info, None)
-        self.assertTrue('FormPost: invalid starting boundary' in body)
-        self.assertEquals(len(self.app.requests), 0)
+        self.assertEqual(status, '400 Bad Request')
+        self.assertIsNone(exc_info)
+        self.assertIn(b'FormPost: invalid starting boundary', body)
+        self.assertEqual(len(self.app.requests), 0)
 
     def test_max_file_size_exceeded(self):
-        key = 'abc'
+        key = b'abc'
         sig, env, body = self._make_sig_env_body(
             '/v1/AUTH_test/container', 'http://brim.net', 5, 10,
             int(time() + 86400), key)
-        env['wsgi.input'] = StringIO('\r\n'.join(body))
-        env['swift.cache'] = FakeMemcache()
-        env['swift.cache'].set('temp-url-key/AUTH_test', key)
-        self.app = FakeApp(iter([('201 Created', {}, ''),
-                                 ('201 Created', {}, '')]))
+        env['wsgi.input'] = BytesIO(b'\r\n'.join(body))
+        env['swift.infocache'][get_cache_key('AUTH_test')] = (
+            self._fake_cache_env('AUTH_test', [key]))
+        env['swift.infocache'][get_cache_key(
+            'AUTH_test', 'container')] = {'meta': {}}
+        self.app = FakeApp(iter([('201 Created', {}, b''),
+                                 ('201 Created', {}, b'')]))
         self.auth = tempauth.filter_factory({})(self.app)
         self.formpost = formpost.filter_factory({})(self.auth)
         status = [None]
@@ -895,25 +935,27 @@ def start_response(s, h, e=None):
             headers[0] = h
             exc_info[0] = e
 
-        body = ''.join(self.formpost(env, start_response))
+        body = b''.join(self.formpost(env, start_response))
         status = status[0]
         headers = headers[0]
         exc_info = exc_info[0]
-        self.assertEquals(status, '400 Bad Request')
-        self.assertEquals(exc_info, None)
-        self.assertTrue('FormPost: max_file_size exceeded' in body)
-        self.assertEquals(len(self.app.requests), 0)
+        self.assertEqual(status, '400 Bad Request')
+        self.assertIsNone(exc_info)
+        self.assertIn(b'FormPost: max_file_size exceeded', body)
+        self.assertEqual(len(self.app.requests), 0)
 
     def test_max_file_count_exceeded(self):
-        key = 'abc'
+        key = b'abc'
         sig, env, body = self._make_sig_env_body(
             '/v1/AUTH_test/container', 'http://brim.net', 1024, 1,
             int(time() + 86400), key)
-        env['wsgi.input'] = StringIO('\r\n'.join(body))
-        env['swift.cache'] = FakeMemcache()
-        env['swift.cache'].set('temp-url-key/AUTH_test', key)
-        self.app = FakeApp(iter([('201 Created', {}, ''),
-                                 ('201 Created', {}, '')]))
+        env['wsgi.input'] = BytesIO(b'\r\n'.join(body))
+        env['swift.infocache'][get_cache_key('AUTH_test')] = (
+            self._fake_cache_env('AUTH_test', [key]))
+        env['swift.infocache'][get_cache_key(
+            'AUTH_test', 'container')] = {'meta': {}}
+        self.app = FakeApp(iter([('201 Created', {}, b''),
+                                 ('201 Created', {}, b'')]))
         self.auth = tempauth.filter_factory({})(self.app)
         self.formpost = formpost.filter_factory({})(self.auth)
         status = [None]
@@ -925,35 +967,73 @@ def start_response(s, h, e=None):
             headers[0] = h
             exc_info[0] = e
 
-        body = ''.join(self.formpost(env, start_response))
+        body = b''.join(self.formpost(env, start_response))
         status = status[0]
         headers = headers[0]
         exc_info = exc_info[0]
-        self.assertEquals(status, '303 See Other')
+        self.assertEqual(status, '303 See Other')
         location = None
         for h, v in headers:
             if h.lower() == 'location':
                 location = v
-        self.assertEquals(
+        self.assertEqual(
             location,
             'http://brim.net?status=400&message=max%20file%20count%20exceeded')
-        self.assertEquals(exc_info, None)
+        self.assertIsNone(exc_info)
         self.assertTrue(
-            'http://brim.net?status=400&message=max%20file%20count%20exceeded'
+            b'http://brim.net?status=400&message=max%20file%20count%20exceeded'
             in body)
-        self.assertEquals(len(self.app.requests), 1)
-        self.assertEquals(self.app.requests[0].body, 'Test File\nOne\n')
+        self.assertEqual(len(self.app.requests), 1)
+        self.assertEqual(self.app.requests[0].body, b'Test File\nOne\n')
+
+    def test_subrequest_does_not_pass_query(self):
+        key = b'abc'
+        sig, env, body = self._make_sig_env_body(
+            '/v1/AUTH_test/container', '', 1024, 10, int(time() + 86400), key)
+        env['QUERY_STRING'] = 'this=should&not=get&passed'
+        env['wsgi.input'] = BytesIO(b'\r\n'.join(body))
+        env['swift.infocache'][get_cache_key('AUTH_test')] = (
+            self._fake_cache_env('AUTH_test', [key]))
+        env['swift.infocache'][get_cache_key(
+            'AUTH_test', 'container')] = {'meta': {}}
+        self.app = FakeApp(
+            iter([('201 Created', {}, b''),
+                  ('201 Created', {}, b'')]),
+            check_no_query_string=True)
+        self.auth = tempauth.filter_factory({})(self.app)
+        self.formpost = formpost.filter_factory({})(self.auth)
+        status = [None]
+        headers = [None]
+        exc_info = [None]
 
-    def test_subrequest_fails(self):
-        key = 'abc'
+        def start_response(s, h, e=None):
+            status[0] = s
+            headers[0] = h
+            exc_info[0] = e
+
+        body = b''.join(self.formpost(env, start_response))
+        status = status[0]
+        headers = headers[0]
+        exc_info = exc_info[0]
+        # Make sure we 201 Created, which means we made the final subrequest
+        # (and FakeApp verifies that no QUERY_STRING got passed).
+        self.assertEqual(status, '201 Created')
+        self.assertIsNone(exc_info)
+        self.assertTrue(b'201 Created' in body)
+        self.assertEqual(len(self.app.requests), 2)
+
+    def test_subrequest_fails_redirect_404(self):
+        key = b'abc'
         sig, env, body = self._make_sig_env_body(
             '/v1/AUTH_test/container', 'http://brim.net', 1024, 10,
             int(time() + 86400), key)
-        env['wsgi.input'] = StringIO('\r\n'.join(body))
-        env['swift.cache'] = FakeMemcache()
-        env['swift.cache'].set('temp-url-key/AUTH_test', key)
-        self.app = FakeApp(iter([('404 Not Found', {}, ''),
-                                 ('201 Created', {}, '')]))
+        env['wsgi.input'] = BytesIO(b'\r\n'.join(body))
+        env['swift.infocache'][get_cache_key('AUTH_test')] = (
+            self._fake_cache_env('AUTH_test', [key]))
+        env['swift.infocache'][get_cache_key(
+            'AUTH_test', 'container')] = {'meta': {}}
+        self.app = FakeApp(iter([('404 Not Found', {}, b''),
+                                 ('201 Created', {}, b'')]))
         self.auth = tempauth.filter_factory({})(self.app)
         self.formpost = formpost.filter_factory({})(self.auth)
         status = [None]
@@ -965,22 +1045,52 @@ def start_response(s, h, e=None):
             headers[0] = h
             exc_info[0] = e
 
-        body = ''.join(self.formpost(env, start_response))
+        body = b''.join(self.formpost(env, start_response))
         status = status[0]
         headers = headers[0]
         exc_info = exc_info[0]
-        self.assertEquals(status, '303 See Other')
+        self.assertEqual(status, '303 See Other')
         location = None
         for h, v in headers:
             if h.lower() == 'location':
                 location = v
-        self.assertEquals(location, 'http://brim.net?status=404&message=')
-        self.assertEquals(exc_info, None)
-        self.assertTrue('http://brim.net?status=404&message=' in body)
-        self.assertEquals(len(self.app.requests), 1)
+        self.assertEqual(location, 'http://brim.net?status=404&message=')
+        self.assertIsNone(exc_info)
+        self.assertTrue(b'http://brim.net?status=404&message=' in body)
+        self.assertEqual(len(self.app.requests), 1)
+
+    def test_subrequest_fails_no_redirect_503(self):
+        key = b'abc'
+        sig, env, body = self._make_sig_env_body(
+            '/v1/AUTH_test/container', '', 1024, 10,
+            int(time() + 86400), key)
+        env['wsgi.input'] = BytesIO(b'\r\n'.join(body))
+        env['swift.infocache'][get_cache_key('AUTH_test')] = (
+            self._fake_cache_env('AUTH_test', [key]))
+        env['swift.infocache'][get_cache_key(
+            'AUTH_test', 'container')] = {'meta': {}}
+        self.app = FakeApp(iter([('503 Server Error', {}, b'some bad news')]))
+        self.auth = tempauth.filter_factory({})(self.app)
+        self.formpost = formpost.filter_factory({})(self.auth)
+        status = [None]
+        headers = [None]
+        exc_info = [None]
+
+        def start_response(s, h, e=None):
+            status[0] = s
+            headers[0] = h
+            exc_info[0] = e
+
+        body = b''.join(self.formpost(env, start_response))
+        status = status[0]
+        headers = headers[0]
+        exc_info = exc_info[0]
+        self.assertEqual(status, '503 Server Error')
+        self.assertTrue(b'bad news' in body)
+        self.assertEqual(len(self.app.requests), 1)
 
     def test_truncated_attr_value(self):
-        key = 'abc'
+        key = b'abc'
         redirect = 'a' * formpost.MAX_VALUE_LENGTH
         max_file_size = 1024
         max_file_count = 10
@@ -991,7 +1101,7 @@ def test_truncated_attr_value(self):
         # Tack on an extra char to redirect, but shouldn't matter since it
         # should get truncated off on read.
         redirect += 'b'
-        env['wsgi.input'] = StringIO('\r\n'.join([
+        wsgi_input = '\r\n'.join([
             '------WebKitFormBoundaryNcxTqxSlX7t4TDkR',
             'Content-Disposition: form-data; name="redirect"',
             '',
@@ -1031,11 +1141,14 @@ def test_truncated_attr_value(self):
             '',
             '------WebKitFormBoundaryNcxTqxSlX7t4TDkR--',
             '',
-        ]))
-        env['swift.cache'] = FakeMemcache()
-        env['swift.cache'].set('temp-url-key/AUTH_test', key)
-        self.app = FakeApp(iter([('201 Created', {}, ''),
-                                 ('201 Created', {}, '')]))
+        ])
+        env['wsgi.input'] = BytesIO(wsgi_input.encode('utf-8'))
+        env['swift.infocache'][get_cache_key('AUTH_test')] = (
+            self._fake_cache_env('AUTH_test', [key]))
+        env['swift.infocache'][get_cache_key(
+            'AUTH_test', 'container')] = {'meta': {}}
+        self.app = FakeApp(iter([('201 Created', {}, b''),
+                                 ('201 Created', {}, b'')]))
         self.auth = tempauth.filter_factory({})(self.app)
         self.formpost = formpost.filter_factory({})(self.auth)
         status = [None]
@@ -1047,27 +1160,27 @@ def start_response(s, h, e=None):
             headers[0] = h
             exc_info[0] = e
 
-        body = ''.join(self.formpost(env, start_response))
+        body = b''.join(self.formpost(env, start_response))
         status = status[0]
         headers = headers[0]
         exc_info = exc_info[0]
-        self.assertEquals(status, '303 See Other')
+        self.assertEqual(status, '303 See Other')
         location = None
         for h, v in headers:
             if h.lower() == 'location':
                 location = v
-        self.assertEquals(
+        self.assertEqual(
             location,
             ('a' * formpost.MAX_VALUE_LENGTH) + '?status=201&message=')
-        self.assertEquals(exc_info, None)
-        self.assertTrue(
-            ('a' * formpost.MAX_VALUE_LENGTH) + '?status=201&message=' in body)
-        self.assertEquals(len(self.app.requests), 2)
-        self.assertEquals(self.app.requests[0].body, 'Test File\nOne\n')
-        self.assertEquals(self.app.requests[1].body, 'Test\nFile\nTwo\n')
+        self.assertIsNone(exc_info)
+        self.assertIn(
+            (b'a' * formpost.MAX_VALUE_LENGTH) + b'?status=201&message=', body)
+        self.assertEqual(len(self.app.requests), 2)
+        self.assertEqual(self.app.requests[0].body, b'Test File\nOne\n')
+        self.assertEqual(self.app.requests[1].body, b'Test\nFile\nTwo\n')
 
     def test_no_file_to_process(self):
-        key = 'abc'
+        key = b'abc'
         redirect = 'http://brim.net'
         max_file_size = 1024
         max_file_count = 10
@@ -1075,7 +1188,7 @@ def test_no_file_to_process(self):
         sig, env, body = self._make_sig_env_body(
             '/v1/AUTH_test/container', redirect, max_file_size, max_file_count,
             expires, key)
-        env['wsgi.input'] = StringIO('\r\n'.join([
+        wsgi_input = '\r\n'.join([
             '------WebKitFormBoundaryNcxTqxSlX7t4TDkR',
             'Content-Disposition: form-data; name="redirect"',
             '',
@@ -1098,11 +1211,14 @@ def test_no_file_to_process(self):
             sig,
             '------WebKitFormBoundaryNcxTqxSlX7t4TDkR--',
             '',
-        ]))
-        env['swift.cache'] = FakeMemcache()
-        env['swift.cache'].set('temp-url-key/AUTH_test', key)
-        self.app = FakeApp(iter([('201 Created', {}, ''),
-                                 ('201 Created', {}, '')]))
+        ])
+        env['wsgi.input'] = BytesIO(wsgi_input.encode('utf-8'))
+        env['swift.infocache'][get_cache_key('AUTH_test')] = (
+            self._fake_cache_env('AUTH_test', [key]))
+        env['swift.infocache'][get_cache_key(
+            'AUTH_test', 'container')] = {'meta': {}}
+        self.app = FakeApp(iter([('201 Created', {}, b''),
+                                 ('201 Created', {}, b'')]))
         self.auth = tempauth.filter_factory({})(self.app)
         self.formpost = formpost.filter_factory({})(self.auth)
         status = [None]
@@ -1114,33 +1230,231 @@ def start_response(s, h, e=None):
             headers[0] = h
             exc_info[0] = e
 
-        body = ''.join(self.formpost(env, start_response))
+        body = b''.join(self.formpost(env, start_response))
         status = status[0]
         headers = headers[0]
         exc_info = exc_info[0]
-        self.assertEquals(status, '303 See Other')
+        self.assertEqual(status, '303 See Other')
         location = None
         for h, v in headers:
             if h.lower() == 'location':
                 location = v
-        self.assertEquals(
+        self.assertEqual(
             location,
             'http://brim.net?status=400&message=no%20files%20to%20process')
-        self.assertEquals(exc_info, None)
+        self.assertIsNone(exc_info)
         self.assertTrue(
-            'http://brim.net?status=400&message=no%20files%20to%20process'
+            b'http://brim.net?status=400&message=no%20files%20to%20process'
             in body)
-        self.assertEquals(len(self.app.requests), 0)
+        self.assertEqual(len(self.app.requests), 0)
+
+    def test_formpost_without_useragent(self):
+        key = b'abc'
+        sig, env, body = self._make_sig_env_body(
+            '/v1/AUTH_test/container', 'http://redirect', 1024, 10,
+            int(time() + 86400), key, user_agent=False)
+        env['wsgi.input'] = BytesIO(b'\r\n'.join(body))
+        env['swift.infocache'][get_cache_key('AUTH_test')] = (
+            self._fake_cache_env('AUTH_test', [key]))
+        env['swift.infocache'][get_cache_key(
+            'AUTH_test', 'container')] = {'meta': {}}
+        self.app = FakeApp(iter([('201 Created', {}, b''),
+                                 ('201 Created', {}, b'')]))
+        self.auth = tempauth.filter_factory({})(self.app)
+        self.formpost = formpost.filter_factory({})(self.auth)
+
+        def start_response(s, h, e=None):
+            pass
+        body = b''.join(self.formpost(env, start_response))
+        self.assertIn('User-Agent', self.app.requests[0].headers)
+        self.assertEqual(self.app.requests[0].headers['User-Agent'],
+                         'FormPost')
+
+    def test_formpost_with_origin(self):
+        key = b'abc'
+        sig, env, body = self._make_sig_env_body(
+            '/v1/AUTH_test/container', 'http://redirect', 1024, 10,
+            int(time() + 86400), key, user_agent=False)
+        env['wsgi.input'] = BytesIO(b'\r\n'.join(body))
+        env['swift.infocache'][get_cache_key('AUTH_test')] = (
+            self._fake_cache_env('AUTH_test', [key]))
+        env['swift.infocache'][get_cache_key(
+            'AUTH_test', 'container')] = {'meta': {}}
+        env['HTTP_ORIGIN'] = 'http://localhost:5000'
+        self.app = FakeApp(iter([('201 Created', {}, b''),
+                                 ('201 Created',
+                                  {'Access-Control-Allow-Origin':
+                                   'http://localhost:5000'}, b'')]))
+        self.auth = tempauth.filter_factory({})(self.app)
+        self.formpost = formpost.filter_factory({})(self.auth)
+
+        headers = {}
+
+        def start_response(s, h, e=None):
+            for k, v in h:
+                headers[k] = v
+            pass
+
+        body = b''.join(self.formpost(env, start_response))
+        self.assertEqual(headers['Access-Control-Allow-Origin'],
+                         'http://localhost:5000')
+
+    def test_formpost_with_multiple_keys(self):
+        key = b'ernie'
+        sig, env, body = self._make_sig_env_body(
+            '/v1/AUTH_test/container', 'http://redirect', 1024, 10,
+            int(time() + 86400), key)
+        env['wsgi.input'] = BytesIO(b'\r\n'.join(body))
+        # Stick it in X-Account-Meta-Temp-URL-Key-2 and make sure we get it
+        env['swift.infocache'][get_cache_key('AUTH_test')] = (
+            self._fake_cache_env('AUTH_test', [key]))
+        env['swift.infocache'][get_cache_key(
+            'AUTH_test', 'container')] = {'meta': {}}
+        self.app = FakeApp(iter([('201 Created', {}, b''),
+                                 ('201 Created', {}, b'')]))
+        self.auth = tempauth.filter_factory({})(self.app)
+        self.formpost = formpost.filter_factory({})(self.auth)
+
+        status = [None]
+        headers = [None]
+
+        def start_response(s, h, e=None):
+            status[0] = s
+            headers[0] = h
+        body = b''.join(self.formpost(env, start_response))
+        self.assertEqual('303 See Other', status[0])
+        self.assertEqual(
+            'http://redirect?status=201&message=',
+            dict(headers[0]).get('Location'))
+
+    def test_formpost_with_multiple_container_keys(self):
+        first_key = b'ernie'
+        second_key = b'bert'
+        keys = [first_key, second_key]
+
+        meta = {}
+        for idx, key in enumerate(keys):
+            meta_name = 'temp-url-key' + ("-%d" % (idx + 1) if idx else "")
+            if key:
+                meta[meta_name] = key
+
+        for key in keys:
+            sig, env, body = self._make_sig_env_body(
+                '/v1/AUTH_test/container', 'http://redirect', 1024, 10,
+                int(time() + 86400), key)
+            env['wsgi.input'] = BytesIO(b'\r\n'.join(body))
+            env['swift.infocache'][get_cache_key('AUTH_test')] = (
+                self._fake_cache_env('AUTH_test'))
+            # Stick it in X-Container-Meta-Temp-URL-Key-2 and ensure we get it
+            env['swift.infocache'][get_cache_key(
+                'AUTH_test', 'container')] = {'meta': meta}
+            self.app = FakeApp(iter([('201 Created', {}, b''),
+                                     ('201 Created', {}, b'')]))
+            self.auth = tempauth.filter_factory({})(self.app)
+            self.formpost = formpost.filter_factory({})(self.auth)
+
+            status = [None]
+            headers = [None]
+
+            def start_response(s, h, e=None):
+                status[0] = s
+                headers[0] = h
+            body = b''.join(self.formpost(env, start_response))
+            self.assertEqual('303 See Other', status[0])
+            self.assertEqual(
+                'http://redirect?status=201&message=',
+                dict(headers[0]).get('Location'))
+
+    def test_redirect(self):
+        key = b'abc'
+        sig, env, body = self._make_sig_env_body(
+            '/v1/AUTH_test/container', 'http://redirect', 1024, 10,
+            int(time() + 86400), key)
+        env['wsgi.input'] = BytesIO(b'\r\n'.join(body))
+        env['swift.infocache'][get_cache_key('AUTH_test')] = (
+            self._fake_cache_env('AUTH_test', [key]))
+        env['swift.infocache'][get_cache_key(
+            'AUTH_test', 'container')] = {'meta': {}}
+        self.app = FakeApp(iter([('201 Created', {}, b''),
+                                 ('201 Created', {}, b'')]))
+        self.auth = tempauth.filter_factory({})(self.app)
+        self.formpost = formpost.filter_factory({})(self.auth)
+        status = [None]
+        headers = [None]
+        exc_info = [None]
+
+        def start_response(s, h, e=None):
+            status[0] = s
+            headers[0] = h
+            exc_info[0] = e
+
+        body = b''.join(self.formpost(env, start_response))
+        status = status[0]
+        headers = headers[0]
+        exc_info = exc_info[0]
+        self.assertEqual(status, '303 See Other')
+        location = None
+        for h, v in headers:
+            if h.lower() == 'location':
+                location = v
+        self.assertEqual(location, 'http://redirect?status=201&message=')
+        self.assertIsNone(exc_info)
+        self.assertTrue(location.encode('utf-8') in body)
+        self.assertEqual(len(self.app.requests), 2)
+        self.assertEqual(self.app.requests[0].body, b'Test File\nOne\n')
+        self.assertEqual(self.app.requests[1].body, b'Test\nFile\nTwo\n')
+
+    def test_redirect_with_query(self):
+        key = b'abc'
+        sig, env, body = self._make_sig_env_body(
+            '/v1/AUTH_test/container', 'http://redirect?one=two', 1024, 10,
+            int(time() + 86400), key)
+        env['wsgi.input'] = BytesIO(b'\r\n'.join(body))
+        env['swift.infocache'][get_cache_key('AUTH_test')] = (
+            self._fake_cache_env('AUTH_test', [key]))
+        env['swift.infocache'][get_cache_key(
+            'AUTH_test', 'container')] = {'meta': {}}
+        self.app = FakeApp(iter([('201 Created', {}, b''),
+                                 ('201 Created', {}, b'')]))
+        self.auth = tempauth.filter_factory({})(self.app)
+        self.formpost = formpost.filter_factory({})(self.auth)
+        status = [None]
+        headers = [None]
+        exc_info = [None]
+
+        def start_response(s, h, e=None):
+            status[0] = s
+            headers[0] = h
+            exc_info[0] = e
+
+        body = b''.join(self.formpost(env, start_response))
+        status = status[0]
+        headers = headers[0]
+        exc_info = exc_info[0]
+        self.assertEqual(status, '303 See Other')
+        location = None
+        for h, v in headers:
+            if h.lower() == 'location':
+                location = v
+        self.assertEqual(location,
+                         'http://redirect?one=two&status=201&message=')
+        self.assertIsNone(exc_info)
+        self.assertTrue(location.encode('utf-8') in body)
+        self.assertEqual(len(self.app.requests), 2)
+        self.assertEqual(self.app.requests[0].body, b'Test File\nOne\n')
+        self.assertEqual(self.app.requests[1].body, b'Test\nFile\nTwo\n')
 
     def test_no_redirect(self):
-        key = 'abc'
+        key = b'abc'
         sig, env, body = self._make_sig_env_body(
             '/v1/AUTH_test/container', '', 1024, 10, int(time() + 86400), key)
-        env['wsgi.input'] = StringIO('\r\n'.join(body))
-        env['swift.cache'] = FakeMemcache()
-        env['swift.cache'].set('temp-url-key/AUTH_test', key)
-        self.app = FakeApp(iter([('201 Created', {}, ''),
-                                 ('201 Created', {}, '')]))
+        env['wsgi.input'] = BytesIO(b'\r\n'.join(body))
+        env['swift.infocache'][get_cache_key('AUTH_test')] = (
+            self._fake_cache_env('AUTH_test', [key]))
+        env['swift.infocache'][get_cache_key(
+            'AUTH_test', 'container')] = {'meta': {}}
+        self.app = FakeApp(iter([('201 Created', {}, b''),
+                                 ('201 Created', {}, b'')]))
         self.auth = tempauth.filter_factory({})(self.app)
         self.formpost = formpost.filter_factory({})(self.auth)
         status = [None]
@@ -1152,31 +1466,108 @@ def start_response(s, h, e=None):
             headers[0] = h
             exc_info[0] = e
 
-        body = ''.join(self.formpost(env, start_response))
+        body = b''.join(self.formpost(env, start_response))
         status = status[0]
         headers = headers[0]
         exc_info = exc_info[0]
-        self.assertEquals(status, '201 Created')
+        self.assertEqual(status, '201 Created')
         location = None
         for h, v in headers:
             if h.lower() == 'location':
                 location = v
-        self.assertEquals(location, None)
-        self.assertEquals(exc_info, None)
-        self.assertTrue('201 Created' in body)
-        self.assertEquals(len(self.app.requests), 2)
-        self.assertEquals(self.app.requests[0].body, 'Test File\nOne\n')
-        self.assertEquals(self.app.requests[1].body, 'Test\nFile\nTwo\n')
+        self.assertIsNone(location)
+        self.assertIsNone(exc_info)
+        self.assertTrue(b'201 Created' in body)
+        self.assertEqual(len(self.app.requests), 2)
+        self.assertEqual(self.app.requests[0].body, b'Test File\nOne\n')
+        self.assertEqual(self.app.requests[1].body, b'Test\nFile\nTwo\n')
+
+    def test_prefixed_and_not_prefixed_sigs_good(self):
+        def do_test(digest, prefixed):
+            key = b'abc'
+            sig, env, body = self._make_sig_env_body(
+                '/v1/AUTH_test/container', '', 1024, 10,
+                int(time() + 86400), key, algorithm=digest, prefix=prefixed)
+            env['wsgi.input'] = BytesIO(b'\r\n'.join(body))
+            env['swift.infocache'][get_cache_key('AUTH_test')] = (
+                self._fake_cache_env('AUTH_test', [key]))
+            env['swift.infocache'][get_cache_key(
+                'AUTH_test', 'container')] = {'meta': {}}
+            self.auth.app = app = FakeApp(iter([('201 Created', {}, b''),
+                                                ('201 Created', {}, b'')]))
+            status = [None]
+            headers = [None]
+            exc_info = [None]
+
+            def start_response(s, h, e=None):
+                status[0] = s
+                headers[0] = h
+                exc_info[0] = e
+
+            body = b''.join(self.formpost(env, start_response))
+            status = status[0]
+            headers = headers[0]
+            exc_info = exc_info[0]
+            self.assertEqual(status, '201 Created')
+            location = None
+            for h, v in headers:
+                if h.lower() == 'location':
+                    location = v
+            self.assertIsNone(location)
+            self.assertIsNone(exc_info)
+            self.assertTrue(b'201 Created' in body)
+            self.assertEqual(len(app.requests), 2)
+            self.assertEqual(app.requests[0].body, b'Test File\nOne\n')
+            self.assertEqual(app.requests[1].body, b'Test\nFile\nTwo\n')
+
+        for digest in ('sha1', 'sha256', 'sha512'):
+            do_test(digest, True)
+            do_test(digest, False)
+
+        # NB: one increment per *upload*, not client request
+        self.assertEqual(self.logger.statsd_client.get_stats_counts(), {
+            'formpost.digests.sha1': 4,
+            'formpost.digests.sha256': 4,
+            'formpost.digests.sha512': 4,
+        })
+
+    def test_prefixed_and_not_prefixed_sigs_unsupported(self):
+        def do_test(digest, prefixed):
+            key = b'abc'
+            sig, env, body = self._make_sig_env_body(
+                '/v1/AUTH_test/container', '', 1024, 10,
+                int(time() + 86400), key, algorithm=digest, prefix=prefixed)
+            env['wsgi.input'] = BytesIO(b'\r\n'.join(body))
+            env['swift.infocache'][get_cache_key('AUTH_test')] = (
+                self._fake_cache_env('AUTH_test', [key]))
+            env['swift.infocache'][get_cache_key(
+                'AUTH_test', 'container')] = {'meta': {}}
+            self.app = FakeApp(iter([('201 Created', {}, b''),
+                                     ('201 Created', {}, b'')]))
+            self.auth = tempauth.filter_factory({})(self.app)
+            self.formpost = formpost.filter_factory({})(self.auth)
+            status = [None]
+
+            def start_response(s, h, e=None):
+                status[0] = s
+
+            body = b''.join(self.formpost(env, start_response))
+            status = status[0]
+            self.assertEqual(status, '401 Unauthorized')
+
+        for digest in ('md5', 'sha224'):
+            do_test(digest, True)
+            do_test(digest, False)
 
     def test_no_redirect_expired(self):
-        key = 'abc'
+        key = b'abc'
         sig, env, body = self._make_sig_env_body(
             '/v1/AUTH_test/container', '', 1024, 10, int(time() - 10), key)
-        env['wsgi.input'] = StringIO('\r\n'.join(body))
-        env['swift.cache'] = FakeMemcache()
-        env['swift.cache'].set('temp-url-key/AUTH_test', key)
-        self.app = FakeApp(iter([('201 Created', {}, ''),
-                                 ('201 Created', {}, '')]))
+        env['wsgi.input'] = BytesIO(b'\r\n'.join(body))
+        env['swift.infocache'][get_cache_key('AUTH_test')] = (
+            self._fake_cache_env('AUTH_test', [key]))
+        self.app = FakeApp(iter([('201 Created', {}, b''),
+                                 ('201 Created', {}, b'')]))
         self.auth = tempauth.filter_factory({})(self.app)
         self.formpost = formpost.filter_factory({})(self.auth)
         status = [None]
@@ -1188,30 +1579,29 @@ def start_response(s, h, e=None):
             headers[0] = h
             exc_info[0] = e
 
-        body = ''.join(self.formpost(env, start_response))
+        body = b''.join(self.formpost(env, start_response))
         status = status[0]
         headers = headers[0]
         exc_info = exc_info[0]
-        self.assertEquals(status, '401 Unauthorized')
+        self.assertEqual(status, '401 Unauthorized')
         location = None
         for h, v in headers:
             if h.lower() == 'location':
                 location = v
-        self.assertEquals(location, None)
-        self.assertEquals(exc_info, None)
-        self.assertTrue('FormPost: Form Expired' in body)
+        self.assertIsNone(location)
+        self.assertIsNone(exc_info)
+        self.assertTrue(b'FormPost: Form Expired' in body)
 
     def test_no_redirect_invalid_sig(self):
-        key = 'abc'
+        key = b'abc'
         sig, env, body = self._make_sig_env_body(
             '/v1/AUTH_test/container', '', 1024, 10, int(time() + 86400), key)
-        env['wsgi.input'] = StringIO('\r\n'.join(body))
-        env['swift.cache'] = FakeMemcache()
+        env['wsgi.input'] = BytesIO(b'\r\n'.join(body))
         # Change key to invalidate sig
-        key = 'def'
-        env['swift.cache'].set('temp-url-key/AUTH_test', key)
-        self.app = FakeApp(iter([('201 Created', {}, ''),
-                                 ('201 Created', {}, '')]))
+        env['swift.infocache'][get_cache_key('AUTH_test')] = (
+            self._fake_cache_env('AUTH_test', [key + b' is bogus now']))
+        self.app = FakeApp(iter([('201 Created', {}, b''),
+                                 ('201 Created', {}, b'')]))
         self.auth = tempauth.filter_factory({})(self.app)
         self.formpost = formpost.filter_factory({})(self.auth)
         status = [None]
@@ -1223,28 +1613,28 @@ def start_response(s, h, e=None):
             headers[0] = h
             exc_info[0] = e
 
-        body = ''.join(self.formpost(env, start_response))
+        body = b''.join(self.formpost(env, start_response))
         status = status[0]
         headers = headers[0]
         exc_info = exc_info[0]
-        self.assertEquals(status, '401 Unauthorized')
+        self.assertEqual(status, '401 Unauthorized')
         location = None
         for h, v in headers:
             if h.lower() == 'location':
                 location = v
-        self.assertEquals(location, None)
-        self.assertEquals(exc_info, None)
-        self.assertTrue('FormPost: Invalid Signature' in body)
+        self.assertIsNone(location)
+        self.assertIsNone(exc_info)
+        self.assertTrue(b'FormPost: Invalid Signature' in body)
 
     def test_no_redirect_with_error(self):
-        key = 'abc'
+        key = b'abc'
         sig, env, body = self._make_sig_env_body(
             '/v1/AUTH_test/container', '', 1024, 10, int(time() + 86400), key)
-        env['wsgi.input'] = StringIO('XX' + '\r\n'.join(body))
-        env['swift.cache'] = FakeMemcache()
-        env['swift.cache'].set('temp-url-key/AUTH_test', key)
-        self.app = FakeApp(iter([('201 Created', {}, ''),
-                                 ('201 Created', {}, '')]))
+        env['wsgi.input'] = BytesIO(b'XX' + b'\r\n'.join(body))
+        env['swift.infocache'][get_cache_key('AUTH_test')] = (
+            self._fake_cache_env('AUTH_test', [key]))
+        self.app = FakeApp(iter([('201 Created', {}, b''),
+                                 ('201 Created', {}, b'')]))
         self.auth = tempauth.filter_factory({})(self.app)
         self.formpost = formpost.filter_factory({})(self.auth)
         status = [None]
@@ -1256,28 +1646,86 @@ def start_response(s, h, e=None):
             headers[0] = h
             exc_info[0] = e
 
-        body = ''.join(self.formpost(env, start_response))
+        body = b''.join(self.formpost(env, start_response))
         status = status[0]
         headers = headers[0]
         exc_info = exc_info[0]
-        self.assertEquals(status, '400 Bad Request')
+        self.assertEqual(status, '400 Bad Request')
         location = None
         for h, v in headers:
             if h.lower() == 'location':
                 location = v
-        self.assertEquals(location, None)
-        self.assertEquals(exc_info, None)
-        self.assertTrue('FormPost: invalid starting boundary' in body)
+        self.assertIsNone(location)
+        self.assertIsNone(exc_info)
+        self.assertTrue(b'FormPost: invalid starting boundary' in body)
+
+    def test_redirect_allowed_deprecated_and_unsupported_digests(self):
+        logger = debug_logger()
+
+        def do_test(digest):
+            logger.clear()
+            key = b'abc'
+            sig, env, body = self._make_sig_env_body(
+                '/v1/AUTH_test/container', 'http://redirect', 1024, 10,
+                int(time() + 86400), key, algorithm=digest)
+            env['wsgi.input'] = BytesIO(b'\r\n'.join(body))
+            env['swift.infocache'][get_cache_key('AUTH_test')] = (
+                self._fake_cache_env('AUTH_test', [key]))
+            env['swift.infocache'][get_cache_key(
+                'AUTH_test', 'container')] = {'meta': {}}
+            self.app = FakeApp(iter([('201 Created', {}, b''),
+                                     ('201 Created', {}, b'')]))
+            self.auth = tempauth.filter_factory({})(self.app)
+            with mock.patch('swift.common.middleware.formpost.get_logger',
+                            return_value=logger):
+                self.formpost = formpost.filter_factory(
+                    {
+                        'allowed_digests': DEFAULT_ALLOWED_DIGESTS})(self.auth)
+            status = [None]
+            headers = [None]
+            exc_info = [None]
+
+            def start_response(s, h, e=None):
+                status[0] = s
+                headers[0] = h
+                exc_info[0] = e
+
+            body = b''.join(self.formpost(env, start_response))
+            return body, status[0], headers[0], exc_info[0]
+
+        for algorithm in ('sha1', 'sha256', 'sha512'):
+            body, status, headers, exc_info = do_test(algorithm)
+            self.assertEqual(status, '303 See Other')
+            location = None
+            for h, v in headers:
+                if h.lower() == 'location':
+                    location = v
+            self.assertEqual(location, 'http://redirect?status=201&message=')
+            self.assertIsNone(exc_info)
+            self.assertTrue(location.encode('utf-8') in body)
+            self.assertEqual(len(self.app.requests), 2)
+            self.assertEqual(self.app.requests[0].body, b'Test File\nOne\n')
+            self.assertEqual(self.app.requests[1].body, b'Test\nFile\nTwo\n')
+            if algorithm in digest_utils.DEPRECATED_DIGESTS:
+                self.assertIn(
+                    'The following digest algorithms are configured but '
+                    'deprecated: %s. Support will be removed in a '
+                    'future release.' % algorithm,
+                    logger.get_lines_for_level('warning'))
+
+        # unsupported
+        _body, status, _headers, _exc_info = do_test("md5")
+        self.assertEqual(status, '401 Unauthorized')
 
     def test_no_v1(self):
-        key = 'abc'
+        key = b'abc'
         sig, env, body = self._make_sig_env_body(
             '/v2/AUTH_test/container', '', 1024, 10, int(time() + 86400), key)
-        env['wsgi.input'] = StringIO('\r\n'.join(body))
-        env['swift.cache'] = FakeMemcache()
-        env['swift.cache'].set('temp-url-key/AUTH_test', key)
-        self.app = FakeApp(iter([('201 Created', {}, ''),
-                                 ('201 Created', {}, '')]))
+        env['wsgi.input'] = BytesIO(b'\r\n'.join(body))
+        env['swift.infocache'][get_cache_key('AUTH_test')] = (
+            self._fake_cache_env('AUTH_test', [key]))
+        self.app = FakeApp(iter([('201 Created', {}, b''),
+                                 ('201 Created', {}, b'')]))
         self.auth = tempauth.filter_factory({})(self.app)
         self.formpost = formpost.filter_factory({})(self.auth)
         status = [None]
@@ -1289,28 +1737,28 @@ def start_response(s, h, e=None):
             headers[0] = h
             exc_info[0] = e
 
-        body = ''.join(self.formpost(env, start_response))
+        body = b''.join(self.formpost(env, start_response))
         status = status[0]
         headers = headers[0]
         exc_info = exc_info[0]
-        self.assertEquals(status, '401 Unauthorized')
+        self.assertEqual(status, '401 Unauthorized')
         location = None
         for h, v in headers:
             if h.lower() == 'location':
                 location = v
-        self.assertEquals(location, None)
-        self.assertEquals(exc_info, None)
-        self.assertTrue('FormPost: Invalid Signature' in body)
+        self.assertIsNone(location)
+        self.assertIsNone(exc_info)
+        self.assertTrue(b'FormPost: Invalid Signature' in body)
 
     def test_empty_v1(self):
-        key = 'abc'
+        key = b'abc'
         sig, env, body = self._make_sig_env_body(
             '//AUTH_test/container', '', 1024, 10, int(time() + 86400), key)
-        env['wsgi.input'] = StringIO('\r\n'.join(body))
-        env['swift.cache'] = FakeMemcache()
-        env['swift.cache'].set('temp-url-key/AUTH_test', key)
-        self.app = FakeApp(iter([('201 Created', {}, ''),
-                                 ('201 Created', {}, '')]))
+        env['wsgi.input'] = BytesIO(b'\r\n'.join(body))
+        env['swift.infocache'][get_cache_key('AUTH_test')] = (
+            self._fake_cache_env('AUTH_test', [key]))
+        self.app = FakeApp(iter([('201 Created', {}, b''),
+                                 ('201 Created', {}, b'')]))
         self.auth = tempauth.filter_factory({})(self.app)
         self.formpost = formpost.filter_factory({})(self.auth)
         status = [None]
@@ -1322,28 +1770,28 @@ def start_response(s, h, e=None):
             headers[0] = h
             exc_info[0] = e
 
-        body = ''.join(self.formpost(env, start_response))
+        body = b''.join(self.formpost(env, start_response))
         status = status[0]
         headers = headers[0]
         exc_info = exc_info[0]
-        self.assertEquals(status, '401 Unauthorized')
+        self.assertEqual(status, '401 Unauthorized')
         location = None
         for h, v in headers:
             if h.lower() == 'location':
                 location = v
-        self.assertEquals(location, None)
-        self.assertEquals(exc_info, None)
-        self.assertTrue('FormPost: Invalid Signature' in body)
+        self.assertIsNone(location)
+        self.assertIsNone(exc_info)
+        self.assertTrue(b'FormPost: Invalid Signature' in body)
 
     def test_empty_account(self):
-        key = 'abc'
+        key = b'abc'
         sig, env, body = self._make_sig_env_body(
             '/v1//container', '', 1024, 10, int(time() + 86400), key)
-        env['wsgi.input'] = StringIO('\r\n'.join(body))
-        env['swift.cache'] = FakeMemcache()
-        env['swift.cache'].set('temp-url-key/AUTH_test', key)
-        self.app = FakeApp(iter([('201 Created', {}, ''),
-                                 ('201 Created', {}, '')]))
+        env['wsgi.input'] = BytesIO(b'\r\n'.join(body))
+        env['swift.infocache'][get_cache_key('AUTH_test')] = (
+            self._fake_cache_env('AUTH_test', [key]))
+        self.app = FakeApp(iter([('201 Created', {}, b''),
+                                 ('201 Created', {}, b'')]))
         self.auth = tempauth.filter_factory({})(self.app)
         self.formpost = formpost.filter_factory({})(self.auth)
         status = [None]
@@ -1355,30 +1803,30 @@ def start_response(s, h, e=None):
             headers[0] = h
             exc_info[0] = e
 
-        body = ''.join(self.formpost(env, start_response))
+        body = b''.join(self.formpost(env, start_response))
         status = status[0]
         headers = headers[0]
         exc_info = exc_info[0]
-        self.assertEquals(status, '401 Unauthorized')
+        self.assertEqual(status, '401 Unauthorized')
         location = None
         for h, v in headers:
             if h.lower() == 'location':
                 location = v
-        self.assertEquals(location, None)
-        self.assertEquals(exc_info, None)
-        self.assertTrue('FormPost: Invalid Signature' in body)
+        self.assertIsNone(location)
+        self.assertIsNone(exc_info)
+        self.assertTrue(b'FormPost: Invalid Signature' in body)
 
     def test_wrong_account(self):
-        key = 'abc'
+        key = b'abc'
         sig, env, body = self._make_sig_env_body(
             '/v1/AUTH_tst/container', '', 1024, 10, int(time() + 86400), key)
-        env['wsgi.input'] = StringIO('\r\n'.join(body))
-        env['swift.cache'] = FakeMemcache()
-        env['swift.cache'].set('temp-url-key/AUTH_test', key)
+        env['wsgi.input'] = BytesIO(b'\r\n'.join(body))
+        env['swift.infocache'][get_cache_key('AUTH_test')] = (
+            self._fake_cache_env('AUTH_test', [key]))
         self.app = FakeApp(iter([
-            ('200 Ok', {'x-account-meta-temp-url-key': 'def'}, ''),
-            ('201 Created', {}, ''),
-            ('201 Created', {}, '')]))
+            ('200 Ok', {'x-account-meta-temp-url-key': 'def'}, b''),
+            ('201 Created', {}, b''),
+            ('201 Created', {}, b'')]))
         self.auth = tempauth.filter_factory({})(self.app)
         self.formpost = formpost.filter_factory({})(self.auth)
         status = [None]
@@ -1390,28 +1838,28 @@ def start_response(s, h, e=None):
             headers[0] = h
             exc_info[0] = e
 
-        body = ''.join(self.formpost(env, start_response))
+        body = b''.join(self.formpost(env, start_response))
         status = status[0]
         headers = headers[0]
         exc_info = exc_info[0]
-        self.assertEquals(status, '401 Unauthorized')
+        self.assertEqual(status, '401 Unauthorized')
         location = None
         for h, v in headers:
             if h.lower() == 'location':
                 location = v
-        self.assertEquals(location, None)
-        self.assertEquals(exc_info, None)
-        self.assertTrue('FormPost: Invalid Signature' in body)
+        self.assertIsNone(location)
+        self.assertIsNone(exc_info)
+        self.assertTrue(b'FormPost: Invalid Signature' in body)
 
     def test_no_container(self):
-        key = 'abc'
+        key = b'abc'
         sig, env, body = self._make_sig_env_body(
             '/v1/AUTH_test', '', 1024, 10, int(time() + 86400), key)
-        env['wsgi.input'] = StringIO('\r\n'.join(body))
-        env['swift.cache'] = FakeMemcache()
-        env['swift.cache'].set('temp-url-key/AUTH_test', key)
-        self.app = FakeApp(iter([('201 Created', {}, ''),
-                                 ('201 Created', {}, '')]))
+        env['wsgi.input'] = BytesIO(b'\r\n'.join(body))
+        env['swift.infocache'][get_cache_key('AUTH_test')] = (
+            self._fake_cache_env('AUTH_test', [key]))
+        self.app = FakeApp(iter([('201 Created', {}, b''),
+                                 ('201 Created', {}, b'')]))
         self.auth = tempauth.filter_factory({})(self.app)
         self.formpost = formpost.filter_factory({})(self.auth)
         status = [None]
@@ -1423,33 +1871,33 @@ def start_response(s, h, e=None):
             headers[0] = h
             exc_info[0] = e
 
-        body = ''.join(self.formpost(env, start_response))
+        body = b''.join(self.formpost(env, start_response))
         status = status[0]
         headers = headers[0]
         exc_info = exc_info[0]
-        self.assertEquals(status, '401 Unauthorized')
+        self.assertEqual(status, '401 Unauthorized')
         location = None
         for h, v in headers:
             if h.lower() == 'location':
                 location = v
-        self.assertEquals(location, None)
-        self.assertEquals(exc_info, None)
-        self.assertTrue('FormPost: Invalid Signature' in body)
+        self.assertIsNone(location)
+        self.assertIsNone(exc_info)
+        self.assertTrue(b'FormPost: Invalid Signature' in body)
 
     def test_completely_non_int_expires(self):
-        key = 'abc'
+        key = b'abc'
         expires = int(time() + 86400)
         sig, env, body = self._make_sig_env_body(
             '/v1/AUTH_test/container', '', 1024, 10, expires, key)
         for i, v in enumerate(body):
-            if v == str(expires):
-                body[i] = 'badvalue'
+            if v.decode('utf-8') == str(expires):
+                body[i] = b'badvalue'
                 break
-        env['wsgi.input'] = StringIO('\r\n'.join(body))
-        env['swift.cache'] = FakeMemcache()
-        env['swift.cache'].set('temp-url-key/AUTH_test', key)
-        self.app = FakeApp(iter([('201 Created', {}, ''),
-                                 ('201 Created', {}, '')]))
+        env['wsgi.input'] = BytesIO(b'\r\n'.join(body))
+        env['swift.infocache'][get_cache_key('AUTH_test')] = (
+            self._fake_cache_env('AUTH_test', [key]))
+        self.app = FakeApp(iter([('201 Created', {}, b''),
+                                 ('201 Created', {}, b'')]))
         self.auth = tempauth.filter_factory({})(self.app)
         self.formpost = formpost.filter_factory({})(self.auth)
         status = [None]
@@ -1461,18 +1909,399 @@ def start_response(s, h, e=None):
             headers[0] = h
             exc_info[0] = e
 
-        body = ''.join(self.formpost(env, start_response))
+        body = b''.join(self.formpost(env, start_response))
         status = status[0]
         headers = headers[0]
         exc_info = exc_info[0]
-        self.assertEquals(status, '400 Bad Request')
+        self.assertEqual(status, '400 Bad Request')
         location = None
         for h, v in headers:
             if h.lower() == 'location':
                 location = v
-        self.assertEquals(location, None)
-        self.assertEquals(exc_info, None)
-        self.assertTrue('FormPost: expired not an integer' in body)
+        self.assertIsNone(location)
+        self.assertIsNone(exc_info)
+        self.assertTrue(b'FormPost: expired not an integer' in body)
+
+    def test_x_delete_at(self):
+        delete_at = int(time() + 100)
+        x_delete_body_part = [
+            '------WebKitFormBoundaryNcxTqxSlX7t4TDkR',
+            'Content-Disposition: form-data; name="x_delete_at"',
+            '',
+            str(delete_at),
+        ]
+        x_delete_body_part = [line.encode('utf-8')
+                              for line in x_delete_body_part]
+        key = b'abc'
+        sig, env, body = self._make_sig_env_body(
+            '/v1/AUTH_test/container', '', 1024, 10, int(time() + 86400), key)
+        wsgi_input = b'\r\n'.join(x_delete_body_part + body)
+        env['wsgi.input'] = BytesIO(wsgi_input)
+        env['swift.infocache'][get_cache_key('AUTH_test')] = (
+            self._fake_cache_env('AUTH_test', [key]))
+        env['swift.infocache'][get_cache_key(
+            'AUTH_test', 'container')] = {'meta': {}}
+        self.app = FakeApp(iter([('201 Created', {}, b''),
+                                 ('201 Created', {}, b'')]))
+        self.auth = tempauth.filter_factory({})(self.app)
+        self.formpost = formpost.filter_factory({})(self.auth)
+        status = [None]
+        headers = [None]
+        exc_info = [None]
+
+        def start_response(s, h, e=None):
+            status[0] = s
+            headers[0] = h
+            exc_info[0] = e
+
+        body = b''.join(self.formpost(env, start_response))
+        status = status[0]
+        headers = headers[0]
+        exc_info = exc_info[0]
+        self.assertEqual(status, '201 Created')
+        self.assertTrue(b'201 Created' in body)
+        self.assertEqual(len(self.app.requests), 2)
+        self.assertIn("X-Delete-At", self.app.requests[0].headers)
+        self.assertIn("X-Delete-At", self.app.requests[1].headers)
+        self.assertEqual(delete_at,
+                         self.app.requests[0].headers["X-Delete-At"])
+        self.assertEqual(delete_at,
+                         self.app.requests[1].headers["X-Delete-At"])
+
+    def test_x_delete_at_not_int(self):
+        delete_at = "2014-07-16"
+        x_delete_body_part = [
+            '------WebKitFormBoundaryNcxTqxSlX7t4TDkR',
+            'Content-Disposition: form-data; name="x_delete_at"',
+            '',
+            str(delete_at),
+        ]
+        x_delete_body_part = [line.encode('utf-8')
+                              for line in x_delete_body_part]
+        key = b'abc'
+        sig, env, body = self._make_sig_env_body(
+            '/v1/AUTH_test/container', '', 1024, 10, int(time() + 86400), key)
+        wsgi_input = b'\r\n'.join(x_delete_body_part + body)
+        env['wsgi.input'] = BytesIO(wsgi_input)
+        env['swift.infocache'][get_cache_key('AUTH_test')] = (
+            self._fake_cache_env('AUTH_test', [key]))
+        self.app = FakeApp(iter([('201 Created', {}, b''),
+                                 ('201 Created', {}, b'')]))
+        self.auth = tempauth.filter_factory({})(self.app)
+        self.formpost = formpost.filter_factory({})(self.auth)
+        status = [None]
+        headers = [None]
+        exc_info = [None]
+
+        def start_response(s, h, e=None):
+            status[0] = s
+            headers[0] = h
+            exc_info[0] = e
+
+        body = b''.join(self.formpost(env, start_response))
+        status = status[0]
+        headers = headers[0]
+        exc_info = exc_info[0]
+        self.assertEqual(status, '400 Bad Request')
+        self.assertTrue(b'FormPost: x_delete_at not an integer' in body)
+
+    def test_x_delete_after(self):
+        delete_after = 100
+        x_delete_body_part = [
+            '------WebKitFormBoundaryNcxTqxSlX7t4TDkR',
+            'Content-Disposition: form-data; name="x_delete_after"',
+            '',
+            str(delete_after),
+        ]
+        x_delete_body_part = [line.encode('utf-8')
+                              for line in x_delete_body_part]
+        key = b'abc'
+        sig, env, body = self._make_sig_env_body(
+            '/v1/AUTH_test/container', '', 1024, 10, int(time() + 86400), key)
+        wsgi_input = b'\r\n'.join(x_delete_body_part + body)
+        env['wsgi.input'] = BytesIO(wsgi_input)
+        env['swift.infocache'][get_cache_key('AUTH_test')] = (
+            self._fake_cache_env('AUTH_test', [key]))
+        env['swift.infocache'][get_cache_key(
+            'AUTH_test', 'container')] = {'meta': {}}
+        self.app = FakeApp(iter([('201 Created', {}, b''),
+                                 ('201 Created', {}, b'')]))
+        self.auth = tempauth.filter_factory({})(self.app)
+        self.formpost = formpost.filter_factory({})(self.auth)
+        status = [None]
+        headers = [None]
+        exc_info = [None]
+
+        def start_response(s, h, e=None):
+            status[0] = s
+            headers[0] = h
+            exc_info[0] = e
+
+        body = b''.join(self.formpost(env, start_response))
+        status = status[0]
+        headers = headers[0]
+        exc_info = exc_info[0]
+        self.assertEqual(status, '201 Created')
+        self.assertTrue(b'201 Created' in body)
+        self.assertEqual(len(self.app.requests), 2)
+        self.assertIn("X-Delete-After", self.app.requests[0].headers)
+        self.assertIn("X-Delete-After", self.app.requests[1].headers)
+        self.assertEqual(delete_after,
+                         self.app.requests[0].headers["X-Delete-After"])
+        self.assertEqual(delete_after,
+                         self.app.requests[1].headers["X-Delete-After"])
+
+    def test_x_delete_after_not_int(self):
+        delete_after = "2 days"
+        x_delete_body_part = [
+            '------WebKitFormBoundaryNcxTqxSlX7t4TDkR',
+            'Content-Disposition: form-data; name="x_delete_after"',
+            '',
+            str(delete_after),
+        ]
+        x_delete_body_part = [line.encode('utf-8')
+                              for line in x_delete_body_part]
+        key = b'abc'
+        sig, env, body = self._make_sig_env_body(
+            '/v1/AUTH_test/container', '', 1024, 10, int(time() + 86400), key)
+        wsgi_input = b'\r\n'.join(x_delete_body_part + body)
+        env['wsgi.input'] = BytesIO(wsgi_input)
+        env['swift.infocache'][get_cache_key('AUTH_test')] = (
+            self._fake_cache_env('AUTH_test', [key]))
+        self.app = FakeApp(iter([('201 Created', {}, b''),
+                                 ('201 Created', {}, b'')]))
+        self.auth = tempauth.filter_factory({})(self.app)
+        self.formpost = formpost.filter_factory({})(self.auth)
+        status = [None]
+        headers = [None]
+        exc_info = [None]
+
+        def start_response(s, h, e=None):
+            status[0] = s
+            headers[0] = h
+            exc_info[0] = e
+
+        body = b''.join(self.formpost(env, start_response))
+        status = status[0]
+        headers = headers[0]
+        exc_info = exc_info[0]
+        self.assertEqual(status, '400 Bad Request')
+        self.assertTrue(b'FormPost: x_delete_after not an integer' in body)
+
+    def test_global_content_type_encoding(self):
+        body_part = [
+            '------WebKitFormBoundaryNcxTqxSlX7t4TDkR',
+            'Content-Disposition: form-data; name="content-encoding"',
+            '',
+            'gzip',
+            '------WebKitFormBoundaryNcxTqxSlX7t4TDkR',
+            'Content-Disposition: form-data; name="content-type"',
+            '',
+            'text/html',
+        ]
+        body_part = [line.encode('utf-8') for line in body_part]
+
+        key = b'abc'
+        sig, env, body = self._make_sig_env_body(
+            '/v1/AUTH_test/container', '', 1024, 10, int(time() + 86400), key)
+        wsgi_input = b'\r\n'.join(body_part + body)
+        env['wsgi.input'] = BytesIO(wsgi_input)
+
+        env['swift.infocache'][get_cache_key('AUTH_test')] = (
+            self._fake_cache_env('AUTH_test', [key]))
+        env['swift.infocache'][get_cache_key(
+            'AUTH_test', 'container')] = {'meta': {}}
+        self.app = FakeApp(iter([('201 Created', {}, b''),
+                                 ('201 Created', {}, b'')]))
+        self.auth = tempauth.filter_factory({})(self.app)
+        self.formpost = formpost.filter_factory({})(self.auth)
+        status = [None]
+        headers = [None]
+        exc_info = [None]
+
+        def start_response(s, h, e=None):
+            status[0] = s
+            headers[0] = h
+            exc_info[0] = e
+
+        body = b''.join(self.formpost(env, start_response))
+        status = status[0]
+        headers = headers[0]
+        exc_info = exc_info[0]
+        self.assertEqual(status, '201 Created')
+        self.assertTrue(b'201 Created' in body)
+        self.assertEqual(len(self.app.requests), 2)
+        self.assertIn("Content-Type", self.app.requests[0].headers)
+        self.assertIn("Content-Type", self.app.requests[1].headers)
+        self.assertIn("Content-Encoding", self.app.requests[0].headers)
+        self.assertIn("Content-Encoding", self.app.requests[1].headers)
+        self.assertEqual("text/html",
+                         self.app.requests[0].headers["Content-Type"])
+        self.assertEqual("text/html",
+                         self.app.requests[1].headers["Content-Type"])
+        self.assertEqual("gzip",
+                         self.app.requests[0].headers["Content-Encoding"])
+        self.assertEqual("gzip",
+                         self.app.requests[1].headers["Content-Encoding"])
+
+    def test_single_content_type_encoding(self):
+        key = b'abc'
+        sig, env, body = self._make_sig_env_body(
+            '/v1/AUTH_test/container', '', 1024, 10, int(time() + 86400), key)
+        wsgi_input = b'\r\n'.join(body)
+        env['wsgi.input'] = BytesIO(wsgi_input)
+
+        env['swift.infocache'][get_cache_key('AUTH_test')] = (
+            self._fake_cache_env('AUTH_test', [key]))
+        env['swift.infocache'][get_cache_key(
+            'AUTH_test', 'container')] = {'meta': {}}
+        self.app = FakeApp(iter([('201 Created', {}, b''),
+                                 ('201 Created', {}, b'')]))
+        self.auth = tempauth.filter_factory({})(self.app)
+        self.formpost = formpost.filter_factory({})(self.auth)
+        status = [None]
+        headers = [None]
+        exc_info = [None]
+
+        def start_response(s, h, e=None):
+            status[0] = s
+            headers[0] = h
+            exc_info[0] = e
+
+        body = b''.join(self.formpost(env, start_response))
+        status = status[0]
+        headers = headers[0]
+        exc_info = exc_info[0]
+        self.assertEqual(status, '201 Created')
+        self.assertTrue(b'201 Created' in body)
+
+        self.assertEqual(len(self.app.requests), 2)
+        self.assertEqual(self.app.requests[1].body, b'Test\nFile\nTwo\n')
+        self.assertIn("Content-Type", self.app.requests[0].headers)
+        self.assertIn("Content-Type", self.app.requests[1].headers)
+        self.assertEqual("text/plain",
+                         self.app.requests[0].headers["Content-Type"])
+        self.assertEqual("text/plain",
+                         self.app.requests[1].headers["Content-Type"])
+
+        self.assertFalse("Content-Encoding" in self.app.requests[0].headers)
+        self.assertIn("Content-Encoding", self.app.requests[1].headers)
+        self.assertEqual("gzip",
+                         self.app.requests[1].headers["Content-Encoding"])
+
+    def test_multiple_content_type_encoding(self):
+        body_part = [
+            '------WebKitFormBoundaryNcxTqxSlX7t4TDkR',
+            'Content-Disposition: form-data; name="file4"; '
+            'filename="testfile4.txt"',
+            'Content-Type: application/json',
+            '',
+            '{"four": 4}\n',
+        ]
+        body_part = [line.encode('utf-8') for line in body_part]
+
+        key = b'abc'
+        sig, env, body = self._make_sig_env_body(
+            '/v1/AUTH_test/container', '', 1024, 10, int(time() + 86400), key)
+        # splice in another file with a different content type
+        before_closing_boundary = len(body) - 2
+        body[before_closing_boundary:before_closing_boundary] = body_part
+        wsgi_input = b'\r\n'.join(body)
+        env['wsgi.input'] = BytesIO(wsgi_input)
+
+        env['swift.infocache'][get_cache_key('AUTH_test')] = (
+            self._fake_cache_env('AUTH_test', [key]))
+        env['swift.infocache'][get_cache_key(
+            'AUTH_test', 'container')] = {'meta': {}}
+        self.app = FakeApp(iter([('201 Created', {}, b'')] * 3))
+        self.auth = tempauth.filter_factory({})(self.app)
+        self.formpost = formpost.filter_factory({})(self.auth)
+        status = [None]
+        headers = [None]
+
+        def start_response(s, h, e=None):
+            status[0] = s
+            headers[0] = h
+
+        body = b''.join(self.formpost(env, start_response))
+        status = status[0]
+        headers = headers[0]
+        self.assertEqual(status, '201 Created')
+        self.assertTrue(b'201 Created' in body)
+
+        self.assertEqual(len(self.app.requests), 3)
+        self.assertEqual(self.app.requests[0].body, b'Test File\nOne\n')
+        self.assertEqual(self.app.requests[1].body, b'Test\nFile\nTwo\n')
+        self.assertEqual(self.app.requests[2].body, b'{"four": 4}\n')
+
+        self.assertIn("Content-Type", self.app.requests[0].headers)
+        self.assertIn("Content-Type", self.app.requests[1].headers)
+        self.assertIn("Content-Type", self.app.requests[2].headers)
+        self.assertEqual("text/plain",
+                         self.app.requests[0].headers["Content-Type"])
+        self.assertEqual("text/plain",
+                         self.app.requests[1].headers["Content-Type"])
+        self.assertEqual("application/json",
+                         self.app.requests[2].headers["Content-Type"])
+
+        self.assertFalse("Content-Encoding" in self.app.requests[0].headers)
+        self.assertIn("Content-Encoding", self.app.requests[1].headers)
+        self.assertEqual("gzip",
+                         self.app.requests[1].headers["Content-Encoding"])
+        self.assertFalse("Content-Encoding" in self.app.requests[2].headers)
+
+
+class TestSwiftInfo(unittest.TestCase):
+    def setUp(self):
+        registry._swift_info = {}
+        registry._swift_admin_info = {}
+
+    def test_registered_defaults(self):
+        formpost.filter_factory({})
+        swift_info = registry.get_swift_info()
+        self.assertIn('formpost', swift_info)
+        info = swift_info['formpost']
+        self.assertIn('allowed_digests', info)
+        self.assertIn('deprecated_digests', info)
+        self.assertEqual(info['allowed_digests'], ['sha1', 'sha256', 'sha512'])
+        self.assertEqual(info['deprecated_digests'], ['sha1'])
+
+    def test_non_default_methods(self):
+        logger = debug_logger()
+        with mock.patch('swift.common.middleware.formpost.get_logger',
+                        return_value=logger):
+            formpost.filter_factory({
+                'allowed_digests': 'sha1 sha512 md5 not-a-valid-digest',
+            })
+        swift_info = registry.get_swift_info()
+        self.assertIn('formpost', swift_info)
+        info = swift_info['formpost']
+        self.assertIn('allowed_digests', info)
+        self.assertIn('deprecated_digests', info)
+        self.assertEqual(info['allowed_digests'], ['sha1', 'sha512'])
+        self.assertEqual(info['deprecated_digests'], ['sha1'])
+        warning_lines = logger.get_lines_for_level('warning')
+        self.assertIn(
+            'The following digest algorithms are configured '
+            'but not supported:',
+            warning_lines[0])
+        self.assertIn('not-a-valid-digest', warning_lines[0])
+        self.assertIn('md5', warning_lines[0])
+
+    def test_no_deprecated_digests(self):
+        formpost.filter_factory({'allowed_digests': 'sha256 sha512'})
+        swift_info = registry.get_swift_info()
+        self.assertIn('formpost', swift_info)
+        info = swift_info['formpost']
+        self.assertIn('allowed_digests', info)
+        self.assertNotIn('deprecated_digests', info)
+        self.assertEqual(info['allowed_digests'], ['sha256', 'sha512'])
+
+    def test_bad_config(self):
+        with self.assertRaises(ValueError):
+            formpost.filter_factory({
+                'allowed_digests': 'md4',
+            })
 
 
 if __name__ == '__main__':
diff --git a/test/unit/common/middleware/test_gatekeeper.py b/test/unit/common/middleware/test_gatekeeper.py
new file mode 100644
index 0000000000..4f8cb480b7
--- /dev/null
+++ b/test/unit/common/middleware/test_gatekeeper.py
@@ -0,0 +1,283 @@
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+
+from swift.common.swob import Request, Response
+from swift.common.middleware import gatekeeper
+
+
+class FakeApp(object):
+    def __init__(self, headers=None):
+        if headers is None:
+            headers = {}
+
+        self.headers = headers
+        self.req = None
+
+    def __call__(self, env, start_response):
+        self.req = Request(env)
+        return Response(request=self.req, body=b'FAKE APP',
+                        headers=self.headers)(env, start_response)
+
+
+class FakeMiddleware(object):
+
+    def __init__(self, app, conf, header_list=None):
+        self.app = app
+        self.conf = conf
+        self.header_list = header_list
+
+    def __call__(self, env, start_response):
+
+        def fake_resp(status, response_headers, exc_info=None):
+            for i in self.header_list:
+                response_headers.append(i)
+            return start_response(status, response_headers, exc_info)
+
+        return self.app(env, fake_resp)
+
+
+class TestGatekeeper(unittest.TestCase):
+    methods = ['PUT', 'POST', 'GET', 'DELETE', 'HEAD', 'COPY', 'OPTIONS']
+
+    allowed_headers = {'xx-account-sysmeta-foo': 'value',
+                       'xx-container-sysmeta-foo': 'value',
+                       'xx-object-sysmeta-foo': 'value',
+                       'x-account-meta-foo': 'value',
+                       'x-container-meta-foo': 'value',
+                       'x-object-meta-foo': 'value',
+                       'x-timestamp-foo': 'value'}
+
+    sysmeta_headers = {'x-account-sysmeta-': 'value',
+                       'x-container-sysmeta-': 'value',
+                       'x-object-sysmeta-': 'value',
+                       'x-account-sysmeta-foo': 'value',
+                       'x-container-sysmeta-foo': 'value',
+                       'x-object-sysmeta-foo': 'value',
+                       'X-Account-Sysmeta-BAR': 'value',
+                       'X-Container-Sysmeta-BAR': 'value',
+                       'X-Object-Sysmeta-BAR': 'value'}
+
+    x_backend_headers = {'X-Backend-Replication': 'true',
+                         'X-Backend-Replication-Headers': 'stuff'}
+
+    object_transient_sysmeta_headers = {
+        'x-object-transient-sysmeta-': 'value',
+        'x-object-transient-sysmeta-foo': 'value'}
+    x_timestamp_headers = {'X-Timestamp': '1455952805.719739'}
+
+    forbidden_headers_out = dict(sysmeta_headers)
+    forbidden_headers_out.update(x_backend_headers)
+    forbidden_headers_out.update(object_transient_sysmeta_headers)
+    forbidden_headers_in = dict(forbidden_headers_out)
+    shunted_headers_in = dict(x_timestamp_headers)
+
+    def _assertHeadersEqual(self, expected, actual):
+        for key in expected:
+            self.assertIn(key.lower(), actual)
+
+    def _assertHeadersAbsent(self, unexpected, actual):
+        for key in unexpected:
+            self.assertNotIn(key.lower(), actual)
+
+    def get_app(self, app, global_conf, **local_conf):
+        factory = gatekeeper.filter_factory(global_conf, **local_conf)
+        return factory(app)
+
+    def test_ok_header(self):
+        req = Request.blank('/v/a/c', environ={'REQUEST_METHOD': 'PUT'},
+                            headers=self.allowed_headers)
+        fake_app = FakeApp()
+        app = self.get_app(fake_app, {})
+        resp = req.get_response(app)
+        self.assertEqual('200 OK', resp.status)
+        self.assertEqual(resp.body, b'FAKE APP')
+        self._assertHeadersEqual(self.allowed_headers, fake_app.req.headers)
+
+    def _test_reserved_header_removed_inbound(self, method):
+        headers = dict(self.forbidden_headers_in)
+        headers.update(self.allowed_headers)
+        headers.update(self.shunted_headers_in)
+        req = Request.blank('/v/a/c', environ={'REQUEST_METHOD': method},
+                            headers=headers)
+        fake_app = FakeApp()
+        app = self.get_app(fake_app, {})
+        resp = req.get_response(app)
+        self.assertEqual('200 OK', resp.status)
+        expected_headers = dict(self.allowed_headers)
+        # shunt_inbound_x_timestamp should be enabled by default
+        expected_headers.update({'X-Backend-Inbound-' + k: v
+                                 for k, v in self.shunted_headers_in.items()})
+        self._assertHeadersEqual(expected_headers, fake_app.req.headers)
+        unexpected_headers = dict(self.forbidden_headers_in)
+        unexpected_headers.update(self.shunted_headers_in)
+        self._assertHeadersAbsent(unexpected_headers, fake_app.req.headers)
+
+    def test_reserved_header_removed_inbound(self):
+        for method in self.methods:
+            self._test_reserved_header_removed_inbound(method)
+
+    def _test_reserved_header_shunted_inbound(self, method):
+        headers = dict(self.shunted_headers_in)
+        headers.update(self.allowed_headers)
+        req = Request.blank('/v/a/c', environ={'REQUEST_METHOD': method},
+                            headers=headers)
+        fake_app = FakeApp()
+        app = self.get_app(fake_app, {}, shunt_inbound_x_timestamp='true')
+        resp = req.get_response(app)
+        self.assertEqual('200 OK', resp.status)
+        expected_headers = dict(self.allowed_headers)
+        expected_headers.update({'X-Backend-Inbound-' + k: v
+                                 for k, v in self.shunted_headers_in.items()})
+        self._assertHeadersEqual(expected_headers, fake_app.req.headers)
+        self._assertHeadersAbsent(self.shunted_headers_in,
+                                  fake_app.req.headers)
+
+    def test_reserved_header_shunted_inbound(self):
+        for method in self.methods:
+            self._test_reserved_header_shunted_inbound(method)
+
+    def _test_reserved_header_shunt_bypassed_inbound(self, method):
+        headers = dict(self.shunted_headers_in)
+        headers.update(self.allowed_headers)
+        req = Request.blank('/v/a/c', environ={'REQUEST_METHOD': method},
+                            headers=headers)
+        fake_app = FakeApp()
+        app = self.get_app(fake_app, {}, shunt_inbound_x_timestamp='false')
+        resp = req.get_response(app)
+        self.assertEqual('200 OK', resp.status)
+        expected_headers = dict(self.allowed_headers)
+        expected_headers.update(self.shunted_headers_in)
+        self._assertHeadersEqual(expected_headers, fake_app.req.headers)
+
+    def test_reserved_header_shunt_bypassed_inbound(self):
+        for method in self.methods:
+            self._test_reserved_header_shunt_bypassed_inbound(method)
+
+    def _test_reserved_header_removed_outbound(self, method):
+        headers = dict(self.forbidden_headers_out)
+        headers.update(self.allowed_headers)
+        req = Request.blank('/v/a/c', environ={'REQUEST_METHOD': method})
+        fake_app = FakeApp(headers=headers)
+        app = self.get_app(fake_app, {})
+        resp = req.get_response(app)
+        self.assertEqual('200 OK', resp.status)
+        self._assertHeadersEqual(self.allowed_headers, resp.headers)
+        self._assertHeadersAbsent(self.forbidden_headers_out, resp.headers)
+
+    def test_reserved_header_removed_outbound(self):
+        for method in self.methods:
+            self._test_reserved_header_removed_outbound(method)
+
+    def _test_duplicate_headers_not_removed(self, method, app_hdrs):
+
+        def fake_factory(global_conf, **local_conf):
+            conf = global_conf.copy()
+            conf.update(local_conf)
+            headers = [('X-Header', 'xxx'),
+                       ('X-Header', 'yyy')]
+
+            def fake_filter(app):
+                return FakeMiddleware(app, conf, headers)
+            return fake_filter
+
+        def fake_start_response(status, response_headers, exc_info=None):
+            hdr_list = []
+            for k, v in response_headers:
+                if k == 'X-Header':
+                    hdr_list.append(v)
+            self.assertTrue('xxx' in hdr_list)
+            self.assertTrue('yyy' in hdr_list)
+            self.assertEqual(len(hdr_list), 2)
+
+        req = Request.blank('/v/a/c', environ={'REQUEST_METHOD': method})
+        fake_app = FakeApp(headers=app_hdrs)
+        factory = gatekeeper.filter_factory({})
+        factory_wrap = fake_factory({})
+        app = factory(factory_wrap(fake_app))
+        app(req.environ, fake_start_response)
+
+    def test_duplicate_headers_not_removed(self):
+        for method in self.methods:
+            for app_hdrs in ({}, self.forbidden_headers_out):
+                self._test_duplicate_headers_not_removed(method, app_hdrs)
+
+    def _test_location_header(self, location_path):
+        headers = {'Location': location_path}
+        req = Request.blank(
+            '/v/a/c', environ={'REQUEST_METHOD': 'GET',
+                               'swift.leave_relative_location': True})
+
+        class SelfishApp(FakeApp):
+            def __call__(self, env, start_response):
+                self.req = Request(env)
+                resp = Response(request=self.req, body=b'FAKE APP',
+                                headers=self.headers)
+                # like webob, middlewares in the pipeline may rewrite
+                # location header from relative to absolute
+                resp.location = resp.absolute_location()
+                return resp(env, start_response)
+
+        selfish_app = SelfishApp(headers=headers)
+
+        app = self.get_app(selfish_app, {})
+        resp = req.get_response(app)
+        self.assertEqual('200 OK', resp.status)
+        self.assertIn('Location', resp.headers)
+        self.assertEqual(resp.headers['Location'], location_path)
+
+    def test_location_header_fixed(self):
+        self._test_location_header('/v/a/c/o2')
+        self._test_location_header('/v/a/c/o2?query=path&query2=doit')
+        self._test_location_header('/v/a/c/o2?query=path#test')
+        self._test_location_header('/v/a/c/o2;whatisparam?query=path#test')
+
+    def test_allow_reserved_names(self):
+        fake_app = FakeApp()
+        app = self.get_app(fake_app, {})
+        headers = {
+            'X-Allow-Reserved-Names': 'some-value'
+        }
+
+        req = Request.blank('/v/a/c/o', method='GET', headers=headers)
+        resp = req.get_response(app)
+        self.assertEqual('200 OK', resp.status)
+        self.assertNotIn('X-Backend-Allow-Reserved-Names',
+                         fake_app.req.headers)
+        self.assertIn('X-Allow-Reserved-Names',
+                      fake_app.req.headers)
+        self.assertEqual(
+            'some-value',
+            fake_app.req.headers['X-Allow-Reserved-Names'])
+
+        app.allow_reserved_names_header = True
+        req = Request.blank('/v/a/c/o', method='GET', headers=headers)
+        resp = req.get_response(app)
+        self.assertEqual('200 OK', resp.status)
+        self.assertIn('X-Backend-Allow-Reserved-Names',
+                      fake_app.req.headers)
+        self.assertEqual(
+            'some-value',
+            fake_app.req.headers['X-Backend-Allow-Reserved-Names'])
+        self.assertEqual(
+            'some-value',
+            req.headers['X-Backend-Allow-Reserved-Names'])
+        self.assertNotIn('X-Allow-Reserved-Names', fake_app.req.headers)
+        self.assertNotIn('X-Allow-Reserved-Names', req.headers)
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/test_healthcheck.py b/test/unit/common/middleware/test_healthcheck.py
index d189d3e6ee..cc54c8ad1a 100644
--- a/test/unit/common/middleware/test_healthcheck.py
+++ b/test/unit/common/middleware/test_healthcheck.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -25,7 +25,7 @@
 class FakeApp(object):
     def __call__(self, env, start_response):
         req = Request(env)
-        return Response(request=req, body='FAKE APP')(
+        return Response(request=req, body=b'FAKE APP')(
             env, start_response)
 
 
@@ -50,30 +50,30 @@ def test_healthcheck(self):
         req = Request.blank('/healthcheck', environ={'REQUEST_METHOD': 'GET'})
         app = self.get_app(FakeApp(), {})
         resp = app(req.environ, self.start_response)
-        self.assertEquals(['200 OK'], self.got_statuses)
-        self.assertEquals(resp, ['OK'])
+        self.assertEqual(['200 OK'], self.got_statuses)
+        self.assertEqual(resp, [b'OK'])
 
-    def test_healtcheck_pass(self):
+    def test_healthcheck_pass(self):
         req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'})
         app = self.get_app(FakeApp(), {})
         resp = app(req.environ, self.start_response)
-        self.assertEquals(['200 OK'], self.got_statuses)
-        self.assertEquals(resp, ['FAKE APP'])
+        self.assertEqual(['200 OK'], self.got_statuses)
+        self.assertEqual(resp, [b'FAKE APP'])
 
     def test_healthcheck_pass_not_disabled(self):
         req = Request.blank('/healthcheck', environ={'REQUEST_METHOD': 'GET'})
         app = self.get_app(FakeApp(), {}, disable_path=self.disable_path)
         resp = app(req.environ, self.start_response)
-        self.assertEquals(['200 OK'], self.got_statuses)
-        self.assertEquals(resp, ['OK'])
+        self.assertEqual(['200 OK'], self.got_statuses)
+        self.assertEqual(resp, [b'OK'])
 
     def test_healthcheck_pass_disabled(self):
         open(self.disable_path, 'w')
         req = Request.blank('/healthcheck', environ={'REQUEST_METHOD': 'GET'})
         app = self.get_app(FakeApp(), {}, disable_path=self.disable_path)
         resp = app(req.environ, self.start_response)
-        self.assertEquals(['503 Service Unavailable'], self.got_statuses)
-        self.assertEquals(resp, ['DISABLED BY FILE'])
+        self.assertEqual(['503 Service Unavailable'], self.got_statuses)
+        self.assertEqual(resp, [b'DISABLED BY FILE'])
 
 
 if __name__ == '__main__':
diff --git a/test/unit/common/middleware/test_helpers.py b/test/unit/common/middleware/test_helpers.py
new file mode 100644
index 0000000000..fea22934f4
--- /dev/null
+++ b/test/unit/common/middleware/test_helpers.py
@@ -0,0 +1,1006 @@
+# -*- coding: utf-8 -*-
+# Copyright (c) 2023 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import collections
+import io
+import unittest
+
+from swift.common.storage_policy import POLICIES
+from swift.common.swob import Request, HTTPOk, HTTPNotFound, \
+    HTTPCreated, HeaderKeyDict
+from swift.common import request_helpers as rh
+from swift.common.middleware.s3api.utils import sysmeta_header
+from test.unit.common.middleware.helpers import FakeSwift, FakeSwiftCall
+
+
+class TestFakeSwiftCall(unittest.TestCase):
+    def test_init(self):
+        req = Request.blank('/v1/a/c/o', headers={'Content-Length': '123'})
+        call = FakeSwiftCall(req)
+        self.assertIs(req, call.req)
+        self.assertEqual('GET', call.method)
+        self.assertEqual('/v1/a/c/o', call.path)
+        self.assertEqual({'Host': 'localhost:80',
+                          'Content-Length': '123'},
+                         call.headers)
+        self.assertIsInstance(call.footers, HeaderKeyDict)
+        self.assertEqual({}, call.footers)
+        self.assertIsNone(call.body)
+
+    def test_environ_copy(self):
+        req = Request.blank('/v1/a/c/o', headers={'Content-Length': '123'})
+        req.environ['swift.source'] = 'SOURCE'
+        req.environ['swift.trans_id'] = 'test-txn-id'
+        mutable_history = ['x', 'y']
+        req.environ['swift.shard_listing_history'] = mutable_history
+        a_list = [(1, 2), {10, range(3)}]
+        d_dict = collections.defaultdict(str, a='b')
+        req.environ['deep.mutable'] = {
+            'x': {
+                'gen2': range(2),
+                'y': {
+                    'gen4': range(4),
+                    'l': a_list
+                },
+                'z': d_dict,
+                'null': None,
+            },
+        }
+        call = FakeSwiftCall(req)
+
+        self.assertEqual('SOURCE', call.env.get('swift.source'))
+        self.assertEqual('test-txn-id', call.env.get('swift.trans_id'))
+        self.assertIn('wsgi.input', call.env)
+        self.assertIs(FakeSwiftCall.DUMMY_VALUE, call.env['wsgi.input'])
+        self.assertEqual(call.env['swift.shard_listing_history'], ['x', 'y'])
+        mutable_history.append('z')
+        self.assertEqual(call.env['swift.shard_listing_history'], ['x', 'y'])
+        self.assertEqual(call.req.environ['swift.shard_listing_history'],
+                         ['x', 'y', 'z'])
+
+        # mutate the deep mutable
+        a_list.append('new thing')
+        d_dict['new'] = 'thing'
+        self.assertEqual(
+            {
+                'x': {
+                    'gen2': FakeSwiftCall.DUMMY_VALUE,
+                    'y': {
+                        'gen4': FakeSwiftCall.DUMMY_VALUE,
+                        'l': [(1, 2), {10, FakeSwiftCall.DUMMY_VALUE}]
+                    },
+                    'z': {'a': 'b'},
+                    'null': None,
+                },
+            },
+            call.env['deep.mutable'])
+
+    def test_header_mutation(self):
+        orig_headers = {'foo': 'bar'}
+        req = Request.blank('/v1/a/c/o',
+                            headers=orig_headers)
+        call = FakeSwiftCall(req)
+        self.assertEqual('bar', call.headers['foo'])
+        req.headers['foo'] = 'baz'
+        self.assertEqual('bar', call.headers['foo'])
+
+
+class TestFakeSwift(unittest.TestCase):
+    def test_call_accessors(self):
+        swift = FakeSwift()
+        swift.register('GET', '/v1/a/c/o', HTTPOk, {'X-Foo': 'Bar'}, b'stuff')
+        req = Request.blank('/v1/a/c/o', headers={'Host': 'localhost:80'})
+        req.environ['swift.trans_id'] = 'test-txn-id'
+        req.environ['swift.source'] = 'SOURCE'
+        req.method = 'GET'
+        req.get_response(swift)
+        self.assertEqual([('GET', '/v1/a/c/o')], swift.calls)
+        self.assertEqual([{'Host': 'localhost:80'}], swift.headers)
+        self.assertEqual([('GET', '/v1/a/c/o', {'Host': 'localhost:80'})],
+                         swift.calls_with_headers)
+        self.assertEqual(['test-txn-id'], swift.txn_ids)
+        self.assertEqual(['SOURCE'], swift.swift_sources)
+        self.assertEqual(1, swift.call_count)
+
+    def test_allowed_methods(self):
+
+        def do_test(swift, method, exp_status):
+            path = '/v1/a/c/o'
+            swift.register(method, path, HTTPOk, {}, None)
+            req = Request.blank(path)
+            req.method = method
+            self.assertEqual(exp_status, req.get_response(swift).status_int)
+
+        for method in ('PUT', 'POST', 'DELETE', 'GET', 'HEAD', 'OPTIONS',
+                       'REPLICATE', 'SSYNC', 'UPDATE'):
+            do_test(FakeSwift(), method, 200)
+
+        do_test(FakeSwift(), 'TEST', 405)
+        do_test(FakeSwift(), 'get', 405)
+
+    def test_not_registered(self):
+        swift = FakeSwift()
+
+        def do_test(method):
+            req = Request.blank('/v1/a/c/o')
+            req.method = method
+            with self.assertRaises(KeyError):
+                req.get_response(swift)
+
+        do_test('GET')
+        do_test('HEAD')
+        do_test('POST')
+        do_test('PUT')
+        do_test('DELETE')
+
+    def test_capture_unexpected_calls(self):
+        req = Request.blank('/v1/a/c/o')
+        req.method = 'GET'
+        swift = FakeSwift()
+        with self.assertRaises(KeyError):
+            req.get_response(swift)
+        self.assertEqual([('GET', '/v1/a/c/o')], swift.calls)
+
+        req = Request.blank('/v1/a/c/o')
+        req.method = 'GET'
+        swift = FakeSwift(capture_unexpected_calls=True)
+        with self.assertRaises(KeyError):
+            req.get_response(swift)
+        self.assertEqual([('GET', '/v1/a/c/o')], swift.calls)
+
+        req = Request.blank('/v1/a/c/o')
+        req.method = 'GET'
+        swift = FakeSwift(capture_unexpected_calls=False)
+        with self.assertRaises(KeyError):
+            req.get_response(swift)
+        self.assertEqual([], swift.calls)
+
+    def test_GET_registered(self):
+        # verify that a single registered GET response is sufficient to handle
+        # GETs and HEADS, with and without query strings
+        swift = FakeSwift()
+        swift.register('GET', '/v1/a/c/o', HTTPOk, {'X-Foo': 'Bar'}, b'stuff')
+
+        req = Request.blank('/v1/a/c/o')
+        req.method = 'GET'
+        resp = req.get_response(swift)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual({'Content-Length': '5',
+                          'Content-Type': 'text/html; charset=UTF-8',
+                          'X-Foo': 'Bar'},
+                         resp.headers)
+        self.assertEqual(b'stuff', resp.body)
+        self.assertEqual(1, swift.call_count)
+        self.assertEqual(('GET', '/v1/a/c/o'), swift.calls[-1])
+
+        req = Request.blank('/v1/a/c/o')
+        req.method = 'GET'
+        req.query_string = 'p=q'
+        resp = req.get_response(swift)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual({'Content-Length': '5',
+                          'Content-Type': 'text/html; charset=UTF-8',
+                          'X-Foo': 'Bar'},
+                         resp.headers)
+        self.assertEqual(b'stuff', resp.body)
+        self.assertEqual(2, swift.call_count)
+        self.assertEqual(('GET', '/v1/a/c/o?p=q'), swift.calls[-1])
+
+        req = Request.blank('/v1/a/c/o')
+        req.method = 'HEAD'
+        resp = req.get_response(swift)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual({'Content-Type': 'text/html; charset=UTF-8',
+                          'X-Foo': 'Bar'},
+                         resp.headers)
+        self.assertEqual(b'', resp.body)
+        self.assertEqual(3, swift.call_count)
+        self.assertEqual(('HEAD', '/v1/a/c/o'), swift.calls[-1])
+
+        req = Request.blank('/v1/a/c/o')
+        req.method = 'HEAD'
+        req.query_string = 'p=q'
+        resp = req.get_response(swift)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual({'Content-Type': 'text/html; charset=UTF-8',
+                          'X-Foo': 'Bar'},
+                         resp.headers)
+        self.assertEqual(b'', resp.body)
+        self.assertEqual(4, swift.call_count)
+        self.assertEqual(('HEAD', '/v1/a/c/o?p=q'), swift.calls[-1])
+
+    def test_GET_registered_with_query_string(self):
+        # verify that a registered GET response with query string only matches
+        # a request with that query string
+        swift = FakeSwift()
+        swift.register('GET', '/v1/a/c/o?p=q', HTTPOk,
+                       {'X-Foo': 'Bar'}, b'stuff')
+
+        req = Request.blank('/v1/a/c/o')  # no query string
+        req.method = 'GET'
+        with self.assertRaises(KeyError):
+            req.get_response(swift)
+        self.assertEqual(1, swift.call_count)
+        self.assertEqual([('GET', '/v1/a/c/o')], swift.calls)
+
+        req.query_string = 'p=q'
+        resp = req.get_response(swift)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual({'Content-Length': '5',
+                          'Content-Type': 'text/html; charset=UTF-8',
+                          'X-Foo': 'Bar'},
+                         resp.headers)
+        self.assertEqual(b'stuff', resp.body)
+        self.assertEqual(2, swift.call_count)
+        self.assertEqual([('GET', '/v1/a/c/o'),
+                          ('GET', '/v1/a/c/o?p=q')],
+                         swift.calls)
+
+        req.query_string = 'p=z'
+        with self.assertRaises(KeyError):
+            req.get_response(swift)
+        self.assertEqual(3, swift.call_count)
+        self.assertEqual([('GET', '/v1/a/c/o'),
+                          ('GET', '/v1/a/c/o?p=q'),
+                          ('GET', '/v1/a/c/o?p=z')],
+                         swift.calls)
+
+    def test_GET_and_HEAD_registered(self):
+        # verify that a registered HEAD response will be preferred over GET for
+        # HEAD request
+        swift = FakeSwift()
+        swift.register('GET', '/v1/a/c/o', HTTPOk, {'X-Foo': 'Bar'}, b'stuff')
+        swift.register('HEAD', '/v1/a/c/o', HTTPNotFound, {}, b'')
+
+        req = Request.blank('/v1/a/c/o')
+        req.method = 'GET'
+        resp = req.get_response(swift)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual({'Content-Length': '5',
+                          'Content-Type': 'text/html; charset=UTF-8',
+                          'X-Foo': 'Bar'},
+                         resp.headers)
+        self.assertEqual(b'stuff', resp.body)
+        self.assertEqual(1, swift.call_count)
+        self.assertEqual(('GET', '/v1/a/c/o'), swift.calls[-1])
+
+        req = Request.blank('/v1/a/c/o')
+        req.method = 'HEAD'
+        resp = req.get_response(swift)
+        self.assertEqual(404, resp.status_int)
+        self.assertEqual({'Content-Type': 'text/html; charset=UTF-8'},
+                         resp.headers)
+        self.assertEqual(b'', resp.body)
+        self.assertEqual(2, swift.call_count)
+        self.assertEqual(('HEAD', '/v1/a/c/o'), swift.calls[-1])
+
+        req = Request.blank('/v1/a/c/o')
+        req.method = 'HEAD'
+        req.query_string = 'p=q'
+        resp = req.get_response(swift)
+        self.assertEqual(404, resp.status_int)
+        self.assertEqual({'Content-Type': 'text/html; charset=UTF-8'},
+                         resp.headers)
+        self.assertEqual(b'', resp.body)
+        self.assertEqual(3, swift.call_count)
+        self.assertEqual(('HEAD', '/v1/a/c/o?p=q'), swift.calls[-1])
+
+    def test_PUT_uploaded(self):
+        # verify an uploaded object is sufficient to handle GETs and HEADS,
+        # with and without query strings
+        swift = FakeSwift()
+        swift.register('PUT', '/v1/a/c/o', HTTPCreated, {}, None)
+        req = Request.blank('/v1/a/c/o', body=b'stuff')
+        req.method = 'PUT'
+        resp = req.get_response(swift)
+        self.assertEqual(201, resp.status_int)
+        self.assertEqual({'Content-Length': '5',
+                          'Etag': 'c13d88cb4cb02003daedb8a84e5d272a',
+                          'Content-Type': 'text/html; charset=UTF-8'},
+                         resp.headers)
+        self.assertEqual(b'', resp.body)
+        self.assertEqual(1, swift.call_count)
+        self.assertEqual(('PUT', '/v1/a/c/o'), swift.calls[-1])
+        self.assertEqual(b'stuff', swift.call_list[-1].body)
+
+        req = Request.blank('/v1/a/c/o')
+        req.method = 'GET'
+        resp = req.get_response(swift)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual({'Content-Length': '5',
+                          'Content-Type': 'text/html; charset=UTF-8',
+                          'Host': 'localhost:80'},
+                         resp.headers)
+        self.assertEqual(b'stuff', resp.body)
+        self.assertEqual(2, swift.call_count)
+        self.assertEqual(('GET', '/v1/a/c/o'), swift.calls[-1])
+
+        req = Request.blank('/v1/a/c/o')
+        req.method = 'GET'
+        req.query_string = 'p=q'
+        resp = req.get_response(swift)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual({'Content-Length': '5',
+                          'Content-Type': 'text/html; charset=UTF-8',
+                          'Host': 'localhost:80'},
+                         resp.headers)
+        self.assertEqual(b'stuff', resp.body)
+        self.assertEqual(3, swift.call_count)
+        self.assertEqual(('GET', '/v1/a/c/o?p=q'), swift.calls[-1])
+
+        req = Request.blank('/v1/a/c/o')
+        req.method = 'HEAD'
+        resp = req.get_response(swift)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual({'Content-Length': '5',
+                          'Content-Type': 'text/html; charset=UTF-8',
+                          'Host': 'localhost:80'},
+                         resp.headers)
+        self.assertEqual(b'', resp.body)
+        self.assertEqual(4, swift.call_count)
+        self.assertEqual(('HEAD', '/v1/a/c/o'), swift.calls[-1])
+
+        req = Request.blank('/v1/a/c/o')
+        req.method = 'HEAD'
+        req.query_string = 'p=q'
+        resp = req.get_response(swift)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual({'Content-Length': '5',
+                          'Content-Type': 'text/html; charset=UTF-8',
+                          'Host': 'localhost:80'},
+                         resp.headers)
+        self.assertEqual(b'', resp.body)
+        self.assertEqual(5, swift.call_count)
+        self.assertEqual(('HEAD', '/v1/a/c/o?p=q'), swift.calls[-1])
+
+    def test_PUT_uploaded_with_query_string(self):
+        # verify an uploaded object with query string is sufficient to handle
+        # GETs and HEADS, with and without query strings
+        swift = FakeSwift()
+        swift.register('PUT', '/v1/a/c/o', HTTPCreated, {}, None)
+        req = Request.blank('/v1/a/c/o', body=b'stuff')
+        req.method = 'PUT'
+        req.query_string = 'multipart-manifest=put'
+        resp = req.get_response(swift)
+        self.assertEqual(201, resp.status_int)
+        self.assertEqual({'Content-Length': '5',
+                          'Etag': 'c13d88cb4cb02003daedb8a84e5d272a',
+                          'Content-Type': 'text/html; charset=UTF-8'},
+                         resp.headers)
+        self.assertEqual(b'', resp.body)
+        self.assertEqual(1, swift.call_count)
+        self.assertEqual(('PUT', '/v1/a/c/o?multipart-manifest=put'),
+                         swift.calls[-1])
+        # note: query string is not included in uploaded key
+        self.assertEqual(
+            {'/v1/a/c/o': ({'Host': 'localhost:80',
+                            'Content-Length': '5'},
+                           b'stuff')},
+            swift.uploaded)
+
+        req = Request.blank('/v1/a/c/o')
+        req.method = 'GET'
+        resp = req.get_response(swift)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual({'Content-Length': '5',
+                          'Content-Type': 'text/html; charset=UTF-8',
+                          'Host': 'localhost:80'},
+                         resp.headers)
+        self.assertEqual(b'stuff', resp.body)
+        self.assertEqual(2, swift.call_count)
+        self.assertEqual(('GET', '/v1/a/c/o'), swift.calls[-1])
+
+        req = Request.blank('/v1/a/c/o')
+        req.method = 'GET'
+        req.query_string = 'p=q'  # note: differs from PUT query string
+        resp = req.get_response(swift)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual({'Content-Length': '5',
+                          'Content-Type': 'text/html; charset=UTF-8',
+                          'Host': 'localhost:80'},
+                         resp.headers)
+        self.assertEqual(b'stuff', resp.body)
+        self.assertEqual(3, swift.call_count)
+        self.assertEqual(('GET', '/v1/a/c/o?p=q'), swift.calls[-1])
+
+        req = Request.blank('/v1/a/c/o')
+        req.method = 'HEAD'
+        resp = req.get_response(swift)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual({'Content-Length': '5',
+                          'Content-Type': 'text/html; charset=UTF-8',
+                          'Host': 'localhost:80'},
+                         resp.headers)
+        self.assertEqual(b'', resp.body)
+        self.assertEqual(4, swift.call_count)
+        self.assertEqual(('HEAD', '/v1/a/c/o'), swift.calls[-1])
+
+        req = Request.blank('/v1/a/c/o')
+        req.method = 'HEAD'
+        req.query_string = 'p=q'
+        resp = req.get_response(swift)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual({'Content-Length': '5',
+                          'Content-Type': 'text/html; charset=UTF-8',
+                          'Host': 'localhost:80'},
+                         resp.headers)
+        self.assertEqual(b'', resp.body)
+        self.assertEqual(5, swift.call_count)
+        self.assertEqual(('HEAD', '/v1/a/c/o?p=q'), swift.calls[-1])
+
+    def test_PUT_POST(self):
+        # verify an uploaded object is updated by a POST
+        swift = FakeSwift()
+        swift.register('PUT', '/v1/a/c/o', HTTPCreated, {}, None)
+        # Note: the POST must be registered
+        swift.register('POST', '/v1/a/c/o', HTTPCreated, {}, None)
+        req = Request.blank('/v1/a/c/o', body=b'stuff',
+                            headers={'X-Object-Meta-Foo': 'Bar'})
+        req.method = 'PUT'
+        resp = req.get_response(swift)
+        self.assertEqual(201, resp.status_int)
+        self.assertEqual({'Content-Length': '5',
+                          'Etag': 'c13d88cb4cb02003daedb8a84e5d272a',
+                          'Content-Type': 'text/html; charset=UTF-8'},
+                         resp.headers)
+        self.assertEqual(b'', resp.body)
+        self.assertEqual(1, swift.call_count)
+        self.assertEqual(('PUT', '/v1/a/c/o'), swift.calls[-1])
+        self.assertEqual(
+            {'/v1/a/c/o': ({'Host': 'localhost:80',
+                            'Content-Length': '5',
+                            'X-Object-Meta-Foo': 'Bar'},
+                           b'stuff')},
+            swift.uploaded)
+
+        # POST should update the uploaded object
+        req = Request.blank('/v1/a/c/o', body=b'stuff',
+                            headers={'X-Object-Meta-Foo': 'Baz'})
+        req.method = 'POST'
+        resp = req.get_response(swift)
+        self.assertEqual(201, resp.status_int)
+        self.assertEqual({'Content-Type': 'text/html; charset=UTF-8'},
+                         resp.headers)
+        self.assertEqual(b'', resp.body)
+        self.assertEqual(2, swift.call_count)
+        self.assertEqual(('POST', '/v1/a/c/o'), swift.calls[-1])
+        self.assertEqual(
+            {'/v1/a/c/o': ({'Host': 'localhost:80',
+                            'Content-Length': '5',
+                            'X-Object-Meta-Foo': 'Baz'},
+                           b'stuff')},
+            swift.uploaded)
+
+    def test_PUT_with_query_string_POST(self):
+        # verify an uploaded object with query string is updated by a POST
+        swift = FakeSwift()
+        swift.register('PUT', '/v1/a/c/o', HTTPCreated, {}, None)
+        # Note: the POST must be registered
+        swift.register('POST', '/v1/a/c/o', HTTPCreated, {}, None)
+        req = Request.blank('/v1/a/c/o', body=b'stuff',
+                            headers={'X-Object-Meta-Foo': 'Bar'})
+        req.method = 'PUT'
+        req.query_string = 'p=q'
+        resp = req.get_response(swift)
+        self.assertEqual(201, resp.status_int)
+        self.assertEqual({'Content-Length': '5',
+                          'Etag': 'c13d88cb4cb02003daedb8a84e5d272a',
+                          'Content-Type': 'text/html; charset=UTF-8'},
+                         resp.headers)
+        self.assertEqual(b'', resp.body)
+        self.assertEqual(1, swift.call_count)
+        self.assertEqual(('PUT', '/v1/a/c/o?p=q'), swift.calls[-1])
+        # note: query string is not included in uploaded key
+        self.assertEqual(
+            {'/v1/a/c/o': ({'Host': 'localhost:80',
+                            'Content-Length': '5',
+                            'X-Object-Meta-Foo': 'Bar'},
+                           b'stuff')},
+            swift.uploaded)
+
+        # POST without query string should update the uploaded object
+        req = Request.blank('/v1/a/c/o', body=b'stuff',
+                            headers={'X-Object-Meta-Foo': 'Baz'})
+        req.method = 'POST'
+        resp = req.get_response(swift)
+        self.assertEqual(201, resp.status_int)
+        self.assertEqual({'Content-Type': 'text/html; charset=UTF-8'},
+                         resp.headers)
+        self.assertEqual(b'', resp.body)
+        self.assertEqual(2, swift.call_count)
+        self.assertEqual(('POST', '/v1/a/c/o'), swift.calls[-1])
+        self.assertEqual(
+            {'/v1/a/c/o': ({'Host': 'localhost:80',
+                            'Content-Length': '5',
+                            'X-Object-Meta-Foo': 'Baz'},
+                           b'stuff')},
+            swift.uploaded)
+
+        # POST with different query string should update the uploaded object
+        req = Request.blank('/v1/a/c/o', body=b'stuff',
+                            headers={'X-Object-Meta-Foo': 'Bof'})
+        req.method = 'POST'
+        req.query_string = 'x=y'
+        resp = req.get_response(swift)
+        self.assertEqual(201, resp.status_int)
+        self.assertEqual({'Content-Type': 'text/html; charset=UTF-8'},
+                         resp.headers)
+        self.assertEqual(b'', resp.body)
+        self.assertEqual(3, swift.call_count)
+        self.assertEqual(('POST', '/v1/a/c/o?x=y'), swift.calls[-1])
+        self.assertEqual(
+            {'/v1/a/c/o': ({'Host': 'localhost:80',
+                            'Content-Length': '5',
+                            'X-Object-Meta-Foo': 'Bof'},
+                           b'stuff')},
+            swift.uploaded)
+
+        req = Request.blank('/v1/a/c/o')
+        req.method = 'GET'
+        resp = req.get_response(swift)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual({'Content-Length': '5',
+                          'Content-Type': 'text/html; charset=UTF-8',
+                          'Host': 'localhost:80',
+                          'X-Object-Meta-Foo': 'Bof'},
+                         resp.headers)
+        self.assertEqual(b'stuff', resp.body)
+        self.assertEqual(4, swift.call_count)
+        self.assertEqual(('GET', '/v1/a/c/o'), swift.calls[-1])
+
+    def test_PUT_with_footers_callback(self):
+        def footers_callback(footers):
+            footers['x-object-sysmeta-foo'] = 'bar'
+
+        swift = FakeSwift()
+        swift.register('PUT', '/v1/a/c/o', HTTPCreated, {}, None)
+        # Note: the POST must be registered
+        swift.register('POST', '/v1/a/c/o', HTTPCreated, {}, None)
+        req = Request.blank('/v1/a/c/o', body=b'stuff',
+                            headers={'X-Object-Meta-Foo': 'Bar'})
+        req.method = 'PUT'
+        req.environ['swift.callback.update_footers'] = footers_callback
+        resp = req.get_response(swift)
+        self.assertEqual(201, resp.status_int)
+        self.assertEqual({'Content-Length': '5',
+                          'Etag': 'c13d88cb4cb02003daedb8a84e5d272a',
+                          'Content-Type': 'text/html; charset=UTF-8'},
+                         resp.headers)
+        self.assertEqual(b'', resp.body)
+        self.assertEqual(1, swift.call_count)
+        self.assertEqual(('PUT', '/v1/a/c/o'), swift.calls[0])
+        self.assertEqual({'Host': 'localhost:80',
+                          'Content-Length': '5',
+                          'X-Object-Meta-Foo': 'Bar'},
+                         swift.call_list[0].headers)
+        self.assertEqual({'X-Object-Sysmeta-Foo': 'bar'},
+                         swift.call_list[0].footers)
+
+        req = Request.blank('/v1/a/c/o')
+        req.method = 'GET'
+        resp = req.get_response(swift)
+        self.assertEqual(200, resp.status_int)
+        # resp has headers and footers
+        self.assertEqual({'Content-Length': '5',
+                          'Content-Type': 'text/html; charset=UTF-8',
+                          'Host': 'localhost:80',
+                          'X-Object-Sysmeta-Foo': 'bar',
+                          'X-Object-Meta-Foo': 'Bar'},
+                         resp.headers)
+
+    def test_PUT_error_reading_body(self):
+        swift = FakeSwift()
+        swift.register('PUT', '/v1/a/c/o', HTTPCreated, {}, None)
+        req = Request.blank('/v1/a/c/o')
+        req.method = 'PUT'
+        wsgi_input = io.BytesIO()
+        wsgi_input.close()
+        req.environ['wsgi.input'] = wsgi_input
+        with self.assertRaises(ValueError):
+            # ValueError: I/O operation on closed file.
+            req.get_response(swift)
+        # the request was captured...
+        self.assertEqual(1, swift.call_count)
+        call = swift.call_list[0]
+        self.assertEqual(('PUT', '/v1/a/c/o'), (call.method, call.path))
+        self.assertIsNone(call.body)
+
+    def test_GET_registered_overrides_uploaded(self):
+        swift = FakeSwift()
+        swift.register('PUT', '/v1/a/c/o', HTTPCreated, {}, None)
+        swift.register('GET', '/v1/a/c/o', HTTPOk, {}, b'not stuff')
+
+        req = Request.blank('/v1/a/c/o', body=b'stuff',
+                            headers={'X-Object-Meta-Foo': 'Bar'})
+        req.method = 'PUT'
+        resp = req.get_response(swift)
+        self.assertEqual(201, resp.status_int)
+        self.assertEqual({'Content-Length': '5',
+                          'Etag': 'c13d88cb4cb02003daedb8a84e5d272a',
+                          'Content-Type': 'text/html; charset=UTF-8'},
+                         resp.headers)
+        self.assertEqual(b'', resp.body)
+        self.assertEqual(1, swift.call_count)
+        self.assertEqual(('PUT', '/v1/a/c/o'), swift.calls[-1])
+        self.assertEqual(
+            {'/v1/a/c/o': ({'Host': 'localhost:80',
+                            'Content-Length': '5',
+                            'X-Object-Meta-Foo': 'Bar'},
+                           b'stuff')},
+            swift.uploaded)
+
+        req = Request.blank('/v1/a/c/o')
+        req.method = 'GET'
+        resp = req.get_response(swift)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual({'Content-Length': '9',
+                          'Content-Type': 'text/html; charset=UTF-8'},
+                         resp.headers)
+        self.assertEqual(b'not stuff', resp.body)
+        self.assertEqual(2, swift.call_count)
+        self.assertEqual(('GET', '/v1/a/c/o'), swift.calls[-1])
+
+    def test_range(self):
+        swift = FakeSwift()
+        swift.register('GET', '/v1/a/c/o', HTTPOk, {}, b'stuff')
+        req = Request.blank('/v1/a/c/o', headers={'Range': 'bytes=0-2'})
+        resp = req.get_response(swift)
+        self.assertEqual(206, resp.status_int)
+        self.assertEqual(b'stu', resp.body)
+        self.assertEqual('bytes 0-2/5', resp.headers['Content-Range'])
+        self.assertEqual('bytes=0-2', req.headers.get('Range'))
+        self.assertEqual('bytes=0-2',
+                         swift.call_list[-1].headers.get('Range'))
+
+    def test_range_ignore_range_header(self):
+        swift = FakeSwift()
+        swift.register('GET', '/v1/a/c/o', HTTPOk, {
+            # the value of the matching header doesn't matter
+            'X-Object-Sysmeta-Magic': 'False'
+        }, b'stuff')
+        req = Request.blank('/v1/a/c/o', headers={'Range': 'bytes=0-2'})
+        rh.update_ignore_range_header(req, 'X-Object-Sysmeta-Magic')
+        resp = req.get_response(swift)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual(b'stuff', resp.body)
+        self.assertNotIn('Content-Range', resp.headers)
+        self.assertEqual('bytes=0-2', req.headers.get('Range'))
+        self.assertEqual('bytes=0-2',
+                         swift.call_list[-1].headers.get('Range'))
+
+    def test_range_ignore_range_header_old_swift(self):
+        swift = FakeSwift()
+        swift.can_ignore_range = False
+        swift.register('GET', '/v1/a/c/o', HTTPOk, {
+            # the value of the matching header doesn't matter
+            'X-Object-Sysmeta-Magic': 'False'
+        }, b'stuff')
+        req = Request.blank('/v1/a/c/o', headers={'Range': 'bytes=0-2'})
+        rh.update_ignore_range_header(req, 'X-Object-Sysmeta-Magic')
+        resp = req.get_response(swift)
+        self.assertEqual(206, resp.status_int)
+        self.assertEqual(b'stu', resp.body)
+        self.assertEqual('bytes 0-2/5', resp.headers['Content-Range'])
+        self.assertEqual('bytes=0-2', req.headers.get('Range'))
+        self.assertEqual('bytes=0-2',
+                         swift.call_list[-1].headers.get('Range'))
+
+    def test_range_ignore_range_header_ignored(self):
+        swift = FakeSwift()
+        # range is only ignored if registered response has matching metadata
+        swift.register('GET', '/v1/a/c/o', HTTPOk, {}, b'stuff')
+        req = Request.blank('/v1/a/c/o', headers={'Range': 'bytes=0-2'})
+        rh.update_ignore_range_header(req, 'X-Object-Sysmeta-Magic')
+        resp = req.get_response(swift)
+        self.assertEqual(206, resp.status_int)
+        self.assertEqual(b'stu', resp.body)
+        self.assertEqual('bytes 0-2/5', resp.headers['Content-Range'])
+        self.assertEqual('bytes=0-2', req.headers.get('Range'))
+        self.assertEqual('bytes=0-2',
+                         swift.call_list[-1].headers.get('Range'))
+
+    def test_object_GET_updated_with_storage_policy(self):
+        swift = FakeSwift()
+        swift.register('GET', '/v1/a/c/o', HTTPOk, {}, body=b'stuff')
+        req = Request.blank('/v1/a/c/o')
+        req.method = 'GET'
+        self.assertNotIn('X-Backend-Storage-Policy-Index', req.headers)
+        resp = req.get_response(swift)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual({'Content-Length': '5',
+                          'Content-Type': 'text/html; charset=UTF-8'},
+                         resp.headers)
+        self.assertEqual(b'stuff', resp.body)
+        self.assertEqual(1, swift.call_count)
+        self.assertEqual(('GET', '/v1/a/c/o'), swift.calls[0])
+        self.assertEqual(('GET', '/v1/a/c/o',
+                          {'Host': 'localhost:80'}),  # from swob
+                         swift.calls_with_headers[0])
+        # default storage policy is applied...
+        self.assertEqual(str(int(POLICIES.default)),
+                         req.headers.get('X-Backend-Storage-Policy-Index'))
+
+        # register a container with storage policy 99...
+        swift.register('HEAD', '/v1/a/c', HTTPOk,
+                       {'X-Backend-Storage-Policy-Index': '99'}, None)
+        req = Request.blank('/v1/a/c/o')
+        req.method = 'GET'
+        self.assertNotIn('X-Backend-Storage-Policy-Index', req.headers)
+        resp = req.get_response(swift)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual({'Content-Length': '5',
+                          'Content-Type': 'text/html; charset=UTF-8'},
+                         resp.headers)
+        self.assertEqual(b'stuff', resp.body)
+        self.assertEqual(2, swift.call_count)
+        self.assertEqual(('GET', '/v1/a/c/o'), swift.calls[1])
+        self.assertEqual(('GET', '/v1/a/c/o',
+                          {'Host': 'localhost:80'}),  # from swob
+                         swift.calls_with_headers[1])
+        self.assertEqual(
+            '99', req.headers.get('X-Backend-Storage-Policy-Index'))
+
+
+class TestFakeSwiftMultipleResponses(unittest.TestCase):
+
+    def test_register_response_is_forever(self):
+        swift = FakeSwift()
+        swift.register('GET', '/v1/a/c/o',
+                       HTTPOk, {'X-Foo': 'Bar'}, b'stuff')
+        req = Request.blank('/v1/a/c/o')
+        resp = req.get_response(swift)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual('Bar', resp.headers['X-Foo'])
+        # you can get this response as much as you want
+        for i in range(10):
+            resp = req.get_response(swift)
+            self.assertEqual(200, resp.status_int)
+            self.assertEqual('Bar', resp.headers['X-Foo'])
+
+    def test_register_response_is_last_response_wins(self):
+        swift = FakeSwift()
+        swift.register('GET', '/v1/a/c/o',
+                       HTTPOk, {'X-Foo': 'Bar'}, b'stuff')
+        req = Request.blank('/v1/a/c/o')
+        resp = req.get_response(swift)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual('Bar', resp.headers['X-Foo'])
+
+        swift.register('GET', '/v1/a/c/o',
+                       HTTPOk, {'X-Foo': 'Baz'}, b'other')
+        resp = req.get_response(swift)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual('Baz', resp.headers['X-Foo'])
+        # you can get this new response as much as you want
+        for i in range(10):
+            resp = req.get_response(swift)
+            self.assertEqual(200, resp.status_int)
+            self.assertEqual('Baz', resp.headers['X-Foo'])
+
+    def test_register_next_response_is_last_response_wins(self):
+        swift = FakeSwift()
+        swift.register(
+            'GET', '/v1/a/c/o',
+            HTTPOk, {'X-Foo': 'Bar'}, b'stuff')
+        swift.register_next_response(
+            'GET', '/v1/a/c/o',
+            HTTPOk, {'X-Foo': 'Baz'}, b'other')
+        req = Request.blank('/v1/a/c/o')
+
+        resp = req.get_response(swift)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual('Bar', resp.headers['X-Foo'])
+        resp = req.get_response(swift)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual('Baz', resp.headers['X-Foo'])
+        # you can get this new response as much as you want
+        for i in range(10):
+            resp = req.get_response(swift)
+            self.assertEqual(200, resp.status_int)
+            self.assertEqual('Baz', resp.headers['X-Foo'])
+
+    def test_register_next_response_keeps_current_registered_response(self):
+        # we expect test authors will typically 'd register ALL their responses
+        # before you start calling FakeSwift
+        swift = FakeSwift()
+        swift.register(
+            'GET', '/v1/a/c/o',
+            HTTPOk, {'X-Foo': 'Bar'}, b'stuff')
+        req = Request.blank('/v1/a/c/o')
+
+        # we get the registered response, obviously
+        resp = req.get_response(swift)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual('Bar', resp.headers['X-Foo'])
+
+        # because before calling register_next_response, no resp are consumed
+        swift.register_next_response(
+            'GET', '/v1/a/c/o',
+            HTTPOk, {'X-Foo': 'Baz'}, b'other')
+
+        # so, this is the "current" response, not the *next* response
+        resp = req.get_response(swift)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual('Bar', resp.headers['X-Foo'])
+
+        # the *next* response is the next response
+        resp = req.get_response(swift)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual('Baz', resp.headers['X-Foo'])
+
+    def test_register_next_response_first(self):
+        # you can just use register_next_response
+        swift = FakeSwift()
+        swift.register_next_response(
+            'GET', '/v1/a/c/o',
+            HTTPOk, {'X-Foo': 'Bar'}, b'stuff')
+        swift.register_next_response(
+            'GET', '/v1/a/c/o',
+            HTTPOk, {'X-Foo': 'Baz'}, b'other')
+        req = Request.blank('/v1/a/c/o')
+
+        # it works just like you'd called register
+        resp = req.get_response(swift)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual('Bar', resp.headers['X-Foo'])
+        resp = req.get_response(swift)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual('Baz', resp.headers['X-Foo'])
+        # you can get this new response as much as you want
+        for i in range(10):
+            resp = req.get_response(swift)
+            self.assertEqual(200, resp.status_int)
+            self.assertEqual('Baz', resp.headers['X-Foo'])
+
+    def test_register_resets(self):
+        swift = FakeSwift()
+        swift.register_next_response(
+            'GET', '/v1/a/c/o',
+            HTTPOk, {'X-Foo': 'Bar'}, b'stuff')
+        req = Request.blank('/v1/a/c/o')
+
+        resp = req.get_response(swift)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual('Bar', resp.headers['X-Foo'])
+        # you can get this response as much as you want
+        for i in range(10):
+            resp = req.get_response(swift)
+            self.assertEqual(200, resp.status_int)
+            self.assertEqual('Bar', resp.headers['X-Foo'])
+
+        # if you call register mid test you immediately reset the resp
+        swift.register(
+            'GET', '/v1/a/c/o',
+            HTTPOk, {'X-Foo': 'Baz'}, b'other')
+
+        resp = req.get_response(swift)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual('Baz', resp.headers['X-Foo'])
+        # you can get this new response as much as you want
+        for i in range(10):
+            resp = req.get_response(swift)
+            self.assertEqual(200, resp.status_int)
+            self.assertEqual('Baz', resp.headers['X-Foo'])
+
+
+class TestFakeSwiftStickyHeaders(unittest.TestCase):
+    def setUp(self):
+        self.swift = FakeSwift()
+        self.path = '/v1/AUTH_test/bucket'
+
+    def _check_headers(self, method, path, exp_headers):
+        captured_headers = {}
+
+        def start_response(status, resp_headers):
+            self.assertEqual(status, '200 OK')
+            captured_headers.update(resp_headers)
+
+        env = {'REQUEST_METHOD': method, 'PATH_INFO': path}
+        body_iter = self.swift(env, start_response)
+        b''.join(body_iter)
+        captured_headers.pop('Content-Type')
+        self.assertEqual(exp_headers, captured_headers)
+
+    def test_sticky_headers(self):
+        sticky_headers = HeaderKeyDict({
+            sysmeta_header('container', 'acl'): 'test',
+            'x-container-meta-foo': 'bar',
+        })
+        self.swift.update_sticky_response_headers(self.path, sticky_headers)
+        # register a response for this path with no headers
+        self.swift.register('GET', self.path, HTTPOk, {}, None)
+        self._check_headers('HEAD', self.path, sticky_headers)
+        self._check_headers('GET', self.path, sticky_headers)
+
+        # sticky headers are not applied to PUT, POST, DELETE
+        self.swift.register('PUT', self.path, HTTPOk, {}, None)
+        self._check_headers('PUT', self.path, {})
+        self.swift.register('POST', self.path, HTTPOk, {}, None)
+        self._check_headers('POST', self.path, {})
+        self.swift.register('DELETE', self.path, HTTPOk, {}, None)
+        self._check_headers('DELETE', self.path, {})
+
+    def test_sticky_headers_match_path(self):
+        other_path = self.path + '-other'
+        sticky_headers = HeaderKeyDict({
+            sysmeta_header('container', 'acl'): 'test',
+            'x-container-meta-foo': 'bar',
+        })
+        sticky_headers_other = HeaderKeyDict({
+            'x-container-meta-foo': 'other',
+        })
+        self.swift.update_sticky_response_headers(self.path, sticky_headers)
+        self.swift.update_sticky_response_headers(other_path,
+                                                  sticky_headers_other)
+        self.swift.register('GET', self.path, HTTPOk, {}, None)
+        self.swift.register('GET', other_path, HTTPOk, {}, None)
+        self._check_headers('HEAD', self.path, sticky_headers)
+        self._check_headers('GET', other_path, sticky_headers_other)
+
+    def test_sticky_headers_update(self):
+        sticky_headers = HeaderKeyDict({
+            sysmeta_header('container', 'acl'): 'test',
+            'x-container-meta-foo': 'bar'
+        })
+        exp_headers = sticky_headers.copy()
+        self.swift.update_sticky_response_headers(self.path, sticky_headers)
+        self.swift.register('HEAD', self.path, HTTPOk, {}, None)
+        self._check_headers('HEAD', self.path, exp_headers)
+
+        # check that FakeSwift made a *copy*
+        sticky_headers['x-container-meta-foo'] = 'changed'
+        self._check_headers('HEAD', self.path, exp_headers)
+
+        # check existing are updated not replaced
+        sticky_headers = HeaderKeyDict({
+            sysmeta_header('container', 'acl'): 'test-modified',
+            'x-container-meta-bar': 'foo'
+        })
+        exp_headers.update(sticky_headers)
+        self.swift.update_sticky_response_headers(self.path, sticky_headers)
+        self._check_headers('HEAD', self.path, exp_headers)
+
+    def test_sticky_headers_add_to_response_headers(self):
+        sticky_headers = HeaderKeyDict({
+            'x-container-meta-foo': 'bar',
+        })
+        self.swift.update_sticky_response_headers(self.path, sticky_headers)
+        # register a response with another header
+        self.swift.register('HEAD', self.path, HTTPOk, {
+            'x-backend-storage-policy-index': '1',
+        }, None)
+        self._check_headers('HEAD', self.path, HeaderKeyDict({
+            'x-container-meta-foo': 'bar',
+            'x-backend-storage-policy-index': '1',
+        }))
+
+    def test_sticky_headers_overwritten_by_response_header(self):
+        sticky_headers = HeaderKeyDict({
+            'x-container-meta-foo': 'bar',
+            'x-backend-storage-policy-index': '0',
+        })
+        self.swift.update_sticky_response_headers(self.path, sticky_headers)
+        # register a response with a different value for a sticky header
+        self.swift.register('HEAD', self.path, HTTPOk, {
+            'x-container-meta-foo': 'different',
+        }, None)
+        self._check_headers('HEAD', self.path, HeaderKeyDict({
+            'x-container-meta-foo': 'different',
+            'x-backend-storage-policy-index': '0',
+        }))
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/test_keystoneauth.py b/test/unit/common/middleware/test_keystoneauth.py
index a40898b184..711baa09de 100644
--- a/test/unit/common/middleware/test_keystoneauth.py
+++ b/test/unit/common/middleware/test_keystoneauth.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2012 OpenStack, LLC.
+# Copyright (c) 2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -16,13 +16,65 @@
 import unittest
 
 from swift.common.middleware import keystoneauth
-from swift.common.swob import Request, Response, HTTPForbidden
+from swift.common.swob import Request, Response
 from swift.common.http import HTTP_FORBIDDEN
+from swift.common.utils import split_path
+from swift.proxy.controllers.base import get_cache_key
+from test.debug_logger import debug_logger
+
+UNKNOWN_ID = keystoneauth.UNKNOWN_ID
+
+
+def _fake_token_info(version='2'):
+    if version == '2':
+        return {'access': 'fake_value'}
+    if version == '3':
+        return {'token': 'fake_value'}
+
+
+def operator_roles(test_auth):
+    # Return copy -- not a reference
+    return list(test_auth.account_rules[test_auth.reseller_prefixes[0]].get(
+                'operator_roles'))
+
+
+def get_account_for_tenant(test_auth, tenant_id):
+    """Convenience function reduces unit test churn"""
+    return '%s%s' % (test_auth.reseller_prefixes[0], tenant_id)
+
+
+def get_identity_headers(status='Confirmed', tenant_id='1',
+                         tenant_name='acct', project_domain_name='domA',
+                         project_domain_id='99',
+                         user_name='usr', user_id='42',
+                         user_domain_name='domA', user_domain_id='99',
+                         role='admin',
+                         service_role=None):
+    if role is None:
+        role = []
+    if isinstance(role, list):
+        role = ','.join(role)
+    res = dict(X_IDENTITY_STATUS=status,
+               X_TENANT_ID=tenant_id,
+               X_TENANT_NAME=tenant_name,
+               X_PROJECT_ID=tenant_id,
+               X_PROJECT_NAME=tenant_name,
+               X_PROJECT_DOMAIN_ID=project_domain_id,
+               X_PROJECT_DOMAIN_NAME=project_domain_name,
+               X_ROLES=role,
+               X_USER_NAME=user_name,
+               X_USER_ID=user_id,
+               X_USER_DOMAIN_NAME=user_domain_name,
+               X_USER_DOMAIN_ID=user_domain_id)
+    if service_role:
+        res.update(X_SERVICE_ROLES=service_role)
+    return res
 
 
 class FakeApp(object):
     def __init__(self, status_headers_body_iter=None):
         self.calls = 0
+        self.call_contexts = []
         self.status_headers_body_iter = status_headers_body_iter
         if not self.status_headers_body_iter:
             self.status_headers_body_iter = iter([('404 Not Found', {}, '')])
@@ -34,41 +86,56 @@ def __call__(self, env, start_response):
             resp = env['swift.authorize'](self.request)
             if resp:
                 return resp(env, start_response)
-        status, headers, body = self.status_headers_body_iter.next()
+        context = {'method': self.request.method,
+                   'headers': self.request.headers}
+        self.call_contexts.append(context)
+        status, headers, body = next(self.status_headers_body_iter)
         return Response(status=status, headers=headers,
-                              body=body)(env, start_response)
+                        body=body)(env, start_response)
 
 
 class SwiftAuth(unittest.TestCase):
     def setUp(self):
         self.test_auth = keystoneauth.filter_factory({})(FakeApp())
+        self.test_auth.logger = debug_logger()
 
     def _make_request(self, path=None, headers=None, **kwargs):
         if not path:
-            path = '/v1/%s/c/o' % self.test_auth._get_account_for_tenant('foo')
+            path = '/v1/%s/c/o' % get_account_for_tenant(self.test_auth, 'foo')
         return Request.blank(path, headers=headers, **kwargs)
 
-    def _get_identity_headers(self, status='Confirmed', tenant_id='1',
-                          tenant_name='acct', user='usr', role=''):
-        return dict(X_IDENTITY_STATUS=status,
-                    X_TENANT_ID=tenant_id,
-                    X_TENANT_NAME=tenant_name,
-                    X_ROLES=role,
-                    X_USER_NAME=user)
-
     def _get_successful_middleware(self):
         response_iter = iter([('200 OK', {}, '')])
         return keystoneauth.filter_factory({})(FakeApp(response_iter))
 
+    def test_invalid_request_authorized(self):
+        role = self.test_auth.reseller_admin_role
+        headers = get_identity_headers(role=role)
+        req = self._make_request('/', headers=headers)
+        resp = req.get_response(self._get_successful_middleware())
+        self.assertEqual(resp.status_int, 404)
+
+    def test_invalid_request_non_authorized(self):
+        req = self._make_request('/')
+        resp = req.get_response(self._get_successful_middleware())
+        self.assertEqual(resp.status_int, 404)
+
     def test_confirmed_identity_is_authorized(self):
         role = self.test_auth.reseller_admin_role
-        headers = self._get_identity_headers(role=role)
+        headers = get_identity_headers(role=role)
         req = self._make_request('/v1/AUTH_acct/c', headers)
         resp = req.get_response(self._get_successful_middleware())
         self.assertEqual(resp.status_int, 200)
 
+    def test_detect_reseller_request(self):
+        role = self.test_auth.reseller_admin_role
+        headers = get_identity_headers(role=role)
+        req = self._make_request('/v1/AUTH_acct/c', headers)
+        req.get_response(self._get_successful_middleware())
+        self.assertTrue(req.environ.get('reseller_request'))
+
     def test_confirmed_identity_is_not_authorized(self):
-        headers = self._get_identity_headers()
+        headers = get_identity_headers()
         req = self._make_request('/v1/AUTH_acct/c', headers)
         resp = req.get_response(self.test_auth)
         self.assertEqual(resp.status_int, 403)
@@ -79,17 +146,58 @@ def test_anonymous_is_authorized_for_permitted_referrer(self):
         resp = req.get_response(self._get_successful_middleware())
         self.assertEqual(resp.status_int, 200)
 
+    def test_anonymous_with_validtoken_authorized_for_permitted_referrer(self):
+        req = self._make_request(headers={'X_IDENTITY_STATUS': 'Confirmed'})
+        req.acl = '.r:*'
+        resp = req.get_response(self._get_successful_middleware())
+        self.assertEqual(resp.status_int, 200)
+
     def test_anonymous_is_not_authorized_for_unknown_reseller_prefix(self):
         req = self._make_request(path='/v1/BLAH_foo/c/o',
                                  headers={'X_IDENTITY_STATUS': 'Invalid'})
         resp = req.get_response(self.test_auth)
         self.assertEqual(resp.status_int, 401)
 
+    def test_denied_responses(self):
+
+        def get_resp_status(headers):
+            req = self._make_request(headers=headers)
+            resp = req.get_response(self.test_auth)
+            return resp.status_int
+
+        self.assertEqual(get_resp_status({'X_IDENTITY_STATUS': 'Confirmed'}),
+                         403)
+        self.assertEqual(get_resp_status(
+                         {'X_IDENTITY_STATUS': 'Confirmed',
+                          'X_SERVICE_IDENTITY_STATUS': 'Confirmed'}), 403)
+        self.assertEqual(get_resp_status({}), 401)
+        self.assertEqual(get_resp_status(
+                         {'X_IDENTITY_STATUS': 'Invalid'}), 401)
+        self.assertEqual(get_resp_status(
+                         {'X_IDENTITY_STATUS': 'Invalid',
+                          'X_SERVICE_IDENTITY_STATUS': 'Confirmed'}), 401)
+        self.assertEqual(get_resp_status(
+                         {'X_IDENTITY_STATUS': 'Confirmed',
+                          'X_SERVICE_IDENTITY_STATUS': 'Invalid'}), 401)
+        self.assertEqual(get_resp_status(
+                         {'X_IDENTITY_STATUS': 'Invalid',
+                          'X_SERVICE_IDENTITY_STATUS': 'Invalid'}), 401)
+
     def test_blank_reseller_prefix(self):
         conf = {'reseller_prefix': ''}
         test_auth = keystoneauth.filter_factory(conf)(FakeApp())
         account = tenant_id = 'foo'
-        self.assertTrue(test_auth._reseller_check(account, tenant_id))
+        self.assertTrue(test_auth._account_matches_tenant(account, tenant_id))
+
+    def test_reseller_prefix_added_underscore(self):
+        conf = {'reseller_prefix': 'AUTH'}
+        test_auth = keystoneauth.filter_factory(conf)(FakeApp())
+        self.assertEqual(test_auth.reseller_prefixes[0], "AUTH_")
+
+    def test_reseller_prefix_not_added_double_underscores(self):
+        conf = {'reseller_prefix': 'AUTH_'}
+        test_auth = keystoneauth.filter_factory(conf)(FakeApp())
+        self.assertEqual(test_auth.reseller_prefixes[0], "AUTH_")
 
     def test_override_asked_for_but_not_allowed(self):
         conf = {'allow_overrides': 'false'}
@@ -97,7 +205,7 @@ def test_override_asked_for_but_not_allowed(self):
         req = self._make_request('/v1/AUTH_account',
                                  environ={'swift.authorize_override': True})
         resp = req.get_response(self.test_auth)
-        self.assertEquals(resp.status_int, 401)
+        self.assertEqual(resp.status_int, 401)
 
     def test_override_asked_for_and_allowed(self):
         conf = {'allow_overrides': 'true'}
@@ -105,18 +213,335 @@ def test_override_asked_for_and_allowed(self):
         req = self._make_request('/v1/AUTH_account',
                                  environ={'swift.authorize_override': True})
         resp = req.get_response(self.test_auth)
-        self.assertEquals(resp.status_int, 404)
+        self.assertEqual(resp.status_int, 404)
 
     def test_override_default_allowed(self):
         req = self._make_request('/v1/AUTH_account',
                                  environ={'swift.authorize_override': True})
         resp = req.get_response(self.test_auth)
-        self.assertEquals(resp.status_int, 404)
+        self.assertEqual(resp.status_int, 404)
 
+    def test_anonymous_options_allowed(self):
+        req = self._make_request('/v1/AUTH_account',
+                                 environ={'REQUEST_METHOD': 'OPTIONS'})
+        resp = req.get_response(self._get_successful_middleware())
+        self.assertEqual(resp.status_int, 200)
+
+    def test_identified_options_allowed(self):
+        headers = get_identity_headers()
+        headers['REQUEST_METHOD'] = 'OPTIONS'
+        req = self._make_request('/v1/AUTH_account',
+                                 headers=get_identity_headers(),
+                                 environ={'REQUEST_METHOD': 'OPTIONS'})
+        resp = req.get_response(self._get_successful_middleware())
+        self.assertEqual(resp.status_int, 200)
+
+    def test_auth_scheme(self):
+        req = self._make_request(path='/v1/BLAH_foo/c/o',
+                                 headers={'X_IDENTITY_STATUS': 'Invalid'})
+        resp = req.get_response(self.test_auth)
+        self.assertEqual(resp.status_int, 401)
+        self.assertTrue('Www-Authenticate' in resp.headers)
+
+    def test_project_domain_id_sysmeta_set(self):
+        proj_id = '12345678'
+        proj_domain_id = '13'
+        headers = get_identity_headers(tenant_id=proj_id,
+                                       project_domain_id=proj_domain_id)
+        account = get_account_for_tenant(self.test_auth, proj_id)
+        path = '/v1/' + account
+        # fake cached account info
+        info_key = get_cache_key(account)
+        env = {'swift.infocache': {info_key: {'status': 0, 'sysmeta': {}}},
+               'keystone.token_info': _fake_token_info(version='3')}
+        req = Request.blank(path, environ=env, headers=headers)
+        req.method = 'POST'
+        headers_out = {'X-Account-Sysmeta-Project-Domain-Id': proj_domain_id}
+        fake_app = FakeApp(iter([('200 OK', headers_out, '')]))
+        test_auth = keystoneauth.filter_factory({})(fake_app)
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(len(fake_app.call_contexts), 1)
+        headers_sent = fake_app.call_contexts[0]['headers']
+        self.assertTrue('X-Account-Sysmeta-Project-Domain-Id' in headers_sent,
+                        headers_sent)
+        self.assertEqual(headers_sent['X-Account-Sysmeta-Project-Domain-Id'],
+                         proj_domain_id)
+        self.assertTrue('X-Account-Project-Domain-Id' in resp.headers)
+        self.assertEqual(resp.headers['X-Account-Project-Domain-Id'],
+                         proj_domain_id)
+
+    def test_project_domain_id_sysmeta_set_to_unknown(self):
+        proj_id = '12345678'
+        # token scoped to a different project
+        headers = get_identity_headers(tenant_id='87654321',
+                                       project_domain_id='default',
+                                       role='reselleradmin')
+        account = get_account_for_tenant(self.test_auth, proj_id)
+        path = '/v1/' + account
+        # fake cached account info
+        info_key = get_cache_key(account)
+        env = {'swift.infocache': {info_key: {'status': 0, 'sysmeta': {}}},
+               'keystone.token_info': _fake_token_info(version='3')}
+        req = Request.blank(path, environ=env, headers=headers)
+        req.method = 'POST'
+        fake_app = FakeApp(iter([('200 OK', {}, '')]))
+        test_auth = keystoneauth.filter_factory({})(fake_app)
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(len(fake_app.call_contexts), 1)
+        headers_sent = fake_app.call_contexts[0]['headers']
+        self.assertTrue('X-Account-Sysmeta-Project-Domain-Id' in headers_sent,
+                        headers_sent)
+        self.assertEqual(headers_sent['X-Account-Sysmeta-Project-Domain-Id'],
+                         UNKNOWN_ID)
+
+    def test_project_domain_id_sysmeta_not_set(self):
+        proj_id = '12345678'
+        headers = get_identity_headers(tenant_id=proj_id, role='admin')
+        account = get_account_for_tenant(self.test_auth, proj_id)
+        path = '/v1/' + account
+        info_key = get_cache_key(account)
+        # v2 token
+        env = {'swift.infocache': {info_key: {'status': 0, 'sysmeta': {}}},
+               'keystone.token_info': _fake_token_info(version='2')}
+        req = Request.blank(path, environ=env, headers=headers)
+        req.method = 'POST'
+        fake_app = FakeApp(iter([('200 OK', {}, '')]))
+        test_auth = keystoneauth.filter_factory({})(fake_app)
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(len(fake_app.call_contexts), 1)
+        headers_sent = fake_app.call_contexts[0]['headers']
+        self.assertFalse('X-Account-Sysmeta-Project-Domain-Id' in headers_sent,
+                         headers_sent)
+
+    def test_project_domain_id_sysmeta_set_unknown_with_v2(self):
+        proj_id = '12345678'
+        # token scoped to a different project
+        headers = get_identity_headers(tenant_id='87654321',
+                                       role='reselleradmin')
+        account = get_account_for_tenant(self.test_auth, proj_id)
+        path = '/v1/' + account
+        info_key = get_cache_key(account)
+        # v2 token
+        env = {'swift.infocache': {info_key: {'status': 0, 'sysmeta': {}}},
+               'keystone.token_info': _fake_token_info(version='2')}
+        req = Request.blank(path, environ=env, headers=headers)
+        req.method = 'POST'
+        fake_app = FakeApp(iter([('200 OK', {}, '')]))
+        test_auth = keystoneauth.filter_factory({})(fake_app)
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(len(fake_app.call_contexts), 1)
+        headers_sent = fake_app.call_contexts[0]['headers']
+        self.assertTrue('X-Account-Sysmeta-Project-Domain-Id' in headers_sent,
+                        headers_sent)
+        self.assertEqual(headers_sent['X-Account-Sysmeta-Project-Domain-Id'],
+                         UNKNOWN_ID)
+
+
+class SwiftAuthMultiple(SwiftAuth):
+    """Runs same tests as SwiftAuth with multiple reseller prefixes
+
+    Runs SwiftAuth tests while a second reseller prefix item exists.
+    Validates that there is no regression against the original
+    single prefix configuration.
+    """
 
-class TestAuthorize(unittest.TestCase):
+    def setUp(self):
+        self.test_auth = keystoneauth.filter_factory(
+            {'reseller_prefix': 'AUTH, PRE2'})(FakeApp())
+        self.test_auth.logger = debug_logger()
+
+
+class ServiceTokenFunctionality(unittest.TestCase):
+
+    def _make_authed_request(self, conf, project_id, path, method='GET',
+                             user_role='admin', service_role=None,
+                             environ=None):
+        """Make a request with keystoneauth as auth
+
+        By default, acts as though the user had presented a token
+        containing the 'admin' role in X-Auth-Token scoped to the specified
+        project_id.
+
+        :param conf: configuration for keystoneauth
+        :param project_id: the project_id of the token
+        :param path: the path of the request
+        :param method: the method (defaults to GET)
+        :param user_role: the role of X-Auth-Token (defaults to 'admin')
+        :param service_role: the role in X-Service-Token (defaults to none)
+        :param environ: a dict of items to be added to the request environ
+                       (defaults to none)
+
+        :returns: response object
+        """
+        headers = get_identity_headers(tenant_id=project_id,
+                                       role=user_role,
+                                       service_role=service_role)
+        (version, account, _junk, _junk) = split_path(path, 2, 4, True)
+        info_key = get_cache_key(account)
+        env = {'swift.infocache': {info_key: {'status': 0, 'sysmeta': {}}},
+               'keystone.token_info': _fake_token_info(version='2')}
+        if environ:
+            env.update(environ)
+        req = Request.blank(path, environ=env, headers=headers)
+        req.method = method
+        fake_app = FakeApp(iter([('200 OK', {}, '')]))
+        test_auth = keystoneauth.filter_factory(conf)(fake_app)
+        resp = req.get_response(test_auth)
+        return resp
+
+    def test_existing_swift_owner_ignored(self):
+        # a request without admin role is denied
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH'}, '12345678', '/v1/AUTH_12345678',
+            environ={'swift_owner': False},
+            user_role='something_else')
+        self.assertEqual(resp.status_int, 403)
+
+        # ... even when swift_owner has previously been set True in request env
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH'}, '12345678', '/v1/AUTH_12345678',
+            environ={'swift_owner': True},
+            user_role='something_else')
+        self.assertEqual(resp.status_int, 403)
+
+        # a request with admin role but to different account prefix is denied
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH'}, '12345678', '/v1/SERVICE_12345678',
+            environ={'swift_owner': False})
+        self.assertEqual(resp.status_int, 403)
+
+        # ... even when swift_owner has previously been set True in request env
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH'}, '12345678', '/v1/SERVICE_12345678',
+            environ={'swift_owner': True})
+        self.assertEqual(resp.status_int, 403)
+
+    def test_unknown_prefix(self):
+        resp = self._make_authed_request({}, '12345678', '/v1/BLAH_12345678')
+        self.assertEqual(resp.status_int, 403)
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH, PRE2'}, '12345678', '/v1/BLAH_12345678')
+        self.assertEqual(resp.status_int, 403)
+
+    def test_authed_for_path_single(self):
+        resp = self._make_authed_request({}, '12345678', '/v1/AUTH_12345678')
+        self.assertEqual(resp.status_int, 200)
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH'}, '12345678', '/v1/AUTH_12345678')
+        self.assertEqual(resp.status_int, 200)
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH'}, '12345678', '/v1/AUTH_12345678/c')
+        self.assertEqual(resp.status_int, 200)
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH'}, '12345678', '/v1/AUTH_12345678',
+            user_role='ResellerAdmin')
+        self.assertEqual(resp.status_int, 200)
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH'}, '12345678', '/v1/AUTH_anything',
+            user_role='ResellerAdmin')
+        self.assertEqual(resp.status_int, 200)
+
+    def test_denied_for_path_single(self):
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH'}, '12345678', '/v1/AUTH_789')
+        self.assertEqual(resp.status_int, 403)
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH'}, '12345678', '/v1/AUTH_12345678',
+            user_role='something_else')
+        self.assertEqual(resp.status_int, 403)
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH'}, '12345678', '/v1/AUTH_12345678',
+            method='DELETE')
+        self.assertEqual(resp.status_int, 403)
+
+    def test_authed_for_primary_path_multiple(self):
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH, PRE2',
+             'PRE2_service_roles': 'service'},
+            '12345678', '/v1/AUTH_12345678')
+        self.assertEqual(resp.status_int, 200)
+
+    def test_denied_for_second_path_with_only_operator_role(self):
+        # User only presents X-Auth-Token
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH, PRE2',
+             'PRE2_service_roles': 'service'},
+            '12345678', '/v1/PRE2_12345678')
+        self.assertEqual(resp.status_int, 403)
+
+        # User puts token in X-Service-Token
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH, PRE2',
+             'PRE2_service_roles': 'service'},
+            '12345678', '/v1/PRE2_12345678',
+            user_role='', service_role='admin')
+        self.assertEqual(resp.status_int, 403)
+
+        # User puts token in both X-Auth-Token and X-Service-Token
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH, PRE2',
+             'PRE2_service_roles': 'service'},
+            '12345678', '/v1/PRE2_12345678',
+            user_role='admin', service_role='admin')
+        self.assertEqual(resp.status_int, 403)
+
+    def test_authed_for_second_path_with_operator_role_and_service(self):
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH, PRE2',
+             'PRE2_service_roles': 'service'},
+            '12345678', '/v1/PRE2_12345678', service_role='service')
+        self.assertEqual(resp.status_int, 200)
+
+    def test_denied_for_second_path_with_only_service(self):
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH, PRE2',
+             'PRE2_service_roles': 'service'},
+            '12345678', '/v1/PRE2_12345678', user_role='something_else',
+            service_role='service')
+        self.assertEqual(resp.status_int, 403)
+
+    def test_denied_for_second_path_for_service_user(self):
+        # User presents token with 'service' role in X-Auth-Token
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH, PRE2',
+             'PRE2_service_roles': 'service'},
+            '12345678', '/v1/PRE2_12345678', user_role='service')
+        self.assertEqual(resp.status_int, 403)
+
+        # User presents token with 'service' role in X-Auth-Token
+        # and also in X-Service-Token
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH, PRE2',
+             'PRE2_service_roles': 'service'},
+            '12345678', '/v1/PRE2_12345678', user_role='service',
+            service_role='service')
+        self.assertEqual(resp.status_int, 403)
+
+    def test_delete_denied_for_second_path(self):
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH, PRE2',
+             'PRE2_service_roles': 'service'},
+            '12345678', '/v1/PRE2_12345678', service_role='service',
+            method='DELETE')
+        self.assertEqual(resp.status_int, 403)
+
+    def test_delete_of_second_path_by_reseller_admin(self):
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH, PRE2',
+             'PRE2_service_roles': 'service'},
+            '12345678', '/v1/PRE2_12345678', user_role='ResellerAdmin',
+            method='DELETE')
+        self.assertEqual(resp.status_int, 200)
+
+
+class BaseTestAuthorize(unittest.TestCase):
     def setUp(self):
         self.test_auth = keystoneauth.filter_factory({})(FakeApp())
+        self.test_auth.logger = debug_logger()
 
     def _make_request(self, path, **kwargs):
         return Request.blank(path, **kwargs)
@@ -124,14 +549,51 @@ def _make_request(self, path, **kwargs):
     def _get_account(self, identity=None):
         if not identity:
             identity = self._get_identity()
-        return self.test_auth._get_account_for_tenant(identity['tenant'][0])
+        return get_account_for_tenant(self.test_auth,
+                                      identity.get('HTTP_X_PROJECT_ID') or
+                                      identity.get('HTTP_X_TENANT_ID'))
 
-    def _get_identity(self, tenant_id='tenant_id',
-                      tenant_name='tenant_name', user='user', roles=None):
-        if not roles:
+    def _get_identity(self, tenant_id='tenant_id', tenant_name='tenant_name',
+                      user_id='user_id', user_name='user_name', roles=None,
+                      project_domain_name='domA', project_domain_id='foo',
+                      user_domain_name='domA', user_domain_id='foo'):
+        if roles is None:
             roles = []
-        return dict(tenant=(tenant_id, tenant_name), user=user, roles=roles)
+        if isinstance(roles, list):
+            roles = ','.join(roles)
+        return {'HTTP_X_USER_ID': user_id,
+                'HTTP_X_USER_NAME': user_name,
+                'HTTP_X_USER_DOMAIN_NAME': user_domain_name,
+                'HTTP_X_USER_DOMAIN_ID': user_domain_id,
+                'HTTP_X_PROJECT_ID': tenant_id,
+                'HTTP_X_PROJECT_NAME': tenant_name,
+                'HTTP_X_PROJECT_DOMAIN_ID': project_domain_id,
+                'HTTP_X_PROJECT_DOMAIN_NAME': project_domain_name,
+                'HTTP_X_ROLES': roles,
+                'HTTP_X_IDENTITY_STATUS': 'Confirmed'}
+
+    def _get_identity_for_v2(self, **kwargs):
+        identity = self._get_identity(**kwargs)
+        for suffix in ['ID', 'NAME']:
+            identity['HTTP_X_TENANT_{0}'.format(suffix)] = identity.pop(
+                'HTTP_X_PROJECT_{0}'.format(suffix))
+        return identity
+
+    def _get_env_id(self, tenant_id='tenant_id', tenant_name='tenant_name',
+                    user_id='user_id', user_name='user_name', roles=[],
+                    project_domain_name='domA', project_domain_id='99',
+                    user_domain_name='domA', user_domain_id='99',
+                    auth_version='3'):
+        env = self._get_identity(tenant_id, tenant_name, user_id, user_name,
+                                 roles, project_domain_name,
+                                 project_domain_id, user_domain_name,
+                                 user_domain_id)
+        token_info = _fake_token_info(version=auth_version)
+        env.update({'keystone.token_info': token_info})
+        return self.test_auth._keystone_identity(env)
 
+
+class BaseTestAuthorizeCheck(BaseTestAuthorize):
     def _check_authenticate(self, account=None, identity=None, headers=None,
                             exception=None, acl=None, env=None, path=None):
         if not identity:
@@ -140,19 +602,32 @@ def _check_authenticate(self, account=None, identity=None, headers=None,
             account = self._get_account(identity)
         if not path:
             path = '/v1/%s/c' % account
-        default_env = {'keystone.identity': identity,
-                       'REMOTE_USER': identity['tenant']}
+        # fake cached account info
+        info_key = get_cache_key(account)
+        default_env = {
+            'REMOTE_USER': (identity.get('HTTP_X_PROJECT_ID') or
+                            identity.get('HTTP_X_TENANT_ID')),
+            'swift.infocache': {info_key: {'status': 200, 'sysmeta': {}}}}
+        default_env.update(identity)
         if env:
             default_env.update(env)
         req = self._make_request(path, headers=headers, environ=default_env)
         req.acl = acl
-        result = self.test_auth.authorize(req)
-        if exception:
-            self.assertEquals(result.status_int, exception)
+
+        env_identity = self.test_auth._keystone_identity(req.environ)
+        result = self.test_auth.authorize(env_identity, req)
+
+        # if we have requested an exception but nothing came back then
+        if exception and not result:
+            self.fail("error %s was not returned" % (str(exception)))
+        elif exception:
+            self.assertEqual(result.status_int, exception)
         else:
-            self.assertTrue(result is None)
+            self.assertIsNone(result)
         return req
 
+
+class TestAuthorize(BaseTestAuthorizeCheck):
     def test_authorize_fails_for_unauthorized_user(self):
         self._check_authenticate(exception=HTTP_FORBIDDEN)
 
@@ -166,27 +641,34 @@ def test_authorize_succeeds_for_reseller_admin(self):
         req = self._check_authenticate(identity=identity)
         self.assertTrue(req.environ.get('swift_owner'))
 
+    def test_authorize_succeeds_for_insensitive_reseller_admin(self):
+        roles = [self.test_auth.reseller_admin_role.upper()]
+        identity = self._get_identity(roles=roles)
+        req = self._check_authenticate(identity=identity)
+        self.assertTrue(req.environ.get('swift_owner'))
+
     def test_authorize_succeeds_as_owner_for_operator_role(self):
-        roles = self.test_auth.operator_roles.split(',')[0]
+        roles = operator_roles(self.test_auth)
         identity = self._get_identity(roles=roles)
         req = self._check_authenticate(identity=identity)
         self.assertTrue(req.environ.get('swift_owner'))
 
-    def _check_authorize_for_tenant_owner_match(self, exception=None):
-        identity = self._get_identity()
-        identity['user'] = identity['tenant'][1]
-        req = self._check_authenticate(identity=identity, exception=exception)
-        expected = bool(exception is None)
-        self.assertEqual(bool(req.environ.get('swift_owner')), expected)
+    def test_authorize_succeeds_as_owner_for_insensitive_operator_role(self):
+        roles = [r.upper() for r in operator_roles(self.test_auth)]
+        identity = self._get_identity(roles=roles)
+        req = self._check_authenticate(identity=identity)
+        self.assertTrue(req.environ.get('swift_owner'))
 
-    def test_authorize_succeeds_as_owner_for_tenant_owner_match(self):
+    def test_authorize_fails_same_user_and_tenant(self):
+        # Historically the is_admin option allowed access when user_name
+        # matched tenant_name, but it is no longer supported. This test is a
+        # sanity check that the option no longer works.
         self.test_auth.is_admin = True
-        self._check_authorize_for_tenant_owner_match()
-
-    def test_authorize_fails_as_owner_for_tenant_owner_match(self):
-        self.test_auth.is_admin = False
-        self._check_authorize_for_tenant_owner_match(
-            exception=HTTP_FORBIDDEN)
+        identity = self._get_identity(user_name='same_name',
+                                      tenant_name='same_name')
+        req = self._check_authenticate(identity=identity,
+                                       exception=HTTP_FORBIDDEN)
+        self.assertFalse(bool(req.environ.get('swift_owner')))
 
     def test_authorize_succeeds_for_container_sync(self):
         env = {'swift_sync_key': 'foo', 'REMOTE_ADDR': '127.0.0.1'}
@@ -218,31 +700,1009 @@ def test_authorize_succeeds_for_user_role_in_roles(self):
         self._check_authenticate(identity=identity, acl=acl)
 
     def test_authorize_succeeds_for_tenant_name_user_in_roles(self):
+        identity = self._get_identity_for_v2()
+        user_name = identity['HTTP_X_USER_NAME']
+        user_id = identity['HTTP_X_USER_ID']
+        tenant_name = identity['HTTP_X_TENANT_NAME']
+        for user in [user_id, user_name, '*']:
+            acl = '%s:%s' % (tenant_name, user)
+            self._check_authenticate(identity=identity, acl=acl)
+
+    def test_authorize_succeeds_for_project_name_user_in_roles(self):
         identity = self._get_identity()
-        acl = '%s:%s' % (identity['tenant'][1], identity['user'])
-        self._check_authenticate(identity=identity, acl=acl)
+        user_name = identity['HTTP_X_USER_NAME']
+        user_id = identity['HTTP_X_USER_ID']
+        project_name = identity['HTTP_X_PROJECT_NAME']
+        for user in [user_id, user_name, '*']:
+            acl = '%s:%s' % (project_name, user)
+            self._check_authenticate(identity=identity, acl=acl)
 
     def test_authorize_succeeds_for_tenant_id_user_in_roles(self):
+        identity = self._get_identity_for_v2()
+        user_name = identity['HTTP_X_USER_NAME']
+        user_id = identity['HTTP_X_USER_ID']
+        tenant_id = identity['HTTP_X_TENANT_ID']
+        for user in [user_id, user_name, '*']:
+            acl = '%s:%s' % (tenant_id, user)
+            self._check_authenticate(identity=identity, acl=acl)
+
+    def test_authorize_succeeds_for_project_id_user_in_roles(self):
         identity = self._get_identity()
-        acl = '%s:%s' % (identity['tenant'][0], identity['user'])
-        self._check_authenticate(identity=identity, acl=acl)
+        user_name = identity['HTTP_X_USER_NAME']
+        user_id = identity['HTTP_X_USER_ID']
+        project_id = identity['HTTP_X_PROJECT_ID']
+        for user in [user_id, user_name, '*']:
+            acl = '%s:%s' % (project_id, user)
+            self._check_authenticate(identity=identity, acl=acl)
 
     def test_authorize_succeeds_for_wildcard_tenant_user_in_roles(self):
         identity = self._get_identity()
-        acl = '*:%s' % (identity['user'])
-        self._check_authenticate(identity=identity, acl=acl)
+        user_name = identity['HTTP_X_USER_NAME']
+        user_id = identity['HTTP_X_USER_ID']
+        for user in [user_id, user_name, '*']:
+            acl = '*:%s' % user
+            self._check_authenticate(identity=identity, acl=acl)
 
     def test_cross_tenant_authorization_success(self):
-        self.assertTrue(self.test_auth._authorize_cross_tenant('userA',
-            'tenantID', 'tenantNAME', ['tenantID:userA']))
-        self.assertTrue(self.test_auth._authorize_cross_tenant('userA',
-            'tenantID', 'tenantNAME', ['tenantNAME:userA']))
-        self.assertTrue(self.test_auth._authorize_cross_tenant('userA',
-            'tenantID', 'tenantNAME', ['*:userA']))
+        self.assertEqual(
+            self.test_auth._authorize_cross_tenant(
+                'userID', 'userA', 'tenantID', 'tenantNAME',
+                ['tenantID:userA']),
+            'tenantID:userA')
+        self.assertEqual(
+            self.test_auth._authorize_cross_tenant(
+                'userID', 'userA', 'tenantID', 'tenantNAME',
+                ['tenantNAME:userA']),
+            'tenantNAME:userA')
+        self.assertEqual(
+            self.test_auth._authorize_cross_tenant(
+                'userID', 'userA', 'tenantID', 'tenantNAME', ['*:userA']),
+            '*:userA')
+
+        self.assertEqual(
+            self.test_auth._authorize_cross_tenant(
+                'userID', 'userA', 'tenantID', 'tenantNAME',
+                ['tenantID:userID']),
+            'tenantID:userID')
+        self.assertEqual(
+            self.test_auth._authorize_cross_tenant(
+                'userID', 'userA', 'tenantID', 'tenantNAME',
+                ['tenantNAME:userID']),
+            'tenantNAME:userID')
+        self.assertEqual(
+            self.test_auth._authorize_cross_tenant(
+                'userID', 'userA', 'tenantID', 'tenantNAME', ['*:userID']),
+            '*:userID')
+
+        self.assertEqual(
+            self.test_auth._authorize_cross_tenant(
+                'userID', 'userA', 'tenantID', 'tenantNAME', ['tenantID:*']),
+            'tenantID:*')
+        self.assertEqual(
+            self.test_auth._authorize_cross_tenant(
+                'userID', 'userA', 'tenantID', 'tenantNAME', ['tenantNAME:*']),
+            'tenantNAME:*')
+        self.assertEqual(
+            self.test_auth._authorize_cross_tenant(
+                'userID', 'userA', 'tenantID', 'tenantNAME', ['*:*']),
+            '*:*')
 
     def test_cross_tenant_authorization_failure(self):
-        self.assertFalse(self.test_auth._authorize_cross_tenant('userA',
-            'tenantID', 'tenantNAME', ['tenantXYZ:userA']))
+        self.assertEqual(
+            self.test_auth._authorize_cross_tenant(
+                'userID', 'userA', 'tenantID', 'tenantNAME',
+                ['tenantXYZ:userA']),
+            None)
+
+    def test_cross_tenant_authorization_allow_names(self):
+        # tests that the allow_names arg does the right thing
+        self.assertEqual(
+            self.test_auth._authorize_cross_tenant(
+                'userID', 'userA', 'tenantID', 'tenantNAME',
+                ['tenantNAME:userA'], allow_names=True),
+            'tenantNAME:userA')
+        self.assertEqual(
+            self.test_auth._authorize_cross_tenant(
+                'userID', 'userA', 'tenantID', 'tenantNAME',
+                ['tenantNAME:userID'], allow_names=True),
+            'tenantNAME:userID')
+        self.assertEqual(
+            self.test_auth._authorize_cross_tenant(
+                'userID', 'userA', 'tenantID', 'tenantNAME',
+                ['tenantID:userA'], allow_names=True),
+            'tenantID:userA')
+        self.assertEqual(
+            self.test_auth._authorize_cross_tenant(
+                'userID', 'userA', 'tenantID', 'tenantNAME',
+                ['tenantID:userID'], allow_names=True),
+            'tenantID:userID')
+        self.assertEqual(
+            self.test_auth._authorize_cross_tenant(
+                'userID', 'userA', 'tenantID', 'tenantNAME',
+                ['tenantNAME:userA'], allow_names=False),
+            None)
+        self.assertEqual(
+            self.test_auth._authorize_cross_tenant(
+                'userID', 'userA', 'tenantID', 'tenantNAME',
+                ['tenantID:userA'], allow_names=False),
+            None)
+        self.assertEqual(
+            self.test_auth._authorize_cross_tenant(
+                'userID', 'userA', 'tenantID', 'tenantNAME',
+                ['tenantNAME:userID'], allow_names=False),
+            None)
+        self.assertEqual(
+            self.test_auth._authorize_cross_tenant(
+                'userID', 'userA', 'tenantID', 'tenantNAME',
+                ['tenantID:userID'], allow_names=False),
+            'tenantID:userID')
+
+    def test_delete_own_account_not_allowed(self):
+        roles = operator_roles(self.test_auth)
+        identity = self._get_identity(roles=roles)
+        account = self._get_account(identity)
+        self._check_authenticate(account=account,
+                                 identity=identity,
+                                 exception=HTTP_FORBIDDEN,
+                                 path='/v1/' + account,
+                                 env={'REQUEST_METHOD': 'DELETE'})
+
+    def test_delete_own_account_when_reseller_allowed(self):
+        roles = [self.test_auth.reseller_admin_role]
+        identity = self._get_identity(roles=roles)
+        account = self._get_account(identity)
+        req = self._check_authenticate(account=account,
+                                       identity=identity,
+                                       path='/v1/' + account,
+                                       env={'REQUEST_METHOD': 'DELETE'})
+        self.assertEqual(bool(req.environ.get('swift_owner')), True)
+
+    def test_identity_set_up_at_call(self):
+        def fake_start_response(*args, **kwargs):
+            pass
+        the_env = self._get_identity(
+            tenant_id='test', roles=['reselleradmin'])
+        self.test_auth(the_env, fake_start_response)
+
+        subreq = Request.blank(
+            '/v1/%s/c/o' % get_account_for_tenant(self.test_auth, 'test'))
+        subreq.environ.update(
+            self._get_identity(tenant_id='test', roles=['got_erased']))
+
+        authorize_resp = the_env['swift.authorize'](subreq)
+        self.assertIsNone(authorize_resp)
+
+    def test_names_disallowed_in_acls_outside_default_domain(self):
+        id = self._get_identity_for_v2(user_domain_id='non-default',
+                                       project_domain_id='non-default')
+        env = {'keystone.token_info': _fake_token_info(version='3')}
+        acl = '%s:%s' % (id['HTTP_X_TENANT_NAME'], id['HTTP_X_USER_NAME'])
+        self._check_authenticate(acl=acl, identity=id, env=env,
+                                 exception=HTTP_FORBIDDEN)
+        acl = '%s:%s' % (id['HTTP_X_TENANT_NAME'], id['HTTP_X_USER_ID'])
+        self._check_authenticate(acl=acl, identity=id, env=env,
+                                 exception=HTTP_FORBIDDEN)
+        acl = '%s:%s' % (id['HTTP_X_TENANT_ID'], id['HTTP_X_USER_NAME'])
+        self._check_authenticate(acl=acl, identity=id, env=env,
+                                 exception=HTTP_FORBIDDEN)
+        acl = '%s:%s' % (id['HTTP_X_TENANT_ID'], id['HTTP_X_USER_ID'])
+        self._check_authenticate(acl=acl, identity=id, env=env)
+
+        id = self._get_identity(user_domain_id='non-default',
+                                project_domain_id='non-default')
+        acl = '%s:%s' % (id['HTTP_X_PROJECT_NAME'], id['HTTP_X_USER_NAME'])
+        self._check_authenticate(acl=acl, identity=id, env=env,
+                                 exception=HTTP_FORBIDDEN)
+        acl = '%s:%s' % (id['HTTP_X_PROJECT_NAME'], id['HTTP_X_USER_ID'])
+        self._check_authenticate(acl=acl, identity=id, env=env,
+                                 exception=HTTP_FORBIDDEN)
+        acl = '%s:%s' % (id['HTTP_X_PROJECT_ID'], id['HTTP_X_USER_NAME'])
+        self._check_authenticate(acl=acl, identity=id, env=env,
+                                 exception=HTTP_FORBIDDEN)
+        acl = '%s:%s' % (id['HTTP_X_PROJECT_ID'], id['HTTP_X_USER_ID'])
+        self._check_authenticate(acl=acl, identity=id, env=env)
+
+    def test_names_allowed_in_acls_inside_default_domain(self):
+        id = self._get_identity_for_v2(user_domain_id='default',
+                                       project_domain_id='default')
+        env = {'keystone.token_info': _fake_token_info(version='3')}
+        acl = '%s:%s' % (id['HTTP_X_TENANT_NAME'], id['HTTP_X_USER_NAME'])
+        self._check_authenticate(acl=acl, identity=id, env=env)
+        acl = '%s:%s' % (id['HTTP_X_TENANT_NAME'], id['HTTP_X_USER_ID'])
+        self._check_authenticate(acl=acl, identity=id, env=env)
+        acl = '%s:%s' % (id['HTTP_X_TENANT_ID'], id['HTTP_X_USER_NAME'])
+        self._check_authenticate(acl=acl, identity=id, env=env)
+        acl = '%s:%s' % (id['HTTP_X_TENANT_ID'], id['HTTP_X_USER_ID'])
+        self._check_authenticate(acl=acl, identity=id, env=env)
+
+        id = self._get_identity(user_domain_id='default',
+                                project_domain_id='default')
+        acl = '%s:%s' % (id['HTTP_X_PROJECT_NAME'], id['HTTP_X_USER_NAME'])
+        self._check_authenticate(acl=acl, identity=id, env=env)
+        acl = '%s:%s' % (id['HTTP_X_PROJECT_NAME'], id['HTTP_X_USER_ID'])
+        self._check_authenticate(acl=acl, identity=id, env=env)
+        acl = '%s:%s' % (id['HTTP_X_PROJECT_ID'], id['HTTP_X_USER_NAME'])
+        self._check_authenticate(acl=acl, identity=id, env=env)
+        acl = '%s:%s' % (id['HTTP_X_PROJECT_ID'], id['HTTP_X_USER_ID'])
+        self._check_authenticate(acl=acl, identity=id, env=env)
+
+    def test_names_allowed_in_acls_inside_default_domain_with_config(self):
+        conf = {'allow_names_in_acls': 'yes'}
+        self.test_auth = keystoneauth.filter_factory(conf)(FakeApp())
+        self.test_auth.logger = debug_logger()
+        id = self._get_identity_for_v2(user_domain_id='default',
+                                       project_domain_id='default')
+        env = {'keystone.token_info': _fake_token_info(version='3')}
+        acl = '%s:%s' % (id['HTTP_X_TENANT_NAME'], id['HTTP_X_USER_NAME'])
+        self._check_authenticate(acl=acl, identity=id, env=env)
+        acl = '%s:%s' % (id['HTTP_X_TENANT_NAME'], id['HTTP_X_USER_ID'])
+        self._check_authenticate(acl=acl, identity=id, env=env)
+        acl = '%s:%s' % (id['HTTP_X_TENANT_ID'], id['HTTP_X_USER_NAME'])
+        self._check_authenticate(acl=acl, identity=id, env=env)
+        acl = '%s:%s' % (id['HTTP_X_TENANT_ID'], id['HTTP_X_USER_ID'])
+        self._check_authenticate(acl=acl, identity=id, env=env)
+
+        id = self._get_identity(user_domain_id='default',
+                                project_domain_id='default')
+        acl = '%s:%s' % (id['HTTP_X_PROJECT_NAME'], id['HTTP_X_USER_NAME'])
+        self._check_authenticate(acl=acl, identity=id, env=env)
+        acl = '%s:%s' % (id['HTTP_X_PROJECT_NAME'], id['HTTP_X_USER_ID'])
+        self._check_authenticate(acl=acl, identity=id, env=env)
+        acl = '%s:%s' % (id['HTTP_X_PROJECT_ID'], id['HTTP_X_USER_NAME'])
+        self._check_authenticate(acl=acl, identity=id, env=env)
+        acl = '%s:%s' % (id['HTTP_X_PROJECT_ID'], id['HTTP_X_USER_ID'])
+        self._check_authenticate(acl=acl, identity=id, env=env)
+
+    def test_names_disallowed_in_acls_inside_default_domain(self):
+        conf = {'allow_names_in_acls': 'false'}
+        self.test_auth = keystoneauth.filter_factory(conf)(FakeApp())
+        self.test_auth.logger = debug_logger()
+        id = self._get_identity_for_v2(user_domain_id='default',
+                                       project_domain_id='default')
+        env = {'keystone.token_info': _fake_token_info(version='3')}
+        acl = '%s:%s' % (id['HTTP_X_TENANT_NAME'], id['HTTP_X_USER_NAME'])
+        self._check_authenticate(acl=acl, identity=id, env=env,
+                                 exception=HTTP_FORBIDDEN)
+        acl = '%s:%s' % (id['HTTP_X_TENANT_NAME'], id['HTTP_X_USER_ID'])
+        self._check_authenticate(acl=acl, identity=id, env=env,
+                                 exception=HTTP_FORBIDDEN)
+        acl = '%s:%s' % (id['HTTP_X_TENANT_ID'], id['HTTP_X_USER_NAME'])
+        self._check_authenticate(acl=acl, identity=id, env=env,
+                                 exception=HTTP_FORBIDDEN)
+        acl = '%s:%s' % (id['HTTP_X_TENANT_ID'], id['HTTP_X_USER_ID'])
+        self._check_authenticate(acl=acl, identity=id, env=env)
+
+        id = self._get_identity(user_domain_id='default',
+                                project_domain_id='default')
+        acl = '%s:%s' % (id['HTTP_X_PROJECT_NAME'], id['HTTP_X_USER_NAME'])
+        self._check_authenticate(acl=acl, identity=id, env=env,
+                                 exception=HTTP_FORBIDDEN)
+        acl = '%s:%s' % (id['HTTP_X_PROJECT_NAME'], id['HTTP_X_USER_ID'])
+        self._check_authenticate(acl=acl, identity=id, env=env,
+                                 exception=HTTP_FORBIDDEN)
+        acl = '%s:%s' % (id['HTTP_X_PROJECT_ID'], id['HTTP_X_USER_NAME'])
+        self._check_authenticate(acl=acl, identity=id, env=env,
+                                 exception=HTTP_FORBIDDEN)
+        acl = '%s:%s' % (id['HTTP_X_PROJECT_ID'], id['HTTP_X_USER_ID'])
+        self._check_authenticate(acl=acl, identity=id, env=env)
+
+    def test_keystone_identity(self):
+        user = ('U_ID', 'U_NAME')
+        roles = ('ROLE1', 'ROLE2')
+        service_roles = ('ROLE3', 'ROLE4')
+        project = ('P_ID', 'P_NAME')
+        user_domain = ('UD_ID', 'UD_NAME')
+        project_domain = ('PD_ID', 'PD_NAME')
+
+        # no valid identity info in headers
+        req = Request.blank('/v/a/c/o')
+        data = self.test_auth._keystone_identity(req.environ)
+        self.assertIsNone(data)
+
+        # valid identity info in headers, but status unconfirmed
+        req.headers.update({'X-Identity-Status': 'Blah',
+                            'X-Roles': '%s,%s' % roles,
+                            'X-User-Id': user[0],
+                            'X-User-Name': user[1],
+                            'X-Tenant-Id': project[0],
+                            'X-Tenant-Name': project[1],
+                            'X-User-Domain-Id': user_domain[0],
+                            'X-User-Domain-Name': user_domain[1],
+                            'X-Project-Domain-Id': project_domain[0],
+                            'X-Project-Domain-Name': project_domain[1]})
+        data = self.test_auth._keystone_identity(req.environ)
+        self.assertIsNone(data)
+
+        # valid identity info in headers, no token info in environ
+        req.headers.update({'X-Identity-Status': 'Confirmed'})
+        expected = {'user': user,
+                    'tenant': project,
+                    'roles': list(roles),
+                    'service_roles': [],
+                    'user_domain': (None, None),
+                    'project_domain': (None, None),
+                    'auth_version': 0}
+        data = self.test_auth._keystone_identity(req.environ)
+        self.assertEqual(expected, data)
+
+        # v2 token info in environ
+        req.environ['keystone.token_info'] = _fake_token_info(version='2')
+        expected = {'user': user,
+                    'tenant': project,
+                    'roles': list(roles),
+                    'service_roles': [],
+                    'user_domain': (None, None),
+                    'project_domain': (None, None),
+                    'auth_version': 2}
+        data = self.test_auth._keystone_identity(req.environ)
+        self.assertEqual(expected, data)
+
+        # v3 token info in environ
+        req.environ['keystone.token_info'] = _fake_token_info(version='3')
+        expected = {'user': user,
+                    'tenant': project,
+                    'roles': list(roles),
+                    'service_roles': [],
+                    'user_domain': user_domain,
+                    'project_domain': project_domain,
+                    'auth_version': 3}
+        data = self.test_auth._keystone_identity(req.environ)
+        self.assertEqual(expected, data)
+
+        # service token in environ
+        req.headers.update({'X-Service-Roles': '%s,%s' % service_roles})
+        expected = {'user': user,
+                    'tenant': project,
+                    'roles': list(roles),
+                    'service_roles': list(service_roles),
+                    'user_domain': user_domain,
+                    'project_domain': project_domain,
+                    'auth_version': 3}
+        data = self.test_auth._keystone_identity(req.environ)
+        self.assertEqual(expected, data)
+
+    def test_get_project_domain_id(self):
+        sysmeta = {}
+        info = {'sysmeta': sysmeta}
+        info_key = get_cache_key('AUTH_1234')
+        env = {'PATH_INFO': '/v1/AUTH_1234',
+               'swift.infocache': {info_key: info}}
+
+        # account does not exist
+        info['status'] = 404
+        self.assertEqual(self.test_auth._get_project_domain_id(env),
+                         (False, None))
+        info['status'] = 0
+        self.assertEqual(self.test_auth._get_project_domain_id(env),
+                         (False, None))
+
+        # account exists, no project domain id in sysmeta
+        info['status'] = 200
+        self.assertEqual(self.test_auth._get_project_domain_id(env),
+                         (True, None))
+
+        # account exists with project domain id in sysmeta
+        sysmeta['project-domain-id'] = 'default'
+        self.assertEqual(self.test_auth._get_project_domain_id(env),
+                         (True, 'default'))
+
+
+class TestIsNameAllowedInACL(BaseTestAuthorize):
+    def setUp(self):
+        super(TestIsNameAllowedInACL, self).setUp()
+        self.default_id = 'default'
+
+    def _assert_names_allowed(self, expected, user_domain_id=None,
+                              req_project_domain_id=None,
+                              sysmeta_project_domain_id=None,
+                              scoped='account'):
+        project_name = 'foo'
+        account_id = '12345678'
+        account = get_account_for_tenant(self.test_auth, account_id)
+        parts = ('v1', account, None, None)
+        path = '/%s/%s' % parts[0:2]
+
+        sysmeta = {}
+        if sysmeta_project_domain_id:
+            sysmeta = {'project-domain-id': sysmeta_project_domain_id}
+
+        # pretend account exists
+        info = {'status': 200, 'sysmeta': sysmeta}
+        info_key = get_cache_key(account)
+        req = Request.blank(path,
+                            environ={'swift.infocache': {info_key: info}})
+
+        if scoped == 'account':
+            project_name = 'account_name'
+            project_id = account_id
+        elif scoped == 'other':
+            project_name = 'other_name'
+            project_id = '87654321'
+        else:
+            # unscoped token
+            project_name, project_id, req_project_domain_id = None, None, None
+
+        if user_domain_id:
+            id = self._get_env_id(tenant_name=project_name,
+                                  tenant_id=project_id,
+                                  user_domain_id=user_domain_id,
+                                  project_domain_id=req_project_domain_id)
+        else:
+            # must be v2 token info
+            id = self._get_env_id(tenant_name=project_name,
+                                  tenant_id=project_id,
+                                  auth_version='2')
+
+        actual = self.test_auth._is_name_allowed_in_acl(req, parts, id)
+        self.assertEqual(actual, expected, '%s, %s, %s, %s'
+                         % (user_domain_id, req_project_domain_id,
+                            sysmeta_project_domain_id, scoped))
+
+    def test_is_name_allowed_in_acl_with_token_scoped_to_tenant(self):
+        # no user or project domain ids in request token so must be v2,
+        # user and project should be assumed to be in default domain
+        self._assert_names_allowed(True, user_domain_id=None,
+                                   req_project_domain_id=None,
+                                   sysmeta_project_domain_id=None)
+        self._assert_names_allowed(True, user_domain_id=None,
+                                   req_project_domain_id=None,
+                                   sysmeta_project_domain_id=self.default_id)
+        self._assert_names_allowed(True, user_domain_id=None,
+                                   req_project_domain_id=None,
+                                   sysmeta_project_domain_id=UNKNOWN_ID)
+        self._assert_names_allowed(True, user_domain_id=None,
+                                   req_project_domain_id=None,
+                                   sysmeta_project_domain_id='foo')
+
+        # user in default domain, project domain in token info takes precedence
+        self._assert_names_allowed(True, user_domain_id=self.default_id,
+                                   req_project_domain_id=self.default_id,
+                                   sysmeta_project_domain_id=None)
+        self._assert_names_allowed(True, user_domain_id=self.default_id,
+                                   req_project_domain_id=self.default_id,
+                                   sysmeta_project_domain_id=UNKNOWN_ID)
+        self._assert_names_allowed(True, user_domain_id=self.default_id,
+                                   req_project_domain_id=self.default_id,
+                                   sysmeta_project_domain_id='bar')
+        self._assert_names_allowed(False, user_domain_id=self.default_id,
+                                   req_project_domain_id='foo',
+                                   sysmeta_project_domain_id=None)
+        self._assert_names_allowed(False, user_domain_id=self.default_id,
+                                   req_project_domain_id='foo',
+                                   sysmeta_project_domain_id=self.default_id)
+        self._assert_names_allowed(False, user_domain_id=self.default_id,
+                                   req_project_domain_id='foo',
+                                   sysmeta_project_domain_id='foo')
+
+        # user in non-default domain so names should never be allowed
+        self._assert_names_allowed(False, user_domain_id='foo',
+                                   req_project_domain_id=self.default_id,
+                                   sysmeta_project_domain_id=None)
+        self._assert_names_allowed(False, user_domain_id='foo',
+                                   req_project_domain_id=self.default_id,
+                                   sysmeta_project_domain_id=self.default_id)
+        self._assert_names_allowed(False, user_domain_id='foo',
+                                   req_project_domain_id=self.default_id,
+                                   sysmeta_project_domain_id=UNKNOWN_ID)
+        self._assert_names_allowed(False, user_domain_id='foo',
+                                   req_project_domain_id=self.default_id,
+                                   sysmeta_project_domain_id='foo')
+
+    def test_is_name_allowed_in_acl_with_unscoped_token(self):
+        # user in default domain
+        self._assert_names_allowed(True, user_domain_id=self.default_id,
+                                   sysmeta_project_domain_id=None,
+                                   scoped=False)
+        self._assert_names_allowed(True, user_domain_id=self.default_id,
+                                   sysmeta_project_domain_id=self.default_id,
+                                   scoped=False)
+        self._assert_names_allowed(False, user_domain_id=self.default_id,
+                                   sysmeta_project_domain_id=UNKNOWN_ID,
+                                   scoped=False)
+        self._assert_names_allowed(False, user_domain_id=self.default_id,
+                                   sysmeta_project_domain_id='foo',
+                                   scoped=False)
+
+        # user in non-default domain so names should never be allowed
+        self._assert_names_allowed(False, user_domain_id='foo',
+                                   sysmeta_project_domain_id=None,
+                                   scoped=False)
+        self._assert_names_allowed(False, user_domain_id='foo',
+                                   sysmeta_project_domain_id=self.default_id,
+                                   scoped=False)
+        self._assert_names_allowed(False, user_domain_id='foo',
+                                   sysmeta_project_domain_id=UNKNOWN_ID,
+                                   scoped=False)
+        self._assert_names_allowed(False, user_domain_id='foo',
+                                   sysmeta_project_domain_id='foo',
+                                   scoped=False)
+
+    def test_is_name_allowed_in_acl_with_token_scoped_to_other_tenant(self):
+        # user and scoped tenant in default domain
+        self._assert_names_allowed(True, user_domain_id=self.default_id,
+                                   req_project_domain_id=self.default_id,
+                                   sysmeta_project_domain_id=None,
+                                   scoped='other')
+        self._assert_names_allowed(True, user_domain_id=self.default_id,
+                                   req_project_domain_id=self.default_id,
+                                   sysmeta_project_domain_id=self.default_id,
+                                   scoped='other')
+        self._assert_names_allowed(False, user_domain_id=self.default_id,
+                                   req_project_domain_id=self.default_id,
+                                   sysmeta_project_domain_id=UNKNOWN_ID,
+                                   scoped='other')
+        self._assert_names_allowed(False, user_domain_id=self.default_id,
+                                   req_project_domain_id=self.default_id,
+                                   sysmeta_project_domain_id='foo',
+                                   scoped='other')
+
+        # user in default domain, but scoped tenant in non-default domain
+        self._assert_names_allowed(False, user_domain_id=self.default_id,
+                                   req_project_domain_id='foo',
+                                   sysmeta_project_domain_id=None,
+                                   scoped='other')
+        self._assert_names_allowed(False, user_domain_id=self.default_id,
+                                   req_project_domain_id='foo',
+                                   sysmeta_project_domain_id=self.default_id,
+                                   scoped='other')
+        self._assert_names_allowed(False, user_domain_id=self.default_id,
+                                   req_project_domain_id='foo',
+                                   sysmeta_project_domain_id=UNKNOWN_ID,
+                                   scoped='other')
+        self._assert_names_allowed(False, user_domain_id=self.default_id,
+                                   req_project_domain_id='foo',
+                                   sysmeta_project_domain_id='foo',
+                                   scoped='other')
+
+        # user in non-default domain, scoped tenant in default domain
+        self._assert_names_allowed(False, user_domain_id='foo',
+                                   req_project_domain_id=self.default_id,
+                                   sysmeta_project_domain_id=None,
+                                   scoped='other')
+        self._assert_names_allowed(False, user_domain_id='foo',
+                                   req_project_domain_id=self.default_id,
+                                   sysmeta_project_domain_id=self.default_id,
+                                   scoped='other')
+        self._assert_names_allowed(False, user_domain_id='foo',
+                                   req_project_domain_id=self.default_id,
+                                   sysmeta_project_domain_id=UNKNOWN_ID,
+                                   scoped='other')
+        self._assert_names_allowed(False, user_domain_id='foo',
+                                   req_project_domain_id=self.default_id,
+                                   sysmeta_project_domain_id='foo',
+                                   scoped='other')
+
+
+class TestIsNameAllowedInACLWithConfiguredDomain(TestIsNameAllowedInACL):
+    def setUp(self):
+        super(TestIsNameAllowedInACLWithConfiguredDomain, self).setUp()
+        conf = {'default_domain_id': 'mydefault'}
+        self.test_auth = keystoneauth.filter_factory(conf)(FakeApp())
+        self.test_auth.logger = debug_logger()
+        self.default_id = 'mydefault'
+
+
+class TestSetProjectDomain(BaseTestAuthorize):
+    def _assert_set_project_domain(self, expected, account, req_project_id,
+                                   req_project_domain_id,
+                                   sysmeta_project_domain_id,
+                                   warning=False):
+        hdr = 'X-Account-Sysmeta-Project-Domain-Id'
+
+        # set up fake account info in req env
+        status = 0 if sysmeta_project_domain_id is None else 200
+        sysmeta = {}
+        if sysmeta_project_domain_id:
+            sysmeta['project-domain-id'] = sysmeta_project_domain_id
+        info = {'status': status, 'sysmeta': sysmeta}
+        info_key = get_cache_key(account)
+        env = {'swift.infocache': {info_key: info}}
+
+        # create fake env identity
+        env_id = self._get_env_id(tenant_id=req_project_id,
+                                  project_domain_id=req_project_domain_id)
+
+        # reset fake logger
+        self.test_auth.logger = debug_logger()
+        num_warnings = 0
+
+        # check account requests
+        path = '/v1/%s' % account
+        for method in ['PUT', 'POST']:
+            req = Request.blank(path, environ=env)
+            req.method = method
+            path_parts = req.split_path(1, 4, True)
+            self.test_auth._set_project_domain_id(req, path_parts, env_id)
+            if warning:
+                num_warnings += 1
+                warnings = self.test_auth.logger.get_lines_for_level('warning')
+                self.assertEqual(len(warnings), num_warnings)
+                self.assertTrue(warnings[-1].startswith('Inconsistent proj'))
+            if expected is not None:
+                self.assertTrue(hdr in req.headers)
+                self.assertEqual(req.headers[hdr], expected)
+            else:
+                self.assertFalse(hdr in req.headers, req.headers)
+
+        for method in ['GET', 'HEAD', 'DELETE', 'OPTIONS']:
+            req = Request.blank(path, environ=env)
+            req.method = method
+            self.test_auth._set_project_domain_id(req, path_parts, env_id)
+            self.assertFalse(hdr in req.headers)
+
+        # check container requests
+        path = '/v1/%s/c' % account
+        for method in ['PUT']:
+            req = Request.blank(path, environ=env)
+            req.method = method
+            path_parts = req.split_path(1, 4, True)
+            self.test_auth._set_project_domain_id(req, path_parts, env_id)
+            if warning:
+                num_warnings += 1
+                warnings = self.test_auth.logger.get_lines_for_level('warning')
+                self.assertEqual(len(warnings), num_warnings)
+                self.assertTrue(warnings[-1].startswith('Inconsistent proj'))
+            if expected is not None:
+                self.assertTrue(hdr in req.headers)
+                self.assertEqual(req.headers[hdr], expected)
+            else:
+                self.assertFalse(hdr in req.headers)
+
+        for method in ['POST', 'GET', 'HEAD', 'DELETE', 'OPTIONS']:
+            req = Request.blank(path, environ=env)
+            req.method = method
+            self.test_auth._set_project_domain_id(req, path_parts, env_id)
+            self.assertFalse(hdr in req.headers)
+
+        # never set for object requests
+        path = '/v1/%s/c/o' % account
+        for method in ['PUT', 'COPY', 'POST', 'GET', 'HEAD', 'DELETE',
+                       'OPTIONS']:
+            req = Request.blank(path, environ=env)
+            req.method = method
+            path_parts = req.split_path(1, 4, True)
+            self.test_auth._set_project_domain_id(req, path_parts, env_id)
+            self.assertFalse(hdr in req.headers)
+
+    def test_set_project_domain_id_new_account(self):
+        # scoped token with project domain info
+        self._assert_set_project_domain('test_id',
+                                        account='AUTH_1234',
+                                        req_project_id='1234',
+                                        req_project_domain_id='test_id',
+                                        sysmeta_project_domain_id=None)
+
+        # scoped v2 token without project domain id
+        self._assert_set_project_domain(None,
+                                        account='AUTH_1234',
+                                        req_project_id='1234',
+                                        req_project_domain_id=None,
+                                        sysmeta_project_domain_id=None)
+
+        # unscoped v2 token without project domain id
+        self._assert_set_project_domain(UNKNOWN_ID,
+                                        account='AUTH_1234',
+                                        req_project_id=None,
+                                        req_project_domain_id=None,
+                                        sysmeta_project_domain_id=None)
+
+        # token scoped on another project
+        self._assert_set_project_domain(UNKNOWN_ID,
+                                        account='AUTH_1234',
+                                        req_project_id='4321',
+                                        req_project_domain_id='default',
+                                        sysmeta_project_domain_id=None)
+
+    def test_set_project_domain_id_existing_v2_account(self):
+        # project domain id provided in scoped request token,
+        # update empty value
+        self._assert_set_project_domain('default',
+                                        account='AUTH_1234',
+                                        req_project_id='1234',
+                                        req_project_domain_id='default',
+                                        sysmeta_project_domain_id='')
+
+        # inconsistent project domain id provided in scoped request token,
+        # leave known value
+        self._assert_set_project_domain(None,
+                                        account='AUTH_1234',
+                                        req_project_id='1234',
+                                        req_project_domain_id='unexpected_id',
+                                        sysmeta_project_domain_id='',
+                                        warning=True)
+
+        # project domain id not provided, scoped request token,
+        # no change to empty value
+        self._assert_set_project_domain(None,
+                                        account='AUTH_1234',
+                                        req_project_id='1234',
+                                        req_project_domain_id=None,
+                                        sysmeta_project_domain_id='')
+
+        # unscoped request token, no change to empty value
+        self._assert_set_project_domain(None,
+                                        account='AUTH_1234',
+                                        req_project_id=None,
+                                        req_project_domain_id=None,
+                                        sysmeta_project_domain_id='')
+
+        # token scoped on another project,
+        # update empty value
+        self._assert_set_project_domain(None,
+                                        account='AUTH_1234',
+                                        req_project_id='4321',
+                                        req_project_domain_id=None,
+                                        sysmeta_project_domain_id='')
+
+    def test_set_project_domain_id_existing_account_unknown_domain(self):
+
+        # project domain id provided in scoped request token,
+        # set known value
+        self._assert_set_project_domain('test_id',
+                                        account='AUTH_1234',
+                                        req_project_id='1234',
+                                        req_project_domain_id='test_id',
+                                        sysmeta_project_domain_id=UNKNOWN_ID)
+
+        # project domain id not provided, scoped request token,
+        # set empty value
+        self._assert_set_project_domain('',
+                                        account='AUTH_1234',
+                                        req_project_id='1234',
+                                        req_project_domain_id=None,
+                                        sysmeta_project_domain_id=UNKNOWN_ID)
+
+        # project domain id not provided, unscoped request token,
+        # leave unknown value
+        self._assert_set_project_domain(None,
+                                        account='AUTH_1234',
+                                        req_project_id=None,
+                                        req_project_domain_id=None,
+                                        sysmeta_project_domain_id=UNKNOWN_ID)
+
+        # token scoped on another project, leave unknown value
+        self._assert_set_project_domain(None,
+                                        account='AUTH_1234',
+                                        req_project_id='4321',
+                                        req_project_domain_id='default',
+                                        sysmeta_project_domain_id=UNKNOWN_ID)
+
+    def test_set_project_domain_id_existing_known_domain(self):
+        # project domain id provided in scoped request token,
+        # leave known value
+        self._assert_set_project_domain(None,
+                                        account='AUTH_1234',
+                                        req_project_id='1234',
+                                        req_project_domain_id='test_id',
+                                        sysmeta_project_domain_id='test_id')
+
+        # inconsistent project domain id provided in scoped request token,
+        # leave known value
+        self._assert_set_project_domain(None,
+                                        account='AUTH_1234',
+                                        req_project_id='1234',
+                                        req_project_domain_id='unexpected_id',
+                                        sysmeta_project_domain_id='test_id',
+                                        warning=True)
+
+        # project domain id not provided, scoped request token,
+        # leave known value
+        self._assert_set_project_domain(None,
+                                        account='AUTH_1234',
+                                        req_project_id='1234',
+                                        req_project_domain_id=None,
+                                        sysmeta_project_domain_id='test_id')
+
+        # project domain id not provided, unscoped request token,
+        # leave known value
+        self._assert_set_project_domain(None,
+                                        account='AUTH_1234',
+                                        req_project_id=None,
+                                        req_project_domain_id=None,
+                                        sysmeta_project_domain_id='test_id')
+
+        # project domain id not provided, token scoped on another project,
+        # leave known value
+        self._assert_set_project_domain(None,
+                                        account='AUTH_1234',
+                                        req_project_id='4321',
+                                        req_project_domain_id='default',
+                                        sysmeta_project_domain_id='test_id')
+
+
+class TestAuthorizeReaderSystem(BaseTestAuthorizeCheck):
+
+    system_reader_role_1 = 'compliance'
+    system_reader_role_2 = 'integrity'
+
+    # This cannot be in SetUp because it takes arguments from tests.
+    def _setup(self, system_reader_roles):
+        # We could rifle in the KeystoneAuth internals and tweak the list,
+        # but to create the middleware fresh is a clean, future-resistant way.
+        self.test_auth = keystoneauth.filter_factory(
+            {}, system_reader_roles=system_reader_roles)(FakeApp())
+        self.test_auth.logger = debug_logger()
+
+    # Zero test: make sure that reader role has no default access
+    # when not in the list of system_reader_roles[].
+    def test_reader_none(self):
+        self._setup(None)
+        identity = self._get_identity(roles=[self.system_reader_role_1])
+        self._check_authenticate(exception=HTTP_FORBIDDEN,
+                                 identity=identity)
+
+    # HEAD is the same, right? No need to check, right?
+    def test_reader_get(self):
+        # While we're at it, test that our parsing of CSV works.
+        self._setup("%s, %s" %
+                    (self.system_reader_role_1, self.system_reader_role_2))
+        identity = self._get_identity(roles=[self.system_reader_role_1])
+        self._check_authenticate(identity=identity)
+
+    def test_reader_put(self):
+        self._setup(self.system_reader_role_1)
+        identity = self._get_identity(roles=[self.system_reader_role_1])
+        self._check_authenticate(exception=HTTP_FORBIDDEN,
+                                 identity=identity,
+                                 env={'REQUEST_METHOD': 'PUT'})
+        self._check_authenticate(exception=HTTP_FORBIDDEN,
+                                 identity=identity,
+                                 env={'REQUEST_METHOD': 'POST'})
+
+    def test_reader_put_to_own(self):
+        roles = operator_roles(self.test_auth) + [self.system_reader_role_1]
+        identity = self._get_identity(roles=roles)
+        req = self._check_authenticate(identity=identity,
+                                       env={'REQUEST_METHOD': 'PUT'})
+        self.assertTrue(req.environ.get('swift_owner'))
+
+    # This should not be happening, but let's make sure that reader did not
+    # obtain any extra authorizations by combining with swiftoperator,
+    # because that is how reader is going to be used in practice.
+    def test_reader_put_elsewhere_fails(self):
+        roles = operator_roles(self.test_auth) + [self.system_reader_role_1]
+        identity = self._get_identity(roles=roles)
+        account = "%s%s" % (self._get_account(identity), "2")
+        self._check_authenticate(exception=HTTP_FORBIDDEN,
+                                 identity=identity,
+                                 account=account,
+                                 env={'REQUEST_METHOD': 'PUT'})
+
+
+class TestAuthorizeReaderProject(BaseTestAuthorizeCheck):
+
+    project_reader_role_1 = 'rdr1'
+    project_reader_role_2 = 'rdr2'
+
+    # This cannot be in SetUp because it takes arguments from tests.
+    def _setup(self, project_reader_roles):
+        self.test_auth = keystoneauth.filter_factory(
+            {}, project_reader_roles=project_reader_roles)(FakeApp())
+        self.test_auth.logger = debug_logger()
+
+    # The project reader tests do not have a zero test because it literally
+    # is the same code as system reader tests already run. See above.
+
+    # Reading is what a reader does.
+    def test_reader_get(self):
+        self._setup("%s, %s" %
+                    (self.project_reader_role_1, self.project_reader_role_2))
+        identity = self._get_identity(roles=[self.project_reader_role_2])
+        self._check_authenticate(identity=identity)
+
+    # Writing would otherwise be allowed, but not for a reader.
+    def test_reader_put(self):
+        self._setup(self.project_reader_role_1)
+        identity = self._get_identity(roles=[self.project_reader_role_1])
+        self._check_authenticate(exception=HTTP_FORBIDDEN,
+                                 identity=identity,
+                                 env={'REQUEST_METHOD': 'PUT'})
+        self._check_authenticate(exception=HTTP_FORBIDDEN,
+                                 identity=identity,
+                                 env={'REQUEST_METHOD': 'POST'})
+
+
+class ResellerInInfo(unittest.TestCase):
+
+    def setUp(self):
+        self.default_rules = {'operator_roles': ['admin', 'swiftoperator'],
+                              'project_reader_roles': [],
+                              'service_roles': []}
+
+    def test_defaults(self):
+        test_auth = keystoneauth.filter_factory({})(FakeApp())
+        self.assertEqual(test_auth.account_rules['AUTH_'], self.default_rules)
+
+    def test_multiple(self):
+        conf = {"reseller_prefix": "AUTH, '', PRE2"}
+        test_auth = keystoneauth.filter_factory(conf)(FakeApp())
+        self.assertEqual(test_auth.account_rules['AUTH_'], self.default_rules)
+        self.assertEqual(test_auth.account_rules[''], self.default_rules)
+        self.assertEqual(test_auth.account_rules['PRE2_'], self.default_rules)
+
+
+class PrefixAccount(unittest.TestCase):
+
+    def test_default(self):
+        conf = {}
+        test_auth = keystoneauth.filter_factory(conf)(FakeApp())
+        self.assertEqual(get_account_for_tenant(test_auth,
+                         '1234'), 'AUTH_1234')
+        self.assertEqual(test_auth._get_account_prefix(
+                         'AUTH_1234'), 'AUTH_')
+        self.assertEqual(test_auth._get_account_prefix(
+                         'JUNK_1234'), None)
+        self.assertTrue(test_auth._account_matches_tenant(
+                        'AUTH_1234', '1234'))
+        self.assertFalse(test_auth._account_matches_tenant(
+                         'AUTH_1234', '5678'))
+        self.assertFalse(test_auth._account_matches_tenant(
+                         'JUNK_1234', '1234'))
+
+    def test_same_as_default(self):
+        conf = {'reseller_prefix': 'AUTH'}
+        test_auth = keystoneauth.filter_factory(conf)(FakeApp())
+        self.assertEqual(get_account_for_tenant(test_auth,
+                         '1234'), 'AUTH_1234')
+        self.assertEqual(test_auth._get_account_prefix(
+                         'AUTH_1234'), 'AUTH_')
+        self.assertEqual(test_auth._get_account_prefix(
+                         'JUNK_1234'), None)
+        self.assertTrue(test_auth._account_matches_tenant(
+                        'AUTH_1234', '1234'))
+        self.assertFalse(test_auth._account_matches_tenant(
+                         'AUTH_1234', '5678'))
+
+    def test_blank_reseller(self):
+        conf = {'reseller_prefix': ''}
+        test_auth = keystoneauth.filter_factory(conf)(FakeApp())
+        self.assertEqual(get_account_for_tenant(test_auth,
+                         '1234'), '1234')
+        self.assertEqual(test_auth._get_account_prefix(
+                         '1234'), '')
+        self.assertEqual(test_auth._get_account_prefix(
+                         'JUNK_1234'), '')  # yes, it should return ''
+        self.assertTrue(test_auth._account_matches_tenant(
+                        '1234', '1234'))
+        self.assertFalse(test_auth._account_matches_tenant(
+                         '1234', '5678'))
+        self.assertFalse(test_auth._account_matches_tenant(
+                         'JUNK_1234', '1234'))
+
+    def test_multiple_resellers(self):
+        conf = {'reseller_prefix': 'AUTH, PRE2'}
+        test_auth = keystoneauth.filter_factory(conf)(FakeApp())
+        self.assertEqual(get_account_for_tenant(test_auth,
+                         '1234'), 'AUTH_1234')
+        self.assertEqual(test_auth._get_account_prefix(
+                         'AUTH_1234'), 'AUTH_')
+        self.assertEqual(test_auth._get_account_prefix(
+                         'JUNK_1234'), None)
+        self.assertTrue(test_auth._account_matches_tenant(
+                        'AUTH_1234', '1234'))
+        self.assertTrue(test_auth._account_matches_tenant(
+                        'PRE2_1234', '1234'))
+        self.assertFalse(test_auth._account_matches_tenant(
+                         'AUTH_1234', '5678'))
+        self.assertFalse(test_auth._account_matches_tenant(
+                         'PRE2_1234', '5678'))
+
+    def test_blank_plus_other_reseller(self):
+        conf = {'reseller_prefix': " '', PRE2"}
+        test_auth = keystoneauth.filter_factory(conf)(FakeApp())
+        self.assertEqual(get_account_for_tenant(test_auth,
+                         '1234'), '1234')
+        self.assertEqual(test_auth._get_account_prefix(
+                         'PRE2_1234'), 'PRE2_')
+        self.assertEqual(test_auth._get_account_prefix('JUNK_1234'), '')
+        self.assertTrue(test_auth._account_matches_tenant(
+                        '1234', '1234'))
+        self.assertTrue(test_auth._account_matches_tenant(
+                        'PRE2_1234', '1234'))
+        self.assertFalse(test_auth._account_matches_tenant(
+                         '1234', '5678'))
+        self.assertFalse(test_auth._account_matches_tenant(
+                         'PRE2_1234', '5678'))
 
 
 if __name__ == '__main__':
diff --git a/test/unit/common/middleware/test_list_endpoints.py b/test/unit/common/middleware/test_list_endpoints.py
new file mode 100644
index 0000000000..661023fd56
--- /dev/null
+++ b/test/unit/common/middleware/test_list_endpoints.py
@@ -0,0 +1,440 @@
+# Copyright (c) 2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import array
+import json
+import unittest
+from tempfile import mkdtemp
+from shutil import rmtree
+
+import os
+from unittest import mock
+from swift.common import ring, utils
+from swift.common.utils import split_path
+from swift.common.swob import Request, Response
+from swift.common.middleware import list_endpoints
+from swift.common.storage_policy import StoragePolicy, POLICIES
+from test.unit import patch_policies
+
+
+class FakeApp(object):
+    def __call__(self, env, start_response):
+        return Response(body="FakeApp")(env, start_response)
+
+
+def start_response(*args):
+    pass
+
+
+@patch_policies([StoragePolicy(0, 'zero', False),
+                StoragePolicy(1, 'one', True)])
+class TestListEndpoints(unittest.TestCase):
+    def setUp(self):
+        utils.HASH_PATH_SUFFIX = b'endcap'
+        utils.HASH_PATH_PREFIX = b''
+        self.testdir = mkdtemp()
+
+        accountgz = os.path.join(self.testdir, 'account.ring.gz')
+        containergz = os.path.join(self.testdir, 'container.ring.gz')
+        objectgz = os.path.join(self.testdir, 'object.ring.gz')
+        objectgz_1 = os.path.join(self.testdir, 'object-1.ring.gz')
+        self.policy_to_test = 0
+        self.expected_path = ('v1', 'a', 'c', 'o1')
+
+        # Let's make the rings slightly different so we can test
+        # that the correct ring is consulted (e.g. we don't consult
+        # the object ring to get nodes for a container)
+        intended_replica2part2dev_id_a = [
+            array.array('H', [3, 1, 3, 1]),
+            array.array('H', [0, 3, 1, 4]),
+            array.array('H', [1, 4, 0, 3])]
+        intended_replica2part2dev_id_c = [
+            array.array('H', [4, 3, 0, 1]),
+            array.array('H', [0, 1, 3, 4]),
+            array.array('H', [3, 4, 0, 1])]
+        intended_replica2part2dev_id_o = [
+            array.array('H', [0, 1, 0, 1]),
+            array.array('H', [0, 1, 0, 1]),
+            array.array('H', [3, 4, 3, 4])]
+        intended_replica2part2dev_id_o_1 = [
+            array.array('H', [1, 0, 1, 0]),
+            array.array('H', [1, 0, 1, 0]),
+            array.array('H', [4, 3, 4, 3])]
+        intended_devs = [{'id': 0, 'region': 1, 'zone': 0, 'weight': 1.0,
+                          'ip': '10.1.1.1', 'port': 6200,
+                          'device': 'sda1'},
+                         {'id': 1, 'region': 1, 'zone': 0, 'weight': 1.0,
+                          'ip': '10.1.1.1', 'port': 6200,
+                          'device': 'sdb1'},
+                         None,
+                         {'id': 3, 'region': 1, 'zone': 2, 'weight': 1.0,
+                          'ip': '10.1.2.1', 'port': 6200,
+                          'device': 'sdc1'},
+                         {'id': 4, 'region': 1, 'zone': 2, 'weight': 1.0,
+                          'ip': '10.1.2.2', 'port': 6200,
+                          'device': 'sdd1'}]
+        intended_part_shift = 30
+        ring.RingData(intended_replica2part2dev_id_a,
+                      intended_devs, intended_part_shift).save(accountgz)
+        ring.RingData(intended_replica2part2dev_id_c,
+                      intended_devs, intended_part_shift).save(containergz)
+        ring.RingData(intended_replica2part2dev_id_o,
+                      intended_devs, intended_part_shift).save(objectgz)
+        ring.RingData(intended_replica2part2dev_id_o_1,
+                      intended_devs, intended_part_shift).save(objectgz_1)
+
+        self.app = FakeApp()
+        self.list_endpoints = list_endpoints.filter_factory(
+            {'swift_dir': self.testdir})(self.app)
+
+    def tearDown(self):
+        rmtree(self.testdir, ignore_errors=1)
+
+    def FakeGetInfo(self, env, app, swift_source=None):
+        info = {'status': 0, 'sync_key': None, 'meta': {},
+                'cors': {'allow_origin': None, 'expose_headers': None,
+                         'max_age': None},
+                'sysmeta': {}, 'read_acl': None,
+                'object_count': None, 'write_acl': None, 'versions': None,
+                'bytes': None}
+        info['storage_policy'] = self.policy_to_test
+        (version, account, container, unused) = \
+            split_path(env['PATH_INFO'], 3, 4, True)
+        self.assertEqual((version, account, container),
+                         self.expected_path[:3])
+        return info
+
+    def test_parse_response_version(self):
+        expectations = {
+            '': 1.0,  # legacy compat
+            '/1': 1.0,
+            '/v1': 1.0,
+            '/1.0': 1.0,
+            '/v1.0': 1.0,
+            '/2': 2.0,
+            '/v2': 2.0,
+            '/2.0': 2.0,
+            '/v2.0': 2.0,
+        }
+        accounts = (
+            'AUTH_test',
+            'test',
+            'verybadreseller_prefix'
+            'verybadaccount'
+        )
+        for expected_account in accounts:
+            for version, expected in expectations.items():
+                path = '/endpoints%s/%s/c/o' % (version, expected_account)
+                req = Request.blank(path)
+                version, account, container, obj = \
+                    self.list_endpoints._parse_path(req)
+                try:
+                    self.assertEqual(version, expected)
+                    self.assertEqual(account, expected_account)
+                except AssertionError:
+                    self.fail('Unexpected result from parse path %r: %r != %r'
+                              % (path, (version, account),
+                                 (expected, expected_account)))
+
+    def test_parse_version_that_looks_like_account(self):
+        """
+        Demonstrate the failure mode for versions that look like accounts,
+        if you can make _parse_path better and this is the *only* test that
+        fails you can delete it ;)
+        """
+        bad_versions = (
+            'v_3',
+            'verybadreseller_prefix',
+        )
+        for bad_version in bad_versions:
+            req = Request.blank('/endpoints/%s/a/c/o' % bad_version)
+            version, account, container, obj = \
+                self.list_endpoints._parse_path(req)
+            self.assertEqual(version, 1.0)
+            self.assertEqual(account, bad_version)
+            self.assertEqual(container, 'a')
+            self.assertEqual(obj, 'c/o')
+
+    def test_parse_account_that_looks_like_version(self):
+        """
+        Demonstrate the failure mode for accounts that looks like versions,
+        if you can make _parse_path better and this is the *only* test that
+        fails you can delete it ;)
+        """
+        bad_accounts = (
+            'v3.0', 'verybaddaccountwithnoprefix',
+        )
+        for bad_account in bad_accounts:
+            req = Request.blank('/endpoints/%s/c/o' % bad_account)
+            self.assertRaises(ValueError,
+                              self.list_endpoints._parse_path, req)
+        even_worse_accounts = {
+            'v1': 1.0,
+            'v2.0': 2.0,
+        }
+        for bad_account, guessed_version in even_worse_accounts.items():
+            req = Request.blank('/endpoints/%s/c/o' % bad_account)
+            version, account, container, obj = \
+                self.list_endpoints._parse_path(req)
+            self.assertEqual(version, guessed_version)
+            self.assertEqual(account, 'c')
+            self.assertEqual(container, 'o')
+            self.assertIsNone(obj)
+
+    def test_get_object_ring(self):
+        self.assertEqual(isinstance(self.list_endpoints.get_object_ring(0),
+                                    ring.Ring), True)
+        self.assertEqual(isinstance(self.list_endpoints.get_object_ring(1),
+                                    ring.Ring), True)
+        self.assertRaises(ValueError, self.list_endpoints.get_object_ring, 99)
+
+    def test_parse_path_no_version_specified(self):
+        req = Request.blank('/endpoints/a/c/o1')
+        version, account, container, obj = \
+            self.list_endpoints._parse_path(req)
+        self.assertEqual(account, 'a')
+        self.assertEqual(container, 'c')
+        self.assertEqual(obj, 'o1')
+
+    def test_parse_path_with_valid_version(self):
+        req = Request.blank('/endpoints/v2/a/c/o1')
+        version, account, container, obj = \
+            self.list_endpoints._parse_path(req)
+        self.assertEqual(version, 2.0)
+        self.assertEqual(account, 'a')
+        self.assertEqual(container, 'c')
+        self.assertEqual(obj, 'o1')
+
+    def test_parse_path_with_invalid_version(self):
+        req = Request.blank('/endpoints/v3/a/c/o1')
+        self.assertRaises(ValueError, self.list_endpoints._parse_path,
+                          req)
+
+    def test_parse_path_with_no_account(self):
+        bad_paths = ('v1', 'v2', '')
+        for path in bad_paths:
+            req = Request.blank('/endpoints/%s' % path)
+            try:
+                self.list_endpoints._parse_path(req)
+                self.fail('Expected ValueError to be raised')
+            except ValueError as err:
+                self.assertEqual(str(err), 'No account specified')
+
+    def test_get_endpoint(self):
+        # Expected results for objects taken from test_ring
+        # Expected results for others computed by manually invoking
+        # ring.get_nodes().
+        resp = Request.blank('/endpoints/a/c/o1').get_response(
+            self.list_endpoints)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.content_type, 'application/json')
+        self.assertEqual(json.loads(resp.body), [
+            "http://10.1.1.1:6200/sdb1/1/a/c/o1",
+            "http://10.1.2.2:6200/sdd1/1/a/c/o1"
+        ])
+
+        # test policies with no version endpoint name
+        expected = [[
+                    "http://10.1.1.1:6200/sdb1/1/a/c/o1",
+                    "http://10.1.2.2:6200/sdd1/1/a/c/o1"], [
+                    "http://10.1.1.1:6200/sda1/1/a/c/o1",
+                    "http://10.1.2.1:6200/sdc1/1/a/c/o1"
+                    ]]
+        PATCHGI = 'swift.common.middleware.list_endpoints.get_container_info'
+        for pol in POLICIES:
+            self.policy_to_test = pol.idx
+            with mock.patch(PATCHGI, self.FakeGetInfo):
+                resp = Request.blank('/endpoints/a/c/o1').get_response(
+                    self.list_endpoints)
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual(resp.content_type, 'application/json')
+            self.assertEqual(json.loads(resp.body),
+                             expected[pol.idx])
+
+        # Here, 'o1/' is the object name.
+        resp = Request.blank('/endpoints/a/c/o1/').get_response(
+            self.list_endpoints)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(json.loads(resp.body), [
+            "http://10.1.1.1:6200/sdb1/3/a/c/o1/",
+            "http://10.1.2.2:6200/sdd1/3/a/c/o1/"
+        ])
+
+        resp = Request.blank('/endpoints/a/c2').get_response(
+            self.list_endpoints)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(json.loads(resp.body), [
+            "http://10.1.1.1:6200/sda1/2/a/c2",
+            "http://10.1.2.1:6200/sdc1/2/a/c2"
+        ])
+
+        resp = Request.blank('/endpoints/a1').get_response(
+            self.list_endpoints)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(json.loads(resp.body), [
+            "http://10.1.2.1:6200/sdc1/0/a1",
+            "http://10.1.1.1:6200/sda1/0/a1",
+            "http://10.1.1.1:6200/sdb1/0/a1"
+        ])
+
+        resp = Request.blank('/endpoints/').get_response(
+            self.list_endpoints)
+        self.assertEqual(resp.status_int, 400)
+
+        resp = Request.blank('/endpoints/a/c 2').get_response(
+            self.list_endpoints)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(json.loads(resp.body), [
+            "http://10.1.1.1:6200/sdb1/3/a/c%202",
+            "http://10.1.2.2:6200/sdd1/3/a/c%202"
+        ])
+
+        resp = Request.blank('/endpoints/a/c%202').get_response(
+            self.list_endpoints)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(json.loads(resp.body), [
+            "http://10.1.1.1:6200/sdb1/3/a/c%202",
+            "http://10.1.2.2:6200/sdd1/3/a/c%202"
+        ])
+
+        resp = Request.blank('/endpoints/ac%20count/con%20tainer/ob%20ject') \
+            .get_response(self.list_endpoints)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(json.loads(resp.body), [
+            "http://10.1.1.1:6200/sdb1/3/ac%20count/con%20tainer/ob%20ject",
+            "http://10.1.2.2:6200/sdd1/3/ac%20count/con%20tainer/ob%20ject"
+        ])
+
+        resp = Request.blank('/endpoints/a/c/o1', {'REQUEST_METHOD': 'POST'}) \
+            .get_response(self.list_endpoints)
+        self.assertEqual(resp.status_int, 405)
+        self.assertEqual(resp.status, '405 Method Not Allowed')
+        self.assertEqual(resp.headers['allow'], 'GET')
+
+        resp = Request.blank('/not-endpoints').get_response(
+            self.list_endpoints)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.status, '200 OK')
+        self.assertEqual(resp.body, b'FakeApp')
+
+        # test policies with custom endpoint name
+        for pol in POLICIES:
+            # test custom path with trailing slash
+            custom_path_le = list_endpoints.filter_factory({
+                'swift_dir': self.testdir,
+                'list_endpoints_path': '/some/another/path/'
+            })(self.app)
+            self.policy_to_test = pol.idx
+            with mock.patch(PATCHGI, self.FakeGetInfo):
+                resp = Request.blank('/some/another/path/a/c/o1') \
+                    .get_response(custom_path_le)
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual(resp.content_type, 'application/json')
+            self.assertEqual(json.loads(resp.body),
+                             expected[pol.idx])
+
+            # test custom path without trailing slash
+            custom_path_le = list_endpoints.filter_factory({
+                'swift_dir': self.testdir,
+                'list_endpoints_path': '/some/another/path'
+            })(self.app)
+            self.policy_to_test = pol.idx
+            with mock.patch(PATCHGI, self.FakeGetInfo):
+                resp = Request.blank('/some/another/path/a/c/o1') \
+                    .get_response(custom_path_le)
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual(resp.content_type, 'application/json')
+            self.assertEqual(json.loads(resp.body),
+                             expected[pol.idx])
+
+    def test_v1_response(self):
+        req = Request.blank('/endpoints/v1/a/c/o1')
+        resp = req.get_response(self.list_endpoints)
+        expected = ["http://10.1.1.1:6200/sdb1/1/a/c/o1",
+                    "http://10.1.2.2:6200/sdd1/1/a/c/o1"]
+        self.assertEqual(json.loads(resp.body), expected)
+
+    def test_v2_obj_response(self):
+        req = Request.blank('/endpoints/v2/a/c/o1')
+        resp = req.get_response(self.list_endpoints)
+        expected = {
+            'endpoints': ["http://10.1.1.1:6200/sdb1/1/a/c/o1",
+                          "http://10.1.2.2:6200/sdd1/1/a/c/o1"],
+            'headers': {'X-Backend-Storage-Policy-Index': "0"},
+        }
+        self.assertEqual(json.loads(resp.body), expected)
+        for policy in POLICIES:
+            patch_path = 'swift.common.middleware.list_endpoints' \
+                '.get_container_info'
+            mock_get_container_info = lambda *args, **kwargs: \
+                {'storage_policy': int(policy)}
+            with mock.patch(patch_path, mock_get_container_info):
+                resp = req.get_response(self.list_endpoints)
+            part, nodes = policy.object_ring.get_nodes('a', 'c', 'o1')
+            [node.update({'part': part}) for node in nodes]
+            path = 'http://%(ip)s:%(port)s/%(device)s/%(part)s/a/c/o1'
+            expected = {
+                'headers': {
+                    'X-Backend-Storage-Policy-Index': str(int(policy))},
+                'endpoints': [path % node for node in nodes],
+            }
+            self.assertEqual(json.loads(resp.body), expected)
+
+    def test_v2_non_obj_response(self):
+        # account
+        req = Request.blank('/endpoints/v2/a')
+        resp = req.get_response(self.list_endpoints)
+        expected = {
+            'endpoints': ["http://10.1.2.1:6200/sdc1/0/a",
+                          "http://10.1.1.1:6200/sda1/0/a",
+                          "http://10.1.1.1:6200/sdb1/0/a"],
+            'headers': {},
+        }
+        # container
+        self.assertEqual(json.loads(resp.body), expected)
+        req = Request.blank('/endpoints/v2/a/c')
+        resp = req.get_response(self.list_endpoints)
+        expected = {
+            'endpoints': ["http://10.1.2.2:6200/sdd1/0/a/c",
+                          "http://10.1.1.1:6200/sda1/0/a/c",
+                          "http://10.1.2.1:6200/sdc1/0/a/c"],
+            'headers': {},
+        }
+        self.assertEqual(json.loads(resp.body), expected)
+
+    def test_version_account_response(self):
+        req = Request.blank('/endpoints/a')
+        resp = req.get_response(self.list_endpoints)
+        expected = ["http://10.1.2.1:6200/sdc1/0/a",
+                    "http://10.1.1.1:6200/sda1/0/a",
+                    "http://10.1.1.1:6200/sdb1/0/a"]
+        self.assertEqual(json.loads(resp.body), expected)
+        req = Request.blank('/endpoints/v1.0/a')
+        resp = req.get_response(self.list_endpoints)
+        self.assertEqual(json.loads(resp.body), expected)
+
+        req = Request.blank('/endpoints/v2/a')
+        resp = req.get_response(self.list_endpoints)
+        expected = {
+            'endpoints': ["http://10.1.2.1:6200/sdc1/0/a",
+                          "http://10.1.1.1:6200/sda1/0/a",
+                          "http://10.1.1.1:6200/sdb1/0/a"],
+            'headers': {},
+        }
+        self.assertEqual(json.loads(resp.body), expected)
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/test_listing_formats.py b/test/unit/common/middleware/test_listing_formats.py
new file mode 100644
index 0000000000..315e82de31
--- /dev/null
+++ b/test/unit/common/middleware/test_listing_formats.py
@@ -0,0 +1,791 @@
+# Copyright (c) 2017 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import json
+import unittest
+
+from swift.common.header_key_dict import HeaderKeyDict
+from swift.common.swob import Request, HTTPOk, HTTPNoContent
+from swift.common.middleware import listing_formats
+from swift.common.request_helpers import get_reserved_name
+from swift.common.storage_policy import POLICIES
+from test.debug_logger import debug_logger
+from test.unit.common.middleware.helpers import FakeSwift
+
+
+TEST_POLICIES = (POLICIES[0].name, 'Policy-1')
+
+
+class TestListingFormats(unittest.TestCase):
+    def setUp(self):
+        self.fake_swift = FakeSwift()
+        self.logger = debug_logger('test-listing')
+        self.app = listing_formats.ListingFilter(self.fake_swift, {},
+                                                 logger=self.logger)
+        self.fake_account_listing = json.dumps([
+            {'name': 'bar', 'bytes': 0, 'count': 0,
+             'last_modified': '1970-01-01T00:00:00.000000',
+             'storage_policy': TEST_POLICIES[0]},
+            {'subdir': 'foo_'},
+            {'name': 'foobar', 'bytes': 0, 'count': 0,
+             'last_modified': '2025-01-01T00:00:00.000000',
+             'storage_policy': TEST_POLICIES[1]},
+            {'name': 'nobar', 'bytes': 0, 'count': 0,  # Unknown policy
+             'last_modified': '2025-02-01T00:00:00.000000'},
+        ]).encode('ascii')
+        self.fake_container_listing = json.dumps([
+            {'name': 'bar', 'hash': 'etag', 'bytes': 0,
+             'content_type': 'text/plain',
+             'last_modified': '1970-01-01T00:00:00.000000'},
+            {'subdir': 'foo/'},
+        ]).encode('ascii')
+
+        self.fake_account_listing_with_reserved = json.dumps([
+            {'name': 'bar', 'bytes': 0, 'count': 0,
+             'last_modified': '1970-01-01T00:00:00.000000',
+             'storage_policy': TEST_POLICIES[0]},
+            {'name': get_reserved_name('bar', 'versions'), 'bytes': 0,
+             'count': 0, 'last_modified': '1970-01-01T00:00:00.000000',
+             'storage_policy': TEST_POLICIES[0]},
+            {'subdir': 'foo_'},
+            {'subdir': get_reserved_name('foo_')},
+            {'name': 'foobar', 'bytes': 0, 'count': 0,
+             'last_modified': '2025-01-01T00:00:00.000000',
+             'storage_policy': TEST_POLICIES[1]},
+            {'name': 'nobar', 'bytes': 0, 'count': 0,  # Unknown policy
+             'last_modified': '2025-02-01T00:00:00.000000'},
+        ]).encode('ascii')
+        self.fake_container_listing_with_reserved = json.dumps([
+            {'name': 'bar', 'hash': 'etag', 'bytes': 0,
+             'content_type': 'text/plain',
+             'last_modified': '1970-01-01T00:00:00.000000'},
+            {'name': get_reserved_name('bar', 'extra data'), 'hash': 'etag',
+             'bytes': 0, 'content_type': 'text/plain',
+             'last_modified': '1970-01-01T00:00:00.000000'},
+            {'subdir': 'foo/'},
+            {'subdir': get_reserved_name('foo/')},
+        ]).encode('ascii')
+
+    def test_valid_account(self):
+        self.fake_swift.register('GET', '/v1/a', HTTPOk, {
+            'Content-Length': str(len(self.fake_account_listing)),
+            'Content-Type': 'application/json'}, self.fake_account_listing)
+
+        req = Request.blank('/v1/a')
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.body, b'bar\nfoo_\nfoobar\nnobar\n')
+        self.assertEqual(resp.headers['Content-Type'],
+                         'text/plain; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', '/v1/a?format=json'))
+
+        req = Request.blank('/v1/a?format=plain')
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.body, b'bar\nfoo_\nfoobar\nnobar\n')
+        self.assertEqual(resp.headers['Content-Type'],
+                         'text/plain; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', '/v1/a?format=json'))
+
+        req = Request.blank('/v1/a?format=json')
+        resp = req.get_response(self.app)
+        self.assertEqual(json.loads(resp.body),
+                         json.loads(self.fake_account_listing))
+        self.assertEqual(resp.headers['Content-Type'],
+                         'application/json; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', '/v1/a?format=json'))
+
+        req = Request.blank('/v1/a?format=xml')
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.body.split(b'\n'), [
+            b'<?xml version="1.0" encoding="UTF-8"?>',
+            b'<account name="a">',
+            b'<container><name>bar</name><count>0</count><bytes>0</bytes>'
+            b'<last_modified>1970-01-01T00:00:00.000000</last_modified>'
+            b'<storage_policy>%s</storage_policy>'
+            b'</container>' % TEST_POLICIES[0].encode('ascii'),
+            b'<subdir name="foo_" />',
+            b'<container><name>foobar</name><count>0</count><bytes>0</bytes>'
+            b'<last_modified>2025-01-01T00:00:00.000000</last_modified>'
+            b'<storage_policy>%s</storage_policy>'
+            b'</container>' % TEST_POLICIES[1].encode('ascii'),
+            b'<container><name>nobar</name><count>0</count><bytes>0</bytes>'
+            b'<last_modified>2025-02-01T00:00:00.000000</last_modified>'
+            b'</container>',
+            b'</account>',
+        ])
+        self.assertEqual(resp.headers['Content-Type'],
+                         'application/xml; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', '/v1/a?format=json'))
+
+    def test_valid_content_type_on_txt_head(self):
+        self.fake_swift.register('HEAD', '/v1/a', HTTPNoContent, {
+            'Content-Length': '0',
+            'Content-Type': 'application/json'}, b'')
+        req = Request.blank('/v1/a', method='HEAD')
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.body, b'')
+        self.assertEqual(resp.headers['Content-Type'],
+                         'text/plain; charset=utf-8')
+        self.assertIn('Vary', resp.headers)
+        # Even though the client didn't send an Accept header, the response
+        # could change *if a subsequent request does*, so include Vary: Accept
+        self.assertEqual(resp.headers['Vary'], 'Accept')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'HEAD', '/v1/a?format=json'))
+
+    def test_text_content_type_on_invalid_format_qs(self):
+        self.fake_swift.register('HEAD', '/v1/a/c', HTTPNoContent, {
+            'Content-Type': 'application/json'}, b'')
+        req = Request.blank('/v1/a/c?format=foo', method='HEAD')
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.body, b'')
+        self.assertEqual(resp.headers['Content-Length'], '0')
+        self.assertEqual(resp.headers['Content-Type'],
+                         'text/plain; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'HEAD', '/v1/a/c?format=json'))
+
+    def test_accept_content_type_on_missing_qs(self):
+        self.fake_swift.register('HEAD', '/v1/a/c', HTTPNoContent, {
+            'Content-Type': 'application/json'}, b'')
+        req = Request.blank('/v1/a/c', method='HEAD',
+                            headers={'Accept': 'application/xml'})
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.body, b'')
+        self.assertEqual(resp.headers['Content-Length'], '0')
+        self.assertEqual(resp.headers['Content-Type'],
+                         'application/xml; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'HEAD', '/v1/a/c?format=json'))
+
+    def test_accept_ignored_on_invalid_qs(self):
+        self.fake_swift.register('HEAD', '/v1/a/c', HTTPNoContent, {
+            'Content-Type': 'application/json'}, b'')
+        req = Request.blank('/v1/a/c?format=foo', method='HEAD',
+                            headers={'Accept': 'application/xml'})
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.body, b'')
+        self.assertEqual(resp.headers['Content-Length'], '0')
+        self.assertEqual(resp.headers['Content-Type'],
+                         'text/plain; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'HEAD', '/v1/a/c?format=json'))
+
+    def test_valid_content_type_on_xml_head(self):
+        self.fake_swift.register('HEAD', '/v1/a', HTTPNoContent, {
+            'Content-Length': '0',
+            'Content-Type': 'application/json'}, b'')
+        req = Request.blank('/v1/a?format=xml', method='HEAD')
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.body, b'')
+        self.assertEqual(resp.headers['Content-Type'],
+                         'application/xml; charset=utf-8')
+        # query param overrides header, so it won't vary
+        self.assertNotIn('Vary', resp.headers)
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'HEAD', '/v1/a?format=json'))
+
+    def test_valid_content_type_on_xml_head_with_no_content_length(self):
+        # note: eventlet 0.38.0 stopped including content-length with 204
+        # responses
+        self.fake_swift.register('HEAD', '/v1/a', HTTPNoContent, {
+            'Content-Type': 'application/json'}, b'')
+        req = Request.blank('/v1/a?format=xml', method='HEAD')
+        status, headers, body = req.call_application(self.app)
+        self.assertEqual(b''.join(body), b'')
+        headers_dict = dict(headers)
+        self.assertEqual(headers_dict.get('Content-Length'), '0', headers)
+        self.assertEqual(headers_dict['Content-Type'],
+                         'application/xml; charset=utf-8')
+        # query param overrides header, so it won't vary
+        self.assertNotIn('Vary', HeaderKeyDict(headers_dict))
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'HEAD', '/v1/a?format=json'))
+
+    def test_update_vary_if_present(self):
+        self.fake_swift.register('HEAD', '/v1/a', HTTPNoContent, {
+            'Content-Length': '0',
+            'Content-Type': 'application/json',
+            'Vary': 'Origin'}, b'')
+        req = Request.blank('/v1/a', method='HEAD')
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.body, b'')
+        self.assertEqual(resp.headers['Content-Type'],
+                         'text/plain; charset=utf-8')
+        self.assertEqual(resp.headers['Vary'], 'Origin, Accept')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'HEAD', '/v1/a?format=json'))
+
+    def test_add_vary_when_content_type_not_json(self):
+        self.fake_swift.register('HEAD', '/v1/a', HTTPNoContent, {
+            'Content-Length': '0',
+            'Content-Type': 'text/plain'}, b'')
+        req = Request.blank('/v1/a', method='HEAD')
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.body, b'')
+        # We actually returned early, we didn't change things in the
+        # request, but added the vary to let the cache know this
+        # request could vary based on Accept as we didn't pass in
+        # a format.
+        self.assertEqual(resp.headers['Content-Type'],
+                         'text/plain')
+        self.assertEqual(resp.headers['Vary'], 'Accept')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'HEAD', '/v1/a?format=json'))
+
+    def test_update_vary_does_not_duplicate(self):
+        self.fake_swift.register('HEAD', '/v1/a', HTTPNoContent, {
+            'Content-Length': '0',
+            'Content-Type': 'application/json',
+            'Vary': 'Accept'}, b'')
+        req = Request.blank('/v1/a', method='HEAD')
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.body, b'')
+        self.assertEqual(resp.headers['Content-Type'],
+                         'text/plain; charset=utf-8')
+        self.assertEqual(resp.headers['Vary'], 'Accept')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'HEAD', '/v1/a?format=json'))
+
+    def test_valid_account_with_reserved(self):
+        body_len = len(self.fake_account_listing_with_reserved)
+        self.fake_swift.register(
+            'GET', '/v1/a\xe2\x98\x83', HTTPOk, {
+                'Content-Length': str(body_len),
+                'Content-Type': 'application/json',
+            }, self.fake_account_listing_with_reserved)
+
+        req = Request.blank('/v1/a\xe2\x98\x83')
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.body, b'bar\nfoo_\nfoobar\nnobar\n')
+        self.assertEqual(resp.headers['Content-Type'],
+                         'text/plain; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', '/v1/a\xe2\x98\x83?format=json'))
+        self.assertEqual(self.logger.get_lines_for_level('warning'), [
+            "Account listing for a%E2%98%83 had reserved byte in name: "
+            "'\\x00bar\\x00versions'",
+            "Account listing for a%E2%98%83 had reserved byte in subdir: "
+            "'\\x00foo_'",
+        ])
+
+        req = Request.blank('/v1/a\xe2\x98\x83', headers={
+            'X-Backend-Allow-Reserved-Names': 'true'})
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.body, b'bar\n%s\nfoo_\n%s\nfoobar\nnobar\n' % (
+            get_reserved_name('bar', 'versions').encode('ascii'),
+            get_reserved_name('foo_').encode('ascii'),
+        ))
+        self.assertEqual(resp.headers['Content-Type'],
+                         'text/plain; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', '/v1/a\xe2\x98\x83?format=json'))
+
+        req = Request.blank('/v1/a\xe2\x98\x83?format=plain')
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.body, b'bar\nfoo_\nfoobar\nnobar\n')
+        self.assertEqual(resp.headers['Content-Type'],
+                         'text/plain; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', '/v1/a\xe2\x98\x83?format=json'))
+
+        req = Request.blank('/v1/a\xe2\x98\x83?format=plain', headers={
+            'X-Backend-Allow-Reserved-Names': 'true'})
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.body, b'bar\n%s\nfoo_\n%s\nfoobar\nnobar\n' % (
+            get_reserved_name('bar', 'versions').encode('ascii'),
+            get_reserved_name('foo_').encode('ascii'),
+        ))
+        self.assertEqual(resp.headers['Content-Type'],
+                         'text/plain; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', '/v1/a\xe2\x98\x83?format=json'))
+
+        req = Request.blank('/v1/a\xe2\x98\x83?format=json')
+        resp = req.get_response(self.app)
+        self.assertEqual(json.loads(resp.body),
+                         json.loads(self.fake_account_listing))
+        self.assertEqual(resp.headers['Content-Type'],
+                         'application/json; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', '/v1/a\xe2\x98\x83?format=json'))
+
+        req = Request.blank('/v1/a\xe2\x98\x83?format=json', headers={
+            'X-Backend-Allow-Reserved-Names': 'true'})
+        resp = req.get_response(self.app)
+        self.assertEqual(json.loads(resp.body),
+                         json.loads(self.fake_account_listing_with_reserved))
+        self.assertEqual(resp.headers['Content-Type'],
+                         'application/json; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', '/v1/a\xe2\x98\x83?format=json'))
+
+        req = Request.blank('/v1/a\xe2\x98\x83?format=xml')
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.body.split(b'\n'), [
+            b'<?xml version="1.0" encoding="UTF-8"?>',
+            b'<account name="a\xe2\x98\x83">',
+            b'<container><name>bar</name><count>0</count><bytes>0</bytes>'
+            b'<last_modified>1970-01-01T00:00:00.000000</last_modified>'
+            b'<storage_policy>%s</storage_policy>'
+            b'</container>' % TEST_POLICIES[0].encode('ascii'),
+            b'<subdir name="foo_" />',
+            b'<container><name>foobar</name><count>0</count><bytes>0</bytes>'
+            b'<last_modified>2025-01-01T00:00:00.000000</last_modified>'
+            b'<storage_policy>%s</storage_policy>'
+            b'</container>' % TEST_POLICIES[1].encode('ascii'),
+            b'<container><name>nobar</name><count>0</count><bytes>0</bytes>'
+            b'<last_modified>2025-02-01T00:00:00.000000</last_modified>'
+            b'</container>',
+            b'</account>',
+        ])
+        self.assertEqual(resp.headers['Content-Type'],
+                         'application/xml; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', '/v1/a\xe2\x98\x83?format=json'))
+
+        req = Request.blank('/v1/a\xe2\x98\x83?format=xml', headers={
+            'X-Backend-Allow-Reserved-Names': 'true'})
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.body.split(b'\n'), [
+            b'<?xml version="1.0" encoding="UTF-8"?>',
+            b'<account name="a\xe2\x98\x83">',
+            b'<container><name>bar</name><count>0</count><bytes>0</bytes>'
+            b'<last_modified>1970-01-01T00:00:00.000000</last_modified>'
+            b'<storage_policy>%s</storage_policy>'
+            b'</container>' % TEST_POLICIES[0].encode('ascii'),
+            b'<container><name>%s</name>'
+            b'<count>0</count><bytes>0</bytes>'
+            b'<last_modified>1970-01-01T00:00:00.000000</last_modified>'
+            b'<storage_policy>%s</storage_policy>'
+            b'</container>' % (
+                get_reserved_name('bar', 'versions').encode('ascii'),
+                TEST_POLICIES[0].encode('ascii'),
+            ),
+            b'<subdir name="foo_" />',
+            b'<subdir name="%s" />' % get_reserved_name(
+                'foo_').encode('ascii'),
+            b'<container><name>foobar</name><count>0</count><bytes>0</bytes>'
+            b'<last_modified>2025-01-01T00:00:00.000000</last_modified>'
+            b'<storage_policy>%s</storage_policy>'
+            b'</container>' % TEST_POLICIES[1].encode('ascii'),
+            b'<container><name>nobar</name><count>0</count><bytes>0</bytes>'
+            b'<last_modified>2025-02-01T00:00:00.000000</last_modified>'
+            b'</container>',
+            b'</account>',
+        ])
+        self.assertEqual(resp.headers['Content-Type'],
+                         'application/xml; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', '/v1/a\xe2\x98\x83?format=json'))
+
+    def test_valid_container(self):
+        self.fake_swift.register('GET', '/v1/a/c', HTTPOk, {
+            'Content-Length': str(len(self.fake_container_listing)),
+            'Content-Type': 'application/json'}, self.fake_container_listing)
+
+        req = Request.blank('/v1/a/c')
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.body, b'bar\nfoo/\n')
+        self.assertEqual(resp.headers['Content-Type'],
+                         'text/plain; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', '/v1/a/c?format=json'))
+
+        req = Request.blank('/v1/a/c?format=plain')
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.body, b'bar\nfoo/\n')
+        self.assertEqual(resp.headers['Content-Type'],
+                         'text/plain; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', '/v1/a/c?format=json'))
+
+        req = Request.blank('/v1/a/c?format=json')
+        resp = req.get_response(self.app)
+        self.assertEqual(json.loads(resp.body),
+                         json.loads(self.fake_container_listing))
+        self.assertEqual(resp.headers['Content-Type'],
+                         'application/json; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', '/v1/a/c?format=json'))
+
+        req = Request.blank('/v1/a/c?format=xml')
+        resp = req.get_response(self.app)
+        self.assertEqual(
+            resp.body,
+            b'<?xml version="1.0" encoding="UTF-8"?>\n'
+            b'<container name="c">'
+            b'<object><name>bar</name><hash>etag</hash><bytes>0</bytes>'
+            b'<content_type>text/plain</content_type>'
+            b'<last_modified>1970-01-01T00:00:00.000000</last_modified>'
+            b'</object>'
+            b'<subdir name="foo/"><name>foo/</name></subdir>'
+            b'</container>'
+        )
+        self.assertEqual(resp.headers['Content-Type'],
+                         'application/xml; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', '/v1/a/c?format=json'))
+
+    def test_valid_container_with_reserved(self):
+        path = '/v1/a\xe2\x98\x83/c\xf0\x9f\x8c\xb4'
+        body_len = len(self.fake_container_listing_with_reserved)
+        self.fake_swift.register(
+            'GET', path, HTTPOk, {
+                'Content-Length': str(body_len),
+                'Content-Type': 'application/json',
+            }, self.fake_container_listing_with_reserved)
+
+        req = Request.blank(path)
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.body, b'bar\nfoo/\n')
+        self.assertEqual(resp.headers['Content-Type'],
+                         'text/plain; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', path + '?format=json'))
+        self.assertEqual(self.logger.get_lines_for_level('warning'), [
+            "Container listing for a%E2%98%83/c%F0%9F%8C%B4 had reserved byte "
+            "in name: '\\x00bar\\x00extra data'",
+            "Container listing for a%E2%98%83/c%F0%9F%8C%B4 had reserved byte "
+            "in subdir: '\\x00foo/'",
+        ])
+
+        req = Request.blank(path, headers={
+            'X-Backend-Allow-Reserved-Names': 'true'})
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.body, b'bar\n%s\nfoo/\n%s\n' % (
+            get_reserved_name('bar', 'extra data').encode('ascii'),
+            get_reserved_name('foo/').encode('ascii'),
+        ))
+        self.assertEqual(resp.headers['Content-Type'],
+                         'text/plain; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', path + '?format=json'))
+
+        req = Request.blank(path + '?format=plain')
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.body, b'bar\nfoo/\n')
+        self.assertEqual(resp.headers['Content-Type'],
+                         'text/plain; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', path + '?format=json'))
+
+        req = Request.blank(path + '?format=plain', headers={
+            'X-Backend-Allow-Reserved-Names': 'true'})
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.body, b'bar\n%s\nfoo/\n%s\n' % (
+            get_reserved_name('bar', 'extra data').encode('ascii'),
+            get_reserved_name('foo/').encode('ascii'),
+        ))
+        self.assertEqual(resp.headers['Content-Type'],
+                         'text/plain; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', path + '?format=json'))
+
+        req = Request.blank(path + '?format=json')
+        resp = req.get_response(self.app)
+        self.assertEqual(json.loads(resp.body),
+                         json.loads(self.fake_container_listing))
+        self.assertEqual(resp.headers['Content-Type'],
+                         'application/json; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', path + '?format=json'))
+
+        req = Request.blank(path + '?format=json', headers={
+            'X-Backend-Allow-Reserved-Names': 'true'})
+        resp = req.get_response(self.app)
+        self.assertEqual(json.loads(resp.body),
+                         json.loads(self.fake_container_listing_with_reserved))
+        self.assertEqual(resp.headers['Content-Type'],
+                         'application/json; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', path + '?format=json'))
+
+        req = Request.blank(path + '?format=xml')
+        resp = req.get_response(self.app)
+        self.assertEqual(
+            resp.body,
+            b'<?xml version="1.0" encoding="UTF-8"?>\n'
+            b'<container name="c\xf0\x9f\x8c\xb4">'
+            b'<object><name>bar</name><hash>etag</hash><bytes>0</bytes>'
+            b'<content_type>text/plain</content_type>'
+            b'<last_modified>1970-01-01T00:00:00.000000</last_modified>'
+            b'</object>'
+            b'<subdir name="foo/"><name>foo/</name></subdir>'
+            b'</container>'
+        )
+        self.assertEqual(resp.headers['Content-Type'],
+                         'application/xml; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', path + '?format=json'))
+
+        req = Request.blank(path + '?format=xml', headers={
+            'X-Backend-Allow-Reserved-Names': 'true'})
+        resp = req.get_response(self.app)
+        self.assertEqual(
+            resp.body,
+            b'<?xml version="1.0" encoding="UTF-8"?>\n'
+            b'<container name="c\xf0\x9f\x8c\xb4">'
+            b'<object><name>bar</name><hash>etag</hash><bytes>0</bytes>'
+            b'<content_type>text/plain</content_type>'
+            b'<last_modified>1970-01-01T00:00:00.000000</last_modified>'
+            b'</object>'
+            b'<object><name>%s</name>'
+            b'<hash>etag</hash><bytes>0</bytes>'
+            b'<content_type>text/plain</content_type>'
+            b'<last_modified>1970-01-01T00:00:00.000000</last_modified>'
+            b'</object>'
+            b'<subdir name="foo/"><name>foo/</name></subdir>'
+            b'<subdir name="%s"><name>%s</name></subdir>'
+            b'</container>' % (
+                get_reserved_name('bar', 'extra data').encode('ascii'),
+                get_reserved_name('foo/').encode('ascii'),
+                get_reserved_name('foo/').encode('ascii'),
+            ))
+        self.assertEqual(resp.headers['Content-Type'],
+                         'application/xml; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', path + '?format=json'))
+
+    def test_blank_account(self):
+        self.fake_swift.register('GET', '/v1/a', HTTPOk, {
+            'Content-Length': '2', 'Content-Type': 'application/json'}, b'[]')
+
+        req = Request.blank('/v1/a')
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.status, '204 No Content')
+        self.assertEqual(resp.body, b'')
+        self.assertEqual(resp.headers['Content-Type'],
+                         'text/plain; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', '/v1/a?format=json'))
+
+        req = Request.blank('/v1/a?format=plain')
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.status, '204 No Content')
+        self.assertEqual(resp.body, b'')
+        self.assertEqual(resp.headers['Content-Type'],
+                         'text/plain; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', '/v1/a?format=json'))
+
+        req = Request.blank('/v1/a?format=json')
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.status, '200 OK')
+        self.assertEqual(resp.body, b'[]')
+        self.assertEqual(resp.headers['Content-Type'],
+                         'application/json; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', '/v1/a?format=json'))
+
+        req = Request.blank('/v1/a?format=xml')
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.status, '200 OK')
+        self.assertEqual(resp.body.split(b'\n'), [
+            b'<?xml version="1.0" encoding="UTF-8"?>',
+            b'<account name="a">',
+            b'</account>',
+        ])
+        self.assertEqual(resp.headers['Content-Type'],
+                         'application/xml; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', '/v1/a?format=json'))
+
+    def test_blank_container(self):
+        self.fake_swift.register('GET', '/v1/a/c', HTTPOk, {
+            'Content-Length': '2', 'Content-Type': 'application/json'}, b'[]')
+
+        req = Request.blank('/v1/a/c')
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.status, '204 No Content')
+        self.assertEqual(resp.body, b'')
+        self.assertEqual(resp.headers['Content-Type'],
+                         'text/plain; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', '/v1/a/c?format=json'))
+
+        req = Request.blank('/v1/a/c?format=plain')
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.status, '204 No Content')
+        self.assertEqual(resp.body, b'')
+        self.assertEqual(resp.headers['Content-Type'],
+                         'text/plain; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', '/v1/a/c?format=json'))
+
+        req = Request.blank('/v1/a/c?format=json')
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.status, '200 OK')
+        self.assertEqual(resp.body, b'[]')
+        self.assertEqual(resp.headers['Content-Type'],
+                         'application/json; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', '/v1/a/c?format=json'))
+
+        req = Request.blank('/v1/a/c?format=xml')
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.status, '200 OK')
+        self.assertEqual(resp.body.split(b'\n'), [
+            b'<?xml version="1.0" encoding="UTF-8"?>',
+            b'<container name="c" />',
+        ])
+        self.assertEqual(resp.headers['Content-Type'],
+                         'application/xml; charset=utf-8')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', '/v1/a/c?format=json'))
+
+    def test_pass_through(self):
+        def do_test(path):
+            self.fake_swift.register(
+                'GET', path, HTTPOk, {
+                    'Content-Length': str(len(self.fake_container_listing)),
+                    'Content-Type': 'application/json'},
+                self.fake_container_listing)
+            req = Request.blank(path + '?format=xml')
+            resp = req.get_response(self.app)
+            self.assertEqual(resp.body, self.fake_container_listing)
+            self.assertEqual(resp.headers['Content-Type'], 'application/json')
+            self.assertEqual(self.fake_swift.calls[-1], (
+                'GET', path + '?format=xml'))  # query param is unchanged
+
+        do_test('/')
+        do_test('/v1')
+        do_test('/auth/v1.0')
+        do_test('/v1/a/c/o')
+
+    def test_static_web_not_json(self):
+        body = b'doesnt matter'
+        self.fake_swift.register(
+            'GET', '/v1/staticweb/not-json', HTTPOk,
+            {'Content-Length': str(len(body)),
+             'Content-Type': 'text/plain'},
+            body)
+
+        resp = Request.blank('/v1/staticweb/not-json').get_response(self.app)
+        self.assertEqual(resp.body, body)
+        self.assertEqual(resp.headers['Content-Type'], 'text/plain')
+        # We *did* try, though
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', '/v1/staticweb/not-json?format=json'))
+        # TODO: add a similar test that has *no* content-type
+        # FakeSwift seems to make this hard to do
+
+    def test_static_web_not_really_json(self):
+        body = b'raises ValueError'
+        self.fake_swift.register(
+            'GET', '/v1/staticweb/not-json', HTTPOk,
+            {'Content-Length': str(len(body)),
+             'Content-Type': 'application/json'},
+            body)
+
+        resp = Request.blank('/v1/staticweb/not-json').get_response(self.app)
+        self.assertEqual(resp.body, body)
+        self.assertEqual(resp.headers['Content-Type'], 'application/json')
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', '/v1/staticweb/not-json?format=json'))
+
+    def test_static_web_pretend_to_be_giant_json(self):
+        body = json.dumps([
+            {'name': 'bar', 'hash': 'etag', 'bytes': 0,
+             'content_type': 'text/plain',
+             'last_modified': '1970-01-01T00:00:00.000000',
+             'storage_policy': TEST_POLICIES[0]},
+            {'subdir': 'foo/'},
+            {'name': 'foobar', 'hash': 'etag', 'bytes': 0,
+             'content_type': 'text/plain',
+             'last_modified': '2025-01-01T00:00:00.000000',
+             'storage_policy': TEST_POLICIES[1]},
+            {'name': 'nobar', 'hash': 'etag', 'bytes': 0,
+             'content_type': 'text/plain',
+             'last_modified': '2025-02-01T00:00:00.000000'},
+        ] * 160000).encode('ascii')
+        self.assertGreater(  # sanity
+            len(body), listing_formats.MAX_CONTAINER_LISTING_CONTENT_LENGTH)
+
+        self.fake_swift.register(
+            'GET', '/v1/staticweb/long-json', HTTPOk,
+            {'Content-Type': 'application/json'},
+            body)
+
+        resp = Request.blank('/v1/staticweb/long-json').get_response(self.app)
+        self.assertEqual(resp.headers['Content-Type'], 'application/json')
+        self.assertEqual(resp.body, body)
+        self.assertEqual(self.fake_swift.calls[-1], (
+            'GET', '/v1/staticweb/long-json?format=json'))
+        # TODO: add a similar test for chunked transfers
+        # (staticweb referencing a DLO that doesn't fit in a single listing?)
+
+    def test_static_web_bad_json(self):
+        def do_test(body_obj):
+            body = json.dumps(body_obj).encode('ascii')
+            self.fake_swift.register(
+                'GET', '/v1/staticweb/bad-json', HTTPOk,
+                {'Content-Length': str(len(body)),
+                 'Content-Type': 'application/json'},
+                body)
+
+            def do_sub_test(path):
+                resp = Request.blank(path).get_response(self.app)
+                self.assertEqual(resp.body, body)
+                # NB: no charset is added; we pass through whatever we got
+                self.assertEqual(resp.headers['Content-Type'],
+                                 'application/json')
+                self.assertEqual(self.fake_swift.calls[-1], (
+                    'GET', '/v1/staticweb/bad-json?format=json'))
+
+            do_sub_test('/v1/staticweb/bad-json')
+            do_sub_test('/v1/staticweb/bad-json?format=plain')
+            do_sub_test('/v1/staticweb/bad-json?format=xml')
+            do_sub_test('/v1/staticweb/bad-json?format=json')
+
+        do_test({})
+        do_test({'non-empty': 'hash'})
+        do_test(None)
+        do_test(0)
+        do_test('some string')
+        do_test([None])
+        do_test([0])
+        do_test(['some string'])
+
+    def test_static_web_bad_but_not_terrible_json(self):
+        body = json.dumps([{'no name': 'nor subdir'}]).encode('ascii')
+        self.fake_swift.register(
+            'GET', '/v1/staticweb/bad-json', HTTPOk,
+            {'Content-Length': str(len(body)),
+             'Content-Type': 'application/json'},
+            body)
+
+        def do_test(path, expect_charset=False):
+            resp = Request.blank(path).get_response(self.app)
+            self.assertEqual(resp.body, body)
+            if expect_charset:
+                self.assertEqual(resp.headers['Content-Type'],
+                                 'application/json; charset=utf-8')
+            else:
+                self.assertEqual(resp.headers['Content-Type'],
+                                 'application/json')
+            self.assertEqual(self.fake_swift.calls[-1], (
+                'GET', '/v1/staticweb/bad-json?format=json'))
+
+        do_test('/v1/staticweb/bad-json')
+        do_test('/v1/staticweb/bad-json?format=plain')
+        do_test('/v1/staticweb/bad-json?format=xml')
+        # The response we get is *just close enough* to being valid that we
+        # assume it is and slap on the missing charset. If you set up staticweb
+        # to serve back such responses, your clients are already hosed.
+        do_test('/v1/staticweb/bad-json?format=json', expect_charset=True)
diff --git a/test/unit/common/middleware/test_memcache.py b/test/unit/common/middleware/test_memcache.py
index c07d7f5be6..e1edfbee9e 100644
--- a/test/unit/common/middleware/test_memcache.py
+++ b/test/unit/common/middleware/test_memcache.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,12 +13,19 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
+import os
+from textwrap import dedent
 import unittest
-from ConfigParser import NoSectionError, NoOptionError
+
+from eventlet.green import ssl
+from unittest import mock
 
 from swift.common.middleware import memcache
 from swift.common.memcached import MemcacheRing
 from swift.common.swob import Request
+from swift.common.wsgi import loadapp
+
+from test.unit import with_tempdir, patch_policies
 
 
 class FakeApp(object):
@@ -26,38 +33,10 @@ def __call__(self, env, start_response):
         return env
 
 
-class ExcConfigParser(object):
-
-    def read(self, path):
-        raise Exception('read called with %r' % path)
-
-
-class EmptyConfigParser(object):
-
-    def read(self, path):
-        return False
-
-
-class SetConfigParser(object):
-
-    def read(self, path):
-        return True
-
-    def get(self, section, option):
-        if section == 'memcache':
-            if option == 'memcache_servers':
-                return '1.2.3.4:5'
-            elif option == 'memcache_serialization_support':
-                return '1'
-            else:
-                raise NoOptionError(option)
-        else:
-            raise NoSectionError(option)
-
-
 def start_response(*args):
     pass
 
+
 class TestCacheMiddleware(unittest.TestCase):
 
     def setUp(self):
@@ -67,70 +46,148 @@ def test_cache_middleware(self):
         req = Request.blank('/something', environ={'REQUEST_METHOD': 'GET'})
         resp = self.app(req.environ, start_response)
         self.assertTrue('swift.cache' in resp)
-        self.assertTrue(isinstance(resp['swift.cache'], MemcacheRing))
-
-    def test_conf_default_read(self):
-        orig_parser = memcache.ConfigParser
-        memcache.ConfigParser = ExcConfigParser
-        exc = None
-        try:
-            app = memcache.MemcacheMiddleware(FakeApp(), {})
-        except Exception, err:
-            exc = err
-        finally:
-            memcache.ConfigParser = orig_parser
-        self.assertEquals(str(exc),
-            "read called with '/etc/swift/memcache.conf'")
-
-    def test_conf_set_no_read(self):
-        orig_parser = memcache.ConfigParser
-        memcache.ConfigParser = ExcConfigParser
-        exc = None
-        try:
-            app = memcache.MemcacheMiddleware(
-                    FakeApp(), {'memcache_servers': '1.2.3.4:5',
-                                'memcache_serialization_support': '2'})
-        except Exception, err:
-            exc = err
-        finally:
-            memcache.ConfigParser = orig_parser
-        self.assertEquals(exc, None)
-
-    def test_conf_default(self):
-        orig_parser = memcache.ConfigParser
-        memcache.ConfigParser = EmptyConfigParser
-        try:
-            app = memcache.MemcacheMiddleware(FakeApp(), {})
-        finally:
-            memcache.ConfigParser = orig_parser
-        self.assertEquals(app.memcache_servers, '127.0.0.1:11211')
-        self.assertEquals(app.memcache._allow_pickle, False)
-        self.assertEquals(app.memcache._allow_unpickle, False)
-
-    def test_conf_from_extra_conf(self):
-        orig_parser = memcache.ConfigParser
-        memcache.ConfigParser = SetConfigParser
-        try:
-            app = memcache.MemcacheMiddleware(FakeApp(), {})
-        finally:
-            memcache.ConfigParser = orig_parser
-        self.assertEquals(app.memcache_servers, '1.2.3.4:5')
-        self.assertEquals(app.memcache._allow_pickle, False)
-        self.assertEquals(app.memcache._allow_unpickle, True)
-
-    def test_conf_from_inline_conf(self):
-        orig_parser = memcache.ConfigParser
-        memcache.ConfigParser = SetConfigParser
-        try:
-            app = memcache.MemcacheMiddleware(
-                    FakeApp(),
-                    {'memcache_servers': '6.7.8.9:10',
-                     'serialization_format': '0'})
-        finally:
-            memcache.ConfigParser = orig_parser
-        self.assertEquals(app.memcache_servers, '6.7.8.9:10')
-        self.assertEquals(app.memcache._allow_pickle, False)
-        self.assertEquals(app.memcache._allow_unpickle, True)
+        self.assertIsInstance(resp['swift.cache'], MemcacheRing)
+
+    def test_filter_factory(self):
+        factory = memcache.filter_factory({'max_connections': '3'},
+                                          memcache_servers='10.10.10.10:10')
+        thefilter = factory('myapp')
+        self.assertEqual(thefilter.app, 'myapp')
+        self.assertEqual(thefilter.memcache.memcache_servers,
+                         ['10.10.10.10:10'])
+        self.assertEqual(
+            thefilter.memcache._client_cache['10.10.10.10:10'].max_size, 3)
+
+    @patch_policies
+    def _loadapp(self, proxy_config_path):
+        """
+        Load a proxy from an app.conf to get the memcache_ring
+
+        :returns: the memcache_ring of the memcache middleware filter
+        """
+        with mock.patch('swift.proxy.server.Ring'):
+            app = loadapp(proxy_config_path)
+        memcache_ring = None
+        while True:
+            memcache_ring = getattr(app, 'memcache', None)
+            if memcache_ring:
+                break
+            app = app.app
+        return memcache_ring
+
+    @with_tempdir
+    def test_real_config(self, tempdir):
+        config = """
+        [pipeline:main]
+        pipeline = cache proxy-server
+
+        [app:proxy-server]
+        use = egg:swift#proxy
+
+        [filter:cache]
+        use = egg:swift#memcache
+        """
+        config_path = os.path.join(tempdir, 'test.conf')
+        with open(config_path, 'w') as f:
+            f.write(dedent(config))
+        memcache_ring = self._loadapp(config_path)
+        # only one server by default
+        self.assertEqual(list(memcache_ring._client_cache.keys()),
+                         ['127.0.0.1:11211'])
+        # extra options
+        self.assertEqual(memcache_ring._connect_timeout, 0.3)
+        self.assertEqual(memcache_ring._pool_timeout, 1.0)
+        # tries is limited to server count
+        self.assertEqual(memcache_ring._tries, 1)
+        self.assertEqual(memcache_ring._io_timeout, 2.0)
+        self.assertEqual(memcache_ring.item_size_warning_threshold, -1)
+
+    @with_tempdir
+    def test_real_config_with_options(self, tempdir):
+        config = """
+        [pipeline:main]
+        pipeline = cache proxy-server
+
+        [app:proxy-server]
+        use = egg:swift#proxy
+
+        [filter:cache]
+        use = egg:swift#memcache
+        memcache_servers = 10.0.0.1:11211,10.0.0.2:11211,10.0.0.3:11211,
+            10.0.0.4:11211
+        connect_timeout = 1.0
+        pool_timeout = 0.5
+        tries = 4
+        io_timeout = 1.0
+        tls_enabled = true
+        item_size_warning_threshold = 1000
+        """
+        config_path = os.path.join(tempdir, 'test.conf')
+        with open(config_path, 'w') as f:
+            f.write(dedent(config))
+        memcache_ring = self._loadapp(config_path)
+        self.assertEqual(sorted(memcache_ring._client_cache.keys()),
+                         ['10.0.0.%d:11211' % i for i in range(1, 5)])
+        # extra options
+        self.assertEqual(memcache_ring._connect_timeout, 1.0)
+        self.assertEqual(memcache_ring._pool_timeout, 0.5)
+        # tries is limited to server count
+        self.assertEqual(memcache_ring._tries, 4)
+        self.assertEqual(memcache_ring._io_timeout, 1.0)
+        self.assertEqual(memcache_ring._error_limit_count, 10)
+        self.assertEqual(memcache_ring._error_limit_time, 60)
+        self.assertEqual(memcache_ring._error_limit_duration, 60)
+        self.assertIsInstance(
+            list(memcache_ring._client_cache.values())[0]._tls_context,
+            ssl.SSLContext)
+        self.assertEqual(memcache_ring.item_size_warning_threshold, 1000)
+
+    @with_tempdir
+    def test_real_memcache_config(self, tempdir):
+        proxy_config = """
+        [DEFAULT]
+        swift_dir = %s
+
+        [pipeline:main]
+        pipeline = cache proxy-server
+
+        [app:proxy-server]
+        use = egg:swift#proxy
+
+        [filter:cache]
+        use = egg:swift#memcache
+        connect_timeout = 1.0
+        """ % tempdir
+        proxy_config_path = os.path.join(tempdir, 'test.conf')
+        with open(proxy_config_path, 'w') as f:
+            f.write(dedent(proxy_config))
+
+        memcache_config = """
+        [memcache]
+        memcache_servers = 10.0.0.1:11211,10.0.0.2:11211,10.0.0.3:11211,
+            10.0.0.4:11211
+        connect_timeout = 0.5
+        io_timeout = 1.0
+        error_suppression_limit = 0
+        error_suppression_interval = 1.5
+        item_size_warning_threshold = 50
+        """
+        memcache_config_path = os.path.join(tempdir, 'memcache.conf')
+        with open(memcache_config_path, 'w') as f:
+            f.write(dedent(memcache_config))
+        memcache_ring = self._loadapp(proxy_config_path)
+        self.assertEqual(sorted(memcache_ring._client_cache.keys()),
+                         ['10.0.0.%d:11211' % i for i in range(1, 5)])
+        # proxy option takes precedence
+        self.assertEqual(memcache_ring._connect_timeout, 1.0)
+        # default tries are not limited by servers
+        self.assertEqual(memcache_ring._tries, 3)
+        # memcache conf options are defaults
+        self.assertEqual(memcache_ring._io_timeout, 1.0)
+        self.assertEqual(memcache_ring._error_limit_count, 0)
+        self.assertEqual(memcache_ring._error_limit_time, 1.5)
+        self.assertEqual(memcache_ring._error_limit_duration, 1.5)
+        self.assertEqual(memcache_ring.item_size_warning_threshold, 50)
 
 
 if __name__ == '__main__':
diff --git a/test/unit/common/middleware/test_name_check.py b/test/unit/common/middleware/test_name_check.py
index 1aa77bc7aa..09c97f39ed 100644
--- a/test/unit/common/middleware/test_name_check.py
+++ b/test/unit/common/middleware/test_name_check.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2012 OpenStack, LLC.
+# Copyright (c) 2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -21,14 +21,16 @@
 @author: eamonn-otoole
 '''
 
+import numbers
 import unittest
 
 from swift.common.swob import Request, Response
 from swift.common.middleware import name_check
+from swift.common import registry
 
 MAX_LENGTH = 255
 FORBIDDEN_CHARS = '\'\"<>`'
-FORBIDDEN_REGEXP = "/\./|/\.\./|/\.$|/\.\.$"
+FORBIDDEN_REGEXP = r"/\./|/\.\./|/\.$|/\.\.$"
 
 
 class FakeApp(object):
@@ -48,44 +50,102 @@ def test_valid_length_and_character(self):
         path = '/V1.0/' + 'c' * (MAX_LENGTH - 6)
         resp = Request.blank(path, environ={'REQUEST_METHOD': 'PUT'}
                              ).get_response(self.test_check)
-        self.assertEquals(resp.body, 'OK')
+        self.assertEqual(resp.body, b'OK')
 
     def test_invalid_character(self):
         for c in self.conf['forbidden_chars']:
             path = '/V1.0/1234' + c + '5'
-            resp = Request.blank(path, environ={'REQUEST_METHOD': 'PUT'}
-                             ).get_response(self.test_check)
-            self.assertEquals(resp.body,
-                    ("Object/Container name contains forbidden chars from %s"
-                    % self.conf['forbidden_chars']))
-            self.assertEquals(resp.status_int, 400)
+            resp = Request.blank(
+                path, environ={'REQUEST_METHOD': 'PUT'}).get_response(
+                    self.test_check)
+            self.assertEqual(
+                resp.body,
+                ("Object/Container/Account name contains forbidden chars "
+                 "from %s" % self.conf['forbidden_chars']).encode('utf8'))
+            self.assertEqual(resp.status_int, 400)
+
+    def test_maximum_length_from_config(self):
+        # test invalid length
+        app = name_check.filter_factory({'maximum_length': "500"})(FakeApp())
+        path = '/V1.0/a/c/' + 'o' * (500 - 9)
+        resp = Request.blank(path, environ={'REQUEST_METHOD': 'PUT'}
+                             ).get_response(app)
+        self.assertEqual(
+            resp.body,
+            ("Object/Container/Account name longer than the allowed "
+             "maximum 500").encode('utf-8'))
+        self.assertEqual(resp.status_int, 400)
+
+        # test valid length
+        path = '/V1.0/a/c/' + 'o' * (500 - 10)
+        resp = Request.blank(path, environ={'REQUEST_METHOD': 'PUT'}
+                             ).get_response(app)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.body, b'OK')
 
     def test_invalid_length(self):
         path = '/V1.0/' + 'c' * (MAX_LENGTH - 5)
         resp = Request.blank(path, environ={'REQUEST_METHOD': 'PUT'}
                              ).get_response(self.test_check)
-        self.assertEquals(resp.body,
-                    ("Object/Container name longer than the allowed maximum %s"
-                    % self.conf['maximum_length']))
-        self.assertEquals(resp.status_int, 400)
+        self.assertEqual(
+            resp.body,
+            ("Object/Container/Account name longer than the allowed maximum %s"
+             % self.conf['maximum_length']).encode('utf-8'))
+        self.assertEqual(resp.status_int, 400)
 
     def test_invalid_regexp(self):
-        for s in ['/.', '/..', '/./foo', '/../foo']:
+        for s in [r'/.', r'/..', r'/./foo', r'/../foo']:
             path = '/V1.0/' + s
-            resp = Request.blank(path, environ={'REQUEST_METHOD': 'PUT'}
-                             ).get_response(self.test_check)
-            self.assertEquals(resp.body,
-                    ("Object/Container name contains a forbidden substring "
-                     "from regular expression %s"
-                     % self.conf['forbidden_regexp']))
-            self.assertEquals(resp.status_int, 400)
+            resp = Request.blank(
+                path, environ={'REQUEST_METHOD': 'PUT'}).get_response(
+                    self.test_check)
+            self.assertEqual(
+                resp.body,
+                ("Object/Container/Account name contains a forbidden "
+                 "substring from regular expression %s"
+                 % self.conf['forbidden_regexp']).encode('utf-8'))
+            self.assertEqual(resp.status_int, 400)
 
     def test_valid_regexp(self):
-        for s in ['/...', '/.\.', '/foo']:
+        for s in [r'/...', r'/.\.', r'/foo']:
             path = '/V1.0/' + s
-            resp = Request.blank(path, environ={'REQUEST_METHOD': 'PUT'}
-                             ).get_response(self.test_check)
-            self.assertEquals(resp.body, 'OK')
+            resp = Request.blank(
+                path, environ={'REQUEST_METHOD': 'PUT'}).get_response(
+                    self.test_check)
+            self.assertEqual(resp.body, b'OK')
+
+
+class TestSwiftInfo(unittest.TestCase):
+    def setUp(self):
+        registry._swift_info = {}
+        registry._swift_admin_info = {}
+
+    def test_registered_defaults(self):
+        name_check.filter_factory({})(FakeApp())
+        swift_info = registry.get_swift_info()
+        self.assertTrue('name_check' in swift_info)
+        self.assertTrue(isinstance(
+            swift_info['name_check'].get('maximum_length'),
+            numbers.Integral))
+        self.assertTrue(isinstance(
+            swift_info['name_check'].get('forbidden_chars'),
+            str))
+        self.assertTrue(isinstance(
+            swift_info['name_check'].get('forbidden_regexp'),
+            str))
+
+    def test_registered_configured_options(self):
+        conf = {'maximum_length': 512,
+                'forbidden_chars': '\'\"`',
+                'forbidden_regexp': r"/\./|/\.\./|/\.$"}
+        name_check.filter_factory(conf)(FakeApp())
+        swift_info = registry.get_swift_info()
+        self.assertTrue('name_check' in swift_info)
+        self.assertEqual(swift_info['name_check'].get('maximum_length'), 512)
+        self.assertEqual(set(swift_info['name_check'].get('forbidden_chars')),
+                         set('\'\"`'))
+        self.assertEqual(swift_info['name_check'].get('forbidden_regexp'),
+                         r"/\./|/\.\./|/\.$")
 
 
 if __name__ == '__main__':
diff --git a/test/unit/common/middleware/test_object_versioning.py b/test/unit/common/middleware/test_object_versioning.py
new file mode 100644
index 0000000000..cecfc05762
--- /dev/null
+++ b/test/unit/common/middleware/test_object_versioning.py
@@ -0,0 +1,3389 @@
+# Copyright (c) 2019 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import functools
+import json
+import os
+import time
+import unittest
+import urllib.parse
+from swift.common import swob, utils
+from swift.common.middleware import versioned_writes, copy, symlink, \
+    listing_formats
+from swift.common.swob import Request, wsgi_quote, str_to_wsgi, \
+    date_header_format
+from swift.common.middleware.symlink import TGT_OBJ_SYSMETA_SYMLINK_HDR, \
+    ALLOW_RESERVED_NAMES, SYMLOOP_EXTEND
+from swift.common.middleware.versioned_writes.object_versioning import \
+    SYSMETA_VERSIONS_CONT, SYSMETA_VERSIONS_ENABLED, \
+    SYSMETA_VERSIONS_SYMLINK, DELETE_MARKER_CONTENT_TYPE
+from swift.common.request_helpers import get_reserved_name
+from swift.common.storage_policy import StoragePolicy
+from swift.common.utils import md5
+from swift.common.utils.timestamp import Timestamp
+from swift.proxy.controllers.base import get_cache_key
+from test.unit import patch_policies, FakeMemcache, make_timestamp_iter, \
+    mock_timestamp_now
+from test.unit.common.middleware.helpers import FakeSwift
+
+
+def local_tz(func):
+    '''
+    Decorator to change the timezone when running a test.
+
+    This uses the Eastern Time Zone definition from the time module's docs.
+    Note that the timezone affects things like time.time() and time.mktime().
+    '''
+    @functools.wraps(func)
+    def wrapper(*args, **kwargs):
+        tz = os.environ.get('TZ', '')
+        try:
+            os.environ['TZ'] = 'EST+05EDT,M4.1.0,M10.5.0'
+            time.tzset()
+            return func(*args, **kwargs)
+        finally:
+            os.environ['TZ'] = tz
+            time.tzset()
+    return wrapper
+
+
+class ObjectVersioningBaseTestCase(unittest.TestCase):
+    def setUp(self):
+        self.app = FakeSwift()
+        conf = {}
+        self.sym = symlink.filter_factory(conf)(self.app)
+        self.sym.logger = self.app.logger
+        self.ov = versioned_writes.object_versioning.\
+            ObjectVersioningMiddleware(self.sym, conf)
+        self.ov.logger = self.app.logger
+        self.cp = copy.filter_factory({})(self.ov)
+        self.lf = listing_formats.ListingFilter(self.cp, {}, self.app.logger)
+
+        self.ts = make_timestamp_iter()
+        cont_cache_version_on = {'sysmeta': {
+            'versions-container': self.build_container_name('c'),
+            'versions-enabled': 'true'}}
+        self.cache_version_on = FakeMemcache()
+        self.cache_version_on.set(get_cache_key('a'), {'status': 200})
+        self.cache_version_on.set(get_cache_key('a', 'c'),
+                                  cont_cache_version_on)
+        self.cache_version_on.set(
+            get_cache_key('a', self.build_container_name('c')),
+            {'status': 200})
+
+        self.cache_version_on_but_busted = FakeMemcache()
+        self.cache_version_on_but_busted.set(get_cache_key('a'),
+                                             {'status': 200})
+        self.cache_version_on_but_busted.set(get_cache_key('a', 'c'),
+                                             cont_cache_version_on)
+        self.cache_version_on_but_busted.set(
+            get_cache_key('a', self.build_container_name('c')),
+            {'status': 404})
+
+        cont_cache_version_off = {'sysmeta': {
+            'versions-container': self.build_container_name('c'),
+            'versions-enabled': 'false'}}
+        self.cache_version_off = FakeMemcache()
+        self.cache_version_off.set(get_cache_key('a'), {'status': 200})
+        self.cache_version_off.set(get_cache_key('a', 'c'),
+                                   cont_cache_version_off)
+        self.cache_version_off.set(
+            get_cache_key('a', self.build_container_name('c')),
+            {'status': 200})
+
+        self.cache_version_never_on = FakeMemcache()
+        self.cache_version_never_on.set(get_cache_key('a'), {'status': 200})
+        self.cache_version_never_on.set(get_cache_key('a', 'c'),
+                                        {'status': 200})
+        self.expected_unread_requests = {}
+
+    def tearDown(self):
+        self.assertEqual(self.app.unclosed_requests, {})
+        self.assertEqual(self.app.unread_requests,
+                         self.expected_unread_requests)
+
+    def call_ov(self, req):
+        # authorized gets reset everytime
+        self.authorized = []
+
+        def authorize(req):
+            self.authorized.append(req)
+
+        if 'swift.authorize' not in req.environ:
+            req.environ['swift.authorize'] = authorize
+
+        req.headers.setdefault("User-Agent", "Marula Kruger")
+
+        status = [None]
+        headers = [None]
+
+        def start_response(s, h, ei=None):
+            status[0] = s
+            headers[0] = h
+
+        body_iter = self.lf(req.environ, start_response)
+        with utils.closing_if_possible(body_iter):
+            body = b''.join(body_iter)
+
+        return status[0], headers[0], body
+
+    def assertRequestEqual(self, req, other):
+        self.assertEqual(req.method, other.method)
+        self.assertEqual(req.path, other.path)
+
+    def build_container_name(self, cont):
+        return get_reserved_name('versions', cont)
+
+    def build_object_name(self, obj, version):
+        return get_reserved_name(obj, version)
+
+    def build_symlink_path(self, cont, obj, version):
+        cont = self.build_container_name(cont)
+        obj = self.build_object_name(obj, version)
+        return wsgi_quote(str_to_wsgi("%s/%s" % (cont, obj)))
+
+    def build_versions_path(self, acc='a', cont='c', obj=None, version=None):
+        cont = self.build_container_name(cont)
+        if not obj:
+            return str_to_wsgi("/v1/%s/%s" % (acc, cont))
+        obj = self.build_object_name(obj, version)
+        return str_to_wsgi("/v1/%s/%s/%s" % (acc, cont, obj))
+
+
+class ObjectVersioningTestCase(ObjectVersioningBaseTestCase):
+
+    def test_put_container(self):
+        self.app.register('HEAD', '/v1/a', swob.HTTPOk, {}, '')
+        self.app.register('HEAD', '/v1/a/c', swob.HTTPOk, {}, '')
+        self.app.register('PUT', self.build_versions_path(), swob.HTTPOk, {},
+                          'passed')
+        self.app.register('PUT', '/v1/a/c', swob.HTTPAccepted, {}, 'passed')
+        req = Request.blank('/v1/a/c',
+                            headers={'X-Versions-Enabled': 'true'},
+                            environ={'REQUEST_METHOD': 'PUT'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '202 Accepted')
+
+        # check for sysmeta header
+        calls = self.app.calls_with_headers
+        self.assertEqual(4, len(calls))
+        method, path, headers = calls[3]
+        self.assertEqual('PUT', method)
+        self.assertEqual('/v1/a/c', path)
+        self.assertIn(SYSMETA_VERSIONS_CONT, headers)
+        self.assertEqual(headers[SYSMETA_VERSIONS_CONT],
+                         wsgi_quote(str_to_wsgi(
+                             self.build_container_name('c'))))
+        self.assertIn(SYSMETA_VERSIONS_ENABLED, headers)
+        self.assertEqual(headers[SYSMETA_VERSIONS_ENABLED], 'True')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+
+    @patch_policies([StoragePolicy(0, 'zero', True),
+                     StoragePolicy(1, 'one', False)])
+    def test_same_policy_as_existing_container(self):
+        self.app.register('GET', '/v1/a', swob.HTTPOk, {}, '')
+        self.app.register('GET', '/v1/a/c', swob.HTTPOk, {
+                          'x-backend-storage-policy-index': 1}, '')
+        self.app.register('PUT', self.build_versions_path(), swob.HTTPOk, {},
+                          'passed')
+        self.app.register('POST', '/v1/a/c', swob.HTTPNoContent, {}, '')
+        req = Request.blank('/v1/a/c',
+                            headers={'X-Versions-Enabled': 'true'},
+                            environ={'REQUEST_METHOD': 'POST'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '204 No Content')
+
+        # check for sysmeta header
+        calls = self.app.calls_with_headers
+        self.assertEqual(4, len(calls))
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+
+        # request to create versions container
+        method, path, headers = calls[2]
+        self.assertEqual('PUT', method)
+        self.assertEqual(self.build_versions_path(), path)
+        self.assertIn('X-Storage-Policy', headers)
+        self.assertEqual('one', headers['X-Storage-Policy'])
+
+        # request to enable versioning on primary container
+        method, path, headers = calls[3]
+        self.assertEqual('POST', method)
+        self.assertEqual('/v1/a/c', path)
+        self.assertIn(SYSMETA_VERSIONS_CONT, headers)
+        self.assertEqual(headers[SYSMETA_VERSIONS_CONT],
+                         wsgi_quote(str_to_wsgi(
+                             self.build_container_name('c'))))
+        self.assertIn(SYSMETA_VERSIONS_ENABLED, headers)
+        self.assertEqual(headers[SYSMETA_VERSIONS_ENABLED], 'True')
+
+    @patch_policies([StoragePolicy(0, 'zero', True),
+                     StoragePolicy(1, 'one', False, is_deprecated=True)])
+    def test_existing_container_has_deprecated_policy(self):
+        self.app.register('GET', '/v1/a', swob.HTTPOk, {}, '')
+        self.app.register('GET', '/v1/a/c', swob.HTTPOk, {
+                          'x-backend-storage-policy-index': 1}, '')
+        req = Request.blank('/v1/a/c',
+                            headers={'X-Versions-Enabled': 'true'},
+                            environ={'REQUEST_METHOD': 'POST'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '400 Bad Request')
+        self.assertEqual(body,
+                         b'Cannot enable object versioning on a container '
+                         b'that uses a deprecated storage policy.')
+
+        calls = self.app.calls_with_headers
+        self.assertEqual(2, len(calls))
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+
+    @patch_policies([StoragePolicy(0, 'zero', True),
+                     StoragePolicy(1, 'one', False, is_deprecated=True)])
+    def test_existing_container_has_deprecated_policy_unauthed(self):
+        self.app.register('GET', '/v1/a', swob.HTTPOk, {}, '')
+        self.app.register('GET', '/v1/a/c', swob.HTTPOk, {
+                          'x-backend-storage-policy-index': 1}, '')
+
+        def fake_authorize(req):
+            self.authorized.append(req)
+            return swob.HTTPForbidden()
+
+        req = Request.blank('/v1/a/c',
+                            headers={'X-Versions-Enabled': 'true'},
+                            environ={'REQUEST_METHOD': 'POST',
+                                     'swift.authorize': fake_authorize})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '403 Forbidden')
+
+        calls = self.app.calls_with_headers
+        self.assertEqual(2, len(calls))
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+
+    def test_same_policy_as_primary_container(self):
+        self.app.register('GET', '/v1/a', swob.HTTPOk, {}, '')
+        self.app.register('GET', '/v1/a/c', swob.HTTPNotFound, {}, '')
+        self.app.register('PUT', self.build_versions_path(), swob.HTTPOk,
+                          {}, '')
+        self.app.register('PUT', '/v1/a/c', swob.HTTPOk, {}, '')
+        req = Request.blank('/v1/a/c',
+                            headers={'X-Versions-Enabled': 'true',
+                                     'X-Storage-Policy': 'ec42'},
+                            environ={'REQUEST_METHOD': 'PUT'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+
+        # check for sysmeta header
+        calls = self.app.calls_with_headers
+        self.assertEqual(4, len(calls))
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+
+        # request to create versions container
+        method, path, headers = calls[2]
+        self.assertEqual('PUT', method)
+        self.assertEqual(self.build_versions_path(), path)
+        self.assertIn('X-Storage-Policy', headers)
+        self.assertEqual('ec42', headers['X-Storage-Policy'])
+
+        # request to enable versioning on primary container
+        method, path, headers = calls[3]
+        self.assertEqual('PUT', method)
+        self.assertEqual('/v1/a/c', path)
+        self.assertIn(SYSMETA_VERSIONS_CONT, headers)
+        self.assertEqual(headers[SYSMETA_VERSIONS_CONT],
+                         wsgi_quote(str_to_wsgi(
+                             self.build_container_name('c'))))
+        self.assertIn(SYSMETA_VERSIONS_ENABLED, headers)
+        self.assertEqual(headers[SYSMETA_VERSIONS_ENABLED], 'True')
+        self.assertIn('X-Storage-Policy', headers)
+        self.assertEqual('ec42', headers['X-Storage-Policy'])
+
+    def test_enable_versioning_failed_primary_container(self):
+        self.app.register('GET', '/v1/a', swob.HTTPOk, {}, 'passed')
+        self.app.register('GET', '/v1/a/c', swob.HTTPNotFound, {}, 'passed')
+        self.app.register('PUT', self.build_versions_path(),
+                          swob.HTTPOk, {}, 'passed')
+        self.app.register('DELETE', self.build_versions_path(),
+                          swob.HTTPNoContent, {}, '')
+        self.app.register('PUT', '/v1/a/c', swob.HTTPInternalServerError,
+                          {}, '')
+        req = Request.blank('/v1/a/c',
+                            headers={'X-Versions-Enabled': 'true'},
+                            environ={'REQUEST_METHOD': 'PUT'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '500 Internal Error')
+
+    def test_enable_versioning_failed_versions_container(self):
+        self.app.register('GET', '/v1/a', swob.HTTPOk, {}, '')
+        self.app.register('GET', '/v1/a/c', swob.HTTPNotFound, {}, '')
+        self.app.register('PUT', self.build_versions_path(),
+                          swob.HTTPInternalServerError, {}, '')
+        req = Request.blank('/v1/a/c',
+                            headers={'X-Versions-Enabled': 'true'},
+                            environ={'REQUEST_METHOD': 'PUT'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '500 Internal Error')
+
+    def test_enable_versioning_existing_container(self):
+        self.app.register('HEAD', '/v1/a', swob.HTTPOk, {}, '')
+        self.app.register('HEAD', self.build_versions_path(),
+                          swob.HTTPOk, {}, '')
+        self.app.register('PUT', self.build_versions_path(),
+                          swob.HTTPAccepted, {}, '')
+        self.app.register(
+            'GET', '/v1/a/c', swob.HTTPOk,
+            {SYSMETA_VERSIONS_CONT: self.build_container_name('c'),
+             SYSMETA_VERSIONS_ENABLED: False},
+            'passed')
+        self.app.register('POST', '/v1/a/c', swob.HTTPOk, {}, 'passed')
+        req = Request.blank('/v1/a/c',
+                            headers={'X-Versions-Enabled': 'true'},
+                            environ={'REQUEST_METHOD': 'POST'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+
+        # check for sysmeta header
+        calls = self.app.calls_with_headers
+        self.assertEqual(5, len(calls))
+        method, path, req_headers = calls[-1]
+        self.assertEqual('POST', method)
+        self.assertEqual('/v1/a/c', path)
+        self.assertIn(SYSMETA_VERSIONS_ENABLED, req_headers)
+        self.assertEqual(req_headers[SYSMETA_VERSIONS_ENABLED],
+                         'True')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+
+    def test_put_container_with_legacy_versioning(self):
+        self.app.register('GET', '/v1/a', swob.HTTPOk, {}, '')
+        self.app.register(
+            'GET', '/v1/a/c', swob.HTTPOk,
+            {'x-container-sysmeta-versions-location': 'ver_cont'},
+            '')
+        req = Request.blank('/v1/a/c',
+                            headers={'X-Versions-Enabled': 'true'},
+                            environ={'REQUEST_METHOD': 'POST'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '400 Bad Request')
+
+    def test_put_container_with_super_legacy_versioning(self):
+        # x-versions-location was used before versioned writes
+        # was pulled out to middleware
+        self.app.register('HEAD', '/v1/a', swob.HTTPOk, {}, '')
+        self.app.register(
+            'HEAD', '/v1/a/c', swob.HTTPOk,
+            {'x-versions-location': 'ver_cont'},
+            '')
+        req = Request.blank('/v1/a/c',
+                            headers={'X-Versions-Enabled': 'true'},
+                            environ={'REQUEST_METHOD': 'POST'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '400 Bad Request')
+
+    def test_get_container(self):
+        self.app.register('GET', '/v1/a', swob.HTTPOk, {}, 'passed')
+        self.app.register(
+            'GET', '/v1/a/c', swob.HTTPOk,
+            {SYSMETA_VERSIONS_CONT: self.build_container_name('c'),
+             SYSMETA_VERSIONS_ENABLED: True}, b'[]')
+        req = Request.blank(
+            '/v1/a/c',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        self.assertIn(('X-Versions-Enabled', 'True'), headers)
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+
+    def test_get_reserved_container_passthrough(self):
+        self.app.register('GET', '/v1/a', swob.HTTPOk, {}, 'passed')
+        self.app.register('GET', '/v1/a/%s' % get_reserved_name('foo'),
+                          swob.HTTPOk, {}, b'[]')
+        req = Request.blank('/v1/a/%s' % get_reserved_name('foo'))
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+
+    def test_head_container(self):
+        self.app.register('GET', '/v1/a', swob.HTTPOk, {}, 'passed')
+        self.app.register(
+            'HEAD', '/v1/a/c', swob.HTTPOk,
+            {SYSMETA_VERSIONS_CONT: self.build_container_name('c'),
+             SYSMETA_VERSIONS_ENABLED: True}, None)
+        req = Request.blank(
+            '/v1/a/c',
+            environ={'REQUEST_METHOD': 'HEAD'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        self.assertIn(('X-Versions-Enabled', 'True'), headers)
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+
+    def test_delete_container_success(self):
+        self.app.register(
+            'DELETE', '/v1/a/c', swob.HTTPNoContent, {}, '')
+        self.app.register(
+            'DELETE', self.build_versions_path(),
+            swob.HTTPNoContent, {}, '')
+        self.app.register('HEAD', '/v1/a', swob.HTTPOk, {}, '')
+        self.app.register(
+            'HEAD', '/v1/a/c', swob.HTTPOk,
+            {SYSMETA_VERSIONS_CONT: self.build_container_name('c'),
+             SYSMETA_VERSIONS_ENABLED: True}, '')
+        self.app.register(
+            'HEAD', self.build_versions_path(), swob.HTTPOk,
+            {'x-container-object-count': 0}, '')
+        req = Request.blank(
+            '/v1/a/c', environ={'REQUEST_METHOD': 'DELETE'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '204 No Content')
+        self.assertEqual(self.app.calls, [
+            ('HEAD', '/v1/a'),
+            ('HEAD', '/v1/a/c'),
+            ('HEAD', self.build_versions_path()),
+            ('HEAD', self.build_versions_path()),  # get_container_info
+            ('DELETE', self.build_versions_path()),
+            ('DELETE', '/v1/a/c'),
+        ])
+
+    def test_delete_container_fail_object_count(self):
+        self.app.register('HEAD', '/v1/a', swob.HTTPOk, {}, '')
+        self.app.register(
+            'HEAD', '/v1/a/c', swob.HTTPOk,
+            {SYSMETA_VERSIONS_CONT: self.build_container_name('c'),
+             SYSMETA_VERSIONS_ENABLED: False}, '')
+        self.app.register(
+            'HEAD',
+            self.build_versions_path(),
+            swob.HTTPOk,
+            {'x-container-object-count': 1}, '')
+        req = Request.blank(
+            '/v1/a/c', environ={'REQUEST_METHOD': 'DELETE'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '409 Conflict')
+        self.assertEqual(self.app.calls, [
+            ('HEAD', '/v1/a'),
+            ('HEAD', '/v1/a/c'),
+            ('HEAD', self.build_versions_path()),
+            ('HEAD', self.build_versions_path()),  # get_container_info
+        ])
+
+    def test_delete_container_fail_delete_versions_cont(self):
+        # N.B.: Notice lack of a call to DELETE /v1/a/c
+        # Since deleting versions container failed, swift should
+        # not delete primary container
+        self.app.register(
+            'DELETE', self.build_versions_path(),
+            swob.HTTPServerError, {}, '')
+        self.app.register('HEAD', '/v1/a', swob.HTTPOk, {}, '')
+        self.app.register(
+            'HEAD', '/v1/a/c', swob.HTTPOk,
+            {SYSMETA_VERSIONS_CONT: self.build_container_name('c'),
+             SYSMETA_VERSIONS_ENABLED: False}, '')
+        self.app.register(
+            'HEAD', self.build_versions_path(), swob.HTTPOk,
+            {'x-container-object-count': 0}, '')
+        req = Request.blank(
+            '/v1/a/c', environ={'REQUEST_METHOD': 'DELETE'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '500 Internal Error')
+        self.assertEqual(self.app.calls, [
+            ('HEAD', '/v1/a'),
+            ('HEAD', '/v1/a/c'),
+            ('HEAD', self.build_versions_path()),
+            ('HEAD', self.build_versions_path()),  # get_container_info
+            ('DELETE', self.build_versions_path()),
+        ])
+
+    def test_get(self):
+        self.app.register(
+            'GET', '/v1/a/c/o', swob.HTTPOk, {
+                'Content-Location': self.build_versions_path(
+                    obj='o', version='9999998765.99999')},
+            'body')
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'GET',
+                     'swift.cache': self.cache_version_on})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+        self.assertIn(('X-Object-Version-Id', '0000001234.00000'), headers)
+        self.assertIn(
+            ('Content-Location', '/v1/a/c/o?version-id=0000001234.00000'),
+            headers)
+
+    def test_get_symlink(self):
+        self.app.register(
+            'GET', '/v1/a/c/o?symlink=get', swob.HTTPOk, {
+                'X-Symlink-Target': '%s/%s' % (
+                    self.build_container_name('c'),
+                    self.build_object_name('o', '9999998765.99999'),
+                ),
+                'X-Symlink-Target-Etag': 'versioned-obj-etag',
+            }, '')
+        req = Request.blank(
+            '/v1/a/c/o?symlink=get',
+            environ={'swift.cache': self.cache_version_on})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+        self.assertIn(('X-Object-Version-Id', '0000001234.00000'), headers)
+        self.assertIn(
+            ('X-Symlink-Target', 'c/o?version-id=0000001234.00000'),
+            headers)
+        self.assertEqual(body, b'')
+        # N.B. HEAD req already works with existing registered GET response
+        req = Request.blank(
+            '/v1/a/c/o?symlink=get', method='HEAD',
+            environ={'swift.cache': self.cache_version_on})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+        self.assertIn(('X-Object-Version-Id', '0000001234.00000'), headers)
+        self.assertIn(
+            ('X-Symlink-Target', 'c/o?version-id=0000001234.00000'),
+            headers)
+        self.assertEqual(body, b'')
+
+    def test_put_object_no_versioning(self):
+        self.app.register(
+            'PUT', '/v1/a/c/o', swob.HTTPOk, {}, 'passed')
+        cache = FakeMemcache()
+        cache.set(get_cache_key('a'), {'status': 200})
+        cache.set(get_cache_key('a', 'c'), {'status': 200})
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '100'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+
+    def test_PUT_overwrite(self):
+        ts_now = Timestamp.now()
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPOk, {
+            SYSMETA_VERSIONS_SYMLINK: 'true',
+            TGT_OBJ_SYSMETA_SYMLINK_HDR: 'c-unique/whatever'}, '')
+        self.app.register(
+            'PUT',
+            self.build_versions_path(obj='o', version=(~ts_now).internal),
+            swob.HTTPCreated, {}, 'passed')
+        self.app.register(
+            'PUT', '/v1/a/c/o', swob.HTTPCreated, {}, 'passed')
+        put_body = 'stuff' * 100
+        req = Request.blank(
+            '/v1/a/c/o', method='PUT', body=put_body,
+            headers={'Content-Type': 'text/plain',
+                     'ETag': md5(
+                         put_body.encode('utf8'),
+                         usedforsecurity=False).hexdigest(),
+                     'Content-Length': len(put_body)},
+            environ={'swift.cache': self.cache_version_on,
+                     'swift.trans_id': 'fake_trans_id'})
+        with mock_timestamp_now(ts_now):
+            status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '201 Created')
+        self.assertEqual(len(self.authorized), 2)
+        self.assertRequestEqual(req, self.authorized[0])
+        self.assertEqual(['OV', 'OV', 'OV'], self.app.swift_sources)
+        self.assertEqual({'fake_trans_id'}, set(self.app.txn_ids))
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/a/c/o?symlink=get'),
+            ('PUT', self.build_versions_path(
+                obj='o', version=(~ts_now).internal)),
+            ('PUT', '/v1/a/c/o'),
+        ])
+
+        calls = self.app.call_list
+        self.assertIn('X-Newest', calls[0].headers)
+        self.assertEqual('True', calls[0].headers['X-Newest'])
+
+        symlink_expected_headers = {
+            SYMLOOP_EXTEND: 'true',
+            ALLOW_RESERVED_NAMES: 'true',
+            TGT_OBJ_SYSMETA_SYMLINK_HDR:
+            self.build_symlink_path('c', 'o', (~ts_now).internal),
+            'x-object-sysmeta-symlink-target-etag': md5(
+                put_body.encode('utf8'), usedforsecurity=False).hexdigest(),
+            'x-object-sysmeta-symlink-target-bytes': str(len(put_body)),
+        }
+        symlink_put_headers = self.app.call_list[-1].headers
+        for k, v in symlink_expected_headers.items():
+            self.assertEqual(symlink_put_headers[k], v)
+
+    def test_POST(self):
+        ts_now = Timestamp.now()
+        self.app.register(
+            'POST',
+            self.build_versions_path(obj='o', version=(~ts_now).internal),
+            swob.HTTPAccepted, {}, '')
+        self.app.register(
+            'POST', '/v1/a/c/o', swob.HTTPTemporaryRedirect, {
+                SYSMETA_VERSIONS_SYMLINK: 'true',
+                'Location': self.build_versions_path(
+                    obj='o', version=(~ts_now).internal)}, '')
+
+        # TODO: in symlink middleware, swift.leave_relative_location
+        # is added by the middleware during the response
+        # adding to the client request here, need to understand how
+        # to modify the response environ.
+        req = Request.blank(
+            '/v1/a/c/o', method='POST',
+            headers={'Content-Type': 'text/jibberish01',
+                     'X-Object-Meta-Foo': 'bar'},
+            environ={'swift.cache': self.cache_version_on,
+                     'swift.leave_relative_location': 'true',
+                     'swift.trans_id': 'fake_trans_id'})
+        with mock_timestamp_now(ts_now):
+            status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '202 Accepted')
+
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+        self.assertEqual([None, 'OV'], self.app.swift_sources)
+        self.assertEqual({'fake_trans_id'}, set(self.app.txn_ids))
+        self.assertEqual(self.app.calls, [
+            ('POST', '/v1/a/c/o'),
+            ('POST', self.build_versions_path(
+                obj='o', version=(~ts_now).internal)),
+        ])
+
+        expected_hdrs = {
+            'content-type': 'text/jibberish01',
+            'x-object-meta-foo': 'bar',
+        }
+        version_obj_post_headers = self.app.call_list[1].headers
+        for k, v in expected_hdrs.items():
+            self.assertEqual(version_obj_post_headers[k], v)
+
+    def test_POST_mismatched_location(self):
+        # This is a defensive chech, ideally a mistmached
+        # versions container should never happen.
+        ts_now = Timestamp.now()
+        self.app.register(
+            'POST', '/v1/a/c/o', swob.HTTPTemporaryRedirect, {
+                SYSMETA_VERSIONS_SYMLINK: 'true',
+                'Location': self.build_versions_path(
+                    cont='mismatched', obj='o', version=(~ts_now).internal)},
+                '')
+
+        # TODO: in symlink middleware, swift.leave_relative_location
+        # is added by the middleware during the response
+        # adding to the client request here, need to understand how
+        # to modify the response environ.
+        req = Request.blank(
+            '/v1/a/c/o', method='POST',
+            headers={'Content-Type': 'text/jibberish01',
+                     'X-Object-Meta-Foo': 'bar'},
+            environ={'swift.cache': self.cache_version_on,
+                     'swift.leave_relative_location': 'true',
+                     'swift.trans_id': 'fake_trans_id'})
+        with mock_timestamp_now(ts_now):
+            status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '307 Temporary Redirect')
+
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+        self.assertEqual([None], self.app.swift_sources)
+        self.assertEqual({'fake_trans_id'}, set(self.app.txn_ids))
+        self.assertEqual(self.app.calls, [
+            ('POST', '/v1/a/c/o'),
+        ])
+
+    def test_POST_regular_symlink(self):
+        ts_now = Timestamp.now()
+        self.app.register(
+            'POST', '/v1/a/c/o', swob.HTTPTemporaryRedirect, {
+                'Location': '/v1/a/t/o'}, '')
+
+        # TODO: in symlink middleware, swift.leave_relative_location
+        # is added by the middleware during the response
+        # adding to the client request here, need to understand how
+        # to modify the response environ.
+        req = Request.blank(
+            '/v1/a/c/o', method='POST',
+            headers={'Content-Type': 'text/jibberish01',
+                     'X-Object-Meta-Foo': 'bar'},
+            environ={'swift.cache': self.cache_version_on,
+                     'swift.leave_relative_location': 'true',
+                     'swift.trans_id': 'fake_trans_id'})
+        with mock_timestamp_now(ts_now):
+            status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '307 Temporary Redirect')
+
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+        self.assertEqual([None], self.app.swift_sources)
+        self.assertEqual({'fake_trans_id'}, set(self.app.txn_ids))
+        self.assertEqual(self.app.calls, [
+            ('POST', '/v1/a/c/o'),
+        ])
+
+    def test_denied_PUT_of_versioned_object(self):
+        authorize_call = []
+        self.app.register(
+            'GET', '/v1/a/c/o', swob.HTTPOk,
+            {'last-modified': 'Thu, 1 Jan 1970 00:00:01 GMT'}, 'passed')
+
+        def fake_authorize(req):
+            # we should deny the object PUT
+            authorize_call.append(req)
+            return swob.HTTPForbidden()
+
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT',
+                     'swift.cache': self.cache_version_on,
+                     'swift.authorize': fake_authorize,
+                     'CONTENT_LENGTH': '0'})
+        # Save off a copy, as the middleware may modify the original
+        expected_req = Request(req.environ.copy())
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '403 Forbidden')
+        self.assertEqual(len(authorize_call), 1)
+        self.assertRequestEqual(expected_req, authorize_call[0])
+
+        self.assertEqual(self.app.calls, [])
+
+    def test_PUT_overwrite_tombstone(self):
+        ts_now = Timestamp.now()
+        self.app.register(
+            'GET', '/v1/a/c/o', swob.HTTPNotFound, {}, None)
+        self.app.register(
+            'PUT',
+            self.build_versions_path(obj='o', version=(~ts_now).internal),
+            swob.HTTPCreated, {}, 'passed')
+        self.app.register(
+            'PUT', '/v1/a/c/o', swob.HTTPCreated, {}, 'passed')
+        put_body = 'stuff' * 100
+        req = Request.blank(
+            '/v1/a/c/o', method='PUT', body=put_body,
+            headers={'Content-Type': 'text/plain',
+                     'ETag': md5(
+                         put_body.encode('utf8'),
+                         usedforsecurity=False).hexdigest(),
+                     'Content-Length': len(put_body)},
+            environ={'swift.cache': self.cache_version_on,
+                     'swift.trans_id': 'fake_trans_id'})
+        with mock_timestamp_now(ts_now):
+            status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '201 Created')
+        # authorized twice because of pre-flight check on PUT
+        self.assertEqual(len(self.authorized), 2)
+        self.assertRequestEqual(req, self.authorized[0])
+        self.assertEqual(['OV', 'OV', 'OV'], self.app.swift_sources)
+        self.assertEqual({'fake_trans_id'}, set(self.app.txn_ids))
+
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/a/c/o?symlink=get'),
+            ('PUT', self.build_versions_path(
+                obj='o', version=(~ts_now).internal)),
+            ('PUT', '/v1/a/c/o'),
+        ])
+
+        calls = self.app.call_list
+        self.assertIn('X-Newest', calls[0].headers)
+        self.assertEqual('True', calls[0].headers['X-Newest'])
+
+        expected_headers = {
+            TGT_OBJ_SYSMETA_SYMLINK_HDR:
+            self.build_symlink_path('c', 'o', (~ts_now).internal),
+            'x-object-sysmeta-symlink-target-etag': md5(
+                put_body.encode('utf8'), usedforsecurity=False).hexdigest(),
+            'x-object-sysmeta-symlink-target-bytes': str(len(put_body)),
+        }
+        symlink_put_headers = self.app.call_list[-1].headers
+        for k, v in expected_headers.items():
+            self.assertEqual(symlink_put_headers[k], v)
+
+    def test_PUT_overwrite_object_with_DLO(self):
+        ts_now = Timestamp.now()
+        self.app.register(
+            'GET', '/v1/a/c/o', swob.HTTPOk,
+            {'last-modified': 'Thu, 1 Jan 1970 00:01:00 GMT'}, 'old version')
+        self.app.register(
+            'PUT',
+            self.build_versions_path(obj='o', version='9999999939.99999'),
+            swob.HTTPCreated, {}, 'passed')
+        self.app.register(
+            'PUT',
+            self.build_versions_path(obj='o', version=(~ts_now).internal),
+            swob.HTTPCreated, {}, 'passed')
+        self.app.register(
+            'PUT', '/v1/a/c/o', swob.HTTPCreated, {}, 'passed')
+        put_body = ''
+        req = Request.blank('/v1/a/c/o', method='PUT', body=put_body,
+                            headers={'Content-Type': 'text/plain',
+                                     'X-Object-Manifest': 'req/manifest'},
+                            environ={'swift.cache': self.cache_version_on,
+                                     'swift.trans_id': 'fake_trans_id'})
+        with mock_timestamp_now(ts_now):
+            status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '201 Created')
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual(4, self.app.call_count)
+        self.assertEqual(['OV', 'OV', 'OV', 'OV'], self.app.swift_sources)
+        self.assertEqual({'fake_trans_id'}, set(self.app.txn_ids))
+
+        self.assertEqual([
+            ('GET', '/v1/a/c/o?symlink=get'),
+            ('PUT',
+             self.build_versions_path(obj='o', version='9999999939.99999')),
+            ('PUT',
+             self.build_versions_path(obj='o', version=(~ts_now).internal)),
+            ('PUT', '/v1/a/c/o'),
+        ], self.app.calls)
+
+        calls = self.app.call_list
+        self.assertIn('X-Newest', calls[0].headers)
+        self.assertEqual('True', calls[0].headers['X-Newest'])
+
+        self.assertNotIn('x-object-manifest', calls[1].headers)
+        self.assertEqual('req/manifest',
+                         calls[-2].headers['X-Object-Manifest'])
+
+        symlink_put_headers = calls[-1].headers
+        expected_headers = {
+            TGT_OBJ_SYSMETA_SYMLINK_HDR:
+            self.build_symlink_path('c', 'o', (~ts_now).internal),
+            'x-object-sysmeta-symlink-target-etag': md5(
+                put_body.encode('utf8'), usedforsecurity=False).hexdigest(),
+            'x-object-sysmeta-symlink-target-bytes': str(len(put_body)),
+        }
+        for k, v in expected_headers.items():
+            self.assertEqual(symlink_put_headers[k], v)
+        self.assertNotIn('x-object-manifest', symlink_put_headers)
+
+    def test_PUT_overwrite_DLO_with_object(self):
+        ts_now = Timestamp.now()
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPOk,
+                          {'X-Object-Manifest': 'resp/manifest',
+                           'last-modified': 'Thu, 1 Jan 1970 00:01:00 GMT'},
+                          'passed')
+        self.app.register(
+            'PUT',
+            self.build_versions_path(obj='o', version='9999999939.99999'),
+            swob.HTTPCreated, {}, 'passed')
+        self.app.register(
+            'PUT',
+            self.build_versions_path(obj='o', version=(~ts_now).internal),
+            swob.HTTPCreated, {}, 'passed')
+        self.app.register(
+            'PUT', '/v1/a/c/o', swob.HTTPCreated, {}, 'passed')
+        put_body = 'stuff' * 100
+        req = Request.blank('/v1/a/c/o', method='PUT', body=put_body,
+                            headers={'Content-Type': 'text/plain'},
+                            environ={'swift.cache': self.cache_version_on,
+                                     'swift.trans_id': 'fake_trans_id'})
+        with mock_timestamp_now(ts_now):
+            status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '201 Created')
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual(4, self.app.call_count)
+        self.assertEqual(['OV', 'OV', 'OV', 'OV'], self.app.swift_sources)
+        self.assertEqual({'fake_trans_id'}, set(self.app.txn_ids))
+        self.assertEqual([
+            ('GET', '/v1/a/c/o?symlink=get'),
+            ('PUT',
+             self.build_versions_path(obj='o', version='9999999939.99999')),
+            ('PUT',
+             self.build_versions_path(obj='o', version=(~ts_now).internal)),
+            ('PUT', '/v1/a/c/o'),
+        ], self.app.calls)
+
+        calls = self.app.call_list
+        self.assertIn('X-Newest', calls[0].headers)
+        self.assertEqual('True', calls[0].headers['X-Newest'])
+
+        self.assertEqual('resp/manifest',
+                         calls[1].headers['X-Object-Manifest'])
+        self.assertNotIn(TGT_OBJ_SYSMETA_SYMLINK_HDR,
+                         calls[1].headers)
+
+        self.assertNotIn('x-object-manifest', calls[2].headers)
+        self.assertNotIn(TGT_OBJ_SYSMETA_SYMLINK_HDR,
+                         calls[2].headers)
+
+        symlink_put_headers = calls[-1].headers
+        expected_headers = {
+            TGT_OBJ_SYSMETA_SYMLINK_HDR:
+            self.build_symlink_path('c', 'o', (~ts_now).internal),
+            'x-object-sysmeta-symlink-target-etag': md5(
+                put_body.encode('utf8'), usedforsecurity=False).hexdigest(),
+            'x-object-sysmeta-symlink-target-bytes': str(len(put_body)),
+        }
+        for k, v in expected_headers.items():
+            self.assertEqual(symlink_put_headers[k], v)
+        self.assertNotIn('x-object-manifest', symlink_put_headers)
+
+    def test_PUT_overwrite_SLO_with_object(self):
+        ts_now = Timestamp.now()
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPOk, {
+            'X-Static-Large-Object': 'True',
+            # N.B. object-sever strips swift_bytes
+            'Content-Type': 'application/octet-stream',
+            'X-Object-Sysmeta-Container-Update-Override-Etag':
+            '656516af0f7474b857857dd2a327f3b9; '
+            'slo_etag=71e938d37c1d06dc634dd24660255a88',
+            'X-Object-Sysmeta-Slo-Etag': '71e938d37c1d06dc634dd24660255a88',
+            'X-Object-Sysmeta-Slo-Size': '10485760',
+            'last-modified': 'Thu, 1 Jan 1970 00:01:00 GMT',
+        }, 'passed')
+        self.app.register(
+            'PUT',
+            self.build_versions_path(obj='o', version='9999999939.99999'),
+            swob.HTTPCreated, {}, 'passed')
+        self.app.register(
+            'PUT',
+            self.build_versions_path(obj='o', version=(~ts_now).internal),
+            swob.HTTPCreated, {}, 'passed')
+        self.app.register(
+            'PUT', '/v1/a/c/o', swob.HTTPCreated, {}, 'passed')
+        put_body = 'stuff' * 100
+        req = Request.blank('/v1/a/c/o', method='PUT', body=put_body,
+                            headers={'Content-Type': 'text/plain'},
+                            environ={'swift.cache': self.cache_version_on,
+                                     'swift.trans_id': 'fake_trans_id'})
+        with mock_timestamp_now(ts_now):
+            status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '201 Created')
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual(4, self.app.call_count)
+        self.assertEqual(['OV', 'OV', 'OV', 'OV'], self.app.swift_sources)
+        self.assertEqual({'fake_trans_id'}, set(self.app.txn_ids))
+        self.assertEqual([
+            ('GET', '/v1/a/c/o?symlink=get'),
+            ('PUT',
+             self.build_versions_path(obj='o', version='9999999939.99999')),
+            ('PUT',
+             self.build_versions_path(obj='o', version=(~ts_now).internal)),
+            ('PUT', '/v1/a/c/o'),
+        ], self.app.calls)
+
+        calls = self.app.call_list
+        self.assertIn('X-Newest', calls[0].headers)
+        self.assertEqual('True', calls[0].headers['X-Newest'])
+
+        slo_headers = {
+            'X-Static-Large-Object': 'True',
+            'Content-Type': 'application/octet-stream; swift_bytes=10485760',
+            'X-Object-Sysmeta-Container-Update-Override-Etag':
+            '656516af0f7474b857857dd2a327f3b9; '
+            'slo_etag=71e938d37c1d06dc634dd24660255a88',
+            'X-Object-Sysmeta-Slo-Etag': '71e938d37c1d06dc634dd24660255a88',
+            'X-Object-Sysmeta-Slo-Size': '10485760',
+        }
+        archive_put = calls[1]
+        for key, value in slo_headers.items():
+            self.assertEqual(archive_put.headers[key], value)
+
+        client_put = calls[2]
+        for key in slo_headers:
+            if key == 'Content-Type':
+                self.assertEqual('text/plain', client_put.headers[key])
+            else:
+                self.assertNotIn(key, client_put.headers)
+
+        symlink_put_headers = calls[-1].headers
+        expected_headers = {
+            TGT_OBJ_SYSMETA_SYMLINK_HDR:
+            self.build_symlink_path('c', 'o', (~ts_now).internal),
+            'x-object-sysmeta-symlink-target-etag': md5(
+                put_body.encode('utf8'), usedforsecurity=False).hexdigest(),
+            'x-object-sysmeta-symlink-target-bytes': str(len(put_body)),
+        }
+        for k, v in expected_headers.items():
+            self.assertEqual(symlink_put_headers[k], v)
+        self.assertNotIn('x-object-manifest', symlink_put_headers)
+
+    def test_PUT_overwrite_object(self):
+        ts_iter = make_timestamp_iter()
+        ts_old, ts_new = next(ts_iter), next(ts_iter)
+        self.app.register(
+            'GET', '/v1/a/c/o', swob.HTTPOk,
+            {'x-timestamp': ts_old.normal,
+             'x-backend-timestamp': ts_old.internal,
+             'last-modified': date_header_format(ts_old)},
+            'passed')
+        self.app.register(
+            'PUT',
+            self.build_versions_path(obj='o', version=(~ts_old).normal),
+            swob.HTTPCreated, {}, 'passed')
+        self.app.register(
+            'PUT',
+            self.build_versions_path(obj='o', version=(~ts_new).internal),
+            swob.HTTPCreated, {}, 'passed')
+        self.app.register(
+            'PUT', '/v1/a/c/o', swob.HTTPCreated, {}, 'passed')
+
+        put_body = 'stuff' * 100
+        req = Request.blank(
+            '/v1/a/c/o', method='PUT', body=put_body,
+            headers={'Content-Type': 'text/plain',
+                     'ETag': md5(
+                         put_body.encode('utf8'),
+                         usedforsecurity=False).hexdigest(),
+                     'Content-Length': len(put_body)},
+            environ={'swift.cache': self.cache_version_on,
+                     'swift.trans_id': 'fake_trans_id'})
+        with mock_timestamp_now(ts_new):
+            status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '201 Created')
+        # authorized twice because of pre-flight check on PUT
+        self.assertEqual(len(self.authorized), 2)
+        self.assertRequestEqual(req, self.authorized[0])
+        self.assertEqual(['OV', 'OV', 'OV', 'OV'], self.app.swift_sources)
+        self.assertEqual({'fake_trans_id'}, set(self.app.txn_ids))
+
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/a/c/o?symlink=get'),
+            ('PUT',
+             self.build_versions_path(obj='o', version=(~ts_old).normal)),
+            ('PUT',
+             self.build_versions_path(obj='o', version=(~ts_new).internal)),
+            ('PUT', '/v1/a/c/o'),
+        ])
+
+        calls = self.app.call_list
+        self.assertIn('X-Newest', calls[0].headers)
+        self.assertEqual('True', calls[0].headers['X-Newest'])
+
+        expected_headers = {
+            TGT_OBJ_SYSMETA_SYMLINK_HDR:
+            self.build_symlink_path('c', 'o', (~ts_new).internal),
+            'x-object-sysmeta-symlink-target-etag': md5(
+                put_body.encode('utf8'), usedforsecurity=False).hexdigest(),
+            'x-object-sysmeta-symlink-target-bytes': str(len(put_body)),
+        }
+        symlink_put_headers = self.app.call_list[-1].headers
+        for k, v in expected_headers.items():
+            self.assertEqual(symlink_put_headers[k], v)
+
+    def test_new_version_get_errors(self):
+        # GET on source fails, expect client error response,
+        # no PUT should happen
+        self.app.register('GET', '/v1/a/c/o',
+                          swob.HTTPBadRequest, {}, None)
+        req = Request.blank('/v1/a/c/o', method='PUT',
+                            environ={'swift.cache': self.cache_version_on,
+                                     'CONTENT_LENGTH': '100'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '400 Bad Request')
+        self.assertEqual(1, self.app.call_count)
+
+        # GET on source fails, expect server error response
+        self.app.register('GET', '/v1/a/c/o',
+                          swob.HTTPBadGateway, {}, None)
+        req = Request.blank('/v1/a/c/o', method='PUT',
+                            environ={'swift.cache': self.cache_version_on,
+                                     'CONTENT_LENGTH': '100'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '503 Service Unavailable')
+        self.assertEqual(2, self.app.call_count)
+
+    def test_new_version_put_errors(self):
+        # PUT of version fails, expect client error response
+        self.app.register(
+            'GET', '/v1/a/c/o', swob.HTTPOk,
+            {'last-modified': 'Thu, 1 Jan 1970 00:01:00 GMT'}, 'passed')
+        self.app.register(
+            'PUT',
+            self.build_versions_path(obj='o', version='9999999939.99999'),
+            swob.HTTPUnauthorized, {}, None)
+        req = Request.blank('/v1/a/c/o', method='PUT',
+                            environ={'swift.cache': self.cache_version_on,
+                                     'CONTENT_LENGTH': '100'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '401 Unauthorized')
+        self.assertEqual(2, self.app.call_count)
+
+        # PUT of version fails, expect server error response
+        self.app.register(
+            'PUT',
+            self.build_versions_path(obj='o', version='9999999939.99999'),
+            swob.HTTPBadGateway, {}, None)
+        req = Request.blank(
+            '/v1/a/c/o', headers={'Content-Type': 'text/plain'},
+            environ={'REQUEST_METHOD': 'PUT',
+                     'swift.cache': self.cache_version_on,
+                     'CONTENT_LENGTH': '100'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '503 Service Unavailable')
+        self.assertEqual(4, self.app.call_count)
+
+        # PUT fails because the reserved container is missing; server error
+        self.app.register(
+            'PUT',
+            self.build_versions_path(obj='o', version='9999999939.99999'),
+            swob.HTTPNotFound, {}, None)
+        req = Request.blank(
+            '/v1/a/c/o', headers={'Content-Type': 'text/plain'},
+            environ={'REQUEST_METHOD': 'PUT',
+                     'swift.cache': self.cache_version_on_but_busted,
+                     'CONTENT_LENGTH': '100'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '500 Internal Error')
+        self.assertIn(b'container does not exist', body)
+        self.assertIn(b're-enable object versioning', body)
+
+
+class ObjectVersioningTestDisabled(ObjectVersioningBaseTestCase):
+    def test_get_container(self):
+        self.app.register('GET', '/v1/a', swob.HTTPOk, {}, 'passed')
+        self.app.register(
+            'GET', '/v1/a/c', swob.HTTPOk,
+            {SYSMETA_VERSIONS_CONT: 'c\x01versions',
+             SYSMETA_VERSIONS_ENABLED: False}, b'[]')
+        req = Request.blank(
+            '/v1/a/c',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        self.assertIn(('X-Versions-Enabled', 'False'), headers)
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+
+    def test_head_container(self):
+        self.app.register('GET', '/v1/a', swob.HTTPOk, {}, 'passed')
+        self.app.register(
+            'HEAD', '/v1/a/c', swob.HTTPOk,
+            {SYSMETA_VERSIONS_CONT: 'c\x01versions',
+             SYSMETA_VERSIONS_ENABLED: False}, None)
+        req = Request.blank(
+            '/v1/a/c',
+            environ={'REQUEST_METHOD': 'HEAD'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        self.assertIn(('X-Versions-Enabled', 'False'), headers)
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+
+    def test_disable_versioning(self):
+        self.app.register('POST', '/v1/a/c', swob.HTTPOk, {}, 'passed')
+        req = Request.blank('/v1/a/c',
+                            headers={'X-Versions-Enabled': 'false'},
+                            environ={'REQUEST_METHOD': 'POST',
+                                     'swift.cache': self.cache_version_on})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+
+    def test_PUT_overwrite_null_marker_versioning_disabled(self):
+        # During object PUT with a versioning disabled, if the most
+        # recent versioned object is a DELETE marker will a *null*
+        # version-id, then the DELETE marker should be removed.
+        listing_body = [{
+            "hash": "y",
+            "last_modified": "2014-11-21T14:23:02.206740",
+            "bytes": 0,
+            "name": self.build_object_name('o', '0000000001.00000'),
+            "content_type": "application/x-deleted;swift_versions_deleted=1"
+        }, {
+            "hash": "x",
+            "last_modified": "2014-11-21T14:14:27.409100",
+            "bytes": 3,
+            "name": self.build_object_name('o', '0000000002.00000'),
+            "content_type": "text/plain"
+        }]
+        prefix_listing_path = \
+            '/v1/a/c\x01versions?prefix=o---&marker='
+        self.app.register(
+            'GET', prefix_listing_path, swob.HTTPOk, {},
+            json.dumps(listing_body).encode('utf8'))
+        self.app.register(
+            'HEAD',
+            self.build_versions_path(obj='o', version='0000000001.00000'),
+            swob.HTTPNoContent,
+            {'content-type': DELETE_MARKER_CONTENT_TYPE}, None)
+        self.app.register(
+            'DELETE',
+            self.build_versions_path(obj='o', version='0000000001.00000'),
+            swob.HTTPNoContent, {}, None)
+        self.app.register(
+            'PUT', '/v1/a/c/o', swob.HTTPCreated, {}, 'passed')
+        put_body = 'stuff' * 100
+        req = Request.blank(
+            '/v1/a/c/o', method='PUT', body=put_body,
+            headers={'Content-Type': 'text/plain',
+                     'ETag': md5(
+                         put_body.encode('utf8'),
+                         usedforsecurity=False).hexdigest(),
+                     'Content-Length': len(put_body)},
+            environ={'swift.cache': self.cache_version_off,
+                     'swift.trans_id': 'fake_trans_id'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '201 Created')
+
+        # authorized twice because of pre-flight check on PUT
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+        # TODO self.assertEqual(['OV', None, 'OV'], self.app.swift_sources)
+        self.assertEqual({'fake_trans_id'}, set(self.app.txn_ids))
+
+        self.assertEqual(self.app.calls, [
+            ('PUT', '/v1/a/c/o'),
+        ])
+
+        obj_put_headers = self.app.call_list[-1].headers
+        self.assertNotIn(SYSMETA_VERSIONS_SYMLINK, obj_put_headers)
+
+    def test_put_object_versioning_disabled(self):
+        listing_body = [{
+            "hash": "x",
+            "last_modified": "2014-11-21T14:14:27.409100",
+            "bytes": 3,
+            "name": self.build_object_name('o', '0000000001.00000'),
+            "content_type": "text/plain"
+        }]
+        prefix_listing_path = \
+            '/v1/a/c\x01versions?prefix=o---&marker='
+        self.app.register(
+            'GET', prefix_listing_path, swob.HTTPOk, {},
+            json.dumps(listing_body).encode('utf8'))
+        self.app.register(
+            'PUT', '/v1/a/c/o', swob.HTTPOk, {}, 'passed')
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT',
+                     'swift.cache': self.cache_version_off,
+                     'CONTENT_LENGTH': '100'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+
+        self.assertEqual(self.app.calls, [
+            ('PUT', '/v1/a/c/o'),
+        ])
+        obj_put_headers = self.app.call_list[-1].headers
+        self.assertNotIn(SYSMETA_VERSIONS_SYMLINK, obj_put_headers)
+
+    def test_PUT_with_recent_versioned_marker_versioning_disabled(self):
+        # During object PUT with a versioning disabled, if the most
+        # recent versioned object is a DELETE marker will a non-null
+        # version-id, then the DELETE marker should not be removed.
+        listing_body = [{
+            "hash": "y",
+            "last_modified": "2014-11-21T14:23:02.206740",
+            "bytes": 0,
+            "name": self.build_object_name('o', '0000000001.00000'),
+            "content_type": "application/x-deleted;swift_versions_deleted=1"
+        }, {
+            "hash": "x",
+            "last_modified": "2014-11-21T14:14:27.409100",
+            "bytes": 3,
+            "name": self.build_object_name('o', '0000000002.00000'),
+            "content_type": "text/plain"
+        }]
+        prefix_listing_path = \
+            '/v1/a/c\x01versions?prefix=o---&marker='
+        self.app.register(
+            'GET', prefix_listing_path, swob.HTTPOk, {},
+            json.dumps(listing_body).encode('utf8'))
+        self.app.register(
+            'HEAD',
+            self.build_versions_path(obj='o', version='0000000001.00000'),
+            swob.HTTPNoContent,
+            {'content-type': DELETE_MARKER_CONTENT_TYPE}, None)
+        self.app.register(
+            'PUT', '/v1/a/c/o', swob.HTTPCreated, {}, 'passed')
+        put_body = 'stuff' * 100
+        req = Request.blank(
+            '/v1/a/c/o', method='PUT', body=put_body,
+            headers={'Content-Type': 'text/plain',
+                     'ETag': md5(
+                         put_body.encode('utf8'),
+                         usedforsecurity=False).hexdigest(),
+                     'Content-Length': len(put_body)},
+            environ={'swift.cache': self.cache_version_off,
+                     'swift.trans_id': 'fake_trans_id'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '201 Created')
+
+        # authorized twice because of pre-flight check on PUT
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+        # TODO self.assertEqual(['OV', None, 'OV'], self.app.swift_sources)
+        self.assertEqual({'fake_trans_id'}, set(self.app.txn_ids))
+
+        self.assertEqual(self.app.calls, [
+            ('PUT', '/v1/a/c/o'),
+        ])
+
+        obj_put_headers = self.app.call_list[-1].headers
+        self.assertNotIn(SYSMETA_VERSIONS_SYMLINK, obj_put_headers)
+
+    def test_delete_object_with_versioning_disabled(self):
+        # When versioning is disabled, swift will simply issue the
+        # original request to the versioned container
+        self.app.register(
+            'DELETE', '/v1/a/c/o', swob.HTTPNoContent, {}, 'passed')
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'DELETE',
+                     'swift.cache': self.cache_version_off})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '204 No Content')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+
+    def test_POST_symlink(self):
+        ts_now = Timestamp.now()
+        self.app.register(
+            'POST',
+            self.build_versions_path(obj='o', version=(~ts_now).internal),
+            swob.HTTPAccepted, {}, '')
+        self.app.register(
+            'POST', '/v1/a/c/o', swob.HTTPTemporaryRedirect, {
+                SYSMETA_VERSIONS_SYMLINK: 'true',
+                'Location': self.build_versions_path(
+                    obj='o', version=(~ts_now).internal)}, '')
+
+        # TODO: in symlink middleware, swift.leave_relative_location
+        # is added by the middleware during the response
+        # adding to the client request here, need to understand how
+        # to modify the response environ.
+        req = Request.blank(
+            '/v1/a/c/o', method='POST',
+            headers={'Content-Type': 'text/jibberish01',
+                     'X-Object-Meta-Foo': 'bar'},
+            environ={'swift.cache': self.cache_version_off,
+                     'swift.leave_relative_location': 'true',
+                     'swift.trans_id': 'fake_trans_id'})
+        with mock_timestamp_now(ts_now):
+            status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '202 Accepted')
+
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+        self.assertEqual([None, 'OV'], self.app.swift_sources)
+        self.assertEqual({'fake_trans_id'}, set(self.app.txn_ids))
+        self.assertEqual(self.app.calls, [
+            ('POST', '/v1/a/c/o'),
+            ('POST',
+             self.build_versions_path(obj='o', version=(~ts_now).internal)),
+        ])
+
+        expected_hdrs = {
+            'content-type': 'text/jibberish01',
+            'x-object-meta-foo': 'bar',
+        }
+        version_obj_post_headers = self.app.call_list[1].headers
+        for k, v in expected_hdrs.items():
+            self.assertEqual(version_obj_post_headers[k], v)
+
+    def test_POST_unversioned_obj(self):
+        self.app.register(
+            'POST', '/v1/a/c/o', swob.HTTPAccepted, {}, '')
+
+        # TODO: in symlink middleware, swift.leave_relative_location
+        # is added by the middleware during the response
+        # adding to the client request here, need to understand how
+        # to modify the response environ.
+        req = Request.blank(
+            '/v1/a/c/o', method='POST',
+            headers={'Content-Type': 'text/jibberish01',
+                     'X-Object-Meta-Foo': 'bar'},
+            environ={'swift.cache': self.cache_version_off,
+                     'swift.trans_id': 'fake_trans_id'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '202 Accepted')
+
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+        self.assertEqual([None], self.app.swift_sources)
+        self.assertEqual({'fake_trans_id'}, set(self.app.txn_ids))
+        self.assertEqual(self.app.calls, [
+            ('POST', '/v1/a/c/o'),
+        ])
+
+        expected_hdrs = {
+            'content-type': 'text/jibberish01',
+            'x-object-meta-foo': 'bar',
+        }
+        version_obj_post_headers = self.app.call_list[0].headers
+        for k, v in expected_hdrs.items():
+            self.assertEqual(version_obj_post_headers[k], v)
+
+
+class ObjectVersioningTestDelete(ObjectVersioningBaseTestCase):
+    def test_delete_object_with_versioning_never_enabled(self):
+        # should be a straight DELETE, versioning middleware
+        # does not get involved.
+        self.app.register(
+            'DELETE', '/v1/a/c/o', swob.HTTPNoContent, {}, 'passed')
+        cache = FakeMemcache()
+        cache.set(get_cache_key('a'), {'status': 200})
+        cache.set(get_cache_key('a', 'c'), {'status': 200})
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'DELETE',
+                     'swift.cache': cache})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '204 No Content')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+        called_method = [call.method for call in self.app.call_list]
+        self.assertNotIn('PUT', called_method)
+        self.assertNotIn('GET', called_method)
+        self.assertEqual(1, self.app.call_count)
+
+    def test_put_delete_marker_no_object_success(self):
+        ts_now = Timestamp.now()
+        self.app.register(
+            'GET', '/v1/a/c/o', swob.HTTPNotFound,
+            {}, 'passed')
+        self.app.register(
+            'PUT',
+            self.build_versions_path(obj='o', version=(~ts_now).internal),
+            swob.HTTPCreated, {}, 'passed')
+        self.app.register(
+            'DELETE', '/v1/a/c/o', swob.HTTPNotFound, {}, None)
+
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'DELETE',
+                     'swift.cache': self.cache_version_on,
+                     'CONTENT_LENGTH': '0'})
+        with mock_timestamp_now(ts_now):
+            status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '404 Not Found')
+        self.assertEqual(len(self.authorized), 2)
+
+        req.environ['REQUEST_METHOD'] = 'PUT'
+        self.assertRequestEqual(req, self.authorized[0])
+
+        calls = self.app.call_list
+        self.assertEqual(['GET', 'PUT', 'DELETE'], [c.method for c in calls])
+        self.assertEqual('application/x-deleted;swift_versions_deleted=1',
+                         calls[1].headers.get('Content-Type'))
+
+    def test_delete_marker_over_object_success(self):
+        ts_now = Timestamp.now()
+        self.app.register(
+            'GET', '/v1/a/c/o', swob.HTTPOk,
+            {'last-modified': 'Thu, 1 Jan 1970 00:01:00 GMT'}, 'passed')
+        self.app.register(
+            'PUT',
+            self.build_versions_path(obj='o', version='9999999939.99999'),
+            swob.HTTPCreated, {}, 'passed')
+        self.app.register(
+            'PUT',
+            self.build_versions_path(obj='o', version=(~ts_now).internal),
+            swob.HTTPCreated, {}, 'passed')
+        self.app.register(
+            'DELETE', '/v1/a/c/o', swob.HTTPNoContent, {}, None)
+
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'DELETE',
+                     'swift.cache': self.cache_version_on,
+                     'CONTENT_LENGTH': '0'})
+        with mock_timestamp_now(ts_now):
+            status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '204 No Content')
+        self.assertEqual(b'', body)
+        self.assertEqual(len(self.authorized), 2)
+
+        req.environ['REQUEST_METHOD'] = 'PUT'
+        self.assertRequestEqual(req, self.authorized[0])
+
+        calls = self.app.call_list
+        self.assertEqual(['GET', 'PUT', 'PUT', 'DELETE'],
+                         [c.method for c in calls])
+        self.assertEqual(
+            self.build_versions_path(obj='o', version='9999999939.99999'),
+            calls[1].path)
+        self.assertEqual('application/x-deleted;swift_versions_deleted=1',
+                         calls[2].headers.get('Content-Type'))
+
+    def test_delete_marker_over_versioned_object_success(self):
+        ts_now = Timestamp.now()
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPOk,
+                          {SYSMETA_VERSIONS_SYMLINK: 'true'}, 'passed')
+        self.app.register(
+            'PUT',
+            self.build_versions_path(obj='o', version=(~ts_now).internal),
+            swob.HTTPCreated, {}, 'passed')
+        self.app.register(
+            'DELETE', '/v1/a/c/o', swob.HTTPNoContent, {}, None)
+
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'DELETE',
+                     'swift.cache': self.cache_version_on,
+                     'CONTENT_LENGTH': '0'})
+        with mock_timestamp_now(ts_now):
+            status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '204 No Content')
+        self.assertEqual(b'', body)
+        self.assertEqual(len(self.authorized), 2)
+
+        req.environ['REQUEST_METHOD'] = 'PUT'
+        self.assertRequestEqual(req, self.authorized[0])
+
+        calls = self.app.call_list
+        self.assertEqual(['GET', 'PUT', 'DELETE'],
+                         [c.method for c in calls])
+        self.assertEqual(
+            self.build_versions_path(obj='o', version=(~ts_now).internal),
+            calls[1].path)
+        self.assertEqual('application/x-deleted;swift_versions_deleted=1',
+                         calls[1].headers.get('Content-Type'))
+
+    def test_denied_DELETE_of_versioned_object(self):
+        authorize_call = []
+
+        def fake_authorize(req):
+            authorize_call.append((req.method, req.path))
+            return swob.HTTPForbidden()
+
+        req = Request.blank('/v1/a/c/o', method='DELETE', body='',
+                            headers={'X-If-Delete-At': 1},
+                            environ={'swift.cache': self.cache_version_on,
+                                     'swift.authorize': fake_authorize,
+                                     'swift.trans_id': 'fake_trans_id'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '403 Forbidden')
+        self.assertEqual(len(authorize_call), 1)
+        self.assertEqual(('DELETE', '/v1/a/c/o'), authorize_call[0])
+
+
+class ObjectVersioningTestCopy(ObjectVersioningBaseTestCase):
+    def test_COPY_overwrite_tombstone(self):
+        ts_now = Timestamp.now()
+        self.cache_version_on.set(get_cache_key('a', 'src_cont'),
+                                  {'status': 200})
+        src_body = 'stuff' * 100
+        self.app.register(
+            'GET', '/v1/a/c/o', swob.HTTPNotFound, {}, None)
+        self.app.register(
+            'GET', '/v1/a/src_cont/src_obj', swob.HTTPOk, {}, src_body)
+        self.app.register(
+            'PUT',
+            self.build_versions_path(obj='o', version=(~ts_now).internal),
+            swob.HTTPCreated, {}, 'passed')
+        self.app.register(
+            'PUT', '/v1/a/c/o', swob.HTTPCreated, {}, 'passed')
+        req = Request.blank(
+            '/v1/a/src_cont/src_obj',
+            environ={'REQUEST_METHOD': 'COPY',
+                     'swift.cache': self.cache_version_on,
+                     'CONTENT_LENGTH': '100'},
+            headers={'Destination': 'c/o'})
+
+        with mock_timestamp_now(ts_now):
+            status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '201 Created')
+        self.assertEqual(len(self.authorized), 3)
+
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/a/src_cont/src_obj'),
+            ('GET', '/v1/a/c/o?symlink=get'),
+            ('PUT',
+             self.build_versions_path(obj='o', version=(~ts_now).internal)),
+            ('PUT', '/v1/a/c/o'),
+        ])
+
+        expected_headers = {
+            TGT_OBJ_SYSMETA_SYMLINK_HDR:
+            self.build_symlink_path('c', 'o', (~ts_now).internal),
+            'x-object-sysmeta-symlink-target-etag': md5(
+                src_body.encode('utf8'), usedforsecurity=False).hexdigest(),
+            'x-object-sysmeta-symlink-target-bytes': str(len(src_body)),
+        }
+        symlink_put_headers = self.app.call_list[-1].headers
+        for k, v in expected_headers.items():
+            self.assertEqual(symlink_put_headers[k], v)
+
+    def test_COPY_overwrite_object(self):
+        ts_now = Timestamp.now()
+        self.cache_version_on.set(get_cache_key('a', 'src_cont'),
+                                  {'status': 200})
+        src_body = 'stuff' * 100
+        self.app.register(
+            'GET', '/v1/a/src_cont/src_obj', swob.HTTPOk, {}, src_body)
+        self.app.register(
+            'GET', '/v1/a/c/o', swob.HTTPOk,
+            {'last-modified': 'Thu, 1 Jan 1970 00:01:00 GMT'}, 'old object')
+        self.app.register(
+            'PUT',
+            self.build_versions_path(obj='o', version='9999999939.99999'),
+            swob.HTTPCreated, {}, 'passed')
+        self.app.register(
+            'PUT',
+            self.build_versions_path(obj='o', version=(~ts_now).internal),
+            swob.HTTPCreated, {}, 'passed')
+        self.app.register(
+            'PUT', '/v1/a/c/o', swob.HTTPCreated, {}, 'passed')
+        req = Request.blank(
+            '/v1/a/src_cont/src_obj',
+            environ={'REQUEST_METHOD': 'COPY',
+                     'swift.cache': self.cache_version_on,
+                     'CONTENT_LENGTH': '100'},
+            headers={'Destination': 'c/o'})
+
+        with mock_timestamp_now(ts_now):
+            status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '201 Created')
+        self.assertEqual(len(self.authorized), 3)
+
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/a/src_cont/src_obj'),
+            ('GET', '/v1/a/c/o?symlink=get'),
+            ('PUT',
+             self.build_versions_path(obj='o', version='9999999939.99999')),
+            ('PUT',
+             self.build_versions_path(obj='o', version=(~ts_now).internal)),
+            ('PUT', '/v1/a/c/o'),
+        ])
+
+        expected_headers = {
+            TGT_OBJ_SYSMETA_SYMLINK_HDR:
+            self.build_symlink_path('c', 'o', (~ts_now).internal),
+            'x-object-sysmeta-symlink-target-etag': md5(
+                src_body.encode('utf8'), usedforsecurity=False).hexdigest(),
+            'x-object-sysmeta-symlink-target-bytes': str(len(src_body)),
+        }
+        symlink_put_headers = self.app.call_list[-1].headers
+        for k, v in expected_headers.items():
+            self.assertEqual(symlink_put_headers[k], v)
+
+    def test_COPY_overwrite_version_symlink(self):
+        ts_now = Timestamp.now()
+        self.cache_version_on.set(get_cache_key('a', 'src_cont'),
+                                  {'status': 200})
+        src_body = 'stuff' * 100
+        self.app.register(
+            'GET', '/v1/a/src_cont/src_obj', swob.HTTPOk, {}, src_body)
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPOk, {
+            SYSMETA_VERSIONS_SYMLINK: 'true',
+            TGT_OBJ_SYSMETA_SYMLINK_HDR: 'c-unique/whatever'}, '')
+        self.app.register(
+            'PUT',
+            self.build_versions_path(obj='o', version=(~ts_now).internal),
+            swob.HTTPCreated, {}, 'passed')
+        self.app.register(
+            'PUT', '/v1/a/c/o', swob.HTTPCreated, {}, 'passed')
+        req = Request.blank(
+            '/v1/a/src_cont/src_obj',
+            environ={'REQUEST_METHOD': 'COPY',
+                     'swift.cache': self.cache_version_on,
+                     'CONTENT_LENGTH': '100'},
+            headers={'Destination': 'c/o'})
+
+        with mock_timestamp_now(ts_now):
+            status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '201 Created')
+        self.assertEqual(len(self.authorized), 3)
+
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/a/src_cont/src_obj'),
+            ('GET', '/v1/a/c/o?symlink=get'),
+            ('PUT',
+             self.build_versions_path(obj='o', version=(~ts_now).internal)),
+            ('PUT', '/v1/a/c/o'),
+        ])
+
+        expected_headers = {
+            TGT_OBJ_SYSMETA_SYMLINK_HDR:
+            self.build_symlink_path('c', 'o', (~ts_now).internal),
+            'x-object-sysmeta-symlink-target-etag': md5(
+                src_body.encode('utf8'), usedforsecurity=False).hexdigest(),
+            'x-object-sysmeta-symlink-target-bytes': str(len(src_body)),
+        }
+        symlink_put_headers = self.app.call_list[-1].headers
+        for k, v in expected_headers.items():
+            self.assertEqual(symlink_put_headers[k], v)
+
+    def test_copy_new_version_different_account(self):
+        ts_now = Timestamp.now()
+        self.cache_version_on.set(get_cache_key('src_acc'),
+                                  {'status': 200})
+        self.cache_version_on.set(get_cache_key('src_acc', 'src_cont'),
+                                  {'status': 200})
+        src_body = 'stuff' * 100
+        self.app.register(
+            'GET', '/v1/src_acc/src_cont/src_obj', swob.HTTPOk, {}, src_body)
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPOk, {
+            SYSMETA_VERSIONS_SYMLINK: 'true',
+            TGT_OBJ_SYSMETA_SYMLINK_HDR: 'c-unique/whatever'}, '')
+        self.app.register(
+            'PUT',
+            self.build_versions_path(obj='o', version=(~ts_now).internal),
+            swob.HTTPCreated, {}, 'passed')
+        self.app.register(
+            'PUT', '/v1/a/c/o', swob.HTTPCreated, {}, 'passed')
+        req = Request.blank(
+            '/v1/src_acc/src_cont/src_obj',
+            environ={'REQUEST_METHOD': 'COPY',
+                     'swift.cache': self.cache_version_on,
+                     'CONTENT_LENGTH': '100'},
+            headers={'Destination': 'c/o',
+                     'Destination-Account': 'a'})
+
+        with mock_timestamp_now(ts_now):
+            status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '201 Created')
+        self.assertEqual(len(self.authorized), 3)
+
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/src_acc/src_cont/src_obj'),
+            ('GET', '/v1/a/c/o?symlink=get'),
+            ('PUT',
+             self.build_versions_path(obj='o', version=(~ts_now).internal)),
+            ('PUT', '/v1/a/c/o'),
+        ])
+
+        expected_headers = {
+            TGT_OBJ_SYSMETA_SYMLINK_HDR:
+            self.build_symlink_path('c', 'o', (~ts_now).internal),
+            'x-object-sysmeta-symlink-target-etag': md5(
+                src_body.encode('utf8'), usedforsecurity=False).hexdigest(),
+            'x-object-sysmeta-symlink-target-bytes': str(len(src_body)),
+        }
+        symlink_put_headers = self.app.call_list[-1].headers
+        for k, v in expected_headers.items():
+            self.assertEqual(symlink_put_headers[k], v)
+
+    def test_copy_object_versioning_disabled(self):
+        self.cache_version_off.set(get_cache_key('a', 'src_cont'),
+                                   {'status': 200})
+        listing_body = [{
+            "hash": "x",
+            "last_modified": "2014-11-21T14:14:27.409100",
+            "bytes": 3,
+            "name": self.build_object_name('o', '0000000001.00000'),
+            "content_type": "text/plain"
+        }]
+        prefix_listing_path = \
+            '/v1/a/c\x01versions?prefix=o---&marker='
+        self.app.register(
+            'GET', prefix_listing_path, swob.HTTPOk, {},
+            json.dumps(listing_body).encode('utf8'))
+        src_body = 'stuff' * 100
+        self.app.register(
+            'GET', '/v1/a/src_cont/src_obj', swob.HTTPOk, {}, src_body)
+        self.app.register(
+            'PUT', '/v1/a/c/o', swob.HTTPOk, {}, 'passed')
+        req = Request.blank(
+            '/v1/a/src_cont/src_obj',
+            environ={'REQUEST_METHOD': 'COPY',
+                     'swift.cache': self.cache_version_off,
+                     'CONTENT_LENGTH': '100'},
+            headers={'Destination': 'c/o'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(len(self.authorized), 2)
+
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/a/src_cont/src_obj'),
+            ('PUT', '/v1/a/c/o'),
+        ])
+        obj_put_headers = self.app.call_list[-1].headers
+        self.assertNotIn(SYSMETA_VERSIONS_SYMLINK, obj_put_headers)
+
+
+class ObjectVersioningTestVersionAPI(ObjectVersioningBaseTestCase):
+
+    def test_fail_non_versioned_container(self):
+        self.app.register('HEAD', '/v1/a', swob.HTTPOk, {}, '')
+        self.app.register('HEAD', '/v1/a/c', swob.HTTPOk, {}, '')
+        req = Request.blank(
+            '/v1/a/c/o', method='GET',
+            params={'version-id': '0000000060.00000'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '400 Bad Request')
+        self.assertEqual(body, b'version-aware operations require'
+                         b' that the container is versioned')
+
+    def test_PUT_version(self):
+        timestamp = next(self.ts)
+        version_path = '%s?symlink=get' % self.build_versions_path(
+            obj='o', version=(~timestamp).normal)
+        etag = md5(b'old-version-etag', usedforsecurity=False).hexdigest()
+        self.app.register('HEAD', version_path, swob.HTTPNoContent, {
+            'Content-Length': 10,
+            'Content-Type': 'application/old-version',
+            'ETag': etag,
+        }, '')
+        self.app.register('PUT', '/v1/a/c/o', swob.HTTPCreated, {}, '')
+        req = Request.blank(
+            '/v1/a/c/o', method='PUT', body=b'',
+            environ={'swift.cache': self.cache_version_on},
+            params={'version-id': timestamp.normal})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '201 Created')
+        self.assertEqual(self.app.calls, [
+            ('HEAD', version_path),
+            ('PUT', '/v1/a/c/o?version-id=%s' % timestamp.normal),
+        ])
+        obj_put_headers = self.app.call_list[-1].headers
+        symlink_expected_headers = {
+            SYSMETA_VERSIONS_SYMLINK: 'true',
+            TGT_OBJ_SYSMETA_SYMLINK_HDR: self.build_symlink_path(
+                'c', 'o', (~timestamp).normal),
+            'x-object-sysmeta-symlink-target-etag': etag,
+            'x-object-sysmeta-symlink-target-bytes': '10',
+        }
+        for k, v in symlink_expected_headers.items():
+            self.assertEqual(obj_put_headers[k], v)
+
+    def test_PUT_version_with_non_empty_body(self):
+        req = Request.blank(
+            '/v1/a/c/o', method='PUT', body='foo',
+            environ={'swift.cache': self.cache_version_on},
+            params={'version-id': '1'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '400 Bad Request')
+
+        req = Request.blank(
+            '/v1/a/c/o', method='PUT', body='foo',
+            environ={'swift.cache': self.cache_version_on,
+                     'HTTP_TRANSFER_ENCODING': 'chunked',
+                     'CONTENT_LENGTH': None},
+            params={'version-id': '1'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '400 Bad Request')
+
+    def test_PUT_version_with_no_length_or_encoding(self):
+        req = Request.blank(
+            '/v1/a/c/o', method='PUT',
+            environ={'swift.cache': self.cache_version_on},
+            params={'version-id': '1'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '411 Length Required')
+
+    def test_PUT_version_not_found(self):
+        timestamp = next(self.ts)
+        version_path = '%s?symlink=get' % self.build_versions_path(
+            obj='o', version=(~timestamp).normal)
+        self.app.register('HEAD', version_path, swob.HTTPNotFound, {}, '')
+        req = Request.blank(
+            '/v1/a/c/o', method='PUT', body=b'',
+            environ={'swift.cache': self.cache_version_on},
+            params={'version-id': timestamp.normal})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '404 Not Found')
+        self.assertIn(b'version does not exist', body)
+
+    def test_PUT_version_container_not_found(self):
+        timestamp = next(self.ts)
+        version_path = '%s?symlink=get' % self.build_versions_path(
+            obj='o', version=(~timestamp).normal)
+        self.app.register('HEAD', version_path, swob.HTTPNotFound, {}, '')
+        req = Request.blank(
+            '/v1/a/c/o', method='PUT', body=b'',
+            environ={'swift.cache': self.cache_version_on_but_busted},
+            params={'version-id': timestamp.normal})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '500 Internal Error')
+        self.assertIn(b'container does not exist', body)
+        self.assertIn(b're-enable object versioning', body)
+
+    def test_PUT_version_invalid(self):
+        invalid_versions = ('null', 'something', '-10')
+        for version_id in invalid_versions:
+            req = Request.blank(
+                '/v1/a/c/o', method='PUT',
+                environ={'swift.cache': self.cache_version_on},
+                params={'version-id': invalid_versions})
+            status, headers, body = self.call_ov(req)
+            self.assertEqual(status, '400 Bad Request')
+
+    def test_POST_error(self):
+        req = Request.blank(
+            '/v1/a/c/o', method='POST',
+            headers={'Content-Type': 'text/plain',
+                     'X-Object-Meta-foo': 'bar'},
+            environ={'swift.cache': self.cache_version_on,
+                     'swift.trans_id': 'fake_trans_id'},
+            params={'version-id': '1'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '400 Bad Request')
+
+    def test_GET_and_HEAD(self):
+        self.app.register(
+            'GET',
+            self.build_versions_path(obj='o', version='9999999939.99999'),
+            swob.HTTPOk, {}, 'foobar')
+        req = Request.blank(
+            '/v1/a/c/o', method='GET',
+            environ={'swift.cache': self.cache_version_on},
+            params={'version-id': '0000000060.00000'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        self.assertIn(('X-Object-Version-Id', '0000000060.00000'),
+                      headers)
+        self.assertEqual(b'foobar', body)
+        # HEAD with same params find same registered GET
+        req = Request.blank(
+            '/v1/a/c/o', method='HEAD',
+            environ={'swift.cache': self.cache_version_on},
+            params={'version-id': '0000000060.00000'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        self.assertIn(('X-Object-Version-Id', '0000000060.00000'),
+                      headers)
+        self.assertEqual(b'', body)
+
+    def test_GET_404(self):
+        self.app.register(
+            'GET',
+            self.build_versions_path(obj='o', version='9999999939.99999'),
+            swob.HTTPNotFound, {}, '')
+        req = Request.blank(
+            '/v1/a/c/o', method='GET',
+            environ={'swift.cache': self.cache_version_on},
+            params={'version-id': '0000000060.00000'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '404 Not Found')
+        self.assertNotIn(('X-Object-Version-Id', '0000000060.00000'),
+                         headers)
+
+    def test_HEAD(self):
+        self.app.register(
+            'HEAD',
+            self.build_versions_path(obj='o', version='9999999939.99999'),
+            swob.HTTPOk, {
+                'X-Object-Meta-Foo': 'bar'},
+            '')
+        req = Request.blank(
+            '/v1/a/c/o', method='HEAD',
+            environ={'swift.cache': self.cache_version_on},
+            params={'version-id': '0000000060.00000'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertIn(('X-Object-Version-Id', '0000000060.00000'),
+                      headers)
+        self.assertIn(('X-Object-Meta-Foo', 'bar'), headers)
+
+    def test_GET_null_id(self):
+        self.app.register(
+            'GET', '/v1/a/c/o', swob.HTTPOk, {}, 'foobar')
+        req = Request.blank(
+            '/v1/a/c/o', method='GET',
+            environ={'swift.cache': self.cache_version_on},
+            params={'version-id': 'null'})
+        # N.B. GET w/ query param found registered raw_path GET
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(1, len(self.authorized))
+        self.assertRequestEqual(req, self.authorized[0])
+        self.assertEqual(1, len(self.app.calls))
+        self.assertIn(('X-Object-Version-Id', 'null'), headers)
+        self.assertEqual(b'foobar', body)
+        # and HEAD w/ same params finds same registered GET
+        req = Request.blank(
+            '/v1/a/c/o?version-id=null', method='HEAD',
+            environ={'swift.cache': self.cache_version_on})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+        self.assertEqual(2, len(self.app.calls))
+        self.assertIn(('X-Object-Version-Id', 'null'), headers)
+        self.assertEqual(b'', body)
+
+    def test_GET_null_id_versioned_obj(self):
+        self.app.register(
+            'GET', '/v1/a/c/o', swob.HTTPOk, {
+                'Content-Location': self.build_versions_path(
+                    obj='o', version='9999998765.99999')},
+            '')
+        req = Request.blank(
+            '/v1/a/c/o', method='GET',
+            environ={'swift.cache': self.cache_version_on},
+            params={'version-id': 'null'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '404 Not Found')
+        self.assertEqual(1, len(self.authorized))
+        self.assertEqual(1, len(self.app.calls))
+        self.assertNotIn(('X-Object-Version-Id', '0000001234.00000'), headers)
+        # This will log a 499 but (at the moment, anyway)
+        # we don't have a good way to avoid it
+        self.expected_unread_requests[('GET', '/v1/a/c/o?version-id=null')] = 1
+
+    def test_GET_null_id_404(self):
+        self.app.register(
+            'GET', '/v1/a/c/o', swob.HTTPNotFound, {}, '')
+        req = Request.blank(
+            '/v1/a/c/o', method='GET',
+            environ={'swift.cache': self.cache_version_on},
+            params={'version-id': 'null'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '404 Not Found')
+        self.assertEqual(1, len(self.authorized))
+        self.assertRequestEqual(req, self.authorized[0])
+        self.assertEqual(1, len(self.app.calls))
+        self.assertNotIn(('X-Object-Version-Id', 'null'), headers)
+        # and HEAD w/ same params finds same registered GET
+        # we have test_HEAD_null_id, the following test is meant to illustrate
+        # that FakeSwift works for HEADs even if only GETs are registered.
+        req = Request.blank(
+            '/v1/a/c/o', method='HEAD',
+            environ={'swift.cache': self.cache_version_on},
+            params={'version-id': 'null'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '404 Not Found')
+        self.assertEqual(1, len(self.authorized))
+        self.assertRequestEqual(req, self.authorized[0])
+        self.assertEqual(2, len(self.app.calls))
+        self.assertNotIn(('X-Object-Version-Id', 'null'), headers)
+
+    def test_HEAD_null_id(self):
+        self.app.register(
+            'HEAD', '/v1/a/c/o', swob.HTTPOk, {'X-Object-Meta-Foo': 'bar'}, '')
+        req = Request.blank(
+            '/v1/a/c/o', method='HEAD',
+            environ={'swift.cache': self.cache_version_on},
+            params={'version-id': 'null'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(1, len(self.authorized))
+        self.assertEqual(1, len(self.app.calls))
+        self.assertIn(('X-Object-Version-Id', 'null'), headers)
+        self.assertIn(('X-Object-Meta-Foo', 'bar'), headers)
+        # N.B. GET on explicitly registered HEAD raised KeyError
+        req = Request.blank(
+            '/v1/a/c/o', method='GET',
+            environ={'swift.cache': self.cache_version_on},
+            params={'version-id': 'null'})
+        with self.assertRaises(KeyError):
+            status, headers, body = self.call_ov(req)
+
+    def test_HEAD_delete_marker(self):
+        self.app.register(
+            'HEAD',
+            self.build_versions_path(obj='o', version='9999999939.99999'),
+            swob.HTTPOk, {
+                'content-type':
+                'application/x-deleted;swift_versions_deleted=1'},
+            '')
+        req = Request.blank(
+            '/v1/a/c/o', method='HEAD',
+            environ={'swift.cache': self.cache_version_on},
+            params={'version-id': '0000000060.00000'})
+        status, headers, body = self.call_ov(req)
+
+        # a HEAD/GET of a delete-marker returns a 404
+        self.assertEqual(status, '404 Not Found')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertIn(('X-Object-Version-Id', '0000000060.00000'),
+                      headers)
+
+    def test_DELETE_not_current_version(self):
+        # This tests when version-id does not point to the
+        # current version, in this case, there's no need to
+        # re-link symlink
+        self.app.register('HEAD', '/v1/a/c/o', swob.HTTPOk, {
+            SYSMETA_VERSIONS_SYMLINK: 'true',
+            TGT_OBJ_SYSMETA_SYMLINK_HDR: self.build_symlink_path(
+                'c', 'o', '9999999940.99999')}, '')
+        self.app.register(
+            'DELETE',
+            self.build_versions_path(obj='o', version='9999999939.99999'),
+            swob.HTTPNoContent, {}, 'foobar')
+        req = Request.blank(
+            '/v1/a/c/o', method='DELETE',
+            environ={'swift.cache': self.cache_version_on},
+            params={'version-id': '0000000060.00000'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '204 No Content')
+        self.assertEqual('0000000059.00000',
+                         dict(headers)['X-Object-Current-Version-Id'])
+        self.assertEqual(self.app.calls, [
+            ('HEAD', '/v1/a/c/o?symlink=get'),
+            ('DELETE',
+             '%s?version-id=0000000060.00000' % self.build_versions_path(
+                 obj='o', version='9999999939.99999')),
+        ])
+
+        calls = self.app.call_list
+        self.assertIn('X-Newest', calls[0].headers)
+        self.assertEqual('True', calls[0].headers['X-Newest'])
+
+    def test_DELETE_current_version(self):
+        self.app.register('HEAD', '/v1/a/c/o', swob.HTTPOk, {
+            SYSMETA_VERSIONS_SYMLINK: 'true',
+            TGT_OBJ_SYSMETA_SYMLINK_HDR: self.build_symlink_path(
+                'c', 'o', '9999999939.99999')}, '')
+        self.app.register(
+            'DELETE',
+            self.build_versions_path(obj='o', version='9999999939.99999'),
+            swob.HTTPNoContent, {}, '')
+        self.app.register(
+            'DELETE', '/v1/a/c/o', swob.HTTPNoContent, {}, '')
+        req = Request.blank(
+            '/v1/a/c/o', method='DELETE',
+            environ={'swift.cache': self.cache_version_on},
+            params={'version-id': '0000000060.00000'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '204 No Content')
+        self.assertEqual('null',
+                         dict(headers)['X-Object-Current-Version-Id'])
+        self.assertEqual('0000000060.00000',
+                         dict(headers)['X-Object-Version-Id'])
+        self.assertEqual(self.app.calls, [
+            ('HEAD', '/v1/a/c/o?symlink=get'),
+            ('DELETE', '/v1/a/c/o'),
+            ('DELETE',
+             self.build_versions_path(obj='o', version='9999999939.99999')),
+        ])
+
+    def test_DELETE_current_version_is_delete_marker(self):
+        self.app.register('HEAD', '/v1/a/c/o', swob.HTTPNotFound, {}, '')
+        self.app.register(
+            'DELETE',
+            self.build_versions_path(obj='o', version='9999999939.99999'),
+            swob.HTTPNoContent, {}, '')
+        req = Request.blank(
+            '/v1/a/c/o', method='DELETE',
+            environ={'swift.cache': self.cache_version_on},
+            params={'version-id': '0000000060.00000'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '204 No Content')
+        self.assertEqual('null',
+                         dict(headers)['X-Object-Current-Version-Id'])
+        self.assertEqual('0000000060.00000',
+                         dict(headers)['X-Object-Version-Id'])
+        self.assertEqual(self.app.calls, [
+            ('HEAD', '/v1/a/c/o?symlink=get'),
+            ('DELETE',
+             '%s?version-id=0000000060.00000' % self.build_versions_path(
+                 obj='o', version='9999999939.99999')),
+        ])
+
+    def test_DELETE_current_obj_is_unversioned(self):
+        self.app.register('HEAD', '/v1/a/c/o', swob.HTTPOk, {}, '')
+        self.app.register(
+            'DELETE',
+            self.build_versions_path(obj='o', version='9999999939.99999'),
+            swob.HTTPNoContent, {}, '')
+        req = Request.blank(
+            '/v1/a/c/o', method='DELETE',
+            environ={'swift.cache': self.cache_version_on},
+            params={'version-id': '0000000060.00000'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '204 No Content')
+        self.assertEqual('null',
+                         dict(headers)['X-Object-Current-Version-Id'])
+        self.assertEqual('0000000060.00000',
+                         dict(headers)['X-Object-Version-Id'])
+        self.assertEqual(self.app.calls, [
+            ('HEAD', '/v1/a/c/o?symlink=get'),
+            ('DELETE',
+             '%s?version-id=0000000060.00000' % self.build_versions_path(
+                 obj='o', version='9999999939.99999')),
+        ])
+
+    def test_DELETE_null_version(self):
+        self.app.register(
+            'DELETE', '/v1/a/c/o', swob.HTTPNoContent, {}, '')
+        req = Request.blank(
+            '/v1/a/c/o', method='DELETE',
+            environ={'swift.cache': self.cache_version_on},
+            params={'version-id': 'null'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '204 No Content')
+        self.assertEqual(self.app.calls, [
+            ('DELETE', '/v1/a/c/o?version-id=null'),
+        ])
+
+
+class ObjectVersioningVersionAPIWhileDisabled(ObjectVersioningBaseTestCase):
+
+    def test_PUT_version_versioning_disbaled(self):
+        timestamp = next(self.ts)
+        version_path = '%s?symlink=get' % self.build_versions_path(
+            obj='o', version=(~timestamp).normal)
+        etag = md5(b'old-version-etag', usedforsecurity=False).hexdigest()
+        self.app.register('HEAD', version_path, swob.HTTPNoContent, {
+            'Content-Length': 10,
+            'Content-Type': 'application/old-version',
+            'ETag': etag,
+        }, '')
+        self.app.register('PUT', '/v1/a/c/o', swob.HTTPCreated, {}, '')
+        req = Request.blank(
+            '/v1/a/c/o', method='PUT', body=b'',
+            environ={'swift.cache': self.cache_version_off},
+            params={'version-id': timestamp.normal})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '201 Created')
+        self.assertEqual(self.app.calls, [
+            ('HEAD', version_path),
+            ('PUT', '/v1/a/c/o?version-id=%s' % timestamp.normal),
+        ])
+        obj_put_headers = self.app.call_list[-1].headers
+        symlink_expected_headers = {
+            SYSMETA_VERSIONS_SYMLINK: 'true',
+            TGT_OBJ_SYSMETA_SYMLINK_HDR: self.build_symlink_path(
+                'c', 'o', (~timestamp).normal),
+            'x-object-sysmeta-symlink-target-etag': etag,
+            'x-object-sysmeta-symlink-target-bytes': '10',
+        }
+        for k, v in symlink_expected_headers.items():
+            self.assertEqual(obj_put_headers[k], v)
+
+    def test_POST_error_versioning_disabled(self):
+        req = Request.blank(
+            '/v1/a/c/o', method='POST',
+            headers={'Content-Type': 'text/plain',
+                     'X-Object-Meta-foo': 'bar'},
+            environ={'swift.cache': self.cache_version_off,
+                     'swift.trans_id': 'fake_trans_id'},
+            params={'version-id': '1'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '400 Bad Request')
+
+    def test_DELETE_current_version(self):
+        self.app.register('HEAD', '/v1/a/c/o', swob.HTTPOk, {
+            SYSMETA_VERSIONS_SYMLINK: 'true',
+            TGT_OBJ_SYSMETA_SYMLINK_HDR: self.build_symlink_path(
+                'c', 'o', '9999999939.99999')}, '')
+        self.app.register(
+            'DELETE',
+            self.build_versions_path(obj='o', version='9999999939.99999'),
+            swob.HTTPNoContent, {}, '')
+        self.app.register(
+            'DELETE', '/v1/a/c/o', swob.HTTPNoContent, {}, '')
+
+        # request with versioning disabled
+        req = Request.blank(
+            '/v1/a/c/o', method='DELETE',
+            environ={'swift.cache': self.cache_version_off},
+            params={'version-id': '0000000060.00000'})
+        status, headers, body = self.call_ov(req)
+
+        self.assertEqual(status, '204 No Content')
+        self.assertEqual(self.app.calls, [
+            ('HEAD', '/v1/a/c/o?symlink=get'),
+            ('DELETE', '/v1/a/c/o'),
+            ('DELETE',
+             self.build_versions_path(obj='o', version='9999999939.99999')),
+        ])
+
+
+class ObjectVersioningTestContainerOperations(ObjectVersioningBaseTestCase):
+    def test_container_listing_translation(self):
+        listing_body = [{
+            'bytes': 0,
+            'name': 'my-normal-obj',
+            'hash': 'd41d8cd98f00b204e9800998ecf8427e; '
+            'symlink_target=%s; '
+            'symlink_target_etag=e55cedc11adb39c404b7365f7d6291fa; '
+            'symlink_target_bytes=9' % self.build_symlink_path(
+                'c', 'my-normal-obj', '9999999989.99999'),
+            'last_modified': '2019-07-26T15:09:54.518990',
+            'content_type': 'application/foo',
+        }, {
+            'bytes': 8,
+            'name': 'my-old-object',
+            'hash': 'ebdd8d46ecb4a07f6c433d67eb05d5f3',
+            'last_modified': '2019-07-26T15:54:38.326800',
+            'content_type': 'application/bar',
+        }, {
+            'bytes': 0,
+            'name': 'my-slo-manifest',
+            'hash': '387d1ab7d89eda2162bcf8e502667c86; '
+            'slo_etag=71e938d37c1d06dc634dd24660255a88; '
+            'symlink_target=%s; '
+            'symlink_target_etag=387d1ab7d89eda2162bcf8e502667c86; '
+            # N.B. symlink_target_bytes is set to the slo_size
+            'symlink_target_bytes=10485760' % self.build_symlink_path(
+                'c', 'my-slo-manifest', '9999999979.99999'),
+            'last_modified': '2019-07-26T15:00:28.499260',
+            'content_type': 'application/baz',
+        }, {
+            'bytes': 0,
+            'name': 'unexpected-symlink',
+            'hash': 'd41d8cd98f00b204e9800998ecf8427e; '
+            'symlink_target=tgt_container/tgt_obj; '
+            'symlink_target_etag=e55cedc11adb39c404b7365f7d6291fa; '
+            'symlink_target_bytes=9',
+            'last_modified': '2019-07-26T15:09:54.518990',
+            'content_type': 'application/symlink',
+        }]
+
+        self.app.register(
+            'GET', '/v1/a/c', swob.HTTPOk,
+            {SYSMETA_VERSIONS_CONT: self.build_container_name('c'),
+             SYSMETA_VERSIONS_ENABLED: True},
+            json.dumps(listing_body).encode('utf8'))
+        req = Request.blank(
+            '/v1/a/c',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        self.assertIn(('X-Versions-Enabled', 'True'), headers)
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+        expected = [{
+            'bytes': 9,
+            'name': 'my-normal-obj',
+            'hash': 'e55cedc11adb39c404b7365f7d6291fa',
+            'last_modified': '2019-07-26T15:09:54.518990',
+            'content_type': 'application/foo',
+            'symlink_path':
+                '/v1/a/c/my-normal-obj?version-id=0000000010.00000',
+            'version_symlink': True,
+        }, {
+            'bytes': 8,
+            'name': 'my-old-object',
+            'hash': 'ebdd8d46ecb4a07f6c433d67eb05d5f3',
+            'last_modified': '2019-07-26T15:54:38.326800',
+            'content_type': 'application/bar',
+        }, {
+            'bytes': 10485760,
+            'name': 'my-slo-manifest',
+            # since we don't have slo middleware in test pipeline, we expect
+            # slo_etag to stay in the hash key
+            'hash': '387d1ab7d89eda2162bcf8e502667c86; '
+            'slo_etag=71e938d37c1d06dc634dd24660255a88',
+            'last_modified': '2019-07-26T15:00:28.499260',
+            'content_type': 'application/baz',
+            'symlink_path':
+                '/v1/a/c/my-slo-manifest?version-id=0000000020.00000',
+            'version_symlink': True,
+        }, {
+            'bytes': 0,
+            'name': 'unexpected-symlink',
+            'hash': 'd41d8cd98f00b204e9800998ecf8427e',
+            'last_modified': '2019-07-26T15:09:54.518990',
+            'symlink_bytes': 9,
+            'symlink_path': '/v1/a/tgt_container/tgt_obj',
+            'symlink_etag': 'e55cedc11adb39c404b7365f7d6291fa',
+            'content_type': 'application/symlink',
+        }]
+        self.assertEqual(expected, json.loads(body))
+
+    def test_listing_translation_utf8(self):
+        listing_body = [{
+            'bytes': 0,
+            'name': u'\N{SNOWMAN}-obj',
+            'hash': 'd41d8cd98f00b204e9800998ecf8427e; '
+            'symlink_target=%s; '
+            'symlink_target_etag=e55cedc11adb39c404b7365f7d6291fa; '
+            'symlink_target_bytes=9' % self.build_symlink_path(
+                u'\N{COMET}-container', u'\N{CLOUD}-target',
+                '9999999989.99999'),
+            'last_modified': '2019-07-26T15:09:54.518990',
+            'content_type': 'application/snowman',
+        }]
+        self.app.register(
+            'GET', '/v1/a/\xe2\x98\x83-test', swob.HTTPOk,
+            {SYSMETA_VERSIONS_CONT: wsgi_quote(
+                str_to_wsgi(self.build_container_name(
+                    u'\N{COMET}-container'))),
+             SYSMETA_VERSIONS_ENABLED: True},
+            json.dumps(listing_body).encode('utf8'))
+        req = Request.blank(
+            '/v1/a/\xe2\x98\x83-test',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        self.assertIn(('X-Versions-Enabled', 'True'), headers)
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+        expected = [{
+            'bytes': 9,
+            'name': u'\N{SNOWMAN}-obj',
+            'hash': 'e55cedc11adb39c404b7365f7d6291fa',
+            'last_modified': '2019-07-26T15:09:54.518990',
+            'symlink_path':
+                '/v1/a/%E2%98%83-test/%E2%98%81-target?'
+                'version-id=0000000010.00000',
+            'content_type': 'application/snowman',
+            'version_symlink': True,
+        }]
+        self.assertEqual(expected, json.loads(body))
+
+    def test_list_versions(self):
+        listing_body = [{
+            'bytes': 8,
+            'name': 'my-other-object',
+            'hash': 'ebdd8d46ecb4a07f6c433d67eb05d5f3',
+            'last_modified': '1970-01-01T00:00:05.000000',
+            'content_type': 'application/bar',
+        }, {
+            'bytes': 0,
+            'name': 'obj',
+            'hash': 'd41d8cd98f00b204e9800998ecf8427e; '
+            'symlink_target=%s; '
+            'symlink_target_etag=e55cedc11adb39c404b7365f7d6291fa; '
+            'symlink_target_bytes=9' %
+            self.build_symlink_path('c', 'obj', '9999999979.99999'),
+            'last_modified': '1970-01-01T00:00:20.000000',
+            'content_type': 'text/plain',
+        }]
+
+        versions_listing_body = [{
+            'bytes': 9,
+            'name': self.build_object_name('obj', '9999999979.99999'),
+            'hash': 'e55cedc11adb39c404b7365f7d6291fa',
+            'last_modified': '1970-01-01T00:00:20.000000',
+            'content_type': 'text/plain',
+        }, {
+            'bytes': 8,
+            'name': self.build_object_name('obj', '9999999989.99999'),
+            'hash': 'ebdd8d46ecb4a07f6c433d67eb35d5f2',
+            'last_modified': '1970-01-01T00:00:10.000000',
+            'content_type': 'text/plain',
+        }]
+        self.app.register(
+            'GET', self.build_versions_path(), swob.HTTPOk, {},
+            json.dumps(versions_listing_body).encode('utf8'))
+        self.app.register(
+            'GET', '/v1/a/c', swob.HTTPOk,
+            {SYSMETA_VERSIONS_CONT: self.build_container_name('c'),
+             SYSMETA_VERSIONS_ENABLED: True},
+            json.dumps(listing_body).encode('utf8'))
+        req = Request.blank(
+            '/v1/a/c?versions',
+            environ={'REQUEST_METHOD': 'GET',
+                     'swift.cache': self.cache_version_on})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        self.assertIn(('X-Versions-Enabled', 'True'), headers)
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+        expected = [{
+            'bytes': 8,
+            'name': 'my-other-object',
+            'version_id': 'null',
+            'hash': 'ebdd8d46ecb4a07f6c433d67eb05d5f3',
+            'last_modified': '1970-01-01T00:00:05.000000',
+            'content_type': 'application/bar',
+            'is_latest': True,
+        }, {
+            'bytes': 9,
+            'name': 'obj',
+            'version_id': '0000000020.00000',
+            'hash': 'e55cedc11adb39c404b7365f7d6291fa',
+            'last_modified': '1970-01-01T00:00:20.000000',
+            'content_type': 'text/plain',
+            'is_latest': True,
+        }, {
+            'bytes': 8,
+            'name': 'obj',
+            'version_id': '0000000010.00000',
+            'hash': 'ebdd8d46ecb4a07f6c433d67eb35d5f2',
+            'last_modified': '1970-01-01T00:00:10.000000',
+            'content_type': 'text/plain',
+            'is_latest': False,
+        }]
+        self.assertEqual(expected, json.loads(body))
+
+        # Can be explicitly JSON
+        req = Request.blank(
+            '/v1/a/c?versions&format=json',
+            environ={'REQUEST_METHOD': 'GET',
+                     'swift.cache': self.cache_version_on})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+
+        req = Request.blank(
+            '/v1/a/c?versions',
+            environ={'REQUEST_METHOD': 'GET',
+                     'swift.cache': self.cache_version_on,
+                     'HTTP_ACCEPT': 'application/json'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+
+        # But everything else is unacceptable
+        req = Request.blank(
+            '/v1/a/c?versions&format=plain',
+            environ={'REQUEST_METHOD': 'GET',
+                     'swift.cache': self.cache_version_on})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '406 Not Acceptable')
+
+        req = Request.blank(
+            '/v1/a/c?versions',
+            environ={'REQUEST_METHOD': 'GET',
+                     'swift.cache': self.cache_version_on,
+                     'HTTP_ACCEPT': 'text/plain'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '406 Not Acceptable')
+
+        req = Request.blank(
+            '/v1/a/c?versions&format=xml',
+            environ={'REQUEST_METHOD': 'GET',
+                     'swift.cache': self.cache_version_on})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '406 Not Acceptable')
+
+        req = Request.blank(
+            '/v1/a/c?versions',
+            environ={'REQUEST_METHOD': 'GET',
+                     'swift.cache': self.cache_version_on,
+                     'HTTP_ACCEPT': 'text/xml'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '406 Not Acceptable')
+
+        req = Request.blank(
+            '/v1/a/c?versions',
+            environ={'REQUEST_METHOD': 'GET',
+                     'swift.cache': self.cache_version_on,
+                     'HTTP_ACCEPT': 'application/xml'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '406 Not Acceptable')
+
+        req = Request.blank(
+            '/v1/a/c?versions&format=asdf',
+            environ={'REQUEST_METHOD': 'GET',
+                     'swift.cache': self.cache_version_on})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '406 Not Acceptable')
+
+        req = Request.blank(
+            '/v1/a/c?versions',
+            environ={'REQUEST_METHOD': 'GET',
+                     'swift.cache': self.cache_version_on,
+                     'HTTP_ACCEPT': 'foo/bar'})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '406 Not Acceptable')
+
+    def test_list_versions_marker_missing_marker(self):
+
+        self.app.register(
+            'GET', '/v1/a/c', swob.HTTPOk,
+            {SYSMETA_VERSIONS_CONT: self.build_container_name('c'),
+             SYSMETA_VERSIONS_ENABLED: True}, '{}')
+
+        req = Request.blank(
+            '/v1/a/c?versions&version_marker=1',
+            environ={'REQUEST_METHOD': 'GET',
+                     'swift.cache': self.cache_version_on})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '400 Bad Request')
+        self.assertEqual(body, b'version_marker param requires marker')
+
+        req = Request.blank(
+            '/v1/a/c?versions&marker=obj&version_marker=id',
+            environ={'REQUEST_METHOD': 'GET',
+                     'swift.cache': self.cache_version_on})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '400 Bad Request')
+        self.assertEqual(body, b'invalid version_marker param')
+
+    def test_list_versions_marker(self):
+        listing_body = [{
+            'bytes': 8,
+            'name': 'non-versioned-obj',
+            'hash': 'etag',
+            'last_modified': '1970-01-01T00:00:05.000000',
+            'content_type': 'application/bar',
+        }, {
+            'bytes': 0,
+            'name': 'obj',
+            'hash': 'd41d8cd98f00b204e9800998ecf8427e; '
+            'symlink_target=%s; '
+            'symlink_target_etag=e55cedc11adb39c404b7365f7d6291fa; '
+            'symlink_target_bytes=9' %
+            self.build_symlink_path('c', 'obj', '9999999969.99999'),
+            'last_modified': '1970-01-01T00:00:30.000000',
+            'content_type': 'text/plain',
+        }]
+
+        versions_listing_body = [{
+            'bytes': 9,
+            'name': self.build_object_name('obj', '9999999969.99999'),
+            'hash': 'etagv3',
+            'last_modified': '1970-01-01T00:00:30.000000',
+            'content_type': 'text/plain',
+        }, {
+            'bytes': 10,
+            'name': self.build_object_name('obj', '9999999979.99999'),
+            'hash': 'etagv2',
+            'last_modified': '1970-01-01T00:00:20.000000',
+            'content_type': 'text/plain',
+        }, {
+            'bytes': 8,
+            'name': self.build_object_name('obj', '9999999989.99999'),
+            'hash': 'etagv1',
+            'last_modified': '1970-01-01T00:00:10.000000',
+            'content_type': 'text/plain',
+        }]
+
+        expected = [{
+            'bytes': 8,
+            'name': 'non-versioned-obj',
+            'hash': 'etag',
+            'version_id': 'null',
+            'last_modified': '1970-01-01T00:00:05.000000',
+            'content_type': 'application/bar',
+        }, {
+            'bytes': 9,
+            'name': 'obj',
+            'version_id': '0000000030.00000',
+            'hash': 'etagv3',
+            'last_modified': '1970-01-01T00:00:30.000000',
+            'content_type': 'text/plain',
+            'is_latest': True,
+        }, {
+            'bytes': 10,
+            'name': 'obj',
+            'version_id': '0000000020.00000',
+            'hash': 'etagv2',
+            'last_modified': '1970-01-01T00:00:20.000000',
+            'content_type': 'text/plain',
+            'is_latest': False,
+        }, {
+            'bytes': 8,
+            'name': 'obj',
+            'version_id': '0000000010.00000',
+            'hash': 'etagv1',
+            'last_modified': '1970-01-01T00:00:10.000000',
+            'content_type': 'text/plain',
+            'is_latest': False,
+        }]
+
+        self.app.register(
+            'GET', self.build_versions_path(), swob.HTTPOk, {},
+            json.dumps(versions_listing_body).encode('utf8'))
+        self.app.register(
+            'GET', '/v1/a/c', swob.HTTPOk,
+            {SYSMETA_VERSIONS_CONT: self.build_container_name('c'),
+             SYSMETA_VERSIONS_ENABLED: True},
+            json.dumps(listing_body[1:]).encode('utf8'))
+        req = Request.blank(
+            '/v1/a/c?versions&marker=obj',
+            environ={'REQUEST_METHOD': 'GET',
+                     'swift.cache': self.cache_version_on})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        self.assertIn(('X-Versions-Enabled', 'True'), headers)
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+        self.assertEqual(expected[1:], json.loads(body))
+
+        # version_marker
+        self.app.register(
+            'GET',
+            '%s?marker=%s' % (
+                self.build_versions_path(),
+                self.build_object_name('obj', '9999999989.99999')),
+            swob.HTTPOk, {},
+            json.dumps(versions_listing_body[2:]).encode('utf8'))
+        self.app.register(
+            'GET', '/v1/a/c', swob.HTTPOk,
+            {SYSMETA_VERSIONS_CONT: self.build_container_name('c'),
+             SYSMETA_VERSIONS_ENABLED: True},
+            json.dumps(listing_body[1:]).encode('utf8'))
+        req = Request.blank(
+            '/v1/a/c?versions&marker=obj&version_marker=0000000010.00000',
+            environ={'REQUEST_METHOD': 'GET',
+                     'swift.cache': self.cache_version_on})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        self.assertIn(('X-Versions-Enabled', 'True'), headers)
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+        self.assertEqual(expected[3:], json.loads(body))
+
+    def test_list_versions_invalid_delimiter(self):
+
+        self.app.register(
+            'GET', '/v1/a/c', swob.HTTPOk,
+            {SYSMETA_VERSIONS_CONT: self.build_container_name('c'),
+             SYSMETA_VERSIONS_ENABLED: True}, '{}')
+
+        req = Request.blank(
+            '/v1/a/c?versions&delimiter=1',
+            environ={'REQUEST_METHOD': 'GET',
+                     'swift.cache': self.cache_version_on})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '400 Bad Request')
+        self.assertEqual(body, b'invalid delimiter param')
+
+    def test_list_versions_delete_markers(self):
+        listing_body = []
+        self.app.register(
+            'GET', '/v1/a/c', swob.HTTPOk,
+            {SYSMETA_VERSIONS_CONT: self.build_container_name('c'),
+             SYSMETA_VERSIONS_ENABLED: True},
+            json.dumps(listing_body).encode('utf8'))
+        versions_listing_body = [{
+            'name': self.build_object_name('obj', '9999999979.99999'),
+            'bytes': 0,
+            'hash': utils.MD5_OF_EMPTY_STRING,
+            'last_modified': '1970-01-01T00:00:20.000000',
+            'content_type': DELETE_MARKER_CONTENT_TYPE,
+        }, {
+            'name': self.build_object_name('obj', '9999999989.99999'),
+            'bytes': 0,
+            'hash': utils.MD5_OF_EMPTY_STRING,
+            'last_modified': '1970-01-01T00:00:10.000000',
+            'content_type': DELETE_MARKER_CONTENT_TYPE,
+        }]
+        self.app.register(
+            'GET', self.build_versions_path(), swob.HTTPOk, {},
+            json.dumps(versions_listing_body).encode('utf8'))
+        req = Request.blank('/v1/a/c?versions', method='GET',
+                            environ={'swift.cache': self.cache_version_on})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        expected = [{
+            'name': 'obj',
+            'bytes': 0,
+            'version_id': '0000000020.00000',
+            'hash': utils.MD5_OF_EMPTY_STRING,
+            'last_modified': '1970-01-01T00:00:20.000000',
+            'content_type': DELETE_MARKER_CONTENT_TYPE,
+            'is_latest': True,
+        }, {
+            'name': 'obj',
+            'bytes': 0,
+            'version_id': '0000000010.00000',
+            'hash': utils.MD5_OF_EMPTY_STRING,
+            'last_modified': '1970-01-01T00:00:10.000000',
+            'content_type': DELETE_MARKER_CONTENT_TYPE,
+            'is_latest': False,
+        }]
+        self.assertEqual(expected, json.loads(body))
+
+    def test_list_versions_unversioned(self):
+        listing_body = [{
+            'bytes': 8,
+            'name': 'my-other-object',
+            'hash': 'ebdd8d46ecb4a07f6c433d67eb05d5f3',
+            'last_modified': '1970-01-01T00:00:05.000000',
+            'content_type': 'application/bar',
+        }, {
+            # How did this get here??? Who knows -- maybe another container
+            # replica *does* know about versioning being enabled
+            'bytes': 0,
+            'name': 'obj',
+            'hash': 'd41d8cd98f00b204e9800998ecf8427e; '
+            'symlink_target=%s; '
+            'symlink_target_etag=e55cedc11adb39c404b7365f7d6291fa; '
+            'symlink_target_bytes=9' %
+            self.build_symlink_path('c', 'obj', '9999999979.99999'),
+            'last_modified': '1970-01-01T00:00:20.000000',
+            'content_type': 'text/plain',
+        }]
+
+        self.app.register(
+            'GET', self.build_versions_path(), swob.HTTPNotFound, {}, None)
+        self.app.register(
+            'GET', '/v1/a/c', swob.HTTPOk, {},
+            json.dumps(listing_body).encode('utf8'))
+        req = Request.blank(
+            '/v1/a/c?versions',
+            environ={'REQUEST_METHOD': 'GET',
+                     'swift.cache': self.cache_version_off})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        self.assertNotIn(('X-Versions-Enabled', 'True'), headers)
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+        expected = [{
+            'bytes': 8,
+            'name': 'my-other-object',
+            'version_id': 'null',
+            'hash': 'ebdd8d46ecb4a07f6c433d67eb05d5f3',
+            'last_modified': '1970-01-01T00:00:05.000000',
+            'content_type': 'application/bar',
+            'is_latest': True,
+        }, {
+            'bytes': 9,
+            'name': 'obj',
+            'version_id': '0000000020.00000',
+            'hash': 'e55cedc11adb39c404b7365f7d6291fa',
+            'last_modified': '1970-01-01T00:00:20.000000',
+            'content_type': 'text/plain',
+            'is_latest': True,
+        }]
+        self.assertEqual(expected, json.loads(body))
+
+    def test_list_versions_delimiter(self):
+        listing_body = [{
+            'bytes': 8,
+            'name': 'my-other-object',
+            'hash': 'ebdd8d46ecb4a07f6c433d67eb05d5f3',
+            'last_modified': '1970-01-01T00:00:05.000000',
+            'content_type': 'application/bar',
+        }, {
+            'bytes': 0,
+            'name': 'obj',
+            'hash': 'd41d8cd98f00b204e9800998ecf8427e; '
+            'symlink_target=%s; '
+            'symlink_target_etag=e55cedc11adb39c404b7365f7d6291fa; '
+            'symlink_target_bytes=9' %
+            self.build_symlink_path('c', 'obj', '9999999979.99999'),
+            'last_modified': '1970-01-01T00:00:20.000000',
+            'content_type': 'text/plain',
+        }, {
+            'subdir': 'subdir/'
+        }]
+
+        versions_listing_body = [{
+            'bytes': 9,
+            'name': self.build_object_name('obj', '9999999979.99999'),
+            'hash': 'e55cedc11adb39c404b7365f7d6291fa',
+            'last_modified': '1970-01-01T00:00:20.000000',
+            'content_type': 'text/plain',
+        }, {
+            'bytes': 8,
+            'name': self.build_object_name('obj', '9999999989.99999'),
+            'hash': 'ebdd8d46ecb4a07f6c433d67eb35d5f2',
+            'last_modified': '1970-01-01T00:00:10.000000',
+            'content_type': 'text/plain',
+        }, {
+            'subdir': get_reserved_name('subdir/')
+        }]
+
+        self.app.register(
+            'GET', self.build_versions_path(), swob.HTTPOk, {},
+            json.dumps(versions_listing_body).encode('utf8'))
+        self.app.register(
+            'GET', '/v1/a/c', swob.HTTPOk,
+            {SYSMETA_VERSIONS_CONT: self.build_container_name('c'),
+             SYSMETA_VERSIONS_ENABLED: True},
+            json.dumps(listing_body).encode('utf8'))
+        req = Request.blank(
+            '/v1/a/c?versions&delimiter=/',
+            environ={'REQUEST_METHOD': 'GET',
+                     'swift.cache': self.cache_version_on})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        self.assertIn(('X-Versions-Enabled', 'True'), headers)
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+        expected = [{
+            'bytes': 8,
+            'name': 'my-other-object',
+            'version_id': 'null',
+            'hash': 'ebdd8d46ecb4a07f6c433d67eb05d5f3',
+            'last_modified': '1970-01-01T00:00:05.000000',
+            'content_type': 'application/bar',
+            'is_latest': True,
+        }, {
+            'bytes': 9,
+            'name': 'obj',
+            'version_id': '0000000020.00000',
+            'hash': 'e55cedc11adb39c404b7365f7d6291fa',
+            'last_modified': '1970-01-01T00:00:20.000000',
+            'content_type': 'text/plain',
+            'is_latest': True,
+        }, {
+            'bytes': 8,
+            'name': 'obj',
+            'version_id': '0000000010.00000',
+            'hash': 'ebdd8d46ecb4a07f6c433d67eb35d5f2',
+            'last_modified': '1970-01-01T00:00:10.000000',
+            'content_type': 'text/plain',
+            'is_latest': False,
+        }, {
+            'subdir': 'subdir/'
+        }]
+        self.assertEqual(expected, json.loads(body))
+
+    def test_list_versions_empty_primary(self):
+        versions_listing_body = [{
+            'bytes': 8,
+            'name': self.build_object_name('obj', '9999999979.99999'),
+            'hash': 'ebdd8d46ecb4a07f6c433d67eb05d5f3',
+            'last_modified': '1970-01-01T00:00:20.000000',
+            'content_type': 'text/plain',
+        }, {
+            'bytes': 8,
+            'name': self.build_object_name('obj', '9999999989.99999'),
+            'hash': 'ebdd8d46ecb4a07f6c433d67eb35d5f2',
+            'last_modified': '1970-01-01T00:00:10.000000',
+            'content_type': 'text/plain',
+        }]
+        self.app.register(
+            'GET', self.build_versions_path(), swob.HTTPOk, {},
+            json.dumps(versions_listing_body).encode('utf8'))
+        self.app.register(
+            'GET', '/v1/a/c', swob.HTTPOk,
+            {SYSMETA_VERSIONS_CONT: self.build_container_name('c'),
+             SYSMETA_VERSIONS_ENABLED: True},
+            '{}')
+        req = Request.blank(
+            '/v1/a/c?versions',
+            environ={'REQUEST_METHOD': 'GET',
+                     'swift.cache': self.cache_version_on})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        self.assertIn(('X-Versions-Enabled', 'True'), headers)
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+        expected = [{
+            'bytes': 8,
+            'name': 'obj',
+            'version_id': '0000000020.00000',
+            'hash': 'ebdd8d46ecb4a07f6c433d67eb05d5f3',
+            'last_modified': '1970-01-01T00:00:20.000000',
+            'content_type': 'text/plain',
+            'is_latest': False,
+        }, {
+            'bytes': 8,
+            'name': 'obj',
+            'version_id': '0000000010.00000',
+            'hash': 'ebdd8d46ecb4a07f6c433d67eb35d5f2',
+            'last_modified': '1970-01-01T00:00:10.000000',
+            'content_type': 'text/plain',
+            'is_latest': False,
+        }]
+        self.assertEqual(expected, json.loads(body))
+
+    def test_list_versions_error_versions_container(self):
+        listing_body = [{
+            'bytes': 8,
+            'name': 'my-other-object',
+            'hash': 'ebdd8d46ecb4a07f6c433d67eb05d5f3',
+            'last_modified': '1970-01-01T00:00:05.000000',
+            'content_type': 'application/bar',
+        }, {
+            'bytes': 9,
+            'name': 'obj',
+            'hash': 'e55cedc11adb39c404b7365f7d6291fa',
+            'last_modified': '1970-01-01T00:00:20.000000',
+            'content_type': 'text/plain',
+        }]
+
+        self.app.register(
+            'GET', self.build_versions_path(),
+            swob.HTTPInternalServerError, {}, '')
+        self.app.register(
+            'GET', '/v1/a/c', swob.HTTPOk,
+            {SYSMETA_VERSIONS_CONT: self.build_container_name('c'),
+             SYSMETA_VERSIONS_ENABLED: True},
+            json.dumps(listing_body).encode('utf8'))
+        req = Request.blank(
+            '/v1/a/c?versions',
+            environ={'REQUEST_METHOD': 'GET',
+                     'swift.cache': self.cache_version_on})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '500 Internal Error')
+
+    def test_list_versions_empty_versions_container(self):
+        listing_body = [{
+            'bytes': 8,
+            'name': 'my-other-object',
+            'hash': 'ebdd8d46ecb4a07f6c433d67eb05d5f3',
+            'last_modified': '1970-01-01T00:00:05.000000',
+            'content_type': 'application/bar',
+        }, {
+            'bytes': 9,
+            'name': 'obj',
+            'hash': 'e55cedc11adb39c404b7365f7d6291fa',
+            'last_modified': '1970-01-01T00:00:20.000000',
+            'content_type': 'text/plain',
+        }]
+
+        self.app.register(
+            'GET', self.build_versions_path(), swob.HTTPOk, {}, '{}')
+        self.app.register(
+            'GET', '/v1/a/c', swob.HTTPOk,
+            {SYSMETA_VERSIONS_CONT: self.build_container_name('c'),
+             SYSMETA_VERSIONS_ENABLED: True},
+            json.dumps(listing_body).encode('utf8'))
+        req = Request.blank(
+            '/v1/a/c?versions',
+            environ={'REQUEST_METHOD': 'GET',
+                     'swift.cache': self.cache_version_on})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        self.assertIn(('X-Versions-Enabled', 'True'), headers)
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+        expected = [{
+            'bytes': 8,
+            'name': 'my-other-object',
+            'version_id': 'null',
+            'hash': 'ebdd8d46ecb4a07f6c433d67eb05d5f3',
+            'last_modified': '1970-01-01T00:00:05.000000',
+            'content_type': 'application/bar',
+            'is_latest': True,
+        }, {
+            'bytes': 9,
+            'name': 'obj',
+            'version_id': 'null',
+            'hash': 'e55cedc11adb39c404b7365f7d6291fa',
+            'last_modified': '1970-01-01T00:00:20.000000',
+            'content_type': 'text/plain',
+            'is_latest': True,
+        }]
+        self.assertEqual(expected, json.loads(body))
+
+    def test_list_versions_404_versions_container(self):
+        listing_body = [{
+            'bytes': 8,
+            'name': 'my-other-object',
+            'hash': 'ebdd8d46ecb4a07f6c433d67eb05d5f3',
+            'last_modified': '1970-01-01T00:00:05.000000',
+            'content_type': 'application/bar',
+        }, {
+            'bytes': 9,
+            'name': 'obj',
+            'hash': 'e55cedc11adb39c404b7365f7d6291fa',
+            'last_modified': '1970-01-01T00:00:20.000000',
+            'content_type': 'text/plain',
+        }]
+
+        self.app.register(
+            'GET', self.build_versions_path(), swob.HTTPNotFound, {}, '')
+        self.app.register(
+            'GET', '/v1/a/c', swob.HTTPOk,
+            {SYSMETA_VERSIONS_CONT: self.build_container_name('c'),
+             SYSMETA_VERSIONS_ENABLED: True},
+            json.dumps(listing_body).encode('utf8'))
+        req = Request.blank(
+            '/v1/a/c?versions',
+            environ={'REQUEST_METHOD': 'GET',
+                     'swift.cache': self.cache_version_on})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        self.assertIn(('X-Versions-Enabled', 'True'), headers)
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+        expected = [{
+            'bytes': 8,
+            'name': 'my-other-object',
+            'version_id': 'null',
+            'hash': 'ebdd8d46ecb4a07f6c433d67eb05d5f3',
+            'last_modified': '1970-01-01T00:00:05.000000',
+            'content_type': 'application/bar',
+            'is_latest': True,
+        }, {
+            'bytes': 9,
+            'name': 'obj',
+            'version_id': 'null',
+            'hash': 'e55cedc11adb39c404b7365f7d6291fa',
+            'last_modified': '1970-01-01T00:00:20.000000',
+            'content_type': 'text/plain',
+            'is_latest': True,
+        }]
+        self.assertEqual(expected, json.loads(body))
+
+    def test_list_versions_never_enabled(self):
+        listing_body = [{
+            'bytes': 8,
+            'name': 'my-other-object',
+            'hash': 'ebdd8d46ecb4a07f6c433d67eb05d5f3',
+            'last_modified': '1970-01-01T00:00:05.000000',
+            'content_type': 'application/bar',
+        }, {
+            'bytes': 9,
+            'name': 'obj',
+            'hash': 'e55cedc11adb39c404b7365f7d6291fa',
+            'last_modified': '1970-01-01T00:00:20.000000',
+            'content_type': 'text/plain',
+        }]
+
+        self.app.register(
+            'GET', self.build_versions_path(), swob.HTTPNotFound, {}, '')
+        self.app.register(
+            'GET', '/v1/a/c', swob.HTTPOk, {},
+            json.dumps(listing_body).encode('utf8'))
+        req = Request.blank(
+            '/v1/a/c?versions',
+            environ={'REQUEST_METHOD': 'GET',
+                     'swift.cache': self.cache_version_never_on})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        self.assertNotIn('x-versions-enabled', [h.lower() for h, _ in headers])
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+        expected = [{
+            'bytes': 8,
+            'name': 'my-other-object',
+            'version_id': 'null',
+            'hash': 'ebdd8d46ecb4a07f6c433d67eb05d5f3',
+            'last_modified': '1970-01-01T00:00:05.000000',
+            'content_type': 'application/bar',
+            'is_latest': True,
+        }, {
+            'bytes': 9,
+            'name': 'obj',
+            'version_id': 'null',
+            'hash': 'e55cedc11adb39c404b7365f7d6291fa',
+            'last_modified': '1970-01-01T00:00:20.000000',
+            'content_type': 'text/plain',
+            'is_latest': True,
+        }]
+        self.assertEqual(expected, json.loads(body))
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/a/c?format=json'),
+            ('HEAD', self.build_versions_path()),
+        ])
+
+        # if it's in cache, we won't even get the HEAD
+        self.app.clear_calls()
+        self.cache_version_never_on.set(
+            get_cache_key('a', self.build_container_name('c')),
+            {'status': 404})
+        req = Request.blank(
+            '/v1/a/c?versions',
+            environ={'REQUEST_METHOD': 'GET',
+                     'swift.cache': self.cache_version_never_on})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        self.assertNotIn('x-versions-enabled', [h.lower() for h, _ in headers])
+        self.assertEqual(expected, json.loads(body))
+        self.assertEqual(self.app.calls, [('GET', '/v1/a/c?format=json')])
+
+    def test_bytes_count(self):
+        self.app.register(
+            'HEAD', self.build_versions_path(), swob.HTTPOk,
+            {'X-Container-Bytes-Used': '17',
+             'X-Container-Object-Count': '3'}, '')
+        self.app.register(
+            'HEAD', '/v1/a/c', swob.HTTPOk,
+            {SYSMETA_VERSIONS_CONT: self.build_container_name('c'),
+             SYSMETA_VERSIONS_ENABLED: True,
+             'X-Container-Bytes-Used': '8',
+             'X-Container-Object-Count': '1'}, '')
+        req = Request.blank(
+            '/v1/a/c?versions',
+            environ={'REQUEST_METHOD': 'HEAD',
+                     'swift.cache': self.cache_version_on})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        self.assertIn(('X-Versions-Enabled', 'True'), headers)
+        self.assertIn(('X-Container-Bytes-Used', '25'), headers)
+        self.assertIn(('X-Container-Object-Count', '1'), headers)
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+
+
+class ObjectVersioningTestAccountOperations(ObjectVersioningBaseTestCase):
+
+    def test_list_containers(self):
+        listing_body = [{
+            'bytes': 10,
+            'count': 2,
+            'name': 'regular-cont',
+            'last_modified': '1970-01-01T00:00:05.000000',
+        }, {
+            'bytes': 0,
+            'count': 3,
+            'name': 'versioned-cont',
+            'last_modified': '1970-01-01T00:00:20.000000',
+        }]
+
+        versions_listing_body = [{
+            'bytes': 24,
+            'count': 3,
+            'name': self.build_container_name('versioned-cont'),
+            'last_modified': '1970-01-01T00:00:20.000000',
+        }]
+
+        cache = FakeMemcache()
+
+        self.app.register(
+            'GET', '/v1/a', swob.HTTPOk, {},
+            json.dumps(listing_body).encode('utf8'))
+
+        params = {
+            'format': 'json',
+            'prefix': str_to_wsgi(get_reserved_name('versions')),
+        }
+        path = '/v1/a?%s' % urllib.parse.urlencode(params)
+
+        self.app.register(
+            'GET', path, swob.HTTPOk, {},
+            json.dumps(versions_listing_body).encode('utf8'))
+
+        req = Request.blank(
+            '/v1/a',
+            environ={'REQUEST_METHOD': 'GET',
+                     'swift.cache': cache})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        expected = [{
+            'bytes': 10,
+            'count': 2,
+            'name': 'regular-cont',
+            'last_modified': '1970-01-01T00:00:05.000000',
+        }, {
+            'bytes': 24,
+            'count': 3,
+            'name': 'versioned-cont',
+            'last_modified': '1970-01-01T00:00:20.000000',
+        }]
+        self.assertEqual(expected, json.loads(body))
+
+        req.query_string = 'limit=1'
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(1, len(json.loads(body)))
+
+        req.query_string = 'limit=foo'
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(2, len(json.loads(body)))
+
+        req.query_string = 'limit=100000000000000000000000'
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '412 Precondition Failed')
+
+    def test_list_containers_prefix(self):
+        listing_body = [{
+            'bytes': 0,
+            'count': 1,
+            'name': 'versioned-cont',
+            'last_modified': '1970-01-01T00:00:05.000000',
+        }]
+
+        versions_listing_body = [{
+            'bytes': 24,
+            'count': 3,
+            'name': self.build_container_name('versioned-cont'),
+            'last_modified': '1970-01-01T00:00:20.000000',
+        }]
+
+        cache = FakeMemcache()
+
+        path = '/v1/a?%s' % urllib.parse.urlencode({
+            'format': 'json', 'prefix': 'versioned-'})
+
+        self.app.register(
+            'GET', path, swob.HTTPOk, {},
+            json.dumps(listing_body).encode('utf8'))
+
+        path = '/v1/a?%s' % urllib.parse.urlencode({
+            'format': 'json', 'prefix': str_to_wsgi(
+                self.build_container_name('versioned-'))})
+
+        self.app.register(
+            'GET', path, swob.HTTPOk, {},
+            json.dumps(versions_listing_body).encode('utf8'))
+
+        req = Request.blank(
+            '/v1/a?prefix=versioned-',
+            environ={'REQUEST_METHOD': 'GET',
+                     'swift.cache': cache})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        expected = [{
+            'bytes': 24,
+            'count': 1,
+            'name': 'versioned-cont',
+            'last_modified': '1970-01-01T00:00:05.000000',
+        }]
+        self.assertEqual(expected, json.loads(body))
+
+    def test_list_orphan_hidden_containers(self):
+
+        listing_body = [{
+            'bytes': 10,
+            'count': 2,
+            'name': 'alpha',
+            'last_modified': '1970-01-01T00:00:05.000000',
+        }, {
+            'bytes': 6,
+            'count': 3,
+            'name': 'bravo',
+            'last_modified': '1970-01-01T00:00:20.000000',
+        }, {
+            'bytes': 0,
+            'count': 5,
+            'name': 'charlie',
+            'last_modified': '1970-01-01T00:00:30.000000',
+        }, {
+            'bytes': 0,
+            'count': 8,
+            'name': 'zulu',
+            'last_modified': '1970-01-01T00:00:40.000000',
+        }]
+
+        versions_listing_body1 = [{
+            'bytes': 24,
+            'count': 8,
+            'name': self.build_container_name('bravo'),
+            'last_modified': '1970-01-01T00:00:20.000000',
+        }, {
+            'bytes': 123,
+            'count': 23,
+            'name': self.build_container_name('charlie'),
+            'last_modified': '1970-01-01T00:00:30.000000',
+        }, {
+            'bytes': 13,
+            'count': 30,
+            'name': self.build_container_name('kilo'),
+            'last_modified': '1970-01-01T00:00:35.000000',
+        }, {
+            'bytes': 83,
+            'count': 13,
+            'name': self.build_container_name('zulu'),
+            'last_modified': '1970-01-01T00:00:40.000000',
+        }]
+
+        cache = FakeMemcache()
+
+        self.app.register(
+            'GET', '/v1/a', swob.HTTPOk, {},
+            json.dumps(listing_body).encode('utf8'))
+
+        params = {
+            'format': 'json',
+            'prefix': str_to_wsgi(get_reserved_name('versions')),
+        }
+        path = '/v1/a?%s' % urllib.parse.urlencode(params)
+
+        self.app.register(
+            'GET', path, swob.HTTPOk, {},
+            json.dumps(versions_listing_body1).encode('utf8'))
+
+        req = Request.blank(
+            '/v1/a',
+            environ={'REQUEST_METHOD': 'GET',
+                     'swift.cache': cache})
+        status, headers, body = self.call_ov(req)
+        self.assertEqual(status, '200 OK')
+        expected = [{
+            'bytes': 10,
+            'count': 2,
+            'name': 'alpha',
+            'last_modified': '1970-01-01T00:00:05.000000',
+        }, {
+            'bytes': 30,
+            'count': 3,
+            'name': 'bravo',
+            'last_modified': '1970-01-01T00:00:20.000000',
+        }, {
+            'bytes': 123,
+            'count': 5,
+            'name': 'charlie',
+            'last_modified': '1970-01-01T00:00:30.000000',
+        }, {
+            'bytes': 13,
+            'count': 0,
+            'name': 'kilo',
+            'last_modified': '1970-01-01T00:00:35.000000',
+        }, {
+            'bytes': 83,
+            'count': 8,
+            'name': 'zulu',
+            'last_modified': '1970-01-01T00:00:40.000000',
+        }]
+        self.assertEqual(expected, json.loads(body))
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/test_proxy_logging.py b/test/unit/common/middleware/test_proxy_logging.py
index 86841df5b8..914a3864de 100644
--- a/test/unit/common/middleware/test_proxy_logging.py
+++ b/test/unit/common/middleware/test_proxy_logging.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2011 OpenStack, LLC.
+# Copyright (c) 2010-2011 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -12,32 +12,89 @@
 # implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
+import itertools
+import logging
+from datetime import datetime, timezone
 
+from unittest import mock
+import email
+import time
 import unittest
-from urllib import quote, unquote
-import cStringIO as StringIO
+from io import BytesIO
 from logging.handlers import SysLogHandler
 
-from test.unit import FakeLogger
-from swift.common.utils import get_logger
+from urllib.parse import unquote
+
+from swift.common.utils import get_swift_logger, split_path, md5
 from swift.common.middleware import proxy_logging
-from swift.common.swob import Request
+from swift.common.registry import register_sensitive_header, \
+    register_sensitive_param, get_sensitive_headers
+from swift.common.swob import Request, Response, HTTPServiceUnavailable, \
+    HTTPCreated, HTTPOk
+from swift.common import constraints, registry, statsd_client
+from swift.common.storage_policy import StoragePolicy
+
+from test.debug_logger import debug_logger, FakeStatsdClient, \
+    FakeLabeledStatsdClient, debug_labeled_statsd_client
+from test.unit import patch_policies
+from test.unit.common.middleware.helpers import FakeAppThatExcepts, \
+    FakeSwift
+from test.unit.common.middleware.s3api import FakeAuthApp, filter_factory \
+    as s3api_filter_factory
 
 
 class FakeApp(object):
-    def __init__(self, body=['FAKE APP']):
+
+    def __init__(self, body=None, response_str='200 OK', policy_idx='0',
+                 chunked=False, environ_updates=None, read_callback=None):
+        if body is None:
+            body = [b'FAKE APP']
+        elif isinstance(body, bytes):
+            body = [body]
+
         self.body = body
+        self.response_str = response_str
+        self.policy_idx = policy_idx
+        self.chunked = chunked
+        self.environ_updates = environ_updates or {}
+        self.read_callback = read_callback
 
     def __call__(self, env, start_response):
-        start_response('200 OK', [('Content-Type', 'text/plain'),
-                            ('Content-Length', str(sum(map(len, self.body))))])
-        while env['wsgi.input'].read(5):
-            pass
+        try:
+            # /v1/a/c or /v1/a/c/o
+            split_path(env['PATH_INFO'], 3, 4, True)
+            is_container_or_object_req = True
+        except ValueError:
+            is_container_or_object_req = False
+
+        headers = [('Content-Type', 'text/plain')]
+        if self.chunked:
+            headers.append(('Transfer-Encoding', 'chunked'))
+        elif not hasattr(self.body, 'close'):
+            content_length = sum(map(len, self.body))
+            headers.append(('Content-Length', str(content_length)))
+
+        if is_container_or_object_req and self.policy_idx is not None:
+            headers.append(('X-Backend-Storage-Policy-Index',
+                            str(self.policy_idx)))
+        start_response(self.response_str, headers)
+        while True:
+            buf = env['wsgi.input'].read(5)
+            if self.read_callback is not None:
+                self.read_callback(len(buf))
+            if not buf:
+                break
+        # N.B. mw can set this anytime before the resp is finished
+        env.update(self.environ_updates)
         return self.body
 
 
 class FakeAppNoContentLengthNoTransferEncoding(object):
-    def __init__(self, body=['FAKE APP']):
+
+    def __init__(self, body=None):
+        if body is None:
+            body = [b'FAKE APP']
+
         self.body = body
 
     def __call__(self, env, start_response):
@@ -48,6 +105,7 @@ def __call__(self, env, start_response):
 
 
 class FileLikeExceptor(object):
+
     def __init__(self):
         pass
 
@@ -59,80 +117,947 @@ def readline(self, len=1024):
 
 
 class FakeAppReadline(object):
+
     def __call__(self, env, start_response):
         start_response('200 OK', [('Content-Type', 'text/plain'),
-                                 ('Content-Length', '8')])
-        line = env['wsgi.input'].readline()
-        return ["FAKE APP"]
+                                  ('Content-Length', '8')])
+        env['wsgi.input'].readline()
+        return [b"FAKE APP"]
+
+
+class PathRewritingApp:
+    """
+    Rewrite request path, modifying the container part of the path, to emulate
+    the behavior of, for example, a multipart upload.
+    """
+    # note: tests deliberately use this explicit rewriting middleware rather
+    # than relying on the behavior of other middleware that might change
+    def __init__(self, app, logger):
+        self.app = app
+        self.logger = logger
+
+    def __call__(self, env, start_response):
+        orig_path = env['PATH_INFO']
+        req = Request(env)
+        parts = req.split_path(4, rest_with_last=True)
+        parts[2] += '+segments'
+        env['PATH_INFO'] = '/' + '/'.join(parts)
+        try:
+            resp = req.get_response(self.app)
+        except Exception:
+            self.logger.exception('PathRewritingApp (re-raising)')
+            raise
+        env['PATH_INFO'] = orig_path
+        return resp(self.app, start_response)
 
 
 def start_response(*args):
     pass
 
 
-class TestProxyLogging(unittest.TestCase):
+class BaseTestProxyLogging(unittest.TestCase):
+
+    def assertLabeledUpdateStats(self, exp_metrics_values_labels):
+        statsd_calls = self.statsd.calls['update_stats']
+        for statsd_call in statsd_calls:
+            statsd_call[1]['labels'] = dict(statsd_call[1]['labels'])
+        exp_calls = []
+        for metric, value, labels in exp_metrics_values_labels:
+            exp_calls.append(((metric, value), {'labels': labels}))
+        self.assertEqual(exp_calls, statsd_calls)
+
+    def assertLabeledTimingStats(self, exp_metrics_values_labels):
+        statsd_calls = self.statsd.calls['timing']
+        exp_calls = []
+        for metric, value, labels in exp_metrics_values_labels:
+            exp_calls.append(((metric, mock.ANY), {'labels': labels}))
+        self.assertEqual(exp_calls, statsd_calls)
+        for i, (metric, value, labels) in enumerate(exp_metrics_values_labels):
+            self.assertAlmostEqual(
+                value, statsd_calls[i][0][1], places=4, msg=i)
+
+
+class TestCallbackInputProxy(unittest.TestCase):
+
+    def test_read_all(self):
+        callback = mock.MagicMock(return_value=b'xyz')
+        self.assertEqual(
+            b'xyz', proxy_logging.CallbackInputProxy(
+                BytesIO(b'abc'), callback).read())
+        self.assertEqual([mock.call(b'abc', True)], callback.call_args_list)
+
+        callback = mock.MagicMock(return_value=b'xyz')
+        self.assertEqual(
+            b'xyz', proxy_logging.CallbackInputProxy(
+                BytesIO(b'abc'), callback).read(-1))
+        self.assertEqual([mock.call(b'abc', True)], callback.call_args_list)
+
+        callback = mock.MagicMock(return_value=b'xyz')
+        self.assertEqual(
+            b'xyz', proxy_logging.CallbackInputProxy(
+                BytesIO(b'abc'), callback).read(None))
+        self.assertEqual([mock.call(b'abc', True)], callback.call_args_list)
+
+    def test_read_size(self):
+        callback = mock.MagicMock(side_effect=[b'a', b'bc', b''])
+        cip = proxy_logging.CallbackInputProxy(BytesIO(b'abc'), callback)
+        self.assertEqual(
+            b'a', cip.read(1))
+        self.assertEqual([mock.call(b'a', False)], callback.call_args_list)
+        self.assertEqual(
+            b'bc', cip.read(2))
+        self.assertEqual(
+            [mock.call(b'a', False), mock.call(b'bc', False)],
+            callback.call_args_list)
+        self.assertEqual(
+            b'', cip.read())
+        self.assertEqual([mock.call(b'a', False), mock.call(b'bc', False),
+                          mock.call(b'', True)], callback.call_args_list)
+
 
-    def _log_parts(self, app):
+class TestBufferXferEmitCallback(BaseTestProxyLogging):
+
+    def setUp(self):
+        self.logger = debug_logger()
+
+    def test_buffer_xfer_emit_callback(self):
+        conf = {
+            'log_headers': 'yes',
+            'statsd_label_mode': 'dogstatsd',
+            'statsd_emit_buffer_xfer_bytes_seconds': 0,
+        }
+        self.statsd = debug_labeled_statsd_client(conf)
+        app = proxy_logging.ProxyLoggingMiddleware(
+            FakeApp(), conf, logger=self.logger)
+        app.statsd = self.statsd
+
+        labels = {
+            'account': 'a',
+            'container': 'c',
+            'method': 'POST',
+            'resource': 'container'}
+        callback = proxy_logging.BufferXferEmitCallback(
+            'swift_proxy_example_metric', labels, app.statsd,
+            app.emit_buffer_xfer_bytes_sec)
+        callback('abcde')
+        self.assertLabeledUpdateStats([
+            ('swift_proxy_example_metric', 5, {
+                'account': 'a',
+                'container': 'c',
+                'method': 'POST',
+                'resource': 'container'}),
+        ])
+        callback('abcdef')
+        self.assertLabeledUpdateStats([
+            ('swift_proxy_example_metric', 5, {
+                'account': 'a',
+                'container': 'c',
+                'method': 'POST',
+                'resource': 'container'}),
+            ('swift_proxy_example_metric', 6, {
+                'account': 'a',
+                'container': 'c',
+                'method': 'POST',
+                'resource': 'container'}),
+        ])
+        callback('abcdefg')
+        self.assertLabeledUpdateStats([
+            ('swift_proxy_example_metric', 5, {
+                'account': 'a',
+                'container': 'c',
+                'method': 'POST',
+                'resource': 'container'}),
+            ('swift_proxy_example_metric', 6, {
+                'account': 'a',
+                'container': 'c',
+                'method': 'POST',
+                'resource': 'container'}),
+            ('swift_proxy_example_metric', 7, {
+                'account': 'a',
+                'container': 'c',
+                'method': 'POST',
+                'resource': 'container'}),
+        ])
+
+    def test_buffer_xfer_emit_callback_negative(self):
+        conf = {
+            'log_headers': 'yes',
+            'statsd_label_mode': 'dogstatsd',
+            'statsd_emit_buffer_xfer_bytes_seconds': -1,
+        }
+        self.statsd = debug_labeled_statsd_client(conf)
+        app = proxy_logging.ProxyLoggingMiddleware(
+            FakeApp(), conf, logger=self.logger)
+        app.statsd = self.statsd
+
+        labels = {
+            'account': 'a',
+            'container': 'c',
+            'method': 'POST',
+            'resource': 'container'}
+        callback = proxy_logging.BufferXferEmitCallback(
+            'swift_proxy_example_metric', labels, app.statsd,
+            app.emit_buffer_xfer_bytes_sec)
+        callback('abcde')
+        self.assertLabeledUpdateStats([])
+        callback('abcdef')
+        self.assertLabeledUpdateStats([])
+        callback('abcdefg')
+        self.assertLabeledUpdateStats([])
+
+    def test_buffer_xfer_emit_callback_positive(self):
+        conf = {
+            'log_headers': 'yes',
+            'statsd_label_mode': 'dogstatsd',
+            'statsd_emit_buffer_xfer_bytes_seconds': 1000,
+        }
+        self.statsd = debug_labeled_statsd_client(conf)
+        app = proxy_logging.ProxyLoggingMiddleware(
+            FakeApp(), conf, logger=self.logger)
+        app.statsd = self.statsd
+
+        labels = {
+            'account': 'a',
+            'container': 'c',
+            'method': 'POST',
+            'resource': 'container'}
+        callback = proxy_logging.BufferXferEmitCallback(
+            'swift_proxy_example_metric', labels, app.statsd,
+            app.emit_buffer_xfer_bytes_sec)
+        callback('abcde')
+        # gotta wait for that emit delay
+        self.assertLabeledUpdateStats([])
+        callback('abcdef')
+        # still no new stats
+        self.assertLabeledUpdateStats([])
+        callback('abcdefg')
+        # no new stats
+        # eof always emits
+        callback('', eof=True)
+        self.assertLabeledUpdateStats([
+            ('swift_proxy_example_metric', 18, {
+                'account': 'a',
+                'container': 'c',
+                'method': 'POST',
+                'resource': 'container'}),
+        ])
+
+    def test_buffer_eof(self):
+        buffers = 'abcd'
+        buffer_len = len(buffers)
+        conf = {
+            'log_headers': 'yes',
+            'statsd_label_mode': 'dogstatsd',
+            'statsd_emit_buffer_xfer_bytes_seconds': 1,
+        }
+        self.statsd = debug_labeled_statsd_client(conf)
+        app = proxy_logging.ProxyLoggingMiddleware(
+            FakeApp(), conf, logger=self.logger)
+        app.statsd = self.statsd
+        labels = {
+            'account': 'a',
+            'container': 'c',
+            'method': 'POST',
+            'resource': 'container'}
+        callback = proxy_logging.BufferXferEmitCallback(
+            'swift_proxy_example_metric', labels, app.statsd,
+            app.emit_buffer_xfer_bytes_sec)
+        now = time.time()
+        with mock.patch('swift.common.middleware.proxy_logging.time.time',
+                        return_value=now):
+            callback(buffers, eof=False)
+            self.assertLabeledUpdateStats([])
+        with mock.patch('swift.common.middleware.proxy_logging.time.time',
+                        return_value=now + 1):
+            callback(buffers, eof=False)
+        self.assertLabeledUpdateStats([
+            ('swift_proxy_example_metric', buffer_len * 2, {
+                'account': 'a',
+                'container': 'c',
+                'method': 'POST',
+                'resource': 'container'})])
+
+        with mock.patch('swift.common.middleware.proxy_logging.time.time',
+                        return_value=now + 1.5):
+            callback(buffers, eof=False)
+        self.assertLabeledUpdateStats([
+            ('swift_proxy_example_metric', buffer_len * 2, {
+                'account': 'a',
+                'container': 'c',
+                'method': 'POST',
+                'resource': 'container'})])
+
+        with mock.patch('swift.common.middleware.proxy_logging.time.time',
+                        return_value=now):
+            callback(buffers[:-1], eof=True)
+        self.assertLabeledUpdateStats([
+            ('swift_proxy_example_metric', buffer_len * 2, {
+                'account': 'a',
+                'container': 'c',
+                'method': 'POST',
+                'resource': 'container'}),
+            ('swift_proxy_example_metric', buffer_len * 2 - 1, {
+                'account': 'a',
+                'container': 'c',
+                'method': 'POST',
+                'resource': 'container'})
+        ])
+
+
+@patch_policies([StoragePolicy(0, 'zero', False)])
+class TestProxyLogging(BaseTestProxyLogging):
+    def setUp(self):
+        self.logger = debug_logger()
+        # really, this would come by way of base_prefix/tail_prefix in
+        # get_logger, ultimately tracing back to our hard-coded
+        # statsd_tail_prefix
+        self.logger.logger.statsd_client._prefix = 'proxy-server.'
+        conf = {
+            'log_statsd_host': 'host',
+            'log_statsd_port': 8125,
+            'statsd_label_mode': 'dogstatsd',
+            'statsd_emit_legacy': True,
+        }
+        self.statsd = debug_labeled_statsd_client(conf)
+        account_labels = {
+            'account': 'a',
+            'resource': 'account',
+        }
+        container_labels = {
+            'account': 'a',
+            'container': 'c',
+            'resource': 'container',
+        }
+        object_labels = {
+            'account': 'a',
+            'container': 'c',
+            'resource': 'object',
+            'policy': '0',
+        }
+        self.path_labels = {
+            '/v1/a': account_labels,
+            '/v1/a/': account_labels,
+            '/v1/a/c': container_labels,
+            '/v1/a/c/': container_labels,
+            '/v1/a/c/o': object_labels,
+            '/v1/a/c/o/': object_labels,
+            '/v1/a/c/o/p': object_labels,
+            '/v1/a/c/o/p/': object_labels,
+            '/v1/a/c/o/p/p2': object_labels,
+            '/v1.0/a': account_labels,
+            '/v1.0/a/': account_labels,
+            '/v1.0/a/c': container_labels,
+            '/v1.0/a/c/': container_labels,
+            '/v1.0/a/c/o': object_labels,
+            '/v1.0/a/c/o/': object_labels,
+            '/v1.0/a/c/o/p': object_labels,
+            '/v1.0/a/c/o/p/': object_labels,
+            '/v1.0/a/c/o/p/p2': object_labels,
+        }
+
+    def _clear(self):
+        self.logger.clear()
+        self.statsd.clear()
+
+    def _log_parts(self, app, should_be_empty=False):
         info_calls = app.access_logger.log_dict['info']
-        self.assertEquals(1, len(info_calls))
-        return info_calls[0][0][0].split(' ')
+        if should_be_empty:
+            self.assertEqual([], info_calls)
+        else:
+            self.assertEqual(1, len(info_calls))
+            return info_calls[0][0][0].split(' ')
 
     def assertTiming(self, exp_metric, app, exp_timing=None):
-        timing_calls = app.access_logger.log_dict['timing']
-        self.assertEquals(1, len(timing_calls))
-        self.assertEquals({}, timing_calls[0][1])
-        self.assertEquals(2, len(timing_calls[0][0]))
-        self.assertEquals(exp_metric, timing_calls[0][0][0])
-        if exp_timing is not None:
-            self.assertEquals(exp_timing, timing_calls[0][0][1])
-
-    def assertUpdateStats(self, exp_metric, exp_bytes, app):
-        update_stats_calls = app.access_logger.log_dict['update_stats']
-        self.assertEquals(1, len(update_stats_calls))
-        self.assertEquals({}, update_stats_calls[0][1])
-        self.assertEquals((exp_metric, exp_bytes), update_stats_calls[0][0])
-
-    def test_log_request_statsd_invalid_stats_types(self):
-        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), {})
-        app.access_logger = FakeLogger()
-        for url in ['/', '/foo', '/foo/bar', '/v1']:
-            req = Request.blank(url, environ={'REQUEST_METHOD': 'GET'})
-            resp = app(req.environ, start_response)
-            resp_body = ''.join(resp)
-            self.assertEquals(0, len(app.access_logger.log_dict['timing']))
-            self.assertEquals(0,
-                              len(app.access_logger.log_dict['update_stats']))
-
-    def test_log_request_stat_type_bad(self):
-        for bad_path in ['', '/', '/bad', '/baddy/mc_badderson', '/v1',
-                         '/v1/']:
-            app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), {})
-            app.access_logger = FakeLogger()
+        timing_calls = app.access_logger.statsd_client.calls['timing']
+        found = False
+        for timing_call in timing_calls:
+            self.assertEqual({}, timing_call[1])
+            self.assertEqual(2, len(timing_call[0]))
+            if timing_call[0][0] == exp_metric:
+                found = True
+                if exp_timing is not None:
+                    self.assertAlmostEqual(exp_timing, timing_call[0][1],
+                                           places=4)
+        if not found:
+            self.fail('assertTiming: %s not found in %r' % (
+                exp_metric, timing_calls))
+
+    def assertNotTiming(self, not_exp_metric, app):
+        timing_calls = app.access_logger.statsd_client.calls['timing']
+        for timing_call in timing_calls:
+            self.assertNotEqual(not_exp_metric, timing_call[0][0])
+
+    def assertUpdateStats(self, exp_metrics_and_values, app):
+        update_stats_calls = sorted(
+            app.access_logger.statsd_client.calls['update_stats'])
+        got_metrics_values_and_kwargs = [(usc[0][0], usc[0][1], usc[1])
+                                         for usc in update_stats_calls]
+        exp_metrics_values_and_kwargs = [(emv[0], emv[1], {})
+                                         for emv in exp_metrics_and_values]
+        self.assertEqual(got_metrics_values_and_kwargs,
+                         exp_metrics_values_and_kwargs)
+        self.assertIs(self.logger, app.access_logger)
+        for metric, value in exp_metrics_and_values:
+            self.assertIn(
+                (('proxy-server.%s:%s|c' % (metric, value)).encode(),
+                 ('host', 8125)),
+                app.access_logger.statsd_client.sendto_calls)
+
+    def get_v4_amz_date_header(self):
+        return datetime.now(timezone.utc).strftime('%Y%m%dT%H%M%SZ')
+
+    def test_init_logger_and_legacy_statsd_options_log_prefix(self):
+        conf = {
+            'log_headers': 'no',
+            'log_statsd_valid_http_methods': 'GET',
+            'log_facility': 'LOG_LOCAL7',
+            'log_name': 'bob',
+            'log_level': 'DEBUG',
+            'log_udp_host': 'example.com',
+            'log_udp_port': '3456',
+            'log_statsd_host': 'example.com',
+            'log_statsd_port': '1234',
+            'log_statsd_default_sample_rate': 10,
+            'log_statsd_sample_rate_factor': .04,
+            'log_statsd_metric_prefix': 'foo',
+        }
+        with mock.patch('swift.common.statsd_client.StatsdClient',
+                        FakeStatsdClient):
+            app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), conf)
+
+        self.assertFalse(app.log_hdrs)
+        self.assertEqual(['GET'], app.valid_methods)
+
+        log_adapter = app.access_logger
+        self.assertEqual('proxy-access', log_adapter.name)
+        self.assertEqual('bob', app.access_logger.server)
+        self.assertEqual(logging.DEBUG, log_adapter.logger.level)
+        self.assertEqual(('example.com', 3456),
+                         log_adapter.logger.handlers[0].address)
+        self.assertEqual(SysLogHandler.LOG_LOCAL7,
+                         log_adapter.logger.handlers[0].facility)
+
+        statsd_client = app.access_logger.logger.statsd_client
+        self.assertIsInstance(statsd_client, FakeStatsdClient)
+        with mock.patch.object(statsd_client, 'random', return_value=0):
+            statsd_client.increment('baz')
+        self.assertEqual(
+            [(b'foo.proxy-server.baz:1|c|@0.4', ('example.com', 1234))],
+            statsd_client.sendto_calls)
+
+    def test_init_logger_and_legacy_statsd_options_access_log_prefix(self):
+        # verify that access_log_ prefix has precedence over log_
+        conf = {
+            'access_log_route': 'my-proxy-access',
+            'access_log_headers': 'yes',
+            'access_log_statsd_valid_http_methods': 'GET, HEAD',
+            'access_log_facility': 'LOG_LOCAL6',
+            'access_log_name': 'alice',
+            'access_log_level': 'WARN',
+            'access_log_udp_host': 'access.com',
+            'access_log_udp_port': '6789',
+            'log_headers': 'no',
+            'log_statsd_valid_http_methods': 'GET',
+            'log_facility': 'LOG_LOCAL7',
+            'log_name': 'bob',
+            'log_level': 'DEBUG',
+            'log_udp_host': 'example.com',
+            'log_udp_port': '3456',
+            'access_log_statsd_host': 'access.com',
+            'access_log_statsd_port': '5678',
+            'access_log_statsd_default_sample_rate': 20,
+            'access_log_statsd_sample_rate_factor': .03,
+            'access_log_statsd_metric_prefix': 'access_foo',
+            'log_statsd_host': 'example.com',
+            'log_statsd_port': '1234',
+            'log_statsd_default_sample_rate': 10,
+            'log_statsd_sample_rate_factor': .04,
+            'log_statsd_metric_prefix': 'foo',
+        }
+        with mock.patch('swift.common.statsd_client.StatsdClient',
+                        FakeStatsdClient):
+            app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), conf)
+
+        self.assertTrue(app.log_hdrs)
+        self.assertEqual(['GET', 'HEAD'], app.valid_methods)
+
+        log_adapter = app.access_logger
+        self.assertEqual('my-proxy-access', log_adapter.name)
+        self.assertEqual('alice', app.access_logger.server)
+        self.assertEqual(logging.WARN, log_adapter.logger.level)
+        self.assertEqual(('access.com', 6789),
+                         log_adapter.logger.handlers[0].address)
+        self.assertEqual(SysLogHandler.LOG_LOCAL6,
+                         log_adapter.logger.handlers[0].facility)
+
+        statsd_client = app.access_logger.logger.statsd_client
+        self.assertIsInstance(statsd_client, FakeStatsdClient)
+        with mock.patch.object(statsd_client, 'random', return_value=0):
+            statsd_client.increment('baz')
+        self.assertEqual(
+            [(b'access_foo.proxy-server.baz:1|c|@0.6', ('access.com', 5678))],
+            statsd_client.sendto_calls)
+
+    def test_init_labeled_statsd_options_log_prefix(self):
+        # verify that log_ prefix options are passed to LabeledStatsdClient
+        conf = {
+            'log_statsd_host': 'example.com',
+            'log_statsd_port': '1234',
+            'log_statsd_default_sample_rate': 10,
+            'log_statsd_sample_rate_factor': .04,
+            'statsd_label_mode': 'dogstatsd',
+        }
+        with mock.patch('swift.common.statsd_client.LabeledStatsdClient',
+                        FakeLabeledStatsdClient):
+            app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), conf)
+
+        statsd_client = app.statsd
+        self.assertIsInstance(statsd_client, FakeLabeledStatsdClient)
+        with mock.patch.object(statsd_client, 'random', return_value=0):
+            statsd_client.increment('baz', labels={'test': 'label'})
+        self.assertEqual(
+            [(b'baz:1|c|@0.4|#test:label', ('example.com', 1234))],
+            statsd_client.sendto_calls)
+
+    def test_init_labeled_statsd_options_access_log_prefix(self):
+        # verify that access_log_ prefix has precedence over log_ prefix
+        conf = {
+            'access_log_statsd_host': 'access.com',
+            'access_log_statsd_port': '5678',
+            'access_log_statsd_default_sample_rate': 20,
+            'access_log_statsd_sample_rate_factor': .03,
+            'log_statsd_host': 'example.com',
+            'log_statsd_port': '1234',
+            'log_statsd_default_sample_rate': 10,
+            'log_statsd_sample_rate_factor': .04,
+            'statsd_label_mode': 'dogstatsd',
+        }
+        with mock.patch('swift.common.statsd_client.LabeledStatsdClient',
+                        FakeLabeledStatsdClient):
+            app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), conf)
+        statsd_client = app.statsd
+        self.assertIsInstance(statsd_client, FakeLabeledStatsdClient)
+        with mock.patch.object(statsd_client, 'random', return_value=0):
+            statsd_client.increment('baz', labels={'test': 'label'})
+        self.assertEqual(
+            [(b'baz:1|c|@0.6|#test:label', ('access.com', 5678))],
+            statsd_client.sendto_calls)
+
+    def test_init_statsd_options_user_labels(self):
+        conf = {
+            'log_statsd_host': 'example.com',
+            'log_statsd_port': '1234',
+            'statsd_label_mode': 'dogstatsd',
+            'statsd_emit_legacy': False,
+            'statsd_user_label_reqctx': 'subrequest',
+        }
+        with mock.patch('swift.common.statsd_client.LabeledStatsdClient',
+                        FakeLabeledStatsdClient):
+            app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), conf)
+
+        statsd = app.statsd
+        self.assertIsInstance(statsd, FakeLabeledStatsdClient)
+        with mock.patch.object(statsd, 'random', return_value=0):
+            statsd.increment('baz', labels={'label_foo': 'foo'})
+        self.assertEqual(
+            [(b'baz:1|c|#label_foo:foo,user_reqctx:subrequest',
+             ('example.com', 1234))],
+            statsd.sendto_calls)
+
+    def test_logger_statsd_prefix(self):
+        app = proxy_logging.ProxyLoggingMiddleware(
+            FakeApp(), {'log_statsd_host': 'example.com'})
+        self.assertIsNotNone(app.access_logger.logger.statsd_client)
+        self.assertIsInstance(app.access_logger.logger.statsd_client,
+                              statsd_client.StatsdClient)
+        self.assertEqual('proxy-server.',
+                         app.access_logger.logger.statsd_client._prefix)
+
+        app = proxy_logging.ProxyLoggingMiddleware(
+            FakeApp(), {'log_statsd_metric_prefix': 'foo',  # set base prefix
+                        'access_log_name': 'bar',  # not used as tail prefix
+                        'log_name': 'baz',  # not used as tail prefix
+                        'log_statsd_host': 'example.com'})
+        self.assertIsNotNone(app.access_logger.logger.statsd_client)
+        self.assertIsInstance(app.access_logger.logger.statsd_client,
+                              statsd_client.StatsdClient)
+        self.assertEqual('foo.proxy-server.',
+                         app.access_logger.logger.statsd_client._prefix)
+
+    def test_log_request_stat_type_bad_GET(self):
+        app = proxy_logging.ProxyLoggingMiddleware(
+            FakeApp(body=b'7 bytes'), {}, logger=self.logger)
+        app.statsd = self.statsd
+        exp_labels = {'resource': 'UNKNOWN',
+                      'method': 'GET',
+                      'api': 'swift',
+                      'status': 200}
+
+        def do_test(bad_path):
+            self._clear()
             req = Request.blank(bad_path, environ={'REQUEST_METHOD': 'GET'})
-            app.log_request(req.environ, 123, 7, 13, 2.71828182846, False)
-            self.assertEqual([], app.access_logger.log_dict['timing'])
-            self.assertEqual([], app.access_logger.log_dict['update_stats'])
-
-    def test_log_request_stat_type_good(self):
-        path_types = {
-            '/v1/a': 'account',
-            '/v1/a/': 'account',
-            '/v1/a/c': 'container',
-            '/v1/a/c/': 'container',
-            '/v1/a/c/o': 'object',
-            '/v1/a/c/o/': 'object',
-            '/v1/a/c/o/p': 'object',
-            '/v1/a/c/o/p/': 'object',
-            '/v1/a/c/o/p/p2': 'object',
-        }
-        for path, exp_type in path_types.iteritems():
-            app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), {})
-            app.access_logger = FakeLogger()
-            req = Request.blank(path, environ={'REQUEST_METHOD': 'GET'})
-            app.log_request(req.environ, 321, 7, 13, 2.71828182846, False)
-            self.assertTiming('%s.GET.321.timing' % exp_type, app,
-                              exp_timing=2.71828182846 * 1000)
-            self.assertUpdateStats('%s.GET.321.xfer' % exp_type, 7 + 13, app)
+            with mock.patch('time.time',
+                            side_effect=[18.0, 18.5, 20.71828182846]):
+                resp = app(req.environ, start_response)
+                # get body
+                b''.join(resp)
+            self.assertTiming('UNKNOWN.GET.200.first-byte.timing', app, 500.0)
+            self.assertTiming('UNKNOWN.GET.200.timing', app,
+                              2718.2818284600216)
+            self.assertUpdateStats([('UNKNOWN.GET.200.xfer', 7)], app)
+            self.assertLabeledTimingStats([
+                ('swift_proxy_server_request_ttfb', 0.5 * 1000, exp_labels),
+                ('swift_proxy_server_request_timing', 2.71828182846 * 1000,
+                 exp_labels)
+            ])
+            self.assertLabeledUpdateStats([
+                ('swift_proxy_server_request_body_bytes', 0, exp_labels),
+                ('swift_proxy_server_response_body_bytes', 7, exp_labels),
+            ])
+
+        do_test('')
+        do_test('/')
+        do_test('/bad')
+        do_test('/baddy/mc_badderson')
+        do_test('/v1')
+        do_test('/v1/')
+        do_test('/v1.0')
+        do_test('/v1.0/')
+        do_test('/v1.0//')
+        do_test('/v1.0//c')
+        do_test('/v1.0/a//')
+        do_test('/v1.0/a//o')
+
+    def _do_test_log_request_s3_sigv4(self, method, path, backend_path):
+        self._clear()
+        fake_app = FakeApp(body=b'7 bytes')
+
+        def app_wrapper(env, start_response):
+            # Fake how s3api would set swift.backend_path. We need to set
+            # PATH_INFO to be the backend_path so that FakeApp does the right
+            # thing w.r.t. the policy index headers, but the original request's
+            # PATH_INFO should be unchanged.
+            env_copy = dict(env)
+            env_copy['PATH_INFO'] = backend_path
+            env['swift.backend_path'] = backend_path
+            return fake_app(env_copy, start_response)
+
+        app = proxy_logging.ProxyLoggingMiddleware(
+            app_wrapper, {}, logger=self.logger)
+        app.statsd = self.statsd
+        date_header = self.get_v4_amz_date_header()
+        req = Request.blank(
+            path, environ={'REQUEST_METHOD': method},
+            headers={
+                'Authorization': 'AWS4-HMAC-SHA256 ' + ', '.join([
+                    'Credential=test:tester/%s/us-east-1/s3/aws4_request' %
+                    date_header.split('T', 1)[0],
+                    'SignedHeaders=host',
+                    'Signature=X',
+                ]),
+            },
+        )
+        with mock.patch('time.time',
+                        side_effect=[18.0, 18.5, 20.71828182846]):
+            resp = app(req.environ, start_response)
+            # get body
+            b''.join(resp)
+        return app
+
+    def test_log_request_stat_type_good_PUT_s3_sigv4_container(self):
+        def check_stats(app, exp_labels):
+            self.assertTiming(
+                'container.PUT.200.timing', app, 500)
+            self.assertUpdateStats([('container.PUT.200.xfer', 7)], app)
+            self.assertLabeledTimingStats([
+                ('swift_proxy_server_request_timing', 500, exp_labels)
+            ])
+            self.assertLabeledUpdateStats([
+                ('swift_proxy_server_request_body_bytes', 0, exp_labels),
+                ('swift_proxy_server_response_body_bytes', 7, exp_labels),
+            ])
+
+        exp_labels = {
+            'method': 'PUT',
+            'status': 200,
+            'api': 'S3',
+            'resource': 'container',
+            'account': 'AUTH_test',
+            'container': 'bucket'}
+        check_stats(self._do_test_log_request_s3_sigv4(
+            'PUT', '/bucket', '/v1/AUTH_test/bucket'), exp_labels)
+        # swift.backend_path is authoritative...
+        exp_labels['container'] = 'bucket+segments'
+        check_stats(self._do_test_log_request_s3_sigv4(
+            'PUT', '/bucket', '/v1/AUTH_test/bucket+segments'), exp_labels)
+
+    def test_log_request_stat_type_good_GET_s3_sigv4_object(self):
+        def check_stats(app, exp_labels):
+            self.assertTiming(
+                'object.GET.200.first-byte.timing', app, 500.0)
+            self.assertTiming(
+                'object.GET.200.timing', app, 2718.2818284600216)
+            self.assertUpdateStats(
+                [('object.GET.200.xfer', 7),
+                 ('object.policy.0.GET.200.xfer', 7)], app)
+            self.assertLabeledTimingStats([
+                ('swift_proxy_server_request_ttfb', 0.5 * 1000, exp_labels),
+                ('swift_proxy_server_request_timing', 2.71828182846 * 1000,
+                 exp_labels)
+            ])
+            self.assertLabeledUpdateStats([
+                ('swift_proxy_server_request_body_bytes', 0, exp_labels),
+                ('swift_proxy_server_response_body_bytes', 7, exp_labels),
+            ])
+
+        exp_labels = {
+            'method': 'GET',
+            'api': 'S3',
+            'status': 200,
+            'resource': 'object',
+            'policy': '0',
+            'account': 'AUTH_test',
+            'container': 'bucket'}
+        check_stats(self._do_test_log_request_s3_sigv4(
+            'GET', '/bucket/obj', '/v1/AUTH_test/bucket/obj'), exp_labels)
+        check_stats(self._do_test_log_request_s3_sigv4(
+            'GET', '/bucket/obj/blah', '/v1/AUTH_test/bucket/obj/blah'),
+            exp_labels)
+        exp_labels['container'] = 'bucket+segments'
+        check_stats(self._do_test_log_request_s3_sigv4(
+            'GET', '/bucket/obj', '/v1/AUTH_test/bucket+segments/obj1234'),
+            exp_labels)
+
+    def test_log_request_stat_type_good_GET(self):
+        """
+        log_request() should send timing and byte-count counters for GET
+        requests.  Also, __call__()'s iter_response() function should
+        statsd-log time to first byte (calling the passed-in start_response
+        function), but only for GET requests.
+        """
+        for path, exp_labels in self.path_labels.items():
+            self._clear()
+            with mock.patch("time.time",
+                            side_effect=[18.0, 18.5, 20.71828182846]):
+                exp_labels = dict(exp_labels)
+                exp_type = exp_labels['resource']
+                app = proxy_logging.ProxyLoggingMiddleware(
+                    FakeApp(body=b'7654321', response_str='321 Fubar'),
+                    {},
+                    logger=self.logger)
+                app.statsd = self.statsd
+                req = Request.blank(path, environ={
+                    'REQUEST_METHOD': 'GET',
+                    'wsgi.input': BytesIO(b'4321')})
+                iter_response = app(req.environ, lambda *_: None)
+
+                self.assertEqual(b'7654321', b''.join(iter_response))
+                self.assertTiming('%s.GET.321.timing' % exp_type, app,
+                                  exp_timing=2.71828182846 * 1000)
+                self.assertTiming('%s.GET.321.first-byte.timing'
+                                  % exp_type, app, exp_timing=0.5 * 1000)
+                if exp_type == 'object':
+                    # Object operations also return stats by policy
+                    # In this case, the value needs to match the timing for GET
+                    self.assertTiming('%s.policy.0.GET.321.timing' % exp_type,
+                                      app, exp_timing=2.71828182846 * 1000)
+                    self.assertTiming(
+                        '%s.policy.0.GET.321.first-byte.timing'
+                        % exp_type, app, exp_timing=0.5 * 1000)
+                    self.assertUpdateStats([('%s.GET.321.xfer' % exp_type,
+                                             4 + 7),
+                                            ('object.policy.0.GET.321.xfer',
+                                             4 + 7)],
+                                           app)
+                else:
+                    self.assertUpdateStats([('%s.GET.321.xfer' % exp_type,
+                                            4 + 7)],
+                                           app)
+                exp_labels.update({
+                    'method': 'GET',
+                    'status': 321,
+                    'api': 'swift'
+                })
+                self.assertLabeledTimingStats([
+                    ('swift_proxy_server_request_ttfb', 0.5 * 1000,
+                     exp_labels),
+                    ('swift_proxy_server_request_timing', 2.71828182846 * 1000,
+                     exp_labels)
+                ])
+                self.assertLabeledUpdateStats([
+                    ('swift_proxy_server_request_body_bytes', 4, exp_labels),
+                    ('swift_proxy_server_response_body_bytes', 7, exp_labels),
+                ])
+
+    def test_log_request_stat_type_good_GET_no_policy(self):
+        # GET Repeat the test above, but with a non-existent policy
+        # Do this only for object types
+        for path, exp_labels in self.path_labels.items():
+            self._clear()
+            with mock.patch("time.time",
+                            side_effect=[18.0, 18.5, 20.71828182846]):
+                exp_labels = dict(exp_labels)
+                exp_type = exp_labels['resource']
+                if exp_type != 'object':
+                    continue
+
+                app = proxy_logging.ProxyLoggingMiddleware(
+                    FakeApp(body=b'7654321', response_str='321 Fubar',
+                            policy_idx='-1'), {}, logger=self.logger)
+                app.statsd = self.statsd
+                req = Request.blank(path, environ={
+                    'REQUEST_METHOD': 'GET',
+                    'wsgi.input': BytesIO(b'4321')})
+                iter_response = app(req.environ, lambda *_: None)
+
+                self.assertEqual(b'7654321', b''.join(iter_response))
+                self.assertTiming('%s.GET.321.timing' % exp_type, app,
+                                  exp_timing=2.71828182846 * 1000)
+                # No results returned for the non-existent policy
+                exp_labels.pop('policy')
+                exp_labels.update({
+                    'method': 'GET',
+                    'status': 321,
+                    'api': 'swift'
+                })
+                self.assertUpdateStats([('%s.GET.321.xfer' % exp_type,
+                                        4 + 7)],
+                                       app)
+                self.assertLabeledTimingStats([
+                    ('swift_proxy_server_request_ttfb', 0.5 * 1000,
+                     exp_labels),
+                    ('swift_proxy_server_request_timing', 2.71828182846 * 1000,
+                     exp_labels)
+                ])
+                self.assertLabeledUpdateStats([
+                    ('swift_proxy_server_request_body_bytes', 4, exp_labels),
+                    ('swift_proxy_server_response_body_bytes', 7, exp_labels),
+                ])
+
+    def test_log_request_stat_type_good_GET_log_made(self):
+        # GET with swift.proxy_access_log_made already set
+        for path, exp_labels in self.path_labels.items():
+            self._clear()
+            with mock.patch("time.time",
+                            side_effect=[18.0, 18.5, 20.71828182846]):
+                app = proxy_logging.ProxyLoggingMiddleware(
+                    FakeApp(body=b'7654321', response_str='321 Fubar'), {},
+                    logger=self.logger
+                )
+                app.statsd = self.statsd
+                req = Request.blank(path, environ={
+                    'REQUEST_METHOD': 'GET',
+                    'swift.proxy_access_log_made': True,
+                    'wsgi.input': BytesIO(b'4321')})
+                iter_response = app(req.environ, lambda *_: None)
+                self.assertEqual(b'7654321', b''.join(iter_response))
+                self.assertEqual(
+                    [], app.access_logger.statsd_client.calls['timing'])
+                self.assertEqual(
+                    [], app.access_logger.statsd_client.calls['timing_since'])
+                self.assertEqual(
+                    [], app.access_logger.statsd_client.calls['update_stats'])
+                self.assertLabeledUpdateStats([])
+                self.assertLabeledTimingStats([])
+
+    def test_log_request_stat_type_good_PUT(self):
+        # PUT (no first-byte timing!)
+        # (it's not a GET, so time() doesn't have a 2nd call)
+        for path, exp_labels in self.path_labels.items():
+            self._clear()
+            with mock.patch("time.time", side_effect=[58.2, 58.2 + 7.3321]):
+                exp_labels = dict(exp_labels)
+                exp_type = exp_labels['resource']
+                app = proxy_logging.ProxyLoggingMiddleware(
+                    FakeApp(body=b'87654321', response_str='314 PiTown'), {},
+                    logger=self.logger)
+                app.statsd = self.statsd
+                req = Request.blank(path, environ={
+                    'REQUEST_METHOD': 'PUT',
+                    'wsgi.input': BytesIO(b'654321')})
+                # (it's not a GET, so time() doesn't have a 2nd call)
+                iter_response = app(req.environ, lambda *_: None)
+                self.assertEqual(b'87654321', b''.join(iter_response))
+                self.assertTiming('%s.PUT.314.timing' % exp_type, app,
+                                  exp_timing=7.3321 * 1000)
+                self.assertNotTiming(
+                    '%s.GET.314.first-byte.timing' % exp_type, app)
+                self.assertNotTiming(
+                    '%s.PUT.314.first-byte.timing' % exp_type, app)
+                if exp_type == 'object':
+                    # Object operations also return stats by policy In this
+                    # case, the value needs to match the timing for PUT.
+                    self.assertTiming('%s.policy.0.PUT.314.timing' %
+                                      exp_type, app,
+                                      exp_timing=7.3321 * 1000)
+                    self.assertUpdateStats(
+                        [('object.PUT.314.xfer', 6 + 8),
+                         ('object.policy.0.PUT.314.xfer', 6 + 8)], app)
+                    exp_labels['policy'] = '0'
+                else:
+                    self.assertUpdateStats(
+                        [('%s.PUT.314.xfer' % exp_type, 6 + 8)], app)
+                exp_labels.update({
+                    'method': 'PUT',
+                    'status': 314,
+                    'api': 'swift'
+                })
+                self.assertLabeledUpdateStats([
+                    ('swift_proxy_server_request_body_bytes', 6, exp_labels),
+                    ('swift_proxy_server_response_body_bytes', 8, exp_labels),
+                ])
+                self.assertLabeledTimingStats([
+                    ('swift_proxy_server_request_timing', 7.3321 * 1000,
+                     exp_labels)
+                ])
+
+    def test_log_request_stat_type_good_PUT_no_policy(self):
+        # PUT Repeat the test above, but with a non-existent policy
+        # Do this only for object types
+        for path, exp_labels in self.path_labels.items():
+            self._clear()
+            with mock.patch("time.time", side_effect=[58.2, 58.2 + 7.3321]):
+                exp_labels = dict(exp_labels)
+                exp_type = exp_labels['resource']
+                if exp_type != 'object':
+                    continue
+
+                app = proxy_logging.ProxyLoggingMiddleware(
+                    FakeApp(body=b'87654321', response_str='314 PiTown',
+                            policy_idx='-1'), {}, logger=self.logger)
+                app.statsd = self.statsd
+                req = Request.blank(path, environ={
+                    'REQUEST_METHOD': 'PUT',
+                    'wsgi.input': BytesIO(b'654321')})
+                iter_response = app(req.environ, lambda *_: None)
+                self.assertEqual(b'87654321', b''.join(iter_response))
+                self.assertTiming('%s.PUT.314.timing' % exp_type, app,
+                                  exp_timing=7.3321 * 1000)
+                self.assertNotTiming(
+                    '%s.GET.314.first-byte.timing' % exp_type, app)
+                self.assertNotTiming(
+                    '%s.PUT.314.first-byte.timing' % exp_type, app)
+                # No results returned for the non-existent policy
+                exp_labels.pop('policy')
+                exp_labels.update({
+                    'method': 'PUT',
+                    'status': 314,
+                    'api': 'swift'
+                })
+                self.assertUpdateStats(
+                    [('object.PUT.314.xfer', 6 + 8)], app)
+                self.assertLabeledTimingStats([
+                    ('swift_proxy_server_request_timing', 7.3321 * 1000,
+                     exp_labels),
+                ])
+                self.assertLabeledUpdateStats([
+                    ('swift_proxy_server_request_body_bytes', 6, exp_labels),
+                    ('swift_proxy_server_response_body_bytes', 8, exp_labels),
+                ])
+                self.assertLabeledTimingStats([
+                    ('swift_proxy_server_request_timing', 7.3321 * 1000,
+                     exp_labels)
+                ])
 
     def test_log_request_stat_method_filtering_default(self):
         method_map = {
@@ -148,15 +1073,34 @@ def test_log_request_stat_method_filtering_default(self):
             'DELETE': 'DELETE',
             'OPTIONS': 'OPTIONS',
         }
-        for method, exp_method in method_map.iteritems():
-            app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), {})
-            app.access_logger = FakeLogger()
+        for method, exp_method in method_map.items():
+            self._clear()
+            app = proxy_logging.ProxyLoggingMiddleware(
+                FakeApp(), {}, logger=self.logger)
+            app.statsd = self.statsd
             req = Request.blank('/v1/a/', environ={'REQUEST_METHOD': method})
-            app.log_request(req.environ, 299, 11, 3, 1.17, False)
+            app.update_swift_base_labels(req)
+            now = 10000.0
+            app.log_request(req, 299, 11, 3, now, now + 1.17)
             self.assertTiming('account.%s.299.timing' % exp_method, app,
                               exp_timing=1.17 * 1000)
-            self.assertUpdateStats('account.%s.299.xfer' % exp_method,
-                                   11 + 3, app)
+            self.assertUpdateStats([
+                ('account.%s.299.xfer' % exp_method, 11 + 3),
+            ], app)
+            exp_labels = {
+                'resource': 'account',
+                'method': exp_method,
+                'api': 'swift',
+                'status': 299,
+                'account': 'a'
+            }
+            self.assertLabeledTimingStats([
+                ('swift_proxy_server_request_timing', 1.17 * 1000, exp_labels),
+            ])
+            self.assertLabeledUpdateStats([
+                ('swift_proxy_server_request_body_bytes', 11, exp_labels),
+                ('swift_proxy_server_response_body_bytes', 3, exp_labels)
+            ])
 
     def test_log_request_stat_method_filtering_custom(self):
         method_map = {
@@ -171,242 +1115,2729 @@ def test_log_request_stat_method_filtering_custom(self):
         # this conf var supports optional leading access_
         for conf_key in ['access_log_statsd_valid_http_methods',
                          'log_statsd_valid_http_methods']:
-            for method, exp_method in method_map.iteritems():
+            for method, exp_method in method_map.items():
+                self._clear()
                 app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), {
                     conf_key: 'SPECIAL,  GET,PUT ',  # crazy spaces ok
-                })
-                app.access_logger = FakeLogger()
-                req = Request.blank('/v1/a/c', environ={'REQUEST_METHOD': method})
-                app.log_request(req.environ, 911, 4, 43, 1.01, False)
+                }, logger=self.logger)
+                app.statsd = self.statsd
+                req = Request.blank('/v1/a/c',
+                                    environ={'REQUEST_METHOD': method})
+                app.update_swift_base_labels(req)
+                now = 10000.0
+                app.log_request(req, 911, 4, 43, now, now + 1.01)
                 self.assertTiming('container.%s.911.timing' % exp_method, app,
-                                exp_timing=1.01 * 1000)
-                self.assertUpdateStats('container.%s.911.xfer' % exp_method,
-                                    4 + 43, app)
+                                  exp_timing=1.01 * 1000)
+                self.assertUpdateStats([
+                    ('container.%s.911.xfer' % exp_method, 4 + 43),
+                ], app)
+                exp_labels = {
+                    'resource': 'container',
+                    'method': exp_method,
+                    'api': 'swift',
+                    'status': 911,
+                    'account': 'a',
+                    'container': 'c'
+                }
+                self.assertLabeledTimingStats([
+                    ('swift_proxy_server_request_timing', 1.01 * 1000,
+                     exp_labels),
+                ])
+                self.assertLabeledUpdateStats([
+                    ('swift_proxy_server_request_body_bytes', 4, exp_labels),
+                    ('swift_proxy_server_response_body_bytes', 43, exp_labels)
+                ])
 
     def test_basic_req(self):
         app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), {})
-        app.access_logger = FakeLogger()
+        app.access_logger = debug_logger()
         req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'})
         resp = app(req.environ, start_response)
-        resp_body = ''.join(resp)
+        resp_body = b''.join(resp)
+        log_parts = self._log_parts(app)
+        self.assertEqual(log_parts[3], 'GET')
+        self.assertEqual(log_parts[4], '/')
+        self.assertEqual(log_parts[5], 'HTTP/1.0')
+        self.assertEqual(log_parts[6], '200')
+        self.assertEqual(resp_body, b'FAKE APP')
+        self.assertEqual(log_parts[11], str(len(resp_body)))
+
+    def test_object_error(self):
+        swift = FakeSwift()
+        self.logger = debug_logger()
+        app = proxy_logging.ProxyLoggingMiddleware(swift, {},
+                                                   logger=self.logger)
+        swift.register('GET', '/v1/a/c/o', HTTPServiceUnavailable, {}, None)
+        req = Request.blank('/v1/a/c/o')
+        start = time.time()
+        ttfb = start + 0.2
+        end = ttfb + 0.5
+        with mock.patch("swift.common.middleware.proxy_logging.time.time",
+                        side_effect=[start, ttfb, end]):
+            resp = req.get_response(app)
+            self.assertEqual(503, resp.status_int)
+            # we have to consume the resp body to trigger logging
+            self.assertIn(b'Service Unavailable', resp.body)
+            log_parts = self._log_parts(app)
+        self.assertEqual(log_parts[3], 'GET')
+        self.assertEqual(log_parts[4], '/v1/a/c/o')
+        self.assertEqual(log_parts[5], 'HTTP/1.0')
+        self.assertEqual(log_parts[6], '503')
+        # we can also expect error metrics
+        self.assertTiming('object.GET.503.timing', app,
+                          exp_timing=700.0)
+        self.assertTiming('object.GET.503.first-byte.timing', app,
+                          exp_timing=200.0)
+
+    def test_basic_error(self):
+        swift = FakeSwift()
+        self.logger = debug_logger()
+        app = proxy_logging.ProxyLoggingMiddleware(swift, {},
+                                                   logger=self.logger)
+        swift.register('GET', '/path', HTTPServiceUnavailable, {}, None)
+        req = Request.blank('/path')
+        start = time.time()
+        ttfb = start + 0.2
+        end = ttfb + 0.5
+        with mock.patch("swift.common.middleware.proxy_logging.time.time",
+                        side_effect=[start, ttfb, end]):
+            resp = req.get_response(app)
+            self.assertEqual(503, resp.status_int)
+            # we have to consume the resp body to trigger logging
+            self.assertIn(b'Service Unavailable', resp.body)
+            log_parts = self._log_parts(app)
+        self.assertEqual(log_parts[3], 'GET')
+        self.assertEqual(log_parts[4], '/path')
+        self.assertEqual(log_parts[5], 'HTTP/1.0')
+        self.assertEqual(log_parts[6], '503')
+        # we can also expect error metrics
+        self.assertTiming('UNKNOWN.GET.503.timing', app,
+                          exp_timing=700.0)
+        self.assertTiming('UNKNOWN.GET.503.first-byte.timing', app,
+                          exp_timing=200.0)
+
+    def test_middleware_exception(self):
+        self.logger = debug_logger()
+        app = proxy_logging.ProxyLoggingMiddleware(
+            FakeAppThatExcepts(), {}, logger=self.logger)
+        req = Request.blank('/path')
+        start = time.time()
+        ttfb = start + 0.2
+        with mock.patch("swift.common.middleware.proxy_logging.time.time",
+                        side_effect=[start, ttfb]), \
+                self.assertRaises(Exception):
+            req.get_response(app)
+        log_parts = self._log_parts(app)
+        self.assertEqual(log_parts[3], 'GET')
+        self.assertEqual(log_parts[4], '/path')
+        self.assertEqual(log_parts[5], 'HTTP/1.0')
+        self.assertEqual(log_parts[6], '500')
+        # we can also expect error metrics
+        self.assertTiming('UNKNOWN.GET.500.timing', app,
+                          exp_timing=200.0)
+
+    def test_middleware_error(self):
+        class ErrorFakeApp(object):
+
+            def __call__(self, env, start_response):
+                env['swift.source'] = 'FA'
+                resp = HTTPServiceUnavailable()
+                return resp(env, start_response)
+
+        self.logger = debug_logger()
+        app = proxy_logging.ProxyLoggingMiddleware(ErrorFakeApp(), {},
+                                                   logger=self.logger)
+        req = Request.blank('/path')
+        start = time.time()
+        ttfb = start + 0.2
+        end = ttfb + 0.5
+        with mock.patch("swift.common.middleware.proxy_logging.time.time",
+                        side_effect=[start, ttfb, end]):
+            resp = req.get_response(app)
+            self.assertEqual(503, resp.status_int)
+            # we have to consume the resp body to trigger logging
+            self.assertIn(b'Service Unavailable', resp.body)
+            log_parts = self._log_parts(app)
+        self.assertEqual(log_parts[3], 'GET')
+        self.assertEqual(log_parts[4], '/path')
+        self.assertEqual(log_parts[5], 'HTTP/1.0')
+        self.assertEqual(log_parts[6], '503')
+        # we can also expect error metrics
+        self.assertTiming('FA.GET.503.timing', app,
+                          exp_timing=700.0)
+        self.assertTiming('FA.GET.503.first-byte.timing', app,
+                          exp_timing=200.0)
+
+    def test_basic_req_second_time(self):
+        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), {})
+        app.access_logger = debug_logger()
+        req = Request.blank('/', environ={
+            'swift.proxy_access_log_made': True,
+            'REQUEST_METHOD': 'GET'})
+        resp = app(req.environ, start_response)
+        resp_body = b''.join(resp)
+        self._log_parts(app, should_be_empty=True)
+        self.assertEqual(resp_body, b'FAKE APP')
+
+    def test_log_msg_template(self):
+        # Access logs configuration should override the default one
+        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), {
+            'log_anonymization_salt': 'secret_salt',
+            'log_msg_template': (
+                'template which can be edited in config: '
+                '{protocol} {path} {method} '
+                '{path.anonymized} {container.anonymized} '
+                '{request_time} {start_time.datetime} {end_time} {ttfb} '
+                '{domain}')})
+        app.access_logger = debug_logger()
+        req = Request.blank('/', headers={'Host': 'example.com'})
+        with mock.patch('time.time',
+                        mock.MagicMock(
+                            side_effect=[10000000.0, 10000000.5, 10000001.0])):
+            resp = app(req.environ, start_response)
+            # exhaust generator
+            resp_body = b''.join(resp)
+        log_parts = self._log_parts(app)
+        self.assertEqual(log_parts[0], 'template')
+        self.assertEqual(log_parts[7], 'HTTP/1.0')
+        self.assertEqual(log_parts[8], '/')
+        self.assertEqual(log_parts[9], 'GET')
+        self.assertEqual(log_parts[10],
+                         '{SMD5}c65475e457fea0951fbb9ec9596b2177')
+        self.assertEqual(log_parts[11], '-')
+        self.assertEqual(log_parts[13], '26/Apr/1970/17/46/40')
+        self.assertEqual(log_parts[14], '10000001.000000000')
+        self.assertEqual(log_parts[15], '0.5')
+        self.assertEqual(log_parts[16], 'example.com')
+        self.assertEqual(resp_body, b'FAKE APP')
+
+    def test_log_msg_template_s3api(self):
+        # Access logs configuration should override the default one
+        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), {
+            'log_msg_template': (
+                '{protocol} {path} {method} '
+                '{account} {container} {object}')
+        }, logger=self.logger)
+        app.statsd = self.statsd
+        req = Request.blank(
+            '/bucket/path/to/key',
+            environ={
+                'REQUEST_METHOD': 'GET',
+                # This would actually get set in the app, but w/e
+                'swift.backend_path': '/v1/AUTH_test/bucket/path/to/key'},
+            headers={
+                'Authorization': 'AWS test:tester:hmac',
+                'Date': email.utils.formatdate(time.time() + 0),
+            })
+        with mock.patch("time.time", side_effect=[
+                18.0, 18.5, 20.71828182846]):
+            resp = app(req.environ, start_response)
+            # exhaust generator
+            resp_body = b''.join(resp)
         log_parts = self._log_parts(app)
-        self.assertEquals(log_parts[3], 'GET')
-        self.assertEquals(log_parts[4], '/')
-        self.assertEquals(log_parts[5], 'HTTP/1.0')
-        self.assertEquals(log_parts[6], '200')
-        self.assertEquals(resp_body, 'FAKE APP')
-        self.assertEquals(log_parts[11], str(len(resp_body)))
+        self.assertEqual(log_parts, [
+            'HTTP/1.0',
+            '/bucket/path/to/key',
+            'GET',
+            'AUTH_test',
+            'bucket',
+            'path/to/key',
+        ])
+        self.assertEqual(resp_body, b'FAKE APP')
+        self.assertTiming('object.policy.0.GET.200.timing',
+                          app, exp_timing=2.71828182846 * 1000)
+        self.assertUpdateStats([
+            ('object.GET.200.xfer', 8),
+            ('object.policy.0.GET.200.xfer', 8),
+        ], app)
+        self.assertLabeledUpdateStats([
+            ('swift_proxy_server_request_body_bytes', 0, {
+                'resource': 'object',
+                'api': 'S3',
+                'method': 'GET',
+                'status': 200,
+                'account': 'AUTH_test',
+                'container': 'bucket',
+                'policy': '0'}),
+            ('swift_proxy_server_response_body_bytes', 8, {
+                'resource': 'object',
+                'api': 'S3',
+                'method': 'GET',
+                'status': 200,
+                'account': 'AUTH_test',
+                'container': 'bucket',
+                'policy': '0'})
+        ])
+
+    def test_invalid_log_config(self):
+        with self.assertRaises(ValueError):
+            proxy_logging.ProxyLoggingMiddleware(FakeApp(), {
+                'log_anonymization_salt': 'secret_salt',
+                'log_msg_template': '{invalid_field}'})
+
+        with self.assertRaises(ValueError):
+            proxy_logging.ProxyLoggingMiddleware(FakeApp(), {
+                'log_anonymization_method': 'invalid_hash_method',
+                'log_anonymization_salt': 'secret_salt',
+                'log_msg_template': '{protocol}'})
 
     def test_multi_segment_resp(self):
         app = proxy_logging.ProxyLoggingMiddleware(FakeApp(
-            ['some', 'chunks', 'of data']), {})
-        app.access_logger = FakeLogger()
+            [b'some', b'chunks', b'of data']), {}, logger=self.logger)
+        app.statsd = self.statsd
         req = Request.blank('/', environ={'REQUEST_METHOD': 'GET',
                                           'swift.source': 'SOS'})
+        app.update_swift_base_labels(req)
         resp = app(req.environ, start_response)
-        resp_body = ''.join(resp)
+        resp_body = b''.join(resp)
         log_parts = self._log_parts(app)
-        self.assertEquals(log_parts[3], 'GET')
-        self.assertEquals(log_parts[4], '/')
-        self.assertEquals(log_parts[5], 'HTTP/1.0')
-        self.assertEquals(log_parts[6], '200')
-        self.assertEquals(resp_body, 'somechunksof data')
-        self.assertEquals(log_parts[11], str(len(resp_body)))
-        self.assertUpdateStats('SOS.GET.200.xfer', len(resp_body), app)
+        self.assertEqual(log_parts[3], 'GET')
+        self.assertEqual(log_parts[4], '/')
+        self.assertEqual(log_parts[5], 'HTTP/1.0')
+        self.assertEqual(log_parts[6], '200')
+        self.assertEqual(resp_body, b'somechunksof data')
+        self.assertEqual(log_parts[11], str(len(resp_body)))
+        self.assertUpdateStats([
+            ('SOS.GET.200.xfer', len(resp_body)),
+        ], app)
+        self.assertLabeledUpdateStats([
+            ('swift_proxy_server_request_body_bytes', 0, {
+                'resource': 'SOS',
+                'api': 'swift',
+                'method': 'GET',
+                'status': 200}),
+            ('swift_proxy_server_response_body_bytes', 17, {
+                'resource': 'SOS',
+                'api': 'swift',
+                'method': 'GET',
+                'status': 200})
+        ])
 
     def test_log_headers(self):
-        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(),
-                    {'log_headers': 'yes'})
-        app.access_logger = FakeLogger()
-        req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'})
+        for conf_key in ['access_log_headers', 'log_headers']:
+            self._clear()
+            app = proxy_logging.ProxyLoggingMiddleware(FakeApp(),
+                                                       {conf_key: 'yes'},
+                                                       logger=self.logger)
+            req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'})
+            resp = app(req.environ, start_response)
+            # exhaust generator
+            self.assertEqual(b'FAKE APP', b''.join(resp))
+            log_parts = self._log_parts(app)
+            headers = unquote(log_parts[14]).split('\n')
+            self.assertIn('Host: localhost:80', headers)
+
+    def test_access_log_headers_only(self):
+        app = proxy_logging.ProxyLoggingMiddleware(
+            FakeApp(), {'log_headers': 'yes',
+                        'access_log_headers_only': 'FIRST, seCond'})
+        app.access_logger = debug_logger()
+        req = Request.blank('/',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'First': '1',
+                                     'Second': '2',
+                                     'Third': '3'})
         resp = app(req.environ, start_response)
-        exhaust_generator = [x for x in resp]
+        # exhaust generator
+        self.assertEqual(b'FAKE APP', b''.join(resp))
         log_parts = self._log_parts(app)
         headers = unquote(log_parts[14]).split('\n')
-        self.assert_('Host: localhost:80' in headers)
+        self.assertIn('First: 1', headers)
+        self.assertIn('Second: 2', headers)
+        self.assertNotIn('Third: 3', headers)
+        self.assertNotIn('Host: localhost:80', headers)
 
     def test_upload_size(self):
+        # Using default policy
         app = proxy_logging.ProxyLoggingMiddleware(FakeApp(),
-                    {'log_headers': 'yes'})
-        app.access_logger = FakeLogger()
-        req = Request.blank('/v1/a/c/o/foo', environ={'REQUEST_METHOD': 'PUT',
-            'wsgi.input': StringIO.StringIO('some stuff')})
+                                                   {'log_headers': 'yes'},
+                                                   logger=self.logger)
+        app.statsd = self.statsd
+        req = Request.blank(
+            '/v1/a/c/o/foo',
+            environ={'REQUEST_METHOD': 'PUT',
+                     'wsgi.input': BytesIO(b'some stuff')})
         resp = app(req.environ, start_response)
-        exhaust_generator = [x for x in resp]
+        # exhaust generator
+        self.assertEqual(b'FAKE APP', b''.join(resp))
         log_parts = self._log_parts(app)
-        self.assertEquals(log_parts[11], str(len('FAKE APP')))
-        self.assertEquals(log_parts[10], str(len('some stuff')))
-        self.assertUpdateStats('object.PUT.200.xfer',
-                               len('some stuff') + len('FAKE APP'),
-                               app)
+        self.assertEqual(log_parts[11], str(len('FAKE APP')))
+        self.assertEqual(log_parts[10], str(len('some stuff')))
+        self.assertUpdateStats([
+            ('object.PUT.200.xfer',
+                len('some stuff') + len('FAKE APP')),
+            ('object.policy.0.PUT.200.xfer',
+                len('some stuff') + len('FAKE APP')),
+        ], app)
+        self.assertLabeledUpdateStats([
+            ('swift_proxy_server_request_body_bytes', 10, {
+                'resource': 'object',
+                'api': 'swift',
+                'method': 'PUT',
+                'status': 200,
+                'account': 'a',
+                'container': 'c',
+                'policy': '0'}),
+            ('swift_proxy_server_response_body_bytes', 8, {
+                'resource': 'object',
+                'api': 'swift',
+                'method': 'PUT',
+                'status': 200,
+                'account': 'a',
+                'container': 'c',
+                'policy': '0'})
+        ])
+
+        # Using a non-existent policy
+        self._clear()
+        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(policy_idx='-1'),
+                                                   {'log_headers': 'yes'},
+                                                   logger=self.logger)
+        app.statsd = self.statsd
+        req = Request.blank(
+            '/v1/a/c/o/foo',
+            environ={'REQUEST_METHOD': 'PUT',
+                     'wsgi.input': BytesIO(b'some stuff')})
+        resp = app(req.environ, start_response)
+        # exhaust generator
+        self.assertEqual(b'FAKE APP', b''.join(resp))
+        log_parts = self._log_parts(app)
+        self.assertEqual(log_parts[11], str(len('FAKE APP')))
+        self.assertEqual(log_parts[10], str(len('some stuff')))
+        self.assertUpdateStats([
+            ('object.PUT.200.xfer',
+                len('some stuff') + len('FAKE APP')),
+        ], app)
+        self.assertLabeledUpdateStats([
+            ('swift_proxy_server_request_body_bytes', 10, {
+                'resource': 'object',
+                'method': 'PUT',
+                'api': 'swift',
+                'status': 200,
+                'account': 'a',
+                'container': 'c'}),
+            ('swift_proxy_server_response_body_bytes', 8, {
+                'resource': 'object',
+                'api': 'swift',
+                'method': 'PUT',
+                'status': 200,
+                'account': 'a',
+                'container': 'c'})
+        ])
+
+    def test_upload_size_no_policy(self):
+        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(policy_idx=None),
+                                                   {'log_headers': 'yes'},
+                                                   logger=self.logger)
+        app.statsd = self.statsd
+        req = Request.blank(
+            '/v1/a/c/o/foo',
+            environ={'REQUEST_METHOD': 'PUT',
+                     'wsgi.input': BytesIO(b'some stuff')})
+        resp = app(req.environ, start_response)
+        # exhaust generator
+        self.assertEqual(b'FAKE APP', b''.join(resp))
+        log_parts = self._log_parts(app)
+        self.assertEqual(log_parts[11], str(len('FAKE APP')))
+        self.assertEqual(log_parts[10], str(len('some stuff')))
+        self.assertUpdateStats([
+            ('object.PUT.200.xfer',
+                len('some stuff') + len('FAKE APP')),
+        ], app)
+        self.assertLabeledUpdateStats([
+            ('swift_proxy_server_request_body_bytes', 10, {
+                'resource': 'object',
+                'api': 'swift',
+                'method': 'PUT',
+                'status': 200,
+                'account': 'a',
+                'container': 'c'}),
+            ('swift_proxy_server_response_body_bytes', 8, {
+                'resource': 'object',
+                'api': 'swift',
+                'method': 'PUT',
+                'status': 200,
+                'account': 'a',
+                'container': 'c'})
+        ])
 
     def test_upload_line(self):
         app = proxy_logging.ProxyLoggingMiddleware(FakeAppReadline(),
-                    {'log_headers': 'yes'})
-        app.access_logger = FakeLogger()
-        req = Request.blank('/v1/a/c', environ={'REQUEST_METHOD': 'POST',
-            'wsgi.input': StringIO.StringIO(
-                            'some stuff\nsome other stuff\n')})
+                                                   {'log_headers': 'yes'},
+                                                   logger=self.logger)
+        app.statsd = self.statsd
+        req = Request.blank(
+            '/v1/a/c',
+            environ={'REQUEST_METHOD': 'POST',
+                     'wsgi.input': BytesIO(b'some stuff\nsome other stuff\n')})
+        resp = app(req.environ, start_response)
+        # exhaust generator
+        self.assertEqual(b'FAKE APP', b''.join(resp))
+        log_parts = self._log_parts(app)
+        self.assertEqual(log_parts[11], str(len('FAKE APP')))
+        self.assertEqual(log_parts[10], str(len('some stuff\n')))
+        self.assertUpdateStats([
+            ('container.POST.200.xfer',
+                len('some stuff\n') + len('FAKE APP')),
+        ], app)
+        self.assertLabeledUpdateStats([
+            ('swift_proxy_server_request_body_bytes', len('some stuff\n'), {
+                'resource': 'container',
+                'method': 'POST',
+                'api': 'swift',
+                'status': 200,
+                'account': 'a',
+                'container': 'c'}),
+            ('swift_proxy_server_response_body_bytes', len('FAKE APP'), {
+                'resource': 'container',
+                'api': 'swift',
+                'method': 'POST',
+                'status': 200,
+                'account': 'a',
+                'container': 'c'})
+        ])
+
+    def test_init_storage_domain_default(self):
+        conf = {}
+        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), conf)
+        self.assertEqual([], app.storage_domains)
+
+    def test_init_storage_domain(self):
+        conf = {'storage_domain': 'domain'}
+        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), conf)
+        self.assertEqual(['domain'], app.storage_domains)
+
+    def test_init_storage_domain_list(self):
+        conf = {'storage_domain': 'domain,some.other.domain'}
+        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), conf)
+        self.assertEqual(['domain', 'some.other.domain'], app.storage_domains)
+
+    def _do_test_swift_base_labels(self, mw_conf, path, req_hdrs,
+                                   extra_environ=None):
+        req_environs = []
+
+        def fake_app(env, start_response):
+            req_environs.append(env)
+            return HTTPOk()(env, start_response)
+
+        mw = proxy_logging.ProxyLoggingMiddleware(
+            fake_app, mw_conf, logger=self.logger)
+
+        environ = {
+            'REQUEST_METHOD': 'PUT',
+            'HTTP_HOST': 'foo.domain',
+        }
+        if extra_environ:
+            environ.update(extra_environ)
+        req = Request.blank(path, environ=environ, headers=req_hdrs)
+        req.get_response(mw)
+        self.assertEqual(1, len(req_environs))
+        return req_environs[0].get('swift.base_labels')
+
+    def test_update_swift_base_labels_swift_request(self):
+        mw_conf = {}
+        req_hdrs = {}
+        self.assertEqual(
+            {
+                'resource': 'account',
+                'method': 'PUT',
+                'account': 'a',
+                'api': 'swift'
+            },
+            self._do_test_swift_base_labels(mw_conf, '/v1/a', req_hdrs))
+
+        self.assertEqual(
+            {
+                'resource': 'container',
+                'method': 'PUT',
+                'account': 'a',
+                'container': 'c',
+                'api': 'swift'
+            },
+            self._do_test_swift_base_labels(mw_conf, '/v1/a/c', req_hdrs))
+
+        self.assertEqual(
+            {
+                'resource': 'object',
+                'method': 'PUT',
+                'account': 'a',
+                'container': 'c',
+                'api': 'swift'
+            },
+            self._do_test_swift_base_labels(mw_conf, '/v1/a/c/o', req_hdrs))
+
+    def test_update_swift_base_labels_swift_request_partial_existing(self):
+        # verify that existing container field is not updated
+        mw_conf = {}
+        req_hdrs = {}
+        extra_environ = {
+            'swift.base_labels': {
+                'resource': 'object',
+                'method': 'PUT',
+                'container': 'c',
+            },
+        }
+
+        self.assertEqual(
+            {
+                'resource': 'object',
+                'method': 'PUT',
+                'account': 'a',
+                'container': 'c',
+            },
+            self._do_test_swift_base_labels(
+                mw_conf, '/v1/a', req_hdrs, extra_environ=extra_environ))
+
+        self.assertEqual(
+            {
+                'resource': 'object',
+                'method': 'PUT',
+                'account': 'a',
+                'container': 'c',
+            },
+            self._do_test_swift_base_labels(
+                mw_conf, '/v1/a/ccc', req_hdrs, extra_environ=extra_environ))
+
+        self.assertEqual(
+            {
+                'resource': 'object',
+                'method': 'PUT',
+                'account': 'a',
+                'container': 'c',
+            },
+            self._do_test_swift_base_labels(
+                mw_conf, '/v1/a/c/ooo', req_hdrs, extra_environ=extra_environ))
+
+    def test_update_swift_base_labels_swift_request_empty_existing(self):
+        # verify that missing container field is
+        # not set once base_labels exists
+        mw_conf = {}
+        req_hdrs = {}
+        extra_environ = {
+            'swift.base_labels': {
+                'resource': 'object',
+                'method': 'PUT',
+            },
+        }
+
+        self.assertEqual(
+            {
+                'resource': 'object',
+                'method': 'PUT',
+                'account': 'a',
+            },
+            self._do_test_swift_base_labels(
+                mw_conf, '/v1/a', req_hdrs, extra_environ=extra_environ))
+
+        self.assertEqual(
+            {
+                'resource': 'object',
+                'method': 'PUT',
+                'account': 'a',
+            },
+            self._do_test_swift_base_labels(
+                mw_conf, '/v1/a/c', req_hdrs, extra_environ=extra_environ))
+
+        self.assertEqual(
+            {
+                'resource': 'object',
+                'method': 'PUT',
+                'account': 'a',
+            },
+            self._do_test_swift_base_labels(
+                mw_conf, '/v1/a/c/o', req_hdrs, extra_environ=extra_environ))
+
+    def test_update_swift_base_labels_swift_request_complete_existing(self):
+        # verify that existing account and container fields are not replaced
+        mw_conf = {}
+        req_hdrs = {}
+        extra_environ = {
+            'swift.base_labels': {
+                'resource': 'object',
+                'method': 'PUT',
+                'account': 'a',
+                'container': 'c',
+            },
+        }
+
+        self.assertEqual(
+            {
+                'resource': 'object',
+                'method': 'PUT',
+                'account': 'a',
+                'container': 'c',
+            },
+            self._do_test_swift_base_labels(
+                mw_conf, '/v1/aa', req_hdrs, extra_environ=extra_environ))
+
+        self.assertEqual(
+            {
+                'resource': 'object',
+                'method': 'PUT',
+                'account': 'a',
+                'container': 'c',
+            },
+            self._do_test_swift_base_labels(
+                mw_conf, '/v1/aa/cc', req_hdrs, extra_environ=extra_environ))
+
+    def test_update_swift_base_labels_s3_request_partial_existing(self):
+        # verify that existing container field is not replaced by s3 field
+        mw_conf = {}
+        req_hdrs = {
+            'Authorization': 'AWS test:tester:hmac',
+            'Date': email.utils.formatdate(time.time() + 0),
+        }
+        extra_environ = {
+            'swift.base_labels': {
+                'resource': 'object',
+                'method': 'PUT',
+                'container': 'c',
+                'api': 'S3'
+            },
+        }
+        self.assertEqual(
+            {
+                'resource': 'object',
+                'method': 'PUT',
+                'container': 'c',
+                'api': 'S3'
+            },
+            self._do_test_swift_base_labels(
+                mw_conf, '/bucket', req_hdrs, extra_environ=extra_environ))
+
+        self.assertEqual(
+            {
+                'resource': 'object',
+                'method': 'PUT',
+                'container': 'c',
+                'api': 'S3'
+            },
+            self._do_test_swift_base_labels(
+                mw_conf, '/bucket/obj', req_hdrs, extra_environ=extra_environ))
+
+        extra_environ = {
+            'swift.base_labels': {
+                'resource': 'object',
+                'method': 'PUT',
+            },
+        }
+        self.assertEqual(
+            {
+                'resource': 'object',
+                'method': 'PUT',
+            },
+            self._do_test_swift_base_labels(
+                mw_conf, '/bucket', req_hdrs, extra_environ=extra_environ))
+
+        self.assertEqual(
+            {
+                'resource': 'object',
+                'method': 'PUT',
+            },
+            self._do_test_swift_base_labels(
+                mw_conf, '/bucket/obj', req_hdrs, extra_environ=extra_environ))
+
+        mw_conf = {'storage_domain': 'domain'}
+        self.assertEqual(
+            {
+                'resource': 'object',
+                'method': 'PUT',
+            },
+            self._do_test_swift_base_labels(
+                mw_conf, '/bucket/obj', req_hdrs, extra_environ=extra_environ))
+
+    def _do_test_update_swift_base_labels_s3_request(self, req_hdrs):
+        mw_conf = {}
+        req_hdrs = {
+            'Authorization': 'AWS test:tester:hmac',
+            'Date': email.utils.formatdate(time.time() + 0),
+        }
+        self.assertEqual(
+            {
+                'resource': 'container',
+                'method': 'PUT',
+                'container': 'bucket',
+                'api': 'S3'
+            },
+            self._do_test_swift_base_labels(mw_conf, '/bucket', req_hdrs))
+
+        self.assertEqual(
+            {
+                'resource': 'object',
+                'method': 'PUT',
+                'container': 'bucket',
+                'api': 'S3'
+            },
+            self._do_test_swift_base_labels(mw_conf, '/bucket/obj', req_hdrs))
+
+        self.assertEqual(
+            {
+                'resource': 'object',
+                'method': 'PUT',
+                'container': 'bucket',
+                'api': 'S3'
+            },
+            self._do_test_swift_base_labels(mw_conf, '/bucket/obj/x',
+                                            req_hdrs))
+
+    def test_update_swift_base_labels_s3_request(self):
+        # v2 req
+        req_hdrs = {
+            'Authorization': 'AWS test:tester:hmac',
+            'Date': email.utils.formatdate(time.time() + 0),
+        }
+        self._do_test_update_swift_base_labels_s3_request(req_hdrs)
+        # v4 req
+        date_header = self.get_v4_amz_date_header()
+        req_hdrs = {
+            'Authorization': 'AWS4-HMAC-SHA256 ' + ', '.join([
+                'Credential=test:tester/%s/us-east-1/s3/aws4_request' %
+                date_header.split('T', 1)[0],
+                'SignedHeaders=host',
+                'Signature=X',
+            ]),
+        }
+        self._do_test_update_swift_base_labels_s3_request(req_hdrs)
+
+    def test_update_swift_base_labels_s3_request_bucket_in_host(self):
+        mw_conf = {'storage_domain': 'domain'}
+        req_hdrs = {
+            'Authorization': 'AWS test:tester:hmac',
+            'Date': email.utils.formatdate(time.time() + 0),
+        }
+        self.assertEqual(
+            {
+                'resource': 'container',
+                'method': 'PUT',
+                'container': 'foo',
+                'api': 'S3'
+            },
+            self._do_test_swift_base_labels(mw_conf, '/', req_hdrs))
+
+        self.assertEqual(
+            {
+                'resource': 'object',
+                'method': 'PUT',
+                'container': 'foo',
+                'api': 'S3'
+            },
+            self._do_test_swift_base_labels(mw_conf, '/obj', req_hdrs))
+
+        self.assertEqual(
+            {
+                'resource': 'object',
+                'method': 'PUT',
+                'container': 'foo',
+                'api': 'S3'
+            },
+            self._do_test_swift_base_labels(mw_conf, '/obj/x', req_hdrs))
+
+        mw_conf = {'storage_domain': 'not-domain'}
+        self.assertEqual(
+            {
+                'resource': 'object',
+                'method': 'PUT',
+                'container': 'bucket',
+                'api': 'S3'
+            },
+            self._do_test_swift_base_labels(mw_conf, '/bucket/obj', req_hdrs))
+
+    def _do_test_base_labels_end_to_end(self, orig_path, new_path=None,
+                                        req_hdrs=None):
+        # if new_path is given then pretend an s3api/auth middleware
+        # combination replaces the request path with new_path
+        mw_conf = {}
+        base_labels = []
+
+        def fake_mw(env, start_response):
+            base_labels.append(dict(env.get('swift.base_labels')))
+            env['PATH_INFO'] = new_path or orig_path
+            return right_mw(env, start_response)
+
+        def fake_app(env, start_response):
+            base_labels.append(dict(env.get('swift.base_labels')))
+            return HTTPOk()(env, start_response)
+
+        left_mw = proxy_logging.ProxyLoggingMiddleware(
+            fake_mw, mw_conf, logger=self.logger)
+        right_mw = proxy_logging.ProxyLoggingMiddleware(
+            fake_app, mw_conf, logger=self.logger)
+
+        req = Request.blank(orig_path, headers=req_hdrs)
+        req.method = 'PUT'
+        req.get_response(left_mw)
+        self.assertEqual(2, len(base_labels))
+
+        return base_labels
+
+    def test_base_labels_end_to_end_info(self):
+        base_labels = self._do_test_base_labels_end_to_end('/info')
+
+        self.assertEqual(
+            [{'method': 'PUT', 'api': 'swift', 'resource': 'UNKNOWN'},
+             {'method': 'PUT', 'api': 'swift', 'resource': 'UNKNOWN'}],
+            base_labels)
+
+    def test_base_labels_end_to_end_account(self):
+        base_labels = self._do_test_base_labels_end_to_end('/v1/a')
+
+        self.assertEqual(
+            [{'account': 'a', 'api': 'swift', 'method': 'PUT',
+              'resource': 'account'},
+             {'account': 'a', 'api': 'swift', 'method': 'PUT',
+              'resource': 'account'}],
+            base_labels)
+
+    def test_base_labels_end_to_end_container(self):
+        base_labels = self._do_test_base_labels_end_to_end('/v1/a/c')
+
+        self.assertEqual([{'account': 'a', 'container': 'c', 'method': 'PUT',
+                           'api': 'swift', 'resource': 'container'},
+                          {'account': 'a', 'container': 'c', 'method': 'PUT',
+                           'api': 'swift', 'resource': 'container'}],
+                         base_labels)
+
+    def test_base_labels_end_to_end_object(self):
+        base_labels = self._do_test_base_labels_end_to_end('/v1/a/c/o')
+
+        self.assertEqual(
+            [{'account': 'a', 'container': 'c', 'method': 'PUT',
+              'api': 'swift', 'resource': 'object'},
+             {'account': 'a', 'container': 'c', 'method': 'PUT',
+              'api': 'swift', 'resource': 'object'}],
+            base_labels)
+
+    def test_swift_base_labels_end_to_end_account_s3(self):
+        req_hdrs = {
+            'Authorization': 'AWS test:tester:hmac',
+            'Date': email.utils.formatdate(time.time() + 0),
+        }
+
+        base_labels = self._do_test_base_labels_end_to_end(
+            '/', '/v1/a', req_hdrs)
+        self.assertEqual(
+            [{'method': 'PUT', 'api': 'S3'},
+             {'account': 'a', 'method': 'PUT', 'resource': 'account',
+              'api': 'S3'}],
+            base_labels)
+
+    def test_base_labels_end_to_end_container_s3(self):
+        req_hdrs = {
+            'Authorization': 'AWS test:tester:hmac',
+            'Date': email.utils.formatdate(time.time() + 0),
+        }
+
+        base_labels = self._do_test_base_labels_end_to_end(
+            '/bucket', '/v1/a/bucket', req_hdrs)
+        self.assertEqual(
+            [{'container': 'bucket', 'method': 'PUT', 'resource': 'container',
+              'api': 'S3'},
+             {'account': 'a', 'container': 'bucket', 'method': 'PUT',
+              'resource': 'container', 'api': 'S3'}],
+            base_labels)
+
+    def test_base_labels_end_to_end_object_s3(self):
+        req_hdrs = {
+            'Authorization': 'AWS test:tester:hmac',
+            'Date': email.utils.formatdate(time.time() + 0),
+        }
+
+        base_labels = self._do_test_base_labels_end_to_end(
+            '/bucket/o', '/v1/a/bucket/o',
+            req_hdrs)
+        self.assertEqual(
+            [{'container': 'bucket', 'method': 'PUT', 'resource': 'object',
+              'api': 'S3'},
+             {'account': 'a', 'container': 'bucket',
+              'method': 'PUT', 'resource': 'object', 'api': 'S3'}],
+            base_labels)
+
+    def test_base_labels_end_to_end_object_s3_sigv4(self):
+        date_header = self.get_v4_amz_date_header()
+        req_hdrs = {
+            'Authorization': 'AWS4-HMAC-SHA256 ' + ', '.join([
+                'Credential=test:tester/%s/us-east-1/s3/aws4_request' %
+                date_header.split('T', 1)[0],
+                'SignedHeaders=host',
+                'Signature=X',
+            ]),
+        }
+
+        base_labels = self._do_test_base_labels_end_to_end(
+            '/bucket/o', '/v1/a/bucket/o',
+            req_hdrs)
+        self.assertEqual(
+            [{'container': 'bucket', 'method': 'PUT', 'resource': 'object',
+              'api': 'S3'},
+             {'account': 'a', 'container': 'bucket',
+              'method': 'PUT', 'resource': 'object', 'api': 'S3'}],
+            base_labels)
+
+    def _do_test_call_app(self, req, app):
+        status, headers, body_iter = req.call_application(app)
+        body = b''.join(body_iter)
+        return status, headers, body
+
+    def test_xfer_stats_put(self):
+        buffer_str = (b'some stuff\n'
+                      b'some other stuff\n'
+                      b'some additional extra stuff\n')
+        buffer_len = len(buffer_str)
+        read_calls = 0
+        read_bytes = 0
+
+        # statsd calls expected while the request body is being read...
+        # (these are in the form expected by assertLabeledUpdateStats)
+        exp_req_stats_per_iter = []
+        nbytes = 0
+        while nbytes + 5 <= buffer_len:
+            iter_stats = [
+                ('swift_proxy_server_request_body_streaming_bytes', 5, {
+                    'account': 'a',
+                    'api': 'swift',
+                    'container': 'c',
+                    'method': 'PUT',
+                    'resource': 'container'})
+            ]
+            exp_req_stats_per_iter.append(iter_stats)
+
+            nbytes += 5
+        if nbytes < buffer_len:
+            iter_stats = [
+                ('swift_proxy_server_request_body_streaming_bytes',
+                 buffer_len - nbytes, {
+                     'account': 'a',
+                     'api': 'swift',
+                     'container': 'c',
+                     'method': 'PUT',
+                     'resource': 'container'})
+            ]
+            exp_req_stats_per_iter.append(iter_stats)
+            # statsd calls expected while the response is being handled...
+        expect_resp_stats = [
+            ('swift_proxy_server_response_body_streaming_bytes',
+             len('FAKE APP'), {
+                 'resource': 'container',
+                 'method': 'PUT',
+                 'api': 'swift',
+                 'status': 200,
+                 'policy': '0',
+                 'account': 'a',
+                 'container': 'c'}),
+            ('swift_proxy_server_request_body_bytes', buffer_len, {
+                'resource': 'container',
+                'api': 'swift',
+                'method': 'PUT',
+                'status': 200,
+                'account': 'a',
+                'container': 'c'}),
+            ('swift_proxy_server_response_body_bytes',
+             len('FAKE APP'), {
+                 'account': 'a',
+                 'api': 'swift',
+                 'container': 'c',
+                 'method': 'PUT',
+                 'resource': 'container',
+                 'status': 200}),
+        ]
+        captured_req_stats_per_iter = []
+
+        def capture_stats(nbytes):
+            # capture stats emitted while the request body is being read
+            statsd_calls = self.statsd.calls['update_stats']
+            metric_value_labels = []
+            for statsd_call in statsd_calls:
+                metric_value_labels.append(
+                    (statsd_call[0][0], statsd_call[0][1],
+                     statsd_call[1]['labels']))
+            if len(metric_value_labels) > 0:
+                captured_req_stats_per_iter.append(metric_value_labels)
+                nonlocal read_calls
+                nonlocal read_bytes
+                read_calls += 1
+                read_bytes += nbytes
+            self.statsd.clear()
+
+        conf = {
+            'statsd_label_mode': 'dogstatsd',
+            'statsd_emit_buffer_xfer_bytes_seconds': 0,
+        }
+        app = proxy_logging.ProxyLoggingMiddleware(
+            FakeApp(read_callback=capture_stats), conf, logger=self.logger)
+        app.statsd = self.statsd
+        req = Request.blank(
+            '/v1/a/c',
+            environ={'REQUEST_METHOD': 'PUT',
+                     'wsgi.input': BytesIO(buffer_str),
+                     })
+        resp = app(req.environ, start_response)
+        self.assertEqual(b'FAKE APP', b''.join(resp))
+        self.assertEqual(read_bytes, buffer_len)
+        self.assertEqual(read_calls, len(captured_req_stats_per_iter))
+
+        self.assertEqual(exp_req_stats_per_iter,
+                         captured_req_stats_per_iter)
+        # note: the fake statsd was cleared after the request body was read so
+        # just has the response handling statsd calls...
+        self.assertLabeledUpdateStats(expect_resp_stats)
+        self.assertUpdateStats([
+            ('container.PUT.200.xfer',
+             buffer_len + len('FAKE APP')),
+        ], app)
+
+    def test_xfer_stats_get(self):
+        buffers = [b'some stuff\n',
+                   b'some other stuff\n',
+                   b'some additional stuff\n']
+        buffer_len = sum(len(b) for b in buffers)
+        conf = {
+            'log_headers': 'yes',
+            'statsd_label_mode': 'dogstatsd',
+            'statsd_emit_buffer_xfer_bytes_seconds': 0,
+        }
+        app = proxy_logging.ProxyLoggingMiddleware(
+            FakeApp(
+                body=buffers,
+            ), conf, logger=self.logger)
+        app.statsd = self.statsd
+        req = Request.blank(
+            '/v1/a/c', environ={'REQUEST_METHOD': 'GET'})
         resp = app(req.environ, start_response)
-        exhaust_generator = [x for x in resp]
+        resp_body = b''.join(resp)
+        expected_resp = b''.join(buffers)
+        log_parts = self._log_parts(app)
+        self.assertEqual(log_parts[3], 'GET')
+        self.assertEqual(log_parts[4], '/v1/a/c')
+        self.assertEqual(log_parts[5], 'HTTP/1.0')
+        self.assertEqual(log_parts[6], '200')
+        self.assertEqual(resp_body, expected_resp)
+        self.assertEqual(log_parts[11], str(buffer_len))
+        self.assertUpdateStats([
+            ('container.GET.200.xfer',
+             buffer_len),
+        ], app)
+        self.assertLabeledUpdateStats([
+            ('swift_proxy_server_response_body_streaming_bytes', 11, {
+                'account': 'a',
+                'api': 'swift',
+                'container': 'c',
+                'method': 'GET',
+                'policy': '0',
+                'resource': 'container',
+                'status': 200}),
+            ('swift_proxy_server_response_body_streaming_bytes', 17, {
+                'account': 'a',
+                'api': 'swift',
+                'container': 'c',
+                'method': 'GET',
+                'policy': '0',
+                'resource': 'container',
+                'status': 200}),
+            ('swift_proxy_server_response_body_streaming_bytes', 22, {
+                'account': 'a',
+                'api': 'swift',
+                'container': 'c',
+                'method': 'GET',
+                'policy': '0',
+                'resource': 'container',
+                'status': 200}),
+            ('swift_proxy_server_request_body_bytes', 0, {
+                'resource': 'container',
+                'api': 'swift',
+                'method': 'GET',
+                'status': 200,
+                'account': 'a',
+                'container': 'c'}),
+            ('swift_proxy_server_response_body_bytes', buffer_len, {
+                'resource': 'container',
+                'api': 'swift',
+                'method': 'GET',
+                'status': 200,
+                'account': 'a',
+                'container': 'c'}),
+        ])
+
+    def test_xfer_stats_emit_frequency_put(self):
+
+        conf = {
+            'statsd_label_mode': 'dogstatsd',
+            'statsd_emit_buffer_xfer_bytes_seconds': 0.005,
+        }
+        app = proxy_logging.ProxyLoggingMiddleware(
+            FakeApp(), conf, logger=self.logger)
+        app.statsd = self.statsd
+        buffer_str = (b'some stuff\n'
+                      b'some other stuff\n'
+                      b'some additional stuff and blah\n')
+        buffer_len = len(buffer_str)
+        req = Request.blank(
+            '/v1/a/c',
+            environ={'REQUEST_METHOD': 'PUT',
+                     'wsgi.input': BytesIO(buffer_str),
+                     })
+        with mock.patch(
+                'time.time',
+                side_effect=(0.001 * i for i in itertools.count())):
+            resp = app(req.environ, start_response)
+            # exhaust generator
+            self.assertEqual(b'FAKE APP', b''.join(resp))
         log_parts = self._log_parts(app)
-        self.assertEquals(log_parts[11], str(len('FAKE APP')))
-        self.assertEquals(log_parts[10], str(len('some stuff\n')))
-        self.assertUpdateStats('container.POST.200.xfer',
-                               len('some stuff\n') + len('FAKE APP'),
-                               app)
+        self.assertEqual(log_parts[11], str(len('FAKE APP')))
+        self.assertEqual(log_parts[10], str(buffer_len))
+        self.assertUpdateStats([
+            ('container.PUT.200.xfer',
+             buffer_len + len('FAKE APP')),
+        ], app)
+        self.assertLabeledUpdateStats([
+            ('swift_proxy_server_request_body_streaming_bytes', 20, {
+                'account': 'a',
+                'api': 'swift',
+                'container': 'c',
+                'method': 'PUT',
+                'resource': 'container'}),
+            ('swift_proxy_server_request_body_streaming_bytes', 25, {
+                'account': 'a',
+                'api': 'swift',
+                'container': 'c',
+                'method': 'PUT',
+                'resource': 'container'}),
+            ('swift_proxy_server_request_body_streaming_bytes', 14, {
+                'account': 'a',
+                'api': 'swift',
+                'container': 'c',
+                'method': 'PUT',
+                'resource': 'container'}),
+            ('swift_proxy_server_response_body_streaming_bytes',
+             len('FAKE APP'), {
+                 'resource': 'container',
+                 'api': 'swift',
+                 'method': 'PUT',
+                 'status': 200,
+                 'policy': '0',
+                 'account': 'a',
+                 'container': 'c'}),
+            ('swift_proxy_server_request_body_bytes', buffer_len, {
+                'resource': 'container',
+                'api': 'swift',
+                'method': 'PUT',
+                'status': 200,
+                'account': 'a',
+                'container': 'c'}),
+            ('swift_proxy_server_response_body_bytes', 8, {
+                'account': 'a',
+                'api': 'swift',
+                'container': 'c',
+                'method': 'PUT',
+                'resource': 'container',
+                'status': 200})
+        ])
+
+    def test_xfer_stats_emit_frequency_get(self):
+
+        buffers = [b'some stuff\n',
+                   b'some other stuff\n',
+                   b'some additional stuff and all\n']
+        buffer_len = sum(len(b) for b in buffers)
+        conf = {
+            'statsd_label_mode': 'dogstatsd',
+            'statsd_emit_buffer_xfer_bytes_seconds': 0.005,
+        }
+        app = proxy_logging.ProxyLoggingMiddleware(
+            FakeApp(
+                body=buffers,
+            ), conf, logger=self.logger)
+        app.statsd = self.statsd
+        req = Request.blank(
+            '/v1/a/c', environ={'REQUEST_METHOD': 'GET'})
+        with mock.patch(
+                'time.time',
+                side_effect=(0.001 * i for i in itertools.count())):
+            resp = app(req.environ, start_response)
+            resp_body = b''.join(resp)
+        expected_resp = b''.join(buffers)
+        self.assertEqual(resp_body, expected_resp)
+        self.assertUpdateStats([
+            ('container.GET.200.xfer', buffer_len),
+        ], app
+        )
+        self.assertLabeledUpdateStats([
+            ('swift_proxy_server_response_body_streaming_bytes', 58, {
+                'account': 'a',
+                'container': 'c',
+                'api': 'swift',
+                'method': 'GET',
+                'policy': '0',
+                'resource': 'container',
+                'status': 200}),
+            ('swift_proxy_server_request_body_bytes', 0, {
+                'resource': 'container',
+                'api': 'swift',
+                'method': 'GET',
+                'status': 200,
+                'account': 'a',
+                'container': 'c'}),
+            ('swift_proxy_server_response_body_bytes', buffer_len, {
+                'resource': 'container',
+                'api': 'swift',
+                'method': 'GET',
+                'status': 200,
+                'account': 'a',
+                'container': 'c'}),
+        ])
+
+    def _make_logged_pipeline(self, storage_domain=None, rewrite_path=False):
+        # make a pipeline:
+        # proxy_logging s3api fake_auth [rewrite_path] proxy_logging fake_swift
+        fake_swift = FakeSwift(test_read_size=5)
+        app = proxy_logging.ProxyLoggingMiddleware(fake_swift, {
+            'access_log_route': 'subrequest',
+        }, logger=self.logger)
+        if rewrite_path:
+            app = PathRewritingApp(app, self.logger)
+        app = FakeAuthApp(app)
+        app._pipeline_final_app = fake_swift
+        app = s3api_filter_factory({
+            'force_swift_request_proxy_log': False,
+            'storage_domain': storage_domain,
+        })(app)
+        proxy_logging_conf = {
+            'access_log_route': 'proxy_access',
+            'statsd_label_mode': 'dogstatsd',
+            'statsd_emit_buffer_xfer_bytes_seconds': 0,
+            'storage_domain': storage_domain,
+        }
+        app = proxy_logging.ProxyLoggingMiddleware(
+            app, proxy_logging_conf, logger=self.logger)
+        app.statsd = self.statsd
+        return app, fake_swift
+
+    def test_xfer_stats_put_s3api(self):
+        app, swift = self._make_logged_pipeline(rewrite_path=True)
+        buffer_str = (b'some stuff\n'
+                      b'some other stuff\n'
+                      b'some additional stuff\n')
+        buffer_len = len(buffer_str)
+        etag = md5(buffer_str, usedforsecurity=False).hexdigest()
+        last_modified = 'Fri, 01 Apr 2014 12:00:00 GMT'
+
+        swift.register('PUT', '/v1/AUTH_test/bucket+segments/object',
+                       HTTPCreated,
+                       {'etag': etag,
+                        'last-modified': last_modified,
+                        'Content-Length': 0},
+                       None)
+
+        date_header = email.utils.formatdate(time.time() + 0)
+        req = Request.blank(
+            '/bucket/object',
+            environ={
+                'REQUEST_METHOD': 'PUT',
+                'wsgi.input': BytesIO(buffer_str),
+            },
+            headers={
+                'Authorization': 'AWS test:tester:hmac',
+                'Date': date_header,
+            },
+        )
+
+        status, headers, body = self._do_test_call_app(req, app)
+        self.assertEqual('200 OK', status)
+
+        self.assertEqual('/v1/AUTH_test/bucket/object',
+                         req.environ['swift.backend_path'])
+        base_labels = req.environ.get('swift.base_labels')
+        self.assertIsNotNone(base_labels)
+
+        self.assertEqual(swift.calls, [
+            ('PUT', '/v1/AUTH_test/bucket+segments/object'),
+        ])
+
+        self.assertUpdateStats([
+            ('object.PUT.200.xfer', buffer_len),
+            ('object.policy.0.PUT.200.xfer', buffer_len)
+        ], app)
+
+        stats = []
+        for i in range(10):
+            stats.append(
+                ('swift_proxy_server_request_body_streaming_bytes', 5, {
+                    'account': 'AUTH_test',
+                    'container': 'bucket',
+                    'method': 'PUT',
+                    'resource': 'object',
+                    'api': 'S3'}))
+        stats += [
+            ('swift_proxy_server_request_body_bytes', buffer_len, {
+                'resource': 'object',
+                'api': 'S3',
+                'method': 'PUT',
+                'status': 200,
+                'account': 'AUTH_test',
+                'container': 'bucket',
+                'policy': '0'}),
+            ('swift_proxy_server_response_body_bytes', 0, {
+                'resource': 'object',
+                'api': 'S3',
+                'method': 'PUT',
+                'status': 200,
+                'account': 'AUTH_test',
+                'container': 'bucket',
+                'policy': '0'})]
+        self.assertLabeledUpdateStats(stats)
+
+        req = Request.blank('/bucket/object',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Authorization': 'AWS test:tester:hmac',
+                                     'Date': date_header})
+        status, headers, body = self._do_test_call_app(req, app)
+        self.assertEqual(status.split()[0], '200')
+
+    def test_xfer_stats_get_s3api(self):
+        app, swift = self._make_logged_pipeline()
+        buffers = [b'some stuff\n',
+                   b'some other stuff\n',
+                   b'some additional stuff\n']
+        buffer_len = sum(len(b) for b in buffers)
+        last_modified = 'Fri, 01 Apr 2014 12:00:00 GMT'
+        date_header = email.utils.formatdate(time.time() + 0)
+
+        swift.register('GET', '/v1/AUTH_test/bucket/object',
+                       HTTPOk,
+                       {'last-modified': last_modified},
+                       buffers)
+
+        req = Request.blank(
+            '/bucket/object',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Authorization': 'AWS test:tester:hmac',
+                     'Date': date_header},
+        )
+        status, headers, body = self._do_test_call_app(req, app)
+        self.assertEqual('200 OK', status)
+
+        self.assertEqual('/v1/AUTH_test/bucket/object',
+                         req.environ['swift.backend_path'])
+        base_labels = req.environ.get('swift.base_labels', None)
+        self.assertEqual(base_labels, {
+            'resource': 'object',
+            'method': 'GET',
+            'account': 'AUTH_test',
+            'container': 'bucket',
+            'api': 'S3'
+        })
+
+        self.assertEqual(swift.calls, [
+            ('GET', '/v1/AUTH_test/bucket/object'),
+        ])
+
+        self.assertUpdateStats([
+            ('object.GET.200.xfer', buffer_len),
+            ('object.policy.0.GET.200.xfer', buffer_len)
+        ], app)
+
+        self.assertLabeledUpdateStats([
+            ('swift_proxy_server_response_body_streaming_bytes', 11, {
+                'resource': 'object',
+                'method': 'GET',
+                'status': 200,
+                'policy': '0',
+                'account': 'AUTH_test',
+                'container': 'bucket',
+                'api': 'S3'
+            }),
+            ('swift_proxy_server_response_body_streaming_bytes', 17, {
+                'resource': 'object',
+                'method': 'GET',
+                'status': 200,
+                'policy': '0',
+                'account': 'AUTH_test',
+                'container': 'bucket',
+                'api': 'S3'
+            }),
+            ('swift_proxy_server_response_body_streaming_bytes', 22, {
+                'resource': 'object',
+                'method': 'GET',
+                'status': 200,
+                'policy': '0',
+                'account': 'AUTH_test',
+                'container': 'bucket',
+                'api': 'S3'
+            }),
+            ('swift_proxy_server_request_body_bytes', 0, {
+                'resource': 'object',
+                'api': 'S3',
+                'method': 'GET',
+                'status': 200,
+                'account': 'AUTH_test',
+                'container': 'bucket',
+                'policy': '0'}),
+            ('swift_proxy_server_response_body_bytes', buffer_len, {
+                'resource': 'object',
+                'api': 'S3',
+                'method': 'GET',
+                'status': 200,
+                'account': 'AUTH_test',
+                'container': 'bucket',
+                'policy': '0'}),
+        ])
+
+    def test_base_labels_put_swift(self):
+        app, swift = self._make_logged_pipeline()
+        buffer_str = (b'some stuff\n'
+                      b'some other stuff\n'
+                      b'some additional stuff\n')
+        etag = md5(buffer_str, usedforsecurity=False).hexdigest()
+        last_modified = 'Fri, 01 Apr 2014 12:00:00 GMT'
+
+        swift.register('PUT', '/v1/AUTH_test/bucket/object',
+                       HTTPCreated,
+                       {'etag': etag,
+                        'last-modified': last_modified,
+                        'Content-Length': 0},
+                       None)
+
+        date_header = email.utils.formatdate(time.time() + 0)
+        req = Request.blank(
+            '/v1/AUTH_test/bucket/object',
+            environ={
+                'REQUEST_METHOD': 'PUT',
+                'wsgi.input': BytesIO(buffer_str),
+            },
+            headers={
+                'Date': date_header,
+            },
+        )
+
+        status, headers, body = self._do_test_call_app(req, app)
+        self.assertEqual('201 Created', status)
+
+        base_labels = req.environ.get('swift.base_labels', None)
+        self.assertEqual(base_labels, {
+            'resource': 'object',
+            'api': 'swift',
+            'method': 'PUT',
+            'account': 'AUTH_test',
+            'container': 'bucket',
+        })
+
+        self.assertEqual(swift.calls, [
+            ('PUT', '/v1/AUTH_test/bucket/object'),
+        ])
+
+    def test_base_labels_put_s3api(self):
+        app, swift = self._make_logged_pipeline()
+        buffer_str = (b'some stuff\n'
+                      b'some other stuff\n'
+                      b'some additional stuff\n')
+        etag = md5(buffer_str, usedforsecurity=False).hexdigest()
+        last_modified = 'Fri, 01 Apr 2014 12:00:00 GMT'
+
+        swift.register('PUT', '/v1/AUTH_test/bucket/object',
+                       HTTPCreated,
+                       {'etag': etag,
+                        'last-modified': last_modified,
+                        'Content-Length': 0},
+                       None)
+
+        date_header = email.utils.formatdate(time.time() + 0)
+        req = Request.blank(
+            '/bucket/object',
+            environ={
+                'REQUEST_METHOD': 'PUT',
+                'wsgi.input': BytesIO(buffer_str),
+            },
+            headers={
+                'Authorization': 'AWS test:tester:hmac',
+                'Date': date_header,
+            },
+        )
+        status, headers, body = self._do_test_call_app(req, app)
+        self.assertEqual('200 OK', status)
+
+        self.assertEqual('/v1/AUTH_test/bucket/object',
+                         req.environ['swift.backend_path'])
+        base_labels = req.environ.get('swift.base_labels', None)
+        self.assertEqual(base_labels, {
+            'resource': 'object',
+            'method': 'PUT',
+            'account': 'AUTH_test',
+            'container': 'bucket',
+            'api': 'S3'
+        })
+
+        self.assertEqual(swift.calls, [
+            ('PUT', '/v1/AUTH_test/bucket/object'),
+        ])
+
+    def test_base_label_v4_auth_headers_GET(self):
+        app, swift = self._make_logged_pipeline()
+        buffers = [b'some stuff\n',
+                   b'some other stuff\n',
+                   b'some additional stuff\n']
+        last_modified = 'Fri, 01 Apr 2014 12:00:00 GMT'
+        date_header = email.utils.formatdate(time.time() + 0)
+
+        swift.register('GET', '/v1/AUTH_test/bucket/object',
+                       HTTPOk,
+                       {'last-modified': last_modified},
+                       buffers)
+
+        req = Request.blank(
+            '/bucket/object',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={
+                'Authorization': 'AWS4-HMAC-SHA256 ' + ', '.join([
+                    'Credential=test:tester/%s/us-east-1/s3/aws4_request' %
+                    self.get_v4_amz_date_header().split('T', 1)[0],
+                    'SignedHeaders=host',
+                    'Signature=X',
+                ]),
+                'Date': date_header,
+                'x-amz-content-sha256': 'UNSIGNED-PAYLOAD',
+            },
+        )
+        status, headers, body = self._do_test_call_app(req, app)
+        self.assertEqual('200 OK', status)
+
+        self.assertEqual('/v1/AUTH_test/bucket/object',
+                         req.environ['swift.backend_path'])
+        base_labels = req.environ.get('swift.base_labels', None)
+        self.assertEqual(base_labels, {
+            'resource': 'object',
+            'method': 'GET',
+            'account': 'AUTH_test',
+            'container': 'bucket',
+            'api': 'S3'
+        })
+
+        self.assertEqual(swift.calls, [
+            ('GET', '/v1/AUTH_test/bucket/object'),
+        ])
+
+        self.assertLabeledUpdateStats([
+            ('swift_proxy_server_response_body_streaming_bytes', 11, {
+                'method': 'GET',
+                'api': 'S3',
+                'resource': 'object',
+                'container': 'bucket',
+                'account': 'AUTH_test',
+                'policy': '0',
+                'status': 200}),
+            ('swift_proxy_server_response_body_streaming_bytes', 17, {
+                'method': 'GET',
+                'api': 'S3',
+                'resource': 'object',
+                'container': 'bucket',
+                'account': 'AUTH_test',
+                'policy': '0',
+                'status': 200}),
+            ('swift_proxy_server_response_body_streaming_bytes', 22, {
+                'method': 'GET',
+                'api': 'S3',
+                'resource': 'object',
+                'container': 'bucket',
+                'account': 'AUTH_test',
+                'policy': '0',
+                'status': 200}),
+            ('swift_proxy_server_request_body_bytes', 0, {
+                'method': 'GET',
+                'api': 'S3',
+                'resource': 'object',
+                'container': 'bucket',
+                'account': 'AUTH_test',
+                'status': 200,
+                'policy': '0'}),
+            ('swift_proxy_server_response_body_bytes', 50, {
+                'method': 'GET',
+                'api': 'S3',
+                'resource': 'object',
+                'container': 'bucket',
+                'account': 'AUTH_test',
+                'status': 200,
+                'policy': '0'})
+        ])
+
+    def test_base_label_v4_auth_headers_PUT(self):
+        app, swift = self._make_logged_pipeline()
+        buffer_str = (b'some stuff\n'
+                      b'some other stuff\n'
+                      b'some additional stuff\n')
+        etag = md5(buffer_str, usedforsecurity=False).hexdigest()
+        last_modified = 'Fri, 01 Apr 2014 12:00:00 GMT'
+        date_header = email.utils.formatdate(time.time() + 0)
+
+        swift.register('PUT', '/v1/AUTH_test/bucket/object',
+                       HTTPCreated,
+                       {'etag': etag,
+                        'last-modified': last_modified,
+                        'Content-Length': 0},
+                       None)
+        req = Request.blank(
+            '/bucket/object',
+            environ={
+                'REQUEST_METHOD': 'PUT',
+                'wsgi.input': BytesIO(buffer_str),
+            },
+            headers={
+                'Authorization': 'AWS4-HMAC-SHA256 ' + ', '.join([
+                    'Credential=test:tester/%s/us-east-1/s3/aws4_request' %
+                    self.get_v4_amz_date_header().split('T', 1)[0],
+                    'SignedHeaders=host',
+                    'Signature=X',
+                ]),
+                'Date': date_header,
+                'x-amz-content-sha256': 'UNSIGNED-PAYLOAD',
+            },
+        )
+
+        status, headers, body = self._do_test_call_app(req, app)
+        self.assertEqual('200 OK', status)
+
+        self.assertEqual('/v1/AUTH_test/bucket/object',
+                         req.environ['swift.backend_path'])
+        base_labels = req.environ.get('swift.base_labels', None)
+        self.assertEqual(base_labels, {
+            'resource': 'object',
+            'method': 'PUT',
+            'account': 'AUTH_test',
+            'container': 'bucket',
+            'api': 'S3'
+        })
+
+        self.assertEqual(swift.calls, [
+            ('PUT', '/v1/AUTH_test/bucket/object'),
+        ])
+
+        self.assertLabeledUpdateStats([
+            ('swift_proxy_server_request_body_streaming_bytes', 5, {
+                'method': 'PUT',
+                'api': 'S3',
+                'resource': 'object',
+                'container': 'bucket',
+                'account': 'AUTH_test'}),
+            ('swift_proxy_server_request_body_streaming_bytes', 5, {
+                'method': 'PUT',
+                'api': 'S3',
+                'resource': 'object',
+                'container': 'bucket',
+                'account': 'AUTH_test'}),
+            ('swift_proxy_server_request_body_streaming_bytes', 5, {
+                'method': 'PUT',
+                'api': 'S3',
+                'resource': 'object',
+                'container': 'bucket',
+                'account': 'AUTH_test'}),
+            ('swift_proxy_server_request_body_streaming_bytes', 5, {
+                'method': 'PUT',
+                'api': 'S3',
+                'resource': 'object',
+                'container': 'bucket',
+                'account': 'AUTH_test'}),
+            ('swift_proxy_server_request_body_streaming_bytes', 5, {
+                'method': 'PUT',
+                'api': 'S3',
+                'resource': 'object',
+                'container': 'bucket',
+                'account': 'AUTH_test'}),
+            ('swift_proxy_server_request_body_streaming_bytes', 5, {
+                'method': 'PUT',
+                'api': 'S3',
+                'resource': 'object',
+                'container': 'bucket',
+                'account': 'AUTH_test'}),
+            ('swift_proxy_server_request_body_streaming_bytes', 5, {
+                'method': 'PUT',
+                'api': 'S3',
+                'resource': 'object',
+                'container': 'bucket',
+                'account': 'AUTH_test'}),
+            ('swift_proxy_server_request_body_streaming_bytes', 5, {
+                'method': 'PUT',
+                'api': 'S3',
+                'resource': 'object',
+                'container': 'bucket',
+                'account': 'AUTH_test'}),
+            ('swift_proxy_server_request_body_streaming_bytes', 5, {
+                'method': 'PUT',
+                'api': 'S3',
+                'resource': 'object',
+                'container': 'bucket',
+                'account': 'AUTH_test'}),
+            ('swift_proxy_server_request_body_streaming_bytes', 5, {
+                'method': 'PUT',
+                'api': 'S3',
+                'resource': 'object',
+                'container': 'bucket',
+                'account': 'AUTH_test'}),
+            ('swift_proxy_server_request_body_bytes', 50, {
+                'method': 'PUT',
+                'api': 'S3',
+                'resource': 'object',
+                'container': 'bucket',
+                'account': 'AUTH_test',
+                'status': 200, 'policy': '0'}),
+            ('swift_proxy_server_response_body_bytes', 0, {
+                'method': 'PUT',
+                'api': 'S3',
+                'resource': 'object',
+                'container': 'bucket',
+                'account': 'AUTH_test',
+                'status': 200,
+                'policy': '0'})
+        ])
+
+    def test_base_labels_put_s3api_storage_domain(self):
+        app, swift = self._make_logged_pipeline(storage_domain='domain')
+        buffer_str = (b'some stuff\n'
+                      b'some other stuff\n'
+                      b'some additional stuff\n')
+
+        etag = md5(buffer_str, usedforsecurity=False).hexdigest()
+        last_modified = 'Fri, 01 Apr 2014 12:00:00 GMT'
+
+        swift.register('PUT', '/v1/AUTH_test/ahost/object',
+                       HTTPCreated,
+                       {'etag': etag,
+                        'last-modified': last_modified,
+                        'Content-Length': 0},
+                       None)
+
+        date_header = email.utils.formatdate(time.time() + 0)
+        req = Request.blank(
+            '/object',
+            environ={
+                'REQUEST_METHOD': 'PUT',
+                'HTTP_HOST': 'ahost.domain',
+                'wsgi.input': BytesIO(buffer_str),
+            },
+            headers={
+                'Authorization': 'AWS test:tester:hmac',
+                'Date': date_header,
+            },
+        )
+
+        status, headers, body = self._do_test_call_app(req, app)
+        self.assertEqual('200 OK', status)
+
+        self.assertEqual('/v1/AUTH_test/ahost/object',
+                         req.environ['swift.backend_path'])
+        base_labels = req.environ.get('swift.base_labels', None)
+        self.assertEqual(base_labels, {
+            'resource': 'object',
+            'method': 'PUT',
+            'account': 'AUTH_test',
+            'container': 'ahost',
+            'api': 'S3'
+        })
+
+        self.assertEqual(swift.calls, [
+            ('PUT', '/v1/AUTH_test/ahost/object'),
+        ])
 
     def test_log_query_string(self):
         app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), {})
-        app.access_logger = FakeLogger()
+        app.access_logger = debug_logger()
         req = Request.blank('/', environ={'REQUEST_METHOD': 'GET',
-                'QUERY_STRING': 'x=3'})
+                                          'QUERY_STRING': 'x=3'})
         resp = app(req.environ, start_response)
-        exhaust_generator = [x for x in resp]
+        # exhaust generator
+        self.assertEqual(b'FAKE APP', b''.join(resp))
         log_parts = self._log_parts(app)
-        self.assertEquals(unquote(log_parts[4]), '/?x=3')
+        self.assertEqual(unquote(log_parts[4]), '/?x=3')
 
     def test_client_logging(self):
         app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), {})
-        app.access_logger = FakeLogger()
+        app.access_logger = debug_logger()
         req = Request.blank('/', environ={'REQUEST_METHOD': 'GET',
-                'REMOTE_ADDR': '1.2.3.4'})
+                                          'REMOTE_ADDR': '1.2.3.4'})
         resp = app(req.environ, start_response)
-        exhaust_generator = [x for x in resp]
+        # exhaust generator
+        self.assertEqual(b'FAKE APP', b''.join(resp))
         log_parts = self._log_parts(app)
-        self.assertEquals(log_parts[0], '1.2.3.4')  # client ip
-        self.assertEquals(log_parts[1], '1.2.3.4')  # remote addr
+        self.assertEqual(log_parts[0], '1.2.3.4')  # client ip
+        self.assertEqual(log_parts[1], '1.2.3.4')  # remote addr
+
+    def test_iterator_closing(self):
+
+        class CloseableBody(object):
+            def __init__(self):
+                self.msg = b"CloseableBody"
+                self.closed = False
+
+            def close(self):
+                self.closed = True
+
+            def __iter__(self):
+                return self
+
+            def __next__(self):
+                if not self.msg:
+                    raise StopIteration
+                result, self.msg = self.msg, b''
+                return result
+
+        body = CloseableBody()
+        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(body), {})
+        req = Request.blank('/', environ={'REQUEST_METHOD': 'GET',
+                                          'REMOTE_ADDR': '1.2.3.4'})
+        resp = app(req.environ, start_response)
+        # exhaust generator
+        self.assertEqual(b'CloseableBody', b''.join(resp))
+        self.assertTrue(body.closed)
+
+    def test_chunked_response(self):
+        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(chunked=True), {})
+        req = Request.blank('/')
+        resp = app(req.environ, start_response)
+        # exhaust generator
+        self.assertEqual(b'FAKE APP', b''.join(resp))
 
     def test_proxy_client_logging(self):
         app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), {})
-        app.access_logger = FakeLogger()
+        app.access_logger = debug_logger()
         req = Request.blank('/', environ={
             'REQUEST_METHOD': 'GET',
             'REMOTE_ADDR': '1.2.3.4',
             'HTTP_X_FORWARDED_FOR': '4.5.6.7,8.9.10.11'})
         resp = app(req.environ, start_response)
-        exhaust_generator = [x for x in resp]
+        # exhaust generator
+        self.assertEqual(b'FAKE APP', b''.join(resp))
         log_parts = self._log_parts(app)
-        self.assertEquals(log_parts[0], '4.5.6.7')  # client ip
-        self.assertEquals(log_parts[1], '1.2.3.4')  # remote addr
+        self.assertEqual(log_parts[0], '4.5.6.7')  # client ip
+        self.assertEqual(log_parts[1], '1.2.3.4')  # remote addr
 
         app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), {})
-        app.access_logger = FakeLogger()
+        app.access_logger = debug_logger()
         req = Request.blank('/', environ={
             'REQUEST_METHOD': 'GET',
             'REMOTE_ADDR': '1.2.3.4',
             'HTTP_X_CLUSTER_CLIENT_IP': '4.5.6.7'})
         resp = app(req.environ, start_response)
-        exhaust_generator = [x for x in resp]
+        # exhaust generator
+        self.assertEqual(b'FAKE APP', b''.join(resp))
         log_parts = self._log_parts(app)
-        self.assertEquals(log_parts[0], '4.5.6.7')  # client ip
-        self.assertEquals(log_parts[1], '1.2.3.4')  # remote addr
+        self.assertEqual(log_parts[0], '4.5.6.7')  # client ip
+        self.assertEqual(log_parts[1], '1.2.3.4')  # remote addr
 
     def test_facility(self):
-        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(),
-                    {'log_headers': 'yes',
-                     'access_log_facility': 'LOG_LOCAL7'})
-        handler = get_logger.handler4logger[app.access_logger.logger]
-        self.assertEquals(SysLogHandler.LOG_LOCAL7, handler.facility)
+        app = proxy_logging.ProxyLoggingMiddleware(
+            FakeApp(),
+            {'log_headers': 'yes',
+             'access_log_facility': 'LOG_LOCAL7'})
+        handler = get_swift_logger.handler4logger[app.access_logger.logger]
+        self.assertEqual(SysLogHandler.LOG_LOCAL7, handler.facility)
+
+    def test_conf_statsd_label_mode(self):
+        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), {})
+        self.assertIsNone(app.statsd.label_formatter)
+
+        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), {})
+        self.assertIsNone(app.statsd.label_formatter)
+        conf = {'statsd_label_mode': 'dogstatsd'}
+        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), conf)
+        self.assertEqual(statsd_client.dogstatsd, app.statsd.label_formatter)
+        conf = {'statsd_label_mode': 'graphite'}
+        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), conf)
+        self.assertEqual(statsd_client.graphite, app.statsd.label_formatter)
+        conf = {'statsd_label_mode': 'librato'}
+        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), conf)
+        self.assertEqual(statsd_client.librato, app.statsd.label_formatter)
+        conf = {'statsd_label_mode': 'influxdb'}
+        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), conf)
+        self.assertEqual(statsd_client.influxdb, app.statsd.label_formatter)
+
+    def test_conf_statsd_emit_legacy(self):
+        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), {})
+        self.assertTrue(app.access_logger.logger.statsd_client.emit_legacy)
+
+        conf = {'statsd_emit_legacy': 'no'}
+        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), conf)
+        self.assertFalse(app.access_logger.logger.statsd_client.emit_legacy)
 
     def test_filter(self):
         factory = proxy_logging.filter_factory({})
-        self.assert_(callable(factory))
-        self.assert_(callable(factory(FakeApp())))
+        self.assertTrue(callable(factory))
+        self.assertTrue(callable(factory(FakeApp())))
+
+    def test_sensitive_headers_registered(self):
+        with mock.patch.object(registry, '_sensitive_headers', set()):
+            self.assertNotIn('x-auth-token', get_sensitive_headers())
+            self.assertNotIn('x-storage-token', get_sensitive_headers())
+            proxy_logging.filter_factory({})(FakeApp())
+            self.assertIn('x-auth-token', get_sensitive_headers())
+            self.assertIn('x-storage-token', get_sensitive_headers())
 
     def test_unread_body(self):
         app = proxy_logging.ProxyLoggingMiddleware(
             FakeApp(['some', 'stuff']), {})
-        app.access_logger = FakeLogger()
+        app.access_logger = debug_logger()
         req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'})
         resp = app(req.environ, start_response)
-        read_first_chunk = next(resp)
+        # read first chunk
+        next(resp)
         resp.close()  # raise a GeneratorExit in middleware app_iter loop
         log_parts = self._log_parts(app)
-        self.assertEquals(log_parts[6], '499')
-        self.assertEquals(log_parts[11], '4')  # write length
+        self.assertEqual(log_parts[6], '499')
+        self.assertEqual(log_parts[11], '4')  # write length
+
+    def test_exploding_body(self):
+
+        def exploding_body():
+            yield 'some'
+            yield 'stuff'
+            raise Exception('kaboom!')
+
+        app = proxy_logging.ProxyLoggingMiddleware(
+            FakeApp(exploding_body()), {
+                'log_msg_template': '{method} {path} '
+                '{status_int} {wire_status_int}',
+            })
+        app.access_logger = debug_logger()
+        req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(app)
+        with self.assertRaises(Exception) as ctx:
+            resp.body
+        self.assertEqual('kaboom!', str(ctx.exception))
+        log_parts = self._log_parts(app)
+        self.assertEqual(log_parts, ['GET', '/', '500', '200'])
 
     def test_disconnect_on_readline(self):
         app = proxy_logging.ProxyLoggingMiddleware(FakeAppReadline(), {})
-        app.access_logger = FakeLogger()
+        app.access_logger = debug_logger()
         req = Request.blank('/', environ={'REQUEST_METHOD': 'GET',
-            'wsgi.input': FileLikeExceptor()})
+                                          'wsgi.input': FileLikeExceptor()})
         try:
             resp = app(req.environ, start_response)
-            body = ''.join(resp)
-        except Exception:
+            # read body
+            b''.join(resp)
+        except IOError:
             pass
         log_parts = self._log_parts(app)
-        self.assertEquals(log_parts[6], '499')
-        self.assertEquals(log_parts[10], '-')  # read length
+        self.assertEqual(log_parts[6], '499')
+        self.assertEqual(log_parts[10], '-')  # read length
 
     def test_disconnect_on_read(self):
         app = proxy_logging.ProxyLoggingMiddleware(
             FakeApp(['some', 'stuff']), {})
-        app.access_logger = FakeLogger()
+        app.access_logger = debug_logger()
         req = Request.blank('/', environ={'REQUEST_METHOD': 'GET',
-            'wsgi.input': FileLikeExceptor()})
+                                          'wsgi.input': FileLikeExceptor()})
         try:
             resp = app(req.environ, start_response)
-            body = ''.join(resp)
+            # read body
+            b''.join(resp)
+        except IOError:
+            pass
+        log_parts = self._log_parts(app)
+        self.assertEqual(log_parts[6], '499')
+        self.assertEqual(log_parts[10], '-')  # read length
+
+    def test_environ_has_proxy_logging_status(self):
+        conf = {'log_msg_template':
+                '{method} {path} {status_int} {wire_status_int}'}
+
+        def do_test(environ_updates):
+            fake_app = FakeApp(body=[b'Slow Down'],
+                               response_str='503 Slow Down',
+                               environ_updates=environ_updates)
+            app = proxy_logging.ProxyLoggingMiddleware(fake_app, conf)
+            app.access_logger = debug_logger()
+            req = Request.blank('/v1/a/c')
+            captured_start_resp = mock.MagicMock()
+            try:
+                resp = app(req.environ, captured_start_resp)
+                b''.join(resp)  # read body
+            except IOError:
+                pass
+            captured_start_resp.assert_called_once_with(
+                '503 Slow Down', mock.ANY, None)
+            return self._log_parts(app)
+
+        # control case, logged status == wire status
+        environ_updates = {}
+        self.assertEqual(do_test(environ_updates),
+                         ['GET', '/v1/a/c', '503', '503'])
+
+        # logged status is forced to other value
+        environ_updates = {'swift.proxy_logging_status': 429}
+        self.assertEqual(do_test(environ_updates),
+                         ['GET', '/v1/a/c', '429', '503'])
+
+        environ_updates = {'swift.proxy_logging_status': '429'}
+        self.assertEqual(do_test(environ_updates),
+                         ['GET', '/v1/a/c', '429', '503'])
+
+        environ_updates = {'swift.proxy_logging_status': None}
+        self.assertEqual(do_test(environ_updates),
+                         ['GET', '/v1/a/c', '-', '503'])
+
+        # middleware should use an int like the docs tell them too, but we
+        # won't like ... "blow up" or anything
+        environ_updates = {'swift.proxy_logging_status': ''}
+        self.assertEqual(do_test(environ_updates),
+                         ['GET', '/v1/a/c', '-', '503'])
+
+        environ_updates = {'swift.proxy_logging_status': True}
+        self.assertEqual(do_test(environ_updates),
+                         ['GET', '/v1/a/c', 'True', '503'])
+
+        environ_updates = {'swift.proxy_logging_status': False}
+        self.assertEqual(do_test(environ_updates),
+                         ['GET', '/v1/a/c', '-', '503'])
+
+        environ_updates = {'swift.proxy_logging_status': 'parsing ok'}
+        self.assertEqual(do_test(environ_updates),
+                         ['GET', '/v1/a/c', 'parsing%20ok', '503'])
+
+    def test_body_iter_updates_environ_proxy_logging_status(self):
+        conf = {'log_msg_template':
+                '{method} {path} {status_int} {wire_status_int}'}
+
+        def do_test(req, body_iter, updated_status):
+            fake_app = FakeApp(body=body_iter,
+                               response_str='205 Weird')
+            app = proxy_logging.ProxyLoggingMiddleware(fake_app, conf)
+            app.access_logger = debug_logger()
+            captured_start_resp = mock.MagicMock()
+            try:
+                resp = app(req.environ, captured_start_resp)
+                b''.join(resp)  # read body
+            except IOError:
+                pass
+            captured_start_resp.assert_called_once_with(
+                '205 Weird', mock.ANY, None)
+            self.assertEqual(self._log_parts(app),
+                             ['GET', '/v1/a/c', updated_status, '205'])
+
+        # sanity
+        req = Request.blank('/v1/a/c')
+        do_test(req, [b'normal', b'chunks'], '205')
+
+        def update_in_middle_chunk_gen():
+            yield b'foo'
+            yield b'bar'
+            req.environ['swift.proxy_logging_status'] = 209
+            yield b'baz'
+
+        req = Request.blank('/v1/a/c')
+        do_test(req, update_in_middle_chunk_gen(), '209')
+
+        def update_in_finally_chunk_gen():
+            try:
+                for i in range(3):
+                    yield ('foo%s' % i).encode()
+            finally:
+                req.environ['swift.proxy_logging_status'] = 210
+
+        req = Request.blank('/v1/a/c')
+        do_test(req, update_in_finally_chunk_gen(), '210')
+
+    def test_environ_has_proxy_logging_status_unread_body(self):
+        conf = {'log_msg_template':
+                '{method} {path} {status_int} {wire_status_int}'}
+
+        def do_test(environ_updates):
+            fake_app = FakeApp(body=[b'Slow Down'],
+                               response_str='503 Slow Down',
+                               environ_updates=environ_updates)
+            app = proxy_logging.ProxyLoggingMiddleware(fake_app, conf)
+            app.access_logger = debug_logger()
+            req = Request.blank('/v1/a/c')
+            captured_start_resp = mock.MagicMock()
+            resp = app(req.environ, captured_start_resp)
+            # read first chunk
+            next(resp)
+            resp.close()  # raise a GeneratorExit in middleware app_iter loop
+            captured_start_resp.assert_called_once_with(
+                '503 Slow Down', mock.ANY, None)
+            return self._log_parts(app)
+
+        # control case, logged status is 499
+        environ_updates = {}
+        self.assertEqual(do_test(environ_updates),
+                         ['GET', '/v1/a/c', '499', '503'])
+
+        # logged status is forced to 499 despite swift.proxy_logging_status
+        environ_updates = {'swift.proxy_logging_status': '429'}
+        self.assertEqual(do_test(environ_updates),
+                         ['GET', '/v1/a/c', '499', '503'])
+
+    def test_environ_has_proxy_logging_status_and_app_explodes(self):
+        # verify exception overrides proxy_logging_status
+        conf = {'log_msg_template':
+                '{method} {path} {status_int} {wire_status_int}'}
+
+        class ExplodingFakeApp(object):
+
+            def __call__(self, env, start_response):
+                # this is going to be so great!
+                env['swift.proxy_logging_status'] = '456'
+                start_response('568 Bespoke', [('X-Special', 'fun')])
+                raise Exception('oops!')
+
+        fake_app = ExplodingFakeApp()
+        app = proxy_logging.ProxyLoggingMiddleware(fake_app, conf)
+        app.access_logger = debug_logger()
+        req = Request.blank('/v1/a/c')
+        captured_start_resp = mock.MagicMock()
+        with self.assertRaises(Exception) as cm:
+            app(req.environ, captured_start_resp)
+        captured_start_resp.assert_not_called()
+        self.assertEqual('oops!', str(cm.exception))
+        self.assertEqual(self._log_parts(app),
+                         ['GET', '/v1/a/c', '500', '500'])
+
+    def test_environ_has_proxy_logging_status_and_body_explodes(self):
+        # verify exception overrides proxy_logging_status
+        conf = {'log_msg_template':
+                '{method} {path} {status_int} {wire_status_int}'}
+
+        def exploding_body():
+            yield 'some'
+            yield 'stuff'
+            raise Exception('oops!')
+
+        class ExplodingFakeApp(object):
+
+            def __call__(self, env, start_response):
+                # this is going to be so great!
+                env['swift.proxy_logging_status'] = '456'
+                start_response('568 Bespoke', [('X-Special', 'fun')])
+                return exploding_body()
+
+        fake_app = ExplodingFakeApp()
+        app = proxy_logging.ProxyLoggingMiddleware(fake_app, conf)
+        app.access_logger = debug_logger()
+        req = Request.blank('/v1/a/c')
+        captured_start_resp = mock.MagicMock()
+        app_iter = app(req.environ, captured_start_resp)
+        with self.assertRaises(Exception) as cm:
+            b''.join(app_iter)
+        captured_start_resp.assert_called_once_with(
+            '568 Bespoke', [('X-Special', 'fun')], None)
+        self.assertEqual('oops!', str(cm.exception))
+        self.assertEqual(self._log_parts(app),
+                         ['GET', '/v1/a/c', '500', '568'])
+
+    def test_app_exception(self):
+        app = proxy_logging.ProxyLoggingMiddleware(
+            FakeAppThatExcepts(), {})
+        app.access_logger = debug_logger()
+        req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'})
+        try:
+            app(req.environ, start_response)
         except Exception:
             pass
         log_parts = self._log_parts(app)
-        self.assertEquals(log_parts[6], '499')
-        self.assertEquals(log_parts[10], '-')  # read length
+        self.assertEqual(log_parts[6], '500')
+        self.assertEqual(log_parts[10], '-')  # read length
 
     def test_no_content_length_no_transfer_encoding_with_list_body(self):
         app = proxy_logging.ProxyLoggingMiddleware(
             FakeAppNoContentLengthNoTransferEncoding(
-                # test the "while not chunk: chunk = iterator.next()"
-                body=['', '', 'line1\n', 'line2\n'],
+                # test the "while not chunk: chunk = next(iterator)"
+                body=[b'', b'', b'line1\n', b'line2\n'],
             ), {})
-        app.access_logger = FakeLogger()
+        app.access_logger = debug_logger()
         req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'})
         resp = app(req.environ, start_response)
-        resp_body = ''.join(resp)
+        resp_body = b''.join(resp)
         log_parts = self._log_parts(app)
-        self.assertEquals(log_parts[3], 'GET')
-        self.assertEquals(log_parts[4], '/')
-        self.assertEquals(log_parts[5], 'HTTP/1.0')
-        self.assertEquals(log_parts[6], '200')
-        self.assertEquals(resp_body, 'line1\nline2\n')
-        self.assertEquals(log_parts[11], str(len(resp_body)))
+        self.assertEqual(log_parts[3], 'GET')
+        self.assertEqual(log_parts[4], '/')
+        self.assertEqual(log_parts[5], 'HTTP/1.0')
+        self.assertEqual(log_parts[6], '200')
+        self.assertEqual(resp_body, b'line1\nline2\n')
+        self.assertEqual(log_parts[11], str(len(resp_body)))
 
     def test_no_content_length_no_transfer_encoding_with_empty_strings(self):
         app = proxy_logging.ProxyLoggingMiddleware(
             FakeAppNoContentLengthNoTransferEncoding(
-                # test the "while not chunk: chunk = iterator.next()"
-                body=['', '', ''],
+                # test the "while not chunk: chunk = next(iterator)"
+                body=[b'', b'', b''],
             ), {})
-        app.access_logger = FakeLogger()
+        app.access_logger = debug_logger()
         req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'})
         resp = app(req.environ, start_response)
-        resp_body = ''.join(resp)
+        resp_body = b''.join(resp)
         log_parts = self._log_parts(app)
-        self.assertEquals(log_parts[3], 'GET')
-        self.assertEquals(log_parts[4], '/')
-        self.assertEquals(log_parts[5], 'HTTP/1.0')
-        self.assertEquals(log_parts[6], '200')
-        self.assertEquals(resp_body, '')
-        self.assertEquals(log_parts[11], '-')
+        self.assertEqual(log_parts[3], 'GET')
+        self.assertEqual(log_parts[4], '/')
+        self.assertEqual(log_parts[5], 'HTTP/1.0')
+        self.assertEqual(log_parts[6], '200')
+        self.assertEqual(resp_body, b'')
+        self.assertEqual(log_parts[11], '-')
+
+    def test_no_content_length_no_transfer_encoding_with_generator(self):
+
+        class BodyGen(object):
+            def __init__(self, data):
+                self.data = data
+
+            def __iter__(self):
+                yield self.data
+
+        app = proxy_logging.ProxyLoggingMiddleware(
+            FakeAppNoContentLengthNoTransferEncoding(
+                body=BodyGen(b'abc'),
+            ), {})
+        app.access_logger = debug_logger()
+        req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'})
+        resp = app(req.environ, start_response)
+        resp_body = b''.join(resp)
+        log_parts = self._log_parts(app)
+        self.assertEqual(log_parts[3], 'GET')
+        self.assertEqual(log_parts[4], '/')
+        self.assertEqual(log_parts[5], 'HTTP/1.0')
+        self.assertEqual(log_parts[6], '200')
+        self.assertEqual(resp_body, b'abc')
+        self.assertEqual(log_parts[11], '3')
 
     def test_req_path_info_popping(self):
         app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), {})
-        app.access_logger = FakeLogger()
+        app.access_logger = debug_logger()
         req = Request.blank('/v1/something', environ={'REQUEST_METHOD': 'GET'})
         req.path_info_pop()
-        self.assertEquals(req.environ['PATH_INFO'], '/something')
+        self.assertEqual(req.environ['PATH_INFO'], '/something')
+        resp = app(req.environ, start_response)
+        resp_body = b''.join(resp)
+        log_parts = self._log_parts(app)
+        self.assertEqual(log_parts[3], 'GET')
+        self.assertEqual(log_parts[4], '/v1/something')
+        self.assertEqual(log_parts[5], 'HTTP/1.0')
+        self.assertEqual(log_parts[6], '200')
+        self.assertEqual(resp_body, b'FAKE APP')
+        self.assertEqual(log_parts[11], str(len(resp_body)))
+
+    def test_ipv6(self):
+        ipv6addr = '2001:db8:85a3:8d3:1319:8a2e:370:7348'
+        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), {})
+        app.access_logger = debug_logger()
+        req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'})
+        req.remote_addr = ipv6addr
         resp = app(req.environ, start_response)
-        resp_body = ''.join(resp)
+        resp_body = b''.join(resp)
         log_parts = self._log_parts(app)
-        self.assertEquals(log_parts[3], 'GET')
-        self.assertEquals(log_parts[4], '/v1/something')
-        self.assertEquals(log_parts[5], 'HTTP/1.0')
-        self.assertEquals(log_parts[6], '200')
-        self.assertEquals(resp_body, 'FAKE APP')
-        self.assertEquals(log_parts[11], str(len(resp_body)))
+        self.assertEqual(log_parts[0], ipv6addr)
+        self.assertEqual(log_parts[1], ipv6addr)
+        self.assertEqual(log_parts[3], 'GET')
+        self.assertEqual(log_parts[4], '/')
+        self.assertEqual(log_parts[5], 'HTTP/1.0')
+        self.assertEqual(log_parts[6], '200')
+        self.assertEqual(resp_body, b'FAKE APP')
+        self.assertEqual(log_parts[11], str(len(resp_body)))
 
+    def test_log_info_none(self):
+        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), {})
+        app.access_logger = debug_logger()
+        req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'})
+        list(app(req.environ, start_response))
+        log_parts = self._log_parts(app)
+        self.assertEqual(log_parts[17], '-')
 
-if __name__ == '__main__':
-    unittest.main()
+        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), {})
+        app.access_logger = debug_logger()
+        req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'})
+        req.environ['swift.log_info'] = []
+        list(app(req.environ, start_response))
+        log_parts = self._log_parts(app)
+        self.assertEqual(log_parts[17], '-')
+
+    def test_log_info_single(self):
+        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), {})
+        app.access_logger = debug_logger()
+        req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'})
+        req.environ['swift.log_info'] = ['one']
+        list(app(req.environ, start_response))
+        log_parts = self._log_parts(app)
+        self.assertEqual(log_parts[17], 'one')
+
+    def test_log_info_multiple(self):
+        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), {})
+        app.access_logger = debug_logger()
+        req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'})
+        req.environ['swift.log_info'] = ['one', 'and two']
+        list(app(req.environ, start_response))
+        log_parts = self._log_parts(app)
+        self.assertEqual(log_parts[17], 'one%2Cand%20two')
+
+    def test_log_auth_token(self):
+        auth_token = 'b05bf940-0464-4c0e-8c70-87717d2d73e8'
+        with mock.patch.object(registry, '_sensitive_headers', set()):
+            # Default - reveal_sensitive_prefix is 16
+            # No x-auth-token header
+            app = proxy_logging.filter_factory({})(FakeApp())
+            app.access_logger = debug_logger()
+            req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'})
+            resp = app(req.environ, start_response)
+            resp_body = b''.join(resp)
+            log_parts = self._log_parts(app)
+            self.assertEqual(log_parts[9], '-')
+            # Has x-auth-token header
+            app = proxy_logging.filter_factory({})(FakeApp())
+            app.access_logger = debug_logger()
+            req = Request.blank('/', environ={'REQUEST_METHOD': 'GET',
+                                              'HTTP_X_AUTH_TOKEN': auth_token})
+            resp = app(req.environ, start_response)
+            resp_body = b''.join(resp)
+            log_parts = self._log_parts(app)
+            self.assertEqual(log_parts[9], 'b05bf940-0464-4c...', log_parts)
+
+            # Truncate to first 8 characters
+            app = proxy_logging.filter_factory(
+                {'reveal_sensitive_prefix': '8'})(FakeApp())
+            app.access_logger = debug_logger()
+            req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'})
+            resp = app(req.environ, start_response)
+            resp_body = b''.join(resp)
+            log_parts = self._log_parts(app)
+            self.assertEqual(log_parts[9], '-')
+            app = proxy_logging.filter_factory(
+                {'reveal_sensitive_prefix': '8'})(FakeApp())
+            app.access_logger = debug_logger()
+            req = Request.blank('/', environ={'REQUEST_METHOD': 'GET',
+                                              'HTTP_X_AUTH_TOKEN': auth_token})
+            resp = app(req.environ, start_response)
+            resp_body = b''.join(resp)
+            log_parts = self._log_parts(app)
+            self.assertEqual(log_parts[9], 'b05bf940...')
+
+            # Token length and reveal_sensitive_prefix are same (no truncate)
+            app = proxy_logging.filter_factory(
+                {'reveal_sensitive_prefix': str(len(auth_token))})(FakeApp())
+            app.access_logger = debug_logger()
+            req = Request.blank('/', environ={'REQUEST_METHOD': 'GET',
+                                              'HTTP_X_AUTH_TOKEN': auth_token})
+            resp = app(req.environ, start_response)
+            resp_body = b''.join(resp)
+            log_parts = self._log_parts(app)
+            self.assertEqual(log_parts[9], auth_token)
+
+            # No effective limit on auth token
+            app = proxy_logging.filter_factory(
+                {'reveal_sensitive_prefix': constraints.MAX_HEADER_SIZE}
+            )(FakeApp())
+            app.access_logger = debug_logger()
+            req = Request.blank('/', environ={'REQUEST_METHOD': 'GET',
+                                              'HTTP_X_AUTH_TOKEN': auth_token})
+            resp = app(req.environ, start_response)
+            resp_body = b''.join(resp)
+            log_parts = self._log_parts(app)
+            self.assertEqual(log_parts[9], auth_token)
+
+            # Don't log x-auth-token
+            app = proxy_logging.filter_factory(
+                {'reveal_sensitive_prefix': '0'})(FakeApp())
+            app.access_logger = debug_logger()
+            req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'})
+            resp = app(req.environ, start_response)
+            resp_body = b''.join(resp)
+            log_parts = self._log_parts(app)
+            self.assertEqual(log_parts[9], '-')
+            app = proxy_logging.filter_factory(
+                {'reveal_sensitive_prefix': '0'})(FakeApp())
+            app.access_logger = debug_logger()
+            req = Request.blank('/', environ={'REQUEST_METHOD': 'GET',
+                                              'HTTP_X_AUTH_TOKEN': auth_token})
+            resp = app(req.environ, start_response)
+            resp_body = b''.join(resp)
+            log_parts = self._log_parts(app)
+            self.assertEqual(log_parts[9], '...')
+
+            # Avoids pyflakes error, "local variable 'resp_body' is assigned to
+            # but never used
+            self.assertTrue(resp_body is not None)
+
+    def test_ensure_fields(self):
+        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), {})
+        app.access_logger = debug_logger()
+        req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'})
+        with mock.patch('time.time',
+                        mock.MagicMock(
+                            side_effect=[10000000.0, 10000000.5, 10000001.0])):
+            resp = app(req.environ, start_response)
+            resp_body = b''.join(resp)
+        log_parts = self._log_parts(app)
+        self.assertEqual(len(log_parts), 22)
+        self.assertEqual(log_parts[0], '-')
+        self.assertEqual(log_parts[1], '-')
+        self.assertEqual(log_parts[2], '26/Apr/1970/17/46/41')
+        self.assertEqual(log_parts[3], 'GET')
+        self.assertEqual(log_parts[4], '/')
+        self.assertEqual(log_parts[5], 'HTTP/1.0')
+        self.assertEqual(log_parts[6], '200')
+        self.assertEqual(log_parts[7], '-')
+        self.assertEqual(log_parts[8], '-')
+        self.assertEqual(log_parts[9], '-')
+        self.assertEqual(log_parts[10], '-')
+        self.assertEqual(resp_body, b'FAKE APP')
+        self.assertEqual(log_parts[11], str(len(resp_body)))
+        self.assertEqual(log_parts[12], '-')
+        self.assertEqual(log_parts[13], '-')
+        self.assertEqual(log_parts[14], '-')
+        self.assertEqual(log_parts[15], '1.0000')
+        self.assertEqual(log_parts[16], '-')
+        self.assertEqual(log_parts[17], '-')
+        self.assertEqual(log_parts[18], '10000000.000000000')
+        self.assertEqual(log_parts[19], '10000001.000000000')
+        self.assertEqual(log_parts[20], '-')
+        self.assertEqual(log_parts[21], '-')
+
+    def test_dual_logging_middlewares(self):
+        # Since no internal request is being made, outer most proxy logging
+        # middleware, log1, should have performed the logging.
+        app = FakeApp()
+        flg0 = debug_logger()
+        env = {}
+        log0 = proxy_logging.ProxyLoggingMiddleware(app, env, logger=flg0)
+        flg1 = debug_logger()
+        log1 = proxy_logging.ProxyLoggingMiddleware(log0, env, logger=flg1)
+
+        req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'})
+        resp = log1(req.environ, start_response)
+        resp_body = b''.join(resp)
+        self._log_parts(log0, should_be_empty=True)
+        log_parts = self._log_parts(log1)
+        self.assertEqual(log_parts[3], 'GET')
+        self.assertEqual(log_parts[4], '/')
+        self.assertEqual(log_parts[5], 'HTTP/1.0')
+        self.assertEqual(log_parts[6], '200')
+        self.assertEqual(resp_body, b'FAKE APP')
+        self.assertEqual(log_parts[11], str(len(resp_body)))
+
+    def test_dual_logging_middlewares_w_inner(self):
+
+        class FakeMiddleware(object):
+            """
+            Fake middleware to make a separate internal request, but construct
+            the response with different data.
+            """
+            def __init__(self, app, conf):
+                self.app = app
+                self.conf = conf
+
+            def GET(self, req):
+                # Make the internal request
+                ireq = Request.blank('/', environ={'REQUEST_METHOD': 'GET'})
+                resp = self.app(ireq.environ, start_response)
+                resp_body = b''.join(resp)
+                if resp_body != b'FAKE APP':
+                    return Response(request=req,
+                                    body=b"FAKE APP WAS NOT RETURNED",
+                                    content_type="text/plain")
+                # But our response is different
+                return Response(request=req, body=b"FAKE MIDDLEWARE",
+                                content_type="text/plain")
+
+            def __call__(self, env, start_response):
+                req = Request(env)
+                return self.GET(req)(env, start_response)
+
+        # Since an internal request is being made, inner most proxy logging
+        # middleware, log0, should have performed the logging.
+        app = FakeApp()
+        flg0 = debug_logger()
+        env = {}
+        log0 = proxy_logging.ProxyLoggingMiddleware(app, env, logger=flg0)
+        fake = FakeMiddleware(log0, env)
+        flg1 = debug_logger()
+        log1 = proxy_logging.ProxyLoggingMiddleware(fake, env, logger=flg1)
+
+        req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'})
+        resp = log1(req.environ, start_response)
+        resp_body = b''.join(resp)
+
+        # Inner most logger should have logged the app's response
+        log_parts = self._log_parts(log0)
+        self.assertEqual(log_parts[3], 'GET')
+        self.assertEqual(log_parts[4], '/')
+        self.assertEqual(log_parts[5], 'HTTP/1.0')
+        self.assertEqual(log_parts[6], '200')
+        self.assertEqual(log_parts[11], str(len('FAKE APP')))
+
+        # Outer most logger should have logged the other middleware's response
+        log_parts = self._log_parts(log1)
+        self.assertEqual(log_parts[3], 'GET')
+        self.assertEqual(log_parts[4], '/')
+        self.assertEqual(log_parts[5], 'HTTP/1.0')
+        self.assertEqual(log_parts[6], '200')
+        self.assertEqual(resp_body, b'FAKE MIDDLEWARE')
+        self.assertEqual(log_parts[11], str(len(resp_body)))
+
+    def test_policy_index(self):
+        # Policy index can be specified by X-Backend-Storage-Policy-Index
+        # in the request header for object API
+        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(policy_idx='1'), {})
+        app.access_logger = debug_logger()
+        req = Request.blank('/v1/a/c/o', environ={'REQUEST_METHOD': 'PUT'})
+        resp = app(req.environ, start_response)
+        b''.join(resp)
+        log_parts = self._log_parts(app)
+        self.assertEqual(log_parts[20], '1')
+
+        # Policy index can be specified by X-Backend-Storage-Policy-Index
+        # in the response header for container API
+        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), {})
+        app.access_logger = debug_logger()
+        req = Request.blank('/v1/a/c', environ={'REQUEST_METHOD': 'GET'})
+
+        def fake_call(app, env, start_response):
+            start_response(app.response_str,
+                           [('Content-Type', 'text/plain'),
+                            ('Content-Length', str(sum(map(len, app.body)))),
+                            ('X-Backend-Storage-Policy-Index', '1')])
+            while env['wsgi.input'].read(5):
+                pass
+            return app.body
+
+        with mock.patch.object(FakeApp, '__call__', fake_call):
+            resp = app(req.environ, start_response)
+            b''.join(resp)
+        log_parts = self._log_parts(app)
+        self.assertEqual(log_parts[20], '1')
+
+    def test_obscure_req(self):
+        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), {})
+        app.access_logger = debug_logger()
+
+        params = [('param_one',
+                   'some_long_string_that_might_need_to_be_obscured'),
+                  ('param_two',
+                   "super_secure_param_that_needs_to_be_obscured")]
+        headers = {'X-Auth-Token': 'this_is_my_auth_token',
+                   'X-Other-Header': 'another_header_that_we_may_obscure'}
+
+        req = Request.blank('a/c/o', environ={'REQUEST_METHOD': 'GET'},
+                            headers=headers)
+        req.params = params
+
+        # if nothing is sensitive, nothing will be obscured
+        with mock.patch.object(registry, '_sensitive_params', set()):
+            with mock.patch.object(registry, '_sensitive_headers', set()):
+                app.obscure_req(req)
+        # show that nothing changed
+        for header, expected_value in headers.items():
+            self.assertEqual(req.headers[header], expected_value)
+
+        for param, expected_value in params:
+            self.assertEqual(req.params[param], expected_value)
+
+        # If an obscured param or header doesn't exist in a req, that's fine
+        with mock.patch.object(registry, '_sensitive_params', set()):
+            with mock.patch.object(registry, '_sensitive_headers', set()):
+                register_sensitive_header('X-Not-Exist')
+                register_sensitive_param('non-existent-param')
+                app.obscure_req(req)
+
+        # show that nothing changed
+        for header, expected_value in headers.items():
+            self.assertEqual(req.headers[header], expected_value)
+
+        for param, expected_value in params:
+            self.assertEqual(req.params[param], expected_value)
+
+        def obscured_test(params, headers, params_to_add, headers_to_add,
+                          expected_params, expected_headers):
+            with mock.patch.object(registry, '_sensitive_params', set()):
+                with mock.patch.object(registry, '_sensitive_headers', set()):
+                    app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), {})
+                    app.access_logger = debug_logger()
+                    req = Request.blank('a/c/o',
+                                        environ={'REQUEST_METHOD': 'GET'},
+                                        headers=dict(headers))
+                    req.params = params
+                    for param in params_to_add:
+                        register_sensitive_param(param)
+
+                    for header in headers_to_add:
+                        register_sensitive_header(header)
+
+                    app.obscure_req(req)
+                    for header, expected_value in expected_headers.items():
+                        self.assertEqual(req.headers[header], expected_value)
+
+                    for param, expected_value in expected_params:
+                        self.assertEqual(req.params[param], expected_value)
+
+        # first just 1 param
+        expected_params = list(params)
+        expected_params[0] = ('param_one', 'some_long_string...')
+        obscured_test(params, headers, ['param_one'], [], expected_params,
+                      headers)
+        # case sensitive
+        expected_params = list(params)
+        obscured_test(params, headers, ['Param_one'], [], expected_params,
+                      headers)
+        # Other param
+        expected_params = list(params)
+        expected_params[1] = ('param_two', 'super_secure_par...')
+        obscured_test(params, headers, ['param_two'], [], expected_params,
+                      headers)
+        # both
+        expected_params[0] = ('param_one', 'some_long_string...')
+        obscured_test(params, headers, ['param_two', 'param_one'], [],
+                      expected_params, headers)
+
+        # Now the headers
+        # first just 1 header
+        expected_headers = headers.copy()
+        expected_headers["X-Auth-Token"] = 'this_is_my_auth_...'
+        obscured_test(params, headers, [], ['X-Auth-Token'], params,
+                      expected_headers)
+        # case insensitive
+        obscured_test(params, headers, [], ['x-auth-token'], params,
+                      expected_headers)
+        # Other headers
+        expected_headers = headers.copy()
+        expected_headers["X-Other-Header"] = 'another_header_t...'
+        obscured_test(params, headers, [], ['X-Other-Header'], params,
+                      expected_headers)
+        # both
+        expected_headers["X-Auth-Token"] = 'this_is_my_auth_...'
+        obscured_test(params, headers, [], ['X-Auth-Token', 'X-Other-Header'],
+                      params, expected_headers)
+
+        # all together
+        obscured_test(params, headers, ['param_two', 'param_one'],
+                      ['X-Auth-Token', 'X-Other-Header'],
+                      expected_params, expected_headers)
+
+    def test_access_user_id_field(self):
+        """Test that access_user_id field is logged correctly."""
+        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), {})
+        app.access_logger = debug_logger()
+        req = Request.blank('/', environ={
+            'REQUEST_METHOD': 'GET',
+            'swift.access_logging': {'user_id': 'test:tester'},
+        })
+        resp = app(req.environ, start_response)
+        b''.join(resp)
+        log_parts = self._log_parts(app)
+        self.assertEqual(log_parts[21], 'test:tester')
+
+        # test that user_id is not logged if it is not present
+        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), {})
+        app.access_logger = debug_logger()
+        req = Request.blank('/', environ={
+            'REQUEST_METHOD': 'GET',
+        })
+        resp = app(req.environ, start_response)
+        b''.join(resp)
+        log_parts = self._log_parts(app)
+        self.assertEqual(log_parts[21], '-')
+
+    def test_access_user_id_field_with_anonymization(self):
+        app = proxy_logging.ProxyLoggingMiddleware(FakeApp(), {
+            'log_anonymization_salt': 'secret_salt',
+            'log_msg_template': '{method} {path} {access_user_id.anonymized}'
+        })
+        app.access_logger = debug_logger()
+        req = Request.blank('/', environ={
+            'REQUEST_METHOD': 'GET',
+            'swift.access_logging': {'user_id': 'test:tester'},
+        })
+        resp = app(req.environ, start_response)
+        b''.join(resp)
+        log_parts = self._log_parts(app)
+        self.assertEqual(log_parts[-1],
+                         '{SMD5}14fe1612c332096e282486e4baa37e63')
diff --git a/test/unit/common/middleware/test_quotas.py b/test/unit/common/middleware/test_quotas.py
new file mode 100644
index 0000000000..0ad1ea87c3
--- /dev/null
+++ b/test/unit/common/middleware/test_quotas.py
@@ -0,0 +1,361 @@
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+
+from swift.common.swob import Request, HTTPUnauthorized, HTTPOk
+from swift.common.middleware import container_quotas, copy
+from test.unit.common.middleware.helpers import FakeSwift
+
+
+class FakeCache(object):
+
+    def __init__(self, val):
+        if 'status' not in val:
+            val['status'] = 200
+        self.val = val
+
+    def get(self, *args):
+        return self.val
+
+
+class FakeApp(object):
+
+    def __init__(self):
+        pass
+
+    def __call__(self, env, start_response):
+        start_response('200 OK', [])
+        return []
+
+
+class FakeMissingApp(object):
+
+    def __init__(self):
+        pass
+
+    def __call__(self, env, start_response):
+        start_response('404 Not Found', [])
+        return []
+
+
+def start_response(*args):
+    pass
+
+
+class TestContainerQuotas(unittest.TestCase):
+
+    def test_split_path_empty_container_path_segment(self):
+        app = container_quotas.ContainerQuotaMiddleware(FakeApp(), {})
+        req = Request.blank('/v1/a//something/something_else',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': {'key': 'value'}})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_not_handled(self):
+        app = container_quotas.ContainerQuotaMiddleware(FakeApp(), {})
+        req = Request.blank('/v1/a/c', environ={'REQUEST_METHOD': 'PUT'})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+        app = container_quotas.ContainerQuotaMiddleware(FakeApp(), {})
+        req = Request.blank('/v1/a/c/o', environ={'REQUEST_METHOD': 'GET'})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_no_quotas(self):
+        app = container_quotas.ContainerQuotaMiddleware(FakeApp(), {})
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT', 'swift.cache': FakeCache({}),
+                     'CONTENT_LENGTH': '100'})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_exceed_bytes_quota(self):
+        app = container_quotas.ContainerQuotaMiddleware(FakeApp(), {})
+        cache = FakeCache({'bytes': 0, 'meta': {'quota-bytes': '2'}})
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '100'})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 413)
+        self.assertEqual(res.body, b'Upload exceeds quota.')
+
+    def test_not_exceed_bytes_quota(self):
+        app = container_quotas.ContainerQuotaMiddleware(FakeApp(), {})
+        cache = FakeCache({'bytes': 0, 'meta': {'quota-bytes': '100'}})
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '100'})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_exceed_counts_quota(self):
+        app = container_quotas.ContainerQuotaMiddleware(FakeApp(), {})
+        cache = FakeCache({'object_count': 1, 'meta': {'quota-count': '1'}})
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '100'})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 413)
+        self.assertEqual(res.body, b'Upload exceeds quota.')
+
+    def test_not_exceed_counts_quota(self):
+        app = container_quotas.ContainerQuotaMiddleware(FakeApp(), {})
+        cache = FakeCache({'object_count': 1, 'meta': {'quota-count': '2'}})
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '100'})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 200)
+
+    def test_invalid_quotas(self):
+        req = Request.blank(
+            '/v1/a/c',
+            environ={'REQUEST_METHOD': 'POST',
+                     'HTTP_X_CONTAINER_META_QUOTA_BYTES': 'abc'})
+        res = req.get_response(
+            container_quotas.ContainerQuotaMiddleware(FakeApp(), {}))
+        self.assertEqual(res.status_int, 400)
+
+        req = Request.blank(
+            '/v1/a/c',
+            environ={'REQUEST_METHOD': 'POST',
+                     'HTTP_X_CONTAINER_META_QUOTA_COUNT': 'abc'})
+        res = req.get_response(
+            container_quotas.ContainerQuotaMiddleware(FakeApp(), {}))
+        self.assertEqual(res.status_int, 400)
+
+    def test_valid_quotas(self):
+        req = Request.blank(
+            '/v1/a/c',
+            environ={'REQUEST_METHOD': 'POST',
+                     'HTTP_X_CONTAINER_META_QUOTA_BYTES': '123'})
+        res = req.get_response(
+            container_quotas.ContainerQuotaMiddleware(FakeApp(), {}))
+        self.assertEqual(res.status_int, 200)
+
+        req = Request.blank(
+            '/v1/a/c',
+            environ={'REQUEST_METHOD': 'POST',
+                     'HTTP_X_CONTAINER_META_QUOTA_COUNT': '123'})
+        res = req.get_response(
+            container_quotas.ContainerQuotaMiddleware(FakeApp(), {}))
+        self.assertEqual(res.status_int, 200)
+
+    def test_delete_quotas(self):
+        req = Request.blank(
+            '/v1/a/c',
+            environ={'REQUEST_METHOD': 'POST',
+                     'HTTP_X_CONTAINER_META_QUOTA_BYTES': None})
+        res = req.get_response(
+            container_quotas.ContainerQuotaMiddleware(FakeApp(), {}))
+        self.assertEqual(res.status_int, 200)
+
+    def test_missing_container(self):
+        app = container_quotas.ContainerQuotaMiddleware(FakeMissingApp(), {})
+        cache = FakeCache({'bytes': 0, 'meta': {'quota-bytes': '100'}})
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '100'})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 404)
+
+    def test_auth_fail(self):
+        app = container_quotas.ContainerQuotaMiddleware(FakeApp(), {})
+        cache = FakeCache({'object_count': 1, 'meta': {'quota-count': '1'},
+                           'write_acl': None})
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '100',
+                     'swift.authorize': lambda *args: HTTPUnauthorized()})
+        res = req.get_response(app)
+        self.assertEqual(res.status_int, 401)
+
+
+class ContainerQuotaCopyingTestCases(unittest.TestCase):
+
+    def setUp(self):
+        self.app = FakeSwift()
+        self.cq_filter = container_quotas.filter_factory({})(self.app)
+        self.copy_filter = copy.filter_factory({})(self.cq_filter)
+
+    def test_exceed_bytes_quota_copy_verb(self):
+        cache = FakeCache({'bytes': 0, 'meta': {'quota-bytes': '2'}})
+        self.app.register('GET', '/v1/a/c2/o2', HTTPOk,
+                          {'Content-Length': '10'}, 'passed')
+
+        req = Request.blank('/v1/a/c2/o2',
+                            environ={'REQUEST_METHOD': 'COPY',
+                                     'swift.cache': cache},
+                            headers={'Destination': '/c/o'})
+        res = req.get_response(self.copy_filter)
+        self.assertEqual(res.status_int, 413)
+        self.assertEqual(res.body, b'Upload exceeds quota.')
+
+    def test_not_exceed_bytes_quota_copy_verb(self):
+        self.app.register('GET', '/v1/a/c2/o2', HTTPOk,
+                          {'Content-Length': '10'}, 'passed')
+        self.app.register(
+            'PUT', '/v1/a/c/o', HTTPOk, {}, 'passed')
+        cache = FakeCache({'bytes': 0, 'meta': {'quota-bytes': '100'}})
+        req = Request.blank('/v1/a/c2/o2',
+                            environ={'REQUEST_METHOD': 'COPY',
+                                     'swift.cache': cache},
+                            headers={'Destination': '/c/o'})
+        res = req.get_response(self.copy_filter)
+        self.assertEqual(res.status_int, 200)
+
+    def test_exceed_counts_quota_copy_verb(self):
+        self.app.register('GET', '/v1/a/c2/o2', HTTPOk, {}, 'passed')
+        cache = FakeCache({'object_count': 1, 'meta': {'quota-count': '1'}})
+        req = Request.blank('/v1/a/c2/o2',
+                            environ={'REQUEST_METHOD': 'COPY',
+                                     'swift.cache': cache},
+                            headers={'Destination': '/c/o'})
+        res = req.get_response(self.copy_filter)
+        self.assertEqual(res.status_int, 413)
+        self.assertEqual(res.body, b'Upload exceeds quota.')
+
+    def test_exceed_counts_quota_copy_cross_account_verb(self):
+        self.app.register('GET', '/v1/a/c2/o2', HTTPOk, {}, 'passed')
+        a_c_cache = {'storage_policy': '0', 'meta': {'quota-count': '2'},
+                     'status': 200, 'object_count': 1}
+        a2_c_cache = {'storage_policy': '0', 'meta': {'quota-count': '1'},
+                      'status': 200, 'object_count': 1}
+        req = Request.blank('/v1/a/c2/o2',
+                            environ={'REQUEST_METHOD': 'COPY',
+                                     'swift.infocache': {
+                                         'container/a/c': a_c_cache,
+                                         'container/a2/c': a2_c_cache}},
+                            headers={'Destination': '/c/o',
+                                     'Destination-Account': 'a2'})
+        res = req.get_response(self.copy_filter)
+        self.assertEqual(res.status_int, 413)
+        self.assertEqual(res.body, b'Upload exceeds quota.')
+
+    def test_exceed_counts_quota_copy_cross_account_PUT_verb(self):
+        self.app.register('GET', '/v1/a/c2/o2', HTTPOk, {}, 'passed')
+        a_c_cache = {'storage_policy': '0', 'meta': {'quota-count': '2'},
+                     'status': 200, 'object_count': 1}
+        a2_c_cache = {'storage_policy': '0', 'meta': {'quota-count': '1'},
+                      'status': 200, 'object_count': 1}
+        req = Request.blank('/v1/a2/c/o',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.infocache': {
+                                         'container/a/c': a_c_cache,
+                                         'container/a2/c': a2_c_cache}},
+                            headers={'X-Copy-From': '/c2/o2',
+                                     'X-Copy-From-Account': 'a'})
+        res = req.get_response(self.copy_filter)
+        self.assertEqual(res.status_int, 413)
+        self.assertEqual(res.body, b'Upload exceeds quota.')
+
+    def test_exceed_bytes_quota_copy_from(self):
+        self.app.register('GET', '/v1/a/c2/o2', HTTPOk,
+                          {'Content-Length': '10'}, 'passed')
+        cache = FakeCache({'bytes': 0, 'meta': {'quota-bytes': '2'}})
+
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache},
+                            headers={'x-copy-from': '/c2/o2'})
+        res = req.get_response(self.copy_filter)
+        self.assertEqual(res.status_int, 413)
+        self.assertEqual(res.body, b'Upload exceeds quota.')
+
+    def test_not_exceed_bytes_quota_copy_from(self):
+        self.app.register('GET', '/v1/a/c2/o2', HTTPOk,
+                          {'Content-Length': '10'}, 'passed')
+        self.app.register(
+            'PUT', '/v1/a/c/o', HTTPOk, {}, 'passed')
+        cache = FakeCache({'bytes': 0, 'meta': {'quota-bytes': '100'}})
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache},
+                            headers={'x-copy-from': '/c2/o2'})
+        res = req.get_response(self.copy_filter)
+        self.assertEqual(res.status_int, 200)
+
+    def test_bytes_quota_copy_from_no_src(self):
+        self.app.register('GET', '/v1/a/c2/o3', HTTPOk, {}, 'passed')
+        self.app.register(
+            'PUT', '/v1/a/c/o', HTTPOk, {}, 'passed')
+        cache = FakeCache({'bytes': 0, 'meta': {'quota-bytes': '100'}})
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache},
+                            headers={'x-copy-from': '/c2/o3'})
+        res = req.get_response(self.copy_filter)
+        self.assertEqual(res.status_int, 200)
+
+    def test_bytes_quota_copy_from_bad_src(self):
+        cache = FakeCache({'bytes': 0, 'meta': {'quota-bytes': '100'}})
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache},
+                            headers={'x-copy-from': 'bad_path'})
+        res = req.get_response(self.copy_filter)
+        self.assertEqual(res.status_int, 412)
+
+    def test_exceed_counts_quota_copy_from(self):
+        self.app.register('GET', '/v1/a/c2/o2', HTTPOk,
+                          {'Content-Length': '10'}, 'passed')
+        cache = FakeCache({'object_count': 1, 'meta': {'quota-count': '1'}})
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache},
+                            headers={'x-copy-from': '/c2/o2'})
+        res = req.get_response(self.copy_filter)
+        self.assertEqual(res.status_int, 413)
+        self.assertEqual(res.body, b'Upload exceeds quota.')
+
+    def test_not_exceed_counts_quota_copy_from(self):
+        self.app.register('GET', '/v1/a/c2/o2', HTTPOk,
+                          {'Content-Length': '10'}, 'passed')
+        self.app.register(
+            'PUT', '/v1/a/c/o', HTTPOk, {}, 'passed')
+        cache = FakeCache({'object_count': 1, 'meta': {'quota-count': '2'}})
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT',
+                                     'swift.cache': cache},
+                            headers={'x-copy-from': '/c2/o2'})
+        res = req.get_response(self.copy_filter)
+        self.assertEqual(res.status_int, 200)
+
+    def test_not_exceed_counts_quota_copy_verb(self):
+        self.app.register('GET', '/v1/a/c2/o2', HTTPOk,
+                          {'Content-Length': '10'}, 'passed')
+        self.app.register(
+            'PUT', '/v1/a/c/o', HTTPOk, {}, 'passed')
+        cache = FakeCache({'object_count': 1, 'meta': {'quota-count': '2'}})
+        req = Request.blank('/v1/a/c2/o2',
+                            environ={'REQUEST_METHOD': 'COPY',
+                                     'swift.cache': cache},
+                            headers={'Destination': '/c/o'})
+        res = req.get_response(self.copy_filter)
+        self.assertEqual(res.status_int, 200)
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/test_ratelimit.py b/test/unit/common/middleware/test_ratelimit.py
index 82aef84541..beff5d11fd 100644
--- a/test/unit/common/middleware/test_ratelimit.py
+++ b/test/unit/common/middleware/test_ratelimit.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -16,104 +16,37 @@
 import unittest
 import time
 import eventlet
-from contextlib import contextmanager
-from threading import Thread
+from unittest import mock
 
-from test.unit import FakeLogger
+from test.debug_logger import debug_logger
+from test.unit import FakeMemcache
 from swift.common.middleware import ratelimit
-from swift.proxy.controllers.base import get_container_memcache_key
-from swift.common.memcached import MemcacheConnectionError
+from swift.proxy.controllers.base import get_cache_key, \
+    headers_to_container_info
 from swift.common.swob import Request
+from swift.common import registry
 
-
-class FakeMemcache(object):
-
-    def __init__(self):
-        self.store = {}
-        self.error_on_incr = False
-        self.init_incr_return_neg = False
-
-    def get(self, key):
-        return self.store.get(key)
-
-    def set(self, key, value, serialize=False, timeout=0):
-        self.store[key] = value
-        return True
-
-    def incr(self, key, delta=1, timeout=0):
-        if self.error_on_incr:
-            raise MemcacheConnectionError('Memcache restarting')
-        if self.init_incr_return_neg:
-            # simulate initial hit, force reset of memcache
-            self.init_incr_return_neg = False
-            return -10000000
-        self.store[key] = int(self.store.setdefault(key, 0)) + int(delta)
-        if self.store[key] < 0:
-            self.store[key] = 0
-        return int(self.store[key])
-
-    def decr(self, key, delta=1, timeout=0):
-        return self.incr(key, delta=-delta, timeout=timeout)
-
-    @contextmanager
-    def soft_lock(self, key, timeout=0, retries=5):
-        yield True
-
-    def delete(self, key):
-        try:
-            del self.store[key]
-        except Exception:
-            pass
-        return True
-
-
-def mock_http_connect(response, headers=None, with_exc=False):
-
-    class FakeConn(object):
-
-        def __init__(self, status, headers, with_exc):
-            self.status = status
-            self.reason = 'Fake'
-            self.host = '1.2.3.4'
-            self.port = '1234'
-            self.with_exc = with_exc
-            self.headers = headers
-            if self.headers is None:
-                self.headers = {}
-
-        def getresponse(self):
-            if self.with_exc:
-                raise Exception('test')
-            return self
-
-        def getheader(self, header):
-            return self.headers[header]
-
-        def read(self, amt=None):
-            return ''
-
-        def close(self):
-            return
-    return lambda *args, **kwargs: FakeConn(response, headers, with_exc)
+threading = eventlet.patcher.original('threading')
 
 
 class FakeApp(object):
+    skip_handled_check = False
 
     def __call__(self, env, start_response):
-        return ['204 No Content']
+        assert self.skip_handled_check or env.get('swift.ratelimit.handled')
+        start_response('200 OK', [])
+        return [b'Some Content']
 
 
-def start_response(*args):
-    pass
+class FakeReq(object):
+    def __init__(self, method, env=None):
+        self.method = method
+        self.environ = env or {}
 
 
-def dummy_filter_factory(global_conf, **local_conf):
-    conf = global_conf.copy()
-    conf.update(local_conf)
+def start_response(*args):
+    pass
 
-    def limit_filter(app):
-        return ratelimit.RateLimitMiddleware(app, conf, logger=FakeLogger())
-    return limit_filter
 
 time_ticker = 0
 time_override = []
@@ -157,129 +90,184 @@ def tearDown(self):
     def _run(self, callable_func, num, rate, check_time=True):
         global time_ticker
         begin = time.time()
-        for x in range(0, num):
-            result = callable_func()
+        for x in range(num):
+            callable_func()
         end = time.time()
-        total_time = float(num) / rate - 1.0 / rate # 1st request isn't limited
+        total_time = float(num) / rate - 1.0 / rate  # 1st request not limited
         # Allow for one second of variation in the total time.
         time_diff = abs(total_time - (end - begin))
         if check_time:
-            self.assertEquals(round(total_time, 1), round(time_ticker, 1))
+            self.assertEqual(round(total_time, 1), round(time_ticker, 1))
         return time_diff
 
-    def test_get_container_maxrate(self):
+    def test_get_maxrate(self):
         conf_dict = {'container_ratelimit_10': 200,
                      'container_ratelimit_50': 100,
                      'container_ratelimit_75': 30}
-        test_ratelimit = dummy_filter_factory(conf_dict)(FakeApp())
-        self.assertEquals(test_ratelimit.get_container_maxrate(0), None)
-        self.assertEquals(test_ratelimit.get_container_maxrate(5), None)
-        self.assertEquals(test_ratelimit.get_container_maxrate(10), 200)
-        self.assertEquals(test_ratelimit.get_container_maxrate(60), 72)
-        self.assertEquals(test_ratelimit.get_container_maxrate(160), 30)
+        test_ratelimit = ratelimit.filter_factory(conf_dict)(FakeApp())
+        test_ratelimit.logger = debug_logger()
+        self.assertIsNone(ratelimit.get_maxrate(
+            test_ratelimit.container_ratelimits, 0))
+        self.assertIsNone(ratelimit.get_maxrate(
+            test_ratelimit.container_ratelimits, 5))
+        self.assertEqual(ratelimit.get_maxrate(
+            test_ratelimit.container_ratelimits, 10), 200)
+        self.assertEqual(ratelimit.get_maxrate(
+            test_ratelimit.container_ratelimits, 60), 72)
+        self.assertEqual(ratelimit.get_maxrate(
+            test_ratelimit.container_ratelimits, 160), 30)
 
     def test_get_ratelimitable_key_tuples(self):
         current_rate = 13
         conf_dict = {'account_ratelimit': current_rate,
                      'container_ratelimit_3': 200}
         fake_memcache = FakeMemcache()
-        fake_memcache.store[get_container_memcache_key('a', 'c')] = \
-            {'count': 5}
-        the_app = ratelimit.RateLimitMiddleware(None, conf_dict,
-                                                logger=FakeLogger())
+        fake_memcache.store[get_cache_key('a', 'c')] = \
+            {'object_count': '5'}
+        the_app = ratelimit.filter_factory(conf_dict)(FakeApp())
         the_app.memcache_client = fake_memcache
-        self.assertEquals(len(the_app.get_ratelimitable_key_tuples(
-                    'DELETE', 'a', None, None)), 0)
-        self.assertEquals(len(the_app.get_ratelimitable_key_tuples(
-                    'PUT', 'a', 'c', None)), 1)
-        self.assertEquals(len(the_app.get_ratelimitable_key_tuples(
-                    'DELETE', 'a', 'c', None)), 1)
-        self.assertEquals(len(the_app.get_ratelimitable_key_tuples(
-                    'GET', 'a', 'c', 'o')), 0)
-        self.assertEquals(len(the_app.get_ratelimitable_key_tuples(
-                    'PUT', 'a', 'c', 'o')), 1)
+        environ = {'swift.cache': fake_memcache, 'PATH_INFO': '/v1/a/c/o'}
+        with mock.patch('swift.common.middleware.ratelimit.get_account_info',
+                        lambda *args, **kwargs: {}):
+            self.assertEqual(len(the_app.get_ratelimitable_key_tuples(
+                FakeReq('DELETE', environ), 'a', None, None)), 0)
+            self.assertEqual(len(the_app.get_ratelimitable_key_tuples(
+                FakeReq('PUT', environ), 'a', 'c', None)), 1)
+            self.assertEqual(len(the_app.get_ratelimitable_key_tuples(
+                FakeReq('DELETE', environ), 'a', 'c', None)), 1)
+            self.assertEqual(len(the_app.get_ratelimitable_key_tuples(
+                FakeReq('GET', environ), 'a', 'c', 'o')), 0)
+            self.assertEqual(len(the_app.get_ratelimitable_key_tuples(
+                FakeReq('PUT', environ), 'a', 'c', 'o')), 1)
+
+        self.assertEqual(len(the_app.get_ratelimitable_key_tuples(
+            FakeReq('PUT', environ), 'a', 'c', None, global_ratelimit=10)), 2)
+        self.assertEqual(the_app.get_ratelimitable_key_tuples(
+            FakeReq('PUT', environ), 'a', 'c', None, global_ratelimit=10)[1],
+            ('ratelimit/global-write/a', 10))
+
+        self.assertEqual(len(the_app.get_ratelimitable_key_tuples(
+            FakeReq('PUT', environ), 'a', 'c', None,
+            global_ratelimit='notafloat')), 1)
+
+    def test_memcached_container_info_dict(self):
+        mdict = headers_to_container_info({'x-container-object-count': '45'})
+        self.assertEqual(mdict['object_count'], '45')
 
     def test_ratelimit_old_memcache_format(self):
         current_rate = 13
         conf_dict = {'account_ratelimit': current_rate,
                      'container_ratelimit_3': 200}
         fake_memcache = FakeMemcache()
-        fake_memcache.store[get_container_memcache_key('a', 'c')] = \
+        fake_memcache.store[get_cache_key('a', 'c')] = \
             {'container_size': 5}
-        the_app = ratelimit.RateLimitMiddleware(None, conf_dict,
-                                                logger=FakeLogger())
+        the_app = ratelimit.filter_factory(conf_dict)(FakeApp())
         the_app.memcache_client = fake_memcache
-        tuples = the_app.get_ratelimitable_key_tuples('PUT', 'a', 'c', 'o')
-        self.assertEquals(tuples, [('ratelimit/a/c', 200.0)])
+        req = FakeReq('PUT', {
+            'PATH_INFO': '/v1/a/c/o', 'swift.cache': fake_memcache})
+        with mock.patch('swift.common.middleware.ratelimit.get_account_info',
+                        lambda *args, **kwargs: {}):
+            tuples = the_app.get_ratelimitable_key_tuples(req, 'a', 'c', 'o')
+            self.assertEqual(tuples, [('ratelimit/a/c', 200.0)])
 
     def test_account_ratelimit(self):
         current_rate = 5
         num_calls = 50
         conf_dict = {'account_ratelimit': current_rate}
         self.test_ratelimit = ratelimit.filter_factory(conf_dict)(FakeApp())
-        ratelimit.http_connect = mock_http_connect(204)
-        for meth, exp_time in [('DELETE', 9.8), ('GET', 0),
-                           ('POST', 0), ('PUT', 9.8)]:
-            req = Request.blank('/v/a%s/c' % meth)
-            req.method = meth
-            req.environ['swift.cache'] = FakeMemcache()
-            make_app_call = lambda: self.test_ratelimit(req.environ,
-                                                        start_response)
-            begin = time.time()
-            self._run(make_app_call, num_calls, current_rate,
-                      check_time=bool(exp_time))
-            self.assertEquals(round(time.time() - begin, 1), exp_time)
-            self._reset_time()
+        with mock.patch('swift.common.middleware.ratelimit.get_container_info',
+                        lambda *args, **kwargs: {}):
+            with mock.patch(
+                    'swift.common.middleware.ratelimit.get_account_info',
+                    lambda *args, **kwargs: {}):
+                for meth, exp_time in [('DELETE', 9.8), ('GET', 0),
+                                       ('POST', 0), ('PUT', 9.8)]:
+                    req = Request.blank('/v1/a%s/c' % meth)
+                    req.method = meth
+                    req.environ['swift.cache'] = FakeMemcache()
+                    make_app_call = lambda: self.test_ratelimit(
+                        req.environ.copy(), start_response)
+                    begin = time.time()
+                    self._run(make_app_call, num_calls, current_rate,
+                              check_time=bool(exp_time))
+                    self.assertEqual(round(time.time() - begin, 1), exp_time)
+                    self._reset_time()
 
     def test_ratelimit_set_incr(self):
         current_rate = 5
         num_calls = 50
         conf_dict = {'account_ratelimit': current_rate}
         self.test_ratelimit = ratelimit.filter_factory(conf_dict)(FakeApp())
-        ratelimit.http_connect = mock_http_connect(204)
-        req = Request.blank('/v/a/c')
+        req = Request.blank('/v1/a/c')
         req.method = 'PUT'
         req.environ['swift.cache'] = FakeMemcache()
         req.environ['swift.cache'].init_incr_return_neg = True
-        make_app_call = lambda: self.test_ratelimit(req.environ,
+        make_app_call = lambda: self.test_ratelimit(req.environ.copy(),
                                                     start_response)
         begin = time.time()
-        self._run(make_app_call, num_calls, current_rate, check_time=False)
-        self.assertEquals(round(time.time() - begin, 1), 9.8)
+        with mock.patch('swift.common.middleware.ratelimit.get_account_info',
+                        lambda *args, **kwargs: {}):
+            self._run(make_app_call, num_calls, current_rate, check_time=False)
+            self.assertEqual(round(time.time() - begin, 1), 9.8)
 
-    def test_ratelimit_whitelist(self):
+    def test_ratelimit_old_white_black_list(self):
         global time_ticker
         current_rate = 2
         conf_dict = {'account_ratelimit': current_rate,
                      'max_sleep_time_seconds': 2,
                      'account_whitelist': 'a',
                      'account_blacklist': 'b'}
-        self.test_ratelimit = dummy_filter_factory(conf_dict)(FakeApp())
-        ratelimit.http_connect = mock_http_connect(204)
-        req = Request.blank('/v/a/c')
+        self.test_ratelimit = ratelimit.filter_factory(conf_dict)(FakeApp())
+        with mock.patch.object(self.test_ratelimit,
+                               'memcache_client', FakeMemcache()):
+            self.assertEqual(
+                self.test_ratelimit.handle_ratelimit(
+                    Request.blank('/'), 'a', 'c', 'o'),
+                None)
+            self.assertEqual(
+                self.test_ratelimit.handle_ratelimit(
+                    Request.blank('/'), 'b', 'c', 'o').status_int,
+                497)
+
+    def test_ratelimit_whitelist_sysmeta(self):
+        global time_ticker
+        current_rate = 2
+        conf_dict = {'account_ratelimit': current_rate,
+                     'max_sleep_time_seconds': 2,
+                     'account_whitelist': 'a',
+                     'account_blacklist': 'b'}
+        self.test_ratelimit = ratelimit.filter_factory(conf_dict)(FakeApp())
+        req = Request.blank('/v1/a/c')
         req.environ['swift.cache'] = FakeMemcache()
 
-        class rate_caller(Thread):
+        class rate_caller(threading.Thread):
 
             def __init__(self, parent):
-                Thread.__init__(self)
+                threading.Thread.__init__(self)
                 self.parent = parent
 
             def run(self):
                 self.result = self.parent.test_ratelimit(req.environ,
                                                          start_response)
-        nt = 5
-        threads = []
-        for i in range(nt):
-            rc = rate_caller(self)
-            rc.start()
-            threads.append(rc)
-        for thread in threads:
-            thread.join()
-        the_498s = [t for t in threads if \
-                        ''.join(t.result).startswith('Slow down')]
-        self.assertEquals(len(the_498s), 0)
-        self.assertEquals(time_ticker, 0)
+
+        def get_fake_ratelimit(*args, **kwargs):
+            return {'sysmeta': {'global-write-ratelimit': 'WHITELIST'}}
+
+        with mock.patch('swift.common.middleware.ratelimit.get_account_info',
+                        get_fake_ratelimit):
+            nt = 5
+            threads = []
+            for i in range(nt):
+                rc = rate_caller(self)
+                rc.start()
+                threads.append(rc)
+            for thread in threads:
+                thread.join()
+            the_498s = [
+                t for t in threads
+                if b''.join(t.result).startswith(b'Slow down')]
+            self.assertEqual(len(the_498s), 0)
+            self.assertEqual(time_ticker, 0)
 
     def test_ratelimit_blacklist(self):
         global time_ticker
@@ -288,33 +276,40 @@ def test_ratelimit_blacklist(self):
                      'max_sleep_time_seconds': 2,
                      'account_whitelist': 'a',
                      'account_blacklist': 'b'}
-        self.test_ratelimit = dummy_filter_factory(conf_dict)(FakeApp())
+        self.test_ratelimit = ratelimit.filter_factory(conf_dict)(FakeApp())
+        self.test_ratelimit.logger = debug_logger()
         self.test_ratelimit.BLACK_LIST_SLEEP = 0
-        ratelimit.http_connect = mock_http_connect(204)
-        req = Request.blank('/v/b/c')
+        req = Request.blank('/v1/b/c')
         req.environ['swift.cache'] = FakeMemcache()
 
-        class rate_caller(Thread):
+        class rate_caller(threading.Thread):
 
             def __init__(self, parent):
-                Thread.__init__(self)
+                threading.Thread.__init__(self)
                 self.parent = parent
 
             def run(self):
-                self.result = self.parent.test_ratelimit(req.environ,
+                self.result = self.parent.test_ratelimit(req.environ.copy(),
                                                          start_response)
-        nt = 5
-        threads = []
-        for i in range(nt):
-            rc = rate_caller(self)
-            rc.start()
-            threads.append(rc)
-        for thread in threads:
-            thread.join()
-        the_497s = [t for t in threads if \
-                        ''.join(t.result).startswith('Your account')]
-        self.assertEquals(len(the_497s), 5)
-        self.assertEquals(time_ticker, 0)
+
+        def get_fake_ratelimit(*args, **kwargs):
+            return {'sysmeta': {'global-write-ratelimit': 'BLACKLIST'}}
+
+        with mock.patch('swift.common.middleware.ratelimit.get_account_info',
+                        get_fake_ratelimit):
+            nt = 5
+            threads = []
+            for i in range(nt):
+                rc = rate_caller(self)
+                rc.start()
+                threads.append(rc)
+            for thread in threads:
+                thread.join()
+            the_497s = [
+                t for t in threads
+                if b''.join(t.result).startswith(b'Your account')]
+            self.assertEqual(len(the_497s), 5)
+            self.assertEqual(time_ticker, 0)
 
     def test_ratelimit_max_rate_double(self):
         global time_ticker
@@ -323,27 +318,101 @@ def test_ratelimit_max_rate_double(self):
         conf_dict = {'account_ratelimit': current_rate,
                      'clock_accuracy': 100,
                      'max_sleep_time_seconds': 1}
-        self.test_ratelimit = dummy_filter_factory(conf_dict)(FakeApp())
-        ratelimit.http_connect = mock_http_connect(204)
+        self.test_ratelimit = ratelimit.filter_factory(conf_dict)(FakeApp())
+        self.test_ratelimit.log_sleep_time_seconds = .00001
+        req = Request.blank('/v1/a/c')
+        req.method = 'PUT'
+        req.environ['swift.cache'] = FakeMemcache()
+
+        time_override = [0, 0, 0, 0, None]
+        # simulates 4 requests coming in at same time, then sleeping
+        with mock.patch('swift.common.middleware.ratelimit.get_account_info',
+                        lambda *args, **kwargs: {}):
+            r = self.test_ratelimit(req.environ.copy(), start_response)
+            mock_sleep(.1)
+            r = self.test_ratelimit(req.environ.copy(), start_response)
+            mock_sleep(.1)
+            r = self.test_ratelimit(req.environ.copy(), start_response)
+            self.assertEqual(r[0], b'Slow down')
+            mock_sleep(.1)
+            r = self.test_ratelimit(req.environ.copy(), start_response)
+            self.assertEqual(r[0], b'Slow down')
+            mock_sleep(.1)
+            r = self.test_ratelimit(req.environ.copy(), start_response)
+            self.assertEqual(r[0], b'Some Content')
+
+    def test_ratelimit_max_rate_double_container(self):
+        global time_ticker
+        global time_override
+        current_rate = 2
+        conf_dict = {'container_ratelimit_0': current_rate,
+                     'clock_accuracy': 100,
+                     'max_sleep_time_seconds': 1}
+        self.test_ratelimit = ratelimit.filter_factory(conf_dict)(FakeApp())
         self.test_ratelimit.log_sleep_time_seconds = .00001
-        req = Request.blank('/v/a/c')
+        req = Request.blank('/v1/a/c/o')
         req.method = 'PUT'
         req.environ['swift.cache'] = FakeMemcache()
+        req.environ['swift.cache'].set(
+            get_cache_key('a', 'c'),
+            {'object_count': 1})
 
         time_override = [0, 0, 0, 0, None]
         # simulates 4 requests coming in at same time, then sleeping
-        r = self.test_ratelimit(req.environ, start_response)
-        mock_sleep(.1)
-        r = self.test_ratelimit(req.environ, start_response)
-        mock_sleep(.1)
-        r = self.test_ratelimit(req.environ, start_response)
-        self.assertEquals(r[0], 'Slow down')
-        mock_sleep(.1)
-        r = self.test_ratelimit(req.environ, start_response)
-        self.assertEquals(r[0], 'Slow down')
-        mock_sleep(.1)
-        r = self.test_ratelimit(req.environ, start_response)
-        self.assertEquals(r[0], '204 No Content')
+        with mock.patch('swift.common.middleware.ratelimit.get_account_info',
+                        lambda *args, **kwargs: {}):
+            r = self.test_ratelimit(req.environ.copy(), start_response)
+            mock_sleep(.1)
+            r = self.test_ratelimit(req.environ.copy(), start_response)
+            mock_sleep(.1)
+            r = self.test_ratelimit(req.environ.copy(), start_response)
+            self.assertEqual(r[0], b'Slow down')
+            mock_sleep(.1)
+            r = self.test_ratelimit(req.environ.copy(), start_response)
+            self.assertEqual(r[0], b'Slow down')
+            mock_sleep(.1)
+            r = self.test_ratelimit(req.environ.copy(), start_response)
+            self.assertEqual(r[0], b'Some Content')
+
+    def test_ratelimit_max_rate_double_container_listing(self):
+        global time_ticker
+        global time_override
+        current_rate = 2
+        conf_dict = {'container_listing_ratelimit_0': current_rate,
+                     'clock_accuracy': 100,
+                     'max_sleep_time_seconds': 1}
+        self.test_ratelimit = ratelimit.filter_factory(conf_dict)(FakeApp())
+        self.test_ratelimit.log_sleep_time_seconds = .00001
+        req = Request.blank('/v1/a/c')
+        req.method = 'GET'
+        req.environ['swift.cache'] = FakeMemcache()
+        req.environ['swift.cache'].set(
+            get_cache_key('a', 'c'),
+            {'object_count': 1})
+
+        with mock.patch('swift.common.middleware.ratelimit.get_account_info',
+                        lambda *args, **kwargs: {}):
+            time_override = [0, 0, 0, 0, None]
+            # simulates 4 requests coming in at same time, then sleeping
+            r = self.test_ratelimit(req.environ.copy(), start_response)
+            mock_sleep(.1)
+            r = self.test_ratelimit(req.environ.copy(), start_response)
+            mock_sleep(.1)
+            r = self.test_ratelimit(req.environ.copy(), start_response)
+            self.assertEqual(r[0], b'Slow down')
+            mock_sleep(.1)
+            r = self.test_ratelimit(req.environ.copy(), start_response)
+            self.assertEqual(r[0], b'Slow down')
+            mock_sleep(.1)
+            r = self.test_ratelimit(req.environ.copy(), start_response)
+            self.assertEqual(r[0], b'Some Content')
+            mc = self.test_ratelimit.memcache_client
+            try:
+                self.test_ratelimit.memcache_client = None
+                self.assertIsNone(
+                    self.test_ratelimit.handle_ratelimit(req, 'n', 'c', None))
+            finally:
+                self.test_ratelimit.memcache_client = mc
 
     def test_ratelimit_max_rate_multiple_acc(self):
         num_calls = 4
@@ -352,35 +421,34 @@ def test_ratelimit_max_rate_multiple_acc(self):
                      'max_sleep_time_seconds': 2}
         fake_memcache = FakeMemcache()
 
-        the_app = ratelimit.RateLimitMiddleware(None, conf_dict,
-                                                logger=FakeLogger())
+        the_app = ratelimit.filter_factory(conf_dict)(FakeApp())
         the_app.memcache_client = fake_memcache
-        req = lambda: None
-        req.method = 'PUT'
 
-        class rate_caller(Thread):
+        class rate_caller(threading.Thread):
 
             def __init__(self, name):
                 self.myname = name
-                Thread.__init__(self)
+                threading.Thread.__init__(self)
 
             def run(self):
                 for j in range(num_calls):
-                    self.result = the_app.handle_ratelimit(req, self.myname,
-                                                           'c', None)
+                    self.result = the_app.handle_ratelimit(
+                        FakeReq('PUT'), self.myname, 'c', None)
 
-        nt = 15
-        begin = time.time()
-        threads = []
-        for i in range(nt):
-            rc = rate_caller('a%s' % i)
-            rc.start()
-            threads.append(rc)
-        for thread in threads:
-            thread.join()
+        with mock.patch('swift.common.middleware.ratelimit.get_account_info',
+                        lambda *args, **kwargs: {}):
+            nt = 15
+            begin = time.time()
+            threads = []
+            for i in range(nt):
+                rc = rate_caller('a%s' % i)
+                rc.start()
+                threads.append(rc)
+            for thread in threads:
+                thread.join()
 
-        time_took = time.time() - begin
-        self.assertEquals(1.5, round(time_took, 1))
+            time_took = time.time() - begin
+            self.assertEqual(1.5, round(time_took, 1))
 
     def test_call_invalid_path(self):
         env = {'REQUEST_METHOD': 'GET',
@@ -392,47 +460,151 @@ def test_call_invalid_path(self):
                'SERVER_PROTOCOL': 'HTTP/1.0'}
 
         app = lambda *args, **kwargs: ['fake_app']
-        rate_mid = ratelimit.RateLimitMiddleware(app, {},
-                                                 logger=FakeLogger())
+        rate_mid = ratelimit.filter_factory({})(app)
 
         class a_callable(object):
 
             def __call__(self, *args, **kwargs):
                 pass
         resp = rate_mid.__call__(env, a_callable())
-        self.assert_('fake_app' == resp[0])
+        self.assertEqual('fake_app', resp[0])
+
+    def test_call_non_swift_api_path(self):
+        env = {'REQUEST_METHOD': 'GET',
+               'SCRIPT_NAME': '',
+               'PATH_INFO': '/ive/got/a/lovely/bunch/of/coconuts',
+               'SERVER_NAME': '127.0.0.1',
+               'SERVER_PORT': '80',
+               'swift.cache': FakeMemcache(),
+               'SERVER_PROTOCOL': 'HTTP/1.0'}
+
+        app = lambda *args, **kwargs: ['some response']
+        rate_mid = ratelimit.filter_factory({})(app)
+
+        class a_callable(object):
+
+            def __call__(self, *args, **kwargs):
+                pass
+
+        with mock.patch('swift.common.middleware.ratelimit.get_account_info',
+                        side_effect=Exception("you shouldn't call this")):
+            resp = rate_mid(env, a_callable())
+        self.assertEqual(resp[0], 'some response')
 
     def test_no_memcache(self):
         current_rate = 13
         num_calls = 5
         conf_dict = {'account_ratelimit': current_rate}
-        self.test_ratelimit = ratelimit.filter_factory(conf_dict)(FakeApp())
-        ratelimit.http_connect = mock_http_connect(204)
-        req = Request.blank('/v/a')
+        fake_app = FakeApp()
+        fake_app.skip_handled_check = True
+        self.test_ratelimit = ratelimit.filter_factory(conf_dict)(fake_app)
+        req = Request.blank('/v1/a')
         req.environ['swift.cache'] = None
         make_app_call = lambda: self.test_ratelimit(req.environ,
                                                     start_response)
         begin = time.time()
         self._run(make_app_call, num_calls, current_rate, check_time=False)
         time_took = time.time() - begin
-        self.assertEquals(round(time_took, 1), 0) # no memcache, no limiting
+        self.assertEqual(round(time_took, 1), 0)  # no memcache, no limiting
+
+    def test_already_handled(self):
+        current_rate = 13
+        num_calls = 5
+        conf_dict = {'container_listing_ratelimit_0': current_rate}
+        self.test_ratelimit = ratelimit.filter_factory(conf_dict)(FakeApp())
+        fake_cache = FakeMemcache()
+        fake_cache.set(
+            get_cache_key('a', 'c'),
+            {'object_count': 1})
+        req = Request.blank('/v1/a/c', environ={'swift.cache': fake_cache})
+        req.environ['swift.ratelimit.handled'] = True
+        make_app_call = lambda: self.test_ratelimit(req.environ,
+                                                    start_response)
+        begin = time.time()
+        self._run(make_app_call, num_calls, current_rate, check_time=False)
+        time_took = time.time() - begin
+        self.assertEqual(round(time_took, 1), 0)  # no memcache, no limiting
 
     def test_restarting_memcache(self):
         current_rate = 2
         num_calls = 5
         conf_dict = {'account_ratelimit': current_rate}
         self.test_ratelimit = ratelimit.filter_factory(conf_dict)(FakeApp())
-        ratelimit.http_connect = mock_http_connect(204)
-        req = Request.blank('/v/a/c')
+        req = Request.blank('/v1/a/c')
         req.method = 'PUT'
         req.environ['swift.cache'] = FakeMemcache()
         req.environ['swift.cache'].error_on_incr = True
         make_app_call = lambda: self.test_ratelimit(req.environ,
                                                     start_response)
         begin = time.time()
-        self._run(make_app_call, num_calls, current_rate, check_time=False)
-        time_took = time.time() - begin
-        self.assertEquals(round(time_took, 1), 0) # no memcache, no limiting
+        with mock.patch('swift.common.middleware.ratelimit.get_account_info',
+                        lambda *args, **kwargs: {}):
+            self._run(make_app_call, num_calls, current_rate, check_time=False)
+            time_took = time.time() - begin
+            self.assertEqual(round(time_took, 1), 0)  # no memcache, no limit
+
+
+class TestSwiftInfo(unittest.TestCase):
+    def setUp(self):
+        registry._swift_info = {}
+        registry._swift_admin_info = {}
+
+    def test_registered_defaults(self):
+
+        def check_key_is_absent(key):
+            try:
+                swift_info[key]
+            except KeyError as err:
+                if key not in str(err):
+                    raise
+
+        test_limits = {'account_ratelimit': 1,
+                       'max_sleep_time_seconds': 60,
+                       'container_ratelimit_0': 0,
+                       'container_ratelimit_10': 10,
+                       'container_ratelimit_50': 50,
+                       'container_listing_ratelimit_0': 0,
+                       'container_listing_ratelimit_10': 10,
+                       'container_listing_ratelimit_50': 50}
+
+        ratelimit.filter_factory(test_limits)('have to pass in an app')
+        swift_info = registry.get_swift_info()
+        self.assertIn('ratelimit', swift_info)
+        self.assertEqual(swift_info['ratelimit']
+                         ['account_ratelimit'], 1.0)
+        self.assertEqual(swift_info['ratelimit']
+                         ['max_sleep_time_seconds'], 60.0)
+        self.assertEqual(swift_info['ratelimit']
+                         ['container_ratelimits'][0][0], 0)
+        self.assertEqual(swift_info['ratelimit']
+                         ['container_ratelimits'][0][1], 0.0)
+        self.assertEqual(swift_info['ratelimit']
+                         ['container_ratelimits'][1][0], 10)
+        self.assertEqual(swift_info['ratelimit']
+                         ['container_ratelimits'][1][1], 10.0)
+        self.assertEqual(swift_info['ratelimit']
+                         ['container_ratelimits'][2][0], 50)
+        self.assertEqual(swift_info['ratelimit']
+                         ['container_ratelimits'][2][1], 50.0)
+        self.assertEqual(swift_info['ratelimit']
+                         ['container_listing_ratelimits'][0][0], 0)
+        self.assertEqual(swift_info['ratelimit']
+                         ['container_listing_ratelimits'][0][1], 0.0)
+        self.assertEqual(swift_info['ratelimit']
+                         ['container_listing_ratelimits'][1][0], 10)
+        self.assertEqual(swift_info['ratelimit']
+                         ['container_listing_ratelimits'][1][1], 10.0)
+        self.assertEqual(swift_info['ratelimit']
+                         ['container_listing_ratelimits'][2][0], 50)
+        self.assertEqual(swift_info['ratelimit']
+                         ['container_listing_ratelimits'][2][1], 50.0)
+
+        # these were left out on purpose
+        for key in ['log_sleep_time_seconds', 'clock_accuracy',
+                    'rate_buffer_seconds', 'ratelimit_whitelis',
+                    'ratelimit_blacklist']:
+            check_key_is_absent(key)
+
 
 if __name__ == '__main__':
     unittest.main()
diff --git a/test/unit/common/middleware/test_read_only.py b/test/unit/common/middleware/test_read_only.py
new file mode 100644
index 0000000000..5a6072cd9c
--- /dev/null
+++ b/test/unit/common/middleware/test_read_only.py
@@ -0,0 +1,266 @@
+# Copyright (c) 2010-2015 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from unittest import mock
+import unittest
+
+from swift.common.middleware import read_only
+from swift.common.swob import Request
+from test.debug_logger import debug_logger
+
+
+class FakeApp(object):
+    def __call__(self, env, start_response):
+        start_response('200 OK', [])
+        return [b'Some Content']
+
+
+def start_response(*args):
+    pass
+
+
+read_methods = 'GET HEAD'.split()
+write_methods = 'COPY DELETE POST PUT'.split()
+ro_resp = [b'Writes are disabled for this account.']
+
+
+class TestReadOnly(unittest.TestCase):
+    def test_global_read_only_off(self):
+        conf = {
+            'read_only': 'false',
+        }
+
+        ro = read_only.filter_factory(conf)(FakeApp())
+        ro.logger = debug_logger()
+
+        with mock.patch('swift.common.middleware.read_only.get_info',
+                        return_value={}):
+            for method in read_methods + write_methods:
+                req = Request.blank('/v1/a')
+                req.method = method
+                resp = ro(req.environ, start_response)
+                self.assertEqual(resp, [b'Some Content'])
+
+    def test_global_read_only_on(self):
+        conf = {
+            'read_only': 'true',
+        }
+
+        ro = read_only.filter_factory(conf)(FakeApp())
+        ro.logger = debug_logger()
+
+        with mock.patch('swift.common.middleware.read_only.get_info',
+                        return_value={}):
+            for method in read_methods:
+                req = Request.blank('/v1/a')
+                req.method = method
+                resp = ro(req.environ, start_response)
+                self.assertEqual(resp, [b'Some Content'])
+
+            for method in write_methods:
+                req = Request.blank('/v1/a')
+                req.method = method
+                resp = ro(req.environ, start_response)
+                self.assertEqual(ro_resp, resp)
+
+    def test_account_read_only_on(self):
+        conf = {}
+
+        ro = read_only.filter_factory(conf)(FakeApp())
+        ro.logger = debug_logger()
+
+        with mock.patch('swift.common.middleware.read_only.get_info',
+                        return_value={'sysmeta': {'read-only': 'true'}}):
+            for method in read_methods:
+                req = Request.blank('/v1/a')
+                req.method = method
+                resp = ro(req.environ, start_response)
+                self.assertEqual(resp, [b'Some Content'])
+
+            for method in write_methods:
+                req = Request.blank('/v1/a')
+                req.method = method
+                resp = ro(req.environ, start_response)
+                self.assertEqual(ro_resp, resp)
+
+    def test_account_read_only_off(self):
+        conf = {}
+
+        ro = read_only.filter_factory(conf)(FakeApp())
+        ro.logger = debug_logger()
+
+        with mock.patch('swift.common.middleware.read_only.get_info',
+                        return_value={'sysmeta': {'read-only': 'false'}}):
+            for method in read_methods + write_methods:
+                req = Request.blank('/v1/a')
+                req.method = method
+                resp = ro(req.environ, start_response)
+                self.assertEqual(resp, [b'Some Content'])
+
+    def test_global_read_only_on_account_off(self):
+        conf = {
+            'read_only': 'true',
+        }
+
+        ro = read_only.filter_factory(conf)(FakeApp())
+        ro.logger = debug_logger()
+
+        with mock.patch('swift.common.middleware.read_only.get_info',
+                        return_value={'sysmeta': {'read-only': 'false'}}):
+            for method in read_methods + write_methods:
+                req = Request.blank('/v1/a')
+                req.method = method
+                resp = ro(req.environ, start_response)
+                self.assertEqual(resp, [b'Some Content'])
+
+    def test_global_read_only_on_allow_deletes(self):
+        conf = {
+            'read_only': 'true',
+            'allow_deletes': 'true',
+        }
+
+        ro = read_only.filter_factory(conf)(FakeApp())
+        ro.logger = debug_logger()
+
+        with mock.patch('swift.common.middleware.read_only.get_info',
+                        return_value={}):
+            req = Request.blank('/v1/a')
+            req.method = "DELETE"
+            resp = ro(req.environ, start_response)
+            self.assertEqual(resp, [b'Some Content'])
+
+    def test_account_read_only_on_allow_deletes(self):
+        conf = {
+            'allow_deletes': 'true',
+        }
+
+        ro = read_only.filter_factory(conf)(FakeApp())
+        ro.logger = debug_logger()
+
+        with mock.patch('swift.common.middleware.read_only.get_info',
+                        return_value={'sysmeta': {'read-only': 'on'}}):
+            req = Request.blank('/v1/a')
+            req.method = "DELETE"
+            resp = ro(req.environ, start_response)
+            self.assertEqual(resp, [b'Some Content'])
+
+    def test_global_read_only_on_destination_account_off_on_copy(self):
+        conf = {
+            'read_only': 'true',
+        }
+
+        ro = read_only.filter_factory(conf)(FakeApp())
+        ro.logger = debug_logger()
+
+        def get_fake_read_only(*args, **kwargs):
+            if 'b' in args:
+                return {'sysmeta': {'read-only': 'false'}}
+            return {}
+
+        with mock.patch('swift.common.middleware.read_only.get_info',
+                        get_fake_read_only):
+            headers = {'Destination-Account': 'b'}
+            req = Request.blank('/v1/a', headers=headers)
+            req.method = "COPY"
+            resp = ro(req.environ, start_response)
+            self.assertEqual(resp, [b'Some Content'])
+
+    def test_global_read_only_off_destination_account_on_on_copy(self):
+        conf = {}
+
+        ro = read_only.filter_factory(conf)(FakeApp())
+        ro.logger = debug_logger()
+
+        def get_fake_read_only(*args, **kwargs):
+            if 'b' in args:
+                return {'sysmeta': {'read-only': 'true'}}
+            return {}
+
+        with mock.patch('swift.common.middleware.read_only.get_info',
+                        get_fake_read_only):
+            headers = {'Destination-Account': 'b'}
+            req = Request.blank('/v1/a', headers=headers)
+            req.method = "COPY"
+            resp = ro(req.environ, start_response)
+            self.assertEqual(ro_resp, resp)
+
+    def test_global_read_only_off_src_acct_on_dest_acct_off_on_copy(self):
+        conf = {}
+
+        ro = read_only.filter_factory(conf)(FakeApp())
+        ro.logger = debug_logger()
+
+        def fake_account_read_only(self, req, account):
+            if account == 'a':
+                return 'on'
+            return ''
+
+        with mock.patch(
+                'swift.common.middleware.read_only.ReadOnlyMiddleware.' +
+                'account_read_only',
+                fake_account_read_only):
+            headers = {'Destination-Account': 'b'}
+            req = Request.blank('/v1/a', headers=headers)
+            req.method = "COPY"
+            resp = ro(req.environ, start_response)
+            self.assertEqual(resp, [b'Some Content'])
+
+    def test_global_read_only_off_src_acct_on_dest_acct_on_on_copy(self):
+        conf = {}
+
+        ro = read_only.filter_factory(conf)(FakeApp())
+        ro.logger = debug_logger()
+
+        with mock.patch(
+                'swift.common.middleware.read_only.ReadOnlyMiddleware.' +
+                'account_read_only',
+                return_value='true'):
+            headers = {'Destination-Account': 'b'}
+            req = Request.blank('/v1/a', headers=headers)
+            req.method = "COPY"
+            resp = ro(req.environ, start_response)
+            self.assertEqual(ro_resp, resp)
+
+    def test_global_read_only_non_swift_path(self):
+        conf = {}
+
+        ro = read_only.filter_factory(conf)(FakeApp())
+        ro.logger = debug_logger()
+
+        def fake_account_read_only(self, req, account):
+            return 'on'
+
+        with mock.patch(
+                'swift.common.middleware.read_only.ReadOnlyMiddleware.' +
+                'account_read_only',
+                fake_account_read_only):
+            req = Request.blank('/auth/v3.14')
+            req.method = "POST"
+            resp = ro(req.environ, start_response)
+            self.assertEqual(resp, [b'Some Content'])
+
+            req = Request.blank('/v1')
+            req.method = "PUT"
+            resp = ro(req.environ, start_response)
+            self.assertEqual(resp, [b'Some Content'])
+
+            req = Request.blank('/v1.0/')
+            req.method = "DELETE"
+            resp = ro(req.environ, start_response)
+            self.assertEqual(resp, [b'Some Content'])
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/test_recon.py b/test/unit/common/middleware/test_recon.py
index 5bcc936d9b..92357dfd08 100644
--- a/test/unit/common/middleware/test_recon.py
+++ b/test/unit/common/middleware/test_recon.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,34 +13,62 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-import unittest
-from unittest import TestCase
+import array
 from contextlib import contextmanager
-from posix import stat_result, statvfs_result
+import errno
+import json
+from unittest import mock
 import os
+from posix import stat_result, statvfs_result
+from shutil import rmtree
+import tempfile
+import time
+import unittest
+from unittest import TestCase
 
-import swift.common.constraints
+from swift import __version__ as swiftver
+from swift.common import ring, utils
+from swift.common.recon import RECON_RELINKER_FILE, RECON_DRIVE_FILE, \
+    DEFAULT_RECON_CACHE_PATH, server_type_to_recon_file
 from swift.common.swob import Request
 from swift.common.middleware import recon
+from swift.common.storage_policy import StoragePolicy
+from test.debug_logger import debug_logger
+from test.unit import patch_policies
+
+
+def fake_check_mount(a, b):
+    raise OSError('Input/Output Error')
+
+
+def fail_os_listdir():
+    raise OSError('No such file or directory')
+
+
+def fail_io_open(file_path, open_mode):
+    raise IOError('No such file or directory')
 
 
 class FakeApp(object):
     def __call__(self, env, start_response):
-        return "FAKE APP"
+        return b"FAKE APP"
+
 
 def start_response(*args):
     pass
 
+
 class FakeFromCache(object):
 
     def __init__(self, out=None):
         self.fakeout = out
-        self.fakeout_calls  = []
+        self.fakeout_calls = []
 
     def fake_from_recon_cache(self, *args, **kwargs):
         self.fakeout_calls.append((args, kwargs))
         return self.fakeout
 
+
 class OpenAndReadTester(object):
 
     def __init__(self, output_iter):
@@ -54,7 +82,7 @@ def __init__(self, output_iter):
     def __iter__(self):
         return self
 
-    def next(self):
+    def __next__(self):
         if self.index == self.out_len:
             raise StopIteration
         else:
@@ -65,7 +93,7 @@ def next(self):
     def read(self, *args, **kwargs):
         self.read_calls.append((args, kwargs))
         try:
-            return self.output_iter.next()
+            return next(self.output_iter)
         except StopIteration:
             return ''
 
@@ -74,35 +102,39 @@ def open(self, *args, **kwargs):
         self.open_calls.append((args, kwargs))
         yield self
 
+
 class MockOS(object):
 
-    def __init__(self, ls_out=None, pe_out=None, statvfs_out=None,
-                 lstat_out=(1, 1, 5, 4, 5, 5, 55, 55, 55, 55)):
+    def __init__(self, ls_out=None, isdir_out=None, ismount_out=False,
+                 statvfs_out=None):
         self.ls_output = ls_out
-        self.path_exists_output = pe_out
+        self.isdir_output = isdir_out
+        self.ismount_output = ismount_out
         self.statvfs_output = statvfs_out
-        self.lstat_output_tuple = lstat_out
         self.listdir_calls = []
+        self.isdir_calls = []
+        self.ismount_calls = []
         self.statvfs_calls = []
-        self.path_exists_calls = []
-        self.lstat_calls = []
 
     def fake_listdir(self, *args, **kwargs):
         self.listdir_calls.append((args, kwargs))
         return self.ls_output
 
-    def fake_path_exists(self, *args, **kwargs):
-        self.path_exists_calls.append((args, kwargs))
-        return self.path_exists_output
+    def fake_isdir(self, *args, **kwargs):
+        self.isdir_calls.append((args, kwargs))
+        return self.isdir_output
+
+    def fake_ismount(self, *args, **kwargs):
+        self.ismount_calls.append((args, kwargs))
+        if isinstance(self.ismount_output, Exception):
+            raise self.ismount_output
+        else:
+            return self.ismount_output
 
     def fake_statvfs(self, *args, **kwargs):
         self.statvfs_calls.append((args, kwargs))
         return statvfs_result(self.statvfs_output)
 
-    def fake_lstat(self, *args, **kwargs):
-        self.lstat_calls.append((args, kwargs))
-        return stat_result(self.lstat_output_tuple)
-
 
 class FakeRecon(object):
 
@@ -128,6 +160,15 @@ def fake_replication(self, recon_type):
         self.fake_replication_rtype = recon_type
         return {'replicationtest': "1"}
 
+    def fake_sharding(self):
+        return {"sharding_stats": "1"}
+
+    def fake_relinker(self):
+        return {"relinktest": "1"}
+
+    def fake_reconstruction(self):
+        return {'reconstructiontest': "1"}
+
     def fake_updater(self, recon_type):
         self.fake_updater_rtype = recon_type
         return {'updatertest': "1"}
@@ -146,7 +187,7 @@ def fake_mounted(self):
     def fake_unmounted(self):
         return {'unmountedtest': "1"}
 
-    def fake_no_unmounted(self):
+    def fake_unmounted_empty(self):
         return []
 
     def fake_diskusage(self):
@@ -155,17 +196,28 @@ def fake_diskusage(self):
     def fake_ringmd5(self):
         return {'ringmd5test': "1"}
 
+    def fake_swiftconfmd5(self):
+        return {'/etc/swift/swift.conf': "abcdef"}
+
     def fake_quarantined(self):
         return {'quarantinedtest': "1"}
 
     def fake_sockstat(self):
         return {'sockstattest': "1"}
 
+    def fake_driveaudit(self):
+        return {'driveaudittest': "1"}
+
+    def fake_time(self):
+        return {'timetest': "1"}
+
     def nocontent(self):
         return None
 
-    def raise_IOError(self, *args, **kwargs):
-        raise IOError
+    def raise_IOError(self, errno=None):
+        mock_obj = mock.MagicMock()
+        mock_obj.side_effect = IOError(errno, str(errno))
+        return mock_obj
 
     def raise_ValueError(self, *args, **kwargs):
         raise ValueError
@@ -173,116 +225,375 @@ def raise_ValueError(self, *args, **kwargs):
     def raise_Exception(self, *args, **kwargs):
         raise Exception
 
+
+@patch_policies(legacy_only=True)
 class TestReconSuccess(TestCase):
 
     def setUp(self):
-        self.app = recon.ReconMiddleware(FakeApp(), {})
+        self.tempdir = tempfile.mkdtemp(prefix='swift_recon_md5_test')
+        utils.mkdirs(self.tempdir)
+        self.app = self._get_app()
         self.mockos = MockOS()
         self.fakecache = FakeFromCache()
         self.real_listdir = os.listdir
-        self.real_path_exists = os.path.exists
-        self.real_lstat = os.lstat
+        self.real_isdir = os.path.isdir
+        self.real_ismount = utils.ismount
         self.real_statvfs = os.statvfs
         os.listdir = self.mockos.fake_listdir
-        os.path.exists = self.mockos.fake_path_exists
-        os.lstat = self.mockos.fake_lstat
+        os.path.isdir = self.mockos.fake_isdir
+        utils.ismount = self.mockos.fake_ismount
         os.statvfs = self.mockos.fake_statvfs
         self.real_from_cache = self.app._from_recon_cache
         self.app._from_recon_cache = self.fakecache.fake_from_recon_cache
         self.frecon = FakeRecon()
+        self.app.logger = debug_logger()
+
+        # replace hash md5 implementation of the md5_hash_for_file function
+        mock_hash_for_file = mock.patch(
+            'swift.common.middleware.recon.md5_hash_for_file',
+            lambda f, **kwargs: 'hash-' + os.path.basename(f))
+        self.addCleanup(mock_hash_for_file.stop)
+        mock_hash_for_file.start()
+
+        self.ring_part_shift = 5
+        self.ring_devs = [{'id': 0, 'zone': 0, 'weight': 1.0,
+                           'ip': '10.1.1.1', 'port': 6200,
+                           'device': 'sda1'},
+                          {'id': 1, 'zone': 0, 'weight': 1.0,
+                           'ip': '10.1.1.1', 'port': 6200,
+                           'device': 'sdb1'},
+                          None,
+                          {'id': 3, 'zone': 2, 'weight': 1.0,
+                           'ip': '10.1.2.1', 'port': 6200,
+                           'device': 'sdc1'},
+                          {'id': 4, 'zone': 2, 'weight': 1.0,
+                           'ip': '10.1.2.2', 'port': 6200,
+                           'device': 'sdd1'}]
+        self._create_rings()
 
     def tearDown(self):
         os.listdir = self.real_listdir
-        os.path.exists = self.real_path_exists
-        os.lstat = self.real_lstat
+        os.path.isdir = self.real_isdir
+        utils.ismount = self.real_ismount
         os.statvfs = self.real_statvfs
         del self.mockos
         self.app._from_recon_cache = self.real_from_cache
         del self.fakecache
+        rmtree(self.tempdir)
+
+    def _get_app(self):
+        app = recon.ReconMiddleware(FakeApp(), {'swift_dir': self.tempdir})
+        return app
+
+    def _create_ring(self, ringpath, replica_map, devs, part_shift):
+        ring.RingData(replica_map, devs, part_shift).save(ringpath,
+                                                          mtime=None)
+
+    def _create_rings(self):
+        # make the rings unique so they have different md5 sums
+        rings = {
+            'account.ring.gz': [
+                array.array('H', [3, 1, 3, 1]),
+                array.array('H', [0, 3, 1, 4]),
+                array.array('H', [1, 4, 0, 3])],
+            'container.ring.gz': [
+                array.array('H', [4, 3, 0, 1]),
+                array.array('H', [0, 1, 3, 4]),
+                array.array('H', [3, 4, 0, 1])],
+            'object.ring.gz': [
+                array.array('H', [0, 1, 0, 1]),
+                array.array('H', [0, 1, 0, 1]),
+                array.array('H', [3, 4, 3, 4])],
+            'object-1.ring.gz': [
+                array.array('H', [1, 0, 1, 0]),
+                array.array('H', [1, 0, 1, 0]),
+                array.array('H', [4, 3, 4, 3])],
+            'object-2.ring.gz': [
+                array.array('H', [1, 1, 1, 0]),
+                array.array('H', [1, 0, 1, 3]),
+                array.array('H', [4, 2, 4, 3])]
+        }
+
+        for ringfn, replica_map in rings.items():
+            ringpath = os.path.join(self.tempdir, ringfn)
+            self._create_ring(ringpath, replica_map, self.ring_devs,
+                              self.ring_part_shift)
+
+    def _full_recon_path(self, server_type, recon_file=None):
+        if server_type:
+            recon_file = server_type_to_recon_file(server_type)
+        return os.path.join(DEFAULT_RECON_CACHE_PATH, recon_file)
+
+    @patch_policies([
+        StoragePolicy(0, 'stagecoach'),
+        StoragePolicy(1, 'pinto', is_deprecated=True),
+        StoragePolicy(2, 'toyota', is_default=True),
+    ])
+    def test_get_ring_md5(self):
+        # We should only see configured and present rings, so to handle the
+        # "normal" case just patch the policies to match the existing rings.
+        expt_out = {'%s/account.ring.gz' % self.tempdir:
+                    'hash-account.ring.gz',
+                    '%s/container.ring.gz' % self.tempdir:
+                    'hash-container.ring.gz',
+                    '%s/object.ring.gz' % self.tempdir:
+                    'hash-object.ring.gz',
+                    '%s/object-1.ring.gz' % self.tempdir:
+                    'hash-object-1.ring.gz',
+                    '%s/object-2.ring.gz' % self.tempdir:
+                    'hash-object-2.ring.gz'}
+
+        # We need to instantiate app after overriding the configured policies.
+        app = self._get_app()
+        # object-{1,2}.ring.gz should both appear as they are present on disk
+        # and were configured as policies.
+        self.assertEqual(sorted(app.get_ring_md5().items()),
+                         sorted(expt_out.items()))
+
+    def test_get_ring_md5_ioerror_produces_none_hash(self):
+        # Ring files that are present but produce an IOError on read should
+        # still produce a ringmd5 entry with a None for the hash. Note that
+        # this is different than if an expected ring file simply doesn't exist,
+        # in which case it is excluded altogether from the ringmd5 response.
+        expt_out = {'%s/account.ring.gz' % self.tempdir: None,
+                    '%s/container.ring.gz' % self.tempdir: None,
+                    '%s/object.ring.gz' % self.tempdir: None}
+        with mock.patch('swift.common.middleware.recon.md5_hash_for_file',
+                        side_effect=IOError):
+            ringmd5 = self.app.get_ring_md5()
+        self.assertEqual(sorted(ringmd5.items()),
+                         sorted(expt_out.items()))
+
+    def test_get_ring_md5_failed_ring_hash_recovers_without_restart(self):
+        # Ring files that are present but produce an IOError on read will
+        # show a None hash, but if they can be read later their hash
+        # should become available in the ringmd5 response.
+        expt_out = {'%s/account.ring.gz' % self.tempdir: None,
+                    '%s/container.ring.gz' % self.tempdir: None,
+                    '%s/object.ring.gz' % self.tempdir: None}
+        with mock.patch('swift.common.middleware.recon.md5_hash_for_file',
+                        side_effect=IOError):
+            ringmd5 = self.app.get_ring_md5()
+        self.assertEqual(sorted(ringmd5.items()),
+                         sorted(expt_out.items()))
+
+        # If we fix a ring and it can be read again, its hash should then
+        # appear using the same app instance
+        def fake_hash_for_file(fn):
+            if 'object' not in fn:
+                raise IOError
+            return 'hash-' + os.path.basename(fn)
+
+        expt_out = {'%s/account.ring.gz' % self.tempdir: None,
+                    '%s/container.ring.gz' % self.tempdir: None,
+                    '%s/object.ring.gz' % self.tempdir:
+                    'hash-object.ring.gz'}
+
+        with mock.patch('swift.common.middleware.recon.md5_hash_for_file',
+                        fake_hash_for_file):
+            ringmd5 = self.app.get_ring_md5()
+        self.assertEqual(sorted(ringmd5.items()),
+                         sorted(expt_out.items()))
+
+    @patch_policies([
+        StoragePolicy(0, 'stagecoach'),
+        StoragePolicy(2, 'bike', is_default=True),
+        StoragePolicy(3502, 'train')
+    ])
+    def test_get_ring_md5_missing_ring_recovers_without_restart(self):
+        # If a configured ring is missing when the app is instantiated, but is
+        # later moved into place, we shouldn't need to restart object-server
+        # for it to appear in recon.
+        expt_out = {'%s/account.ring.gz' % self.tempdir:
+                    'hash-account.ring.gz',
+                    '%s/container.ring.gz' % self.tempdir:
+                    'hash-container.ring.gz',
+                    '%s/object.ring.gz' % self.tempdir:
+                    'hash-object.ring.gz',
+                    '%s/object-2.ring.gz' % self.tempdir:
+                    'hash-object-2.ring.gz'}
+
+        # We need to instantiate app after overriding the configured policies.
+        app = self._get_app()
+        # object-1.ring.gz should not appear as it's present but unconfigured.
+        # object-3502.ring.gz should not appear as it's configured but not
+        # (yet) present.
+        self.assertEqual(sorted(app.get_ring_md5().items()),
+                         sorted(expt_out.items()))
+
+        # Simulate the configured policy's missing ringfile being moved into
+        # place during runtime
+        ringfn = 'object-3502.ring.gz'
+        ringpath = os.path.join(self.tempdir, ringfn)
+        ringmap = [array.array('H', [1, 2, 1, 4]),
+                   array.array('H', [4, 0, 1, 3]),
+                   array.array('H', [1, 1, 0, 3])]
+        self._create_ring(os.path.join(self.tempdir, ringfn),
+                          ringmap, self.ring_devs, self.ring_part_shift)
+        expt_out[ringpath] = 'hash-' + ringfn
+
+        # We should now see it in the ringmd5 response, without a restart
+        # (using the same app instance)
+        self.assertEqual(sorted(app.get_ring_md5().items()),
+                         sorted(expt_out.items()))
+
+    @patch_policies([
+        StoragePolicy(0, 'stagecoach', is_default=True),
+        StoragePolicy(2, 'bike'),
+        StoragePolicy(2305, 'taxi')
+    ])
+    def test_get_ring_md5_excludes_configured_missing_obj_rings(self):
+        # Object rings that are configured but missing aren't meant to appear
+        # in the ringmd5 response.
+        expt_out = {'%s/account.ring.gz' % self.tempdir:
+                    'hash-account.ring.gz',
+                    '%s/container.ring.gz' % self.tempdir:
+                    'hash-container.ring.gz',
+                    '%s/object.ring.gz' % self.tempdir:
+                    'hash-object.ring.gz',
+                    '%s/object-2.ring.gz' % self.tempdir:
+                    'hash-object-2.ring.gz'}
+
+        # We need to instantiate app after overriding the configured policies.
+        app = self._get_app()
+        # object-1.ring.gz should not appear as it's present but unconfigured.
+        # object-2305.ring.gz should not appear as it's configured but not
+        # present.
+        self.assertEqual(sorted(app.get_ring_md5().items()),
+                         sorted(expt_out.items()))
+
+    @patch_policies([
+        StoragePolicy(0, 'zero', is_default=True),
+    ])
+    def test_get_ring_md5_excludes_unconfigured_present_obj_rings(self):
+        # Object rings that are present but not configured in swift.conf
+        # aren't meant to appear in the ringmd5 response.
+        expt_out = {'%s/account.ring.gz' % self.tempdir:
+                    'hash-account.ring.gz',
+                    '%s/container.ring.gz' % self.tempdir:
+                    'hash-container.ring.gz',
+                    '%s/object.ring.gz' % self.tempdir:
+                    'hash-object.ring.gz'}
+
+        # We need to instantiate app after overriding the configured policies.
+        app = self._get_app()
+        # object-{1,2}.ring.gz should not appear as they are present on disk
+        # but were not configured as policies.
+        self.assertEqual(sorted(app.get_ring_md5().items()),
+                         sorted(expt_out.items()))
 
     def test_from_recon_cache(self):
         oart = OpenAndReadTester(['{"notneeded": 5, "testkey1": "canhazio"}'])
         self.app._from_recon_cache = self.real_from_cache
         rv = self.app._from_recon_cache(['testkey1', 'notpresentkey'],
-                                         'test.cache', openr=oart.open)
-        self.assertEquals(oart.read_calls, [((), {})])
-        self.assertEquals(oart.open_calls, [(('test.cache', 'r'), {})])
-        self.assertEquals(rv, {'notpresentkey': None, 'testkey1': 'canhazio'})
+                                        'test.cache', openr=oart.open)
+        self.assertEqual(oart.read_calls, [((), {})])
+        self.assertEqual(oart.open_calls, [(('test.cache', 'r'), {})])
+        self.assertEqual(rv, {'notpresentkey': None, 'testkey1': 'canhazio'})
         self.app._from_recon_cache = self.fakecache.fake_from_recon_cache
 
     def test_from_recon_cache_ioerror(self):
-        oart = self.frecon.raise_IOError
+        oart = self.frecon.raise_IOError()
         self.app._from_recon_cache = self.real_from_cache
         rv = self.app._from_recon_cache(['testkey1', 'notpresentkey'],
-                                         'test.cache', openr=oart)
-        self.assertEquals(rv, {'notpresentkey': None, 'testkey1': None})
+                                        'test.cache', openr=oart)
+        self.assertEqual(rv, {'notpresentkey': None, 'testkey1': None})
+        self.assertIn('Error reading recon cache file: ',
+                      self.app.logger.get_lines_for_level('error'))
+        # Now try with ignore_missing but not ENOENT
+        self.app.logger.clear()
+        rv = self.app._from_recon_cache(['testkey1', 'notpresentkey'],
+                                        'test.cache', openr=oart,
+                                        ignore_missing=True)
+        self.assertEqual(rv, {'notpresentkey': None, 'testkey1': None})
+        self.assertIn('Error reading recon cache file: ',
+                      self.app.logger.get_lines_for_level('error'))
+        # Now try again with ignore_missing with ENOENT
+        self.app.logger.clear()
+        oart = self.frecon.raise_IOError(errno.ENOENT)
+        rv = self.app._from_recon_cache(['testkey1', 'notpresentkey'],
+                                        'test.cache', openr=oart,
+                                        ignore_missing=True)
+        self.assertEqual(rv, {'notpresentkey': None, 'testkey1': None})
+        self.assertEqual(self.app.logger.get_lines_for_level('error'), [])
         self.app._from_recon_cache = self.fakecache.fake_from_recon_cache
 
     def test_from_recon_cache_valueerror(self):
         oart = self.frecon.raise_ValueError
         self.app._from_recon_cache = self.real_from_cache
         rv = self.app._from_recon_cache(['testkey1', 'notpresentkey'],
-                                         'test.cache', openr=oart)
-        self.assertEquals(rv, {'notpresentkey': None, 'testkey1': None})
+                                        'test.cache', openr=oart)
+        self.assertEqual(rv, {'notpresentkey': None, 'testkey1': None})
+        self.assertIn('Error parsing recon cache file: ',
+                      self.app.logger.get_lines_for_level('error'))
         self.app._from_recon_cache = self.fakecache.fake_from_recon_cache
 
     def test_from_recon_cache_exception(self):
         oart = self.frecon.raise_Exception
         self.app._from_recon_cache = self.real_from_cache
         rv = self.app._from_recon_cache(['testkey1', 'notpresentkey'],
-                                         'test.cache', openr=oart)
-        self.assertEquals(rv, {'notpresentkey': None, 'testkey1': None})
+                                        'test.cache', openr=oart)
+        self.assertEqual(rv, {'notpresentkey': None, 'testkey1': None})
+        self.assertIn('Error retrieving recon data: ',
+                      self.app.logger.get_lines_for_level('error'))
         self.app._from_recon_cache = self.fakecache.fake_from_recon_cache
 
     def test_get_mounted(self):
-        mounts_content = ['rootfs / rootfs rw 0 0',
-                          'none /sys sysfs rw,nosuid,nodev,noexec,relatime 0 0',
-                          'none /proc proc rw,nosuid,nodev,noexec,relatime 0 0',
-                          'none /dev devtmpfs rw,relatime,size=248404k,nr_inodes=62101,mode=755 0 0',
-                          'none /dev/pts devpts rw,nosuid,noexec,relatime,gid=5,mode=620,ptmxmode=000 0 0',
-                          '/dev/disk/by-uuid/e5b143bd-9f31-49a7-b018-5e037dc59252 / ext4 rw,relatime,errors=remount-ro,barrier=1,data=ordered 0 0',
-                          'none /sys/fs/fuse/connections fusectl rw,relatime 0 0',
-                          'none /sys/kernel/debug debugfs rw,relatime 0 0',
-                          'none /sys/kernel/security securityfs rw,relatime 0 0',
-                          'none /dev/shm tmpfs rw,nosuid,nodev,relatime 0 0',
-                          'none /var/run tmpfs rw,nosuid,relatime,mode=755 0 0',
-                          'none /var/lock tmpfs rw,nosuid,nodev,noexec,relatime 0 0',
-                          'none /lib/init/rw tmpfs rw,nosuid,relatime,mode=755 0 0',
-                          '/dev/loop0 /mnt/sdb1 xfs rw,noatime,nodiratime,attr2,nobarrier,logbufs=8,noquota 0 0',
-                          'rpc_pipefs /var/lib/nfs/rpc_pipefs rpc_pipefs rw,relatime 0 0',
-                          'nfsd /proc/fs/nfsd nfsd rw,relatime 0 0',
-                          'none /proc/fs/vmblock/mountPoint vmblock rw,relatime 0 0',
-                          '']
-        mounted_resp = [{'device': 'rootfs', 'path': '/'},
-                        {'device': 'none', 'path': '/sys'},
-                        {'device': 'none', 'path': '/proc'},
-                        {'device': 'none', 'path': '/dev'},
-                        {'device': 'none', 'path': '/dev/pts'},
-                        {'device': '/dev/disk/by-uuid/e5b143bd-9f31-49a7-b018-5e037dc59252', 'path': '/'},
-                        {'device': 'none', 'path': '/sys/fs/fuse/connections'},
-                        {'device': 'none', 'path': '/sys/kernel/debug'},
-                        {'device': 'none', 'path': '/sys/kernel/security'},
-                        {'device': 'none', 'path': '/dev/shm'},
-                        {'device': 'none', 'path': '/var/run'},
-                        {'device': 'none', 'path': '/var/lock'},
-                        {'device': 'none', 'path': '/lib/init/rw'},
-                        {'device': '/dev/loop0', 'path': '/mnt/sdb1'},
-                        {'device': 'rpc_pipefs', 'path': '/var/lib/nfs/rpc_pipefs'},
-                        {'device': 'nfsd', 'path': '/proc/fs/nfsd'},
-                        {'device': 'none', 'path': '/proc/fs/vmblock/mountPoint'}]
+        mounts_content = [
+            'rootfs / rootfs rw 0 0',
+            'none /sys sysfs rw,nosuid,nodev,noexec,relatime 0 0',
+            'none /proc proc rw,nosuid,nodev,noexec,relatime 0 0',
+            'none /dev devtmpfs rw,relatime,size=248404k,nr_inodes=62101,'
+            'mode=755 0 0',
+            'none /dev/pts devpts rw,nosuid,noexec,relatime,gid=5,mode=620,'
+            'ptmxmode=000 0 0',
+            '/dev/disk/by-uuid/e5b143bd-9f31-49a7-b018-5e037dc59252 / ext4'
+            ' rw,relatime,errors=remount-ro,barrier=1,data=ordered 0 0',
+            'none /sys/fs/fuse/connections fusectl rw,relatime 0 0',
+            'none /sys/kernel/debug debugfs rw,relatime 0 0',
+            'none /sys/kernel/security securityfs rw,relatime 0 0',
+            'none /dev/shm tmpfs rw,nosuid,nodev,relatime 0 0',
+            'none /var/run tmpfs rw,nosuid,relatime,mode=755 0 0',
+            'none /var/lock tmpfs rw,nosuid,nodev,noexec,relatime 0 0',
+            'none /lib/init/rw tmpfs rw,nosuid,relatime,mode=755 0 0',
+            '/dev/loop0 /mnt/sdb1 xfs rw,noatime,nodiratime,attr2,'
+            'logbufs=8,noquota 0 0',
+            'rpc_pipefs /var/lib/nfs/rpc_pipefs rpc_pipefs rw,relatime 0 0',
+            'nfsd /proc/fs/nfsd nfsd rw,relatime 0 0',
+            'none /proc/fs/vmblock/mountPoint vmblock rw,relatime 0 0',
+            '']
+        mounted_resp = [
+            {'device': 'rootfs', 'path': '/'},
+            {'device': 'none', 'path': '/sys'},
+            {'device': 'none', 'path': '/proc'},
+            {'device': 'none', 'path': '/dev'},
+            {'device': 'none', 'path': '/dev/pts'},
+            {'device': '/dev/disk/by-uuid/'
+             'e5b143bd-9f31-49a7-b018-5e037dc59252', 'path': '/'},
+            {'device': 'none', 'path': '/sys/fs/fuse/connections'},
+            {'device': 'none', 'path': '/sys/kernel/debug'},
+            {'device': 'none', 'path': '/sys/kernel/security'},
+            {'device': 'none', 'path': '/dev/shm'},
+            {'device': 'none', 'path': '/var/run'},
+            {'device': 'none', 'path': '/var/lock'},
+            {'device': 'none', 'path': '/lib/init/rw'},
+            {'device': '/dev/loop0', 'path': '/mnt/sdb1'},
+            {'device': 'rpc_pipefs', 'path': '/var/lib/nfs/rpc_pipefs'},
+            {'device': 'nfsd', 'path': '/proc/fs/nfsd'},
+            {'device': 'none', 'path': '/proc/fs/vmblock/mountPoint'}]
         oart = OpenAndReadTester(mounts_content)
         rv = self.app.get_mounted(openr=oart.open)
-        self.assertEquals(oart.open_calls, [(('/proc/mounts', 'r'), {})])
-        self.assertEquals(rv, mounted_resp)
+        self.assertEqual(oart.open_calls, [(('/proc/mounts', 'r'), {})])
+        self.assertEqual(rv, mounted_resp)
 
     def test_get_load(self):
         oart = OpenAndReadTester(['0.03 0.03 0.00 1/220 16306'])
         rv = self.app.get_load(openr=oart.open)
-        self.assertEquals(oart.read_calls, [((), {})])
-        self.assertEquals(oart.open_calls, [(('/proc/loadavg', 'r'), {})])
-        self.assertEquals(rv, {'5m': 0.029999999999999999, '15m': 0.0,
-                               'processes': 16306, 'tasks': '1/220',
-                               '1m': 0.029999999999999999})
+        self.assertEqual(oart.read_calls, [((), {})])
+        self.assertEqual(oart.open_calls, [(('/proc/loadavg', 'r'), {})])
+        self.assertEqual(rv, {'5m': 0.029999999999999999, '15m': 0.0,
+                              'processes': 16306, 'tasks': '1/220',
+                              '1m': 0.029999999999999999})
 
     def test_get_mem(self):
         meminfo_content = ['MemTotal:         505840 kB',
@@ -370,95 +681,185 @@ def test_get_mem(self):
                         'Dirty': '104 kB'}
         oart = OpenAndReadTester(meminfo_content)
         rv = self.app.get_mem(openr=oart.open)
-        self.assertEquals(oart.open_calls, [(('/proc/meminfo', 'r'), {})])
-        self.assertEquals(rv, meminfo_resp)
+        self.assertEqual(oart.open_calls, [(('/proc/meminfo', 'r'), {})])
+        self.assertEqual(rv, meminfo_resp)
 
     def test_get_async_info(self):
-        from_cache_response = {'async_pending': 5}
+        now = time.time()
+        from_cache_response = {'async_pending': 5, 'async_pending_last': now}
         self.fakecache.fakeout = from_cache_response
         rv = self.app.get_async_info()
-        self.assertEquals(rv, {'async_pending': 5})
+        self.assertEqual(self.fakecache.fakeout_calls,
+                         [((['async_pending', 'async_pending_last'],
+                             self._full_recon_path('object')), {})])
+        self.assertEqual(rv, {'async_pending': 5, 'async_pending_last': now})
 
     def test_get_replication_info_account(self):
-        from_cache_response = {"replication_stats": {
-                                    "attempted": 1, "diff": 0,
-                                    "diff_capped": 0, "empty": 0,
-                                    "failure": 0, "hashmatch": 0,
-                                    "no_change": 2, "remote_merge": 0,
-                                    "remove": 0, "rsync": 0,
-                                    "start": 1333044050.855202,
-                                    "success": 2, "ts_repl": 0 },
-                               "replication_time": 0.2615511417388916}
+        from_cache_response = {
+            "replication_stats": {
+                "attempted": 1, "diff": 0,
+                "diff_capped": 0, "empty": 0,
+                "failure": 0, "hashmatch": 0,
+                "failure_nodes": {
+                    "192.168.0.1": 0,
+                    "192.168.0.2": 0},
+                "no_change": 2, "remote_merge": 0,
+                "remove": 0, "rsync": 0,
+                "start": 1333044050.855202,
+                "success": 2, "ts_repl": 0},
+            "replication_time": 0.2615511417388916,
+            "replication_last": 1357969645.25}
         self.fakecache.fakeout = from_cache_response
         rv = self.app.get_replication_info('account')
-        self.assertEquals(self.fakecache.fakeout_calls,
-                            [((['replication_time', 'replication_stats'],
-                                '/var/cache/swift/account.recon'), {})])
-        self.assertEquals(rv, {"replication_stats": {
-                                    "attempted": 1, "diff": 0,
-                                    "diff_capped": 0, "empty": 0,
-                                    "failure": 0, "hashmatch": 0,
-                                    "no_change": 2, "remote_merge": 0,
-                                    "remove": 0, "rsync": 0,
-                                    "start": 1333044050.855202,
-                                    "success": 2, "ts_repl": 0 },
-                                "replication_time": 0.2615511417388916})
+        self.assertEqual(self.fakecache.fakeout_calls,
+                         [((['replication_time', 'replication_stats',
+                             'replication_last'],
+                             self._full_recon_path('account')), {})])
+        self.assertEqual(rv, {
+            "replication_stats": {
+                "attempted": 1, "diff": 0,
+                "diff_capped": 0, "empty": 0,
+                "failure": 0, "hashmatch": 0,
+                "failure_nodes": {
+                    "192.168.0.1": 0,
+                    "192.168.0.2": 0},
+                "no_change": 2, "remote_merge": 0,
+                "remove": 0, "rsync": 0,
+                "start": 1333044050.855202,
+                "success": 2, "ts_repl": 0},
+            "replication_time": 0.2615511417388916,
+            "replication_last": 1357969645.25})
 
     def test_get_replication_info_container(self):
-        from_cache_response = {"replication_time": 200.0,
-                               "replication_stats": {
-                                    "attempted": 179, "diff": 0,
-                                    "diff_capped": 0, "empty": 0,
-                                    "failure": 0, "hashmatch": 0,
-                                    "no_change": 358, "remote_merge": 0,
-                                    "remove": 0, "rsync": 0,
-                                    "start": 5.5, "success": 358,
-                                    "ts_repl": 0}}
+        from_cache_response = {
+            "replication_time": 200.0,
+            "replication_stats": {
+                "attempted": 179, "diff": 0,
+                "diff_capped": 0, "empty": 0,
+                "failure": 0, "hashmatch": 0,
+                "failure_nodes": {
+                    "192.168.0.1": 0,
+                    "192.168.0.2": 0},
+                "no_change": 358, "remote_merge": 0,
+                "remove": 0, "rsync": 0,
+                "start": 5.5, "success": 358,
+                "ts_repl": 0},
+            "replication_last": 1357969645.25}
         self.fakecache.fakeout_calls = []
         self.fakecache.fakeout = from_cache_response
         rv = self.app.get_replication_info('container')
-        self.assertEquals(self.fakecache.fakeout_calls,
-                            [((['replication_time', 'replication_stats'],
-                                '/var/cache/swift/container.recon'), {})])
-        self.assertEquals(rv, {"replication_time": 200.0,
-                               "replication_stats": {
-                                    "attempted": 179, "diff": 0,
-                                    "diff_capped": 0, "empty": 0,
-                                    "failure": 0, "hashmatch": 0,
-                                    "no_change": 358, "remote_merge": 0,
-                                    "remove": 0, "rsync": 0,
-                                    "start": 5.5, "success": 358,
-                                    "ts_repl": 0}})
+        self.assertEqual(self.fakecache.fakeout_calls,
+                         [((['replication_time', 'replication_stats',
+                             'replication_last'],
+                             self._full_recon_path('container')),
+                           {})])
+        self.assertEqual(rv, {
+            "replication_time": 200.0,
+            "replication_stats": {
+                "attempted": 179, "diff": 0,
+                "diff_capped": 0, "empty": 0,
+                "failure": 0, "hashmatch": 0,
+                "failure_nodes": {
+                    "192.168.0.1": 0,
+                    "192.168.0.2": 0},
+                "no_change": 358, "remote_merge": 0,
+                "remove": 0, "rsync": 0,
+                "start": 5.5, "success": 358,
+                "ts_repl": 0},
+            "replication_last": 1357969645.25})
 
     def test_get_replication_object(self):
-        from_cache_response = {"object_replication_time": 200.0}
+        from_cache_response = {
+            "replication_time": 0.2615511417388916,
+            "replication_stats": {
+                "attempted": 179,
+                "failure": 0, "hashmatch": 0,
+                "failure_nodes": {
+                    "192.168.0.1": 0,
+                    "192.168.0.2": 0},
+                "remove": 0, "rsync": 0,
+                "start": 1333044050.855202, "success": 358},
+            "replication_last": 1357969645.25,
+            "object_replication_time": 0.2615511417388916,
+            "object_replication_last": 1357969645.25}
         self.fakecache.fakeout_calls = []
         self.fakecache.fakeout = from_cache_response
         rv = self.app.get_replication_info('object')
-        self.assertEquals(self.fakecache.fakeout_calls,
-                            [((['object_replication_time'],
-                                '/var/cache/swift/object.recon'), {})])
-        self.assertEquals(rv, {'object_replication_time': 200.0})
+        self.assertEqual(self.fakecache.fakeout_calls,
+                         [((['replication_time', 'replication_stats',
+                             'replication_last', 'object_replication_time',
+                             'object_replication_last'],
+                             self._full_recon_path('object')), {})])
+        self.assertEqual(rv, {
+            "replication_time": 0.2615511417388916,
+            "replication_stats": {
+                "attempted": 179,
+                "failure": 0, "hashmatch": 0,
+                "failure_nodes": {
+                    "192.168.0.1": 0,
+                    "192.168.0.2": 0},
+                "remove": 0, "rsync": 0,
+                "start": 1333044050.855202, "success": 358},
+            "replication_last": 1357969645.25,
+            "object_replication_time": 0.2615511417388916,
+            "object_replication_last": 1357969645.25})
+
+    def test_get_replication_info_unrecognized(self):
+        rv = self.app.get_replication_info('unrecognized_recon_type')
+        self.assertIsNone(rv)
+
+    def test_get_reconstruction(self):
+        from_cache_response = {
+            "object_reconstruction_time": 0.2615511417388916,
+            "object_reconstruction_last": 1357969645.25}
+        self.fakecache.fakeout_calls = []
+        self.fakecache.fakeout = from_cache_response
+        rv = self.app.get_reconstruction_info()
+        self.assertEqual(self.fakecache.fakeout_calls,
+                         [((['object_reconstruction_last',
+                             'object_reconstruction_time'],
+                             '/var/cache/swift/object.recon'), {})])
+        self.assertEqual(rv, {
+            "object_reconstruction_time": 0.2615511417388916,
+            "object_reconstruction_last": 1357969645.25})
 
     def test_get_updater_info_container(self):
         from_cache_response = {"container_updater_sweep": 18.476239919662476}
         self.fakecache.fakeout_calls = []
         self.fakecache.fakeout = from_cache_response
         rv = self.app.get_updater_info('container')
-        self.assertEquals(self.fakecache.fakeout_calls,
-                            [((['container_updater_sweep'],
-                            '/var/cache/swift/container.recon'), {})])
-        self.assertEquals(rv, {"container_updater_sweep": 18.476239919662476})
+        self.assertEqual(self.fakecache.fakeout_calls,
+                         [((['container_updater_sweep'],
+                            self._full_recon_path('container')), {})])
+        self.assertEqual(rv, {"container_updater_sweep": 18.476239919662476})
 
     def test_get_updater_info_object(self):
-        from_cache_response = {"object_updater_sweep": 0.79848217964172363}
+        from_cache_response = {"object_updater_sweep": 0.79848217964172363,
+                               "object_updater_last": 1357969645.25}
         self.fakecache.fakeout_calls = []
         self.fakecache.fakeout = from_cache_response
         rv = self.app.get_updater_info('object')
-        self.assertEquals(self.fakecache.fakeout_calls,
-                            [((['object_updater_sweep'],
-                            '/var/cache/swift/object.recon'), {})])
-        self.assertEquals(rv, {"object_updater_sweep": 0.79848217964172363})
+        self.assertEqual(self.fakecache.fakeout_calls,
+                         [((['object_updater_sweep', 'object_updater_stats',
+                             'object_updater_last'],
+                            self._full_recon_path('object')), {})])
+        self.assertEqual(rv, {"object_updater_sweep": 0.79848217964172363,
+                              "object_updater_last": 1357969645.25})
+
+    def test_get_updater_info_unrecognized(self):
+        rv = self.app.get_updater_info('unrecognized_recon_type')
+        self.assertIsNone(rv)
+
+    def test_get_expirer_info_object(self):
+        from_cache_response = {'object_expiration_pass': 0.79848217964172363,
+                               'expired_last_pass': 99}
+        self.fakecache.fakeout_calls = []
+        self.fakecache.fakeout = from_cache_response
+        rv = self.app.get_expirer_info('object')
+        self.assertEqual(self.fakecache.fakeout_calls,
+                         [((['object_expiration_pass', 'expired_last_pass'],
+                            self._full_recon_path('object')), {})])
+        self.assertEqual(rv, from_cache_response)
 
     def test_get_auditor_info_account(self):
         from_cache_response = {"account_auditor_pass_completed": 0.24,
@@ -468,16 +869,16 @@ def test_get_auditor_info_account(self):
         self.fakecache.fakeout_calls = []
         self.fakecache.fakeout = from_cache_response
         rv = self.app.get_auditor_info('account')
-        self.assertEquals(self.fakecache.fakeout_calls,
-                            [((['account_audits_passed',
-                                'account_auditor_pass_completed',
-                                'account_audits_since',
-                                'account_audits_failed'],
-                                '/var/cache/swift/account.recon'), {})])
-        self.assertEquals(rv, {"account_auditor_pass_completed": 0.24,
-                               "account_audits_failed": 0,
-                               "account_audits_passed": 6,
-                               "account_audits_since": "1333145374.1373529"})
+        self.assertEqual(self.fakecache.fakeout_calls,
+                         [((['account_audits_passed',
+                             'account_auditor_pass_completed',
+                             'account_audits_since',
+                             'account_audits_failed'],
+                             self._full_recon_path('account')), {})])
+        self.assertEqual(rv, {"account_auditor_pass_completed": 0.24,
+                              "account_audits_failed": 0,
+                              "account_audits_passed": 6,
+                              "account_audits_since": "1333145374.1373529"})
 
     def test_get_auditor_info_container(self):
         from_cache_response = {"container_auditor_pass_completed": 0.24,
@@ -487,123 +888,256 @@ def test_get_auditor_info_container(self):
         self.fakecache.fakeout_calls = []
         self.fakecache.fakeout = from_cache_response
         rv = self.app.get_auditor_info('container')
-        self.assertEquals(self.fakecache.fakeout_calls,
-                            [((['container_audits_passed',
-                                'container_auditor_pass_completed',
-                                'container_audits_since',
-                                'container_audits_failed'],
-                                '/var/cache/swift/container.recon'), {})])
-        self.assertEquals(rv, {"container_auditor_pass_completed": 0.24,
-                               "container_audits_failed": 0,
-                               "container_audits_passed": 6,
-                               "container_audits_since": "1333145374.1373529"})
+        self.assertEqual(self.fakecache.fakeout_calls,
+                         [((['container_audits_passed',
+                             'container_auditor_pass_completed',
+                             'container_audits_since',
+                             'container_audits_failed'],
+                             self._full_recon_path('container')), {})])
+        self.assertEqual(rv, {"container_auditor_pass_completed": 0.24,
+                              "container_audits_failed": 0,
+                              "container_audits_passed": 6,
+                              "container_audits_since": "1333145374.1373529"})
 
     def test_get_auditor_info_object(self):
-        from_cache_response = {"object_auditor_stats_ALL": {
-                                    "audit_time": 115.14418768882751,
-                                    "bytes_processed": 234660,
-                                    "completed": 115.4512460231781,
-                                    "errors": 0,
-                                    "files_processed": 2310,
-                                    "quarantined": 0 },
-                                "object_auditor_stats_ZBF": {
-                                    "audit_time": 45.877294063568115,
-                                    "bytes_processed": 0,
-                                    "completed": 46.181446075439453,
-                                    "errors": 0,
-                                    "files_processed": 2310,
-                                    "quarantined": 0 }}
+        from_cache_response = {
+            "object_auditor_stats_ALL": {
+                "audit_time": 115.14418768882751,
+                "bytes_processed": 234660,
+                "completed": 115.4512460231781,
+                "errors": 0,
+                "files_processed": 2310,
+                "quarantined": 0},
+            "object_auditor_stats_ZBF": {
+                "audit_time": 45.877294063568115,
+                "bytes_processed": 0,
+                "completed": 46.181446075439453,
+                "errors": 0,
+                "files_processed": 2310,
+                "quarantined": 0}}
         self.fakecache.fakeout_calls = []
         self.fakecache.fakeout = from_cache_response
         rv = self.app.get_auditor_info('object')
-        self.assertEquals(self.fakecache.fakeout_calls,
-                            [((['object_auditor_stats_ALL',
-                                'object_auditor_stats_ZBF'],
-                            '/var/cache/swift/object.recon'), {})])
-        self.assertEquals(rv, {"object_auditor_stats_ALL": {
-                                    "audit_time": 115.14418768882751,
-                                    "bytes_processed": 234660,
-                                    "completed": 115.4512460231781,
-                                    "errors": 0,
-                                    "files_processed": 2310,
-                                    "quarantined": 0 },
-                                "object_auditor_stats_ZBF": {
-                                    "audit_time": 45.877294063568115,
-                                    "bytes_processed": 0,
-                                    "completed": 46.181446075439453,
-                                    "errors": 0,
-                                    "files_processed": 2310,
-                                    "quarantined": 0 }})
+        self.assertEqual(self.fakecache.fakeout_calls,
+                         [((['object_auditor_stats_ALL',
+                             'object_auditor_stats_ZBF'],
+                             self._full_recon_path('object')), {})])
+        self.assertEqual(rv, {
+            "object_auditor_stats_ALL": {
+                "audit_time": 115.14418768882751,
+                "bytes_processed": 234660,
+                "completed": 115.4512460231781,
+                "errors": 0,
+                "files_processed": 2310,
+                "quarantined": 0},
+            "object_auditor_stats_ZBF": {
+                "audit_time": 45.877294063568115,
+                "bytes_processed": 0,
+                "completed": 46.181446075439453,
+                "errors": 0,
+                "files_processed": 2310,
+                "quarantined": 0}})
+
+    def test_get_auditor_info_object_parallel_once(self):
+        from_cache_response = {
+            "object_auditor_stats_ALL": {
+                'disk1': {
+                    "audit_time": 115.14418768882751,
+                    "bytes_processed": 234660,
+                    "completed": 115.4512460231781,
+                    "errors": 0,
+                    "files_processed": 2310,
+                    "quarantined": 0},
+                'disk2': {
+                    "audit_time": 115,
+                    "bytes_processed": 234660,
+                    "completed": 115,
+                    "errors": 0,
+                    "files_processed": 2310,
+                    "quarantined": 0}},
+            "object_auditor_stats_ZBF": {'disk1disk2': {
+                "audit_time": 45.877294063568115,
+                "bytes_processed": 0,
+                "completed": 46.181446075439453,
+                "errors": 0,
+                "files_processed": 2310,
+                "quarantined": 0}}}
+        self.fakecache.fakeout_calls = []
+        self.fakecache.fakeout = from_cache_response
+        rv = self.app.get_auditor_info('object')
+        self.assertEqual(self.fakecache.fakeout_calls,
+                         [((['object_auditor_stats_ALL',
+                             'object_auditor_stats_ZBF'],
+                             self._full_recon_path('object')), {})])
+        self.assertEqual(rv, {
+            "object_auditor_stats_ALL": {
+                'disk1': {
+                    "audit_time": 115.14418768882751,
+                    "bytes_processed": 234660,
+                    "completed": 115.4512460231781,
+                    "errors": 0,
+                    "files_processed": 2310,
+                    "quarantined": 0},
+                'disk2': {
+                    "audit_time": 115,
+                    "bytes_processed": 234660,
+                    "completed": 115,
+                    "errors": 0,
+                    "files_processed": 2310,
+                    "quarantined": 0}},
+            "object_auditor_stats_ZBF": {'disk1disk2': {
+                "audit_time": 45.877294063568115,
+                "bytes_processed": 0,
+                "completed": 46.181446075439453,
+                "errors": 0,
+                "files_processed": 2310,
+                "quarantined": 0}}})
+
+    def test_get_auditor_info_unrecognized(self):
+        rv = self.app.get_auditor_info('unrecognized_recon_type')
+        self.assertIsNone(rv)
 
     def test_get_unmounted(self):
-
-        def fake_checkmount_true(*args):
-            return True
-
         unmounted_resp = [{'device': 'fakeone', 'mounted': False},
                           {'device': 'faketwo', 'mounted': False}]
-        self.mockos.ls_output=['fakeone', 'faketwo']
-        self.mockos.path_exists_output=False
-        real_checkmount = swift.common.constraints.check_mount
-        swift.common.constraints.check_mount = fake_checkmount_true
+        self.mockos.ls_output = ['fakeone', 'faketwo']
+        self.mockos.isdir_output = True
+        self.mockos.ismount_output = False
         rv = self.app.get_unmounted()
-        swift.common.constraints.check_mount = real_checkmount
-        self.assertEquals(self.mockos.listdir_calls, [(('/srv/node/',), {})])
-        self.assertEquals(rv, unmounted_resp)
+        self.assertEqual(self.mockos.listdir_calls, [(('/srv/node',), {})])
+        self.assertEqual(self.mockos.isdir_calls,
+                         [(('/srv/node/fakeone',), {}),
+                          (('/srv/node/faketwo',), {})])
+        self.assertEqual(rv, unmounted_resp)
 
-    def test_no_get_unmounted(self):
+    def test_get_unmounted_excludes_files(self):
+        unmounted_resp = []
+        self.mockos.ls_output = ['somerando.log']
+        self.mockos.isdir_output = False
+        self.mockos.ismount_output = False
+        rv = self.app.get_unmounted()
+        self.assertEqual(self.mockos.listdir_calls, [(('/srv/node',), {})])
+        self.assertEqual(self.mockos.isdir_calls,
+                         [(('/srv/node/somerando.log',), {})])
+        self.assertEqual(rv, unmounted_resp)
+
+    def test_get_unmounted_all_mounted(self):
+        unmounted_resp = []
+        self.mockos.ls_output = ['fakeone', 'faketwo']
+        self.mockos.isdir_output = True
+        self.mockos.ismount_output = True
+        rv = self.app.get_unmounted()
+        self.assertEqual(self.mockos.listdir_calls, [(('/srv/node',), {})])
+        self.assertEqual(self.mockos.isdir_calls,
+                         [(('/srv/node/fakeone',), {}),
+                          (('/srv/node/faketwo',), {})])
+        self.assertEqual(rv, unmounted_resp)
+
+    def test_get_unmounted_checkmount_fail(self):
+        unmounted_resp = [{'device': 'fakeone', 'mounted': 'brokendrive'}]
+        self.mockos.ls_output = ['fakeone']
+        self.mockos.isdir_output = True
+        self.mockos.ismount_output = OSError('brokendrive')
+        rv = self.app.get_unmounted()
+        self.assertEqual(self.mockos.listdir_calls, [(('/srv/node',), {})])
+        self.assertEqual(self.mockos.isdir_calls,
+                         [(('/srv/node/fakeone',), {})])
+        self.assertEqual(self.mockos.ismount_calls,
+                         [(('/srv/node/fakeone',), {})])
+        self.assertEqual(rv, unmounted_resp)
+
+    def test_get_unmounted_no_mounts(self):
 
         def fake_checkmount_true(*args):
             return True
 
         unmounted_resp = []
-        self.mockos.ls_output=[]
-        self.mockos.path_exists_output=False
-        real_checkmount = swift.common.constraints.check_mount
-        swift.common.constraints.check_mount = fake_checkmount_true
+        self.mockos.ls_output = []
+        self.mockos.isdir_output = False
+        self.mockos.ismount_output = False
         rv = self.app.get_unmounted()
-        swift.common.constraints.check_mount = real_checkmount
-        self.assertEquals(self.mockos.listdir_calls, [(('/srv/node/',), {})])
-        self.assertEquals(rv, unmounted_resp)
+        self.assertEqual(self.mockos.listdir_calls, [(('/srv/node',), {})])
+        self.assertEqual(self.mockos.isdir_calls, [])
+        self.assertEqual(rv, unmounted_resp)
 
     def test_get_diskusage(self):
-        #posix.statvfs_result(f_bsize=4096, f_frsize=4096, f_blocks=1963185,
-        #                     f_bfree=1113075, f_bavail=1013351, f_files=498736,
-        #                     f_ffree=397839, f_favail=397839, f_flag=0,
-        #                     f_namemax=255)
-        statvfs_content=(4096, 4096, 1963185, 1113075, 1013351, 498736, 397839,
-                         397839, 0, 255)
+        # posix.statvfs_result(f_bsize=4096, f_frsize=4096, f_blocks=1963185,
+        #                      f_bfree=1113075, f_bavail=1013351,
+        #                      f_files=498736,
+        #                      f_ffree=397839, f_favail=397839, f_flag=0,
+        #                      f_namemax=255)
+        statvfs_content = (4096, 4096, 1963185, 1113075, 1013351, 498736,
+                           397839, 397839, 0, 255)
         du_resp = [{'device': 'canhazdrive1', 'avail': 4150685696,
                     'mounted': True, 'used': 3890520064, 'size': 8041205760}]
-        self.mockos.ls_output=['canhazdrive1']
-        self.mockos.statvfs_output=statvfs_content
-        self.mockos.path_exists_output=True
+        self.mockos.ls_output = ['canhazdrive1']
+        self.mockos.isdir_output = True
+        self.mockos.statvfs_output = statvfs_content
+        self.mockos.ismount_output = True
         rv = self.app.get_diskusage()
-        self.assertEquals(self.mockos.statvfs_calls,
-                            [(('/srv/node/canhazdrive1',), {})])
-        self.assertEquals(rv, du_resp)
+        self.assertEqual(self.mockos.listdir_calls, [(('/srv/node',), {})])
+        self.assertEqual(self.mockos.isdir_calls,
+                         [(('/srv/node/canhazdrive1',), {})])
+        self.assertEqual(self.mockos.statvfs_calls,
+                         [(('/srv/node/canhazdrive1',), {})])
+        self.assertEqual(rv, du_resp)
+
+    def test_get_diskusage_excludes_files(self):
+        du_resp = []
+        self.mockos.ls_output = ['somerando.log']
+        self.mockos.isdir_output = False
+        rv = self.app.get_diskusage()
+        self.assertEqual(self.mockos.isdir_calls,
+                         [(('/srv/node/somerando.log',), {})])
+        self.assertEqual(self.mockos.statvfs_calls, [])
+        self.assertEqual(rv, du_resp)
 
     def test_get_diskusage_checkmount_fail(self):
         du_resp = [{'device': 'canhazdrive1', 'avail': '',
-                    'mounted': False, 'used': '', 'size': ''}]
-        self.mockos.ls_output=['canhazdrive1']
-        self.mockos.path_exists_output=False
+                    'mounted': 'brokendrive', 'used': '', 'size': ''}]
+        self.mockos.ls_output = ['canhazdrive1']
+        self.mockos.isdir_output = True
+        self.mockos.ismount_output = OSError('brokendrive')
+        rv = self.app.get_diskusage()
+        self.assertEqual(self.mockos.listdir_calls, [(('/srv/node',), {})])
+        self.assertEqual(self.mockos.isdir_calls,
+                         [(('/srv/node/canhazdrive1',), {})])
+        self.assertEqual(self.mockos.ismount_calls,
+                         [(('/srv/node/canhazdrive1',), {})])
+        self.assertEqual(rv, du_resp)
+
+    @mock.patch("swift.common.middleware.recon.check_mount", fake_check_mount)
+    def test_get_diskusage_oserror(self):
+        du_resp = [{'device': 'canhazdrive1', 'avail': '',
+                    'mounted': 'Input/Output Error', 'used': '', 'size': ''}]
+        self.mockos.ls_output = ['canhazdrive1']
+        self.mockos.isdir_output = True
         rv = self.app.get_diskusage()
-        self.assertEquals(self.mockos.listdir_calls,[(('/srv/node/',), {})])
-        self.assertEquals(self.mockos.path_exists_calls,
-                            [(('/srv/node/canhazdrive1',), {})])
-        self.assertEquals(rv, du_resp)
+        self.assertEqual(rv, du_resp)
 
     def test_get_quarantine_count(self):
-        #posix.lstat_result(st_mode=1, st_ino=2, st_dev=3, st_nlink=4,
-        #                   st_uid=5, st_gid=6, st_size=7, st_atime=8,
-        #                   st_mtime=9, st_ctime=10)
-        lstat_content = (1, 2, 3, 4, 5, 6, 7, 8, 9, 10)
-        self.mockos.ls_output=['sda']
-        self.mockos.path_exists_output=True
-        self.mockos.lstat_output=lstat_content
-        rv = self.app.get_quarantine_count()
-        self.assertEquals(rv, {'objects': 2, 'accounts': 2, 'containers': 2})
+        dirs = [['sda'], ['accounts', 'containers', 'objects', 'objects-1']]
+        self.mockos.ismount_output = True
+
+        def fake_lstat(*args, **kwargs):
+            # posix.lstat_result(st_mode=1, st_ino=2, st_dev=3, st_nlink=4,
+            #                    st_uid=5, st_gid=6, st_size=7, st_atime=8,
+            #                    st_mtime=9, st_ctime=10)
+            return stat_result((1, 2, 3, 4, 5, 6, 7, 8, 9, 10))
+
+        def fake_exists(*args, **kwargs):
+            return True
+
+        def fake_listdir(*args, **kwargs):
+            return dirs.pop(0)
+
+        with mock.patch("os.lstat", fake_lstat):
+            with mock.patch("os.path.exists", fake_exists):
+                with mock.patch("os.listdir", fake_listdir):
+                    rv = self.app.get_quarantine_count()
+        self.assertEqual(rv, {'objects': 4, 'accounts': 2, 'policies':
+                              {'1': {'objects': 2}, '0': {'objects': 2}},
+                              'containers': 2})
 
     def test_get_socket_info(self):
         sockstat_content = ['sockets: used 271',
@@ -611,28 +1145,214 @@ def test_get_socket_info(self):
                             'UDP: inuse 16 mem 4', 'UDPLITE: inuse 0',
                             'RAW: inuse 0', 'FRAG: inuse 0 memory 0',
                             '']
-        sockstat6_content = ['TCP6: inuse 1',
-                             'UDP6: inuse 3',
-                             'UDPLITE6: inuse 0',
-                             'RAW6: inuse 0',
-                             'FRAG6: inuse 0 memory 0',
-                             '']
         oart = OpenAndReadTester(sockstat_content)
-        rv = self.app.get_socket_info(openr=oart.open)
-        self.assertEquals(oart.open_calls, [(('/proc/net/sockstat', 'r'), {}),
-                                            (('/proc/net/sockstat6', 'r'), {})])
+        self.app.get_socket_info(openr=oart.open)
+        self.assertEqual(oart.open_calls, [
+            (('/proc/net/sockstat', 'r'), {}),
+            (('/proc/net/sockstat6', 'r'), {})])
+
+    def test_get_driveaudit_info(self):
+        from_cache_response = {'drive_audit_errors': 7}
+        self.fakecache.fakeout = from_cache_response
+        rv = self.app.get_driveaudit_error()
+        self.assertEqual(self.fakecache.fakeout_calls,
+                         [((['drive_audit_errors'],
+                            self._full_recon_path(
+                                None, recon_file=RECON_DRIVE_FILE)), {})])
+        self.assertEqual(rv, {'drive_audit_errors': 7})
+
+    def test_get_time(self):
+        def fake_time():
+            return 1430000000.0
+
+        with mock.patch("time.time", fake_time):
+            now = fake_time()
+            rv = self.app.get_time()
+            self.assertEqual(rv, now)
+
+    def test_get_sharding_info(self):
+        from_cache_response = {
+            "sharding_stats": {
+                "attempted": 0,
+                "deferred": 0,
+                "diff": 0,
+                "diff_capped": 0,
+                "empty": 0,
+                "failure": 0,
+                "hashmatch": 0,
+                "no_change": 0,
+                "remote_merge": 0,
+                "remove": 0,
+                "rsync": 0,
+                "start": 1614136398.5729735,
+                "success": 0,
+                "ts_repl": 0,
+                "sharding": {
+                    "audit_root": {
+                        "attempted": 0,
+                        "failure": 0,
+                        "success": 0,
+                    },
+                    "audit_shard": {
+                        "attempted": 0,
+                        "failure": 0,
+                        "success": 0,
+                    },
+                    "cleaved": {
+                        "attempted": 0,
+                        "failure": 0,
+                        "max_time": 0,
+                        "min_time": 0,
+                        "success": 0,
+                    },
+                    "created": {
+                        "attempted": 0,
+                        "failure": 0,
+                        "success": 0,
+                    },
+                    "misplaced": {
+                        "attempted": 0,
+                        "failure": 0,
+                        "found": 0,
+                        "placed": 0,
+                        "success": 0,
+                        "unplaced": 0,
+                    },
+                    "scanned": {
+                        "attempted": 0,
+                        "failure": 0,
+                        "found": 0,
+                        "max_time": 0,
+                        "min_time": 0,
+                        "success": 0,
+                    },
+                    "sharding_candidates": {
+                        "found": 0,
+                        "top": [],
+                    },
+                    "visited": {
+                        "attempted": 0,
+                        "completed": 0,
+                        "failure": 0,
+                        "skipped": 6,
+                        "success": 0,
+                    }
+                },
+            },
+            "sharding_time": 600,
+            "sharding_last": 1614136398.6680582}
+        self.fakecache.fakeout_calls = []
+        self.fakecache.fakeout = from_cache_response
+        rv = self.app.get_sharding_info()
+        self.assertEqual(self.fakecache.fakeout_calls, [
+            ((['sharding_stats', 'sharding_time', 'sharding_last'],
+              self._full_recon_path('container')), {})])
+        self.assertEqual(rv, from_cache_response)
+
+    def test_get_relinker_info(self):
+        from_cache_response = {
+            "devices": {
+                "sdb3": {
+                    "parts_done": 523,
+                    "policies": {
+                        "1": {
+                            "next_part_power": 11,
+                            "start_time": 1618998724.845616,
+                            "stats": {
+                                "errors": 0,
+                                "files": 1630,
+                                "hash_dirs": 1630,
+                                "linked": 1630,
+                                "policies": 1,
+                                "removed": 0
+                            },
+                            "timestamp": 1618998730.24672,
+                            "total_parts": 1029,
+                            "total_time": 5.400741815567017
+                        }},
+                    "start_time": 1618998724.845946,
+                    "stats": {
+                        "errors": 0,
+                        "files": 836,
+                        "hash_dirs": 836,
+                        "linked": 836,
+                        "removed": 0
+                    },
+                    "timestamp": 1618998730.24672,
+                    "total_parts": 523,
+                    "total_time": 5.400741815567017
+                },
+                "sdb7": {
+                    "parts_done": 506,
+                    "policies": {
+                        "1": {
+                            "next_part_power": 11,
+                            "part_power": 10,
+                            "parts_done": 506,
+                            "start_time": 1618998724.845616,
+                            "stats": {
+                                "errors": 0,
+                                "files": 794,
+                                "hash_dirs": 794,
+                                "linked": 794,
+                                "removed": 0
+                            },
+                            "step": "relink",
+                            "timestamp": 1618998730.166175,
+                            "total_parts": 506,
+                            "total_time": 5.320528984069824
+                        }
+                    },
+                    "start_time": 1618998724.845616,
+                    "stats": {
+                        "errors": 0,
+                        "files": 794,
+                        "hash_dirs": 794,
+                        "linked": 794,
+                        "removed": 0
+                    },
+                    "timestamp": 1618998730.166175,
+                    "total_parts": 506,
+                    "total_time": 5.320528984069824
+                }
+            },
+            "workers": {
+                "100": {
+                    "drives": ["sda1"],
+                    "return_code": 0,
+                    "timestamp": 1618998730.166175}
+            }}
+        self.fakecache.fakeout_calls = []
+        self.fakecache.fakeout = from_cache_response
+        rv = self.app.get_relinker_info()
+        self.assertEqual(self.fakecache.fakeout_calls,
+                         [((['devices', 'workers'],
+                            self._full_recon_path(
+                                None, recon_file=RECON_RELINKER_FILE)),
+                           {'ignore_missing': True})])
+        self.assertEqual(rv, from_cache_response)
+
 
 class TestReconMiddleware(unittest.TestCase):
 
+    def fake_list(self, path):
+        return ['a', 'b']
+
     def setUp(self):
         self.frecon = FakeRecon()
+        self.real_listdir = os.listdir
+        os.listdir = self.fake_list
         self.app = recon.ReconMiddleware(FakeApp(), {'object_recon': "true"})
-        #self.app.object_recon = True
+        self.real_app_get_device_info = self.app.get_device_info
+        self.real_app_get_swift_conf_md5 = self.app.get_swift_conf_md5
+        os.listdir = self.real_listdir
+        # self.app.object_recon = True
         self.app.get_mem = self.frecon.fake_mem
         self.app.get_load = self.frecon.fake_load
         self.app.get_async_info = self.frecon.fake_async
         self.app.get_device_info = self.frecon.fake_get_device_info
         self.app.get_replication_info = self.frecon.fake_replication
+        self.app.get_reconstruction_info = self.frecon.fake_reconstruction
         self.app.get_auditor_info = self.frecon.fake_auditor
         self.app.get_updater_info = self.frecon.fake_updater
         self.app.get_expirer_info = self.frecon.fake_expirer
@@ -640,221 +1360,303 @@ def setUp(self):
         self.app.get_unmounted = self.frecon.fake_unmounted
         self.app.get_diskusage = self.frecon.fake_diskusage
         self.app.get_ring_md5 = self.frecon.fake_ringmd5
+        self.app.get_swift_conf_md5 = self.frecon.fake_swiftconfmd5
         self.app.get_quarantine_count = self.frecon.fake_quarantined
         self.app.get_socket_info = self.frecon.fake_sockstat
+        self.app.get_driveaudit_error = self.frecon.fake_driveaudit
+        self.app.get_time = self.frecon.fake_time
+        self.app.get_sharding_info = self.frecon.fake_sharding
+        self.app.get_relinker_info = self.frecon.fake_relinker
 
     def test_recon_get_mem(self):
-        get_mem_resp = ['{"memtest": "1"}']
+        get_mem_resp = [b'{"memtest": "1"}']
         req = Request.blank('/recon/mem', environ={'REQUEST_METHOD': 'GET'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, get_mem_resp)
+        self.assertEqual(resp, get_mem_resp)
+
+    def test_recon_get_version(self):
+        req = Request.blank('/recon/version',
+                            environ={'REQUEST_METHOD': 'GET'})
+        resp = self.app(req.environ, start_response)
+        self.assertEqual(resp, [json.dumps({
+            'version': swiftver}).encode('ascii')])
 
     def test_recon_get_load(self):
-        get_load_resp = ['{"loadtest": "1"}']
+        get_load_resp = [b'{"loadtest": "1"}']
         req = Request.blank('/recon/load', environ={'REQUEST_METHOD': 'GET'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, get_load_resp)
+        self.assertEqual(resp, get_load_resp)
 
     def test_recon_get_async(self):
-        get_async_resp = ['{"asynctest": "1"}']
+        get_async_resp = [b'{"asynctest": "1"}']
         req = Request.blank('/recon/async', environ={'REQUEST_METHOD': 'GET'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, get_async_resp)
+        self.assertEqual(resp, get_async_resp)
 
     def test_get_device_info(self):
-        get_device_resp = ['{"/srv/1/node": ["sdb1"]}']
-        req = Request.blank('/recon/devices', 
+        get_device_resp = [b'{"/srv/1/node": ["sdb1"]}']
+        req = Request.blank('/recon/devices',
+                            environ={'REQUEST_METHOD': 'GET'})
+        resp = self.app(req.environ, start_response)
+        self.assertEqual(resp, get_device_resp)
+
+    def test_reconstruction_info(self):
+        get_reconstruction_resp = [b'{"reconstructiontest": "1"}']
+        req = Request.blank('/recon/reconstruction/object',
                             environ={'REQUEST_METHOD': 'GET'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, get_device_resp)
+        self.assertEqual(resp, get_reconstruction_resp)
 
     def test_recon_get_replication_notype(self):
-        get_replication_resp = ['{"replicationtest": "1"}']
+        get_replication_resp = [b'{"replicationtest": "1"}']
         req = Request.blank('/recon/replication',
                             environ={'REQUEST_METHOD': 'GET'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, get_replication_resp)
-        self.assertEquals(self.frecon.fake_replication_rtype, 'object')
+        self.assertEqual(resp, get_replication_resp)
+        self.assertEqual(self.frecon.fake_replication_rtype, 'object')
         self.frecon.fake_replication_rtype = None
 
     def test_recon_get_replication_all(self):
-        get_replication_resp = ['{"replicationtest": "1"}']
-        #test account
+        get_replication_resp = [b'{"replicationtest": "1"}']
+        # test account
         req = Request.blank('/recon/replication/account',
                             environ={'REQUEST_METHOD': 'GET'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, get_replication_resp)
-        self.assertEquals(self.frecon.fake_replication_rtype, 'account')
+        self.assertEqual(resp, get_replication_resp)
+        self.assertEqual(self.frecon.fake_replication_rtype, 'account')
         self.frecon.fake_replication_rtype = None
-        #test container
+        # test container
         req = Request.blank('/recon/replication/container',
                             environ={'REQUEST_METHOD': 'GET'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, get_replication_resp)
-        self.assertEquals(self.frecon.fake_replication_rtype, 'container')
+        self.assertEqual(resp, get_replication_resp)
+        self.assertEqual(self.frecon.fake_replication_rtype, 'container')
         self.frecon.fake_replication_rtype = None
-        #test object
+        # test object
         req = Request.blank('/recon/replication/object',
                             environ={'REQUEST_METHOD': 'GET'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, get_replication_resp)
-        self.assertEquals(self.frecon.fake_replication_rtype, 'object')
+        self.assertEqual(resp, get_replication_resp)
+        self.assertEqual(self.frecon.fake_replication_rtype, 'object')
         self.frecon.fake_replication_rtype = None
 
     def test_recon_get_auditor_invalid(self):
-        get_auditor_resp = ['Invalid path: /recon/auditor/invalid']
+        get_auditor_resp = [b'Invalid path: /recon/auditor/invalid']
         req = Request.blank('/recon/auditor/invalid',
                             environ={'REQUEST_METHOD': 'GET'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, get_auditor_resp)
+        self.assertEqual(resp, get_auditor_resp)
 
     def test_recon_get_auditor_notype(self):
-        get_auditor_resp = ['Invalid path: /recon/auditor']
+        get_auditor_resp = [b'Invalid path: /recon/auditor']
         req = Request.blank('/recon/auditor',
                             environ={'REQUEST_METHOD': 'GET'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, get_auditor_resp)
+        self.assertEqual(resp, get_auditor_resp)
 
     def test_recon_get_auditor_all(self):
-        get_auditor_resp = ['{"auditortest": "1"}']
+        get_auditor_resp = [b'{"auditortest": "1"}']
         req = Request.blank('/recon/auditor/account',
                             environ={'REQUEST_METHOD': 'GET'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, get_auditor_resp)
-        self.assertEquals(self.frecon.fake_auditor_rtype, 'account')
+        self.assertEqual(resp, get_auditor_resp)
+        self.assertEqual(self.frecon.fake_auditor_rtype, 'account')
         self.frecon.fake_auditor_rtype = None
         req = Request.blank('/recon/auditor/container',
                             environ={'REQUEST_METHOD': 'GET'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, get_auditor_resp)
-        self.assertEquals(self.frecon.fake_auditor_rtype, 'container')
+        self.assertEqual(resp, get_auditor_resp)
+        self.assertEqual(self.frecon.fake_auditor_rtype, 'container')
         self.frecon.fake_auditor_rtype = None
         req = Request.blank('/recon/auditor/object',
                             environ={'REQUEST_METHOD': 'GET'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, get_auditor_resp)
-        self.assertEquals(self.frecon.fake_auditor_rtype, 'object')
+        self.assertEqual(resp, get_auditor_resp)
+        self.assertEqual(self.frecon.fake_auditor_rtype, 'object')
         self.frecon.fake_auditor_rtype = None
 
     def test_recon_get_updater_invalid(self):
-        get_updater_resp = ['Invalid path: /recon/updater/invalid']
+        get_updater_resp = [b'Invalid path: /recon/updater/invalid']
         req = Request.blank('/recon/updater/invalid',
                             environ={'REQUEST_METHOD': 'GET'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, get_updater_resp)
+        self.assertEqual(resp, get_updater_resp)
 
     def test_recon_get_updater_notype(self):
-        get_updater_resp = ['Invalid path: /recon/updater']
+        get_updater_resp = [b'Invalid path: /recon/updater']
         req = Request.blank('/recon/updater',
                             environ={'REQUEST_METHOD': 'GET'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, get_updater_resp)
+        self.assertEqual(resp, get_updater_resp)
 
     def test_recon_get_updater(self):
-        get_updater_resp = ['{"updatertest": "1"}']
+        get_updater_resp = [b'{"updatertest": "1"}']
         req = Request.blank('/recon/updater/container',
                             environ={'REQUEST_METHOD': 'GET'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(self.frecon.fake_updater_rtype, 'container')
+        self.assertEqual(self.frecon.fake_updater_rtype, 'container')
         self.frecon.fake_updater_rtype = None
-        self.assertEquals(resp, get_updater_resp)
+        self.assertEqual(resp, get_updater_resp)
         req = Request.blank('/recon/updater/object',
                             environ={'REQUEST_METHOD': 'GET'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, get_updater_resp)
-        self.assertEquals(self.frecon.fake_updater_rtype, 'object')
+        self.assertEqual(resp, get_updater_resp)
+        self.assertEqual(self.frecon.fake_updater_rtype, 'object')
         self.frecon.fake_updater_rtype = None
 
     def test_recon_get_expirer_invalid(self):
-        get_updater_resp = ['Invalid path: /recon/expirer/invalid']
+        get_updater_resp = [b'Invalid path: /recon/expirer/invalid']
         req = Request.blank('/recon/expirer/invalid',
                             environ={'REQUEST_METHOD': 'GET'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, get_updater_resp)
+        self.assertEqual(resp, get_updater_resp)
 
     def test_recon_get_expirer_notype(self):
-        get_updater_resp = ['Invalid path: /recon/expirer']
+        get_updater_resp = [b'Invalid path: /recon/expirer']
         req = Request.blank('/recon/expirer',
                             environ={'REQUEST_METHOD': 'GET'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, get_updater_resp)
+        self.assertEqual(resp, get_updater_resp)
 
     def test_recon_get_expirer_object(self):
-        get_expirer_resp = ['{"expirertest": "1"}']
+        get_expirer_resp = [b'{"expirertest": "1"}']
         req = Request.blank('/recon/expirer/object',
                             environ={'REQUEST_METHOD': 'GET'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, get_expirer_resp)
-        self.assertEquals(self.frecon.fake_expirer_rtype, 'object')
+        self.assertEqual(resp, get_expirer_resp)
+        self.assertEqual(self.frecon.fake_expirer_rtype, 'object')
         self.frecon.fake_updater_rtype = None
 
     def test_recon_get_mounted(self):
-        get_mounted_resp = ['{"mountedtest": "1"}']
+        get_mounted_resp = [b'{"mountedtest": "1"}']
         req = Request.blank('/recon/mounted',
                             environ={'REQUEST_METHOD': 'GET'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, get_mounted_resp)
+        self.assertEqual(resp, get_mounted_resp)
 
     def test_recon_get_unmounted(self):
-        get_unmounted_resp = ['{"unmountedtest": "1"}']
+        get_unmounted_resp = [b'{"unmountedtest": "1"}']
         self.app.get_unmounted = self.frecon.fake_unmounted
         req = Request.blank('/recon/unmounted',
                             environ={'REQUEST_METHOD': 'GET'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, get_unmounted_resp)
-    
-    def test_recon_no_get_unmounted(self):
-        get_unmounted_resp = '[]'
-        self.app.get_unmounted = self.frecon.fake_no_unmounted
+        self.assertEqual(resp, get_unmounted_resp)
+
+    def test_recon_get_unmounted_empty(self):
+        get_unmounted_resp = b'[]'
+        self.app.get_unmounted = self.frecon.fake_unmounted_empty
         req = Request.blank('/recon/unmounted',
                             environ={'REQUEST_METHOD': 'GET'})
-        resp = ''.join(self.app(req.environ, start_response))
-        self.assertEquals(resp, get_unmounted_resp)
+        resp = b''.join(self.app(req.environ, start_response))
+        self.assertEqual(resp, get_unmounted_resp)
 
     def test_recon_get_diskusage(self):
-        get_diskusage_resp = ['{"diskusagetest": "1"}']
+        get_diskusage_resp = [b'{"diskusagetest": "1"}']
         req = Request.blank('/recon/diskusage',
                             environ={'REQUEST_METHOD': 'GET'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, get_diskusage_resp)
+        self.assertEqual(resp, get_diskusage_resp)
 
     def test_recon_get_ringmd5(self):
-        get_ringmd5_resp = ['{"ringmd5test": "1"}']
+        get_ringmd5_resp = [b'{"ringmd5test": "1"}']
         req = Request.blank('/recon/ringmd5',
                             environ={'REQUEST_METHOD': 'GET'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, get_ringmd5_resp)
+        self.assertEqual(resp, get_ringmd5_resp)
+
+    def test_recon_get_swiftconfmd5(self):
+        get_swiftconfmd5_resp = [b'{"/etc/swift/swift.conf": "abcdef"}']
+        req = Request.blank('/recon/swiftconfmd5',
+                            environ={'REQUEST_METHOD': 'GET'})
+        resp = self.app(req.environ, start_response)
+        self.assertEqual(resp, get_swiftconfmd5_resp)
 
     def test_recon_get_quarantined(self):
-        get_quarantined_resp = ['{"quarantinedtest": "1"}']
+        get_quarantined_resp = [b'{"quarantinedtest": "1"}']
         req = Request.blank('/recon/quarantined',
                             environ={'REQUEST_METHOD': 'GET'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, get_quarantined_resp)
+        self.assertEqual(resp, get_quarantined_resp)
 
     def test_recon_get_sockstat(self):
-        get_sockstat_resp = ['{"sockstattest": "1"}']
+        get_sockstat_resp = [b'{"sockstattest": "1"}']
         req = Request.blank('/recon/sockstat',
                             environ={'REQUEST_METHOD': 'GET'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, get_sockstat_resp)
+        self.assertEqual(resp, get_sockstat_resp)
 
     def test_recon_invalid_path(self):
         req = Request.blank('/recon/invalid',
                             environ={'REQUEST_METHOD': 'GET'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, ['Invalid path: /recon/invalid'])
+        self.assertEqual(resp, [b'Invalid path: /recon/invalid'])
 
     def test_no_content(self):
         self.app.get_load = self.frecon.nocontent
         req = Request.blank('/recon/load', environ={'REQUEST_METHOD': 'GET'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, ['Internal server error.'])
+        self.assertEqual(resp, [b'Internal server error.'])
 
     def test_recon_pass(self):
         req = Request.blank('/', environ={'REQUEST_METHOD': 'GET'})
         resp = self.app(req.environ, start_response)
-        self.assertEquals(resp, 'FAKE APP')
+        self.assertEqual(resp, b'FAKE APP')
+
+    def test_recon_get_driveaudit(self):
+        get_driveaudit_resp = [b'{"driveaudittest": "1"}']
+        req = Request.blank('/recon/driveaudit',
+                            environ={'REQUEST_METHOD': 'GET'})
+        resp = self.app(req.environ, start_response)
+        self.assertEqual(resp, get_driveaudit_resp)
+
+    def test_recon_get_time(self):
+        get_time_resp = [b'{"timetest": "1"}']
+        req = Request.blank('/recon/time',
+                            environ={'REQUEST_METHOD': 'GET'})
+        resp = self.app(req.environ, start_response)
+        self.assertEqual(resp, get_time_resp)
+
+    def test_get_device_info_function(self):
+        """Test get_device_info function call success"""
+        resp = self.app.get_device_info()
+        self.assertEqual(['sdb1'], resp['/srv/1/node'])
+
+    def test_get_device_info_fail(self):
+        """Test get_device_info failure by failing os.listdir"""
+        os.listdir = fail_os_listdir
+        resp = self.real_app_get_device_info()
+        os.listdir = self.real_listdir
+        device_path = list(resp)[0]
+        self.assertIsNone(resp[device_path])
+
+    def test_get_swift_conf_md5(self):
+        """Test get_swift_conf_md5 success"""
+        resp = self.app.get_swift_conf_md5()
+        self.assertEqual('abcdef', resp['/etc/swift/swift.conf'])
+
+    def test_get_swift_conf_md5_fail(self):
+        """Test get_swift_conf_md5 failure by failing file open"""
+        with mock.patch('swift.common.middleware.recon.md5_hash_for_file',
+                        side_effect=IOError):
+            resp = self.real_app_get_swift_conf_md5()
+        self.assertIsNone(resp['/etc/swift/swift.conf'])
+
+    def test_recon_get_sharding(self):
+        get_sharding_resp = [
+            b'{"sharding_stats": "1"}']
+        req = Request.blank('/recon/sharding',
+                            environ={'REQUEST_METHOD': 'GET'})
+        resp = self.app(req.environ, start_response)
+        self.assertEqual(resp, get_sharding_resp)
+
+    def test_recon_get_relink(self):
+        get_recon_resp = [
+            b'{"relinktest": "1"}']
+        req = Request.blank('/recon/relinker',
+                            environ={'REQUEST_METHOD': 'GET'})
+        resp = self.app(req.environ, start_response)
+        self.assertEqual(resp, get_recon_resp)
+
 
 if __name__ == '__main__':
     unittest.main()
diff --git a/test/unit/common/middleware/test_slo.py b/test/unit/common/middleware/test_slo.py
new file mode 100644
index 0000000000..caffc10095
--- /dev/null
+++ b/test/unit/common/middleware/test_slo.py
@@ -0,0 +1,7130 @@
+# -*- coding: utf-8 -*-
+# Copyright (c) 2013 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import base64
+from datetime import datetime
+import json
+import time
+import unittest
+import string
+
+from unittest.mock import patch
+
+from io import BytesIO
+
+from swift.common import swob, registry
+from swift.common.header_key_dict import HeaderKeyDict
+from swift.common.middleware import slo
+from swift.common.request_helpers import update_etag_is_at_header
+from swift.common.swob import Request, HTTPException, str_to_wsgi, \
+    bytes_to_wsgi
+from swift.common.utils import quote, closing_if_possible, close_if_possible, \
+    parse_content_type, iter_multipart_mime_documents, parse_mime_headers, \
+    Timestamp, md5, normalize_delete_at_timestamp
+from test.unit.common.middleware.helpers import FakeSwift
+
+
+test_xml_data = '''<?xml version="1.0" encoding="UTF-8"?>
+<static_large_object>
+  <object_segment>
+    <path>/cont/object</path>
+    <etag>etagoftheobjectsegment</etag>
+    <size_bytes>100</size_bytes>
+  </object_segment>
+</static_large_object>
+'''
+test_json_data = json.dumps([{'path': '/cont/object',
+                              'etag': 'etagoftheobjectsegment',
+                              'size_bytes': 100}]).encode('ascii')
+
+
+def fake_start_response(*args, **kwargs):
+    pass
+
+
+def md5hex(s):
+    if not isinstance(s, bytes):
+        s = s.encode('ascii')
+    return md5(s, usedforsecurity=False).hexdigest()
+
+
+class SloTestCase(unittest.TestCase):
+
+    def setUp(self):
+        self.app = FakeSwift()
+        slo_conf = {'rate_limit_under_size': '0'}
+        self.slo = slo.filter_factory(slo_conf)(self.app)
+        self.slo.logger = self.app.logger
+
+    def call_app(self, req, app=None):
+        if app is None:
+            app = self.app
+
+        req.headers.setdefault("User-Agent", "Mozzarella Foxfire")
+
+        status = [None]
+        headers = [None]
+
+        def start_response(s, h, ei=None):
+            status[0] = s
+            headers[0] = h
+
+        body_iter = app(req.environ, start_response)
+        body = b''
+        # appease the close-checker
+        with closing_if_possible(body_iter):
+            for chunk in body_iter:
+                body += chunk
+        return status[0], headers[0], body
+
+    def call_slo(self, req, **kwargs):
+        return self.call_app(req, app=self.slo, **kwargs)
+
+
+class TestSloMiddleware(SloTestCase):
+
+    def setUp(self):
+        super(TestSloMiddleware, self).setUp()
+
+        self.app.register(
+            'GET', '/', swob.HTTPOk, {}, b'passed')
+        self.app.register(
+            'PUT', '/', swob.HTTPOk, {}, b'passed')
+
+    def test_handle_multipart_no_obj(self):
+        req = Request.blank('/')
+        resp_iter = self.slo(req.environ, fake_start_response)
+        self.assertEqual(self.app.calls, [('GET', '/')])
+        self.assertEqual(b''.join(resp_iter), b'passed')
+
+    def test_slo_header_assigned(self):
+        req = Request.blank(
+            '/v1/a/c/o', headers={'x-static-large-object': "true"},
+            environ={'REQUEST_METHOD': 'PUT'})
+        resp = b''.join(self.slo(req.environ, fake_start_response))
+        self.assertTrue(
+            resp.startswith(b'X-Static-Large-Object is a reserved header'))
+
+    def test_slo_PUT_env_override(self):
+        path = '/v1/a/c/o'
+        body = b'manifest body not checked when override flag set'
+        resp_status = []
+
+        def start_response(status, headers, *args):
+            resp_status.append(status)
+
+        req = Request.blank(
+            path, headers={'x-static-large-object': "true"},
+            environ={'REQUEST_METHOD': 'PUT', 'swift.slo_override': True},
+            body=body)
+        self.app.register('PUT', path, swob.HTTPCreated, {})
+        resp_iter = self.slo(req.environ, start_response)
+        self.assertEqual(b'', b''.join(resp_iter))
+        self.assertEqual([
+            ('PUT', path, {
+                'Host': 'localhost:80',
+                'Content-Length': str(len(body)),
+                'X-Static-Large-Object': 'true',
+            }),
+        ], self.app.calls_with_headers)
+        self.assertEqual(body, self.app.uploaded[path][1])
+        self.assertEqual(resp_status[0], '201 Created')
+
+    def _put_bogus_slo(self, manifest_text,
+                       manifest_path='/v1/a/c/the-manifest'):
+        with self.assertRaises(HTTPException) as catcher:
+            slo.parse_and_validate_input(manifest_text, manifest_path)
+        self.assertEqual(400, catcher.exception.status_int)
+        return catcher.exception.body.decode('utf-8')
+
+    def _put_slo(self, manifest_text, manifest_path='/v1/a/c/the-manifest'):
+        return slo.parse_and_validate_input(manifest_text, manifest_path)
+
+    def test_bogus_input(self):
+        self.assertEqual('Manifest must be valid JSON.\n',
+                         self._put_bogus_slo('some non json'))
+
+        self.assertEqual('Manifest must be a list.\n',
+                         self._put_bogus_slo('{}'))
+
+        self.assertEqual('Index 0: not a JSON object\n',
+                         self._put_bogus_slo('["zombocom"]'))
+
+    def test_bogus_input_bad_keys(self):
+        self.assertEqual(
+            "Index 0: extraneous keys \"baz\", \"foo\"\n",
+            self._put_bogus_slo(json.dumps(
+                [{'path': '/cont/object', 'etag': 'etagoftheobjectsegment',
+                  'size_bytes': 100,
+                  'foo': 'bar', 'baz': 'quux'}])))
+
+        # This also catches typos
+        self.assertEqual(
+            'Index 0: extraneous keys "egat"\n',
+            self._put_bogus_slo(json.dumps(
+                [{'path': '/cont/object', 'egat': 'etagoftheobjectsegment',
+                  'size_bytes': 100}])))
+        self.assertEqual(
+            'Index 0: extraneous keys "siez_bytes"\n',
+            self._put_bogus_slo(json.dumps(
+                [{'path': '/cont/object', 'etag': 'etagoftheobjectsegment',
+                  'siez_bytes': 100}])))
+
+    def test_bogus_input_ranges(self):
+        self.assertEqual(
+            "Index 0: invalid range\n",
+            self._put_bogus_slo(json.dumps(
+                [{'path': '/cont/object', 'etag': 'blah',
+                  'size_bytes': 100, 'range': 'non-range value'}])))
+
+        self.assertEqual(
+            "Index 0: multiple ranges (only one allowed)\n",
+            self._put_bogus_slo(json.dumps(
+                [{'path': '/cont/object', 'etag': 'blah',
+                  'size_bytes': 100, 'range': '1-20,30-40'}])))
+
+    def test_bogus_input_unsatisfiable_range(self):
+        self.assertEqual(
+            "Index 0: unsatisfiable range\n",
+            self._put_bogus_slo(json.dumps(
+                [{'path': '/cont/object', 'etag': 'blah',
+                  'size_bytes': 100, 'range': '8888-9999'}])))
+
+        # since size is optional, we have to be able to defer this check
+        segs = self._put_slo(json.dumps(
+            [{'path': '/cont/object', 'etag': 'blah',
+              'size_bytes': None, 'range': '8888-9999'}]))
+        self.assertEqual(1, len(segs))
+
+    def test_bogus_input_path(self):
+        self.assertEqual(
+            "Index 0: path does not refer to an object. Path must be of the "
+            "form /container/object.\n"
+            "Index 1: path does not refer to an object. Path must be of the "
+            "form /container/object.\n",
+            self._put_bogus_slo(json.dumps(
+                [{'path': '/cont', 'etag': 'etagoftheobjectsegment',
+                  'size_bytes': 100},
+                 {'path': '/c-trailing-slash/', 'etag': 'e',
+                  'size_bytes': 100},
+                 {'path': '/con/obj', 'etag': 'e',
+                  'size_bytes': 100},
+                 {'path': '/con/obj-trailing-slash/', 'etag': 'e',
+                  'size_bytes': 100},
+                 {'path': '/con/obj/with/slashes', 'etag': 'e',
+                  'size_bytes': 100}])))
+
+    def test_bogus_input_multiple(self):
+        self.assertEqual(
+            "Index 0: invalid range\nIndex 1: not a JSON object\n",
+            self._put_bogus_slo(json.dumps(
+                [{'path': '/cont/object', 'etag': 'etagoftheobjectsegment',
+                  'size_bytes': 100, 'range': 'non-range value'},
+                 None])))
+
+    def test_bogus_input_size_bytes(self):
+        self.assertEqual(
+            "Index 0: invalid size_bytes\n",
+            self._put_bogus_slo(json.dumps(
+                [{'path': '/cont/object', 'etag': 'blah', 'size_bytes': "fht"},
+                 {'path': '/cont/object', 'etag': 'blah', 'size_bytes': None},
+                 {'path': '/cont/object', 'etag': 'blah', 'size_bytes': 100}],
+            )))
+
+        self.assertEqual(
+            "Index 0: invalid size_bytes\n",
+            self._put_bogus_slo(json.dumps(
+                [{'path': '/cont/object', 'etag': 'blah', 'size_bytes': []}],
+            )))
+
+    def test_bogus_input_self_referential(self):
+        self.assertEqual(
+            "Index 0: manifest must not include itself as a segment\n",
+            self._put_bogus_slo(json.dumps(
+                [{'path': '/c/the-manifest', 'etag': 'gate',
+                  'size_bytes': 100, 'range': 'non-range value'}])))
+
+    def test_bogus_input_self_referential_non_ascii(self):
+        self.assertEqual(
+            "Index 0: manifest must not include itself as a segment\n",
+            self._put_bogus_slo(
+                json.dumps([{'path': u'/c/あ_1',
+                             'etag': 'a', 'size_bytes': 1}]),
+                manifest_path=quote(u'/v1/a/c/あ_1')))
+
+    def test_bogus_input_self_referential_last_segment(self):
+        test_json_data = json.dumps([
+            {'path': '/c/seg_1', 'etag': 'a', 'size_bytes': 1},
+            {'path': '/c/seg_2', 'etag': 'a', 'size_bytes': 1},
+            {'path': '/c/seg_3', 'etag': 'a', 'size_bytes': 1},
+            {'path': '/c/the-manifest', 'etag': 'a', 'size_bytes': 1},
+        ]).encode('ascii')
+        self.assertEqual(
+            "Index 3: manifest must not include itself as a segment\n",
+            self._put_bogus_slo(
+                test_json_data,
+                manifest_path=quote('/v1/a/c/the-manifest')))
+
+    def test_bogus_input_undersize_segment(self):
+        self.assertEqual(
+            "Index 1: too small; each segment "
+            "must be at least 1 byte.\n"
+            "Index 2: too small; each segment "
+            "must be at least 1 byte.\n",
+            self._put_bogus_slo(
+                json.dumps([
+                    {'path': u'/c/s1', 'etag': 'a', 'size_bytes': 1},
+                    {'path': u'/c/s2', 'etag': 'b', 'size_bytes': 0},
+                    {'path': u'/c/s3', 'etag': 'c', 'size_bytes': 0},
+                    # No error for this one since size_bytes is unspecified
+                    {'path': u'/c/s4', 'etag': 'd', 'size_bytes': None},
+                    {'path': u'/c/s5', 'etag': 'e', 'size_bytes': 1000}])))
+
+    def test_valid_input(self):
+        data = json.dumps(
+            [{'path': '/cont/object', 'etag': 'etagoftheobjectsegment',
+              'size_bytes': 100}])
+        self.assertEqual(
+            '/cont/object',
+            slo.parse_and_validate_input(data, '/v1/a/cont/man')[0]['path'])
+
+        data = json.dumps(
+            [{'path': '/cont/object', 'etag': 'etagoftheobjectsegment',
+              'size_bytes': 100, 'range': '0-40'}])
+        parsed = slo.parse_and_validate_input(data, '/v1/a/cont/man')
+        self.assertEqual('/cont/object', parsed[0]['path'])
+        self.assertEqual([(0, 40)], parsed[0]['range'].ranges)
+
+        data = json.dumps(
+            [{'path': '/cont/object', 'etag': 'etagoftheobjectsegment',
+              'size_bytes': None, 'range': '0-40'}])
+        parsed = slo.parse_and_validate_input(data, '/v1/a/cont/man')
+        self.assertEqual('/cont/object', parsed[0]['path'])
+        self.assertIsNone(parsed[0]['size_bytes'])
+        self.assertEqual([(0, 40)], parsed[0]['range'].ranges)
+
+    def test_container_listing(self):
+        listing_json = json.dumps([{
+            "bytes": 104857600,
+            "content_type": "application/x-troff-me",
+            "hash": "8de7b0b1551660da51d8d96a53b85531; this=that;"
+            "slo_etag=dc9947c2b53a3f55fe20c1394268e216",
+            "last_modified": "2018-07-12T03:14:39.532020",
+            "name": "test.me"
+        }]).encode('ascii')
+        self.app.register(
+            'GET', '/v1/a/c',
+            swob.HTTPOk,
+            {'Content-Type': 'application/json',
+             'Content-Length': len(listing_json)},
+            listing_json)
+        req = Request.blank('/v1/a/c', method='GET')
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(json.loads(body), [{
+            "slo_etag": '"dc9947c2b53a3f55fe20c1394268e216"',
+            "hash": "8de7b0b1551660da51d8d96a53b85531; this=that",
+            "name": "test.me",
+            "bytes": 104857600,
+            "last_modified": "2018-07-12T03:14:39.532020",
+            "content_type": "application/x-troff-me",
+        }])
+
+
+class TestSloPutManifest(SloTestCase):
+
+    def setUp(self):
+        super(TestSloPutManifest, self).setUp()
+
+        self.app.register(
+            'GET', '/', swob.HTTPOk, {}, b'passed')
+        self.app.register(
+            'PUT', '/', swob.HTTPOk, {}, b'passed')
+
+        self.app.register(
+            'HEAD', '/v1/AUTH_test/cont/missing-object',
+            swob.HTTPNotFound, {}, None)
+        self.app.register(
+            'HEAD', '/v1/AUTH_test/cont/object',
+            swob.HTTPOk,
+            {'Content-Length': '100', 'Etag': 'etagoftheobjectsegment'},
+            None)
+        self.app.register(
+            'HEAD', '/v1/AUTH_test/cont/object2',
+            swob.HTTPOk,
+            {'Content-Length': '100', 'Etag': 'etagoftheobjectsegment'},
+            None)
+        self.app.register(
+            'HEAD', '/v1/AUTH_test/cont/object\xe2\x99\xa1',
+            swob.HTTPOk,
+            {'Content-Length': '100', 'Etag': 'etagoftheobjectsegment'},
+            None)
+        self.app.register(
+            'HEAD', '/v1/AUTH_test/cont/small_object',
+            swob.HTTPOk,
+            {'Content-Length': '10', 'Etag': 'etagoftheobjectsegment'},
+            None)
+        self.app.register(
+            'HEAD', '/v1/AUTH_test/cont/empty_object',
+            swob.HTTPOk,
+            {'Content-Length': '0', 'Etag': 'etagoftheobjectsegment'},
+            None)
+        self.app.register(
+            'HEAD', u'/v1/AUTH_test/cont/あ_1',
+            swob.HTTPOk,
+            {'Content-Length': '1', 'Etag': 'a'},
+            None)
+        self.app.register(
+            'PUT', '/v1/AUTH_test/c/man', swob.HTTPCreated,
+            {'Last-Modified': 'Fri, 01 Feb 2012 20:38:36 GMT'}, None)
+        self.app.register(
+            'DELETE', '/v1/AUTH_test/c/man', swob.HTTPNoContent, {}, None)
+
+        self.app.register(
+            'HEAD', '/v1/AUTH_test/checktest/a_1',
+            swob.HTTPOk,
+            {'Content-Length': '1', 'Etag': 'a'},
+            None)
+        self.app.register(
+            'HEAD', '/v1/AUTH_test/checktest/badreq',
+            swob.HTTPBadRequest, {}, None)
+        self.app.register(
+            'HEAD', '/v1/AUTH_test/checktest/b_2',
+            swob.HTTPOk,
+            {'Content-Length': '2', 'Etag': 'b',
+             'Last-Modified': 'Fri, 01 Feb 2012 20:38:36 GMT'},
+            None)
+
+        _manifest_json = json.dumps(
+            [{'name': '/checktest/a_5', 'hash': md5hex("a" * 5),
+              'content_type': 'text/plain', 'bytes': '5'}]).encode('ascii')
+        self.app.register(
+            'GET', '/v1/AUTH_test/checktest/slob',
+            swob.HTTPOk,
+            {'X-Static-Large-Object': 'true', 'Etag': 'slob-etag',
+             'Content-Type': 'cat/picture',
+             'Content-Length': len(_manifest_json)},
+            _manifest_json)
+
+        self.app.register(
+            'PUT', '/v1/AUTH_test/checktest/man_3', swob.HTTPCreated, {}, None)
+
+    def test_put_manifest_too_quick_fail(self):
+        req = Request.blank('/v1/a/c/o?multipart-manifest=put', method='PUT')
+        req.content_length = self.slo.max_manifest_size + 1
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '413 Request Entity Too Large')
+
+        with patch.object(self.slo, 'max_manifest_segments', 0):
+            req = Request.blank('/v1/a/c/o?multipart-manifest=put',
+                                method='PUT', body=test_json_data)
+            status, headers, body = self.call_slo(req)
+            self.assertEqual(status, '413 Request Entity Too Large')
+
+        req = Request.blank('/v1/a/c/o?multipart-manifest=put', method='PUT',
+                            headers={'X-Copy-From': 'lala'})
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '405 Method Not Allowed')
+
+        # we already validated that there are enough path segments in __call__
+        for path in ('/', '/v1/', '/v1/a/', '/v1/a/c/'):
+            req = Request.blank(
+                path + '?multipart-manifest=put',
+                environ={'REQUEST_METHOD': 'PUT'}, body=test_json_data)
+            with self.assertRaises(ValueError):
+                list(self.slo.handle_multipart_put(req, fake_start_response))
+
+            req = Request.blank(
+                path.rstrip('/') + '?multipart-manifest=put',
+                environ={'REQUEST_METHOD': 'PUT'}, body=test_json_data)
+            with self.assertRaises(ValueError):
+                list(self.slo.handle_multipart_put(req, fake_start_response))
+
+    def test_handle_multipart_put_success(self):
+        override_header = 'X-Object-Sysmeta-Container-Update-Override-Etag'
+        headers = {
+            'Accept': 'test',
+            override_header: '; params=are important',
+        }
+        req = Request.blank(
+            '/v1/AUTH_test/c/man?multipart-manifest=put',
+            environ={'REQUEST_METHOD': 'PUT'}, headers=headers,
+            body=test_json_data)
+        for h in ('X-Static-Large-Object', 'X-Object-Sysmeta-Slo-Etag',
+                  'X-Object-Sysmeta-Slo-Size'):
+            # Sanity
+            self.assertNotIn(h, req.headers)
+
+        status, headers, body = self.call_slo(req)
+        gen_etag = '"' + md5hex('etagoftheobjectsegment') + '"'
+        self.assertIn(('Etag', gen_etag), headers)
+        self.assertIn('X-Static-Large-Object', req.headers)
+        self.assertEqual(req.headers['X-Static-Large-Object'], 'True')
+        self.assertIn('Etag', req.headers)
+        self.assertIn('X-Object-Sysmeta-Slo-Etag', req.headers)
+        self.assertIn('X-Object-Sysmeta-Container-Update-Override-Etag',
+                      req.headers)
+        self.assertEqual(req.headers['X-Object-Sysmeta-Slo-Etag'],
+                         gen_etag.strip('"'))
+        self.assertEqual(
+            req.headers['X-Object-Sysmeta-Container-Update-Override-Etag'],
+            '%s; params=are important; slo_etag=%s' % (
+                req.headers['Etag'], gen_etag.strip('"')))
+        self.assertIn('X-Object-Sysmeta-Slo-Size', req.headers)
+        self.assertEqual(req.headers['X-Object-Sysmeta-Slo-Size'], '100')
+        self.assertIn('Content-Type', req.headers)
+        self.assertTrue(
+            req.headers['Content-Type'].endswith(';swift_bytes=100'),
+            'Content-Type %r does not end with swift_bytes=100' %
+            req.headers['Content-Type'])
+
+    @patch('swift.common.middleware.slo.time')
+    def test_handle_multipart_put_fast_heartbeat(self, mock_time):
+        mock_time.time.side_effect = [
+            0,  # start time
+            1,  # first segment's fast
+            2,  # second segment's also fast!
+        ]
+        test_json_data = json.dumps([{'path': u'/cont/object\u2661',
+                                      'etag': 'etagoftheobjectsegment',
+                                      'size_bytes': 100},
+                                     {'path': '/cont/object',
+                                      'etag': 'etagoftheobjectsegment',
+                                      'size_bytes': 100}]).encode('ascii')
+        req = Request.blank(
+            '/v1/AUTH_test/c/man?multipart-manifest=put&heartbeat=on',
+            environ={'REQUEST_METHOD': 'PUT'}, headers={'Accept': 'test'},
+            body=test_json_data)
+
+        status, headers, body = self.call_slo(req)
+        self.assertEqual('202 Accepted', status)
+        headers_found = [h.lower() for h, v in headers]
+        self.assertNotIn('etag', headers_found)
+        gen_etag = '"' + md5hex('etagoftheobjectsegment' * 2) + '"'
+        self.assertTrue(body.startswith(b' \r\n\r\n'),
+                        'Expected body to start with single space and two '
+                        'blank lines; got %r' % body)
+        self.assertIn(b'\nResponse Status: 201 Created\n', body)
+        self.assertIn(b'\nResponse Body: \n', body)
+        self.assertIn(('\nEtag: %s\n' % gen_etag).encode('ascii'), body)
+        self.assertIn(b'\nLast Modified: Fri, 01 Feb 2012 20:38:36 GMT\n',
+                      body)
+
+    @patch('swift.common.middleware.slo.time')
+    def test_handle_multipart_long_running_put_success(self, mock_time):
+        mock_time.time.side_effect = [
+            0,  # start time
+            1,  # first segment's fast
+            20,  # second segment's slow
+        ]
+        test_json_data = json.dumps([{'path': u'/cont/object\u2661',
+                                      'etag': 'etagoftheobjectsegment',
+                                      'size_bytes': 100},
+                                     {'path': '/cont/object',
+                                      'etag': 'etagoftheobjectsegment',
+                                      'size_bytes': 100}]).encode('ascii')
+        req = Request.blank(
+            '/v1/AUTH_test/c/man?multipart-manifest=put&heartbeat=on',
+            environ={'REQUEST_METHOD': 'PUT'}, headers={'Accept': 'test'},
+            body=test_json_data)
+
+        status, headers, body = self.call_slo(req)
+        self.assertEqual('202 Accepted', status)
+        headers_found = [h.lower() for h, v in headers]
+        self.assertNotIn('etag', headers_found)
+        gen_etag = '"' + md5hex('etagoftheobjectsegment' * 2) + '"'
+        self.assertTrue(body.startswith(b'  \r\n\r\n'),
+                        'Expected body to start with two spaces and two '
+                        'blank lines; got %r' % body)
+        self.assertIn(b'\nResponse Status: 201 Created\n', body)
+        self.assertIn(b'\nResponse Body: \n', body)
+        self.assertIn(('\nEtag: %s\n' % gen_etag).encode('ascii'), body)
+        self.assertIn(b'\nLast Modified: Fri, 01 Feb 2012 20:38:36 GMT\n',
+                      body)
+
+    @patch('swift.common.middleware.slo.time')
+    def test_handle_multipart_long_running_put_success_json(self, mock_time):
+        mock_time.time.side_effect = [
+            0,  # start time
+            11,  # first segment's slow
+            22,  # second segment's also slow
+        ]
+        test_json_data = json.dumps([{'path': u'/cont/object\u2661',
+                                      'etag': 'etagoftheobjectsegment',
+                                      'size_bytes': 100},
+                                     {'path': '/cont/object',
+                                      'etag': 'etagoftheobjectsegment',
+                                      'size_bytes': 100}]).encode('ascii')
+        req = Request.blank(
+            '/v1/AUTH_test/c/man?multipart-manifest=put&heartbeat=on',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'Accept': 'application/json'},
+            body=test_json_data)
+
+        status, headers, body = self.call_slo(req)
+        self.assertEqual('202 Accepted', status)
+        headers_found = [h.lower() for h, v in headers]
+        self.assertNotIn('etag', headers_found)
+        gen_etag = '"' + md5hex('etagoftheobjectsegment' * 2) + '"'
+        self.assertTrue(body.startswith(b'   \r\n\r\n'),
+                        'Expected body to start with three spaces and two '
+                        'blank lines; got %r' % body)
+        body = json.loads(body)
+        self.assertEqual(body['Response Status'], '201 Created')
+        self.assertEqual(body['Response Body'], '')
+        self.assertEqual(body['Etag'], gen_etag)
+        self.assertEqual(body['Last Modified'],
+                         'Fri, 01 Feb 2012 20:38:36 GMT')
+
+    @patch('swift.common.middleware.slo.time')
+    def test_handle_multipart_long_running_put_failure(self, mock_time):
+        mock_time.time.side_effect = [
+            0,  # start time
+            1,  # first segment's fast
+            20,  # second segment's slow
+        ]
+        test_json_data = json.dumps([{'path': u'/cont/missing-object',
+                                      'etag': 'etagoftheobjectsegment',
+                                      'size_bytes': 100},
+                                     {'path': '/cont/object',
+                                      'etag': 'etagoftheobjectsegment',
+                                      'size_bytes': 99}]).encode('ascii')
+        req = Request.blank(
+            '/v1/AUTH_test/c/man?multipart-manifest=put&heartbeat=on',
+            environ={'REQUEST_METHOD': 'PUT'}, headers={'Accept': 'test'},
+            body=test_json_data)
+
+        status, headers, body = self.call_slo(req)
+        self.assertEqual('202 Accepted', status)
+        headers_found = [h.lower() for h, v in headers]
+        self.assertNotIn('etag', headers_found)
+        body = body.split(b'\n')
+        self.assertEqual([b'  \r', b'\r'], body[:2],
+                         'Expected body to start with two spaces and two '
+                         'blank lines; got %r' % b'\n'.join(body))
+        self.assertIn(b'Response Status: 400 Bad Request', body[2:5])
+        self.assertIn(b'Response Body: Bad Request', body)
+        self.assertIn(b'The server could not comply with the request since it '
+                      b'is either malformed or otherwise incorrect.', body)
+        self.assertFalse(any(line.startswith(b'Etag: ') for line in body))
+        self.assertFalse(any(line.startswith(b'Last Modified: ')
+                             for line in body))
+        self.assertEqual(body[-4], b'Errors:')
+        self.assertEqual(sorted(body[-3:-1]), [
+            b'/cont/missing-object, 404 Not Found',
+            b'/cont/object, Size Mismatch',
+        ])
+        self.assertEqual(body[-1], b'')
+
+    @patch('swift.common.middleware.slo.time')
+    def test_handle_multipart_long_running_put_failure_json(self, mock_time):
+        mock_time.time.side_effect = [
+            0,  # start time
+            11,  # first segment's slow
+            22,  # second segment's also slow
+        ]
+        test_json_data = json.dumps([{'path': u'/cont/object\u2661',
+                                      'etag': 'etagoftheobjectsegment',
+                                      'size_bytes': 99},
+                                     {'path': '/cont/object',
+                                      'etag': 'some other etag',
+                                      'size_bytes': 100}]).encode('ascii')
+        req = Request.blank(
+            '/v1/AUTH_test/c/man?multipart-manifest=put&heartbeat=on',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'Accept': 'application/json'},
+            body=test_json_data)
+
+        status, headers, body = self.call_slo(req)
+        self.assertEqual('202 Accepted', status)
+        headers_found = [h.lower() for h, v in headers]
+        self.assertNotIn('etag', headers_found)
+        self.assertTrue(body.startswith(b'   \r\n\r\n'),
+                        'Expected body to start with three spaces and two '
+                        'blank lines; got %r' % body)
+        body = json.loads(body)
+        self.assertEqual(body['Response Status'], '400 Bad Request')
+        self.assertEqual(body['Response Body'], 'Bad Request\nThe server '
+                         'could not comply with the request since it is '
+                         'either malformed or otherwise incorrect.')
+        self.assertNotIn('Etag', body)
+        self.assertNotIn('Last Modified', body)
+        self.assertEqual(sorted(body['Errors']), [
+            ['/cont/object', 'Etag Mismatch'],
+            [quote(u'/cont/object\u2661'.encode('utf8')).decode('ascii'),
+             'Size Mismatch'],
+        ])
+
+    @patch('swift.common.middleware.slo.time')
+    def test_handle_multipart_long_running_put_bad_etag_json(self, mock_time):
+        mock_time.time.side_effect = [
+            0,  # start time
+            11,  # first segment's slow
+            22,  # second segment's also slow
+        ]
+        test_json_data = json.dumps([{'path': u'/cont/object\u2661',
+                                      'etag': 'etagoftheobjectsegment',
+                                      'size_bytes': 100},
+                                     {'path': '/cont/object',
+                                      'etag': 'etagoftheobjectsegment',
+                                      'size_bytes': 100}]).encode('ascii')
+        req = Request.blank(
+            '/v1/AUTH_test/c/man?multipart-manifest=put&heartbeat=on',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'Accept': 'application/json', 'ETag': 'bad etag'},
+            body=test_json_data)
+
+        status, headers, body = self.call_slo(req)
+        self.assertEqual('202 Accepted', status)
+        headers_found = [h.lower() for h, v in headers]
+        self.assertNotIn('etag', headers_found)
+        self.assertTrue(body.startswith(b'   \r\n\r\n'),
+                        'Expected body to start with three spaces and two '
+                        'blank lines; got %r' % body)
+        body = json.loads(body)
+        self.assertEqual(body['Response Status'], '422 Unprocessable Entity')
+        self.assertEqual('Unprocessable Entity\nUnable to process the '
+                         'contained instructions', body['Response Body'])
+        self.assertNotIn('Etag', body)
+        self.assertNotIn('Last Modified', body)
+        self.assertEqual(body['Errors'], [])
+
+    def test_manifest_put_no_etag_success(self):
+        req = Request.blank(
+            '/v1/AUTH_test/c/man?multipart-manifest=put',
+            method='PUT', body=test_json_data)
+        resp = req.get_response(self.slo)
+        self.assertEqual(resp.status_int, 201)
+
+    def test_manifest_put_with_etag_success(self):
+        req = Request.blank(
+            '/v1/AUTH_test/c/man?multipart-manifest=put',
+            method='PUT', body=test_json_data)
+        req.headers['Etag'] = md5hex('etagoftheobjectsegment')
+        resp = req.get_response(self.slo)
+        self.assertEqual(resp.status_int, 201)
+
+    def test_manifest_put_with_etag_with_quotes_success(self):
+        req = Request.blank(
+            '/v1/AUTH_test/c/man?multipart-manifest=put',
+            method='PUT', body=test_json_data)
+        req.headers['Etag'] = '"%s"' % md5hex('etagoftheobjectsegment')
+        resp = req.get_response(self.slo)
+        self.assertEqual(resp.status_int, 201)
+
+    def test_manifest_put_bad_etag_fail(self):
+        req = Request.blank(
+            '/v1/AUTH_test/c/man?multipart-manifest=put',
+            method='PUT', body=test_json_data)
+        req.headers['Etag'] = md5hex('NOTetagoftheobjectsegment')
+        resp = req.get_response(self.slo)
+        self.assertEqual(resp.status_int, 422)
+
+    def test_handle_multipart_put_disallow_empty_first_segment(self):
+        test_json_data = json.dumps([{'path': '/cont/small_object',
+                                      'etag': 'etagoftheobjectsegment',
+                                      'size_bytes': 0},
+                                     {'path': '/cont/object',
+                                      'etag': 'etagoftheobjectsegment',
+                                      'size_bytes': 100}]).encode('ascii')
+        req = Request.blank('/v1/a/c/o?multipart-manifest=put',
+                            method='PUT', body=test_json_data)
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '400 Bad Request')
+
+    def test_handle_multipart_put_allow_empty_last_segment(self):
+        test_json_data = json.dumps([{'path': '/cont/object',
+                                      'etag': 'etagoftheobjectsegment',
+                                      'size_bytes': 100},
+                                     {'path': '/cont/empty_object',
+                                      'etag': 'etagoftheobjectsegment',
+                                      'size_bytes': 0}]).encode('ascii')
+        req = Request.blank('/v1/AUTH_test/c/man?multipart-manifest=put',
+                            method='PUT', body=test_json_data)
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '201 Created')
+
+    def test_handle_multipart_put_invalid_data(self):
+        def do_test(bad_data):
+            test_json_data = json.dumps([{'path': '/cont/object',
+                                          'etag': 'etagoftheobjectsegment',
+                                          'size_bytes': 100},
+                                         {'data': bad_data}]).encode('ascii')
+            req = Request.blank('/v1/a/c/o', body=test_json_data)
+            with self.assertRaises(HTTPException) as catcher:
+                self.slo.handle_multipart_put(req, fake_start_response)
+            self.assertEqual(catcher.exception.status_int, 400)
+
+        do_test('invalid')  # insufficient padding
+        do_test(12345)
+        do_test(0)
+        do_test(True)
+        do_test(False)
+        do_test(None)
+        do_test({})
+        do_test([])
+        # Empties are no good, either
+        do_test('')
+        do_test('====')
+
+    def test_handle_multipart_put_success_unicode(self):
+        test_json_data = json.dumps([{'path': u'/cont/object\u2661',
+                                      'etag': 'etagoftheobjectsegment',
+                                      'size_bytes': 100}]).encode('ascii')
+        req = Request.blank(
+            '/v1/AUTH_test/c/man?multipart-manifest=put',
+            environ={'REQUEST_METHOD': 'PUT'}, headers={'Accept': 'test'},
+            body=test_json_data)
+        self.assertNotIn('X-Static-Large-Object', req.headers)
+        self.call_slo(req)
+        self.assertIn('X-Static-Large-Object', req.headers)
+        self.assertEqual(req.environ['PATH_INFO'], '/v1/AUTH_test/c/man')
+        self.assertIn(('HEAD', '/v1/AUTH_test/cont/object\xe2\x99\xa1'),
+                      self.app.calls)
+
+    def test_handle_multipart_put_no_xml(self):
+        req = Request.blank(
+            '/test_good/AUTH_test/c/man?multipart-manifest=put',
+            environ={'REQUEST_METHOD': 'PUT'}, headers={'Accept': 'test'},
+            body=test_xml_data)
+        no_xml = list(self.slo(req.environ, fake_start_response))
+        self.assertEqual(no_xml, [b'Manifest must be valid JSON.\n'])
+
+    def test_handle_multipart_put_bad_data(self):
+        bad_data = json.dumps([{'path': '/cont/object',
+                                'etag': 'etagoftheobj',
+                                'size_bytes': 'lala'}])
+        req = Request.blank(
+            '/test_good/AUTH_test/c/man?multipart-manifest=put',
+            environ={'REQUEST_METHOD': 'PUT'}, body=bad_data)
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '400 Bad Request')
+        self.assertIn(b'invalid size_bytes', body)
+
+        for bad_data in [
+                json.dumps([{'path': '/cont', 'etag': 'etagoftheobj',
+                             'size_bytes': 100}]),
+                json.dumps('asdf'), json.dumps(None), json.dumps(5),
+                'not json', '1234', '', json.dumps({'path': None}),
+                json.dumps([{'path': '/cont/object', 'etag': None,
+                             'size_bytes': 12}]),
+                json.dumps([{'path': '/cont/object', 'etag': 'asdf',
+                             'size_bytes': 'sd'}]),
+                json.dumps([{'path': 12, 'etag': 'etagoftheobj',
+                             'size_bytes': 100}]),
+                json.dumps([{'path': u'/cont/object\u2661',
+                             'etag': 'etagoftheobj', 'size_bytes': 100}]),
+                json.dumps([{'path': 12, 'size_bytes': 100}]),
+                json.dumps([{'path': 12, 'size_bytes': 100}]),
+                json.dumps([{'path': '/c/o', 'etag': 123, 'size_bytes': 100}]),
+                json.dumps([{'path': None, 'etag': 'etagoftheobj',
+                             'size_bytes': 100}])]:
+            req = Request.blank(
+                '/v1/AUTH_test/c/man?multipart-manifest=put',
+                environ={'REQUEST_METHOD': 'PUT'}, body=bad_data)
+            status, headers, body = self.call_slo(req)
+            self.assertEqual(status, '400 Bad Request')
+
+        req = Request.blank(
+            '/v1/AUTH_test/c/man?multipart-manifest=put',
+            environ={'REQUEST_METHOD': 'PUT'}, body=None)
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '411 Length Required')
+
+    def test_handle_multipart_put_check_data(self):
+        good_data = json.dumps(
+            [{'path': '/checktest/a_1', 'etag': 'a', 'size_bytes': '1'},
+             {'path': '/checktest/b_2', 'etag': 'b', 'size_bytes': '2'}])
+        req = Request.blank(
+            '/v1/AUTH_test/checktest/man_3?multipart-manifest=put',
+            environ={'REQUEST_METHOD': 'PUT'}, body=good_data)
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(self.app.call_count, 3)
+
+        # go behind SLO's back and see what actually got stored
+        req = Request.blank(
+            '/v1/AUTH_test/checktest/man_3?multipart-manifest=get',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_app(req)
+        headers = dict(headers)
+        manifest_data = json.loads(body)
+        self.assertTrue(headers['Content-Type'].endswith(';swift_bytes=3'))
+        self.assertEqual(len(manifest_data), 2)
+        self.assertEqual(manifest_data[0]['hash'], 'a')
+        self.assertEqual(manifest_data[0]['bytes'], 1)
+        self.assertTrue(
+            not manifest_data[0]['last_modified'].startswith('2012'))
+        self.assertTrue(manifest_data[1]['last_modified'].startswith('2012'))
+
+    def test_handle_multipart_put_check_data_bad(self):
+        bad_data = json.dumps(
+            [{'path': '/checktest/a_1', 'etag': 'a', 'size_bytes': '2'},
+             {'path': '/checktest/badreq', 'etag': 'a', 'size_bytes': '1'},
+             {'path': '/checktest/b_2', 'etag': 'not-b', 'size_bytes': '2'},
+             {'path': '/checktest/slob', 'etag': 'not-slob',
+              'size_bytes': '12345'}])
+        req = Request.blank(
+            '/v1/AUTH_test/checktest/man?multipart-manifest=put',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'Accept': 'application/json'},
+            body=bad_data)
+
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(self.app.call_count, 5)
+        errors = json.loads(body)['Errors']
+
+        self.assertEqual([
+            [u'/checktest/a_1', u'Size Mismatch'],
+            [u'/checktest/b_2', u'Etag Mismatch'],
+            [u'/checktest/badreq', u'400 Bad Request'],
+            [u'/checktest/slob', u'Etag Mismatch'],
+            [u'/checktest/slob', u'Size Mismatch'],
+        ], sorted(errors))
+
+    def test_handle_multipart_put_skip_size_check(self):
+        good_data = json.dumps([
+            # Explicit None will skip it
+            {'path': '/checktest/a_1', 'etag': 'a', 'size_bytes': None},
+            # ...as will omitting it entirely
+            {'path': '/checktest/b_2', 'etag': 'b'}])
+        req = Request.blank(
+            '/v1/AUTH_test/checktest/man_3?multipart-manifest=put',
+            environ={'REQUEST_METHOD': 'PUT'}, body=good_data)
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(self.app.call_count, 3)
+
+        # Check that we still populated the manifest properly from our HEADs
+        req = Request.blank(
+            '/v1/AUTH_test/checktest/man_3?multipart-manifest=get',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_app(req)
+        manifest_data = json.loads(body)
+        self.assertEqual(1, manifest_data[0]['bytes'])
+        self.assertEqual(2, manifest_data[1]['bytes'])
+
+    def test_handle_multipart_put_skip_size_check_still_uses_min_size(self):
+        test_json_data = json.dumps([{'path': '/cont/empty_object',
+                                      'etag': 'etagoftheobjectsegment',
+                                      'size_bytes': None},
+                                     {'path': '/cont/small_object',
+                                      'etag': 'etagoftheobjectsegment',
+                                      'size_bytes': 100}]).encode('ascii')
+        req = Request.blank('/v1/AUTH_test/c/o?multipart-manifest=put',
+                            method='PUT', body=test_json_data)
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '400 Bad Request')
+        self.assertIn(b'Too small; each segment must be at least 1 byte', body)
+
+    def test_handle_multipart_put_skip_size_check_no_early_bailout(self):
+        # The first is too small (it's 0 bytes), and
+        # the second has a bad etag. Make sure both errors show up in
+        # the response.
+        test_json_data = json.dumps([{'path': '/cont/empty_object',
+                                      'etag': 'etagoftheobjectsegment',
+                                      'size_bytes': None},
+                                     {'path': '/cont/object2',
+                                      'etag': 'wrong wrong wrong',
+                                      'size_bytes': 100}]).encode('ascii')
+        req = Request.blank('/v1/AUTH_test/c/o?multipart-manifest=put',
+                            method='PUT', body=test_json_data)
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '400 Bad Request')
+        self.assertIn(b'at least 1 byte', body)
+        self.assertIn(b'Etag Mismatch', body)
+
+    def test_handle_multipart_put_skip_etag_check(self):
+        good_data = json.dumps([
+            # Explicit None will skip it
+            {'path': '/checktest/a_1', 'etag': None, 'size_bytes': 1},
+            # ...as will omitting it entirely
+            {'path': '/checktest/b_2', 'size_bytes': 2}])
+        req = Request.blank(
+            '/v1/AUTH_test/checktest/man_3?multipart-manifest=put',
+            environ={'REQUEST_METHOD': 'PUT'}, body=good_data)
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(self.app.call_count, 3)
+
+        # Check that we still populated the manifest properly from our HEADs
+        req = Request.blank(
+            '/v1/AUTH_test/checktest/man_3?multipart-manifest=get',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_app(req)
+        manifest_data = json.loads(body)
+        self.assertEqual('a', manifest_data[0]['hash'])
+        self.assertEqual('b', manifest_data[1]['hash'])
+
+    def test_handle_multipart_put_with_manipulator_callback(self):
+        def data_inserter(manifest):
+            for i in range(len(manifest), -1, -1):
+                manifest.insert(i, {'data': 'WA=='})
+
+        good_data = json.dumps([
+            {'path': '/checktest/a_1'},
+            {'path': '/checktest/b_2'}])
+        req = Request.blank(
+            '/v1/AUTH_test/checktest/man_3?multipart-manifest=put',
+            environ={'REQUEST_METHOD': 'PUT',
+                     'swift.callback.slo_manifest_hook': data_inserter},
+            body=good_data)
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(self.app.call_count, 3)
+
+        # Check that we still populated the manifest properly from our HEADs
+        req = Request.blank(
+            '/v1/AUTH_test/checktest/man_3?multipart-manifest=get',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_app(req)
+        manifest_data = json.loads(body)
+        self.assertEqual([
+            {k: v for k, v in item.items()
+             if k in ('name', 'bytes', 'hash', 'data')}
+            for item in manifest_data
+        ], [
+            {'data': 'WA=='},
+            {'name': '/checktest/a_1', 'bytes': 1, 'hash': 'a'},
+            {'data': 'WA=='},
+            {'name': '/checktest/b_2', 'bytes': 2, 'hash': 'b'},
+            {'data': 'WA=='},
+        ])
+
+    def test_handle_multipart_put_with_validator_callback(self):
+        def complainer(manifest):
+            return [(item['name'], "Don't wanna") for item in manifest]
+
+        good_data = json.dumps([
+            {'path': '/checktest/a_1'},
+            {'path': '/checktest/b_2'}])
+        req = Request.blank(
+            '/v1/AUTH_test/checktest/man_3?multipart-manifest=put',
+            environ={'REQUEST_METHOD': 'PUT',
+                     'swift.callback.slo_manifest_hook': complainer},
+            body=good_data)
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(self.app.call_count, 2)
+        self.assertEqual(status, '400 Bad Request')
+        body = body.split(b'\n')
+        self.assertIn(b"/checktest/a_1, Don't wanna", body)
+        self.assertIn(b"/checktest/b_2, Don't wanna", body)
+
+    def test_handle_unsatisfiable_ranges(self):
+        bad_data = json.dumps(
+            [{'path': '/checktest/a_1', 'etag': None,
+              'size_bytes': None, 'range': '1-'}])
+        req = Request.blank(
+            '/v1/AUTH_test/checktest/man_3?multipart-manifest=put',
+            environ={'REQUEST_METHOD': 'PUT'}, body=bad_data)
+        status, headers, body = self.call_slo(req)
+        self.assertEqual('400 Bad Request', status)
+        self.assertIn(b"Unsatisfiable Range", body)
+
+    def test_handle_multipart_put_success_conditional(self):
+        test_json_data = json.dumps([{'path': u'/cont/object',
+                                      'etag': 'etagoftheobjectsegment',
+                                      'size_bytes': 100}]).encode('ascii')
+        req = Request.blank(
+            '/v1/AUTH_test/c/man?multipart-manifest=put',
+            environ={'REQUEST_METHOD': 'PUT'}, headers={'If-None-Match': '*'},
+            body=test_json_data)
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(('201 Created', b''), (status, body))
+        self.assertEqual([
+            ('HEAD', '/v1/AUTH_test/cont/object'),
+            ('PUT', '/v1/AUTH_test/c/man?multipart-manifest=put'),
+        ], self.app.calls)
+        # HEAD shouldn't be conditional
+        self.assertNotIn('If-None-Match', self.app.headers[0])
+        # But the PUT should be
+        self.assertIn('If-None-Match', self.app.headers[1])
+        self.assertEqual('*', self.app.headers[1]['If-None-Match'])
+
+    def test_handle_single_ranges(self):
+        good_data = json.dumps(
+            [{'path': '/checktest/a_1', 'etag': None,
+              'size_bytes': None, 'range': '0-0'},
+             {'path': '/checktest/b_2', 'etag': None,
+              'size_bytes': 2, 'range': '-1'},
+             {'path': '/checktest/b_2', 'etag': None,
+              'size_bytes': 2, 'range': '0-0'},
+             {'path': '/checktest/a_1', 'etag': None,
+              'size_bytes': None},
+             {'path': '/cont/object', 'etag': None,
+              'size_bytes': None, 'range': '10-40'}])
+        override_header = 'X-Object-Sysmeta-Container-Update-Override-Etag'
+        req = Request.blank(
+            '/v1/AUTH_test/checktest/man_3?multipart-manifest=put',
+            environ={'REQUEST_METHOD': 'PUT'}, body=good_data,
+            headers={override_header: 'my custom etag'})
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(('201 Created', b''), (status, body))
+        expected_etag = '"%s"' % md5hex(
+            'ab:1-1;b:0-0;aetagoftheobjectsegment:10-40;')
+        self.assertEqual(expected_etag, dict(headers)['Etag'])
+        self.assertEqual([
+            ('HEAD', '/v1/AUTH_test/checktest/a_1'),  # Only once!
+            ('HEAD', '/v1/AUTH_test/checktest/b_2'),  # Only once!
+            ('HEAD', '/v1/AUTH_test/cont/object'),
+        ], sorted(self.app.calls[:-1]))
+        self.assertEqual(
+            ('PUT', '/v1/AUTH_test/checktest/man_3?multipart-manifest=put'),
+            self.app.calls[-1])
+        self.assertEqual(
+            'my custom etag; slo_etag=%s' % expected_etag.strip('"'),
+            self.app.headers[-1].get(override_header))
+
+        # Check that we still populated the manifest properly from our HEADs
+        req = Request.blank(
+            '/v1/AUTH_test/checktest/man_3?multipart-manifest=get',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_app(req)
+        manifest_data = json.loads(body)
+        self.assertEqual(len(manifest_data), 5)
+
+        self.assertEqual('a', manifest_data[0]['hash'])
+        self.assertNotIn('range', manifest_data[0])
+
+        self.assertEqual('b', manifest_data[1]['hash'])
+        self.assertEqual('1-1', manifest_data[1]['range'])
+
+        self.assertEqual('b', manifest_data[2]['hash'])
+        self.assertEqual('0-0', manifest_data[2]['range'])
+
+        self.assertEqual('a', manifest_data[3]['hash'])
+        self.assertNotIn('range', manifest_data[3])
+
+        self.assertEqual('etagoftheobjectsegment', manifest_data[4]['hash'])
+        self.assertEqual('10-40', manifest_data[4]['range'])
+
+
+class TestSloDeleteManifest(SloTestCase):
+
+    def setUp(self):
+        super(TestSloDeleteManifest, self).setUp()
+
+        _submanifest_data = json.dumps(
+            [{'name': '/deltest/b_2', 'hash': 'a', 'bytes': '1'},
+             {'name': '/deltest/c_3', 'hash': 'b', 'bytes': '2'}])
+        _submanifest_data = _submanifest_data.encode('ascii')
+
+        self.app.register(
+            'GET', '/v1/AUTH_test/deltest/man_404',
+            swob.HTTPNotFound, {}, None)
+        self.app.register(
+            'GET', '/v1/AUTH_test/deltest/man',
+            swob.HTTPOk, {'Content-Type': 'application/json',
+                          'X-Static-Large-Object': 'true'},
+            json.dumps([{'name': '/deltest/gone', 'hash': 'a', 'bytes': '1'},
+                        {'name': '/deltest/b_2', 'hash': 'b', 'bytes': '2'}]).
+            encode('ascii'))
+        self.app.register(
+            'DELETE', '/v1/AUTH_test/deltest/man',
+            swob.HTTPNoContent, {}, None)
+        self.app.register(
+            'GET', '/v1/AUTH_test/deltest/man-all-there',
+            swob.HTTPOk, {'Content-Type': 'application/json',
+                          'X-Static-Large-Object': 'true'},
+            json.dumps([{'name': '/deltest/b_2', 'hash': 'a', 'bytes': '1'},
+                        {'name': '/deltest/c_3', 'hash': 'b', 'bytes': '2'}]).
+            encode('ascii'))
+        self.app.register(
+            'GET', '/v1/AUTH_test-un\xc3\xafcode',
+            swob.HTTPOk, {}, None)
+        self.app.register(
+            'GET', '/v1/AUTH_test-un\xc3\xafcode/deltest', swob.HTTPOk, {
+                'X-Container-Read': 'diff read',
+                'X-Container-Write': 'diff write',
+            }, None)
+        self.app.register(
+            'GET', '/v1/AUTH_test-un\xc3\xafcode/\xe2\x98\x83', swob.HTTPOk, {
+                'X-Container-Read': 'same read',
+                'X-Container-Write': 'same write',
+            }, None)
+        self.app.register(
+            'GET', '/v1/AUTH_test-un\xc3\xafcode/deltest/man-all-there',
+            swob.HTTPOk, {'Content-Type': 'application/json',
+                          'X-Static-Large-Object': 'true'},
+            json.dumps([
+                {'name': u'/\N{SNOWMAN}/b_2', 'hash': 'a', 'bytes': '1'},
+                {'name': u'/\N{SNOWMAN}/c_3', 'hash': 'b', 'bytes': '2'},
+            ]).encode('ascii'))
+        self.app.register(
+            'GET', '/v1/AUTH_test-un\xc3\xafcode/\xe2\x98\x83/same-container',
+            swob.HTTPOk, {'Content-Type': 'application/json',
+                          'X-Static-Large-Object': 'true'},
+            json.dumps([
+                {'name': u'/\N{SNOWMAN}/b_2', 'hash': 'a', 'bytes': '1'},
+                {'name': u'/\N{SNOWMAN}/c_3', 'hash': 'b', 'bytes': '2'},
+            ]).encode('ascii'))
+        self.app.register(
+            'DELETE', '/v1/AUTH_test/deltest/man-all-there',
+            swob.HTTPNoContent, {}, None)
+        self.app.register(
+            'DELETE', '/v1/AUTH_test/deltest/gone',
+            swob.HTTPNotFound, {}, None)
+        self.app.register(
+            'GET', '/v1/AUTH_test/deltest/a_1',
+            swob.HTTPOk, {'Content-Length': '1'}, 'a')
+        self.app.register(
+            'DELETE', '/v1/AUTH_test/deltest/a_1',
+            swob.HTTPNoContent, {}, None)
+        self.app.register(
+            'DELETE', '/v1/AUTH_test/deltest/b_2',
+            swob.HTTPNoContent, {}, None)
+        self.app.register(
+            'DELETE', '/v1/AUTH_test/deltest/c_3',
+            swob.HTTPNoContent, {}, None)
+        self.app.register(
+            'DELETE', '/v1/AUTH_test/deltest/d_3',
+            swob.HTTPNoContent, {}, None)
+        self.app.register(
+            'DELETE', '/v1/AUTH_test-un\xc3\xafcode/deltest/man-all-there',
+            swob.HTTPNoContent, {}, None)
+        self.app.register(
+            'DELETE',
+            '/v1/AUTH_test-un\xc3\xafcode/\xe2\x98\x83/same-container',
+            swob.HTTPNoContent, {}, None)
+        self.app.register(
+            'DELETE', '/v1/AUTH_test-un\xc3\xafcode/\xe2\x98\x83/b_2',
+            swob.HTTPNoContent, {}, None)
+        self.app.register(
+            'DELETE', '/v1/AUTH_test-un\xc3\xafcode/\xe2\x98\x83/c_3',
+            swob.HTTPNoContent, {}, None)
+
+        self.app.register(
+            'GET', '/v1/AUTH_test/deltest/manifest-with-submanifest',
+            swob.HTTPOk, {'Content-Type': 'application/json',
+                          'X-Static-Large-Object': 'true'},
+            json.dumps([{'name': '/deltest/a_1',
+                         'hash': 'a', 'bytes': '1'},
+                        {'name': '/deltest/submanifest', 'sub_slo': True,
+                         'hash': 'submanifest-etag',
+                         'bytes': len(_submanifest_data)},
+                        {'name': '/deltest/d_3',
+                         'hash': 'd', 'bytes': '3'}]).encode('ascii'))
+        self.app.register(
+            'DELETE', '/v1/AUTH_test/deltest/manifest-with-submanifest',
+            swob.HTTPNoContent, {}, None)
+
+        self.app.register(
+            'GET', '/v1/AUTH_test/deltest/submanifest',
+            swob.HTTPOk, {'Content-Type': 'application/json',
+                          'X-Static-Large-Object': 'true'},
+            _submanifest_data)
+        self.app.register(
+            'DELETE', '/v1/AUTH_test/deltest/submanifest',
+            swob.HTTPNoContent, {}, None)
+
+        self.app.register(
+            'GET', '/v1/AUTH_test/deltest/manifest-missing-submanifest',
+            swob.HTTPOk, {'Content-Type': 'application/json',
+                          'X-Static-Large-Object': 'true'},
+            json.dumps([{'name': '/deltest/a_1', 'hash': 'a', 'bytes': '1'},
+                        {'name': '/deltest/missing-submanifest',
+                         'hash': 'a', 'bytes': '2', 'sub_slo': True},
+                        {'name': '/deltest/d_3', 'hash': 'd', 'bytes': '3'}]).
+            encode('ascii'))
+        self.app.register(
+            'DELETE', '/v1/AUTH_test/deltest/manifest-missing-submanifest',
+            swob.HTTPNoContent, {}, None)
+
+        self.app.register(
+            'GET', '/v1/AUTH_test/deltest/missing-submanifest',
+            swob.HTTPNotFound, {}, None)
+
+        self.app.register(
+            'GET', '/v1/AUTH_test/deltest/manifest-badjson',
+            swob.HTTPOk, {'Content-Type': 'application/json',
+                          'X-Static-Large-Object': 'true'},
+            b"[not {json (at ++++all")
+
+        self.app.register(
+            'GET', '/v1/AUTH_test/deltest/manifest-with-unauth-segment',
+            swob.HTTPOk, {'Content-Type': 'application/json',
+                          'X-Static-Large-Object': 'true'},
+            json.dumps([{'name': '/deltest/a_1', 'hash': 'a', 'bytes': '1'},
+                        {'name': '/deltest-unauth/q_17',
+                         'hash': '11', 'bytes': '17'}]).encode('ascii'))
+        self.app.register(
+            'DELETE', '/v1/AUTH_test/deltest/manifest-with-unauth-segment',
+            swob.HTTPNoContent, {}, None)
+
+        self.app.register(
+            'DELETE', '/v1/AUTH_test/deltest-unauth/q_17',
+            swob.HTTPUnauthorized, {}, None)
+
+        self.app.register(
+            'GET', '/v1/AUTH_test/deltest/manifest-with-too-many-segs',
+            swob.HTTPOk, {'Content-Type': 'application/json',
+                          'X-Static-Large-Object': 'true'},
+            json.dumps([{'name': '/deltest/a_1',
+                         'hash': 'a', 'bytes': '1'},
+                        {'name': '/deltest/multi-submanifest', 'sub_slo': True,
+                         'hash': 'submanifest-etag',
+                         'bytes': len(_submanifest_data)},
+                        {'name': '/deltest/b_2',
+                         'hash': 'b', 'bytes': '1'},
+                        {'name': '/deltest/c_3',
+                         'hash': 'c', 'bytes': '1'},
+                        {'name': '/deltest/d_4',
+                         'hash': 'b', 'bytes': '1'},
+                        {'name': '/deltest/e_5',
+                         'hash': 'c', 'bytes': '1'},
+                        {'name': '/deltest/f_6',
+                         'hash': 'b', 'bytes': '1'},
+                        {'name': '/deltest/g_8',
+                         'hash': 'c', 'bytes': '1'},
+                        {'name': '/deltest/g_8',
+                         'hash': 'c', 'bytes': '1'},
+                        {'name': '/deltest/h_9',
+                         'hash': 'd', 'bytes': '3'}]))
+
+    def test_handle_multipart_delete_man(self):
+        req = Request.blank(
+            '/v1/AUTH_test/deltest/man',
+            environ={'REQUEST_METHOD': 'DELETE'})
+        self.slo(req.environ, fake_start_response)
+        self.assertEqual(self.app.call_count, 1)
+
+    def test_handle_multipart_delete_bad_utf8(self):
+        req = Request.blank(
+            b'/v1/AUTH_test/deltest/man\xff\xfe?multipart-manifest=delete',
+            environ={'REQUEST_METHOD': 'DELETE',
+                     'HTTP_ACCEPT': 'application/json'})
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '200 OK')
+        resp_data = json.loads(body)
+        self.assertEqual(resp_data['Response Status'],
+                         '412 Precondition Failed')
+
+    def test_handle_multipart_delete_whole_404(self):
+        req = Request.blank(
+            '/v1/AUTH_test/deltest/man_404?multipart-manifest=delete',
+            environ={'REQUEST_METHOD': 'DELETE',
+                     'HTTP_ACCEPT': 'application/json'})
+        status, headers, body = self.call_slo(req)
+        resp_data = json.loads(body)
+        self.assertEqual(
+            self.app.calls,
+            [('GET',
+              '/v1/AUTH_test/deltest/man_404?multipart-manifest=get')])
+        self.assertEqual(resp_data['Response Status'], '200 OK')
+        self.assertEqual(resp_data['Response Body'], '')
+        self.assertEqual(resp_data['Number Deleted'], 0)
+        self.assertEqual(resp_data['Number Not Found'], 1)
+        self.assertEqual(resp_data['Errors'], [])
+
+    def test_handle_multipart_delete_segment_404(self):
+        req = Request.blank(
+            '/v1/AUTH_test/deltest/man?multipart-manifest=delete',
+            environ={'REQUEST_METHOD': 'DELETE',
+                     'HTTP_ACCEPT': 'application/json'})
+        status, headers, body = self.call_slo(req)
+        resp_data = json.loads(body)
+        self.assertEqual(
+            set(self.app.calls),
+            set([('GET',
+                  '/v1/AUTH_test/deltest/man?multipart-manifest=get'),
+                 ('DELETE', '/v1/AUTH_test/deltest/gone'),
+                 ('DELETE', '/v1/AUTH_test/deltest/b_2'),
+                 ('DELETE', '/v1/AUTH_test/deltest/man')]))
+        self.assertEqual(resp_data['Response Status'], '200 OK')
+        self.assertEqual(resp_data['Number Deleted'], 2)
+        self.assertEqual(resp_data['Number Not Found'], 1)
+
+    def test_handle_multipart_delete_whole(self):
+        req = Request.blank(
+            '/v1/AUTH_test/deltest/man-all-there?multipart-manifest=delete',
+            environ={'REQUEST_METHOD': 'DELETE'})
+        self.call_slo(req)
+        self.assertEqual(set(self.app.calls), set([
+            ('GET',
+             '/v1/AUTH_test/deltest/man-all-there?multipart-manifest=get'),
+            ('DELETE', '/v1/AUTH_test/deltest/b_2'),
+            ('DELETE', '/v1/AUTH_test/deltest/c_3'),
+            ('DELETE', ('/v1/AUTH_test/deltest/man-all-there'))]))
+
+    def test_handle_multipart_delete_whole_old_swift(self):
+        # behave like pre-2.24.0 swift; initial GET will return just one byte
+        self.app.can_ignore_range = False
+
+        req = Request.blank(
+            '/v1/AUTH_test/deltest/man-all-there?multipart-manifest=delete',
+            environ={'REQUEST_METHOD': 'DELETE'})
+        self.call_slo(req)
+        self.assertEqual(self.app.calls_with_headers[:2], [
+            ('GET',
+             '/v1/AUTH_test/deltest/man-all-there?multipart-manifest=get',
+             {'Host': 'localhost:80',
+              'User-Agent': 'Mozzarella Foxfire MultipartDELETE',
+              'Range': 'bytes=-1',
+              'X-Backend-Ignore-Range-If-Metadata-Present':
+              'X-Static-Large-Object',
+              'Content-Length': '0'}),
+            ('GET',
+             '/v1/AUTH_test/deltest/man-all-there?multipart-manifest=get',
+             {'Host': 'localhost:80',
+              'User-Agent': 'Mozzarella Foxfire MultipartDELETE',
+              'Content-Length': '0'}),
+        ])
+        self.assertEqual(set(self.app.calls), set([
+            ('GET',
+             '/v1/AUTH_test/deltest/man-all-there?multipart-manifest=get'),
+            ('DELETE', '/v1/AUTH_test/deltest/b_2'),
+            ('DELETE', '/v1/AUTH_test/deltest/c_3'),
+            ('DELETE', ('/v1/AUTH_test/deltest/man-all-there'))]))
+
+    def test_handle_multipart_delete_non_ascii(self):
+        unicode_acct = u'AUTH_test-un\u00efcode'
+        wsgi_acct = bytes_to_wsgi(unicode_acct.encode('utf-8'))
+        req = Request.blank(
+            '/v1/%s/deltest/man-all-there?'
+            'multipart-manifest=delete' % wsgi_acct,
+            environ={'REQUEST_METHOD': 'DELETE'})
+        status, _, body = self.call_slo(req)
+        self.assertEqual('200 OK', status)
+        lines = body.split(b'\n')
+        for l in lines:
+            parts = l.split(b':')
+            if len(parts) == 1:
+                continue
+            key, value = parts
+            if key == 'Response Status':
+                delete_status = int(value.split()[0])
+                self.assertEqual(200, delete_status)
+
+        self.assertEqual(set(self.app.calls), set([
+            ('GET',
+             '/v1/%s/deltest/man-all-there'
+             '?multipart-manifest=get' % wsgi_acct),
+            ('DELETE', '/v1/%s/\xe2\x98\x83/b_2' % wsgi_acct),
+            ('DELETE', '/v1/%s/\xe2\x98\x83/c_3' % wsgi_acct),
+            ('DELETE', ('/v1/%s/deltest/man-all-there' % wsgi_acct))]))
+
+    def test_handle_multipart_delete_nested(self):
+        req = Request.blank(
+            '/v1/AUTH_test/deltest/manifest-with-submanifest?' +
+            'multipart-manifest=delete',
+            environ={'REQUEST_METHOD': 'DELETE'})
+        self.call_slo(req)
+        self.assertEqual(
+            set(self.app.calls),
+            {('GET', '/v1/AUTH_test/deltest/' +
+              'manifest-with-submanifest?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/deltest/' +
+              'submanifest?multipart-manifest=get'),
+             ('DELETE', '/v1/AUTH_test/deltest/a_1'),
+             ('DELETE', '/v1/AUTH_test/deltest/b_2'),
+             ('DELETE', '/v1/AUTH_test/deltest/c_3'),
+             ('DELETE', '/v1/AUTH_test/deltest/submanifest'),
+             ('DELETE', '/v1/AUTH_test/deltest/d_3'),
+             ('DELETE', '/v1/AUTH_test/deltest/manifest-with-submanifest')})
+
+    def test_handle_multipart_delete_nested_too_many_segments(self):
+        req = Request.blank(
+            '/v1/AUTH_test/deltest/manifest-with-too-many-segs?' +
+            'multipart-manifest=delete',
+            environ={'REQUEST_METHOD': 'DELETE',
+                     'HTTP_ACCEPT': 'application/json'})
+        with patch.object(self.slo, 'max_manifest_segments', 1):
+            status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '200 OK')
+        resp_data = json.loads(body)
+        self.assertEqual(resp_data['Response Status'], '400 Bad Request')
+        self.assertEqual(resp_data['Response Body'],
+                         'Too many buffered slo segments to delete.')
+
+    def test_handle_multipart_delete_nested_404(self):
+        req = Request.blank(
+            '/v1/AUTH_test/deltest/manifest-missing-submanifest' +
+            '?multipart-manifest=delete',
+            environ={'REQUEST_METHOD': 'DELETE',
+                     'HTTP_ACCEPT': 'application/json'})
+        status, headers, body = self.call_slo(req)
+        resp_data = json.loads(body)
+        self.assertEqual(set(self.app.calls), {
+            ('GET', '/v1/AUTH_test/deltest/' +
+             'manifest-missing-submanifest?multipart-manifest=get'),
+            ('DELETE', '/v1/AUTH_test/deltest/a_1'),
+            ('GET', '/v1/AUTH_test/deltest/' +
+             'missing-submanifest?multipart-manifest=get'),
+            ('DELETE', '/v1/AUTH_test/deltest/d_3'),
+            ('DELETE', '/v1/AUTH_test/deltest/manifest-missing-submanifest'),
+        })
+        self.assertEqual(resp_data['Response Status'], '200 OK')
+        self.assertEqual(resp_data['Response Body'], '')
+        self.assertEqual(resp_data['Number Deleted'], 3)
+        self.assertEqual(resp_data['Number Not Found'], 1)
+        self.assertEqual(resp_data['Errors'], [])
+
+    def test_handle_multipart_delete_nested_401(self):
+        self.app.register(
+            'GET', '/v1/AUTH_test/deltest/submanifest',
+            swob.HTTPUnauthorized, {}, None)
+
+        req = Request.blank(
+            ('/v1/AUTH_test/deltest/manifest-with-submanifest' +
+             '?multipart-manifest=delete'),
+            environ={'REQUEST_METHOD': 'DELETE',
+                     'HTTP_ACCEPT': 'application/json'})
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '200 OK')
+        resp_data = json.loads(body)
+        self.assertEqual(resp_data['Response Status'], '400 Bad Request')
+        self.assertEqual(resp_data['Errors'],
+                         [['/deltest/submanifest', '401 Unauthorized']])
+
+    def test_handle_multipart_delete_nested_500(self):
+        self.app.register(
+            'GET', '/v1/AUTH_test/deltest/submanifest',
+            swob.HTTPServerError, {}, None)
+
+        req = Request.blank(
+            ('/v1/AUTH_test/deltest/manifest-with-submanifest' +
+             '?multipart-manifest=delete'),
+            environ={'REQUEST_METHOD': 'DELETE',
+                     'HTTP_ACCEPT': 'application/json'})
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '200 OK')
+        resp_data = json.loads(body)
+        self.assertEqual(resp_data['Response Status'], '400 Bad Request')
+        self.assertEqual(resp_data['Errors'],
+                         [['/deltest/submanifest',
+                           'Unable to load SLO manifest or segment.']])
+
+    def test_handle_multipart_delete_not_a_manifest(self):
+        req = Request.blank(
+            '/v1/AUTH_test/deltest/a_1?multipart-manifest=delete',
+            environ={'REQUEST_METHOD': 'DELETE',
+                     'HTTP_ACCEPT': 'application/json'})
+        status, headers, body = self.call_slo(req)
+        resp_data = json.loads(body)
+        self.assertEqual(
+            self.app.calls,
+            [('GET', '/v1/AUTH_test/deltest/a_1?multipart-manifest=get')])
+        self.assertEqual(resp_data['Response Status'], '400 Bad Request')
+        self.assertEqual(resp_data['Response Body'], '')
+        self.assertEqual(resp_data['Number Deleted'], 0)
+        self.assertEqual(resp_data['Number Not Found'], 0)
+        self.assertEqual(resp_data['Errors'],
+                         [['/deltest/a_1', 'Not an SLO manifest']])
+        self.assertFalse(self.app.unread_requests)
+
+    def test_handle_multipart_delete_bad_json(self):
+        req = Request.blank(
+            '/v1/AUTH_test/deltest/manifest-badjson?multipart-manifest=delete',
+            environ={'REQUEST_METHOD': 'DELETE',
+                     'HTTP_ACCEPT': 'application/json'})
+        status, headers, body = self.call_slo(req)
+        resp_data = json.loads(body)
+        self.assertEqual(self.app.calls,
+                         [('GET', '/v1/AUTH_test/deltest/' +
+                           'manifest-badjson?multipart-manifest=get')])
+        self.assertEqual(resp_data['Response Status'], '400 Bad Request')
+        self.assertEqual(resp_data['Response Body'], '')
+        self.assertEqual(resp_data['Number Deleted'], 0)
+        self.assertEqual(resp_data['Number Not Found'], 0)
+        self.assertEqual(resp_data['Errors'],
+                         [['/deltest/manifest-badjson',
+                           'Unable to load SLO manifest']])
+
+    def test_handle_multipart_delete_401(self):
+        req = Request.blank(
+            '/v1/AUTH_test/deltest/manifest-with-unauth-segment' +
+            '?multipart-manifest=delete',
+            environ={'REQUEST_METHOD': 'DELETE',
+                     'HTTP_ACCEPT': 'application/json'})
+        status, headers, body = self.call_slo(req)
+        resp_data = json.loads(body)
+        self.assertEqual(
+            set(self.app.calls),
+            set([('GET', '/v1/AUTH_test/deltest/' +
+                  'manifest-with-unauth-segment?multipart-manifest=get'),
+                 ('DELETE', '/v1/AUTH_test/deltest/a_1'),
+                 ('DELETE', '/v1/AUTH_test/deltest-unauth/q_17'),
+                 ('DELETE', '/v1/AUTH_test/deltest/' +
+                  'manifest-with-unauth-segment')]))
+        self.assertEqual(resp_data['Response Status'], '400 Bad Request')
+        self.assertEqual(resp_data['Response Body'], '')
+        self.assertEqual(resp_data['Number Deleted'], 2)
+        self.assertEqual(resp_data['Number Not Found'], 0)
+        self.assertEqual(resp_data['Errors'],
+                         [['/deltest-unauth/q_17', '401 Unauthorized']])
+
+    def test_handle_multipart_delete_client_content_type(self):
+        req = Request.blank(
+            '/v1/AUTH_test/deltest/man-all-there?multipart-manifest=delete',
+            environ={'REQUEST_METHOD': 'DELETE', 'CONTENT_TYPE': 'foo/bar'},
+            headers={'Accept': 'application/json'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')
+        resp_data = json.loads(body)
+        self.assertEqual(resp_data["Number Deleted"], 3)
+
+        self.assertEqual(set(self.app.calls), set([
+            ('GET',
+             '/v1/AUTH_test/deltest/man-all-there?multipart-manifest=get'),
+            ('DELETE', '/v1/AUTH_test/deltest/b_2'),
+            ('DELETE', '/v1/AUTH_test/deltest/c_3'),
+            ('DELETE', '/v1/AUTH_test/deltest/man-all-there')]))
+
+    def test_handle_async_delete_whole_404(self):
+        self.slo.allow_async_delete = True
+        req = Request.blank(
+            '/v1/AUTH_test/deltest/man_404?async=t&multipart-manifest=delete',
+            environ={'REQUEST_METHOD': 'DELETE',
+                     'HTTP_ACCEPT': 'application/json'})
+        status, headers, body = self.call_slo(req)
+        self.assertEqual('404 Not Found', status)
+        self.assertEqual(
+            self.app.calls,
+            [('GET',
+              '/v1/AUTH_test/deltest/man_404?multipart-manifest=get')])
+
+    def test_handle_async_delete_turned_off(self):
+        self.slo.allow_async_delete = False
+        req = Request.blank(
+            '/v1/AUTH_test/deltest/man-all-there?'
+            'multipart-manifest=delete&async=on&heartbeat=on',
+            environ={'REQUEST_METHOD': 'DELETE'},
+            headers={'Accept': 'application/json'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')
+        resp_data = json.loads(body)
+        self.assertEqual(resp_data["Number Deleted"], 3)
+
+        self.assertEqual(set(self.app.calls), set([
+            ('GET',
+             '/v1/AUTH_test/deltest/man-all-there?multipart-manifest=get'),
+            ('DELETE', '/v1/AUTH_test/deltest/b_2'),
+            ('DELETE', '/v1/AUTH_test/deltest/c_3'),
+            ('DELETE', '/v1/AUTH_test/deltest/man-all-there')]))
+
+    def test_handle_async_delete_whole(self):
+        self.slo.allow_async_delete = True
+        now = Timestamp(time.time())
+        exp_obj_cont = self.slo.expirer_config.get_expirer_container(
+            int(now), 'AUTH_test', 'deltest', 'man-all-there')
+        self.app.register(
+            'UPDATE', '/v1/.expiring_objects/%s' % exp_obj_cont,
+            swob.HTTPNoContent, {}, None)
+        req = Request.blank(
+            '/v1/AUTH_test/deltest/man-all-there'
+            '?async=true&multipart-manifest=delete',
+            environ={'REQUEST_METHOD': 'DELETE'})
+        with patch('swift.common.utils.Timestamp.now', return_value=now):
+            status, headers, body = self.call_slo(req)
+        self.assertEqual('204 No Content', status)
+        self.assertEqual(b'', body)
+        self.assertEqual(self.app.calls, [
+            ('GET',
+             '/v1/AUTH_test/deltest/man-all-there?multipart-manifest=get'),
+            ('UPDATE', '/v1/.expiring_objects/%s'
+                       '?async=true&multipart-manifest=delete' % exp_obj_cont),
+            ('DELETE', '/v1/AUTH_test/deltest/man-all-there'
+                       '?async=true&multipart-manifest=delete'),
+        ])
+
+        for header, expected in (
+            ('Content-Type', 'application/json'),
+            ('X-Backend-Storage-Policy-Index', '0'),
+            ('X-Backend-Allow-Private-Methods', 'True'),
+        ):
+            self.assertIn(header, self.app.call_list[1].headers)
+            value = self.app.call_list[1].headers[header]
+            msg = 'Expected %s header to be %r, not %r'
+            self.assertEqual(value, expected, msg % (header, expected, value))
+
+        t_delete_at = normalize_delete_at_timestamp(now, high_precision=True)
+        self.assertEqual(json.loads(self.app.call_list[1].body), [
+            {'content_type': 'application/async-deleted',
+             'created_at': now.internal,
+             'deleted': 0,
+             'etag': 'd41d8cd98f00b204e9800998ecf8427e',
+             'name': '%s-AUTH_test/deltest/b_2' % t_delete_at,
+             'size': 0,
+             'storage_policy_index': 0},
+            {'content_type': 'application/async-deleted',
+             'created_at': now.internal,
+             'deleted': 0,
+             'etag': 'd41d8cd98f00b204e9800998ecf8427e',
+             'name': '%s-AUTH_test/deltest/c_3' % t_delete_at,
+             'size': 0,
+             'storage_policy_index': 0},
+        ])
+
+    def test_handle_async_delete_non_ascii(self):
+        self.slo.allow_async_delete = True
+        unicode_acct = u'AUTH_test-un\u00efcode'
+        wsgi_acct = bytes_to_wsgi(unicode_acct.encode('utf-8'))
+        now = Timestamp(time.time())
+        exp_obj_cont = self.slo.expirer_config.get_expirer_container(
+            int(now), unicode_acct, 'deltest', 'man-all-there')
+        self.app.register(
+            'UPDATE', '/v1/.expiring_objects/%s' % exp_obj_cont,
+            swob.HTTPNoContent, {}, None)
+        authorize_calls = []
+
+        def authorize(req):
+            authorize_calls.append((req.method, req.acl))
+
+        req = Request.blank(
+            '/v1/%s/deltest/man-all-there?'
+            'async=1&multipart-manifest=delete&heartbeat=1' % wsgi_acct,
+            environ={'REQUEST_METHOD': 'DELETE', 'swift.authorize': authorize})
+        with patch('swift.common.utils.Timestamp.now', return_value=now):
+            status, _, body = self.call_slo(req)
+        # Every async delete should only need to make 3 requests during the
+        # client request/response cycle, so no need to support heart-beating
+        self.assertEqual('204 No Content', status)
+        self.assertEqual(b'', body)
+
+        self.assertEqual(self.app.calls, [
+            ('GET',
+             '/v1/%s/deltest/man-all-there?'
+             'multipart-manifest=get' % wsgi_acct),
+            ('HEAD', '/v1/%s' % wsgi_acct),
+            ('HEAD', '/v1/%s/deltest' % wsgi_acct),
+            ('HEAD', '/v1/%s/\xe2\x98\x83' % wsgi_acct),
+            ('UPDATE',
+             '/v1/.expiring_objects/%s'
+             '?async=1&heartbeat=1&multipart-manifest=delete' % exp_obj_cont),
+            ('DELETE',
+             '/v1/%s/deltest/man-all-there'
+             '?async=1&heartbeat=1&multipart-manifest=delete' % wsgi_acct),
+        ])
+        self.assertEqual(authorize_calls, [
+            ('GET', None),  # Original GET
+            ('DELETE', 'diff write'),
+            ('DELETE', 'same write'),
+            ('DELETE', None),  # Final DELETE
+        ])
+
+        for header, expected in (
+            ('Content-Type', 'application/json'),
+            ('X-Backend-Storage-Policy-Index', '0'),
+            ('X-Backend-Allow-Private-Methods', 'True'),
+        ):
+            self.assertIn(header, self.app.call_list[-2].headers)
+            value = self.app.call_list[-2].headers[header]
+            msg = 'Expected %s header to be %r, not %r'
+            self.assertEqual(value, expected, msg % (header, expected, value))
+
+        t_delete_at = normalize_delete_at_timestamp(now, high_precision=True)
+        self.assertEqual(json.loads(self.app.call_list[-2].body), [
+            {'content_type': 'application/async-deleted',
+             'created_at': now.internal,
+             'deleted': 0,
+             'etag': 'd41d8cd98f00b204e9800998ecf8427e',
+             'name': u'%s-%s/\N{SNOWMAN}/b_2' % (t_delete_at, unicode_acct),
+             'size': 0,
+             'storage_policy_index': 0},
+            {'content_type': 'application/async-deleted',
+             'created_at': now.internal,
+             'deleted': 0,
+             'etag': 'd41d8cd98f00b204e9800998ecf8427e',
+             'name': u'%s-%s/\N{SNOWMAN}/c_3'
+                     % (t_delete_at, unicode_acct),
+             'size': 0,
+             'storage_policy_index': 0},
+        ])
+
+    def test_handle_async_delete_non_ascii_same_container(self):
+        self.slo.allow_async_delete = True
+        unicode_acct = u'AUTH_test-un\u00efcode'
+        wsgi_acct = bytes_to_wsgi(unicode_acct.encode('utf-8'))
+        now = Timestamp(time.time())
+        exp_obj_cont = self.slo.expirer_config.get_expirer_container(
+            int(now), unicode_acct, u'\N{SNOWMAN}', 'same-container')
+        self.app.register(
+            'UPDATE', '/v1/.expiring_objects/%s' % exp_obj_cont,
+            swob.HTTPNoContent, {}, None)
+        authorize_calls = []
+
+        def authorize(req):
+            authorize_calls.append((req.method, req.acl))
+
+        req = Request.blank(
+            '/v1/%s/\xe2\x98\x83/same-container?'
+            'async=yes&multipart-manifest=delete' % wsgi_acct,
+            environ={'REQUEST_METHOD': 'DELETE', 'swift.authorize': authorize})
+        with patch('swift.common.utils.Timestamp.now', return_value=now):
+            status, _, body = self.call_slo(req)
+        self.assertEqual('204 No Content', status)
+        self.assertEqual(b'', body)
+
+        self.assertEqual(self.app.calls, [
+            ('GET',
+             '/v1/%s/\xe2\x98\x83/same-container?'
+             'multipart-manifest=get' % wsgi_acct),
+            ('HEAD', '/v1/%s' % wsgi_acct),
+            ('HEAD', '/v1/%s/\xe2\x98\x83' % wsgi_acct),
+            ('UPDATE',
+             '/v1/.expiring_objects/%s'
+             '?async=yes&multipart-manifest=delete' % exp_obj_cont),
+            ('DELETE',
+             '/v1/%s/\xe2\x98\x83/same-container'
+             '?async=yes&multipart-manifest=delete' % wsgi_acct),
+        ])
+        self.assertEqual(authorize_calls, [
+            ('GET', None),  # Original GET
+            ('DELETE', 'same write'),  # Only need one auth check
+            ('DELETE', None),  # Final DELETE
+        ])
+
+        for header, expected in (
+            ('Content-Type', 'application/json'),
+            ('X-Backend-Storage-Policy-Index', '0'),
+            ('X-Backend-Allow-Private-Methods', 'True'),
+        ):
+            self.assertIn(header, self.app.call_list[-2].headers)
+            value = self.app.call_list[-2].headers[header]
+            msg = 'Expected %s header to be %r, not %r'
+            self.assertEqual(value, expected, msg % (header, expected, value))
+
+        t_delete_at = normalize_delete_at_timestamp(now, high_precision=True)
+        self.assertEqual(json.loads(self.app.call_list[-2].body), [
+            {'content_type': 'application/async-deleted',
+             'created_at': now.internal,
+             'deleted': 0,
+             'etag': 'd41d8cd98f00b204e9800998ecf8427e',
+             'name': u'%s-%s/\N{SNOWMAN}/b_2' % (t_delete_at, unicode_acct),
+             'size': 0,
+             'storage_policy_index': 0},
+            {'content_type': 'application/async-deleted',
+             'created_at': now.internal,
+             'deleted': 0,
+             'etag': 'd41d8cd98f00b204e9800998ecf8427e',
+             'name': u'%s-%s/\N{SNOWMAN}/c_3' % (t_delete_at, unicode_acct),
+             'size': 0,
+             'storage_policy_index': 0},
+        ])
+
+    def test_handle_async_delete_alternative_expirer_config(self):
+        # Test that SLO async delete operation will send UPDATE requests to the
+        # alternative expirer container when using a non-default account name
+        # and container divisor.
+        slo_conf = {
+            'expiring_objects_account_name': 'exp',
+            'expiring_objects_container_divisor': '5400',
+        }
+        self.slo = slo.filter_factory(slo_conf)(self.app)
+        now = Timestamp(time.time())
+        exp_obj_cont = self.slo.expirer_config.get_expirer_container(
+            int(now), 'AUTH_test', 'deltest', 'man-all-there')
+        self.app.register(
+            'UPDATE', '/v1/.exp/%s' % exp_obj_cont,
+            swob.HTTPNoContent, {}, None)
+        req = Request.blank(
+            '/v1/AUTH_test/deltest/man-all-there',
+            method='DELETE')
+        with patch('swift.common.utils.Timestamp.now', return_value=now):
+            self.slo.handle_async_delete(req)
+        self.assertEqual([
+            ('GET', '/v1/AUTH_test/deltest/man-all-there'
+             '?multipart-manifest=get'),
+            ('UPDATE', '/v1/.exp/%s' % exp_obj_cont),
+        ], self.app.calls)
+
+    def test_handle_async_delete_nested(self):
+        self.slo.allow_async_delete = True
+        req = Request.blank(
+            '/v1/AUTH_test/deltest/manifest-with-submanifest' +
+            '?async=on&multipart-manifest=delete',
+            environ={'REQUEST_METHOD': 'DELETE'})
+        status, _, body = self.call_slo(req)
+        self.assertEqual('400 Bad Request', status)
+        self.assertEqual(b'No segments may be large objects.', body)
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/AUTH_test/deltest/' +
+             'manifest-with-submanifest?multipart-manifest=get')])
+
+    def test_handle_async_delete_too_many_containers(self):
+        self.slo.allow_async_delete = True
+        self.app.register(
+            'GET', '/v1/AUTH_test/deltest/man',
+            swob.HTTPOk, {'Content-Type': 'application/json',
+                          'X-Static-Large-Object': 'true'},
+            json.dumps([{'name': '/cont1/a_1', 'hash': 'a', 'bytes': '1'},
+                        {'name': '/cont2/b_2', 'hash': 'b', 'bytes': '2'}]).
+            encode('ascii'))
+
+        req = Request.blank(
+            '/v1/AUTH_test/deltest/man?async=on&multipart-manifest=delete',
+            environ={'REQUEST_METHOD': 'DELETE'})
+        status, _, body = self.call_slo(req)
+        self.assertEqual('400 Bad Request', status)
+        expected = b'All segments must be in one container. Found segments in '
+        self.assertEqual(expected, body[:len(expected)])
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/AUTH_test/deltest/man?multipart-manifest=get')])
+
+
+class SloGETorHEADTestCase(SloTestCase):
+    """
+    Any GET or HEAD test-case should exercise legacy manifests written before
+    we added etag/size SLO Sysmeta.
+
+    N.B. We used to GET the whole manifest to calculate etag/size, just to
+    respond to HEAD requests.
+    """
+
+    modern_manifest_headers = True
+
+    def maybe_add_modern_manifest_headers(self, headers, manifest):
+        hasher = md5(usedforsecurity=False)
+        calculated_size = 0
+        for seg_dict in manifest:
+            if 'data' in seg_dict:
+                raw_data = base64.b64decode(seg_dict['data'])
+                segment_etag = md5(raw_data, usedforsecurity=False).hexdigest()
+                segment_length = len(raw_data)
+            else:
+                segment_etag = seg_dict['hash']
+                if 'range' in seg_dict:
+                    segment_etag += ':%s;' % seg_dict['range']
+                    start, end = seg_dict['range'].split('-')
+                    segment_length = int(end) - int(start) + 1
+                else:
+                    segment_length = int(seg_dict['bytes'])
+            calculated_size += segment_length
+            hasher.update(segment_etag.encode())
+        calculated_etag = hasher.hexdigest()
+        if self.modern_manifest_headers:
+            headers.update({
+                'X-Object-Sysmeta-Slo-Etag': calculated_etag,
+                'X-Object-Sysmeta-Slo-Size': calculated_size,
+            })
+        return calculated_etag, calculated_size
+
+    def setUp(self):
+        super(SloGETorHEADTestCase, self).setUp()
+        self.expected_unread_requests = {}
+
+    def tearDown(self):
+        # SloTestCase always has an app
+        self.assertEqual(self.app.unclosed_requests, {})
+        self.assertEqual(self.app.unread_requests,
+                         self.expected_unread_requests)
+
+    def call_slo(self, req):
+        # all the tests that inhert from this class were part of a major test
+        # refactor in an effort to normalize and strengthen assertions; in
+        # general it would probably be reasonable for call_app to return a
+        # HeaderKeyDict but at the time was considered unrelated to the
+        # GETorHEAD TestCase refactor
+        status, raw_headers, body = super(
+            SloGETorHEADTestCase, self).call_slo(req)
+        headers = HeaderKeyDict(raw_headers)
+        self.assertEqual(
+            len(raw_headers), len(headers),
+            'Got duplicate names in response headers: %r' % raw_headers)
+        return status, headers, body
+
+    def _setup_alphabet_objects(self, letters, container='gettest'):
+        """
+        A common convention in these tests uses segments named a_5, b_10, etc.
+
+        They're nothing special, just small regular objects with names that
+        describe their content and size.
+        """
+        for i, letter in enumerate(string.ascii_lowercase):
+            if letter not in letters:
+                continue
+            size = (i + 1) * 5
+            body = letter * size
+            path = '/v1/AUTH_test/%s/%s_%s' % (container, letter, size)
+            self.app.register('GET', path, swob.HTTPOk, {
+                'Content-Length': len(body),
+                'Etag': md5hex(body),
+            }, body)
+
+    def _setup_manifest(self, name, manifest, extra_headers=None,
+                        attr_key=None, container='c', obj_key=None):
+        """
+        This helper should be used to create manifests that have descriptive
+        names you can reference in tests.  Think of manifests as having
+        "personalities" - you should get to known them over the course of a few
+        test methods; you can share them between TestCases.  When you want to
+        test something on a SLO with a slightly different manifest resist the
+        temptation to update an existing manifest; just create a new
+        personality - and give it a name that recognizes its heritage and
+        follows existing patterns - don't worry we won't run out of memory
+        having too many similar but different manifests setup in our tests.
+        """
+        if not attr_key:
+            # _setup_manifest attrs will *always* be prefixed with manifest,
+            # but you can override the glob in the form manifest_*_<attr>
+            attr_key = name.replace('-', '_').lower()
+        if obj_key is None:
+            # seems reasonable when reading tests to see request paths that
+            # clearly specify the object is a manifest; so this is a strong
+            # convention.  But if we ever have a bug we can only repro if the
+            # manifest doesn't start a literal "manifest-" you can register the
+            # object name however you want.
+            obj_key = 'manifest-%s' % name
+        manifest_json = json.dumps(manifest)
+        setattr(self, 'manifest_%s_json_size' % attr_key, len(manifest_json))
+        json_md5 = md5hex(manifest_json)
+        setattr(self, 'manifest_%s_json_md5' % attr_key, json_md5)
+        manifest_headers = {
+            'Content-Length': str(len(manifest_json)),
+            'X-Static-Large-Object': 'true',
+            'Etag': json_md5,
+            # In my testing it's not possible to create an SLO manifest that
+            # has *no* content-type, both empty or missing Content-Type header
+            # on ?multipart-manifest=put result in a default
+            # "application/octet-stream" value being stored in the manifest
+            # metadata; still I wouldn't assert on this value in these tests,
+            # you may not be testing what you think you are - N.B. some tests
+            # will override this value with the "extra_headers" param.
+            'Content-Type': 'application/octet-stream',
+        }
+        if extra_headers is not None:
+            manifest_headers.update(extra_headers)
+        slo_etag, slo_size = self.maybe_add_modern_manifest_headers(
+            manifest_headers, manifest)
+        setattr(self, 'manifest_%s_slo_etag' % attr_key, slo_etag)
+        setattr(self, 'manifest_%s_slo_size' % attr_key, slo_size)
+        self.app.register(
+            'GET', '/v1/AUTH_test/%s/%s' % (container, obj_key),
+            swob.HTTPOk, manifest_headers, manifest_json.encode('ascii'))
+
+    def _setup_manifest_single_segment(self):
+        """
+        This manifest's segments are all regular objects.
+        """
+        _single_segment_manifest = [
+            {'name': '/gettest/b_50', 'hash': md5hex('b' * 50), 'bytes': '50',
+             'content_type': 'text/plain'},
+        ]
+        self._setup_manifest(
+            'single-segment', _single_segment_manifest,
+            extra_headers={'X-Object-Meta-Nature': 'Regular'},
+            container='gettest')
+
+    def _setup_manifest_zero_byte(self):
+        """
+        This is a zero-byte manifest.
+        """
+        _single_segment_manifest = [
+            {'name': '/gettest/zero', 'hash': md5hex(''), 'bytes': '0',
+             'content_type': 'text/plain'},
+        ]
+        self._setup_manifest(
+            'zero-byte', _single_segment_manifest,
+            container='gettest')
+
+    def _setup_manifest_data(self):
+        _data_manifest = [
+            {
+                'data': base64.b64encode(b'123456').decode('ascii')
+            }, {
+                'name': '/gettest/a_5',
+                'hash': md5hex('a' * 5),
+                'content_type': 'text/plain',
+                'bytes': '5',
+            }, {
+                'data': base64.b64encode(b'ABCDEF').decode('ascii')
+            },
+        ]
+        self._setup_manifest('data', _data_manifest)
+
+    def _setup_manifest_bc(self):
+        """
+        This manifest's segments are all regular objects.
+        """
+        _bc_manifest = [
+            {'name': '/gettest/b_10', 'hash': md5hex('b' * 10), 'bytes': '10',
+             'content_type': 'text/plain'},
+            {'name': '/gettest/c_15', 'hash': md5hex('c' * 15), 'bytes': '15',
+             'content_type': 'text/plain'}
+        ]
+        self._setup_manifest('bc', _bc_manifest, extra_headers={
+            # maybe manifest-bc is about some botony research!?
+            'X-Object-Meta-Plant': 'Ficus',
+        }, container='gettest')
+
+    def _setup_manifest_bc_expires(self):
+        """
+        This manifest's segments are all regular objects due to expire.
+        """
+        _bc_expires_manifest = [
+            {'name': '/gettest/b_5', 'hash': md5hex('b' * 5), 'bytes': '5',
+             'content_type': 'text/plain'},
+            {'name': '/gettest/c_10', 'hash': md5hex('c' * 10), 'bytes': '10',
+             'content_type': 'text/plain'}
+        ]
+        self._setup_manifest('bc-expires', _bc_expires_manifest,
+                             extra_headers={'X-Object-Meta-Plant':
+                                            'Ficus-Expires'},
+                             container='gettest')
+
+    def _setup_manifest_abcd(self):
+        """
+        This manifest uses manifest-bc as a sub-manifest!
+        """
+        _abcd_manifest = [
+            {'name': '/gettest/a_5', 'hash': md5hex("a" * 5),
+             'content_type': 'text/plain', 'bytes': '5'},
+            {'name': '/gettest/manifest-bc', 'sub_slo': True,
+             'content_type': 'application/json',
+             # N.B. sub-slo-segments use slo-etag & slo-size
+             'hash': self.manifest_bc_slo_etag,
+             'bytes': self.manifest_bc_slo_size},
+            {'name': '/gettest/d_20', 'hash': md5hex("d" * 20),
+             'content_type': 'text/plain', 'bytes': '20'},
+        ]
+        self._setup_manifest('abcd', _abcd_manifest, extra_headers={
+            # apparently this is a HUGE json object?  maybe the plan Ficus data
+            # is embeded as base64.
+            'Content-Type': 'application/json',
+        }, container='gettest')
+
+    def _setup_manifest_abcdefghijkl(self):
+        """
+        Despite the terrible name, this is just a large manifest of regular
+        objects.
+        """
+        _abcdefghijkl_manifest = [
+            {'name': '/gettest/a_5', 'hash': md5hex("a" * 5),
+             'content_type': 'text/plain', 'bytes': '5'},
+            {'name': '/gettest/b_10', 'hash': md5hex("b" * 10),
+             'content_type': 'text/plain', 'bytes': '10'},
+            {'name': '/gettest/c_15', 'hash': md5hex("c" * 15),
+             'content_type': 'text/plain', 'bytes': '15'},
+            {'name': '/gettest/d_20', 'hash': md5hex("d" * 20),
+             'content_type': 'text/plain', 'bytes': '20'},
+            {'name': '/gettest/e_25', 'hash': md5hex("e" * 25),
+             'content_type': 'text/plain', 'bytes': '25'},
+            {'name': '/gettest/f_30', 'hash': md5hex("f" * 30),
+             'content_type': 'text/plain', 'bytes': '30'},
+            {'name': '/gettest/g_35', 'hash': md5hex("g" * 35),
+             'content_type': 'text/plain', 'bytes': '35'},
+            {'name': '/gettest/h_40', 'hash': md5hex("h" * 40),
+             'content_type': 'text/plain', 'bytes': '40'},
+            {'name': '/gettest/i_45', 'hash': md5hex("i" * 45),
+             'content_type': 'text/plain', 'bytes': '45'},
+            {'name': '/gettest/j_50', 'hash': md5hex("j" * 50),
+             'content_type': 'text/plain', 'bytes': '50'},
+            {'name': '/gettest/k_55', 'hash': md5hex("k" * 55),
+             'content_type': 'text/plain', 'bytes': '55'},
+            {'name': '/gettest/l_60', 'hash': md5hex("l" * 60),
+             'content_type': 'text/plain', 'bytes': '60'},
+        ]
+        self._setup_manifest('abcdefghijkl', _abcdefghijkl_manifest,
+                             extra_headers={}, container='gettest')
+
+    def _setup_manifest_bc_ranges(self):
+        """
+        This manifest's segments are range-segments into regular objects.
+        """
+        _bc_ranges_manifest = [
+            {'name': '/gettest/b_10', 'hash': md5hex('b' * 10),
+             'content_type': 'text/plain', 'bytes': '10',
+             'range': '4-7'},
+            {'name': '/gettest/b_10', 'hash': md5hex('b' * 10),
+             'content_type': 'text/plain', 'bytes': '10',
+             'range': '2-5'},
+            {'name': '/gettest/c_15', 'hash': md5hex('c' * 15),
+             'content_type': 'text/plain', 'bytes': '15',
+             'range': '0-3'},
+            {'name': '/gettest/c_15', 'hash': md5hex('c' * 15),
+             'content_type': 'text/plain', 'bytes': '15',
+             'range': '11-14'},
+        ]
+        self._setup_manifest('bc-ranges', _bc_ranges_manifest,
+                             container='gettest')
+
+    def _setup_manifest_abcd_ranges(self):
+        """
+        This manifest's range-segments use manifest-bc as sub-manifest!
+        """
+        _abcd_ranges_manifest = [
+            {'name': '/gettest/a_5', 'hash': md5hex("a" * 5),
+             'content_type': 'text/plain', 'bytes': '5',
+             'range': '0-3'},
+            {'name': '/gettest/a_5', 'hash': md5hex("a" * 5),
+             'content_type': 'text/plain', 'bytes': '5',
+             'range': '1-4'},
+            {'name': '/gettest/manifest-bc-ranges', 'sub_slo': True,
+             'content_type': 'application/json',
+             'hash': self.manifest_bc_ranges_slo_etag,
+             'bytes': 16,
+             'range': '8-15'},
+            {'name': '/gettest/manifest-bc-ranges', 'sub_slo': True,
+             'content_type': 'application/json',
+             'hash': self.manifest_bc_ranges_slo_etag,
+             'bytes': self.manifest_bc_ranges_slo_size,
+             'range': '0-7'},
+            {'name': '/gettest/d_20', 'hash': md5hex("d" * 20),
+             'content_type': 'text/plain', 'bytes': '20',
+             'range': '0-3'},
+            {'name': '/gettest/d_20', 'hash': md5hex("d" * 20),
+             'content_type': 'text/plain', 'bytes': '20',
+             'range': '8-11'},
+        ]
+        self._setup_manifest(
+            'abcd-ranges', _abcd_ranges_manifest, extra_headers={
+                # apparently this is another HUGE json object?
+                'Content-Type': 'application/json',
+            }, container='gettest')
+
+    def _setup_manifest_abcd_subranges(self):
+        """
+        These range-segments use manifest-abcd-ranges as sub-manifests!
+        """
+        _abcd_subranges_manifest = [
+            {'name': '/gettest/manifest-abcd-ranges', 'sub_slo': True,
+             'hash': self.manifest_abcd_ranges_slo_etag,
+             'bytes': self.manifest_abcd_ranges_slo_size,
+             'content_type': 'text/plain',
+             'range': '6-10'},
+            {'name': '/gettest/manifest-abcd-ranges', 'sub_slo': True,
+             'hash': self.manifest_abcd_ranges_slo_etag,
+             'bytes': self.manifest_abcd_ranges_slo_size,
+             'content_type': 'text/plain',
+             'range': '31-31'},
+            {'name': '/gettest/manifest-abcd-ranges', 'sub_slo': True,
+             'hash': self.manifest_abcd_ranges_slo_etag,
+             'bytes': self.manifest_abcd_ranges_slo_size,
+             'content_type': 'text/plain',
+             'range': '14-18'},
+            {'name': '/gettest/manifest-abcd-ranges', 'sub_slo': True,
+             'hash': self.manifest_abcd_ranges_slo_etag,
+             'bytes': self.manifest_abcd_ranges_slo_size,
+             'content_type': 'text/plain',
+             'range': '0-0'},
+            {'name': '/gettest/manifest-abcd-ranges', 'sub_slo': True,
+             'hash': self.manifest_abcd_ranges_slo_etag,
+             'bytes': self.manifest_abcd_ranges_slo_size,
+             'content_type': 'text/plain',
+             'range': '22-26'},
+        ]
+        self._setup_manifest(
+            'abcd-subranges', _abcd_subranges_manifest, extra_headers={
+                # apparently this is another HUGE json object?
+                'Content-Type': 'application/json',
+            }, container='gettest')
+
+    def _setup_manifest_headtest(self):
+        """
+        This is a unqiue manifest, un-related to the linage of gettest with
+        different segments.  AFAIK the segments responses are never registered.
+        It also has it's own weird name.
+        """
+        manifest = [
+            {'name': '/gettest/seg01',
+             'bytes': '100',
+             'hash': 'seg01-hash',
+             'content_type': 'text/plain',
+             'last_modified': '2013-11-19T11:33:45.137446'},
+            {'name': '/gettest/seg02',
+             'bytes': '200',
+             'hash': 'seg02-hash',
+             'content_type': 'text/plain',
+             'last_modified': '2013-11-19T11:33:45.137447'},
+        ]
+        self._setup_manifest('man', manifest, extra_headers={
+            'Content-Type': 'test/data',
+            'X-Object-Sysmeta-Artisanal-Etag': 'bespoke',
+        }, attr_key='headtest', container='headtest', obj_key='man')
+
+    def _setup_manifest_aabbccdd(self):
+        """
+        This manifest has repeated whole segments, SLO request pattern on a
+        manifest like uses multi-range requests to coalesce repated segments
+        into a single request!
+        """
+        _aabbccdd_manifest = [
+            {'name': '/gettest/a_5', 'hash': md5hex("a" * 5),
+             'content_type': 'text/plain', 'bytes': '5'},
+            {'name': '/gettest/a_5', 'hash': md5hex("a" * 5),
+             'content_type': 'text/plain', 'bytes': '5'},
+
+            {'name': '/gettest/b_10', 'hash': md5hex("b" * 10),
+             'content_type': 'text/plain', 'bytes': '10'},
+            {'name': '/gettest/b_10', 'hash': md5hex("b" * 10),
+             'content_type': 'text/plain', 'bytes': '10'},
+
+            {'name': '/gettest/c_15', 'hash': md5hex("c" * 15),
+             'content_type': 'text/plain', 'bytes': '15'},
+            {'name': '/gettest/c_15', 'hash': md5hex("c" * 15),
+             'content_type': 'text/plain', 'bytes': '15'},
+
+            {'name': '/gettest/d_20', 'hash': md5hex("d" * 20),
+             'content_type': 'text/plain', 'bytes': '20'},
+            {'name': '/gettest/d_20', 'hash': md5hex("d" * 20),
+             'content_type': 'text/plain', 'bytes': '20'}
+        ]
+        self._setup_manifest('aabbccdd', _aabbccdd_manifest,
+                             container='gettest')
+
+
+class TestSloHeadOldManifest(SloGETorHEADTestCase):
+
+    modern_manifest_headers = False
+
+    def setUp(self):
+        super(TestSloHeadOldManifest, self).setUp()
+        self._setup_alphabet_objects('abcd')
+        self._setup_manifest_bc()
+        self._setup_manifest_abcd()
+
+        self._setup_manifest_headtest()
+        # these aliases are not *too* ambiguous, they get a pass
+        self.slo_etag = self.manifest_headtest_slo_etag
+        self.manifest_json_etag = self.manifest_headtest_json_md5
+
+    def test_etag_is_hash_of_segment_etags(self):
+        req = Request.blank(
+            '/v1/AUTH_test/headtest/man',
+            environ={'REQUEST_METHOD': 'HEAD'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(headers['Etag'], '"%s"' % self.slo_etag)
+        self.assertEqual(headers['X-Manifest-Etag'], self.manifest_json_etag)
+        self.assertEqual(headers['Content-Length'], '300')
+        self.assertEqual(headers['Content-Type'], 'test/data')
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(body, b'')  # it's a HEAD request, after all
+
+        expected_app_calls = [('HEAD', '/v1/AUTH_test/headtest/man')]
+        if not self.modern_manifest_headers:
+            expected_app_calls.append(('GET', '/v1/AUTH_test/headtest/man'))
+        self.assertEqual(self.app.calls, expected_app_calls)
+
+    def test_get_manifest_passthrough(self):
+        req = Request.blank(
+            '/v1/AUTH_test/headtest/man?multipart-manifest=get',
+            environ={'REQUEST_METHOD': 'HEAD'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(headers['Etag'], self.manifest_json_etag)
+        self.assertEqual(headers['Content-Type'],
+                         'application/json; charset=utf-8')
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['X-Object-Sysmeta-Artisanal-Etag'], 'bespoke')
+        self.assertNotIn('X-Manifest-Etag', headers)
+        self.assertEqual(int(headers['Content-Length']),
+                         self.manifest_headtest_json_size)
+        self.assertEqual(body, b'')  # it's a HEAD request, after all
+
+        expected_app_calls = [(
+            'HEAD', '/v1/AUTH_test/headtest/man?multipart-manifest=get')]
+        self.assertEqual(self.app.calls, expected_app_calls)
+        # this is only relevant for conditional requests; but SLO will only
+        # *add* it on SLO requests, not a multipart-manifest=get request
+        self.assertNotIn('X-Backend-Etag-Is-At', self.app.headers[0])
+
+    def test_zero_byte_manifest(self):
+        _single_segment_manifest = [
+            {'name': '/c/zero', 'hash': md5hex(''), 'bytes': '0',
+             'content_type': 'text/plain'},
+        ]
+        self._setup_manifest('zero-byte', _single_segment_manifest)
+        req = Request.blank('/v1/AUTH_test/c/manifest-zero-byte',
+                            method='HEAD')
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(headers['Etag'],
+                         '"%s"' % self.manifest_zero_byte_slo_etag)
+        self.assertEqual(headers['Content-Length'], '0')
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['X-Manifest-Etag'],
+                         self.manifest_zero_byte_json_md5)
+        self.assertEqual(body, b'')  # it's a HEAD request, after all
+
+        expected_app_calls = [('HEAD', '/v1/AUTH_test/c/manifest-zero-byte')]
+        if not self.modern_manifest_headers:
+            expected_app_calls.append((
+                'GET', '/v1/AUTH_test/c/manifest-zero-byte'))
+        self.assertEqual(self.app.calls, expected_app_calls)
+
+    def test_if_none_match_etag_matching(self):
+        req = Request.blank(
+            '/v1/AUTH_test/headtest/man',
+            environ={'REQUEST_METHOD': 'HEAD'},
+            headers={'If-None-Match': self.slo_etag})
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '304 Not Modified')
+        self.assertEqual(headers['Etag'], '"%s"' % self.slo_etag)
+        self.assertEqual(headers['Content-Length'], '0')
+        self.assertEqual(headers['Content-Type'], 'test/data')
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['X-Manifest-Etag'], self.manifest_json_etag)
+        self.assertEqual(headers['X-Object-Sysmeta-Artisanal-Etag'], 'bespoke')
+
+        expected_app_calls = [('HEAD', '/v1/AUTH_test/headtest/man')]
+        if not self.modern_manifest_headers:
+            expected_app_calls.append(('GET', '/v1/AUTH_test/headtest/man'))
+        self.assertEqual(self.app.calls, expected_app_calls)
+
+    def test_if_match_etag_not_matching(self):
+        req = Request.blank(
+            '/v1/AUTH_test/headtest/man',
+            environ={'REQUEST_METHOD': 'HEAD'},
+            headers={'If-Match': 'zzz'})
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '412 Precondition Failed')
+        self.assertEqual(headers['Etag'], '"%s"' % self.slo_etag)
+        self.assertEqual(headers['Content-Length'], '0')
+        self.assertEqual(headers['Content-Type'], 'test/data')
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['X-Manifest-Etag'], self.manifest_json_etag)
+        self.assertEqual(headers['X-Object-Sysmeta-Artisanal-Etag'], 'bespoke')
+
+        expected_app_calls = [('HEAD', '/v1/AUTH_test/headtest/man')]
+        if not self.modern_manifest_headers:
+            expected_app_calls.append(('GET', '/v1/AUTH_test/headtest/man'))
+        self.assertEqual(self.app.calls, expected_app_calls)
+
+    def test_if_none_match_etag_matching_with_override(self):
+        req = Request.blank(
+            '/v1/AUTH_test/headtest/man',
+            environ={'REQUEST_METHOD': 'HEAD'},
+            headers={
+                'If-None-Match': 'bespoke',
+                'X-Backend-Etag-Is-At': 'X-Object-Sysmeta-Artisanal-Etag'})
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '304 Not Modified')
+        # We *are not* responsible for replacing the etag; whoever set
+        # x-backend-etag-is-at is responsible
+        self.assertEqual(headers['Etag'], '"%s"' % self.slo_etag)
+        self.assertEqual(headers['Content-Length'], '0')
+        self.assertEqual(headers['Content-Type'], 'test/data')
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['X-Manifest-Etag'], self.manifest_json_etag)
+        self.assertEqual(headers['X-Object-Sysmeta-Artisanal-Etag'], 'bespoke')
+
+        expected_app_calls = [('HEAD', '/v1/AUTH_test/headtest/man')]
+        if not self.modern_manifest_headers:
+            expected_app_calls.append(('GET', '/v1/AUTH_test/headtest/man'))
+        self.assertEqual(self.app.calls, expected_app_calls)
+
+    def test_if_match_etag_not_matching_with_override(self):
+        req = Request.blank(
+            '/v1/AUTH_test/headtest/man',
+            environ={'REQUEST_METHOD': 'HEAD'},
+            headers={
+                'If-Match': self.slo_etag,
+                'X-Backend-Etag-Is-At': 'X-Object-Sysmeta-Artisanal-Etag'})
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '412 Precondition Failed')
+        # We *are not* responsible for replacing the etag; whoever set
+        # x-backend-etag-is-at is responsible
+        self.assertEqual(headers['Etag'], '"%s"' % self.slo_etag)
+        self.assertEqual(headers['Content-Length'], '0')
+        self.assertEqual(headers['Content-Type'], 'test/data')
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['X-Manifest-Etag'], self.manifest_json_etag)
+        self.assertEqual(headers['X-Object-Sysmeta-Artisanal-Etag'], 'bespoke')
+
+        expected_app_calls = [('HEAD', '/v1/AUTH_test/headtest/man')]
+        if not self.modern_manifest_headers:
+            expected_app_calls.append(('GET', '/v1/AUTH_test/headtest/man'))
+        self.assertEqual(self.app.calls, expected_app_calls)
+
+    def test_head_manifest_is_efficient(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd',
+            environ={'REQUEST_METHOD': 'HEAD'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(headers['Content-Length'], '50')
+        self.assertEqual(headers['Etag'], '"%s"' % self.manifest_abcd_slo_etag)
+        self.assertEqual(headers['X-Manifest-Etag'],
+                         self.manifest_abcd_json_md5)
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(body, b'')
+        expected_calls = [
+            ('HEAD', '/v1/AUTH_test/gettest/manifest-abcd'),
+        ]
+        if not self.modern_manifest_headers:
+            # Note we don't call validate first segment on HEAD. We know the
+            # slo size/etag from the manifest, so there's no need for any
+            # segment or submanifest fetching here, but a naïve implementation
+            # might do it anyway.
+            expected_calls.append(
+                ('GET', '/v1/AUTH_test/gettest/manifest-abcd'))
+        self.assertEqual(self.app.calls, expected_calls)
+
+
+class TestSloHeadManifest(TestSloHeadOldManifest):
+    """
+    Exercise manifests written after we added etag/size SLO Sysmeta
+    """
+
+    modern_manifest_headers = True
+
+
+class TestSloGetRawManifest(SloGETorHEADTestCase):
+
+    modern_manifest_headers = True
+
+    def setUp(self):
+        super(TestSloGetRawManifest, self).setUp()
+        self._setup_manifest_raw()
+        self._setup_manifest_raw_ranges()
+
+    def _setup_manifest_raw(self):
+        """
+        This is only used by TestSloGetRawManifest; some segments are
+        regular objects and one segment is a sub-slo.
+        """
+        _raw_manifest = [
+            {'name': '/gettest/does_not_exist', 'hash': md5hex('foo'),
+             'bytes': '100', 'content_type': 'text/plain',
+             'last_modified': '1970-01-01T00:00:00.000000'},
+            {'name': '/gettest/not_checked', 'hash': md5hex('bar'),
+             'bytes': '303', 'content_type': 'text/plain',
+             'last_modified': '1970-01-01T00:00:00.000000'},
+            {'name': '/gettest/made_up',
+             'hash': md5hex(md5hex("fizz") + md5hex("buzz")), 'bytes': '2099',
+             'content_type': 'application/json',
+             'sub_slo': True,
+             'last_modified': '1970-01-01T00:00:00.000000'}
+        ]
+        self._setup_manifest('raw', _raw_manifest, extra_headers={
+            'Content-Type': 'text/plain',
+        }, container='gettest')
+
+    def _setup_manifest_raw_ranges(self):
+        """
+        This is only used by TestSloGetRawManifest; the segments are
+        range-segments into regular objects.
+        """
+        _raw_ranges_manifest = [
+            {'name': '/gettest/does_not_exist', 'hash': md5hex('foo'),
+             'bytes': '100', 'last_modified': '1970-01-01T00:00:00.000000',
+             'content_type': 'text/plain', 'range': '1-99'},
+            {'name': '/gettest/not_checked', 'hash': md5hex('bar'),
+             'bytes': '303', 'last_modified': '1970-01-01T00:00:00.000000',
+             'content_type': 'text/plain', 'range': '100-200'},
+        ]
+        self._setup_manifest(
+            'raw-ranges', _raw_ranges_manifest, extra_headers={
+                'Content-Type': 'text/plain',
+            }, container='gettest')
+
+    def test_get_raw_manifest(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-raw'
+            '?multipart-manifest=get&format=raw',
+            environ={'REQUEST_METHOD': 'GET',
+                     'HTTP_ACCEPT': 'application/json'})
+        status, headers, body = self.call_slo(req)
+
+        expected_body = json.dumps([
+            {'etag': md5hex('foo'), 'size_bytes': '100',
+             'path': '/gettest/does_not_exist'},
+            {'etag': md5hex('bar'), 'size_bytes': '303',
+             'path': '/gettest/not_checked'},
+            {'etag': md5hex(md5hex("fizz") + md5hex("buzz")),
+             'size_bytes': '2099',
+             'path': '/gettest/made_up'}], sort_keys=True).encode('utf8')
+        expected_etag = md5hex(expected_body)
+
+        self.assertEqual(body, expected_body)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(headers['Etag'], expected_etag)
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        # raw format should return the actual manifest object content-type
+        self.assertEqual(headers['Content-Type'], 'text/plain')
+        self.assertNotIn('X-Manifest-Etag', headers)
+        self.assertEqual(int(headers['Content-Length']), len(body))
+
+        try:
+            json.loads(body)
+        except ValueError:
+            self.fail("Invalid JSON in manifest GET: %r" % body)
+
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/AUTH_test/gettest/manifest-raw'
+             # FakeSwift stable-alpha-sorts params keys
+             '?format=raw&multipart-manifest=get'),
+        ])
+
+    def test_get_raw_manifest_passthrough_with_ranges(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-raw-ranges'
+            '?multipart-manifest=get&format=raw',
+            environ={'REQUEST_METHOD': 'GET',
+                     'HTTP_ACCEPT': 'application/json'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')
+        # raw format should return the actual manifest object content-type
+        self.assertEqual(headers['Content-Type'], 'text/plain')
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertNotIn('X-Manifest-Etag', headers)
+        self.assertEqual(int(headers['Content-Length']), len(body))
+        try:
+            resp_data = json.loads(body)
+        except ValueError:
+            self.fail("Invalid JSON in manifest GET: %r" % body)
+
+        self.assertEqual(
+            resp_data,
+            [{'etag': md5hex('foo'), 'size_bytes': '100',
+              'path': '/gettest/does_not_exist', 'range': '1-99'},
+             {'etag': md5hex('bar'), 'size_bytes': '303',
+              'path': '/gettest/not_checked', 'range': '100-200'}],
+            body)
+
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/AUTH_test/gettest/manifest-raw-ranges'
+             # FakeSwift stable-alpha-sorts params keys
+             '?format=raw&multipart-manifest=get'),
+        ])
+
+
+class TestSloGetRawOldManifest(TestSloGetRawManifest):
+
+    modern_manifest_headers = False
+
+
+class TestSloGetManifests(SloGETorHEADTestCase):
+
+    modern_manifest_headers = True
+
+    def setUp(self):
+        super(TestSloGetManifests, self).setUp()
+        self._setup_alphabet_objects('abcdefghijkl')
+        self._setup_manifest_bc()
+        self._setup_manifest_abcd()
+        self._setup_manifest_abcdefghijkl()
+
+    def test_get_manifest_passthrough(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-bc?multipart-manifest=get',
+            environ={'REQUEST_METHOD': 'GET',
+                     'HTTP_ACCEPT': 'application/json'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(headers['Content-Type'],
+                         'application/json; charset=utf-8')
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['Etag'], self.manifest_bc_json_md5)
+        self.assertEqual(int(headers['Content-Length']),
+                         self.manifest_bc_json_size)
+        self.assertNotIn('X-Manifest-Etag', headers)
+        try:
+            resp_data = json.loads(body)
+        except ValueError:
+            self.fail("Invalid JSON in manifest GET: %r" % body)
+
+        self.assertEqual(
+            resp_data,
+            [{'hash': md5hex('b' * 10), 'bytes': '10', 'name': '/gettest/b_10',
+              'content_type': 'text/plain'},
+             {'hash': md5hex('c' * 15), 'bytes': '15', 'name': '/gettest/c_15',
+              'content_type': 'text/plain'}],
+            body)
+        self.assertEqual(headers['Etag'], md5hex(body))
+
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/AUTH_test/gettest/manifest-bc'
+             '?multipart-manifest=get'),
+        ])
+
+    def test_get_manifest(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-bc',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_slo(req)
+
+        manifest_etag = md5hex(md5hex("b" * 10) + md5hex("c" * 15))
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(headers['Content-Length'], '25')
+        self.assertEqual(headers['Etag'], '"%s"' % manifest_etag)
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['X-Manifest-Etag'], self.manifest_bc_json_md5)
+        self.assertEqual(headers['X-Object-Meta-Plant'], 'Ficus')
+        self.assertEqual(body, b'bbbbbbbbbbccccccccccccccc')
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/AUTH_test/gettest/manifest-bc'),
+            ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'),
+        ])
+
+        for _, _, hdrs in self.app.calls_with_headers[1:]:
+            ua = hdrs.get("User-Agent", "")
+            self.assertTrue("SLO MultipartGET" in ua)
+            self.assertFalse("SLO MultipartGET SLO MultipartGET" in ua)
+        # the first request goes through unaltered
+        first_ua = self.app.calls_with_headers[0][2].get("User-Agent")
+        self.assertFalse(
+            "SLO MultipartGET" in first_ua)
+
+    def test_get_manifest_repeated_segments_uses_multi_range_requests(self):
+        self._setup_manifest_aabbccdd()
+
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-aabbccdd',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(int(headers['Content-Length']),
+                         self.manifest_aabbccdd_slo_size)
+        self.assertEqual(headers['Etag'],
+                         '"%s"' % self.manifest_aabbccdd_slo_etag)
+        self.assertEqual(headers['X-Manifest-Etag'],
+                         self.manifest_aabbccdd_json_md5)
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(body, (
+            b'aaaaaaaaaabbbbbbbbbbbbbbbbbbbbcccccccccccccccccccccccccccccc'
+            b'dddddddddddddddddddddddddddddddddddddddd'))
+
+        # FakeSwift doesn't have any explicit knowledge of multi-range
+        # responses; but swob will convert the response to to MIME documents if
+        # it's constructed with body=<bytes>, this test would break with
+        # registered segment responses who's body was was a list/app_iter
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/AUTH_test/gettest/manifest-aabbccdd'),
+            ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/d_20?multipart-manifest=get')])
+
+        ranges = [c[2].get('Range') for c in self.app.calls_with_headers]
+        # I won't say it's bad we do this, but it's not obviously only good
+        self.assertEqual(ranges, [
+            None,
+            'bytes=0-4,0-4',
+            'bytes=0-9,0-9',
+            'bytes=0-14,0-14',
+            'bytes=0-19,0-19'])
+
+    def test_get_manifest_ratelimiting(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcdefghijkl',
+            environ={'REQUEST_METHOD': 'GET'})
+
+        the_time = [time.time()]
+        sleeps = []
+
+        def mock_time():
+            return the_time[0]
+
+        def mock_sleep(duration):
+            sleeps.append(duration)
+            the_time[0] += duration
+
+        with patch('time.time', mock_time), \
+                patch('eventlet.sleep', mock_sleep), \
+                patch.object(self.slo, 'rate_limit_under_size', 999999999), \
+                patch.object(self.slo, 'rate_limit_after_segment', 0):
+            status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')  # sanity check
+        self.assertEqual(sleeps, [1.0] * 11)
+
+        # give the client the first 4 segments without ratelimiting; we'll
+        # sleep less
+        del sleeps[:]
+        with patch('time.time', mock_time), \
+                patch('eventlet.sleep', mock_sleep), \
+                patch.object(self.slo, 'rate_limit_under_size', 999999999), \
+                patch.object(self.slo, 'rate_limit_after_segment', 4):
+            status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')  # sanity check
+        self.assertEqual(sleeps, [1.0] * 7)
+
+        # ratelimit segments under 35 bytes; this affects a-f
+        del sleeps[:]
+        with patch('time.time', mock_time), \
+                patch('eventlet.sleep', mock_sleep), \
+                patch.object(self.slo, 'rate_limit_under_size', 35), \
+                patch.object(self.slo, 'rate_limit_after_segment', 0):
+            status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')  # sanity check
+        self.assertEqual(sleeps, [1.0] * 5)
+
+        # ratelimit segments under 36 bytes; this now affects a-g, netting
+        # us one more sleep than before
+        del sleeps[:]
+        with patch('time.time', mock_time), \
+                patch('eventlet.sleep', mock_sleep), \
+                patch.object(self.slo, 'rate_limit_under_size', 36), \
+                patch.object(self.slo, 'rate_limit_after_segment', 0):
+            status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')  # sanity check
+        self.assertEqual(sleeps, [1.0] * 6)
+
+    def test_get_manifest_with_submanifest(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(headers['Content-Length'], '50')
+        self.assertEqual(headers['Etag'], '"%s"' % self.manifest_abcd_slo_etag)
+        self.assertEqual(headers['X-Manifest-Etag'],
+                         self.manifest_abcd_json_md5)
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(
+            body, b'aaaaabbbbbbbbbbcccccccccccccccdddddddddddddddddddd')
+
+        self.assertEqual(
+            self.app.calls,
+            [('GET', '/v1/AUTH_test/gettest/manifest-abcd'),
+             ('GET', '/v1/AUTH_test/gettest/manifest-bc'),
+             ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/d_20?multipart-manifest=get')])
+
+    def test_range_get_manifest(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Range': 'bytes=3-17'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(headers['Content-Length'], '15')
+        self.assertEqual(headers['Content-Range'], 'bytes 3-17/50')
+        self.assertEqual(headers['Etag'], '"%s"' % self.manifest_abcd_slo_etag)
+        self.assertEqual(headers['X-Manifest-Etag'],
+                         self.manifest_abcd_json_md5)
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(body, b'aabbbbbbbbbbccc')
+
+        self.assertEqual(
+            self.app.calls,
+            [('GET', '/v1/AUTH_test/gettest/manifest-abcd'),
+             ('GET', '/v1/AUTH_test/gettest/manifest-bc'),
+             ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get')])
+
+        ranges = [c[2].get('Range') for c in self.app.calls_with_headers]
+        self.assertEqual(ranges, [
+            'bytes=3-17',
+            None,
+            'bytes=3-',
+            None,
+            'bytes=0-2'])
+        ignore_range_headers = [
+            c[2].get('X-Backend-Ignore-Range-If-Metadata-Present')
+            for c in self.app.calls_with_headers]
+        self.assertEqual(ignore_range_headers, [
+            'X-Static-Large-Object',
+            None,
+            None,
+            None,
+            None])
+        # we set swift.source for everything but the first request
+        self.assertIsNone(self.app.swift_sources[0])
+        self.assertEqual(self.app.swift_sources[1:],
+                         ['SLO'] * (len(self.app.swift_sources) - 1))
+
+    def test_multiple_ranges_get_manifest(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Range': 'bytes=3-17,20-24,35-999999'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(headers['Etag'],
+                         '"%s"' % self.manifest_abcd_slo_etag)
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['X-Manifest-Etag'],
+                         self.manifest_abcd_json_md5)
+        self.assertEqual(int(headers['Content-Length']), len(body))
+
+        ct, params = parse_content_type(headers['Content-Type'])
+        params = dict(params)
+        self.assertEqual(ct, 'multipart/byteranges')
+        boundary = params.get('boundary')
+        self.assertTrue(boundary is not None)
+        boundary = boundary.encode('utf-8')
+
+        self.assertEqual(len(body), int(headers['Content-Length']))
+        # this is a multi-range resp
+        self.assertNotIn('Content-Range', headers)
+
+        got_mime_docs = []
+        for mime_doc_fh in iter_multipart_mime_documents(
+                BytesIO(body), boundary):
+            headers = parse_mime_headers(mime_doc_fh)
+            body = mime_doc_fh.read()
+            got_mime_docs.append((headers, body))
+        self.assertEqual(len(got_mime_docs), 3)
+
+        first_range_headers = got_mime_docs[0][0]
+        first_range_body = got_mime_docs[0][1]
+        self.assertEqual(first_range_headers['Content-Range'],
+                         'bytes 3-17/50')
+        self.assertEqual(first_range_headers['Content-Type'],
+                         'application/json')
+        self.assertEqual(first_range_body, b'aabbbbbbbbbbccc')
+
+        second_range_headers = got_mime_docs[1][0]
+        second_range_body = got_mime_docs[1][1]
+        self.assertEqual(second_range_headers['Content-Range'],
+                         'bytes 20-24/50')
+        self.assertEqual(second_range_headers['Content-Type'],
+                         'application/json')
+        self.assertEqual(second_range_body, b'ccccc')
+
+        third_range_headers = got_mime_docs[2][0]
+        third_range_body = got_mime_docs[2][1]
+        self.assertEqual(third_range_headers['Content-Range'],
+                         'bytes 35-49/50')
+        self.assertEqual(third_range_headers['Content-Type'],
+                         'application/json')
+        self.assertEqual(third_range_body, b'ddddddddddddddd')
+
+        self.assertEqual(
+            self.app.calls,
+            [('GET', '/v1/AUTH_test/gettest/manifest-abcd'),
+             ('GET', '/v1/AUTH_test/gettest/manifest-bc'),
+             ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/d_20?multipart-manifest=get')])
+
+        ranges = [c[2].get('Range') for c in self.app.calls_with_headers]
+        self.assertEqual(ranges, [
+            'bytes=3-17,20-24,35-999999',  # initial GET
+            None,                          # fetch manifest-bc as sub-slo
+            'bytes=3-',                    # a_5
+            None,                          # b_10
+            'bytes=0-2,5-9',               # c_15
+            'bytes=5-'])                   # d_20
+        # we set swift.source for everything but the first request
+        self.assertIsNone(self.app.swift_sources[0])
+        self.assertEqual(self.app.swift_sources[1:],
+                         ['SLO'] * (len(self.app.swift_sources) - 1))
+
+    def test_multiple_ranges_including_suffix_get_manifest(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Range': 'bytes=3-17,-21'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(headers['Etag'],
+                         '"%s"' % self.manifest_abcd_slo_etag)
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['X-Manifest-Etag'],
+                         self.manifest_abcd_json_md5)
+        self.assertEqual(int(headers['Content-Length']), len(body))
+
+        ct, params = parse_content_type(headers['Content-Type'])
+        params = dict(params)
+        self.assertEqual(ct, 'multipart/byteranges')
+        boundary = params.get('boundary')
+        self.assertTrue(boundary is not None)
+        boundary = boundary.encode('utf-8')
+
+        got_mime_docs = []
+        for mime_doc_fh in iter_multipart_mime_documents(
+                BytesIO(body), boundary):
+            headers = parse_mime_headers(mime_doc_fh)
+            body = mime_doc_fh.read()
+            got_mime_docs.append((headers, body))
+        self.assertEqual(len(got_mime_docs), 2)
+
+        first_range_headers = got_mime_docs[0][0]
+        first_range_body = got_mime_docs[0][1]
+        self.assertEqual(first_range_headers['Content-Range'],
+                         'bytes 3-17/50')
+        self.assertEqual(first_range_body, b'aabbbbbbbbbbccc')
+
+        second_range_headers = got_mime_docs[1][0]
+        second_range_body = got_mime_docs[1][1]
+        self.assertEqual(second_range_headers['Content-Range'],
+                         'bytes 29-49/50')
+        self.assertEqual(second_range_body, b'cdddddddddddddddddddd')
+
+        self.assertEqual(
+            self.app.calls,
+            [('GET', '/v1/AUTH_test/gettest/manifest-abcd'),
+             ('GET', '/v1/AUTH_test/gettest/manifest-bc'),
+             ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/d_20?multipart-manifest=get')])
+        ranges = [c[2].get('Range') for c in self.app.calls_with_headers]
+        self.assertEqual(ranges, [
+            'bytes=3-17,-21',              # initial GET
+            None,                          # fetch manifest-bc as sub-slo
+            'bytes=3-',                    # a_5
+            None,                          # b_10
+            'bytes=0-2,14-',               # c_15
+            None])                         # d_20
+
+
+class TestSloGetOldManifests(TestSloGetManifests):
+
+    modern_manifest_headers = False
+
+    def test_get_manifest_with_submanifest_bytes_in_content_type(self):
+        _abcd_alt_manifest = [
+            {'name': '/gettest/a_5', 'hash': md5hex("a" * 5),
+             'content_type': 'text/plain', 'bytes': '5'},
+            {'name': '/gettest/manifest-bc', 'sub_slo': True,
+             'hash': self.manifest_bc_slo_etag,
+             # if swift 1.9.1 thru 1.12.0 let this sub-slo manifest get created
+             # with invalid hash/bytes the sub-request SLO GET will still work
+             'content_type': 'application/json; swift_bytes=25',
+             'bytes': self.manifest_bc_json_size},
+            {'name': '/gettest/d_20', 'hash': md5hex("d" * 20),
+             'content_type': 'text/plain', 'bytes': '20'}
+        ]
+        # N.B. if the _setup_manifest helper is called from a class w/
+        # modern_manifest_headers = True the fake sysmeta is calculated from
+        # the manifests provided bytes; real modern swift would have rejected
+        # the PUT when the HEAD resp showed a size mis-match with sub-slo resp
+        self._setup_manifest('abcd-alt', _abcd_alt_manifest,
+                             container='gettest')
+        # verify correct content-length when the sub-slo segment in the
+        # manifest has its actual object content-length appended as swift_bytes
+        # to the content-type, and the submanifest length in the bytes field.
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd-alt',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(headers['Content-Length'], '50')
+        # N.B. we use the same slo-etag hash for the sub-slo segment to
+        # calculate the alt-slo-etag
+        self.assertEqual(self.manifest_abcd_slo_etag,
+                         self.manifest_abcd_alt_slo_etag)
+        self.assertEqual(headers['Etag'],
+                         '"%s"' % self.manifest_abcd_alt_slo_etag)
+        self.assertEqual(headers['X-Manifest-Etag'],
+                         self.manifest_abcd_alt_json_md5)
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(
+            body, b'aaaaabbbbbbbbbbcccccccccccccccdddddddddddddddddddd')
+        self.assertEqual(
+            self.app.calls,
+            [('GET', '/v1/AUTH_test/gettest/manifest-abcd-alt'),
+             ('GET', '/v1/AUTH_test/gettest/manifest-bc'),
+             ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/d_20?multipart-manifest=get')])
+
+
+class TestOldSwiftWithRanges(SloGETorHEADTestCase):
+
+    # Proxies have been writing moden slo-sysmeta since 2016; object servers
+    # only started ignoring Range headers on x-static-large-object in 2020 and
+    # it works on legacy manifests.
+    modern_manifest_headers = True
+
+    def setUp(self):
+        super(TestOldSwiftWithRanges, self).setUp()
+        # old swift didn't know how to ignore range headers and respond with
+        # the whole object/manifest when specific metadata was present
+        self.app.can_ignore_range = False
+
+        self._setup_alphabet_objects('abcd')
+        self._setup_manifest_bc()
+        self._setup_manifest_bc_ranges()
+        self._setup_manifest_abcd()
+        self._setup_manifest_abcd_ranges()
+        self._setup_big_manifest()
+
+    def _setup_big_manifest(self):
+        big = b'e' * 1024 * 1024
+        big_etag = md5hex(big)
+        self.app.register(
+            'GET', '/v1/AUTH_test/gettest/big_seg',
+            swob.HTTPOk, {'Content-Type': 'application/foo',
+                          'Etag': big_etag}, big)
+        self._setup_manifest('big_man', [
+            {'name': '/gettest/big_seg', 'hash': big_etag,
+             'bytes': 1024 * 1024, 'content_type': 'application/foo'},
+        ], extra_headers={
+            'X-Backend-Timestamp': '1234',
+        }, container='gettest', obj_key='big_manifest')
+
+    def test_old_swift_range_get_includes_whole_manifest(self):
+        # If the first range GET results in retrieval of the entire manifest
+        # body (and not because of X-Backend-Ignore-Range-If-Metadata-Present,
+        # but because the requested range happened to be sufficient which we
+        # detected by looking at the Content-Range response header), then we
+        # should not go make a second, non-ranged request just to retrieve the
+        # same bytes again.
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Range': 'bytes=0-999999999'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(headers['Etag'],
+                         '"%s"' % self.manifest_abcd_slo_etag)
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['X-Manifest-Etag'],
+                         self.manifest_abcd_json_md5)
+        self.assertEqual(int(headers['Content-Length']),
+                         self.manifest_abcd_slo_size)
+        self.assertEqual(
+            body, b'aaaaabbbbbbbbbbcccccccccccccccdddddddddddddddddddd')
+
+        self.assertEqual(
+            self.app.calls,
+            [('GET', '/v1/AUTH_test/gettest/manifest-abcd'),
+             ('GET', '/v1/AUTH_test/gettest/manifest-bc'),
+             ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/d_20?multipart-manifest=get')])
+
+    def test_old_swift_range_get_beyond_manifest(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/big_manifest',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Range': 'bytes=100000-199999'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(headers['Etag'],
+                         '"%s"' % self.manifest_big_man_slo_etag)
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['X-Manifest-Etag'],
+                         self.manifest_big_man_json_md5)
+        self.assertEqual(int(headers['Content-Length']), len(body))
+        count_e = sum(1 if x == 'e' else 0
+                      for x in body.decode('ascii', errors='replace'))
+        self.assertEqual(count_e, 100000)
+        self.assertEqual(len(body) - count_e, 0)
+
+        self.assertEqual(
+            self.app.calls, [
+                # has Range header, gets 416
+                ('GET', '/v1/AUTH_test/gettest/big_manifest'),
+                # old swift can't ignore range request to manifest and we have
+                # to refetch; new swift has exactly the same behavior but w/o
+                # this extra refetch request as lots of other tests demonstrate
+                ('GET', '/v1/AUTH_test/gettest/big_manifest'),
+                ('GET',
+                 '/v1/AUTH_test/gettest/big_seg?multipart-manifest=get')])
+        self.assertEqual('bytes=100000-199999', self.app.headers[0]['Range'])
+        self.assertNotIn('Range', self.app.headers[1])
+        self.assertEqual('bytes=100000-199999', self.app.headers[2]['Range'])
+
+    def test_old_swift_range_get_beyond_manifest_refetch_fails(self):
+        # new swift would have ignored the range and got the whole
+        # manifest on the first try and therefore never have attempted
+        # this second refetch which fails
+        self.app.register_next_response(
+            'GET', '/v1/AUTH_test/gettest/big_manifest',
+            swob.HTTPNotFound, {}, None)
+
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/big_manifest',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Range': 'bytes=100000-199999'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '503 Service Unavailable')
+        self.assertNotIn('X-Static-Large-Object', headers)
+        self.assertEqual(self.app.calls, [
+            # has Range header, gets 416
+            ('GET', '/v1/AUTH_test/gettest/big_manifest'),
+            # retry the first one
+            ('GET', '/v1/AUTH_test/gettest/big_manifest'),
+        ])
+
+    def test_old_swift_range_get_beyond_manifest_refetch_finds_old(self):
+        # new swift would have ignored the range and got the whole
+        # manifest on the first try and therefore never have attempted
+        # this second refetch which is too old
+        self.app.register_next_response(
+            'GET', '/v1/AUTH_test/gettest/big_manifest',
+            swob.HTTPOk, {'X-Backend-Timestamp': '1233'}, [b'small body'])
+
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/big_manifest',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Range': 'bytes=100000-199999'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '503 Service Unavailable')
+        self.assertNotIn('X-Static-Large-Object', headers)
+        self.assertEqual(self.app.calls, [
+            # has Range header, gets 416
+            ('GET', '/v1/AUTH_test/gettest/big_manifest'),
+            # retry the first one
+            ('GET', '/v1/AUTH_test/gettest/big_manifest'),
+        ])
+
+    def test_old_swift_range_get_beyond_manifest_refetch_small_non_slo(self):
+        # new swift would have ignored the range and got the whole
+        # manifest on the first try and therefore never have attempted
+        # this second refetch which isn't an SLO
+        self.app.register_next_response(
+            'GET', '/v1/AUTH_test/gettest/big_manifest',
+            swob.HTTPOk, {'X-Backend-Timestamp': '1235'}, [b'small body'])
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/big_manifest',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Range': 'bytes=100000-199999'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '416 Requested Range Not Satisfiable')
+        self.assertNotIn('X-Static-Large-Object', headers)
+        self.assertEqual(self.app.calls, [
+            # has Range header, gets 416
+            ('GET', '/v1/AUTH_test/gettest/big_manifest'),
+            # retry the first one
+            ('GET', '/v1/AUTH_test/gettest/big_manifest'),
+        ])
+        # swob is converting the successful non-slo response to conditional
+        # error and closing our unconditionally refetched resp_iter
+        self.expected_unread_requests[
+            ('GET', '/v1/AUTH_test/gettest/big_manifest')] = 1
+
+    def test_old_swift_range_get_beyond_manifest_refetch_big_non_slo(self):
+        # new swift would have ignored the range and got the whole
+        # manifest on the first try and therefore never have attempted
+        # this second refetch which isn't an SLO
+        self.app.register_next_response(
+            'GET', '/v1/AUTH_test/gettest/big_manifest',
+            swob.HTTPOk, {'X-Backend-Timestamp': '1235'}, [b'x' * 1024 * 1024])
+
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/big_manifest',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Range': 'bytes=100000-199999'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')  # NOT 416 or 206!
+        self.assertNotIn('X-Static-Large-Object', headers)
+        self.assertEqual(len(body), 1024 * 1024)
+        self.assertEqual(body, b'x' * 1024 * 1024)
+        self.assertEqual(self.app.calls, [
+            # has Range header, gets 416
+            ('GET', '/v1/AUTH_test/gettest/big_manifest'),
+            # retry the first one
+            ('GET', '/v1/AUTH_test/gettest/big_manifest'),
+        ])
+
+    def test_old_swift_range_get_beyond_manifest_refetch_tombstone(self):
+        # new swift would have ignored the range and got the whole
+        # manifest on the first try and therefore never have attempted
+        # this second refetch which shows it was deleted
+        self.app.register_next_response(
+            'GET', '/v1/AUTH_test/gettest/big_manifest',
+            swob.HTTPNotFound, {'X-Backend-Timestamp': '1345'}, None)
+
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/big_manifest',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Range': 'bytes=100000-199999'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '404 Not Found')
+        self.assertNotIn('X-Static-Large-Object', headers)
+        self.assertEqual(self.app.calls, [
+            # has Range header, gets 416
+            ('GET', '/v1/AUTH_test/gettest/big_manifest'),
+            # retry the first one
+            ('GET', '/v1/AUTH_test/gettest/big_manifest'),
+        ])
+
+    def test_old_swift_range_get_bogus_content_range(self):
+        # Just a little paranoia; Swift currently sends back valid
+        # Content-Range headers, but if somehow someone sneaks an invalid one
+        # in there, we'll ignore it, when sniffing a 206 manifest response.
+
+        def content_range_breaker_factory(app):
+            def content_range_breaker(env, start_response):
+                req = swob.Request(env)
+                resp = req.get_response(app)
+                resp.headers['Content-Range'] = 'triscuits'
+                return resp(env, start_response)
+            return content_range_breaker
+
+        self.slo = slo.filter_factory({})(
+            content_range_breaker_factory(self.app))
+
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Range': 'bytes=0-999999999'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(
+            body, b'aaaaabbbbbbbbbbcccccccccccccccdddddddddddddddddddd')
+
+        self.assertEqual(
+            self.app.calls,
+            [('GET', '/v1/AUTH_test/gettest/manifest-abcd'),
+             # new swift would have ignored the range and got the whole
+             # manifest on the first try and therefore never have attempted to
+             # look at Content-Range; new swift has exactly the same behavior
+             # but w/o this extra refetch request, however on new swift the
+             # broken content-range in the resp isn't intresting or relevant
+             ('GET', '/v1/AUTH_test/gettest/manifest-abcd'),
+             ('GET', '/v1/AUTH_test/gettest/manifest-bc'),
+             ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/d_20?multipart-manifest=get')])
+
+    def test_old_swift_range_get_includes_whole_range_manifest(self):
+        # If the first range GET results in retrieval of the entire manifest
+        # body (and not because of X-Backend-Ignore-Range-If-Metadata-Present,
+        # but because the requested range happened to be sufficient which we
+        # detected by looking at the Content-Range response header), then we
+        # should not go make a second, non-ranged request just to retrieve the
+        # same bytes again.
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd-ranges',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Range': 'bytes=0-999999999'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(headers['Content-Length'], '32')
+        self.assertEqual(headers['Content-Type'], 'application/json')
+        self.assertEqual(body, b'aaaaaaaaccccccccbbbbbbbbdddddddd')
+
+        self.assertEqual(
+            self.app.calls,
+            [('GET', '/v1/AUTH_test/gettest/manifest-abcd-ranges'),
+             ('GET', '/v1/AUTH_test/gettest/manifest-bc-ranges'),
+             ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/d_20?multipart-manifest=get')])
+
+        ranges = [c[2].get('Range') for c in self.app.calls_with_headers]
+        self.assertEqual(ranges, [
+            'bytes=0-999999999',
+            None,
+            'bytes=0-3,1-',
+            'bytes=0-3,11-',
+            'bytes=4-7,2-5',
+            'bytes=0-3,8-11'])
+        # we set swift.source for everything but the first request
+        self.assertIsNone(self.app.swift_sources[0])
+        self.assertEqual(self.app.swift_sources[1:],
+                         ['SLO'] * (len(self.app.swift_sources) - 1))
+
+
+class TestOldSwiftWithRangesOldManifests(TestOldSwiftWithRanges):
+
+    # Proxies have been writing modern slo-sysmeta since 2016; object servers
+    # only started ignoring Range headers on x-static-large-object in 2020 and
+    # it works on legacy manifests.
+    modern_manifest_headers = False
+
+
+class TestSloRangeRequests(SloGETorHEADTestCase):
+
+    modern_manifest_headers = True
+
+    def setUp(self):
+        super(TestSloRangeRequests, self).setUp()
+        self._setup_alphabet_objects('abcd')
+        self._setup_manifest_bc()
+        self._setup_manifest_abcd()
+        self._setup_manifest_bc_ranges()
+        self._setup_manifest_abcd_ranges()
+        self._setup_manifest_abcd_subranges()
+
+    def test_range_get_manifest_on_segment_boundaries(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Range': 'bytes=5-29'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(headers['Content-Length'], '25')
+        self.assertEqual(headers['Content-Range'], 'bytes 5-29/50')
+        self.assertEqual(headers['Etag'], '"%s"' % self.manifest_abcd_slo_etag)
+        self.assertEqual(body, b'bbbbbbbbbbccccccccccccccc')
+
+        self.assertEqual(
+            self.app.calls,
+            [('GET', '/v1/AUTH_test/gettest/manifest-abcd'),
+             ('GET', '/v1/AUTH_test/gettest/manifest-bc'),
+             ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get')])
+
+        headers = [c[2] for c in self.app.calls_with_headers]
+        self.assertEqual(headers[0].get('Range'), 'bytes=5-29')
+        self.assertIsNone(headers[1].get('Range'))
+        self.assertIsNone(headers[2].get('Range'))
+        self.assertIsNone(headers[3].get('Range'))
+
+    def test_range_get_manifest_first_byte(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Range': 'bytes=0-0'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(headers['Content-Length'], '1')
+        self.assertEqual(headers['Content-Range'], 'bytes 0-0/50')
+        self.assertEqual(body, b'a')
+
+        # Make sure we don't get any objects we don't need, including
+        # submanifests.
+        self.assertEqual(
+            self.app.calls,
+            [('GET', '/v1/AUTH_test/gettest/manifest-abcd'),
+             ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get')])
+
+    def test_range_get_manifest_sub_slo(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Range': 'bytes=25-30'})
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(headers['Content-Length'], '6')
+        self.assertEqual(headers['Content-Range'], 'bytes 25-30/50')
+        self.assertEqual(body, b'cccccd')
+
+        # Make sure we don't get any objects we don't need, including
+        # submanifests.
+        self.assertEqual(
+            self.app.calls,
+            [('GET', '/v1/AUTH_test/gettest/manifest-abcd'),
+             ('GET', '/v1/AUTH_test/gettest/manifest-bc'),
+             ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/d_20?multipart-manifest=get')])
+
+    def test_range_get_manifest_overlapping_end(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Range': 'bytes=45-55'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(headers['Content-Length'], '5')
+        self.assertEqual(headers['Content-Range'], 'bytes 45-49/50')
+        self.assertEqual(body, b'ddddd')
+
+        self.assertEqual(
+            self.app.calls,
+            [('GET', '/v1/AUTH_test/gettest/manifest-abcd'),
+             ('GET', '/v1/AUTH_test/gettest/d_20?multipart-manifest=get')])
+
+    def test_range_get_manifest_unsatisfiable(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Range': 'bytes=100-200'})
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '416 Requested Range Not Satisfiable')
+
+    def test_get_segment_with_non_ascii_path(self):
+        segment_body = u"a møøse once bit my sister".encode("utf-8")
+        segment_etag = md5(segment_body, usedforsecurity=False).hexdigest()
+        path = str_to_wsgi(u'/v1/AUTH_test/ünicode/öbject-segment')
+        self.app.register(
+            'GET', path,
+            swob.HTTPOk, {'Content-Length': str(len(segment_body)),
+                          'Etag': segment_etag},
+            segment_body)
+
+        manifest_json = json.dumps([{'name': u'/ünicode/öbject-segment',
+                                     'hash': segment_etag,
+                                     'content_type': 'text/plain',
+                                     'bytes': len(segment_body)}])
+        path = str_to_wsgi(u'/v1/AUTH_test/ünicode/manifest')
+        self.app.register(
+            'GET', path,
+            swob.HTTPOk, {'Content-Type': 'application/json',
+                          'Content-Length': str(len(manifest_json)),
+                          'X-Static-Large-Object': 'true'},
+            manifest_json.encode('ascii'))
+
+        req = Request.blank(
+            str_to_wsgi('/v1/AUTH_test/ünicode/manifest'),
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(body, segment_body)
+
+    def test_get_range_manifest(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd-ranges',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(headers['Content-Length'], '32')
+        self.assertEqual(headers['Content-Type'], 'application/json')
+        self.assertEqual(body, b'aaaaaaaaccccccccbbbbbbbbdddddddd')
+
+        self.assertEqual(
+            self.app.calls,
+            [('GET', '/v1/AUTH_test/gettest/manifest-abcd-ranges'),
+             ('GET', '/v1/AUTH_test/gettest/manifest-bc-ranges'),
+             ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/d_20?multipart-manifest=get')])
+
+        ranges = [c[2].get('Range') for c in self.app.calls_with_headers]
+        self.assertEqual(ranges, [
+            None,
+            None,
+            'bytes=0-3,1-',
+            'bytes=0-3,11-',
+            'bytes=4-7,2-5',
+            'bytes=0-3,8-11'])
+        # we set swift.source for everything but the first request
+        self.assertIsNone(self.app.swift_sources[0])
+        self.assertEqual(
+            self.app.swift_sources[1:],
+            ['SLO'] * (len(self.app.swift_sources) - 1)
+        )
+        self.assertEqual(md5hex(''.join([
+            md5hex('a' * 5), ':0-3;',
+            md5hex('a' * 5), ':1-4;',
+            self.manifest_bc_ranges_slo_etag, ':8-15;',
+            self.manifest_bc_ranges_slo_etag, ':0-7;',
+            md5hex('d' * 20), ':0-3;',
+            md5hex('d' * 20), ':8-11;',
+        ])), headers['Etag'].strip('"'))
+
+    def test_get_subrange_manifest(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd-subranges',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(headers['Content-Length'], '17')
+        self.assertEqual(headers['Content-Type'], 'application/json')
+        self.assertEqual(body, b'aacccdccbbbabbddd')
+
+        self.assertEqual(
+            self.app.calls,
+            [('GET', '/v1/AUTH_test/gettest/manifest-abcd-subranges'),
+             ('GET', '/v1/AUTH_test/gettest/manifest-abcd-ranges'),
+             ('GET', '/v1/AUTH_test/gettest/manifest-bc-ranges'),
+             ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/d_20?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/d_20?multipart-manifest=get')])
+
+        ranges = [c[2].get('Range') for c in self.app.calls_with_headers]
+        self.assertEqual(ranges, [
+            None,
+            None,
+            None,
+            'bytes=3-',
+            'bytes=0-2',
+            'bytes=11-11',
+            'bytes=13-',
+            'bytes=4-6',
+            'bytes=0-0',
+            'bytes=4-5',
+            'bytes=0-2'])
+        # we set swift.source for everything but the first request
+        self.assertIsNone(self.app.swift_sources[0])
+        self.assertEqual(self.app.swift_sources[1:],
+                         ['SLO'] * (len(self.app.swift_sources) - 1))
+
+    def test_range_get_range_manifest(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd-ranges',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Range': 'bytes=7-26'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(headers['Content-Length'], '20')
+        self.assertEqual(headers['Content-Range'], 'bytes 7-26/32')
+        self.assertEqual(headers['Content-Type'], 'application/json')
+        self.assertIn('Etag', headers)
+        self.assertEqual(body, b'accccccccbbbbbbbbddd')
+
+        self.assertEqual(
+            self.app.calls,
+            [('GET', '/v1/AUTH_test/gettest/manifest-abcd-ranges'),
+             ('GET', '/v1/AUTH_test/gettest/manifest-bc-ranges'),
+             ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/d_20?multipart-manifest=get')])
+
+        ranges = [c[2].get('Range') for c in self.app.calls_with_headers]
+        self.assertEqual(ranges, [
+            'bytes=7-26',
+            None,
+            'bytes=4-',
+            'bytes=0-3,11-',
+            'bytes=4-7,2-5',
+            'bytes=0-2'])
+        # we set swift.source for everything but the first request
+        self.assertIsNone(self.app.swift_sources[0])
+        self.assertEqual(self.app.swift_sources[1:],
+                         ['SLO'] * (len(self.app.swift_sources) - 1))
+
+    def test_range_get_subrange_manifest(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd-subranges',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Range': 'bytes=4-12'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(headers['Content-Length'], '9')
+        self.assertEqual(headers['Content-Range'], 'bytes 4-12/17')
+        self.assertEqual(headers['Content-Type'], 'application/json')
+        self.assertEqual(body, b'cdccbbbab')
+
+        self.assertEqual(
+            self.app.calls,
+            [('GET', '/v1/AUTH_test/gettest/manifest-abcd-subranges'),
+             ('GET', '/v1/AUTH_test/gettest/manifest-abcd-ranges'),
+             ('GET', '/v1/AUTH_test/gettest/manifest-bc-ranges'),
+             ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/d_20?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get')])
+
+        ranges = [c[2].get('Range') for c in self.app.calls_with_headers]
+        self.assertEqual(ranges, [
+            'bytes=4-12',
+            None,
+            None,
+            'bytes=2-2',
+            'bytes=11-11',
+            'bytes=13-',
+            'bytes=4-6',
+            'bytes=0-0',
+            'bytes=4-4'])
+        # we set swift.source for everything but the first request
+        self.assertIsNone(self.app.swift_sources[0])
+        self.assertEqual(self.app.swift_sources[1:],
+                         ['SLO'] * (len(self.app.swift_sources) - 1))
+
+
+class TestSloRangeRequestsOldManifest(TestSloRangeRequests):
+
+    modern_manifest_headers = False
+
+
+class TestSloErrors(SloGETorHEADTestCase):
+
+    modern_manifest_headers = True
+
+    def setUp(self):
+        super(TestSloErrors, self).setUp()
+        self._setup_alphabet_objects('abcd')
+        self._setup_manifest_bc()
+        self._setup_manifest_abcd()
+
+        self._setup_manifest('badetag', [
+            {'name': '/gettest/a_5', 'hash': 'wrong!',
+             'content_type': 'text/plain', 'bytes': '5'}
+        ], container='gettest')
+        self._setup_manifest('badsize', [
+            {'name': '/gettest/a_5', 'hash': md5hex('a' * 5),
+             'content_type': 'text/plain', 'bytes': '999999'},
+        ], container='gettest')
+
+    def test_slo_sysmeta_on_error(self):
+        headers = {
+            'Content-Type': 'application/octet-stream',
+            'X-Static-Large-Object': 'true',
+            'X-Object-Meta-Animal': 'Pig',
+        }
+        if self.modern_manifest_headers:
+            headers.update({
+                'X-Object-Sysmeta-Slo-Etag': 'badmeta-etag',
+                'X-Object-Sysmeta-Slo-Size': '123',
+            })
+        self.app.register(
+            'GET', '/v1/AUTH_test/gettest/manifest-badmeta',
+            swob.HTTPNotFound, headers)
+        req = Request.blank('/v1/AUTH_test/gettest/manifest-badmeta')
+        status, headers, body = self.call_slo(req)
+        # slo metadata on error response!?  there's a bug somewhere.
+        self.assertEqual(status, '500 Internal Error')
+        self.assertEqual(body, b'Unable to load SLO manifest')
+        self.assertNotIn('X-Object-Meta-Animal', headers)
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/AUTH_test/gettest/manifest-badmeta')])
+
+    def test_get_bogus_manifest(self):
+        headers = {
+            'Content-Type': 'application/json',
+            'X-Static-Large-Object': 'true',
+            'X-Object-Meta-Fish': 'Bass',
+        }
+        if self.modern_manifest_headers:
+            headers.update({
+                'X-Object-Sysmeta-Slo-Etag': 'badjson-etag',
+                'X-Object-Sysmeta-Slo-Size': '123',
+            })
+        self.app.register(
+            'GET', '/v1/AUTH_test/gettest/manifest-badjson',
+            swob.HTTPOk, headers,
+            "[not {json (at ++++all")
+
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-badjson',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_slo(req)
+
+        # This often (usually?) happens because of an incomplete read -- the
+        # proxy app started getting a large manifest and sending it back to
+        # SLO, then there was a timeout or something, couldn't resume in time,
+        # and we've got just part of a JSON document. Having the client retry
+        # seems reasonable
+        self.assertEqual(status, '500 Internal Error')
+        self.assertEqual(body, b'Unable to load SLO manifest')
+        self.assertNotIn('X-Object-Meta-Fish', headers)
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/AUTH_test/gettest/manifest-badjson')])
+
+    def test_get_invalid_sysmeta_passthrough(self):
+        # in an attempt to workaround lp bug#2035158 s3api used to set some
+        # invalid slo/s3api sysmeta, we will always have some data stored with
+        # empty values for these headers, but they're not SLOs and are missing
+        # the X-Static-Large-Object marker sysmeta (thank goodness!)
+        self.app.register(
+            'GET', '/v1/AUTH_test/bucket+segments/obj/upload-id/1',
+            swob.HTTPOk, {
+                'X-Object-Sysmeta-S3Api-Acl': "{'some': 'json'}",
+                'X-Object-Sysmeta-S3Api-Etag': '',
+                'X-Object-Sysmeta-Slo-Etag': '',
+                'X-Object-Sysmeta-Slo-Size': '',
+                'X-Object-Sysmeta-Swift3-Etag': '',
+            }, "any seg created with copy-part")
+        req = Request.blank('/v1/AUTH_test/bucket+segments/obj/upload-id/1')
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')
+        self.assertNotIn('X-Static-Large-Object', headers)
+        self.assertNotIn('X-Manifest-Etag', headers)
+        self.assertEqual(int(headers['Content-Length']), len(body))
+        self.assertEqual(body, b"any seg created with copy-part")
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/AUTH_test/bucket+segments/obj/upload-id/1'),
+        ])
+
+    def _do_test_generator_closure(self, leaks):
+        # Test that the SLO WSGI iterable closes its internal .app_iter when
+        # it receives a close() message.
+        #
+        # This is sufficient to fix a memory leak. The memory leak arises
+        # due to cyclic references involving a running generator; a running
+        # generator sometimes preventes the GC from collecting it in the
+        # same way that an object with a defined __del__ does.
+        #
+        # There are other ways to break the cycle and fix the memory leak as
+        # well; calling .close() on the generator is sufficient, but not
+        # necessary. However, having this test is better than nothing for
+        # preventing regressions.
+        class LeakTracker(object):
+            def __init__(self, inner_iter):
+                leaks[0] += 1
+                self.inner_iter = iter(inner_iter)
+
+            def __iter__(self):
+                return self
+
+            def __next__(self):
+                return next(self.inner_iter)
+
+            def close(self):
+                leaks[0] -= 1
+                close_if_possible(self.inner_iter)
+
+        class LeakTrackingSegmentedIterable(slo.SegmentedIterable):
+            def _internal_iter(self, *a, **kw):
+                it = super(
+                    LeakTrackingSegmentedIterable, self)._internal_iter(
+                        *a, **kw)
+                return LeakTracker(it)
+
+        status = [None]
+        headers = [None]
+
+        def start_response(s, h, ei=None):
+            status[0] = s
+            headers[0] = h
+
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd',
+            environ={'REQUEST_METHOD': 'GET',
+                     'HTTP_ACCEPT': 'application/json'})
+
+        # can't self.call_slo() here since we don't want to consume the
+        # whole body
+        with patch.object(slo, 'SegmentedIterable',
+                          LeakTrackingSegmentedIterable):
+            app_resp = self.slo(req.environ, start_response)
+        self.assertEqual(status[0], '200 OK')  # sanity check
+        return app_resp
+
+    def test_generator_closure(self):
+        leaks = [0]
+        app_resp = self._do_test_generator_closure(leaks)
+        body_iter = iter(app_resp)
+        chunk = next(body_iter)
+        self.assertEqual(chunk, b'aaaaa')  # sanity check
+        app_resp.close()
+        self.assertEqual(0, leaks[0])
+        # we closed before reading all chunks
+        self.expected_unread_requests[
+            ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get')] = 1
+
+    def test_generator_closure_iter_app_resp(self):
+        # verify that the result of iter(app_resp) has a close method that
+        # closes app_resp
+        leaks = [0]
+        app_resp = self._do_test_generator_closure(leaks)
+        body_iter = iter(app_resp)
+        chunk = next(body_iter)
+        self.assertEqual(chunk, b'aaaaa')  # sanity check
+        close_method = getattr(body_iter, 'close', None)
+        self.assertIsNotNone(close_method)
+        self.assertTrue(callable(close_method))
+        close_method()
+        self.assertEqual(0, leaks[0])
+        # we closed before reading all chunks
+        self.expected_unread_requests[
+            ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get')] = 1
+
+    def test_recursion_limit(self):
+        # man1 points to obj1 and man2, man2 points to obj2 and man3...
+        for i in range(20):
+            self.app.register('GET', '/v1/AUTH_test/gettest/obj%d' % i,
+                              swob.HTTPOk, {'Content-Type': 'text/plain',
+                                            'Etag': md5hex('body%02d' % i)},
+                              b'body%02d' % i)
+
+        manifest_name = 'man1'
+        manifest_data = [{'name': '/gettest/obj20',
+                          'hash': md5hex('body20'),
+                          'content_type': 'text/plain',
+                          'bytes': '6'}]
+        self._setup_manifest(manifest_name, manifest_data,
+                             container='gettest', obj_key='man1')
+
+        submanifest_bytes = 6
+        for i in range(19, 0, -1):
+            manifest_name = 'man%d' % i
+            manifest_data = [
+                {'name': '/gettest/obj%d' % i,
+                 'hash': md5hex('body%02d' % i),
+                 'bytes': '6',
+                 'content_type': 'text/plain'},
+                {'data': base64.b64encode(b'-' * 3).decode('ascii')},
+                {'name': '/gettest/man%d' % (i + 1),
+                 'hash': 'man%d' % (i + 1),
+                 'sub_slo': True,
+                 'bytes': submanifest_bytes,
+                 'content_type': 'application/json'}]
+            self._setup_manifest(manifest_name, manifest_data,
+                                 container='gettest', obj_key=manifest_name)
+
+            submanifest_bytes += 9
+
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/man1',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_slo(req)
+
+        # we don't know at header-sending time that things are going to go
+        # wrong, so we end up with a 200 and a truncated body
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(headers['Content-Length'], str(9 * 19 + 6))
+        self.assertEqual(body, (
+            b'body01---body02---body03---body04---body05---'
+            b'body06---body07---body08---body09---body10---'))
+        # but the error shows up in logs
+        self.assertEqual(self.slo.logger.get_lines_for_level('error'), [
+            "While processing manifest '/v1/AUTH_test/gettest/man1', "
+            "max recursion depth was exceeded"
+        ])
+        # make sure we didn't keep asking for segments
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/AUTH_test/gettest/man1'),
+            ('GET', '/v1/AUTH_test/gettest/obj1?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/man2'),
+            ('GET', '/v1/AUTH_test/gettest/obj2?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/man3'),
+            ('GET', '/v1/AUTH_test/gettest/obj3?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/man4'),
+            ('GET', '/v1/AUTH_test/gettest/obj4?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/man5'),
+            ('GET', '/v1/AUTH_test/gettest/obj5?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/man6'),
+            ('GET', '/v1/AUTH_test/gettest/obj6?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/man7'),
+            ('GET', '/v1/AUTH_test/gettest/obj7?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/man8'),
+            ('GET', '/v1/AUTH_test/gettest/obj8?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/man9'),
+            ('GET', '/v1/AUTH_test/gettest/obj9?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/man10'),
+            ('GET', '/v1/AUTH_test/gettest/obj10?multipart-manifest=get'),
+        ])
+
+    def test_sub_slo_recursion(self):
+        # man1 points to man2 and obj1, man2 points to man3 and obj2...
+        for i in range(11):
+            self.app.register('GET', '/v1/AUTH_test/gettest/obj%d' % i,
+                              swob.HTTPOk, {'Content-Type': 'text/plain',
+                                            'Content-Length': '6',
+                                            'Etag': md5hex('body%02d' % i)},
+                              b'body%02d' % i)
+
+        manifest_name = 'man%d' % i
+        manifest_data = [{'name': '/gettest/obj%d' % i,
+                          'hash': md5hex('body%2d' % i),
+                          'content_type': 'text/plain',
+                          'bytes': '6'}]
+        self._setup_manifest(manifest_name, manifest_data,
+                             container='gettest', obj_key=manifest_name)
+
+        self.app.register(
+            'HEAD', '/v1/AUTH_test/gettest/obj%d' % i,
+            swob.HTTPOk, {'Content-Length': '6',
+                          'Etag': md5hex('body%2d' % i)},
+            None)
+
+        for i in range(9, 0, -1):
+            manifest_name = 'man%d' % i
+            manifest_data = [
+                {'name': '/gettest/man%d' % (i + 1),
+                 'hash': 'man%d' % (i + 1),
+                 'sub_slo': True,
+                 'bytes': (10 - i) * 6,
+                 'content_type': 'application/json'},
+                {'name': '/gettest/obj%d' % i,
+                 'hash': md5hex('body%02d' % i),
+                 'bytes': '6',
+                 'content_type': 'text/plain'}]
+            self._setup_manifest(manifest_name, manifest_data,
+                                 container='gettest', obj_key=manifest_name)
+
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/man1',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(body, (b'body10body09body08body07body06'
+                                b'body05body04body03body02body01'))
+
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/AUTH_test/gettest/man1'),
+            ('GET', '/v1/AUTH_test/gettest/man2'),
+            ('GET', '/v1/AUTH_test/gettest/man3'),
+            ('GET', '/v1/AUTH_test/gettest/man4'),
+            ('GET', '/v1/AUTH_test/gettest/man5'),
+            ('GET', '/v1/AUTH_test/gettest/man6'),
+            ('GET', '/v1/AUTH_test/gettest/man7'),
+            ('GET', '/v1/AUTH_test/gettest/man8'),
+            ('GET', '/v1/AUTH_test/gettest/man9'),
+            ('GET', '/v1/AUTH_test/gettest/man10'),
+            ('GET', '/v1/AUTH_test/gettest/obj10?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/obj9?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/obj8?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/obj7?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/obj6?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/obj5?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/obj4?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/obj3?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/obj2?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/obj1?multipart-manifest=get'),
+        ])
+
+    def test_sub_slo_recursion_limit(self):
+        # man1 points to man2 and obj1, man2 points to man3 and obj2...
+        for i in range(12):
+            self.app.register('GET', '/v1/AUTH_test/gettest/obj%d' % i,
+                              swob.HTTPOk,
+                              {'Content-Type': 'text/plain',
+                               'Content-Length': '6',
+                               'Etag': md5hex('body%02d' % i)},
+                              b'body%02d' % i)
+
+        manifest_name = 'man%d' % i
+        manifest_data = [{'name': '/gettest/obj%d' % i,
+                          'hash': md5hex('body%2d' % i),
+                          'content_type': 'text/plain',
+                          'bytes': '6'}]
+        self._setup_manifest(manifest_name, manifest_data,
+                             container='gettest', obj_key=manifest_name)
+
+        self.app.register(
+            'HEAD', '/v1/AUTH_test/gettest/obj%d' % i,
+            swob.HTTPOk, {'Content-Length': '6',
+                          'Etag': md5hex('body%2d' % i)},
+            None)
+
+        for i in range(11, 0, -1):
+            manifest_name = 'man%d' % i
+            manifest_data = [
+                {'name': '/gettest/man%d' % (i + 1),
+                 'hash': 'man%d' % (i + 1),
+                 'sub_slo': True,
+                 'bytes': (12 - i) * 6,
+                 'content_type': 'application/json'},
+                {'name': '/gettest/obj%d' % i,
+                 'hash': md5hex('body%02d' % i),
+                 'bytes': '6',
+                 'content_type': 'text/plain'}]
+            self._setup_manifest(manifest_name, manifest_data,
+                                 container='gettest', obj_key=manifest_name)
+
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/man1',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '409 Conflict')
+        self.assertNotIn('Etag', headers)
+        self.assertNotIn('X-Manifest-Etag', headers)
+        self.assertNotIn('X-Static-Large-Object', headers)
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/AUTH_test/gettest/man1'),
+            ('GET', '/v1/AUTH_test/gettest/man2'),
+            ('GET', '/v1/AUTH_test/gettest/man3'),
+            ('GET', '/v1/AUTH_test/gettest/man4'),
+            ('GET', '/v1/AUTH_test/gettest/man5'),
+            ('GET', '/v1/AUTH_test/gettest/man6'),
+            ('GET', '/v1/AUTH_test/gettest/man7'),
+            ('GET', '/v1/AUTH_test/gettest/man8'),
+            ('GET', '/v1/AUTH_test/gettest/man9'),
+            ('GET', '/v1/AUTH_test/gettest/man10'),
+        ])
+        self.assertEqual(self.slo.logger.get_lines_for_level('error'), [
+            "While processing manifest '/v1/AUTH_test/gettest/man1', "
+            "max recursion depth was exceeded"
+        ])
+
+    def test_error_fetching_segment(self):
+        self.app.register('GET', '/v1/AUTH_test/gettest/c_15',
+                          swob.HTTPUnauthorized, {}, None)
+
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(b"aaaaabbbbbbbbbb", body)
+        self.assertEqual(self.slo.logger.get_lines_for_level('error'), [
+            'While processing manifest /v1/AUTH_test/gettest/manifest-abcd, '
+            'got 401 (<html><h1>Unauthorized</h1><p>This server could not '
+            'verif...) while retrieving /v1/AUTH_test/gettest/c_15'
+        ])
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/AUTH_test/gettest/manifest-abcd'),
+            ('GET', '/v1/AUTH_test/gettest/manifest-bc'),
+            ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'),
+            # This one has the error, and so is the last one we fetch.
+            ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get')])
+
+    def test_error_fetching_submanifest(self):
+        self.app.register('GET', '/v1/AUTH_test/gettest/manifest-bc',
+                          swob.HTTPUnauthorized, {}, None)
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual("200 OK", status)
+        self.assertEqual(b"aaaaa", body)
+        self.assertEqual(self.slo.logger.get_lines_for_level('error'), [
+            'while fetching /v1/AUTH_test/gettest/manifest-abcd, GET of '
+            'submanifest /v1/AUTH_test/gettest/manifest-bc failed with '
+            'status 401 (<html><h1>Unauthorized</h1><p>This server could '
+            'not verif...)'
+        ])
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/AUTH_test/gettest/manifest-abcd'),
+            # TODO: skip coalecse until validate to re-order sub-manifest req
+            # This one has the error, and so is the last one we fetch.
+            ('GET', '/v1/AUTH_test/gettest/manifest-bc'),
+            # But we were looking ahead to see if we could combine ranges,
+            # so we still get the first segment out
+            ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get')])
+
+    def test_error_fetching_first_segment_submanifest(self):
+        # This differs from the normal submanifest error because this one
+        # happens before we've actually sent any response body.
+        self.app.register(
+            'GET', '/v1/AUTH_test/gettest/manifest-a',
+            swob.HTTPForbidden, {}, None)
+        self._setup_manifest('manifest-a', [
+            {'name': '/gettest/manifest-a', 'sub_slo': True,
+             'content_type': 'application/json',
+             'hash': 'manifest-a', 'bytes': '12345'},
+        ], container='gettest')
+
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-manifest-a',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual('409 Conflict', status)
+        self.assertEqual(self.slo.logger.get_lines_for_level('error'), [
+            'while fetching /v1/AUTH_test/gettest/manifest-manifest-a, GET '
+            'of submanifest /v1/AUTH_test/gettest/manifest-a failed with '
+            'status 403 (<html><h1>Forbidden</h1><p>Access was denied to '
+            'this reso...)'
+        ])
+
+    def test_invalid_json_submanifest(self):
+        self.app.register(
+            'GET', '/v1/AUTH_test/gettest/manifest-bc',
+            swob.HTTPOk, {'Content-Type': 'application/json',
+                          'X-Static-Large-Object': 'true',
+                          'X-Object-Meta-Plant': 'Ficus'},
+            "[this {isn't (JSON")
+
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual('200 OK', status)
+        self.assertEqual(body, b'aaaaa')
+        self.assertEqual(self.slo.logger.get_lines_for_level('error'), [
+            'Unable to load SLO manifest: '
+            'Expecting value: line 1 column 2 (char 1)',
+            'while fetching /v1/AUTH_test/gettest/manifest-abcd, '
+            'JSON-decoding of submanifest /v1/AUTH_test/gettest/manifest-bc '
+            'failed with 500 Internal Error'
+        ])
+
+    def test_mismatched_etag(self):
+        self._setup_manifest('a-b-badetag-c', [
+            {'name': '/gettest/a_5', 'hash': md5hex('a' * 5),
+             'content_type': 'text/plain', 'bytes': '5'},
+            {'name': '/gettest/b_10', 'hash': 'wrong!',
+             'content_type': 'text/plain', 'bytes': '10'},
+            {'name': '/gettest/c_15', 'hash': md5hex('c' * 15),
+             'content_type': 'text/plain', 'bytes': '15'},
+        ], container='gettest')
+
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-a-b-badetag-c',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual('200 OK', status)
+        self.assertEqual(headers['Etag'], '"%s"' %
+                         self.manifest_a_b_badetag_c_slo_etag)
+        self.assertEqual(headers['X-Manifest-Etag'],
+                         self.manifest_a_b_badetag_c_json_md5)
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(body, b'aaaaa')
+        self.assertEqual(self.slo.logger.get_lines_for_level('error'), [
+            'Object segment no longer valid: /v1/AUTH_test/gettest/b_10 '
+            'etag: 82136b4240d6ce4ea7d03e51469a393b != wrong! or 10 != 10.'
+        ])
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/AUTH_test/gettest/manifest-a-b-badetag-c'),
+            ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'),
+        ])
+        # we don't drain the segment's resp_iter if validation fails
+        self.expected_unread_requests[
+            ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get')] = 1
+
+    def test_mismatched_size(self):
+        self._setup_manifest('a-b-badsize-c', [
+            {'name': '/gettest/a_5', 'hash': md5hex('a' * 5),
+             'content_type': 'text/plain', 'bytes': '5'},
+            {'name': '/gettest/b_10', 'hash': md5hex('b' * 10),
+             'content_type': 'text/plain', 'bytes': '999999'},
+            {'name': '/gettest/c_15', 'hash': md5hex('c' * 15),
+             'content_type': 'text/plain', 'bytes': '15'},
+        ], container='gettest')
+
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-a-b-badsize-c',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual('200 OK', status)
+        self.assertEqual(body, b'aaaaa')
+        self.assertEqual(self.slo.logger.get_lines_for_level('error'), [
+            'Object segment no longer valid: /v1/AUTH_test/gettest/b_10 '
+            'etag: 82136b4240d6ce4ea7d03e51469a393b != '
+            '82136b4240d6ce4ea7d03e51469a393b or 10 != 999999.'
+        ])
+        # we don't drain the segment's resp_iter if validation fails
+        self.expected_unread_requests[
+            ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get')] = 1
+
+    def test_mismatched_checksum(self):
+        self.app.register(
+            'GET', '/v1/AUTH_test/gettest/a_5',
+            swob.HTTPOk, {'Content-Length': '5',
+                          'Etag': md5hex('a' * 5)},
+            # this segment has invalid content
+            'x' * 5)
+
+        self.app.register(
+            'GET', '/v1/AUTH_test/gettest/manifest',
+            swob.HTTPOk, {'Content-Type': 'application/json',
+                          'X-Static-Large-Object': 'true'},
+            json.dumps([{'name': '/gettest/b_10', 'hash': md5hex('b' * 10),
+                         'content_type': 'text/plain', 'bytes': '10'},
+                        {'name': '/gettest/a_5', 'hash': md5hex('a' * 5),
+                         'content_type': 'text/plain', 'bytes': '5'},
+                        {'name': '/gettest/c_15', 'hash': md5hex('c' * 15),
+                         'content_type': 'text/plain', 'bytes': '15'}]))
+
+        req = Request.blank('/v1/AUTH_test/gettest/manifest')
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual('200 OK', status)
+        self.assertEqual(body, (b'b' * 10 + b'x' * 5))
+        self.assertEqual(self.slo.logger.get_lines_for_level('error'), [
+            'Bad MD5 checksum for /v1/AUTH_test/gettest/a_5 as part of '
+            '/v1/AUTH_test/gettest/manifest: headers had '
+            '594f803b380a41396ed63dca39503542, but object MD5 was '
+            'actually fb0e22c79ac75679e9881e6ba183b354',
+        ])
+
+    def test_mismatched_length(self):
+        self.app.register(
+            'GET', '/v1/AUTH_test/gettest/a_5',
+            swob.HTTPOk, {'Content-Length': '5',
+                          'Etag': md5hex('a' * 5)},
+            # this segment comes up short
+            [b'a' * 4])
+
+        self.app.register(
+            'GET', '/v1/AUTH_test/gettest/manifest',
+            swob.HTTPOk, {'Content-Type': 'application/json',
+                          'X-Static-Large-Object': 'true'},
+            json.dumps([{'name': '/gettest/b_10', 'hash': md5hex('b' * 10),
+                         'content_type': 'text/plain', 'bytes': '10'},
+                        {'name': '/gettest/a_5', 'hash': md5hex('a' * 5),
+                         'content_type': 'text/plain', 'bytes': '5'},
+                        {'name': '/gettest/c_15', 'hash': md5hex('c' * 15),
+                         'content_type': 'text/plain', 'bytes': '15'}]))
+
+        req = Request.blank('/v1/AUTH_test/gettest/manifest')
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual('200 OK', status)
+        self.assertEqual(body, (b'b' * 10 + b'a' * 4))
+        self.assertEqual(self.slo.logger.get_lines_for_level('error'), [
+            'Bad response length for /v1/AUTH_test/gettest/a_5 as part of '
+            '/v1/AUTH_test/gettest/manifest: headers had 5, but '
+            'response length was actually 4',
+        ])
+
+    def test_first_segment_mismatched_etag(self):
+        req = Request.blank('/v1/AUTH_test/gettest/manifest-badetag')
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual('409 Conflict', status)
+        self.assertNotIn('Etag', headers)
+        self.assertNotIn('X-Manifest-Etag', headers)
+        self.assertNotIn('X-Static-Large-Object', headers)
+        self.assertEqual(int(headers['Content-Length']), len(body))
+        self.assertIn(b'There was a conflict', body)
+
+        self.assertEqual(self.slo.logger.get_lines_for_level('error'), [
+            'Object segment no longer valid: /v1/AUTH_test/gettest/a_5 '
+            'etag: 594f803b380a41396ed63dca39503542 != wrong! or 5 != 5.'
+        ])
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/AUTH_test/gettest/manifest-badetag'),
+            ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+        ])
+        # we don't drain the segment's resp_iter if validation fails
+        self.expected_unread_requests[
+            ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get')] = 1
+
+    def test_head_does_not_validate_first_segment_mismatched_etag(self):
+        req = Request.blank('/v1/AUTH_test/gettest/manifest-badetag',
+                            method='HEAD')
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(headers['Etag'],
+                         '"%s"' % self.manifest_badetag_slo_etag)
+        self.assertEqual(headers['X-Manifest-Etag'],
+                         self.manifest_badetag_json_md5)
+        self.assertEqual(int(headers['Content-Length']),
+                         self.manifest_badetag_slo_size)
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        expected_calls = [
+            ('HEAD', '/v1/AUTH_test/gettest/manifest-badetag'),
+        ]
+        if not self.modern_manifest_headers:
+            expected_calls.append(
+                ('GET', '/v1/AUTH_test/gettest/manifest-badetag'))
+        self.assertEqual(self.app.calls, expected_calls)
+
+    def test_first_segment_mismatched_size(self):
+        req = Request.blank('/v1/AUTH_test/gettest/manifest-badsize',
+                            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual('409 Conflict', status)
+        self.assertNotIn('Etag', headers)
+        self.assertNotIn('X-Manifest-Etag', headers)
+        self.assertNotIn('X-Static-Large-Object', headers)
+        self.assertEqual(int(headers['Content-Length']), len(body))
+        self.assertIn(b'There was a conflict', body)
+        self.assertEqual(self.slo.logger.get_lines_for_level('error'), [
+            'Object segment no longer valid: /v1/AUTH_test/gettest/a_5 '
+            'etag: 594f803b380a41396ed63dca39503542 != '
+            '594f803b380a41396ed63dca39503542 or 5 != 999999.'
+        ])
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/AUTH_test/gettest/manifest-badsize'),
+            ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+        ])
+        # we don't drain the segment's resp_iter if validation fails
+        self.expected_unread_requests[
+            ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get')] = 1
+
+    def test_head_does_not_validate_first_segment_mismatched_size(self):
+        req = Request.blank('/v1/AUTH_test/gettest/manifest-badsize',
+                            method='HEAD')
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(headers['Etag'],
+                         '"%s"' % self.manifest_badsize_slo_etag)
+        self.assertEqual(headers['X-Manifest-Etag'],
+                         self.manifest_badsize_json_md5)
+        self.assertEqual(int(headers['Content-Length']),
+                         self.manifest_badsize_slo_size)
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        expected_calls = [
+            ('HEAD', '/v1/AUTH_test/gettest/manifest-badsize'),
+        ]
+        if not self.modern_manifest_headers:
+            expected_calls.append(
+                ('GET', '/v1/AUTH_test/gettest/manifest-badsize'))
+        self.assertEqual(self.app.calls, expected_calls)
+
+    @patch('swift.common.request_helpers.time')
+    def test_download_takes_too_long(self, mock_time):
+        mock_time.time.side_effect = [
+            0,  # start time
+            10 * 3600,  # a_5
+            20 * 3600,  # b_10
+            30 * 3600,  # c_15, but then we time out
+        ]
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd',
+            environ={'REQUEST_METHOD': 'GET'})
+
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(self.slo.logger.get_lines_for_level('error'), [
+            'While processing manifest /v1/AUTH_test/gettest/manifest-abcd, '
+            'max LO GET time of 86400s exceeded'
+        ])
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/AUTH_test/gettest/manifest-abcd'),
+            ('GET', '/v1/AUTH_test/gettest/manifest-bc'),
+            ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get')])
+        # we timeout without reading the whole of the last segment
+        self.expected_unread_requests[
+            ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get')] = 1
+
+    def test_first_segment_not_exists(self):
+        self.app.register('GET', '/v1/AUTH_test/gettest/not_exists_obj',
+                          swob.HTTPNotFound, {}, None)
+        self.app.register('GET', '/v1/AUTH_test/gettest/manifest-not-exists',
+                          swob.HTTPOk, {'Content-Type': 'application/json',
+                                        'X-Static-Large-Object': 'true'},
+                          json.dumps([{'name': '/gettest/not_exists_obj',
+                                       'hash': md5hex('not_exists_obj'),
+                                       'content_type': 'text/plain',
+                                       'bytes': '%d' % len('not_exists_obj')
+                                       }]))
+
+        req = Request.blank('/v1/AUTH_test/gettest/manifest-not-exists',
+                            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual('409 Conflict', status)
+        self.assertEqual(self.slo.logger.get_lines_for_level('error'), [
+            'While processing manifest /v1/AUTH_test/gettest/'
+            'manifest-not-exists, got 404 (<html><h1>Not Found</h1><p>The '
+            'resource could not be foun...) while retrieving /v1/AUTH_test/'
+            'gettest/not_exists_obj'
+        ])
+
+    def test_first_segment_not_available(self):
+        self.app.register('GET', '/v1/AUTH_test/gettest/not_avail_obj',
+                          swob.HTTPServiceUnavailable, {}, None)
+        self.app.register('GET', '/v1/AUTH_test/gettest/manifest-not-avail',
+                          swob.HTTPOk, {'Content-Type': 'application/json',
+                                        'X-Static-Large-Object': 'true'},
+                          json.dumps([{'name': '/gettest/not_avail_obj',
+                                       'hash': md5hex('not_avail_obj'),
+                                       'content_type': 'text/plain',
+                                       'bytes': '%d' % len('not_avail_obj')
+                                       }]))
+
+        req = Request.blank('/v1/AUTH_test/gettest/manifest-not-avail',
+                            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual('503 Service Unavailable', status)
+        self.assertEqual(self.slo.logger.get_lines_for_level('error'), [
+            'While processing manifest /v1/AUTH_test/gettest/'
+            'manifest-not-avail, got 503 (<html><h1>Service Unavailable</h1>'
+            '<p>The server is curren...) while retrieving /v1/AUTH_test/'
+            'gettest/not_avail_obj'
+        ])
+        self.assertIn(b'Service Unavailable', body)
+
+
+class TestSloErrorsOldManifests(TestSloErrors):
+
+    modern_manifest_headers = False
+
+
+class TestSloDataSegments(SloGETorHEADTestCase):
+    # data segments were added some months after modern slo-sysmeta
+
+    def setUp(self):
+        super(TestSloDataSegments, self).setUp()
+        self._setup_alphabet_objects('ab')
+
+    def test_leading_data_segment(self):
+        slo_etag = md5hex(
+            md5hex('preamble') +
+            md5hex('a' * 5)
+        )
+        preamble = base64.b64encode(b'preamble')
+        self.app.register(
+            'GET', '/v1/AUTH_test/gettest/manifest-single-preamble',
+            swob.HTTPOk,
+            {
+                'Content-Type': 'application/json',
+                'X-Static-Large-Object': 'true'
+            },
+            json.dumps([{
+                'data': preamble.decode('ascii')
+            }, {
+                'name': '/gettest/a_5',
+                'hash': md5hex('a' * 5),
+                'content_type': 'text/plain',
+                'bytes': '5',
+            }])
+        )
+
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-single-preamble',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual('200 OK', status)
+        self.assertEqual(body, b'preambleaaaaa')
+        self.assertEqual(headers['Etag'], '"%s"' % slo_etag)
+        self.assertEqual(headers['Content-Length'], '13')
+
+    def test_trailing_data_segment(self):
+        slo_etag = md5hex(
+            md5hex('a' * 5) +
+            md5hex('postamble')
+        )
+        postamble = base64.b64encode(b'postamble')
+        self.app.register(
+            'GET', '/v1/AUTH_test/gettest/manifest-single-postamble',
+            swob.HTTPOk,
+            {
+                'Content-Type': 'application/json',
+                'X-Static-Large-Object': 'true'
+            },
+            json.dumps([{
+                'name': '/gettest/a_5',
+                'hash': md5hex('a' * 5),
+                'content_type': 'text/plain',
+                'bytes': '5',
+            }, {
+                'data': postamble.decode('ascii')
+            }]).encode('ascii')
+        )
+
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-single-postamble',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual('200 OK', status)
+        self.assertEqual(body, b'aaaaapostamble')
+        self.assertEqual(headers['Etag'], '"%s"' % slo_etag)
+        self.assertEqual(headers['Content-Length'], '14')
+
+    def test_data_segment_sandwich(self):
+        slo_etag = md5hex(
+            md5hex('preamble') +
+            md5hex('a' * 5) +
+            md5hex('postamble')
+        )
+        preamble = base64.b64encode(b'preamble')
+        postamble = base64.b64encode(b'postamble')
+        self.app.register(
+            'GET', '/v1/AUTH_test/gettest/manifest-single-prepostamble',
+            swob.HTTPOk,
+            {
+                'Content-Type': 'application/json',
+                'X-Static-Large-Object': 'true'
+            },
+            json.dumps([{
+                'data': preamble.decode('ascii'),
+            }, {
+                'name': '/gettest/a_5',
+                'hash': md5hex('a' * 5),
+                'content_type': 'text/plain',
+                'bytes': '5',
+            }, {
+                'data': postamble.decode('ascii')
+            }])
+        )
+
+        # Test the whole SLO
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-single-prepostamble',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual('200 OK', status)
+        self.assertEqual(body, b'preambleaaaaapostamble')
+        self.assertEqual(headers['Etag'], '"%s"' % slo_etag)
+        self.assertEqual(headers['Content-Length'], '22')
+
+        # Test complete preamble only
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-single-prepostamble',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Range': 'bytes=0-7'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual('206 Partial Content', status)
+        self.assertEqual(body, b'preamble')
+
+        # Test range within preamble only
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-single-prepostamble',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Range': 'bytes=1-5'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual('206 Partial Content', status)
+        self.assertEqual(body, b'reamb')
+
+        # Test complete postamble only
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-single-prepostamble',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Range': 'bytes=13-21'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual('206 Partial Content', status)
+        self.assertEqual(body, b'postamble')
+
+        # Test partial pre and postamble
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-single-prepostamble',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Range': 'bytes=4-16'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual('206 Partial Content', status)
+        self.assertEqual(body, b'mbleaaaaapost')
+
+        # Test partial preamble and first byte of data
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-single-prepostamble',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Range': 'bytes=1-8'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual('206 Partial Content', status)
+        self.assertEqual(body, b'reamblea')
+
+        # Test last byte of segment data and partial postamble
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-single-prepostamble',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Range': 'bytes=12-16'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual('206 Partial Content', status)
+        self.assertEqual(body, b'apost')
+
+    def test_bunches_of_data_segments(self):
+        slo_etag = md5hex(
+            md5hex('ABCDEF') +
+            md5hex('a' * 5) +
+            md5hex('123456') +
+            md5hex('GHIJKL') +
+            md5hex('b' * 10) +
+            md5hex('7890@#')
+        )
+        self.app.register(
+            'GET', '/v1/AUTH_test/gettest/manifest-multi-prepostamble',
+            swob.HTTPOk,
+            {
+                'Content-Type': 'application/json',
+                'X-Static-Large-Object': 'true'
+            },
+            json.dumps([
+                {
+                    'data': base64.b64encode(b'ABCDEF').decode('ascii')
+                },
+                {
+                    'name': '/gettest/a_5',
+                    'hash': md5hex('a' * 5),
+                    'content_type': 'text/plain',
+                    'bytes': '5',
+                },
+                {
+                    'data': base64.b64encode(b'123456').decode('ascii')
+                },
+                {
+                    'data': base64.b64encode(b'GHIJKL').decode('ascii')
+                },
+                {
+                    'name': '/gettest/b_10',
+                    'hash': md5hex('b' * 10),
+                    'content_type': 'text/plain',
+                    'bytes': '10',
+                },
+                {
+                    'data': base64.b64encode(b'7890@#').decode('ascii')
+                }
+            ])
+        )
+
+        # Test the whole SLO
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-multi-prepostamble',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual('200 OK', status)
+        self.assertEqual(body, b'ABCDEFaaaaa123456GHIJKLbbbbbbbbbb7890@#')
+        self.assertEqual(headers['Etag'], '"%s"' % slo_etag)
+        self.assertEqual(headers['Content-Length'], '39')
+
+        # Test last byte first pre-amble to first byte of second postamble
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-multi-prepostamble',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Range': 'bytes=5-33'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual('206 Partial Content', status)
+        self.assertEqual(body, b'Faaaaa123456GHIJKLbbbbbbbbbb7')
+
+        # Test only second complete preamble
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-multi-prepostamble',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Range': 'bytes=17-22'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual('206 Partial Content', status)
+        self.assertEqual(body, b'GHIJKL')
+
+        # Test only first complete postamble
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-multi-prepostamble',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Range': 'bytes=11-16'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual('206 Partial Content', status)
+        self.assertEqual(body, b'123456')
+
+        # Test only range within first postamble
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-multi-prepostamble',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Range': 'bytes=12-15'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual('206 Partial Content', status)
+        self.assertEqual(body, b'2345')
+
+        # Test only range within first postamble and second preamble
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-multi-prepostamble',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Range': 'bytes=12-18'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual('206 Partial Content', status)
+        self.assertEqual(body, b'23456GH')
+
+
+class TestSloConditionalGetOldManifest(SloGETorHEADTestCase):
+
+    modern_manifest_headers = False
+
+    def setUp(self):
+        super(TestSloConditionalGetOldManifest, self).setUp()
+        self._setup_alphabet_objects('abcd')
+        self._setup_manifest_bc()
+        self._setup_manifest_abcd()
+
+        # plain object with alt-etag
+        num_segments = 2
+        alt_seg_info = []
+        for i in range(num_segments):
+            body = (b'alt_%02d' % i) * 5
+            etag = md5hex(body)
+            self.app.register(
+                'GET', '/v1/AUTH_test/c/alt_%02d' % i,
+                swob.HTTPOk, {
+                    'Content-Length': len(body),
+                    'Etag': etag,
+                    'X-Object-Sysmeta-Alt-Etag': 'seg-etag-%02d' % i
+                }, body=body)
+            alt_seg_info.append((body, etag))
+
+        # s3api is to the left of SLO and writes an alternate etag for
+        # conditional requests to match
+        self._setup_manifest('alt', [{
+            'name': '/c/alt_%02d' % i,
+            'bytes': len(body),
+            'hash': etag,
+            'content_type': 'text/plain',
+        } for i, (body, etag) in enumerate(alt_seg_info)], extra_headers={
+            'X-Object-Sysmeta-Alt-Etag': '"alt-etag-1"',
+        })
+
+        self._setup_manifest('last-modified', [
+            {'name': '/gettest/a_5', 'hash': md5hex('a' * 5), 'bytes': '5',
+             'content_type': 'text/plain'},
+            {'name': '/gettest/c_15', 'hash': md5hex('c' * 15), 'bytes': '15',
+             'content_type': 'text/plain'},
+        ], extra_headers={
+            'Last-Modified': 'Mon, 23 Oct 2023 10:05:32 GMT',
+        })
+
+    def test_if_none_match_matches(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd',
+            headers={'If-None-Match': self.manifest_abcd_slo_etag})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '304 Not Modified')
+        self.assertEqual('"%s"' % self.manifest_abcd_slo_etag, headers['Etag'])
+        # conditional errors are always zero-bytes to save client egress
+        self.assertEqual('0', headers['Content-Length'])
+        self.assertEqual(b'', body)
+
+        expected_app_calls = [('GET', '/v1/AUTH_test/gettest/manifest-abcd')]
+        if not self.modern_manifest_headers:
+            expected_app_calls.extend([
+                # N.B. since manifest didn't match slo_etag => no refetch
+                # TODO: skip coalecse until validate to avoid sub-manifest req
+                ('GET', '/v1/AUTH_test/gettest/manifest-bc'),
+                # for legacy manifests we don't know if swob will return a
+                # successful response or conditional error so we validate the
+                # first segment to avoid a 2XX when we should 5XX
+                ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+            ])
+            # when swob decides to error it closes our SegmentedIterable
+            # and we don't drain the (possibly large) segment.
+            self.expected_unread_requests[('GET', '/v1/AUTH_test/gettest/a_5'
+                                           '?multipart-manifest=get')] = 1
+        self.assertEqual(self.app.calls, expected_app_calls)
+        self.assertEqual(self.app.headers[0].get('X-Backend-Etag-Is-At'),
+                         'x-object-sysmeta-slo-etag')
+        if not self.modern_manifest_headers:
+            for headers in self.app.headers[1:]:
+                self.assertNotIn('If-Match', headers)
+                self.assertNotIn('X-Backend-Etag-Is-At', headers)
+
+    def test_if_none_match_mismatches(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd',
+            headers={'If-None-Match': "not-%s" % self.manifest_abcd_slo_etag})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')
+        self.assertEqual('"%s"' % self.manifest_abcd_slo_etag, headers['Etag'])
+        self.assertEqual('50', headers['Content-Length'])
+        self.assertEqual(
+            body, b'aaaaabbbbbbbbbbcccccccccccccccdddddddddddddddddddd')
+
+        expected_app_calls = [
+            ('GET', '/v1/AUTH_test/gettest/manifest-abcd'),
+            ('GET', '/v1/AUTH_test/gettest/manifest-bc'),
+            ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/d_20?multipart-manifest=get'),
+        ]
+        self.assertEqual(self.app.calls, expected_app_calls)
+        self.assertEqual(self.app.headers[0].get('X-Backend-Etag-Is-At'),
+                         'x-object-sysmeta-slo-etag')
+
+    def test_if_none_match_mismatches_json_md5(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd',
+            headers={'If-None-Match': self.manifest_abcd_json_md5})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')
+        self.assertEqual('"%s"' % self.manifest_abcd_slo_etag, headers['Etag'])
+        self.assertEqual('50', headers['Content-Length'])
+
+        expected_app_calls = [
+            ('GET', '/v1/AUTH_test/gettest/manifest-abcd'),
+        ]
+        if not self.modern_manifest_headers:
+            # w/o modern manifest headers, the json manifest etag responds 304
+            # and triggers a refetch!
+            expected_app_calls.append(
+                ('GET', '/v1/AUTH_test/gettest/manifest-abcd')
+            )
+        expected_app_calls.extend([
+            ('GET', '/v1/AUTH_test/gettest/manifest-bc'),
+            ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/d_20?multipart-manifest=get'),
+        ])
+        self.assertEqual(self.app.calls, expected_app_calls)
+
+    def test_if_none_match_matches_alternate_etag(self):
+        req = Request.blank(
+            '/v1/AUTH_test/c/manifest-alt',
+            headers={'If-None-Match': '"alt-etag-1"'})
+        update_etag_is_at_header(req, 'X-Object-Sysmeta-Alt-Etag')
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '304 Not Modified')
+        # N.B. Etag-Is-At only effects conditional matching, not response Etag
+        self.assertEqual('"%s"' % self.manifest_alt_slo_etag, headers['Etag'])
+        # ... but the response Sysmeta will be available to wrapping middleware
+        self.assertEqual('"alt-etag-1"', headers['X-Object-Sysmeta-Alt-Etag'])
+        # conditional errors are always zero-bytes to save client egress
+        self.assertEqual('0', headers['Content-Length'])
+        self.assertEqual(b'', body)
+
+        expected_app_calls = [('GET', '/v1/AUTH_test/c/manifest-alt')]
+        self.assertEqual(
+            self.app.headers[0].get('X-Backend-Etag-Is-At'),
+            'X-Object-Sysmeta-Alt-Etag,x-object-sysmeta-slo-etag')
+        if not self.modern_manifest_headers:
+            expected_app_calls.extend([
+                # Needed to re-fetch because if-match can't find slo-etag, and
+                # has to 304
+                ('GET', '/v1/AUTH_test/c/manifest-alt'),
+                # for legacy manifests we don't know if swob will return a
+                # successful response or conditional error so we validate the
+                # first segment to avoid a 2XX when we should 5XX
+                ('GET', '/v1/AUTH_test/c/alt_00?multipart-manifest=get'),
+            ])
+            # when swob decides to error it closes our SegmentedIterable
+            # and we don't drain the (possibly large) segment.
+            self.expected_unread_requests[('GET', '/v1/AUTH_test/c/alt_00'
+                                           '?multipart-manifest=get')] = 1
+            for headers in self.app.headers[1:]:
+                self.assertNotIn('If-None-Match', headers)
+                self.assertNotIn('X-Backend-Etag-Is-At', headers)
+        self.assertEqual(self.app.calls, expected_app_calls)
+
+    def test_if_none_match_matches_no_alternate_etag(self):
+        # this is similar to test_if_none_match_matches, but serves as a sanity
+        # check to test_if_none_match_mismatches_alternate_etag, which appends
+        # to etag-is-at
+        req = Request.blank(
+            '/v1/AUTH_test/c/manifest-alt',
+            headers={'If-None-Match': self.manifest_alt_slo_etag})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '304 Not Modified')
+        self.assertEqual('"%s"' % self.manifest_alt_slo_etag, headers['Etag'])
+        # conditional errors are always zero-bytes to save client egress
+        self.assertEqual('0', headers['Content-Length'])
+        self.assertEqual(b'', body)
+
+        expected_app_calls = [('GET', '/v1/AUTH_test/c/manifest-alt')]
+        self.assertEqual(self.app.headers[0].get('X-Backend-Etag-Is-At'),
+                         'x-object-sysmeta-slo-etag')
+        if not self.modern_manifest_headers:
+            expected_app_calls.extend([
+                # N.B. since manifest didn't match slo_etag => no refetch
+                # for legacy manifests we don't know if swob will return a
+                # successful response or conditional error so we validate the
+                # first segment to avoid a 2XX when we should 5XX
+                ('GET', '/v1/AUTH_test/c/alt_00?multipart-manifest=get'),
+            ])
+            for headers in self.app.headers[1:]:
+                self.assertNotIn('If-Match', headers)
+                self.assertNotIn('X-Backend-Etag-Is-At', headers)
+            # for legacy manifests we don't know if swob will return a
+            # successful response or conditional error so we validate the first
+            # segment to avoid a 2XX when we should 5XX, when swob decides to
+            # error it closes our SegmentedIterable and we don't drain the
+            # (possibly large) segment.
+            self.expected_unread_requests[
+                ('GET', '/v1/AUTH_test/c/alt_00'
+                 '?multipart-manifest=get')] = 1
+        self.assertEqual(self.app.calls, expected_app_calls)
+
+    def test_if_none_match_mismatches_alternate_etag(self):
+        req = Request.blank(
+            '/v1/AUTH_test/c/manifest-alt',
+            headers={'If-None-Match': self.manifest_alt_slo_etag})
+        # N.B. SLO request with if-none-match slo_etag would normally respond
+        # not modified (see test_if_none_match_matches_no_alternate_etag), but
+        # here we provide alt-tag so it doesn't match so the request is success
+        update_etag_is_at_header(req, 'X-Object-Sysmeta-Alt-Etag')
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')
+        # N.B. Etag-Is-At only effects conditional matching, not response Etag
+        self.assertEqual('"%s"' % self.manifest_alt_slo_etag, headers['Etag'])
+        # ... but the response Sysmeta will be available to wrapping middleware
+        self.assertEqual('"alt-etag-1"', headers['X-Object-Sysmeta-Alt-Etag'])
+        self.assertEqual(self.manifest_alt_slo_size,
+                         int(headers['Content-Length']))
+
+        expected_app_calls = [
+            ('GET', '/v1/AUTH_test/c/manifest-alt'),
+            ('GET', '/v1/AUTH_test/c/alt_00?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/c/alt_01?multipart-manifest=get'),
+        ]
+        self.assertEqual(self.app.calls, expected_app_calls)
+        self.assertEqual(
+            self.app.headers[0].get('X-Backend-Etag-Is-At'),
+            'X-Object-Sysmeta-Alt-Etag,x-object-sysmeta-slo-etag')
+        for headers in self.app.headers[1:]:
+            self.assertNotIn('If-None-Match', headers)
+            self.assertNotIn('X-Backend-Etag-Is-At', headers)
+
+    def test_if_match_matches(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'If-Match': self.manifest_abcd_slo_etag})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')
+        self.assertEqual('"%s"' % self.manifest_abcd_slo_etag, headers['Etag'])
+        self.assertEqual('50', headers['Content-Length'])
+        self.assertEqual(
+            body, b'aaaaabbbbbbbbbbcccccccccccccccdddddddddddddddddddd')
+
+        expected_app_calls = [('GET', '/v1/AUTH_test/gettest/manifest-abcd')]
+        if not self.modern_manifest_headers:
+            # Manifest never matches -> got back a 412; need to re-fetch
+            expected_app_calls.append(
+                ('GET', '/v1/AUTH_test/gettest/manifest-abcd'))
+        expected_app_calls.extend([
+            ('GET', '/v1/AUTH_test/gettest/manifest-bc'),
+            ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/d_20?multipart-manifest=get'),
+        ])
+        self.assertEqual(self.app.calls, expected_app_calls)
+        self.assertEqual(self.app.headers[0].get('X-Backend-Etag-Is-At'),
+                         'x-object-sysmeta-slo-etag')
+
+    def test_if_match_mismatches(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd',
+            headers={'If-Match': 'not-%s' % self.manifest_abcd_json_md5})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '412 Precondition Failed')
+        self.assertEqual('"%s"' % self.manifest_abcd_slo_etag, headers['Etag'])
+        # conditional errors are always zero-bytes to save client egress
+        self.assertEqual('0', headers['Content-Length'])
+        self.assertEqual(b'', body)
+
+        expected_app_calls = [('GET', '/v1/AUTH_test/gettest/manifest-abcd')]
+        if not self.modern_manifest_headers:
+            expected_app_calls.extend([
+                # Manifest "never" matches -> got back a 412; need to re-fetch
+                ('GET', '/v1/AUTH_test/gettest/manifest-abcd'),
+                # TODO: skip coalecse until validate to avoid sub-manifest req
+                ('GET', '/v1/AUTH_test/gettest/manifest-bc'),
+                # for legacy manifests we don't know if swob will return a
+                # successful response or conditional error so we validate the
+                # first segment to avoid a 2XX when we should 5XX
+                ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+            ])
+            # when swob decides to error it closes our SegmentedIterable
+            # and we don't drain the (possibly large) segment.
+            self.expected_unread_requests[
+                ('GET', '/v1/AUTH_test/gettest/a_5'
+                 '?multipart-manifest=get')] = 1
+        self.assertEqual(self.app.calls, expected_app_calls)
+        self.assertEqual(self.app.headers[0].get('X-Backend-Etag-Is-At'),
+                         'x-object-sysmeta-slo-etag')
+        if not self.modern_manifest_headers:
+            for headers in self.app.headers[1:]:
+                self.assertNotIn('If-Match', headers)
+                self.assertNotIn('X-Backend-Etag-Is-At', headers)
+
+    def test_if_match_mismatches_manifest_json_md5(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd',
+            headers={'If-Match': self.manifest_abcd_json_md5})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '412 Precondition Failed')
+        self.assertEqual('"%s"' % self.manifest_abcd_slo_etag, headers['Etag'])
+        # 412 is always zero-bytes because client is trying to save egress
+        self.assertEqual('0', headers['Content-Length'])
+        self.assertEqual(body, b'')
+
+        expected_app_calls = [('GET', '/v1/AUTH_test/gettest/manifest-abcd')]
+        self.assertEqual(self.app.headers[0].get('X-Backend-Etag-Is-At'),
+                         'x-object-sysmeta-slo-etag')
+        if not self.modern_manifest_headers:
+            # We *still* verify the first segment
+            expected_app_calls.extend([
+                # N.B. since manifest matched => no refetch
+                # TODO: skip coalecse until validate to avoid sub-manifest req
+                ('GET', '/v1/AUTH_test/gettest/manifest-bc'),
+                ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+            ])
+            # swob conditional errors throw away the SegmentedIterable w/o
+            # reading the remaining segments
+            self.expected_unread_requests[('GET', '/v1/AUTH_test/gettest/a_5'
+                                           '?multipart-manifest=get')] = 1
+        self.assertEqual(self.app.calls, expected_app_calls)
+
+    def test_if_match_matches_alternate_etag(self):
+        req = Request.blank(
+            '/v1/AUTH_test/c/manifest-alt',
+            headers={'If-Match': '"alt-etag-1"'})
+        update_etag_is_at_header(req, 'X-Object-Sysmeta-Alt-Etag')
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(self.manifest_alt_slo_size,
+                         int(headers['Content-Length']))
+        # N.B. Etag-Is-At only effects conditional matching, not response Etag
+        self.assertEqual('"%s"' % self.manifest_alt_slo_etag, headers['Etag'])
+        # ... but the response Sysmeta will be available to wrapping middleware
+        self.assertEqual('"alt-etag-1"', headers['X-Object-Sysmeta-Alt-Etag'])
+
+        expected_app_calls = [
+            ('GET', '/v1/AUTH_test/c/manifest-alt'),
+            ('GET', '/v1/AUTH_test/c/alt_00?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/c/alt_01?multipart-manifest=get'),
+        ]
+        self.assertEqual(self.app.calls, expected_app_calls)
+        self.assertEqual(
+            self.app.headers[0].get('X-Backend-Etag-Is-At'),
+            'X-Object-Sysmeta-Alt-Etag,x-object-sysmeta-slo-etag')
+        self.assertNotIn('X-Backend-Etag-Is-At', self.app.headers[1])
+
+    def test_if_match_mismatches_alternate_etag(self):
+        req = Request.blank(
+            '/v1/AUTH_test/c/manifest-alt',
+            headers={'If-Match': self.manifest_alt_slo_etag})
+        update_etag_is_at_header(req, 'X-Object-Sysmeta-Alt-Etag')
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '412 Precondition Failed')
+        # N.B. Etag-Is-At only effects conditional matching, not response Etag
+        self.assertEqual('"%s"' % self.manifest_alt_slo_etag, headers['Etag'])
+        # ... but the response Sysmeta will be available to wrapping middleware
+        self.assertEqual('"alt-etag-1"', headers['X-Object-Sysmeta-Alt-Etag'])
+        # conditional errors are always zero-bytes to save client egress
+        self.assertEqual('0', headers['Content-Length'])
+        self.assertEqual(b'', body)
+        expected_app_calls = [('GET', '/v1/AUTH_test/c/manifest-alt')]
+        self.assertEqual(self.app.headers[0].get('X-Backend-Etag-Is-At'),
+                         'X-Object-Sysmeta-Alt-Etag,x-object-sysmeta-slo-etag')
+        if not self.modern_manifest_headers:
+            expected_app_calls.extend([
+                # Needed to re-fetch because if-match can't find slo-etag
+                ('GET', '/v1/AUTH_test/c/manifest-alt'),
+                # We end up validating the first segment
+                ('GET', '/v1/AUTH_test/c/alt_00?multipart-manifest=get'),
+            ])
+            # for legacy manifests we don't know if swob will return a
+            # successful response or conditional error so we validate the first
+            # segment to avoid a 2XX when we should 5XX, when swob decides to
+            # error it closes our SegmentedIterable and we don't drain the
+            # (possibly large) segment.
+            self.expected_unread_requests[
+                ('GET', '/v1/AUTH_test/c/alt_00'
+                 '?multipart-manifest=get')] = 1
+            for headers in self.app.headers[1:]:
+                self.assertNotIn('If-Match', headers)
+                self.assertNotIn('X-Backend-Etag-Is-At', headers)
+        self.assertEqual(self.app.calls, expected_app_calls)
+
+    def test_manifest_get_if_none_match_matches(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd?multipart-manifest=get',
+            headers={'If-None-Match': self.manifest_abcd_json_md5})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '304 Not Modified')
+        self.assertEqual(self.manifest_abcd_json_md5, headers['Etag'])
+        # conditional errors are always zero-bytes to save client egress
+        self.assertEqual('0', headers['Content-Length'])
+        self.assertEqual(b'', body)
+
+        expected_app_calls = [('GET', '/v1/AUTH_test/gettest/manifest-abcd'
+                               '?multipart-manifest=get')]
+
+        self.assertEqual(self.app.calls, expected_app_calls)
+        self.assertNotIn('X-Backend-Etag-Is-At', self.app.headers[0])
+
+    def test_manifest_get_if_none_match_mismatches(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd?multipart-manifest=get',
+            headers={'If-None-Match': "not-%s" % self.manifest_abcd_json_md5})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(self.manifest_abcd_json_md5, headers['Etag'])
+        self.assertEqual(self.manifest_abcd_json_size,
+                         int(headers['Content-Length']))
+        data = json.loads(body)
+        self.assertEqual(
+            ['/gettest/a_5', '/gettest/manifest-bc', '/gettest/d_20'],
+            [s['name'] for s in data])
+        self.assertEqual(md5hex(body), self.manifest_abcd_json_md5)
+
+        expected_app_calls = [('GET', '/v1/AUTH_test/gettest/manifest-abcd'
+                               '?multipart-manifest=get')]
+        self.assertEqual(self.app.calls, expected_app_calls)
+        self.assertNotIn('X-Backend-Etag-Is-At', self.app.headers[0])
+
+    def test_manifest_get_if_none_match_matches_alternate_etag(self):
+        req = Request.blank(
+            '/v1/AUTH_test/c/manifest-alt?multipart-manifest=get',
+            headers={'If-None-Match': '"alt-etag-1"'})
+        # who would do this for a multipart-manifest=get requests?
+        update_etag_is_at_header(req, 'X-Object-Sysmeta-Alt-Etag')
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '304 Not Modified')
+        # N.B. Etag-Is-At only effects conditional matching, not response Etag
+        self.assertEqual(self.manifest_alt_json_md5, headers['Etag'])
+        # ... but the response Sysmeta will be available to wrapping middleware
+        self.assertEqual('"alt-etag-1"', headers['X-Object-Sysmeta-Alt-Etag'])
+        # conditional errors are always zero-bytes to save client egress
+        self.assertEqual('0', headers['Content-Length'])
+        self.assertEqual(b'', body)
+
+        expected_app_calls = [('GET', '/v1/AUTH_test/c/manifest-alt'
+                               '?multipart-manifest=get')]
+        self.assertEqual(self.app.calls, expected_app_calls)
+        self.assertEqual(
+            self.app.headers[0].get('X-Backend-Etag-Is-At'),
+            'X-Object-Sysmeta-Alt-Etag')
+
+    def test_manifest_get_if_none_match_mismatches_alternate_etag(self):
+        req = Request.blank(
+            '/v1/AUTH_test/c/manifest-alt?multipart-manifest=get',
+            headers={'If-None-Match': '"not-alt-etag-1"'})
+        # who would do this for a multipart-manifest=get requests?
+        update_etag_is_at_header(req, 'X-Object-Sysmeta-Alt-Etag')
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')
+        # N.B. Etag-Is-At only effects conditional matching, not response Etag
+        self.assertEqual(self.manifest_alt_json_md5, headers['Etag'])
+        # ... but the response Sysmeta will be available to wrapping middleware
+        self.assertEqual('"alt-etag-1"', headers['X-Object-Sysmeta-Alt-Etag'])
+        data = json.loads(body)
+        self.assertEqual(['/c/alt_%02d' % i for i in range(len(data))],
+                         [s['name'] for s in data])
+        self.assertEqual(md5hex(body), self.manifest_alt_json_md5)
+
+        expected_app_calls = [('GET', '/v1/AUTH_test/c/manifest-alt'
+                               '?multipart-manifest=get')]
+        self.assertEqual(self.app.calls, expected_app_calls)
+        self.assertEqual(
+            self.app.headers[0].get('X-Backend-Etag-Is-At'),
+            'X-Object-Sysmeta-Alt-Etag')
+
+    def test_manifest_get_if_match_matches(self):
+        # use if-match condition and expect to match
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd?multipart-manifest=get',
+            headers={'If-Match': self.manifest_abcd_json_md5})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(self.manifest_abcd_json_md5, headers['Etag'])
+        expected_app_calls = [
+            ('GET',
+             '/v1/AUTH_test/gettest/manifest-abcd?multipart-manifest=get')]
+        self.assertEqual(self.app.calls, expected_app_calls)
+        self.assertNotIn('X-Backend-Etag-Is-At', self.app.headers[0])
+
+    def test_manifest_get_if_match_mismatches(self):
+        # use if-match condition and expect to mismatch
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd?multipart-manifest=get',
+            headers={'If-Match': self.manifest_abcd_slo_etag})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '412 Precondition Failed')
+        self.assertEqual(self.manifest_abcd_json_md5, headers['Etag'])
+        # conditional errors are always zero-bytes to save client egress
+        self.assertEqual('0', headers['Content-Length'])
+        self.assertEqual(b'', body)
+
+        expected_app_calls = [
+            ('GET',
+             '/v1/AUTH_test/gettest/manifest-abcd?multipart-manifest=get')]
+        self.assertEqual(self.app.calls, expected_app_calls)
+        self.assertNotIn('X-Backend-Etag-Is-At', self.app.headers[0])
+
+    def test_manifest_get_if_match_matches_alternate_etag(self):
+        # use if-match condition with alt-etag and expect to match
+        req = Request.blank(
+            '/v1/AUTH_test/c/manifest-alt?multipart-manifest=get',
+            headers={'If-Match': '"alt-etag-1"'})
+        update_etag_is_at_header(req, 'X-Object-Sysmeta-Alt-Etag')
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(self.manifest_alt_json_md5, headers['Etag'])
+        expected_app_calls = [
+            ('GET', '/v1/AUTH_test/c/manifest-alt?multipart-manifest=get')]
+        self.assertEqual(self.app.calls, expected_app_calls)
+        self.assertEqual('X-Object-Sysmeta-Alt-Etag',
+                         self.app.headers[0]['X-Backend-Etag-Is-At'])
+
+    def test_manifest_get_if_match_mismatches_alternate_etag(self):
+        # mis-match alternate etag
+        req = Request.blank(
+            '/v1/AUTH_test/c/manifest-alt?multipart-manifest=get',
+            headers={'If-Match': self.manifest_alt_json_md5})
+        update_etag_is_at_header(req, 'X-Object-Sysmeta-Alt-Etag')
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '412 Precondition Failed')
+        self.assertEqual(self.manifest_alt_json_md5, headers['Etag'])
+        # conditional errors are always zero-bytes to save client egress
+        self.assertEqual('0', headers['Content-Length'])
+        self.assertEqual(b'', body)
+
+        expected_app_calls = [
+            ('GET', '/v1/AUTH_test/c/manifest-alt?multipart-manifest=get')]
+        self.assertEqual(self.app.calls, expected_app_calls)
+        self.assertEqual('X-Object-Sysmeta-Alt-Etag',
+                         self.app.headers[0].get('X-Backend-Etag-Is-At'))
+
+    def test_manifest_get_if_match_mismatches_without_alternate_etag(self):
+        # sanity, this is similar to the test_manifest_get_if_match_mismatches
+        # but in this case our manifest *has* an alt-etag, but no-one tells the
+        # object server to look for it
+        req = Request.blank(
+            '/v1/AUTH_test/c/manifest-alt?multipart-manifest=get',
+            headers={'If-Match': '"alt-etag-1"'})
+        # update_etag_is_at_header(req, 'X-Object-Sysmeta-Alt-Etag')
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '412 Precondition Failed')
+        self.assertEqual(self.manifest_alt_json_md5, headers['Etag'])
+        # conditional errors are always zero-bytes to save client egress
+        self.assertEqual('0', headers['Content-Length'])
+        self.assertEqual(b'', body)
+
+        expected_app_calls = [
+            ('GET', '/v1/AUTH_test/c/manifest-alt?multipart-manifest=get')]
+        self.assertEqual(self.app.calls, expected_app_calls)
+        self.assertNotIn('X-Backend-Etag-Is-At', self.app.headers[0])
+
+    def test_manifest_get_if_match_mismatches_alternate_etag_miss(self):
+        # sanity, this is similar to
+        # test_manifest_get_if_match_mismatches_alternate_etag but in this case
+        # our manifest doesn't HAVE an alt-etag, so the object server falls
+        # back to match with manifest's json_md5
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd?multipart-manifest=get',
+            headers={'If-Match': self.manifest_abcd_json_md5})
+        update_etag_is_at_header(req, 'X-Object-Sysmeta-Alt-Etag')
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')
+
+    def test_if_match_matches_alternate_etag_non_slo(self):
+        # match alternate etag
+        req = Request.blank(
+            '/v1/AUTH_test/c/alt_00',
+            headers={'If-Match': 'seg-etag-00'})
+        update_etag_is_at_header(req, 'X-Object-Sysmeta-Alt-Etag')
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '200 OK')
+        # N.B. Etag-Is-At only effects conditional matching, not response Etag
+        self.assertEqual(md5hex('alt_00' * 5), headers['Etag'])
+        # ... but the response Sysmeta will be available to wrapping middleware
+        self.assertEqual('seg-etag-00', headers['X-Object-Sysmeta-Alt-Etag'])
+        expected_calls = [
+            ('GET', '/v1/AUTH_test/c/alt_00'),
+        ]
+        self.assertEqual(self.app.calls, expected_calls)
+
+    def test_if_match_mismatches_alternate_etag_non_slo(self):
+        # mis-match alternate etag
+        req = Request.blank(
+            '/v1/AUTH_test/c/alt_00',
+            headers={'If-Match': md5hex(b'alt_00' * 5)})
+        update_etag_is_at_header(req, 'X-Object-Sysmeta-Alt-Etag')
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '412 Precondition Failed')
+        # N.B. Etag-Is-At only effects conditional matching, not response Etag
+        self.assertEqual(md5hex('alt_00' * 5), headers['Etag'])
+        # ... but the response Sysmeta will be available to wrapping middleware
+        self.assertEqual('seg-etag-00', headers['X-Object-Sysmeta-Alt-Etag'])
+        expected_calls = [
+            ('GET', '/v1/AUTH_test/c/alt_00'),
+        ]
+        self.assertEqual(self.app.calls, expected_calls)
+
+    def test_if_match_matches_alternate_etag_non_slo_after_refetch(self):
+        self.app.register_next_response(
+            'GET', '/v1/AUTH_test/c/manifest-alt',
+            swob.HTTPOk, {'Content-Length': '25',
+                          'Etag': md5hex('alt_1' * 5),
+                          # N.B. manifest-alt gets overwritten mid-flight!
+                          'X-Backend-Timestamp': '2345',
+                          'X-Object-Sysmeta-Alt-Etag': 'alt-object-etag'},
+            body=b'alt_1' * 5)
+
+        req = Request.blank(
+            '/v1/AUTH_test/c/manifest-alt',
+            headers={'If-Match': 'alt-object-etag'})
+        update_etag_is_at_header(req, 'X-Object-Sysmeta-Alt-Etag')
+        status, headers, body = self.call_slo(req)
+
+        expected_app_calls = [('GET', '/v1/AUTH_test/c/manifest-alt')]
+        # first request asks for match on alt-etag
+        self.assertEqual('alt-object-etag', self.app.headers[0]['If-Match'])
+        self.assertIn('X-Object-Sysmeta-Alt-Etag',
+                      self.app.headers[0]['X-Backend-Etag-Is-At'])
+
+        if self.modern_manifest_headers:
+            # and since the response includes modern sysmeta, slo trusts the
+            # 412 w/o refetch
+            self.assertEqual(status, '412 Precondition Failed')
+            # N.B. if the first repsonse had included a matching
+            # alt-object-etag in sysmeta we would have returned 200, see
+            # test_if_match_matches_alternate_etag with "alt-etag-1"
+            self.assertEqual('"%s"' % self.manifest_alt_slo_etag,
+                             headers['Etag'])
+            self.assertEqual('"alt-etag-1"',
+                             headers['X-Object-Sysmeta-Alt-Etag'])
+        else:
+            # ... but lacking modern sysmeta, slo will refetch a 412
+            expected_app_calls.append(
+                ('GET', '/v1/AUTH_test/c/manifest-alt')
+            )
+            # ... w/o conditionals
+            self.assertNotIn('If-Match', self.app.headers[1])
+            self.assertNotIn('X-Backend-Etag-Is-At', self.app.headers[1])
+            # and the reconstructed swob response will *match*
+            self.assertEqual(status, '200 OK')
+            # N.B. Etag-Is-At only effects conditional matching,
+            # not response Etag
+            self.assertEqual(md5hex('alt_1' * 5), headers['Etag'])
+            # ... but the response Sysmeta will be available to
+            # wrapping middleware
+            self.assertEqual('alt-object-etag',
+                             headers['X-Object-Sysmeta-Alt-Etag'])
+
+        self.assertEqual(self.app.calls, expected_app_calls)
+
+    def test_if_match_mismatches_alternate_etag_non_slo_after_refetch(self):
+        self.app.register_next_response(
+            'GET', '/v1/AUTH_test/c/manifest-alt',
+            swob.HTTPOk, {'Content-Length': '25',
+                          'Etag': md5hex('alt_1' * 5),
+                          # N.B. manifest-alt gets overwritten mid-flight!
+                          'X-Backend-Timestamp': '2345',
+                          'X-Object-Sysmeta-Alt-Etag': 'alt-object-etag'},
+            body=b'alt_1' * 5)
+
+        req = Request.blank(
+            '/v1/AUTH_test/c/manifest-alt',
+            headers={'If-Match': md5hex('alt_1' * 5)})
+        update_etag_is_at_header(req, 'X-Object-Sysmeta-Alt-Etag')
+        status, headers, body = self.call_slo(req)
+
+        expected_app_calls = [('GET', '/v1/AUTH_test/c/manifest-alt')]
+        # first request asks for (mis)match on alt-etag
+        self.assertEqual(md5hex('alt_1' * 5), self.app.headers[0]['If-Match'])
+        self.assertIn('X-Object-Sysmeta-Alt-Etag',
+                      self.app.headers[0]['X-Backend-Etag-Is-At'])
+
+        if self.modern_manifest_headers:
+            # and since the response includes modern sysmeta, slo trusts the
+            # 412 w/o refetch
+            self.assertEqual(status, '412 Precondition Failed')
+            # N.B. the first repsonse included an alt-etag in sysmeta (i.e.
+            # "alt-etag-1"), it just doesn't match either - see
+            # test_if_match_mismatches_alternate_etag
+            self.assertEqual('"%s"' % self.manifest_alt_slo_etag,
+                             headers['Etag'])
+            self.assertEqual('"alt-etag-1"',
+                             headers['X-Object-Sysmeta-Alt-Etag'])
+        else:
+            # ... but lacking modern sysmeta, slo will refetch a 412
+            expected_app_calls.append(
+                ('GET', '/v1/AUTH_test/c/manifest-alt')
+            )
+            # ... w/o conditionals
+            self.assertNotIn('If-Match', self.app.headers[1])
+            self.assertNotIn('X-Backend-Etag-Is-At', self.app.headers[1])
+            # and the reconstructed swob response will *not* match
+            self.assertEqual(status, '412 Precondition Failed')
+            # N.B. Etag-Is-At only effects conditional matching,
+            # not response Etag
+            self.assertEqual(md5hex('alt_1' * 5), headers['Etag'])
+            # ... but the response Sysmeta will be available to
+            # wrapping middleware
+            self.assertEqual('alt-object-etag',
+                             headers['X-Object-Sysmeta-Alt-Etag'])
+            # swob is converting the successful non-slo response to conditional
+            # error and closing our unconditionally refetched resp_iter
+            self.expected_unread_requests[
+                ('GET', '/v1/AUTH_test/c/manifest-alt')] = 1
+
+        self.assertEqual(self.app.calls, expected_app_calls)
+
+    def test_if_match_matches_and_range(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'If-Match': self.manifest_abcd_slo_etag,
+                     'Range': 'bytes=3-6'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '206 Partial Content')
+        self.assertIn('bytes 3-6/50', headers['Content-Range'])
+        self.assertEqual('"%s"' % self.manifest_abcd_slo_etag, headers['Etag'])
+        self.assertEqual('4', headers['Content-Length'])
+        self.assertEqual(body, b'aabb')
+
+        expected_app_calls = [
+            ('GET', '/v1/AUTH_test/gettest/manifest-abcd'),
+        ]
+        if not self.modern_manifest_headers:
+            # Needed to re-fetch because if-match can't find slo-etag
+            expected_app_calls.append(
+                ('GET', '/v1/AUTH_test/gettest/manifest-abcd'),
+            )
+        # and then fetch the segments
+        expected_app_calls.extend([
+            ('GET', '/v1/AUTH_test/gettest/manifest-bc'),
+            ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'),
+        ])
+        self.assertEqual(self.app.calls, expected_app_calls)
+        self.assertEqual(self.app.headers[0].get('X-Backend-Etag-Is-At'),
+                         'x-object-sysmeta-slo-etag')
+
+    def test_old_swift_if_match_matches_and_range(self):
+        self.app.can_ignore_range = False
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd',
+            headers={'If-Match': self.manifest_abcd_slo_etag,
+                     'Range': 'bytes=3-6'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual('"%s"' % self.manifest_abcd_slo_etag, headers['Etag'])
+        self.assertEqual('4', headers['Content-Length'])
+        self.assertEqual(body, b'aabb')
+
+        expected_app_calls = [
+            ('GET', '/v1/AUTH_test/gettest/manifest-abcd'),
+            # new-sytle manifest sysmeta was added 2016, but ignore-range
+            # didn't get added until 2020, so both new and old manifest
+            # will still require refetch with old-swift
+            ('GET', '/v1/AUTH_test/gettest/manifest-abcd'),
+            ('GET', '/v1/AUTH_test/gettest/manifest-bc'),
+            ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'),
+        ]
+        self.assertEqual(self.app.calls, expected_app_calls)
+        self.assertEqual(self.app.headers[0].get('X-Backend-Etag-Is-At'),
+                         'x-object-sysmeta-slo-etag')
+
+    def test_range_resume_download(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Range': 'bytes=20-'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(body, b'ccccccccccdddddddddddddddddddd')
+
+    def test_get_with_if_modified_since(self):
+        req = swob.Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'If-Modified-Since': 'Wed, 12 Feb 2014 22:24:52 GMT',
+                     'If-Unmodified-Since': 'Thu, 13 Feb 2014 23:25:53 GMT'})
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(headers['Etag'], '"%s"' % self.manifest_abcd_slo_etag)
+        self.assertEqual(int(headers['Content-Length']),
+                         self.manifest_abcd_slo_size)
+        self.assertEqual(headers['X-Manifest-Etag'],
+                         self.manifest_abcd_json_md5)
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(self.slo.logger.get_lines_for_level('error'), [])
+
+        self.assertEqual(
+            self.app.calls,
+            [('GET', '/v1/AUTH_test/gettest/manifest-abcd'),
+             ('GET', '/v1/AUTH_test/gettest/manifest-bc'),
+             ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'),
+             ('GET', '/v1/AUTH_test/gettest/d_20?multipart-manifest=get')])
+
+        # It's important not to pass the If-[Un]Modified-Since header to the
+        # proxy for segment or submanifest GET requests, as it may result in
+        # 304 Not Modified responses, and those don't contain any useful data.
+        for _, _, hdrs in self.app.calls_with_headers[1:]:
+            self.assertNotIn('If-Modified-Since', hdrs)
+            self.assertNotIn('If-Unmodified-Since', hdrs)
+
+    def test_if_modified_since_ancient_date(self):
+        req = swob.Request.blank(
+            '/v1/AUTH_test/c/manifest-last-modified',
+            headers={
+                'If-Modified-Since': 'Fri, 01 Feb 2012 20:38:36 GMT',
+            })
+        status, headers, body = self.call_slo(req)
+        # oh it's *definately* been modified since then!
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['Etag'],
+                         '"%s"' % self.manifest_last_modified_slo_etag)
+        self.assertEqual(headers['X-Manifest-Etag'],
+                         self.manifest_last_modified_json_md5)
+        self.assertEqual(int(headers['Content-Length']),
+                         self.manifest_last_modified_slo_size)
+        self.assertEqual(headers['Last-Modified'],
+                         'Mon, 23 Oct 2023 10:05:32 GMT')
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/AUTH_test/c/manifest-last-modified'),
+            ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'),
+        ])
+
+    def test_if_modified_since_last_modified(self):
+        req = swob.Request.blank(
+            '/v1/AUTH_test/c/manifest-last-modified',
+            headers={
+                'If-Modified-Since': 'Mon, 23 Oct 2023 10:05:32 GMT',
+            })
+        status, headers, body = self.call_slo(req)
+        # nope, that was the last time it was changed
+        self.assertEqual(status, '304 Not Modified')
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['Etag'],
+                         '"%s"' % self.manifest_last_modified_slo_etag)
+        self.assertEqual(headers['X-Manifest-Etag'],
+                         self.manifest_last_modified_json_md5)
+        self.assertEqual(headers['Content-Length'], '0')
+        self.assertEqual('Mon, 23 Oct 2023 10:05:32 GMT',
+                         headers['Last-Modified'])
+        self.assertEqual(b'', body)
+        expected_calls = [
+            ('GET', '/v1/AUTH_test/c/manifest-last-modified'),
+        ]
+        if not self.modern_manifest_headers:
+            # N.B. legacy manifests must refetch for accurate Etag, and then we
+            # validate first segment before lettting swob return the error
+            expected_calls.extend([
+                ('GET', '/v1/AUTH_test/c/manifest-last-modified'),
+                ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+            ])
+            # we don't drain the segment's resp_iter if validation fails
+            self.expected_unread_requests[
+                ('GET', '/v1/AUTH_test/gettest/a_5'
+                 '?multipart-manifest=get')] = 1
+        self.assertEqual(self.app.calls, expected_calls)
+
+    def test_if_modified_since_now(self):
+        now = datetime.now()
+        last_modified = now.strftime("%a, %d %b %Y %H:%M:%S %Z")
+        req = swob.Request.blank(
+            '/v1/AUTH_test/c/manifest-last-modified',
+            headers={
+                'If-Modified-Since': last_modified,
+            })
+        status, headers, body = self.call_slo(req)
+        # nope, that was the last time it was changed
+        self.assertEqual(status, '304 Not Modified')
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['Etag'],
+                         '"%s"' % self.manifest_last_modified_slo_etag)
+        self.assertEqual(headers['X-Manifest-Etag'],
+                         self.manifest_last_modified_json_md5)
+        self.assertEqual(headers['Content-Length'], '0')
+        self.assertEqual('Mon, 23 Oct 2023 10:05:32 GMT',
+                         headers['Last-Modified'])
+        self.assertEqual(b'', body)
+        expected_calls = [
+            ('GET', '/v1/AUTH_test/c/manifest-last-modified'),
+        ]
+        if not self.modern_manifest_headers:
+            # N.B. legacy manifests must refetch for accurate Etag, and then we
+            # validate first segment before lettting swob return the error
+            expected_calls.extend([
+                ('GET', '/v1/AUTH_test/c/manifest-last-modified'),
+                ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+            ])
+            # we don't drain the segment's resp_iter if validation fails
+            self.expected_unread_requests[
+                ('GET', '/v1/AUTH_test/gettest/a_5'
+                 '?multipart-manifest=get')] = 1
+        self.assertEqual(self.app.calls, expected_calls)
+
+    def test_if_unmodified_since_ancient_date(self):
+        req = swob.Request.blank(
+            '/v1/AUTH_test/c/manifest-last-modified',
+            headers={
+                'If-Unmodified-Since': 'Fri, 01 Feb 2012 20:38:36 GMT',
+            })
+        status, headers, body = self.call_slo(req)
+        # oh it's *definately* been modified since then!
+        self.assertEqual(status, '412 Precondition Failed')
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['Etag'],
+                         '"%s"' % self.manifest_last_modified_slo_etag)
+        self.assertEqual(headers['X-Manifest-Etag'],
+                         self.manifest_last_modified_json_md5)
+        self.assertEqual(headers['Content-Length'], '0')
+        self.assertEqual('Mon, 23 Oct 2023 10:05:32 GMT',
+                         headers['Last-Modified'])
+        self.assertEqual(b'', body)
+        expected_calls = [
+            ('GET', '/v1/AUTH_test/c/manifest-last-modified'),
+        ]
+        if not self.modern_manifest_headers:
+            # N.B. legacy manifests must refetch for accurate Etag, and then we
+            # validate first segment before lettting swob return the error
+            expected_calls.extend([
+                ('GET', '/v1/AUTH_test/c/manifest-last-modified'),
+                ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+            ])
+            # we don't drain the segment's resp_iter if validation fails
+            self.expected_unread_requests[
+                ('GET', '/v1/AUTH_test/gettest/a_5'
+                 '?multipart-manifest=get')] = 1
+        self.assertEqual(self.app.calls, expected_calls)
+
+    def test_if_unmodified_since_last_modified(self):
+        req = swob.Request.blank(
+            '/v1/AUTH_test/c/manifest-last-modified',
+            headers={
+                'If-Unmodified-Since': 'Mon, 23 Oct 2023 10:05:32 GMT',
+            })
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['Etag'],
+                         '"%s"' % self.manifest_last_modified_slo_etag)
+        self.assertEqual(headers['X-Manifest-Etag'],
+                         self.manifest_last_modified_json_md5)
+        self.assertEqual(int(headers['Content-Length']),
+                         self.manifest_last_modified_slo_size)
+        self.assertEqual(headers['Last-Modified'],
+                         'Mon, 23 Oct 2023 10:05:32 GMT')
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/AUTH_test/c/manifest-last-modified'),
+            ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'),
+        ])
+
+    def test_if_unmodified_since_now(self):
+        now = datetime.now()
+        last_modified = now.strftime("%a, %d %b %Y %H:%M:%S %Z")
+        req = swob.Request.blank(
+            '/v1/AUTH_test/c/manifest-last-modified',
+            headers={
+                'If-Unmodified-Since': last_modified,
+            })
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['Etag'],
+                         '"%s"' % self.manifest_last_modified_slo_etag)
+        self.assertEqual(headers['X-Manifest-Etag'],
+                         self.manifest_last_modified_json_md5)
+        self.assertEqual(int(headers['Content-Length']),
+                         self.manifest_last_modified_slo_size)
+        self.assertEqual(headers['Last-Modified'],
+                         'Mon, 23 Oct 2023 10:05:32 GMT')
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/AUTH_test/c/manifest-last-modified'),
+            ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'),
+        ])
+
+
+class TestSloConditionalGetNewManifest(TestSloConditionalGetOldManifest):
+
+    modern_manifest_headers = True
+
+
+class TestPartNumber(SloGETorHEADTestCase):
+
+    modern_manifest_headers = True
+
+    def setUp(self):
+        super(TestPartNumber, self).setUp()
+        self._setup_alphabet_objects('bcdj')
+        self._setup_manifest_bc()
+        self._setup_manifest_abcd()
+        self._setup_manifest_abcdefghijkl()
+        self._setup_manifest_bc_ranges()
+        self._setup_manifest_abcd_ranges()
+        self._setup_manifest_abcd_subranges()
+        self._setup_manifest_aabbccdd()
+        self._setup_manifest_single_segment()
+        self._setup_manifest_zero_byte()
+        self._setup_manifest_bc_expires()
+
+        # this b_50 object doesn't follow the alphabet convention
+        self.app.register(
+            'GET', '/v1/AUTH_test/gettest/b_50',
+            swob.HTTPPartialContent, {'Content-Length': '50',
+                                      'Etag': md5hex('b' * 50)},
+            'b' * 50)
+
+        # Setup POST req separately for expiring manifest
+        self.app.register('POST',
+                          '/v1/AUTH_test/gettest/manifest-bc-expires',
+                          swob.HTTPAccepted, {})
+
+        self._setup_manifest_data()
+
+    def test_head_part_number(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-bc?part-number=1',
+            environ={'REQUEST_METHOD': 'HEAD'})
+        status, headers, body = self.call_slo(req)
+        expected_calls = [
+            ('HEAD', '/v1/AUTH_test/gettest/manifest-bc?part-number=1'),
+            ('GET', '/v1/AUTH_test/gettest/manifest-bc?part-number=1')
+        ]
+
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(headers['Etag'], '"%s"' % self.manifest_bc_slo_etag)
+        self.assertEqual(headers['Content-Length'], '10')
+        self.assertEqual(headers['Content-Range'], 'bytes 0-9/25')
+        self.assertEqual(headers['X-Manifest-Etag'], self.manifest_bc_json_md5)
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['X-Parts-Count'], '2')
+        self.assertEqual(headers['Content-Type'], 'application/octet-stream')
+        self.assertEqual(body, b'')  # it's a HEAD request, after all
+        self.assertEqual(headers['X-Object-Meta-Plant'], 'Ficus')
+        self.assertEqual(self.app.calls, expected_calls)
+
+    def test_head_part_number_refetch_path(self):
+        # verify that any modification of the request path by a downstream
+        # middleware is ignored when refetching
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/mani?part-number=1',
+            environ={'REQUEST_METHOD': 'HEAD'})
+        captured_calls = []
+        orig_call = FakeSwift.__call__
+
+        def pseudo_middleware(app, env, start_response):
+            captured_calls.append((env['REQUEST_METHOD'], env['PATH_INFO']))
+            # pretend another middleware modified the path
+            # note: for convenience, the path "modification" actually results
+            # in one of the pre-registered paths
+            env['PATH_INFO'] += 'fest-bc'
+            return orig_call(app, env, start_response)
+
+        with patch.object(FakeSwift, '__call__', pseudo_middleware):
+            status, headers, body = self.call_slo(req)
+
+        # pseudo-middleware gets the original path for the refetch
+        self.assertEqual([('HEAD', '/v1/AUTH_test/gettest/mani'),
+                          ('GET', '/v1/AUTH_test/gettest/mani')],
+                         captured_calls)
+        self.assertEqual(status, '206 Partial Content')
+        expected_calls = [
+            # original path is modified...
+            ('HEAD', '/v1/AUTH_test/gettest/manifest-bc?part-number=1'),
+            # refetch: the *original* path is modified...
+            ('GET', '/v1/AUTH_test/gettest/manifest-bc?part-number=1')
+        ]
+        self.assertEqual(self.app.calls, expected_calls)
+
+    def test_get_manifest_with_x_open_expired_part_num(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-bc-expires'
+            '?multipart-manifest=get',
+            environ={'REQUEST_METHOD': 'GET'})
+
+        captured_calls = []
+        orig_call = FakeSwift.__call__
+
+        def pseudo_middleware(app, env, start_response):
+            captured_calls.append((env['REQUEST_METHOD'], env['PATH_INFO']))
+            # pretend another middleware modified the path
+            # note: for convenience, the path "modification" actually results
+            # in one of the pre-registered paths
+            env['PATH_INFO'] += ''
+            return orig_call(app, env, start_response)
+
+        with patch.object(FakeSwift, '__call__', pseudo_middleware):
+            status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')
+        self.assertEqual([('GET',
+                           '/v1/AUTH_test/gettest/manifest-bc-expires')],
+                         captured_calls)
+
+        t = str(int(time.time()))
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-bc-expires',
+            environ={'REQUEST_METHOD': 'POST'},
+            headers={'X-Delete-At': t}
+        )
+
+        with patch.object(FakeSwift, '__call__', pseudo_middleware):
+            status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '202 Accepted')
+
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-bc-expires?part-number=1',
+            environ={'REQUEST_METHOD': 'HEAD'},
+            headers={'x-open-expired': 'true'})
+
+        with patch.object(FakeSwift, '__call__', pseudo_middleware):
+            status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['Etag'], '"%s"' %
+                         self.manifest_bc_expires_slo_etag)
+        self.assertEqual(self.app.call_count, 4)
+        self.assertTrue(self.app.calls_with_headers[2][2]['X-Open-Expired'])
+
+    def test_get_part_number(self):
+        # part number 1 is b_10
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-bc?part-number=1')
+        status, headers, body = self.call_slo(req)
+        expected_calls = [
+            ('GET', '/v1/AUTH_test/gettest/manifest-bc?part-number=1'),
+            ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get')
+        ]
+
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(headers['Etag'], '"%s"' % self.manifest_bc_slo_etag)
+        self.assertEqual(headers['X-Manifest-Etag'], self.manifest_bc_json_md5)
+        self.assertEqual(headers['Content-Length'], '10')
+        self.assertEqual(headers['Content-Range'], 'bytes 0-9/25')
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['X-Parts-Count'], '2')
+        self.assertEqual(headers['Content-Type'], 'application/octet-stream')
+        self.assertEqual(body, b'b' * 10)
+        self.assertEqual(headers['X-Object-Meta-Plant'], 'Ficus')
+        self.assertEqual(self.app.calls, expected_calls)
+
+        # part number 2 is c_15
+        self.app.clear_calls()
+        expected_calls = [
+            ('GET', '/v1/AUTH_test/gettest/manifest-bc?part-number=2'),
+            ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get')
+        ]
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-bc?part-number=2')
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(headers['Etag'], '"%s"' % self.manifest_bc_slo_etag)
+        self.assertEqual(headers['X-Manifest-Etag'], self.manifest_bc_json_md5)
+        self.assertEqual(headers['Content-Length'], '15')
+        self.assertEqual(headers['Content-Range'], 'bytes 10-24/25')
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['X-Parts-Count'], '2')
+        self.assertEqual(headers['Content-Type'], 'application/octet-stream')
+        self.assertEqual(body, b'c' * 15)
+        self.assertEqual(headers['X-Object-Meta-Plant'], 'Ficus')
+        self.assertEqual(self.app.calls, expected_calls)
+
+        # we now test it with single segment slo
+        self.app.clear_calls()
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-single-segment?part-number=1')
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(headers['Etag'], '"%s"' %
+                         self.manifest_single_segment_slo_etag)
+        self.assertEqual(headers['X-Manifest-Etag'],
+                         self.manifest_single_segment_json_md5)
+        self.assertEqual(headers['Content-Length'], '50')
+        self.assertEqual(headers['Content-Range'], 'bytes 0-49/50')
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['X-Object-Meta-Nature'], 'Regular')
+        self.assertEqual(headers['X-Parts-Count'], '1')
+        self.assertEqual(headers['Content-Type'], 'application/octet-stream')
+        expected_calls = [
+            ('GET', '/v1/AUTH_test/gettest/manifest-single-segment?'
+                    'part-number=1'),
+            ('GET', '/v1/AUTH_test/gettest/b_50?multipart-manifest=get')
+        ]
+        self.assertEqual(self.app.calls, expected_calls)
+
+    def test_get_part_number_sub_slo(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd?part-number=3')
+        status, headers, body = self.call_slo(req)
+        expected_calls = [
+            ('GET', '/v1/AUTH_test/gettest/manifest-abcd?part-number=3'),
+            ('GET', '/v1/AUTH_test/gettest/d_20?multipart-manifest=get')
+        ]
+
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(headers['Etag'], '"%s"' % self.manifest_abcd_slo_etag)
+        self.assertEqual(headers['X-Manifest-Etag'],
+                         self.manifest_abcd_json_md5)
+        self.assertEqual(headers['Content-Length'], '20')
+        self.assertEqual(headers['Content-Range'], 'bytes 30-49/50')
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['X-Parts-Count'], '3')
+        self.assertEqual(headers['Content-Type'], 'application/json')
+        self.assertEqual(body, b'd' * 20)
+        self.assertEqual(self.app.calls, expected_calls)
+
+        self.app.clear_calls()
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd?part-number=2')
+        status, headers, body = self.call_slo(req)
+        expected_calls = [
+            ('GET', '/v1/AUTH_test/gettest/manifest-abcd?part-number=2'),
+            ('GET', '/v1/AUTH_test/gettest/manifest-bc'),
+            ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get')
+        ]
+
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(headers['Etag'], '"%s"' % self.manifest_abcd_slo_etag)
+        self.assertEqual(headers['X-Manifest-Etag'],
+                         self.manifest_abcd_json_md5)
+        self.assertEqual(headers['Content-Length'], '25')
+        self.assertEqual(headers['Content-Range'], 'bytes 5-29/50')
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['X-Parts-Count'], '3')
+        self.assertEqual(headers['Content-Type'], 'application/json')
+        self.assertEqual(body, b'b' * 10 + b'c' * 15)
+        self.assertEqual(self.app.calls, expected_calls)
+
+    def test_get_part_number_large_manifest(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcdefghijkl?part-number=10')
+        status, headers, body = self.call_slo(req)
+        expected_calls = [
+            ('GET', '/v1/AUTH_test/gettest/manifest-abcdefghijkl?'
+                    'part-number=10'),
+            ('GET', '/v1/AUTH_test/gettest/j_50?multipart-manifest=get')
+        ]
+
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(headers['Etag'], '"%s"' %
+                         self.manifest_abcdefghijkl_slo_etag)
+        self.assertEqual(headers['X-Manifest-Etag'],
+                         self.manifest_abcdefghijkl_json_md5)
+        self.assertEqual(headers['Content-Length'], '50')
+        self.assertEqual(headers['Content-Range'], 'bytes 225-274/390')
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['X-Parts-Count'], '12')
+        self.assertEqual(headers['Content-Type'], 'application/octet-stream')
+        self.assertEqual(body, b'j' * 50)
+        self.assertEqual(self.app.calls, expected_calls)
+
+    def test_part_number_with_range_segments(self):
+        req = Request.blank('/v1/AUTH_test/gettest/manifest-bc-ranges',
+                            params={'part-number': 1})
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(headers['Etag'], '"%s"' %
+                         self.manifest_bc_ranges_slo_etag)
+        self.assertEqual(headers['X-Manifest-Etag'],
+                         self.manifest_bc_ranges_json_md5)
+        self.assertEqual(headers['Content-Length'], '4')
+        self.assertEqual(headers['Content-Range'],
+                         'bytes 0-3/%s' % self.manifest_bc_ranges_slo_size)
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['X-Parts-Count'], '4')
+        self.assertEqual(body, b'b' * 4)
+        expected_calls = [
+            ('GET', '/v1/AUTH_test/gettest/manifest-bc-ranges?part-number=1'),
+            ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get')
+        ]
+        self.assertEqual(self.app.calls, expected_calls)
+        # since the our requested part-number is range-segment we expect Range
+        # header on b_10 segment subrequest
+        self.assertEqual('bytes=4-7',
+                         self.app.call_list[1].headers['Range'])
+
+    def test_part_number_sub_ranges_manifest(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd-subranges?part-number=3')
+
+        status, headers, body = self.call_slo(req)
+        expected_calls = [
+            ('GET', '/v1/AUTH_test/gettest/manifest-abcd-subranges?'
+                    'part-number=3'),
+            ('GET', '/v1/AUTH_test/gettest/manifest-abcd-ranges'),
+            ('GET', '/v1/AUTH_test/gettest/manifest-bc-ranges'),
+            ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'),
+            ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get')
+        ]
+
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(headers['Etag'], '"%s"' %
+                         self.manifest_abcd_subranges_slo_etag)
+        self.assertEqual(headers['X-Manifest-Etag'],
+                         self.manifest_abcd_subranges_json_md5)
+        self.assertEqual(headers['Content-Length'], '5')
+        self.assertEqual(headers['Content-Range'], 'bytes 6-10/17')
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['X-Parts-Count'], '5')
+        self.assertEqual(headers['Content-Type'], 'application/json')
+        self.assertEqual(body, b'c' * 2 + b'b' * 3)
+        self.assertEqual(self.app.calls, expected_calls)
+
+    def test_get_part_num_with_repeated_segments(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-aabbccdd?part-number=3',
+            environ={'REQUEST_METHOD': 'GET'})
+
+        status, headers, body = self.call_slo(req)
+        expected_calls = [
+            ('GET', '/v1/AUTH_test/gettest/manifest-aabbccdd?part-number=3'),
+            ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get')
+        ]
+
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(headers['Etag'], '"%s"' %
+                         self.manifest_aabbccdd_slo_etag)
+        self.assertEqual(headers['X-Manifest-Etag'],
+                         self.manifest_aabbccdd_json_md5)
+        self.assertEqual(headers['Content-Length'], '10')
+        self.assertEqual(headers['Content-Range'], 'bytes 10-19/100')
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['X-Parts-Count'], '8')
+        self.assertEqual(headers['Content-Type'], 'application/octet-stream')
+        self.assertEqual(body, b'b' * 10)
+        self.assertEqual(self.app.calls, expected_calls)
+
+    def test_part_number_zero_invalid(self):
+        # part-number query param is 1-indexed, part-number=0 is no joy
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-bc?part-number=0')
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '400 Bad Request')
+        self.assertNotIn('Content-Range', headers)
+        self.assertNotIn('Etag', headers)
+        self.assertNotIn('X-Static-Large-Object', headers)
+        self.assertNotIn('X-Parts-Count', headers)
+        self.assertEqual(body,
+                         b'Part number must be an integer greater than 0')
+        expected_calls = [
+            ('GET', '/v1/AUTH_test/gettest/manifest-bc?part-number=0')
+        ]
+        self.assertEqual(expected_calls, self.app.calls)
+
+        self.app.clear_calls()
+        self.slo.max_manifest_segments = 3999
+        req = Request.blank('/v1/AUTH_test/gettest/manifest-bc',
+                            params={'part-number': 0})
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '400 Bad Request')
+        self.assertNotIn('Content-Range', headers)
+        self.assertNotIn('Etag', headers)
+        self.assertNotIn('X-Static-Large-Object', headers)
+        self.assertNotIn('X-Parts-Count', headers)
+        self.assertEqual(body,
+                         b'Part number must be an integer greater than 0')
+        self.assertEqual(expected_calls, self.app.calls)
+
+    def test_head_part_number_zero_invalid(self):
+        # you can HEAD part-number=0 either
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-bc', method='HEAD',
+            params={'part-number': 0})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '400 Bad Request')
+        self.assertNotIn('Content-Range', headers)
+        self.assertNotIn('Etag', headers)
+        self.assertNotIn('X-Static-Large-Object', headers)
+        self.assertNotIn('X-Parts-Count', headers)
+        self.assertEqual(body, b'')  # HEAD response, makes sense
+        expected_calls = [
+            ('HEAD', '/v1/AUTH_test/gettest/manifest-bc?part-number=0')
+        ]
+        self.assertEqual(expected_calls, self.app.calls)
+
+    def test_part_number_zero_byte_manifest(self):
+        part_num = 1
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-zero-byte?'
+            'partNumber=%s' % part_num,
+            method='HEAD')
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(headers['Etag'],
+                         '"%s"' % self.manifest_zero_byte_slo_etag)
+        self.assertEqual(headers['Content-Length'], '0')
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['X-Manifest-Etag'],
+                         self.manifest_zero_byte_json_md5)
+        self.assertEqual(body, b'')  # it's a HEAD request, after all
+
+        expected_app_calls = [('HEAD',
+                               '/v1/AUTH_test/gettest/manifest-zero-byte?'
+                               'partNumber=%s' % part_num)]
+        if not self.modern_manifest_headers:
+            expected_app_calls.append((
+                'GET',
+                '/v1/AUTH_test/gettest/manifest-zero-byte?'
+                'partNumber=%s' % part_num))
+        self.assertEqual(self.app.calls, expected_app_calls)
+
+    def test_part_number_zero_invalid_on_subrange(self):
+        # either manifest, doesn't matter, part-number=0 is always invalid
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd-subranges?part-number=0')
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '400 Bad Request')
+        self.assertNotIn('Content-Range', headers)
+        self.assertNotIn('Etag', headers)
+        self.assertNotIn('X-Static-Large-Object', headers)
+        self.assertNotIn('X-Parts-Count', headers)
+        self.assertEqual(body,
+                         b'Part number must be an integer greater than 0')
+        expected_calls = [
+            ('GET',
+             '/v1/AUTH_test/gettest/manifest-abcd-subranges?part-number=0')
+        ]
+        self.assertEqual(expected_calls, self.app.calls)
+
+    def test_negative_part_number_invalid(self):
+        # negative numbers are never any good
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-bc?part-number=-1')
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '400 Bad Request')
+        self.assertNotIn('Content-Range', headers)
+        self.assertNotIn('Etag', headers)
+        self.assertNotIn('X-Static-Large-Object', headers)
+        self.assertNotIn('X-Parts-Count', headers)
+        self.assertEqual(body,
+                         b'Part number must be an integer greater than 0')
+        expected_calls = [
+            ('GET', '/v1/AUTH_test/gettest/manifest-bc?part-number=-1')
+        ]
+        self.assertEqual(expected_calls, self.app.calls)
+
+    def test_head_negative_part_number_invalid_on_subrange(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd-subranges', method='HEAD',
+            params={'part-number': '-1'})
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '400 Bad Request')
+        self.assertNotIn('Content-Range', headers)
+        self.assertNotIn('Etag', headers)
+        self.assertNotIn('X-Static-Large-Object', headers)
+        self.assertNotIn('X-Parts-Count', headers)
+        self.assertEqual(body, b'')
+        expected_calls = [
+            ('HEAD',
+             '/v1/AUTH_test/gettest/manifest-abcd-subranges?part-number=-1')
+        ]
+        self.assertEqual(expected_calls, self.app.calls)
+
+    def test_head_non_integer_part_number_invalid(self):
+        # some kind of string is bad too
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-bc', method='HEAD',
+            params={'part-number': 'foo'})
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '400 Bad Request')
+        self.assertEqual(body, b'')
+        expected_calls = [
+            ('HEAD', '/v1/AUTH_test/gettest/manifest-bc?part-number=foo')
+        ]
+        self.assertEqual(expected_calls, self.app.calls)
+
+    def test_get_non_integer_part_number_invalid(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-bc', params={'part-number': 'foo'})
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '400 Bad Request')
+        self.assertNotIn('Content-Range', headers)
+        self.assertNotIn('Etag', headers)
+        self.assertNotIn('X-Static-Large-Object', headers)
+        self.assertNotIn('X-Parts-Count', headers)
+        self.assertEqual(body, b'Part number must be an integer greater'
+                               b' than 0')
+        expected_calls = [
+            ('GET', '/v1/AUTH_test/gettest/manifest-bc?part-number=foo')
+        ]
+        self.assertEqual(expected_calls, self.app.calls)
+
+    def test_get_out_of_range_part_number(self):
+        # you can't go past the actual number of parts either
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-bc?part-number=4')
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '416 Requested Range Not Satisfiable')
+        self.assertEqual(headers['Content-Range'],
+                         'bytes */%d' % self.manifest_bc_slo_size)
+        self.assertEqual(headers['Etag'], '"%s"' % self.manifest_bc_slo_etag)
+        self.assertEqual(headers['X-Manifest-Etag'], self.manifest_bc_json_md5)
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['X-Parts-Count'], '2')
+        self.assertEqual(int(headers['Content-Length']), len(body))
+        self.assertEqual(body, b'The requested part number is not '
+                               b'satisfiable')
+        self.assertEqual(headers['X-Object-Meta-Plant'], 'Ficus')
+        expected_app_calls = [
+            ('GET', '/v1/AUTH_test/gettest/manifest-bc?part-number=4'),
+        ]
+        self.assertEqual(self.app.calls, expected_app_calls)
+
+        self.app.clear_calls()
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-single-segment?part-number=2')
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '416 Requested Range Not Satisfiable')
+        self.assertEqual(headers['Content-Range'],
+                         'bytes */%d' % self.manifest_single_segment_slo_size)
+        self.assertEqual(int(headers['Content-Length']), len(body))
+        self.assertEqual(headers['Etag'],
+                         '"%s"' % self.manifest_single_segment_slo_etag)
+        self.assertEqual(headers['X-Manifest-Etag'],
+                         self.manifest_single_segment_json_md5)
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['X-Parts-Count'], '1')
+        self.assertEqual(body, b'The requested part number is not '
+                               b'satisfiable')
+        self.assertEqual(headers['X-Object-Meta-Nature'], 'Regular')
+        expected_app_calls = [
+            ('GET', '/v1/AUTH_test/gettest/manifest-single-segment?'
+                    'part-number=2'),
+        ]
+        self.assertEqual(self.app.calls, expected_app_calls)
+
+    def test_head_out_of_range_part_number(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-bc?part-number=4')
+        req.method = 'HEAD'
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '416 Requested Range Not Satisfiable')
+        self.assertEqual(headers['Content-Range'],
+                         'bytes */%d' % self.manifest_bc_slo_size)
+        self.assertEqual(headers['Etag'], '"%s"' % self.manifest_bc_slo_etag)
+        self.assertEqual(headers['X-Manifest-Etag'], self.manifest_bc_json_md5)
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['X-Parts-Count'], '2')
+        self.assertEqual(int(headers['Content-Length']), len(body))
+        self.assertEqual(body, b'')
+        self.assertEqual(headers['X-Object-Meta-Plant'], 'Ficus')
+        expected_app_calls = [
+            ('HEAD', '/v1/AUTH_test/gettest/manifest-bc?part-number=4'),
+            # segments needed
+            ('GET', '/v1/AUTH_test/gettest/manifest-bc?part-number=4')
+        ]
+        self.assertEqual(self.app.calls, expected_app_calls)
+
+    def test_part_number_exceeds_max_manifest_segments_is_ok(self):
+        # verify that an existing part can be fetched regardless of the current
+        # max_manifest_segments
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-bc?part-number=2')
+        self.slo.max_manifest_segments = 1
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(headers['Etag'], '"%s"' % self.manifest_bc_slo_etag)
+        self.assertEqual(headers['X-Manifest-Etag'], self.manifest_bc_json_md5)
+        self.assertEqual(headers['Content-Length'], '15')
+        self.assertEqual(headers['Content-Range'], 'bytes 10-24/25')
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['X-Parts-Count'], '2')
+        self.assertEqual(headers['Content-Type'], 'application/octet-stream')
+        self.assertEqual(body, b'c' * 15)
+        expected_calls = [
+            ('GET', '/v1/AUTH_test/gettest/manifest-bc?part-number=2'),
+            ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get')
+        ]
+        self.assertEqual(self.app.calls, expected_calls)
+
+    def test_part_number_ignored_for_non_slo_object(self):
+        # verify that a part-number param is ignored for a non-slo object
+        def do_test(query_string):
+            self.app.clear_calls()
+            req = Request.blank(
+                '/v1/AUTH_test/gettest/c_15?%s' % query_string)
+            self.slo.max_manifest_segments = 1
+            status, headers, body = self.call_slo(req)
+            self.assertEqual(status, '200 OK')
+            self.assertEqual(headers['Etag'], '%s' % md5hex('c' * 15))
+            self.assertEqual(headers['Content-Length'], '15')
+            self.assertEqual(body, b'c' * 15)
+            self.assertEqual(1, self.app.call_count)
+            method, path = self.app.calls[0]
+            actual_req = Request.blank(path, method=method)
+            self.assertEqual(req.path, actual_req.path)
+            self.assertEqual(req.params, actual_req.params)
+
+        do_test('part-number=-1')
+        do_test('part-number=0')
+        do_test('part-number=1')
+        do_test('part-number=2')
+        do_test('part-number=foo')
+        do_test('part-number=foo&multipart-manifest=get')
+
+    def test_part_number_ignored_for_non_slo_object_with_range(self):
+        # verify that a part-number param is ignored for a non-slo object
+        def do_test(query_string):
+            self.app.clear_calls()
+            req = Request.blank(
+                '/v1/AUTH_test/gettest/c_15?%s' % query_string,
+                headers={'Range': 'bytes=1-2'})
+            self.slo.max_manifest_segments = 1
+            status, headers, body = self.call_slo(req)
+            self.assertEqual(status, '206 Partial Content')
+            self.assertEqual(headers['Etag'], '%s' % md5hex('c' * 15))
+            self.assertEqual(headers['Content-Length'], '2')
+            self.assertEqual(headers['Content-Range'], 'bytes 1-2/15')
+            self.assertEqual(body, b'c' * 2)
+            self.assertEqual(1, self.app.call_count)
+            method, path = self.app.calls[0]
+            actual_req = Request.blank(path, method=method)
+            self.assertEqual(req.path, actual_req.path)
+            self.assertEqual(req.params, actual_req.params)
+
+        do_test('part-number=-1')
+        do_test('part-number=0')
+        do_test('part-number=1')
+        do_test('part-number=2')
+        do_test('part-number=foo')
+        do_test('part-number=foo&multipart-manifest=get')
+
+    def test_part_number_ignored_for_manifest_get(self):
+        def do_test(query_string):
+            self.app.clear_calls()
+            req = Request.blank(
+                '/v1/AUTH_test/gettest/manifest-bc?%s' % query_string)
+            self.slo.max_manifest_segments = 1
+            status, headers, body = self.call_slo(req)
+            self.assertEqual(status, '200 OK')
+            self.assertEqual(headers['Etag'], self.manifest_bc_json_md5)
+            self.assertEqual(headers['Content-Length'],
+                             str(self.manifest_bc_json_size))
+            self.assertEqual(headers['X-Static-Large-Object'], 'true')
+            self.assertEqual(headers['Content-Type'],
+                             'application/json; charset=utf-8')
+            self.assertEqual(headers['X-Object-Meta-Plant'], 'Ficus')
+            self.assertEqual(1, self.app.call_count)
+            method, path = self.app.calls[0]
+            actual_req = Request.blank(path, method=method)
+            self.assertEqual(req.path, actual_req.path)
+            self.assertEqual(req.params, actual_req.params)
+
+        do_test('part-number=-1&multipart-manifest=get')
+        do_test('part-number=0&multipart-manifest=get')
+        do_test('part-number=1&multipart-manifest=get')
+        do_test('part-number=2&multipart-manifest=get')
+        do_test('part-number=foo&multipart-manifest=get')
+
+    def test_head_out_of_range_part_number_on_subrange(self):
+        # you can't go past the actual number of parts either
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd-subranges',
+            method='HEAD',
+            params={'part-number': 6})
+        expected_calls = [
+            ('HEAD', '/v1/AUTH_test/gettest/manifest-abcd-subranges?'
+                     'part-number=6'),
+            ('GET', '/v1/AUTH_test/gettest/manifest-abcd-subranges?'
+                    'part-number=6')]
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '416 Requested Range Not Satisfiable')
+        self.assertEqual(headers['Content-Range'],
+                         'bytes */%d' % self.manifest_abcd_subranges_slo_size)
+        self.assertEqual(headers['Etag'],
+                         '"%s"' % self.manifest_abcd_subranges_slo_etag)
+        self.assertEqual(headers['X-Manifest-Etag'],
+                         self.manifest_abcd_subranges_json_md5)
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['X-Parts-Count'], '5')
+        self.assertEqual(int(headers['Content-Length']), len(body))
+        self.assertEqual(body, b'')
+        self.assertEqual(self.app.calls, expected_calls)
+
+    def test_range_with_part_number_is_error(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd-subranges?part-number=2',
+            headers={'Range': 'bytes=4-12'})
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '400 Bad Request')
+        self.assertNotIn('Content-Range', headers)
+        self.assertNotIn('Etag', headers)
+        self.assertNotIn('X-Static-Large-Object', headers)
+        self.assertNotIn('X-Parts-Count', headers)
+        self.assertEqual(body, b'Range requests are not supported with '
+                               b'part number queries')
+        expected_calls = [
+            ('GET',
+             '/v1/AUTH_test/gettest/manifest-abcd-subranges?part-number=2')
+        ]
+        self.assertEqual(expected_calls, self.app.calls)
+
+    def test_head_part_number_subrange(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/manifest-abcd-subranges',
+            method='HEAD', params={'part-number': 2})
+        status, headers, body = self.call_slo(req)
+
+        # Range header can be ignored in a HEAD request
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(headers['Etag'],
+                         '"%s"' % self.manifest_abcd_subranges_slo_etag)
+        self.assertEqual(headers['Content-Length'], '1')
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['Content-Type'], 'application/json')
+        self.assertEqual(headers['X-Parts-Count'], '5')
+        self.assertEqual(body, b'')  # it's a HEAD request, after all
+        expected_calls = [
+            ('HEAD', '/v1/AUTH_test/gettest/manifest-abcd-subranges'
+             '?part-number=2'),
+            ('GET', '/v1/AUTH_test/gettest/manifest-abcd-subranges'
+             '?part-number=2'),
+        ]
+        self.assertEqual(self.app.calls, expected_calls)
+
+    def test_head_part_number_data_manifest(self):
+        req = Request.blank(
+            '/v1/AUTH_test/c/manifest-data',
+            method='HEAD', params={'part-number': 1})
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(headers['Etag'],
+                         '"%s"' % self.manifest_data_slo_etag)
+        self.assertEqual(headers['Content-Length'], '6')
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['X-Parts-Count'], '3')
+        self.assertEqual(body, b'')  # it's a HEAD request, after all
+        expected_calls = [
+            ('HEAD', '/v1/AUTH_test/c/manifest-data?part-number=1'),
+            ('GET', '/v1/AUTH_test/c/manifest-data?part-number=1'),
+        ]
+        self.assertEqual(self.app.calls, expected_calls)
+
+    def test_get_part_number_data_manifest(self):
+        req = Request.blank(
+            '/v1/AUTH_test/c/manifest-data',
+            params={'part-number': 3})
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(headers['Etag'],
+                         '"%s"' % self.manifest_data_slo_etag)
+        self.assertEqual(headers['Content-Length'], '6')
+        self.assertEqual(headers['X-Static-Large-Object'], 'true')
+        self.assertEqual(headers['X-Parts-Count'], '3')
+        self.assertEqual(body, b'ABCDEF')
+        expected_calls = [
+            ('GET', '/v1/AUTH_test/c/manifest-data?part-number=3'),
+        ]
+        self.assertEqual(self.app.calls, expected_calls)
+
+
+class TestPartNumberLegacyManifest(TestPartNumber):
+
+    modern_manifest_headers = False
+
+
+class TestSloBulkDeleter(unittest.TestCase):
+    def test_reused_logger(self):
+        slo_mware = slo.filter_factory({})('fake app')
+        self.assertTrue(slo_mware.logger is slo_mware.bulk_deleter.logger)
+
+    def test_passes_through_concurrency(self):
+        slo_mware = slo.filter_factory({'delete_concurrency': 5})('fake app')
+        self.assertEqual(5, slo_mware.bulk_deleter.delete_concurrency)
+
+    def test_uses_big_max_deletes(self):
+        slo_mware = slo.filter_factory(
+            {'max_manifest_segments': 123456789})('fake app')
+        self.assertGreaterEqual(
+            slo_mware.bulk_deleter.max_deletes_per_request,
+            123456789)
+
+
+class TestSwiftInfo(unittest.TestCase):
+    def setUp(self):
+        registry._swift_info = {}
+        registry._swift_admin_info = {}
+
+    def test_registered_defaults(self):
+        mware = slo.filter_factory({})('have to pass in an app')
+        swift_info = registry.get_swift_info()
+        self.assertTrue('slo' in swift_info)
+        self.assertEqual(swift_info['slo'].get('max_manifest_segments'),
+                         mware.max_manifest_segments)
+        self.assertEqual(swift_info['slo'].get('min_segment_size'), 1)
+        self.assertEqual(swift_info['slo'].get('max_manifest_size'),
+                         mware.max_manifest_size)
+        self.assertIs(swift_info['slo'].get('allow_async_delete'), True)
+        self.assertEqual(1000, mware.max_manifest_segments)
+        self.assertEqual(8388608, mware.max_manifest_size)
+        self.assertEqual(1048576, mware.rate_limit_under_size)
+        self.assertEqual(10, mware.rate_limit_after_segment)
+        self.assertEqual(1, mware.rate_limit_segments_per_sec)
+        self.assertEqual(10, mware.yield_frequency)
+        self.assertEqual(2, mware.concurrency)
+        self.assertEqual(2, mware.bulk_deleter.delete_concurrency)
+        self.assertIs(True, mware.allow_async_delete)
+
+    def test_registered_non_defaults(self):
+        conf = dict(
+            max_manifest_segments=500, max_manifest_size=1048576,
+            rate_limit_under_size=2097152, rate_limit_after_segment=20,
+            rate_limit_segments_per_sec=2, yield_frequency=5, concurrency=1,
+            delete_concurrency=3, allow_async_delete='n')
+        mware = slo.filter_factory(conf)('have to pass in an app')
+        swift_info = registry.get_swift_info()
+        self.assertTrue('slo' in swift_info)
+        self.assertEqual(swift_info['slo'].get('max_manifest_segments'), 500)
+        self.assertEqual(swift_info['slo'].get('min_segment_size'), 1)
+        self.assertEqual(swift_info['slo'].get('max_manifest_size'), 1048576)
+        self.assertIs(swift_info['slo'].get('allow_async_delete'), False)
+        self.assertEqual(500, mware.max_manifest_segments)
+        self.assertEqual(1048576, mware.max_manifest_size)
+        self.assertEqual(2097152, mware.rate_limit_under_size)
+        self.assertEqual(20, mware.rate_limit_after_segment)
+        self.assertEqual(2, mware.rate_limit_segments_per_sec)
+        self.assertEqual(5, mware.yield_frequency)
+        self.assertEqual(1, mware.concurrency)
+        self.assertEqual(3, mware.bulk_deleter.delete_concurrency)
+        self.assertIs(False, mware.allow_async_delete)
+
+
+class TestNonSloPassthrough(SloGETorHEADTestCase):
+
+    def setUp(self):
+        super(TestNonSloPassthrough, self).setUp()
+        self._setup_alphabet_objects('a')
+
+        body = b'big' * 1000
+        self.app.register(
+            'GET', '/v1/AUTH_test/rangetest/big', swob.HTTPOk, {
+                'Content-Length': len(body),
+                'Etag': md5hex(body),
+            }, body=body)
+
+    def test_get_nonmanifest_passthrough(self):
+        req = Request.blank(
+            '/v1/AUTH_test/gettest/a_5',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_slo(req)
+
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(headers['Etag'], md5hex('a' * 5))
+        self.assertEqual(headers['Content-Length'], '5')
+        self.assertNotIn('X-Static-Large-Object', headers)
+        self.assertNotIn('X-Manifest-Etag', headers)
+        self.assertEqual(body, b'aaaaa')
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/AUTH_test/gettest/a_5'),
+        ])
+
+    def test_non_slo_range_passthrough(self):
+        req = Request.blank(
+            '/v1/AUTH_test/rangetest/big',
+            headers={'Range': 'bytes=0-4'})
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '206 Partial Content')
+        self.assertEqual(headers['Content-Length'], '5')
+        self.assertEqual(headers['Content-Range'], 'bytes 0-4/3000')
+        self.assertEqual(body, b'bigbi')
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/AUTH_test/rangetest/big'),
+        ])
+
+    def test_non_slo_range_unsatisfiable_passthrough(self):
+        req = Request.blank(
+            '/v1/AUTH_test/rangetest/big',
+            headers={'Range': 'bytes=3001-'})
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '416 Requested Range Not Satisfiable')
+        self.assertEqual(headers['Content-Range'], 'bytes */3000')
+        self.assertIn(b'Requested Range Not Satisfiable', body)
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/AUTH_test/rangetest/big'),
+        ])
+
+    def test_non_slo_multi_range_passthrough(self):
+        req = Request.blank(
+            '/v1/AUTH_test/rangetest/big',
+            headers={'Range': 'bytes=1-2,3-4'})
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '206 Partial Content')
+        self.assertNotIn('Content-Range', headers)
+
+        ct, params = parse_content_type(headers['Content-Type'])
+        self.assertEqual(ct, 'multipart/byteranges')
+
+        params = dict(params)
+        boundary = params.get('boundary').encode('utf-8')
+
+        self.assertEqual(len(body), int(headers['Content-Length']))
+
+        got_mime_docs = []
+        for mime_doc_fh in iter_multipart_mime_documents(
+                BytesIO(body), boundary):
+            headers = parse_mime_headers(mime_doc_fh)
+            body = mime_doc_fh.read()
+            got_mime_docs.append((headers, body))
+        self.assertEqual(len(got_mime_docs), 2)
+
+        first_range_headers, first_range_body = got_mime_docs[0]
+        self.assertEqual(first_range_headers['Content-Range'],
+                         'bytes 1-2/3000')
+        self.assertEqual(first_range_body, b'ig')
+
+        second_range_headers, second_range_body = got_mime_docs[1]
+        self.assertEqual(second_range_headers['Content-Range'],
+                         'bytes 3-4/3000')
+        # 012 34 5678
+        # big bi gbig
+        self.assertEqual(second_range_body, b'bi')
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/AUTH_test/rangetest/big'),
+        ])
+
+    def test_non_slo_multi_range_partially_satisfiable_passthrough(self):
+        req = Request.blank(
+            '/v1/AUTH_test/rangetest/big',
+            headers={'Range': 'bytes=1-2,3-4,3001-'})
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '206 Partial Content')
+        self.assertNotIn('Content-Range', headers)
+        self.assertEqual(int(headers['Content-Length']), len(body))
+
+        ct, params = parse_content_type(headers['Content-Type'])
+        self.assertEqual(ct, 'multipart/byteranges')
+
+        params = dict(params)
+        boundary = params.get('boundary').encode('utf-8')
+
+        self.assertEqual(len(body), int(headers['Content-Length']))
+
+        got_mime_docs = []
+        for mime_doc_fh in iter_multipart_mime_documents(
+                BytesIO(body), boundary):
+            headers = parse_mime_headers(mime_doc_fh)
+            body = mime_doc_fh.read()
+            got_mime_docs.append((headers, body))
+        self.assertEqual(len(got_mime_docs), 2)
+
+        first_range_headers, first_range_body = got_mime_docs[0]
+        self.assertEqual(first_range_headers['Content-Range'],
+                         'bytes 1-2/3000')
+        self.assertEqual(first_range_body, b'ig')
+
+        second_range_headers, second_range_body = got_mime_docs[1]
+        self.assertEqual(second_range_headers['Content-Range'],
+                         'bytes 3-4/3000')
+        self.assertEqual(second_range_body, b'bi')
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/AUTH_test/rangetest/big'),
+        ])
+
+    def test_non_slo_multi_range_unsatisfiable_passthrough(self):
+        req = Request.blank(
+            '/v1/AUTH_test/rangetest/big',
+            headers={'Range': 'bytes=3001-,3005-3010'})
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '416 Requested Range Not Satisfiable')
+        self.assertEqual(headers['Content-Range'], 'bytes */3000')
+        self.assertEqual(int(headers['Content-Length']), len(body))
+        self.assertIn(b'Requested Range Not Satisfiable', body)
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/AUTH_test/rangetest/big'),
+        ])
+
+    def test_non_slo_multi_range_starting_beyond_multipart_resp_length(self):
+        req = Request.blank(
+            '/v1/AUTH_test/rangetest/big',
+            headers={'Range': 'bytes=1000-1002,2000-2002'})
+        status, headers, body = self.call_slo(req)
+        self.assertEqual(status, '206 Partial Content')
+        self.assertNotIn('Content-Range', headers)
+        self.assertEqual(int(headers['Content-Length']), len(body))
+
+        ct, params = parse_content_type(headers['Content-Type'])
+        self.assertEqual(ct, 'multipart/byteranges')
+
+        params = dict(params)
+        boundary = params.get('boundary').encode('utf-8')
+
+        self.assertEqual(len(body), int(headers['Content-Length']))
+
+        got_mime_docs = []
+        for mime_doc_fh in iter_multipart_mime_documents(
+                BytesIO(body), boundary):
+            headers = parse_mime_headers(mime_doc_fh)
+            body = mime_doc_fh.read()
+            got_mime_docs.append((headers, body))
+        self.assertEqual(len(got_mime_docs), 2)
+
+        first_range_headers, first_range_body = got_mime_docs[0]
+        self.assertEqual(first_range_headers['Content-Range'],
+                         'bytes 1000-1002/3000')
+        self.assertEqual(first_range_body, b'igb')
+
+        second_range_headers, second_range_body = got_mime_docs[1]
+        self.assertEqual(second_range_headers['Content-Range'],
+                         'bytes 2000-2002/3000')
+        self.assertEqual(second_range_body, b'gbi')
+        self.assertEqual(self.app.calls, [
+            ('GET', '/v1/AUTH_test/rangetest/big'),
+        ])
+
+
+class TestRespAttrs(unittest.TestCase):
+    def test_init_calculates_is_legacy(self):
+        attrs = slo.RespAttrs(True, 123456789.12345,
+                              'manifest-etag', 'slo-etag', 999)
+        self.assertTrue(attrs.is_slo)
+        self.assertEqual(123456789.12345, attrs.timestamp)
+        self.assertIsInstance(attrs.timestamp, Timestamp)
+        self.assertEqual('manifest-etag', attrs.json_md5)
+        self.assertEqual('slo-etag', attrs.slo_etag)
+        self.assertEqual(999, attrs.slo_size)
+        # we gave it etag and size!
+        self.assertTrue(attrs._has_size_and_etag())
+        self.assertFalse(attrs.is_legacy)
+
+    def test_init_converts_timestamps_from_strings(self):
+        attrs = slo.RespAttrs(True, '123456789.12345',
+                              'manifest-etag', 'slo-etag', 999)
+        self.assertTrue(attrs.is_slo)
+        self.assertEqual(123456789.12345, attrs.timestamp)
+        self.assertIsInstance(attrs.timestamp, Timestamp)
+        self.assertEqual('manifest-etag', attrs.json_md5)
+        self.assertEqual('slo-etag', attrs.slo_etag)
+        self.assertEqual(999, attrs.slo_size)
+        # we gave it etag and size!
+        self.assertTrue(attrs._has_size_and_etag())
+        self.assertFalse(attrs.is_legacy)
+
+    def test_default_types(self):
+        attrs = slo.RespAttrs(None, None, None, None, None)
+        # types are correct, values are default/place-holders
+        self.assertTrue(attrs.is_slo is False)  # not None!
+        self.assertEqual(Timestamp.zero(), attrs.timestamp)
+        self.assertIsInstance(attrs.timestamp, Timestamp)
+        self.assertEqual('', attrs.json_md5)
+        self.assertEqual('', attrs.slo_etag)
+        self.assertEqual(-1, attrs.slo_size)
+        # we didn't provide etag & size
+        self.assertFalse(attrs._has_size_and_etag())
+        self.assertTrue(attrs.is_legacy)
+
+    def test_init_with_no_sysmeta(self):
+        now = Timestamp.now()
+        attrs = slo.RespAttrs(True, now.normal, None, None, None)
+        self.assertTrue(attrs.is_slo)
+        self.assertEqual(Timestamp(now.normal), attrs.timestamp)
+        self.assertIsInstance(attrs.timestamp, Timestamp)
+        self.assertEqual('', attrs.json_md5)
+        self.assertEqual('', attrs.slo_etag)
+        self.assertEqual(-1, attrs.slo_size)
+        # we didn't provide etag & size
+        self.assertFalse(attrs._has_size_and_etag())
+        self.assertTrue(attrs.is_legacy)
+
+    def test_init_with_no_sysmeta_offset(self):
+        now = Timestamp.now(offset=123)
+        attrs = slo.RespAttrs(True, now.internal, None, None, None)
+        self.assertTrue(attrs.is_slo)
+        self.assertEqual(now, attrs.timestamp)
+        self.assertIsInstance(attrs.timestamp, Timestamp)
+        self.assertEqual('', attrs.json_md5)
+        self.assertEqual('', attrs.slo_etag)
+        self.assertEqual(-1, attrs.slo_size)
+        # we didn't provide etag & size
+        self.assertFalse(attrs._has_size_and_etag())
+        self.assertTrue(attrs.is_legacy)
+
+    def test_from_empty_headers(self):
+        attrs = slo.RespAttrs.from_headers([])
+        self.assertFalse(attrs.is_slo)
+        self.assertEqual(Timestamp.zero(), attrs.timestamp)
+        self.assertEqual('', attrs.json_md5)
+        self.assertEqual('', attrs.slo_etag)
+        self.assertEqual(-1, attrs.slo_size)
+        self.assertTrue(attrs.is_legacy)
+
+    def test_from_only_timestamp(self):
+        now = Timestamp.now(offset=1)
+        attrs = slo.RespAttrs.from_headers(
+            [('X-Backend-Timestamp', now.internal),
+             ('X-Irrelevant', 'ignored')])
+        self.assertFalse(attrs.is_slo)
+        self.assertEqual(now, attrs.timestamp)
+        self.assertEqual('', attrs.json_md5)
+        self.assertEqual('', attrs.slo_etag)
+        self.assertEqual(-1, attrs.slo_size)
+        self.assertTrue(attrs.is_legacy)
+
+    def test_legacy_slo_sysmeta(self):
+        attrs = slo.RespAttrs.from_headers(
+            [('X-Backend-Timestamp', '123456789.12345'),
+             ('Etag', 'manifest-etag'),
+             ('X-Static-lARGE-Object', 'yes')])
+        self.assertTrue(attrs.is_slo)
+        self.assertEqual(123456789.12345, attrs.timestamp)
+        self.assertEqual('manifest-etag', attrs.json_md5)
+        self.assertEqual('', attrs.slo_etag)
+        self.assertEqual(-1, attrs.slo_size)
+        self.assertTrue(attrs.is_legacy)
+
+    def test_partial_modern_sysmeta(self):
+        # missing slo etag
+        attrs = slo.RespAttrs.from_headers(
+            [('X-Backend-Timestamp', '123456789.12345'),
+             ('Etag', 'manifest-etag'),
+             ('X-Static-lARGE-Object', 'yes'),
+             ('x-object-sysmeta-slo-size', '1234')])
+        self.assertTrue(attrs.is_slo)
+        self.assertEqual(123456789.12345, attrs.timestamp)
+        self.assertEqual('manifest-etag', attrs.json_md5)
+        self.assertEqual('', attrs.slo_etag)
+        self.assertEqual(1234, attrs.slo_size)
+        self.assertTrue(attrs.is_legacy)
+
+        # missing slo size
+        attrs = slo.RespAttrs.from_headers(
+            [('X-Backend-Timestamp', '123456789.12345'),
+             ('Etag', 'manifest-etag'),
+             ('X-Static-lARGE-Object', 'yes'),
+             ('x-object-sysmeta-slo-etag', 'slo-etag')])
+        self.assertTrue(attrs.is_slo)
+        self.assertEqual(123456789.12345, attrs.timestamp)
+        self.assertEqual('manifest-etag', attrs.json_md5)
+        self.assertEqual('slo-etag', attrs.slo_etag)
+        self.assertEqual(-1, attrs.slo_size)
+        self.assertTrue(attrs.is_legacy)
+
+        # missing manifest etag
+        attrs = slo.RespAttrs.from_headers(
+            [('X-Backend-Timestamp', '123456789.12345'),
+             ('X-Static-lARGE-Object', 'yes'),
+             ('x-object-sysmeta-slo-size', '1234'),
+             ('x-object-sysmeta-slo-etag', 'slo-etag')])
+        self.assertTrue(attrs.is_slo)
+        self.assertEqual(123456789.12345, attrs.timestamp)
+        self.assertEqual('', attrs.json_md5)
+        self.assertEqual('slo-etag', attrs.slo_etag)
+        self.assertEqual(1234, attrs.slo_size)
+        # missing Etag might be some kind of bug, but it has all sysmeta
+        self.assertFalse(attrs.is_legacy)
+
+    def test_invalid_sysmeta(self):
+        attrs = slo.RespAttrs.from_headers(
+            [('X-Backend-Timestamp', '123456789.12345'),
+             ('X-Static-lARGE-Object', 'yes'),
+             ('x-object-sysmeta-slo-size', 'huge!')])
+        self.assertTrue(attrs.is_slo)
+        self.assertEqual(123456789.12345, attrs.timestamp)
+        self.assertEqual('', attrs.json_md5)
+        self.assertEqual('', attrs.slo_etag)
+        self.assertEqual(-1, attrs.slo_size)
+        self.assertTrue(attrs.is_legacy)
+
+        attrs = slo.RespAttrs.from_headers(
+            [('X-Backend-Timestamp', '123456789.12345'),
+             ('X-Static-lARGE-Object', 'yes'),
+             ('e-TAG', 'wrong!'),
+             ('x-object-sysmeta-slo-size', '')])
+        self.assertTrue(attrs.is_slo)
+        self.assertEqual(123456789.12345, attrs.timestamp)
+        self.assertEqual('', attrs.json_md5)
+        self.assertEqual('', attrs.slo_etag)
+        self.assertEqual(-1, attrs.slo_size)
+        self.assertTrue(attrs.is_legacy)
+
+    def test_from_valid_sysmeta(self):
+        attrs = slo.RespAttrs.from_headers(
+            [('X-Backend-Timestamp', '123456789.12345'),
+             ('Etag', 'manifest-etag'),
+             ('X-Static-lARGE-Object', 'yes'),
+             ('x-object-sysmeta-slo-etag', 'slo-tag'),
+             ('x-object-sysmeta-slo-size', '1234')])
+        self.assertTrue(attrs.is_slo)
+        self.assertEqual(123456789.12345, attrs.timestamp)
+        self.assertEqual('manifest-etag', attrs.json_md5)
+        self.assertEqual('slo-tag', attrs.slo_etag)
+        self.assertEqual(1234, attrs.slo_size)
+        self.assertFalse(attrs.is_legacy)
+
+    def test_from_regular_object(self):
+        now = Timestamp.now()
+        attrs = slo.RespAttrs.from_headers(
+            [('X-Backend-Timestamp', now.internal),
+             ('Etag', 'object-etag')])
+        self.assertFalse(attrs.is_slo)
+        self.assertEqual(now, attrs.timestamp)
+        # N.B. we only set manifest_etag on slo objects
+        self.assertEqual('', attrs.json_md5)
+        self.assertEqual('', attrs.slo_etag)
+        self.assertEqual(-1, attrs.slo_size)
+        self.assertTrue(attrs.is_legacy)
+
+    def test_non_slo_with_sysmeta(self):
+        attrs = slo.RespAttrs.from_headers(
+            [('X-Backend-Timestamp', '123456789.12345'),
+             ('X-Static-lARGE-Object', 'false')])
+        self.assertFalse(attrs.is_slo)
+        self.assertEqual(123456789.12345, attrs.timestamp)
+        self.assertEqual('', attrs.json_md5)
+        self.assertEqual('', attrs.slo_etag)
+        self.assertEqual(-1, attrs.slo_size)
+        self.assertTrue(attrs.is_legacy)
+
+        attrs = slo.RespAttrs.from_headers(
+            [('X-Backend-Timestamp', '123456789.12345'),
+             ('Etag', 'segment-etag'),
+             ('x-object-sysmeta-slo-etag', 'tag'),
+             ('x-object-sysmeta-slo-size', '1234')])
+        # this is NOT an SLO
+        self.assertFalse(attrs.is_slo)
+        self.assertEqual('', attrs.json_md5)
+        # ... but we set these based on the sysmeta values
+        self.assertEqual('tag', attrs.slo_etag)
+        self.assertEqual(1234, attrs.slo_size)
+        self.assertEqual(123456789.12345, attrs.timestamp)
+        # I hope someday a non-slo with slo sysmeta *will* be just a legacy,
+        # see lp bug #2035158
+        self.assertFalse(attrs.is_legacy)
+
+    def test_from_zero_byte_sysmeta(self):
+        attrs = slo.RespAttrs.from_headers([
+            ('X-Backend-Timestamp', '1709069771.34178'),
+            ('X-Object-Sysmeta-Container-Update-Override-Etag',
+             'a1eadf0ca181e87fcbdba2074ce0fd90; '
+             's3_etag=59adb24ef3cdbe0297f05b395827453f-1; '
+             'slo_etag=74be16979710d4c4e7c6647856088456'),
+            ('X-Object-Sysmeta-S3Api-Etag',
+             '59adb24ef3cdbe0297f05b395827453f-1'),
+            ('X-Object-Sysmeta-S3Api-Upload-Id',
+             'NDZlMDBhN2MtNzVmZS00ZTljLTkzN2EtODcwNGQ5OTg4NmQ2'),
+            ('X-Object-Sysmeta-Slo-Etag', '74be16979710d4c4e7c6647856088456'),
+            ('X-Object-Sysmeta-Slo-Size', '0'),
+            ('ETag', 'a1eadf0ca181e87fcbdba2074ce0fd90'),
+            ('X-Static-Large-Object', 'True'),
+        ])
+        self.assertTrue(attrs.is_slo)
+        self.assertEqual(1709069771.34178, attrs.timestamp)
+        self.assertEqual('a1eadf0ca181e87fcbdba2074ce0fd90', attrs.json_md5)
+        self.assertEqual('74be16979710d4c4e7c6647856088456', attrs.slo_etag)
+        self.assertEqual(0, attrs.slo_size)
+        self.assertFalse(attrs.is_legacy)
+
+    def _legacy_from_headers(self):
+        attrs = slo.RespAttrs.from_headers(
+            [('X-Backend-Timestamp', '123456789.12345'),
+             ('Etag', 'manifest-etag'),
+             ('X-Static-lARGE-Object', 'yes')])
+        self.assertTrue(attrs.is_slo)
+        self.assertEqual(123456789.12345, attrs.timestamp)
+        self.assertEqual('manifest-etag', attrs.json_md5)
+        self.assertEqual('', attrs.slo_etag)
+        self.assertEqual(-1, attrs.slo_size)
+        self.assertTrue(attrs.is_legacy)
+        return attrs
+
+    def test_update_from_segments(self):
+        attrs = self._legacy_from_headers()
+        segments = [
+            {'hash': 'abc', 'bytes': 2},
+            {'hash': 'def', 'bytes': 3},
+        ]
+        slo._annotate_segments(segments)
+        attrs.update_from_segments(segments)
+
+        exp_etag = md5('abcdef'.encode('ascii'), usedforsecurity=False)
+
+        self.assertTrue(attrs.is_slo)
+        self.assertEqual(123456789.12345, attrs.timestamp)
+        self.assertEqual(exp_etag.hexdigest(), attrs.slo_etag)
+        self.assertEqual(5, attrs.slo_size)
+        # N.B. it's still a legacy manifest
+        self.assertTrue(attrs.is_legacy)
+
+    def test_update_from_segments_with_raw_data(self):
+        attrs = self._legacy_from_headers()
+        raw_data = b'something'
+        segments = [
+            {'hash': 'abc', 'bytes': 2},
+            {'data': base64.b64encode(raw_data)},
+        ]
+        slo._annotate_segments(segments)
+        attrs.update_from_segments(segments)
+
+        raw_data_checksum = md5(raw_data).hexdigest()
+        exp_etag = md5(('abc' + raw_data_checksum).encode('ascii'),
+                       usedforsecurity=False)
+
+        self.assertTrue(attrs.is_slo)
+        self.assertEqual(123456789.12345, attrs.timestamp)
+        self.assertEqual(exp_etag.hexdigest(), attrs.slo_etag)
+        self.assertEqual(11, attrs.slo_size)
+        # N.B. it's still a legacy manifest
+        self.assertTrue(attrs.is_legacy)
+
+    def test_update_from_segments_with_range(self):
+        attrs = self._legacy_from_headers()
+        segments = [
+            {'hash': 'abc', 'bytes': 2},
+            {'hash': 'def', 'range': '1-2'},
+        ]
+        slo._annotate_segments(segments)
+        attrs.update_from_segments(segments)
+
+        exp_etag = md5('abcdef:1-2;'.encode('ascii'), usedforsecurity=False)
+
+        self.assertTrue(attrs.is_slo)
+        self.assertEqual(123456789.12345, attrs.timestamp)
+        self.assertEqual(exp_etag.hexdigest(), attrs.slo_etag)
+        self.assertEqual(4, attrs.slo_size)
+        # N.B. it's still a legacy manifest
+        self.assertTrue(attrs.is_legacy)
+
+    def test_update_from_segments_with_sub_slo(self):
+        attrs = self._legacy_from_headers()
+        content_type = 'application/octet-stream'
+        content_type += ";swift_bytes=%d" % 5
+        segments = [
+            {'hash': 'abc', 'bytes': 2},
+            {'hash': '123', 'sub_slo': True, 'content_type': content_type},
+        ]
+        slo._annotate_segments(segments)
+        attrs.update_from_segments(segments)
+
+        exp_etag = md5('abc123'.encode('ascii'), usedforsecurity=False)
+
+        self.assertTrue(attrs.is_slo)
+        self.assertEqual(123456789.12345, attrs.timestamp)
+        self.assertEqual(exp_etag.hexdigest(), attrs.slo_etag)
+        self.assertEqual(7, attrs.slo_size)
+        # N.B. it's still a legacy manifest
+        self.assertTrue(attrs.is_legacy)
+
+    def test_update_from_segments_with_sub_slo_range(self):
+        attrs = self._legacy_from_headers()
+        content_type = 'application/octet-stream'
+        content_type += ";swift_bytes=%d" % 5
+        segments = [
+            {'hash': 'abc', 'bytes': 2},
+            {'hash': '123', 'sub_slo': True, 'content_type': content_type,
+             'range': '2-4'},
+        ]
+        slo._annotate_segments(segments)
+        attrs.update_from_segments(segments)
+
+        exp_etag = md5('abc123:2-4;'.encode('ascii'), usedforsecurity=False)
+
+        self.assertTrue(attrs.is_slo)
+        self.assertEqual(123456789.12345, attrs.timestamp)
+        self.assertEqual(exp_etag.hexdigest(), attrs.slo_etag)
+        self.assertEqual(5, attrs.slo_size)
+        # N.B. it's still a legacy manifest
+        self.assertTrue(attrs.is_legacy)
+
+    def test_update_from_segments_not_legacy(self):
+        attrs = slo.RespAttrs.from_headers(
+            [('X-Backend-Timestamp', '123456789.12345'),
+             ('X-Static-lARGE-Object', 'yes'),
+             ('x-object-sysmeta-slo-etag', 'tag'),
+             ('x-object-sysmeta-slo-size', '1234')])
+
+        segments = 'not even json; does not matter'
+        attrs.update_from_segments(segments)
+
+        self.assertTrue(attrs.is_slo)
+        self.assertEqual(123456789.12345, attrs.timestamp)
+        self.assertEqual('tag', attrs.slo_etag)
+        self.assertEqual(1234, attrs.slo_size)
+        # N.B. it's still a legacy manifest
+        self.assertFalse(attrs.is_legacy)
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/test_staticweb.py b/test/unit/common/middleware/test_staticweb.py
index 9b006bdea7..fab02ac0dd 100644
--- a/test/unit/common/middleware/test_staticweb.py
+++ b/test/unit/common/middleware/test_staticweb.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010 OpenStack, LLC.
+# Copyright (c) 2010 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,44 +13,64 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-try:
-    import simplejson as json
-except ImportError:
-    import json
+import json
 import unittest
-from contextlib import contextmanager
+from unittest import mock
 
-from swift.common.swob import Request, Response
-from swift.common.middleware import staticweb
-from test.unit import FakeLogger
-
-
-class FakeMemcache(object):
-
-    def __init__(self):
-        self.store = {}
+from urllib.parse import urlparse
 
-    def get(self, key):
-        return self.store.get(key)
-
-    def set(self, key, value, timeout=0):
-        self.store[key] = value
-        return True
-
-    def incr(self, key, timeout=0):
-        self.store[key] = self.store.setdefault(key, 0) + 1
-        return self.store[key]
+from swift.common.swob import Request, Response, HTTPUnauthorized
+from swift.common.middleware import staticweb
 
-    @contextmanager
-    def soft_lock(self, key, timeout=0, retries=5):
-        yield True
 
-    def delete(self, key):
-        try:
-            del self.store[key]
-        except Exception:
-            pass
-        return True
+meta_map = {
+    'c1': {'status': 401},
+    'c2': {},
+    'c3': {'meta': {'web-index': 'index.html',
+                    'web-listings': 't'}},
+    'c3b': {'meta': {'web-index': 'index.html',
+                     'web-listings': 't'}},
+    'c4': {'meta': {'web-index': 'index.html',
+                    'web-error': 'error.html',
+                    'web-listings': 't',
+                    'web-listings-css': 'listing.css',
+                    'web-directory-type': 'text/dir'}},
+    'c5': {'meta': {'web-index': 'index.html',
+                    'web-error': 'error.html',
+                    'web-listings': 't',
+                    'web-listings-css': 'listing.css'}},
+    'c6': {'meta': {'web-listings': 't',
+                    'web-error': 'error.html'}},
+    'c6b': {'meta': {'web-listings': 't',
+                     'web-listings-label': 'foo'}},
+    'c7': {'meta': {'web-listings': 'f',
+                    'web-error': 'error.html'}},
+    'c8': {'meta': {'web-error': 'error.html',
+                    'web-listings': 't',
+                    'web-listings-css':
+                    'http://localhost/stylesheets/listing.css'}},
+    'c9': {'meta': {'web-error': 'error.html',
+                    'web-listings': 't',
+                    'web-listings-css':
+                    '/absolute/listing.css'}},
+    'c10': {'meta': {'web-listings': 't'}},
+    'c11': {'meta': {'web-index': 'index.html'}},
+    'c11a': {'meta': {'web-index': 'index.html',
+             'web-directory-type': 'text/directory'}},
+    'c12': {'meta': {'web-index': 'index.html',
+                     'web-error': 'error.html'}},
+    'c13': {'meta': {'web-listings': 'f',
+                     'web-listings-css': 'listing.css'}},
+    'c14': {'meta': {'web-listings': 't'}},
+}
+
+
+def mock_get_container_info(env, app, swift_source='SW'):
+    container = env['PATH_INFO'].rstrip('/').split('/')[3]
+    container_info = meta_map[container]
+    container_info.setdefault('status', 200)
+    container_info.setdefault('read_acl', '.r:*')
+    return container_info
 
 
 class FakeApp(object):
@@ -61,6 +81,10 @@ def __init__(self, status_headers_body_iter=None):
 
     def __call__(self, env, start_response):
         self.calls += 1
+        if 'swift.authorize' in env:
+            resp = env['swift.authorize'](Request(env))
+            if resp:
+                return resp(env, start_response)
         if env['PATH_INFO'] == '/':
             return Response(status='404 Not Found')(env, start_response)
         elif env['PATH_INFO'] == '/v1':
@@ -71,15 +95,11 @@ def __call__(self, env, start_response):
         elif env['PATH_INFO'] == '/v1/a/c1':
             return Response(status='401 Unauthorized')(env, start_response)
         elif env['PATH_INFO'] == '/v1/a/c2':
-            return self.listing(env, start_response,
-                                {'x-container-read': '.r:*'})
+            return self.listing(env, start_response)
         elif env['PATH_INFO'] == '/v1/a/c2/one.txt':
             return Response(status='404 Not Found')(env, start_response)
         elif env['PATH_INFO'] == '/v1/a/c3':
-            return self.listing(env, start_response,
-                                {'x-container-read': '.r:*',
-                                 'x-container-meta-web-index': 'index.html',
-                                 'x-container-meta-web-listings': 't'})
+            return self.listing(env, start_response)
         elif env['PATH_INFO'] == '/v1/a/c3/index.html':
             return Response(status='200 Ok', body='''
 <html>
@@ -94,10 +114,7 @@ def __call__(self, env, start_response):
 </html>
             ''')(env, start_response)
         elif env['PATH_INFO'] == '/v1/a/c3b':
-            return self.listing(env, start_response,
-                                {'x-container-read': '.r:*',
-                                 'x-container-meta-web-index': 'index.html',
-                                 'x-container-meta-web-listings': 't'})
+            return self.listing(env, start_response)
         elif env['PATH_INFO'] == '/v1/a/c3b/index.html':
             resp = Response(status='204 No Content')
             resp.app_iter = iter([])
@@ -133,14 +150,10 @@ def __call__(self, env, start_response):
             return Response(status='404 Not Found')(env, start_response)
         elif env['PATH_INFO'] == '/v1/a/c4':
             self.get_c4_called = True
-            return self.listing(env, start_response,
-                          {'x-container-read': '.r:*',
-                           'x-container-meta-web-index': 'index.html',
-                           'x-container-meta-web-error': 'error.html',
-                           'x-container-meta-web-listings': 't',
-                           'x-container-meta-web-listings-css': 'listing.css'})
+            return self.listing(env, start_response)
         elif env['PATH_INFO'] == '/v1/a/c4/one.txt':
-            return Response(status='200 Ok',
+            return Response(
+                status='200 Ok',
                 headers={'x-object-meta-test': 'value'},
                 body='1')(env, start_response)
         elif env['PATH_INFO'] == '/v1/a/c4/two.txt':
@@ -161,15 +174,11 @@ def __call__(self, env, start_response):
 <html>
     <body style="background: #000000; color: #ffaaaa">
         <p>Chrome's 404 fancy-page sucks.</p>
-    <body>
-<html>
+    </body>
+</html>
             '''.strip())(env, start_response)
         elif env['PATH_INFO'] == '/v1/a/c5':
-            return self.listing(env, start_response,
-                                {'x-container-read': '.r:*',
-                                 'x-container-meta-web-index': 'index.html',
-                                 'x-container-meta-listings': 't',
-                                 'x-container-meta-web-error': 'error.html'})
+            return self.listing(env, start_response)
         elif env['PATH_INFO'] == '/v1/a/c5/index.html':
             return Response(status='503 Service Unavailable')(env,
                                                               start_response)
@@ -182,42 +191,100 @@ def __call__(self, env, start_response):
         elif env['PATH_INFO'] == '/v1/a/c5/404error.html':
             return Response(status='404 Not Found')(env, start_response)
         elif env['PATH_INFO'] == '/v1/a/c6':
-            return self.listing(env, start_response,
-                                {'x-container-read': '.r:*',
-                                 'x-container-meta-web-listings': 't'})
+            return self.listing(env, start_response)
+        elif env['PATH_INFO'] == '/v1/a/c6b':
+            return self.listing(env, start_response)
         elif env['PATH_INFO'] == '/v1/a/c6/subdir':
             return Response(status='404 Not Found')(env, start_response)
+        elif env['PATH_INFO'] == '/v1/a/c6/401error.html':
+            return Response(status='200 Ok', body='''
+<html>
+    <body style="background: #000000; color: #ffaaaa">
+        <p>Hey, you're not authorized to see this!</p>
+    </body>
+</html>
+            '''.strip())(env, start_response)
         elif env['PATH_INFO'] in ('/v1/a/c7', '/v1/a/c7/'):
-            return self.listing(env, start_response,
-                                {'x-container-read': '.r:*',
-                                 'x-container-meta-web-listings': 'f'})
+            return self.listing(env, start_response)
+        elif env['PATH_INFO'] == '/v1/a/c7/404error.html':
+            return Response(status='404 Not Found')(env, start_response)
+        elif env['PATH_INFO'] == '/v1/a/c7/401error.html':
+            return Response(status='200 Ok', body='''
+<html>
+    <body style="background: #000000; color: #ffaaaa">
+        <p>Hey, you're not authorized to see this!</p>
+    </body>
+</html>
+            '''.strip())(env, start_response)
         elif env['PATH_INFO'] in ('/v1/a/c8', '/v1/a/c8/'):
-            return self.listing(env, start_response,
-                          {'x-container-read': '.r:*',
-                           'x-container-meta-web-error': 'error.html',
-                           'x-container-meta-web-listings': 't',
-                           'x-container-meta-web-listings-css': \
-                               'http://localhost/stylesheets/listing.css'})
+            return self.listing(env, start_response)
         elif env['PATH_INFO'] == '/v1/a/c8/subdir/':
             return Response(status='404 Not Found')(env, start_response)
         elif env['PATH_INFO'] in ('/v1/a/c9', '/v1/a/c9/'):
-            return self.listing(env, start_response,
-                          {'x-container-read': '.r:*',
-                           'x-container-meta-web-error': 'error.html',
-                           'x-container-meta-web-listings': 't',
-                           'x-container-meta-web-listings-css': \
-                               '/absolute/listing.css'})
+            return self.listing(env, start_response)
         elif env['PATH_INFO'] == '/v1/a/c9/subdir/':
             return Response(status='404 Not Found')(env, start_response)
+        elif env['PATH_INFO'] in ('/v1/a/c10', '/v1/a/c10/'):
+            return self.listing(env, start_response)
+        elif env['PATH_INFO'] == '/v1/a/c10/\xe2\x98\x83/':
+            return Response(status='404 Not Found')(env, start_response)
+        elif env['PATH_INFO'] == '/v1/a/c10/\xe2\x98\x83/\xe2\x98\x83/':
+            return Response(status='404 Not Found')(env, start_response)
+        elif env['PATH_INFO'] in ('/v1/a/c11', '/v1/a/c11/'):
+            return self.listing(env, start_response)
+        elif env['PATH_INFO'] == '/v1/a/c11/subdir/':
+            return Response(status='200 Ok', headers={
+                'Content-Type': 'application/directory'})(
+                    env, start_response)
+        elif env['PATH_INFO'] == '/v1/a/c11/subdir/index.html':
+            return Response(status='200 Ok', body='''
+<html>
+    <body>
+        <h2>c11 subdir index</h2>
+    </body>
+</html>
+            '''.strip())(env, start_response)
+        elif env['PATH_INFO'] == '/v1/a/c11/subdir2/':
+            return Response(status='200 Ok', headers={'Content-Type':
+                            'application/directory'})(env, start_response)
+        elif env['PATH_INFO'] == '/v1/a/c11/subdir2/index.html':
+            return Response(status='404 Not Found')(env, start_response)
+        elif env['PATH_INFO'] in ('/v1/a/c11a', '/v1/a/c11a/'):
+            return self.listing(env, start_response)
+        elif env['PATH_INFO'] == '/v1/a/c11a/subdir/':
+            return Response(status='200 Ok', headers={'Content-Type':
+                            'text/directory'})(env, start_response)
+        elif env['PATH_INFO'] == '/v1/a/c11a/subdir/index.html':
+            return Response(status='404 Not Found')(env, start_response)
+        elif env['PATH_INFO'] == '/v1/a/c11a/subdir2/':
+            return Response(status='200 Ok', headers={'Content-Type':
+                            'application/directory'})(env, start_response)
+        elif env['PATH_INFO'] == '/v1/a/c11a/subdir2/index.html':
+            return Response(status='404 Not Found')(env, start_response)
+        elif env['PATH_INFO'] == '/v1/a/c11a/subdir3/':
+            return Response(status='200 Ok', headers={'Content-Type':
+                            'not_a/directory'})(env, start_response)
+        elif env['PATH_INFO'] == '/v1/a/c11a/subdir3/index.html':
+            return Response(status='404 Not Found')(env, start_response)
+        elif env['PATH_INFO'] == '/v1/a/c12/index.html':
+            return Response(status='200 Ok', body='index file')(env,
+                                                                start_response)
+        elif env['PATH_INFO'] == '/v1/a/c12/200error.html':
+            return Response(status='200 Ok', body='error file')(env,
+                                                                start_response)
+        elif env['PATH_INFO'] == '/v1/a/c14':
+            return self.listing(env, start_response)
         else:
             raise Exception('Unknown path %r' % env['PATH_INFO'])
 
-    def listing(self, env, start_response, headers):
-        if env['PATH_INFO'] in ('/v1/a/c3', '/v1/a/c4', '/v1/a/c8', \
-               '/v1/a/c9') and \
-               env['QUERY_STRING'] == 'delimiter=/&format=json&prefix=subdir/':
-            headers.update({'X-Container-Object-Count': '11',
-                            'X-Container-Bytes-Used': '73741',
+    def listing(self, env, start_response):
+        headers = {'x-container-read': '.r:*'}
+        if ((env['PATH_INFO'] in (
+                '/v1/a/c3', '/v1/a/c4', '/v1/a/c8', '/v1/a/c9'))
+            and (env['QUERY_STRING'] ==
+                 'delimiter=/&prefix=subdir/')):
+            headers.update({'X-Container-Object-Count': '12',
+                            'X-Container-Bytes-Used': '73763',
                             'X-Container-Read': '.r:*',
                             'Content-Type': 'application/json; charset=utf-8'})
             body = '''
@@ -232,16 +299,16 @@ def listing(self, env, start_response, headers):
                  {"subdir":"subdir3/subsubdir/"}]
             '''.strip()
         elif env['PATH_INFO'] == '/v1/a/c3' and env['QUERY_STRING'] == \
-                'delimiter=/&format=json&prefix=subdiry/':
-            headers.update({'X-Container-Object-Count': '11',
-                            'X-Container-Bytes-Used': '73741',
+                'delimiter=/&prefix=subdiry/':
+            headers.update({'X-Container-Object-Count': '12',
+                            'X-Container-Bytes-Used': '73763',
                             'X-Container-Read': '.r:*',
                             'Content-Type': 'application/json; charset=utf-8'})
             body = '[]'
         elif env['PATH_INFO'] == '/v1/a/c3' and env['QUERY_STRING'] == \
-                'limit=1&format=json&delimiter=/&limit=1&prefix=subdirz/':
-            headers.update({'X-Container-Object-Count': '11',
-                            'X-Container-Bytes-Used': '73741',
+                'limit=1&delimiter=/&prefix=subdirz/':
+            headers.update({'X-Container-Object-Count': '12',
+                            'X-Container-Bytes-Used': '73763',
                             'X-Container-Read': '.r:*',
                             'Content-Type': 'application/json; charset=utf-8'})
             body = '''
@@ -251,9 +318,9 @@ def listing(self, env, start_response, headers):
                   "last_modified":"2011-03-24T04:27:52.709100"}]
             '''.strip()
         elif env['PATH_INFO'] == '/v1/a/c6' and env['QUERY_STRING'] == \
-                'limit=1&format=json&delimiter=/&limit=1&prefix=subdir/':
-            headers.update({'X-Container-Object-Count': '11',
-                            'X-Container-Bytes-Used': '73741',
+                'limit=1&delimiter=/&prefix=subdir/':
+            headers.update({'X-Container-Object-Count': '12',
+                            'X-Container-Bytes-Used': '73763',
                             'X-Container-Read': '.r:*',
                             'X-Container-Web-Listings': 't',
                             'Content-Type': 'application/json; charset=utf-8'})
@@ -263,11 +330,35 @@ def listing(self, env, start_response, headers):
                   "content_type":"text/plain",
                   "last_modified":"2011-03-24T04:27:52.709100"}]
             '''.strip()
+        elif env['PATH_INFO'] == '/v1/a/c10' and (
+                env['QUERY_STRING'] ==
+                'delimiter=/&prefix=%E2%98%83/' or
+                env['QUERY_STRING'] ==
+                'delimiter=/&prefix=%E2%98%83/%E2%98%83/'):
+            headers.update({'X-Container-Object-Count': '12',
+                            'X-Container-Bytes-Used': '73763',
+                            'X-Container-Read': '.r:*',
+                            'X-Container-Web-Listings': 't',
+                            'Content-Type': 'application/json; charset=utf-8'})
+            body = '''
+                [{"name":"\u2603/\u2603/one.txt",
+                  "hash":"73f1dd69bacbf0847cc9cffa3c6b23a1", "bytes":22,
+                  "content_type":"text/plain",
+                  "last_modified":"2011-03-24T04:27:52.709100"},
+                 {"subdir":"\u2603/\u2603/"}]
+            '''.strip()
+        elif env['PATH_INFO'] == '/v1/a/c14' and env['QUERY_STRING'] == \
+                'delimiter=/':
+            headers.update({'X-Container-Object-Count': '0',
+                            'X-Container-Bytes-Used': '0',
+                            'X-Container-Read': '.r:*',
+                            'Content-Type': 'application/json; charset=utf-8'})
+            body = '[]'
         elif 'prefix=' in env['QUERY_STRING']:
             return Response(status='204 No Content')(env, start_response)
-        elif 'format=json' in env['QUERY_STRING']:
-            headers.update({'X-Container-Object-Count': '11',
-                            'X-Container-Bytes-Used': '73741',
+        else:
+            headers.update({'X-Container-Object-Count': '12',
+                            'X-Container-Bytes-Used': '73763',
                             'Content-Type': 'application/json; charset=utf-8'})
             body = '''
                 [{"name":"401error.html",
@@ -310,346 +401,574 @@ def listing(self, env, start_response, headers):
                   "last_modified":"2011-03-24T04:27:52.751260"},
                  {"name":"two.txt", "hash":"10abb84c63a5cff379fdfd6385918833",
                   "bytes":22, "content_type":"text/plain",
-                  "last_modified":"2011-03-24T04:27:52.825110"}]
+                  "last_modified":"2011-03-24T04:27:52.825110"},
+                 {"name":"\u2603/\u2603/one.txt",
+                  "hash":"73f1dd69bacbf0847cc9cffa3c6b23a1", "bytes":22,
+                  "content_type":"text/plain",
+                  "last_modified":"2011-03-24T04:27:52.935560"}]
             '''.strip()
-        else:
-            headers.update({'X-Container-Object-Count': '11',
-                            'X-Container-Bytes-Used': '73741',
-                            'Content-Type': 'text/plain; charset=utf-8'})
-            body = '\n'.join(['401error.html', '404error.html', 'index.html',
-                              'listing.css', 'one.txt', 'subdir/1.txt',
-                              'subdir/2.txt', u'subdir/\u2603.txt', 'subdir2',
-                              'subdir3/subsubdir/index.html', 'two.txt'])
         return Response(status='200 Ok', headers=headers,
                         body=body)(env, start_response)
 
 
+class FakeAuthFilter(object):
+
+    def __init__(self, app, deny_objects=False, deny_listing=False):
+        self.app = app
+        self.deny_objects = deny_objects
+        self.deny_listing = deny_listing
+
+    def authorize(self, req):
+        path_parts = req.path.strip('/').split('/')
+        if ((self.deny_objects and len(path_parts) > 3)
+                or (self.deny_listing and len(path_parts) == 3)):
+            return HTTPUnauthorized()
+
+    def __call__(self, env, start_response):
+        env['swift.authorize'] = self.authorize
+        return self.app(env, start_response)
+
+
 class TestStaticWeb(unittest.TestCase):
 
     def setUp(self):
         self.app = FakeApp()
-        self.test_staticweb = staticweb.filter_factory({})(self.app)
+        self.test_staticweb = FakeAuthFilter(
+            staticweb.filter_factory({})(self.app))
+        self._orig_get_container_info = staticweb.get_container_info
+        staticweb.get_container_info = mock_get_container_info
+
+    def tearDown(self):
+        staticweb.get_container_info = self._orig_get_container_info
 
     def test_app_set(self):
         app = FakeApp()
         sw = staticweb.filter_factory({})(app)
-        self.assertEquals(sw.app, app)
+        self.assertEqual(sw.app, app)
 
     def test_conf_set(self):
         conf = {'blah': 1}
         sw = staticweb.filter_factory(conf)(FakeApp())
-        self.assertEquals(sw.conf, conf)
-
-    def test_cache_timeout_unset(self):
-        sw = staticweb.filter_factory({})(FakeApp())
-        self.assertEquals(sw.cache_timeout, 300)
-
-    def test_cache_timeout_set(self):
-        sw = staticweb.filter_factory({'cache_timeout': '1'})(FakeApp())
-        self.assertEquals(sw.cache_timeout, 1)
+        self.assertEqual(sw.conf, conf)
 
     def test_root(self):
         resp = Request.blank('/').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 404)
+        self.assertEqual(resp.status_int, 404)
 
     def test_version(self):
         resp = Request.blank('/v1').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 412)
+        self.assertEqual(resp.status_int, 412)
 
     def test_account(self):
         resp = Request.blank('/v1/a').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 401)
+        self.assertEqual(resp.status_int, 401)
 
     def test_container1(self):
         resp = Request.blank('/v1/a/c1').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 401)
+        self.assertEqual(resp.status_int, 401)
 
     def test_container1_web_mode_explicitly_off(self):
         resp = Request.blank('/v1/a/c1',
-            headers={'x-web-mode': 'false'}).get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 401)
+                             headers={'x-web-mode': 'false'}).get_response(
+                                 self.test_staticweb)
+        self.assertEqual(resp.status_int, 401)
 
     def test_container1_web_mode_explicitly_on(self):
         resp = Request.blank('/v1/a/c1',
-            headers={'x-web-mode': 'true'}).get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 404)
+                             headers={'x-web-mode': 'true'}).get_response(
+                                 self.test_staticweb)
+        self.assertEqual(resp.status_int, 404)
 
     def test_container2(self):
         resp = Request.blank('/v1/a/c2').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(resp.content_type, 'text/plain')
-        self.assertEquals(len(resp.body.split('\n')),
-                          int(resp.headers['x-container-object-count']))
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.content_type, 'application/json')
+        self.assertEqual(len(json.loads(resp.body)),
+                         int(resp.headers['x-container-object-count']))
 
     def test_container2_web_mode_explicitly_off(self):
-        resp = Request.blank('/v1/a/c2',
+        resp = Request.blank(
+            '/v1/a/c2',
             headers={'x-web-mode': 'false'}).get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(resp.content_type, 'text/plain')
-        self.assertEquals(len(resp.body.split('\n')),
-                          int(resp.headers['x-container-object-count']))
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.content_type, 'application/json')
+        self.assertEqual(len(json.loads(resp.body)),
+                         int(resp.headers['x-container-object-count']))
 
     def test_container2_web_mode_explicitly_on(self):
-        resp = Request.blank('/v1/a/c2',
+        resp = Request.blank(
+            '/v1/a/c2',
             headers={'x-web-mode': 'true'}).get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 404)
+        self.assertEqual(resp.status_int, 404)
 
     def test_container2onetxt(self):
         resp = Request.blank(
-                '/v1/a/c2/one.txt').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 404)
+            '/v1/a/c2/one.txt').get_response(self.test_staticweb)
+        self.assertEqual(resp.status_int, 404)
 
     def test_container2json(self):
         resp = Request.blank(
-                '/v1/a/c2?format=json').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(resp.content_type, 'application/json')
-        self.assertEquals(len(json.loads(resp.body)),
-                          int(resp.headers['x-container-object-count']))
+            '/v1/a/c2').get_response(self.test_staticweb)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.content_type, 'application/json')
+        self.assertEqual(len(json.loads(resp.body)),
+                         int(resp.headers['x-container-object-count']))
 
     def test_container2json_web_mode_explicitly_off(self):
-        resp = Request.blank('/v1/a/c2?format=json',
+        resp = Request.blank(
+            '/v1/a/c2',
             headers={'x-web-mode': 'false'}).get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(resp.content_type, 'application/json')
-        self.assertEquals(len(json.loads(resp.body)),
-                          int(resp.headers['x-container-object-count']))
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.content_type, 'application/json')
+        self.assertEqual(len(json.loads(resp.body)),
+                         int(resp.headers['x-container-object-count']))
 
     def test_container2json_web_mode_explicitly_on(self):
-        resp = Request.blank('/v1/a/c2?format=json',
+        resp = Request.blank(
+            '/v1/a/c2',
             headers={'x-web-mode': 'true'}).get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 404)
+        self.assertEqual(resp.status_int, 404)
 
     def test_container3(self):
         resp = Request.blank('/v1/a/c3').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 301)
-        self.assertEquals(resp.headers['location'],
-                          'http://localhost/v1/a/c3/')
+        self.assertEqual(resp.status_int, 301)
+        self.assertEqual(resp.headers['location'],
+                         'http://localhost/v1/a/c3/')
 
     def test_container3indexhtml(self):
         resp = Request.blank('/v1/a/c3/').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 200)
-        self.assert_('Test main index.html file.' in resp.body)
-
-    def test_container3subdir(self):
-        resp = Request.blank(
-                '/v1/a/c3/subdir').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 301)
+        self.assertEqual(resp.status_int, 200)
+        self.assertIn(b'Test main index.html file.', resp.body)
+        self.assertNotIn('X-Backend-Content-Generator', resp.headers)
 
     def test_container3subsubdir(self):
         resp = Request.blank(
-                '/v1/a/c3/subdir3/subsubdir').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 301)
+            '/v1/a/c3/subdir3/subsubdir').get_response(self.test_staticweb)
+        self.assertEqual(resp.status_int, 301)
 
     def test_container3subsubdircontents(self):
         resp = Request.blank(
-               '/v1/a/c3/subdir3/subsubdir/').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(resp.body, 'index file')
+            '/v1/a/c3/subdir3/subsubdir/').get_response(self.test_staticweb)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.body, b'index file')
 
     def test_container3subdir(self):
         resp = Request.blank(
-                '/v1/a/c3/subdir/').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 200)
-        self.assert_('Listing of /v1/a/c3/subdir/' in resp.body)
-        self.assert_('</style>' in resp.body)
-        self.assert_('<link' not in resp.body)
-        self.assert_('listing.css' not in resp.body)
+            '/v1/a/c3/subdir/').get_response(self.test_staticweb)
+        self.assertEqual(resp.status_int, 200)
+        self.assertIn(b'Listing of /v1/a/c3/subdir/', resp.body)
+        self.assertIn(b'</style>', resp.body)
+        self.assertNotIn(b'<link', resp.body)
+        self.assertNotIn(b'listing.css', resp.body)
 
     def test_container3subdirx(self):
         resp = Request.blank(
-                '/v1/a/c3/subdirx/').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 404)
+            '/v1/a/c3/subdirx/').get_response(self.test_staticweb)
+        self.assertEqual(resp.status_int, 404)
 
     def test_container3subdiry(self):
         resp = Request.blank(
-                '/v1/a/c3/subdiry/').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 404)
+            '/v1/a/c3/subdiry/').get_response(self.test_staticweb)
+        self.assertEqual(resp.status_int, 404)
 
     def test_container3subdirz(self):
         resp = Request.blank(
-                '/v1/a/c3/subdirz').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 301)
+            '/v1/a/c3/subdirz').get_response(self.test_staticweb)
+        self.assertEqual(resp.status_int, 301)
 
     def test_container3unknown(self):
         resp = Request.blank(
-                '/v1/a/c3/unknown').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 404)
-        self.assert_("Chrome's 404 fancy-page sucks." not in resp.body)
+            '/v1/a/c3/unknown').get_response(self.test_staticweb)
+        self.assertEqual(resp.status_int, 404)
+        self.assertNotIn(b"Chrome's 404 fancy-page sucks.", resp.body)
 
     def test_container3bindexhtml(self):
         resp = Request.blank('/v1/a/c3b/').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 204)
-        self.assertEquals(resp.body, '')
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.body, b'')
 
     def test_container4indexhtml(self):
         resp = Request.blank('/v1/a/c4/').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 200)
-        self.assert_('Listing of /v1/a/c4/' in resp.body)
-        self.assert_('href="listing.css"' in resp.body)
+        self.assertEqual(resp.status_int, 200)
+        self.assertIn(b'Listing of /v1/a/c4/', resp.body)
+        self.assertIn(b'href="listing.css"', resp.body)
+        self.assertIn('X-Backend-Content-Generator', resp.headers)
+        self.assertEqual(resp.headers['X-Backend-Content-Generator'],
+                         'staticweb')
 
     def test_container4indexhtmlauthed(self):
+        # anonymous access gets staticweb
         resp = Request.blank('/v1/a/c4').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 301)
-        resp = Request.blank('/v1/a/c4',
-           environ={'REMOTE_USER': 'authed'}).get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 200)
-        resp = Request.blank('/v1/a/c4', headers={'x-web-mode': 't'},
-           environ={'REMOTE_USER': 'authed'}).get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 301)
+        self.assertEqual(resp.status_int, 301)
 
-    def test_container4unknown(self):
+        # authed access doesn't (by default)
         resp = Request.blank(
-                '/v1/a/c4/unknown').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 404)
-        self.assert_("Chrome's 404 fancy-page sucks." in resp.body)
-
-    def test_container4unknown_memcache(self):
-        fake_memcache = FakeMemcache()
-        self.assertEquals(fake_memcache.store, {})
-        resp = Request.blank('/v1/a/c4',
-            environ={'swift.cache': fake_memcache}
-        ).get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 301)
-        self.assertEquals(fake_memcache.store,
-           {'/staticweb/v1/a/c4':
-                ('index.html', 'error.html', 't', 'listing.css')})
-        self.assert_(self.test_staticweb.app.get_c4_called)
-        self.test_staticweb.app.get_c4_called = False
-        resp = Request.blank('/v1/a/c4',
-            environ={'swift.cache': fake_memcache}
+            '/v1/a/c4',
+            environ={'REMOTE_USER': 'authed'}).get_response(
+                self.test_staticweb)
+        self.assertEqual(resp.status_int, 200)
+
+        # it can opt-in, though!
+        resp = Request.blank(
+            '/v1/a/c4', headers={'x-web-mode': 't'},
+            environ={'REMOTE_USER': 'authed'}).get_response(
+                self.test_staticweb)
+        self.assertEqual(resp.status_int, 301)
+
+        # and there's an exclusion for authed-via-tempurl
+        resp = Request.blank(
+            '/v1/a/c4',
+            environ={'REMOTE_USER': '.wsgi.tempurl'}).get_response(
+                self.test_staticweb)
+        self.assertEqual(resp.status_int, 301)
+
+    def test_container4tempurl(self):
+        parts = [
+            'temp_url_prefix=subdir/',
+            'temp_url_sig=the-sig',
+            'temp_url_expires=2024-12-31T00:00:00'
+        ]
+
+        resp = Request.blank(
+            '/v1/a/c4/subdir/?' + '&'.join(parts),
+            environ={'REMOTE_USER': '.wsgi.tempurl'},
         ).get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 301)
-        self.assert_(not self.test_staticweb.app.get_c4_called)
-        self.assertEquals(fake_memcache.store,
-           {'/staticweb/v1/a/c4':
-                ('index.html', 'error.html', 't', 'listing.css')})
-        resp = Request.blank('/v1/a/c4',
-            environ={'swift.cache': fake_memcache, 'REQUEST_METHOD': 'PUT'}
+        self.assertEqual(resp.status_int, 200)
+        self.assertIn(b'Listing of /v1/a/c4/subdir/', resp.body)
+        self.assertIn(b'<a href="2.txt?temp_url_prefix=subdir/&amp;'
+                      b'temp_url_expires=2024-12-31T00%3A00%3A00&amp;'
+                      b'temp_url_sig=the-sig">2.txt</a>', resp.body)
+
+        parts.append('temp_url_ip_range=127.0.0.1')
+        resp = Request.blank(
+            '/v1/a/c4/subdir/?' + '&'.join(parts),
+            environ={'REMOTE_USER': '.wsgi.tempurl'},
         ).get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(fake_memcache.store, {})
-        resp = Request.blank('/v1/a/c4',
-            environ={'swift.cache': fake_memcache}
+        self.assertEqual(resp.status_int, 200)
+        self.assertIn(b'Listing of /v1/a/c4/subdir/', resp.body)
+        self.assertIn(b'<a href="2.txt?temp_url_prefix=subdir/&amp;'
+                      b'temp_url_expires=2024-12-31T00%3A00%3A00&amp;'
+                      b'temp_url_sig=the-sig&amp;temp_url_ip_range='
+                      b'127.0.0.1">2.txt</a>', resp.body)
+
+        parts.append('inline')
+        resp = Request.blank(
+            '/v1/a/c4/subdir/?' + '&'.join(parts),
+            environ={'REMOTE_USER': '.wsgi.tempurl'},
         ).get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 301)
-        self.assertEquals(fake_memcache.store,
-           {'/staticweb/v1/a/c4':
-                ('index.html', 'error.html', 't', 'listing.css')})
-        resp = Request.blank('/v1/a/c4',
-            environ={'swift.cache': fake_memcache, 'REQUEST_METHOD': 'POST'}
+        self.assertEqual(resp.status_int, 200)
+        self.assertIn(b'Listing of /v1/a/c4/subdir/', resp.body)
+        self.assertIn(b'<a href="2.txt?temp_url_prefix=subdir/&amp;'
+                      b'temp_url_expires=2024-12-31T00%3A00%3A00&amp;'
+                      b'temp_url_sig=the-sig&amp;temp_url_ip_range='
+                      b'127.0.0.1&amp;inline">2.txt</a>', resp.body)
+
+        # no prefix => you get normal links (which will almost certainly 401)
+        resp = Request.blank(
+            '/v1/a/c4/subdir/?' + '&'.join(parts[1:]),
+            environ={'REMOTE_USER': '.wsgi.tempurl'},
         ).get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(fake_memcache.store, {})
+        self.assertEqual(resp.status_int, 200)
+        self.assertIn(b'Listing of /v1/a/c4/subdir/', resp.body)
+        self.assertIn(b'<a href="2.txt">2.txt</a>', resp.body)
+
+    def test_container4unknown(self):
+        resp = Request.blank(
+            '/v1/a/c4/unknown').get_response(self.test_staticweb)
+        self.assertEqual(resp.status_int, 404)
+        self.assertIn(b"Chrome's 404 fancy-page sucks.", resp.body)
 
     def test_container4subdir(self):
         resp = Request.blank(
-                '/v1/a/c4/subdir/').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 200)
-        self.assert_('Listing of /v1/a/c4/subdir/' in resp.body)
-        self.assert_('</style>' not in resp.body)
-        self.assert_('<link' in resp.body)
-        self.assert_('href="../listing.css"' in resp.body)
-        self.assertEquals(resp.headers['content-type'],
-                          'text/html; charset=UTF-8')
+            '/v1/a/c4/subdir/').get_response(self.test_staticweb)
+        self.assertEqual(resp.status_int, 200)
+        self.assertIn(b'Listing of /v1/a/c4/subdir/', resp.body)
+        self.assertNotIn(b'</style>', resp.body)
+        self.assertIn(b'<link', resp.body)
+        self.assertIn(b'href="../listing.css"', resp.body)
+        self.assertEqual(resp.headers['content-type'],
+                         'text/html; charset=UTF-8')
 
     def test_container4onetxt(self):
         resp = Request.blank(
-                '/v1/a/c4/one.txt').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 200)
+            '/v1/a/c4/one.txt').get_response(self.test_staticweb)
+        self.assertEqual(resp.status_int, 200)
 
     def test_container4twotxt(self):
         resp = Request.blank(
-                '/v1/a/c4/two.txt').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 503)
+            '/v1/a/c4/two.txt').get_response(self.test_staticweb)
+        self.assertEqual(resp.status_int, 503)
 
     def test_container5indexhtml(self):
         resp = Request.blank('/v1/a/c5/').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 503)
+        self.assertEqual(resp.status_int, 503)
 
     def test_container5unknown(self):
         resp = Request.blank(
-                '/v1/a/c5/unknown').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 404)
-        self.assert_("Chrome's 404 fancy-page sucks." not in resp.body)
+            '/v1/a/c5/unknown').get_response(self.test_staticweb)
+        self.assertEqual(resp.status_int, 404)
+        self.assertNotIn(b"Chrome's 404 fancy-page sucks.", resp.body)
 
     def test_container6subdir(self):
         resp = Request.blank(
-                '/v1/a/c6/subdir').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 301)
+            '/v1/a/c6/subdir').get_response(self.test_staticweb)
+        self.assertEqual(resp.status_int, 301)
+
+    def test_container6listing(self):
+        # container6 has web-listings = t, web-error=error.html
+        resp = Request.blank('/v1/a/c6/').get_response(self.test_staticweb)
+        self.assertEqual(resp.status_int, 200)
+
+        # expect custom 401 if request is not auth'd for listing but is auth'd
+        # to GET objects
+        test_staticweb = FakeAuthFilter(
+            staticweb.filter_factory({})(self.app), deny_listing=True)
+        resp = Request.blank('/v1/a/c6/').get_response(test_staticweb)
+        self.assertEqual(resp.status_int, 401)
+        self.assertIn(b"Hey, you're not authorized to see this!", resp.body)
+
+        # expect default 401 if request is not auth'd for listing or object GET
+        test_staticweb = FakeAuthFilter(
+            staticweb.filter_factory({})(self.app), deny_listing=True,
+            deny_objects=True)
+        resp = Request.blank('/v1/a/c6/').get_response(test_staticweb)
+        self.assertEqual(resp.status_int, 401)
+        self.assertNotIn(b"Hey, you're not authorized to see this!", resp.body)
+
+    def test_container6blisting(self):
+        label = 'Listing of {0}/'.format(
+            meta_map['c6b']['meta']['web-listings-label'])
+        resp = Request.blank('/v1/a/c6b/').get_response(self.test_staticweb)
+        self.assertEqual(resp.status_int, 200)
+        self.assertIn(label.encode('utf-8'), resp.body)
 
     def test_container7listing(self):
+        # container7 has web-listings = f, web-error=error.html
         resp = Request.blank('/v1/a/c7/').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 404)
+        self.assertEqual(resp.status_int, 404)
+        self.assertIn(b"Web Listing Disabled", resp.body)
+
+        # expect 301 if auth'd but no trailing '/'
+        resp = Request.blank('/v1/a/c7').get_response(self.test_staticweb)
+        self.assertEqual(resp.status_int, 301)
+
+        # expect default 401 if request is not auth'd and no trailing '/'
+        test_staticweb = FakeAuthFilter(
+            staticweb.filter_factory({})(self.app), deny_listing=True,
+            deny_objects=True)
+        resp = Request.blank('/v1/a/c7').get_response(test_staticweb)
+        self.assertEqual(resp.status_int, 401)
+        self.assertNotIn(b"Hey, you're not authorized to see this!", resp.body)
+
+        # expect custom 401 if request is not auth'd for listing
+        test_staticweb = FakeAuthFilter(
+            staticweb.filter_factory({})(self.app), deny_listing=True)
+        resp = Request.blank('/v1/a/c7/').get_response(test_staticweb)
+        self.assertEqual(resp.status_int, 401)
+        self.assertIn(b"Hey, you're not authorized to see this!", resp.body)
+
+        # expect default 401 if request is not auth'd for listing or object GET
+        test_staticweb = FakeAuthFilter(
+            staticweb.filter_factory({})(self.app), deny_listing=True,
+            deny_objects=True)
+        resp = Request.blank('/v1/a/c7/').get_response(test_staticweb)
+        self.assertEqual(resp.status_int, 401)
+        self.assertNotIn(b"Hey, you're not authorized to see this!", resp.body)
 
     def test_container8listingcss(self):
         resp = Request.blank(
-                '/v1/a/c8/').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 200)
-        self.assert_('Listing of /v1/a/c8/' in resp.body)
-        self.assert_('<link' in resp.body)
-        self.assert_(
-                'href="http://localhost/stylesheets/listing.css"' in resp.body)
+            '/v1/a/c8/').get_response(self.test_staticweb)
+        self.assertEqual(resp.status_int, 200)
+        self.assertIn(b'Listing of /v1/a/c8/', resp.body)
+        self.assertIn(b'<link', resp.body)
+        self.assertIn(b'href="http://localhost/stylesheets/listing.css"',
+                      resp.body)
 
     def test_container8subdirlistingcss(self):
         resp = Request.blank(
-                '/v1/a/c8/subdir/').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 200)
-        self.assert_('Listing of /v1/a/c8/subdir/' in resp.body)
-        self.assert_('<link' in resp.body)
-        self.assert_(
-                'href="http://localhost/stylesheets/listing.css"' in resp.body)
+            '/v1/a/c8/subdir/').get_response(self.test_staticweb)
+        self.assertEqual(resp.status_int, 200)
+        self.assertIn(b'Listing of /v1/a/c8/subdir/', resp.body)
+        self.assertIn(b'<link', resp.body)
+        self.assertIn(b'href="http://localhost/stylesheets/listing.css"',
+                      resp.body)
 
     def test_container9listingcss(self):
         resp = Request.blank(
-                '/v1/a/c9/').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 200)
-        self.assert_('Listing of /v1/a/c9/' in resp.body)
-        self.assert_('<link' in resp.body)
-        self.assert_('href="/absolute/listing.css"' in resp.body)
+            '/v1/a/c9/').get_response(self.test_staticweb)
+        self.assertEqual(resp.status_int, 200)
+        self.assertIn(b'Listing of /v1/a/c9/', resp.body)
+        self.assertIn(b'<link', resp.body)
+        self.assertIn(b'href="/absolute/listing.css"', resp.body)
 
     def test_container9subdirlistingcss(self):
         resp = Request.blank(
-                '/v1/a/c9/subdir/').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 200)
-        self.assert_('Listing of /v1/a/c9/subdir/' in resp.body)
-        self.assert_('<link' in resp.body)
-        self.assert_('href="/absolute/listing.css"' in resp.body)
+            '/v1/a/c9/subdir/').get_response(self.test_staticweb)
+        self.assertEqual(resp.status_int, 200)
+        self.assertIn(b'Listing of /v1/a/c9/subdir/', resp.body)
+        self.assertIn(b'<link', resp.body)
+        self.assertIn(b'href="/absolute/listing.css"', resp.body)
+
+    def test_container10unicodesubdirlisting(self):
+        resp = Request.blank(
+            '/v1/a/c10/').get_response(self.test_staticweb)
+        self.assertEqual(resp.status_int, 200)
+        self.assertIn(b'Listing of /v1/a/c10/', resp.body)
+        resp = Request.blank(
+            '/v1/a/c10/\xe2\x98\x83/').get_response(self.test_staticweb)
+        self.assertEqual(resp.status_int, 200)
+        self.assertIn(b'Listing of /v1/a/c10/\xe2\x98\x83/', resp.body)
+        resp = Request.blank(
+            '/v1/a/c10/\xe2\x98\x83/\xe2\x98\x83/'
+        ).get_response(self.test_staticweb)
+        self.assertEqual(resp.status_int, 200)
+        self.assertIn(
+            b'Listing of /v1/a/c10/\xe2\x98\x83/\xe2\x98\x83/', resp.body)
+
+    def test_container11subdirmarkerobjectindex(self):
+        resp = Request.blank('/v1/a/c11/subdir/').get_response(
+            self.test_staticweb)
+        self.assertEqual(resp.status_int, 200)
+        self.assertIn(b'<h2>c11 subdir index</h2>', resp.body)
+
+    def test_container11subdirmarkermatchdirtype(self):
+        resp = Request.blank('/v1/a/c11a/subdir/').get_response(
+            self.test_staticweb)
+        self.assertEqual(resp.status_int, 404)
+        self.assertIn(b'Index File Not Found', resp.body)
+
+    def test_container11subdirmarkeraltdirtype(self):
+        resp = Request.blank('/v1/a/c11a/subdir2/').get_response(
+            self.test_staticweb)
+        self.assertEqual(resp.status_int, 200)
+
+    def test_container11subdirmarkerinvaliddirtype(self):
+        resp = Request.blank('/v1/a/c11a/subdir3/').get_response(
+            self.test_staticweb)
+        self.assertEqual(resp.status_int, 200)
+
+    def test_container12unredirectedrequest(self):
+        resp = Request.blank('/v1/a/c12/').get_response(
+            self.test_staticweb)
+        self.assertEqual(resp.status_int, 200)
+        self.assertIn(b'index file', resp.body)
+
+    def test_container13empty(self):
+        resp = Request.blank(
+            '/v1/a/c14/').get_response(self.test_staticweb)
+        self.assertEqual(resp.status_int, 200)
+        self.assertIn(b'Listing of /v1/a/c14/', resp.body)
+        self.assertIn(b'</style>', resp.body)
+        self.assertNotIn(b'<link', resp.body)
+        self.assertNotIn(b'listing.css', resp.body)
+        self.assertNotIn(b'<td', resp.body)
+
+    def test_container_404_has_css(self):
+        resp = Request.blank('/v1/a/c13/').get_response(
+            self.test_staticweb)
+        self.assertEqual(resp.status_int, 404)
+        self.assertIn(b'listing.css', resp.body)
+
+    def test_container_404_has_no_css(self):
+        resp = Request.blank('/v1/a/c7/').get_response(
+            self.test_staticweb)
+        self.assertEqual(resp.status_int, 404)
+        self.assertNotIn(b'listing.css', resp.body)
+        self.assertIn(b'<style', resp.body)
 
     def test_subrequest_once_if_possible(self):
         resp = Request.blank(
-                '/v1/a/c4/one.txt').get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(resp.headers['x-object-meta-test'], 'value')
-        self.assertEquals(resp.body, '1')
-        self.assertEquals(self.app.calls, 1)
-
-    def test_log_headers(self):
-        # Using a listing request since we know that calls StaticWeb's logging
-        # routines
-        self.test_staticweb.access_logger = FakeLogger()
-        self.test_staticweb.log_headers = True
-        req = Request.blank('/v1/a/c3/subdir/',
-                            headers={'test-header': 'test-value'})
-        resp = req.get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 200)
-        self.assert_('Listing of /v1/a/c3/subdir/' in resp.body)
-        infos = self.test_staticweb.access_logger.log_dict['info']
-        self.assertEquals(len(infos), 1)
-        info = infos[0][0][0]
-        self.assertTrue('Test-Header%3A%20test-value' in info, repr(info))
-
-        self.test_staticweb.access_logger = FakeLogger()
-        self.test_staticweb.log_headers = False
-        req = Request.blank('/v1/a/c3/subdir/',
-                            headers={'test-header': 'test-value'})
-        resp = req.get_response(self.test_staticweb)
-        self.assertEquals(resp.status_int, 200)
-        self.assert_('Listing of /v1/a/c3/subdir/' in resp.body)
-        infos = self.test_staticweb.access_logger.log_dict['info']
-        self.assertEquals(len(infos), 1)
-        info = infos[0][0][0]
-        self.assertTrue('Test-Header%3A%20test-value' not in info, repr(info))
+            '/v1/a/c4/one.txt').get_response(self.test_staticweb)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['x-object-meta-test'], 'value')
+        self.assertEqual(resp.body, b'1')
+        self.assertEqual(self.app.calls, 1)
+
+    def test_no_auth_middleware(self):
+        resp = Request.blank('/v1/a/c3').get_response(self.test_staticweb)
+        self.assertEqual(resp.status_int, 301)
+        # Test without an authentication middleware before staticweb
+        # This is no longer handled by staticweb middleware, thus not returning
+        # a 301 redirect
+        self.test_staticweb = staticweb.filter_factory({})(self.app)
+        resp = Request.blank('/v1/a/c3').get_response(self.test_staticweb)
+        self.assertEqual(resp.status_int, 200)
+
+    def test_subrequest_not_override_auth(self):
+        app_call = \
+            'swift.common.middleware.staticweb._StaticWebContext._app_call'
+        orig_app_call = staticweb._StaticWebContext._app_call
+        _fail = self.fail
+
+        def hook_app_call(self, env):
+            if 'swift.authorize_override' in env:
+                _fail('staticweb must not create authorize info by itself')
+            return orig_app_call(self, env)
+
+        with mock.patch(app_call, hook_app_call):
+            # testing for _listing container
+            resp = Request.blank('/v1/a/c4/').get_response(self.test_staticweb)
+            self.assertEqual(resp.status_int, 200)  # sanity
+
+            # testing for _listing object subdir
+            resp = Request.blank(
+                '/v1/a/c4/unknown').get_response(self.test_staticweb)
+            self.assertEqual(resp.status_int, 404)
+
+            # testing for _error_response
+            resp = Request.blank('/v1/a/c5/').get_response(self.test_staticweb)
+            self.assertEqual(resp.status_int, 503)  # sanity
+
+
+class TestStaticWebUrlBase(unittest.TestCase):
+
+    def setUp(self):
+        self.app = FakeApp()
+        self._orig_get_container_info = staticweb.get_container_info
+        staticweb.get_container_info = mock_get_container_info
+
+    def tearDown(self):
+        staticweb.get_container_info = self._orig_get_container_info
+
+    def test_container3subdirz_scheme(self):
+        path = '/v1/a/c3/subdirz'
+        scheme = 'https'
+        test_staticweb = FakeAuthFilter(
+            staticweb.filter_factory({'url_base': 'https://'})(self.app))
+        resp = Request.blank(path).get_response(test_staticweb)
+        self.assertEqual(resp.status_int, 301)
+        parsed = urlparse(resp.location)
+        self.assertEqual(parsed.scheme, scheme)
+        # We omit comparing netloc here, because swob is free to add port.
+        self.assertEqual(parsed.path, path + '/')
+
+    def test_container3subdirz_host(self):
+        path = '/v1/a/c3/subdirz'
+        netloc = 'example.com'
+        test_staticweb = FakeAuthFilter(
+            staticweb.filter_factory({
+                'url_base': '//%s' % (netloc,)})(self.app))
+        resp = Request.blank(path).get_response(test_staticweb)
+        self.assertEqual(resp.status_int, 301)
+        parsed = urlparse(resp.location)
+        # We compare scheme with the default. This may change, but unlikely.
+        self.assertEqual(parsed.scheme, 'http')
+        self.assertEqual(parsed.netloc, netloc)
+        self.assertEqual(parsed.path, path + '/')
+
+    def test_container3subdirz_both(self):
+        path = '/v1/a/c3/subdirz'
+        scheme = 'http'
+        netloc = 'example.com'
+        test_staticweb = FakeAuthFilter(
+            staticweb.filter_factory({
+                'url_base': 'http://example.com'})(self.app))
+        resp = Request.blank(path).get_response(test_staticweb)
+        self.assertEqual(resp.status_int, 301)
+        parsed = urlparse(resp.location)
+        self.assertEqual(parsed.scheme, scheme)
+        self.assertEqual(parsed.netloc, netloc)
+        self.assertEqual(parsed.path, path + '/')
 
 
 if __name__ == '__main__':
diff --git a/test/unit/common/middleware/test_subrequest_logging.py b/test/unit/common/middleware/test_subrequest_logging.py
new file mode 100644
index 0000000000..20b71dff67
--- /dev/null
+++ b/test/unit/common/middleware/test_subrequest_logging.py
@@ -0,0 +1,149 @@
+# Copyright (c) 2016-2017 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import unittest
+
+from swift.common.middleware import copy, proxy_logging
+from swift.common.swob import Request, HTTPOk
+from swift.common.utils import close_if_possible
+from swift.common.wsgi import make_subrequest
+from test.debug_logger import debug_logger
+from test.unit.common.middleware.helpers import FakeSwift
+
+
+SUB_GET_PATH = '/v1/a/c/sub_get'
+SUB_PUT_POST_PATH = '/v1/a/c/sub_put'
+
+
+class FakeFilter(object):
+    def __init__(self, app, conf, register):
+        self.body = ['FAKE MIDDLEWARE']
+        self.conf = conf
+        self.app = app
+        self.register = register
+        self.logger = None
+
+    def __call__(self, env, start_response):
+        path = SUB_PUT_POST_PATH
+        if env['REQUEST_METHOD'] == 'GET':
+            path = SUB_GET_PATH
+
+        # Make a subrequest that will be logged
+        hdrs = {'content-type': 'text/plain'}
+        sub_req = make_subrequest(env, path=path,
+                                  method=self.conf['subrequest_type'],
+                                  headers=hdrs,
+                                  agent='FakeApp',
+                                  swift_source='FA')
+        self.register(self.conf['subrequest_type'],
+                      path, HTTPOk, headers=hdrs)
+
+        resp = sub_req.get_response(self.app)
+        close_if_possible(resp.app_iter)
+
+        return self.app(env, start_response)
+
+
+class FakeApp(object):
+    def __init__(self, conf):
+        self.fake_logger = debug_logger()
+        self.fake_swift = self.app = FakeSwift()
+        self.register = self.fake_swift.register
+        for filter in reversed([
+                proxy_logging.filter_factory,
+                copy.filter_factory,
+                lambda conf: lambda app: FakeFilter(app, conf, self.register),
+                proxy_logging.filter_factory]):
+            self.app = filter(conf)(self.app)
+            self.app.logger = self.fake_logger
+            if hasattr(self.app, 'access_logger'):
+                self.app.access_logger = self.fake_logger
+
+        if conf['subrequest_type'] == 'GET':
+            self.register(conf['subrequest_type'], SUB_GET_PATH, HTTPOk, {})
+        else:
+            self.register(conf['subrequest_type'],
+                          SUB_PUT_POST_PATH, HTTPOk, {})
+
+    @property
+    def __call__(self):
+        return self.app.__call__
+
+
+class TestSubRequestLogging(unittest.TestCase):
+    path = '/v1/a/c/o'
+
+    def _test_subrequest_logged(self, subrequest_type):
+        # Test that subrequests made downstream from Copy PUT will be logged
+        # with the request type of the subrequest as opposed to the GET/PUT.
+
+        app = FakeApp({'subrequest_type': subrequest_type})
+
+        hdrs = {'content-type': 'text/plain', 'X-Copy-From': 'test/obj'}
+        req = Request.blank(self.path, method='PUT', headers=hdrs)
+
+        app.register('PUT', self.path, HTTPOk, headers=hdrs)
+        app.register('GET', '/v1/a/test/obj', HTTPOk, headers=hdrs)
+
+        req.get_response(app)
+        info_log_lines = app.fake_logger.get_lines_for_level('info')
+        self.assertEqual(len(info_log_lines), 4)
+        subreq_get = '%s %s' % (subrequest_type, SUB_GET_PATH)
+        subreq_put = '%s %s' % (subrequest_type, SUB_PUT_POST_PATH)
+        origput = 'PUT %s' % self.path
+        copyget = 'GET %s' % '/v1/a/test/obj'
+        # expect GET subreq, copy GET, PUT subreq, orig PUT
+        self.assertTrue(subreq_get in info_log_lines[0])
+        self.assertTrue(copyget in info_log_lines[1])
+        self.assertTrue(subreq_put in info_log_lines[2])
+        self.assertTrue(origput in info_log_lines[3])
+
+    def test_subrequest_logged_x_copy_from(self):
+        self._test_subrequest_logged('HEAD')
+        self._test_subrequest_logged('GET')
+        self._test_subrequest_logged('POST')
+        self._test_subrequest_logged('PUT')
+        self._test_subrequest_logged('DELETE')
+
+    def _test_subrequest_logged_POST(self, subrequest_type):
+        app = FakeApp({'subrequest_type': subrequest_type})
+
+        hdrs = {'content-type': 'text/plain'}
+        req = Request.blank(self.path, method='POST', headers=hdrs)
+
+        app.register('POST', self.path, HTTPOk, headers=hdrs)
+        expect_lines = 2
+
+        req.get_response(app)
+        info_log_lines = app.fake_logger.get_lines_for_level('info')
+        self.assertEqual(len(info_log_lines), expect_lines)
+        self.assertTrue('Copying object' not in info_log_lines[0])
+
+        subreq_put_post = '%s %s' % (subrequest_type, SUB_PUT_POST_PATH)
+        origpost = 'POST %s' % self.path
+
+        # fast post expect POST subreq, original POST
+        self.assertTrue(subreq_put_post in info_log_lines[0])
+        self.assertTrue(origpost in info_log_lines[1])
+
+    def test_subrequest_logged_with_POST(self):
+        self._test_subrequest_logged_POST('HEAD')
+        self._test_subrequest_logged_POST('GET')
+        self._test_subrequest_logged_POST('POST')
+        self._test_subrequest_logged_POST('PUT')
+        self._test_subrequest_logged_POST('DELETE')
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/test_symlink.py b/test/unit/common/middleware/test_symlink.py
new file mode 100644
index 0000000000..ed9418d406
--- /dev/null
+++ b/test/unit/common/middleware/test_symlink.py
@@ -0,0 +1,1473 @@
+#!/usr/bin/env python
+# Copyright (c) 2016 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+import io
+import json
+from unittest import mock
+
+from urllib.parse import parse_qs
+from swift.common import swob
+from swift.common.middleware import symlink, copy, versioned_writes, \
+    listing_formats
+from swift.common.swob import Request
+from swift.common.request_helpers import get_reserved_name
+from swift.common.utils import MD5_OF_EMPTY_STRING, Timestamp
+from swift.common.registry import get_swift_info
+from test.unit.common.middleware.helpers import FakeSwift
+from test.unit.common.middleware.test_versioned_writes import FakeCache
+
+
+class TestSymlinkMiddlewareBase(unittest.TestCase):
+    def setUp(self):
+        self.app = FakeSwift()
+        self.sym = symlink.filter_factory({
+            'symloop_max': '2',
+        })(self.app)
+        self.sym.logger = self.app.logger
+
+    def call_app(self, req, app=None, expect_exception=False):
+        if app is None:
+            app = self.app
+
+        self.authorized = []
+
+        def authorize(req):
+            self.authorized.append(req)
+
+        if 'swift.authorize' not in req.environ:
+            req.environ['swift.authorize'] = authorize
+
+        status = [None]
+        headers = [None]
+
+        def start_response(s, h, ei=None):
+            status[0] = s
+            headers[0] = h
+
+        body_iter = app(req.environ, start_response)
+        body = b''
+        caught_exc = None
+        try:
+            for chunk in body_iter:
+                body += chunk
+        except Exception as exc:
+            if expect_exception:
+                caught_exc = exc
+            else:
+                raise
+
+        if expect_exception:
+            return status[0], headers[0], body, caught_exc
+        else:
+            return status[0], headers[0], body
+
+    def call_sym(self, req, **kwargs):
+        return self.call_app(req, app=self.sym, **kwargs)
+
+
+class TestSymlinkMiddleware(TestSymlinkMiddlewareBase):
+
+    def test_symlink_info(self):
+        swift_info = get_swift_info()
+        self.assertEqual(swift_info['symlink'], {
+            'symloop_max': 2,
+            'static_links': True,
+        })
+
+    def test_symlink_simple_put(self):
+        self.app.register('PUT', '/v1/a/c/symlink', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/symlink', method='PUT',
+                            headers={'X-Symlink-Target': 'c1/o'},
+                            body='')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '201 Created')
+        method, path, hdrs = self.app.calls_with_headers[0]
+        val = hdrs.get('X-Object-Sysmeta-Symlink-Target')
+        self.assertEqual(val, 'c1/o')
+        self.assertNotIn('X-Object-Sysmeta-Symlink-Target-Account', hdrs)
+        val = hdrs.get('X-Object-Sysmeta-Container-Update-Override-Etag')
+        self.assertEqual(val, '%s; symlink_target=c1/o' % MD5_OF_EMPTY_STRING)
+        self.assertEqual('application/symlink', hdrs.get('Content-Type'))
+
+    def test_symlink_simple_put_with_content_type(self):
+        self.app.register('PUT', '/v1/a/c/symlink', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/symlink', method='PUT',
+                            headers={'X-Symlink-Target': 'c1/o',
+                                     'Content-Type': 'application/linkyfoo'},
+                            body='')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '201 Created')
+        method, path, hdrs = self.app.calls_with_headers[0]
+        val = hdrs.get('X-Object-Sysmeta-Symlink-Target')
+        self.assertEqual(val, 'c1/o')
+        self.assertNotIn('X-Object-Sysmeta-Symlink-Target-Account', hdrs)
+        val = hdrs.get('X-Object-Sysmeta-Container-Update-Override-Etag')
+        self.assertEqual(val, '%s; symlink_target=c1/o' % MD5_OF_EMPTY_STRING)
+        self.assertEqual('application/linkyfoo', hdrs.get('Content-Type'))
+
+    def test_symlink_simple_put_with_etag(self):
+        self.app.register('HEAD', '/v1/a/c1/o', swob.HTTPOk, {
+            'Etag': 'tgt-etag', 'Content-Length': 42,
+            'Content-Type': 'application/foo'})
+        self.app.register('PUT', '/v1/a/c/symlink', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/symlink', method='PUT',
+                            headers={
+                                'X-Symlink-Target': 'c1/o',
+                                'X-Symlink-Target-Etag': 'tgt-etag',
+                            }, body='')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '201 Created')
+        method, path, hdrs = self.app.calls_with_headers[1]
+        val = hdrs.get('X-Object-Sysmeta-Symlink-Target')
+        self.assertEqual(val, 'c1/o')
+        self.assertNotIn('X-Object-Sysmeta-Symlink-Target-Account', hdrs)
+        val = hdrs.get('X-Object-Sysmeta-Container-Update-Override-Etag')
+        self.assertEqual(val, '%s; symlink_target=c1/o; '
+                         'symlink_target_etag=tgt-etag; '
+                         'symlink_target_bytes=42' % MD5_OF_EMPTY_STRING)
+        self.assertEqual([
+            ('HEAD', '/v1/a/c1/o'),
+            ('PUT', '/v1/a/c/symlink'),
+        ], self.app.calls)
+        self.assertEqual('application/foo',
+                         self.app.call_list[-1].headers['Content-Type'])
+
+    def test_symlink_simple_put_with_quoted_etag(self):
+        self.app.register('HEAD', '/v1/a/c1/o', swob.HTTPOk, {
+            'Etag': 'tgt-etag', 'Content-Length': 42,
+            'Content-Type': 'application/foo'})
+        self.app.register('PUT', '/v1/a/c/symlink', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/symlink', method='PUT',
+                            headers={
+                                'X-Symlink-Target': 'c1/o',
+                                'X-Symlink-Target-Etag': '"tgt-etag"',
+                            }, body='')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '201 Created')
+        method, path, hdrs = self.app.calls_with_headers[1]
+        val = hdrs.get('X-Object-Sysmeta-Symlink-Target')
+        self.assertEqual(val, 'c1/o')
+        self.assertNotIn('X-Object-Sysmeta-Symlink-Target-Account', hdrs)
+        val = hdrs.get('X-Object-Sysmeta-Container-Update-Override-Etag')
+        self.assertEqual(val, '%s; symlink_target=c1/o; '
+                         'symlink_target_etag=tgt-etag; '
+                         'symlink_target_bytes=42' % MD5_OF_EMPTY_STRING)
+        self.assertEqual([
+            ('HEAD', '/v1/a/c1/o'),
+            ('PUT', '/v1/a/c/symlink'),
+        ], self.app.calls)
+        self.assertEqual('application/foo',
+                         self.app.call_list[-1].headers['Content-Type'])
+
+    def test_symlink_simple_put_with_etag_target_missing_content_type(self):
+        self.app.register('HEAD', '/v1/a/c1/o', swob.HTTPOk, {
+            'Etag': 'tgt-etag', 'Content-Length': 42})
+        self.app.register('PUT', '/v1/a/c/symlink', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/symlink', method='PUT',
+                            headers={
+                                'X-Symlink-Target': 'c1/o',
+                                'X-Symlink-Target-Etag': 'tgt-etag',
+                            }, body='')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '201 Created')
+        method, path, hdrs = self.app.calls_with_headers[1]
+        val = hdrs.get('X-Object-Sysmeta-Symlink-Target')
+        self.assertEqual(val, 'c1/o')
+        self.assertNotIn('X-Object-Sysmeta-Symlink-Target-Account', hdrs)
+        val = hdrs.get('X-Object-Sysmeta-Container-Update-Override-Etag')
+        self.assertEqual(val, '%s; symlink_target=c1/o; '
+                         'symlink_target_etag=tgt-etag; '
+                         'symlink_target_bytes=42' % MD5_OF_EMPTY_STRING)
+        self.assertEqual([
+            ('HEAD', '/v1/a/c1/o'),
+            ('PUT', '/v1/a/c/symlink'),
+        ], self.app.calls)
+        # N.B. the ObjectController would call _update_content_type on PUT
+        # regardless, but you actually can't get a HEAD response without swob
+        # setting a Content-Type
+        self.assertEqual('text/html; charset=UTF-8',
+                         self.app.call_list[-1].headers['Content-Type'])
+
+    def test_symlink_simple_put_with_etag_explicit_content_type(self):
+        self.app.register('HEAD', '/v1/a/c1/o', swob.HTTPOk, {
+            'Etag': 'tgt-etag', 'Content-Length': 42,
+            'Content-Type': 'application/foo'})
+        self.app.register('PUT', '/v1/a/c/symlink', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/symlink', method='PUT',
+                            headers={
+                                'X-Symlink-Target': 'c1/o',
+                                'X-Symlink-Target-Etag': 'tgt-etag',
+                                'Content-Type': 'application/bar',
+                            }, body='')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '201 Created')
+        method, path, hdrs = self.app.calls_with_headers[1]
+        val = hdrs.get('X-Object-Sysmeta-Symlink-Target')
+        self.assertEqual(val, 'c1/o')
+        self.assertNotIn('X-Object-Sysmeta-Symlink-Target-Account', hdrs)
+        val = hdrs.get('X-Object-Sysmeta-Container-Update-Override-Etag')
+        self.assertEqual(val, '%s; symlink_target=c1/o; '
+                         'symlink_target_etag=tgt-etag; '
+                         'symlink_target_bytes=42' % MD5_OF_EMPTY_STRING)
+        self.assertEqual([
+            ('HEAD', '/v1/a/c1/o'),
+            ('PUT', '/v1/a/c/symlink'),
+        ], self.app.calls)
+        self.assertEqual('application/bar',
+                         self.app.call_list[-1].headers['Content-Type'])
+
+    def test_symlink_simple_put_with_unmatched_etag(self):
+        self.app.register('HEAD', '/v1/a/c1/o', swob.HTTPOk, {
+            'Etag': 'tgt-etag', 'Content-Length': 42})
+        self.app.register('PUT', '/v1/a/c/symlink', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/symlink', method='PUT',
+                            headers={
+                                'X-Symlink-Target': 'c1/o',
+                                'X-Symlink-Target-Etag': 'not-tgt-etag',
+                            }, body='')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '409 Conflict')
+        self.assertIn(('Content-Location', '/v1/a/c1/o'), headers)
+        self.assertEqual(body, b"Object Etag 'tgt-etag' does not match "
+                         b"X-Symlink-Target-Etag header 'not-tgt-etag'")
+
+    def test_symlink_simple_put_to_non_existing_object(self):
+        self.app.register('HEAD', '/v1/a/c1/o', swob.HTTPNotFound, {})
+        req = Request.blank('/v1/a/c/symlink', method='PUT',
+                            headers={
+                                'X-Symlink-Target': 'c1/o',
+                                'X-Symlink-Target-Etag': 'not-tgt-etag',
+                            }, body='')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '409 Conflict')
+        self.assertIn(('Content-Location', '/v1/a/c1/o'), headers)
+        self.assertIn(b'does not exist', body)
+
+    def test_symlink_simple_put_error(self):
+        self.app.register('HEAD', '/v1/a/c1/o',
+                          swob.HTTPInternalServerError, {}, 'bad news')
+        req = Request.blank('/v1/a/c/symlink', method='PUT',
+                            headers={
+                                'X-Symlink-Target': 'c1/o',
+                                'X-Symlink-Target-Etag': 'not-tgt-etag',
+                            }, body='')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '500 Internal Error')
+        # this is a PUT response; so if we have a content-length...
+        self.assertGreater(int(dict(headers)['Content-Length']), 0)
+        # ... we better have a body!
+        self.assertIn(b'Internal Error', body)
+
+    def test_symlink_simple_put_to_non_existing_object_override(self):
+        self.app.register('HEAD', '/v1/a/c1/o', swob.HTTPNotFound, {})
+        self.app.register('PUT', '/v1/a/c/symlink', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/symlink', method='PUT',
+                            headers={
+                                'X-Symlink-Target': 'c1/o',
+                                'X-Symlink-Target-Etag': 'some-tgt-etag',
+                                # this header isn't normally sent with PUT
+                                'X-Symlink-Target-Bytes': '13',
+                            }, body='')
+        # this can be set in container_sync
+        req.environ['swift.symlink_override'] = True
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '201 Created')
+
+    def test_symlink_put_with_prevalidated_etag(self):
+        self.app.register('PUT', '/v1/a/c/symlink', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/symlink', method='PUT', headers={
+            'X-Symlink-Target': 'c1/o',
+            'X-Object-Sysmeta-Symlink-Target-Etag': 'tgt-etag',
+            'X-Object-Sysmeta-Symlink-Target-Bytes': '13',
+            'Content-Type': 'application/foo',
+        }, body='')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '201 Created')
+
+        self.assertEqual([
+            # N.B. no HEAD!
+            ('PUT', '/v1/a/c/symlink'),
+        ], self.app.calls)
+        self.assertEqual('application/foo',
+                         self.app.call_list[-1].headers['Content-Type'])
+
+        method, path, hdrs = self.app.calls_with_headers[0]
+        val = hdrs.get('X-Object-Sysmeta-Symlink-Target')
+        self.assertEqual(val, 'c1/o')
+        self.assertNotIn('X-Object-Sysmeta-Symlink-Target-Account', hdrs)
+        val = hdrs.get('X-Object-Sysmeta-Container-Update-Override-Etag')
+        self.assertEqual(val, '%s; symlink_target=c1/o; '
+                         'symlink_target_etag=tgt-etag; '
+                         'symlink_target_bytes=13' % MD5_OF_EMPTY_STRING)
+
+    def test_symlink_put_with_prevalidated_etag_sysmeta_incomplete(self):
+        req = Request.blank('/v1/a/c/symlink', method='PUT', headers={
+            'X-Symlink-Target': 'c1/o',
+            'X-Object-Sysmeta-Symlink-Target-Etag': 'tgt-etag',
+        }, body='')
+        with self.assertRaises(KeyError) as cm:
+            self.call_sym(req)
+        self.assertEqual(cm.exception.args[0], swob.header_to_environ_key(
+            'X-Object-Sysmeta-Symlink-Target-Bytes'))
+
+    def test_symlink_chunked_put(self):
+        self.app.register('PUT', '/v1/a/c/symlink', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/symlink', method='PUT',
+                            headers={'X-Symlink-Target': 'c1/o'},
+                            environ={'wsgi.input': io.BytesIO(b'')})
+        self.assertIsNone(req.content_length)  # sanity
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '201 Created')
+        method, path, hdrs = self.app.calls_with_headers[0]
+        val = hdrs.get('X-Object-Sysmeta-Symlink-Target')
+        self.assertEqual(val, 'c1/o')
+        self.assertNotIn('X-Object-Sysmeta-Symlink-Target-Account', hdrs)
+        val = hdrs.get('X-Object-Sysmeta-Container-Update-Override-Etag')
+        self.assertEqual(val, '%s; symlink_target=c1/o' % MD5_OF_EMPTY_STRING)
+
+    def test_symlink_chunked_put_error(self):
+        self.app.register('PUT', '/v1/a/c/symlink', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/symlink', method='PUT',
+                            headers={'X-Symlink-Target': 'c1/o'},
+                            environ={'wsgi.input':
+                                     io.BytesIO(b'this has a body')})
+        self.assertIsNone(req.content_length)  # sanity
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '400 Bad Request')
+
+    def test_symlink_put_different_account(self):
+        self.app.register('PUT', '/v1/a/c/symlink', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/symlink', method='PUT',
+                            headers={'X-Symlink-Target': 'c1/o',
+                                     'X-Symlink-Target-Account': 'a1'},
+                            body='')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '201 Created')
+        method, path, hdrs = self.app.calls_with_headers[0]
+        val = hdrs.get('X-Object-Sysmeta-Symlink-Target')
+        self.assertEqual(val, 'c1/o')
+        self.assertEqual(hdrs.get('X-Object-Sysmeta-Symlink-Target-Account'),
+                         'a1')
+
+    def test_symlink_put_leading_slash(self):
+        self.app.register('PUT', '/v1/a/c/symlink', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/symlink', method='PUT',
+                            headers={'X-Symlink-Target': '/c1/o'},
+                            body='')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '412 Precondition Failed')
+        self.assertEqual(body, b"X-Symlink-Target header must be of "
+                               b"the form <container name>/<object name>")
+
+    def test_symlink_put_non_zero_length(self):
+        req = Request.blank('/v1/a/c/symlink', method='PUT', body='req_body',
+                            headers={'X-Symlink-Target': 'c1/o'})
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '400 Bad Request')
+        self.assertEqual(body, b'Symlink requests require a zero byte body')
+
+    def test_symlink_put_bad_object_header(self):
+        req = Request.blank('/v1/a/c/symlink', method='PUT',
+                            headers={'X-Symlink-Target': 'o'},
+                            body='')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, "412 Precondition Failed")
+        self.assertEqual(body, b"X-Symlink-Target header must be of "
+                               b"the form <container name>/<object name>")
+
+    def test_symlink_put_bad_account_header(self):
+        req = Request.blank('/v1/a/c/symlink', method='PUT',
+                            headers={'X-Symlink-Target': 'c1/o',
+                                     'X-Symlink-Target-Account': 'a1/c1'},
+                            body='')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, "412 Precondition Failed")
+        self.assertEqual(body, b"Account name cannot contain slashes")
+
+    def test_get_symlink(self):
+        self.app.register('GET', '/v1/a/c/symlink', swob.HTTPOk,
+                          {'X-Object-Sysmeta-Symlink-Target': 'c1/o',
+                           'X-Object-Meta-Color': 'Red'})
+        req = Request.blank('/v1/a/c/symlink?symlink=get', method='GET')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '200 OK')
+        self.assertIsInstance(headers, list)
+        self.assertIn(('X-Symlink-Target', 'c1/o'), headers)
+        self.assertNotIn('X-Symlink-Target-Account', dict(headers))
+        self.assertIn(('X-Object-Meta-Color', 'Red'), headers)
+        self.assertEqual(body, b'')
+        # HEAD with same params find same registered GET
+        req = Request.blank('/v1/a/c/symlink?symlink=get', method='HEAD')
+        head_status, head_headers, head_body = self.call_sym(req)
+        self.assertEqual(head_status, '200 OK')
+        self.assertIn(('X-Symlink-Target', 'c1/o'), head_headers)
+        self.assertNotIn('X-Symlink-Target-Account', dict(head_headers))
+        self.assertIn(('X-Object-Meta-Color', 'Red'), head_headers)
+        self.assertEqual(head_body, b'')
+
+    def test_get_symlink_with_account(self):
+        self.app.register('GET', '/v1/a/c/symlink', swob.HTTPOk,
+                          {'X-Object-Sysmeta-Symlink-Target': 'c1/o',
+                           'X-Object-Sysmeta-Symlink-Target-Account': 'a2'})
+        req = Request.blank('/v1/a/c/symlink?symlink=get', method='GET')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '200 OK')
+        self.assertIn(('X-Symlink-Target', 'c1/o'), headers)
+        self.assertIn(('X-Symlink-Target-Account', 'a2'), headers)
+
+    def test_get_symlink_not_found(self):
+        self.app.register('GET', '/v1/a/c/symlink', swob.HTTPNotFound, {})
+        req = Request.blank('/v1/a/c/symlink', method='GET')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '404 Not Found')
+        self.assertNotIn('Content-Location', dict(headers))
+
+    def test_get_target_object(self):
+        self.app.register('GET', '/v1/a/c/symlink', swob.HTTPOk,
+                          {'X-Object-Sysmeta-Symlink-Target': 'c1/o',
+                           'X-Object-Sysmeta-Symlink-Target-Account': 'a2'})
+        self.app.register('GET', '/v1/a2/c1/o', swob.HTTPOk, {}, 'resp_body')
+        req_headers = {'X-Newest': 'True', 'X-Backend-Something': 'future'}
+        req = Request.blank('/v1/a/c/symlink', method='GET',
+                            headers=req_headers)
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(body, b'resp_body')
+        self.assertNotIn('X-Symlink-Target', dict(headers))
+        self.assertNotIn('X-Symlink-Target-Account', dict(headers))
+        self.assertIn(('Content-Location', '/v1/a2/c1/o'), headers)
+        calls = self.app.call_list
+        req_headers.update({
+            'Host': 'localhost:80',
+            'X-Backend-Ignore-Range-If-Metadata-Present':
+            'x-object-sysmeta-symlink-target',
+        })
+        self.assertEqual(req_headers, calls[0].headers)
+        req_headers['User-Agent'] = 'Swift'
+        self.assertEqual(req_headers, calls[1].headers)
+        self.assertFalse(calls[2:])
+        self.assertFalse(self.app.unread_requests)
+
+    def test_get_target_object_not_found(self):
+        self.app.register('GET', '/v1/a/c/symlink', swob.HTTPOk,
+                          {'X-Object-Sysmeta-Symlink-Target': 'c1/o',
+                           'X-Object-Sysmeta-Symlink-Target-account': 'a2'})
+        self.app.register('GET', '/v1/a2/c1/o', swob.HTTPNotFound, {}, '')
+        req = Request.blank('/v1/a/c/symlink', method='GET')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '404 Not Found')
+        self.assertEqual(body, b'')
+        self.assertNotIn('X-Symlink-Target', dict(headers))
+        self.assertNotIn('X-Symlink-Target-Account', dict(headers))
+        self.assertIn(('Content-Location', '/v1/a2/c1/o'), headers)
+        self.assertFalse(self.app.unread_requests)
+
+    def test_get_target_object_range_not_satisfiable(self):
+        self.app.register('GET', '/v1/a/c/symlink', swob.HTTPOk,
+                          {'X-Object-Sysmeta-Symlink-Target': 'c1/o',
+                           'X-Object-Sysmeta-Symlink-Target-Account': 'a2'})
+        self.app.register('GET', '/v1/a2/c1/o',
+                          swob.HTTPRequestedRangeNotSatisfiable, {}, '')
+        req = Request.blank('/v1/a/c/symlink', method='GET',
+                            headers={'Range': 'bytes=1-2'})
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '416 Requested Range Not Satisfiable')
+        self.assertEqual(
+            body, b'<html><h1>Requested Range Not Satisfiable</h1>'
+                  b'<p>The Range requested is not available.</p></html>')
+        self.assertNotIn('X-Symlink-Target', dict(headers))
+        self.assertNotIn('X-Symlink-Target-Account', dict(headers))
+        self.assertIn(('Content-Location', '/v1/a2/c1/o'), headers)
+        self.assertFalse(self.app.unread_requests)
+
+    def test_get_ec_symlink_range_unsatisfiable_can_redirect_to_target(self):
+        self.app.register('GET', '/v1/a/c/symlink',
+                          swob.HTTPRequestedRangeNotSatisfiable,
+                          {'X-Object-Sysmeta-Symlink-Target': 'c1/o',
+                           'X-Object-Sysmeta-Symlink-Target-Account': 'a2'})
+        self.app.register('GET', '/v1/a2/c1/o', swob.HTTPOk,
+                          {'Content-Range': 'bytes 1-2/10'}, 'es')
+        req = Request.blank('/v1/a/c/symlink', method='GET',
+                            headers={'Range': 'bytes=1-2'})
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(body, b'es')
+        self.assertNotIn('X-Symlink-Target', dict(headers))
+        self.assertNotIn('X-Symlink-Target-Account', dict(headers))
+        self.assertIn(('Content-Location', '/v1/a2/c1/o'), headers)
+        self.assertIn(('Content-Range', 'bytes 1-2/10'), headers)
+
+    def test_get_non_symlink(self):
+        # this is not symlink object
+        self.app.register('GET', '/v1/a/c/obj', swob.HTTPOk, {}, 'resp_body')
+        req = Request.blank('/v1/a/c/obj', method='GET')
+
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(body, b'resp_body')
+
+        # Assert special headers for symlink are not in response
+        self.assertNotIn('X-Symlink-Target', dict(headers))
+        self.assertNotIn('X-Symlink-Target-Account', dict(headers))
+        self.assertNotIn('Content-Location', dict(headers))
+
+    def test_get_static_link_mismatched_etag(self):
+        self.app.register('GET', '/v1/a/c/symlink', swob.HTTPOk,
+                          {'X-Object-Sysmeta-Symlink-Target': 'c1/o',
+                           'X-Object-Sysmeta-Symlink-Target-Etag': 'the-etag'})
+        # apparently target object was overwritten
+        self.app.register('GET', '/v1/a/c1/o', swob.HTTPOk,
+                          {'ETag': 'not-the-etag'}, 'resp_body')
+        req = Request.blank('/v1/a/c/symlink', method='GET')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '409 Conflict')
+        self.assertEqual(body, b"Object Etag 'not-the-etag' does not "
+                         b"match X-Symlink-Target-Etag header 'the-etag'")
+
+    def test_get_static_link_to_symlink(self):
+        self.app.register('GET', '/v1/a/c/static_link', swob.HTTPOk,
+                          {'X-Object-Sysmeta-Symlink-Target': 'c/symlink',
+                           'X-Object-Sysmeta-Symlink-Target-Etag': 'the-etag'})
+        self.app.register('GET', '/v1/a/c/symlink', swob.HTTPOk,
+                          {'ETag': 'the-etag',
+                           'X-Object-Sysmeta-Symlink-Target': 'c1/o'})
+        self.app.register('GET', '/v1/a/c1/o', swob.HTTPOk,
+                          {'ETag': 'not-the-etag'}, 'resp_body')
+        req = Request.blank('/v1/a/c/static_link', method='GET')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '200 OK')
+
+    def test_get_static_link_to_symlink_fails(self):
+        self.app.register('GET', '/v1/a/c/static_link', swob.HTTPOk,
+                          {'X-Object-Sysmeta-Symlink-Target': 'c/symlink',
+                           'X-Object-Sysmeta-Symlink-Target-Etag': 'the-etag'})
+        self.app.register('GET', '/v1/a/c/symlink', swob.HTTPOk,
+                          {'ETag': 'not-the-etag',
+                           'X-Object-Sysmeta-Symlink-Target': 'c1/o'})
+        req = Request.blank('/v1/a/c/static_link', method='GET')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '409 Conflict')
+        self.assertEqual(body, b"X-Symlink-Target-Etag headers do not match")
+
+    def put_static_link_to_symlink(self):
+        self.app.register('HEAD', '/v1/a/c/symlink', swob.HTTPOk,
+                          {'ETag': 'symlink-etag',
+                           'X-Object-Sysmeta-Symlink-Target': 'c/o',
+                           'Content-Type': 'application/symlink'})
+        self.app.register('HEAD', '/v1/a/c/o', swob.HTTPOk,
+                          {'ETag': 'tgt-etag',
+                           'Content-Type': 'application/data'}, 'resp_body')
+        self.app.register('PUT', '/v1/a/c/static_link', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/static_link', method='PUT',
+                            headers={
+                                'X-Symlink-Target': 'c/symlink',
+                                'X-Symlink-Target-Etag': 'symlink-etag',
+                            }, body='')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '201 Created')
+        self.assertEqual([], self.app.calls)
+        self.assertEqual('application/data',
+                         self.app.call_list[-1].headers['Content-Type'])
+
+    def test_head_symlink(self):
+        self.app.register('HEAD', '/v1/a/c/symlink', swob.HTTPOk,
+                          {'X-Object-Sysmeta-Symlink-Target': 'c1/o',
+                           'X-Object-Meta-Color': 'Red'})
+        req = Request.blank('/v1/a/c/symlink?symlink=get', method='HEAD')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '200 OK')
+        self.assertIn(('X-Symlink-Target', 'c1/o'), headers)
+        self.assertNotIn('X-Symlink-Target-Account', dict(headers))
+        self.assertIn(('X-Object-Meta-Color', 'Red'), headers)
+
+    def test_head_symlink_with_account(self):
+        self.app.register('HEAD', '/v1/a/c/symlink', swob.HTTPOk,
+                          {'X-Object-Sysmeta-Symlink-Target': 'c1/o',
+                           'X-Object-Sysmeta-Symlink-Target-Account': 'a2',
+                           'X-Object-Meta-Color': 'Red'})
+        req = Request.blank('/v1/a/c/symlink?symlink=get', method='HEAD')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '200 OK')
+        self.assertIn(('X-Symlink-Target', 'c1/o'), headers)
+        self.assertIn(('X-Symlink-Target-Account', 'a2'), headers)
+        self.assertIn(('X-Object-Meta-Color', 'Red'), headers)
+
+    def test_head_target_object(self):
+        # this test is also validating that the symlink metadata is not
+        # returned, but the target object metadata does return
+        self.app.register('HEAD', '/v1/a/c/symlink', swob.HTTPOk,
+                          {'X-Object-Sysmeta-Symlink-Target': 'c1/o',
+                           'X-Object-Sysmeta-Symlink-Target-Account': 'a2',
+                           'X-Object-Meta-Color': 'Red'})
+        self.app.register('HEAD', '/v1/a2/c1/o', swob.HTTPOk,
+                          {'X-Object-Meta-Color': 'Green'})
+        req_headers = {'X-Newest': 'True', 'X-Backend-Something': 'future'}
+        req = Request.blank('/v1/a/c/symlink', method='HEAD',
+                            headers=req_headers)
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '200 OK')
+        self.assertNotIn('X-Symlink-Target', dict(headers))
+        self.assertNotIn('X-Symlink-Target-Account', dict(headers))
+        self.assertNotIn(('X-Object-Meta-Color', 'Red'), headers)
+        self.assertIn(('X-Object-Meta-Color', 'Green'), headers)
+        self.assertIn(('Content-Location', '/v1/a2/c1/o'), headers)
+        calls = self.app.call_list
+        req_headers.update({
+            'Host': 'localhost:80',
+            'X-Backend-Ignore-Range-If-Metadata-Present':
+            'x-object-sysmeta-symlink-target',
+        })
+        self.assertEqual(req_headers, calls[0].headers)
+        req_headers['User-Agent'] = 'Swift'
+        self.assertEqual(req_headers, calls[1].headers)
+        self.assertFalse(calls[2:])
+
+    def test_get_symlink_to_reserved_object(self):
+        cont = get_reserved_name('versioned')
+        obj = get_reserved_name('symlink', '9999998765.99999')
+        symlink_target = "%s/%s" % (cont, obj)
+        version_path = '/v1/a/%s' % symlink_target
+        self.app.register('GET', '/v1/a/versioned/symlink', swob.HTTPOk, {
+            symlink.TGT_OBJ_SYSMETA_SYMLINK_HDR: symlink_target,
+            symlink.ALLOW_RESERVED_NAMES: 'true',
+            'x-object-sysmeta-symlink-target-etag': MD5_OF_EMPTY_STRING,
+            'x-object-sysmeta-symlink-target-bytes': '0',
+        })
+        self.app.register('GET', version_path, swob.HTTPOk, {})
+        req = Request.blank('/v1/a/versioned/symlink', headers={
+            'Range': 'foo', 'If-Match': 'bar'})
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '200 OK')
+        self.assertIn(('Content-Location', version_path), headers)
+        self.assertEqual(len(self.authorized), 1)
+        self.assertNotIn('X-Backend-Allow-Reserved-Names',
+                         self.app.calls_with_headers[0])
+        call_headers = self.app.call_list[1].headers
+        self.assertEqual('true', call_headers[
+            'X-Backend-Allow-Reserved-Names'])
+        self.assertEqual('foo', call_headers['Range'])
+        self.assertEqual('bar', call_headers['If-Match'])
+
+    def test_get_symlink_to_reserved_symlink(self):
+        cont = get_reserved_name('versioned')
+        obj = get_reserved_name('symlink', '9999998765.99999')
+        symlink_target = "%s/%s" % (cont, obj)
+        version_path = '/v1/a/%s' % symlink_target
+        self.app.register('GET', '/v1/a/versioned/symlink', swob.HTTPOk, {
+            symlink.TGT_OBJ_SYSMETA_SYMLINK_HDR: symlink_target,
+            symlink.ALLOW_RESERVED_NAMES: 'true',
+            'x-object-sysmeta-symlink-target-etag': MD5_OF_EMPTY_STRING,
+            'x-object-sysmeta-symlink-target-bytes': '0',
+        })
+        self.app.register('GET', version_path, swob.HTTPOk, {
+            symlink.TGT_OBJ_SYSMETA_SYMLINK_HDR: 'unversioned/obj',
+            'ETag': MD5_OF_EMPTY_STRING,
+        })
+        self.app.register('GET', '/v1/a/unversioned/obj', swob.HTTPOk, {
+        })
+        req = Request.blank('/v1/a/versioned/symlink')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '200 OK')
+        self.assertIn(('Content-Location', '/v1/a/unversioned/obj'), headers)
+        self.assertEqual(len(self.authorized), 2)
+
+    def test_symlink_too_deep(self):
+        self.app.register('GET', '/v1/a/c/symlink', swob.HTTPOk,
+                          {'X-Object-Sysmeta-Symlink-Target': 'c/sym1'})
+        self.app.register('GET', '/v1/a/c/sym1', swob.HTTPOk,
+                          {'X-Object-Sysmeta-Symlink-Target': 'c/sym2'})
+        self.app.register('GET', '/v1/a/c/sym2', swob.HTTPOk,
+                          {'X-Object-Sysmeta-Symlink-Target': 'c/o'})
+        req = Request.blank('/v1/a/c/symlink', method='HEAD')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '409 Conflict')
+        self.assertEqual(body, b'')
+        req = Request.blank('/v1/a/c/symlink')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '409 Conflict')
+        self.assertEqual(body, b'Too many levels of symbolic links, '
+                         b'maximum allowed is 2')
+
+    def test_symlink_change_symloopmax(self):
+        # similar test to test_symlink_too_deep, but now changed the limit to 3
+        self.sym = symlink.filter_factory({
+            'symloop_max': '3',
+        })(self.app)
+        self.sym.logger = self.app.logger
+        self.app.register('HEAD', '/v1/a/c/symlink', swob.HTTPOk,
+                          {'X-Object-Sysmeta-Symlink-Target': 'c/sym1'})
+        self.app.register('HEAD', '/v1/a/c/sym1', swob.HTTPOk,
+                          {'X-Object-Sysmeta-Symlink-Target': 'c/sym2'})
+        self.app.register('HEAD', '/v1/a/c/sym2', swob.HTTPOk,
+                          {'X-Object-Sysmeta-Symlink-Target': 'c/o',
+                           'X-Object-Meta-Color': 'Red'})
+        self.app.register('HEAD', '/v1/a/c/o', swob.HTTPOk,
+                          {'X-Object-Meta-Color': 'Green'})
+        req = Request.blank('/v1/a/c/symlink', method='HEAD')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '200 OK')
+
+        # assert that the correct metadata was returned
+        self.assertNotIn(('X-Object-Meta-Color', 'Red'), headers)
+        self.assertIn(('X-Object-Meta-Color', 'Green'), headers)
+
+    def test_sym_to_sym_to_target(self):
+        # this test is also validating that the symlink metadata is not
+        # returned, but the target object metadata does return
+        self.app.register('HEAD', '/v1/a/c/symlink', swob.HTTPOk,
+                          {'X-Object-Sysmeta-Symlink-Target': 'c/sym1',
+                           'X-Object-Meta-Color': 'Red'})
+        self.app.register('HEAD', '/v1/a/c/sym1', swob.HTTPOk,
+                          {'X-Object-Sysmeta-Symlink-Target': 'c1/o',
+                           'X-Object-Meta-Color': 'Yellow'})
+        self.app.register('HEAD', '/v1/a/c1/o', swob.HTTPOk,
+                          {'X-Object-Meta-Color': 'Green'})
+        req = Request.blank('/v1/a/c/symlink', method='HEAD')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '200 OK')
+        self.assertNotIn(('X-Symlink-Target', 'c1/o'), headers)
+        self.assertNotIn(('X-Symlink-Target-Account', 'a2'), headers)
+        self.assertNotIn(('X-Object-Meta-Color', 'Red'), headers)
+        self.assertNotIn(('X-Object-Meta-Color', 'Yellow'), headers)
+        self.assertIn(('X-Object-Meta-Color', 'Green'), headers)
+        self.assertIn(('Content-Location', '/v1/a/c1/o'), headers)
+
+    def test_symlink_post(self):
+        self.app.register('POST', '/v1/a/c/symlink', swob.HTTPAccepted,
+                          {'X-Object-Sysmeta-Symlink-Target': 'c1/o'})
+        req = Request.blank('/v1/a/c/symlink', method='POST',
+                            headers={'X-Object-Meta-Color': 'Red'})
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '307 Temporary Redirect')
+        self.assertEqual(
+            body,
+            b'The requested POST was applied to a symlink. POST '
+            b'directly to the target to apply requested metadata.')
+        method, path, hdrs = self.app.calls_with_headers[0]
+        val = hdrs.get('X-Object-Meta-Color')
+        self.assertEqual(val, 'Red')
+
+    def test_non_symlink_post(self):
+        self.app.register('POST', '/v1/a/c/o', swob.HTTPAccepted, {})
+        req = Request.blank('/v1/a/c/o', method='POST',
+                            headers={'X-Object-Meta-Color': 'Red'})
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '202 Accepted')
+
+    def test_set_symlink_POST_fail(self):
+        # Setting a link with a POST request is not allowed
+        req = Request.blank('/v1/a/c/o', method='POST',
+                            headers={'X-Symlink-Target': 'c1/regular_obj'})
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '400 Bad Request')
+        self.assertEqual(body, b"A PUT request is required to set a symlink "
+                         b"target")
+
+    def test_symlink_post_but_fail_at_server(self):
+        self.app.register('POST', '/v1/a/c/o', swob.HTTPNotFound, {})
+        req = Request.blank('/v1/a/c/o', method='POST',
+                            headers={'X-Object-Meta-Color': 'Red'})
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '404 Not Found')
+
+    def test_validate_and_prep_request_headers(self):
+        def do_test(headers):
+            req = Request.blank('/v1/a/c/o', method='PUT',
+                                headers=headers)
+            symlink._validate_and_prep_request_headers(req)
+
+        # normal cases
+        do_test({'X-Symlink-Target': 'c1/o1'})
+        do_test({'X-Symlink-Target': 'c1/sub/o1'})
+        do_test({'X-Symlink-Target': 'c1%2Fo1'})
+        # specify account
+        do_test({'X-Symlink-Target': 'c1/o1',
+                 'X-Symlink-Target-Account': 'another'})
+        # URL encoded is safe
+        do_test({'X-Symlink-Target': 'c1%2Fo1'})
+        # URL encoded + multibytes is also safe
+        target = u'\u30b0\u30e9\u30d6\u30eb/\u30a2\u30ba\u30ec\u30f3'
+        target = swob.bytes_to_wsgi(target.encode('utf8'))
+        do_test({'X-Symlink-Target': target})
+        do_test({'X-Symlink-Target': swob.wsgi_quote(target)})
+
+        target = swob.bytes_to_wsgi(u'\u30b0\u30e9\u30d6\u30eb'.encode('utf8'))
+        do_test(
+            {'X-Symlink-Target': 'cont/obj',
+             'X-Symlink-Target-Account': target})
+        do_test(
+            {'X-Symlink-Target': 'cont/obj',
+             'X-Symlink-Target-Account': swob.wsgi_quote(target)})
+
+    def test_validate_and_prep_request_headers_invalid_format(self):
+        def do_test(headers, status, err_msg):
+            req = Request.blank('/v1/a/c/o', method='PUT',
+                                headers=headers)
+            with self.assertRaises(swob.HTTPException) as cm:
+                symlink._validate_and_prep_request_headers(req)
+
+            self.assertEqual(cm.exception.status, status)
+            self.assertEqual(cm.exception.body, err_msg)
+
+        do_test({'X-Symlink-Target': '/c1/o1'},
+                '412 Precondition Failed',
+                b'X-Symlink-Target header must be of the '
+                b'form <container name>/<object name>')
+        do_test({'X-Symlink-Target': 'c1o1'},
+                '412 Precondition Failed',
+                b'X-Symlink-Target header must be of the '
+                b'form <container name>/<object name>')
+        do_test({'X-Symlink-Target': 'c1/o1',
+                 'X-Symlink-Target-Account': '/another'},
+                '412 Precondition Failed',
+                b'Account name cannot contain slashes')
+        do_test({'X-Symlink-Target': 'c1/o1',
+                 'X-Symlink-Target-Account': 'an/other'},
+                '412 Precondition Failed',
+                b'Account name cannot contain slashes')
+        # url encoded case
+        do_test({'X-Symlink-Target': '%2Fc1%2Fo1'},
+                '412 Precondition Failed',
+                b'X-Symlink-Target header must be of the '
+                b'form <container name>/<object name>')
+        do_test({'X-Symlink-Target': 'c1/o1',
+                 'X-Symlink-Target-Account': '%2Fanother'},
+                '412 Precondition Failed',
+                b'Account name cannot contain slashes')
+        do_test({'X-Symlink-Target': 'c1/o1',
+                 'X-Symlink-Target-Account': 'an%2Fother'},
+                '412 Precondition Failed',
+                b'Account name cannot contain slashes')
+        # with multi-bytes
+        target = u'/\u30b0\u30e9\u30d6\u30eb/\u30a2\u30ba\u30ec\u30f3'
+        target = swob.bytes_to_wsgi(target.encode('utf8'))
+        do_test(
+            {'X-Symlink-Target': target},
+            '412 Precondition Failed',
+            b'X-Symlink-Target header must be of the '
+            b'form <container name>/<object name>')
+        do_test(
+            {'X-Symlink-Target': swob.wsgi_quote(target)},
+            '412 Precondition Failed',
+            b'X-Symlink-Target header must be of the '
+            b'form <container name>/<object name>')
+        account = u'\u30b0\u30e9\u30d6\u30eb/\u30a2\u30ba\u30ec\u30f3'
+        account = swob.bytes_to_wsgi(account.encode('utf8'))
+        do_test(
+            {'X-Symlink-Target': 'c/o',
+             'X-Symlink-Target-Account': account},
+            '412 Precondition Failed',
+            b'Account name cannot contain slashes')
+        do_test(
+            {'X-Symlink-Target': 'c/o',
+             'X-Symlink-Target-Account': swob.wsgi_quote(account)},
+            '412 Precondition Failed',
+            b'Account name cannot contain slashes')
+
+    def test_validate_and_prep_request_headers_points_to_itself(self):
+        req = Request.blank('/v1/a/c/o', method='PUT',
+                            headers={'X-Symlink-Target': 'c/o'})
+        with self.assertRaises(swob.HTTPException) as cm:
+            symlink._validate_and_prep_request_headers(req)
+        self.assertEqual(cm.exception.status, '400 Bad Request')
+        self.assertEqual(cm.exception.body, b'Symlink cannot target itself')
+
+        # Even if set account to itself, it will fail as well
+        req = Request.blank('/v1/a/c/o', method='PUT',
+                            headers={'X-Symlink-Target': 'c/o',
+                                     'X-Symlink-Target-Account': 'a'})
+        with self.assertRaises(swob.HTTPException) as cm:
+            symlink._validate_and_prep_request_headers(req)
+        self.assertEqual(cm.exception.status, '400 Bad Request')
+        self.assertEqual(cm.exception.body, b'Symlink cannot target itself')
+
+        # sanity, the case to another account is safe
+        req = Request.blank('/v1/a/c/o', method='PUT',
+                            headers={'X-Symlink-Target': 'c/o',
+                                     'X-Symlink-Target-Account': 'a1'})
+        symlink._validate_and_prep_request_headers(req)
+
+    def test_symloop_max_config(self):
+        self.app = FakeSwift()
+        # sanity
+        self.sym = symlink.filter_factory({
+            'symloop_max': '1',
+        })(self.app)
+        self.assertEqual(self.sym.symloop_max, 1)
+        # < 1 case will result in default
+        self.sym = symlink.filter_factory({
+            'symloop_max': '-1',
+        })(self.app)
+        self.assertEqual(self.sym.symloop_max, symlink.DEFAULT_SYMLOOP_MAX)
+
+
+class SymlinkCopyingTestCase(TestSymlinkMiddlewareBase):
+    # verify interaction of copy and symlink middlewares
+
+    def setUp(self):
+        self.app = FakeSwift()
+        conf = {'symloop_max': '2'}
+        self.sym = symlink.filter_factory(conf)(self.app)
+        self.sym.logger = self.app.logger
+        self.copy = copy.filter_factory({})(self.sym)
+
+    def call_copy(self, req, **kwargs):
+        return self.call_app(req, app=self.copy, **kwargs)
+
+    def test_copy_symlink_target(self):
+        req = Request.blank('/v1/a/src_cont/symlink', method='COPY',
+                            headers={'Destination': 'tgt_cont/tgt_obj'})
+        self._test_copy_symlink_target(req)
+        req = Request.blank('/v1/a/tgt_cont/tgt_obj', method='PUT',
+                            headers={'X-Copy-From': 'src_cont/symlink'})
+        self._test_copy_symlink_target(req)
+
+    def _test_copy_symlink_target(self, req):
+        self.app.register('GET', '/v1/a/src_cont/symlink', swob.HTTPOk,
+                          {'X-Object-Sysmeta-Symlink-Target': 'c1/o',
+                           'X-Object-Sysmeta-Symlink-Target-Account': 'a2'})
+        self.app.register('GET', '/v1/a2/c1/o', swob.HTTPOk, {}, 'resp_body')
+        self.app.register('PUT', '/v1/a/tgt_cont/tgt_obj', swob.HTTPCreated,
+                          {}, 'resp_body')
+        status, headers, body = self.call_copy(req)
+        method, path, hdrs = self.app.calls_with_headers[0]
+        self.assertEqual(method, 'GET')
+        self.assertEqual(path, '/v1/a/src_cont/symlink')
+        self.assertEqual('/src_cont/symlink', hdrs.get('X-Copy-From'))
+        method, path, hdrs = self.app.calls_with_headers[1]
+        self.assertEqual(method, 'GET')
+        self.assertEqual(path, '/v1/a2/c1/o')
+        self.assertEqual('/src_cont/symlink', hdrs.get('X-Copy-From'))
+        method, path, hdrs = self.app.calls_with_headers[2]
+        self.assertEqual(method, 'PUT')
+        val = hdrs.get('X-Object-Sysmeta-Symlink-Target')
+        # this is raw object copy
+        self.assertEqual(val, None)
+        self.assertEqual(status, '201 Created')
+
+    def test_copy_symlink(self):
+        req = Request.blank(
+            '/v1/a/src_cont/symlink?symlink=get', method='COPY',
+            headers={'Destination': 'tgt_cont/tgt_obj'})
+        self._test_copy_symlink(req)
+        req = Request.blank(
+            '/v1/a/tgt_cont/tgt_obj?symlink=get', method='PUT',
+            headers={'X-Copy-From': 'src_cont/symlink'})
+        self._test_copy_symlink(req)
+
+    def _test_copy_symlink(self, req):
+        self.app.register('GET', '/v1/a/src_cont/symlink', swob.HTTPOk,
+                          {'X-Object-Sysmeta-Symlink-Target': 'c1/o',
+                           'X-Object-Sysmeta-Symlink-Target-Account': 'a2'})
+        self.app.register('PUT', '/v1/a/tgt_cont/tgt_obj', swob.HTTPCreated,
+                          {'X-Symlink-Target': 'c1/o',
+                           'X-Symlink-Target-Account': 'a2'})
+        status, headers, body = self.call_copy(req)
+        self.assertEqual(status, '201 Created')
+        method, path, hdrs = self.app.calls_with_headers[0]
+        self.assertEqual(method, 'GET')
+        self.assertEqual(path, '/v1/a/src_cont/symlink?symlink=get')
+        self.assertEqual('/src_cont/symlink', hdrs.get('X-Copy-From'))
+        method, path, hdrs = self.app.calls_with_headers[1]
+        val = hdrs.get('X-Object-Sysmeta-Symlink-Target')
+        self.assertEqual(val, 'c1/o')
+        self.assertEqual(
+            hdrs.get('X-Object-Sysmeta-Symlink-Target-Account'), 'a2')
+
+    def test_copy_symlink_new_target(self):
+        req = Request.blank(
+            '/v1/a/src_cont/symlink?symlink=get', method='COPY',
+            headers={'Destination': 'tgt_cont/tgt_obj',
+                     'X-Symlink-Target': 'new_cont/new_obj',
+                     'X-Symlink-Target-Account': 'new_acct'})
+        self._test_copy_symlink_new_target(req)
+        req = Request.blank(
+            '/v1/a/tgt_cont/tgt_obj?symlink=get', method='PUT',
+            headers={'X-Copy-From': 'src_cont/symlink',
+                     'X-Symlink-Target': 'new_cont/new_obj',
+                     'X-Symlink-Target-Account': 'new_acct'})
+        self._test_copy_symlink_new_target(req)
+
+    def _test_copy_symlink_new_target(self, req):
+        self.app.register('GET', '/v1/a/src_cont/symlink', swob.HTTPOk,
+                          {'X-Object-Sysmeta-Symlink-Target': 'c1/o',
+                           'X-Object-Sysmeta-Symlink-Target-Account': 'a2'})
+        self.app.register('PUT', '/v1/a/tgt_cont/tgt_obj', swob.HTTPCreated,
+                          {'X-Symlink-Target': 'c1/o',
+                           'X-Symlink-Target-Account': 'a2'})
+        status, headers, body = self.call_copy(req)
+        self.assertEqual(status, '201 Created')
+        method, path, hdrs = self.app.calls_with_headers[0]
+        self.assertEqual(method, 'GET')
+        self.assertEqual(path, '/v1/a/src_cont/symlink?symlink=get')
+        self.assertEqual('/src_cont/symlink', hdrs.get('X-Copy-From'))
+        method, path, hdrs = self.app.calls_with_headers[1]
+        self.assertEqual(method, 'PUT')
+        self.assertEqual(path, '/v1/a/tgt_cont/tgt_obj?symlink=get')
+        val = hdrs.get('X-Object-Sysmeta-Symlink-Target')
+        self.assertEqual(val, 'new_cont/new_obj')
+        self.assertEqual(hdrs.get('X-Object-Sysmeta-Symlink-Target-Account'),
+                         'new_acct')
+
+    def test_copy_symlink_with_slo_query(self):
+        req = Request.blank(
+            '/v1/a/src_cont/symlink?multipart-manifest=get&symlink=get',
+            method='COPY', headers={'Destination': 'tgt_cont/tgt_obj'})
+        self._test_copy_symlink_with_slo_query(req)
+        req = Request.blank(
+            '/v1/a/tgt_cont/tgt_obj?multipart-manifest=get&symlink=get',
+            method='PUT', headers={'X-Copy-From': 'src_cont/symlink'})
+        self._test_copy_symlink_with_slo_query(req)
+
+    def _test_copy_symlink_with_slo_query(self, req):
+        self.app.register('GET', '/v1/a/src_cont/symlink', swob.HTTPOk,
+                          {'X-Object-Sysmeta-Symlink-Target': 'c1/o',
+                           'X-Object-Sysmeta-Symlink-Target-Account': 'a2'})
+        self.app.register('PUT', '/v1/a/tgt_cont/tgt_obj', swob.HTTPCreated,
+                          {'X-Symlink-Target': 'c1/o',
+                           'X-Symlink-Target-Account': 'a2'})
+        status, headers, body = self.call_copy(req)
+        self.assertEqual(status, '201 Created')
+        method, path, hdrs = self.app.calls_with_headers[0]
+        self.assertEqual(method, 'GET')
+        path, query = path.split('?')
+        query_dict = parse_qs(query)
+        self.assertEqual(
+            path, '/v1/a/src_cont/symlink')
+        self.assertEqual(
+            query_dict,
+            {'multipart-manifest': ['get'], 'symlink': ['get'],
+             'format': ['raw']})
+        self.assertEqual('/src_cont/symlink', hdrs.get('X-Copy-From'))
+        method, path, hdrs = self.app.calls_with_headers[1]
+        val = hdrs.get('X-Object-Sysmeta-Symlink-Target')
+        self.assertEqual(val, 'c1/o')
+        self.assertEqual(
+            hdrs.get('X-Object-Sysmeta-Symlink-Target-Account'), 'a2')
+
+    def test_static_link_to_new_slo_manifest(self):
+        self.app.register('HEAD', '/v1/a/c1/o', swob.HTTPOk, {
+            'X-Static-Large-Object': 'True',
+            'Etag': 'manifest-etag',
+            'X-Object-Sysmeta-Slo-Size': '1048576',
+            'X-Object-Sysmeta-Slo-Etag': 'this-is-not-used',
+            'Content-Length': 42,
+            'Content-Type': 'application/big-data',
+            'X-Object-Sysmeta-Container-Update-Override-Etag':
+            '956859738870e5ca6aa17eeda58e4df0; '
+            'slo_etag=71e938d37c1d06dc634dd24660255a88',
+
+        })
+        self.app.register('PUT', '/v1/a/c/symlink', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/symlink', method='PUT',
+                            headers={
+                                'X-Symlink-Target': 'c1/o',
+                                'X-Symlink-Target-Etag': 'manifest-etag',
+                            }, body='')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '201 Created')
+        self.assertEqual([
+            ('HEAD', '/v1/a/c1/o'),
+            ('PUT', '/v1/a/c/symlink'),
+        ], self.app.calls)
+        method, path, hdrs = self.app.calls_with_headers[-1]
+        self.assertEqual('application/big-data', hdrs['Content-Type'])
+        self.assertEqual(hdrs['X-Object-Sysmeta-Symlink-Target'], 'c1/o')
+        self.assertEqual(hdrs['X-Object-Sysmeta-Symlink-Target-Etag'],
+                         'manifest-etag')
+        self.assertEqual(hdrs['X-Object-Sysmeta-Symlink-Target-Bytes'],
+                         '1048576')
+        self.assertEqual(
+            hdrs['X-Object-Sysmeta-Container-Update-Override-Etag'],
+            'd41d8cd98f00b204e9800998ecf8427e; '
+            'slo_etag=71e938d37c1d06dc634dd24660255a88; '
+            'symlink_target=c1/o; '
+            'symlink_target_etag=manifest-etag; '
+            'symlink_target_bytes=1048576')
+
+    def test_static_link_to_old_slo_manifest(self):
+        self.app.register('HEAD', '/v1/a/c1/o', swob.HTTPOk, {
+            'X-Static-Large-Object': 'True',
+            'Etag': 'manifest-etag',
+            'X-Object-Sysmeta-Slo-Size': '1048576',
+            'X-Object-Sysmeta-Slo-Etag': '71e938d37c1d06dc634dd24660255a88',
+            'Content-Length': 42,
+            'Content-Type': 'application/big-data',
+
+        })
+        self.app.register('PUT', '/v1/a/c/symlink', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/symlink', method='PUT',
+                            headers={
+                                'X-Symlink-Target': 'c1/o',
+                                'X-Symlink-Target-Etag': 'manifest-etag',
+                            }, body='')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '201 Created')
+        self.assertEqual([
+            ('HEAD', '/v1/a/c1/o'),
+            ('PUT', '/v1/a/c/symlink'),
+        ], self.app.calls)
+        method, path, hdrs = self.app.calls_with_headers[-1]
+        self.assertEqual('application/big-data', hdrs['Content-Type'])
+        self.assertEqual(hdrs['X-Object-Sysmeta-Symlink-Target'], 'c1/o')
+        self.assertEqual(hdrs['X-Object-Sysmeta-Symlink-Target-Etag'],
+                         'manifest-etag')
+        self.assertEqual(hdrs['X-Object-Sysmeta-Symlink-Target-Bytes'],
+                         '1048576')
+        self.assertEqual(
+            hdrs['X-Object-Sysmeta-Container-Update-Override-Etag'],
+            'd41d8cd98f00b204e9800998ecf8427e; '
+            'slo_etag=71e938d37c1d06dc634dd24660255a88; '
+            'symlink_target=c1/o; '
+            'symlink_target_etag=manifest-etag; '
+            'symlink_target_bytes=1048576')
+
+    def test_static_link_to_really_old_slo_manifest(self):
+        self.app.register('HEAD', '/v1/a/c1/o', swob.HTTPOk, {
+            'X-Static-Large-Object': 'True',
+            'Etag': 'manifest-etag',
+            'Content-Length': 42,
+            'Content-Type': 'application/big-data',
+
+        })
+        self.app.register('PUT', '/v1/a/c/symlink', swob.HTTPCreated, {})
+        req = Request.blank('/v1/a/c/symlink', method='PUT',
+                            headers={
+                                'X-Symlink-Target': 'c1/o',
+                                'X-Symlink-Target-Etag': 'manifest-etag',
+                            }, body='')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '201 Created')
+        self.assertEqual([
+            ('HEAD', '/v1/a/c1/o'),
+            ('PUT', '/v1/a/c/symlink'),
+        ], self.app.calls)
+        method, path, hdrs = self.app.calls_with_headers[-1]
+        self.assertEqual('application/big-data', hdrs['Content-Type'])
+        self.assertEqual(hdrs['X-Object-Sysmeta-Symlink-Target'], 'c1/o')
+        self.assertEqual(hdrs['X-Object-Sysmeta-Symlink-Target-Etag'],
+                         'manifest-etag')
+        # symlink m/w is doing a HEAD, it's not going to going to read the
+        # manifest body and sum up the bytes - so we just use manifest size
+        self.assertEqual(hdrs['X-Object-Sysmeta-Symlink-Target-Bytes'],
+                         '42')
+        # no slo_etag, and target_bytes is manifest
+        self.assertEqual(
+            hdrs['X-Object-Sysmeta-Container-Update-Override-Etag'],
+            'd41d8cd98f00b204e9800998ecf8427e; '
+            'symlink_target=c1/o; '
+            'symlink_target_etag=manifest-etag; '
+            'symlink_target_bytes=42')
+
+    def test_static_link_to_slo_manifest_slo_etag(self):
+        self.app.register('HEAD', '/v1/a/c1/o', swob.HTTPOk, {
+            'Etag': 'manifest-etag',
+            'X-Object-Sysmeta-Slo-Etag': 'slo-etag',
+            'Content-Length': 42,
+        })
+        self.app.register('PUT', '/v1/a/c/symlink', swob.HTTPCreated, {})
+        # unquoted slo-etag doesn't match
+        req = Request.blank('/v1/a/c/symlink', method='PUT',
+                            headers={
+                                'X-Symlink-Target': 'c1/o',
+                                'X-Symlink-Target-Etag': 'slo-etag',
+                            }, body='')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '409 Conflict')
+        # the quoted slo-etag is tolerated, but still doesn't match
+        req = Request.blank('/v1/a/c/symlink', method='PUT',
+                            headers={
+                                'X-Symlink-Target': 'c1/o',
+                                'X-Symlink-Target-Etag': '"slo-etag"',
+                            }, body='')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '409 Conflict')
+
+
+class SymlinkVersioningTestCase(TestSymlinkMiddlewareBase):
+    # verify interaction of versioned_writes and symlink middlewares
+
+    def setUp(self):
+        self.app = FakeSwift()
+        conf = {'symloop_max': '2'}
+        self.sym = symlink.filter_factory(conf)(self.app)
+        self.sym.logger = self.app.logger
+        vw_conf = {'allow_versioned_writes': 'true'}
+        self.vw = versioned_writes.filter_factory(vw_conf)(self.sym)
+
+    def call_vw(self, req, **kwargs):
+        return self.call_app(req, app=self.vw, **kwargs)
+
+    def assertRequestEqual(self, req, other):
+        self.assertEqual(req.method, other.method)
+        self.assertEqual(req.path, other.path)
+
+    def test_new_symlink_version_success(self):
+        ts = Timestamp.now()
+        self.app.register(
+            'PUT', '/v1/a/c/symlink', swob.HTTPCreated,
+            {'X-Symlink-Target': 'new_cont/new_tgt',
+             'X-Symlink-Target-Account': 'a'}, None)
+        self.app.register(
+            'GET', '/v1/a/c/symlink', swob.HTTPOk,
+            {'last-modified': 'Thu, 1 Jan 1970 00:00:01 GMT',
+             'x-timestamp': ts.normal,
+             'X-Object-Sysmeta-Symlink-Target': 'old_cont/old_tgt',
+             'X-Object-Sysmeta-Symlink-Target-Account': 'a'},
+            '')
+        self.app.register(
+            'PUT', '/v1/a/ver_cont/007symlink/%s' % ts.normal,
+            swob.HTTPCreated,
+            {'X-Symlink-Target': 'old_cont/old_tgt',
+             'X-Symlink-Target-Account': 'a'}, None)
+        cache = FakeCache({'sysmeta': {'versions-location': 'ver_cont'}})
+        req = Request.blank(
+            '/v1/a/c/symlink',
+            headers={'X-Symlink-Target': 'new_cont/new_tgt'},
+            environ={'REQUEST_METHOD': 'PUT', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '0',
+                     'swift.trans_id': 'fake_trans_id'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '201 Created')
+        # authorized twice now because versioned_writes now makes a check on
+        # PUT
+        self.assertEqual(len(self.authorized), 2)
+        self.assertRequestEqual(req, self.authorized[0])
+        self.assertEqual(['VW', 'VW', None], self.app.swift_sources)
+        self.assertEqual({'fake_trans_id'}, set(self.app.txn_ids))
+        calls = self.app.calls_with_headers
+        method, path, req_headers = calls[2]
+        self.assertEqual('PUT', method)
+        self.assertEqual('/v1/a/c/symlink', path)
+        self.assertEqual(
+            'new_cont/new_tgt',
+            req_headers['X-Object-Sysmeta-Symlink-Target'])
+
+    def test_delete_latest_version_no_marker_success(self):
+        self.app.register(
+            'GET',
+            '/v1/a/ver_cont?prefix=003sym/&marker=&reverse=on',
+            swob.HTTPOk, {},
+            '[{"hash": "y", '
+            '"last_modified": "2014-11-21T14:23:02.206740", '
+            '"bytes": 0, '
+            '"name": "003sym/2", '
+            '"content_type": "text/plain"}, '
+            '{"hash": "x", '
+            '"last_modified": "2014-11-21T14:14:27.409100", '
+            '"bytes": 0, '
+            '"name": "003sym/1", '
+            '"content_type": "text/plain"}]')
+        self.app.register(
+            'GET', '/v1/a/ver_cont/003sym/2', swob.HTTPCreated,
+            {'content-length': '0',
+             'X-Object-Sysmeta-Symlink-Target': 'c/tgt'}, None)
+        self.app.register(
+            'PUT', '/v1/a/c/sym', swob.HTTPCreated,
+            {'X-Symlink-Target': 'c/tgt', 'X-Symlink-Target-Account': 'a'},
+            None)
+        self.app.register(
+            'DELETE', '/v1/a/ver_cont/003sym/2', swob.HTTPOk,
+            {}, None)
+
+        cache = FakeCache({'sysmeta': {'versions-location': 'ver_cont'}})
+        req = Request.blank(
+            '/v1/a/c/sym',
+            headers={'X-If-Delete-At': 1},
+            environ={'REQUEST_METHOD': 'DELETE', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '0', 'swift.trans_id': 'fake_trans_id'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+        self.assertEqual(4, self.app.call_count)
+        self.assertEqual(['VW', 'VW', 'VW', 'VW'], self.app.swift_sources)
+        self.assertEqual({'fake_trans_id'}, set(self.app.txn_ids))
+        calls = self.app.calls_with_headers
+        method, path, req_headers = calls[2]
+        self.assertEqual('PUT', method)
+        self.assertEqual('/v1/a/c/sym', path)
+        self.assertEqual(
+            'c/tgt',
+            req_headers['X-Object-Sysmeta-Symlink-Target'])
+
+
+class TestSymlinkContainerContext(TestSymlinkMiddlewareBase):
+
+    def setUp(self):
+        super(TestSymlinkContainerContext, self).setUp()
+        self.context = symlink.SymlinkContainerContext(
+            self.sym.app, self.sym.logger)
+
+    def test_extract_symlink_path_json_simple_etag(self):
+        obj_dict = {"bytes": 6,
+                    "last_modified": "1",
+                    "hash": "etag",
+                    "name": "obj",
+                    "content_type": "application/octet-stream"}
+        obj_dict = self.context._extract_symlink_path_json(
+            obj_dict, 'v1', 'AUTH_a')
+        self.assertEqual(obj_dict['hash'], 'etag')
+        self.assertNotIn('symlink_path', obj_dict)
+
+    def test_extract_symlink_path_json_symlink_path(self):
+        obj_dict = {"bytes": 6,
+                    "last_modified": "1",
+                    "hash": "etag; symlink_target=c/o; something_else=foo; "
+                    "symlink_target_etag=tgt_etag; symlink_target_bytes=8",
+                    "name": "obj",
+                    "content_type": "application/octet-stream"}
+        obj_dict = self.context._extract_symlink_path_json(
+            obj_dict, 'v1', 'AUTH_a')
+        self.assertEqual(obj_dict['hash'], 'etag; something_else=foo')
+        self.assertEqual(obj_dict['symlink_path'], '/v1/AUTH_a/c/o')
+        self.assertEqual(obj_dict['symlink_etag'], 'tgt_etag')
+        self.assertEqual(obj_dict['symlink_bytes'], 8)
+
+    def test_extract_symlink_path_json_symlink_path_and_account(self):
+        obj_dict = {
+            "bytes": 6,
+            "last_modified": "1",
+            "hash": "etag; symlink_target=c/o; symlink_target_account=AUTH_a2",
+            "name": "obj",
+            "content_type": "application/octet-stream"}
+        obj_dict = self.context._extract_symlink_path_json(
+            obj_dict, 'v1', 'AUTH_a')
+        self.assertEqual(obj_dict['hash'], 'etag')
+        self.assertEqual(obj_dict['symlink_path'], '/v1/AUTH_a2/c/o')
+
+    def test_extract_symlink_path_json_extra_key(self):
+        obj_dict = {"bytes": 6,
+                    "last_modified": "1",
+                    "hash": "etag; symlink_target=c/o; extra_key=value",
+                    "name": "obj",
+                    "content_type": "application/octet-stream"}
+        obj_dict = self.context._extract_symlink_path_json(
+            obj_dict, 'v1', 'AUTH_a')
+        self.assertEqual(obj_dict['hash'], 'etag; extra_key=value')
+        self.assertEqual(obj_dict['symlink_path'], '/v1/AUTH_a/c/o')
+
+    def test_get_container_simple(self):
+        self.app.register(
+            'GET',
+            '/v1/a/c',
+            swob.HTTPOk, {},
+            json.dumps(
+                [{"hash": "etag; symlink_target=c/o;",
+                  "last_modified": "2014-11-21T14:23:02.206740",
+                  "bytes": 0,
+                  "name": "sym_obj",
+                  "content_type": "text/plain"},
+                 {"hash": "etag2",
+                  "last_modified": "2014-11-21T14:14:27.409100",
+                  "bytes": 32,
+                  "name": "normal_obj",
+                  "content_type": "text/plain"}]))
+        req = Request.blank(path='/v1/a/c')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '200 OK')
+        obj_list = json.loads(body)
+        self.assertIn('symlink_path', obj_list[0])
+        self.assertIn(obj_list[0]['symlink_path'], '/v1/a/c/o')
+        self.assertNotIn('symlink_path', obj_list[1])
+
+    def test_get_container_with_subdir(self):
+        self.app.register(
+            'GET',
+            '/v1/a/c?delimiter=/',
+            swob.HTTPOk, {},
+            json.dumps([{"subdir": "photos/"}]))
+        req = Request.blank(path='/v1/a/c?delimiter=/')
+        status, headers, body = self.call_sym(req)
+        self.assertEqual(status, '200 OK')
+        obj_list = json.loads(body)
+        self.assertEqual(len(obj_list), 1)
+        self.assertEqual(obj_list[0]['subdir'], 'photos/')
+
+    def test_get_container_error_cases(self):
+        # No affect for error cases
+        for error in (swob.HTTPNotFound, swob.HTTPUnauthorized,
+                      swob.HTTPServiceUnavailable,
+                      swob.HTTPInternalServerError):
+            self.app.register('GET', '/v1/a/c', error, {}, '')
+            req = Request.blank(path='/v1/a/c')
+            status, headers, body = self.call_sym(req)
+            self.assertEqual(status, error().status)
+
+    def test_no_affect_for_account_request(self):
+        with mock.patch.object(self.sym, 'app') as mock_app:
+            mock_app.return_value = (b'ok',)
+            req = Request.blank(path='/v1/a')
+            status, headers, body = self.call_sym(req)
+            self.assertEqual(body, b'ok')
+
+    def test_get_container_simple_with_listing_format(self):
+        self.app.register(
+            'GET',
+            '/v1/a/c?format=json',
+            swob.HTTPOk, {},
+            json.dumps(
+                [{"hash": "etag; symlink_target=c/o;",
+                  "last_modified": "2014-11-21T14:23:02.206740",
+                  "bytes": 0,
+                  "name": "sym_obj",
+                  "content_type": "text/plain"},
+                 {"hash": "etag2",
+                  "last_modified": "2014-11-21T14:14:27.409100",
+                  "bytes": 32,
+                  "name": "normal_obj",
+                  "content_type": "text/plain"}]))
+        self.lf = listing_formats.filter_factory({})(self.sym)
+        req = Request.blank(path='/v1/a/c?format=json')
+        status, headers, body = self.call_app(req, app=self.lf)
+        self.assertEqual(status, '200 OK')
+        obj_list = json.loads(body)
+        self.assertIn('symlink_path', obj_list[0])
+        self.assertIn(obj_list[0]['symlink_path'], '/v1/a/c/o')
+        self.assertNotIn('symlink_path', obj_list[1])
+
+    def test_get_container_simple_with_listing_format_xml(self):
+        self.app.register(
+            'GET',
+            '/v1/a/c?format=json',
+            swob.HTTPOk, {'Content-Type': 'application/json'},
+            json.dumps(
+                [{"hash": "etag; symlink_target=c/o;",
+                  "last_modified": "2014-11-21T14:23:02.206740",
+                  "bytes": 0,
+                  "name": "sym_obj",
+                  "content_type": "text/plain"},
+                 {"hash": "etag2",
+                  "last_modified": "2014-11-21T14:14:27.409100",
+                  "bytes": 32,
+                  "name": "normal_obj",
+                  "content_type": "text/plain"}]))
+        self.lf = listing_formats.filter_factory({})(self.sym)
+        req = Request.blank(path='/v1/a/c?format=xml')
+        status, headers, body = self.call_app(req, app=self.lf)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(body.split(b'\n'), [
+            b'<?xml version="1.0" encoding="UTF-8"?>',
+            b'<container name="c"><object><name>sym_obj</name>'
+            b'<hash>etag</hash><bytes>0</bytes>'
+            b'<content_type>text/plain</content_type>'
+            b'<last_modified>2014-11-21T14:23:02.206740</last_modified>'
+            b'</object>'
+            b'<object><name>normal_obj</name><hash>etag2</hash>'
+            b'<bytes>32</bytes><content_type>text/plain</content_type>'
+            b'<last_modified>2014-11-21T14:14:27.409100</last_modified>'
+            b'</object></container>'])
diff --git a/test/unit/common/middleware/test_tempauth.py b/test/unit/common/middleware/test_tempauth.py
index 7f5804d72f..7d39ee8773 100644
--- a/test/unit/common/middleware/test_tempauth.py
+++ b/test/unit/common/middleware/test_tempauth.py
@@ -1,4 +1,5 @@
-# Copyright (c) 2011 OpenStack, LLC.
+# -*- coding: utf-8 -*-
+# Copyright (c) 2011-2015 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,40 +14,27 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
+import json
 import unittest
-from contextlib import contextmanager
-from base64 import b64encode
+from base64 import b64encode as _b64encode
+from time import time
 
+from urllib.parse import quote, urlparse
 from swift.common.middleware import tempauth as auth
-from swift.common.swob import Request, Response
+from swift.common.middleware.acl import format_acl
+from swift.common.swob import Request, Response, bytes_to_wsgi, HTTPOk
+from swift.common.statsd_client import StatsdClient
+from swift.common.utils import split_path
+from test.unit import FakeMemcache
+from test.unit.common.middleware.helpers import FakeSwift
 
+NO_CONTENT_RESP = (('204 No Content', {}, ''),)   # mock server response
 
-class FakeMemcache(object):
 
-    def __init__(self):
-        self.store = {}
-
-    def get(self, key):
-        return self.store.get(key)
-
-    def set(self, key, value, timeout=0):
-        self.store[key] = value
-        return True
-
-    def incr(self, key, timeout=0):
-        self.store[key] = self.store.setdefault(key, 0) + 1
-        return self.store[key]
-
-    @contextmanager
-    def soft_lock(self, key, timeout=0, retries=5):
-        yield True
-
-    def delete(self, key):
-        try:
-            del self.store[key]
-        except Exception:
-            pass
-        return True
+def b64encode(str_or_bytes):
+    if not isinstance(str_or_bytes, bytes):
+        str_or_bytes = str_or_bytes.encode('utf8')
+    return _b64encode(str_or_bytes).decode('ascii')
 
 
 class FakeApp(object):
@@ -61,7 +49,7 @@ def __init__(self, status_headers_body_iter=None, acl=None, sync_key=None):
 
     def __call__(self, env, start_response):
         self.calls += 1
-        self.request = Request.blank('', environ=env)
+        self.request = Request(env)
         if self.acl:
             self.request.acl = self.acl
         if self.sync_key:
@@ -70,7 +58,7 @@ def __call__(self, env, start_response):
             resp = env['swift.authorize'](self.request)
             if resp:
                 return resp(env, start_response)
-        status, headers, body = self.status_headers_body_iter.next()
+        status, headers, body = next(self.status_headers_body_iter)
         return Response(status=status, headers=headers,
                         body=body)(env, start_response)
 
@@ -87,7 +75,7 @@ def request(self, method, path, headers):
         self.calls += 1
         self.request_path = path
         self.status, self.headers, self.body = \
-            self.status_headers_body_iter.next()
+            next(self.status_headers_body_iter)
         self.status, self.reason = self.status.split(' ', 1)
         self.status = int(self.status)
 
@@ -110,43 +98,98 @@ def _make_request(self, path, **kwargs):
         req.environ['swift.cache'] = FakeMemcache()
         return req
 
+    def test_statsd_prefix(self):
+        app = FakeApp()
+        ath = auth.filter_factory({})(app)
+        self.assertIsNotNone(ath.logger.logger.statsd_client)
+        self.assertIsInstance(ath.logger.logger.statsd_client,
+                              StatsdClient)
+        self.assertEqual('tempauth.AUTH_.',
+                         ath.logger.logger.statsd_client._prefix)
+
+        ath = auth.filter_factory({'log_statsd_metric_prefix': 'foo',
+                                   'log_name': 'bar'})(app)
+        self.assertIsNotNone(ath.logger.logger.statsd_client)
+        self.assertIsInstance(ath.logger.logger.statsd_client,
+                              StatsdClient)
+        self.assertEqual('foo.tempauth.AUTH_.',
+                         ath.logger.logger.statsd_client._prefix)
+
+        ath = auth.filter_factory({'log_statsd_metric_prefix': 'foo',
+                                   'log_name': 'bar',
+                                   'reseller_prefix': 'TEST'})(app)
+        self.assertIsNotNone(ath.logger.logger.statsd_client)
+        self.assertIsInstance(ath.logger.logger.statsd_client,
+                              StatsdClient)
+        self.assertEqual('foo.tempauth.TEST_.',
+                         ath.logger.logger.statsd_client._prefix)
+
     def test_reseller_prefix_init(self):
         app = FakeApp()
         ath = auth.filter_factory({})(app)
-        self.assertEquals(ath.reseller_prefix, 'AUTH_')
+        self.assertEqual(ath.reseller_prefix, 'AUTH_')
+        self.assertEqual(ath.reseller_prefixes, ['AUTH_'])
         ath = auth.filter_factory({'reseller_prefix': 'TEST'})(app)
-        self.assertEquals(ath.reseller_prefix, 'TEST_')
+        self.assertEqual(ath.reseller_prefix, 'TEST_')
+        self.assertEqual(ath.reseller_prefixes, ['TEST_'])
         ath = auth.filter_factory({'reseller_prefix': 'TEST_'})(app)
-        self.assertEquals(ath.reseller_prefix, 'TEST_')
+        self.assertEqual(ath.reseller_prefix, 'TEST_')
+        self.assertEqual(ath.reseller_prefixes, ['TEST_'])
+        ath = auth.filter_factory({'reseller_prefix': ''})(app)
+        self.assertEqual(ath.reseller_prefix, '')
+        self.assertEqual(ath.reseller_prefixes, [''])
+        ath = auth.filter_factory({'reseller_prefix': '    '})(app)
+        self.assertEqual(ath.reseller_prefix, '')
+        self.assertEqual(ath.reseller_prefixes, [''])
+        ath = auth.filter_factory({'reseller_prefix': '  ''  '})(app)
+        self.assertEqual(ath.reseller_prefix, '')
+        self.assertEqual(ath.reseller_prefixes, [''])
+        ath = auth.filter_factory({'reseller_prefix': " '', TEST"})(app)
+        self.assertEqual(ath.reseller_prefix, '')
+        self.assertTrue('' in ath.reseller_prefixes)
+        self.assertTrue('TEST_' in ath.reseller_prefixes)
 
     def test_auth_prefix_init(self):
         app = FakeApp()
         ath = auth.filter_factory({})(app)
-        self.assertEquals(ath.auth_prefix, '/auth/')
+        self.assertEqual(ath.auth_prefix, '/auth/')
         ath = auth.filter_factory({'auth_prefix': ''})(app)
-        self.assertEquals(ath.auth_prefix, '/auth/')
+        self.assertEqual(ath.auth_prefix, '/auth/')
+        ath = auth.filter_factory({'auth_prefix': '/'})(app)
+        self.assertEqual(ath.auth_prefix, '/auth/')
         ath = auth.filter_factory({'auth_prefix': '/test/'})(app)
-        self.assertEquals(ath.auth_prefix, '/test/')
+        self.assertEqual(ath.auth_prefix, '/test/')
         ath = auth.filter_factory({'auth_prefix': '/test'})(app)
-        self.assertEquals(ath.auth_prefix, '/test/')
+        self.assertEqual(ath.auth_prefix, '/test/')
         ath = auth.filter_factory({'auth_prefix': 'test/'})(app)
-        self.assertEquals(ath.auth_prefix, '/test/')
+        self.assertEqual(ath.auth_prefix, '/test/')
         ath = auth.filter_factory({'auth_prefix': 'test'})(app)
-        self.assertEquals(ath.auth_prefix, '/test/')
+        self.assertEqual(ath.auth_prefix, '/test/')
 
     def test_top_level_deny(self):
         req = self._make_request('/')
         resp = req.get_response(self.test_auth)
-        self.assertEquals(resp.status_int, 401)
-        self.assertEquals(req.environ['swift.authorize'],
-                          self.test_auth.denied_response)
+        self.assertEqual(resp.status_int, 401)
+        self.assertEqual(req.environ['swift.authorize'],
+                         self.test_auth.denied_response)
+        self.assertEqual(resp.headers.get('Www-Authenticate'),
+                         'Swift realm="unknown"')
 
     def test_anon(self):
         req = self._make_request('/v1/AUTH_account')
         resp = req.get_response(self.test_auth)
-        self.assertEquals(resp.status_int, 401)
-        self.assertEquals(req.environ['swift.authorize'],
-                          self.test_auth.authorize)
+        self.assertEqual(resp.status_int, 401)
+        self.assertEqual(req.environ['swift.authorize'],
+                         self.test_auth.authorize)
+        self.assertEqual(resp.headers.get('Www-Authenticate'),
+                         'Swift realm="AUTH_account"')
+
+    def test_anon_badpath(self):
+        req = self._make_request('/v1')
+        resp = req.get_response(self.test_auth)
+        self.assertEqual(resp.status_int, 401)
+        self.assertEqual(resp.headers.get('Www-Authenticate'),
+                         'Swift realm="unknown"')
 
     def test_override_asked_for_but_not_allowed(self):
         self.test_auth = \
@@ -154,9 +197,11 @@ def test_override_asked_for_but_not_allowed(self):
         req = self._make_request('/v1/AUTH_account',
                                  environ={'swift.authorize_override': True})
         resp = req.get_response(self.test_auth)
-        self.assertEquals(resp.status_int, 401)
-        self.assertEquals(req.environ['swift.authorize'],
-                          self.test_auth.authorize)
+        self.assertEqual(resp.status_int, 401)
+        self.assertEqual(resp.headers.get('Www-Authenticate'),
+                         'Swift realm="AUTH_account"')
+        self.assertEqual(req.environ['swift.authorize'],
+                         self.test_auth.authorize)
 
     def test_override_asked_for_and_allowed(self):
         self.test_auth = \
@@ -164,23 +209,25 @@ def test_override_asked_for_and_allowed(self):
         req = self._make_request('/v1/AUTH_account',
                                  environ={'swift.authorize_override': True})
         resp = req.get_response(self.test_auth)
-        self.assertEquals(resp.status_int, 404)
-        self.assertTrue('swift.authorize' not in req.environ)
+        self.assertEqual(resp.status_int, 404)
+        self.assertNotIn('swift.authorize', req.environ)
 
     def test_override_default_allowed(self):
         req = self._make_request('/v1/AUTH_account',
                                  environ={'swift.authorize_override': True})
         resp = req.get_response(self.test_auth)
-        self.assertEquals(resp.status_int, 404)
-        self.assertTrue('swift.authorize' not in req.environ)
+        self.assertEqual(resp.status_int, 404)
+        self.assertNotIn('swift.authorize', req.environ)
 
     def test_auth_deny_non_reseller_prefix(self):
         req = self._make_request('/v1/BLAH_account',
                                  headers={'X-Auth-Token': 'BLAH_t'})
         resp = req.get_response(self.test_auth)
-        self.assertEquals(resp.status_int, 401)
-        self.assertEquals(req.environ['swift.authorize'],
-                          self.test_auth.denied_response)
+        self.assertEqual(resp.status_int, 401)
+        self.assertEqual(resp.headers.get('Www-Authenticate'),
+                         'Swift realm="BLAH_account"')
+        self.assertEqual(req.environ['swift.authorize'],
+                         self.test_auth.denied_response)
 
     def test_auth_deny_non_reseller_prefix_no_override(self):
         fake_authorize = lambda x: Response(status='500 Fake')
@@ -189,8 +236,8 @@ def test_auth_deny_non_reseller_prefix_no_override(self):
                                  environ={'swift.authorize': fake_authorize}
                                  )
         resp = req.get_response(self.test_auth)
-        self.assertEquals(resp.status_int, 500)
-        self.assertEquals(req.environ['swift.authorize'], fake_authorize)
+        self.assertEqual(resp.status_int, 500)
+        self.assertEqual(req.environ['swift.authorize'], fake_authorize)
 
     def test_auth_no_reseller_prefix_deny(self):
         # Ensures that when we have no reseller prefix, we don't deny a request
@@ -201,20 +248,164 @@ def test_auth_no_reseller_prefix_deny(self):
         req = self._make_request('/v1/account',
                                  headers={'X-Auth-Token': 't'})
         resp = req.get_response(local_auth)
-        self.assertEquals(resp.status_int, 401)
-        self.assertEquals(local_app.calls, 1)
-        self.assertEquals(req.environ['swift.authorize'],
-                          local_auth.denied_response)
+        self.assertEqual(resp.status_int, 401)
+        self.assertEqual(resp.headers.get('Www-Authenticate'),
+                         'Swift realm="account"')
+        self.assertEqual(local_app.calls, 1)
+        self.assertEqual(req.environ['swift.authorize'],
+                         local_auth.denied_response)
+
+    def test_auth_reseller_prefix_with_s3_deny(self):
+        # Ensures that when we have a reseller prefix and using a middleware
+        # relying on Http-Authorization (for example swift3), we don't deny a
+        # request outright but set up a denial swift.authorize and pass the
+        # request on down the chain.
+        local_app = FakeApp()
+        local_auth = auth.filter_factory({'reseller_prefix': 'PRE'})(local_app)
+        req = self._make_request('/v1/account',
+                                 headers={'X-Auth-Token': 't',
+                                          'Authorization': 'AWS user:pw'})
+        resp = req.get_response(local_auth)
+        self.assertEqual(resp.status_int, 401)
+        self.assertEqual(local_app.calls, 1)
+        self.assertEqual(req.environ['swift.authorize'],
+                         local_auth.denied_response)
+
+    def test_auth_with_swift3_authorization_good(self):
+        local_app = FakeApp()
+        local_auth = auth.filter_factory(
+            {'user_s3_s3': 'secret .admin'})(local_app)
+        req = self._make_request('/v1/s3:s3', environ={
+            'swift3.auth_details': {
+                'access_key': 's3:s3',
+                'signature': b64encode('sig'),
+                'string_to_sign': 't',
+                'check_signature': lambda secret: True}})
+        resp = req.get_response(local_auth)
+
+        self.assertEqual(resp.status_int, 404)
+        self.assertEqual(local_app.calls, 1)
+        self.assertEqual(req.environ['PATH_INFO'], '/v1/AUTH_s3')
+        self.assertEqual(req.environ['swift.authorize'],
+                         local_auth.authorize)
+
+    def test_auth_with_s3api_authorization_good(self):
+        local_app = FakeApp()
+        local_auth = auth.filter_factory(
+            {'user_s3_s3': 'secret .admin'})(local_app)
+        req = self._make_request('/v1/s3:s3', environ={
+            's3api.auth_details': {
+                'access_key': 's3:s3',
+                'signature': b64encode('sig'),
+                'string_to_sign': 't',
+                'check_signature': lambda secret: True}})
+        resp = req.get_response(local_auth)
+
+        self.assertEqual(resp.status_int, 404)
+        self.assertEqual(local_app.calls, 1)
+        self.assertEqual(req.environ['PATH_INFO'], '/v1/AUTH_s3')
+        self.assertEqual(req.environ['swift.authorize'],
+                         local_auth.authorize)
+
+    def test_auth_with_s3api_unicode_authorization_good(self):
+        local_app = FakeApp()
+        conf = {u'user_t\u00e9st_t\u00e9ster': u'p\u00e1ss .admin'}
+        access_key = u't\u00e9st:t\u00e9ster'
+        local_auth = auth.filter_factory(conf)(local_app)
+        req = self._make_request('/v1/t\xc3\xa9st:t\xc3\xa9ster', environ={
+            's3api.auth_details': {
+                'access_key': access_key,
+                'signature': b64encode('sig'),
+                'string_to_sign': 't',
+                'check_signature': lambda secret: True}})
+        resp = req.get_response(local_auth)
+
+        self.assertEqual(resp.status_int, 404)
+        self.assertEqual(local_app.calls, 1)
+        self.assertEqual(req.environ['PATH_INFO'], '/v1/AUTH_t\xc3\xa9st')
+        self.assertEqual(req.environ['swift.authorize'],
+                         local_auth.authorize)
+
+    def test_auth_with_swift3_authorization_invalid(self):
+        local_app = FakeApp()
+        local_auth = auth.filter_factory(
+            {'user_s3_s3': 'secret .admin'})(local_app)
+        req = self._make_request('/v1/s3:s3', environ={
+            'swift3.auth_details': {
+                'access_key': 's3:s3',
+                'signature': b64encode('sig'),
+                'string_to_sign': 't',
+                'check_signature': lambda secret: False}})
+        resp = req.get_response(local_auth)
+
+        self.assertEqual(resp.status_int, 401)
+        self.assertEqual(local_app.calls, 1)
+        self.assertEqual(req.environ['PATH_INFO'], '/v1/s3:s3')
+        self.assertEqual(req.environ['swift.authorize'],
+                         local_auth.denied_response)
+
+    def test_auth_with_s3api_authorization_invalid(self):
+        local_app = FakeApp()
+        local_auth = auth.filter_factory(
+            {'user_s3_s3': 'secret .admin'})(local_app)
+        req = self._make_request('/v1/s3:s3', environ={
+            's3api.auth_details': {
+                'access_key': 's3:s3',
+                'signature': b64encode('sig'),
+                'string_to_sign': 't',
+                'check_signature': lambda secret: False}})
+        resp = req.get_response(local_auth)
+
+        self.assertEqual(resp.status_int, 401)
+        self.assertEqual(local_app.calls, 1)
+        self.assertEqual(req.environ['PATH_INFO'], '/v1/s3:s3')
+        self.assertEqual(req.environ['swift.authorize'],
+                         local_auth.denied_response)
+
+    def test_auth_with_old_swift3_details(self):
+        local_app = FakeApp()
+        local_auth = auth.filter_factory(
+            {'user_s3_s3': 'secret .admin'})(local_app)
+        req = self._make_request('/v1/s3:s3', environ={
+            'swift3.auth_details': {
+                'access_key': 's3:s3',
+                'signature': b64encode('sig'),
+                'string_to_sign': 't'}})
+        resp = req.get_response(local_auth)
+
+        self.assertEqual(resp.status_int, 401)
+        self.assertEqual(local_app.calls, 1)
+        self.assertEqual(req.environ['PATH_INFO'], '/v1/s3:s3')
+        self.assertEqual(req.environ['swift.authorize'],
+                         local_auth.denied_response)
+
+    def test_auth_with_old_s3api_details(self):
+        local_app = FakeApp()
+        local_auth = auth.filter_factory(
+            {'user_s3_s3': 'secret .admin'})(local_app)
+        req = self._make_request('/v1/s3:s3', environ={
+            's3api.auth_details': {
+                'access_key': 's3:s3',
+                'signature': b64encode('sig'),
+                'string_to_sign': 't'}})
+        resp = req.get_response(local_auth)
+
+        self.assertEqual(resp.status_int, 401)
+        self.assertEqual(local_app.calls, 1)
+        self.assertEqual(req.environ['PATH_INFO'], '/v1/s3:s3')
+        self.assertEqual(req.environ['swift.authorize'],
+                         local_auth.denied_response)
 
     def test_auth_no_reseller_prefix_no_token(self):
         # Check that normally we set up a call back to our authorize.
-        local_auth = \
-            auth.filter_factory({'reseller_prefix': ''})(FakeApp(iter([])))
+        local_auth = auth.filter_factory({'reseller_prefix': ''})(FakeApp())
         req = self._make_request('/v1/account')
         resp = req.get_response(local_auth)
-        self.assertEquals(resp.status_int, 401)
-        self.assertEquals(req.environ['swift.authorize'],
-                          local_auth.authorize)
+        self.assertEqual(resp.status_int, 401)
+        self.assertEqual(resp.headers.get('Www-Authenticate'),
+                         'Swift realm="account"')
+        self.assertEqual(req.environ['swift.authorize'],
+                         local_auth.authorize)
         # Now make sure we don't override an existing swift.authorize when we
         # have no reseller prefix.
         local_auth = \
@@ -223,56 +414,62 @@ def test_auth_no_reseller_prefix_no_token(self):
         req = self._make_request('/v1/account', environ={'swift.authorize':
                                  local_authorize})
         resp = req.get_response(local_auth)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(req.environ['swift.authorize'], local_authorize)
+        self.assertEqual(req.environ['swift.authorize'], local_authorize)
+        self.assertEqual(resp.status_int, 200)
 
     def test_auth_fail(self):
         resp = self._make_request(
             '/v1/AUTH_cfa',
             headers={'X-Auth-Token': 'AUTH_t'}).get_response(self.test_auth)
-        self.assertEquals(resp.status_int, 401)
+        self.assertEqual(resp.status_int, 401)
+        self.assertEqual(resp.headers.get('Www-Authenticate'),
+                         'Swift realm="AUTH_cfa"')
 
     def test_authorize_bad_path(self):
         req = self._make_request('/badpath')
         resp = self.test_auth.authorize(req)
-        self.assertEquals(resp.status_int, 401)
+        self.assertEqual(resp.status_int, 401)
+        self.assertEqual(resp.headers.get('Www-Authenticate'),
+                         'Swift realm="unknown"')
         req = self._make_request('/badpath')
         req.remote_user = 'act:usr,act,AUTH_cfa'
         resp = self.test_auth.authorize(req)
-        self.assertEquals(resp.status_int, 403)
+        self.assertEqual(resp.status_int, 403)
 
     def test_authorize_account_access(self):
         req = self._make_request('/v1/AUTH_cfa')
         req.remote_user = 'act:usr,act,AUTH_cfa'
-        self.assertEquals(self.test_auth.authorize(req), None)
+        self.assertIsNone(self.test_auth.authorize(req))
         req = self._make_request('/v1/AUTH_cfa')
         req.remote_user = 'act:usr,act'
         resp = self.test_auth.authorize(req)
-        self.assertEquals(resp.status_int, 403)
+        self.assertEqual(resp.status_int, 403)
 
     def test_authorize_acl_group_access(self):
+        self.test_auth = auth.filter_factory({})(
+            FakeApp(iter(NO_CONTENT_RESP * 3)))
         req = self._make_request('/v1/AUTH_cfa')
         req.remote_user = 'act:usr,act'
         resp = self.test_auth.authorize(req)
-        self.assertEquals(resp.status_int, 403)
+        self.assertEqual(resp.status_int, 403)
         req = self._make_request('/v1/AUTH_cfa')
         req.remote_user = 'act:usr,act'
         req.acl = 'act'
-        self.assertEquals(self.test_auth.authorize(req), None)
+        self.assertIsNone(self.test_auth.authorize(req))
         req = self._make_request('/v1/AUTH_cfa')
         req.remote_user = 'act:usr,act'
         req.acl = 'act:usr'
-        self.assertEquals(self.test_auth.authorize(req), None)
+        self.assertIsNone(self.test_auth.authorize(req))
         req = self._make_request('/v1/AUTH_cfa')
         req.remote_user = 'act:usr,act'
         req.acl = 'act2'
         resp = self.test_auth.authorize(req)
-        self.assertEquals(resp.status_int, 403)
+        self.assertEqual(resp.status_int, 403)
         req = self._make_request('/v1/AUTH_cfa')
         req.remote_user = 'act:usr,act'
         req.acl = 'act:usr2'
         resp = self.test_auth.authorize(req)
-        self.assertEquals(resp.status_int, 403)
+        self.assertEqual(resp.status_int, 403)
 
     def test_deny_cross_reseller(self):
         # Tests that cross-reseller is denied, even if ACLs/group names match
@@ -280,76 +477,107 @@ def test_deny_cross_reseller(self):
         req.remote_user = 'act:usr,act,AUTH_cfa'
         req.acl = 'act'
         resp = self.test_auth.authorize(req)
-        self.assertEquals(resp.status_int, 403)
+        self.assertEqual(resp.status_int, 403)
+
+    def test_authorize_acl_referer_after_user_groups(self):
+        req = self._make_request('/v1/AUTH_cfa/c')
+        req.remote_user = 'act:usr'
+        req.acl = '.r:*,act:usr'
+        self.assertIsNone(self.test_auth.authorize(req))
 
     def test_authorize_acl_referrer_access(self):
+        self.test_auth = auth.filter_factory({})(
+            FakeApp(iter(NO_CONTENT_RESP * 6)))
         req = self._make_request('/v1/AUTH_cfa/c')
         req.remote_user = 'act:usr,act'
         resp = self.test_auth.authorize(req)
-        self.assertEquals(resp.status_int, 403)
+        self.assertEqual(resp.status_int, 403)
         req = self._make_request('/v1/AUTH_cfa/c')
         req.remote_user = 'act:usr,act'
         req.acl = '.r:*,.rlistings'
-        self.assertEquals(self.test_auth.authorize(req), None)
+        self.assertIsNone(self.test_auth.authorize(req))
         req = self._make_request('/v1/AUTH_cfa/c')
         req.remote_user = 'act:usr,act'
         req.acl = '.r:*'  # No listings allowed
         resp = self.test_auth.authorize(req)
-        self.assertEquals(resp.status_int, 403)
+        self.assertEqual(resp.status_int, 403)
         req = self._make_request('/v1/AUTH_cfa/c')
         req.remote_user = 'act:usr,act'
         req.acl = '.r:.example.com,.rlistings'
         resp = self.test_auth.authorize(req)
-        self.assertEquals(resp.status_int, 403)
+        self.assertEqual(resp.status_int, 403)
         req = self._make_request('/v1/AUTH_cfa/c')
         req.remote_user = 'act:usr,act'
         req.referer = 'http://www.example.com/index.html'
         req.acl = '.r:.example.com,.rlistings'
-        self.assertEquals(self.test_auth.authorize(req), None)
+        self.assertIsNone(self.test_auth.authorize(req))
         req = self._make_request('/v1/AUTH_cfa/c')
         resp = self.test_auth.authorize(req)
-        self.assertEquals(resp.status_int, 401)
+        self.assertEqual(resp.status_int, 401)
+        self.assertEqual(resp.headers.get('Www-Authenticate'),
+                         'Swift realm="AUTH_cfa"')
         req = self._make_request('/v1/AUTH_cfa/c')
         req.acl = '.r:*,.rlistings'
-        self.assertEquals(self.test_auth.authorize(req), None)
+        self.assertIsNone(self.test_auth.authorize(req))
         req = self._make_request('/v1/AUTH_cfa/c')
         req.acl = '.r:*'  # No listings allowed
         resp = self.test_auth.authorize(req)
-        self.assertEquals(resp.status_int, 401)
+        self.assertEqual(resp.status_int, 401)
+        self.assertEqual(resp.headers.get('Www-Authenticate'),
+                         'Swift realm="AUTH_cfa"')
         req = self._make_request('/v1/AUTH_cfa/c')
         req.acl = '.r:.example.com,.rlistings'
         resp = self.test_auth.authorize(req)
-        self.assertEquals(resp.status_int, 401)
+        self.assertEqual(resp.status_int, 401)
+        self.assertEqual(resp.headers.get('Www-Authenticate'),
+                         'Swift realm="AUTH_cfa"')
         req = self._make_request('/v1/AUTH_cfa/c')
         req.referer = 'http://www.example.com/index.html'
         req.acl = '.r:.example.com,.rlistings'
-        self.assertEquals(self.test_auth.authorize(req), None)
+        self.assertIsNone(self.test_auth.authorize(req))
+
+    def test_detect_reseller_request(self):
+        req = self._make_request('/v1/AUTH_admin',
+                                 headers={'X-Auth-Token': 'AUTH_tk'})
+        cache_key = 'AUTH_/token/AUTH_tk'
+        cache_entry = (time() + 3600, '.reseller_admin')
+        req.environ['swift.cache'].set(cache_key, cache_entry)
+        req.get_response(self.test_auth)
+        self.assertTrue(req.environ.get('reseller_request', False))
 
     def test_account_put_permissions(self):
+        self.test_auth = auth.filter_factory({})(
+            FakeApp(iter(NO_CONTENT_RESP * 5)))
         req = self._make_request('/v1/AUTH_new',
                                  environ={'REQUEST_METHOD': 'PUT'})
         req.remote_user = 'act:usr,act'
         resp = self.test_auth.authorize(req)
-        self.assertEquals(resp.status_int, 403)
+        self.assertEqual(resp.status_int, 403)
 
         req = self._make_request('/v1/AUTH_new',
                                  environ={'REQUEST_METHOD': 'PUT'})
         req.remote_user = 'act:usr,act,AUTH_other'
         resp = self.test_auth.authorize(req)
-        self.assertEquals(resp.status_int, 403)
+        self.assertEqual(resp.status_int, 403)
 
         # Even PUTs to your own account as account admin should fail
         req = self._make_request('/v1/AUTH_old',
                                  environ={'REQUEST_METHOD': 'PUT'})
         req.remote_user = 'act:usr,act,AUTH_old'
         resp = self.test_auth.authorize(req)
-        self.assertEquals(resp.status_int, 403)
+        self.assertEqual(resp.status_int, 403)
 
         req = self._make_request('/v1/AUTH_new',
                                  environ={'REQUEST_METHOD': 'PUT'})
         req.remote_user = 'act:usr,act,.reseller_admin'
         resp = self.test_auth.authorize(req)
-        self.assertEquals(resp, None)
+        self.assertIsNone(resp)
+
+        req = self._make_request('/v1/AUTH_new',
+                                 environ={'REQUEST_METHOD': 'PUT'})
+        req.remote_user = 'act:usr,act,.reseller_reader'
+        resp = self.test_auth.authorize(req)
+        self.assertEqual(resp.status_int, 403)
 
         # .super_admin is not something the middleware should ever see or care
         # about
@@ -357,33 +585,41 @@ def test_account_put_permissions(self):
                                  environ={'REQUEST_METHOD': 'PUT'})
         req.remote_user = 'act:usr,act,.super_admin'
         resp = self.test_auth.authorize(req)
-        self.assertEquals(resp.status_int, 403)
+        self.assertEqual(resp.status_int, 403)
 
     def test_account_delete_permissions(self):
+        self.test_auth = auth.filter_factory({})(
+            FakeApp(iter(NO_CONTENT_RESP * 5)))
         req = self._make_request('/v1/AUTH_new',
                                  environ={'REQUEST_METHOD': 'DELETE'})
         req.remote_user = 'act:usr,act'
         resp = self.test_auth.authorize(req)
-        self.assertEquals(resp.status_int, 403)
+        self.assertEqual(resp.status_int, 403)
 
         req = self._make_request('/v1/AUTH_new',
                                  environ={'REQUEST_METHOD': 'DELETE'})
         req.remote_user = 'act:usr,act,AUTH_other'
         resp = self.test_auth.authorize(req)
-        self.assertEquals(resp.status_int, 403)
+        self.assertEqual(resp.status_int, 403)
 
         # Even DELETEs to your own account as account admin should fail
         req = self._make_request('/v1/AUTH_old',
                                  environ={'REQUEST_METHOD': 'DELETE'})
         req.remote_user = 'act:usr,act,AUTH_old'
         resp = self.test_auth.authorize(req)
-        self.assertEquals(resp.status_int, 403)
+        self.assertEqual(resp.status_int, 403)
 
         req = self._make_request('/v1/AUTH_new',
                                  environ={'REQUEST_METHOD': 'DELETE'})
         req.remote_user = 'act:usr,act,.reseller_admin'
         resp = self.test_auth.authorize(req)
-        self.assertEquals(resp, None)
+        self.assertIsNone(resp)
+
+        req = self._make_request('/v1/AUTH_new',
+                                 environ={'REQUEST_METHOD': 'DELETE'})
+        req.remote_user = 'act:usr,act,.reseller_reader'
+        resp = self.test_auth.authorize(req)
+        self.assertEqual(resp.status_int, 403)
 
         # .super_admin is not something the middleware should ever see or care
         # about
@@ -391,43 +627,212 @@ def test_account_delete_permissions(self):
                                  environ={'REQUEST_METHOD': 'DELETE'})
         req.remote_user = 'act:usr,act,.super_admin'
         resp = self.test_auth.authorize(req)
-        self.assertEquals(resp.status_int, 403)
+        self.assertEqual(resp.status_int, 403)
+
+    def test_get_token_success(self):
+        # Example of how to simulate the auth transaction
+        test_auth = auth.filter_factory({'user_ac_user': 'testing'})(FakeApp())
+        req = self._make_request(
+            '/auth/v1.0',
+            headers={'X-Auth-User': 'ac:user', 'X-Auth-Key': 'testing'})
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 200)
+        self.assertTrue(resp.headers['x-storage-url'].endswith('/v1/AUTH_ac'))
+        self.assertTrue(resp.headers['x-auth-token'].startswith('AUTH_'))
+        self.assertEqual(resp.headers['x-auth-token'],
+                         resp.headers['x-storage-token'])
+        self.assertAlmostEqual(int(resp.headers['x-auth-token-expires']),
+                               auth.DEFAULT_TOKEN_LIFE - 0.5, delta=0.5)
+        self.assertGreater(len(resp.headers['x-auth-token']), 10)
+
+    def test_get_token_sets_access_logging_user_id(self):
+        # Test that token generation sets access logging user_id
+        test_auth = auth.filter_factory({'user_ac_user': 'testing'})(FakeApp())
+        req = self._make_request(
+            '/auth/v1.0',
+            headers={'X-Auth-User': 'ac:user', 'X-Auth-Key': 'testing'})
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 200)
+        # Check that access logging user_id was set during token generation
+        self.assertIn('swift.access_logging', req.environ)
+        self.assertIn('user_id', req.environ['swift.access_logging'])
+        self.assertEqual(req.environ['swift.access_logging']['user_id'],
+                         'ac:user')
+
+    def test_get_token_memcache_error(self):
+        test_auth = auth.filter_factory({'user_ac_user': 'testing'})(FakeApp())
+        req = self._make_request(
+            '/auth/v1.0',
+            headers={'X-Auth-User': 'ac:user', 'X-Auth-Key': 'testing'})
+        req.environ['swift.cache'] = FakeMemcache(error_on_set=[True])
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 503)
+
+    def test_get_token_success_other_auth_prefix(self):
+        test_auth = auth.filter_factory({'user_ac_user': 'testing',
+                                         'auth_prefix': '/other/'})(FakeApp())
+        req = self._make_request(
+            '/other/v1.0',
+            headers={'X-Auth-User': 'ac:user', 'X-Auth-Key': 'testing'})
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 200)
+        self.assertTrue(resp.headers['x-storage-url'].endswith('/v1/AUTH_ac'))
+        self.assertTrue(resp.headers['x-auth-token'].startswith('AUTH_'))
+        self.assertTrue(len(resp.headers['x-auth-token']) > 10)
+
+    def test_use_token_success(self):
+        # Example of how to simulate an authorized request
+        test_auth = auth.filter_factory({'user_acct_user': 'testing'})(
+            FakeApp(iter(NO_CONTENT_RESP * 1)))
+        req = self._make_request('/v1/AUTH_acct',
+                                 headers={'X-Auth-Token': 'AUTH_tk'})
+        cache_key = 'AUTH_/token/AUTH_tk'
+        cache_entry = (time() + 3600, 'AUTH_acct')
+        req.environ['swift.cache'].set(cache_key, cache_entry)
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 204)
 
     def test_get_token_fail(self):
         resp = self._make_request('/auth/v1.0').get_response(self.test_auth)
-        self.assertEquals(resp.status_int, 401)
+        self.assertEqual(resp.status_int, 401)
+        self.assertEqual(resp.headers.get('Www-Authenticate'),
+                         'Swift realm="unknown"')
         resp = self._make_request(
             '/auth/v1.0',
             headers={'X-Auth-User': 'act:usr',
                      'X-Auth-Key': 'key'}).get_response(self.test_auth)
-        self.assertEquals(resp.status_int, 401)
+        self.assertEqual(resp.status_int, 401)
+        self.assertTrue('Www-Authenticate' in resp.headers)
+        self.assertEqual(resp.headers.get('Www-Authenticate'),
+                         'Swift realm="act"')
 
     def test_get_token_fail_invalid_x_auth_user_format(self):
         resp = self._make_request(
             '/auth/v1/act/auth',
             headers={'X-Auth-User': 'usr',
                      'X-Auth-Key': 'key'}).get_response(self.test_auth)
-        self.assertEquals(resp.status_int, 401)
+        self.assertEqual(resp.status_int, 401)
+        self.assertEqual(resp.headers.get('Www-Authenticate'),
+                         'Swift realm="act"')
 
     def test_get_token_fail_non_matching_account_in_request(self):
         resp = self._make_request(
             '/auth/v1/act/auth',
             headers={'X-Auth-User': 'act2:usr',
                      'X-Auth-Key': 'key'}).get_response(self.test_auth)
-        self.assertEquals(resp.status_int, 401)
+        self.assertEqual(resp.status_int, 401)
+        self.assertEqual(resp.headers.get('Www-Authenticate'),
+                         'Swift realm="act"')
 
     def test_get_token_fail_bad_path(self):
         resp = self._make_request(
             '/auth/v1/act/auth/invalid',
             headers={'X-Auth-User': 'act:usr',
                      'X-Auth-Key': 'key'}).get_response(self.test_auth)
-        self.assertEquals(resp.status_int, 400)
+        self.assertEqual(resp.status_int, 400)
 
     def test_get_token_fail_missing_key(self):
         resp = self._make_request(
             '/auth/v1/act/auth',
             headers={'X-Auth-User': 'act:usr'}).get_response(self.test_auth)
-        self.assertEquals(resp.status_int, 401)
+        self.assertEqual(resp.status_int, 401)
+        self.assertEqual(resp.headers.get('Www-Authenticate'),
+                         'Swift realm="act"')
+
+    def test_fernet_token_no_memcache(self):
+        swift = FakeSwift()
+        swift.register('GET', '/v1/AUTH_ac', HTTPOk, {})
+
+        test_auth = auth.filter_factory({
+            'user_ac_user': 'testing .admin',
+            'fernet_key_2024': 'esipv1wC03xLGPb3cydid0uPINl6g8sydhlPh6iwJxk=',
+            'active_fernet_key_id': '2024',
+        })(swift)
+        req = Request.blank(
+            '/auth/v1.0',
+            headers={'X-Auth-User': 'ac:user', 'X-Auth-Key': 'testing'})
+        # no memcache!
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 200)
+        token = resp.headers['X-Auth-Token']
+        self.assertEqual(token[:8], 'AUTH_ftk')
+
+        req = Request.blank('/v1/AUTH_ac', headers={'X-Auth-Token': token})
+        # again, no memcache!
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 200)
+
+        # key rotation time
+        test_auth = auth.filter_factory({
+            'user_ac_user': 'testing .admin',
+            'fernet_key_2024': 'esipv1wC03xLGPb3cydid0uPINl6g8sydhlPh6iwJxk=',
+            'fernet_key_2025': 'gRXHeKlt5h1nMDZL_QA7UfVIJ5z3ZP3v351cvmiRZD4=',
+            'active_fernet_key_id': '2025',
+        })(swift)
+
+        # old token still good
+        req = Request.blank('/v1/AUTH_ac', headers={'X-Auth-Token': token})
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 200)
+
+        req = Request.blank(
+            '/auth/v1.0',
+            headers={'X-Auth-User': 'ac:user', 'X-Auth-Key': 'testing'})
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 200)
+        new_token = resp.headers['X-Auth-Token']
+        self.assertEqual(new_token[:8], 'AUTH_ftk')
+
+        # drop old key
+        test_auth = auth.filter_factory({
+            'user_ac_user': 'testing .admin',
+            'fernet_key_2025': 'gRXHeKlt5h1nMDZL_QA7UfVIJ5z3ZP3v351cvmiRZD4=',
+            'active_fernet_key_id': '2025',
+        })(swift)
+
+        # old token now bad
+        req = Request.blank('/v1/AUTH_ac', headers={'X-Auth-Token': token})
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 401)
+
+        # new token still good
+        req = Request.blank('/v1/AUTH_ac', headers={'X-Auth-Token': new_token})
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 200)
+
+    def test_compressed_fernet_token_no_memcache(self):
+        swift = FakeSwift()
+        swift.register('GET', '/v1/AUTH_ac', HTTPOk, {})
+
+        test_auth = auth.filter_factory({
+            'user_ac_user': 'testing .admin ' + ' '.join(
+                'similar-group-name-%d' % i for i in range(20)),
+            'fernet_key_2024': 'esipv1wC03xLGPb3cydid0uPINl6g8sydhlPh6iwJxk=',
+            'active_fernet_key_id': '2024',
+        })(swift)
+        req = Request.blank(
+            '/auth/v1.0',
+            headers={'X-Auth-User': 'ac:user', 'X-Auth-Key': 'testing'})
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 200)
+        token = resp.headers['X-Auth-Token']
+        self.assertEqual(token[:9], 'AUTH_zftk')
+
+        # token's good
+        req = Request.blank('/v1/AUTH_ac', headers={'X-Auth-Token': token})
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 200)
+
+    def test_object_name_containing_slash(self):
+        test_auth = auth.filter_factory({'user_acct_user': 'testing'})(
+            FakeApp(iter(NO_CONTENT_RESP * 1)))
+        req = self._make_request('/v1/AUTH_acct/cont/obj/name/with/slash',
+                                 headers={'X-Auth-Token': 'AUTH_tk'})
+        cache_key = 'AUTH_/token/AUTH_tk'
+        cache_entry = (time() + 3600, 'AUTH_acct')
+        req.environ['swift.cache'].set(cache_key, cache_entry)
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 204)
 
     def test_storage_url_default(self):
         self.test_auth = \
@@ -439,9 +844,9 @@ def test_storage_url_default(self):
         req.environ['SERVER_NAME'] = 'bob'
         req.environ['SERVER_PORT'] = '1234'
         resp = req.get_response(self.test_auth)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(resp.headers['x-storage-url'],
-                          'http://bob:1234/v1/AUTH_test')
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['x-storage-url'],
+                         'http://bob:1234/v1/AUTH_test')
 
     def test_storage_url_based_on_host(self):
         self.test_auth = \
@@ -453,11 +858,68 @@ def test_storage_url_based_on_host(self):
         req.environ['SERVER_NAME'] = 'bob'
         req.environ['SERVER_PORT'] = '1234'
         resp = req.get_response(self.test_auth)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(resp.headers['x-storage-url'],
-                          'http://somehost:5678/v1/AUTH_test')
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['x-storage-url'],
+                         'http://somehost:5678/v1/AUTH_test')
+
+    def test_storage_url_overridden_scheme(self):
+        self.test_auth = \
+            auth.filter_factory({'user_test_tester': 'testing',
+                                 'storage_url_scheme': 'fake'})(FakeApp())
+        req = self._make_request(
+            '/auth/v1.0',
+            headers={'X-Auth-User': 'test:tester', 'X-Auth-Key': 'testing'})
+        req.environ['HTTP_HOST'] = 'somehost:5678'
+        req.environ['SERVER_NAME'] = 'bob'
+        req.environ['SERVER_PORT'] = '1234'
+        resp = req.get_response(self.test_auth)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['x-storage-url'],
+                         'fake://somehost:5678/v1/AUTH_test')
+
+    def test_use_old_token_from_memcached(self):
+        self.test_auth = \
+            auth.filter_factory({'user_test_tester': 'testing',
+                                 'storage_url_scheme': 'fake'})(FakeApp())
+        req = self._make_request(
+            '/auth/v1.0',
+            headers={'X-Auth-User': 'test:tester', 'X-Auth-Key': 'testing'})
+        req.environ['HTTP_HOST'] = 'somehost:5678'
+        req.environ['SERVER_NAME'] = 'bob'
+        req.environ['SERVER_PORT'] = '1234'
+        req.environ['swift.cache'].set('AUTH_/user/test:tester', 'uuid_token')
+        expires = time() + 180
+        req.environ['swift.cache'].set('AUTH_/token/uuid_token',
+                                       (expires, 'test,test:tester'))
+        resp = req.get_response(self.test_auth)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['x-auth-token'], 'uuid_token')
+        self.assertEqual(resp.headers['x-auth-token'],
+                         resp.headers['x-storage-token'])
+        self.assertAlmostEqual(int(resp.headers['x-auth-token-expires']),
+                               179.5, delta=0.5)
+
+    def test_old_token_overdate(self):
+        self.test_auth = \
+            auth.filter_factory({'user_test_tester': 'testing',
+                                 'storage_url_scheme': 'fake'})(FakeApp())
+        req = self._make_request(
+            '/auth/v1.0',
+            headers={'X-Auth-User': 'test:tester', 'X-Auth-Key': 'testing'})
+        req.environ['HTTP_HOST'] = 'somehost:5678'
+        req.environ['SERVER_NAME'] = 'bob'
+        req.environ['SERVER_PORT'] = '1234'
+        req.environ['swift.cache'].set('AUTH_/user/test:tester', 'uuid_token')
+        req.environ['swift.cache'].set('AUTH_/token/uuid_token',
+                                       (0, 'test,test:tester'))
+        resp = req.get_response(self.test_auth)
+        self.assertEqual(resp.status_int, 200)
+        self.assertNotEqual(resp.headers['x-auth-token'], 'uuid_token')
+        self.assertEqual(resp.headers['x-auth-token'][:7], 'AUTH_tk')
+        self.assertAlmostEqual(int(resp.headers['x-auth-token-expires']),
+                               auth.DEFAULT_TOKEN_LIFE - 0.5, delta=0.5)
 
-    def test_storage_url_overriden_scheme(self):
+    def test_old_token_with_old_data(self):
         self.test_auth = \
             auth.filter_factory({'user_test_tester': 'testing',
                                  'storage_url_scheme': 'fake'})(FakeApp())
@@ -467,10 +929,15 @@ def test_storage_url_overriden_scheme(self):
         req.environ['HTTP_HOST'] = 'somehost:5678'
         req.environ['SERVER_NAME'] = 'bob'
         req.environ['SERVER_PORT'] = '1234'
+        req.environ['swift.cache'].set('AUTH_/user/test:tester', 'uuid_token')
+        req.environ['swift.cache'].set('AUTH_/token/uuid_token',
+                                       (time() + 99, 'test,test:tester,.role'))
         resp = req.get_response(self.test_auth)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(resp.headers['x-storage-url'],
-                          'fake://somehost:5678/v1/AUTH_test')
+        self.assertEqual(resp.status_int, 200)
+        self.assertNotEqual(resp.headers['x-auth-token'], 'uuid_token')
+        self.assertEqual(resp.headers['x-auth-token'][:7], 'AUTH_tk')
+        self.assertAlmostEqual(int(resp.headers['x-auth-token-expires']),
+                               auth.DEFAULT_TOKEN_LIFE - 0.5, delta=0.5)
 
     def test_reseller_admin_is_owner(self):
         orig_authorize = self.test_auth.authorize
@@ -486,8 +953,17 @@ def mitm_authorize(req):
         req = self._make_request('/v1/AUTH_cfa',
                                  headers={'X-Auth-Token': 'AUTH_t'})
         req.remote_user = '.reseller_admin'
-        self.test_auth.authorize(req)
-        self.assertEquals(owner_values, [True])
+        resp = self.test_auth.authorize(req)
+        self.assertIsNone(resp)
+        self.assertEqual(owner_values, [True])
+
+        owner_values = []
+        req = self._make_request('/v1/AUTH_cfa',
+                                 headers={'X-Auth-Token': 'AUTH_t'})
+        req.remote_user = '.reseller_reader'
+        resp = self.test_auth.authorize(req)
+        self.assertIsNone(resp)
+        self.assertEqual(owner_values, [False])
 
     def test_admin_is_owner(self):
         orig_authorize = self.test_auth.authorize
@@ -505,7 +981,7 @@ def mitm_authorize(req):
             headers={'X-Auth-Token': 'AUTH_t'})
         req.remote_user = 'AUTH_cfa'
         self.test_auth.authorize(req)
-        self.assertEquals(owner_values, [True])
+        self.assertEqual(owner_values, [True])
 
     def test_regular_is_not_owner(self):
         orig_authorize = self.test_auth.authorize
@@ -523,10 +999,10 @@ def mitm_authorize(req):
             headers={'X-Auth-Token': 'AUTH_t'})
         req.remote_user = 'act:usr'
         self.test_auth.authorize(req)
-        self.assertEquals(owner_values, [False])
+        self.assertEqual(owner_values, [False])
 
     def test_sync_request_success(self):
-        self.test_auth.app = FakeApp(iter([('204 No Content', {}, '')]),
+        self.test_auth.app = FakeApp(iter(NO_CONTENT_RESP * 1),
                                      sync_key='secret')
         req = self._make_request(
             '/v1/AUTH_cfa/c/o',
@@ -535,11 +1011,10 @@ def test_sync_request_success(self):
                      'x-timestamp': '123.456'})
         req.remote_addr = '127.0.0.1'
         resp = req.get_response(self.test_auth)
-        self.assertEquals(resp.status_int, 204)
+        self.assertEqual(resp.status_int, 204)
 
     def test_sync_request_fail_key(self):
-        self.test_auth.app = FakeApp(iter([('204 No Content', {}, '')]),
-                                     sync_key='secret')
+        self.test_auth.app = FakeApp(sync_key='secret')
         req = self._make_request(
             '/v1/AUTH_cfa/c/o',
             environ={'REQUEST_METHOD': 'DELETE'},
@@ -547,10 +1022,11 @@ def test_sync_request_fail_key(self):
                      'x-timestamp': '123.456'})
         req.remote_addr = '127.0.0.1'
         resp = req.get_response(self.test_auth)
-        self.assertEquals(resp.status_int, 401)
+        self.assertEqual(resp.status_int, 401)
+        self.assertEqual(resp.headers.get('Www-Authenticate'),
+                         'Swift realm="AUTH_cfa"')
 
-        self.test_auth.app = FakeApp(iter([('204 No Content', {}, '')]),
-                                     sync_key='othersecret')
+        self.test_auth.app = FakeApp(sync_key='othersecret')
         req = self._make_request(
             '/v1/AUTH_cfa/c/o',
             environ={'REQUEST_METHOD': 'DELETE'},
@@ -558,10 +1034,11 @@ def test_sync_request_fail_key(self):
                      'x-timestamp': '123.456'})
         req.remote_addr = '127.0.0.1'
         resp = req.get_response(self.test_auth)
-        self.assertEquals(resp.status_int, 401)
+        self.assertEqual(resp.status_int, 401)
+        self.assertEqual(resp.headers.get('Www-Authenticate'),
+                         'Swift realm="AUTH_cfa"')
 
-        self.test_auth.app = FakeApp(iter([('204 No Content', {}, '')]),
-                                     sync_key=None)
+        self.test_auth.app = FakeApp(sync_key=None)
         req = self._make_request(
             '/v1/AUTH_cfa/c/o',
             environ={'REQUEST_METHOD': 'DELETE'},
@@ -569,21 +1046,24 @@ def test_sync_request_fail_key(self):
                      'x-timestamp': '123.456'})
         req.remote_addr = '127.0.0.1'
         resp = req.get_response(self.test_auth)
-        self.assertEquals(resp.status_int, 401)
+        self.assertEqual(resp.status_int, 401)
+        self.assertEqual(resp.headers.get('Www-Authenticate'),
+                         'Swift realm="AUTH_cfa"')
 
     def test_sync_request_fail_no_timestamp(self):
-        self.test_auth.app = FakeApp(iter([('204 No Content', {}, '')]),
-                                     sync_key='secret')
+        self.test_auth.app = FakeApp(sync_key='secret')
         req = self._make_request(
             '/v1/AUTH_cfa/c/o',
             environ={'REQUEST_METHOD': 'DELETE'},
             headers={'x-container-sync-key': 'secret'})
         req.remote_addr = '127.0.0.1'
         resp = req.get_response(self.test_auth)
-        self.assertEquals(resp.status_int, 401)
+        self.assertEqual(resp.status_int, 401)
+        self.assertEqual(resp.headers.get('Www-Authenticate'),
+                         'Swift realm="AUTH_cfa"')
 
     def test_sync_request_success_lb_sync_host(self):
-        self.test_auth.app = FakeApp(iter([('204 No Content', {}, '')]),
+        self.test_auth.app = FakeApp(iter(NO_CONTENT_RESP * 1),
                                      sync_key='secret')
         req = self._make_request(
             '/v1/AUTH_cfa/c/o',
@@ -593,9 +1073,9 @@ def test_sync_request_success_lb_sync_host(self):
                      'x-forwarded-for': '127.0.0.1'})
         req.remote_addr = '127.0.0.2'
         resp = req.get_response(self.test_auth)
-        self.assertEquals(resp.status_int, 204)
+        self.assertEqual(resp.status_int, 204)
 
-        self.test_auth.app = FakeApp(iter([('204 No Content', {}, '')]),
+        self.test_auth.app = FakeApp(iter(NO_CONTENT_RESP * 1),
                                      sync_key='secret')
         req = self._make_request(
             '/v1/AUTH_cfa/c/o',
@@ -605,13 +1085,223 @@ def test_sync_request_success_lb_sync_host(self):
                      'x-cluster-client-ip': '127.0.0.1'})
         req.remote_addr = '127.0.0.2'
         resp = req.get_response(self.test_auth)
-        self.assertEquals(resp.status_int, 204)
+        self.assertEqual(resp.status_int, 204)
 
     def test_options_call(self):
         req = self._make_request('/v1/AUTH_cfa/c/o',
                                  environ={'REQUEST_METHOD': 'OPTIONS'})
         resp = self.test_auth.authorize(req)
-        self.assertEquals(resp, None)
+        self.assertIsNone(resp)
+
+    def test_get_user_group(self):
+        # More tests in TestGetUserGroups class
+        app = FakeApp()
+        ath = auth.filter_factory({})(app)
+
+        ath.users = {'test:tester': {'groups': ['.admin']}}
+        groups = ath._get_user_groups('test', 'test:tester', 'AUTH_test')
+        self.assertEqual(groups, 'test,test:tester,AUTH_test')
+
+        ath.users = {'test:tester': {'groups': []}}
+        groups = ath._get_user_groups('test', 'test:tester', 'AUTH_test')
+        self.assertEqual(groups, 'test,test:tester')
+
+    def test_auth_scheme(self):
+        req = self._make_request('/v1/BLAH_account',
+                                 headers={'X-Auth-Token': 'BLAH_t'})
+        resp = req.get_response(self.test_auth)
+        self.assertEqual(resp.status_int, 401)
+        self.assertTrue('Www-Authenticate' in resp.headers)
+        self.assertEqual(resp.headers.get('Www-Authenticate'),
+                         'Swift realm="BLAH_account"')
+
+    def test_successful_token_unicode_user(self):
+        app = FakeApp(iter(NO_CONTENT_RESP * 2))
+        conf = {u'user_t\u00e9st_t\u00e9ster': u'p\u00e1ss .admin'}
+        ath = auth.filter_factory(conf)(app)
+        quoted_acct = quote(u'/v1/AUTH_t\u00e9st'.encode('utf8'))
+        memcache = FakeMemcache()
+
+        wsgi_user = bytes_to_wsgi(u't\u00e9st:t\u00e9ster'.encode('utf8'))
+        req = self._make_request(
+            '/auth/v1.0',
+            headers={'X-Auth-User': wsgi_user,
+                     'X-Auth-Key': bytes_to_wsgi(u'p\u00e1ss'.encode('utf8'))})
+        req.environ['swift.cache'] = memcache
+        resp = req.get_response(ath)
+        self.assertEqual(resp.status_int, 200)
+        auth_token = resp.headers['X-Auth-Token']
+        self.assertEqual(quoted_acct,
+                         urlparse(resp.headers['X-Storage-Url']).path)
+
+        req = self._make_request(
+            '/auth/v1.0',
+            headers={'X-Auth-User': wsgi_user,
+                     'X-Auth-Key': bytes_to_wsgi(u'p\u00e1ss'.encode('utf8'))})
+        req.environ['swift.cache'] = memcache
+        resp = req.get_response(ath)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(auth_token, resp.headers['X-Auth-Token'])
+        self.assertEqual(quoted_acct,
+                         urlparse(resp.headers['X-Storage-Url']).path)
+
+        # storage urls should be url-encoded...
+        req = self._make_request(
+            quoted_acct, headers={'X-Auth-Token': auth_token})
+        req.environ['swift.cache'] = memcache
+        self.assertNotIn('swift.access_logging', req.environ)
+        resp = req.get_response(ath)
+        self.assertEqual(req.environ['swift.access_logging'],
+                         {'user_id': 't\u00e9st:t\u00e9ster'})
+        self.assertEqual(204, resp.status_int)
+
+        # ...but it also works if you send the account raw
+        req = self._make_request(
+            u'/v1/AUTH_t\u00e9st'.encode('utf8'),
+            headers={'X-Auth-Token': auth_token})
+        req.environ['swift.cache'] = memcache
+        resp = req.get_response(ath)
+        self.assertEqual(204, resp.status_int)
+
+    def test_request_method_not_allowed(self):
+        test_auth = auth.filter_factory({'user_ac_user': 'testing'})(FakeApp())
+        req = self._make_request(
+            '/auth/v1.0',
+            headers={'X-Auth-User': 'ac:user', 'X-Auth-Key': 'testing'},
+            environ={'REQUEST_METHOD': 'PUT'})
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 405)
+
+        req = self._make_request(
+            '/auth/v1.0',
+            headers={'X-Auth-User': 'ac:user', 'X-Auth-Key': 'testing'},
+            environ={'REQUEST_METHOD': 'HEAD'})
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 405)
+
+        req = self._make_request(
+            '/auth/v1.0',
+            headers={'X-Auth-User': 'ac:user', 'X-Auth-Key': 'testing'},
+            environ={'REQUEST_METHOD': 'POST'})
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 405)
+
+        req = self._make_request(
+            '/auth/v1.0',
+            headers={'X-Auth-User': 'ac:user', 'X-Auth-Key': 'testing'},
+            environ={'REQUEST_METHOD': 'DELETE'})
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 405)
+
+
+class TestAuthWithMultiplePrefixes(TestAuth):
+    """
+    Repeats all tests in TestAuth except adds multiple
+    reseller_prefix items
+    """
+
+    def setUp(self):
+        self.test_auth = auth.filter_factory(
+            {'reseller_prefix': 'AUTH_, SOMEOTHER_, YETANOTHER_'})(FakeApp())
+
+
+class TestGetUserGroups(unittest.TestCase):
+
+    def test_custom_url_config(self):
+        app = FakeApp()
+        ath = auth.filter_factory({
+            'user_test_tester':
+            'testing .admin http://saio:8080/v1/AUTH_monkey'})(app)
+        groups = ath._get_user_groups('test', 'test:tester', 'AUTH_monkey')
+        self.assertEqual(groups, 'test,test:tester,AUTH_test,AUTH_monkey')
+
+    def test_no_prefix_reseller(self):
+        app = FakeApp()
+        ath = auth.filter_factory({'reseller_prefix': ''})(app)
+
+        ath.users = {'test:tester': {'groups': ['.admin']}}
+        groups = ath._get_user_groups('test', 'test:tester', 'test')
+        self.assertEqual(groups, 'test,test:tester')
+
+        ath.users = {'test:tester': {'groups': []}}
+        groups = ath._get_user_groups('test', 'test:tester', 'test')
+        self.assertEqual(groups, 'test,test:tester')
+
+    def test_single_reseller(self):
+        app = FakeApp()
+        ath = auth.filter_factory({})(app)
+
+        ath.users = {'test:tester': {'groups': ['.admin']}}
+        groups = ath._get_user_groups('test', 'test:tester', 'AUTH_test')
+        self.assertEqual(groups, 'test,test:tester,AUTH_test')
+
+        ath.users = {'test:tester': {'groups': []}}
+        groups = ath._get_user_groups('test', 'test:tester', 'AUTH_test')
+        self.assertEqual(groups, 'test,test:tester')
+
+    def test_multiple_reseller(self):
+        app = FakeApp()
+        ath = auth.filter_factory(
+            {'reseller_prefix': 'AUTH_, SOMEOTHER_, YETANOTHER_'})(app)
+        self.assertEqual(ath.reseller_prefixes, ['AUTH_', 'SOMEOTHER_',
+                                                 'YETANOTHER_'])
+
+        ath.users = {'test:tester': {'groups': ['.admin']}}
+        groups = ath._get_user_groups('test', 'test:tester', 'AUTH_test')
+        self.assertEqual(groups,
+                         'test,test:tester,AUTH_test,'
+                         'SOMEOTHER_test,YETANOTHER_test')
+
+        ath.users = {'test:tester': {'groups': []}}
+        groups = ath._get_user_groups('test', 'test:tester', 'AUTH_test')
+        self.assertEqual(groups, 'test,test:tester')
+
+
+class TestDefinitiveAuth(unittest.TestCase):
+    def setUp(self):
+        self.test_auth = auth.filter_factory(
+            {'reseller_prefix': 'AUTH_, SOMEOTHER_'})(FakeApp())
+
+    def test_noreseller_prefix(self):
+        ath = auth.filter_factory({'reseller_prefix': ''})(FakeApp())
+        result = ath._is_definitive_auth(path='/v1/test')
+        self.assertEqual(result, False)
+        result = ath._is_definitive_auth(path='/v1/AUTH_test')
+        self.assertEqual(result, False)
+        result = ath._is_definitive_auth(path='/v1/BLAH_test')
+        self.assertEqual(result, False)
+
+    def test_blank_prefix(self):
+        ath = auth.filter_factory({'reseller_prefix':
+                                   " '', SOMEOTHER"})(FakeApp())
+        result = ath._is_definitive_auth(path='/v1/test')
+        self.assertEqual(result, False)
+        result = ath._is_definitive_auth(path='/v1/SOMEOTHER_test')
+        self.assertEqual(result, True)
+        result = ath._is_definitive_auth(path='/v1/SOMEOTHERtest')
+        self.assertEqual(result, False)
+
+    def test_default_prefix(self):
+        ath = auth.filter_factory({})(FakeApp())
+        result = ath._is_definitive_auth(path='/v1/AUTH_test')
+        self.assertEqual(result, True)
+        result = ath._is_definitive_auth(path='/v1/BLAH_test')
+        self.assertEqual(result, False)
+        ath = auth.filter_factory({'reseller_prefix': 'AUTH'})(FakeApp())
+        result = ath._is_definitive_auth(path='/v1/AUTH_test')
+        self.assertEqual(result, True)
+        result = ath._is_definitive_auth(path='/v1/BLAH_test')
+        self.assertEqual(result, False)
+
+    def test_multiple_prefixes(self):
+        ath = auth.filter_factory({'reseller_prefix':
+                                   'AUTH, SOMEOTHER'})(FakeApp())
+        result = ath._is_definitive_auth(path='/v1/AUTH_test')
+        self.assertEqual(result, True)
+        result = ath._is_definitive_auth(path='/v1/SOMEOTHER_test')
+        self.assertEqual(result, True)
+        result = ath._is_definitive_auth(path='/v1/BLAH_test')
+        self.assertEqual(result, False)
 
 
 class TestParseUserCreation(unittest.TestCase):
@@ -621,12 +1311,17 @@ def test_parse_user_creation(self):
             'user_test_tester3': 'testing',
             'user_has_url': 'urlly .admin http://a.b/v1/DEF_has',
             'user_admin_admin': 'admin .admin .reseller_admin',
+            'user_admin_auditor': 'admin_ro .reseller_reader',
         })(FakeApp())
-        self.assertEquals(auth_filter.users, {
+        self.assertEqual(auth_filter.users, {
             'admin:admin': {
                 'url': '$HOST/v1/ABC_admin',
                 'groups': ['.admin', '.reseller_admin'],
                 'key': 'admin'
+            }, 'admin:auditor': {
+                'url': '$HOST/v1/ABC_admin',
+                'groups': ['.reseller_reader'],
+                'key': 'admin_ro'
             }, 'test:tester3': {
                 'url': '$HOST/v1/ABC_test',
                 'groups': [],
@@ -650,7 +1345,7 @@ def test_base64_encoding(self):
                 b64encode('ab').rstrip('=')):
             'urlly .admin http://a.b/v1/DEF_has',
         })(FakeApp())
-        self.assertEquals(auth_filter.users, {
+        self.assertEqual(auth_filter.users, {
             'test:tester3': {
                 'url': '$HOST/v1/ABC_test',
                 'groups': ['.reseller_admin'],
@@ -669,6 +1364,652 @@ def test_key_with_no_value(self):
             'user_admin_admin': 'admin .admin .reseller_admin',
         }), FakeApp())
 
+    def test_account_with_no_user(self):
+        expected_msg = 'key user_testtester was provided in an invalid format'
+        with self.assertRaises(ValueError) as ctx:
+            auth.filter_factory({
+                'user_testtester': 'testing',
+            })(FakeApp())
+        self.assertEqual(str(ctx.exception), expected_msg)
+
+
+class TestAccountAcls(unittest.TestCase):
+    """
+    These tests use a single reseller prefix (AUTH_) and the
+    target paths are /v1/AUTH_<blah>
+    """
+
+    def setUp(self):
+        self.reseller_prefix = {}
+        self.accpre = 'AUTH'
+
+    def _make_request(self, path, **kwargs):
+        # Our TestAccountAcls default request will have a valid auth token
+        version, acct, _ = split_path(path, 1, 3, True)
+        headers = kwargs.pop('headers', {'X-Auth-Token': 'AUTH_tk'})
+        user_groups = kwargs.pop('user_groups', 'AUTH_firstacct')
+
+        # The account being accessed will have account ACLs
+        acl = {'admin': ['AUTH_admin'], 'read-write': ['AUTH_rw'],
+               'read-only': ['AUTH_ro']}
+        header_data = {'core-access-control':
+                       format_acl(version=2, acl_dict=acl)}
+        acls = kwargs.pop('acls', header_data)
+
+        req = Request.blank(path, headers=headers, **kwargs)
+
+        # Authorize the token by populating the request's cache
+        req.environ['swift.cache'] = FakeMemcache()
+        cache_key = 'AUTH_/token/AUTH_tk'
+        cache_entry = (time() + 3600, user_groups)
+        req.environ['swift.cache'].set(cache_key, cache_entry)
+
+        # Pretend get_account_info returned ACLs in sysmeta, and we cached that
+        cache_key = 'account/%s' % acct
+        cache_entry = {'sysmeta': acls}
+        req.environ['swift.cache'].set(cache_key, cache_entry)
+
+        return req
+
+    def _conf(self, moreconf):
+        conf = self.reseller_prefix
+        conf.update(moreconf)
+        return conf
+
+    def test_account_acl_success(self):
+        test_auth = auth.filter_factory(
+            self._conf({'user_admin_user': 'testing'}))(
+                FakeApp(iter(NO_CONTENT_RESP * 1)))
+
+        # admin (not a swift admin) wants to read from otheracct
+        req = self._make_request('/v1/%s_otheract' % self.accpre,
+                                 user_groups="AUTH_admin")
+
+        # The request returned by _make_request should be allowed
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 204)
+
+    def test_account_acl_failures(self):
+        test_auth = auth.filter_factory(
+            self._conf({'user_admin_user': 'testing'}))(
+                FakeApp())
+
+        # If I'm not authed as anyone on the ACLs, I shouldn't get in
+        req = self._make_request('/v1/%s_otheract' % self.accpre,
+                                 user_groups="AUTH_bob")
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 403)
+
+        # If the target account has no ACLs, a non-owner shouldn't get in
+        req = self._make_request('/v1/%s_otheract' % self.accpre,
+                                 user_groups="AUTH_admin",
+                                 acls={})
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 403)
+
+    def test_admin_privileges(self):
+        test_auth = auth.filter_factory(
+            self._conf({'user_admin_user': 'testing'}))(
+                FakeApp(iter(NO_CONTENT_RESP * 18)))
+
+        for target in (
+                '/v1/%s_otheracct' % self.accpre,
+                '/v1/%s_otheracct/container' % self.accpre,
+                '/v1/%s_otheracct/container/obj' % self.accpre):
+            for method in ('GET', 'HEAD', 'OPTIONS', 'PUT', 'POST', 'DELETE'):
+                # Admin ACL user can do anything
+                req = self._make_request(target, user_groups="AUTH_admin",
+                                         environ={'REQUEST_METHOD': method})
+                resp = req.get_response(test_auth)
+                self.assertEqual(resp.status_int, 204)
+
+                # swift_owner should be set to True
+                if method != 'OPTIONS':
+                    self.assertTrue(req.environ.get('swift_owner'))
+
+    def test_readwrite_privileges(self):
+        test_auth = auth.filter_factory(
+            self._conf({'user_rw_user': 'testing'}))(
+                FakeApp(iter(NO_CONTENT_RESP * 15)))
+
+        for target in ('/v1/%s_otheracct' % self.accpre,):
+            for method in ('GET', 'HEAD', 'OPTIONS'):
+                # Read-Write user can read account data
+                req = self._make_request(target, user_groups="AUTH_rw",
+                                         environ={'REQUEST_METHOD': method})
+                resp = req.get_response(test_auth)
+                self.assertEqual(resp.status_int, 204)
+
+                # swift_owner should NOT be set to True
+                self.assertFalse(req.environ.get('swift_owner'))
+
+            # RW user should NOT be able to PUT, POST, or DELETE to the account
+            for method in ('PUT', 'POST', 'DELETE'):
+                req = self._make_request(target, user_groups="AUTH_rw",
+                                         environ={'REQUEST_METHOD': method})
+                resp = req.get_response(test_auth)
+                self.assertEqual(resp.status_int, 403)
+
+        # RW user should be able to GET, PUT, POST, or DELETE to containers
+        # and objects
+        for target in ('/v1/%s_otheracct/c' % self.accpre,
+                       '/v1/%s_otheracct/c/o' % self.accpre):
+            for method in ('GET', 'HEAD', 'OPTIONS', 'PUT', 'POST', 'DELETE'):
+                req = self._make_request(target, user_groups="AUTH_rw",
+                                         environ={'REQUEST_METHOD': method})
+                resp = req.get_response(test_auth)
+                self.assertEqual(resp.status_int, 204)
+
+    def test_readonly_privileges(self):
+        test_auth = auth.filter_factory(
+            self._conf({'user_ro_user': 'testing'}))(
+                FakeApp(iter(NO_CONTENT_RESP * 9)))
+
+        # ReadOnly user should NOT be able to PUT, POST, or DELETE to account,
+        # container, or object
+        for target in ('/v1/%s_otheracct' % self.accpre,
+                       '/v1/%s_otheracct/cont' % self.accpre,
+                       '/v1/%s_otheracct/cont/obj' % self.accpre):
+            for method in ('GET', 'HEAD', 'OPTIONS'):
+                req = self._make_request(target, user_groups="AUTH_ro",
+                                         environ={'REQUEST_METHOD': method})
+                resp = req.get_response(test_auth)
+                self.assertEqual(resp.status_int, 204)
+                # swift_owner should NOT be set to True for the ReadOnly ACL
+                self.assertFalse(req.environ.get('swift_owner'))
+            for method in ('PUT', 'POST', 'DELETE'):
+                req = self._make_request(target, user_groups="AUTH_ro",
+                                         environ={'REQUEST_METHOD': method})
+                resp = req.get_response(test_auth)
+                self.assertEqual(resp.status_int, 403)
+                # swift_owner should NOT be set to True for the ReadOnly ACL
+                self.assertFalse(req.environ.get('swift_owner'))
+
+    def test_user_gets_best_acl(self):
+        test_auth = auth.filter_factory(
+            self._conf({'user_acct_username': 'testing'}))(
+                FakeApp(iter(NO_CONTENT_RESP * 18)))
+
+        mygroups = "AUTH_acct,AUTH_ro,AUTH_something,AUTH_admin"
+        for target in ('/v1/%s_otheracct' % self.accpre,
+                       '/v1/%s_otheracct/container' % self.accpre,
+                       '/v1/%s_otheracct/container/obj' % self.accpre):
+            for method in ('GET', 'HEAD', 'OPTIONS', 'PUT', 'POST', 'DELETE'):
+                # Admin ACL user can do anything
+                req = self._make_request(target, user_groups=mygroups,
+                                         environ={'REQUEST_METHOD': method})
+                resp = req.get_response(test_auth)
+                self.assertEqual(
+                    resp.status_int, 204, "%s (%s) - expected 204, got %d" %
+                    (target, method, resp.status_int))
+
+                # swift_owner should be set to True
+                if method != 'OPTIONS':
+                    self.assertTrue(req.environ.get('swift_owner'))
+
+    def test_acl_syntax_verification(self):
+        test_auth = auth.filter_factory(
+            self._conf({'user_admin_user': 'testing .admin'}))(
+                FakeApp(iter(NO_CONTENT_RESP * 5)))
+        user_groups = test_auth._get_user_groups('admin', 'admin:user',
+                                                 'AUTH_admin')
+        good_headers = {'X-Auth-Token': 'AUTH_tk'}
+        good_acl = json.dumps({"read-only": [u"á", "b"]})
+        bad_list_types = '{"read-only": ["a", 99]}'
+        bad_acl = 'syntactically invalid acl -- this does not parse as JSON'
+        wrong_acl = '{"other-auth-system":["valid","json","but","wrong"]}'
+        bad_value_acl = '{"read-write":["fine"],"admin":"should be a list"}'
+        not_dict_acl = '["read-only"]'
+        not_dict_acl2 = 1
+        empty_acls = ['{}', '', '{ }']
+        target = '/v1/%s_firstacct' % self.accpre
+
+        # no acls -- no problem!
+        req = self._make_request(target, headers=good_headers,
+                                 user_groups=user_groups)
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 204)
+
+        # syntactically valid acls should go through
+        update = {'x-account-access-control': good_acl}
+        req = self._make_request(target, user_groups=user_groups,
+                                 headers=dict(good_headers, **update))
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 204,
+                         'Expected 204, got %s, response body: %s'
+                         % (resp.status_int, resp.body))
+
+        # syntactically valid empty acls should go through
+        for acl in empty_acls:
+            update = {'x-account-access-control': acl}
+            req = self._make_request(target, user_groups=user_groups,
+                                     headers=dict(good_headers, **update))
+            resp = req.get_response(test_auth)
+            self.assertEqual(resp.status_int, 204)
+
+        errmsg = b'X-Account-Access-Control invalid: %s'
+        # syntactically invalid acls get a 400
+        update = {'x-account-access-control': bad_acl}
+        req = self._make_request(target, headers=dict(good_headers, **update))
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 400)
+        self.assertEqual(errmsg % b"Syntax error", resp.body[:46])
+
+        # syntactically valid acls with bad keys also get a 400
+        update = {'x-account-access-control': wrong_acl}
+        req = self._make_request(target, headers=dict(good_headers, **update))
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 400)
+        self.assertTrue(resp.body.startswith(
+            errmsg % b'Key "other-auth-system" not recognized'), resp.body)
+
+        # and do something sane with crazy data
+        update = {'x-account-access-control': u'{"\u1234": []}'.encode('utf8')}
+        req = self._make_request(target, headers=dict(good_headers, **update))
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 400)
+        self.assertTrue(resp.body.startswith(
+            errmsg % b'Key "\\u1234" not recognized'), resp.body)
+
+        # acls with good keys but bad values also get a 400
+        update = {'x-account-access-control': bad_value_acl}
+        req = self._make_request(target, headers=dict(good_headers, **update))
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 400)
+        self.assertTrue(resp.body.startswith(
+            errmsg % b'Value for key "admin" must be a list'), resp.body)
+
+        # acls with non-string-types in list also get a 400
+        update = {'x-account-access-control': bad_list_types}
+        req = self._make_request(target, headers=dict(good_headers, **update))
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 400)
+        self.assertTrue(resp.body.startswith(
+            errmsg % b'Elements of "read-only" list must be strings'),
+            resp.body)
+
+        # acls with wrong json structure also get a 400
+        update = {'x-account-access-control': not_dict_acl}
+        req = self._make_request(target, headers=dict(good_headers, **update))
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 400)
+        self.assertEqual(errmsg % b"Syntax error", resp.body[:46])
+
+        # acls with wrong json structure also get a 400
+        update = {'x-account-access-control': not_dict_acl2}
+        req = self._make_request(target, headers=dict(good_headers, **update))
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 400)
+        self.assertEqual(errmsg % b"Syntax error", resp.body[:46])
+
+    def test_acls_propagate_to_sysmeta(self):
+        test_auth = auth.filter_factory({'user_admin_user': 'testing'})(
+            FakeApp(iter(NO_CONTENT_RESP * 3)))
+
+        sysmeta_hdr = 'x-account-sysmeta-core-access-control'
+        target = '/v1/AUTH_firstacct'
+        good_headers = {'X-Auth-Token': 'AUTH_tk'}
+        good_acl = '{"read-only":["a","b"]}'
+
+        # no acls -- no problem!
+        req = self._make_request(target, headers=good_headers)
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 204)
+        self.assertIsNone(req.headers.get(sysmeta_hdr))
+
+        # syntactically valid acls should go through
+        update = {'x-account-access-control': good_acl}
+        req = self._make_request(target, headers=dict(good_headers, **update))
+        resp = req.get_response(test_auth)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(good_acl, req.headers.get(sysmeta_hdr))
+
+    def test_bad_acls_get_denied(self):
+        test_auth = auth.filter_factory({'user_admin_user': 'testing'})(
+            FakeApp(iter(NO_CONTENT_RESP * 3)))
+
+        target = '/v1/AUTH_firstacct'
+        good_headers = {'X-Auth-Token': 'AUTH_tk'}
+        bad_acls = (
+            'syntax error',
+            '{"bad_key":"should_fail"}',
+            '{"admin":"not a list, should fail"}',
+            '{"admin":["valid"],"read-write":"not a list, should fail"}',
+        )
+
+        for bad_acl in bad_acls:
+            hdrs = dict(good_headers, **{'x-account-access-control': bad_acl})
+            req = self._make_request(target, headers=hdrs)
+            resp = req.get_response(test_auth)
+            self.assertEqual(resp.status_int, 400)
+
+
+class TestAuthMultiplePrefixes(TestAccountAcls):
+    """
+    These tests repeat the same tests as TestAccountACLs,
+    but use multiple reseller prefix items (AUTH_ and SOMEOTHER_).
+    The target paths are /v1/SOMEOTHER_<blah>
+    """
+
+    def setUp(self):
+        self.reseller_prefix = {'reseller_prefix': 'AUTH_, SOMEOTHER_'}
+        self.accpre = 'SOMEOTHER'
+
+
+class PrefixAccount(unittest.TestCase):
+
+    def test_default(self):
+        conf = {}
+        test_auth = auth.filter_factory(conf)(FakeApp())
+        self.assertEqual(test_auth._get_account_prefix(
+                         'AUTH_1234'), 'AUTH_')
+        self.assertIsNone(test_auth._get_account_prefix('JUNK_1234'))
+
+    def test_same_as_default(self):
+        conf = {'reseller_prefix': 'AUTH'}
+        test_auth = auth.filter_factory(conf)(FakeApp())
+        self.assertEqual(test_auth._get_account_prefix(
+                         'AUTH_1234'), 'AUTH_')
+        self.assertIsNone(test_auth._get_account_prefix('JUNK_1234'))
+
+    def test_blank_reseller(self):
+        conf = {'reseller_prefix': ''}
+        test_auth = auth.filter_factory(conf)(FakeApp())
+        self.assertEqual(test_auth._get_account_prefix(
+                         '1234'), '')
+        self.assertEqual(test_auth._get_account_prefix(
+                         'JUNK_1234'), '')  # yes, it should return ''
+
+    def test_multiple_resellers(self):
+        conf = {'reseller_prefix': 'AUTH, PRE2'}
+        test_auth = auth.filter_factory(conf)(FakeApp())
+        self.assertEqual(test_auth._get_account_prefix(
+                         'AUTH_1234'), 'AUTH_')
+        self.assertIsNone(test_auth._get_account_prefix('JUNK_1234'))
+
+
+class ServiceTokenFunctionality(unittest.TestCase):
+
+    def _make_authed_request(self, conf, remote_user, path, method='GET'):
+        """Make a request with tempauth as auth
+
+        Acts as though the user had presented a token
+        granting groups as described in remote_user.
+        If remote_user contains the .service group, it emulates presenting
+        X-Service-Token containing a .service group.
+
+        :param conf: configuration for tempauth
+        :param remote_user: the groups the user belongs to. Examples:
+            acct:joe,acct                         user joe, no .admin
+            acct:joe,acct,AUTH_joeacct            user joe, jas .admin group
+            acct:joe,acct,AUTH_joeacct,.service   adds .service group
+        :param path: the path of the request
+        :param method: the method (defaults to GET)
+
+        :returns: response object
+        """
+        self.req = Request.blank(path)
+        self.req.method = method
+        self.req.remote_user = remote_user
+        fake_app = FakeApp(iter([('200 OK', {}, '')]))
+        test_auth = auth.filter_factory(conf)(fake_app)
+        resp = self.req.get_response(test_auth)
+        return resp
+
+    def test_authed_for_path_single(self):
+        resp = self._make_authed_request({}, 'acct:joe,acct,AUTH_acct',
+                                             '/v1/AUTH_acct')
+        self.assertEqual(resp.status_int, 200)
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH'}, 'acct:joe,acct,AUTH_acct',
+                                         '/v1/AUTH_acct/c', method='PUT')
+        self.assertEqual(resp.status_int, 200)
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH'},
+            'admin:mary,admin,AUTH_admin,.reseller_reader',
+            '/v1/AUTH_acct', method='GET')
+        self.assertEqual(resp.status_int, 200)
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH'},
+            'admin:mary,admin,AUTH_admin,.reseller_reader',
+            '/v1/AUTH_acct/c', method='GET')
+        self.assertEqual(resp.status_int, 200)
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH'},
+            'admin:mary,admin,AUTH_admin,.reseller_admin',
+            '/v1/AUTH_acct', method='GET')
+        self.assertEqual(resp.status_int, 200)
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH'},
+            'admin:mary,admin,AUTH_admin,.reseller_admin',
+            '/v1/AUTH_acct', method='DELETE')
+        self.assertEqual(resp.status_int, 200)
+
+    def test_denied_for_path_single(self):
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH'},
+            'fredacc:fred,fredacct,AUTH_fredacc',
+            '/v1/AUTH_acct')
+        self.assertEqual(resp.status_int, 403)
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH'},
+            'acct:joe,acct',
+            '/v1/AUTH_acct',
+            method='PUT')
+        self.assertEqual(resp.status_int, 403)
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH'},
+            'acct:joe,acct,AUTH_acct',
+            '/v1/AUTH_acct',
+            method='DELETE')
+        self.assertEqual(resp.status_int, 403)
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH'},
+            'admin:mary,admin,.admin,.reseller_reader',
+            '/v1/AUTH_acct', method='PUT')
+        self.assertEqual(resp.status_int, 403)
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH'},
+            'admin:mary,admin,.admin,.reseller_reader',
+            '/v1/AUTH_acct', method='DELETE')
+        self.assertEqual(resp.status_int, 403)
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH'},
+            'admin:mary,admin,.admin,.reseller_reader',
+            '/v1/AUTH_acct/c', method='PUT')
+        self.assertEqual(resp.status_int, 403)
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH'},
+            'admin:mary,admin,.admin,.reseller_reader',
+            '/v1/AUTH_acct/c', method='DELETE')
+        self.assertEqual(resp.status_int, 403)
+
+    def test_authed_for_primary_path_multiple(self):
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH, PRE2'},
+            'acct:joe,acct,AUTH_acct,PRE2_acct',
+            '/v1/PRE2_acct')
+        self.assertEqual(resp.status_int, 200)
+
+    def test_denied_for_second_path_with_only_operator_role(self):
+        # User only presents a token in X-Auth-Token (or in X-Service-Token)
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH, PRE2',
+             'PRE2_require_group': '.service'},
+            'acct:joe,acct,AUTH_acct,PRE2_acct',
+            '/v1/PRE2_acct')
+        self.assertEqual(resp.status_int, 403)
+
+        # User puts token in both X-Auth-Token and X-Service-Token
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH, PRE2',
+             'PRE2_require_group': '.service'},
+            'acct:joe,acct,AUTH_acct,PRE2_acct,AUTH_acct,PRE2_acct',
+            '/v1/PRE2_acct')
+        self.assertEqual(resp.status_int, 403)
+
+    def test_authed_for_second_path_with_operator_role_and_service(self):
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH, PRE2',
+             'PRE2_require_group': '.service'},
+            'acct:joe,acct,AUTH_acct,PRE2_acct,'
+            'admin:mary,admin,AUTH_admin,PRE2_admin,.service',
+            '/v1/PRE2_acct')
+        self.assertEqual(resp.status_int, 200)
+
+    def test_denied_for_second_path_with_only_service(self):
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH, PRE2',
+             'PRE2_require_group': '.service'},
+            'admin:mary,admin,AUTH_admin,PRE2_admin,.service',
+            '/v1/PRE2_acct')
+        self.assertEqual(resp.status_int, 403)
+
+    def test_denied_for_second_path_for_service_user(self):
+        # User presents token with 'service' role in X-Auth-Token
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH, PRE2',
+             'PRE2_require_group': '.service'},
+            'admin:mary,admin,AUTH_admin,PRE2_admin,.service',
+            '/v1/PRE2_acct')
+        self.assertEqual(resp.status_int, 403)
+
+        # User presents token with 'service' role in X-Auth-Token
+        # and also in X-Service-Token
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH, PRE2',
+             'PRE2_require_group': '.service'},
+            'admin:mary,admin,AUTH_admin,PRE2_admin,.service,'
+            'admin:mary,admin,AUTH_admin,PRE2_admin,.service',
+            '/v1/PRE2_acct')
+        self.assertEqual(resp.status_int, 403)
+
+    def test_delete_denied_for_second_path(self):
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH, PRE2',
+             'PRE2_require_group': '.service'},
+            'acct:joe,acct,AUTH_acct,PRE2_acct,'
+            'admin:mary,admin,AUTH_admin,PRE2_admin,.service',
+            '/v1/PRE2_acct',
+            method='DELETE')
+        self.assertEqual(resp.status_int, 403)
+
+    def test_delete_of_second_path_by_reseller_admin(self):
+        resp = self._make_authed_request(
+            {'reseller_prefix': 'AUTH, PRE2',
+             'PRE2_require_group': '.service'},
+            'acct:joe,acct,AUTH_acct,PRE2_acct,'
+            'admin:mary,admin,AUTH_admin,PRE2_admin,.reseller_admin',
+            '/v1/PRE2_acct',
+            method='DELETE')
+        self.assertEqual(resp.status_int, 200)
+
+
+class TestTokenHandling(unittest.TestCase):
+
+    def _make_request(self, conf, path, headers, method='GET'):
+        """Make a request with tempauth as auth
+
+        It sets up AUTH_t and AUTH_s as tokens in memcache, where "joe"
+        has .admin role on /v1/AUTH_acct and user "glance" has .service
+        role on /v1/AUTH_admin.
+
+        :param conf: configuration for tempauth
+        :param path: the path of the request
+        :param headers: allows you to pass X-Auth-Token, etc.
+        :param method: the method (defaults to GET)
+
+        :returns: response object
+        """
+        fake_app = FakeApp(iter([('200 OK', {}, '')]))
+        self.test_auth = auth.filter_factory(conf)(fake_app)
+        self.req = Request.blank(path, headers=headers)
+        self.req.method = method
+        self.req.environ['swift.cache'] = FakeMemcache()
+        self._setup_user_and_token('AUTH_tk', 'acct', 'acct:joe',
+                                   '.admin')
+        self._setup_user_and_token('AUTH_tks', 'admin', 'admin:glance',
+                                   '.service')
+        resp = self.req.get_response(self.test_auth)
+        return resp
+
+    def _setup_user_and_token(self, token_name, account, account_user,
+                              groups):
+        """Setup named token in memcache
+
+        :param token_name: name of token
+        :param account: example: acct
+        :param account_user: example: acct_joe
+        :param groups: example: .admin
+        """
+        self.test_auth.users[account_user] = dict(groups=[groups])
+        account_id = 'AUTH_%s' % account
+        cache_key = 'AUTH_/token/%s' % token_name
+        cache_entry = (time() + 3600,
+                       self.test_auth._get_user_groups(account,
+                                                       account_user,
+                                                       account_id))
+        self.req.environ['swift.cache'].set(cache_key, cache_entry)
+
+    def test_tokens_set_remote_user(self):
+        conf = {}  # Default conf
+        resp = self._make_request(conf, '/v1/AUTH_acct',
+                                  {'x-auth-token': 'AUTH_tk'})
+        self.assertEqual(self.req.environ['REMOTE_USER'],
+                         'acct,acct:joe,AUTH_acct')
+        self.assertEqual(resp.status_int, 200)
+        # Add x-service-token
+        resp = self._make_request(conf, '/v1/AUTH_acct',
+                                  {'x-auth-token': 'AUTH_tk',
+                                   'x-service-token': 'AUTH_tks'})
+        self.assertEqual(self.req.environ['REMOTE_USER'],
+                         'acct,acct:joe,AUTH_acct,admin,admin:glance,.service')
+        self.assertEqual(resp.status_int, 200)
+        # Put x-auth-token value into x-service-token
+        resp = self._make_request(conf, '/v1/AUTH_acct',
+                                  {'x-auth-token': 'AUTH_tk',
+                                   'x-service-token': 'AUTH_tk'})
+        self.assertEqual(self.req.environ['REMOTE_USER'],
+                         'acct,acct:joe,AUTH_acct,acct,acct:joe,AUTH_acct')
+        self.assertEqual(resp.status_int, 200)
+
+    def test_service_token_given_and_needed(self):
+        conf = {'reseller_prefix': 'AUTH, PRE2',
+                'PRE2_require_group': '.service'}
+        resp = self._make_request(conf, '/v1/PRE2_acct',
+                                  {'x-auth-token': 'AUTH_tk',
+                                   'x-service-token': 'AUTH_tks'})
+        self.assertEqual(resp.status_int, 200)
+
+    def test_service_token_omitted(self):
+        conf = {'reseller_prefix': 'AUTH, PRE2',
+                'PRE2_require_group': '.service'}
+        resp = self._make_request(conf, '/v1/PRE2_acct',
+                                  {'x-auth-token': 'AUTH_tk'})
+        self.assertEqual(resp.status_int, 403)
+
+    def test_invalid_tokens(self):
+        conf = {'reseller_prefix': 'AUTH, PRE2',
+                'PRE2_require_group': '.service'}
+        resp = self._make_request(conf, '/v1/PRE2_acct',
+                                  {'x-auth-token': 'AUTH_junk'})
+        self.assertEqual(resp.status_int, 401)
+        resp = self._make_request(conf, '/v1/PRE2_acct',
+                                  {'x-auth-token': 'AUTH_tk',
+                                   'x-service-token': 'AUTH_junk'})
+        self.assertEqual(resp.status_int, 403)
+        resp = self._make_request(conf, '/v1/PRE2_acct',
+                                  {'x-auth-token': 'AUTH_junk',
+                                   'x-service-token': 'AUTH_tks'})
+        self.assertEqual(resp.status_int, 401)
+
+
+class TestUtilityMethods(unittest.TestCase):
+    def test_account_acls_bad_path_raises_exception(self):
+        auth_inst = auth.filter_factory({})(FakeApp())
+        req = Request({'PATH_INFO': '/'})
+        self.assertRaises(ValueError, auth_inst.account_acls, req)
+
 
 if __name__ == '__main__':
     unittest.main()
diff --git a/test/unit/common/middleware/test_tempurl.py b/test/unit/common/middleware/test_tempurl.py
index 7031152970..03bf6c7e4e 100644
--- a/test/unit/common/middleware/test_tempurl.py
+++ b/test/unit/common/middleware/test_tempurl.py
@@ -1,4 +1,19 @@
-# Copyright (c) 2011 OpenStack, LLC.
+# Copyright (c) 2011-2014 Greg Holt
+# Copyright (c) 2012-2013 Peter Portante
+# Copyright (c) 2012 Iryoung Jeong
+# Copyright (c) 2012 Michael Barton
+# Copyright (c) 2013 Alex Gaynor
+# Copyright (c) 2013 Chuck Thier
+# Copyright (c) 2013 David Goetz
+# Copyright (c) 2015 Donagh McCabe
+# Copyright (c) 2013 Greg Lange
+# Copyright (c) 2013 John Dickinson
+# Copyright (c) 2013 Kun Huang
+# Copyright (c) 2013 Richard Hawkins
+# Copyright (c) 2013 Samuel Merritt
+# Copyright (c) 2013 Shri Javadekar
+# Copyright (c) 2013 Tong Li
+# Copyright (c) 2013 ZhiQiang Fan
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,42 +28,20 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
+import base64
 import hmac
+import itertools
+from unittest import mock
 import unittest
-from hashlib import sha1
-from contextlib import contextmanager
-from time import time
+import hashlib
+from urllib.parse import quote
+from time import time, strftime, gmtime
 
+from swift.common.middleware import tempauth, tempurl, proxy_logging
+from swift.common.header_key_dict import HeaderKeyDict
 from swift.common.swob import Request, Response
-from swift.common.middleware import tempauth, tempurl
-
-
-class FakeMemcache(object):
-
-    def __init__(self):
-        self.store = {}
-
-    def get(self, key):
-        return self.store.get(key)
-
-    def set(self, key, value, timeout=0):
-        self.store[key] = value
-        return True
-
-    def incr(self, key, timeout=0):
-        self.store[key] = self.store.setdefault(key, 0) + 1
-        return self.store[key]
-
-    @contextmanager
-    def soft_lock(self, key, timeout=0, retries=5):
-        yield True
-
-    def delete(self, key):
-        try:
-            del self.store[key]
-        except Exception:
-            pass
-        return True
+from swift.common import utils, registry
+from test.debug_logger import debug_logger
 
 
 class FakeApp(object):
@@ -57,10 +50,13 @@ def __init__(self, status_headers_body_iter=None):
         self.calls = 0
         self.status_headers_body_iter = status_headers_body_iter
         if not self.status_headers_body_iter:
-            self.status_headers_body_iter = iter([('404 Not Found', {
-                'x-test-header-one-a': 'value1',
-                'x-test-header-two-a': 'value2',
-                'x-test-header-two-b': 'value3'}, '')])
+            self.status_headers_body_iter = iter(
+                itertools.repeat((
+                    '404 Not Found', {
+                        'x-test-header-one-a': 'value1',
+                        'x-test-header-two-a': 'value2',
+                        'x-test-header-two-b': 'value3'},
+                    '')))
         self.request = None
 
     def __call__(self, env, start_response):
@@ -70,7 +66,7 @@ def __call__(self, env, start_response):
             resp = env['swift.authorize'](self.request)
             if resp:
                 return resp(env, start_response)
-        status, headers, body = self.status_headers_body_iter.next()
+        status, headers, body = next(self.status_headers_body_iter)
         return Response(status=status, headers=headers,
                         body=body)(env, start_response)
 
@@ -79,323 +75,1013 @@ class TestTempURL(unittest.TestCase):
 
     def setUp(self):
         self.app = FakeApp()
-        self.auth = tempauth.filter_factory({})(self.app)
+        self.auth = tempauth.filter_factory({'reseller_prefix': ''})(self.app)
         self.tempurl = tempurl.filter_factory({})(self.auth)
+        self.logger = self.tempurl.logger = debug_logger()
 
-    def _make_request(self, path, **kwargs):
-        req = Request.blank(path, **kwargs)
-        req.environ['swift.cache'] = FakeMemcache()
+    def _make_request(self, path, environ=None, keys=(), container_keys=None,
+                      **kwargs):
+        if environ is None:
+            environ = {}
+
+        _junk, account, _junk, _junk = utils.split_path(path, 2, 4, True)
+        self._fake_cache_environ(environ, account, keys,
+                                 container_keys=container_keys)
+        req = Request.blank(path, environ=environ, **kwargs)
         return req
 
+    def _fake_cache_environ(self, environ, account, keys, container_keys=None):
+        """
+        Fake out the caching layer for get_account_info(). Injects account data
+        into environ such that keys are the tempurl keys, if set.
+        """
+        meta = {'swash': 'buckle'}
+        for idx, key in enumerate(keys):
+            meta_name = 'Temp-URL-key' + (("-%d" % (idx + 1) if idx else ""))
+            if key:
+                meta[meta_name] = key
+
+        ic = environ.setdefault('swift.infocache', {})
+        ic['account/' + account] = {
+            'status': 204,
+            'container_count': '0',
+            'total_object_count': '0',
+            'bytes': '0',
+            'meta': meta}
+
+        meta = {}
+        for i, key in enumerate(container_keys or []):
+            meta_name = 'Temp-URL-key' + (("-%d" % (i + 1) if i else ""))
+            meta[meta_name] = key
+
+        container_cache_key = 'container/' + account + '/c'
+        ic.setdefault(container_cache_key, {'meta': meta})
+
     def test_passthrough(self):
         resp = self._make_request('/v1/a/c/o').get_response(self.tempurl)
-        self.assertEquals(resp.status_int, 401)
-        self.assertTrue('Temp URL invalid' not in resp.body)
+        self.assertEqual(resp.status_int, 401)
+        self.assertNotIn(b'Temp URL invalid', resp.body)
+
+    def test_allow_options(self):
+        self.app.status_headers_body_iter = iter([('200 Ok', {}, '')])
+        resp = self._make_request(
+            '/v1/a/c/o?temp_url_sig=abcde&temp_url_expires=12345',
+            environ={'REQUEST_METHOD': 'OPTIONS'}).get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 200)
+
+    def assert_valid_sig(self, expires, path, keys, sig, environ=None,
+                         prefix=None):
+        if not environ:
+            environ = {}
+        if isinstance(sig, bytes):
+            sig = sig.decode('utf-8')
+        environ['QUERY_STRING'] = 'temp_url_sig=%s&temp_url_expires=%s' % (
+            sig.replace('+', '%2B'), expires)
+        if prefix is not None:
+            environ['QUERY_STRING'] += '&temp_url_prefix=%s' % prefix
+        req = self._make_request(path, keys=keys, environ=environ)
+        self.tempurl.app = FakeApp(iter([('200 Ok', (), '123')]))
+        resp = req.get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['content-disposition'],
+                         'attachment; filename="o"; ' + "filename*=UTF-8''o")
+        self.assertEqual(resp.headers['expires'],
+                         strftime('%a, %d %b %Y %H:%M:%S GMT',
+                                  gmtime(expires)))
+        self.assertEqual(req.environ['swift.authorize_override'], True)
+        self.assertEqual(req.environ['REMOTE_USER'], '.wsgi.tempurl')
 
     def test_get_valid(self):
         method = 'GET'
         expires = int(time() + 86400)
         path = '/v1/a/c/o'
-        key = 'abc'
-        hmac_body = '%s\n%s\n%s' % (method, expires, path)
-        sig = hmac.new(key, hmac_body, sha1).hexdigest()
-        req = self._make_request(path,
-            environ={'QUERY_STRING':
-                       'temp_url_sig=%s&temp_url_expires=%s' % (sig, expires)})
-        req.environ['swift.cache'].set('temp-url-key/a', key)
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+
+        sig = hmac.new(key, hmac_body, hashlib.sha1).hexdigest()
+        self.assert_valid_sig(expires, path, [key], sig)
+
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        self.assert_valid_sig(expires, path, [key], sig)
+
+        sig = base64.b64encode(hmac.new(
+            key, hmac_body, hashlib.sha256).digest())
+        self.assert_valid_sig(expires, path, [key], b'sha256:' + sig)
+
+        sig = base64.b64encode(hmac.new(
+            key, hmac_body, hashlib.sha512).digest())
+        self.assert_valid_sig(expires, path, [key], b'sha512:' + sig)
+
+        self.assertEqual(self.logger.statsd_client.get_stats_counts(), {
+            'tempurl.digests.sha1': 1,
+            'tempurl.digests.sha256': 2,
+            'tempurl.digests.sha512': 1
+        })
+
+    def test_get_valid_key2(self):
+        method = 'GET'
+        expires = int(time() + 86400)
+        path = '/v1/a/c/o'
+        key1 = b'abc123'
+        key2 = b'def456'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig1 = hmac.new(key1, hmac_body, hashlib.sha256).hexdigest()
+        sig2 = hmac.new(key2, hmac_body, hashlib.sha256).hexdigest()
+        for sig in (sig1, sig2):
+            self.assert_valid_sig(expires, path, [key1, key2], sig)
+
+    def test_get_valid_container_keys(self):
+        ic = {}
+        environ = {'swift.infocache': ic}
+        # Add two static container keys
+        container_keys = ['me', 'other']
+        meta = {}
+        for idx, key in enumerate(container_keys):
+            meta_name = 'Temp-URL-key' + (("-%d" % (idx + 1) if idx else ""))
+            if key:
+                meta[meta_name] = key
+        ic['container/a/c'] = {'meta': meta}
+
+        method = 'GET'
+        expires = int(time() + 86400)
+        path = '/v1/a/c/o'
+        key1 = b'me'
+        key2 = b'other'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig1 = hmac.new(key1, hmac_body, hashlib.sha256).hexdigest()
+        sig2 = hmac.new(key2, hmac_body, hashlib.sha256).hexdigest()
+        account_keys = []
+        for sig in (sig1, sig2):
+            self.assert_valid_sig(expires, path, account_keys, sig, environ)
+
+    def test_signature_trim(self):
+        # Insert proxy logging into the pipeline
+        p_logging = proxy_logging.filter_factory({})(self.app)
+        self.auth = tempauth.filter_factory({
+            'reseller_prefix': ''})(p_logging)
+        self.tempurl = tempurl.filter_factory({
+            'allowed_digests': 'sha1'})(self.auth)
+
+        # valid sig should be exactly 40 hex chars
+        sig = 'deadbeefdeadbeefdeadbeefdeadbeefdeadbeef'
+        expires = int(time() + 1000)
+        p_logging.access_logger.logger = debug_logger('fake')
+        resp = self._make_request(
+            '/v1/a/c/o?temp_url_sig=%s&temp_url_expires=%d' % (sig, expires))
+
+        with mock.patch('swift.common.middleware.tempurl.TempURL._get_keys',
+                        return_value=[('key', tempurl.CONTAINER_SCOPE)]):
+            with mock.patch(
+                    'swift.common.middleware.tempurl.TempURL._get_hmacs',
+                    return_value=[(sig, tempurl.CONTAINER_SCOPE)]):
+                resp.get_response(self.tempurl)
+        trimmed_sig_qs = '%s...' % sig[:16]
+        info_lines = p_logging.access_logger. \
+            logger.get_lines_for_level('info')
+
+        self.assertIn(trimmed_sig_qs, info_lines[0])
+
+    @mock.patch('swift.common.middleware.tempurl.time', return_value=0)
+    def test_get_valid_with_filename(self, mock_time):
+        method = 'GET'
+        expires = (((24 + 1) * 60 + 1) * 60) + 1
+        path = '/v1/a/c/o'
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(path, keys=[key], environ={
+            'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s&'
+            'filename=bob%%20%%22killer%%22.txt' % (sig, expires)})
+        self.tempurl.app = FakeApp(iter([('200 Ok', (), '123')]))
+        resp = req.get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['content-disposition'],
+                         'attachment; filename="bob %22killer%22.txt"; ' +
+                         "filename*=UTF-8''bob%20%22killer%22.txt")
+        self.assertIn('expires', resp.headers)
+        self.assertEqual('Fri, 02 Jan 1970 01:01:01 GMT',
+                         resp.headers['expires'])
+        self.assertEqual(req.environ['swift.authorize_override'], True)
+        self.assertEqual(req.environ['REMOTE_USER'], '.wsgi.tempurl')
+
+    def test_head_valid_with_filename(self):
+        method = 'HEAD'
+        expires = int(time() + 86400)
+        path = '/v1/a/c/o'
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(path, keys=[key], environ={
+            'REQUEST_METHOD': 'HEAD',
+            'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s&'
+            'filename=bob_killer.txt' % (sig, expires)})
+        self.tempurl.app = FakeApp(iter([('200 Ok', (), '123')]))
+        resp = req.get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['content-disposition'],
+                         'attachment; filename="bob_killer.txt"; ' +
+                         "filename*=UTF-8''bob_killer.txt")
+
+    def test_head_and_get_headers_match(self):
+        method = 'HEAD'
+        expires = int(time() + 86400)
+        path = '/v1/a/c/o'
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(path, keys=[key], environ={
+            'REQUEST_METHOD': 'HEAD',
+            'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s'
+            % (sig, expires)})
+        self.tempurl.app = FakeApp(iter([('200 Ok', (), '123')]))
+        resp = req.get_response(self.tempurl)
+
+        get_method = 'GET'
+        get_hmac_body = ('%s\n%i\n%s' %
+                         (get_method, expires, path)).encode('utf-8')
+        get_sig = hmac.new(key, get_hmac_body, hashlib.sha256).hexdigest()
+        get_req = self._make_request(path, keys=[key], environ={
+            'REQUEST_METHOD': 'GET',
+            'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s'
+            % (get_sig, expires)})
+        self.tempurl.app = FakeApp(iter([('200 Ok', (), '123')]))
+        get_resp = get_req.get_response(self.tempurl)
+        self.assertEqual(resp.headers, get_resp.headers)
+
+    @mock.patch('swift.common.middleware.tempurl.time', return_value=0)
+    def test_get_valid_with_filename_and_inline(self, mock_time):
+        method = 'GET'
+        expires = 1
+        path = '/v1/a/c/o'
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(path, keys=[key], environ={
+            'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s&'
+            'filename=bob%%20%%22killer%%22.txt&inline=' % (sig, expires)})
+        self.tempurl.app = FakeApp(iter([('200 Ok', (), '123')]))
+        resp = req.get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['content-disposition'],
+                         'inline; filename="bob %22killer%22.txt"; ' +
+                         "filename*=UTF-8''bob%20%22killer%22.txt")
+        self.assertIn('expires', resp.headers)
+        self.assertEqual('Thu, 01 Jan 1970 00:00:01 GMT',
+                         resp.headers['expires'])
+        self.assertEqual(req.environ['swift.authorize_override'], True)
+        self.assertEqual(req.environ['REMOTE_USER'], '.wsgi.tempurl')
+
+    def test_get_valid_with_inline(self):
+        method = 'GET'
+        expires = int(time() + 86400)
+        path = '/v1/a/c/o'
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(path, keys=[key], environ={
+            'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s&'
+            'inline=' % (sig, expires)})
+        self.tempurl.app = FakeApp(iter([('200 Ok', (), '123')]))
+        resp = req.get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['content-disposition'], 'inline')
+        self.assertIn('expires', resp.headers)
+        self.assertEqual(req.environ['swift.authorize_override'], True)
+        self.assertEqual(req.environ['REMOTE_USER'], '.wsgi.tempurl')
+
+    def test_get_valid_with_prefix(self):
+        method = 'GET'
+        expires = int(time() + 86400)
+        prefix = 'p1/p2/'
+        sig_path = 'prefix:/v1/a/c/' + prefix
+        query_path = '/v1/a/c/' + prefix + 'o'
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' %
+                     (method, expires, sig_path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        self.assert_valid_sig(expires, query_path, [key], sig, prefix=prefix)
+
+        query_path = query_path[:-1] + 'p3/o'
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' %
+                     (method, expires, sig_path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        self.assert_valid_sig(expires, query_path, [key], sig, prefix=prefix)
+
+    def test_get_valid_with_prefix_and_staticweb(self):
+        method = 'GET'
+        expires = int(time() + 86400)
+        prefix = 'p1/p2/'
+        sig_path = 'prefix:/v1/a/c/' + prefix
+        query_path = '/v1/a/c/' + prefix + 'o'
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' %
+                     (method, expires, sig_path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha512).hexdigest()
+        req = self._make_request(query_path, keys=[key], environ={
+            'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s&'
+            'temp_url_prefix=%s' % (sig, expires, prefix)})
+        self.tempurl.app = FakeApp(iter([('200 Ok', {
+            'X-Backend-Content-Generator': 'staticweb'}, b'123')]))
+        resp = req.get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 200)
+        # This is the key thing: if the response came from staticweb, assume
+        # the client is a browser and doesn't want a download prompt
+        self.assertEqual(resp.headers['content-disposition'], 'inline')
+        self.assertIn('expires', resp.headers)
+        self.assertEqual(req.environ['swift.authorize_override'], True)
+        self.assertEqual(req.environ['REMOTE_USER'], '.wsgi.tempurl')
+
+    def test_get_valid_with_prefix_empty(self):
+        method = 'GET'
+        expires = int(time() + 86400)
+        sig_path = 'prefix:/v1/a/c/'
+        query_path = '/v1/a/c/o'
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' %
+                     (method, expires, sig_path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        self.assert_valid_sig(expires, query_path, [key], sig, prefix='')
+
+    def test_obj_odd_chars(self):
+        method = 'GET'
+        expires = int(time() + 86400)
+        path = '/v1/a/c/a\r\nb'
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(quote(path), keys=[key], environ={
+            'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                sig, expires)})
+        self.tempurl.app = FakeApp(iter([('200 Ok', (), '123')]))
+        resp = req.get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['content-disposition'],
+                         'attachment; filename="a%0D%0Ab"; ' +
+                         "filename*=UTF-8''a%0D%0Ab")
+        self.assertIn('expires', resp.headers)
+        self.assertEqual(req.environ['swift.authorize_override'], True)
+        self.assertEqual(req.environ['REMOTE_USER'], '.wsgi.tempurl')
+
+    def test_obj_odd_chars_in_content_disposition_metadata(self):
+        method = 'GET'
+        expires = int(time() + 86400)
+        path = '/v1/a/c/o'
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(path, keys=[key], environ={
+            'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                sig, expires)})
+        headers = [('Content-Disposition', 'attachment; filename="fu\nbar"')]
+        self.tempurl.app = FakeApp(iter([('200 Ok', headers, '123')]))
+        resp = req.get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['content-disposition'],
+                         'attachment; filename="fu%0Abar"')
+        self.assertIn('expires', resp.headers)
+        self.assertEqual(req.environ['swift.authorize_override'], True)
+        self.assertEqual(req.environ['REMOTE_USER'], '.wsgi.tempurl')
+
+    def test_obj_trailing_slash(self):
+        method = 'GET'
+        expires = int(time() + 86400)
+        path = '/v1/a/c/o/'
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(path, keys=[key], environ={
+            'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                sig, expires)})
+        self.tempurl.app = FakeApp(iter([('200 Ok', (), '123')]))
+        resp = req.get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['content-disposition'],
+                         'attachment; filename="o"; ' +
+                         "filename*=UTF-8''o")
+        self.assertIn('expires', resp.headers)
+        self.assertEqual(req.environ['swift.authorize_override'], True)
+        self.assertEqual(req.environ['REMOTE_USER'], '.wsgi.tempurl')
+
+    def test_filename_trailing_slash(self):
+        method = 'GET'
+        expires = int(time() + 86400)
+        path = '/v1/a/c/o'
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(path, keys=[key], environ={
+            'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s&'
+            'filename=/i/want/this/just/as/it/is/' % (sig, expires)})
+        self.tempurl.app = FakeApp(iter([('200 Ok', (), '123')]))
+        resp = req.get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(
+            resp.headers['content-disposition'],
+            'attachment; filename="/i/want/this/just/as/it/is/"; ' +
+            "filename*=UTF-8''/i/want/this/just/as/it/is/")
+        self.assertIn('expires', resp.headers)
+        self.assertEqual(req.environ['swift.authorize_override'], True)
+        self.assertEqual(req.environ['REMOTE_USER'], '.wsgi.tempurl')
+
+    def test_get_valid_but_404(self):
+        method = 'GET'
+        expires = int(time() + 86400)
+        path = '/v1/a/c/o'
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(
+            path, keys=[key],
+            environ={'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                sig, expires)})
         resp = req.get_response(self.tempurl)
-        self.assertEquals(resp.status_int, 404)
-        self.assertEquals(resp.headers['content-disposition'],
-                          'attachment; filename=o')
-        self.assertEquals(req.environ['swift.authorize_override'], True)
-        self.assertEquals(req.environ['REMOTE_USER'], '.wsgi.tempurl')
+        self.assertEqual(resp.status_int, 404)
+        self.assertNotIn('content-disposition', resp.headers)
+        self.assertNotIn('expires', resp.headers)
+        self.assertEqual(req.environ['swift.authorize_override'], True)
+        self.assertEqual(req.environ['REMOTE_USER'], '.wsgi.tempurl')
 
     def test_put_not_allowed_by_get(self):
         method = 'GET'
         expires = int(time() + 86400)
         path = '/v1/a/c/o'
-        key = 'abc'
-        hmac_body = '%s\n%s\n%s' % (method, expires, path)
-        sig = hmac.new(key, hmac_body, sha1).hexdigest()
-        req = self._make_request(path,
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(
+            path, keys=[key],
             environ={'REQUEST_METHOD': 'PUT',
-                     'QUERY_STRING':
-                       'temp_url_sig=%s&temp_url_expires=%s' % (sig, expires)})
-        req.environ['swift.cache'].set('temp-url-key/a', key)
+                     'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                         sig, expires)})
         resp = req.get_response(self.tempurl)
-        self.assertEquals(resp.status_int, 401)
-        self.assertTrue('Temp URL invalid' in resp.body)
+        self.assertEqual(resp.status_int, 401)
+        self.assertIn(b'Temp URL invalid', resp.body)
+        self.assertIn('Www-Authenticate', resp.headers)
 
     def test_put_valid(self):
         method = 'PUT'
         expires = int(time() + 86400)
         path = '/v1/a/c/o'
-        key = 'abc'
-        hmac_body = '%s\n%s\n%s' % (method, expires, path)
-        sig = hmac.new(key, hmac_body, sha1).hexdigest()
-        req = self._make_request(path,
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(
+            path, keys=[key],
             environ={'REQUEST_METHOD': 'PUT',
-                     'QUERY_STRING':
-                       'temp_url_sig=%s&temp_url_expires=%s' % (sig, expires)})
-        req.environ['swift.cache'].set('temp-url-key/a', key)
+                     'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                         sig, expires)})
         resp = req.get_response(self.tempurl)
-        self.assertEquals(resp.status_int, 404)
-        self.assertEquals(req.environ['swift.authorize_override'], True)
-        self.assertEquals(req.environ['REMOTE_USER'], '.wsgi.tempurl')
+        self.assertEqual(resp.status_int, 404)
+        self.assertEqual(req.environ['swift.authorize_override'], True)
+        self.assertEqual(req.environ['REMOTE_USER'], '.wsgi.tempurl')
+
+    def test_put_response_headers_in_list(self):
+        class Validator(object):
+            def __init__(self, app):
+                self.app = app
+                self.status = None
+                self.headers = None
+                self.exc_info = None
+
+            def start_response(self, status, headers, exc_info=None):
+                self.status = status
+                self.headers = headers
+                self.exc_info = exc_info
+
+            def __call__(self, env, start_response):
+                resp_iter = self.app(env, self.start_response)
+                start_response(self.status, self.headers, self.exc_info)
+                return resp_iter
+
+        method = 'PUT'
+        expires = int(time() + 86400)
+        path = '/v1/a/c/o'
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(
+            path, keys=[key],
+            environ={'REQUEST_METHOD': 'PUT',
+                     'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                         sig, expires)})
+        validator = Validator(self.tempurl)
+        resp = req.get_response(validator)
+        self.assertIsInstance(validator.headers, list)
+        self.assertEqual(resp.status_int, 404)
+        self.assertEqual(req.environ['swift.authorize_override'], True)
+        self.assertEqual(req.environ['REMOTE_USER'], '.wsgi.tempurl')
 
     def test_get_not_allowed_by_put(self):
         method = 'PUT'
         expires = int(time() + 86400)
         path = '/v1/a/c/o'
-        key = 'abc'
-        hmac_body = '%s\n%s\n%s' % (method, expires, path)
-        sig = hmac.new(key, hmac_body, sha1).hexdigest()
-        req = self._make_request(path,
-            environ={'QUERY_STRING':
-                       'temp_url_sig=%s&temp_url_expires=%s' % (sig, expires)})
-        req.environ['swift.cache'].set('temp-url-key/a', key)
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(
+            path, keys=[key],
+            environ={'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                sig, expires)})
         resp = req.get_response(self.tempurl)
-        self.assertEquals(resp.status_int, 401)
-        self.assertTrue('Temp URL invalid' in resp.body)
+        self.assertEqual(resp.status_int, 401)
+        self.assertIn(b'Temp URL invalid', resp.body)
+        self.assertIn('Www-Authenticate', resp.headers)
 
     def test_missing_sig(self):
         method = 'GET'
         expires = int(time() + 86400)
         path = '/v1/a/c/o'
-        key = 'abc'
-        hmac_body = '%s\n%s\n%s' % (method, expires, path)
-        sig = hmac.new(key, hmac_body, sha1).hexdigest()
-        req = self._make_request(path,
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(
+            path, keys=[key],
             environ={'QUERY_STRING': 'temp_url_expires=%s' % expires})
-        req.environ['swift.cache'].set('temp-url-key/a', key)
         resp = req.get_response(self.tempurl)
-        self.assertEquals(resp.status_int, 401)
-        self.assertTrue('Temp URL invalid' in resp.body)
+        self.assertEqual(resp.status_int, 401)
+        self.assertIn(b'Temp URL invalid', resp.body)
+        self.assertIn('Www-Authenticate', resp.headers)
 
     def test_missing_expires(self):
         method = 'GET'
         expires = int(time() + 86400)
         path = '/v1/a/c/o'
-        key = 'abc'
-        hmac_body = '%s\n%s\n%s' % (method, expires, path)
-        sig = hmac.new(key, hmac_body, sha1).hexdigest()
-        req = self._make_request(path,
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(
+            path, keys=[key],
             environ={'QUERY_STRING': 'temp_url_sig=%s' % sig})
-        req.environ['swift.cache'].set('temp-url-key/a', key)
         resp = req.get_response(self.tempurl)
-        self.assertEquals(resp.status_int, 401)
-        self.assertTrue('Temp URL invalid' in resp.body)
+        self.assertEqual(resp.status_int, 401)
+        self.assertIn(b'Temp URL invalid', resp.body)
+        self.assertIn('Www-Authenticate', resp.headers)
 
     def test_bad_path(self):
         method = 'GET'
         expires = int(time() + 86400)
         path = '/v1/a/c/'
-        key = 'abc'
-        hmac_body = '%s\n%s\n%s' % (method, expires, path)
-        sig = hmac.new(key, hmac_body, sha1).hexdigest()
-        req = self._make_request(path,
-            environ={'QUERY_STRING':
-                       'temp_url_sig=%s&temp_url_expires=%s' % (sig, expires)})
-        req.environ['swift.cache'].set('temp-url-key/a', key)
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(
+            path, keys=[key],
+            environ={'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                sig, expires)})
         resp = req.get_response(self.tempurl)
-        self.assertEquals(resp.status_int, 401)
-        self.assertTrue('Temp URL invalid' in resp.body)
+        self.assertEqual(resp.status_int, 401)
+        self.assertIn(b'Temp URL invalid', resp.body)
+        self.assertIn('Www-Authenticate', resp.headers)
 
     def test_no_key(self):
         method = 'GET'
         expires = int(time() + 86400)
         path = '/v1/a/c/o'
-        key = 'abc'
-        hmac_body = '%s\n%s\n%s' % (method, expires, path)
-        sig = hmac.new(key, hmac_body, sha1).hexdigest()
-        req = self._make_request(path,
-            environ={'QUERY_STRING':
-                       'temp_url_sig=%s&temp_url_expires=%s' % (sig, expires)})
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(
+            path, keys=[],
+            environ={'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                sig, expires)})
         resp = req.get_response(self.tempurl)
-        self.assertEquals(resp.status_int, 401)
-        self.assertTrue('Temp URL invalid' in resp.body)
+        self.assertEqual(resp.status_int, 401)
+        self.assertIn(b'Temp URL invalid', resp.body)
+        self.assertIn('Www-Authenticate', resp.headers)
 
     def test_head_allowed_by_get(self):
         method = 'GET'
         expires = int(time() + 86400)
         path = '/v1/a/c/o'
-        key = 'abc'
-        hmac_body = '%s\n%s\n%s' % (method, expires, path)
-        sig = hmac.new(key, hmac_body, sha1).hexdigest()
-        req = self._make_request(path,
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(
+            path, keys=[key],
             environ={'REQUEST_METHOD': 'HEAD',
-                     'QUERY_STRING':
-                       'temp_url_sig=%s&temp_url_expires=%s' % (sig, expires)})
-        req.environ['swift.cache'].set('temp-url-key/a', key)
+                     'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                         sig, expires)})
         resp = req.get_response(self.tempurl)
-        self.assertEquals(resp.status_int, 404)
-        self.assertEquals(req.environ['swift.authorize_override'], True)
-        self.assertEquals(req.environ['REMOTE_USER'], '.wsgi.tempurl')
+        self.assertEqual(resp.status_int, 404)
+        self.assertEqual(req.environ['swift.authorize_override'], True)
+        self.assertEqual(req.environ['REMOTE_USER'], '.wsgi.tempurl')
 
     def test_head_allowed_by_put(self):
         method = 'PUT'
         expires = int(time() + 86400)
         path = '/v1/a/c/o'
-        key = 'abc'
-        hmac_body = '%s\n%s\n%s' % (method, expires, path)
-        sig = hmac.new(key, hmac_body, sha1).hexdigest()
-        req = self._make_request(path,
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(
+            path, keys=[key],
+            environ={'REQUEST_METHOD': 'HEAD',
+                     'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                         sig, expires)})
+        resp = req.get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 404)
+        self.assertEqual(req.environ['swift.authorize_override'], True)
+        self.assertEqual(req.environ['REMOTE_USER'], '.wsgi.tempurl')
+
+    def test_head_allowed_by_post(self):
+        method = 'POST'
+        expires = int(time() + 86400)
+        path = '/v1/a/c/o'
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(
+            path, keys=[key],
             environ={'REQUEST_METHOD': 'HEAD',
-                     'QUERY_STRING':
-                       'temp_url_sig=%s&temp_url_expires=%s' % (sig, expires)})
-        req.environ['swift.cache'].set('temp-url-key/a', key)
+                     'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                         sig, expires)})
         resp = req.get_response(self.tempurl)
-        self.assertEquals(resp.status_int, 404)
-        self.assertEquals(req.environ['swift.authorize_override'], True)
-        self.assertEquals(req.environ['REMOTE_USER'], '.wsgi.tempurl')
+        self.assertEqual(resp.status_int, 404)
+        self.assertEqual(req.environ['swift.authorize_override'], True)
+        self.assertEqual(req.environ['REMOTE_USER'], '.wsgi.tempurl')
 
     def test_head_otherwise_not_allowed(self):
         method = 'PUT'
         expires = int(time() + 86400)
         path = '/v1/a/c/o'
-        key = 'abc'
-        hmac_body = '%s\n%s\n%s' % (method, expires, path)
-        sig = hmac.new(key, hmac_body, sha1).hexdigest()
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
         # Deliberately fudge expires to show HEADs aren't just automatically
         # allowed.
         expires += 1
-        req = self._make_request(path,
+        req = self._make_request(
+            path, keys=[key],
             environ={'REQUEST_METHOD': 'HEAD',
-                     'QUERY_STRING':
-                       'temp_url_sig=%s&temp_url_expires=%s' % (sig, expires)})
-        req.environ['swift.cache'].set('temp-url-key/a', key)
+                     'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                         sig, expires)})
         resp = req.get_response(self.tempurl)
-        self.assertEquals(resp.status_int, 401)
+        self.assertEqual(resp.status_int, 401)
+        self.assertIn('Www-Authenticate', resp.headers)
 
-    def test_post_not_allowed(self):
+    def test_post_when_forbidden_by_config(self):
+        self.tempurl.conf['methods'].remove('POST')
         method = 'POST'
         expires = int(time() + 86400)
         path = '/v1/a/c/o'
-        key = 'abc'
-        hmac_body = '%s\n%s\n%s' % (method, expires, path)
-        sig = hmac.new(key, hmac_body, sha1).hexdigest()
-        req = self._make_request(path,
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(
+            path, keys=[key],
             environ={'REQUEST_METHOD': 'POST',
-                     'QUERY_STRING':
-                       'temp_url_sig=%s&temp_url_expires=%s' % (sig, expires)})
-        req.environ['swift.cache'].set('temp-url-key/a', key)
+                     'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                         sig, expires)})
         resp = req.get_response(self.tempurl)
-        self.assertEquals(resp.status_int, 401)
-        self.assertTrue('Temp URL invalid' in resp.body)
+        self.assertEqual(resp.status_int, 401)
+        self.assertIn(b'Temp URL invalid', resp.body)
+        self.assertIn('Www-Authenticate', resp.headers)
 
-    def test_delete_not_allowed(self):
+    def test_delete_when_forbidden_by_config(self):
+        self.tempurl.conf['methods'].remove('DELETE')
         method = 'DELETE'
         expires = int(time() + 86400)
         path = '/v1/a/c/o'
-        key = 'abc'
-        hmac_body = '%s\n%s\n%s' % (method, expires, path)
-        sig = hmac.new(key, hmac_body, sha1).hexdigest()
-        req = self._make_request(path,
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(
+            path, keys=[key],
             environ={'REQUEST_METHOD': 'DELETE',
-                     'QUERY_STRING':
-                       'temp_url_sig=%s&temp_url_expires=%s' % (sig, expires)})
-        req.environ['swift.cache'].set('temp-url-key/a', key)
+                     'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                         sig, expires)})
         resp = req.get_response(self.tempurl)
-        self.assertEquals(resp.status_int, 401)
-        self.assertTrue('Temp URL invalid' in resp.body)
+        self.assertEqual(resp.status_int, 401)
+        self.assertIn(b'Temp URL invalid', resp.body)
+        self.assertIn('Www-Authenticate', resp.headers)
+
+    def test_delete_allowed(self):
+        method = 'DELETE'
+        expires = int(time() + 86400)
+        path = '/v1/a/c/o'
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(
+            path, keys=[key],
+            environ={'REQUEST_METHOD': 'DELETE',
+                     'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                         sig, expires)})
+        resp = req.get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 404)
 
     def test_unknown_not_allowed(self):
         method = 'UNKNOWN'
         expires = int(time() + 86400)
         path = '/v1/a/c/o'
-        key = 'abc'
-        hmac_body = '%s\n%s\n%s' % (method, expires, path)
-        sig = hmac.new(key, hmac_body, sha1).hexdigest()
-        req = self._make_request(path,
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(
+            path, keys=[key],
             environ={'REQUEST_METHOD': 'UNKNOWN',
-                     'QUERY_STRING':
-                       'temp_url_sig=%s&temp_url_expires=%s' % (sig, expires)})
-        req.environ['swift.cache'].set('temp-url-key/a', key)
+                     'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                         sig, expires)})
+        resp = req.get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 401)
+        self.assertIn(b'Temp URL invalid', resp.body)
+        self.assertIn('Www-Authenticate', resp.headers)
+
+    def test_authorize_limits_scope(self):
+        req_other_object = Request.blank("/v1/a/c/o2")
+        req_other_container = Request.blank("/v1/a/c2/o2")
+        req_other_account = Request.blank("/v1/a2/c2/o2")
+
+        key_kwargs = {
+            'keys': ['account-key', 'shared-key'],
+            'container_keys': ['container-key', 'shared-key'],
+        }
+
+        # A request with the account key limits the pre-authed scope to the
+        # account level.
+        method = 'GET'
+        expires = int(time() + 86400)
+        path = '/v1/a/c/o'
+
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(b'account-key', hmac_body, hashlib.sha256).hexdigest()
+        qs = '?temp_url_sig=%s&temp_url_expires=%s' % (sig, expires)
+
+        # make request will setup the environ cache for us
+        req = self._make_request(path + qs, **key_kwargs)
+        resp = req.get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 404)  # sanity check
+
+        authorize = req.environ['swift.authorize']
+        # Requests for other objects happen if, for example, you're
+        # downloading a large object or creating a large-object manifest.
+        oo_resp = authorize(req_other_object)
+        self.assertIsNone(oo_resp)
+        oc_resp = authorize(req_other_container)
+        self.assertIsNone(oc_resp)
+        oa_resp = authorize(req_other_account)
+        self.assertEqual(oa_resp.status_int, 401)
+
+        # A request with the container key limits the pre-authed scope to
+        # the container level; a different container in the same account is
+        # out of scope and thus forbidden.
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(b'container-key', hmac_body, hashlib.sha256).hexdigest()
+        qs = '?temp_url_sig=%s&temp_url_expires=%s' % (sig, expires)
+
+        req = self._make_request(path + qs, **key_kwargs)
         resp = req.get_response(self.tempurl)
-        self.assertEquals(resp.status_int, 401)
-        self.assertTrue('Temp URL invalid' in resp.body)
+        self.assertEqual(resp.status_int, 404)  # sanity check
+
+        authorize = req.environ['swift.authorize']
+        oo_resp = authorize(req_other_object)
+        self.assertIsNone(oo_resp)
+        oc_resp = authorize(req_other_container)
+        self.assertEqual(oc_resp.status_int, 401)
+        oa_resp = authorize(req_other_account)
+        self.assertEqual(oa_resp.status_int, 401)
+
+        # If account and container share a key (users set these, so this can
+        # happen by accident, stupidity, *or* malice!), limit the scope to
+        # account level. This prevents someone from shrinking the scope of
+        # account-level tempurls by reusing one of the account's keys on a
+        # container.
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(b'shared-key', hmac_body, hashlib.sha256).hexdigest()
+        qs = '?temp_url_sig=%s&temp_url_expires=%s' % (sig, expires)
+
+        req = self._make_request(path + qs, **key_kwargs)
+        resp = req.get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 404)  # sanity check
+
+        authorize = req.environ['swift.authorize']
+        oo_resp = authorize(req_other_object)
+        self.assertIsNone(oo_resp)
+        oc_resp = authorize(req_other_container)
+        self.assertIsNone(oc_resp)
+        oa_resp = authorize(req_other_account)
+        self.assertEqual(oa_resp.status_int, 401)
 
     def test_changed_path_invalid(self):
         method = 'GET'
         expires = int(time() + 86400)
         path = '/v1/a/c/o'
-        key = 'abc'
-        hmac_body = '%s\n%s\n%s' % (method, expires, path)
-        sig = hmac.new(key, hmac_body, sha1).hexdigest()
-        req = self._make_request(path + '2',
-            environ={'QUERY_STRING':
-                       'temp_url_sig=%s&temp_url_expires=%s' % (sig, expires)})
-        req.environ['swift.cache'].set('temp-url-key/a', key)
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(
+            path + '2', keys=[key],
+            environ={'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                sig, expires)})
         resp = req.get_response(self.tempurl)
-        self.assertEquals(resp.status_int, 401)
-        self.assertTrue('Temp URL invalid' in resp.body)
+        self.assertEqual(resp.status_int, 401)
+        self.assertIn(b'Temp URL invalid', resp.body)
+        self.assertIn('Www-Authenticate', resp.headers)
 
     def test_changed_sig_invalid(self):
         method = 'GET'
         expires = int(time() + 86400)
         path = '/v1/a/c/o'
-        key = 'abc'
-        hmac_body = '%s\n%s\n%s' % (method, expires, path)
-        sig = hmac.new(key, hmac_body, sha1).hexdigest()
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
         if sig[-1] != '0':
             sig = sig[:-1] + '0'
         else:
             sig = sig[:-1] + '1'
-        req = self._make_request(path,
-            environ={'QUERY_STRING':
-                       'temp_url_sig=%s&temp_url_expires=%s' % (sig, expires)})
-        req.environ['swift.cache'].set('temp-url-key/a', key)
+        req = self._make_request(
+            path, keys=[key],
+            environ={'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                sig, expires)})
         resp = req.get_response(self.tempurl)
-        self.assertEquals(resp.status_int, 401)
-        self.assertTrue('Temp URL invalid' in resp.body)
+        self.assertEqual(resp.status_int, 401)
+        self.assertIn(b'Temp URL invalid', resp.body)
+        self.assertIn('Www-Authenticate', resp.headers)
 
     def test_changed_expires_invalid(self):
         method = 'GET'
         expires = int(time() + 86400)
         path = '/v1/a/c/o'
-        key = 'abc'
-        hmac_body = '%s\n%s\n%s' % (method, expires, path)
-        sig = hmac.new(key, hmac_body, sha1).hexdigest()
-        req = self._make_request(path,
-            environ={'QUERY_STRING':
-                       'temp_url_sig=%s&temp_url_expires=%s' %
-                       (sig, expires + 1)})
-        req.environ['swift.cache'].set('temp-url-key/a', key)
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(
+            path, keys=[key],
+            environ={'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                sig, expires + 1)})
         resp = req.get_response(self.tempurl)
-        self.assertEquals(resp.status_int, 401)
-        self.assertTrue('Temp URL invalid' in resp.body)
+        self.assertEqual(resp.status_int, 401)
+        self.assertIn(b'Temp URL invalid', resp.body)
+        self.assertIn('Www-Authenticate', resp.headers)
+
+    def test_ip_range_value_error(self):
+        method = 'GET'
+        expires = int(time() + 86400)
+        path = '/v1/a/c/o'
+        key = b'abc'
+        ip = '127.0.0.1'
+        not_an_ip = 'abcd'
+        hmac_body = ('ip=%s\n%s\n%i\n%s' %
+                     (ip, method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha1).hexdigest()
+        req = self._make_request(
+            path, keys=[key],
+            environ={
+                'QUERY_STRING':
+                'temp_url_sig=%s&temp_url_expires=%s&temp_url_ip_range=%s'
+                % (sig, expires, not_an_ip),
+                'REMOTE_ADDR': '127.0.0.1'
+            },
+        )
+        resp = req.get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 401)
+        self.assertIn(b'Temp URL invalid', resp.body)
+        self.assertIn('Www-Authenticate', resp.headers)
+
+    def test_bad_ip_range_invalid(self):
+        method = 'GET'
+        expires = int(time() + 86400)
+        path = '/v1/a/c/o'
+        key = b'abc'
+        ip = '127.0.0.1'
+        bad_ip = '127.0.0.2'
+        hmac_body = ('ip=%s\n%s\n%i\n%s' %
+                     (ip, method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha1).hexdigest()
+        req = self._make_request(
+            path, keys=[key],
+            environ={
+                'QUERY_STRING':
+                'temp_url_sig=%s&temp_url_expires=%s&temp_url_ip_range=%s'
+                % (sig, expires, ip),
+                'REMOTE_ADDR': bad_ip
+            },
+        )
+        resp = req.get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 401)
+        self.assertIn(b'Temp URL invalid', resp.body)
+        self.assertIn('Www-Authenticate', resp.headers)
 
     def test_different_key_invalid(self):
         method = 'GET'
         expires = int(time() + 86400)
         path = '/v1/a/c/o'
-        key = 'abc'
-        hmac_body = '%s\n%s\n%s' % (method, expires, path)
-        sig = hmac.new(key, hmac_body, sha1).hexdigest()
-        req = self._make_request(path,
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(
+            path, keys=[key + b'2'],
+            environ={'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                sig, expires)})
+        resp = req.get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 401)
+        self.assertTrue(b'Temp URL invalid' in resp.body)
+        self.assertTrue('Www-Authenticate' in resp.headers)
+
+    def test_no_prefix_match_invalid(self):
+        method = 'GET'
+        expires = int(time() + 86400)
+        sig_path = 'prefix:/v1/a/c/p1/p2/'
+        query_path = '/v1/a/c/o'
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' %
+                     (method, expires, sig_path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(
+            query_path, keys=[key],
+            environ={'QUERY_STRING':
+                     'temp_url_sig=%s&temp_url_expires=%s&temp_url_prefix=%s' %
+                     (sig, expires, 'p1/p2/')})
+        resp = req.get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 401)
+        self.assertTrue(b'Temp URL invalid' in resp.body)
+        self.assertTrue('Www-Authenticate' in resp.headers)
+
+    def test_object_url_with_prefix_invalid(self):
+        method = 'GET'
+        expires = int(time() + 86400)
+        path = '/v1/a/c/o'
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' %
+                     (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(
+            path, keys=[key],
             environ={'QUERY_STRING':
-                       'temp_url_sig=%s&temp_url_expires=%s' % (sig, expires)})
-        req.environ['swift.cache'].set('temp-url-key/a', key + '2')
+                     'temp_url_sig=%s&temp_url_expires=%s&temp_url_prefix=o' %
+                     (sig, expires)})
+        resp = req.get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 401)
+        self.assertIn(b'Temp URL invalid', resp.body)
+        self.assertIn('Www-Authenticate', resp.headers)
+
+    def test_disallowed_header_object_manifest(self):
+        self.tempurl = tempurl.filter_factory({})(self.auth)
+        expires = int(time() + 86400)
+        path = '/v1/a/c/o'
+        key = b'abc'
+        for method in ('PUT', 'POST'):
+            for hdr, value in [('X-Object-Manifest', 'private/secret'),
+                               ('X-Symlink-Target', 'cont/symlink')]:
+                hmac_body = ('%s\n%i\n%s' %
+                             (method, expires, path)).encode('utf-8')
+                sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+                req = self._make_request(
+                    path, method=method, keys=[key],
+                    headers={hdr: value},
+                    environ={'QUERY_STRING':
+                             'temp_url_sig=%s&temp_url_expires=%s'
+                             % (sig, expires)})
+                resp = req.get_response(self.tempurl)
+                self.assertEqual(resp.status_int, 400)
+                self.assertIn(b'header', resp.body)
+                self.assertIn(b'not allowed', resp.body)
+                self.assertIn(hdr.encode('utf-8'), resp.body)
+
+    def test_removed_incoming_header_defaults(self):
+        self.tempurl = tempurl.filter_factory({})(self.auth)
+
+        swift_info = registry.get_swift_info()
+        self.assertIn('tempurl', swift_info)
+        incoming_remove_headers = \
+            swift_info['tempurl']['incoming_remove_headers']
+
+        method = 'GET'
+        expires = int(time() + 86400)
+        path = '/v1/a/c/o'
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(
+            path, keys=[key],
+            headers={k: 'test_value' for k in incoming_remove_headers},
+            environ={'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                sig, expires)})
         resp = req.get_response(self.tempurl)
-        self.assertEquals(resp.status_int, 401)
-        self.assertTrue('Temp URL invalid' in resp.body)
+        self.assertEqual(resp.status_int, 404)
+        for incoming_remove_header in incoming_remove_headers:
+            self.assertNotIn(incoming_remove_header, self.app.request.headers)
 
     def test_removed_incoming_header(self):
         self.tempurl = tempurl.filter_factory({
-            'incoming_remove_headers': 'x-remove-this'})(self.auth)
+            'incoming_remove_headers': 'x-remove-this'
+        })(self.auth)
         method = 'GET'
         expires = int(time() + 86400)
         path = '/v1/a/c/o'
-        key = 'abc'
-        hmac_body = '%s\n%s\n%s' % (method, expires, path)
-        sig = hmac.new(key, hmac_body, sha1).hexdigest()
-        req = self._make_request(path, headers={'x-remove-this': 'value'},
-            environ={'QUERY_STRING':
-                       'temp_url_sig=%s&temp_url_expires=%s' % (sig, expires)})
-        req.environ['swift.cache'].set('temp-url-key/a', key)
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(
+            path, keys=[key],
+            headers={'x-remove-this': 'value', 'x-open-expired': 'true'},
+            environ={'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                sig, expires)})
         resp = req.get_response(self.tempurl)
-        self.assertEquals(resp.status_int, 404)
-        self.assertTrue('x-remove-this' not in self.app.request.headers)
+        self.assertEqual(resp.status_int, 404)
+        self.assertNotIn('x-remove-this', self.app.request.headers)
+        self.assertIn('x-open-expired', self.app.request.headers)
 
     def test_removed_incoming_headers_match(self):
         self.tempurl = tempurl.filter_factory({
@@ -404,38 +1090,76 @@ def test_removed_incoming_headers_match(self):
         method = 'GET'
         expires = int(time() + 86400)
         path = '/v1/a/c/o'
-        key = 'abc'
-        hmac_body = '%s\n%s\n%s' % (method, expires, path)
-        sig = hmac.new(key, hmac_body, sha1).hexdigest()
-        req = self._make_request(path,
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(
+            path, keys=[key],
             headers={'x-remove-this-one': 'value1',
                      'x-remove-this-except-this': 'value2'},
-            environ={'QUERY_STRING':
-                       'temp_url_sig=%s&temp_url_expires=%s' % (sig, expires)})
-        req.environ['swift.cache'].set('temp-url-key/a', key)
+            environ={'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                sig, expires)})
         resp = req.get_response(self.tempurl)
-        self.assertEquals(resp.status_int, 404)
-        self.assertTrue('x-remove-this-one' not in self.app.request.headers)
-        self.assertEquals(
+        self.assertEqual(resp.status_int, 404)
+        self.assertNotIn('x-remove-this-one', self.app.request.headers)
+        self.assertEqual(
             self.app.request.headers['x-remove-this-except-this'], 'value2')
 
+    def test_allow_trumps_incoming_header_conflict(self):
+        self.tempurl = tempurl.filter_factory({
+            'incoming_remove_headers': 'x-conflict-header',
+            'incoming_allow_headers': 'x-conflict-header'})(self.auth)
+        method = 'GET'
+        expires = int(time() + 86400)
+        path = '/v1/a/c/o'
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(
+            path, keys=[key],
+            headers={'x-conflict-header': 'value'},
+            environ={'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                sig, expires)})
+        resp = req.get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 404)
+        self.assertTrue('x-conflict-header' in self.app.request.headers)
+
+    def test_allow_trumps_incoming_header_startswith_conflict(self):
+        self.tempurl = tempurl.filter_factory({
+            'incoming_remove_headers': 'x-conflict-header-*',
+            'incoming_allow_headers': 'x-conflict-header-*'})(self.auth)
+        method = 'GET'
+        expires = int(time() + 86400)
+        path = '/v1/a/c/o'
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(
+            path, keys=[key],
+            headers={'x-conflict-header-test': 'value'},
+            environ={'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                sig, expires)})
+        resp = req.get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 404)
+        self.assertTrue('x-conflict-header-test' in self.app.request.headers)
+
     def test_removed_outgoing_header(self):
         self.tempurl = tempurl.filter_factory({
             'outgoing_remove_headers': 'x-test-header-one-a'})(self.auth)
         method = 'GET'
         expires = int(time() + 86400)
         path = '/v1/a/c/o'
-        key = 'abc'
-        hmac_body = '%s\n%s\n%s' % (method, expires, path)
-        sig = hmac.new(key, hmac_body, sha1).hexdigest()
-        req = self._make_request(path,
-            environ={'QUERY_STRING':
-                       'temp_url_sig=%s&temp_url_expires=%s' % (sig, expires)})
-        req.environ['swift.cache'].set('temp-url-key/a', key)
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(
+            path, keys=[key],
+            environ={'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                sig, expires)})
         resp = req.get_response(self.tempurl)
-        self.assertEquals(resp.status_int, 404)
-        self.assertTrue('x-test-header-one-a' not in resp.headers)
-        self.assertEquals(resp.headers['x-test-header-two-a'], 'value2')
+        self.assertEqual(resp.status_int, 404)
+        self.assertNotIn('x-test-header-one-a', resp.headers)
+        self.assertEqual(resp.headers['x-test-header-two-a'], 'value2')
 
     def test_removed_outgoing_headers_match(self):
         self.tempurl = tempurl.filter_factory({
@@ -444,210 +1168,600 @@ def test_removed_outgoing_headers_match(self):
         method = 'GET'
         expires = int(time() + 86400)
         path = '/v1/a/c/o'
-        key = 'abc'
-        hmac_body = '%s\n%s\n%s' % (method, expires, path)
-        sig = hmac.new(key, hmac_body, sha1).hexdigest()
-        req = self._make_request(path,
-            environ={'QUERY_STRING':
-                       'temp_url_sig=%s&temp_url_expires=%s' % (sig, expires)})
-        req.environ['swift.cache'].set('temp-url-key/a', key)
-        resp = req.get_response(self.tempurl)
-        self.assertEquals(resp.status_int, 404)
-        self.assertEquals(resp.headers['x-test-header-one-a'], 'value1')
-        self.assertTrue('x-test-header-two-a' not in resp.headers)
-        self.assertEquals(resp.headers['x-test-header-two-b'], 'value3')
-
-    def test_get_account(self):
-        self.assertEquals(self.tempurl._get_account({
-            'REQUEST_METHOD': 'HEAD', 'PATH_INFO': '/v1/a/c/o'}), 'a')
-        self.assertEquals(self.tempurl._get_account({
-            'REQUEST_METHOD': 'GET', 'PATH_INFO': '/v1/a/c/o'}), 'a')
-        self.assertEquals(self.tempurl._get_account({
-            'REQUEST_METHOD': 'PUT', 'PATH_INFO': '/v1/a/c/o'}), 'a')
-        self.assertEquals(self.tempurl._get_account({
-            'REQUEST_METHOD': 'POST', 'PATH_INFO': '/v1/a/c/o'}), None)
-        self.assertEquals(self.tempurl._get_account({
-            'REQUEST_METHOD': 'DELETE', 'PATH_INFO': '/v1/a/c/o'}), None)
-        self.assertEquals(self.tempurl._get_account({
-            'REQUEST_METHOD': 'UNKNOWN', 'PATH_INFO': '/v1/a/c/o'}), None)
-        self.assertEquals(self.tempurl._get_account({
-            'REQUEST_METHOD': 'GET', 'PATH_INFO': '/v1/a/c/'}), None)
-        self.assertEquals(self.tempurl._get_account({
-            'REQUEST_METHOD': 'GET', 'PATH_INFO': '/v1/a/c//////'}), None)
-        self.assertEquals(self.tempurl._get_account({
-            'REQUEST_METHOD': 'GET', 'PATH_INFO': '/v1/a/c///o///'}), 'a')
-        self.assertEquals(self.tempurl._get_account({
-            'REQUEST_METHOD': 'GET', 'PATH_INFO': '/v1/a/c'}), None)
-        self.assertEquals(self.tempurl._get_account({
-            'REQUEST_METHOD': 'GET', 'PATH_INFO': '/v1/a//o'}), None)
-        self.assertEquals(self.tempurl._get_account({
-            'REQUEST_METHOD': 'GET', 'PATH_INFO': '/v1//c/o'}), None)
-        self.assertEquals(self.tempurl._get_account({
-            'REQUEST_METHOD': 'GET', 'PATH_INFO': '//a/c/o'}), None)
-        self.assertEquals(self.tempurl._get_account({
-            'REQUEST_METHOD': 'GET', 'PATH_INFO': '/v2/a/c/o'}), None)
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(
+            path, keys=[key],
+            environ={'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                sig, expires)})
+        resp = req.get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 404)
+        self.assertEqual(resp.headers['x-test-header-one-a'], 'value1')
+        self.assertNotIn('x-test-header-two-a', resp.headers)
+        self.assertEqual(resp.headers['x-test-header-two-b'], 'value3')
+
+    def test_allow_trumps_outgoing_header_conflict(self):
+        self.tempurl = tempurl.filter_factory({
+            'outgoing_remove_headers': 'x-conflict-header',
+            'outgoing_allow_headers': 'x-conflict-header'})(self.auth)
+        method = 'GET'
+        expires = int(time() + 86400)
+        path = '/v1/a/c/o'
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(
+            path, keys=[key],
+            headers={},
+            environ={'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                sig, expires)})
+        self.tempurl.app = FakeApp(iter([('200 Ok', {
+            'X-Conflict-Header': 'value'}, '123')]))
+        resp = req.get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 200)
+        self.assertTrue('x-conflict-header' in resp.headers)
+        self.assertEqual(resp.headers['x-conflict-header'], 'value')
+
+    def test_allow_trumps_outgoing_header_startswith_conflict(self):
+        self.tempurl = tempurl.filter_factory({
+            'outgoing_remove_headers': 'x-conflict-header-*',
+            'outgoing_allow_headers': 'x-conflict-header-*'})(self.auth)
+        method = 'GET'
+        expires = int(time() + 86400)
+        path = '/v1/a/c/o'
+        key = b'abc'
+        hmac_body = ('%s\n%i\n%s' % (method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(
+            path, keys=[key],
+            headers={},
+            environ={'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                sig, expires)})
+        self.tempurl.app = FakeApp(iter([('200 Ok', {
+            'X-Conflict-Header-Test': 'value'}, '123')]))
+        resp = req.get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 200)
+        self.assertTrue('x-conflict-header-test' in resp.headers)
+        self.assertEqual(resp.headers['x-conflict-header-test'], 'value')
+
+    def test_get_path_parts(self):
+        self.assertEqual(self.tempurl._get_path_parts({
+            'REQUEST_METHOD': 'HEAD', 'PATH_INFO': '/v1/a/c/o'}),
+            ('a', 'c', 'o'))
+        self.assertEqual(self.tempurl._get_path_parts({
+            'REQUEST_METHOD': 'GET', 'PATH_INFO': '/v1/a/c/o'}),
+            ('a', 'c', 'o'))
+        self.assertEqual(self.tempurl._get_path_parts({
+            'REQUEST_METHOD': 'PUT', 'PATH_INFO': '/v1/a/c/o'}),
+            ('a', 'c', 'o'))
+        self.assertEqual(self.tempurl._get_path_parts({
+            'REQUEST_METHOD': 'POST', 'PATH_INFO': '/v1/a/c/o'}),
+            ('a', 'c', 'o'))
+        self.assertEqual(self.tempurl._get_path_parts({
+            'REQUEST_METHOD': 'DELETE', 'PATH_INFO': '/v1/a/c/o'}),
+            ('a', 'c', 'o'))
+        self.assertEqual(self.tempurl._get_path_parts({
+            'REQUEST_METHOD': 'UNKNOWN', 'PATH_INFO': '/v1/a/c/o'}),
+            (None, None, None))
+        self.assertEqual(self.tempurl._get_path_parts({
+            'REQUEST_METHOD': 'GET', 'PATH_INFO': '/v1/a/c/'}),
+            (None, None, None))
+        self.assertEqual(
+            self.tempurl._get_path_parts(
+                {'REQUEST_METHOD': 'GET', 'PATH_INFO': '/v1/a/c/'},
+                allow_container_root=True),
+            ('a', 'c', ''))
+        self.assertEqual(
+            self.tempurl._get_path_parts(
+                {'REQUEST_METHOD': 'GET', 'PATH_INFO': '/v1/a/c/'},
+                allow_container_root=False),
+            (None, None, None))
+        self.assertEqual(self.tempurl._get_path_parts({
+            'REQUEST_METHOD': 'GET', 'PATH_INFO': '/v1/a/c//////'}),
+            (None, None, None))
+        self.assertEqual(self.tempurl._get_path_parts({
+            'REQUEST_METHOD': 'GET', 'PATH_INFO': '/v1/a/c///o///'}),
+            ('a', 'c', '//o///'))
+        self.assertEqual(self.tempurl._get_path_parts({
+            'REQUEST_METHOD': 'GET', 'PATH_INFO': '/v1/a/c'}),
+            (None, None, None))
+        self.assertEqual(self.tempurl._get_path_parts({
+            'REQUEST_METHOD': 'GET', 'PATH_INFO': '/v1/a//o'}),
+            (None, None, None))
+        self.assertEqual(self.tempurl._get_path_parts({
+            'REQUEST_METHOD': 'GET', 'PATH_INFO': '/v1//c/o'}),
+            (None, None, None))
+        self.assertEqual(self.tempurl._get_path_parts({
+            'REQUEST_METHOD': 'GET', 'PATH_INFO': '//a/c/o'}),
+            (None, None, None))
+        self.assertEqual(self.tempurl._get_path_parts({
+            'REQUEST_METHOD': 'GET', 'PATH_INFO': '/v2/a/c/o'}),
+            (None, None, None))
 
     def test_get_temp_url_info(self):
         s = 'f5d5051bddf5df7e27c628818738334f'
-        e = int(time() + 86400)
-        self.assertEquals(self.tempurl._get_temp_url_info({'QUERY_STRING':
-            'temp_url_sig=%s&temp_url_expires=%s' % (s, e)}), (s, e))
-        self.assertEquals(self.tempurl._get_temp_url_info({}), (None, None))
-        self.assertEquals(self.tempurl._get_temp_url_info({'QUERY_STRING':
-            'temp_url_expires=%s' % e}), (None, e))
-        self.assertEquals(self.tempurl._get_temp_url_info({'QUERY_STRING':
-            'temp_url_sig=%s' % s}), (s, None))
-        self.assertEquals(self.tempurl._get_temp_url_info({'QUERY_STRING':
-            'temp_url_sig=%s&temp_url_expires=bad' % s}), (s, 0))
-        e = int(time() - 1)
-        self.assertEquals(self.tempurl._get_temp_url_info({'QUERY_STRING':
-            'temp_url_sig=%s&temp_url_expires=%s' % (s, e)}), (s, 0))
-
-    def test_get_key_memcache(self):
-        self.app.status_headers_body_iter = iter([('404 Not Found', {}, '')])
-        self.assertEquals(
-            self.tempurl._get_key({}, 'a'), None)
-        self.app.status_headers_body_iter = iter([('404 Not Found', {}, '')])
-        self.assertEquals(
-            self.tempurl._get_key({'swift.cache': None}, 'a'), None)
-        mc = FakeMemcache()
-        self.app.status_headers_body_iter = iter([('404 Not Found', {}, '')])
-        self.assertEquals(
-            self.tempurl._get_key({'swift.cache': mc}, 'a'), None)
-        mc.set('temp-url-key/a', 'abc')
-        self.assertEquals(
-            self.tempurl._get_key({'swift.cache': mc}, 'a'), 'abc')
-
-    def test_get_key_from_source(self):
-        self.app.status_headers_body_iter = \
-            iter([('200 Ok', {'x-account-meta-temp-url-key': 'abc'}, '')])
-        mc = FakeMemcache()
-        self.assertEquals(
-            self.tempurl._get_key({'swift.cache': mc}, 'a'), 'abc')
-        self.assertEquals(mc.get('temp-url-key/a'), 'abc')
-
-    def test_get_hmac(self):
-        self.assertEquals(self.tempurl._get_hmac(
-                {'REQUEST_METHOD': 'GET', 'PATH_INFO': '/v1/a/c/o'},
-                1, 'abc'),
-            '026d7f7cc25256450423c7ad03fc9f5ffc1dab6d')
-        self.assertEquals(self.tempurl._get_hmac(
-                {'REQUEST_METHOD': 'HEAD', 'PATH_INFO': '/v1/a/c/o'},
-                1, 'abc', request_method='GET'),
-            '026d7f7cc25256450423c7ad03fc9f5ffc1dab6d')
+        e_ts = int(time() + 86400)
+        e_8601 = strftime(tempurl.EXPIRES_ISO8601_FORMAT, gmtime(e_ts))
+        for e in (str(e_ts), e_8601):
+            self.assertEqual(
+                tempurl.get_temp_url_info(
+                    {'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                        s, e)}),
+                (s, e, None, None, None, None))
+            self.assertEqual(
+                tempurl.get_temp_url_info(
+                    {'QUERY_STRING':
+                     'temp_url_sig=%s&temp_url_expires=%s&temp_url_prefix=%s'
+                     % (s, e, 'prefix')}),
+                (s, e, 'prefix', None, None, None))
+            self.assertEqual(
+                tempurl.get_temp_url_info(
+                    {'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s&'
+                     'filename=bobisyouruncle' % (s, e)}),
+                (s, e, None, 'bobisyouruncle', None, None))
+            self.assertEqual(
+                tempurl.get_temp_url_info({}),
+                (None, None, None, None, None, None))
+            self.assertEqual(
+                tempurl.get_temp_url_info(
+                    {'QUERY_STRING': 'temp_url_expires=%s' % e}),
+                (None, e, None, None, None, None))
+            self.assertEqual(
+                tempurl.get_temp_url_info(
+                    {'QUERY_STRING': 'temp_url_sig=%s' % s}),
+                (s, None, None, None, None, None))
+            self.assertEqual(
+                tempurl.get_temp_url_info(
+                    {'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=bad' % (
+                        s)}),
+                (s, 'bad', None, None, None, None))
+            self.assertEqual(
+                tempurl.get_temp_url_info(
+                    {'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s&'
+                     'inline=' % (s, e)}),
+                (s, e, None, None, True, None))
+            self.assertEqual(
+                tempurl.get_temp_url_info(
+                    {'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s&'
+                     'filename=bobisyouruncle&inline=' % (s, e)}),
+                (s, e, None, 'bobisyouruncle', True, None))
+            self.assertEqual(
+                tempurl.get_temp_url_info(
+                    {'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s&'
+                     'filename=bobisyouruncle&inline='
+                     '&temp_url_ip_range=127.0.0.1' % (s, e)}),
+                (s, e, None, 'bobisyouruncle', True, '127.0.0.1'))
+
+        e_ts = int(time() - 1)
+        e_8601 = strftime(tempurl.EXPIRES_ISO8601_FORMAT, gmtime(e_ts))
+        for e in (str(e_ts), e_8601):
+            self.assertEqual(
+                tempurl.get_temp_url_info(
+                    {'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                        s, e)}),
+                (s, e, None, None, None, None))
+        e_8601 = strftime('%Y-%m-%dT%H:%M:%S+0000', gmtime(e_ts))
+        self.assertEqual(
+            tempurl.get_temp_url_info(
+                {'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s' % (
+                    s, e_8601.replace('+', '%2B'))}),
+            (s, e_8601, None, None, None, None))
+
+    def test_normalize_temp_url_expires(self):
+        e_ts = int(time() + 86400)
+        self.assertEqual(e_ts, tempurl.normalize_temp_url_expires(e_ts))
+        self.assertEqual(e_ts, tempurl.normalize_temp_url_expires(str(e_ts)))
+
+        e_8601 = strftime(tempurl.EXPIRES_ISO8601_FORMAT, gmtime(e_ts))
+        self.assertEqual(e_ts, tempurl.normalize_temp_url_expires(e_8601))
+        # Offsets not supported (yet?).
+        e_8601 = strftime('%Y-%m-%dT%H:%M:%S+0000', gmtime(e_ts))
+        self.assertEqual(0, tempurl.normalize_temp_url_expires(e_8601))
+
+        self.assertEqual(None, tempurl.normalize_temp_url_expires(None))
+        self.assertEqual(0, tempurl.normalize_temp_url_expires('bad'))
+        e_ts = int(time() - 1)
+        self.assertEqual(0, tempurl.normalize_temp_url_expires(e_ts))
+        e_8601 = strftime(tempurl.EXPIRES_ISO8601_FORMAT, gmtime(e_ts))
+        self.assertEqual(0, tempurl.normalize_temp_url_expires(e_8601))
+
+    def test_get_hmacs(self):
+        self.assertEqual(
+            self.tempurl._get_hmacs(
+                {'REQUEST_METHOD': 'GET'}, 1, '/v1/a/c/o',
+                [('abc', 'account')], 'sha1'),
+            [('026d7f7cc25256450423c7ad03fc9f5ffc1dab6d', 'account')])
+        self.assertEqual(
+            self.tempurl._get_hmacs(
+                {'REQUEST_METHOD': 'HEAD'}, 1, '/v1/a/c/o',
+                [('abc', 'account')], 'sha512', request_method='GET'),
+            [('240866478d94bbe683ab1d25fba52c7d0df21a60951'
+              '4fe6a493dc30f951d2748abc51da0cbc633cd1e0acf'
+              '6fadd3af3aedff00ee3d3434dc6a4c423e74adfc4a', 'account')])
+        self.assertEqual(
+            self.tempurl._get_hmacs(
+                {'REQUEST_METHOD': 'HEAD'}, 1, '/v1/a/c/o',
+                [('abc', 'account')], 'sha512', request_method='GET',
+                ip_range='127.0.0.1'
+            ),
+            [('b713f99a66911cdf41dbcdff16db3efbd1ca89340a20'
+              '86cc2ed88f0d3a74c7159e7687a312b12345d3721b7b'
+              '94e36c2753d7cc01e9a91cc318c5081d788f2cfe', 'account')])
 
     def test_invalid(self):
 
         def _start_response(status, headers, exc_info=None):
             self.assertTrue(status, '401 Unauthorized')
 
-        self.assertTrue('Temp URL invalid' in
-            ''.join(self.tempurl._invalid({'REQUEST_METHOD': 'GET'},
-                                          _start_response)))
-        self.assertEquals('',
-            ''.join(self.tempurl._invalid({'REQUEST_METHOD': 'HEAD'},
-                                          _start_response)))
+        self.assertIn(b'Temp URL invalid', b''.join(
+            self.tempurl._invalid({'REQUEST_METHOD': 'GET'},
+                                  _start_response)))
+        self.assertIn(b'', b''.join(
+            self.tempurl._invalid({'REQUEST_METHOD': 'HEAD'},
+                                  _start_response)))
+
+    def test_auth_scheme_value(self):
+        # Passthrough
+        environ = {}
+        resp = self._make_request('/v1/a/c/o', environ=environ).get_response(
+            self.tempurl)
+        self.assertEqual(resp.status_int, 401)
+        self.assertNotIn(b'Temp URL invalid', resp.body)
+        self.assertIn('Www-Authenticate', resp.headers)
+        self.assertNotIn('swift.auth_scheme', environ)
+
+        # Rejected by TempURL
+        environ = {'REQUEST_METHOD': 'PUT',
+                   'QUERY_STRING':
+                   'temp_url_sig=dummy&temp_url_expires=1234'}
+        req = self._make_request('/v1/a/c/o', keys=['abc'],
+                                 environ=environ)
+        resp = req.get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 401)
+        self.assertIn(b'Temp URL invalid', resp.body)
+        self.assertIn('Www-Authenticate', resp.headers)
 
     def test_clean_incoming_headers(self):
-        irh = ''
-        iah = ''
+        irh = []
+        iah = []
         env = {'HTTP_TEST_HEADER': 'value'}
-        tempurl.TempURL(None, {'incoming_remove_headers': irh,
-            'incoming_allow_headers': iah})._clean_incoming_headers(env)
-        self.assertTrue('HTTP_TEST_HEADER' in env)
+        tempurl.TempURL(
+            None, {'incoming_remove_headers': irh,
+                   'incoming_allow_headers': iah}
+        )._clean_incoming_headers(env)
+        self.assertIn('HTTP_TEST_HEADER', env)
 
-        irh = 'test-header'
-        iah = ''
+        irh = ['test-header']
+        iah = []
         env = {'HTTP_TEST_HEADER': 'value'}
-        tempurl.TempURL(None, {'incoming_remove_headers': irh,
-            'incoming_allow_headers': iah})._clean_incoming_headers(env)
-        self.assertTrue('HTTP_TEST_HEADER' not in env)
+        tempurl.TempURL(
+            None, {'incoming_remove_headers': irh,
+                   'incoming_allow_headers': iah}
+        )._clean_incoming_headers(env)
+        self.assertNotIn('HTTP_TEST_HEADER', env)
 
-        irh = 'test-header-*'
-        iah = ''
+        irh = ['test-header-*']
+        iah = []
         env = {'HTTP_TEST_HEADER_ONE': 'value',
                'HTTP_TEST_HEADER_TWO': 'value'}
-        tempurl.TempURL(None, {'incoming_remove_headers': irh,
-            'incoming_allow_headers': iah})._clean_incoming_headers(env)
-        self.assertTrue('HTTP_TEST_HEADER_ONE' not in env)
-        self.assertTrue('HTTP_TEST_HEADER_TWO' not in env)
+        tempurl.TempURL(
+            None, {'incoming_remove_headers': irh,
+                   'incoming_allow_headers': iah}
+        )._clean_incoming_headers(env)
+        self.assertNotIn('HTTP_TEST_HEADER_ONE', env)
+        self.assertNotIn('HTTP_TEST_HEADER_TWO', env)
 
-        irh = 'test-header-*'
-        iah = 'test-header-two'
+        irh = ['test-header-*']
+        iah = ['test-header-two']
         env = {'HTTP_TEST_HEADER_ONE': 'value',
                'HTTP_TEST_HEADER_TWO': 'value'}
-        tempurl.TempURL(None, {'incoming_remove_headers': irh,
-            'incoming_allow_headers': iah})._clean_incoming_headers(env)
-        self.assertTrue('HTTP_TEST_HEADER_ONE' not in env)
-        self.assertTrue('HTTP_TEST_HEADER_TWO' in env)
+        tempurl.TempURL(
+            None, {'incoming_remove_headers': irh,
+                   'incoming_allow_headers': iah}
+        )._clean_incoming_headers(env)
+        self.assertNotIn('HTTP_TEST_HEADER_ONE', env)
+        self.assertIn('HTTP_TEST_HEADER_TWO', env)
 
-        irh = 'test-header-* test-other-header'
-        iah = 'test-header-two test-header-yes-*'
+        irh = ['test-header-*', 'test-other-header']
+        iah = ['test-header-two', 'test-header-yes-*']
         env = {'HTTP_TEST_HEADER_ONE': 'value',
                'HTTP_TEST_HEADER_TWO': 'value',
                'HTTP_TEST_OTHER_HEADER': 'value',
                'HTTP_TEST_HEADER_YES': 'value',
                'HTTP_TEST_HEADER_YES_THIS': 'value'}
-        tempurl.TempURL(None, {'incoming_remove_headers': irh,
-            'incoming_allow_headers': iah})._clean_incoming_headers(env)
-        self.assertTrue('HTTP_TEST_HEADER_ONE' not in env)
-        self.assertTrue('HTTP_TEST_HEADER_TWO' in env)
-        self.assertTrue('HTTP_TEST_OTHER_HEADER' not in env)
-        self.assertTrue('HTTP_TEST_HEADER_YES' not in env)
-        self.assertTrue('HTTP_TEST_HEADER_YES_THIS' in env)
+        tempurl.TempURL(
+            None, {'incoming_remove_headers': irh,
+                   'incoming_allow_headers': iah}
+        )._clean_incoming_headers(env)
+        self.assertNotIn('HTTP_TEST_HEADER_ONE', env)
+        self.assertIn('HTTP_TEST_HEADER_TWO', env)
+        self.assertNotIn('HTTP_TEST_OTHER_HEADER', env)
+        self.assertNotIn('HTTP_TEST_HEADER_YES', env)
+        self.assertIn('HTTP_TEST_HEADER_YES_THIS', env)
 
     def test_clean_outgoing_headers(self):
-        orh = ''
-        oah = ''
+        orh = []
+        oah = []
         hdrs = {'test-header': 'value'}
-        hdrs = dict(tempurl.TempURL(None,
+        hdrs = HeaderKeyDict(tempurl.TempURL(
+            None,
             {'outgoing_remove_headers': orh, 'outgoing_allow_headers': oah}
-            )._clean_outgoing_headers(hdrs.iteritems()))
-        self.assertTrue('test-header' in hdrs)
+        )._clean_outgoing_headers(hdrs.items()))
+        self.assertIn('test-header', hdrs)
 
-        orh = 'test-header'
-        oah = ''
+        orh = ['test-header']
+        oah = []
         hdrs = {'test-header': 'value'}
-        hdrs = dict(tempurl.TempURL(None,
+        hdrs = HeaderKeyDict(tempurl.TempURL(
+            None,
             {'outgoing_remove_headers': orh, 'outgoing_allow_headers': oah}
-            )._clean_outgoing_headers(hdrs.iteritems()))
-        self.assertTrue('test-header' not in hdrs)
+        )._clean_outgoing_headers(hdrs.items()))
+        self.assertNotIn('test-header', hdrs)
 
-        orh = 'test-header-*'
-        oah = ''
+        orh = ['test-header-*']
+        oah = []
         hdrs = {'test-header-one': 'value',
                 'test-header-two': 'value'}
-        hdrs = dict(tempurl.TempURL(None,
+        hdrs = HeaderKeyDict(tempurl.TempURL(
+            None,
             {'outgoing_remove_headers': orh, 'outgoing_allow_headers': oah}
-            )._clean_outgoing_headers(hdrs.iteritems()))
-        self.assertTrue('test-header-one' not in hdrs)
-        self.assertTrue('test-header-two' not in hdrs)
+        )._clean_outgoing_headers(hdrs.items()))
+        self.assertNotIn('test-header-one', hdrs)
+        self.assertNotIn('test-header-two', hdrs)
 
-        orh = 'test-header-*'
-        oah = 'test-header-two'
+        orh = ['test-header-*']
+        oah = ['test-header-two']
         hdrs = {'test-header-one': 'value',
                 'test-header-two': 'value'}
-        hdrs = dict(tempurl.TempURL(None,
+        hdrs = HeaderKeyDict(tempurl.TempURL(
+            None,
             {'outgoing_remove_headers': orh, 'outgoing_allow_headers': oah}
-            )._clean_outgoing_headers(hdrs.iteritems()))
-        self.assertTrue('test-header-one' not in hdrs)
-        self.assertTrue('test-header-two' in hdrs)
+        )._clean_outgoing_headers(hdrs.items()))
+        self.assertNotIn('test-header-one', hdrs)
+        self.assertIn('test-header-two', hdrs)
 
-        orh = 'test-header-* test-other-header'
-        oah = 'test-header-two test-header-yes-*'
+        orh = ['test-header-*', 'test-other-header']
+        oah = ['test-header-two', 'test-header-yes-*']
         hdrs = {'test-header-one': 'value',
                 'test-header-two': 'value',
                 'test-other-header': 'value',
                 'test-header-yes': 'value',
                 'test-header-yes-this': 'value'}
-        hdrs = dict(tempurl.TempURL(None,
+        hdrs = HeaderKeyDict(tempurl.TempURL(
+            None,
             {'outgoing_remove_headers': orh, 'outgoing_allow_headers': oah}
-            )._clean_outgoing_headers(hdrs.iteritems()))
-        self.assertTrue('test-header-one' not in hdrs)
-        self.assertTrue('test-header-two' in hdrs)
-        self.assertTrue('test-other-header' not in hdrs)
-        self.assertTrue('test-header-yes' not in hdrs)
-        self.assertTrue('test-header-yes-this' in hdrs)
+        )._clean_outgoing_headers(hdrs.items()))
+        self.assertNotIn('test-header-one', hdrs)
+        self.assertIn('test-header-two', hdrs)
+        self.assertNotIn('test-other-header', hdrs)
+        self.assertNotIn('test-header-yes', hdrs)
+        self.assertIn('test-header-yes-this', hdrs)
+
+    def test_unicode_metadata_value(self):
+        meta = {"temp-url-key": "test", "temp-url-key-2": u"test2"}
+        results = tempurl.get_tempurl_keys_from_metadata(meta)
+        for str_value in results:
+            self.assertIsInstance(str_value, str)
+
+    @mock.patch('swift.common.middleware.tempurl.time', return_value=0)
+    def test_get_valid_with_ip_range(self, mock_time):
+        method = 'GET'
+        expires = (((24 + 1) * 60 + 1) * 60) + 1
+        path = '/v1/a/c/o'
+        key = b'abc'
+        ip_range = '127.0.0.0/29'
+        hmac_body = ('ip=%s\n%s\n%i\n%s' %
+                     (ip_range, method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(path, keys=[key], environ={
+            'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s&'
+            'temp_url_ip_range=%s' % (sig, expires, ip_range),
+            'REMOTE_ADDR': '127.0.0.1'},
+        )
+        self.tempurl.app = FakeApp(iter([('200 Ok', (), '123')]))
+        resp = req.get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 200)
+        self.assertIn('expires', resp.headers)
+        self.assertEqual('Fri, 02 Jan 1970 01:01:01 GMT',
+                         resp.headers['expires'])
+        self.assertEqual(req.environ['swift.authorize_override'], True)
+        self.assertEqual(req.environ['REMOTE_USER'], '.wsgi.tempurl')
+
+    @mock.patch('swift.common.middleware.tempurl.time', return_value=0)
+    def test_get_valid_with_ip_from_remote_addr(self, mock_time):
+        method = 'GET'
+        expires = (((24 + 1) * 60 + 1) * 60) + 1
+        path = '/v1/a/c/o'
+        key = b'abc'
+        ip = '127.0.0.1'
+        hmac_body = ('ip=%s\n%s\n%i\n%s' %
+                     (ip, method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(path, keys=[key], environ={
+            'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s&'
+            'temp_url_ip_range=%s' % (sig, expires, ip),
+            'REMOTE_ADDR': ip},
+        )
+        self.tempurl.app = FakeApp(iter([('200 Ok', (), '123')]))
+        resp = req.get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 200)
+        self.assertIn('expires', resp.headers)
+        self.assertEqual('Fri, 02 Jan 1970 01:01:01 GMT',
+                         resp.headers['expires'])
+        self.assertEqual(req.environ['swift.authorize_override'], True)
+        self.assertEqual(req.environ['REMOTE_USER'], '.wsgi.tempurl')
+
+    def test_get_valid_with_fake_ip_from_x_forwarded_for(self):
+        method = 'GET'
+        expires = (((24 + 1) * 60 + 1) * 60) + 1
+        path = '/v1/a/c/o'
+        key = b'abc'
+        ip = '127.0.0.1'
+        remote_addr = '127.0.0.2'
+        hmac_body = ('ip=%s\n%s\n%i\n%s' %
+                     (ip, method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha1).hexdigest()
+        req = self._make_request(path, keys=[key], environ={
+            'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s&'
+            'temp_url_ip_range=%s' % (sig, expires, ip),
+            'REMOTE_ADDR': remote_addr},
+            headers={'x-forwarded-for': ip})
+        self.tempurl.app = FakeApp(iter([('200 Ok', (), '123')]))
+        resp = req.get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 401)
+        self.assertIn(b'Temp URL invalid', resp.body)
+        self.assertIn('Www-Authenticate', resp.headers)
+
+    @mock.patch('swift.common.middleware.tempurl.time', return_value=0)
+    def test_get_valid_with_single_ipv6(self, mock_time):
+        method = 'GET'
+        expires = (((24 + 1) * 60 + 1) * 60) + 1
+        path = '/v1/a/c/o'
+        key = b'abc'
+        ip = '2001:db8::'
+        hmac_body = ('ip=%s\n%s\n%i\n%s' %
+                     (ip, method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(path, keys=[key], environ={
+            'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s&'
+            'temp_url_ip_range=%s' % (sig, expires, ip),
+            'REMOTE_ADDR': '2001:db8::'},
+        )
+        self.tempurl.app = FakeApp(iter([('200 Ok', (), '123')]))
+        resp = req.get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 200)
+        self.assertIn('expires', resp.headers)
+        self.assertEqual('Fri, 02 Jan 1970 01:01:01 GMT',
+                         resp.headers['expires'])
+        self.assertEqual(req.environ['swift.authorize_override'], True)
+        self.assertEqual(req.environ['REMOTE_USER'], '.wsgi.tempurl')
+
+    @mock.patch('swift.common.middleware.tempurl.time', return_value=0)
+    def test_get_valid_with_ipv6_range(self, mock_time):
+        method = 'GET'
+        expires = (((24 + 1) * 60 + 1) * 60) + 1
+        path = '/v1/a/c/o'
+        key = b'abc'
+        ip_range = '2001:db8::/127'
+        hmac_body = ('ip=%s\n%s\n%i\n%s' %
+                     (ip_range, method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha256).hexdigest()
+        req = self._make_request(path, keys=[key], environ={
+            'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s&'
+            'temp_url_ip_range=%s' % (sig, expires, ip_range),
+            'REMOTE_ADDR': '2001:db8::'},
+        )
+        self.tempurl.app = FakeApp(iter([('200 Ok', (), '123')]))
+        resp = req.get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 200)
+        self.assertIn('expires', resp.headers)
+        self.assertEqual('Fri, 02 Jan 1970 01:01:01 GMT',
+                         resp.headers['expires'])
+        self.assertEqual(req.environ['swift.authorize_override'], True)
+        self.assertEqual(req.environ['REMOTE_USER'], '.wsgi.tempurl')
+
+    def test_get_valid_with_no_client_address(self):
+        method = 'GET'
+        expires = (((24 + 1) * 60 + 1) * 60) + 1
+        path = '/v1/a/c/o'
+        key = b'abc'
+        ip = '127.0.0.1'
+        hmac_body = ('%s\n%s\n%i\n%s' %
+                     (ip, method, expires, path)).encode('utf-8')
+        sig = hmac.new(key, hmac_body, hashlib.sha1).hexdigest()
+        req = self._make_request(path, keys=[key], environ={
+            'QUERY_STRING': 'temp_url_sig=%s&temp_url_expires=%s&'
+            'temp_url_ip_range=%s' % (sig, expires, ip)},
+        )
+        self.tempurl.app = FakeApp(iter([('200 Ok', (), '123')]))
+        resp = req.get_response(self.tempurl)
+        self.assertEqual(resp.status_int, 401)
+        self.assertIn(b'Temp URL invalid', resp.body)
+        self.assertIn('Www-Authenticate', resp.headers)
+
+
+class TestSwiftInfo(unittest.TestCase):
+    def setUp(self):
+        registry._swift_info = {}
+        registry._swift_admin_info = {}
+
+    def test_registered_defaults(self):
+        tempurl.filter_factory({})
+        swift_info = registry.get_swift_info()
+        self.assertIn('tempurl', swift_info)
+        info = swift_info['tempurl']
+        self.assertEqual(set(info['methods']),
+                         set(('GET', 'HEAD', 'PUT', 'POST', 'DELETE')))
+        self.assertEqual(set(info['incoming_remove_headers']),
+                         set(('x-timestamp', 'x-open-expired',)))
+        self.assertEqual(set(info['incoming_allow_headers']), set())
+        self.assertEqual(set(info['outgoing_remove_headers']),
+                         set(('x-object-meta-*',)))
+        self.assertEqual(set(info['outgoing_allow_headers']),
+                         set(('x-object-meta-public-*',)))
+        self.assertEqual(info['allowed_digests'], ['sha1', 'sha256', 'sha512'])
+        self.assertEqual(info['deprecated_digests'], ['sha1'])
+
+    def test_non_default_methods(self):
+        tempurl.filter_factory({
+            'methods': 'GET HEAD PUT DELETE BREW',
+            'incoming_remove_headers': '',
+            'incoming_allow_headers': 'x-timestamp x-versions-location',
+            'outgoing_remove_headers': 'x-*',
+            'outgoing_allow_headers': 'x-object-meta-* content-type',
+            'allowed_digests': 'sha1 sha512 md5 not-a-valid-digest',
+        })
+        swift_info = registry.get_swift_info()
+        self.assertIn('tempurl', swift_info)
+        info = swift_info['tempurl']
+        self.assertEqual(set(info['methods']),
+                         set(('GET', 'HEAD', 'PUT', 'DELETE', 'BREW')))
+        self.assertEqual(set(info['incoming_remove_headers']), set())
+        self.assertEqual(set(info['incoming_allow_headers']),
+                         set(('x-timestamp', 'x-versions-location')))
+        self.assertEqual(set(info['outgoing_remove_headers']), set(('x-*', )))
+        self.assertEqual(set(info['outgoing_allow_headers']),
+                         set(('x-object-meta-*', 'content-type')))
+        self.assertEqual(info['allowed_digests'], ['sha1', 'sha512'])
+        self.assertEqual(info['deprecated_digests'], ['sha1'])
+
+    def test_no_deprecated_digests(self):
+        tempurl.filter_factory({'allowed_digests': 'sha256 sha512'})
+        swift_info = registry.get_swift_info()
+        self.assertIn('tempurl', swift_info)
+        info = swift_info['tempurl']
+        self.assertEqual(set(info['methods']),
+                         set(('GET', 'HEAD', 'PUT', 'POST', 'DELETE')))
+        self.assertEqual(set(info['incoming_remove_headers']),
+                         set(('x-timestamp', 'x-open-expired',)))
+        self.assertEqual(set(info['incoming_allow_headers']), set())
+        self.assertEqual(set(info['outgoing_remove_headers']),
+                         set(('x-object-meta-*',)))
+        self.assertEqual(set(info['outgoing_allow_headers']),
+                         set(('x-object-meta-public-*',)))
+        self.assertEqual(info['allowed_digests'], ['sha256', 'sha512'])
+        self.assertNotIn('deprecated_digests', info)
+
+    def test_bad_config(self):
+        with self.assertRaises(ValueError):
+            tempurl.filter_factory({
+                'allowed_digests': 'md4',
+            })
+
+
+class TestTempurlWarning(unittest.TestCase):
+
+    def test_deprecation_warning(self):
+        logger = debug_logger()
+        with mock.patch('swift.common.middleware.tempurl.get_logger',
+                        lambda *a, **kw: logger):
+            tempurl.filter_factory({'allowed_digests': 'sha1'})
+        log_lines = logger.get_lines_for_level('warning')
+        self.assertIn(
+            'The following digest algorithms are configured but deprecated:'
+            ' sha1. Support will be removed in a future release.',
+            log_lines)
 
 
 if __name__ == '__main__':
diff --git a/test/unit/common/middleware/test_versioned_writes.py b/test/unit/common/middleware/test_versioned_writes.py
new file mode 100644
index 0000000000..2769e873c7
--- /dev/null
+++ b/test/unit/common/middleware/test_versioned_writes.py
@@ -0,0 +1,1574 @@
+# Copyright (c) 2013 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import functools
+import json
+import os
+import time
+import unittest
+from swift.common import swob, utils, registry
+from swift.common.middleware import versioned_writes, copy
+from swift.common.swob import Request, date_header_format
+from swift.common.utils import Timestamp
+from test.unit import mock_timestamp_now, make_timestamp_iter
+from test.unit.common.middleware import helpers
+
+
+class FakeCache(object):
+
+    def __init__(self, val):
+        if 'status' not in val:
+            val['status'] = 200
+        self.val = val
+
+    def get(self, *args):
+        return self.val
+
+
+def local_tz(func):
+    '''
+    Decorator to change the timezone when running a test.
+
+    This uses the Eastern Time Zone definition from the time module's docs.
+    Note that the timezone affects things like time.time() and time.mktime().
+    '''
+    @functools.wraps(func)
+    def wrapper(*args, **kwargs):
+        tz = os.environ.get('TZ', '')
+        try:
+            os.environ['TZ'] = 'EST+05EDT,M4.1.0,M10.5.0'
+            time.tzset()
+            return func(*args, **kwargs)
+        finally:
+            os.environ['TZ'] = tz
+            time.tzset()
+    return wrapper
+
+
+class VersionedWritesBaseTestCase(unittest.TestCase):
+    def setUp(self):
+        self.app = helpers.FakeSwift()
+        conf = {'allow_versioned_writes': 'true'}
+        self.vw = versioned_writes.legacy.VersionedWritesMiddleware(
+            self.app, conf)
+
+    def tearDown(self):
+        self.assertEqual(self.app.unclosed_requests, {})
+        self.assertEqual(self.app.unread_requests, {})
+
+    def call_app(self, req, app=None):
+        if app is None:
+            app = self.app
+
+        self.authorized = []
+
+        def authorize(req):
+            self.authorized.append(req)
+
+        if 'swift.authorize' not in req.environ:
+            req.environ['swift.authorize'] = authorize
+
+        req.headers.setdefault("User-Agent", "Marula Kruger")
+
+        status = [None]
+        headers = [None]
+
+        def start_response(s, h, ei=None):
+            status[0] = s
+            headers[0] = h
+
+        body_iter = app(req.environ, start_response)
+        with utils.closing_if_possible(body_iter):
+            body = b''.join(body_iter)
+
+        return status[0], headers[0], body
+
+    def call_vw(self, req):
+        return self.call_app(req, app=self.vw)
+
+    def assertRequestEqual(self, req, other):
+        self.assertEqual(req.method, other.method)
+        self.assertEqual(req.path, other.path)
+
+
+class VersionedWritesTestCase(VersionedWritesBaseTestCase):
+    def test_put_container(self):
+        self.app.register('PUT', '/v1/a/c', swob.HTTPOk, {}, 'passed')
+        req = Request.blank('/v1/a/c',
+                            headers={'X-Versions-Location': 'ver_cont'},
+                            environ={'REQUEST_METHOD': 'PUT'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '200 OK')
+
+        # check for sysmeta header
+        calls = self.app.calls_with_headers
+        method, path, req_headers = calls[0]
+        self.assertEqual('PUT', method)
+        self.assertEqual('/v1/a/c', path)
+        self.assertIn('x-container-sysmeta-versions-location', req_headers)
+        self.assertEqual(req.headers['x-container-sysmeta-versions-location'],
+                         'ver_cont')
+        self.assertIn('x-container-sysmeta-versions-mode', req_headers)
+        self.assertEqual(req.headers['x-container-sysmeta-versions-mode'],
+                         'stack')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+
+    def test_put_container_history_header(self):
+        self.app.register('PUT', '/v1/a/c', swob.HTTPOk, {}, 'passed')
+        req = Request.blank('/v1/a/c',
+                            headers={'X-History-Location': 'ver_cont'},
+                            environ={'REQUEST_METHOD': 'PUT'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '200 OK')
+
+        # check for sysmeta header
+        calls = self.app.calls_with_headers
+        method, path, req_headers = calls[0]
+        self.assertEqual('PUT', method)
+        self.assertEqual('/v1/a/c', path)
+        self.assertIn('x-container-sysmeta-versions-location', req_headers)
+        self.assertEqual('ver_cont',
+                         req_headers['x-container-sysmeta-versions-location'])
+        self.assertIn('x-container-sysmeta-versions-mode', req_headers)
+        self.assertEqual('history',
+                         req_headers['x-container-sysmeta-versions-mode'])
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+
+    def test_put_container_both_headers(self):
+        req = Request.blank('/v1/a/c',
+                            headers={'X-Versions-Location': 'ver_cont',
+                                     'X-History-Location': 'ver_cont'},
+                            environ={'REQUEST_METHOD': 'PUT'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '400 Bad Request')
+        self.assertFalse(self.app.calls)
+
+    def test_container_allow_versioned_writes_false(self):
+        self.vw.conf = {'allow_versioned_writes': 'false'}
+
+        # PUT/POST container must fail as 412 when allow_versioned_writes
+        # set to false
+        for method in ('PUT', 'POST'):
+            for header in ('X-Versions-Location', 'X-History-Location'):
+                req = Request.blank('/v1/a/c',
+                                    headers={header: 'ver_cont'},
+                                    environ={'REQUEST_METHOD': method})
+                status, headers, body = self.call_vw(req)
+                self.assertEqual(status, "412 Precondition Failed",
+                                 'Got %s instead of 412 when %sing '
+                                 'with %s header' % (status, method, header))
+
+        # GET performs as normal
+        self.app.register('GET', '/v1/a/c', swob.HTTPOk, {}, 'passed')
+
+        for method in ('GET', 'HEAD'):
+            req = Request.blank('/v1/a/c',
+                                headers={'X-Versions-Location': 'ver_cont'},
+                                environ={'REQUEST_METHOD': method})
+            status, headers, body = self.call_vw(req)
+            self.assertEqual(status, '200 OK')
+
+    def _test_removal(self, headers):
+        self.app.register('POST', '/v1/a/c', swob.HTTPNoContent, {}, 'passed')
+        req = Request.blank('/v1/a/c',
+                            headers=headers,
+                            environ={'REQUEST_METHOD': 'POST'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '204 No Content')
+
+        # check for sysmeta header
+        calls = self.app.calls_with_headers
+        method, path, req_headers = calls[0]
+        self.assertEqual('POST', method)
+        self.assertEqual('/v1/a/c', path)
+        for header in ['x-container-sysmeta-versions-location',
+                       'x-container-sysmeta-versions-mode',
+                       'x-versions-location']:
+            self.assertIn(header, req_headers)
+            self.assertEqual('', req_headers[header])
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+
+    def test_remove_headers(self):
+        self._test_removal({'X-Remove-Versions-Location': 'x'})
+        self._test_removal({'X-Remove-History-Location': 'x'})
+
+    def test_empty_versions_location(self):
+        self._test_removal({'X-Versions-Location': ''})
+        self._test_removal({'X-History-Location': ''})
+
+    def test_remove_add_versions_precedence(self):
+        self.app.register(
+            'POST', '/v1/a/c', swob.HTTPOk,
+            {'x-container-sysmeta-versions-location': 'ver_cont'},
+            'passed')
+        req = Request.blank('/v1/a/c',
+                            headers={'X-Remove-Versions-Location': 'x',
+                                     'X-Versions-Location': 'ver_cont'},
+                            environ={'REQUEST_METHOD': 'POST'})
+
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '200 OK')
+        self.assertIn(('X-Versions-Location', 'ver_cont'), headers)
+
+        # check for sysmeta header
+        calls = self.app.calls_with_headers
+        method, path, req_headers = calls[0]
+        self.assertEqual('POST', method)
+        self.assertEqual('/v1/a/c', path)
+        self.assertIn('x-container-sysmeta-versions-location', req_headers)
+        self.assertNotIn('x-remove-versions-location', req_headers)
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+
+    def _test_blank_add_versions_precedence(self, blank_header, add_header):
+        self.app.register(
+            'POST', '/v1/a/c', swob.HTTPOk,
+            {'x-container-sysmeta-versions-location': 'ver_cont'},
+            'passed')
+        req = Request.blank('/v1/a/c',
+                            headers={blank_header: '',
+                                     add_header: 'ver_cont'},
+                            environ={'REQUEST_METHOD': 'POST'})
+
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '200 OK')
+
+        # check for sysmeta header
+        calls = self.app.calls_with_headers
+        method, path, req_headers = calls[-1]
+        self.assertEqual('POST', method)
+        self.assertEqual('/v1/a/c', path)
+        self.assertIn('x-container-sysmeta-versions-location', req_headers)
+        self.assertEqual('ver_cont',
+                         req_headers['x-container-sysmeta-versions-location'])
+        self.assertIn('x-container-sysmeta-versions-mode', req_headers)
+        self.assertEqual('history' if add_header == 'X-History-Location'
+                         else 'stack',
+                         req_headers['x-container-sysmeta-versions-mode'])
+        self.assertNotIn('x-remove-versions-location', req_headers)
+        self.assertIn('x-versions-location', req_headers)
+        self.assertEqual('', req_headers['x-versions-location'])
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+
+    def test_blank_add_versions_precedence(self):
+        self._test_blank_add_versions_precedence(
+            'X-Versions-Location', 'X-History-Location')
+        self._test_blank_add_versions_precedence(
+            'X-History-Location', 'X-Versions-Location')
+
+    def test_get_container(self):
+        self.app.register(
+            'GET', '/v1/a/c', swob.HTTPOk,
+            {'x-container-sysmeta-versions-location': 'ver_cont',
+             'x-container-sysmeta-versions-mode': 'stack'}, None)
+        req = Request.blank(
+            '/v1/a/c',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '200 OK')
+        self.assertIn(('X-Versions-Location', 'ver_cont'), headers)
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+
+    def test_head_container(self):
+        self.app.register(
+            'HEAD', '/v1/a/c', swob.HTTPOk,
+            {'x-container-sysmeta-versions-location': 'other_ver_cont',
+             'x-container-sysmeta-versions-mode': 'history'}, None)
+        req = Request.blank(
+            '/v1/a/c',
+            environ={'REQUEST_METHOD': 'HEAD'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '200 OK')
+        self.assertIn(('X-History-Location', 'other_ver_cont'), headers)
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+
+    def test_get_head(self):
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPOk, {}, None)
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'GET'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+
+        self.app.register('HEAD', '/v1/a/c/o', swob.HTTPOk, {}, None)
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'HEAD'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+
+    def test_put_object_no_versioning(self):
+        self.app.register(
+            'PUT', '/v1/a/c/o', swob.HTTPOk, {}, 'passed')
+
+        cache = FakeCache({})
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '100'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+
+    def test_put_first_object_success(self):
+        self.app.register(
+            'PUT', '/v1/a/c/o', swob.HTTPOk, {}, 'passed')
+        self.app.register(
+            'GET', '/v1/a/c/o', swob.HTTPNotFound, {}, None)
+
+        cache = FakeCache({'sysmeta': {'versions-location': 'ver_cont'}})
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '100',
+                     'swift.trans_id': 'fake_trans_id'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(len(self.authorized), 2)
+        # Versioned writes middleware now calls auth on the incoming request
+        # before we try the GET and then at the proxy, so there are 2
+        # atuhorized for the same request.
+        self.assertRequestEqual(req, self.authorized[0])
+        self.assertRequestEqual(req, self.authorized[1])
+        self.assertEqual(2, self.app.call_count)
+        self.assertEqual(['VW', None], self.app.swift_sources)
+        self.assertEqual({'fake_trans_id'}, set(self.app.txn_ids))
+
+    def test_put_versioned_object_including_url_encoded_name_success(self):
+        self.app.register(
+            'PUT', '/v1/a/c/%ff', swob.HTTPOk, {}, 'passed')
+        self.app.register(
+            'GET', '/v1/a/c/%ff', swob.HTTPNotFound, {}, None)
+
+        cache = FakeCache({'sysmeta': {'versions-location': 'ver_cont'}})
+        req = Request.blank(
+            '/v1/a/c/%25ff',
+            environ={'REQUEST_METHOD': 'PUT', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '100',
+                     'swift.trans_id': 'fake_trans_id'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(len(self.authorized), 2)
+        # Versioned writes middleware now calls auth on the incoming request
+        # before we try the GET and then at the proxy, so there are 2
+        # atuhorized for the same request.
+        self.assertRequestEqual(req, self.authorized[0])
+        self.assertRequestEqual(req, self.authorized[1])
+        self.assertEqual(2, self.app.call_count)
+        self.assertEqual(['VW', None], self.app.swift_sources)
+        self.assertEqual({'fake_trans_id'}, set(self.app.txn_ids))
+
+    def test_put_object_no_versioning_with_container_config_true(self):
+        # set False to versions_write and expect no GET occurred
+        self.vw.conf = {'allow_versioned_writes': 'false'}
+        self.app.register(
+            'PUT', '/v1/a/c/o', swob.HTTPCreated, {}, 'passed')
+        cache = FakeCache({'versions': 'ver_cont'})
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '100'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '201 Created')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+        called_method = [call.method for call in self.app.call_list]
+        self.assertNotIn('GET', called_method)
+
+    def test_put_request_is_dlo_manifest_with_container_config_true(self):
+        self.app.register(
+            'PUT', '/v1/a/c/o', swob.HTTPCreated, {}, 'passed')
+        self.app.register(
+            'GET', '/v1/a/c/o', swob.HTTPOk,
+            {'last-modified': 'Thu, 1 Jan 1970 00:01:00 GMT'}, 'old version')
+        self.app.register(
+            'PUT', '/v1/a/ver_cont/001o/0000000060.00000', swob.HTTPCreated,
+            {}, '')
+        cache = FakeCache({'versions': 'ver_cont'})
+        req = Request.blank(
+            '/v1/a/c/o',
+            headers={'X-Object-Manifest': 'req/manifest'},
+            environ={'REQUEST_METHOD': 'PUT', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '100'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '201 Created')
+        self.assertEqual(len(self.authorized), 2)
+        self.assertRequestEqual(req, self.authorized[0])
+        self.assertRequestEqual(req, self.authorized[1])
+        self.assertEqual(3, self.app.call_count)
+        self.assertEqual([
+            ('GET', '/v1/a/c/o?symlink=get'),
+            ('PUT', '/v1/a/ver_cont/001o/0000000060.00000'),
+            ('PUT', '/v1/a/c/o'),
+        ], self.app.calls)
+        self.assertIn('x-object-manifest',
+                      self.app.call_list[2].headers)
+
+    def test_put_version_is_dlo_manifest_with_container_config_true(self):
+        self.app.register('GET', '/v1/a/c/o', swob.HTTPOk,
+                          {'X-Object-Manifest': 'resp/manifest',
+                           'last-modified': 'Thu, 1 Jan 1970 01:00:00 GMT'},
+                          'passed')
+        self.app.register(
+            'PUT', '/v1/a/ver_cont/001o/0000003600.00000', swob.HTTPCreated,
+            {}, '')
+        self.app.register(
+            'PUT', '/v1/a/c/o', swob.HTTPCreated, {}, 'passed')
+        cache = FakeCache({'versions': 'ver_cont'})
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '100'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '201 Created')
+        # The middleware now auths the request before the initial GET, the
+        # same GET that gets the X-Object-Manifest back. So a second auth is
+        # now done.
+        self.assertEqual(len(self.authorized), 2)
+        self.assertRequestEqual(req, self.authorized[0])
+        self.assertRequestEqual(req, self.authorized[1])
+        self.assertEqual(3, self.app.call_count)
+        self.assertEqual([
+            ('GET', '/v1/a/c/o?symlink=get'),
+            ('PUT', '/v1/a/ver_cont/001o/0000003600.00000'),
+            ('PUT', '/v1/a/c/o'),
+        ], self.app.calls)
+        self.assertIn('x-object-manifest',
+                      self.app.call_list[1].headers)
+
+    def test_delete_object_no_versioning_with_container_config_true(self):
+        # set False to versions_write obviously and expect no GET versioning
+        # container and GET/PUT called (just delete object as normal)
+        self.vw.conf = {'allow_versioned_writes': 'false'}
+        self.app.register(
+            'DELETE', '/v1/a/c/o', swob.HTTPNoContent, {}, 'passed')
+        cache = FakeCache({'versions': 'ver_cont'})
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'DELETE', 'swift.cache': cache})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '204 No Content')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+        called_method = [call.method for call in self.app.call_list]
+        self.assertNotIn('PUT', called_method)
+        self.assertNotIn('GET', called_method)
+        self.assertEqual(1, self.app.call_count)
+
+    def test_new_version_success(self):
+        self.app.register(
+            'PUT', '/v1/a/c/o', swob.HTTPCreated, {}, 'passed')
+        self.app.register(
+            'GET', '/v1/a/c/o', swob.HTTPOk,
+            {'last-modified': 'Thu, 1 Jan 1970 00:00:01 GMT'}, 'passed')
+        self.app.register(
+            'PUT', '/v1/a/ver_cont/001o/0000000001.00000', swob.HTTPCreated,
+            {}, None)
+        cache = FakeCache({'sysmeta': {'versions-location': 'ver_cont'}})
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '100',
+                     'swift.trans_id': 'fake_trans_id'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '201 Created')
+        # authorized twice now because versioned_writes now makes a check on
+        # PUT
+        self.assertEqual(len(self.authorized), 2)
+        self.assertRequestEqual(req, self.authorized[0])
+        self.assertEqual(['VW', 'VW', None], self.app.swift_sources)
+        self.assertEqual({'fake_trans_id'}, set(self.app.txn_ids))
+
+    def test_new_version_get_errors(self):
+        # GET on source fails, expect client error response,
+        # no PUT should happen
+        self.app.register(
+            'GET', '/v1/a/c/o', swob.HTTPBadRequest, {}, None)
+        cache = FakeCache({'versions': 'ver_cont'})
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '100'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '412 Precondition Failed')
+        self.assertEqual(1, self.app.call_count)
+
+        # GET on source fails, expect server error response
+        self.app.register(
+            'GET', '/v1/a/c/o', swob.HTTPBadGateway, {}, None)
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '100'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '503 Service Unavailable')
+        self.assertEqual(2, self.app.call_count)
+
+    def test_new_version_put_errors(self):
+        # PUT of version fails, expect client error response
+        self.app.register(
+            'GET', '/v1/a/c/o', swob.HTTPOk,
+            {'last-modified': 'Thu, 1 Jan 1970 00:00:01 GMT'}, 'passed')
+        self.app.register(
+            'PUT', '/v1/a/ver_cont/001o/0000000001.00000',
+            swob.HTTPUnauthorized, {}, None)
+        cache = FakeCache({'sysmeta': {'versions-location': 'ver_cont'}})
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '100'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '412 Precondition Failed')
+        self.assertEqual(2, self.app.call_count)
+
+        # PUT of version fails, expect server error response
+        self.app.register(
+            'PUT', '/v1/a/ver_cont/001o/0000000001.00000', swob.HTTPBadGateway,
+            {}, None)
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '100'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '503 Service Unavailable')
+        self.assertEqual(4, self.app.call_count)
+
+    @local_tz
+    def test_new_version_sysmeta_precedence(self):
+        self.app.register(
+            'PUT', '/v1/a/c/o', swob.HTTPOk, {}, 'passed')
+        self.app.register(
+            'GET', '/v1/a/c/o', swob.HTTPOk,
+            {'last-modified': 'Thu, 1 Jan 1970 00:00:00 GMT'}, 'passed')
+        self.app.register(
+            'PUT', '/v1/a/ver_cont/001o/0000000000.00000', swob.HTTPOk,
+            {}, None)
+
+        # fill cache with two different values for versions location
+        # new middleware should use sysmeta first
+        cache = FakeCache({'versions': 'old_ver_cont',
+                          'sysmeta': {'versions-location': 'ver_cont'}})
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '100'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '200 OK')
+        # authorized twice now because versioned_writes now makes a check on
+        # PUT
+        self.assertEqual(len(self.authorized), 2)
+        self.assertRequestEqual(req, self.authorized[0])
+
+        # check that sysmeta header was used
+        calls = self.app.calls_with_headers
+        method, path, req_headers = calls[1]
+        self.assertEqual('PUT', method)
+        self.assertEqual('/v1/a/ver_cont/001o/0000000000.00000', path)
+
+    def test_delete_no_versions_container_success(self):
+        self.app.register(
+            'DELETE', '/v1/a/c/o', swob.HTTPOk, {}, 'passed')
+        self.app.register(
+            'GET', helpers.normalize_path(
+                '/v1/a/ver_cont?prefix=001o/&marker=&reverse=on'),
+            swob.HTTPNotFound, {}, None)
+
+        cache = FakeCache({'sysmeta': {'versions-location': 'ver_cont'}})
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'DELETE', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '0', 'swift.trans_id': 'fake_trans_id'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+        self.assertEqual(2, self.app.call_count)
+        self.assertEqual(['VW', None], self.app.swift_sources)
+        self.assertEqual({'fake_trans_id'}, set(self.app.txn_ids))
+
+        prefix_listing_prefix = '/v1/a/ver_cont?prefix=001o/&'
+        self.assertEqual(self.app.calls, [
+            ('GET', helpers.normalize_path(
+                prefix_listing_prefix + 'marker=&reverse=on')),
+            ('DELETE', '/v1/a/c/o'),
+        ])
+
+    def test_delete_first_object_success(self):
+        self.app.register(
+            'DELETE', '/v1/a/c/o', swob.HTTPOk, {}, 'passed')
+        self.app.register(
+            'GET', '/v1/a/ver_cont?prefix=001o/&marker=&reverse=on',
+            swob.HTTPOk, {}, '[]')
+
+        cache = FakeCache({'sysmeta': {'versions-location': 'ver_cont'}})
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'DELETE', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '0'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+
+        prefix_listing_prefix = '/v1/a/ver_cont?prefix=001o/&'
+        self.assertEqual(self.app.calls, [
+            ('GET', helpers.normalize_path(
+                prefix_listing_prefix + 'marker=&reverse=on')),
+            ('DELETE', '/v1/a/c/o'),
+        ])
+
+    def test_delete_latest_version_no_marker_success(self):
+        self.app.register(
+            'GET',
+            '/v1/a/ver_cont?prefix=001o/&marker=&reverse=on',
+            swob.HTTPOk, {},
+            '[{"hash": "y", '
+            '"last_modified": "2014-11-21T14:23:02.206740", '
+            '"bytes": 3, '
+            '"name": "001o/2", '
+            '"content_type": "text/plain"}, '
+            '{"hash": "x", '
+            '"last_modified": "2014-11-21T14:14:27.409100", '
+            '"bytes": 3, '
+            '"name": "001o/1", '
+            '"content_type": "text/plain"}]')
+        self.app.register(
+            'GET', '/v1/a/ver_cont/001o/2', swob.HTTPCreated,
+            {'content-length': '3'}, None)
+        self.app.register(
+            'PUT', '/v1/a/c/o', swob.HTTPCreated, {}, None)
+        self.app.register(
+            'DELETE', '/v1/a/ver_cont/001o/2', swob.HTTPOk,
+            {}, None)
+
+        cache = FakeCache({'sysmeta': {'versions-location': 'ver_cont'}})
+        req = Request.blank(
+            '/v1/a/c/o',
+            headers={'X-If-Delete-At': 1},
+            environ={'REQUEST_METHOD': 'DELETE', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '0', 'swift.trans_id': 'fake_trans_id'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+        self.assertEqual(4, self.app.call_count)
+        self.assertEqual(['VW', 'VW', 'VW', 'VW'], self.app.swift_sources)
+        self.assertEqual({'fake_trans_id'}, set(self.app.txn_ids))
+
+        # check that X-If-Delete-At was removed from DELETE request
+        req_headers = self.app.headers[-1]
+        self.assertNotIn('x-if-delete-at', [h.lower() for h in req_headers])
+
+        prefix_listing_prefix = '/v1/a/ver_cont?prefix=001o/&'
+        self.assertEqual(self.app.calls, [
+            ('GET', helpers.normalize_path(
+                prefix_listing_prefix + 'marker=&reverse=on')),
+            ('GET', '/v1/a/ver_cont/001o/2?symlink=get'),
+            ('PUT', '/v1/a/c/o'),
+            ('DELETE', '/v1/a/ver_cont/001o/2'),
+        ])
+
+    def test_delete_latest_version_restores_marker_success(self):
+        self.app.register(
+            'GET',
+            '/v1/a/ver_cont?prefix=001o/&marker=&reverse=on',
+            swob.HTTPOk, {},
+            '[{"hash": "x", '
+            '"last_modified": "2014-11-21T14:23:02.206740", '
+            '"bytes": 3, '
+            '"name": "001o/2", '
+            '"content_type": "application/x-deleted;swift_versions_deleted=1"'
+            '}, {"hash": "y", '
+            '"last_modified": "2014-11-21T14:14:27.409100", '
+            '"bytes": 3, '
+            '"name": "001o/1", '
+            '"content_type": "text/plain"'
+            '}]')
+        self.app.register(
+            'HEAD', '/v1/a/c/o', swob.HTTPOk, {}, 'passed')
+        self.app.register(
+            'DELETE', '/v1/a/c/o', swob.HTTPNoContent, {})
+
+        cache = FakeCache({'sysmeta': {'versions-location': 'ver_cont'}})
+        req = Request.blank(
+            '/v1/a/c/o',
+            headers={'X-If-Delete-At': 1},
+            environ={'REQUEST_METHOD': 'DELETE', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '0'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '204 No Content')
+        self.assertEqual(len(self.authorized), 2)
+        self.assertRequestEqual(req, self.authorized[0])
+        self.assertRequestEqual(req, self.authorized[1])
+
+        calls = self.app.call_list
+        self.assertEqual(['GET', 'HEAD', 'DELETE'],
+                         [c.method for c in calls])
+
+        self.assertIn('X-Newest', calls[1].headers)
+        self.assertEqual('True', calls[1].headers['X-Newest'])
+
+        call = calls.pop()
+        self.assertTrue(call.path.startswith('/v1/a/c/o'))
+        # Since we're deleting the original, this *should* still be present:
+        self.assertEqual('1', call.headers.get('X-If-Delete-At'))
+
+    def test_delete_latest_version_is_marker_success(self):
+        # Test popping a delete marker off the stack. So, there's data in the
+        # versions container, topped by a delete marker, and there's nothing
+        # in the base versioned container.
+        self.app.register(
+            'GET',
+            helpers.normalize_path(
+                '/v1/a/ver_cont?prefix=001o/&marker=&reverse=on'),
+            swob.HTTPOk, {},
+            '[{"hash": "y", '
+            '"last_modified": "2014-11-21T14:23:02.206740", '
+            '"bytes": 3, '
+            '"name": "001o/2", '
+            '"content_type": "application/x-deleted;swift_versions_deleted=1"'
+            '},{"hash": "x", '
+            '"last_modified": "2014-11-21T14:14:27.409100", '
+            '"bytes": 3, '
+            '"name": "001o/1", '
+            '"content_type": "text/plain"'
+            '}]')
+        self.app.register(
+            'HEAD', '/v1/a/c/o', swob.HTTPNotFound, {}, 'passed')
+        self.app.register(
+            'GET', '/v1/a/ver_cont/001o/1', swob.HTTPOk, {}, 'passed')
+        self.app.register(
+            'PUT', '/v1/a/c/o', swob.HTTPCreated, {}, None)
+        self.app.register(
+            'DELETE', '/v1/a/ver_cont/001o/2', swob.HTTPOk, {}, 'passed')
+        self.app.register(
+            'DELETE', '/v1/a/ver_cont/001o/1', swob.HTTPOk, {}, 'passed')
+
+        cache = FakeCache({'sysmeta': {'versions-location': 'ver_cont'}})
+        req = Request.blank(
+            '/v1/a/c/o',
+            headers={'X-If-Delete-At': 1},
+            environ={'REQUEST_METHOD': 'DELETE', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '0'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+
+        prefix_listing_prefix = '/v1/a/ver_cont?prefix=001o/&'
+        self.assertEqual(self.app.calls, [
+            ('GET', helpers.normalize_path(
+                prefix_listing_prefix + 'marker=&reverse=on')),
+            ('HEAD', '/v1/a/c/o'),
+            ('GET', '/v1/a/ver_cont/001o/1?symlink=get'),
+            ('PUT', '/v1/a/c/o'),
+            ('DELETE', '/v1/a/ver_cont/001o/1'),
+            ('DELETE', '/v1/a/ver_cont/001o/2'),
+        ])
+        self.assertIn('X-Newest', self.app.headers[1])
+        self.assertEqual('True', self.app.headers[1]['X-Newest'])
+        self.assertIn('X-Newest', self.app.headers[2])
+        self.assertEqual('True', self.app.headers[2]['X-Newest'])
+
+        # check that X-If-Delete-At was removed from DELETE request
+        for req_headers in self.app.headers[-2:]:
+            self.assertNotIn('x-if-delete-at',
+                             [h.lower() for h in req_headers])
+
+    def test_delete_latest_version_doubled_up_markers_success(self):
+        self.app.register(
+            'GET', '/v1/a/ver_cont?prefix=001o/'
+            '&marker=&reverse=on',
+            swob.HTTPOk, {},
+            '[{"hash": "x", '
+            '"last_modified": "2014-11-21T14:23:02.206740", '
+            '"bytes": 3, '
+            '"name": "001o/3", '
+            '"content_type": "application/x-deleted;swift_versions_deleted=1"'
+            '}, {"hash": "y", '
+            '"last_modified": "2014-11-21T14:14:27.409100", '
+            '"bytes": 3, '
+            '"name": "001o/2", '
+            '"content_type": "application/x-deleted;swift_versions_deleted=1"'
+            '}, {"hash": "y", '
+            '"last_modified": "2014-11-20T14:23:02.206740", '
+            '"bytes": 30, '
+            '"name": "001o/1", '
+            '"content_type": "text/plain"'
+            '}]')
+        self.app.register(
+            'HEAD', '/v1/a/c/o', swob.HTTPNotFound, {}, 'passed')
+        self.app.register(
+            'DELETE', '/v1/a/ver_cont/001o/3', swob.HTTPOk, {}, 'passed')
+
+        cache = FakeCache({'sysmeta': {'versions-location': 'ver_cont'}})
+        req = Request.blank(
+            '/v1/a/c/o',
+            headers={'X-If-Delete-At': 1},
+            environ={'REQUEST_METHOD': 'DELETE', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '0'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+
+        # check that X-If-Delete-At was removed from DELETE request
+        calls = self.app.call_list
+        self.assertEqual(['GET', 'HEAD', 'DELETE'],
+                         [c.method for c in calls])
+
+        call = calls.pop()
+        self.assertTrue(call.path.startswith('/v1/a/ver_cont/001o/3'))
+        self.assertNotIn('x-if-delete-at', [h.lower() for h in call.headers])
+
+    def test_history_delete_marker_no_object_success(self):
+        ts_now = Timestamp.now()
+        self.app.register(
+            'GET', '/v1/a/c/o', swob.HTTPNotFound,
+            {}, 'passed')
+        self.app.register(
+            'PUT', '/v1/a/ver_cont/001o/%s' % ts_now.internal,
+            swob.HTTPCreated, {}, 'passed')
+        self.app.register(
+            'DELETE', '/v1/a/c/o', swob.HTTPNotFound, {}, None)
+
+        cache = FakeCache({'sysmeta': {'versions-location': 'ver_cont',
+                                       'versions-mode': 'history'}})
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'DELETE', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '0'})
+        with mock_timestamp_now(ts_now):
+            status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '404 Not Found')
+        self.assertEqual(len(self.authorized), 2)
+
+        req.environ['REQUEST_METHOD'] = 'PUT'
+        self.assertRequestEqual(req, self.authorized[0])
+
+        calls = self.app.call_list
+        self.assertEqual(['GET', 'PUT', 'DELETE'], [c.method for c in calls])
+        self.assertEqual('application/x-deleted;swift_versions_deleted=1',
+                         calls[1].headers.get('Content-Type'))
+
+    def test_history_delete_marker_over_object_success(self):
+        ts_now = Timestamp.now()
+        self.app.register(
+            'GET', '/v1/a/c/o', swob.HTTPOk,
+            {'last-modified': 'Wed, 19 Nov 2014 18:19:02 GMT'}, 'passed')
+        self.app.register(
+            'PUT', '/v1/a/ver_cont/001o/1416421142.00000', swob.HTTPCreated,
+            {}, 'passed')
+        self.app.register(
+            'PUT', '/v1/a/ver_cont/001o/%s' % ts_now.internal,
+            swob.HTTPCreated, {}, 'passed')
+        self.app.register(
+            'DELETE', '/v1/a/c/o', swob.HTTPNoContent, {}, None)
+
+        cache = FakeCache({'sysmeta': {'versions-location': 'ver_cont',
+                                       'versions-mode': 'history'}})
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'DELETE', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '0'})
+        with mock_timestamp_now(ts_now):
+            status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '204 No Content')
+        self.assertEqual(b'', body)
+        self.assertEqual(len(self.authorized), 2)
+
+        req.environ['REQUEST_METHOD'] = 'PUT'
+        self.assertRequestEqual(req, self.authorized[0])
+
+        calls = self.app.call_list
+        self.assertEqual(['GET', 'PUT', 'PUT', 'DELETE'],
+                         [c.method for c in calls])
+        self.assertEqual('/v1/a/ver_cont/001o/1416421142.00000',
+                         calls[1].path)
+        self.assertEqual('application/x-deleted;swift_versions_deleted=1',
+                         calls[2].headers.get('Content-Type'))
+
+    def test_delete_single_version_success(self):
+        # check that if the first listing page has just a single item then
+        # it is not erroneously inferred to be a non-reversed listing
+        self.app.register(
+            'DELETE', '/v1/a/c/o', swob.HTTPOk, {}, 'passed')
+        self.app.register(
+            'GET',
+            '/v1/a/ver_cont?prefix=001o/&marker=&reverse=on',
+            swob.HTTPOk, {},
+            '[{"hash": "y", '
+            '"last_modified": "2014-11-21T14:23:02.206740", '
+            '"bytes": 3, '
+            '"name": "001o/1", '
+            '"content_type": "text/plain"}]')
+        self.app.register(
+            'GET', '/v1/a/ver_cont/001o/1', swob.HTTPOk,
+            {'content-length': '3'}, None)
+        self.app.register(
+            'PUT', '/v1/a/c/o', swob.HTTPCreated, {}, None)
+        self.app.register(
+            'DELETE', '/v1/a/ver_cont/001o/1', swob.HTTPOk,
+            {}, None)
+
+        cache = FakeCache({'sysmeta': {'versions-location': 'ver_cont'}})
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'DELETE', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '0'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+
+        prefix_listing_prefix = '/v1/a/ver_cont?prefix=001o/&'
+        self.assertEqual(self.app.calls, [
+            ('GET', helpers.normalize_path(
+                prefix_listing_prefix + 'marker=&reverse=on')),
+            ('GET', '/v1/a/ver_cont/001o/1?symlink=get'),
+            ('PUT', '/v1/a/c/o'),
+            ('DELETE', '/v1/a/ver_cont/001o/1'),
+        ])
+
+    def test_DELETE_on_expired_versioned_object(self):
+        self.app.register(
+            'GET',
+            '/v1/a/ver_cont?prefix=001o/&marker=&reverse=on',
+            swob.HTTPOk, {},
+            '[{"hash": "y", '
+            '"last_modified": "2014-11-21T14:23:02.206740", '
+            '"bytes": 3, '
+            '"name": "001o/2", '
+            '"content_type": "text/plain"}, '
+            '{"hash": "x", '
+            '"last_modified": "2014-11-21T14:14:27.409100", '
+            '"bytes": 3, '
+            '"name": "001o/1", '
+            '"content_type": "text/plain"}]')
+
+        # expired object
+        self.app.register(
+            'GET', '/v1/a/ver_cont/001o/2', swob.HTTPNotFound,
+            {}, None)
+        self.app.register(
+            'GET', '/v1/a/ver_cont/001o/1', swob.HTTPCreated,
+            {'content-length': '3'}, None)
+        self.app.register(
+            'PUT', '/v1/a/c/o', swob.HTTPOk, {}, None)
+        self.app.register(
+            'DELETE', '/v1/a/ver_cont/001o/1', swob.HTTPOk,
+            {}, None)
+
+        cache = FakeCache({'sysmeta': {'versions-location': 'ver_cont'}})
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'DELETE', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '0'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+        self.assertEqual(5, self.app.call_count)
+
+        prefix_listing_prefix = '/v1/a/ver_cont?prefix=001o/&'
+        self.assertEqual(self.app.calls, [
+            ('GET', helpers.normalize_path(
+                prefix_listing_prefix + 'marker=&reverse=on')),
+            ('GET', helpers.normalize_path(
+                '/v1/a/ver_cont/001o/2?symlink=get')),
+            ('GET', helpers.normalize_path(
+                '/v1/a/ver_cont/001o/1?symlink=get')),
+            ('PUT', helpers.normalize_path('/v1/a/c/o')),
+            ('DELETE', helpers.normalize_path('/v1/a/ver_cont/001o/1')),
+        ])
+
+    def test_denied_DELETE_of_versioned_object(self):
+        authorize_call = []
+        self.app.register(
+            'GET',
+            '/v1/a/ver_cont?prefix=001o/&marker=&reverse=on',
+            swob.HTTPOk, {},
+            '[{"hash": "y", '
+            '"last_modified": "2014-11-21T14:23:02.206740", '
+            '"bytes": 3, '
+            '"name": "001o/2", '
+            '"content_type": "text/plain"}, '
+            '{"hash": "x", '
+            '"last_modified": "2014-11-21T14:14:27.409100", '
+            '"bytes": 3, '
+            '"name": "001o/1", '
+            '"content_type": "text/plain"}]')
+
+        def fake_authorize(req):
+            # the container GET is pre-auth'd so here we deny the object DELETE
+            authorize_call.append(req)
+            return swob.HTTPForbidden()
+
+        cache = FakeCache({'sysmeta': {'versions-location': 'ver_cont'}})
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'DELETE', 'swift.cache': cache,
+                     'swift.authorize': fake_authorize,
+                     'CONTENT_LENGTH': '0'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '403 Forbidden')
+        self.assertEqual(len(authorize_call), 1)
+        self.assertRequestEqual(req, authorize_call[0])
+
+        prefix_listing_prefix = '/v1/a/ver_cont?prefix=001o/&'
+        self.assertEqual(self.app.calls, [
+            ('GET', helpers.normalize_path(
+                prefix_listing_prefix + 'marker=&reverse=on')),
+        ])
+
+    def test_denied_PUT_of_versioned_object(self):
+        authorize_call = []
+        self.app.register(
+            'GET', '/v1/a/c/o', swob.HTTPOk,
+            {'last-modified': 'Thu, 1 Jan 1970 00:00:01 GMT'}, 'passed')
+
+        def fake_authorize(req):
+            # we should deny the object PUT
+            authorize_call.append(req)
+            return swob.HTTPForbidden()
+
+        cache = FakeCache({'sysmeta': {'versions-location': 'ver_cont'}})
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT', 'swift.cache': cache,
+                     'swift.authorize': fake_authorize,
+                     'CONTENT_LENGTH': '0'})
+        # Save off a copy, as the middleware may modify the original
+        expected_req = Request(req.environ.copy())
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '403 Forbidden')
+        self.assertEqual(len(authorize_call), 1)
+        self.assertRequestEqual(expected_req, authorize_call[0])
+
+        self.assertEqual(self.app.calls, [])
+
+
+class VersionedWritesOldContainersTestCase(VersionedWritesBaseTestCase):
+    def test_delete_latest_version_success(self):
+        self.app.register(
+            'DELETE', '/v1/a/c/o', swob.HTTPOk, {}, 'passed')
+        self.app.register(
+            'GET', '/v1/a/ver_cont?prefix=001o/&'
+            'marker=&reverse=on',
+            swob.HTTPOk, {},
+            '[{"hash": "x", '
+            '"last_modified": "2014-11-21T14:14:27.409100", '
+            '"bytes": 3, '
+            '"name": "001o/1", '
+            '"content_type": "text/plain"}, '
+            '{"hash": "y", '
+            '"last_modified": "2014-11-21T14:23:02.206740", '
+            '"bytes": 3, '
+            '"name": "001o/2", '
+            '"content_type": "text/plain"}]')
+        self.app.register(
+            'GET', '/v1/a/ver_cont?prefix=001o/'
+            '&marker=001o/2',
+            swob.HTTPNotFound, {}, None)
+        self.app.register(
+            'GET', '/v1/a/ver_cont/001o/2', swob.HTTPCreated,
+            {'content-length': '3'}, None)
+        self.app.register(
+            'PUT', '/v1/a/c/o', swob.HTTPCreated, {}, None)
+        self.app.register(
+            'DELETE', '/v1/a/ver_cont/001o/2', swob.HTTPOk,
+            {}, None)
+
+        cache = FakeCache({'sysmeta': {'versions-location': 'ver_cont'}})
+        req = Request.blank(
+            '/v1/a/c/o',
+            headers={'X-If-Delete-At': 1},
+            environ={'REQUEST_METHOD': 'DELETE', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '0', 'swift.trans_id': 'fake_trans_id'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+        self.assertEqual(5, self.app.call_count)
+        self.assertEqual(['VW', 'VW', 'VW', 'VW', 'VW'],
+                         self.app.swift_sources)
+        self.assertEqual({'fake_trans_id'}, set(self.app.txn_ids))
+
+        # check that X-If-Delete-At was removed from DELETE request
+        req_headers = self.app.headers[-1]
+        self.assertNotIn('x-if-delete-at', [h.lower() for h in req_headers])
+
+        prefix_listing_prefix = '/v1/a/ver_cont?prefix=001o/&'
+        self.assertEqual(self.app.calls, [
+            ('GET', helpers.normalize_path(
+                prefix_listing_prefix + 'marker=&reverse=on')),
+            ('GET', helpers.normalize_path(
+                prefix_listing_prefix + 'marker=001o/2')),
+            ('GET', '/v1/a/ver_cont/001o/2?symlink=get'),
+            ('PUT', '/v1/a/c/o'),
+            ('DELETE', '/v1/a/ver_cont/001o/2'),
+        ])
+
+    def test_DELETE_on_expired_versioned_object(self):
+        self.app.register(
+            'GET', '/v1/a/ver_cont?prefix=001o/&'
+            'marker=&reverse=on',
+            swob.HTTPOk, {},
+            '[{"hash": "x", '
+            '"last_modified": "2014-11-21T14:14:27.409100", '
+            '"bytes": 3, '
+            '"name": "001o/1", '
+            '"content_type": "text/plain"}, '
+            '{"hash": "y", '
+            '"last_modified": "2014-11-21T14:23:02.206740", '
+            '"bytes": 3, '
+            '"name": "001o/2", '
+            '"content_type": "text/plain"}]')
+        self.app.register(
+            'GET', '/v1/a/ver_cont?prefix=001o/'
+            '&marker=001o/2',
+            swob.HTTPNotFound, {}, None)
+
+        # expired object
+        self.app.register(
+            'GET', '/v1/a/ver_cont/001o/2', swob.HTTPNotFound,
+            {}, None)
+        self.app.register(
+            'GET', '/v1/a/ver_cont/001o/1', swob.HTTPCreated,
+            {'content-length': '3'}, None)
+        self.app.register(
+            'PUT', '/v1/a/c/o', swob.HTTPOk, {}, None)
+        self.app.register(
+            'DELETE', '/v1/a/ver_cont/001o/1', swob.HTTPOk,
+            {}, None)
+
+        cache = FakeCache({'sysmeta': {'versions-location': 'ver_cont'}})
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'DELETE', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '0'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(len(self.authorized), 1)
+        self.assertRequestEqual(req, self.authorized[0])
+        self.assertEqual(6, self.app.call_count)
+
+        prefix_listing_prefix = '/v1/a/ver_cont?prefix=001o/&'
+        self.assertEqual(self.app.calls, [
+            ('GET', helpers.normalize_path(
+                prefix_listing_prefix + 'marker=&reverse=on')),
+            ('GET', helpers.normalize_path(
+                prefix_listing_prefix + 'marker=001o/2')),
+            ('GET', '/v1/a/ver_cont/001o/2?symlink=get'),
+            ('GET', '/v1/a/ver_cont/001o/1?symlink=get'),
+            ('PUT', '/v1/a/c/o'),
+            ('DELETE', '/v1/a/ver_cont/001o/1'),
+        ])
+
+    def test_denied_DELETE_of_versioned_object(self):
+        authorize_call = []
+        self.app.register(
+            'DELETE', '/v1/a/c/o', swob.HTTPOk, {}, 'passed')
+        self.app.register(
+            'GET', '/v1/a/ver_cont?prefix=001o/&'
+            'marker=&reverse=on',
+            swob.HTTPOk, {},
+            '[{"hash": "x", '
+            '"last_modified": "2014-11-21T14:14:27.409100", '
+            '"bytes": 3, '
+            '"name": "001o/1", '
+            '"content_type": "text/plain"}, '
+            '{"hash": "y", '
+            '"last_modified": "2014-11-21T14:23:02.206740", '
+            '"bytes": 3, '
+            '"name": "001o/2", '
+            '"content_type": "text/plain"}]')
+        self.app.register(
+            'GET', '/v1/a/ver_cont?prefix=001o/'
+            '&marker=001o/2',
+            swob.HTTPNotFound, {}, None)
+        self.app.register(
+            'DELETE', '/v1/a/c/o', swob.HTTPForbidden,
+            {}, None)
+
+        def fake_authorize(req):
+            authorize_call.append(req)
+            return swob.HTTPForbidden()
+
+        cache = FakeCache({'sysmeta': {'versions-location': 'ver_cont'}})
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'DELETE', 'swift.cache': cache,
+                     'swift.authorize': fake_authorize,
+                     'CONTENT_LENGTH': '0'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '403 Forbidden')
+        self.assertEqual(len(authorize_call), 1)
+        self.assertRequestEqual(req, authorize_call[0])
+        prefix_listing_prefix = '/v1/a/ver_cont?prefix=001o/&'
+        self.assertEqual(self.app.calls, [
+            ('GET', helpers.normalize_path(
+                prefix_listing_prefix + 'marker=&reverse=on')),
+            ('GET', helpers.normalize_path(
+                prefix_listing_prefix + 'marker=001o/2')),
+        ])
+
+    def test_partially_upgraded_cluster(self):
+        old_versions = [
+            {'hash': 'etag%d' % x,
+             'last_modified': "2014-11-21T14:14:%02d.409100" % x,
+             'bytes': 3,
+             'name': '001o/%d' % x,
+             'content_type': 'text/plain'}
+            for x in range(5)]
+
+        # first container server can reverse
+        self.app.register(
+            'GET', '/v1/a/ver_cont?prefix=001o/&'
+            'marker=&reverse=on',
+            swob.HTTPOk, {}, json.dumps(list(reversed(old_versions[2:]))))
+        # but all objects are already gone
+        self.app.register(
+            'GET', '/v1/a/ver_cont/001o/4', swob.HTTPNotFound,
+            {}, None)
+        self.app.register(
+            'GET', '/v1/a/ver_cont/001o/3', swob.HTTPNotFound,
+            {}, None)
+        self.app.register(
+            'GET', '/v1/a/ver_cont/001o/2', swob.HTTPNotFound,
+            {}, None)
+
+        # second container server can't reverse
+        self.app.register(
+            'GET', '/v1/a/ver_cont?prefix=001o/&'
+            'marker=001o/2&reverse=on',
+            swob.HTTPOk, {}, json.dumps(old_versions[3:]))
+
+        # subsequent requests shouldn't reverse
+        self.app.register(
+            'GET', '/v1/a/ver_cont?prefix=001o/&'
+            'marker=&end_marker=001o/2',
+            swob.HTTPOk, {}, json.dumps(old_versions[:1]))
+        self.app.register(
+            'GET', '/v1/a/ver_cont?prefix=001o/&'
+            'marker=001o/0&end_marker=001o/2',
+            swob.HTTPOk, {}, json.dumps(old_versions[1:2]))
+        self.app.register(
+            'GET', '/v1/a/ver_cont?prefix=001o/&'
+            'marker=001o/1&end_marker=001o/2',
+            swob.HTTPOk, {}, '[]')
+        self.app.register(
+            'GET', '/v1/a/ver_cont/001o/1', swob.HTTPOk,
+            {'content-length': '3'}, None)
+        self.app.register(
+            'PUT', '/v1/a/c/o', swob.HTTPCreated, {}, None)
+        self.app.register(
+            'DELETE', '/v1/a/ver_cont/001o/1', swob.HTTPNoContent,
+            {}, None)
+
+        cache = FakeCache({'sysmeta': {'versions-location': 'ver_cont'}})
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'DELETE', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '0'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '204 No Content')
+        prefix_listing_prefix = '/v1/a/ver_cont?prefix=001o/&'
+        self.assertEqual(self.app.calls, [
+            ('GET', helpers.normalize_path(
+                prefix_listing_prefix + 'marker=&reverse=on')),
+            ('GET', '/v1/a/ver_cont/001o/4?symlink=get'),
+            ('GET', '/v1/a/ver_cont/001o/3?symlink=get'),
+            ('GET', '/v1/a/ver_cont/001o/2?symlink=get'),
+            ('GET', helpers.normalize_path(
+                prefix_listing_prefix + 'marker=001o/2&reverse=on')),
+            ('GET', helpers.normalize_path(
+                prefix_listing_prefix + 'marker=&end_marker=001o/2')),
+            ('GET', helpers.normalize_path(
+                prefix_listing_prefix + 'marker=001o/0&end_marker=001o/2')),
+            ('GET', helpers.normalize_path(
+                prefix_listing_prefix + 'marker=001o/1&end_marker=001o/2')),
+            ('GET', '/v1/a/ver_cont/001o/1?symlink=get'),
+            ('PUT', '/v1/a/c/o'),
+            ('DELETE', '/v1/a/ver_cont/001o/1'),
+        ])
+
+    def test_partially_upgraded_cluster_single_result_on_second_page(self):
+        old_versions = [
+            {'hash': 'etag%d' % x,
+             'last_modified': "2014-11-21T14:14:%02d.409100" % x,
+             'bytes': 3,
+             'name': '001o/%d' % x,
+             'content_type': 'text/plain'}
+            for x in range(5)]
+
+        # first container server can reverse
+        self.app.register(
+            'GET', '/v1/a/ver_cont?prefix=001o/&'
+            'marker=&reverse=on',
+            swob.HTTPOk, {}, json.dumps(list(reversed(old_versions[-2:]))))
+        # but both objects are already gone
+        self.app.register(
+            'GET', '/v1/a/ver_cont/001o/4', swob.HTTPNotFound,
+            {}, None)
+        self.app.register(
+            'GET', '/v1/a/ver_cont/001o/3', swob.HTTPNotFound,
+            {}, None)
+
+        # second container server can't reverse
+        self.app.register(
+            'GET', '/v1/a/ver_cont?prefix=001o/&'
+            'marker=001o/3&reverse=on',
+            swob.HTTPOk, {}, json.dumps(old_versions[4:]))
+
+        # subsequent requests shouldn't reverse
+        self.app.register(
+            'GET', '/v1/a/ver_cont?prefix=001o/&'
+            'marker=&end_marker=001o/3',
+            swob.HTTPOk, {}, json.dumps(old_versions[:2]))
+        self.app.register(
+            'GET', '/v1/a/ver_cont?prefix=001o/&'
+            'marker=001o/1&end_marker=001o/3',
+            swob.HTTPOk, {}, json.dumps(old_versions[2:3]))
+        self.app.register(
+            'GET', '/v1/a/ver_cont?prefix=001o/&'
+            'marker=001o/2&end_marker=001o/3',
+            swob.HTTPOk, {}, '[]')
+        self.app.register(
+            'GET', '/v1/a/ver_cont/001o/2', swob.HTTPOk,
+            {'content-length': '3'}, None)
+        self.app.register(
+            'PUT', '/v1/a/c/o', swob.HTTPCreated, {}, None)
+        self.app.register(
+            'DELETE', '/v1/a/ver_cont/001o/2', swob.HTTPNoContent,
+            {}, None)
+
+        cache = FakeCache({'sysmeta': {'versions-location': 'ver_cont'}})
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'DELETE', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '0'})
+        status, headers, body = self.call_vw(req)
+        self.assertEqual(status, '204 No Content')
+        prefix_listing_prefix = '/v1/a/ver_cont?prefix=001o/&'
+        self.assertEqual(self.app.calls, [
+            ('GET', helpers.normalize_path(
+                prefix_listing_prefix + 'marker=&reverse=on')),
+            ('GET', '/v1/a/ver_cont/001o/4?symlink=get'),
+            ('GET', '/v1/a/ver_cont/001o/3?symlink=get'),
+            ('GET', helpers.normalize_path(
+                prefix_listing_prefix + 'marker=001o/3&reverse=on')),
+            ('GET', helpers.normalize_path(
+                prefix_listing_prefix + 'marker=&end_marker=001o/3')),
+            ('GET', helpers.normalize_path(
+                prefix_listing_prefix + 'marker=001o/1&end_marker=001o/3')),
+            ('GET', helpers.normalize_path(
+                prefix_listing_prefix + 'marker=001o/2&end_marker=001o/3')),
+            ('GET', '/v1/a/ver_cont/001o/2?symlink=get'),
+            ('PUT', '/v1/a/c/o'),
+            ('DELETE', '/v1/a/ver_cont/001o/2'),
+        ])
+
+
+class VersionedWritesCopyingTestCase(VersionedWritesBaseTestCase):
+    # verify interaction of copy and versioned_writes middlewares
+
+    def setUp(self):
+        self.app = helpers.FakeSwift()
+        conf = {'allow_versioned_writes': 'true'}
+        self.vw = versioned_writes.filter_factory(conf)(self.app)
+        self.filter = copy.filter_factory({})(self.vw)
+
+    def call_filter(self, req, **kwargs):
+        return self.call_app(req, app=self.filter, **kwargs)
+
+    def test_copy_first_version(self):
+        # no existing object to move to the versions container
+        self.app.register(
+            'GET', '/v1/a/tgt_cont/tgt_obj', swob.HTTPNotFound, {}, None)
+        self.app.register(
+            'GET', '/v1/a/src_cont/src_obj', swob.HTTPOk, {}, 'passed')
+        self.app.register(
+            'PUT', '/v1/a/tgt_cont/tgt_obj', swob.HTTPCreated, {}, 'passed')
+        cache = FakeCache({'sysmeta': {'versions-location': 'ver_cont'}})
+        req = Request.blank(
+            '/v1/a/src_cont/src_obj',
+            environ={'REQUEST_METHOD': 'COPY', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '100'},
+            headers={'Destination': 'tgt_cont/tgt_obj'})
+        status, headers, body = self.call_filter(req)
+        self.assertEqual(status, '201 Created')
+        self.assertEqual(len(self.authorized), 3)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/src_cont/src_obj', self.authorized[0].path)
+        # At the moment we are calling authorize on the incoming request in
+        # the middleware before we do the PUT (and the source GET) and again
+        # on the incoming request when it gets to the proxy. So the 2nd and
+        # 3rd auths look the same.
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a/tgt_cont/tgt_obj', self.authorized[1].path)
+        self.assertEqual('PUT', self.authorized[2].method)
+        self.assertEqual('/v1/a/tgt_cont/tgt_obj', self.authorized[2].path)
+        # note the GET on tgt_cont/tgt_obj is pre-authed
+        self.assertEqual(3, self.app.call_count, self.app.calls)
+
+    def test_copy_new_version(self):
+        # existing object should be moved to versions container
+        self.app.register(
+            'GET', '/v1/a/src_cont/src_obj', swob.HTTPOk, {}, 'passed')
+        self.app.register(
+            'GET', '/v1/a/tgt_cont/tgt_obj', swob.HTTPOk,
+            {'last-modified': 'Thu, 1 Jan 1970 00:00:01 GMT'}, 'passed')
+        self.app.register(
+            'PUT', '/v1/a/ver_cont/007tgt_obj/0000000001.00000', swob.HTTPOk,
+            {}, None)
+        self.app.register(
+            'PUT', '/v1/a/tgt_cont/tgt_obj', swob.HTTPCreated, {}, 'passed')
+        cache = FakeCache({'sysmeta': {'versions-location': 'ver_cont'}})
+        req = Request.blank(
+            '/v1/a/src_cont/src_obj',
+            environ={'REQUEST_METHOD': 'COPY', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '100'},
+            headers={'Destination': 'tgt_cont/tgt_obj'})
+        status, headers, body = self.call_filter(req)
+        self.assertEqual(status, '201 Created')
+        self.assertEqual(len(self.authorized), 3)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/src_cont/src_obj', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a/tgt_cont/tgt_obj', self.authorized[1].path)
+        self.assertEqual(4, self.app.call_count)
+
+    def test_copy_new_version_x_timestamp(self):
+        # existing object should be moved to versions container
+        ts_iter = make_timestamp_iter()
+        ts_then, ts_now = next(ts_iter), next(ts_iter)
+        self.app.register(
+            'GET', '/v1/a/src_cont/src_obj', swob.HTTPOk, {}, 'passed')
+        self.app.register(
+            'GET', '/v1/a/tgt_cont/tgt_obj', swob.HTTPOk,
+            {'x-timestamp': ts_now.normal,
+             'x-backend-timestamp': ts_now.internal,
+             # we'd expect last-modified to be ts_now as well, but we want the
+             # test to verify that x-timestamp is preferred when it is
+             # available so we deliberately set last-modified to another value
+             'last-modified': date_header_format(ts_then)},
+            'passed')
+        self.app.register(
+            'PUT', '/v1/a/ver_cont/007tgt_obj/%s' % ts_now.normal, swob.HTTPOk,
+            {}, None)
+        self.app.register(
+            'PUT', '/v1/a/tgt_cont/tgt_obj', swob.HTTPCreated, {}, 'passed')
+        cache = FakeCache({'sysmeta': {'versions-location': 'ver_cont'}})
+        req = Request.blank(
+            '/v1/a/src_cont/src_obj',
+            environ={'REQUEST_METHOD': 'COPY', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '100'},
+            headers={'Destination': 'tgt_cont/tgt_obj'})
+        with mock_timestamp_now(ts_now):
+            status, headers, body = self.call_filter(req)
+        self.assertEqual(status, '201 Created')
+        self.assertEqual(len(self.authorized), 3)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/src_cont/src_obj', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a/tgt_cont/tgt_obj', self.authorized[1].path)
+        self.assertEqual(4, self.app.call_count)
+
+    def test_copy_new_version_different_account(self):
+        self.app.register(
+            'GET', '/v1/src_a/src_cont/src_obj', swob.HTTPOk, {}, 'passed')
+        self.app.register(
+            'GET', '/v1/tgt_a/tgt_cont/tgt_obj', swob.HTTPOk,
+            {'last-modified': 'Thu, 1 Jan 1970 00:00:01 GMT'}, 'passed')
+        self.app.register(
+            'PUT', '/v1/tgt_a/ver_cont/007tgt_obj/0000000001.00000',
+            swob.HTTPOk, {}, None)
+        self.app.register(
+            'PUT', '/v1/tgt_a/tgt_cont/tgt_obj', swob.HTTPCreated, {},
+            'passed')
+        cache = FakeCache({'sysmeta': {'versions-location': 'ver_cont'}})
+        req = Request.blank(
+            '/v1/src_a/src_cont/src_obj',
+            environ={'REQUEST_METHOD': 'COPY', 'swift.cache': cache,
+                     'CONTENT_LENGTH': '100'},
+            headers={'Destination': 'tgt_cont/tgt_obj',
+                     'Destination-Account': 'tgt_a'})
+        status, headers, body = self.call_filter(req)
+        self.assertEqual(status, '201 Created')
+        self.assertEqual(len(self.authorized), 3)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/src_a/src_cont/src_obj', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/tgt_a/tgt_cont/tgt_obj', self.authorized[1].path)
+        self.assertEqual(4, self.app.call_count)
+
+    def test_copy_object_no_versioning_with_container_config_true(self):
+        # set False to versions_write obviously and expect no extra
+        # COPY called (just copy object as normal)
+        self.vw.conf = {'allow_versioned_writes': 'false'}
+        self.app.register(
+            'GET', '/v1/a/src_cont/src_obj', swob.HTTPOk, {}, 'passed')
+        self.app.register(
+            'PUT', '/v1/a/tgt_cont/tgt_obj', swob.HTTPCreated, {}, 'passed')
+        cache = FakeCache({'versions': 'ver_cont'})
+        req = Request.blank(
+            '/v1/a/src_cont/src_obj',
+            environ={'REQUEST_METHOD': 'COPY', 'swift.cache': cache},
+            headers={'Destination': '/tgt_cont/tgt_obj'})
+        status, headers, body = self.call_filter(req)
+        self.assertEqual(status, '201 Created')
+        self.assertEqual(len(self.authorized), 2)
+        self.assertEqual('GET', self.authorized[0].method)
+        self.assertEqual('/v1/a/src_cont/src_obj', self.authorized[0].path)
+        self.assertEqual('PUT', self.authorized[1].method)
+        self.assertEqual('/v1/a/tgt_cont/tgt_obj', self.authorized[1].path)
+        self.assertEqual(2, self.app.call_count)
+
+
+class TestSwiftInfo(unittest.TestCase):
+    def setUp(self):
+        registry._swift_info = {}
+        registry._swift_admin_info = {}
+
+    def test_registered_defaults(self):
+        versioned_writes.filter_factory({})('have to pass in an app')
+        swift_info = registry.get_swift_info()
+        # in default, versioned_writes is not in swift_info
+        self.assertNotIn('versioned_writes', swift_info)
+
+    def test_registered_explicitly_set(self):
+        versioned_writes.filter_factory(
+            {'allow_versioned_writes': 'true'})('have to pass in an app')
+        swift_info = registry.get_swift_info()
+        self.assertIn('versioned_writes', swift_info)
+        self.assertEqual(
+            swift_info['versioned_writes'].get('allowed_flags'),
+            ('x-versions-location', 'x-history-location'))
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/middleware/test_xprofile.py b/test/unit/common/middleware/test_xprofile.py
new file mode 100644
index 0000000000..17d573ffdf
--- /dev/null
+++ b/test/unit/common/middleware/test_xprofile.py
@@ -0,0 +1,532 @@
+# Copyright (c) 2010-2012 OpenStack, LLC.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import os
+import json
+import shutil
+import tempfile
+import unittest
+
+from io import BytesIO
+
+from swift.common.swob import Request, Response
+
+try:
+    from swift.common.middleware import xprofile
+    from swift.common.middleware.xprofile import ProfileMiddleware
+    from swift.common.middleware.x_profile.exceptions import (
+        MethodNotAllowed, NotFoundException, ODFLIBNotInstalled,
+        PLOTLIBNotInstalled)
+    from swift.common.middleware.x_profile.html_viewer import (
+        HTMLViewer, PLOTLIB_INSTALLED)
+    from swift.common.middleware.x_profile.profile_model import (
+        ODFLIB_INSTALLED, ProfileLog, Stats2)
+except ImportError:
+    xprofile = None
+
+
+class FakeApp(object):
+
+    def __call__(self, env, start_response):
+        req = Request(env)
+        return Response(request=req, body='FAKE APP')(
+            env, start_response)
+
+
+class TestXProfile(unittest.TestCase):
+
+    @unittest.skipIf(xprofile is None, "can't import xprofile")
+    def test_get_profiler(self):
+        self.assertTrue(xprofile.get_profiler('cProfile') is not None)
+        self.assertTrue(xprofile.get_profiler('eventlet.green.profile')
+                        is not None)
+
+
+class TestProfilers(unittest.TestCase):
+
+    @unittest.skipIf(xprofile is None, "can't import xprofile")
+    def setUp(self):
+        self.profilers = [xprofile.get_profiler('cProfile'),
+                          xprofile.get_profiler('eventlet.green.profile')]
+
+    def fake_func(self, *args, **kw):
+        return len(args) + len(kw)
+
+    def test_runcall(self):
+        for p in self.profilers:
+            v = p.runcall(self.fake_func, 'one', 'two', {'key1': 'value1'})
+            self.assertEqual(v, 3)
+
+    def test_runctx(self):
+        for p in self.profilers:
+            p.runctx('import os;os.getcwd();', globals(), locals())
+            p.snapshot_stats()
+            self.assertTrue(p.stats is not None)
+            self.assertGreater(len(p.stats.keys()), 0)
+
+
+class TestProfileMiddleware(unittest.TestCase):
+
+    @unittest.skipIf(xprofile is None, "can't import xprofile")
+    def setUp(self):
+        self.got_statuses = []
+        self.tempdir = tempfile.mkdtemp()
+        log_filename_prefix = os.path.join(
+            self.tempdir,
+            'log/swift/profile/default.profile')
+        conf = {'log_filename_prefix': log_filename_prefix}
+        self.app = ProfileMiddleware(FakeApp, conf)
+        self.pids = ['123', '456', str(os.getpid())]
+        profiler = xprofile.get_profiler('eventlet.green.profile')
+        for pid in self.pids:
+            path = self.app.log_filename_prefix + pid
+            profiler.runctx('import os;os.getcwd();', globals(), locals())
+            profiler.dump_stats(path)
+            profiler.runctx('import os;os.getcwd();', globals(), locals())
+            profiler.dump_stats(path + '.tmp')
+
+    def tearDown(self):
+        shutil.rmtree(self.tempdir, ignore_errors=True)
+
+    def get_app(self, app, global_conf, **local_conf):
+        factory = xprofile.filter_factory(global_conf, **local_conf)
+        return factory(app)
+
+    def start_response(self, status, headers):
+        self.got_statuses = [status]
+        self.headers = headers
+
+    def test_combine_body_qs(self):
+        body = (b"profile=all&sort=time&limit=-1&fulldirs=1"
+                b"&nfl_filter=__call__&query=query&metric=nc&format=default")
+        wsgi_input = BytesIO(body)
+        environ = {'REQUEST_METHOD': 'GET',
+                   'QUERY_STRING': 'profile=all&format=json',
+                   'wsgi.input': wsgi_input}
+        req = Request.blank('/__profile__/', environ=environ)
+        query_dict = self.app._combine_body_qs(req)
+        self.assertEqual(query_dict['profile'], ['all'])
+        self.assertEqual(query_dict['sort'], ['time'])
+        self.assertEqual(query_dict['limit'], ['-1'])
+        self.assertEqual(query_dict['fulldirs'], ['1'])
+        self.assertEqual(query_dict['nfl_filter'], ['__call__'])
+        self.assertEqual(query_dict['query'], ['query'])
+        self.assertEqual(query_dict['metric'], ['nc'])
+        self.assertEqual(query_dict['format'], ['default'])
+
+    def test_call(self):
+        body = b"sort=time&limit=-1&fulldirs=1&nfl_filter=&metric=nc"
+        wsgi_input = BytesIO(body + b'&query=query')
+        environ = {'HTTP_HOST': 'localhost:8080',
+                   'PATH_INFO': '/__profile__',
+                   'REQUEST_METHOD': 'GET',
+                   'QUERY_STRING': 'profile=all&format=json',
+                   'wsgi.input': wsgi_input}
+        resp = self.app(environ, self.start_response)
+        self.assertTrue(resp[0].find(b'<html>') > 0, resp)
+        self.assertEqual(self.got_statuses, ['200 OK'])
+        self.assertEqual(self.headers, [('content-type', 'text/html')])
+        wsgi_input = BytesIO(body + b'&plot=plot')
+        environ['wsgi.input'] = wsgi_input
+        if PLOTLIB_INSTALLED:
+            resp = self.app(environ, self.start_response)
+            self.assertEqual(self.got_statuses, ['200 OK'])
+            self.assertEqual(self.headers, [('content-type', 'image/jpg')])
+        else:
+            resp = self.app(environ, self.start_response)
+            self.assertEqual(self.got_statuses, ['500 Internal Server Error'])
+        wsgi_input = BytesIO(body + b'&download=download&format=default')
+        environ['wsgi.input'] = wsgi_input
+        resp = self.app(environ, self.start_response)
+        self.assertEqual(self.headers, [('content-type',
+                                         HTMLViewer.format_dict['default'])])
+        wsgi_input = BytesIO(body + b'&download=download&format=json')
+        environ['wsgi.input'] = wsgi_input
+        resp = self.app(environ, self.start_response)
+        self.assertTrue(self.headers == [('content-type',
+                                          HTMLViewer.format_dict['json'])])
+        env2 = environ.copy()
+        env2['REQUEST_METHOD'] = 'DELETE'
+        resp = self.app(env2, self.start_response)
+        self.assertEqual(self.got_statuses, ['405 Method Not Allowed'], resp)
+
+        # use a totally bogus profile identifier
+        wsgi_input = BytesIO(body + b'&profile=ABC&download=download')
+        environ['wsgi.input'] = wsgi_input
+        resp = self.app(environ, self.start_response)
+        self.assertEqual(self.got_statuses, ['404 Not Found'], resp)
+
+        wsgi_input = BytesIO(body + b'&download=download&format=ods')
+        environ['wsgi.input'] = wsgi_input
+        resp = self.app(environ, self.start_response)
+        if ODFLIB_INSTALLED:
+            self.assertEqual(self.headers, [('content-type',
+                                             HTMLViewer.format_dict['ods'])])
+        else:
+            self.assertEqual(self.got_statuses, ['500 Internal Server Error'])
+
+    def test_dump_checkpoint(self):
+        self.app.dump_checkpoint()
+        self.assertTrue(self.app.last_dump_at is not None)
+
+    def test_renew_profile(self):
+        old_profiler = self.app.profiler
+        self.app.renew_profile()
+        new_profiler = self.app.profiler
+        self.assertTrue(old_profiler != new_profiler)
+
+    def test_int_values(self):
+        for body in (
+            b"limit=os.system",
+            b"fulldirs=boom",
+        ):
+            environ = {'HTTP_HOST': 'localhost:8080',
+                       'PATH_INFO': '/__profile__',
+                       'REQUEST_METHOD': 'POST',
+                       'wsgi.input': BytesIO(body)}
+            resp = self.app(environ, self.start_response)
+            self.assertEqual(
+                self.got_statuses, ['500 Internal Server Error'], resp)
+            self.assertTrue(
+                resp.startswith(
+                    "Error on render profiling results: invalid literal "
+                    "for int() with base 10: "
+                ),
+                resp)
+
+
+class Test_profile_log(unittest.TestCase):
+
+    @unittest.skipIf(xprofile is None, "can't import xprofile")
+    def setUp(self):
+        self.dir1 = tempfile.mkdtemp()
+        self.log_filename_prefix1 = self.dir1 + '/unittest.profile'
+        self.profile_log1 = ProfileLog(self.log_filename_prefix1, False)
+        self.pids1 = ['123', '456', str(os.getpid())]
+        profiler1 = xprofile.get_profiler('eventlet.green.profile')
+        for pid in self.pids1:
+            profiler1.runctx('import os;os.getcwd();', globals(), locals())
+            self.profile_log1.dump_profile(profiler1, pid)
+
+        self.dir2 = tempfile.mkdtemp()
+        self.log_filename_prefix2 = self.dir2 + '/unittest.profile'
+        self.profile_log2 = ProfileLog(self.log_filename_prefix2, True)
+        self.pids2 = ['321', '654', str(os.getpid())]
+        profiler2 = xprofile.get_profiler('eventlet.green.profile')
+        for pid in self.pids2:
+            profiler2.runctx('import os;os.getcwd();', globals(), locals())
+            self.profile_log2.dump_profile(profiler2, pid)
+
+    def tearDown(self):
+        self.profile_log1.clear('all')
+        self.profile_log2.clear('all')
+        shutil.rmtree(self.dir1, ignore_errors=True)
+        shutil.rmtree(self.dir2, ignore_errors=True)
+
+    def test_get_all_pids(self):
+        self.assertEqual(self.profile_log1.get_all_pids(),
+                         sorted(self.pids1, reverse=True))
+        for pid in self.profile_log2.get_all_pids():
+            self.assertTrue(pid.split('-')[0] in self.pids2)
+
+    def test_clear(self):
+        self.profile_log1.clear('123')
+        self.assertFalse(os.path.exists(self.log_filename_prefix1 + '123'))
+        self.profile_log1.clear('current')
+        self.assertFalse(os.path.exists(self.log_filename_prefix1 +
+                                        str(os.getpid())))
+        self.profile_log1.clear('all')
+        for pid in self.pids1:
+            self.assertFalse(os.path.exists(self.log_filename_prefix1 + pid))
+
+        self.profile_log2.clear('321')
+        self.assertFalse(os.path.exists(self.log_filename_prefix2 + '321'))
+        self.profile_log2.clear('current')
+        self.assertFalse(os.path.exists(self.log_filename_prefix2 +
+                                        str(os.getpid())))
+        self.profile_log2.clear('all')
+        for pid in self.pids2:
+            self.assertFalse(os.path.exists(self.log_filename_prefix2 + pid))
+
+    def test_get_logfiles(self):
+        log_files = self.profile_log1.get_logfiles('all')
+        self.assertEqual(len(log_files), 3)
+        self.assertEqual(len(log_files), len(self.pids1))
+        log_files = self.profile_log1.get_logfiles('current')
+        self.assertEqual(len(log_files), 1)
+        self.assertEqual(log_files, [self.log_filename_prefix1
+                         + str(os.getpid())])
+        log_files = self.profile_log1.get_logfiles(self.pids1[0])
+        self.assertEqual(len(log_files), 1)
+        self.assertEqual(log_files, [self.log_filename_prefix1
+                         + self.pids1[0]])
+        log_files = self.profile_log2.get_logfiles('all')
+        self.assertEqual(len(log_files), 3)
+        self.assertEqual(len(log_files), len(self.pids2))
+        log_files = self.profile_log2.get_logfiles('current')
+        self.assertEqual(len(log_files), 1)
+        self.assertTrue(log_files[0].find(self.log_filename_prefix2 +
+                                          str(os.getpid())) > -1)
+        log_files = self.profile_log2.get_logfiles(self.pids2[0])
+        self.assertEqual(len(log_files), 1)
+        self.assertTrue(log_files[0].find(self.log_filename_prefix2 +
+                                          self.pids2[0]) > -1)
+
+    def test_dump_profile(self):
+        prof = xprofile.get_profiler('eventlet.green.profile')
+        prof.runctx('import os;os.getcwd();', globals(), locals())
+        prof.create_stats()
+        pfn = self.profile_log1.dump_profile(prof, os.getpid())
+        self.assertTrue(os.path.exists(pfn))
+        os.remove(pfn)
+        pfn = self.profile_log2.dump_profile(prof, os.getpid())
+        self.assertTrue(os.path.exists(pfn))
+        os.remove(pfn)
+
+
+class Test_html_viewer(unittest.TestCase):
+
+    @unittest.skipIf(xprofile is None, "can't import xprofile")
+    def setUp(self):
+        self.app = ProfileMiddleware(FakeApp, {})
+        self.log_files = []
+        self.tempdir = tempfile.mkdtemp()
+        self.log_filename_prefix = self.tempdir + '/unittest.profile'
+        self.profile_log = ProfileLog(self.log_filename_prefix, False)
+        self.pids = ['123', '456', str(os.getpid())]
+        profiler = xprofile.get_profiler('eventlet.green.profile')
+        for pid in self.pids:
+            profiler.runctx('import os;os.getcwd();', globals(), locals())
+            self.log_files.append(self.profile_log.dump_profile(profiler, pid))
+        self.viewer = HTMLViewer('__profile__', 'eventlet.green.profile',
+                                 self.profile_log)
+        body = (b"profile=123&profile=456&sort=time&sort=nc&limit=10"
+                b"&fulldirs=1&nfl_filter=getcwd&query=query&metric=nc")
+        wsgi_input = BytesIO(body)
+        environ = {'REQUEST_METHOD': 'GET',
+                   'QUERY_STRING': 'profile=all',
+                   'wsgi.input': wsgi_input}
+        req = Request.blank('/__profile__/', environ=environ)
+        self.query_dict = self.app._combine_body_qs(req)
+
+    def tearDown(self):
+        shutil.rmtree(self.tempdir, ignore_errors=True)
+
+    def fake_call_back(self):
+        pass
+
+    def test_get_param(self):
+        query_dict = self.query_dict
+        get_param = self.viewer._get_param
+        self.assertEqual(get_param(query_dict, 'profile', 'current', True),
+                         ['123', '456'])
+        self.assertEqual(get_param(query_dict, 'profile', 'current'), '123')
+        self.assertEqual(get_param(query_dict, 'sort', 'time'), 'time')
+        self.assertEqual(get_param(query_dict, 'sort', 'time', True),
+                         ['time', 'nc'])
+        self.assertEqual(get_param(query_dict, 'limit', -1), 10)
+        self.assertEqual(get_param(query_dict, 'fulldirs', '0'), '1')
+        self.assertEqual(get_param(query_dict, 'nfl_filter', ''), 'getcwd')
+        self.assertEqual(get_param(query_dict, 'query', ''), 'query')
+        self.assertEqual(get_param(query_dict, 'metric', 'time'), 'nc')
+        self.assertEqual(get_param(query_dict, 'format', 'default'), 'default')
+
+    def test_render(self):
+        url = 'http://localhost:8080/__profile__'
+        path_entries = ['/__profile__'.split('/'),
+                        '/__profile__/'.split('/'),
+                        '/__profile__/123'.split('/'),
+                        '/__profile__/123/'.split('/'),
+                        '/__profile__/123/:0(getcwd)'.split('/'),
+                        '/__profile__/all'.split('/'),
+                        '/__profile__/all/'.split('/'),
+                        '/__profile__/all/:0(getcwd)'.split('/'),
+                        '/__profile__/current'.split('/'),
+                        '/__profile__/current/'.split('/'),
+                        '/__profile__/current/:0(getcwd)'.split('/')]
+
+        content, headers = self.viewer.render(url, 'GET', path_entries[0],
+                                              self.query_dict, None)
+        self.assertTrue(content is not None)
+        self.assertEqual(headers, [('content-type', 'text/html')])
+
+        content, headers = self.viewer.render(url, 'POST', path_entries[0],
+                                              self.query_dict, None)
+        self.assertTrue(content is not None)
+        self.assertEqual(headers, [('content-type', 'text/html')])
+
+        plot_dict = self.query_dict.copy()
+        plot_dict['plot'] = ['plot']
+        if PLOTLIB_INSTALLED:
+            content, headers = self.viewer.render(url, 'POST', path_entries[0],
+                                                  plot_dict, None)
+            self.assertEqual(headers, [('content-type', 'image/jpg')])
+        else:
+            self.assertRaises(PLOTLIBNotInstalled, self.viewer.render,
+                              url, 'POST', path_entries[0], plot_dict, None)
+
+        clear_dict = self.query_dict.copy()
+        clear_dict['clear'] = ['clear']
+        del clear_dict['query']
+        clear_dict['profile'] = ['xxx']
+        content, headers = self.viewer.render(url, 'POST', path_entries[0],
+                                              clear_dict, None)
+        self.assertEqual(headers, [('content-type', 'text/html')])
+
+        download_dict = self.query_dict.copy()
+        download_dict['download'] = ['download']
+        content, headers = self.viewer.render(url, 'POST', path_entries[0],
+                                              download_dict, None)
+        self.assertTrue(headers == [('content-type',
+                                    self.viewer.format_dict['default'])])
+
+        content, headers = self.viewer.render(url, 'GET', path_entries[1],
+                                              self.query_dict, None)
+        self.assertTrue(isinstance(json.loads(content), dict))
+
+        for method in ['HEAD', 'PUT', 'DELETE', 'XYZMethod']:
+            self.assertRaises(MethodNotAllowed, self.viewer.render, url,
+                              method, path_entries[10], self.query_dict, None)
+
+        for entry in path_entries[2:]:
+            download_dict['format'] = 'default'
+            content, headers = self.viewer.render(url, 'GET', entry,
+                                                  download_dict, None)
+            self.assertTrue(
+                ('content-type', self.viewer.format_dict['default'])
+                in headers, entry)
+            download_dict['format'] = 'json'
+            content, headers = self.viewer.render(url, 'GET', entry,
+                                                  download_dict, None)
+            self.assertTrue(isinstance(json.loads(content), dict))
+
+    def test_index(self):
+        content, headers = self.viewer.index_page(self.log_files[0:1],
+                                                  profile_id='current')
+        self.assertTrue(content.find('<html>') > -1)
+        self.assertTrue(headers == [('content-type', 'text/html')])
+
+    def test_index_all(self):
+        content, headers = self.viewer.index_page(self.log_files,
+                                                  profile_id='all')
+        for f in self.log_files:
+            self.assertTrue(content.find(f) > 0, content)
+            self.assertTrue(headers == [('content-type', 'text/html')])
+
+    def test_download(self):
+        content, headers = self.viewer.download(self.log_files)
+        self.assertTrue(content is not None)
+        self.assertEqual(headers, [('content-type',
+                                    self.viewer.format_dict['default'])])
+        content, headers = self.viewer.download(self.log_files, sort='calls',
+                                                limit=10, nfl_filter='os')
+        self.assertTrue(content is not None)
+        self.assertEqual(headers, [('content-type',
+                                    self.viewer.format_dict['default'])])
+        content, headers = self.viewer.download(self.log_files,
+                                                output_format='default')
+        self.assertEqual(headers, [('content-type',
+                                    self.viewer.format_dict['default'])])
+        content, headers = self.viewer.download(self.log_files,
+                                                output_format='json')
+        self.assertTrue(isinstance(json.loads(content), dict))
+        self.assertEqual(headers, [('content-type',
+                                    self.viewer.format_dict['json'])])
+        content, headers = self.viewer.download(self.log_files,
+                                                output_format='csv')
+        self.assertEqual(headers, [('content-type',
+                                    self.viewer.format_dict['csv'])])
+        if ODFLIB_INSTALLED:
+            content, headers = self.viewer.download(self.log_files,
+                                                    output_format='ods')
+            self.assertEqual(headers, [('content-type',
+                                        self.viewer.format_dict['ods'])])
+        else:
+            self.assertRaises(ODFLIBNotInstalled, self.viewer.download,
+                              self.log_files, output_format='ods')
+        content, headers = self.viewer.download(self.log_files,
+                                                nfl_filter=__file__,
+                                                output_format='python')
+        self.assertEqual(headers, [('content-type',
+                                    self.viewer.format_dict['python'])])
+
+    def test_plot(self):
+        if PLOTLIB_INSTALLED:
+            content, headers = self.viewer.plot(self.log_files)
+            self.assertTrue(content is not None)
+            self.assertEqual(headers, [('content-type', 'image/jpg')])
+            self.assertRaises(NotFoundException, self.viewer.plot, [])
+        else:
+            self.assertRaises(PLOTLIBNotInstalled, self.viewer.plot,
+                              self.log_files)
+
+    def test_format_source_code(self):
+        osfile = os.__file__.rstrip('c')
+        nfl_os = '%s:%d(%s)' % (osfile, 136, 'makedirs')
+        self.assertIn('makedirs', self.viewer.format_source_code(nfl_os))
+        self.assertNotIn('makedirsXYZ', self.viewer.format_source_code(nfl_os))
+        nfl_illegal = '%sc:136(makedirs)' % osfile
+        self.assertIn('The file type are forbidden to access!',
+                      self.viewer.format_source_code(nfl_illegal))
+        nfl_not_exist = '%s.py:136(makedirs)' % osfile
+        self.assertIn('Can not access the file %s.py.' % osfile,
+                      self.viewer.format_source_code(nfl_not_exist))
+
+
+class TestStats2(unittest.TestCase):
+
+    @unittest.skipIf(xprofile is None, "can't import xprofile")
+    def setUp(self):
+        self.profile_file = tempfile.mktemp('profile', 'unittest')
+        self.profilers = [xprofile.get_profiler('cProfile'),
+                          xprofile.get_profiler('eventlet.green.profile')]
+        for p in self.profilers:
+            p.runctx('import os;os.getcwd();', globals(), locals())
+            p.dump_stats(self.profile_file)
+            self.stats2 = Stats2(self.profile_file)
+            self.selections = [['getcwd'], ['getcwd', -1],
+                               ['getcwd', -10], ['getcwd', 0.1]]
+
+    def tearDown(self):
+        os.remove(self.profile_file)
+
+    def test_func_to_dict(self):
+        func = ['profile.py', 100, '__call__']
+        self.assertEqual({'module': 'profile.py', 'line': 100, 'function':
+                          '__call__'}, self.stats2.func_to_dict(func))
+        func = ['', 0, '__call__']
+        self.assertEqual({'module': '', 'line': 0, 'function':
+                          '__call__'}, self.stats2.func_to_dict(func))
+
+    def test_to_json(self):
+        for selection in self.selections:
+            js = self.stats2.to_json(selection)
+            self.assertTrue(isinstance(json.loads(js), dict))
+            self.assertTrue(json.loads(js)['stats'] is not None)
+            self.assertTrue(json.loads(js)['stats'][0] is not None)
+
+    def test_to_ods(self):
+        if ODFLIB_INSTALLED:
+            for selection in self.selections:
+                self.assertTrue(self.stats2.to_ods(selection) is not None)
+
+    def test_to_csv(self):
+        for selection in self.selections:
+            self.assertTrue(self.stats2.to_csv(selection) is not None)
+            self.assertTrue('function calls' in self.stats2.to_csv(selection))
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/missing_container_info.db b/test/unit/common/missing_container_info.db
new file mode 100644
index 0000000000..cd9ee50ffc
Binary files /dev/null and b/test/unit/common/missing_container_info.db differ
diff --git a/test/unit/common/ring/test_builder.py b/test/unit/common/ring/test_builder.py
index e9a1011ef1..bec767bc02 100644
--- a/test/unit/common/ring/test_builder.py
+++ b/test/unit/common/ring/test_builder.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,92 +13,275 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
+import copy
+import errno
+from unittest import mock
+import operator
 import os
 import unittest
-import cPickle as pickle
-from collections import defaultdict
+import pickle
+from array import array
+from collections import Counter, defaultdict
+from math import ceil
+from tempfile import mkdtemp
 from shutil import rmtree
-from mock import Mock, call as mock_call
+import sys
+import random
+import uuid
+import itertools
 
 from swift.common import exceptions
 from swift.common import ring
-from swift.common.ring import RingBuilder, RingData
+from swift.common.ring import utils
+from swift.common.ring.builder import MAX_BALANCE
+
+
+def _partition_counts(builder, key='id'):
+    """
+    Returns a dictionary mapping the given device key to (number of
+    partitions assigned to that key).
+    """
+    return Counter(builder.devs[dev_id][key]
+                   for part2dev_id in builder._replica2part2dev
+                   for dev_id in part2dev_id)
 
 
 class TestRingBuilder(unittest.TestCase):
 
     def setUp(self):
-        self.testdir = os.path.join(os.path.dirname(__file__),
-                                    'ring_builder')
-        rmtree(self.testdir, ignore_errors=1)
-        os.mkdir(self.testdir)
+        self.testdir = mkdtemp()
 
     def tearDown(self):
         rmtree(self.testdir, ignore_errors=1)
 
+    def _get_population_by_region(self, builder):
+        """
+        Returns a dictionary mapping region to number of partitions in that
+        region.
+        """
+        return _partition_counts(builder, key='region')
+
     def test_init(self):
         rb = ring.RingBuilder(8, 3, 1)
-        self.assertEquals(rb.part_power, 8)
-        self.assertEquals(rb.replicas, 3)
-        self.assertEquals(rb.min_part_hours, 1)
-        self.assertEquals(rb.parts, 2 ** 8)
-        self.assertEquals(rb.devs, [])
-        self.assertEquals(rb.devs_changed, False)
-        self.assertEquals(rb.version, 0)
+        self.assertEqual(rb.part_power, 8)
+        self.assertEqual(rb.replicas, 3)
+        self.assertEqual(rb.min_part_hours, 1)
+        self.assertEqual(rb.parts, 2 ** 8)
+        self.assertEqual(rb.devs, [])
+        self.assertFalse(rb.devs_changed)
+        self.assertEqual(rb.version, 0)
+        self.assertIsNotNone(rb._last_part_moves)
+        rd = rb.get_ring()
+        self.assertEqual(rd.devs, [])
+        self.assertEqual(rd.version, 0)
+        self.assertIsNone(rd.next_part_power)
+        self.assertEqual(rd.replica_count, 0)
+
+    def test_overlarge_part_powers(self):
+        expected_msg = 'part_power must be at most 32 (was 33)'
+        with self.assertRaises(ValueError) as ctx:
+            ring.RingBuilder(33, 3, 1)
+        self.assertEqual(str(ctx.exception), expected_msg)
+
+    def test_oversmall_part_powers(self):
+        expected_msg = 'part_power must be at least 0 (was -1)'
+        with self.assertRaises(ValueError) as ctx:
+            ring.RingBuilder(-1, 3, 1)
+        self.assertEqual(str(ctx.exception), expected_msg)
+
+    def test_insufficient_replicas(self):
+        expected_msg = 'replicas must be at least 1 (was 0.999000)'
+        with self.assertRaises(ValueError) as ctx:
+            ring.RingBuilder(8, 0.999, 1)
+        self.assertEqual(str(ctx.exception), expected_msg)
+
+    def test_negative_min_part_hours(self):
+        expected_msg = 'min_part_hours must be non-negative (was -1)'
+        with self.assertRaises(ValueError) as ctx:
+            ring.RingBuilder(8, 3, -1)
+        self.assertEqual(str(ctx.exception), expected_msg)
+
+    def test_deepcopy(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdb1'})
+
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sda1'})
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sdb1'})
+
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 2, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10002, 'device': 'sda1'})
+        rb.add_dev({'id': 6, 'region': 0, 'zone': 2, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10002, 'device': 'sdb1'})
+
+        # more devices in zone #1
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10004, 'device': 'sdc1'})
+        rb.add_dev({'id': 7, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10004, 'device': 'sdd1'})
+        rb.rebalance()
+        rb_copy = copy.deepcopy(rb)
+
+        self.assertEqual(rb.to_dict(), rb_copy.to_dict())
+        self.assertIsNot(rb.devs, rb_copy.devs)
+        self.assertIsNot(rb._replica2part2dev, rb_copy._replica2part2dev)
+        self.assertIsNot(rb._last_part_moves, rb_copy._last_part_moves)
+        self.assertIsNot(rb._remove_devs, rb_copy._remove_devs)
+        self.assertIsNot(rb._dispersion_graph, rb_copy._dispersion_graph)
 
     def test_get_ring(self):
         rb = ring.RingBuilder(8, 3, 1)
-        rb.add_dev({'id': 0, 'zone': 0, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sda1'})
-        rb.add_dev({'id': 1, 'zone': 1, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10001, 'device': 'sda1'})
-        rb.add_dev({'id': 2, 'zone': 2, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10002, 'device': 'sda1'})
-        rb.add_dev({'id': 3, 'zone': 1, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10004, 'device': 'sda1'})
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sda1'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 2, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10002, 'device': 'sda1'})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10004, 'device': 'sda1'})
         rb.remove_dev(1)
         rb.rebalance()
         r = rb.get_ring()
-        self.assert_(isinstance(r, ring.RingData))
+        self.assertIsInstance(r, ring.RingData)
         r2 = rb.get_ring()
-        self.assert_(r is r2)
+        self.assertIs(r, r2)
         rb.rebalance()
         r3 = rb.get_ring()
-        self.assert_(r3 is not r2)
+        self.assertIsNot(r3, r2)
         r4 = rb.get_ring()
-        self.assert_(r3 is r4)
+        self.assertIs(r3, r4)
+
+    def test_rebalance_with_seed(self):
+        devs = [(0, 10000), (1, 10001), (2, 10002), (1, 10003)]
+        ring_builders = []
+        for n in range(3):
+            rb = ring.RingBuilder(8, 3, 1)
+            idx = 0
+            for zone, port in devs:
+                for d in ('sda1', 'sdb1'):
+                    rb.add_dev({'id': idx, 'region': 0, 'zone': zone,
+                                'ip': '127.0.0.1', 'port': port,
+                                'device': d, 'weight': 1})
+                    idx += 1
+            ring_builders.append(rb)
+
+        rb0 = ring_builders[0]
+        rb1 = ring_builders[1]
+        rb2 = ring_builders[2]
+
+        r0 = rb0.get_ring()
+        self.assertIs(rb0.get_ring(), r0)
+
+        rb0.rebalance()  # NO SEED
+        rb1.rebalance(seed=10)
+        rb2.rebalance(seed=10)
+
+        r1 = rb1.get_ring()
+        r2 = rb2.get_ring()
+
+        self.assertIsNot(rb0.get_ring(), r0)
+        self.assertNotEqual(r0.to_dict(), r1.to_dict())
+        self.assertEqual(r1.to_dict(), r2.to_dict())
+
+        # check that random state is reset
+        pre_state = random.getstate()
+        rb2.rebalance(seed=10)
+        self.assertEqual(pre_state, random.getstate(),
+                         "Random state was not reset")
+
+        pre_state = random.getstate()
+        with mock.patch.object(rb2, "_build_replica_plan",
+                               side_effect=Exception()):
+            self.assertRaises(Exception, rb2.rebalance, seed=10)
+        self.assertEqual(pre_state, random.getstate(),
+                         "Random state was not reset")
+
+    def test_rebalance_part_on_deleted_other_part_on_drained(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        rb.add_dev({'id': 0, 'region': 1, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 1, 'region': 1, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sda1'})
+        rb.add_dev({'id': 2, 'region': 1, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10002, 'device': 'sda1'})
+        rb.add_dev({'id': 3, 'region': 1, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10003, 'device': 'sda1'})
+        rb.add_dev({'id': 4, 'region': 1, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10004, 'device': 'sda1'})
+        rb.add_dev({'id': 5, 'region': 1, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10005, 'device': 'sda1'})
+
+        rb.rebalance(seed=1)
+        # We want a partition where 1 replica is on a removed device, 1
+        # replica is on a 0-weight device, and 1 on a normal device. To
+        # guarantee we have one, we see where partition 123 is, then
+        # manipulate its devices accordingly.
+        zero_weight_dev_id = rb._replica2part2dev[1][123]
+        delete_dev_id = rb._replica2part2dev[2][123]
+
+        rb.set_dev_weight(zero_weight_dev_id, 0.0)
+        rb.remove_dev(delete_dev_id)
+        rb.rebalance()
+
+    def test_set_replicas(self):
+        rb = ring.RingBuilder(8, 3.2, 1)
+        rb.devs_changed = False
+        rb.set_replicas(3.25)
+        self.assertTrue(rb.devs_changed)
+
+        rb.devs_changed = False
+        rb.set_replicas(3.2500001)
+        self.assertFalse(rb.devs_changed)
 
     def test_add_dev(self):
         rb = ring.RingBuilder(8, 3, 1)
-        dev = \
-            {'id': 0, 'zone': 0, 'weight': 1, 'ip': '127.0.0.1', 'port': 10000}
-        rb.add_dev(dev)
+        dev = {'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+               'ip': '127.0.0.1', 'port': 10000, 'device': 'sda1'}
+        dev_id = rb.add_dev(dev)
         self.assertRaises(exceptions.DuplicateDeviceError, rb.add_dev, dev)
+        self.assertEqual(dev_id, 0)
         rb = ring.RingBuilder(8, 3, 1)
-        #test add new dev with no id
-        rb.add_dev({'zone': 0, 'weight': 1, 'ip': '127.0.0.1', 'port': 6000})
-        self.assertEquals(rb.devs[0]['id'], 0)
-        #test add another dev with no id
-        rb.add_dev({'zone': 3, 'weight': 1, 'ip': '127.0.0.1', 'port': 6000})
-        self.assertEquals(rb.devs[1]['id'], 1)
+        # test add new dev with no id
+        dev_id = rb.add_dev({'zone': 0, 'region': 1, 'weight': 1,
+                             'ip': '127.0.0.1', 'port': 6200,
+                             'device': 'sda2'})
+        self.assertEqual(rb.devs[0]['id'], 0)
+        self.assertEqual(dev_id, 0)
+        # test add another dev with no id
+        dev_id = rb.add_dev({'zone': 3, 'region': 2, 'weight': 1,
+                             'ip': '127.0.0.1', 'port': 6200,
+                             'device': 'sda3'})
+        self.assertEqual(rb.devs[1]['id'], 1)
+        self.assertEqual(dev_id, 1)
+        # some keys are required
+        self.assertRaises(ValueError, rb.add_dev, {})
+        stub_dev = {'weight': 1, 'ip': '127.0.0.1', 'port': 7000}
+        for key in (stub_dev.keys()):
+            dev = stub_dev.copy()
+            dev.pop(key)
+            self.assertRaises(ValueError, rb.add_dev, dev)
 
     def test_set_dev_weight(self):
         rb = ring.RingBuilder(8, 3, 1)
-        rb.add_dev({'id': 0, 'zone': 0, 'weight': 0.5, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sda1'})
-        rb.add_dev({'id': 1, 'zone': 0, 'weight': 0.5, 'ip': '127.0.0.1',
-                    'port': 10001, 'device': 'sda1'})
-        rb.add_dev({'id': 2, 'zone': 1, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10002, 'device': 'sda1'})
-        rb.add_dev({'id': 3, 'zone': 2, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10003, 'device': 'sda1'})
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 0.5,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'weight': 0.5,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sda1'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10002, 'device': 'sda1'})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 2, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10003, 'device': 'sda1'})
         rb.rebalance()
         r = rb.get_ring()
         counts = {}
         for part2dev_id in r._replica2part2dev_id:
             for dev_id in part2dev_id:
                 counts[dev_id] = counts.get(dev_id, 0) + 1
-        self.assertEquals(counts, {0: 128, 1: 128, 2: 256, 3: 256})
+        self.assertEqual(counts, {0: 128, 1: 128, 2: 256, 3: 256})
         rb.set_dev_weight(0, 0.75)
         rb.set_dev_weight(1, 0.25)
         rb.pretend_min_part_hours_passed()
@@ -108,25 +291,25 @@ def test_set_dev_weight(self):
         for part2dev_id in r._replica2part2dev_id:
             for dev_id in part2dev_id:
                 counts[dev_id] = counts.get(dev_id, 0) + 1
-        self.assertEquals(counts, {0: 192, 1: 64, 2: 256, 3: 256})
+        self.assertEqual(counts, {0: 192, 1: 64, 2: 256, 3: 256})
 
     def test_remove_dev(self):
         rb = ring.RingBuilder(8, 3, 1)
-        rb.add_dev({'id': 0, 'zone': 0, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sda1'})
-        rb.add_dev({'id': 1, 'zone': 1, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10001, 'device': 'sda1'})
-        rb.add_dev({'id': 2, 'zone': 2, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10002, 'device': 'sda1'})
-        rb.add_dev({'id': 3, 'zone': 3, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10003, 'device': 'sda1'})
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sda1'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 2, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10002, 'device': 'sda1'})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 3, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10003, 'device': 'sda1'})
         rb.rebalance()
         r = rb.get_ring()
         counts = {}
         for part2dev_id in r._replica2part2dev_id:
             for dev_id in part2dev_id:
                 counts[dev_id] = counts.get(dev_id, 0) + 1
-        self.assertEquals(counts, {0: 192, 1: 192, 2: 192, 3: 192})
+        self.assertEqual(counts, {0: 192, 1: 192, 2: 192, 3: 192})
         rb.remove_dev(1)
         rb.pretend_min_part_hours_passed()
         rb.rebalance()
@@ -135,22 +318,48 @@ def test_remove_dev(self):
         for part2dev_id in r._replica2part2dev_id:
             for dev_id in part2dev_id:
                 counts[dev_id] = counts.get(dev_id, 0) + 1
-        self.assertEquals(counts, {0: 256, 2: 256, 3: 256})
+        self.assertEqual(counts, {0: 256, 2: 256, 3: 256})
+
+    def test_round_off_error(self):
+        # 3 nodes with 11 disks each is particularly problematic. Probably has
+        # to do with the binary repr. of 1/33? Those ones look suspicious...
+        #
+        #   >>> bin(int(struct.pack('!f', 1.0/(33)).encode('hex'), 16))
+        #   '0b111100111110000011111000010000'
+        rb = ring.RingBuilder(8, 3, 1)
+        for dev_id, (region, zone) in enumerate(
+                11 * [(0, 0), (1, 10), (1, 11)]):
+            rb.add_dev({'id': dev_id, 'region': region, 'zone': zone,
+                        'weight': 1, 'ip': '127.0.0.1',
+                        'port': 10000 + region * 100 + zone,
+                        'device': 'sda%d' % dev_id})
+        rb.rebalance()
+        self.assertEqual(_partition_counts(rb, 'zone'),
+                         {0: 256, 10: 256, 11: 256})
+        wanted_by_zone = defaultdict(lambda: defaultdict(int))
+        for dev in rb._iter_devs():
+            wanted_by_zone[dev['zone']][dev['parts_wanted']] += 1
+        # We're nicely balanced, but parts_wanted is slightly lumpy
+        # because reasons.
+        self.assertEqual(wanted_by_zone, {
+            0: {0: 10, 1: 1},
+            10: {0: 11},
+            11: {0: 10, -1: 1}})
 
     def test_remove_a_lot(self):
         rb = ring.RingBuilder(3, 3, 1)
         rb.add_dev({'id': 0, 'device': 'd0', 'ip': '10.0.0.1',
-                    'port': 6002, 'weight': 1000.0, 'zone': 1})
+                    'port': 6202, 'weight': 1000.0, 'region': 0, 'zone': 1})
         rb.add_dev({'id': 1, 'device': 'd1', 'ip': '10.0.0.2',
-                    'port': 6002, 'weight': 1000.0, 'zone': 2})
+                    'port': 6202, 'weight': 1000.0, 'region': 0, 'zone': 2})
         rb.add_dev({'id': 2, 'device': 'd2', 'ip': '10.0.0.3',
-                    'port': 6002, 'weight': 1000.0, 'zone': 3})
+                    'port': 6202, 'weight': 1000.0, 'region': 0, 'zone': 3})
         rb.add_dev({'id': 3, 'device': 'd3', 'ip': '10.0.0.1',
-                    'port': 6002, 'weight': 1000.0, 'zone': 1})
+                    'port': 6202, 'weight': 1000.0, 'region': 0, 'zone': 1})
         rb.add_dev({'id': 4, 'device': 'd4', 'ip': '10.0.0.2',
-                    'port': 6002, 'weight': 1000.0, 'zone': 2})
+                    'port': 6202, 'weight': 1000.0, 'region': 0, 'zone': 2})
         rb.add_dev({'id': 5, 'device': 'd5', 'ip': '10.0.0.3',
-                    'port': 6002, 'weight': 1000.0, 'zone': 3})
+                    'port': 6202, 'weight': 1000.0, 'region': 0, 'zone': 3})
         rb.rebalance()
         rb.validate()
 
@@ -167,30 +376,50 @@ def test_remove_a_lot(self):
         rb.rebalance()
         rb.validate()
 
+    def test_remove_zero_weighted(self):
+        rb = ring.RingBuilder(8, 3, 0)
+        rb.add_dev({'id': 0, 'device': 'd0', 'ip': '10.0.0.1',
+                    'port': 6202, 'weight': 1000.0, 'region': 0, 'zone': 1})
+        rb.add_dev({'id': 1, 'device': 'd1', 'ip': '10.0.0.2',
+                    'port': 6202, 'weight': 0.0, 'region': 0, 'zone': 2})
+        rb.add_dev({'id': 2, 'device': 'd2', 'ip': '10.0.0.3',
+                    'port': 6202, 'weight': 1000.0, 'region': 0, 'zone': 3})
+        rb.add_dev({'id': 3, 'device': 'd3', 'ip': '10.0.0.1',
+                    'port': 6202, 'weight': 1000.0, 'region': 0, 'zone': 1})
+        rb.rebalance()
+
+        rb.remove_dev(1)
+        parts, balance, removed = rb.rebalance()
+        self.assertEqual(removed, 1)
+
     def test_shuffled_gather(self):
         if self._shuffled_gather_helper() and \
                 self._shuffled_gather_helper():
-                raise AssertionError('It is highly likely the ring is no '
-                                     'longer shuffling the set of partitions '
-                                     'to reassign on a rebalance.')
+            raise AssertionError('It is highly likely the ring is no '
+                                 'longer shuffling the set of partitions '
+                                 'to reassign on a rebalance.')
 
     def _shuffled_gather_helper(self):
         rb = ring.RingBuilder(8, 3, 1)
-        rb.add_dev({'id': 0, 'zone': 0, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sda1'})
-        rb.add_dev({'id': 1, 'zone': 1, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10001, 'device': 'sda1'})
-        rb.add_dev({'id': 2, 'zone': 2, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10002, 'device': 'sda1'})
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sda1'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 2, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10002, 'device': 'sda1'})
         rb.rebalance()
-        rb.add_dev({'id': 3, 'zone': 3, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10003, 'device': 'sda1'})
-        rb.pretend_min_part_hours_passed()
-        parts = rb._gather_reassign_parts()
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 3, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10003, 'device': 'sda1'})
+        replica_plan = rb._build_replica_plan()
+        rb._set_parts_wanted(replica_plan)
+        for dev in rb._iter_devs():
+            dev['tiers'] = utils.tiers_for_dev(dev)
+        assign_parts = defaultdict(list)
+        rb._gather_parts_for_balance(assign_parts, replica_plan, False)
         max_run = 0
         run = 0
         last_part = 0
-        for part, _ in parts:
+        for part, _ in assign_parts.items():
             if part > last_part:
                 run += 1
             else:
@@ -200,38 +429,95 @@ def _shuffled_gather_helper(self):
             last_part = part
         if run > max_run:
             max_run = run
-        return max_run > len(parts) / 2
+        return max_run > len(assign_parts) / 2
+
+    def test_initial_balance(self):
+        # 2 boxes, 2 drives each in zone 1
+        # 1 box, 2 drives in zone 2
+        #
+        # This is balanceable, but there used to be some nondeterminism in
+        # rebalance() that would sometimes give you an imbalanced ring.
+        rb = ring.RingBuilder(8, 3, 1)
+        rb.add_dev({'region': 1, 'zone': 1, 'weight': 4000.0,
+                    'ip': '10.1.1.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'region': 1, 'zone': 1, 'weight': 4000.0,
+                    'ip': '10.1.1.1', 'port': 10000, 'device': 'sdb'})
+
+        rb.add_dev({'region': 1, 'zone': 1, 'weight': 4000.0,
+                    'ip': '10.1.1.2', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'region': 1, 'zone': 1, 'weight': 4000.0,
+                    'ip': '10.1.1.2', 'port': 10000, 'device': 'sdb'})
+
+        rb.add_dev({'region': 1, 'zone': 2, 'weight': 4000.0,
+                    'ip': '10.1.1.3', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'region': 1, 'zone': 2, 'weight': 4000.0,
+                    'ip': '10.1.1.3', 'port': 10000, 'device': 'sdb'})
+
+        _, balance, _ = rb.rebalance(seed=2)
+
+        # maybe not *perfect*, but should be close
+        self.assertLessEqual(balance, 1)
 
     def test_multitier_partial(self):
+        # Multitier test, nothing full
+        rb = ring.RingBuilder(8, 3, 1)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 1, 'region': 1, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdb'})
+        rb.add_dev({'id': 2, 'region': 2, 'zone': 2, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdc'})
+        rb.add_dev({'id': 3, 'region': 3, 'zone': 3, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdd'})
+
+        rb.rebalance()
+        rb.validate()
+
+        for part in range(rb.parts):
+            counts = defaultdict(lambda: defaultdict(int))
+            for replica in range(rb.replicas):
+                dev = rb.devs[rb._replica2part2dev[replica][part]]
+                counts['region'][dev['region']] += 1
+                counts['zone'][dev['zone']] += 1
+
+            if any(c > 1 for c in counts['region'].values()):
+                raise AssertionError(
+                    "Partition %d not evenly region-distributed (got %r)" %
+                    (part, counts['region']))
+            if any(c > 1 for c in counts['zone'].values()):
+                raise AssertionError(
+                    "Partition %d not evenly zone-distributed (got %r)" %
+                    (part, counts['zone']))
+
         # Multitier test, zones full, nodes not full
         rb = ring.RingBuilder(8, 6, 1)
-        rb.add_dev({'id': 0, 'zone': 0, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sda'})
-        rb.add_dev({'id': 1, 'zone': 0, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sdb'})
-        rb.add_dev({'id': 2, 'zone': 0, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sdc'})
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdb'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdc'})
 
-        rb.add_dev({'id': 3, 'zone': 1, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10001, 'device': 'sdd'})
-        rb.add_dev({'id': 4, 'zone': 1, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10001, 'device': 'sde'})
-        rb.add_dev({'id': 5, 'zone': 1, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10001, 'device': 'sdf'})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sdd'})
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sde'})
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sdf'})
 
-        rb.add_dev({'id': 6, 'zone': 2, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10002, 'device': 'sdg'})
-        rb.add_dev({'id': 7, 'zone': 2, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10002, 'device': 'sdh'})
-        rb.add_dev({'id': 8, 'zone': 2, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10002, 'device': 'sdi'})
+        rb.add_dev({'id': 6, 'region': 0, 'zone': 2, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10002, 'device': 'sdg'})
+        rb.add_dev({'id': 7, 'region': 0, 'zone': 2, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10002, 'device': 'sdh'})
+        rb.add_dev({'id': 8, 'region': 0, 'zone': 2, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10002, 'device': 'sdi'})
 
         rb.rebalance()
         rb.validate()
 
-        for part in xrange(rb.parts):
-            counts = defaultdict(lambda: defaultdict(lambda: 0))
-            for replica in xrange(rb.replicas):
+        for part in range(rb.parts):
+            counts = defaultdict(lambda: defaultdict(int))
+            for replica in range(rb.replicas):
                 dev = rb.devs[rb._replica2part2dev[replica][part]]
                 counts['zone'][dev['zone']] += 1
                 counts['dev_id'][dev['id']] += 1
@@ -239,7 +525,7 @@ def test_multitier_partial(self):
                 raise AssertionError(
                     "Partition %d not evenly distributed (got %r)" %
                     (part, counts['zone']))
-            for dev_id, replica_count in counts['dev_id'].iteritems():
+            for dev_id, replica_count in counts['dev_id'].items():
                 if replica_count > 1:
                     raise AssertionError(
                         "Partition %d is on device %d more than once (%r)" %
@@ -248,27 +534,27 @@ def test_multitier_partial(self):
     def test_multitier_full(self):
         # Multitier test, #replicas == #devs
         rb = ring.RingBuilder(8, 6, 1)
-        rb.add_dev({'id': 0, 'zone': 0, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sda'})
-        rb.add_dev({'id': 1, 'zone': 0, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sdb'})
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdb'})
 
-        rb.add_dev({'id': 2, 'zone': 1, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sdc'})
-        rb.add_dev({'id': 3, 'zone': 1, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10001, 'device': 'sdd'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdc'})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sdd'})
 
-        rb.add_dev({'id': 4, 'zone': 2, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10001, 'device': 'sde'})
-        rb.add_dev({'id': 5, 'zone': 2, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10001, 'device': 'sdf'})
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 2, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sde'})
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 2, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sdf'})
 
         rb.rebalance()
         rb.validate()
 
-        for part in xrange(rb.parts):
-            counts = defaultdict(lambda: defaultdict(lambda: 0))
-            for replica in xrange(rb.replicas):
+        for part in range(rb.parts):
+            counts = defaultdict(lambda: defaultdict(int))
+            for replica in range(rb.replicas):
                 dev = rb.devs[rb._replica2part2dev[replica][part]]
                 counts['zone'][dev['zone']] += 1
                 counts['dev_id'][dev['id']] += 1
@@ -276,47 +562,53 @@ def test_multitier_full(self):
                 raise AssertionError(
                     "Partition %d not evenly distributed (got %r)" %
                     (part, counts['zone']))
-            for dev_id, replica_count in counts['dev_id'].iteritems():
+            for dev_id, replica_count in counts['dev_id'].items():
                 if replica_count != 1:
                     raise AssertionError(
                         "Partition %d is on device %d %d times, not 1 (%r)" %
                         (part, dev_id, replica_count, counts['dev_id']))
 
     def test_multitier_overfull(self):
-        # Multitier test, #replicas > #devs + 2 (to prove even distribution)
+        # Multitier test, #replicas > #zones (to prove even distribution)
         rb = ring.RingBuilder(8, 8, 1)
-        rb.add_dev({'id': 0, 'zone': 0, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sda'})
-        rb.add_dev({'id': 1, 'zone': 0, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sdb'})
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdb'})
+        rb.add_dev({'id': 6, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdg'})
 
-        rb.add_dev({'id': 2, 'zone': 1, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sdc'})
-        rb.add_dev({'id': 3, 'zone': 1, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10001, 'device': 'sdd'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdc'})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sdd'})
+        rb.add_dev({'id': 7, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sdh'})
 
-        rb.add_dev({'id': 4, 'zone': 2, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10001, 'device': 'sde'})
-        rb.add_dev({'id': 5, 'zone': 2, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10001, 'device': 'sdf'})
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 2, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sde'})
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 2, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sdf'})
+        rb.add_dev({'id': 8, 'region': 0, 'zone': 2, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sdi'})
 
         rb.rebalance()
         rb.validate()
 
-        for part in xrange(rb.parts):
-            counts = defaultdict(lambda: defaultdict(lambda: 0))
-            for replica in xrange(rb.replicas):
+        for part in range(rb.parts):
+            counts = defaultdict(lambda: defaultdict(int))
+            for replica in range(rb.replicas):
                 dev = rb.devs[rb._replica2part2dev[replica][part]]
                 counts['zone'][dev['zone']] += 1
                 counts['dev_id'][dev['id']] += 1
 
-            self.assertEquals(8, sum(counts['zone'].values()))
-            for zone, replica_count in counts['zone'].iteritems():
+            self.assertEqual(8, sum(counts['zone'].values()))
+            for zone, replica_count in counts['zone'].items():
                 if replica_count not in (2, 3):
                     raise AssertionError(
                         "Partition %d not evenly distributed (got %r)" %
                         (part, counts['zone']))
-            for dev_id, replica_count in counts['dev_id'].iteritems():
+            for dev_id, replica_count in counts['dev_id'].items():
                 if replica_count not in (1, 2):
                     raise AssertionError(
                         "Partition %d is on device %d %d times, "
@@ -325,59 +617,76 @@ def test_multitier_overfull(self):
 
     def test_multitier_expansion_more_devices(self):
         rb = ring.RingBuilder(8, 6, 1)
-        rb.add_dev({'id': 0, 'zone': 0, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sda'})
-        rb.add_dev({'id': 1, 'zone': 1, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sdb'})
-        rb.add_dev({'id': 2, 'zone': 2, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sdc'})
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 0.5,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 1, 'weight': 0.5,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdb'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 2, 'weight': 0.5,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdc'})
+        rb.add_dev({'id': 6, 'region': 0, 'zone': 0, 'weight': 0.5,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 7, 'region': 0, 'zone': 1, 'weight': 0.5,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdb'})
+        rb.add_dev({'id': 8, 'region': 0, 'zone': 2, 'weight': 0.5,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdc'})
 
         rb.rebalance()
         rb.validate()
 
-        rb.add_dev({'id': 3, 'zone': 0, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sdd'})
-        rb.add_dev({'id': 4, 'zone': 1, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sde'})
-        rb.add_dev({'id': 5, 'zone': 2, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sdf'})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 0, 'weight': 0.5,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdd'})
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 1, 'weight': 0.5,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sde'})
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 2, 'weight': 0.5,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdf'})
+        rb.add_dev({'id': 9, 'region': 0, 'zone': 0, 'weight': 0.5,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdd'})
+        rb.add_dev({'id': 10, 'region': 0, 'zone': 1, 'weight': 0.5,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sde'})
+        rb.add_dev({'id': 11, 'region': 0, 'zone': 2, 'weight': 0.5,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdf'})
 
-        for _ in xrange(5):
+        for _ in range(5):
             rb.pretend_min_part_hours_passed()
             rb.rebalance()
         rb.validate()
 
-        for part in xrange(rb.parts):
-            counts = dict(zone=defaultdict(lambda: 0),
-                          dev_id=defaultdict(lambda: 0))
-            for replica in xrange(rb.replicas):
+        for part in range(rb.parts):
+            counts = dict(zone=defaultdict(int),
+                          dev_id=defaultdict(int))
+            for replica in range(rb.replicas):
                 dev = rb.devs[rb._replica2part2dev[replica][part]]
                 counts['zone'][dev['zone']] += 1
                 counts['dev_id'][dev['id']] += 1
 
-            self.assertEquals({0: 2, 1: 2, 2: 2}, dict(counts['zone']))
-            self.assertEquals({0: 1, 1: 1, 2: 1, 3: 1, 4: 1, 5: 1},
-                              dict(counts['dev_id']))
+            self.assertEqual({0: 2, 1: 2, 2: 2}, dict(counts['zone']))
+            # each part is assigned once to six unique devices
+            self.assertEqual(list(counts['dev_id'].values()), [1] * 6)
+            self.assertEqual(len(set(counts['dev_id'].keys())), 6)
 
     def test_multitier_part_moves_with_0_min_part_hours(self):
         rb = ring.RingBuilder(8, 3, 0)
-        rb.add_dev({'id': 0, 'zone': 0, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdd1'})
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sde1'})
         rb.rebalance()
         rb.validate()
 
         # min_part_hours is 0, so we're clear to move 2 replicas to
         # new devs
-        rb.add_dev({'id': 1, 'zone': 0, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sdb1'})
-        rb.add_dev({'id': 2, 'zone': 0, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sdc1'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdb1'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdc1'})
         rb.rebalance()
         rb.validate()
 
-        for part in xrange(rb.parts):
+        for part in range(rb.parts):
             devs = set()
-            for replica in xrange(rb.replicas):
+            for replica in range(rb.replicas):
                 devs.add(rb._replica2part2dev[replica][part])
 
             if len(devs) != 3:
@@ -386,53 +695,61 @@ def test_multitier_part_moves_with_0_min_part_hours(self):
 
     def test_multitier_part_moves_with_positive_min_part_hours(self):
         rb = ring.RingBuilder(8, 3, 99)
-        rb.add_dev({'id': 0, 'zone': 0, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdd1'})
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sde1'})
         rb.rebalance()
         rb.validate()
 
         # min_part_hours is >0, so we'll only be able to move 1
         # replica to a new home
-        rb.add_dev({'id': 1, 'zone': 0, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sdb1'})
-        rb.add_dev({'id': 2, 'zone': 0, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sdc1'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdb1'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdc1'})
         rb.pretend_min_part_hours_passed()
         rb.rebalance()
         rb.validate()
 
-        for part in xrange(rb.parts):
+        for part in range(rb.parts):
             devs = set()
-            for replica in xrange(rb.replicas):
+            for replica in range(rb.replicas):
                 devs.add(rb._replica2part2dev[replica][part])
-
-            if len(devs) != 2:
+            if not any(rb.devs[dev_id]['zone'] == 1 for dev_id in devs):
                 raise AssertionError(
-                    "Partition %d not on 2 devs (got %r)" % (part, devs))
+                    "Partition %d did not move (got %r)" % (part, devs))
 
     def test_multitier_dont_move_too_many_replicas(self):
-        rb = ring.RingBuilder(8, 3, 0)
+        rb = ring.RingBuilder(8, 3, 1)
         # there'll be at least one replica in z0 and z1
-        rb.add_dev({'id': 0, 'zone': 0, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sda1'})
-        rb.add_dev({'id': 1, 'zone': 1, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sdb1'})
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 0.5,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 1, 'weight': 0.5,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdb1'})
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 0, 'weight': 0.5,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 6, 'region': 0, 'zone': 1, 'weight': 0.5,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdb1'})
         rb.rebalance()
         rb.validate()
 
         # only 1 replica should move
-        rb.add_dev({'id': 2, 'zone': 2, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sdd1'})
-        rb.add_dev({'id': 3, 'zone': 3, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sde1'})
-        rb.add_dev({'id': 4, 'zone': 4, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sdf1'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 2, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdd1'})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 3, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sde1'})
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 4, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdf1'})
+        rb.pretend_min_part_hours_passed()
         rb.rebalance()
         rb.validate()
 
-        for part in xrange(rb.parts):
+        for part in range(rb.parts):
             zones = set()
-            for replica in xrange(rb.replicas):
+            for replica in range(rb.replicas):
                 zones.add(rb.devs[rb._replica2part2dev[replica][part]]['zone'])
 
             if len(zones) != 3:
@@ -443,208 +760,3839 @@ def test_multitier_dont_move_too_many_replicas(self):
                     "Partition %d not in zones 0 and 1 (got %r)" %
                     (part, zones))
 
+    def test_min_part_hours_zero_will_move_one_replica(self):
+        rb = ring.RingBuilder(8, 3, 0)
+        # there'll be at least one replica in z0 and z1
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 0.5,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 1, 'weight': 0.5,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdb1'})
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 0, 'weight': 0.5,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 6, 'region': 0, 'zone': 1, 'weight': 0.5,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdb1'})
+        rb.rebalance(seed=1)
+        rb.validate()
+
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 2, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdd1'})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 3, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sde1'})
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 4, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdf1'})
+        rb.rebalance(seed=3)
+        rb.validate()
+
+        self.assertEqual(0, rb.dispersion)
+        # Only one replica could move, so some zones are quite unbalanced
+        self.assertAlmostEqual(rb.get_balance(), 66.66, delta=0.5)
+
+        # There was only zone 0 and 1 before adding more devices. Only one
+        # replica should have been moved, therefore we expect 256 parts in zone
+        # 0 and 1, and a total of 256 in zone 2,3, and 4
+        expected = defaultdict(int, {0: 256, 1: 256, 2: 86, 3: 85, 4: 85})
+        self.assertEqual(expected, _partition_counts(rb, key='zone'))
+
+        zone_histogram = defaultdict(int)
+        for part in range(rb.parts):
+            zones = [
+                rb.devs[rb._replica2part2dev[replica][part]]['zone']
+                for replica in range(rb.replicas)]
+            zone_histogram[tuple(sorted(zones))] += 1
+
+        # We expect that every partition moved exactly one replica
+        expected = {
+            (0, 1, 2): 86,
+            (0, 1, 3): 85,
+            (0, 1, 4): 85,
+        }
+        self.assertEqual(zone_histogram, expected)
+
+        # After rebalancing one more times, we expect that everything is in a
+        # good state
+        rb.rebalance(seed=3)
+
+        self.assertEqual(0, rb.dispersion)
+        # a balance of w/i a 1% isn't too bad for 3 replicas on 7
+        # devices when part power is only 8
+        self.assertAlmostEqual(rb.get_balance(), 0, delta=0.5)
+
+        # every zone has either 153 or 154 parts
+        for zone, count in _partition_counts(
+                rb, key='zone').items():
+            self.assertAlmostEqual(153.5, count, delta=1)
+
+        parts_with_moved_count = defaultdict(int)
+        for part in range(rb.parts):
+            zones = set()
+            for replica in range(rb.replicas):
+                zones.add(rb.devs[rb._replica2part2dev[replica][part]]['zone'])
+            moved_replicas = len(zones - {0, 1})
+            parts_with_moved_count[moved_replicas] += 1
+
+        # as usual, the real numbers depend on the seed, but we want to
+        # validate a few things here:
+        #
+        # 1) every part had to move one replica to hit dispersion (so no
+        # one can have a moved count 0)
+        #
+        # 2) it's quite reasonable that some small percent of parts will
+        # have a replica in {0, 1, X} (meaning only one replica of the
+        # part moved)
+        #
+        # 3) when min_part_hours is 0, more than one replica of a part
+        # can move in a rebalance, and since that movement would get to
+        # better dispersion faster we expect to observe most parts in
+        # {[0,1], X, X} (meaning *two* replicas of the part moved)
+        #
+        # 4) there's plenty of weight in z0 & z1 to hold a whole
+        # replicanth, so there is no reason for any part to have to move
+        # all three replicas out of those zones (meaning no one can have
+        # a moved count 3)
+        #
+        expected = {
+            1: 52,
+            2: 204,
+        }
+        self.assertEqual(parts_with_moved_count, expected)
+
+    def test_ever_rebalanced(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sda1'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 2, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10002, 'device': 'sda1'})
+        self.assertFalse(rb.ever_rebalanced)
+        builder_file = os.path.join(self.testdir, 'test.builder')
+        rb.save(builder_file)
+        rb = ring.RingBuilder.load(builder_file)
+        self.assertFalse(rb.ever_rebalanced)
+        rb.rebalance()
+        self.assertTrue(rb.ever_rebalanced)
+        rb.save(builder_file)
+        rb = ring.RingBuilder.load(builder_file)
+        self.assertTrue(rb.ever_rebalanced)
+
     def test_rerebalance(self):
         rb = ring.RingBuilder(8, 3, 1)
-        rb.add_dev({'id': 0, 'zone': 0, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sda1'})
-        rb.add_dev({'id': 1, 'zone': 1, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10001, 'device': 'sda1'})
-        rb.add_dev({'id': 2, 'zone': 2, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10002, 'device': 'sda1'})
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sda1'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 2, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10002, 'device': 'sda1'})
+        self.assertFalse(rb.ever_rebalanced)
         rb.rebalance()
-        r = rb.get_ring()
-        counts = {}
-        for part2dev_id in r._replica2part2dev_id:
-            for dev_id in part2dev_id:
-                counts[dev_id] = counts.get(dev_id, 0) + 1
-        self.assertEquals(counts, {0: 256, 1: 256, 2: 256})
-        rb.add_dev({'id': 3, 'zone': 3, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10003, 'device': 'sda1'})
+        self.assertTrue(rb.ever_rebalanced)
+        counts = _partition_counts(rb)
+        self.assertEqual(counts, {0: 256, 1: 256, 2: 256})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 3, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10003, 'device': 'sda1'})
         rb.pretend_min_part_hours_passed()
         rb.rebalance()
-        r = rb.get_ring()
-        counts = {}
-        for part2dev_id in r._replica2part2dev_id:
-            for dev_id in part2dev_id:
-                counts[dev_id] = counts.get(dev_id, 0) + 1
-        self.assertEquals(counts, {0: 192, 1: 192, 2: 192, 3: 192})
+        self.assertTrue(rb.ever_rebalanced)
+        counts = _partition_counts(rb)
+        self.assertEqual(counts, {0: 192, 1: 192, 2: 192, 3: 192})
         rb.set_dev_weight(3, 100)
         rb.rebalance()
-        r = rb.get_ring()
-        counts = {}
-        for part2dev_id in r._replica2part2dev_id:
-            for dev_id in part2dev_id:
-                counts[dev_id] = counts.get(dev_id, 0) + 1
-        self.assertEquals(counts[3], 256)
+        counts = _partition_counts(rb)
+        self.assertEqual(counts[3], 256)
 
     def test_add_rebalance_add_rebalance_delete_rebalance(self):
-        """ Test for https://bugs.launchpad.net/swift/+bug/845952 """
+        # Test for https://bugs.launchpad.net/swift/+bug/845952
         # min_part of 0 to allow for rapid rebalancing
         rb = ring.RingBuilder(8, 3, 0)
-        rb.add_dev({'id': 0, 'zone': 0, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sda1'})
-        rb.add_dev({'id': 1, 'zone': 1, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10001, 'device': 'sda1'})
-        rb.add_dev({'id': 2, 'zone': 2, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10002, 'device': 'sda1'})
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sda1'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 2, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10002, 'device': 'sda1'})
 
         rb.rebalance()
+        rb.validate()
 
-        rb.add_dev({'id': 3, 'zone': 0, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10003, 'device': 'sda1'})
-        rb.add_dev({'id': 4, 'zone': 1, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10004, 'device': 'sda1'})
-        rb.add_dev({'id': 5, 'zone': 2, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10005, 'device': 'sda1'})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10003, 'device': 'sda1'})
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10004, 'device': 'sda1'})
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 2, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10005, 'device': 'sda1'})
 
         rb.rebalance()
+        rb.validate()
 
         rb.remove_dev(1)
 
-        rb.rebalance()
+        # well now we have only one device in z0
+        rb.set_overload(0.5)
 
-    def test_load(self):
-        rb = ring.RingBuilder(8, 3, 1)
-        devs = [{'id': 0, 'zone': 0, 'weight': 1, 'ip': '127.0.0.0',
-                 'port': 10000, 'device': 'sda1', 'meta': 'meta0'},
-                {'id': 1, 'zone': 1, 'weight': 1, 'ip': '127.0.0.1',
-                 'port': 10001, 'device': 'sdb1', 'meta': 'meta1'},
-                {'id': 2, 'zone': 2, 'weight': 2, 'ip': '127.0.0.2',
-                 'port': 10002, 'device': 'sdc1', 'meta': 'meta2'},
-                {'id': 3, 'zone': 3, 'weight': 2, 'ip': '127.0.0.3',
-                 'port': 10003, 'device': 'sdd1'}]
-        for d in devs:
-            rb.add_dev(d)
         rb.rebalance()
+        rb.validate()
 
-        real_pickle = pickle.load
-        try:
-            #test a legit builder
-            fake_pickle = Mock(return_value=rb)
-            fake_open = Mock(return_value=None)
-            pickle.load = fake_pickle
-            builder = RingBuilder.load('fake.builder', open=fake_open)
-            self.assertEquals(fake_pickle.call_count, 1)
-            fake_open.assert_has_calls([mock_call('fake.builder', 'rb')])
-            self.assertEquals(builder, rb)
-            fake_pickle.reset_mock()
-            fake_open.reset_mock()
+    def test_remove_last_partition_from_zero_weight(self):
+        rb = ring.RingBuilder(4, 3, 1)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 1, 'weight': 1.0,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
 
-            #test old style builder
-            fake_pickle.return_value = rb.to_dict()
-            pickle.load = fake_pickle
-            builder = RingBuilder.load('fake.builder', open=fake_open)
-            fake_open.assert_has_calls([mock_call('fake.builder', 'rb')])
-            self.assertEquals(builder.devs, rb.devs)
-            fake_pickle.reset_mock()
-            fake_open.reset_mock()
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 2, 'weight': 1.0,
+                    'ip': '127.0.0.2', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 2, 'weight': 1.0,
+                    'ip': '127.0.0.2', 'port': 10000, 'device': 'sdb'})
 
-            #test old devs but no meta
-            no_meta_builder = rb
-            for dev in no_meta_builder.devs:
-                del(dev['meta'])
-            fake_pickle.return_value = no_meta_builder
-            pickle.load = fake_pickle
-            builder = RingBuilder.load('fake.builder', open=fake_open)
-            fake_open.assert_has_calls([mock_call('fake.builder', 'rb')])
-            self.assertEquals(builder.devs, rb.devs)
-            fake_pickle.reset_mock()
-        finally:
-            pickle.load = real_pickle
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 3, 'weight': 1.0,
+                    'ip': '127.0.0.3', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 3, 'weight': 1.0,
+                    'ip': '127.0.0.3', 'port': 10000, 'device': 'sdb'})
+        rb.add_dev({'id': 6, 'region': 0, 'zone': 3, 'weight': 1.0,
+                    'ip': '127.0.0.3', 'port': 10000, 'device': 'sdc'})
 
-    def test_search_devs(self):
-        rb = ring.RingBuilder(8, 3, 1)
-        devs = [{'id': 0, 'zone': 0, 'weight': 1, 'ip': '127.0.0.0',
-                 'port': 10000, 'device': 'sda1', 'meta': 'meta0'},
-                {'id': 1, 'zone': 1, 'weight': 1, 'ip': '127.0.0.1',
-                 'port': 10001, 'device': 'sdb1', 'meta': 'meta1'},
-                {'id': 2, 'zone': 2, 'weight': 2, 'ip': '127.0.0.2',
-                 'port': 10002, 'device': 'sdc1', 'meta': 'meta2'},
-                {'id': 3, 'zone': 3, 'weight': 2, 'ip': '127.0.0.3',
-                 'port': 10003, 'device': 'sdd1', 'meta': 'meta3'}]
-        for d in devs:
-            rb.add_dev(d)
-        rb.rebalance()
-        res = rb.search_devs('d1')
-        self.assertEquals(res, [devs[1]])
-        res = rb.search_devs('z1')
-        self.assertEquals(res, [devs[1]])
-        res = rb.search_devs('-127.0.0.1')
-        self.assertEquals(res, [devs[1]])
-        res = rb.search_devs('-[127.0.0.1]:10001')
-        self.assertEquals(res, [devs[1]])
-        res = rb.search_devs(':10001')
-        self.assertEquals(res, [devs[1]])
-        res = rb.search_devs('/sdb1')
-        self.assertEquals(res, [devs[1]])
-        res = rb.search_devs('_meta1')
-        self.assertRaises(ValueError, rb.search_devs, 'OMGPONIES')
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 3, 'weight': 0.4,
+                    'ip': '127.0.0.3', 'port': 10001, 'device': 'zero'})
 
-    def test_validate(self):
-        rb = ring.RingBuilder(8, 3, 1)
-        rb.add_dev({'id': 0, 'zone': 0, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10000, 'device': 'sda1'})
-        rb.add_dev({'id': 1, 'zone': 1, 'weight': 1, 'ip': '127.0.0.1',
-                    'port': 10001, 'device': 'sda1'})
-        rb.add_dev({'id': 2, 'zone': 2, 'weight': 2, 'ip': '127.0.0.1',
-                    'port': 10002, 'device': 'sda1'})
-        rb.add_dev({'id': 3, 'zone': 3, 'weight': 2, 'ip': '127.0.0.1',
-                    'port': 10003, 'device': 'sda1'})
-        rb.rebalance()
-        r = rb.get_ring()
-        counts = {}
-        for part2dev_id in r._replica2part2dev_id:
+        zero_weight_dev = 3
+
+        rb.rebalance(seed=1)
+
+        # We want at least one partition with replicas only in zone 2 and 3
+        # due to device weights. It would *like* to spread out into zone 1,
+        # but can't, due to device weight.
+        #
+        # Also, we want such a partition to have a replica on device 3,
+        # which we will then reduce to zero weight. This should cause the
+        # removal of the replica from device 3.
+        #
+        # Getting this to happen by chance is hard, so let's just set up a
+        # builder so that it's in the state we want. This is a synthetic
+        # example; while the bug has happened on a real cluster, that
+        # builder file had a part_power of 16, so its contents are much too
+        # big to include here.
+        rb._replica2part2dev = [
+            #                            these are the relevant ones
+            #                                   |  |  |
+            #                                   v  v  v
+            array('H', [2, 5, 6, 2, 5, 6, 2, 5, 6, 2, 5, 6, 2, 5, 6, 2]),
+            array('H', [1, 4, 1, 4, 1, 4, 1, 4, 1, 4, 1, 4, 1, 4, 1, 4]),
+            array('H', [0, 0, 0, 0, 0, 0, 0, 0, 3, 3, 3, 5, 6, 2, 5, 6])]
+
+        # fix up bookkeeping
+        new_dev_parts = defaultdict(int)
+        for part2dev_id in rb._replica2part2dev:
             for dev_id in part2dev_id:
-                counts[dev_id] = counts.get(dev_id, 0) + 1
-        self.assertEquals(counts, {0: 128, 1: 128, 2: 256, 3: 256})
+                new_dev_parts[dev_id] += 1
+        for dev in rb._iter_devs():
+            dev['parts'] = new_dev_parts[dev['id']]
 
-        dev_usage, worst = rb.validate()
-        self.assert_(dev_usage is None)
-        self.assert_(worst is None)
+        rb.set_dev_weight(zero_weight_dev, 0.0)
+        rb.pretend_min_part_hours_passed()
+        rb.rebalance(seed=1)
 
-        dev_usage, worst = rb.validate(stats=True)
-        self.assertEquals(list(dev_usage), [128, 128, 256, 256])
-        self.assertEquals(int(worst), 0)
+        node_counts = defaultdict(int)
+        for part2dev_id in rb._replica2part2dev:
+            for dev_id in part2dev_id:
+                node_counts[dev_id] += 1
 
-        rb.set_dev_weight(2, 0)
+        self.assertEqual(node_counts[zero_weight_dev], 0)
+
+        # it's as balanced as it gets, so nothing moves anymore
+        rb.pretend_min_part_hours_passed()
+        parts_moved, _balance, _removed = rb.rebalance(seed=1)
+
+        new_node_counts = defaultdict(int)
+        for part2dev_id in rb._replica2part2dev:
+            for dev_id in part2dev_id:
+                new_node_counts[dev_id] += 1
+
+        del node_counts[zero_weight_dev]
+        self.assertEqual(node_counts, new_node_counts)
+
+        self.assertEqual(parts_moved, 0)
+
+    def test_part_swapping_problem(self):
+        rb = ring.RingBuilder(4, 3, 1)
+        # 127.0.0.1 (2 devs)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 100,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'weight': 100,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdb'})
+        # 127.0.0.2 (3 devs)
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 0, 'weight': 100,
+                    'ip': '127.0.0.2', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 0, 'weight': 100,
+                    'ip': '127.0.0.2', 'port': 10000, 'device': 'sdb'})
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 0, 'weight': 100,
+                    'ip': '127.0.0.2', 'port': 10000, 'device': 'sdc'})
+
+        expected = {
+            '127.0.0.1': 1.2,
+            '127.0.0.2': 1.7999999999999998,
+        }
+        for wr in (rb._build_weighted_replicas_by_tier(),
+                   rb._build_wanted_replicas_by_tier(),
+                   rb._build_target_replicas_by_tier()):
+            self.assertEqual(expected, {t[-1]: r for (t, r) in
+                                        wr.items() if len(t) == 3})
+        self.assertEqual(rb.get_required_overload(), 0)
+        rb.rebalance(seed=3)
+        # so 127.0.0.1 ended up with...
+        tier = (0, 0, '127.0.0.1')
+        # ... 6 parts with 1 replicas
+        self.assertEqual(rb._dispersion_graph[tier][1], 12)
+        # ... 4 parts with 2 replicas
+        self.assertEqual(rb._dispersion_graph[tier][2], 4)
+        # but since we only have two tiers, this is *totally* dispersed
+        self.assertEqual(0, rb.dispersion)
+
+        # small rings are hard to balance...
+        expected = {0: 10, 1: 10, 2: 10, 3: 9, 4: 9}
+        self.assertEqual(expected, {d['id']: d['parts']
+                                    for d in rb._iter_devs()})
+        # everyone wants 9.6 parts
+        expected = {
+            0: 4.166666666666671,
+            1: 4.166666666666671,
+            2: 4.166666666666671,
+            3: -6.25,
+            4: -6.25,
+        }
+        self.assertEqual(expected, rb._build_balance_per_dev())
+
+        # original sorted _replica2part2dev
+        """
+        rb._replica2part2dev = [
+            array('H', [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1]),
+            array('H', [1, 1, 1, 1, 2, 2, 2, 3, 3, 3, 2, 2, 2, 3, 3, 3]),
+            array('H', [2, 2, 2, 2, 3, 3, 4, 4, 4, 4, 3, 4, 4, 4, 4, 4])]
+        """
+
+        # now imagine if we came along this _replica2part2dev through no
+        # fault of our own; if instead of the 12 parts with only one
+        # replica on 127.0.0.1 being split evenly (6 and 6) on device's
+        # 0 and 1 - device 1 inexplicitly had 3 extra parts
+        rb._replica2part2dev = [
+            #                    these are the relevant one's here
+            #                                |  |  |
+            #                                v  v  v
+            array('H', [0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1]),
+            array('H', [1, 1, 1, 1, 2, 2, 2, 3, 3, 3, 2, 2, 2, 3, 3, 3]),
+            array('H', [2, 2, 2, 2, 3, 3, 4, 4, 4, 4, 3, 4, 4, 4, 4, 4])]
+
+        # fix up bookkeeping
+        new_dev_parts = defaultdict(int)
+        for part2dev_id in rb._replica2part2dev:
+            for dev_id in part2dev_id:
+                new_dev_parts[dev_id] += 1
+        for dev in rb._iter_devs():
+            dev['parts'] = new_dev_parts[dev['id']]
+        # reset the _last_part_gather_start otherwise
+        # there is a chance it'll unluckly wrap and try and
+        # move one of the device 1's from replica 2
+        # causing the intermitant failure in bug 1724356
+        rb._last_part_gather_start = 0
+
+        rb.pretend_min_part_hours_passed()
         rb.rebalance()
-        self.assertEquals(rb.validate(stats=True)[1], 999.99)
+        expected = {
+            0: 4.166666666666671,
+            1: 4.166666666666671,
+            2: 4.166666666666671,
+            3: -6.25,
+            4: -6.25,
+        }
+        self.assertEqual(expected, rb._build_balance_per_dev())
 
-        # Test not all partitions doubly accounted for
-        rb.devs[1]['parts'] -= 1
-        self.assertRaises(exceptions.RingValidationError, rb.validate)
-        rb.devs[1]['parts'] += 1
+        self.assertEqual(rb.get_balance(), 6.25)
+
+    def test_wrong_tier_with_no_where_to_go(self):
+        rb = ring.RingBuilder(4, 3, 1)
+
+        # 127.0.0.1 (even devices)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 100,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 0, 'weight': 900,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdb'})
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 0, 'weight': 900,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdc'})
+        rb.add_dev({'id': 6, 'region': 0, 'zone': 0, 'weight': 900,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdd'})
+        # 127.0.0.2 (odd devices)
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'weight': 500,
+                    'ip': '127.0.0.2', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 0, 'weight': 500,
+                    'ip': '127.0.0.2', 'port': 10000, 'device': 'sdb'})
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 0, 'weight': 500,
+                    'ip': '127.0.0.2', 'port': 10000, 'device': 'sdc'})
+        rb.add_dev({'id': 7, 'region': 0, 'zone': 0, 'weight': 500,
+                    'ip': '127.0.0.2', 'port': 10000, 'device': 'sdd'})
+
+        expected = {
+            '127.0.0.1': 1.75,
+            '127.0.0.2': 1.25,
+        }
+        for wr in (rb._build_weighted_replicas_by_tier(),
+                   rb._build_wanted_replicas_by_tier(),
+                   rb._build_target_replicas_by_tier()):
+            self.assertEqual(expected, {t[-1]: r for (t, r) in
+                                        wr.items() if len(t) == 3})
+        self.assertEqual(rb.get_required_overload(), 0)
+        rb.rebalance(seed=3)
+        # so 127.0.0.1 ended up with...
+        tier = (0, 0, '127.0.0.1')
+        # ... 4 parts with 1 replicas
+        self.assertEqual(rb._dispersion_graph[tier][1], 4)
+        # ... 12 parts with 2 replicas
+        self.assertEqual(rb._dispersion_graph[tier][2], 12)
+        # ... and of course 0 parts with 3 replicas
+        self.assertEqual(rb._dispersion_graph[tier][3], 0)
+        # but since we only have two tiers, this is *totally* dispersed
+        self.assertEqual(0, rb.dispersion)
+
+        # small rings are hard to balance, but it's possible when
+        # part-replicas (3 * 2 ** 4) can go evenly into device weights
+        # (4800) like we've done here
+        expected = {
+            0: 1,
+            2: 9,
+            4: 9,
+            6: 9,
+            1: 5,
+            3: 5,
+            5: 5,
+            7: 5,
+        }
+        self.assertEqual(expected, {d['id']: d['parts']
+                                    for d in rb._iter_devs()})
+        expected = {
+            0: 0.0,
+            1: 0.0,
+            2: 0.0,
+            3: 0.0,
+            4: 0.0,
+            5: 0.0,
+            6: 0.0,
+            7: 0.0,
+        }
+        self.assertEqual(expected, rb._build_balance_per_dev())
+
+        # all devices have exactly the # of parts they want
+        expected = {
+            0: 0,
+            2: 0,
+            4: 0,
+            6: 0,
+            1: 0,
+            3: 0,
+            5: 0,
+            7: 0,
+        }
+        self.assertEqual(expected, {d['id']: d['parts_wanted']
+                                    for d in rb._iter_devs()})
+
+        # original sorted _replica2part2dev
+        """
+        rb._replica2part2dev = [
+            array('H', [0, 2, 2, 2, 2, 2, 2, 2, 2, 2, 4, 4, 4, 4, 4, 4, ]),
+            array('H', [4, 4, 4, 6, 6, 6, 6, 6, 6, 6, 6, 6, 1, 1, 1, 1, ]),
+            array('H', [1, 3, 3, 3, 3, 3, 5, 5, 5, 5, 5, 7, 7, 7, 7, 7, ])]
+        """
+        # now imagine if we came along this _replica2part2dev through no
+        # fault of our own; and device 0 had extra parts, but both
+        # copies of the other replicas were already in the other tier!
+        rb._replica2part2dev = [
+            #                          these are the relevant one's here
+            #                                                     |  |
+            #                                                     v  v
+            array('H', [2, 2, 2, 2, 2, 2, 2, 2, 2, 4, 4, 4, 4, 4, 0, 0]),
+            array('H', [4, 4, 4, 4, 6, 6, 6, 6, 6, 6, 6, 6, 6, 1, 1, 1]),
+            array('H', [1, 1, 3, 3, 3, 3, 5, 5, 5, 5, 5, 7, 7, 7, 7, 7])]
+
+        # fix up bookkeeping
+        new_dev_parts = defaultdict(int)
+        for part2dev_id in rb._replica2part2dev:
+            for dev_id in part2dev_id:
+                new_dev_parts[dev_id] += 1
+        for dev in rb._iter_devs():
+            dev['parts'] = new_dev_parts[dev['id']]
+        replica_plan = rb._build_replica_plan()
+        rb._set_parts_wanted(replica_plan)
+
+        expected = {
+            0: -1,  # this device wants to shed
+            2: 0,
+            4: 0,
+            6: 0,
+            1: 0,
+            3: 1,  # there's devices with room on the other server
+            5: 0,
+            7: 0,
+        }
+        self.assertEqual(expected, {d['id']: d['parts_wanted']
+                                    for d in rb._iter_devs()})
+        self.assertEqual(rb.get_balance(), 100)
 
-        # Test partition on nonexistent device
         rb.pretend_min_part_hours_passed()
-        orig_dev_id = rb._replica2part2dev[0][0]
-        rb._replica2part2dev[0][0] = len(rb.devs)
-        self.assertRaises(exceptions.RingValidationError, rb.validate)
-        rb._replica2part2dev[0][0] = orig_dev_id
+        # There's something like a 11% chance that we won't be able to get to
+        # a balance of 0 (and a 6% chance that we won't change anything at all)
+        # Pick a seed to make this pass.
+        rb.rebalance(seed=123)
+        self.assertEqual(rb.get_balance(), 0)
 
-        # Tests that validate can handle 'holes' in .devs
-        rb.remove_dev(2)
+    def test_multiple_duplicate_device_assignment(self):
+        rb = ring.RingBuilder(4, 4, 1)
+        devs = [
+            'r1z1-127.0.0.1:6200/d1',
+            'r1z1-127.0.0.1:6201/d2',
+            'r1z1-127.0.0.1:6202/d3',
+            'r1z1-127.0.0.1:33443/d4',
+            'r1z1-127.0.0.2:6200/d5',
+            'r1z1-127.0.0.2:6201/d6',
+            'r1z1-127.0.0.2:6202/d7',
+            'r1z1-127.0.0.2:6202/d8',
+        ]
+        for add_value in devs:
+            dev = utils.parse_add_value(add_value)
+            dev['weight'] = 1.0
+            rb.add_dev(dev)
+        rb.rebalance()
+        rb._replica2part2dev = [
+            #         these are the relevant one's here
+            #           |  |  |                 |  |
+            #           v  v  v                 v  v
+            array('H', [0, 1, 2, 3, 3, 0, 0, 0, 4, 6, 4, 4, 4, 4, 4, 4]),
+            array('H', [0, 1, 3, 1, 1, 1, 1, 1, 5, 7, 5, 5, 5, 5, 5, 5]),
+            array('H', [0, 1, 2, 2, 2, 2, 2, 2, 4, 6, 6, 6, 6, 6, 6, 6]),
+            array('H', [0, 3, 2, 3, 3, 3, 3, 3, 5, 7, 7, 7, 7, 7, 7, 7])
+            #                    ^
+            #                    |
+            #      this sort of thing worked already
+        ]
+        # fix up bookkeeping
+        new_dev_parts = defaultdict(int)
+        for part2dev_id in rb._replica2part2dev:
+            for dev_id in part2dev_id:
+                new_dev_parts[dev_id] += 1
+        for dev in rb._iter_devs():
+            dev['parts'] = new_dev_parts[dev['id']]
         rb.pretend_min_part_hours_passed()
         rb.rebalance()
-        rb.validate(stats=True)
+        rb.validate()
 
-        # Test partition assigned to a hole
-        if rb.devs[2]:
-            rb.remove_dev(2)
+    def test_region_fullness_with_balanceable_ring(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sda1'})
+
+        rb.add_dev({'id': 2, 'region': 1, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10003, 'device': 'sda1'})
+        rb.add_dev({'id': 3, 'region': 1, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10004, 'device': 'sda1'})
+
+        rb.add_dev({'id': 4, 'region': 2, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10005, 'device': 'sda1'})
+        rb.add_dev({'id': 5, 'region': 2, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10006, 'device': 'sda1'})
+
+        rb.add_dev({'id': 6, 'region': 3, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10007, 'device': 'sda1'})
+        rb.add_dev({'id': 7, 'region': 3, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10008, 'device': 'sda1'})
+        rb.rebalance(seed=2)
+
+        population_by_region = self._get_population_by_region(rb)
+        self.assertEqual(population_by_region,
+                         {0: 192, 1: 192, 2: 192, 3: 192})
+
+    def test_region_fullness_with_unbalanceable_ring(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 2,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 1, 'weight': 2,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sda1'})
+
+        rb.add_dev({'id': 2, 'region': 1, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10003, 'device': 'sda1'})
+        rb.add_dev({'id': 3, 'region': 1, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10004, 'device': 'sda1'})
+        rb.rebalance(seed=2)
+
+        population_by_region = self._get_population_by_region(rb)
+        self.assertEqual(population_by_region, {0: 512, 1: 256})
+
+    def test_adding_region_slowly_with_unbalanceable_ring(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 0.5,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 0, 'weight': 0.5,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdb1'})
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 0, 'weight': 0.5,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdc1'})
+        rb.add_dev({'id': 6, 'region': 0, 'zone': 0, 'weight': 0.5,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdd1'})
+
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 1, 'weight': 0.5,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sda1'})
+        rb.add_dev({'id': 7, 'region': 0, 'zone': 1, 'weight': 0.5,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sdb1'})
+        rb.add_dev({'id': 8, 'region': 0, 'zone': 1, 'weight': 0.5,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sdc1'})
+        rb.add_dev({'id': 9, 'region': 0, 'zone': 1, 'weight': 0.5,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sdd1'})
+        rb.rebalance(seed=2)
+
+        rb.add_dev({'id': 2, 'region': 1, 'zone': 0, 'weight': 0.25,
+                    'ip': '127.0.0.1', 'port': 10003, 'device': 'sda1'})
+        rb.add_dev({'id': 3, 'region': 1, 'zone': 1, 'weight': 0.25,
+                    'ip': '127.0.0.1', 'port': 10004, 'device': 'sda1'})
         rb.pretend_min_part_hours_passed()
-        orig_dev_id = rb._replica2part2dev[0][0]
-        rb._replica2part2dev[0][0] = 2
-        self.assertRaises(exceptions.RingValidationError, rb.validate)
-        rb._replica2part2dev[0][0] = orig_dev_id
+        changed_parts, _balance, _removed = rb.rebalance(seed=2)
 
-        # Validate that zero weight devices with no partitions don't count on
-        # the 'worst' value.
-        self.assertNotEquals(rb.validate(stats=True)[1], 999.99)
-        rb.add_dev({'id': 4, 'zone': 0, 'weight': 0, 'ip': '127.0.0.1',
-                    'port': 10004, 'device': 'sda1'})
+        # there's not enough room in r1 for every partition to have a replica
+        # in it, so only 86 assignments occur in r1 (that's ~1/5 of the total,
+        # since r1 has 1/5 of the weight).
+        population_by_region = self._get_population_by_region(rb)
+        self.assertEqual(population_by_region, {0: 682, 1: 86})
+
+        # really 86 parts *should* move (to the new region) but to avoid
+        # accidentally picking up too many and causing some parts to randomly
+        # flop around devices in the original region - our gather algorithm
+        # is conservative when picking up only from devices that are for sure
+        # holding more parts than they want (math.ceil() of the replica_plan)
+        # which guarantees any parts picked up will have new homes in a better
+        # tier or failure_domain.
+        self.assertEqual(86, changed_parts)
+
+        # and since there's not enough room, subsequent rebalances will not
+        # cause additional assignments to r1
+        rb.pretend_min_part_hours_passed()
+        rb.rebalance(seed=2)
+        rb.validate()
+        population_by_region = self._get_population_by_region(rb)
+        self.assertEqual(population_by_region, {0: 682, 1: 86})
+
+        # after you add more weight, more partition assignments move
+        rb.set_dev_weight(2, 0.5)
+        rb.set_dev_weight(3, 0.5)
+        rb.pretend_min_part_hours_passed()
+        rb.rebalance(seed=2)
+        rb.validate()
+        population_by_region = self._get_population_by_region(rb)
+        self.assertEqual(population_by_region, {0: 614, 1: 154})
+
+        rb.set_dev_weight(2, 1.0)
+        rb.set_dev_weight(3, 1.0)
         rb.pretend_min_part_hours_passed()
+        rb.rebalance(seed=2)
+        rb.validate()
+        population_by_region = self._get_population_by_region(rb)
+        self.assertEqual(population_by_region, {0: 512, 1: 256})
+
+    def test_avoid_tier_change_new_region(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        for i in range(5):
+            rb.add_dev({'id': i, 'region': 0, 'zone': 0, 'weight': 100,
+                        'ip': '127.0.0.1', 'port': i, 'device': 'sda1'})
+        rb.rebalance(seed=2)
+
+        # Add a new device in new region to a balanced ring
+        rb.add_dev({'id': 5, 'region': 1, 'zone': 0, 'weight': 0,
+                    'ip': '127.0.0.5', 'port': 10000, 'device': 'sda1'})
+
+        # Increase the weight of region 1 slowly
+        moved_partitions = []
+        errors = []
+        for weight in range(0, 101, 10):
+            rb.set_dev_weight(5, weight)
+            rb.pretend_min_part_hours_passed()
+            changed_parts, _balance, _removed = rb.rebalance(seed=2)
+            rb.validate()
+            moved_partitions.append(changed_parts)
+            # Ensure that the second region has enough partitions
+            # Otherwise there will be replicas at risk
+            min_parts_for_r1 = ceil(weight / (500.0 + weight) * 768)
+            parts_for_r1 = self._get_population_by_region(rb).get(1, 0)
+            try:
+                self.assertEqual(min_parts_for_r1, parts_for_r1)
+            except AssertionError:
+                errors.append('weight %s got %s parts but expected %s' % (
+                    weight, parts_for_r1, min_parts_for_r1))
+
+        self.assertFalse(errors)
+
+        # Number of partitions moved on each rebalance
+        # 10/510 * 768 ~ 15.06 -> move at least 15 partitions in first step
+        ref = [0, 16, 14, 14, 13, 13, 13, 12, 11, 12, 10]
+        self.assertEqual(ref, moved_partitions)
+
+    def test_set_replicas_increase(self):
+        rb = ring.RingBuilder(8, 2, 0)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sda1'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 2, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sda1'})
+        rb.rebalance()
+        rb.validate()
+
+        rb.replicas = 2.1
+        rb.rebalance()
+        rb.validate()
+
+        self.assertEqual([len(p2d) for p2d in rb._replica2part2dev],
+                         [256, 256, 25])
+
+        rb.replicas = 2.2
+        rb.rebalance()
+        rb.validate()
+        self.assertEqual([len(p2d) for p2d in rb._replica2part2dev],
+                         [256, 256, 51])
+
+    def test_set_replicas_decrease(self):
+        rb = ring.RingBuilder(4, 5, 0)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sda1'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sda1'})
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sda1'})
+        rb.rebalance()
+        rb.validate()
+
+        rb.replicas = 4.9
+        rb.rebalance()
+        rb.validate()
+
+        self.assertEqual([len(p2d) for p2d in rb._replica2part2dev],
+                         [16, 16, 16, 16, 14])
+
+        # cross a couple of integer thresholds (4 and 3)
+        rb.replicas = 2.5
+        rb.rebalance()
+        rb.validate()
+
+        self.assertEqual([len(p2d) for p2d in rb._replica2part2dev],
+                         [16, 16, 8])
+
+    def test_fractional_replicas_rebalance(self):
+        rb = ring.RingBuilder(8, 2.5, 0)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sda1'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 2, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sda1'})
+        rb.rebalance()  # passes by not crashing
+        rb.validate()   # also passes by not crashing
+        self.assertEqual([len(p2d) for p2d in rb._replica2part2dev],
+                         [256, 256, 128])
+
+    def test_create_add_dev_add_replica_rebalance(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 3,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'weight': 3,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 0, 'weight': 3,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 0, 'weight': 3,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.set_replicas(4)
+        rb.rebalance()  # this would crash since parts_wanted was not set
+        rb.validate()
+
+    def test_reduce_replicas_after_remove_device(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 3,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'weight': 3,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 0, 'weight': 3,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.rebalance()
+        rb.remove_dev(0)
+        self.assertRaises(exceptions.RingValidationError, rb.rebalance)
+        rb.set_replicas(2)
         rb.rebalance()
-        self.assertNotEquals(rb.validate(stats=True)[1], 999.99)
+        rb.validate()
+
+    def test_rebalance_post_upgrade(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        # 5 devices: 5 is the smallest number that does not divide 3 * 2^8,
+        # which forces some rounding to happen.
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdb'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdc'})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdd'})
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sde'})
+        rb.rebalance()
+        rb.validate()
+
+        # Older versions of the ring builder code would round down when
+        # computing parts_wanted, while the new code rounds up. Make sure we
+        # can handle a ring built by the old method.
+        #
+        # This code mimics the old _set_parts_wanted.
+        weight_of_one_part = rb.weight_of_one_part()
+        for dev in rb._iter_devs():
+            if not dev['weight']:
+                dev['parts_wanted'] = -rb.parts * rb.replicas
+            else:
+                dev['parts_wanted'] = (
+                    int(weight_of_one_part * dev['weight']) -
+                    dev['parts'])
+
+        rb.pretend_min_part_hours_passed()
+        rb.rebalance()  # this crashes unless rebalance resets parts_wanted
+        rb.validate()
+
+    def test_add_replicas_then_rebalance_respects_weight(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 3,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'weight': 3,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdb'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdc'})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdd'})
+
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 1, 'weight': 3,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sde'})
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 1, 'weight': 3,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdf'})
+        rb.add_dev({'id': 6, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdg'})
+        rb.add_dev({'id': 7, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdh'})
+
+        rb.add_dev({'id': 8, 'region': 0, 'zone': 2, 'weight': 3,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdi'})
+        rb.add_dev({'id': 9, 'region': 0, 'zone': 2, 'weight': 3,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdj'})
+        rb.add_dev({'id': 10, 'region': 0, 'zone': 2, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdk'})
+        rb.add_dev({'id': 11, 'region': 0, 'zone': 2, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdl'})
+
+        rb.rebalance(seed=1)
+
+        r = rb.get_ring()
+        counts = {}
+        for part2dev_id in r._replica2part2dev_id:
+            for dev_id in part2dev_id:
+                counts[dev_id] = counts.get(dev_id, 0) + 1
+        self.assertEqual(counts, {0: 96, 1: 96,
+                                  2: 32, 3: 32,
+                                  4: 96, 5: 96,
+                                  6: 32, 7: 32,
+                                  8: 96, 9: 96,
+                                  10: 32, 11: 32})
+
+        rb.replicas *= 2
+        rb.rebalance(seed=1)
+
+        r = rb.get_ring()
+        counts = {}
+        for part2dev_id in r._replica2part2dev_id:
+            for dev_id in part2dev_id:
+                counts[dev_id] = counts.get(dev_id, 0) + 1
+        self.assertEqual(counts, {0: 192, 1: 192,
+                                  2: 64, 3: 64,
+                                  4: 192, 5: 192,
+                                  6: 64, 7: 64,
+                                  8: 192, 9: 192,
+                                  10: 64, 11: 64})
+
+    def test_overload(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdd'})
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sde'})
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdf'})
+
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sdb'})
+        rb.add_dev({'id': 6, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sdg'})
+        rb.add_dev({'id': 7, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sdh'})
+        rb.add_dev({'id': 8, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sdi'})
+
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 2, 'weight': 2,
+                    'ip': '127.0.0.2', 'port': 10002, 'device': 'sdc'})
+        rb.add_dev({'id': 9, 'region': 0, 'zone': 2, 'weight': 2,
+                    'ip': '127.0.0.2', 'port': 10002, 'device': 'sdj'})
+        rb.add_dev({'id': 10, 'region': 0, 'zone': 2, 'weight': 2,
+                    'ip': '127.0.0.2', 'port': 10002, 'device': 'sdk'})
+        rb.add_dev({'id': 11, 'region': 0, 'zone': 2, 'weight': 2,
+                    'ip': '127.0.0.2', 'port': 10002, 'device': 'sdl'})
+
+        rb.rebalance(seed=12345)
+        rb.validate()
+
+        # sanity check: balance respects weights, so default
+        part_counts = _partition_counts(rb, key='zone')
+        self.assertEqual(part_counts[0], 192)
+        self.assertEqual(part_counts[1], 192)
+        self.assertEqual(part_counts[2], 384)
+
+        # Devices 0 and 1 take 10% more than their fair shares by weight since
+        # overload is 10% (0.1).
+        rb.set_overload(0.1)
+        rb.pretend_min_part_hours_passed()
+        rb.rebalance(seed=12345)
+
+        part_counts = _partition_counts(rb, key='zone')
+        self.assertEqual({0: 212, 1: 211, 2: 345}, part_counts)
+
+        # Now, devices 0 and 1 take 50% more than their fair shares by
+        # weight.
+        rb.set_overload(0.5)
+        for _ in range(3):
+            rb.pretend_min_part_hours_passed()
+            rb.rebalance(seed=12345)
+
+        part_counts = _partition_counts(rb, key='zone')
+        self.assertEqual({0: 256, 1: 256, 2: 256}, part_counts)
+
+        # Devices 0 and 1 may take up to 75% over their fair share, but the
+        # placement algorithm only wants to spread things out evenly between
+        # all drives, so the devices stay at 50% more.
+        rb.set_overload(0.75)
+        for _ in range(3):
+            rb.pretend_min_part_hours_passed()
+            rb.rebalance(seed=12345)
+
+        part_counts = _partition_counts(rb, key='zone')
+        self.assertEqual(part_counts[0], 256)
+        self.assertEqual(part_counts[1], 256)
+        self.assertEqual(part_counts[2], 256)
+
+    def test_unoverload(self):
+        # Start off needing overload to balance, then add capacity until we
+        # don't need overload any more and see that things still balance.
+        # Overload doesn't prevent optimal balancing.
+        rb = ring.RingBuilder(8, 3, 1)
+        rb.set_overload(0.125)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.2', 'port': 10000, 'device': 'sdb'})
+        rb.add_dev({'id': 6, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.2', 'port': 10000, 'device': 'sdb'})
+        rb.add_dev({'id': 7, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.2', 'port': 10000, 'device': 'sdb'})
+        rb.add_dev({'id': 8, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.2', 'port': 10000, 'device': 'sdb'})
+
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 0, 'weight': 2,
+                    'ip': '127.0.0.3', 'port': 10000, 'device': 'sdc'})
+        rb.add_dev({'id': 9, 'region': 0, 'zone': 0, 'weight': 2,
+                    'ip': '127.0.0.3', 'port': 10000, 'device': 'sdc'})
+        rb.add_dev({'id': 10, 'region': 0, 'zone': 0, 'weight': 2,
+                    'ip': '127.0.0.3', 'port': 10000, 'device': 'sdc'})
+        rb.add_dev({'id': 11, 'region': 0, 'zone': 0, 'weight': 2,
+                    'ip': '127.0.0.3', 'port': 10000, 'device': 'sdc'})
+        rb.rebalance(seed=12345)
+
+        # sanity check: our overload is big enough to balance things
+        part_counts = _partition_counts(rb, key='ip')
+        self.assertEqual(part_counts['127.0.0.1'], 216)
+        self.assertEqual(part_counts['127.0.0.2'], 216)
+        self.assertEqual(part_counts['127.0.0.3'], 336)
+
+        # Add some weight: balance improves
+        for dev in rb.devs:
+            if dev['ip'] in ('127.0.0.1', '127.0.0.2'):
+                rb.set_dev_weight(dev['id'], 1.22)
+        rb.pretend_min_part_hours_passed()
+        rb.rebalance(seed=12345)
+
+        part_counts = _partition_counts(rb, key='ip')
+
+        self.assertEqual({
+            '127.0.0.1': 237,
+            '127.0.0.2': 237,
+            '127.0.0.3': 294,
+        }, part_counts)
+
+        # Even out the weights: balance becomes perfect
+        for dev in rb.devs:
+            if dev['ip'] in ('127.0.0.1', '127.0.0.2'):
+                rb.set_dev_weight(dev['id'], 2)
+
+        rb.pretend_min_part_hours_passed()
+        rb.rebalance(seed=12345)
+
+        part_counts = _partition_counts(rb, key='ip')
+        self.assertEqual(part_counts['127.0.0.1'], 256)
+        self.assertEqual(part_counts['127.0.0.2'], 256)
+        self.assertEqual(part_counts['127.0.0.3'], 256)
+
+        # Add a new server: balance stays optimal
+        rb.add_dev({'id': 12, 'region': 0, 'zone': 0,
+                    'weight': 2,
+                    'ip': '127.0.0.4', 'port': 10000, 'device': 'sdd'})
+        rb.add_dev({'id': 13, 'region': 0, 'zone': 0,
+                    'weight': 2,
+                    'ip': '127.0.0.4', 'port': 10000, 'device': 'sde'})
+        rb.add_dev({'id': 14, 'region': 0, 'zone': 0,
+                    'weight': 2,
+                    'ip': '127.0.0.4', 'port': 10000, 'device': 'sdf'})
+        rb.add_dev({'id': 15, 'region': 0, 'zone': 0,
+                    'weight': 2,
+                    'ip': '127.0.0.4', 'port': 10000, 'device': 'sdf'})
+
+        # we're moving more than 1/3 of the replicas but fewer than 2/3, so
+        # we have to do this twice
+        rb.pretend_min_part_hours_passed()
+        rb.rebalance(seed=12345)
+        rb.pretend_min_part_hours_passed()
+        rb.rebalance(seed=12345)
+
+        expected = {
+            '127.0.0.1': 192,
+            '127.0.0.2': 192,
+            '127.0.0.3': 192,
+            '127.0.0.4': 192,
+        }
+
+        part_counts = _partition_counts(rb, key='ip')
+        self.assertEqual(part_counts, expected)
+
+    def test_overload_keeps_balanceable_things_balanced_initially(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 8,
+                    'ip': '10.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'weight': 8,
+                    'ip': '10.0.0.1', 'port': 10000, 'device': 'sdb'})
+
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 0, 'weight': 4,
+                    'ip': '10.0.0.2', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 0, 'weight': 4,
+                    'ip': '10.0.0.2', 'port': 10000, 'device': 'sdb'})
+
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 0, 'weight': 4,
+                    'ip': '10.0.0.3', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 0, 'weight': 4,
+                    'ip': '10.0.0.3', 'port': 10000, 'device': 'sdb'})
+
+        rb.add_dev({'id': 6, 'region': 0, 'zone': 0, 'weight': 4,
+                    'ip': '10.0.0.4', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 7, 'region': 0, 'zone': 0, 'weight': 4,
+                    'ip': '10.0.0.4', 'port': 10000, 'device': 'sdb'})
+
+        rb.add_dev({'id': 8, 'region': 0, 'zone': 0, 'weight': 4,
+                    'ip': '10.0.0.5', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 9, 'region': 0, 'zone': 0, 'weight': 4,
+                    'ip': '10.0.0.5', 'port': 10000, 'device': 'sdb'})
+
+        rb.set_overload(99999)
+        rb.rebalance(seed=12345)
+
+        part_counts = _partition_counts(rb)
+        self.assertEqual(part_counts, {
+            0: 128,
+            1: 128,
+            2: 64,
+            3: 64,
+            4: 64,
+            5: 64,
+            6: 64,
+            7: 64,
+            8: 64,
+            9: 64,
+        })
+
+    def test_overload_keeps_balanceable_things_balanced_on_rebalance(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 8,
+                    'ip': '10.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'weight': 8,
+                    'ip': '10.0.0.1', 'port': 10000, 'device': 'sdb'})
+
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 0, 'weight': 4,
+                    'ip': '10.0.0.2', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 0, 'weight': 4,
+                    'ip': '10.0.0.2', 'port': 10000, 'device': 'sdb'})
+
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 0, 'weight': 4,
+                    'ip': '10.0.0.3', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 0, 'weight': 4,
+                    'ip': '10.0.0.3', 'port': 10000, 'device': 'sdb'})
+
+        rb.add_dev({'id': 6, 'region': 0, 'zone': 0, 'weight': 4,
+                    'ip': '10.0.0.4', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 7, 'region': 0, 'zone': 0, 'weight': 4,
+                    'ip': '10.0.0.4', 'port': 10000, 'device': 'sdb'})
+
+        rb.add_dev({'id': 8, 'region': 0, 'zone': 0, 'weight': 4,
+                    'ip': '10.0.0.5', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 9, 'region': 0, 'zone': 0, 'weight': 4,
+                    'ip': '10.0.0.5', 'port': 10000, 'device': 'sdb'})
+
+        rb.set_overload(99999)
+
+        rb.rebalance(seed=123)
+        part_counts = _partition_counts(rb)
+        self.assertEqual(part_counts, {
+            0: 128,
+            1: 128,
+            2: 64,
+            3: 64,
+            4: 64,
+            5: 64,
+            6: 64,
+            7: 64,
+            8: 64,
+            9: 64,
+        })
+
+        # swap weights between 10.0.0.1 and 10.0.0.2
+        rb.set_dev_weight(0, 4)
+        rb.set_dev_weight(1, 4)
+        rb.set_dev_weight(2, 8)
+        rb.set_dev_weight(1, 8)
+
+        rb.rebalance(seed=456)
+        part_counts = _partition_counts(rb)
+        self.assertEqual(part_counts, {
+            0: 128,
+            1: 128,
+            2: 64,
+            3: 64,
+            4: 64,
+            5: 64,
+            6: 64,
+            7: 64,
+            8: 64,
+            9: 64,
+        })
+
+    def test_server_per_port(self):
+        # 3 servers, 3 disks each, with each disk on its own port
+        rb = ring.RingBuilder(8, 3, 1)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '10.0.0.1', 'port': 10000, 'device': 'sdx'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '10.0.0.1', 'port': 10001, 'device': 'sdy'})
+
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '10.0.0.2', 'port': 10000, 'device': 'sdx'})
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '10.0.0.2', 'port': 10001, 'device': 'sdy'})
+
+        rb.add_dev({'id': 6, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '10.0.0.3', 'port': 10000, 'device': 'sdx'})
+        rb.add_dev({'id': 7, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '10.0.0.3', 'port': 10001, 'device': 'sdy'})
+
+        rb.rebalance(seed=1)
+
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '10.0.0.1', 'port': 10002, 'device': 'sdz'})
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '10.0.0.2', 'port': 10002, 'device': 'sdz'})
+        rb.add_dev({'id': 8, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '10.0.0.3', 'port': 10002, 'device': 'sdz'})
+
+        rb.pretend_min_part_hours_passed()
+        rb.rebalance(seed=1)
+
+        poorly_dispersed = []
+        for part in range(rb.parts):
+            on_nodes = set()
+            for replica in range(rb.replicas):
+                dev_id = rb._replica2part2dev[replica][part]
+                on_nodes.add(rb.devs[dev_id]['ip'])
+            if len(on_nodes) < rb.replicas:
+                poorly_dispersed.append(part)
+        self.assertEqual(poorly_dispersed, [])
+
+    def test_load(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        devs = [{'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                 'ip': '127.0.0.0', 'port': 10000, 'device': 'sda1',
+                 'meta': 'meta0'},
+                {'id': 1, 'region': 0, 'zone': 1, 'weight': 1,
+                 'ip': '127.0.0.1', 'port': 10001, 'device': 'sdb1',
+                 'meta': 'meta1'},
+                {'id': 2, 'region': 0, 'zone': 2, 'weight': 2,
+                 'ip': '127.0.0.2', 'port': 10002, 'device': 'sdc1',
+                 'meta': 'meta2'},
+                {'id': 3, 'region': 0, 'zone': 3, 'weight': 2,
+                 'ip': '127.0.0.3', 'port': 10003, 'device': 'sdd1'}]
+        for d in devs:
+            rb.add_dev(d)
+        rb.rebalance()
+
+        real_pickle = pickle.load
+        fake_open = mock.mock_open()
+
+        io_error_not_found = IOError()
+        io_error_not_found.errno = errno.ENOENT
+
+        io_error_no_perm = IOError()
+        io_error_no_perm.errno = errno.EPERM
+
+        io_error_generic = IOError()
+        io_error_generic.errno = errno.EOPNOTSUPP
+        try:
+            # test a legit builder
+            fake_pickle = mock.Mock(return_value=rb)
+            pickle.load = fake_pickle
+            builder = ring.RingBuilder.load('fake.builder', open=fake_open)
+            self.assertEqual(fake_pickle.call_count, 1)
+            fake_open.assert_has_calls([mock.call('fake.builder', 'rb')])
+            self.assertEqual(builder, rb)
+            fake_pickle.reset_mock()
+
+            # test old style builder
+            fake_pickle.return_value = rb.to_dict()
+            pickle.load = fake_pickle
+            builder = ring.RingBuilder.load('fake.builder', open=fake_open)
+            fake_open.assert_has_calls([mock.call('fake.builder', 'rb')])
+            self.assertEqual(builder.devs, rb.devs)
+            fake_pickle.reset_mock()
+
+            # test old devs but no meta
+            no_meta_builder = rb
+            for dev in no_meta_builder.devs:
+                del dev['meta']
+            fake_pickle.return_value = no_meta_builder
+            pickle.load = fake_pickle
+            builder = ring.RingBuilder.load('fake.builder', open=fake_open)
+            fake_open.assert_has_calls([mock.call('fake.builder', 'rb')])
+            self.assertEqual(builder.devs, rb.devs)
+
+            # test an empty builder
+            fake_pickle.side_effect = EOFError
+            pickle.load = fake_pickle
+            self.assertRaises(exceptions.UnPicklingError,
+                              ring.RingBuilder.load, 'fake.builder',
+                              open=fake_open)
+
+            # test a corrupted builder
+            fake_pickle.side_effect = pickle.UnpicklingError
+            pickle.load = fake_pickle
+            self.assertRaises(exceptions.UnPicklingError,
+                              ring.RingBuilder.load, 'fake.builder',
+                              open=fake_open)
+
+            # test some error
+            fake_pickle.side_effect = AttributeError
+            pickle.load = fake_pickle
+            self.assertRaises(exceptions.UnPicklingError,
+                              ring.RingBuilder.load, 'fake.builder',
+                              open=fake_open)
+        finally:
+            pickle.load = real_pickle
+
+        # test non existent builder file
+        fake_open.side_effect = io_error_not_found
+        self.assertRaises(exceptions.FileNotFoundError,
+                          ring.RingBuilder.load, 'fake.builder',
+                          open=fake_open)
+
+        # test non accessible builder file
+        fake_open.side_effect = io_error_no_perm
+        self.assertRaises(exceptions.PermissionError,
+                          ring.RingBuilder.load, 'fake.builder',
+                          open=fake_open)
+
+        # test an error other then ENOENT and ENOPERM
+        fake_open.side_effect = io_error_generic
+        self.assertRaises(IOError,
+                          ring.RingBuilder.load, 'fake.builder',
+                          open=fake_open)
+
+    def test_save_load(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        devs = [{'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                 'ip': '127.0.0.0', 'port': 10000,
+                 'replication_ip': '127.0.0.0', 'replication_port': 10000,
+                 'device': 'sda1', 'meta': 'meta0'},
+                {'id': 1, 'region': 0, 'zone': 1, 'weight': 1,
+                 'ip': '127.0.0.1', 'port': 10001,
+                 'replication_ip': '127.0.0.1', 'replication_port': 10001,
+                 'device': 'sdb1', 'meta': 'meta1'},
+                {'id': 2, 'region': 0, 'zone': 2, 'weight': 2,
+                 'ip': '127.0.0.2', 'port': 10002,
+                 'replication_ip': '127.0.0.2', 'replication_port': 10002,
+                 'device': 'sdc1', 'meta': 'meta2'},
+                {'id': 3, 'region': 0, 'zone': 3, 'weight': 2,
+                 'ip': '127.0.0.3', 'port': 10003,
+                 'replication_ip': '127.0.0.3', 'replication_port': 10003,
+                 'device': 'sdd1', 'meta': ''}]
+        rb.set_overload(3.14159)
+        for d in devs:
+            rb.add_dev(d)
+        rb.rebalance()
+        # There are so few devs, they should fit into 1 byte dev_ids but we
+        # store in a minimum of 2 for backwards compat.
+        self.assertEqual(rb.dev_id_bytes, 2)
+        self.assertEqual(rb._replica2part2dev[0].itemsize, 2)
+        builder_file = os.path.join(self.testdir, 'test_save.builder')
+        rb.save(builder_file)
+        loaded_rb = ring.RingBuilder.load(builder_file)
+        self.maxDiff = None
+        self.assertEqual(loaded_rb.to_dict(), rb.to_dict())
+        self.assertEqual(loaded_rb.overload, 3.14159)
+        self.assertEqual(loaded_rb.dev_id_bytes, 2)
+        self.assertEqual(loaded_rb._replica2part2dev[0].itemsize, 2)
+
+    @mock.patch('builtins.open', autospec=True)
+    @mock.patch('swift.common.ring.builder.pickle.dump', autospec=True)
+    def test_save(self, mock_pickle_dump, mock_open):
+        mock_open.return_value = mock_fh = mock.MagicMock()
+        rb = ring.RingBuilder(8, 3, 1)
+        devs = [{'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                 'ip': '127.0.0.0', 'port': 10000, 'device': 'sda1',
+                 'meta': 'meta0'},
+                {'id': 1, 'region': 0, 'zone': 1, 'weight': 1,
+                 'ip': '127.0.0.1', 'port': 10001, 'device': 'sdb1',
+                 'meta': 'meta1'},
+                {'id': 2, 'region': 0, 'zone': 2, 'weight': 2,
+                 'ip': '127.0.0.2', 'port': 10002, 'device': 'sdc1',
+                 'meta': 'meta2'},
+                {'id': 3, 'region': 0, 'zone': 3, 'weight': 2,
+                 'ip': '127.0.0.3', 'port': 10003, 'device': 'sdd1'}]
+        for d in devs:
+            rb.add_dev(d)
+        rb.rebalance()
+        rb.save('some.builder')
+        mock_open.assert_called_once_with('some.builder', 'wb')
+        mock_pickle_dump.assert_called_once_with(rb.to_dict(),
+                                                 mock_fh.__enter__(),
+                                                 protocol=2)
+
+    def test_id(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        # check id is assigned after save
+        builder_file = os.path.join(self.testdir, 'test_save.builder')
+        rb.save(builder_file)
+        assigned_id = rb.id
+        # check id doesn't change when builder is saved again
+        rb.save(builder_file)
+        self.assertEqual(assigned_id, rb.id)
+        # check same id after loading
+        loaded_rb = ring.RingBuilder.load(builder_file)
+        self.assertEqual(assigned_id, loaded_rb.id)
+        # check id doesn't change when loaded builder is saved
+        rb.save(builder_file)
+        self.assertEqual(assigned_id, rb.id)
+        # check same id after loading again
+        loaded_rb = ring.RingBuilder.load(builder_file)
+        self.assertEqual(assigned_id, loaded_rb.id)
+        # check id remains once assigned, even when save fails
+        with self.assertRaises(IOError):
+            rb.save(os.path.join(
+                self.testdir, 'non_existent_dir', 'test_save.file'))
+        self.assertEqual(assigned_id, rb.id)
+
+        # sanity check that different builders get different id's
+        other_rb = ring.RingBuilder(8, 3, 1)
+        other_builder_file = os.path.join(self.testdir, 'test_save_2.builder')
+        other_rb.save(other_builder_file)
+        self.assertNotEqual(assigned_id, other_rb.id)
+
+    def test_id_copy_from(self):
+        # copy_from preserves the same id
+        orig_rb = ring.RingBuilder(8, 3, 1)
+        copy_rb = ring.RingBuilder(8, 3, 1)
+        copy_rb.copy_from(orig_rb)
+        for rb in (orig_rb, copy_rb):
+            with self.assertRaises(AttributeError) as cm:
+                rb.id
+            self.assertIn('id attribute has not been initialised',
+                          cm.exception.args[0])
+
+        builder_file = os.path.join(self.testdir, 'test_save.builder')
+        orig_rb.save(builder_file)
+        copy_rb = ring.RingBuilder(8, 3, 1)
+        copy_rb.copy_from(orig_rb)
+        self.assertEqual(orig_rb.id, copy_rb.id)
+
+    def test_id_legacy_builder_file(self):
+        builder_file = os.path.join(self.testdir, 'legacy.builder')
+
+        def do_test():
+            # load legacy file
+            loaded_rb = ring.RingBuilder.load(builder_file)
+            with self.assertRaises(AttributeError) as cm:
+                loaded_rb.id
+            self.assertIn('id attribute has not been initialised',
+                          cm.exception.args[0])
+
+            # check saving assigns an id, and that it is persisted
+            loaded_rb.save(builder_file)
+            assigned_id = loaded_rb.id
+            self.assertIsNotNone(assigned_id)
+            loaded_rb = ring.RingBuilder.load(builder_file)
+            self.assertEqual(assigned_id, loaded_rb.id)
+
+        # older builders had no id so the pickled builder dict had no id key
+        rb = ring.RingBuilder(8, 3, 1)
+        orig_to_dict = rb.to_dict
+
+        def mock_to_dict():
+            result = orig_to_dict()
+            result.pop('id')
+            return result
+
+        with mock.patch.object(rb, 'to_dict', mock_to_dict):
+            rb.save(builder_file)
+        do_test()
+
+        # even older builders pickled the class instance, which would have had
+        # no _id attribute
+        rb = ring.RingBuilder(8, 3, 1)
+        del rb.logger  # logger type cannot be pickled
+        del rb._id
+        builder_file = os.path.join(self.testdir, 'legacy.builder')
+        with open(builder_file, 'wb') as f:
+            pickle.dump(rb, f, protocol=2)
+        do_test()
+
+    def test_id_not_initialised_errors(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        # id is not set until builder has been saved
+        with self.assertRaises(AttributeError) as cm:
+            rb.id
+        self.assertIn('id attribute has not been initialised',
+                      cm.exception.args[0])
+        # save must succeed for id to be assigned
+        with self.assertRaises(IOError):
+            rb.save(os.path.join(
+                self.testdir, 'non-existent-dir', 'foo.builder'))
+        with self.assertRaises(AttributeError) as cm:
+            rb.id
+        self.assertIn('id attribute has not been initialised',
+                      cm.exception.args[0])
+
+    def test_search_devs(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        devs = [{'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                 'ip': '127.0.0.0', 'port': 10000, 'device': 'sda1',
+                 'meta': 'meta0'},
+                {'id': 1, 'region': 0, 'zone': 1, 'weight': 1,
+                 'ip': '127.0.0.1', 'port': 10001, 'device': 'sdb1',
+                 'meta': 'meta1'},
+                {'id': 2, 'region': 1, 'zone': 2, 'weight': 2,
+                 'ip': '127.0.0.2', 'port': 10002, 'device': 'sdc1',
+                 'meta': 'meta2'},
+                {'id': 3, 'region': 1, 'zone': 3, 'weight': 2,
+                 'ip': '127.0.0.3', 'port': 10003, 'device': 'sdd1',
+                 'meta': 'meta3'},
+                {'id': 4, 'region': 2, 'zone': 4, 'weight': 1,
+                 'ip': '127.0.0.4', 'port': 10004, 'device': 'sde1',
+                 'meta': 'meta4', 'replication_ip': '127.0.0.10',
+                 'replication_port': 20000},
+                {'id': 5, 'region': 2, 'zone': 5, 'weight': 2,
+                 'ip': '127.0.0.5', 'port': 10005, 'device': 'sdf1',
+                 'meta': 'meta5', 'replication_ip': '127.0.0.11',
+                 'replication_port': 20001},
+                {'id': 6, 'region': 2, 'zone': 6, 'weight': 2,
+                 'ip': '127.0.0.6', 'port': 10006, 'device': 'sdg1',
+                 'meta': 'meta6', 'replication_ip': '127.0.0.12',
+                 'replication_port': 20002}]
+        for d in devs:
+            rb.add_dev(d)
+        rb.rebalance()
+        res = rb.search_devs({'region': 0})
+        self.assertEqual(res, [devs[0], devs[1]])
+        res = rb.search_devs({'region': 1})
+        self.assertEqual(res, [devs[2], devs[3]])
+        res = rb.search_devs({'region': 1, 'zone': 2})
+        self.assertEqual(res, [devs[2]])
+        res = rb.search_devs({'id': 1})
+        self.assertEqual(res, [devs[1]])
+        res = rb.search_devs({'zone': 1})
+        self.assertEqual(res, [devs[1]])
+        res = rb.search_devs({'ip': '127.0.0.1'})
+        self.assertEqual(res, [devs[1]])
+        res = rb.search_devs({'ip': '127.0.0.1', 'port': 10001})
+        self.assertEqual(res, [devs[1]])
+        res = rb.search_devs({'port': 10001})
+        self.assertEqual(res, [devs[1]])
+        res = rb.search_devs({'replication_ip': '127.0.0.10'})
+        self.assertEqual(res, [devs[4]])
+        res = rb.search_devs({'replication_ip': '127.0.0.10',
+                              'replication_port': 20000})
+        self.assertEqual(res, [devs[4]])
+        res = rb.search_devs({'replication_port': 20000})
+        self.assertEqual(res, [devs[4]])
+        res = rb.search_devs({'device': 'sdb1'})
+        self.assertEqual(res, [devs[1]])
+        res = rb.search_devs({'meta': 'meta1'})
+        self.assertEqual(res, [devs[1]])
+
+    def test_validate(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 6, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sda1'})
+        rb.add_dev({'id': 7, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sda1'})
+        rb.add_dev({'id': 8, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sda1'})
+        rb.add_dev({'id': 9, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sda1'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 2, 'weight': 2,
+                    'ip': '127.0.0.1', 'port': 10002, 'device': 'sda1'})
+        rb.add_dev({'id': 10, 'region': 0, 'zone': 2, 'weight': 2,
+                    'ip': '127.0.0.1', 'port': 10002, 'device': 'sda1'})
+        rb.add_dev({'id': 11, 'region': 0, 'zone': 2, 'weight': 2,
+                    'ip': '127.0.0.1', 'port': 10002, 'device': 'sda1'})
+        rb.add_dev({'id': 12, 'region': 0, 'zone': 2, 'weight': 2,
+                    'ip': '127.0.0.1', 'port': 10002, 'device': 'sda1'})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 3, 'weight': 2,
+                    'ip': '127.0.0.1', 'port': 10003, 'device': 'sda1'})
+        rb.add_dev({'id': 13, 'region': 0, 'zone': 3, 'weight': 2,
+                    'ip': '127.0.0.1', 'port': 10003, 'device': 'sda1'})
+        rb.add_dev({'id': 14, 'region': 0, 'zone': 3, 'weight': 2,
+                    'ip': '127.0.0.1', 'port': 10003, 'device': 'sda1'})
+        rb.add_dev({'id': 15, 'region': 0, 'zone': 3, 'weight': 2,
+                    'ip': '127.0.0.1', 'port': 10003, 'device': 'sda1'})
+
+        # Degenerate case: devices added but not rebalanced yet
+        self.assertRaises(exceptions.RingValidationError, rb.validate)
+
+        rb.rebalance()
+        counts = _partition_counts(rb, key='zone')
+        self.assertEqual(counts, {0: 128, 1: 128, 2: 256, 3: 256})
+
+        dev_usage, worst = rb.validate()
+        self.assertIsNone(dev_usage)
+        self.assertIsNone(worst)
+
+        dev_usage, worst = rb.validate(stats=True)
+        self.assertEqual(list(dev_usage), [32, 32, 64, 64,
+                                           32, 32, 32,  # added zone0
+                                           32, 32, 32,  # added zone1
+                                           64, 64, 64,  # added zone2
+                                           64, 64, 64,  # added zone3
+                                           ])
+        self.assertEqual(int(worst), 0)
+
+        # min part hours should pin all the parts assigned to this zero
+        # weight device onto it such that the balance will look horrible
+        rb.set_dev_weight(2, 0)
+        rb.rebalance()
+        self.assertEqual(rb.validate(stats=True)[1], MAX_BALANCE)
+
+        # Test not all partitions doubly accounted for
+        rb.devs[1]['parts'] -= 1
+        self.assertRaises(exceptions.RingValidationError, rb.validate)
+        rb.devs[1]['parts'] += 1
+
+        # Test non-numeric port
+        rb.devs[1]['port'] = '10001'
+        self.assertRaises(exceptions.RingValidationError, rb.validate)
+        rb.devs[1]['port'] = 10001
+
+        # Test partition on nonexistent device
+        rb.pretend_min_part_hours_passed()
+        orig_dev_id = rb._replica2part2dev[0][0]
+        rb._replica2part2dev[0][0] = len(rb.devs)
+        self.assertRaises(exceptions.RingValidationError, rb.validate)
+        rb._replica2part2dev[0][0] = orig_dev_id
+
+        # Tests that validate can handle 'holes' in .devs
+        rb.remove_dev(2)
+        rb.pretend_min_part_hours_passed()
+        rb.rebalance()
+        rb.validate(stats=True)
+
+        # Test partition assigned to a hole
+        if rb.devs[2]:
+            rb.remove_dev(2)
+        rb.pretend_min_part_hours_passed()
+        orig_dev_id = rb._replica2part2dev[0][0]
+        rb._replica2part2dev[0][0] = 2
+        self.assertRaises(exceptions.RingValidationError, rb.validate)
+        rb._replica2part2dev[0][0] = orig_dev_id
+
+        # Validate that zero weight devices with no partitions don't count on
+        # the 'worst' value.
+        self.assertNotEqual(rb.validate(stats=True)[1], MAX_BALANCE)
+        rb.add_dev({'id': 16, 'region': 0, 'zone': 0, 'weight': 0,
+                    'ip': '127.0.0.1', 'port': 10004, 'device': 'sda1'})
+        rb.pretend_min_part_hours_passed()
+        rb.rebalance()
+        self.assertNotEqual(rb.validate(stats=True)[1], MAX_BALANCE)
+
+    def test_validate_partial_replica(self):
+        rb = ring.RingBuilder(8, 2.5, 1)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sdb'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sdc'})
+        rb.rebalance()
+        rb.validate()  # sanity
+        self.assertEqual(len(rb._replica2part2dev[0]), 256)
+        self.assertEqual(len(rb._replica2part2dev[1]), 256)
+        self.assertEqual(len(rb._replica2part2dev[2]), 128)
+
+        # now swap partial replica part maps
+        rb._replica2part2dev[1], rb._replica2part2dev[2] = \
+            rb._replica2part2dev[2], rb._replica2part2dev[1]
+        self.assertRaises(exceptions.RingValidationError, rb.validate)
+
+    def test_validate_duplicate_part_assignment(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sdb'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sdc'})
+        rb.rebalance()
+        rb.validate()  # sanity
+        # now double up a device assignment
+        rb._replica2part2dev[1][200] = rb._replica2part2dev[2][200]
+
+        with self.assertRaises(exceptions.RingValidationError) as e:
+            rb.validate()
+
+        expected = 'The partition 200 has been assigned to duplicate devices'
+        self.assertIn(expected, str(e.exception))
+
+    def test_get_part_devices(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        self.assertEqual(rb.get_part_devices(0), [])
+
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sda1'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 2, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sda1'})
+        rb.rebalance()
+
+        part_devs = sorted(rb.get_part_devices(0),
+                           key=operator.itemgetter('id'))
+        self.assertEqual(part_devs, [rb.devs[0], rb.devs[1], rb.devs[2]])
+
+    def test_get_part_devices_partial_replicas(self):
+        rb = ring.RingBuilder(8, 2.5, 1)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 1, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sda1'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 2, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sda1'})
+        rb.rebalance(seed=4)
+
+        # note: partition 255 will only have 2 replicas
+        part_devs = sorted(rb.get_part_devices(255),
+                           key=operator.itemgetter('id'))
+        self.assertEqual(part_devs, [rb.devs[1], rb.devs[2]])
+
+    def test_dispersion_with_zero_weight_devices(self):
+        rb = ring.RingBuilder(8, 3.0, 0)
+        # add two devices to a single server in a single zone
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdb'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdc'})
+        # and a zero weight device
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 0, 'weight': 0,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdd'})
+        rb.rebalance()
+        self.assertEqual(rb.dispersion, 0.0)
+        self.assertEqual(rb._dispersion_graph, {
+            (0,): [0, 0, 0, 256],
+            (0, 0): [0, 0, 0, 256],
+            (0, 0, '127.0.0.1'): [0, 0, 0, 256],
+            (0, 0, '127.0.0.1', 0): [0, 256, 0, 0],
+            (0, 0, '127.0.0.1', 1): [0, 256, 0, 0],
+            (0, 0, '127.0.0.1', 2): [0, 256, 0, 0],
+        })
+
+    def test_dispersion_with_zero_weight_devices_with_parts(self):
+        rb = ring.RingBuilder(8, 3.0, 1)
+        # add four devices to a single server in a single zone
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdb'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdc'})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdd'})
+        rb.rebalance(seed=1)
+        self.assertEqual(rb.dispersion, 0.0)
+        self.assertEqual(rb._dispersion_graph, {
+            (0,): [0, 0, 0, 256],
+            (0, 0): [0, 0, 0, 256],
+            (0, 0, '127.0.0.1'): [0, 0, 0, 256],
+            (0, 0, '127.0.0.1', 0): [64, 192, 0, 0],
+            (0, 0, '127.0.0.1', 1): [64, 192, 0, 0],
+            (0, 0, '127.0.0.1', 2): [64, 192, 0, 0],
+            (0, 0, '127.0.0.1', 3): [64, 192, 0, 0],
+        })
+        # now mark a device 2 for decom
+        rb.set_dev_weight(2, 0.0)
+        # we'll rebalance but can't move any parts
+        rb.rebalance(seed=1)
+        # zero weight tier has one copy of 1/4 part-replica
+        self.assertEqual(rb.dispersion, 25.0)
+        self.assertEqual(rb._dispersion_graph, {
+            (0,): [0, 0, 0, 256],
+            (0, 0): [0, 0, 0, 256],
+            (0, 0, '127.0.0.1'): [0, 0, 0, 256],
+            (0, 0, '127.0.0.1', 0): [64, 192, 0, 0],
+            (0, 0, '127.0.0.1', 1): [64, 192, 0, 0],
+            (0, 0, '127.0.0.1', 2): [64, 192, 0, 0],
+            (0, 0, '127.0.0.1', 3): [64, 192, 0, 0],
+        })
+        # unlock the stuck parts
+        rb.pretend_min_part_hours_passed()
+        rb.rebalance(seed=3)
+        self.assertEqual(rb.dispersion, 0.0)
+        self.assertEqual(rb._dispersion_graph, {
+            (0,): [0, 0, 0, 256],
+            (0, 0): [0, 0, 0, 256],
+            (0, 0, '127.0.0.1'): [0, 0, 0, 256],
+            (0, 0, '127.0.0.1', 0): [0, 256, 0, 0],
+            (0, 0, '127.0.0.1', 1): [0, 256, 0, 0],
+            (0, 0, '127.0.0.1', 3): [0, 256, 0, 0],
+        })
+
+    def test_undispersable_zone_converge_on_balance(self):
+        rb = ring.RingBuilder(8, 6, 0)
+        dev_id = 0
+        # 3 regions, 2 zone for each region, 1 server with only *one* device in
+        # each zone (this is an absolutely pathological case)
+        for r in range(3):
+            for z in range(2):
+                ip = '127.%s.%s.1' % (r, z)
+                dev_id += 1
+                rb.add_dev({'id': dev_id, 'region': r, 'zone': z,
+                            'weight': 1000, 'ip': ip, 'port': 10000,
+                            'device': 'd%s' % dev_id})
+        rb.rebalance(seed=5)
+
+        # sanity, all balanced and 0 dispersion
+        self.assertEqual(rb.get_balance(), 0)
+        self.assertEqual(rb.dispersion, 0)
+
+        # add one device to the server in z1 for each region, N.B. when we
+        # *balance* this topology we will have very bad dispersion (too much
+        # weight in z1 compared to z2!)
+        for r in range(3):
+            z = 0
+            ip = '127.%s.%s.1' % (r, z)
+            dev_id += 1
+            rb.add_dev({'id': dev_id, 'region': r, 'zone': z,
+                        'weight': 1000, 'ip': ip, 'port': 10000,
+                        'device': 'd%s' % dev_id})
+
+        changed_part, _, _ = rb.rebalance(seed=5)
+
+        # sanity, all part but only one replica moved to new devices
+        self.assertEqual(changed_part, 2 ** 8)
+        # so the first time, rings are still unbalanced becase we'll only move
+        # one replica of each part.
+        self.assertEqual(rb.get_balance(), 50.1953125)
+        self.assertEqual(rb.dispersion, 16.6015625)
+
+        # N.B. since we mostly end up grabbing parts by "weight forced" some
+        # seeds given some specific ring state will randomly pick bad
+        # part-replicas that end up going back down onto the same devices
+        changed_part, _, _ = rb.rebalance(seed=5)
+        self.assertEqual(changed_part, 15)
+        # ... this isn't a really "desirable" behavior, but even with bad luck,
+        # things do get better
+        self.assertEqual(rb.get_balance(), 47.265625)
+        self.assertEqual(rb.dispersion, 16.6015625)
+
+        # but if you stick with it, eventually the next rebalance, will get to
+        # move "the right" part-replicas, resulting in near optimal balance
+        changed_part, _, _ = rb.rebalance(seed=5)
+        self.assertEqual(changed_part, 167)
+        self.assertEqual(rb.get_balance(), 14.453125)
+        self.assertEqual(rb.dispersion, 16.6015625)
+
+    def test_undispersable_server_converge_on_balance(self):
+        rb = ring.RingBuilder(8, 6, 0)
+        dev_id = 0
+        # 3 zones, 2 server for each zone, 2 device for each server
+        for z in range(3):
+            for i in range(2):
+                ip = '127.0.%s.%s' % (z, i + 1)
+                for d in range(2):
+                    dev_id += 1
+                    rb.add_dev({'id': dev_id, 'region': 1, 'zone': z,
+                                'weight': 1000, 'ip': ip, 'port': 10000,
+                                'device': 'd%s' % dev_id})
+        rb.rebalance(seed=7)
+
+        # sanity, all balanced and 0 dispersion
+        self.assertEqual(rb.get_balance(), 0)
+        self.assertEqual(rb.dispersion, 0)
+
+        # add one device for first server for each zone
+        for z in range(3):
+            ip = '127.0.%s.1' % z
+            dev_id += 1
+            rb.add_dev({'id': dev_id, 'region': 1, 'zone': z,
+                        'weight': 1000, 'ip': ip, 'port': 10000,
+                        'device': 'd%s' % dev_id})
+
+        changed_part, _, _ = rb.rebalance(seed=7)
+
+        # sanity, all part but only one replica moved to new devices
+        self.assertEqual(changed_part, 2 ** 8)
+
+        # but the first time, those are still unbalance becase ring builder
+        # can move only one replica for each part
+        self.assertEqual(rb.get_balance(), 17.96875)
+        self.assertEqual(rb.dispersion, 9.9609375)
+
+        rb.rebalance(seed=7)
+
+        # converge into around 0~1
+        self.assertGreaterEqual(rb.get_balance(), 0)
+        self.assertLess(rb.get_balance(), 1)
+        # dispersion doesn't get any worse
+        self.assertEqual(rb.dispersion, 9.9609375)
+
+    def test_effective_overload(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        # z0
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 100,
+                    'ip': '127.0.0.0', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'weight': 100,
+                    'ip': '127.0.0.0', 'port': 10000, 'device': 'sdb'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 0, 'weight': 100,
+                    'ip': '127.0.0.0', 'port': 10000, 'device': 'sdb'})
+        # z1
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 1, 'weight': 100,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 1, 'weight': 100,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdb'})
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 1, 'weight': 100,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdc'})
+        # z2
+        rb.add_dev({'id': 6, 'region': 0, 'zone': 2, 'weight': 100,
+                    'ip': '127.0.0.2', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 7, 'region': 0, 'zone': 2, 'weight': 100,
+                    'ip': '127.0.0.2', 'port': 10000, 'device': 'sdb'})
+
+        # this ring requires overload
+        required = rb.get_required_overload()
+        self.assertGreater(required, 0.1)
+
+        # and we'll use a little bit
+        rb.set_overload(0.1)
+
+        rb.rebalance(seed=7)
+        rb.validate()
+
+        # but with-out enough overload we're not dispersed
+        self.assertGreater(rb.dispersion, 0)
+
+        # add the other dev to z2
+        rb.add_dev({'id': 8, 'region': 0, 'zone': 2, 'weight': 100,
+                    'ip': '127.0.0.2', 'port': 10000, 'device': 'sdc'})
+        # but also fail another device in the same!
+        rb.remove_dev(6)
+
+        # we still require overload
+        required = rb.get_required_overload()
+        self.assertGreater(required, 0.1)
+
+        rb.pretend_min_part_hours_passed()
+        rb.rebalance(seed=7)
+        rb.validate()
+
+        # ... and without enough we're full dispersed
+        self.assertGreater(rb.dispersion, 0)
+
+        # ok, let's fix z2's weight for real
+        rb.add_dev({'id': 6, 'region': 0, 'zone': 2, 'weight': 100,
+                    'ip': '127.0.0.2', 'port': 10000, 'device': 'sda'})
+
+        # ... technically, we no longer require overload
+        self.assertEqual(rb.get_required_overload(), 0.0)
+
+        # so let's rebalance w/o resetting min_part_hours
+        rb.rebalance(seed=7)
+        rb.validate()
+
+        # ... and that got it in one pass boo-yah!
+        self.assertEqual(rb.dispersion, 0)
+
+    def zone_weights_over_device_count(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        # z0
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 100,
+                    'ip': '127.0.0.0', 'port': 10000, 'device': 'sda'})
+        # z1
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 1, 'weight': 100,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        # z2
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 2, 'weight': 200,
+                    'ip': '127.0.0.2', 'port': 10000, 'device': 'sda'})
+
+        rb.rebalance(seed=7)
+        rb.validate()
+        self.assertEqual(rb.dispersion, 0)
+        self.assertAlmostEqual(rb.get_balance(), (1.0 / 3.0) * 100)
+
+    def test_more_devices_than_replicas_validation_when_removed_dev(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'ip': '127.0.0.1',
+                    'port': 6200, 'weight': 1.0, 'device': 'sda'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'ip': '127.0.0.1',
+                    'port': 6200, 'weight': 1.0, 'device': 'sdb'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 0, 'ip': '127.0.0.1',
+                    'port': 6200, 'weight': 1.0, 'device': 'sdc'})
+        rb.rebalance()
+        rb.remove_dev(2)
+        with self.assertRaises(ValueError) as e:
+            rb.set_dev_weight(2, 1)
+        msg = "Can not set weight of dev_id 2 because it is marked " \
+            "for removal"
+        self.assertIn(msg, str(e.exception))
+        with self.assertRaises(exceptions.RingValidationError) as e:
+            rb.rebalance()
+        msg = 'Replica count of 3 requires more than 2 devices'
+        self.assertIn(msg, str(e.exception))
+
+    def _add_dev_delete_first_n(self, add_dev_count, n):
+        rb = ring.RingBuilder(8, 3, 1)
+        dev_names = ['sda', 'sdb', 'sdc', 'sdd', 'sde', 'sdf']
+        for i in range(add_dev_count):
+            if i < len(dev_names):
+                dev_name = dev_names[i]
+            else:
+                dev_name = 'sda'
+            rb.add_dev({'id': i, 'region': 0, 'zone': 0, 'ip': '127.0.0.1',
+                        'port': 6200, 'weight': 1.0, 'device': dev_name})
+        rb.rebalance()
+        if (n > 0):
+            rb.pretend_min_part_hours_passed()
+            # remove first n
+            for i in range(n):
+                rb.remove_dev(i)
+            rb.pretend_min_part_hours_passed()
+            rb.rebalance()
+        return rb
+
+    def test_reuse_of_dev_holes_without_id(self):
+        # try with contiguous holes at beginning
+        add_dev_count = 6
+        rb = self._add_dev_delete_first_n(add_dev_count, add_dev_count - 3)
+        self.assertEqual([None, None, None, 3, 4, 5], [
+            None if d is None else d['id'] for d in rb.devs])
+        new_dev_id = rb.add_dev({'region': 0, 'zone': 0, 'ip': '127.0.0.1',
+                                 'port': 6200, 'weight': 1.0,
+                                 'device': 'sda'})
+        self.assertLess(new_dev_id, add_dev_count)
+
+        # try with non-contiguous holes
+        rb2 = ring.RingBuilder(8, 3, 1)
+        for i in range(6):
+            rb2.add_dev({'region': 0, 'zone': 0, 'ip': '127.0.0.1',
+                         'port': 6200, 'weight': 1.0, 'device': 'sda'})
+        rb2.rebalance()
+        rb2.pretend_min_part_hours_passed()
+        rb2.remove_dev(2)
+        rb2.remove_dev(5)
+        rb2.pretend_min_part_hours_passed()
+        rb2.rebalance()
+        # List gets trimmed during rebalance
+        self.assertEqual([0, 1, None, 3, 4], [
+            None if d is None else d['id'] for d in rb2.devs])
+        first = rb2.add_dev({'region': 0, 'zone': 0, 'ip': '127.0.0.1',
+                             'port': 6200, 'weight': 1.0, 'device': 'sda'})
+        self.assertEqual(first, 2)
+        self.assertEqual([0, 1, 2, 3, 4], [
+            None if d is None else d['id'] for d in rb2.devs])
+        second = rb2.add_dev({'region': 0, 'zone': 0, 'ip': '127.0.0.1',
+                              'port': 6200, 'weight': 1.0, 'device': 'sda'})
+        self.assertEqual(second, 5)
+        self.assertEqual([0, 1, 2, 3, 4, 5], [
+            None if d is None else d['id'] for d in rb2.devs])
+        # add a new one (without reusing a hole)
+        third = rb2.add_dev({'region': 0, 'zone': 0, 'ip': '127.0.0.1',
+                             'port': 6200, 'weight': 1.0, 'device': 'sda'})
+        self.assertEqual(third, 6)
+        self.assertEqual([0, 1, 2, 3, 4, 5, 6], [
+            None if d is None else d['id'] for d in rb2.devs])
+
+    def test_reuse_of_dev_holes_with_id(self):
+        add_dev_count = 6
+        rb = self._add_dev_delete_first_n(add_dev_count, add_dev_count - 3)
+        self.assertEqual([None, None, None, 3, 4, 5], [
+            None if d is None else d['id'] for d in rb.devs])
+        # add specifying id
+        exp_new_dev_id = 2
+        try:
+            new_dev_id = rb.add_dev({'id': exp_new_dev_id, 'region': 0,
+                                     'zone': 0, 'ip': '127.0.0.1',
+                                     'port': 6200, 'weight': 1.0,
+                                     'device': 'sda'})
+            self.assertEqual(new_dev_id, exp_new_dev_id)
+        except exceptions.DuplicateDeviceError:
+            self.fail("device hole not reused")
+        self.assertEqual([None, None, 2, 3, 4, 5], [
+            None if d is None else d['id'] for d in rb.devs])
+
+    def test_wide_device_limits(self):
+        rb = ring.RingBuilder(8, 2, 1)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'ip': '127.0.0.1',
+                    'port': 6200, 'weight': 1.0, 'device': 'sda'})
+        new_id = 2 ** 16 - 2
+        rb.add_dev({'id': new_id, 'region': 0, 'zone': 0, 'ip': '127.0.0.1',
+                    'port': 6200, 'weight': 1.0, 'device': 'sdb'})
+        rb.rebalance()
+        self.assertEqual(rb._replica2part2dev[0].itemsize, 2)
+        self.assertEqual([0] + [None] * (new_id - 1) + [new_id], [
+            None if d is None else d['id'] for d in rb.devs])
+
+        # Special value used for removed devices in 2-byte-dev-id rings
+        new_id = 2 ** 16 - 1
+        rb.add_dev({'id': new_id, 'region': 0, 'zone': 0, 'ip': '127.0.0.1',
+                    'port': 6200, 'weight': 1.0, 'device': 'sdc'})
+        rb.rebalance()
+        # so we get kicked over to 4
+        self.assertEqual(rb._replica2part2dev[0].itemsize, 4)
+        self.assertEqual([0] + [None] * (new_id - 2) + [new_id - 1, new_id], [
+            None if d is None else d['id'] for d in rb.devs])
+
+
+class TestPartPowerIncrease(unittest.TestCase):
+
+    FORMAT_VERSION = 1
+
+    def setUp(self):
+        self.testdir = mkdtemp()
+
+    def tearDown(self):
+        rmtree(self.testdir, ignore_errors=1)
+
+    def test_prepare_increase_partition_power(self):
+        ring_file = os.path.join(self.testdir, 'test_partpower.ring.gz')
+
+        rb = ring.RingBuilder(8, 3.0, 1)
+        self.assertEqual(rb.part_power, 8)
+
+        # add more devices than replicas to the ring
+        for i in range(10):
+            dev = "sdx%s" % i
+            rb.add_dev({'id': i, 'region': 0, 'zone': 0, 'weight': 1,
+                        'ip': '127.0.0.1', 'port': 10000, 'device': dev})
+        rb.rebalance(seed=1)
+
+        self.assertFalse(rb.cancel_increase_partition_power())
+        self.assertEqual(rb.part_power, 8)
+        self.assertIsNone(rb.next_part_power)
+
+        self.assertFalse(rb.finish_increase_partition_power())
+        self.assertEqual(rb.part_power, 8)
+        self.assertIsNone(rb.next_part_power)
+
+        self.assertTrue(rb.prepare_increase_partition_power())
+        self.assertEqual(rb.part_power, 8)
+        self.assertEqual(rb.next_part_power, 9)
+
+        # Save .ring.gz, and load ring from it to ensure prev/next is set
+        rd = rb.get_ring()
+        rd.save(ring_file, format_version=self.FORMAT_VERSION)
+
+        r = ring.Ring(ring_file)
+        expected_part_shift = 32 - 8
+        self.assertEqual(expected_part_shift, r._part_shift)
+        self.assertEqual(9, r.next_part_power)
+
+    def test_increase_partition_power(self):
+        rb = ring.RingBuilder(8, 3.0, 1)
+        self.assertEqual(rb.part_power, 8)
+
+        # add more devices than replicas to the ring
+        for i in range(10):
+            dev = "sdx%s" % i
+            rb.add_dev({'id': i, 'region': 0, 'zone': 0, 'weight': 1,
+                        'ip': '127.0.0.1', 'port': 10000, 'device': dev})
+        rb.rebalance(seed=1)
+
+        # Let's save the ring, and get the nodes for an object
+        ring_file = os.path.join(self.testdir, 'test_partpower.ring.gz')
+        rd = rb.get_ring()
+        rd.save(ring_file, format_version=self.FORMAT_VERSION)
+        r = ring.Ring(ring_file)
+        old_part, old_nodes = r.get_nodes("acc", "cont", "obj")
+        old_version = rb.version
+
+        self.assertTrue(rb.prepare_increase_partition_power())
+        self.assertTrue(rb.increase_partition_power())
+        rb.validate()
+        changed_parts, _balance, removed_devs = rb.rebalance()
+
+        self.assertEqual(changed_parts, 0)
+        self.assertEqual(removed_devs, 0)
+
+        # Make sure cancellation is not possible
+        # after increasing the partition power
+        self.assertFalse(rb.cancel_increase_partition_power())
+
+        old_ring = r
+        rd = rb.get_ring()
+        rd.save(ring_file, format_version=self.FORMAT_VERSION)
+        r = ring.Ring(ring_file)
+        new_part, new_nodes = r.get_nodes("acc", "cont", "obj")
+
+        # sanity checks
+        self.assertEqual(9, rb.part_power)
+        self.assertEqual(9, rb.next_part_power)
+        self.assertEqual(rb.version, old_version + 3)
+
+        # make sure there is always the same device assigned to every pair of
+        # partitions
+        for replica in rb._replica2part2dev:
+            for part in range(0, len(replica), 2):
+                dev = replica[part]
+                next_dev = replica[part + 1]
+                self.assertEqual(dev, next_dev)
+
+        # same for last_part moves
+        for part in range(0, rb.parts, 2):
+            this_last_moved = rb._last_part_moves[part]
+            next_last_moved = rb._last_part_moves[part + 1]
+            self.assertEqual(this_last_moved, next_last_moved)
+
+        for i in range(100):
+            suffix = uuid.uuid4()
+            account = 'account_%s' % suffix
+            container = 'container_%s' % suffix
+            obj = 'obj_%s' % suffix
+            old_part, old_nodes = old_ring.get_nodes(account, container, obj)
+            new_part, new_nodes = r.get_nodes(account, container, obj)
+            # Due to the increased partition power, the partition each object
+            # is assigned to has changed. If the old partition was X, it will
+            # now be either located in 2*X or 2*X+1
+            self.assertIn(new_part, [old_part * 2, old_part * 2 + 1])
+
+            # Importantly, we expect the objects to be placed on the same
+            # nodes after increasing the partition power
+            self.assertEqual(old_nodes, new_nodes)
+
+    def test_finalize_increase_partition_power(self):
+        ring_file = os.path.join(self.testdir, 'test_partpower.ring.gz')
+
+        rb = ring.RingBuilder(8, 3.0, 1)
+        self.assertEqual(rb.part_power, 8)
+
+        # add more devices than replicas to the ring
+        for i in range(10):
+            dev = "sdx%s" % i
+            rb.add_dev({'id': i, 'region': 0, 'zone': 0, 'weight': 1,
+                        'ip': '127.0.0.1', 'port': 10000, 'device': dev})
+        rb.rebalance(seed=1)
+
+        self.assertTrue(rb.prepare_increase_partition_power())
+
+        # Make sure this doesn't do any harm before actually increasing the
+        # partition power
+        self.assertFalse(rb.finish_increase_partition_power())
+        self.assertEqual(rb.next_part_power, 9)
+
+        self.assertTrue(rb.increase_partition_power())
+
+        self.assertFalse(rb.prepare_increase_partition_power())
+        self.assertEqual(rb.part_power, 9)
+        self.assertEqual(rb.next_part_power, 9)
+
+        self.assertTrue(rb.finish_increase_partition_power())
+
+        self.assertEqual(rb.part_power, 9)
+        self.assertIsNone(rb.next_part_power)
+
+        # Save .ring.gz, and load ring from it to ensure prev/next is set
+        rd = rb.get_ring()
+        rd.save(ring_file, format_version=self.FORMAT_VERSION)
+
+        r = ring.Ring(ring_file)
+        expected_part_shift = 32 - 9
+        self.assertEqual(expected_part_shift, r._part_shift)
+        self.assertIsNone(r.next_part_power)
+
+    def test_prepare_increase_partition_power_failed(self):
+        rb = ring.RingBuilder(8, 3.0, 1)
+        self.assertEqual(rb.part_power, 8)
+
+        self.assertTrue(rb.prepare_increase_partition_power())
+        self.assertEqual(rb.next_part_power, 9)
+
+        # next_part_power is still set, do not increase again
+        self.assertFalse(rb.prepare_increase_partition_power())
+        self.assertEqual(rb.next_part_power, 9)
+
+    def test_increase_partition_power_failed(self):
+        rb = ring.RingBuilder(8, 3.0, 1)
+        self.assertEqual(rb.part_power, 8)
+
+        # add more devices than replicas to the ring
+        for i in range(10):
+            dev = "sdx%s" % i
+            rb.add_dev({'id': i, 'region': 0, 'zone': 0, 'weight': 1,
+                        'ip': '127.0.0.1', 'port': 10000, 'device': dev})
+        rb.rebalance(seed=1)
+
+        # next_part_power not set, can't increase the part power
+        self.assertFalse(rb.increase_partition_power())
+        self.assertEqual(rb.part_power, 8)
+
+        self.assertTrue(rb.prepare_increase_partition_power())
+
+        self.assertTrue(rb.increase_partition_power())
+        self.assertEqual(rb.part_power, 9)
+
+        # part_power already increased
+        self.assertFalse(rb.increase_partition_power())
+        self.assertEqual(rb.part_power, 9)
+
+    def test_cancel_increase_partition_power(self):
+        rb = ring.RingBuilder(8, 3.0, 1)
+        self.assertEqual(rb.part_power, 8)
+
+        # add more devices than replicas to the ring
+        for i in range(10):
+            dev = "sdx%s" % i
+            rb.add_dev({'id': i, 'region': 0, 'zone': 0, 'weight': 1,
+                        'ip': '127.0.0.1', 'port': 10000, 'device': dev})
+        rb.rebalance(seed=1)
+
+        old_version = rb.version
+        self.assertTrue(rb.prepare_increase_partition_power())
+
+        # sanity checks
+        self.assertEqual(8, rb.part_power)
+        self.assertEqual(9, rb.next_part_power)
+        self.assertEqual(rb.version, old_version + 1)
+
+        self.assertTrue(rb.cancel_increase_partition_power())
+        rb.validate()
+
+        self.assertEqual(8, rb.part_power)
+        self.assertEqual(8, rb.next_part_power)
+        self.assertEqual(rb.version, old_version + 2)
+
+
+class TestPartPowerIncreaseV2(TestPartPowerIncrease):
+    FORMAT_VERSION = 2
+
+
+class TestGetRequiredOverload(unittest.TestCase):
+
+    maxDiff = None
+
+    def test_none_needed(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdb'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdc'})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 0, 'weight': 1,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdd'})
+
+        # 4 equal-weight devs and 3 replicas: this can be balanced without
+        # resorting to overload at all
+        self.assertAlmostEqual(rb.get_required_overload(), 0)
+
+        expected = {
+            (0, 0, '127.0.0.1', 0): 0.75,
+            (0, 0, '127.0.0.1', 1): 0.75,
+            (0, 0, '127.0.0.1', 2): 0.75,
+            (0, 0, '127.0.0.1', 3): 0.75,
+        }
+
+        weighted_replicas = rb._build_weighted_replicas_by_tier()
+        self.assertEqual(expected, {
+            tier: weighted
+            for (tier, weighted) in weighted_replicas.items()
+            if len(tier) == 4})
+        wanted_replicas = rb._build_wanted_replicas_by_tier()
+        self.assertEqual(expected,
+                         {tier: weighted
+                          for (tier, weighted) in wanted_replicas.items()
+                          if len(tier) == 4})
+
+        # since no overload is needed, target_replicas is the same
+        rb.set_overload(0.10)
+        target_replicas = rb._build_target_replicas_by_tier()
+        self.assertEqual(expected,
+                         {tier: weighted
+                          for (tier, weighted) in target_replicas.items()
+                          if len(tier) == 4})
+
+        # ... no matter how high you go!
+        rb.set_overload(100.0)
+        target_replicas = rb._build_target_replicas_by_tier()
+        self.assertEqual(expected,
+                         {tier: weighted
+                          for (tier, weighted) in target_replicas.items()
+                          if len(tier) == 4})
+
+        # 3 equal-weight devs and 3 replicas: this can also be balanced
+        rb.remove_dev(3)
+        self.assertAlmostEqual(rb.get_required_overload(), 0)
+
+        expected = {
+            (0, 0, '127.0.0.1', 0): 1.0,
+            (0, 0, '127.0.0.1', 1): 1.0,
+            (0, 0, '127.0.0.1', 2): 1.0,
+        }
+
+        weighted_replicas = rb._build_weighted_replicas_by_tier()
+        self.assertEqual(expected,
+                         {tier: weighted
+                          for (tier, weighted) in weighted_replicas.items()
+                          if len(tier) == 4})
+        wanted_replicas = rb._build_wanted_replicas_by_tier()
+        self.assertEqual(expected,
+                         {tier: weighted
+                          for (tier, weighted) in wanted_replicas.items()
+                          if len(tier) == 4})
+
+        # ... still no overload
+        rb.set_overload(100.0)
+        target_replicas = rb._build_target_replicas_by_tier()
+        self.assertEqual(expected,
+                         {tier: weighted
+                          for (tier, weighted) in target_replicas.items()
+                          if len(tier) == 4})
+
+    def test_equal_replica_and_devices_count_ignore_weights(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 7.47,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'weight': 5.91,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdb'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 0, 'weight': 6.44,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        expected = {
+            0: 1.0,
+            1: 1.0,
+            2: 1.0,
+        }
+        # simplicity itself
+        self.assertEqual(expected, {
+            t[-1]: r for (t, r) in
+            rb._build_weighted_replicas_by_tier().items()
+            if len(t) == 4})
+        self.assertEqual(expected, {
+            t[-1]: r for (t, r) in
+            rb._build_wanted_replicas_by_tier().items()
+            if len(t) == 4})
+        self.assertEqual(expected, {
+            t[-1]: r for (t, r) in
+            rb._build_target_replicas_by_tier().items()
+            if len(t) == 4})
+        # ... no overload required!
+        self.assertEqual(0, rb.get_required_overload())
+
+        rb.rebalance()
+        expected = {
+            0: 256,
+            1: 256,
+            2: 256,
+        }
+        self.assertEqual(expected, {d['id']: d['parts'] for d in
+                                    rb._iter_devs()})
+
+    def test_small_zone(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 4,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'weight': 4,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdb'})
+
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 1, 'weight': 4,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdc'})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 1, 'weight': 4,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdd'})
+
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 2, 'weight': 4,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdc'})
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 2, 'weight': 3,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdd'})
+
+        expected = {
+            (0, 0): 1.0434782608695652,
+            (0, 1): 1.0434782608695652,
+            (0, 2): 0.9130434782608695,
+        }
+        weighted_replicas = rb._build_weighted_replicas_by_tier()
+        self.assertEqual(expected,
+                         {tier: weighted
+                          for (tier, weighted) in weighted_replicas.items()
+                          if len(tier) == 2})
+        expected = {
+            (0, 0): 1.0,
+            (0, 1): 1.0,
+            (0, 2): 1.0,
+        }
+        wanted_replicas = rb._build_wanted_replicas_by_tier()
+        self.assertEqual(expected,
+                         {tier: weighted
+                          for (tier, weighted) in wanted_replicas.items()
+                          if len(tier) == 2})
+
+        # the device tier is interesting because one of the devices in zone
+        # two has a different weight
+        expected = {
+            0: 0.5217391304347826,
+            1: 0.5217391304347826,
+            2: 0.5217391304347826,
+            3: 0.5217391304347826,
+            4: 0.5217391304347826,
+            5: 0.3913043478260869,
+        }
+        self.assertEqual(expected,
+                         {tier[3]: weighted
+                          for (tier, weighted) in weighted_replicas.items()
+                          if len(tier) == 4})
+
+        # ... but, each pair of devices still needs to hold a whole
+        # replicanth; which we'll try distribute fairly among devices in
+        # zone 2, so that they can share the burden and ultimately the
+        # required overload will be as small as possible.
+        expected = {
+            0: 0.5,
+            1: 0.5,
+            2: 0.5,
+            3: 0.5,
+            4: 0.5714285714285715,
+            5: 0.42857142857142855,
+        }
+        self.assertEqual(expected,
+                         {tier[3]: weighted
+                          for (tier, weighted) in wanted_replicas.items()
+                          if len(tier) == 4})
+
+        # full dispersion requires zone two's devices to eat more than
+        # they're weighted for
+        self.assertAlmostEqual(rb.get_required_overload(), 0.095238,
+                               delta=1e-5)
+
+        # so... if we give it enough overload it we should get full dispersion
+        rb.set_overload(0.1)
+        target_replicas = rb._build_target_replicas_by_tier()
+        self.assertEqual(expected,
+                         {tier[3]: weighted
+                          for (tier, weighted) in target_replicas.items()
+                          if len(tier) == 4})
+
+    def test_multiple_small_zones(self):
+        rb = ring.RingBuilder(8, 3, 1)
+
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 500,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'weight': 500,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdb'})
+        rb.add_dev({'id': 8, 'region': 0, 'zone': 0, 'weight': 500,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdb'})
+        rb.add_dev({'id': 9, 'region': 0, 'zone': 0, 'weight': 500,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdb'})
+
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 1, 'weight': 150,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdc'})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 1, 'weight': 150,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdd'})
+        rb.add_dev({'id': 10, 'region': 0, 'zone': 1, 'weight': 150,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdd'})
+
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 2, 'weight': 100,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdc'})
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 2, 'weight': 100,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdd'})
+
+        rb.add_dev({'id': 6, 'region': 0, 'zone': 3, 'weight': 100,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdc'})
+        rb.add_dev({'id': 7, 'region': 0, 'zone': 3, 'weight': 100,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdd'})
+
+        expected = {
+            (0, 0): 2.1052631578947367,
+            (0, 1): 0.47368421052631576,
+            (0, 2): 0.21052631578947367,
+            (0, 3): 0.21052631578947367,
+        }
+        weighted_replicas = rb._build_weighted_replicas_by_tier()
+        self.assertEqual(expected,
+                         {tier: weighted
+                          for (tier, weighted) in weighted_replicas.items()
+                          if len(tier) == 2})
+
+        # without any overload, we get weight
+        target_replicas = rb._build_target_replicas_by_tier()
+        self.assertEqual(expected,
+                         {tier: r
+                          for (tier, r) in target_replicas.items()
+                          if len(tier) == 2})
+
+        expected = {
+            (0, 0): 1.0,
+            (0, 1): 1.0,
+            (0, 2): 0.49999999999999994,
+            (0, 3): 0.49999999999999994,
+        }
+        wanted_replicas = rb._build_wanted_replicas_by_tier()
+        self.assertEqual(expected,
+                         {t: r
+                          for (t, r) in wanted_replicas.items()
+                          if len(t) == 2})
+
+        self.assertEqual(1.3750000000000002, rb.get_required_overload())
+
+        # with enough overload we get the full dispersion
+        rb.set_overload(1.5)
+        target_replicas = rb._build_target_replicas_by_tier()
+        self.assertEqual(expected,
+                         {tier: r
+                          for (tier, r) in target_replicas.items()
+                          if len(tier) == 2})
+
+        # with not enough overload, we get somewhere in the middle
+        rb.set_overload(1.0)
+        expected = {
+            (0, 0): 1.3014354066985647,
+            (0, 1): 0.8564593301435406,
+            (0, 2): 0.4210526315789473,
+            (0, 3): 0.4210526315789473,
+        }
+        target_replicas = rb._build_target_replicas_by_tier()
+        self.assertEqual(expected,
+                         {tier: r
+                          for (tier, r) in target_replicas.items()
+                          if len(tier) == 2})
+
+    def test_big_zone(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 100,
+                    'ip': '127.0.0.0', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'weight': 100,
+                    'ip': '127.0.0.0', 'port': 10000, 'device': 'sdb'})
+
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 1, 'weight': 60,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 1, 'weight': 60,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdb'})
+
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 2, 'weight': 60,
+                    'ip': '127.0.0.2', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 2, 'weight': 60,
+                    'ip': '127.0.0.2', 'port': 10000, 'device': 'sdb'})
+
+        rb.add_dev({'id': 6, 'region': 0, 'zone': 3, 'weight': 60,
+                    'ip': '127.0.0.3', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 7, 'region': 0, 'zone': 3, 'weight': 60,
+                    'ip': '127.0.0.3', 'port': 10000, 'device': 'sdb'})
+
+        expected = {
+            (0, 0): 1.0714285714285714,
+            (0, 1): 0.6428571428571429,
+            (0, 2): 0.6428571428571429,
+            (0, 3): 0.6428571428571429,
+        }
+        weighted_replicas = rb._build_weighted_replicas_by_tier()
+        self.assertEqual(expected,
+                         {tier: weighted
+                          for (tier, weighted) in weighted_replicas.items()
+                          if len(tier) == 2})
+        # starting in py312, "sum() now uses Neumaier summation to improve
+        # accuracy and commutativity", hence the tiny delta
+        w = (0.6666666666666666 if sys.version_info >= (3, 12) else
+             0.6666666666666667)
+        expected = {
+            (0, 0): 1.0,
+            (0, 1): w,
+            (0, 2): w,
+            (0, 3): w,
+        }
+        wanted_replicas = rb._build_wanted_replicas_by_tier()
+        self.assertEqual(expected,
+                         {tier: weighted
+                          for (tier, weighted) in wanted_replicas.items()
+                          if len(tier) == 2})
+
+        # when all the devices and servers in a zone are evenly weighted
+        # it will accurately proxy their required overload, all the
+        # zones besides 0 require the same overload
+        t = random.choice([t for t in weighted_replicas
+                           if len(t) == 2
+                           and t[1] != 0])
+        expected_overload = ((wanted_replicas[t] - weighted_replicas[t])
+                             / weighted_replicas[t])
+        self.assertAlmostEqual(rb.get_required_overload(),
+                               expected_overload)
+
+        # but if you only give it out half of that
+        rb.set_overload(expected_overload / 2.0)
+        # ... you can expect it's not going to full disperse
+        # (but see above about sum() accuracy)
+        w = (0.6547619047619048 if sys.version_info >= (3, 12) else
+             0.6547619047619049)
+        expected = {
+            (0, 0): 1.0357142857142856,
+            (0, 1): w,
+            (0, 2): w,
+            (0, 3): w,
+        }
+        target_replicas = rb._build_target_replicas_by_tier()
+        self.assertEqual(expected,
+                         {tier: weighted
+                          for (tier, weighted) in target_replicas.items()
+                          if len(tier) == 2})
+
+    def test_enormous_zone(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 500,
+                    'ip': '127.0.0.0', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'weight': 500,
+                    'ip': '127.0.0.0', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 0, 'weight': 500,
+                    'ip': '127.0.0.0', 'port': 10000, 'device': 'sdb'})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 0, 'weight': 500,
+                    'ip': '127.0.0.0', 'port': 10000, 'device': 'sdb'})
+
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 1, 'weight': 60,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 1, 'weight': 60,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdb'})
+
+        rb.add_dev({'id': 6, 'region': 0, 'zone': 2, 'weight': 60,
+                    'ip': '127.0.0.2', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 7, 'region': 0, 'zone': 2, 'weight': 60,
+                    'ip': '127.0.0.2', 'port': 10000, 'device': 'sdb'})
+
+        rb.add_dev({'id': 8, 'region': 0, 'zone': 3, 'weight': 60,
+                    'ip': '127.0.0.2', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 9, 'region': 0, 'zone': 3, 'weight': 60,
+                    'ip': '127.0.0.2', 'port': 10000, 'device': 'sdb'})
+
+        expected = {
+            (0, 0): 2.542372881355932,
+            (0, 1): 0.15254237288135591,
+            (0, 2): 0.15254237288135591,
+            (0, 3): 0.15254237288135591,
+        }
+        weighted_replicas = rb._build_weighted_replicas_by_tier()
+        self.assertEqual(expected,
+                         {tier: weighted
+                          for (tier, weighted) in weighted_replicas.items()
+                          if len(tier) == 2})
+
+        expected = {
+            (0, 0): 1.0,
+            (0, 1): 0.6666666666666667,
+            (0, 2): 0.6666666666666667,
+            (0, 3): 0.6666666666666667,
+        }
+        wanted_replicas = rb._build_wanted_replicas_by_tier()
+        self.assertEqual(expected,
+                         {tier: weighted
+                          for (tier, weighted) in wanted_replicas.items()
+                          if len(tier) == 2})
+
+        # ouch, those "tiny" devices need to hold 3x more than their
+        # weighted for!
+        self.assertAlmostEqual(rb.get_required_overload(), 3.370370,
+                               delta=1e-5)
+
+        # let's get a little crazy, and let devices eat up to 1x more than
+        # their capacity is weighted for - see how far that gets us...
+        rb.set_overload(1)
+        target_replicas = rb._build_target_replicas_by_tier()
+        expected = {
+            (0, 0): 2.084745762711864,
+            (0, 1): 0.30508474576271183,
+            (0, 2): 0.30508474576271183,
+            (0, 3): 0.30508474576271183,
+        }
+        self.assertEqual(expected,
+                         {tier: weighted
+                          for (tier, weighted) in target_replicas.items()
+                          if len(tier) == 2})
+
+    def test_two_big_two_small(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 100,
+                    'ip': '127.0.0.0', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'weight': 100,
+                    'ip': '127.0.0.0', 'port': 10000, 'device': 'sdb'})
+
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 1, 'weight': 100,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 1, 'weight': 100,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdb'})
+
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 2, 'weight': 45,
+                    'ip': '127.0.0.2', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 2, 'weight': 45,
+                    'ip': '127.0.0.2', 'port': 10000, 'device': 'sdb'})
+
+        rb.add_dev({'id': 6, 'region': 0, 'zone': 3, 'weight': 35,
+                    'ip': '127.0.0.2', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 7, 'region': 0, 'zone': 3, 'weight': 35,
+                    'ip': '127.0.0.2', 'port': 10000, 'device': 'sdb'})
+
+        expected = {
+            (0, 0): 1.0714285714285714,
+            (0, 1): 1.0714285714285714,
+            (0, 2): 0.48214285714285715,
+            (0, 3): 0.375,
+        }
+        weighted_replicas = rb._build_weighted_replicas_by_tier()
+        self.assertEqual(expected,
+                         {tier: weighted
+                          for (tier, weighted) in weighted_replicas.items()
+                          if len(tier) == 2})
+
+        expected = {
+            (0, 0): 1.0,
+            (0, 1): 1.0,
+            (0, 2): 0.5625,
+            (0, 3): 0.43749999999999994,
+        }
+        wanted_replicas = rb._build_wanted_replicas_by_tier()
+        self.assertEqual(expected,
+                         {tier: weighted
+                          for (tier, weighted) in wanted_replicas.items()
+                          if len(tier) == 2})
+
+        # I'm not sure it's significant or coincidental that the devices
+        # in zone 2 & 3 who end up splitting the 3rd replica turn out to
+        # need to eat ~1/6th extra replicanths
+        self.assertAlmostEqual(rb.get_required_overload(), 1.0 / 6.0)
+
+        # ... *so* 10% isn't *quite* enough
+        rb.set_overload(0.1)
+        target_replicas = rb._build_target_replicas_by_tier()
+        expected = {
+            (0, 0): 1.0285714285714285,
+            (0, 1): 1.0285714285714285,
+            (0, 2): 0.5303571428571429,
+            (0, 3): 0.4125,
+        }
+        self.assertEqual(expected,
+                         {tier: weighted
+                          for (tier, weighted) in target_replicas.items()
+                          if len(tier) == 2})
+
+        # ... but 20% will do the trick!
+        rb.set_overload(0.2)
+        target_replicas = rb._build_target_replicas_by_tier()
+        expected = {
+            (0, 0): 1.0,
+            (0, 1): 1.0,
+            (0, 2): 0.5625,
+            (0, 3): 0.43749999999999994,
+        }
+        self.assertEqual(expected,
+                         {tier: weighted
+                          for (tier, weighted) in target_replicas.items()
+                          if len(tier) == 2})
+
+    def test_multiple_replicas_each(self):
+        rb = ring.RingBuilder(8, 7, 1)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': 80,
+                    'ip': '127.0.0.0', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'weight': 80,
+                    'ip': '127.0.0.0', 'port': 10000, 'device': 'sdb'})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 0, 'weight': 80,
+                    'ip': '127.0.0.0', 'port': 10000, 'device': 'sdc'})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 0, 'weight': 80,
+                    'ip': '127.0.0.0', 'port': 10000, 'device': 'sdd'})
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 0, 'weight': 80,
+                    'ip': '127.0.0.0', 'port': 10000, 'device': 'sde'})
+
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 1, 'weight': 70,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 6, 'region': 0, 'zone': 1, 'weight': 70,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdb'})
+        rb.add_dev({'id': 7, 'region': 0, 'zone': 1, 'weight': 70,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdc'})
+        rb.add_dev({'id': 8, 'region': 0, 'zone': 1, 'weight': 70,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sdd'})
+
+        expected = {
+            (0, 0): 4.117647058823529,
+            (0, 1): 2.8823529411764706,
+        }
+        weighted_replicas = rb._build_weighted_replicas_by_tier()
+        self.assertEqual(expected,
+                         {tier: weighted
+                          for (tier, weighted) in weighted_replicas.items()
+                          if len(tier) == 2})
+
+        expected = {
+            (0, 0): 4.0,
+            (0, 1): 3.0,
+        }
+        wanted_replicas = rb._build_wanted_replicas_by_tier()
+        self.assertEqual(expected,
+                         {tier: weighted
+                          for (tier, weighted) in wanted_replicas.items()
+                          if len(tier) == 2})
+
+        # I guess 2.88 => 3.0 is about a 4% increase
+        self.assertAlmostEqual(rb.get_required_overload(),
+                               0.040816326530612256)
+
+        # ... 10% is plenty enough here
+        rb.set_overload(0.1)
+        target_replicas = rb._build_target_replicas_by_tier()
+        self.assertEqual(expected,
+                         {tier: weighted
+                          for (tier, weighted) in target_replicas.items()
+                          if len(tier) == 2})
+
+    def test_small_extra_server_in_zone_with_multiple_replicas(self):
+        rb = ring.RingBuilder(8, 5, 1)
+
+        # z0
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'ip': '127.0.0.1',
+                    'port': 6200, 'device': 'sda', 'weight': 1000})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'ip': '127.0.0.1',
+                    'port': 6200, 'device': 'sdb', 'weight': 1000})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 0, 'ip': '127.0.0.1',
+                    'port': 6200, 'device': 'sdc', 'weight': 1000})
+
+        # z1
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 1, 'ip': '127.0.0.2',
+                    'port': 6200, 'device': 'sda', 'weight': 1000})
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 1, 'ip': '127.0.0.2',
+                    'port': 6200, 'device': 'sdb', 'weight': 1000})
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 1, 'ip': '127.0.0.2',
+                    'port': 6200, 'device': 'sdc', 'weight': 1000})
+
+        # z1 - extra small server
+        rb.add_dev({'id': 6, 'region': 0, 'zone': 1, 'ip': '127.0.0.3',
+                    'port': 6200, 'device': 'sda', 'weight': 50})
+
+        expected = {
+            (0, 0): 2.479338842975207,
+            (0, 1): 2.5206611570247937,
+        }
+        weighted_replicas = rb._build_weighted_replicas_by_tier()
+        self.assertEqual(expected, {t: r for (t, r) in
+                                    weighted_replicas.items()
+                                    if len(t) == 2})
+
+        # dispersion is fine with this at the zone tier
+        wanted_replicas = rb._build_wanted_replicas_by_tier()
+        self.assertEqual(expected, {t: r for (t, r) in
+                                    wanted_replicas.items()
+                                    if len(t) == 2})
+
+        # ... but not ok with that tiny server
+        expected = {
+            '127.0.0.1': 2.479338842975207,
+            '127.0.0.2': 1.5206611570247937,
+            '127.0.0.3': 1.0,
+        }
+        self.assertEqual(expected, {t[-1]: r for (t, r) in
+                                    wanted_replicas.items()
+                                    if len(t) == 3})
+
+        self.assertAlmostEqual(23.2, rb.get_required_overload())
+
+    def test_multiple_replicas_in_zone_with_single_device(self):
+        rb = ring.RingBuilder(8, 5, 0)
+        # z0
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'ip': '127.0.0.1',
+                    'port': 6200, 'device': 'sda', 'weight': 100})
+        # z1
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 1, 'ip': '127.0.1.1',
+                    'port': 6200, 'device': 'sda', 'weight': 100})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 1, 'ip': '127.0.1.1',
+                    'port': 6200, 'device': 'sdb', 'weight': 100})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 1, 'ip': '127.0.1.2',
+                    'port': 6200, 'device': 'sdc', 'weight': 100})
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 1, 'ip': '127.0.1.2',
+                    'port': 6200, 'device': 'sdd', 'weight': 100})
+
+        # first things first, make sure we do this right
+        rb.rebalance()
+
+        # each device get's a sing replica of every part
+        expected = {
+            0: 256,
+            1: 256,
+            2: 256,
+            3: 256,
+            4: 256,
+        }
+        self.assertEqual(expected, {d['id']: d['parts']
+                                    for d in rb._iter_devs()})
+
+        # but let's make sure we're thinking about it right too
+        expected = {
+            0: 1.0,
+            1: 1.0,
+            2: 1.0,
+            3: 1.0,
+            4: 1.0,
+        }
+
+        # by weight everyone is equal
+        weighted_replicas = rb._build_weighted_replicas_by_tier()
+        self.assertEqual(expected, {t[-1]: r for (t, r) in
+                                    weighted_replicas.items()
+                                    if len(t) == 4})
+
+        # wanted might have liked to have fewer replicas in z1, but the
+        # single device in z0 limits us one replica per device
+        with rb.debug():
+            wanted_replicas = rb._build_wanted_replicas_by_tier()
+        self.assertEqual(expected, {t[-1]: r for (t, r) in
+                                    wanted_replicas.items()
+                                    if len(t) == 4})
+
+        # even with some overload - still one replica per device
+        rb.set_overload(1.0)
+        target_replicas = rb._build_target_replicas_by_tier()
+        self.assertEqual(expected, {t[-1]: r for (t, r) in
+                                    target_replicas.items()
+                                    if len(t) == 4})
+
+        # when overload can not change the outcome none is required
+        self.assertEqual(0.0, rb.get_required_overload())
+        # even though dispersion is terrible (in z1 particularly)
+        self.assertEqual(20.0, rb.dispersion)
+
+    def test_one_big_guy_does_not_spoil_his_buddy(self):
+        rb = ring.RingBuilder(8, 3, 0)
+
+        # z0
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'ip': '127.0.0.1',
+                    'port': 6200, 'device': 'sda', 'weight': 100})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'ip': '127.0.0.2',
+                    'port': 6200, 'device': 'sda', 'weight': 100})
+        # z1
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 1, 'ip': '127.0.1.1',
+                    'port': 6200, 'device': 'sda', 'weight': 100})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 1, 'ip': '127.0.1.2',
+                    'port': 6200, 'device': 'sda', 'weight': 100})
+        # z2
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 2, 'ip': '127.0.2.1',
+                    'port': 6200, 'device': 'sda', 'weight': 100})
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 2, 'ip': '127.0.2.2',
+                    'port': 6200, 'device': 'sda', 'weight': 10000})
+
+        # obviously d5 gets one whole replica; the other two replicas
+        # are split evenly among the five other devices
+        # (i.e. ~0.4 replicanths for each 100 units of weight)
+        expected = {
+            0: 0.39999999999999997,
+            1: 0.39999999999999997,
+            2: 0.39999999999999997,
+            3: 0.39999999999999997,
+            4: 0.39999999999999997,
+            5: 1.0,
+        }
+        weighted_replicas = rb._build_weighted_replicas_by_tier()
+        self.assertEqual(expected, {t[-1]: r for (t, r) in
+                                    weighted_replicas.items()
+                                    if len(t) == 4})
+
+        # with no overload we get the "balanced" placement
+        target_replicas = rb._build_target_replicas_by_tier()
+        self.assertEqual(expected, {t[-1]: r for (t, r) in
+                                    target_replicas.items()
+                                    if len(t) == 4})
+
+        # but in reality, these devices having such disparate weights
+        # leads to a *terrible* balance even w/o overload!
+        rb.rebalance(seed=9)
+        self.assertEqual(rb.get_balance(), 1308.2031249999998)
+
+        # even though part assignment is pretty reasonable
+        expected = {
+            0: 103,
+            1: 102,
+            2: 103,
+            3: 102,
+            4: 102,
+            5: 256,
+        }
+        self.assertEqual(expected, {
+            d['id']: d['parts'] for d in rb._iter_devs()})
+
+        # so whats happening is the small devices are holding *way* more
+        # *real* parts than their *relative* portion of the weight would
+        # like them too!
+        expected = {
+            0: 1308.2031249999998,
+            1: 1294.5312499999998,
+            2: 1308.2031249999998,
+            3: 1294.5312499999998,
+            4: 1294.5312499999998,
+            5: -65.0,
+
+        }
+        self.assertEqual(expected, rb._build_balance_per_dev())
+
+        # increasing overload moves towards one replica in each tier
+        rb.set_overload(0.20)
+        expected = {
+            0: 0.48,
+            1: 0.48,
+            2: 0.48,
+            3: 0.48,
+            4: 0.30857142857142855,
+            5: 0.7714285714285714,
+        }
+        target_replicas = rb._build_target_replicas_by_tier()
+        self.assertEqual(expected, {t[-1]: r for (t, r) in
+                                    target_replicas.items()
+                                    if len(t) == 4})
+
+        # ... and as always increasing overload makes balance *worse*
+        rb.rebalance(seed=17)
+        self.assertEqual(rb.get_balance(), 1581.6406249999998)
+
+        # but despite the overall trend toward imbalance, in the tier with the
+        # huge device, we want to see the small device (d4) try to shed parts
+        # as effectively as it can to the huge device in the same tier (d5)
+        # this is a useful behavior anytime when for whatever reason a device
+        # w/i a tier wants parts from another device already in the same tier
+        # another example is `test_one_small_guy_does_not_spoil_his_buddy`
+        expected = {
+            0: 123,
+            1: 123,
+            2: 123,
+            3: 123,
+            4: 79,
+            5: 197,
+        }
+        self.assertEqual(expected, {
+            d['id']: d['parts'] for d in rb._iter_devs()})
+
+        # *see*, at least *someones* balance is getting better!
+        expected = {
+            0: 1581.6406249999998,
+            1: 1581.6406249999998,
+            2: 1581.6406249999998,
+            3: 1581.6406249999998,
+            4: 980.078125,
+            5: -73.06640625,
+        }
+        self.assertEqual(expected, rb._build_balance_per_dev())
+
+    def test_one_small_guy_does_not_spoil_his_buddy(self):
+        rb = ring.RingBuilder(8, 3, 0)
+
+        # z0
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'ip': '127.0.0.1',
+                    'port': 6200, 'device': 'sda', 'weight': 10000})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'ip': '127.0.0.2',
+                    'port': 6200, 'device': 'sda', 'weight': 10000})
+        # z1
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 1, 'ip': '127.0.1.1',
+                    'port': 6200, 'device': 'sda', 'weight': 10000})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 1, 'ip': '127.0.1.2',
+                    'port': 6200, 'device': 'sda', 'weight': 10000})
+        # z2
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 2, 'ip': '127.0.2.1',
+                    'port': 6200, 'device': 'sda', 'weight': 10000})
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 2, 'ip': '127.0.2.2',
+                    'port': 6200, 'device': 'sda', 'weight': 100})
+
+        # it's almost like 3.0 / 5 ~= 0.6, but that one little guy get's
+        # his fair share
+        expected = {
+            0: 0.5988023952095808,
+            1: 0.5988023952095808,
+            2: 0.5988023952095808,
+            3: 0.5988023952095808,
+            4: 0.5988023952095808,
+            5: 0.005988023952095809,
+        }
+        weighted_replicas = rb._build_weighted_replicas_by_tier()
+        self.assertEqual(expected, {t[-1]: r for (t, r) in
+                                    weighted_replicas.items()
+                                    if len(t) == 4})
+
+        # with no overload we get a nice balanced placement
+        target_replicas = rb._build_target_replicas_by_tier()
+        self.assertEqual(expected, {t[-1]: r for (t, r) in
+                                    target_replicas.items()
+                                    if len(t) == 4})
+        rb.rebalance(seed=9)
+
+        # part placement looks goods
+        expected = {
+            0: 154,
+            1: 153,
+            2: 153,
+            3: 153,
+            4: 153,
+            5: 2,
+        }
+        self.assertEqual(expected, {
+            d['id']: d['parts'] for d in rb._iter_devs()})
+
+        # ... balance is a little lumpy on the small guy since he wants
+        # one and a half parts :\
+        expected = {
+            0: 0.4609375000000142,
+            1: -0.1914062499999858,
+            2: -0.1914062499999858,
+            3: -0.1914062499999858,
+            4: -0.1914062499999858,
+            5: 30.46875,
+        }
+        self.assertEqual(expected, rb._build_balance_per_dev())
+
+        self.assertEqual(rb.get_balance(), 30.46875)
+
+        # increasing overload moves towards one replica in each tier
+        rb.set_overload(0.3)
+        expected = {
+            0: 0.553443113772455,
+            1: 0.553443113772455,
+            2: 0.553443113772455,
+            3: 0.553443113772455,
+            4: 0.778443113772455,
+            5: 0.007784431137724551,
+        }
+        target_replicas = rb._build_target_replicas_by_tier()
+        self.assertEqual(expected, {t[-1]: r for (t, r) in
+                                    target_replicas.items()
+                                    if len(t) == 4})
+        # ... and as always increasing overload makes balance *worse*
+        rb.rebalance(seed=12)
+        self.assertEqual(rb.get_balance(), 30.46875)
+
+        # the little guy it really struggling to take his share tho
+        expected = {
+            0: 142,
+            1: 141,
+            2: 142,
+            3: 141,
+            4: 200,
+            5: 2,
+        }
+        self.assertEqual(expected, {
+            d['id']: d['parts'] for d in rb._iter_devs()})
+        # ... and you can see it in the balance!
+        expected = {
+            0: -7.367187499999986,
+            1: -8.019531249999986,
+            2: -7.367187499999986,
+            3: -8.019531249999986,
+            4: 30.46875,
+            5: 30.46875,
+        }
+        self.assertEqual(expected, rb._build_balance_per_dev())
+
+        rb.set_overload(0.5)
+        expected = {
+            0: 0.5232035928143712,
+            1: 0.5232035928143712,
+            2: 0.5232035928143712,
+            3: 0.5232035928143712,
+            4: 0.8982035928143712,
+            5: 0.008982035928143714,
+        }
+        target_replicas = rb._build_target_replicas_by_tier()
+        self.assertEqual(expected, {t[-1]: r for (t, r) in
+                                    target_replicas.items()
+                                    if len(t) == 4})
+
+        # because the device is so small, balance get's bad quick
+        rb.rebalance(seed=17)
+        self.assertEqual(rb.get_balance(), 95.703125)
+
+        # but despite the overall trend toward imbalance, the little guy
+        # isn't really taking on many new parts!
+        expected = {
+            0: 134,
+            1: 134,
+            2: 134,
+            3: 133,
+            4: 230,
+            5: 3,
+        }
+        self.assertEqual(expected, {
+            d['id']: d['parts'] for d in rb._iter_devs()})
+
+        # *see*, at everyone's balance is getting worse *together*!
+        expected = {
+            0: -12.585937499999986,
+            1: -12.585937499999986,
+            2: -12.585937499999986,
+            3: -13.238281249999986,
+            4: 50.0390625,
+            5: 95.703125,
+        }
+        self.assertEqual(expected, rb._build_balance_per_dev())
+
+    def test_two_servers_with_more_than_one_replica(self):
+        rb = ring.RingBuilder(8, 3, 0)
+        # z0
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'ip': '127.0.0.1',
+                    'port': 6200, 'device': 'sda', 'weight': 60})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'ip': '127.0.0.2',
+                    'port': 6200, 'device': 'sda', 'weight': 60})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 0, 'ip': '127.0.0.3',
+                    'port': 6200, 'device': 'sda', 'weight': 60})
+        # z1
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 1, 'ip': '127.0.1.1',
+                    'port': 6200, 'device': 'sda', 'weight': 80})
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 1, 'ip': '127.0.1.2',
+                    'port': 6200, 'device': 'sda', 'weight': 128})
+        # z2
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 2, 'ip': '127.0.2.1',
+                    'port': 6200, 'device': 'sda', 'weight': 80})
+        rb.add_dev({'id': 6, 'region': 0, 'zone': 2, 'ip': '127.0.2.2',
+                    'port': 6200, 'device': 'sda', 'weight': 240})
+
+        rb.set_overload(0.1)
+        rb.rebalance()
+        self.assertEqual(12.161458333333343, rb.get_balance())
+
+        replica_plan = rb._build_target_replicas_by_tier()
+        for dev in rb._iter_devs():
+            tier = (dev['region'], dev['zone'], dev['ip'], dev['id'])
+            expected_parts = replica_plan[tier] * rb.parts
+            self.assertAlmostEqual(dev['parts'], expected_parts,
+                                   delta=1)
+
+    def test_multi_zone_with_failed_device(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'ip': '127.0.0.1',
+                    'port': 6200, 'device': 'sda', 'weight': 2000})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'ip': '127.0.0.1',
+                    'port': 6200, 'device': 'sdb', 'weight': 2000})
+
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 1, 'ip': '127.0.0.2',
+                    'port': 6200, 'device': 'sda', 'weight': 2000})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 1, 'ip': '127.0.0.2',
+                    'port': 6200, 'device': 'sdb', 'weight': 2000})
+
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 2, 'ip': '127.0.0.3',
+                    'port': 6200, 'device': 'sda', 'weight': 2000})
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 2, 'ip': '127.0.0.3',
+                    'port': 6200, 'device': 'sdb', 'weight': 2000})
+
+        # sanity, balanced and dispersed
+        expected = {
+            (0, 0): 1.0,
+            (0, 1): 1.0,
+            (0, 2): 1.0,
+        }
+        weighted_replicas = rb._build_weighted_replicas_by_tier()
+        self.assertEqual(expected,
+                         {tier: weighted
+                          for (tier, weighted) in weighted_replicas.items()
+                          if len(tier) == 2})
+        wanted_replicas = rb._build_wanted_replicas_by_tier()
+        self.assertEqual(expected,
+                         {tier: weighted
+                          for (tier, weighted) in wanted_replicas.items()
+                          if len(tier) == 2})
+
+        self.assertEqual(rb.get_required_overload(), 0.0)
+
+        # fail a device in zone 2
+        rb.remove_dev(4)
+
+        expected = {
+            0: 0.6,
+            1: 0.6,
+            2: 0.6,
+            3: 0.6,
+            5: 0.6,
+        }
+        weighted_replicas = rb._build_weighted_replicas_by_tier()
+        self.assertEqual(expected,
+                         {tier[3]: weighted
+                          for (tier, weighted) in weighted_replicas.items()
+                          if len(tier) == 4})
+
+        expected = {
+            0: 0.5,
+            1: 0.5,
+            2: 0.5,
+            3: 0.5,
+            5: 1.0,
+        }
+        wanted_replicas = rb._build_wanted_replicas_by_tier()
+        self.assertEqual(expected,
+                         {tier[3]: weighted
+                          for (tier, weighted) in wanted_replicas.items()
+                          if len(tier) == 4})
+
+        # does this make sense?  every zone was holding 1/3rd of the
+        # replicas, so each device was 1/6th, remove a device and
+        # suddenly it's holding *both* sixths which is 2/3rds?
+        self.assertAlmostEqual(rb.get_required_overload(), 2.0 / 3.0)
+
+        # 10% isn't nearly enough
+        rb.set_overload(0.1)
+        target_replicas = rb._build_target_replicas_by_tier()
+        expected = {
+            0: 0.585,
+            1: 0.585,
+            2: 0.585,
+            3: 0.585,
+            5: 0.6599999999999999,
+        }
+        self.assertEqual(expected,
+                         {tier[3]: weighted
+                          for (tier, weighted) in target_replicas.items()
+                          if len(tier) == 4})
+
+        # 50% isn't even enough
+        rb.set_overload(0.5)
+        target_replicas = rb._build_target_replicas_by_tier()
+        expected = {
+            0: 0.525,
+            1: 0.525,
+            2: 0.525,
+            3: 0.525,
+            5: 0.8999999999999999,
+        }
+        self.assertEqual(expected,
+                         {tier[3]: weighted
+                          for (tier, weighted) in target_replicas.items()
+                          if len(tier) == 4})
+
+        # even 65% isn't enough (but it's getting closer)
+        rb.set_overload(0.65)
+        target_replicas = rb._build_target_replicas_by_tier()
+        expected = {
+            0: 0.5025000000000001,
+            1: 0.5025000000000001,
+            2: 0.5025000000000001,
+            3: 0.5025000000000001,
+            5: 0.99,
+        }
+        self.assertEqual(expected,
+                         {tier[3]: weighted
+                          for (tier, weighted) in target_replicas.items()
+                          if len(tier) == 4})
+
+    def test_balanced_zones_unbalanced_servers(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        # zone 0 server 127.0.0.1
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'ip': '127.0.0.1',
+                    'port': 6200, 'device': 'sda', 'weight': 3000})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'ip': '127.0.0.1',
+                    'port': 6200, 'device': 'sdb', 'weight': 3000})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 0, 'ip': '127.0.0.1',
+                    'port': 6200, 'device': 'sda', 'weight': 3000})
+        # zone 1 server 127.0.0.2
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 1, 'ip': '127.0.0.2',
+                    'port': 6200, 'device': 'sda', 'weight': 4000})
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 1, 'ip': '127.0.0.2',
+                    'port': 6200, 'device': 'sdb', 'weight': 4000})
+        # zone 1 (again) server 127.0.0.3
+        rb.add_dev({'id': 6, 'region': 0, 'zone': 1, 'ip': '127.0.0.3',
+                    'port': 6200, 'device': 'sda', 'weight': 1000})
+
+        weighted_replicas = rb._build_weighted_replicas_by_tier()
+
+        # zones are evenly weighted
+        expected = {
+            (0, 0): 1.5,
+            (0, 1): 1.5,
+        }
+        self.assertEqual(expected,
+                         {tier: weighted
+                          for (tier, weighted) in weighted_replicas.items()
+                          if len(tier) == 2})
+
+        # ... but servers are not
+        expected = {
+            '127.0.0.1': 1.5,
+            '127.0.0.2': 1.3333333333333333,
+            '127.0.0.3': 0.16666666666666666,
+        }
+        self.assertEqual(expected,
+                         {tier[2]: weighted
+                          for (tier, weighted) in weighted_replicas.items()
+                          if len(tier) == 3})
+
+        # make sure wanted will even it out
+        expected = {
+            '127.0.0.1': 1.5,
+            '127.0.0.2': 1.0,
+            '127.0.0.3': 0.4999999999999999,
+        }
+        wanted_replicas = rb._build_wanted_replicas_by_tier()
+        self.assertEqual(expected,
+                         {tier[2]: weighted
+                          for (tier, weighted) in wanted_replicas.items()
+                          if len(tier) == 3})
+
+        # so it wants 1/6th and eats 1/2 - that's 2/6ths more than it
+        # wants which is a 200% increase
+        self.assertAlmostEqual(rb.get_required_overload(), 2.0)
+
+        # the overload doesn't effect the tiers that are already dispersed
+        rb.set_overload(1)
+        target_replicas = rb._build_target_replicas_by_tier()
+        expected = {
+            '127.0.0.1': 1.5,
+            # notice with half the overload 1/6th replicanth swapped servers
+            '127.0.0.2': 1.1666666666666665,
+            '127.0.0.3': 0.3333333333333333,
+        }
+        self.assertEqual(expected,
+                         {tier[2]: weighted
+                          for (tier, weighted) in target_replicas.items()
+                          if len(tier) == 3})
+
+    def test_adding_second_zone(self):
+        rb = ring.RingBuilder(3, 3, 1)
+        # zone 0 server 127.0.0.1
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'ip': '127.0.0.1',
+                    'port': 6200, 'device': 'sda', 'weight': 2000})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'ip': '127.0.0.1',
+                    'port': 6200, 'device': 'sdb', 'weight': 2000})
+        # zone 0 server 127.0.0.2
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 0, 'ip': '127.0.0.2',
+                    'port': 6200, 'device': 'sda', 'weight': 2000})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 0, 'ip': '127.0.0.2',
+                    'port': 6200, 'device': 'sdb', 'weight': 2000})
+        # zone 0 server 127.0.0.3
+        rb.add_dev({'id': 4, 'region': 0, 'zone': 0, 'ip': '127.0.0.3',
+                    'port': 6200, 'device': 'sda', 'weight': 2000})
+        rb.add_dev({'id': 5, 'region': 0, 'zone': 0, 'ip': '127.0.0.3',
+                    'port': 6200, 'device': 'sdb', 'weight': 2000})
+
+        # sanity, balanced and dispersed
+        expected = {
+            '127.0.0.1': 1.0,
+            '127.0.0.2': 1.0,
+            '127.0.0.3': 1.0,
+        }
+        weighted_replicas = rb._build_weighted_replicas_by_tier()
+        self.assertEqual(expected,
+                         {tier[2]: weighted
+                          for (tier, weighted) in weighted_replicas.items()
+                          if len(tier) == 3})
+        wanted_replicas = rb._build_wanted_replicas_by_tier()
+        self.assertEqual(expected,
+                         {tier[2]: weighted
+                          for (tier, weighted) in wanted_replicas.items()
+                          if len(tier) == 3})
+
+        self.assertEqual(rb.get_required_overload(), 0)
+
+        # start adding a second zone
+
+        # zone 1 server 127.0.1.1
+        rb.add_dev({'id': 6, 'region': 0, 'zone': 1, 'ip': '127.0.1.1',
+                    'port': 6200, 'device': 'sda', 'weight': 100})
+        rb.add_dev({'id': 7, 'region': 0, 'zone': 1, 'ip': '127.0.1.1',
+                    'port': 6200, 'device': 'sdb', 'weight': 100})
+        # zone 1 server 127.0.1.2
+        rb.add_dev({'id': 8, 'region': 0, 'zone': 1, 'ip': '127.0.1.2',
+                    'port': 6200, 'device': 'sda', 'weight': 100})
+        rb.add_dev({'id': 9, 'region': 0, 'zone': 1, 'ip': '127.0.1.2',
+                    'port': 6200, 'device': 'sdb', 'weight': 100})
+        # zone 1 server 127.0.1.3
+        rb.add_dev({'id': 10, 'region': 0, 'zone': 1, 'ip': '127.0.1.3',
+                    'port': 6200, 'device': 'sda', 'weight': 100})
+        rb.add_dev({'id': 11, 'region': 0, 'zone': 1, 'ip': '127.0.1.3',
+                    'port': 6200, 'device': 'sdb', 'weight': 100})
+
+        # this messes things up pretty royally
+        expected = {
+            '127.0.0.1': 0.9523809523809523,
+            '127.0.0.2': 0.9523809523809523,
+            '127.0.0.3': 0.9523809523809523,
+            '127.0.1.1': 0.047619047619047616,
+            '127.0.1.2': 0.047619047619047616,
+            '127.0.1.3': 0.047619047619047616,
+        }
+        weighted_replicas = rb._build_weighted_replicas_by_tier()
+        self.assertEqual(expected,
+                         {tier[2]: weighted
+                          for (tier, weighted) in weighted_replicas.items()
+                          if len(tier) == 3})
+        expected = {
+            '127.0.0.1': 0.6666666666666667,
+            '127.0.0.2': 0.6666666666666667,
+            '127.0.0.3': 0.6666666666666667,
+            '127.0.1.1': 0.3333333333333333,
+            '127.0.1.2': 0.3333333333333333,
+            '127.0.1.3': 0.3333333333333333,
+        }
+        wanted_replicas = rb._build_wanted_replicas_by_tier()
+        self.assertEqual(expected,
+                         {tier[2]: weighted
+                          for (tier, weighted) in wanted_replicas.items()
+                          if len(tier) == 3})
+
+        # so dispersion would require these devices hold 6x more than
+        # prescribed by weight, defeating any attempt at gradually
+        # anything
+        self.assertAlmostEqual(rb.get_required_overload(), 6.0)
+
+        # so let's suppose we only allow for 10% overload
+        rb.set_overload(0.10)
+        target_replicas = rb._build_target_replicas_by_tier()
+
+        expected = {
+            # we expect servers in zone 0 to be between 0.952 and 0.666
+            '127.0.0.1': 0.9476190476190476,
+            '127.0.0.2': 0.9476190476190476,
+            '127.0.0.3': 0.9476190476190476,
+            # we expect servers in zone 1 to be between 0.0476 and 0.333
+            # and in fact its ~10% increase (very little compared to 6x!)
+            '127.0.1.1': 0.052380952380952375,
+            '127.0.1.2': 0.052380952380952375,
+            '127.0.1.3': 0.052380952380952375,
+        }
+        self.assertEqual(expected,
+                         {tier[2]: weighted
+                          for (tier, weighted) in target_replicas.items()
+                          if len(tier) == 3})
+
+    def test_gradual_replica_count(self):
+        rb = ring.RingBuilder(3, 2.5, 1)
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'ip': '127.0.0.1',
+                    'port': 6200, 'device': 'sda', 'weight': 2000})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'ip': '127.0.0.1',
+                    'port': 6200, 'device': 'sdb', 'weight': 2000})
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 0, 'ip': '127.0.0.2',
+                    'port': 6200, 'device': 'sda', 'weight': 2000})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 0, 'ip': '127.0.0.2',
+                    'port': 6200, 'device': 'sdb', 'weight': 2000})
+
+        expected = {
+            0: 0.625,
+            1: 0.625,
+            2: 0.625,
+            3: 0.625,
+        }
+
+        weighted_replicas = rb._build_weighted_replicas_by_tier()
+        self.assertEqual(expected, {
+            tier[3]: weighted
+            for (tier, weighted) in weighted_replicas.items()
+            if len(tier) == 4})
+        wanted_replicas = rb._build_wanted_replicas_by_tier()
+        self.assertEqual(expected, {
+            tier[3]: wanted
+            for (tier, wanted) in wanted_replicas.items()
+            if len(tier) == 4})
+
+        self.assertEqual(rb.get_required_overload(), 0)
+
+        # server 127.0.0.2 will have only one device
+        rb.remove_dev(2)
+
+        # server 127.0.0.1 has twice the capacity of 127.0.0.2
+        expected = {
+            '127.0.0.1': 1.6666666666666667,
+            '127.0.0.2': 0.8333333333333334,
+        }
+        weighted_replicas = rb._build_weighted_replicas_by_tier()
+        self.assertEqual(expected, {
+            tier[2]: weighted
+            for (tier, weighted) in weighted_replicas.items()
+            if len(tier) == 3})
+
+        # dispersion requirements extend only to whole replicas
+        expected = {
+            '127.0.0.1': 1.4999999999999998,
+            '127.0.0.2': 1.0,
+        }
+        wanted_replicas = rb._build_wanted_replicas_by_tier()
+        self.assertEqual(expected, {
+            tier[2]: wanted
+            for (tier, wanted) in wanted_replicas.items()
+            if len(tier) == 3})
+
+        # 5/6ths to a whole replicanth is a 20% increase
+        self.assertAlmostEqual(rb.get_required_overload(), 0.2)
+
+        # so let's suppose we only allow for 10% overload
+        rb.set_overload(0.1)
+        target_replicas = rb._build_target_replicas_by_tier()
+        expected = {
+            '127.0.0.1': 1.5833333333333333,
+            '127.0.0.2': 0.9166666666666667,
+        }
+        self.assertEqual(expected, {
+            tier[2]: wanted
+            for (tier, wanted) in target_replicas.items()
+            if len(tier) == 3})
+
+    def test_perfect_four_zone_four_replica_bad_placement(self):
+        rb = ring.RingBuilder(4, 4, 1)
+
+        # this weight is sorta nuts, but it's really just to help the
+        # weight_of_one_part hit a magic number where floats mess up
+        # like they would on ring with a part power of 19 and 100's of
+        # 1000's of units of weight.
+        weight = 21739130434795e-11
+
+        # r0z0
+        rb.add_dev({'id': 0, 'region': 0, 'zone': 0, 'weight': weight,
+                    'ip': '127.0.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 1, 'region': 0, 'zone': 0, 'weight': weight,
+                    'ip': '127.0.0.2', 'port': 10000, 'device': 'sdb'})
+        # r0z1
+        rb.add_dev({'id': 2, 'region': 0, 'zone': 1, 'weight': weight,
+                    'ip': '127.0.1.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 3, 'region': 0, 'zone': 1, 'weight': weight,
+                    'ip': '127.0.1.2', 'port': 10000, 'device': 'sdb'})
+        # r1z0
+        rb.add_dev({'id': 4, 'region': 1, 'zone': 0, 'weight': weight,
+                    'ip': '127.1.0.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 5, 'region': 1, 'zone': 0, 'weight': weight,
+                    'ip': '127.1.0.2', 'port': 10000, 'device': 'sdb'})
+        # r1z1
+        rb.add_dev({'id': 6, 'region': 1, 'zone': 1, 'weight': weight,
+                    'ip': '127.1.1.1', 'port': 10000, 'device': 'sda'})
+        rb.add_dev({'id': 7, 'region': 1, 'zone': 1, 'weight': weight,
+                    'ip': '127.1.1.2', 'port': 10000, 'device': 'sdb'})
+
+        # the replica plan is sound
+        expectations = {
+            # tier_len => expected replicas
+            1: {
+                (0,): 2.0,
+                (1,): 2.0,
+            },
+            2: {
+                (0, 0): 1.0,
+                (0, 1): 1.0,
+                (1, 0): 1.0,
+                (1, 1): 1.0,
+            }
+        }
+        wr = rb._build_replica_plan()
+        for tier_len, expected in expectations.items():
+            self.assertEqual(expected, {t: r['max'] for (t, r) in
+                                        wr.items() if len(t) == tier_len})
+
+        if sys.version_info < (3, 12):
+            # even though a naive ceil of weights is surprisingly wrong
+            # (on old python)
+            expectations = {
+                # tier_len => expected replicas
+                1: {
+                    (0,): 3.0,
+                    (1,): 3.0,
+                },
+                2: {
+                    (0, 0): 2.0,
+                    (0, 1): 2.0,
+                    (1, 0): 2.0,
+                    (1, 1): 2.0,
+                }
+            }
+        wr = rb._build_weighted_replicas_by_tier()
+        for tier_len, expected in expectations.items():
+            self.assertEqual(expected, {t: ceil(r) for (t, r) in
+                                        wr.items() if len(t) == tier_len})
+
+
+class TestRingBuilderDispersion(unittest.TestCase):
+
+    def setUp(self):
+        self.devs = ('d%s' % i for i in itertools.count())
+
+    def assertAlmostPartCount(self, counts, expected, delta=3):
+        msgs = []
+        failed = False
+        for k, p in sorted(expected.items()):
+            try:
+                self.assertAlmostEqual(counts[k], p, delta=delta)
+            except KeyError:
+                self.fail('%r is missing the key %r' % (counts, k))
+            except AssertionError:
+                failed = True
+                state = '!='
+            else:
+                state = 'ok'
+            msgs.append('parts in %s was %s expected %s (%s)' % (
+                k, counts[k], p, state))
+        if failed:
+            self.fail('some part counts not close enough '
+                      'to expected:\n' + '\n'.join(msgs))
+
+    def test_rebalance_dispersion(self):
+        rb = ring.RingBuilder(8, 6, 0)
+
+        for i in range(6):
+            rb.add_dev({'region': 0, 'zone': 0, 'ip': '127.0.0.1',
+                        'port': 6000, 'weight': 1.0,
+                        'device': next(self.devs)})
+        rb.rebalance()
+        self.assertEqual(0, rb.dispersion)
+
+        for z in range(2):
+            for i in range(6):
+                rb.add_dev({'region': 0, 'zone': z + 1, 'ip': '127.0.1.1',
+                            'port': 6000, 'weight': 1.0,
+                            'device': next(self.devs)})
+
+        self.assertAlmostPartCount(_partition_counts(rb, 'zone'),
+                                   {0: 1536, 1: 0, 2: 0})
+        rb.rebalance()
+        self.assertEqual(rb.dispersion, 50.0)
+        expected = {0: 1280, 1: 128, 2: 128}
+        self.assertAlmostPartCount(_partition_counts(rb, 'zone'),
+                                   expected)
+        report = dict(utils.dispersion_report(
+            rb, r'r\d+z\d+$', verbose=True)['graph'])
+        counts = {int(k.split('z')[1]): d['placed_parts']
+                  for k, d in report.items()}
+        self.assertAlmostPartCount(counts, expected)
+        rb.rebalance()
+        self.assertEqual(rb.dispersion, 33.333333333333336)
+        expected = {0: 1024, 1: 256, 2: 256}
+        self.assertAlmostPartCount(_partition_counts(rb, 'zone'),
+                                   expected)
+        report = dict(utils.dispersion_report(
+            rb, r'r\d+z\d+$', verbose=True)['graph'])
+        counts = {int(k.split('z')[1]): d['placed_parts']
+                  for k, d in report.items()}
+        self.assertAlmostPartCount(counts, expected)
+        rb.rebalance()
+        self.assertEqual(rb.dispersion, 16.666666666666668)
+        expected = {0: 768, 1: 384, 2: 384}
+        self.assertAlmostPartCount(_partition_counts(rb, 'zone'),
+                                   expected)
+        report = dict(utils.dispersion_report(
+            rb, r'r\d+z\d+$', verbose=True)['graph'])
+        counts = {int(k.split('z')[1]): d['placed_parts']
+                  for k, d in report.items()}
+        self.assertAlmostPartCount(counts, expected)
+        rb.rebalance()
+        self.assertEqual(0, rb.dispersion)
+        expected = {0: 512, 1: 512, 2: 512}
+        self.assertAlmostPartCount(_partition_counts(rb, 'zone'), expected)
+        report = dict(utils.dispersion_report(
+            rb, r'r\d+z\d+$', verbose=True)['graph'])
+        counts = {int(k.split('z')[1]): d['placed_parts']
+                  for k, d in report.items()}
+        self.assertAlmostPartCount(counts, expected)
+
+    def test_weight_dispersion(self):
+        rb = ring.RingBuilder(8, 3, 0)
+
+        for i in range(2):
+            for d in range(3):
+                rb.add_dev({'region': 0, 'zone': 0, 'ip': '127.0.%s.1' % i,
+                            'port': 6000, 'weight': 1.0,
+                            'device': next(self.devs)})
+        for d in range(3):
+            rb.add_dev({'region': 0, 'zone': 0, 'ip': '127.0.2.1',
+                        'port': 6000, 'weight': 10.0,
+                        'device': next(self.devs)})
+
+        rb.rebalance()
+        # each tier should only have 1 replicanth, but the big server has 2
+        # replicas of every part and 3 replicas another 1/2 - so our total
+        # dispersion is greater than one replicanth, it's 1.5
+        self.assertEqual(50.0, rb.dispersion)
+        expected = {
+            '127.0.0.1': 64,
+            '127.0.1.1': 64,
+            '127.0.2.1': 640,
+        }
+        self.assertAlmostPartCount(_partition_counts(rb, 'ip'),
+                                   expected)
+        report = dict(utils.dispersion_report(
+            rb, r'r\d+z\d+-[^/]*$', verbose=True)['graph'])
+        counts = {k.split('-')[1]: d['placed_parts']
+                  for k, d in report.items()}
+        self.assertAlmostPartCount(counts, expected)
+
+    def test_multiple_tier_dispersion(self):
+        rb = ring.RingBuilder(10, 8, 0)
+        r_z_to_ip_count = {
+            (0, 0): 2,
+            (1, 1): 1,
+            (1, 2): 2,
+        }
+        ip_index = 0
+        for (r, z), ip_count in sorted(r_z_to_ip_count.items()):
+            for i in range(ip_count):
+                ip_index += 1
+                for d in range(3):
+                    rb.add_dev({'region': r, 'zone': z,
+                                'ip': '127.%s.%s.%s' % (r, z, ip_index),
+                                'port': 6000, 'weight': 1.0,
+                                'device': next(self.devs)})
+
+        for i in range(3):
+            # it might take a few rebalances for all the right part replicas to
+            # balance from r1z2 into r1z1
+            rb.rebalance()
+        self.assertAlmostEqual(15.52734375, rb.dispersion, delta=5.0)
+        self.assertAlmostEqual(0.0, rb.get_balance(), delta=0.5)
+        expected = {
+            '127.0.0.1': 1638,
+            '127.0.0.2': 1638,
+            '127.1.1.3': 1638,
+            '127.1.2.4': 1638,
+            '127.1.2.5': 1638,
+        }
+        delta = 10
+        self.assertAlmostPartCount(_partition_counts(rb, 'ip'), expected,
+                                   delta=delta)
+        report = dict(utils.dispersion_report(
+            rb, r'r\d+z\d+-[^/]*$', verbose=True)['graph'])
+        counts = {k.split('-')[1]: d['placed_parts']
+                  for k, d in report.items()}
+        self.assertAlmostPartCount(counts, expected, delta=delta)
 
 
 if __name__ == '__main__':
diff --git a/test/unit/common/ring/test_composite_builder.py b/test/unit/common/ring/test_composite_builder.py
new file mode 100644
index 0000000000..956eb5ff14
--- /dev/null
+++ b/test/unit/common/ring/test_composite_builder.py
@@ -0,0 +1,1311 @@
+# Copyright (c) 2010-2017 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import json
+from contextlib import contextmanager
+
+from unittest import mock
+import os
+import random
+import tempfile
+import unittest
+import shutil
+import copy
+import time
+
+from collections import defaultdict, Counter
+
+from swift.common.exceptions import RingBuilderError
+from swift.common.ring import RingBuilder, Ring
+from swift.common.ring.composite_builder import (
+    compose_rings, CompositeRingBuilder, CooperativeRingBuilder)
+
+
+def make_device_iter():
+    x = 0
+    base_port = 6000
+    while True:
+        yield {'id': 200 + x,
+               'region': 0,  # Note that region may be replaced on the tests
+               'zone': 0,
+               'ip': '10.0.0.%s' % x,
+               'replication_ip': '10.0.0.%s' % x,
+               'port': base_port + x,
+               'replication_port': base_port + x,
+               'device': 'sda',
+               'weight': 100.0, }
+        x += 1
+
+
+class BaseTestCompositeBuilder(unittest.TestCase):
+    def setUp(self):
+        self.tmpdir = tempfile.mkdtemp()
+        self.device_iter = make_device_iter()
+        self.output_ring = os.path.join(self.tmpdir, 'composite.ring.gz')
+
+    def pop_region_device(self, region):
+        dev = next(self.device_iter)
+        dev.update({'region': region})
+        return dev
+
+    def tearDown(self):
+        try:
+            shutil.rmtree(self.tmpdir, True)
+        except OSError:
+            pass
+
+    def save_builder_with_no_id(self, builder, fname):
+        orig_to_dict = builder.to_dict
+
+        def fake_to_dict():
+            res = orig_to_dict()
+            res.pop('id')
+            return res
+
+        with mock.patch.object(builder, 'to_dict', fake_to_dict):
+            builder.save(fname)
+
+    def save_builders(self, builders, missing_ids=None, prefix='builder'):
+        missing_ids = missing_ids or []
+        builder_files = []
+        for i, builder in enumerate(builders):
+            fname = os.path.join(self.tmpdir, '%s_%s.builder' % (prefix, i))
+            if i in missing_ids:
+                self.save_builder_with_no_id(builder, fname)
+            else:
+                builder.save(fname)
+            builder_files.append(fname)
+        return builder_files
+
+    def create_sample_ringbuilders(self, num_builders=2, rebalance=True):
+        """
+        Create sample rings with four devices
+
+        :returns: a list of ring builder instances
+        """
+
+        builders = []
+        for region in range(num_builders):
+            fname = os.path.join(self.tmpdir, 'builder_%s.builder' % region)
+            builder = RingBuilder(6, 3, 0)
+            for _ in range(5):
+                dev = self.pop_region_device(region)
+                builder.add_dev(dev)
+            # remove last dev to simulate a ring with some history
+            builder.remove_dev(dev['id'])
+            # add a dev that won't be assigned any parts
+            new_dev = self.pop_region_device(region)
+            new_dev['weight'] = 0
+            builder.add_dev(new_dev)
+            if rebalance:
+                builder.rebalance()
+            builder.save(fname)
+            self.assertTrue(os.path.exists(fname))
+            builders.append(builder)
+
+        return builders
+
+    def add_dev(self, builder, weight=None, region=None):
+        if region is None:
+            dev = next(builder._iter_devs())
+            region = dev['region']
+        new_dev = self.pop_region_device(region)
+        if weight is not None:
+            new_dev['weight'] = weight
+        builder.add_dev(new_dev)
+
+    def add_dev_and_rebalance(self, builder, weight=None):
+        self.add_dev(builder, weight)
+        builder.rebalance()
+
+    def assertDevices(self, composite_ring, builders):
+        """
+        :param composite_ring: a Ring instance
+        :param builders: a list of RingBuilder instances for assertion
+        """
+        # assert all component devices are in composite device table
+        builder_devs = []
+        for builder in builders:
+            builder_devs.extend([
+                (dev['ip'], dev['port'], dev['device'])
+                for dev in builder._iter_devs()])
+
+        got_devices = [
+            (dev['ip'], dev['port'], dev['device'])
+            for dev in composite_ring.devs if dev]
+        self.assertEqual(sorted(builder_devs), sorted(got_devices),
+                         "composite_ring mismatched with part of the rings")
+
+        # assert composite device ids correctly index into the dev list
+        dev_ids = []
+        for i, dev in enumerate(composite_ring.devs):
+            if dev:
+                self.assertEqual(i, dev['id'])
+                dev_ids.append(dev['id'])
+        self.assertEqual(len(builder_devs), len(dev_ids))
+
+        def uniqueness(dev):
+            return (dev['ip'], dev['port'], dev['device'])
+
+        # assert part assignment is ordered by ring order
+        part_count = composite_ring.partition_count
+        for part in range(part_count):
+            primaries = [uniqueness(primary) for primary in
+                         composite_ring.get_part_nodes(part)]
+            offset = 0
+            for builder in builders:
+                sub_primaries = [uniqueness(primary) for primary in
+                                 builder.get_part_devices(part)]
+                self.assertEqual(
+                    primaries[offset:offset + builder.replicas],
+                    sub_primaries,
+                    "composite ring is not ordered by ring order, %s, %s"
+                    % (primaries, sub_primaries))
+                offset += builder.replicas
+
+    def check_composite_ring(self, ring_file, builders):
+        got_ring = Ring(ring_file)
+        self.assertEqual(got_ring.partition_count, builders[0].parts)
+        self.assertEqual(got_ring.replica_count,
+                         sum(b.replicas for b in builders))
+        self.assertEqual(got_ring._part_shift, builders[0].part_shift)
+        self.assertDevices(got_ring, builders)
+
+    def check_composite_meta(self, cb_file, builder_files, version=1):
+        with open(cb_file) as fd:
+            actual = json.load(fd)
+        builders = [RingBuilder.load(fname) for fname in builder_files]
+        expected_metadata = {
+            'saved_path': os.path.abspath(cb_file),
+            'serialization_version': 1,
+            'version': version,
+            'components': [
+                {'id': builder.id,
+                 'version': builder.version,
+                 'replicas': builder.replicas,
+                 }
+                for builder in builders
+            ],
+            'component_builder_files':
+                dict((builder.id, os.path.abspath(builder_files[i]))
+                     for i, builder in enumerate(builders))
+        }
+        self.assertEqual(expected_metadata, actual)
+
+    def _make_composite_builder(self, builders):
+        # helper to compose a ring, save it and sanity check it
+        builder_files = self.save_builders(builders)
+        cb = CompositeRingBuilder(builder_files)
+        cb.compose().save(self.output_ring)
+        self.check_composite_ring(self.output_ring, builders)
+        return cb, builder_files
+
+
+class TestCompositeBuilder(BaseTestCompositeBuilder):
+    def test_compose_rings(self):
+        def do_test(builder_count):
+            builders = self.create_sample_ringbuilders(builder_count)
+            rd = compose_rings(builders)
+            rd.save(self.output_ring)
+            self.check_composite_ring(self.output_ring, builders)
+
+        do_test(2)
+        do_test(3)
+        do_test(4)
+
+    def test_composite_same_region_in_the_different_rings_error(self):
+        builder_1 = self.create_sample_ringbuilders(1)
+        builder_2 = self.create_sample_ringbuilders(1)
+        builders = builder_1 + builder_2
+        with self.assertRaises(ValueError) as cm:
+            compose_rings(builders)
+        self.assertIn('Same region found in different rings',
+                      cm.exception.args[0])
+
+    def test_composite_only_one_ring_in_the_args_error(self):
+        builders = self.create_sample_ringbuilders(1)
+        with self.assertRaises(ValueError) as cm:
+            compose_rings(builders)
+        self.assertIn(
+            'Two or more component builders are required.',
+            cm.exception.args[0])
+
+    def test_composite_same_device_in_the_different_rings_error(self):
+        builders = self.create_sample_ringbuilders(2)
+        same_device = copy.deepcopy(builders[0].devs[200])
+
+        # create one more ring which duplicates a device in the first ring
+        builder = RingBuilder(6, 3, 1)
+        _, fname = tempfile.mkstemp(dir=self.tmpdir)
+        # add info to feed to add_dev
+        same_device.update({'region': 2, 'weight': 100})
+        builder.add_dev(same_device)
+
+        # add rest of the devices, which are unique
+        for _ in range(3):
+            dev = self.pop_region_device(2)
+            builder.add_dev(dev)
+        builder.rebalance()
+        builder.save(fname)
+        # sanity
+        self.assertTrue(os.path.exists(fname))
+
+        builders.append(builder)
+
+        with self.assertRaises(ValueError) as cm:
+            compose_rings(builders)
+        self.assertIn(
+            'Duplicate ip/port/device combination %(ip)s/%(port)s/%(device)s '
+            'found in builders at indexes 0 and 2' %
+            same_device, cm.exception.args[0])
+
+    def test_different_part_power_error(self):
+        # create a ring builder
+        # (default, part power is 6 with create_sample_ringbuilders)
+        builders = self.create_sample_ringbuilders(1)
+
+        # prepare another ring which has different part power
+        incorrect_builder = RingBuilder(4, 3, 1)
+        _, fname = tempfile.mkstemp(dir=self.tmpdir)
+        for _ in range(4):
+            dev = self.pop_region_device(1)
+            incorrect_builder.add_dev(dev)
+        incorrect_builder.rebalance()
+        incorrect_builder.save(fname)
+        # sanity
+        self.assertTrue(os.path.exists(fname))
+
+        # sanity
+        correct_builder = builders[0]
+        self.assertNotEqual(correct_builder.part_shift,
+                            incorrect_builder.part_shift)
+        self.assertNotEqual(correct_builder.part_power,
+                            incorrect_builder.part_power)
+
+        builders.append(incorrect_builder)
+        with self.assertRaises(ValueError) as cm:
+            compose_rings(builders)
+        self.assertIn("All builders must have same value for 'part_power'",
+                      cm.exception.args[0])
+
+    def test_compose_rings_float_replica_count_builder_error(self):
+        builders = self.create_sample_ringbuilders(1)
+
+        # prepare another ring which has float replica count
+        incorrect_builder = RingBuilder(6, 1.5, 1)
+        _, fname = tempfile.mkstemp(dir=self.tmpdir)
+        for _ in range(4):
+            dev = self.pop_region_device(1)
+            incorrect_builder.add_dev(dev)
+        incorrect_builder.rebalance()
+        incorrect_builder.save(fname)
+        # sanity
+        self.assertTrue(os.path.exists(fname))
+        self.assertEqual(1.5, incorrect_builder.replicas)
+        # the first replica has 2 ** 6 partitions
+        self.assertEqual(
+            2 ** 6, len(incorrect_builder._replica2part2dev[0]))
+        # but the second replica has the half of the first partitions
+        self.assertEqual(
+            2 ** 5, len(incorrect_builder._replica2part2dev[1]))
+        builders.append(incorrect_builder)
+
+        with self.assertRaises(ValueError) as cm:
+            compose_rings(builders)
+        self.assertIn("Problem with builders", cm.exception.args[0])
+        self.assertIn("Non integer replica count", cm.exception.args[0])
+
+    def test_compose_rings_rebalance_needed(self):
+        builders = self.create_sample_ringbuilders(2)
+
+        # add a new device to builder 1 but no rebalance
+        dev = self.pop_region_device(1)
+        builders[1].add_dev(dev)
+        self.assertTrue(builders[1].devs_changed)  # sanity check
+        with self.assertRaises(ValueError) as cm:
+            compose_rings(builders)
+        self.assertIn("Problem with builders", cm.exception.args[0])
+        self.assertIn("Builder needs rebalance", cm.exception.args[0])
+        # after rebalance, that works (sanity)
+        builders[1].rebalance()
+        compose_rings(builders)
+
+    def test_different_replica_count_works(self):
+        # create a ring builder
+        # (default, part power is 6 with create_sample_ringbuilders)
+        builders = self.create_sample_ringbuilders(1)
+
+        # prepare another ring which has different replica count
+        builder = RingBuilder(6, 1, 1)
+        _, fname = tempfile.mkstemp(dir=self.tmpdir)
+        for _ in range(4):
+            dev = self.pop_region_device(1)
+            builder.add_dev(dev)
+        builder.rebalance()
+        builder.save(fname)
+        # sanity
+        self.assertTrue(os.path.exists(fname))
+        builders.append(builder)
+
+        rd = compose_rings(builders)
+        rd.save(self.output_ring)
+        got_ring = Ring(self.output_ring)
+        self.assertEqual(got_ring.partition_count, 2 ** 6)
+        self.assertEqual(got_ring.replica_count, 4)  # 3 + 1
+        self.assertEqual(got_ring._part_shift, 26)
+        self.assertDevices(got_ring, builders)
+
+    def test_ring_swap(self):
+        # sanity
+        builders = self.create_sample_ringbuilders(2)
+        rd = compose_rings(builders)
+        rd.save(self.output_ring)
+        got_ring = Ring(self.output_ring)
+        self.assertEqual(got_ring.partition_count, 2 ** 6)
+        self.assertEqual(got_ring.replica_count, 6)
+        self.assertEqual(got_ring._part_shift, 26)
+        self.assertDevices(got_ring, builders)
+
+        # even if swapped, it works
+        reverse_builders = builders[::-1]
+        self.assertNotEqual(reverse_builders, builders)
+        rd = compose_rings(reverse_builders)
+        rd.save(self.output_ring)
+        got_ring = Ring(self.output_ring)
+        self.assertEqual(got_ring.partition_count, 2 ** 6)
+        self.assertEqual(got_ring.replica_count, 6)
+        self.assertEqual(got_ring._part_shift, 26)
+        self.assertDevices(got_ring, reverse_builders)
+
+        # but if the composite rings are different order, the composite ring
+        # *will* be different. Note that the CompositeRingBuilder class will
+        # check builder order against the existing ring and fail if the order
+        # is different (actually checking the metadata). See also
+        # test_compose_different_builder_order
+        with self.assertRaises(AssertionError) as cm:
+            self.assertDevices(got_ring, builders)
+
+        self.assertIn("composite ring is not ordered by ring order",
+                      cm.exception.args[0])
+
+
+class TestCompositeRingBuilder(BaseTestCompositeBuilder):
+    def test_compose_with_builder_files(self):
+        cb_file = os.path.join(self.tmpdir, 'test-composite-ring.json')
+        builders = self.create_sample_ringbuilders(2)
+        cb, _ = self._make_composite_builder(builders)
+        cb.save(cb_file)
+
+        for i, b in enumerate(builders):
+            self.add_dev_and_rebalance(b)
+        self.save_builders(builders)
+        cb = CompositeRingBuilder.load(cb_file)
+        cb.compose().save(self.output_ring)
+        self.check_composite_ring(self.output_ring, builders)
+
+    def test_compose_ok(self):
+        cb_file = os.path.join(self.tmpdir, 'test-composite-ring.json')
+        builders = self.create_sample_ringbuilders(2)
+        # make first version of composite ring
+        cb, builder_files = self._make_composite_builder(builders)
+        # check composite builder persists ok
+        cb.save(cb_file)
+        self.assertTrue(os.path.exists(cb_file))
+        self.check_composite_meta(cb_file, builder_files)
+        # and reloads ok
+        cb = CompositeRingBuilder.load(cb_file)
+        self.assertEqual(1, cb.version)
+        # compose detects if no component builder changes, if we ask it to...
+        with self.assertRaises(ValueError) as cm:
+            cb.compose(require_modified=True)
+        self.assertIn('None of the component builders has been modified',
+                      cm.exception.args[0])
+        self.assertEqual(1, cb.version)
+        # ...but by default will compose again despite no changes to components
+        cb.compose(force=True).save(self.output_ring)
+        self.check_composite_ring(self.output_ring, builders)
+        self.assertEqual(2, cb.version)
+        # check composite builder persists ok again
+        cb_file = os.path.join(self.tmpdir, 'test-composite-ring.json2')
+        cb.save(cb_file)
+        self.assertTrue(os.path.exists(cb_file))
+        self.check_composite_meta(cb_file, builder_files, version=2)
+
+    def test_compose_modified_component_builders(self):
+        # check it's ok to compose again with same but modified builders
+        cb_file = os.path.join(self.tmpdir, 'test-composite-ring.json')
+        builders = self.create_sample_ringbuilders(2)
+        cb, builder_files = self._make_composite_builder(builders)
+        ring = Ring(self.output_ring)
+        orig_devs = [dev for dev in ring.devs if dev]
+        self.assertEqual(10, len(orig_devs))  # sanity check
+        self.add_dev_and_rebalance(builders[1])
+        builder_files = self.save_builders(builders)
+        cb.compose().save(self.output_ring)
+        self.check_composite_ring(self.output_ring, builders)
+        ring = Ring(self.output_ring)
+        modified_devs = [dev for dev in ring.devs if dev]
+        self.assertEqual(len(orig_devs) + 1, len(modified_devs))
+        # check composite builder persists ok
+        cb.save(cb_file)
+        self.assertTrue(os.path.exists(cb_file))
+        self.check_composite_meta(cb_file, builder_files, version=2)
+        # and reloads ok
+        cb = CompositeRingBuilder.load(cb_file)
+        # and composes ok after reload
+        cb.compose(force=True).save(self.output_ring)
+        self.check_composite_ring(self.output_ring, builders)
+        # check composite builder persists ok again
+        cb_file = os.path.join(self.tmpdir, 'test-composite-ring.json2')
+        cb.save(cb_file)
+        self.assertTrue(os.path.exists(cb_file))
+        self.check_composite_meta(cb_file, builder_files, version=3)
+
+    def test_compose_override_component_builders(self):
+        # check passing different builder files to the compose() method
+        # overrides loaded builder files
+        cb_file = os.path.join(self.tmpdir, 'test-composite-ring.json')
+        builders = self.create_sample_ringbuilders(2)
+        cb, builder_files = self._make_composite_builder(builders)
+        # modify builders and save in different files
+        self.add_dev_and_rebalance(builders[1])
+        with self.assertRaises(ValueError):
+            # sanity check - originals are unchanged
+            cb.compose(builder_files, require_modified=True)
+        other_files = self.save_builders(builders, prefix='other')
+        cb.compose(other_files, require_modified=True).save(self.output_ring)
+        self.check_composite_ring(self.output_ring, builders)
+        # check composite builder persists ok
+        cb.save(cb_file)
+        self.assertTrue(os.path.exists(cb_file))
+        self.check_composite_meta(cb_file, other_files, version=2)
+        # and reloads ok
+        cb = CompositeRingBuilder.load(cb_file)
+        # and composes ok after reload
+        cb.compose(force=True).save(self.output_ring)
+        self.check_composite_ring(self.output_ring, builders)
+        # check composite builder persists ok again
+        cb_file = os.path.join(self.tmpdir, 'test-composite-ring.json2')
+        cb.save(cb_file)
+        self.assertTrue(os.path.exists(cb_file))
+        self.check_composite_meta(cb_file, other_files, version=3)
+
+    def test_abs_paths_persisted(self):
+        cwd = os.getcwd()
+        try:
+            os.chdir(self.tmpdir)
+            builders = self.create_sample_ringbuilders(2)
+            builder_files = self.save_builders(builders)
+            rel_builder_files = [os.path.basename(bf) for bf in builder_files]
+            cb = CompositeRingBuilder(rel_builder_files)
+            cb.compose().save(self.output_ring)
+            self.check_composite_ring(self.output_ring, builders)
+            cb_file = os.path.join(self.tmpdir, 'test-composite-ring.json')
+            rel_cb_file = os.path.basename(cb_file)
+            cb.save(rel_cb_file)
+            self.check_composite_meta(rel_cb_file, rel_builder_files)
+        finally:
+            os.chdir(cwd)
+
+    def test_load_errors(self):
+        bad_file = os.path.join(self.tmpdir, 'bad_file.json')
+        with self.assertRaises(IOError):
+            CompositeRingBuilder.load(bad_file)
+
+        def check_bad_content(content):
+            with open(bad_file, 'wb') as fp:
+                fp.write(content)
+            try:
+                with self.assertRaises(ValueError) as cm:
+                    CompositeRingBuilder.load(bad_file)
+                self.assertIn(
+                    "File does not contain valid composite ring data",
+                    cm.exception.args[0])
+            except AssertionError as err:
+                raise AssertionError('With content %r: %s' % (content, err))
+
+        for content in ('', 'not json', json.dumps({}), json.dumps([])):
+            check_bad_content(content.encode('ascii'))
+
+        good_content = {
+            'components': [
+                {'version': 1, 'id': 'uuid_x', 'replicas': 12},
+                {'version': 2, 'id': 'uuid_y', 'replicas': 12}
+            ],
+            'builder_files': {'uuid_x': '/path/to/file_x',
+                              'uuid_y': '/path/to/file_y'},
+            'version': 99}
+        for missing in good_content:
+            bad_content = dict(good_content)
+            bad_content.pop(missing)
+            check_bad_content(json.dumps(bad_content).encode('ascii'))
+
+    def test_save_errors(self):
+        cb_file = os.path.join(self.tmpdir, 'test-composite-ring.json')
+
+        def do_test(cb):
+            with self.assertRaises(ValueError) as cm:
+                cb.save(cb_file)
+            self.assertIn("No composed ring to save", cm.exception.args[0])
+
+        do_test(CompositeRingBuilder())
+        do_test(CompositeRingBuilder([]))
+        do_test(CompositeRingBuilder(['file1', 'file2']))
+
+    def test_rebalance(self):
+        @contextmanager
+        def mock_rebalance():
+            # captures component builder rebalance call results, yields a dict
+            # that maps builder -> results
+            calls = defaultdict(list)
+            orig_func = RingBuilder.rebalance
+
+            def func(builder, **kwargs):
+                result = orig_func(builder, **kwargs)
+                calls[builder].append(result)
+                return result
+
+            with mock.patch('swift.common.ring.RingBuilder.rebalance', func):
+                yield calls
+
+        def check_results():
+            self.assertEqual(2, len(rebalance_calls))  # 2 builders called
+            for calls in rebalance_calls.values():
+                self.assertFalse(calls[1:])  # 1 call to each builder
+
+            self.assertEqual(sorted(expected_ids),
+                             sorted([b.id for b in rebalance_calls]))
+            self.assertEqual(sorted(expected_versions),
+                             sorted([b.version for b in rebalance_calls]))
+            for b in rebalance_calls:
+                self.assertEqual(set(rebalance_calls.keys()),
+                                 set(b.parent_builder._builders))
+
+            # check the rebalanced builders were saved
+            written_builders = [RingBuilder.load(f) for f in builder_files]
+            self.assertEqual(expected_ids,
+                             [b.id for b in written_builders])
+            self.assertEqual(expected_versions,
+                             [b.version for b in written_builders])
+
+            # check returned results, should be in component order
+            self.assertEqual(2, len(results))
+            self.assertEqual(builder_files,
+                             [r['builder_file'] for r in results])
+            self.assertEqual(expected_versions,
+                             [r['builder'].version for r in results])
+            self.assertEqual(expected_ids, [r['builder'].id for r in results])
+            self.assertEqual(
+                [rebalance_calls[r['builder']][0] for r in results],
+                [r['result'] for r in results])
+
+        # N.B. the sample builders have zero min_part_hours
+        builders = self.create_sample_ringbuilders(2)
+        expected_versions = [b.version + 1 for b in builders]
+        expected_ids = [b.id for b in builders]
+
+        # test rebalance loads component builders
+        builder_files = self.save_builders(builders)
+        cb = CompositeRingBuilder(builder_files)
+        with mock_rebalance() as rebalance_calls:
+            results = cb.rebalance()
+        check_results()
+
+        # test loading builder files via load_components
+        # revert builder files to original builder state
+        builder_files = self.save_builders(builders)
+        cb = CompositeRingBuilder()
+        cb.load_components(builder_files)
+        with mock_rebalance() as rebalance_calls:
+            results = cb.rebalance()
+        check_results()
+
+    def test_rebalance_errors(self):
+        cb = CompositeRingBuilder()
+        with self.assertRaises(ValueError) as cm:
+            cb.rebalance()
+        self.assertIn('Two or more component builders are required',
+                      cm.exception.args[0])
+
+        builders = self.create_sample_ringbuilders(2)
+        cb, builder_files = self._make_composite_builder(builders)
+        with mock.patch('swift.common.ring.RingBuilder.rebalance',
+                        side_effect=RingBuilderError('test')):
+            with mock.patch('swift.common.ring.composite_builder.shuffle',
+                            lambda x: x):
+                with self.assertRaises(RingBuilderError) as cm:
+                    cb.rebalance()
+        self.assertIn('An error occurred while rebalancing component %s' %
+                      builder_files[0], str(cm.exception))
+        self.assertIsNone(cb._builders)
+
+        with mock.patch('swift.common.ring.RingBuilder.validate',
+                        side_effect=RingBuilderError('test')):
+            with mock.patch('swift.common.ring.composite_builder.shuffle',
+                            lambda x: x):
+                with self.assertRaises(RingBuilderError) as cm:
+                    cb.rebalance()
+        self.assertIn('An error occurred while rebalancing component %s' %
+                      builder_files[0], str(cm.exception))
+        self.assertIsNone(cb._builders)
+
+    def test_rebalance_with_unrebalanced_builders(self):
+        # create 2 non-rebalanced rings
+        builders = self.create_sample_ringbuilders(rebalance=False)
+        # save builders
+        builder_files = self.save_builders(builders)
+        cb = CompositeRingBuilder(builder_files)
+        # sanity, it is impossible to compose un-rebalanced component rings
+        with self.assertRaises(ValueError) as cm:
+            cb.compose()
+        self.assertIn("Builder needs rebalance", cm.exception.args[0])
+        # but ok to compose after rebalance
+        cb.rebalance()
+        rd = cb.compose()
+        rd.save(self.output_ring)
+        rebalanced_builders = [RingBuilder.load(f) for f in builder_files]
+        self.check_composite_ring(self.output_ring, rebalanced_builders)
+
+
+class TestLoadComponents(BaseTestCompositeBuilder):
+    # Tests for the loading of component builders.
+    def _call_method_under_test(self, cb, *args, **kwargs):
+        # Component builder loading is triggered by the load_components method
+        # and the compose method. This method provides a hook for subclasses to
+        # configure a different method to repeat the component loading tests.
+        cb.load_components(*args, **kwargs)
+
+    def test_load_components(self):
+        builders = self.create_sample_ringbuilders(2)
+        builder_files = self.save_builders(builders)
+        cb = CompositeRingBuilder(builder_files)
+        # check lazy loading
+        self.assertEqual(builder_files, cb._builder_files)
+        self.assertFalse(cb._builders)  # none loaded yet
+
+        # check loading configured files
+        self._call_method_under_test(cb)
+        self.assertEqual(builder_files, cb._builder_files)
+        for i, builder in enumerate(cb._builders):
+            self.assertEqual(builders[i].id, builder.id)
+            self.assertEqual(builders[i].devs, builder.devs)
+
+        # modify builders and save in different files
+        self.add_dev_and_rebalance(builders[0])
+        other_files = self.save_builders(builders, prefix='other')
+        # reload from other files
+        self._call_method_under_test(cb, other_files)
+        self.assertEqual(other_files, cb._builder_files)
+        for i, builder in enumerate(cb._builders):
+            self.assertEqual(builders[i].id, builder.id)
+            self.assertEqual(builders[i].devs, builder.devs)
+
+        # modify builders again and save in same files
+        self.add_dev_and_rebalance(builders[1])
+        self.save_builders(builders, prefix='other')
+        # reload from same files
+        self._call_method_under_test(cb)
+        self.assertEqual(other_files, cb._builder_files)
+        for i, builder in enumerate(cb._builders):
+            self.assertEqual(builders[i].id, builder.id)
+            self.assertEqual(builders[i].devs, builder.devs)
+
+    def test_load_components_insufficient_builders(self):
+        def do_test(builder_files, force):
+            cb = CompositeRingBuilder(builder_files)
+            with self.assertRaises(ValueError) as cm:
+                self._call_method_under_test(cb, builder_files,
+                                             force=force)
+            self.assertIn('Two or more component builders are required',
+                          cm.exception.args[0])
+
+            cb = CompositeRingBuilder()
+            with self.assertRaises(ValueError) as cm:
+                self._call_method_under_test(cb, builder_files,
+                                             force=force)
+            self.assertIn('Two or more component builders are required',
+                          cm.exception.args[0])
+
+        builders = self.create_sample_ringbuilders(3)
+        builder_files = self.save_builders(builders)
+        do_test([], force=False)
+        do_test([], force=True)  # this error is never ignored
+        do_test(builder_files[:1], force=False)
+        do_test(builder_files[:1], force=True)  # this error is never ignored
+
+    def test_load_components_missing_builder_id(self):
+        def check_missing_id(cb, builders):
+            # not ok to load builder_files that have no id assigned
+            orig_version = cb.version
+            no_id = random.randint(0, len(builders) - 1)
+            # rewrite the builder files so that one has missing id
+            builder_files = self.save_builders(builders, missing_ids=[no_id])
+
+            def do_check(force):
+                with self.assertRaises(ValueError) as cm:
+                    self._call_method_under_test(cb, builder_files,
+                                                 force=force)
+                error_lines = cm.exception.args[0].split('\n')
+                self.assertIn("Problem with builder at index %s" % no_id,
+                              error_lines[0])
+                self.assertIn("id attribute has not been initialised",
+                              error_lines[0])
+                self.assertFalse(error_lines[1:])
+                self.assertEqual(orig_version, cb.version)
+
+            do_check(False)
+            do_check(True)  # we never ignore this error
+
+        # check with compose not previously called, cb has no existing metadata
+        builders = self.create_sample_ringbuilders(3)
+        cb = CompositeRingBuilder()
+        check_missing_id(cb, builders)
+        # now save good copies of builders and compose so this cb has
+        # existing component metadata
+        builder_files = self.save_builders(builders)
+        cb = CompositeRingBuilder(builder_files)
+        cb.compose()  # cb now has component metadata
+        check_missing_id(cb, builders)
+
+    def test_load_components_duplicate_builder_ids(self):
+        builders = self.create_sample_ringbuilders(3)
+        builders[2]._id = builders[0]._id
+        cb = CompositeRingBuilder(self.save_builders(builders))
+
+        def do_check(force):
+            with self.assertRaises(ValueError) as cm:
+                self._call_method_under_test(cb, force=force)
+            error_lines = cm.exception.args[0].split('\n')
+            self.assertIn("Builder id %r used at indexes 0, 2" %
+                          builders[0].id, error_lines[0])
+            self.assertFalse(error_lines[1:])
+            self.assertEqual(0, cb.version)
+
+        do_check(False)
+        do_check(True)
+
+    def test_load_components_unchanged_builders(self):
+        def do_test(cb, builder_files, **kwargs):
+            orig_version = cb.version
+            with self.assertRaises(ValueError) as cm:
+                self._call_method_under_test(cb, builder_files, **kwargs)
+            error_lines = cm.exception.args[0].split('\n')
+            self.assertIn("None of the component builders has been modified",
+                          error_lines[0])
+            self.assertFalse(error_lines[1:])
+            self.assertEqual(orig_version, cb.version)
+
+        builders = self.create_sample_ringbuilders(2)
+        cb, builder_files = self._make_composite_builder(builders)
+        # ok to load same *unchanged* builders
+        self._call_method_under_test(cb, builder_files)
+        # unless require_modified is set
+        do_test(cb, builder_files, require_modified=True)
+        # even if we rewrite the files
+        builder_files = self.save_builders(builders)
+        do_test(cb, builder_files, require_modified=True)
+        # even if we rename the files
+        builder_files = self.save_builders(builders, prefix='other')
+        do_test(cb, builder_files, require_modified=True)
+        # force trumps require_modified
+        self._call_method_under_test(cb, builder_files, force=True,
+                                     require_modified=True)
+
+    def test_load_components_older_builder(self):
+        # make first version of composite ring
+        builders = self.create_sample_ringbuilders(2)
+        cb, builder_files = self._make_composite_builder(builders)
+        old_builders = [copy.deepcopy(b) for b in builders]
+        # update components and reload
+        for i, b in enumerate(builders):
+            self.add_dev_and_rebalance(b)
+            self.assertLess(old_builders[i].version, b.version)
+        self.save_builders(builders)
+        self._call_method_under_test(cb)
+        orig_version = cb.version
+        cb.compose()  # compose with newer builder versions
+        self.assertEqual(orig_version + 1, cb.version)  # sanity check
+        # not ok to use old versions of same builders
+        self.save_builders([old_builders[0], builders[1]])
+        with self.assertRaises(ValueError) as cm:
+            self._call_method_under_test(cb)
+        error_lines = cm.exception.args[0].split('\n')
+        self.assertIn("Invalid builder change at index 0", error_lines[0])
+        self.assertIn("Older builder version", error_lines[0])
+        self.assertFalse(error_lines[1:])
+        self.assertEqual(orig_version + 1, cb.version)
+        # not even if one component ring has changed
+        self.add_dev_and_rebalance(builders[1])
+        self.save_builders([old_builders[0], builders[1]])
+        with self.assertRaises(ValueError) as cm:
+            self._call_method_under_test(cb)
+        error_lines = cm.exception.args[0].split('\n')
+        self.assertIn("Invalid builder change at index 0", error_lines[0])
+        self.assertIn("Older builder version", error_lines[0])
+        self.assertFalse(error_lines[1:])
+        self.assertEqual(orig_version + 1, cb.version)
+        self.assertIsNone(cb._builders)
+        # unless we ignore errors
+        self._call_method_under_test(cb, force=True)
+        self.assertEqual(old_builders[0].version, cb._builders[0].version)
+
+    def test_load_components_different_number_builders(self):
+        # not ok to use a different number of component rings
+        builders = self.create_sample_ringbuilders(4)
+
+        def do_test(bad_builders):
+            cb, builder_files = self._make_composite_builder(builders[:3])
+            # expect an error
+            with self.assertRaises(ValueError) as cm:
+                self._call_method_under_test(
+                    cb, self.save_builders(bad_builders))
+            error_lines = cm.exception.args[0].split('\n')
+            self.assertFalse(error_lines[1:])
+            self.assertEqual(1, cb.version)
+            # unless we ignore errors
+            self._call_method_under_test(cb, self.save_builders(bad_builders),
+                                         force=True)
+            self.assertEqual(len(bad_builders), len(cb._builders))
+            return error_lines
+
+        error_lines = do_test(builders[:2])  # too few
+        self.assertIn("Missing builder at index 2", error_lines[0])
+        error_lines = do_test(builders)  # too many
+        self.assertIn("Unexpected extra builder at index 3", error_lines[0])
+
+    def test_load_components_different_builders(self):
+        # not ok to change component rings
+        builders = self.create_sample_ringbuilders(3)
+        cb, builder_files = self._make_composite_builder(builders[:2])
+        # ensure builder[0] is newer version so that's not the problem
+        self.add_dev_and_rebalance(builders[0])
+        different_files = self.save_builders([builders[0], builders[2]])
+        with self.assertRaises(ValueError) as cm:
+            self._call_method_under_test(cb, different_files)
+        error_lines = cm.exception.args[0].split('\n')
+        self.assertIn("Invalid builder change at index 1", error_lines[0])
+        self.assertIn("Attribute mismatch for id", error_lines[0])
+        self.assertFalse(error_lines[1:])
+        self.assertEqual(1, cb.version)
+        # ok if we force
+        self._call_method_under_test(cb, different_files, force=True)
+        self.assertEqual(different_files, cb._builder_files)
+
+    def test_load_component_different_builder_order(self):
+        # not ok to change order of component rings
+        builders = self.create_sample_ringbuilders(4)
+        cb, builder_files = self._make_composite_builder(builders)
+        builder_files.reverse()
+        with self.assertRaises(ValueError) as cm:
+            self._call_method_under_test(cb, builder_files)
+        error_lines = cm.exception.args[0].split('\n')
+        for i, line in enumerate(error_lines):
+            self.assertIn("Invalid builder change at index %s" % i, line)
+            self.assertIn("Attribute mismatch for id", line)
+        self.assertEqual(1, cb.version)
+        # ok if we force
+        self._call_method_under_test(cb, builder_files, force=True)
+        self.assertEqual(builder_files, cb._builder_files)
+
+    def test_load_components_replica_count_changed(self):
+        # not ok to change the number of replicas in a ring
+        builders = self.create_sample_ringbuilders(3)
+        cb, builder_files = self._make_composite_builder(builders)
+        builders[0].set_replicas(4)
+        self.save_builders(builders)
+        with self.assertRaises(ValueError) as cm:
+            self._call_method_under_test(cb)
+        error_lines = cm.exception.args[0].split('\n')
+        for i, line in enumerate(error_lines):
+            self.assertIn("Invalid builder change at index 0", line)
+            self.assertIn("Attribute mismatch for replicas", line)
+        self.assertEqual(1, cb.version)
+        # ok if we force
+        self._call_method_under_test(cb, force=True)
+
+
+class TestComposeLoadComponents(TestLoadComponents):
+    def _call_method_under_test(self, cb, *args, **kwargs):
+        cb.compose(*args, **kwargs)
+
+    def test_load_components_replica_count_changed(self):
+        # For compose method this test differs from superclass when the force
+        # flag is used, because although the force flag causes load_components
+        # to skip checks, the actual ring composition fails.
+        # not ok to change the number of replicas in a ring
+        builders = self.create_sample_ringbuilders(3)
+        cb, builder_files = self._make_composite_builder(builders)
+        builders[0].set_replicas(4)
+        self.save_builders(builders)
+        with self.assertRaises(ValueError) as cm:
+            self._call_method_under_test(cb)
+        error_lines = cm.exception.args[0].split('\n')
+        for i, line in enumerate(error_lines):
+            self.assertIn("Invalid builder change at index 0", line)
+            self.assertIn("Attribute mismatch for replicas", line)
+        self.assertEqual(1, cb.version)
+        # if we force, then load_components succeeds but the compose pre
+        # validate will fail because the builder needs rebalancing
+        with self.assertRaises(ValueError) as cm:
+            self._call_method_under_test(cb, force=True)
+        error_lines = cm.exception.args[0].split('\n')
+        self.assertIn("Problem with builders", error_lines[0])
+        self.assertIn("Builder needs rebalance", error_lines[1])
+        self.assertFalse(error_lines[2:])
+        self.assertEqual(1, cb.version)
+
+
+class TestCooperativeRingBuilder(BaseTestCompositeBuilder):
+    def _make_coop_builder(self, region, composite_builder, rebalance=False,
+                           min_part_hours=1):
+        rb = CooperativeRingBuilder(8, 3, min_part_hours, composite_builder)
+        if composite_builder._builders is None:
+            composite_builder._builders = [rb]
+        for i in range(3):
+            self.add_dev(rb, region=region)
+        if rebalance:
+            rb.rebalance()
+            self.assertEqual(self._partition_counts(rb),
+                             [256, 256, 256])  # sanity check
+        return rb
+
+    def _partition_counts(self, builder):
+        """
+        Returns an array mapping device id's to (number of
+        partitions assigned to that device).
+        """
+        c = Counter(builder.devs[dev_id]['id']
+                    for part2dev_id in builder._replica2part2dev
+                    for dev_id in part2dev_id)
+        return [c[d['id']] for d in builder.devs if d]
+
+    def get_moved_parts(self, after, before):
+        def uniqueness(dev):
+            return dev['ip'], dev['port'], dev['device']
+        moved_parts = set()
+        for p in range(before.parts):
+            if ({uniqueness(dev) for dev in before._devs_for_part(p)} !=
+                    {uniqueness(dev) for dev in after._devs_for_part(p)}):
+                moved_parts.add(p)
+        return moved_parts
+
+    def num_parts_can_move(self, builder):
+        # note that can_part_move() gives consideration to the
+        # _part_moved_bitmap which is only reset when a rebalance starts
+        return len(
+            [p for p in range(builder.parts)
+             if super(CooperativeRingBuilder, builder)._can_part_move(p)])
+
+    @mock.patch('swift.common.ring.builder.time')
+    def _check_rebalance_respects_cobuilder_part_moves(
+            self, min_part_hours, mock_time):
+        mock_time.return_value = now = int(time.time())
+        builder_files = []
+        cb = CompositeRingBuilder()
+        for i in (1, 2, 3):
+            b = self._make_coop_builder(i, cb, min_part_hours=min_part_hours)
+            fname = os.path.join(self.tmpdir, 'builder_%s.builder' % i)
+            b.save(fname)
+            builder_files.append(fname)
+        builder_files, builders = cb.load_components(builder_files)
+
+        # all cobuilders can perform initial rebalance
+        cb.rebalance()
+        exp = [256, 256, 256]
+        self.assertEqual(exp, self._partition_counts(builders[0]))
+        self.assertEqual(exp, self._partition_counts(builders[1]))
+        self.assertEqual(exp, self._partition_counts(builders[2]))
+        exp = min_part_hours * 3600
+        self.assertEqual(exp, builders[0].min_part_seconds_left)
+        self.assertEqual(exp, builders[1].min_part_seconds_left)
+        self.assertEqual(exp, builders[2].min_part_seconds_left)
+
+        # jump forwards min_part_hours
+        now += min_part_hours * 3600
+        mock_time.return_value = now
+        old_builders = []
+        for builder in builders:
+            old_builder = CooperativeRingBuilder(8, 3, min_part_hours, None)
+            old_builder.copy_from(copy.deepcopy(builder.to_dict()))
+            old_builders.append(old_builder)
+
+        for builder in builders:
+            self.add_dev(builder)
+        # sanity checks: all builders are ready for rebalance
+        self.assertEqual(0, builders[0].min_part_seconds_left)
+        self.assertEqual(0, builders[1].min_part_seconds_left)
+        self.assertEqual(0, builders[2].min_part_seconds_left)
+        # ... but last_part_moves not yet updated to current epoch
+        if min_part_hours > 0:
+            self.assertEqual(0, self.num_parts_can_move(builders[0]))
+            self.assertEqual(0, self.num_parts_can_move(builders[1]))
+            self.assertEqual(0, self.num_parts_can_move(builders[2]))
+
+        with mock.patch('swift.common.ring.composite_builder.shuffle',
+                        lambda x: x):
+            cb.rebalance()
+
+        rb1_parts_moved = self.get_moved_parts(builders[0], old_builders[0])
+        self.assertEqual(192, len(rb1_parts_moved))
+        self.assertEqual(self._partition_counts(builders[0]),
+                         [192, 192, 192, 192])
+
+        rb2_parts_moved = self.get_moved_parts(builders[1], old_builders[1])
+        self.assertEqual(64, len(rb2_parts_moved))
+        counts = self._partition_counts(builders[1])
+        self.assertEqual(counts[3], 64)
+        self.assertEqual([234, 235, 235], sorted(counts[:3]))
+        self.assertFalse(rb2_parts_moved.intersection(rb1_parts_moved))
+
+        # rb3 can't rebalance - all parts moved while rebalancing rb1 and rb2
+        self.assertEqual(
+            0, len(self.get_moved_parts(builders[2], old_builders[2])))
+
+        # jump forwards min_part_hours, all builders can move all parts again,
+        # so now rb2 should be able to further rebalance
+        now += min_part_hours * 3600
+        mock_time.return_value = now
+        old_builders = []
+        for builder in builders:
+            old_builder = CooperativeRingBuilder(8, 3, min_part_hours, None)
+            old_builder.copy_from(copy.deepcopy(builder.to_dict()))
+            old_builders.append(old_builder)
+        with mock.patch('swift.common.ring.composite_builder.shuffle',
+                        lambda x: x):
+            cb.rebalance()
+
+        rb2_parts_moved = self.get_moved_parts(builders[1], old_builders[1])
+        self.assertGreater(len(rb2_parts_moved), 64)
+        self.assertGreater(self._partition_counts(builders[1])[3], 64)
+        self.assertLess(self.num_parts_can_move(builders[2]), 256)
+        self.assertEqual(256, self.num_parts_can_move(builders[0]))
+        # and rb3 should also have been able to move some parts
+        rb3_parts_moved = self.get_moved_parts(builders[2], old_builders[2])
+        self.assertGreater(len(rb3_parts_moved), 0)
+        self.assertFalse(rb3_parts_moved.intersection(rb2_parts_moved))
+
+        # but cobuilders will not prevent a new rb rebalancing for first time
+        rb4 = self._make_coop_builder(4, cb, rebalance=False,
+                                      min_part_hours=min_part_hours)
+        builders.append(rb4)
+        builder_files = []
+        for i, builder in enumerate(builders):
+            fname = os.path.join(self.tmpdir, 'builder_%s.builder' % i)
+            builder.save(fname)
+            builder_files.append(fname)
+        cb = CompositeRingBuilder()
+        builder_files, builders = cb.load_components(builder_files)
+        cb.rebalance()
+        self.assertEqual(256, len(self.get_moved_parts(builders[3], rb4)))
+
+    def test_rebalance_respects_cobuilder_part_moves(self):
+        self._check_rebalance_respects_cobuilder_part_moves(1)
+        self._check_rebalance_respects_cobuilder_part_moves(0)
+
+    @mock.patch('swift.common.ring.builder.time')
+    def _check_rebalance_cobuilder_states(
+            self, min_part_hours, mock_time):
+
+        @contextmanager
+        def mock_rebalance():
+            # wrap rebalance() in order to capture builder states before and
+            # after each component rebalance
+            orig_rebalance = RingBuilder.rebalance
+            # a dict mapping builder -> (list of captured builder states)
+            captured_builder_states = defaultdict(list)
+
+            def update_states():
+                for b in cb._builders:
+                    rb = CooperativeRingBuilder(8, 3, min_part_hours, None)
+                    rb.copy_from(copy.deepcopy(b.to_dict()))
+                    rb._part_moved_bitmap = bytearray(b._part_moved_bitmap)
+                    captured_builder_states[b].append(rb)
+
+            def wrap_rebalance(builder_instance):
+                update_states()
+                results = orig_rebalance(builder_instance)
+                update_states()
+                return results
+
+            with mock.patch('swift.common.ring.RingBuilder.rebalance',
+                            wrap_rebalance):
+                yield captured_builder_states
+
+        mock_time.return_value = now = int(time.time())
+        builder_files = []
+        cb = CompositeRingBuilder()
+        for i in (1, 2, 3):
+            b = self._make_coop_builder(i, cb, min_part_hours=min_part_hours)
+            fname = os.path.join(self.tmpdir, 'builder_%s.builder' % i)
+            b.save(fname)
+            builder_files.append(fname)
+        builder_files, builders = cb.load_components(builder_files)
+
+        # all cobuilders can perform initial rebalance
+        cb.rebalance()
+        # jump forwards min_part_hours
+        now += min_part_hours * 3600
+        mock_time.return_value = now
+        for builder in builders:
+            self.add_dev(builder)
+
+        with mock.patch('swift.common.ring.composite_builder.shuffle',
+                        lambda x: x):
+            with mock_rebalance() as captured_states:
+                cb.rebalance()
+
+        # sanity - state captured before and after each component rebalance
+        self.assertEqual(len(builders), len(captured_states))
+        for states in captured_states.values():
+            self.assertEqual(2 * len(builders), len(states))
+        # for each component we have a list of it's builder states
+        rb1s = captured_states[builders[0]]
+        rb2s = captured_states[builders[1]]
+        rb3s = captured_states[builders[2]]
+
+        # rebalancing will update epoch for all builders' last_part_moves
+        self.assertEqual(now, rb1s[0]._last_part_moves_epoch)
+        self.assertEqual(now, rb2s[0]._last_part_moves_epoch)
+        self.assertEqual(now, rb3s[0]._last_part_moves_epoch)
+        # so, in state before any component rebalance, all can now move parts
+        # N.B. num_parts_can_move gathers super class's (i.e. RingBuilder)
+        # _can_part_move so that it doesn't refer to cobuilders state.
+        self.assertEqual(256, self.num_parts_can_move(rb1s[0]))
+        self.assertEqual(256, self.num_parts_can_move(rb2s[0]))
+        self.assertEqual(256, self.num_parts_can_move(rb3s[0]))
+
+        # after first component has been rebalanced it has moved parts
+        self.assertEqual(64, self.num_parts_can_move(rb1s[1]))
+        self.assertEqual(256, self.num_parts_can_move(rb2s[2]))
+        self.assertEqual(256, self.num_parts_can_move(rb3s[2]))
+
+        rb1_parts_moved = self.get_moved_parts(rb1s[1], rb1s[0])
+        self.assertEqual(192, len(rb1_parts_moved))
+        self.assertEqual(self._partition_counts(rb1s[1]),
+                         [192, 192, 192, 192])
+
+        # rebalancing rb2 - rb2 in isolation could potentially move all parts
+        # so would move 192 parts to new device, but it is constrained by rb1
+        # only having 64 parts that can move
+        rb2_parts_moved = self.get_moved_parts(rb2s[3], rb2s[2])
+        self.assertEqual(64, len(rb2_parts_moved))
+        counts = self._partition_counts(rb2s[3])
+        self.assertEqual(counts[3], 64)
+        self.assertEqual([234, 235, 235], sorted(counts[:3]))
+        self.assertFalse(rb2_parts_moved.intersection(rb1_parts_moved))
+        self.assertEqual(192, self.num_parts_can_move(rb2s[3]))
+        self.assertEqual(64, self.num_parts_can_move(rb1s[3]))
+
+        # rb3 can't rebalance - all parts moved while rebalancing rb1 and rb2
+        self.assertEqual(0, len(self.get_moved_parts(rb3s[5], rb3s[0])))
+
+    def test_rebalance_cobuilder_states(self):
+        self._check_rebalance_cobuilder_states(1)
+        self._check_rebalance_cobuilder_states(0)
+
+    def _check_rebalance_cobuilders_calls(self, min_part_hours):
+        # verify that co-builder methods are called during one builder's
+        # rebalance
+        @contextmanager
+        def mock_update_last_part_moves():
+            # intercept calls to RingBuilder._update_last_part_moves (yes, the
+            # superclass method) and populate a dict mapping builder instance
+            # to a list of that builder's parent builder when method was called
+            calls = []
+            orig_func = RingBuilder._update_last_part_moves
+
+            def fake_update(builder):
+                calls.append(builder)
+                return orig_func(builder)
+
+            with mock.patch(
+                    'swift.common.ring.RingBuilder._update_last_part_moves',
+                    fake_update):
+                yield calls
+
+        @contextmanager
+        def mock_can_part_move():
+            # intercept calls to RingBuilder._can_part_move (yes, the
+            # superclass method) and populate a dict mapping builder instance
+            # to a list of that builder's parent builder when method was called
+            calls = defaultdict(list)
+            orig_func = RingBuilder._can_part_move
+
+            def fake_can_part_move(builder, part):
+                calls[builder].append(part)
+                return orig_func(builder, part)
+            with mock.patch('swift.common.ring.RingBuilder._can_part_move',
+                            fake_can_part_move):
+                yield calls
+
+        cb = CompositeRingBuilder()
+        rb1 = self._make_coop_builder(1, cb, min_part_hours=min_part_hours)
+        rb2 = self._make_coop_builder(2, cb, min_part_hours=min_part_hours)
+        cb._builders = [rb1, rb2]
+        # composite rebalance updates last_part_moves before any component
+        # rebalance - after that expect no more updates
+        with mock_update_last_part_moves() as update_calls:
+            cb.update_last_part_moves()
+        self.assertEqual({rb1, rb2}, set(update_calls))
+
+        with mock_update_last_part_moves() as update_calls:
+            with mock_can_part_move() as can_part_move_calls:
+                rb2.rebalance()
+        self.assertFalse(update_calls)
+        # rb1 has never been rebalanced so no calls propagate from its
+        # can_part_move method to its superclass _can_part_move method
+        self.assertEqual({rb2}, set(can_part_move_calls))
+
+        with mock_update_last_part_moves() as update_calls:
+            with mock_can_part_move() as can_part_move_calls:
+                rb1.rebalance()
+        self.assertFalse(update_calls)
+        # rb1 is being rebalanced so gets checked, and rb2 also gets checked
+        self.assertEqual({rb1, rb2}, set(can_part_move_calls))
+        self.assertEqual(768, len(can_part_move_calls[rb1]))
+        self.assertEqual(768, len(can_part_move_calls[rb2]))
+
+    def test_rebalance_cobuilders_calls(self):
+        self._check_rebalance_cobuilders_calls(1)
+        self._check_rebalance_cobuilders_calls(0)
+
+    def test_save_then_load(self):
+        cb = CompositeRingBuilder()
+        coop_rb = self._make_coop_builder(1, cb, rebalance=True)
+        builder_file = os.path.join(self.tmpdir, 'test.builder')
+        coop_rb.save(builder_file)
+        cb = CompositeRingBuilder()
+        loaded_coop_rb = CooperativeRingBuilder.load(builder_file,
+                                                     parent_builder=cb)
+        self.assertIs(cb, loaded_coop_rb.parent_builder)
+        self.assertEqual(coop_rb.to_dict(), loaded_coop_rb.to_dict())
+
+        # check can be loaded as superclass
+        loaded_rb = RingBuilder.load(builder_file)
+        self.assertEqual(coop_rb.to_dict(), loaded_rb.to_dict())
+
+        # check can load a saved superclass
+        rb = RingBuilder(6, 3, 0)
+        for _ in range(3):
+            self.add_dev(rb, region=1)
+        rb.save(builder_file)
+        cb = CompositeRingBuilder()
+        loaded_coop_rb = CooperativeRingBuilder.load(builder_file,
+                                                     parent_builder=cb)
+        self.assertIs(cb, loaded_coop_rb.parent_builder)
+        self.assertEqual(rb.to_dict(), loaded_coop_rb.to_dict())
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/ring/test_io.py b/test/unit/common/ring/test_io.py
new file mode 100644
index 0000000000..8288a2a35d
--- /dev/null
+++ b/test/unit/common/ring/test_io.py
@@ -0,0 +1,238 @@
+# Copyright (c) 2022 NVIDIA
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import collections
+import dataclasses
+import io
+import json
+import os.path
+import unittest
+from unittest import mock
+
+from swift.common.ring.io import IndexEntry, RingReader, RingWriter
+
+from test.unit import with_tempdir
+
+
+class TestRoundTrip(unittest.TestCase):
+    def assertRepeats(self, data, pattern, n):
+        l = len(pattern)
+        self.assertEqual(len(data), n * l)
+        actual = collections.Counter(
+            data[x * l:(x + 1) * l]
+            for x in range(n))
+        self.assertEqual(actual, {pattern: n})
+
+    @with_tempdir
+    def test_write_failure(self, tempd):
+        tempf = os.path.join(tempd, 'not-persisted')
+        try:
+            with RingWriter.open(tempf):
+                self.assertEqual(1, len(os.listdir(tempd)))
+                raise RuntimeError
+        except RuntimeError:
+            pass
+        self.assertEqual(0, len(os.listdir(tempd)))
+
+    def test_sections(self):
+        buf = io.BytesIO()
+        with RingWriter(buf) as writer:
+            writer.write_magic(2)
+            with writer.section('foo'):
+                writer.write_blob(b'\xde\xad\xbe\xef' * 10240)
+
+            with writer.section('bar'):
+                # Sometimes you might not want to get the whole section into
+                # memory as a byte-string all at once (eg, when writing ring
+                # assignments)
+                writer.write_size(40960)
+                for _ in range(10):
+                    writer.write(b'\xda\x7a\xda\x7a' * 1024)
+
+            with writer.section('baz'):
+                writer.write_blob(b'more' * 10240)
+
+                # Can't nest sections
+                with self.assertRaises(ValueError):
+                    with writer.section('inner'):
+                        pass
+                self.assertNotIn('inner', writer.index)
+
+            writer.write(b'can add arbitrary bytes')
+            # ...though accessing them on read may be difficult; see below.
+            # This *is not* a recommended pattern -- write proper length-value
+            # blobs instead (even if you don't include them as sections in the
+            # index).
+
+            with writer.section('quux'):
+                writer.write_blob(b'data' * 10240)
+
+            # Gotta do this at the start
+            with self.assertRaises(IOError):
+                writer.write_magic(2)
+
+            # Can't write duplicate sections
+            with self.assertRaises(ValueError):
+                with writer.section('foo'):
+                    pass
+
+            # We're reserving globs, so we can later support something like
+            # reader.load_sections('swift/ring/*')
+            with self.assertRaises(ValueError):
+                with writer.section('foo*'):
+                    pass
+
+        buf.seek(0)
+        reader = RingReader(buf)
+        self.assertEqual(reader.version, 2)
+        # Order matters!
+        self.assertEqual(list(reader.index), [
+            'foo', 'bar', 'baz', 'quux'])
+        self.assertEqual({
+            k: (v.uncompressed_start, v.uncompressed_end, v.checksum_method)
+            for k, v in reader.index.items()
+        }, {
+            'foo': (6, 40974, 'sha256'),
+            'bar': (40974, 81942, 'sha256'),
+            'baz': (81942, 122910, 'sha256'),
+            # note the gap between baz and quux for the raw bytes
+            'quux': (122933, 163901, 'sha256'),
+        })
+
+        self.assertIn('foo', reader)
+        self.assertNotIn('inner', reader)
+
+        self.assertRepeats(reader.read_section('foo'),
+                           b'\xde\xad\xbe\xef', 10240)
+        with reader.open_section('bar') as s:
+            for _ in range(10):
+                self.assertEqual(s.read(4), b'\xda\x7a\xda\x7a')
+            self.assertRepeats(s.read(), b'\xda\x7a\xda\x7a', 10230)
+        # If you know that one section follows another, you don't *have*
+        # to "open" the next one
+        self.assertRepeats(reader.read_blob(), b'more', 10240)
+        self.assertRepeats(reader.read_section('quux'),
+                           b'data', 10240)
+        # Index is just a final (length-prefixed) JSON blob
+        index_dict = json.loads(reader.read_blob())
+        self.assertEqual(reader.index, {
+            section: IndexEntry(*entry)
+            for section, entry in index_dict.items()})
+
+        # Missing section
+        with self.assertRaises(KeyError) as caught:
+            with reader.open_section('foobar'):
+                pass
+        self.assertEqual("'foobar'", str(caught.exception))
+
+        # seek to the end of baz
+        reader.compressed_seek(reader.index['baz'].compressed_end)
+        # so we can read the raw bytes we stuffed in
+        gap_length = (reader.index['quux'].uncompressed_start -
+                      reader.index['baz'].uncompressed_end)
+        self.assertGreater(gap_length, 0)
+        self.assertEqual(b'can add arbitrary bytes',
+                         reader.read(gap_length))
+
+    def test_sections_with_corruption(self):
+        buf = io.BytesIO()
+        with RingWriter(buf) as writer:
+            writer.write_magic(2)
+            with writer.section('foo'):
+                writer.write_blob(b'\xde\xad\xbe\xef' * 10240)
+
+        buf.seek(0)
+        reader = RingReader(buf)
+        # if you open a section, you better read it all!
+        read_bytes = b''
+        with self.assertRaises(ValueError) as caught:
+            with reader.open_section('foo') as s:
+                read_bytes = s.read(4)
+        self.assertEqual(
+            'Incomplete read; expected 40956 more bytes to be read',
+            str(caught.exception))
+        self.assertEqual(b'\xde\xad\xbe\xef', read_bytes)
+
+        # if there's a digest mismatch, you can read data, but it'll
+        # throw an error on close
+        self.assertEqual('sha256', reader.index['foo'].checksum_method)
+        self.assertEqual(
+            'c51d6703d54cd7cf57b4d4b7ecfcca60'
+            '56dbd41ebf1c1e83c0e8e48baeff629a',
+            reader.index['foo'].checksum_value)
+        reader.index['foo'] = dataclasses.replace(
+            writer.index['foo'],
+            checksum_value='not-the-sha',
+        )
+        read_bytes = b''
+        with self.assertRaises(ValueError) as caught:
+            with reader.open_section('foo') as s:
+                read_bytes = s.read()
+        self.assertIn('Hash mismatch in block: ', str(caught.exception))
+        self.assertRepeats(read_bytes, b'\xde\xad\xbe\xef', 10240)
+
+    @mock.patch('logging.getLogger')
+    def test_sections_with_unsupported_checksum(self, mock_logging):
+        buf = io.BytesIO()
+        with RingWriter(buf) as writer:
+            writer.write_magic(2)
+            with writer.section('foo'):
+                writer.write_blob(b'\xde\xad\xbe\xef')
+            writer.index['foo'] = dataclasses.replace(
+                writer.index['foo'],
+                checksum_method='not_a_digest',
+                checksum_value='do not care',
+            )
+
+        buf.seek(0)
+        reader = RingReader(buf)
+        with self.assertRaises(ValueError):
+            with reader.open_section('foo'):
+                pass
+
+    def test_recompressed(self):
+        buf = io.BytesIO()
+        with RingWriter(buf) as writer:
+            writer.write_magic(2)
+            with writer.section('foo'):
+                writer.write_blob(b'\xde\xad\xbe\xef' * 10240)
+
+        buf.seek(0)
+        reader = RingReader(buf)
+        with self.assertRaises(IOError):
+            reader.read(-1)  # don't be greedy
+        uncompressed_bytes = reader.read(2 ** 20)
+
+        buf = io.BytesIO()
+        with RingWriter(buf) as writer:
+            writer.write(uncompressed_bytes)
+
+        buf.seek(0)
+        with self.assertRaises(IOError):
+            # ...but we can't read it
+            RingReader(buf)
+
+    def test_version_too_high(self):
+        buf = io.BytesIO()
+        with RingWriter(buf) as writer:
+            # you can write it...
+            writer.write_magic(3)
+            with writer.section('foo'):
+                writer.write_blob(b'\xde\xad\xbe\xef' * 10240)
+
+        buf.seek(0)
+        with self.assertRaises(ValueError):
+            # ...but we can't read it
+            RingReader(buf)
diff --git a/test/unit/common/ring/test_ring.py b/test/unit/common/ring/test_ring.py
index 9a37cc31b7..7e006a7852 100644
--- a/test/unit/common/ring/test_ring.py
+++ b/test/unit/common/ring/test_ring.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -14,231 +14,717 @@
 # limitations under the License.
 
 import array
-import cPickle as pickle
+import collections
+from gzip import GzipFile
+import hashlib
+import json
 import os
 import unittest
-from gzip import GzipFile
+import stat
+import struct
+from tempfile import mkdtemp
 from shutil import rmtree
 from time import sleep, time
+import sys
+import copy
+from unittest import mock
+import zlib
 
+from swift.common.exceptions import DevIdBytesTooSmall
 from swift.common import ring, utils
+from swift.common.ring import io, utils as ring_utils
+
+
+class TestRingBase(unittest.TestCase):
+    longMessage = True
+
+    def setUp(self):
+        self._orig_hash_suffix = utils.HASH_PATH_SUFFIX
+        self._orig_hash_prefix = utils.HASH_PATH_PREFIX
+        utils.HASH_PATH_SUFFIX = b'endcap'
+        utils.HASH_PATH_PREFIX = b''
+
+    def tearDown(self):
+        utils.HASH_PATH_SUFFIX = self._orig_hash_suffix
+        utils.HASH_PATH_PREFIX = self._orig_hash_prefix
 
 
 class TestRingData(unittest.TestCase):
 
     def setUp(self):
-        self.testdir = os.path.join(os.path.dirname(__file__), 'ring_data')
-        rmtree(self.testdir, ignore_errors=1)
-        os.mkdir(self.testdir)
+        self.testdir = mkdtemp()
 
     def tearDown(self):
         rmtree(self.testdir, ignore_errors=1)
 
-    def assert_ring_data_equal(self, rd_expected, rd_got):
-        self.assertEquals(rd_expected._replica2part2dev_id,
-                          rd_got._replica2part2dev_id)
-        self.assertEquals(rd_expected.devs, rd_got.devs)
-        self.assertEquals(rd_expected._part_shift, rd_got._part_shift)
+    def assert_ring_data_equal(self, rd_expected, rd_got, metadata_only=False):
+        self.assertEqual(rd_expected.devs, rd_got.devs)
+        self.assertEqual(rd_expected._part_shift, rd_got._part_shift)
+        self.assertEqual(rd_expected.next_part_power, rd_got.next_part_power)
+        self.assertEqual(rd_expected.version, rd_got.version)
+        self.assertEqual(rd_expected.dev_id_bytes, rd_got.dev_id_bytes)
+        self.assertEqual(rd_expected.replica_count, rd_got.replica_count)
+
+        if metadata_only:
+            self.assertEqual([], rd_got._replica2part2dev_id)
+        else:
+            self.assertEqual(rd_expected._replica2part2dev_id,
+                             rd_got._replica2part2dev_id)
 
     def test_attrs(self):
         r2p2d = [[0, 1, 0, 1], [0, 1, 0, 1]]
-        d = [{'id': 0, 'zone': 0}, {'id': 1, 'zone': 1}]
+        d = [{'id': 0, 'zone': 0, 'region': 0, 'ip': '10.1.1.0', 'port': 7000,
+              'replication_ip': '10.1.1.0', 'replication_port': 7000},
+             {'id': 1, 'zone': 1, 'region': 1, 'ip': '10.1.1.1', 'port': 7000,
+              'replication_ip': '10.1.1.1', 'replication_port': 7000}]
         s = 30
         rd = ring.RingData(r2p2d, d, s)
-        self.assertEquals(rd._replica2part2dev_id, r2p2d)
-        self.assertEquals(rd.devs, d)
-        self.assertEquals(rd._part_shift, s)
+        self.assertEqual(rd._replica2part2dev_id, r2p2d)
+        self.assertEqual(rd.devs, d)
+        self.assertEqual(rd._part_shift, s)
 
-    def test_can_load_pickled_ring_data(self):
-        rd = ring.RingData([[0, 1, 0, 1], [0, 1, 0, 1]],
-                [{'id': 0, 'zone': 0}, {'id': 1, 'zone': 1}], 30)
+    def test_roundtrip_serialization(self):
         ring_fname = os.path.join(self.testdir, 'foo.ring.gz')
-        for p in xrange(pickle.HIGHEST_PROTOCOL):
-            pickle.dump(rd, GzipFile(ring_fname, 'wb'), protocol=p)
-            ring_data = ring.RingData.load(ring_fname)
-            self.assert_ring_data_equal(rd, ring_data)
+        rd = ring.RingData(
+            [array.array('H', [0, 1, 0, 1]), array.array('H', [0, 1, 0, 1])],
+            [
+                {'id': 0, 'region': 1, 'zone': 0},
+                {'id': 1, 'region': 1, 'zone': 1},
+            ],
+            30)
+        rd.save(ring_fname)
 
-    def test_roundtrip_serialization(self):
+        meta_only = ring.RingData.load(ring_fname, metadata_only=True)
+        self.assert_ring_data_equal(rd, meta_only, metadata_only=True)
+
+        rd2 = ring.RingData.load(ring_fname)
+        self.assert_ring_data_equal(rd, rd2)
+
+    def test_load_closes_file(self):
         ring_fname = os.path.join(self.testdir, 'foo.ring.gz')
         rd = ring.RingData(
-            [array.array('H', [0, 1, 0, 1]), array.array('H',[0, 1, 0, 1])],
+            [array.array('H', [0, 1, 0, 1]), array.array('H', [0, 1, 0, 1])],
             [{'id': 0, 'zone': 0}, {'id': 1, 'zone': 1}], 30)
         rd.save(ring_fname)
+
+        with mock.patch('swift.common.ring.io.open',
+                        return_value=open(ring_fname, 'rb')) as mock_open:
+            self.assertFalse(mock_open.return_value.closed)  # sanity
+            ring.RingData.load(ring_fname)
+            self.assertTrue(mock_open.return_value.closed)
+
+    def test_byteswapped_serialization(self):
+        # Manually byte swap a ring and write it out, claiming it was written
+        # on a different endian machine. Then read it back in and see if it's
+        # the same as the non-byte swapped original.
+
+        ring_fname = os.path.join(self.testdir, 'foo.ring.gz')
+        data = [array.array('H', [0, 1, 0, 1]), array.array('H', [0, 1, 0, 1])]
+        swapped_data = copy.deepcopy(data)
+        for x in swapped_data:
+            x.byteswap()
+
+        with mock.patch.object(sys, 'byteorder',
+                               'big' if sys.byteorder == 'little'
+                               else 'little'):
+            rds = ring.RingData(swapped_data,
+                                [{'id': 0, 'zone': 0}, {'id': 1, 'zone': 1}],
+                                30)
+            # note that this can only be an issue for v1 rings;
+            # v2 rings always write network order
+            rds.save(ring_fname, format_version=1)
+
+        rd1 = ring.RingData(data, [{'id': 0, 'zone': 0}, {'id': 1, 'zone': 1}],
+                            30)
         rd2 = ring.RingData.load(ring_fname)
-        self.assert_ring_data_equal(rd, rd2)
+        self.assert_ring_data_equal(rd1, rd2)
+
+    def test_deterministic_serialization(self):
+        """
+        Two identical rings should produce identical .gz files on disk.
+        """
+        os.mkdir(os.path.join(self.testdir, '1'))
+        os.mkdir(os.path.join(self.testdir, '2'))
+        # These have to have the same filename (not full path,
+        # obviously) since the filename gets encoded in the gzip data.
+        ring_fname1 = os.path.join(self.testdir, '1', 'the.ring.gz')
+        ring_fname2 = os.path.join(self.testdir, '2', 'the.ring.gz')
+        rd = ring.RingData(
+            [array.array('H', [0, 1, 0, 1]), array.array('H', [0, 1, 0, 1])],
+            [{'id': 0, 'zone': 0}, {'id': 1, 'zone': 1}], 30)
+        rd.save(ring_fname1)
+        rd.save(ring_fname2)
+        with open(ring_fname1, 'rb') as ring1:
+            with open(ring_fname2, 'rb') as ring2:
+                self.assertEqual(ring1.read(), ring2.read())
+
+    def test_permissions(self):
+        ring_fname = os.path.join(self.testdir, 'stat.ring.gz')
+        rd = ring.RingData(
+            [array.array('H', [0, 1, 0, 1]), array.array('H', [0, 1, 0, 1])],
+            [{'id': 0, 'zone': 0}, {'id': 1, 'zone': 1}], 30)
+        rd.save(ring_fname)
+        ring_mode = stat.S_IMODE(os.stat(ring_fname).st_mode)
+        expected_mode = (stat.S_IRUSR | stat.S_IWUSR |
+                         stat.S_IRGRP | stat.S_IROTH)
+        self.assertEqual(
+            ring_mode, expected_mode,
+            'Ring has mode 0%o, expected 0%o' % (ring_mode, expected_mode))
+
+    def test_replica_count(self):
+        rd = ring.RingData(
+            [[0, 1, 0, 1], [0, 1, 0, 1]],
+            [{'id': 0, 'zone': 0, 'ip': '10.1.1.0', 'port': 7000},
+             {'id': 1, 'zone': 1, 'ip': '10.1.1.1', 'port': 7000}],
+            30)
+        self.assertEqual(rd.replica_count, 2)
 
+        rd = ring.RingData(
+            [[0, 1, 0, 1], [0, 1, 0]],
+            [{'id': 0, 'zone': 0, 'ip': '10.1.1.0', 'port': 7000},
+             {'id': 1, 'zone': 1, 'ip': '10.1.1.1', 'port': 7000}],
+            30)
+        self.assertEqual(rd.replica_count, 1.75)
+
+    def test_deserialize_v1(self):
+        # First save it as a ring v2 and then try and load it using
+        # deserialize_v1
+        ring_fname = os.path.join(self.testdir, 'foo.ring.gz')
+        rd = ring.RingData(
+            [[0, 1, 0, 1], [0, 1, 0, 1]],
+            [{'id': 0, 'region': 1, 'zone': 0, 'ip': '10.1.1.0',
+              'port': 7000},
+             {'id': 1, 'region': 1, 'zone': 1, 'ip': '10.1.1.1',
+              'port': 7000}],
+            30)
+        rd.save(ring_fname, format_version=2)
+
+        with self.assertRaises(ValueError) as err:
+            ring.RingData.deserialize_v1(io.RingReader(open(ring_fname, 'rb')))
+        self.assertIn("unexpected magic:", str(err.exception))
+
+        # Now let's save it as v1 then load it up metadata_only
+        rd.save(ring_fname, format_version=1)
+        loaded_rd = ring.RingData.deserialize_v1(
+            io.RingReader(open(ring_fname, 'rb')),
+            metadata_only=True)
+        self.assertTrue(loaded_rd['byteorder'])
+        expected_devs = [
+            {'id': 0, 'ip': '10.1.1.0', 'port': 7000, 'region': 1, 'zone': 0,
+             'replication_ip': '10.1.1.0', 'replication_port': 7000},
+            {'id': 1, 'ip': '10.1.1.1', 'port': 7000, 'region': 1, 'zone': 1,
+             'replication_ip': '10.1.1.1', 'replication_port': 7000}]
+        self.assertEqual(loaded_rd['devs'], expected_devs)
+        self.assertEqual(loaded_rd['part_shift'], 30)
+        self.assertEqual(loaded_rd['replica_count'], 2)
+
+        # but the replica2part2dev table is empty
+        self.assertFalse(loaded_rd['replica2part2dev_id'])
+
+        # But if we load it up with metadata_only = false
+        loaded_rd = ring.RingData.deserialize_v1(
+            io.RingReader(open(ring_fname, 'rb')))
+        self.assertTrue(loaded_rd['byteorder'])
+        self.assertEqual(loaded_rd['devs'], expected_devs)
+        self.assertEqual(loaded_rd['part_shift'], 30)
+        self.assertEqual(loaded_rd['replica_count'], 2)
+        self.assertTrue(loaded_rd['replica2part2dev_id'])
+
+    def test_deserialize_v2(self):
+        # First save it as a ring v1 and then try and load it using
+        # deserialize_v2
+        ring_fname = os.path.join(self.testdir, 'foo.ring.gz')
+        rd = ring.RingData(
+            [[0, 1, 0, 1], [0, 1, 0, 1]],
+            [{'id': 0, 'region': 1, 'zone': 0, 'ip': '10.1.1.0',
+              'port': 7000},
+             {'id': 1, 'region': 1, 'zone': 1, 'ip': '10.1.1.1',
+              'port': 7000}],
+            30)
+        rd.save(ring_fname, format_version=1)
+        with self.assertRaises(ValueError) as err:
+            ring.RingData.deserialize_v2(io.RingReader(open(ring_fname, 'rb')))
+        self.assertEqual("No index loaded", str(err.exception))
 
-class TestRing(unittest.TestCase):
+        # Now let's save it as v2 then load it up metadata_only
+        rd.save(ring_fname, format_version=2)
+        loaded_rd = ring.RingData.deserialize_v2(
+            io.RingReader(open(ring_fname, 'rb')),
+            metadata_only=True,
+            include_devices=False)
+        self.assertEqual(loaded_rd['part_shift'], 30)
+        self.assertEqual(loaded_rd['replica_count'], 2)
+        # minimum size we use is 2 byte dev ids
+        self.assertEqual(loaded_rd['dev_id_bytes'], 2)
+
+        # but the replica2part2dev table and devs are both empty
+        self.assertFalse(loaded_rd['devs'])
+        self.assertFalse(loaded_rd['replica2part2dev_id'])
+
+        # Next we load it up with metadata and devs only
+        loaded_rd = ring.RingData.deserialize_v2(
+            io.RingReader(open(ring_fname, 'rb')),
+            metadata_only=True)
+        expected_devs = [
+            {'id': 0, 'ip': '10.1.1.0', 'port': 7000, 'region': 1, 'zone': 0,
+             'replication_ip': '10.1.1.0', 'replication_port': 7000},
+            {'id': 1, 'ip': '10.1.1.1', 'port': 7000, 'region': 1, 'zone': 1,
+             'replication_ip': '10.1.1.1', 'replication_port': 7000}]
+        self.assertEqual(loaded_rd['devs'], expected_devs)
+        self.assertEqual(loaded_rd['part_shift'], 30)
+        self.assertEqual(loaded_rd['replica_count'], 2)
+        self.assertEqual(loaded_rd['dev_id_bytes'], 2)
+        self.assertFalse(loaded_rd['replica2part2dev_id'])
+
+        # But if we load it up with metadata_only = false
+        loaded_rd = ring.RingData.deserialize_v2(
+            io.RingReader(open(ring_fname, 'rb')))
+        self.assertEqual(loaded_rd['devs'], expected_devs)
+        self.assertEqual(loaded_rd['part_shift'], 30)
+        self.assertEqual(loaded_rd['replica_count'], 2)
+        self.assertEqual(loaded_rd['dev_id_bytes'], 2)
+        self.assertTrue(loaded_rd['replica2part2dev_id'])
+
+        # Can also load up assignments but not devs; idk why you'd want that
+        loaded_rd = ring.RingData.deserialize_v2(
+            io.RingReader(open(ring_fname, 'rb')),
+            metadata_only=False,
+            include_devices=False)
+        self.assertFalse(loaded_rd['devs'])
+        self.assertEqual(loaded_rd['part_shift'], 30)
+        self.assertEqual(loaded_rd['replica_count'], 2)
+        self.assertEqual(loaded_rd['dev_id_bytes'], 2)
+        self.assertTrue(loaded_rd['replica2part2dev_id'])
+
+    def test_load(self):
+        rd = ring.RingData(
+            [[0, 1, 0, 1], [0, 1, 0, 1]],
+            [{'id': 0, 'region': 1, 'zone': 0, 'ip': '10.1.1.0',
+              'port': 7000},
+             {'id': 1, 'region': 1, 'zone': 1, 'ip': '10.1.1.1',
+              'port': 7000}],
+            30)
+        ring_fname_1 = os.path.join(self.testdir, 'foo-1.ring.gz')
+        ring_fname_2 = os.path.join(self.testdir, 'foo-2.ring.gz')
+        ring_fname_bad_version = os.path.join(self.testdir, 'foo-bar.ring.gz')
+        rd.save(ring_fname_1, format_version=1)
+        rd.save(ring_fname_2, format_version=2)
+        with io.RingWriter.open(ring_fname_bad_version) as writer:
+            writer.write_magic(5)
+            with writer.section('foo'):
+                writer.write_blob(b'\xde\xad\xbe\xef' * 10240)
+
+        # Loading the bad ring will fail because it's an unknown version
+        with self.assertRaises(Exception) as ex:
+            ring.RingData.load(ring_fname_bad_version)
+        self.assertEqual(
+            f'Unsupported ring version: 5 for {ring_fname_bad_version!r}',
+            str(ex.exception))
+
+        orig_load_index = io.RingReader.load_index
+
+        def mock_load_index(cls):
+            cls.version = 5
+            orig_load_index(cls)
+
+        with mock.patch('swift.common.ring.io.RingReader.load_index',
+                        mock_load_index):
+            with self.assertRaises(Exception) as ex:
+                ring.RingData.load(ring_fname_1)
+        self.assertEqual(
+            f'Unknown ring format version 5 for {ring_fname_1!r}',
+            str(ex.exception))
+
+        expected_r2p2d = [
+            array.array('H', [0, 1, 0, 1]),
+            array.array('H', [0, 1, 0, 1])]
+        expected_rd_dict = {
+            'devs': [
+                {'id': 0, 'region': 1, 'zone': 0,
+                 'ip': '10.1.1.0', 'port': 7000,
+                 'replication_ip': '10.1.1.0', 'replication_port': 7000},
+                {'id': 1, 'zone': 1, 'region': 1,
+                 'ip': '10.1.1.1', 'port': 7000,
+                 'replication_ip': '10.1.1.1', 'replication_port': 7000}],
+            'replica2part2dev_id': expected_r2p2d,
+            'part_shift': 30,
+            'next_part_power': None,
+            'dev_id_bytes': 2,
+            'version': None}
+
+        # version 2
+        loaded_rd = ring.RingData.load(ring_fname_2)
+        self.assertEqual(loaded_rd.to_dict(), expected_rd_dict)
+
+        # version 1
+        loaded_rd = ring.RingData.load(ring_fname_1)
+        self.assertEqual(loaded_rd.to_dict(), expected_rd_dict)
+
+    def test_load_metadata_only(self):
+        rd = ring.RingData(
+            [[0, 1, 0, 1], [0, 1, 0, 1]],
+            [{'id': 0, 'region': 1, 'zone': 0, 'ip': '10.1.1.0',
+              'port': 7000},
+             {'id': 1, 'region': 1, 'zone': 1, 'ip': '10.1.1.1',
+              'port': 7000}],
+            30)
+        ring_fname_1 = os.path.join(self.testdir, 'foo-1.ring.gz')
+        ring_fname_2 = os.path.join(self.testdir, 'foo-2.ring.gz')
+        ring_fname_bad_version = os.path.join(self.testdir, 'foo-bar.ring.gz')
+        rd.save(ring_fname_1, format_version=1)
+        rd.save(ring_fname_2, format_version=2)
+        with io.RingWriter.open(ring_fname_bad_version) as writer:
+            writer.write_magic(5)
+            with writer.section('foo'):
+                writer.write_blob(b'\xde\xad\xbe\xef' * 10240)
+
+        # Loading the bad ring will fail because it's an unknown version
+        with self.assertRaises(Exception) as ex:
+            ring.RingData.load(ring_fname_bad_version)
+        self.assertEqual(
+            f'Unsupported ring version: 5 for {ring_fname_bad_version!r}',
+            str(ex.exception))
+
+        orig_load_index = io.RingReader.load_index
+
+        def mock_load_index(cls):
+            cls.version = 5
+            orig_load_index(cls)
+
+        with mock.patch('swift.common.ring.io.RingReader.load_index',
+                        mock_load_index):
+            with self.assertRaises(Exception) as ex:
+                ring.RingData.load(ring_fname_1)
+        self.assertEqual(
+            f'Unknown ring format version 5 for {ring_fname_1!r}',
+            str(ex.exception))
+
+        expected_rd_dict = {
+            'devs': [
+                {'id': 0, 'region': 1, 'zone': 0,
+                 'ip': '10.1.1.0', 'port': 7000,
+                 'replication_ip': '10.1.1.0', 'replication_port': 7000},
+                {'id': 1, 'zone': 1, 'region': 1,
+                 'ip': '10.1.1.1', 'port': 7000,
+                 'replication_ip': '10.1.1.1', 'replication_port': 7000}],
+            'replica2part2dev_id': [],
+            'part_shift': 30,
+            'next_part_power': None,
+            'dev_id_bytes': 2,
+            'version': None}
+
+        # version 2
+        loaded_rd = ring.RingData.load(ring_fname_2, metadata_only=True)
+        self.assertEqual(loaded_rd.to_dict(), expected_rd_dict)
+
+        # version 1
+        loaded_rd = ring.RingData.load(ring_fname_1, metadata_only=True)
+        self.assertEqual(loaded_rd.to_dict(), expected_rd_dict)
+
+    def test_save(self):
+        ring_fname = os.path.join(self.testdir, 'foo.ring.gz')
+        rd = ring.RingData(
+            [[0, 1, 0, 1], [0, 1, 0, 1]],
+            [{'id': 0, 'zone': 0, 'ip': '10.1.1.0', 'port': 7000},
+             {'id': 1, 'zone': 1, 'ip': '10.1.1.1', 'port': 7000}],
+            30)
+
+        # First test the supported versions
+        for version in (1, 2):
+            rd.save(ring_fname, format_version=version)
+
+        # Now try an unknown version
+        with self.assertRaises(ValueError) as err:
+            for version in (3, None, "some version"):
+                rd.save(ring_fname, format_version=version)
+        self.assertEqual("format_version must be one of (1, 2)",
+                         str(err.exception))
+        # re-serialisation is already handled in test_load.
+
+    def test_save_bad_dev_id_bytes(self):
+        ring_fname = os.path.join(self.testdir, 'foo.ring.gz')
+        rd = ring.RingData(
+            [array.array('I', [0, 1, 0, 1]), array.array('I', [0, 1, 0, 1])],
+            [{'id': 0, 'zone': 0, 'ip': '10.1.1.0', 'port': 7000},
+             {'id': 1, 'zone': 1, 'ip': '10.1.1.1', 'port': 7000}],
+            30)
+
+        # v2 ring can handle wide devices fine
+        rd.save(ring_fname, format_version=2)
+        # but not v1! Only 2-byte dev ids there!
+        with self.assertRaises(DevIdBytesTooSmall):
+            rd.save(ring_fname, format_version=1)
+
+
+class TestRing(TestRingBase):
+    FORMAT_VERSION = 1
 
     def setUp(self):
-        utils.HASH_PATH_SUFFIX = 'endcap'
-        self.testdir = os.path.join(os.path.dirname(__file__), 'ring')
-        rmtree(self.testdir, ignore_errors=1)
-        os.mkdir(self.testdir)
+        super(TestRing, self).setUp()
+        self.testdir = mkdtemp()
         self.testgz = os.path.join(self.testdir, 'whatever.ring.gz')
         self.intended_replica2part2dev_id = [
             array.array('H', [0, 1, 0, 1]),
             array.array('H', [0, 1, 0, 1]),
             array.array('H', [3, 4, 3, 4])]
-        self.intended_devs = [{'id': 0, 'zone': 0, 'weight': 1.0,
-                               'ip': '10.1.1.1', 'port': 6000},
-                              {'id': 1, 'zone': 0, 'weight': 1.0,
-                               'ip': '10.1.1.1', 'port': 6000},
+        self.intended_devs = [{'id': 0, 'region': 0, 'zone': 0, 'weight': 1.0,
+                               'ip': '10.1.1.1', 'port': 6200,
+                               'replication_ip': '10.1.0.1',
+                               'replication_port': 6066},
+                              {'id': 1, 'region': 0, 'zone': 0, 'weight': 1.0,
+                               'ip': '10.1.1.1', 'port': 6200,
+                               'replication_ip': '10.1.0.2',
+                               'replication_port': 6066},
                               None,
-                              {'id': 3, 'zone': 2, 'weight': 1.0,
-                               'ip': '10.1.2.1', 'port': 6000},
-                              {'id': 4, 'zone': 2, 'weight': 1.0,
-                               'ip': '10.1.2.2', 'port': 6000}]
+                              {'id': 3, 'region': 0, 'zone': 2, 'weight': 1.0,
+                               'ip': '10.1.2.1', 'port': 6200,
+                               'replication_ip': '10.2.0.1',
+                               'replication_port': 6066},
+                              {'id': 4, 'region': 0, 'zone': 2, 'weight': 1.0,
+                               'ip': '10.1.2.2', 'port': 6200,
+                               'replication_ip': '10.2.0.1',
+                               'replication_port': 6066}]
         self.intended_part_shift = 30
         self.intended_reload_time = 15
-        ring.RingData(self.intended_replica2part2dev_id,
-            self.intended_devs, self.intended_part_shift).save(self.testgz)
-        self.ring = ring.Ring(self.testdir,
+        rd = ring.RingData(
+            self.intended_replica2part2dev_id,
+            self.intended_devs, self.intended_part_shift)
+        rd.save(self.testgz, format_version=self.FORMAT_VERSION)
+        self.ring = ring.Ring(
+            self.testdir,
             reload_time=self.intended_reload_time, ring_name='whatever')
 
     def tearDown(self):
+        super(TestRing, self).tearDown()
         rmtree(self.testdir, ignore_errors=1)
 
     def test_creation(self):
-        self.assertEquals(self.ring._replica2part2dev_id,
-                          self.intended_replica2part2dev_id)
-        self.assertEquals(self.ring._part_shift, self.intended_part_shift)
-        self.assertEquals(self.ring.devs, self.intended_devs)
-        self.assertEquals(self.ring.reload_time, self.intended_reload_time)
-        self.assertEquals(self.ring.serialized_path, self.testgz)
+        self.assertEqual(self.ring._replica2part2dev_id,
+                         self.intended_replica2part2dev_id)
+        self.assertEqual(self.ring._part_shift, self.intended_part_shift)
+        self.assertEqual(self.ring.devs, self.intended_devs)
+        self.assertEqual(self.ring.reload_time, self.intended_reload_time)
+        self.assertEqual(self.ring.serialized_path, self.testgz)
+        self.assertIsNone(self.ring.version)
+
+        with open(self.testgz, 'rb') as fp:
+            expected_size = 0
+            for chunk in iter(lambda: fp.read(2 ** 16), b''):
+                expected_size += len(chunk)
+        self.assertEqual(self.ring.size, expected_size)
+
         # test invalid endcap
-        _orig_hash_path_suffix = utils.HASH_PATH_SUFFIX
-        try:
-            utils.HASH_PATH_SUFFIX = ''
-            self.assertRaises(SystemExit, ring.Ring, self.testdir, 'whatever')
-        finally:
-            utils.HASH_PATH_SUFFIX = _orig_hash_path_suffix
+        with mock.patch.object(utils, 'HASH_PATH_SUFFIX', b''), \
+                mock.patch.object(utils, 'HASH_PATH_PREFIX', b''), \
+                mock.patch.object(utils, 'SWIFT_CONF_FILE', ''):
+            self.assertRaises(IOError, ring.Ring, self.testdir, 'whatever')
+
+    def test_replica_count(self):
+        self.assertEqual(self.ring.replica_count, 3)
+        self.ring._replica2part2dev_id.append([0])
+        self.assertEqual(self.ring.replica_count, 3.25)
 
     def test_has_changed(self):
-        self.assertEquals(self.ring.has_changed(), False)
+        self.assertFalse(self.ring.has_changed())
         os.utime(self.testgz, (time() + 60, time() + 60))
-        self.assertEquals(self.ring.has_changed(), True)
+        self.assertTrue(self.ring.has_changed())
 
     def test_reload(self):
         os.utime(self.testgz, (time() - 300, time() - 300))
         self.ring = ring.Ring(self.testdir, reload_time=0.001,
-                    ring_name='whatever')
+                              ring_name='whatever')
         orig_mtime = self.ring._mtime
-        self.assertEquals(len(self.ring.devs), 5)
-        self.intended_devs.append({'id': 3, 'zone': 3, 'weight': 1.0})
-        ring.RingData(self.intended_replica2part2dev_id,
-            self.intended_devs, self.intended_part_shift).save(self.testgz)
+        self.assertEqual(len(self.ring.devs), 5)
+        self.intended_devs.append(
+            {'id': 3, 'region': 0, 'zone': 3, 'weight': 1.0,
+             'ip': '10.1.1.1', 'port': 9876})
+        ring.RingData(
+            self.intended_replica2part2dev_id,
+            self.intended_devs, self.intended_part_shift,
+        ).save(self.testgz, format_version=self.FORMAT_VERSION)
         sleep(0.1)
         self.ring.get_nodes('a')
-        self.assertEquals(len(self.ring.devs), 6)
-        self.assertNotEquals(self.ring._mtime, orig_mtime)
+        self.assertEqual(len(self.ring.devs), 6)
+        self.assertNotEqual(self.ring._mtime, orig_mtime)
 
         os.utime(self.testgz, (time() - 300, time() - 300))
         self.ring = ring.Ring(self.testdir, reload_time=0.001,
-                    ring_name='whatever')
+                              ring_name='whatever')
         orig_mtime = self.ring._mtime
-        self.assertEquals(len(self.ring.devs), 6)
-        self.intended_devs.append({'id': 5, 'zone': 4, 'weight': 1.0})
-        ring.RingData(self.intended_replica2part2dev_id,
-            self.intended_devs, self.intended_part_shift).save(self.testgz)
+        self.assertEqual(len(self.ring.devs), 6)
+        self.intended_devs.append(
+            {'id': 5, 'region': 0, 'zone': 4, 'weight': 1.0,
+             'ip': '10.5.5.5', 'port': 9876})
+        ring.RingData(
+            self.intended_replica2part2dev_id,
+            self.intended_devs, self.intended_part_shift,
+        ).save(self.testgz, format_version=self.FORMAT_VERSION)
         sleep(0.1)
         self.ring.get_part_nodes(0)
-        self.assertEquals(len(self.ring.devs), 7)
-        self.assertNotEquals(self.ring._mtime, orig_mtime)
+        self.assertEqual(len(self.ring.devs), 7)
+        self.assertNotEqual(self.ring._mtime, orig_mtime)
 
         os.utime(self.testgz, (time() - 300, time() - 300))
         self.ring = ring.Ring(self.testdir, reload_time=0.001,
-                    ring_name='whatever')
+                              ring_name='whatever')
         orig_mtime = self.ring._mtime
         part, nodes = self.ring.get_nodes('a')
-        self.assertEquals(len(self.ring.devs), 7)
-        self.intended_devs.append({'id': 6, 'zone': 5, 'weight': 1.0})
-        ring.RingData(self.intended_replica2part2dev_id,
-            self.intended_devs, self.intended_part_shift).save(self.testgz)
+        self.assertEqual(len(self.ring.devs), 7)
+        self.intended_devs.append(
+            {'id': 6, 'region': 0, 'zone': 5, 'weight': 1.0,
+             'ip': '10.6.6.6', 'port': 6200})
+        ring.RingData(
+            self.intended_replica2part2dev_id,
+            self.intended_devs, self.intended_part_shift,
+        ).save(self.testgz, format_version=self.FORMAT_VERSION)
         sleep(0.1)
-        self.ring.get_more_nodes(part).next()
-        self.assertEquals(len(self.ring.devs), 8)
-        self.assertNotEquals(self.ring._mtime, orig_mtime)
+        next(self.ring.get_more_nodes(part))
+        self.assertEqual(len(self.ring.devs), 8)
+        self.assertNotEqual(self.ring._mtime, orig_mtime)
 
         os.utime(self.testgz, (time() - 300, time() - 300))
         self.ring = ring.Ring(self.testdir, reload_time=0.001,
-                    ring_name='whatever')
+                              ring_name='whatever')
         orig_mtime = self.ring._mtime
-        self.assertEquals(len(self.ring.devs), 8)
-        self.intended_devs.append({'id': 5, 'zone': 4, 'weight': 1.0})
-        ring.RingData(self.intended_replica2part2dev_id,
-            self.intended_devs, self.intended_part_shift).save(self.testgz)
+        self.assertEqual(len(self.ring.devs), 8)
+        self.intended_devs.append(
+            {'id': 5, 'region': 0, 'zone': 4, 'weight': 1.0,
+             'ip': '10.5.5.5', 'port': 6200})
+        ring.RingData(
+            self.intended_replica2part2dev_id,
+            self.intended_devs, self.intended_part_shift,
+        ).save(self.testgz, format_version=self.FORMAT_VERSION)
         sleep(0.1)
-        self.assertEquals(len(self.ring.devs), 9)
-        self.assertNotEquals(self.ring._mtime, orig_mtime)
+        self.assertEqual(len(self.ring.devs), 9)
+        self.assertNotEqual(self.ring._mtime, orig_mtime)
+
+    def test_reload_without_replication(self):
+        replication_less_devs = [{'id': 0, 'region': 0, 'zone': 0,
+                                  'weight': 1.0, 'ip': '10.1.1.1',
+                                  'port': 6200},
+                                 {'id': 1, 'region': 0, 'zone': 0,
+                                  'weight': 1.0, 'ip': '10.1.1.1',
+                                  'port': 6200},
+                                 None,
+                                 {'id': 3, 'region': 0, 'zone': 2,
+                                  'weight': 1.0, 'ip': '10.1.2.1',
+                                  'port': 6200},
+                                 {'id': 4, 'region': 0, 'zone': 2,
+                                  'weight': 1.0, 'ip': '10.1.2.2',
+                                  'port': 6200}]
+        intended_devs = [{'id': 0, 'region': 0, 'zone': 0, 'weight': 1.0,
+                          'ip': '10.1.1.1', 'port': 6200,
+                          'replication_ip': '10.1.1.1',
+                          'replication_port': 6200},
+                         {'id': 1, 'region': 0, 'zone': 0, 'weight': 1.0,
+                          'ip': '10.1.1.1', 'port': 6200,
+                          'replication_ip': '10.1.1.1',
+                          'replication_port': 6200},
+                         None,
+                         {'id': 3, 'region': 0, 'zone': 2, 'weight': 1.0,
+                          'ip': '10.1.2.1', 'port': 6200,
+                          'replication_ip': '10.1.2.1',
+                          'replication_port': 6200},
+                         {'id': 4, 'region': 0, 'zone': 2, 'weight': 1.0,
+                          'ip': '10.1.2.2', 'port': 6200,
+                          'replication_ip': '10.1.2.2',
+                          'replication_port': 6200}]
+        testgz = os.path.join(self.testdir, 'without_replication.ring.gz')
+        ring.RingData(
+            self.intended_replica2part2dev_id,
+            replication_less_devs, self.intended_part_shift,
+        ).save(testgz, format_version=self.FORMAT_VERSION)
+        self.ring = ring.Ring(
+            self.testdir,
+            reload_time=self.intended_reload_time,
+            ring_name='without_replication')
+        self.assertEqual(self.ring.devs, intended_devs)
+
+    def test_get_part(self):
+        part1 = self.ring.get_part('a')
+        nodes1 = self.ring.get_part_nodes(part1)
+        part2, nodes2 = self.ring.get_nodes('a')
+        self.assertEqual(part1, part2)
+        self.assertEqual(nodes1, nodes2)
 
     def test_get_part_nodes(self):
         part, nodes = self.ring.get_nodes('a')
-        self.assertEquals(nodes, self.ring.get_part_nodes(part))
+        self.assertEqual(nodes, self.ring.get_part_nodes(part))
 
     def test_get_nodes(self):
         # Yes, these tests are deliberately very fragile. We want to make sure
         # that if someones changes the results the ring produces, they know it.
         self.assertRaises(TypeError, self.ring.get_nodes)
         part, nodes = self.ring.get_nodes('a')
-        self.assertEquals(part, 0)
-        self.assertEquals(nodes, [self.intended_devs[0],
-                                  self.intended_devs[3]])
+        self.assertEqual(part, 0)
+        self.assertEqual(nodes, [dict(node, index=i) for i, node in
+                         enumerate([self.intended_devs[0],
+                                    self.intended_devs[3]])])
 
         part, nodes = self.ring.get_nodes('a1')
-        self.assertEquals(part, 0)
-        self.assertEquals(nodes, [self.intended_devs[0],
-                                  self.intended_devs[3]])
+        self.assertEqual(part, 0)
+        self.assertEqual(nodes, [dict(node, index=i) for i, node in
+                         enumerate([self.intended_devs[0],
+                                    self.intended_devs[3]])])
 
         part, nodes = self.ring.get_nodes('a4')
-        self.assertEquals(part, 1)
-        self.assertEquals(nodes, [self.intended_devs[1],
-                                  self.intended_devs[4]])
+        self.assertEqual(part, 1)
+        self.assertEqual(nodes, [dict(node, index=i) for i, node in
+                         enumerate([self.intended_devs[1],
+                                    self.intended_devs[4]])])
 
         part, nodes = self.ring.get_nodes('aa')
-        self.assertEquals(part, 1)
-        self.assertEquals(nodes, [self.intended_devs[1],
-                                  self.intended_devs[4]])
+        self.assertEqual(part, 1)
+        self.assertEqual(nodes, [dict(node, index=i) for i, node in
+                         enumerate([self.intended_devs[1],
+                                    self.intended_devs[4]])])
 
         part, nodes = self.ring.get_nodes('a', 'c1')
-        self.assertEquals(part, 0)
-        self.assertEquals(nodes, [self.intended_devs[0],
-                                  self.intended_devs[3]])
+        self.assertEqual(part, 0)
+        self.assertEqual(nodes, [dict(node, index=i) for i, node in
+                         enumerate([self.intended_devs[0],
+                                    self.intended_devs[3]])])
 
         part, nodes = self.ring.get_nodes('a', 'c0')
-        self.assertEquals(part, 3)
-        self.assertEquals(nodes, [self.intended_devs[1],
-                                  self.intended_devs[4]])
+        self.assertEqual(part, 3)
+        self.assertEqual(nodes, [dict(node, index=i) for i, node in
+                         enumerate([self.intended_devs[1],
+                                    self.intended_devs[4]])])
 
         part, nodes = self.ring.get_nodes('a', 'c3')
-        self.assertEquals(part, 2)
-        self.assertEquals(nodes, [self.intended_devs[0],
-                                  self.intended_devs[3]])
+        self.assertEqual(part, 2)
+        self.assertEqual(nodes, [dict(node, index=i) for i, node in
+                         enumerate([self.intended_devs[0],
+                                    self.intended_devs[3]])])
 
         part, nodes = self.ring.get_nodes('a', 'c2')
-        self.assertEquals(part, 2)
-        self.assertEquals(nodes, [self.intended_devs[0],
-                                  self.intended_devs[3]])
+        self.assertEqual(nodes, [dict(node, index=i) for i, node in
+                         enumerate([self.intended_devs[0],
+                                    self.intended_devs[3]])])
 
         part, nodes = self.ring.get_nodes('a', 'c', 'o1')
-        self.assertEquals(part, 1)
-        self.assertEquals(nodes, [self.intended_devs[1],
-                                  self.intended_devs[4]])
+        self.assertEqual(part, 1)
+        self.assertEqual(nodes, [dict(node, index=i) for i, node in
+                         enumerate([self.intended_devs[1],
+                                    self.intended_devs[4]])])
 
         part, nodes = self.ring.get_nodes('a', 'c', 'o5')
-        self.assertEquals(part, 0)
-        self.assertEquals(nodes, [self.intended_devs[0],
-                                  self.intended_devs[3]])
+        self.assertEqual(part, 0)
+        self.assertEqual(nodes, [dict(node, index=i) for i, node in
+                         enumerate([self.intended_devs[0],
+                                    self.intended_devs[3]])])
 
         part, nodes = self.ring.get_nodes('a', 'c', 'o0')
-        self.assertEquals(part, 0)
-        self.assertEquals(nodes, [self.intended_devs[0],
-                                  self.intended_devs[3]])
+        self.assertEqual(part, 0)
+        self.assertEqual(nodes, [dict(node, index=i) for i, node in
+                         enumerate([self.intended_devs[0],
+                                    self.intended_devs[3]])])
 
         part, nodes = self.ring.get_nodes('a', 'c', 'o2')
-        self.assertEquals(part, 2)
-        self.assertEquals(nodes, [self.intended_devs[0],
-                                  self.intended_devs[3]])
+        self.assertEqual(part, 2)
+        self.assertEqual(nodes, [dict(node, index=i) for i, node in
+                         enumerate([self.intended_devs[0],
+                                    self.intended_devs[3]])])
 
     def add_dev_to_ring(self, new_dev):
         self.ring.devs.append(new_dev)
@@ -247,72 +733,649 @@ def add_dev_to_ring(self, new_dev):
     def test_get_more_nodes(self):
         # Yes, these tests are deliberately very fragile. We want to make sure
         # that if someone changes the results the ring produces, they know it.
-        part, nodes = self.ring.get_nodes('a', 'c', 'o2')
-        self.assertEquals(part, 2)
-        self.assertEquals(nodes, [self.intended_devs[0],
-                                  self.intended_devs[3]])
-        nodes = list(self.ring.get_more_nodes(part))
-        self.assertEquals(nodes, [self.intended_devs[4],
-                                  self.intended_devs[1]])
-
-        new_dev = {'id': 5, 'zone': 0, 'weight': 1.0,
-                   'ip': '10.1.1.1', 'port': 6000}
-        self.add_dev_to_ring(new_dev)
-        part, nodes = self.ring.get_nodes('a', 'c', 'o2')
-        self.assertEquals(part, 2)
-        self.assertEquals(nodes, [self.intended_devs[0],
-                                  self.intended_devs[3]])
-        nodes = list(self.ring.get_more_nodes(part))
-        self.assertEquals(nodes, [self.intended_devs[4],
-                                  new_dev,
-                                  self.intended_devs[1]])
-
-        self.ring.devs[5]['zone'] = 3
-        self.ring._rebuild_tier_data()
-        part, nodes = self.ring.get_nodes('a', 'c', 'o2')
-        self.assertEquals(part, 2)
-        self.assertEquals(nodes, [self.intended_devs[0],
-                                  self.intended_devs[3]])
-        nodes = list(self.ring.get_more_nodes(part))
-        self.assertEquals(nodes, [new_dev,
-                                  self.intended_devs[4],
-                                  self.intended_devs[1]])
-
-        self.ring.devs.append(None)
-        new_dev2 = {'id': 6, 'zone': 6, 'weight': 1.0,
-                    'ip': '10.1.6.1', 'port': 6000}
-        self.add_dev_to_ring(new_dev2)
-        part, nodes = self.ring.get_nodes('a', 'c', 'o2')
-        self.assertEquals(part, 2)
-        self.assertEquals(nodes, [self.intended_devs[0],
-                                  self.intended_devs[3]])
-        nodes = list(self.ring.get_more_nodes(part))
-        self.assertEquals(nodes, [new_dev,
-                                  new_dev2,
-                                  self.intended_devs[4],
-                                  self.intended_devs[1]])
-
-        new_dev3 = {'id': 7, 'zone': 7, 'weight': 1.0,
-                    'ip': '10.1.7.1', 'port': 6000}
-        self.add_dev_to_ring(new_dev3)
-        nodes = list(self.ring.get_more_nodes(part))
-        self.assertEquals(nodes, [new_dev, new_dev2, new_dev3,
-                                  self.intended_devs[4],
-                                  self.intended_devs[1]])
-        new_dev3['weight'] = 0
-        nodes = list(self.ring.get_more_nodes(part))
-        self.assertEquals(nodes, [new_dev, new_dev2,
-                                  self.intended_devs[4],
-                                  self.intended_devs[1]])
-        self.ring.devs[7]['weight'] = 1.0
-
-        new_dev4 = {'id': 8, 'zone': 8, 'weight': 0.0,
-                    'ip': '10.1.8.1', 'port': 6000}
-        self.add_dev_to_ring(new_dev4)
-        nodes = list(self.ring.get_more_nodes(part))
-        self.assertEquals(nodes, [new_dev, new_dev2,
-                                  self.intended_devs[4],
-                                  self.intended_devs[1]])
+        exp_part = 6
+        exp_devs = [102, 39, 93]
+        exp_zones = set([8, 9, 4])
+
+        exp_handoffs = [
+            69, 10, 22, 35, 56, 83, 100, 42, 92, 25, 50, 74, 61, 4,
+            13, 67, 8, 20, 106, 47, 89, 27, 59, 76, 97, 37, 85, 64,
+            0, 15, 32, 52, 79, 71, 11, 23, 99, 44, 90, 68, 6, 18,
+            96, 36, 84, 103, 41, 95, 33, 54, 81, 24, 48, 72, 60, 3,
+            12, 63, 2, 17, 28, 58, 75, 66, 7, 19, 104, 40, 94, 107,
+            45, 87, 101, 43, 91, 29, 57, 77, 62, 5, 14, 105, 46, 88,
+            98, 38, 86, 70, 9, 21, 65, 1, 16, 34, 55, 82, 31, 53,
+            78, 30, 51, 80, 26, 49, 73]
+
+        exp_first_handoffs = [
+            28, 34, 101, 99, 35, 62, 69, 65, 71, 67, 60, 34,
+            34, 101, 96, 98, 101, 27, 25, 106, 61, 63, 60,
+            104, 106, 65, 106, 31, 25, 25, 32, 62, 70, 35, 31,
+            99, 35, 33, 33, 64, 64, 32, 98, 69, 60, 102, 68,
+            33, 34, 60, 26, 60, 98, 32, 29, 60, 107, 96, 31,
+            65, 32, 26, 103, 62, 96, 62, 25, 103, 34, 30, 107,
+            104, 25, 97, 32, 65, 102, 24, 67, 97, 70, 63, 35,
+            105, 33, 104, 69, 29, 63, 30, 24, 102, 60, 30, 26,
+            105, 103, 104, 35, 24, 30, 64, 99, 27, 71, 107,
+            30, 25, 34, 33, 32, 62, 100, 103, 32, 33, 34, 99,
+            70, 32, 68, 69, 33, 27, 71, 101, 102, 99, 30, 31,
+            98, 71, 34, 33, 31, 100, 61, 107, 106, 66, 97,
+            106, 96, 101, 34, 33, 33, 28, 106, 30, 64, 96,
+            104, 105, 67, 32, 99, 102, 102, 30, 97, 105, 34,
+            99, 31, 61, 64, 29, 64, 61, 30, 101, 106, 60, 35,
+            34, 64, 61, 65, 101, 65, 62, 69, 60, 102, 107, 30,
+            28, 28, 34, 28, 65, 99, 105, 33, 62, 99, 71, 29,
+            66, 61, 101, 104, 104, 33, 96, 26, 62, 24, 64, 25,
+            99, 97, 35, 103, 32, 67, 70, 102, 26, 99, 102,
+            105, 65, 97, 31, 60, 60, 103, 98, 97, 98, 35, 66,
+            24, 98, 71, 0, 24, 67, 67, 30, 62, 69, 105, 71,
+            64, 101, 65, 32, 102, 35, 31, 34, 29, 105]
+
+        rb = ring.RingBuilder(8, 3, 1)
+        next_dev_id = 0
+        for zone in range(1, 10):
+            for server in range(1, 5):
+                for device in range(1, 4):
+                    rb.add_dev({'id': next_dev_id,
+                                'ip': '1.2.%d.%d' % (zone, server),
+                                'port': 1234 + device,
+                                'zone': zone, 'region': 0,
+                                'weight': 1.0,
+                                'device': "d%s" % device})
+                    next_dev_id += 1
+        rb.rebalance(seed=43)
+        rb.get_ring().save(self.testgz, format_version=self.FORMAT_VERSION)
+        r = ring.Ring(self.testdir, ring_name='whatever')
+
+        # every part has the same number of handoffs
+        part_handoff_counts = set()
+        for part in range(r.partition_count):
+            part_handoff_counts.add(len(list(r.get_more_nodes(part))))
+        self.assertEqual(part_handoff_counts, {105})
+        # which less the primaries - is every device in the ring
+        self.assertEqual(len(list(rb._iter_devs())) - rb.replicas, 105)
+
+        part, devs = r.get_nodes('a', 'c', 'o')
+        primary_zones = set([d['zone'] for d in devs])
+        self.assertEqual(part, exp_part)
+        self.assertEqual([d['id'] for d in devs], exp_devs)
+        self.assertEqual(primary_zones, exp_zones)
+        devs = list(r.get_more_nodes(part))
+        self.assertEqual(len(devs), len(exp_handoffs))
+        dev_ids = [d['id'] for d in devs]
+        self.assertEqual(dev_ids, exp_handoffs)
+        # We mark handoffs so code consuming extra nodes can reason about how
+        # far they've gone
+        for i, d in enumerate(devs):
+            self.assertEqual(d['handoff_index'], i)
+
+        # The first 6 replicas plus the 3 primary nodes should cover all 9
+        # zones in this test
+        seen_zones = set(primary_zones)
+        seen_zones.update([d['zone'] for d in devs[:6]])
+        self.assertEqual(seen_zones, set(range(1, 10)))
+
+        # The first handoff nodes for each partition in the ring
+        devs = []
+        for part in range(r.partition_count):
+            devs.append(next(r.get_more_nodes(part))['id'])
+        self.assertEqual(devs, exp_first_handoffs)
+
+        # Add a new device we can handoff to.
+        zone = 5
+        server = 0
+        rb.add_dev({'id': next_dev_id,
+                    'ip': '1.2.%d.%d' % (zone, server),
+                    'port': 1234, 'zone': zone, 'region': 0, 'weight': 1.0,
+                    'device': 'xd0'})
+        next_dev_id += 1
+        rb.pretend_min_part_hours_passed()
+        num_parts_changed, _balance, _removed_dev = rb.rebalance(seed=43)
+        rb.get_ring().save(self.testgz, format_version=self.FORMAT_VERSION)
+        r = ring.Ring(self.testdir, ring_name='whatever')
+
+        # so now we expect the device list to be longer by one device
+        part_handoff_counts = set()
+        for part in range(r.partition_count):
+            part_handoff_counts.add(len(list(r.get_more_nodes(part))))
+        self.assertEqual(part_handoff_counts, {106})
+        self.assertEqual(len(list(rb._iter_devs())) - rb.replicas, 106)
+        # I don't think there's any special reason this dev goes at this index
+        exp_handoffs.insert(33, rb.devs[-1]['id'])
+
+        # We would change expectations here, but in this part only the added
+        # device changed at all.
+        part, devs = r.get_nodes('a', 'c', 'o')
+        primary_zones = set([d['zone'] for d in devs])
+        self.assertEqual(part, exp_part)
+        self.assertEqual([d['id'] for d in devs], exp_devs)
+        self.assertEqual(primary_zones, exp_zones)
+        devs = list(r.get_more_nodes(part))
+        dev_ids = [d['id'] for d in devs]
+        self.assertEqual(len(dev_ids), len(exp_handoffs))
+        for index, dev in enumerate(dev_ids):
+            self.assertEqual(
+                dev, exp_handoffs[index],
+                'handoff differs at position %d\n%s\n%s' % (
+                    index, dev_ids[index:], exp_handoffs[index:]))
+
+        # The handoffs still cover all the non-primary zones first
+        seen_zones = set(primary_zones)
+        seen_zones.update([d['zone'] for d in devs[:6]])
+        self.assertEqual(seen_zones, set(range(1, 10)))
+
+        # Change expectations for the rest of the parts
+        devs = []
+        for part in range(r.partition_count):
+            devs.append(next(r.get_more_nodes(part))['id'])
+        changed_first_handoff = 0
+        for part in range(r.partition_count):
+            if devs[part] != exp_first_handoffs[part]:
+                changed_first_handoff += 1
+                exp_first_handoffs[part] = devs[part]
+        self.assertEqual(devs, exp_first_handoffs)
+        self.assertEqual(changed_first_handoff, num_parts_changed)
+
+        # Remove a device - no need to fluff min_part_hours.
+        rb.remove_dev(0)
+        num_parts_changed, _balance, _removed_dev = rb.rebalance(seed=87)
+        rb.get_ring().save(self.testgz, format_version=self.FORMAT_VERSION)
+        r = ring.Ring(self.testdir, ring_name='whatever')
+
+        # so now we expect the device list to be shorter by one device
+        part_handoff_counts = set()
+        for part in range(r.partition_count):
+            part_handoff_counts.add(len(list(r.get_more_nodes(part))))
+        self.assertEqual(part_handoff_counts, {105})
+        self.assertEqual(len(list(rb._iter_devs())) - rb.replicas, 105)
+
+        # Change expectations for our part
+        exp_handoffs.remove(0)
+        first_matches = 0
+        total_changed = 0
+        devs = list(d['id'] for d in r.get_more_nodes(exp_part))
+        for i, part in enumerate(devs):
+            if exp_handoffs[i] != devs[i]:
+                total_changed += 1
+                exp_handoffs[i] = devs[i]
+            if not total_changed:
+                first_matches += 1
+        self.assertEqual(devs, exp_handoffs)
+        # the first 32 handoffs were the same across the rebalance
+        self.assertEqual(first_matches, 32)
+        # but as you dig deeper some of the differences show up
+        self.assertEqual(total_changed, 27)
+
+        # Change expectations for the rest of the parts
+        devs = []
+        for part in range(r.partition_count):
+            devs.append(next(r.get_more_nodes(part))['id'])
+        changed_first_handoff = 0
+        for part in range(r.partition_count):
+            if devs[part] != exp_first_handoffs[part]:
+                changed_first_handoff += 1
+                exp_first_handoffs[part] = devs[part]
+        self.assertEqual(devs, exp_first_handoffs)
+        self.assertEqual(changed_first_handoff, num_parts_changed)
+
+        # Test
+        part, devs = r.get_nodes('a', 'c', 'o')
+        primary_zones = set([d['zone'] for d in devs])
+        self.assertEqual(part, exp_part)
+        self.assertEqual([d['id'] for d in devs], exp_devs)
+        self.assertEqual(primary_zones, exp_zones)
+        devs = list(r.get_more_nodes(part))
+        dev_ids = [d['id'] for d in devs]
+        self.assertEqual(len(dev_ids), len(exp_handoffs))
+        for index, dev in enumerate(dev_ids):
+            self.assertEqual(
+                dev, exp_handoffs[index],
+                'handoff differs at position %d\n%s\n%s' % (
+                    index, dev_ids[index:], exp_handoffs[index:]))
+
+        seen_zones = set(primary_zones)
+        seen_zones.update([d['zone'] for d in devs[:6]])
+        self.assertEqual(seen_zones, set(range(1, 10)))
+
+        devs = []
+        for part in range(r.partition_count):
+            devs.append(next(r.get_more_nodes(part))['id'])
+        for part in range(r.partition_count):
+            self.assertEqual(
+                devs[part], exp_first_handoffs[part],
+                'handoff for partitition %d is now device id %d' % (
+                    part, devs[part]))
+
+        # Add a partial replica
+        rb.set_replicas(3.5)
+        num_parts_changed, _balance, _removed_dev = rb.rebalance(seed=164)
+        rb.get_ring().save(self.testgz, format_version=self.FORMAT_VERSION)
+        r = ring.Ring(self.testdir, ring_name='whatever')
+
+        # Change expectations
+
+        # We have another replica now
+        exp_devs.append(13)
+        exp_zones.add(2)
+        # and therefore one less handoff
+        exp_handoffs = exp_handoffs[:-1]
+        # Caused some major changes in the sequence of handoffs for our test
+        # partition, but at least the first stayed the same.
+        devs = list(d['id'] for d in r.get_more_nodes(exp_part))
+        first_matches = 0
+        total_changed = 0
+        for i, part in enumerate(devs):
+            if exp_handoffs[i] != devs[i]:
+                total_changed += 1
+                exp_handoffs[i] = devs[i]
+            if not total_changed:
+                first_matches += 1
+        # most seeds seem to throw out first handoff stabilization with
+        # replica_count change
+        self.assertEqual(first_matches, 0)
+        # and lots of other handoff changes...
+        self.assertEqual(total_changed, 95)
+
+        self.assertEqual(devs, exp_handoffs)
+
+        # Change expectations for the rest of the parts
+        devs = []
+        for part in range(r.partition_count):
+            devs.append(next(r.get_more_nodes(part))['id'])
+        changed_first_handoff = 0
+        for part in range(r.partition_count):
+            if devs[part] != exp_first_handoffs[part]:
+                changed_first_handoff += 1
+                exp_first_handoffs[part] = devs[part]
+        self.assertEqual(devs, exp_first_handoffs)
+        self.assertLessEqual(changed_first_handoff, num_parts_changed)
+
+        # Test
+        part, devs = r.get_nodes('a', 'c', 'o')
+        primary_zones = set([d['zone'] for d in devs])
+        self.assertEqual(part, exp_part)
+        self.assertEqual([d['id'] for d in devs], exp_devs)
+        self.assertEqual(primary_zones, exp_zones)
+        devs = list(r.get_more_nodes(part))
+        dev_ids = [d['id'] for d in devs]
+        self.assertEqual(len(dev_ids), len(exp_handoffs))
+
+        for index, dev in enumerate(dev_ids):
+            self.assertEqual(
+                dev, exp_handoffs[index],
+                'handoff differs at position %d\n%s\n%s' % (
+                    index, dev_ids[index:], exp_handoffs[index:]))
+
+        seen_zones = set(primary_zones)
+        seen_zones.update([d['zone'] for d in devs[:6]])
+        self.assertEqual(seen_zones, set(range(1, 10)))
+
+        devs = []
+        for part in range(r.partition_count):
+            devs.append(next(r.get_more_nodes(part))['id'])
+        for part in range(r.partition_count):
+            self.assertEqual(
+                devs[part], exp_first_handoffs[part],
+                'handoff for partitition %d is now device id %d' % (
+                    part, devs[part]))
+
+        # One last test of a partial replica partition
+        exp_part2 = 136
+        exp_devs2 = [35, 56, 83]
+        exp_zones2 = set([3, 5, 7])
+        exp_handoffs2 = [
+            61, 4, 13, 86, 103, 41, 63, 2, 17, 95, 70, 67, 8, 20,
+            106, 100, 11, 23, 87, 47, 51, 42, 30, 24, 48, 72, 27,
+            59, 76, 97, 38, 90, 108, 79, 55, 68, 6, 18, 105, 71,
+            62, 5, 14, 107, 89, 7, 45, 69, 10, 22, 12, 99, 44, 46,
+            88, 74, 39, 15, 102, 93, 85, 34, 98, 29, 57, 77, 84, 9,
+            21, 58, 78, 32, 52, 66, 19, 28, 75, 65, 1, 16, 33, 37,
+            49, 82, 31, 53, 54, 81, 96, 92, 3, 25, 50, 60, 36, 101,
+            43, 104, 40, 94, 64, 80, 26, 73, 91]
+
+        part2, devs2 = r.get_nodes('a', 'c', 'o2')
+        primary_zones2 = set([d['zone'] for d in devs2])
+        self.assertEqual(part2, exp_part2)
+        self.assertEqual([d['id'] for d in devs2], exp_devs2)
+        self.assertEqual(primary_zones2, exp_zones2)
+        devs2 = list(r.get_more_nodes(part2))
+        dev_ids2 = [d['id'] for d in devs2]
+
+        self.assertEqual(len(dev_ids2), len(exp_handoffs2))
+        for index, dev in enumerate(dev_ids2):
+            self.assertEqual(
+                dev, exp_handoffs2[index],
+                'handoff differs at position %d\n%s\n%s' % (
+                    index, dev_ids2[index:], exp_handoffs2[index:]))
+
+        seen_zones = set(primary_zones2)
+        seen_zones.update([d['zone'] for d in devs2[:6]])
+        self.assertEqual(seen_zones, set(range(1, 10)))
+
+        # Test distribution across regions
+        rb.set_replicas(3)
+        for region in range(1, 5):
+            rb.add_dev({'id': next_dev_id,
+                        'ip': '1.%d.1.%d' % (region, server), 'port': 1234,
+                        # 108.0 is the weight of all devices created prior to
+                        # this test in region 0; this way all regions have
+                        # equal combined weight
+                        'zone': 1, 'region': region, 'weight': 108.0,
+                        'device': 'sdx'})
+            next_dev_id += 1
+        rb.pretend_min_part_hours_passed()
+        rb.rebalance(seed=1)
+        rb.pretend_min_part_hours_passed()
+        rb.rebalance(seed=1)
+        rb.get_ring().save(self.testgz, format_version=self.FORMAT_VERSION)
+        r = ring.Ring(self.testdir, ring_name='whatever')
+
+        # There's 5 regions now, so the primary nodes + first 2 handoffs
+        # should span all 5 regions
+        part, devs = r.get_nodes('a1', 'c1', 'o1')
+        primary_regions = set([d['region'] for d in devs])
+        primary_zones = set([(d['region'], d['zone']) for d in devs])
+        more_devs = list(r.get_more_nodes(part))
+
+        seen_regions = set(primary_regions)
+        seen_regions.update([d['region'] for d in more_devs[:2]])
+        self.assertEqual(seen_regions, set(range(0, 5)))
+
+        # There are 13 zones now, so the first 13 nodes should all have
+        # distinct zones (that's r0z0, r0z1, ..., r0z8, r1z1, r2z1, r3z1, and
+        # r4z1).
+        seen_zones = set(primary_zones)
+        seen_zones.update([(d['region'], d['zone']) for d in more_devs[:10]])
+        self.assertEqual(13, len(seen_zones))
+
+        # Here's a brittle canary-in-the-coalmine test to make sure the region
+        # handoff computation didn't change accidentally
+        exp_handoffs = [111, 112, 83, 45, 21, 95, 51, 26, 3, 102, 72, 80, 59,
+                        61, 14, 89, 105, 31, 1, 39, 90, 16, 86, 75, 49, 42, 35,
+                        71, 99, 20, 97, 27, 54, 67, 8, 11, 37, 108, 73, 78, 23,
+                        53, 79, 82, 57, 106, 85, 22, 25, 13, 47, 76, 18, 84,
+                        81, 12, 32, 17, 103, 41, 19, 50, 52, 4, 94, 64, 48, 63,
+                        43, 66, 104, 6, 62, 87, 69, 68, 46, 98, 77, 2, 107, 93,
+                        9, 28, 55, 33, 5, 92, 74, 96, 7, 40, 30, 100, 36, 15,
+                        88, 58, 24, 56, 34, 101, 60, 10, 38, 29, 70, 44, 91]
+
+        dev_ids = [d['id'] for d in more_devs]
+
+        self.assertEqual(len(dev_ids), len(exp_handoffs))
+        for index, dev_id in enumerate(dev_ids):
+            self.assertEqual(
+                dev_id, exp_handoffs[index],
+                'handoff differs at position %d\n%s\n%s' % (
+                    index, dev_ids[index:], exp_handoffs[index:]))
+
+    def test_get_more_nodes_with_zero_weight_region(self):
+        rb = ring.RingBuilder(8, 3, 1)
+        devs = [
+            ring_utils.parse_add_value(v) for v in [
+                'r1z1-127.0.0.1:6200/d1',
+                'r1z1-127.0.0.1:6201/d2',
+                'r1z1-127.0.0.1:6202/d3',
+                'r1z1-127.0.0.1:6203/d4',
+                'r1z2-127.0.0.2:6200/d1',
+                'r1z2-127.0.0.2:6201/d2',
+                'r1z2-127.0.0.2:6202/d3',
+                'r1z2-127.0.0.2:6203/d4',
+                'r2z1-127.0.1.1:6200/d1',
+                'r2z1-127.0.1.1:6201/d2',
+                'r2z1-127.0.1.1:6202/d3',
+                'r2z1-127.0.1.1:6203/d4',
+                'r2z2-127.0.1.2:6200/d1',
+                'r2z2-127.0.1.2:6201/d2',
+                'r2z2-127.0.1.2:6202/d3',
+                'r2z2-127.0.1.2:6203/d4',
+            ]
+        ]
+        for dev in devs:
+            if dev['region'] == 2:
+                dev['weight'] = 0.0
+            else:
+                dev['weight'] = 1.0
+            rb.add_dev(dev)
+        rb.rebalance()
+        rb.get_ring().save(self.testgz, format_version=self.FORMAT_VERSION)
+        r = ring.Ring(self.testdir, ring_name='whatever')
+        self.assertEqual(r.version, rb.version)
+
+        class CountingRingTable(object):
+
+            def __init__(self, table):
+                self.table = table
+                self.count = 0
+
+            def __iter__(self):
+                self._iter = iter(self.table)
+                return self
+
+            def __next__(self):
+                self.count += 1
+                return next(self._iter)
+
+            def __getitem__(self, key):
+                return self.table[key]
+
+        histogram = collections.defaultdict(int)
+        for part in range(r.partition_count):
+            counting_table = CountingRingTable(r._replica2part2dev_id)
+            with mock.patch.object(r, '_replica2part2dev_id', counting_table):
+                node_iter = r.get_more_nodes(part)
+                next(node_iter)
+            histogram[counting_table.count] += 1
+        # Don't let our summing muddy our histogram
+        histogram = dict(histogram)
+
+        # sanity
+        self.assertEqual(1, r._num_regions)
+        self.assertEqual(2, r._num_zones)
+        self.assertEqual(256, r.partition_count)
+
+        # We always do one loop (including the StopIteration) while getting
+        # primaries, so every part should hit next() at least 5 times
+        self.assertEqual(sum(histogram.get(x, 0) for x in range(5)), 0,
+                         histogram)
+
+        # Most of the parts should find a handoff device in the next partition,
+        # but because some of the primary devices may *also* be used for that
+        # partition, that means 5, 6, or 7 calls to next().
+        self.assertGreater(sum(histogram.get(x, 0) for x in range(8)), 160,
+                           histogram)
+
+        # Want 90% confidence that it'll happen within two partitions
+        self.assertGreater(sum(histogram.get(x, 0) for x in range(12)), 230,
+                           histogram)
+
+        # Tail should fall off fairly quickly
+        self.assertLess(sum(histogram.get(x, 0) for x in range(20, 100)), 5,
+                        histogram)
+
+        # Hard limit at 50 (we've seen as bad as 41, 45)
+        self.assertEqual(sum(histogram.get(x, 0) for x in range(50, 100)), 0,
+                         histogram)
+
+
+class TestRingV2(TestRing):
+    FORMAT_VERSION = 2
+
+    def test_4_byte_dev_ids(self):
+        ring_file = os.path.join(self.testdir, 'test.ring.gz')
+        index = {}
+        with GzipFile(ring_file, 'wb') as fp:
+            fp.write(b'R1NG\x00\x02')
+            fp.flush(zlib.Z_FULL_FLUSH)
+
+            comp_start = os.fstat(fp.fileno()).st_size
+            uncomp_start = fp.tell()
+            meta = json.dumps({
+                "dev_id_bytes": 4,
+                "part_shift": 29,
+                "replica_count": 1.5,
+            }).encode('ascii')
+            to_write = struct.pack('!Q', len(meta)) + meta
+            fp.write(to_write)
+            fp.flush(zlib.Z_FULL_FLUSH)
+            index['swift/ring/metadata'] = [
+                comp_start,
+                uncomp_start,
+                os.fstat(fp.fileno()).st_size,
+                fp.tell(),
+                'sha256',
+                hashlib.sha256(to_write).hexdigest()]
+
+            comp_start = os.fstat(fp.fileno()).st_size
+            uncomp_start = fp.tell()
+            devs = json.dumps([
+                {"id": 0, "region": 1, "zone": 1, "ip": "127.0.0.1",
+                 "port": 6200, "device": "sda", "weight": 1},
+                None,
+                {"id": 2, "region": 1, "zone": 1, "ip": "127.0.0.1",
+                 "port": 6201, "device": "sdb", "weight": 1},
+                {"id": 3, "region": 1, "zone": 1, "ip": "127.0.0.1",
+                 "port": 6202, "device": "sdc", "weight": 1},
+            ]).encode('ascii')
+            to_write = struct.pack('!Q', len(devs)) + devs
+            fp.write(to_write)
+            fp.flush(zlib.Z_FULL_FLUSH)
+            index['swift/ring/devices'] = [
+                comp_start,
+                uncomp_start,
+                os.fstat(fp.fileno()).st_size,
+                fp.tell(),
+                'sha256',
+                hashlib.sha256(to_write).hexdigest()]
+
+            comp_start = os.fstat(fp.fileno()).st_size
+            uncomp_start = fp.tell()
+            to_write = struct.pack('!Q', 48) + 4 * (
+                b'\x00\x00\x00\x03'
+                b'\x00\x00\x00\x02'
+                b'\x00\x00\x00\x00')
+            fp.write(to_write)
+            fp.flush(zlib.Z_FULL_FLUSH)
+            index['swift/ring/assignments'] = [
+                comp_start,
+                uncomp_start,
+                os.fstat(fp.fileno()).st_size,
+                fp.tell(),
+                'sha256',
+                hashlib.sha256(to_write).hexdigest()]
+
+            comp_start = os.fstat(fp.fileno()).st_size
+            uncomp_start = fp.tell()
+            blob = json.dumps(index).encode('ascii')
+            fp.write(struct.pack('!Q', len(blob)) + blob)
+            fp.flush(zlib.Z_FULL_FLUSH)
+
+            fp.compress = zlib.compressobj(
+                0, zlib.DEFLATED, -zlib.MAX_WBITS, zlib.DEF_MEM_LEVEL, 0)
+            fp.write(struct.pack('!Q', uncomp_start))
+            fp.flush(zlib.Z_FULL_FLUSH)
+            fp.write(struct.pack('!Q', comp_start))
+            fp.flush(zlib.Z_FULL_FLUSH)
+
+        r = ring.Ring(ring_file)
+        self.assertEqual(
+            [[d['id'] for d in r.get_part_nodes(p)] for p in range(8)],
+            [[3, 0], [2, 3], [0, 2], [3, 0], [2], [0], [3], [2]])
+
+
+class ExtendedRingData(ring.RingData):
+    extra = b'some super-specific data'
+
+    def to_dict(self):
+        ring_data = super().to_dict()
+        ring_data.setdefault('extra', self.extra)
+        return ring_data
+
+    def serialize_v2(self, writer):
+        super().serialize_v2(writer)
+        with writer.section('my-custom-section') as s:
+            s.write_blob(self.extra)
+
+    @classmethod
+    def deserialize_v2(cls, reader, *args, **kwargs):
+        ring_data = super().deserialize_v2(reader, *args, **kwargs)
+        # If you're adding custom data to your rings, you probably want an
+        # upgrade story that includes that data not being present
+        if 'my-custom-section' in reader.index:
+            with reader.open_section('my-custom-section') as s:
+                ring_data['extra'] = s.read()
+        return ring_data
+
+    @classmethod
+    def from_dict(cls, ring_data):
+        obj = super().from_dict(ring_data)
+        obj.extra = ring_data.get('extra')
+        return obj
+
+
+class TestRingExtensibility(unittest.TestCase):
+    def test(self):
+        r2p2d = [[0, 1, 0, 1], [0, 1, 0, 1]]
+        d = [{'id': 0, 'zone': 0, 'region': 0, 'ip': '10.1.1.0', 'port': 7000},
+             {'id': 1, 'zone': 1, 'region': 1, 'ip': '10.1.1.1', 'port': 7000}]
+        s = 30
+        rd = ExtendedRingData(r2p2d, d, s)
+        self.assertEqual(rd._replica2part2dev_id, r2p2d)
+        self.assertEqual(rd.devs, d)
+        self.assertEqual(rd._part_shift, s)
+        self.assertEqual(rd.extra, b'some super-specific data')
+
+        # Can update it and round-trip to disk and back
+        rd.extra = b'some other value'
+        testdir = mkdtemp()
+        try:
+            ring_fname = os.path.join(testdir, 'foo.ring.gz')
+            rd.save(ring_fname, format_version=2)
+            bytes_written = os.path.getsize(ring_fname)
+            rd2 = ExtendedRingData.load(ring_fname)
+            # Vanilla Swift can also read the custom ring
+            vanilla_ringdata = ring.RingData.load(ring_fname)
+        finally:
+            rmtree(testdir, ignore_errors=1)
+
+        self.assertEqual(rd2._replica2part2dev_id, r2p2d)
+        self.assertEqual(rd2.devs, d)
+        self.assertEqual(rd2._part_shift, s)
+        self.assertEqual(rd2.extra, b'some other value')
+        self.assertEqual(rd2.size, bytes_written)
+
+        self.assertEqual(vanilla_ringdata._replica2part2dev_id, r2p2d)
+        self.assertEqual(vanilla_ringdata.devs, d)
+        self.assertEqual(vanilla_ringdata._part_shift, s)
+        self.assertFalse(hasattr(vanilla_ringdata, 'extra'))
+        self.assertEqual(vanilla_ringdata.size, bytes_written)
+
+    def test_missing_custom_data(self):
+        r2p2d = [[0, 1, 0, 1], [0, 1, 0, 1]]
+        d = [{'id': 0, 'zone': 0, 'region': 0, 'ip': '10.1.1.0', 'port': 7000},
+             {'id': 1, 'zone': 1, 'region': 1, 'ip': '10.1.1.1', 'port': 7000}]
+        s = 30
+        rd = ring.RingData(r2p2d, d, s)
+        self.assertEqual(rd._replica2part2dev_id, r2p2d)
+        self.assertEqual(rd.devs, d)
+        self.assertEqual(rd._part_shift, s)
+        self.assertFalse(hasattr(rd, 'extra'))
+
+        # Can load a vanilla ring and get some default behavior based on the
+        # overridden from_dict
+        testdir = mkdtemp()
+        try:
+            ring_fname = os.path.join(testdir, 'foo.ring.gz')
+            rd.save(ring_fname, format_version=2)
+            bytes_written = os.path.getsize(ring_fname)
+            rd2 = ExtendedRingData.load(ring_fname)
+        finally:
+            rmtree(testdir, ignore_errors=1)
+
+        self.assertEqual(rd2._replica2part2dev_id, r2p2d)
+        self.assertEqual(rd2.devs, d)
+        self.assertEqual(rd2._part_shift, s)
+        self.assertIsNone(rd2.extra)
+        self.assertEqual(rd2.size, bytes_written)
 
 
 if __name__ == '__main__':
diff --git a/test/unit/common/ring/test_utils.py b/test/unit/common/ring/test_utils.py
new file mode 100644
index 0000000000..881f62a877
--- /dev/null
+++ b/test/unit/common/ring/test_utils.py
@@ -0,0 +1,787 @@
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+from collections import defaultdict
+
+from swift.common import exceptions
+from swift.common import ring
+from swift.common.ring.utils import (tiers_for_dev, build_tier_tree,
+                                     validate_and_normalize_ip,
+                                     validate_and_normalize_address,
+                                     is_valid_hostname,
+                                     is_local_device, parse_search_value,
+                                     parse_search_values_from_opts,
+                                     parse_change_values_from_opts,
+                                     validate_args, parse_args,
+                                     parse_builder_ring_filename_args,
+                                     build_dev_from_opts, dispersion_report,
+                                     parse_address, get_tier_name, pretty_dev,
+                                     validate_replicas_by_tier)
+
+
+class TestUtils(unittest.TestCase):
+
+    def setUp(self):
+        self.test_dev = {'region': 1, 'zone': 1, 'ip': '192.168.1.1',
+                         'port': '6200', 'id': 0}
+
+        def get_test_devs():
+            dev0 = {'region': 1, 'zone': 1, 'ip': '192.168.1.1',
+                    'port': '6200', 'id': 0}
+            dev1 = {'region': 1, 'zone': 1, 'ip': '192.168.1.1',
+                    'port': '6200', 'id': 1}
+            dev2 = {'region': 1, 'zone': 1, 'ip': '192.168.1.1',
+                    'port': '6200', 'id': 2}
+            dev3 = {'region': 1, 'zone': 1, 'ip': '192.168.1.2',
+                    'port': '6200', 'id': 3}
+            dev4 = {'region': 1, 'zone': 1, 'ip': '192.168.1.2',
+                    'port': '6200', 'id': 4}
+            dev5 = {'region': 1, 'zone': 1, 'ip': '192.168.1.2',
+                    'port': '6200', 'id': 5}
+            dev6 = {'region': 1, 'zone': 2, 'ip': '192.168.2.1',
+                    'port': '6200', 'id': 6}
+            dev7 = {'region': 1, 'zone': 2, 'ip': '192.168.2.1',
+                    'port': '6200', 'id': 7}
+            dev8 = {'region': 1, 'zone': 2, 'ip': '192.168.2.1',
+                    'port': '6200', 'id': 8}
+            dev9 = {'region': 1, 'zone': 2, 'ip': '192.168.2.2',
+                    'port': '6200', 'id': 9}
+            dev10 = {'region': 1, 'zone': 2, 'ip': '192.168.2.2',
+                     'port': '6200', 'id': 10}
+            dev11 = {'region': 1, 'zone': 2, 'ip': '192.168.2.2',
+                     'port': '6200', 'id': 11}
+            return [dev0, dev1, dev2, dev3, dev4, dev5,
+                    dev6, dev7, dev8, dev9, dev10, dev11]
+
+        self.test_devs = get_test_devs()
+
+    def test_tiers_for_dev(self):
+        self.assertEqual(
+            tiers_for_dev(self.test_dev),
+            ((1,),
+             (1, 1),
+             (1, 1, '192.168.1.1'),
+             (1, 1, '192.168.1.1', 0)))
+
+    def test_build_tier_tree(self):
+        ret = build_tier_tree(self.test_devs)
+        self.assertEqual(len(ret), 8)
+        self.assertEqual(ret[()], set([(1,)]))
+        self.assertEqual(ret[(1,)], set([(1, 1), (1, 2)]))
+        self.assertEqual(ret[(1, 1)],
+                         set([(1, 1, '192.168.1.2'),
+                              (1, 1, '192.168.1.1')]))
+        self.assertEqual(ret[(1, 2)],
+                         set([(1, 2, '192.168.2.2'),
+                              (1, 2, '192.168.2.1')]))
+        self.assertEqual(ret[(1, 1, '192.168.1.1')],
+                         set([(1, 1, '192.168.1.1', 0),
+                              (1, 1, '192.168.1.1', 1),
+                              (1, 1, '192.168.1.1', 2)]))
+        self.assertEqual(ret[(1, 1, '192.168.1.2')],
+                         set([(1, 1, '192.168.1.2', 3),
+                              (1, 1, '192.168.1.2', 4),
+                              (1, 1, '192.168.1.2', 5)]))
+        self.assertEqual(ret[(1, 2, '192.168.2.1')],
+                         set([(1, 2, '192.168.2.1', 6),
+                              (1, 2, '192.168.2.1', 7),
+                              (1, 2, '192.168.2.1', 8)]))
+        self.assertEqual(ret[(1, 2, '192.168.2.2')],
+                         set([(1, 2, '192.168.2.2', 9),
+                              (1, 2, '192.168.2.2', 10),
+                              (1, 2, '192.168.2.2', 11)]))
+
+    def test_is_valid_hostname(self):
+        self.assertTrue(is_valid_hostname("local"))
+        self.assertTrue(is_valid_hostname("test.test.com"))
+        hostname = "test." * 51
+        self.assertTrue(is_valid_hostname(hostname))
+        hostname = hostname.rstrip('.')
+        self.assertTrue(is_valid_hostname(hostname))
+        hostname = hostname + "00"
+        self.assertFalse(is_valid_hostname(hostname))
+        self.assertFalse(is_valid_hostname("$blah#"))
+
+    def test_is_local_device(self):
+        # localhost shows up in whataremyips() output as "::1" for IPv6
+        my_ips = ["127.0.0.1", "::1"]
+        my_port = 6200
+        self.assertTrue(is_local_device(my_ips, my_port,
+                                        "127.0.0.1", my_port))
+        self.assertTrue(is_local_device(my_ips, my_port,
+                                        "::1", my_port))
+        self.assertTrue(is_local_device(
+            my_ips, my_port,
+            "0000:0000:0000:0000:0000:0000:0000:0001", my_port))
+        self.assertTrue(is_local_device(my_ips, my_port,
+                                        "localhost", my_port))
+        self.assertFalse(is_local_device(my_ips, my_port,
+                                         "localhost", my_port + 1))
+        self.assertFalse(is_local_device(my_ips, my_port,
+                                         "127.0.0.2", my_port))
+        # for those that don't have a local port
+        self.assertTrue(is_local_device(my_ips, None,
+                                        my_ips[0], None))
+
+        # When servers_per_port is active, the "my_port" passed in is None
+        # which means "don't include port in the determination of locality
+        # because it's not reliable in this deployment scenario"
+        self.assertTrue(is_local_device(my_ips, None,
+                                        "127.0.0.1", 6666))
+        self.assertTrue(is_local_device(my_ips, None,
+                                        "::1", 6666))
+        self.assertTrue(is_local_device(
+            my_ips, None,
+            "0000:0000:0000:0000:0000:0000:0000:0001", 6666))
+        self.assertTrue(is_local_device(my_ips, None,
+                                        "localhost", 6666))
+        self.assertFalse(is_local_device(my_ips, None,
+                                         "127.0.0.2", my_port))
+
+    def test_validate_and_normalize_ip(self):
+        ipv4 = "10.0.0.1"
+        self.assertEqual(ipv4, validate_and_normalize_ip(ipv4))
+        ipv6 = "fe80::204:61ff:fe9d:f156"
+        self.assertEqual(ipv6, validate_and_normalize_ip(ipv6.upper()))
+        hostname = "test.test.com"
+        self.assertRaises(ValueError,
+                          validate_and_normalize_ip, hostname)
+        hostname = "$blah#"
+        self.assertRaises(ValueError,
+                          validate_and_normalize_ip, hostname)
+
+    def test_validate_and_normalize_address(self):
+        ipv4 = "10.0.0.1"
+        self.assertEqual(ipv4, validate_and_normalize_address(ipv4))
+        ipv6 = "fe80::204:61ff:fe9d:f156"
+        self.assertEqual(ipv6, validate_and_normalize_address(ipv6.upper()))
+        hostname = "test.test.com"
+        self.assertEqual(hostname,
+                         validate_and_normalize_address(hostname.upper()))
+        hostname = "$blah#"
+        self.assertRaises(ValueError,
+                          validate_and_normalize_address, hostname)
+
+    def test_validate_replicas_by_tier_close(self):
+        one_ip_six_devices = \
+            defaultdict(float,
+                        {(): 4.0,
+                         (0,): 4.0,
+                         (0, 0): 4.0,
+                         (0, 0, '127.0.0.1'): 4.0,
+                         (0, 0, '127.0.0.1', 0): 0.6666666670,
+                         (0, 0, '127.0.0.1', 1): 0.6666666668,
+                         (0, 0, '127.0.0.1', 2): 0.6666666667,
+                         (0, 0, '127.0.0.1', 3): 0.6666666666,
+                         (0, 0, '127.0.0.1', 4): 0.6666666665,
+                         (0, 0, '127.0.0.1', 5): 0.6666666664,
+                         })
+        try:
+            validate_replicas_by_tier(4, one_ip_six_devices)
+        except Exception as e:
+            self.fail('one_ip_six_devices is invalid for %s' % e)
+
+    def test_validate_replicas_by_tier_exact(self):
+        three_regions_three_devices = \
+            defaultdict(float,
+                        {(): 3.0,
+                         (0,): 1.0,
+                         (0, 0): 1.0,
+                         (0, 0, '127.0.0.1'): 1.0,
+                         (0, 0, '127.0.0.1', 0): 1.0,
+                         (1,): 1.0,
+                         (1, 1): 1.0,
+                         (1, 1, '127.0.0.1'): 1.0,
+                         (1, 1, '127.0.0.1', 1): 1.0,
+                         (2,): 1.0,
+                         (2, 2): 1.0,
+                         (2, 2, '127.0.0.1'): 1.0,
+                         (2, 2, '127.0.0.1', 2): 1.0,
+                         })
+        try:
+            validate_replicas_by_tier(3, three_regions_three_devices)
+        except Exception as e:
+            self.fail('three_regions_three_devices is invalid for %s' % e)
+
+    def test_validate_replicas_by_tier_errors(self):
+        pseudo_replicas = \
+            defaultdict(float,
+                        {(): 3.0,
+                         (0,): 1.0,
+                         (0, 0): 1.0,
+                         (0, 0, '127.0.0.1'): 1.0,
+                         (0, 0, '127.0.0.1', 0): 1.0,
+                         (1,): 1.0,
+                         (1, 1): 1.0,
+                         (1, 1, '127.0.0.1'): 1.0,
+                         (1, 1, '127.0.0.1', 1): 1.0,
+                         (2,): 1.0,
+                         (2, 2): 1.0,
+                         (2, 2, '127.0.0.1'): 1.0,
+                         (2, 2, '127.0.0.1', 2): 1.0,
+                         })
+
+        def do_test(bad_tier_key, bad_tier_name):
+            # invalidate a copy of pseudo_replicas at given key and check for
+            # an exception to be raised
+            test_replicas = dict(pseudo_replicas)
+            test_replicas[bad_tier_key] += 0.1  # <- this is not fair!
+            with self.assertRaises(exceptions.RingValidationError) as ctx:
+                validate_replicas_by_tier(3, test_replicas)
+            self.assertEqual(
+                '3.1 != 3 at tier %s' % bad_tier_name, str(ctx.exception))
+
+        do_test((), 'cluster')
+        do_test((1,), 'regions')
+        do_test((0, 0), 'zones')
+        do_test((2, 2, '127.0.0.1'), 'servers')
+        do_test((1, 1, '127.0.0.1', 1), 'devices')
+
+    def test_parse_search_value(self):
+        res = parse_search_value('r0')
+        self.assertEqual(res, {'region': 0})
+        res = parse_search_value('r1')
+        self.assertEqual(res, {'region': 1})
+        res = parse_search_value('r1z2')
+        self.assertEqual(res, {'region': 1, 'zone': 2})
+        res = parse_search_value('d1')
+        self.assertEqual(res, {'id': 1})
+        res = parse_search_value('z1')
+        self.assertEqual(res, {'zone': 1})
+        res = parse_search_value('-127.0.0.1')
+        self.assertEqual(res, {'ip': '127.0.0.1'})
+        res = parse_search_value('127.0.0.1')
+        self.assertEqual(res, {'ip': '127.0.0.1'})
+        res = parse_search_value('-[127.0.0.1]:10001')
+        self.assertEqual(res, {'ip': '127.0.0.1', 'port': 10001})
+        res = parse_search_value(':10001')
+        self.assertEqual(res, {'port': 10001})
+        res = parse_search_value('R127.0.0.10')
+        self.assertEqual(res, {'replication_ip': '127.0.0.10'})
+        res = parse_search_value('R[127.0.0.10]:20000')
+        self.assertEqual(res, {'replication_ip': '127.0.0.10',
+                               'replication_port': 20000})
+        res = parse_search_value('R:20000')
+        self.assertEqual(res, {'replication_port': 20000})
+        res = parse_search_value('/sdb1')
+        self.assertEqual(res, {'device': 'sdb1'})
+        res = parse_search_value('_meta1')
+        self.assertEqual(res, {'meta': 'meta1'})
+        self.assertRaises(ValueError, parse_search_value, 'OMGPONIES')
+
+    def test_parse_search_values_from_opts(self):
+        argv = \
+            ["--id", "1", "--region", "2", "--zone", "3",
+             "--ip", "test.test.com",
+             "--port", "6200",
+             "--replication-ip", "r.test.com",
+             "--replication-port", "7000",
+             "--device", "sda3",
+             "--meta", "some meta data",
+             "--weight", "3.14159265359",
+             "--change-ip", "change.test.test.com",
+             "--change-port", "6201",
+             "--change-replication-ip", "change.r.test.com",
+             "--change-replication-port", "7001",
+             "--change-device", "sdb3",
+             "--change-meta", "some meta data for change"]
+        expected = {
+            'id': 1,
+            'region': 2,
+            'zone': 3,
+            'ip': "test.test.com",
+            'port': 6200,
+            'replication_ip': "r.test.com",
+            'replication_port': 7000,
+            'device': "sda3",
+            'meta': "some meta data",
+            'weight': 3.14159265359,
+        }
+        new_cmd_format, opts, args = validate_args(argv)
+        search_values = parse_search_values_from_opts(opts)
+        self.assertEqual(search_values, expected)
+
+        argv = \
+            ["--id", "1", "--region", "2", "--zone", "3",
+             "--ip", "127.0.0.1",
+             "--port", "6200",
+             "--replication-ip", "127.0.0.10",
+             "--replication-port", "7000",
+             "--device", "sda3",
+             "--meta", "some meta data",
+             "--weight", "3.14159265359",
+             "--change-ip", "127.0.0.2",
+             "--change-port", "6201",
+             "--change-replication-ip", "127.0.0.20",
+             "--change-replication-port", "7001",
+             "--change-device", "sdb3",
+             "--change-meta", "some meta data for change"]
+        expected = {
+            'id': 1,
+            'region': 2,
+            'zone': 3,
+            'ip': "127.0.0.1",
+            'port': 6200,
+            'replication_ip': "127.0.0.10",
+            'replication_port': 7000,
+            'device': "sda3",
+            'meta': "some meta data",
+            'weight': 3.14159265359,
+        }
+        new_cmd_format, opts, args = validate_args(argv)
+        search_values = parse_search_values_from_opts(opts)
+        self.assertEqual(search_values, expected)
+
+        argv = \
+            ["--id", "1", "--region", "2", "--zone", "3",
+             "--ip", "[127.0.0.1]",
+             "--port", "6200",
+             "--replication-ip", "[127.0.0.10]",
+             "--replication-port", "7000",
+             "--device", "sda3",
+             "--meta", "some meta data",
+             "--weight", "3.14159265359",
+             "--change-ip", "[127.0.0.2]",
+             "--change-port", "6201",
+             "--change-replication-ip", "[127.0.0.20]",
+             "--change-replication-port", "7001",
+             "--change-device", "sdb3",
+             "--change-meta", "some meta data for change"]
+        new_cmd_format, opts, args = validate_args(argv)
+        search_values = parse_search_values_from_opts(opts)
+        self.assertEqual(search_values, expected)
+
+    def test_parse_change_values_from_opts(self):
+        argv = \
+            ["--id", "1", "--region", "2", "--zone", "3",
+             "--ip", "test.test.com",
+             "--port", "6200",
+             "--replication-ip", "r.test.com",
+             "--replication-port", "7000",
+             "--device", "sda3",
+             "--meta", "some meta data",
+             "--weight", "3.14159265359",
+             "--change-ip", "change.test.test.com",
+             "--change-port", "6201",
+             "--change-replication-ip", "change.r.test.com",
+             "--change-replication-port", "7001",
+             "--change-device", "sdb3",
+             "--change-meta", "some meta data for change"]
+        expected = {
+            'ip': "change.test.test.com",
+            'port': 6201,
+            'replication_ip': "change.r.test.com",
+            'replication_port': 7001,
+            'device': "sdb3",
+            'meta': "some meta data for change",
+        }
+        new_cmd_format, opts, args = validate_args(argv)
+        search_values = parse_change_values_from_opts(opts)
+        self.assertEqual(search_values, expected)
+
+        argv = \
+            ["--id", "1", "--region", "2", "--zone", "3",
+             "--ip", "127.0.0.1",
+             "--port", "6200",
+             "--replication-ip", "127.0.0.10",
+             "--replication-port", "7000",
+             "--device", "sda3",
+             "--meta", "some meta data",
+             "--weight", "3.14159265359",
+             "--change-ip", "127.0.0.2",
+             "--change-port", "6201",
+             "--change-replication-ip", "127.0.0.20",
+             "--change-replication-port", "7001",
+             "--change-device", "sdb3",
+             "--change-meta", "some meta data for change"]
+        expected = {
+            'ip': "127.0.0.2",
+            'port': 6201,
+            'replication_ip': "127.0.0.20",
+            'replication_port': 7001,
+            'device': "sdb3",
+            'meta': "some meta data for change",
+        }
+        new_cmd_format, opts, args = validate_args(argv)
+        search_values = parse_change_values_from_opts(opts)
+        self.assertEqual(search_values, expected)
+
+        argv = \
+            ["--id", "1", "--region", "2", "--zone", "3",
+             "--ip", "[127.0.0.1]",
+             "--port", "6200",
+             "--replication-ip", "[127.0.0.10]",
+             "--replication-port", "7000",
+             "--device", "sda3",
+             "--meta", "some meta data",
+             "--weight", "3.14159265359",
+             "--change-ip", "[127.0.0.2]",
+             "--change-port", "6201",
+             "--change-replication-ip", "[127.0.0.20]",
+             "--change-replication-port", "7001",
+             "--change-device", "sdb3",
+             "--change-meta", "some meta data for change"]
+        new_cmd_format, opts, args = validate_args(argv)
+        search_values = parse_change_values_from_opts(opts)
+        self.assertEqual(search_values, expected)
+
+    def test_validate_args(self):
+        argv = \
+            ["--id", "1", "--region", "2", "--zone", "3",
+             "--ip", "test.test.com",
+             "--port", "6200",
+             "--replication-ip", "r.test.com",
+             "--replication-port", "7000",
+             "--device", "sda3",
+             "--meta", "some meta data",
+             "--weight", "3.14159265359",
+             "--change-ip", "change.test.test.com",
+             "--change-port", "6201",
+             "--change-replication-ip", "change.r.test.com",
+             "--change-replication-port", "7001",
+             "--change-device", "sdb3",
+             "--change-meta", "some meta data for change"]
+        new_cmd_format, opts, args = validate_args(argv)
+        self.assertTrue(new_cmd_format)
+        self.assertEqual(opts.id, 1)
+        self.assertEqual(opts.region, 2)
+        self.assertEqual(opts.zone, 3)
+        self.assertEqual(opts.ip, "test.test.com")
+        self.assertEqual(opts.port, 6200)
+        self.assertEqual(opts.replication_ip, "r.test.com")
+        self.assertEqual(opts.replication_port, 7000)
+        self.assertEqual(opts.device, "sda3")
+        self.assertEqual(opts.meta, "some meta data")
+        self.assertEqual(opts.weight, 3.14159265359)
+        self.assertEqual(opts.change_ip, "change.test.test.com")
+        self.assertEqual(opts.change_port, 6201)
+        self.assertEqual(opts.change_replication_ip, "change.r.test.com")
+        self.assertEqual(opts.change_replication_port, 7001)
+        self.assertEqual(opts.change_device, "sdb3")
+        self.assertEqual(opts.change_meta, "some meta data for change")
+
+    def test_validate_args_new_cmd_format(self):
+        argv = \
+            ["--id", "0", "--region", "0", "--zone", "0",
+             "--ip", "",
+             "--port", "0",
+             "--replication-ip", "",
+             "--replication-port", "0",
+             "--device", "",
+             "--meta", "",
+             "--weight", "0",
+             "--change-ip", "",
+             "--change-port", "0",
+             "--change-replication-ip", "",
+             "--change-replication-port", "0",
+             "--change-device", "",
+             "--change-meta", ""]
+        new_cmd_format, opts, args = validate_args(argv)
+        self.assertTrue(new_cmd_format)
+
+        argv = \
+            ["--id", None, "--region", None, "--zone", None,
+             "--ip", "",
+             "--port", "0",
+             "--replication-ip", "",
+             "--replication-port", "0",
+             "--device", "",
+             "--meta", "",
+             "--weight", None,
+             "--change-ip", "change.test.test.com",
+             "--change-port", "6201",
+             "--change-replication-ip", "change.r.test.com",
+             "--change-replication-port", "7001",
+             "--change-device", "sdb3",
+             "--change-meta", "some meta data for change"]
+        new_cmd_format, opts, args = validate_args(argv)
+        self.assertFalse(new_cmd_format)
+
+        argv = \
+            ["--id", "0"]
+        new_cmd_format, opts, args = validate_args(argv)
+        self.assertTrue(new_cmd_format)
+        argv = \
+            ["--region", "0"]
+        new_cmd_format, opts, args = validate_args(argv)
+        self.assertTrue(new_cmd_format)
+        argv = \
+            ["--zone", "0"]
+        new_cmd_format, opts, args = validate_args(argv)
+        self.assertTrue(new_cmd_format)
+        argv = \
+            ["--weight", "0"]
+        new_cmd_format, opts, args = validate_args(argv)
+        self.assertTrue(new_cmd_format)
+
+    def test_parse_args(self):
+        argv = \
+            ["--id", "1", "--region", "2", "--zone", "3",
+             "--ip", "test.test.com",
+             "--port", "6200",
+             "--replication-ip", "r.test.com",
+             "--replication-port", "7000",
+             "--device", "sda3",
+             "--meta", "some meta data",
+             "--weight", "3.14159265359",
+             "--change-ip", "change.test.test.com",
+             "--change-port", "6201",
+             "--change-replication-ip", "change.r.test.com",
+             "--change-replication-port", "7001",
+             "--change-device", "sdb3",
+             "--change-meta", "some meta data for change"]
+
+        opts, args = parse_args(argv)
+        self.assertEqual(opts.id, 1)
+        self.assertEqual(opts.region, 2)
+        self.assertEqual(opts.zone, 3)
+        self.assertEqual(opts.ip, "test.test.com")
+        self.assertEqual(opts.port, 6200)
+        self.assertEqual(opts.replication_ip, "r.test.com")
+        self.assertEqual(opts.replication_port, 7000)
+        self.assertEqual(opts.device, "sda3")
+        self.assertEqual(opts.meta, "some meta data")
+        self.assertEqual(opts.weight, 3.14159265359)
+        self.assertEqual(opts.change_ip, "change.test.test.com")
+        self.assertEqual(opts.change_port, 6201)
+        self.assertEqual(opts.change_replication_ip, "change.r.test.com")
+        self.assertEqual(opts.change_replication_port, 7001)
+        self.assertEqual(opts.change_device, "sdb3")
+        self.assertEqual(opts.change_meta, "some meta data for change")
+        self.assertEqual(len(args), 0)
+
+    def test_parse_builder_ring_filename_args(self):
+        args = 'swift-ring-builder object.builder write_ring'
+        self.assertEqual((
+            'object.builder', 'object.ring.gz'
+        ), parse_builder_ring_filename_args(args.split()))
+        args = 'swift-ring-builder container.ring.gz write_builder'
+        self.assertEqual((
+            'container.builder', 'container.ring.gz'
+        ), parse_builder_ring_filename_args(args.split()))
+        # builder name arg should always fall through
+        args = 'swift-ring-builder test create'
+        self.assertEqual((
+            'test', 'test.ring.gz'
+        ), parse_builder_ring_filename_args(args.split()))
+        args = 'swift-ring-builder my.file.name create'
+        self.assertEqual((
+            'my.file.name', 'my.file.name.ring.gz'
+        ), parse_builder_ring_filename_args(args.split()))
+
+    def test_build_dev_from_opts(self):
+        argv = \
+            ["--region", "0", "--zone", "3",
+             "--ip", "test.test.com",
+             "--port", "6200",
+             "--replication-ip", "r.test.com",
+             "--replication-port", "7000",
+             "--device", "sda3",
+             "--meta", "some meta data",
+             "--weight", "3.14159265359"]
+        expected = {
+            'region': 0,
+            'zone': 3,
+            'ip': "test.test.com",
+            'port': 6200,
+            'replication_ip': "r.test.com",
+            'replication_port': 7000,
+            'device': "sda3",
+            'meta': "some meta data",
+            'weight': 3.14159265359,
+        }
+        opts, args = parse_args(argv)
+        device = build_dev_from_opts(opts)
+        self.assertEqual(device, expected)
+
+        argv = \
+            ["--region", "2", "--zone", "3",
+             "--ip", "[test.test.com]",
+             "--port", "6200",
+             "--replication-ip", "[r.test.com]",
+             "--replication-port", "7000",
+             "--device", "sda3",
+             "--meta", "some meta data",
+             "--weight", "3.14159265359"]
+        opts, args = parse_args(argv)
+        self.assertRaises(ValueError, build_dev_from_opts, opts)
+
+        argv = \
+            ["--region", "2", "--zone", "3",
+             "--ip", "[test.test.com]",
+             "--port", "6200",
+             "--replication-ip", "[r.test.com]",
+             "--replication-port", "7000",
+             "--meta", "some meta data",
+             "--weight", "3.14159265359"]
+        opts, args = parse_args(argv)
+        self.assertRaises(ValueError, build_dev_from_opts, opts)
+
+    def test_replication_defaults(self):
+        args = '-r 1 -z 1 -i 127.0.0.1 -p 6010 -d d1 -w 100'.split()
+        opts, _ = parse_args(args)
+        device = build_dev_from_opts(opts)
+        expected = {
+            'device': 'd1',
+            'ip': '127.0.0.1',
+            'meta': '',
+            'port': 6010,
+            'region': 1,
+            'replication_ip': '127.0.0.1',
+            'replication_port': 6010,
+            'weight': 100.0,
+            'zone': 1,
+        }
+        self.assertEqual(device, expected)
+
+        args = '-r 1 -z 1 -i test.com -p 6010 -d d1 -w 100'.split()
+        opts, _ = parse_args(args)
+        device = build_dev_from_opts(opts)
+        expected = {
+            'device': 'd1',
+            'ip': 'test.com',
+            'meta': '',
+            'port': 6010,
+            'region': 1,
+            'replication_ip': 'test.com',
+            'replication_port': 6010,
+            'weight': 100.0,
+            'zone': 1,
+        }
+        self.assertEqual(device, expected)
+
+    def test_dispersion_report(self):
+        rb = ring.RingBuilder(8, 3, 0)
+        rb.add_dev({'id': 0, 'region': 1, 'zone': 0, 'weight': 100,
+                    'ip': '127.0.0.0', 'port': 10000, 'device': 'sda1'})
+        rb.add_dev({'id': 3, 'region': 1, 'zone': 0, 'weight': 100,
+                    'ip': '127.0.0.0', 'port': 10000, 'device': 'sdb1'})
+        rb.add_dev({'id': 4, 'region': 1, 'zone': 0, 'weight': 100,
+                    'ip': '127.0.0.0', 'port': 10000, 'device': 'sdc1'})
+        rb.add_dev({'id': 5, 'region': 1, 'zone': 0, 'weight': 100,
+                    'ip': '127.0.0.0', 'port': 10000, 'device': 'sdd1'})
+
+        rb.add_dev({'id': 1, 'region': 1, 'zone': 1, 'weight': 200,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sda1'})
+        rb.add_dev({'id': 6, 'region': 1, 'zone': 1, 'weight': 200,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sdb1'})
+        rb.add_dev({'id': 7, 'region': 1, 'zone': 1, 'weight': 200,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sdc1'})
+        rb.add_dev({'id': 8, 'region': 1, 'zone': 1, 'weight': 200,
+                    'ip': '127.0.0.1', 'port': 10001, 'device': 'sdd1'})
+
+        rb.add_dev({'id': 2, 'region': 1, 'zone': 1, 'weight': 200,
+                    'ip': '127.0.0.2', 'port': 10002, 'device': 'sda1'})
+        rb.add_dev({'id': 9, 'region': 1, 'zone': 1, 'weight': 200,
+                    'ip': '127.0.0.2', 'port': 10002, 'device': 'sdb1'})
+        rb.add_dev({'id': 10, 'region': 1, 'zone': 1, 'weight': 200,
+                    'ip': '127.0.0.2', 'port': 10002, 'device': 'sdc1'})
+        rb.add_dev({'id': 11, 'region': 1, 'zone': 1, 'weight': 200,
+                    'ip': '127.0.0.2', 'port': 10002, 'device': 'sdd1'})
+
+        # this ring is pretty volatile and the assertions are pretty brittle
+        # so we use a specific seed
+        rb.rebalance(seed=100)
+        rb.validate()
+
+        self.assertEqual(rb.dispersion, 16.796875)
+        report = dispersion_report(rb)
+        self.assertEqual(report['worst_tier'], 'r1z1-127.0.0.1')
+        self.assertEqual(report['max_dispersion'], 20.967741935483872)
+
+        def build_tier_report(max_replicas, placed_parts, dispersion,
+                              replicas):
+            return {
+                'max_replicas': max_replicas,
+                'placed_parts': placed_parts,
+                'dispersion': dispersion,
+                'replicas': replicas,
+            }
+
+        # every partition has at least two replicas in this zone, unfortunately
+        # sometimes they're both on the same server.
+        expected = [
+            ['r1z1', build_tier_report(
+                2, 621, 17.55233494363929, [0, 0, 147, 109])],
+            ['r1z1-127.0.0.1', build_tier_report(
+                1, 310, 20.967741935483872, [11, 180, 65, 0])],
+            ['r1z1-127.0.0.2', build_tier_report(
+                1, 311, 20.578778135048232, [9, 183, 64, 0])],
+        ]
+        report = dispersion_report(rb, 'r1z1[^/]*$', verbose=True)
+        graph = report['graph']
+        for i, (expected_key, expected_report) in enumerate(expected):
+            key, report = graph[i]
+            self.assertEqual(
+                (key, report),
+                (expected_key, expected_report)
+            )
+
+        # overcompensate in r1z0
+        rb.add_dev({'id': 12, 'region': 1, 'zone': 0, 'weight': 500,
+                    'ip': '127.0.0.3', 'port': 10003, 'device': 'sda1'})
+        rb.add_dev({'id': 13, 'region': 1, 'zone': 0, 'weight': 500,
+                    'ip': '127.0.0.3', 'port': 10003, 'device': 'sdb1'})
+        rb.add_dev({'id': 14, 'region': 1, 'zone': 0, 'weight': 500,
+                    'ip': '127.0.0.3', 'port': 10003, 'device': 'sdc1'})
+        rb.add_dev({'id': 15, 'region': 1, 'zone': 0, 'weight': 500,
+                    'ip': '127.0.0.3', 'port': 10003, 'device': 'sdd1'})
+
+        # when the biggest tier has the smallest devices things get ugly
+        # can't move all the part-replicas in one rebalance
+        rb.rebalance(seed=100)
+        report = dispersion_report(rb, verbose=True)
+        self.assertEqual(rb.dispersion, 2.8645833333333335)
+        self.assertEqual(report['worst_tier'], 'r1z1-127.0.0.1')
+        self.assertEqual(report['max_dispersion'], 6.593406593406593)
+        # do a sencond rebalance
+        rb.rebalance(seed=100)
+        report = dispersion_report(rb, verbose=True)
+        self.assertEqual(rb.dispersion, 16.666666666666668)
+        self.assertEqual(report['worst_tier'], 'r1z0-127.0.0.3')
+        self.assertEqual(report['max_dispersion'], 33.333333333333336)
+
+        # ... but overload can square it
+        rb.set_overload(rb.get_required_overload())
+        rb.rebalance()
+        self.assertEqual(rb.dispersion, 0.0)
+
+    def test_parse_address_old_format(self):
+        # Test old format
+        argv = "127.0.0.1:6200R127.0.0.1:6200/sda1_some meta data"
+        ip, port, rest = parse_address(argv)
+        self.assertEqual(ip, '127.0.0.1')
+        self.assertEqual(port, 6200)
+        self.assertEqual(rest, 'R127.0.0.1:6200/sda1_some meta data')
+
+    def test_normalized_device_tier_names(self):
+        rb = ring.RingBuilder(8, 3, 0)
+        rb.add_dev({
+            'region': 1,
+            'zone': 1,
+            'ip': '127.0.0.1',
+            'port': 6011,
+            'device': 'd1',
+            'weight': 0.0,
+        })
+        dev = rb.devs[0]
+        expected = 'r1z1-127.0.0.1/d1'
+        self.assertEqual(expected, get_tier_name(tiers_for_dev(dev)[-1], rb))
+        self.assertEqual(expected, pretty_dev(dev))
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/test_base_storage_server.py b/test/unit/common/test_base_storage_server.py
new file mode 100644
index 0000000000..3a807c86e4
--- /dev/null
+++ b/test/unit/common/test_base_storage_server.py
@@ -0,0 +1,368 @@
+# Copyright (c) 2010-2015 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import contextlib
+from unittest import mock
+
+import time
+import unittest
+import os
+
+from swift.common.base_storage_server import BaseStorageServer, \
+    timing_stats, labeled_timing_stats
+from swift.common.swob import Request, Response, HTTPInsufficientStorage
+from test.debug_logger import debug_logger, debug_labeled_statsd_client
+
+from tempfile import mkdtemp
+from swift import __version__ as swift_version
+from swift.common.utils import get_logger, public, replication
+from shutil import rmtree
+
+
+class FakeOPTIONS(BaseStorageServer):
+
+    server_type = 'test-server'
+
+    def __init__(self, conf, logger=None):
+        super(FakeOPTIONS, self).__init__(conf)
+        self.logger = logger or get_logger(conf, log_route='test-server')
+
+
+class FakeANOTHER(FakeOPTIONS):
+
+    @public
+    def ANOTHER(self):
+        """this is to test adding to allowed_methods"""
+        pass
+
+    @replication
+    @public
+    def REPLICATE(self):
+        """this is to test replication_server"""
+        pass
+
+    @public
+    @replication
+    def REPLICATE2(self):
+        """this is to test replication_server"""
+        pass
+
+
+class MockLabeledTimingController(object):
+    def __init__(self, status, extra_labels=None):
+        self.statsd = debug_labeled_statsd_client({})
+        self.status = status
+        self.extra_labels = extra_labels or {}
+
+    def _update_labels(self, req, labels):
+        labels.update(self.extra_labels)
+
+    @labeled_timing_stats(metric='my_timing_metric')
+    def handle_req(self, req, timing_stats_labels):
+        self._update_labels(req, timing_stats_labels)
+        if isinstance(self.status, Exception):
+            raise self.status
+        return Response(status=self.status)
+
+
+class TestLabeledTimingStatsDecorator(unittest.TestCase):
+
+    @contextlib.contextmanager
+    def _patch_time(self):
+        now = time.time()
+        with mock.patch('swift.common.utils.time.time', return_value=now):
+            yield now
+
+    def test_labeled_timing_stats_get_200(self):
+        req = Request.blank('/v1/a/c/o')
+        mock_controller = MockLabeledTimingController(200)
+        with self._patch_time() as now:
+            mock_controller.handle_req(req)
+        self.assertEqual(
+            {'timing_since': [(('my_timing_metric', now), {
+                'labels': {
+                    'method': 'GET',
+                    'status': 200,
+                }
+            })]},
+            mock_controller.statsd.calls)
+
+    def test_labeled_timing_stats_head_500(self):
+        req = Request.blank('/v1/a/c/o', method='HEAD')
+        mock_controller = MockLabeledTimingController(500)
+        with self._patch_time() as now:
+            mock_controller.handle_req(req)
+        self.assertEqual(
+            {'timing_since': [(('my_timing_metric', now), {
+                'labels': {
+                    'method': 'HEAD',
+                    'status': 500,
+                }
+            })]},
+            mock_controller.statsd.calls)
+
+    def test_labeled_timing_stats_head_507_exception(self):
+        req = Request.blank('/v1/a/c/o', method='HEAD')
+        mock_controller = MockLabeledTimingController(
+            HTTPInsufficientStorage())
+        with self._patch_time() as now:
+            mock_controller.handle_req(req)
+        self.assertEqual(
+            {'timing_since': [(('my_timing_metric', now), {
+                'labels': {
+                    'method': 'HEAD',
+                    'status': 507,
+                }
+            })]},
+            mock_controller.statsd.calls)
+
+    def test_labeled_timing_stats_extra_labels(self):
+        req = Request.blank('/v1/AUTH_test/c/o')
+        mock_controller = MockLabeledTimingController(
+            206, extra_labels={'account': 'AUTH_test'})
+        with self._patch_time() as now:
+            mock_controller.handle_req(req)
+        self.assertEqual(
+            {'timing_since': [(('my_timing_metric', now), {
+                'labels': {
+                    'account': 'AUTH_test',
+                    'method': 'GET',
+                    'status': 206,
+                }
+            })]},
+            mock_controller.statsd.calls)
+
+    def test_labeled_timing_stats_can_not_override_status(self):
+        req = Request.blank('/v1/AUTH_test/c/o')
+        mock_controller = MockLabeledTimingController(
+            404, extra_labels={'status': 200})
+        with self._patch_time() as now:
+            mock_controller.handle_req(req)
+        self.assertEqual(
+            {'timing_since': [(('my_timing_metric', now), {
+                'labels': {
+                    'method': 'GET',
+                    'status': 404,
+                }
+            })]},
+            mock_controller.statsd.calls)
+
+    def test_labeled_timing_stats_can_not_override_method(self):
+        req = Request.blank('/v1/AUTH_test/c/o', method='POST')
+        mock_controller = MockLabeledTimingController(
+            412, extra_labels={'method': 'GET'})
+        with self._patch_time() as now:
+            mock_controller.handle_req(req)
+        self.assertEqual(
+            {'timing_since': [(('my_timing_metric', now), {
+                'labels': {
+                    'method': 'POST',
+                    'status': 412,
+                }
+            })]},
+            mock_controller.statsd.calls)
+
+    def test_labeled_timing_stats_really_can_not_override_method(self):
+
+        class MutilatingController(MockLabeledTimingController):
+
+            def _update_labels(self, req, labels):
+                req.method = 'BANANA'
+
+        req = Request.blank('/v1/AUTH_test/c/o', method='POST')
+        mock_controller = MutilatingController(412)
+        with self._patch_time() as now:
+            mock_controller.handle_req(req)
+        self.assertEqual('BANANA', req.method)
+        self.assertEqual(
+            {'timing_since': [(('my_timing_metric', now), {
+                'labels': {
+                    'method': 'POST',
+                    'status': 412,
+                }
+            })]},
+            mock_controller.statsd.calls)
+
+    def test_labeled_timing_stats_cannot_remove_labels(self):
+
+        class MutilatingController(MockLabeledTimingController):
+
+            def _update_labels(self, req, labels):
+                labels.clear()
+
+        req = Request.blank('/v1/AUTH_test/c/o', method='DELETE')
+        mock_controller = MutilatingController('42 bad stuff')
+        with self._patch_time() as now:
+            mock_controller.handle_req(req)
+        self.assertEqual(
+            {'timing_since': [(('my_timing_metric', now), {
+                'labels': {
+                    'method': 'DELETE',
+                    # resp.status_int knows how to do it
+                    'status': 42,
+                }
+            })]},
+            mock_controller.statsd.calls)
+
+
+class TestTimingStatsDecorators(unittest.TestCase):
+    def test_timing_stats(self):
+        class MockController(object):
+            def __init__(mock_self, status):
+                mock_self.status = status
+                mock_self.logger = debug_logger()
+
+            @timing_stats()
+            def METHOD(mock_self):
+                if isinstance(mock_self.status, Exception):
+                    raise mock_self.status
+                return Response(status=mock_self.status)
+
+        now = time.time()
+        mock_controller = MockController(200)
+        with mock.patch('swift.common.utils.time.time', return_value=now):
+            mock_controller.METHOD()
+        self.assertEqual({'timing_since': [(('METHOD.timing', now), {})]},
+                         mock_controller.logger.statsd_client.calls)
+
+        mock_controller = MockController(400)
+        with mock.patch('swift.common.utils.time.time', return_value=now):
+            mock_controller.METHOD()
+        self.assertEqual({'timing_since': [(('METHOD.timing', now), {})]},
+                         mock_controller.logger.statsd_client.calls)
+
+        mock_controller = MockController(404)
+        with mock.patch('swift.common.utils.time.time', return_value=now):
+            mock_controller.METHOD()
+        self.assertEqual({'timing_since': [(('METHOD.timing', now), {})]},
+                         mock_controller.logger.statsd_client.calls)
+
+        mock_controller = MockController(412)
+        with mock.patch('swift.common.utils.time.time', return_value=now):
+            mock_controller.METHOD()
+        self.assertEqual({'timing_since': [(('METHOD.timing', now), {})]},
+                         mock_controller.logger.statsd_client.calls)
+
+        mock_controller = MockController(416)
+        with mock.patch('swift.common.utils.time.time', return_value=now):
+            mock_controller.METHOD()
+        self.assertEqual({'timing_since': [(('METHOD.timing', now), {})]},
+                         mock_controller.logger.statsd_client.calls)
+
+        mock_controller = MockController(500)
+        with mock.patch('swift.common.utils.time.time', return_value=now):
+            mock_controller.METHOD()
+        self.assertEqual(
+            {'timing_since': [(('METHOD.errors.timing', now), {})]},
+            mock_controller.logger.statsd_client.calls)
+
+        mock_controller = MockController(507)
+        with mock.patch('swift.common.utils.time.time', return_value=now):
+            mock_controller.METHOD()
+        self.assertEqual(
+            {'timing_since': [(('METHOD.errors.timing', now), {})]},
+            mock_controller.logger.statsd_client.calls)
+
+        mock_controller = MockController(
+            HTTPInsufficientStorage())
+        with mock.patch('swift.common.utils.time.time', return_value=now):
+            mock_controller.METHOD()
+        self.assertEqual(
+            {'timing_since': [(('METHOD.errors.timing', now), {})]},
+            mock_controller.logger.statsd_client.calls)
+
+
+class TestBaseStorageServer(unittest.TestCase):
+    """Test swift.common.base_storage_server"""
+
+    def setUp(self):
+        self.tmpdir = mkdtemp()
+        self.testdir = os.path.join(self.tmpdir,
+                                    'tmp_test_base_storage_server')
+
+    def tearDown(self):
+        """Tear down for testing swift.common.base_storage_server"""
+        rmtree(self.tmpdir)
+
+    def test_server_type(self):
+        conf = {'devices': self.testdir, 'mount_check': 'false'}
+        baseserver = BaseStorageServer(conf)
+        msg = 'Storage nodes have not implemented the Server type.'
+        try:
+            baseserver.server_type
+        except NotImplementedError as e:
+            self.assertEqual(str(e), msg)
+
+    def test_allowed_methods(self):
+        conf = {'devices': self.testdir, 'mount_check': 'false',
+                'replication_server': 'false'}
+
+        # test what's available in the base class
+        allowed_methods_test = FakeOPTIONS(conf).allowed_methods
+        self.assertEqual(allowed_methods_test, ['OPTIONS'])
+
+        # test that a subclass can add allowed methods
+        allowed_methods_test = FakeANOTHER(conf).allowed_methods
+        allowed_methods_test.sort()
+        self.assertEqual(allowed_methods_test, [
+            'ANOTHER', 'OPTIONS'])
+
+        conf = {'devices': self.testdir, 'mount_check': 'false',
+                'replication_server': 'true'}
+
+        # test what's available in the base class
+        allowed_methods_test = FakeOPTIONS(conf).allowed_methods
+        self.assertEqual(allowed_methods_test, ['OPTIONS'])
+
+        # test that a subclass can add allowed methods
+        allowed_methods_test = FakeANOTHER(conf).allowed_methods
+        self.assertEqual(allowed_methods_test, [
+            'ANOTHER', 'OPTIONS', 'REPLICATE', 'REPLICATE2'])
+
+        conf = {'devices': self.testdir, 'mount_check': 'false'}
+
+        # test what's available in the base class
+        allowed_methods_test = FakeOPTIONS(conf).allowed_methods
+        self.assertEqual(allowed_methods_test, ['OPTIONS'])
+
+        # test that a subclass can add allowed methods
+        allowed_methods_test = FakeANOTHER(conf).allowed_methods
+        allowed_methods_test.sort()
+        self.assertEqual(allowed_methods_test, [
+            'ANOTHER', 'OPTIONS', 'REPLICATE', 'REPLICATE2'])
+
+    def test_OPTIONS_error(self):
+        msg = 'Storage nodes have not implemented the Server type.'
+        conf = {'devices': self.testdir, 'mount_check': 'false',
+                'replication_server': 'false'}
+
+        baseserver = BaseStorageServer(conf)
+        req = Request.blank('/sda1/p/a/c/o', {'REQUEST_METHOD': 'OPTIONS'})
+        req.content_length = 0
+
+        try:
+            baseserver.OPTIONS(req)
+        except NotImplementedError as e:
+            self.assertEqual(str(e), msg)
+
+    def test_OPTIONS(self):
+        conf = {'devices': self.testdir, 'mount_check': 'false',
+                'replication_server': 'false'}
+        req = Request.blank('/sda1/p/a/c/o', {'REQUEST_METHOD': 'OPTIONS'})
+        req.content_length = 0
+        resp = FakeOPTIONS(conf).OPTIONS(req)
+        self.assertEqual(resp.headers['Allow'], 'OPTIONS')
+        self.assertEqual(resp.headers['Server'],
+                         'test-server/' + swift_version)
diff --git a/test/unit/common/test_bufferedhttp.py b/test/unit/common/test_bufferedhttp.py
index 02de8eff18..1c58d77204 100644
--- a/test/unit/common/test_bufferedhttp.py
+++ b/test/unit/common/test_bufferedhttp.py
@@ -1,4 +1,5 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# -*- coding: utf-8 -*-
+#  Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -12,90 +13,263 @@
 # implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
+import io
+from http.client import parse_headers
 
+from unittest import mock
 import unittest
+import socket
 
-from eventlet import spawn, Timeout, listen
+from eventlet import spawn, Timeout
 
 from swift.common import bufferedhttp
 
+from test import listen_zero
+
+
+class MockHTTPSConnection(object):
+
+    def __init__(self, hostport):
+        pass
+
+    def putrequest(self, method, path, skip_host=0):
+        self.path = path
+        pass
+
+    def putheader(self, header, *values):
+        # Verify that path and values can be safely joined
+        # Essentially what Python 2.7 does that caused us problems.
+        '\r\n\t'.join((self.path,) + values)
+
+    def endheaders(self):
+        pass
+
 
 class TestBufferedHTTP(unittest.TestCase):
 
     def test_http_connect(self):
-        bindsock = listen(('127.0.0.1', 0))
+        bindsock = listen_zero()
 
         def accept(expected_par):
             try:
                 with Timeout(3):
                     sock, addr = bindsock.accept()
-                    fp = sock.makefile()
-                    fp.write('HTTP/1.1 200 OK\r\nContent-Length: 8\r\n\r\n'
-                             'RESPONSE')
+                    fp = sock.makefile('rwb')
+                    fp.write(b'HTTP/1.1 200 OK\r\nContent-Length: 8\r\n\r\n'
+                             b'RESPONSE')
                     fp.flush()
-                    self.assertEquals(fp.readline(),
-                        'PUT /dev/%s/path/..%%25/?omg&no=%%7f HTTP/1.1\r\n' %
-                        expected_par)
+                    line = fp.readline()
+                    path = (b'/dev/' + expected_par +
+                            b'/path/..%25/?omg=&no=%7F&%FF=%FF&no=%25ff')
+                    self.assertEqual(
+                        line,
+                        b'PUT ' + path + b' HTTP/1.1\r\n')
                     headers = {}
                     line = fp.readline()
-                    while line and line != '\r\n':
-                        headers[line.split(':')[0].lower()] = \
-                            line.split(':')[1].strip()
+                    while line and line != b'\r\n':
+                        headers[line.split(b':')[0].lower()] = \
+                            line.split(b':')[1].strip()
                         line = fp.readline()
-                    self.assertEquals(headers['content-length'], '7')
-                    self.assertEquals(headers['x-header'], 'value')
-                    self.assertEquals(fp.readline(), 'REQUEST\r\n')
-            except BaseException, err:
+                    self.assertEqual(headers[b'content-length'], b'7')
+                    self.assertEqual(headers[b'x-header'], b'value')
+                    self.assertEqual(fp.readline(), b'REQUEST\r\n')
+            except BaseException as err:
                 return err
             return None
-        for par in ('par', 1357):
-            event = spawn(accept, par)
+        for spawn_par, par in (
+                (b'par', b'par'), (b'up%C3%A5r', u'up\xe5r'),
+                (b'%C3%BCpar', b'\xc3\xbcpar'), (b'1357', 1357)):
+            event = spawn(accept, spawn_par)
             try:
                 with Timeout(3):
-                    conn = bufferedhttp.http_connect('127.0.0.1',
-                        bindsock.getsockname()[1], 'dev', par, 'PUT',
-                        '/path/..%/', {'content-length': 7, 'x-header':
-                        'value'}, query_string='omg&no=%7f')
-                    conn.send('REQUEST\r\n')
+                    conn = bufferedhttp.http_connect(
+                        '127.0.0.1', bindsock.getsockname()[1], 'dev', par,
+                        'PUT', '/path/..%/', {
+                            'content-length': 7,
+                            'x-header': 'value'},
+                        query_string='omg&no=%7f&\xff=%ff&no=%25ff')
+                    conn.send(b'REQUEST\r\n')
+                    self.assertTrue(conn.sock.getsockopt(socket.IPPROTO_TCP,
+                                                         socket.TCP_NODELAY))
                     resp = conn.getresponse()
                     body = resp.read()
                     conn.close()
-                    self.assertEquals(resp.status, 200)
-                    self.assertEquals(resp.reason, 'OK')
-                    self.assertEquals(body, 'RESPONSE')
+                    self.assertEqual(resp.status, 200)
+                    self.assertEqual(resp.reason, 'OK')
+                    self.assertEqual(body, b'RESPONSE')
             finally:
                 err = event.wait()
                 if err:
                     raise Exception(err)
 
-    def test_nonstr_header_values(self):
+    def test_get_expect(self):
+        bindsock = listen_zero()
+        request = []
 
-        class MockHTTPSConnection(object):
+        def accept():
+            with Timeout(3):
+                sock, addr = bindsock.accept()
+                fp = sock.makefile('rwb')
+                request.append(fp.readline())
+                fp.write(b'HTTP/1.1 100 Continue\r\n\r\n')
+                fp.flush()
+                fp.write(b'HTTP/1.1 200 OK\r\nContent-Length: 8\r\n\r\n'
+                         b'RESPONSE')
+                fp.flush()
 
-            def __init__(self, hostport):
-                pass
+        server = spawn(accept)
+        try:
+            address = '%s:%s' % ('127.0.0.1', bindsock.getsockname()[1])
+            conn = bufferedhttp.BufferedHTTPConnection(address)
+            conn.putrequest('GET', '/path')
+            conn.endheaders()
+            resp = conn.getexpect()
+            self.assertIsInstance(resp, bufferedhttp.BufferedHTTPResponse)
+            self.assertEqual(resp.status, 100)
+            self.assertEqual(resp.version, 11)
+            self.assertEqual(resp.reason, 'Continue')
+            # I don't think you're supposed to "read" a continue response
+            self.assertRaises(AssertionError, resp.read)
+
+            resp = conn.getresponse()
+            self.assertIsInstance(resp, bufferedhttp.BufferedHTTPResponse)
+            self.assertEqual(resp.read(), b'RESPONSE')
 
-            def putrequest(self, method, path, skip_host=0):
-                pass
+        finally:
+            server.wait()
+        self.assertEqual(request[0], b'GET /path HTTP/1.1\r\n')
 
-            def putheader(self, header, *values):
-                # Essentially what Python 2.7 does that caused us problems.
-                '\r\n\t'.join(values)
+    def test_get_with_non_ascii(self):
+        bindsock = listen_zero()
+        request = []
 
-            def endheaders(self):
-                pass
+        def accept():
+            with Timeout(3):
+                sock, addr = bindsock.accept()
+                fp = sock.makefile('rwb')
+                request.append(fp.readline())
+                # Ignore request headers
+                while fp.readline() != b'\r\n':
+                    pass
+                fp.write(b'HTTP/1.1 100 Continue\r\n\r\n')
+                fp.flush()
+                fp.write(b'\r\n'.join([
+                    b'HTTP/1.1 200 OK',
+                    b'X-Non-Ascii-M\xc3\xa9ta: \xe1\x88\xb4',
+                    b'Content-Length: 8',
+                    b'',
+                    b'RESPONSE']))
+                fp.flush()
+                # Server can look for pipelined requests
+                request.append(fp.readline())
 
-        origHTTPSConnection = bufferedhttp.HTTPSConnection
-        bufferedhttp.HTTPSConnection = MockHTTPSConnection
+        server = spawn(accept)
         try:
-            bufferedhttp.http_connect('127.0.0.1', 8080, 'sda', 1, 'GET', '/',
+            address = '%s:%s' % ('127.0.0.1', bindsock.getsockname()[1])
+            conn = bufferedhttp.BufferedHTTPConnection(address)
+            conn.putrequest('GET', '/path')
+            conn.endheaders()
+            resp = conn.getexpect()
+            self.assertIsInstance(resp, bufferedhttp.BufferedHTTPResponse)
+            self.assertEqual(resp.status, 100)
+            self.assertEqual(resp.version, 11)
+            self.assertEqual(resp.reason, 'Continue')
+            # I don't think you're supposed to "read" a continue response
+            self.assertRaises(AssertionError, resp.read)
+
+            resp = conn.getresponse()
+            self.assertIsInstance(resp, bufferedhttp.BufferedHTTPResponse)
+            self.assertEqual(resp.length, 8)
+            self.assertEqual(resp.read(), b'RESPONSE')
+            self.assertEqual(resp.read(), b'')
+            self.assertEqual(resp.headers['X-Non-Ascii-M\xc3\xa9ta'],
+                             '\xe1\x88\xb4')
+            # it's all HTTP/1.1 so we *could* pipeline, but we won't
+            conn.close()
+        finally:
+            server.wait()
+        self.assertEqual(request, [b'GET /path HTTP/1.1\r\n', b''])
+
+    def test_closed_response(self):
+        resp = bufferedhttp.BufferedHTTPResponse(None)
+        self.assertEqual(resp.status, 'UNKNOWN')
+        self.assertEqual(resp.version, 'UNKNOWN')
+        self.assertEqual(resp.reason, 'UNKNOWN')
+        self.assertEqual(resp.read(), b'')
+
+    def test_nonstr_header_values(self):
+        with mock.patch('swift.common.bufferedhttp.HTTPSConnection',
+                        MockHTTPSConnection):
+            bufferedhttp.http_connect(
+                '127.0.0.1', 8080, 'sda', 1, 'GET', '/',
                 headers={'x-one': '1', 'x-two': 2, 'x-three': 3.0,
                          'x-four': {'crazy': 'value'}}, ssl=True)
-            bufferedhttp.http_connect_raw('127.0.0.1', 8080, 'GET', '/',
+            bufferedhttp.http_connect_raw(
+                '127.0.0.1', 8080, 'GET', '/',
                 headers={'x-one': '1', 'x-two': 2, 'x-three': 3.0,
                          'x-four': {'crazy': 'value'}}, ssl=True)
-        finally:
-            bufferedhttp.HTTPSConnection = origHTTPSConnection
+
+    def test_unicode_values(self):
+        with mock.patch('swift.common.bufferedhttp.HTTPSConnection',
+                        MockHTTPSConnection):
+            for dev in ('sda', u'sda', u'sdá', u'sdá'.encode('utf-8')):
+                for path in (
+                        '/v1/a', u'/v1/a', u'/v1/á', u'/v1/á'.encode('utf-8')):
+                    for header in ('abc', u'abc', u'ábc'.encode('utf-8')):
+                        try:
+                            bufferedhttp.http_connect(
+                                '127.0.0.1', 8080, dev, 1, 'GET', path,
+                                headers={'X-Container-Meta-Whatever': header},
+                                ssl=True)
+                        except Exception as e:
+                            self.fail(
+                                'Exception %r for device=%r path=%r header=%r'
+                                % (e, dev, path, header))
+
+    def test_headers_setter_with_dict(self):
+        resp = bufferedhttp.BufferedHTTPResponse(None)
+        resp.headers = {'a': 'b', 'c': 'd'}
+        self.assertEqual('b', resp.headers.get('a'))
+        self.assertEqual('d', resp.headers.get('c'))
+        resp.headers = {'a': 'b', 'c': 'd'}
+        self.assertEqual('b', resp.headers.get('a'))
+        self.assertEqual('d', resp.headers.get('c'))
+        # XXX: AttributeError: 'dict' object has no attribute 'get_all'
+        # self.assertEqual(['b'], resp.headers.get_all('a'))
+
+    def test_headers_setter_with_message(self):
+        msg = parse_headers(io.BytesIO(b'a: b\na: bb\nc: d\n\n'))
+        self.assertEqual('', msg.get_payload())
+        resp = bufferedhttp.BufferedHTTPResponse(None)
+        resp.headers = msg
+        self.assertEqual('b', resp.headers.get('a'))
+        self.assertEqual(['b', 'bb'], resp.headers.get_all('a'))
+        self.assertEqual('d', resp.headers.get('c'))
+        self.assertEqual([('a', 'b'), ('a', 'bb'), ('c', 'd')],
+                         resp.headers.items())
+        resp.headers = msg
+        self.assertEqual([('a', 'b'), ('a', 'bb'), ('c', 'd')],
+                         resp.headers.items())
+
+    def test_headers_setter_with_message_with_payload(self):
+        msg = parse_headers(io.BytesIO(b'\xc3: b\n\xc3: bb\nc: d\n\n'))
+        self.assertEqual('Ã: b\nÃ: bb\nc: d\n\n', msg.get_payload())
+        resp = bufferedhttp.BufferedHTTPResponse(None)
+        resp.headers = resp.msg = msg
+        self.assertEqual('b', resp.headers.get('\xc3'))
+        self.assertEqual(['b', 'bb'], resp.headers.get_all('\xc3'))
+        self.assertEqual('d', resp.headers.get('c'))
+        self.assertEqual([('\xc3', 'b'), ('\xc3', 'bb'), ('c', 'd')],
+                         resp.headers.items())
+
+        resp.headers = msg
+        self.assertEqual('b', resp.headers.get('\xc3'))
+        self.assertEqual(['b', 'bb'], resp.headers.get_all('\xc3'))
+        self.assertEqual('d', resp.headers.get('c'))
+        self.assertEqual([('\xc3', 'b'), ('\xc3', 'bb'), ('c', 'd')],
+                         resp.headers.items())
+        self.assertIs(resp.headers, resp.msg)
+        self.assertIs(resp._headers, resp.headers)
 
 
 if __name__ == '__main__':
diff --git a/test/unit/common/test_constraints.py b/test/unit/common/test_constraints.py
index 6404dd176b..2488072f3a 100644
--- a/test/unit/common/test_constraints.py
+++ b/test/unit/common/test_constraints.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -14,191 +14,686 @@
 # limitations under the License.
 
 import unittest
-from test.unit import MockTrue
+from unittest import mock
+import tempfile
+import time
 
-from swift.common.swob import HTTPBadRequest, HTTPLengthRequired, \
-    HTTPRequestEntityTooLarge, Request
+from test.unit import mock_check_drive
+
+from swift.common.swob import Request, HTTPException
 from swift.common.http import HTTP_REQUEST_ENTITY_TOO_LARGE, \
-    HTTP_BAD_REQUEST, HTTP_LENGTH_REQUIRED
-from swift.common import constraints
+    HTTP_BAD_REQUEST, HTTP_LENGTH_REQUIRED, HTTP_NOT_IMPLEMENTED
+from swift.common import constraints, utils
+from swift.common.constraints import MAX_OBJECT_NAME_LENGTH
 
 
 class TestConstraints(unittest.TestCase):
-
     def test_check_metadata_empty(self):
         headers = {}
-        self.assertEquals(constraints.check_metadata(Request.blank('/',
-            headers=headers), 'object'), None)
+        self.assertIsNone(constraints.check_metadata(Request.blank(
+            '/', headers=headers), 'object'))
 
     def test_check_metadata_good(self):
         headers = {'X-Object-Meta-Name': 'Value'}
-        self.assertEquals(constraints.check_metadata(Request.blank('/',
-            headers=headers), 'object'), None)
+        self.assertIsNone(constraints.check_metadata(Request.blank(
+            '/', headers=headers), 'object'))
 
     def test_check_metadata_empty_name(self):
         headers = {'X-Object-Meta-': 'Value'}
-        self.assert_(constraints.check_metadata(Request.blank('/',
-            headers=headers), 'object'), HTTPBadRequest)
+        resp = constraints.check_metadata(Request.blank(
+            '/', headers=headers), 'object')
+        self.assertEqual(resp.status_int, HTTP_BAD_REQUEST)
+        self.assertIn(b'Metadata name cannot be empty', resp.body)
+
+    def test_check_metadata_non_utf8(self):
+        # Consciously using native "WSGI strings" in headers
+        headers = {'X-Account-Meta-Foo': '\xff'}
+        resp = constraints.check_metadata(Request.blank(
+            '/', headers=headers), 'account')
+        self.assertEqual(resp.status_int, HTTP_BAD_REQUEST)
+        self.assertIn(b'Metadata must be valid UTF-8', resp.body)
+
+        headers = {'X-Container-Meta-\xff': 'foo'}
+        resp = constraints.check_metadata(Request.blank(
+            '/', headers=headers), 'container')
+        self.assertEqual(resp.status_int, HTTP_BAD_REQUEST)
+        self.assertIn(b'Metadata must be valid UTF-8', resp.body)
+        # Object's OK; its metadata isn't serialized as JSON
+        headers = {'X-Object-Meta-Foo': '\xff'}
+        self.assertIsNone(constraints.check_metadata(Request.blank(
+            '/', headers=headers), 'object'))
 
     def test_check_metadata_name_length(self):
         name = 'a' * constraints.MAX_META_NAME_LENGTH
         headers = {'X-Object-Meta-%s' % name: 'v'}
-        self.assertEquals(constraints.check_metadata(Request.blank('/',
-            headers=headers), 'object'), None)
+        self.assertIsNone(constraints.check_metadata(Request.blank(
+            '/', headers=headers), 'object'))
+
         name = 'a' * (constraints.MAX_META_NAME_LENGTH + 1)
         headers = {'X-Object-Meta-%s' % name: 'v'}
-        self.assertEquals(constraints.check_metadata(Request.blank('/',
-            headers=headers), 'object').status_int, HTTP_BAD_REQUEST)
+        resp = constraints.check_metadata(Request.blank(
+            '/', headers=headers), 'object')
+        self.assertEqual(resp.status_int, HTTP_BAD_REQUEST)
+        self.assertIn(
+            b'x-object-meta-%s' % name.encode('ascii'), resp.body.lower())
+        self.assertIn(b'Metadata name too long', resp.body)
 
     def test_check_metadata_value_length(self):
         value = 'a' * constraints.MAX_META_VALUE_LENGTH
         headers = {'X-Object-Meta-Name': value}
-        self.assertEquals(constraints.check_metadata(Request.blank('/',
-            headers=headers), 'object'), None)
+        self.assertIsNone(constraints.check_metadata(Request.blank(
+            '/', headers=headers), 'object'))
+
         value = 'a' * (constraints.MAX_META_VALUE_LENGTH + 1)
         headers = {'X-Object-Meta-Name': value}
-        self.assertEquals(constraints.check_metadata(Request.blank('/',
-            headers=headers), 'object').status_int, HTTP_BAD_REQUEST)
+        resp = constraints.check_metadata(Request.blank(
+            '/', headers=headers), 'object')
+        self.assertEqual(resp.status_int, HTTP_BAD_REQUEST)
+        self.assertIn(b'x-object-meta-name', resp.body.lower())
+        self.assertIn(
+            str(constraints.MAX_META_VALUE_LENGTH).encode('ascii'), resp.body)
+        self.assertIn(b'Metadata value longer than 256', resp.body)
 
     def test_check_metadata_count(self):
         headers = {}
-        for x in xrange(constraints.MAX_META_COUNT):
+        for x in range(constraints.MAX_META_COUNT):
             headers['X-Object-Meta-%d' % x] = 'v'
-        self.assertEquals(constraints.check_metadata(Request.blank('/',
-            headers=headers), 'object'), None)
+        self.assertIsNone(constraints.check_metadata(Request.blank(
+            '/', headers=headers), 'object'))
+
         headers['X-Object-Meta-Too-Many'] = 'v'
-        self.assertEquals(constraints.check_metadata(Request.blank('/',
-            headers=headers), 'object').status_int, HTTP_BAD_REQUEST)
+        resp = constraints.check_metadata(Request.blank(
+            '/', headers=headers), 'object')
+        self.assertEqual(resp.status_int, HTTP_BAD_REQUEST)
+        self.assertIn(b'Too many metadata items', resp.body)
 
     def test_check_metadata_size(self):
         headers = {}
         size = 0
         chunk = constraints.MAX_META_NAME_LENGTH + \
-                constraints.MAX_META_VALUE_LENGTH
+            constraints.MAX_META_VALUE_LENGTH
         x = 0
         while size + chunk < constraints.MAX_META_OVERALL_SIZE:
             headers['X-Object-Meta-%04d%s' %
                     (x, 'a' * (constraints.MAX_META_NAME_LENGTH - 4))] = \
-                        'v' * constraints.MAX_META_VALUE_LENGTH
+                'v' * constraints.MAX_META_VALUE_LENGTH
             size += chunk
             x += 1
-        self.assertEquals(constraints.check_metadata(Request.blank('/',
-            headers=headers), 'object'), None)
+        self.assertIsNone(constraints.check_metadata(Request.blank(
+            '/', headers=headers), 'object'))
         # add two more headers in case adding just one falls exactly on the
         # limit (eg one header adds 1024 and the limit is 2048)
         headers['X-Object-Meta-%04d%s' %
                 (x, 'a' * (constraints.MAX_META_NAME_LENGTH - 4))] = \
-                    'v' * constraints.MAX_META_VALUE_LENGTH
+            'v' * constraints.MAX_META_VALUE_LENGTH
         headers['X-Object-Meta-%04d%s' %
                 (x + 1, 'a' * (constraints.MAX_META_NAME_LENGTH - 4))] = \
-                    'v' * constraints.MAX_META_VALUE_LENGTH
-        self.assertEquals(constraints.check_metadata(Request.blank('/',
-            headers=headers), 'object').status_int, HTTP_BAD_REQUEST)
+            'v' * constraints.MAX_META_VALUE_LENGTH
+        resp = constraints.check_metadata(Request.blank(
+            '/', headers=headers), 'object')
+        self.assertEqual(resp.status_int, HTTP_BAD_REQUEST)
+        self.assertIn(b'Total metadata too large', resp.body)
 
     def test_check_object_creation_content_length(self):
         headers = {'Content-Length': str(constraints.MAX_FILE_SIZE),
-                   'Content-Type': 'text/plain'}
-        self.assertEquals(constraints.check_object_creation(Request.blank('/',
-            headers=headers), 'object_name'), None)
+                   'Content-Type': 'text/plain',
+                   'X-Timestamp': str(time.time())}
+        self.assertIsNone(constraints.check_object_creation(Request.blank(
+            '/', headers=headers), 'object_name'))
+
         headers = {'Content-Length': str(constraints.MAX_FILE_SIZE + 1),
-                   'Content-Type': 'text/plain'}
-        self.assertEquals(constraints.check_object_creation(
-            Request.blank('/', headers=headers), 'object_name').status_int,
-            HTTP_REQUEST_ENTITY_TOO_LARGE)
+                   'Content-Type': 'text/plain',
+                   'X-Timestamp': str(time.time())}
+        resp = constraints.check_object_creation(
+            Request.blank('/', headers=headers), 'object_name')
+        self.assertEqual(resp.status_int, HTTP_REQUEST_ENTITY_TOO_LARGE)
+
         headers = {'Transfer-Encoding': 'chunked',
-                   'Content-Type': 'text/plain'}
-        self.assertEquals(constraints.check_object_creation(Request.blank('/',
-            headers=headers), 'object_name'), None)
-        headers = {'Content-Type': 'text/plain'}
-        self.assertEquals(constraints.check_object_creation(
-            Request.blank('/', headers=headers), 'object_name').status_int,
-            HTTP_LENGTH_REQUIRED)
+                   'Content-Type': 'text/plain',
+                   'X-Timestamp': str(time.time())}
+        self.assertIsNone(constraints.check_object_creation(Request.blank(
+            '/', headers=headers), 'object_name'))
+
+        headers = {'Transfer-Encoding': 'gzip',
+                   'Content-Type': 'text/plain',
+                   'X-Timestamp': str(time.time())}
+        resp = constraints.check_object_creation(Request.blank(
+            '/', headers=headers), 'object_name')
+        self.assertEqual(resp.status_int, HTTP_BAD_REQUEST)
+        self.assertIn(b'Invalid Transfer-Encoding header value', resp.body)
+
+        headers = {'Content-Type': 'text/plain',
+                   'X-Timestamp': str(time.time())}
+        resp = constraints.check_object_creation(
+            Request.blank('/', headers=headers), 'object_name')
+        self.assertEqual(resp.status_int, HTTP_LENGTH_REQUIRED)
+
+        headers = {'Content-Length': 'abc',
+                   'Content-Type': 'text/plain',
+                   'X-Timestamp': str(time.time())}
+        resp = constraints.check_object_creation(Request.blank(
+            '/', headers=headers), 'object_name')
+        self.assertEqual(resp.status_int, HTTP_BAD_REQUEST)
+        self.assertIn(b'Invalid Content-Length header value', resp.body)
+
+        headers = {'Transfer-Encoding': 'gzip,chunked',
+                   'Content-Type': 'text/plain',
+                   'X-Timestamp': str(time.time())}
+        resp = constraints.check_object_creation(Request.blank(
+            '/', headers=headers), 'object_name')
+        self.assertEqual(resp.status_int, HTTP_NOT_IMPLEMENTED)
 
     def test_check_object_creation_name_length(self):
         headers = {'Transfer-Encoding': 'chunked',
-                   'Content-Type': 'text/plain'}
+                   'Content-Type': 'text/plain',
+                   'X-Timestamp': str(time.time())}
         name = 'o' * constraints.MAX_OBJECT_NAME_LENGTH
-        self.assertEquals(constraints.check_object_creation(Request.blank('/',
-            headers=headers), name), None)
-        name = 'o' * (constraints.MAX_OBJECT_NAME_LENGTH + 1)
-        self.assertEquals(constraints.check_object_creation(
-            Request.blank('/', headers=headers), name).status_int,
-            HTTP_BAD_REQUEST)
+        self.assertIsNone(constraints.check_object_creation(Request.blank(
+            '/', headers=headers), name))
+
+        name = 'o' * (MAX_OBJECT_NAME_LENGTH + 1)
+        resp = constraints.check_object_creation(
+            Request.blank('/', headers=headers), name)
+        self.assertEqual(resp.status_int, HTTP_BAD_REQUEST)
+        self.assertIn(b'Object name length of %d longer than %d' %
+                      (MAX_OBJECT_NAME_LENGTH + 1, MAX_OBJECT_NAME_LENGTH),
+                      resp.body)
 
     def test_check_object_creation_content_type(self):
         headers = {'Transfer-Encoding': 'chunked',
-                   'Content-Type': 'text/plain'}
-        self.assertEquals(constraints.check_object_creation(Request.blank('/',
-            headers=headers), 'object_name'), None)
-        headers = {'Transfer-Encoding': 'chunked'}
-        self.assertEquals(constraints.check_object_creation(
-            Request.blank('/', headers=headers), 'object_name').status_int,
-            HTTP_BAD_REQUEST)
+                   'Content-Type': 'text/plain',
+                   'X-Timestamp': str(time.time())}
+        self.assertIsNone(constraints.check_object_creation(Request.blank(
+            '/', headers=headers), 'object_name'))
+
+        headers = {'Transfer-Encoding': 'chunked',
+                   'X-Timestamp': str(time.time())}
+        resp = constraints.check_object_creation(
+            Request.blank('/', headers=headers), 'object_name')
+        self.assertEqual(resp.status_int, HTTP_BAD_REQUEST)
+        self.assertIn(b'No content type', resp.body)
 
     def test_check_object_creation_bad_content_type(self):
         headers = {'Transfer-Encoding': 'chunked',
-                   'Content-Type': '\xff\xff'}
+                   'Content-Type': '\xff\xff',
+                   'X-Timestamp': str(time.time())}
+        resp = constraints.check_object_creation(
+            Request.blank('/', headers=headers), 'object_name')
+        self.assertEqual(resp.status_int, HTTP_BAD_REQUEST)
+        self.assertIn(b'Content-Type', resp.body)
+
+    def test_check_object_creation_bad_delete_headers(self):
+        headers = {'Transfer-Encoding': 'chunked',
+                   'Content-Type': 'text/plain',
+                   'X-Delete-After': 'abc',
+                   'X-Timestamp': str(time.time())}
         resp = constraints.check_object_creation(
             Request.blank('/', headers=headers), 'object_name')
-        self.assertEquals(resp.status_int, HTTP_BAD_REQUEST)
-        self.assert_('Content-Type' in resp.body)
-
-    def test_check_object_manifest_header(self):
-        resp = constraints.check_object_creation(Request.blank('/',
-            headers={'X-Object-Manifest': 'container/prefix', 'Content-Length':
-            '0', 'Content-Type': 'text/plain'}), 'manifest')
-        self.assert_(not resp)
-        resp = constraints.check_object_creation(Request.blank('/',
-            headers={'X-Object-Manifest': 'container', 'Content-Length': '0',
-            'Content-Type': 'text/plain'}), 'manifest')
-        self.assertEquals(resp.status_int, HTTP_BAD_REQUEST)
-        resp = constraints.check_object_creation(Request.blank('/',
-            headers={'X-Object-Manifest': '/container/prefix',
-            'Content-Length': '0', 'Content-Type': 'text/plain'}), 'manifest')
-        self.assertEquals(resp.status_int, HTTP_BAD_REQUEST)
-        resp = constraints.check_object_creation(Request.blank('/',
-            headers={'X-Object-Manifest': 'container/prefix?query=param',
-            'Content-Length': '0', 'Content-Type': 'text/plain'}), 'manifest')
-        self.assertEquals(resp.status_int, HTTP_BAD_REQUEST)
-        resp = constraints.check_object_creation(Request.blank('/',
-            headers={'X-Object-Manifest': 'container/prefix&query=param',
-            'Content-Length': '0', 'Content-Type': 'text/plain'}), 'manifest')
-        self.assertEquals(resp.status_int, HTTP_BAD_REQUEST)
-        resp = constraints.check_object_creation(Request.blank('/',
-            headers={'X-Object-Manifest': 'http://host/container/prefix',
-            'Content-Length': '0', 'Content-Type': 'text/plain'}), 'manifest')
-        self.assertEquals(resp.status_int, HTTP_BAD_REQUEST)
-
-    def test_check_mount(self):
-        self.assertFalse(constraints.check_mount('', ''))
-        constraints.os = MockTrue()  # mock os module
-        self.assertTrue(constraints.check_mount('/srv', '1'))
-        self.assertTrue(constraints.check_mount('/srv', 'foo-bar'))
-        self.assertTrue(constraints.check_mount('/srv', '003ed03c-242a-4b2f-bee9-395f801d1699'))
-        self.assertFalse(constraints.check_mount('/srv', 'foo bar'))
-        self.assertFalse(constraints.check_mount('/srv', 'foo/bar'))
-        self.assertFalse(constraints.check_mount('/srv', 'foo?bar'))
-        reload(constraints)  # put it back
+        self.assertEqual(resp.status_int, HTTP_BAD_REQUEST)
+        self.assertIn(b'Non-integer X-Delete-After', resp.body)
+
+        t = str(int(time.time() - 60))
+        headers = {'Transfer-Encoding': 'chunked',
+                   'Content-Type': 'text/plain',
+                   'X-Delete-At': t,
+                   'X-Timestamp': str(time.time())}
+        resp = constraints.check_object_creation(
+            Request.blank('/', headers=headers), 'object_name')
+        self.assertEqual(resp.status_int, HTTP_BAD_REQUEST)
+        self.assertIn(b'X-Delete-At in past', resp.body)
+
+    def test_check_delete_headers(self):
+        # x-delete-at value should be relative to the request timestamp rather
+        # than time.time() so separate the two to ensure the checks are robust
+        ts = utils.Timestamp(time.time() + 100)
+
+        # X-Delete-After
+        headers = {'X-Delete-After': '600',
+                   'X-Timestamp': ts.internal}
+        req = constraints.check_delete_headers(
+            Request.blank('/', headers=headers))
+        self.assertIsInstance(req, Request)
+        self.assertIn('x-delete-at', req.headers)
+        self.assertNotIn('x-delete-after', req.headers)
+        expected_delete_at = str(int(ts) + 600)
+        self.assertEqual(req.headers.get('X-Delete-At'), expected_delete_at)
+
+        headers = {'X-Delete-After': 'abc',
+                   'X-Timestamp': ts.internal}
+
+        with self.assertRaises(HTTPException) as cm:
+            constraints.check_delete_headers(
+                Request.blank('/', headers=headers))
+        self.assertEqual(cm.exception.status_int, HTTP_BAD_REQUEST)
+        self.assertIn(b'Non-integer X-Delete-After', cm.exception.body)
+
+        headers = {'X-Delete-After': '60.1',
+                   'X-Timestamp': ts.internal}
+        with self.assertRaises(HTTPException) as cm:
+            constraints.check_delete_headers(
+                Request.blank('/', headers=headers))
+        self.assertEqual(cm.exception.status_int, HTTP_BAD_REQUEST)
+        self.assertIn(b'Non-integer X-Delete-After', cm.exception.body)
+
+        headers = {'X-Delete-After': '-1',
+                   'X-Timestamp': ts.internal}
+        with self.assertRaises(HTTPException) as cm:
+            constraints.check_delete_headers(
+                Request.blank('/', headers=headers))
+        self.assertEqual(cm.exception.status_int, HTTP_BAD_REQUEST)
+        self.assertIn(b'X-Delete-After in past', cm.exception.body)
+
+        headers = {'X-Delete-After': '0',
+                   'X-Timestamp': ts.internal}
+        with self.assertRaises(HTTPException) as cm:
+            constraints.check_delete_headers(
+                Request.blank('/', headers=headers))
+        self.assertEqual(cm.exception.status_int, HTTP_BAD_REQUEST)
+        self.assertIn(b'X-Delete-After in past', cm.exception.body)
+
+        # x-delete-after = 0 disallowed when it results in x-delete-at equal to
+        # the timestamp
+        headers = {'X-Delete-After': '0',
+                   'X-Timestamp': utils.Timestamp(int(ts)).internal}
+        with self.assertRaises(HTTPException) as cm:
+            constraints.check_delete_headers(
+                Request.blank('/', headers=headers))
+        self.assertEqual(cm.exception.status_int, HTTP_BAD_REQUEST)
+        self.assertIn(b'X-Delete-After in past', cm.exception.body)
+
+        # X-Delete-At
+        delete_at = str(int(ts) + 100)
+        headers = {'X-Delete-At': delete_at,
+                   'X-Timestamp': ts.internal}
+        req = constraints.check_delete_headers(
+            Request.blank('/', headers=headers))
+        self.assertIsInstance(req, Request)
+        self.assertIn('x-delete-at', req.headers)
+        self.assertEqual(req.headers.get('X-Delete-At'), delete_at)
+
+        headers = {'X-Delete-At': 'abc',
+                   'X-Timestamp': ts.internal}
+        with self.assertRaises(HTTPException) as cm:
+            constraints.check_delete_headers(
+                Request.blank('/', headers=headers))
+        self.assertEqual(cm.exception.status_int, HTTP_BAD_REQUEST)
+        self.assertIn(b'Non-integer X-Delete-At', cm.exception.body)
+
+        delete_at = str(int(ts) + 100) + '.1'
+        headers = {'X-Delete-At': delete_at,
+                   'X-Timestamp': ts.internal}
+        with self.assertRaises(HTTPException) as cm:
+            constraints.check_delete_headers(
+                Request.blank('/', headers=headers))
+        self.assertEqual(cm.exception.status_int, HTTP_BAD_REQUEST)
+        self.assertIn(b'Non-integer X-Delete-At', cm.exception.body)
+
+        delete_at = str(int(ts) - 1)
+        headers = {'X-Delete-At': delete_at,
+                   'X-Timestamp': ts.internal}
+        with self.assertRaises(HTTPException) as cm:
+            constraints.check_delete_headers(
+                Request.blank('/', headers=headers))
+        self.assertEqual(cm.exception.status_int, HTTP_BAD_REQUEST)
+        self.assertIn(b'X-Delete-At in past', cm.exception.body)
+
+        # x-delete-at disallowed when exactly equal to timestamp
+        delete_at = str(int(ts))
+        headers = {'X-Delete-At': delete_at,
+                   'X-Timestamp': utils.Timestamp(int(ts)).internal}
+        with self.assertRaises(HTTPException) as cm:
+            constraints.check_delete_headers(
+                Request.blank('/', headers=headers))
+        self.assertEqual(cm.exception.status_int, HTTP_BAD_REQUEST)
+        self.assertIn(b'X-Delete-At in past', cm.exception.body)
+
+    def test_check_delete_headers_removes_delete_after(self):
+        ts = utils.Timestamp.now()
+        headers = {'Content-Length': '0',
+                   'Content-Type': 'text/plain',
+                   'X-Delete-After': '42',
+                   'X-Delete-At': str(int(ts) + 40),
+                   'X-Timestamp': ts.internal}
+        req = Request.blank('/', headers=headers)
+        constraints.check_delete_headers(req)
+        self.assertNotIn('X-Delete-After', req.headers)
+        self.assertEqual(req.headers['X-Delete-At'], str(int(ts) + 42))
+
+    def test_check_delete_headers_sets_delete_at(self):
+        ts = utils.Timestamp.now()
+        expected = str(int(ts) + 1000)
+        # check delete-at is passed through
+        headers = {'Content-Length': '0',
+                   'Content-Type': 'text/plain',
+                   'X-Delete-At': expected,
+                   'X-Timestamp': ts.internal}
+        req = Request.blank('/', headers=headers)
+        constraints.check_delete_headers(req)
+        self.assertIn('X-Delete-At', req.headers)
+        self.assertEqual(req.headers['X-Delete-At'], expected)
+
+        # check delete-after is converted to delete-at
+        headers = {'Content-Length': '0',
+                   'Content-Type': 'text/plain',
+                   'X-Delete-After': '42',
+                   'X-Timestamp': ts.internal}
+        req = Request.blank('/', headers=headers)
+        constraints.check_delete_headers(req)
+        self.assertIn('X-Delete-At', req.headers)
+        expected = str(int(ts) + 42)
+        self.assertEqual(req.headers['X-Delete-At'], expected)
+
+        # check delete-after takes precedence over delete-at
+        headers = {'Content-Length': '0',
+                   'Content-Type': 'text/plain',
+                   'X-Delete-After': '42',
+                   'X-Delete-At': str(int(ts) + 40),
+                   'X-Timestamp': ts.internal}
+        req = Request.blank('/', headers=headers)
+        constraints.check_delete_headers(req)
+        self.assertIn('X-Delete-At', req.headers)
+        self.assertEqual(req.headers['X-Delete-At'], expected)
+
+        headers = {'Content-Length': '0',
+                   'Content-Type': 'text/plain',
+                   'X-Delete-After': '42',
+                   'X-Delete-At': str(int(ts) + 44),
+                   'X-Timestamp': ts.internal}
+        req = Request.blank('/', headers=headers)
+        constraints.check_delete_headers(req)
+        self.assertIn('X-Delete-At', req.headers)
+        self.assertEqual(req.headers['X-Delete-At'], expected)
+
+    def test_check_drive_invalid_path(self):
+        root = '/srv/'
+        with mock_check_drive() as mocks:
+            drive = 'foo?bar'
+            with self.assertRaises(ValueError) as exc_mgr:
+                constraints.check_dir(root, drive)
+            self.assertEqual(str(exc_mgr.exception),
+                             '%s is not a valid drive name' % drive)
+
+            drive = 'foo bar'
+            with self.assertRaises(ValueError) as exc_mgr:
+                constraints.check_mount(root, drive)
+            self.assertEqual(str(exc_mgr.exception),
+                             '%s is not a valid drive name' % drive)
+
+            drive = 'foo/bar'
+            with self.assertRaises(ValueError) as exc_mgr:
+                constraints.check_drive(root, drive, True)
+            self.assertEqual(str(exc_mgr.exception),
+                             '%s is not a valid drive name' % drive)
+
+            drive = 'foo%bar'
+            with self.assertRaises(ValueError) as exc_mgr:
+                constraints.check_drive(root, drive, False)
+            self.assertEqual(str(exc_mgr.exception),
+                             '%s is not a valid drive name' % drive)
+        self.assertEqual([], mocks['isdir'].call_args_list)
+        self.assertEqual([], mocks['ismount'].call_args_list)
+
+    def test_check_drive_ismount(self):
+        root = '/srv'
+        path = 'sdb1'
+        with mock_check_drive(ismount=True) as mocks:
+            with self.assertRaises(ValueError) as exc_mgr:
+                constraints.check_dir(root, path)
+            self.assertEqual(str(exc_mgr.exception),
+                             '/srv/sdb1 is not a directory')
+
+            with self.assertRaises(ValueError) as exc_mgr:
+                constraints.check_drive(root, path, False)
+            self.assertEqual(str(exc_mgr.exception),
+                             '/srv/sdb1 is not a directory')
+
+            self.assertEqual([mock.call('/srv/sdb1'), mock.call('/srv/sdb1')],
+                             mocks['isdir'].call_args_list)
+            self.assertEqual([], mocks['ismount'].call_args_list)
+
+        with mock_check_drive(ismount=True) as mocks:
+            self.assertEqual('/srv/sdb1', constraints.check_mount(root, path))
+            self.assertEqual('/srv/sdb1', constraints.check_drive(
+                root, path, True))
+            self.assertEqual([], mocks['isdir'].call_args_list)
+            self.assertEqual([mock.call('/srv/sdb1'), mock.call('/srv/sdb1')],
+                             mocks['ismount'].call_args_list)
+
+    def test_check_drive_isdir(self):
+        root = '/srv'
+        path = 'sdb2'
+        with mock_check_drive(isdir=True) as mocks:
+            self.assertEqual('/srv/sdb2', constraints.check_dir(root, path))
+            self.assertEqual('/srv/sdb2', constraints.check_drive(
+                root, path, False))
+            self.assertEqual([mock.call('/srv/sdb2'), mock.call('/srv/sdb2')],
+                             mocks['isdir'].call_args_list)
+            self.assertEqual([], mocks['ismount'].call_args_list)
+
+        with mock_check_drive(isdir=True) as mocks:
+            with self.assertRaises(ValueError) as exc_mgr:
+                constraints.check_mount(root, path)
+            self.assertEqual(str(exc_mgr.exception),
+                             '/srv/sdb2 is not mounted')
+
+            with self.assertRaises(ValueError) as exc_mgr:
+                constraints.check_drive(root, path, True)
+            self.assertEqual(str(exc_mgr.exception),
+                             '/srv/sdb2 is not mounted')
+
+            self.assertEqual([], mocks['isdir'].call_args_list)
+            self.assertEqual([mock.call('/srv/sdb2'), mock.call('/srv/sdb2')],
+                             mocks['ismount'].call_args_list)
 
     def test_check_float(self):
         self.assertFalse(constraints.check_float(''))
         self.assertTrue(constraints.check_float('0'))
 
+    def test_valid_timestamp(self):
+        self.assertRaises(HTTPException,
+                          constraints.valid_timestamp,
+                          Request.blank('/'))
+        self.assertRaises(HTTPException,
+                          constraints.valid_timestamp,
+                          Request.blank('/', headers={
+                              'X-Timestamp': 'asdf'}))
+        timestamp = utils.Timestamp.now(offset=0xabc)
+        req = Request.blank('/', headers={'X-Timestamp': timestamp.internal})
+        self.assertEqual(timestamp, constraints.valid_timestamp(req))
+        req = Request.blank('/', headers={'X-Timestamp': timestamp.normal})
+        self.assertEqual(utils.Timestamp(timestamp.normal),
+                         constraints.valid_timestamp(req))
+
     def test_check_utf8(self):
         unicode_sample = u'\uc77c\uc601'
-        valid_utf8_str = unicode_sample.encode('utf-8')
-        invalid_utf8_str = unicode_sample.encode('utf-8')[::-1]
-
-        for false_argument in [None,
-                               '',
-                               invalid_utf8_str,
-                               ]:
-            self.assertFalse(constraints.check_utf8(false_argument))
-
-        for true_argument in ['this is ascii and utf-8, too',
-                              unicode_sample,
-                              valid_utf8_str]:
-            self.assertTrue(constraints.check_utf8(true_argument))
+        unicode_with_reserved = u'abc%sdef' % utils.RESERVED_STR
+
+        # Some false-y values
+        self.assertFalse(constraints.check_utf8(None))
+        self.assertFalse(constraints.check_utf8(''))
+        self.assertFalse(constraints.check_utf8(b''))
+        self.assertFalse(constraints.check_utf8(u''))
+
+        # invalid utf8 bytes
+        self.assertFalse(constraints.check_utf8(
+            unicode_sample.encode('utf-8')[::-1]))
+        # unicode with null
+        self.assertFalse(constraints.check_utf8(unicode_with_reserved))
+        # utf8 bytes with null
+        self.assertFalse(constraints.check_utf8(
+            unicode_with_reserved.encode('utf8')))
+
+        self.assertTrue(constraints.check_utf8('this is ascii and utf-8, too'))
+        self.assertTrue(constraints.check_utf8(unicode_sample))
+        self.assertTrue(constraints.check_utf8(unicode_sample.encode('utf8')))
+
+    def test_check_utf8_internal(self):
+        unicode_with_reserved = u'abc%sdef' % utils.RESERVED_STR
+        # sanity
+        self.assertFalse(constraints.check_utf8(unicode_with_reserved))
+        self.assertTrue(constraints.check_utf8('foobar', internal=True))
+        # internal allows reserved names
+        self.assertTrue(constraints.check_utf8(unicode_with_reserved,
+                                               internal=True))
+
+    def test_check_utf8_non_canonical(self):
+        self.assertFalse(constraints.check_utf8(b'\xed\xa0\xbc\xed\xbc\xb8'))
+        self.assertTrue(constraints.check_utf8(u'\U0001f338'))
+        self.assertTrue(constraints.check_utf8(b'\xf0\x9f\x8c\xb8'))
+        self.assertTrue(constraints.check_utf8(u'\U0001f338'.encode('utf8')))
+        self.assertFalse(constraints.check_utf8(b'\xed\xa0\xbd\xed\xb9\x88'))
+        self.assertTrue(constraints.check_utf8(u'\U0001f648'))
+
+    def test_check_utf8_lone_surrogates(self):
+        self.assertFalse(constraints.check_utf8(b'\xed\xa0\xbc'))
+        self.assertFalse(constraints.check_utf8(u'\ud83c'))
+        self.assertFalse(constraints.check_utf8(b'\xed\xb9\x88'))
+        self.assertFalse(constraints.check_utf8(u'\ude48'))
+
+        self.assertFalse(constraints.check_utf8(u'\ud800'))
+        self.assertFalse(constraints.check_utf8(u'\udc00'))
+        self.assertFalse(constraints.check_utf8(u'\udcff'))
+        self.assertFalse(constraints.check_utf8(u'\udfff'))
+
+    def test_validate_bad_meta(self):
+        req = Request.blank(
+            '/v/a/c/o',
+            headers={'x-object-meta-hello':
+                     'ab' * constraints.MAX_HEADER_SIZE})
+        self.assertEqual(constraints.check_metadata(req, 'object').status_int,
+                         HTTP_BAD_REQUEST)
+        resp = constraints.check_metadata(req, 'object')
+        self.assertIsNotNone(resp)
+        self.assertIn(b'x-object-meta-hello', resp.body.lower())
+
+    def test_validate_constraints(self):
+        c = constraints
+        self.assertGreater(c.MAX_META_OVERALL_SIZE, c.MAX_META_NAME_LENGTH)
+        self.assertGreater(c.MAX_META_OVERALL_SIZE, c.MAX_META_VALUE_LENGTH)
+        self.assertGreater(c.MAX_HEADER_SIZE, c.MAX_META_NAME_LENGTH)
+        self.assertGreater(c.MAX_HEADER_SIZE, c.MAX_META_VALUE_LENGTH)
+
+    def test_check_account_format(self):
+        req = Request.blank(
+            '/v/a/c/o',
+            headers={'X-Copy-From-Account': 'account/with/slashes'})
+        self.assertRaises(HTTPException,
+                          constraints.check_account_format,
+                          req, req.headers['X-Copy-From-Account'])
+        req = Request.blank(
+            '/v/a/c/o',
+            headers={'X-Copy-From-Account': ''})
+        self.assertRaises(HTTPException,
+                          constraints.check_account_format,
+                          req, req.headers['X-Copy-From-Account'])
+
+    def test_check_container_format(self):
+        invalid_versions_locations = (
+            'container/with/slashes',
+            '',  # empty
+        )
+        for versions_location in invalid_versions_locations:
+            req = Request.blank(
+                '/v/a/c/o', headers={
+                    'X-Versions-Location': versions_location})
+            with self.assertRaises(HTTPException) as cm:
+                constraints.check_container_format(
+                    req, req.headers['X-Versions-Location'])
+            self.assertTrue(cm.exception.body.startswith(
+                b'Container name cannot'))
+
+    def test_valid_api_version(self):
+        version = 'v1'
+        self.assertTrue(constraints.valid_api_version(version))
+
+        version = 'v1.0'
+        self.assertTrue(constraints.valid_api_version(version))
+
+        version = 'v2'
+        self.assertFalse(constraints.valid_api_version(version))
+
+
+class TestConstraintsConfig(unittest.TestCase):
+
+    def test_default_constraints(self):
+        for key in constraints.DEFAULT_CONSTRAINTS:
+            # if there is local over-rides in swift.conf we just continue on
+            if key in constraints.OVERRIDE_CONSTRAINTS:
+                continue
+            # module level attrs (that aren't in OVERRIDE) should have the
+            # same value as the DEFAULT map
+            module_level_value = getattr(constraints, key.upper())
+            self.assertEqual(constraints.DEFAULT_CONSTRAINTS[key],
+                             module_level_value)
+
+    def test_effective_constraints(self):
+        for key in constraints.DEFAULT_CONSTRAINTS:
+            # module level attrs should always mirror the same value as the
+            # EFFECTIVE map
+            module_level_value = getattr(constraints, key.upper())
+            self.assertEqual(constraints.EFFECTIVE_CONSTRAINTS[key],
+                             module_level_value)
+            # if there are local over-rides in swift.conf those should be
+            # reflected in the EFFECTIVE, otherwise we expect the DEFAULTs
+            self.assertEqual(constraints.EFFECTIVE_CONSTRAINTS[key],
+                             constraints.OVERRIDE_CONSTRAINTS.get(
+                                 key, constraints.DEFAULT_CONSTRAINTS[key]))
+
+    def test_override_constraints(self):
+        try:
+            with tempfile.NamedTemporaryFile() as f:
+                f.write(b'[swift-constraints]\n')
+                # set everything to 1
+                for key in constraints.DEFAULT_CONSTRAINTS:
+                    f.write(b'%s = 1\n' % key.encode('ascii'))
+                f.flush()
+                with mock.patch.object(utils, 'SWIFT_CONF_FILE', f.name):
+                    constraints.reload_constraints()
+            for key, default in constraints.DEFAULT_CONSTRAINTS.items():
+                # module level attrs should all be 1
+                module_level_value = getattr(constraints, key.upper())
+                if isinstance(default, int):
+                    self.assertEqual(module_level_value, 1)
+                elif isinstance(default, str):
+                    self.assertEqual(module_level_value, '1')
+                else:
+                    self.assertEqual(module_level_value, ['1'])
+                # all keys should be in OVERRIDE
+                self.assertEqual(constraints.OVERRIDE_CONSTRAINTS[key],
+                                 module_level_value)
+                # module level attrs should always mirror the same value as
+                # the EFFECTIVE map
+                self.assertEqual(constraints.EFFECTIVE_CONSTRAINTS[key],
+                                 module_level_value)
+        finally:
+            constraints.reload_constraints()
+
+    def test_reload_reset(self):
+        try:
+            with tempfile.NamedTemporaryFile() as f:
+                f.write(b'[swift-constraints]\n')
+                # set everything to 1
+                for key in constraints.DEFAULT_CONSTRAINTS:
+                    f.write(b'%s = 1\n' % key.encode('ascii'))
+                f.flush()
+                with mock.patch.object(utils, 'SWIFT_CONF_FILE', f.name):
+                    constraints.reload_constraints()
+            self.assertTrue(constraints.SWIFT_CONSTRAINTS_LOADED)
+            self.assertEqual(sorted(constraints.DEFAULT_CONSTRAINTS.keys()),
+                             sorted(constraints.OVERRIDE_CONSTRAINTS.keys()))
+            # file is now deleted...
+            with mock.patch.object(utils, 'SWIFT_CONF_FILE', f.name):
+                constraints.reload_constraints()
+            # no constraints have been loaded from non-existent swift.conf
+            self.assertFalse(constraints.SWIFT_CONSTRAINTS_LOADED)
+            # no constraints are in OVERRIDE
+            self.assertEqual([], list(constraints.OVERRIDE_CONSTRAINTS.keys()))
+            # the EFFECTIVE constraints mirror DEFAULT
+            self.assertEqual(constraints.EFFECTIVE_CONSTRAINTS,
+                             constraints.DEFAULT_CONSTRAINTS)
+        finally:
+            constraints.reload_constraints()
+
 
 if __name__ == '__main__':
     unittest.main()
diff --git a/test/unit/common/test_container_sync_realms.py b/test/unit/common/test_container_sync_realms.py
new file mode 100644
index 0000000000..fa5afe00c3
--- /dev/null
+++ b/test/unit/common/test_container_sync_realms.py
@@ -0,0 +1,196 @@
+# Copyright (c) 2013 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import errno
+import os
+import unittest
+import uuid
+
+from unittest.mock import ANY, patch
+from swift.common.container_sync_realms import ContainerSyncRealms
+from test.debug_logger import debug_logger
+from test.unit import temptree
+
+
+class TestUtils(unittest.TestCase):
+
+    def test_no_file_there(self):
+        unique = uuid.uuid4().hex
+        logger = debug_logger()
+        csr = ContainerSyncRealms(unique, logger)
+        self.assertEqual(
+            logger.all_log_lines(),
+            {'debug': [
+                "Could not load '%s': [Errno 2] No such file or directory: "
+                "'%s'" % (unique, unique)]})
+        self.assertEqual(csr.mtime_check_interval, 300)
+        self.assertEqual(csr.realms(), [])
+
+    def test_os_error(self):
+        fname = 'container-sync-realms.conf'
+        fcontents = ''
+        with temptree([fname], [fcontents]) as tempdir:
+            logger = debug_logger()
+            fpath = os.path.join(tempdir, fname)
+
+            def _mock_getmtime(path):
+                raise OSError(errno.EACCES,
+                              os.strerror(errno.EACCES) +
+                              ": '%s'" % (fpath))
+            with patch('os.path.getmtime', _mock_getmtime):
+                csr = ContainerSyncRealms(fpath, logger)
+
+            self.assertEqual(
+                logger.all_log_lines(),
+                {'error': [
+                    "Could not load '%s': [Errno 13] Permission denied: "
+                    "'%s'" % (fpath, fpath)]})
+            self.assertEqual(csr.mtime_check_interval, 300)
+            self.assertEqual(csr.realms(), [])
+
+    def test_empty(self):
+        fname = 'container-sync-realms.conf'
+        fcontents = ''
+        with temptree([fname], [fcontents]) as tempdir:
+            logger = debug_logger()
+            fpath = os.path.join(tempdir, fname)
+            csr = ContainerSyncRealms(fpath, logger)
+            self.assertEqual(logger.all_log_lines(), {})
+            self.assertEqual(csr.mtime_check_interval, 300)
+            self.assertEqual(csr.realms(), [])
+
+    def test_error_parsing(self):
+        fname = 'container-sync-realms.conf'
+        fcontents = 'invalid'
+        with temptree([fname], [fcontents]) as tempdir:
+            logger = debug_logger()
+            fpath = os.path.join(tempdir, fname)
+            csr = ContainerSyncRealms(fpath, logger)
+            fmt = "Could not load '%s': " \
+                "File contains no section headers.\n" \
+                "file: '%s', line: 1\n" \
+                "'invalid'"
+            self.assertEqual(
+                logger.all_log_lines(),
+                {'error': [fmt % (fpath, fpath)]})
+            self.assertEqual(csr.mtime_check_interval, 300)
+            self.assertEqual(csr.realms(), [])
+
+    def test_one_realm(self):
+        fname = 'container-sync-realms.conf'
+        fcontents = '''
+[US]
+key = 9ff3b71c849749dbaec4ccdd3cbab62b
+cluster_dfw1 = http://dfw1.host/v1/
+'''
+        with temptree([fname], [fcontents]) as tempdir:
+            logger = debug_logger()
+            fpath = os.path.join(tempdir, fname)
+            csr = ContainerSyncRealms(fpath, logger)
+            self.assertEqual(logger.all_log_lines(), {})
+            self.assertEqual(csr.mtime_check_interval, 300)
+            self.assertEqual(csr.realms(), ['US'])
+            self.assertEqual(csr.key('US'), '9ff3b71c849749dbaec4ccdd3cbab62b')
+            self.assertIsNone(csr.key2('US'))
+            self.assertEqual(csr.clusters('US'), ['DFW1'])
+            self.assertEqual(
+                csr.endpoint('US', 'DFW1'), 'http://dfw1.host/v1/')
+
+    def test_two_realms_and_change_a_default(self):
+        fname = 'container-sync-realms.conf'
+        fcontents = '''
+[DEFAULT]
+mtime_check_interval = 60
+
+[US]
+key = 9ff3b71c849749dbaec4ccdd3cbab62b
+cluster_dfw1 = http://dfw1.host/v1/
+
+[UK]
+key = e9569809dc8b4951accc1487aa788012
+key2 = f6351bd1cc36413baa43f7ba1b45e51d
+cluster_lon3 = http://lon3.host/v1/
+'''
+        with temptree([fname], [fcontents]) as tempdir:
+            logger = debug_logger()
+            fpath = os.path.join(tempdir, fname)
+            csr = ContainerSyncRealms(fpath, logger)
+            self.assertEqual(logger.all_log_lines(), {})
+            self.assertEqual(csr.mtime_check_interval, 60)
+            self.assertEqual(sorted(csr.realms()), ['UK', 'US'])
+            self.assertEqual(csr.key('US'), '9ff3b71c849749dbaec4ccdd3cbab62b')
+            self.assertIsNone(csr.key2('US'))
+            self.assertEqual(csr.clusters('US'), ['DFW1'])
+            self.assertEqual(
+                csr.endpoint('US', 'DFW1'), 'http://dfw1.host/v1/')
+            self.assertEqual(csr.key('UK'), 'e9569809dc8b4951accc1487aa788012')
+            self.assertEqual(
+                csr.key2('UK'), 'f6351bd1cc36413baa43f7ba1b45e51d')
+            self.assertEqual(csr.clusters('UK'), ['LON3'])
+            self.assertEqual(
+                csr.endpoint('UK', 'LON3'), 'http://lon3.host/v1/')
+
+    def test_empty_realm(self):
+        fname = 'container-sync-realms.conf'
+        fcontents = '''
+[US]
+'''
+        with temptree([fname], [fcontents]) as tempdir:
+            logger = debug_logger()
+            fpath = os.path.join(tempdir, fname)
+            csr = ContainerSyncRealms(fpath, logger)
+            self.assertEqual(logger.all_log_lines(), {})
+            self.assertEqual(csr.mtime_check_interval, 300)
+            self.assertEqual(csr.realms(), ['US'])
+            self.assertIsNone(csr.key('US'))
+            self.assertIsNone(csr.key2('US'))
+            self.assertEqual(csr.clusters('US'), [])
+            self.assertIsNone(csr.endpoint('US', 'JUST_TESTING'))
+
+    def test_bad_mtime_check_interval(self):
+        fname = 'container-sync-realms.conf'
+        fcontents = '''
+[DEFAULT]
+mtime_check_interval = invalid
+'''
+        with temptree([fname], [fcontents]) as tempdir:
+            logger = debug_logger()
+            fpath = os.path.join(tempdir, fname)
+            csr = ContainerSyncRealms(fpath, logger)
+            logs = logger.all_log_lines()
+            self.assertEqual(logs, {'error': [ANY]})
+            line = logs['error'][0]
+            self.assertIn(
+                "Error in '%s' with mtime_check_interval: "
+                "could not convert string to float:" % fpath, line)
+
+            self.assertEqual(csr.mtime_check_interval, 300)
+
+    def test_get_sig(self):
+        fname = 'container-sync-realms.conf'
+        fcontents = ''
+        with temptree([fname], [fcontents]) as tempdir:
+            logger = debug_logger()
+            fpath = os.path.join(tempdir, fname)
+            csr = ContainerSyncRealms(fpath, logger)
+            self.assertEqual(
+                csr.get_sig(
+                    'GET', '/some/path', '1387212345.67890', 'my_nonce',
+                    'realm_key', 'user_key'),
+                '5a6eb486eb7b44ae1b1f014187a94529c3f9c8f9')
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/test_daemon.py b/test/unit/common/test_daemon.py
index f2da86965b..1ae10e841c 100644
--- a/test/unit/common/test_daemon.py
+++ b/test/unit/common/test_daemon.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,22 +13,32 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-# TODO: Test kill_children signal handlers
-
+import configparser
+import os
+from io import StringIO
+import time
 import unittest
 from getpass import getuser
 import logging
-from StringIO import StringIO
-from test.unit import tmpfile
+from test.unit import tmpfile, with_tempdir
+from unittest import mock
+import signal
+from contextlib import contextmanager
+import itertools
+from collections import defaultdict
+import errno
+from textwrap import dedent
 
 from swift.common import daemon, utils
+from test.debug_logger import debug_logger
 
 
 class MyDaemon(daemon.Daemon):
+    WORKERS_HEALTHCHECK_INTERVAL = 0
 
     def __init__(self, conf):
         self.conf = conf
-        self.logger = utils.get_logger(None, 'server', log_route='server')
+        self.logger = debug_logger('my-daemon')
         MyDaemon.forever_called = False
         MyDaemon.once_called = False
 
@@ -49,8 +59,8 @@ class TestDaemon(unittest.TestCase):
 
     def test_create(self):
         d = daemon.Daemon({})
-        self.assertEquals(d.conf, {})
-        self.assert_(isinstance(d.logger, utils.LogAdapter))
+        self.assertEqual(d.conf, {})
+        self.assertIsInstance(d.logger, utils.logs.SwiftLogAdapter)
 
     def test_stubs(self):
         d = daemon.Daemon({})
@@ -58,15 +68,57 @@ def test_stubs(self):
         self.assertRaises(NotImplementedError, d.run_forever)
 
 
+class MyWorkerDaemon(MyDaemon):
+
+    def __init__(self, *a, **kw):
+        super(MyWorkerDaemon, self).__init__(*a, **kw)
+        MyWorkerDaemon.post_multiprocess_run_called = False
+
+    def get_worker_args(self, once=False, **kwargs):
+        return [kwargs for i in range(int(self.conf.get('workers', 0)))]
+
+    def is_healthy(self):
+        try:
+            return getattr(self, 'health_side_effects', []).pop(0)
+        except IndexError:
+            return True
+
+    def post_multiprocess_run(self):
+        MyWorkerDaemon.post_multiprocess_run_called = True
+
+
+class TestWorkerDaemon(unittest.TestCase):
+
+    def test_stubs(self):
+        d = daemon.Daemon({})
+        self.assertRaises(NotImplementedError, d.run_once)
+        self.assertRaises(NotImplementedError, d.run_forever)
+        self.assertEqual([], d.get_worker_args())
+        self.assertEqual(True, d.is_healthy())
+
+    def test_my_worker_daemon(self):
+        d = MyWorkerDaemon({})
+        self.assertEqual([], d.get_worker_args())
+        self.assertTrue(d.is_healthy())
+        d = MyWorkerDaemon({'workers': '3'})
+        self.assertEqual([{'key': 'val'}] * 3, d.get_worker_args(key='val'))
+        d.health_side_effects = [True, False]
+        self.assertTrue(d.is_healthy())
+        self.assertFalse(d.is_healthy())
+        self.assertTrue(d.is_healthy())
+
+
 class TestRunDaemon(unittest.TestCase):
 
     def setUp(self):
-        utils.HASH_PATH_SUFFIX = 'endcap'
-        utils.drop_privileges = lambda *args: None
-        utils.capture_stdio = lambda *args: None
-
-    def tearDown(self):
-        reload(utils)
+        for patcher in [
+            mock.patch.object(utils, 'HASH_PATH_PREFIX', b'startcap'),
+            mock.patch.object(utils, 'HASH_PATH_SUFFIX', b'endcap'),
+            mock.patch.object(utils, 'drop_privileges', lambda *args: None),
+            mock.patch.object(utils, 'capture_stdio', lambda *args: None),
+        ]:
+            patcher.start()
+            self.addCleanup(patcher.stop)
 
     def test_run(self):
         d = MyDaemon({})
@@ -74,34 +126,371 @@ def test_run(self):
         self.assertFalse(MyDaemon.once_called)
         # test default
         d.run()
-        self.assertEquals(d.forever_called, True)
+        self.assertEqual(d.forever_called, True)
         # test once
         d.run(once=True)
-        self.assertEquals(d.once_called, True)
+        self.assertEqual(d.once_called, True)
+
+    def test_signal(self):
+        d = MyDaemon({})
+        with mock.patch('swift.common.daemon.signal') as mock_signal:
+            mock_signal.SIGTERM = signal.SIGTERM
+            daemon.DaemonStrategy(d, d.logger).run()
+        signal_args, kwargs = mock_signal.signal.call_args
+        sig, func = signal_args
+        self.assertEqual(sig, signal.SIGTERM)
+        with mock.patch('swift.common.daemon.os') as mock_os:
+            func()
+        self.assertEqual(mock_os.method_calls, [
+            mock.call.getpid(),
+            mock.call.killpg(0, signal.SIGTERM),
+            # hard exit because bare except handlers can trap SystemExit
+            mock.call._exit(0)
+        ])
 
     def test_run_daemon(self):
-        sample_conf = """[my-daemon]
-user = %s
-""" % getuser()
-        with tmpfile(sample_conf) as conf_file:
-            daemon.run_daemon(MyDaemon, conf_file)
-            self.assertEquals(MyDaemon.forever_called, True)
+        logging.logThreads = 1  # reset to default
+        sample_conf = "[my-daemon]\nuser = %s\n" % getuser()
+        with tmpfile(sample_conf) as conf_file, \
+                mock.patch('swift.common.utils.eventlet') as _utils_evt, \
+                mock.patch('eventlet.hubs.use_hub') as mock_use_hub, \
+                mock.patch('eventlet.debug') as _debug_evt:
+            with mock.patch.dict('os.environ', {'TZ': ''}), \
+                    mock.patch('time.tzset') as mock_tzset:
+                daemon.run_daemon(MyDaemon, conf_file)
+                self.assertTrue(MyDaemon.forever_called)
+                self.assertEqual(os.environ['TZ'], 'UTC+0')
+                self.assertEqual(mock_tzset.mock_calls, [mock.call()])
+                self.assertEqual(mock_use_hub.mock_calls,
+                                 [mock.call(utils.get_hub())])
             daemon.run_daemon(MyDaemon, conf_file, once=True)
-            self.assertEquals(MyDaemon.once_called, True)
+            _utils_evt.patcher.monkey_patch.assert_called_with(all=False,
+                                                               socket=True,
+                                                               select=True,
+                                                               thread=True)
+            self.assertEqual(0, logging.logThreads)  # fixed in monkey_patch
+            _debug_evt.hub_exceptions.assert_called_with(False)
+            self.assertEqual(MyDaemon.once_called, True)
 
             # test raise in daemon code
-            MyDaemon.run_once = MyDaemon.run_raise
-            self.assertRaises(OSError, daemon.run_daemon, MyDaemon,
-                              conf_file, once=True)
+            with mock.patch.object(MyDaemon, 'run_once', MyDaemon.run_raise):
+                self.assertRaises(OSError, daemon.run_daemon, MyDaemon,
+                                  conf_file, once=True)
 
             # test user quit
-            MyDaemon.run_forever = MyDaemon.run_quit
             sio = StringIO()
             logger = logging.getLogger('server')
             logger.addHandler(logging.StreamHandler(sio))
             logger = utils.get_logger(None, 'server', log_route='server')
-            daemon.run_daemon(MyDaemon, conf_file, logger=logger)
-            self.assert_('user quit' in sio.getvalue().lower())
+            with mock.patch.object(MyDaemon, 'run_forever', MyDaemon.run_quit):
+                daemon.run_daemon(MyDaemon, conf_file, logger=logger)
+            self.assertTrue('user quit' in sio.getvalue().lower())
+
+            # test missing section
+            sample_conf = "[default]\nuser = %s\n" % getuser()
+            with tmpfile(sample_conf) as conf_file:
+                self.assertRaisesRegex(SystemExit,
+                                       'Unable to find my-daemon '
+                                       'config section in.*',
+                                       daemon.run_daemon, MyDaemon,
+                                       conf_file, once=True)
+
+    def test_run_daemon_diff_tz(self):
+        old_tz = os.environ.get('TZ', '')
+        try:
+            os.environ['TZ'] = 'EST+05EDT,M4.1.0,M10.5.0'
+            time.tzset()
+            self.assertEqual((1970, 1, 1, 0, 0, 0), time.gmtime(0)[:6])
+            self.assertEqual((1969, 12, 31, 19, 0, 0), time.localtime(0)[:6])
+            self.assertEqual(18000, time.timezone)
+
+            sample_conf = "[my-daemon]\nuser = %s\n" % getuser()
+            with tmpfile(sample_conf) as conf_file, \
+                    mock.patch('swift.common.utils.eventlet'), \
+                    mock.patch('eventlet.hubs.use_hub'), \
+                    mock.patch('eventlet.debug'):
+                daemon.run_daemon(MyDaemon, conf_file)
+                self.assertFalse(MyDaemon.once_called)
+                self.assertTrue(MyDaemon.forever_called)
+
+            self.assertEqual((1970, 1, 1, 0, 0, 0), time.gmtime(0)[:6])
+            self.assertEqual((1970, 1, 1, 0, 0, 0), time.localtime(0)[:6])
+            self.assertEqual(0, time.timezone)
+        finally:
+            os.environ['TZ'] = old_tz
+            time.tzset()
+
+    @with_tempdir
+    def test_run_deamon_from_conf_file(self, tempdir):
+        conf_path = os.path.join(tempdir, 'test-daemon.conf')
+        conf_body = """
+        [DEFAULT]
+        conn_timeout = 5
+        client_timeout = 1
+        [my-daemon]
+        CONN_timeout = 10
+        client_timeout = 2
+        """
+        contents = dedent(conf_body)
+        with open(conf_path, 'w') as f:
+            f.write(contents)
+        with mock.patch('swift.common.utils.eventlet'), \
+                mock.patch('eventlet.hubs.use_hub'), \
+                mock.patch('eventlet.debug'):
+            d = daemon.run_daemon(MyDaemon, conf_path)
+        # my-daemon section takes priority (!?)
+        self.assertEqual('2', d.conf['client_timeout'])
+        self.assertEqual('10', d.conf['CONN_timeout'])
+        self.assertEqual('5', d.conf['conn_timeout'])
+
+    @with_tempdir
+    def test_run_daemon_from_conf_file_with_duplicate_var(self, tempdir):
+        conf_path = os.path.join(tempdir, 'test-daemon.conf')
+        conf_body = """
+        [DEFAULT]
+        client_timeout = 3
+        [my-daemon]
+        CLIENT_TIMEOUT = 2
+        client_timeout = 1
+        conn_timeout = 1.1
+        conn_timeout = 1.2
+        """
+        contents = dedent(conf_body)
+        with open(conf_path, 'w') as f:
+            f.write(contents)
+        with mock.patch('swift.common.utils.eventlet'), \
+                mock.patch('eventlet.hubs.use_hub'), \
+                mock.patch('eventlet.debug'):
+            with self.assertRaises(
+                    configparser.DuplicateOptionError) as ctx:
+                daemon.run_daemon(MyDaemon, tempdir)
+            msg = str(ctx.exception)
+            self.assertIn('conn_timeout', msg)
+            self.assertIn('already exists', msg)
+
+    @with_tempdir
+    def test_run_deamon_from_conf_dir(self, tempdir):
+        conf_files = {
+            'default': """
+            [DEFAULT]
+            conn_timeout = 5
+            client_timeout = 1
+            """,
+            'daemon': """
+            [DEFAULT]
+            CONN_timeout = 3
+            CLIENT_TIMEOUT = 4
+            [my-daemon]
+            CONN_timeout = 10
+            client_timeout = 2
+            """,
+        }
+        for filename, conf_body in conf_files.items():
+            path = os.path.join(tempdir, filename + '.conf')
+            with open(path, 'wt') as fd:
+                fd.write(dedent(conf_body))
+        with mock.patch('swift.common.utils.eventlet'), \
+                mock.patch('eventlet.hubs.use_hub'), \
+                mock.patch('eventlet.debug'):
+            d = daemon.run_daemon(MyDaemon, tempdir)
+        # my-daemon section takes priority (!?)
+        self.assertEqual('2', d.conf['client_timeout'])
+        self.assertEqual('10', d.conf['CONN_timeout'])
+        self.assertEqual('5', d.conf['conn_timeout'])
+
+    @with_tempdir
+    def test_run_daemon_from_conf_dir_with_duplicate_var(self, tempdir):
+        conf_files = {
+            'default': """
+            [DEFAULT]
+            client_timeout = 3
+            """,
+            'daemon': """
+            [my-daemon]
+            client_timeout = 2
+            CLIENT_TIMEOUT = 4
+            conn_timeout = 1.1
+            conn_timeout = 1.2
+            """,
+        }
+        for filename, conf_body in conf_files.items():
+            path = os.path.join(tempdir, filename + '.conf')
+            with open(path, 'wt') as fd:
+                fd.write(dedent(conf_body))
+        with mock.patch('swift.common.utils.eventlet'), \
+                mock.patch('eventlet.hubs.use_hub'), \
+                mock.patch('eventlet.debug'):
+            with self.assertRaises(
+                    configparser.DuplicateOptionError) as ctx:
+                daemon.run_daemon(MyDaemon, tempdir)
+            msg = str(ctx.exception)
+            self.assertIn('conn_timeout', msg)
+            self.assertIn('already exists', msg)
+
+    @contextmanager
+    def mock_os(self, child_worker_cycles=3):
+        self.waitpid_calls = defaultdict(int)
+
+        def mock_waitpid(p, *args):
+            self.waitpid_calls[p] += 1
+            if self.waitpid_calls[p] >= child_worker_cycles:
+                rv = p
+            else:
+                rv = 0
+            return rv, 0
+        with mock.patch('swift.common.daemon.os.fork') as mock_fork, \
+                mock.patch('swift.common.daemon.os.waitpid', mock_waitpid), \
+                mock.patch('swift.common.daemon.os.kill') as mock_kill:
+            mock_fork.side_effect = (
+                'mock-pid-%s' % i for i in itertools.count())
+            self.mock_fork = mock_fork
+            self.mock_kill = mock_kill
+            yield
+
+    def test_fork_workers(self):
+        utils.logging_monkey_patch()  # needed to log at notice
+        d = MyWorkerDaemon({'workers': 3})
+        strategy = daemon.DaemonStrategy(d, d.logger)
+        with self.mock_os():
+            strategy.run(once=True)
+        self.assertEqual([mock.call()] * 3, self.mock_fork.call_args_list)
+        self.assertEqual(self.waitpid_calls, {
+            'mock-pid-0': 3,
+            'mock-pid-1': 3,
+            'mock-pid-2': 3,
+        })
+        self.assertEqual([], self.mock_kill.call_args_list)
+        self.assertIn('Finished', d.logger.get_lines_for_level('notice')[-1])
+        self.assertTrue(MyWorkerDaemon.post_multiprocess_run_called)
+
+    def test_forked_worker(self):
+        d = MyWorkerDaemon({'workers': 3})
+        strategy = daemon.DaemonStrategy(d, d.logger)
+        with mock.patch('swift.common.daemon.os.fork') as mock_fork, \
+                mock.patch('swift.common.daemon.os._exit') as mock_exit:
+            mock_fork.return_value = 0
+            mock_exit.side_effect = SystemExit
+            self.assertRaises(SystemExit, strategy.run, once=True)
+        self.assertTrue(d.once_called)
+
+    def test_restart_workers(self):
+        d = MyWorkerDaemon({'workers': 3})
+        strategy = daemon.DaemonStrategy(d, d.logger)
+        d.health_side_effects = [True, False]
+        with self.mock_os():
+            self.mock_kill.side_effect = lambda *args, **kwargs: setattr(
+                strategy, 'running', False)
+            strategy.run()
+        # six workers forked in total
+        self.assertEqual([mock.call()] * 6, self.mock_fork.call_args_list)
+        # since the daemon starts healthy, first pass checks children once
+        self.assertEqual(self.waitpid_calls, {
+            'mock-pid-0': 1,
+            'mock-pid-1': 1,
+            'mock-pid-2': 1,
+        })
+        # second pass is not healthy, original pid's killed
+        self.assertEqual(set([
+            ('mock-pid-0', signal.SIGTERM),
+            ('mock-pid-1', signal.SIGTERM),
+            ('mock-pid-2', signal.SIGTERM),
+        ]), set(c[0] for c in self.mock_kill.call_args_list[:3]))
+        # our mock_kill side effect breaks out of running, and cleanup kills
+        # remaining pids
+        self.assertEqual(set([
+            ('mock-pid-3', signal.SIGTERM),
+            ('mock-pid-4', signal.SIGTERM),
+            ('mock-pid-5', signal.SIGTERM),
+        ]), set(c[0] for c in self.mock_kill.call_args_list[3:]))
+
+    def test_worker_disappears(self):
+        d = MyWorkerDaemon({'workers': 3})
+        strategy = daemon.DaemonStrategy(d, d.logger)
+        strategy.register_worker_start('mock-pid', {'mock_options': True})
+        self.assertEqual(strategy.unspawned_worker_options, [])
+        self.assertEqual(strategy.options_by_pid, {
+            'mock-pid': {'mock_options': True}
+        })
+        # still running
+        with mock.patch('swift.common.daemon.os.waitpid') as mock_waitpid:
+            mock_waitpid.return_value = (0, 0)
+            strategy.check_on_all_running_workers()
+        self.assertEqual(strategy.unspawned_worker_options, [])
+        self.assertEqual(strategy.options_by_pid, {
+            'mock-pid': {'mock_options': True}
+        })
+        # finished
+        strategy = daemon.DaemonStrategy(d, d.logger)
+        strategy.register_worker_start('mock-pid', {'mock_options': True})
+        with mock.patch('swift.common.daemon.os.waitpid') as mock_waitpid:
+            mock_waitpid.return_value = ('mock-pid', 0)
+            strategy.check_on_all_running_workers()
+        self.assertEqual(strategy.unspawned_worker_options, [
+            {'mock_options': True}])
+        self.assertEqual(strategy.options_by_pid, {})
+        self.assertEqual(d.logger.get_lines_for_level('debug')[-1],
+                         'Worker mock-pid exited')
+        # disappeared
+        strategy = daemon.DaemonStrategy(d, d.logger)
+        strategy.register_worker_start('mock-pid', {'mock_options': True})
+        with mock.patch('swift.common.daemon.os.waitpid') as mock_waitpid:
+            mock_waitpid.side_effect = OSError(
+                errno.ECHILD, os.strerror(errno.ECHILD))
+            mock_waitpid.return_value = ('mock-pid', 0)
+            strategy.check_on_all_running_workers()
+        self.assertEqual(strategy.unspawned_worker_options, [
+            {'mock_options': True}])
+        self.assertEqual(strategy.options_by_pid, {})
+        self.assertEqual(d.logger.get_lines_for_level('notice')[-1],
+                         'Worker mock-pid died')
+
+    def test_worker_kills_pids_in_cleanup(self):
+        d = MyWorkerDaemon({'workers': 2})
+        strategy = daemon.DaemonStrategy(d, d.logger)
+        strategy.register_worker_start('mock-pid-1', {'mock_options': True})
+        strategy.register_worker_start('mock-pid-2', {'mock_options': True})
+        self.assertEqual(strategy.unspawned_worker_options, [])
+        self.assertEqual(strategy.options_by_pid, {
+            'mock-pid-1': {'mock_options': True},
+            'mock-pid-2': {'mock_options': True},
+        })
+        with mock.patch('swift.common.daemon.os.kill') as mock_kill:
+            strategy.cleanup()
+        self.assertEqual(strategy.unspawned_worker_options, [
+            {'mock_options': True}] * 2)
+        self.assertEqual(strategy.options_by_pid, {})
+        self.assertEqual(set([
+            ('mock-pid-1', signal.SIGTERM),
+            ('mock-pid-2', signal.SIGTERM),
+        ]), set(c[0] for c in mock_kill.call_args_list))
+        self.assertEqual(set(d.logger.get_lines_for_level('debug')[-2:]),
+                         set(['Cleaned up worker mock-pid-1',
+                              'Cleaned up worker mock-pid-2']))
+
+    def test_worker_disappears_in_cleanup(self):
+        d = MyWorkerDaemon({'workers': 2})
+        strategy = daemon.DaemonStrategy(d, d.logger)
+        strategy.register_worker_start('mock-pid-1', {'mock_options': True})
+        strategy.register_worker_start('mock-pid-2', {'mock_options': True})
+        self.assertEqual(strategy.unspawned_worker_options, [])
+        self.assertEqual(strategy.options_by_pid, {
+            'mock-pid-1': {'mock_options': True},
+            'mock-pid-2': {'mock_options': True},
+        })
+        with mock.patch('swift.common.daemon.os.kill') as mock_kill:
+            mock_kill.side_effect = [None, OSError(errno.ECHILD,
+                                                   os.strerror(errno.ECHILD))]
+            strategy.cleanup()
+        self.assertEqual(strategy.unspawned_worker_options, [
+            {'mock_options': True}] * 2)
+        self.assertEqual(strategy.options_by_pid, {})
+        self.assertEqual(set([
+            ('mock-pid-1', signal.SIGTERM),
+            ('mock-pid-2', signal.SIGTERM),
+        ]), set(c[0] for c in mock_kill.call_args_list))
+        self.assertEqual(set(d.logger.get_lines_for_level('debug')[-2:]),
+                         set(['Cleaned up worker mock-pid-1',
+                              'Cleaned up worker mock-pid-2']))
 
 
 if __name__ == '__main__':
diff --git a/test/unit/common/test_db.py b/test/unit/common/test_db.py
index 257e53479c..e591e733ce 100644
--- a/test/unit/common/test_db.py
+++ b/test/unit/common/test_db.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,25 +13,60 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-""" Tests for swift.common.db """
-
-from __future__ import with_statement
-import hashlib
+"""Tests for swift.common.db"""
+import contextlib
 import os
 import unittest
+from tempfile import mkdtemp
 from shutil import rmtree, copy
-from StringIO import StringIO
-from time import sleep, time
 from uuid import uuid4
+import pickle
+from unittest import mock
 
-import simplejson
+import base64
+import json
 import sqlite3
+import time
+import random
+from unittest.mock import patch, MagicMock
+
+from eventlet.timeout import Timeout
 
 import swift.common.db
-from swift.common.db import AccountBroker, chexor, ContainerBroker, \
-    DatabaseBroker, DatabaseConnectionError, dict_factory, get_db_connection
-from swift.common.utils import normalize_timestamp
+from swift.common.constraints import \
+    MAX_META_VALUE_LENGTH, MAX_META_COUNT, MAX_META_OVERALL_SIZE
+from swift.common.db import chexor, dict_factory, get_db_connection, \
+    DatabaseBroker, DatabaseConnectionError, DatabaseAlreadyExists, \
+    GreenDBConnection, PICKLE_PROTOCOL, zero_like, TombstoneReclaimer
+from swift.common.utils import normalize_timestamp, mkdirs, Timestamp, md5
 from swift.common.exceptions import LockTimeout
+from swift.common.swob import HTTPException
+
+from test.unit import make_timestamp_iter, generate_db_path
+
+
+class TestHelperFunctions(unittest.TestCase):
+
+    def test_zero_like(self):
+        expectations = {
+            # value => expected
+            None: True,
+            True: False,
+            '': True,
+            'asdf': False,
+            0: True,
+            1: False,
+            '0': True,
+            '1': False,
+        }
+        errors = []
+        for value, expected in expectations.items():
+            rv = zero_like(value)
+            if rv != expected:
+                errors.append('zero_like(%r) => %r expected %r' % (
+                    value, rv, expected))
+        if errors:
+            self.fail('Some unexpected return values:\n' + '\n'.join(errors))
 
 
 class TestDatabaseConnectionError(unittest.TestCase):
@@ -39,13 +74,14 @@ class TestDatabaseConnectionError(unittest.TestCase):
     def test_str(self):
         err = \
             DatabaseConnectionError(':memory:', 'No valid database connection')
-        self.assert_(':memory:' in str(err))
-        self.assert_('No valid database connection' in str(err))
+        self.assertIn(':memory:', str(err))
+        self.assertIn('No valid database connection', str(err))
         err = DatabaseConnectionError(':memory:',
-                'No valid database connection', timeout=1357)
-        self.assert_(':memory:' in str(err))
-        self.assert_('No valid database connection' in str(err))
-        self.assert_('1357' in str(err))
+                                      'No valid database connection',
+                                      timeout=1357)
+        self.assertIn(':memory:', str(err))
+        self.assertIn('No valid database connection', str(err))
+        self.assertIn('1357', str(err))
 
 
 class TestDictFactory(unittest.TestCase):
@@ -57,59 +93,605 @@ def test_normal_case(self):
         conn.execute('INSERT INTO test (one, two) VALUES ("def", 456)')
         conn.commit()
         curs = conn.execute('SELECT one, two FROM test')
-        self.assertEquals(dict_factory(curs, curs.next()),
-                          {'one': 'abc', 'two': 123})
-        self.assertEquals(dict_factory(curs, curs.next()),
-                          {'one': 'def', 'two': 456})
+        self.assertEqual(dict_factory(curs, next(curs)),
+                         {'one': 'abc', 'two': 123})
+        self.assertEqual(dict_factory(curs, next(curs)),
+                         {'one': 'def', 'two': 456})
 
 
 class TestChexor(unittest.TestCase):
 
     def test_normal_case(self):
-        self.assertEquals(chexor('d41d8cd98f00b204e9800998ecf8427e',
-            'new name', normalize_timestamp(1)),
+        self.assertEqual(
+            chexor('d41d8cd98f00b204e9800998ecf8427e',
+                   'new name', Timestamp('1').internal),
             '4f2ea31ac14d4273fe32ba08062b21de')
 
     def test_invalid_old_hash(self):
-        self.assertRaises(TypeError, chexor, 'oldhash', 'name',
+        self.assertRaises(ValueError, chexor, 'oldhash', 'name',
                           normalize_timestamp(1))
 
     def test_no_name(self):
         self.assertRaises(Exception, chexor,
-            'd41d8cd98f00b204e9800998ecf8427e', None, normalize_timestamp(1))
+                          'd41d8cd98f00b204e9800998ecf8427e', None,
+                          normalize_timestamp(1))
+
+    def test_chexor(self):
+        ts = make_timestamp_iter()
+
+        objects = [
+            ('frank', next(ts).internal),
+            ('bob', next(ts).internal),
+            ('tom', next(ts).internal),
+            ('frank', next(ts).internal),
+            ('tom', next(ts).internal),
+            ('bob', next(ts).internal),
+        ]
+        hash_ = '0'
+        random.shuffle(objects)
+        for obj in objects:
+            hash_ = chexor(hash_, *obj)
+
+        other_hash = '0'
+        random.shuffle(objects)
+        for obj in objects:
+            other_hash = chexor(other_hash, *obj)
+
+        self.assertEqual(hash_, other_hash)
+
+
+class TestGreenDBConnection(unittest.TestCase):
+
+    def test_execute_when_locked(self):
+        # This test is dependent on the code under test calling execute and
+        # commit as sqlite3.Cursor.execute in a subclass.
+        class InterceptCursor(sqlite3.Cursor):
+            pass
+        db_error = sqlite3.OperationalError('database is locked')
+        InterceptCursor.execute = MagicMock(side_effect=db_error)
+        with patch('sqlite3.Cursor', new=InterceptCursor):
+            conn = sqlite3.connect(':memory:', check_same_thread=False,
+                                   factory=GreenDBConnection, timeout=0.1)
+            self.assertRaises(Timeout, conn.execute, 'select 1')
+            self.assertTrue(InterceptCursor.execute.called)
+            self.assertEqual(InterceptCursor.execute.call_args_list,
+                             list((InterceptCursor.execute.call_args,) *
+                                  InterceptCursor.execute.call_count))
+
+    def text_commit_when_locked(self):
+        # This test is dependent on the code under test calling commit and
+        # commit as sqlite3.Connection.commit in a subclass.
+        class InterceptConnection(sqlite3.Connection):
+            pass
+        db_error = sqlite3.OperationalError('database is locked')
+        InterceptConnection.commit = MagicMock(side_effect=db_error)
+        with patch('sqlite3.Connection', new=InterceptConnection):
+            conn = sqlite3.connect(':memory:', check_same_thread=False,
+                                   factory=GreenDBConnection, timeout=0.1)
+            self.assertRaises(Timeout, conn.commit)
+            self.assertTrue(InterceptConnection.commit.called)
+            self.assertEqual(InterceptConnection.commit.call_args_list,
+                             list((InterceptConnection.commit.call_args,) *
+                                  InterceptConnection.commit.call_count))
+
+
+class TestDbBase(unittest.TestCase):
+    server_type = 'container'
+    testdir = None
 
+    def setUp(self):
+        self.testdir = mkdtemp()
+        self.db_path = self.get_db_path()
+        self.ts = make_timestamp_iter()
+
+    def tearDown(self):
+        rmtree(self.testdir, ignore_errors=True)
 
-class TestGetDBConnection(unittest.TestCase):
+    def get_db_path(self):
+        return generate_db_path(self.testdir, self.server_type)
+
+
+class TestGetDBConnection(TestDbBase):
+    def setUp(self):
+        super(TestGetDBConnection, self).setUp()
+        self.db_path = self.init_db_path()
+
+    def init_db_path(self):
+        # Test ContainerBroker.empty
+        db_path = self.get_db_path()
+        broker = ExampleBroker(db_path, account='a')
+        broker.initialize(Timestamp.now().internal, 0)
+        return db_path
 
     def test_normal_case(self):
-        conn = get_db_connection(':memory:')
-        self.assert_(hasattr(conn, 'execute'))
+        conn = get_db_connection(self.db_path)
+        self.assertTrue(hasattr(conn, 'execute'))
 
     def test_invalid_path(self):
         self.assertRaises(DatabaseConnectionError, get_db_connection,
                           'invalid database path / name')
 
+    def test_locked_db(self):
+        # This test is dependent on the code under test calling execute and
+        # commit as sqlite3.Cursor.execute in a subclass.
+        class InterceptCursor(sqlite3.Cursor):
+            pass
+
+        db_error = sqlite3.OperationalError('database is locked')
+        mock_db_cmd = MagicMock(side_effect=db_error)
+        InterceptCursor.execute = mock_db_cmd
+
+        with patch('sqlite3.Cursor', new=InterceptCursor):
+            self.assertRaises(Timeout, get_db_connection,
+                              self.db_path, timeout=0.1)
+            self.assertTrue(mock_db_cmd.called)
+            self.assertEqual(mock_db_cmd.call_args_list,
+                             list((mock_db_cmd.call_args,) *
+                                  mock_db_cmd.call_count))
+
+
+class ExampleBroker(DatabaseBroker):
+    """
+    Concrete enough implementation of a DatabaseBroker.
+    """
+
+    db_type = 'test'
+    db_contains_type = 'test'
+    db_reclaim_timestamp = 'created_at'
+
+    def _initialize(self, conn, put_timestamp, **kwargs):
+        if not self.account:
+            raise ValueError(
+                'Attempting to create a new database with no account set')
+        conn.executescript('''
+            CREATE TABLE test_stat (
+                account TEXT,
+                test_count INTEGER DEFAULT 0,
+                created_at TEXT,
+                put_timestamp TEXT DEFAULT '0',
+                delete_timestamp TEXT DEFAULT '0',
+                hash TEXT default '00000000000000000000000000000000',
+                id TEXT,
+                status TEXT DEFAULT '',
+                status_changed_at TEXT DEFAULT '0',
+                metadata TEXT DEFAULT ''
+            );
+            CREATE TABLE test (
+                ROWID INTEGER PRIMARY KEY AUTOINCREMENT,
+                name TEXT,
+                created_at TEXT,
+                deleted INTEGER DEFAULT 0
+            );
+            CREATE TRIGGER test_insert AFTER INSERT ON test
+            BEGIN
+                UPDATE test_stat
+                SET test_count = test_count + (1 - new.deleted);
+            END;
+            CREATE TRIGGER test_delete AFTER DELETE ON test
+            BEGIN
+                UPDATE test_stat
+                SET test_count = test_count - (1 - old.deleted);
+            END;
+        ''')
+        conn.execute("""
+        INSERT INTO test_stat (
+            account, created_at, id, put_timestamp, status_changed_at, status)
+        VALUES (?, ?, ?, ?, ?, ?);
+        """, (self.account, Timestamp.now().internal, str(uuid4()),
+              put_timestamp, put_timestamp, ''))
+
+    def merge_items(self, item_list):
+        with self.get() as conn:
+            for rec in item_list:
+                conn.execute(
+                    'DELETE FROM test WHERE name = ? and created_at < ?', (
+                        rec['name'], rec['created_at']))
+                if not conn.execute(
+                        'SELECT 1 FROM test WHERE name = ?',
+                        (rec['name'],)).fetchall():
+                    conn.execute('''
+                    INSERT INTO test (name, created_at, deleted)
+                    VALUES (?, ?, ?)''', (
+                        rec['name'], rec['created_at'], rec['deleted']))
+            conn.commit()
 
-class TestDatabaseBroker(unittest.TestCase):
+    def _commit_puts_load(self, item_list, entry):
+        (name, timestamp, deleted) = entry
+        item_list.append({
+            'name': name,
+            'created_at': timestamp,
+            'deleted': deleted,
+        })
+
+    def _load_item(self, name, timestamp, deleted):
+        if self.db_file == ':memory:':
+            record = {
+                'name': name,
+                'created_at': timestamp,
+                'deleted': deleted,
+            }
+            self.merge_items([record])
+            return
+        with open(self.pending_file, 'a+b') as fp:
+            fp.write(b':')
+            fp.write(base64.b64encode(pickle.dumps(
+                (name, timestamp, deleted),
+                protocol=PICKLE_PROTOCOL)))
+            fp.flush()
+
+    def put_test(self, name, timestamp):
+        self._load_item(name, timestamp, 0)
+
+    def delete_test(self, name, timestamp):
+        self._load_item(name, timestamp, 1)
+
+    def _delete_db(self, conn, timestamp):
+        conn.execute("""
+            UPDATE test_stat
+            SET delete_timestamp = ?,
+                status = 'DELETED',
+                status_changed_at = ?
+            WHERE delete_timestamp < ? """, (timestamp, timestamp, timestamp))
+
+    def _is_deleted(self, conn):
+        info = conn.execute('SELECT * FROM test_stat').fetchone()
+        return (info['test_count'] in (None, '', 0, '0')) and \
+            (Timestamp(info['delete_timestamp']) >
+             Timestamp(info['put_timestamp']))
+
+
+class TestExampleBroker(TestDbBase):
+    """
+    Tests that use the mostly Concrete enough ExampleBroker to exercise some
+    of the abstract methods on DatabaseBroker.
+    """
+
+    broker_class = ExampleBroker
+    policy = 0
+    server_type = 'example'
 
     def setUp(self):
-        self.testdir = os.path.join(os.path.dirname(__file__), 'db')
-        rmtree(self.testdir, ignore_errors=1)
-        os.mkdir(self.testdir)
+        super(TestExampleBroker, self).setUp()
+
+    def test_initialize(self):
+        broker = self.broker_class(self.db_path, account='a', container='c')
+        put_timestamp = next(self.ts)
+        created_at = next(self.ts)
+        with patch('swift.common.db.Timestamp.now', return_value=created_at):
+            broker.initialize(put_timestamp.internal)
+        info = broker.get_info()
+        self.assertEqual(info['created_at'], created_at.internal)
+        self.assertEqual(info['put_timestamp'], put_timestamp.internal)
+        self.assertEqual(info['delete_timestamp'], '0')
+        self.assertEqual(info['status_changed_at'], put_timestamp.internal)
+        self.assertFalse(broker.is_deleted())
+
+    def test_initialize_default_put_timestamp(self):
+        broker = self.broker_class(self.db_path, account='a', container='c')
+        created_at = next(self.ts)
+        with patch('swift.common.db.Timestamp.now', return_value=created_at):
+            broker.initialize()
+        info = broker.get_info()
+        self.assertEqual(info['created_at'], created_at.internal)
+        self.assertEqual(info['put_timestamp'], Timestamp.zero().internal)
+        self.assertEqual(info['delete_timestamp'], '0')
+        self.assertEqual(info['status_changed_at'], Timestamp.zero().internal)
+        self.assertFalse(broker.is_deleted())
+
+    def test_delete_db(self):
+        broker = self.broker_class(self.db_path, account='a', container='c')
+        broker.initialize(next(self.ts).internal)
+        broker.delete_db(next(self.ts).internal)
+        self.assertTrue(broker.is_deleted())
+
+    def test_merge_timestamps_simple_delete(self):
+        put_timestamp = next(self.ts).internal
+        broker = self.broker_class(self.db_path, account='a', container='c')
+        broker.initialize(put_timestamp)
+        created_at = broker.get_info()['created_at']
+        broker.merge_timestamps(created_at, put_timestamp, '0')
+        info = broker.get_info()
+        self.assertEqual(info['created_at'], created_at)
+        self.assertEqual(info['put_timestamp'], put_timestamp)
+        self.assertEqual(info['delete_timestamp'], '0')
+        self.assertEqual(info['status_changed_at'], put_timestamp)
+        # delete
+        delete_timestamp = next(self.ts).internal
+        broker.merge_timestamps(created_at, put_timestamp, delete_timestamp)
+        self.assertTrue(broker.is_deleted())
+        info = broker.get_info()
+        self.assertEqual(info['created_at'], created_at)
+        self.assertEqual(info['put_timestamp'], put_timestamp)
+        self.assertEqual(info['delete_timestamp'], delete_timestamp)
+        self.assertTrue(info['status_changed_at'] > Timestamp(put_timestamp))
+
+    def put_item(self, broker, timestamp):
+        broker.put_test('test', timestamp)
+
+    def delete_item(self, broker, timestamp):
+        broker.delete_test('test', timestamp)
+
+    def test_merge_timestamps_delete_with_objects(self):
+        put_timestamp = next(self.ts).internal
+        broker = self.broker_class(self.db_path, account='a', container='c')
+        broker.initialize(put_timestamp, storage_policy_index=int(self.policy))
+        created_at = broker.get_info()['created_at']
+        broker.merge_timestamps(created_at, put_timestamp, '0')
+        info = broker.get_info()
+        self.assertEqual(info['created_at'], created_at)
+        self.assertEqual(info['put_timestamp'], put_timestamp)
+        self.assertEqual(info['delete_timestamp'], '0')
+        self.assertEqual(info['status_changed_at'], put_timestamp)
+        # add object
+        self.put_item(broker, next(self.ts).internal)
+        self.assertEqual(broker.get_info()[
+            '%s_count' % broker.db_contains_type], 1)
+        # delete
+        delete_timestamp = next(self.ts).internal
+        broker.merge_timestamps(created_at, put_timestamp, delete_timestamp)
+        self.assertFalse(broker.is_deleted())
+        info = broker.get_info()
+        self.assertEqual(info['created_at'], created_at)
+        self.assertEqual(info['put_timestamp'], put_timestamp)
+        self.assertEqual(info['delete_timestamp'], delete_timestamp)
+        # status is unchanged
+        self.assertEqual(info['status_changed_at'], put_timestamp)
+        # count is causing status to hold on
+        self.delete_item(broker, next(self.ts).internal)
+        self.assertEqual(broker.get_info()[
+            '%s_count' % broker.db_contains_type], 0)
+        self.assertTrue(broker.is_deleted())
+
+    def test_merge_timestamps_simple_recreate(self):
+        put_timestamp = next(self.ts).internal
+        broker = self.broker_class(self.db_path, account='a', container='c')
+        broker.initialize(put_timestamp, storage_policy_index=int(self.policy))
+        virgin_status_changed_at = broker.get_info()['status_changed_at']
+        created_at = broker.get_info()['created_at']
+        delete_timestamp = next(self.ts).internal
+        broker.merge_timestamps(created_at, put_timestamp, delete_timestamp)
+        self.assertTrue(broker.is_deleted())
+        info = broker.get_info()
+        self.assertEqual(info['created_at'], created_at)
+        self.assertEqual(info['put_timestamp'], put_timestamp)
+        self.assertEqual(info['delete_timestamp'], delete_timestamp)
+        orig_status_changed_at = info['status_changed_at']
+        self.assertTrue(orig_status_changed_at >
+                        Timestamp(virgin_status_changed_at))
+        # recreate
+        recreate_timestamp = next(self.ts).internal
+        status_changed_at = Timestamp.now()
+        with patch('swift.common.db.Timestamp.now',
+                   return_value=status_changed_at):
+            broker.merge_timestamps(created_at, recreate_timestamp, '0')
+        self.assertFalse(broker.is_deleted())
+        info = broker.get_info()
+        self.assertEqual(info['created_at'], created_at)
+        self.assertEqual(info['put_timestamp'], recreate_timestamp)
+        self.assertEqual(info['delete_timestamp'], delete_timestamp)
+        self.assertEqual(status_changed_at.internal, info['status_changed_at'])
+
+    def test_merge_timestamps_recreate_with_objects(self):
+        put_timestamp = next(self.ts).internal
+        broker = self.broker_class(self.db_path, account='a', container='c')
+        broker.initialize(put_timestamp, storage_policy_index=int(self.policy))
+        created_at = broker.get_info()['created_at']
+        # delete
+        delete_timestamp = next(self.ts).internal
+        broker.merge_timestamps(created_at, put_timestamp, delete_timestamp)
+        self.assertTrue(broker.is_deleted())
+        info = broker.get_info()
+        self.assertEqual(info['created_at'], created_at)
+        self.assertEqual(info['put_timestamp'], put_timestamp)
+        self.assertEqual(info['delete_timestamp'], delete_timestamp)
+        orig_status_changed_at = info['status_changed_at']
+        self.assertTrue(Timestamp(orig_status_changed_at) >=
+                        Timestamp(put_timestamp))
+        # add object
+        self.put_item(broker, next(self.ts).internal)
+        count_key = '%s_count' % broker.db_contains_type
+        self.assertEqual(broker.get_info()[count_key], 1)
+        self.assertFalse(broker.is_deleted())
+        # recreate
+        recreate_timestamp = next(self.ts).internal
+        broker.merge_timestamps(created_at, recreate_timestamp, '0')
+        self.assertFalse(broker.is_deleted())
+        info = broker.get_info()
+        self.assertEqual(info['created_at'], created_at)
+        self.assertEqual(info['put_timestamp'], recreate_timestamp)
+        self.assertEqual(info['delete_timestamp'], delete_timestamp)
+        self.assertEqual(info['status_changed_at'], orig_status_changed_at)
+        # count is not causing status to hold on
+        self.delete_item(broker, next(self.ts).internal)
+        self.assertFalse(broker.is_deleted())
+
+    def test_merge_timestamps_update_put_no_status_change(self):
+        put_timestamp = next(self.ts).internal
+        broker = self.broker_class(self.db_path, account='a', container='c')
+        broker.initialize(put_timestamp, storage_policy_index=int(self.policy))
+        info = broker.get_info()
+        orig_status_changed_at = info['status_changed_at']
+        created_at = info['created_at']
+        new_put_timestamp = next(self.ts).internal
+        broker.merge_timestamps(created_at, new_put_timestamp, '0')
+        info = broker.get_info()
+        self.assertEqual(new_put_timestamp, info['put_timestamp'])
+        self.assertEqual(orig_status_changed_at, info['status_changed_at'])
+
+    def test_merge_timestamps_update_delete_no_status_change(self):
+        put_timestamp = next(self.ts).internal
+        broker = self.broker_class(self.db_path, account='a', container='c')
+        broker.initialize(put_timestamp, storage_policy_index=int(self.policy))
+        created_at = broker.get_info()['created_at']
+        broker.merge_timestamps(created_at, put_timestamp,
+                                next(self.ts).internal)
+        orig_status_changed_at = broker.get_info()['status_changed_at']
+        new_delete_timestamp = next(self.ts).internal
+        broker.merge_timestamps(created_at, put_timestamp,
+                                new_delete_timestamp)
+        info = broker.get_info()
+        self.assertEqual(new_delete_timestamp, info['delete_timestamp'])
+        self.assertEqual(orig_status_changed_at, info['status_changed_at'])
+
+    def test_get_max_row(self):
+        broker = self.broker_class(self.db_path, account='a', container='c')
+        broker.initialize(next(self.ts).internal,
+                          storage_policy_index=int(self.policy))
+        self.assertEqual(-1, broker.get_max_row())
+        self.put_item(broker, next(self.ts).internal)
+        # commit pending file into db
+        broker._commit_puts()
+        self.assertEqual(1, broker.get_max_row())
+        self.delete_item(broker, next(self.ts).internal)
+        broker._commit_puts()
+        self.assertEqual(2, broker.get_max_row())
+        self.put_item(broker, next(self.ts).internal)
+        broker._commit_puts()
+        self.assertEqual(3, broker.get_max_row())
+
+    def test_get_info(self):
+        broker = self.broker_class(self.db_path, account='test', container='c')
+        created_at = Timestamp.now()
+        put_timestamp = next(self.ts)
+        with patch('swift.common.db.Timestamp.now', return_value=created_at):
+            broker.initialize(put_timestamp.internal,
+                              storage_policy_index=int(self.policy))
+        info = broker.get_info()
+        count_key = '%s_count' % broker.db_contains_type
+        expected = {
+            count_key: 0,
+            'created_at': created_at.internal,
+            'put_timestamp': put_timestamp.internal,
+            'status_changed_at': put_timestamp.internal,
+            'delete_timestamp': '0',
+        }
+        for k, v in expected.items():
+            self.assertEqual(info[k], v,
+                             'mismatch for %s, %s != %s' % (
+                                 k, info[k], v))
+
+    def test_get_raw_metadata(self):
+        broker = self.broker_class(self.db_path, account='test', container='c')
+        broker.initialize(Timestamp(0).internal,
+                          storage_policy_index=int(self.policy))
+        self.assertEqual(broker.metadata, {})
+        self.assertEqual(broker.get_raw_metadata(), '')
+        metadata = {
+            'test\u062a': ['value\u062a', Timestamp(1).internal]
+        }
+        broker.update_metadata(metadata)
+        self.assertEqual(broker.metadata, metadata)
+        self.assertEqual(broker.get_raw_metadata(),
+                         json.dumps(metadata))
+
+    def test_put_timestamp(self):
+        broker = self.broker_class(self.db_path, account='a', container='c')
+        orig_put_timestamp = next(self.ts).internal
+        broker.initialize(orig_put_timestamp,
+                          storage_policy_index=int(self.policy))
+        self.assertEqual(broker.get_info()['put_timestamp'],
+                         orig_put_timestamp)
+        # put_timestamp equal - no change
+        broker.update_put_timestamp(orig_put_timestamp)
+        self.assertEqual(broker.get_info()['put_timestamp'],
+                         orig_put_timestamp)
+        # put_timestamp newer - gets newer
+        newer_put_timestamp = next(self.ts).internal
+        broker.update_put_timestamp(newer_put_timestamp)
+        self.assertEqual(broker.get_info()['put_timestamp'],
+                         newer_put_timestamp)
+        # put_timestamp older - no change
+        broker.update_put_timestamp(orig_put_timestamp)
+        self.assertEqual(broker.get_info()['put_timestamp'],
+                         newer_put_timestamp)
+
+    def test_status_changed_at(self):
+        broker = self.broker_class(self.db_path, account='test', container='c')
+        put_timestamp = next(self.ts).internal
+        created_at = Timestamp.now()
+        with patch('swift.common.db.Timestamp.now', return_value=created_at):
+            broker.initialize(put_timestamp,
+                              storage_policy_index=int(self.policy))
+        self.assertEqual(broker.get_info()['status_changed_at'],
+                         put_timestamp)
+        self.assertEqual(broker.get_info()['created_at'], created_at.internal)
+        status_changed_at = next(self.ts).internal
+        broker.update_status_changed_at(status_changed_at)
+        self.assertEqual(broker.get_info()['status_changed_at'],
+                         status_changed_at)
+        # save the old and get a new status_changed_at
+        old_status_changed_at, status_changed_at = \
+            status_changed_at, next(self.ts).internal
+        broker.update_status_changed_at(status_changed_at)
+        self.assertEqual(broker.get_info()['status_changed_at'],
+                         status_changed_at)
+        # status changed at won't go backwards...
+        broker.update_status_changed_at(old_status_changed_at)
+        self.assertEqual(broker.get_info()['status_changed_at'],
+                         status_changed_at)
+
+    def test_get_syncs(self):
+        broker = self.broker_class(self.db_path, account='a', container='c')
+        broker.initialize(Timestamp.now().internal,
+                          storage_policy_index=int(self.policy))
+        self.assertEqual([], broker.get_syncs())
+        broker.merge_syncs([{'sync_point': 1, 'remote_id': 'remote1'}])
+        self.assertEqual([{'sync_point': 1, 'remote_id': 'remote1'}],
+                         broker.get_syncs())
+        self.assertEqual([], broker.get_syncs(incoming=False))
+        broker.merge_syncs([{'sync_point': 2, 'remote_id': 'remote2'}],
+                           incoming=False)
+        self.assertEqual([{'sync_point': 2, 'remote_id': 'remote2'}],
+                         broker.get_syncs(incoming=False))
+
+    def test_commit_pending(self):
+        broker = self.broker_class(os.path.join(self.testdir, 'test.db'),
+                                   account='a', container='c')
+        broker.initialize(next(self.ts).internal,
+                          storage_policy_index=int(self.policy))
+        self.put_item(broker, next(self.ts).internal)
+        qry = 'select * from %s_stat' % broker.db_type
+        with broker.get() as conn:
+            rows = [dict(x) for x in conn.execute(qry)]
+        info = rows[0]
+        count_key = '%s_count' % broker.db_contains_type
+        self.assertEqual(0, info[count_key])
+        # commit pending file into db
+        broker._commit_puts()
+        self.assertEqual(1, broker.get_info()[count_key])
+
+    def test_maybe_get(self):
+        broker = self.broker_class(os.path.join(self.testdir, 'test.db'),
+                                   account='a', container='c')
+        broker.initialize(next(self.ts).internal,
+                          storage_policy_index=int(self.policy))
+        qry = 'select account from %s_stat' % broker.db_type
+        with broker.maybe_get(None) as conn:
+            rows = [dict(x) for x in conn.execute(qry)]
+        self.assertEqual([{'account': 'a'}], rows)
+        self.assertEqual(conn, broker.conn)
+        with broker.get() as other_conn:
+            self.assertEqual(broker.conn, None)
+            with broker.maybe_get(other_conn) as identity_conn:
+                self.assertIs(other_conn, identity_conn)
+                self.assertEqual(broker.conn, None)
+            self.assertEqual(broker.conn, None)
+        self.assertEqual(broker.conn, conn)
+
+
+class TestDatabaseBroker(TestDbBase):
 
     def test_DB_PREALLOCATION_setting(self):
         u = uuid4().hex
         b = DatabaseBroker(u)
+        swift.common.db.DB_PREALLOCATION = False
         b._preallocate()
         swift.common.db.DB_PREALLOCATION = True
         self.assertRaises(OSError, b._preallocate)
 
-    def tearDown(self):
-        rmtree(self.testdir, ignore_errors=1)
-
     def test_memory_db_init(self):
-        broker = DatabaseBroker(':memory:')
-        self.assertEqual(broker.db_file, ':memory:')
+        broker = DatabaseBroker(self.db_path)
+        self.assertEqual(broker.db_file, self.db_path)
         self.assertRaises(AttributeError, broker.initialize,
                           normalize_timestamp('0'))
 
@@ -117,89 +699,146 @@ def test_disk_db_init(self):
         db_file = os.path.join(self.testdir, '1.db')
         broker = DatabaseBroker(db_file)
         self.assertEqual(broker.db_file, db_file)
-        self.assert_(broker.conn is None)
+        self.assertIsNone(broker.conn)
+
+    def test_disk_preallocate(self):
+        test_size = [-1]
+
+        def fallocate_stub(fd, size):
+            test_size[0] = size
+
+        with patch('swift.common.db.fallocate', fallocate_stub):
+            db_file = os.path.join(self.testdir, 'pre.db')
+            # Write 1 byte and hope that the fs will allocate less than 1 MB.
+            f = open(db_file, "w")
+            f.write('@')
+            f.close()
+            b = DatabaseBroker(db_file)
+            b._preallocate()
+            # We only wrote 1 byte, so we should end with the 1st step or 1 MB.
+            self.assertEqual(test_size[0], 1024 * 1024)
 
     def test_initialize(self):
         self.assertRaises(AttributeError,
-                          DatabaseBroker(':memory:').initialize,
+                          DatabaseBroker(self.db_path).initialize,
                           normalize_timestamp('1'))
         stub_dict = {}
 
         def stub(*args, **kwargs):
-            for key in stub_dict.keys():
-                del stub_dict[key]
+            stub_dict.clear()
             stub_dict['args'] = args
-            for key, value in kwargs.items():
-                stub_dict[key] = value
-        broker = DatabaseBroker(':memory:')
+            stub_dict.update(kwargs)
+        broker = DatabaseBroker(self.db_path)
         broker._initialize = stub
         broker.initialize(normalize_timestamp('1'))
-        self.assert_(hasattr(stub_dict['args'][0], 'execute'))
-        self.assertEquals(stub_dict['args'][1], '0000000001.00000')
+        self.assertTrue(hasattr(stub_dict['args'][0], 'execute'))
+        self.assertEqual(stub_dict['args'][1], '0000000001.00000')
         with broker.get() as conn:
             conn.execute('SELECT * FROM outgoing_sync')
             conn.execute('SELECT * FROM incoming_sync')
         broker = DatabaseBroker(os.path.join(self.testdir, '1.db'))
         broker._initialize = stub
         broker.initialize(normalize_timestamp('1'))
-        self.assert_(hasattr(stub_dict['args'][0], 'execute'))
-        self.assertEquals(stub_dict['args'][1], '0000000001.00000')
+        self.assertTrue(hasattr(stub_dict['args'][0], 'execute'))
+        self.assertEqual(stub_dict['args'][1], '0000000001.00000')
         with broker.get() as conn:
             conn.execute('SELECT * FROM outgoing_sync')
             conn.execute('SELECT * FROM incoming_sync')
+        broker = DatabaseBroker(os.path.join(self.testdir, '1.db'))
+        broker._initialize = stub
+        self.assertRaises(DatabaseAlreadyExists,
+                          broker.initialize, normalize_timestamp('1'))
 
     def test_delete_db(self):
-        def init_stub(conn, put_timestamp):
+        meta = {'foo': ['bar', normalize_timestamp('0')]}
+
+        def init_stub(conn, put_timestamp, **kwargs):
             conn.execute('CREATE TABLE test (one TEXT)')
-            conn.execute('CREATE TABLE test_stat (id TEXT)')
-            conn.execute('INSERT INTO test_stat (id) VALUES (?)',
-                        (str(uuid4),))
+            conn.execute('''CREATE TABLE test_stat (
+                id TEXT, put_timestamp TEXT, delete_timestamp TEXT,
+                status TEXT, status_changed_at TEXT, metadata TEXT)''')
+            conn.execute(
+                '''INSERT INTO test_stat (
+                    id, put_timestamp, delete_timestamp, status,
+                    status_changed_at, metadata) VALUES (?, ?, ?, ?, ?, ?)''',
+                (str(uuid4), put_timestamp, '0', '', '0', json.dumps(meta)))
             conn.execute('INSERT INTO test (one) VALUES ("1")')
             conn.commit()
-        stub_called = [False]
 
-        def delete_stub(*a, **kw):
-            stub_called[0] = True
-        broker = DatabaseBroker(':memory:')
-        broker.db_type = 'test'
-        broker._initialize = init_stub
-        # Initializes a good broker for us
-        broker.initialize(normalize_timestamp('1'))
-        self.assert_(broker.conn is not None)
-        broker._delete_db = delete_stub
-        stub_called[0] = False
-        broker.delete_db('2')
-        self.assert_(stub_called[0])
-        broker = DatabaseBroker(os.path.join(self.testdir, '1.db'))
-        broker.db_type = 'test'
-        broker._initialize = init_stub
-        broker.initialize(normalize_timestamp('1'))
-        broker._delete_db = delete_stub
-        stub_called[0] = False
-        broker.delete_db('2')
-        self.assert_(stub_called[0])
-        # ensure that metadata was cleared
-        m2 = broker.metadata
-        self.assert_(not any(v[0] for v in m2.itervalues()))
-        self.assert_(all(v[1] == normalize_timestamp('2')
-                        for v in m2.itervalues()))
+        def do_test(expected_metadata, delete_meta_whitelist=None):
+            if not delete_meta_whitelist:
+                delete_meta_whitelist = []
+            broker = DatabaseBroker(self.get_db_path())
+            broker.delete_meta_whitelist = delete_meta_whitelist
+            broker.db_type = 'test'
+            broker._initialize = init_stub
+            # Initializes a good broker for us
+            broker.initialize(normalize_timestamp('1'))
+            info = broker.get_info()
+            self.assertEqual('0', info['delete_timestamp'])
+            self.assertEqual('', info['status'])
+            self.assertIsNotNone(broker.conn)
+            broker.delete_db(normalize_timestamp('2'))
+            info = broker.get_info()
+            self.assertEqual(normalize_timestamp('2'),
+                             info['delete_timestamp'])
+            self.assertEqual('DELETED', info['status'])
+
+            # check meta
+            m2 = broker.metadata
+            self.assertEqual(m2, expected_metadata)
+
+            broker = DatabaseBroker(os.path.join(self.testdir,
+                                                 '%s.db' % uuid4()))
+            broker.delete_meta_whitelist = delete_meta_whitelist
+            broker.db_type = 'test'
+            broker._initialize = init_stub
+            broker.initialize(normalize_timestamp('1'))
+            info = broker.get_info()
+            self.assertEqual('0', info['delete_timestamp'])
+            self.assertEqual('', info['status'])
+            broker.delete_db(normalize_timestamp('2'))
+            info = broker.get_info()
+            self.assertEqual(normalize_timestamp('2'),
+                             info['delete_timestamp'])
+            self.assertEqual('DELETED', info['status'])
+
+            # check meta
+            m2 = broker.metadata
+            self.assertEqual(m2, expected_metadata)
+
+        # ensure that metadata was cleared by default
+        do_test({'foo': ['', normalize_timestamp('2')]})
+
+        # If the meta is in the brokers delete_meta_whitelist it wont get
+        # cleared up
+        do_test(meta, ['foo'])
+
+        # delete_meta_whitelist things need to be in lower case, as the keys
+        # are lower()'ed before checked
+        meta["X-Container-Meta-Test"] = ['value', normalize_timestamp('0')]
+        meta["X-Something-else"] = ['other', normalize_timestamp('0')]
+        do_test({'foo': ['', normalize_timestamp('2')],
+                 'X-Container-Meta-Test': ['value', normalize_timestamp('0')],
+                 'X-Something-else': ['other', normalize_timestamp('0')]},
+                ['x-container-meta-test', 'x-something-else'])
 
     def test_get(self):
-        broker = DatabaseBroker(':memory:')
-        got_exc = False
-        try:
-            with broker.get() as conn:
-                conn.execute('SELECT 1')
-        except Exception:
-            got_exc = True
+        broker = DatabaseBroker(self.db_path)
+        with self.assertRaises(DatabaseConnectionError) as raised, \
+                broker.get() as conn:
+            conn.execute('SELECT 1')
+        self.assertEqual(
+            str(raised.exception),
+            "DB connection error (%s, 0):\nDB doesn't exist" % self.db_path)
+
         broker = DatabaseBroker(os.path.join(self.testdir, '1.db'))
-        got_exc = False
-        try:
-            with broker.get() as conn:
-                conn.execute('SELECT 1')
-        except Exception:
-            got_exc = True
-        self.assert_(got_exc)
+        with self.assertRaises(DatabaseConnectionError) as raised, \
+                broker.get() as conn:
+            conn.execute('SELECT 1')
+        self.assertEqual(
+            str(raised.exception),
+            "DB connection error (%s, 0):\nDB doesn't exist" % broker.db_file)
 
         def stub(*args, **kwargs):
             pass
@@ -216,66 +855,89 @@ def stub(*args, **kwargs):
             pass
         broker = DatabaseBroker(os.path.join(self.testdir, '1.db'))
         with broker.get() as conn:
-            self.assertEquals(
+            self.assertEqual(
                 [r[0] for r in conn.execute('SELECT * FROM test')], [])
         with broker.get() as conn:
             conn.execute('INSERT INTO test (one) VALUES ("1")')
             conn.commit()
         broker = DatabaseBroker(os.path.join(self.testdir, '1.db'))
         with broker.get() as conn:
-            self.assertEquals(
+            self.assertEqual(
                 [r[0] for r in conn.execute('SELECT * FROM test')], ['1'])
-        orig_renamer = swift.common.db.renamer
-        try:
-            swift.common.db.renamer = lambda a, b: b
-            qpath = os.path.dirname(os.path.dirname(os.path.dirname(
-                os.path.dirname(self.testdir))))
-            if qpath:
-                qpath += '/quarantined/tests/db'
-            else:
-                qpath = 'quarantined/tests/db'
+
+        dbpath = os.path.join(self.testdir, 'dev', 'dbs', 'par', 'pre', 'db')
+        mkdirs(dbpath)
+        qpath = os.path.join(self.testdir, 'dev', 'quarantined', 'tests', 'db')
+        with patch('swift.common.db.renamer', lambda a, b,
+                   fsync: b):
             # Test malformed database
             copy(os.path.join(os.path.dirname(__file__),
                               'malformed_example.db'),
-                 os.path.join(self.testdir, '1.db'))
-            broker = DatabaseBroker(os.path.join(self.testdir, '1.db'))
+                 os.path.join(dbpath, '1.db'))
+            broker = DatabaseBroker(os.path.join(dbpath, '1.db'))
+            broker.db_type = 'test'
+            with self.assertRaises(sqlite3.DatabaseError) as raised, \
+                    broker.get() as conn:
+                conn.execute('SELECT * FROM test')
+            self.assertEqual(
+                str(raised.exception),
+                'Quarantined %s to %s due to malformed database' %
+                (dbpath, qpath))
+            # Test malformed schema database
+            copy(os.path.join(os.path.dirname(__file__),
+                              'malformed_schema_example.db'),
+                 os.path.join(dbpath, '1.db'))
+            broker = DatabaseBroker(os.path.join(dbpath, '1.db'))
             broker.db_type = 'test'
-            exc = None
-            try:
-                with broker.get() as conn:
-                    conn.execute('SELECT * FROM test')
-            except Exception, err:
-                exc = err
-            self.assertEquals(str(exc),
+            with self.assertRaises(sqlite3.DatabaseError) as raised, \
+                    broker.get() as conn:
+                conn.execute('SELECT * FROM test')
+            self.assertEqual(
+                str(raised.exception),
                 'Quarantined %s to %s due to malformed database' %
-                (self.testdir, qpath))
+                (dbpath, qpath))
             # Test corrupted database
             copy(os.path.join(os.path.dirname(__file__),
                               'corrupted_example.db'),
-                 os.path.join(self.testdir, '1.db'))
-            broker = DatabaseBroker(os.path.join(self.testdir, '1.db'))
+                 os.path.join(dbpath, '1.db'))
+            broker = DatabaseBroker(os.path.join(dbpath, '1.db'))
             broker.db_type = 'test'
-            exc = None
-            try:
-                with broker.get() as conn:
-                    conn.execute('SELECT * FROM test')
-            except Exception, err:
-                exc = err
-            self.assertEquals(str(exc),
+            with self.assertRaises(sqlite3.DatabaseError) as raised, \
+                    broker.get() as conn:
+                conn.execute('SELECT * FROM test')
+            self.assertEqual(
+                str(raised.exception),
                 'Quarantined %s to %s due to corrupted database' %
-                (self.testdir, qpath))
-        finally:
-            swift.common.db.renamer = orig_renamer
+                (dbpath, qpath))
+
+    def test_get_raw_metadata_missing_container_info(self):
+        # Test missing container_info/container_stat row
+        dbpath = os.path.join(self.testdir, 'dev', 'dbs', 'par', 'pre', 'db')
+        mkdirs(dbpath)
+        qpath = os.path.join(self.testdir, 'dev', 'quarantined', 'containers',
+                             'db')
+        copy(os.path.join(os.path.dirname(__file__),
+                          'missing_container_info.db'),
+             os.path.join(dbpath, '1.db'))
+
+        broker = DatabaseBroker(os.path.join(dbpath, '1.db'))
+        broker.db_type = 'container'
+
+        with self.assertRaises(sqlite3.DatabaseError) as raised:
+            broker.get_raw_metadata()
+        self.assertEqual(
+            str(raised.exception),
+            'Quarantined %s to %s due to missing row in container_stat table' %
+            (dbpath, qpath))
 
     def test_lock(self):
         broker = DatabaseBroker(os.path.join(self.testdir, '1.db'), timeout=.1)
-        got_exc = False
-        try:
-            with broker.lock():
-                pass
-        except Exception:
-            got_exc = True
-        self.assert_(got_exc)
+        with self.assertRaises(DatabaseConnectionError) as raised, \
+                broker.lock():
+            pass
+        self.assertEqual(
+            str(raised.exception),
+            "DB connection error (%s, 0):\nDB doesn't exist" % broker.db_file)
 
         def stub(*args, **kwargs):
             pass
@@ -285,17 +947,30 @@ def stub(*args, **kwargs):
             pass
         with broker.lock():
             pass
+
+        with self.assertRaises(RuntimeError) as raised, broker.lock():
+            raise RuntimeError('boom!')
+        self.assertEqual(raised.exception.args[0], 'boom!')
+
         broker2 = DatabaseBroker(os.path.join(self.testdir, '1.db'),
                                  timeout=.1)
         broker2._initialize = stub
         with broker.lock():
-            got_exc = False
-            try:
+            # broker2 raises the timeout
+            with self.assertRaises(LockTimeout) as raised:
+                with broker2.lock():
+                    pass
+        self.assertEqual(str(raised.exception),
+                         '0.1 seconds: %s' % broker.db_file)
+
+        # and the timeout bubbles up out of broker.lock()
+        with self.assertRaises(LockTimeout) as raised:
+            with broker.lock():
                 with broker2.lock():
                     pass
-            except LockTimeout:
-                got_exc = True
-            self.assert_(got_exc)
+        self.assertEqual(str(raised.exception),
+                         '0.1 seconds: %s' % broker.db_file)
+
         try:
             with broker.lock():
                 raise Exception('test')
@@ -305,12 +980,12 @@ def stub(*args, **kwargs):
             pass
 
     def test_newid(self):
-        broker = DatabaseBroker(':memory:')
+        broker = DatabaseBroker(self.db_path)
         broker.db_type = 'test'
         broker.db_contains_type = 'test'
         uuid1 = str(uuid4())
 
-        def _initialize(conn, timestamp):
+        def _initialize(conn, timestamp, **kwargs):
             conn.execute('CREATE TABLE test (one TEXT)')
             conn.execute('CREATE TABLE test_stat (id TEXT)')
             conn.execute('INSERT INTO test_stat (id) VALUES (?)', (uuid1,))
@@ -321,43 +996,46 @@ def _initialize(conn, timestamp):
         broker.newid(uuid2)
         with broker.get() as conn:
             uuids = [r[0] for r in conn.execute('SELECT * FROM test_stat')]
-            self.assertEquals(len(uuids), 1)
-            self.assertNotEquals(uuids[0], uuid1)
+            self.assertEqual(len(uuids), 1)
+            self.assertNotEqual(uuids[0], uuid1)
             uuid1 = uuids[0]
-            points = [(r[0], r[1]) for r in conn.execute('SELECT sync_point, '
+            points = [(r[0], r[1]) for r in conn.execute(
+                'SELECT sync_point, '
                 'remote_id FROM incoming_sync WHERE remote_id = ?', (uuid2,))]
-            self.assertEquals(len(points), 1)
-            self.assertEquals(points[0][0], -1)
-            self.assertEquals(points[0][1], uuid2)
+            self.assertEqual(len(points), 1)
+            self.assertEqual(points[0][0], -1)
+            self.assertEqual(points[0][1], uuid2)
             conn.execute('INSERT INTO test (one) VALUES ("1")')
             conn.commit()
         uuid3 = str(uuid4())
         broker.newid(uuid3)
         with broker.get() as conn:
             uuids = [r[0] for r in conn.execute('SELECT * FROM test_stat')]
-            self.assertEquals(len(uuids), 1)
-            self.assertNotEquals(uuids[0], uuid1)
+            self.assertEqual(len(uuids), 1)
+            self.assertNotEqual(uuids[0], uuid1)
             uuid1 = uuids[0]
-            points = [(r[0], r[1]) for r in conn.execute('SELECT sync_point, '
+            points = [(r[0], r[1]) for r in conn.execute(
+                'SELECT sync_point, '
                 'remote_id FROM incoming_sync WHERE remote_id = ?', (uuid3,))]
-            self.assertEquals(len(points), 1)
-            self.assertEquals(points[0][1], uuid3)
+            self.assertEqual(len(points), 1)
+            self.assertEqual(points[0][1], uuid3)
         broker.newid(uuid2)
         with broker.get() as conn:
             uuids = [r[0] for r in conn.execute('SELECT * FROM test_stat')]
-            self.assertEquals(len(uuids), 1)
-            self.assertNotEquals(uuids[0], uuid1)
-            points = [(r[0], r[1]) for r in conn.execute('SELECT sync_point, '
+            self.assertEqual(len(uuids), 1)
+            self.assertNotEqual(uuids[0], uuid1)
+            points = [(r[0], r[1]) for r in conn.execute(
+                'SELECT sync_point, '
                 'remote_id FROM incoming_sync WHERE remote_id = ?', (uuid2,))]
-            self.assertEquals(len(points), 1)
-            self.assertEquals(points[0][1], uuid2)
+            self.assertEqual(len(points), 1)
+            self.assertEqual(points[0][1], uuid2)
 
     def test_get_items_since(self):
-        broker = DatabaseBroker(':memory:')
+        broker = DatabaseBroker(self.db_path)
         broker.db_type = 'test'
         broker.db_contains_type = 'test'
 
-        def _initialize(conn, timestamp):
+        def _initialize(conn, timestamp, **kwargs):
             conn.execute('CREATE TABLE test (one TEXT)')
             conn.execute('INSERT INTO test (one) VALUES ("1")')
             conn.execute('INSERT INTO test (one) VALUES ("2")')
@@ -365,22 +1043,71 @@ def _initialize(conn, timestamp):
             conn.commit()
         broker._initialize = _initialize
         broker.initialize(normalize_timestamp('1'))
-        self.assertEquals(broker.get_items_since(-1, 10),
-                          [{'one': '1'}, {'one': '2'}, {'one': '3'}])
-        self.assertEquals(broker.get_items_since(-1, 2),
-                          [{'one': '1'}, {'one': '2'}])
-        self.assertEquals(broker.get_items_since(1, 2),
-                          [{'one': '2'}, {'one': '3'}])
-        self.assertEquals(broker.get_items_since(3, 2), [])
-        self.assertEquals(broker.get_items_since(999, 2), [])
+        self.assertEqual(broker.get_items_since(-1, 10),
+                         [{'one': '1'}, {'one': '2'}, {'one': '3'}])
+        self.assertEqual(broker.get_items_since(-1, 2),
+                         [{'one': '1'}, {'one': '2'}])
+        self.assertEqual(broker.get_items_since(1, 2),
+                         [{'one': '2'}, {'one': '3'}])
+        self.assertEqual(broker.get_items_since(3, 2), [])
+        self.assertEqual(broker.get_items_since(999, 2), [])
+
+    def test_get_syncs(self):
+        broker = DatabaseBroker(self.db_path)
+        broker.db_type = 'test'
+        broker.db_contains_type = 'test'
+        uuid1 = str(uuid4())
+
+        def _initialize(conn, timestamp, **kwargs):
+            conn.execute('CREATE TABLE test (one TEXT)')
+            conn.execute('CREATE TABLE test_stat (id TEXT)')
+            conn.execute('INSERT INTO test_stat (id) VALUES (?)', (uuid1,))
+            conn.execute('INSERT INTO test (one) VALUES ("1")')
+            conn.commit()
+            pass
+        broker._initialize = _initialize
+        broker.initialize(normalize_timestamp('1'))
+
+        for incoming in (True, False):
+            # Can't mock out timestamp now, because the update_at in the sync
+            # tables are cuase by a trigger inside sqlite which uses it's own
+            # now method. So instead track the time before and after to make
+            # sure we're getting the right timestamps.
+            ts0 = Timestamp.now()
+            broker.merge_syncs([
+                {'sync_point': 0, 'remote_id': 'remote_0'},
+                {'sync_point': 1, 'remote_id': 'remote_1'}], incoming)
+
+            time.sleep(0.005)
+            broker.merge_syncs([
+                {'sync_point': 2, 'remote_id': 'remote_2'}], incoming)
+
+            ts1 = Timestamp.now()
+            expected_syncs = [{'sync_point': 0, 'remote_id': 'remote_0'},
+                              {'sync_point': 1, 'remote_id': 'remote_1'},
+                              {'sync_point': 2, 'remote_id': 'remote_2'}]
+
+            self.assertEqual(expected_syncs, broker.get_syncs(incoming))
+
+            # if we want the updated_at timestamps too then:
+            expected_syncs[0]['updated_at'] = mock.ANY
+            expected_syncs[1]['updated_at'] = mock.ANY
+            expected_syncs[2]['updated_at'] = mock.ANY
+            actual_syncs = broker.get_syncs(incoming, include_timestamp=True)
+            self.assertEqual(expected_syncs, actual_syncs)
+            # Note that most of the time, we expect these all to be ==
+            # but we've been known to see sizeable delays in the gate at times
+            self.assertTrue(all([
+                str(int(ts0)) <= s['updated_at'] <= str(int(ts1))
+                for s in actual_syncs]))
 
     def test_get_sync(self):
-        broker = DatabaseBroker(':memory:')
+        broker = DatabaseBroker(self.db_path)
         broker.db_type = 'test'
         broker.db_contains_type = 'test'
         uuid1 = str(uuid4())
 
-        def _initialize(conn, timestamp):
+        def _initialize(conn, timestamp, **kwargs):
             conn.execute('CREATE TABLE test (one TEXT)')
             conn.execute('CREATE TABLE test_stat (id TEXT)')
             conn.execute('INSERT INTO test_stat (id) VALUES (?)', (uuid1,))
@@ -390,32 +1117,32 @@ def _initialize(conn, timestamp):
         broker._initialize = _initialize
         broker.initialize(normalize_timestamp('1'))
         uuid2 = str(uuid4())
-        self.assertEquals(broker.get_sync(uuid2), -1)
+        self.assertEqual(broker.get_sync(uuid2), -1)
         broker.newid(uuid2)
-        self.assertEquals(broker.get_sync(uuid2), 1)
+        self.assertEqual(broker.get_sync(uuid2), 1)
         uuid3 = str(uuid4())
-        self.assertEquals(broker.get_sync(uuid3), -1)
+        self.assertEqual(broker.get_sync(uuid3), -1)
         with broker.get() as conn:
             conn.execute('INSERT INTO test (one) VALUES ("2")')
             conn.commit()
         broker.newid(uuid3)
-        self.assertEquals(broker.get_sync(uuid2), 1)
-        self.assertEquals(broker.get_sync(uuid3), 2)
-        self.assertEquals(broker.get_sync(uuid2, incoming=False), -1)
-        self.assertEquals(broker.get_sync(uuid3, incoming=False), -1)
+        self.assertEqual(broker.get_sync(uuid2), 1)
+        self.assertEqual(broker.get_sync(uuid3), 2)
+        self.assertEqual(broker.get_sync(uuid2, incoming=False), -1)
+        self.assertEqual(broker.get_sync(uuid3, incoming=False), -1)
         broker.merge_syncs([{'sync_point': 1, 'remote_id': uuid2}],
                            incoming=False)
-        self.assertEquals(broker.get_sync(uuid2), 1)
-        self.assertEquals(broker.get_sync(uuid3), 2)
-        self.assertEquals(broker.get_sync(uuid2, incoming=False), 1)
-        self.assertEquals(broker.get_sync(uuid3, incoming=False), -1)
+        self.assertEqual(broker.get_sync(uuid2), 1)
+        self.assertEqual(broker.get_sync(uuid3), 2)
+        self.assertEqual(broker.get_sync(uuid2, incoming=False), 1)
+        self.assertEqual(broker.get_sync(uuid3, incoming=False), -1)
         broker.merge_syncs([{'sync_point': 2, 'remote_id': uuid3}],
                            incoming=False)
-        self.assertEquals(broker.get_sync(uuid2, incoming=False), 1)
-        self.assertEquals(broker.get_sync(uuid3, incoming=False), 2)
+        self.assertEqual(broker.get_sync(uuid2, incoming=False), 1)
+        self.assertEqual(broker.get_sync(uuid3, incoming=False), 2)
 
     def test_merge_syncs(self):
-        broker = DatabaseBroker(':memory:')
+        broker = DatabaseBroker(self.db_path)
 
         def stub(*args, **kwargs):
             pass
@@ -423,22 +1150,35 @@ def stub(*args, **kwargs):
         broker.initialize(normalize_timestamp('1'))
         uuid2 = str(uuid4())
         broker.merge_syncs([{'sync_point': 1, 'remote_id': uuid2}])
-        self.assertEquals(broker.get_sync(uuid2), 1)
+        self.assertEqual(broker.get_sync(uuid2), 1)
         uuid3 = str(uuid4())
         broker.merge_syncs([{'sync_point': 2, 'remote_id': uuid3}])
-        self.assertEquals(broker.get_sync(uuid2), 1)
-        self.assertEquals(broker.get_sync(uuid3), 2)
-        self.assertEquals(broker.get_sync(uuid2, incoming=False), -1)
-        self.assertEquals(broker.get_sync(uuid3, incoming=False), -1)
+        self.assertEqual(broker.get_sync(uuid2), 1)
+        self.assertEqual(broker.get_sync(uuid3), 2)
+        self.assertEqual(broker.get_sync(uuid2, incoming=False), -1)
+        self.assertEqual(broker.get_sync(uuid3, incoming=False), -1)
         broker.merge_syncs([{'sync_point': 3, 'remote_id': uuid2},
                             {'sync_point': 4, 'remote_id': uuid3}],
                            incoming=False)
-        self.assertEquals(broker.get_sync(uuid2, incoming=False), 3)
-        self.assertEquals(broker.get_sync(uuid3, incoming=False), 4)
-        self.assertEquals(broker.get_sync(uuid2), 1)
-        self.assertEquals(broker.get_sync(uuid3), 2)
+        self.assertEqual(broker.get_sync(uuid2, incoming=False), 3)
+        self.assertEqual(broker.get_sync(uuid3, incoming=False), 4)
+        self.assertEqual(broker.get_sync(uuid2), 1)
+        self.assertEqual(broker.get_sync(uuid3), 2)
+        broker.merge_syncs([{'sync_point': 5, 'remote_id': uuid2}])
+        self.assertEqual(broker.get_sync(uuid2), 5)
+        # max sync point sticks
         broker.merge_syncs([{'sync_point': 5, 'remote_id': uuid2}])
-        self.assertEquals(broker.get_sync(uuid2), 5)
+        self.assertEqual(broker.get_sync(uuid2), 5)
+        self.assertEqual(broker.get_sync(uuid3), 2)
+        broker.merge_syncs([{'sync_point': 4, 'remote_id': uuid2}])
+        self.assertEqual(broker.get_sync(uuid2), 5)
+        self.assertEqual(broker.get_sync(uuid3), 2)
+        broker.merge_syncs([{'sync_point': -1, 'remote_id': uuid2},
+                            {'sync_point': 3, 'remote_id': uuid3}])
+        self.assertEqual(broker.get_sync(uuid2), 5)
+        self.assertEqual(broker.get_sync(uuid3), 3)
+        self.assertEqual(broker.get_sync(uuid2, incoming=False), 3)
+        self.assertEqual(broker.get_sync(uuid3, incoming=False), 4)
 
     def test_get_replication_info(self):
         self.get_replication_info_tester(metadata=False)
@@ -447,15 +1187,16 @@ def test_get_replication_info_with_metadata(self):
         self.get_replication_info_tester(metadata=True)
 
     def get_replication_info_tester(self, metadata=False):
-        broker = DatabaseBroker(':memory:', account='a')
+        broker = DatabaseBroker(self.db_path, account='a')
         broker.db_type = 'test'
         broker.db_contains_type = 'test'
-        broker_creation = normalize_timestamp(1)
+        broker.db_reclaim_timestamp = 'created_at'
+        broker_creation = next(self.ts)
         broker_uuid = str(uuid4())
-        broker_metadata = metadata and simplejson.dumps(
-                {'Test': ('Value', normalize_timestamp(1))}) or ''
+        broker_metadata = metadata and json.dumps(
+            {'Test': ('Value', next(self.ts).internal)}) or ''
 
-        def _initialize(conn, put_timestamp):
+        def _initialize(conn, put_timestamp, **kwargs):
             if put_timestamp is None:
                 put_timestamp = normalize_timestamp(0)
             conn.executescript('''
@@ -486,6 +1227,7 @@ def _initialize(conn, put_timestamp):
                     created_at TEXT,
                     put_timestamp TEXT DEFAULT '0',
                     delete_timestamp TEXT DEFAULT '0',
+                    status_changed_at TEXT DEFAULT '0',
                     test_count INTEGER,
                     hash TEXT default '00000000000000000000000000000000',
                     id TEXT
@@ -495,1565 +1237,603 @@ def _initialize(conn, put_timestamp):
             ''' % (metadata and ", metadata TEXT DEFAULT ''" or ""))
             conn.execute('''
                 UPDATE test_stat
-                SET account = ?, created_at = ?,  id = ?, put_timestamp = ?
-            ''', (broker.account, broker_creation, broker_uuid, put_timestamp))
+                SET account = ?, created_at = ?,  id = ?, put_timestamp = ?,
+                    status_changed_at = ?
+            ''', (broker.account, broker_creation.internal, broker_uuid,
+                  put_timestamp, put_timestamp))
             if metadata:
                 conn.execute('UPDATE test_stat SET metadata = ?',
                              (broker_metadata,))
             conn.commit()
         broker._initialize = _initialize
-        put_timestamp = normalize_timestamp(2)
-        broker.initialize(put_timestamp)
+        put_timestamp = next(self.ts)
+        broker.initialize(put_timestamp.internal)
         info = broker.get_replication_info()
-        self.assertEquals(info, {'count': 0,
+        self.assertEqual(info, {
+            'account': broker.account, 'count': 0,
             'hash': '00000000000000000000000000000000',
-            'created_at': broker_creation, 'put_timestamp': put_timestamp,
-            'delete_timestamp': '0', 'max_row': -1, 'id': broker_uuid,
-            'metadata': broker_metadata})
-        insert_timestamp = normalize_timestamp(3)
+            'created_at': broker_creation.internal,
+            'put_timestamp': put_timestamp.internal,
+            'delete_timestamp': '0',
+            'status_changed_at': put_timestamp.internal,
+            'max_row': -1, 'id': broker_uuid, 'metadata': broker_metadata})
+        insert_timestamp = next(self.ts)
+        exp_hash = md5(
+            b'test-%s' % insert_timestamp.internal.encode('utf8')).hexdigest()
         with broker.get() as conn:
             conn.execute('''
                 INSERT INTO test (name, created_at) VALUES ('test', ?)
-            ''', (insert_timestamp,))
+            ''', (insert_timestamp.internal,))
             conn.commit()
         info = broker.get_replication_info()
-        self.assertEquals(info, {'count': 1,
-            'hash': 'bdc4c93f574b0d8c2911a27ce9dd38ba',
-            'created_at': broker_creation, 'put_timestamp': put_timestamp,
-            'delete_timestamp': '0', 'max_row': 1, 'id': broker_uuid,
-            'metadata': broker_metadata})
+        self.assertEqual(info, {
+            'account': broker.account, 'count': 1,
+            'hash': exp_hash,
+            'created_at': broker_creation.internal,
+            'put_timestamp': put_timestamp.internal,
+            'delete_timestamp': '0',
+            'status_changed_at': put_timestamp.internal,
+            'max_row': 1, 'id': broker_uuid, 'metadata': broker_metadata})
         with broker.get() as conn:
             conn.execute('DELETE FROM test')
             conn.commit()
         info = broker.get_replication_info()
-        self.assertEquals(info, {'count': 0,
+        self.assertEqual(info, {
+            'account': broker.account, 'count': 0,
             'hash': '00000000000000000000000000000000',
-            'created_at': broker_creation, 'put_timestamp': put_timestamp,
-            'delete_timestamp': '0', 'max_row': 1, 'id': broker_uuid,
-            'metadata': broker_metadata})
+            'created_at': broker_creation.internal,
+            'put_timestamp': put_timestamp.internal,
+            'delete_timestamp': '0',
+            'status_changed_at': put_timestamp.internal,
+            'max_row': 1, 'id': broker_uuid, 'metadata': broker_metadata})
         return broker
 
-    def test_metadata(self):
+    # only testing _reclaim_metadata here
+    @patch.object(TombstoneReclaimer, 'reclaim')
+    def test_metadata(self, mock_reclaim):
         # Initializes a good broker for us
         broker = self.get_replication_info_tester(metadata=True)
+        ts = [next(self.ts) for _ in range(6)]
         # Add our first item
-        first_timestamp = normalize_timestamp(1)
         first_value = '1'
-        broker.update_metadata({'First': [first_value, first_timestamp]})
-        self.assert_('First' in broker.metadata)
-        self.assertEquals(broker.metadata['First'],
-                          [first_value, first_timestamp])
+        broker.update_metadata({'First': [first_value, ts[0].internal]})
+        self.assertIn('First', broker.metadata)
+        self.assertEqual(broker.metadata['First'],
+                         [first_value, ts[0].internal])
         # Add our second item
-        second_timestamp = normalize_timestamp(2)
         second_value = '2'
-        broker.update_metadata({'Second': [second_value, second_timestamp]})
-        self.assert_('First' in broker.metadata)
-        self.assertEquals(broker.metadata['First'],
-                          [first_value, first_timestamp])
-        self.assert_('Second' in broker.metadata)
-        self.assertEquals(broker.metadata['Second'],
-                          [second_value, second_timestamp])
+        broker.update_metadata({'Second': [second_value, ts[1].internal]})
+        self.assertIn('First', broker.metadata)
+        self.assertEqual(broker.metadata['First'],
+                         [first_value, ts[0].internal])
+        self.assertIn('Second', broker.metadata)
+        self.assertEqual(broker.metadata['Second'],
+                         [second_value, ts[1].internal])
         # Update our first item
-        first_timestamp = normalize_timestamp(3)
         first_value = '1b'
-        broker.update_metadata({'First': [first_value, first_timestamp]})
-        self.assert_('First' in broker.metadata)
-        self.assertEquals(broker.metadata['First'],
-                          [first_value, first_timestamp])
-        self.assert_('Second' in broker.metadata)
-        self.assertEquals(broker.metadata['Second'],
-                          [second_value, second_timestamp])
+        broker.update_metadata({'First': [first_value, ts[2].internal]})
+        self.assertIn('First', broker.metadata)
+        self.assertEqual(broker.metadata['First'],
+                         [first_value, ts[2].internal])
+        self.assertIn('Second', broker.metadata)
+        self.assertEqual(broker.metadata['Second'],
+                         [second_value, ts[1].internal])
         # Delete our second item (by setting to empty string)
-        second_timestamp = normalize_timestamp(4)
         second_value = ''
-        broker.update_metadata({'Second': [second_value, second_timestamp]})
-        self.assert_('First' in broker.metadata)
-        self.assertEquals(broker.metadata['First'],
-                          [first_value, first_timestamp])
-        self.assert_('Second' in broker.metadata)
-        self.assertEquals(broker.metadata['Second'],
-                          [second_value, second_timestamp])
+        broker.update_metadata({'Second': [second_value, ts[3].internal]})
+        self.assertIn('First', broker.metadata)
+        self.assertEqual(broker.metadata['First'],
+                         [first_value, ts[2].internal])
+        self.assertIn('Second', broker.metadata)
+        self.assertEqual(broker.metadata['Second'],
+                         [second_value, ts[3].internal])
         # Reclaim at point before second item was deleted
-        broker.reclaim(normalize_timestamp(3))
-        self.assert_('First' in broker.metadata)
-        self.assertEquals(broker.metadata['First'],
-                          [first_value, first_timestamp])
-        self.assert_('Second' in broker.metadata)
-        self.assertEquals(broker.metadata['Second'],
-                          [second_value, second_timestamp])
+        broker.reclaim(float(ts[2]), float(ts[2]))
+        self.assertIn('First', broker.metadata)
+        self.assertEqual(broker.metadata['First'],
+                         [first_value, ts[2].internal])
+        self.assertIn('Second', broker.metadata)
+        self.assertEqual(broker.metadata['Second'],
+                         [second_value, ts[3].internal])
         # Reclaim at point second item was deleted
-        broker.reclaim(normalize_timestamp(4))
-        self.assert_('First' in broker.metadata)
-        self.assertEquals(broker.metadata['First'],
-                          [first_value, first_timestamp])
-        self.assert_('Second' in broker.metadata)
-        self.assertEquals(broker.metadata['Second'],
-                          [second_value, second_timestamp])
+        broker.reclaim(float(ts[3]), float(ts[3]))
+        self.assertIn('First', broker.metadata)
+        self.assertEqual(broker.metadata['First'],
+                         [first_value, ts[2].internal])
+        self.assertIn('Second', broker.metadata)
+        self.assertEqual(broker.metadata['Second'],
+                         [second_value, ts[3].internal])
         # Reclaim after point second item was deleted
-        broker.reclaim(normalize_timestamp(5))
-        self.assert_('First' in broker.metadata)
-        self.assertEquals(broker.metadata['First'],
-                          [first_value, first_timestamp])
-        self.assert_('Second' not in broker.metadata)
-
-
-class TestContainerBroker(unittest.TestCase):
-    """ Tests for swift.common.db.ContainerBroker """
-
-    def test_creation(self):
-        """ Test swift.common.db.ContainerBroker.__init__ """
-        broker = ContainerBroker(':memory:', account='a', container='c')
-        self.assertEqual(broker.db_file, ':memory:')
-        broker.initialize(normalize_timestamp('1'))
-        with broker.get() as conn:
-            curs = conn.cursor()
-            curs.execute('SELECT 1')
-            self.assertEqual(curs.fetchall()[0][0], 1)
-
-    def test_exception(self):
-        """ Test swift.common.db.ContainerBroker throwing a conn away after
-            unhandled exception """
-        first_conn = None
-        broker = ContainerBroker(':memory:', account='a', container='c')
-        broker.initialize(normalize_timestamp('1'))
-        with broker.get() as conn:
-            first_conn = conn
-        try:
-            with broker.get() as conn:
-                self.assertEquals(first_conn, conn)
-                raise Exception('OMG')
-        except Exception:
-            pass
-        self.assert_(broker.conn is None)
-
-    def test_empty(self):
-        """ Test swift.common.db.ContainerBroker.empty """
-        broker = ContainerBroker(':memory:', account='a', container='c')
-        broker.initialize(normalize_timestamp('1'))
-        self.assert_(broker.empty())
-        broker.put_object('o', normalize_timestamp(time()), 0, 'text/plain',
-                          'd41d8cd98f00b204e9800998ecf8427e')
-        self.assert_(not broker.empty())
-        sleep(.00001)
-        broker.delete_object('o', normalize_timestamp(time()))
-        self.assert_(broker.empty())
-
-    def test_reclaim(self):
-        broker = ContainerBroker(':memory:', account='test_account',
-                                 container='test_container')
-        broker.initialize(normalize_timestamp('1'))
-        broker.put_object('o', normalize_timestamp(time()), 0, 'text/plain',
-                          'd41d8cd98f00b204e9800998ecf8427e')
-        with broker.get() as conn:
-            self.assertEquals(conn.execute(
-                "SELECT count(*) FROM object "
-                "WHERE deleted = 0").fetchone()[0], 1)
-            self.assertEquals(conn.execute(
-                "SELECT count(*) FROM object "
-                "WHERE deleted = 1").fetchone()[0], 0)
-        broker.reclaim(normalize_timestamp(time() - 999), time())
-        with broker.get() as conn:
-            self.assertEquals(conn.execute(
-                "SELECT count(*) FROM object "
-                "WHERE deleted = 0").fetchone()[0], 1)
-            self.assertEquals(conn.execute(
-                "SELECT count(*) FROM object "
-                "WHERE deleted = 1").fetchone()[0], 0)
-        sleep(.00001)
-        broker.delete_object('o', normalize_timestamp(time()))
-        with broker.get() as conn:
-            self.assertEquals(conn.execute(
-                "SELECT count(*) FROM object "
-                "WHERE deleted = 0").fetchone()[0], 0)
-            self.assertEquals(conn.execute(
-                "SELECT count(*) FROM object "
-                "WHERE deleted = 1").fetchone()[0], 1)
-        broker.reclaim(normalize_timestamp(time() - 999), time())
-        with broker.get() as conn:
-            self.assertEquals(conn.execute(
-                "SELECT count(*) FROM object "
-                "WHERE deleted = 0").fetchone()[0], 0)
-            self.assertEquals(conn.execute(
-                "SELECT count(*) FROM object "
-                "WHERE deleted = 1").fetchone()[0], 1)
-        sleep(.00001)
-        broker.reclaim(normalize_timestamp(time()), time())
-        with broker.get() as conn:
-            self.assertEquals(conn.execute(
-                "SELECT count(*) FROM object "
-                "WHERE deleted = 0").fetchone()[0], 0)
-            self.assertEquals(conn.execute(
-                "SELECT count(*) FROM object "
-                "WHERE deleted = 1").fetchone()[0], 0)
-        # Test the return values of reclaim()
-        broker.put_object('w', normalize_timestamp(time()), 0, 'text/plain',
-                'd41d8cd98f00b204e9800998ecf8427e')
-        broker.put_object('x', normalize_timestamp(time()), 0, 'text/plain',
-                'd41d8cd98f00b204e9800998ecf8427e')
-        broker.put_object('y', normalize_timestamp(time()), 0, 'text/plain',
-                'd41d8cd98f00b204e9800998ecf8427e')
-        broker.put_object('z', normalize_timestamp(time()), 0, 'text/plain',
-                'd41d8cd98f00b204e9800998ecf8427e')
-        # Test before deletion
-        res = broker.reclaim(normalize_timestamp(time()), time())
-        broker.delete_db(normalize_timestamp(time()))
-
-    def test_delete_object(self):
-        """ Test swift.common.db.ContainerBroker.delete_object """
-        broker = ContainerBroker(':memory:', account='a', container='c')
-        broker.initialize(normalize_timestamp('1'))
-        broker.put_object('o', normalize_timestamp(time()), 0, 'text/plain',
-                          'd41d8cd98f00b204e9800998ecf8427e')
-        with broker.get() as conn:
-            self.assertEquals(conn.execute(
-                "SELECT count(*) FROM object "
-                "WHERE deleted = 0").fetchone()[0], 1)
-            self.assertEquals(conn.execute(
-                "SELECT count(*) FROM object "
-                "WHERE deleted = 1").fetchone()[0], 0)
-        sleep(.00001)
-        broker.delete_object('o', normalize_timestamp(time()))
-        with broker.get() as conn:
-            self.assertEquals(conn.execute(
-                "SELECT count(*) FROM object "
-                "WHERE deleted = 0").fetchone()[0], 0)
-            self.assertEquals(conn.execute(
-                "SELECT count(*) FROM object "
-                "WHERE deleted = 1").fetchone()[0], 1)
-
-    def test_put_object(self):
-        """ Test swift.common.db.ContainerBroker.put_object """
-        broker = ContainerBroker(':memory:', account='a', container='c')
-        broker.initialize(normalize_timestamp('1'))
-
-        # Create initial object
-        timestamp = normalize_timestamp(time())
-        broker.put_object('"{<object \'&\' name>}"', timestamp, 123,
-                          'application/x-test',
-                          '5af83e3196bf99f440f31f2e1a6c9afe')
-        with broker.get() as conn:
-            self.assertEquals(conn.execute(
-                "SELECT name FROM object").fetchone()[0],
-                '"{<object \'&\' name>}"')
-            self.assertEquals(conn.execute(
-                "SELECT created_at FROM object").fetchone()[0], timestamp)
-            self.assertEquals(conn.execute(
-                "SELECT size FROM object").fetchone()[0], 123)
-            self.assertEquals(conn.execute(
-                "SELECT content_type FROM object").fetchone()[0],
-                'application/x-test')
-            self.assertEquals(conn.execute(
-                "SELECT etag FROM object").fetchone()[0],
-                '5af83e3196bf99f440f31f2e1a6c9afe')
-            self.assertEquals(conn.execute(
-                "SELECT deleted FROM object").fetchone()[0], 0)
-
-        # Reput same event
-        broker.put_object('"{<object \'&\' name>}"', timestamp, 123,
-                          'application/x-test',
-                          '5af83e3196bf99f440f31f2e1a6c9afe')
-        with broker.get() as conn:
-            self.assertEquals(conn.execute(
-                "SELECT name FROM object").fetchone()[0],
-                '"{<object \'&\' name>}"')
-            self.assertEquals(conn.execute(
-                "SELECT created_at FROM object").fetchone()[0], timestamp)
-            self.assertEquals(conn.execute(
-                "SELECT size FROM object").fetchone()[0], 123)
-            self.assertEquals(conn.execute(
-                "SELECT content_type FROM object").fetchone()[0],
-                'application/x-test')
-            self.assertEquals(conn.execute(
-                "SELECT etag FROM object").fetchone()[0],
-                '5af83e3196bf99f440f31f2e1a6c9afe')
-            self.assertEquals(conn.execute(
-                "SELECT deleted FROM object").fetchone()[0], 0)
-
-        # Put new event
-        sleep(.00001)
-        timestamp = normalize_timestamp(time())
-        broker.put_object('"{<object \'&\' name>}"', timestamp, 124,
-                          'application/x-test',
-                          'aa0749bacbc79ec65fe206943d8fe449')
-        with broker.get() as conn:
-            self.assertEquals(conn.execute(
-                "SELECT name FROM object").fetchone()[0],
-                '"{<object \'&\' name>}"')
-            self.assertEquals(conn.execute(
-                "SELECT created_at FROM object").fetchone()[0], timestamp)
-            self.assertEquals(conn.execute(
-                "SELECT size FROM object").fetchone()[0], 124)
-            self.assertEquals(conn.execute(
-                "SELECT content_type FROM object").fetchone()[0],
-                'application/x-test')
-            self.assertEquals(conn.execute(
-                "SELECT etag FROM object").fetchone()[0],
-                'aa0749bacbc79ec65fe206943d8fe449')
-            self.assertEquals(conn.execute(
-                "SELECT deleted FROM object").fetchone()[0], 0)
-
-        # Put old event
-        otimestamp = normalize_timestamp(float(timestamp) - 1)
-        broker.put_object('"{<object \'&\' name>}"', otimestamp, 124,
-                          'application/x-test',
-                          'aa0749bacbc79ec65fe206943d8fe449')
-        with broker.get() as conn:
-            self.assertEquals(conn.execute(
-                "SELECT name FROM object").fetchone()[0],
-                '"{<object \'&\' name>}"')
-            self.assertEquals(conn.execute(
-                "SELECT created_at FROM object").fetchone()[0], timestamp)
-            self.assertEquals(conn.execute(
-                "SELECT size FROM object").fetchone()[0], 124)
-            self.assertEquals(conn.execute(
-                "SELECT content_type FROM object").fetchone()[0],
-                'application/x-test')
-            self.assertEquals(conn.execute(
-                "SELECT etag FROM object").fetchone()[0],
-                'aa0749bacbc79ec65fe206943d8fe449')
-            self.assertEquals(conn.execute(
-                "SELECT deleted FROM object").fetchone()[0], 0)
-
-        # Put old delete event
-        dtimestamp = normalize_timestamp(float(timestamp) - 1)
-        broker.put_object('"{<object \'&\' name>}"', dtimestamp, 0, '', '',
-                          deleted=1)
-        with broker.get() as conn:
-            self.assertEquals(conn.execute(
-                "SELECT name FROM object").fetchone()[0],
-                '"{<object \'&\' name>}"')
-            self.assertEquals(conn.execute(
-                "SELECT created_at FROM object").fetchone()[0], timestamp)
-            self.assertEquals(conn.execute(
-                "SELECT size FROM object").fetchone()[0], 124)
-            self.assertEquals(conn.execute(
-                "SELECT content_type FROM object").fetchone()[0],
-                'application/x-test')
-            self.assertEquals(conn.execute(
-                "SELECT etag FROM object").fetchone()[0],
-                'aa0749bacbc79ec65fe206943d8fe449')
-            self.assertEquals(conn.execute(
-                "SELECT deleted FROM object").fetchone()[0], 0)
-
-        # Put new delete event
-        sleep(.00001)
-        timestamp = normalize_timestamp(time())
-        broker.put_object('"{<object \'&\' name>}"', timestamp, 0, '', '',
-                          deleted=1)
-        with broker.get() as conn:
-            self.assertEquals(conn.execute(
-                "SELECT name FROM object").fetchone()[0],
-                '"{<object \'&\' name>}"')
-            self.assertEquals(conn.execute(
-                "SELECT created_at FROM object").fetchone()[0], timestamp)
-            self.assertEquals(conn.execute(
-                "SELECT deleted FROM object").fetchone()[0], 1)
-
-        # Put new event
-        sleep(.00001)
-        timestamp = normalize_timestamp(time())
-        broker.put_object('"{<object \'&\' name>}"', timestamp, 123,
-                          'application/x-test',
-                          '5af83e3196bf99f440f31f2e1a6c9afe')
-        with broker.get() as conn:
-            self.assertEquals(conn.execute(
-                "SELECT name FROM object").fetchone()[0],
-                '"{<object \'&\' name>}"')
-            self.assertEquals(conn.execute(
-                "SELECT created_at FROM object").fetchone()[0], timestamp)
-            self.assertEquals(conn.execute(
-                "SELECT size FROM object").fetchone()[0], 123)
-            self.assertEquals(conn.execute(
-                "SELECT content_type FROM object").fetchone()[0],
-                'application/x-test')
-            self.assertEquals(conn.execute(
-                "SELECT etag FROM object").fetchone()[0],
-                '5af83e3196bf99f440f31f2e1a6c9afe')
-            self.assertEquals(conn.execute(
-                "SELECT deleted FROM object").fetchone()[0], 0)
-
-        # We'll use this later
-        sleep(.0001)
-        in_between_timestamp = normalize_timestamp(time())
-
-        # New post event
-        sleep(.0001)
-        previous_timestamp = timestamp
-        timestamp = normalize_timestamp(time())
-        with broker.get() as conn:
-            self.assertEquals(conn.execute(
-                "SELECT name FROM object").fetchone()[0],
-                '"{<object \'&\' name>}"')
-            self.assertEquals(conn.execute(
-                "SELECT created_at FROM object").fetchone()[0],
-                previous_timestamp)
-            self.assertEquals(conn.execute(
-                "SELECT size FROM object").fetchone()[0], 123)
-            self.assertEquals(conn.execute(
-                "SELECT content_type FROM object").fetchone()[0],
-                'application/x-test')
-            self.assertEquals(conn.execute(
-                "SELECT etag FROM object").fetchone()[0],
-                '5af83e3196bf99f440f31f2e1a6c9afe')
-            self.assertEquals(conn.execute(
-                "SELECT deleted FROM object").fetchone()[0], 0)
-
-        # Put event from after last put but before last post
-        timestamp = in_between_timestamp
-        broker.put_object('"{<object \'&\' name>}"', timestamp, 456,
-                          'application/x-test3',
-                          '6af83e3196bf99f440f31f2e1a6c9afe')
-        with broker.get() as conn:
-            self.assertEquals(conn.execute(
-                "SELECT name FROM object").fetchone()[0],
-                '"{<object \'&\' name>}"')
-            self.assertEquals(conn.execute(
-                "SELECT created_at FROM object").fetchone()[0], timestamp)
-            self.assertEquals(conn.execute(
-                "SELECT size FROM object").fetchone()[0], 456)
-            self.assertEquals(conn.execute(
-                "SELECT content_type FROM object").fetchone()[0],
-                'application/x-test3')
-            self.assertEquals(conn.execute(
-                "SELECT etag FROM object").fetchone()[0],
-                '6af83e3196bf99f440f31f2e1a6c9afe')
-            self.assertEquals(conn.execute(
-                "SELECT deleted FROM object").fetchone()[0], 0)
-
-    def test_get_info(self):
-        """ Test swift.common.db.ContainerBroker.get_info """
-        broker = ContainerBroker(':memory:', account='test1',
-                                 container='test2')
-        broker.initialize(normalize_timestamp('1'))
-
-        info = broker.get_info()
-        self.assertEquals(info['account'], 'test1')
-        self.assertEquals(info['container'], 'test2')
-        self.assertEquals(info['hash'], '00000000000000000000000000000000')
-
-        info = broker.get_info()
-        self.assertEquals(info['object_count'], 0)
-        self.assertEquals(info['bytes_used'], 0)
-
-        broker.put_object('o1', normalize_timestamp(time()), 123, 'text/plain',
-                          '5af83e3196bf99f440f31f2e1a6c9afe')
-        info = broker.get_info()
-        self.assertEquals(info['object_count'], 1)
-        self.assertEquals(info['bytes_used'], 123)
-
-        sleep(.00001)
-        broker.put_object('o2', normalize_timestamp(time()), 123, 'text/plain',
-                          '5af83e3196bf99f440f31f2e1a6c9afe')
-        info = broker.get_info()
-        self.assertEquals(info['object_count'], 2)
-        self.assertEquals(info['bytes_used'], 246)
-
-        sleep(.00001)
-        broker.put_object('o2', normalize_timestamp(time()), 1000,
-                          'text/plain', '5af83e3196bf99f440f31f2e1a6c9afe')
-        info = broker.get_info()
-        self.assertEquals(info['object_count'], 2)
-        self.assertEquals(info['bytes_used'], 1123)
-
-        sleep(.00001)
-        broker.delete_object('o1', normalize_timestamp(time()))
-        info = broker.get_info()
-        self.assertEquals(info['object_count'], 1)
-        self.assertEquals(info['bytes_used'], 1000)
-
-        sleep(.00001)
-        broker.delete_object('o2', normalize_timestamp(time()))
-        info = broker.get_info()
-        self.assertEquals(info['object_count'], 0)
-        self.assertEquals(info['bytes_used'], 0)
-
-        info = broker.get_info()
-        self.assertEquals(info['x_container_sync_point1'], -1)
-        self.assertEquals(info['x_container_sync_point2'], -1)
-
-    def test_set_x_syncs(self):
-        broker = ContainerBroker(':memory:', account='test1',
-                                 container='test2')
-        broker.initialize(normalize_timestamp('1'))
-
-        info = broker.get_info()
-        self.assertEquals(info['x_container_sync_point1'], -1)
-        self.assertEquals(info['x_container_sync_point2'], -1)
-
-        broker.set_x_container_sync_points(1, 2)
-        info = broker.get_info()
-        self.assertEquals(info['x_container_sync_point1'], 1)
-        self.assertEquals(info['x_container_sync_point2'], 2)
-
-    def test_get_report_info(self):
-        broker = ContainerBroker(':memory:', account='test1',
-                                 container='test2')
-        broker.initialize(normalize_timestamp('1'))
-
-        info = broker.get_info()
-        self.assertEquals(info['account'], 'test1')
-        self.assertEquals(info['container'], 'test2')
-        self.assertEquals(info['object_count'], 0)
-        self.assertEquals(info['bytes_used'], 0)
-        self.assertEquals(info['reported_object_count'], 0)
-        self.assertEquals(info['reported_bytes_used'], 0)
-
-        broker.put_object('o1', normalize_timestamp(time()), 123, 'text/plain',
-                          '5af83e3196bf99f440f31f2e1a6c9afe')
-        info = broker.get_info()
-        self.assertEquals(info['object_count'], 1)
-        self.assertEquals(info['bytes_used'], 123)
-        self.assertEquals(info['reported_object_count'], 0)
-        self.assertEquals(info['reported_bytes_used'], 0)
-
-        sleep(.00001)
-        broker.put_object('o2', normalize_timestamp(time()), 123, 'text/plain',
-                          '5af83e3196bf99f440f31f2e1a6c9afe')
-        info = broker.get_info()
-        self.assertEquals(info['object_count'], 2)
-        self.assertEquals(info['bytes_used'], 246)
-        self.assertEquals(info['reported_object_count'], 0)
-        self.assertEquals(info['reported_bytes_used'], 0)
-
-        sleep(.00001)
-        broker.put_object('o2', normalize_timestamp(time()), 1000,
-                          'text/plain', '5af83e3196bf99f440f31f2e1a6c9afe')
-        info = broker.get_info()
-        self.assertEquals(info['object_count'], 2)
-        self.assertEquals(info['bytes_used'], 1123)
-        self.assertEquals(info['reported_object_count'], 0)
-        self.assertEquals(info['reported_bytes_used'], 0)
-
-        put_timestamp = normalize_timestamp(time())
-        sleep(.001)
-        delete_timestamp = normalize_timestamp(time())
-        broker.reported(put_timestamp, delete_timestamp, 2, 1123)
-        info = broker.get_info()
-        self.assertEquals(info['object_count'], 2)
-        self.assertEquals(info['bytes_used'], 1123)
-        self.assertEquals(info['reported_put_timestamp'], put_timestamp)
-        self.assertEquals(info['reported_delete_timestamp'], delete_timestamp)
-        self.assertEquals(info['reported_object_count'], 2)
-        self.assertEquals(info['reported_bytes_used'], 1123)
-
-        sleep(.00001)
-        broker.delete_object('o1', normalize_timestamp(time()))
-        info = broker.get_info()
-        self.assertEquals(info['object_count'], 1)
-        self.assertEquals(info['bytes_used'], 1000)
-        self.assertEquals(info['reported_object_count'], 2)
-        self.assertEquals(info['reported_bytes_used'], 1123)
-
-        sleep(.00001)
-        broker.delete_object('o2', normalize_timestamp(time()))
-        info = broker.get_info()
-        self.assertEquals(info['object_count'], 0)
-        self.assertEquals(info['bytes_used'], 0)
-        self.assertEquals(info['reported_object_count'], 2)
-        self.assertEquals(info['reported_bytes_used'], 1123)
-
-    def test_list_objects_iter(self):
-        """ Test swift.common.db.ContainerBroker.list_objects_iter """
-        broker = ContainerBroker(':memory:', account='a', container='c')
-        broker.initialize(normalize_timestamp('1'))
-        for obj1 in xrange(4):
-            for obj2 in xrange(125):
-                broker.put_object('%d/%04d' % (obj1, obj2),
-                                  normalize_timestamp(time()), 0, 'text/plain',
-                                  'd41d8cd98f00b204e9800998ecf8427e')
-        for obj in xrange(125):
-            broker.put_object('2/0051/%04d' % obj,
-                              normalize_timestamp(time()), 0, 'text/plain',
-                              'd41d8cd98f00b204e9800998ecf8427e')
-
-        for obj in xrange(125):
-            broker.put_object('3/%04d/0049' % obj,
-                              normalize_timestamp(time()), 0, 'text/plain',
-                              'd41d8cd98f00b204e9800998ecf8427e')
-
-        listing = broker.list_objects_iter(100, '', None, None, '')
-        self.assertEquals(len(listing), 100)
-        self.assertEquals(listing[0][0], '0/0000')
-        self.assertEquals(listing[-1][0], '0/0099')
-
-        listing = broker.list_objects_iter(100, '', '0/0050', None, '')
-        self.assertEquals(len(listing), 50)
-        self.assertEquals(listing[0][0], '0/0000')
-        self.assertEquals(listing[-1][0], '0/0049')
-
-        listing = broker.list_objects_iter(100, '0/0099', None, None, '')
-        self.assertEquals(len(listing), 100)
-        self.assertEquals(listing[0][0], '0/0100')
-        self.assertEquals(listing[-1][0], '1/0074')
-
-        listing = broker.list_objects_iter(55, '1/0074', None, None, '')
-        self.assertEquals(len(listing), 55)
-        self.assertEquals(listing[0][0], '1/0075')
-        self.assertEquals(listing[-1][0], '2/0004')
-
-        listing = broker.list_objects_iter(10, '', None, '0/01', '')
-        self.assertEquals(len(listing), 10)
-        self.assertEquals(listing[0][0], '0/0100')
-        self.assertEquals(listing[-1][0], '0/0109')
-
-        listing = broker.list_objects_iter(10, '', None, '0/', '/')
-        self.assertEquals(len(listing), 10)
-        self.assertEquals(listing[0][0], '0/0000')
-        self.assertEquals(listing[-1][0], '0/0009')
-
-        listing = broker.list_objects_iter(10, '', None, '', '/')
-        self.assertEquals(len(listing), 4)
-        self.assertEquals([row[0] for row in listing],
-                          ['0/', '1/', '2/', '3/'])
-
-        listing = broker.list_objects_iter(10, '2', None, None, '/')
-        self.assertEquals(len(listing), 2)
-        self.assertEquals([row[0] for row in listing], ['2/', '3/'])
-
-        listing = broker.list_objects_iter(10, '2/', None,  None, '/')
-        self.assertEquals(len(listing), 1)
-        self.assertEquals([row[0] for row in listing], ['3/'])
-
-        listing = broker.list_objects_iter(10, '2/0050', None, '2/', '/')
-        self.assertEquals(len(listing), 10)
-        self.assertEquals(listing[0][0], '2/0051')
-        self.assertEquals(listing[1][0], '2/0051/')
-        self.assertEquals(listing[2][0], '2/0052')
-        self.assertEquals(listing[-1][0], '2/0059')
-
-        listing = broker.list_objects_iter(10, '3/0045', None, '3/', '/')
-        self.assertEquals(len(listing), 10)
-        self.assertEquals([row[0] for row in listing],
-                           ['3/0045/', '3/0046', '3/0046/', '3/0047',
-                            '3/0047/', '3/0048', '3/0048/', '3/0049',
-                            '3/0049/', '3/0050'])
-
-        broker.put_object('3/0049/', normalize_timestamp(time()), 0,
-                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
-        listing = broker.list_objects_iter(10, '3/0048', None, None, None)
-        self.assertEquals(len(listing), 10)
-        self.assertEquals([row[0] for row in listing],
-            ['3/0048/0049', '3/0049', '3/0049/',
-            '3/0049/0049', '3/0050', '3/0050/0049', '3/0051', '3/0051/0049',
-            '3/0052', '3/0052/0049'])
-
-        listing = broker.list_objects_iter(10, '3/0048', None, '3/', '/')
-        self.assertEquals(len(listing), 10)
-        self.assertEquals([row[0] for row in listing],
-            ['3/0048/', '3/0049', '3/0049/', '3/0050',
-            '3/0050/', '3/0051', '3/0051/', '3/0052', '3/0052/', '3/0053'])
-
-        listing = broker.list_objects_iter(10, None, None, '3/0049/', '/')
-        self.assertEquals(len(listing), 2)
-        self.assertEquals([row[0] for row in listing],
-            ['3/0049/', '3/0049/0049'])
-
-        listing = broker.list_objects_iter(10, None, None, None, None,
-                                           '3/0049')
-        self.assertEquals(len(listing), 1)
-        self.assertEquals([row[0] for row in listing], ['3/0049/0049'])
-
-        listing = broker.list_objects_iter(2, None, None, '3/', '/')
-        self.assertEquals(len(listing), 2)
-        self.assertEquals([row[0] for row in listing], ['3/0000', '3/0000/'])
-
-        listing = broker.list_objects_iter(2, None, None, None, None, '3')
-        self.assertEquals(len(listing), 2)
-        self.assertEquals([row[0] for row in listing], ['3/0000', '3/0001'])
-
-    def test_list_objects_iter_prefix_delim(self):
-        """ Test swift.common.db.ContainerBroker.list_objects_iter """
-        broker = ContainerBroker(':memory:', account='a', container='c')
-        broker.initialize(normalize_timestamp('1'))
-
-        broker.put_object('/pets/dogs/1', normalize_timestamp(0), 0,
-            'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
-        broker.put_object('/pets/dogs/2', normalize_timestamp(0), 0,
-            'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
-        broker.put_object('/pets/fish/a', normalize_timestamp(0), 0,
-            'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
-        broker.put_object('/pets/fish/b', normalize_timestamp(0), 0,
-            'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
-        broker.put_object('/pets/fish_info.txt', normalize_timestamp(0), 0,
-            'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
-        broker.put_object('/snakes', normalize_timestamp(0), 0,
-            'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
-
-        #def list_objects_iter(self, limit, marker, prefix, delimiter,
-        #                      path=None, format=None):
-        listing = broker.list_objects_iter(100, None, None, '/pets/f', '/')
-        self.assertEquals([row[0] for row in listing],
-                          ['/pets/fish/', '/pets/fish_info.txt'])
-        listing = broker.list_objects_iter(100, None, None, '/pets/fish', '/')
-        self.assertEquals([row[0] for row in listing],
-                          ['/pets/fish/', '/pets/fish_info.txt'])
-        listing = broker.list_objects_iter(100, None, None, '/pets/fish/', '/')
-        self.assertEquals([row[0] for row in listing],
-                          ['/pets/fish/a', '/pets/fish/b'])
-
-    def test_double_check_trailing_delimiter(self):
-        """ Test swift.common.db.ContainerBroker.list_objects_iter for a
-            container that has an odd file with a trailing delimiter """
-        broker = ContainerBroker(':memory:', account='a', container='c')
-        broker.initialize(normalize_timestamp('1'))
-        broker.put_object('a', normalize_timestamp(time()), 0,
-                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
-        broker.put_object('a/', normalize_timestamp(time()), 0,
-                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
-        broker.put_object('a/a', normalize_timestamp(time()), 0,
-                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
-        broker.put_object('a/a/a', normalize_timestamp(time()), 0,
-                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
-        broker.put_object('a/a/b', normalize_timestamp(time()), 0,
-                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
-        broker.put_object('a/b', normalize_timestamp(time()), 0,
-                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
-        broker.put_object('b', normalize_timestamp(time()), 0,
-                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
-        broker.put_object('b/a', normalize_timestamp(time()), 0,
-                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
-        broker.put_object('b/b', normalize_timestamp(time()), 0,
-                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
-        broker.put_object('c', normalize_timestamp(time()), 0,
-                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
-        listing = broker.list_objects_iter(15, None, None, None, None)
-        self.assertEquals(len(listing), 10)
-        self.assertEquals([row[0] for row in listing],
-        ['a', 'a/', 'a/a', 'a/a/a', 'a/a/b', 'a/b', 'b', 'b/a', 'b/b', 'c'])
-        listing = broker.list_objects_iter(15, None, None, '', '/')
-        self.assertEquals(len(listing), 5)
-        self.assertEquals([row[0] for row in listing],
-        ['a', 'a/', 'b', 'b/', 'c'])
-        listing = broker.list_objects_iter(15, None, None, 'a/', '/')
-        self.assertEquals(len(listing), 4)
-        self.assertEquals([row[0] for row in listing],
-        ['a/', 'a/a', 'a/a/', 'a/b'])
-        listing = broker.list_objects_iter(15, None, None, 'b/', '/')
-        self.assertEquals(len(listing), 2)
-        self.assertEquals([row[0] for row in listing], ['b/a', 'b/b'])
-
-    def test_chexor(self):
-        broker = ContainerBroker(':memory:', account='a', container='c')
-        broker.initialize(normalize_timestamp('1'))
-        broker.put_object('a', normalize_timestamp(1), 0,
-                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
-        broker.put_object('b', normalize_timestamp(2), 0,
-                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
-        hasha = hashlib.md5('%s-%s' % ('a', '0000000001.00000')).digest()
-        hashb = hashlib.md5('%s-%s' % ('b', '0000000002.00000')).digest()
-        hashc = ''.join(('%2x' % (ord(a) ^ ord(b)) for a, b in zip(hasha,
-                                                                 hashb)))
-        self.assertEquals(broker.get_info()['hash'], hashc)
-        broker.put_object('b', normalize_timestamp(3), 0,
-                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
-        hashb = hashlib.md5('%s-%s' % ('b', '0000000003.00000')).digest()
-        hashc = ''.join(('%02x' % (ord(a) ^ ord(b)) for a, b in zip(hasha,
-                                                                  hashb)))
-        self.assertEquals(broker.get_info()['hash'], hashc)
-
-    def test_newid(self):
-        """test DatabaseBroker.newid"""
-        broker = ContainerBroker(':memory:', account='a', container='c')
-        broker.initialize(normalize_timestamp('1'))
-        id = broker.get_info()['id']
-        broker.newid('someid')
-        self.assertNotEquals(id, broker.get_info()['id'])
-
-    def test_get_items_since(self):
-        """test DatabaseBroker.get_items_since"""
-        broker = ContainerBroker(':memory:', account='a', container='c')
-        broker.initialize(normalize_timestamp('1'))
-        broker.put_object('a', normalize_timestamp(1), 0,
-                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
-        max_row = broker.get_replication_info()['max_row']
-        broker.put_object('b', normalize_timestamp(2), 0,
-                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
-        items = broker.get_items_since(max_row, 1000)
-        self.assertEquals(len(items), 1)
-        self.assertEquals(items[0]['name'], 'b')
-
-    def test_sync_merging(self):
-        """ exercise the DatabaseBroker sync functions a bit """
-        broker1 = ContainerBroker(':memory:', account='a', container='c')
-        broker1.initialize(normalize_timestamp('1'))
-        broker2 = ContainerBroker(':memory:', account='a', container='c')
-        broker2.initialize(normalize_timestamp('1'))
-        self.assertEquals(broker2.get_sync('12345'), -1)
-        broker1.merge_syncs([{'sync_point': 3, 'remote_id': '12345'}])
-        broker2.merge_syncs(broker1.get_syncs())
-        self.assertEquals(broker2.get_sync('12345'), 3)
-
-    def test_merge_items(self):
-        broker1 = ContainerBroker(':memory:', account='a', container='c')
-        broker1.initialize(normalize_timestamp('1'))
-        broker2 = ContainerBroker(':memory:', account='a', container='c')
-        broker2.initialize(normalize_timestamp('1'))
-        broker1.put_object('a', normalize_timestamp(1), 0,
-                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
-        broker1.put_object('b', normalize_timestamp(2), 0,
-                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
-        id = broker1.get_info()['id']
-        broker2.merge_items(broker1.get_items_since(
-            broker2.get_sync(id), 1000), id)
-        items = broker2.get_items_since(-1, 1000)
-        self.assertEquals(len(items), 2)
-        self.assertEquals(['a', 'b'], sorted([rec['name'] for rec in items]))
-        broker1.put_object('c', normalize_timestamp(3), 0,
-                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
-        broker2.merge_items(broker1.get_items_since(
-            broker2.get_sync(id), 1000), id)
-        items = broker2.get_items_since(-1, 1000)
-        self.assertEquals(len(items), 3)
-        self.assertEquals(['a', 'b', 'c'],
-                          sorted([rec['name'] for rec in items]))
-
-    def test_merge_items_overwrite(self):
-        """test DatabaseBroker.merge_items"""
-        broker1 = ContainerBroker(':memory:', account='a', container='c')
-        broker1.initialize(normalize_timestamp('1'))
-        id = broker1.get_info()['id']
-        broker2 = ContainerBroker(':memory:', account='a', container='c')
-        broker2.initialize(normalize_timestamp('1'))
-        broker1.put_object('a', normalize_timestamp(2), 0,
-                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
-        broker1.put_object('b', normalize_timestamp(3), 0,
-                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
-        broker2.merge_items(broker1.get_items_since(
-            broker2.get_sync(id), 1000), id)
-        broker1.put_object('a', normalize_timestamp(4), 0,
-                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
-        broker2.merge_items(broker1.get_items_since(
-            broker2.get_sync(id), 1000), id)
-        items = broker2.get_items_since(-1, 1000)
-        self.assertEquals(['a', 'b'], sorted([rec['name'] for rec in items]))
-        for rec in items:
-            if rec['name'] == 'a':
-                self.assertEquals(rec['created_at'], normalize_timestamp(4))
-            if rec['name'] == 'b':
-                self.assertEquals(rec['created_at'], normalize_timestamp(3))
-
-    def test_merge_items_post_overwrite_out_of_order(self):
-        """test DatabaseBroker.merge_items"""
-        broker1 = ContainerBroker(':memory:', account='a', container='c')
-        broker1.initialize(normalize_timestamp('1'))
-        id = broker1.get_info()['id']
-        broker2 = ContainerBroker(':memory:', account='a', container='c')
-        broker2.initialize(normalize_timestamp('1'))
-        broker1.put_object('a', normalize_timestamp(2), 0,
-                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
-        broker1.put_object('b', normalize_timestamp(3), 0,
-                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
-        broker2.merge_items(broker1.get_items_since(
-            broker2.get_sync(id), 1000), id)
-        broker1.put_object('a', normalize_timestamp(4), 0,
-                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
-        broker2.merge_items(broker1.get_items_since(
-            broker2.get_sync(id), 1000), id)
-        items = broker2.get_items_since(-1, 1000)
-        self.assertEquals(['a', 'b'], sorted([rec['name'] for rec in items]))
-        for rec in items:
-            if rec['name'] == 'a':
-                self.assertEquals(rec['created_at'], normalize_timestamp(4))
-            if rec['name'] == 'b':
-                self.assertEquals(rec['created_at'], normalize_timestamp(3))
-                self.assertEquals(rec['content_type'], 'text/plain')
-        items = broker2.get_items_since(-1, 1000)
-        self.assertEquals(['a', 'b'], sorted([rec['name'] for rec in items]))
-        for rec in items:
-            if rec['name'] == 'a':
-                self.assertEquals(rec['created_at'], normalize_timestamp(4))
-            if rec['name'] == 'b':
-                self.assertEquals(rec['created_at'], normalize_timestamp(3))
-        broker1.put_object('b', normalize_timestamp(5), 0,
-                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
-        broker2.merge_items(broker1.get_items_since(
-            broker2.get_sync(id), 1000), id)
-        items = broker2.get_items_since(-1, 1000)
-        self.assertEquals(['a', 'b'], sorted([rec['name'] for rec in items]))
-        for rec in items:
-            if rec['name'] == 'a':
-                self.assertEquals(rec['created_at'], normalize_timestamp(4))
-            if rec['name'] == 'b':
-                self.assertEquals(rec['created_at'], normalize_timestamp(5))
-                self.assertEquals(rec['content_type'], 'text/plain')
-
-
-def premetadata_create_container_stat_table(self, conn, put_timestamp=None):
-    """
-    Copied from swift.common.db.ContainerBroker before the metadata column was
-    added; used for testing with TestContainerBrokerBeforeMetadata.
-
-    Create the container_stat table which is specifc to the container DB.
-
-    :param conn: DB connection object
-    :param put_timestamp: put timestamp
-    """
-    if put_timestamp is None:
-        put_timestamp = normalize_timestamp(0)
-    conn.executescript("""
-        CREATE TABLE container_stat (
-            account TEXT,
-            container TEXT,
-            created_at TEXT,
-            put_timestamp TEXT DEFAULT '0',
-            delete_timestamp TEXT DEFAULT '0',
-            object_count INTEGER,
-            bytes_used INTEGER,
-            reported_put_timestamp TEXT DEFAULT '0',
-            reported_delete_timestamp TEXT DEFAULT '0',
-            reported_object_count INTEGER DEFAULT 0,
-            reported_bytes_used INTEGER DEFAULT 0,
-            hash TEXT default '00000000000000000000000000000000',
-            id TEXT,
-            status TEXT DEFAULT '',
-            status_changed_at TEXT DEFAULT '0'
-        );
-
-        INSERT INTO container_stat (object_count, bytes_used)
-            VALUES (0, 0);
-    """)
-    conn.execute('''
-        UPDATE container_stat
-        SET account = ?, container = ?, created_at = ?, id = ?,
-            put_timestamp = ?
-    ''', (self.account, self.container, normalize_timestamp(time()),
-          str(uuid4()), put_timestamp))
-
-
-class TestContainerBrokerBeforeMetadata(TestContainerBroker):
-    """
-    Tests for swift.common.db.ContainerBroker against databases created before
-    the metadata column was added.
-    """
-
-    def setUp(self):
-        self._imported_create_container_stat_table = \
-            ContainerBroker.create_container_stat_table
-        ContainerBroker.create_container_stat_table = \
-            premetadata_create_container_stat_table
-        broker = ContainerBroker(':memory:', account='a', container='c')
-        broker.initialize(normalize_timestamp('1'))
-        exc = None
-        with broker.get() as conn:
-            try:
-                conn.execute('SELECT metadata FROM container_stat')
-            except BaseException, err:
-                exc = err
-        self.assert_('no such column: metadata' in str(exc))
-
-    def tearDown(self):
-        ContainerBroker.create_container_stat_table = \
-            self._imported_create_container_stat_table
-        broker = ContainerBroker(':memory:', account='a', container='c')
-        broker.initialize(normalize_timestamp('1'))
-        with broker.get() as conn:
-            conn.execute('SELECT metadata FROM container_stat')
-
-
-def prexsync_create_container_stat_table(self, conn, put_timestamp=None):
-    """
-    Copied from swift.common.db.ContainerBroker before the
-    x_container_sync_point[12] columns were added; used for testing with
-    TestContainerBrokerBeforeXSync.
-
-    Create the container_stat table which is specifc to the container DB.
-
-    :param conn: DB connection object
-    :param put_timestamp: put timestamp
-    """
-    if put_timestamp is None:
-        put_timestamp = normalize_timestamp(0)
-    conn.executescript("""
-        CREATE TABLE container_stat (
-            account TEXT,
-            container TEXT,
-            created_at TEXT,
-            put_timestamp TEXT DEFAULT '0',
-            delete_timestamp TEXT DEFAULT '0',
-            object_count INTEGER,
-            bytes_used INTEGER,
-            reported_put_timestamp TEXT DEFAULT '0',
-            reported_delete_timestamp TEXT DEFAULT '0',
-            reported_object_count INTEGER DEFAULT 0,
-            reported_bytes_used INTEGER DEFAULT 0,
-            hash TEXT default '00000000000000000000000000000000',
-            id TEXT,
-            status TEXT DEFAULT '',
-            status_changed_at TEXT DEFAULT '0',
-            metadata TEXT DEFAULT ''
-        );
-
-        INSERT INTO container_stat (object_count, bytes_used)
-            VALUES (0, 0);
-    """)
-    conn.execute('''
-        UPDATE container_stat
-        SET account = ?, container = ?, created_at = ?, id = ?,
-            put_timestamp = ?
-    ''', (self.account, self.container, normalize_timestamp(time()),
-          str(uuid4()), put_timestamp))
-
-
-class TestContainerBrokerBeforeXSync(TestContainerBroker):
-    """
-    Tests for swift.common.db.ContainerBroker against databases created before
-    the x_container_sync_point[12] columns were added.
-    """
-
-    def setUp(self):
-        self._imported_create_container_stat_table = \
-            ContainerBroker.create_container_stat_table
-        ContainerBroker.create_container_stat_table = \
-            prexsync_create_container_stat_table
-        broker = ContainerBroker(':memory:', account='a', container='c')
-        broker.initialize(normalize_timestamp('1'))
-        exc = None
-        with broker.get() as conn:
-            try:
-                conn.execute('''SELECT x_container_sync_point1
-                                FROM container_stat''')
-            except BaseException, err:
-                exc = err
-        self.assert_('no such column: x_container_sync_point1' in str(exc))
-
-    def tearDown(self):
-        ContainerBroker.create_container_stat_table = \
-            self._imported_create_container_stat_table
-        broker = ContainerBroker(':memory:', account='a', container='c')
-        broker.initialize(normalize_timestamp('1'))
-        with broker.get() as conn:
-            conn.execute('SELECT x_container_sync_point1 FROM container_stat')
-
-
-class TestAccountBroker(unittest.TestCase):
-    """ Tests for swift.common.db.AccountBroker """
+        broker.reclaim(float(ts[4]), float(ts[4]))
+        self.assertIn('First', broker.metadata)
+        self.assertEqual(broker.metadata['First'],
+                         [first_value, ts[2].internal])
+        self.assertNotIn('Second', broker.metadata)
+        # Delete first item (by setting to empty string)
+        broker.update_metadata({'First': ['', ts[5].internal]})
+        self.assertIn('First', broker.metadata)
+        # Check that sync_timestamp doesn't cause item to be reclaimed
+        broker.reclaim(float(ts[4]), float(ts[4]))
+        self.assertIn('First', broker.metadata)
+
+    def test_update_metadata_missing_container_info(self):
+        # Test missing container_info/container_stat row
+        dbpath = os.path.join(self.testdir, 'dev', 'dbs', 'par', 'pre', 'db')
+        mkdirs(dbpath)
+        qpath = os.path.join(self.testdir, 'dev', 'quarantined', 'containers',
+                             'db')
+        copy(os.path.join(os.path.dirname(__file__),
+                          'missing_container_info.db'),
+             os.path.join(dbpath, '1.db'))
+
+        broker = DatabaseBroker(os.path.join(dbpath, '1.db'))
+        broker.db_type = 'container'
+
+        with self.assertRaises(sqlite3.DatabaseError) as raised:
+            broker.update_metadata({'First': ['1', normalize_timestamp(1)]})
+        self.assertEqual(
+            str(raised.exception),
+            'Quarantined %s to %s due to missing row in container_stat table' %
+            (dbpath, qpath))
+
+    def test_reclaim_missing_container_info(self):
+        # Test missing container_info/container_stat row
+        dbpath = os.path.join(self.testdir, 'dev', 'dbs', 'par', 'pre', 'db')
+        mkdirs(dbpath)
+        qpath = os.path.join(self.testdir, 'dev', 'quarantined', 'containers',
+                             'db')
+        copy(os.path.join(os.path.dirname(__file__),
+                          'missing_container_info.db'),
+             os.path.join(dbpath, '1.db'))
+
+        broker = DatabaseBroker(os.path.join(dbpath, '1.db'))
+        broker.db_type = 'container'
+
+        with self.assertRaises(sqlite3.DatabaseError) as raised, \
+                broker.get() as conn:
+            broker._reclaim_metadata(conn, 0)
+        self.assertEqual(
+            str(raised.exception),
+            'Quarantined %s to %s due to missing row in container_stat table' %
+            (dbpath, qpath))
+
+    @patch.object(DatabaseBroker, 'validate_metadata')
+    def test_validate_metadata_is_called_from_update_metadata(self, mock):
+        broker = self.get_replication_info_tester(metadata=True)
+        first_timestamp = normalize_timestamp(1)
+        first_value = '1'
+        metadata = {'First': [first_value, first_timestamp]}
+        broker.update_metadata(metadata, validate_metadata=True)
+        self.assertTrue(mock.called)
 
-    def test_creation(self):
-        """ Test swift.common.db.AccountBroker.__init__ """
-        broker = AccountBroker(':memory:', account='a')
-        self.assertEqual(broker.db_file, ':memory:')
-        got_exc = False
+    @patch.object(DatabaseBroker, 'validate_metadata')
+    def test_validate_metadata_is_not_called_from_update_metadata(self, mock):
+        broker = self.get_replication_info_tester(metadata=True)
+        first_timestamp = normalize_timestamp(1)
+        first_value = '1'
+        metadata = {'First': [first_value, first_timestamp]}
+        broker.update_metadata(metadata)
+        self.assertFalse(mock.called)
+
+    def test_metadata_with_max_count(self):
+        metadata = {}
+        for c in range(MAX_META_COUNT):
+            key = 'X-Account-Meta-F{0}'.format(c)
+            metadata[key] = ('B', normalize_timestamp(1))
+        key = 'X-Account-Meta-Foo'
+        metadata[key] = ('', normalize_timestamp(1))
+        self.assertIsNone(DatabaseBroker.validate_metadata(metadata))
+
+    def test_metadata_raises_exception_on_non_utf8(self):
+        def try_validate(metadata):
+            with self.assertRaises(HTTPException) as raised:
+                DatabaseBroker.validate_metadata(metadata)
+            self.assertEqual(str(raised.exception), '400 Bad Request')
+        ts = normalize_timestamp(1)
+        try_validate({'X-Account-Meta-Foo': (b'\xff', ts)})
+        try_validate({b'X-Container-Meta-\xff': ('bar', ts)})
+
+    def test_metadata_raises_exception_over_max_count(self):
+        metadata = {}
+        for c in range(MAX_META_COUNT + 1):
+            key = 'X-Account-Meta-F{0}'.format(c)
+            metadata[key] = ('B', normalize_timestamp(1))
+        message = ''
         try:
-            with broker.get() as conn:
-                pass
-        except Exception:
-            got_exc = True
-        self.assert_(got_exc)
-        broker.initialize(normalize_timestamp('1'))
-        with broker.get() as conn:
-            curs = conn.cursor()
-            curs.execute('SELECT 1')
-            self.assertEqual(curs.fetchall()[0][0], 1)
-
-    def test_exception(self):
-        """ Test swift.common.db.AccountBroker throwing a conn away after
-            exception """
-        first_conn = None
-        broker = AccountBroker(':memory:', account='a')
-        broker.initialize(normalize_timestamp('1'))
-        with broker.get() as conn:
-            first_conn = conn
+            DatabaseBroker.validate_metadata(metadata)
+        except HTTPException as e:
+            message = str(e)
+        self.assertEqual(message, '400 Bad Request')
+
+    def test_metadata_with_max_overall_size(self):
+        metadata = {}
+        metadata_value = 'v' * MAX_META_VALUE_LENGTH
+        size = 0
+        x = 0
+        while size < (MAX_META_OVERALL_SIZE - 4
+                      - MAX_META_VALUE_LENGTH):
+            size += 4 + MAX_META_VALUE_LENGTH
+            metadata['X-Account-Meta-%04d' % x] = (metadata_value,
+                                                   normalize_timestamp(1))
+            x += 1
+        if MAX_META_OVERALL_SIZE - size > 1:
+            metadata['X-Account-Meta-k'] = (
+                'v' * (MAX_META_OVERALL_SIZE - size - 1),
+                normalize_timestamp(1))
+        self.assertIsNone(DatabaseBroker.validate_metadata(metadata))
+
+    def test_metadata_raises_exception_over_max_overall_size(self):
+        metadata = {}
+        metadata_value = 'k' * MAX_META_VALUE_LENGTH
+        size = 0
+        x = 0
+        while size < (MAX_META_OVERALL_SIZE - 4
+                      - MAX_META_VALUE_LENGTH):
+            size += 4 + MAX_META_VALUE_LENGTH
+            metadata['X-Account-Meta-%04d' % x] = (metadata_value,
+                                                   normalize_timestamp(1))
+            x += 1
+        if MAX_META_OVERALL_SIZE - size > 1:
+            metadata['X-Account-Meta-k'] = (
+                'v' * (MAX_META_OVERALL_SIZE - size - 1),
+                normalize_timestamp(1))
+        metadata['X-Account-Meta-k2'] = ('v', normalize_timestamp(1))
+        message = ''
         try:
-            with broker.get() as conn:
-                self.assertEquals(first_conn, conn)
-                raise Exception('OMG')
-        except Exception:
+            DatabaseBroker.validate_metadata(metadata)
+        except HTTPException as e:
+            message = str(e)
+        self.assertEqual(message, '400 Bad Request')
+
+    def test_possibly_quarantine_db_errors(self):
+        dbpath = os.path.join(self.testdir, 'dev', 'dbs', 'par', 'pre', 'db')
+        qpath = os.path.join(self.testdir, 'dev', 'quarantined', 'tests', 'db')
+        # Data is a list of Excpetions to be raised and expected values in the
+        # log
+        data = [
+            (sqlite3.DatabaseError('database disk image is malformed'),
+             'malformed'),
+            (sqlite3.DatabaseError('malformed database schema'), 'malformed'),
+            (sqlite3.DatabaseError('file is encrypted or is not a database'),
+             'corrupted'),
+            (sqlite3.OperationalError('disk I/O error'),
+             'disk error while accessing')]
+
+        for i, (ex, hint) in enumerate(data):
+            mkdirs(dbpath)
+            broker = DatabaseBroker(os.path.join(dbpath, '%d.db' % (i)))
+            broker.db_type = 'test'
+            with self.assertRaises(sqlite3.DatabaseError) as raised:
+                broker.possibly_quarantine(ex)
+            self.assertEqual(
+                str(raised.exception),
+                'Quarantined %s to %s due to %s database' %
+                (dbpath, qpath, hint))
+
+    def test_skip_commits(self):
+        broker = DatabaseBroker(self.db_path)
+        self.assertTrue(broker._skip_commit_puts())
+        broker._initialize = MagicMock()
+        broker.initialize(Timestamp.now())
+        self.assertTrue(broker._skip_commit_puts())
+
+        # not initialized
+        db_file = os.path.join(self.testdir, '1.db')
+        broker = DatabaseBroker(db_file)
+        self.assertFalse(os.path.exists(broker.db_file))  # sanity check
+        self.assertTrue(broker._skip_commit_puts())
+
+        # no pending file
+        broker._initialize = MagicMock()
+        broker.initialize(Timestamp.now())
+        self.assertTrue(os.path.exists(broker.db_file))  # sanity check
+        self.assertFalse(os.path.exists(broker.pending_file))  # sanity check
+        self.assertTrue(broker._skip_commit_puts())
+
+        # pending file exists
+        with open(broker.pending_file, 'wb'):
             pass
-        self.assert_(broker.conn is None)
-
-    def test_empty(self):
-        """ Test swift.common.db.AccountBroker.empty """
-        broker = AccountBroker(':memory:', account='a')
-        broker.initialize(normalize_timestamp('1'))
-        self.assert_(broker.empty())
-        broker.put_container('o', normalize_timestamp(time()), 0, 0, 0)
-        self.assert_(not broker.empty())
-        sleep(.00001)
-        broker.put_container('o', 0, normalize_timestamp(time()), 0, 0)
-        self.assert_(broker.empty())
-
-    def test_reclaim(self):
-        broker = AccountBroker(':memory:', account='test_account')
-        broker.initialize(normalize_timestamp('1'))
-        broker.put_container('c', normalize_timestamp(time()), 0, 0, 0)
-        with broker.get() as conn:
-            self.assertEquals(conn.execute(
-                "SELECT count(*) FROM container "
-                "WHERE deleted = 0").fetchone()[0], 1)
-            self.assertEquals(conn.execute(
-                "SELECT count(*) FROM container "
-                "WHERE deleted = 1").fetchone()[0], 0)
-        broker.reclaim(normalize_timestamp(time() - 999), time())
-        with broker.get() as conn:
-            self.assertEquals(conn.execute(
-                "SELECT count(*) FROM container "
-                "WHERE deleted = 0").fetchone()[0], 1)
-            self.assertEquals(conn.execute(
-                "SELECT count(*) FROM container "
-                "WHERE deleted = 1").fetchone()[0], 0)
-        sleep(.00001)
-        broker.put_container('c', 0, normalize_timestamp(time()), 0, 0)
-        with broker.get() as conn:
-            self.assertEquals(conn.execute(
-                "SELECT count(*) FROM container "
-                "WHERE deleted = 0").fetchone()[0], 0)
-            self.assertEquals(conn.execute(
-                "SELECT count(*) FROM container "
-                "WHERE deleted = 1").fetchone()[0], 1)
-        broker.reclaim(normalize_timestamp(time() - 999), time())
-        with broker.get() as conn:
-            self.assertEquals(conn.execute(
-                "SELECT count(*) FROM container "
-                "WHERE deleted = 0").fetchone()[0], 0)
-            self.assertEquals(conn.execute(
-                "SELECT count(*) FROM container "
-                "WHERE deleted = 1").fetchone()[0], 1)
-        sleep(.00001)
-        broker.reclaim(normalize_timestamp(time()), time())
-        with broker.get() as conn:
-            self.assertEquals(conn.execute(
-                "SELECT count(*) FROM container "
-                "WHERE deleted = 0").fetchone()[0], 0)
-            self.assertEquals(conn.execute(
-                "SELECT count(*) FROM container "
-                "WHERE deleted = 1").fetchone()[0], 0)
-        # Test reclaim after deletion. Create 3 test containers
-        broker.put_container('x', 0, 0, 0, 0)
-        broker.put_container('y', 0, 0, 0, 0)
-        broker.put_container('z', 0, 0, 0, 0)
-        res = broker.reclaim(normalize_timestamp(time()), time())
-        # self.assertEquals(len(res), 2)
-        # self.assert_(isinstance(res, tuple))
-        # containers, account_name = res
-        # self.assert_(containers is None)
-        # self.assert_(account_name is None)
-        # Now delete the account
-        broker.delete_db(normalize_timestamp(time()))
-        res = broker.reclaim(normalize_timestamp(time()), time())
-        # self.assertEquals(len(res), 2)
-        # self.assert_(isinstance(res, tuple))
-        # containers, account_name = res
-        # self.assertEquals(account_name, 'test_account')
-        # self.assertEquals(len(containers), 3)
-        # self.assert_('x' in containers)
-        # self.assert_('y' in containers)
-        # self.assert_('z' in containers)
-        # self.assert_('a' not in containers)
-
-    def test_delete_container(self):
-        """ Test swift.common.db.AccountBroker.delete_container """
-        broker = AccountBroker(':memory:', account='a')
-        broker.initialize(normalize_timestamp('1'))
-        broker.put_container('o', normalize_timestamp(time()), 0, 0, 0)
-        with broker.get() as conn:
-            self.assertEquals(conn.execute(
-                "SELECT count(*) FROM container "
-                "WHERE deleted = 0").fetchone()[0], 1)
-            self.assertEquals(conn.execute(
-                "SELECT count(*) FROM container "
-                "WHERE deleted = 1").fetchone()[0], 0)
-        sleep(.00001)
-        broker.put_container('o', 0, normalize_timestamp(time()), 0, 0)
-        with broker.get() as conn:
-            self.assertEquals(conn.execute(
-                "SELECT count(*) FROM container "
-                "WHERE deleted = 0").fetchone()[0], 0)
-            self.assertEquals(conn.execute(
-                "SELECT count(*) FROM container "
-                "WHERE deleted = 1").fetchone()[0], 1)
-
-    def test_get_container_timestamp(self):
-        """ Test swift.common.db.AccountBroker.get_container_timestamp """
-        broker = AccountBroker(':memory:', account='a')
-        broker.initialize(normalize_timestamp('1'))
-
-        # Create initial container
-        timestamp = normalize_timestamp(time())
-        broker.put_container('container_name', timestamp, 0, 0, 0)
-        # test extant map
-        ts = broker.get_container_timestamp('container_name')
-        self.assertEquals(ts, timestamp)
-        # test missing map
-        ts = broker.get_container_timestamp('something else')
-        self.assertEquals(ts, None)
-
-    def test_put_container(self):
-        """ Test swift.common.db.AccountBroker.put_container """
-        broker = AccountBroker(':memory:', account='a')
-        broker.initialize(normalize_timestamp('1'))
-
-        # Create initial container
-        timestamp = normalize_timestamp(time())
-        broker.put_container('"{<container \'&\' name>}"', timestamp, 0, 0, 0)
-        with broker.get() as conn:
-            self.assertEquals(conn.execute(
-                "SELECT name FROM container").fetchone()[0],
-                '"{<container \'&\' name>}"')
-            self.assertEquals(conn.execute(
-                "SELECT put_timestamp FROM container").fetchone()[0],
-                timestamp)
-            self.assertEquals(conn.execute(
-                "SELECT deleted FROM container").fetchone()[0], 0)
-
-        # Reput same event
-        broker.put_container('"{<container \'&\' name>}"', timestamp, 0, 0, 0)
-        with broker.get() as conn:
-            self.assertEquals(conn.execute(
-                "SELECT name FROM container").fetchone()[0],
-                '"{<container \'&\' name>}"')
-            self.assertEquals(conn.execute(
-                "SELECT put_timestamp FROM container").fetchone()[0],
-                timestamp)
-            self.assertEquals(conn.execute(
-                "SELECT deleted FROM container").fetchone()[0], 0)
-
-        # Put new event
-        sleep(.00001)
-        timestamp = normalize_timestamp(time())
-        broker.put_container('"{<container \'&\' name>}"', timestamp, 0, 0, 0)
-        with broker.get() as conn:
-            self.assertEquals(conn.execute(
-                "SELECT name FROM container").fetchone()[0],
-                '"{<container \'&\' name>}"')
-            self.assertEquals(conn.execute(
-                "SELECT put_timestamp FROM container").fetchone()[0],
-                timestamp)
-            self.assertEquals(conn.execute(
-                "SELECT deleted FROM container").fetchone()[0], 0)
-
-        # Put old event
-        otimestamp = normalize_timestamp(float(timestamp) - 1)
-        broker.put_container('"{<container \'&\' name>}"', otimestamp, 0, 0, 0)
-        with broker.get() as conn:
-            self.assertEquals(conn.execute(
-                "SELECT name FROM container").fetchone()[0],
-                '"{<container \'&\' name>}"')
-            self.assertEquals(conn.execute(
-                "SELECT put_timestamp FROM container").fetchone()[0],
-                timestamp)
-            self.assertEquals(conn.execute(
-                "SELECT deleted FROM container").fetchone()[0], 0)
-
-        # Put old delete event
-        dtimestamp = normalize_timestamp(float(timestamp) - 1)
-        broker.put_container('"{<container \'&\' name>}"', 0, dtimestamp, 0, 0)
-        with broker.get() as conn:
-            self.assertEquals(conn.execute(
-                "SELECT name FROM container").fetchone()[0],
-                '"{<container \'&\' name>}"')
-            self.assertEquals(conn.execute(
-                "SELECT put_timestamp FROM container").fetchone()[0],
-                timestamp)
-            self.assertEquals(conn.execute(
-                "SELECT delete_timestamp FROM container").fetchone()[0],
-                dtimestamp)
-            self.assertEquals(conn.execute(
-                "SELECT deleted FROM container").fetchone()[0], 0)
-
-        # Put new delete event
-        sleep(.00001)
-        timestamp = normalize_timestamp(time())
-        broker.put_container('"{<container \'&\' name>}"', 0, timestamp, 0, 0)
-        with broker.get() as conn:
-            self.assertEquals(conn.execute(
-                "SELECT name FROM container").fetchone()[0],
-                '"{<container \'&\' name>}"')
-            self.assertEquals(conn.execute(
-                "SELECT delete_timestamp FROM container").fetchone()[0],
-                timestamp)
-            self.assertEquals(conn.execute(
-                "SELECT deleted FROM container").fetchone()[0], 1)
-
-        # Put new event
-        sleep(.00001)
-        timestamp = normalize_timestamp(time())
-        broker.put_container('"{<container \'&\' name>}"', timestamp, 0, 0, 0)
-        with broker.get() as conn:
-            self.assertEquals(conn.execute(
-                "SELECT name FROM container").fetchone()[0],
-                '"{<container \'&\' name>}"')
-            self.assertEquals(conn.execute(
-                "SELECT put_timestamp FROM container").fetchone()[0],
-                timestamp)
-            self.assertEquals(conn.execute(
-                "SELECT deleted FROM container").fetchone()[0], 0)
-
-    def test_get_info(self):
-        """ Test swift.common.db.AccountBroker.get_info """
-        broker = AccountBroker(':memory:', account='test1')
-        broker.initialize(normalize_timestamp('1'))
-
-        info = broker.get_info()
-        self.assertEquals(info['account'], 'test1')
-        self.assertEquals(info['hash'], '00000000000000000000000000000000')
-
-        info = broker.get_info()
-        self.assertEquals(info['container_count'], 0)
+        self.assertTrue(os.path.exists(broker.pending_file))  # sanity check
+        self.assertFalse(broker._skip_commit_puts())
 
-        broker.put_container('c1', normalize_timestamp(time()), 0, 0, 0)
-        info = broker.get_info()
-        self.assertEquals(info['container_count'], 1)
+        # skip_commits is True
+        broker.skip_commits = True
+        self.assertTrue(broker._skip_commit_puts())
 
-        sleep(.00001)
-        broker.put_container('c2', normalize_timestamp(time()), 0, 0, 0)
-        info = broker.get_info()
-        self.assertEquals(info['container_count'], 2)
-
-        sleep(.00001)
-        broker.put_container('c2', normalize_timestamp(time()), 0, 0, 0)
-        info = broker.get_info()
-        self.assertEquals(info['container_count'], 2)
-
-        sleep(.00001)
-        broker.put_container('c1', 0, normalize_timestamp(time()), 0, 0)
-        info = broker.get_info()
-        self.assertEquals(info['container_count'], 1)
-
-        sleep(.00001)
-        broker.put_container('c2', 0, normalize_timestamp(time()), 0, 0)
-        info = broker.get_info()
-        self.assertEquals(info['container_count'], 0)
-
-    def test_list_containers_iter(self):
-        """ Test swift.common.db.AccountBroker.list_containers_iter """
-        broker = AccountBroker(':memory:', account='a')
-        broker.initialize(normalize_timestamp('1'))
-        for cont1 in xrange(4):
-            for cont2 in xrange(125):
-                broker.put_container('%d/%04d' % (cont1, cont2),
-                                     normalize_timestamp(time()), 0, 0, 0)
-        for cont in xrange(125):
-            broker.put_container('2/0051/%04d' % cont,
-                                 normalize_timestamp(time()), 0, 0, 0)
-
-        for cont in xrange(125):
-            broker.put_container('3/%04d/0049' % cont,
-                                 normalize_timestamp(time()), 0, 0, 0)
-
-        listing = broker.list_containers_iter(100, '', None, None, '')
-        self.assertEquals(len(listing), 100)
-        self.assertEquals(listing[0][0], '0/0000')
-        self.assertEquals(listing[-1][0], '0/0099')
-
-        listing = broker.list_containers_iter(100, '', '0/0050', None, '')
-        self.assertEquals(len(listing), 50)
-        self.assertEquals(listing[0][0], '0/0000')
-        self.assertEquals(listing[-1][0], '0/0049')
-
-        listing = broker.list_containers_iter(100, '0/0099', None, None, '')
-        self.assertEquals(len(listing), 100)
-        self.assertEquals(listing[0][0], '0/0100')
-        self.assertEquals(listing[-1][0], '1/0074')
-
-        listing = broker.list_containers_iter(55, '1/0074', None, None, '')
-        self.assertEquals(len(listing), 55)
-        self.assertEquals(listing[0][0], '1/0075')
-        self.assertEquals(listing[-1][0], '2/0004')
-
-        listing = broker.list_containers_iter(10, '', None, '0/01', '')
-        self.assertEquals(len(listing), 10)
-        self.assertEquals(listing[0][0], '0/0100')
-        self.assertEquals(listing[-1][0], '0/0109')
-
-        listing = broker.list_containers_iter(10, '', None, '0/01', '/')
-        self.assertEquals(len(listing), 10)
-        self.assertEquals(listing[0][0], '0/0100')
-        self.assertEquals(listing[-1][0], '0/0109')
-
-        listing = broker.list_containers_iter(10, '', None, '0/', '/')
-        self.assertEquals(len(listing), 10)
-        self.assertEquals(listing[0][0], '0/0000')
-        self.assertEquals(listing[-1][0], '0/0009')
-
-        listing = broker.list_containers_iter(10, '', None, '', '/')
-        self.assertEquals(len(listing), 4)
-        self.assertEquals([row[0] for row in listing],
-                          ['0/', '1/', '2/', '3/'])
-
-        listing = broker.list_containers_iter(10, '2/', None, None, '/')
-        self.assertEquals(len(listing), 1)
-        self.assertEquals([row[0] for row in listing], ['3/'])
-
-        listing = broker.list_containers_iter(10, '', None, '2', '/')
-        self.assertEquals(len(listing), 1)
-        self.assertEquals([row[0] for row in listing], ['2/'])
-
-        listing = broker.list_containers_iter(10, '2/0050', None, '2/', '/')
-        self.assertEquals(len(listing), 10)
-        self.assertEquals(listing[0][0], '2/0051')
-        self.assertEquals(listing[1][0], '2/0051/')
-        self.assertEquals(listing[2][0], '2/0052')
-        self.assertEquals(listing[-1][0], '2/0059')
-
-        listing = broker.list_containers_iter(10, '3/0045', None, '3/', '/')
-        self.assertEquals(len(listing), 10)
-        self.assertEquals([row[0] for row in listing],
-                           ['3/0045/', '3/0046', '3/0046/', '3/0047',
-                            '3/0047/', '3/0048', '3/0048/', '3/0049',
-                            '3/0049/', '3/0050'])
-
-        broker.put_container('3/0049/', normalize_timestamp(time()), 0, 0, 0)
-        listing = broker.list_containers_iter(10, '3/0048', None, None, None)
-        self.assertEquals(len(listing), 10)
-        self.assertEquals([row[0] for row in listing],
-                           ['3/0048/0049', '3/0049', '3/0049/', '3/0049/0049',
-                            '3/0050', '3/0050/0049', '3/0051', '3/0051/0049',
-                            '3/0052', '3/0052/0049'])
-
-        listing = broker.list_containers_iter(10, '3/0048', None, '3/', '/')
-        self.assertEquals(len(listing), 10)
-        self.assertEquals([row[0] for row in listing],
-                           ['3/0048/', '3/0049', '3/0049/', '3/0050',
-                            '3/0050/', '3/0051', '3/0051/', '3/0052',
-                            '3/0052/', '3/0053'])
-
-        listing = broker.list_containers_iter(10, None, None, '3/0049/', '/')
-        self.assertEquals(len(listing), 2)
-        self.assertEquals([row[0] for row in listing],
-                          ['3/0049/', '3/0049/0049'])
-
-    def test_double_check_trailing_delimiter(self):
-        """ Test swift.common.db.AccountBroker.list_containers_iter for an
-            account that has an odd file with a trailing delimiter """
-        broker = AccountBroker(':memory:', account='a')
-        broker.initialize(normalize_timestamp('1'))
-        broker.put_container('a', normalize_timestamp(time()), 0, 0, 0)
-        broker.put_container('a/', normalize_timestamp(time()), 0, 0, 0)
-        broker.put_container('a/a', normalize_timestamp(time()), 0, 0, 0)
-        broker.put_container('a/a/a', normalize_timestamp(time()), 0, 0, 0)
-        broker.put_container('a/a/b', normalize_timestamp(time()), 0, 0, 0)
-        broker.put_container('a/b', normalize_timestamp(time()), 0, 0, 0)
-        broker.put_container('b', normalize_timestamp(time()), 0, 0, 0)
-        broker.put_container('b/a', normalize_timestamp(time()), 0, 0, 0)
-        broker.put_container('b/b', normalize_timestamp(time()), 0, 0, 0)
-        broker.put_container('c', normalize_timestamp(time()), 0, 0, 0)
-        listing = broker.list_containers_iter(15, None, None, None, None)
-        self.assertEquals(len(listing), 10)
-        self.assertEquals([row[0] for row in listing],
-                           ['a', 'a/', 'a/a', 'a/a/a', 'a/a/b', 'a/b', 'b',
-                            'b/a', 'b/b', 'c'])
-        listing = broker.list_containers_iter(15, None, None, '', '/')
-        self.assertEquals(len(listing), 5)
-        self.assertEquals([row[0] for row in listing],
-                          ['a', 'a/', 'b', 'b/', 'c'])
-        listing = broker.list_containers_iter(15, None, None, 'a/', '/')
-        self.assertEquals(len(listing), 4)
-        self.assertEquals([row[0] for row in listing],
-                          ['a/', 'a/a', 'a/a/', 'a/b'])
-        listing = broker.list_containers_iter(15, None, None, 'b/', '/')
-        self.assertEquals(len(listing), 2)
-        self.assertEquals([row[0] for row in listing], ['b/a', 'b/b'])
-
-    def test_chexor(self):
-        broker = AccountBroker(':memory:', account='a')
-        broker.initialize(normalize_timestamp('1'))
-        broker.put_container('a', normalize_timestamp(1),
-                             normalize_timestamp(0), 0, 0)
-        broker.put_container('b', normalize_timestamp(2),
-                             normalize_timestamp(0), 0, 0)
-        hasha = hashlib.md5('%s-%s' %
-            ('a', '0000000001.00000-0000000000.00000-0-0')
-        ).digest()
-        hashb = hashlib.md5('%s-%s' %
-            ('b', '0000000002.00000-0000000000.00000-0-0')
-        ).digest()
-        hashc = \
-            ''.join(('%02x' % (ord(a) ^ ord(b)) for a, b in zip(hasha, hashb)))
-        self.assertEquals(broker.get_info()['hash'], hashc)
-        broker.put_container('b', normalize_timestamp(3),
-                             normalize_timestamp(0), 0, 0)
-        hashb = hashlib.md5('%s-%s' %
-            ('b', '0000000003.00000-0000000000.00000-0-0')
-        ).digest()
-        hashc = \
-            ''.join(('%02x' % (ord(a) ^ ord(b)) for a, b in zip(hasha, hashb)))
-        self.assertEquals(broker.get_info()['hash'], hashc)
-
-    def test_merge_items(self):
-        broker1 = AccountBroker(':memory:', account='a')
-        broker1.initialize(normalize_timestamp('1'))
-        broker2 = AccountBroker(':memory:', account='a')
-        broker2.initialize(normalize_timestamp('1'))
-        broker1.put_container('a', normalize_timestamp(1), 0, 0, 0)
-        broker1.put_container('b', normalize_timestamp(2), 0, 0, 0)
-        id = broker1.get_info()['id']
-        broker2.merge_items(broker1.get_items_since(
-            broker2.get_sync(id), 1000), id)
-        items = broker2.get_items_since(-1, 1000)
-        self.assertEquals(len(items), 2)
-        self.assertEquals(['a', 'b'], sorted([rec['name'] for rec in items]))
-        broker1.put_container('c', normalize_timestamp(3), 0, 0, 0)
-        broker2.merge_items(broker1.get_items_since(
-            broker2.get_sync(id), 1000), id)
-        items = broker2.get_items_since(-1, 1000)
-        self.assertEquals(len(items), 3)
-        self.assertEquals(['a', 'b', 'c'],
-                          sorted([rec['name'] for rec in items]))
-
-
-def premetadata_create_account_stat_table(self, conn, put_timestamp):
-    """
-    Copied from swift.common.db.AccountBroker before the metadata column was
-    added; used for testing with TestAccountBrokerBeforeMetadata.
+        # re-init
+        broker = DatabaseBroker(db_file)
+        self.assertFalse(broker._skip_commit_puts())
 
-    Create account_stat table which is specific to the account DB.
+        # constructor can override
+        broker = DatabaseBroker(db_file, skip_commits=True)
+        self.assertTrue(broker._skip_commit_puts())
 
-    :param conn: DB connection object
-    :param put_timestamp: put timestamp
-    """
-    conn.executescript("""
-        CREATE TABLE account_stat (
-            account TEXT,
-            created_at TEXT,
-            put_timestamp TEXT DEFAULT '0',
-            delete_timestamp TEXT DEFAULT '0',
-            container_count INTEGER,
-            object_count INTEGER DEFAULT 0,
-            bytes_used INTEGER DEFAULT 0,
-            hash TEXT default '00000000000000000000000000000000',
-            id TEXT,
-            status TEXT DEFAULT '',
-            status_changed_at TEXT DEFAULT '0'
-        );
-
-        INSERT INTO account_stat (container_count) VALUES (0);
-    """)
-
-    conn.execute('''
-        UPDATE account_stat SET account = ?, created_at = ?, id = ?,
-               put_timestamp = ?
-        ''', (self.account, normalize_timestamp(time()), str(uuid4()),
-        put_timestamp))
-
-
-class TestAccountBrokerBeforeMetadata(TestAccountBroker):
-    """
-    Tests for swift.common.db.AccountBroker against databases created before
-    the metadata column was added.
-    """
-
-    def setUp(self):
-        self._imported_create_account_stat_table = \
-            AccountBroker.create_account_stat_table
-        AccountBroker.create_account_stat_table = \
-            premetadata_create_account_stat_table
-        broker = AccountBroker(':memory:', account='a')
-        broker.initialize(normalize_timestamp('1'))
-        exc = None
-        with broker.get() as conn:
-            try:
-                conn.execute('SELECT metadata FROM account_stat')
-            except BaseException, err:
-                exc = err
-        self.assert_('no such column: metadata' in str(exc))
+    def test_commit_puts(self):
+        db_file = os.path.join(self.testdir, '1.db')
+        broker = DatabaseBroker(db_file)
+        broker._initialize = MagicMock()
+        broker.initialize(Timestamp.now())
+        with open(broker.pending_file, 'wb'):
+            pass
 
-    def tearDown(self):
-        AccountBroker.create_account_stat_table = \
-            self._imported_create_account_stat_table
-        broker = AccountBroker(':memory:', account='a')
-        broker.initialize(normalize_timestamp('1'))
+        # merge given list
+        with patch.object(broker, 'merge_items') as mock_merge_items:
+            broker._commit_puts(['test'])
+        mock_merge_items.assert_called_once_with(['test'])
+
+        # load file and merge
+        with open(broker.pending_file, 'wb') as fd:
+            for v in (1, 2, 99):
+                fd.write(b':' + base64.b64encode(pickle.dumps(
+                    v, protocol=PICKLE_PROTOCOL)))
+        with patch.object(broker, 'merge_items') as mock_merge_items:
+            broker._commit_puts_load = lambda l, e: l.append(e)
+            broker._commit_puts()
+        mock_merge_items.assert_called_once_with([1, 2, 99])
+        self.assertEqual(0, os.path.getsize(broker.pending_file))
+
+        # load file and merge with given list
+        with open(broker.pending_file, 'wb') as fd:
+            fd.write(b':' + base64.b64encode(pickle.dumps(
+                b'bad', protocol=PICKLE_PROTOCOL)))
+        with patch.object(broker, 'merge_items') as mock_merge_items:
+            broker._commit_puts_load = lambda l, e: l.append(e)
+            broker._commit_puts([b'not'])
+        mock_merge_items.assert_called_once_with([b'not', b'bad'])
+        self.assertEqual(0, os.path.getsize(broker.pending_file))
+
+        # load a pending entry that's caused trouble in py2/py3 upgrade tests
+        # can't quite figure out how it got generated, though, so hard-code it
+        with open(broker.pending_file, 'wb') as fd:
+            fd.write(b':gAIoVS3olIngpILrjIvrjIvpkIngpIHlmIjlmIbjnIbgp'
+                     b'IPjnITimIPvhI/rjI3tiI5xAVUQMTU1OTI0MTg0Ni40NjY'
+                     b'wMXECVQEwVQEwVQEwSwBVATB0Lg==')
+        with patch.object(broker, 'merge_items') as mock_merge_items:
+            broker._commit_puts_load = lambda l, e: l.append(e)
+            broker._commit_puts([])
+        expected_name = (u'\u8509\u0902\ub30b\ub30b\u9409\u0901\u5608\u5606'
+                         u'\u3706\u0903\u3704\u2603\uf10f\ub30d\ud20e')
+        mock_merge_items.assert_called_once_with([
+            (expected_name, '1559241846.46601', '0', '0', '0', 0, '0')])
+        self.assertEqual(0, os.path.getsize(broker.pending_file))
+
+        # skip_commits True - no merge
+        db_file = os.path.join(self.testdir, '2.db')
+        broker = DatabaseBroker(db_file, skip_commits=True)
+        broker._initialize = MagicMock()
+        broker.initialize(Timestamp.now())
+        with open(broker.pending_file, 'wb') as fd:
+            fd.write(b':ignored')
+        with patch.object(broker, 'merge_items') as mock_merge_items:
+            with self.assertRaises(DatabaseConnectionError) as cm:
+                broker._commit_puts([b'hmmm'])
+        mock_merge_items.assert_not_called()
+        self.assertIn('commits not accepted', str(cm.exception))
+        with open(broker.pending_file, 'rb') as fd:
+            self.assertEqual(b':ignored', fd.read())
+
+    def test_put_record(self):
+        db_file = os.path.join(self.testdir, '1.db')
+        broker = DatabaseBroker(db_file)
+        broker._initialize = MagicMock()
+        broker.initialize(Timestamp.now())
+
+        # pending file created and record written
+        broker.make_tuple_for_pickle = lambda x: x.upper()
+        with patch.object(broker, '_commit_puts') as mock_commit_puts:
+            broker.put_record('pinky')
+        mock_commit_puts.assert_not_called()
+        with open(broker.pending_file, 'rb') as fd:
+            pending = fd.read()
+        items = pending.split(b':')
+        self.assertEqual(['PINKY'],
+                         [pickle.loads(base64.b64decode(i))
+                             for i in items[1:]])
+
+        # record appended
+        with patch.object(broker, '_commit_puts') as mock_commit_puts:
+            broker.put_record('perky')
+        mock_commit_puts.assert_not_called()
+        with open(broker.pending_file, 'rb') as fd:
+            pending = fd.read()
+        items = pending.split(b':')
+        self.assertEqual(['PINKY', 'PERKY'],
+                         [pickle.loads(base64.b64decode(i))
+                             for i in items[1:]])
+
+        # pending file above cap
+        cap = swift.common.db.PENDING_CAP
+        while os.path.getsize(broker.pending_file) < cap:
+            with open(broker.pending_file, 'ab') as fd:
+                fd.write(b'x' * 100000)
+        with patch.object(broker, '_commit_puts') as mock_commit_puts:
+            broker.put_record('direct')
+        mock_commit_puts.assert_called_once_with(['direct'])
+
+        # records shouldn't be put to brokers with skip_commits True because
+        # they cannot be accepted if the pending file is full
+        broker.skip_commits = True
+        with open(broker.pending_file, 'wb'):
+            # empty the pending file
+            pass
+        with patch.object(broker, '_commit_puts') as mock_commit_puts:
+            with self.assertRaises(DatabaseConnectionError) as cm:
+                broker.put_record('unwelcome')
+        self.assertIn('commits not accepted', str(cm.exception))
+        mock_commit_puts.assert_not_called()
+        with open(broker.pending_file, 'rb') as fd:
+            pending = fd.read()
+        self.assertFalse(pending)
+
+
+class TestTombstoneReclaimer(TestDbBase):
+    def _make_object(self, broker, obj_name, ts, deleted):
+        if deleted:
+            broker.delete_test(obj_name, ts.internal)
+        else:
+            broker.put_test(obj_name, ts.internal)
+
+    def _count_reclaimable(self, conn, reclaim_age):
+        return conn.execute(
+            "SELECT count(*) FROM test "
+            "WHERE deleted = 1 AND created_at < ?", (reclaim_age,)
+        ).fetchone()[0]
+
+    def _get_reclaimable(self, broker, reclaim_age):
         with broker.get() as conn:
-            conn.execute('SELECT metadata FROM account_stat')
+            return self._count_reclaimable(conn, reclaim_age)
+
+    def _setup_tombstones(self, reverse_names=True):
+        broker = ExampleBroker(self.db_path,
+                               account='test_account',
+                               container='test_container')
+        broker.initialize(Timestamp('1').internal, 0)
+        now = time.time()
+        top_of_the_minute = now - (now % 60)
+
+        # namespace if reverse:
+        #  a-* has 70 'active' tombstones followed by 70 reclaimable
+        #  b-* has 70 'active' tombstones followed by 70 reclaimable
+        # else:
+        #  a-* has 70 reclaimable followed by 70 'active' tombstones
+        #  b-* has 70 reclaimable followed by 70 'active' tombstones
+        for i in range(0, 560, 4):
+            self._make_object(
+                broker, 'a_%3d' % (560 - i if reverse_names else i),
+                Timestamp(top_of_the_minute - (i * 60)), True)
+            self._make_object(
+                broker, 'a_%3d' % (559 - i if reverse_names else i + 1),
+                Timestamp(top_of_the_minute - ((i + 1) * 60), offset=1), False)
+            self._make_object(
+                broker, 'b_%3d' % (560 - i if reverse_names else i),
+                Timestamp(top_of_the_minute - ((i + 2) * 60)), True)
+            self._make_object(
+                broker, 'b_%3d' % (559 - i if reverse_names else i + 1),
+                Timestamp(top_of_the_minute - ((i + 3) * 60)), False)
+        broker._commit_puts()
+
+        # divide the set of timestamps exactly in half for reclaim
+        reclaim_age = top_of_the_minute + 1 - (560 / 2 * 60)
+        self.assertEqual(140, self._get_reclaimable(broker, reclaim_age))
+
+        tombstones = self._get_reclaimable(broker, top_of_the_minute + 1)
+        self.assertEqual(280, tombstones)
+        return broker, top_of_the_minute, reclaim_age
+
+    @contextlib.contextmanager
+    def _mock_broker_get(self, broker, reclaim_age):
+        # intercept broker.get() calls and capture the current reclaimable
+        # count before returning a conn
+        orig_get = broker.get
+        reclaimable = []
+
+        @contextlib.contextmanager
+        def mock_get():
+            with orig_get() as conn:
+                reclaimable.append(self._count_reclaimable(conn, reclaim_age))
+                yield conn
+        with patch.object(broker, 'get', mock_get):
+            yield reclaimable
+
+    def test_batched_reclaim_several_small_batches(self):
+        broker, totm, reclaim_age = self._setup_tombstones()
+
+        with self._mock_broker_get(broker, reclaim_age) as reclaimable:
+            with patch('swift.common.db.RECLAIM_PAGE_SIZE', 50):
+                reclaimer = TombstoneReclaimer(broker, reclaim_age)
+                reclaimer.reclaim()
+
+        expected_reclaimable = [140,  # 0 rows fetched
+                                90,  # 50 rows fetched, 50 reclaimed
+                                70,  # 100 rows fetched, 20 reclaimed
+                                60,  # 150 rows fetched, 10 reclaimed
+                                10,  # 200 rows fetched, 50 reclaimed
+                                0,  # 250 rows fetched, 10 reclaimed
+                                ]
+        self.assertEqual(expected_reclaimable, reclaimable)
+        self.assertEqual(0, self._get_reclaimable(broker, reclaim_age))
+
+    def test_batched_reclaim_exactly_two_batches(self):
+        broker, totm, reclaim_age = self._setup_tombstones()
+
+        with self._mock_broker_get(broker, reclaim_age) as reclaimable:
+            with patch('swift.common.db.RECLAIM_PAGE_SIZE', 140):
+                reclaimer = TombstoneReclaimer(broker, reclaim_age)
+                reclaimer.reclaim()
+
+        expected_reclaimable = [140,  # 0 rows fetched
+                                70,  # 140 rows fetched, 70 reclaimed
+                                ]
+        self.assertEqual(expected_reclaimable, reclaimable)
+        self.assertEqual(0, self._get_reclaimable(broker, reclaim_age))
+
+    def test_batched_reclaim_one_large_batch(self):
+        broker, totm, reclaim_age = self._setup_tombstones()
+
+        with self._mock_broker_get(broker, reclaim_age) as reclaimable:
+            with patch('swift.common.db.RECLAIM_PAGE_SIZE', 1000):
+                reclaimer = TombstoneReclaimer(broker, reclaim_age)
+                reclaimer.reclaim()
+
+        expected_reclaimable = [140]  # 0 rows fetched
+        self.assertEqual(expected_reclaimable, reclaimable)
+        self.assertEqual(0, self._get_reclaimable(broker, reclaim_age))
+
+    def test_reclaim_get_tombstone_count(self):
+        broker, totm, reclaim_age = self._setup_tombstones(reverse_names=False)
+        with patch('swift.common.db.RECLAIM_PAGE_SIZE', 122):
+            reclaimer = TombstoneReclaimer(broker, reclaim_age)
+            reclaimer.reclaim()
+        self.assertEqual(0, self._get_reclaimable(broker, reclaim_age))
+        tombstones = self._get_reclaimable(broker, totm + 1)
+        self.assertEqual(140, tombstones)
+        # in this scenario the reclaim phase finds the remaining tombstone
+        # count (140)
+        self.assertEqual(140, reclaimer.remaining_tombstones)
+        self.assertEqual(140, reclaimer.get_tombstone_count())
+
+    def test_reclaim_get_tombstone_count_with_leftover(self):
+        broker, totm, reclaim_age = self._setup_tombstones()
+        with patch('swift.common.db.RECLAIM_PAGE_SIZE', 122):
+            reclaimer = TombstoneReclaimer(broker, reclaim_age)
+            reclaimer.reclaim()
+
+        self.assertEqual(0, self._get_reclaimable(broker, reclaim_age))
+        tombstones = self._get_reclaimable(broker, totm + 1)
+        self.assertEqual(140, tombstones)
+        # in this scenario the reclaim phase finds a subset (104) of all
+        # tombstones (140)
+        self.assertEqual(104, reclaimer.remaining_tombstones)
+        # get_tombstone_count finds the rest
+        actual = reclaimer.get_tombstone_count()
+        self.assertEqual(140, actual)
+
+    def test_get_tombstone_count_with_leftover(self):
+        # verify that a call to get_tombstone_count() will invoke a reclaim if
+        # reclaim not already invoked
+        broker, totm, reclaim_age = self._setup_tombstones()
+        with patch('swift.common.db.RECLAIM_PAGE_SIZE', 122):
+            reclaimer = TombstoneReclaimer(broker, reclaim_age)
+            actual = reclaimer.get_tombstone_count()
+
+        self.assertEqual(0, self._get_reclaimable(broker, reclaim_age))
+        self.assertEqual(140, actual)
+
+    def test_reclaim_with_timestamp_with_offset(self):
+        broker, totm, reclaim_age = self._setup_tombstones()
+
+        age_timestamp = Timestamp(reclaim_age, offset=0xabcd)
+        reclaimer = TombstoneReclaimer(broker, age_timestamp.internal)
+        reclaimer.reclaim()
+
+        self.assertEqual(0, self._get_reclaimable(broker, reclaim_age))
+        tombstones = self._get_reclaimable(broker, totm + 1)
+        self.assertEqual(140, tombstones)
+        # in this scenario the reclaim phase all tombstones (140)
+        self.assertEqual(0, reclaimer.remaining_tombstones)
+        # get_tombstone_count finds the rest
+        actual = reclaimer.get_tombstone_count()
+        self.assertEqual(140, actual)
 
 
 if __name__ == '__main__':
diff --git a/test/unit/common/test_db_auditor.py b/test/unit/common/test_db_auditor.py
new file mode 100644
index 0000000000..4df8127315
--- /dev/null
+++ b/test/unit/common/test_db_auditor.py
@@ -0,0 +1,151 @@
+# Copyright (c) 2010-2018 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+from unittest import mock
+import time
+import os
+import random
+from tempfile import mkdtemp
+from shutil import rmtree
+from eventlet import Timeout
+
+from swift.common.db_auditor import DatabaseAuditor
+from test.debug_logger import debug_logger
+
+
+class FakeDatabaseBroker(object):
+    def __init__(self, path, logger):
+        self.path = path
+        self.db_file = path
+        self.file = os.path.basename(path)
+
+    def is_deleted(self):
+        return False
+
+    def get_info(self):
+        if self.file.startswith('fail'):
+            raise ValueError
+        if self.file.startswith('true'):
+            return 'ok'
+
+
+class FakeDatabaseAuditor(DatabaseAuditor):
+    server_type = "container"
+    broker_class = FakeDatabaseBroker
+
+    def _audit(self, info, broker):
+        return None
+
+
+class TestAuditor(unittest.TestCase):
+
+    def setUp(self):
+        self.testdir = os.path.join(mkdtemp(), 'tmp_test_database_auditor')
+        self.logger = debug_logger()
+        rmtree(self.testdir, ignore_errors=1)
+        os.mkdir(self.testdir)
+        fnames = ['true1.db', 'true2.db', 'true3.db',
+                  'fail1.db', 'fail2.db']
+        for fn in fnames:
+            with open(os.path.join(self.testdir, fn), 'w+') as f:
+                f.write(' ')
+
+    def tearDown(self):
+        rmtree(os.path.dirname(self.testdir), ignore_errors=1)
+
+    def test_run_forever(self):
+        sleep_times = random.randint(5, 10)
+        call_times = sleep_times - 1
+
+        class FakeTime(object):
+            def __init__(self):
+                self.times = 0
+
+            def sleep(self, sec):
+                self.times += 1
+                if self.times < sleep_times:
+                    time.sleep(0.1)
+                else:
+                    # stop forever by an error
+                    raise ValueError()
+
+            def time(self):
+                return time.time()
+
+        conf = {}
+        test_auditor = FakeDatabaseAuditor(conf, logger=self.logger)
+
+        with mock.patch('swift.common.db_auditor.time', FakeTime()):
+            def fake_audit_location_generator(*args, **kwargs):
+                files = os.listdir(self.testdir)
+                return [(os.path.join(self.testdir, f), '', '') for f in files]
+
+            with mock.patch('swift.common.db_auditor.audit_location_generator',
+                            fake_audit_location_generator):
+                self.assertRaises(ValueError, test_auditor.run_forever)
+        self.assertEqual(test_auditor.failures, 2 * call_times)
+        self.assertEqual(test_auditor.passes, 3 * call_times)
+
+        # now force timeout path code coverage
+        with mock.patch('swift.common.db_auditor.DatabaseAuditor.'
+                        '_one_audit_pass', side_effect=Timeout()):
+            with mock.patch('swift.common.db_auditor.time', FakeTime()):
+                self.assertRaises(ValueError, test_auditor.run_forever)
+
+    def test_run_once(self):
+        conf = {}
+        test_auditor = FakeDatabaseAuditor(conf, logger=self.logger)
+
+        def fake_audit_location_generator(*args, **kwargs):
+            files = os.listdir(self.testdir)
+            return [(os.path.join(self.testdir, f), '', '') for f in files]
+
+        with mock.patch('swift.common.db_auditor.audit_location_generator',
+                        fake_audit_location_generator):
+            test_auditor.run_once()
+        self.assertEqual(test_auditor.failures, 2)
+        self.assertEqual(test_auditor.passes, 3)
+
+    def test_one_audit_pass(self):
+        conf = {}
+        test_auditor = FakeDatabaseAuditor(conf, logger=self.logger)
+
+        def fake_audit_location_generator(*args, **kwargs):
+            files = sorted(os.listdir(self.testdir))
+            return [(os.path.join(self.testdir, f), '', '') for f in files]
+
+        # force code coverage for logging path
+        with mock.patch('swift.common.db_auditor.audit_location_generator',
+                        fake_audit_location_generator), \
+                mock.patch('time.time',
+                           return_value=(test_auditor.logging_interval * 2)):
+            test_auditor._one_audit_pass(0)
+        self.assertEqual(test_auditor.failures, 1)
+        self.assertEqual(test_auditor.passes, 3)
+
+    def test_database_auditor(self):
+        conf = {}
+        test_auditor = FakeDatabaseAuditor(conf, logger=self.logger)
+        files = os.listdir(self.testdir)
+        for f in files:
+            path = os.path.join(self.testdir, f)
+            test_auditor.audit(path)
+        self.assertEqual(test_auditor.failures, 2)
+        self.assertEqual(test_auditor.passes, 3)
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/test_db_replicator.py b/test/unit/common/test_db_replicator.py
index 2e93205b67..81d5993d18 100644
--- a/test/unit/common/test_db_replicator.py
+++ b/test/unit/common/test_db_replicator.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -12,26 +12,40 @@
 # implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
-
+import shutil
 import unittest
 from contextlib import contextmanager
+
+import eventlet
 import os
 import logging
 import errno
-from shutil import rmtree
+import math
+import time
+from shutil import rmtree, copy
 from tempfile import mkdtemp, NamedTemporaryFile
+import json
 
+from unittest import mock
+from unittest.mock import patch, call
+
+from swift.common.db_replicator import BrokerAnnotatedLogger
+from swift.container.backend import DATADIR
 from swift.common import db_replicator
-from swift.common import utils
-from swift.common.utils import normalize_timestamp
-from swift.container import server as container_server
+from swift.common.utils import (normalize_timestamp, hash_path,
+                                storage_directory, Timestamp, quote,
+                                mkdirs, listdir)
+from swift.common.exceptions import DriveNotMounted
+from swift.common.swob import HTTPException
 
-from test.unit import FakeLogger
+from test import unit
+from test.debug_logger import debug_logger
+from test.unit import attach_fake_replication_rpc
+from test.unit.common.test_db import ExampleBroker
 
 
-def teardown_module():
-    "clean up my monkey patching"
-    reload(db_replicator)
+TEST_ACCOUNT_NAME = 'a c t'
+TEST_CONTAINER_NAME = 'c o n'
 
 
 @contextmanager
@@ -39,13 +53,17 @@ def lock_parent_directory(filename):
     yield True
 
 
-class FakeRing:
-    class Ring:
+class FakeRing(object):
+    class Ring(object):
         devs = []
+        replica_count = 3
 
         def __init__(self, path, reload_time=15, ring_name=None):
             pass
 
+        def get_part(self, account, container=None, obj=None):
+            return 0
+
         def get_part_nodes(self, part):
             return []
 
@@ -53,24 +71,56 @@ def get_more_nodes(self, *args):
             return []
 
 
-class FakeRingWithNodes:
-    class Ring:
+class FakeRingWithSingleNode(object):
+    class Ring(object):
+        devs = [dict(
+            id=1, weight=10.0, zone=1, ip='1.1.1.1', port=6200, device='sdb',
+            meta='', replication_ip='1.1.1.1', replication_port=6200, region=1
+        )]
+        replica_count = 3
+
+        def __init__(self, path, reload_time=15, ring_name=None):
+            pass
+
+        def get_part(self, account, container=None, obj=None):
+            return 0
+
+        def get_part_nodes(self, part):
+            return self.devs
+
+        def get_more_nodes(self, *args):
+            return (d for d in self.devs)
+
+
+class FakeRingWithNodes(object):
+    class Ring(object):
         devs = [dict(
-            id=1, weight=10.0, zone=1, ip='1.1.1.1', port=6000, device='sdb',
-            meta=''
+            id=1, weight=10.0, zone=1, ip='1.1.1.1', port=6200, device='sdb',
+            meta='', replication_ip='1.1.1.1', replication_port=6200, region=1
         ), dict(
-            id=2, weight=10.0, zone=2, ip='1.1.1.2', port=6000, device='sdb',
-            meta=''
+            id=2, weight=10.0, zone=2, ip='1.1.1.2', port=6200, device='sdb',
+            meta='', replication_ip='1.1.1.2', replication_port=6200, region=2
         ), dict(
-            id=3, weight=10.0, zone=3, ip='1.1.1.3', port=6000, device='sdb',
-            meta=''
+            id=3, weight=10.0, zone=3, ip='1.1.1.3', port=6200, device='sdb',
+            meta='', replication_ip='1.1.1.3', replication_port=6200, region=1
         ), dict(
-            id=4, weight=10.0, zone=4, ip='1.1.1.4', port=6000, device='sdb',
-            meta='')]
+            id=4, weight=10.0, zone=4, ip='1.1.1.4', port=6200, device='sdb',
+            meta='', replication_ip='1.1.1.4', replication_port=6200, region=2
+        ), dict(
+            id=5, weight=10.0, zone=5, ip='1.1.1.5', port=6200, device='sdb',
+            meta='', replication_ip='1.1.1.5', replication_port=6200, region=1
+        ), dict(
+            id=6, weight=10.0, zone=6, ip='1.1.1.6', port=6200, device='sdb',
+            meta='', replication_ip='1.1.1.6', replication_port=6200, region=2
+        )]
+        replica_count = 3
 
         def __init__(self, path, reload_time=15, ring_name=None):
             pass
 
+        def get_part(self, account, container=None, obj=None):
+            return 0
+
         def get_part_nodes(self, part):
             return self.devs[:3]
 
@@ -78,18 +128,23 @@ def get_more_nodes(self, *args):
             return (d for d in self.devs[3:])
 
 
-class FakeProcess:
+class FakeProcess(object):
     def __init__(self, *codes):
         self.codes = iter(codes)
+        self.args = None
+        self.kwargs = None
 
     def __call__(self, *args, **kwargs):
-        class Failure:
+        self.args = args
+        self.kwargs = kwargs
+
+        class Failure(object):
             def communicate(innerself):
-                next = self.codes.next()
-                if isinstance(next, int):
-                    innerself.returncode = next
-                    return next
-                raise next
+                next_item = next(self.codes)
+                if isinstance(next_item, int):
+                    innerself.returncode = next_item
+                    return next_item
+                raise next_item
         return Failure()
 
 
@@ -97,21 +152,29 @@ def communicate(innerself):
 def _mock_process(*args):
     orig_process = db_replicator.subprocess.Popen
     db_replicator.subprocess.Popen = FakeProcess(*args)
-    yield
+    yield db_replicator.subprocess.Popen
     db_replicator.subprocess.Popen = orig_process
 
 
-class ReplHttp:
-    def __init__(self, response=None):
+class ReplHttp(object):
+    def __init__(self, response=None, set_status=200):
+        if isinstance(response, str):
+            response = response.encode('ascii')
         self.response = response
+        self.set_status = set_status
     replicated = False
     host = 'localhost'
+    node = {
+        'ip': '127.0.0.1',
+        'port': '6000',
+        'device': 'sdb',
+    }
 
     def replicate(self, *args):
         self.replicated = True
 
-        class Response:
-            status = 200
+        class Response(object):
+            status = self.set_status
             data = self.response
 
             def read(innerself):
@@ -119,29 +182,44 @@ def read(innerself):
         return Response()
 
 
-class ChangingMtimesOs:
+class ChangingMtimesOs(object):
     def __init__(self):
         self.mtime = 0
-        self.path = self
-        self.basename = os.path.basename
 
-    def getmtime(self, file):
+    def __call__(self, *args, **kwargs):
         self.mtime += 1
         return self.mtime
 
 
-class FakeBroker:
-    db_file = __file__
+class FakeBroker(object):
     get_repl_missing_table = False
     stub_replication_info = None
     db_type = 'container'
-
-    def __init__(self, *args, **kwargs):
-        return None
+    db_contains_type = 'object'
+
+    def __init__(self, db_file=None, account=TEST_ACCOUNT_NAME,
+                 container=TEST_CONTAINER_NAME, **kwargs):
+        self.db_file = db_file or __file__
+        self.db_dir = os.path.dirname(self.db_file)
+        self.locked = False
+        self.metadata = {}
+
+        self.info = {}
+        if account is not None:
+            self.info['account'] = account
+        if container is not None:
+            self.info['container'] = container
+
+        if 'account' in self.info:
+            self.path = self.info['account']
+            if 'container' in self.info:
+                self.path += '/' + self.info['container']
 
     @contextmanager
     def lock(self):
+        self.locked = True
         yield True
+        self.locked = False
 
     def get_sync(self, *args, **kwargs):
         return 5
@@ -152,6 +230,8 @@ def get_syncs(self):
     def get_items_since(self, point, *args):
         if point == 0:
             return [{'ROWID': 1}]
+        if point == -1:
+            return [{'ROWID': 1}, {'ROWID': 2}]
         return []
 
     def merge_syncs(self, *args, **kwargs):
@@ -163,268 +243,1586 @@ def merge_items(self, *args):
     def get_replication_info(self):
         if self.get_repl_missing_table:
             raise Exception('no such table')
+        info = dict(self.info)
+        info.update({
+            'hash': 12345,
+            'delete_timestamp': 0,
+            'put_timestamp': 1,
+            'created_at': 1,
+            'count': 0,
+            'max_row': 99,
+            'id': 'ID',
+            'metadata': {}
+        })
         if self.stub_replication_info:
-            return self.stub_replication_info
-        return {'delete_timestamp': 0, 'put_timestamp': 1, 'count': 0}
+            info.update(self.stub_replication_info)
+        return info
+
+    def get_max_row(self, table=None):
+        return self.get_replication_info()['max_row']
+
+    def is_reclaimable(self, now, reclaim_age):
+        info = self.get_replication_info()
+        return info['count'] == 0 and (
+            (now - reclaim_age) >
+            info['delete_timestamp'] >
+            info['put_timestamp'])
+
+    def get_other_replication_items(self):
+        return None
 
     def reclaim(self, item_timestamp, sync_timestamp):
         pass
 
-    def get_info(self):
+    def newid(self, remote_d):
         pass
 
+    def update_metadata(self, metadata):
+        self.metadata = metadata
+
+    def merge_timestamps(self, created_at, put_timestamp, delete_timestamp):
+        self.created_at = created_at
+        self.put_timestamp = put_timestamp
+        self.delete_timestamp = delete_timestamp
+
+    def get_brokers(self):
+        return [self]
 
-class TestReplicator(db_replicator.Replicator):
+
+class FakeAccountBroker(FakeBroker):
+    db_type = 'account'
+    db_contains_type = 'container'
+
+    def __init__(self, db_file=None, account=TEST_ACCOUNT_NAME,
+                 container=None, **kwargs):
+        if container is not None:
+            raise TypeError("FakeAccountBroker: no container allowed")
+        super(FakeAccountBroker, self).__init__(
+            db_file=db_file, account=account, container=None,
+            **kwargs
+        )
+
+
+class ConcreteReplicator(db_replicator.Replicator):
     server_type = 'container'
     ring_file = 'container.ring.gz'
     brokerclass = FakeBroker
-    datadir = container_server.DATADIR
+    datadir = DATADIR
     default_port = 1000
 
 
+class TestBrokerAnnotatedLogger(unittest.TestCase):
+    def setUp(self):
+        self.logger = debug_logger('broker-logger-test')
+        self.db_logger = BrokerAnnotatedLogger(logger=self.logger)
+        self.tempdir = mkdtemp()
+
+    def tearDown(self):
+        shutil.rmtree(self.tempdir, ignore_errors=True)
+
+    def test_log_broker(self):
+        broker = FakeBroker(account='a', container='c@d',
+                            db_file='/tmp/abc.db')
+
+        def do_test(level_name, call):
+            # exercise
+            call(broker, 'bonjour %s %s', 'mes', 'amis')
+            call(broker, 'hello my %s', 'friend%04ds')
+            call(broker, 'greetings friend%04ds')
+
+            # verify
+            expected = [
+                'bonjour mes amis, path: a/c%40d, db: /tmp/abc.db',
+                'hello my friend%04ds, path: a/c%40d, db: /tmp/abc.db',
+                'greetings friend%04ds, path: a/c%40d, db: /tmp/abc.db',
+            ]
+            self.assertEqual(expected,
+                             self.logger.get_lines_for_level(level_name))
+
+            # other levels should be empty
+            for lvl, lines in self.logger.all_log_lines().items():
+                if lvl != level_name:
+                    self.assertFalse(lines)
+
+            # clear between sub-tests
+            self.logger.clear()
+
+        do_test('debug', self.db_logger.debug)
+        do_test('info', self.db_logger.info)
+        do_test('warning', self.db_logger.warning)
+        do_test('error', self.db_logger.error)
+
+    def test_log_broker_exception(self):
+        broker = FakeBroker(account='a', container='c', db_file='/tmp/abc.db')
+
+        try:
+            raise ValueError('test')
+        except ValueError as err:
+            self.db_logger.exception(broker, 'exception: %s', err)
+
+        self.assertEqual(
+            ['exception: test, path: a/c, db: /tmp/abc.db: '],
+            self.logger.get_lines_for_level('error')
+        )
+        for lvl, lines in self.logger.all_log_lines().items():
+            if lvl != 'error':
+                self.assertFalse(lines)
+
+    def test_log_broker_levels(self):
+        # When level is disabled, no message should be formatted nor emitted.
+        broker = FakeBroker(account='a', container='c', db_file='/tmp/abc.db')
+
+        with mock.patch.object(self.logger, 'isEnabledFor',
+                               return_value=False):
+            self.db_logger.debug(broker, 'test')
+            self.db_logger.info(broker, 'test')
+            self.db_logger.warning(broker, 'test')
+            self.db_logger.error(broker, 'test')
+            self.db_logger.exception(broker, 'test %s', 'x')
+
+        self.assertFalse(self.logger.all_log_lines())
+
+    def test_log_broker_exception_while_logging(self):
+        """
+        If accessing broker.path or broker.db_file raises, the formatter should
+        fall back to empty strings for that field.
+        """
+        class WeirdBroker(object):
+            def __init__(self, db_file, path, raise_db=False,
+                         raise_path=False):
+                self._db_file = db_file
+                self._path = path
+                self._raise_db = raise_db
+                self._raise_path = raise_path
+
+            @property
+            def db_file(self):
+                if self._raise_db:
+                    raise Exception('boom db')
+                return self._db_file
+
+            @property
+            def path(self):
+                if self._raise_path:
+                    raise Exception('boom path')
+                return self._path
+
+        # --- Case 1: path access fails ---
+        broker_path_boom = WeirdBroker('/tmp/abc.db', 'a/c', raise_path=True)
+        self.db_logger.info(broker_path_boom, 'bonjour %s %s', 'mes', 'amis')
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertEqual(['bonjour mes amis, path: , db: /tmp/abc.db'],
+                         info_lines)
+        self.logger.clear()
+
+        # --- Case 2: db_file access fails ---
+        broker_db_boom = WeirdBroker('/tmp/abc.db', 'a/c', raise_db=True)
+        self.db_logger.info(broker_db_boom, 'bonjour %s %s', 'mes', 'amis')
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertEqual(['bonjour mes amis, path: a/c, db: '], info_lines)
+        self.logger.clear()
+
+        # --- Case 3: both path and db_file fail ---
+        broker_boom = WeirdBroker('/tmp/abc.db', 'a/c', raise_db=True,
+                                  raise_path=True)
+        self.db_logger.info(broker_boom, 'bonjour %s %s', 'mes', 'amis')
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertEqual(['bonjour mes amis, path: , db: '], info_lines)
+        self.logger.clear()
+
+        for lvl, lines in self.logger.all_log_lines().items():
+            if lvl != 'info':
+                self.assertFalse(lines)
+
+
 class TestDBReplicator(unittest.TestCase):
     def setUp(self):
         db_replicator.ring = FakeRing()
         self.delete_db_calls = []
-
-    def stub_delete_db(self, object_file):
-        self.delete_db_calls.append(object_file)
+        self._patchers = []
+        self.logger = debug_logger('test-replicator')
+        self.temp_dir = mkdtemp()
+        # recon cache path
+        self.recon_cache = os.path.join(self.temp_dir, 'cache')
+        os.mkdir(self.recon_cache)
+
+    def tearDown(self):
+        for patcher in self._patchers:
+            patcher.stop()
+        rmtree(self.temp_dir, ignore_errors=True)
+
+    def _patch(self, patching_fn, *args, **kwargs):
+        patcher = patching_fn(*args, **kwargs)
+        patched_thing = patcher.start()
+        self._patchers.append(patcher)
+        return patched_thing
+
+    def stub_delete_db(self, broker):
+        self.delete_db_calls.append('/path/to/file')
+        return True
+
+    def test_creation(self):
+        # later config should be extended to assert more config options
+        replicator = ConcreteReplicator({'node_timeout': '3.5'})
+        self.assertEqual(replicator.node_timeout, 3.5)
+        self.assertEqual(replicator.databases_per_second, 50.0)
+
+        replicator = ConcreteReplicator({'databases_per_second': '0.1'})
+        self.assertEqual(replicator.node_timeout, 10)
+        self.assertEqual(replicator.databases_per_second, 0.1)
 
     def test_repl_connection(self):
-        node = {'ip': '127.0.0.1', 'port': 80, 'device': 'sdb1'}
+        node = {'replication_ip': '127.0.0.1', 'replication_port': 80,
+                'device': 'sdb1'}
         conn = db_replicator.ReplConnection(node, '1234567890', 'abcdefg',
-                    logging.getLogger())
+                                            logging.getLogger())
 
         def req(method, path, body, headers):
-            self.assertEquals(method, 'REPLICATE')
-            self.assertEquals(headers['Content-Type'], 'application/json')
+            self.assertEqual(method, 'REPLICATE')
+            self.assertEqual(headers['Content-Type'], 'application/json')
 
-        class Resp:
+        class Resp(object):
             def read(self):
                 return 'data'
         resp = Resp()
         conn.request = req
         conn.getresponse = lambda *args: resp
-        self.assertEquals(conn.replicate(1, 2, 3), resp)
+        self.assertEqual(conn.replicate(1, 2, 3), resp)
 
         def other_req(method, path, body, headers):
             raise Exception('blah')
         conn.request = other_req
-        self.assertEquals(conn.replicate(1, 2, 3), None)
+
+        class Closeable(object):
+            closed = False
+
+            def close(self):
+                self.closed = True
+
+        conn.sock = fake_sock = Closeable()
+        self.assertIsNone(conn.replicate(1, 2, 3))
+        self.assertTrue(fake_sock.closed)
+        self.assertEqual(None, conn.sock)
 
     def test_rsync_file(self):
-        replicator = TestReplicator({})
+        replicator = ConcreteReplicator({})
+        broker = FakeBroker(db_file='/some/file')
+
         with _mock_process(-1):
-            fake_device = {'ip': '127.0.0.1', 'device': 'sda1'}
-            self.assertEquals(False,
-                    replicator._rsync_file('/some/file', 'remote:/some/file'))
+            self.assertEqual(
+                False,
+                replicator._rsync_file(broker, 'remote:/some/file'))
         with _mock_process(0):
-            fake_device = {'ip': '127.0.0.1', 'device': 'sda1'}
-            self.assertEquals(True,
-                    replicator._rsync_file('/some/file', 'remote:/some/file'))
+            self.assertEqual(
+                True,
+                replicator._rsync_file(broker, 'remote:/some/file'))
+
+    def test_rsync_file_popen_args(self):
+        replicator = ConcreteReplicator({})
+        broker = FakeBroker(db_file='/some/file')
+
+        with _mock_process(0) as process:
+            replicator._rsync_file(broker, 'remote:/some_file')
+            exp_args = ([
+                'rsync', '--quiet', '--no-motd',
+                '--timeout=%s' % int(math.ceil(replicator.node_timeout)),
+                '--contimeout=%s' % int(math.ceil(replicator.conn_timeout)),
+                '--whole-file', '/some/file', 'remote:/some_file'],)
+            self.assertEqual(exp_args, process.args)
+
+    def test_rsync_file_popen_args_whole_file_false(self):
+        replicator = ConcreteReplicator({})
+        broker = FakeBroker(db_file='/some/file')
+        with _mock_process(0) as process:
+            replicator._rsync_file(broker, 'remote:/some_file', False)
+            exp_args = ([
+                'rsync', '--quiet', '--no-motd',
+                '--timeout=%s' % int(math.ceil(replicator.node_timeout)),
+                '--contimeout=%s' % int(math.ceil(replicator.conn_timeout)),
+                '/some/file', 'remote:/some_file'],)
+            self.assertEqual(exp_args, process.args)
+
+    def test_rsync_file_popen_args_different_region_and_rsync_compress(self):
+        replicator = ConcreteReplicator({})
+        broker = FakeBroker(db_file='/some/file')
+
+        for rsync_compress in (False, True):
+            replicator.rsync_compress = rsync_compress
+            for different_region in (False, True):
+                with _mock_process(0) as process:
+                    replicator._rsync_file(broker, 'remote:/some_file',
+                                           False, different_region)
+                    if rsync_compress and different_region:
+                        # --compress arg should be passed to rsync binary
+                        # only when rsync_compress option is enabled
+                        # AND destination node is in a different
+                        # region
+                        self.assertTrue('--compress' in process.args[0])
+                    else:
+                        self.assertFalse('--compress' in process.args[0])
 
     def test_rsync_db(self):
-        replicator = TestReplicator({})
-        replicator._rsync_file = lambda *args: True
-        fake_device = {'ip': '127.0.0.1', 'device': 'sda1'}
+        replicator = ConcreteReplicator({})
+        fake_device = {'replication_ip': '127.0.0.1', 'device': 'sda1'}
+
+        calls = []
+
+        def _rsync_file_stub(broker_arg, remote_spec, *args, **kwargs):
+            calls.append({
+                'broker': broker_arg,
+                'remote_spec': remote_spec,
+                'args': args,
+                'kwargs': kwargs,
+            })
+            return True
+
+        replicator._rsync_file = _rsync_file_stub
         replicator._rsync_db(FakeBroker(), fake_device, ReplHttp(), 'abcd')
 
+        self.assertEqual(1, len(calls), "single rsync call")
+        broker_arg = calls[0]['broker']
+        self.assertTrue(os.path.isabs(broker_arg.db_file))
+        self.assertFalse(os.path.isabs(broker_arg.path))
+
+    def test_rsync_db_rsync_file_call(self):
+        fake_device = {'ip': '127.0.0.1', 'port': '0',
+                       'replication_ip': '127.0.0.1', 'replication_port': '0',
+                       'device': 'sda1'}
+
+        class MyTestReplicator(ConcreteReplicator):
+            def __init__(self, db_file, remote_file):
+                super(MyTestReplicator, self).__init__({})
+                self.db_file = db_file
+                self.remote_file = remote_file
+                self._rsync_file_called = False
+
+            def _rsync_file(self_, broker, remote_file, whole_file=True,
+                            different_region=False):
+                self.assertEqual(broker.db_file, self_.db_file)
+                self.assertEqual(remote_file, self_.remote_file)
+                self_._rsync_file_called = True
+                return False
+
+        broker = FakeBroker()
+        remote_file = '127.0.0.1::container/sda1/tmp/abcd'
+        replicator = MyTestReplicator(broker.db_file, remote_file)
+        replicator._rsync_db(broker, fake_device, ReplHttp(), 'abcd')
+        self.assertTrue(replicator._rsync_file_called)
+
+    def test_rsync_db_rsync_file_failure(self):
+        class MyTestReplicator(ConcreteReplicator):
+            def __init__(self):
+                super(MyTestReplicator, self).__init__({})
+                self._rsync_file_called = False
+
+            def _rsync_file(self_, *args, **kwargs):
+                self.assertEqual(
+                    False, self_._rsync_file_called,
+                    '_sync_file() should only be called once')
+                self_._rsync_file_called = True
+                return False
+
+        with patch('os.path.exists', lambda *args: True):
+            replicator = MyTestReplicator()
+            fake_device = {'ip': '127.0.0.1', 'replication_ip': '127.0.0.1',
+                           'device': 'sda1'}
+            replicator._rsync_db(FakeBroker(), fake_device, ReplHttp(), 'abcd')
+            self.assertEqual(True, replicator._rsync_file_called)
+
+    def test_rsync_db_change_after_sync(self):
+        class MyTestReplicator(ConcreteReplicator):
+            def __init__(self, broker):
+                super(MyTestReplicator, self).__init__({})
+                self.broker = broker
+                self._rsync_file_call_count = 0
+
+            def _rsync_file(self_, broker_arg, remote_file, whole_file=True,
+                            different_region=False):
+                self_._rsync_file_call_count += 1
+                if self_._rsync_file_call_count == 1:
+                    self.assertEqual(True, whole_file)
+                    self.assertEqual(False, self_.broker.locked)
+                elif self_._rsync_file_call_count == 2:
+                    self.assertEqual(False, whole_file)
+                    self.assertEqual(True, self_.broker.locked)
+                else:
+                    raise RuntimeError('_rsync_file() called too many times')
+                return True
+
+        # with journal file
+        with patch('os.path.exists', lambda *args: True):
+            broker = FakeBroker()
+            replicator = MyTestReplicator(broker)
+            fake_device = {'ip': '127.0.0.1', 'replication_ip': '127.0.0.1',
+                           'device': 'sda1'}
+            replicator._rsync_db(broker, fake_device, ReplHttp(), 'abcd')
+            self.assertEqual(2, replicator._rsync_file_call_count)
+
+        # with new mtime
+        with patch('os.path.exists', lambda *args: False):
+            with patch('os.path.getmtime', ChangingMtimesOs()):
+                broker = FakeBroker()
+                replicator = MyTestReplicator(broker)
+                fake_device = {'ip': '127.0.0.1',
+                               'replication_ip': '127.0.0.1',
+                               'device': 'sda1'}
+                replicator._rsync_db(broker, fake_device, ReplHttp(), 'abcd')
+                self.assertEqual(2, replicator._rsync_file_call_count)
+
     def test_in_sync(self):
-        replicator = TestReplicator({})
-        self.assertEquals(replicator._in_sync(
-            {'id': 'a', 'point': -1, 'max_row': 0, 'hash': 'b'},
+        replicator = ConcreteReplicator({})
+        self.assertEqual(replicator._in_sync(
+            {'id': 'a', 'point': 0, 'max_row': 0, 'hash': 'b'},
             {'id': 'a', 'point': -1, 'max_row': 0, 'hash': 'b'},
             FakeBroker(), -1), True)
-        self.assertEquals(replicator._in_sync(
+        self.assertEqual(replicator._in_sync(
             {'id': 'a', 'point': -1, 'max_row': 0, 'hash': 'b'},
             {'id': 'a', 'point': -1, 'max_row': 10, 'hash': 'b'},
             FakeBroker(), -1), True)
-        self.assertEquals(bool(replicator._in_sync(
+        self.assertEqual(bool(replicator._in_sync(
             {'id': 'a', 'point': -1, 'max_row': 0, 'hash': 'c'},
             {'id': 'a', 'point': -1, 'max_row': 10, 'hash': 'd'},
             FakeBroker(), -1)), False)
 
-    def test_run_once(self):
-        replicator = TestReplicator({})
+    def test_run_once_no_local_device_in_ring(self):
+        replicator = ConcreteReplicator({'recon_cache_path': self.recon_cache},
+                                        logger=self.logger)
+        with patch('swift.common.db_replicator.whataremyips',
+                   return_value=['127.0.0.1']):
+            replicator.run_once()
+        expected = [
+            "Can't find itself 127.0.0.1 with port 1000 "
+            "in ring file, not replicating",
+        ]
+        self.assertEqual(expected, self.logger.get_lines_for_level('error'))
+
+    def test_run_once_with_local_device_in_ring(self):
+        base = 'swift.common.db_replicator.'
+        with patch(base + 'whataremyips', return_value=['1.1.1.1']), \
+                patch(base + 'ring', FakeRingWithNodes()):
+            replicator = ConcreteReplicator({
+                'bind_port': 6200,
+                'recon_cache_path': self.recon_cache
+            }, logger=self.logger)
+            replicator.run_once()
+        self.assertFalse(self.logger.get_lines_for_level('error'))
+
+    def test_run_once_no_ips(self):
+        replicator = ConcreteReplicator({}, logger=self.logger)
+        self._patch(patch.object, db_replicator, 'whataremyips',
+                    lambda *a, **kw: [])
+
+        replicator.run_once()
+
+        self.assertEqual(
+            replicator.logger.get_lines_for_level('error'),
+            ['ERROR Failed to get my own IPs?'])
+
+    def test_run_once_node_is_not_mounted(self):
+        db_replicator.ring = FakeRingWithSingleNode()
+        # If a bind_ip is specified, it's plumbed into whataremyips() and
+        # returned by itself.
+        conf = {'mount_check': 'true', 'bind_ip': '1.1.1.1',
+                'bind_port': 6200}
+        replicator = ConcreteReplicator(conf, logger=self.logger)
+        self.assertEqual(replicator.mount_check, True)
+        self.assertEqual(replicator.port, 6200)
+
+        err = ValueError('Boom!')
+
+        def mock_check_drive(root, device, mount_check):
+            self.assertEqual(root, replicator.root)
+            self.assertEqual(device, replicator.ring.devs[0]['device'])
+            self.assertEqual(mount_check, True)
+            raise err
+
+        self._patch(patch.object, db_replicator, 'check_drive',
+                    mock_check_drive)
         replicator.run_once()
 
+        self.assertEqual(
+            replicator.logger.get_lines_for_level('warning'),
+            ['Skipping: %s' % (err,)])
+
+    def test_run_once_node_is_mounted(self):
+        db_replicator.ring = FakeRingWithSingleNode()
+        conf = {'mount_check': 'true', 'bind_port': 6200}
+        replicator = ConcreteReplicator(conf, logger=self.logger)
+        self.assertEqual(replicator.mount_check, True)
+        self.assertEqual(replicator.port, 6200)
+
+        def mock_unlink_older_than(path, mtime):
+            self.assertEqual(path,
+                             os.path.join(replicator.root,
+                                          replicator.ring.devs[0]['device'],
+                                          'tmp'))
+            self.assertTrue(time.time() - replicator.reclaim_age >= mtime)
+
+        def mock_spawn_n(fn, part, object_file, node_id):
+            self.assertEqual('123', part)
+            self.assertEqual('/srv/node/sda/c.db', object_file)
+            self.assertEqual(1, node_id)
+
+        self._patch(patch.object, db_replicator, 'whataremyips',
+                    lambda *a, **kw: ['1.1.1.1'])
+        self._patch(patch.object, db_replicator, 'unlink_older_than',
+                    mock_unlink_older_than)
+        self._patch(patch.object, db_replicator, 'roundrobin_datadirs',
+                    lambda *args: [('123', '/srv/node/sda/c.db', 1)])
+        self._patch(patch.object, replicator.cpool, 'spawn_n', mock_spawn_n)
+
+        with patch('swift.common.db_replicator.os',
+                   new=mock.MagicMock(wraps=os)) as mock_os, \
+                unit.mock_check_drive(ismount=True) as mocks:
+            mock_os.path.isdir.return_value = True
+            replicator.run_once()
+            mock_os.path.isdir.assert_called_with(
+                os.path.join(replicator.root,
+                             replicator.ring.devs[0]['device'],
+                             replicator.datadir))
+            self.assertEqual([
+                mock.call(os.path.join(
+                    replicator.root,
+                    replicator.ring.devs[0]['device'])),
+            ], mocks['ismount'].call_args_list)
+
     def test_usync(self):
         fake_http = ReplHttp()
-        replicator = TestReplicator({})
+        replicator = ConcreteReplicator({})
         replicator._usync_db(0, FakeBroker(), fake_http, '12345', '67890')
 
-    def test_repl_to_node(self):
-        replicator = TestReplicator({})
-        fake_node = {'ip': '127.0.0.1', 'device': 'sda1', 'port': 1000}
-        fake_info = {'id': 'a', 'point': -1, 'max_row': 0, 'hash': 'b',
-                    'created_at': 100, 'put_timestamp': 0,
-                    'delete_timestamp': 0,
-                    'metadata': {'Test': ('Value', normalize_timestamp(1))}}
-        replicator._http_connect = lambda *args: ReplHttp(
-                                                   '{"id": 3, "point": -1}')
-        self.assertEquals(replicator._repl_to_node(
-            fake_node, FakeBroker(), '0', fake_info), True)
-
-    def test_stats(self):
-        # I'm not sure how to test that this logs the right thing,
-        # but we can at least make sure it gets covered.
-        replicator = TestReplicator({})
+    def test_usync_http_error_above_300(self):
+        fake_http = ReplHttp(set_status=301)
+        replicator = ConcreteReplicator({})
+        self.assertFalse(
+            replicator._usync_db(0, FakeBroker(), fake_http, '12345', '67890'))
+
+    def test_usync_http_error_below_200(self):
+        fake_http = ReplHttp(set_status=101)
+        replicator = ConcreteReplicator({})
+        self.assertFalse(
+            replicator._usync_db(0, FakeBroker(), fake_http, '12345', '67890'))
+
+    @mock.patch('swift.common.db_replicator.dump_recon_cache')
+    @mock.patch('swift.common.db_replicator.time.time', return_value=1234.5678)
+    def test_stats(self, mock_time, mock_recon_cache):
+        replicator = ConcreteReplicator({}, logger=self.logger)
         replicator._zero_stats()
+        self.assertEqual(replicator.stats['start'], mock_time.return_value)
+        replicator._report_stats()
+        self.assertEqual(self.logger.get_lines_for_level('info'), [
+            'Attempted to replicate 0 dbs in 0.00000 seconds (0.00000/s)',
+            'Removed 0 dbs',
+            '0 successes, 0 failures',
+            'diff:0 diff_capped:0 empty:0 hashmatch:0 no_change:0 '
+            'remote_merge:0 rsync:0 ts_repl:0',
+        ])
+        self.assertEqual(1, len(mock_recon_cache.mock_calls))
+        self.assertEqual(mock_recon_cache.mock_calls[0][1][0], {
+            'replication_time': 0.0,
+            'replication_last': mock_time.return_value,
+            'replication_stats': replicator.stats,
+        })
+
+        mock_recon_cache.reset_mock()
+        self.logger.clear()
+        replicator.stats.update({
+            'attempted': 30,
+            'success': 25,
+            'remove': 9,
+            'failure': 1,
+
+            'diff': 5,
+            'diff_capped': 4,
+            'empty': 7,
+            'hashmatch': 8,
+            'no_change': 6,
+            'remote_merge': 2,
+            'rsync': 3,
+            'ts_repl': 10,
+        })
+        mock_time.return_value += 246.813576
         replicator._report_stats()
+        self.maxDiff = None
+        self.assertEqual(self.logger.get_lines_for_level('info'), [
+            'Attempted to replicate 30 dbs in 246.81358 seconds (0.12155/s)',
+            'Removed 9 dbs',
+            '25 successes, 1 failures',
+            'diff:5 diff_capped:4 empty:7 hashmatch:8 no_change:6 '
+            'remote_merge:2 rsync:3 ts_repl:10',
+        ])
+        self.assertEqual(1, len(mock_recon_cache.mock_calls))
+        self.assertEqual(mock_recon_cache.mock_calls[0][1][0], {
+            'replication_time': 246.813576,
+            'replication_last': mock_time.return_value,
+            'replication_stats': replicator.stats,
+        })
 
     def test_replicate_object(self):
+        # verify return values from replicate_object
         db_replicator.ring = FakeRingWithNodes()
-        replicator = TestReplicator({})
-        replicator.delete_db = self.stub_delete_db
-        replicator._replicate_object('0', '/path/to/file', 'node_id')
-        self.assertEquals([], self.delete_db_calls)
+        db_path = '/path/to/file'
+        replicator = ConcreteReplicator({}, logger=self.logger)
+        info = FakeBroker().get_replication_info()
+        # make remote appear to be in sync
+        rinfo = {'point': info['max_row'], 'id': 'remote_id'}
+
+        class FakeResponse(object):
+            def __init__(self, status, rinfo):
+                self._status = status
+                self.data = json.dumps(rinfo).encode('ascii')
+
+            @property
+            def status(self):
+                if isinstance(self._status, (Exception, eventlet.Timeout)):
+                    raise self._status
+                return self._status
+
+        # all requests fail
+        replicate = 'swift.common.db_replicator.ReplConnection.replicate'
+        with mock.patch(replicate) as fake_replicate:
+            fake_replicate.side_effect = [
+                FakeResponse(500, None),
+                FakeResponse(500, None),
+                FakeResponse(500, None)]
+            with mock.patch.object(replicator, 'delete_db') as mock_delete:
+                res = replicator._replicate_object('0', db_path, 'node_id')
+        self.assertRaises(StopIteration, next, fake_replicate.side_effect)
+        self.assertEqual((False, [False, False, False]), res)
+        self.assertEqual(0, mock_delete.call_count)
+        self.assertFalse(replicator.logger.get_lines_for_level('error'))
+        self.assertFalse(replicator.logger.get_lines_for_level('warning'))
+        replicator.logger.clear()
+
+        with mock.patch(replicate) as fake_replicate:
+            fake_replicate.side_effect = [
+                FakeResponse(Exception('ugh'), None),
+                FakeResponse(eventlet.Timeout(), None),
+                FakeResponse(200, rinfo)]
+            with mock.patch.object(replicator, 'delete_db') as mock_delete:
+                res = replicator._replicate_object('0', db_path, 'node_id')
+        self.assertRaises(StopIteration, next, fake_replicate.side_effect)
+        self.assertEqual((False, [False, False, True]), res)
+        self.assertEqual(0, mock_delete.call_count)
+        lines = replicator.logger.get_lines_for_level('error')
+        self.assertIn('ERROR syncing', lines[0])
+        self.assertIn('ERROR syncing', lines[1])
+        self.assertFalse(lines[2:])
+        self.assertFalse(replicator.logger.get_lines_for_level('warning'))
+        replicator.logger.clear()
+
+        # partial success
+        with mock.patch(replicate) as fake_replicate:
+            fake_replicate.side_effect = [
+                FakeResponse(200, rinfo),
+                FakeResponse(200, rinfo),
+                FakeResponse(500, None)]
+            with mock.patch.object(replicator, 'delete_db') as mock_delete:
+                res = replicator._replicate_object('0', db_path, 'node_id')
+        self.assertRaises(StopIteration, next, fake_replicate.side_effect)
+        self.assertEqual((False, [True, True, False]), res)
+        self.assertEqual(0, mock_delete.call_count)
+        self.assertFalse(replicator.logger.get_lines_for_level('error'))
+        self.assertFalse(replicator.logger.get_lines_for_level('warning'))
+        replicator.logger.clear()
+
+        # 507 triggers additional requests
+        with mock.patch(replicate) as fake_replicate:
+            fake_replicate.side_effect = [
+                FakeResponse(200, rinfo),
+                FakeResponse(200, rinfo),
+                FakeResponse(507, None),
+                FakeResponse(507, None),
+                FakeResponse(200, rinfo)]
+            with mock.patch.object(replicator, 'delete_db') as mock_delete:
+                res = replicator._replicate_object('0', db_path, 'node_id')
+        self.assertRaises(StopIteration, next, fake_replicate.side_effect)
+        self.assertEqual((False, [True, True, False, False, True]), res)
+        self.assertEqual(0, mock_delete.call_count)
+        lines = replicator.logger.get_lines_for_level('error')
+        self.assertIn('Remote drive not mounted', lines[0])
+        self.assertIn('Remote drive not mounted', lines[1])
+        self.assertFalse(lines[2:])
+        self.assertFalse(replicator.logger.get_lines_for_level('warning'))
+        replicator.logger.clear()
+
+        # all requests succeed; node id == 'node_id' causes node to be
+        # considered a handoff so expect the db to be deleted
+        with mock.patch(replicate) as fake_replicate:
+            fake_replicate.side_effect = [
+                FakeResponse(200, rinfo),
+                FakeResponse(200, rinfo),
+                FakeResponse(200, rinfo)]
+            with mock.patch.object(replicator, 'delete_db') as mock_delete:
+                res = replicator._replicate_object('0', db_path, 'node_id')
+        self.assertRaises(StopIteration, next, fake_replicate.side_effect)
+        self.assertEqual((True, [True, True, True]), res)
+        self.assertEqual(1, mock_delete.call_count)
+        self.assertFalse(replicator.logger.get_lines_for_level('error'))
+        self.assertFalse(replicator.logger.get_lines_for_level('warning'))
 
     def test_replicate_object_quarantine(self):
-        replicator = TestReplicator({})
-        was_db_file = replicator.brokerclass.db_file
-        try:
-
-            def mock_renamer(was, new, cause_colision=False):
-                if cause_colision and '-' not in new:
-                    raise OSError(errno.EEXIST, "File already exists")
-                self.assertEquals('/a/b/c/d/e', was)
-                if '-' in new:
-                    self.assert_(
-                        new.startswith('/a/quarantined/containers/e-'))
-                else:
-                    self.assertEquals('/a/quarantined/containers/e', new)
-
-            def mock_renamer_error(was, new):
-                return mock_renamer(was, new, cause_colision=True)
-            was_renamer = db_replicator.renamer
-            db_replicator.renamer = mock_renamer
-            replicator.brokerclass.get_repl_missing_table = True
-            replicator.brokerclass.db_file = '/a/b/c/d/e/hey'
-            replicator._replicate_object('0', 'file', 'node_id')
-            # try the double quarantine
-            db_replicator.renamer = mock_renamer_error
-            replicator._replicate_object('0', 'file', 'node_id')
-        finally:
-            replicator.brokerclass.db_file = was_db_file
-            db_replicator.renamer = was_renamer
+        replicator = ConcreteReplicator({})
+        db_path = '/a/b/c/d/e/hey'
+        self._patch(patch.object, replicator.brokerclass,
+                    'get_repl_missing_table', True)
+
+        def mock_renamer(was, new, fsync=False, cause_colision=False):
+            if cause_colision and '-' not in new:
+                raise OSError(errno.EEXIST, "File already exists")
+            self.assertEqual('/a/b/c/d/e', was)
+            if '-' in new:
+                self.assertTrue(
+                    new.startswith('/a/quarantined/containers/e-'))
+            else:
+                self.assertEqual('/a/quarantined/containers/e', new)
+
+        def mock_renamer_error(was, new, fsync):
+            return mock_renamer(was, new, fsync, cause_colision=True)
+        with patch.object(db_replicator, 'renamer', mock_renamer):
+            replicator._replicate_object('0', db_path, 'node_id')
+        # try the double quarantine
+        with patch.object(db_replicator, 'renamer', mock_renamer_error):
+            replicator._replicate_object('0', db_path, 'node_id')
 
     def test_replicate_object_delete_because_deleted(self):
-        replicator = TestReplicator({})
+        replicator = ConcreteReplicator({})
         try:
             replicator.delete_db = self.stub_delete_db
             replicator.brokerclass.stub_replication_info = {
-                'delete_timestamp': 2, 'put_timestamp': 1, 'count': 0}
+                'delete_timestamp': 2, 'put_timestamp': 1}
             replicator._replicate_object('0', '/path/to/file', 'node_id')
         finally:
             replicator.brokerclass.stub_replication_info = None
-        self.assertEquals(['/path/to/file'], self.delete_db_calls)
+        self.assertEqual(['/path/to/file'], self.delete_db_calls)
 
     def test_replicate_object_delete_because_not_shouldbehere(self):
-        replicator = TestReplicator({})
+        replicator = ConcreteReplicator({})
+        replicator.ring = FakeRingWithNodes().Ring('path')
+        replicator.brokerclass = FakeAccountBroker
+        replicator._repl_to_node = lambda *args: True
+        replicator.delete_db = self.stub_delete_db
+        orig_cleanup = replicator.cleanup_post_replicate
+        with mock.patch.object(replicator, 'cleanup_post_replicate',
+                               side_effect=orig_cleanup) as mock_cleanup:
+            replicator._replicate_object('0', '/path/to/file', 'node_id')
+        mock_cleanup.assert_called_once_with(mock.ANY, mock.ANY, [True] * 3)
+        self.assertIsInstance(mock_cleanup.call_args[0][0],
+                              replicator.brokerclass)
+        self.assertEqual(['/path/to/file'], self.delete_db_calls)
+        self.assertEqual(0, replicator.stats['failure'])
+
+    def test_handoff_delete(self):
+        def do_test(config, repl_to_node_results, expect_delete):
+            self.delete_db_calls = []
+            replicator = ConcreteReplicator(config)
+            replicator.ring = FakeRingWithNodes().Ring('path')
+            replicator.brokerclass = FakeAccountBroker
+            mock_repl_to_node = mock.Mock()
+            mock_repl_to_node.side_effect = repl_to_node_results
+            replicator._repl_to_node = mock_repl_to_node
+            replicator.delete_db = self.stub_delete_db
+            orig_cleanup = replicator.cleanup_post_replicate
+            with mock.patch.object(replicator, 'cleanup_post_replicate',
+                                   side_effect=orig_cleanup) as mock_cleanup:
+                replicator._replicate_object('0', '/path/to/file', 'node_id')
+            mock_cleanup.assert_called_once_with(mock.ANY, mock.ANY,
+                                                 repl_to_node_results)
+            self.assertIsInstance(mock_cleanup.call_args[0][0],
+                                  replicator.brokerclass)
+            if expect_delete:
+                self.assertEqual(['/path/to/file'], self.delete_db_calls)
+            else:
+                self.assertNotEqual(['/path/to/file'], self.delete_db_calls)
+
+            self.assertEqual(repl_to_node_results.count(True),
+                             replicator.stats['success'])
+            self.assertEqual(repl_to_node_results.count(False),
+                             replicator.stats['failure'])
+
+        for cfg, repl_results, expected_delete in (
+                # Start with the sanilty check
+                ({}, [True] * 3, True),
+                ({}, [True, True, False], False),
+                ({'handoff_delete': 'auto'}, [True] * 3, True),
+                ({'handoff_delete': 'auto'}, [True, True, False], False),
+                ({'handoff_delete': 0}, [True] * 3, True),
+                ({'handoff_delete': 0}, [True, True, False], False),
+                # Now test a lower handoff delete
+                ({'handoff_delete': 2}, [True] * 3, True),
+                ({'handoff_delete': 2}, [True, True, False], True),
+                ({'handoff_delete': 2}, [True, False, False], False),
+                ({'handoff_delete': 1}, [True] * 3, True),
+                ({'handoff_delete': 1}, [True, True, False], True),
+                ({'handoff_delete': 1}, [True, False, False], True),
+                # if we configure it too high, handle it gracefully
+                ({'handoff_delete': 5}, [True] * 3, True),
+        ):
+            do_test(cfg, repl_results, expected_delete)
+
+    def test_replicate_object_delete_delegated_to_cleanup_post_replicate(self):
+        replicator = ConcreteReplicator({})
+        replicator.ring = FakeRingWithNodes().Ring('path')
+        replicator.brokerclass = FakeAccountBroker
+        replicator._repl_to_node = lambda *args: True
         replicator.delete_db = self.stub_delete_db
-        replicator._replicate_object('0', '/path/to/file', 'node_id')
-        self.assertEquals(['/path/to/file'], self.delete_db_calls)
+
+        # cleanup succeeds
+        with mock.patch.object(replicator, 'cleanup_post_replicate',
+                               return_value=True) as mock_cleanup:
+            replicator._replicate_object('0', '/path/to/file', 'node_id')
+        mock_cleanup.assert_called_once_with(mock.ANY, mock.ANY, [True] * 3)
+        self.assertIsInstance(mock_cleanup.call_args[0][0],
+                              replicator.brokerclass)
+        self.assertFalse(self.delete_db_calls)
+        self.assertEqual(0, replicator.stats['failure'])
+        self.assertEqual(3, replicator.stats['success'])
+
+        # cleanup fails
+        replicator._zero_stats()
+        with mock.patch.object(replicator, 'cleanup_post_replicate',
+                               return_value=False) as mock_cleanup:
+            replicator._replicate_object('0', '/path/to/file', 'node_id')
+        mock_cleanup.assert_called_once_with(mock.ANY, mock.ANY, [True] * 3)
+        self.assertIsInstance(mock_cleanup.call_args[0][0],
+                              replicator.brokerclass)
+        self.assertFalse(self.delete_db_calls)
+        self.assertEqual(3, replicator.stats['failure'])
+        self.assertEqual(0, replicator.stats['success'])
+
+        # shouldbehere True - cleanup not required
+        replicator._zero_stats()
+        primary_node_id = replicator.ring.get_part_nodes('0')[0]['id']
+        with mock.patch.object(replicator, 'cleanup_post_replicate',
+                               return_value=True) as mock_cleanup:
+            replicator._replicate_object('0', '/path/to/file', primary_node_id)
+        mock_cleanup.assert_not_called()
+        self.assertFalse(self.delete_db_calls)
+        self.assertEqual(0, replicator.stats['failure'])
+        self.assertEqual(2, replicator.stats['success'])
+
+    def test_cleanup_post_replicate(self):
+        replicator = ConcreteReplicator({}, logger=self.logger)
+        replicator.ring = FakeRingWithNodes().Ring('path')
+        broker = FakeBroker(account='a', container='c')
+        replicator._repl_to_node = lambda *args: True
+        info = broker.get_replication_info()
+
+        with mock.patch.object(replicator, 'delete_db') as mock_delete_db:
+            res = replicator.cleanup_post_replicate(
+                broker, info, [False] * 3)
+        mock_delete_db.assert_not_called()
+        self.assertTrue(res)
+        self.assertEqual(['Not deleting db (0/3 success), path: %s, '
+                          'db: %s' % (quote(broker.path), broker.db_file)],
+                         replicator.logger.get_lines_for_level('debug'))
+        replicator.logger.clear()
+
+        with mock.patch.object(replicator, 'delete_db') as mock_delete_db:
+            res = replicator.cleanup_post_replicate(
+                broker, info, [True, False, True])
+        mock_delete_db.assert_not_called()
+        self.assertTrue(res)
+        self.assertEqual(['Not deleting db (2/3 success), path: %s, '
+                          'db: %s' % (quote(broker.path), broker.db_file)],
+                         replicator.logger.get_lines_for_level('debug'))
+        replicator.logger.clear()
+
+        broker.stub_replication_info = {'max_row': 101}
+        with mock.patch.object(replicator, 'delete_db') as mock_delete_db:
+            res = replicator.cleanup_post_replicate(
+                broker, info, [True] * 3)
+        mock_delete_db.assert_not_called()
+        self.assertTrue(res)
+        self.assertEqual(['Not deleting db (2 new rows), path: %s, '
+                          'db: %s' % (quote(broker.path), broker.db_file)],
+                         replicator.logger.get_lines_for_level('debug'))
+        replicator.logger.clear()
+
+        broker.stub_replication_info = {'max_row': 98}
+        with mock.patch.object(replicator, 'delete_db') as mock_delete_db:
+            res = replicator.cleanup_post_replicate(
+                broker, info, [True] * 3)
+        mock_delete_db.assert_not_called()
+        self.assertTrue(res)
+        broker.stub_replication_info = None
+        self.assertEqual(['Not deleting db (negative max_row_delta: -1),'
+                          ' path: %s, db: %s' % (quote(broker.path),
+                                                 broker.db_file)],
+                         replicator.logger.get_lines_for_level('error'))
+        replicator.logger.clear()
+
+        with mock.patch.object(replicator, 'delete_db') as mock_delete_db:
+            res = replicator.cleanup_post_replicate(
+                broker, info, [True] * 3)
+        mock_delete_db.assert_called_once_with(broker)
+        self.assertTrue(res)
+        self.assertEqual(['Successfully deleted db, path: %s, db: %s' %
+                          (quote(broker.path), broker.db_file)],
+                         replicator.logger.get_lines_for_level('debug'))
+        replicator.logger.clear()
+
+        with mock.patch.object(replicator, 'delete_db',
+                               return_value=False) as mock_delete_db:
+            res = replicator.cleanup_post_replicate(
+                broker, info, [True] * 3)
+        mock_delete_db.assert_called_once_with(broker)
+        self.assertFalse(res)
+        self.assertEqual(['Failed to delete db, path: %s, db: %s' %
+                          (quote(broker.path), broker.db_file)],
+                         replicator.logger.get_lines_for_level('debug'))
+        replicator.logger.clear()
+
+    def test_replicate_object_with_exception(self):
+        replicator = ConcreteReplicator({})
+        replicator.ring = FakeRingWithNodes().Ring('path')
+        replicator.brokerclass = FakeAccountBroker
+        replicator.delete_db = self.stub_delete_db
+        replicator._repl_to_node = mock.Mock(side_effect=Exception())
+        replicator._replicate_object('0', '/path/to/file',
+                                     replicator.ring.devs[0]['id'])
+        self.assertEqual(2, replicator._repl_to_node.call_count)
+        # with one DriveNotMounted exception called on +1 more replica
+        replicator._repl_to_node = mock.Mock(side_effect=[DriveNotMounted()])
+        replicator._replicate_object('0', '/path/to/file',
+                                     replicator.ring.devs[0]['id'])
+        self.assertEqual(3, replicator._repl_to_node.call_count)
+        # called on +1 more replica and self when *first* handoff
+        replicator._repl_to_node = mock.Mock(side_effect=[DriveNotMounted()])
+        replicator._replicate_object('0', '/path/to/file',
+                                     replicator.ring.devs[3]['id'])
+        self.assertEqual(4, replicator._repl_to_node.call_count)
+        # even if it's the last handoff it works to keep 3 replicas
+        # 2 primaries + 1 handoff
+        replicator._repl_to_node = mock.Mock(side_effect=[DriveNotMounted()])
+        replicator._replicate_object('0', '/path/to/file',
+                                     replicator.ring.devs[-1]['id'])
+        self.assertEqual(4, replicator._repl_to_node.call_count)
+        # with two DriveNotMounted exceptions called on +2 more replica keeping
+        # durability
+        replicator._repl_to_node = mock.Mock(
+            side_effect=[DriveNotMounted()] * 2)
+        replicator._replicate_object('0', '/path/to/file',
+                                     replicator.ring.devs[0]['id'])
+        self.assertEqual(4, replicator._repl_to_node.call_count)
+
+    def test_replicate_object_with_exception_run_out_of_nodes(self):
+        replicator = ConcreteReplicator({})
+        replicator.ring = FakeRingWithNodes().Ring('path')
+        replicator.brokerclass = FakeAccountBroker
+        replicator.delete_db = self.stub_delete_db
+        # all other devices are not mounted
+        replicator._repl_to_node = mock.Mock(side_effect=DriveNotMounted())
+        replicator._replicate_object('0', '/path/to/file',
+                                     replicator.ring.devs[0]['id'])
+        self.assertEqual(5, replicator._repl_to_node.call_count)
+
+    def test_replicate_account_out_of_place(self):
+        replicator = ConcreteReplicator({}, logger=self.logger)
+        replicator.ring = FakeRingWithNodes().Ring('path')
+        replicator.brokerclass = FakeAccountBroker
+        replicator._repl_to_node = lambda *args: True
+        replicator.delete_db = self.stub_delete_db
+        # Correct node_id, wrong part
+        part = replicator.ring.get_part(TEST_ACCOUNT_NAME) + 1
+        node_id = replicator.ring.get_part_nodes(part)[0]['id']
+        replicator._replicate_object(str(part), '/path/to/file', node_id)
+        self.assertEqual(['/path/to/file'], self.delete_db_calls)
+        error_msgs = replicator.logger.get_lines_for_level('error')
+        expected = ('Found db that should be on '
+                    'partition 0; will replicate out and remove,'
+                    ' path: a%20c%20t, db: /path/to/file')
+        self.assertEqual(error_msgs, [expected])
+
+    def test_replicate_container_out_of_place(self):
+        replicator = ConcreteReplicator({}, logger=self.logger)
+        replicator.ring = FakeRingWithNodes().Ring('path')
+        replicator._repl_to_node = lambda *args: True
+        replicator.delete_db = self.stub_delete_db
+        # Correct node_id, wrong part
+        part = replicator.ring.get_part(
+            TEST_ACCOUNT_NAME, TEST_CONTAINER_NAME) + 1
+        node_id = replicator.ring.get_part_nodes(part)[0]['id']
+        replicator._replicate_object(str(part), '/path/to/file', node_id)
+        self.assertEqual(['/path/to/file'], self.delete_db_calls)
+        self.assertEqual(
+            replicator.logger.get_lines_for_level('error'),
+            ['Found db that should '
+             'be on partition 0; will replicate out and remove,'
+             ' path: a%20c%20t/c%20o%20n, db: /path/to/file'])
+
+    def test_replicate_container_out_of_place_no_node(self):
+        replicator = ConcreteReplicator({}, logger=self.logger)
+        replicator.ring = FakeRingWithSingleNode().Ring('path')
+        replicator._repl_to_node = lambda *args: True
+
+        replicator.delete_db = self.stub_delete_db
+        # Correct node_id, wrong part
+        part = replicator.ring.get_part(
+            TEST_ACCOUNT_NAME, TEST_CONTAINER_NAME) + 1
+        node_id = replicator.ring.get_part_nodes(part)[0]['id']
+        replicator._replicate_object(str(part), '/path/to/file', node_id)
+        self.assertEqual(['/path/to/file'], self.delete_db_calls)
+
+        self.delete_db_calls = []
+
+        # No nodes this time
+        replicator.ring.get_part_nodes = lambda *args: []
+        replicator.delete_db = self.stub_delete_db
+        # Correct node_id, wrong part
+        part = replicator.ring.get_part(
+            TEST_ACCOUNT_NAME, TEST_CONTAINER_NAME) + 1
+        replicator._replicate_object(str(part), '/path/to/file', node_id)
+        self.assertEqual([], self.delete_db_calls)
+
+    def test_replicate_object_different_region(self):
+        db_replicator.ring = FakeRingWithNodes()
+        replicator = ConcreteReplicator({})
+        replicator._repl_to_node = mock.Mock()
+        # For node_id = 1, one replica in same region(1) and other is in a
+        # different region(2). Refer: FakeRingWithNodes
+        replicator._replicate_object('0', '/path/to/file', 1)
+        # different_region was set True and passed to _repl_to_node()
+        self.assertEqual(replicator._repl_to_node.call_args_list[0][0][-1],
+                         True)
+        # different_region was set False and passed to _repl_to_node()
+        self.assertEqual(replicator._repl_to_node.call_args_list[1][0][-1],
+                         False)
 
     def test_delete_db(self):
         db_replicator.lock_parent_directory = lock_parent_directory
-        replicator = TestReplicator({})
+        replicator = ConcreteReplicator({}, logger=self.logger)
         replicator._zero_stats()
         replicator.extract_device = lambda _: 'some_device'
-        replicator.logger = FakeLogger()
 
-        temp_dir = mkdtemp()
-        try:
-            temp_suf_dir = os.path.join(temp_dir, '16e')
-            os.mkdir(temp_suf_dir)
-            temp_hash_dir = os.path.join(temp_suf_dir,
-                                         '166e33924a08ede4204871468c11e16e')
-            os.mkdir(temp_hash_dir)
-            temp_file = NamedTemporaryFile(dir=temp_hash_dir, delete=False)
-            temp_hash_dir2 = os.path.join(temp_suf_dir,
-                                         '266e33924a08ede4204871468c11e16e')
-            os.mkdir(temp_hash_dir2)
-            temp_file2 = NamedTemporaryFile(dir=temp_hash_dir2, delete=False)
-
-            # sanity-checks
-            self.assertTrue(os.path.exists(temp_dir))
-            self.assertTrue(os.path.exists(temp_suf_dir))
-            self.assertTrue(os.path.exists(temp_hash_dir))
-            self.assertTrue(os.path.exists(temp_file.name))
-            self.assertTrue(os.path.exists(temp_hash_dir2))
-            self.assertTrue(os.path.exists(temp_file2.name))
-            self.assertEqual(0, replicator.stats['remove'])
-
-            replicator.delete_db(temp_file.name)
-
-            self.assertTrue(os.path.exists(temp_dir))
-            self.assertTrue(os.path.exists(temp_suf_dir))
-            self.assertFalse(os.path.exists(temp_hash_dir))
-            self.assertFalse(os.path.exists(temp_file.name))
-            self.assertTrue(os.path.exists(temp_hash_dir2))
-            self.assertTrue(os.path.exists(temp_file2.name))
-            self.assertEqual([(('removes.some_device',), {})],
-                             replicator.logger.log_dict['increment'])
-            self.assertEqual(1, replicator.stats['remove'])
-
-            replicator.delete_db(temp_file2.name)
-
-            self.assertTrue(os.path.exists(temp_dir))
-            self.assertFalse(os.path.exists(temp_suf_dir))
-            self.assertFalse(os.path.exists(temp_hash_dir))
-            self.assertFalse(os.path.exists(temp_file.name))
-            self.assertFalse(os.path.exists(temp_hash_dir2))
-            self.assertFalse(os.path.exists(temp_file2.name))
-            self.assertEqual([(('removes.some_device',), {})] * 2,
-                             replicator.logger.log_dict['increment'])
-            self.assertEqual(2, replicator.stats['remove'])
-        finally:
-            rmtree(temp_dir)
+        temp_part_dir = os.path.join(self.temp_dir, '140')
+        os.mkdir(temp_part_dir)
+        temp_suf_dir = os.path.join(temp_part_dir, '16e')
+        os.mkdir(temp_suf_dir)
+        temp_hash_dir = os.path.join(temp_suf_dir,
+                                     '166e33924a08ede4204871468c11e16e')
+        os.mkdir(temp_hash_dir)
+        temp_file = NamedTemporaryFile(dir=temp_hash_dir, delete=False)
+        temp_hash_dir2 = os.path.join(temp_suf_dir,
+                                      '266e33924a08ede4204871468c11e16e')
+        os.mkdir(temp_hash_dir2)
+        temp_file2 = NamedTemporaryFile(dir=temp_hash_dir2, delete=False)
+
+        # sanity-checks
+        self.assertTrue(os.path.exists(self.temp_dir))
+        self.assertTrue(os.path.exists(temp_part_dir))
+        self.assertTrue(os.path.exists(temp_suf_dir))
+        self.assertTrue(os.path.exists(temp_hash_dir))
+        self.assertTrue(os.path.exists(temp_file.name))
+        self.assertTrue(os.path.exists(temp_hash_dir2))
+        self.assertTrue(os.path.exists(temp_file2.name))
+        self.assertEqual(0, replicator.stats['remove'])
+
+        temp_file.db_file = temp_file.name
+        replicator.delete_db(temp_file)
+
+        self.assertTrue(os.path.exists(self.temp_dir))
+        self.assertTrue(os.path.exists(temp_part_dir))
+        self.assertTrue(os.path.exists(temp_suf_dir))
+        self.assertFalse(os.path.exists(temp_hash_dir))
+        self.assertFalse(os.path.exists(temp_file.name))
+        self.assertTrue(os.path.exists(temp_hash_dir2))
+        self.assertTrue(os.path.exists(temp_file2.name))
+        self.assertEqual(
+            [(('removes.some_device',), {})],
+            replicator.logger.statsd_client.calls['increment'])
+        self.assertEqual(1, replicator.stats['remove'])
+
+        temp_file2.db_file = temp_file2.name
+        replicator.delete_db(temp_file2)
+
+        self.assertTrue(os.path.exists(self.temp_dir))
+        self.assertFalse(os.path.exists(temp_part_dir))
+        self.assertFalse(os.path.exists(temp_suf_dir))
+        self.assertFalse(os.path.exists(temp_hash_dir))
+        self.assertFalse(os.path.exists(temp_file.name))
+        self.assertFalse(os.path.exists(temp_hash_dir2))
+        self.assertFalse(os.path.exists(temp_file2.name))
+        self.assertEqual(
+            [(('removes.some_device',), {})] * 2,
+            replicator.logger.statsd_client.calls['increment'])
+        self.assertEqual(2, replicator.stats['remove'])
 
     def test_extract_device(self):
-        replicator = TestReplicator({'devices': '/some/root'})
+        replicator = ConcreteReplicator({'devices': '/some/root'})
         self.assertEqual('some_device', replicator.extract_device(
             '/some/root/some_device/deeper/and/deeper'))
+        self.assertEqual('UNKNOWN', replicator.extract_device(
+            '/some/foo/some_device/deeper/and/deeper'))
+
+    def test_dispatch_no_arg_pop(self):
+        rpc = db_replicator.ReplicatorRpc('/', '/', FakeBroker,
+                                          mount_check=False)
+        with unit.mock_check_drive(isdir=True):
+            response = rpc.dispatch(('a',), 'arg')
+        self.assertEqual(b'Invalid object type', response.body)
+        self.assertEqual(400, response.status_int)
+
+    def test_dispatch_drive_not_mounted(self):
+        rpc = db_replicator.ReplicatorRpc('/', '/', FakeBroker,
+                                          mount_check=True)
+
+        with unit.mock_check_drive() as mocks:
+            response = rpc.dispatch(('drive', 'part', 'hash'), ['method'])
+        self.assertEqual([mock.call(os.path.join('/drive'))],
+                         mocks['ismount'].call_args_list)
+
+        self.assertEqual('507 drive is not mounted', response.status)
+        self.assertEqual(507, response.status_int)
+
+    def test_dispatch_unexpected_operation_db_does_not_exist(self):
+        rpc = db_replicator.ReplicatorRpc('/', '/', FakeBroker,
+                                          mount_check=False)
+
+        def mock_mkdirs(path):
+            self.assertEqual('/drive/tmp', path)
+
+        self._patch(patch.object, db_replicator, 'mkdirs', mock_mkdirs)
+
+        with patch('swift.common.db_replicator.os',
+                   new=mock.MagicMock(wraps=os)) as mock_os, \
+                unit.mock_check_drive(isdir=True):
+            mock_os.path.exists.return_value = False
+            response = rpc.dispatch(('drive', 'part', 'hash'), ['unexpected'])
+
+        self.assertEqual('404 Not Found', response.status)
+        self.assertEqual(404, response.status_int)
+
+    def test_dispatch_operation_unexpected(self):
+        rpc = db_replicator.ReplicatorRpc('/', '/', FakeBroker,
+                                          mount_check=False)
+
+        self._patch(patch.object, db_replicator, 'mkdirs', lambda *args: True)
+
+        def unexpected_method(broker, args):
+            self.assertEqual(FakeBroker, broker.__class__)
+            self.assertEqual(['arg1', 'arg2'], args)
+            return 'unexpected-called'
+
+        rpc.unexpected = unexpected_method
+
+        with patch('swift.common.db_replicator.os',
+                   new=mock.MagicMock(wraps=os)) as mock_os, \
+                unit.mock_check_drive(isdir=True):
+            mock_os.path.exists.return_value = True
+            response = rpc.dispatch(('drive', 'part', 'hash'),
+                                    ['unexpected', 'arg1', 'arg2'])
+            mock_os.path.exists.assert_called_with('/part/ash/hash/hash.db')
+
+        self.assertEqual('unexpected-called', response)
+
+    def test_dispatch_operation_rsync_then_merge(self):
+        rpc = db_replicator.ReplicatorRpc('/', '/', FakeBroker,
+                                          mount_check=False)
+
+        self._patch(patch.object, db_replicator, 'renamer', lambda *args: True)
+
+        with patch('swift.common.db_replicator.os',
+                   new=mock.MagicMock(wraps=os)) as mock_os, \
+                unit.mock_check_drive(isdir=True):
+            mock_os.path.exists.return_value = True
+            response = rpc.dispatch(('drive', 'part', 'hash'),
+                                    ['rsync_then_merge', 'arg1', 'arg2'])
+            expected_calls = [call('/part/ash/hash/hash.db'),
+                              call('/drive/tmp/arg1'),
+                              call('/part/ash/hash/hash.db'),
+                              call('/drive/tmp/arg1')]
+            self.assertEqual(mock_os.path.exists.call_args_list,
+                             expected_calls)
+            self.assertEqual('204 No Content', response.status)
+            self.assertEqual(204, response.status_int)
+
+    def test_dispatch_operation_complete_rsync(self):
+        rpc = db_replicator.ReplicatorRpc('/', '/', FakeBroker,
+                                          mount_check=False)
+
+        self._patch(patch.object, db_replicator, 'renamer', lambda *args: True)
+
+        with patch('swift.common.db_replicator.os',
+                   new=mock.MagicMock(wraps=os)) as mock_os, \
+                unit.mock_check_drive(isdir=True):
+            mock_os.path.exists.side_effect = [False, True]
+            response = rpc.dispatch(('drive', 'part', 'hash'),
+                                    ['complete_rsync', 'arg1'])
+            expected_calls = [call('/part/ash/hash/hash.db'),
+                              call('/drive/tmp/arg1')]
+            self.assertEqual(mock_os.path.exists.call_args_list,
+                             expected_calls)
+            self.assertEqual('204 No Content', response.status)
+            self.assertEqual(204, response.status_int)
+
+        with patch('swift.common.db_replicator.os',
+                   new=mock.MagicMock(wraps=os)) as mock_os, \
+                unit.mock_check_drive(isdir=True):
+            mock_os.path.exists.side_effect = [False, True]
+            response = rpc.dispatch(('drive', 'part', 'hash'),
+                                    ['complete_rsync', 'arg1', 'arg2'])
+            expected_calls = [call('/part/ash/hash/arg2'),
+                              call('/drive/tmp/arg1')]
+            self.assertEqual(mock_os.path.exists.call_args_list,
+                             expected_calls)
+            self.assertEqual('204 No Content', response.status)
+            self.assertEqual(204, response.status_int)
+
+    def test_delete_db_exception_log_includes_parent_directory(self):
+        replicator = ConcreteReplicator({}, logger=self.logger)
+        replicator._zero_stats()
+        db_replicator.lock_parent_directory = lock_parent_directory
+        temp_part_dir = os.path.join(self.temp_dir, '140')
+        os.mkdir(temp_part_dir)
+        suf_dir = os.path.join(temp_part_dir, '16e')
+        os.mkdir(suf_dir)
+        hash_prefix = '166e33924a08ede4204871468c11e16e'
+        hash_dir = os.path.join(suf_dir, hash_prefix)
+        os.mkdir(hash_dir)
+        object_file = os.path.join(hash_dir, hash_prefix + '.db')
+        with open(object_file, 'w'):
+            pass
 
-#    def test_dispatch(self):
-#        rpc = db_replicator.ReplicatorRpc('/', '/', FakeBroker, False)
-#        no_op = lambda *args, **kwargs: True
-#        self.assertEquals(rpc.dispatch(('drv', 'part', 'hash'), ('op',)
-#                ).status_int, 400)
-#        rpc.mount_check = True
-#        self.assertEquals(rpc.dispatch(('drv', 'part', 'hash'), ['op',]
-#                ).status_int, 507)
-#        rpc.mount_check = False
-#        rpc.rsync_then_merge = lambda drive, db_file,
-#                                      args: self.assertEquals(args, ['test1'])
-#        rpc.complete_rsync = lambda drive, db_file,
-#                                      args: self.assertEquals(args, ['test2'])
-#        rpc.dispatch(('drv', 'part', 'hash'), ['rsync_then_merge','test1'])
-#        rpc.dispatch(('drv', 'part', 'hash'), ['complete_rsync','test2'])
-#        rpc.dispatch(('drv', 'part', 'hash'), ['other_op',])
+        broker = FakeBroker(account='a', container='c')
+        broker.db_file = object_file
+        parent_dir = suf_dir
+
+        def rmdir_side_effect(path):
+            if path == parent_dir:
+                raise OSError(errno.EPERM, "Operation not permitted")
+            return os.rmdir(path)
+
+        with mock.patch('swift.common.db_replicator.os',
+                        wraps=os) as mock_os:
+            mock_os.rmdir.side_effect = rmdir_side_effect
+            result = replicator.delete_db(broker)
+        self.assertFalse(result)
+        self.assertFalse(os.path.exists(hash_dir))
+        self.assertFalse(os.path.exists(object_file))
+
+        lines = self.logger.get_lines_for_level('error')
+        self.assertEqual(
+            ['ERROR while trying to clean up %s, path: %s, db: %s: ' %
+             (parent_dir, db_replicator.quote(broker.path),
+              broker.db_file)],
+            lines)
+
+    def test_rsync_then_merge_db_does_not_exist(self):
+        rpc = db_replicator.ReplicatorRpc('/', '/', FakeBroker,
+                                          mount_check=False)
+
+        with patch('swift.common.db_replicator.os',
+                   new=mock.MagicMock(wraps=os)) as mock_os, \
+                unit.mock_check_drive(isdir=True):
+            mock_os.path.exists.return_value = False
+            response = rpc.rsync_then_merge('drive', '/data/db.db',
+                                            ('arg1', 'arg2'))
+            mock_os.path.exists.assert_called_with('/data/db.db')
+            self.assertEqual('404 Not Found', response.status)
+            self.assertEqual(404, response.status_int)
+
+    def test_rsync_then_merge_old_does_not_exist(self):
+        rpc = db_replicator.ReplicatorRpc('/', '/', FakeBroker,
+                                          mount_check=False)
+
+        with patch('swift.common.db_replicator.os',
+                   new=mock.MagicMock(wraps=os)) as mock_os, \
+                unit.mock_check_drive(isdir=True):
+            mock_os.path.exists.side_effect = [True, False]
+            response = rpc.rsync_then_merge('drive', '/data/db.db',
+                                            ('arg1', 'arg2'))
+            expected_calls = [call('/data/db.db'), call('/drive/tmp/arg1')]
+            self.assertEqual(mock_os.path.exists.call_args_list,
+                             expected_calls)
+            self.assertEqual('404 Not Found', response.status)
+            self.assertEqual(404, response.status_int)
+
+    def test_rsync_then_merge_with_objects(self):
+        rpc = db_replicator.ReplicatorRpc('/', '/', FakeBroker,
+                                          mount_check=False)
+        target_db = '/data/db.db'
+
+        def mock_renamer(old, new):
+            self.assertEqual('/drive/tmp/arg1', old)
+            self.assertEqual(target_db, new)
+
+        self._patch(patch.object, db_replicator, 'renamer', mock_renamer)
+
+        with patch('swift.common.db_replicator.os',
+                   new=mock.MagicMock(wraps=os)) as mock_os, \
+                unit.mock_check_drive(isdir=True):
+            mock_os.path.exists.return_value = True
+            response = rpc.rsync_then_merge('drive', target_db,
+                                            ['arg1', 'arg2'])
+            self.assertEqual('204 No Content', response.status)
+            self.assertEqual(204, response.status_int)
+
+    def test_complete_rsync_db_exists(self):
+        rpc = db_replicator.ReplicatorRpc('/', '/', FakeBroker,
+                                          mount_check=False)
+
+        with patch('swift.common.db_replicator.os',
+                   new=mock.MagicMock(wraps=os)) as mock_os, \
+                unit.mock_check_drive(isdir=True):
+            mock_os.path.exists.return_value = True
+            response = rpc.complete_rsync('drive', '/data/db.db', ['arg1'])
+            mock_os.path.exists.assert_called_with('/data/db.db')
+            self.assertEqual('404 Not Found', response.status)
+            self.assertEqual(404, response.status_int)
+
+        with patch('swift.common.db_replicator.os',
+                   new=mock.MagicMock(wraps=os)) as mock_os, \
+                unit.mock_check_drive(isdir=True):
+            mock_os.path.exists.return_value = True
+            response = rpc.complete_rsync('drive', '/data/db.db',
+                                          ['arg1', 'arg2'])
+            mock_os.path.exists.assert_called_with('/data/arg2')
+            self.assertEqual('404 Not Found', response.status)
+            self.assertEqual(404, response.status_int)
+
+    def test_complete_rsync_old_file_does_not_exist(self):
+        rpc = db_replicator.ReplicatorRpc('/', '/', FakeBroker,
+                                          mount_check=False)
+
+        with patch('swift.common.db_replicator.os',
+                   new=mock.MagicMock(wraps=os)) as mock_os, \
+                unit.mock_check_drive(isdir=True):
+            mock_os.path.exists.return_value = False
+            response = rpc.complete_rsync('drive', '/data/db.db',
+                                          ['arg1'])
+            expected_calls = [call('/data/db.db'), call('/drive/tmp/arg1')]
+            self.assertEqual(expected_calls,
+                             mock_os.path.exists.call_args_list)
+            self.assertEqual('404 Not Found', response.status)
+            self.assertEqual(404, response.status_int)
+
+        with patch('swift.common.db_replicator.os',
+                   new=mock.MagicMock(wraps=os)) as mock_os, \
+                unit.mock_check_drive(isdir=True):
+            mock_os.path.exists.return_value = False
+            response = rpc.complete_rsync('drive', '/data/db.db',
+                                          ['arg1', 'arg2'])
+            expected_calls = [call('/data/arg2'), call('/drive/tmp/arg1')]
+            self.assertEqual(expected_calls,
+                             mock_os.path.exists.call_args_list)
+            self.assertEqual('404 Not Found', response.status)
+            self.assertEqual(404, response.status_int)
+
+    def test_complete_rsync_rename(self):
+        rpc = db_replicator.ReplicatorRpc('/', '/', FakeBroker,
+                                          mount_check=False)
+
+        def mock_renamer(old, new):
+            renamer_calls.append((old, new))
+
+        self._patch(patch.object, db_replicator, 'renamer', mock_renamer)
+
+        renamer_calls = []
+        with patch('swift.common.db_replicator.os',
+                   new=mock.MagicMock(wraps=os)) as mock_os, \
+                unit.mock_check_drive(isdir=True):
+            mock_os.path.exists.side_effect = [False, True]
+            response = rpc.complete_rsync('drive', '/data/db.db',
+                                          ['arg1'])
+        self.assertEqual('204 No Content', response.status)
+        self.assertEqual(204, response.status_int)
+        self.assertEqual(('/drive/tmp/arg1', '/data/db.db'), renamer_calls[0])
+        self.assertFalse(renamer_calls[1:])
+
+        renamer_calls = []
+        with patch('swift.common.db_replicator.os',
+                   new=mock.MagicMock(wraps=os)) as mock_os, \
+                unit.mock_check_drive(isdir=True):
+            mock_os.path.exists.side_effect = [False, True]
+            response = rpc.complete_rsync('drive', '/data/db.db',
+                                          ['arg1', 'arg2'])
+        self.assertEqual('204 No Content', response.status)
+        self.assertEqual(204, response.status_int)
+        self.assertEqual(('/drive/tmp/arg1', '/data/arg2'), renamer_calls[0])
+        self.assertFalse(renamer_calls[1:])
+
+    def test_replicator_sync_with_broker_replication_missing_table(self):
+        rpc = db_replicator.ReplicatorRpc('/', '/', FakeBroker,
+                                          mount_check=False,
+                                          logger=self.logger)
+        broker = FakeBroker()
+        broker.get_repl_missing_table = True
+
+        called = []
+
+        def mock_quarantine_db(object_file, server_type):
+            called.append(True)
+            self.assertEqual(broker.db_file, object_file)
+            self.assertEqual(broker.db_type, server_type)
+
+        self._patch(patch.object, db_replicator, 'quarantine_db',
+                    mock_quarantine_db)
+
+        with unit.mock_check_drive(isdir=True):
+            response = rpc.sync(broker, ('remote_sync', 'hash_', 'id_',
+                                         'created_at', 'put_timestamp',
+                                         'delete_timestamp', 'metadata'))
+
+        self.assertEqual('404 Not Found', response.status)
+        self.assertEqual(404, response.status_int)
+        self.assertEqual(called, [True])
+        errors = rpc.logger.get_lines_for_level('error')
+        self.assertEqual(errors,
+                         ["Unable to decode remote metadata 'metadata'",
+                          "Quarantining DB, path: %s, db: %s" %
+                          (quote(broker.path), broker.db_file)])
+
+    def test_replicator_sync(self):
+        rpc = db_replicator.ReplicatorRpc('/', '/', FakeBroker,
+                                          mount_check=False)
+        broker = FakeBroker()
+
+        with unit.mock_check_drive(isdir=True):
+            response = rpc.sync(broker, (
+                broker.get_sync() + 1, 12345, 'id_',
+                'created_at', 'put_timestamp', 'delete_timestamp',
+                '{"meta1": "data1", "meta2": "data2"}'))
+
+        self.assertEqual({'meta1': 'data1', 'meta2': 'data2'},
+                         broker.metadata)
+        self.assertEqual('created_at', broker.created_at)
+        self.assertEqual('put_timestamp', broker.put_timestamp)
+        self.assertEqual('delete_timestamp', broker.delete_timestamp)
+
+        self.assertEqual('200 OK', response.status)
+        self.assertEqual(200, response.status_int)
 
     def test_rsync_then_merge(self):
-        rpc = db_replicator.ReplicatorRpc('/', '/', FakeBroker, False)
-        rpc.rsync_then_merge('sda1', '/srv/swift/blah', ('a', 'b'))
+        rpc = db_replicator.ReplicatorRpc('/', '/', FakeBroker,
+                                          mount_check=False)
+        with unit.mock_check_drive(isdir=True):
+            rpc.rsync_then_merge('sda1', '/srv/swift/blah', ('a', 'b'))
 
     def test_merge_items(self):
-        rpc = db_replicator.ReplicatorRpc('/', '/', FakeBroker, False)
+        rpc = db_replicator.ReplicatorRpc('/', '/', FakeBroker,
+                                          mount_check=False)
         fake_broker = FakeBroker()
         args = ('a', 'b')
-        rpc.merge_items(fake_broker, args)
-        self.assertEquals(fake_broker.args, args)
+        with unit.mock_check_drive(isdir=True):
+            rpc.merge_items(fake_broker, args)
+        self.assertEqual(fake_broker.args, args)
 
     def test_merge_syncs(self):
-        rpc = db_replicator.ReplicatorRpc('/', '/', FakeBroker, False)
+        rpc = db_replicator.ReplicatorRpc('/', '/', FakeBroker,
+                                          mount_check=False)
         fake_broker = FakeBroker()
         args = ('a', 'b')
-        rpc.merge_syncs(fake_broker, args)
-        self.assertEquals(fake_broker.args, (args[0],))
+        with unit.mock_check_drive(isdir=True):
+            rpc.merge_syncs(fake_broker, args)
+        self.assertEqual(fake_broker.args, (args[0],))
+
+    def test_complete_rsync_with_bad_input(self):
+        drive = '/some/root'
+        db_file = __file__
+        args = ['old_file']
+        rpc = db_replicator.ReplicatorRpc('/', '/', FakeBroker,
+                                          mount_check=False)
+        with unit.mock_check_drive(isdir=True):
+            resp = rpc.complete_rsync(drive, db_file, args)
+        self.assertIsInstance(resp, HTTPException)
+        self.assertEqual(404, resp.status_int)
+        with unit.mock_check_drive(isdir=True):
+            resp = rpc.complete_rsync(drive, 'new_db_file', args)
+        self.assertIsInstance(resp, HTTPException)
+        self.assertEqual(404, resp.status_int)
+
+    def test_complete_rsync(self):
+        drive = self.temp_dir
+        args = ['old_file']
+        rpc = db_replicator.ReplicatorRpc('/', '/', FakeBroker,
+                                          mount_check=False)
+        os.mkdir('%s/tmp' % drive)
+        old_file = '%s/tmp/old_file' % drive
+        new_file = '%s/new_db_file' % drive
+        fp = open(old_file, 'w')
+        fp.write('void')
+        fp.close
+        resp = rpc.complete_rsync(drive, new_file, args)
+        self.assertEqual(204, resp.status_int)
+
+    @unit.with_tempdir
+    def test_empty_suffix_and_hash_dirs_get_cleanedup(self, tempdir):
+        datadir = os.path.join(tempdir, 'containers')
+        db_path = ('450/afd/7089ab48d955ab0851fc51cc17a34afd/'
+                   '7089ab48d955ab0851fc51cc17a34afd.db')
+        random_file = ('1060/xyz/1234ab48d955ab0851fc51cc17a34xyz/'
+                       '1234ab48d955ab0851fc51cc17a34xyz.abc')
+
+        # trailing "/" indicates empty dir
+        paths = [
+            # empty part dir
+            '240/',
+            # empty suffix dir
+            '18/aba/',
+            # empty hashdir
+            '1054/27e/d41d8cd98f00b204e9800998ecf8427e/',
+            # database
+            db_path,
+            # non database file
+            random_file,
+        ]
+        for path in paths:
+            path = os.path.join(datadir, path)
+            os.makedirs(os.path.dirname(path))
+            if os.path.basename(path):
+                # our setup requires "directories" to end in "/" (i.e. basename
+                # is ''); otherwise, create an empty file
+                open(path, 'w')
+        # sanity
+        self.assertEqual({'240', '18', '1054', '1060', '450'},
+                         set(os.listdir(datadir)))
+        for path in paths:
+            dirpath = os.path.join(datadir, os.path.dirname(path))
+            self.assertTrue(os.path.isdir(dirpath))
+
+        node_id = 1
+        results = list(db_replicator.roundrobin_datadirs(
+            [(datadir, node_id, lambda p: True)]))
+        expected = [
+            ('450', os.path.join(datadir, db_path), node_id),
+        ]
+        self.assertEqual(results, expected)
+
+        # all the empty leaf dirs are cleaned up
+        for path in paths:
+            if os.path.basename(path):
+                check = self.assertTrue
+            else:
+                check = self.assertFalse
+            dirpath = os.path.join(datadir, os.path.dirname(path))
+            isdir = os.path.isdir(dirpath)
+            check(isdir, '%r is%s a directory!' % (
+                dirpath, '' if isdir else ' not'))
+
+        # despite the leaves cleaned up it takes a few loops to finish it off
+        self.assertEqual({'18', '1054', '1060', '450'},
+                         set(os.listdir(datadir)))
+
+        results = list(db_replicator.roundrobin_datadirs(
+            [(datadir, node_id, lambda p: True)]))
+        self.assertEqual(results, expected)
+        self.assertEqual({'1054', '1060', '450'},
+                         set(os.listdir(datadir)))
+
+        results = list(db_replicator.roundrobin_datadirs(
+            [(datadir, node_id, lambda p: True)]))
+        self.assertEqual(results, expected)
+        # non db file in '1060' dir is not deleted and exception is handled
+        self.assertEqual({'1060', '450'},
+                         set(os.listdir(datadir)))
 
     def test_roundrobin_datadirs(self):
         listdir_calls = []
         isdir_calls = []
         exists_calls = []
         shuffle_calls = []
+        rmdir_calls = []
 
         def _listdir(path):
             listdir_calls.append(path)
@@ -433,7 +1831,11 @@ def _listdir(path):
                 return []
             path = path[len('/srv/node/sdx/containers'):]
             if path == '':
-                return ['123', '456', '789']  # 456 will pretend to be a file
+                return ['123', '456', '789', '9999', "-5", "not-a-partition"]
+                # 456 will pretend to be a file
+                # 9999 will be an empty partition with no contents
+                # -5 and not-a-partition were created by something outside
+                #   Swift
             elif path == '/123':
                 return ['abc', 'def.db']  # def.db will pretend to be a file
             elif path == '/123/abc':
@@ -455,6 +1857,12 @@ def _listdir(path):
             elif path == '/789/ghi/22222222222222222222222222222ghi':
                 return ['22222222222222222222222222222ghi.db',
                         'weird2']  # weird2 will pretend to be a dir, if asked
+            elif path == '9999':
+                return []
+            elif path == 'not-a-partition':
+                raise Exception("shouldn't look in not-a-partition")
+            elif path == '-5':
+                raise Exception("shouldn't look in -5")
             return []
 
         def _isdir(path):
@@ -468,7 +1876,8 @@ def _isdir(path):
                         '/123/abc/00000000000000000000000000000abc/weird1',
                         '/789', '/789/ghi',
                         '/789/ghi/22222222222222222222222222222ghi',
-                        '/789/ghi/22222222222222222222222222222ghi/weird2'):
+                        '/789/ghi/22222222222222222222222222222ghi/weird2',
+                        '/9999'):
                 return True
             return False
 
@@ -479,21 +1888,22 @@ def _exists(arg):
         def _shuffle(arg):
             shuffle_calls.append(arg)
 
-        orig_listdir = db_replicator.os.listdir
-        orig_isdir = db_replicator.os.path.isdir
-        orig_exists = db_replicator.os.path.exists
-        orig_shuffle = db_replicator.random.shuffle
-        try:
-            db_replicator.os.listdir = _listdir
-            db_replicator.os.path.isdir = _isdir
-            db_replicator.os.path.exists = _exists
-            db_replicator.random.shuffle = _shuffle
-            datadirs = [('/srv/node/sda/containers', 1),
-                        ('/srv/node/sdb/containers', 2)]
+        def _rmdir(arg):
+            rmdir_calls.append(arg)
+
+        base = 'swift.common.db_replicator.'
+        with mock.patch(base + 'os.listdir', _listdir), \
+                mock.patch(base + 'os.path.isdir', _isdir), \
+                mock.patch(base + 'os.path.exists', _exists), \
+                mock.patch(base + 'random.shuffle', _shuffle), \
+                mock.patch(base + 'os.rmdir', _rmdir):
+
+            datadirs = [('/srv/node/sda/containers', 1, lambda p: True),
+                        ('/srv/node/sdb/containers', 2, lambda p: True)]
             results = list(db_replicator.roundrobin_datadirs(datadirs))
             # The results show that the .db files are returned, the devices
             # interleaved.
-            self.assertEquals(results, [
+            self.assertEqual(results, [
                 ('123', '/srv/node/sda/containers/123/abc/'
                         '00000000000000000000000000000abc/'
                         '00000000000000000000000000000abc.db', 1),
@@ -507,7 +1917,7 @@ def _shuffle(arg):
                         '22222222222222222222222222222ghi/'
                         '22222222222222222222222222222ghi.db', 2)])
             # The listdir calls show that we only listdir the dirs
-            self.assertEquals(listdir_calls, [
+            self.assertEqual(listdir_calls, [
                 '/srv/node/sda/containers',
                 '/srv/node/sda/containers/123',
                 '/srv/node/sda/containers/123/abc',
@@ -517,10 +1927,12 @@ def _shuffle(arg):
                 '/srv/node/sda/containers/789',
                 '/srv/node/sda/containers/789/ghi',
                 '/srv/node/sdb/containers/789',
-                '/srv/node/sdb/containers/789/ghi'])
+                '/srv/node/sdb/containers/789/ghi',
+                '/srv/node/sda/containers/9999',
+                '/srv/node/sdb/containers/9999'])
             # The isdir calls show that we did ask about the things pretending
             # to be files at various levels.
-            self.assertEquals(isdir_calls, [
+            self.assertEqual(isdir_calls, [
                 '/srv/node/sda/containers/123',
                 '/srv/node/sda/containers/123/abc',
                 ('/srv/node/sda/containers/123/abc/'
@@ -548,12 +1960,14 @@ def _shuffle(arg):
                 ('/srv/node/sda/containers/789/ghi/'
                  '33333333333333333333333333333ghi'),
                 '/srv/node/sda/containers/789/jkl',
+                '/srv/node/sda/containers/9999',
                 ('/srv/node/sdb/containers/789/ghi/'
                  '33333333333333333333333333333ghi'),
-                '/srv/node/sdb/containers/789/jkl'])
+                '/srv/node/sdb/containers/789/jkl',
+                '/srv/node/sdb/containers/9999'])
             # The exists calls are the .db files we looked for as we walked the
             # structure.
-            self.assertEquals(exists_calls, [
+            self.assertEqual(exists_calls, [
                 ('/srv/node/sda/containers/123/abc/'
                  '00000000000000000000000000000abc/'
                  '00000000000000000000000000000abc.db'),
@@ -567,13 +1981,612 @@ def _shuffle(arg):
                  '22222222222222222222222222222ghi/'
                  '22222222222222222222222222222ghi.db')])
             # Shows that we called shuffle twice, once for each device.
-            self.assertEquals(
-                shuffle_calls, [['123', '456', '789'], ['123', '456', '789']])
-        finally:
-            db_replicator.os.listdir = orig_listdir
-            db_replicator.os.path.isdir = orig_isdir
-            db_replicator.os.path.exists = orig_exists
-            db_replicator.random.shuffle = orig_shuffle
+            self.assertEqual(
+                shuffle_calls, [['123', '456', '789', '9999'],
+                                ['123', '456', '789', '9999']])
+
+            # Shows that we called removed the two empty partition directories.
+            self.assertEqual(
+                rmdir_calls, ['/srv/node/sda/containers/9999',
+                              '/srv/node/sdb/containers/9999'])
+
+    @mock.patch("swift.common.db_replicator.ReplConnection", mock.Mock())
+    def test_http_connect(self):
+        node = "node"
+        partition = "partition"
+        db_file = __file__
+        replicator = ConcreteReplicator({})
+        replicator._http_connect(node, partition, db_file)
+        expected_hsh = os.path.basename(db_file).split('.', 1)[0]
+        expected_hsh = expected_hsh.split('_', 1)[0]
+        db_replicator.ReplConnection.assert_has_calls([
+            mock.call(node, partition, expected_hsh, replicator.logger)])
+
+    @unit.with_tempdir
+    def test_reclaim_tmp_files(self, tmpdir):
+        db_dir = os.path.join(tmpdir, 'containers/123/bla/some_bla/localtion/')
+        mkdirs(db_dir)
+
+        # Touch some files
+        file_mtimes = {'the_db.db': 0,
+                       'somethingelse.txt': 0,
+                       'some_temp_file.tmp': 5,
+                       'another_tmp_file.db.tmp': 10,
+                       'one_last_temp.db.tmp': 5}
+        for f in file_mtimes.keys():
+            with open(os.path.join(db_dir, f), 'w'):
+                pass
+
+        # create a broker
+        broker = FakeBroker(os.path.join(db_dir, 'the_db.db'))
+        calls = []
+
+        def fake_getmtime(path, *args, **kwargs):
+            calls.append(path)
+            return file_mtimes.get(os.path.basename(path), 0)
+
+        # OK now let's try and reclaim old tmp files
+        with mock.patch('os.path.getmtime', fake_getmtime):
+            replicator = ConcreteReplicator({'reclaim_age': 10})
+            replicator._reclaim_tmp_dbs(broker, 18)
+
+        # It should only look at the tmp files and because of the mtimes only
+        # 2 of them should have been removed
+        self.assertEqual(sorted(['another_tmp_file.db.tmp',
+                                 'somethingelse.txt',
+                                 'the_db.db']),
+                         sorted(listdir(db_dir)))
+        expected_paths_called = [
+            os.path.join(db_dir, 'another_tmp_file.db.tmp'),
+            os.path.join(db_dir, 'one_last_temp.db.tmp'),
+            os.path.join(db_dir, 'some_temp_file.tmp')]
+        self.assertEqual(expected_paths_called, sorted(calls))
+
+
+class TestHandoffsOnly(unittest.TestCase):
+    class FakeRing3Nodes(object):
+        _replicas = 3
+
+        # Three nodes, two disks each
+        devs = [
+            dict(id=0, region=1, zone=1,
+                 meta='', weight=500.0, ip='10.0.0.1', port=6201,
+                 replication_ip='10.0.0.1', replication_port=6201,
+                 device='sdp'),
+            dict(id=1, region=1, zone=1,
+                 meta='', weight=500.0, ip='10.0.0.1', port=6201,
+                 replication_ip='10.0.0.1', replication_port=6201,
+                 device='sdq'),
+
+            dict(id=2, region=1, zone=1,
+                 meta='', weight=500.0, ip='10.0.0.2', port=6201,
+                 replication_ip='10.0.0.2', replication_port=6201,
+                 device='sdp'),
+            dict(id=3, region=1, zone=1,
+                 meta='', weight=500.0, ip='10.0.0.2', port=6201,
+                 replication_ip='10.0.0.2', replication_port=6201,
+                 device='sdq'),
+
+            dict(id=4, region=1, zone=1,
+                 meta='', weight=500.0, ip='10.0.0.3', port=6201,
+                 replication_ip='10.0.0.3', replication_port=6201,
+                 device='sdp'),
+            dict(id=5, region=1, zone=1,
+                 meta='', weight=500.0, ip='10.0.0.3', port=6201,
+                 replication_ip='10.0.0.3', replication_port=6201,
+                 device='sdq'),
+        ]
+
+        def __init__(self, *a, **kw):
+            pass
+
+        def get_part(self, account, container=None, obj=None):
+            return 0
+
+        def get_part_nodes(self, part):
+            nodes = []
+            for offset in range(self._replicas):
+                i = (part + offset) % len(self.devs)
+                nodes.append(self.devs[i])
+            return nodes
+
+        def get_more_nodes(self, part):
+            for offset in range(self._replicas, len(self.devs)):
+                i = (part + offset) % len(self.devs)
+                yield self.devs[i]
+
+    def _make_fake_db(self, disk, partition, db_hash):
+        directories = [
+            os.path.join(self.root, disk),
+            os.path.join(self.root, disk, 'containers'),
+            os.path.join(self.root, disk, 'containers', str(partition)),
+            os.path.join(self.root, disk, 'containers', str(partition),
+                         db_hash[-3:]),
+            os.path.join(self.root, disk, 'containers', str(partition),
+                         db_hash[-3:], db_hash)]
+
+        for d in directories:
+            try:
+                os.mkdir(d)
+            except OSError as err:
+                if err.errno != errno.EEXIST:
+                    raise
+        file_path = os.path.join(directories[-1], db_hash + ".db")
+        with open(file_path, 'w'):
+            pass
+
+    def setUp(self):
+        self.root = mkdtemp()
+        self.logger = debug_logger()
+
+        # object disks; they're just here to make sure they don't trip us up
+        os.mkdir(os.path.join(self.root, 'sdc'))
+        os.mkdir(os.path.join(self.root, 'sdc', 'objects'))
+        os.mkdir(os.path.join(self.root, 'sdd'))
+        os.mkdir(os.path.join(self.root, 'sdd', 'objects'))
+
+        # part 0 belongs on sdp
+        self._make_fake_db('sdp', 0, '010101013cf2b7979af9eaa71cb67220')
+
+        # part 1 does not belong on sdp
+        self._make_fake_db('sdp', 1, 'abababab2b5368158355e799323b498d')
+
+        # part 1 belongs on sdq
+        self._make_fake_db('sdq', 1, '02020202e30f696a3cfa63d434a3c94e')
+
+        # part 2 does not belong on sdq
+        self._make_fake_db('sdq', 2, 'bcbcbcbc15d3835053d568c57e2c83b5')
+
+    def tearDown(self):
+        rmtree(self.root, ignore_errors=True)
+
+    def test_scary_warnings(self):
+        replicator = ConcreteReplicator({
+            'handoffs_only': 'yes',
+            'devices': self.root,
+            'bind_port': 6201,
+            'mount_check': 'no',
+        }, logger=self.logger)
+
+        with patch.object(db_replicator, 'whataremyips',
+                          return_value=['10.0.0.1']), \
+                patch.object(replicator, '_replicate_object'), \
+                patch.object(replicator, 'ring', self.FakeRing3Nodes()):
+            replicator.run_once()
+
+        self.assertEqual(
+            self.logger.get_lines_for_level('warning'),
+            [('Starting replication pass with handoffs_only and/or '
+              'handoffs_delete enabled. These '
+              'modes are not intended for normal operation; use '
+              'these options with care.'),
+             ('Finished replication pass with handoffs_only and/or '
+              'handoffs_delete enabled. If these are no longer required, '
+              'disable them.')])
+
+    def test_skips_primary_partitions(self):
+        replicator = ConcreteReplicator({
+            'handoffs_only': 'yes',
+            'devices': self.root,
+            'bind_port': 6201,
+            'mount_check': 'no',
+        })
+
+        with patch.object(db_replicator, 'whataremyips',
+                          return_value=['10.0.0.1']), \
+                patch.object(replicator, '_replicate_object') as mock_repl, \
+                patch.object(replicator, 'ring', self.FakeRing3Nodes()):
+            replicator.run_once()
+
+        self.assertEqual(sorted(mock_repl.mock_calls), [
+            mock.call('1', os.path.join(
+                self.root, 'sdp', 'containers', '1', '98d',
+                'abababab2b5368158355e799323b498d',
+                'abababab2b5368158355e799323b498d.db'), 0),
+            mock.call('2', os.path.join(
+                self.root, 'sdq', 'containers', '2', '3b5',
+                'bcbcbcbc15d3835053d568c57e2c83b5',
+                'bcbcbcbc15d3835053d568c57e2c83b5.db'), 1)])
+
+    def test_override_partitions(self):
+        replicator = ConcreteReplicator({
+            'devices': self.root,
+            'bind_port': 6201,
+            'mount_check': 'no',
+        })
+
+        with patch.object(db_replicator, 'whataremyips',
+                          return_value=['10.0.0.1']), \
+                patch.object(replicator, '_replicate_object') as mock_repl, \
+                patch.object(replicator, 'ring', self.FakeRing3Nodes()):
+            replicator.run_once(partitions="0,2")
+
+        self.assertEqual(sorted(mock_repl.mock_calls), [
+            mock.call('0', os.path.join(
+                self.root, 'sdp', 'containers', '0', '220',
+                '010101013cf2b7979af9eaa71cb67220',
+                '010101013cf2b7979af9eaa71cb67220.db'), 0),
+            mock.call('2', os.path.join(
+                self.root, 'sdq', 'containers', '2', '3b5',
+                'bcbcbcbc15d3835053d568c57e2c83b5',
+                'bcbcbcbc15d3835053d568c57e2c83b5.db'), 1)])
+
+    def test_override_devices(self):
+        replicator = ConcreteReplicator({
+            'devices': self.root,
+            'bind_port': 6201,
+            'mount_check': 'no',
+        })
+
+        with patch.object(db_replicator, 'whataremyips',
+                          return_value=['10.0.0.1']), \
+                patch.object(replicator, '_replicate_object') as mock_repl, \
+                patch.object(replicator, 'ring', self.FakeRing3Nodes()):
+            replicator.run_once(devices="sdp")
+
+        self.assertEqual(sorted(mock_repl.mock_calls), [
+            mock.call('0', os.path.join(
+                self.root, 'sdp', 'containers', '0', '220',
+                '010101013cf2b7979af9eaa71cb67220',
+                '010101013cf2b7979af9eaa71cb67220.db'), 0),
+            mock.call('1', os.path.join(
+                self.root, 'sdp', 'containers', '1', '98d',
+                'abababab2b5368158355e799323b498d',
+                'abababab2b5368158355e799323b498d.db'), 0)])
+
+    def test_override_devices_and_partitions(self):
+        replicator = ConcreteReplicator({
+            'devices': self.root,
+            'bind_port': 6201,
+            'mount_check': 'no',
+        })
+
+        with patch.object(db_replicator, 'whataremyips',
+                          return_value=['10.0.0.1']), \
+                patch.object(replicator, '_replicate_object') as mock_repl, \
+                patch.object(replicator, 'ring', self.FakeRing3Nodes()):
+            replicator.run_once(partitions="0,2", devices="sdp")
+
+        self.assertEqual(sorted(mock_repl.mock_calls), [
+            mock.call('0', os.path.join(
+                self.root, 'sdp', 'containers', '0', '220',
+                '010101013cf2b7979af9eaa71cb67220',
+                '010101013cf2b7979af9eaa71cb67220.db'), 0)])
+
+
+class TestReplToNode(unittest.TestCase):
+    def setUp(self):
+        db_replicator.ring = FakeRing()
+        self.delete_db_calls = []
+        self.broker = FakeBroker()
+        self.logger = debug_logger()
+        self.fake_statsd_client = self.logger.logger.statsd_client
+        self.replicator = ConcreteReplicator({'per_diff': 10},
+                                             logger=self.logger)
+        self.fake_node = {'ip': '127.0.0.1', 'device': 'sda1', 'port': 1000}
+        self.fake_info = {'id': 'a', 'point': -1, 'max_row': 20, 'hash': 'b',
+                          'created_at': 100, 'put_timestamp': 0,
+                          'delete_timestamp': 0, 'count': 0,
+                          'metadata': json.dumps({
+                              'Test': ('Value', normalize_timestamp(1))})}
+        self.replicator._rsync_db = mock.Mock(return_value=True)
+        self.replicator._usync_db = mock.Mock(return_value=True)
+        self.http = ReplHttp('{"id": 3, "point": -1}')
+        self.replicator._http_connect = lambda *args: self.http
+
+    def test_repl_to_node_usync_success(self):
+        rinfo = {"id": 3, "point": -1, "max_row": 10, "hash": "c"}
+        self.http = ReplHttp(json.dumps(rinfo))
+        local_sync = self.broker.get_sync()
+        self.assertEqual(self.replicator._repl_to_node(
+            self.fake_node, self.broker, '0', self.fake_info), True)
+        self.replicator._usync_db.assert_has_calls([
+            mock.call(max(rinfo['point'], local_sync), self.broker,
+                      self.http, rinfo['id'], self.fake_info['id'])
+        ])
+
+    def test_repl_to_node_rsync_success(self):
+        rinfo = {"id": 3, "point": -1, "max_row": 9, "hash": "c"}
+        self.http = ReplHttp(json.dumps(rinfo))
+        self.broker.get_sync()
+
+        self.assertEqual(self.replicator._repl_to_node(
+            self.fake_node, self.broker, '0', self.fake_info), True)
+        self.assertEqual(1, self.fake_statsd_client.counters[
+            'remote_merges']
+        )
+
+        self.replicator._rsync_db.assert_has_calls([
+            mock.call(self.broker, self.fake_node, self.http,
+                      self.fake_info['id'],
+                      replicate_method='rsync_then_merge',
+                      replicate_timeout=(self.fake_info['count'] / 2000),
+                      different_region=False)
+        ])
+
+    def test_repl_to_node_already_in_sync(self):
+        rinfo = {"id": 3, "point": -1, "max_row": 20, "hash": "b"}
+        self.http = ReplHttp(json.dumps(rinfo))
+        self.broker.get_sync()
+        self.assertEqual(self.replicator._repl_to_node(
+            self.fake_node, self.broker, '0', self.fake_info), True)
+        self.assertEqual(self.replicator._rsync_db.call_count, 0)
+        self.assertEqual(self.replicator._usync_db.call_count, 0)
+        lines = self.replicator.logger.get_lines_for_level('debug')
+        self.assertIn('in sync with 127.0.0.1:1000/sda1, nothing to do,'
+                      ' path: %s, db: %s'
+                      % (quote(self.broker.path), self.broker.db_file), lines)
+
+    def test_repl_to_node_metadata_update(self):
+        now = Timestamp(time.time()).internal
+        rmetadata = {"X-Container-Sysmeta-Test": ("XYZ", now)}
+        rinfo = {"id": 3, "point": -1, "max_row": 20, "hash": "b",
+                 "metadata": json.dumps(rmetadata)}
+        self.http = ReplHttp(json.dumps(rinfo))
+        self.broker.get_sync()
+        self.assertEqual(self.replicator._repl_to_node(
+            self.fake_node, self.broker, '0', self.fake_info), True)
+        metadata = self.broker.metadata
+        lines = self.replicator.logger.get_lines_for_level('debug')
+        self.assertIn("X-Container-Sysmeta-Test", metadata)
+        self.assertEqual("XYZ", metadata["X-Container-Sysmeta-Test"][0])
+        self.assertEqual(now, metadata["X-Container-Sysmeta-Test"][1])
+        self.assertIn('in sync with 127.0.0.1:1000/sda1, nothing to do,'
+                      ' path: %s, db: %s' % (quote(self.broker.path),
+                                             self.broker.db_file), lines)
+
+    def test_repl_to_node_not_found(self):
+        self.http = ReplHttp('{"id": 3, "point": -1}', set_status=404)
+
+        self.assertEqual(self.replicator._repl_to_node(
+            self.fake_node, self.broker, '0', self.fake_info, False), True)
+        self.assertEqual(1, self.fake_statsd_client.counters['rsyncs'])
+        self.replicator._rsync_db.assert_has_calls([
+            mock.call(self.broker, self.fake_node, self.http,
+                      self.fake_info['id'], different_region=False)
+        ])
+
+    def test_repl_to_node_drive_not_mounted(self):
+        self.http = ReplHttp('{"id": 3, "point": -1}', set_status=507)
+
+        self.assertRaises(DriveNotMounted, self.replicator._repl_to_node,
+                          self.fake_node, FakeBroker(), '0', self.fake_info)
+
+    def test_repl_to_node_300_status(self):
+        self.http = ReplHttp('{"id": 3, "point": -1}', set_status=300)
+
+        self.assertFalse(self.replicator._repl_to_node(
+            self.fake_node, FakeBroker(), '0', self.fake_info))
+
+    def test_repl_to_node_not_response(self):
+        self.http = mock.Mock(replicate=mock.Mock(return_value=None))
+        self.assertEqual(self.replicator._repl_to_node(
+            self.fake_node, FakeBroker(), '0', self.fake_info), False)
+
+    def test_repl_to_node_small_container_always_usync(self):
+        # Tests that a small container that is > 50% out of sync will
+        # still use usync.
+        rinfo = {"id": 3, "point": -1, "hash": "c"}
+
+        # Turn per_diff back to swift's default.
+        self.replicator.per_diff = 1000
+        for r, l in ((5, 20), (40, 100), (450, 1000), (550, 1500)):
+            rinfo['max_row'] = r
+            self.fake_info['max_row'] = l
+            self.replicator._usync_db = mock.Mock(return_value=True)
+            self.http = ReplHttp(json.dumps(rinfo))
+            local_sync = self.broker.get_sync()
+            self.assertEqual(self.replicator._repl_to_node(
+                self.fake_node, self.broker, '0', self.fake_info), True)
+            self.replicator._usync_db.assert_has_calls([
+                mock.call(max(rinfo['point'], local_sync), self.broker,
+                          self.http, rinfo['id'], self.fake_info['id'])
+            ])
+
+
+class ExampleReplicator(db_replicator.Replicator):
+    # We need to have a valid server_type
+    server_type = 'object'
+    brokerclass = ExampleBroker
+    datadir = 'fake'
+    default_port = 1000
+
+
+class TestReplicatorSync(unittest.TestCase):
+
+    # override in subclass
+    backend = ExampleReplicator.brokerclass
+    datadir = ExampleReplicator.datadir
+    replicator_daemon = ExampleReplicator
+    replicator_rpc = db_replicator.ReplicatorRpc
+
+    def setUp(self):
+        self.root = mkdtemp()
+        self.rpc = self.replicator_rpc(
+            self.root, self.datadir, self.backend, mount_check=False,
+            logger=debug_logger())
+        FakeReplConnection = attach_fake_replication_rpc(self.rpc)
+        p = mock.patch.object(db_replicator, 'ReplConnection',
+                              FakeReplConnection)
+        p.start()
+        # it turns out this works very well, even if a test leaks a global
+        # patch this will restore the original db_replicator.ReplConnection
+        self.addCleanup(p.stop)
+        self._ring = unit.FakeRing()
+        p = mock.patch.object(db_replicator.ring, 'Ring', self._get_ring)
+        p.start()
+        self.addCleanup(p.stop)
+        self.logger = debug_logger()
+
+    def tearDown(self):
+        rmtree(self.root)
+
+    def _get_ring(self, *args, **kwargs):
+        return self._ring
+
+    def _get_broker(self, account, container=None, node_index=0):
+        hash_ = hash_path(account, container)
+        part, nodes = self._ring.get_nodes(account, container)
+        drive = nodes[node_index]['device']
+        db_path = os.path.join(self.root, drive,
+                               storage_directory(self.datadir, part, hash_),
+                               hash_ + '.db')
+        return self.backend(db_path, account=account, container=container)
+
+    def _get_broker_part_node(self, broker):
+        part, nodes = self._ring.get_nodes(broker.account, broker.container)
+        storage_dir = broker.db_file[len(self.root):].lstrip(os.path.sep)
+        broker_device = storage_dir.split(os.path.sep, 1)[0]
+        for node in nodes:
+            if node['device'] == broker_device:
+                return part, node
+
+    def _get_daemon(self, node, conf_updates):
+        conf = {
+            'devices': self.root,
+            'recon_cache_path': self.root,
+            'mount_check': 'false',
+            'bind_port': node['replication_port'],
+        }
+        if conf_updates:
+            conf.update(conf_updates)
+        return self.replicator_daemon(conf, logger=self.logger)
+
+    def _install_fake_rsync_file(self, daemon, captured_calls=None):
+        def _rsync_file(src, remote_file, **kwargs):
+            src_path = src.db_file
+            if captured_calls is not None:
+                captured_calls.append((src_path, remote_file, kwargs))
+            remote_server, remote_path = remote_file.split('/', 1)
+            dest_path = os.path.join(self.root, remote_path)
+            copy(src_path, dest_path)
+            return True
+        daemon._rsync_file = _rsync_file
+
+    def _run_once(self, node, conf_updates=None, daemon=None):
+        daemon = daemon or self._get_daemon(node, conf_updates)
+        self._install_fake_rsync_file(daemon)
+        with mock.patch('swift.common.db_replicator.whataremyips',
+                        new=lambda *a, **kw: [node['replication_ip']]), \
+                unit.mock_check_drive(isdir=not daemon.mount_check,
+                                      ismount=daemon.mount_check):
+            daemon.run_once()
+        return daemon
+
+    def test_local_ids(self):
+        for drive in ('sda', 'sdb', 'sdd'):
+            os.makedirs(os.path.join(self.root, drive, self.datadir))
+        for node in self._ring.devs:
+            daemon = self._run_once(node)
+            if node['device'] == 'sdc':
+                self.assertEqual(daemon._local_device_ids, {})
+            else:
+                self.assertEqual(daemon._local_device_ids,
+                                 {node['id']: node})
+
+    def test_clean_up_after_deleted_brokers(self):
+        broker = self._get_broker('a', 'c', node_index=0)
+        part, node = self._get_broker_part_node(broker)
+        part = str(part)
+        daemon = self._run_once(node)
+        # create a super old broker and delete it!
+        forever_ago = time.time() - daemon.reclaim_age
+        put_timestamp = normalize_timestamp(forever_ago - 2)
+        delete_timestamp = normalize_timestamp(forever_ago - 1)
+        broker.initialize(put_timestamp)
+        broker.delete_db(delete_timestamp)
+        # if we have a container broker make sure it's reported
+        if hasattr(broker, 'reported'):
+            info = broker.get_info()
+            broker.reported(info['put_timestamp'],
+                            info['delete_timestamp'],
+                            info['object_count'],
+                            info['bytes_used'])
+        info = broker.get_replication_info()
+        self.assertTrue(daemon.report_up_to_date(info))
+        # we have a part dir
+        part_root = os.path.join(self.root, node['device'], self.datadir)
+        parts = os.listdir(part_root)
+        self.assertEqual([part], parts)
+        # with a single suffix
+        suff = os.listdir(os.path.join(part_root, part))
+        self.assertEqual(1, len(suff))
+        # running replicator will remove the deleted db
+        daemon = self._run_once(node, daemon=daemon)
+        self.assertEqual(1, daemon.stats['remove'])
+        # which also takes out the empty part dir
+        parts = os.listdir(part_root)
+        self.assertEqual(0, len(parts))
+
+    def test_rsync_then_merge(self):
+        # setup current db (and broker)
+        broker = self._get_broker('a', 'c', node_index=0)
+        part, node = self._get_broker_part_node(broker)
+        part = str(part)
+        put_timestamp = normalize_timestamp(time.time())
+        broker.initialize(put_timestamp)
+        put_metadata = {'example-meta': ['bah', put_timestamp]}
+        broker.update_metadata(put_metadata)
+
+        # sanity (re-open, and the db keeps the metadata)
+        broker = self._get_broker('a', 'c', node_index=0)
+        self.assertEqual(put_metadata, broker.metadata)
+
+        # create rsynced db in tmp dir
+        obj_hash = hash_path('a', 'c')
+        rsynced_db_broker = self.backend(
+            os.path.join(self.root, node['device'], 'tmp', obj_hash + '.db'),
+            account='a', container='b')
+        rsynced_db_broker.initialize(put_timestamp)
+
+        # do rysnc_then_merge
+        rpc = db_replicator.ReplicatorRpc(
+            self.root, self.datadir, self.backend, False)
+        response = rpc.dispatch((node['device'], part, obj_hash),
+                                ['rsync_then_merge', obj_hash + '.db', 'arg2'])
+        # sanity
+        self.assertEqual('204 No Content', response.status)
+        self.assertEqual(204, response.status_int)
+
+        # re-open the db
+        broker = self._get_broker('a', 'c', node_index=0)
+        # keep the metadata in existing db
+        self.assertEqual(put_metadata, broker.metadata)
+
+    def test_replicator_sync(self):
+        # setup current db (and broker)
+        broker = self._get_broker('a', 'c', node_index=0)
+        part, node = self._get_broker_part_node(broker)
+        part = str(part)
+        put_timestamp = normalize_timestamp(time.time())
+        broker.initialize(put_timestamp)
+        put_metadata = {'example-meta': ['bah', put_timestamp]}
+        sync_local_metadata = {
+            "meta1": ["data1", put_timestamp],
+            "meta2": ["data2", put_timestamp]}
+        broker.update_metadata(put_metadata)
+
+        # sanity (re-open, and the db keeps the metadata)
+        broker = self._get_broker('a', 'c', node_index=0)
+        self.assertEqual(put_metadata, broker.metadata)
+
+        # do rysnc_then_merge
+        rpc = db_replicator.ReplicatorRpc(
+            self.root, self.datadir, ExampleBroker, False)
+        response = rpc.sync(
+            broker, (broker.get_sync('id_') + 1, 12345, 'id_',
+                     put_timestamp, put_timestamp, '0',
+                     json.dumps(sync_local_metadata)))
+        # sanity
+        self.assertEqual('200 OK', response.status)
+        self.assertEqual(200, response.status_int)
+
+        # re-open the db
+        broker = self._get_broker('a', 'c', node_index=0)
+        # keep the both metadata in existing db and local db
+        expected = put_metadata.copy()
+        expected.update(sync_local_metadata)
+        self.assertEqual(expected, broker.metadata)
 
 
 if __name__ == '__main__':
diff --git a/test/unit/common/test_digest.py b/test/unit/common/test_digest.py
new file mode 100644
index 0000000000..d2105169f8
--- /dev/null
+++ b/test/unit/common/test_digest.py
@@ -0,0 +1,191 @@
+# Copyright (c) 2022 NVIDIA
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import hashlib
+import unittest
+
+from swift.common import digest
+from test.debug_logger import debug_logger
+
+
+class TestDigestUtils(unittest.TestCase):
+    """Tests for swift.common.middleware.digest """
+    def setUp(self):
+        self.logger = debug_logger('test_digest_utils')
+
+    def test_get_hmac(self):
+        self.assertEqual(
+            digest.get_hmac('GET', '/path', 1, 'abc'),
+            'b17f6ff8da0e251737aa9e3ee69a881e3e092e2f')
+
+    def test_get_hmac_ip_range(self):
+        self.assertEqual(
+            digest.get_hmac('GET', '/path', 1, 'abc', ip_range='127.0.0.1'),
+            'b30dde4d2b8562b8496466c3b46b2b9ac5054461')
+
+    def test_get_hmac_ip_range_non_binary_type(self):
+        self.assertEqual(
+            digest.get_hmac(
+                u'GET', u'/path', 1, u'abc', ip_range=u'127.0.0.1'),
+            'b30dde4d2b8562b8496466c3b46b2b9ac5054461')
+
+    def test_get_hmac_digest(self):
+        self.assertEqual(
+            digest.get_hmac(u'GET', u'/path', 1, u'abc', digest='sha256'),
+            '64c5558394f86b042ce1e929b34907abd9d0a57f3e20cd3f93cffd83de0206a7')
+        self.assertEqual(
+            digest.get_hmac(
+                u'GET', u'/path', 1, u'abc', digest=hashlib.sha256),
+            '64c5558394f86b042ce1e929b34907abd9d0a57f3e20cd3f93cffd83de0206a7')
+
+        self.assertEqual(
+            digest.get_hmac(u'GET', u'/path', 1, u'abc', digest='sha512'),
+            '7e95af818aec1b69b53fc2cb6d69456ec64ebda6c17b8fc8b7303b78acc8ca'
+            '14fc4aed96c1614a8e9d6ff45a6237711d8be294cda679624825d79aa6959b'
+            '5229')
+        self.assertEqual(
+            digest.get_hmac(
+                u'GET', u'/path', 1, u'abc', digest=hashlib.sha512),
+            '7e95af818aec1b69b53fc2cb6d69456ec64ebda6c17b8fc8b7303b78acc8ca'
+            '14fc4aed96c1614a8e9d6ff45a6237711d8be294cda679624825d79aa6959b'
+            '5229')
+
+    def test_extract_digest_and_algorithm(self):
+        self.assertEqual(
+            digest.extract_digest_and_algorithm(
+                'b17f6ff8da0e251737aa9e3ee69a881e3e092e2f'),
+            ('sha1', 'b17f6ff8da0e251737aa9e3ee69a881e3e092e2f'))
+        self.assertEqual(
+            digest.extract_digest_and_algorithm(
+                'sha1:sw3eTSuFYrhJZGbDtGsrmsUFRGE='),
+            ('sha1', 'b30dde4d2b8562b8496466c3b46b2b9ac5054461'))
+        # also good with '=' stripped
+        self.assertEqual(
+            digest.extract_digest_and_algorithm(
+                'sha1:sw3eTSuFYrhJZGbDtGsrmsUFRGE'),
+            ('sha1', 'b30dde4d2b8562b8496466c3b46b2b9ac5054461'))
+
+        self.assertEqual(
+            digest.extract_digest_and_algorithm(
+                'b963712313cd4236696fb4c4cf11fc56'
+                'ff4158e0bcbf1d4424df147783fd1045'),
+            ('sha256', 'b963712313cd4236696fb4c4cf11fc56'
+                       'ff4158e0bcbf1d4424df147783fd1045'))
+        self.assertEqual(
+            digest.extract_digest_and_algorithm(
+                'sha256:uWNxIxPNQjZpb7TEzxH8Vv9BWOC8vx1EJN8Ud4P9EEU='),
+            ('sha256', 'b963712313cd4236696fb4c4cf11fc56'
+                       'ff4158e0bcbf1d4424df147783fd1045'))
+        self.assertEqual(
+            digest.extract_digest_and_algorithm(
+                'sha256:uWNxIxPNQjZpb7TEzxH8Vv9BWOC8vx1EJN8Ud4P9EEU'),
+            ('sha256', 'b963712313cd4236696fb4c4cf11fc56'
+                       'ff4158e0bcbf1d4424df147783fd1045'))
+
+        self.assertEqual(
+            digest.extract_digest_and_algorithm(
+                '26df3d9d59da574d6f8d359cb2620b1b'
+                '86737215c38c412dfee0a410acea1ac4'
+                '285ad0c37229ca74e715c443979da17d'
+                '3d77a97d2ac79cc5e395b05bfa4bdd30'),
+            ('sha512', '26df3d9d59da574d6f8d359cb2620b1b'
+                       '86737215c38c412dfee0a410acea1ac4'
+                       '285ad0c37229ca74e715c443979da17d'
+                       '3d77a97d2ac79cc5e395b05bfa4bdd30'))
+        self.assertEqual(
+            digest.extract_digest_and_algorithm(
+                'sha512:Jt89nVnaV01vjTWcsmILG4ZzchXDjEEt/uCkEKzq'
+                'GsQoWtDDcinKdOcVxEOXnaF9PXepfSrHnMXjlbBb+kvdMA=='),
+            ('sha512', '26df3d9d59da574d6f8d359cb2620b1b'
+                       '86737215c38c412dfee0a410acea1ac4'
+                       '285ad0c37229ca74e715c443979da17d'
+                       '3d77a97d2ac79cc5e395b05bfa4bdd30'))
+        self.assertEqual(
+            digest.extract_digest_and_algorithm(
+                'sha512:Jt89nVnaV01vjTWcsmILG4ZzchXDjEEt_uCkEKzq'
+                'GsQoWtDDcinKdOcVxEOXnaF9PXepfSrHnMXjlbBb-kvdMA'),
+            ('sha512', '26df3d9d59da574d6f8d359cb2620b1b'
+                       '86737215c38c412dfee0a410acea1ac4'
+                       '285ad0c37229ca74e715c443979da17d'
+                       '3d77a97d2ac79cc5e395b05bfa4bdd30'))
+
+        with self.assertRaises(ValueError):
+            digest.extract_digest_and_algorithm('')
+        with self.assertRaises(ValueError):
+            digest.extract_digest_and_algorithm(
+                'exactly_forty_chars_but_not_hex_encoded!')
+        # Too short (md5)
+        with self.assertRaises(ValueError):
+            digest.extract_digest_and_algorithm(
+                'd41d8cd98f00b204e9800998ecf8427e')
+        # but you can slip it in via the prefix notation!
+        self.assertEqual(
+            digest.extract_digest_and_algorithm(
+                'md5:1B2M2Y8AsgTpgAmY7PhCfg'),
+            ('md5', 'd41d8cd98f00b204e9800998ecf8427e'))
+
+    def test_get_allowed_digests(self):
+        # start with defaults
+        allowed, deprecated = digest.get_allowed_digests(
+            ''.split(), self.logger)
+        self.assertEqual(allowed, {'sha256', 'sha512', 'sha1'})
+        self.assertEqual(deprecated, {'sha1'})
+        warning_lines = self.logger.get_lines_for_level('warning')
+        expected_warning_line = (
+            'The following digest algorithms are allowed by default but '
+            'deprecated: sha1. Support will be disabled by default in a '
+            'future release, and later removed entirely.')
+        self.assertIn(expected_warning_line, warning_lines)
+        self.logger.clear()
+
+        # now with a subset
+        allowed, deprecated = digest.get_allowed_digests(
+            'sha1 sha256'.split(), self.logger)
+        self.assertEqual(allowed, {'sha256', 'sha1'})
+        self.assertEqual(deprecated, {'sha1'})
+        warning_lines = self.logger.get_lines_for_level('warning')
+        expected_warning_line = (
+            'The following digest algorithms are configured but '
+            'deprecated: sha1. Support will be removed in a future release.')
+        self.assertIn(expected_warning_line, warning_lines)
+        self.logger.clear()
+
+        # Now also with an unsupported digest
+        allowed, deprecated = digest.get_allowed_digests(
+            'sha1 sha256 md5'.split(), self.logger)
+        self.assertEqual(allowed, {'sha256', 'sha1'})
+        self.assertEqual(deprecated, {'sha1'})
+        warning_lines = self.logger.get_lines_for_level('warning')
+        self.assertIn(expected_warning_line, warning_lines)
+        expected_unsupported_warning_line = (
+            'The following digest algorithms are configured but not '
+            'supported: md5')
+        self.assertIn(expected_unsupported_warning_line, warning_lines)
+        self.logger.clear()
+
+        # Now with no deprecated digests
+        allowed, deprecated = digest.get_allowed_digests(
+            'sha256 sha512'.split(), self.logger)
+        self.assertEqual(allowed, {'sha256', 'sha512'})
+        self.assertEqual(deprecated, set())
+        warning_lines = self.logger.get_lines_for_level('warning')
+        self.assertFalse(warning_lines)
+        self.logger.clear()
+
+        # no valid digest
+        # Now also with an unsupported digest
+        with self.assertRaises(ValueError):
+            digest.get_allowed_digests(['md5'], self.logger)
+        warning_lines = self.logger.get_lines_for_level('warning')
+        self.assertIn(expected_unsupported_warning_line, warning_lines)
diff --git a/test/unit/common/test_direct_client.py b/test/unit/common/test_direct_client.py
index d1996e58f7..34f25ecd01 100644
--- a/test/unit/common/test_direct_client.py
+++ b/test/unit/common/test_direct_client.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,17 +13,1119 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-# TODO: Tests
-
+import io
+import json
 import unittest
+import os
+from contextlib import contextmanager
+import time
+import pickle
+
+from unittest import mock
+import urllib.parse
 
 from swift.common import direct_client
+from swift.common.direct_client import DirectClientException
+from swift.common.exceptions import ClientException
+from swift.common.header_key_dict import HeaderKeyDict
+from swift.common.utils import Timestamp, quote, md5
+from swift.common.swob import RESPONSE_REASONS
+from swift.common.storage_policy import POLICIES
+from http.client import HTTPException
+
+from test.debug_logger import debug_logger
+from test.unit import patch_policies
+
+
+class FakeConn(object):
+
+    def __init__(self, status, headers=None, body='', **kwargs):
+        self.status = status
+        try:
+            self.reason = RESPONSE_REASONS[self.status][0]
+        except Exception:
+            self.reason = 'Fake'
+        self.body = body
+        self.resp_headers = HeaderKeyDict()
+        if headers:
+            self.resp_headers.update(headers)
+        self.etag = None
+
+    def _update_raw_call_args(self, *args, **kwargs):
+        capture_attrs = ('host', 'port', 'method', 'path', 'req_headers',
+                         'query_string')
+        for attr, value in zip(capture_attrs, args[:len(capture_attrs)]):
+            setattr(self, attr, value)
+        return self
+
+    def getresponse(self):
+        if self.etag:
+            self.resp_headers['etag'] = str(self.etag.hexdigest())
+        if isinstance(self.status, Exception):
+            raise self.status
+        return self
+
+    def getheader(self, header, default=None):
+        return self.resp_headers.get(header, default)
+
+    def getheaders(self):
+        return self.resp_headers.items()
 
+    def read(self, amt=None):
+        if isinstance(self.body, io.BytesIO):
+            return self.body.read(amt)
+        elif amt is None:
+            return self.body
+        else:
+            return Exception('Not a StringIO entry')
 
+    def send(self, data):
+        if not self.etag:
+            self.etag = md5(usedforsecurity=False)
+        self.etag.update(data)
+
+
+@contextmanager
+def mocked_http_conn(*args, **kwargs):
+    mocked = kwargs.pop('mocked', 'swift.common.bufferedhttp.http_connect_raw')
+    fake_conn = FakeConn(*args, **kwargs)
+    mock_http_conn = lambda *args, **kwargs: \
+        fake_conn._update_raw_call_args(*args, **kwargs)
+    with mock.patch(mocked, new=mock_http_conn):
+        yield fake_conn
+
+
+@patch_policies
 class TestDirectClient(unittest.TestCase):
 
-    def test_placeholder(self):
-        pass
+    def setUp(self):
+        self.node = json.loads(json.dumps({  # json roundtrip to ring-like
+            'ip': '1.2.3.4', 'port': '6200', 'device': 'sda',
+            'replication_ip': '1.2.3.5', 'replication_port': '7000'}))
+        self.part = '0'
+
+        self.account = u'\u062a account'
+        self.container = u'\u062a container'
+        self.obj = u'\u062a obj/name'
+        self.account_path = '/sda/0/%s' % urllib.parse.quote(
+            self.account.encode('utf-8'))
+        self.container_path = '/sda/0/%s/%s' % tuple(
+            urllib.parse.quote(p.encode('utf-8')) for p in (
+                self.account, self.container))
+        self.obj_path = '/sda/0/%s/%s/%s' % tuple(
+            urllib.parse.quote(p.encode('utf-8')) for p in (
+                self.account, self.container, self.obj))
+        self.user_agent = 'direct-client %s' % os.getpid()
+
+        class FakeTimeout(BaseException):
+            def __enter__(self):
+                return self
+
+            def __exit__(self, typ, value, tb):
+                pass
+
+        patcher = mock.patch.object(direct_client, 'Timeout', FakeTimeout)
+        patcher.start()
+        self.addCleanup(patcher.stop)
+
+    def test_gen_headers(self):
+        stub_user_agent = 'direct-client %s' % os.getpid()
+
+        headers = direct_client.gen_headers(add_ts=False)
+        self.assertEqual(dict(headers), {
+            'User-Agent': stub_user_agent,
+            'X-Backend-Allow-Reserved-Names': 'true',
+        })
+
+        with mock.patch('swift.common.utils.Timestamp.now',
+                        return_value=Timestamp('123.45')):
+            headers = direct_client.gen_headers()
+        self.assertEqual(dict(headers), {
+            'User-Agent': stub_user_agent,
+            'X-Backend-Allow-Reserved-Names': 'true',
+            'X-Timestamp': '0000000123.45000',
+        })
+
+        headers = direct_client.gen_headers(hdrs_in={'x-timestamp': '15'})
+        self.assertEqual(dict(headers), {
+            'User-Agent': stub_user_agent,
+            'X-Backend-Allow-Reserved-Names': 'true',
+            'X-Timestamp': '15',
+        })
+
+        with mock.patch('swift.common.utils.Timestamp.now',
+                        return_value=Timestamp('12345.6789')):
+            headers = direct_client.gen_headers(hdrs_in={'foo-bar': '63'})
+        self.assertEqual(dict(headers), {
+            'User-Agent': stub_user_agent,
+            'Foo-Bar': '63',
+            'X-Backend-Allow-Reserved-Names': 'true',
+            'X-Timestamp': '0000012345.67890',
+        })
+
+        hdrs_in = {'foo-bar': '55'}
+        headers = direct_client.gen_headers(hdrs_in, add_ts=False)
+        self.assertEqual(dict(headers), {
+            'User-Agent': stub_user_agent,
+            'Foo-Bar': '55',
+            'X-Backend-Allow-Reserved-Names': 'true',
+        })
+
+        with mock.patch('swift.common.utils.Timestamp.now',
+                        return_value=Timestamp('12345')):
+            headers = direct_client.gen_headers(hdrs_in={'user-agent': '32'})
+        self.assertEqual(dict(headers), {
+            'User-Agent': '32',
+            'X-Backend-Allow-Reserved-Names': 'true',
+            'X-Timestamp': '0000012345.00000',
+        })
+
+        hdrs_in = {'user-agent': '47'}
+        headers = direct_client.gen_headers(hdrs_in, add_ts=False)
+        self.assertEqual(dict(headers), {
+            'User-Agent': '47',
+            'X-Backend-Allow-Reserved-Names': 'true',
+        })
+
+        for policy in POLICIES:
+            for add_ts in (True, False):
+                with mock.patch('swift.common.utils.Timestamp.now',
+                                return_value=Timestamp('123456789')):
+                    headers = direct_client.gen_headers(
+                        {'X-Backend-Storage-Policy-Index': policy.idx},
+                        add_ts=add_ts)
+                expected = {
+                    'User-Agent': stub_user_agent,
+                    'X-Backend-Storage-Policy-Index': str(policy.idx),
+                    'X-Backend-Allow-Reserved-Names': 'true',
+                }
+                if add_ts:
+                    expected['X-Timestamp'] = '0123456789.00000'
+                self.assertEqual(dict(headers), expected)
+
+    def test_direct_get_account(self):
+        def do_test(req_params):
+            stub_headers = HeaderKeyDict({
+                'X-Account-Container-Count': '1',
+                'X-Account-Object-Count': '1',
+                'X-Account-Bytes-Used': '1',
+                'X-Timestamp': '1234567890',
+                'X-PUT-Timestamp': '1234567890'})
+
+            body = b'[{"count": 1, "bytes": 20971520, "name": "c1"}]'
+
+            with mocked_http_conn(200, stub_headers, body) as conn:
+                resp_headers, resp = direct_client.direct_get_account(
+                    self.node, self.part, self.account, **req_params)
+            try:
+                self.assertEqual(conn.method, 'GET')
+                self.assertEqual(conn.path, self.account_path)
+                self.assertEqual(conn.req_headers['user-agent'],
+                                 self.user_agent)
+                self.assertEqual(resp_headers, stub_headers)
+                self.assertEqual(json.loads(body), resp)
+                actual_params = conn.query_string.split('&')
+                exp_params = ['%s=%s' % (k, v)
+                              for k, v in req_params.items()
+                              if v is not None]
+                exp_params.append('format=json')
+                self.assertEqual(sorted(actual_params), sorted(exp_params))
+
+            except AssertionError as err:
+                self.fail('Failed with params %s: %s' % (req_params, err))
+
+        test_params = (dict(marker=marker, prefix=prefix, delimiter=delimiter,
+                       limit=limit, end_marker=end_marker, reverse=reverse)
+                       for marker in (None, 'my-marker')
+                       for prefix in (None, 'my-prefix')
+                       for delimiter in (None, 'my-delimiter')
+                       for limit in (None, 1000)
+                       for end_marker in (None, 'my-endmarker')
+                       for reverse in (None, 'on'))
+
+        for params in test_params:
+            do_test(params)
+
+    def test_direct_client_exception(self):
+        stub_headers = {'X-Trans-Id': 'txb5f59485c578460f8be9e-0053478d09'}
+        body = 'a server error has occurred'
+        with mocked_http_conn(500, stub_headers, body):
+            with self.assertRaises(ClientException) as raised:
+                direct_client.direct_get_account(self.node, self.part,
+                                                 self.account)
+        self.assertEqual(raised.exception.http_status, 500)
+        expected_err_msg_parts = (
+            'Account server %s:%s' % (self.node['ip'], self.node['port']),
+            'GET %r' % self.account_path,
+            'status 500',
+        )
+        for item in expected_err_msg_parts:
+            self.assertIn(item, str(raised.exception))
+        self.assertEqual(raised.exception.http_host, self.node['ip'])
+        self.assertEqual(raised.exception.http_port, self.node['port'])
+        self.assertEqual(raised.exception.http_device, self.node['device'])
+        self.assertEqual(raised.exception.http_status, 500)
+        self.assertEqual(raised.exception.http_reason, 'Internal Error')
+        self.assertEqual(raised.exception.http_headers, stub_headers)
+
+    def test_direct_get_account_no_content_does_not_parse_body(self):
+        headers = {
+            'X-Account-Container-Count': '1',
+            'X-Account-Object-Count': '1',
+            'X-Account-Bytes-Used': '1',
+            'X-Timestamp': '1234567890',
+            'X-Put-Timestamp': '1234567890'}
+        with mocked_http_conn(204, headers) as conn:
+            resp_headers, resp = direct_client.direct_get_account(
+                self.node, self.part, self.account)
+            self.assertEqual(conn.method, 'GET')
+            self.assertEqual(conn.path, self.account_path)
+
+        self.assertEqual(conn.req_headers['user-agent'], self.user_agent)
+        self.assertDictEqual(resp_headers, headers)
+        self.assertEqual([], resp)
+
+    def test_direct_get_account_error(self):
+        with mocked_http_conn(500) as conn:
+            with self.assertRaises(ClientException) as raised:
+                direct_client.direct_get_account(
+                    self.node, self.part, self.account)
+            self.assertEqual(conn.method, 'GET')
+            self.assertEqual(conn.path, self.account_path)
+        self.assertEqual(raised.exception.http_status, 500)
+        self.assertTrue('GET' in str(raised.exception))
+
+    def test_direct_delete_account(self):
+        part = '0'
+        account = 'a'
+
+        mock_path = 'swift.common.bufferedhttp.http_connect_raw'
+        with mock.patch(mock_path) as fake_connect:
+            fake_connect.return_value.getresponse.return_value.status = 200
+            direct_client.direct_delete_account(self.node, part, account)
+            args, kwargs = fake_connect.call_args
+            ip = args[0]
+            self.assertEqual(self.node['ip'], ip)
+            port = args[1]
+            self.assertEqual(self.node['port'], port)
+            method = args[2]
+            self.assertEqual('DELETE', method)
+            path = args[3]
+            self.assertEqual('/sda/0/a', path)
+            headers = args[4]
+            self.assertIn('X-Timestamp', headers)
+            self.assertIn('User-Agent', headers)
+
+    def test_direct_delete_account_replication_net(self):
+        part = '0'
+        account = 'a'
+
+        mock_path = 'swift.common.bufferedhttp.http_connect_raw'
+        with mock.patch(mock_path) as fake_connect:
+            fake_connect.return_value.getresponse.return_value.status = 200
+            direct_client.direct_delete_account(
+                self.node, part, account,
+                headers={'X-Backend-Use-Replication-Network': 't'})
+            args, kwargs = fake_connect.call_args
+            ip = args[0]
+            self.assertEqual(self.node['replication_ip'], ip)
+            self.assertNotEqual(self.node['ip'], ip)
+            port = args[1]
+            self.assertEqual(self.node['replication_port'], port)
+            self.assertNotEqual(self.node['port'], port)
+            method = args[2]
+            self.assertEqual('DELETE', method)
+            path = args[3]
+            self.assertEqual('/sda/0/a', path)
+            headers = args[4]
+            self.assertIn('X-Timestamp', headers)
+            self.assertIn('User-Agent', headers)
+
+    def test_direct_delete_account_failure(self):
+        part = '0'
+        account = 'a'
+
+        with mocked_http_conn(500) as conn:
+            with self.assertRaises(ClientException) as raised:
+                direct_client.direct_delete_account(self.node, part, account)
+            self.assertEqual(self.node['ip'], conn.host)
+            self.assertEqual(self.node['port'], conn.port)
+            self.assertEqual('DELETE', conn.method)
+            self.assertEqual('/sda/0/a', conn.path)
+            self.assertIn('X-Timestamp', conn.req_headers)
+            self.assertIn('User-Agent', conn.req_headers)
+            self.assertEqual(raised.exception.http_status, 500)
+
+    def test_direct_head_container(self):
+        headers = HeaderKeyDict(key='value')
+
+        with mocked_http_conn(200, headers) as conn:
+            resp = direct_client.direct_head_container(
+                self.node, self.part, self.account, self.container)
+            self.assertEqual(conn.host, self.node['ip'])
+            self.assertEqual(conn.port, self.node['port'])
+            self.assertEqual(conn.method, 'HEAD')
+            self.assertEqual(conn.path, self.container_path)
+
+        self.assertEqual(conn.req_headers['user-agent'],
+                         self.user_agent)
+        self.assertEqual(headers, resp)
+
+    def test_direct_head_container_replication_net(self):
+        headers = HeaderKeyDict(key='value')
+
+        with mocked_http_conn(200, headers) as conn:
+            resp = direct_client.direct_head_container(
+                self.node, self.part, self.account, self.container,
+                headers={'X-Backend-Use-Replication-Network': 'on'})
+            self.assertEqual(conn.host, self.node['replication_ip'])
+            self.assertEqual(conn.port, self.node['replication_port'])
+            self.assertNotEqual(conn.host, self.node['ip'])
+            self.assertNotEqual(conn.port, self.node['port'])
+            self.assertEqual(conn.method, 'HEAD')
+            self.assertEqual(conn.path, self.container_path)
+
+        self.assertEqual(conn.req_headers['user-agent'],
+                         self.user_agent)
+        self.assertEqual(headers, resp)
+
+    def test_direct_head_container_error(self):
+        headers = HeaderKeyDict(key='value')
+
+        with mocked_http_conn(503, headers) as conn:
+            with self.assertRaises(ClientException) as raised:
+                direct_client.direct_head_container(
+                    self.node, self.part, self.account, self.container)
+            # check request
+            self.assertEqual(conn.host, self.node['ip'])
+            self.assertEqual(conn.port, self.node['port'])
+            self.assertEqual(conn.method, 'HEAD')
+            self.assertEqual(conn.path, self.container_path)
+
+        self.assertEqual(conn.req_headers['user-agent'], self.user_agent)
+        self.assertEqual(raised.exception.http_status, 503)
+        self.assertEqual(raised.exception.http_headers, headers)
+        self.assertTrue('HEAD' in str(raised.exception))
+
+    def test_direct_head_container_deleted(self):
+        important_timestamp = Timestamp.now().internal
+        headers = HeaderKeyDict({'X-Backend-Important-Timestamp':
+                                 important_timestamp})
+
+        with mocked_http_conn(404, headers) as conn:
+            with self.assertRaises(ClientException) as raised:
+                direct_client.direct_head_container(
+                    self.node, self.part, self.account, self.container)
+            self.assertEqual(conn.host, self.node['ip'])
+            self.assertEqual(conn.port, self.node['port'])
+            self.assertEqual(conn.method, 'HEAD')
+            self.assertEqual(conn.path, self.container_path)
+
+        self.assertEqual(conn.req_headers['user-agent'], self.user_agent)
+        self.assertEqual(raised.exception.http_status, 404)
+        self.assertEqual(raised.exception.http_headers, headers)
+
+    def test_direct_get_container(self):
+        def do_test(req_params):
+            headers = HeaderKeyDict({'key': 'value'})
+            body = (b'[{"hash": "8f4e3", "last_modified": "317260", '
+                    b'"bytes": 209}]')
+
+            with mocked_http_conn(200, headers, body) as conn:
+                resp_headers, resp = direct_client.direct_get_container(
+                    self.node, self.part, self.account, self.container,
+                    **req_params)
+
+            try:
+                self.assertEqual(conn.method, 'GET')
+                self.assertEqual(conn.path, self.container_path)
+                self.assertEqual(conn.req_headers['user-agent'],
+                                 self.user_agent)
+                self.assertEqual(headers, resp_headers)
+                self.assertEqual(json.loads(body), resp)
+                actual_params = conn.query_string.split('&')
+                exp_params = ['%s=%s' % (k, v)
+                              for k, v in req_params.items()
+                              if v is not None]
+                exp_params.append('format=json')
+                self.assertEqual(sorted(actual_params), sorted(exp_params))
+            except AssertionError as err:
+                self.fail('Failed with params %s: %s' % (req_params, err))
+
+        test_params = (dict(marker=marker, prefix=prefix, delimiter=delimiter,
+                       limit=limit, end_marker=end_marker, reverse=reverse)
+                       for marker in (None, 'my-marker')
+                       for prefix in (None, 'my-prefix')
+                       for delimiter in (None, 'my-delimiter')
+                       for limit in (None, 1000)
+                       for end_marker in (None, 'my-endmarker')
+                       for reverse in (None, 'on'))
+
+        for params in test_params:
+            do_test(params)
+
+    def test_direct_get_container_no_content_does_not_decode_body(self):
+        headers = {}
+        body = ''
+        with mocked_http_conn(204, headers, body) as conn:
+            resp_headers, resp = direct_client.direct_get_container(
+                self.node, self.part, self.account, self.container)
+
+        self.assertEqual(conn.req_headers['user-agent'], self.user_agent)
+        self.assertEqual(headers, resp_headers)
+        self.assertEqual([], resp)
+
+    def test_direct_get_container_with_extra_params(self):
+        def do_test(req_params, expected_params):
+            headers = HeaderKeyDict({'key': 'value'})
+            body = (b'[{"hash": "8f4e3", "last_modified": "317260", '
+                    b'"bytes": 209}]')
+
+            with mocked_http_conn(200, headers, body) as conn:
+                resp_headers, resp = direct_client.direct_get_container(
+                    self.node, self.part, self.account, self.container,
+                    **req_params)
+
+            self.assertEqual(conn.method, 'GET')
+            self.assertEqual(conn.path, self.container_path)
+            self.assertEqual(
+                conn.req_headers['user-agent'], self.user_agent)
+            self.assertEqual(headers, resp_headers)
+            self.assertEqual(json.loads(body), resp)
+            actual_params = conn.query_string.split('&')
+            exp_params = ['%s=%s' % (k, v)
+                          for k, v in expected_params.items()]
+            exp_params.append('format=json')
+            self.assertEqual(sorted(actual_params), sorted(exp_params))
+
+        req_params = dict(marker='my-marker', prefix='my-prefix',
+                          delimiter='my-delimiter',
+                          limit=10, end_marker='my-endmarker', reverse='on',
+                          extra_params={'states': 'updating',
+                                        'test': 'okay'})
+        expected_params = dict(marker='my-marker', prefix='my-prefix',
+                               delimiter='my-delimiter', limit=10,
+                               end_marker='my-endmarker', reverse='on',
+                               states='updating', test='okay')
+        do_test(req_params, expected_params)
+
+        req_params = dict(marker='my-marker', prefix='my-prefix',
+                          delimiter='my-delimiter',
+                          limit=10, end_marker='my-endmarker', reverse='on',
+                          extra_params={'states': None})
+        expected_params = dict(marker='my-marker', prefix='my-prefix',
+                               delimiter='my-delimiter', limit=10,
+                               end_marker='my-endmarker', reverse='on')
+
+        req_params = dict(marker='my-marker', prefix='my-prefix',
+                          delimiter='my-delimiter',
+                          limit=10, end_marker='my-endmarker', reverse='on',
+                          extra_params={})
+        expected_params = dict(marker='my-marker', prefix='my-prefix',
+                               delimiter='my-delimiter', limit=10,
+                               end_marker='my-endmarker', reverse='on')
+        do_test(req_params, expected_params)
+
+        req_params = dict(marker='my-marker', prefix='my-prefix',
+                          delimiter='my-delimiter',
+                          limit=10, end_marker='my-endmarker', reverse='on',
+                          extra_params={'states': 'updating',
+                                        'marker': 'others'})
+        with self.assertRaises(TypeError) as cm:
+            do_test(req_params, expected_params={})
+        self.assertIn('duplicate values for keyword arg: marker',
+                      str(cm.exception))
+
+        req_params = dict(marker='my-marker', prefix='my-prefix',
+                          delimiter='my-delimiter',
+                          limit=10, end_marker='my-endmarker', reverse='on',
+                          extra_params={'prefix': 'others'})
+        with self.assertRaises(TypeError) as cm:
+            do_test(req_params, expected_params=None)
+        self.assertIn('duplicate values for keyword arg: prefix',
+                      str(cm.exception))
+
+        req_params = dict(marker='my-marker', delimiter='my-delimiter',
+                          limit=10, end_marker='my-endmarker', reverse='on',
+                          extra_params={'prefix': 'others'})
+        expected_params = dict(marker='my-marker', prefix='others',
+                               delimiter='my-delimiter', limit=10,
+                               end_marker='my-endmarker', reverse='on')
+        do_test(req_params, expected_params)
+
+        req_params = dict(marker='my-marker', prefix=None,
+                          delimiter='my-delimiter',
+                          limit=10, end_marker='my-endmarker', reverse='on',
+                          extra_params={'prefix': 'others'})
+        expected_params = dict(marker='my-marker', prefix='others',
+                               delimiter='my-delimiter', limit=10,
+                               end_marker='my-endmarker', reverse='on')
+        do_test(req_params, expected_params)
+
+        req_params = dict(extra_params={'limit': 10, 'empty': '',
+                                        'test': True, 'zero': 0})
+        expected_params = dict(limit='10', empty='', test='True', zero='0')
+        do_test(req_params, expected_params)
+
+    def test_direct_delete_container(self):
+        with mocked_http_conn(200) as conn:
+            direct_client.direct_delete_container(
+                self.node, self.part, self.account, self.container)
+            self.assertEqual(conn.host, self.node['ip'])
+            self.assertEqual(conn.port, self.node['port'])
+            self.assertEqual(conn.method, 'DELETE')
+            self.assertEqual(conn.path, self.container_path)
+
+    def test_direct_delete_container_replication_net(self):
+        with mocked_http_conn(200) as conn:
+            direct_client.direct_delete_container(
+                self.node, self.part, self.account, self.container,
+                headers={'X-Backend-Use-Replication-Network': '1'})
+            self.assertEqual(conn.host, self.node['replication_ip'])
+            self.assertEqual(conn.port, self.node['replication_port'])
+            self.assertNotEqual(conn.host, self.node['ip'])
+            self.assertNotEqual(conn.port, self.node['port'])
+            self.assertEqual(conn.method, 'DELETE')
+            self.assertEqual(conn.path, self.container_path)
+
+    def test_direct_delete_container_with_timestamp(self):
+        # ensure timestamp is different from any that might be auto-generated
+        timestamp = Timestamp(time.time() - 100)
+        headers = {'X-Timestamp': timestamp.internal}
+        with mocked_http_conn(200) as conn:
+            direct_client.direct_delete_container(
+                self.node, self.part, self.account, self.container,
+                headers=headers)
+            self.assertEqual(conn.host, self.node['ip'])
+            self.assertEqual(conn.port, self.node['port'])
+            self.assertEqual(conn.method, 'DELETE')
+            self.assertEqual(conn.path, self.container_path)
+            self.assertTrue('X-Timestamp' in conn.req_headers)
+            self.assertEqual(timestamp, conn.req_headers['X-Timestamp'])
+
+    def test_direct_delete_container_error(self):
+        with mocked_http_conn(500) as conn:
+            with self.assertRaises(ClientException) as raised:
+                direct_client.direct_delete_container(
+                    self.node, self.part, self.account, self.container)
+
+            self.assertEqual(conn.host, self.node['ip'])
+            self.assertEqual(conn.port, self.node['port'])
+            self.assertEqual(conn.method, 'DELETE')
+            self.assertEqual(conn.path, self.container_path)
+
+        self.assertEqual(raised.exception.http_status, 500)
+        self.assertTrue('DELETE' in str(raised.exception))
+
+    def test_direct_put_container(self):
+        body = b'Let us begin with a quick introduction'
+        headers = {'x-foo': 'bar', 'Content-Length': str(len(body)),
+                   'Content-Type': 'application/json',
+                   'User-Agent': 'my UA'}
+
+        with mocked_http_conn(204) as conn:
+            rv = direct_client.direct_put_container(
+                self.node, self.part, self.account, self.container,
+                contents=body, headers=headers)
+            self.assertEqual(conn.host, self.node['ip'])
+            self.assertEqual(conn.port, self.node['port'])
+            self.assertEqual(conn.method, 'PUT')
+            self.assertEqual(conn.path, self.container_path)
+            self.assertEqual(conn.req_headers['Content-Length'],
+                             str(len(body)))
+            self.assertEqual(conn.req_headers['Content-Type'],
+                             'application/json')
+            self.assertEqual(conn.req_headers['User-Agent'], 'my UA')
+            self.assertTrue('x-timestamp' in conn.req_headers)
+            self.assertEqual('bar', conn.req_headers.get('x-foo'))
+            self.assertEqual(
+                md5(body, usedforsecurity=False).hexdigest(),
+                conn.etag.hexdigest())
+        self.assertIsNone(rv)
+
+    def test_direct_put_container_chunked(self):
+        body = b'Let us begin with a quick introduction'
+        headers = {'x-foo': 'bar', 'Content-Type': 'application/json'}
+
+        with mocked_http_conn(204) as conn:
+            rv = direct_client.direct_put_container(
+                self.node, self.part, self.account, self.container,
+                contents=body, headers=headers)
+            self.assertEqual(conn.host, self.node['ip'])
+            self.assertEqual(conn.port, self.node['port'])
+            self.assertEqual(conn.method, 'PUT')
+            self.assertEqual(conn.path, self.container_path)
+            self.assertEqual(conn.req_headers['Transfer-Encoding'], 'chunked')
+            self.assertEqual(conn.req_headers['Content-Type'],
+                             'application/json')
+            self.assertTrue('x-timestamp' in conn.req_headers)
+            self.assertEqual('bar', conn.req_headers.get('x-foo'))
+            self.assertNotIn('Content-Length', conn.req_headers)
+            expected_sent = b'%0x\r\n%s\r\n0\r\n\r\n' % (len(body), body)
+            self.assertEqual(
+                md5(expected_sent, usedforsecurity=False).hexdigest(),
+                conn.etag.hexdigest())
+        self.assertIsNone(rv)
+
+    def test_direct_put_container_fail(self):
+        with mock.patch('swift.common.bufferedhttp.http_connect_raw',
+                        side_effect=Exception('conn failed')):
+            with self.assertRaises(Exception) as cm:
+                direct_client.direct_put_container(
+                    self.node, self.part, self.account, self.container)
+        self.assertEqual('conn failed', str(cm.exception))
+
+        with mocked_http_conn(Exception('resp failed')):
+            with self.assertRaises(Exception) as cm:
+                direct_client.direct_put_container(
+                    self.node, self.part, self.account, self.container)
+        self.assertEqual('resp failed', str(cm.exception))
+
+    def test_direct_put_container_object(self):
+        headers = {'x-foo': 'bar'}
+
+        with mocked_http_conn(204) as conn:
+            rv = direct_client.direct_put_container_object(
+                self.node, self.part, self.account, self.container, self.obj,
+                headers=headers)
+            self.assertEqual(conn.host, self.node['ip'])
+            self.assertEqual(conn.port, self.node['port'])
+            self.assertEqual(conn.method, 'PUT')
+            self.assertEqual(conn.path, self.obj_path)
+            self.assertTrue('x-timestamp' in conn.req_headers)
+            self.assertEqual('bar', conn.req_headers.get('x-foo'))
+
+        self.assertIsNone(rv)
+
+    def test_direct_put_container_object_error(self):
+        with mocked_http_conn(500) as conn:
+            with self.assertRaises(ClientException) as raised:
+                direct_client.direct_put_container_object(
+                    self.node, self.part, self.account, self.container,
+                    self.obj)
+
+            self.assertEqual(conn.host, self.node['ip'])
+            self.assertEqual(conn.port, self.node['port'])
+            self.assertEqual(conn.method, 'PUT')
+            self.assertEqual(conn.path, self.obj_path)
+
+        self.assertEqual(raised.exception.http_status, 500)
+        self.assertTrue('PUT' in str(raised.exception))
+
+    def test_direct_post_container(self):
+        headers = {'x-foo': 'bar', 'User-Agent': 'my UA'}
+
+        with mocked_http_conn(204) as conn:
+            resp = direct_client.direct_post_container(
+                self.node, self.part, self.account, self.container,
+                headers=headers)
+            self.assertEqual(conn.host, self.node['ip'])
+            self.assertEqual(conn.port, self.node['port'])
+            self.assertEqual(conn.method, 'POST')
+            self.assertEqual(conn.path, self.container_path)
+            self.assertEqual(conn.req_headers['User-Agent'], 'my UA')
+            self.assertTrue('x-timestamp' in conn.req_headers)
+            self.assertEqual('bar', conn.req_headers.get('x-foo'))
+        self.assertEqual(204, resp.status)
+
+    def test_direct_delete_container_object(self):
+        with mocked_http_conn(204) as conn:
+            rv = direct_client.direct_delete_container_object(
+                self.node, self.part, self.account, self.container, self.obj)
+            self.assertEqual(conn.host, self.node['ip'])
+            self.assertEqual(conn.port, self.node['port'])
+            self.assertEqual(conn.method, 'DELETE')
+            self.assertEqual(conn.path, self.obj_path)
+
+        self.assertIsNone(rv)
+
+    def test_direct_delete_container_obj_error(self):
+        with mocked_http_conn(500) as conn:
+            with self.assertRaises(ClientException) as raised:
+                direct_client.direct_delete_container_object(
+                    self.node, self.part, self.account, self.container,
+                    self.obj)
+
+            self.assertEqual(conn.host, self.node['ip'])
+            self.assertEqual(conn.port, self.node['port'])
+            self.assertEqual(conn.method, 'DELETE')
+            self.assertEqual(conn.path, self.obj_path)
+
+        self.assertEqual(raised.exception.http_status, 500)
+        self.assertTrue('DELETE' in str(raised.exception))
+
+    def test_direct_head_object(self):
+        headers = HeaderKeyDict({'x-foo': 'bar'})
+
+        with mocked_http_conn(200, headers) as conn:
+            resp = direct_client.direct_head_object(
+                self.node, self.part, self.account, self.container,
+                self.obj, headers=headers)
+            self.assertEqual(conn.host, self.node['ip'])
+            self.assertEqual(conn.port, self.node['port'])
+            self.assertEqual(conn.method, 'HEAD')
+            self.assertEqual(conn.path, self.obj_path)
+
+        self.assertEqual(conn.req_headers['user-agent'], self.user_agent)
+        self.assertEqual('bar', conn.req_headers.get('x-foo'))
+        self.assertIn('x-timestamp', conn.req_headers)
+        self.assertEqual(headers, resp)
+
+    def test_direct_head_object_error(self):
+        with mocked_http_conn(500) as conn:
+            with self.assertRaises(ClientException) as raised:
+                direct_client.direct_head_object(
+                    self.node, self.part, self.account, self.container,
+                    self.obj)
+            self.assertEqual(conn.host, self.node['ip'])
+            self.assertEqual(conn.port, self.node['port'])
+            self.assertEqual(conn.method, 'HEAD')
+            self.assertEqual(conn.path, self.obj_path)
+
+        self.assertEqual(raised.exception.http_status, 500)
+        self.assertTrue('HEAD' in str(raised.exception))
+
+    def test_direct_head_object_not_found(self):
+        important_timestamp = Timestamp.now().internal
+        stub_headers = {'X-Backend-Important-Timestamp': important_timestamp}
+        with mocked_http_conn(404, headers=stub_headers) as conn:
+            with self.assertRaises(ClientException) as raised:
+                direct_client.direct_head_object(
+                    self.node, self.part, self.account, self.container,
+                    self.obj)
+            self.assertEqual(conn.host, self.node['ip'])
+            self.assertEqual(conn.port, self.node['port'])
+            self.assertEqual(conn.method, 'HEAD')
+            self.assertEqual(conn.path, self.obj_path)
+
+        self.assertEqual(raised.exception.http_status, 404)
+        self.assertEqual(
+            raised.exception.http_headers['x-backend-important-timestamp'],
+            important_timestamp)
+
+    def test_direct_get_object(self):
+        contents = io.BytesIO(b'123456')
+
+        with mocked_http_conn(200, body=contents) as conn:
+            resp_header, obj_body = direct_client.direct_get_object(
+                self.node, self.part, self.account, self.container, self.obj)
+            self.assertEqual(conn.host, self.node['ip'])
+            self.assertEqual(conn.port, self.node['port'])
+            self.assertEqual(conn.method, 'GET')
+            self.assertEqual(conn.path, self.obj_path)
+        self.assertEqual(obj_body, contents.getvalue())
+
+    def test_direct_get_object_error(self):
+        with mocked_http_conn(500) as conn:
+            with self.assertRaises(ClientException) as raised:
+                direct_client.direct_get_object(
+                    self.node, self.part,
+                    self.account, self.container, self.obj)
+            self.assertEqual(conn.host, self.node['ip'])
+            self.assertEqual(conn.port, self.node['port'])
+            self.assertEqual(conn.method, 'GET')
+            self.assertEqual(conn.path, self.obj_path)
+
+        self.assertEqual(raised.exception.http_status, 500)
+        self.assertTrue('GET' in str(raised.exception))
+
+    def test_direct_get_object_chunks(self):
+        contents = io.BytesIO(b'123456')
+
+        with mocked_http_conn(200, body=contents) as conn:
+            resp_header, obj_body = direct_client.direct_get_object(
+                self.node, self.part, self.account, self.container, self.obj,
+                resp_chunk_size=2)
+            self.assertEqual(conn.host, self.node['ip'])
+            self.assertEqual(conn.port, self.node['port'])
+            self.assertEqual('GET', conn.method)
+            self.assertEqual(self.obj_path, conn.path)
+            self.assertEqual([b'12', b'34', b'56'], list(obj_body))
+
+    def test_direct_post_object(self):
+        headers = {'Key': 'value'}
+
+        resp_headers = []
+
+        with mocked_http_conn(200, resp_headers) as conn:
+            direct_client.direct_post_object(
+                self.node, self.part, self.account, self.container, self.obj,
+                headers)
+            self.assertEqual(conn.host, self.node['ip'])
+            self.assertEqual(conn.port, self.node['port'])
+            self.assertEqual(conn.method, 'POST')
+            self.assertEqual(conn.path, self.obj_path)
+
+        for header in headers:
+            self.assertEqual(conn.req_headers[header], headers[header])
+
+    def test_direct_post_object_error(self):
+        headers = {'Key': 'value'}
+
+        with mocked_http_conn(500) as conn:
+            with self.assertRaises(ClientException) as raised:
+                direct_client.direct_post_object(
+                    self.node, self.part, self.account, self.container,
+                    self.obj, headers)
+            self.assertEqual(conn.host, self.node['ip'])
+            self.assertEqual(conn.port, self.node['port'])
+            self.assertEqual(conn.method, 'POST')
+            self.assertEqual(conn.path, self.obj_path)
+            for header in headers:
+                self.assertEqual(conn.req_headers[header], headers[header])
+            self.assertEqual(conn.req_headers['user-agent'], self.user_agent)
+            self.assertTrue('x-timestamp' in conn.req_headers)
+
+        self.assertEqual(raised.exception.http_status, 500)
+        self.assertTrue('POST' in str(raised.exception))
+
+    def test_direct_delete_object(self):
+        with mocked_http_conn(200) as conn:
+            resp = direct_client.direct_delete_object(
+                self.node, self.part, self.account, self.container, self.obj)
+            self.assertEqual(conn.host, self.node['ip'])
+            self.assertEqual(conn.port, self.node['port'])
+            self.assertEqual(conn.method, 'DELETE')
+            self.assertEqual(conn.path, self.obj_path)
+        self.assertIsNone(resp)
+
+    def test_direct_delete_object_with_timestamp(self):
+        # ensure timestamp is different from any that might be auto-generated
+        timestamp = Timestamp(time.time() - 100)
+        headers = {'X-Timestamp': timestamp.internal}
+        with mocked_http_conn(200) as conn:
+            direct_client.direct_delete_object(
+                self.node, self.part, self.account, self.container, self.obj,
+                headers=headers)
+            self.assertEqual(conn.host, self.node['ip'])
+            self.assertEqual(conn.port, self.node['port'])
+            self.assertEqual(conn.method, 'DELETE')
+            self.assertEqual(conn.path, self.obj_path)
+            self.assertTrue('X-Timestamp' in conn.req_headers)
+            self.assertEqual(timestamp, conn.req_headers['X-Timestamp'])
+
+    def test_direct_delete_object_error(self):
+        with mocked_http_conn(503) as conn:
+            with self.assertRaises(ClientException) as raised:
+                direct_client.direct_delete_object(
+                    self.node, self.part, self.account, self.container,
+                    self.obj)
+            self.assertEqual(conn.method, 'DELETE')
+            self.assertEqual(conn.path, self.obj_path)
+        self.assertEqual(raised.exception.http_status, 503)
+        self.assertTrue('DELETE' in str(raised.exception))
+
+    def test_direct_get_suffix_hashes(self):
+        data = {'a83': 'c130a2c17ed45102aada0f4eee69494ff'}
+        body = pickle.dumps(data)
+        with mocked_http_conn(200, {}, body) as conn:
+            resp = direct_client.direct_get_suffix_hashes(self.node,
+                                                          self.part, ['a83'])
+            self.assertEqual(conn.method, 'REPLICATE')
+            self.assertEqual(conn.path, '/sda/0/a83')
+            self.assertEqual(conn.host, self.node['replication_ip'])
+            self.assertEqual(conn.port, self.node['replication_port'])
+            self.assertEqual(data, resp)
+
+    def _test_direct_get_suffix_hashes_fail(self, status_code):
+        with mocked_http_conn(status_code):
+            with self.assertRaises(DirectClientException) as cm:
+                direct_client.direct_get_suffix_hashes(
+                    self.node, self.part, ['a83', 'b52'])
+        self.assertIn('REPLICATE', cm.exception.args[0])
+        self.assertIn(quote('/%s/%s/a83-b52'
+                            % (self.node['device'], self.part)),
+                      cm.exception.args[0])
+        self.assertIn(self.node['replication_ip'], cm.exception.args[0])
+        self.assertIn(self.node['replication_port'], cm.exception.args[0])
+        self.assertEqual(self.node['replication_ip'], cm.exception.http_host)
+        self.assertEqual(self.node['replication_port'], cm.exception.http_port)
+        self.assertEqual(self.node['device'], cm.exception.http_device)
+        self.assertEqual(status_code, cm.exception.http_status)
+
+    def test_direct_get_suffix_hashes_503(self):
+        self._test_direct_get_suffix_hashes_fail(503)
+
+    def test_direct_get_suffix_hashes_507(self):
+        self._test_direct_get_suffix_hashes_fail(507)
+
+    def test_direct_put_object_with_content_length(self):
+        contents = io.BytesIO(b'123456')
+
+        with mocked_http_conn(200) as conn:
+            resp = direct_client.direct_put_object(
+                self.node, self.part, self.account, self.container, self.obj,
+                contents, 6)
+            self.assertEqual(conn.host, self.node['ip'])
+            self.assertEqual(conn.port, self.node['port'])
+            self.assertEqual(conn.method, 'PUT')
+            self.assertEqual(conn.path, self.obj_path)
+        self.assertEqual(
+            md5(b'123456', usedforsecurity=False).hexdigest(),
+            resp)
+
+    def test_direct_put_object_fail(self):
+        contents = io.BytesIO(b'123456')
+
+        with mocked_http_conn(500) as conn:
+            with self.assertRaises(ClientException) as raised:
+                direct_client.direct_put_object(
+                    self.node, self.part, self.account, self.container,
+                    self.obj, contents)
+            self.assertEqual(conn.host, self.node['ip'])
+            self.assertEqual(conn.port, self.node['port'])
+            self.assertEqual(conn.method, 'PUT')
+            self.assertEqual(conn.path, self.obj_path)
+        self.assertEqual(raised.exception.http_status, 500)
+
+    def test_direct_put_object_chunked(self):
+        contents = io.BytesIO(b'123456')
+
+        with mocked_http_conn(200) as conn:
+            resp = direct_client.direct_put_object(
+                self.node, self.part, self.account, self.container, self.obj,
+                contents)
+            self.assertEqual(conn.host, self.node['ip'])
+            self.assertEqual(conn.port, self.node['port'])
+            self.assertEqual(conn.method, 'PUT')
+            self.assertEqual(conn.path, self.obj_path)
+        self.assertEqual(
+            md5(b'6\r\n123456\r\n0\r\n\r\n',
+                usedforsecurity=False).hexdigest(),
+            resp)
+
+    def test_direct_put_object_args(self):
+        # One test to cover all missing checks
+        contents = ""
+        with mocked_http_conn(200) as conn:
+            resp = direct_client.direct_put_object(
+                self.node, self.part, self.account, self.container, self.obj,
+                contents, etag="testing-etag", content_type='Text')
+            self.assertEqual(conn.host, self.node['ip'])
+            self.assertEqual(conn.port, self.node['port'])
+            self.assertEqual('PUT', conn.method)
+            self.assertEqual(self.obj_path, conn.path)
+            self.assertEqual(conn.req_headers['Content-Length'], '0')
+            self.assertEqual(conn.req_headers['Content-Type'], 'Text')
+        self.assertEqual(
+            md5(b'0\r\n\r\n', usedforsecurity=False).hexdigest(),
+            resp)
+
+    def test_direct_put_object_header_content_length(self):
+        contents = io.BytesIO(b'123456')
+        stub_headers = HeaderKeyDict({
+            'Content-Length': '6'})
+
+        with mocked_http_conn(200) as conn:
+            resp = direct_client.direct_put_object(
+                self.node, self.part, self.account, self.container, self.obj,
+                contents, headers=stub_headers)
+            self.assertEqual(conn.host, self.node['ip'])
+            self.assertEqual(conn.port, self.node['port'])
+            self.assertEqual('PUT', conn.method)
+            self.assertEqual(conn.req_headers['Content-length'], '6')
+        self.assertEqual(
+            md5(b'123456', usedforsecurity=False).hexdigest(),
+            resp)
+
+    def test_retry(self):
+        headers = HeaderKeyDict({'key': 'value'})
+
+        with mocked_http_conn(200, headers) as conn:
+            attempts, resp = direct_client.retry(
+                direct_client.direct_head_object, self.node, self.part,
+                self.account, self.container, self.obj)
+            self.assertEqual(conn.method, 'HEAD')
+            self.assertEqual(conn.path, self.obj_path)
+        self.assertEqual(conn.req_headers['user-agent'], self.user_agent)
+        self.assertEqual(headers, resp)
+        self.assertEqual(attempts, 1)
+
+    def test_retry_client_exception(self):
+        logger = debug_logger('direct-client-test')
+
+        with mock.patch('swift.common.direct_client.sleep') as mock_sleep, \
+                mocked_http_conn(500) as conn:
+            with self.assertRaises(direct_client.ClientException) as err_ctx:
+                direct_client.retry(direct_client.direct_delete_object,
+                                    self.node, self.part,
+                                    self.account, self.container, self.obj,
+                                    retries=2, error_log=logger.error)
+        self.assertEqual('DELETE', conn.method)
+        self.assertEqual(err_ctx.exception.http_status, 500)
+        self.assertIn('DELETE', err_ctx.exception.args[0])
+        self.assertIn(self.obj_path,
+                      err_ctx.exception.args[0])
+        self.assertIn(self.node['ip'], err_ctx.exception.args[0])
+        self.assertIn(self.node['port'], err_ctx.exception.args[0])
+        self.assertEqual(self.node['ip'], err_ctx.exception.http_host)
+        self.assertEqual(self.node['port'], err_ctx.exception.http_port)
+        self.assertEqual(self.node['device'], err_ctx.exception.http_device)
+        self.assertEqual(500, err_ctx.exception.http_status)
+        self.assertEqual([mock.call(1), mock.call(2)],
+                         mock_sleep.call_args_list)
+        error_lines = logger.get_lines_for_level('error')
+        self.assertEqual(3, len(error_lines))
+        for line in error_lines:
+            self.assertIn('500 Internal Error', line)
+
+    def test_retry_http_exception(self):
+        logger = debug_logger('direct-client-test')
+
+        with mock.patch('swift.common.direct_client.sleep') as mock_sleep, \
+                mocked_http_conn(HTTPException('Kaboom!')) as conn:
+            with self.assertRaises(HTTPException) as err_ctx:
+                direct_client.retry(direct_client.direct_delete_object,
+                                    self.node, self.part,
+                                    self.account, self.container, self.obj,
+                                    retries=2, error_log=logger.error)
+        self.assertEqual('DELETE', conn.method)
+        self.assertEqual('Kaboom!', str(err_ctx.exception))
+        self.assertEqual([mock.call(1), mock.call(2)],
+                         mock_sleep.call_args_list)
+        error_lines = logger.get_lines_for_level('error')
+        self.assertEqual(3, len(error_lines))
+        for line in error_lines:
+            self.assertIn('Kaboom!', line)
+
+    def test_direct_get_recon(self):
+        data = {
+            "/etc/swift/account.ring.gz": "de7316d2809205fa13ebfc747566260c",
+            "/etc/swift/container.ring.gz": "8e63c916fec81825cc40940eefe1d058",
+            "/etc/swift/object.ring.gz": "a77f51c14bbf7075bb7be0c27fd00dc4",
+            "/etc/swift/object-1.ring.gz": "f0222326f80ee5cb34b7546b18727923",
+            "/etc/swift/object-2.ring.gz": "2228dc8a7ff1cf2eb89b116653ac6191"}
+        body = json.dumps(data)
+        with mocked_http_conn(
+                200, {}, body,
+                mocked='swift.common.direct_client.http_connect_raw') as conn:
+            resp = direct_client.direct_get_recon(self.node, "ringmd5")
+        self.assertEqual(conn.method, 'GET')
+        self.assertEqual(conn.path, '/recon/ringmd5')
+        self.assertEqual(conn.host, self.node['ip'])
+        self.assertEqual(conn.port, self.node['port'])
+        self.assertEqual(data, resp)
+
+        # Now check failure
+        with mocked_http_conn(
+                500,
+                mocked='swift.common.direct_client.http_connect_raw') as conn:
+            with self.assertRaises(ClientException) as raised:
+                resp = direct_client.direct_get_recon(self.node, "ringmd5")
+        self.assertEqual(conn.host, self.node['ip'])
+        self.assertEqual(conn.port, self.node['port'])
+        self.assertEqual(conn.method, 'GET')
+        self.assertEqual(conn.path, '/recon/ringmd5')
+        self.assertEqual(raised.exception.http_status, 500)
+
+
+class TestUTF8DirectClient(TestDirectClient):
+
+    def setUp(self):
+        super(TestUTF8DirectClient, self).setUp()
+        self.account = self.account.encode('utf-8')
+        self.container = self.container.encode('utf-8')
+        self.obj = self.obj.encode('utf-8')
 
 
 if __name__ == '__main__':
diff --git a/test/unit/common/test_error_limiter.py b/test/unit/common/test_error_limiter.py
new file mode 100644
index 0000000000..21627a2018
--- /dev/null
+++ b/test/unit/common/test_error_limiter.py
@@ -0,0 +1,99 @@
+# Copyright (c) 2021 NVIDIA
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import unittest
+from unittest import mock
+from time import time
+
+from swift.common.error_limiter import ErrorLimiter
+from test.unit import FakeRing
+
+
+class TestErrorLimiter(unittest.TestCase):
+    def setUp(self):
+        self.ring = FakeRing()
+
+    def test_init_config(self):
+        config = {'suppression_interval': 100.9,
+                  'suppression_limit': 5}
+        limiter = ErrorLimiter(**config)
+        self.assertEqual(limiter.suppression_interval, 100.9)
+        self.assertEqual(limiter.suppression_limit, 5)
+
+        config = {'suppression_interval': '100.9',
+                  'suppression_limit': '5'}
+        limiter = ErrorLimiter(**config)
+        self.assertEqual(limiter.suppression_interval, 100.9)
+        self.assertEqual(limiter.suppression_limit, 5)
+
+    def test_init_bad_config(self):
+        with self.assertRaises(ValueError):
+            ErrorLimiter(suppression_interval='bad',
+                         suppression_limit=1)
+
+        with self.assertRaises(TypeError):
+            ErrorLimiter(suppression_interval=None,
+                         suppression_limit=1)
+
+        with self.assertRaises(ValueError):
+            ErrorLimiter(suppression_interval=0,
+                         suppression_limit='bad')
+
+        with self.assertRaises(TypeError):
+            ErrorLimiter(suppression_interval=0,
+                         suppression_limit=None)
+
+    def test_is_limited(self):
+        node = self.ring.devs[-1]
+        limiter = ErrorLimiter(suppression_interval=60, suppression_limit=10)
+
+        now = time()
+        with mock.patch('swift.common.error_limiter.time', return_value=now):
+            self.assertFalse(limiter.is_limited(node))
+            limiter.limit(node)
+            self.assertTrue(limiter.is_limited(node))
+            node_key = limiter.node_key(node)
+            self.assertEqual(limiter.stats.get(node_key),
+                             {'errors': limiter.suppression_limit + 1,
+                              'last_error': now})
+
+    def test_increment(self):
+        node = self.ring.devs[-1]
+        limiter = ErrorLimiter(suppression_interval=60, suppression_limit=10)
+        node_key = limiter.node_key(node)
+        for i in range(limiter.suppression_limit):
+            self.assertFalse(limiter.increment(node))
+            self.assertEqual(i + 1, limiter.stats.get(node_key)['errors'])
+            self.assertFalse(limiter.is_limited(node))
+
+        # A few more to make sure it is > suppression_limit
+        for i in range(1, 4):
+            self.assertTrue(limiter.increment(node))
+            self.assertEqual(limiter.suppression_limit + i,
+                             limiter.stats.get(node_key)['errors'])
+            self.assertTrue(limiter.is_limited(node))
+
+        # Simulate time with no errors have gone by.
+        last_time = limiter.stats.get(node_key)['last_error']
+        now = last_time + limiter.suppression_interval + 1
+        with mock.patch('swift.common.error_limiter.time',
+                        return_value=now):
+            self.assertFalse(limiter.is_limited(node))
+            self.assertFalse(limiter.stats.get(node_key))
+
+    def test_node_key(self):
+        limiter = ErrorLimiter(suppression_interval=60, suppression_limit=10)
+        node = self.ring.devs[0]
+        expected = '%s:%s/%s' % (node['ip'], node['port'], node['device'])
+        self.assertEqual(expected, limiter.node_key(node))
diff --git a/test/unit/common/test_exceptions.py b/test/unit/common/test_exceptions.py
index 339e311d19..0a5c8b4c21 100644
--- a/test/unit/common/test_exceptions.py
+++ b/test/unit/common/test_exceptions.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,7 +13,7 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-# TODO: Tests
+# TODO(creiht): Tests
 
 import unittest
 from swift.common import exceptions
@@ -21,8 +21,27 @@
 
 class TestExceptions(unittest.TestCase):
 
-    def test_placeholder(self):
-        pass
+    def test_replication_exception(self):
+        self.assertEqual(str(exceptions.ReplicationException()), '')
+        self.assertEqual(str(exceptions.ReplicationException('test')), 'test')
+
+    def test_replication_lock_timeout(self):
+        with exceptions.ReplicationLockTimeout(15, 'test') as exc:
+            self.assertIsInstance(exc, exceptions.MessageTimeout)
+
+    def test_client_exception(self):
+        strerror = 'test: HTTP://random:888/randompath?foo=1 666 reason: ' \
+                   'device /sdb1   content'
+        exc = exceptions.ClientException('test', http_scheme='HTTP',
+                                         http_host='random',
+                                         http_port=888,
+                                         http_path='/randompath',
+                                         http_query='foo=1',
+                                         http_status=666,
+                                         http_reason='reason',
+                                         http_device='/sdb1',
+                                         http_response_content='content')
+        self.assertEqual(str(exc), strerror)
 
 
 if __name__ == '__main__':
diff --git a/test/unit/common/test_header_key_dict.py b/test/unit/common/test_header_key_dict.py
new file mode 100644
index 0000000000..edb160b7ad
--- /dev/null
+++ b/test/unit/common/test_header_key_dict.py
@@ -0,0 +1,135 @@
+# Copyright (c) 2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+from swift.common.header_key_dict import HeaderKeyDict
+from swift.common.swob import bytes_to_wsgi
+
+
+class TestHeaderKeyDict(unittest.TestCase):
+    def test_case_insensitive(self):
+        headers = HeaderKeyDict()
+        headers['Content-Length'] = 0
+        headers['CONTENT-LENGTH'] = 10
+        headers['content-length'] = 20
+        self.assertEqual(headers['Content-Length'], '20')
+        self.assertEqual(headers['content-length'], '20')
+        self.assertEqual(headers['CONTENT-LENGTH'], '20')
+
+    def test_unicode(self):
+        def mkstr(prefix):
+            return bytes_to_wsgi((prefix + u'\U0001f44d').encode('utf8'))
+
+        headers = HeaderKeyDict()
+        headers[mkstr('x-object-meta-')] = 'ok'
+        self.assertIn(mkstr('x-object-meta-'), headers)
+        self.assertIn(mkstr('X-Object-Meta-'), headers)
+        self.assertIn(mkstr('X-OBJECT-META-'), headers)
+        keys = list(headers)
+        self.assertNotIn(mkstr('x-object-meta-'), keys)
+        self.assertIn(mkstr('X-Object-Meta-'), keys)
+        self.assertNotIn(mkstr('X-OBJECT-META-'), keys)
+
+    def test_setdefault(self):
+        headers = HeaderKeyDict()
+
+        # it gets set
+        headers.setdefault('x-rubber-ducky', 'the one')
+        self.assertEqual(headers['X-Rubber-Ducky'], 'the one')
+
+        # it has the right return value
+        ret = headers.setdefault('x-boat', 'dinghy')
+        self.assertEqual(ret, 'dinghy')
+
+        ret = headers.setdefault('x-boat', 'yacht')
+        self.assertEqual(ret, 'dinghy')
+
+        # shouldn't crash
+        headers.setdefault('x-sir-not-appearing-in-this-request', None)
+
+    def test_del_contains(self):
+        headers = HeaderKeyDict()
+        headers['Content-Length'] = 0
+        self.assertIn('Content-Length', headers)
+        del headers['Content-Length']
+        self.assertNotIn('Content-Length', headers)
+
+    def test_update(self):
+        headers = HeaderKeyDict()
+        headers.update({'Content-Length': '0'})
+        headers.update([('Content-Type', 'text/plain')])
+        self.assertEqual(headers['Content-Length'], '0')
+        self.assertEqual(headers['Content-Type'], 'text/plain')
+
+    def test_set_none(self):
+        headers = HeaderKeyDict()
+        headers['test'] = None
+        self.assertNotIn('test', headers)
+        headers['test'] = 'something'
+        self.assertEqual('something', headers['test'])  # sanity check
+        headers['test'] = None
+        self.assertNotIn('test', headers)
+
+    def test_init_from_dict(self):
+        headers = HeaderKeyDict({'Content-Length': 20,
+                                 'Content-Type': 'text/plain'})
+        self.assertEqual('20', headers['Content-Length'])
+        self.assertEqual('text/plain', headers['Content-Type'])
+        headers = HeaderKeyDict(headers)
+        self.assertEqual('20', headers['Content-Length'])
+        self.assertEqual('text/plain', headers['Content-Type'])
+
+    def test_set(self):
+        # mappings = ((<tuple of input vals>, <expected output val>), ...)
+        mappings = (((1.618, '1.618', b'1.618', u'1.618'), '1.618'),
+                    ((20, '20', b'20', u'20'), '20'),
+                    ((True, 'True', b'True', u'True'), 'True'),
+                    ((False, 'False', b'False', u'False'), 'False'))
+        for vals, expected in mappings:
+            for val in vals:
+                headers = HeaderKeyDict(test=val)
+                actual = headers['test']
+                self.assertEqual(expected, actual,
+                                 'Expected %s but got %s for val %s' %
+                                 (expected, actual, val))
+                self.assertIsInstance(
+                    actual, str,
+                    'Expected type str but got %s for val %s of type %s' %
+                    (type(actual), val, type(val)))
+
+    def test_get(self):
+        headers = HeaderKeyDict()
+        headers['content-length'] = 20
+        self.assertEqual(headers.get('CONTENT-LENGTH'), '20')
+        self.assertIsNone(headers.get('something-else'))
+        self.assertEqual(headers.get('something-else', True), True)
+
+    def test_keys(self):
+        headers = HeaderKeyDict()
+        headers['content-length'] = 20
+        headers['cOnTent-tYpe'] = 'text/plain'
+        headers['SomeThing-eLse'] = 'somevalue'
+        self.assertEqual(
+            set(headers.keys()),
+            set(('Content-Length', 'Content-Type', 'Something-Else')))
+
+    def test_pop(self):
+        headers = HeaderKeyDict()
+        headers['content-length'] = 20
+        headers['cOntent-tYpe'] = 'text/plain'
+        self.assertEqual(headers.pop('content-Length'), '20')
+        self.assertEqual(headers.pop('Content-type'), 'text/plain')
+        self.assertEqual(headers.pop('Something-Else', 'somevalue'),
+                         'somevalue')
diff --git a/test/unit/common/test_http_protocol.py b/test/unit/common/test_http_protocol.py
new file mode 100644
index 0000000000..d1110e76ec
--- /dev/null
+++ b/test/unit/common/test_http_protocol.py
@@ -0,0 +1,543 @@
+# Copyright (c) 2010-2022 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from argparse import Namespace
+from io import BytesIO
+import json
+from unittest import mock
+import types
+import unittest
+import eventlet.wsgi as wsgi
+
+from test.debug_logger import debug_logger
+from swift.common import http_protocol, swob
+
+
+class TestSwiftHttpProtocol(unittest.TestCase):
+    def _proto_obj(self):
+        # Make an object we can exercise... note the base class's __init__()
+        # does a bunch of work, so we just new up an object like eventlet.wsgi
+        # does.
+        proto_class = http_protocol.SwiftHttpProtocol
+        try:
+            the_obj = types.InstanceType(proto_class)
+        except AttributeError:
+            the_obj = proto_class.__new__(proto_class)
+        # Install some convenience mocks
+        the_obj.server = Namespace(app=Namespace(logger=mock.Mock()),
+                                   url_length_limit=777,
+                                   log=mock.Mock())
+        the_obj.send_error = mock.Mock()
+
+        return the_obj
+
+    def test_swift_http_protocol_log_request(self):
+        proto_obj = self._proto_obj()
+        self.assertEqual(None, proto_obj.log_request('ignored'))
+
+    def test_swift_http_protocol_log_message(self):
+        proto_obj = self._proto_obj()
+
+        proto_obj.log_message('a%sc', 'b')
+        self.assertEqual([mock.call.error('ERROR WSGI: a%sc', 'b')],
+                         proto_obj.server.app.logger.mock_calls)
+
+    def test_swift_http_protocol_log_message_no_logger(self):
+        # If the app somehow had no logger attribute or it was None, don't blow
+        # up
+        proto_obj = self._proto_obj()
+        delattr(proto_obj.server.app, 'logger')
+
+        proto_obj.log_message('a%sc', 'b')
+        self.assertEqual([mock.call.info('ERROR WSGI: a%sc', 'b')],
+                         proto_obj.server.log.mock_calls)
+
+        proto_obj.server.log.reset_mock()
+        proto_obj.server.app.logger = None
+
+        proto_obj.log_message('a%sc', 'b')
+        self.assertEqual([mock.call.info('ERROR WSGI: a%sc', 'b')],
+                         proto_obj.server.log.mock_calls)
+
+    def test_swift_http_protocol_parse_request_no_proxy(self):
+        proto_obj = self._proto_obj()
+        proto_obj.raw_requestline = b'jimmy jam'
+        proto_obj.client_address = ('a', '123')
+
+        self.assertEqual(False, proto_obj.parse_request())
+
+        self.assertEqual([
+            mock.call(400, "Bad HTTP/0.9 request type ('jimmy')"),
+        ], proto_obj.send_error.mock_calls)
+        self.assertEqual(('a', '123'), proto_obj.client_address)
+
+    def test_bad_request_line(self):
+        proto_obj = self._proto_obj()
+        proto_obj.raw_requestline = b'None //'
+        self.assertEqual(False, proto_obj.parse_request())
+
+
+class ProtocolTest(unittest.TestCase):
+    def _run_bytes_through_protocol(self, bytes_from_client, app=None):
+        rfile = BytesIO(bytes_from_client)
+        wfile = BytesIO()
+
+        # All this fakery is needed to make the WSGI server process one
+        # connection, possibly with multiple requests, in the main
+        # greenthread. It doesn't hurt correctness if the function is called
+        # in a separate greenthread, but it makes using the debugger harder.
+        class FakeGreenthread(object):
+            def link(self, a_callable, *args):
+                a_callable(self, *args)
+
+        class FakePool(object):
+            def spawn(self, a_callable, *args, **kwargs):
+                a_callable(*args, **kwargs)
+                return FakeGreenthread()
+
+            def spawn_n(self, a_callable, *args, **kwargs):
+                a_callable(*args, **kwargs)
+
+            def waitall(self):
+                pass
+
+        addr = ('127.0.0.1', 8359)
+        fake_tcp_socket = mock.Mock(
+            setsockopt=lambda *a: None,
+            makefile=lambda mode, bufsize: rfile if 'r' in mode else wfile,
+            getsockname=lambda *a: addr
+        )
+        fake_listen_socket = mock.Mock(
+            accept=mock.MagicMock(
+                side_effect=[[fake_tcp_socket, addr],
+                             # KeyboardInterrupt breaks the WSGI server out of
+                             # its infinite accept-process-close loop.
+                             KeyboardInterrupt]),
+            getsockname=lambda *a: addr)
+        del fake_listen_socket.do_handshake
+
+        # If we let the WSGI server close rfile/wfile then we can't access
+        # their contents any more.
+        self.logger = debug_logger('proxy')
+        with mock.patch.object(wfile, 'close', lambda: None), \
+                mock.patch.object(rfile, 'close', lambda: None):
+            wsgi.server(
+                fake_listen_socket, app or self.app,
+                protocol=self.protocol_class,
+                custom_pool=FakePool(),
+                log=self.logger,
+                log_output=True,
+            )
+        return wfile.getvalue()
+
+
+class TestSwiftHttpProtocolSomeMore(ProtocolTest):
+    protocol_class = http_protocol.SwiftHttpProtocol
+
+    @staticmethod
+    def app(env, start_response):
+        start_response("200 OK", [])
+        return [swob.wsgi_to_bytes(env['RAW_PATH_INFO'])]
+
+    def test_simple(self):
+        bytes_out = self._run_bytes_through_protocol(
+            b"GET /someurl HTTP/1.0\r\n"
+            b"User-Agent: something or other\r\n"
+            b"\r\n"
+        )
+
+        lines = [l for l in bytes_out.split(b"\r\n") if l]
+        self.assertEqual(lines[0], b"HTTP/1.1 200 OK")  # sanity check
+        self.assertEqual(lines[-1], b'/someurl')
+
+    def test_quoted(self):
+        bytes_out = self._run_bytes_through_protocol(
+            b"GET /some%fFpath%D8%AA HTTP/1.0\r\n"
+            b"User-Agent: something or other\r\n"
+            b"\r\n"
+        )
+
+        lines = [l for l in bytes_out.split(b"\r\n") if l]
+        self.assertEqual(lines[0], b"HTTP/1.1 200 OK")  # sanity check
+        self.assertEqual(lines[-1], b'/some%fFpath%D8%AA')
+
+    def test_messy(self):
+        bytes_out = self._run_bytes_through_protocol(
+            b"GET /oh\xffboy%what$now%E2%80%bd HTTP/1.0\r\n"
+            b"User-Agent: something or other\r\n"
+            b"\r\n"
+        )
+
+        lines = [l for l in bytes_out.split(b"\r\n") if l]
+        self.assertEqual(lines[-1], b'/oh\xffboy%what$now%E2%80%bd')
+
+    def test_absolute_target(self):
+        bytes_out = self._run_bytes_through_protocol((
+            b"GET https://cluster.domain/bucket/key HTTP/1.0\r\n"
+            b"\r\n"
+        ))
+
+        lines = [l for l in bytes_out.split(b"\r\n") if l]
+        self.assertEqual(lines[-1], b'/bucket/key')
+
+        bytes_out = self._run_bytes_through_protocol((
+            b"GET http://cluster.domain/v1/acct/cont/obj HTTP/1.0\r\n"
+            b"\r\n"
+        ))
+
+        lines = [l for l in bytes_out.split(b"\r\n") if l]
+        self.assertEqual(lines[-1], b'/v1/acct/cont/obj')
+
+        # clients talking nonsense
+        bytes_out = self._run_bytes_through_protocol((
+            b"GET ftp://cluster.domain/bucket/key HTTP/1.0\r\n"
+            b"\r\n"
+        ))
+
+        lines = [l for l in bytes_out.split(b"\r\n") if l]
+        self.assertEqual(lines[-1], b'ftp://cluster.domain/bucket/key')
+
+        bytes_out = self._run_bytes_through_protocol((
+            b"GET https://cluster.domain HTTP/1.0\r\n"
+            b"\r\n"
+        ))
+
+        lines = [l for l in bytes_out.split(b"\r\n") if l]
+        self.assertEqual(lines[-1], b'https://cluster.domain')
+
+        bytes_out = self._run_bytes_through_protocol((
+            b"GET http:omg//wtf/bbq HTTP/1.0\r\n"
+            b"\r\n"
+        ))
+
+        lines = [l for l in bytes_out.split(b"\r\n") if l]
+        self.assertEqual(lines[-1], b'http:omg//wtf/bbq')
+
+    def test_bad_request(self):
+        bytes_out = self._run_bytes_through_protocol((
+            b"ONLY-METHOD\r\n"
+            b"Server: example.com\r\n"
+            b"\r\n"
+        ))
+        lines = [l for l in bytes_out.split(b"\r\n") if l]
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertEqual(
+            lines[0], b"HTTP/1.1 400 Bad request syntax ('ONLY-METHOD')")
+        self.assertIn(b"Bad request syntax or unsupported method.", lines[-1])
+        self.assertIn(b"X-Trans-Id", lines[6])
+        self.assertIn(b"X-Openstack-Request-Id", lines[7])
+        self.assertIn("wsgi starting up", info_lines[0])
+        self.assertIn("ERROR WSGI: code 400", info_lines[1])
+        self.assertIn("txn:", info_lines[1])
+
+    def test_bad_request_server_logging(self):
+        with mock.patch('swift.common.http_protocol.generate_trans_id',
+                        return_value='test-trans-id'):
+            bytes_out = self._run_bytes_through_protocol(
+                b"ONLY-METHOD\r\n"
+                b"Server: example.com\r\n"
+                b"\r\n"
+            )
+        lines = [l for l in bytes_out.split(b"\r\n") if l]
+        self.assertEqual(
+            lines[0], b"HTTP/1.1 400 Bad request syntax ('ONLY-METHOD')")
+        self.assertIn(b"Bad request syntax or unsupported method.", lines[-1])
+        self.assertIn(b"X-Trans-Id: test-trans-id", lines[6])
+        self.assertIn(b"X-Openstack-Request-Id: test-trans-id", lines[7])
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertEqual(
+            "ERROR WSGI: code 400, message "
+            "Bad request syntax ('ONLY-METHOD'), (txn: test-trans-id)",
+            info_lines[1])
+
+    def test_bad_request_app_logging(self):
+        app_logger = debug_logger()
+        app = mock.MagicMock()
+        app.logger = app_logger
+        with mock.patch('swift.common.http_protocol.generate_trans_id',
+                        return_value='test-trans-id'):
+            bytes_out = self._run_bytes_through_protocol((
+                b"ONLY-METHOD\r\n"
+                b"Server: example.com\r\n"
+                b"\r\n"
+            ), app=app)
+        lines = [l for l in bytes_out.split(b"\r\n") if l]
+        self.assertEqual(
+            lines[0], b"HTTP/1.1 400 Bad request syntax ('ONLY-METHOD')")
+        self.assertIn(b"Bad request syntax or unsupported method.", lines[-1])
+        self.assertIn(b"X-Trans-Id: test-trans-id", lines[6])
+        self.assertIn(b"X-Openstack-Request-Id: test-trans-id", lines[7])
+        self.assertEqual(1, len(app_logger.records.get('ERROR', [])))
+        self.assertIn(
+            "ERROR WSGI: code 400, message Bad request syntax ('ONLY-METHOD') "
+            "(txn: test-trans-id)",
+            app_logger.records.get('ERROR')[0])
+        # but we can at least assert that the logger txn_id was set
+        self.assertEqual('test-trans-id', app_logger.txn_id)
+
+    def test_leading_slashes(self):
+        bytes_out = self._run_bytes_through_protocol((
+            b"GET ///some-leading-slashes HTTP/1.0\r\n"
+            b"User-Agent: blah blah blah\r\n"
+            b"\r\n"
+        ))
+        lines = [l for l in bytes_out.split(b"\r\n") if l]
+        self.assertEqual(lines[-1], b'///some-leading-slashes')
+
+    def test_chunked_with_content_length(self):
+        def reflecting_app(env, start_response):
+            start_response('200 OK', [])
+            return [env['wsgi.input'].read()]
+
+        # This is more of a test of eventlet, but we've seen issues with it
+        # before that were only caught in unit tests that require an XFS
+        # tempdir, and so were skipped on the requirements job
+        bytes_out = self._run_bytes_through_protocol((
+            b"PUT /path HTTP/1.0\r\n"
+            b"Content-Length: 10\r\n"
+            b"Transfer-Encoding: chunked\r\n"
+            b"\r\n"
+            b"a\r\n"
+            b"some text\n"
+            b"\r\n"
+            b"0\r\n"
+            b"\r\n"
+        ), app=reflecting_app)
+        body = bytes_out.partition(b"\r\n\r\n")[2]
+        self.assertEqual(body, b'some text\n')
+
+    def test_request_lines(self):
+        def app(env, start_response):
+            start_response("200 OK", [])
+            return [json.dumps({
+                'RAW_PATH_INFO': env['RAW_PATH_INFO'],
+                'QUERY_STRING': env.get('QUERY_STRING'),
+            }).encode('ascii')]
+
+        def do_test(request_line, expected):
+            bytes_out = self._run_bytes_through_protocol(
+                request_line + b'\r\n\r\n',
+                app,
+            )
+            print(bytes_out)
+            resp_body = bytes_out.partition(b'\r\n\r\n')[2]
+            self.assertEqual(json.loads(resp_body), expected)
+
+        do_test(b'GET / HTTP/1.1', {
+            'RAW_PATH_INFO': u'/',
+            'QUERY_STRING': None,
+        })
+        do_test(b'GET /%FF HTTP/1.1', {
+            'RAW_PATH_INFO': u'/%FF',
+            'QUERY_STRING': None,
+        })
+
+        do_test(b'GET /\xff HTTP/1.1', {
+            'RAW_PATH_INFO': u'/\xff',
+            'QUERY_STRING': None,
+        })
+        do_test(b'PUT /Here%20Is%20A%20SnowMan:\xe2\x98\x83 HTTP/1.0', {
+            'RAW_PATH_INFO': u'/Here%20Is%20A%20SnowMan:\xe2\x98\x83',
+            'QUERY_STRING': None,
+        })
+        do_test(
+            b'POST /?and%20it=does+nothing+to+params&'
+            b'PALMTREE=\xf0%9f\x8c%b4 HTTP/1.1', {
+                'RAW_PATH_INFO': u'/',
+                'QUERY_STRING': (u'and%20it=does+nothing+to+params'
+                                 u'&PALMTREE=\xf0%9f\x8c%b4'),
+            }
+        )
+        do_test(b'GET // HTTP/1.1', {
+            'RAW_PATH_INFO': u'//',
+            'QUERY_STRING': None,
+        })
+        do_test(b'GET //bar HTTP/1.1', {
+            'RAW_PATH_INFO': u'//bar',
+            'QUERY_STRING': None,
+        })
+        do_test(b'GET //////baz HTTP/1.1', {
+            'RAW_PATH_INFO': u'//////baz',
+            'QUERY_STRING': None,
+        })
+
+
+class TestProxyProtocol(ProtocolTest):
+    protocol_class = http_protocol.SwiftHttpProxiedProtocol
+
+    @staticmethod
+    def app(env, start_response):
+        start_response("200 OK", [])
+        body = '\r\n'.join([
+            'got addr: %s %s' % (
+                env.get("REMOTE_ADDR", "<missing>"),
+                env.get("REMOTE_PORT", "<missing>")),
+            'on addr: %s %s' % (
+                env.get("SERVER_ADDR", "<missing>"),
+                env.get("SERVER_PORT", "<missing>")),
+            'https is %s (scheme %s)' % (
+                env.get("HTTPS", "<missing>"),
+                env.get("wsgi.url_scheme", "<missing>")),
+        ]) + '\r\n'
+        return [body.encode("utf-8")]
+
+    def test_request_with_proxy(self):
+        bytes_out = self._run_bytes_through_protocol(
+            b"PROXY TCP4 192.168.0.1 192.168.0.11 56423 4433\r\n"
+            b"GET /someurl HTTP/1.0\r\n"
+            b"User-Agent: something or other\r\n"
+            b"\r\n"
+        )
+
+        lines = [l for l in bytes_out.split(b"\r\n") if l]
+        self.assertEqual(lines[0], b"HTTP/1.1 200 OK")  # sanity check
+        self.assertEqual(lines[-3:], [
+            b"got addr: 192.168.0.1 56423",
+            b"on addr: 192.168.0.11 4433",
+            b"https is <missing> (scheme http)",
+        ])
+
+    def test_request_with_proxy_https(self):
+        bytes_out = self._run_bytes_through_protocol(
+            b"PROXY TCP4 192.168.0.1 192.168.0.11 56423 443\r\n"
+            b"GET /someurl HTTP/1.0\r\n"
+            b"User-Agent: something or other\r\n"
+            b"\r\n"
+        )
+
+        lines = [l for l in bytes_out.split(b"\r\n") if l]
+        self.assertEqual(lines[0], b"HTTP/1.1 200 OK")  # sanity check
+        self.assertEqual(lines[-3:], [
+            b"got addr: 192.168.0.1 56423",
+            b"on addr: 192.168.0.11 443",
+            b"https is on (scheme https)",
+        ])
+
+    def test_multiple_requests_with_proxy(self):
+        bytes_out = self._run_bytes_through_protocol(
+            b"PROXY TCP4 192.168.0.1 192.168.0.11 56423 443\r\n"
+            b"GET /someurl HTTP/1.1\r\n"
+            b"User-Agent: something or other\r\n"
+            b"\r\n"
+            b"GET /otherurl HTTP/1.1\r\n"
+            b"User-Agent: something or other\r\n"
+            b"Connection: close\r\n"
+            b"\r\n"
+        )
+
+        lines = bytes_out.split(b"\r\n")
+        self.assertEqual(lines[0], b"HTTP/1.1 200 OK")  # sanity check
+
+        # the address in the PROXY line is applied to every request
+        addr_lines = [l for l in lines if l.startswith(b"got addr")]
+        self.assertEqual(addr_lines, [b"got addr: 192.168.0.1 56423"] * 2)
+        addr_lines = [l for l in lines if l.startswith(b"on addr")]
+        self.assertEqual(addr_lines, [b"on addr: 192.168.0.11 443"] * 2)
+        addr_lines = [l for l in lines if l.startswith(b"https is")]
+        self.assertEqual(addr_lines, [b"https is on (scheme https)"] * 2)
+
+    def test_missing_proxy_line(self):
+        with mock.patch('swift.common.http_protocol.generate_trans_id',
+                        return_value='test-bad-req-trans-id'):
+            bytes_out = self._run_bytes_through_protocol(
+                # whoops, no PROXY line here
+                b"GET /someurl HTTP/1.0\r\n"
+                b"User-Agent: something or other\r\n"
+                b"\r\n"
+            )
+
+        lines = [l for l in bytes_out.split(b"\r\n") if l]
+        info_lines = self.logger.get_lines_for_level('info')
+
+        self.assertEqual(
+            lines[0],
+            b"HTTP/1.1 400 Invalid PROXY line 'GET /someurl HTTP/1.0\\r\\n'")
+        self.assertIn(b"X-Trans-Id: test-bad-req-trans-id", lines[6])
+        self.assertIn(b"X-Openstack-Request-Id: test-bad-req-trans-id",
+                      lines[7])
+        self.assertEqual(
+            "ERROR WSGI: code 400, message Invalid PROXY line "
+            "'GET /someurl HTTP/1.0\\r\\n', "
+            "(txn: test-bad-req-trans-id)",
+            info_lines[1])
+
+    def test_malformed_proxy_lines(self):
+        for bad_line in [b'PROXY jojo',
+                         b'PROXYjojo a b c d e',
+                         b'PROXY a b c d e',  # bad INET protocol and family
+                         ]:
+            bytes_out = self._run_bytes_through_protocol(bad_line)
+            lines = [l for l in bytes_out.split(b"\r\n") if l]
+            info_lines = self.logger.get_lines_for_level('info')
+            self.assertIn(b"400 Invalid PROXY line", lines[0])
+            self.assertIn(b"X-Trans-Id", lines[6])
+            self.assertIn(b"X-Openstack-Request-Id", lines[7])
+            self.assertIn("wsgi starting up", info_lines[0])
+            self.assertIn("txn:", info_lines[1])
+
+    def test_unknown_client_addr(self):
+        # For "UNKNOWN", the rest of the line before the CRLF may be omitted by
+        # the sender, and the receiver must ignore anything presented before
+        # the CRLF is found.
+        for unknown_line in [b'PROXY UNKNOWN',  # mimimal valid unknown
+                             b'PROXY UNKNOWNblahblah',  # also valid
+                             b'PROXY UNKNOWN a b c d']:
+            bytes_out = self._run_bytes_through_protocol(
+                unknown_line + (b"\r\n"
+                                b"GET /someurl HTTP/1.0\r\n"
+                                b"User-Agent: something or other\r\n"
+                                b"\r\n")
+            )
+            lines = [l for l in bytes_out.split(b"\r\n") if l]
+            self.assertIn(b"200 OK", lines[0])
+
+    def test_address_and_environ(self):
+        # Make an object we can exercise... note the base class's __init__()
+        # does a bunch of work, so we just new up an object like eventlet.wsgi
+        # does.
+        dummy_env = {'OTHER_ENV_KEY': 'OTHER_ENV_VALUE'}
+        mock_protocol = mock.Mock(get_environ=lambda s: dummy_env)
+        patcher = mock.patch(
+            'swift.common.http_protocol.SwiftHttpProtocol', mock_protocol
+        )
+        self.mock_super = patcher.start()
+        self.addCleanup(patcher.stop)
+
+        proto_class = http_protocol.SwiftHttpProxiedProtocol
+        try:
+            proxy_obj = types.InstanceType(proto_class)
+        except AttributeError:
+            proxy_obj = proto_class.__new__(proto_class)
+
+        # Install some convenience mocks
+        proxy_obj.server = Namespace(app=Namespace(logger=mock.Mock()),
+                                     url_length_limit=777,
+                                     log=mock.Mock())
+        proxy_obj.send_error = mock.Mock()
+
+        proxy_obj.rfile = BytesIO(
+            b'PROXY TCP4 111.111.111.111 222.222.222.222 111 222'
+        )
+
+        assert proxy_obj.handle()
+
+        self.assertEqual(proxy_obj.client_address, ('111.111.111.111', '111'))
+        self.assertEqual(proxy_obj.proxy_address, ('222.222.222.222', '222'))
+        expected_env = {
+            'SERVER_PORT': '222',
+            'SERVER_ADDR': '222.222.222.222',
+            'OTHER_ENV_KEY': 'OTHER_ENV_VALUE'
+        }
+        self.assertEqual(proxy_obj.get_environ(), expected_env)
diff --git a/test/unit/common/test_init.py b/test/unit/common/test_init.py
deleted file mode 100644
index ee79b6dceb..0000000000
--- a/test/unit/common/test_init.py
+++ /dev/null
@@ -1,38 +0,0 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#    http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-# implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-import re
-import unittest
-import swift
-
-
-class TestVersioning(unittest.TestCase):
-    def test_canonical_version_is_clean(self):
-        """Ensure that a non-clean canonical_version never happens"""
-        pattern = re.compile('^\d+(\.\d+)*$')
-        self.assertTrue(pattern.match(swift.__canonical_version__) is not None)
-
-    def test_canonical_version_equals_version_for_final(self):
-        version = swift.Version('7.8.9', True)
-        self.assertEquals(version.pretty_version, '7.8.9')
-        self.assertEquals(version.canonical_version, '7.8.9')
-
-    def test_version_has_dev_suffix_for_non_final(self):
-        version = swift.Version('7.8.9', False)
-        self.assertEquals(version.pretty_version, '7.8.9-dev')
-        self.assertEquals(version.canonical_version, '7.8.9')
-
-if __name__ == '__main__':
-    unittest.main()
diff --git a/test/unit/common/test_internal_client.py b/test/unit/common/test_internal_client.py
index e3aa6f96d0..0e78927e5d 100644
--- a/test/unit/common/test_internal_client.py
+++ b/test/unit/common/test_internal_client.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -14,12 +14,41 @@
 # limitations under the License.
 
 import json
-from StringIO import StringIO
+from unittest import mock
 import unittest
-from urllib import quote
 import zlib
+import os
 
-from swift.common import internal_client
+from io import BytesIO
+from textwrap import dedent
+
+from itertools import zip_longest
+from urllib.parse import quote, parse_qsl
+from swift.common import exceptions, internal_client, request_helpers, swob
+from swift.common.header_key_dict import HeaderKeyDict
+from swift.common.storage_policy import StoragePolicy
+from swift.common.middleware.proxy_logging import ProxyLoggingMiddleware
+from swift.common.middleware.gatekeeper import GatekeeperMiddleware
+
+from test.debug_logger import debug_logger
+from test.unit import with_tempdir, write_fake_ring, patch_policies
+from test.unit.common.middleware.helpers import FakeSwift, LeakTrackingIter
+
+from eventlet.green.urllib import request as urllib_request
+from eventlet.green.http import client as http_client
+
+
+class FakeConn(object):
+    def __init__(self, body=None):
+        if body is None:
+            body = []
+        self.body = body
+
+    def read(self):
+        return json.dumps(self.body).encode('ascii')
+
+    def info(self):
+        return {}
 
 
 def not_sleep(seconds):
@@ -27,7 +56,7 @@ def not_sleep(seconds):
 
 
 def unicode_string(start, length):
-    return u''.join([unichr(x) for x in xrange(start, start + length)])
+    return u''.join([chr(x) for x in range(start, start + length)])
 
 
 def path_parts():
@@ -46,6 +75,19 @@ def make_path(account, container=None, obj=None):
     return path
 
 
+def make_path_info(account, container=None, obj=None):
+    # FakeSwift keys on PATH_INFO - which is *encoded* but unquoted
+    path = '/v1/%s' % '/'.join(
+        p for p in (account, container, obj) if p)
+    return swob.bytes_to_wsgi(path.encode('utf-8'))
+
+
+def get_client_app():
+    app = FakeSwift()
+    client = internal_client.InternalClient({}, 'test', 1, app=app)
+    return client, app
+
+
 class InternalClient(internal_client.InternalClient):
     def __init__(self):
         pass
@@ -60,11 +102,12 @@ def __init__(self, test, path, metadata_prefix, acceptable_statuses):
         self.get_metadata_called = 0
         self.metadata = 'some_metadata'
 
-    def _get_metadata(self, path, metadata_prefix, acceptable_statuses=None):
+    def _get_metadata(self, path, metadata_prefix, acceptable_statuses=None,
+                      headers=None, params=None):
         self.get_metadata_called += 1
-        self.test.assertEquals(self.path, path)
-        self.test.assertEquals(self.metadata_prefix, metadata_prefix)
-        self.test.assertEquals(self.acceptable_statuses, acceptable_statuses)
+        self.test.assertEqual(self.path, path)
+        self.test.assertEqual(self.metadata_prefix, metadata_prefix)
+        self.test.assertEqual(self.acceptable_statuses, acceptable_statuses)
         return self.metadata
 
 
@@ -83,28 +126,32 @@ def _set_metadata(
             self, path, metadata, metadata_prefix='',
             acceptable_statuses=None):
         self.set_metadata_called += 1
-        self.test.assertEquals(self.path, path)
-        self.test.assertEquals(self.metadata_prefix, metadata_prefix)
-        self.test.assertEquals(self.metadata, metadata)
-        self.test.assertEquals(self.acceptable_statuses, acceptable_statuses)
+        self.test.assertEqual(self.path, path)
+        self.test.assertEqual(self.metadata_prefix, metadata_prefix)
+        self.test.assertEqual(self.metadata, metadata)
+        self.test.assertEqual(self.acceptable_statuses, acceptable_statuses)
 
 
 class IterInternalClient(internal_client.InternalClient):
     def __init__(
-            self, test, path, marker, end_marker, acceptable_statuses, items):
+            self, test, path, marker, end_marker, prefix, acceptable_statuses,
+            items):
         self.test = test
         self.path = path
         self.marker = marker
         self.end_marker = end_marker
+        self.prefix = prefix
         self.acceptable_statuses = acceptable_statuses
         self.items = items
 
     def _iter_items(
-            self, path, marker='', end_marker='', acceptable_statuses=None):
-        self.test.assertEquals(self.path, path)
-        self.test.assertEquals(self.marker, marker)
-        self.test.assertEquals(self.end_marker, end_marker)
-        self.test.assertEquals(self.acceptable_statuses, acceptable_statuses)
+            self, path, marker='', end_marker='', prefix='',
+            acceptable_statuses=None):
+        self.test.assertEqual(self.path, path)
+        self.test.assertEqual(self.marker, marker)
+        self.test.assertEqual(self.end_marker, end_marker)
+        self.test.assertEqual(self.prefix, prefix)
+        self.test.assertEqual(self.acceptable_statuses, acceptable_statuses)
         for item in self.items:
             yield item
 
@@ -117,7 +164,7 @@ def __init__(self, test, *args):
                 self.args = args
 
             def method(self, *args):
-                self.test.assertEquals(self.args, args)
+                self.test.assertEqual(self.args, args)
                 return self
 
         try:
@@ -127,89 +174,442 @@ def method(self, *args):
             old_compressobj = internal_client.compressobj
             internal_client.compressobj = compressobj.method
 
-            f = StringIO('')
+            f = BytesIO(b'')
 
             fobj = internal_client.CompressingFileReader(f)
-            self.assertEquals(f, fobj._f)
-            self.assertEquals(compressobj, fobj._compressor)
-            self.assertEquals(False, fobj.done)
-            self.assertEquals(True, fobj.first)
-            self.assertEquals(0, fobj.crc32)
-            self.assertEquals(0, fobj.total_size)
+            self.assertEqual(f, fobj._f)
+            self.assertEqual(compressobj, fobj._compressor)
+            self.assertEqual(False, fobj.done)
+            self.assertEqual(True, fobj.first)
+            self.assertEqual(0, fobj.crc32)
+            self.assertEqual(0, fobj.total_size)
         finally:
             internal_client.compressobj = old_compressobj
 
     def test_read(self):
-        exp_data = 'abcdefghijklmnopqrstuvwxyz'
-        fobj = internal_client.CompressingFileReader(StringIO(exp_data))
+        exp_data = b'abcdefghijklmnopqrstuvwxyz'
+        fobj = internal_client.CompressingFileReader(
+            BytesIO(exp_data), chunk_size=5)
+
+        d = zlib.decompressobj(16 + zlib.MAX_WBITS)
+        data = b''.join(d.decompress(chunk)
+                        for chunk in iter(fobj.read, b''))
+
+        self.assertEqual(exp_data, data)
 
-        data = ''
+    def test_seek(self):
+        exp_data = b'abcdefghijklmnopqrstuvwxyz'
+        fobj = internal_client.CompressingFileReader(
+            BytesIO(exp_data), chunk_size=5)
+
+        # read a couple of chunks only
+        for _ in range(2):
+            fobj.read()
+
+        # read whole thing after seek and check data
+        fobj.seek(0)
         d = zlib.decompressobj(16 + zlib.MAX_WBITS)
-        for chunk in fobj.read():
-            data += d.decompress(chunk)
+        data = b''.join(d.decompress(chunk)
+                        for chunk in iter(fobj.read, b''))
+        self.assertEqual(exp_data, data)
 
-        self.assertEquals(exp_data, data)
+    def test_seek_not_implemented_exception(self):
+        fobj = internal_client.CompressingFileReader(
+            BytesIO(b''), chunk_size=5)
+        self.assertRaises(NotImplementedError, fobj.seek, 10)
+        self.assertRaises(NotImplementedError, fobj.seek, 0, 10)
 
 
 class TestInternalClient(unittest.TestCase):
-    def test_init(self):
-        class App(object):
-            def __init__(self, test, conf_path):
-                self.test = test
-                self.conf_path = conf_path
-                self.load_called = 0
 
-            def load(self, uri):
-                self.load_called += 1
-                self.test.assertEquals('config:' + conf_path, uri)
-                return self
+    @mock.patch('swift.common.utils.HASH_PATH_SUFFIX', new=b'endcap')
+    @with_tempdir
+    def test_load_from_config(self, tempdir):
+        conf_path = os.path.join(tempdir, 'interal_client.conf')
+        conf_body = """
+        [DEFAULT]
+        swift_dir = %s
+
+        [pipeline:main]
+        pipeline = catch_errors cache proxy-server
+
+        [app:proxy-server]
+        use = egg:swift#proxy
+
+        [filter:cache]
+        use = egg:swift#memcache
+
+        [filter:catch_errors]
+        use = egg:swift#catch_errors
+        """ % tempdir
+        with open(conf_path, 'w') as f:
+            f.write(dedent(conf_body))
+        account_ring_path = os.path.join(tempdir, 'account.ring.gz')
+        write_fake_ring(account_ring_path)
+        container_ring_path = os.path.join(tempdir, 'container.ring.gz')
+        write_fake_ring(container_ring_path)
+        object_ring_path = os.path.join(tempdir, 'object.ring.gz')
+        write_fake_ring(object_ring_path)
+        logger = debug_logger('test-ic')
+        self.assertEqual(logger.get_lines_for_level('warning'), [])
+        with patch_policies([StoragePolicy(0, 'legacy', True)]):
+            with mock.patch('swift.proxy.server.get_logger',
+                            lambda *a, **kw: logger):
+                client = internal_client.InternalClient(conf_path, 'test', 1)
+            self.assertEqual(client.account_ring,
+                             client.app.app.app.account_ring)
+            self.assertEqual(client.account_ring.serialized_path,
+                             account_ring_path)
+            self.assertEqual(client.container_ring,
+                             client.app.app.app.container_ring)
+            self.assertEqual(client.container_ring.serialized_path,
+                             container_ring_path)
+            object_ring = client.app.app.app.get_object_ring(0)
+            self.assertEqual(client.get_object_ring(0),
+                             object_ring)
+            self.assertEqual(object_ring.serialized_path,
+                             object_ring_path)
+
+    @mock.patch('swift.common.utils.HASH_PATH_SUFFIX', new=b'endcap')
+    @with_tempdir
+    def test_load_from_config_with_global_conf(self, tempdir):
+        account_ring_path = os.path.join(tempdir, 'account.ring.gz')
+        write_fake_ring(account_ring_path)
+        container_ring_path = os.path.join(tempdir, 'container.ring.gz')
+        write_fake_ring(container_ring_path)
+        object_ring_path = os.path.join(tempdir, 'object.ring.gz')
+        write_fake_ring(object_ring_path)
+
+        # global_conf will override the 'x = y' syntax in conf file...
+        conf_path = os.path.join(tempdir, 'internal_client.conf')
+        conf_body = """
+        [DEFAULT]
+        swift_dir = %s
+        log_name = conf-file-log-name
+
+        [pipeline:main]
+        pipeline = catch_errors cache proxy-server
+
+        [app:proxy-server]
+        use = egg:swift#proxy
+
+        [filter:cache]
+        use = egg:swift#memcache
+
+        [filter:catch_errors]
+        use = egg:swift#catch_errors
+        log_name = catch-errors-log-name
+        """ % tempdir
+        with open(conf_path, 'w') as f:
+            f.write(dedent(conf_body))
+        global_conf = {'log_name': 'global-conf-log-name'}
+        with patch_policies([StoragePolicy(0, 'legacy', True)]):
+            client = internal_client.InternalClient(
+                conf_path, 'test', 1, global_conf=global_conf)
+        self.assertEqual('global-conf-log-name', client.app.logger.server)
+
+        # ...but the 'set x = y' syntax in conf file DEFAULT section will
+        # override global_conf
+        conf_body = """
+        [DEFAULT]
+        swift_dir = %s
+        set log_name = conf-file-log-name
+
+        [pipeline:main]
+        pipeline = catch_errors cache proxy-server
+
+        [app:proxy-server]
+        use = egg:swift#proxy
+
+        [filter:cache]
+        use = egg:swift#memcache
+
+        [filter:catch_errors]
+        use = egg:swift#catch_errors
+        log_name = catch-errors-log-name
+        """ % tempdir
+        with open(conf_path, 'w') as f:
+            f.write(dedent(conf_body))
+        global_conf = {'log_name': 'global-conf-log-name'}
+        with patch_policies([StoragePolicy(0, 'legacy', True)]):
+            client = internal_client.InternalClient(
+                conf_path, 'test', 1, global_conf=global_conf)
+        self.assertEqual('conf-file-log-name', client.app.logger.server)
+
+        # ...and the 'set x = y' syntax in conf file app section will override
+        # DEFAULT section and global_conf
+        conf_body = """
+        [DEFAULT]
+        swift_dir = %s
+        set log_name = conf-file-log-name
+
+        [pipeline:main]
+        pipeline = catch_errors cache proxy-server
+
+        [app:proxy-server]
+        use = egg:swift#proxy
+
+        [filter:cache]
+        use = egg:swift#memcache
+
+        [filter:catch_errors]
+        use = egg:swift#catch_errors
+        set log_name = catch-errors-log-name
+        """ % tempdir
+        with open(conf_path, 'w') as f:
+            f.write(dedent(conf_body))
+        global_conf = {'log_name': 'global-conf-log-name'}
+        with patch_policies([StoragePolicy(0, 'legacy', True)]):
+            client = internal_client.InternalClient(
+                conf_path, 'test', 1, global_conf=global_conf)
+        self.assertEqual('catch-errors-log-name', client.app.logger.server)
 
+    def test_init(self):
         conf_path = 'some_path'
-        app = App(self, conf_path)
-        old_loadapp = internal_client.loadapp
-        internal_client.loadapp = app.load
+        app = FakeSwift()
 
         user_agent = 'some_user_agent'
-        request_tries = 'some_request_tries'
+        request_tries = 123
+
+        with mock.patch.object(internal_client, 'loadapp',
+                               return_value=app) as mock_loadapp, \
+                self.assertRaises(ValueError):
+            # First try with a bad arg
+            internal_client.InternalClient(
+                conf_path, user_agent, request_tries=0)
+        mock_loadapp.assert_not_called()
+
+        # if we load it with the gatekeeper middleware then we also get a
+        # value error
+        gate_keeper_app = GatekeeperMiddleware(app, {})
+        gate_keeper_app._pipeline_final_app = app
+        gate_keeper_app._pipeline = [gate_keeper_app, app]
+        with mock.patch.object(
+                internal_client, 'loadapp', return_value=gate_keeper_app) \
+                as mock_loadapp, self.assertRaises(ValueError) as err:
+            internal_client.InternalClient(
+                conf_path, user_agent, request_tries)
+        self.assertEqual(
+            str(err.exception),
+            ('Gatekeeper middleware is not allowed in the InternalClient '
+             'proxy pipeline'))
 
-        try:
+        with mock.patch.object(
+                internal_client, 'loadapp', return_value=app) as mock_loadapp:
             client = internal_client.InternalClient(
                 conf_path, user_agent, request_tries)
-        finally:
-            internal_client.loadapp = old_loadapp
 
-        self.assertEquals(1, app.load_called)
-        self.assertEquals(app, client.app)
-        self.assertEquals(user_agent, client.user_agent)
-        self.assertEquals(request_tries, client.request_tries)
+        mock_loadapp.assert_called_once_with(
+            conf_path, global_conf=None, allow_modify_pipeline=False)
+        self.assertEqual(app, client.app)
+        self.assertEqual(user_agent, client.user_agent)
+        self.assertEqual(request_tries, client.request_tries)
+        self.assertFalse(client.use_replication_network)
+
+        client = internal_client.InternalClient(
+            conf_path, user_agent, request_tries, app=app,
+            use_replication_network=True)
+        self.assertEqual(app, client.app)
+        self.assertEqual(user_agent, client.user_agent)
+        self.assertEqual(request_tries, client.request_tries)
+        self.assertTrue(client.use_replication_network)
+
+        global_conf = {'log_name': 'custom'}
+        client = internal_client.InternalClient(
+            conf_path, user_agent, request_tries, app=app,
+            use_replication_network=True, global_conf=global_conf)
+        self.assertEqual(app, client.app)
+        self.assertEqual(user_agent, client.user_agent)
+        self.assertEqual(request_tries, client.request_tries)
+        self.assertTrue(client.use_replication_network)
+
+    def test_init_allow_modify_pipeline(self):
+        conf_path = 'some_path'
+        app = FakeSwift()
+        user_agent = 'some_user_agent'
+
+        with mock.patch.object(internal_client, 'loadapp',
+                               return_value=app) as mock_loadapp, \
+                self.assertRaises(ValueError) as cm:
+            internal_client.InternalClient(
+                conf_path, user_agent, 1, allow_modify_pipeline=True)
+        mock_loadapp.assert_not_called()
+        self.assertIn("'allow_modify_pipeline' is no longer supported",
+                      str(cm.exception))
+
+        with mock.patch.object(
+                internal_client, 'loadapp', return_value=app) as mock_loadapp:
+            internal_client.InternalClient(
+                conf_path, user_agent, 1, allow_modify_pipeline=False)
+        mock_loadapp.assert_called_once_with(
+            conf_path, allow_modify_pipeline=False, global_conf=None)
+
+    def test_gatekeeper_not_loaded(self):
+        app = FakeSwift()
+        pipeline = [app]
+
+        class RandomMiddleware(object):
+            def __init__(self, app):
+                self.app = app
+                self._pipeline_final_app = app
+                self._pipeline = pipeline
+                self._pipeline.insert(0, self)
+
+        # if there is no Gatekeeper middleware then it's false
+        # just the final app
+        self.assertFalse(
+            internal_client.InternalClient.check_gatekeeper_not_loaded(app))
+
+        # now with a bunch of middlewares
+        app_no_gatekeeper = app
+        for i in range(5):
+            app_no_gatekeeper = RandomMiddleware(app_no_gatekeeper)
+            self.assertFalse(
+                internal_client.InternalClient.check_gatekeeper_not_loaded(
+                    app_no_gatekeeper))
+
+        # But if we put the gatekeeper on the end, it will be found
+        app_with_gatekeeper = GatekeeperMiddleware(app_no_gatekeeper, {})
+        pipeline.insert(0, app_with_gatekeeper)
+        app_with_gatekeeper._pipeline = pipeline
+        with self.assertRaises(ValueError) as err:
+            internal_client.InternalClient.check_gatekeeper_not_loaded(
+                app_with_gatekeeper)
+        self.assertEqual(str(err.exception),
+                         ('Gatekeeper middleware is not allowed in the '
+                          'InternalClient proxy pipeline'))
+
+        # even if we bury deep into the pipeline
+        for i in range(5):
+            app_with_gatekeeper = RandomMiddleware(app_with_gatekeeper)
+            with self.assertRaises(ValueError) as err:
+                internal_client.InternalClient.check_gatekeeper_not_loaded(
+                    app_with_gatekeeper)
+            self.assertEqual(str(err.exception),
+                             ('Gatekeeper middleware is not allowed in the '
+                              'InternalClient proxy pipeline'))
 
     def test_make_request_sets_user_agent(self):
-        class InternalClient(internal_client.InternalClient):
+        class FakeApp(FakeSwift):
             def __init__(self, test):
+                super(FakeApp, self).__init__()
                 self.test = test
-                self.app = self.fake_app
-                self.user_agent = 'some_agent'
-                self.request_tries = 1
 
-            def fake_app(self, env, start_response):
-                self.test.assertEquals(self.user_agent, env['HTTP_USER_AGENT'])
+            def __call__(self, env, start_response):
+                self.test.assertNotIn(
+                    'HTTP_X_BACKEND_USE_REPLICATION_NETWORK', env)
+                self.test.assertEqual(self.backend_user_agent,
+                                      "some_agent")
                 start_response('200 Ok', [('Content-Length', '0')])
                 return []
 
-        client = InternalClient(self)
+        client = internal_client.InternalClient(
+            None, 'some_agent', 1, use_replication_network=False,
+            app=FakeApp(self))
         client.make_request('GET', '/', {}, (200,))
 
-    def test_make_request_retries(self):
+    def test_make_request_clears_txn_id_after_calling_app(self):
         class InternalClient(internal_client.InternalClient):
-            def __init__(self, test):
+            def __init__(self, test, logger):
+                def fake_app(env, start_response):
+                    self.app.logger.txn_id = 'foo'
+                    self.app.logger.debug('Inside of request')
+                    start_response('200 Ok', [('Content-Length', '0')])
+                    return []
+
                 self.test = test
-                self.app = self.fake_app
                 self.user_agent = 'some_agent'
+                self.app = fake_app
+                self.app.logger = logger
+                self.request_tries = 1
+                self.use_replication_network = False
+
+        logger = debug_logger()
+        # Make sure there's no transaction ID set -- other tests may have
+        # polluted the logger
+        logger.txn_id = None
+        logger.debug('Before request')
+        client = InternalClient(self, logger)
+        client.make_request('GET', '/', {}, (200,))
+        logger.debug('After request')
+        self.assertEqual([(args[0], kwargs['extra'].get('txn_id'))
+                          for args, kwargs in logger.log_dict['debug']], [
+            ('Before request', None),
+            ('Inside of request', 'foo'),
+            ('After request', None),
+        ])
+
+    def test_make_request_defaults_replication_network_header(self):
+        class FakeApp(FakeSwift):
+            def __init__(self, test):
+                super(FakeApp, self).__init__()
+                self.test = test
+                self.expected_header_value = None
+
+            def __call__(self, env, start_response):
+                if self.expected_header_value is None:
+                    self.test.assertNotIn(
+                        'HTTP_X_BACKEND_USE_REPLICATION_NETWORK', env)
+                else:
+                    hdr_val = env['HTTP_X_BACKEND_USE_REPLICATION_NETWORK']
+                    self.test.assertEqual(self.expected_header_value, hdr_val)
+                self.test.assertEqual(self.backend_user_agent,
+                                      'some_agent')
+                start_response('200 Ok', [('Content-Length', '0')])
+                return []
+
+        client = internal_client.InternalClient(
+            None, 'some_agent', 1, use_replication_network=False,
+            app=FakeApp(self))
+        client.make_request('GET', '/', {}, (200,))
+        # Caller can still override
+        client.app.expected_header_value = 'false'
+        client.make_request('GET', '/', {
+            request_helpers.USE_REPLICATION_NETWORK_HEADER: 'false'}, (200,))
+        client.app.expected_header_value = 'true'
+        client.make_request('GET', '/', {
+            request_helpers.USE_REPLICATION_NETWORK_HEADER: 'true'}, (200,))
+
+        # Switch default behavior
+        client.use_replication_network = True
+
+        client.make_request('GET', '/', {}, (200,))
+        client.app.expected_header_value = 'false'
+        client.make_request('GET', '/', {
+            request_helpers.USE_REPLICATION_NETWORK_HEADER: 'false'}, (200,))
+        client.app.expected_header_value = 'on'
+        client.make_request('GET', '/', {
+            request_helpers.USE_REPLICATION_NETWORK_HEADER: 'on'}, (200,))
+
+    def test_make_request_sets_query_string(self):
+        captured_envs = []
+
+        class FakeApp(FakeSwift):
+            def __call__(self, env, start_response):
+                captured_envs.append(env)
+                start_response('200 Ok', [('Content-Length', '0')])
+                return []
+
+        client = internal_client.InternalClient(
+            None, 'some_agent', 1, use_replication_network=False,
+            app=FakeApp())
+        params = {'param1': 'p1', 'tasty': 'soup'}
+        client.make_request('GET', '/', {}, (200,), params=params)
+        actual_params = dict(parse_qsl(captured_envs[0]['QUERY_STRING'],
+                                       keep_blank_values=True,
+                                       strict_parsing=True))
+        self.assertEqual(params, actual_params)
+        self.assertEqual(client.app._pipeline_final_app.backend_user_agent,
+                         'some_agent')
+
+    def test_make_request_retries(self):
+        class FakeApp(FakeSwift):
+            def __init__(self):
+                super(FakeApp, self).__init__()
                 self.request_tries = 4
                 self.tries = 0
-                self.sleep_called = 0
 
-            def fake_app(self, env, start_response):
+            def __call__(self, env, start_response):
                 self.tries += 1
                 if self.tries < self.request_tries:
                     start_response(
@@ -218,11 +618,19 @@ def fake_app(self, env, start_response):
                     start_response('200 Ok', [('Content-Length', '0')])
                 return []
 
+        class InternalClient(internal_client.InternalClient):
+            def __init__(self, *args, **kwargs):
+                self.test = kwargs.pop('test')
+                super(InternalClient, self).__init__(*args, **kwargs)
+                self.sleep_called = 0
+
             def sleep(self, seconds):
                 self.sleep_called += 1
-                self.test.assertEquals(2 ** (self.sleep_called), seconds)
+                self.test.assertEqual(2 ** (self.sleep_called), seconds)
 
-        client = InternalClient(self)
+        client = InternalClient(
+            None, 'some_agent', 4, use_replication_network=False,
+            app=FakeApp(), test=self)
 
         old_sleep = internal_client.sleep
         internal_client.sleep = client.sleep
@@ -232,45 +640,178 @@ def sleep(self, seconds):
         finally:
             internal_client.sleep = old_sleep
 
-        self.assertEquals(3, client.sleep_called)
-        self.assertEquals(4, client.tries)
+        self.assertEqual(3, client.sleep_called)
+        self.assertEqual(4, client.app.tries)
+        self.assertEqual(client.app._pipeline_final_app.backend_user_agent,
+                         'some_agent')
+
+    def test_base_request_timeout(self):
+        # verify that base_request passes timeout arg on to urlopen
+        body = {"some": "content"}
+
+        for timeout in (0.0, 42.0, None):
+            mocked_func = 'swift.common.internal_client.urllib_request.urlopen'
+            with mock.patch(mocked_func) as mock_urlopen:
+                mock_urlopen.side_effect = [FakeConn(body)]
+                sc = internal_client.SimpleClient('http://0.0.0.0/')
+                _, resp_body = sc.base_request('GET', timeout=timeout)
+                mock_urlopen.assert_called_once_with(mock.ANY, timeout=timeout)
+                # sanity check
+                self.assertEqual(body, resp_body)
+
+    def test_base_full_listing(self):
+        body1 = [{'name': 'a'}, {'name': "b"}, {'name': "c"}]
+        body2 = [{'name': 'd'}]
+        body3 = []
+
+        mocked_func = 'swift.common.internal_client.urllib_request.urlopen'
+        with mock.patch(mocked_func) as mock_urlopen:
+            mock_urlopen.side_effect = [
+                FakeConn(body1), FakeConn(body2), FakeConn(body3)]
+            sc = internal_client.SimpleClient('http://0.0.0.0/')
+            _, resp_body = sc.base_request('GET', full_listing=True)
+        self.assertEqual(body1 + body2, resp_body)
+        self.assertEqual(3, mock_urlopen.call_count)
+        actual_requests = [call[0][0] for call in mock_urlopen.call_args_list]
+        self.assertEqual('/?format=json', actual_requests[0].selector)
+        self.assertEqual(
+            '/?format=json&marker=c', actual_requests[1].selector)
+        self.assertEqual(
+            '/?format=json&marker=d', actual_requests[2].selector)
 
     def test_make_request_method_path_headers(self):
-        class InternalClient(internal_client.InternalClient):
+        class FakeApp(FakeSwift):
             def __init__(self):
-                self.app = self.fake_app
-                self.user_agent = 'some_agent'
-                self.request_tries = 3
+                super(FakeApp, self).__init__()
                 self.env = None
 
-            def fake_app(self, env, start_response):
+            def __call__(self, env, start_response):
                 self.env = env
                 start_response('200 Ok', [('Content-Length', '0')])
                 return []
 
-        client = InternalClient()
+        client = internal_client.InternalClient(
+            None, 'some_agent', 3, use_replication_network=False,
+            app=FakeApp())
 
         for method in 'GET PUT HEAD'.split():
             client.make_request(method, '/', {}, (200,))
-            self.assertEquals(client.env['REQUEST_METHOD'], method)
+            self.assertEqual(client.app.env['REQUEST_METHOD'], method)
 
         for path in '/one /two/three'.split():
             client.make_request('GET', path, {'X-Test': path}, (200,))
-            self.assertEquals(client.env['PATH_INFO'], path)
-            self.assertEquals(client.env['HTTP_X_TEST'], path)
-
-    def test_make_request_codes(self):
-        class InternalClient(internal_client.InternalClient):
+            self.assertEqual(client.app.env['PATH_INFO'], path)
+            self.assertEqual(client.app.env['HTTP_X_TEST'], path)
+        self.assertEqual(client.app._pipeline_final_app.backend_user_agent,
+                         'some_agent')
+
+    def test_make_request_error_case(self):
+        class FakeApp(FakeSwift):
+            def __call__(self, env, start_response):
+                body = b'fake error response'
+                start_response('409 Conflict',
+                               [('Content-Length', str(len(body)))])
+                return [body]
+
+        final_fake_app = FakeApp()
+        fake_app = ProxyLoggingMiddleware(
+            final_fake_app, {}, final_fake_app.logger)
+        fake_app._pipeline_final_app = final_fake_app
+
+        client = internal_client.InternalClient(
+            None, 'some_agent', 3, use_replication_network=False, app=fake_app)
+        with self.assertRaises(internal_client.UnexpectedResponse), \
+                mock.patch('swift.common.internal_client.sleep'):
+            client.make_request('DELETE', '/container', {}, (200,))
+
+        # Since we didn't provide an X-Timestamp, retrying gives us a chance to
+        # succeed (assuming the failure was due to clock skew between servers)
+        expected = (' HTTP/1.0 409 ',)
+        logger = client.app._pipeline_final_app.logger
+        loglines = logger.get_lines_for_level('info')
+        for expected, logline in zip_longest(expected, loglines):
+            if not expected:
+                self.fail('Unexpected extra log line: %r' % logline)
+            self.assertIn(expected, logline)
+        self.assertEqual(client.app.app.backend_user_agent, 'some_agent')
+
+    def test_make_request_acceptable_status_not_2xx(self):
+        class FakeApp(FakeSwift):
             def __init__(self):
-                self.app = self.fake_app
-                self.user_agent = 'some_agent'
-                self.request_tries = 3
+                super(FakeApp, self).__init__()
+                self.closed_paths = []
+                self.fully_read_paths = []
+                self.resp_status = None
+
+            def __call__(self, env, start_response):
+                body = b'fake error response'
+                start_response(self.resp_status,
+                               [('Content-Length', str(len(body)))])
+                return LeakTrackingIter(body, self.closed_paths.append,
+                                        self.fully_read_paths.append,
+                                        env['PATH_INFO'])
+
+        def do_test(resp_status):
+            final_fake_app = FakeApp()
+            fake_app = ProxyLoggingMiddleware(
+                final_fake_app, {}, final_fake_app.logger)
+            fake_app._pipeline_final_app = final_fake_app
+            final_fake_app.resp_status = resp_status
+            client = internal_client.InternalClient(
+                None, "some_agent", 3, use_replication_network=False,
+                app=fake_app)
+            expected_error = internal_client.UnexpectedResponse
+            with self.assertRaises(expected_error) as ctx, \
+                    mock.patch('swift.common.internal_client.sleep'):
+                # This is obvious strange tests to expect only 400 Bad Request
+                # but this test intended to avoid extra body drain if it's
+                # correct object body with 2xx.
+                client.make_request('GET', '/cont/obj', {}, (400,))
+            logger = client.app._pipeline_final_app.logger
+            loglines = logger.get_lines_for_level('info')
+            self.assertEqual(client.app.app.backend_user_agent, 'some_agent')
+            return (client.app._pipeline_final_app.fully_read_paths,
+                    client.app._pipeline_final_app.closed_paths,
+                    ctx.exception.resp, loglines)
+
+        fully_read_paths, closed_paths, resp, loglines = do_test('200 OK')
+        # Since the 200 is considered "properly handled", it won't be retried
+        self.assertEqual(fully_read_paths, [])
+        self.assertEqual(closed_paths, [])
+        # ...and it'll be on us (the caller) to read and close (for example,
+        # by using swob.Response's body property)
+        self.assertEqual(resp.body, b'fake error response')
+        self.assertEqual(fully_read_paths, ['/cont/obj'])
+        self.assertEqual(closed_paths, ['/cont/obj'])
+
+        expected = (' HTTP/1.0 200 ', )
+        for expected, logline in zip_longest(expected, loglines):
+            if not expected:
+                self.fail('Unexpected extra log line: %r' % logline)
+            self.assertIn(expected, logline)
+
+        fully_read_paths, closed_paths, resp, loglines = do_test(
+            '503 Service Unavailable')
+        # But since 5xx is neither "properly handled" not likely to include
+        # a large body, it will be retried and responses will already be closed
+        self.assertEqual(fully_read_paths, ['/cont/obj'] * 3)
+        self.assertEqual(closed_paths, ['/cont/obj'] * 3)
+
+        expected = (' HTTP/1.0 503 ', ' HTTP/1.0 503 ', ' HTTP/1.0 503 ', )
+        for expected, logline in zip_longest(expected, loglines):
+            if not expected:
+                self.fail('Unexpected extra log line: %r' % logline)
+            self.assertIn(expected, logline)
 
-            def fake_app(self, env, start_response):
+    def test_make_request_codes(self):
+        class FakeApp(FakeSwift):
+            def __call__(self, env, start_response):
                 start_response('200 Ok', [('Content-Length', '0')])
                 return []
 
-        client = InternalClient()
+        client = internal_client.InternalClient(
+            None, 'some_agent', 3, use_replication_network=False,
+            app=FakeApp())
 
         try:
             old_sleep = internal_client.sleep
@@ -281,16 +822,23 @@ def fake_app(self, env, start_response):
             client.make_request('GET', '/', {}, (400, 200))
             client.make_request('GET', '/', {}, (400, 2))
 
-            try:
+            with self.assertRaises(internal_client.UnexpectedResponse) \
+                    as raised:
                 client.make_request('GET', '/', {}, (400,))
-            except Exception, err:
-                exc = err
-            self.assertEquals(200, err.resp.status_int)
-            try:
+            self.assertEqual(200, raised.exception.resp.status_int)
+
+            with self.assertRaises(internal_client.UnexpectedResponse) \
+                    as raised:
                 client.make_request('GET', '/', {}, (201,))
-            except Exception, err:
-                exc = err
-            self.assertEquals(200, err.resp.status_int)
+            self.assertEqual(200, raised.exception.resp.status_int)
+
+            with self.assertRaises(internal_client.UnexpectedResponse) \
+                    as raised:
+                client.make_request('GET', '/', {}, (111,))
+            self.assertTrue(str(raised.exception).startswith(
+                'Unexpected response'))
+            self.assertEqual(client.app._pipeline_final_app.backend_user_agent,
+                             'some_agent')
         finally:
             internal_client.sleep = old_sleep
 
@@ -302,46 +850,48 @@ def __init__(self, test):
 
             def seek(self, offset, whence=0):
                 self.seek_called += 1
-                self.test.assertEquals(0, offset)
-                self.test.assertEquals(0, whence)
+                self.test.assertEqual(0, offset)
+                self.test.assertEqual(0, whence)
 
-        class InternalClient(internal_client.InternalClient):
-            def __init__(self):
-                self.app = self.fake_app
-                self.user_agent = 'some_agent'
-                self.request_tries = 3
+        class FakeApp(FakeSwift):
+            def __init__(self, status):
+                super(FakeApp, self).__init__()
+                self.status = status
 
-            def fake_app(self, env, start_response):
-                start_response('404 Not Found', [('Content-Length', '0')])
+            def __call__(self, env, start_response):
+                start_response(self.status, [('Content-Length', '0')])
+                self._calls.append('')
                 return []
 
-        fobj = FileObject(self)
-        client = InternalClient()
+        def do_test(status, expected_calls):
+            fobj = FileObject(self)
+            client = internal_client.InternalClient(
+                None, 'some_agent', 3, use_replication_network=False,
+                app=FakeApp(status))
 
-        try:
-            old_sleep = internal_client.sleep
-            internal_client.sleep = not_sleep
-            try:
-                client.make_request('PUT', '/', {}, (2,), fobj)
-            except Exception, err:
-                exc = err
-            self.assertEquals(404, err.resp.status_int)
-        finally:
-            internal_client.sleep = old_sleep
+            with mock.patch.object(internal_client, 'sleep', not_sleep):
+                with self.assertRaises(Exception) as exc_mgr:
+                    client.make_request('PUT', '/', {}, (2,), fobj)
+                self.assertEqual(int(status[:3]),
+                                 exc_mgr.exception.resp.status_int)
 
-        self.assertEquals(client.request_tries, fobj.seek_called)
+            self.assertEqual(client.app.call_count, fobj.seek_called)
+            self.assertEqual(client.app.call_count, expected_calls)
+            self.assertEqual(client.app._pipeline_final_app.backend_user_agent,
+                             'some_agent')
 
-    def test_make_request_request_exception(self):
-        class InternalClient(internal_client.InternalClient):
-            def __init__(self):
-                self.app = self.fake_app
-                self.user_agent = 'some_agent'
-                self.request_tries = 3
+        do_test('404 Not Found', 1)
+        do_test('503 Service Unavailable', 3)
 
-            def fake_app(self, env, start_response):
+    def test_make_request_request_exception(self):
+        class FakeApp(FakeSwift):
+            def __call__(self, env, start_response):
                 raise Exception()
 
-        client = InternalClient()
+        client = internal_client.InternalClient(
+            None, 'some_agent', 3, app=FakeApp())
+        self.assertEqual(client.app._pipeline_final_app.backend_user_agent,
+                         'some_agent')
         try:
             old_sleep = internal_client.sleep
             internal_client.sleep = not_sleep
@@ -365,22 +915,22 @@ def __init__(self, test, path, resp_headers):
 
             def make_request(
                     self, method, path, headers, acceptable_statuses,
-                    body_file=None):
+                    body_file=None, params=None):
                 self.make_request_called += 1
-                self.test.assertEquals('HEAD', method)
-                self.test.assertEquals(self.path, path)
-                self.test.assertEquals((2,), acceptable_statuses)
-                self.test.assertEquals(None, body_file)
+                self.test.assertEqual('HEAD', method)
+                self.test.assertEqual(self.path, path)
+                self.test.assertEqual((2,), acceptable_statuses)
+                self.test.assertIsNone(body_file)
                 return Response(self.resp_headers)
 
         path = 'some_path'
         metadata_prefix = 'some_key-'
         resp_headers = {
             '%sone' % (metadata_prefix): '1',
-            '%stwo' % (metadata_prefix): '2',
-            '%sthree' % (metadata_prefix): '3',
+            '%sTwo' % (metadata_prefix): '2',
+            '%sThree' % (metadata_prefix): '3',
             'some_header-four': '4',
-            'some_header-five': '5',
+            'Some_header-five': '5',
         }
         exp_metadata = {
             'one': '1',
@@ -390,32 +940,32 @@ def make_request(
 
         client = InternalClient(self, path, resp_headers)
         metadata = client._get_metadata(path, metadata_prefix)
-        self.assertEquals(exp_metadata, metadata)
-        self.assertEquals(1, client.make_request_called)
+        self.assertEqual(exp_metadata, metadata)
+        self.assertEqual(1, client.make_request_called)
 
     def test_get_metadata_invalid_status(self):
-        class Response(object):
-            def __init__(self):
-                self.status_int = 404
-                self.headers = {'some_key': 'some_value'}
 
-        class InternalClient(internal_client.InternalClient):
-            def __init__(self):
-                pass
-
-            def make_request(self, *a, **kw):
-                return Response()
-
-        client = InternalClient()
-        metadata = client._get_metadata('path')
-        self.assertEquals({}, metadata)
+        class FakeApp(FakeSwift):
+            def __call__(self, environ, start_response):
+                start_response('404 Not Found', [('x-foo', 'bar')])
+                return [b'nope']
+
+        client = internal_client.InternalClient(
+            None, 'test', 1, use_replication_network=False, app=FakeApp())
+        self.assertRaises(internal_client.UnexpectedResponse,
+                          client._get_metadata, 'path')
+        metadata = client._get_metadata('path', metadata_prefix='x-',
+                                        acceptable_statuses=(4,))
+        self.assertEqual(metadata, {'foo': 'bar'})
+        self.assertEqual(client.app._pipeline_final_app.backend_user_agent,
+                         'test')
 
     def test_make_path(self):
         account, container, obj = path_parts()
         path = make_path(account, container, obj)
 
         c = InternalClient()
-        self.assertEquals(path, c.make_path(account, container, obj))
+        self.assertEqual(path, c.make_path(account, container, obj))
 
     def test_make_path_exception(self):
         c = InternalClient()
@@ -440,20 +990,20 @@ def make_request(
                 return self.responses.pop(0)
 
         exp_items = []
-        responses = [Response(200, json.dumps([])), ]
+        responses = [Response(200, json.dumps([]).encode('ascii')), ]
         items = []
         client = InternalClient(self, responses)
         for item in client._iter_items('/'):
             items.append(item)
-        self.assertEquals(exp_items, items)
+        self.assertEqual(exp_items, items)
 
         exp_items = []
         responses = []
-        for i in xrange(3):
+        for i in range(3):
             data = [
                 {'name': 'item%02d' % (2 * i)},
                 {'name': 'item%02d' % (2 * i + 1)}]
-            responses.append(Response(200, json.dumps(data)))
+            responses.append(Response(200, json.dumps(data).encode('ascii')))
             exp_items.extend(data)
         responses.append(Response(204, ''))
 
@@ -461,13 +1011,13 @@ def make_request(
         client = InternalClient(self, responses)
         for item in client._iter_items('/'):
             items.append(item)
-        self.assertEquals(exp_items, items)
+        self.assertEqual(exp_items, items)
 
     def test_iter_items_with_markers(self):
         class Response(object):
             def __init__(self, status_int, body):
                 self.status_int = status_int
-                self.body = body
+                self.body = body.encode('ascii')
 
         class InternalClient(internal_client.InternalClient):
             def __init__(self, test, paths, responses):
@@ -479,17 +1029,18 @@ def make_request(
                     self, method, path, headers, acceptable_statuses,
                     body_file=None):
                 exp_path = self.paths.pop(0)
-                self.test.assertEquals(exp_path, path)
+                self.test.assertEqual(exp_path, path)
                 return self.responses.pop(0)
 
         paths = [
-            '/?format=json&marker=start&end_marker=end',
-            '/?format=json&marker=one%C3%A9&end_marker=end',
-            '/?format=json&marker=two&end_marker=end',
+            '/?format=json&marker=start&end_marker=end&prefix=',
+            '/?format=json&marker=one%C3%A9&end_marker=end&prefix=',
+            '/?format=json&marker=two&end_marker=end&prefix=',
         ]
 
         responses = [
-            Response(200, json.dumps([{'name': 'one\xc3\xa9'}, ])),
+            Response(200, json.dumps([{
+                'name': b'one\xc3\xa9'.decode('utf8')}, ])),
             Response(200, json.dumps([{'name': 'two'}, ])),
             Response(204, ''),
         ]
@@ -499,7 +1050,107 @@ def make_request(
         for item in client._iter_items('/', marker='start', end_marker='end'):
             items.append(item['name'].encode('utf8'))
 
-        self.assertEquals('one\xc3\xa9 two'.split(), items)
+        self.assertEqual(b'one\xc3\xa9 two'.split(), items)
+
+    def test_iter_items_with_markers_and_prefix(self):
+        class Response(object):
+            def __init__(self, status_int, body):
+                self.status_int = status_int
+                self.body = body.encode('ascii')
+
+        class InternalClient(internal_client.InternalClient):
+            def __init__(self, test, paths, responses):
+                self.test = test
+                self.paths = paths
+                self.responses = responses
+
+            def make_request(
+                    self, method, path, headers, acceptable_statuses,
+                    body_file=None):
+                exp_path = self.paths.pop(0)
+                self.test.assertEqual(exp_path, path)
+                return self.responses.pop(0)
+
+        paths = [
+            '/?format=json&marker=prefixed_start&end_marker=prefixed_end'
+            '&prefix=prefixed_',
+            '/?format=json&marker=prefixed_one%C3%A9&end_marker=prefixed_end'
+            '&prefix=prefixed_',
+            '/?format=json&marker=prefixed_two&end_marker=prefixed_end'
+            '&prefix=prefixed_',
+        ]
+
+        responses = [
+            Response(200, json.dumps([{
+                'name': b'prefixed_one\xc3\xa9'.decode('utf8')}, ])),
+            Response(200, json.dumps([{'name': 'prefixed_two'}, ])),
+            Response(204, ''),
+        ]
+
+        items = []
+        client = InternalClient(self, paths, responses)
+        for item in client._iter_items('/', marker='prefixed_start',
+                                       end_marker='prefixed_end',
+                                       prefix='prefixed_'):
+            items.append(item['name'].encode('utf8'))
+
+        self.assertEqual(b'prefixed_one\xc3\xa9 prefixed_two'.split(), items)
+
+    def test_iter_item_read_response_if_status_is_acceptable(self):
+        class Response(object):
+            def __init__(self, status_int, body, app_iter):
+                self.status_int = status_int
+                self.body = body
+                self.app_iter = app_iter
+
+        class InternalClient(internal_client.InternalClient):
+            def __init__(self, test, responses):
+                self.test = test
+                self.responses = responses
+
+            def make_request(
+                self, method, path, headers, acceptable_statuses,
+                    body_file=None):
+                resp = self.responses.pop(0)
+                if resp.status_int in acceptable_statuses or \
+                        resp.status_int // 100 in acceptable_statuses:
+                    return resp
+                if resp:
+                    raise internal_client.UnexpectedResponse(
+                        'Unexpected response: %s' % resp.status_int, resp)
+
+        num_list = []
+
+        def generate_resp_body():
+            for i in range(1, 5):
+                yield str(i).encode('ascii')
+                num_list.append(i)
+
+        exp_items = []
+        responses = [Response(204, json.dumps([]).encode('ascii'),
+                              generate_resp_body())]
+        items = []
+        client = InternalClient(self, responses)
+        for item in client._iter_items('/'):
+            items.append(item)
+        self.assertEqual(exp_items, items)
+        self.assertEqual(len(num_list), 0)
+
+        responses = [Response(300, json.dumps([]).encode('ascii'),
+                              generate_resp_body())]
+        client = InternalClient(self, responses)
+        self.assertRaises(internal_client.UnexpectedResponse,
+                          next, client._iter_items('/'))
+
+        exp_items = []
+        responses = [Response(404, json.dumps([]).encode('ascii'),
+                              generate_resp_body())]
+        items = []
+        client = InternalClient(self, responses)
+        for item in client._iter_items('/'):
+            items.append(item)
+        self.assertEqual(exp_items, items)
+        self.assertEqual(len(num_list), 4)
 
     def test_set_metadata(self):
         class InternalClient(internal_client.InternalClient):
@@ -513,11 +1164,11 @@ def make_request(
                     self, method, path, headers, acceptable_statuses,
                     body_file=None):
                 self.make_request_called += 1
-                self.test.assertEquals('POST', method)
-                self.test.assertEquals(self.path, path)
-                self.test.assertEquals(self.exp_headers, headers)
-                self.test.assertEquals((2,), acceptable_statuses)
-                self.test.assertEquals(None, body_file)
+                self.test.assertEqual('POST', method)
+                self.test.assertEqual(self.path, path)
+                self.test.assertEqual(self.exp_headers, headers)
+                self.test.assertEqual((2,), acceptable_statuses)
+                self.test.assertIsNone(body_file)
 
         path = 'some_path'
         metadata_prefix = 'some_key-'
@@ -534,7 +1185,7 @@ def make_request(
 
         client = InternalClient(self, path, exp_headers)
         client._set_metadata(path, metadata, metadata_prefix)
-        self.assertEquals(1, client.make_request_called)
+        self.assertEqual(1, client.make_request_called)
 
     def test_iter_containers(self):
         account, container, obj = path_parts()
@@ -542,15 +1193,42 @@ def test_iter_containers(self):
         items = '0 1 2'.split()
         marker = 'some_marker'
         end_marker = 'some_end_marker'
+        prefix = 'some_prefix'
         acceptable_statuses = 'some_status_list'
         client = IterInternalClient(
-            self, path, marker, end_marker, acceptable_statuses, items)
+            self, path, marker, end_marker, prefix, acceptable_statuses, items)
         ret_items = []
         for container in client.iter_containers(
-                account, marker, end_marker,
+                account, marker, end_marker, prefix,
                 acceptable_statuses=acceptable_statuses):
             ret_items.append(container)
-        self.assertEquals(items, ret_items)
+        self.assertEqual(items, ret_items)
+
+    def test_create_account(self):
+        account, container, obj = path_parts()
+        path = make_path_info(account)
+        client, app = get_client_app()
+        app.register('PUT', path, swob.HTTPCreated, {})
+        client.create_account(account)
+        self.assertEqual([('PUT', path, {
+            'X-Backend-Allow-Reserved-Names': 'true',
+            'Host': 'localhost:80',
+            'User-Agent': 'test'
+        })], app.calls_with_headers)
+        self.assertEqual(app.backend_user_agent, 'test')
+        self.assertEqual({}, app.unread_requests)
+        self.assertEqual({}, app.unclosed_requests)
+
+    def test_delete_account(self):
+        account, container, obj = path_parts()
+        path = make_path_info(account)
+        client, app = get_client_app()
+        app.register('DELETE', path, swob.HTTPNoContent, {})
+        client.delete_account(account)
+        self.assertEqual(1, len(app._calls))
+        self.assertEqual({}, app.unread_requests)
+        self.assertEqual({}, app.unclosed_requests)
+        self.assertEqual(app.backend_user_agent, 'test')
 
     def test_get_account_info(self):
         class Response(object):
@@ -559,6 +1237,7 @@ def __init__(self, containers, objects):
                     'x-account-container-count': containers,
                     'x-account-object-count': objects,
                 }
+                self.status_int = 200
 
         class InternalClient(internal_client.InternalClient):
             def __init__(self, test, path, resp):
@@ -569,11 +1248,11 @@ def __init__(self, test, path, resp):
             def make_request(
                     self, method, path, headers, acceptable_statuses,
                     body_file=None):
-                self.test.assertEquals('HEAD', method)
-                self.test.assertEquals(self.path, path)
-                self.test.assertEquals({}, headers)
-                self.test.assertEquals((2, 404), acceptable_statuses)
-                self.test.assertEquals(None, body_file)
+                self.test.assertEqual('HEAD', method)
+                self.test.assertEqual(self.path, path)
+                self.test.assertEqual({}, headers)
+                self.test.assertEqual((2, 404), acceptable_statuses)
+                self.test.assertIsNone(body_file)
                 return self.resp
 
         account, container, obj = path_parts()
@@ -581,7 +1260,30 @@ def make_request(
         containers, objects = 10, 100
         client = InternalClient(self, path, Response(containers, objects))
         info = client.get_account_info(account)
-        self.assertEquals((containers, objects), info)
+        self.assertEqual((containers, objects), info)
+
+    def test_get_account_info_404(self):
+        class Response(object):
+            def __init__(self):
+                self.headers = {
+                    'x-account-container-count': 10,
+                    'x-account-object-count': 100,
+                }
+                self.status_int = 404
+
+        class InternalClient(internal_client.InternalClient):
+            def __init__(self):
+                pass
+
+            def make_path(self, *a, **kw):
+                return 'some_path'
+
+            def make_request(self, *a, **kw):
+                return Response()
+
+        client = InternalClient()
+        info = client.get_account_info('some_account')
+        self.assertEqual((0, 0), info)
 
     def test_get_account_metadata(self):
         account, container, obj = path_parts()
@@ -592,10 +1294,47 @@ def test_get_account_metadata(self):
             self, path, metadata_prefix, acceptable_statuses)
         metadata = client.get_account_metadata(
             account, metadata_prefix, acceptable_statuses)
-        self.assertEquals(client.metadata, metadata)
-        self.assertEquals(1, client.get_metadata_called)
+        self.assertEqual(client.metadata, metadata)
+        self.assertEqual(1, client.get_metadata_called)
+
+    def test_get_metadadata_with_acceptable_status(self):
+        account, container, obj = path_parts()
+        path = make_path_info(account)
+        client, app = get_client_app()
+        resp_headers = {'some-important-header': 'some value'}
+        app.register('GET', path, swob.HTTPOk, resp_headers)
+        metadata = client.get_account_metadata(
+            account, acceptable_statuses=(2, 4))
+        self.assertEqual(metadata['some-important-header'],
+                         'some value')
+        app.register('GET', path, swob.HTTPNotFound, resp_headers)
+        metadata = client.get_account_metadata(
+            account, acceptable_statuses=(2, 4))
+        self.assertEqual(metadata['some-important-header'],
+                         'some value')
+        app.register('GET', path, swob.HTTPServerError, resp_headers)
+        self.assertRaises(internal_client.UnexpectedResponse,
+                          client.get_account_metadata, account,
+                          acceptable_statuses=(2, 4))
 
     def test_set_account_metadata(self):
+        account, container, obj = path_parts()
+        path = make_path_info(account)
+        client, app = get_client_app()
+        app.register('POST', path, swob.HTTPAccepted, {})
+        client.set_account_metadata(account, {'Color': 'Blue'},
+                                    metadata_prefix='X-Account-Meta-')
+        self.assertEqual([('POST', path, {
+            'X-Backend-Allow-Reserved-Names': 'true',
+            'Host': 'localhost:80',
+            'X-Account-Meta-Color': 'Blue',
+            'User-Agent': 'test'
+        })], app.calls_with_headers)
+        self.assertEqual({}, app.unread_requests)
+        self.assertEqual({}, app.unclosed_requests)
+        self.assertEqual(app.backend_user_agent, 'test')
+
+    def test_set_account_metadata_plumbing(self):
         account, container, obj = path_parts()
         path = make_path(account)
         metadata = 'some_metadata'
@@ -605,7 +1344,7 @@ def test_set_account_metadata(self):
             self, path, metadata, metadata_prefix, acceptable_statuses)
         client.set_account_metadata(
             account, metadata, metadata_prefix, acceptable_statuses)
-        self.assertEquals(1, client.set_metadata_called)
+        self.assertEqual(1, client.set_metadata_called)
 
     def test_container_exists(self):
         class Response(object):
@@ -623,25 +1362,40 @@ def make_request(
                     self, method, path, headers, acceptable_statuses,
                     body_file=None):
                 self.make_request_called += 1
-                self.test.assertEquals('HEAD', method)
-                self.test.assertEquals(self.path, path)
-                self.test.assertEquals({}, headers)
-                self.test.assertEquals((2, 404), acceptable_statuses)
-                self.test.assertEquals(None, body_file)
+                self.test.assertEqual('HEAD', method)
+                self.test.assertEqual(self.path, path)
+                self.test.assertEqual({}, headers)
+                self.test.assertEqual((2, 404), acceptable_statuses)
+                self.test.assertIsNone(body_file)
                 return self.resp
 
         account, container, obj = path_parts()
         path = make_path(account, container)
 
         client = InternalClient(self, path, Response(200))
-        self.assertEquals(True, client.container_exists(account, container))
-        self.assertEquals(1, client.make_request_called)
+        self.assertEqual(True, client.container_exists(account, container))
+        self.assertEqual(1, client.make_request_called)
 
         client = InternalClient(self, path, Response(404))
-        self.assertEquals(False, client.container_exists(account, container))
-        self.assertEquals(1, client.make_request_called)
+        self.assertEqual(False, client.container_exists(account, container))
+        self.assertEqual(1, client.make_request_called)
 
     def test_create_container(self):
+        account, container, obj = path_parts()
+        path = make_path_info(account, container)
+        client, app = get_client_app()
+        app.register('PUT', path, swob.HTTPCreated, {})
+        client.create_container(account, container)
+        self.assertEqual([('PUT', path, {
+            'X-Backend-Allow-Reserved-Names': 'true',
+            'Host': 'localhost:80',
+            'User-Agent': 'test'
+        })], app.calls_with_headers)
+        self.assertEqual(app.backend_user_agent, 'test')
+        self.assertEqual({}, app.unread_requests)
+        self.assertEqual({}, app.unclosed_requests)
+
+    def test_create_container_plumbing(self):
         class InternalClient(internal_client.InternalClient):
             def __init__(self, test, path, headers):
                 self.test = test
@@ -653,20 +1407,31 @@ def make_request(
                     self, method, path, headers, acceptable_statuses,
                     body_file=None):
                 self.make_request_called += 1
-                self.test.assertEquals('PUT', method)
-                self.test.assertEquals(self.path, path)
-                self.test.assertEquals(self.headers, headers)
-                self.test.assertEquals((2,), acceptable_statuses)
-                self.test.assertEquals(None, body_file)
+                self.test.assertEqual('PUT', method)
+                self.test.assertEqual(self.path, path)
+                self.test.assertEqual(self.headers, headers)
+                self.test.assertEqual((2,), acceptable_statuses)
+                self.test.assertIsNone(body_file)
 
         account, container, obj = path_parts()
         path = make_path(account, container)
         headers = 'some_headers'
         client = InternalClient(self, path, headers)
         client.create_container(account, container, headers)
-        self.assertEquals(1, client.make_request_called)
+        self.assertEqual(1, client.make_request_called)
 
     def test_delete_container(self):
+        account, container, obj = path_parts()
+        path = make_path_info(account, container)
+        client, app = get_client_app()
+        app.register('DELETE', path, swob.HTTPNoContent, {})
+        client.delete_container(account, container)
+        self.assertEqual(1, len(app._calls))
+        self.assertEqual({}, app.unread_requests)
+        self.assertEqual({}, app.unclosed_requests)
+        self.assertEqual(app.backend_user_agent, 'test')
+
+    def test_delete_container_plumbing(self):
         class InternalClient(internal_client.InternalClient):
             def __init__(self, test, path):
                 self.test = test
@@ -677,17 +1442,17 @@ def make_request(
                     self, method, path, headers, acceptable_statuses,
                     body_file=None):
                 self.make_request_called += 1
-                self.test.assertEquals('DELETE', method)
-                self.test.assertEquals(self.path, path)
-                self.test.assertEquals({}, headers)
-                self.test.assertEquals((2, 404), acceptable_statuses)
-                self.test.assertEquals(None, body_file)
+                self.test.assertEqual('DELETE', method)
+                self.test.assertEqual(self.path, path)
+                self.test.assertEqual({}, headers)
+                self.test.assertEqual((2, 404), acceptable_statuses)
+                self.test.assertIsNone(body_file)
 
         account, container, obj = path_parts()
         path = make_path(account, container)
         client = InternalClient(self, path)
         client.delete_container(account, container)
-        self.assertEquals(1, client.make_request_called)
+        self.assertEqual(1, client.make_request_called)
 
     def test_get_container_metadata(self):
         account, container, obj = path_parts()
@@ -698,25 +1463,44 @@ def test_get_container_metadata(self):
             self, path, metadata_prefix, acceptable_statuses)
         metadata = client.get_container_metadata(
             account, container, metadata_prefix, acceptable_statuses)
-        self.assertEquals(client.metadata, metadata)
-        self.assertEquals(1, client.get_metadata_called)
+        self.assertEqual(client.metadata, metadata)
+        self.assertEqual(1, client.get_metadata_called)
 
     def test_iter_objects(self):
         account, container, obj = path_parts()
         path = make_path(account, container)
         marker = 'some_maker'
         end_marker = 'some_end_marker'
+        prefix = 'some_prefix'
         acceptable_statuses = 'some_status_list'
         items = '0 1 2'.split()
         client = IterInternalClient(
-            self, path, marker, end_marker, acceptable_statuses, items)
+            self, path, marker, end_marker, prefix, acceptable_statuses, items)
         ret_items = []
         for obj in client.iter_objects(
-                account, container, marker, end_marker, acceptable_statuses):
+                account, container, marker, end_marker, prefix,
+                acceptable_statuses):
             ret_items.append(obj)
-        self.assertEquals(items, ret_items)
+        self.assertEqual(items, ret_items)
 
     def test_set_container_metadata(self):
+        account, container, obj = path_parts()
+        path = make_path_info(account, container)
+        client, app = get_client_app()
+        app.register('POST', path, swob.HTTPAccepted, {})
+        client.set_container_metadata(account, container, {'Color': 'Blue'},
+                                      metadata_prefix='X-Container-Meta-')
+        self.assertEqual([('POST', path, {
+            'X-Backend-Allow-Reserved-Names': 'true',
+            'Host': 'localhost:80',
+            'X-Container-Meta-Color': 'Blue',
+            'User-Agent': 'test'
+        })], app.calls_with_headers)
+        self.assertEqual({}, app.unread_requests)
+        self.assertEqual({}, app.unclosed_requests)
+        self.assertEqual(app.backend_user_agent, 'test')
+
+    def test_set_container_metadata_plumbing(self):
         account, container, obj = path_parts()
         path = make_path(account, container)
         metadata = 'some_metadata'
@@ -726,31 +1510,26 @@ def test_set_container_metadata(self):
             self, path, metadata, metadata_prefix, acceptable_statuses)
         client.set_container_metadata(
             account, container, metadata, metadata_prefix, acceptable_statuses)
-        self.assertEquals(1, client.set_metadata_called)
+        self.assertEqual(1, client.set_metadata_called)
 
     def test_delete_object(self):
-        class InternalClient(internal_client.InternalClient):
-            def __init__(self, test, path):
-                self.test = test
-                self.path = path
-                self.make_request_called = 0
-
-            def make_request(
-                    self, method, path, headers, acceptable_statuses,
-                    body_file=None):
-                self.make_request_called += 1
-                self.test.assertEquals('DELETE', method)
-                self.test.assertEquals(self.path, path)
-                self.test.assertEquals({}, headers)
-                self.test.assertEquals((2, 404), acceptable_statuses)
-                self.test.assertEquals(None, body_file)
-
         account, container, obj = path_parts()
-        path = make_path(account, container, obj)
+        path = make_path_info(account, container, obj)
+        client, app = get_client_app()
+        app.register('DELETE', path, swob.HTTPNoContent, {})
+        client.delete_object(account, container, obj)
+        self.assertEqual(app.unclosed_requests, {})
+        self.assertEqual(1, len(app._calls))
+        self.assertEqual({}, app.unread_requests)
+        self.assertEqual({}, app.unclosed_requests)
+        self.assertEqual(app.backend_user_agent, 'test')
 
-        client = InternalClient(self, path)
+        app.register('DELETE', path, swob.HTTPNotFound, {})
         client.delete_object(account, container, obj)
-        self.assertEquals(1, client.make_request_called)
+        self.assertEqual(app.unclosed_requests, {})
+        self.assertEqual(2, len(app._calls))
+        self.assertEqual({}, app.unread_requests)
+        self.assertEqual({}, app.unclosed_requests)
 
     def test_get_object_metadata(self):
         account, container, obj = path_parts()
@@ -762,50 +1541,125 @@ def test_get_object_metadata(self):
         metadata = client.get_object_metadata(
             account, container, obj, metadata_prefix,
             acceptable_statuses)
-        self.assertEquals(client.metadata, metadata)
-        self.assertEquals(1, client.get_metadata_called)
+        self.assertEqual(client.metadata, metadata)
+        self.assertEqual(1, client.get_metadata_called)
+
+    def test_get_metadata_extra_headers(self):
+        class FakeApp(FakeSwift):
+            def __call__(self, env, start_response):
+                self.req_env = env
+                start_response('200 Ok', [('Content-Length', '0')])
+                return []
+
+        client = internal_client.InternalClient(
+            None, 'some_agent', 3, use_replication_network=False,
+            app=FakeApp())
+        headers = {'X-Foo': 'bar'}
+        client.get_object_metadata('account', 'container', 'obj',
+                                   headers=headers)
+        self.assertEqual(client.app.req_env['HTTP_X_FOO'], 'bar')
+
+    def test_get_object(self):
+        account, container, obj = path_parts()
+        path_info = make_path_info(account, container, obj)
+        client, app = get_client_app()
+        headers = {'foo': 'bar'}
+        body = b'some_object_body'
+        params = {'symlink': 'get'}
+        app.register('GET', path_info, swob.HTTPOk, headers, body)
+        req_headers = {'x-important-header': 'some_important_value'}
+        status_int, resp_headers, obj_iter = client.get_object(
+            account, container, obj, req_headers, params=params)
+        self.assertEqual(status_int // 100, 2)
+        for k, v in headers.items():
+            self.assertEqual(v, resp_headers[k])
+        self.assertEqual(b''.join(obj_iter), body)
+        self.assertEqual(resp_headers['content-length'], str(len(body)))
+        self.assertEqual(app.call_count, 1)
+        req_headers.update({
+            'host': 'localhost:80',  # from swob.Request.blank
+            'user-agent': 'test',  # from IC
+            'x-backend-allow-reserved-names': 'true',  # also from IC
+        })
+        self.assertEqual(app.calls_with_headers, [(
+            'GET', path_info + '?symlink=get', HeaderKeyDict(req_headers))])
 
     def test_iter_object_lines(self):
-        class InternalClient(internal_client.InternalClient):
+        class FakeApp(FakeSwift):
             def __init__(self, lines):
+                super(FakeApp, self).__init__()
                 self.lines = lines
-                self.app = self.fake_app
-                self.user_agent = 'some_agent'
-                self.request_tries = 3
 
-            def fake_app(self, env, start_response):
+            def __call__(self, env, start_response):
                 start_response('200 Ok', [('Content-Length', '0')])
-                return ['%s\n' % x for x in self.lines]
+                return [b'%s\n' % x for x in self.lines]
 
-        lines = 'line1 line2 line3'.split()
-        client = InternalClient(lines)
+        lines = b'line1 line2 line3'.split()
+        client = internal_client.InternalClient(
+            None, 'some_agent', 3, use_replication_network=False,
+            app=FakeApp(lines))
         ret_lines = []
         for line in client.iter_object_lines('account', 'container', 'object'):
             ret_lines.append(line)
-        self.assertEquals(lines, ret_lines)
+        self.assertEqual(lines, ret_lines)
+        self.assertEqual(client.app._pipeline_final_app.backend_user_agent,
+                         'some_agent')
 
     def test_iter_object_lines_compressed_object(self):
-        class InternalClient(internal_client.InternalClient):
+        class FakeApp(FakeSwift):
             def __init__(self, lines):
+                super(FakeApp, self).__init__()
                 self.lines = lines
-                self.app = self.fake_app
-                self.user_agent = 'some_agent'
-                self.request_tries = 3
 
-            def fake_app(self, env, start_response):
+            def __call__(self, env, start_response):
                 start_response('200 Ok', [('Content-Length', '0')])
                 return internal_client.CompressingFileReader(
-                    StringIO('\n'.join(self.lines)))
+                    BytesIO(b'\n'.join(self.lines)))
 
-        lines = 'line1 line2 line3'.split()
-        client = InternalClient(lines)
+        lines = b'line1 line2 line3'.split()
+        client = internal_client.InternalClient(
+            None, 'some_agent', 3, use_replication_network=False,
+            app=FakeApp(lines))
         ret_lines = []
         for line in client.iter_object_lines(
                 'account', 'container', 'object.gz'):
             ret_lines.append(line)
-        self.assertEquals(lines, ret_lines)
+        self.assertEqual(lines, ret_lines)
+
+    def test_iter_object_lines_404(self):
+        class FakeApp(FakeSwift):
+            def __call__(self, env, start_response):
+                start_response('404 Not Found', [])
+                return [b'one\ntwo\nthree']
+
+        client = internal_client.InternalClient(
+            None, 'some_agent', 3, use_replication_network=False,
+            app=FakeApp())
+        lines = []
+        for line in client.iter_object_lines(
+                'some_account', 'some_container', 'some_object',
+                acceptable_statuses=(2, 404)):
+            lines.append(line)
+        self.assertEqual([], lines)
 
     def test_set_object_metadata(self):
+        account, container, obj = path_parts()
+        path = make_path_info(account, container, obj)
+        client, app = get_client_app()
+        app.register('POST', path, swob.HTTPAccepted, {})
+        client.set_object_metadata(account, container, obj, {'Color': 'Blue'},
+                                   metadata_prefix='X-Object-Meta-')
+        self.assertEqual([('POST', path, {
+            'X-Backend-Allow-Reserved-Names': 'true',
+            'Host': 'localhost:80',
+            'X-Object-Meta-Color': 'Blue',
+            'User-Agent': 'test'
+        })], app.calls_with_headers)
+        self.assertEqual({}, app.unread_requests)
+        self.assertEqual({}, app.unclosed_requests)
+        self.assertEqual(app.backend_user_agent, 'test')
+
+    def test_set_object_metadata_plumbing(self):
         account, container, obj = path_parts()
         path = make_path(account, container, obj)
         metadata = 'some_metadata'
@@ -816,12 +1670,29 @@ def test_set_object_metadata(self):
         client.set_object_metadata(
             account, container, obj, metadata, metadata_prefix,
             acceptable_statuses)
-        self.assertEquals(1, client.set_metadata_called)
+        self.assertEqual(1, client.set_metadata_called)
 
     def test_upload_object(self):
+        account, container, obj = path_parts()
+        path = make_path_info(account, container, obj)
+        client, app = get_client_app()
+        app.register('PUT', path, swob.HTTPCreated, {})
+        client.upload_object(BytesIO(b'fobj'), account, container, obj)
+        self.assertEqual([('PUT', path, {
+            'Transfer-Encoding': 'chunked',
+            'X-Backend-Allow-Reserved-Names': 'true',
+            'Host': 'localhost:80',
+            'User-Agent': 'test'
+        })], app.calls_with_headers)
+        self.assertEqual({}, app.unread_requests)
+        self.assertEqual({}, app.unclosed_requests)
+        self.assertEqual(app.backend_user_agent, 'test')
+
+    def test_upload_object_plumbing(self):
         class InternalClient(internal_client.InternalClient):
             def __init__(self, test, path, headers, fobj):
                 self.test = test
+                self.use_replication_network = False
                 self.path = path
                 self.headers = headers
                 self.fobj = fobj
@@ -829,13 +1700,13 @@ def __init__(self, test, path, headers, fobj):
 
             def make_request(
                     self, method, path, headers, acceptable_statuses,
-                    body_file=None):
+                    body_file=None, params=None):
                 self.make_request_called += 1
-                self.test.assertEquals(self.path, path)
+                self.test.assertEqual(self.path, path)
                 exp_headers = dict(self.headers)
                 exp_headers['Transfer-Encoding'] = 'chunked'
-                self.test.assertEquals(exp_headers, headers)
-                self.test.assertEquals(self.fobj, fobj)
+                self.test.assertEqual(exp_headers, headers)
+                self.test.assertEqual(self.fobj, fobj)
 
         fobj = 'some_fobj'
         account, container, obj = path_parts()
@@ -844,7 +1715,340 @@ def make_request(
 
         client = InternalClient(self, path, headers, fobj)
         client.upload_object(fobj, account, container, obj, headers)
-        self.assertEquals(1, client.make_request_called)
+        self.assertEqual(1, client.make_request_called)
+
+    def test_upload_object_not_chunked(self):
+        class InternalClient(internal_client.InternalClient):
+            def __init__(self, test, path, headers, fobj):
+                self.test = test
+                self.path = path
+                self.headers = headers
+                self.fobj = fobj
+                self.make_request_called = 0
+
+            def make_request(
+                    self, method, path, headers, acceptable_statuses,
+                    body_file=None, params=None):
+                self.make_request_called += 1
+                self.test.assertEqual(self.path, path)
+                exp_headers = dict(self.headers)
+                self.test.assertEqual(exp_headers, headers)
+                self.test.assertEqual(self.fobj, fobj)
+
+        fobj = 'some_fobj'
+        account, container, obj = path_parts()
+        path = make_path(account, container, obj)
+        headers = {'key': 'value', 'Content-Length': len(fobj)}
+
+        client = InternalClient(self, path, headers, fobj)
+        client.upload_object(fobj, account, container, obj, headers)
+        self.assertEqual(1, client.make_request_called)
+
+
+class TestGetAuth(unittest.TestCase):
+    @mock.patch.object(urllib_request, 'urlopen')
+    @mock.patch.object(urllib_request, 'Request')
+    def test_ok(self, request, urlopen):
+        def getheader(name):
+            d = {'X-Storage-Url': 'url', 'X-Auth-Token': 'token'}
+            return d.get(name)
+        urlopen.return_value.info.return_value.getheader = getheader
+
+        url, token = internal_client.get_auth(
+            'http://127.0.0.1', 'user', 'key')
+
+        self.assertEqual(url, "url")
+        self.assertEqual(token, "token")
+        request.assert_called_with('http://127.0.0.1')
+        request.return_value.add_header.assert_any_call('X-Auth-User', 'user')
+        request.return_value.add_header.assert_any_call('X-Auth-Key', 'key')
+
+    def test_invalid_version(self):
+        self.assertRaises(SystemExit, internal_client.get_auth,
+                          'http://127.0.0.1', 'user', 'key', auth_version=2.0)
+
+
+class TestSimpleClient(unittest.TestCase):
+
+    def _test_get_head(self, request, urlopen, method):
+
+        mock_time_value = [1401224049.98]
+
+        def mock_time():
+            # global mock_time_value
+            mock_time_value[0] += 1
+            return mock_time_value[0]
+
+        with mock.patch('swift.common.internal_client.time', mock_time):
+            # basic request, only url as kwarg
+            request.return_value.get_type.return_value = "http"
+            urlopen.return_value.read.return_value = b''
+            urlopen.return_value.getcode.return_value = 200
+            urlopen.return_value.info.return_value = {'content-length': '345'}
+            sc = internal_client.SimpleClient(url='http://127.0.0.1')
+            logger = debug_logger('test-ic')
+            retval = sc.retry_request(
+                method, headers={'content-length': '123'}, logger=logger)
+            self.assertEqual(urlopen.call_count, 1)
+            request.assert_called_with('http://127.0.0.1?format=json',
+                                       headers={'content-length': '123'},
+                                       data=None)
+            self.assertEqual([{'content-length': '345'}, None], retval)
+            self.assertEqual(method, request.return_value.get_method())
+            self.assertEqual(logger.get_lines_for_level('debug'), [
+                '-> 2014-05-27T20:54:11 ' + method +
+                ' http://127.0.0.1%3Fformat%3Djson 200 '
+                '123 345 1401224050.98 1401224051.98 1.0 -'
+            ])
+
+            # Check if JSON is decoded
+            urlopen.return_value.read.return_value = b'{}'
+            retval = sc.retry_request(method)
+            self.assertEqual([{'content-length': '345'}, {}], retval)
+
+            # same as above, now with token
+            sc = internal_client.SimpleClient(url='http://127.0.0.1',
+                                              token='token')
+            retval = sc.retry_request(method)
+            request.assert_called_with('http://127.0.0.1?format=json',
+                                       headers={'X-Auth-Token': 'token'},
+                                       data=None)
+            self.assertEqual([{'content-length': '345'}, {}], retval)
+
+            # same as above, now with prefix
+            sc = internal_client.SimpleClient(url='http://127.0.0.1',
+                                              token='token')
+            retval = sc.retry_request(method, prefix="pre_")
+            request.assert_called_with(
+                'http://127.0.0.1?format=json&prefix=pre_',
+                headers={'X-Auth-Token': 'token'}, data=None)
+            self.assertEqual([{'content-length': '345'}, {}], retval)
+
+            # same as above, now with container name
+            retval = sc.retry_request(method, container='cont')
+            request.assert_called_with('http://127.0.0.1/cont?format=json',
+                                       headers={'X-Auth-Token': 'token'},
+                                       data=None)
+            self.assertEqual([{'content-length': '345'}, {}], retval)
+
+            # same as above, now with object name
+            retval = sc.retry_request(method, container='cont', name='obj')
+            request.assert_called_with('http://127.0.0.1/cont/obj',
+                                       headers={'X-Auth-Token': 'token'},
+                                       data=None)
+            self.assertEqual([{'content-length': '345'}, {}], retval)
+
+    @mock.patch.object(urllib_request, 'urlopen')
+    @mock.patch.object(urllib_request, 'Request')
+    def test_get(self, request, urlopen):
+        self._test_get_head(request, urlopen, 'GET')
+
+    @mock.patch.object(urllib_request, 'urlopen')
+    @mock.patch.object(urllib_request, 'Request')
+    def test_head(self, request, urlopen):
+        self._test_get_head(request, urlopen, 'HEAD')
+
+    @mock.patch.object(urllib_request, 'urlopen')
+    @mock.patch.object(urllib_request, 'Request')
+    def test_get_with_retries_all_failed(self, request, urlopen):
+        # Simulate a failing request, ensure retries done
+        request.return_value.get_type.return_value = "http"
+        urlopen.side_effect = urllib_request.URLError('')
+        sc = internal_client.SimpleClient(url='http://127.0.0.1', retries=1)
+        with mock.patch('swift.common.internal_client.sleep') as mock_sleep:
+            self.assertRaises(urllib_request.URLError, sc.retry_request, 'GET')
+        self.assertEqual(mock_sleep.call_count, 1)
+        self.assertEqual(request.call_count, 2)
+        self.assertEqual(urlopen.call_count, 2)
+
+    @mock.patch.object(urllib_request, 'urlopen')
+    @mock.patch.object(urllib_request, 'Request')
+    def test_get_with_retries(self, request, urlopen):
+        # First request fails, retry successful
+        request.return_value.get_type.return_value = "http"
+        mock_resp = mock.MagicMock()
+        mock_resp.read.return_value = b''
+        mock_resp.info.return_value = {}
+        urlopen.side_effect = [urllib_request.URLError(''), mock_resp]
+        sc = internal_client.SimpleClient(url='http://127.0.0.1', retries=1,
+                                          token='token')
+
+        with mock.patch('swift.common.internal_client.sleep') as mock_sleep:
+            retval = sc.retry_request('GET')
+        self.assertEqual(mock_sleep.call_count, 1)
+        self.assertEqual(request.call_count, 2)
+        self.assertEqual(urlopen.call_count, 2)
+        request.assert_called_with('http://127.0.0.1?format=json', data=None,
+                                   headers={'X-Auth-Token': 'token'})
+        self.assertEqual([{}, None], retval)
+        self.assertEqual(sc.attempts, 2)
+
+    @mock.patch.object(urllib_request, 'urlopen')
+    def test_get_with_retries_param(self, mock_urlopen):
+        mock_response = mock.MagicMock()
+        mock_response.read.return_value = b''
+        mock_response.info.return_value = {}
+        mock_urlopen.side_effect = http_client.BadStatusLine('')
+        c = internal_client.SimpleClient(url='http://127.0.0.1', token='token')
+        self.assertEqual(c.retries, 5)
+
+        # first without retries param
+        with mock.patch('swift.common.internal_client.sleep') as mock_sleep:
+            self.assertRaises(http_client.BadStatusLine,
+                              c.retry_request, 'GET')
+        self.assertEqual(mock_sleep.call_count, 5)
+        self.assertEqual(mock_urlopen.call_count, 6)
+        # then with retries param
+        mock_urlopen.reset_mock()
+        with mock.patch('swift.common.internal_client.sleep') as mock_sleep:
+            self.assertRaises(http_client.BadStatusLine,
+                              c.retry_request, 'GET', retries=2)
+        self.assertEqual(mock_sleep.call_count, 2)
+        self.assertEqual(mock_urlopen.call_count, 3)
+        # and this time with a real response
+        mock_urlopen.reset_mock()
+        mock_urlopen.side_effect = [http_client.BadStatusLine(''),
+                                    mock_response]
+        with mock.patch('swift.common.internal_client.sleep') as mock_sleep:
+            retval = c.retry_request('GET', retries=1)
+        self.assertEqual(mock_sleep.call_count, 1)
+        self.assertEqual(mock_urlopen.call_count, 2)
+        self.assertEqual([{}, None], retval)
+
+    @mock.patch.object(urllib_request, 'urlopen')
+    def test_request_with_retries_with_HTTPError(self, mock_urlopen):
+        mock_response = mock.MagicMock()
+        mock_response.read.return_value = b''
+        c = internal_client.SimpleClient(url='http://127.0.0.1', token='token')
+        self.assertEqual(c.retries, 5)
+
+        for request_method in 'GET PUT POST DELETE HEAD COPY'.split():
+            mock_urlopen.reset_mock()
+            mock_urlopen.side_effect = urllib_request.HTTPError(*[None] * 5)
+            with mock.patch('swift.common.internal_client.sleep') \
+                    as mock_sleep:
+                self.assertRaises(exceptions.ClientException,
+                                  c.retry_request, request_method, retries=1)
+            self.assertEqual(mock_sleep.call_count, 1)
+            self.assertEqual(mock_urlopen.call_count, 2)
+
+    @mock.patch.object(urllib_request, 'urlopen')
+    def test_request_container_with_retries_with_HTTPError(self,
+                                                           mock_urlopen):
+        mock_response = mock.MagicMock()
+        mock_response.read.return_value = b''
+        c = internal_client.SimpleClient(url='http://127.0.0.1', token='token')
+        self.assertEqual(c.retries, 5)
+
+        for request_method in 'GET PUT POST DELETE HEAD COPY'.split():
+            mock_urlopen.reset_mock()
+            mock_urlopen.side_effect = urllib_request.HTTPError(*[None] * 5)
+            with mock.patch('swift.common.internal_client.sleep') \
+                    as mock_sleep:
+                self.assertRaises(exceptions.ClientException,
+                                  c.retry_request, request_method,
+                                  container='con', retries=1)
+            self.assertEqual(mock_sleep.call_count, 1)
+            self.assertEqual(mock_urlopen.call_count, 2)
+
+    @mock.patch.object(urllib_request, 'urlopen')
+    def test_request_object_with_retries_with_HTTPError(self,
+                                                        mock_urlopen):
+        mock_response = mock.MagicMock()
+        mock_response.read.return_value = b''
+        c = internal_client.SimpleClient(url='http://127.0.0.1', token='token')
+        self.assertEqual(c.retries, 5)
+
+        for request_method in 'GET PUT POST DELETE HEAD COPY'.split():
+            mock_urlopen.reset_mock()
+            mock_urlopen.side_effect = urllib_request.HTTPError(*[None] * 5)
+            with mock.patch('swift.common.internal_client.sleep') \
+                    as mock_sleep:
+                self.assertRaises(exceptions.ClientException,
+                                  c.retry_request, request_method,
+                                  container='con', name='obj', retries=1)
+            self.assertEqual(mock_sleep.call_count, 1)
+            self.assertEqual(mock_urlopen.call_count, 2)
+
+    @mock.patch.object(urllib_request, 'urlopen')
+    def test_delete_object_with_404_no_retry(self, mock_urlopen):
+        mock_response = mock.MagicMock()
+        mock_response.read.return_value = b''
+        err_args = [None, 404, None, None, None]
+        mock_urlopen.side_effect = urllib_request.HTTPError(*err_args)
+
+        with mock.patch('swift.common.internal_client.sleep') as mock_sleep, \
+                self.assertRaises(exceptions.ClientException) as caught:
+            internal_client.delete_object('http://127.0.0.1',
+                                          container='con', name='obj')
+        self.assertEqual(caught.exception.http_status, 404)
+        self.assertEqual(mock_sleep.call_count, 0)
+        self.assertEqual(mock_urlopen.call_count, 1)
+
+    @mock.patch.object(urllib_request, 'urlopen')
+    def test_delete_object_with_409_no_retry(self, mock_urlopen):
+        mock_response = mock.MagicMock()
+        mock_response.read.return_value = b''
+        err_args = [None, 409, None, None, None]
+        mock_urlopen.side_effect = urllib_request.HTTPError(*err_args)
+
+        with mock.patch('swift.common.internal_client.sleep') as mock_sleep, \
+                self.assertRaises(exceptions.ClientException) as caught:
+            internal_client.delete_object('http://127.0.0.1',
+                                          container='con', name='obj')
+        self.assertEqual(caught.exception.http_status, 409)
+        self.assertEqual(mock_sleep.call_count, 0)
+        self.assertEqual(mock_urlopen.call_count, 1)
+
+    def test_proxy(self):
+        # check that proxy arg is passed through to the urllib Request
+        scheme = 'http'
+        proxy_host = '127.0.0.1:80'
+        proxy = '%s://%s' % (scheme, proxy_host)
+        url = 'https://127.0.0.1:1/a'
+
+        mocked = 'swift.common.internal_client.urllib_request.urlopen'
+
+        # module level methods
+        for func in (internal_client.put_object,
+                     internal_client.delete_object):
+            with mock.patch(mocked) as mock_urlopen:
+                mock_urlopen.return_value = FakeConn()
+                func(url, container='c', name='o1', contents='', proxy=proxy,
+                     timeout=0.1, retries=0)
+                self.assertEqual(1, mock_urlopen.call_count)
+                args, kwargs = mock_urlopen.call_args
+                self.assertEqual(1, len(args))
+                self.assertEqual(1, len(kwargs))
+                self.assertEqual(0.1, kwargs['timeout'])
+                self.assertIsInstance(args[0], urllib_request.Request)
+                self.assertEqual(proxy_host, args[0].host)
+                # TODO: figure out why this doesn't match `scheme`, whether
+                # py2 (where it did) or py3 is messed up, whether we care,
+                # and what can be done about it
+                self.assertEqual('https', args[0].type)
+
+        # class methods
+        content = mock.MagicMock()
+        cl = internal_client.SimpleClient(url)
+        scenarios = ((cl.get_account, []),
+                     (cl.get_container, ['c']),
+                     (cl.put_container, ['c']),
+                     (cl.put_object, ['c', 'o', content]))
+        for scenario in scenarios:
+            with mock.patch(mocked) as mock_urlopen:
+                mock_urlopen.return_value = FakeConn()
+                scenario[0](*scenario[1], proxy=proxy, timeout=0.1)
+                self.assertEqual(1, mock_urlopen.call_count)
+                args, kwargs = mock_urlopen.call_args
+                self.assertEqual(1, len(args))
+                self.assertEqual(1, len(kwargs))
+                self.assertEqual(0.1, kwargs['timeout'])
+                self.assertIsInstance(args[0], urllib_request.Request)
+                self.assertEqual(proxy_host, args[0].host)
+                # See above
+                self.assertEqual('https', args[0].type)
+
 
 if __name__ == '__main__':
     unittest.main()
diff --git a/test/unit/common/test_linkat.py b/test/unit/common/test_linkat.py
new file mode 100644
index 0000000000..51604aa1df
--- /dev/null
+++ b/test/unit/common/test_linkat.py
@@ -0,0 +1,104 @@
+# Copyright (c) 2016 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+'''Tests for `swift.common.linkat`'''
+
+import ctypes
+import unittest
+import os
+from unittest import mock
+from uuid import uuid4
+from tempfile import gettempdir
+
+from swift.common.linkat import linkat
+from swift.common.utils import O_TMPFILE
+
+from test.unit import requires_o_tmpfile_support_in_tmp
+
+
+class TestLinkat(unittest.TestCase):
+
+    def test_flags(self):
+        self.assertTrue(hasattr(linkat, 'AT_FDCWD'))
+        self.assertTrue(hasattr(linkat, 'AT_SYMLINK_FOLLOW'))
+
+    @mock.patch('swift.common.linkat.linkat._c_linkat', None)
+    def test_available(self):
+        self.assertFalse(linkat.available)
+
+    @requires_o_tmpfile_support_in_tmp
+    def test_errno(self):
+        with open('/dev/null', 'r') as fd:
+            self.assertRaises(IOError, linkat,
+                              linkat.AT_FDCWD, "/proc/self/fd/%s" % (fd),
+                              linkat.AT_FDCWD, "%s/testlinkat" % gettempdir(),
+                              linkat.AT_SYMLINK_FOLLOW)
+        self.assertEqual(ctypes.get_errno(), 0)
+
+    @mock.patch('swift.common.linkat.linkat._c_linkat', None)
+    def test_unavailable(self):
+        self.assertRaises(EnvironmentError, linkat, 0, None, 0, None, 0)
+
+    def test_unavailable_in_libc(self):
+
+        class LibC(object):
+
+            def __init__(self):
+                self.linkat_retrieved = False
+
+            @property
+            def linkat(self):
+                self.linkat_retrieved = True
+                raise AttributeError
+
+        libc = LibC()
+        mock_cdll = mock.Mock(return_value=libc)
+
+        with mock.patch('ctypes.CDLL', new=mock_cdll):
+            # Force re-construction of a `Linkat` instance
+            # Something you're not supposed to do in actual code
+            new_linkat = type(linkat)()
+            self.assertFalse(new_linkat.available)
+
+        libc_name = ctypes.util.find_library('c')
+
+        mock_cdll.assert_called_once_with(libc_name, use_errno=True)
+        self.assertTrue(libc.linkat_retrieved)
+
+    @requires_o_tmpfile_support_in_tmp
+    def test_linkat_success(self):
+
+        fd = None
+        path = None
+        ret = -1
+        try:
+            fd = os.open(gettempdir(), O_TMPFILE | os.O_WRONLY)
+            path = os.path.join(gettempdir(), uuid4().hex)
+            ret = linkat(linkat.AT_FDCWD, "/proc/self/fd/%d" % (fd),
+                         linkat.AT_FDCWD, path, linkat.AT_SYMLINK_FOLLOW)
+            self.assertEqual(ret, 0)
+            self.assertTrue(os.path.exists(path))
+        finally:
+            if fd:
+                os.close(fd)
+            if path and ret == 0:
+                # if linkat succeeded, remove file
+                os.unlink(path)
+
+    @mock.patch('swift.common.linkat.linkat._c_linkat')
+    def test_linkat_fd_not_integer(self, _mock_linkat):
+        self.assertRaises(TypeError, linkat,
+                          "not_int", None, "not_int", None, 0)
+        self.assertFalse(_mock_linkat.called)
diff --git a/test/unit/common/test_manager.py b/test/unit/common/test_manager.py
index 15f0b9761e..668c95b5a6 100644
--- a/test/unit/common/test_manager.py
+++ b/test/unit/common/test_manager.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -16,22 +16,28 @@
 import unittest
 from test.unit import temptree
 
+from unittest import mock
 import os
 import sys
 import resource
 import signal
 import errno
-from contextlib import contextmanager
 from collections import defaultdict
-from threading import Thread
 from time import sleep, time
+import tempfile
+
+from importlib import reload as reload_module
 
 from swift.common import manager
+from swift.common.exceptions import InvalidPidFileException
+
+import eventlet
+threading = eventlet.patcher.original('threading')
 
 DUMMY_SIG = 1
 
 
-class MockOs():
+class MockOs(object):
     RAISE_EPERM_SIG = 99
 
     def __init__(self, pids):
@@ -64,7 +70,6 @@ def pop_stream(f):
     output = f.read()
     f.seek(0)
     f.truncate()
-    #print >> sys.stderr, output
     return output
 
 
@@ -72,13 +77,13 @@ class TestManagerModule(unittest.TestCase):
 
     def test_servers(self):
         main_plus_rest = set(manager.MAIN_SERVERS + manager.REST_SERVERS)
-        self.assertEquals(set(manager.ALL_SERVERS), main_plus_rest)
+        self.assertEqual(set(manager.ALL_SERVERS), main_plus_rest)
         # make sure there's no server listed in both
-        self.assertEquals(len(main_plus_rest), len(manager.MAIN_SERVERS) +
-                          len(manager.REST_SERVERS))
+        self.assertEqual(len(main_plus_rest), len(manager.MAIN_SERVERS) +
+                         len(manager.REST_SERVERS))
 
     def test_setup_env(self):
-        class MockResource():
+        class MockResource(object):
             def __init__(self, error=None):
                 self.error = error
                 self.called_with_args = []
@@ -106,52 +111,66 @@ def __getattr__(self, name):
                                           manager.MAX_DESCRIPTORS)),
                 (resource.RLIMIT_DATA, (manager.MAX_MEMORY,
                                         manager.MAX_MEMORY)),
+                (resource.RLIMIT_NPROC, (manager.MAX_PROCS,
+                                         manager.MAX_PROCS)),
             ]
-            self.assertEquals(manager.resource.called_with_args, expected)
-            self.assertEquals(manager.os.environ['PYTHON_EGG_CACHE'], '/tmp')
+            self.assertEqual(manager.resource.called_with_args, expected)
+            self.assertTrue(
+                manager.os.environ['PYTHON_EGG_CACHE'].startswith(
+                    tempfile.gettempdir()))
 
             # test error condition
             manager.resource = MockResource(error=ValueError())
             manager.os.environ = {}
             manager.setup_env()
-            self.assertEquals(manager.resource.called_with_args, [])
-            self.assertEquals(manager.os.environ['PYTHON_EGG_CACHE'], '/tmp')
+            self.assertEqual(manager.resource.called_with_args, [])
+            self.assertTrue(
+                manager.os.environ['PYTHON_EGG_CACHE'].startswith(
+                    tempfile.gettempdir()))
 
             manager.resource = MockResource(error=OSError())
             manager.os.environ = {}
             self.assertRaises(OSError, manager.setup_env)
-            self.assertEquals(manager.os.environ.get('PYTHON_EGG_CACHE'), None)
+            self.assertIsNone(manager.os.environ.get('PYTHON_EGG_CACHE'))
         finally:
             manager.resource = _orig_resource
             os.environ = _orig_environ
 
     def test_command_wrapper(self):
-        @manager.command
-        def myfunc(arg1):
-            """test doc
-            """
-            return arg1
-
-        self.assertEquals(myfunc.__doc__.strip(), 'test doc')
-        self.assertEquals(myfunc(1), 1)
-        self.assertEquals(myfunc(0), 0)
-        self.assertEquals(myfunc(True), 1)
-        self.assertEquals(myfunc(False), 0)
-        self.assert_(hasattr(myfunc, 'publicly_accessible'))
-        self.assert_(myfunc.publicly_accessible)
+
+        class MockManager(object):
+            def __init__(self, servers_):
+                self.servers = [manager.Server(server) for server in servers_]
+
+            @manager.command
+            def myfunc(self, arg1):
+                """test doc
+                """
+                return arg1
+
+        m = MockManager(['test'])
+        self.assertEqual(m.myfunc.__doc__.strip(), 'test doc')
+        self.assertEqual(m.myfunc(1), 1)
+        self.assertEqual(m.myfunc(0), 0)
+        self.assertEqual(m.myfunc(True), 1)
+        self.assertEqual(m.myfunc(False), 0)
+        self.assertTrue(hasattr(m.myfunc, 'publicly_accessible'))
+        self.assertTrue(m.myfunc.publicly_accessible)
 
     def test_watch_server_pids(self):
-        class MockOs():
+        class MockOs(object):
             WNOHANG = os.WNOHANG
 
-            def __init__(self, pid_map={}):
+            def __init__(self, pid_map=None):
+                if pid_map is None:
+                    pid_map = {}
                 self.pid_map = {}
                 for pid, v in pid_map.items():
                     self.pid_map[pid] = (x for x in v)
 
             def waitpid(self, pid, options):
                 try:
-                    rv = self.pid_map[pid].next()
+                    rv = next(self.pid_map[pid])
                 except StopIteration:
                     raise OSError(errno.ECHILD, os.strerror(errno.ECHILD))
                 except KeyError:
@@ -161,7 +180,7 @@ def waitpid(self, pid, options):
                 else:
                     return rv
 
-        class MockTime():
+        class MockTime(object):
             def __init__(self, ticks=None):
                 self.tock = time()
                 if not ticks:
@@ -171,7 +190,7 @@ def __init__(self, ticks=None):
 
             def time(self):
                 try:
-                    self.tock += self.ticks.next()
+                    self.tock += next(self.ticks)
                 except StopIteration:
                     self.tock += 1
                 return self.tock
@@ -179,14 +198,14 @@ def time(self):
             def sleep(*args):
                 return
 
-        class MockServer():
+        class MockServer(object):
 
-            def __init__(self, pids, zombie=0):
+            def __init__(self, pids, run_dir=manager.RUN_DIR, zombie=0):
                 self.heartbeat = (pids for _ in range(zombie))
 
             def get_running_pids(self):
                 try:
-                    rv = self.heartbeat.next()
+                    rv = next(self.heartbeat)
                     return rv
                 except StopIteration:
                     return {}
@@ -206,17 +225,17 @@ def get_running_pids(self):
             # basic test, server dies
             gen = manager.watch_server_pids(server_pids)
             expected = [(server, 1)]
-            self.assertEquals([x for x in gen], expected)
+            self.assertEqual([x for x in gen], expected)
             # start long running server and short interval
             server = MockServer([1], zombie=15)
             server_pids = {
                 server: [1],
             }
             gen = manager.watch_server_pids(server_pids)
-            self.assertEquals([x for x in gen], [])
+            self.assertEqual([x for x in gen], [])
             # wait a little longer
             gen = manager.watch_server_pids(server_pids, interval=15)
-            self.assertEquals([x for x in gen], [(server, 1)])
+            self.assertEqual([x for x in gen], [(server, 1)])
             # zombie process
             server = MockServer([1], zombie=200)
             server_pids = {
@@ -245,21 +264,70 @@ def get_running_pids(self):
                 (server2, 2),
                 (server2, 20),
             ]
-            self.assertEquals([x for x in gen], expected)
+            self.assertEqual([x for x in gen], expected)
 
         finally:
             manager.os = _orig_os
             manager.time = _orig_time
             manager.Server = _orig_server
 
+    def test_safe_kill(self):
+        manager.os = MockOs([1, 2, 3, 4])
+
+        proc_files = (
+            ('1/cmdline', 'same-procname'),
+            ('2/cmdline', 'another-procname'),
+            ('4/cmdline', 'another-procname'),
+        )
+        files, contents = zip(*proc_files)
+        with temptree(files, contents) as t:
+            manager.PROC_DIR = t
+            manager.safe_kill(1, signal.SIG_DFL, 'same-procname')
+            self.assertRaises(InvalidPidFileException, manager.safe_kill,
+                              2, signal.SIG_DFL, 'same-procname')
+            manager.safe_kill(3, signal.SIG_DFL, 'same-procname')
+            manager.safe_kill(4, signal.SIGHUP, 'same-procname')
+
     def test_exc(self):
-        self.assert_(issubclass(manager.UnknownCommandError, Exception))
+        self.assertTrue(issubclass(manager.UnknownCommandError, Exception))
+
+    def test_format_server_name(self):
+        self.assertEqual(
+            manager.format_server_name('proxy'),
+            ("proxy-server", "swift-proxy-server"))
+        self.assertEqual(
+            manager.format_server_name('Proxy'),
+            ("Proxy-server", "swift-Proxy-server"))
+        self.assertEqual(
+            manager.format_server_name(''),
+            ("-server", "swift--server"))
+
+    def test_verify_server(self):
+        def mock_find_exe(f):
+            # pretend that swift-object-server is the only file on path
+            return f if f == 'swift-object-server' else None
+
+        with mock.patch('swift.common.manager.which',
+                        side_effect=mock_find_exe):
+            # test valid servers
+            self.assertTrue(manager.verify_server('object'))
+            self.assertTrue(manager.verify_server('object-server'))
+            self.assertTrue(manager.verify_server('object.replication'))
+            self.assertTrue(manager.verify_server('object-server.1'))
+            # test invalid servers
+            self.assertFalse(manager.verify_server('test'))
+            self.assertFalse(manager.verify_server('test-server'))
+            self.assertFalse(manager.verify_server('ls'))
+            self.assertFalse(manager.verify_server(''))
+            self.assertFalse(manager.verify_server('Object'))
+            self.assertFalse(manager.verify_server('object1'))
+            self.assertFalse(manager.verify_server(None))
 
 
 class TestServer(unittest.TestCase):
 
     def tearDown(self):
-        reload(manager)
+        reload_module(manager)
 
     def join_swift_dir(self, path):
         return os.path.join(manager.SWIFT_DIR, path)
@@ -269,68 +337,86 @@ def join_run_dir(self, path):
 
     def test_create_server(self):
         server = manager.Server('proxy')
-        self.assertEquals(server.server, 'proxy-server')
-        self.assertEquals(server.type, 'proxy')
-        self.assertEquals(server.cmd, 'swift-proxy-server')
+        self.assertEqual(server.server, 'proxy-server')
+        self.assertEqual(server.type, 'proxy')
+        self.assertEqual(server.cmd, 'swift-proxy-server')
         server = manager.Server('object-replicator')
-        self.assertEquals(server.server, 'object-replicator')
-        self.assertEquals(server.type, 'object')
-        self.assertEquals(server.cmd, 'swift-object-replicator')
+        self.assertEqual(server.server, 'object-replicator')
+        self.assertEqual(server.type, 'object')
+        self.assertEqual(server.cmd, 'swift-object-replicator')
 
     def test_server_to_string(self):
         server = manager.Server('Proxy')
-        self.assertEquals(str(server), 'proxy-server')
+        self.assertEqual(str(server), 'proxy-server')
         server = manager.Server('object-replicator')
-        self.assertEquals(str(server), 'object-replicator')
+        self.assertEqual(str(server), 'object-replicator')
 
     def test_server_repr(self):
         server = manager.Server('proxy')
-        self.assert_(server.__class__.__name__ in repr(server))
-        self.assert_(str(server) in repr(server))
+        self.assertTrue(server.__class__.__name__ in repr(server))
+        self.assertTrue(str(server) in repr(server))
 
     def test_server_equality(self):
         server1 = manager.Server('Proxy')
         server2 = manager.Server('proxy-server')
-        self.assertEquals(server1, server2)
+        self.assertEqual(server1, server2)
         # it is NOT a string
-        self.assertNotEquals(server1, 'proxy-server')
+        self.assertNotEqual(server1, 'proxy-server')
 
     def test_get_pid_file_name(self):
         server = manager.Server('proxy')
         conf_file = self.join_swift_dir('proxy-server.conf')
         pid_file = self.join_run_dir('proxy-server.pid')
-        self.assertEquals(pid_file, server.get_pid_file_name(conf_file))
+        self.assertEqual(pid_file, server.get_pid_file_name(conf_file))
         server = manager.Server('object-replicator')
         conf_file = self.join_swift_dir('object-server/1.conf')
         pid_file = self.join_run_dir('object-replicator/1.pid')
-        self.assertEquals(pid_file, server.get_pid_file_name(conf_file))
+        self.assertEqual(pid_file, server.get_pid_file_name(conf_file))
         server = manager.Server('container-auditor')
         conf_file = self.join_swift_dir(
             'container-server/1/container-auditor.conf')
         pid_file = self.join_run_dir(
             'container-auditor/1/container-auditor.pid')
-        self.assertEquals(pid_file, server.get_pid_file_name(conf_file))
+        self.assertEqual(pid_file, server.get_pid_file_name(conf_file))
+
+    def test_get_custom_pid_file_name(self):
+        random_run_dir = "/random/dir"
+        get_random_run_dir = lambda x: os.path.join(random_run_dir, x)
+        server = manager.Server('proxy', run_dir=random_run_dir)
+        conf_file = self.join_swift_dir('proxy-server.conf')
+        pid_file = get_random_run_dir('proxy-server.pid')
+        self.assertEqual(pid_file, server.get_pid_file_name(conf_file))
+        server = manager.Server('object-replicator', run_dir=random_run_dir)
+        conf_file = self.join_swift_dir('object-server/1.conf')
+        pid_file = get_random_run_dir('object-replicator/1.pid')
+        self.assertEqual(pid_file, server.get_pid_file_name(conf_file))
+        server = manager.Server('container-auditor', run_dir=random_run_dir)
+        conf_file = self.join_swift_dir(
+            'container-server/1/container-auditor.conf')
+        pid_file = get_random_run_dir(
+            'container-auditor/1/container-auditor.pid')
+        self.assertEqual(pid_file, server.get_pid_file_name(conf_file))
 
     def test_get_conf_file_name(self):
         server = manager.Server('proxy')
         conf_file = self.join_swift_dir('proxy-server.conf')
         pid_file = self.join_run_dir('proxy-server.pid')
-        self.assertEquals(conf_file, server.get_conf_file_name(pid_file))
+        self.assertEqual(conf_file, server.get_conf_file_name(pid_file))
         server = manager.Server('object-replicator')
         conf_file = self.join_swift_dir('object-server/1.conf')
         pid_file = self.join_run_dir('object-replicator/1.pid')
-        self.assertEquals(conf_file, server.get_conf_file_name(pid_file))
+        self.assertEqual(conf_file, server.get_conf_file_name(pid_file))
         server = manager.Server('container-auditor')
         conf_file = self.join_swift_dir(
             'container-server/1/container-auditor.conf')
         pid_file = self.join_run_dir(
             'container-auditor/1/container-auditor.pid')
-        self.assertEquals(conf_file, server.get_conf_file_name(pid_file))
+        self.assertEqual(conf_file, server.get_conf_file_name(pid_file))
         server_name = manager.STANDALONE_SERVERS[0]
         server = manager.Server(server_name)
         conf_file = self.join_swift_dir(server_name + '.conf')
         pid_file = self.join_run_dir(server_name + '.pid')
-        self.assertEquals(conf_file, server.get_conf_file_name(pid_file))
+        self.assertEqual(conf_file, server.get_conf_file_name(pid_file))
 
     def test_conf_files(self):
         # test get single conf file
@@ -343,10 +429,10 @@ def test_conf_files(self):
             manager.SWIFT_DIR = t
             server = manager.Server('proxy')
             conf_files = server.conf_files()
-            self.assertEquals(len(conf_files), 1)
+            self.assertEqual(len(conf_files), 1)
             conf_file = conf_files[0]
             proxy_conf = self.join_swift_dir('proxy-server.conf')
-            self.assertEquals(conf_file, proxy_conf)
+            self.assertEqual(conf_file, proxy_conf)
 
         # test multi server conf files & grouping of server-type config
         conf_files = (
@@ -361,16 +447,16 @@ def test_conf_files(self):
             manager.SWIFT_DIR = t
             server = manager.Server('object-replicator')
             conf_files = server.conf_files()
-            self.assertEquals(len(conf_files), 4)
+            self.assertEqual(len(conf_files), 4)
             c1 = self.join_swift_dir('object-server1.conf')
             c2 = self.join_swift_dir('object-server/2.conf')
             c3 = self.join_swift_dir('object-server/object3.conf')
             c4 = self.join_swift_dir('object-server/conf/server4.conf')
             for c in [c1, c2, c3, c4]:
-                self.assert_(c in conf_files)
+                self.assertTrue(c in conf_files)
             # test configs returned sorted
             sorted_confs = sorted([c1, c2, c3, c4])
-            self.assertEquals(conf_files, sorted_confs)
+            self.assertEqual(conf_files, sorted_confs)
 
         # test get single numbered conf
         conf_files = (
@@ -383,14 +469,30 @@ def test_conf_files(self):
             manager.SWIFT_DIR = t
             server = manager.Server('account')
             conf_files = server.conf_files(number=2)
-            self.assertEquals(len(conf_files), 1)
+            self.assertEqual(len(conf_files), 1)
             conf_file = conf_files[0]
-            self.assertEquals(conf_file,
-                              self.join_swift_dir('account-server/2.conf'))
+            self.assertEqual(conf_file,
+                             self.join_swift_dir('account-server/2.conf'))
             # test missing config number
             conf_files = server.conf_files(number=5)
             self.assertFalse(conf_files)
 
+        # test getting specific conf
+        conf_files = (
+            'account-server/1.conf',
+            'account-server/2.conf',
+            'account-server/3.conf',
+            'account-server/4.conf',
+        )
+        with temptree(conf_files) as t:
+            manager.SWIFT_DIR = t
+            server = manager.Server('account.2')
+            conf_files = server.conf_files()
+            self.assertEqual(len(conf_files), 1)
+            conf_file = conf_files[0]
+            self.assertEqual(conf_file,
+                             self.join_swift_dir('account-server/2.conf'))
+
         # test verbose & quiet
         conf_files = (
             'auth-server.ini',
@@ -406,21 +508,24 @@ def test_conf_files(self):
                     # check warn "unable to locate"
                     conf_files = server.conf_files()
                     self.assertFalse(conf_files)
-                    self.assert_('unable to locate' in pop_stream(f).lower())
+                    self.assertTrue('unable to locate config for auth'
+                                    in pop_stream(f).lower())
                     # check quiet will silence warning
                     conf_files = server.conf_files(verbose=True, quiet=True)
-                    self.assertEquals(pop_stream(f), '')
+                    self.assertEqual(pop_stream(f), '')
                     # check found config no warning
                     server = manager.Server('container-auditor')
                     conf_files = server.conf_files()
-                    self.assertEquals(pop_stream(f), '')
+                    self.assertEqual(pop_stream(f), '')
                     # check missing config number warn "unable to locate"
                     conf_files = server.conf_files(number=2)
-                    self.assert_('unable to locate' in pop_stream(f).lower())
+                    self.assertTrue(
+                        'unable to locate config number 2 for ' +
+                        'container-auditor' in pop_stream(f).lower())
                     # check verbose lists configs
                     conf_files = server.conf_files(number=2, verbose=True)
                     c1 = self.join_swift_dir('container-server/1.conf')
-                    self.assert_(c1 in pop_stream(f))
+                    self.assertIn(c1, pop_stream(f))
             finally:
                 sys.stdout = old_stdout
 
@@ -431,10 +536,217 @@ def test_conf_files(self):
             manager.SWIFT_DIR = t
             server = manager.Server(server_name)
             conf_files = server.conf_files()
-            self.assertEquals(len(conf_files), 1)
+            self.assertEqual(len(conf_files), 1)
             conf_file = conf_files[0]
             conf = self.join_swift_dir(server_name + '.conf')
-            self.assertEquals(conf_file, conf)
+            self.assertEqual(conf_file, conf)
+
+    def _test_expirer_conf_files(self, files_and_contents, expected_files):
+        files, contents = zip(*files_and_contents)
+        with temptree(files, contents) as t:
+            manager.SWIFT_DIR = t
+            expected_files = [self.join_swift_dir(f) for f in expected_files]
+
+            def assert_results(quiet, verbose):
+                original_stdout = sys.stdout
+                try:
+                    with open(os.path.join(t, 'output'), 'w+') as stdout:
+                        sys.stdout = stdout
+                        server = manager.Server('object-expirer')
+                        conf_files = server.conf_files(verbose=verbose,
+                                                       quiet=quiet)
+                        messages = pop_stream(stdout)
+                finally:
+                    sys.stdout = original_stdout
+
+                self.assertEqual(conf_files, expected_files)
+
+                if any(["expirer" in f for f in expected_files]) and not quiet:
+                    self.assertIn(
+                        "object-expirer.conf is deprecated.", messages)
+                    if verbose:
+                        for f in expected_files:
+                            self.assertIn(f, messages)
+                elif not expected_files and not quiet:
+                    self.assertIn("Unable to locate config", messages)
+                else:
+                    self.assertEqual(messages, "")
+
+            assert_results(quiet=True, verbose=False)
+            assert_results(quiet=False, verbose=False)
+            assert_results(quiet=False, verbose=True)
+
+    def test_expirer_conf_files(self):
+        self._test_expirer_conf_files(
+            [('object-expirer.conf', '')], ['object-expirer.conf'])
+
+        self._test_expirer_conf_files(
+            [('object-server.conf', '')], [])
+        self._test_expirer_conf_files(
+            [('object-server.conf', '[object-expirer]')],
+            ['object-server.conf'])
+
+        self._test_expirer_conf_files([
+            ('object-server/1.conf', ''),
+            ('object-server/2.conf', ''),
+            ('object-server/3.conf', ''),
+            ('object-server/4.conf', ''),
+        ], [])
+        self._test_expirer_conf_files([
+            ('object-server/1.conf', '[object-expirer]'),
+            ('object-server/2.conf', ''),
+            ('object-server/3.conf', ''),
+            ('object-server/4.conf', ''),
+        ], ['object-server/1.conf'])
+        self._test_expirer_conf_files([
+            ('object-server/1.conf', '[object-expirer]'),
+            ('object-server/2.conf', '[object-expirer]'),
+            ('object-server/3.conf', '[object-expirer]'),
+            ('object-server/4.conf', '[object-expirer]'),
+        ], [
+            'object-server/1.conf',
+            'object-server/2.conf',
+            'object-server/3.conf',
+            'object-server/4.conf',
+        ])
+
+        self._test_expirer_conf_files([
+            ('object-server.conf', ''),
+            ('object-expirer.conf', ''),
+        ], ['object-expirer.conf'])
+        self._test_expirer_conf_files([
+            ('object-server.conf', '[object-expirer]'),
+            ('object-expirer.conf', ''),
+        ], ['object-server.conf'])
+
+        self._test_expirer_conf_files([
+            ('object-server/1.conf', ''),
+            ('object-server/2.conf', ''),
+            ('object-server/3.conf', ''),
+            ('object-server/4.conf', ''),
+            ('object-expirer.conf', ''),
+        ], ['object-expirer.conf'])
+        self._test_expirer_conf_files([
+            ('object-server/1.conf', '[object-expirer]'),
+            ('object-server/2.conf', ''),
+            ('object-server/3.conf', ''),
+            ('object-server/4.conf', ''),
+            ('object-expirer.conf', ''),
+        ], ['object-server/1.conf'])
+        self._test_expirer_conf_files([
+            ('object-server/1.conf', '[object-expirer]'),
+            ('object-server/2.conf', '[object-expirer]'),
+            ('object-server/3.conf', '[object-expirer]'),
+            ('object-server/4.conf', '[object-expirer]'),
+            ('object-expirer.conf', ''),
+        ], [
+            'object-server/1.conf',
+            'object-server/2.conf',
+            'object-server/3.conf',
+            'object-server/4.conf',
+        ])
+
+        self._test_expirer_conf_files([
+            ('object-server/1.conf.d/20_setting.conf', '[object-expirer]'),
+            ('object-server/2.conf.d/20_setting.conf', '[object-expirer]'),
+            ('object-server/3.conf.d/20_setting.conf', '[object-expirer]'),
+            ('object-server/4.conf.d/20_setting.conf', '[object-expirer]'),
+        ], [
+            'object-server/1.conf.d',
+            'object-server/2.conf.d',
+            'object-server/3.conf.d',
+            'object-server/4.conf.d',
+        ])
+
+    def test_proxy_conf_dir(self):
+        conf_files = (
+            'proxy-server.conf.d/00.conf',
+            'proxy-server.conf.d/01.conf',
+        )
+        with temptree(conf_files) as t:
+            manager.SWIFT_DIR = t
+            server = manager.Server('proxy')
+            conf_dirs = server.conf_files()
+            self.assertEqual(len(conf_dirs), 1)
+            conf_dir = conf_dirs[0]
+            proxy_conf_dir = self.join_swift_dir('proxy-server.conf.d')
+            self.assertEqual(proxy_conf_dir, conf_dir)
+
+    def test_named_conf_dir(self):
+        conf_files = (
+            'object-server/base.conf-template',
+            'object-server/object-server.conf.d/00_base.conf',
+            'object-server/object-server.conf.d/10_server.conf',
+            'object-server/object-replication.conf.d/00_base.conf',
+            'object-server/object-replication.conf.d/10_server.conf',
+        )
+        with temptree(conf_files) as t:
+            manager.SWIFT_DIR = t
+            server = manager.Server('object.replication')
+            conf_dirs = server.conf_files()
+            self.assertEqual(len(conf_dirs), 1)
+            conf_dir = conf_dirs[0]
+            replication_server_conf_dir = self.join_swift_dir(
+                'object-server/object-replication.conf.d')
+            self.assertEqual(replication_server_conf_dir, conf_dir)
+            # and again with no named filter
+            server = manager.Server('object')
+            conf_dirs = server.conf_files()
+            self.assertEqual(len(conf_dirs), 2)
+            for named_conf in ('server', 'replication'):
+                conf_dir = self.join_swift_dir(
+                    'object-server/object-%s.conf.d' % named_conf)
+                self.assertTrue(conf_dir in conf_dirs)
+
+    def test_conf_dir(self):
+        conf_files = (
+            'object-server/object-server.conf-base',
+            'object-server/1.conf.d/base.conf',
+            'object-server/1.conf.d/1.conf',
+            'object-server/2.conf.d/base.conf',
+            'object-server/2.conf.d/2.conf',
+            'object-server/3.conf.d/base.conf',
+            'object-server/3.conf.d/3.conf',
+            'object-server/4.conf.d/base.conf',
+            'object-server/4.conf.d/4.conf',
+        )
+        with temptree(conf_files) as t:
+            manager.SWIFT_DIR = t
+            server = manager.Server('object-replicator')
+            conf_dirs = server.conf_files()
+            self.assertEqual(len(conf_dirs), 4)
+            c1 = self.join_swift_dir('object-server/1.conf.d')
+            c2 = self.join_swift_dir('object-server/2.conf.d')
+            c3 = self.join_swift_dir('object-server/3.conf.d')
+            c4 = self.join_swift_dir('object-server/4.conf.d')
+            for c in [c1, c2, c3, c4]:
+                self.assertTrue(c in conf_dirs)
+            # test configs returned sorted
+            sorted_confs = sorted([c1, c2, c3, c4])
+            self.assertEqual(conf_dirs, sorted_confs)
+
+    def test_named_conf_dir_pid_files(self):
+        conf_files = (
+            'object-server/object-server.pid.d',
+            'object-server/object-replication.pid.d',
+        )
+        with temptree(conf_files) as t:
+            manager.RUN_DIR = t
+            server = manager.Server('object.replication', run_dir=t)
+            pid_files = server.pid_files()
+            self.assertEqual(len(pid_files), 1)
+            pid_file = pid_files[0]
+            replication_server_pid = self.join_run_dir(
+                'object-server/object-replication.pid.d')
+            self.assertEqual(replication_server_pid, pid_file)
+            # and again with no named filter
+            server = manager.Server('object', run_dir=t)
+            pid_files = server.pid_files()
+            self.assertEqual(len(pid_files), 2)
+            for named_pid in ('server', 'replication'):
+                pid_file = self.join_run_dir(
+                    'object-server/object-%s.pid.d' % named_pid)
+                self.assertTrue(pid_file in pid_files)
 
     def test_iter_pid_files(self):
         """
@@ -450,22 +762,23 @@ def test_iter_pid_files(self):
         files, contents = zip(*pid_files)
         with temptree(files, contents) as t:
             manager.RUN_DIR = t
-            server = manager.Server('proxy')
+            server = manager.Server('proxy', run_dir=t)
             # test get one file
-            iter = server.iter_pid_files()
-            pid_file, pid = iter.next()
-            self.assertEquals(pid_file, self.join_run_dir('proxy-server.pid'))
-            self.assertEquals(pid, 1)
+            iterator = server.iter_pid_files()
+            pid_file, pid = next(iterator)
+            self.assertEqual(pid_file, self.join_run_dir('proxy-server.pid'))
+            self.assertEqual(pid, 1)
             # ... and only one file
-            self.assertRaises(StopIteration, iter.next)
+            self.assertRaises(StopIteration, next, iterator)
             # test invalid value in pid file
-            server = manager.Server('auth')
-            self.assertRaises(ValueError, server.iter_pid_files().next)
+            server = manager.Server('auth', run_dir=t)
+            pid_file, pid = next(server.iter_pid_files())
+            self.assertIsNone(pid)
             # test object-server doesn't steal pids from object-replicator
-            server = manager.Server('object')
-            self.assertRaises(StopIteration, server.iter_pid_files().next)
+            server = manager.Server('object', run_dir=t)
+            self.assertRaises(StopIteration, next, server.iter_pid_files())
             # test multi-pid iter
-            server = manager.Server('object-replicator')
+            server = manager.Server('object-replicator', run_dir=t)
             real_map = {
                 11: self.join_run_dir('object-replicator/1.pid'),
                 12: self.join_run_dir('object-replicator/2.pid'),
@@ -473,7 +786,7 @@ def test_iter_pid_files(self):
             pid_map = {}
             for pid_file, pid in server.iter_pid_files():
                 pid_map[pid] = pid_file
-            self.assertEquals(pid_map, real_map)
+            self.assertEqual(pid_map, real_map)
 
         # test get pid_files by number
         conf_files = (
@@ -494,7 +807,7 @@ def test_iter_pid_files(self):
             files, pids = zip(*pid_files)
             with temptree(files, pids) as t:
                 manager.RUN_DIR = t
-                server = manager.Server('object')
+                server = manager.Server('object', run_dir=t)
                 # test get all pid files
                 real_map = {
                     1: self.join_run_dir('object-server/1.pid'),
@@ -504,14 +817,14 @@ def test_iter_pid_files(self):
                 pid_map = {}
                 for pid_file, pid in server.iter_pid_files():
                     pid_map[pid] = pid_file
-                self.assertEquals(pid_map, real_map)
+                self.assertEqual(pid_map, real_map)
                 # test get pid with matching conf
                 pids = list(server.iter_pid_files(number=2))
-                self.assertEquals(len(pids), 1)
+                self.assertEqual(len(pids), 1)
                 pid_file, pid = pids[0]
-                self.assertEquals(pid, 2)
+                self.assertEqual(pid, 2)
                 pid_two = self.join_run_dir('object-server/2.pid')
-                self.assertEquals(pid_file, pid_two)
+                self.assertEqual(pid_file, pid_two)
                 # try to iter on a pid number with a matching conf but no pid
                 pids = list(server.iter_pid_files(number=3))
                 self.assertFalse(pids)
@@ -519,85 +832,161 @@ def test_iter_pid_files(self):
                 pids = list(server.iter_pid_files(number=5))
                 self.assertFalse(pids)
 
-    def test_signal_pids(self):
+        # test get pid_files by conf name
+        conf_files = (
+            'object-server/1.conf',
+            'object-server/2.conf',
+            'object-server/3.conf',
+            'object-server/4.conf',
+        )
+
         pid_files = (
-            ('proxy-server.pid', 1),
-            ('auth-server.pid', 2),
-            ('object-server.pid', 3),
+            ('object-server/1.pid', 1),
+            ('object-server/2.pid', 2),
+            ('object-server/5.pid', 5),
         )
-        files, pids = zip(*pid_files)
-        with temptree(files, pids) as t:
-            manager.RUN_DIR = t
-            # mock os with both pids running
+
+        with temptree(conf_files) as swift_dir:
+            manager.SWIFT_DIR = swift_dir
+            files, pids = zip(*pid_files)
+            with temptree(files, pids) as t:
+                manager.RUN_DIR = t
+                server = manager.Server('object.2', run_dir=t)
+                # test get pid with matching conf
+                pids = list(server.iter_pid_files())
+                self.assertEqual(len(pids), 1)
+                pid_file, pid = pids[0]
+                self.assertEqual(pid, 2)
+                pid_two = self.join_run_dir('object-server/2.pid')
+                self.assertEqual(pid_file, pid_two)
+
+    def test_signal_pids(self):
+        temp_files = (
+            ('var/run/zero-server.pid', 0),
+            ('var/run/proxy-server.pid', 1),
+            ('var/run/auth-server.pid', 2),
+            ('var/run/one-server.pid', 3),
+            ('var/run/object-server.pid', 4),
+            ('var/run/invalid-server.pid', 'Forty-Two'),
+            ('proc/3/cmdline', 'swift-another-server')
+        )
+        with temptree(*zip(*temp_files)) as t:
+            manager.RUN_DIR = os.path.join(t, 'var/run')
+            manager.PROC_DIR = os.path.join(t, 'proc')
+            # mock os with so both the first and second are running
             manager.os = MockOs([1, 2])
-            server = manager.Server('proxy')
+            server = manager.Server('proxy', run_dir=manager.RUN_DIR)
             pids = server.signal_pids(DUMMY_SIG)
-            self.assertEquals(len(pids), 1)
-            self.assert_(1 in pids)
-            self.assertEquals(manager.os.pid_sigs[1], [DUMMY_SIG])
+            self.assertEqual(len(pids), 1)
+            self.assertIn(1, pids)
+            self.assertEqual(manager.os.pid_sigs[1], [DUMMY_SIG])
             # make sure other process not signaled
-            self.assertFalse(2 in pids)
-            self.assertFalse(2 in manager.os.pid_sigs)
+            self.assertNotIn(2, pids)
+            self.assertNotIn(2, manager.os.pid_sigs)
             # capture stdio
             old_stdout = sys.stdout
             try:
                 with open(os.path.join(t, 'output'), 'w+') as f:
                     sys.stdout = f
-                    #test print details
+                    # test print details
                     pids = server.signal_pids(DUMMY_SIG)
                     output = pop_stream(f)
-                    self.assert_('pid: %s' % 1 in output)
-                    self.assert_('signal: %s' % DUMMY_SIG in output)
+                    self.assertIn('pid: %s' % 1, output)
+                    self.assertIn('signal: %s' % DUMMY_SIG, output)
                     # test no details on signal.SIG_DFL
                     pids = server.signal_pids(signal.SIG_DFL)
-                    self.assertEquals(pop_stream(f), '')
-                    # reset mock os so only the other server is running
+                    self.assertEqual(pop_stream(f), '')
+                    # reset mock os so only the second server is running
                     manager.os = MockOs([2])
                     # test pid not running
                     pids = server.signal_pids(signal.SIG_DFL)
-                    self.assert_(1 not in pids)
-                    self.assert_(1 not in manager.os.pid_sigs)
+                    self.assertNotIn(1, pids)
+                    self.assertNotIn(1, manager.os.pid_sigs)
                     # test remove stale pid file
                     self.assertFalse(os.path.exists(
                         self.join_run_dir('proxy-server.pid')))
                     # reset mock os with no running pids
                     manager.os = MockOs([])
-                    server = manager.Server('auth')
-                    # test verbose warns on removing pid file
+                    server = manager.Server('auth', run_dir=manager.RUN_DIR)
+                    # test verbose warns on removing stale pid file
                     pids = server.signal_pids(signal.SIG_DFL, verbose=True)
                     output = pop_stream(f)
-                    self.assert_('stale pid' in output.lower())
+                    self.assertTrue('stale pid' in output.lower())
                     auth_pid = self.join_run_dir('auth-server.pid')
-                    self.assert_(auth_pid in output)
+                    self.assertTrue(auth_pid in output)
+                    # reset mock os so only the third server is running
+                    manager.os = MockOs([3])
+                    server = manager.Server('one', run_dir=manager.RUN_DIR)
+                    # test verbose warns on removing invalid pid file
+                    pids = server.signal_pids(signal.SIG_DFL, verbose=True)
+                    output = pop_stream(f)
+                    old_stdout.write('output %s' % output)
+                    self.assertTrue('removing pid file' in output.lower())
+                    one_pid = self.join_run_dir('one-server.pid')
+                    self.assertTrue(one_pid in output)
+
+                    server = manager.Server('zero', run_dir=manager.RUN_DIR)
+                    self.assertTrue(os.path.exists(
+                        self.join_run_dir('zero-server.pid')))  # sanity
+                    # test verbose warns on removing pid file with invalid pid
+                    pids = server.signal_pids(signal.SIG_DFL, verbose=True)
+                    output = pop_stream(f)
+                    old_stdout.write('output %s' % output)
+                    self.assertTrue('with invalid pid' in output.lower())
+                    self.assertFalse(os.path.exists(
+                        self.join_run_dir('zero-server.pid')))
+                    server = manager.Server('invalid-server',
+                                            run_dir=manager.RUN_DIR)
+                    self.assertTrue(os.path.exists(
+                        self.join_run_dir('invalid-server.pid')))  # sanity
+                    # test verbose warns on removing pid file with invalid pid
+                    pids = server.signal_pids(signal.SIG_DFL, verbose=True)
+                    output = pop_stream(f)
+                    old_stdout.write('output %s' % output)
+                    self.assertTrue('with invalid pid' in output.lower())
+                    self.assertFalse(os.path.exists(
+                        self.join_run_dir('invalid-server.pid')))
+
+                    # reset mock os with no running pids
+                    manager.os = MockOs([])
                     # test warning with insufficient permissions
-                    server = manager.Server('object')
+                    server = manager.Server('object', run_dir=manager.RUN_DIR)
                     pids = server.signal_pids(manager.os.RAISE_EPERM_SIG)
                     output = pop_stream(f)
-                    self.assert_('no permission to signal pid 3' in
-                                 output.lower(), output)
+                    self.assertTrue('no permission to signal pid 4' in
+                                    output.lower(), output)
             finally:
                 sys.stdout = old_stdout
 
     def test_get_running_pids(self):
         # test only gets running pids
-        pid_files = (
-            ('test-server1.pid', 1),
-            ('test-server2.pid', 2),
+        temp_files = (
+            ('var/run/test-server1.pid', 1),
+            ('var/run/test-server2.pid', 2),
+            ('var/run/test-server3.pid', 3),
+            ('proc/1/cmdline', 'swift-test-server'),
+            ('proc/3/cmdline', 'swift-another-server')
         )
-        with temptree(*zip(*pid_files)) as t:
-            manager.RUN_DIR = t
-            server = manager.Server('test-server')
+        with temptree(*zip(*temp_files)) as t:
+            manager.RUN_DIR = os.path.join(t, 'var/run')
+            manager.PROC_DIR = os.path.join(t, 'proc')
+            server = manager.Server(
+                'test-server', run_dir=manager.RUN_DIR)
             # mock os, only pid '1' is running
-            manager.os = MockOs([1])
+            manager.os = MockOs([1, 3])
             running_pids = server.get_running_pids()
-            self.assertEquals(len(running_pids), 1)
-            self.assert_(1 in running_pids)
-            self.assert_(2 not in running_pids)
-            # test persistant running pid files
-            self.assert_(os.path.exists(os.path.join(t, 'test-server1.pid')))
+            self.assertEqual(len(running_pids), 1)
+            self.assertIn(1, running_pids)
+            self.assertNotIn(2, running_pids)
+            self.assertNotIn(3, running_pids)
+            # test persistent running pid files
+            self.assertTrue(os.path.exists(
+                os.path.join(manager.RUN_DIR, 'test-server1.pid')))
             # test clean up stale pids
             pid_two = self.join_swift_dir('test-server2.pid')
             self.assertFalse(os.path.exists(pid_two))
+            pid_three = self.join_swift_dir('test-server3.pid')
+            self.assertFalse(os.path.exists(pid_three))
             # reset mock os, no pids running
             manager.os = MockOs([])
             running_pids = server.get_running_pids()
@@ -605,8 +994,8 @@ def test_get_running_pids(self):
             # and now all pid files are cleaned out
             pid_one = self.join_run_dir('test-server1.pid')
             self.assertFalse(os.path.exists(pid_one))
-            all_pids = os.listdir(t)
-            self.assertEquals(len(all_pids), 0)
+            all_pids = os.listdir(manager.RUN_DIR)
+            self.assertEqual(len(all_pids), 0)
 
         # test only get pids for right server
         pid_files = (
@@ -620,29 +1009,29 @@ def test_get_running_pids(self):
             manager.RUN_DIR = t
             # all pids are running
             manager.os = MockOs(pids)
-            server = manager.Server('thing-doer')
+            server = manager.Server('thing-doer', run_dir=t)
             running_pids = server.get_running_pids()
             # only thing-doer.pid, 1
-            self.assertEquals(len(running_pids), 1)
-            self.assert_(1 in running_pids)
+            self.assertEqual(len(running_pids), 1)
+            self.assertIn(1, running_pids)
             # no other pids returned
             for n in (2, 3, 4):
-                self.assert_(n not in running_pids)
+                self.assertNotIn(n, running_pids)
             # assert stale pids for other servers ignored
             manager.os = MockOs([1])  # only thing-doer is running
             running_pids = server.get_running_pids()
             for f in ('thing-sayer.pid', 'other-doer.pid', 'other-sayer.pid'):
                 # other server pid files persist
-                self.assert_(os.path.exists, os.path.join(t, f))
+                self.assertTrue(os.path.exists(os.path.join(t, f)))
             # verify that servers are in fact not running
             for server_name in ('thing-sayer', 'other-doer', 'other-sayer'):
-                server = manager.Server(server_name)
+                server = manager.Server(server_name, run_dir=t)
                 running_pids = server.get_running_pids()
                 self.assertFalse(running_pids)
             # and now all OTHER pid files are cleaned out
             all_pids = os.listdir(t)
-            self.assertEquals(len(all_pids), 1)
-            self.assert_(os.path.exists(os.path.join(t, 'thing-doer.pid')))
+            self.assertEqual(len(all_pids), 1)
+            self.assertTrue(os.path.exists(os.path.join(t, 'thing-doer.pid')))
 
     def test_kill_running_pids(self):
         pid_files = (
@@ -653,7 +1042,7 @@ def test_kill_running_pids(self):
         files, running_pids = zip(*pid_files)
         with temptree(files, running_pids) as t:
             manager.RUN_DIR = t
-            server = manager.Server('object')
+            server = manager.Server('object', run_dir=t)
             # test no servers running
             manager.os = MockOs([])
             pids = server.kill_running_pids()
@@ -661,36 +1050,38 @@ def test_kill_running_pids(self):
         files, running_pids = zip(*pid_files)
         with temptree(files, running_pids) as t:
             manager.RUN_DIR = t
+            server.run_dir = t
             # start up pid
             manager.os = MockOs([1])
+            server = manager.Server('object', run_dir=t)
             # test kill one pid
             pids = server.kill_running_pids()
-            self.assertEquals(len(pids), 1)
-            self.assert_(1 in pids)
-            self.assertEquals(manager.os.pid_sigs[1], [signal.SIGTERM])
+            self.assertEqual(len(pids), 1)
+            self.assertIn(1, pids)
+            self.assertEqual(manager.os.pid_sigs[1], [signal.SIGTERM])
             # reset os mock
             manager.os = MockOs([1])
             # test shutdown
-            self.assert_('object-server' in
-                         manager.GRACEFUL_SHUTDOWN_SERVERS)
+            self.assertTrue('object-server' in
+                            manager.GRACEFUL_SHUTDOWN_SERVERS)
             pids = server.kill_running_pids(graceful=True)
-            self.assertEquals(len(pids), 1)
-            self.assert_(1 in pids)
-            self.assertEquals(manager.os.pid_sigs[1], [signal.SIGHUP])
+            self.assertEqual(len(pids), 1)
+            self.assertIn(1, pids)
+            self.assertEqual(manager.os.pid_sigs[1], [signal.SIGHUP])
             # start up other servers
             manager.os = MockOs([11, 12])
             # test multi server kill & ignore graceful on unsupported server
             self.assertFalse('object-replicator' in
                              manager.GRACEFUL_SHUTDOWN_SERVERS)
-            server = manager.Server('object-replicator')
+            server = manager.Server('object-replicator', run_dir=t)
             pids = server.kill_running_pids(graceful=True)
-            self.assertEquals(len(pids), 2)
+            self.assertEqual(len(pids), 2)
             for pid in (11, 12):
-                self.assert_(pid in pids)
-                self.assertEquals(manager.os.pid_sigs[pid],
-                                  [signal.SIGTERM])
+                self.assertTrue(pid in pids)
+                self.assertEqual(manager.os.pid_sigs[pid],
+                                 [signal.SIGTERM])
             # and the other pid is of course not signaled
-            self.assert_(1 not in manager.os.pid_sigs)
+            self.assertNotIn(1, manager.os.pid_sigs)
 
     def test_status(self):
         conf_files = (
@@ -713,7 +1104,7 @@ def test_status(self):
             with temptree(files, pids) as t:
                 manager.RUN_DIR = t
                 # setup running servers
-                server = manager.Server('test')
+                server = manager.Server('test', run_dir=t)
                 # capture stdio
                 old_stdout = sys.stdout
                 try:
@@ -721,40 +1112,68 @@ def test_status(self):
                         sys.stdout = f
                         # test status for all running
                         manager.os = MockOs(pids)
-                        self.assertEquals(server.status(), 0)
-                        output = pop_stream(f).strip().splitlines()
-                        self.assertEquals(len(output), 4)
-                        for line in output:
-                            self.assert_('test-server running' in line)
+                        proc_files = (
+                            ('1/cmdline', 'swift-test-server'),
+                            ('2/cmdline', 'swift-test-server'),
+                            ('3/cmdline', 'swift-test-server'),
+                            ('4/cmdline', 'swift-test-server'),
+                        )
+                        files, contents = zip(*proc_files)
+                        with temptree(files, contents) as t:
+                            manager.PROC_DIR = t
+                            self.assertEqual(server.status(), 0)
+                            output = pop_stream(f).strip().splitlines()
+                            self.assertEqual(len(output), 4)
+                            for line in output:
+                                self.assertTrue('test-server running' in line)
                         # test get single server by number
-                        self.assertEquals(server.status(number=4), 0)
-                        output = pop_stream(f).strip().splitlines()
-                        self.assertEquals(len(output), 1)
-                        line = output[0]
-                        self.assert_('test-server running' in line)
-                        conf_four = self.join_swift_dir(conf_files[3])
-                        self.assert_('4 - %s' % conf_four in line)
+                        with temptree([], []) as t:
+                            manager.PROC_DIR = t
+                            self.assertEqual(server.status(number=4), 0)
+                            output = pop_stream(f).strip().splitlines()
+                            self.assertEqual(len(output), 1)
+                            line = output[0]
+                            self.assertTrue('test-server running' in line)
+                            conf_four = self.join_swift_dir(conf_files[3])
+                            self.assertTrue('4 - %s' % conf_four in line)
                         # test some servers not running
                         manager.os = MockOs([1, 2, 3])
-                        self.assertEquals(server.status(), 0)
-                        output = pop_stream(f).strip().splitlines()
-                        self.assertEquals(len(output), 3)
-                        for line in output:
-                            self.assert_('test-server running' in line)
+                        proc_files = (
+                            ('1/cmdline', 'swift-test-server'),
+                            ('2/cmdline', 'swift-test-server'),
+                            ('3/cmdline', 'swift-test-server'),
+                        )
+                        files, contents = zip(*proc_files)
+                        with temptree(files, contents) as t:
+                            manager.PROC_DIR = t
+                            self.assertEqual(server.status(), 0)
+                            output = pop_stream(f).strip().splitlines()
+                            self.assertEqual(len(output), 3)
+                            for line in output:
+                                self.assertTrue('test-server running' in line)
                         # test single server not running
                         manager.os = MockOs([1, 2])
-                        self.assertEquals(server.status(number=3), 1)
-                        output = pop_stream(f).strip().splitlines()
-                        self.assertEquals(len(output), 1)
-                        line = output[0]
-                        self.assert_('not running' in line)
-                        conf_three = self.join_swift_dir(conf_files[2])
-                        self.assert_(conf_three in line)
+                        proc_files = (
+                            ('1/cmdline', 'swift-test-server'),
+                            ('2/cmdline', 'swift-test-server'),
+                        )
+                        files, contents = zip(*proc_files)
+                        with temptree(files, contents) as t:
+                            manager.PROC_DIR = t
+                            self.assertEqual(server.status(number=3), 1)
+                            output = pop_stream(f).strip().splitlines()
+                            self.assertEqual(len(output), 1)
+                            line = output[0]
+                            self.assertTrue('not running' in line)
+                            conf_three = self.join_swift_dir(conf_files[2])
+                            self.assertTrue(conf_three in line)
                         # test no running pids
                         manager.os = MockOs([])
-                        self.assertEquals(server.status(), 1)
-                        output = pop_stream(f).lower()
-                        self.assert_('no test-server running' in output)
+                        with temptree([], []) as t:
+                            manager.PROC_DIR = t
+                            self.assertEqual(server.status(), 1)
+                            output = pop_stream(f).lower()
+                            self.assertTrue('no test-server running' in output)
                         # test use provided pids
                         pids = {
                             1: '1.pid',
@@ -767,19 +1186,19 @@ def mock(*args, **kwargs):
                             called.append(True)
                         server.get_running_pids = mock
                         status = server.status(pids=pids)
-                        self.assertEquals(status, 0)
+                        self.assertEqual(status, 0)
                         self.assertFalse(called)
                         output = pop_stream(f).strip().splitlines()
-                        self.assertEquals(len(output), 2)
+                        self.assertEqual(len(output), 2)
                         for line in output:
-                            self.assert_('test-server running' in line)
+                            self.assertTrue('test-server running' in line)
                 finally:
                     sys.stdout = old_stdout
 
     def test_spawn(self):
 
         # mocks
-        class MockProcess():
+        class MockProcess(object):
 
             NOTHING = 'default besides None'
             STDOUT = 'stdout'
@@ -791,9 +1210,9 @@ def __init__(self, pids=None):
                 self.pids = (p for p in pids)
 
             def Popen(self, args, **kwargs):
-                return MockProc(self.pids.next(), args, **kwargs)
+                return MockProc(next(self.pids), args, **kwargs)
 
-        class MockProc():
+        class MockProc(object):
 
             def __init__(self, pid, args, stdout=MockProcess.NOTHING,
                          stderr=MockProcess.NOTHING):
@@ -812,6 +1231,7 @@ def __init__(self, pid, args, stdout=MockProcess.NOTHING,
             manager.SWIFT_DIR = swift_dir
             with temptree([]) as t:
                 manager.RUN_DIR = t
+                server.run_dir = t
                 old_subprocess = manager.subprocess
                 try:
                     # test single server process calls spawn once
@@ -821,90 +1241,94 @@ def __init__(self, pid, args, stdout=MockProcess.NOTHING,
                     server.spawn(conf_file)
                     # test pid file
                     pid_file = self.join_run_dir('test-server.pid')
-                    self.assert_(os.path.exists(pid_file))
+                    self.assertTrue(os.path.exists(pid_file))
                     pid_on_disk = int(open(pid_file).read().strip())
-                    self.assertEquals(pid_on_disk, 1)
+                    self.assertEqual(pid_on_disk, 1)
                     # assert procs args
-                    self.assert_(server.procs)
-                    self.assertEquals(len(server.procs), 1)
+                    self.assertTrue(server.procs)
+                    self.assertEqual(len(server.procs), 1)
                     proc = server.procs[0]
                     expected_args = [
                         'swift-test-server',
                         conf_file,
                     ]
-                    self.assertEquals(proc.args, expected_args)
+                    self.assertEqual(proc.args, expected_args)
                     # assert stdout is piped
-                    self.assertEquals(proc.stdout, MockProcess.PIPE)
-                    self.assertEquals(proc.stderr, proc.stdout)
+                    self.assertEqual(proc.stdout, MockProcess.PIPE)
+                    self.assertEqual(proc.stderr, proc.stdout)
                     # test multi server process calls spawn multiple times
                     manager.subprocess = MockProcess([11, 12, 13, 14])
                     conf1 = self.join_swift_dir('test-server/1.conf')
                     conf2 = self.join_swift_dir('test-server/2.conf')
                     conf3 = self.join_swift_dir('test-server/3.conf')
                     conf4 = self.join_swift_dir('test-server/4.conf')
-                    server = manager.Server('test')
+                    server = manager.Server('test', run_dir=t)
                     # test server run once
                     server.spawn(conf1, once=True)
-                    self.assert_(server.procs)
-                    self.assertEquals(len(server.procs), 1)
+                    self.assertTrue(server.procs)
+                    self.assertEqual(len(server.procs), 1)
                     proc = server.procs[0]
                     expected_args = ['swift-test-server', conf1, 'once']
                     # assert stdout is piped
-                    self.assertEquals(proc.stdout, MockProcess.PIPE)
-                    self.assertEquals(proc.stderr, proc.stdout)
+                    self.assertEqual(proc.stdout, MockProcess.PIPE)
+                    self.assertEqual(proc.stderr, proc.stdout)
                     # test server not daemon
                     server.spawn(conf2, daemon=False)
-                    self.assert_(server.procs)
-                    self.assertEquals(len(server.procs), 2)
+                    self.assertTrue(server.procs)
+                    self.assertEqual(len(server.procs), 2)
                     proc = server.procs[1]
                     expected_args = ['swift-test-server', conf2, 'verbose']
-                    self.assertEquals(proc.args, expected_args)
+                    self.assertEqual(proc.args, expected_args)
                     # assert stdout is not changed
-                    self.assertEquals(proc.stdout, None)
-                    self.assertEquals(proc.stderr, None)
+                    self.assertIsNone(proc.stdout)
+                    self.assertIsNone(proc.stderr)
                     # test server wait
                     server.spawn(conf3, wait=False)
-                    self.assert_(server.procs)
-                    self.assertEquals(len(server.procs), 3)
+                    self.assertTrue(server.procs)
+                    self.assertEqual(len(server.procs), 3)
                     proc = server.procs[2]
                     # assert stdout is /dev/null
-                    self.assert_(isinstance(proc.stdout, file))
-                    self.assertEquals(proc.stdout.name, os.devnull)
-                    self.assertEquals(proc.stdout.mode, 'w+b')
-                    self.assertEquals(proc.stderr, proc.stdout)
+                    with open('/dev/null', 'wb+') as fp:
+                        self.assertTrue(isinstance(proc.stdout, type(fp)))
+                    self.assertEqual(proc.stdout.name, os.devnull)
+                    self.assertIn('b', proc.stdout.mode)
+                    self.assertTrue(any(x in proc.stdout.mode for x in 'aw+'),
+                                    'mode must be writable, not %r' %
+                                    proc.stdout.mode)
+                    self.assertEqual(proc.stderr, proc.stdout)
                     # test not daemon over-rides wait
                     server.spawn(conf4, wait=False, daemon=False, once=True)
-                    self.assert_(server.procs)
-                    self.assertEquals(len(server.procs), 4)
+                    self.assertTrue(server.procs)
+                    self.assertEqual(len(server.procs), 4)
                     proc = server.procs[3]
                     expected_args = ['swift-test-server', conf4, 'once',
                                      'verbose']
-                    self.assertEquals(proc.args, expected_args)
+                    self.assertEqual(proc.args, expected_args)
                     # daemon behavior should trump wait, once shouldn't matter
-                    self.assertEquals(proc.stdout, None)
-                    self.assertEquals(proc.stderr, None)
+                    self.assertIsNone(proc.stdout)
+                    self.assertIsNone(proc.stderr)
                     # assert pids
                     for i, proc in enumerate(server.procs):
                         pid_file = self.join_run_dir('test-server/%d.pid' %
                                                      (i + 1))
                         pid_on_disk = int(open(pid_file).read().strip())
-                        self.assertEquals(pid_on_disk, proc.pid)
+                        self.assertEqual(pid_on_disk, proc.pid)
                 finally:
                     manager.subprocess = old_subprocess
 
     def test_wait(self):
         server = manager.Server('test')
-        self.assertEquals(server.wait(), 0)
+        self.assertEqual(server.wait(), 0)
 
-        class MockProcess(Thread):
+        class MockProcess(threading.Thread):
             def __init__(self, delay=0.1, fail_to_start=False):
-                Thread.__init__(self)
+                threading.Thread.__init__(self)
                 # setup pipe
                 rfd, wfd = os.pipe()
                 # subprocess connection to read stdout
-                self.stdout = os.fdopen(rfd)
+                self.stdout = os.fdopen(rfd, 'rb')
                 # real process connection to write stdout
-                self._stdout = os.fdopen(wfd, 'w')
+                self._stdout = os.fdopen(wfd, 'wb')
                 self.delay = delay
                 self.finished = False
                 self.returncode = None
@@ -919,7 +1343,7 @@ def __enter__(self):
                 return self
 
             def __exit__(self, *args):
-                if self.isAlive():
+                if self.is_alive():
                     self.join()
 
             def close_stdout(self):
@@ -931,9 +1355,9 @@ def close_stdout(self):
                         pass
 
             def fail(self):
-                print >>self._stdout, 'mock process started'
+                self._stdout.write(b'mock process started\n')
                 sleep(self.delay)  # perform setup processing
-                print >>self._stdout, 'mock process failed to start'
+                self._stdout.write(b'mock process failed to start\n')
                 self.close_stdout()
 
             def poll(self):
@@ -941,15 +1365,15 @@ def poll(self):
                 return self.returncode or None
 
             def run(self):
-                print >>self._stdout, 'mock process started'
+                self._stdout.write(b'mock process started\n')
                 sleep(self.delay)  # perform setup processing
-                print >>self._stdout, 'setup complete!'
+                self._stdout.write(b'setup complete!\n')
                 self.close_stdout()
                 sleep(self.delay)  # do some more processing
-                print >>self._stdout, 'mock process finished'
+                self._stdout.write(b'mock process finished\n')
                 self.finished = True
 
-        class MockTime():
+        class MockTime(object):
 
             def time(self):
                 return time()
@@ -957,58 +1381,49 @@ def time(self):
             def sleep(self, *args, **kwargs):
                 pass
 
-        with temptree([]) as t:
-            old_stdout = sys.stdout
-            old_wait = manager.WARNING_WAIT
-            old_time = manager.time
-            try:
-                manager.WARNING_WAIT = 0.01
-                manager.time = MockTime()
-                with open(os.path.join(t, 'output'), 'w+') as f:
-                    # acctually capture the read stdout (for prints)
-                    sys.stdout = f
-                    # test closing pipe in subprocess unblocks read
-                    with MockProcess() as proc:
-                        server.procs = [proc]
-                        status = server.wait()
-                        self.assertEquals(status, 0)
-                        # wait should return before process exits
-                        self.assert_(proc.isAlive())
-                        self.assertFalse(proc.finished)
-                    self.assert_(proc.finished)  # make sure it did finish...
-                    # test output kwarg prints subprocess output
-                    with MockProcess() as proc:
-                        server.procs = [proc]
-                        status = server.wait(output=True)
-                    output = pop_stream(f)
-                    self.assert_('mock process started' in output)
-                    self.assert_('setup complete' in output)
-                    # make sure we don't get prints after stdout was closed
-                    self.assert_('mock process finished' not in output)
-                    # test process which fails to start
-                    with MockProcess(fail_to_start=True) as proc:
-                        server.procs = [proc]
-                        status = server.wait()
-                        self.assertEquals(status, 1)
-                    self.assert_('failed' in pop_stream(f))
-                    # test multiple procs
-                    procs = [MockProcess() for i in range(3)]
-                    for proc in procs:
-                        proc.start()
-                    server.procs = procs
-                    status = server.wait()
-                    self.assertEquals(status, 0)
-                    for proc in procs:
-                        self.assert_(proc.isAlive())
-                    for proc in procs:
-                        proc.join()
-            finally:
-                sys.stdout = old_stdout
-                manager.WARNING_WAIT = old_wait
-                manager.time = old_time
+        with temptree([]) as t, open(os.path.join(t, 'output'), 'w+') as f, \
+                mock.patch.object(sys, 'stdout', f), \
+                mock.patch.object(manager, 'WARNING_WAIT', 0.01), \
+                mock.patch.object(manager, 'time', MockTime()):
+            # Note that we actually capture the read stdout (for prints)
+            # test closing pipe in subprocess unblocks read
+            with MockProcess() as proc:
+                server.procs = [proc]
+                status = server.wait()
+                self.assertEqual(status, 0)
+                # wait should return before process exits
+                self.assertTrue(proc.is_alive())
+                self.assertFalse(proc.finished)
+            self.assertTrue(proc.finished)  # make sure it did finish
+            # test output kwarg prints subprocess output
+            with MockProcess() as proc:
+                server.procs = [proc]
+                status = server.wait(output=True)
+            output = pop_stream(f)
+            self.assertIn('mock process started', output)
+            self.assertIn('setup complete', output)
+            # make sure we don't get prints after stdout was closed
+            self.assertNotIn('mock process finished', output)
+            # test process which fails to start
+            with MockProcess(fail_to_start=True) as proc:
+                server.procs = [proc]
+                status = server.wait()
+                self.assertEqual(status, 1)
+            self.assertIn('failed', pop_stream(f))
+            # test multiple procs
+            procs = [MockProcess(delay=.5) for i in range(3)]
+            for proc in procs:
+                proc.start()
+            server.procs = procs
+            status = server.wait()
+            self.assertEqual(status, 0)
+            for proc in procs:
+                self.assertTrue(proc.is_alive())
+            for proc in procs:
+                proc.join()
 
     def test_interact(self):
-        class MockProcess():
+        class MockProcess(object):
 
             def __init__(self, fail=False):
                 self.returncode = None
@@ -1023,14 +1438,14 @@ def communicate(self):
 
         server = manager.Server('test')
         server.procs = [MockProcess()]
-        self.assertEquals(server.interact(), 0)
+        self.assertEqual(server.interact(), 0)
         server.procs = [MockProcess(fail=True)]
-        self.assertEquals(server.interact(), 1)
+        self.assertEqual(server.interact(), 1)
         procs = []
         for fail in (False, True, True):
             procs.append(MockProcess(fail=fail))
         server.procs = procs
-        self.assert_(server.interact() > 0)
+        self.assertTrue(server.interact() > 0)
 
     def test_launch(self):
         # stubs
@@ -1047,8 +1462,8 @@ def test_launch(self):
             ('proxy-server/2.pid', 2),
         )
 
-        #mocks
-        class MockSpawn():
+        # mocks
+        class MockSpawn(object):
 
             def __init__(self, pids=None):
                 self.conf_files = []
@@ -1064,7 +1479,7 @@ def one_forever():
             def __call__(self, conf_file, **kwargs):
                 self.conf_files.append(conf_file)
                 self.kwargs.append(kwargs)
-                rv = self.pids.next()
+                rv = next(self.pids)
                 if isinstance(rv, Exception):
                     raise rv
                 else:
@@ -1080,80 +1495,103 @@ def __call__(self, conf_file, **kwargs):
                     with open(os.path.join(t, 'output'), 'w+') as f:
                         sys.stdout = f
                         # can't start server w/o an conf
-                        server = manager.Server('test')
+                        server = manager.Server('test', run_dir=t)
                         self.assertFalse(server.launch())
                         # start mock os running all pids
                         manager.os = MockOs(pids)
-                        server = manager.Server('proxy')
-                        # can't start server if it's already running
-                        self.assertFalse(server.launch())
-                        output = pop_stream(f)
-                        self.assert_('running' in output)
-                        conf_file = self.join_swift_dir('proxy-server.conf')
-                        self.assert_(conf_file in output)
-                        pid_file = self.join_run_dir('proxy-server/2.pid')
-                        self.assert_(pid_file in output)
-                        self.assert_('already started' in output)
+                        proc_files = (
+                            ('1/cmdline', 'swift-proxy-server'),
+                            ('2/cmdline', 'swift-proxy-server'),
+                        )
+                        files, contents = zip(*proc_files)
+                        with temptree(files, contents) as proc_dir:
+                            manager.PROC_DIR = proc_dir
+                            server = manager.Server('proxy', run_dir=t)
+                            # can't start server if it's already running
+                            self.assertFalse(server.launch())
+                            output = pop_stream(f)
+                            self.assertTrue('running' in output)
+                            conf_file = self.join_swift_dir(
+                                'proxy-server.conf')
+                            self.assertTrue(conf_file in output)
+                            pid_file = self.join_run_dir('proxy-server/2.pid')
+                            self.assertTrue(pid_file in output)
+                            self.assertTrue('already started' in output)
+
                         # no running pids
                         manager.os = MockOs([])
-                        # test ignore once for non-start-once server
-                        mock_spawn = MockSpawn([1])
-                        server.spawn = mock_spawn
-                        conf_file = self.join_swift_dir('proxy-server.conf')
-                        expected = {
-                            1: conf_file,
-                        }
-                        self.assertEquals(server.launch(once=True), expected)
-                        self.assertEquals(mock_spawn.conf_files, [conf_file])
-                        expected = {
-                            'once': False,
-                        }
-                        self.assertEquals(mock_spawn.kwargs, [expected])
-                        output = pop_stream(f)
-                        self.assert_('Starting' in output)
-                        self.assert_('once' not in output)
+                        with temptree([], []) as proc_dir:
+                            manager.PROC_DIR = proc_dir
+                            # test ignore once for non-start-once server
+                            mock_spawn = MockSpawn([1])
+                            server.spawn = mock_spawn
+                            conf_file = self.join_swift_dir(
+                                'proxy-server.conf')
+                            expected = {
+                                1: conf_file,
+                            }
+                            self.assertEqual(server.launch(once=True),
+                                             expected)
+                            self.assertEqual(mock_spawn.conf_files,
+                                             [conf_file])
+                            expected = {
+                                'once': False,
+                            }
+                            self.assertEqual(mock_spawn.kwargs, [expected])
+                            output = pop_stream(f)
+                            self.assertIn('Starting', output)
+                            self.assertNotIn('once', output)
                         # test multi-server kwarg once
                         server = manager.Server('object-replicator')
-                        mock_spawn = MockSpawn([1, 2, 3, 4])
-                        server.spawn = mock_spawn
-                        conf1 = self.join_swift_dir('object-server/1.conf')
-                        conf2 = self.join_swift_dir('object-server/2.conf')
-                        conf3 = self.join_swift_dir('object-server/3.conf')
-                        conf4 = self.join_swift_dir('object-server/4.conf')
-                        expected = {
-                            1: conf1,
-                            2: conf2,
-                            3: conf3,
-                            4: conf4,
-                        }
-                        self.assertEquals(server.launch(once=True), expected)
-                        self.assertEquals(mock_spawn.conf_files, [conf1, conf2,
-                                                                 conf3, conf4])
-                        expected = {
-                            'once': True,
-                        }
-                        self.assertEquals(len(mock_spawn.kwargs), 4)
-                        for kwargs in mock_spawn.kwargs:
-                            self.assertEquals(kwargs, expected)
-                        # test number kwarg
-                        mock_spawn = MockSpawn([4])
-                        server.spawn = mock_spawn
-                        expected = {
-                            4: conf4,
-                        }
-                        self.assertEquals(server.launch(number=4), expected)
-                        self.assertEquals(mock_spawn.conf_files, [conf4])
-                        expected = {
-                            'number': 4
-                        }
-                        self.assertEquals(mock_spawn.kwargs, [expected])
+                        with temptree([], []) as proc_dir:
+                            manager.PROC_DIR = proc_dir
+                            mock_spawn = MockSpawn([1, 2, 3, 4])
+                            server.spawn = mock_spawn
+                            conf1 = self.join_swift_dir('object-server/1.conf')
+                            conf2 = self.join_swift_dir('object-server/2.conf')
+                            conf3 = self.join_swift_dir('object-server/3.conf')
+                            conf4 = self.join_swift_dir('object-server/4.conf')
+                            expected = {
+                                1: conf1,
+                                2: conf2,
+                                3: conf3,
+                                4: conf4,
+                            }
+                            self.assertEqual(server.launch(once=True),
+                                             expected)
+                            self.assertEqual(mock_spawn.conf_files, [
+                                conf1, conf2, conf3, conf4])
+                            expected = {
+                                'once': True,
+                            }
+                            self.assertEqual(len(mock_spawn.kwargs), 4)
+                            for kwargs in mock_spawn.kwargs:
+                                self.assertEqual(kwargs, expected)
+                            # test number kwarg
+                            mock_spawn = MockSpawn([4])
+                            manager.PROC_DIR = proc_dir
+                            server.spawn = mock_spawn
+                            expected = {
+                                4: conf4,
+                            }
+                            self.assertEqual(server.launch(number=4),
+                                             expected)
+                            self.assertEqual(mock_spawn.conf_files, [conf4])
+                            expected = {
+                                'number': 4
+                            }
+                            self.assertEqual(mock_spawn.kwargs, [expected])
                         # test cmd does not exist
                         server = manager.Server('auth')
-                        mock_spawn = MockSpawn([OSError(errno.ENOENT, 'blah')])
-                        server.spawn = mock_spawn
-                        self.assertEquals(server.launch(), {})
-                        self.assert_('swift-auth-server does not exist' in
-                                     pop_stream(f))
+                        with temptree([], []) as proc_dir:
+                            manager.PROC_DIR = proc_dir
+                            mock_spawn = MockSpawn([OSError(errno.ENOENT,
+                                                            'blah')])
+                            server.spawn = mock_spawn
+                            self.assertEqual(server.launch(), {})
+                            self.assertTrue(
+                                'swift-auth-server does not exist' in
+                                pop_stream(f))
                 finally:
                     sys.stdout = old_stdout
 
@@ -1178,14 +1616,14 @@ def test_stop(self):
                 manager.RUN_DIR = t
                 # start all pids in mock os
                 manager.os = MockOs(pids)
-                server = manager.Server('account-reaper')
+                server = manager.Server('account-reaper', run_dir=t)
                 # test kill all running pids
                 pids = server.stop()
-                self.assertEquals(len(pids), 4)
+                self.assertEqual(len(pids), 4)
                 for pid in (1, 2, 3, 4):
-                    self.assert_(pid in pids)
-                    self.assertEquals(manager.os.pid_sigs[pid],
-                                      [signal.SIGTERM])
+                    self.assertTrue(pid in pids)
+                    self.assertEqual(manager.os.pid_sigs[pid],
+                                     [signal.SIGTERM])
                 conf1 = self.join_swift_dir('account-reaper/1.conf')
                 conf2 = self.join_swift_dir('account-reaper/2.conf')
                 conf3 = self.join_swift_dir('account-reaper/3.conf')
@@ -1193,83 +1631,119 @@ def test_stop(self):
                 # reset mock os with only 2 running pids
                 manager.os = MockOs([3, 4])
                 pids = server.stop()
-                self.assertEquals(len(pids), 2)
+                self.assertEqual(len(pids), 2)
                 for pid in (3, 4):
-                    self.assert_(pid in pids)
-                    self.assertEquals(manager.os.pid_sigs[pid],
-                                      [signal.SIGTERM])
+                    self.assertTrue(pid in pids)
+                    self.assertEqual(manager.os.pid_sigs[pid],
+                                     [signal.SIGTERM])
                 self.assertFalse(os.path.exists(conf1))
                 self.assertFalse(os.path.exists(conf2))
                 # test number kwarg
                 manager.os = MockOs([3, 4])
                 pids = server.stop(number=3)
-                self.assertEquals(len(pids), 1)
+                self.assertEqual(len(pids), 1)
                 expected = {
-                    3: conf3,
+                    3: self.join_run_dir('account-reaper/3.pid'),
                 }
-                self.assert_(pids, expected)
-                self.assertEquals(manager.os.pid_sigs[3], [signal.SIGTERM])
+                self.assertEqual(expected, pids)
+                self.assertEqual(manager.os.pid_sigs[3], [signal.SIGTERM])
                 self.assertFalse(os.path.exists(conf4))
                 self.assertFalse(os.path.exists(conf3))
 
 
 class TestManager(unittest.TestCase):
 
-    def test_create(self):
+    @mock.patch.object(manager, 'verify_server',
+                       side_effect=lambda server: 'error' not in server)
+    def test_create(self, mock_verify):
         m = manager.Manager(['test'])
-        self.assertEquals(len(m.servers), 1)
+        self.assertEqual(len(m.servers), 1)
         server = m.servers.pop()
-        self.assert_(isinstance(server, manager.Server))
-        self.assertEquals(server.server, 'test-server')
+        self.assertIsInstance(server, manager.Server)
+        self.assertEqual(server.server, 'test-server')
         # test multi-server and simple dedupe
-        servers = ['object-replicator', 'object-auditor', 'object-replicator']
+        servers = ['object-replicator', 'object-auditor',
+                   'object-replicator']
         m = manager.Manager(servers)
-        self.assertEquals(len(m.servers), 2)
+        self.assertEqual(len(m.servers), 2)
         for server in m.servers:
-            self.assert_(server.server in servers)
+            self.assertTrue(server.server in servers)
         # test all
         m = manager.Manager(['all'])
-        self.assertEquals(len(m.servers), len(manager.ALL_SERVERS))
+        self.assertEqual(len(m.servers), len(manager.ALL_SERVERS))
         for server in m.servers:
-            self.assert_(server.server in manager.ALL_SERVERS)
+            self.assertTrue(server.server in manager.ALL_SERVERS)
         # test main
         m = manager.Manager(['main'])
-        self.assertEquals(len(m.servers), len(manager.MAIN_SERVERS))
+        self.assertEqual(len(m.servers), len(manager.MAIN_SERVERS))
         for server in m.servers:
-            self.assert_(server.server in manager.MAIN_SERVERS)
+            self.assertTrue(server.server in manager.MAIN_SERVERS)
         # test rest
         m = manager.Manager(['rest'])
-        self.assertEquals(len(m.servers), len(manager.REST_SERVERS))
+        self.assertEqual(len(m.servers), len(manager.REST_SERVERS))
         for server in m.servers:
-            self.assert_(server.server in manager.REST_SERVERS)
+            self.assertTrue(server.server in manager.REST_SERVERS)
         # test main + rest == all
         m = manager.Manager(['main', 'rest'])
-        self.assertEquals(len(m.servers), len(manager.ALL_SERVERS))
+        self.assertEqual(len(m.servers), len(manager.ALL_SERVERS))
         for server in m.servers:
-            self.assert_(server.server in manager.ALL_SERVERS)
+            self.assertTrue(server.server in manager.ALL_SERVERS)
         # test dedupe
         m = manager.Manager(['main', 'rest', 'proxy', 'object',
-                                           'container', 'account'])
-        self.assertEquals(len(m.servers), len(manager.ALL_SERVERS))
+                             'container', 'account'])
+        self.assertEqual(len(m.servers), len(manager.ALL_SERVERS))
         for server in m.servers:
-            self.assert_(server.server in manager.ALL_SERVERS)
+            self.assertTrue(server.server in manager.ALL_SERVERS)
         # test glob
         m = manager.Manager(['object-*'])
         object_servers = [s for s in manager.ALL_SERVERS if
                           s.startswith('object')]
-        self.assertEquals(len(m.servers), len(object_servers))
+        self.assertEqual(len(m.servers), len(object_servers))
         for s in m.servers:
-            self.assert_(str(s) in object_servers)
+            self.assertTrue(str(s) in object_servers)
         m = manager.Manager(['*-replicator'])
         replicators = [s for s in manager.ALL_SERVERS if
                        s.endswith('replicator')]
         for s in m.servers:
-            self.assert_(str(s) in replicators)
+            self.assertTrue(str(s) in replicators)
+
+        # test invalid server
+        m = manager.Manager(['error'])
+        self.assertEqual(len(m.servers), 0)
+        # test valid + invalid server
+        servers = ['object-server']
+        m = manager.Manager(['object', 'error'])
+        self.assertEqual(len(m.servers), 1)
+        for server in m.servers:
+            self.assertTrue(server.server in servers)
+        # test multi-server and invalid server together
+        servers = ['object-replicator', 'object-auditor', 'error']
+        m = manager.Manager(servers)
+        self.assertEqual(len(m.servers), 2)
+        for server in m.servers:
+            self.assertTrue(server.server in servers[:2])
+
+    def test_iter(self):
+        with mock.patch.object(manager, 'which', lambda x: x):
+            m = manager.Manager(['all'])
+            self.assertEqual(len(list(m)), len(manager.ALL_SERVERS))
+            for server in m:
+                self.assertTrue(server.server in manager.ALL_SERVERS)
+
+    def test_default_strict(self):
+        # test default strict
+        m = manager.Manager(['proxy'])
+        self.assertEqual(m._default_strict, True)
+        # aliases
+        m = manager.Manager(['main'])
+        self.assertEqual(m._default_strict, False)
+        m = manager.Manager(['proxy*'])
+        self.assertEqual(m._default_strict, False)
 
     def test_status(self):
-        class MockServer():
+        class MockServer(object):
 
-            def __init__(self, server):
+            def __init__(self, server, run_dir=manager.RUN_DIR):
                 self.server = server
                 self.called_kwargs = []
 
@@ -1280,36 +1754,56 @@ def status(self, **kwargs):
                 else:
                     return 0
 
+        def mock_verify_server(server):
+            if 'error' in server:
+                return False
+            return True
+
+        old_verify_server = manager.verify_server
         old_server_class = manager.Server
+
         try:
+            manager.verify_server = mock_verify_server
             manager.Server = MockServer
             m = manager.Manager(['test'])
             status = m.status()
-            self.assertEquals(status, 0)
+            self.assertEqual(status, 0)
             m = manager.Manager(['error'])
             status = m.status()
-            self.assertEquals(status, 1)
+            self.assertEqual(status, 1)
             # test multi-server
             m = manager.Manager(['test', 'error'])
             kwargs = {'key': 'value'}
             status = m.status(**kwargs)
-            self.assertEquals(status, 1)
+            self.assertEqual(status, 0)
             for server in m.servers:
-                self.assertEquals(server.called_kwargs, [kwargs])
+                self.assertEqual(server.called_kwargs, [kwargs])
         finally:
+            manager.verify_server = old_verify_server
             manager.Server = old_server_class
 
     def test_start(self):
         def mock_setup_env():
             getattr(mock_setup_env, 'called', []).append(True)
 
-        class MockServer():
-            def __init__(self, server):
+        def mock_verify_server(server):
+            if 'none' in server:
+                return False
+            return True
+
+        class MockServer(object):
+            def __init__(self, server, run_dir=manager.RUN_DIR):
                 self.server = server
                 self.called = defaultdict(list)
 
             def launch(self, **kwargs):
                 self.called['launch'].append(kwargs)
+                if 'noconfig' in self.server:
+                    return {}
+                elif 'somerunning' in self.server:
+                    return {}
+                else:
+                    return {1: self.server[0]}
 
             def wait(self, **kwargs):
                 self.called['wait'].append(kwargs)
@@ -1328,131 +1822,262 @@ def interact(self, **kwargs):
                     return 0
 
         old_setup_env = manager.setup_env
+        old_verify_server = manager.verify_server
         old_swift_server = manager.Server
         try:
             manager.setup_env = mock_setup_env
+            manager.verify_server = mock_verify_server
             manager.Server = MockServer
 
             # test no errors on launch
             m = manager.Manager(['proxy'])
             status = m.start()
-            self.assertEquals(status, 0)
+            self.assertEqual(status, 0)
             for server in m.servers:
-                self.assertEquals(server.called['launch'], [{}])
+                self.assertEqual(server.called['launch'], [{}])
 
             # test error on launch
             m = manager.Manager(['proxy', 'error'])
             status = m.start()
-            self.assertEquals(status, 1)
+            self.assertEqual(status, 1)
             for server in m.servers:
-                self.assertEquals(server.called['launch'], [{}])
-                self.assertEquals(server.called['wait'], [{}])
+                self.assertEqual(server.called['launch'], [{}])
+                self.assertEqual(server.called['wait'], [{}])
+
+            # test missing (on launch, as it happens)
+            # We only throw a bad error code if nothing good was run.
+            m = manager.Manager(['none'])
+            status = m.start()
+            self.assertEqual(status, 1)
+            m = manager.Manager(['proxy', 'none'])
+            status = m.start()
+            self.assertEqual(status, 0)
 
             # test interact
             m = manager.Manager(['proxy', 'error'])
             kwargs = {'daemon': False}
             status = m.start(**kwargs)
-            self.assertEquals(status, 1)
+            self.assertEqual(status, 1)
             for server in m.servers:
-                self.assertEquals(server.called['launch'], [kwargs])
-                self.assertEquals(server.called['interact'], [kwargs])
+                self.assertEqual(server.called['launch'], [kwargs])
+                self.assertEqual(server.called['interact'], [kwargs])
             m = manager.Manager(['raise'])
             kwargs = {'daemon': False}
             status = m.start(**kwargs)
 
+            # test no config
+            m = manager.Manager(['proxy', 'noconfig'])
+            status = m.start()
+            self.assertEqual(status, 1)
+            for server in m.servers:
+                self.assertEqual(server.called['launch'], [{}])
+                self.assertEqual(server.called['wait'], [{}])
+
+            # test no config with --non-strict
+            m = manager.Manager(['proxy', 'noconfig'])
+            status = m.start(strict=False)
+            self.assertEqual(status, 0)
+            for server in m.servers:
+                self.assertEqual(server.called['launch'], [{'strict': False}])
+                self.assertEqual(server.called['wait'], [{'strict': False}])
+
+            # test no config --strict
+            m = manager.Manager(['proxy', 'noconfig'])
+            status = m.start(strict=True)
+            self.assertEqual(status, 1)
+            for server in m.servers:
+                self.assertEqual(server.called['launch'], [{'strict': True}])
+                self.assertEqual(server.called['wait'], [{'strict': True}])
+
+            # test no config with alias
+            m = manager.Manager(['main', 'noconfig'])
+            status = m.start()
+            self.assertEqual(status, 0)
+            for server in m.servers:
+                self.assertEqual(server.called['launch'], [{}])
+                self.assertEqual(server.called['wait'], [{}])
+
+            # test no config with alias and --non-strict
+            m = manager.Manager(['main', 'noconfig'])
+            status = m.start(strict=False)
+            self.assertEqual(status, 0)
+            for server in m.servers:
+                self.assertEqual(server.called['launch'], [{'strict': False}])
+                self.assertEqual(server.called['wait'], [{'strict': False}])
+
+            # test no config with alias and --strict
+            m = manager.Manager(['main', 'noconfig'])
+            status = m.start(strict=True)
+            self.assertEqual(status, 1)
+            for server in m.servers:
+                self.assertEqual(server.called['launch'], [{'strict': True}])
+                self.assertEqual(server.called['wait'], [{'strict': True}])
+
+            # test already all running
+            m = manager.Manager(['proxy', 'somerunning'])
+            status = m.start()
+            self.assertEqual(status, 1)
+            for server in m.servers:
+                self.assertEqual(server.called['launch'], [{}])
+                self.assertEqual(server.called['wait'], [{}])
+
+            # test already all running --non-strict
+            m = manager.Manager(['proxy', 'somerunning'])
+            status = m.start(strict=False)
+            self.assertEqual(status, 0)
+            for server in m.servers:
+                self.assertEqual(server.called['launch'], [{'strict': False}])
+                self.assertEqual(server.called['wait'], [{'strict': False}])
+
+            # test already all running --strict
+            m = manager.Manager(['proxy', 'somerunning'])
+            status = m.start(strict=True)
+            self.assertEqual(status, 1)
+            for server in m.servers:
+                self.assertEqual(server.called['launch'], [{'strict': True}])
+                self.assertEqual(server.called['wait'], [{'strict': True}])
+
+            # test already all running with alias
+            m = manager.Manager(['main', 'somerunning'])
+            status = m.start()
+            self.assertEqual(status, 0)
+            for server in m.servers:
+                self.assertEqual(server.called['launch'], [{}])
+                self.assertEqual(server.called['wait'], [{}])
+
+            # test already all running with alias and --non-strict
+            m = manager.Manager(['main', 'somerunning'])
+            status = m.start(strict=False)
+            self.assertEqual(status, 0)
+            for server in m.servers:
+                self.assertEqual(server.called['launch'], [{'strict': False}])
+                self.assertEqual(server.called['wait'], [{'strict': False}])
+
+            # test already all running with alias and --strict
+            m = manager.Manager(['main', 'somerunning'])
+            status = m.start(strict=True)
+            self.assertEqual(status, 1)
+            for server in m.servers:
+                self.assertEqual(server.called['launch'], [{'strict': True}])
+                self.assertEqual(server.called['wait'], [{'strict': True}])
+
         finally:
             manager.setup_env = old_setup_env
+            manager.verify_server = old_verify_server
             manager.Server = old_swift_server
 
     def test_no_wait(self):
-        class MockServer():
-            def __init__(self, server):
+        def mock_verify_server(server):
+            if 'error' in server:
+                return False
+            return True
+
+        class MockServer(object):
+            def __init__(self, server, run_dir=manager.RUN_DIR):
                 self.server = server
                 self.called = defaultdict(list)
 
             def launch(self, **kwargs):
                 self.called['launch'].append(kwargs)
+                # must return non-empty dict if launch succeeded
+                return {1: self.server[0]}
 
             def wait(self, **kwargs):
                 self.called['wait'].append(kwargs)
                 return int('error' in self.server)
 
+        orig_verify_server = manager.verify_server
         orig_swift_server = manager.Server
         try:
+            manager.verify_server = mock_verify_server
             manager.Server = MockServer
             # test success
             init = manager.Manager(['proxy'])
             status = init.no_wait()
-            self.assertEquals(status, 0)
+            self.assertEqual(status, 0)
             for server in init.servers:
-                self.assertEquals(len(server.called['launch']), 1)
+                self.assertEqual(len(server.called['launch']), 1)
                 called_kwargs = server.called['launch'][0]
                 self.assertFalse(called_kwargs['wait'])
                 self.assertFalse(server.called['wait'])
-            # test no errocode status even on error
-            init = manager.Manager(['error'])
+            # test no errocode status even on invalid
+            init = manager.Manager(['invalid'])
             status = init.no_wait()
-            self.assertEquals(status, 0)
+            self.assertEqual(status, 0)
             for server in init.servers:
-                self.assertEquals(len(server.called['launch']), 1)
+                self.assertEqual(len(server.called['launch']), 1)
                 called_kwargs = server.called['launch'][0]
-                self.assert_('wait' in called_kwargs)
+                self.assertTrue('wait' in called_kwargs)
                 self.assertFalse(called_kwargs['wait'])
                 self.assertFalse(server.called['wait'])
             # test wait with once option
-            init = manager.Manager(['updater', 'replicator-error'])
+            init = manager.Manager(['updater', 'replicator-invalid'])
             status = init.no_wait(once=True)
-            self.assertEquals(status, 0)
+            self.assertEqual(status, 0)
             for server in init.servers:
-                self.assertEquals(len(server.called['launch']), 1)
+                self.assertEqual(len(server.called['launch']), 1)
                 called_kwargs = server.called['launch'][0]
-                self.assert_('wait' in called_kwargs)
+                self.assertTrue('wait' in called_kwargs)
                 self.assertFalse(called_kwargs['wait'])
-                self.assert_('once' in called_kwargs)
-                self.assert_(called_kwargs['once'])
+                self.assertTrue('once' in called_kwargs)
+                self.assertTrue(called_kwargs['once'])
                 self.assertFalse(server.called['wait'])
         finally:
+            manager.verify_server = orig_verify_server
             manager.Server = orig_swift_server
 
     def test_no_daemon(self):
-        class MockServer():
+        def mock_verify_server(server):
+            return True
+
+        class MockServer(object):
 
-            def __init__(self, server):
+            def __init__(self, server, run_dir=manager.RUN_DIR):
                 self.server = server
                 self.called = defaultdict(list)
 
             def launch(self, **kwargs):
                 self.called['launch'].append(kwargs)
+                # must return non-empty dict if launch succeeded
+                return {1: self.server[0]}
 
             def interact(self, **kwargs):
                 self.called['interact'].append(kwargs)
                 return int('error' in self.server)
 
+        orig_verify_server = manager.verify_server
         orig_swift_server = manager.Server
         try:
             manager.Server = MockServer
+            manager.verify_server = mock_verify_server
             # test success
             init = manager.Manager(['proxy'])
             stats = init.no_daemon()
-            self.assertEquals(stats, 0)
+            self.assertEqual(stats, 0)
             # test error
             init = manager.Manager(['proxy', 'object-error'])
             stats = init.no_daemon()
-            self.assertEquals(stats, 1)
+            self.assertEqual(stats, 1)
             # test once
             init = manager.Manager(['proxy', 'object-error'])
             stats = init.no_daemon()
             for server in init.servers:
-                self.assertEquals(len(server.called['launch']), 1)
-                self.assertEquals(len(server.called['wait']), 0)
-                self.assertEquals(len(server.called['interact']), 1)
+                self.assertEqual(len(server.called['launch']), 1)
+                self.assertEqual(len(server.called['wait']), 0)
+                self.assertEqual(len(server.called['interact']), 1)
         finally:
+            manager.verify_server = orig_verify_server
             manager.Server = orig_swift_server
 
     def test_once(self):
-        class MockServer():
+        def mock_verify_server(server):
+            if 'error' in server:
+                return False
+            return True
 
-            def __init__(self, server):
+        class MockServer(object):
+
+            def __init__(self, server, run_dir=manager.RUN_DIR):
                 self.server = server
                 self.called = defaultdict(list)
 
@@ -1464,41 +2089,53 @@ def wait(self, **kwargs):
                     return 0
 
             def launch(self, **kwargs):
-                return self.called['launch'].append(kwargs)
+                self.called['launch'].append(kwargs)
+                return {1: 'account-reaper'}
 
+        orig_verify_server = manager.verify_server
         orig_swift_server = manager.Server
         try:
             manager.Server = MockServer
+            manager.verify_server = mock_verify_server
             # test no errors
             init = manager.Manager(['account-reaper'])
             status = init.once()
-            self.assertEquals(status, 0)
+            self.assertEqual(status, 0)
             # test error code on error
-            init = manager.Manager(['error-reaper'])
+            init = manager.Manager(['error'])
             status = init.once()
-            self.assertEquals(status, 1)
+            self.assertEqual(status, 1)
             for server in init.servers:
-                self.assertEquals(len(server.called['launch']), 1)
+                self.assertEqual(len(server.called['launch']), 1)
                 called_kwargs = server.called['launch'][0]
-                self.assertEquals(called_kwargs, {'once': True})
-                self.assertEquals(len(server.called['wait']), 1)
-                self.assertEquals(len(server.called['interact']), 0)
+                self.assertEqual(called_kwargs, {'once': True})
+                self.assertEqual(len(server.called['wait']), 1)
+                self.assertEqual(len(server.called['interact']), 0)
         finally:
             manager.Server = orig_swift_server
+            manager.verify_server = orig_verify_server
 
     def test_stop(self):
-        class MockServerFactory():
-            class MockServer():
-                def __init__(self, pids):
+        def mock_verify_server(server):
+            if 'error' in server:
+                return False
+            return True
+
+        class MockServerFactory(object):
+            class MockServer(object):
+                def __init__(self, pids, run_dir=manager.RUN_DIR):
                     self.pids = pids
 
                 def stop(self, **kwargs):
                     return self.pids
 
-            def __init__(self, server_pids):
+                def status(self, **kwargs):
+                    return not self.pids
+
+            def __init__(self, server_pids, run_dir=manager.RUN_DIR):
                 self.server_pids = server_pids
 
-            def __call__(self, server):
+            def __call__(self, server, run_dir=manager.RUN_DIR):
                 return MockServerFactory.MockServer(self.server_pids[server])
 
         def mock_watch_server_pids(server_pids, **kwargs):
@@ -1508,55 +2145,159 @@ def mock_watch_server_pids(server_pids, **kwargs):
                         continue
                     yield server, pid
 
+        def mock_kill_group(pid, sig):
+            self.fail('kill_group should not be called')
+
+        _orig_verify_server = manager.verify_server
         _orig_server = manager.Server
         _orig_watch_server_pids = manager.watch_server_pids
+        _orig_kill_group = manager.kill_group
         try:
             manager.watch_server_pids = mock_watch_server_pids
+            manager.kill_group = mock_kill_group
+            manager.verify_server = mock_verify_server
             # test stop one server
             server_pids = {
-                'test': [1]
+                'test': {1: "dummy.pid"}
             }
             manager.Server = MockServerFactory(server_pids)
             m = manager.Manager(['test'])
             status = m.stop()
-            self.assertEquals(status, 0)
+            self.assertEqual(status, 0)
             # test not running
             server_pids = {
-                'test': []
+                'test': {}
             }
             manager.Server = MockServerFactory(server_pids)
             m = manager.Manager(['test'])
             status = m.stop()
-            self.assertEquals(status, 1)
+            self.assertEqual(status, 1)
+            # test kill not running
+            server_pids = {
+                'test': {}
+            }
+            manager.Server = MockServerFactory(server_pids)
+            m = manager.Manager(['test'])
+            status = m.kill()
+            self.assertEqual(status, 0)
             # test won't die
             server_pids = {
-                'test': [None]
+                'test': {None: None}
             }
             manager.Server = MockServerFactory(server_pids)
             m = manager.Manager(['test'])
             status = m.stop()
-            self.assertEquals(status, 1)
+            self.assertEqual(status, 1)
 
         finally:
+            manager.verify_server = _orig_verify_server
             manager.Server = _orig_server
             manager.watch_server_pids = _orig_watch_server_pids
+            manager.kill_group = _orig_kill_group
+
+    def test_stop_kill_after_timeout(self):
+        class MockServerFactory(object):
+            class MockServer(object):
+                def __init__(self, pids, run_dir=manager.RUN_DIR):
+                    self.pids = pids
+
+                def stop(self, **kwargs):
+                    return self.pids
+
+                def status(self, **kwargs):
+                    return not self.pids
 
-    # TODO: more tests
-    def test_shutdown(self):
+            def __init__(self, server_pids, run_dir=manager.RUN_DIR):
+                self.server_pids = server_pids
+
+            def __call__(self, server, run_dir=manager.RUN_DIR):
+                return MockServerFactory.MockServer(self.server_pids[server])
+
+        def mock_watch_server_pids(server_pids, **kwargs):
+            for server, pids in server_pids.items():
+                for pid in pids:
+                    if pid is None:
+                        continue
+                    yield server, pid
+
+        mock_kill_group_called = []
+
+        def mock_kill_group(*args):
+            mock_kill_group_called.append(args)
+
+        def mock_kill_group_oserr(*args):
+            raise OSError()
+
+        def mock_kill_group_oserr_ESRCH(*args):
+            raise OSError(errno.ESRCH, 'No such process')
+
+        def mock_verify_server(server):
+            if 'error' in server:
+                return False
+            return True
+
+        _orig_server = manager.Server
+        _orig_watch_server_pids = manager.watch_server_pids
+        _orig_kill_group = manager.kill_group
+        _orig_verify_server = manager.verify_server
+        try:
+            manager.watch_server_pids = mock_watch_server_pids
+            manager.kill_group = mock_kill_group
+            manager.verify_server = mock_verify_server
+            # test stop one server
+            server_pids = {
+                'test': {None: None}
+            }
+            manager.Server = MockServerFactory(server_pids)
+            m = manager.Manager(['test'])
+            status = m.stop(kill_after_timeout=True)
+            self.assertEqual(status, 1)
+            self.assertEqual(mock_kill_group_called, [(None, 9)])
+
+            manager.kill_group = mock_kill_group_oserr
+            # test stop one server - OSError
+            server_pids = {
+                'test': {None: None}
+            }
+            manager.Server = MockServerFactory(server_pids)
+            m = manager.Manager(['test'])
+            with self.assertRaises(OSError):
+                status = m.stop(kill_after_timeout=True)
+
+            manager.kill_group = mock_kill_group_oserr_ESRCH
+            # test stop one server - OSError: No such process
+            server_pids = {
+                'test': {None: None}
+            }
+            manager.Server = MockServerFactory(server_pids)
+            m = manager.Manager(['test'])
+            status = m.stop(kill_after_timeout=True)
+            self.assertEqual(status, 1)
+        finally:
+            manager.Server = _orig_server
+            manager.watch_server_pids = _orig_watch_server_pids
+            manager.kill_group = _orig_kill_group
+            manager.verify_server = _orig_verify_server
+
+    @mock.patch.object(manager, 'verify_server',
+                       side_effect=lambda server: 'error' not in server)
+    def test_shutdown(self, mock_verify):
         m = manager.Manager(['test'])
         m.stop_was_called = False
 
         def mock_stop(*args, **kwargs):
             m.stop_was_called = True
             expected = {'graceful': True}
-            self.assertEquals(kwargs, expected)
+            self.assertEqual(kwargs, expected)
             return 0
         m.stop = mock_stop
         status = m.shutdown()
-        self.assertEquals(status, 0)
-        self.assertEquals(m.stop_was_called, True)
+        self.assertEqual(status, 0)
+        self.assertEqual(m.stop_was_called, True)
 
-    def test_restart(self):
+    @mock.patch.object(manager, 'verify_server',
+                       side_effect=lambda server: 'error' not in server)
+    def test_restart(self, mock_verify):
         m = manager.Manager(['test'])
         m.stop_was_called = False
 
@@ -1571,63 +2312,48 @@ def mock_start(*args, **kwargs):
         m.stop = mock_stop
         m.start = mock_start
         status = m.restart()
-        self.assertEquals(status, 0)
-        self.assertEquals(m.stop_was_called, True)
-        self.assertEquals(m.start_was_called, True)
+        self.assertEqual(status, 0)
+        self.assertEqual(m.stop_was_called, True)
+        self.assertEqual(m.start_was_called, True)
 
     def test_reload(self):
-        class MockManager():
+        def do_test(graceful):
             called = defaultdict(list)
 
-            def __init__(self, servers):
-                pass
-
-            @classmethod
-            def reset_called(cls):
-                cls.called = defaultdict(list)
-
             def stop(self, **kwargs):
-                MockManager.called['stop'].append(kwargs)
+                called[self].append(('stop', kwargs))
                 return 0
 
             def start(self, **kwargs):
-                MockManager.called['start'].append(kwargs)
+                called[self].append(('start', kwargs))
                 return 0
 
-        _orig_manager = manager.Manager
-        try:
-            m = _orig_manager(['auth'])
-            for server in m.servers:
-                self.assert_(server.server in
-                             manager.GRACEFUL_SHUTDOWN_SERVERS)
-            manager.Manager = MockManager
-            status = m.reload()
-            self.assertEquals(status, 0)
-            expected = {
-                'start': [{'graceful': True}],
-                'stop': [{'graceful': True}],
-            }
-            self.assertEquals(MockManager.called, expected)
-            # test force graceful
-            MockManager.reset_called()
-            m = _orig_manager(['*-server'])
-            self.assertEquals(len(m.servers), 4)
-            for server in m.servers:
-                self.assert_(server.server in
-                             manager.GRACEFUL_SHUTDOWN_SERVERS)
-            manager.Manager = MockManager
-            status = m.reload(graceful=False)
-            self.assertEquals(status, 0)
-            expected = {
-                'start': [{'graceful': True}] * 4,
-                'stop': [{'graceful': True}] * 4,
-            }
-            self.assertEquals(MockManager.called, expected)
-
-        finally:
-            manager.Manager = _orig_manager
-
-    def test_force_reload(self):
+            m = manager.Manager(['*-server'])
+            expected_servers = set([server.server for server in m.servers])
+            self.assertEqual(len(expected_servers), 4)
+            for server in expected_servers:
+                self.assertIn(server, manager.GRACEFUL_SHUTDOWN_SERVERS)
+
+            with mock.patch('swift.common.manager.Manager.start', start):
+                with mock.patch('swift.common.manager.Manager.stop', stop):
+                    status = m.reload(graceful=graceful)
+
+            self.assertEqual(status, 0)
+            self.assertEqual(4, len(called))
+            actual_servers = set()
+            for m, calls in called.items():
+                self.assertEqual(calls, [('stop', {'graceful': True}),
+                                         ('start', {'graceful': True})])
+                actual_servers.update([server.server for server in m.servers])
+            self.assertEqual(expected_servers, actual_servers)
+
+        with mock.patch.object(manager, 'which', lambda x: x):
+            do_test(graceful=True)
+            do_test(graceful=False)  # graceful is forced regardless
+
+    @mock.patch.object(manager, 'verify_server',
+                       side_effect=lambda server: 'error' not in server)
+    def test_force_reload(self, mock_verify):
         m = manager.Manager(['test'])
         m.reload_was_called = False
 
@@ -1636,15 +2362,17 @@ def mock_reload(*args, **kwargs):
             return 0
         m.reload = mock_reload
         status = m.force_reload()
-        self.assertEquals(status, 0)
-        self.assertEquals(m.reload_was_called, True)
+        self.assertEqual(status, 0)
+        self.assertEqual(m.reload_was_called, True)
 
-    def test_get_command(self):
+    @mock.patch.object(manager, 'verify_server',
+                       side_effect=lambda server: 'error' not in server)
+    def test_get_command(self, mock_verify):
         m = manager.Manager(['test'])
-        self.assertEquals(m.start, m.get_command('start'))
-        self.assertEquals(m.force_reload, m.get_command('force-reload'))
-        self.assertEquals(m.get_command('force-reload'),
-                          m.get_command('force_reload'))
+        self.assertEqual(m.start, m.get_command('start'))
+        self.assertEqual(m.force_reload, m.get_command('force-reload'))
+        self.assertEqual(m.get_command('force-reload'),
+                         m.get_command('force_reload'))
         self.assertRaises(manager.UnknownCommandError, m.get_command,
                           'no_command')
         self.assertRaises(manager.UnknownCommandError, m.get_command,
@@ -1653,25 +2381,28 @@ def test_get_command(self):
     def test_list_commands(self):
         for cmd, help in manager.Manager.list_commands():
             method = getattr(manager.Manager, cmd.replace('-', '_'), None)
-            self.assert_(method, '%s is not a command' % cmd)
-            self.assert_(getattr(method, 'publicly_accessible', False))
-            self.assertEquals(method.__doc__.strip(), help)
+            self.assertTrue(method, '%s is not a command' % cmd)
+            self.assertTrue(getattr(method, 'publicly_accessible', False))
+            self.assertEqual(method.__doc__.strip(), help)
 
-    def test_run_command(self):
+    @mock.patch.object(manager, 'verify_server',
+                       side_effect=lambda server: 'error' not in server)
+    def test_run_command(self, mock_verify):
         m = manager.Manager(['test'])
         m.cmd_was_called = False
 
         def mock_cmd(*args, **kwargs):
             m.cmd_was_called = True
             expected = {'kw1': True, 'kw2': False}
-            self.assertEquals(kwargs, expected)
+            self.assertEqual(kwargs, expected)
             return 0
         mock_cmd.publicly_accessible = True
         m.mock_cmd = mock_cmd
         kwargs = {'kw1': True, 'kw2': False}
         status = m.run_command('mock_cmd', **kwargs)
-        self.assertEquals(status, 0)
-        self.assertEquals(m.cmd_was_called, True)
+        self.assertEqual(status, 0)
+        self.assertEqual(m.cmd_was_called, True)
+
 
 if __name__ == '__main__':
     unittest.main()
diff --git a/test/unit/common/test_memcached.py b/test/unit/common/test_memcached.py
index 7272cdaee3..27454e44ef 100644
--- a/test/unit/common/test_memcached.py
+++ b/test/unit/common/test_memcached.py
@@ -1,5 +1,5 @@
- # -*- coding: utf8 -*-
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# -*- coding:utf-8 -*-
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -14,113 +14,197 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-""" Tests for swift.common.utils """
-
-from __future__ import with_statement
+"""Tests for swift.common.utils"""
+import itertools
+from collections import defaultdict
+import errno
+import io
 import logging
 import socket
 import time
 import unittest
-from uuid import uuid4
+import os
+
+from unittest import mock
+from configparser import NoSectionError, NoOptionError
+
+from eventlet import GreenPool, sleep, Queue
+from eventlet.pools import Pool
+from eventlet.green import ssl
 
 from swift.common import memcached
-from test.unit import NullLoggingHandler
+from swift.common.memcached import MemcacheConnectionError, md5hash, \
+    MemcacheCommand, EXPTIME_MAXDELTA
+from swift.common.utils import md5, human_readable
+from unittest.mock import patch, MagicMock
+from test.debug_logger import debug_logger
+
+
+class MockedMemcachePool(memcached.MemcacheConnPool):
+    def __init__(self, mocks):
+        Pool.__init__(self, max_size=2)
+        self.mocks = mocks
+        # setting this for the eventlet workaround in the MemcacheConnPool
+        self._parent_class_getter = super(memcached.MemcacheConnPool, self).get
+
+    def create(self):
+        return self.mocks.pop(0)
 
 
 class ExplodingMockMemcached(object):
+    should_explode = True
     exploded = False
 
     def sendall(self, string):
-        self.exploded = True
-        raise socket.error()
+        if self.should_explode:
+            self.exploded = True
+            raise socket.error(errno.EPIPE, os.strerror(errno.EPIPE))
 
     def readline(self):
-        self.exploded = True
-        raise socket.error()
+        if self.should_explode:
+            self.exploded = True
+            raise socket.error(errno.EPIPE, os.strerror(errno.EPIPE))
+        return b'STORED\r\n'
 
     def read(self, size):
-        self.exploded = True
-        raise socket.error()
+        if self.should_explode:
+            self.exploded = True
+            raise socket.error(errno.EPIPE, os.strerror(errno.EPIPE))
+
+    def close(self):
+        pass
+
+
+TOO_BIG_KEY = md5(
+    b'too-big', usedforsecurity=False).hexdigest().encode('ascii')
 
 
 class MockMemcached(object):
+    # See https://github.com/memcached/memcached/blob/master/doc/protocol.txt
+    # In particular, the "Storage commands" section may be interesting.
 
     def __init__(self):
-        self.inbuf = ''
-        self.outbuf = ''
+        self.inbuf = b''
+        self.outbuf = b''
+        # Structure: key -> (flags, absolute exptime, value)
         self.cache = {}
         self.down = False
         self.exc_on_delete = False
         self.read_return_none = False
+        self.read_return_empty_str = False
+        self.close_called = False
+
+    def _get_absolute_exptime(self, exptime):
+        exptime = int(exptime)
+        if exptime == 0:
+            # '0' means this cache item doesn't expire.
+            return 0
+        elif exptime <= EXPTIME_MAXDELTA:
+            # Expiration time client passes in is delta from current unix time.
+            return exptime + time.time()
+        else:
+            # Already a absolute time.
+            return exptime
 
     def sendall(self, string):
         if self.down:
             raise Exception('mock is down')
         self.inbuf += string
-        while '\n' in self.inbuf:
-            cmd, self.inbuf = self.inbuf.split('\n', 1)
+        while b'\n' in self.inbuf:
+            cmd, self.inbuf = self.inbuf.split(b'\n', 1)
             parts = cmd.split()
-            if parts[0].lower() == 'set':
-                self.cache[parts[1]] = parts[2], parts[3], \
-                    self.inbuf[:int(parts[4])]
-                self.inbuf = self.inbuf[int(parts[4]) + 2:]
-                if len(parts) < 6 or parts[5] != 'noreply':
-                    self.outbuf += 'STORED\r\n'
-            elif parts[0].lower() == 'add':
-                value = self.inbuf[:int(parts[4])]
-                self.inbuf = self.inbuf[int(parts[4]) + 2:]
-                if parts[1] in self.cache:
-                    if len(parts) < 6 or parts[5] != 'noreply':
-                        self.outbuf += 'NOT_STORED\r\n'
-                else:
-                    self.cache[parts[1]] = parts[2], parts[3], value
-                    if len(parts) < 6 or parts[5] != 'noreply':
-                        self.outbuf += 'STORED\r\n'
-            elif parts[0].lower() == 'delete':
-                if self.exc_on_delete:
-                    raise Exception('mock is has exc_on_delete set')
-                if parts[1] in self.cache:
-                    del self.cache[parts[1]]
-                    if 'noreply' not in parts:
-                        self.outbuf += 'DELETED\r\n'
-                elif 'noreply' not in parts:
-                    self.outbuf += 'NOT_FOUND\r\n'
-            elif parts[0].lower() == 'get':
-                for key in parts[1:]:
-                    if key in self.cache:
-                        val = self.cache[key]
-                        self.outbuf += 'VALUE %s %s %s\r\n' % (
-                            key, val[0], len(val[2]))
-                        self.outbuf += val[2] + '\r\n'
-                self.outbuf += 'END\r\n'
-            elif parts[0].lower() == 'incr':
-                if parts[1] in self.cache:
-                    val = list(self.cache[parts[1]])
-                    val[2] = str(int(val[2]) + int(parts[2]))
-                    self.cache[parts[1]] = val
-                    self.outbuf += str(val[2]) + '\r\n'
-                else:
-                    self.outbuf += 'NOT_FOUND\r\n'
-            elif parts[0].lower() == 'decr':
-                if parts[1] in self.cache:
-                    val = list(self.cache[parts[1]])
-                    if int(val[2]) - int(parts[2]) > 0:
-                        val[2] = str(int(val[2]) - int(parts[2]))
-                    else:
-                        val[2] = '0'
-                    self.cache[parts[1]] = val
-                    self.outbuf += str(val[2]) + '\r\n'
-                else:
-                    self.outbuf += 'NOT_FOUND\r\n'
+            cmd_name = parts[0].decode('ascii').lower()
+            handler = getattr(self, 'handle_%s' % cmd_name, None)
+            if handler:
+                handler(*parts[1:])
+            else:
+                raise ValueError('Unhandled command: %s' % parts[0])
+
+    def handle_set(self, key, flags, exptime, num_bytes, noreply=b''):
+        self.cache[key] = (
+            flags,
+            self._get_absolute_exptime(exptime),
+            self.inbuf[:int(num_bytes)]
+        )
+        self.inbuf = self.inbuf[int(num_bytes) + 2:]
+        if noreply != b'noreply':
+            if key == TOO_BIG_KEY:
+                self.outbuf += b'SERVER_ERROR object too large for cache\r\n'
+            else:
+                self.outbuf += b'STORED\r\n'
+
+    def handle_add(self, key, flags, exptime, num_bytes, noreply=b''):
+        value = self.inbuf[:int(num_bytes)]
+        self.inbuf = self.inbuf[int(num_bytes) + 2:]
+        if key in self.cache:
+            if noreply != b'noreply':
+                self.outbuf += b'NOT_STORED\r\n'
+        else:
+            self.cache[key] = flags, self._get_absolute_exptime(exptime), value
+            if noreply != b'noreply':
+                self.outbuf += b'STORED\r\n'
+
+    def _is_expired(self, key):
+        _, exptime, _ = self.cache[key]
+        if exptime != 0 and time.time() > exptime:
+            self.cache.pop(key)
+            return True
+        else:
+            return False
+
+    def handle_delete(self, key, noreply=b''):
+        if self.exc_on_delete:
+            raise Exception('mock is has exc_on_delete set')
+        if key in self.cache and not self._is_expired(key):
+            del self.cache[key]
+            if noreply != b'noreply':
+                self.outbuf += b'DELETED\r\n'
+        elif noreply != b'noreply':
+            self.outbuf += b'NOT_FOUND\r\n'
+
+    def handle_get(self, *keys):
+        for key in keys:
+            if key in self.cache and not self._is_expired(key):
+                val = self.cache[key]
+                self.outbuf += b' '.join([
+                    b'VALUE',
+                    key,
+                    val[0],
+                    str(len(val[2])).encode('ascii')
+                ]) + b'\r\n'
+                self.outbuf += val[2] + b'\r\n'
+        self.outbuf += b'END\r\n'
+
+    def handle_incr(self, key, value, noreply=b''):
+        if key in self.cache and not self._is_expired(key):
+            current = self.cache[key][2]
+            new_val = str(int(current) + int(value)).encode('ascii')
+            self.cache[key] = self.cache[key][:2] + (new_val, )
+            self.outbuf += new_val + b'\r\n'
+        else:
+            self.outbuf += b'NOT_FOUND\r\n'
+
+    def handle_decr(self, key, value, noreply=b''):
+        if key in self.cache and not self._is_expired(key):
+            current = self.cache[key][2]
+            new_val = str(int(current) - int(value)).encode('ascii')
+            if new_val[:1] == b'-':  # ie, val is negative
+                new_val = b'0'
+            self.cache[key] = self.cache[key][:2] + (new_val, )
+            self.outbuf += new_val + b'\r\n'
+        else:
+            self.outbuf += b'NOT_FOUND\r\n'
 
     def readline(self):
+        if self.read_return_empty_str:
+            return b''
         if self.read_return_none:
             return None
         if self.down:
             raise Exception('mock is down')
-        if '\n' in self.outbuf:
-            response, self.outbuf = self.outbuf.split('\n', 1)
-            return response + '\n'
+        if b'\n' in self.outbuf:
+            response, self.outbuf = self.outbuf.split(b'\n', 1)
+            return response + b'\n'
 
     def read(self, size):
         if self.down:
@@ -130,9 +214,61 @@ def read(self, size):
             self.outbuf = self.outbuf[size:]
             return response
 
+    def close(self):
+        self.close_called = True
+        pass
+
+
+class TestMemcacheCommand(unittest.TestCase):
+    def test_init(self):
+        cmd = MemcacheCommand("set", "shard-updating-v2/a/c")
+        self.assertEqual(cmd.method, "set")
+        self.assertEqual(cmd.command, b"set")
+        self.assertEqual(cmd.key, "shard-updating-v2/a/c")
+        self.assertEqual(cmd.key_prefix, "shard-updating-v2/a")
+        self.assertEqual(cmd.hash_key, md5hash("shard-updating-v2/a/c"))
+
+    def test_get_key_prefix(self):
+        cmd = MemcacheCommand("set", "shard-updating-v2/a/c")
+        self.assertEqual(cmd.key_prefix, "shard-updating-v2/a")
+        cmd = MemcacheCommand("set", "shard-listing-v2/accout/container3")
+        self.assertEqual(cmd.key_prefix, "shard-listing-v2/accout")
+        cmd = MemcacheCommand(
+            "set", "auth_reseller_name/token/X58E34EL2SDFLEY3")
+        self.assertEqual(cmd.key_prefix, "auth_reseller_name/token")
+        cmd = MemcacheCommand("set", "nvratelimit/v2/wf/2345392374")
+        self.assertEqual(cmd.key_prefix, "nvratelimit/v2/wf")
+        cmd = MemcacheCommand("set", "some_key")
+        self.assertEqual(cmd.key_prefix, "some_key")
+
 
 class TestMemcached(unittest.TestCase):
-    """ Tests for swift.common.memcached"""
+    """Tests for swift.common.memcached"""
+
+    def setUp(self):
+        self.logger = debug_logger()
+        self.set_cmd = MemcacheCommand('set', 'key')
+
+    def test_logger_kwarg(self):
+        server_socket = '%s:%s' % ('[::1]', 11211)
+        client = memcached.MemcacheRing([server_socket])
+        self.assertIs(client.logger, logging.getLogger())
+
+        client = memcached.MemcacheRing([server_socket], logger=self.logger)
+        self.assertIs(client.logger, self.logger)
+
+    def test_tls_context_kwarg(self):
+        with patch('swift.common.memcached.socket.socket'):
+            server = '%s:%s' % ('[::1]', 11211)
+            client = memcached.MemcacheRing([server])
+            self.assertIsNone(client._client_cache[server]._tls_context)
+
+            context = mock.Mock()
+            client = memcached.MemcacheRing([server], tls_context=context)
+            self.assertIs(client._client_cache[server]._tls_context, context)
+
+            list(client._get_conns(self.set_cmd))
+            context.wrap_socket.assert_called_once()
 
     def test_get_conns(self):
         sock1 = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
@@ -148,165 +284,1543 @@ def test_get_conns(self):
             sock2ipport = '%s:%s' % (sock2ip, memcached.DEFAULT_MEMCACHED_PORT)
             # We're deliberately using sock2ip (no port) here to test that the
             # default port is used.
-            memcache_client = memcached.MemcacheRing([sock1ipport, sock2ip])
+            memcache_client = memcached.MemcacheRing([sock1ipport, sock2ip],
+                                                     logger=self.logger)
             one = two = True
             while one or two:  # Run until we match hosts one and two
-                key = uuid4().hex
-                for conn in memcache_client._get_conns(key):
+                for conn in memcache_client._get_conns(self.set_cmd):
+                    if 'b' not in getattr(conn[1], 'mode', ''):
+                        self.assertIsInstance(conn[1], (
+                            io.RawIOBase, io.BufferedIOBase))
                     peeripport = '%s:%s' % conn[2].getpeername()
-                    self.assert_(peeripport in (sock1ipport, sock2ipport))
+                    self.assertTrue(peeripport in (sock1ipport, sock2ipport))
                     if peeripport == sock1ipport:
                         one = False
                     if peeripport == sock2ipport:
                         two = False
+            self.assertEqual(len(memcache_client._errors[sock1ipport]), 0)
+            self.assertEqual(len(memcache_client._errors[sock2ip]), 0)
         finally:
             memcached.DEFAULT_MEMCACHED_PORT = orig_port
 
-    def test_set_get(self):
-        memcache_client = memcached.MemcacheRing(['1.2.3.4:11211'])
+    def test_get_conns_v6(self):
+        if not socket.has_ipv6:
+            return
+        try:
+            sock = socket.socket(socket.AF_INET6, socket.SOCK_STREAM)
+            sock.bind(('::1', 0, 0, 0))
+            sock.listen(1)
+            sock_addr = sock.getsockname()
+            server_socket = '[%s]:%s' % (sock_addr[0], sock_addr[1])
+            memcache_client = memcached.MemcacheRing([server_socket],
+                                                     logger=self.logger)
+            for conn in memcache_client._get_conns(self.set_cmd):
+                peer_sockaddr = conn[2].getpeername()
+                peer_socket = '[%s]:%s' % (peer_sockaddr[0], peer_sockaddr[1])
+                self.assertEqual(peer_socket, server_socket)
+            self.assertEqual(len(memcache_client._errors[server_socket]), 0)
+        finally:
+            sock.close()
+
+    def test_get_conns_v6_default(self):
+        if not socket.has_ipv6:
+            return
+        try:
+            sock = socket.socket(socket.AF_INET6, socket.SOCK_STREAM)
+            sock.bind(('::1', 0))
+            sock.listen(1)
+            sock_addr = sock.getsockname()
+            server_socket = '[%s]:%s' % (sock_addr[0], sock_addr[1])
+            server_host = '[%s]' % sock_addr[0]
+            memcached.DEFAULT_MEMCACHED_PORT = sock_addr[1]
+            memcache_client = memcached.MemcacheRing([server_host],
+                                                     logger=self.logger)
+            for conn in memcache_client._get_conns(self.set_cmd):
+                peer_sockaddr = conn[2].getpeername()
+                peer_socket = '[%s]:%s' % (peer_sockaddr[0], peer_sockaddr[1])
+                self.assertEqual(peer_socket, server_socket)
+            self.assertEqual(len(memcache_client._errors[server_host]), 0)
+        finally:
+            sock.close()
+
+    def test_get_conns_bad_v6(self):
+        with self.assertRaises(ValueError):
+            # IPv6 address with missing [] is invalid
+            server_socket = '%s:%s' % ('::1', 11211)
+            memcached.MemcacheRing([server_socket], logger=self.logger)
+
+    def test_get_conns_hostname(self):
+        with patch('swift.common.memcached.socket.getaddrinfo') as addrinfo:
+            try:
+                sock = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
+                sock.bind(('127.0.0.1', 0))
+                sock.listen(1)
+                sock_addr = sock.getsockname()
+                fqdn = socket.getfqdn()
+                server_socket = '%s:%s' % (fqdn, sock_addr[1])
+                addrinfo.return_value = [(socket.AF_INET,
+                                          socket.SOCK_STREAM, 0, '',
+                                          ('127.0.0.1', sock_addr[1]))]
+                memcache_client = memcached.MemcacheRing([server_socket],
+                                                         logger=self.logger)
+                for conn in memcache_client._get_conns(self.set_cmd):
+                    peer_sockaddr = conn[2].getpeername()
+                    peer_socket = '%s:%s' % (peer_sockaddr[0],
+                                             peer_sockaddr[1])
+                    self.assertEqual(peer_socket,
+                                     '127.0.0.1:%d' % sock_addr[1])
+                self.assertEqual(len(memcache_client._errors[server_socket]),
+                                 0)
+            finally:
+                sock.close()
+
+    def test_get_conns_hostname6(self):
+        with patch('swift.common.memcached.socket.getaddrinfo') as addrinfo:
+            try:
+                sock = socket.socket(socket.AF_INET6, socket.SOCK_STREAM)
+                sock.bind(('::1', 0))
+                sock.listen(1)
+                sock_addr = sock.getsockname()
+                fqdn = socket.getfqdn()
+                server_socket = '%s:%s' % (fqdn, sock_addr[1])
+                addrinfo.return_value = [(socket.AF_INET6,
+                                          socket.SOCK_STREAM, 0, '',
+                                          ('::1', sock_addr[1]))]
+                memcache_client = memcached.MemcacheRing([server_socket],
+                                                         logger=self.logger)
+                for conn in memcache_client._get_conns(self.set_cmd):
+                    peer_sockaddr = conn[2].getpeername()
+                    peer_socket = '[%s]:%s' % (peer_sockaddr[0],
+                                               peer_sockaddr[1])
+                    self.assertEqual(peer_socket, '[::1]:%d' % sock_addr[1])
+                self.assertEqual(len(memcache_client._errors[server_socket]),
+                                 0)
+            finally:
+                sock.close()
+
+    def test_set_get_json(self):
+        memcache_client = memcached.MemcacheRing(['1.2.3.4:11211'],
+                                                 logger=self.logger)
         mock = MockMemcached()
-        memcache_client._client_cache['1.2.3.4:11211'] = [(mock, mock)] * 2
+        memcache_client._client_cache['1.2.3.4:11211'] = MockedMemcachePool(
+            [(mock, mock)] * 2)
+        cache_key = md5(b'some_key',
+                        usedforsecurity=False).hexdigest().encode('ascii')
+
         memcache_client.set('some_key', [1, 2, 3])
-        self.assertEquals(memcache_client.get('some_key'), [1, 2, 3])
-        self.assertEquals(mock.cache.values()[0][1], '0')
+        self.assertEqual(memcache_client.get('some_key'), [1, 2, 3])
+        # See JSON_FLAG
+        self.assertEqual(mock.cache, {cache_key: (b'2', 0, b'[1, 2, 3]')})
+
         memcache_client.set('some_key', [4, 5, 6])
-        self.assertEquals(memcache_client.get('some_key'), [4, 5, 6])
+        self.assertEqual(memcache_client.get('some_key'), [4, 5, 6])
+        self.assertEqual(mock.cache, {cache_key: (b'2', 0, b'[4, 5, 6]')})
+
         memcache_client.set('some_key', ['simple str', 'utf8 str éà'])
         # As per http://wiki.openstack.org/encoding,
         # we should expect to have unicode
-        self.assertEquals(
+        self.assertEqual(
             memcache_client.get('some_key'), ['simple str', u'utf8 str éà'])
-        self.assert_(float(mock.cache.values()[0][1]) == 0)
-        memcache_client.set('some_key', [1, 2, 3], timeout=10)
-        self.assertEquals(mock.cache.values()[0][1], '10')
+        self.assertEqual(mock.cache, {cache_key: (
+            b'2', 0, b'["simple str", "utf8 str \\u00e9\\u00e0"]')})
+
+        now = time.time()
+        with patch('time.time', return_value=now):
+            memcache_client.set('some_key', [1, 2, 3], time=20)
+        self.assertEqual(
+            mock.cache, {cache_key: (b'2', now + 20, b'[1, 2, 3]')})
+
         sixtydays = 60 * 24 * 60 * 60
         esttimeout = time.time() + sixtydays
-        memcache_client.set('some_key', [1, 2, 3], timeout=sixtydays)
-        self.assert_(-1 <= float(mock.cache.values()[0][1]) - esttimeout <= 1)
+        memcache_client.set('some_key', [1, 2, 3], time=sixtydays)
+        _junk, cache_timeout, _junk = mock.cache[cache_key]
+        self.assertAlmostEqual(float(cache_timeout), esttimeout, delta=1)
+
+    def test_set_error(self):
+        memcache_client = memcached.MemcacheRing(
+            ['1.2.3.4:11211'], logger=self.logger,
+            item_size_warning_threshold=1)
+        mock = MockMemcached()
+        memcache_client._client_cache['1.2.3.4:11211'] = MockedMemcachePool(
+            [(mock, mock)] * 2)
+        now = time.time()
+        with patch('time.time', return_value=now):
+            memcache_client.set('too-big', [1, 2, 3])
+        self.assertEqual(
+            self.logger.get_lines_for_level('error'),
+            ['Error talking to memcached: 1.2.3.4:11211: '
+             'with key_prefix too-big, method set, time_spent 0.0, '
+             'failed set: SERVER_ERROR object too large for cache'])
+        warning_lines = self.logger.get_lines_for_level('warning')
+        self.assertEqual(1, len(warning_lines))
+        self.assertIn('Item size larger than warning threshold',
+                      warning_lines[0])
+        self.assertTrue(mock.close_called)
+
+    def test_set_error_raise_on_error(self):
+        memcache_client = memcached.MemcacheRing(
+            ['1.2.3.4:11211'], logger=self.logger,
+            item_size_warning_threshold=1)
+        mock = MockMemcached()
+        memcache_client._client_cache[
+            '1.2.3.4:11211'] = MockedMemcachePool(
+            [(mock, mock)] * 2)
+        now = time.time()
+
+        with self.assertRaises(MemcacheConnectionError) as cm:
+            with patch('time.time', return_value=now):
+                memcache_client.set('too-big', [1, 2, 3], raise_on_error=True)
+        self.assertIn("No memcached connections succeeded", str(cm.exception))
+        self.assertEqual(
+            self.logger.get_lines_for_level('error'),
+            ['Error talking to memcached: 1.2.3.4:11211: '
+             'with key_prefix too-big, method set, time_spent 0.0, '
+             'failed set: SERVER_ERROR object too large for cache'])
+        warning_lines = self.logger.get_lines_for_level('warning')
+        self.assertEqual(1, len(warning_lines))
+        self.assertIn('Item size larger than warning threshold',
+                      warning_lines[0])
+        self.assertTrue(mock.close_called)
+
+    def test_get_failed_connection_mid_request(self):
+        memcache_client = memcached.MemcacheRing(['1.2.3.4:11211'],
+                                                 logger=self.logger)
+        mock = MockMemcached()
+        memcache_client._client_cache['1.2.3.4:11211'] = MockedMemcachePool(
+            [(mock, mock)] * 2)
+        memcache_client.set('some_key', [1, 2, 3])
+        self.assertEqual(memcache_client.get('some_key'), [1, 2, 3])
+        self.assertEqual(list(mock.cache.values()),
+                         [(b'2', 0, b'[1, 2, 3]')])
+
+        # Now lets return an empty string, and make sure we aren't logging
+        # the error.
+        fake_stdout = io.StringIO()
+        # force the logging through the DebugLogger instead of the nose
+        # handler. This will use stdout, so we can assert that no stack trace
+        # is logged.
+        with patch("sys.stdout", fake_stdout):
+            mock.read_return_empty_str = True
+            self.assertIsNone(memcache_client.get('some_key'))
+        log_lines = self.logger.get_lines_for_level('error')
+        self.assertIn('Error talking to memcached', log_lines[0])
+        self.assertFalse(log_lines[1:])
+        self.assertNotIn("Traceback", fake_stdout.getvalue())
 
     def test_incr(self):
-        memcache_client = memcached.MemcacheRing(['1.2.3.4:11211'])
+        memcache_client = memcached.MemcacheRing(['1.2.3.4:11211'],
+                                                 logger=self.logger)
         mock = MockMemcached()
-        memcache_client._client_cache['1.2.3.4:11211'] = [(mock, mock)] * 2
-        memcache_client.incr('some_key', delta=5)
-        self.assertEquals(memcache_client.get('some_key'), '5')
-        memcache_client.incr('some_key', delta=5)
-        self.assertEquals(memcache_client.get('some_key'), '10')
-        memcache_client.incr('some_key', delta=1)
-        self.assertEquals(memcache_client.get('some_key'), '11')
-        memcache_client.incr('some_key', delta=-5)
-        self.assertEquals(memcache_client.get('some_key'), '6')
-        memcache_client.incr('some_key', delta=-15)
-        self.assertEquals(memcache_client.get('some_key'), '0')
+        memcache_client._client_cache['1.2.3.4:11211'] = MockedMemcachePool(
+            [(mock, mock)] * 2)
+        self.assertEqual(memcache_client.incr('some_key', delta=5), 5)
+        self.assertEqual(memcache_client.get('some_key'), b'5')
+        self.assertEqual(memcache_client.incr('some_key', delta=5), 10)
+        self.assertEqual(memcache_client.get('some_key'), b'10')
+        self.assertEqual(memcache_client.incr('some_key', delta=1), 11)
+        self.assertEqual(memcache_client.get('some_key'), b'11')
+        self.assertEqual(memcache_client.incr('some_key', delta=-5), 6)
+        self.assertEqual(memcache_client.get('some_key'), b'6')
+        self.assertEqual(memcache_client.incr('some_key', delta=-15), 0)
+        self.assertEqual(memcache_client.get('some_key'), b'0')
         mock.read_return_none = True
         self.assertRaises(memcached.MemcacheConnectionError,
                           memcache_client.incr, 'some_key', delta=-15)
+        self.assertTrue(mock.close_called)
+
+    def test_incr_failed_connection_mid_request(self):
+        memcache_client = memcached.MemcacheRing(['1.2.3.4:11211'],
+                                                 logger=self.logger)
+        mock = MockMemcached()
+        memcache_client._client_cache['1.2.3.4:11211'] = MockedMemcachePool(
+            [(mock, mock)] * 2)
+        self.assertEqual(memcache_client.incr('some_key', delta=5), 5)
+        self.assertEqual(memcache_client.get('some_key'), b'5')
+        self.assertEqual(memcache_client.incr('some_key', delta=5), 10)
+        self.assertEqual(memcache_client.get('some_key'), b'10')
+
+        # Now lets return an empty string, and make sure we aren't logging
+        # the error.
+        fake_stdout = io.StringIO()
+        # force the logging through the DebugLogger instead of the nose
+        # handler. This will use stdout, so we can assert that no stack trace
+        # is logged.
+        with patch("sys.stdout", fake_stdout):
+            mock.read_return_empty_str = True
+            self.assertRaises(memcached.MemcacheConnectionError,
+                              memcache_client.incr, 'some_key', delta=1)
+        log_lines = self.logger.get_lines_for_level('error')
+        self.assertIn('Error talking to memcached', log_lines[0])
+        self.assertFalse(log_lines[1:])
+        self.assertNotIn('Traceback', fake_stdout.getvalue())
 
     def test_incr_w_timeout(self):
-        memcache_client = memcached.MemcacheRing(['1.2.3.4:11211'])
+        memcache_client = memcached.MemcacheRing(['1.2.3.4:11211'],
+                                                 logger=self.logger)
         mock = MockMemcached()
-        memcache_client._client_cache['1.2.3.4:11211'] = [(mock, mock)] * 2
-        memcache_client.incr('some_key', delta=5, timeout=55)
-        self.assertEquals(memcache_client.get('some_key'), '5')
-        self.assertEquals(mock.cache.values()[0][1], '55')
+        memcache_client._client_cache['1.2.3.4:11211'] = MockedMemcachePool(
+            [(mock, mock)] * 2)
+        cache_key = md5(b'some_key',
+                        usedforsecurity=False).hexdigest().encode('ascii')
+
+        now = time.time()
+        with patch('time.time', return_value=now):
+            memcache_client.incr('some_key', delta=5, time=55)
+        self.assertEqual(memcache_client.get('some_key'), b'5')
+        self.assertEqual(mock.cache, {cache_key: (b'0', now + 55, b'5')})
+
         memcache_client.delete('some_key')
-        self.assertEquals(memcache_client.get('some_key'), None)
+        self.assertIsNone(memcache_client.get('some_key'))
+
         fiftydays = 50 * 24 * 60 * 60
         esttimeout = time.time() + fiftydays
-        memcache_client.incr('some_key', delta=5, timeout=fiftydays)
-        self.assertEquals(memcache_client.get('some_key'), '5')
-        self.assert_(-1 <= float(mock.cache.values()[0][1]) - esttimeout <= 1)
+        memcache_client.incr('some_key', delta=5, time=fiftydays)
+        self.assertEqual(memcache_client.get('some_key'), b'5')
+        _junk, cache_timeout, _junk = mock.cache[cache_key]
+        self.assertAlmostEqual(float(cache_timeout), esttimeout, delta=1)
+
         memcache_client.delete('some_key')
-        self.assertEquals(memcache_client.get('some_key'), None)
+        self.assertIsNone(memcache_client.get('some_key'))
+
         memcache_client.incr('some_key', delta=5)
-        self.assertEquals(memcache_client.get('some_key'), '5')
-        self.assertEquals(mock.cache.values()[0][1], '0')
-        memcache_client.incr('some_key', delta=5, timeout=55)
-        self.assertEquals(memcache_client.get('some_key'), '10')
-        self.assertEquals(mock.cache.values()[0][1], '0')
+        self.assertEqual(memcache_client.get('some_key'), b'5')
+        self.assertEqual(mock.cache, {cache_key: (b'0', 0, b'5')})
+
+        memcache_client.incr('some_key', delta=5, time=55)
+        self.assertEqual(memcache_client.get('some_key'), b'10')
+        self.assertEqual(mock.cache, {cache_key: (b'0', 0, b'10')})
+
+    def test_incr_expiration_time(self):
+        # Test increment with different expiration times
+        memcache_client = memcached.MemcacheRing(
+            ['1.2.3.4:11211'], logger=self.logger)
+        mock = MockMemcached()
+        memcache_client._client_cache['1.2.3.4:11211'] = MockedMemcachePool(
+            [(mock, mock)] * 2)
+
+        now = time.time()
+        # Test expiration time < 'EXPTIME_MAXDELTA'
+        with patch('time.time', return_value=now):
+            memcache_client.incr('expiring_key', delta=5, time=1)
+            self.assertEqual(memcache_client.get('expiring_key'), b'5')
+        with patch('time.time', return_value=now + 2):
+            self.assertIsNone(memcache_client.get('expiring_key'))
+        # Test expiration time is 0
+        with patch('time.time', return_value=now):
+            memcache_client.incr('expiring_key', delta=5, time=0)
+            self.assertEqual(memcache_client.get('expiring_key'), b'5')
+        with patch('time.time', return_value=now + 100):
+            self.assertEqual(memcache_client.get('expiring_key'), b'5')
+        memcache_client.delete('expiring_key')
+        # Test expiration time > 'EXPTIME_MAXDELTA'
+        with patch('time.time', return_value=now):
+            memcache_client.incr(
+                'expiring_key', delta=5, time=(EXPTIME_MAXDELTA + 10))
+        with patch('time.time', return_value=(now + EXPTIME_MAXDELTA + 2)):
+            self.assertEqual(memcache_client.get('expiring_key'), b'5')
+        with patch('time.time', return_value=(now + EXPTIME_MAXDELTA + 11)):
+            self.assertIsNone(memcache_client.get('expiring_key'))
+
+    def test_set_expiration_time(self):
+        # Test set with different expiration times
+        memcache_client = memcached.MemcacheRing(
+            ['1.2.3.4:11211'], logger=self.logger)
+        mock = MockMemcached()
+        memcache_client._client_cache['1.2.3.4:11211'] = MockedMemcachePool(
+            [(mock, mock)] * 2)
+
+        now = time.time()
+        # Test expiration time < 'EXPTIME_MAXDELTA'
+        with patch('time.time', return_value=now):
+            memcache_client.set('expiring_key', value=5, time=1)
+            self.assertEqual(memcache_client.get('expiring_key'), 5)
+        with patch('time.time', return_value=now + 2):
+            self.assertIsNone(memcache_client.get('expiring_key'))
+        # Test expiration time is 0
+        with patch('time.time', return_value=now):
+            memcache_client.set('expiring_key', value=5, time=0)
+            self.assertEqual(memcache_client.get('expiring_key'), 5)
+        with patch('time.time', return_value=now + 100):
+            self.assertEqual(memcache_client.get('expiring_key'), 5)
+        memcache_client.delete('expiring_key')
+        # Test expiration time > 'EXPTIME_MAXDELTA'
+        with patch('time.time', return_value=now):
+            memcache_client.set(
+                'expiring_key', value=5, time=(EXPTIME_MAXDELTA + 10))
+        with patch('time.time', return_value=(now + EXPTIME_MAXDELTA + 2)):
+            self.assertEqual(memcache_client.get('expiring_key'), 5)
+        with patch('time.time', return_value=(now + EXPTIME_MAXDELTA + 11)):
+            self.assertIsNone(memcache_client.get('expiring_key'))
 
     def test_decr(self):
-        memcache_client = memcached.MemcacheRing(['1.2.3.4:11211'])
+        memcache_client = memcached.MemcacheRing(['1.2.3.4:11211'],
+                                                 logger=self.logger)
         mock = MockMemcached()
-        memcache_client._client_cache['1.2.3.4:11211'] = [(mock, mock)] * 2
-        memcache_client.decr('some_key', delta=5)
-        self.assertEquals(memcache_client.get('some_key'), '0')
-        memcache_client.incr('some_key', delta=15)
-        self.assertEquals(memcache_client.get('some_key'), '15')
-        memcache_client.decr('some_key', delta=4)
-        self.assertEquals(memcache_client.get('some_key'), '11')
-        memcache_client.decr('some_key', delta=15)
-        self.assertEquals(memcache_client.get('some_key'), '0')
+        memcache_client._client_cache['1.2.3.4:11211'] = MockedMemcachePool(
+            [(mock, mock)] * 2)
+        self.assertEqual(memcache_client.decr('some_key', delta=5), 0)
+        self.assertEqual(memcache_client.get('some_key'), b'0')
+        self.assertEqual(memcache_client.incr('some_key', delta=15), 15)
+        self.assertEqual(memcache_client.get('some_key'), b'15')
+        self.assertEqual(memcache_client.decr('some_key', delta=4), 11)
+        self.assertEqual(memcache_client.get('some_key'), b'11')
+        self.assertEqual(memcache_client.decr('some_key', delta=15), 0)
+        self.assertEqual(memcache_client.get('some_key'), b'0')
         mock.read_return_none = True
         self.assertRaises(memcached.MemcacheConnectionError,
                           memcache_client.decr, 'some_key', delta=15)
 
     def test_retry(self):
-        logging.getLogger().addHandler(NullLoggingHandler())
         memcache_client = memcached.MemcacheRing(
-            ['1.2.3.4:11211', '1.2.3.5:11211'])
+            ['1.2.3.4:11211', '1.2.3.5:11211'], logger=self.logger)
         mock1 = ExplodingMockMemcached()
         mock2 = MockMemcached()
-        memcache_client._client_cache['1.2.3.4:11211'] = [(mock2, mock2)]
-        memcache_client._client_cache['1.2.3.5:11211'] = [(mock1, mock1)]
-        memcache_client.set('some_key', [1, 2, 3])
-        self.assertEquals(memcache_client.get('some_key'), [1, 2, 3])
-        self.assertEquals(mock1.exploded, True)
+        memcache_client._client_cache['1.2.3.4:11211'] = MockedMemcachePool(
+            [(mock2, mock2)])
+        memcache_client._client_cache['1.2.3.5:11211'] = MockedMemcachePool(
+            [(mock1, mock1), (mock1, mock1)])
+        now = time.time()
+        with patch('time.time', return_value=now):
+            memcache_client.set('some_key', [1, 2, 3])
+        self.assertEqual(mock1.exploded, True)
+        self.assertEqual(self.logger.get_lines_for_level('error'), [
+            'Error talking to memcached: 1.2.3.5:11211: '
+            'with key_prefix some_key, method set, time_spent 0.0, '
+            '[Errno 32] Broken pipe',
+        ])
+
+        self.logger.clear()
+        mock1.exploded = False
+        now = time.time()
+        with patch('time.time', return_value=now):
+            self.assertEqual(memcache_client.get('some_key'), [1, 2, 3])
+        self.assertEqual(mock1.exploded, True)
+        self.assertEqual(self.logger.get_lines_for_level('error'), [
+            'Error talking to memcached: 1.2.3.5:11211: '
+            'with key_prefix some_key, method get, time_spent 0.0, '
+            '[Errno 32] Broken pipe',
+        ])
+        # Check that we really did call create() twice
+        self.assertEqual(memcache_client._client_cache['1.2.3.5:11211'].mocks,
+                         [])
+
+    def test_error_limiting(self):
+        memcache_client = memcached.MemcacheRing(
+            ['1.2.3.4:11211', '1.2.3.5:11211'], logger=self.logger)
+        mock1 = ExplodingMockMemcached()
+        mock2 = ExplodingMockMemcached()
+        mock2.should_explode = False
+        memcache_client._client_cache['1.2.3.4:11211'] = MockedMemcachePool(
+            [(mock2, mock2)] * 12)
+        memcache_client._client_cache['1.2.3.5:11211'] = MockedMemcachePool(
+            [(mock1, mock1)] * 12)
+
+        now = time.time()
+        with patch('time.time', return_value=now):
+            for _ in range(12):
+                memcache_client.set('some_key', [1, 2, 3])
+        # twelfth one skips .5 because of error limiting and goes straight
+        # to .4
+        self.assertEqual(self.logger.get_lines_for_level('error'), [
+            'Error talking to memcached: 1.2.3.5:11211: '
+            'with key_prefix some_key, method set, time_spent 0.0, '
+            '[Errno 32] Broken pipe',
+        ] * 11 + [
+            'Error limiting server 1.2.3.5:11211'
+        ])
+        self.logger.clear()
+
+        mock2.should_explode = True
+        now = time.time()
+        with patch('time.time', return_value=now):
+            for _ in range(12):
+                memcache_client.set('some_key', [1, 2, 3])
+        # as we keep going, eventually .4 gets error limited, too
+        self.assertEqual(self.logger.get_lines_for_level('error'), [
+            'Error talking to memcached: 1.2.3.4:11211: '
+            'with key_prefix some_key, method set, time_spent 0.0, '
+            '[Errno 32] Broken pipe',
+        ] * 10 + [
+            'Error talking to memcached: 1.2.3.4:11211: '
+            'with key_prefix some_key, method set, time_spent 0.0, '
+            '[Errno 32] Broken pipe',
+            'Error limiting server 1.2.3.4:11211',
+            'Error connecting to memcached: ALL: with key_prefix some_key, '
+            'method set: No more memcached servers to try',
+        ])
+        self.logger.clear()
+
+        # continued requests just keep bypassing memcache
+        for _ in range(12):
+            memcache_client.set('some_key', [1, 2, 3])
+        self.assertEqual(self.logger.get_lines_for_level('error'), [
+            'Error connecting to memcached: ALL: with key_prefix some_key, '
+            'method set: No more memcached servers to try',
+        ] * 12)
+        self.logger.clear()
+
+        # and get()s are all a "cache miss"
+        self.assertIsNone(memcache_client.get('some_key'))
+        self.assertEqual(self.logger.get_lines_for_level('error'), [
+            'Error connecting to memcached: ALL: with key_prefix some_key, '
+            'method get: No more memcached servers to try',
+        ])
+
+    def test_error_disabled(self):
+        memcache_client = memcached.MemcacheRing(
+            ['1.2.3.4:11211'], logger=self.logger, error_limit_time=0)
+        mock1 = ExplodingMockMemcached()
+        memcache_client._client_cache['1.2.3.4:11211'] = MockedMemcachePool(
+            [(mock1, mock1)] * 20)
+
+        now = time.time()
+        with patch('time.time', return_value=now):
+            for _ in range(20):
+                memcache_client.set('some_key', [1, 2, 3])
+        # twelfth one skips .5 because of error limiting and goes straight
+        # to .4
+        self.assertEqual(self.logger.get_lines_for_level('error'), [
+            'Error talking to memcached: 1.2.3.4:11211: '
+            'with key_prefix some_key, method set, time_spent 0.0, '
+            '[Errno 32] Broken pipe',
+        ] * 20)
+
+    def test_error_raising(self):
+        memcache_client = memcached.MemcacheRing(
+            ['1.2.3.4:11211'], logger=self.logger, error_limit_time=0)
+        mock1 = ExplodingMockMemcached()
+        memcache_client._client_cache['1.2.3.4:11211'] = MockedMemcachePool(
+            [(mock1, mock1)] * 20)
+
+        # expect exception when requested...
+        now = time.time()
+        with patch('time.time', return_value=now):
+            with self.assertRaises(MemcacheConnectionError):
+                memcache_client.set('some_key', [1, 2, 3], raise_on_error=True)
+        self.assertEqual(self.logger.get_lines_for_level('error'), [
+            'Error talking to memcached: 1.2.3.4:11211: '
+            'with key_prefix some_key, method set, time_spent 0.0, '
+            '[Errno 32] Broken pipe',
+        ])
+        self.logger.clear()
+
+        with patch('time.time', return_value=now):
+            with self.assertRaises(MemcacheConnectionError):
+                memcache_client.get('some_key', raise_on_error=True)
+        self.assertEqual(self.logger.get_lines_for_level('error'), [
+            'Error talking to memcached: 1.2.3.4:11211: '
+            'with key_prefix some_key, method get, time_spent 0.0, '
+            '[Errno 32] Broken pipe',
+        ])
+        self.logger.clear()
+
+        with patch('time.time', return_value=now):
+            with self.assertRaises(MemcacheConnectionError):
+                memcache_client.set(
+                    'shard-updating-v2/acc/container', [1, 2, 3],
+                    raise_on_error=True)
+        self.assertEqual(self.logger.get_lines_for_level('error'), [
+            'Error talking to memcached: 1.2.3.4:11211: '
+            'with key_prefix shard-updating-v2/acc, method set, '
+            'time_spent 0.0, [Errno 32] Broken pipe',
+        ])
+        self.logger.clear()
+
+        # ...but default is no exception
+        with patch('time.time', return_value=now):
+            memcache_client.set('some_key', [1, 2, 3])
+        self.assertEqual(self.logger.get_lines_for_level('error'), [
+            'Error talking to memcached: 1.2.3.4:11211: '
+            'with key_prefix some_key, method set, time_spent 0.0, '
+            '[Errno 32] Broken pipe',
+        ])
+        self.logger.clear()
+
+        with patch('time.time', return_value=now):
+            memcache_client.get('some_key')
+        self.assertEqual(self.logger.get_lines_for_level('error'), [
+            'Error talking to memcached: 1.2.3.4:11211: '
+            'with key_prefix some_key, method get, time_spent 0.0, '
+            '[Errno 32] Broken pipe',
+        ])
+        self.logger.clear()
+
+        with patch('time.time', return_value=now):
+            memcache_client.set('shard-updating-v2/acc/container', [1, 2, 3])
+        self.assertEqual(self.logger.get_lines_for_level('error'), [
+            'Error talking to memcached: 1.2.3.4:11211: '
+            'with key_prefix shard-updating-v2/acc, method set, '
+            'time_spent 0.0, [Errno 32] Broken pipe',
+        ])
+
+    def test_error_limiting_custom_config(self):
+        def do_calls(time_step, num_calls, **memcache_kwargs):
+            self.logger.clear()
+            memcache_client = memcached.MemcacheRing(
+                ['1.2.3.5:11211'], logger=self.logger,
+                **memcache_kwargs)
+            mock1 = ExplodingMockMemcached()
+            memcache_client._client_cache['1.2.3.5:11211'] = \
+                MockedMemcachePool([(mock1, mock1)] * num_calls)
+
+            for n in range(num_calls):
+                with mock.patch.object(memcached.tm, 'time',
+                                       return_value=time_step * n):
+                    memcache_client.set('some_key', [1, 2, 3])
+
+        # with default error_limit_time of 60, one call per 5 secs, twelfth one
+        # triggers error limit
+        do_calls(5.0, 12)
+        self.assertEqual(self.logger.get_lines_for_level('error'), [
+            'Error talking to memcached: 1.2.3.5:11211: '
+            'with key_prefix some_key, method set, time_spent 0.0, '
+            '[Errno 32] Broken pipe',
+        ] * 10 + [
+            'Error talking to memcached: 1.2.3.5:11211: '
+            'with key_prefix some_key, method set, time_spent 0.0, '
+            '[Errno 32] Broken pipe',
+            'Error limiting server 1.2.3.5:11211',
+            'Error connecting to memcached: ALL: with key_prefix some_key, '
+            'method set: No more memcached servers to try',
+        ])
+
+        # with default error_limit_time of 60, one call per 6 secs, error limit
+        # is not triggered
+        do_calls(6.0, 20)
+        self.assertEqual(self.logger.get_lines_for_level('error'), [
+            'Error talking to memcached: 1.2.3.5:11211: '
+            'with key_prefix some_key, method set, time_spent 0.0, '
+            '[Errno 32] Broken pipe',
+        ] * 20)
+
+        # with error_limit_time of 66, one call per 6 secs, twelfth one
+        # triggers error limit
+        do_calls(6.0, 12, error_limit_time=66)
+        self.assertEqual(self.logger.get_lines_for_level('error'), [
+            'Error talking to memcached: 1.2.3.5:11211: '
+            'with key_prefix some_key, method set, time_spent 0.0, '
+            '[Errno 32] Broken pipe',
+        ] * 10 + [
+            'Error talking to memcached: 1.2.3.5:11211: '
+            'with key_prefix some_key, method set, time_spent 0.0, '
+            '[Errno 32] Broken pipe',
+            'Error limiting server 1.2.3.5:11211',
+            'Error connecting to memcached: ALL: with key_prefix some_key, '
+            'method set: No more memcached servers to try'])
+
+        # with error_limit_time of 70, one call per 6 secs, error_limit_count
+        # of 11, 13th call triggers error limit
+        do_calls(6.0, 13, error_limit_time=70, error_limit_count=11)
+        self.assertEqual(self.logger.get_lines_for_level('error'), [
+            'Error talking to memcached: 1.2.3.5:11211: '
+            'with key_prefix some_key, method set, time_spent 0.0, '
+            '[Errno 32] Broken pipe',
+        ] * 11 + [
+            'Error talking to memcached: 1.2.3.5:11211: '
+            'with key_prefix some_key, method set, time_spent 0.0, '
+            '[Errno 32] Broken pipe',
+            'Error limiting server 1.2.3.5:11211',
+            'Error connecting to memcached: ALL: with key_prefix some_key, '
+            'method set: No more memcached servers to try'])
 
     def test_delete(self):
-        memcache_client = memcached.MemcacheRing(['1.2.3.4:11211'])
+        memcache_client = memcached.MemcacheRing(['1.2.3.4:11211'],
+                                                 logger=self.logger)
         mock = MockMemcached()
-        memcache_client._client_cache['1.2.3.4:11211'] = [(mock, mock)] * 2
+        memcache_client._client_cache['1.2.3.4:11211'] = MockedMemcachePool(
+            [(mock, mock)] * 2)
         memcache_client.set('some_key', [1, 2, 3])
-        self.assertEquals(memcache_client.get('some_key'), [1, 2, 3])
+        self.assertEqual(memcache_client.get('some_key'), [1, 2, 3])
         memcache_client.delete('some_key')
-        self.assertEquals(memcache_client.get('some_key'), None)
+        self.assertIsNone(memcache_client.get('some_key'))
 
     def test_multi(self):
-        memcache_client = memcached.MemcacheRing(['1.2.3.4:11211'])
+        memcache_client = memcached.MemcacheRing(['1.2.3.4:11211'],
+                                                 logger=self.logger)
         mock = MockMemcached()
-        memcache_client._client_cache['1.2.3.4:11211'] = [(mock, mock)] * 2
+        memcache_client._client_cache['1.2.3.4:11211'] = MockedMemcachePool(
+            [(mock, mock)] * 2)
+
         memcache_client.set_multi(
             {'some_key1': [1, 2, 3], 'some_key2': [4, 5, 6]}, 'multi_key')
-        self.assertEquals(
+        self.assertEqual(
             memcache_client.get_multi(('some_key2', 'some_key1'), 'multi_key'),
             [[4, 5, 6], [1, 2, 3]])
-        self.assertEquals(mock.cache.values()[0][1], '0')
-        self.assertEquals(mock.cache.values()[1][1], '0')
-        memcache_client.set_multi(
-            {'some_key1': [1, 2, 3], 'some_key2': [4, 5, 6]}, 'multi_key',
-            timeout=10)
-        self.assertEquals(mock.cache.values()[0][1], '10')
-        self.assertEquals(mock.cache.values()[1][1], '10')
+        for key in (b'some_key1', b'some_key2'):
+            key = md5(key, usedforsecurity=False).hexdigest().encode('ascii')
+            self.assertIn(key, mock.cache)
+            _junk, cache_timeout, _junk = mock.cache[key]
+            self.assertEqual(cache_timeout, 0)
+
+        now = time.time()
+        with patch('time.time', return_value=now):
+            memcache_client.set_multi(
+                {'some_key1': [1, 2, 3], 'some_key2': [4, 5, 6]}, 'multi_key',
+                time=20)
+        for key in (b'some_key1', b'some_key2'):
+            key = md5(key, usedforsecurity=False).hexdigest().encode('ascii')
+            _junk, cache_timeout, _junk = mock.cache[key]
+            self.assertEqual(cache_timeout, now + 20)
+
         fortydays = 50 * 24 * 60 * 60
         esttimeout = time.time() + fortydays
         memcache_client.set_multi(
             {'some_key1': [1, 2, 3], 'some_key2': [4, 5, 6]}, 'multi_key',
-            timeout=fortydays)
-        self.assert_(-1 <= float(mock.cache.values()[0][1]) - esttimeout <= 1)
-        self.assert_(-1 <= float(mock.cache.values()[1][1]) - esttimeout <= 1)
-        self.assertEquals(memcache_client.get_multi(
+            time=fortydays)
+        for key in (b'some_key1', b'some_key2'):
+            key = md5(key, usedforsecurity=False).hexdigest().encode('ascii')
+            _junk, cache_timeout, _junk = mock.cache[key]
+            self.assertAlmostEqual(float(cache_timeout), esttimeout, delta=1)
+        self.assertEqual(memcache_client.get_multi(
             ('some_key2', 'some_key1', 'not_exists'), 'multi_key'),
             [[4, 5, 6], [1, 2, 3], None])
 
+        # Now lets simulate a lost connection and make sure we don't get
+        # the index out of range stack trace when it does
+        mock_stderr = io.StringIO()
+        not_expected = "IndexError: list index out of range"
+        with patch("sys.stderr", mock_stderr):
+            mock.read_return_empty_str = True
+            self.assertEqual(memcache_client.get_multi(
+                ('some_key2', 'some_key1', 'not_exists'), 'multi_key'),
+                None)
+            self.assertFalse(not_expected in mock_stderr.getvalue())
+
+    def test_multi_delete(self):
+        memcache_client = memcached.MemcacheRing(['1.2.3.4:11211',
+                                                  '1.2.3.5:11211'],
+                                                 logger=self.logger)
+        mock1 = MockMemcached()
+        mock2 = MockMemcached()
+        memcache_client._client_cache['1.2.3.4:11211'] = MockedMemcachePool(
+            [(mock1, mock1)] * 2)
+        memcache_client._client_cache['1.2.3.5:11211'] = MockedMemcachePool(
+            [(mock2, mock2)] * 2)
+
+        # MemcacheRing will put 'some_key0' on server 1.2.3.5:11211 and
+        # 'some_key1' and 'multi_key' on '1.2.3.4:11211'
+        memcache_client.set_multi(
+            {'some_key0': [1, 2, 3], 'some_key1': [4, 5, 6]}, 'multi_key')
+        self.assertEqual(
+            memcache_client.get_multi(('some_key1', 'some_key0'), 'multi_key'),
+            [[4, 5, 6], [1, 2, 3]])
+        for key in (b'some_key0', b'some_key1'):
+            key = md5(key, usedforsecurity=False).hexdigest().encode('ascii')
+            self.assertIn(key, mock1.cache)
+            _junk, cache_timeout, _junk = mock1.cache[key]
+            self.assertEqual(cache_timeout, 0)
+
+        memcache_client.set('some_key0', [7, 8, 9])
+        self.assertEqual(memcache_client.get('some_key0'), [7, 8, 9])
+        key = md5(b'some_key0',
+                  usedforsecurity=False).hexdigest().encode('ascii')
+        self.assertIn(key, mock2.cache)
+
+        # Delete 'some_key0' with server_key='multi_key'
+        memcache_client.delete('some_key0', server_key='multi_key')
+        self.assertEqual(memcache_client.get_multi(
+            ('some_key0', 'some_key1'), 'multi_key'),
+            [None, [4, 5, 6]])
+
+        # 'some_key0' have to be available on 1.2.3.5:11211
+        self.assertEqual(memcache_client.get('some_key0'), [7, 8, 9])
+        self.assertIn(key, mock2.cache)
+
     def test_serialization(self):
         memcache_client = memcached.MemcacheRing(['1.2.3.4:11211'],
-                                                 allow_pickle=True)
+                                                 logger=self.logger)
         mock = MockMemcached()
-        memcache_client._client_cache['1.2.3.4:11211'] = [(mock, mock)] * 2
+        memcache_client._client_cache['1.2.3.4:11211'] = MockedMemcachePool(
+            [(mock, mock)] * 2)
         memcache_client.set('some_key', [1, 2, 3])
-        self.assertEquals(memcache_client.get('some_key'), [1, 2, 3])
-        memcache_client._allow_pickle = False
-        memcache_client._allow_unpickle = True
-        self.assertEquals(memcache_client.get('some_key'), [1, 2, 3])
-        memcache_client._allow_unpickle = False
-        self.assertEquals(memcache_client.get('some_key'), None)
-        memcache_client.set('some_key', [1, 2, 3])
-        self.assertEquals(memcache_client.get('some_key'), [1, 2, 3])
-        memcache_client._allow_unpickle = True
-        self.assertEquals(memcache_client.get('some_key'), [1, 2, 3])
-        memcache_client._allow_pickle = True
-        self.assertEquals(memcache_client.get('some_key'), [1, 2, 3])
+        self.assertEqual(memcache_client.get('some_key'), [1, 2, 3])
+        self.assertEqual(len(mock.cache), 1)
+        key = next(iter(mock.cache))
+        self.assertEqual(mock.cache[key][0], b'2')  # JSON_FLAG
+        # Pretend we've got some really old pickle data in there
+        mock.cache[key] = (b'1',) + mock.cache[key][1:]
+        self.assertIsNone(memcache_client.get('some_key'))
+
+    def test_connection_pooling(self):
+        with patch('swift.common.memcached.socket') as mock_module:
+            def mock_getaddrinfo(host, port, family=socket.AF_INET,
+                                 socktype=socket.SOCK_STREAM, proto=0,
+                                 flags=0):
+                return [(family, socktype, proto, '', (host, port))]
+
+            mock_module.getaddrinfo = mock_getaddrinfo
+
+            # patch socket, stub socket.socket, mock sock
+            mock_sock = mock_module.socket.return_value
+
+            # track clients waiting for connections
+            connected = []
+            connections = Queue()
+            errors = []
+
+            def wait_connect(addr):
+                connected.append(addr)
+                sleep(0.1)  # yield
+                val = connections.get()
+                if val is not None:
+                    errors.append(val)
+
+            mock_sock.connect = wait_connect
+
+            memcache_client = memcached.MemcacheRing(['1.2.3.4:11211'],
+                                                     connect_timeout=10,
+                                                     logger=self.logger)
+            # sanity
+            self.assertEqual(1, len(memcache_client._client_cache))
+            for server, pool in memcache_client._client_cache.items():
+                self.assertEqual(2, pool.max_size)
+
+            # make 10 requests "at the same time"
+            p = GreenPool()
+            for i in range(10):
+                p.spawn(memcache_client.set, 'key', 'value')
+            for i in range(3):
+                sleep(0.1)
+                self.assertEqual(2, len(connected))
+
+            # give out a connection
+            connections.put(None)
+
+            # at this point, only one connection should have actually been
+            # created, the other is in the creation step, and the rest of the
+            # clients are not attempting to connect. we let this play out a
+            # bit to verify.
+            for i in range(3):
+                sleep(0.1)
+                self.assertEqual(2, len(connected))
+
+            # finish up, this allows the final connection to be created, so
+            # that all the other clients can use the two existing connections
+            # and no others will be created.
+            connections.put(None)
+            connections.put('nono')
+            self.assertEqual(2, len(connected))
+            p.waitall()
+            self.assertEqual(2, len(connected))
+            self.assertEqual(0, len(errors),
+                             "A client was allowed a third connection")
+            connections.get_nowait()
+            self.assertTrue(connections.empty())
+
+    def test_connection_pool_timeout(self):
+        connections = defaultdict(Queue)
+        pending = defaultdict(int)
+        served = defaultdict(int)
+
+        class MockConnectionPool(memcached.MemcacheConnPool):
+            def get(self):
+                pending[self.host] += 1
+                conn = connections[self.host].get()
+                pending[self.host] -= 1
+                return conn
+
+            def put(self, *args, **kwargs):
+                connections[self.host].put(*args, **kwargs)
+                served[self.host] += 1
+
+        with mock.patch.object(memcached, 'MemcacheConnPool',
+                               MockConnectionPool):
+            memcache_client = memcached.MemcacheRing(['1.2.3.4:11211',
+                                                      '1.2.3.5:11211'],
+                                                     io_timeout=0.5,
+                                                     pool_timeout=0.1,
+                                                     logger=self.logger)
+
+            # Hand out a couple slow connections to 1.2.3.5, leaving 1.2.3.4
+            # fast. All ten (10) clients should try to talk to .5 first, and
+            # then move on to .4, and we'll assert all that below.
+            mock_conn = MagicMock(), MagicMock()
+            mock_conn[0].readline = lambda: b'STORED\r\n'
+            mock_conn[1].sendall = lambda x: sleep(0.2)
+            connections['1.2.3.5'].put(mock_conn)
+            connections['1.2.3.5'].put(mock_conn)
+
+            mock_conn = MagicMock(), MagicMock()
+            mock_conn[0].readline = lambda: b'STORED\r\n'
+            connections['1.2.3.4'].put(mock_conn)
+            connections['1.2.3.4'].put(mock_conn)
+
+            p = GreenPool()
+            for i in range(10):
+                p.spawn(memcache_client.set, 'key', 'value')
+
+            # Wait for the dust to settle.
+            p.waitall()
+
+        self.assertEqual(pending['1.2.3.5'], 8)
+        self.assertEqual(len(memcache_client._errors['1.2.3.5:11211']), 8)
+        error_logs = self.logger.get_lines_for_level('error')
+        self.assertEqual(len(error_logs), 8)
+        for each_log in error_logs:
+            self.assertIn(
+                'Timeout getting a connection to memcached: 1.2.3.5:11211: '
+                'with key_prefix key',
+                each_log)
+        self.assertEqual(served['1.2.3.5'], 2)
+        self.assertEqual(pending['1.2.3.4'], 0)
+        self.assertEqual(len(memcache_client._errors['1.2.3.4:11211']), 0)
+        self.assertEqual(served['1.2.3.4'], 8)
+
+        # and we never got more put in that we gave out
+        self.assertEqual(connections['1.2.3.5'].qsize(), 2)
+        self.assertEqual(connections['1.2.3.4'].qsize(), 2)
+
+    def test_connection_slow_connect(self):
+        with patch('swift.common.memcached.socket') as mock_module:
+            def mock_getaddrinfo(host, port, family=socket.AF_INET,
+                                 socktype=socket.SOCK_STREAM, proto=0,
+                                 flags=0):
+                return [(family, socktype, proto, '', (host, port))]
+
+            mock_module.getaddrinfo = mock_getaddrinfo
+
+            # patch socket, stub socket.socket, mock sock
+            mock_sock = mock_module.socket.return_value
+
+            def wait_connect(addr):
+                # slow connect gives Timeout Exception
+                sleep(1)
+
+            # patch connect method
+            mock_sock.connect = wait_connect
+
+            memcache_client = memcached.MemcacheRing(
+                ['1.2.3.4:11211'], connect_timeout=0.1, logger=self.logger)
+
+            # sanity
+            self.assertEqual(1, len(memcache_client._client_cache))
+            for server, pool in memcache_client._client_cache.items():
+                self.assertEqual(2, pool.max_size)
+
+            # try to get connect and no connection found
+            # so it will result in StopIteration
+            conn_generator = memcache_client._get_conns(self.set_cmd)
+            with self.assertRaises(StopIteration):
+                next(conn_generator)
+
+            self.assertEqual(1, mock_sock.close.call_count)
+
+    def test_item_size_warning_threshold(self):
+        mock = MockMemcached()
+        mocked_pool = MockedMemcachePool([(mock, mock)] * 2)
+
+        def do_test(d, threshold, should_warn, error=False):
+            self.logger.clear()
+            try:
+                memcache_client = memcached.MemcacheRing(
+                    ['1.2.3.4:11211'], item_size_warning_threshold=threshold,
+                    logger=self.logger)
+                memcache_client._client_cache['1.2.3.4:11211'] = mocked_pool
+                memcache_client.set('some_key', d, serialize=False)
+                warning_lines = self.logger.get_lines_for_level('warning')
+                if should_warn:
+                    self.assertIn(
+                        'Item size larger than warning threshold: '
+                        '%d (%s) >= %d (%s)' % (
+                            len(d), human_readable(len(d)), threshold,
+                            human_readable(threshold)),
+                        warning_lines[0])
+                else:
+                    self.assertFalse(warning_lines)
+            except ValueError as err:
+                if not err:
+                    self.fail(err)
+                else:
+                    self.assertIn(
+                        'Config option must be a number, greater than 0, '
+                        'less than 100, not "%s".' % threshold,
+                        str(err))
+
+        data = '1' * 100
+        # let's start with something easy, say warning at 80
+        for data_size, warn in ((79, False), (80, True), (81, True),
+                                (99, True), (100, True)):
+            do_test(data[:data_size], 80, warn)
+
+        # if we set the threshold to -1 will turn off the warning
+        for data_size, warn in ((79, False), (80, False), (81, False),
+                                (99, False), (100, False)):
+            do_test(data[:data_size], -1, warn)
+
+        # Changing to 0 should warn on everything
+        for data_size, warn in ((0, True), (1, True), (50, True),
+                                (99, True), (100, True)):
+            do_test(data[:data_size], 0, warn)
+
+        # Let's do a big number
+        do_test('1' * 2048576, 1000000, True)
+
+    def test_operations_timing_stats(self):
+        memcache_client = memcached.MemcacheRing(['1.2.3.4:11211'],
+                                                 logger=self.logger)
+        mock = MockMemcached()
+        memcache_client._client_cache['1.2.3.4:11211'] = MockedMemcachePool(
+            [(mock, mock)] * 2)
+
+        with patch('time.time',) as mock_time:
+            mock_time.return_value = 1000.99
+            memcache_client.set('some_key', [1, 2, 3])
+            last_stats = self.logger.statsd_client.calls['timing_since'][-1]
+            self.assertEqual('memcached.set.timing', last_stats[0][0])
+            self.assertEqual(last_stats[0][1], 1000.99)
+            mock_time.return_value = 2000.99
+            self.assertEqual(memcache_client.get('some_key'), [1, 2, 3])
+            last_stats = self.logger.statsd_client.calls['timing_since'][-1]
+            self.assertEqual('memcached.get.timing', last_stats[0][0])
+            self.assertEqual(last_stats[0][1], 2000.99)
+            mock_time.return_value = 3000.99
+            self.assertEqual(memcache_client.decr('decr_key', delta=5), 0)
+            last_stats = self.logger.statsd_client.calls['timing_since'][-1]
+            self.assertEqual('memcached.decr.timing', last_stats[0][0])
+            self.assertEqual(last_stats[0][1], 3000.99)
+            mock_time.return_value = 4000.99
+            self.assertEqual(memcache_client.incr('decr_key', delta=5), 5)
+            last_stats = self.logger.statsd_client.calls['timing_since'][-1]
+            self.assertEqual('memcached.incr.timing', last_stats[0][0])
+            self.assertEqual(last_stats[0][1], 4000.99)
+            mock_time.return_value = 5000.99
+            memcache_client.set_multi(
+                {'some_key1': [1, 2, 3], 'some_key2': [4, 5, 6]}, 'multi_key')
+            last_stats = self.logger.statsd_client.calls['timing_since'][-1]
+            self.assertEqual('memcached.set_multi.timing', last_stats[0][0])
+            self.assertEqual(last_stats[0][1], 5000.99)
+            mock_time.return_value = 6000.99
+            self.assertEqual(
+                memcache_client.get_multi(
+                    ('some_key2', 'some_key1'),
+                    'multi_key'),
+                [[4, 5, 6],
+                 [1, 2, 3]])
+            last_stats = self.logger.statsd_client.calls['timing_since'][-1]
+            self.assertEqual('memcached.get_multi.timing', last_stats[0][0])
+            self.assertEqual(last_stats[0][1], 6000.99)
+            mock_time.return_value = 7000.99
+            memcache_client.delete('some_key')
+            last_stats = self.logger.statsd_client.calls['timing_since'][-1]
+            self.assertEqual('memcached.delete.timing', last_stats[0][0])
+            self.assertEqual(last_stats[0][1], 7000.99)
+
+    def test_operations_timing_stats_with_incr_exception(self):
+        memcache_client = memcached.MemcacheRing(['1.2.3.4:11211'],
+                                                 logger=self.logger)
+        mock_memcache = MockMemcached()
+        memcache_client._client_cache[
+            '1.2.3.4:11211'] = MockedMemcachePool(
+            [(mock_memcache, mock_memcache)] * 2)
+
+        def handle_add(key, flags, exptime, num_bytes, noreply=b''):
+            raise Exception('add failed')
+
+        with patch('time.time', ) as mock_time:
+            with mock.patch.object(mock_memcache, 'handle_add', handle_add):
+                mock_time.return_value = 4000.99
+                with self.assertRaises(MemcacheConnectionError):
+                    memcache_client.incr('incr_key', delta=5)
+                self.assertTrue(
+                    self.logger.statsd_client.calls['timing_since'])
+                last_stats = \
+                    self.logger.statsd_client.calls['timing_since'][-1]
+                self.assertEqual('memcached.incr.errors.timing',
+                                 last_stats[0][0])
+                self.assertEqual(last_stats[0][1], 4000.99)
+                self.assertEqual(
+                    'Error talking to memcached: 1.2.3.4:11211: '
+                    'with key_prefix incr_key, method incr, time_spent 0.0: ',
+                    self.logger.get_lines_for_level('error')[0])
+
+    def test_operations_timing_stats_with_set_exception(self):
+        memcache_client = memcached.MemcacheRing(['1.2.3.4:11211'],
+                                                 logger=self.logger)
+        mock_memcache = MockMemcached()
+        memcache_client._client_cache[
+            '1.2.3.4:11211'] = MockedMemcachePool(
+            [(mock_memcache, mock_memcache)] * 2)
+
+        def handle_set(key, flags, exptime, num_bytes, noreply=b''):
+            raise Exception('set failed')
+
+        with patch('time.time', ) as mock_time:
+            with mock.patch.object(mock_memcache, 'handle_set', handle_set):
+                mock_time.return_value = 4000.99
+                with self.assertRaises(MemcacheConnectionError):
+                    memcache_client.set(
+                        'set_key', [1, 2, 3],
+                        raise_on_error=True)
+                self.assertTrue(
+                    self.logger.statsd_client.calls['timing_since'])
+                last_stats = \
+                    self.logger.statsd_client.calls['timing_since'][-1]
+                self.assertEqual('memcached.set.errors.timing',
+                                 last_stats[0][0])
+                self.assertEqual(last_stats[0][1], 4000.99)
+                self.assertEqual(
+                    'Error talking to memcached: 1.2.3.4:11211: '
+                    'with key_prefix set_key, method set, time_spent 0.0: ',
+                    self.logger.get_lines_for_level('error')[0])
+
+    def test_operations_timing_stats_with_get_exception(self):
+        memcache_client = memcached.MemcacheRing(['1.2.3.4:11211'],
+                                                 logger=self.logger)
+        mock_memcache = MockMemcached()
+        memcache_client._client_cache[
+            '1.2.3.4:11211'] = MockedMemcachePool(
+            [(mock_memcache, mock_memcache)] * 2)
+
+        def handle_get(*keys):
+            raise Exception('get failed')
+
+        with patch('time.time', ) as mock_time:
+            with mock.patch.object(mock_memcache, 'handle_get', handle_get):
+                mock_time.return_value = 4000.99
+                with self.assertRaises(MemcacheConnectionError):
+                    memcache_client.get('get_key', raise_on_error=True)
+                self.assertTrue(
+                    self.logger.statsd_client.calls['timing_since'])
+                last_stats = \
+                    self.logger.statsd_client.calls['timing_since'][-1]
+                self.assertEqual('memcached.get.errors.timing',
+                                 last_stats[0][0])
+                self.assertEqual(last_stats[0][1], 4000.99)
+                self.assertEqual(
+                    'Error talking to memcached: 1.2.3.4:11211: '
+                    'with key_prefix get_key, method get, time_spent 0.0: ',
+                    self.logger.get_lines_for_level('error')[0])
+
+    def test_operations_timing_stats_with_get_error(self):
+        memcache_client = memcached.MemcacheRing(['1.2.3.4:11211'],
+                                                 logger=self.logger)
+        mock_memcache = MockMemcached()
+        memcache_client._client_cache[
+            '1.2.3.4:11211'] = MockedMemcachePool(
+            [(mock_memcache, mock_memcache)] * 2)
+
+        def handle_get(*keys):
+            raise MemcacheConnectionError('failed to connect')
+
+        with patch('time.time', ) as mock_time:
+            with mock.patch.object(mock_memcache, 'handle_get', handle_get):
+                mock_time.return_value = 4000.99
+                with self.assertRaises(MemcacheConnectionError):
+                    memcache_client.get('get_key', raise_on_error=True)
+                self.assertTrue(
+                    self.logger.statsd_client.calls['timing_since'])
+                last_stats = \
+                    self.logger.statsd_client.calls['timing_since'][-1]
+                self.assertEqual('memcached.get.conn_err.timing',
+                                 last_stats[0][0])
+                self.assertEqual(last_stats[0][1], 4000.99)
+                self.assertEqual('Error talking to memcached: 1.2.3.4:11211: '
+                                 'with key_prefix get_key, method get, '
+                                 'time_spent 0.0, failed to connect',
+                                 self.logger.get_lines_for_level('error')[0])
+
+    def test_operations_timing_stats_with_incr_timeout(self):
+        memcache_client = memcached.MemcacheRing(['1.2.3.4:11211'],
+                                                 io_timeout=0.01,
+                                                 logger=self.logger)
+        mock_memcache = MockMemcached()
+        memcache_client._client_cache[
+            '1.2.3.4:11211'] = MockedMemcachePool(
+            [(mock_memcache, mock_memcache)] * 2)
+
+        def handle_add(key, flags, exptime, num_bytes, noreply=b''):
+            sleep(0.05)
+
+        with patch('time.time', ) as mock_time:
+            with mock.patch.object(mock_memcache, 'handle_add', handle_add):
+                mock_time.side_effect = itertools.count(4000.99, 1.0)
+                with self.assertRaises(MemcacheConnectionError):
+                    memcache_client.incr('nvratelimit/v2/wf/124593', delta=5)
+                self.assertTrue(
+                    self.logger.statsd_client.calls['timing_since'])
+                last_stats = \
+                    self.logger.statsd_client.calls['timing_since'][-1]
+                self.assertEqual('memcached.incr.timeout.timing',
+                                 last_stats[0][0])
+                self.assertEqual(last_stats[0][1], 4002.99)
+                error_logs = self.logger.get_lines_for_level('error')
+                self.assertIn('Timeout talking to memcached: 1.2.3.4:11211: ',
+                              error_logs[0])
+                self.assertIn(
+                    'with key_prefix nvratelimit/v2/wf, ', error_logs[0])
+                self.assertIn('method incr, ', error_logs[0])
+                self.assertIn(
+                    'config_timeout 0.01, time_spent 1.0', error_logs[0])
+
+    def test_operations_timing_stats_with_set_timeout(self):
+        memcache_client = memcached.MemcacheRing(['1.2.3.4:11211'],
+                                                 io_timeout=0.01,
+                                                 logger=self.logger)
+        mock_memcache = MockMemcached()
+        memcache_client._client_cache[
+            '1.2.3.4:11211'] = MockedMemcachePool(
+            [(mock_memcache, mock_memcache)] * 2)
+
+        def handle_set(key, flags, exptime, num_bytes, noreply=b''):
+            sleep(0.05)
+
+        with patch('time.time', ) as mock_time:
+            with mock.patch.object(mock_memcache, 'handle_set', handle_set):
+                mock_time.side_effect = itertools.count(4000.99, 1.0)
+                with self.assertRaises(MemcacheConnectionError):
+                    memcache_client.set(
+                        'shard-updating-v2/acc/container', [1, 2, 3],
+                        raise_on_error=True)
+                self.assertTrue(
+                    self.logger.statsd_client.calls['timing_since'])
+                last_stats = \
+                    self.logger.statsd_client.calls['timing_since'][-1]
+                self.assertEqual('memcached.set.timeout.timing',
+                                 last_stats[0][0])
+                self.assertEqual(last_stats[0][1], 4002.99)
+                error_logs = self.logger.get_lines_for_level('error')
+                self.assertIn('Timeout talking to memcached: 1.2.3.4:11211: ',
+                              error_logs[0])
+                self.assertIn(
+                    'with key_prefix shard-updating-v2/acc, ', error_logs[0])
+                self.assertIn('method set, ', error_logs[0])
+                self.assertIn(
+                    'config_timeout 0.01, time_spent 1.0', error_logs[0])
+
+    def test_operations_timing_stats_with_get_timeout(self):
+        memcache_client = memcached.MemcacheRing(['1.2.3.4:11211'],
+                                                 io_timeout=0.01,
+                                                 logger=self.logger)
+        mock_memcache = MockMemcached()
+        memcache_client._client_cache[
+            '1.2.3.4:11211'] = MockedMemcachePool(
+            [(mock_memcache, mock_memcache)] * 2)
+
+        def handle_get(*keys):
+            sleep(0.05)
+
+        with patch('time.time', ) as mock_time:
+            with mock.patch.object(mock_memcache, 'handle_get', handle_get):
+                mock_time.side_effect = itertools.count(4000.99, 1.0)
+                with self.assertRaises(MemcacheConnectionError):
+                    memcache_client.get(
+                        'shard-updating-v2/acc/container', raise_on_error=True)
+                self.assertTrue(
+                    self.logger.statsd_client.calls['timing_since'])
+                last_stats = \
+                    self.logger.statsd_client.calls['timing_since'][-1]
+                self.assertEqual('memcached.get.timeout.timing',
+                                 last_stats[0][0])
+                self.assertEqual(last_stats[0][1], 4002.99)
+                error_logs = self.logger.get_lines_for_level('error')
+                self.assertIn('Timeout talking to memcached: 1.2.3.4:11211: ',
+                              error_logs[0])
+                self.assertIn(
+                    'with key_prefix shard-updating-v2/acc, ', error_logs[0])
+                self.assertIn('method get, ', error_logs[0])
+                self.assertIn(
+                    'config_timeout 0.01, time_spent 1.0', error_logs[0])
+
+    def test_incr_add_expires(self):
+        memcache_client = memcached.MemcacheRing(['1.2.3.4:11211'],
+                                                 io_timeout=0.01,
+                                                 logger=self.logger)
+        mock_memcache = MockMemcached()
+        memcache_client._client_cache[
+            '1.2.3.4:11211'] = MockedMemcachePool(
+            [(mock_memcache, mock_memcache)] * 2)
+        incr_calls = []
+        orig_incr = mock_memcache.handle_incr
+        orig_add = mock_memcache.handle_add
+
+        def handle_incr(key, value, noreply=b''):
+            if incr_calls:
+                mock_memcache.cache.clear()
+            incr_calls.append(key)
+            orig_incr(key, value, noreply)
+
+        def handle_add(key, flags, exptime, num_bytes, noreply=b''):
+            mock_memcache.cache[key] = 'already set!'
+            orig_add(key, flags, exptime, num_bytes, noreply)
+            mock_memcache.cache.clear()
+
+        with patch('time.time', ) as mock_time:
+            mock_time.side_effect = itertools.count(4000.99, 1.0)
+            with mock.patch.object(mock_memcache, 'handle_incr', handle_incr):
+                with mock.patch.object(mock_memcache, 'handle_add',
+                                       handle_add):
+                    with self.assertRaises(MemcacheConnectionError):
+                        memcache_client.incr(
+                            'shard-updating-v2/acc/container', time=1.23)
+        self.assertTrue(self.logger.statsd_client.calls['timing_since'])
+        last_stats = self.logger.statsd_client.calls['timing_since'][-1]
+        self.assertEqual('memcached.incr.conn_err.timing',
+                         last_stats[0][0])
+        self.assertEqual(last_stats[0][1], 4002.99)
+        error_logs = self.logger.get_lines_for_level('error')
+        self.assertIn('Error talking to memcached: 1.2.3.4:11211: ',
+                      error_logs[0])
+        self.assertIn('with key_prefix shard-updating-v2/acc, method incr, '
+                      'time_spent 1.0, expired ttl=1.23',
+                      error_logs[0])
+        self.assertIn('1.2.3.4:11211', memcache_client._errors)
+        self.assertFalse(memcache_client._errors['1.2.3.4:11211'])
+
+    def test_incr_unexpected_response(self):
+        memcache_client = memcached.MemcacheRing(['1.2.3.4:11211'],
+                                                 io_timeout=0.01,
+                                                 logger=self.logger)
+        mock_memcache = MockMemcached()
+        memcache_client._client_cache[
+            '1.2.3.4:11211'] = MockedMemcachePool(
+            [(mock_memcache, mock_memcache)] * 2)
+        resp = b'UNEXPECTED RESPONSE\r\n'
+
+        def handle_incr(key, value, noreply=b''):
+            mock_memcache.outbuf += resp
+
+        with patch('time.time') as mock_time:
+            mock_time.side_effect = itertools.count(4000.99, 1.0)
+            with mock.patch.object(mock_memcache, 'handle_incr', handle_incr):
+                with self.assertRaises(MemcacheConnectionError):
+                    memcache_client.incr(
+                        'shard-updating-v2/acc/container', time=1.23)
+        self.assertTrue(self.logger.statsd_client.calls['timing_since'])
+        last_stats = self.logger.statsd_client.calls['timing_since'][-1]
+        self.assertEqual('memcached.incr.errors.timing',
+                         last_stats[0][0])
+        self.assertEqual(last_stats[0][1], 4002.99)
+        error_logs = self.logger.get_lines_for_level('error')
+        self.assertIn('Error talking to memcached: 1.2.3.4:11211: ',
+                      error_logs[0])
+        self.assertIn("with key_prefix shard-updating-v2/acc, method incr, "
+                      "time_spent 1.0" % resp.split(), error_logs[0])
+        self.assertIn('1.2.3.4:11211', memcache_client._errors)
+        self.assertEqual([4005.99], memcache_client._errors['1.2.3.4:11211'])
+
+
+class ExcConfigParser(object):
+
+    def read(self, path):
+        raise Exception('read called with %r' % path)
+
+
+class EmptyConfigParser(object):
+
+    def read(self, path):
+        return False
+
+
+def get_config_parser(memcache_servers='1.2.3.4:5',
+                      memcache_max_connections='4',
+                      section='memcache',
+                      item_size_warning_threshold='75'):
+    _srvs = memcache_servers
+    _maxc = memcache_max_connections
+    _section = section
+    _warn_threshold = item_size_warning_threshold
+
+    class SetConfigParser(object):
+
+        def items(self, section_name):
+            if section_name != section:
+                raise NoSectionError(section_name)
+            return {
+                'memcache_servers': memcache_servers,
+                'memcache_max_connections': memcache_max_connections
+            }
+
+        def read(self, path):
+            return True
+
+        def get(self, section, option):
+            if _section == section:
+                if option == 'memcache_servers':
+                    if _srvs == 'error':
+                        raise NoOptionError(option, section)
+                    return _srvs
+                elif option in ('memcache_max_connections',
+                                'max_connections'):
+                    if _maxc == 'error':
+                        raise NoOptionError(option, section)
+                    return _maxc
+                elif option == 'item_size_warning_threshold':
+                    if _warn_threshold == 'error':
+                        raise NoOptionError(option, section)
+                    return _warn_threshold
+                else:
+                    raise NoOptionError(option, section)
+            else:
+                raise NoSectionError(option)
+
+    return SetConfigParser
+
+
+def start_response(*args):
+    pass
+
+
+class TestLoadMemcache(unittest.TestCase):
+    def setUp(self):
+        self.logger = debug_logger()
+
+    def test_conf_default_read(self):
+        with mock.patch.object(memcached, 'ConfigParser', ExcConfigParser):
+            for d in ({},
+                      {'memcache_servers': '6.7.8.9:10'},
+                      {'memcache_max_connections': '30'},
+                      {'item_size_warning_threshold': 75},
+                      {'memcache_servers': '6.7.8.9:10',
+                       'item_size_warning_threshold': '75'},
+                      {'item_size_warning_threshold': '75',
+                       'memcache_max_connections': '30'},
+                      ):
+                with self.assertRaises(Exception) as catcher:
+                    memcached.load_memcache(d, self.logger)
+                self.assertEqual(
+                    str(catcher.exception),
+                    "read called with '/etc/swift/memcache.conf'")
+
+    def test_conf_set_no_read(self):
+        with mock.patch.object(memcached, 'ConfigParser', ExcConfigParser):
+            exc = None
+            try:
+                memcached.load_memcache({
+                    'memcache_servers': '1.2.3.4:5',
+                    'memcache_max_connections': '30',
+                    'item_size_warning_threshold': '80'
+
+                }, self.logger)
+            except Exception as err:
+                exc = err
+        self.assertIsNone(exc)
+
+    def test_conf_default(self):
+        with mock.patch.object(memcached, 'ConfigParser', EmptyConfigParser):
+            memcache = memcached.load_memcache({}, self.logger)
+        self.assertEqual(memcache.memcache_servers, ['127.0.0.1:11211'])
+        self.assertEqual(
+            memcache._client_cache['127.0.0.1:11211'].max_size, 2)
+        self.assertEqual(memcache.item_size_warning_threshold, -1)
+
+    def test_conf_inline(self):
+        with mock.patch.object(memcached, 'ConfigParser', get_config_parser()):
+            memcache = memcached.load_memcache({
+                'memcache_servers': '6.7.8.9:10',
+                'memcache_max_connections': '5',
+                'item_size_warning_threshold': '75'
+            }, self.logger)
+        self.assertEqual(memcache.memcache_servers, ['6.7.8.9:10'])
+        self.assertEqual(
+            memcache._client_cache['6.7.8.9:10'].max_size, 5)
+        self.assertEqual(memcache.item_size_warning_threshold, 75)
+
+    def test_conf_inline_ratelimiting(self):
+        with mock.patch.object(memcached, 'ConfigParser', get_config_parser()):
+            memcache = memcached.load_memcache({
+                'error_suppression_limit': '5',
+                'error_suppression_interval': '2.5',
+            }, self.logger)
+        self.assertEqual(memcache._error_limit_count, 5)
+        self.assertEqual(memcache._error_limit_time, 2.5)
+        self.assertEqual(memcache._error_limit_duration, 2.5)
+
+    def test_conf_inline_tls(self):
+        fake_context = mock.Mock()
+        with mock.patch.object(ssl, 'create_default_context',
+                               return_value=fake_context):
+            with mock.patch.object(memcached, 'ConfigParser',
+                                   get_config_parser()):
+                memcached.load_memcache({
+                    'tls_enabled': 'true',
+                    'tls_cafile': 'cafile',
+                    'tls_certfile': 'certfile',
+                    'tls_keyfile': 'keyfile',
+                }, self.logger)
+            ssl.create_default_context.assert_called_with(cafile='cafile')
+            fake_context.load_cert_chain.assert_called_with('certfile',
+                                                            'keyfile')
+
+    def test_conf_extra_no_section(self):
+        with mock.patch.object(memcached, 'ConfigParser',
+                               get_config_parser(section='foobar')):
+            memcache = memcached.load_memcache({}, self.logger)
+        self.assertEqual(memcache.memcache_servers, ['127.0.0.1:11211'])
+        self.assertEqual(
+            memcache._client_cache['127.0.0.1:11211'].max_size, 2)
+
+    def test_conf_extra_no_option(self):
+        replacement_parser = get_config_parser(
+            memcache_servers='error',
+            memcache_max_connections='error')
+        with mock.patch.object(memcached, 'ConfigParser', replacement_parser):
+            memcache = memcached.load_memcache({}, self.logger)
+        self.assertEqual(memcache.memcache_servers, ['127.0.0.1:11211'])
+        self.assertEqual(
+            memcache._client_cache['127.0.0.1:11211'].max_size, 2)
+
+    def test_conf_inline_other_max_conn(self):
+        with mock.patch.object(memcached, 'ConfigParser', get_config_parser()):
+            memcache = memcached.load_memcache({
+                'memcache_servers': '6.7.8.9:10',
+                'max_connections': '5'
+            }, self.logger)
+        self.assertEqual(memcache.memcache_servers, ['6.7.8.9:10'])
+        self.assertEqual(
+            memcache._client_cache['6.7.8.9:10'].max_size, 5)
+
+    def test_conf_inline_bad_max_conn(self):
+        with mock.patch.object(memcached, 'ConfigParser', get_config_parser()):
+            memcache = memcached.load_memcache({
+                'memcache_servers': '6.7.8.9:10',
+                'max_connections': 'bad42',
+            }, self.logger)
+        self.assertEqual(memcache.memcache_servers, ['6.7.8.9:10'])
+        self.assertEqual(
+            memcache._client_cache['6.7.8.9:10'].max_size, 4)
+
+    def test_conf_inline_bad_item_warning_threshold(self):
+        with mock.patch.object(memcached, 'ConfigParser', get_config_parser()):
+            with self.assertRaises(ValueError) as err:
+                memcached.load_memcache({
+                    'memcache_servers': '6.7.8.9:10',
+                    'item_size_warning_threshold': 'bad42',
+                }, self.logger)
+        self.assertIn('invalid literal for int() with base 10:',
+                      str(err.exception))
+
+    def test_conf_from_extra_conf(self):
+        with mock.patch.object(memcached, 'ConfigParser', get_config_parser()):
+            memcache = memcached.load_memcache({}, self.logger)
+        self.assertEqual(memcache.memcache_servers, ['1.2.3.4:5'])
+        self.assertEqual(
+            memcache._client_cache['1.2.3.4:5'].max_size, 4)
+
+    def test_conf_from_extra_conf_bad_max_conn(self):
+        with mock.patch.object(memcached, 'ConfigParser', get_config_parser(
+                memcache_max_connections='bad42')):
+            memcache = memcached.load_memcache({}, self.logger)
+        self.assertEqual(memcache.memcache_servers, ['1.2.3.4:5'])
+        self.assertEqual(
+            memcache._client_cache['1.2.3.4:5'].max_size, 2)
+
+    def test_conf_from_inline_and_maxc_from_extra_conf(self):
+        with mock.patch.object(memcached, 'ConfigParser', get_config_parser()):
+            memcache = memcached.load_memcache({
+                'memcache_servers': '6.7.8.9:10'}, self.logger)
+        self.assertEqual(memcache.memcache_servers, ['6.7.8.9:10'])
+        self.assertEqual(
+            memcache._client_cache['6.7.8.9:10'].max_size, 4)
+
+    def test_conf_from_inline_and_sers_from_extra_conf(self):
+        with mock.patch.object(memcached, 'ConfigParser', get_config_parser()):
+            memcache = memcached.load_memcache({
+                'memcache_servers': '6.7.8.9:10',
+                'memcache_max_connections': '42',
+            }, self.logger)
+        self.assertEqual(memcache.memcache_servers, ['6.7.8.9:10'])
+        self.assertEqual(
+            memcache._client_cache['6.7.8.9:10'].max_size, 42)
 
 
 if __name__ == '__main__':
diff --git a/test/unit/common/test_recon.py b/test/unit/common/test_recon.py
new file mode 100644
index 0000000000..c2c1308dec
--- /dev/null
+++ b/test/unit/common/test_recon.py
@@ -0,0 +1,31 @@
+# -*- coding:utf-8 -*-
+# Copyright (c) 2010-2021 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from unittest import TestCase
+from swift.common import recon
+
+
+class TestCommonRecon(TestCase):
+    def test_server_type_to_recon_file(self):
+        # valid server types will come out as <server_type>.recon
+        for server_type in ('object', 'container', 'account', 'ACCount'):
+            self.assertEqual(recon.server_type_to_recon_file(server_type),
+                             "%s.recon" % server_type.lower())
+
+        # other values will return a ValueError
+        for bad_server_type in ('obj', '', None, 'other', 'Account '):
+            self.assertRaises(ValueError,
+                              recon.server_type_to_recon_file, bad_server_type)
diff --git a/test/unit/common/test_registry.py b/test/unit/common/test_registry.py
new file mode 100644
index 0000000000..f769871132
--- /dev/null
+++ b/test/unit/common/test_registry.py
@@ -0,0 +1,296 @@
+# Copyright (c) 2022 NVIDIA
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from swift.common import registry, utils
+
+from unittest import mock
+import unittest
+
+
+class TestSwiftInfo(unittest.TestCase):
+
+    def setUp(self):
+        patcher = mock.patch.object(registry, '_swift_info', dict())
+        patcher.start()
+        self.addCleanup(patcher.stop)
+        patcher = mock.patch.object(registry, '_swift_admin_info', dict())
+        patcher.start()
+        self.addCleanup(patcher.stop)
+
+    def test_register_swift_info(self):
+        registry.register_swift_info(foo='bar')
+        registry.register_swift_info(lorem='ipsum')
+        registry.register_swift_info('cap1', cap1_foo='cap1_bar')
+        registry.register_swift_info('cap1', cap1_lorem='cap1_ipsum')
+
+        self.assertTrue('swift' in registry._swift_info)
+        self.assertTrue('foo' in registry._swift_info['swift'])
+        self.assertEqual(registry._swift_info['swift']['foo'], 'bar')
+        self.assertTrue('lorem' in registry._swift_info['swift'])
+        self.assertEqual(registry._swift_info['swift']['lorem'], 'ipsum')
+
+        self.assertTrue('cap1' in registry._swift_info)
+        self.assertTrue('cap1_foo' in registry._swift_info['cap1'])
+        self.assertEqual(registry._swift_info['cap1']['cap1_foo'], 'cap1_bar')
+        self.assertTrue('cap1_lorem' in registry._swift_info['cap1'])
+        self.assertEqual(registry._swift_info['cap1']['cap1_lorem'],
+                         'cap1_ipsum')
+
+        self.assertRaises(ValueError,
+                          registry.register_swift_info, 'admin', foo='bar')
+
+        self.assertRaises(ValueError,
+                          registry.register_swift_info, 'disallowed_sections',
+                          disallowed_sections=None)
+
+        registry.register_swift_info('goodkey', foo='5.6')
+        self.assertRaises(ValueError,
+                          registry.register_swift_info, 'bad.key', foo='5.6')
+        data = {'bad.key': '5.6'}
+        self.assertRaises(ValueError,
+                          registry.register_swift_info, 'goodkey', **data)
+
+    def test_get_swift_info(self):
+        registry._swift_info = {'swift': {'foo': 'bar'},
+                                'cap1': {'cap1_foo': 'cap1_bar'}}
+        registry._swift_admin_info = {'admin_cap1': {'ac1_foo': 'ac1_bar'}}
+
+        info = registry.get_swift_info()
+
+        self.assertNotIn('admin', info)
+
+        self.assertIn('swift', info)
+        self.assertIn('foo', info['swift'])
+        self.assertEqual(registry._swift_info['swift']['foo'], 'bar')
+
+        self.assertIn('cap1', info)
+        self.assertIn('cap1_foo', info['cap1'])
+        self.assertEqual(registry._swift_info['cap1']['cap1_foo'], 'cap1_bar')
+
+    def test_get_swift_info_with_disallowed_sections(self):
+        registry._swift_info = {'swift': {'foo': 'bar'},
+                                'cap1': {'cap1_foo': 'cap1_bar'},
+                                'cap2': {'cap2_foo': 'cap2_bar'},
+                                'cap3': {'cap3_foo': 'cap3_bar'}}
+        registry._swift_admin_info = {'admin_cap1': {'ac1_foo': 'ac1_bar'}}
+
+        info = registry.get_swift_info(disallowed_sections=['cap1', 'cap3'])
+
+        self.assertNotIn('admin', info)
+
+        self.assertIn('swift', info)
+        self.assertIn('foo', info['swift'])
+        self.assertEqual(info['swift']['foo'], 'bar')
+
+        self.assertNotIn('cap1', info)
+
+        self.assertIn('cap2', info)
+        self.assertIn('cap2_foo', info['cap2'])
+        self.assertEqual(info['cap2']['cap2_foo'], 'cap2_bar')
+
+        self.assertNotIn('cap3', info)
+
+    def test_register_swift_admin_info(self):
+        registry.register_swift_info(admin=True, admin_foo='admin_bar')
+        registry.register_swift_info(admin=True, admin_lorem='admin_ipsum')
+        registry.register_swift_info('cap1', admin=True, ac1_foo='ac1_bar')
+        registry.register_swift_info('cap1', admin=True, ac1_lorem='ac1_ipsum')
+
+        self.assertIn('swift', registry._swift_admin_info)
+        self.assertIn('admin_foo', registry._swift_admin_info['swift'])
+        self.assertEqual(
+            registry._swift_admin_info['swift']['admin_foo'], 'admin_bar')
+        self.assertIn('admin_lorem', registry._swift_admin_info['swift'])
+        self.assertEqual(
+            registry._swift_admin_info['swift']['admin_lorem'], 'admin_ipsum')
+
+        self.assertIn('cap1', registry._swift_admin_info)
+        self.assertIn('ac1_foo', registry._swift_admin_info['cap1'])
+        self.assertEqual(
+            registry._swift_admin_info['cap1']['ac1_foo'], 'ac1_bar')
+        self.assertIn('ac1_lorem', registry._swift_admin_info['cap1'])
+        self.assertEqual(
+            registry._swift_admin_info['cap1']['ac1_lorem'], 'ac1_ipsum')
+
+        self.assertNotIn('swift', registry._swift_info)
+        self.assertNotIn('cap1', registry._swift_info)
+
+    def test_get_swift_admin_info(self):
+        registry._swift_info = {'swift': {'foo': 'bar'},
+                                'cap1': {'cap1_foo': 'cap1_bar'}}
+        registry._swift_admin_info = {'admin_cap1': {'ac1_foo': 'ac1_bar'}}
+
+        info = registry.get_swift_info(admin=True)
+
+        self.assertIn('admin', info)
+        self.assertIn('admin_cap1', info['admin'])
+        self.assertIn('ac1_foo', info['admin']['admin_cap1'])
+        self.assertEqual(info['admin']['admin_cap1']['ac1_foo'], 'ac1_bar')
+
+        self.assertIn('swift', info)
+        self.assertIn('foo', info['swift'])
+        self.assertEqual(registry._swift_info['swift']['foo'], 'bar')
+
+        self.assertIn('cap1', info)
+        self.assertIn('cap1_foo', info['cap1'])
+        self.assertEqual(registry._swift_info['cap1']['cap1_foo'], 'cap1_bar')
+
+    def test_get_swift_admin_info_with_disallowed_sections(self):
+        registry._swift_info = {'swift': {'foo': 'bar'},
+                                'cap1': {'cap1_foo': 'cap1_bar'},
+                                'cap2': {'cap2_foo': 'cap2_bar'},
+                                'cap3': {'cap3_foo': 'cap3_bar'}}
+        registry._swift_admin_info = {'admin_cap1': {'ac1_foo': 'ac1_bar'}}
+
+        info = registry.get_swift_info(
+            admin=True, disallowed_sections=['cap1', 'cap3'])
+
+        self.assertIn('admin', info)
+        self.assertIn('admin_cap1', info['admin'])
+        self.assertIn('ac1_foo', info['admin']['admin_cap1'])
+        self.assertEqual(info['admin']['admin_cap1']['ac1_foo'], 'ac1_bar')
+        self.assertIn('disallowed_sections', info['admin'])
+        self.assertIn('cap1', info['admin']['disallowed_sections'])
+        self.assertNotIn('cap2', info['admin']['disallowed_sections'])
+        self.assertIn('cap3', info['admin']['disallowed_sections'])
+
+        self.assertIn('swift', info)
+        self.assertIn('foo', info['swift'])
+        self.assertEqual(info['swift']['foo'], 'bar')
+
+        self.assertNotIn('cap1', info)
+
+        self.assertIn('cap2', info)
+        self.assertIn('cap2_foo', info['cap2'])
+        self.assertEqual(info['cap2']['cap2_foo'], 'cap2_bar')
+
+        self.assertNotIn('cap3', info)
+
+    def test_get_swift_admin_info_with_disallowed_sub_sections(self):
+        registry._swift_info = {'swift': {'foo': 'bar'},
+                                'cap1': {'cap1_foo': 'cap1_bar',
+                                         'cap1_moo': 'cap1_baa'},
+                                'cap2': {'cap2_foo': 'cap2_bar'},
+                                'cap3': {'cap2_foo': 'cap2_bar'},
+                                'cap4': {'a': {'b': {'c': 'c'},
+                                               'b.c': 'b.c'}}}
+        registry._swift_admin_info = {'admin_cap1': {'ac1_foo': 'ac1_bar'}}
+
+        info = registry.get_swift_info(
+            admin=True, disallowed_sections=['cap1.cap1_foo', 'cap3',
+                                             'cap4.a.b.c'])
+        self.assertNotIn('cap3', info)
+        self.assertEqual(info['cap1']['cap1_moo'], 'cap1_baa')
+        self.assertNotIn('cap1_foo', info['cap1'])
+        self.assertNotIn('c', info['cap4']['a']['b'])
+        self.assertEqual(info['cap4']['a']['b.c'], 'b.c')
+
+    def test_get_swift_info_with_unmatched_disallowed_sections(self):
+        cap1 = {'cap1_foo': 'cap1_bar',
+                'cap1_moo': 'cap1_baa'}
+        registry._swift_info = {'swift': {'foo': 'bar'},
+                                'cap1': cap1}
+        # expect no exceptions
+        info = registry.get_swift_info(
+            disallowed_sections=['cap2.cap1_foo', 'cap1.no_match',
+                                 'cap1.cap1_foo.no_match.no_match'])
+        self.assertEqual(info['cap1'], cap1)
+
+    def test_register_swift_info_import_from_utils(self):
+        # verify that the functions are available to import from utils
+        utils.register_swift_info(foo='bar')
+        self.assertTrue('swift' in registry._swift_info)
+        self.assertTrue('foo' in registry._swift_info['swift'])
+        self.assertEqual(registry._swift_info['swift']['foo'], 'bar')
+        self.assertEqual(registry.get_swift_info(admin=True),
+                         utils.get_swift_info(admin=True))
+
+
+class TestSensitiveRegistry(unittest.TestCase):
+    def setUp(self):
+        patcher = mock.patch.object(registry, '_sensitive_headers', set())
+        patcher.start()
+        self.addCleanup(patcher.stop)
+        patcher = mock.patch.object(registry, '_sensitive_params', set())
+        patcher.start()
+        self.addCleanup(patcher.stop)
+
+    def test_register_sensitive_header(self):
+        self.assertFalse(registry._sensitive_headers)
+
+        registry.register_sensitive_header('Some-Header')
+        expected_headers = {'some-header'}
+        self.assertEqual(expected_headers, registry._sensitive_headers)
+
+        expected_headers.add("new-header")
+        registry.register_sensitive_header("New-Header")
+        self.assertEqual(expected_headers, registry._sensitive_headers)
+
+        for header_not_str in (1, None, 1.1):
+            with self.assertRaises(TypeError):
+                registry.register_sensitive_header(header_not_str)
+            self.assertEqual(expected_headers, registry._sensitive_headers)
+
+        with self.assertRaises(UnicodeError):
+            registry.register_sensitive_header('\xe2\x98\x83')
+        self.assertEqual(expected_headers, registry._sensitive_headers)
+
+    def test_register_sensitive_param(self):
+        self.assertFalse(registry._sensitive_params)
+
+        registry.register_sensitive_param('some_param')
+        expected_params = {'some_param'}
+        self.assertEqual(expected_params, registry._sensitive_params)
+
+        expected_params.add("another")
+        registry.register_sensitive_param("another")
+        self.assertEqual(expected_params, registry._sensitive_params)
+
+        for param_not_str in (1, None, 1.1):
+            with self.assertRaises(TypeError):
+                registry.register_sensitive_param(param_not_str)
+            self.assertEqual(expected_params, registry._sensitive_params)
+
+        with self.assertRaises(UnicodeError):
+            registry.register_sensitive_param('\xe2\x98\x83')
+        self.assertEqual(expected_params, registry._sensitive_params)
+
+    def test_get_sensitive_headers(self):
+        self.assertFalse(registry.get_sensitive_headers())
+
+        registry.register_sensitive_header('Header1')
+        self.assertEqual(registry.get_sensitive_headers(), {'header1'})
+        self.assertEqual(registry.get_sensitive_headers(),
+                         registry._sensitive_headers)
+
+        registry.register_sensitive_header('Header2')
+        self.assertEqual(registry.get_sensitive_headers(),
+                         {'header1', 'header2'})
+        self.assertEqual(registry.get_sensitive_headers(),
+                         registry._sensitive_headers)
+
+    def test_get_sensitive_params(self):
+        self.assertFalse(registry.get_sensitive_params())
+
+        registry.register_sensitive_param('Param1')
+        self.assertEqual(registry.get_sensitive_params(), {'Param1'})
+        self.assertEqual(registry.get_sensitive_params(),
+                         registry._sensitive_params)
+
+        registry.register_sensitive_param('param')
+        self.assertEqual(registry.get_sensitive_params(),
+                         {'Param1', 'param'})
+        self.assertEqual(registry.get_sensitive_params(),
+                         registry._sensitive_params)
diff --git a/test/unit/common/test_request_helpers.py b/test/unit/common/test_request_helpers.py
new file mode 100644
index 0000000000..cc31b7df44
--- /dev/null
+++ b/test/unit/common/test_request_helpers.py
@@ -0,0 +1,817 @@
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""Tests for swift.common.request_helpers"""
+import argparse
+import unittest
+from swift.common.swob import Request, HTTPException, HeaderKeyDict, HTTPOk
+from swift.common.storage_policy import POLICIES, EC_POLICY, REPL_POLICY
+from swift.common import request_helpers as rh
+from swift.common.constraints import AUTO_CREATE_ACCOUNT_PREFIX
+
+from test.debug_logger import debug_logger
+from test.unit import patch_policies
+from test.unit.common.test_utils import FakeResponse
+from test.unit.common.middleware.helpers import FakeSwift
+
+
+server_types = ['account', 'container', 'object']
+
+
+class TestRequestHelpers(unittest.TestCase):
+
+    def test_append_log_info(self):
+        req = Request.blank('/v/a/c/o')
+        self.assertNotIn('swift.log_info', req.environ)
+        rh.append_log_info(req.environ, 'msg1')
+        self.assertEqual(['msg1'], req.environ.get('swift.log_info'))
+        rh.append_log_info(req.environ, 'msg2')
+        self.assertEqual(['msg1', 'msg2'], req.environ.get('swift.log_info'))
+
+    def test_get_log_info(self):
+        req = Request.blank('/v/a/c/o')
+        self.assertEqual('', rh.get_log_info(req.environ))
+        req.environ['swift.log_info'] = ['msg1']
+        self.assertEqual('msg1', rh.get_log_info(req.environ))
+        rh.append_log_info(req.environ, 'msg2')
+        self.assertEqual('msg1,msg2', rh.get_log_info(req.environ))
+
+    def test_constrain_req_limit(self):
+        req = Request.blank('')
+        self.assertEqual(10, rh.constrain_req_limit(req, 10))
+        req = Request.blank('', query_string='limit=1')
+        self.assertEqual(1, rh.constrain_req_limit(req, 10))
+        req = Request.blank('', query_string='limit=1.0')
+        self.assertEqual(10, rh.constrain_req_limit(req, 10))
+        req = Request.blank('', query_string='limit=11')
+        with self.assertRaises(HTTPException) as raised:
+            rh.constrain_req_limit(req, 10)
+        self.assertEqual(raised.exception.status_int, 412)
+
+    def test_validate_params(self):
+        req = Request.blank('')
+        actual = rh.validate_params(req, ('limit', 'marker', 'end_marker'))
+        self.assertEqual({}, actual)
+
+        req = Request.blank('', query_string='limit=1&junk=here&marker=foo')
+        actual = rh.validate_params(req, ())
+        self.assertEqual({}, actual)
+
+        req = Request.blank('', query_string='limit=1&junk=here&marker=foo')
+        actual = rh.validate_params(req, ('limit', 'marker', 'end_marker'))
+        expected = {'limit': '1', 'marker': 'foo'}
+        self.assertEqual(expected, actual)
+
+        req = Request.blank('', query_string='limit=1&junk=here&marker=')
+        actual = rh.validate_params(req, ('limit', 'marker', 'end_marker'))
+        expected = {'limit': '1', 'marker': ''}
+        self.assertEqual(expected, actual)
+
+        # ignore bad junk
+        req = Request.blank('', query_string='limit=1&junk=%ff&marker=foo')
+        actual = rh.validate_params(req, ('limit', 'marker', 'end_marker'))
+        expected = {'limit': '1', 'marker': 'foo'}
+        self.assertEqual(expected, actual)
+
+        # error on bad wanted parameter
+        req = Request.blank('', query_string='limit=1&junk=here&marker=%ff')
+        with self.assertRaises(HTTPException) as raised:
+            rh.validate_params(req, ('limit', 'marker', 'end_marker'))
+        self.assertEqual(raised.exception.status_int, 400)
+
+    def test_validate_container_params(self):
+        req = Request.blank('')
+        actual = rh.validate_container_params(req)
+        self.assertEqual({'limit': 10000}, actual)
+
+        req = Request.blank('', query_string='limit=1&junk=here&marker=foo')
+        actual = rh.validate_container_params(req)
+        expected = {'limit': 1, 'marker': 'foo'}
+        self.assertEqual(expected, actual)
+
+        req = Request.blank('', query_string='limit=1&junk=here&marker=')
+        actual = rh.validate_container_params(req)
+        expected = {'limit': 1, 'marker': ''}
+        self.assertEqual(expected, actual)
+
+        # ignore bad junk
+        req = Request.blank('', query_string='limit=1&junk=%ff&marker=foo')
+        actual = rh.validate_container_params(req)
+        expected = {'limit': 1, 'marker': 'foo'}
+        self.assertEqual(expected, actual)
+
+        # error on bad wanted parameter
+        req = Request.blank('', query_string='limit=1&junk=here&marker=%ff')
+        with self.assertRaises(HTTPException) as raised:
+            rh.validate_container_params(req)
+        self.assertEqual(raised.exception.status_int, 400)
+
+        # error on bad limit
+        req = Request.blank('', query_string='limit=10001')
+        with self.assertRaises(HTTPException) as raised:
+            rh.validate_container_params(req)
+        self.assertEqual(raised.exception.status_int, 412)
+
+    def test_is_user_meta(self):
+        m_type = 'meta'
+        for st in server_types:
+            self.assertTrue(rh.is_user_meta(st, 'x-%s-%s-foo' % (st, m_type)))
+            self.assertFalse(rh.is_user_meta(st, 'x-%s-%s-' % (st, m_type)))
+            self.assertFalse(rh.is_user_meta(st, 'x-%s-%sfoo' % (st, m_type)))
+
+    def test_is_sys_meta(self):
+        m_type = 'sysmeta'
+        for st in server_types:
+            self.assertTrue(rh.is_sys_meta(st, 'x-%s-%s-foo' % (st, m_type)))
+            self.assertFalse(rh.is_sys_meta(st, 'x-%s-%s-' % (st, m_type)))
+            self.assertFalse(rh.is_sys_meta(st, 'x-%s-%sfoo' % (st, m_type)))
+
+    def test_is_sys_or_user_meta(self):
+        m_types = ['sysmeta', 'meta']
+        for mt in m_types:
+            for st in server_types:
+                self.assertTrue(rh.is_sys_or_user_meta(
+                    st, 'x-%s-%s-foo' % (st, mt)))
+                self.assertFalse(rh.is_sys_or_user_meta(
+                    st, 'x-%s-%s-' % (st, mt)))
+                self.assertFalse(rh.is_sys_or_user_meta(
+                    st, 'x-%s-%sfoo' % (st, mt)))
+
+    def test_strip_sys_meta_prefix(self):
+        mt = 'sysmeta'
+        for st in server_types:
+            self.assertEqual(rh.strip_sys_meta_prefix(
+                st, 'x-%s-%s-a' % (st, mt)), 'a')
+        mt = 'not-sysmeta'
+        for st in server_types:
+            with self.assertRaises(ValueError):
+                rh.strip_sys_meta_prefix(st, 'x-%s-%s-a' % (st, mt))
+
+    def test_strip_user_meta_prefix(self):
+        mt = 'meta'
+        for st in server_types:
+            self.assertEqual(rh.strip_user_meta_prefix(
+                st, 'x-%s-%s-a' % (st, mt)), 'a')
+        mt = 'not-meta'
+        for st in server_types:
+            with self.assertRaises(ValueError):
+                rh.strip_sys_meta_prefix(st, 'x-%s-%s-a' % (st, mt))
+
+    def test_is_object_transient_sysmeta(self):
+        self.assertTrue(rh.is_object_transient_sysmeta(
+            'x-object-transient-sysmeta-foo'))
+        self.assertFalse(rh.is_object_transient_sysmeta(
+            'x-object-transient-sysmeta-'))
+        self.assertFalse(rh.is_object_transient_sysmeta(
+            'x-object-meatmeta-foo'))
+
+    def test_strip_object_transient_sysmeta_prefix(self):
+        mt = 'object-transient-sysmeta'
+        self.assertEqual(rh.strip_object_transient_sysmeta_prefix(
+            'x-%s-a' % mt), 'a')
+
+        mt = 'object-sysmeta-transient'
+        with self.assertRaises(ValueError):
+            rh.strip_object_transient_sysmeta_prefix('x-%s-a' % mt)
+
+    def test_remove_items(self):
+        src = {'a': 'b',
+               'c': 'd'}
+        test = lambda x: x == 'a'
+        rem = rh.remove_items(src, test)
+        self.assertEqual(src, {'c': 'd'})
+        self.assertEqual(rem, {'a': 'b'})
+
+    def test_copy_header_subset(self):
+        src = {'a': 'b',
+               'c': 'd'}
+        from_req = Request.blank('/path', environ={}, headers=src)
+        to_req = Request.blank('/path', {})
+        test = lambda x: x.lower() == 'a'
+        rh.copy_header_subset(from_req, to_req, test)
+        self.assertTrue('A' in to_req.headers)
+        self.assertEqual(to_req.headers['A'], 'b')
+        self.assertFalse('c' in to_req.headers)
+        self.assertFalse('C' in to_req.headers)
+
+    def test_is_use_replication_network(self):
+        self.assertFalse(rh.is_use_replication_network())
+        self.assertFalse(rh.is_use_replication_network({}))
+        self.assertFalse(rh.is_use_replication_network(
+            {'x-backend-use-replication-network': 'false'}))
+        self.assertFalse(rh.is_use_replication_network(
+            {'x-backend-use-replication-network': 'no'}))
+
+        self.assertTrue(rh.is_use_replication_network(
+            {'x-backend-use-replication-network': 'true'}))
+        self.assertTrue(rh.is_use_replication_network(
+            {'x-backend-use-replication-network': 'yes'}))
+        self.assertTrue(rh.is_use_replication_network(
+            {'X-Backend-Use-Replication-Network': 'True'}))
+
+    def test_get_ip_port(self):
+        node = {
+            'ip': '1.2.3.4',
+            'port': 6000,
+            'replication_ip': '5.6.7.8',
+            'replication_port': 7000,
+        }
+        self.assertEqual(('1.2.3.4', 6000), rh.get_ip_port(node, {}))
+        self.assertEqual(('5.6.7.8', 7000), rh.get_ip_port(node, {
+            rh.USE_REPLICATION_NETWORK_HEADER: 'true'}))
+        self.assertEqual(('1.2.3.4', 6000), rh.get_ip_port(node, {
+            rh.USE_REPLICATION_NETWORK_HEADER: 'false'}))
+
+        # node trumps absent header and False header
+        node['use_replication'] = True
+        self.assertEqual(('5.6.7.8', 7000), rh.get_ip_port(node, {}))
+        self.assertEqual(('5.6.7.8', 7000), rh.get_ip_port(node, {
+            rh.USE_REPLICATION_NETWORK_HEADER: 'false'}))
+
+        # True header trumps node
+        node['use_replication'] = False
+        self.assertEqual(('5.6.7.8', 7000), rh.get_ip_port(node, {
+            rh.USE_REPLICATION_NETWORK_HEADER: 'true'}))
+
+    @patch_policies(with_ec_default=True)
+    def test_get_name_and_placement_object_req(self):
+        path = '/device/part/account/container/object'
+        req = Request.blank(path, headers={
+            'X-Backend-Storage-Policy-Index': '0'})
+        device, part, account, container, obj, policy = \
+            rh.get_name_and_placement(req, 5, 5, True)
+        self.assertEqual(device, 'device')
+        self.assertEqual(part, 'part')
+        self.assertEqual(account, 'account')
+        self.assertEqual(container, 'container')
+        self.assertEqual(obj, 'object')
+        self.assertEqual(policy, POLICIES[0])
+        self.assertEqual(policy.policy_type, EC_POLICY)
+
+        req.headers['X-Backend-Storage-Policy-Index'] = 1
+        device, part, account, container, obj, policy = \
+            rh.get_name_and_placement(req, 5, 5, True)
+        self.assertEqual(device, 'device')
+        self.assertEqual(part, 'part')
+        self.assertEqual(account, 'account')
+        self.assertEqual(container, 'container')
+        self.assertEqual(obj, 'object')
+        self.assertEqual(policy, POLICIES[1])
+        self.assertEqual(policy.policy_type, REPL_POLICY)
+
+        req.headers['X-Backend-Storage-Policy-Index'] = 'foo'
+        with self.assertRaises(HTTPException) as raised:
+            device, part, account, container, obj, policy = \
+                rh.get_name_and_placement(req, 5, 5, True)
+        e = raised.exception
+        self.assertEqual(e.status_int, 503)
+        self.assertEqual(str(e), '503 Service Unavailable')
+        self.assertEqual(e.body, b"No policy with index foo")
+
+    @patch_policies(with_ec_default=True)
+    def test_get_name_and_placement_object_replication(self):
+        # yup, suffixes are sent '-'.joined in the path
+        path = '/device/part/012-345-678-9ab-cde'
+        req = Request.blank(path, headers={
+            'X-Backend-Storage-Policy-Index': '0'})
+        device, partition, suffix_parts, policy = \
+            rh.get_name_and_placement(req, 2, 3, True)
+        self.assertEqual(device, 'device')
+        self.assertEqual(partition, 'part')
+        self.assertEqual(suffix_parts, '012-345-678-9ab-cde')
+        self.assertEqual(policy, POLICIES[0])
+        self.assertEqual(policy.policy_type, EC_POLICY)
+
+        path = '/device/part'
+        req = Request.blank(path, headers={
+            'X-Backend-Storage-Policy-Index': '1'})
+        device, partition, suffix_parts, policy = \
+            rh.get_name_and_placement(req, 2, 3, True)
+        self.assertEqual(device, 'device')
+        self.assertEqual(partition, 'part')
+        self.assertIsNone(suffix_parts)  # false-y
+        self.assertEqual(policy, POLICIES[1])
+        self.assertEqual(policy.policy_type, REPL_POLICY)
+
+        path = '/device/part/'  # with a trailing slash
+        req = Request.blank(path, headers={
+            'X-Backend-Storage-Policy-Index': '1'})
+        device, partition, suffix_parts, policy = \
+            rh.get_name_and_placement(req, 2, 3, True)
+        self.assertEqual(device, 'device')
+        self.assertEqual(partition, 'part')
+        self.assertEqual(suffix_parts, '')  # still false-y
+        self.assertEqual(policy, POLICIES[1])
+        self.assertEqual(policy.policy_type, REPL_POLICY)
+
+    def test_validate_internal_name(self):
+        self.assertIsNone(rh._validate_internal_name('foo'))
+        self.assertIsNone(rh._validate_internal_name(
+            rh.get_reserved_name('foo')))
+        self.assertIsNone(rh._validate_internal_name(
+            rh.get_reserved_name('foo', 'bar')))
+        self.assertIsNone(rh._validate_internal_name(''))
+        self.assertIsNone(rh._validate_internal_name(rh.RESERVED))
+
+    def test_invalid_reserved_name(self):
+        with self.assertRaises(HTTPException) as raised:
+            rh._validate_internal_name('foo' + rh.RESERVED)
+        e = raised.exception
+        self.assertEqual(e.status_int, 400)
+        self.assertEqual(str(e), '400 Bad Request')
+        self.assertEqual(e.body, b"Invalid reserved-namespace name")
+
+    def test_validate_internal_account(self):
+        self.assertIsNone(rh.validate_internal_account('AUTH_foo'))
+        self.assertIsNone(rh.validate_internal_account(
+            rh.get_reserved_name('AUTH_foo')))
+        with self.assertRaises(HTTPException) as raised:
+            rh.validate_internal_account('AUTH_foo' + rh.RESERVED)
+        e = raised.exception
+        self.assertEqual(e.status_int, 400)
+        self.assertEqual(str(e), '400 Bad Request')
+        self.assertEqual(e.body, b"Invalid reserved-namespace account")
+
+    def test_validate_internal_container(self):
+        self.assertIsNone(rh.validate_internal_container('AUTH_foo', 'bar'))
+        self.assertIsNone(rh.validate_internal_container(
+            rh.get_reserved_name('AUTH_foo'), 'bar'))
+        self.assertIsNone(rh.validate_internal_container(
+            'foo', rh.get_reserved_name('bar')))
+        self.assertIsNone(rh.validate_internal_container(
+            rh.get_reserved_name('AUTH_foo'), rh.get_reserved_name('bar')))
+        with self.assertRaises(HTTPException) as raised:
+            rh.validate_internal_container('AUTH_foo' + rh.RESERVED, 'bar')
+        e = raised.exception
+        self.assertEqual(e.status_int, 400)
+        self.assertEqual(str(e), '400 Bad Request')
+        self.assertEqual(e.body, b"Invalid reserved-namespace account")
+        with self.assertRaises(HTTPException) as raised:
+            rh.validate_internal_container('AUTH_foo', 'bar' + rh.RESERVED)
+        e = raised.exception
+        self.assertEqual(e.status_int, 400)
+        self.assertEqual(str(e), '400 Bad Request')
+        self.assertEqual(e.body, b"Invalid reserved-namespace container")
+
+        # These should always be operating on split_path outputs so this
+        # shouldn't really be an issue, but just in case...
+        for acct in ('', None):
+            with self.assertRaises(ValueError) as raised:
+                rh.validate_internal_container(
+                    acct, 'bar')
+            self.assertEqual(raised.exception.args[0], 'Account is required')
+
+    def test_validate_internal_object(self):
+        self.assertIsNone(rh.validate_internal_obj('AUTH_foo', 'bar', 'baz'))
+        self.assertIsNone(rh.validate_internal_obj(
+            rh.get_reserved_name('AUTH_foo'), 'bar', 'baz'))
+        for acct in ('AUTH_foo', rh.get_reserved_name('AUTH_foo')):
+            self.assertIsNone(rh.validate_internal_obj(
+                acct,
+                rh.get_reserved_name('bar'),
+                rh.get_reserved_name('baz')))
+        for acct in ('AUTH_foo', rh.get_reserved_name('AUTH_foo')):
+            with self.assertRaises(HTTPException) as raised:
+                rh.validate_internal_obj(
+                    acct, 'bar', rh.get_reserved_name('baz'))
+            e = raised.exception
+            self.assertEqual(e.status_int, 400)
+            self.assertEqual(str(e), '400 Bad Request')
+            self.assertEqual(e.body, b"Invalid reserved-namespace object "
+                             b"in user-namespace container")
+        for acct in ('AUTH_foo', rh.get_reserved_name('AUTH_foo')):
+            with self.assertRaises(HTTPException) as raised:
+                rh.validate_internal_obj(
+                    acct, rh.get_reserved_name('bar'), 'baz')
+            e = raised.exception
+            self.assertEqual(e.status_int, 400)
+            self.assertEqual(str(e), '400 Bad Request')
+            self.assertEqual(e.body, b"Invalid user-namespace object "
+                             b"in reserved-namespace container")
+
+        # These should always be operating on split_path outputs so this
+        # shouldn't really be an issue, but just in case...
+        for acct in ('', None):
+            with self.assertRaises(ValueError) as raised:
+                rh.validate_internal_obj(
+                    acct, 'bar', 'baz')
+            self.assertEqual(raised.exception.args[0], 'Account is required')
+
+        for cont in ('', None):
+            with self.assertRaises(ValueError) as raised:
+                rh.validate_internal_obj(
+                    'AUTH_foo', cont, 'baz')
+            self.assertEqual(raised.exception.args[0], 'Container is required')
+
+    def test_invalid_names_in_system_accounts(self):
+        self.assertIsNone(rh.validate_internal_obj(
+            AUTO_CREATE_ACCOUNT_PREFIX + 'system_account', 'foo',
+            'crazy%stown' % rh.RESERVED))
+
+    def test_invalid_reserved_names(self):
+        with self.assertRaises(HTTPException) as raised:
+            rh.validate_internal_obj('AUTH_foo' + rh.RESERVED, 'bar', 'baz')
+        e = raised.exception
+        self.assertEqual(e.status_int, 400)
+        self.assertEqual(str(e), '400 Bad Request')
+        self.assertEqual(e.body, b"Invalid reserved-namespace account")
+        with self.assertRaises(HTTPException) as raised:
+            rh.validate_internal_obj('AUTH_foo', 'bar' + rh.RESERVED, 'baz')
+        e = raised.exception
+        self.assertEqual(e.status_int, 400)
+        self.assertEqual(str(e), '400 Bad Request')
+        self.assertEqual(e.body, b"Invalid reserved-namespace container")
+        with self.assertRaises(HTTPException) as raised:
+            rh.validate_internal_obj('AUTH_foo', 'bar', 'baz' + rh.RESERVED)
+        e = raised.exception
+        self.assertEqual(e.status_int, 400)
+        self.assertEqual(str(e), '400 Bad Request')
+        self.assertEqual(e.body, b"Invalid reserved-namespace object")
+
+    def test_get_reserved_name(self):
+        expectations = {
+            tuple(): rh.RESERVED,
+            ('',): rh.RESERVED,
+            ('foo',): rh.RESERVED + 'foo',
+            ('foo', 'bar'): rh.RESERVED + 'foo' + rh.RESERVED + 'bar',
+            ('foo', ''): rh.RESERVED + 'foo' + rh.RESERVED,
+            ('', ''): rh.RESERVED * 2,
+        }
+        failures = []
+        for parts, expected in expectations.items():
+            name = rh.get_reserved_name(*parts)
+            if name != expected:
+                failures.append('get given %r expected %r != %r' % (
+                    parts, expected, name))
+        if failures:
+            self.fail('Unexpected reults:\n' + '\n'.join(failures))
+
+    def test_invalid_get_reserved_name(self):
+        self.assertRaises(ValueError)
+        with self.assertRaises(ValueError) as ctx:
+            rh.get_reserved_name('foo', rh.RESERVED + 'bar', 'baz')
+        self.assertEqual(str(ctx.exception),
+                         'Invalid reserved part in components')
+
+    def test_split_reserved_name(self):
+        expectations = {
+            rh.RESERVED: ('',),
+            rh.RESERVED + 'foo': ('foo',),
+            rh.RESERVED + 'foo' + rh.RESERVED + 'bar': ('foo', 'bar'),
+            rh.RESERVED + 'foo' + rh.RESERVED: ('foo', ''),
+            rh.RESERVED * 2: ('', ''),
+        }
+        failures = []
+        for name, expected in expectations.items():
+            parts = rh.split_reserved_name(name)
+            if tuple(parts) != expected:
+                failures.append('split given %r expected %r != %r' % (
+                    name, expected, parts))
+        if failures:
+            self.fail('Unexpected reults:\n' + '\n'.join(failures))
+
+    def test_invalid_split_reserved_name(self):
+        self.assertRaises(ValueError)
+        with self.assertRaises(ValueError) as ctx:
+            rh.split_reserved_name('foo')
+        self.assertEqual(str(ctx.exception),
+                         'Invalid reserved name')
+
+    def test_is_open_expired(self):
+        app = argparse.Namespace(allow_open_expired=False)
+        req = Request.blank('/v1/a/c/o', headers={'X-Open-Expired': 'yes'})
+        self.assertFalse(rh.is_open_expired(app, req))
+        req = Request.blank('/v1/a/c/o', headers={'X-Open-Expired': 'no'})
+        self.assertFalse(rh.is_open_expired(app, req))
+        req = Request.blank('/v1/a/c/o', headers={})
+        self.assertFalse(rh.is_open_expired(app, req))
+
+        app = argparse.Namespace(allow_open_expired=True)
+        req = Request.blank('/v1/a/c/o', headers={'X-Open-Expired': 'no'})
+        self.assertFalse(rh.is_open_expired(app, req))
+        req = Request.blank('/v1/a/c/o', headers={})
+        self.assertFalse(rh.is_open_expired(app, req))
+
+        req = Request.blank('/v1/a/c/o', headers={'X-Open-Expired': 'yes'})
+        self.assertTrue(rh.is_open_expired(app, req))
+
+    def test_is_backend_open_expired(self):
+        req = Request.blank('/v1/a/c/o', headers={
+            'X-Backend-Open-Expired': 'yes'
+        })
+        self.assertTrue(rh.is_backend_open_expired(req))
+        req = Request.blank('/v1/a/c/o', headers={
+            'X-Backend-Open-Expired': 'no'
+        })
+        self.assertFalse(rh.is_backend_open_expired(req))
+
+        req = Request.blank('/v1/a/c/o', headers={
+            'X-Backend-Replication': 'yes'
+        })
+        self.assertTrue(rh.is_backend_open_expired(req))
+        req = Request.blank('/v1/a/c/o', headers={
+            'X-Backend-Replication': 'no'
+        })
+        self.assertFalse(rh.is_backend_open_expired(req))
+
+        req = Request.blank('/v1/a/c/o', headers={})
+        self.assertFalse(rh.is_backend_open_expired(req))
+
+
+class TestHTTPResponseToDocumentIters(unittest.TestCase):
+    def test_200(self):
+        fr = FakeResponse(
+            200,
+            {'Content-Length': '10', 'Content-Type': 'application/lunch'},
+            b'sandwiches')
+
+        doc_iters = rh.http_response_to_document_iters(fr)
+        first_byte, last_byte, length, headers, body = next(doc_iters)
+        self.assertEqual(first_byte, 0)
+        self.assertEqual(last_byte, 9)
+        self.assertEqual(length, 10)
+        header_dict = HeaderKeyDict(headers)
+        self.assertEqual(header_dict.get('Content-Length'), '10')
+        self.assertEqual(header_dict.get('Content-Type'), 'application/lunch')
+        self.assertEqual(body.read(), b'sandwiches')
+
+        self.assertRaises(StopIteration, next, doc_iters)
+
+        fr = FakeResponse(
+            200,
+            {'Transfer-Encoding': 'chunked',
+             'Content-Type': 'application/lunch'},
+            b'sandwiches')
+
+        doc_iters = rh.http_response_to_document_iters(fr)
+        first_byte, last_byte, length, headers, body = next(doc_iters)
+        self.assertEqual(first_byte, 0)
+        self.assertIsNone(last_byte)
+        self.assertIsNone(length)
+        header_dict = HeaderKeyDict(headers)
+        self.assertEqual(header_dict.get('Transfer-Encoding'), 'chunked')
+        self.assertEqual(header_dict.get('Content-Type'), 'application/lunch')
+        self.assertEqual(body.read(), b'sandwiches')
+
+        self.assertRaises(StopIteration, next, doc_iters)
+
+    def test_206_single_range(self):
+        fr = FakeResponse(
+            206,
+            {'Content-Length': '8', 'Content-Type': 'application/lunch',
+             'Content-Range': 'bytes 1-8/10'},
+            b'andwiche')
+
+        doc_iters = rh.http_response_to_document_iters(fr)
+        first_byte, last_byte, length, headers, body = next(doc_iters)
+        self.assertEqual(first_byte, 1)
+        self.assertEqual(last_byte, 8)
+        self.assertEqual(length, 10)
+        header_dict = HeaderKeyDict(headers)
+        self.assertEqual(header_dict.get('Content-Length'), '8')
+        self.assertEqual(header_dict.get('Content-Type'), 'application/lunch')
+        self.assertEqual(body.read(), b'andwiche')
+
+        self.assertRaises(StopIteration, next, doc_iters)
+
+        # Chunked response should be treated in the same way as non-chunked one
+        fr = FakeResponse(
+            206,
+            {'Transfer-Encoding': 'chunked',
+             'Content-Type': 'application/lunch',
+             'Content-Range': 'bytes 1-8/10'},
+            b'andwiche')
+
+        doc_iters = rh.http_response_to_document_iters(fr)
+        first_byte, last_byte, length, headers, body = next(doc_iters)
+        self.assertEqual(first_byte, 1)
+        self.assertEqual(last_byte, 8)
+        self.assertEqual(length, 10)
+        header_dict = HeaderKeyDict(headers)
+        self.assertEqual(header_dict.get('Content-Type'), 'application/lunch')
+        self.assertEqual(body.read(), b'andwiche')
+
+        self.assertRaises(StopIteration, next, doc_iters)
+
+    def test_206_multiple_ranges(self):
+        fr = FakeResponse(
+            206,
+            {'Content-Type': 'multipart/byteranges; boundary=asdfasdfasdf'},
+            (b"--asdfasdfasdf\r\n"
+             b"Content-Type: application/lunch\r\n"
+             b"Content-Range: bytes 0-3/10\r\n"
+             b"\r\n"
+             b"sand\r\n"
+             b"--asdfasdfasdf\r\n"
+             b"Content-Type: application/lunch\r\n"
+             b"Content-Range: bytes 6-9/10\r\n"
+             b"\r\n"
+             b"ches\r\n"
+             b"--asdfasdfasdf--"))
+
+        doc_iters = rh.http_response_to_document_iters(fr)
+
+        first_byte, last_byte, length, headers, body = next(doc_iters)
+        self.assertEqual(first_byte, 0)
+        self.assertEqual(last_byte, 3)
+        self.assertEqual(length, 10)
+        header_dict = HeaderKeyDict(headers)
+        self.assertEqual(header_dict.get('Content-Type'), 'application/lunch')
+        self.assertEqual(body.read(), b'sand')
+
+        first_byte, last_byte, length, headers, body = next(doc_iters)
+        self.assertEqual(first_byte, 6)
+        self.assertEqual(last_byte, 9)
+        self.assertEqual(length, 10)
+        header_dict = HeaderKeyDict(headers)
+        self.assertEqual(header_dict.get('Content-Type'), 'application/lunch')
+        self.assertEqual(body.read(), b'ches')
+
+        self.assertRaises(StopIteration, next, doc_iters)
+
+    def test_update_etag_is_at_header(self):
+        # start with no existing X-Backend-Etag-Is-At
+        req = Request.blank('/v/a/c/o')
+        rh.update_etag_is_at_header(req, 'X-Object-Sysmeta-My-Etag')
+        self.assertEqual('X-Object-Sysmeta-My-Etag',
+                         req.headers['X-Backend-Etag-Is-At'])
+        # add another alternate
+        rh.update_etag_is_at_header(req, 'X-Object-Sysmeta-Ec-Etag')
+        self.assertEqual('X-Object-Sysmeta-My-Etag,X-Object-Sysmeta-Ec-Etag',
+                         req.headers['X-Backend-Etag-Is-At'])
+        with self.assertRaises(ValueError) as cm:
+            rh.update_etag_is_at_header(req, 'X-Object-Sysmeta-,-Bad')
+        self.assertEqual('Header name must not contain commas',
+                         cm.exception.args[0])
+
+    def test_resolve_etag_is_at_header(self):
+        def do_test():
+            req = Request.blank('/v/a/c/o')
+            # ok to have no X-Backend-Etag-Is-At
+            self.assertIsNone(rh.resolve_etag_is_at_header(req, metadata))
+
+            # ok to have no matching metadata
+            req.headers['X-Backend-Etag-Is-At'] = 'X-Not-There'
+            self.assertIsNone(rh.resolve_etag_is_at_header(req, metadata))
+
+            # selects from metadata
+            req.headers['X-Backend-Etag-Is-At'] = 'X-Object-Sysmeta-Ec-Etag'
+            self.assertEqual('an etag value',
+                             rh.resolve_etag_is_at_header(req, metadata))
+            req.headers['X-Backend-Etag-Is-At'] = 'X-Object-Sysmeta-My-Etag'
+            self.assertEqual('another etag value',
+                             rh.resolve_etag_is_at_header(req, metadata))
+
+            # first in list takes precedence
+            req.headers['X-Backend-Etag-Is-At'] = \
+                'X-Object-Sysmeta-My-Etag,X-Object-Sysmeta-Ec-Etag'
+            self.assertEqual('another etag value',
+                             rh.resolve_etag_is_at_header(req, metadata))
+
+            # non-existent alternates are passed over
+            req.headers['X-Backend-Etag-Is-At'] = \
+                'X-Bogus,X-Object-Sysmeta-My-Etag,X-Object-Sysmeta-Ec-Etag'
+            self.assertEqual('another etag value',
+                             rh.resolve_etag_is_at_header(req, metadata))
+
+            # spaces in list are ok
+            alts = 'X-Foo, X-Object-Sysmeta-My-Etag , X-Object-Sysmeta-Ec-Etag'
+            req.headers['X-Backend-Etag-Is-At'] = alts
+            self.assertEqual('another etag value',
+                             rh.resolve_etag_is_at_header(req, metadata))
+
+            # lower case in list is ok
+            alts = alts.lower()
+            req.headers['X-Backend-Etag-Is-At'] = alts
+            self.assertEqual('another etag value',
+                             rh.resolve_etag_is_at_header(req, metadata))
+
+            # upper case in list is ok
+            alts = alts.upper()
+            req.headers['X-Backend-Etag-Is-At'] = alts
+            self.assertEqual('another etag value',
+                             rh.resolve_etag_is_at_header(req, metadata))
+
+        metadata = {'X-Object-Sysmeta-Ec-Etag': 'an etag value',
+                    'X-Object-Sysmeta-My-Etag': 'another etag value'}
+        do_test()
+        metadata = dict((k.lower(), v) for k, v in metadata.items())
+        do_test()
+        metadata = dict((k.upper(), v) for k, v in metadata.items())
+        do_test()
+
+    def test_ignore_range_header(self):
+        req = Request.blank('/v/a/c/o')
+        self.assertIsNone(req.headers.get(
+            'X-Backend-Ignore-Range-If-Metadata-Present'))
+        rh.update_ignore_range_header(req, 'X-Static-Large-Object')
+        self.assertEqual('X-Static-Large-Object', req.headers.get(
+            'X-Backend-Ignore-Range-If-Metadata-Present'))
+        rh.update_ignore_range_header(req, 'X-Static-Large-Object')
+        self.assertEqual(
+            'X-Static-Large-Object,X-Static-Large-Object',
+            req.headers.get('X-Backend-Ignore-Range-If-Metadata-Present'))
+        rh.update_ignore_range_header(req, 'X-Object-Sysmeta-Slo-Etag')
+        self.assertEqual(
+            'X-Static-Large-Object,X-Static-Large-Object,'
+            'X-Object-Sysmeta-Slo-Etag',
+            req.headers.get('X-Backend-Ignore-Range-If-Metadata-Present'))
+
+    def test_resolove_ignore_range_header(self):
+        # no ignore header is no-op
+        req = Request.blank('/v/a/c/o', headers={'Range': 'bytes=0-4'})
+        self.assertEqual(str(req.range), 'bytes=0-4')
+        rh.resolve_ignore_range_header(req, {
+            'X-Static-Large-Object': True,
+            'X-Object-Meta-Color': 'blue',
+        })
+        self.assertEqual(str(req.range), 'bytes=0-4')
+
+        # missing matching metadata is no-op
+        rh.update_ignore_range_header(req, 'X-Static-Large-Object')
+        rh.resolve_ignore_range_header(req, {
+            'X-Object-Meta-Color': 'blue',
+        })
+        self.assertEqual(str(req.range), 'bytes=0-4')
+
+        # matching metadata pops range
+        rh.resolve_ignore_range_header(req, {
+            'X-Static-Large-Object': True,
+            'X-Object-Meta-Color': 'blue',
+        })
+        self.assertIsNone(req.range)
+
+    def test_multiple_resolove_ignore_range_header(self):
+        req = Request.blank('/v/a/c/o', headers={'Range': 'bytes=0-4'})
+        rh.update_ignore_range_header(req, 'X-Static-Large-Object')
+        rh.update_ignore_range_header(req, 'X-Object-Sysmeta-Slo-Etag')
+        rh.resolve_ignore_range_header(req, {
+            'X-Static-Large-Object': True,
+            'X-Object-Meta-Color': 'blue',
+        })
+        self.assertIsNone(req.range)
+
+
+class TestSegmentedIterable(unittest.TestCase):
+
+    def setUp(self):
+        self.logger = debug_logger()
+        self.app = FakeSwift()
+        self.expected_unread_requests = {}
+
+    def tearDown(self):
+        self.assertFalse(self.app.unclosed_requests)
+        self.assertEqual(self.app.unread_requests,
+                         self.expected_unread_requests)
+
+    def test_simple_segments_app_iter(self):
+        self.app.register('GET', '/a/c/seg1', HTTPOk, {}, 'segment1')
+        self.app.register('GET', '/a/c/seg2', HTTPOk, {}, 'segment2')
+        req = Request.blank('/v1/a/c/mpu')
+        listing_iter = [
+            {'path': '/a/c/seg1', 'first_byte': None, 'last_byte': None},
+            {'path': '/a/c/seg2', 'first_byte': None, 'last_byte': None},
+        ]
+        si = rh.SegmentedIterable(req, self.app, listing_iter, 60, self.logger,
+                                  'test-agent', 'test-source')
+        body = b''.join(si.app_iter)
+        self.assertEqual(b'segment1segment2', body)
+
+    def test_simple_segments_app_iter_ranges(self):
+        self.app.register('GET', '/a/c/seg1', HTTPOk, {}, 'segment1')
+        self.app.register('GET', '/a/c/seg2', HTTPOk, {}, 'segment2')
+        req = Request.blank('/v1/a/c/mpu')
+        listing_iter = [
+            {'path': '/a/c/seg1', 'first_byte': None, 'last_byte': None},
+            {'path': '/a/c/seg2', 'first_byte': None, 'last_byte': None},
+        ]
+        si = rh.SegmentedIterable(req, self.app, listing_iter, 60, self.logger,
+                                  'test-agent', 'test-source')
+        body = b''.join(si.app_iter_ranges(
+            [(0, 8), (8, 16)], b'app/foo', b'bound', 16))
+        expected = b'\r\n'.join([
+            b'--bound',
+            b'Content-Type: app/foo',
+            b'Content-Range: bytes 0-7/16',
+            b'',
+            b'segment1',
+            b'--bound',
+            b'Content-Type: app/foo',
+            b'Content-Range: bytes 8-15/16',
+            b'',
+            b'segment2',
+            b'--bound--',
+        ])
+        self.assertEqual(expected, body)
diff --git a/test/unit/common/test_splice.py b/test/unit/common/test_splice.py
new file mode 100644
index 0000000000..b6451097b8
--- /dev/null
+++ b/test/unit/common/test_splice.py
@@ -0,0 +1,309 @@
+# Copyright (c) 2014 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+'''Tests for `swift.common.splice`'''
+
+import os
+import errno
+import ctypes
+import logging
+import tempfile
+import unittest
+import contextlib
+import re
+
+from unittest import mock
+
+from swift.common.splice import splice, tee
+
+LOGGER = logging.getLogger(__name__)
+
+
+def safe_close(fd):
+    '''Close a file descriptor, ignoring any exceptions'''
+
+    try:
+        os.close(fd)
+    except Exception:
+        LOGGER.exception('Error while closing FD')
+
+
+@contextlib.contextmanager
+def pipe():
+    '''Context-manager providing 2 ends of a pipe, closing them at exit'''
+
+    fds = os.pipe()
+
+    try:
+        yield fds
+    finally:
+        safe_close(fds[0])
+        safe_close(fds[1])
+
+
+class TestSplice(unittest.TestCase):
+    '''Tests for `splice`'''
+
+    def setUp(self):
+        if not splice.available:
+            raise unittest.SkipTest('splice not available')
+
+    def test_flags(self):
+        '''Test flag attribute availability'''
+
+        self.assertTrue(hasattr(splice, 'SPLICE_F_MOVE'))
+        self.assertTrue(hasattr(splice, 'SPLICE_F_NONBLOCK'))
+        self.assertTrue(hasattr(splice, 'SPLICE_F_MORE'))
+        self.assertTrue(hasattr(splice, 'SPLICE_F_GIFT'))
+
+    @mock.patch('swift.common.splice.splice._c_splice', None)
+    def test_available(self):
+        '''Test `available` attribute correctness'''
+
+        self.assertFalse(splice.available)
+
+    def test_splice_pipe_to_pipe(self):
+        '''Test `splice` from a pipe to a pipe'''
+
+        with pipe() as (p1a, p1b):
+            with pipe() as (p2a, p2b):
+                os.write(p1b, b'abcdef')
+                res = splice(p1a, None, p2b, None, 3, 0)
+                self.assertEqual(res, (3, None, None))
+                self.assertEqual(os.read(p2a, 3), b'abc')
+                self.assertEqual(os.read(p1a, 3), b'def')
+
+    def test_splice_file_to_pipe(self):
+        '''Test `splice` from a file to a pipe'''
+
+        with tempfile.NamedTemporaryFile(buffering=0) as fd:
+            with pipe() as (pa, pb):
+                fd.write(b'abcdef')
+                fd.seek(0, os.SEEK_SET)
+
+                res = splice(fd, None, pb, None, 3, 0)
+                self.assertEqual(res, (3, None, None))
+                # `fd.tell()` isn't updated...
+                self.assertEqual(os.lseek(fd.fileno(), 0, os.SEEK_CUR), 3)
+
+                fd.seek(0, os.SEEK_SET)
+                res = splice(fd, 3, pb, None, 3, 0)
+                self.assertEqual(res, (3, 6, None))
+                self.assertEqual(os.lseek(fd.fileno(), 0, os.SEEK_CUR), 0)
+
+                self.assertEqual(os.read(pa, 6), b'abcdef')
+
+    def test_splice_pipe_to_file(self):
+        '''Test `splice` from a pipe to a file'''
+
+        with tempfile.NamedTemporaryFile(buffering=0) as fd:
+            with pipe() as (pa, pb):
+                os.write(pb, b'abcdef')
+
+                res = splice(pa, None, fd, None, 3, 0)
+                self.assertEqual(res, (3, None, None))
+                self.assertEqual(fd.tell(), 3)
+
+                fd.seek(0, os.SEEK_SET)
+
+                res = splice(pa, None, fd, 3, 3, 0)
+                self.assertEqual(res, (3, None, 6))
+                self.assertEqual(fd.tell(), 0)
+
+                self.assertEqual(fd.read(6), b'abcdef')
+
+    @mock.patch.object(splice, '_c_splice')
+    def test_fileno(self, mock_splice):
+        '''Test handling of file-descriptors'''
+
+        splice(1, None, 2, None, 3, 0)
+        self.assertEqual(mock_splice.call_args,
+                         ((1, None, 2, None, 3, 0), {}))
+
+        mock_splice.reset_mock()
+
+        with open('/dev/zero', 'r') as fd:
+            splice(fd, None, fd, None, 3, 0)
+            self.assertEqual(mock_splice.call_args,
+                             ((fd.fileno(), None, fd.fileno(), None, 3, 0),
+                              {}))
+
+    @mock.patch.object(splice, '_c_splice')
+    def test_flags_list(self, mock_splice):
+        '''Test handling of flag lists'''
+
+        splice(1, None, 2, None, 3,
+               [splice.SPLICE_F_MOVE, splice.SPLICE_F_NONBLOCK])
+
+        flags = splice.SPLICE_F_MOVE | splice.SPLICE_F_NONBLOCK
+        self.assertEqual(mock_splice.call_args,
+                         ((1, None, 2, None, 3, flags), {}))
+
+        mock_splice.reset_mock()
+
+        splice(1, None, 2, None, 3, [])
+        self.assertEqual(mock_splice.call_args,
+                         ((1, None, 2, None, 3, 0), {}))
+
+    def test_errno(self):
+        '''Test handling of failures'''
+
+        # Invoke EBADF by using a read-only FD as fd_out
+        with open('/dev/null', 'r') as fd:
+            err = errno.EBADF
+            msg = r'\[Errno %d\] splice: %s' % (err, os.strerror(err))
+            try:
+                splice(fd, None, fd, None, 3, 0)
+            except IOError as e:
+                self.assertTrue(re.match(msg, str(e)))
+            else:
+                self.fail('Expected IOError was not raised')
+
+        self.assertEqual(ctypes.get_errno(), 0)
+
+    @mock.patch('swift.common.splice.splice._c_splice', None)
+    def test_unavailable(self):
+        '''Test exception when unavailable'''
+
+        self.assertRaises(EnvironmentError, splice, 1, None, 2, None, 2, 0)
+
+    def test_unavailable_in_libc(self):
+        '''Test `available` attribute when `libc` has no `splice` support'''
+
+        class LibC(object):
+            '''A fake `libc` object tracking `splice` attribute access'''
+
+            def __init__(self):
+                self.splice_retrieved = False
+
+            @property
+            def splice(self):
+                self.splice_retrieved = True
+                raise AttributeError
+
+        libc = LibC()
+        mock_cdll = mock.Mock(return_value=libc)
+
+        with mock.patch('ctypes.CDLL', new=mock_cdll):
+            # Force re-construction of a `Splice` instance
+            # Something you're not supposed to do in actual code
+            new_splice = type(splice)()
+            self.assertFalse(new_splice.available)
+
+        libc_name = ctypes.util.find_library('c')
+
+        mock_cdll.assert_called_once_with(libc_name, use_errno=True)
+        self.assertTrue(libc.splice_retrieved)
+
+
+class TestTee(unittest.TestCase):
+    '''Tests for `tee`'''
+
+    def setUp(self):
+        if not tee.available:
+            raise unittest.SkipTest('tee not available')
+
+    @mock.patch('swift.common.splice.tee._c_tee', None)
+    def test_available(self):
+        '''Test `available` attribute correctness'''
+
+        self.assertFalse(tee.available)
+
+    def test_tee_pipe_to_pipe(self):
+        '''Test `tee` from a pipe to a pipe'''
+
+        with pipe() as (p1a, p1b):
+            with pipe() as (p2a, p2b):
+                os.write(p1b, b'abcdef')
+                res = tee(p1a, p2b, 3, 0)
+                self.assertEqual(res, 3)
+                self.assertEqual(os.read(p2a, 3), b'abc')
+                self.assertEqual(os.read(p1a, 6), b'abcdef')
+
+    @mock.patch.object(tee, '_c_tee')
+    def test_fileno(self, mock_tee):
+        '''Test handling of file-descriptors'''
+
+        with pipe() as (pa, pb):
+            tee(pa, pb, 3, 0)
+            self.assertEqual(mock_tee.call_args, ((pa, pb, 3, 0), {}))
+
+            mock_tee.reset_mock()
+
+            tee(os.fdopen(pa, 'r'), os.fdopen(pb, 'w'), 3, 0)
+            self.assertEqual(mock_tee.call_args, ((pa, pb, 3, 0), {}))
+
+    @mock.patch.object(tee, '_c_tee')
+    def test_flags_list(self, mock_tee):
+        '''Test handling of flag lists'''
+
+        tee(1, 2, 3, [splice.SPLICE_F_MOVE | splice.SPLICE_F_NONBLOCK])
+        flags = splice.SPLICE_F_MOVE | splice.SPLICE_F_NONBLOCK
+        self.assertEqual(mock_tee.call_args, ((1, 2, 3, flags), {}))
+
+        mock_tee.reset_mock()
+
+        tee(1, 2, 3, [])
+        self.assertEqual(mock_tee.call_args, ((1, 2, 3, 0), {}))
+
+    def test_errno(self):
+        '''Test handling of failures'''
+
+        # Invoke EBADF by using a read-only FD as fd_out
+        with open('/dev/null', 'r') as fd:
+            err = errno.EBADF
+            msg = r'\[Errno %d\] tee: %s' % (err, os.strerror(err))
+            try:
+                tee(fd, fd, 3, 0)
+            except IOError as e:
+                self.assertTrue(re.match(msg, str(e)))
+            else:
+                self.fail('Expected IOError was not raised')
+
+        self.assertEqual(ctypes.get_errno(), 0)
+
+    @mock.patch('swift.common.splice.tee._c_tee', None)
+    def test_unavailable(self):
+        '''Test exception when unavailable'''
+
+        self.assertRaises(EnvironmentError, tee, 1, 2, 2, 0)
+
+    def test_unavailable_in_libc(self):
+        '''Test `available` attribute when `libc` has no `tee` support'''
+
+        class LibC(object):
+            '''A fake `libc` object tracking `tee` attribute access'''
+
+            def __init__(self):
+                self.tee_retrieved = False
+
+            @property
+            def tee(self):
+                self.tee_retrieved = True
+                raise AttributeError
+
+        libc = LibC()
+        mock_cdll = mock.Mock(return_value=libc)
+
+        with mock.patch('ctypes.CDLL', new=mock_cdll):
+            # Force re-construction of a `Tee` instance
+            # Something you're not supposed to do in actual code
+            new_tee = type(tee)()
+            self.assertFalse(new_tee.available)
+
+        libc_name = ctypes.util.find_library('c')
+
+        mock_cdll.assert_called_once_with(libc_name, use_errno=True)
+        self.assertTrue(libc.tee_retrieved)
diff --git a/test/unit/common/test_statsd_client.py b/test/unit/common/test_statsd_client.py
new file mode 100644
index 0000000000..056ea0717b
--- /dev/null
+++ b/test/unit/common/test_statsd_client.py
@@ -0,0 +1,1113 @@
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import errno
+import random
+import re
+import socket
+import sys
+import threading
+import time
+import unittest
+import warnings
+
+from unittest import mock
+from queue import Queue, Empty
+
+
+from swift.common import statsd_client
+from swift.common.statsd_client import StatsdClient, get_statsd_client
+
+from test.debug_logger import debug_logger
+
+
+class MockUdpSocket(object):
+    def __init__(self, sendto_errno=None):
+        self.sent = []
+        self.sendto_errno = sendto_errno
+
+    def sendto(self, data, target):
+        if self.sendto_errno:
+            raise socket.error(self.sendto_errno,
+                               'test errno %s' % self.sendto_errno)
+        self.sent.append((data, target))
+        return len(data)
+
+    def close(self):
+        pass
+
+
+class BaseTestStatsdClient(unittest.TestCase):
+    def setUp(self):
+        self.getaddrinfo_calls = []
+
+        def fake_getaddrinfo(host, port, *args):
+            self.getaddrinfo_calls.append((host, port))
+            # this is what a real getaddrinfo('localhost', port,
+            # socket.AF_INET) returned once
+            return [(socket.AF_INET,      # address family
+                     socket.SOCK_STREAM,  # socket type
+                     socket.IPPROTO_TCP,  # socket protocol
+                     '',                  # canonical name,
+                     ('127.0.0.1', port)),  # socket address
+                    (socket.AF_INET,
+                     socket.SOCK_DGRAM,
+                     socket.IPPROTO_UDP,
+                     '',
+                     ('127.0.0.1', port))]
+
+        self.real_getaddrinfo = statsd_client.socket.getaddrinfo
+        self.getaddrinfo_patcher = mock.patch.object(
+            statsd_client.socket, 'getaddrinfo', fake_getaddrinfo)
+        self.mock_getaddrinfo = self.getaddrinfo_patcher.start()
+        self.addCleanup(self.getaddrinfo_patcher.stop)
+        self.logger = debug_logger()
+
+
+class TestStatsdClient(BaseTestStatsdClient):
+    """
+    Tests here construct a StatsdClient directly.
+    """
+    def test_init_host(self):
+        client = StatsdClient('myhost', 1234)
+        self.assertEqual([('myhost', 1234)], self.getaddrinfo_calls)
+        client1 = statsd_client.get_statsd_client(
+            conf={'log_statsd_host': 'myhost1',
+                  'log_statsd_port': 1235})
+        with mock.patch.object(client, '_open_socket') as mock_open:
+            self.assertIs(client.increment('tunafish'),
+                          mock_open.return_value.sendto.return_value)
+        self.assertEqual(mock_open.mock_calls, [
+            mock.call(),
+            mock.call().sendto(b'tunafish:1|c', ('myhost', 1234)),
+            mock.call().close(),
+        ])
+        with mock.patch.object(client1, '_open_socket') as mock_open1:
+            self.assertIs(client1.increment('tunafish'),
+                          mock_open1.return_value.sendto.return_value)
+        self.assertEqual(mock_open1.mock_calls, [
+            mock.call(),
+            mock.call().sendto(b'tunafish:1|c', ('myhost1', 1235)),
+            mock.call().close(),
+        ])
+
+    def test_init_host_is_none(self):
+        client = StatsdClient(None, None)
+        client1 = statsd_client.get_statsd_client(conf=None,
+                                                  logger=None)
+        self.assertIsNone(client._host)
+        self.assertIsNone(client1._host)
+        self.assertFalse(self.getaddrinfo_calls)
+        with mock.patch.object(client, '_open_socket') as mock_open:
+            self.assertIsNone(client.increment('tunafish'))
+        self.assertFalse(mock_open.mock_calls)
+        with mock.patch.object(client1, '_open_socket') as mock_open1:
+            self.assertIsNone(client1.increment('tunafish'))
+        self.assertFalse(mock_open1.mock_calls)
+        self.assertFalse(self.getaddrinfo_calls)
+
+    def test_statsd_set_prefix_deprecation(self):
+        with warnings.catch_warnings(record=True) as cm:
+            warnings.resetwarnings()
+            warnings.simplefilter('always', DeprecationWarning)
+            client = StatsdClient(None, None)
+            client.set_prefix('some-name.more-specific')
+        msgs = [str(warning.message)
+                for warning in cm
+                if str(warning.message).startswith('set_prefix')]
+        self.assertEqual(
+            ['set_prefix() is deprecated; use the ``tail_prefix`` argument of '
+             'the constructor when instantiating the class instead.'],
+            msgs)
+        self.assertEqual('some-name.more-specific.', client._prefix)
+
+
+class TestGetStatsdClientConfParsing(BaseTestStatsdClient):
+    """
+    Tests here use get_statsd_client to make a StatsdClient.
+    """
+    def test_get_statsd_client_defaults(self):
+        # no options configured
+        client = statsd_client.get_statsd_client({})
+        self.assertIsInstance(client, StatsdClient)
+        self.assertIsNone(client._host)
+        self.assertEqual(8125, client._port)
+        self.assertEqual('', client._base_prefix)
+        self.assertEqual('', client._prefix)
+        self.assertEqual(1.0, client._default_sample_rate)
+        self.assertEqual(1.0, client._sample_rate_factor)
+        self.assertIsNone(client.logger)
+        with mock.patch.object(client, '_open_socket') as mock_open:
+            client.increment('tunafish')
+        self.assertFalse(mock_open.mock_calls)
+
+    def test_get_statsd_client_options(self):
+        # legacy options...
+        conf = {
+            'log_statsd_host': 'example.com',
+            'log_statsd_port': '6789',
+            'log_statsd_metric_prefix': 'banana',
+            'log_statsd_default_sample_rate': '3.3',
+            'log_statsd_sample_rate_factor': '4.4',
+            'log_junk': 'ignored',
+            'statsd_label_mode': 'dogstatsd',  # ignored
+        }
+        client = statsd_client.get_statsd_client(
+            conf, tail_prefix='milkshake', logger=self.logger)
+        self.assertIsInstance(client, StatsdClient)
+        self.assertEqual('example.com', client._host)
+        self.assertEqual(6789, client._port)
+        self.assertEqual('banana', client._base_prefix)
+        self.assertEqual('banana.milkshake.', client._prefix)
+        self.assertEqual(3.3, client._default_sample_rate)
+        self.assertEqual(4.4, client._sample_rate_factor)
+        self.assertEqual(self.logger, client.logger)
+        warn_lines = self.logger.get_lines_for_level('warning')
+        self.assertEqual([], warn_lines)
+
+    def test_emit_legacy(self):
+        conf = {
+            'log_statsd_host': 'myhost',
+            'log_statsd_port': '1234',
+        }
+        client = statsd_client.get_statsd_client(conf)
+        with mock.patch.object(client, '_open_socket') as mock_open:
+            client.increment('tunafish')
+        self.assertEqual(mock_open.mock_calls, [
+            mock.call(),
+            mock.call().sendto(b'tunafish:1|c', ('myhost', 1234)),
+            mock.call().close(),
+        ])
+
+        conf = {
+            'log_statsd_host': 'myhost',
+            'log_statsd_port': '1234',
+            'statsd_emit_legacy': 'False',
+        }
+        client = statsd_client.get_statsd_client(conf)
+        with mock.patch.object(client, '_open_socket') as mock_open:
+            client.increment('tunafish')
+        self.assertEqual(mock_open.mock_calls, [])
+
+    def test_legacy_client_does_not_support_labels_kwarg(self):
+        conf = {
+            'log_statsd_host': 'localhost',
+            'log_statsd_port': '123451',
+            'statsd_label_mode': 'dogstatsd',
+        }
+        client = statsd_client.get_statsd_client(conf)
+        labels = {'action': 'some', 'result': 'ok'}
+        with mock.patch.object(client, '_send_line') as mocked:
+            # legacy client accepts sample_rate kwarg as positional argument
+            # for backwards compat as demonstrated in other tests
+            client.random = lambda: 0.4
+            client.increment('metric', 0.5)
+            # but will never accept labels kwarg
+            with self.assertRaises(TypeError):
+                client.increment('metric', labels=labels)
+        self.assertEqual(
+            [mock.call('metric:1|c|@0.5')],
+            mocked.call_args_list)
+
+
+class TestGetLabeledStatsdClientConfParsing(BaseTestStatsdClient):
+    """
+    Tests here use get_labeled_statsd_client to make a LabeledStatsdClient.
+    """
+    def test_conf_defaults(self):
+        # no options configured
+        client = statsd_client.get_labeled_statsd_client({})
+        self.assertIsInstance(client, statsd_client.LabeledStatsdClient)
+        self.assertIsNone(client._host)
+        self.assertEqual(8125, client._port)
+        self.assertEqual(1.0, client._default_sample_rate)
+        self.assertEqual(1.0, client._sample_rate_factor)
+        self.assertIsNone(client.logger)
+        with mock.patch.object(client, '_open_socket') as mock_open:
+            # because legacy statsd.increment last pos arg was sample_rate
+            # we're always explicit with labels kwarg
+            client.increment('tunafish', labels={})
+        self.assertFalse(mock_open.mock_calls)
+
+    def test_conf_non_defaults(self):
+        # legacy options...
+        conf = {
+            'log_statsd_host': 'example.com',
+            'log_statsd_port': '6789',
+            'log_statsd_default_sample_rate': '3.3',
+            'log_statsd_sample_rate_factor': '4.4',
+            'log_junk': 'ignored',
+            'statsd_emit_legacy': 'False',  # ignored
+        }
+        client = statsd_client.get_labeled_statsd_client(
+            conf, logger=self.logger)
+        self.assertIsInstance(client, statsd_client.LabeledStatsdClient)
+        self.assertEqual('example.com', client._host)
+        self.assertEqual(6789, client._port)
+        self.assertEqual(3.3, client._default_sample_rate)
+        self.assertEqual(4.4, client._sample_rate_factor)
+        self.assertEqual(self.logger, client.logger)
+        warn_lines = self.logger.get_lines_for_level('warning')
+        self.assertEqual([], warn_lines)
+
+    def test_invalid_label_mode(self):
+        conf = {
+            'log_statsd_host': 'localhost',
+            'log_statsd_port': '1234',
+            'statsd_label_mode': 'invalid',
+        }
+        with self.assertRaises(ValueError) as cm:
+            statsd_client.get_labeled_statsd_client(conf, self.logger)
+        self.assertIn("unknown statsd_label_mode 'invalid'", str(cm.exception))
+
+    def test_valid_label_mode(self):
+        conf = {'statsd_label_mode': 'dogstatsd'}
+        logger = debug_logger(log_route='my-log-route')
+        client = statsd_client.get_labeled_statsd_client(conf, logger)
+        self.assertEqual(statsd_client.dogstatsd, client.label_formatter)
+        log_lines = logger.get_lines_for_level('debug')
+        self.assertEqual(1, len(log_lines))
+        self.assertEqual(
+            'Labeled statsd mode: dogstatsd (my-log-route)', log_lines[0])
+
+    def test_weird_invalid_attrname_label_mode(self):
+        conf = {'statsd_label_mode': '__class__'}
+        with self.assertRaises(ValueError) as cm:
+            statsd_client.get_labeled_statsd_client(conf, self.logger)
+        self.assertIn("unknown statsd_label_mode '__class__'",
+                      str(cm.exception))
+
+    def test_disabled_by_default(self):
+        conf = {}
+        logger = debug_logger(log_route='my-log-route')
+        client = statsd_client.get_labeled_statsd_client(conf, logger)
+        self.assertIsNone(client.label_formatter)
+        log_lines = logger.get_lines_for_level('debug')
+        self.assertEqual(1, len(log_lines))
+        self.assertEqual(
+            'Labeled statsd mode: disabled (my-log-route)', log_lines[0])
+
+    def test_label_must_be_kwarg(self):
+        conf = {
+            'log_statsd_host': 'localhost',
+            'log_statsd_port': '123451',
+            'statsd_label_mode': 'dogstatsd',
+        }
+        client = statsd_client.get_labeled_statsd_client(conf)
+        labels = {'action': 'some', 'result': 'ok'}
+        with mock.patch.object(client, '_send_line') as mocked:
+            # labels can not be a positional arg
+            with self.assertRaises(TypeError):
+                client.increment('metric', labels)
+            client.random = lambda: 0.4
+            # order of kwargs does not matter
+            client.increment('metric', sample_rate=0.5, labels=labels)
+        self.assertEqual(
+            [mock.call('metric:1|c|@0.5|#action:some,result:ok')],
+            mocked.call_args_list)
+
+    def test_label_values_to_str(self):
+        # verify that simple non-str types can be passed as label values
+        conf = {
+            'log_statsd_host': 'myhost1',
+            'log_statsd_port': 1235,
+            'statsd_label_mode': 'librato',
+        }
+        client = statsd_client.get_labeled_statsd_client(conf)
+        labels = {'bool': True, 'number': 42.1, 'null': None}
+        with mock.patch.object(client, '_send_line') as mocked:
+            client.update_stats('metric', '10', labels=labels)
+        self.assertEqual(
+            [mock.call('metric#bool=True,null=None,number=42.1:10|c')],
+            mocked.call_args_list)
+
+    def test_user_label(self):
+        conf = {
+            'log_statsd_host': 'myhost1',
+            'log_statsd_port': 1235,
+            'statsd_label_mode': 'librato',
+            'statsd_user_label_foo': 'foo.bar.com',
+        }
+        client = statsd_client.get_labeled_statsd_client(conf)
+        self.assertEqual({'user_foo': 'foo.bar.com'}, client.default_labels)
+        with mock.patch.object(client, '_send_line') as mocked:
+            client.update_stats('metric', '10', labels={'app': 'value'})
+        self.assertEqual(
+            [mock.call('metric#app=value,user_foo=foo.bar.com:10|c')],
+            mocked.call_args_list)
+
+    def test_user_label_overridden_by_call_label(self):
+        conf = {
+            'log_statsd_host': 'myhost1',
+            'log_statsd_port': 1235,
+            'statsd_label_mode': 'librato',
+            'statsd_user_label_foo': 'foo',
+        }
+        client = statsd_client.get_labeled_statsd_client(conf)
+        self.assertEqual({'user_foo': 'foo'}, client.default_labels)
+        with mock.patch.object(client, '_send_line') as mocked:
+            client.update_stats('metric', '10', labels={'user_foo': 'bar'})
+        self.assertEqual(
+            [mock.call('metric#user_foo=bar:10|c')],
+            mocked.call_args_list)
+
+    def test_user_label_sorting(self):
+        conf = {
+            'log_statsd_host': 'myhost1',
+            'log_statsd_port': 1235,
+            'statsd_label_mode': 'librato',
+            'statsd_user_label_foo': 'middle',
+        }
+        labels = {'z': 'last', 'a': 'first'}
+        client = statsd_client.get_labeled_statsd_client(conf)
+        with mock.patch.object(client, '_send_line') as mocked:
+            client.update_stats('metric', '10', labels=labels)
+        self.assertEqual(
+            [mock.call('metric#a=first,user_foo=middle,z=last:10|c')],
+            mocked.call_args_list)
+
+    def test_user_label_invalid_chars(self):
+        invalid = ',|=[]:.'
+        for c in invalid:
+            user_label = 'statsd_user_label_foo%sbar' % c
+            conf = {
+                'log_statsd_host': 'myhost1',
+                'log_statsd_port': 1235,
+                'statsd_label_mode': 'librato',
+                user_label: 'buz',
+            }
+            with self.assertRaises(ValueError) as ctx:
+                statsd_client.get_labeled_statsd_client(conf)
+            self.assertEqual("invalid character in statsd "
+                             "user label configuration "
+                             "'%s': '%s'" % (user_label, c),
+                             str(ctx.exception))
+
+    def test_user_label_value_invalid_chars(self):
+        invalid = ',|=[]:'
+        for c in invalid:
+            label_value = 'bar%sbaz' % c
+            conf = {
+                'log_statsd_host': 'myhost1',
+                'log_statsd_port': 1235,
+                'statsd_label_mode': 'librato',
+                'statsd_user_label_foo': label_value
+            }
+            with self.assertRaises(ValueError) as ctx:
+                statsd_client.get_labeled_statsd_client(conf)
+            self.assertEqual("invalid character in configuration "
+                             "'statsd_user_label_foo' value "
+                             "'%s': '%s'" % (label_value, c),
+                             str(ctx.exception))
+
+
+class CommonBaseTestsMixIn(object):
+
+    # N.B. we use a MixIn here to help maintain/transfer the understanding that
+    # the tests defined in this "MixIn" are run in multiple concrete TestCase
+    # subclasses.  We can't inherit from TestCase ourselves because unittest
+    # does not know how to skip abstract common base TestCases - although we
+    # may explore alternatives in the future.
+    def make_test_client(self, conf, tail_prefix='', **kwargs):
+        """
+        Concrete TestCase classes should implement this method and have the
+        following attributes:
+             * tail_prefix
+             * expected_prefix_bytes
+        """
+        raise NotImplementedError()
+
+    def test_ipv4_or_ipv6_hostname_defaults_to_ipv4(self):
+        def stub_getaddrinfo_both_ipv4_and_ipv6(host, port, family, *rest):
+            if family == socket.AF_INET:
+                return [(socket.AF_INET, 'blah', 'blah', 'blah',
+                        ('127.0.0.1', int(port)))]
+            elif family == socket.AF_INET6:
+                # Implemented so an incorrectly ordered implementation (IPv6
+                # then IPv4) would realistically fail.
+                return [(socket.AF_INET6, 'blah', 'blah', 'blah',
+                        ('::1', int(port), 0, 0))]
+
+        with mock.patch.object(statsd_client.socket, 'getaddrinfo',
+                               new=stub_getaddrinfo_both_ipv4_and_ipv6):
+            client = self.make_test_client({
+                'log_statsd_host': 'localhost',
+                'log_statsd_port': '9876',
+            }, self.tail_prefix, logger=self.logger)
+
+        self.assertEqual(client._sock_family, socket.AF_INET)
+        self.assertEqual(client._target, ('localhost', 9876))
+
+        got_sock = client._open_socket()
+        self.assertEqual(got_sock.family, socket.AF_INET)
+
+    def test_ipv4_instantiation_and_socket_creation(self):
+        client = self.make_test_client({
+            'log_statsd_host': '127.0.0.1',
+            'log_statsd_port': '9876',
+        }, 'some-name', logger=self.logger)
+
+        self.assertEqual(client._sock_family, socket.AF_INET)
+        self.assertEqual(client._target, ('127.0.0.1', 9876))
+
+        got_sock = client._open_socket()
+        self.assertEqual(got_sock.family, socket.AF_INET)
+
+    def test_ipv6_instantiation_and_socket_creation(self):
+        # We have to check the given hostname or IP for IPv4/IPv6 on logger
+        # instantiation so we don't call getaddrinfo() too often and don't have
+        # to call bind() on our socket to detect IPv4/IPv6 on every send.
+        #
+        # This test patches over the existing mock. If we just stop the
+        # existing mock, then unittest.exit() blows up, but stacking
+        # real-fake-fake works okay.
+        calls = []
+
+        def fake_getaddrinfo(host, port, family, *args):
+            calls.append(family)
+            if len(calls) == 1:
+                raise socket.gaierror
+            # this is what a real getaddrinfo('::1', port,
+            # socket.AF_INET6) returned once
+            return [(socket.AF_INET6,
+                     socket.SOCK_STREAM,
+                     socket.IPPROTO_TCP,
+                     '', ('::1', port, 0, 0)),
+                    (socket.AF_INET6,
+                     socket.SOCK_DGRAM,
+                     socket.IPPROTO_UDP,
+                     '',
+                     ('::1', port, 0, 0))]
+
+        with mock.patch.object(statsd_client.socket,
+                               'getaddrinfo', fake_getaddrinfo):
+            client = self.make_test_client({
+                'log_statsd_host': '::1',
+                'log_statsd_port': '9876',
+            }, 'some-name', logger=self.logger)
+        self.assertEqual([socket.AF_INET, socket.AF_INET6], calls)
+        self.assertEqual(client._sock_family, socket.AF_INET6)
+        self.assertEqual(client._target, ('::1', 9876, 0, 0))
+
+        got_sock = client._open_socket()
+        self.assertEqual(got_sock.family, socket.AF_INET6)
+
+    def test_bad_hostname_instantiation(self):
+        stub_err = statsd_client.socket.gaierror('whoops')
+        with mock.patch.object(statsd_client.socket, 'getaddrinfo',
+                               side_effect=stub_err):
+            client = self.make_test_client({
+                'log_statsd_host': 'i-am-not-a-hostname-or-ip',
+                'log_statsd_port': '9876',
+            }, 'some-name', logger=self.logger)
+
+        self.assertEqual(client._sock_family, socket.AF_INET)
+        self.assertEqual(client._target,
+                         ('i-am-not-a-hostname-or-ip', 9876))
+
+        got_sock = client._open_socket()
+        self.assertEqual(got_sock.family, socket.AF_INET)
+        # Maybe the DNS server gets fixed in a bit and it starts working... or
+        # maybe the DNS record hadn't propagated yet.  In any case, failed
+        # statsd sends will warn in the logs until the DNS failure or invalid
+        # IP address in the configuration is fixed.
+
+    def test_sending_ipv6(self):
+        def fake_getaddrinfo(host, port, *args):
+            # this is what a real getaddrinfo('::1', port,
+            # socket.AF_INET6) returned once
+            return [(socket.AF_INET6,
+                     socket.SOCK_STREAM,
+                     socket.IPPROTO_TCP,
+                     '', ('::1', port, 0, 0)),
+                    (socket.AF_INET6,
+                     socket.SOCK_DGRAM,
+                     socket.IPPROTO_UDP,
+                     '',
+                     ('::1', port, 0, 0))]
+
+        with mock.patch.object(statsd_client.socket, 'getaddrinfo',
+                               fake_getaddrinfo):
+            client = self.make_test_client({
+                'log_statsd_host': '::1',
+                'log_statsd_port': '9876',
+            }, 'some-name', logger=self.logger)
+
+        fl = debug_logger()
+        client.logger = fl
+        mock_socket = MockUdpSocket()
+
+        client._open_socket = lambda *_: mock_socket
+        client.increment('tunafish')
+        self.assertEqual(fl.get_lines_for_level('warning'), [])
+        self.assertEqual(mock_socket.sent,
+                         [(self.expected_prefix_bytes + b'tunafish:1|c',
+                           ('::1', 9876, 0, 0))])
+
+    def test_no_exception_when_cant_send_udp_packet(self):
+        client = self.make_test_client({'log_statsd_host': 'some.host.com'})
+        fl = debug_logger()
+        client.logger = fl
+        mock_socket = MockUdpSocket(sendto_errno=errno.EPERM)
+        client._open_socket = lambda *_: mock_socket
+        client.increment('tunafish')
+        expected = ["Error sending UDP message to ('some.host.com', 8125): "
+                    "[Errno 1] test errno 1"]
+        self.assertEqual(fl.get_lines_for_level('warning'), expected)
+
+    def test_sample_rates(self):
+        client = self.make_test_client({'log_statsd_host': 'some.host.com'})
+
+        mock_socket = MockUdpSocket()
+        self.assertTrue(client.random is random.random)
+
+        client._open_socket = lambda *_: mock_socket
+        client.random = lambda: 0.50001
+
+        self.assertIsNone(client.increment('tribbles', sample_rate=0.5))
+        self.assertFalse(mock_socket.sent)
+
+        client.random = lambda: 0.49999
+        rv = client.increment('tribbles', sample_rate=0.5)
+        self.assertIsInstance(rv, int)
+        self.assertEqual([(b"tribbles:1|c|@0.5", ('some.host.com', 8125))],
+                         mock_socket.sent)
+
+    def test_sample_rates_with_sample_rate_factor(self):
+        client = self.make_test_client({
+            'log_statsd_host': 'some.host.com',
+            'log_statsd_default_sample_rate': '0.82',
+            'log_statsd_sample_rate_factor': '0.91',
+        })
+        effective_sample_rate = 0.82 * 0.91
+
+        mock_socket = MockUdpSocket()
+        self.assertIs(client.random, random.random)
+
+        client._open_socket = lambda *_: mock_socket
+        client.random = lambda: effective_sample_rate + 0.001
+
+        client.increment('tribbles')
+        self.assertFalse(mock_socket.sent)
+
+        client.random = lambda: effective_sample_rate - 0.001
+        client.increment('tribbles')
+        expected = ("tribbles:1|c|@%s" % effective_sample_rate).encode('utf-8')
+        self.assertEqual([(expected, ('some.host.com', 8125))],
+                         mock_socket.sent)
+
+        # caller specifies non-default sample rate
+        mock_socket = MockUdpSocket()
+        effective_sample_rate = 0.587 * 0.91
+        client.random = lambda: effective_sample_rate + 0.001
+        client.increment('tribbles', sample_rate=0.587)
+        self.assertFalse(mock_socket.sent)
+
+        client.random = lambda: effective_sample_rate - 0.001
+        client.increment('tribbles', sample_rate=0.587)
+        expected = ("tribbles:1|c|@%s" % effective_sample_rate).encode('utf-8')
+        self.assertEqual([(expected, ('some.host.com', 8125))],
+                         mock_socket.sent)
+
+
+class TestGetStatsdClient(BaseTestStatsdClient, CommonBaseTestsMixIn):
+    """
+    Tests here use get_statsd_client to make a LabeledStatsdClient.
+    """
+    tail_prefix = 'some-name'
+    expected_prefix_bytes = ('%s.' % tail_prefix).encode()
+
+    def make_test_client(self, conf, tail_prefix='', **kwargs):
+        return statsd_client.get_statsd_client(conf, tail_prefix, **kwargs)
+
+
+class TestGetLabeledStatsdClient(BaseTestStatsdClient, CommonBaseTestsMixIn):
+    """
+    Tests here use get_labeled_statsd_client to make a LabeledStatsdClient.
+    """
+    tail_prefix = None
+    expected_prefix_bytes = b''
+
+    def make_test_client(self, conf, _tail_prefix='', **kwargs):
+        conf.setdefault('statsd_label_mode', 'dogstatsd')
+        return statsd_client.get_labeled_statsd_client(conf, **kwargs)
+
+
+class BaseTestStatsdClientOutput(unittest.TestCase):
+
+    def setUp(self):
+        self.sock = socket.socket(socket.AF_INET, socket.SOCK_DGRAM)
+        self.sock.bind(('localhost', 0))
+        self.port = self.sock.getsockname()[1]
+        self.queue = Queue()
+        self.reader_thread = threading.Thread(target=self.statsd_reader)
+        self.reader_thread.daemon = True
+        self.reader_thread.start()
+        self.client = None
+
+    def tearDown(self):
+        # The "no-op when disabled" test doesn't set up a real client, so
+        # create one here so we can tell the reader thread to stop.
+        if not self.client:
+            self.client = get_statsd_client({
+                'log_statsd_host': 'localhost',
+                'log_statsd_port': str(self.port),
+            })
+        self.client.increment('STOP')
+        self.reader_thread.join(timeout=4)
+        self.sock.close()
+
+    def statsd_reader(self):
+        while True:
+            try:
+                payload = self.sock.recv(4096)
+                if payload and b'STOP' in payload:
+                    return 42
+                self.queue.put(payload)
+            except Exception as e:
+                sys.stderr.write('statsd_reader thread: %r' % (e,))
+                break
+
+    def _send_and_get(self, sender_fn, *args, **kwargs):
+        """
+        Because the client library may not actually send a packet with
+        sample_rate < 1, we keep trying until we get one through.
+        """
+        got = None
+        while not got:
+            sender_fn(*args, **kwargs)
+            try:
+                got = self.queue.get(timeout=0.3)
+            except Empty:
+                pass
+        return got.decode('utf-8')
+
+    def assertStat(self, expected, sender_fn, *args, **kwargs):
+        got = self._send_and_get(sender_fn, *args, **kwargs)
+        return self.assertEqual(expected, got)
+
+    def assertStatMatches(self, expected_regexp, sender_fn, *args, **kwargs):
+        got = self._send_and_get(sender_fn, *args, **kwargs)
+        return self.assertTrue(re.search(expected_regexp, got),
+                               [got, expected_regexp])
+
+
+class TestGetStatsdClientOutput(BaseTestStatsdClientOutput):
+    """
+    Tests here use get_statsd_client to make a StatsdClient.
+    """
+    def test_methods_are_no_ops_when_not_enabled(self):
+        # *Don't* use self.client -- we want tearDown to create it
+        client = get_statsd_client({
+            # No "log_statsd_host" means "disabled"
+            'log_statsd_port': str(self.port),
+        }, 'some-name')
+        self.assertIsNone(client.update_stats('foo', 88))
+        self.assertIsNone(client.update_stats('foo', 88, 0.57))
+        self.assertIsNone(client.update_stats('foo', 88,
+                                              sample_rate=0.61))
+        self.assertIsNone(client.increment('foo'))
+        self.assertIsNone(client.increment('foo', 0.57))
+        self.assertIsNone(client.increment('foo', sample_rate=0.61))
+        self.assertIsNone(client.decrement('foo'))
+        self.assertIsNone(client.decrement('foo', 0.57))
+        self.assertIsNone(client.decrement('foo', sample_rate=0.61))
+        self.assertIsNone(client.timing('foo', 88.048))
+        self.assertIsNone(client.timing('foo', 88.57, 0.34))
+        self.assertIsNone(client.timing('foo', 88.998, sample_rate=0.82))
+        self.assertIsNone(client.timing_since('foo', 8938))
+        self.assertIsNone(client.timing_since('foo', 8948, 0.57))
+        self.assertIsNone(client.timing_since('foo', 849398,
+                                              sample_rate=0.61))
+        # Now, the queue should be empty (no UDP packets sent)
+        self.assertRaises(Empty, self.queue.get_nowait)
+
+    def test_methods_with_no_default_sample_rate(self):
+        self.client = get_statsd_client({
+            'log_statsd_host': 'localhost',
+            'log_statsd_port': str(self.port),
+            'statsd_label_mode': 'disabled',  # ignored
+        }, 'some-name')
+        self.assertStat('some-name.some.counter:1|c', self.client.increment,
+                        'some.counter')
+        self.assertStat('some-name.some.counter:-1|c', self.client.decrement,
+                        'some.counter')
+        self.assertStat('some-name.some.operation:4900.0|ms',
+                        self.client.timing, 'some.operation', 4.9 * 1000)
+        self.assertStatMatches(r'some-name\.another\.operation:\d+\.\d+\|ms',
+                               self.client.timing_since, 'another.operation',
+                               time.time())
+        self.assertStat('some-name.another.counter:42|c',
+                        self.client.update_stats, 'another.counter', 42)
+
+        # Each call can override the sample_rate (also, bonus prefix test)
+        with warnings.catch_warnings():
+            warnings.filterwarnings(
+                'ignore', r'set_statsd_prefix\(\) is deprecated')
+            self.client.set_prefix('pfx')
+        self.assertStat('pfx.some.counter:1|c|@0.972', self.client.increment,
+                        'some.counter', sample_rate=0.972)
+        self.assertStat('pfx.some.counter:-1|c|@0.972', self.client.decrement,
+                        'some.counter', sample_rate=0.972)
+        self.assertStat('pfx.some.operation:4900.0|ms|@0.972',
+                        self.client.timing, 'some.operation', 4.9 * 1000,
+                        sample_rate=0.972)
+        self.assertStat(
+            'pfx.some.hi-res.operation:3141.5927|ms|@0.367879441171',
+            self.client.timing, 'some.hi-res.operation',
+            3.141592653589793 * 1000, sample_rate=0.367879441171)
+        self.assertStatMatches(r'pfx\.another\.op:\d+\.\d+\|ms|@0.972',
+                               self.client.timing_since, 'another.op',
+                               time.time(), sample_rate=0.972)
+        self.assertStat('pfx.another.counter:3|c|@0.972',
+                        self.client.update_stats, 'another.counter', 3,
+                        sample_rate=0.972)
+
+        # Can override sample_rate with non-keyword arg
+        with warnings.catch_warnings():
+            warnings.filterwarnings(
+                'ignore', r'set_statsd_prefix\(\) is deprecated')
+            self.client.set_prefix('')
+        self.assertStat('some.counter:1|c|@0.939', self.client.increment,
+                        'some.counter', 0.939)
+        self.assertStat('some.counter:-1|c|@0.939', self.client.decrement,
+                        'some.counter', 0.939)
+        self.assertStat('some.operation:4900.0|ms|@0.939',
+                        self.client.timing, 'some.operation',
+                        4.9 * 1000, 0.939)
+        self.assertStatMatches(r'another\.op:\d+\.\d+\|ms|@0.939',
+                               self.client.timing_since, 'another.op',
+                               time.time(), 0.939)
+        self.assertStat('another.counter:3|c|@0.939',
+                        self.client.update_stats, 'another.counter', 3, 0.939)
+
+    def test_methods_with_default_sample_rate(self):
+        self.client = get_statsd_client({
+            'log_statsd_host': 'localhost',
+            'log_statsd_port': str(self.port),
+            'log_statsd_default_sample_rate': '0.93',
+        }, 'pfx')
+        self.assertStat('pfx.some.counter:1|c|@0.93', self.client.increment,
+                        'some.counter')
+        self.assertStat('pfx.some.counter:-1|c|@0.93', self.client.decrement,
+                        'some.counter')
+        self.assertStat('pfx.some.operation:4760.0|ms|@0.93',
+                        self.client.timing, 'some.operation', 4.76 * 1000)
+        self.assertStatMatches(r'pfx\.another\.op:\d+\.\d+\|ms|@0.93',
+                               self.client.timing_since, 'another.op',
+                               time.time())
+        self.assertStat('pfx.another.counter:3|c|@0.93',
+                        self.client.update_stats, 'another.counter', 3)
+
+        # Each call can override the sample_rate
+        self.assertStat('pfx.some.counter:1|c|@0.9912', self.client.increment,
+                        'some.counter', sample_rate=0.9912)
+        self.assertStat('pfx.some.counter:-1|c|@0.9912', self.client.decrement,
+                        'some.counter', sample_rate=0.9912)
+        self.assertStat('pfx.some.operation:4900.0|ms|@0.9912',
+                        self.client.timing, 'some.operation', 4.9 * 1000,
+                        sample_rate=0.9912)
+        self.assertStatMatches(r'pfx\.another\.op:\d+\.\d+\|ms|@0.9912',
+                               self.client.timing_since, 'another.op',
+                               time.time(), sample_rate=0.9912)
+        self.assertStat('pfx.another.counter:3|c|@0.9912',
+                        self.client.update_stats, 'another.counter', 3,
+                        sample_rate=0.9912)
+
+        # Can override sample_rate with non-keyword arg
+        with warnings.catch_warnings():
+            warnings.filterwarnings(
+                'ignore', r'set_statsd_prefix\(\) is deprecated')
+            self.client.set_prefix('')
+        self.assertStat('some.counter:1|c|@0.987654', self.client.increment,
+                        'some.counter', 0.987654)
+        self.assertStat('some.counter:-1|c|@0.987654', self.client.decrement,
+                        'some.counter', 0.987654)
+        self.assertStat('some.operation:4900.0|ms|@0.987654',
+                        self.client.timing, 'some.operation',
+                        4.9 * 1000, 0.987654)
+        self.assertStatMatches(r'another\.op:\d+\.\d+\|ms|@0.987654',
+                               self.client.timing_since, 'another.op',
+                               time.time(), 0.987654)
+        self.assertStat('another.counter:3|c|@0.987654',
+                        self.client.update_stats, 'another.counter',
+                        3, 0.987654)
+
+    def test_methods_with_metric_prefix(self):
+        self.client = get_statsd_client({
+            'log_statsd_host': 'localhost',
+            'log_statsd_port': str(self.port),
+            'log_statsd_metric_prefix': 'alpha.beta',
+        }, 'pfx')
+        self.assertStat('alpha.beta.pfx.some.counter:1|c',
+                        self.client.increment, 'some.counter')
+        self.assertStat('alpha.beta.pfx.some.counter:-1|c',
+                        self.client.decrement, 'some.counter')
+        self.assertStat('alpha.beta.pfx.some.operation:4760.0|ms',
+                        self.client.timing, 'some.operation', 4.76 * 1000)
+        self.assertStatMatches(
+            r'alpha\.beta\.pfx\.another\.op:\d+\.\d+\|ms',
+            self.client.timing_since, 'another.op', time.time())
+        self.assertStat('alpha.beta.pfx.another.counter:3|c',
+                        self.client.update_stats, 'another.counter', 3)
+
+        with warnings.catch_warnings():
+            warnings.filterwarnings(
+                'ignore', r'set_statsd_prefix\(\) is deprecated')
+            self.client.set_prefix('')
+        self.assertStat('alpha.beta.some.counter:1|c|@0.9912',
+                        self.client.increment, 'some.counter',
+                        sample_rate=0.9912)
+        self.assertStat('alpha.beta.some.counter:-1|c|@0.9912',
+                        self.client.decrement, 'some.counter', 0.9912)
+        self.assertStat('alpha.beta.some.operation:4900.0|ms|@0.9912',
+                        self.client.timing, 'some.operation', 4.9 * 1000,
+                        sample_rate=0.9912)
+        self.assertStatMatches(
+            r'alpha\.beta\.another\.op:\d+\.\d+\|ms|@0.9912',
+            self.client.timing_since, 'another.op',
+            time.time(), sample_rate=0.9912)
+        self.assertStat('alpha.beta.another.counter:3|c|@0.9912',
+                        self.client.update_stats, 'another.counter', 3,
+                        sample_rate=0.9912)
+
+    def test_statsd_methods_legacy_disabled(self):
+        conf = {
+            'log_statsd_host': 'localhost',
+            'log_statsd_port': str(self.port),
+            'log_statsd_metric_prefix': 'my_prefix',
+            'statsd_emit_legacy': 'false',
+        }
+        statsd = statsd_client.get_statsd_client(conf, tail_prefix='pfx')
+        with mock.patch.object(statsd, '_open_socket') as mock_open:
+            statsd.increment('some.counter')
+            statsd.decrement('some.counter')
+            statsd.timing('some.timing', 6.28 * 1000)
+            statsd.update_stats('some.stat', 3)
+        self.assertFalse(mock_open.mock_calls)
+
+
+class TestGetLabeledStatsdClientOutput(BaseTestStatsdClientOutput):
+    """
+    Tests here use get_labeled_statsd_client to make a LabeledStatsdClient.
+    """
+    def test_statsd_methods_disabled(self):
+        conf = {
+            'log_statsd_host': 'localhost',
+            'log_statsd_port': str(self.port),
+            'log_statsd_metric_prefix': 'my_prefix',
+            'statsd_label_mode': 'disabled',
+        }
+        labeled_statsd = statsd_client.get_labeled_statsd_client(conf)
+        labels = {'action': 'some', 'result': 'ok'}
+        with mock.patch.object(labeled_statsd,
+                               '_open_socket') as mock_open:
+            # Any labeled-metrics callers should not emit any metrics
+            labeled_statsd.increment('the_counter', labels=labels)
+            labeled_statsd.decrement('the_counter', labels=labels)
+            labeled_statsd.timing('the_timing', 6.28 * 1000, labels=labels)
+            labeled_statsd.update_stats('the_stat', 3, labels=labels)
+        self.assertFalse(mock_open.mock_calls)
+
+    def test_statsd_methods_dogstatsd(self):
+        conf = {
+            'log_statsd_host': 'localhost',
+            'log_statsd_port': str(self.port),
+            'statsd_label_mode': 'dogstatsd',
+            'statsd_emit_legacy': 'false',  # ignored
+        }
+        labeled_statsd = statsd_client.get_labeled_statsd_client(conf)
+        labels = {'action': 'some', 'result': 'ok'}
+        self.assertStat(
+            'the_counter:1|c|#action:some,result:ok',
+            labeled_statsd.increment, 'the_counter', labels=labels)
+        self.assertStat(
+            'the_counter:-1|c|#action:some,result:ok',
+            labeled_statsd.decrement, 'the_counter', labels=labels)
+        self.assertStat(
+            'the_timing:6280.0|ms'
+            '|#action:some,result:ok',
+            labeled_statsd.timing, 'the_timing', 6.28 * 1000, labels=labels)
+        self.assertStat(
+            'the_stat:3|c|#action:some,result:ok',
+            labeled_statsd.update_stats, 'the_stat', 3, labels=labels)
+
+    def test_statsd_methods_dogstatsd_sample_rate(self):
+        conf = {
+            'log_statsd_host': 'localhost',
+            'log_statsd_port': str(self.port),
+            'statsd_label_mode': 'dogstatsd',
+            'log_statsd_default_sample_rate': '0.9',
+            'log_statsd_sample_rate_factor': '0.5'}
+        labeled_statsd = statsd_client.get_labeled_statsd_client(conf)
+        labels = {'action': 'some', 'result': 'ok'}
+        self.assertStat(
+            'the_counter:1|c|@0.45|#action:some,result:ok',
+            labeled_statsd.increment, 'the_counter', labels=labels)
+
+    def test_statsd_methods_graphite(self):
+        conf = {
+            'log_statsd_host': 'localhost',
+            'log_statsd_port': str(self.port),
+            'log_statsd_metric_prefix': 'my_prefix',
+            'statsd_label_mode': 'graphite',
+        }
+        labeled_statsd = statsd_client.get_labeled_statsd_client(conf)
+        labels = {'action': 'some', 'result': 'ok'}
+        self.assertStat(
+            'the_counter;action=some;result=ok:1|c',
+            labeled_statsd.increment, 'the_counter', labels=labels)
+        self.assertStat(
+            'the_counter;action=some;result=ok:-1|c',
+            labeled_statsd.decrement, 'the_counter', labels=labels)
+        self.assertStat(
+            'the_timing;action=some;result=ok'
+            ':6280.0|ms',
+            labeled_statsd.timing, 'the_timing', 6.28 * 1000, labels=labels)
+        self.assertStat(
+            'the_stat;action=some;result=ok:3|c',
+            labeled_statsd.update_stats, 'the_stat', 3, labels=labels)
+
+    def test_statsd_methods_graphite_sample_rate(self):
+        conf = {
+            'log_statsd_host': 'localhost',
+            'log_statsd_port': str(self.port),
+            'statsd_label_mode': 'graphite',
+            'log_statsd_default_sample_rate': '0.9',
+            'log_statsd_sample_rate_factor': '0.5'}
+        labeled_statsd = statsd_client.get_labeled_statsd_client(conf)
+        labels = {'action': 'some', 'result': 'ok'}
+        self.assertStat(
+            'the_counter;action=some;result=ok:1|c|@0.45',
+            labeled_statsd.increment, 'the_counter', labels=labels)
+
+    def test_statsd_methods_influxdb(self):
+        conf = {
+            'log_statsd_host': 'localhost',
+            'log_statsd_port': str(self.port),
+            'log_statsd_metric_prefix': 'my_prefix',
+            'statsd_label_mode': 'influxdb',
+        }
+        labeled_statsd = statsd_client.get_labeled_statsd_client(conf)
+        labels = {'action': 'some', 'result': 'ok'}
+        self.assertStat(
+            'the_counter,action=some,result=ok:1|c',
+            labeled_statsd.increment, 'the_counter', labels=labels)
+        self.assertStat(
+            'the_counter,action=some,result=ok:-1|c',
+            labeled_statsd.decrement, 'the_counter', labels=labels)
+        self.assertStat(
+            'the_counter,action=some,result=ok:-1|c',
+            labeled_statsd.decrement, 'the_counter', labels=labels)
+        self.assertStat(
+            'the_timing,action=some,result=ok'
+            ':6280.0|ms',
+            labeled_statsd.timing, 'the_timing', 6.28 * 1000, labels=labels)
+        self.assertStat(
+            'the_stat,action=some,result=ok:3|c',
+            labeled_statsd.update_stats, 'the_stat', 3, labels=labels)
+
+    def test_statsd_methods_influxdb_sample_rate(self):
+        conf = {
+            'log_statsd_host': 'localhost',
+            'log_statsd_port': str(self.port),
+            'statsd_label_mode': 'influxdb',
+            'log_statsd_default_sample_rate': '0.9',
+            'log_statsd_sample_rate_factor': '0.5'}
+        labeled_statsd = statsd_client.get_labeled_statsd_client(conf)
+        labels = {'action': 'some', 'result': 'ok'}
+        self.assertStat(
+            'the.counter,action=some,result=ok:1|c|@0.45',
+            labeled_statsd.increment, 'the.counter', labels=labels)
+
+    def test_statsd_methods_librato(self):
+        conf = {
+            'log_statsd_host': 'localhost',
+            'log_statsd_port': str(self.port),
+            'log_statsd_metric_prefix': 'my_prefix',
+            'statsd_label_mode': 'librato',
+        }
+        labeled_statsd = statsd_client.get_labeled_statsd_client(conf)
+        labels = {'action': 'some', 'result': 'ok'}
+        self.assertStat(
+            'the_counter#action=some,result=ok:1|c',
+            labeled_statsd.increment, 'the_counter', labels=labels)
+        self.assertStat(
+            'the_counter#action=some,result=ok:-1|c',
+            labeled_statsd.decrement, 'the_counter', labels=labels)
+        self.assertStat(
+            'the_timing#action=some,result=ok'
+            ':6280.0|ms',
+            labeled_statsd.timing, 'the_timing', 6.28 * 1000, labels=labels)
+        self.assertStat(
+            'the_stat#action=some,result=ok:3|c',
+            labeled_statsd.update_stats, 'the_stat', 3, labels=labels)
+
+    def test_statsd_methods_librato_sample_rate(self):
+        conf = {
+            'log_statsd_host': 'localhost',
+            'log_statsd_port': str(self.port),
+            'statsd_label_mode': 'librato',
+            'log_statsd_default_sample_rate': '0.9',
+            'log_statsd_sample_rate_factor': '0.5'}
+        labeled_statsd = statsd_client.get_labeled_statsd_client(conf)
+        labels = {'action': 'some', 'result': 'ok'}
+        self.assertStat(
+            'the_counter#action=some,result=ok:1|c|@0.45',
+            labeled_statsd.increment, 'the_counter', labels=labels)
+
+    def _do_test_statsd_methods_no_labels(self, label_mode):
+        # no default_sample_rate option
+        conf = {
+            'log_statsd_host': 'localhost',
+            'log_statsd_port': str(self.port),
+            'statsd_label_mode': label_mode,
+        }
+        labeled_statsd = statsd_client.get_labeled_statsd_client(conf)
+        self.assertStat('the.counter:1|c',
+                        labeled_statsd.increment, 'the.counter', labels={})
+        self.assertStat('the.counter:-1|c',
+                        labeled_statsd.decrement, 'the.counter', labels={})
+        # but individual call sites could set sample_rate
+        self.assertStat('the.counter:1|c|@0.9912',
+                        labeled_statsd.increment, 'the.counter', labels={},
+                        sample_rate=0.9912)
+        self.assertStat(
+            'the.timing:6280.0|ms',
+            labeled_statsd.timing, 'the.timing', 6.28 * 1000, labels={})
+        self.assertStat('the.stat:3|c',
+                        labeled_statsd.update_stats, 'the.stat', 3, labels={})
+
+        self.assertStat('the.counter:1|c',
+                        labeled_statsd.increment, 'the.counter')
+        self.assertStat('the.counter:-1|c',
+                        labeled_statsd.decrement, 'the.counter')
+        self.assertStat('the.timing:6280.0|ms',
+                        labeled_statsd.timing, 'the.timing', 6.28 * 1000)
+        self.assertStat('the.stat:3|c',
+                        labeled_statsd.update_stats, 'the.stat', 3)
+        self.assertStat('the.stat:500.0|ms',
+                        labeled_statsd.transfer_rate, 'the.stat', 3.3, 6600)
+
+    def test_statsd_methods_dogstatsd_no_labels(self):
+        self._do_test_statsd_methods_no_labels('dogstatsd')
+
+    def test_statsd_methods_graphite_no_labels(self):
+        self._do_test_statsd_methods_no_labels('graphite')
+
+    def test_statsd_methods_influxdb_no_labels(self):
+        self._do_test_statsd_methods_no_labels('influxdb')
+
+    def test_statsd_methods_librato_no_labels(self):
+        self._do_test_statsd_methods_no_labels('librato')
diff --git a/test/unit/common/test_storage_policy.py b/test/unit/common/test_storage_policy.py
new file mode 100644
index 0000000000..825480bf60
--- /dev/null
+++ b/test/unit/common/test_storage_policy.py
@@ -0,0 +1,1572 @@
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+""" Tests for swift.common.storage_policies """
+from configparser import ConfigParser
+import contextlib
+import io
+import logging
+import unittest
+import os
+from unittest import mock
+from functools import partial
+
+from tempfile import NamedTemporaryFile
+from test.debug_logger import debug_logger
+from test.unit import (
+    patch_policies, FakeRing, temptree, DEFAULT_TEST_EC_TYPE)
+import swift.common.storage_policy
+from swift.common.storage_policy import (
+    StoragePolicyCollection, POLICIES, PolicyError, parse_storage_policies,
+    reload_storage_policies, get_policy_string, split_policy_string,
+    BaseStoragePolicy, StoragePolicy, ECStoragePolicy, REPL_POLICY, EC_POLICY,
+    VALID_EC_TYPES, DEFAULT_EC_OBJECT_SEGMENT_SIZE, BindPortsCache)
+from swift.common.ring import RingData
+from swift.common.exceptions import RingLoadError
+from pyeclib.ec_iface import ECDriver
+
+
+class CapturingHandler(logging.Handler):
+    def __init__(self):
+        super(CapturingHandler, self).__init__()
+        self._records = []
+
+    def emit(self, record):
+        self._records.append(record)
+
+
+@contextlib.contextmanager
+def capture_logging(log_name):
+    captured = CapturingHandler()
+    logger = logging.getLogger(log_name)
+    logger.addHandler(captured)
+    try:
+        yield captured._records
+    finally:
+        logger.removeHandler(captured)
+
+
+@BaseStoragePolicy.register('fake')
+class FakeStoragePolicy(BaseStoragePolicy):
+    """
+    Test StoragePolicy class - the only user at the moment is
+    test_validate_policies_type_invalid()
+    """
+
+    def __init__(self, idx, name='', is_default=False, is_deprecated=False,
+                 object_ring=None):
+        super(FakeStoragePolicy, self).__init__(
+            idx, name, is_default, is_deprecated, object_ring)
+
+
+class TestStoragePolicies(unittest.TestCase):
+    def _conf(self, conf_str):
+        conf_str = "\n".join(line.strip() for line in conf_str.split("\n"))
+        conf = ConfigParser(strict=False)
+        conf.read_file(io.StringIO(conf_str))
+        return conf
+
+    def assertRaisesWithMessage(self, exc_class, message, f, *args, **kwargs):
+        try:
+            f(*args, **kwargs)
+        except exc_class as err:
+            err_msg = str(err)
+            self.assertTrue(message in err_msg, 'Error message %r did not '
+                            'have expected substring %r' % (err_msg, message))
+        else:
+            self.fail('%r did not raise %s' % (message, exc_class.__name__))
+
+    def test_policy_baseclass_instantiate(self):
+        self.assertRaisesWithMessage(TypeError,
+                                     "Can't instantiate BaseStoragePolicy",
+                                     BaseStoragePolicy, 1, 'one')
+
+    @patch_policies([
+        StoragePolicy(0, 'zero', is_default=True),
+        StoragePolicy(1, 'one'),
+        StoragePolicy(2, 'two'),
+        StoragePolicy(3, 'three', is_deprecated=True),
+        ECStoragePolicy(10, 'ten', ec_type=DEFAULT_TEST_EC_TYPE,
+                        ec_ndata=10, ec_nparity=4),
+    ])
+    def test_swift_info(self):
+        # the deprecated 'three' should not exist in expect
+        expect = [{'aliases': 'zero', 'default': True, 'name': 'zero', },
+                  {'aliases': 'two', 'name': 'two'},
+                  {'aliases': 'one', 'name': 'one'},
+                  {'aliases': 'ten', 'name': 'ten'}]
+        swift_info = POLICIES.get_policy_info()
+        self.assertEqual(sorted(expect, key=lambda k: k['name']),
+                         sorted(swift_info, key=lambda k: k['name']))
+
+    @patch_policies
+    def test_get_policy_string(self):
+        self.assertEqual(get_policy_string('something', 0), 'something')
+        self.assertEqual(get_policy_string('something', None), 'something')
+        self.assertEqual(get_policy_string('something', ''), 'something')
+        self.assertEqual(get_policy_string('something', 1),
+                         'something' + '-1')
+        self.assertRaises(PolicyError, get_policy_string, 'something', 99)
+
+    @patch_policies
+    def test_split_policy_string(self):
+        expectations = {
+            'something': ('something', POLICIES[0]),
+            'something-1': ('something', POLICIES[1]),
+            'tmp': ('tmp', POLICIES[0]),
+            'objects': ('objects', POLICIES[0]),
+            'tmp-1': ('tmp', POLICIES[1]),
+            'objects-1': ('objects', POLICIES[1]),
+            'objects-': PolicyError,
+            'objects-0': PolicyError,
+            'objects--1': ('objects-', POLICIES[1]),
+            'objects-+1': PolicyError,
+            'objects--': PolicyError,
+            'objects-foo': PolicyError,
+            'objects--bar': PolicyError,
+            'objects-+bar': PolicyError,
+            # questionable, demonstrated as inverse of get_policy_string
+            'objects+0': ('objects+0', POLICIES[0]),
+            '': ('', POLICIES[0]),
+            '0': ('0', POLICIES[0]),
+            '-1': ('', POLICIES[1]),
+        }
+        for policy_string, expected in expectations.items():
+            if expected == PolicyError:
+                try:
+                    invalid = split_policy_string(policy_string)
+                except PolicyError:
+                    continue  # good
+                else:
+                    self.fail('The string %r returned %r '
+                              'instead of raising a PolicyError' %
+                              (policy_string, invalid))
+            self.assertEqual(expected, split_policy_string(policy_string))
+            # should be inverse of get_policy_string
+            self.assertEqual(policy_string, get_policy_string(*expected))
+
+    def test_defaults(self):
+        self.assertGreater(len(POLICIES), 0)
+
+        # test class functions
+        default_policy = POLICIES.default
+        self.assertTrue(default_policy.is_default)
+        zero_policy = POLICIES.get_by_index(0)
+        self.assertTrue(zero_policy.idx == 0)
+        zero_policy_by_name = POLICIES.get_by_name(zero_policy.name)
+        self.assertTrue(zero_policy_by_name.idx == 0)
+
+    def test_storage_policy_repr(self):
+        test_policies = [StoragePolicy(0, 'aay', True),
+                         StoragePolicy(1, 'bee', False),
+                         StoragePolicy(2, 'cee', False),
+                         ECStoragePolicy(10, 'ten',
+                                         ec_type=DEFAULT_TEST_EC_TYPE,
+                                         ec_ndata=10, ec_nparity=3),
+                         ECStoragePolicy(11, 'eleven',
+                                         ec_type=DEFAULT_TEST_EC_TYPE,
+                                         ec_ndata=10, ec_nparity=3,
+                                         ec_duplication_factor=2)]
+        policies = StoragePolicyCollection(test_policies)
+        for policy in policies:
+            policy_repr = repr(policy)
+            self.assertTrue(policy.__class__.__name__ in policy_repr)
+            self.assertTrue('is_default=%s' % policy.is_default in policy_repr)
+            self.assertTrue('is_deprecated=%s' % policy.is_deprecated in
+                            policy_repr)
+            self.assertTrue(policy.name in policy_repr)
+            if policy.policy_type == EC_POLICY:
+                self.assertTrue('ec_type=%s' % policy.ec_type in policy_repr)
+                self.assertTrue('ec_ndata=%s' % policy.ec_ndata in policy_repr)
+                self.assertTrue('ec_nparity=%s' %
+                                policy.ec_nparity in policy_repr)
+                self.assertTrue('ec_segment_size=%s' %
+                                policy.ec_segment_size in policy_repr)
+                if policy.ec_duplication_factor > 1:
+                    self.assertTrue('ec_duplication_factor=%s' %
+                                    policy.ec_duplication_factor in
+                                    policy_repr)
+        collection_repr = repr(policies)
+        collection_repr_lines = collection_repr.splitlines()
+        self.assertTrue(
+            policies.__class__.__name__ in collection_repr_lines[0])
+        self.assertEqual(len(policies), len(collection_repr_lines[1:-1]))
+        for policy, line in zip(policies, collection_repr_lines[1:-1]):
+            self.assertTrue(repr(policy) in line)
+        with patch_policies(policies):
+            self.assertEqual(repr(POLICIES), collection_repr)
+
+    def test_validate_policies_defaults(self):
+        # 0 explicit default
+        test_policies = [StoragePolicy(0, 'zero', True),
+                         StoragePolicy(1, 'one', False),
+                         StoragePolicy(2, 'two', False)]
+        policies = StoragePolicyCollection(test_policies)
+        self.assertEqual(policies.default, test_policies[0])
+        self.assertEqual(policies.default.name, 'zero')
+
+        # non-zero explicit default
+        test_policies = [StoragePolicy(0, 'zero', False),
+                         StoragePolicy(1, 'one', False),
+                         StoragePolicy(2, 'two', True)]
+        policies = StoragePolicyCollection(test_policies)
+        self.assertEqual(policies.default, test_policies[2])
+        self.assertEqual(policies.default.name, 'two')
+
+        # multiple defaults
+        test_policies = [StoragePolicy(0, 'zero', False),
+                         StoragePolicy(1, 'one', True),
+                         StoragePolicy(2, 'two', True)]
+        self.assertRaisesWithMessage(
+            PolicyError, 'Duplicate default', StoragePolicyCollection,
+            test_policies)
+
+        # nothing specified
+        test_policies = []
+        policies = StoragePolicyCollection(test_policies)
+        self.assertEqual(policies.default, policies[0])
+        self.assertEqual(policies.default.name, 'Policy-0')
+
+        # no default specified with only policy index 0
+        test_policies = [StoragePolicy(0, 'zero')]
+        policies = StoragePolicyCollection(test_policies)
+        self.assertEqual(policies.default, policies[0])
+
+        # no default specified with multiple policies
+        test_policies = [StoragePolicy(0, 'zero', False),
+                         StoragePolicy(1, 'one', False),
+                         StoragePolicy(2, 'two', False)]
+        self.assertRaisesWithMessage(
+            PolicyError, 'Unable to find default policy',
+            StoragePolicyCollection, test_policies)
+
+    def test_deprecate_policies(self):
+        # deprecation specified
+        test_policies = [StoragePolicy(0, 'zero', True),
+                         StoragePolicy(1, 'one', False),
+                         StoragePolicy(2, 'two', False, is_deprecated=True)]
+        policies = StoragePolicyCollection(test_policies)
+        self.assertEqual(policies.default, test_policies[0])
+        self.assertEqual(policies.default.name, 'zero')
+        self.assertEqual(len(policies), 3)
+
+        # multiple policies requires default
+        test_policies = [StoragePolicy(0, 'zero', False),
+                         StoragePolicy(1, 'one', False, is_deprecated=True),
+                         StoragePolicy(2, 'two', False)]
+        self.assertRaisesWithMessage(
+            PolicyError, 'Unable to find default policy',
+            StoragePolicyCollection, test_policies)
+
+    def test_validate_policies_indexes(self):
+        # duplicate indexes
+        test_policies = [StoragePolicy(0, 'zero', True),
+                         StoragePolicy(1, 'one', False),
+                         StoragePolicy(1, 'two', False)]
+        self.assertRaises(PolicyError, StoragePolicyCollection,
+                          test_policies)
+
+    def test_validate_policy_params(self):
+        StoragePolicy(0, 'name')  # sanity
+        # bogus indexes
+        self.assertRaises(PolicyError, FakeStoragePolicy, 'x', 'name')
+        self.assertRaises(PolicyError, FakeStoragePolicy, -1, 'name')
+
+        # non-zero Policy-0
+        self.assertRaisesWithMessage(PolicyError, 'reserved',
+                                     FakeStoragePolicy, 1, 'policy-0')
+        # deprecate default
+        self.assertRaisesWithMessage(
+            PolicyError, 'Deprecated policy can not be default',
+            FakeStoragePolicy, 1, 'Policy-1', is_default=True,
+            is_deprecated=True)
+        # weird names
+        names = (
+            '',
+            'name_foo',
+            'name\nfoo',
+            'name foo',
+            u'name \u062a',
+            'name \xd8\xaa',
+        )
+        for name in names:
+            self.assertRaisesWithMessage(PolicyError, 'Invalid name',
+                                         FakeStoragePolicy, 1, name)
+
+    def test_validate_policies_names(self):
+        # duplicate names
+        test_policies = [StoragePolicy(0, 'zero', True),
+                         StoragePolicy(1, 'zero', False),
+                         StoragePolicy(2, 'two', False)]
+        self.assertRaises(PolicyError, StoragePolicyCollection,
+                          test_policies)
+
+    def test_validate_policies_type_default(self):
+        # no type specified - make sure the policy is initialized to
+        # DEFAULT_POLICY_TYPE
+        test_policy = FakeStoragePolicy(0, 'zero', True)
+        self.assertEqual(test_policy.policy_type, 'fake')
+
+    def test_validate_policies_type_invalid(self):
+        class BogusStoragePolicy(FakeStoragePolicy):
+            policy_type = 'bogus'
+
+        # unsupported policy type - initialization with FakeStoragePolicy
+        self.assertRaisesWithMessage(PolicyError, 'Invalid type',
+                                     BogusStoragePolicy, 1, 'one')
+
+    def test_policies_type_attribute(self):
+        test_policies = [
+            StoragePolicy(0, 'zero', is_default=True),
+            StoragePolicy(1, 'one'),
+            StoragePolicy(2, 'two'),
+            StoragePolicy(3, 'three', is_deprecated=True),
+            ECStoragePolicy(10, 'ten', ec_type=DEFAULT_TEST_EC_TYPE,
+                            ec_ndata=10, ec_nparity=3),
+        ]
+        policies = StoragePolicyCollection(test_policies)
+        self.assertEqual(policies.get_by_index(0).policy_type,
+                         REPL_POLICY)
+        self.assertEqual(policies.get_by_index(1).policy_type,
+                         REPL_POLICY)
+        self.assertEqual(policies.get_by_index(2).policy_type,
+                         REPL_POLICY)
+        self.assertEqual(policies.get_by_index(3).policy_type,
+                         REPL_POLICY)
+        self.assertEqual(policies.get_by_index(10).policy_type,
+                         EC_POLICY)
+
+    def test_names_are_normalized(self):
+        test_policies = [StoragePolicy(0, 'zero', True),
+                         StoragePolicy(1, 'ZERO', False)]
+        self.assertRaises(PolicyError, StoragePolicyCollection,
+                          test_policies)
+
+        policies = StoragePolicyCollection([StoragePolicy(0, 'zEro', True),
+                                            StoragePolicy(1, 'One', False)])
+
+        pol0 = policies[0]
+        pol1 = policies[1]
+
+        for name in ('zero', 'ZERO', 'zErO', 'ZeRo'):
+            self.assertEqual(pol0, policies.get_by_name(name))
+            self.assertEqual(policies.get_by_name(name).name, 'zEro')
+        for name in ('one', 'ONE', 'oNe', 'OnE'):
+            self.assertEqual(pol1, policies.get_by_name(name))
+            self.assertEqual(policies.get_by_name(name).name, 'One')
+
+    def test_wacky_int_names(self):
+        # checking duplicate on insert
+        test_policies = [StoragePolicy(0, '1', True, aliases='-1'),
+                         StoragePolicy(1, '0', False)]
+        policies = StoragePolicyCollection(test_policies)
+
+        with self.assertRaises(PolicyError):
+            policies.get_by_name_or_index('0')
+        self.assertEqual(policies.get_by_name('1'), test_policies[0])
+        self.assertEqual(policies.get_by_index(0), test_policies[0])
+
+        with self.assertRaises(PolicyError):
+            policies.get_by_name_or_index('1')
+        self.assertEqual(policies.get_by_name('0'), test_policies[1])
+        self.assertEqual(policies.get_by_index(1), test_policies[1])
+
+        self.assertIsNone(policies.get_by_index(-1))
+        self.assertEqual(policies.get_by_name_or_index('-1'), test_policies[0])
+
+    def test_multiple_names(self):
+        # checking duplicate on insert
+        test_policies = [StoragePolicy(0, 'zero', True),
+                         StoragePolicy(1, 'one', False, aliases='zero')]
+        self.assertRaises(PolicyError, StoragePolicyCollection,
+                          test_policies)
+
+        # checking correct retrival using other names
+        test_policies = [StoragePolicy(0, 'zero', True, aliases='cero, kore'),
+                         StoragePolicy(1, 'one', False, aliases='uno, tahi'),
+                         StoragePolicy(2, 'two', False, aliases='dos, rua')]
+
+        policies = StoragePolicyCollection(test_policies)
+
+        for name in ('zero', 'cero', 'kore'):
+            self.assertEqual(policies.get_by_name(name), test_policies[0])
+        for name in ('two', 'dos', 'rua'):
+            self.assertEqual(policies.get_by_name(name), test_policies[2])
+
+        # Testing parsing of conf files/text
+        good_conf = self._conf("""
+        [storage-policy:0]
+        name = one
+        aliases = uno, tahi
+        default = yes
+        """)
+
+        policies = parse_storage_policies(good_conf)
+        self.assertEqual(policies.get_by_name('one'),
+                         policies[0])
+        self.assertEqual(policies.get_by_name('one'),
+                         policies.get_by_name('tahi'))
+
+        name_repeat_conf = self._conf("""
+        [storage-policy:0]
+        name = one
+        aliases = one
+        default = yes
+        """)
+        # Test on line below should not generate errors. Repeat of main
+        # name under aliases is permitted during construction
+        # but only because automated testing requires it.
+        policies = parse_storage_policies(name_repeat_conf)
+
+        extra_commas_conf = self._conf("""
+        [storage-policy:0]
+        name = one
+        aliases = ,,one, ,
+        default = yes
+        """)
+        # Extra blank entries should be silently dropped
+        policies = parse_storage_policies(extra_commas_conf)
+
+        bad_conf = self._conf("""
+        [storage-policy:0]
+        name = one
+        aliases = uno, uno
+        default = yes
+        """)
+
+        self.assertRaisesWithMessage(PolicyError,
+                                     'is already assigned to this policy',
+                                     parse_storage_policies, bad_conf)
+
+    def test_multiple_names_EC(self):
+        # checking duplicate names on insert
+        test_policies_ec = [
+            ECStoragePolicy(
+                0, 'ec8-2',
+                aliases='zeus, jupiter',
+                ec_type=DEFAULT_TEST_EC_TYPE,
+                ec_ndata=8, ec_nparity=2,
+                object_ring=FakeRing(replicas=8),
+                is_default=True),
+            ECStoragePolicy(
+                1, 'ec10-4',
+                aliases='ec8-2',
+                ec_type=DEFAULT_TEST_EC_TYPE,
+                ec_ndata=10, ec_nparity=4,
+                object_ring=FakeRing(replicas=10))]
+
+        self.assertRaises(PolicyError, StoragePolicyCollection,
+                          test_policies_ec)
+
+        # checking correct retrival using other names
+        good_test_policies_EC = [
+            ECStoragePolicy(0, 'ec8-2', aliases='zeus, jupiter',
+                            ec_type=DEFAULT_TEST_EC_TYPE,
+                            ec_ndata=8, ec_nparity=2,
+                            object_ring=FakeRing(replicas=10),
+                            is_default=True),
+            ECStoragePolicy(1, 'ec10-4', aliases='athena, minerva',
+                            ec_type=DEFAULT_TEST_EC_TYPE,
+                            ec_ndata=10, ec_nparity=4,
+                            object_ring=FakeRing(replicas=14)),
+            ECStoragePolicy(2, 'ec4-2', aliases='poseidon, neptune',
+                            ec_type=DEFAULT_TEST_EC_TYPE,
+                            ec_ndata=4, ec_nparity=2,
+                            object_ring=FakeRing(replicas=6)),
+            ECStoragePolicy(3, 'ec4-2-dup', aliases='uzuki, rin',
+                            ec_type=DEFAULT_TEST_EC_TYPE,
+                            ec_ndata=4, ec_nparity=2,
+                            ec_duplication_factor=2,
+                            object_ring=FakeRing(replicas=12)),
+        ]
+        ec_policies = StoragePolicyCollection(good_test_policies_EC)
+
+        for name in ('ec8-2', 'zeus', 'jupiter'):
+            self.assertEqual(ec_policies.get_by_name(name), ec_policies[0])
+        for name in ('ec10-4', 'athena', 'minerva'):
+            self.assertEqual(ec_policies.get_by_name(name), ec_policies[1])
+        for name in ('ec4-2', 'poseidon', 'neptune'):
+            self.assertEqual(ec_policies.get_by_name(name), ec_policies[2])
+        for name in ('ec4-2-dup', 'uzuki', 'rin'):
+            self.assertEqual(ec_policies.get_by_name(name), ec_policies[3])
+
+        # Testing parsing of conf files/text
+        good_ec_conf = self._conf("""
+        [storage-policy:0]
+        name = ec8-2
+        aliases = zeus, jupiter
+        policy_type = erasure_coding
+        ec_type = %(ec_type)s
+        default = yes
+        ec_num_data_fragments = 8
+        ec_num_parity_fragments = 2
+        [storage-policy:1]
+        name = ec10-4
+        aliases = poseidon, neptune
+        policy_type = erasure_coding
+        ec_type = %(ec_type)s
+        ec_num_data_fragments = 10
+        ec_num_parity_fragments = 4
+        [storage-policy:2]
+        name = ec4-2-dup
+        aliases = uzuki, rin
+        policy_type = erasure_coding
+        ec_type = %(ec_type)s
+        ec_num_data_fragments = 4
+        ec_num_parity_fragments = 2
+        ec_duplication_factor = 2
+        """ % {'ec_type': DEFAULT_TEST_EC_TYPE})
+
+        ec_policies = parse_storage_policies(good_ec_conf)
+        self.assertEqual(ec_policies.get_by_name('ec8-2'),
+                         ec_policies[0])
+        self.assertEqual(ec_policies.get_by_name('ec10-4'),
+                         ec_policies.get_by_name('poseidon'))
+        self.assertEqual(ec_policies.get_by_name('ec4-2-dup'),
+                         ec_policies.get_by_name('uzuki'))
+
+        name_repeat_ec_conf = self._conf("""
+        [storage-policy:0]
+        name = ec8-2
+        aliases = ec8-2
+        policy_type = erasure_coding
+        ec_type = %(ec_type)s
+        default = yes
+        ec_num_data_fragments = 8
+        ec_num_parity_fragments = 2
+        """ % {'ec_type': DEFAULT_TEST_EC_TYPE})
+        # Test on line below should not generate errors. Repeat of main
+        # name under aliases is permitted during construction
+        # but only because automated testing requires it.
+        ec_policies = parse_storage_policies(name_repeat_ec_conf)
+
+        bad_ec_conf = self._conf("""
+        [storage-policy:0]
+        name = ec8-2
+        aliases = zeus, zeus
+        policy_type = erasure_coding
+        ec_type = %(ec_type)s
+        default = yes
+        ec_num_data_fragments = 8
+        ec_num_parity_fragments = 2
+        """ % {'ec_type': DEFAULT_TEST_EC_TYPE})
+        self.assertRaisesWithMessage(PolicyError,
+                                     'is already assigned to this policy',
+                                     parse_storage_policies, bad_ec_conf)
+
+    def test_add_remove_names(self):
+        test_policies = [StoragePolicy(0, 'zero', True),
+                         StoragePolicy(1, 'one', False),
+                         StoragePolicy(2, 'two', False)]
+        policies = StoragePolicyCollection(test_policies)
+
+        # add names
+        policies.add_policy_alias(1, 'tahi')
+        self.assertEqual(policies.get_by_name('tahi'), test_policies[1])
+
+        policies.add_policy_alias(2, 'rua', 'dos')
+        self.assertEqual(policies.get_by_name('rua'), test_policies[2])
+        self.assertEqual(policies.get_by_name('dos'), test_policies[2])
+
+        self.assertRaisesWithMessage(PolicyError, 'Invalid name',
+                                     policies.add_policy_alias, 2, 'double\n')
+
+        self.assertRaisesWithMessage(PolicyError, 'Invalid name',
+                                     policies.add_policy_alias, 2, '')
+
+        # try to add existing name
+        self.assertRaisesWithMessage(PolicyError, 'Duplicate name',
+                                     policies.add_policy_alias, 2, 'two')
+
+        self.assertRaisesWithMessage(PolicyError, 'Duplicate name',
+                                     policies.add_policy_alias, 1, 'two')
+
+        # remove name
+        policies.remove_policy_alias('tahi')
+        self.assertIsNone(policies.get_by_name('tahi'))
+
+        # remove only name
+        self.assertRaisesWithMessage(PolicyError,
+                                     'Policies must have at least one name.',
+                                     policies.remove_policy_alias, 'zero')
+
+        # remove non-existent name
+        self.assertRaisesWithMessage(PolicyError,
+                                     'No policy with name',
+                                     policies.remove_policy_alias, 'three')
+
+        # remove default name
+        policies.remove_policy_alias('two')
+        self.assertIsNone(policies.get_by_name('two'))
+        self.assertEqual(policies.get_by_index(2).name, 'rua')
+
+        # change default name to a new name
+        policies.change_policy_primary_name(2, 'two')
+        self.assertEqual(policies.get_by_name('two'), test_policies[2])
+        self.assertEqual(policies.get_by_index(2).name, 'two')
+
+        # change default name to an existing alias
+        policies.change_policy_primary_name(2, 'dos')
+        self.assertEqual(policies.get_by_index(2).name, 'dos')
+
+        # change default name to a bad new name
+        self.assertRaisesWithMessage(PolicyError, 'Invalid name',
+                                     policies.change_policy_primary_name,
+                                     2, 'bad\nname')
+
+        # change default name to a name belonging to another policy
+        self.assertRaisesWithMessage(PolicyError,
+                                     'Other policy',
+                                     policies.change_policy_primary_name,
+                                     1, 'dos')
+
+    def test_deprecated_default(self):
+        bad_conf = self._conf("""
+        [storage-policy:1]
+        name = one
+        deprecated = yes
+        default = yes
+        """)
+
+        self.assertRaisesWithMessage(
+            PolicyError, "Deprecated policy can not be default",
+            parse_storage_policies, bad_conf)
+
+    def test_multiple_policies_with_no_policy_index_zero(self):
+        bad_conf = self._conf("""
+        [storage-policy:1]
+        name = one
+        default = yes
+        """)
+
+        # Policy-0 will not be implicitly added if other policies are defined
+        self.assertRaisesWithMessage(
+            PolicyError, "must specify a storage policy section "
+            "for policy index 0", parse_storage_policies, bad_conf)
+
+    @mock.patch.object(swift.common.storage_policy, 'VALID_EC_TYPES',
+                       ['isa_l_rs_vand', 'isa_l_rs_cauchy'])
+    @mock.patch('swift.common.storage_policy.ECDriver')
+    def test_known_bad_ec_config(self, mock_driver):
+        good_conf = self._conf("""
+        [storage-policy:0]
+        name = bad-policy
+        policy_type = erasure_coding
+        ec_type = isa_l_rs_cauchy
+        ec_num_data_fragments = 10
+        ec_num_parity_fragments = 5
+        """)
+
+        with capture_logging('swift.common.storage_policy') as records:
+            parse_storage_policies(good_conf)
+        mock_driver.assert_called_once()
+        mock_driver.reset_mock()
+        self.assertFalse([(r.levelname, r.msg) for r in records])
+
+        good_conf = self._conf("""
+        [storage-policy:0]
+        name = bad-policy
+        policy_type = erasure_coding
+        ec_type = isa_l_rs_vand
+        ec_num_data_fragments = 10
+        ec_num_parity_fragments = 4
+        """)
+
+        with capture_logging('swift.common.storage_policy') as records:
+            parse_storage_policies(good_conf)
+        mock_driver.assert_called_once()
+        mock_driver.reset_mock()
+        self.assertFalse([(r.levelname, r.msg) for r in records])
+
+        bad_conf = self._conf("""
+        [storage-policy:0]
+        name = bad-policy
+        policy_type = erasure_coding
+        ec_type = isa_l_rs_vand
+        ec_num_data_fragments = 10
+        ec_num_parity_fragments = 5
+        """)
+
+        with capture_logging('swift.common.storage_policy') as records, \
+                self.assertRaises(PolicyError) as exc_mgr:
+            parse_storage_policies(bad_conf)
+        self.assertEqual(exc_mgr.exception.args[0],
+                         'Storage policy bad-policy uses an EC '
+                         'configuration known to harm data durability. This '
+                         'policy MUST be deprecated.')
+        mock_driver.assert_not_called()
+        mock_driver.reset_mock()
+        self.assertEqual([r.levelname for r in records],
+                         ['WARNING'])
+        for msg in ('known to harm data durability',
+                    'Any data in this policy should be migrated',
+                    'https://bugs.launchpad.net/swift/+bug/1639691'):
+            self.assertIn(msg, records[0].msg)
+
+        slightly_less_bad_conf = self._conf("""
+        [storage-policy:0]
+        name = bad-policy
+        policy_type = erasure_coding
+        ec_type = isa_l_rs_vand
+        ec_num_data_fragments = 10
+        ec_num_parity_fragments = 5
+        deprecated = true
+
+        [storage-policy:1]
+        name = good-policy
+        policy_type = erasure_coding
+        ec_type = isa_l_rs_cauchy
+        ec_num_data_fragments = 10
+        ec_num_parity_fragments = 5
+        default = true
+        """)
+
+        with capture_logging('swift.common.storage_policy') as records:
+            parse_storage_policies(slightly_less_bad_conf)
+        self.assertEqual(2, mock_driver.call_count)
+        mock_driver.reset_mock()
+        self.assertEqual([r.levelname for r in records],
+                         ['WARNING'])
+        for msg in ('known to harm data durability',
+                    'Any data in this policy should be migrated',
+                    'https://bugs.launchpad.net/swift/+bug/1639691'):
+            self.assertIn(msg, records[0].msg)
+
+    def test_no_default(self):
+        orig_conf = self._conf("""
+        [storage-policy:0]
+        name = zero
+        [storage-policy:1]
+        name = one
+        default = yes
+        """)
+
+        policies = parse_storage_policies(orig_conf)
+        self.assertEqual(policies.default, policies[1])
+        self.assertEqual('zero', policies[0].name)
+
+        bad_conf = self._conf("""
+        [storage-policy:0]
+        name = zero
+        [storage-policy:1]
+        name = one
+        deprecated = yes
+        """)
+
+        # multiple polices and no explicit default
+        self.assertRaisesWithMessage(
+            PolicyError, "Unable to find default",
+            parse_storage_policies, bad_conf)
+
+        good_conf = self._conf("""
+        [storage-policy:0]
+        name = Policy-0
+        default = yes
+        [storage-policy:1]
+        name = one
+        deprecated = yes
+        """)
+
+        policies = parse_storage_policies(good_conf)
+        self.assertEqual(policies.default, policies[0])
+        self.assertTrue(policies[1].is_deprecated)
+
+    def test_parse_storage_policies(self):
+        # ValueError when deprecating policy 0
+        bad_conf = self._conf("""
+        [storage-policy:0]
+        name = zero
+        deprecated = yes
+
+        [storage-policy:1]
+        name = one
+        deprecated = yes
+        """)
+
+        self.assertRaisesWithMessage(
+            PolicyError, "Unable to find policy that's not deprecated",
+            parse_storage_policies, bad_conf)
+
+        bad_conf = self._conf("""
+        [storage-policy:]
+        name = zero
+        """)
+
+        self.assertRaisesWithMessage(PolicyError, 'Invalid index',
+                                     parse_storage_policies, bad_conf)
+
+        bad_conf = self._conf("""
+        [storage-policy:-1]
+        name = zero
+        """)
+
+        self.assertRaisesWithMessage(PolicyError, 'Invalid index',
+                                     parse_storage_policies, bad_conf)
+
+        bad_conf = self._conf("""
+        [storage-policy:x]
+        name = zero
+        """)
+
+        self.assertRaisesWithMessage(PolicyError, 'Invalid index',
+                                     parse_storage_policies, bad_conf)
+
+        bad_conf = self._conf("""
+        [storage-policy:x-1]
+        name = zero
+        """)
+
+        self.assertRaisesWithMessage(PolicyError, 'Invalid index',
+                                     parse_storage_policies, bad_conf)
+
+        bad_conf = self._conf("""
+        [storage-policy:x]
+        name = zero
+        """)
+
+        self.assertRaisesWithMessage(PolicyError, 'Invalid index',
+                                     parse_storage_policies, bad_conf)
+
+        bad_conf = self._conf("""
+        [storage-policy:x:1]
+        name = zero
+        """)
+
+        self.assertRaisesWithMessage(PolicyError, 'Invalid index',
+                                     parse_storage_policies, bad_conf)
+
+        bad_conf = self._conf("""
+        [storage-policy:1]
+        name = zero
+        boo = berries
+        """)
+
+        self.assertRaisesWithMessage(PolicyError, 'Invalid option',
+                                     parse_storage_policies, bad_conf)
+
+        bad_conf = self._conf("""
+        [storage-policy:0]
+        name =
+        """)
+
+        self.assertRaisesWithMessage(PolicyError, 'Invalid name',
+                                     parse_storage_policies, bad_conf)
+
+        bad_conf = self._conf("""
+        [storage-policy:3]
+        name = Policy-0
+        """)
+
+        self.assertRaisesWithMessage(PolicyError, 'Invalid name',
+                                     parse_storage_policies, bad_conf)
+
+        bad_conf = self._conf("""
+        [storage-policy:1]
+        name = policY-0
+        """)
+
+        self.assertRaisesWithMessage(PolicyError, 'Invalid name',
+                                     parse_storage_policies, bad_conf)
+
+        bad_conf = self._conf("""
+        [storage-policy:0]
+        name = one
+        [storage-policy:1]
+        name = ONE
+        """)
+
+        self.assertRaisesWithMessage(PolicyError, 'Duplicate name',
+                                     parse_storage_policies, bad_conf)
+
+        bad_conf = self._conf("""
+        [storage-policy:0]
+        name = good_stuff
+        """)
+
+        self.assertRaisesWithMessage(PolicyError, 'Invalid name',
+                                     parse_storage_policies, bad_conf)
+
+        # policy_type = erasure_coding
+
+        # missing ec_type, ec_num_data_fragments and ec_num_parity_fragments
+        bad_conf = self._conf("""
+        [storage-policy:0]
+        name = zero
+        [storage-policy:1]
+        name = ec10-4
+        policy_type = erasure_coding
+        """)
+
+        self.assertRaisesWithMessage(PolicyError, 'Missing ec_type',
+                                     parse_storage_policies, bad_conf)
+
+        # missing ec_type, but other options valid...
+        bad_conf = self._conf("""
+        [storage-policy:0]
+        name = zero
+        [storage-policy:1]
+        name = ec10-4
+        policy_type = erasure_coding
+        ec_num_data_fragments = 10
+        ec_num_parity_fragments = 4
+        """)
+
+        self.assertRaisesWithMessage(PolicyError, 'Missing ec_type',
+                                     parse_storage_policies, bad_conf)
+
+        # ec_type specified, but invalid...
+        bad_conf = self._conf("""
+        [storage-policy:0]
+        name = zero
+        default = yes
+        [storage-policy:1]
+        name = ec10-4
+        policy_type = erasure_coding
+        ec_type = garbage_alg
+        ec_num_data_fragments = 10
+        ec_num_parity_fragments = 4
+        """)
+
+        self.assertRaisesWithMessage(PolicyError,
+                                     'Wrong ec_type garbage_alg for policy '
+                                     'ec10-4, should be one of "%s"' %
+                                     (', '.join(VALID_EC_TYPES)),
+                                     parse_storage_policies, bad_conf)
+
+        # missing and invalid ec_num_parity_fragments
+        bad_conf = self._conf("""
+        [storage-policy:0]
+        name = zero
+        [storage-policy:1]
+        name = ec10-4
+        policy_type = erasure_coding
+        ec_type = %(ec_type)s
+        ec_num_data_fragments = 10
+        """ % {'ec_type': DEFAULT_TEST_EC_TYPE})
+
+        self.assertRaisesWithMessage(PolicyError,
+                                     'Invalid ec_num_parity_fragments',
+                                     parse_storage_policies, bad_conf)
+
+        for num_parity in ('-4', '0', 'x'):
+            bad_conf = self._conf("""
+            [storage-policy:0]
+            name = zero
+            [storage-policy:1]
+            name = ec10-4
+            policy_type = erasure_coding
+            ec_type = %(ec_type)s
+            ec_num_data_fragments = 10
+            ec_num_parity_fragments = %(num_parity)s
+            """ % {'ec_type': DEFAULT_TEST_EC_TYPE,
+                   'num_parity': num_parity})
+
+            self.assertRaisesWithMessage(PolicyError,
+                                         'Invalid ec_num_parity_fragments',
+                                         parse_storage_policies, bad_conf)
+
+        # missing and invalid ec_num_data_fragments
+        bad_conf = self._conf("""
+        [storage-policy:0]
+        name = zero
+        [storage-policy:1]
+        name = ec10-4
+        policy_type = erasure_coding
+        ec_type = %(ec_type)s
+        ec_num_parity_fragments = 4
+        """ % {'ec_type': DEFAULT_TEST_EC_TYPE})
+
+        self.assertRaisesWithMessage(PolicyError,
+                                     'Invalid ec_num_data_fragments',
+                                     parse_storage_policies, bad_conf)
+
+        for num_data in ('-10', '0', 'x'):
+            bad_conf = self._conf("""
+            [storage-policy:0]
+            name = zero
+            [storage-policy:1]
+            name = ec10-4
+            policy_type = erasure_coding
+            ec_type = %(ec_type)s
+            ec_num_data_fragments = %(num_data)s
+            ec_num_parity_fragments = 4
+            """ % {'num_data': num_data, 'ec_type': DEFAULT_TEST_EC_TYPE})
+
+            self.assertRaisesWithMessage(PolicyError,
+                                         'Invalid ec_num_data_fragments',
+                                         parse_storage_policies, bad_conf)
+
+        # invalid ec_object_segment_size
+        for segment_size in ('-4', '0', 'x'):
+            bad_conf = self._conf("""
+            [storage-policy:0]
+            name = zero
+            [storage-policy:1]
+            name = ec10-4
+            policy_type = erasure_coding
+            ec_object_segment_size = %(segment_size)s
+            ec_type = %(ec_type)s
+            ec_num_data_fragments = 10
+            ec_num_parity_fragments = 4
+            """ % {'segment_size': segment_size,
+                   'ec_type': DEFAULT_TEST_EC_TYPE})
+
+            self.assertRaisesWithMessage(PolicyError,
+                                         'Invalid ec_object_segment_size',
+                                         parse_storage_policies, bad_conf)
+
+        # Additional section added to ensure parser ignores other sections
+        conf = self._conf("""
+        [some-other-section]
+        foo = bar
+        [storage-policy:0]
+        name = zero
+        [storage-policy:5]
+        name = one
+        default = yes
+        [storage-policy:6]
+        name = duplicate-sections-are-ignored
+        [storage-policy:6]
+        name = apple
+        """)
+        policies = parse_storage_policies(conf)
+
+        self.assertEqual(True, policies.get_by_index(5).is_default)
+        self.assertEqual(False, policies.get_by_index(0).is_default)
+        self.assertEqual(False, policies.get_by_index(6).is_default)
+
+        self.assertEqual("object", policies.get_by_name("zero").ring_name)
+        self.assertEqual("object-5", policies.get_by_name("one").ring_name)
+        self.assertEqual("object-6", policies.get_by_name("apple").ring_name)
+
+        self.assertEqual(0, int(policies.get_by_name('zero')))
+        self.assertEqual(5, int(policies.get_by_name('one')))
+        self.assertEqual(6, int(policies.get_by_name('apple')))
+
+        self.assertEqual("zero", policies.get_by_index(0).name)
+        self.assertEqual("zero", policies.get_by_index("0").name)
+        self.assertEqual("one", policies.get_by_index(5).name)
+        self.assertEqual("apple", policies.get_by_index(6).name)
+        self.assertEqual("zero", policies.get_by_index(None).name)
+        self.assertEqual("zero", policies.get_by_index('').name)
+
+        self.assertEqual(policies.get_by_index(0), policies.legacy)
+
+    def test_reload_invalid_storage_policies(self):
+        conf = self._conf("""
+        [storage-policy:0]
+        name = zero
+        [storage-policy:00]
+        name = double-zero
+        """)
+        with NamedTemporaryFile(mode='w+t') as f:
+            conf.write(f)
+            f.flush()
+            with mock.patch('swift.common.utils.SWIFT_CONF_FILE',
+                            new=f.name):
+                try:
+                    reload_storage_policies()
+                except SystemExit as e:
+                    err_msg = str(e)
+                else:
+                    self.fail('SystemExit not raised')
+        parts = [
+            'Invalid Storage Policy Configuration',
+            'Duplicate index',
+        ]
+        for expected in parts:
+            self.assertTrue(
+                expected in err_msg, '%s was not in %s' % (expected,
+                                                           err_msg))
+
+    def test_storage_policy_ordering(self):
+        test_policies = StoragePolicyCollection([
+            StoragePolicy(0, 'zero', is_default=True),
+            StoragePolicy(503, 'error'),
+            StoragePolicy(204, 'empty'),
+            StoragePolicy(404, 'missing'),
+        ])
+        self.assertEqual([0, 204, 404, 503], [int(p) for p in
+                                              sorted(list(test_policies))])
+
+        p503 = test_policies[503]
+        self.assertTrue(501 < p503 < 507)
+
+    def test_storage_policies_as_dict_keys(self):
+        # We have tests that expect to be able to map policies
+        # to expected values in a dict; check that we can use
+        # policies as keys.
+        test_policies = [StoragePolicy(0, 'aay', True),
+                         StoragePolicy(1, 'bee', False),
+                         StoragePolicy(2, 'cee', False)]
+        policy_to_name_map = {p: p.name for p in test_policies}
+        self.assertEqual(sorted(policy_to_name_map.keys()), test_policies)
+        self.assertIs(test_policies[0], next(
+            p for p in policy_to_name_map.keys() if p.is_default))
+        for p in test_policies:
+            self.assertEqual(policy_to_name_map[p], p.name)
+
+    def test_get_object_ring(self):
+        test_policies = [StoragePolicy(0, 'aay', True),
+                         StoragePolicy(1, 'bee', False),
+                         StoragePolicy(2, 'cee', False)]
+        policies = StoragePolicyCollection(test_policies)
+
+        class NamedFakeRing(FakeRing):
+
+            def __init__(self, swift_dir, reload_time=15, ring_name=None,
+                         validation_hook=None):
+                self.ring_name = ring_name
+                super(NamedFakeRing, self).__init__()
+
+        with mock.patch('swift.common.storage_policy.Ring',
+                        new=NamedFakeRing):
+            for policy in policies:
+                self.assertFalse(policy.object_ring)
+                ring = policies.get_object_ring(int(policy), '/path/not/used')
+                self.assertEqual(ring.ring_name, policy.ring_name)
+                self.assertTrue(policy.object_ring)
+                self.assertIsInstance(policy.object_ring, NamedFakeRing)
+
+        def blow_up(*args, **kwargs):
+            raise Exception('kaboom!')
+
+        with mock.patch('swift.common.storage_policy.Ring', new=blow_up):
+            for policy in policies:
+                policy.load_ring('/path/not/used')
+                expected = policies.get_object_ring(int(policy),
+                                                    '/path/not/used')
+                self.assertEqual(policy.object_ring, expected)
+
+        # bad policy index
+        self.assertRaises(PolicyError, policies.get_object_ring, 99,
+                          '/path/not/used')
+
+    def test_bind_ports_cache(self):
+        test_policies = [StoragePolicy(0, 'aay', True),
+                         StoragePolicy(1, 'bee', False),
+                         StoragePolicy(2, 'cee', False)]
+
+        my_ips = ['1.2.3.4', '2.3.4.5']
+        other_ips = ['3.4.5.6', '4.5.6.7']
+        bind_ip = my_ips[1]
+        devs_by_ring_name1 = {
+            'object': [  # 'aay'
+                {'id': 0, 'zone': 0, 'region': 1, 'ip': my_ips[0],
+                 'port': 6006},
+                {'id': 0, 'zone': 0, 'region': 1, 'ip': other_ips[0],
+                 'port': 6007},
+                {'id': 0, 'zone': 0, 'region': 1, 'ip': my_ips[1],
+                 'port': 6008},
+                None,
+                {'id': 0, 'zone': 0, 'region': 1, 'ip': other_ips[1],
+                 'port': 6009}],
+            'object-1': [  # 'bee'
+                {'id': 0, 'zone': 0, 'region': 1, 'ip': my_ips[1],
+                 'port': 6006},  # dupe
+                {'id': 0, 'zone': 0, 'region': 1, 'ip': other_ips[0],
+                 'port': 6010},
+                {'id': 0, 'zone': 0, 'region': 1, 'ip': my_ips[1],
+                 'port': 6011},
+                {'id': 0, 'zone': 0, 'region': 1, 'ip': other_ips[1],
+                 'port': 6012}],
+            'object-2': [  # 'cee'
+                {'id': 0, 'zone': 0, 'region': 1, 'ip': my_ips[0],
+                 'port': 6010},  # on our IP and a not-us IP
+                {'id': 0, 'zone': 0, 'region': 1, 'ip': other_ips[0],
+                 'port': 6013},
+                None,
+                {'id': 0, 'zone': 0, 'region': 1, 'ip': my_ips[1],
+                 'port': 6014},
+                {'id': 0, 'zone': 0, 'region': 1, 'ip': other_ips[1],
+                 'port': 6015}],
+        }
+        devs_by_ring_name2 = {
+            'object': [  # 'aay'
+                {'id': 0, 'zone': 0, 'region': 1, 'ip': my_ips[0],
+                 'port': 6016},
+                {'id': 0, 'zone': 0, 'region': 1, 'ip': other_ips[1],
+                 'port': 6019}],
+            'object-1': [  # 'bee'
+                {'id': 0, 'zone': 0, 'region': 1, 'ip': my_ips[1],
+                 'port': 6016},  # dupe
+                {'id': 0, 'zone': 0, 'region': 1, 'ip': other_ips[1],
+                 'port': 6022}],
+            'object-2': [  # 'cee'
+                {'id': 0, 'zone': 0, 'region': 1, 'ip': my_ips[0],
+                 'port': 6020},
+                {'id': 0, 'zone': 0, 'region': 1, 'ip': other_ips[1],
+                 'port': 6025}],
+        }
+        ring_files = [ring_name + '.ring.gz'
+                      for ring_name in sorted(devs_by_ring_name1)]
+
+        def _fake_load(gz_path, stub_objs, metadata_only=False):
+            return RingData(
+                devs=stub_objs[os.path.basename(gz_path)[:-8]],
+                replica2part2dev_id=[],
+                part_shift=24)
+
+        with mock.patch(
+                'swift.common.storage_policy.RingData.load'
+        ) as mock_ld, \
+                patch_policies(test_policies), \
+                mock.patch('swift.common.storage_policy.whataremyips') \
+                as mock_whataremyips, \
+                temptree(ring_files) as tempdir:
+            mock_whataremyips.return_value = my_ips
+
+            cache = BindPortsCache(tempdir, bind_ip)
+
+            self.assertEqual([
+                mock.call(bind_ip),
+            ], mock_whataremyips.mock_calls)
+            mock_whataremyips.reset_mock()
+
+            mock_ld.side_effect = partial(_fake_load,
+                                          stub_objs=devs_by_ring_name1)
+            self.assertEqual(set([
+                6006, 6008, 6011, 6010, 6014,
+            ]), cache.all_bind_ports_for_node())
+            self.assertEqual([
+                mock.call(os.path.join(tempdir, ring_files[0]),
+                          metadata_only=True),
+                mock.call(os.path.join(tempdir, ring_files[1]),
+                          metadata_only=True),
+                mock.call(os.path.join(tempdir, ring_files[2]),
+                          metadata_only=True),
+            ], mock_ld.mock_calls)
+            mock_ld.reset_mock()
+
+            mock_ld.side_effect = partial(_fake_load,
+                                          stub_objs=devs_by_ring_name2)
+            self.assertEqual(set([
+                6006, 6008, 6011, 6010, 6014,
+            ]), cache.all_bind_ports_for_node())
+            self.assertEqual([], mock_ld.mock_calls)
+
+            # but when all the file mtimes are made different, it'll
+            # reload
+            for gz_file in [os.path.join(tempdir, n)
+                            for n in ring_files]:
+                os.utime(gz_file, (88, 88))
+
+            self.assertEqual(set([
+                6016, 6020,
+            ]), cache.all_bind_ports_for_node())
+            self.assertEqual([
+                mock.call(os.path.join(tempdir, ring_files[0]),
+                          metadata_only=True),
+                mock.call(os.path.join(tempdir, ring_files[1]),
+                          metadata_only=True),
+                mock.call(os.path.join(tempdir, ring_files[2]),
+                          metadata_only=True),
+            ], mock_ld.mock_calls)
+            mock_ld.reset_mock()
+
+            # Don't do something stupid like crash if a ring file is missing.
+            os.unlink(os.path.join(tempdir, 'object-2.ring.gz'))
+
+            self.assertEqual(set([
+                6016, 6020,
+            ]), cache.all_bind_ports_for_node())
+            self.assertEqual([], mock_ld.mock_calls)
+
+        # whataremyips() is only called in the constructor
+        self.assertEqual([], mock_whataremyips.mock_calls)
+
+    def test_singleton_passthrough(self):
+        test_policies = [StoragePolicy(0, 'aay', True),
+                         StoragePolicy(1, 'bee', False),
+                         StoragePolicy(2, 'cee', False)]
+        with patch_policies(test_policies):
+            for policy in POLICIES:
+                self.assertEqual(POLICIES[int(policy)], policy)
+
+    def test_quorum_size_replication(self):
+        expected_sizes = {1: 1,
+                          2: 1,
+                          3: 2,
+                          4: 2,
+                          5: 3}
+        for n, expected in expected_sizes.items():
+            policy = StoragePolicy(0, 'zero',
+                                   object_ring=FakeRing(replicas=n))
+            self.assertEqual(policy.quorum, expected)
+
+    def test_quorum_size_erasure_coding(self):
+        test_ec_policies = [
+            ECStoragePolicy(10, 'ec8-2', ec_type=DEFAULT_TEST_EC_TYPE,
+                            ec_ndata=8, ec_nparity=2),
+            ECStoragePolicy(11, 'df10-6', ec_type='flat_xor_hd_4',
+                            ec_ndata=10, ec_nparity=6),
+            ECStoragePolicy(12, 'ec4-2-dup', ec_type=DEFAULT_TEST_EC_TYPE,
+                            ec_ndata=4, ec_nparity=2, ec_duplication_factor=2),
+        ]
+        for ec_policy in test_ec_policies:
+            k = ec_policy.ec_ndata
+            expected_size = (
+                (k + ec_policy.pyeclib_driver.min_parity_fragments_needed())
+                * ec_policy.ec_duplication_factor
+            )
+
+            self.assertEqual(expected_size, ec_policy.quorum)
+
+    def test_validate_ring(self):
+        test_policies = [
+            ECStoragePolicy(0, 'ec8-2', ec_type=DEFAULT_TEST_EC_TYPE,
+                            ec_ndata=8, ec_nparity=2,
+                            is_default=True),
+            ECStoragePolicy(1, 'ec10-4', ec_type=DEFAULT_TEST_EC_TYPE,
+                            ec_ndata=10, ec_nparity=4),
+            ECStoragePolicy(2, 'ec4-2', ec_type=DEFAULT_TEST_EC_TYPE,
+                            ec_ndata=4, ec_nparity=2),
+            ECStoragePolicy(3, 'ec4-2-2dup', ec_type=DEFAULT_TEST_EC_TYPE,
+                            ec_ndata=4, ec_nparity=2,
+                            ec_duplication_factor=2)
+        ]
+        policies = StoragePolicyCollection(test_policies)
+
+        class MockRingData(object):
+            def __init__(self, num_replica):
+                self.replica_count = num_replica
+
+        def do_test(actual_load_ring_replicas):
+            for policy, ring_replicas in zip(policies,
+                                             actual_load_ring_replicas):
+                with mock.patch('swift.common.ring.ring.RingData.load',
+                                return_value=MockRingData(ring_replicas)):
+                    necessary_replica_num = (policy.ec_n_unique_fragments *
+                                             policy.ec_duplication_factor)
+                    with mock.patch(
+                            'swift.common.ring.ring.validate_configuration'):
+                        msg = 'EC ring for policy %s needs to be configured ' \
+                              'with exactly %d replicas.' % \
+                              (policy.name, necessary_replica_num)
+                        self.assertRaisesWithMessage(RingLoadError, msg,
+                                                     policy.load_ring, 'mock')
+
+        # first, do somethign completely different
+        do_test([8, 10, 7, 11])
+        # then again, closer to true, but fractional
+        do_test([9.9, 14.1, 5.99999, 12.000000001])
+
+    def test_storage_policy_get_info(self):
+        test_policies = [
+            StoragePolicy(0, 'zero', is_default=True),
+            StoragePolicy(1, 'one', is_deprecated=True,
+                          aliases='tahi, uno'),
+            ECStoragePolicy(10, 'ten',
+                            ec_type=DEFAULT_TEST_EC_TYPE,
+                            ec_ndata=10, ec_nparity=3),
+            ECStoragePolicy(11, 'done', is_deprecated=True,
+                            ec_type=DEFAULT_TEST_EC_TYPE,
+                            ec_ndata=10, ec_nparity=3),
+        ]
+        policies = StoragePolicyCollection(test_policies)
+        expected = {
+            # default replication
+            (0, True): {
+                'name': 'zero',
+                'aliases': 'zero',
+                'default': True,
+                'deprecated': False,
+                'diskfile_module': 'egg:swift#replication.fs',
+                'policy_type': REPL_POLICY
+            },
+            (0, False): {
+                'name': 'zero',
+                'aliases': 'zero',
+                'default': True,
+            },
+            # deprecated replication
+            (1, True): {
+                'name': 'one',
+                'aliases': 'one, tahi, uno',
+                'default': False,
+                'deprecated': True,
+                'diskfile_module': 'egg:swift#replication.fs',
+                'policy_type': REPL_POLICY
+            },
+            (1, False): {
+                'name': 'one',
+                'aliases': 'one, tahi, uno',
+                'deprecated': True,
+            },
+            # enabled ec
+            (10, True): {
+                'name': 'ten',
+                'aliases': 'ten',
+                'default': False,
+                'deprecated': False,
+                'diskfile_module': 'egg:swift#erasure_coding.fs',
+                'policy_type': EC_POLICY,
+                'ec_type': DEFAULT_TEST_EC_TYPE,
+                'ec_num_data_fragments': 10,
+                'ec_num_parity_fragments': 3,
+                'ec_object_segment_size': DEFAULT_EC_OBJECT_SEGMENT_SIZE,
+                'ec_duplication_factor': 1,
+            },
+            (10, False): {
+                'name': 'ten',
+                'aliases': 'ten',
+            },
+            # deprecated ec
+            (11, True): {
+                'name': 'done',
+                'aliases': 'done',
+                'default': False,
+                'deprecated': True,
+                'diskfile_module': 'egg:swift#erasure_coding.fs',
+                'policy_type': EC_POLICY,
+                'ec_type': DEFAULT_TEST_EC_TYPE,
+                'ec_num_data_fragments': 10,
+                'ec_num_parity_fragments': 3,
+                'ec_object_segment_size': DEFAULT_EC_OBJECT_SEGMENT_SIZE,
+                'ec_duplication_factor': 1,
+            },
+            (11, False): {
+                'name': 'done',
+                'aliases': 'done',
+                'deprecated': True,
+            },
+            # enabled ec with ec_duplication
+            (12, True): {
+                'name': 'twelve',
+                'aliases': 'twelve',
+                'default': False,
+                'deprecated': False,
+                'diskfile_module': 'egg:swift#erasure_coding.fs',
+                'policy_type': EC_POLICY,
+                'ec_type': DEFAULT_TEST_EC_TYPE,
+                'ec_num_data_fragments': 10,
+                'ec_num_parity_fragments': 3,
+                'ec_object_segment_size': DEFAULT_EC_OBJECT_SEGMENT_SIZE,
+                'ec_duplication_factor': 2,
+            },
+            (12, False): {
+                'name': 'twelve',
+                'aliases': 'twelve',
+            },
+        }
+        self.maxDiff = None
+        for policy in policies:
+            expected_info = expected[(int(policy), True)]
+            self.assertEqual(policy.get_info(config=True), expected_info)
+            expected_info = expected[(int(policy), False)]
+            self.assertEqual(policy.get_info(config=False), expected_info)
+
+    def test_ec_fragment_size_cached(self):
+        policy = ECStoragePolicy(
+            0, 'ec2-1', ec_type=DEFAULT_TEST_EC_TYPE,
+            ec_ndata=2, ec_nparity=1, object_ring=FakeRing(replicas=3),
+            ec_segment_size=DEFAULT_EC_OBJECT_SEGMENT_SIZE, is_default=True)
+
+        ec_driver = ECDriver(ec_type=DEFAULT_TEST_EC_TYPE,
+                             k=2, m=1)
+        expected_fragment_size = ec_driver.get_segment_info(
+            DEFAULT_EC_OBJECT_SEGMENT_SIZE,
+            DEFAULT_EC_OBJECT_SEGMENT_SIZE)['fragment_size']
+
+        with mock.patch.object(
+                policy.pyeclib_driver, 'get_segment_info') as fake:
+            fake.return_value = {
+                'fragment_size': expected_fragment_size}
+
+            for x in range(10):
+                self.assertEqual(expected_fragment_size,
+                                 policy.fragment_size)
+                # pyeclib_driver.get_segment_info is called only once
+                self.assertEqual(1, fake.call_count)
+
+    def test_get_diskfile_manager(self):
+        # verify unique diskfile manager instances are returned
+        policy = StoragePolicy(0, name='zero', is_default=True,
+                               diskfile_module='replication.fs')
+
+        dfm = policy.get_diskfile_manager({'devices': 'sdb1'}, debug_logger())
+        self.assertEqual('sdb1', dfm.devices)
+        dfm = policy.get_diskfile_manager({'devices': 'sdb2'}, debug_logger())
+        self.assertEqual('sdb2', dfm.devices)
+        dfm2 = policy.get_diskfile_manager({'devices': 'sdb2'}, debug_logger())
+        self.assertEqual('sdb2', dfm2.devices)
+        self.assertIsNot(dfm, dfm2)
+
+    def test_get_diskfile_manager_custom_diskfile(self):
+        calls = []
+        is_policy_ok = True
+
+        class DFM(object):
+            def __init__(self, *args, **kwargs):
+                calls.append((args, kwargs))
+
+            @classmethod
+            def check_policy(cls, policy):
+                if not is_policy_ok:
+                    raise ValueError("I am not ok")
+
+        policy = StoragePolicy(0, name='zero', is_default=True,
+                               diskfile_module='thin_air.fs')
+        with mock.patch(
+                'swift.common.storage_policy.load_pkg_resource',
+                side_effect=lambda *a, **kw: DFM) as mock_load_pkg_resource:
+            dfm = policy.get_diskfile_manager('arg', kwarg='kwarg')
+        self.assertIsInstance(dfm, DFM)
+        mock_load_pkg_resource.assert_called_with(
+            'swift.diskfile', 'thin_air.fs')
+        self.assertEqual([(('arg',), {'kwarg': 'kwarg'})], calls)
+
+        calls = []
+        is_policy_ok = False
+
+        with mock.patch(
+                'swift.common.storage_policy.load_pkg_resource',
+                side_effect=lambda *a, **kw: DFM) as mock_load_pkg_resource:
+            with self.assertRaises(PolicyError) as cm:
+                policy.get_diskfile_manager('arg', kwarg='kwarg')
+        mock_load_pkg_resource.assert_called_with(
+            'swift.diskfile', 'thin_air.fs')
+        self.assertIn('Invalid diskfile_module thin_air.fs', str(cm.exception))
+
+    def test_get_diskfile_manager_invalid_policy_config(self):
+        bad_policy = StoragePolicy(0, name='zero', is_default=True,
+                                   diskfile_module='erasure_coding.fs')
+
+        with self.assertRaises(PolicyError) as cm:
+            bad_policy.get_diskfile_manager()
+        self.assertIn('Invalid diskfile_module erasure_coding.fs',
+                      str(cm.exception))
+
+        bad_policy = ECStoragePolicy(0, name='one', is_default=True,
+                                     ec_type=DEFAULT_TEST_EC_TYPE,
+                                     ec_ndata=10, ec_nparity=4,
+                                     diskfile_module='replication.fs')
+
+        with self.assertRaises(PolicyError) as cm:
+            bad_policy.get_diskfile_manager()
+
+        self.assertIn('Invalid diskfile_module replication.fs',
+                      str(cm.exception))
+
+        bad_policy = StoragePolicy(0, name='zero', is_default=True,
+                                   diskfile_module='thin_air.fs')
+
+        with self.assertRaises(PolicyError) as cm:
+            bad_policy.get_diskfile_manager()
+
+        self.assertIn('Unable to load diskfile_module thin_air.fs',
+                      str(cm.exception))
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/common/test_swob.py b/test/unit/common/test_swob.py
old mode 100755
new mode 100644
index ca065c0509..b77b8caaac
--- a/test/unit/common/test_swob.py
+++ b/test/unit/common/test_swob.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2012 OpenStack, LLC.
+# Copyright (c) 2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -15,176 +15,242 @@
 
 "Tests for swift.common.swob"
 
-import unittest
 import datetime
+import unittest
 import re
-from StringIO import StringIO
+import time
+
+from io import BytesIO
+
+from urllib.parse import quote
+from unittest import mock
+
+import swift.common.swob as swob
+from swift.common import utils, exceptions
 
-import swift.common.swob
+from test.unit.common.middleware.helpers import LeakTrackingIter
 
 
 class TestHeaderEnvironProxy(unittest.TestCase):
     def test_proxy(self):
         environ = {}
-        proxy = swift.common.swob.HeaderEnvironProxy(environ)
+        proxy = swob.HeaderEnvironProxy(environ)
+        self.assertIs(environ, proxy.environ)
         proxy['Content-Length'] = 20
         proxy['Content-Type'] = 'text/plain'
         proxy['Something-Else'] = 'somevalue'
-        self.assertEquals(
-            proxy.environ, {'CONTENT_LENGTH': '20',
-                            'CONTENT_TYPE': 'text/plain',
-                            'HTTP_SOMETHING_ELSE': 'somevalue'})
-        self.assertEquals(proxy['content-length'], '20')
-        self.assertEquals(proxy['content-type'], 'text/plain')
-        self.assertEquals(proxy['something-else'], 'somevalue')
+        # NB: WSGI strings
+        proxy['X-Object-Meta-Unicode-\xff-Bu\xc3\x9fe'] = '\xe2\x98\xb9'
+        self.assertEqual(proxy.environ, {
+            'CONTENT_LENGTH': '20',
+            'CONTENT_TYPE': 'text/plain',
+            'HTTP_SOMETHING_ELSE': 'somevalue',
+            'HTTP_X_OBJECT_META_UNICODE_\xff_BU\xc3\x9fE': '\xe2\x98\xb9'})
+        self.assertEqual(proxy['content-length'], '20')
+        self.assertEqual(proxy['content-type'], 'text/plain')
+        self.assertEqual(proxy['something-else'], 'somevalue')
+        self.assertEqual(set(['Something-Else',
+                              'X-Object-Meta-Unicode-\xff-Bu\xc3\x9fE',
+                              'Content-Length', 'Content-Type']),
+                         set(proxy.keys()))
+        self.assertEqual(list(iter(proxy)), proxy.keys())
+        self.assertEqual(4, len(proxy))
+
+    def test_ignored_keys(self):
+        # Constructor doesn't normalize keys
+        key = 'wsgi.input'
+        environ = {key: ''}
+        proxy = swob.HeaderEnvironProxy(environ)
+        self.assertEqual([], list(iter(proxy)))
+        self.assertEqual([], proxy.keys())
+        self.assertEqual(0, len(proxy))
+        self.assertRaises(KeyError, proxy.__getitem__, key)
+        self.assertNotIn(key, proxy)
+        self.assertIn(key, proxy.environ)
+        self.assertIs(environ, proxy.environ)
+
+        proxy['Content-Type'] = 'text/plain'
+        self.assertEqual(['Content-Type'], list(iter(proxy)))
+        self.assertEqual(['Content-Type'], proxy.keys())
+        self.assertEqual(1, len(proxy))
+        self.assertEqual('text/plain', proxy['Content-Type'])
+        self.assertIn('Content-Type', proxy)
 
     def test_del(self):
         environ = {}
-        proxy = swift.common.swob.HeaderEnvironProxy(environ)
+        proxy = swob.HeaderEnvironProxy(environ)
         proxy['Content-Length'] = 20
         proxy['Content-Type'] = 'text/plain'
         proxy['Something-Else'] = 'somevalue'
         del proxy['Content-Length']
         del proxy['Content-Type']
         del proxy['Something-Else']
-        self.assertEquals(proxy.environ, {})
+        self.assertEqual(proxy.environ, {})
+        self.assertEqual(0, len(proxy))
+        with self.assertRaises(KeyError):
+            del proxy['Content-Length']
 
     def test_contains(self):
         environ = {}
-        proxy = swift.common.swob.HeaderEnvironProxy(environ)
+        proxy = swob.HeaderEnvironProxy(environ)
         proxy['Content-Length'] = 20
         proxy['Content-Type'] = 'text/plain'
         proxy['Something-Else'] = 'somevalue'
-        self.assert_('content-length' in proxy)
-        self.assert_('content-type' in proxy)
-        self.assert_('something-else' in proxy)
+        self.assertTrue('content-length' in proxy)
+        self.assertTrue('content-type' in proxy)
+        self.assertTrue('something-else' in proxy)
 
     def test_keys(self):
         environ = {}
-        proxy = swift.common.swob.HeaderEnvironProxy(environ)
+        proxy = swob.HeaderEnvironProxy(environ)
         proxy['Content-Length'] = 20
         proxy['Content-Type'] = 'text/plain'
         proxy['Something-Else'] = 'somevalue'
-        self.assertEquals(
+        self.assertEqual(
             set(proxy.keys()),
             set(('Content-Length', 'Content-Type', 'Something-Else')))
 
 
-class TestHeaderKeyDict(unittest.TestCase):
-    def test_case_insensitive(self):
-        headers = swift.common.swob.HeaderKeyDict()
-        headers['Content-Length'] = 0
-        headers['CONTENT-LENGTH'] = 10
-        headers['content-length'] = 20
-        self.assertEquals(headers['Content-Length'], '20')
-        self.assertEquals(headers['content-length'], '20')
-        self.assertEquals(headers['CONTENT-LENGTH'], '20')
-
-    def test_del_contains(self):
-        headers = swift.common.swob.HeaderKeyDict()
-        headers['Content-Length'] = 0
-        self.assert_('Content-Length' in headers)
-        del headers['Content-Length']
-        self.assert_('Content-Length' not in headers)
-
-    def test_update(self):
-        headers = swift.common.swob.HeaderKeyDict()
-        headers.update({'Content-Length': '0'})
-        headers.update([('Content-Type', 'text/plain')])
-        self.assertEquals(headers['Content-Length'], '0')
-        self.assertEquals(headers['Content-Type'], 'text/plain')
-
-    def test_get(self):
-        headers = swift.common.swob.HeaderKeyDict()
-        headers['content-length'] = 20
-        self.assertEquals(headers.get('CONTENT-LENGTH'), '20')
-        self.assertEquals(headers.get('something-else'), None)
-        self.assertEquals(headers.get('something-else', True), True)
-
-
 class TestRange(unittest.TestCase):
     def test_range(self):
-        range = swift.common.swob.Range('bytes=1-7')
-        self.assertEquals(range.ranges[0], (1, 7))
+        swob_range = swob.Range('bytes=1-7')
+        self.assertEqual(swob_range.ranges[0], (1, 7))
 
     def test_upsidedown_range(self):
-        range = swift.common.swob.Range('bytes=5-10')
-        self.assertEquals(range.ranges_for_length(2), [])
+        swob_range = swob.Range('bytes=5-10')
+        self.assertEqual(swob_range.ranges_for_length(2), [])
 
     def test_str(self):
         for range_str in ('bytes=1-7', 'bytes=1-', 'bytes=-1',
                           'bytes=1-7,9-12', 'bytes=-7,9-'):
-            range = swift.common.swob.Range(range_str)
-            self.assertEquals(str(range), range_str)
+            swob_range = swob.Range(range_str)
+            self.assertEqual(str(swob_range), range_str)
 
     def test_ranges_for_length(self):
-        range = swift.common.swob.Range('bytes=1-7')
-        self.assertEquals(range.ranges_for_length(10), [(1, 8)])
-        self.assertEquals(range.ranges_for_length(5), [(1, 5)])
-        self.assertEquals(range.ranges_for_length(None), None)
+        swob_range = swob.Range('bytes=1-7')
+        self.assertEqual(swob_range.ranges_for_length(10), [(1, 8)])
+        self.assertEqual(swob_range.ranges_for_length(5), [(1, 5)])
+        self.assertIsNone(swob_range.ranges_for_length(None))
 
     def test_ranges_for_large_length(self):
-        range = swift.common.swob.Range('bytes=-1000000000000000000000000000')
-        self.assertEquals(range.ranges_for_length(100), [(0, 100)])
+        swob_range = swob.Range('bytes=-100000000000000000000000')
+        self.assertEqual(swob_range.ranges_for_length(100), [(0, 100)])
 
     def test_ranges_for_length_no_end(self):
-        range = swift.common.swob.Range('bytes=1-')
-        self.assertEquals(range.ranges_for_length(10), [(1, 10)])
-        self.assertEquals(range.ranges_for_length(5), [(1, 5)])
-        self.assertEquals(range.ranges_for_length(None), None)
+        swob_range = swob.Range('bytes=1-')
+        self.assertEqual(swob_range.ranges_for_length(10), [(1, 10)])
+        self.assertEqual(swob_range.ranges_for_length(5), [(1, 5)])
+        self.assertIsNone(swob_range.ranges_for_length(None))
         # This used to freak out:
-        range = swift.common.swob.Range('bytes=100-')
-        self.assertEquals(range.ranges_for_length(5), [])
-        self.assertEquals(range.ranges_for_length(None), None)
+        swob_range = swob.Range('bytes=100-')
+        self.assertEqual(swob_range.ranges_for_length(5), [])
+        self.assertIsNone(swob_range.ranges_for_length(None))
 
-        range = swift.common.swob.Range('bytes=4-6,100-')
-        self.assertEquals(range.ranges_for_length(5), [(4, 5)])
+        swob_range = swob.Range('bytes=4-6,100-')
+        self.assertEqual(swob_range.ranges_for_length(5), [(4, 5)])
 
     def test_ranges_for_length_no_start(self):
-        range = swift.common.swob.Range('bytes=-7')
-        self.assertEquals(range.ranges_for_length(10), [(3, 10)])
-        self.assertEquals(range.ranges_for_length(5), [(0, 5)])
-        self.assertEquals(range.ranges_for_length(None), None)
+        swob_range = swob.Range('bytes=-7')
+        self.assertEqual(swob_range.ranges_for_length(10), [(3, 10)])
+        self.assertEqual(swob_range.ranges_for_length(5), [(0, 5)])
+        self.assertIsNone(swob_range.ranges_for_length(None))
 
-        range = swift.common.swob.Range('bytes=4-6,-100')
-        self.assertEquals(range.ranges_for_length(5), [(4, 5), (0, 5)])
+        swob_range = swob.Range('bytes=4-6,-100')
+        self.assertEqual(swob_range.ranges_for_length(5), [(4, 5), (0, 5)])
 
     def test_ranges_for_length_multi(self):
-        range = swift.common.swob.Range('bytes=-20,4-,30-150,-10')
-        # the length of the ranges should be 4
-        self.assertEquals(len(range.ranges_for_length(200)), 4)
+        swob_range = swob.Range('bytes=-20,4-')
+        self.assertEqual(len(swob_range.ranges_for_length(200)), 2)
 
-        # the actual length less than any of the range
-        self.assertEquals(range.ranges_for_length(90),
-                          [(70, 90), (4, 90), (30, 90), (80, 90)])
+        # the actual length greater than each range element
+        self.assertEqual(swob_range.ranges_for_length(200),
+                         [(180, 200), (4, 200)])
 
-        # the actual length greater than any of the range
-        self.assertEquals(range.ranges_for_length(200),
-                          [(180, 200), (4, 200), (30, 151), (190, 200)])
+        swob_range = swob.Range('bytes=30-150,-10')
+        self.assertEqual(len(swob_range.ranges_for_length(200)), 2)
 
-        self.assertEquals(range.ranges_for_length(None), None)
+        # the actual length lands in the middle of a range
+        self.assertEqual(swob_range.ranges_for_length(90),
+                         [(30, 90), (80, 90)])
 
-    def test_ranges_for_length_edges(self):
-        range = swift.common.swob.Range('bytes=0-1, -7')
-        self.assertEquals(range.ranges_for_length(10),
-                          [(0, 2), (3, 10)])
+        # the actual length greater than any of the range
+        self.assertEqual(swob_range.ranges_for_length(200),
+                         [(30, 151), (190, 200)])
 
-        range = swift.common.swob.Range('bytes=-7, 0-1')
-        self.assertEquals(range.ranges_for_length(10),
-                          [(3, 10), (0, 2)])
+        self.assertIsNone(swob_range.ranges_for_length(None))
 
-        range = swift.common.swob.Range('bytes=-7, 0-1')
-        self.assertEquals(range.ranges_for_length(5),
-                          [(0, 5), (0, 2)])
+    def test_ranges_for_length_edges(self):
+        swob_range = swob.Range('bytes=0-1, -7')
+        self.assertEqual(swob_range.ranges_for_length(10),
+                         [(0, 2), (3, 10)])
+
+        swob_range = swob.Range('bytes=-7, 0-1')
+        self.assertEqual(swob_range.ranges_for_length(10),
+                         [(3, 10), (0, 2)])
+
+        swob_range = swob.Range('bytes=-7, 0-1')
+        self.assertEqual(swob_range.ranges_for_length(5),
+                         [(0, 5), (0, 2)])
+
+    def test_ranges_for_length_overlapping(self):
+        # Fewer than 3 overlaps is okay
+        swob_range = swob.Range('bytes=10-19,15-24')
+        self.assertEqual(swob_range.ranges_for_length(100),
+                         [(10, 20), (15, 25)])
+        swob_range = swob.Range('bytes=10-19,15-24,20-29')
+        self.assertEqual(swob_range.ranges_for_length(100),
+                         [(10, 20), (15, 25), (20, 30)])
+
+        # Adjacent ranges, though suboptimal, don't overlap
+        swob_range = swob.Range('bytes=10-19,20-29,30-39')
+        self.assertEqual(swob_range.ranges_for_length(100),
+                         [(10, 20), (20, 30), (30, 40)])
+
+        # Ranges that share a byte do overlap
+        swob_range = swob.Range('bytes=10-20,20-30,30-40,40-50')
+        self.assertEqual(swob_range.ranges_for_length(100), [])
+
+        # With suffix byte range specs (e.g. bytes=-2), make sure that we
+        # correctly determine overlapping-ness based on the entity length
+        swob_range = swob.Range('bytes=10-15,15-20,30-39,-9')
+        self.assertEqual(swob_range.ranges_for_length(100),
+                         [(10, 16), (15, 21), (30, 40), (91, 100)])
+        self.assertEqual(swob_range.ranges_for_length(20), [])
+
+    def test_ranges_for_length_nonascending(self):
+        few_ranges = ("bytes=100-109,200-209,300-309,500-509,"
+                      "400-409,600-609,700-709")
+        many_ranges = few_ranges + ",800-809"
+
+        swob_range = swob.Range(few_ranges)
+        self.assertEqual(swob_range.ranges_for_length(100000),
+                         [(100, 110), (200, 210), (300, 310), (500, 510),
+                          (400, 410), (600, 610), (700, 710)])
+
+        swob_range = swob.Range(many_ranges)
+        self.assertEqual(swob_range.ranges_for_length(100000), [])
+
+    def test_ranges_for_length_too_many(self):
+        at_the_limit_ranges = (
+            "bytes=" + ",".join("%d-%d" % (x * 1000, x * 1000 + 10)
+                                for x in range(50)))
+        too_many_ranges = at_the_limit_ranges + ",10000000-10000009"
+
+        rng = swob.Range(at_the_limit_ranges)
+        self.assertEqual(len(rng.ranges_for_length(1000000000)), 50)
+
+        rng = swob.Range(too_many_ranges)
+        self.assertEqual(rng.ranges_for_length(1000000000), [])
 
     def test_range_invalid_syntax(self):
 
-        def _check_invalid_range(range_value):
+        def _assert_invalid_range(range_value):
             try:
-                swift.common.swob.Range(range_value)
-                return False
+                swob.Range(range_value)
+                self.fail("Expected %r to be invalid, but wasn't" %
+                          (range_value,))
             except ValueError:
-                return True
+                pass
 
         """
         All the following cases should result ValueError exception
@@ -196,37 +262,136 @@ def _check_invalid_range(range_value):
         6. any combination of the above
         """
 
-        self.assert_(_check_invalid_range('nonbytes=foobar,10-2'))
-        self.assert_(_check_invalid_range('bytes=5-3'))
-        self.assert_(_check_invalid_range('bytes=-'))
-        self.assert_(_check_invalid_range('bytes=45'))
-        self.assert_(_check_invalid_range('bytes=foo-bar,3-5'))
-        self.assert_(_check_invalid_range('bytes=4-10,45'))
-        self.assert_(_check_invalid_range('bytes=foobar,3-5'))
-        self.assert_(_check_invalid_range('bytes=nonumber-5'))
-        self.assert_(_check_invalid_range('bytes=nonumber'))
+        _assert_invalid_range(None)
+        _assert_invalid_range('nonbytes=0-')
+        _assert_invalid_range('nonbytes=foobar,10-2')
+        _assert_invalid_range('bytes=5-3')
+        _assert_invalid_range('bytes=-')
+        _assert_invalid_range('bytes=45')
+        _assert_invalid_range('bytes=foo-bar,3-5')
+        _assert_invalid_range('bytes=4-10,45')
+        _assert_invalid_range('bytes=foobar,3-5')
+        _assert_invalid_range('bytes=nonumber-5')
+        _assert_invalid_range('bytes=nonumber')
+        _assert_invalid_range('bytes=--1')
+        _assert_invalid_range('bytes=--0')
 
 
 class TestMatch(unittest.TestCase):
     def test_match(self):
-        match = swift.common.swob.Match('"a", "b"')
-        self.assertEquals(match.tags, set(('a', 'b')))
-        self.assert_('a' in match)
-        self.assert_('b' in match)
-        self.assert_('c' not in match)
+        match = swob.Match('"a", "b"')
+        self.assertEqual(match.tags, set(('a', 'b')))
+        self.assertIn('a', match)
+        self.assertIn('"a"', match)
+        self.assertNotIn('""a""', match)
+        self.assertIn('b', match)
+        self.assertNotIn('c', match)
+        self.assertNotIn(None, match)
+        self.assertEqual(repr(match), "Match('a, b')")
 
     def test_match_star(self):
-        match = swift.common.swob.Match('"a", "*"')
-        self.assert_('a' in match)
-        self.assert_('b' in match)
-        self.assert_('c' in match)
+        match = swob.Match('"a", "*"')
+        self.assertIn('a', match)
+        self.assertIn('"a"', match)
+        self.assertIn('""a""', match)
+        self.assertIn('b', match)
+        self.assertIn('c', match)
+        self.assertIn(None, match)
+        self.assertEqual(repr(match), "Match('*, a')")
 
     def test_match_noquote(self):
-        match = swift.common.swob.Match('a, b')
-        self.assertEquals(match.tags, set(('a', 'b')))
-        self.assert_('a' in match)
-        self.assert_('b' in match)
-        self.assert_('c' not in match)
+        match = swob.Match('a, b')
+        self.assertEqual(match.tags, set(('a', 'b')))
+        self.assertIn('a', match)
+        self.assertIn('"a"', match)
+        self.assertNotIn('""a""', match)
+        self.assertIn('b', match)
+        self.assertNotIn('c', match)
+        self.assertNotIn(None, match)
+
+    def test_match_no_optional_white_space(self):
+        match = swob.Match('"a","b"')
+        self.assertEqual(match.tags, set(('a', 'b')))
+        self.assertIn('a', match)
+        self.assertIn('"a"', match)
+        self.assertNotIn('""a""', match)
+        self.assertIn('b', match)
+        self.assertNotIn('c', match)
+        self.assertNotIn(None, match)
+
+    def test_match_lots_of_optional_white_space(self):
+        match = swob.Match('"a"   ,  ,   "b"   ')
+        self.assertEqual(match.tags, set(('a', 'b')))
+        self.assertIn('a', match)
+        self.assertIn('"a"', match)
+        self.assertNotIn('""a""', match)
+        self.assertIn('b', match)
+        self.assertNotIn('c', match)
+        self.assertNotIn(None, match)
+
+
+class TestEtag(unittest.TestCase):
+    def test_normalize_etag(self):
+        expectations = {
+            '': '',
+            '"': '"',
+            '""': '',
+            'foo': 'foo',
+            '"bar"': 'bar',
+            '"baz': '"baz',
+            'buz"': 'buz"',
+            '"fuz""': 'fuz"',
+            u'\u2661': u'\u2661',
+            u'"\u2661"': u'\u2661',
+            u'"\u2661': u'"\u2661',
+        }
+        failures = []
+        for given, expected in expectations.items():
+            found = swob.normalize_etag(given)
+            if found != expected:
+                failures.append(
+                    'given %r expected %r != %r' % (given, expected, found))
+        if failures:
+            self.fail('Some expectations failed:\n' + '\n'.join(failures))
+
+    def test_normalize_bytes(self):
+        some_etag = b'"some-etag"'
+        self.assertRaises(TypeError, swob.normalize_etag, some_etag)
+
+
+class TestTransferEncoding(unittest.TestCase):
+    def test_is_chunked(self):
+        headers = {}
+        self.assertFalse(swob.is_chunked(headers))
+
+        headers['Transfer-Encoding'] = 'chunked'
+        self.assertTrue(swob.is_chunked(headers))
+
+        headers['Transfer-Encoding'] = 'gzip,chunked'
+        try:
+            swob.is_chunked(headers)
+        except AttributeError as e:
+            self.assertEqual(str(e), "Unsupported Transfer-Coding header"
+                             " value specified in Transfer-Encoding header")
+        else:
+            self.fail("Expected an AttributeError raised for 'gzip'")
+
+        headers['Transfer-Encoding'] = 'gzip'
+        try:
+            swob.is_chunked(headers)
+        except ValueError as e:
+            self.assertEqual(str(e), "Invalid Transfer-Encoding header value")
+        else:
+            self.fail("Expected a ValueError raised for 'gzip'")
+
+        headers['Transfer-Encoding'] = 'gzip,identity'
+        try:
+            swob.is_chunked(headers)
+        except AttributeError as e:
+            self.assertEqual(str(e), "Unsupported Transfer-Coding header"
+                             " value specified in Transfer-Encoding header")
+        else:
+            self.fail("Expected an AttributeError raised for 'gzip,identity'")
 
 
 class TestAccept(unittest.TestCase):
@@ -235,165 +400,484 @@ def test_accept_json(self):
                        '*/*;q=0.9,application/json;q=1.0', 'application/*',
                        'text/*,application/json', 'application/*,text/*',
                        'application/json,text/xml'):
-            acc = swift.common.swob.Accept(accept)
+            acc = swob.Accept(accept)
             match = acc.best_match(['text/plain', 'application/json',
                                     'application/xml', 'text/xml'])
-            self.assertEquals(match, 'application/json')
+            self.assertEqual(match, 'application/json')
 
     def test_accept_plain(self):
         for accept in ('', 'text/plain', 'application/xml;q=0.8,*/*;q=0.9',
                        '*/*;q=0.9,application/xml;q=0.8', '*/*',
                        'text/plain,application/xml'):
-            acc = swift.common.swob.Accept(accept)
+            acc = swob.Accept(accept)
             match = acc.best_match(['text/plain', 'application/json',
                                     'application/xml', 'text/xml'])
-            self.assertEquals(match, 'text/plain')
+            self.assertEqual(match, 'text/plain')
 
     def test_accept_xml(self):
         for accept in ('application/xml', 'application/xml;q=1.0,*/*;q=0.9',
-                       '*/*;q=0.9,application/xml;q=1.0'):
-            acc = swift.common.swob.Accept(accept)
+                       '*/*;q=0.9,application/xml;q=1.0',
+                       'application/xml;charset=UTF-8',
+                       'application/xml;charset=UTF-8;qws="quoted with space"',
+                       'application/xml; q=0.99 ; qws="quoted with space"'):
+            acc = swob.Accept(accept)
             match = acc.best_match(['text/plain', 'application/xml',
                                    'text/xml'])
-            self.assertEquals(match, 'application/xml')
+            self.assertEqual(match, 'application/xml')
 
     def test_accept_invalid(self):
         for accept in ('*', 'text/plain,,', 'some stuff',
                        'application/xml;q=1.0;q=1.1', 'text/plain,*',
-                       'text /plain', 'text\x7f/plain'):
-            acc = swift.common.swob.Accept(accept)
-            match = acc.best_match(['text/plain', 'application/xml',
-                                   'text/xml'])
-            self.assertEquals(match, None)
+                       'text /plain', 'text\x7f/plain',
+                       'text/plain;a=b=c',
+                       'text/plain;q=1;q=2',
+                       'text/plain;q=not-a-number',
+                       'text/plain; ubq="unbalanced " quotes"'):
+            acc = swob.Accept(accept)
+            with self.assertRaises(ValueError):
+                acc.best_match(['text/plain', 'application/xml', 'text/xml'])
+
+    def test_repr(self):
+        acc = swob.Accept("application/json")
+        self.assertEqual(repr(acc), "application/json")
 
 
 class TestRequest(unittest.TestCase):
     def test_blank(self):
-        req = swift.common.swob.Request.blank(
+        req = swob.Request.blank(
             '/', environ={'REQUEST_METHOD': 'POST'},
             headers={'Content-Type': 'text/plain'}, body='hi')
-        self.assertEquals(req.path_info, '/')
-        self.assertEquals(req.body, 'hi')
-        self.assertEquals(req.headers['Content-Type'], 'text/plain')
-        self.assertEquals(req.method, 'POST')
+        self.assertEqual(req.path_info, '/')
+        self.assertEqual(req.body, b'hi')
+        self.assertEqual(req.headers['Content-Type'], 'text/plain')
+        self.assertEqual(req.method, 'POST')
+
+    def test_blank_req_environ_property_args(self):
+        blank = swob.Request.blank
+        req = blank('/', method='PATCH')
+        self.assertEqual(req.method, 'PATCH')
+        self.assertEqual(req.environ['REQUEST_METHOD'], 'PATCH')
+        req = blank('/', referer='http://example.com')
+        self.assertEqual(req.referer, 'http://example.com')
+        self.assertEqual(req.referrer, 'http://example.com')
+        self.assertEqual(req.environ['HTTP_REFERER'], 'http://example.com')
+        self.assertEqual(req.headers['Referer'], 'http://example.com')
+        req = blank('/', script_name='/application')
+        self.assertEqual(req.script_name, '/application')
+        self.assertEqual(req.environ['SCRIPT_NAME'], '/application')
+        req = blank('/', host='www.example.com')
+        self.assertEqual(req.host, 'www.example.com')
+        self.assertEqual(req.environ['HTTP_HOST'], 'www.example.com')
+        self.assertEqual(req.headers['Host'], 'www.example.com')
+        req = blank('/', remote_addr='127.0.0.1')
+        self.assertEqual(req.remote_addr, '127.0.0.1')
+        self.assertEqual(req.environ['REMOTE_ADDR'], '127.0.0.1')
+        req = blank('/', remote_user='username')
+        self.assertEqual(req.remote_user, 'username')
+        self.assertEqual(req.environ['REMOTE_USER'], 'username')
+        req = blank('/', user_agent='curl/7.22.0 (x86_64-pc-linux-gnu)')
+        self.assertEqual(req.user_agent, 'curl/7.22.0 (x86_64-pc-linux-gnu)')
+        self.assertEqual(req.environ['HTTP_USER_AGENT'],
+                         'curl/7.22.0 (x86_64-pc-linux-gnu)')
+        self.assertEqual(req.headers['User-Agent'],
+                         'curl/7.22.0 (x86_64-pc-linux-gnu)')
+        req = blank('/', query_string='a=b&c=d')
+        self.assertEqual(req.query_string, 'a=b&c=d')
+        self.assertEqual(req.environ['QUERY_STRING'], 'a=b&c=d')
+        req = blank('/', if_match='*')
+        self.assertEqual(req.environ['HTTP_IF_MATCH'], '*')
+        self.assertEqual(req.headers['If-Match'], '*')
+
+        # multiple environ property kwargs
+        req = blank('/', method='PATCH', referer='http://example.com',
+                    script_name='/application', host='www.example.com',
+                    remote_addr='127.0.0.1', remote_user='username',
+                    user_agent='curl/7.22.0 (x86_64-pc-linux-gnu)',
+                    query_string='a=b&c=d', if_match='*')
+        self.assertEqual(req.method, 'PATCH')
+        self.assertEqual(req.referer, 'http://example.com')
+        self.assertEqual(req.script_name, '/application')
+        self.assertEqual(req.host, 'www.example.com')
+        self.assertEqual(req.remote_addr, '127.0.0.1')
+        self.assertEqual(req.remote_user, 'username')
+        self.assertEqual(req.user_agent, 'curl/7.22.0 (x86_64-pc-linux-gnu)')
+        self.assertEqual(req.query_string, 'a=b&c=d')
+        self.assertEqual(req.environ['QUERY_STRING'], 'a=b&c=d')
+
+    def test_invalid_req_environ_property_args(self):
+        # getter only property
+        try:
+            swob.Request.blank(
+                '/', host_url='http://example.com:8080/v1/a/c/o')
+        except TypeError as e:
+            self.assertEqual("got unexpected keyword argument 'host_url'",
+                             str(e))
+        else:
+            self.fail("invalid req_environ_property didn't raise error!")
+        # regular attribute
+        try:
+            swob.Request.blank('/', _params_cache={'a': 'b'})
+        except TypeError as e:
+            self.assertEqual("got unexpected keyword "
+                             "argument '_params_cache'", str(e))
+        else:
+            self.fail("invalid req_environ_property didn't raise error!")
+        # non-existent attribute
+        try:
+            swob.Request.blank('/', params_cache={'a': 'b'})
+        except TypeError as e:
+            self.assertEqual("got unexpected keyword "
+                             "argument 'params_cache'", str(e))
+        else:
+            self.fail("invalid req_environ_property didn't raise error!")
+        # method
+        try:
+            swob.Request.blank(
+                '/', as_referer='GET http://example.com')
+        except TypeError as e:
+            self.assertEqual("got unexpected keyword "
+                             "argument 'as_referer'", str(e))
+        else:
+            self.fail("invalid req_environ_property didn't raise error!")
+
+    def test_blank_path_info_precedence(self):
+        blank = swob.Request.blank
+        req = blank('/a')
+        self.assertEqual(req.path_info, '/a')
+        req = blank('/a', environ={'PATH_INFO': '/a/c'})
+        self.assertEqual(req.path_info, '/a/c')
+        req = blank('/a', environ={'PATH_INFO': '/a/c'}, path_info='/a/c/o')
+        self.assertEqual(req.path_info, '/a/c/o')
+        req = blank('/a', path_info='/a/c/o')
+        self.assertEqual(req.path_info, '/a/c/o')
 
     def test_blank_body_precedence(self):
-        req = swift.common.swob.Request.blank(
+        req = swob.Request.blank(
             '/', environ={'REQUEST_METHOD': 'POST',
-                          'wsgi.input': StringIO('')},
+                          'wsgi.input': BytesIO(b'')},
             headers={'Content-Type': 'text/plain'}, body='hi')
-        self.assertEquals(req.path_info, '/')
-        self.assertEquals(req.body, 'hi')
-        self.assertEquals(req.headers['Content-Type'], 'text/plain')
-        self.assertEquals(req.method, 'POST')
+        self.assertEqual(req.path_info, '/')
+        self.assertEqual(req.body, b'hi')
+        self.assertEqual(req.headers['Content-Type'], 'text/plain')
+        self.assertEqual(req.method, 'POST')
+        body_file = BytesIO(b'asdf')
+        req = swob.Request.blank(
+            '/', environ={'REQUEST_METHOD': 'POST',
+                          'wsgi.input': BytesIO(b'')},
+            headers={'Content-Type': 'text/plain'}, body='hi',
+            body_file=body_file)
+        self.assertTrue(req.body_file is body_file)
+        req = swob.Request.blank(
+            '/', environ={'REQUEST_METHOD': 'POST',
+                          'wsgi.input': BytesIO(b'')},
+            headers={'Content-Type': 'text/plain'}, body='hi',
+            content_length=3)
+        self.assertEqual(req.content_length, 3)
+        self.assertEqual(len(req.body), 2)
+
+    def test_blank_parsing(self):
+        req = swob.Request.blank('http://test.com/')
+        self.assertEqual(req.environ['wsgi.url_scheme'], 'http')
+        self.assertEqual(req.environ['SERVER_PORT'], '80')
+        self.assertEqual(req.environ['SERVER_NAME'], 'test.com')
+
+        req = swob.Request.blank('https://test.com:456/')
+        self.assertEqual(req.environ['wsgi.url_scheme'], 'https')
+        self.assertEqual(req.environ['SERVER_PORT'], '456')
+
+        req = swob.Request.blank('test.com/')
+        self.assertEqual(req.environ['wsgi.url_scheme'], 'http')
+        self.assertEqual(req.environ['SERVER_PORT'], '80')
+        self.assertEqual(req.environ['PATH_INFO'], 'test.com/')
+
+        self.assertRaises(TypeError, swob.Request.blank,
+                          'ftp://test.com/')
 
     def test_params(self):
-        req = swift.common.swob.Request.blank('/?a=b&c=d')
-        self.assertEquals(req.params['a'], 'b')
-        self.assertEquals(req.params['c'], 'd')
+        req = swob.Request.blank('/?a=b&c=d')
+        self.assertEqual(req.params['a'], 'b')
+        self.assertEqual(req.params['c'], 'd')
+
+        new_params = {'e': 'f', 'g': 'h'}
+        req.params = new_params
+        self.assertDictEqual(new_params, req.params)
+
+        new_params = (('i', 'j'), ('k', 'l'))
+        req.params = new_params
+        self.assertDictEqual(dict(new_params), req.params)
+
+    def test_unicode_params(self):
+        # NB: all of these strings are WSGI strings
+        req = swob.Request.blank(
+            '/?\xe1\x88\xb4=%E1%88%B4&%FF=\xff')
+        self.assertEqual(req.params['\xff'], '\xff')
+        self.assertEqual(req.params['\xe1\x88\xb4'], '\xe1\x88\xb4')
+
+        new_params = {'\xff': '\xe1\x88\xb4', '\xe1\x88\xb4': '\xff'}
+        req.params = new_params
+        self.assertDictEqual(new_params, req.params)
+        self.assertIn('%FF=%E1%88%B4', req.environ['QUERY_STRING'])
+        self.assertIn('%E1%88%B4=%FF', req.environ['QUERY_STRING'])
+
+        # ...well, until we get to unicode that isn't WSGI-friendly
+        new_params = ((u'\u1234', u'\u1234'), )
+        with self.assertRaises(UnicodeEncodeError):
+            req.params = new_params
+
+    def test_timestamp_missing(self):
+        req = swob.Request.blank('/')
+        self.assertRaises(exceptions.InvalidTimestamp,
+                          getattr, req, 'timestamp')
+
+    def test_timestamp_invalid(self):
+        req = swob.Request.blank(
+            '/', headers={'X-Timestamp': 'asdf'})
+        self.assertRaises(exceptions.InvalidTimestamp,
+                          getattr, req, 'timestamp')
+
+    def test_timestamp(self):
+        req = swob.Request.blank(
+            '/', headers={'X-Timestamp': '1402447134.13507_00000001'})
+        expected = utils.Timestamp('1402447134.13507', offset=1)
+        self.assertEqual(req.timestamp, expected)
+        self.assertEqual(req.timestamp.normal, expected.normal)
+        self.assertEqual(req.timestamp.internal, expected.internal)
 
     def test_path(self):
-        req = swift.common.swob.Request.blank('/hi?a=b&c=d')
-        self.assertEquals(req.path, '/hi')
-        req = swift.common.swob.Request.blank(
+        req = swob.Request.blank('/hi?a=b&c=d')
+        self.assertEqual(req.path, '/hi')
+        req = swob.Request.blank(
             '/', environ={'SCRIPT_NAME': '/hi', 'PATH_INFO': '/there'})
-        self.assertEquals(req.path, '/hi/there')
+        self.assertEqual(req.path, '/hi/there')
 
     def test_path_question_mark(self):
-        req = swift.common.swob.Request.blank('/test%3Ffile')
+        req = swob.Request.blank('/test%3Ffile')
         # This tests that .blank unquotes the path when setting PATH_INFO
-        self.assertEquals(req.environ['PATH_INFO'], '/test?file')
+        self.assertEqual(req.environ['PATH_INFO'], '/test?file')
         # This tests that .path requotes it
-        self.assertEquals(req.path, '/test%3Ffile')
+        self.assertEqual(req.path, '/test%3Ffile')
 
     def test_path_info_pop(self):
-        req = swift.common.swob.Request.blank('/hi/there')
-        self.assertEquals(req.path_info_pop(), 'hi')
-        self.assertEquals(req.path_info, '/there')
-        self.assertEquals(req.script_name, '/hi')
+        req = swob.Request.blank('/hi/there')
+        self.assertEqual(req.path_info_pop(), 'hi')
+        self.assertEqual(req.path_info, '/there')
+        self.assertEqual(req.script_name, '/hi')
 
     def test_bad_path_info_pop(self):
-        req = swift.common.swob.Request.blank('blahblah')
-        self.assertEquals(req.path_info_pop(), None)
+        req = swob.Request.blank('blahblah')
+        self.assertIsNone(req.path_info_pop())
 
     def test_path_info_pop_last(self):
-        req = swift.common.swob.Request.blank('/last')
-        self.assertEquals(req.path_info_pop(), 'last')
-        self.assertEquals(req.path_info, '')
-        self.assertEquals(req.script_name, '/last')
+        req = swob.Request.blank('/last')
+        self.assertEqual(req.path_info_pop(), 'last')
+        self.assertEqual(req.path_info, '')
+        self.assertEqual(req.script_name, '/last')
 
     def test_path_info_pop_none(self):
-        req = swift.common.swob.Request.blank('/')
-        self.assertEquals(req.path_info_pop(), '')
-        self.assertEquals(req.path_info, '')
-        self.assertEquals(req.script_name, '/')
+        req = swob.Request.blank('/')
+        self.assertEqual(req.path_info_pop(), '')
+        self.assertEqual(req.path_info, '')
+        self.assertEqual(req.script_name, '/')
 
     def test_copy_get(self):
-        req = swift.common.swob.Request.blank(
+        req = swob.Request.blank(
             '/hi/there', environ={'REQUEST_METHOD': 'POST'})
-        self.assertEquals(req.method, 'POST')
+        self.assertEqual(req.method, 'POST')
         req2 = req.copy_get()
-        self.assertEquals(req2.method, 'GET')
+        self.assertEqual(req2.method, 'GET')
 
     def test_get_response(self):
         def test_app(environ, start_response):
             start_response('200 OK', [])
-            return ['hi']
+            return [b'hi']
+
+        req = swob.Request.blank('/')
+        resp = req.get_response(test_app)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.body, b'hi')
+
+    def test_401_unauthorized(self):
+        # No request environment
+        resp = swob.HTTPUnauthorized()
+        self.assertEqual(resp.status_int, 401)
+        self.assertTrue('Www-Authenticate' in resp.headers)
+        # Request environment
+        req = swob.Request.blank('/')
+        resp = swob.HTTPUnauthorized(request=req)
+        self.assertEqual(resp.status_int, 401)
+        self.assertTrue('Www-Authenticate' in resp.headers)
+
+    def test_401_valid_account_path(self):
+
+        def test_app(environ, start_response):
+            start_response('401 Unauthorized', [])
+            return [b'hi']
+
+        # Request environment contains valid account in path
+        req = swob.Request.blank('/v1/account-name')
+        resp = req.get_response(test_app)
+        self.assertEqual(resp.status_int, 401)
+        self.assertTrue('Www-Authenticate' in resp.headers)
+        self.assertEqual('Swift realm="account-name"',
+                         resp.headers['Www-Authenticate'])
+
+        # Request environment contains valid account/container in path
+        req = swob.Request.blank('/v1/account-name/c')
+        resp = req.get_response(test_app)
+        self.assertEqual(resp.status_int, 401)
+        self.assertTrue('Www-Authenticate' in resp.headers)
+        self.assertEqual('Swift realm="account-name"',
+                         resp.headers['Www-Authenticate'])
+
+    def test_401_invalid_path(self):
+
+        def test_app(environ, start_response):
+            start_response('401 Unauthorized', [])
+            return [b'hi']
+
+        # Request environment contains bad path
+        req = swob.Request.blank('/random')
+        resp = req.get_response(test_app)
+        self.assertEqual(resp.status_int, 401)
+        self.assertTrue('Www-Authenticate' in resp.headers)
+        self.assertEqual('Swift realm="unknown"',
+                         resp.headers['Www-Authenticate'])
+
+    def test_401_non_keystone_auth_path(self):
+
+        def test_app(environ, start_response):
+            start_response('401 Unauthorized', [])
+            return [b'no creds in request']
+
+        # Request to get token
+        req = swob.Request.blank('/v1.0/auth')
+        resp = req.get_response(test_app)
+        self.assertEqual(resp.status_int, 401)
+        self.assertTrue('Www-Authenticate' in resp.headers)
+        self.assertEqual('Swift realm="unknown"',
+                         resp.headers['Www-Authenticate'])
+
+        # Other form of path
+        req = swob.Request.blank('/auth/v1.0')
+        resp = req.get_response(test_app)
+        self.assertEqual(resp.status_int, 401)
+        self.assertTrue('Www-Authenticate' in resp.headers)
+        self.assertEqual('Swift realm="unknown"',
+                         resp.headers['Www-Authenticate'])
+
+    def test_401_www_authenticate_exists(self):
+
+        def test_app(environ, start_response):
+            start_response('401 Unauthorized', {
+                           'Www-Authenticate': 'Me realm="whatever"'})
+            return [b'no creds in request']
+
+        # Auth middleware sets own Www-Authenticate
+        req = swob.Request.blank('/auth/v1.0')
+        resp = req.get_response(test_app)
+        self.assertEqual(resp.status_int, 401)
+        self.assertTrue('Www-Authenticate' in resp.headers)
+        self.assertEqual('Me realm="whatever"',
+                         resp.headers['Www-Authenticate'])
+
+    def test_401_www_authenticate_is_quoted(self):
+
+        def test_app(environ, start_response):
+            start_response('401 Unauthorized', [])
+            return [b'hi']
+
+        hacker = 'account-name\n\n<b>foo<br>'  # url injection test
+        quoted_hacker = quote(hacker)
+        req = swob.Request.blank('/v1/' + quoted_hacker)
+        self.assertIn(hacker, req.environ['PATH_INFO'])  # sanity check
+        resp = req.get_response(test_app)
+        self.assertEqual(resp.status_int, 401)
+        self.assertTrue('Www-Authenticate' in resp.headers)
+        self.assertEqual('Swift realm="%s"' % quoted_hacker,
+                         resp.headers['Www-Authenticate'])
+
+    def test_not_401(self):
+
+        # Other status codes should not have WWW-Authenticate in response
+        def test_app(environ, start_response):
+            start_response('200 OK', [])
+            return [b'hi']
 
-        req = swift.common.swob.Request.blank('/')
+        req = swob.Request.blank('/')
         resp = req.get_response(test_app)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(resp.body, 'hi')
+        self.assertNotIn('Www-Authenticate', resp.headers)
 
     def test_properties(self):
-        req = swift.common.swob.Request.blank('/hi/there', body='hi')
+        req = swob.Request.blank('/hi/there', body='hi')
 
-        self.assertEquals(req.body, 'hi')
-        self.assertEquals(req.content_length, 2)
+        self.assertEqual(req.body, b'hi')
+        self.assertEqual(req.content_length, 2)
 
         req.remote_addr = 'something'
-        self.assertEquals(req.environ['REMOTE_ADDR'], 'something')
+        self.assertEqual(req.environ['REMOTE_ADDR'], 'something')
         req.body = 'whatever'
-        self.assertEquals(req.content_length, 8)
-        self.assertEquals(req.body, 'whatever')
-        self.assertEquals(req.method, 'GET')
+        self.assertEqual(req.content_length, 8)
+        self.assertEqual(req.body, b'whatever')
+        self.assertEqual(req.method, 'GET')
 
         req.range = 'bytes=1-7'
-        self.assertEquals(req.range.ranges[0], (1, 7))
+        self.assertEqual(req.range.ranges[0], (1, 7))
 
-        self.assert_('Range' in req.headers)
+        self.assertIn('Range', req.headers)
         req.range = None
-        self.assert_('Range' not in req.headers)
+        self.assertNotIn('Range', req.headers)
 
     def test_datetime_properties(self):
-        req = swift.common.swob.Request.blank('/hi/there', body='hi')
+        req = swob.Request.blank('/hi/there', body='hi')
 
         req.if_unmodified_since = 0
-        self.assert_(isinstance(req.if_unmodified_since, datetime.datetime))
+        self.assertIsInstance(req.if_unmodified_since, datetime.datetime)
         if_unmodified_since = req.if_unmodified_since
         req.if_unmodified_since = if_unmodified_since
-        self.assertEquals(if_unmodified_since, req.if_unmodified_since)
+        self.assertEqual(if_unmodified_since, req.if_unmodified_since)
 
         req.if_unmodified_since = 'something'
-        self.assertEquals(req.headers['If-Unmodified-Since'], 'something')
-        self.assertEquals(req.if_unmodified_since, None)
-
-        req.if_unmodified_since = -1
-        self.assertRaises(ValueError, lambda: req.if_unmodified_since)
+        self.assertEqual(req.headers['If-Unmodified-Since'], 'something')
+        self.assertIsNone(req.if_unmodified_since)
 
-        self.assert_('If-Unmodified-Since' in req.headers)
+        self.assertIn('If-Unmodified-Since', req.headers)
         req.if_unmodified_since = None
-        self.assert_('If-Unmodified-Since' not in req.headers)
+        self.assertNotIn('If-Unmodified-Since', req.headers)
+
+        too_big_date_list = list(datetime.datetime.max.timetuple())
+        too_big_date_list[0] += 1  # bump up the year
+        too_big_date = time.strftime(
+            "%a, %d %b %Y %H:%M:%S UTC", time.struct_time(too_big_date_list))
+
+        req.if_unmodified_since = too_big_date
+        self.assertIsNone(req.if_unmodified_since)
+
+    def test_date_header_format(self):
+        self.assertEqual('Thu, 01 Jan 1970 00:00:00 GMT',
+                         swob.date_header_format(0))
+        self.assertEqual('Tue, 10 Jun 2014 21:40:08 GMT',
+                         swob.date_header_format(1402436408.91203))
+        ts = utils.Timestamp('1764019169.37945')
+        self.assertEqual('Mon, 24 Nov 2025 21:19:30 GMT',
+                         swob.date_header_format(ts))
+
+    def test_parse_date_header(self):
+        secs = swob.parse_date_header('Thu, 01 Jan 1970 00:00:00 GMT')
+        self.assertIsInstance(secs, int)
+        self.assertEqual(0, secs)
+        secs = swob.parse_date_header('Tue, 10 Jun 2014 21:40:08 GMT')
+        self.assertIsInstance(secs, int)
+        self.assertEqual(1402436408, secs)
 
     def test_bad_range(self):
-        req = swift.common.swob.Request.blank('/hi/there', body='hi')
+        req = swob.Request.blank('/hi/there', body='hi')
         req.range = 'bad range'
-        self.assertEquals(req.range, None)
+        self.assertIsNone(req.range)
 
     def test_accept_header(self):
-        req = swift.common.swob.Request({'REQUEST_METHOD': 'GET',
-                                         'PATH_INFO': '/',
-                                         'HTTP_ACCEPT': 'application/json'})
+        req = swob.Request({'REQUEST_METHOD': 'GET',
+                            'PATH_INFO': '/',
+                            'HTTP_ACCEPT': 'application/json'})
         self.assertEqual(
             req.accept.best_match(['application/json', 'text/plain']),
             'application/json')
@@ -401,14 +885,285 @@ def test_accept_header(self):
             req.accept.best_match(['text/plain', 'application/json']),
             'application/json')
 
+    def test_swift_entity_path(self):
+        req = swob.Request.blank('/v1/a/c/o')
+        self.assertEqual(req.swift_entity_path, '/a/c/o')
+
+        req = swob.Request.blank('/v1/a/c')
+        self.assertEqual(req.swift_entity_path, '/a/c')
+
+        req = swob.Request.blank('/v1/a')
+        self.assertEqual(req.swift_entity_path, '/a')
+
+        req = swob.Request.blank('/v1')
+        self.assertIsNone(req.swift_entity_path)
+
     def test_path_qs(self):
-        req = swift.common.swob.Request.blank('/hi/there?hello=equal&acl')
+        req = swob.Request.blank('/hi/there?hello=equal&acl')
         self.assertEqual(req.path_qs, '/hi/there?hello=equal&acl')
 
-        req = swift.common.swob.Request({'PATH_INFO': '/hi/there',
+        req = swob.Request({'PATH_INFO': '/hi/there',
                                          'QUERY_STRING': 'hello=equal&acl'})
         self.assertEqual(req.path_qs, '/hi/there?hello=equal&acl')
 
+    def test_url(self):
+        req = swob.Request.blank('/hi/there?hello=equal&acl')
+        self.assertEqual(req.url,
+                         'http://localhost/hi/there?hello=equal&acl')
+
+    def test_wsgify(self):
+        used_req = []
+
+        @swob.wsgify
+        def _wsgi_func(req):
+            used_req.append(req)
+            return swob.Response(b'200 OK')
+
+        req = swob.Request.blank('/hi/there')
+        resp = req.get_response(_wsgi_func)
+        self.assertEqual(used_req[0].path, '/hi/there')
+        self.assertEqual(resp.status_int, 200)
+
+    def test_wsgify_method(self):
+        class _wsgi_class(object):
+            def __init__(self):
+                self.used_req = []
+
+            @swob.wsgify
+            def __call__(self, req):
+                self.used_req.append(req)
+                return swob.Response(b'200 OK')
+
+        req = swob.Request.blank('/hi/there')
+        handler = _wsgi_class()
+        resp = req.get_response(handler)
+        self.assertIs(handler.used_req[0].environ, req.environ)
+        self.assertEqual(resp.status_int, 200)
+
+    def test_wsgify_raise(self):
+        used_req = []
+
+        @swob.wsgify
+        def _wsgi_func(req):
+            used_req.append(req)
+            raise swob.HTTPServerError()
+
+        req = swob.Request.blank('/hi/there')
+        resp = req.get_response(_wsgi_func)
+        self.assertEqual(used_req[0].path, '/hi/there')
+        self.assertEqual(resp.status_int, 500)
+
+    def test_split_path(self):
+        """
+        Copied from utils.split_path
+        """
+        def _test_split_path(path, minsegs=1, maxsegs=None, rwl=False):
+            req = swob.Request.blank(path)
+            return req.split_path(minsegs, maxsegs, rwl)
+        self.assertRaises(ValueError, _test_split_path, '')
+        self.assertRaises(ValueError, _test_split_path, '/')
+        self.assertRaises(ValueError, _test_split_path, '//')
+        self.assertEqual(_test_split_path('/a'), ['a'])
+        self.assertRaises(ValueError, _test_split_path, '//a')
+        self.assertEqual(_test_split_path('/a/'), ['a'])
+        self.assertRaises(ValueError, _test_split_path, '/a/c')
+        self.assertRaises(ValueError, _test_split_path, '//c')
+        self.assertRaises(ValueError, _test_split_path, '/a/c/')
+        self.assertRaises(ValueError, _test_split_path, '/a//')
+        self.assertRaises(ValueError, _test_split_path, '/a', 2)
+        self.assertRaises(ValueError, _test_split_path, '/a', 2, 3)
+        self.assertRaises(ValueError, _test_split_path, '/a', 2, 3, True)
+        self.assertEqual(_test_split_path('/a/c', 2), ['a', 'c'])
+        self.assertEqual(_test_split_path('/a/c/o', 3), ['a', 'c', 'o'])
+        self.assertRaises(ValueError, _test_split_path, '/a/c/o/r', 3, 3)
+        self.assertEqual(_test_split_path('/a/c/o/r', 3, 3, True),
+                         ['a', 'c', 'o/r'])
+        self.assertEqual(_test_split_path('/a/c', 2, 3, True),
+                         ['a', 'c', None])
+        self.assertRaises(ValueError, _test_split_path, '/a', 5, 4)
+        self.assertEqual(_test_split_path('/a/c/', 2), ['a', 'c'])
+        self.assertEqual(_test_split_path('/a/c/', 2, 3), ['a', 'c', ''])
+        try:
+            _test_split_path('o%0an e', 2)
+        except ValueError as err:
+            self.assertEqual(str(err), 'Invalid path: o%0An%20e')
+        try:
+            _test_split_path('o%0an e', 2, 3, True)
+        except ValueError as err:
+            self.assertEqual(str(err), 'Invalid path: o%0An%20e')
+
+    def test_unicode_path(self):
+        # Byte sequences always make sense
+        req = swob.Request.blank(u'/\u2661'.encode('utf8'))
+        self.assertEqual(req.path, quote(u'/\u2661'.encode('utf-8')))
+        self.assertEqual(req.environ['PATH_INFO'], '/\xe2\x99\xa1')
+
+        req = swob.Request.blank('/')
+        req.path_info = u'/\u2661'.encode('utf8')
+        self.assertEqual(req.path, quote(u'/\u2661'.encode('utf-8')))
+        self.assertEqual(req.environ['PATH_INFO'], '/\xe2\x99\xa1')
+
+        # Arbitrary Unicode *is not* supported on py3 -- only latin-1
+        # encodable is supported, because PEP-3333.
+        with self.assertRaises(UnicodeEncodeError):
+            req = swob.Request.blank(u'/\u2661')
+
+        req = swob.Request.blank('/')
+        with self.assertRaises(UnicodeEncodeError):
+            req.path_info = u'/\u2661'
+        # Update didn't take
+        self.assertEqual(req.path, '/')
+        self.assertEqual(req.environ['PATH_INFO'], '/')
+
+        # Needs to be a "WSGI string"
+        req = swob.Request.blank('/\xe2\x99\xa1')
+        self.assertEqual(req.path, quote(u'/\u2661'.encode('utf-8')))
+        self.assertEqual(req.environ['PATH_INFO'], '/\xe2\x99\xa1')
+
+        req = swob.Request.blank('/')
+        req.path_info = '/\xe2\x99\xa1'
+        self.assertEqual(req.path, quote(u'/\u2661'.encode('utf-8')))
+        self.assertEqual(req.environ['PATH_INFO'], '/\xe2\x99\xa1')
+
+    def test_unicode_query(self):
+        # Bytes are always OK
+        req = swob.Request.blank('/')
+        encoded = u'\u2661'.encode('utf-8')
+        req.query_string = b'x=' + encoded
+        self.assertEqual(req.params['x'], encoded.decode('latin1'))
+
+        # Note that py3 requires "WSGI strings"
+        req = swob.Request.blank('/')
+        with self.assertRaises(UnicodeEncodeError):
+            req.query_string = u'x=\u2661'
+        self.assertEqual(req.params, {})
+
+        req = swob.Request.blank('/')
+        req.query_string = 'x=' + encoded.decode('latin-1')
+        self.assertEqual(req.params['x'], encoded.decode('latin-1'))
+
+    def test_url2(self):
+        pi = '/hi/there'
+        path = pi
+        req = swob.Request.blank(path)
+        sche = 'http'
+        exp_url = '%s://localhost%s' % (sche, pi)
+        self.assertEqual(req.url, exp_url)
+
+        qs = 'hello=equal&acl'
+        path = '%s?%s' % (pi, qs)
+        s, p = 'unit.test.example.com', '90'
+        req = swob.Request({'PATH_INFO': pi,
+                            'QUERY_STRING': qs,
+                            'SERVER_NAME': s,
+                            'SERVER_PORT': p})
+        exp_url = '%s://%s:%s%s?%s' % (sche, s, p, pi, qs)
+        self.assertEqual(req.url, exp_url)
+
+        host = 'unit.test.example.com'
+        req = swob.Request({'PATH_INFO': pi,
+                            'QUERY_STRING': qs,
+                            'HTTP_HOST': host + ':80'})
+        exp_url = '%s://%s%s?%s' % (sche, host, pi, qs)
+        self.assertEqual(req.url, exp_url)
+
+        host = 'unit.test.example.com'
+        sche = 'https'
+        req = swob.Request({'PATH_INFO': pi,
+                            'QUERY_STRING': qs,
+                            'HTTP_HOST': host + ':443',
+                            'wsgi.url_scheme': sche})
+        exp_url = '%s://%s%s?%s' % (sche, host, pi, qs)
+        self.assertEqual(req.url, exp_url)
+
+        host = 'unit.test.example.com:81'
+        req = swob.Request({'PATH_INFO': pi,
+                            'QUERY_STRING': qs,
+                            'HTTP_HOST': host,
+                            'wsgi.url_scheme': sche})
+        exp_url = '%s://%s%s?%s' % (sche, host, pi, qs)
+        self.assertEqual(req.url, exp_url)
+
+    def test_as_referer(self):
+        pi = '/hi/there'
+        qs = 'hello=equal&acl'
+        sche = 'https'
+        host = 'unit.test.example.com:81'
+        req = swob.Request({'REQUEST_METHOD': 'POST',
+                            'PATH_INFO': pi,
+                            'QUERY_STRING': qs,
+                            'HTTP_HOST': host,
+                            'wsgi.url_scheme': sche})
+        exp_url = '%s://%s%s?%s' % (sche, host, pi, qs)
+        self.assertEqual(req.as_referer(), 'POST ' + exp_url)
+
+    def test_message_length_just_content_length(self):
+        req = swob.Request.blank(
+            u'/',
+            environ={'REQUEST_METHOD': 'PUT', 'PATH_INFO': '/'})
+        self.assertIsNone(req.message_length())
+
+        req = swob.Request.blank(
+            u'/',
+            environ={'REQUEST_METHOD': 'PUT', 'PATH_INFO': '/'},
+            body='x' * 42)
+        self.assertEqual(req.message_length(), 42)
+
+        req.headers['Content-Length'] = 'abc'
+        try:
+            req.message_length()
+        except ValueError as e:
+            self.assertEqual(str(e), "Invalid Content-Length header value")
+        else:
+            self.fail("Expected a ValueError raised for 'abc'")
+
+    def test_message_length_transfer_encoding(self):
+        req = swob.Request.blank(
+            u'/',
+            environ={'REQUEST_METHOD': 'PUT', 'PATH_INFO': '/'},
+            headers={'transfer-encoding': 'chunked'},
+            body='x' * 42)
+        self.assertIsNone(req.message_length())
+
+        req.headers['Transfer-Encoding'] = 'gzip,chunked'
+        try:
+            req.message_length()
+        except AttributeError as e:
+            self.assertEqual(str(e), "Unsupported Transfer-Coding header"
+                             " value specified in Transfer-Encoding header")
+        else:
+            self.fail("Expected an AttributeError raised for 'gzip'")
+
+        req.headers['Transfer-Encoding'] = 'gzip'
+        try:
+            req.message_length()
+        except ValueError as e:
+            self.assertEqual(str(e), "Invalid Transfer-Encoding header value")
+        else:
+            self.fail("Expected a ValueError raised for 'gzip'")
+
+        req.headers['Transfer-Encoding'] = 'gzip,identity'
+        try:
+            req.message_length()
+        except AttributeError as e:
+            self.assertEqual(str(e), "Unsupported Transfer-Coding header"
+                             " value specified in Transfer-Encoding header")
+        else:
+            self.fail("Expected an AttributeError raised for 'gzip,identity'")
+
+    def test_allow_reserved_names(self):
+        req = swob.Request.blank('', headers={})
+        self.assertFalse(req.allow_reserved_names)
+        req = swob.Request.blank('', headers={
+            'X-Allow-Reserved-Names': 'true'})
+        self.assertFalse(req.allow_reserved_names)
+        req = swob.Request.blank('', headers={
+            'X-Backend-Allow-Reserved-Names': 'false'})
+        self.assertFalse(req.allow_reserved_names)
+        req = swob.Request.blank('', headers={
+            'X-Backend-Allow-Reserved-Names': 'true'})
+        self.assertTrue(req.allow_reserved_names)
+
 
 class TestStatusMap(unittest.TestCase):
     def test_status_map(self):
@@ -417,192 +1172,358 @@ def test_status_map(self):
         def start_response(status, headers):
             response_args.append(status)
             response_args.append(headers)
-        resp_cls = swift.common.swob.status_map[404]
+        resp_cls = swob.status_map[404]
         resp = resp_cls()
-        self.assertEquals(resp.status_int, 404)
-        self.assertEquals(resp.title, 'Not Found')
-        body = ''.join(resp({}, start_response))
-        self.assert_('The resource could not be found.' in body)
-        self.assertEquals(response_args[0], '404 Not Found')
+        self.assertEqual(resp.status_int, 404)
+        self.assertEqual(resp.title, 'Not Found')
+        body = b''.join(resp({}, start_response))
+        self.assertIn(b'The resource could not be found.', body)
+        self.assertEqual(response_args[0], '404 Not Found')
         headers = dict(response_args[1])
-        self.assertEquals(headers['content-type'], 'text/html; charset=UTF-8')
-        self.assert_(int(headers['content-length']) > 0)
+        self.assertEqual(headers['Content-Type'], 'text/html; charset=UTF-8')
+        self.assertTrue(int(headers['Content-Length']) > 0)
 
 
 class TestResponse(unittest.TestCase):
     def _get_response(self):
         def test_app(environ, start_response):
             start_response('200 OK', [])
-            return ['hi']
+            return [b'hi']
 
-        req = swift.common.swob.Request.blank('/')
+        req = swob.Request.blank('/')
         return req.get_response(test_app)
 
     def test_properties(self):
         resp = self._get_response()
 
         resp.location = 'something'
-        self.assertEquals(resp.location, 'something')
-        self.assert_('Location' in resp.headers)
+        self.assertEqual(resp.location, 'something')
+        self.assertIn('Location', resp.headers)
         resp.location = None
-        self.assert_('Location' not in resp.headers)
+        self.assertNotIn('Location', resp.headers)
 
         resp.content_type = 'text/plain'
-        self.assert_('Content-Type' in resp.headers)
+        self.assertIn('Content-Type', resp.headers)
         resp.content_type = None
-        self.assert_('Content-Type' not in resp.headers)
+        self.assertNotIn('Content-Type', resp.headers)
 
     def test_empty_body(self):
         resp = self._get_response()
-        resp.body = ''
-        self.assertEquals(resp.body, '')
+        resp.body = b''
+        self.assertEqual(resp.body, b'')
 
     def test_unicode_body(self):
         resp = self._get_response()
-        resp.body = u'\N{SNOWMAN}'
-        self.assertEquals(resp.body, u'\N{SNOWMAN}'.encode('utf-8'))
+        with self.assertRaises(TypeError) as catcher:
+            resp.body = u'\N{SNOWMAN}'
+        self.assertEqual(str(catcher.exception),
+                         'WSGI responses must be bytes')
+
+    def test_call_reifies_request_if_necessary(self):
+        """
+        The actual bug was a HEAD response coming out with a body because the
+        Request object wasn't passed into the Response object's constructor.
+        The Response object's __call__ method should be able to reify a
+        Request object from the env it gets passed.
+        """
+        tracking = {
+            'closed': 0,
+            'read': 0,
+        }
+
+        def mark_closed(*args):
+            tracking['closed'] += 1
+
+        def mark_read(*args):
+            tracking['read'] += 1
+
+        def test_app(environ, start_response):
+            start_response('200 OK', [])
+            body = [b'hi']
+            return LeakTrackingIter(body, mark_closed, mark_read, None)
+        req = swob.Request.blank('/')
+        req.method = 'HEAD'
+        status, headers, app_iter = req.call_application(test_app)
+        resp = swob.Response(status=status, headers=dict(headers),
+                             app_iter=app_iter)
+        output_iter = resp(req.environ, lambda *_: None)
+        with utils.closing_if_possible(output_iter):
+            body = b''.join(output_iter)
+        self.assertEqual(body, b'')
+        self.assertEqual(tracking, {
+            'closed': 1,
+            'read': 1,
+        })
+
+    def test_swob_drains_small_HEAD_resp_iter(self):
+        tracking = {
+            'closed': 0,
+            'read': 0,
+        }
+
+        def mark_closed(*args):
+            tracking['closed'] += 1
+
+        def mark_read(*args):
+            tracking['read'] += 1
+
+        def test_app(environ, start_response):
+            start_response('200 OK', [])
+            body = [b'hello', b'world']
+            return LeakTrackingIter(body, mark_closed, mark_read, None)
+
+        req = swob.Request.blank('/', method='HEAD')
+        status, headers, app_iter = req.call_application(test_app)
+        resp = swob.Response(status=status, headers=dict(headers),
+                             app_iter=app_iter)
+        # sanity, swob drains small HEAD responses
+        output_iter = resp(req.environ, lambda *_: None)
+        with utils.closing_if_possible(output_iter):
+            # regardless what the app returns swob's HEAD response is empty
+            body = b''.join(output_iter)
+        self.assertEqual(body, b'')
+        self.assertEqual(tracking, {
+            'closed': 1,
+            'read': 1,
+        })
+
+    def test_swob_closes_large_HEAD_resp_iter(self):
+        tracking = {
+            'closed': 0,
+            'read': 0,
+        }
+
+        def mark_closed(*args):
+            tracking['closed'] += 1
+
+        def mark_read(*args):
+            tracking['read'] += 1
+
+        def test_app(environ, start_response):
+            start_response('200 OK', [])
+            body = [b'hello', b'world']
+            return LeakTrackingIter(body, mark_closed, mark_read, None)
+
+        req = swob.Request.blank('/', method='HEAD')
+        status, headers, app_iter = req.call_application(test_app)
+        resp = swob.Response(status=status, headers=dict(headers),
+                             app_iter=app_iter)
+        # N.B. if we call next a third time (i.e. len(helloworld) < read_limit)
+        # then leak tracker will notice StopIteration and count it drained.
+        with mock.patch.object(utils, 'DEFAULT_DRAIN_LIMIT', 10):
+            output_iter = resp(req.environ, lambda *_: None)
+        with utils.closing_if_possible(output_iter):
+            # regardless what the app returns swob's HEAD response is empty
+            body = b''.join(output_iter)
+        self.assertEqual(body, b'')
+        self.assertEqual(tracking, {
+            'closed': 1,
+            'read': 0,
+        })
+
+    def test_call_preserves_closeability(self):
+        def test_app(environ, start_response):
+            start_response('200 OK', [])
+            yield "igloo"
+            yield "shindig"
+            yield "macadamia"
+            yield "hullabaloo"
+        req = swob.Request.blank('/')
+        req.method = 'GET'
+        status, headers, app_iter = req.call_application(test_app)
+        iterator = iter(app_iter)
+        self.assertEqual('igloo', next(iterator))
+        self.assertEqual('shindig', next(iterator))
+        app_iter.close()
+        with self.assertRaises(StopIteration):
+            next(iterator)
+
+    def test_call_finds_nonempty_chunk(self):
+        def test_app(environ, start_response):
+            start_response('400 Bad Request', [])
+            yield ''
+            start_response('200 OK', [])
+            yield 'complete '
+            yield ''
+            yield 'response'
+        req = swob.Request.blank('/')
+        req.method = 'GET'
+        status, headers, app_iter = req.call_application(test_app)
+        self.assertEqual(status, '200 OK')
+        self.assertEqual(list(app_iter), ['complete ', '', 'response'])
+
+    def test_call_requires_that_start_response_is_called(self):
+        def test_app(environ, start_response):
+            yield 'response'
+        req = swob.Request.blank('/')
+        req.method = 'GET'
+        with self.assertRaises(RuntimeError) as mgr:
+            req.call_application(test_app)
+        self.assertEqual(mgr.exception.args[0],
+                         'application never called start_response')
 
     def test_location_rewrite(self):
         def start_response(env, headers):
             pass
-        req = swift.common.swob.Request.blank(
+        req = swob.Request.blank(
             '/', environ={'HTTP_HOST': 'somehost'})
         resp = self._get_response()
         resp.location = '/something'
-        body = ''.join(resp(req.environ, start_response))
-        self.assertEquals(resp.location, 'http://somehost/something')
+        # read response
+        b''.join(resp(req.environ, start_response))
+        self.assertEqual(resp.location, 'http://somehost/something')
 
-        req = swift.common.swob.Request.blank(
+        req = swob.Request.blank(
             '/', environ={'HTTP_HOST': 'somehost:80'})
         resp = self._get_response()
         resp.location = '/something'
-        body = ''.join(resp(req.environ, start_response))
-        self.assertEquals(resp.location, 'http://somehost/something')
+        # read response
+        b''.join(resp(req.environ, start_response))
+        self.assertEqual(resp.location, 'http://somehost/something')
 
-        req = swift.common.swob.Request.blank(
+        req = swob.Request.blank(
             '/', environ={'HTTP_HOST': 'somehost:443',
                           'wsgi.url_scheme': 'http'})
         resp = self._get_response()
         resp.location = '/something'
-        body = ''.join(resp(req.environ, start_response))
-        self.assertEquals(resp.location, 'http://somehost:443/something')
+        # read response
+        b''.join(resp(req.environ, start_response))
+        self.assertEqual(resp.location, 'http://somehost:443/something')
 
-        req = swift.common.swob.Request.blank(
+        req = swob.Request.blank(
             '/', environ={'HTTP_HOST': 'somehost:443',
                           'wsgi.url_scheme': 'https'})
         resp = self._get_response()
         resp.location = '/something'
-        body = ''.join(resp(req.environ, start_response))
-        self.assertEquals(resp.location, 'https://somehost/something')
+        # read response
+        b''.join(resp(req.environ, start_response))
+        self.assertEqual(resp.location, 'https://somehost/something')
 
     def test_location_rewrite_no_host(self):
         def start_response(env, headers):
             pass
-        req = swift.common.swob.Request.blank(
+        req = swob.Request.blank(
             '/', environ={'SERVER_NAME': 'local', 'SERVER_PORT': 80})
         del req.environ['HTTP_HOST']
         resp = self._get_response()
         resp.location = '/something'
-        body = ''.join(resp(req.environ, start_response))
-        self.assertEquals(resp.location, 'http://local/something')
+        # read response
+        b''.join(resp(req.environ, start_response))
+        self.assertEqual(resp.location, 'http://local/something')
 
-        req = swift.common.swob.Request.blank(
+        req = swob.Request.blank(
             '/', environ={'SERVER_NAME': 'local', 'SERVER_PORT': 81})
         del req.environ['HTTP_HOST']
         resp = self._get_response()
         resp.location = '/something'
-        body = ''.join(resp(req.environ, start_response))
-        self.assertEquals(resp.location, 'http://local:81/something')
+        # read response
+        b''.join(resp(req.environ, start_response))
+        self.assertEqual(resp.location, 'http://local:81/something')
 
     def test_location_no_rewrite(self):
         def start_response(env, headers):
             pass
-        req = swift.common.swob.Request.blank(
+        req = swob.Request.blank(
             '/', environ={'HTTP_HOST': 'somehost'})
         resp = self._get_response()
         resp.location = 'http://www.google.com/'
-        body = ''.join(resp(req.environ, start_response))
-        self.assertEquals(resp.location, 'http://www.google.com/')
+        # read response
+        b''.join(resp(req.environ, start_response))
+        self.assertEqual(resp.location, 'http://www.google.com/')
+
+    def test_location_no_rewrite_when_told_not_to(self):
+        def start_response(env, headers):
+            pass
+        req = swob.Request.blank(
+            '/', environ={'SERVER_NAME': 'local', 'SERVER_PORT': 81,
+                          'swift.leave_relative_location': True})
+        del req.environ['HTTP_HOST']
+        resp = self._get_response()
+        resp.location = '/something'
+        # read response
+        b''.join(resp(req.environ, start_response))
+        self.assertEqual(resp.location, '/something')
 
     def test_app_iter(self):
         def start_response(env, headers):
             pass
         resp = self._get_response()
-        resp.app_iter = ['a', 'b', 'c']
-        body = ''.join(resp({}, start_response))
-        self.assertEquals(body, 'abc')
+        resp.app_iter = [b'a', b'b', b'c']
+        body = b''.join(resp({}, start_response))
+        self.assertEqual(body, b'abc')
 
     def test_multi_ranges_wo_iter_ranges(self):
         def test_app(environ, start_response):
             start_response('200 OK', [('Content-Length', '10')])
-            return ['1234567890']
+            return [b'1234567890']
 
-        req = swift.common.swob.Request.blank(
+        req = swob.Request.blank(
             '/', headers={'Range': 'bytes=0-9,10-19,20-29'})
 
         resp = req.get_response(test_app)
         resp.conditional_response = True
         resp.content_length = 10
 
-        content = ''.join(resp._response_iter(resp.app_iter, ''))
+        # read response
+        b''.join(resp._response_iter(resp.app_iter, b''))
 
-        self.assertEquals(resp.status, '200 OK')
+        self.assertEqual(resp.status, '200 OK')
         self.assertEqual(10, resp.content_length)
 
     def test_single_range_wo_iter_range(self):
         def test_app(environ, start_response):
             start_response('200 OK', [('Content-Length', '10')])
-            return ['1234567890']
+            return [b'1234567890']
 
-        req = swift.common.swob.Request.blank(
+        req = swob.Request.blank(
             '/', headers={'Range': 'bytes=0-9'})
 
         resp = req.get_response(test_app)
         resp.conditional_response = True
         resp.content_length = 10
 
-        content = ''.join(resp._response_iter(resp.app_iter, ''))
+        # read response
+        b''.join(resp._response_iter(resp.app_iter, b''))
 
-        self.assertEquals(resp.status, '200 OK')
+        self.assertEqual(resp.status, '200 OK')
         self.assertEqual(10, resp.content_length)
 
     def test_multi_range_body(self):
         def test_app(environ, start_response):
             start_response('200 OK', [('Content-Length', '4')])
-            return ['abcd']
+            return [b'abcd']
 
-        req = swift.common.swob.Request.blank(
+        req = swob.Request.blank(
             '/', headers={'Range': 'bytes=0-9,10-19,20-29'})
 
         resp = req.get_response(test_app)
         resp.conditional_response = True
         resp.content_length = 100
 
-        resp.content_type = 'text/plain'
-        content = ''.join(resp._response_iter(None,
-                                              ('0123456789112345678'
-                                               '92123456789')))
-
-        self.assert_(re.match(('\r\n'
-                               '--[a-f0-9]{32}\r\n'
-                               'Content-Type: text/plain\r\n'
-                               'Content-Range: bytes '
-                               '0-9/100\r\n\r\n0123456789\r\n'
-                               '--[a-f0-9]{32}\r\n'
-                               'Content-Type: text/plain\r\n'
-                               'Content-Range: bytes '
-                               '10-19/100\r\n\r\n1123456789\r\n'
-                               '--[a-f0-9]{32}\r\n'
-                               'Content-Type: text/plain\r\n'
-                               'Content-Range: bytes '
-                               '20-29/100\r\n\r\n2123456789\r\n'
-                               '--[a-f0-9]{32}--\r\n'), content))
+        resp.content_type = 'text/plain; charset=utf8'
+        content = b''.join(resp._response_iter(None,
+                                               (b'0123456789112345678'
+                                                b'92123456789')))
+
+        self.assertTrue(re.match(br'--([a-f0-9]{32})\r\n'
+                                 br'Content-Type: text/plain; charset=utf8\r\n'
+                                 br'Content-Range: bytes '
+                                 br'0-9/100\r\n\r\n0123456789\r\n'
+                                 br'--\1\r\n'
+                                 br'Content-Type: text/plain; charset=utf8\r\n'
+                                 br'Content-Range: bytes '
+                                 br'10-19/100\r\n\r\n1123456789\r\n'
+                                 br'--\1\r\n'
+                                 br'Content-Type: text/plain; charset=utf8\r\n'
+                                 br'Content-Range: bytes '
+                                 br'20-29/100\r\n\r\n2123456789\r\n'
+                                 br'--\1--', content))
 
     def test_multi_response_iter(self):
         def test_app(environ, start_response):
             start_response('200 OK', [('Content-Length', '10'),
                                       ('Content-Type', 'application/xml')])
-            return ['0123456789']
+            return [b'0123456789']
 
         app_iter_ranges_args = []
 
@@ -610,104 +1531,114 @@ class App_iter(object):
             def app_iter_ranges(self, ranges, content_type, boundary, size):
                 app_iter_ranges_args.append((ranges, content_type, boundary,
                                              size))
-                for i in xrange(3):
-                    yield str(i) + 'fun'
+                for i in range(3):
+                    yield (str(i) + 'fun').encode('ascii')
                 yield boundary
 
             def __iter__(self):
-                for i in xrange(3):
-                    yield str(i) + 'fun'
+                for i in range(3):
+                    yield (str(i) + 'fun').encode('ascii')
 
-        req = swift.common.swob.Request.blank(
+        req = swob.Request.blank(
             '/', headers={'Range': 'bytes=1-5,8-11'})
 
         resp = req.get_response(test_app)
         resp.conditional_response = True
         resp.content_length = 12
 
-        content = ''.join(resp._response_iter(App_iter(), ''))
+        content = b''.join(resp._response_iter(App_iter(), b''))
         boundary = content[-32:]
-        self.assertEqual(content[:-32], '0fun1fun2fun')
+        self.assertEqual(content[:-32], b'0fun1fun2fun')
         self.assertEqual(app_iter_ranges_args,
-                         [([(1, 6), (8, 12)], 'application/xml',
+                         [([(1, 6), (8, 12)], b'application/xml',
                            boundary, 12)])
 
     def test_range_body(self):
 
         def test_app(environ, start_response):
             start_response('200 OK', [('Content-Length', '10')])
-            return ['1234567890']
+            return [b'1234567890']
 
         def start_response(env, headers):
             pass
 
-        req = swift.common.swob.Request.blank(
+        req = swob.Request.blank(
             '/', headers={'Range': 'bytes=1-3'})
 
-        resp = swift.common.swob.Response(
-            body='1234567890', request=req,
+        resp = swob.Response(
+            body=b'1234567890', request=req,
             conditional_response=True)
-        body = ''.join(resp([], start_response))
-        self.assertEquals(body, '234')
-        self.assertEquals(resp.content_range, 'bytes 1-3/10')
-        self.assertEquals(resp.status, '206 Partial Content')
+        body = b''.join(resp({}, start_response))
+        self.assertEqual(body, b'234')
+        self.assertEqual(resp.content_range, 'bytes 1-3/10')
+        self.assertEqual(resp.status, '206 Partial Content')
 
         # syntactically valid, but does not make sense, so returning 416
         # in next couple of cases.
-        req = swift.common.swob.Request.blank(
+        req = swob.Request.blank(
             '/', headers={'Range': 'bytes=-0'})
         resp = req.get_response(test_app)
         resp.conditional_response = True
-        body = ''.join(resp([], start_response))
-        self.assertEquals(body, '')
-        self.assertEquals(resp.content_length, 0)
-        self.assertEquals(resp.status, '416 Requested Range Not Satisfiable')
-
-        resp = swift.common.swob.Response(
-            body='1234567890', request=req,
+        body = b''.join(resp({}, start_response))
+        self.assertIn(b'The Range requested is not available', body)
+        self.assertEqual(resp.content_length, len(body))
+        self.assertEqual(resp.status, '416 Requested Range Not Satisfiable')
+        self.assertEqual(resp.content_range, 'bytes */10')
+
+        resp = swob.Response(
+            body=b'1234567890', request=req,
             conditional_response=True)
-        body = ''.join(resp([], start_response))
-        self.assertEquals(body, '')
-        self.assertEquals(resp.content_length, 0)
-        self.assertEquals(resp.status, '416 Requested Range Not Satisfiable')
+        body = b''.join(resp({}, start_response))
+        self.assertIn(b'The Range requested is not available', body)
+        self.assertEqual(resp.content_length, len(body))
+        self.assertEqual(resp.status, '416 Requested Range Not Satisfiable')
 
         # Syntactically-invalid Range headers "MUST" be ignored
-        req = swift.common.swob.Request.blank(
+        req = swob.Request.blank(
             '/', headers={'Range': 'bytes=3-2'})
         resp = req.get_response(test_app)
         resp.conditional_response = True
-        body = ''.join(resp([], start_response))
-        self.assertEquals(body, '1234567890')
-        self.assertEquals(resp.status, '200 OK')
+        body = b''.join(resp({}, start_response))
+        self.assertEqual(body, b'1234567890')
+        self.assertEqual(resp.status, '200 OK')
+        self.assertNotIn('Content-Range', resp.headers)
 
-        resp = swift.common.swob.Response(
-            body='1234567890', request=req,
+        resp = swob.Response(
+            body=b'1234567890', request=req,
             conditional_response=True)
-        body = ''.join(resp([], start_response))
-        self.assertEquals(body, '1234567890')
-        self.assertEquals(resp.status, '200 OK')
+        body = b''.join(resp({}, start_response))
+        self.assertEqual(body, b'1234567890')
+        self.assertEqual(resp.status, '200 OK')
 
     def test_content_type(self):
         resp = self._get_response()
         resp.content_type = 'text/plain; charset=utf8'
-        self.assertEquals(resp.content_type, 'text/plain')
+        self.assertEqual(resp.content_type, 'text/plain')
 
     def test_charset(self):
         resp = self._get_response()
         resp.content_type = 'text/plain; charset=utf8'
-        self.assertEquals(resp.charset, 'utf8')
+        self.assertEqual(resp.charset, 'utf8')
         resp.charset = 'utf16'
-        self.assertEquals(resp.charset, 'utf16')
+        self.assertEqual(resp.charset, 'utf16')
+
+    def test_charset_content_type(self):
+        resp = swob.Response(
+            content_type='text/plain', charset='utf-8')
+        self.assertEqual(resp.charset, 'utf-8')
+        resp = swob.Response(
+            charset='utf-8', content_type='text/plain')
+        self.assertEqual(resp.charset, 'utf-8')
 
     def test_etag(self):
         resp = self._get_response()
         resp.etag = 'hi'
-        self.assertEquals(resp.headers['Etag'], '"hi"')
-        self.assertEquals(resp.etag, 'hi')
+        self.assertEqual(resp.headers['Etag'], '"hi"')
+        self.assertEqual(resp.etag, 'hi')
 
-        self.assert_('etag' in resp.headers)
+        self.assertIn('etag', resp.headers)
         resp.etag = None
-        self.assert_('etag' not in resp.headers)
+        self.assertNotIn('etag', resp.headers)
 
     def test_host_url_default(self):
         resp = self._get_response()
@@ -716,7 +1647,7 @@ def test_host_url_default(self):
         env['SERVER_NAME'] = 'bob'
         env['SERVER_PORT'] = '1234'
         del env['HTTP_HOST']
-        self.assertEquals(resp.host_url(), 'http://bob:1234')
+        self.assertEqual(resp.host_url, 'http://bob:1234')
 
     def test_host_url_default_port_squelched(self):
         resp = self._get_response()
@@ -725,7 +1656,7 @@ def test_host_url_default_port_squelched(self):
         env['SERVER_NAME'] = 'bob'
         env['SERVER_PORT'] = '80'
         del env['HTTP_HOST']
-        self.assertEquals(resp.host_url(), 'http://bob')
+        self.assertEqual(resp.host_url, 'http://bob')
 
     def test_host_url_https(self):
         resp = self._get_response()
@@ -734,7 +1665,7 @@ def test_host_url_https(self):
         env['SERVER_NAME'] = 'bob'
         env['SERVER_PORT'] = '1234'
         del env['HTTP_HOST']
-        self.assertEquals(resp.host_url(), 'https://bob:1234')
+        self.assertEqual(resp.host_url, 'https://bob:1234')
 
     def test_host_url_https_port_squelched(self):
         resp = self._get_response()
@@ -743,7 +1674,7 @@ def test_host_url_https_port_squelched(self):
         env['SERVER_NAME'] = 'bob'
         env['SERVER_PORT'] = '443'
         del env['HTTP_HOST']
-        self.assertEquals(resp.host_url(), 'https://bob')
+        self.assertEqual(resp.host_url, 'https://bob')
 
     def test_host_url_host_override(self):
         resp = self._get_response()
@@ -752,7 +1683,7 @@ def test_host_url_host_override(self):
         env['SERVER_NAME'] = 'bob'
         env['SERVER_PORT'] = '1234'
         env['HTTP_HOST'] = 'someother'
-        self.assertEquals(resp.host_url(), 'http://someother')
+        self.assertEqual(resp.host_url, 'http://someother')
 
     def test_host_url_host_port_override(self):
         resp = self._get_response()
@@ -761,7 +1692,7 @@ def test_host_url_host_port_override(self):
         env['SERVER_NAME'] = 'bob'
         env['SERVER_PORT'] = '1234'
         env['HTTP_HOST'] = 'someother:5678'
-        self.assertEquals(resp.host_url(), 'http://someother:5678')
+        self.assertEqual(resp.host_url, 'http://someother:5678')
 
     def test_host_url_host_https(self):
         resp = self._get_response()
@@ -770,12 +1701,351 @@ def test_host_url_host_https(self):
         env['SERVER_NAME'] = 'bob'
         env['SERVER_PORT'] = '1234'
         env['HTTP_HOST'] = 'someother:5678'
-        self.assertEquals(resp.host_url(), 'https://someother:5678')
+        self.assertEqual(resp.host_url, 'https://someother:5678')
+
+    def test_507(self):
+        resp = swob.HTTPInsufficientStorage()
+        content = b''.join(resp._response_iter(resp.app_iter, resp._body))
+        self.assertEqual(
+            content,
+            b'<html><h1>Insufficient Storage</h1><p>There was not enough '
+            b'space to save the resource. Drive: unknown</p></html>')
+        resp = swob.HTTPInsufficientStorage(drive='sda1')
+        content = b''.join(resp._response_iter(resp.app_iter, resp._body))
+        self.assertEqual(
+            content,
+            b'<html><h1>Insufficient Storage</h1><p>There was not enough '
+            b'space to save the resource. Drive: sda1</p></html>')
+
+    def test_200_with_body_and_headers(self):
+        headers = {'Content-Length': '0'}
+        content = b'foo'
+        resp = swob.HTTPOk(body=content, headers=headers)
+        self.assertEqual(resp.body, content)
+        self.assertEqual(resp.content_length, len(content))
+
+    def test_init_with_body_headers_app_iter(self):
+        # body exists but no headers and no app_iter
+        body = b'ok'
+        resp = swob.Response(body=body)
+        self.assertEqual(resp.body, body)
+        self.assertEqual(resp.content_length, len(body))
+
+        # body and headers with 0 content_length exist but no app_iter
+        body = b'ok'
+        resp = swob.Response(
+            body=body, headers={'Content-Length': '0'})
+        self.assertEqual(resp.body, body)
+        self.assertEqual(resp.content_length, len(body))
+
+        # body and headers with content_length exist but no app_iter
+        body = b'ok'
+        resp = swob.Response(
+            body=body, headers={'Content-Length': '5'})
+        self.assertEqual(resp.body, body)
+        self.assertEqual(resp.content_length, len(body))
+
+        # body and headers with no content_length exist but no app_iter
+        body = b'ok'
+        resp = swob.Response(body=body, headers={})
+        self.assertEqual(resp.body, body)
+        self.assertEqual(resp.content_length, len(body))
+
+        # body, headers with content_length and app_iter exist
+        resp = swob.Response(
+            body=b'ok', headers={'Content-Length': '5'}, app_iter=iter([]))
+        self.assertEqual(resp.content_length, 5)
+        self.assertEqual(resp.body, b'')
+
+        # headers with content_length and app_iter exist but no body
+        resp = swob.Response(
+            headers={'Content-Length': '5'}, app_iter=iter([]))
+        self.assertEqual(resp.content_length, 5)
+        self.assertEqual(resp.body, b'')
+
+        # app_iter exists but no body and headers
+        resp = swob.Response(app_iter=iter([]))
+        self.assertIsNone(resp.content_length)
+        self.assertEqual(resp.body, b'')
+
+
+class TestConditionalIfNoneMatch(unittest.TestCase):
+    def fake_app(self, environ, start_response):
+        start_response('200 OK', [('Etag', 'the-etag')])
+        return [b'hi']
+
+    def fake_start_response(*a, **kw):
+        pass
+
+    def test_simple_match(self):
+        # etag matches --> 304
+        req = swob.Request.blank(
+            '/', headers={'If-None-Match': 'the-etag'})
+        resp = req.get_response(self.fake_app)
+        resp.conditional_response = True
+        body = b''.join(resp(req.environ, self.fake_start_response))
+        self.assertEqual(resp.status_int, 304)
+        self.assertEqual(body, b'')
+
+    def test_quoted_simple_match(self):
+        # double quotes don't matter
+        req = swob.Request.blank(
+            '/', headers={'If-None-Match': '"the-etag"'})
+        resp = req.get_response(self.fake_app)
+        resp.conditional_response = True
+        body = b''.join(resp(req.environ, self.fake_start_response))
+        self.assertEqual(resp.status_int, 304)
+        self.assertEqual(body, b'')
+
+    def test_list_match(self):
+        # it works with lists of etags to match
+        req = swob.Request.blank(
+            '/', headers={'If-None-Match': '"bert", "the-etag", "ernie"'})
+        resp = req.get_response(self.fake_app)
+        resp.conditional_response = True
+        body = b''.join(resp(req.environ, self.fake_start_response))
+        self.assertEqual(resp.status_int, 304)
+        self.assertEqual(body, b'')
+
+    def test_list_no_match(self):
+        # no matches --> whatever the original status was
+        req = swob.Request.blank(
+            '/', headers={'If-None-Match': '"bert", "ernie"'})
+        resp = req.get_response(self.fake_app)
+        resp.conditional_response = True
+        body = b''.join(resp(req.environ, self.fake_start_response))
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(body, b'hi')
+
+    def test_match_star(self):
+        # "*" means match anything; see RFC 2616 section 14.24
+        req = swob.Request.blank(
+            '/', headers={'If-None-Match': '*'})
+        resp = req.get_response(self.fake_app)
+        resp.conditional_response = True
+        body = b''.join(resp(req.environ, self.fake_start_response))
+        self.assertEqual(resp.status_int, 304)
+        self.assertEqual(body, b'')
+
+
+class TestConditionalIfMatch(unittest.TestCase):
+    def fake_app(self, environ, start_response):
+        start_response('200 OK', [('Etag', 'the-etag')])
+        return [b'hi']
+
+    def fake_start_response(*a, **kw):
+        pass
+
+    def test_simple_match(self):
+        # if etag matches, proceed as normal
+        req = swob.Request.blank(
+            '/', headers={'If-Match': 'the-etag'})
+        resp = req.get_response(self.fake_app)
+        resp.conditional_response = True
+        body = b''.join(resp(req.environ, self.fake_start_response))
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(body, b'hi')
+
+    def test_simple_conditional_etag_match(self):
+        # if etag matches, proceed as normal
+        req = swob.Request.blank(
+            '/', headers={'If-Match': 'not-the-etag'})
+        resp = req.get_response(self.fake_app)
+        resp.conditional_response = True
+        resp._conditional_etag = 'not-the-etag'
+        body = b''.join(resp(req.environ, self.fake_start_response))
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(body, b'hi')
+
+    def test_quoted_simple_match(self):
+        # double quotes or not, doesn't matter
+        req = swob.Request.blank(
+            '/', headers={'If-Match': '"the-etag"'})
+        resp = req.get_response(self.fake_app)
+        resp.conditional_response = True
+        body = b''.join(resp(req.environ, self.fake_start_response))
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(body, b'hi')
+
+    def test_no_match(self):
+        # no match --> 412
+        req = swob.Request.blank(
+            '/', headers={'If-Match': 'not-the-etag'})
+        resp = req.get_response(self.fake_app)
+        resp.conditional_response = True
+        body = b''.join(resp(req.environ, self.fake_start_response))
+        self.assertEqual(resp.status_int, 412)
+        self.assertEqual(body, b'')
+
+    def test_simple_conditional_etag_no_match(self):
+        req = swob.Request.blank(
+            '/', headers={'If-Match': 'the-etag'})
+        resp = req.get_response(self.fake_app)
+        resp.conditional_response = True
+        resp._conditional_etag = 'not-the-etag'
+        body = b''.join(resp(req.environ, self.fake_start_response))
+        self.assertEqual(resp.status_int, 412)
+        self.assertEqual(body, b'')
+
+    def test_match_star(self):
+        # "*" means match anything; see RFC 2616 section 14.24
+        req = swob.Request.blank(
+            '/', headers={'If-Match': '*'})
+        resp = req.get_response(self.fake_app)
+        resp.conditional_response = True
+        body = b''.join(resp(req.environ, self.fake_start_response))
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(body, b'hi')
+
+    def test_match_star_on_404(self):
+
+        def fake_app_404(environ, start_response):
+            start_response('404 Not Found', [])
+            return [b'hi']
+
+        req = swob.Request.blank(
+            '/', headers={'If-Match': '*'})
+        resp = req.get_response(fake_app_404)
+        resp.conditional_response = True
+        body = b''.join(resp(req.environ, self.fake_start_response))
+        self.assertEqual(resp.status_int, 412)
+        self.assertEqual(body, b'')
 
 
-class TestUTC(unittest.TestCase):
-    def test_tzname(self):
-        self.assertEquals(swift.common.swob.UTC.tzname(None), 'UTC')
+class TestConditionalIfModifiedSince(unittest.TestCase):
+    def fake_app(self, environ, start_response):
+        start_response(
+            '200 OK', [('Last-Modified', 'Thu, 27 Feb 2014 03:29:37 GMT')])
+        return [b'hi']
+
+    def fake_start_response(*a, **kw):
+        pass
+
+    def test_absent(self):
+        req = swob.Request.blank('/')
+        resp = req.get_response(self.fake_app)
+        resp.conditional_response = True
+        body = b''.join(resp(req.environ, self.fake_start_response))
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(body, b'hi')
+
+    def test_before(self):
+        req = swob.Request.blank(
+            '/',
+            headers={'If-Modified-Since': 'Thu, 27 Feb 2014 03:29:36 GMT'})
+        resp = req.get_response(self.fake_app)
+        resp.conditional_response = True
+        body = b''.join(resp(req.environ, self.fake_start_response))
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(body, b'hi')
+
+    def test_same(self):
+        req = swob.Request.blank(
+            '/',
+            headers={'If-Modified-Since': 'Thu, 27 Feb 2014 03:29:37 GMT'})
+        resp = req.get_response(self.fake_app)
+        resp.conditional_response = True
+        body = b''.join(resp(req.environ, self.fake_start_response))
+        self.assertEqual(resp.status_int, 304)
+        self.assertEqual(body, b'')
+
+    def test_greater(self):
+        req = swob.Request.blank(
+            '/',
+            headers={'If-Modified-Since': 'Thu, 27 Feb 2014 03:29:38 GMT'})
+        resp = req.get_response(self.fake_app)
+        resp.conditional_response = True
+        body = b''.join(resp(req.environ, self.fake_start_response))
+        self.assertEqual(resp.status_int, 304)
+        self.assertEqual(body, b'')
+
+    def test_out_of_range_is_ignored(self):
+        # All that datetime gives us is a ValueError or OverflowError when
+        # something is out of range (i.e. less than datetime.datetime.min or
+        # greater than datetime.datetime.max). Unfortunately, we can't
+        # distinguish between a date being too old and a date being too new,
+        # so the best we can do is ignore such headers.
+        max_date_list = list(datetime.datetime.max.timetuple())
+        max_date_list[0] += 1  # bump up the year
+        too_big_date_header = time.strftime(
+            "%a, %d %b %Y %H:%M:%S GMT", time.struct_time(max_date_list))
+
+        req = swob.Request.blank(
+            '/',
+            headers={'If-Modified-Since': too_big_date_header})
+        resp = req.get_response(self.fake_app)
+        resp.conditional_response = True
+        body = b''.join(resp(req.environ, self.fake_start_response))
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(body, b'hi')
+
+
+class TestConditionalIfUnmodifiedSince(unittest.TestCase):
+    def fake_app(self, environ, start_response):
+        start_response(
+            '200 OK', [('Last-Modified', 'Thu, 20 Feb 2014 03:29:37 GMT')])
+        return [b'hi']
+
+    def fake_start_response(*a, **kw):
+        pass
+
+    def test_absent(self):
+        req = swob.Request.blank('/')
+        resp = req.get_response(self.fake_app)
+        resp.conditional_response = True
+        body = b''.join(resp(req.environ, self.fake_start_response))
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(body, b'hi')
+
+    def test_before(self):
+        req = swob.Request.blank(
+            '/',
+            headers={'If-Unmodified-Since': 'Thu, 20 Feb 2014 03:29:36 GMT'})
+        resp = req.get_response(self.fake_app)
+        resp.conditional_response = True
+        body = b''.join(resp(req.environ, self.fake_start_response))
+        self.assertEqual(resp.status_int, 412)
+        self.assertEqual(body, b'')
+
+    def test_same(self):
+        req = swob.Request.blank(
+            '/',
+            headers={'If-Unmodified-Since': 'Thu, 20 Feb 2014 03:29:37 GMT'})
+        resp = req.get_response(self.fake_app)
+        resp.conditional_response = True
+        body = b''.join(resp(req.environ, self.fake_start_response))
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(body, b'hi')
+
+    def test_greater(self):
+        req = swob.Request.blank(
+            '/',
+            headers={'If-Unmodified-Since': 'Thu, 20 Feb 2014 03:29:38 GMT'})
+        resp = req.get_response(self.fake_app)
+        resp.conditional_response = True
+        body = b''.join(resp(req.environ, self.fake_start_response))
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(body, b'hi')
+
+    def test_out_of_range_is_ignored(self):
+        # All that datetime gives us is a ValueError or OverflowError when
+        # something is out of range (i.e. less than datetime.datetime.min or
+        # greater than datetime.datetime.max). Unfortunately, we can't
+        # distinguish between a date being too old and a date being too new,
+        # so the best we can do is ignore such headers.
+        max_date_list = list(datetime.datetime.max.timetuple())
+        max_date_list[0] += 1  # bump up the year
+        too_big_date_header = time.strftime(
+            "%a, %d %b %Y %H:%M:%S GMT", time.struct_time(max_date_list))
+
+        req = swob.Request.blank(
+            '/',
+            headers={'If-Unmodified-Since': too_big_date_header})
+        resp = req.get_response(self.fake_app)
+        resp.conditional_response = True
+        body = b''.join(resp(req.environ, self.fake_start_response))
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(body, b'hi')
 
 
 if __name__ == '__main__':
diff --git a/test/unit/common/test_utils.py b/test/unit/common/test_utils.py
index 25a9b45226..c92669460c 100644
--- a/test/unit/common/test_utils.py
+++ b/test/unit/common/test_utils.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,39 +13,79 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-""" Tests for swift.common.utils """
+"""Tests for swift.common.utils"""
 
-from __future__ import with_statement
-from test.unit import temptree
+import argparse
+import hashlib
+import io
+import itertools
+
+from swift.common.statsd_client import StatsdClient
+from test.debug_logger import debug_logger, FakeStatsdClient, \
+    debug_labeled_statsd_client
+from test.unit import temptree, make_timestamp_iter, with_tempdir, \
+    mock_timestamp_now, TestableMemcacheRing, FakeIterable
+
+import contextlib
 import errno
+import eventlet
+import eventlet.debug
+import eventlet.event
+import eventlet.patcher
+import grp
 import logging
-import mimetools
 import os
+from unittest import mock
+import posix
+import pwd
 import random
-import re
 import socket
+import string
 import sys
+import json
+import math
+import inspect
+import warnings
+
+import tempfile
 import time
 import unittest
-from threading import Thread
-from Queue import Queue, Empty
+import fcntl
+import shutil
+
 from getpass import getuser
+from io import BytesIO, StringIO
 from shutil import rmtree
-from StringIO import StringIO
 from functools import partial
-from tempfile import TemporaryFile, NamedTemporaryFile
-
-from eventlet import sleep
+from tempfile import TemporaryFile, NamedTemporaryFile, mkdtemp
+from unittest.mock import MagicMock, patch
+from configparser import NoSectionError, NoOptionError
+from uuid import uuid4
 
-from swift.common.exceptions import (Timeout, MessageTimeout,
-                                     ConnectionTimeout)
+from swift.common.exceptions import Timeout, LockTimeout, \
+    ReplicationLockTimeout, MimeInvalid
 from swift.common import utils
+from swift.common.utils import set_swift_dir, md5, ShardRangeList, \
+    CooperativeCachePopulator
+from swift.common.container_sync_realms import ContainerSyncRealms
+from swift.common.header_key_dict import HeaderKeyDict
+from swift.common.storage_policy import POLICIES, reload_storage_policies
 from swift.common.swob import Response
+from test.unit import requires_o_tmpfile_support_in_tmp
+
+threading = eventlet.patcher.original('threading')
 
 
-class MockOs():
+class MockOs(object):
+
+    def __init__(self, pass_funcs=None, called_funcs=None, raise_funcs=None):
+        if pass_funcs is None:
+            pass_funcs = []
+        if called_funcs is None:
+            called_funcs = []
+        if raise_funcs is None:
+            raise_funcs = []
 
-    def __init__(self, pass_funcs=[], called_funcs=[], raise_funcs=[]):
         self.closed_fds = []
         for func in pass_funcs:
             setattr(self, func, self.pass_func)
@@ -63,10 +103,10 @@ def pass_func(self, *args, **kwargs):
     setgroups = chdir = setsid = setgid = setuid = umask = pass_func
 
     def called_func(self, name, *args, **kwargs):
-        self.called_funcs[name] = True
+        self.called_funcs[name] = args
 
     def raise_func(self, name, *args, **kwargs):
-        self.called_funcs[name] = True
+        self.called_funcs[name] = args
         raise OSError()
 
     def dup2(self, source, target):
@@ -84,18 +124,14 @@ def __getattr__(self, name):
             return getattr(os, name)
 
 
-class MockUdpSocket():
-    def __init__(self):
-        self.sent = []
-
-    def sendto(self, data, target):
-        self.sent.append((data, target))
+class MockApp(object):
 
-    def close(self):
-        pass
+    def __init__(self, logger, statsd):
+        self.logger = logger
+        self.statsd = statsd
 
 
-class MockSys():
+class MockSys(object):
 
     def __init__(self):
         self.stdin = TemporaryFile('w')
@@ -106,81 +142,379 @@ def __init__(self):
                           self.stderr.fileno()]
 
 
-def reset_loggers():
-    if hasattr(utils.get_logger, 'handler4logger'):
-        for logger, handler in utils.get_logger.handler4logger.items():
-            logger.thread_locals = (None, None)
-            logger.removeHandler(handler)
-        delattr(utils.get_logger, 'handler4logger')
-    if hasattr(utils.get_logger, 'console_handler4logger'):
-        for logger, h in utils.get_logger.console_handler4logger.items():
-            logger.thread_locals = (None, None)
-            logger.removeHandler(h)
-        delattr(utils.get_logger, 'console_handler4logger')
-
-
 class TestUtils(unittest.TestCase):
-    """ Tests for swift.common.utils """
+    """Tests for swift.common.utils """
 
     def setUp(self):
-        utils.HASH_PATH_SUFFIX = 'endcap'
-
-    def test_normalize_timestamp(self):
-        """ Test swift.common.utils.normalize_timestamp """
-        self.assertEquals(utils.normalize_timestamp('1253327593.48174'),
-                          "1253327593.48174")
-        self.assertEquals(utils.normalize_timestamp(1253327593.48174),
-                          "1253327593.48174")
-        self.assertEquals(utils.normalize_timestamp('1253327593.48'),
-                          "1253327593.48000")
-        self.assertEquals(utils.normalize_timestamp(1253327593.48),
-                          "1253327593.48000")
-        self.assertEquals(utils.normalize_timestamp('253327593.48'),
-                          "0253327593.48000")
-        self.assertEquals(utils.normalize_timestamp(253327593.48),
-                          "0253327593.48000")
-        self.assertEquals(utils.normalize_timestamp('1253327593'),
-                          "1253327593.00000")
-        self.assertEquals(utils.normalize_timestamp(1253327593),
-                          "1253327593.00000")
-        self.assertRaises(ValueError, utils.normalize_timestamp, '')
-        self.assertRaises(ValueError, utils.normalize_timestamp, 'abc')
-
-    def test_mkdirs(self):
-        testroot = os.path.join(os.path.dirname(__file__), 'mkdirs')
+        utils.HASH_PATH_SUFFIX = b'endcap'
+        utils.HASH_PATH_PREFIX = b'startcap'
+        self.md5_test_data = "Openstack forever".encode('utf-8')
         try:
-            os.unlink(testroot)
-        except Exception:
-            pass
-        rmtree(testroot, ignore_errors=1)
-        self.assert_(not os.path.exists(testroot))
+            self.md5_digest = hashlib.md5(self.md5_test_data).hexdigest()
+            self.fips_enabled = False
+        except ValueError:
+            self.md5_digest = '0d6dc3c588ae71a04ce9a6beebbbba06'
+            self.fips_enabled = True
+
+    def test_monkey_patch(self):
+        def take_and_release(lock):
+            try:
+                lock.acquire()
+            finally:
+                lock.release()
+
+        def do_test():
+            res = 0
+            try:
+                # this module imports eventlet original threading, so re-import
+                # locally...
+                import threading
+                import traceback
+                logging_lock_before = logging._lock
+                my_lock_before = threading.RLock()
+                self.assertIsInstance(logging_lock_before,
+                                      type(my_lock_before))
+
+                utils.monkey_patch()
+
+                logging_lock_after = logging._lock
+                my_lock_after = threading.RLock()
+                self.assertIsInstance(logging_lock_after,
+                                      type(my_lock_after))
+
+                self.assertTrue(logging_lock_after.acquire())
+                thread = threading.Thread(target=take_and_release,
+                                          args=(logging_lock_after,))
+                thread.start()
+                self.assertTrue(thread.isAlive())
+                # we should timeout while the thread is still blocking on lock
+                eventlet.sleep()
+                thread.join(timeout=0.1)
+                self.assertTrue(thread.isAlive())
+
+                logging._lock.release()
+                thread.join(timeout=0.1)
+                self.assertFalse(thread.isAlive())
+            except AssertionError:
+                traceback.print_exc()
+                res = 1
+            finally:
+                os._exit(res)
+
+        pid = os.fork()
+        if pid == 0:
+            # run the test in an isolated environment to avoid monkey patching
+            # in this one
+            do_test()
+        else:
+            child_pid, errcode = os.waitpid(pid, 0)
+            self.assertEqual(0, os.WEXITSTATUS(errcode),
+                             'Forked do_test failed')
+
+    def test_get_zero_indexed_base_string(self):
+        self.assertEqual(utils.get_zero_indexed_base_string('something', 0),
+                         'something')
+        self.assertEqual(utils.get_zero_indexed_base_string('something', None),
+                         'something')
+        self.assertEqual(utils.get_zero_indexed_base_string('something', 1),
+                         'something-1')
+        self.assertRaises(ValueError, utils.get_zero_indexed_base_string,
+                          'something', 'not_integer')
+
+    @with_tempdir
+    def test_lock_path(self, tmpdir):
+        # 2 locks with limit=1 must fail
+        success = False
+        with utils.lock_path(tmpdir, 0.1):
+            with self.assertRaises(LockTimeout):
+                with utils.lock_path(tmpdir, 0.1):
+                    success = True
+        self.assertFalse(success)
+
+        # 2 locks with limit=2 must succeed
+        success = False
+        with utils.lock_path(tmpdir, 0.1, limit=2):
+            try:
+                with utils.lock_path(tmpdir, 0.1, limit=2):
+                    success = True
+            except LockTimeout as exc:
+                self.fail('Unexpected exception %s' % exc)
+        self.assertTrue(success)
+
+        # 3 locks with limit=2 must fail
+        success = False
+        with utils.lock_path(tmpdir, 0.1, limit=2):
+            with utils.lock_path(tmpdir, 0.1, limit=2):
+                with self.assertRaises(LockTimeout):
+                    with utils.lock_path(tmpdir, 0.1):
+                        success = True
+        self.assertFalse(success)
+
+    @with_tempdir
+    def test_lock_path_invalid_limit(self, tmpdir):
+        success = False
+        with self.assertRaises(ValueError):
+            with utils.lock_path(tmpdir, 0.1, limit=0):
+                success = True
+        self.assertFalse(success)
+        with self.assertRaises(ValueError):
+            with utils.lock_path(tmpdir, 0.1, limit=-1):
+                success = True
+        self.assertFalse(success)
+        with self.assertRaises(TypeError):
+            with utils.lock_path(tmpdir, 0.1, limit='1'):
+                success = True
+        self.assertFalse(success)
+        with self.assertRaises(TypeError):
+            with utils.lock_path(tmpdir, 0.1, limit=1.1):
+                success = True
+        self.assertFalse(success)
+
+    @with_tempdir
+    def test_lock_path_num_sleeps(self, tmpdir):
+        num_short_calls = [0]
+        exception_raised = [False]
+
+        def my_sleep(to_sleep):
+            if to_sleep == 0.01:
+                num_short_calls[0] += 1
+            else:
+                raise Exception('sleep time changed: %s' % to_sleep)
+
+        try:
+            with mock.patch('swift.common.utils.sleep', my_sleep):
+                with utils.lock_path(tmpdir):
+                    with utils.lock_path(tmpdir):
+                        pass
+        except Exception as e:
+            exception_raised[0] = True
+            self.assertTrue('sleep time changed' in str(e))
+        self.assertEqual(num_short_calls[0], 11)
+        self.assertTrue(exception_raised[0])
+
+    @with_tempdir
+    def test_lock_path_class(self, tmpdir):
+        with utils.lock_path(tmpdir, 0.1, ReplicationLockTimeout):
+            exc = None
+            exc2 = None
+            success = False
+            try:
+                with utils.lock_path(tmpdir, 0.1, ReplicationLockTimeout):
+                    success = True
+            except ReplicationLockTimeout as err:
+                exc = err
+            except LockTimeout as err:
+                exc2 = err
+            self.assertTrue(exc is not None)
+            self.assertTrue(exc2 is None)
+            self.assertTrue(not success)
+            exc = None
+            exc2 = None
+            success = False
+            try:
+                with utils.lock_path(tmpdir, 0.1):
+                    success = True
+            except ReplicationLockTimeout as err:
+                exc = err
+            except LockTimeout as err:
+                exc2 = err
+            self.assertTrue(exc is None)
+            self.assertTrue(exc2 is not None)
+            self.assertTrue(not success)
+
+    @with_tempdir
+    def test_lock_path_name(self, tmpdir):
+        # With default limit (1), can't take the same named lock twice
+        success = False
+        with utils.lock_path(tmpdir, 0.1, name='foo'):
+            with self.assertRaises(LockTimeout):
+                with utils.lock_path(tmpdir, 0.1, name='foo'):
+                    success = True
+        self.assertFalse(success)
+        # With default limit (1), can take two differently named locks
+        success = False
+        with utils.lock_path(tmpdir, 0.1, name='foo'):
+            with utils.lock_path(tmpdir, 0.1, name='bar'):
+                success = True
+        self.assertTrue(success)
+        # With default limit (1), can take a named lock and the default lock
+        success = False
+        with utils.lock_path(tmpdir, 0.1, name='foo'):
+            with utils.lock_path(tmpdir, 0.1):
+                success = True
+        self.assertTrue(success)
+
+    def test_drain_and_close(self):
+        utils.drain_and_close([])
+        utils.drain_and_close(iter([]))
+        drained = [False]
+
+        def gen():
+            yield 'x'
+            yield 'y'
+            drained[0] = True
+
+        g = gen()
+        utils.drain_and_close(g)
+        self.assertTrue(drained[0])
+        self.assertIsNone(g.gi_frame)
+
+        utils.drain_and_close(Response(status=200, body=b'Some body'))
+        drained = [False]
+        utils.drain_and_close(Response(status=200, app_iter=gen()))
+        self.assertTrue(drained[0])
+
+    def test_drain_and_close_with_limit(self):
+
+        def gen():
+            yield 'a' * 5
+            yield 'a' * 4
+            yield 'a' * 3
+            drained[0] = True
+
+        drained = [False]
+        g = gen()
+        utils.drain_and_close(g, read_limit=13)
+        self.assertTrue(drained[0])
+        self.assertIsNone(g.gi_frame)
+
+        drained = [False]
+        g = gen()
+        utils.drain_and_close(g, read_limit=12)
+        # this would need *one more* call to next
+        self.assertFalse(drained[0])
+        self.assertIsNone(g.gi_frame)
+
+        drained = [False]
+        # not even close to the whole thing
+        g = gen()
+        utils.drain_and_close(g, read_limit=3)
+        self.assertFalse(drained[0])
+        self.assertIsNone(g.gi_frame)
+
+        drained = [False]
+        # default is to drain; no limit!
+        g = gen()
+        utils.drain_and_close(g)
+        self.assertIsNone(g.gi_frame)
+        self.assertTrue(drained[0])
+
+    def test_friendly_close_small_body(self):
+
+        def small_body_iter():
+            yield 'a small body'
+            drained[0] = True
+
+        drained = [False]
+        utils.friendly_close(small_body_iter())
+        self.assertTrue(drained[0])
+
+    def test_friendly_close_large_body(self):
+        def large_body_iter():
+            for i in range(10):
+                chunk = chr(97 + i) * 64 * 2 ** 10
+                yielded_chunks.append(chunk)
+                yield chunk
+            drained[0] = True
+
+        drained = [False]
+        yielded_chunks = []
+        utils.friendly_close(large_body_iter())
+        self.assertFalse(drained[0])
+        self.assertEqual(['a' * 65536], yielded_chunks)
+
+    def test_friendly_close_exploding_body(self):
+
+        class ExplodingBody(object):
+
+            def __init__(self):
+                self.yielded_chunks = []
+                self.close_calls = []
+                self._body = self._exploding_iter()
+
+            def _exploding_iter(self):
+                chunk = 'a' * 63 * 2 ** 10
+                self.yielded_chunks.append(chunk)
+                yield chunk
+                raise Exception('kaboom!')
+
+            def __iter__(self):
+                return self
+
+            def __next__(self):
+                return next(self._body)
+
+            def close(self):
+                self.close_calls.append(True)
+
+        body = ExplodingBody()
+        with self.assertRaises(Exception) as ctx:
+            utils.friendly_close(body)
+        self.assertEqual('kaboom!', str(ctx.exception))
+        self.assertEqual(['a' * 64512], body.yielded_chunks)
+        self.assertEqual([True], body.close_calls)
+
+    def test_backwards(self):
+        # Test swift.common.utils.backward
+
+        # The lines are designed so that the function would encounter
+        # all of the boundary conditions and typical conditions.
+        # Block boundaries are marked with '<>' characters
+        blocksize = 25
+        lines = [b'123456789x12345678><123456789\n',  # block larger than rest
+                 b'123456789x123>\n',  # block ends just before \n character
+                 b'123423456789\n',
+                 b'123456789x\n',  # block ends at the end of line
+                 b'<123456789x123456789x123\n',
+                 b'<6789x123\n',  # block ends at the beginning of the line
+                 b'6789x1234\n',
+                 b'1234><234\n',  # block ends typically in the middle of line
+                 b'123456789x123456789\n']
+
+        with TemporaryFile() as f:
+            for line in lines:
+                f.write(line)
+
+            count = len(lines) - 1
+            for line in utils.backward(f, blocksize):
+                self.assertEqual(line, lines[count].split(b'\n')[0])
+                count -= 1
+
+        # Empty file case
+        with TemporaryFile('r') as f:
+            self.assertEqual([], list(utils.backward(f)))
+
+    @with_tempdir
+    def test_mkdirs(self, testdir_base):
+        testroot = os.path.join(testdir_base, 'mkdirs')
+        self.assertTrue(not os.path.exists(testroot))
         utils.mkdirs(testroot)
-        self.assert_(os.path.exists(testroot))
+        self.assertTrue(os.path.exists(testroot))
         utils.mkdirs(testroot)
-        self.assert_(os.path.exists(testroot))
+        self.assertTrue(os.path.exists(testroot))
         rmtree(testroot, ignore_errors=1)
 
         testdir = os.path.join(testroot, 'one/two/three')
-        self.assert_(not os.path.exists(testdir))
+        self.assertTrue(not os.path.exists(testdir))
         utils.mkdirs(testdir)
-        self.assert_(os.path.exists(testdir))
+        self.assertTrue(os.path.exists(testdir))
         utils.mkdirs(testdir)
-        self.assert_(os.path.exists(testdir))
+        self.assertTrue(os.path.exists(testdir))
         rmtree(testroot, ignore_errors=1)
 
         open(testroot, 'wb').close()
-        self.assert_(not os.path.exists(testdir))
+        self.assertTrue(not os.path.exists(testdir))
         self.assertRaises(OSError, utils.mkdirs, testdir)
         os.unlink(testroot)
 
     def test_split_path(self):
-        """ Test swift.common.utils.split_account_path """
+        # Test swift.common.utils.split_account_path
         self.assertRaises(ValueError, utils.split_path, '')
         self.assertRaises(ValueError, utils.split_path, '/')
         self.assertRaises(ValueError, utils.split_path, '//')
-        self.assertEquals(utils.split_path('/a'), ['a'])
+        self.assertEqual(utils.split_path('/a'), ['a'])
         self.assertRaises(ValueError, utils.split_path, '//a')
-        self.assertEquals(utils.split_path('/a/'), ['a'])
+        self.assertEqual(utils.split_path('/a/'), ['a'])
         self.assertRaises(ValueError, utils.split_path, '/a/c')
         self.assertRaises(ValueError, utils.split_path, '//c')
         self.assertRaises(ValueError, utils.split_path, '/a/c/')
@@ -188,27 +522,31 @@ def test_split_path(self):
         self.assertRaises(ValueError, utils.split_path, '/a', 2)
         self.assertRaises(ValueError, utils.split_path, '/a', 2, 3)
         self.assertRaises(ValueError, utils.split_path, '/a', 2, 3, True)
-        self.assertEquals(utils.split_path('/a/c', 2), ['a', 'c'])
-        self.assertEquals(utils.split_path('/a/c/o', 3), ['a', 'c', 'o'])
+        self.assertRaises(ValueError, utils.split_path, '/v/a//o', 1, 4, True)
+        self.assertRaises(ValueError, utils.split_path, '/v/a//o', 2, 4, True)
+        self.assertEqual(utils.split_path('/a/c', 2), ['a', 'c'])
+        self.assertEqual(utils.split_path('/a/c/o', 3), ['a', 'c', 'o'])
         self.assertRaises(ValueError, utils.split_path, '/a/c/o/r', 3, 3)
-        self.assertEquals(utils.split_path('/a/c/o/r', 3, 3, True),
-                          ['a', 'c', 'o/r'])
-        self.assertEquals(utils.split_path('/a/c', 2, 3, True),
-                          ['a', 'c', None])
+        self.assertEqual(utils.split_path('/a/c/o/r', 3, 3, True),
+                         ['a', 'c', 'o/r'])
+        self.assertEqual(utils.split_path('/a/c//o', 1, 3, True),
+                         ['a', 'c', '/o'])
+        self.assertEqual(utils.split_path('/a/c', 2, 3, True),
+                         ['a', 'c', None])
         self.assertRaises(ValueError, utils.split_path, '/a', 5, 4)
-        self.assertEquals(utils.split_path('/a/c/', 2), ['a', 'c'])
-        self.assertEquals(utils.split_path('/a/c/', 2, 3), ['a', 'c', ''])
+        self.assertEqual(utils.split_path('/a/c/', 2), ['a', 'c'])
+        self.assertEqual(utils.split_path('/a/c/', 2, 3), ['a', 'c', ''])
         try:
             utils.split_path('o\nn e', 2)
-        except ValueError, err:
-            self.assertEquals(str(err), 'Invalid path: o%0An%20e')
+        except ValueError as err:
+            self.assertEqual(str(err), 'Invalid path: o%0An%20e')
         try:
             utils.split_path('o\nn e', 2, 3, True)
-        except ValueError, err:
-            self.assertEquals(str(err), 'Invalid path: o%0An%20e')
+        except ValueError as err:
+            self.assertEqual(str(err), 'Invalid path: o%0An%20e')
 
     def test_validate_device_partition(self):
-        """ Test swift.common.utils.validate_device_partition """
+        # Test swift.common.utils.validate_device_partition
         utils.validate_device_partition('foo', 'bar')
         self.assertRaises(ValueError,
                           utils.validate_device_partition, '', '')
@@ -230,568 +568,490 @@ def test_validate_device_partition(self):
                           utils.validate_device_partition, 'foo', '..')
         try:
             utils.validate_device_partition('o\nn e', 'foo')
-        except ValueError, err:
-            self.assertEquals(str(err), 'Invalid device: o%0An%20e')
+        except ValueError as err:
+            self.assertEqual(str(err), 'Invalid device: o%0An%20e')
         try:
             utils.validate_device_partition('foo', 'o\nn e')
-        except ValueError, err:
-            self.assertEquals(str(err), 'Invalid partition: o%0An%20e')
-
-    def test_NullLogger(self):
-        """ Test swift.common.utils.NullLogger """
-        sio = StringIO()
-        nl = utils.NullLogger()
-        nl.write('test')
-        self.assertEquals(sio.getvalue(), '')
-
-    def test_LoggerFileObject(self):
-        orig_stdout = sys.stdout
-        orig_stderr = sys.stderr
-        sio = StringIO()
-        handler = logging.StreamHandler(sio)
-        logger = logging.getLogger()
-        logger.addHandler(handler)
-        lfo = utils.LoggerFileObject(logger)
-        print 'test1'
-        self.assertEquals(sio.getvalue(), '')
-        sys.stdout = lfo
-        print 'test2'
-        self.assertEquals(sio.getvalue(), 'STDOUT: test2\n')
-        sys.stderr = lfo
-        print >> sys.stderr, 'test4'
-        self.assertEquals(sio.getvalue(), 'STDOUT: test2\nSTDOUT: test4\n')
-        sys.stdout = orig_stdout
-        print 'test5'
-        self.assertEquals(sio.getvalue(), 'STDOUT: test2\nSTDOUT: test4\n')
-        print >> sys.stderr, 'test6'
-        self.assertEquals(sio.getvalue(), 'STDOUT: test2\nSTDOUT: test4\n'
-                          'STDOUT: test6\n')
-        sys.stderr = orig_stderr
-        print 'test8'
-        self.assertEquals(sio.getvalue(), 'STDOUT: test2\nSTDOUT: test4\n'
-                          'STDOUT: test6\n')
-        lfo.writelines(['a', 'b', 'c'])
-        self.assertEquals(sio.getvalue(), 'STDOUT: test2\nSTDOUT: test4\n'
-                          'STDOUT: test6\nSTDOUT: a#012b#012c\n')
-        lfo.close()
-        lfo.write('d')
-        self.assertEquals(sio.getvalue(), 'STDOUT: test2\nSTDOUT: test4\n'
-                          'STDOUT: test6\nSTDOUT: a#012b#012c\nSTDOUT: d\n')
-        lfo.flush()
-        self.assertEquals(sio.getvalue(), 'STDOUT: test2\nSTDOUT: test4\n'
-                          'STDOUT: test6\nSTDOUT: a#012b#012c\nSTDOUT: d\n')
-        got_exc = False
-        try:
-            for line in lfo:
-                pass
-        except Exception:
-            got_exc = True
-        self.assert_(got_exc)
-        got_exc = False
-        try:
-            for line in lfo.xreadlines():
-                pass
-        except Exception:
-            got_exc = True
-        self.assert_(got_exc)
-        self.assertRaises(IOError, lfo.read)
-        self.assertRaises(IOError, lfo.read, 1024)
-        self.assertRaises(IOError, lfo.readline)
-        self.assertRaises(IOError, lfo.readline, 1024)
-        lfo.tell()
+        except ValueError as err:
+            self.assertEqual(str(err), 'Invalid partition: o%0An%20e')
 
     def test_parse_options(self):
-        # use mkstemp to get a file that is definately on disk
+        # Get a file that is definitely on disk
         with NamedTemporaryFile() as f:
             conf_file = f.name
             conf, options = utils.parse_options(test_args=[conf_file])
-            self.assertEquals(conf, conf_file)
+            self.assertEqual(conf, conf_file)
             # assert defaults
-            self.assertEquals(options['verbose'], False)
-            self.assert_('once' not in options)
+            self.assertEqual(options['verbose'], False)
+            self.assertNotIn('once', options)
             # assert verbose as option
             conf, options = utils.parse_options(test_args=[conf_file, '-v'])
-            self.assertEquals(options['verbose'], True)
+            self.assertEqual(options['verbose'], True)
             # check once option
             conf, options = utils.parse_options(test_args=[conf_file],
                                                 once=True)
-            self.assertEquals(options['once'], False)
+            self.assertEqual(options['once'], False)
             test_args = [conf_file, '--once']
             conf, options = utils.parse_options(test_args=test_args, once=True)
-            self.assertEquals(options['once'], True)
+            self.assertEqual(options['once'], True)
             # check options as arg parsing
             test_args = [conf_file, 'once', 'plugin_name', 'verbose']
             conf, options = utils.parse_options(test_args=test_args, once=True)
-            self.assertEquals(options['verbose'], True)
-            self.assertEquals(options['once'], True)
-            self.assertEquals(options['extra_args'], ['plugin_name'])
+            self.assertEqual(options['verbose'], True)
+            self.assertEqual(options['once'], True)
+            self.assertEqual(options['extra_args'], ['plugin_name'])
 
     def test_parse_options_errors(self):
-        orig_stdout = sys.stdout
-        orig_stderr = sys.stderr
-        stdo = StringIO()
-        stde = StringIO()
-        utils.sys.stdout = stdo
-        utils.sys.stderr = stde
-        self.assertRaises(SystemExit, utils.parse_options, once=True,
-                          test_args=[])
-        self.assert_('missing config file' in stdo.getvalue())
-
-        # verify conf file must exist, context manager will delete temp file
-        with NamedTemporaryFile() as f:
-            conf_file = f.name
-        self.assertRaises(SystemExit, utils.parse_options, once=True,
-                          test_args=[conf_file])
-        self.assert_('unable to locate' in stdo.getvalue())
-
-        # reset stdio
-        utils.sys.stdout = orig_stdout
-        utils.sys.stderr = orig_stderr
-
-    def test_get_logger(self):
-        sio = StringIO()
-        logger = logging.getLogger('server')
-        logger.addHandler(logging.StreamHandler(sio))
+        with mock.patch.object(utils.sys, 'stdout', StringIO()) as stdo:
+            self.assertRaises(SystemExit, utils.parse_options, once=True,
+                              test_args=[])
+            self.assertTrue('missing config' in stdo.getvalue())
+
+            # verify conf file must exist -- context manager will delete
+            # temp file
+            with NamedTemporaryFile() as f:
+                conf_file = f.name
+            self.assertRaises(SystemExit, utils.parse_options, once=True,
+                              test_args=[conf_file])
+            self.assertTrue('unable to locate' in stdo.getvalue())
+
+    @with_tempdir
+    def test_dump_recon_cache(self, testdir_base):
+        testcache_file = os.path.join(testdir_base, 'cache.recon')
         logger = utils.get_logger(None, 'server', log_route='server')
-        logger.warn('test1')
-        self.assertEquals(sio.getvalue(), 'test1\n')
-        logger.debug('test2')
-        self.assertEquals(sio.getvalue(), 'test1\n')
-        logger = utils.get_logger({'log_level': 'DEBUG'}, 'server',
-                                  log_route='server')
-        logger.debug('test3')
-        self.assertEquals(sio.getvalue(), 'test1\ntest3\n')
-        # Doesn't really test that the log facility is truly being used all the
-        # way to syslog; but exercises the code.
-        logger = utils.get_logger({'log_facility': 'LOG_LOCAL3'}, 'server',
-                                  log_route='server')
-        logger.warn('test4')
-        self.assertEquals(sio.getvalue(),
-                          'test1\ntest3\ntest4\n')
-        # make sure debug doesn't log by default
-        logger.debug('test5')
-        self.assertEquals(sio.getvalue(),
-                          'test1\ntest3\ntest4\n')
-        # make sure notice lvl logs by default
-        logger.notice('test6')
-        self.assertEquals(sio.getvalue(),
-                          'test1\ntest3\ntest4\ntest6\n')
-
-    def test_clean_logger_exception(self):
-        # setup stream logging
-        sio = StringIO()
-        logger = utils.get_logger(None)
-        handler = logging.StreamHandler(sio)
-        logger.logger.addHandler(handler)
-
-        def strip_value(sio):
-            v = sio.getvalue()
-            sio.truncate(0)
-            return v
-
-        def log_exception(exc):
-            try:
-                raise exc
-            except (Exception, Timeout):
-                logger.exception('blah')
-        try:
-            # establish base case
-            self.assertEquals(strip_value(sio), '')
-            logger.info('test')
-            self.assertEquals(strip_value(sio), 'test\n')
-            self.assertEquals(strip_value(sio), '')
-            logger.info('test')
-            logger.info('test')
-            self.assertEquals(strip_value(sio), 'test\ntest\n')
-            self.assertEquals(strip_value(sio), '')
-
-            # test OSError
-            for en in (errno.EIO, errno.ENOSPC):
-                log_exception(OSError(en, 'my %s error message' % en))
-                log_msg = strip_value(sio)
-                self.assert_('Traceback' not in log_msg)
-                self.assert_('my %s error message' % en in log_msg)
-            # unfiltered
-            log_exception(OSError())
-            self.assert_('Traceback' in strip_value(sio))
-
-            # test socket.error
-            log_exception(socket.error(errno.ECONNREFUSED,
-                                       'my error message'))
-            log_msg = strip_value(sio)
-            self.assert_('Traceback' not in log_msg)
-            self.assert_('errno.ECONNREFUSED message test' not in log_msg)
-            self.assert_('Connection refused' in log_msg)
-            log_exception(socket.error(errno.EHOSTUNREACH,
-                                       'my error message'))
-            log_msg = strip_value(sio)
-            self.assert_('Traceback' not in log_msg)
-            self.assert_('my error message' not in log_msg)
-            self.assert_('Host unreachable' in log_msg)
-            log_exception(socket.error(errno.ETIMEDOUT, 'my error message'))
-            log_msg = strip_value(sio)
-            self.assert_('Traceback' not in log_msg)
-            self.assert_('my error message' not in log_msg)
-            self.assert_('Connection timeout' in log_msg)
-            # unfiltered
-            log_exception(socket.error(0, 'my error message'))
-            log_msg = strip_value(sio)
-            self.assert_('Traceback' in log_msg)
-            self.assert_('my error message' in log_msg)
-
-            # test eventlet.Timeout
-            log_exception(ConnectionTimeout(42, 'my error message'))
-            log_msg = strip_value(sio)
-            self.assert_('Traceback' not in log_msg)
-            self.assert_('ConnectionTimeout' in log_msg)
-            self.assert_('(42s)' in log_msg)
-            self.assert_('my error message' not in log_msg)
-            log_exception(MessageTimeout(42, 'my error message'))
-            log_msg = strip_value(sio)
-            self.assert_('Traceback' not in log_msg)
-            self.assert_('MessageTimeout' in log_msg)
-            self.assert_('(42s)' in log_msg)
-            self.assert_('my error message' in log_msg)
-
-            # test unhandled
-            log_exception(Exception('my error message'))
-            log_msg = strip_value(sio)
-            self.assert_('Traceback' in log_msg)
-            self.assert_('my error message' in log_msg)
+        submit_dict = {'key0': 99,
+                       'key1': {'value1': 1, 'value2': 2}}
+        utils.dump_recon_cache(submit_dict, testcache_file, logger)
+        with open(testcache_file) as fd:
+            file_dict = json.loads(fd.readline())
+        self.assertEqual(submit_dict, file_dict)
+        # Use a nested entry
+        submit_dict = {'key0': 101,
+                       'key1': {'key2': {'value1': 1, 'value2': 2}}}
+        expect_dict = {'key0': 101,
+                       'key1': {'key2': {'value1': 1, 'value2': 2},
+                                'value1': 1, 'value2': 2}}
+        utils.dump_recon_cache(submit_dict, testcache_file, logger)
+        with open(testcache_file) as fd:
+            file_dict = json.loads(fd.readline())
+        self.assertEqual(expect_dict, file_dict)
+        # nested dict items are not sticky
+        submit_dict = {'key1': {'key2': {'value3': 3}}}
+        expect_dict = {'key0': 101,
+                       'key1': {'key2': {'value3': 3},
+                                'value1': 1, 'value2': 2}}
+        utils.dump_recon_cache(submit_dict, testcache_file, logger)
+        with open(testcache_file) as fd:
+            file_dict = json.loads(fd.readline())
+        self.assertEqual(expect_dict, file_dict)
+        # cached entries are sticky
+        submit_dict = {}
+        utils.dump_recon_cache(submit_dict, testcache_file, logger)
+        with open(testcache_file) as fd:
+            file_dict = json.loads(fd.readline())
+        self.assertEqual(expect_dict, file_dict)
+        # nested dicts can be erased...
+        submit_dict = {'key1': {'key2': {}}}
+        expect_dict = {'key0': 101,
+                       'key1': {'value1': 1, 'value2': 2}}
+        utils.dump_recon_cache(submit_dict, testcache_file, logger)
+        with open(testcache_file) as fd:
+            file_dict = json.loads(fd.readline())
+        self.assertEqual(expect_dict, file_dict)
+        # ... and erasure is idempotent
+        utils.dump_recon_cache(submit_dict, testcache_file, logger)
+        with open(testcache_file) as fd:
+            file_dict = json.loads(fd.readline())
+        self.assertEqual(expect_dict, file_dict)
+        # top level dicts can be erased...
+        submit_dict = {'key1': {}}
+        expect_dict = {'key0': 101}
+        utils.dump_recon_cache(submit_dict, testcache_file, logger)
+        with open(testcache_file) as fd:
+            file_dict = json.loads(fd.readline())
+        self.assertEqual(expect_dict, file_dict)
+        # ... and erasure is idempotent
+        utils.dump_recon_cache(submit_dict, testcache_file, logger)
+        with open(testcache_file) as fd:
+            file_dict = json.loads(fd.readline())
+        self.assertEqual(expect_dict, file_dict)
+
+    @with_tempdir
+    def test_dump_recon_cache_set_owner(self, testdir_base):
+        testcache_file = os.path.join(testdir_base, 'cache.recon')
+        logger = utils.get_logger(None, 'server', log_route='server')
+        submit_dict = {'key1': {'value1': 1, 'value2': 2}}
+
+        _ret = lambda: None
+        _ret.pw_uid = 100
+        _mock_getpwnam = MagicMock(return_value=_ret)
+        _mock_chown = mock.Mock()
+
+        with patch('os.chown', _mock_chown), \
+                patch('pwd.getpwnam', _mock_getpwnam):
+            utils.dump_recon_cache(submit_dict, testcache_file,
+                                   logger, set_owner="swift")
+
+        _mock_getpwnam.assert_called_once_with("swift")
+        self.assertEqual(_mock_chown.call_args[0][1], 100)
+
+    @with_tempdir
+    def test_dump_recon_cache_permission_denied(self, testdir_base):
+        testcache_file = os.path.join(testdir_base, 'cache.recon')
+
+        class MockLogger(object):
+            def __init__(self):
+                self._excs = []
+
+            def exception(self, message):
+                _junk, exc, _junk = sys.exc_info()
+                self._excs.append(exc)
+
+        logger = MockLogger()
+        submit_dict = {'key1': {'value1': 1, 'value2': 2}}
+        with mock.patch(
+                'swift.common.utils.NamedTemporaryFile',
+                side_effect=IOError(13, 'Permission Denied')):
+            utils.dump_recon_cache(submit_dict, testcache_file, logger)
+        self.assertIsInstance(logger._excs[0], IOError)
+
+    def test_load_recon_cache(self):
+        stub_data = {'test': 'foo'}
+        with NamedTemporaryFile() as f:
+            f.write(json.dumps(stub_data).encode("utf-8"))
+            f.flush()
+            self.assertEqual(stub_data, utils.load_recon_cache(f.name))
 
-        finally:
-            logger.logger.removeHandler(handler)
-            reset_loggers()
-
-    def test_swift_log_formatter(self):
-        # setup stream logging
-        sio = StringIO()
-        logger = utils.get_logger(None)
-        handler = logging.StreamHandler(sio)
-        handler.setFormatter(utils.SwiftLogFormatter())
-        logger.logger.addHandler(handler)
-
-        def strip_value(sio):
-            v = sio.getvalue()
-            sio.truncate(0)
-            return v
+        # missing files are treated as empty
+        self.assertFalse(os.path.exists(f.name))  # sanity
+        self.assertEqual({}, utils.load_recon_cache(f.name))
 
-        try:
-            self.assertFalse(logger.txn_id)
-            logger.error('my error message')
-            log_msg = strip_value(sio)
-            self.assert_('my error message' in log_msg)
-            self.assert_('txn' not in log_msg)
-            logger.txn_id = '12345'
-            logger.error('test')
-            log_msg = strip_value(sio)
-            self.assert_('txn' in log_msg)
-            self.assert_('12345' in log_msg)
-            # test no txn on info message
-            self.assertEquals(logger.txn_id, '12345')
-            logger.info('test')
-            log_msg = strip_value(sio)
-            self.assert_('txn' not in log_msg)
-            self.assert_('12345' not in log_msg)
-            # test txn already in message
-            self.assertEquals(logger.txn_id, '12345')
-            logger.warn('test 12345 test')
-            self.assertEquals(strip_value(sio), 'test 12345 test\n')
-
-            # test client_ip
-            self.assertFalse(logger.client_ip)
-            logger.error('my error message')
-            log_msg = strip_value(sio)
-            self.assert_('my error message' in log_msg)
-            self.assert_('client_ip' not in log_msg)
-            logger.client_ip = '1.2.3.4'
-            logger.error('test')
-            log_msg = strip_value(sio)
-            self.assert_('client_ip' in log_msg)
-            self.assert_('1.2.3.4' in log_msg)
-            # test no client_ip on info message
-            self.assertEquals(logger.client_ip, '1.2.3.4')
-            logger.info('test')
-            log_msg = strip_value(sio)
-            self.assert_('client_ip' not in log_msg)
-            self.assert_('1.2.3.4' not in log_msg)
-            # test client_ip (and txn) already in message
-            self.assertEquals(logger.client_ip, '1.2.3.4')
-            logger.warn('test 1.2.3.4 test 12345')
-            self.assertEquals(strip_value(sio), 'test 1.2.3.4 test 12345\n')
-        finally:
-            logger.logger.removeHandler(handler)
-            reset_loggers()
+        # Corrupt files are treated as empty. We could crash and make an
+        # operator fix the corrupt file, but they'll "fix" it with "rm -f
+        # /var/cache/swift/*.recon", so let's just do it for them.
+        with NamedTemporaryFile() as f:
+            f.write(b"{not [valid (json")
+            f.flush()
+            self.assertEqual({}, utils.load_recon_cache(f.name))
 
     def test_storage_directory(self):
-        self.assertEquals(utils.storage_directory('objects', '1', 'ABCDEF'),
-                          'objects/1/DEF/ABCDEF')
-
-    def test_whataremyips(self):
-        myips = utils.whataremyips()
-        self.assert_(len(myips) > 1)
-        self.assert_('127.0.0.1' in myips)
+        self.assertEqual(utils.storage_directory('objects', '1', 'ABCDEF'),
+                         'objects/1/DEF/ABCDEF')
+
+    def test_select_node_ip(self):
+        dev = {
+            'ip': '127.0.0.1',
+            'port': 6200,
+            'replication_ip': '127.0.1.1',
+            'replication_port': 6400,
+            'device': 'sdb',
+        }
+        self.assertEqual(('127.0.0.1', 6200), utils.select_ip_port(dev))
+        self.assertEqual(('127.0.1.1', 6400),
+                         utils.select_ip_port(dev, use_replication=True))
+        dev['use_replication'] = False
+        self.assertEqual(('127.0.1.1', 6400),
+                         utils.select_ip_port(dev, use_replication=True))
+        dev['use_replication'] = True
+        self.assertEqual(('127.0.1.1', 6400), utils.select_ip_port(dev))
+        self.assertEqual(('127.0.1.1', 6400),
+                         utils.select_ip_port(dev, use_replication=False))
+
+    def test_node_to_string(self):
+        dev = {
+            'id': 3,
+            'region': 1,
+            'zone': 1,
+            'ip': '127.0.0.1',
+            'port': 6200,
+            'replication_ip': '127.0.1.1',
+            'replication_port': 6400,
+            'device': 'sdb',
+            'meta': '',
+            'weight': 8000.0,
+            'index': 0,
+        }
+        self.assertEqual(utils.node_to_string(dev), '127.0.0.1:6200/sdb')
+        self.assertEqual(utils.node_to_string(dev, replication=True),
+                         '127.0.1.1:6400/sdb')
+        dev['use_replication'] = False
+        self.assertEqual(utils.node_to_string(dev), '127.0.0.1:6200/sdb')
+        self.assertEqual(utils.node_to_string(dev, replication=True),
+                         '127.0.1.1:6400/sdb')
+        dev['use_replication'] = True
+        self.assertEqual(utils.node_to_string(dev), '127.0.1.1:6400/sdb')
+        # Node dict takes precedence
+        self.assertEqual(utils.node_to_string(dev, replication=False),
+                         '127.0.1.1:6400/sdb')
+
+        dev = {
+            'id': 3,
+            'region': 1,
+            'zone': 1,
+            'ip': "fe80::0204:61ff:fe9d:f156",
+            'port': 6200,
+            'replication_ip': "fe80::0204:61ff:ff9d:1234",
+            'replication_port': 6400,
+            'device': 'sdb',
+            'meta': '',
+            'weight': 8000.0,
+            'index': 0,
+        }
+        self.assertEqual(utils.node_to_string(dev),
+                         '[fe80::0204:61ff:fe9d:f156]:6200/sdb')
+        self.assertEqual(utils.node_to_string(dev, replication=True),
+                         '[fe80::0204:61ff:ff9d:1234]:6400/sdb')
 
     def test_hash_path(self):
         # Yes, these tests are deliberately very fragile. We want to make sure
         # that if someones changes the results hash_path produces, they know it
-        self.assertEquals(utils.hash_path('a'),
-                          '1c84525acb02107ea475dcd3d09c2c58')
-        self.assertEquals(utils.hash_path('a', 'c'),
-                          '33379ecb053aa5c9e356c68997cbb59e')
-        self.assertEquals(utils.hash_path('a', 'c', 'o'),
-                          '06fbf0b514e5199dfc4e00f42eb5ea83')
-        self.assertEquals(utils.hash_path('a', 'c', 'o', raw_digest=False),
-                          '06fbf0b514e5199dfc4e00f42eb5ea83')
-        self.assertEquals(utils.hash_path('a', 'c', 'o', raw_digest=True),
-                          '\x06\xfb\xf0\xb5\x14\xe5\x19\x9d\xfcN'
-                          '\x00\xf4.\xb5\xea\x83')
-        self.assertRaises(ValueError, utils.hash_path, 'a', object='o')
+        with mock.patch('swift.common.utils.HASH_PATH_PREFIX', b''):
+            self.assertEqual(utils.hash_path('a'),
+                             '1c84525acb02107ea475dcd3d09c2c58')
+            self.assertEqual(utils.hash_path('a', 'c'),
+                             '33379ecb053aa5c9e356c68997cbb59e')
+            self.assertEqual(utils.hash_path('a', 'c', 'o'),
+                             '06fbf0b514e5199dfc4e00f42eb5ea83')
+            self.assertEqual(utils.hash_path('a', 'c', 'o', raw_digest=False),
+                             '06fbf0b514e5199dfc4e00f42eb5ea83')
+            self.assertEqual(utils.hash_path('a', 'c', 'o', raw_digest=True),
+                             b'\x06\xfb\xf0\xb5\x14\xe5\x19\x9d\xfcN'
+                             b'\x00\xf4.\xb5\xea\x83')
+            self.assertRaises(ValueError, utils.hash_path, 'a', object='o')
+            utils.HASH_PATH_PREFIX = b'abcdef'
+            self.assertEqual(utils.hash_path('a', 'c', 'o', raw_digest=False),
+                             '363f9b535bfb7d17a43a46a358afca0e')
+
+    def test_validate_hash_conf(self):
+        # no section causes InvalidHashPathConfigError
+        self._test_validate_hash_conf([], [], True)
+
+        # 'swift-hash' section is there but no options causes
+        # InvalidHashPathConfigError
+        self._test_validate_hash_conf(['swift-hash'], [], True)
+
+        # if we have the section and either of prefix or suffix,
+        # InvalidHashPathConfigError doesn't occur
+        self._test_validate_hash_conf(
+            ['swift-hash'], ['swift_hash_path_prefix'], False)
+        self._test_validate_hash_conf(
+            ['swift-hash'], ['swift_hash_path_suffix'], False)
+
+        # definitely, we have the section and both of them,
+        # InvalidHashPathConfigError doesn't occur
+        self._test_validate_hash_conf(
+            ['swift-hash'],
+            ['swift_hash_path_suffix', 'swift_hash_path_prefix'], False)
+
+        # But invalid section name should make an error even if valid
+        # options are there
+        self._test_validate_hash_conf(
+            ['swift-hash-xxx'],
+            ['swift_hash_path_suffix', 'swift_hash_path_prefix'], True)
+
+        # Unreadable/missing swift.conf causes IOError
+        # We mock in case the unit tests are run on a laptop with SAIO,
+        # which does have a natural /etc/swift/swift.conf.
+        with mock.patch('swift.common.utils.HASH_PATH_PREFIX', b''), \
+                mock.patch('swift.common.utils.HASH_PATH_SUFFIX', b''), \
+                mock.patch('swift.common.utils.SWIFT_CONF_FILE',
+                           '/nosuchfile'), \
+                self.assertRaises(IOError):
+            utils.validate_hash_conf()
+
+    def _test_validate_hash_conf(self, sections, options, should_raise_error):
+
+        class FakeConfigParser(object):
+            def read_file(self, fp):
+                pass
+
+            readfp = read_file
+
+            def get(self, section, option):
+                if section not in sections:
+                    raise NoSectionError('section error')
+                elif option not in options:
+                    raise NoOptionError('option error', 'this option')
+                else:
+                    return 'some_option_value'
+
+        with mock.patch('swift.common.utils.HASH_PATH_PREFIX', b''), \
+                mock.patch('swift.common.utils.HASH_PATH_SUFFIX', b''), \
+                mock.patch('swift.common.utils.SWIFT_CONF_FILE',
+                           '/dev/null'), \
+                mock.patch('swift.common.utils.ConfigParser',
+                           FakeConfigParser):
+            try:
+                utils.validate_hash_conf()
+            except utils.InvalidHashPathConfigError:
+                if not should_raise_error:
+                    self.fail('validate_hash_conf should not raise an error')
+            else:
+                if should_raise_error:
+                    self.fail('validate_hash_conf should raise an error')
 
     def test_load_libc_function(self):
-        self.assert_(callable(
+        self.assertTrue(callable(
             utils.load_libc_function('printf')))
-        self.assert_(callable(
+        self.assertTrue(callable(
             utils.load_libc_function('some_not_real_function')))
-
-    def test_readconf(self):
-        conf = '''[section1]
-foo = bar
-
-[section2]
-log_name = yarr'''
-        # setup a real file
-        with open('/tmp/test', 'wb') as f:
-            f.write(conf)
-        make_filename = lambda: '/tmp/test'
-        # setup a file stream
-        make_fp = lambda: StringIO(conf)
-        for conf_object_maker in (make_filename, make_fp):
-            conffile = conf_object_maker()
-            result = utils.readconf(conffile)
-            expected = {'__file__': conffile,
-                        'log_name': None,
-                        'section1': {'foo': 'bar'},
-                        'section2': {'log_name': 'yarr'}}
-            self.assertEquals(result, expected)
-            conffile = conf_object_maker()
-            result = utils.readconf(conffile, 'section1')
-            expected = {'__file__': conffile, 'log_name': 'section1',
-                        'foo': 'bar'}
-            self.assertEquals(result, expected)
-            conffile = conf_object_maker()
-            result = utils.readconf(conffile,
-                                    'section2').get('log_name')
-            expected = 'yarr'
-            self.assertEquals(result, expected)
-            conffile = conf_object_maker()
-            result = utils.readconf(conffile, 'section1',
-                                    log_name='foo').get('log_name')
-            expected = 'foo'
-            self.assertEquals(result, expected)
-            conffile = conf_object_maker()
-            result = utils.readconf(conffile, 'section1',
-                                    defaults={'bar': 'baz'})
-            expected = {'__file__': conffile, 'log_name': 'section1',
-                        'foo': 'bar', 'bar': 'baz'}
-            self.assertEquals(result, expected)
-        self.assertRaises(SystemExit, utils.readconf, '/tmp/test', 'section3')
-        os.unlink('/tmp/test')
-        self.assertRaises(SystemExit, utils.readconf, '/tmp/test')
-
-    def test_readconf_raw(self):
-        conf = '''[section1]
-foo = bar
-
-[section2]
-log_name = %(yarr)s'''
-        # setup a real file
-        with open('/tmp/test', 'wb') as f:
-            f.write(conf)
-        make_filename = lambda: '/tmp/test'
-        # setup a file stream
-        make_fp = lambda: StringIO(conf)
-        for conf_object_maker in (make_filename, make_fp):
-            conffile = conf_object_maker()
-            result = utils.readconf(conffile, raw=True)
-            expected = {'__file__': conffile,
-                        'log_name': None,
-                        'section1': {'foo': 'bar'},
-                        'section2': {'log_name': '%(yarr)s'}}
-            self.assertEquals(result, expected)
-        os.unlink('/tmp/test')
-        self.assertRaises(SystemExit, utils.readconf, '/tmp/test')
+        self.assertRaises(AttributeError,
+                          utils.load_libc_function, 'some_not_real_function',
+                          fail_if_missing=True)
 
     def test_drop_privileges(self):
+        required_func_calls = ('setgroups', 'setgid', 'setuid')
+        mock_os = MockOs(called_funcs=required_func_calls)
         user = getuser()
+        user_data = pwd.getpwnam(user)
+        self.assertFalse(mock_os.called_funcs)  # sanity check
         # over-ride os with mock
-        required_func_calls = ('setgroups', 'setgid', 'setuid', 'setsid',
-                               'chdir', 'umask')
-        utils.os = MockOs(called_funcs=required_func_calls)
-        # exercise the code
-        utils.drop_privileges(user)
+        with mock.patch('swift.common.utils.os', mock_os):
+            # exercise the code
+            utils.drop_privileges(user)
+
         for func in required_func_calls:
-            self.assert_(utils.os.called_funcs[func])
-        import pwd
-        self.assertEquals(pwd.getpwnam(user)[5], utils.os.environ['HOME'])
+            self.assertIn(func, mock_os.called_funcs)
+        self.assertEqual(user_data[5], mock_os.environ['HOME'])
+        groups = {g.gr_gid for g in grp.getgrall() if user in g.gr_mem}
+        self.assertEqual(groups, set(mock_os.called_funcs['setgroups'][0]))
+        self.assertEqual(user_data[3], mock_os.called_funcs['setgid'][0])
+        self.assertEqual(user_data[2], mock_os.called_funcs['setuid'][0])
+
+    def test_drop_privileges_no_setgroups(self):
+        required_func_calls = ('geteuid', 'setgid', 'setuid')
+        mock_os = MockOs(called_funcs=required_func_calls)
+        user = getuser()
+        user_data = pwd.getpwnam(user)
+        self.assertFalse(mock_os.called_funcs)  # sanity check
+        # over-ride os with mock
+        with mock.patch('swift.common.utils.os', mock_os):
+            # exercise the code
+            utils.drop_privileges(user)
 
-        # reset; test same args, OSError trying to get session leader
-        utils.os = MockOs(called_funcs=required_func_calls,
-                          raise_funcs=('setsid',))
         for func in required_func_calls:
-            self.assertFalse(utils.os.called_funcs.get(func, False))
-        utils.drop_privileges(user)
+            self.assertIn(func, mock_os.called_funcs)
+        self.assertNotIn('setgroups', mock_os.called_funcs)
+        self.assertEqual(user_data[5], mock_os.environ['HOME'])
+        self.assertEqual(user_data[3], mock_os.called_funcs['setgid'][0])
+        self.assertEqual(user_data[2], mock_os.called_funcs['setuid'][0])
+
+    def test_clean_up_daemon_hygene(self):
+        required_func_calls = ('chdir', 'umask')
+        # OSError if trying to get session leader, but setsid() OSError is
+        # ignored by the code under test.
+        bad_func_calls = ('setsid',)
+        mock_os = MockOs(called_funcs=required_func_calls,
+                         raise_funcs=bad_func_calls)
+        with mock.patch('swift.common.utils.os', mock_os):
+            # exercise the code
+            utils.clean_up_daemon_hygiene()
         for func in required_func_calls:
-            self.assert_(utils.os.called_funcs[func])
+            self.assertIn(func, mock_os.called_funcs)
+        for func in bad_func_calls:
+            self.assertIn(func, mock_os.called_funcs)
+        self.assertEqual('/', mock_os.called_funcs['chdir'][0])
+        self.assertEqual(0o22, mock_os.called_funcs['umask'][0])
+
+    def verify_under_pseudo_time(
+            self, func, target_runtime_ms=1, *args, **kwargs):
+        curr_time = [42.0]
+
+        def my_time():
+            curr_time[0] += 0.001
+            return curr_time[0]
+
+        def my_sleep(duration):
+            curr_time[0] += 0.001
+            curr_time[0] += duration
+
+        with patch('time.time', my_time), \
+                patch('time.sleep', my_sleep), \
+                patch('eventlet.sleep', my_sleep):
+            start = time.time()
+            func(*args, **kwargs)
+            # make sure it's accurate to 10th of a second, converting the time
+            # difference to milliseconds, 100 milliseconds is 1/10 of a second
+            diff_from_target_ms = abs(
+                target_runtime_ms - ((time.time() - start) * 1000))
+            self.assertTrue(diff_from_target_ms < 100,
+                            "Expected %d < 100" % diff_from_target_ms)
 
-    def test_capture_stdio(self):
-        # stubs
-        logger = utils.get_logger(None, 'dummy')
+    def test_ratelimit_sleep(self):
+        with warnings.catch_warnings():
+            warnings.filterwarnings(
+                'ignore', r'ratelimit_sleep\(\) is deprecated')
 
-        # mock utils system modules
-        _orig_sys = utils.sys
-        _orig_os = utils.os
-        try:
-            utils.sys = MockSys()
-            utils.os = MockOs()
-
-            # basic test
-            utils.capture_stdio(logger)
-            self.assert_(utils.sys.excepthook is not None)
-            self.assertEquals(utils.os.closed_fds, utils.sys.stdio_fds)
-            self.assert_(isinstance(utils.sys.stdout, utils.LoggerFileObject))
-            self.assert_(isinstance(utils.sys.stderr, utils.LoggerFileObject))
-
-            # reset; test same args, but exc when trying to close stdio
-            utils.os = MockOs(raise_funcs=('dup2',))
-            utils.sys = MockSys()
-
-            # test unable to close stdio
-            utils.capture_stdio(logger)
-            self.assert_(utils.sys.excepthook is not None)
-            self.assertEquals(utils.os.closed_fds, [])
-            self.assert_(isinstance(utils.sys.stdout, utils.LoggerFileObject))
-            self.assert_(isinstance(utils.sys.stderr, utils.LoggerFileObject))
-
-            # reset; test some other args
-            utils.os = MockOs()
-            utils.sys = MockSys()
-            logger = utils.get_logger(None, log_to_console=True)
-
-            # test console log
-            utils.capture_stdio(logger, capture_stdout=False,
-                                capture_stderr=False)
-            self.assert_(utils.sys.excepthook is not None)
-            # when logging to console, stderr remains open
-            self.assertEquals(utils.os.closed_fds, utils.sys.stdio_fds[:2])
-            reset_loggers()
-
-            # stdio not captured
-            self.assertFalse(isinstance(utils.sys.stdout,
-                                        utils.LoggerFileObject))
-            self.assertFalse(isinstance(utils.sys.stderr,
-                                        utils.LoggerFileObject))
-            reset_loggers()
-        finally:
-            utils.sys = _orig_sys
-            utils.os = _orig_os
-
-    def test_get_logger_console(self):
-        reset_loggers()
-        logger = utils.get_logger(None)
-        console_handlers = [h for h in logger.logger.handlers if
-                            isinstance(h, logging.StreamHandler)]
-        self.assertFalse(console_handlers)
-        logger = utils.get_logger(None, log_to_console=True)
-        console_handlers = [h for h in logger.logger.handlers if
-                            isinstance(h, logging.StreamHandler)]
-        self.assert_(console_handlers)
-        # make sure you can't have two console handlers
-        self.assertEquals(len(console_handlers), 1)
-        old_handler = console_handlers[0]
-        logger = utils.get_logger(None, log_to_console=True)
-        console_handlers = [h for h in logger.logger.handlers if
-                            isinstance(h, logging.StreamHandler)]
-        self.assertEquals(len(console_handlers), 1)
-        new_handler = console_handlers[0]
-        self.assertNotEquals(new_handler, old_handler)
-        reset_loggers()
+            def testfunc():
+                running_time = 0
+                for i in range(100):
+                    running_time = utils.ratelimit_sleep(running_time, -5)
 
-    def test_ratelimit_sleep(self):
-        running_time = 0
-        start = time.time()
-        for i in range(100):
-            running_time = utils.ratelimit_sleep(running_time, 0)
-        self.assertTrue(abs((time.time() - start) * 100) < 1)
-
-        running_time = 0
-        start = time.time()
-        for i in range(50):
-            running_time = utils.ratelimit_sleep(running_time, 200)
-        # make sure it's accurate to 10th of a second
-        self.assertTrue(abs(25 - (time.time() - start) * 100) < 10)
+            self.verify_under_pseudo_time(testfunc, target_runtime_ms=1)
+
+            def testfunc():
+                running_time = 0
+                for i in range(100):
+                    running_time = utils.ratelimit_sleep(running_time, 0)
+
+            self.verify_under_pseudo_time(testfunc, target_runtime_ms=1)
+
+            def testfunc():
+                running_time = 0
+                for i in range(50):
+                    running_time = utils.ratelimit_sleep(running_time, 200)
+
+            self.verify_under_pseudo_time(testfunc, target_runtime_ms=250)
 
     def test_ratelimit_sleep_with_incr(self):
-        running_time = 0
-        start = time.time()
-        vals = [5, 17, 0, 3, 11, 30,
-                40, 4, 13, 2, -1] * 2  # adds up to 250 (with no -1)
-        total = 0
-        for i in vals:
-            running_time = utils.ratelimit_sleep(running_time,
-                                                 500, incr_by=i)
-            total += i
-        self.assertTrue(abs(50 - (time.time() - start) * 100) < 10)
-
-    def test_urlparse(self):
-        parsed = utils.urlparse('http://127.0.0.1/')
-        self.assertEquals(parsed.scheme, 'http')
-        self.assertEquals(parsed.hostname, '127.0.0.1')
-        self.assertEquals(parsed.path, '/')
-
-        parsed = utils.urlparse('http://127.0.0.1:8080/')
-        self.assertEquals(parsed.port, 8080)
-
-        parsed = utils.urlparse('https://127.0.0.1/')
-        self.assertEquals(parsed.scheme, 'https')
-
-        parsed = utils.urlparse('http://[::1]/')
-        self.assertEquals(parsed.hostname, '::1')
-
-        parsed = utils.urlparse('http://[::1]:8080/')
-        self.assertEquals(parsed.hostname, '::1')
-        self.assertEquals(parsed.port, 8080)
-
-        parsed = utils.urlparse('www.example.com')
-        self.assertEquals(parsed.hostname, '')
+        with warnings.catch_warnings():
+            warnings.filterwarnings(
+                'ignore', r'ratelimit_sleep\(\) is deprecated')
+
+            def testfunc():
+                running_time = 0
+                vals = [5, 17, 0, 3, 11, 30,
+                        40, 4, 13, 2, -1] * 2  # adds up to 248
+                total = 0
+                for i in vals:
+                    running_time = utils.ratelimit_sleep(running_time,
+                                                         500, incr_by=i)
+                    total += i
+                self.assertEqual(248, total)
+
+            self.verify_under_pseudo_time(testfunc, target_runtime_ms=500)
 
     def test_ratelimit_sleep_with_sleep(self):
-        running_time = 0
-        start = time.time()
-        sleeps = [0] * 7 + [.2] * 3 + [0] * 30
-        for i in sleeps:
-            running_time = utils.ratelimit_sleep(running_time, 40,
-                                                 rate_buffer=1)
-            time.sleep(i)
-        # make sure it's accurate to 10th of a second
-        self.assertTrue(abs(100 - (time.time() - start) * 100) < 10)
+        with warnings.catch_warnings():
+            warnings.filterwarnings(
+                'ignore', r'ratelimit_sleep\(\) is deprecated')
+
+            def testfunc():
+                running_time = 0
+                sleeps = [0] * 7 + [.2] * 3 + [0] * 30
+                for i in sleeps:
+                    running_time = utils.ratelimit_sleep(running_time, 40,
+                                                         rate_buffer=1)
+                    time.sleep(i)
+
+            self.verify_under_pseudo_time(testfunc, target_runtime_ms=900)
 
     def test_search_tree(self):
         # file match & ext miss
         with temptree(['asdf.conf', 'blarg.conf', 'asdf.cfg']) as t:
             asdf = utils.search_tree(t, 'a*', '.conf')
-            self.assertEquals(len(asdf), 1)
-            self.assertEquals(asdf[0],
-                              os.path.join(t, 'asdf.conf'))
+            self.assertEqual(len(asdf), 1)
+            self.assertEqual(asdf[0],
+                             os.path.join(t, 'asdf.conf'))
 
         # multi-file match & glob miss & sort
         with temptree(['application.bin', 'apple.bin', 'apropos.bin']) as t:
             app_bins = utils.search_tree(t, 'app*', 'bin')
-            self.assertEquals(len(app_bins), 2)
-            self.assertEquals(app_bins[0],
-                              os.path.join(t, 'apple.bin'))
-            self.assertEquals(app_bins[1],
-                              os.path.join(t, 'application.bin'))
+            self.assertEqual(len(app_bins), 2)
+            self.assertEqual(app_bins[0],
+                             os.path.join(t, 'apple.bin'))
+            self.assertEqual(app_bins[1],
+                             os.path.join(t, 'application.bin'))
 
         # test file in folder & ext miss & glob miss
         files = (
@@ -803,9 +1063,9 @@ def test_search_tree(self):
         )
         with temptree(files) as t:
             sub_ini = utils.search_tree(t, 'sub*', '.ini')
-            self.assertEquals(len(sub_ini), 1)
-            self.assertEquals(sub_ini[0],
-                              os.path.join(t, 'sub/file1.ini'))
+            self.assertEqual(len(sub_ini), 1)
+            self.assertEqual(sub_ini[0],
+                             os.path.join(t, 'sub/file1.ini'))
 
         # test multi-file in folder & sub-folder & ext miss & glob miss
         files = (
@@ -818,13 +1078,61 @@ def test_search_tree(self):
         )
         with temptree(files) as t:
             folder_texts = utils.search_tree(t, 'folder*', '.txt')
-            self.assertEquals(len(folder_texts), 4)
+            self.assertEqual(len(folder_texts), 4)
             f1 = os.path.join(t, 'folder_file.txt')
             f2 = os.path.join(t, 'folder/1.txt')
             f3 = os.path.join(t, 'folder/sub/2.txt')
             f4 = os.path.join(t, 'folder2/3.txt')
             for f in [f1, f2, f3, f4]:
-                self.assert_(f in folder_texts)
+                self.assertTrue(f in folder_texts)
+
+    def test_search_tree_with_directory_ext_match(self):
+        files = (
+            'object-server/object-server.conf-base',
+            'object-server/1.conf.d/base.conf',
+            'object-server/1.conf.d/1.conf',
+            'object-server/2.conf.d/base.conf',
+            'object-server/2.conf.d/2.conf',
+            'object-server/3.conf.d/base.conf',
+            'object-server/3.conf.d/3.conf',
+            'object-server/4.conf.d/base.conf',
+            'object-server/4.conf.d/4.conf',
+        )
+        with temptree(files) as t:
+            conf_dirs = utils.search_tree(t, 'object-server', '.conf',
+                                          dir_ext='conf.d')
+        self.assertEqual(len(conf_dirs), 4)
+        for i in range(4):
+            conf_dir = os.path.join(t, 'object-server/%d.conf.d' % (i + 1))
+            self.assertTrue(conf_dir in conf_dirs)
+
+    def test_search_tree_conf_dir_with_named_conf_match(self):
+        files = (
+            'proxy-server/proxy-server.conf.d/base.conf',
+            'proxy-server/proxy-server.conf.d/pipeline.conf',
+            'proxy-server/proxy-noauth.conf.d/base.conf',
+            'proxy-server/proxy-noauth.conf.d/pipeline.conf',
+        )
+        with temptree(files) as t:
+            conf_dirs = utils.search_tree(t, 'proxy-server', 'noauth.conf',
+                                          dir_ext='noauth.conf.d')
+        self.assertEqual(len(conf_dirs), 1)
+        conf_dir = conf_dirs[0]
+        expected = os.path.join(t, 'proxy-server/proxy-noauth.conf.d')
+        self.assertEqual(conf_dir, expected)
+
+    def test_search_tree_conf_dir_pid_with_named_conf_match(self):
+        files = (
+            'proxy-server/proxy-server.pid.d',
+            'proxy-server/proxy-noauth.pid.d',
+        )
+        with temptree(files) as t:
+            pid_files = utils.search_tree(t, 'proxy-server',
+                                          exts=['noauth.pid', 'noauth.pid.d'])
+        self.assertEqual(len(pid_files), 1)
+        pid_file = pid_files[0]
+        expected = os.path.join(t, 'proxy-server/proxy-noauth.pid.d')
+        self.assertEqual(pid_file, expected)
 
     def test_write_file(self):
         with temptree([]) as t:
@@ -832,13 +1140,13 @@ def test_write_file(self):
             utils.write_file(file_name, 'test')
             with open(file_name, 'r') as f:
                 contents = f.read()
-            self.assertEquals(contents, 'test')
+            self.assertEqual(contents, 'test')
             # and also subdirs
             file_name = os.path.join(t, 'subdir/test2')
             utils.write_file(file_name, 'test2')
             with open(file_name, 'r') as f:
                 contents = f.read()
-            self.assertEquals(contents, 'test2')
+            self.assertEqual(contents, 'test2')
             # but can't over-write files
             file_name = os.path.join(t, 'subdir/test2/test3')
             self.assertRaises(IOError, utils.write_file, file_name,
@@ -848,79 +1156,208 @@ def test_remove_file(self):
         with temptree([]) as t:
             file_name = os.path.join(t, 'blah.pid')
             # assert no raise
-            self.assertEquals(os.path.exists(file_name), False)
-            self.assertEquals(utils.remove_file(file_name), None)
+            self.assertEqual(os.path.exists(file_name), False)
+            self.assertIsNone(utils.remove_file(file_name))
             with open(file_name, 'w') as f:
                 f.write('1')
-            self.assert_(os.path.exists(file_name))
-            self.assertEquals(utils.remove_file(file_name), None)
+            self.assertTrue(os.path.exists(file_name))
+            self.assertIsNone(utils.remove_file(file_name))
             self.assertFalse(os.path.exists(file_name))
 
+    def test_remove_directory(self):
+        with temptree([]) as t:
+            dir_name = os.path.join(t, 'subdir')
+
+            os.mkdir(dir_name)
+            self.assertTrue(os.path.isdir(dir_name))
+            self.assertIsNone(utils.remove_directory(dir_name))
+            self.assertFalse(os.path.exists(dir_name))
+
+            # assert no raise only if it does not exist, or is not empty
+            self.assertEqual(os.path.exists(dir_name), False)
+            self.assertIsNone(utils.remove_directory(dir_name))
+
+            _m_rmdir = mock.Mock(
+                side_effect=OSError(errno.ENOTEMPTY,
+                                    os.strerror(errno.ENOTEMPTY)))
+            with mock.patch('swift.common.utils.os.rmdir', _m_rmdir):
+                self.assertIsNone(utils.remove_directory(dir_name))
+
+            _m_rmdir = mock.Mock(
+                side_effect=OSError(errno.EPERM, os.strerror(errno.EPERM)))
+            with mock.patch('swift.common.utils.os.rmdir', _m_rmdir):
+                self.assertRaises(OSError, utils.remove_directory, dir_name)
+
+    @with_tempdir
+    def test_is_file_older(self, tempdir):
+        ts = utils.Timestamp(time.time() - 100000)
+        file_name = os.path.join(tempdir, '%s.data' % ts.internal)
+        # assert no raise
+        self.assertFalse(os.path.exists(file_name))
+        self.assertTrue(utils.is_file_older(file_name, 0))
+        self.assertFalse(utils.is_file_older(file_name, 1))
+
+        with open(file_name, 'w') as f:
+            f.write('1')
+        self.assertTrue(os.path.exists(file_name))
+        self.assertTrue(utils.is_file_older(file_name, 0))
+        # check that timestamp in file name is not relevant
+        self.assertFalse(utils.is_file_older(file_name, 50000))
+        time.sleep(0.01)
+        self.assertTrue(utils.is_file_older(file_name, 0.009))
+
     def test_human_readable(self):
-        self.assertEquals(utils.human_readable(0), '0')
-        self.assertEquals(utils.human_readable(1), '1')
-        self.assertEquals(utils.human_readable(10), '10')
-        self.assertEquals(utils.human_readable(100), '100')
-        self.assertEquals(utils.human_readable(999), '999')
-        self.assertEquals(utils.human_readable(1024), '1Ki')
-        self.assertEquals(utils.human_readable(1535), '1Ki')
-        self.assertEquals(utils.human_readable(1536), '2Ki')
-        self.assertEquals(utils.human_readable(1047552), '1023Ki')
-        self.assertEquals(utils.human_readable(1048063), '1023Ki')
-        self.assertEquals(utils.human_readable(1048064), '1Mi')
-        self.assertEquals(utils.human_readable(1048576), '1Mi')
-        self.assertEquals(utils.human_readable(1073741824), '1Gi')
-        self.assertEquals(utils.human_readable(1099511627776), '1Ti')
-        self.assertEquals(utils.human_readable(1125899906842624), '1Pi')
-        self.assertEquals(utils.human_readable(1152921504606846976), '1Ei')
-        self.assertEquals(utils.human_readable(1180591620717411303424), '1Zi')
-        self.assertEquals(utils.human_readable(1208925819614629174706176),
-                          '1Yi')
-        self.assertEquals(utils.human_readable(1237940039285380274899124224),
-                          '1024Yi')
+        self.assertEqual(utils.human_readable(0), '0')
+        self.assertEqual(utils.human_readable(1), '1')
+        self.assertEqual(utils.human_readable(10), '10')
+        self.assertEqual(utils.human_readable(100), '100')
+        self.assertEqual(utils.human_readable(999), '999')
+        self.assertEqual(utils.human_readable(1024), '1Ki')
+        self.assertEqual(utils.human_readable(1535), '1Ki')
+        self.assertEqual(utils.human_readable(1536), '2Ki')
+        self.assertEqual(utils.human_readable(1047552), '1023Ki')
+        self.assertEqual(utils.human_readable(1048063), '1023Ki')
+        self.assertEqual(utils.human_readable(1048064), '1Mi')
+        self.assertEqual(utils.human_readable(1048576), '1Mi')
+        self.assertEqual(utils.human_readable(1073741824), '1Gi')
+        self.assertEqual(utils.human_readable(1099511627776), '1Ti')
+        self.assertEqual(utils.human_readable(1125899906842624), '1Pi')
+        self.assertEqual(utils.human_readable(1152921504606846976), '1Ei')
+        self.assertEqual(utils.human_readable(1180591620717411303424), '1Zi')
+        self.assertEqual(utils.human_readable(1208925819614629174706176),
+                         '1Yi')
+        self.assertEqual(utils.human_readable(1237940039285380274899124224),
+                         '1024Yi')
 
     def test_validate_sync_to(self):
-        for goodurl in ('http://1.1.1.1/v1/a/c/o',
-                        'http://1.1.1.1:8080/a/c/o',
-                        'http://2.2.2.2/a/c/o',
-                        'https://1.1.1.1/v1/a/c/o',
-                        ''):
-            self.assertEquals(utils.validate_sync_to(goodurl,
-                                                     ['1.1.1.1', '2.2.2.2']),
-                              None)
-        for badurl in ('http://1.1.1.1',
-                       'httpq://1.1.1.1/v1/a/c/o',
-                       'http://1.1.1.1/v1/a/c/o?query',
-                       'http://1.1.1.1/v1/a/c/o#frag',
-                       'http://1.1.1.1/v1/a/c/o?query#frag',
-                       'http://1.1.1.1/v1/a/c/o?query=param',
-                       'http://1.1.1.1/v1/a/c/o?query=param#frag',
-                       'http://1.1.1.2/v1/a/c/o'):
-            self.assertNotEquals(
-                utils.validate_sync_to(badurl, ['1.1.1.1', '2.2.2.2']),
-                None)
-
-    def test_TRUE_VALUES(self):
-        for v in utils.TRUE_VALUES:
-            self.assertEquals(v, v.lower())
-
-    def test_config_true_value(self):
-        orig_trues = utils.TRUE_VALUES
-        try:
-            utils.TRUE_VALUES = 'hello world'.split()
-            for val in 'hello world HELLO WORLD'.split():
-                self.assertTrue(utils.config_true_value(val) is True)
-            self.assertTrue(utils.config_true_value(True) is True)
-            self.assertTrue(utils.config_true_value('foo') is False)
-            self.assertTrue(utils.config_true_value(False) is False)
-        finally:
-            utils.TRUE_VALUES = orig_trues
+        fname = 'container-sync-realms.conf'
+        fcontents = '''
+[US]
+key = 9ff3b71c849749dbaec4ccdd3cbab62b
+cluster_dfw1 = http://dfw1.host/v1/
+'''
+        with temptree([fname], [fcontents]) as tempdir:
+            logger = debug_logger()
+            fpath = os.path.join(tempdir, fname)
+            csr = ContainerSyncRealms(fpath, logger)
+            for realms_conf in (None, csr):
+                for goodurl, result in (
+                        ('http://1.1.1.1/v1/a/c',
+                         (None, 'http://1.1.1.1/v1/a/c', None, None)),
+                        ('http://1.1.1.1:8080/a/c',
+                         (None, 'http://1.1.1.1:8080/a/c', None, None)),
+                        ('http://2.2.2.2/a/c',
+                         (None, 'http://2.2.2.2/a/c', None, None)),
+                        ('https://1.1.1.1/v1/a/c',
+                         (None, 'https://1.1.1.1/v1/a/c', None, None)),
+                        ('//US/DFW1/a/c',
+                         (None, 'http://dfw1.host/v1/a/c', 'US',
+                          '9ff3b71c849749dbaec4ccdd3cbab62b')),
+                        ('//us/DFW1/a/c',
+                         (None, 'http://dfw1.host/v1/a/c', 'US',
+                          '9ff3b71c849749dbaec4ccdd3cbab62b')),
+                        ('//us/dfw1/a/c',
+                         (None, 'http://dfw1.host/v1/a/c', 'US',
+                          '9ff3b71c849749dbaec4ccdd3cbab62b')),
+                        ('//',
+                         (None, None, None, None)),
+                        ('',
+                         (None, None, None, None))):
+                    if goodurl.startswith('//') and not realms_conf:
+                        self.assertEqual(
+                            utils.validate_sync_to(
+                                goodurl, ['1.1.1.1', '2.2.2.2'], realms_conf),
+                            (None, None, None, None))
+                    else:
+                        self.assertEqual(
+                            utils.validate_sync_to(
+                                goodurl, ['1.1.1.1', '2.2.2.2'], realms_conf),
+                            result)
+                for badurl, result in (
+                        ('http://1.1.1.1',
+                         ('Path required in X-Container-Sync-To', None, None,
+                          None)),
+                        ('httpq://1.1.1.1/v1/a/c',
+                         ('Invalid scheme \'httpq\' in X-Container-Sync-To, '
+                          'must be "//", "http", or "https".', None, None,
+                          None)),
+                        ('http://1.1.1.1/v1/a/c?query',
+                         ('Params, queries, and fragments not allowed in '
+                          'X-Container-Sync-To', None, None, None)),
+                        ('http://1.1.1.1/v1/a/c#frag',
+                         ('Params, queries, and fragments not allowed in '
+                          'X-Container-Sync-To', None, None, None)),
+                        ('http://1.1.1.1/v1/a/c?query#frag',
+                         ('Params, queries, and fragments not allowed in '
+                          'X-Container-Sync-To', None, None, None)),
+                        ('http://1.1.1.1/v1/a/c?query=param',
+                         ('Params, queries, and fragments not allowed in '
+                          'X-Container-Sync-To', None, None, None)),
+                        ('http://1.1.1.1/v1/a/c?query=param#frag',
+                         ('Params, queries, and fragments not allowed in '
+                          'X-Container-Sync-To', None, None, None)),
+                        ('http://1.1.1.2/v1/a/c',
+                         ("Invalid host '1.1.1.2' in X-Container-Sync-To",
+                          None, None, None)),
+                        ('//us/invalid/a/c',
+                         ("No cluster endpoint for 'us' 'invalid'", None,
+                          None, None)),
+                        ('//invalid/dfw1/a/c',
+                         ("No realm key for 'invalid'", None, None, None)),
+                        ('//us/invalid1/a/',
+                         ("Invalid X-Container-Sync-To format "
+                          "'//us/invalid1/a/'", None, None, None)),
+                        ('//us/invalid1/a',
+                         ("Invalid X-Container-Sync-To format "
+                          "'//us/invalid1/a'", None, None, None)),
+                        ('//us/invalid1/',
+                         ("Invalid X-Container-Sync-To format "
+                          "'//us/invalid1/'", None, None, None)),
+                        ('//us/invalid1',
+                         ("Invalid X-Container-Sync-To format "
+                          "'//us/invalid1'", None, None, None)),
+                        ('//us/',
+                         ("Invalid X-Container-Sync-To format "
+                          "'//us/'", None, None, None)),
+                        ('//us',
+                         ("Invalid X-Container-Sync-To format "
+                          "'//us'", None, None, None))):
+                    if badurl.startswith('//') and not realms_conf:
+                        self.assertEqual(
+                            utils.validate_sync_to(
+                                badurl, ['1.1.1.1', '2.2.2.2'], realms_conf),
+                            (None, None, None, None))
+                    else:
+                        self.assertEqual(
+                            utils.validate_sync_to(
+                                badurl, ['1.1.1.1', '2.2.2.2'], realms_conf),
+                            result)
 
     def test_streq_const_time(self):
         self.assertTrue(utils.streq_const_time('abc123', 'abc123'))
         self.assertFalse(utils.streq_const_time('a', 'aaaaa'))
         self.assertFalse(utils.streq_const_time('ABC123', 'abc123'))
 
+    def test_quorum_size(self):
+        expected_sizes = {1: 1,
+                          2: 1,
+                          3: 2,
+                          4: 2,
+                          5: 3}
+        got_sizes = dict([(n, utils.quorum_size(n))
+                          for n in expected_sizes])
+        self.assertEqual(expected_sizes, got_sizes)
+
+    def test_majority_size(self):
+        expected_sizes = {1: 1,
+                          2: 2,
+                          3: 2,
+                          4: 3,
+                          5: 3}
+        got_sizes = dict([(n, utils.majority_size(n))
+                          for n in expected_sizes])
+        self.assertEqual(expected_sizes, got_sizes)
+
     def test_rsync_ip_ipv4_localhost(self):
         self.assertEqual(utils.rsync_ip('127.0.0.1'), '127.0.0.1')
 
@@ -933,347 +1370,7413 @@ def test_rsync_ip_ipv6_ipv4_compatible(self):
         self.assertEqual(
             utils.rsync_ip('::ffff:192.0.2.128'), '[::ffff:192.0.2.128]')
 
+    def test_rsync_module_interpolation(self):
+        fake_device = {'ip': '127.0.0.1', 'port': 11,
+                       'replication_ip': '127.0.0.2', 'replication_port': 12,
+                       'region': '1', 'zone': '2', 'device': 'sda1',
+                       'meta': 'just_a_string'}
 
-class TestStatsdLogging(unittest.TestCase):
-    def test_get_logger_statsd_client_not_specified(self):
-        logger = utils.get_logger({}, 'some-name', log_route='some-route')
-        # white-box construction validation
-        self.assertEqual(None, logger.logger.statsd_client)
+        self.assertEqual(
+            utils.rsync_module_interpolation('{ip}', fake_device),
+            '127.0.0.1')
+        self.assertEqual(
+            utils.rsync_module_interpolation('{port}', fake_device),
+            '11')
+        self.assertEqual(
+            utils.rsync_module_interpolation('{replication_ip}', fake_device),
+            '127.0.0.2')
+        self.assertEqual(
+            utils.rsync_module_interpolation('{replication_port}',
+                                             fake_device),
+            '12')
+        self.assertEqual(
+            utils.rsync_module_interpolation('{region}', fake_device),
+            '1')
+        self.assertEqual(
+            utils.rsync_module_interpolation('{zone}', fake_device),
+            '2')
+        self.assertEqual(
+            utils.rsync_module_interpolation('{device}', fake_device),
+            'sda1')
+        self.assertEqual(
+            utils.rsync_module_interpolation('{meta}', fake_device),
+            'just_a_string')
 
-    def test_get_logger_statsd_client_defaults(self):
-        logger = utils.get_logger({'log_statsd_host': 'some.host.com'},
-                                  'some-name', log_route='some-route')
-        # white-box construction validation
-        self.assert_(isinstance(logger.logger.statsd_client,
-                                utils.StatsdClient))
-        self.assertEqual(logger.logger.statsd_client._host, 'some.host.com')
-        self.assertEqual(logger.logger.statsd_client._port, 8125)
-        self.assertEqual(logger.logger.statsd_client._prefix, 'some-name.')
-        self.assertEqual(logger.logger.statsd_client._default_sample_rate, 1)
+        self.assertEqual(
+            utils.rsync_module_interpolation('{replication_ip}::object',
+                                             fake_device),
+            '127.0.0.2::object')
+        self.assertEqual(
+            utils.rsync_module_interpolation('{ip}::container{port}',
+                                             fake_device),
+            '127.0.0.1::container11')
+        self.assertEqual(
+            utils.rsync_module_interpolation(
+                '{replication_ip}::object_{device}', fake_device),
+            '127.0.0.2::object_sda1')
+        self.assertEqual(
+            utils.rsync_module_interpolation(
+                '127.0.0.3::object_{replication_port}', fake_device),
+            '127.0.0.3::object_12')
+
+        self.assertRaises(ValueError, utils.rsync_module_interpolation,
+                          '{replication_ip}::object_{deivce}', fake_device)
+
+    def test_generate_trans_id(self):
+        fake_time = 1366428370.5163341
+        with patch.object(utils.time, 'time', return_value=fake_time):
+            trans_id = utils.generate_trans_id('')
+            self.assertEqual(len(trans_id), 34)
+            self.assertEqual(trans_id[:2], 'tx')
+            self.assertEqual(trans_id[23], '-')
+            self.assertEqual(int(trans_id[24:], 16), int(fake_time))
+        with patch.object(utils.time, 'time', return_value=fake_time):
+            trans_id = utils.generate_trans_id('-suffix')
+            self.assertEqual(len(trans_id), 41)
+            self.assertEqual(trans_id[:2], 'tx')
+            self.assertEqual(trans_id[34:], '-suffix')
+            self.assertEqual(trans_id[23], '-')
+            self.assertEqual(int(trans_id[24:34], 16), int(fake_time))
+
+    def test_get_trans_id_time(self):
+        ts = utils.get_trans_id_time('tx8c8bc884cdaf499bb29429aa9c46946e')
+        self.assertIsNone(ts)
+        ts = utils.get_trans_id_time('tx1df4ff4f55ea45f7b2ec2-0051720c06')
+        self.assertEqual(ts, 1366428678)
+        self.assertEqual(
+            time.asctime(time.gmtime(ts)) + ' UTC',
+            'Sat Apr 20 03:31:18 2013 UTC')
+        ts = utils.get_trans_id_time(
+            'tx1df4ff4f55ea45f7b2ec2-0051720c06-suffix')
+        self.assertEqual(ts, 1366428678)
+        self.assertEqual(
+            time.asctime(time.gmtime(ts)) + ' UTC',
+            'Sat Apr 20 03:31:18 2013 UTC')
+        ts = utils.get_trans_id_time('')
+        self.assertIsNone(ts)
+        ts = utils.get_trans_id_time('garbage')
+        self.assertIsNone(ts)
+        ts = utils.get_trans_id_time('tx1df4ff4f55ea45f7b2ec2-almostright')
+        self.assertIsNone(ts)
+
+    def test_lock_file(self):
+        flags = os.O_CREAT | os.O_RDWR
+        with NamedTemporaryFile(delete=False) as nt:
+            nt.write(b"test string")
+            nt.flush()
+            nt.close()
+            with utils.lock_file(nt.name, unlink=False) as f:
+                self.assertEqual(f.read(), b"test string")
+                # we have a lock, now let's try to get a newer one
+                fd = os.open(nt.name, flags)
+                self.assertRaises(IOError, fcntl.flock, fd,
+                                  fcntl.LOCK_EX | fcntl.LOCK_NB)
+
+            with utils.lock_file(nt.name, unlink=False, append=True) as f:
+                f.seek(0)
+                self.assertEqual(f.read(), b"test string")
+                f.seek(0)
+                f.write(b"\nanother string")
+                f.flush()
+                f.seek(0)
+                self.assertEqual(f.read(), b"test string\nanother string")
+
+                # we have a lock, now let's try to get a newer one
+                fd = os.open(nt.name, flags)
+                self.assertRaises(IOError, fcntl.flock, fd,
+                                  fcntl.LOCK_EX | fcntl.LOCK_NB)
+
+            with utils.lock_file(nt.name, timeout=3, unlink=False) as f:
+                try:
+                    with utils.lock_file(
+                            nt.name, timeout=1, unlink=False) as f:
+                        self.assertTrue(
+                            False, "Expected LockTimeout exception")
+                except LockTimeout:
+                    pass
+
+            with utils.lock_file(nt.name, unlink=True) as f:
+                self.assertEqual(f.read(), b"test string\nanother string")
+                # we have a lock, now let's try to get a newer one
+                fd = os.open(nt.name, flags)
+                self.assertRaises(
+                    IOError, fcntl.flock, fd, fcntl.LOCK_EX | fcntl.LOCK_NB)
+
+            self.assertRaises(OSError, os.remove, nt.name)
+
+    def test_lock_file_unlinked_after_open(self):
+        os_open = os.open
+        first_pass = [True]
+
+        def deleting_open(filename, flags):
+            # unlink the file after it's opened.  once.
+            fd = os_open(filename, flags)
+            if first_pass[0]:
+                os.unlink(filename)
+                first_pass[0] = False
+            return fd
+
+        with NamedTemporaryFile(delete=False) as nt:
+            with mock.patch('os.open', deleting_open):
+                with utils.lock_file(nt.name, unlink=True) as f:
+                    self.assertNotEqual(os.fstat(nt.fileno()).st_ino,
+                                        os.fstat(f.fileno()).st_ino)
+        first_pass = [True]
+
+        def recreating_open(filename, flags):
+            # unlink and recreate the file after it's opened
+            fd = os_open(filename, flags)
+            if first_pass[0]:
+                os.unlink(filename)
+                os.close(os_open(filename, os.O_CREAT | os.O_RDWR))
+                first_pass[0] = False
+            return fd
+
+        with NamedTemporaryFile(delete=False) as nt:
+            with mock.patch('os.open', recreating_open):
+                with utils.lock_file(nt.name, unlink=True) as f:
+                    self.assertNotEqual(os.fstat(nt.fileno()).st_ino,
+                                        os.fstat(f.fileno()).st_ino)
+
+    def test_lock_file_held_on_unlink(self):
+        os_unlink = os.unlink
+
+        def flocking_unlink(filename):
+            # make sure the lock is held when we unlink
+            fd = os.open(filename, os.O_RDWR)
+            self.assertRaises(
+                IOError, fcntl.flock, fd, fcntl.LOCK_EX | fcntl.LOCK_NB)
+            os.close(fd)
+            os_unlink(filename)
+
+        with NamedTemporaryFile(delete=False) as nt:
+            with mock.patch('os.unlink', flocking_unlink):
+                with utils.lock_file(nt.name, unlink=True):
+                    pass
+
+    def test_lock_file_no_unlink_if_fail(self):
+        os_open = os.open
+        with NamedTemporaryFile(delete=True) as nt:
+
+            def lock_on_open(filename, flags):
+                # lock the file on another fd after it's opened.
+                fd = os_open(filename, flags)
+                fd2 = os_open(filename, flags)
+                fcntl.flock(fd2, fcntl.LOCK_EX | fcntl.LOCK_NB)
+                return fd
+
+            try:
+                timedout = False
+                with mock.patch('os.open', lock_on_open):
+                    with utils.lock_file(nt.name, unlink=False, timeout=0.01):
+                        pass
+            except LockTimeout:
+                timedout = True
+            self.assertTrue(timedout)
+            self.assertTrue(os.path.exists(nt.name))
+
+    @with_tempdir
+    def test_ismount_path_does_not_exist(self, tmpdir):
+        self.assertFalse(utils.ismount(os.path.join(tmpdir, 'bar')))
+
+    @with_tempdir
+    def test_ismount_path_not_mount(self, tmpdir):
+        self.assertFalse(utils.ismount(tmpdir))
+
+    @with_tempdir
+    def test_ismount_path_error(self, tmpdir):
+
+        def _mock_os_lstat(path):
+            raise OSError(13, "foo")
+
+        with patch("os.lstat", _mock_os_lstat):
+            # Raises exception with _raw -- see next test.
+            utils.ismount(tmpdir)
+
+    @with_tempdir
+    def test_ismount_raw_path_error(self, tmpdir):
+
+        def _mock_os_lstat(path):
+            raise OSError(13, "foo")
+
+        with patch("os.lstat", _mock_os_lstat):
+            self.assertRaises(OSError, utils.ismount_raw, tmpdir)
+
+    @with_tempdir
+    def test_ismount_path_is_symlink(self, tmpdir):
+        link = os.path.join(tmpdir, "tmp")
+        rdir = os.path.join(tmpdir, "realtmp")
+        os.mkdir(rdir)
+        os.symlink(rdir, link)
+        self.assertFalse(utils.ismount(link))
+
+        # Can add a stubfile to make it pass
+        with open(os.path.join(link, ".ismount"), "w"):
+            pass
+        self.assertTrue(utils.ismount(link))
+
+    def test_ismount_path_is_root(self):
+        self.assertTrue(utils.ismount('/'))
+
+    @with_tempdir
+    def test_ismount_parent_path_error(self, tmpdir):
+
+        _os_lstat = os.lstat
+
+        def _mock_os_lstat(path):
+            if path.endswith(".."):
+                raise OSError(13, "foo")
+            else:
+                return _os_lstat(path)
+
+        with patch("os.lstat", _mock_os_lstat):
+            # Raises exception with _raw -- see next test.
+            utils.ismount(tmpdir)
+
+    @with_tempdir
+    def test_ismount_raw_parent_path_error(self, tmpdir):
+
+        _os_lstat = os.lstat
+
+        def _mock_os_lstat(path):
+            if path.endswith(".."):
+                raise OSError(13, "foo")
+            else:
+                return _os_lstat(path)
+
+        with patch("os.lstat", _mock_os_lstat):
+            self.assertRaises(OSError, utils.ismount_raw, tmpdir)
+
+    @with_tempdir
+    def test_ismount_successes_dev(self, tmpdir):
+
+        _os_lstat = os.lstat
+
+        class MockStat(object):
+            def __init__(self, mode, dev, ino):
+                self.st_mode = mode
+                self.st_dev = dev
+                self.st_ino = ino
+
+        def _mock_os_lstat(path):
+            if path.endswith(".."):
+                parent = _os_lstat(path)
+                return MockStat(parent.st_mode, parent.st_dev + 1,
+                                parent.st_ino)
+            else:
+                return _os_lstat(path)
+
+        with patch("os.lstat", _mock_os_lstat):
+            self.assertTrue(utils.ismount(tmpdir))
+
+    @with_tempdir
+    def test_ismount_successes_ino(self, tmpdir):
+
+        _os_lstat = os.lstat
+
+        class MockStat(object):
+            def __init__(self, mode, dev, ino):
+                self.st_mode = mode
+                self.st_dev = dev
+                self.st_ino = ino
+
+        def _mock_os_lstat(path):
+            if path.endswith(".."):
+                return _os_lstat(path)
+            else:
+                parent_path = os.path.join(path, "..")
+                child = _os_lstat(path)
+                parent = _os_lstat(parent_path)
+                return MockStat(child.st_mode, parent.st_ino,
+                                child.st_dev)
+
+        with patch("os.lstat", _mock_os_lstat):
+            self.assertTrue(utils.ismount(tmpdir))
+
+    @with_tempdir
+    def test_ismount_successes_stubfile(self, tmpdir):
+        fname = os.path.join(tmpdir, ".ismount")
+        with open(fname, "w") as stubfile:
+            stubfile.write("")
+        self.assertTrue(utils.ismount(tmpdir))
+
+    def test_parse_content_type(self):
+        self.assertEqual(utils.parse_content_type('text/plain'),
+                         ('text/plain', []))
+        self.assertEqual(utils.parse_content_type('text/plain;charset=utf-8'),
+                         ('text/plain', [('charset', 'utf-8')]))
+        self.assertEqual(
+            utils.parse_content_type('text/plain;hello="world";charset=utf-8'),
+            ('text/plain', [('hello', '"world"'), ('charset', 'utf-8')]))
+        self.assertEqual(
+            utils.parse_content_type('text/plain; hello="world"; a=b'),
+            ('text/plain', [('hello', '"world"'), ('a', 'b')]))
+        self.assertEqual(
+            utils.parse_content_type(r'text/plain; x="\""; a=b'),
+            ('text/plain', [('x', r'"\""'), ('a', 'b')]))
+        self.assertEqual(
+            utils.parse_content_type(r'text/plain; x; a=b'),
+            ('text/plain', [('x', ''), ('a', 'b')]))
+        self.assertEqual(
+            utils.parse_content_type(r'text/plain; x="\""; a'),
+            ('text/plain', [('x', r'"\""'), ('a', '')]))
+        self.assertEqual(
+            utils.parse_content_type(r'text/plain; x=a/b; y'),
+            ('text/plain', [('x', 'a'), ('y', '')]))
+
+        self.assertEqual(
+            utils.parse_content_type(r'text/plain; x=a/b; y', strict=True),
+            ('text/plain', [('x', 'a'), ('y', '')]))
+        self.assertEqual(
+            utils.parse_content_type(r'text/plain; x=a/b; y', strict=False),
+            ('text/plain', [('x', 'a/b'), ('y', '')]))
+
+    def test_parse_header(self):
+        self.assertEqual(
+            utils.parse_header('text/plain'), ('text/plain', {}))
+        self.assertEqual(
+            utils.parse_header('text/plain;'), ('text/plain', {}))
+        self.assertEqual(
+            utils.parse_header(r'text/plain; x=a/b; y  =  z'),
+            ('text/plain', {'x': 'a/b', 'y': 'z'}))
+        self.assertEqual(
+            utils.parse_header(r'text/plain; x=a/b; y'),
+            ('text/plain', {'x': 'a/b', 'y': ''}))
+        self.assertEqual(
+            utils.parse_header('etag; x=a/b; y'),
+            ('etag', {'x': 'a/b', 'y': ''}))
+
+    def test_parse_headers_chars_in_params(self):
+        def do_test(val):
+            self.assertEqual(
+                utils.parse_header('text/plain; x=a%sb' % val),
+                ('text/plain', {'x': 'a%sb' % val}))
+
+        do_test('\N{SNOWMAN}')
+        do_test('\\')
+        do_test('%')
+        do_test('-')
+        do_test('-')
+        do_test('&')
+        # wsgi_quote'd null character is ok...
+        do_test('%00')
+
+    def test_parse_header_non_token_chars_in_params(self):
+        def do_test(val):
+            # character terminates individual param parsing...
+            self.assertEqual(
+                utils.parse_header('text/plain; x=a%sb; y=z' % val),
+                ('text/plain', {'x': 'a', 'y': 'z'}),
+                'val=%s' % val
+            )
+
+        non_token_chars = '()<>@,:[]?={}\x00"'
+
+        for ch in non_token_chars:
+            do_test(ch)
+
+        do_test(' space  oddity ')
+
+    def test_parse_header_quoted_string_in_params(self):
+        def do_test(val):
+            self.assertEqual(
+                utils.parse_header('text/plain; x="%s"; y=z' % val),
+                ('text/plain', {'x': '"%s"' % val, 'y': 'z'}),
+                'val=%s' % val
+            )
+
+        non_token_chars = '()<>@,:[]?={}\x00'
+
+        for ch in non_token_chars:
+            do_test(ch)
+
+        do_test(' space  oddity ')
+
+    def test_override_bytes_from_content_type(self):
+        listing_dict = {
+            'bytes': 1234, 'hash': 'asdf', 'name': 'zxcv',
+            'content_type': 'text/plain; hello="world"; swift_bytes=15'}
+        utils.override_bytes_from_content_type(listing_dict,
+                                               logger=debug_logger())
+        self.assertEqual(listing_dict['bytes'], 15)
+        self.assertEqual(listing_dict['content_type'],
+                         'text/plain;hello="world"')
+
+        listing_dict = {
+            'bytes': 1234, 'hash': 'asdf', 'name': 'zxcv',
+            'content_type': 'text/plain; hello="world"; swift_bytes=hey'}
+        utils.override_bytes_from_content_type(listing_dict,
+                                               logger=debug_logger())
+        self.assertEqual(listing_dict['bytes'], 1234)
+        self.assertEqual(listing_dict['content_type'],
+                         'text/plain;hello="world"')
+
+    def test_extract_swift_bytes(self):
+        scenarios = {
+            # maps input value -> expected returned tuple
+            '': ('', None),
+            'text/plain': ('text/plain', None),
+            'text/plain; other=thing': ('text/plain;other=thing', None),
+            'text/plain; swift_bytes=123': ('text/plain', '123'),
+            'text/plain; other=thing;swift_bytes=123':
+                ('text/plain;other=thing', '123'),
+            'text/plain; swift_bytes=123; other=thing':
+                ('text/plain;other=thing', '123'),
+            'text/plain; swift_bytes=123; swift_bytes=456':
+                ('text/plain', '456'),
+            'text/plain; swift_bytes=123; other=thing;swift_bytes=456':
+                ('text/plain;other=thing', '456')}
+        for test_value, expected in scenarios.items():
+            self.assertEqual(expected, utils.extract_swift_bytes(test_value))
+
+    def test_clean_content_type(self):
+        subtests = {
+            '': '', 'text/plain': 'text/plain',
+            'text/plain; someother=thing': 'text/plain; someother=thing',
+            'text/plain; swift_bytes=123': 'text/plain',
+            'text/plain; someother=thing; swift_bytes=123':
+                'text/plain; someother=thing',
+            # Since Swift always tacks on the swift_bytes, clean_content_type()
+            # only strips swift_bytes if it's last. The next item simply shows
+            # that if for some other odd reason it's not last,
+            # clean_content_type() will not remove it from the header.
+            'text/plain; swift_bytes=123; someother=thing':
+                'text/plain; swift_bytes=123; someother=thing'}
+        for before, after in subtests.items():
+            self.assertEqual(utils.clean_content_type(before), after)
+
+    def test_get_valid_utf8_str(self):
+        def do_test(input_value, expected):
+            actual = utils.get_valid_utf8_str(input_value)
+            self.assertEqual(expected, actual)
+            self.assertIsInstance(actual, bytes)
+            actual.decode('utf-8')
+
+        do_test(b'abc', b'abc')
+        do_test(u'abc', b'abc')
+        do_test(u'\uc77c\uc601', b'\xec\x9d\xbc\xec\x98\x81')
+        do_test(b'\xec\x9d\xbc\xec\x98\x81', b'\xec\x9d\xbc\xec\x98\x81')
+
+        # test some invalid UTF-8
+        do_test(b'\xec\x9d\xbc\xec\x98', b'\xec\x9d\xbc\xef\xbf\xbd')
+
+        # check surrogate pairs, too
+        do_test(u'\U0001f0a1', b'\xf0\x9f\x82\xa1'),
+        do_test(u'\uD83C\uDCA1', b'\xf0\x9f\x82\xa1'),
+        do_test(b'\xf0\x9f\x82\xa1', b'\xf0\x9f\x82\xa1'),
+        do_test(b'\xed\xa0\xbc\xed\xb2\xa1', b'\xf0\x9f\x82\xa1'),
+
+    def test_quote_bytes(self):
+        self.assertEqual(b'/v1/a/c3/subdirx/',
+                         utils.quote(b'/v1/a/c3/subdirx/'))
+        self.assertEqual(b'/v1/a%26b/c3/subdirx/',
+                         utils.quote(b'/v1/a&b/c3/subdirx/'))
+        self.assertEqual(b'%2Fv1%2Fa&b%2Fc3%2Fsubdirx%2F',
+                         utils.quote(b'/v1/a&b/c3/subdirx/', safe='&'))
+        self.assertEqual(b'abc_%EC%9D%BC%EC%98%81',
+                         utils.quote(u'abc_\uc77c\uc601'.encode('utf8')))
+        # Invalid utf8 is parsed as latin1, then re-encoded as utf8??
+        self.assertEqual(b'%EF%BF%BD%EF%BF%BD%EC%BC%9D%EF%BF%BD',
+                         utils.quote(u'\uc77c\uc601'.encode('utf8')[::-1]))
+
+    def test_quote_unicode(self):
+        self.assertEqual(u'/v1/a/c3/subdirx/',
+                         utils.quote(u'/v1/a/c3/subdirx/'))
+        self.assertEqual(u'/v1/a%26b/c3/subdirx/',
+                         utils.quote(u'/v1/a&b/c3/subdirx/'))
+        self.assertEqual(u'%2Fv1%2Fa&b%2Fc3%2Fsubdirx%2F',
+                         utils.quote(u'/v1/a&b/c3/subdirx/', safe='&'))
+        self.assertEqual(u'abc_%EC%9D%BC%EC%98%81',
+                         utils.quote(u'abc_\uc77c\uc601'))
+
+    def test_parse_override_options(self):
+        # When override_<thing> is passed in, it takes precedence.
+        opts = utils.parse_override_options(
+            override_policies=[0, 1],
+            override_devices=['sda', 'sdb'],
+            override_partitions=[100, 200],
+            policies='0,1,2,3',
+            devices='sda,sdb,sdc,sdd',
+            partitions='100,200,300,400')
+        self.assertEqual(opts.policies, [0, 1])
+        self.assertEqual(opts.devices, ['sda', 'sdb'])
+        self.assertEqual(opts.partitions, [100, 200])
+
+        # When override_<thing> is passed in, it applies even in run-once
+        # mode.
+        opts = utils.parse_override_options(
+            once=True,
+            override_policies=[0, 1],
+            override_devices=['sda', 'sdb'],
+            override_partitions=[100, 200],
+            policies='0,1,2,3',
+            devices='sda,sdb,sdc,sdd',
+            partitions='100,200,300,400')
+        self.assertEqual(opts.policies, [0, 1])
+        self.assertEqual(opts.devices, ['sda', 'sdb'])
+        self.assertEqual(opts.partitions, [100, 200])
+
+        # In run-once mode, we honor the passed-in overrides.
+        opts = utils.parse_override_options(
+            once=True,
+            policies='0,1,2,3',
+            devices='sda,sdb,sdc,sdd',
+            partitions='100,200,300,400')
+        self.assertEqual(opts.policies, [0, 1, 2, 3])
+        self.assertEqual(opts.devices, ['sda', 'sdb', 'sdc', 'sdd'])
+        self.assertEqual(opts.partitions, [100, 200, 300, 400])
+
+        # In run-forever mode, we ignore the passed-in overrides.
+        opts = utils.parse_override_options(
+            policies='0,1,2,3',
+            devices='sda,sdb,sdc,sdd',
+            partitions='100,200,300,400')
+        self.assertEqual(opts.policies, [])
+        self.assertEqual(opts.devices, [])
+        self.assertEqual(opts.partitions, [])
+
+    def test_cache_from_env(self):
+        # should never get logging when swift.cache is found
+        env = {'swift.cache': 42}
+        logger = debug_logger()
+        with mock.patch('swift.common.utils.logging', logger):
+            self.assertEqual(42, utils.cache_from_env(env))
+            self.assertEqual(0, len(logger.get_lines_for_level('error')))
+        logger = debug_logger()
+        with mock.patch('swift.common.utils.logging', logger):
+            self.assertEqual(42, utils.cache_from_env(env, False))
+            self.assertEqual(0, len(logger.get_lines_for_level('error')))
+        logger = debug_logger()
+        with mock.patch('swift.common.utils.logging', logger):
+            self.assertEqual(42, utils.cache_from_env(env, True))
+            self.assertEqual(0, len(logger.get_lines_for_level('error')))
+
+        # check allow_none controls logging when swift.cache is not found
+        err_msg = 'ERROR: swift.cache could not be found in env!'
+        env = {}
+        logger = debug_logger()
+        with mock.patch('swift.common.utils.logging', logger):
+            self.assertIsNone(utils.cache_from_env(env))
+            self.assertTrue(err_msg in logger.get_lines_for_level('error'))
+        logger = debug_logger()
+        with mock.patch('swift.common.utils.logging', logger):
+            self.assertIsNone(utils.cache_from_env(env, False))
+            self.assertTrue(err_msg in logger.get_lines_for_level('error'))
+        logger = debug_logger()
+        with mock.patch('swift.common.utils.logging', logger):
+            self.assertIsNone(utils.cache_from_env(env, True))
+            self.assertEqual(0, len(logger.get_lines_for_level('error')))
+
+    @with_tempdir
+    def test_fsync_dir(self, tempdir):
+
+        fd = None
+        try:
+            fd, temppath = tempfile.mkstemp(dir=tempdir)
+
+            _mock_fsync = mock.Mock()
+            _mock_close = mock.Mock()
+
+            with patch('swift.common.utils.fsync', _mock_fsync):
+                with patch('os.close', _mock_close):
+                    utils.fsync_dir(tempdir)
+            self.assertTrue(_mock_fsync.called)
+            self.assertTrue(_mock_close.called)
+            self.assertIsInstance(_mock_fsync.call_args[0][0], int)
+            self.assertEqual(_mock_fsync.call_args[0][0],
+                             _mock_close.call_args[0][0])
+
+            # Not a directory - arg is file path
+            self.assertRaises(OSError, utils.fsync_dir, temppath)
+
+            logger = debug_logger()
+
+            def _mock_fsync(fd):
+                raise OSError(errno.EBADF, os.strerror(errno.EBADF))
+
+            with patch('swift.common.utils.fsync', _mock_fsync):
+                with mock.patch('swift.common.utils.logging', logger):
+                    utils.fsync_dir(tempdir)
+            self.assertEqual(1, len(logger.get_lines_for_level('warning')))
+
+        finally:
+            if fd is not None:
+                os.close(fd)
+                os.unlink(temppath)
+
+    @with_tempdir
+    def test_renamer_with_fsync_dir(self, tempdir):
+        # Simulate part of object path already existing
+        part_dir = os.path.join(tempdir, 'objects/1234/')
+        os.makedirs(part_dir)
+        obj_dir = os.path.join(part_dir, 'aaa', 'a' * 32)
+        obj_path = os.path.join(obj_dir, '1425276031.12345.data')
+
+        # Object dir had to be created
+        _m_os_rename = mock.Mock()
+        _m_fsync_dir = mock.Mock()
+        with patch('os.rename', _m_os_rename):
+            with patch('swift.common.utils.fsync_dir', _m_fsync_dir):
+                utils.renamer("fake_path", obj_path)
+        _m_os_rename.assert_called_once_with('fake_path', obj_path)
+        # fsync_dir on parents of all newly create dirs
+        self.assertEqual(_m_fsync_dir.call_count, 3)
+
+        # Object dir existed
+        _m_os_rename.reset_mock()
+        _m_fsync_dir.reset_mock()
+        with patch('os.rename', _m_os_rename):
+            with patch('swift.common.utils.fsync_dir', _m_fsync_dir):
+                utils.renamer("fake_path", obj_path)
+        _m_os_rename.assert_called_once_with('fake_path', obj_path)
+        # fsync_dir only on the leaf dir
+        self.assertEqual(_m_fsync_dir.call_count, 1)
+
+    def test_renamer_when_fsync_is_false(self):
+        _m_os_rename = mock.Mock()
+        _m_fsync_dir = mock.Mock()
+        _m_makedirs_count = mock.Mock(return_value=2)
+        with patch('os.rename', _m_os_rename):
+            with patch('swift.common.utils.fsync_dir', _m_fsync_dir):
+                with patch('swift.common.utils.makedirs_count',
+                           _m_makedirs_count):
+                    utils.renamer("fake_path", "/a/b/c.data", fsync=False)
+        _m_makedirs_count.assert_called_once_with("/a/b")
+        _m_os_rename.assert_called_once_with('fake_path', "/a/b/c.data")
+        self.assertFalse(_m_fsync_dir.called)
+
+    @with_tempdir
+    def test_makedirs_count(self, tempdir):
+        os.makedirs(os.path.join(tempdir, 'a/b'))
+        # 4 new dirs created
+        dirpath = os.path.join(tempdir, 'a/b/1/2/3/4')
+        ret = utils.makedirs_count(dirpath)
+        self.assertEqual(ret, 4)
+        # no new dirs created - dir already exists
+        ret = utils.makedirs_count(dirpath)
+        self.assertEqual(ret, 0)
+        # path exists and is a file
+        fd, temppath = tempfile.mkstemp(dir=dirpath)
+        os.close(fd)
+        self.assertRaises(OSError, utils.makedirs_count, temppath)
+
+    def test_find_namespace(self):
+        ts = utils.Timestamp.now().internal
+        start = utils.ShardRange('a/-a', ts, '', 'a')
+        atof = utils.ShardRange('a/a-f', ts, 'a', 'f')
+        ftol = utils.ShardRange('a/f-l', ts, 'f', 'l')
+        ltor = utils.ShardRange('a/l-r', ts, 'l', 'r')
+        rtoz = utils.ShardRange('a/r-z', ts, 'r', 'z')
+        end = utils.ShardRange('a/z-', ts, 'z', '')
+        ranges = [start, atof, ftol, ltor, rtoz, end]
+
+        found = utils.find_namespace('', ranges)
+        self.assertEqual(found, None)
+        found = utils.find_namespace(' ', ranges)
+        self.assertEqual(found, start)
+        found = utils.find_namespace(' ', ranges[1:])
+        self.assertEqual(found, None)
+        found = utils.find_namespace('b', ranges)
+        self.assertEqual(found, atof)
+        found = utils.find_namespace('f', ranges)
+        self.assertEqual(found, atof)
+        found = utils.find_namespace('f\x00', ranges)
+        self.assertEqual(found, ftol)
+        found = utils.find_namespace('x', ranges)
+        self.assertEqual(found, rtoz)
+        found = utils.find_namespace('r', ranges)
+        self.assertEqual(found, ltor)
+        found = utils.find_namespace('}', ranges)
+        self.assertEqual(found, end)
+        found = utils.find_namespace('}', ranges[:-1])
+        self.assertEqual(found, None)
+        # remove l-r from list of ranges and try and find a shard range for an
+        # item in that range.
+        found = utils.find_namespace('p', ranges[:-3] + ranges[-2:])
+        self.assertEqual(found, None)
+
+        # add some sub-shards; a sub-shard's state is less than its parent
+        # while the parent is undeleted, so insert these ahead of the
+        # overlapping parent in the list of ranges
+        ftoh = utils.ShardRange('a/f-h', ts, 'f', 'h')
+        htok = utils.ShardRange('a/h-k', ts, 'h', 'k')
+
+        overlapping_ranges = ranges[:2] + [ftoh, htok] + ranges[2:]
+        found = utils.find_namespace('g', overlapping_ranges)
+        self.assertEqual(found, ftoh)
+        found = utils.find_namespace('h', overlapping_ranges)
+        self.assertEqual(found, ftoh)
+        found = utils.find_namespace('k', overlapping_ranges)
+        self.assertEqual(found, htok)
+        found = utils.find_namespace('l', overlapping_ranges)
+        self.assertEqual(found, ftol)
+        found = utils.find_namespace('m', overlapping_ranges)
+        self.assertEqual(found, ltor)
+
+        ktol = utils.ShardRange('a/k-l', ts, 'k', 'l')
+        overlapping_ranges = ranges[:2] + [ftoh, htok, ktol] + ranges[2:]
+        found = utils.find_namespace('l', overlapping_ranges)
+        self.assertEqual(found, ktol)
+
+    def test_parse_db_filename(self):
+        actual = utils.parse_db_filename('hash.db')
+        self.assertEqual(('hash', None, '.db'), actual)
+        actual = utils.parse_db_filename('hash_1234567890.12345.db')
+        self.assertEqual(('hash', '1234567890.12345', '.db'), actual)
+        actual = utils.parse_db_filename(
+            '/dev/containers/part/ash/hash/hash_1234567890.12345.db')
+        self.assertEqual(('hash', '1234567890.12345', '.db'), actual)
+        self.assertRaises(ValueError, utils.parse_db_filename, '/path/to/dir/')
+        # These shouldn't come up in practice; included for completeness
+        self.assertEqual(utils.parse_db_filename('hashunder_.db'),
+                         ('hashunder', '', '.db'))
+        self.assertEqual(utils.parse_db_filename('lots_of_underscores.db'),
+                         ('lots', 'of', '.db'))
+
+    def test_make_db_file_path(self):
+        epoch = utils.Timestamp.now()
+        actual = utils.make_db_file_path('hash.db', epoch)
+        self.assertEqual('hash_%s.db' % epoch.normal, actual)
+
+        actual = utils.make_db_file_path('hash_oldepoch.db', epoch)
+        self.assertEqual('hash_%s.db' % epoch.normal, actual)
+
+        actual = utils.make_db_file_path('/path/to/hash.db', epoch)
+        self.assertEqual('/path/to/hash_%s.db' % epoch.normal, actual)
+
+        epoch = utils.Timestamp.now()
+        actual = utils.make_db_file_path(actual, epoch)
+        self.assertEqual('/path/to/hash_%s.db' % epoch.normal, actual)
+
+        # None strips epoch
+        self.assertEqual('hash.db', utils.make_db_file_path('hash.db', None))
+        self.assertEqual('/path/to/hash.db', utils.make_db_file_path(
+            '/path/to/hash_withepoch.db', None))
+
+        # epochs shouldn't have offsets
+        epoch = utils.Timestamp.now(offset=10)
+        actual = utils.make_db_file_path(actual, epoch)
+        self.assertEqual('/path/to/hash_%s.db' % epoch.normal, actual)
+
+        self.assertRaises(ValueError, utils.make_db_file_path,
+                          '/path/to/hash.db', 'bad epoch')
+
+    @requires_o_tmpfile_support_in_tmp
+    @with_tempdir
+    def test_link_fd_to_path_linkat_success(self, tempdir):
+        fd = os.open(tempdir, utils.O_TMPFILE | os.O_WRONLY)
+        data = b"I'm whatever Gotham needs me to be"
+        _m_fsync_dir = mock.Mock()
+        try:
+            os.write(fd, data)
+            # fd is O_WRONLY
+            self.assertRaises(OSError, os.read, fd, 1)
+            file_path = os.path.join(tempdir, uuid4().hex)
+            with mock.patch('swift.common.utils.fsync_dir', _m_fsync_dir):
+                utils.link_fd_to_path(fd, file_path, 1)
+            with open(file_path, 'rb') as f:
+                self.assertEqual(f.read(), data)
+            self.assertEqual(_m_fsync_dir.call_count, 2)
+        finally:
+            os.close(fd)
+
+    @requires_o_tmpfile_support_in_tmp
+    @with_tempdir
+    def test_link_fd_to_path_target_exists(self, tempdir):
+        # Create and write to a file
+        fd, path = tempfile.mkstemp(dir=tempdir)
+        os.write(fd, b"hello world")
+        os.fsync(fd)
+        os.close(fd)
+        self.assertTrue(os.path.exists(path))
+
+        fd = os.open(tempdir, utils.O_TMPFILE | os.O_WRONLY)
+        try:
+            os.write(fd, b"bye world")
+            os.fsync(fd)
+            utils.link_fd_to_path(fd, path, 0, fsync=False)
+            # Original file now should have been over-written
+            with open(path, 'rb') as f:
+                self.assertEqual(f.read(), b"bye world")
+        finally:
+            os.close(fd)
+
+    def test_link_fd_to_path_errno_not_EEXIST_or_ENOENT(self):
+        _m_linkat = mock.Mock(
+            side_effect=IOError(errno.EACCES, os.strerror(errno.EACCES)))
+        with mock.patch('swift.common.utils.linkat', _m_linkat):
+            try:
+                utils.link_fd_to_path(0, '/path', 1)
+            except IOError as err:
+                self.assertEqual(err.errno, errno.EACCES)
+            else:
+                self.fail("Expecting IOError exception")
+        self.assertTrue(_m_linkat.called)
+
+    def test_link_fd_to_path_runs_out_of_retries(self):
+        _m_linkat = mock.Mock(
+            side_effect=IOError(errno.ENOENT, os.strerror(errno.ENOENT)))
+        with mock.patch('swift.common.utils.linkat', _m_linkat), \
+                self.assertRaises(IOError) as caught:
+            utils.link_fd_to_path(0, '/path', 1)
+        self.assertEqual(caught.exception.errno, errno.ENOENT)
+        self.assertEqual(3, len(_m_linkat.mock_calls))
+
+    @requires_o_tmpfile_support_in_tmp
+    @with_tempdir
+    def test_linkat_race_dir_not_exists(self, tempdir):
+        target_dir = os.path.join(tempdir, uuid4().hex)
+        target_path = os.path.join(target_dir, uuid4().hex)
+        os.mkdir(target_dir)
+        fd = os.open(target_dir, utils.O_TMPFILE | os.O_WRONLY)
+        try:
+            # Simulating directory deletion by other backend process
+            os.rmdir(target_dir)
+            self.assertFalse(os.path.exists(target_dir))
+            utils.link_fd_to_path(fd, target_path, 1)
+            self.assertTrue(os.path.exists(target_dir))
+            self.assertTrue(os.path.exists(target_path))
+        finally:
+            os.close(fd)
+
+    def test_safe_json_loads(self):
+        expectations = {
+            None: None,
+            '': None,
+            0: None,
+            1: None,
+            '"asdf"': 'asdf',
+            '[]': [],
+            '{}': {},
+            "{'foo': 'bar'}": None,
+            '{"foo": "bar"}': {'foo': 'bar'},
+        }
+
+        failures = []
+        for value, expected in expectations.items():
+            try:
+                result = utils.safe_json_loads(value)
+            except Exception as e:
+                # it's called safe, if it blows up the test blows up
+                self.fail('%r caused safe method to throw %r!' % (
+                    value, e))
+            try:
+                self.assertEqual(expected, result)
+            except AssertionError:
+                failures.append('%r => %r (expected %r)' % (
+                    value, result, expected))
+        if failures:
+            self.fail('Invalid results from pure function:\n%s' %
+                      '\n'.join(failures))
+
+    def test_strict_b64decode(self):
+        expectations = {
+            None: ValueError,
+            0: ValueError,
+            b'': b'',
+            u'': b'',
+            b'A': ValueError,
+            b'AA': ValueError,
+            b'AAA': ValueError,
+            b'AAAA': b'\x00\x00\x00',
+            u'AAAA': b'\x00\x00\x00',
+            b'////': b'\xff\xff\xff',
+            u'////': b'\xff\xff\xff',
+            b'A===': ValueError,
+            b'AA==': b'\x00',
+            b'AAA=': b'\x00\x00',
+            b' AAAA': ValueError,
+            b'AAAA ': ValueError,
+            b'AAAA============': b'\x00\x00\x00',
+            b'AA&AA==': ValueError,
+            b'====': b'',
+        }
+
+        failures = []
+        for value, expected in expectations.items():
+            try:
+                result = utils.strict_b64decode(value)
+            except Exception as e:
+                if inspect.isclass(expected) and issubclass(
+                        expected, Exception):
+                    if not isinstance(e, expected):
+                        failures.append('%r raised %r (expected to raise %r)' %
+                                        (value, e, expected))
+                else:
+                    failures.append('%r raised %r (expected to return %r)' %
+                                    (value, e, expected))
+            else:
+                if inspect.isclass(expected) and issubclass(
+                        expected, Exception):
+                    failures.append('%r => %r (expected to raise %r)' %
+                                    (value, result, expected))
+                elif result != expected:
+                    failures.append('%r => %r (expected %r)' % (
+                        value, result, expected))
+        if failures:
+            self.fail('Invalid results from pure function:\n%s' %
+                      '\n'.join(failures))
+
+    def test_strict_b64decode_allow_line_breaks(self):
+        with self.assertRaises(ValueError):
+            utils.strict_b64decode(b'AA\nA=')
+        self.assertEqual(
+            b'\x00\x00',
+            utils.strict_b64decode(b'AA\nA=', allow_line_breaks=True))
+
+    def test_strict_b64decode_exact_size(self):
+        self.assertEqual(b'\x00\x00',
+                         utils.strict_b64decode(b'AAA='))
+        self.assertEqual(b'\x00\x00',
+                         utils.strict_b64decode(b'AAA=', exact_size=2))
+        with self.assertRaises(ValueError):
+            utils.strict_b64decode(b'AAA=', exact_size=1)
+        with self.assertRaises(ValueError):
+            utils.strict_b64decode(b'AAA=', exact_size=3)
+
+    def test_base64_str(self):
+        self.assertEqual('Zm9v', utils.base64_str(b'foo'))
+        self.assertEqual('Zm9vZA==', utils.base64_str(b'food'))
+        self.assertEqual('IGZvbw==', utils.base64_str(b' foo'))
+
+    def test_cap_length(self):
+        self.assertEqual(utils.cap_length(None, 3), None)
+        self.assertEqual(utils.cap_length('', 3), '')
+        self.assertEqual(utils.cap_length('asdf', 3), 'asd...')
+        self.assertEqual(utils.cap_length('asdf', 5), 'asdf')
+
+        self.assertEqual(utils.cap_length(b'asdf', 3), b'asd...')
+        self.assertEqual(utils.cap_length(b'asdf', 5), b'asdf')
+
+    def test_get_partition_for_hash(self):
+        hex_hash = 'af088baea4806dcaba30bf07d9e64c77'
+        self.assertEqual(43, utils.get_partition_for_hash(hex_hash, 6))
+        self.assertEqual(87, utils.get_partition_for_hash(hex_hash, 7))
+        self.assertEqual(350, utils.get_partition_for_hash(hex_hash, 9))
+        self.assertEqual(700, utils.get_partition_for_hash(hex_hash, 10))
+        self.assertEqual(1400, utils.get_partition_for_hash(hex_hash, 11))
+        self.assertEqual(0, utils.get_partition_for_hash(hex_hash, 0))
+        self.assertEqual(0, utils.get_partition_for_hash(hex_hash, -1))
+
+    def test_get_partition_from_path(self):
+        def do_test(path):
+            self.assertEqual(utils.get_partition_from_path('/s/n', path), 70)
+            self.assertEqual(utils.get_partition_from_path('/s/n/', path), 70)
+            path += '/'
+            self.assertEqual(utils.get_partition_from_path('/s/n', path), 70)
+            self.assertEqual(utils.get_partition_from_path('/s/n/', path), 70)
+
+        do_test('/s/n/d/o/70/c77/af088baea4806dcaba30bf07d9e64c77/f')
+        # also works with a hashdir
+        do_test('/s/n/d/o/70/c77/af088baea4806dcaba30bf07d9e64c77')
+        # or suffix dir
+        do_test('/s/n/d/o/70/c77')
+        # or even the part dir itself
+        do_test('/s/n/d/o/70')
+
+    def test_replace_partition_in_path(self):
+        # Check for new part = part * 2
+        old = '/s/n/d/o/700/c77/af088baea4806dcaba30bf07d9e64c77/f'
+        new = '/s/n/d/o/1400/c77/af088baea4806dcaba30bf07d9e64c77/f'
+        # Expected outcome
+        self.assertEqual(utils.replace_partition_in_path('/s/n/', old, 11),
+                         new)
+
+        # Make sure there is no change if the part power didn't change
+        self.assertEqual(utils.replace_partition_in_path('/s/n', old, 10), old)
+        self.assertEqual(utils.replace_partition_in_path('/s/n/', new, 11),
+                         new)
+
+        # Check for new part = part * 2 + 1
+        old = '/s/n/d/o/693/c77/ad708baea4806dcaba30bf07d9e64c77/f'
+        new = '/s/n/d/o/1387/c77/ad708baea4806dcaba30bf07d9e64c77/f'
+
+        # Expected outcome
+        self.assertEqual(utils.replace_partition_in_path('/s/n', old, 11), new)
+
+        # Make sure there is no change if the part power didn't change
+        self.assertEqual(utils.replace_partition_in_path('/s/n', old, 10), old)
+        self.assertEqual(utils.replace_partition_in_path('/s/n/', new, 11),
+                         new)
+
+        # check hash_dir
+        old = '/s/n/d/o/700/c77/af088baea4806dcaba30bf07d9e64c77'
+        exp = '/s/n/d/o/1400/c77/af088baea4806dcaba30bf07d9e64c77'
+        actual = utils.replace_partition_in_path('/s/n', old, 11)
+        self.assertEqual(exp, actual)
+        actual = utils.replace_partition_in_path('/s/n', exp, 11)
+        self.assertEqual(exp, actual)
+
+        # check longer devices path
+        old = '/s/n/1/2/d/o/700/c77/af088baea4806dcaba30bf07d9e64c77'
+        exp = '/s/n/1/2/d/o/1400/c77/af088baea4806dcaba30bf07d9e64c77'
+        actual = utils.replace_partition_in_path('/s/n/1/2', old, 11)
+        self.assertEqual(exp, actual)
+        actual = utils.replace_partition_in_path('/s/n/1/2', exp, 11)
+        self.assertEqual(exp, actual)
+
+        # check empty devices path
+        old = '/d/o/700/c77/af088baea4806dcaba30bf07d9e64c77'
+        exp = '/d/o/1400/c77/af088baea4806dcaba30bf07d9e64c77'
+        actual = utils.replace_partition_in_path('', old, 11)
+        self.assertEqual(exp, actual)
+        actual = utils.replace_partition_in_path('', exp, 11)
+        self.assertEqual(exp, actual)
+
+        # check path validation
+        path = '/s/n/d/o/693/c77/ad708baea4806dcaba30bf07d9e64c77/f'
+        with self.assertRaises(ValueError) as cm:
+            utils.replace_partition_in_path('/s/n1', path, 11)
+        self.assertEqual(
+            "Path '/s/n/d/o/693/c77/ad708baea4806dcaba30bf07d9e64c77/f' "
+            "is not under device dir '/s/n1'", str(cm.exception))
+
+        # check path validation - path lacks leading /
+        path = 's/n/d/o/693/c77/ad708baea4806dcaba30bf07d9e64c77/f'
+        with self.assertRaises(ValueError) as cm:
+            utils.replace_partition_in_path('/s/n', path, 11)
+        self.assertEqual(
+            "Path 's/n/d/o/693/c77/ad708baea4806dcaba30bf07d9e64c77/f' "
+            "is not under device dir '/s/n'", str(cm.exception))
+
+    def test_round_robin_iter(self):
+        it1 = iter([1, 2, 3])
+        it2 = iter([4, 5])
+        it3 = iter([6, 7, 8, 9])
+        it4 = iter([])
+
+        rr_its = utils.round_robin_iter([it1, it2, it3, it4])
+        got = list(rr_its)
+
+        # Expect that items get fetched in a round-robin fashion from the
+        # iterators
+        self.assertListEqual([1, 4, 6, 2, 5, 7, 3, 8, 9], got)
+
+    @with_tempdir
+    def test_get_db_files(self, tempdir):
+        dbdir = os.path.join(tempdir, 'dbdir')
+        self.assertEqual([], utils.get_db_files(dbdir))
+        path_1 = os.path.join(dbdir, 'dbfile.db')
+        self.assertEqual([], utils.get_db_files(path_1))
+        os.mkdir(dbdir)
+        self.assertEqual([], utils.get_db_files(path_1))
+        with open(path_1, 'wb'):
+            pass
+        self.assertEqual([path_1], utils.get_db_files(path_1))
+
+        path_2 = os.path.join(dbdir, 'dbfile_2.db')
+        self.assertEqual([path_1], utils.get_db_files(path_2))
+
+        with open(path_2, 'wb'):
+            pass
+
+        self.assertEqual([path_1, path_2], utils.get_db_files(path_1))
+        self.assertEqual([path_1, path_2], utils.get_db_files(path_2))
+
+        path_3 = os.path.join(dbdir, 'dbfile_3.db')
+        self.assertEqual([path_1, path_2], utils.get_db_files(path_3))
+
+        with open(path_3, 'wb'):
+            pass
+
+        self.assertEqual([path_1, path_2, path_3], utils.get_db_files(path_1))
+        self.assertEqual([path_1, path_2, path_3], utils.get_db_files(path_2))
+        self.assertEqual([path_1, path_2, path_3], utils.get_db_files(path_3))
+
+        other_hash = os.path.join(dbdir, 'other.db')
+        self.assertEqual([], utils.get_db_files(other_hash))
+        other_hash = os.path.join(dbdir, 'other_1.db')
+        self.assertEqual([], utils.get_db_files(other_hash))
+
+        pending = os.path.join(dbdir, 'dbfile.pending')
+        self.assertEqual([path_1, path_2, path_3], utils.get_db_files(pending))
+
+        with open(pending, 'wb'):
+            pass
+        self.assertEqual([path_1, path_2, path_3], utils.get_db_files(pending))
+
+        self.assertEqual([path_1, path_2, path_3], utils.get_db_files(path_1))
+        self.assertEqual([path_1, path_2, path_3], utils.get_db_files(path_2))
+        self.assertEqual([path_1, path_2, path_3], utils.get_db_files(path_3))
+        self.assertEqual([], utils.get_db_files(dbdir))
+
+        os.unlink(path_1)
+        self.assertEqual([path_2, path_3], utils.get_db_files(path_1))
+        self.assertEqual([path_2, path_3], utils.get_db_files(path_2))
+        self.assertEqual([path_2, path_3], utils.get_db_files(path_3))
+
+        os.unlink(path_2)
+        self.assertEqual([path_3], utils.get_db_files(path_1))
+        self.assertEqual([path_3], utils.get_db_files(path_2))
+        self.assertEqual([path_3], utils.get_db_files(path_3))
+
+        os.unlink(path_3)
+        self.assertEqual([], utils.get_db_files(path_1))
+        self.assertEqual([], utils.get_db_files(path_2))
+        self.assertEqual([], utils.get_db_files(path_3))
+        self.assertEqual([], utils.get_db_files('/path/to/nowhere'))
+
+    def test_get_redirect_data(self):
+        ts_now = utils.Timestamp.now()
+        headers = {'X-Backend-Redirect-Timestamp': ts_now.internal}
+        response = FakeResponse(200, headers, b'')
+        self.assertIsNone(utils.get_redirect_data(response))
+
+        headers = {'Location': '/a/c/o',
+                   'X-Backend-Redirect-Timestamp': ts_now.internal}
+        response = FakeResponse(200, headers, b'')
+        path, ts = utils.get_redirect_data(response)
+        self.assertEqual('a/c', path)
+        self.assertEqual(ts_now, ts)
+
+        headers = {'Location': '/a/c',
+                   'X-Backend-Redirect-Timestamp': ts_now.internal}
+        response = FakeResponse(200, headers, b'')
+        path, ts = utils.get_redirect_data(response)
+        self.assertEqual('a/c', path)
+        self.assertEqual(ts_now, ts)
+
+        def do_test(headers):
+            response = FakeResponse(200, headers, b'')
+            with self.assertRaises(ValueError) as cm:
+                utils.get_redirect_data(response)
+            return cm.exception
+
+        exc = do_test({'Location': '/a',
+                       'X-Backend-Redirect-Timestamp': ts_now.internal})
+        self.assertIn('Invalid path', str(exc))
+
+        exc = do_test({'Location': '',
+                       'X-Backend-Redirect-Timestamp': ts_now.internal})
+        self.assertIn('Invalid path', str(exc))
+
+        exc = do_test({'Location': '/a/c',
+                       'X-Backend-Redirect-Timestamp': 'bad'})
+        self.assertIn('Invalid timestamp', str(exc))
+
+        exc = do_test({'Location': '/a/c'})
+        self.assertIn('Invalid timestamp', str(exc))
+
+        exc = do_test({'Location': '/a/c',
+                       'X-Backend-Redirect-Timestamp': '-1'})
+        self.assertIn('Invalid timestamp', str(exc))
+
+    @unittest.skipIf(sys.version_info >= (3, 8),
+                     'pkg_resources loading is only available on python 3.7 '
+                     'and earlier')
+    @mock.patch('pkg_resources.load_entry_point')
+    def test_load_pkg_resource(self, mock_driver):
+        tests = {
+            ('swift.diskfile', 'egg:swift#replication.fs'):
+                ('swift', 'swift.diskfile', 'replication.fs'),
+            ('swift.diskfile', 'egg:swift#erasure_coding.fs'):
+                ('swift', 'swift.diskfile', 'erasure_coding.fs'),
+            ('swift.section', 'egg:swift#thing.other'):
+                ('swift', 'swift.section', 'thing.other'),
+            ('swift.section', 'swift#thing.other'):
+                ('swift', 'swift.section', 'thing.other'),
+            ('swift.section', 'thing.other'):
+                ('swift', 'swift.section', 'thing.other'),
+        }
+        for args, expected in tests.items():
+            utils.load_pkg_resource(*args)
+            mock_driver.assert_called_with(*expected)
+
+        with self.assertRaises(TypeError) as cm:
+            args = ('swift.diskfile', 'nog:swift#replication.fs')
+            utils.load_pkg_resource(*args)
+        self.assertEqual("Unhandled URI scheme: 'nog'", str(cm.exception))
+
+    @unittest.skipIf(sys.version_info < (3, 8),
+                     'importlib loading is only available on python 3.8 '
+                     'and later')
+    @mock.patch('importlib.metadata.distribution')
+    def test_load_pkg_resource_importlib(self, mock_driver):
+        import importlib.metadata
+
+        class TestEntryPoint(importlib.metadata.EntryPoint):
+            def load(self):
+                return self.value
+
+        repl_obj = object()
+        ec_obj = object()
+        other_obj = object()
+        mock_driver.return_value.entry_points = [
+            TestEntryPoint(group='swift.diskfile',
+                           name='replication.fs',
+                           value=repl_obj),
+            TestEntryPoint(group='swift.diskfile',
+                           name='erasure_coding.fs',
+                           value=ec_obj),
+            TestEntryPoint(group='swift.section',
+                           name='thing.other',
+                           value=other_obj),
+        ]
+        tests = {
+            ('swift.diskfile', 'egg:swift#replication.fs'): repl_obj,
+            ('swift.diskfile', 'egg:swift#erasure_coding.fs'): ec_obj,
+            ('swift.section', 'egg:swift#thing.other'): other_obj,
+            ('swift.section', 'swift#thing.other'): other_obj,
+            ('swift.section', 'thing.other'): other_obj,
+        }
+        for args, expected in tests.items():
+            self.assertIs(expected, utils.load_pkg_resource(*args))
+            self.assertEqual(mock_driver.mock_calls, [mock.call('swift')])
+            mock_driver.reset_mock()
+
+        with self.assertRaises(TypeError) as cm:
+            args = ('swift.diskfile', 'nog:swift#replication.fs')
+            utils.load_pkg_resource(*args)
+        self.assertEqual("Unhandled URI scheme: 'nog'", str(cm.exception))
+
+        with self.assertRaises(ImportError) as cm:
+            args = ('swift.diskfile', 'other.fs')
+            utils.load_pkg_resource(*args)
+        self.assertEqual(
+            "Entry point ('swift.diskfile', 'other.fs') not found",
+            str(cm.exception))
+
+        with self.assertRaises(ImportError) as cm:
+            args = ('swift.missing', 'thing.other')
+            utils.load_pkg_resource(*args)
+        self.assertEqual(
+            "Entry point ('swift.missing', 'thing.other') not found",
+            str(cm.exception))
+
+    @with_tempdir
+    def test_systemd_notify(self, tempdir):
+        m_sock = mock.Mock(connect=mock.Mock(), sendall=mock.Mock())
+        with mock.patch('swift.common.utils.socket.socket',
+                        return_value=m_sock) as m_socket:
+            # No notification socket
+            m_socket.reset_mock()
+            m_sock.reset_mock()
+            utils.systemd_notify()
+            self.assertEqual(m_socket.mock_calls, [
+                mock.call(socket.AF_UNIX, socket.SOCK_DGRAM)])
+            self.assertEqual(m_sock.connect.mock_calls, [
+                mock.call(utils.get_pid_notify_socket())])
+            self.assertEqual(m_sock.sendall.mock_calls, [
+                mock.call(b'READY=1')])
+
+            # File notification socket
+            m_socket.reset_mock()
+            m_sock.reset_mock()
+            os.environ['NOTIFY_SOCKET'] = 'foobar'
+            utils.systemd_notify()
+            self.assertEqual(m_socket.mock_calls, [
+                mock.call(socket.AF_UNIX, socket.SOCK_DGRAM),
+                mock.call(socket.AF_UNIX, socket.SOCK_DGRAM)])
+            self.assertEqual(m_sock.connect.mock_calls, [
+                mock.call(utils.get_pid_notify_socket()),
+                mock.call('foobar')])
+            self.assertEqual(m_sock.sendall.mock_calls, [
+                mock.call(b'READY=1'),
+                mock.call(b'READY=1')])
+            # Still there, so we can send STOPPING/RELOADING messages
+            self.assertIn('NOTIFY_SOCKET', os.environ)
+
+            m_socket.reset_mock()
+            m_sock.reset_mock()
+            logger = debug_logger()
+            utils.systemd_notify(logger, "RELOADING=1")
+            self.assertEqual(m_socket.mock_calls, [
+                mock.call(socket.AF_UNIX, socket.SOCK_DGRAM),
+                mock.call(socket.AF_UNIX, socket.SOCK_DGRAM)])
+            self.assertEqual(m_sock.connect.mock_calls, [
+                mock.call(utils.get_pid_notify_socket()),
+                mock.call('foobar')])
+            self.assertEqual(m_sock.sendall.mock_calls, [
+                mock.call(b'RELOADING=1'),
+                mock.call(b'RELOADING=1')])
+
+            # Abstract notification socket
+            m_socket.reset_mock()
+            m_sock.reset_mock()
+            os.environ['NOTIFY_SOCKET'] = '@foobar'
+            utils.systemd_notify()
+            self.assertEqual(m_socket.mock_calls, [
+                mock.call(socket.AF_UNIX, socket.SOCK_DGRAM),
+                mock.call(socket.AF_UNIX, socket.SOCK_DGRAM)])
+            self.assertEqual(m_sock.connect.mock_calls, [
+                mock.call(utils.get_pid_notify_socket()),
+                mock.call('\x00foobar')])
+            self.assertEqual(m_sock.sendall.mock_calls, [
+                mock.call(b'READY=1'),
+                mock.call(b'READY=1')])
+            self.assertIn('NOTIFY_SOCKET', os.environ)
+
+        # Test logger with connection error
+        m_sock = mock.Mock(connect=mock.Mock(side_effect=EnvironmentError),
+                           sendall=mock.Mock())
+        m_logger = mock.Mock(debug=mock.Mock())
+        with mock.patch('swift.common.utils.socket.socket',
+                        return_value=m_sock) as m_socket:
+            os.environ['NOTIFY_SOCKET'] = '@foobar'
+            m_sock.reset_mock()
+            m_logger.reset_mock()
+            utils.systemd_notify()
+            self.assertEqual(0, m_sock.sendall.call_count)
+            self.assertEqual(0, m_logger.debug.call_count)
+
+            m_sock.reset_mock()
+            m_logger.reset_mock()
+            utils.systemd_notify(logger=m_logger)
+            self.assertEqual(0, m_sock.sendall.call_count)
+            self.assertEqual(m_logger.debug.mock_calls, [
+                mock.call("Systemd notification failed", exc_info=True),
+                mock.call("Systemd notification failed", exc_info=True)])
+
+        # Test it for real
+        def do_test_real_socket(socket_address, notify_socket):
+            sock = socket.socket(socket.AF_UNIX, socket.SOCK_DGRAM)
+            sock.settimeout(5)
+            sock.bind(socket_address)
+            os.environ['NOTIFY_SOCKET'] = notify_socket
+            utils.systemd_notify()
+            msg = sock.recv(512)
+            sock.close()
+            self.assertEqual(msg, b'READY=1')
+            self.assertIn('NOTIFY_SOCKET', os.environ)
+
+        # test file socket address
+        socket_path = os.path.join(tempdir, 'foobar')
+        do_test_real_socket(socket_path, socket_path)
+        if sys.platform.startswith('linux'):
+            # test abstract socket address
+            do_test_real_socket('\0foobar', '@foobar')
+
+            with utils.NotificationServer(os.getpid(), 1) as swift_listener:
+                do_test_real_socket('\0foobar', '@foobar')
+                self.assertEqual(swift_listener.receive(),
+                                 b'READY=1')
+
+    def test_md5_with_data(self):
+        if not self.fips_enabled:
+            digest = md5(self.md5_test_data).hexdigest()
+            self.assertEqual(digest, self.md5_digest)
+        else:
+            # on a FIPS enabled system, this throws a ValueError:
+            # [digital envelope routines: EVP_DigestInit_ex] disabled for FIPS
+            self.assertRaises(ValueError, md5, self.md5_test_data)
+
+        if not self.fips_enabled:
+            digest = md5(self.md5_test_data, usedforsecurity=True).hexdigest()
+            self.assertEqual(digest, self.md5_digest)
+        else:
+            self.assertRaises(
+                ValueError, md5, self.md5_test_data, usedforsecurity=True)
+
+        digest = md5(self.md5_test_data, usedforsecurity=False).hexdigest()
+        self.assertEqual(digest, self.md5_digest)
+
+    def test_md5_without_data(self):
+        if not self.fips_enabled:
+            test_md5 = md5()
+            test_md5.update(self.md5_test_data)
+            digest = test_md5.hexdigest()
+            self.assertEqual(digest, self.md5_digest)
+        else:
+            self.assertRaises(ValueError, md5)
+
+        if not self.fips_enabled:
+            test_md5 = md5(usedforsecurity=True)
+            test_md5.update(self.md5_test_data)
+            digest = test_md5.hexdigest()
+            self.assertEqual(digest, self.md5_digest)
+        else:
+            self.assertRaises(ValueError, md5, usedforsecurity=True)
+
+        test_md5 = md5(usedforsecurity=False)
+        test_md5.update(self.md5_test_data)
+        digest = test_md5.hexdigest()
+        self.assertEqual(digest, self.md5_digest)
+
+    def test_string_data_raises_type_error(self):
+        if not self.fips_enabled:
+            self.assertRaises(TypeError, hashlib.md5, u'foo')
+            self.assertRaises(TypeError, md5, u'foo')
+            self.assertRaises(
+                TypeError, md5, u'foo', usedforsecurity=True)
+        else:
+            self.assertRaises(ValueError, hashlib.md5, u'foo')
+            self.assertRaises(ValueError, md5, u'foo')
+            self.assertRaises(
+                ValueError, md5, u'foo', usedforsecurity=True)
+
+        self.assertRaises(
+            TypeError, md5, u'foo', usedforsecurity=False)
+
+    def test_none_data_raises_type_error(self):
+        if not self.fips_enabled:
+            self.assertRaises(TypeError, hashlib.md5, None)
+            self.assertRaises(TypeError, md5, None)
+            self.assertRaises(
+                TypeError, md5, None, usedforsecurity=True)
+        else:
+            self.assertRaises(ValueError, hashlib.md5, None)
+            self.assertRaises(ValueError, md5, None)
+            self.assertRaises(
+                ValueError, md5, None, usedforsecurity=True)
+
+        self.assertRaises(
+            TypeError, md5, None, usedforsecurity=False)
+
+    def test_get_my_ppid(self):
+        if not os.path.exists('/proc/'):
+            self.skipTest('get_ppid can only be functionally tested on Linux')
+        self.assertEqual(os.getppid(), utils.get_ppid(os.getpid()))
+
+
+class TestCooperativeCachePopulator(unittest.TestCase):
+    backend_resp = Response(status=200, body=b'response')
 
-        logger.set_statsd_prefix('some-name.more-specific')
-        self.assertEqual(logger.logger.statsd_client._prefix,
-                         'some-name.more-specific.')
-        logger.set_statsd_prefix('')
-        self.assertEqual(logger.logger.statsd_client._prefix, '')
-
-    def test_get_logger_statsd_client_non_defaults(self):
-        logger = utils.get_logger({
-            'log_statsd_host': 'another.host.com',
-            'log_statsd_port': 9876,
-            'log_statsd_default_sample_rate': 0.75,
-            'log_statsd_metric_prefix': 'tomato.sauce',
-        }, 'some-name', log_route='some-route')
-        self.assertEqual(logger.logger.statsd_client._prefix,
-                         'tomato.sauce.some-name.')
-        logger.set_statsd_prefix('some-name.more-specific')
-        self.assertEqual(logger.logger.statsd_client._prefix,
-                         'tomato.sauce.some-name.more-specific.')
-        logger.set_statsd_prefix('')
-        self.assertEqual(logger.logger.statsd_client._prefix, 'tomato.sauce.')
-        self.assertEqual(logger.logger.statsd_client._host, 'another.host.com')
-        self.assertEqual(logger.logger.statsd_client._port, 9876)
-        self.assertEqual(logger.logger.statsd_client._default_sample_rate,
-                         0.75)
-
-    def test_sample_rates(self):
-        logger = utils.get_logger({'log_statsd_host': 'some.host.com'})
-
-        mock_socket = MockUdpSocket()
-        # encapsulation? what's that?
-        statsd_client = logger.logger.statsd_client
-        self.assertTrue(statsd_client.random is random.random)
-
-        statsd_client._open_socket = lambda *_: mock_socket
-        statsd_client.random = lambda: 0.50001
-
-        logger.increment('tribbles', sample_rate=0.5)
-        self.assertEqual(len(mock_socket.sent), 0)
-
-        statsd_client.random = lambda: 0.49999
-        logger.increment('tribbles', sample_rate=0.5)
-        self.assertEqual(len(mock_socket.sent), 1)
-
-        payload = mock_socket.sent[0][0]
-        self.assertTrue(payload.endswith("|@0.5"))
-
-    def test_timing_stats(self):
-        class MockController(object):
-            def __init__(self, status):
-                self.status = status
-                self.logger = self
-                self.args = ()
-                self.called = 'UNKNOWN'
-
-            def timing_since(self, *args):
-                self.called = 'timing'
-                self.args = args
-
-        @utils.timing_stats
-        def METHOD(controller):
-            return Response(status=controller.status)
-
-        mock_controller = MockController(200)
-        METHOD(mock_controller)
-        self.assertEquals(mock_controller.called, 'timing')
-        self.assertEquals(len(mock_controller.args), 2)
-        self.assertEquals(mock_controller.args[0], 'METHOD.timing')
-        self.assert_(mock_controller.args[1] > 0)
-
-        mock_controller = MockController(404)
-        METHOD(mock_controller)
-        self.assertEquals(len(mock_controller.args), 2)
-        self.assertEquals(mock_controller.called, 'timing')
-        self.assertEquals(mock_controller.args[0], 'METHOD.timing')
-        self.assert_(mock_controller.args[1] > 0)
-
-        mock_controller = MockController(401)
-        METHOD(mock_controller)
-        self.assertEquals(len(mock_controller.args), 2)
-        self.assertEquals(mock_controller.called, 'timing')
-        self.assertEquals(mock_controller.args[0], 'METHOD.errors.timing')
-        self.assert_(mock_controller.args[1] > 0)
-
-
-class TestStatsdLoggingDelegation(unittest.TestCase):
     def setUp(self):
-        self.sock = socket.socket(socket.AF_INET, socket.SOCK_DGRAM)
-        self.sock.bind(('localhost', 0))
-        self.port = self.sock.getsockname()[1]
-        self.queue = Queue()
-        self.reader_thread = Thread(target=self.statsd_reader)
-        self.reader_thread.setDaemon(1)
-        self.reader_thread.start()
+        self.logger = debug_logger()
+        conf = {
+            'log_statsd_host': 'host',
+            'log_statsd_port': 8125,
+            'statsd_label_mode': 'dogstatsd',
+            'statsd_emit_legacy': True,
+        }
+        self.statsd = debug_labeled_statsd_client(conf)
+        self.memcache = TestableMemcacheRing(
+            ['1.2.3.4:11211'], logger=self.logger)
+        self.infocache = {}
+        self.cache_key = "test_key"
+        self.token_key = "_cache_token/%s" % self.cache_key
+        self.cache_ttl = 60
+        self.avg_backend_fetch_time = 0.001
+
+    class MockCachePopulator(CooperativeCachePopulator):
+        def do_fetch_backend(self):
+            return "backend data", TestCooperativeCachePopulator.backend_resp
+
+    class DataTransformCachePopulator(CooperativeCachePopulator):
+        def cache_encoder(self, data):
+            return data.upper()
+
+        def cache_decoder(self, data):
+            return data.lower()
+
+        def do_fetch_backend(self):
+            return "backend data", TestCooperativeCachePopulator.backend_resp
+
+    class DelayedCachePopulator(CooperativeCachePopulator):
+        def __init__(self, app, infocache, memcache,
+                     cache_key, cache_ttl, avg_backend_fetch_time,
+                     backend_delay=0,
+                     fetch_backend_failure=False,
+                     num_tokens=3, labels=None):
+            super().__init__(
+                app, infocache, memcache, cache_key, cache_ttl,
+                avg_backend_fetch_time, num_tokens, labels=labels
+            )
+            self._backend_delay = backend_delay
+            self._fetch_backend_failure = fetch_backend_failure
+
+        def do_fetch_backend(self):
+            if self._backend_delay:
+                eventlet.sleep(self._backend_delay)
+            if self._fetch_backend_failure:
+                return None, FakeResponse(status_int=503)
+            else:
+                return "backend data", \
+                    TestCooperativeCachePopulator.backend_resp
+
+    def test_populator_constructor(self):
+        obj = self.MockCachePopulator(
+            MockApp(self.logger, self.statsd),
+            self.infocache, self.memcache,
+            self.cache_key, self.cache_ttl,
+            self.avg_backend_fetch_time,
+            num_tokens=10, labels={
+                'resource': "test",
+            }
+        )
+        self.assertEqual(obj._logger, self.logger)
+        self.assertEqual(obj._labels, {
+            'resource': "test",
+        })
+        self.assertEqual(obj._infocache, self.infocache)
+        self.assertEqual(obj._memcache, self.memcache)
+        self.assertEqual(obj._cache_key, self.cache_key)
+        self.assertEqual(obj._cache_ttl, self.cache_ttl)
+        self.assertEqual(obj._token_key, '_cache_token/%s' % self.cache_key)
+        self.assertEqual(
+            obj._avg_backend_fetch_time, self.avg_backend_fetch_time)
+        self.assertEqual(obj._token_ttl, self.avg_backend_fetch_time * 10)
+        self.assertEqual(obj._num_tokens, 10)
+        self.assertEqual(obj.cache_encoder(42), 42)
+        self.assertEqual(obj.cache_decoder(42), 42)
+        self.assertIsNone(obj.set_cache_state)
+        self.assertFalse(obj.token_acquired)
+        self.assertIsNone(obj.backend_resp)
+
+    def test_populator_num_tokens_zero(self):
+        populator = self.MockCachePopulator(
+            MockApp(self.logger, self.statsd),
+            self.infocache, self.memcache,
+            self.cache_key, self.cache_ttl,
+            avg_backend_fetch_time=.1,
+            num_tokens=0, labels={
+                'resource': "test",
+            }
+        )
+        data = populator.fetch_data()
+        self.assertEqual(data, "backend data")
+        self.assertEqual(populator.backend_resp, self.backend_resp)
+        self.assertEqual(populator.set_cache_state, "set")
+        self.assertFalse(populator.token_acquired)
+        self.assertEqual(self.memcache.get_calls, [])
+        self.assertEqual(self.infocache[self.cache_key], "backend data")
+        self.assertEqual(self.memcache.incr_calls, [])
+        self.assertEqual(
+            self.memcache.set_calls,
+            [(self.cache_key, "backend data", self.cache_ttl)]
+        )
+        self.assertEqual(self.memcache.del_calls, [])
+        stats = self.statsd.get_labeled_stats_counts()
+        self.assertEqual({
+            ('swift_coop_cache', frozenset((
+                ('resource', 'test'),
+                ('event', 'backend_reqs'),
+                ('token', 'disabled'),
+                ('set_cache_state', 'set'),
+                ('status', 200)),
+            )): 1,
+        }, stats)
+
+    def test_populator_fetch_data_called_twice(self):
+        populator = self.MockCachePopulator(
+            MockApp(self.logger, self.statsd),
+            self.infocache, self.memcache,
+            self.cache_key, self.cache_ttl,
+            self.avg_backend_fetch_time,
+        )
+        data = populator.fetch_data()
+        self.assertEqual(data, "backend data")
+        self.assertTrue(populator._fetch_called)
+        self.assertRaises(RuntimeError, populator.fetch_data)
+
+    def test_first_request_with_token(self):
+        # Test the first request will acquire the token, fetch data from
+        # the backend and set it into Memcached.
+        populator = self.MockCachePopulator(
+            MockApp(self.logger, self.statsd),
+            self.infocache, self.memcache,
+            self.cache_key, self.cache_ttl,
+            self.avg_backend_fetch_time,
+            labels={
+                'resource': "test",
+            }
+        )
+        data = populator.fetch_data()
+        self.assertEqual(data, "backend data")
+        self.assertEqual(populator.backend_resp, self.backend_resp)
+        self.assertEqual(populator.set_cache_state, "set")
+        self.assertTrue(populator.token_acquired)
+        self.assertEqual(self.memcache.get_calls, [])
+        self.assertEqual(self.infocache[self.cache_key], "backend data")
+        self.assertEqual(
+            self.memcache.incr_calls,
+            [(self.token_key, 1, self.avg_backend_fetch_time * 10)]
+        )
+        self.assertEqual(
+            self.memcache.set_calls,
+            [(self.cache_key, "backend data", self.cache_ttl)]
+        )
+        self.assertEqual(self.memcache.del_calls, [self.token_key])
+        stats = self.statsd.get_labeled_stats_counts()
+        self.assertEqual({
+            ('swift_coop_cache', frozenset((
+                ('resource', 'test'),
+                ('event', 'backend_reqs'),
+                ('token', 'with_token'),
+                ('set_cache_state', 'set'),
+                ('status', 200)),
+            )): 1,
+        }, stats)
+
+    def test_first_request_with_token_with_encoder(self):
+        # Test the processing of first request with cache data encoder and
+        # decoder.
+        populator = self.DataTransformCachePopulator(
+            MockApp(self.logger, self.statsd),
+            self.infocache, self.memcache,
+            self.cache_key, self.cache_ttl,
+            self.avg_backend_fetch_time,
+            labels={
+                'resource': "test",
+            }
+        )
+        data = populator.fetch_data()
+        self.assertEqual(data, "backend data")
+        self.assertEqual(populator.backend_resp, self.backend_resp)
+        self.assertEqual(populator.set_cache_state, "set")
+        self.assertTrue(populator.token_acquired)
+        self.assertEqual(self.memcache.get_calls, [])
+        self.assertEqual(self.infocache[self.cache_key], "backend data")
+        self.assertEqual(
+            self.memcache.incr_calls,
+            [(self.token_key, 1, self.avg_backend_fetch_time * 10)]
+        )
+        self.assertEqual(
+            self.memcache.set_calls,
+            [(self.cache_key, "BACKEND DATA", self.cache_ttl)]
+        )
+        self.assertEqual(self.memcache.del_calls, [self.token_key])
+        stats = self.statsd.get_labeled_stats_counts()
+        self.assertEqual({
+            ('swift_coop_cache', frozenset((
+                ('resource', 'test'),
+                ('event', 'backend_reqs'),
+                ('token', 'with_token'),
+                ('set_cache_state', 'set'),
+                ('status', 200)),
+            )): 1,
+        }, stats)
+
+    def test_following_request_with_token(self):
+        # Test the following request (not the first one) which also acquires
+        # the token, fetch data from the backend and set it into Memcached.
+        # Simulate that there are 1 or 2 requests who have acquired the tokens.
+        prior_reqs_with_token = random.randint(1, 2)
+        total_requests = self.memcache.incr(
+            self.token_key, delta=prior_reqs_with_token, time=10)
+        self.assertEqual(total_requests, prior_reqs_with_token)
+        # Test the following request to get the token.
+        self.memcache.incr_calls = []
+        populator = self.MockCachePopulator(
+            MockApp(self.logger, self.statsd),
+            self.infocache, self.memcache,
+            self.cache_key, self.cache_ttl,
+            self.avg_backend_fetch_time,
+            labels={
+                'resource': "test",
+            }
+        )
+        data = populator.fetch_data()
+        self.assertEqual(data, "backend data")
+        self.assertEqual(populator.backend_resp, self.backend_resp)
+        self.assertEqual(populator.set_cache_state, "set")
+        self.assertTrue(populator.token_acquired)
+        self.assertEqual(self.memcache.get_calls, [])
+        self.assertEqual(self.infocache[self.cache_key], "backend data")
+        self.assertEqual(
+            self.memcache.incr_calls,
+            [(self.token_key, 1, self.avg_backend_fetch_time * 10)]
+        )
+        self.assertEqual(
+            self.memcache.set_calls,
+            [(self.cache_key, "backend data", self.cache_ttl)]
+        )
+        self.assertEqual(self.memcache.del_calls, [self.token_key])
+        stats = self.statsd.get_labeled_stats_counts()
+        self.assertEqual({
+            ('swift_coop_cache', frozenset((
+                ('resource', 'test'),
+                ('event', 'backend_reqs'),
+                ('token', 'with_token'),
+                ('set_cache_state', 'set'),
+                ('status', 200)),
+            )): 1,
+        }, stats)
+
+    def test_fetch_data_cache_hit_without_token(self):
+        # Test the request which doesn't acquire the token, then keep sleeping
+        # and trying to fetch data from the Memcached until it succeeds.
+
+        def test_fetch_data(avg_fetch_time,
+                            total_miss_retries,
+                            expected_sleep_calls):
+            self.logger.statsd_client.clear()
+            self.statsd.clear()
+            num_tokens_per_session = random.randint(1, 3)
+            retries = 0
+
+            class CustomizedCache(TestableMemcacheRing):
+                def get(self, key, raise_on_error=False):
+                    nonlocal retries
+                    retries += 1
+                    if retries <= total_miss_retries:
+                        value = super().get(
+                            "NOT_EXISTED_YET")
+                        return value
+                    else:
+                        return super().get(key)
+
+            self.memcache = CustomizedCache(
+                ['1.2.3.4:11211'], logger=self.logger)
+            # Simulate that there were 'num_tokens_per_session' requests who
+            # have acquired the tokens.
+            total_requests = self.memcache.incr(
+                self.token_key, delta=num_tokens_per_session, time=10)
+            self.assertEqual(total_requests, num_tokens_per_session)
+            self.memcache.set(self.cache_key, [1, 2, 3])
+            # Test the request without a token
+            self.memcache.incr_calls = []
+            self.memcache.set_calls = []
+            populator = self.MockCachePopulator(
+                MockApp(self.logger, self.statsd),
+                self.infocache, self.memcache,
+                self.cache_key, self.cache_ttl,
+                avg_backend_fetch_time=avg_fetch_time,
+                num_tokens=num_tokens_per_session,
+                labels={
+                    'resource': "test",
+                }
+            )
+            populator._token_ttl = 1
+            with mock.patch.object(utils, 'sleep') as mock_sleep:
+                data = populator.fetch_data()
+            self.assertEqual(expected_sleep_calls, mock_sleep.call_args_list)
+            self.assertEqual(data, [1, 2, 3])
+            self.assertIsNone(populator.backend_resp)
+            self.assertIsNone(populator.set_cache_state)
+            self.assertEqual(self.infocache, {})
+            self.assertEqual(
+                self.memcache.incr_calls,
+                [(self.token_key, 1, populator._token_ttl)]
+            )
+            self.assertEqual(self.memcache.set_calls, [])
+            self.assertEqual(retries, total_miss_retries + 1)
+            self.assertEqual(
+                self.memcache.get_calls,
+                ['NOT_EXISTED_YET'] * (retries - 1) + [self.cache_key]
+            )
+            self.assertFalse(populator.token_acquired)
+            stats = self.statsd.get_labeled_stats_counts()
+            self.assertEqual({
+                ('swift_coop_cache', frozenset((
+                    ('resource', 'test'),
+                    ('event', 'cache_served'),
+                    ('token', 'no_token'),
+                    ('lack_retries', False)),
+                )): 1,
+            }, stats)
+
+        test_fetch_data(1.0, 1, [mock.call(1.5), mock.call(3.0)])
+        test_fetch_data(
+            1.0, 2, [mock.call(1.5), mock.call(3.0), mock.call(6.0)])
+        test_fetch_data(2.0, 1, [mock.call(3.0), mock.call(6.0)])
+        test_fetch_data(
+            2.0, 2, [mock.call(3.0), mock.call(6.0), mock.call(12.0)])
+
+    def test_fetch_data_cache_miss_without_token(self):
+        # Test the request which doesn't acquire the token, then keep sleeping
+        # and trying to fetch data from the Memcached, but enventually all
+        # retries exhausted with cache misses.
+        num_tokens_per_session = random.randint(1, 3)
+        retries = 0
+
+        class CustomizedCache(TestableMemcacheRing):
+            def get(self, key, raise_on_error=False):
+                nonlocal retries
+                retries += 1
+                return super().get("NOT_EXISTED_YET")
+
+        self.memcache = CustomizedCache(['1.2.3.4:11211'], logger=self.logger)
+        # Simulate that there are 'num_tokens_per_session' requests who have
+        # acquired the tokens.
+        total_requests = self.memcache.incr(
+            self.token_key, delta=num_tokens_per_session, time=10)
+        self.assertEqual(total_requests, num_tokens_per_session)
+        self.memcache.set(self.cache_key, "cached data")
+        # Test the request without a token
+        self.memcache.incr_calls = []
+        self.memcache.set_calls = []
+        populator = self.MockCachePopulator(
+            MockApp(self.logger, self.statsd),
+            self.infocache, self.memcache,
+            self.cache_key, self.cache_ttl,
+            self.avg_backend_fetch_time,
+            num_tokens_per_session,
+            labels={
+                'resource': "test",
+            }
+        )
+        data = populator.fetch_data()
+        self.assertEqual(data, "backend data")
+        self.assertEqual(populator.backend_resp, self.backend_resp)
+        self.assertEqual(populator.set_cache_state, "set")
+        self.assertFalse(populator.token_acquired)
+        self.assertEqual(self.infocache[self.cache_key], "backend data")
+        self.assertEqual(
+            self.memcache.incr_calls,
+            [(self.token_key, 1, self.avg_backend_fetch_time * 10)]
+        )
+        self.assertEqual(
+            self.memcache.set_calls,
+            [(self.cache_key, "backend data", self.cache_ttl)]
+        )
+        self.assertEqual(retries, 3)
+        self.assertEqual(
+            self.memcache.get_calls, ['NOT_EXISTED_YET'] * retries)
+        self.assertEqual(self.memcache.del_calls, [])
+        stats = self.statsd.get_labeled_stats_counts()
+        self.assertEqual({
+            ('swift_coop_cache', frozenset((
+                ('resource', 'test'),
+                ('event', 'backend_reqs'),
+                ('token', 'no_token'),
+                ('lack_retries', False),
+                ('set_cache_state', 'set'),
+                ('status', 200)),
+            )): 1,
+        }, stats)
+
+    def test_fetch_data_req_lacks_enough_retries(self):
+        # Test the request which doesn't acquire the token, then keep sleeping
+        # and trying to fetch data from the Memcached, but doesn't get enough
+        # retries.
+        retries = 0
+
+        class CustomizedCache(TestableMemcacheRing):
+            def get(self, key, raise_on_error=False):
+                nonlocal retries
+                retries += 1
+                return super().get("NOT_EXISTED_YET")
+
+        self.memcache = CustomizedCache(['1.2.3.4:11211'], logger=self.logger)
+        # Simulate that there are three requests who have acquired the tokens.
+        total_requests = self.memcache.incr(self.token_key, delta=3, time=10)
+        self.assertEqual(total_requests, 3)
+        self.memcache.set(self.cache_key, [1, 2, 3])
+        # Test the request without a token
+        self.memcache.incr_calls = []
+        self.memcache.set_calls = []
+        populator = self.MockCachePopulator(
+            MockApp(self.logger, self.statsd),
+            self.infocache, self.memcache,
+            self.cache_key, self.cache_ttl,
+            self.avg_backend_fetch_time,
+            labels={
+                'resource': "test",
+            }
+        )
+        with patch('time.time', ) as mock_time:
+            mock_time.side_effect = itertools.count(4000.99, 1.0)
+            data = populator.fetch_data()
+        self.assertEqual(data, "backend data")
+        self.assertEqual(populator.backend_resp, self.backend_resp)
+        self.assertEqual(populator.set_cache_state, "set")
+        self.assertFalse(populator.token_acquired)
+        self.assertEqual(self.infocache[self.cache_key], "backend data")
+        self.assertEqual(
+            self.memcache.incr_calls,
+            [(self.token_key, 1, self.avg_backend_fetch_time * 10)]
+        )
+        self.assertEqual(
+            self.memcache.set_calls,
+            [(self.cache_key, "backend data", self.cache_ttl)]
+        )
+        self.assertEqual(retries, 2)
+        self.assertEqual(
+            self.memcache.get_calls, ['NOT_EXISTED_YET'] * 2)
+        self.assertEqual(self.memcache.del_calls, [])
+        stats = self.statsd.get_labeled_stats_counts()
+        self.assertEqual({
+            ('swift_coop_cache', frozenset((
+                ('resource', 'test'),
+                ('event', 'backend_reqs'),
+                ('token', 'no_token'),
+                ('lack_retries', True),
+                ('set_cache_state', 'set'),
+                ('status', 200)),
+            )): 1,
+        }, stats)
+
+    def test_get_token_connection_error(self):
+        # Test the request which couldn't acquire the token due to memcached
+        # connection error.
+        self.memcache = TestableMemcacheRing(
+            ['1.2.3.4:11211'], logger=self.logger, inject_incr_error=True)
+        populator = self.MockCachePopulator(
+            MockApp(self.logger, self.statsd),
+            self.infocache, self.memcache,
+            self.cache_key, self.cache_ttl,
+            self.avg_backend_fetch_time,
+            labels={
+                'resource': "test",
+            }
+        )
+        data = populator.fetch_data()
+        self.assertEqual(data, "backend data")
+        self.assertEqual(populator.backend_resp, self.backend_resp)
+        self.assertEqual(populator.set_cache_state, "set")
+        self.assertFalse(populator.token_acquired)
+        self.assertEqual(self.infocache[self.cache_key], "backend data")
+        self.assertEqual(
+            self.memcache.incr_calls,
+            [(self.token_key, 1, self.avg_backend_fetch_time * 10)]
+        )
+        self.assertEqual(
+            self.memcache.set_calls,
+            [(self.cache_key, "backend data", self.cache_ttl)]
+        )
+        self.assertEqual(self.memcache.del_calls, [])
+        stats = self.statsd.get_labeled_stats_counts()
+        self.assertEqual({
+            ('swift_coop_cache', frozenset((
+                ('resource', 'test'),
+                ('event', 'backend_reqs'),
+                ('token', 'error'),
+                ('set_cache_state', 'set'),
+                ('status', 200)),
+            )): 1,
+        }, stats)
+
+    def test_set_data_connection_error(self):
+        # Test the request which is able to acquire the token, but fails to set
+        # the fetched backend data into memcached due to memcached connection
+        # error.
+        self.memcache = TestableMemcacheRing(
+            ['1.2.3.4:11211'], logger=self.logger, inject_set_error=True)
+        populator = self.MockCachePopulator(
+            MockApp(self.logger, self.statsd),
+            self.infocache, self.memcache,
+            self.cache_key, self.cache_ttl,
+            self.avg_backend_fetch_time,
+            labels={
+                'resource': "test",
+            }
+        )
+        data = populator.fetch_data()
+        self.assertEqual(data, "backend data")
+        self.assertEqual(populator.backend_resp, self.backend_resp)
+        self.assertEqual(populator.set_cache_state, "set_error")
+        self.assertTrue(populator.token_acquired)
+        self.assertEqual(self.infocache[self.cache_key], "backend data")
+        self.assertEqual(
+            self.memcache.incr_calls,
+            [(self.token_key, 1, self.avg_backend_fetch_time * 10)]
+        )
+        self.assertEqual(
+            self.memcache.set_calls,
+            [(self.cache_key, "backend data", self.cache_ttl)]
+        )
+        self.assertEqual(self.memcache.del_calls, [])
+        stats = self.statsd.get_labeled_stats_counts()
+        self.assertEqual({
+            ('swift_coop_cache', frozenset((
+                ('resource', 'test'),
+                ('event', 'backend_reqs'),
+                ('token', 'with_token'),
+                ('set_cache_state', 'set_error'),
+                ('status', 200)),
+            )): 1,
+        }, stats)
+
+    def test_connection_errors_on_gettoken_and_dataset(self):
+        # Test the request which couldn't acquire the token due to memcached
+        # connection error, and then couldn't set the backend data into cache
+        # due to memcached connection error too.
+        self.memcache = TestableMemcacheRing(
+            ['1.2.3.4:11211'], logger=self.logger,
+            inject_incr_error=True, inject_set_error=True)
+        populator = self.MockCachePopulator(
+            MockApp(self.logger, self.statsd),
+            self.infocache, self.memcache,
+            self.cache_key, self.cache_ttl,
+            self.avg_backend_fetch_time,
+            labels={
+                'resource': "test",
+            }
+        )
+        data = populator.fetch_data()
+        self.assertEqual(data, "backend data")
+        self.assertEqual(populator.backend_resp, self.backend_resp)
+        self.assertEqual(populator.set_cache_state, "set_error")
+        self.assertFalse(populator.token_acquired)
+        self.assertEqual(self.infocache[self.cache_key], "backend data")
+        self.assertEqual(
+            self.memcache.incr_calls,
+            [(self.token_key, 1, self.avg_backend_fetch_time * 10)]
+        )
+        self.assertEqual(
+            self.memcache.set_calls,
+            [(self.cache_key, "backend data", self.cache_ttl)]
+        )
+        self.assertEqual(self.memcache.del_calls, [])
+        stats = self.statsd.get_labeled_stats_counts()
+        self.assertEqual({
+            ('swift_coop_cache', frozenset((
+                ('resource', 'test'),
+                ('event', 'backend_reqs'),
+                ('token', 'error'),
+                ('set_cache_state', 'set_error'),
+                ('status', 200)),
+            )): 1,
+        }, stats)
+
+    def test_fetch_data_from_cache_connection_error(self):
+        # Test the request which doesn't acquire the token, then keep sleeping
+        # and trying to fetch data from the Memcached, but eventually all
+        # retries exhausted with memcached connection errors.
+        self.memcache = TestableMemcacheRing(
+            ['1.2.3.4:11211'], logger=self.logger, inject_get_error=True)
+        # Simulate that there are three requests who have acquired the tokens.
+        total_requests = self.memcache.incr(self.token_key, delta=3, time=10)
+        self.assertEqual(total_requests, 3)
+        self.memcache.set(self.cache_key, [1, 2, 3])
+        # Test the request without a token
+        self.memcache.incr_calls = []
+        self.memcache.set_calls = []
+        populator = self.MockCachePopulator(
+            MockApp(self.logger, self.statsd),
+            self.infocache, self.memcache,
+            self.cache_key, self.cache_ttl,
+            self.avg_backend_fetch_time,
+            labels={
+                'resource': "test",
+            }
+        )
+        data = populator.fetch_data()
+        self.assertEqual(data, "backend data")
+        self.assertEqual(populator.backend_resp, self.backend_resp)
+        self.assertEqual(populator.set_cache_state, "set")
+        self.assertFalse(populator.token_acquired)
+        self.assertEqual(self.infocache[self.cache_key], "backend data")
+        self.assertEqual(
+            self.memcache.incr_calls,
+            [(self.token_key, 1, self.avg_backend_fetch_time * 10)]
+        )
+        self.assertEqual(
+            self.memcache.set_calls,
+            [(self.cache_key, "backend data", self.cache_ttl)]
+        )
+        self.assertEqual(
+            self.memcache.get_calls[0], self.cache_key)
+        self.assertEqual(self.memcache.del_calls, [])
+        stats = self.statsd.get_labeled_stats_counts()
+        self.assertEqual({
+            ('swift_coop_cache', frozenset((
+                ('resource', 'test'),
+                ('event', 'backend_reqs'),
+                ('token', 'no_token'),
+                ('lack_retries', False),
+                ('set_cache_state', 'set'),
+                ('status', 200)),
+            )): 1,
+        }, stats)
+
+    def test_concurrent_requests(self):
+        # Simulate multiple concurrent threads, each of them issues a
+        # "fetch_data" request cooperatively.
+        self.avg_backend_fetch_time = 0.01
+        num_processes = 100
+        exceptions = []
+
+        def worker_process():
+            # Initialize new populator instance in each process.
+            populator = self.DelayedCachePopulator(
+                MockApp(self.logger, self.statsd),
+                {}, self.memcache,
+                self.cache_key, self.cache_ttl,
+                self.avg_backend_fetch_time,
+                backend_delay=self.avg_backend_fetch_time,
+                labels={
+                    'resource': "test",
+                }
+            )
+            data = populator.fetch_data()
+
+            try:
+                # Data retrieved successfully
+                self.assertEqual(data, "backend data")
+                if populator.set_cache_state == 'set':
+                    self.assertTrue(populator.token_acquired)
+                    self.assertEqual(
+                        populator._infocache[self.cache_key], "backend data")
+                    self.assertEqual(populator.backend_resp, self.backend_resp)
+                else:
+                    self.assertEqual(populator._infocache, {})
+                    self.assertIsNone(populator.backend_resp)
+            except Exception as e:
+                exceptions.append(e)
+
+        # Issue those parallel requests "at the same time".
+        pool = eventlet.GreenPool()
+        for i in range(num_processes):
+            pool.spawn(worker_process)
+
+        # Wait for all requests to complete
+        pool.waitall()
+        if exceptions:
+            self.fail(f"Greenthread assertions failed: {exceptions}")
+        stats = self.statsd.get_labeled_stats_counts()
+        self.assertEqual({
+            ('swift_coop_cache', frozenset((
+                ('resource', 'test'),
+                ('event', 'backend_reqs'),
+                ('token', 'with_token'),
+                ('set_cache_state', 'set'),
+                ('status', 200)),
+            )): 3,
+            ('swift_coop_cache', frozenset((
+                ('resource', 'test'),
+                ('event', 'cache_served'),
+                ('token', 'no_token'),
+                ('lack_retries', False)),
+            )): 97
+        }, stats)
+        self.assertEqual(
+            self.memcache.incr_calls,
+            [(self.token_key, 1, self.avg_backend_fetch_time * 10)] * 100
+        )
+        self.assertEqual(
+            self.memcache.set_calls,
+            [(self.cache_key, "backend data", self.cache_ttl)] * 3
+        )
+        self.assertEqual(self.memcache.del_calls, [self.token_key] * 3)
+
+    def test_concurrent_requests_all_token_requests_fail(self):
+        # Simulate multiple concurrent threads issued into a cooperative token
+        # session, each thread will issue a "fetch_data" request cooperatively.
+        # And the first three requests will acquire the token, but fail to get
+        # data from the backend. This test also demonstrates that even though
+        # all token requests fail to go through, other requests who arrive at
+        # the late stage of same token session and won't get a token still
+        # could be served out of the memcached.
+        self.avg_backend_fetch_time = 0.1
+        counts = {
+            'num_backend_success': 0,
+            'num_requests_served_from_cache': 0,
+            'num_backend_failures': 0,
+        }
+        exceptions = []
+
+        def worker_process(exec_delay, backend_delay,
+                           fetch_backend_failure=False):
+            # Initialize new populator instance in each process.
+            populator = self.DelayedCachePopulator(
+                MockApp(self.logger, self.statsd),
+                {}, self.memcache,
+                self.cache_key, self.cache_ttl,
+                self.avg_backend_fetch_time,
+                backend_delay,
+                fetch_backend_failure,
+                labels={
+                    'resource': "test",
+                }
+            )
+            if exec_delay:
+                eventlet.sleep(exec_delay)
+            data = populator.fetch_data()
+
+            try:
+                if fetch_backend_failure:
+                    self.assertIsNone(data)
+                else:
+                    self.assertEqual(data, "backend data")
+                if populator.set_cache_state == 'set':
+                    counts['num_backend_success'] += 1
+                    self.assertEqual(
+                        populator._infocache[self.cache_key], "backend data")
+                    self.assertEqual(populator.backend_resp, self.backend_resp)
+                elif not fetch_backend_failure:
+                    counts['num_requests_served_from_cache'] += 1
+                    self.assertEqual(populator._infocache, {})
+                    self.assertIsNone(populator.backend_resp)
+                else:
+                    counts['num_backend_failures'] += 1
+            except Exception as e:
+                exceptions.append(e)
+
+        # Issue those parallel requests at different time within this
+        # cooperative token session.
+        pool = eventlet.GreenPool()
+        # The first three requests will get the token but fails.
+        for i in range(3):
+            pool.spawn(
+                worker_process, 0, self.avg_backend_fetch_time * 15, True)
+        # The 4th request won't get a token, but after it exits its waiting
+        # cycles, it will fetch the data from the backend and set the data into
+        # the memcached.
+        pool.spawn(worker_process, 0, 0)
+        # The remaining 16 requests won't get a token, but will be served out
+        # of the memcached because the 4th request will finish within their
+        # waiting cycles.
+        for i in range(16):
+            pool.spawn(
+                worker_process,
+                random.uniform(self.avg_backend_fetch_time * 3,
+                               self.avg_backend_fetch_time * 6),
+                self.avg_backend_fetch_time
+            )
+
+        # Wait for all requests to complete
+        pool.waitall()
+        if exceptions:
+            self.fail(f"Greenthread assertions failed: {exceptions}")
+        # The first three requests of the first token session failed to get
+        # data from the backend.
+        self.assertEqual(counts['num_backend_failures'], 3)
+        self.assertEqual(counts['num_backend_success'], 1)
+        self.assertEqual(counts['num_requests_served_from_cache'], 16)
+        self.assertEqual(len(self.memcache.incr_calls), 20)
+        self.assertEqual(len(self.memcache.del_calls), 0)
+
+    def test_concurrent_requests_pass_token_ttl(self):
+        # Simulate multiple concurrent threads across two cooperative token
+        # sessions, each thread will issue a "fetch_data" request
+        # cooperatively. The very first three requests which will acquire the
+        # token, but fail to fetch data from backend.
+        self.avg_backend_fetch_time = 0.1
+        counts = {
+            'num_backend_success': 0,
+            'num_requests_served_from_cache': 0,
+            'num_backend_failures': 0,
+        }
+        exceptions = []
+
+        def worker_process(exec_delay, backend_delay,
+                           fetch_backend_failure=False):
+            # Initialize new populator instance in each process.
+            populator = self.DelayedCachePopulator(
+                MockApp(self.logger, self.statsd),
+                {}, self.memcache,
+                self.cache_key, self.cache_ttl,
+                self.avg_backend_fetch_time,
+                backend_delay,
+                fetch_backend_failure,
+                labels={
+                    'resource': "test",
+                }
+            )
+            if exec_delay:
+                eventlet.sleep(exec_delay)
+            data = populator.fetch_data()
+
+            try:
+                if fetch_backend_failure:
+                    self.assertIsNone(data)
+                else:
+                    self.assertEqual(data, "backend data")
+                if populator.set_cache_state == 'set':
+                    counts['num_backend_success'] += 1
+                    self.assertEqual(
+                        populator._infocache[self.cache_key], "backend data")
+                    self.assertEqual(populator.backend_resp, self.backend_resp)
+                elif not fetch_backend_failure:
+                    counts['num_requests_served_from_cache'] += 1
+                    self.assertEqual(populator._infocache, {})
+                    self.assertIsNone(populator.backend_resp)
+                else:
+                    counts['num_backend_failures'] += 1
+            except Exception as e:
+                exceptions.append(e)
+
+        # Issue the parallel requests for the first token session.
+        pool = eventlet.GreenPool()
+        for i in range(3):
+            pool.spawn(
+                worker_process, 0, self.avg_backend_fetch_time * 15, True)
+        for i in range(17):
+            pool.spawn(
+                worker_process,
+                random.uniform(0, self.avg_backend_fetch_time * 10),
+                self.avg_backend_fetch_time
+            )
+
+        # Issue the parallel requests for the second token session.
+        for i in range(3):
+            pool.spawn(
+                worker_process,
+                self.avg_backend_fetch_time * 10,
+                self.avg_backend_fetch_time * 5
+            )
+        for i in range(17):
+            pool.spawn(
+                worker_process,
+                random.uniform(self.avg_backend_fetch_time * 10,
+                               self.avg_backend_fetch_time * 11),
+                self.avg_backend_fetch_time
+            )
+        # Wait for all requests to complete
+        pool.waitall()
+        if exceptions:
+            self.fail(f"Greenthread assertions failed: {exceptions}")
+        # The first three requests of the first token session failed to get
+        # data from the backend.
+        self.assertEqual(counts['num_backend_failures'], 3)
+        self.assertGreaterEqual(counts['num_backend_success'], 3)
+        self.assertEqual(
+            counts['num_requests_served_from_cache'],
+            40 - counts['num_backend_failures'] -
+            counts['num_backend_success']
+        )
+        self.assertEqual(len(self.memcache.incr_calls), 40)
+        # The first three requests of the second token session will delete the
+        # token after fetching data from the backend and set it in cache.
+        self.assertEqual(len(self.memcache.del_calls), 3)
+
+
+class TestUnlinkOlder(unittest.TestCase):
+
+    def setUp(self):
+        self.tempdir = mkdtemp()
+        self.mtime = {}
+        self.ts = make_timestamp_iter()
 
     def tearDown(self):
-        # The "no-op when disabled" test doesn't set up a real logger, so
-        # create one here so we can tell the reader thread to stop.
-        if not getattr(self, 'logger', None):
-            self.logger = utils.get_logger({
-                'log_statsd_host': 'localhost',
-                'log_statsd_port': str(self.port),
-            }, 'some-name')
-        self.logger.increment('STOP')
-        self.reader_thread.join(timeout=4)
-        self.sock.close()
-        del self.logger
-
-    def statsd_reader(self):
+        rmtree(self.tempdir, ignore_errors=True)
+
+    def touch(self, fpath, mtime=None):
+        self.mtime[fpath] = mtime or next(self.ts)
+        open(fpath, 'w')
+
+    @contextlib.contextmanager
+    def high_resolution_getmtime(self):
+        orig_getmtime = os.path.getmtime
+
+        def mock_getmtime(fpath):
+            mtime = self.mtime.get(fpath)
+            if mtime is None:
+                mtime = orig_getmtime(fpath)
+            return mtime
+
+        with mock.patch('os.path.getmtime', mock_getmtime):
+            yield
+
+    def test_unlink_older_than_path_not_exists(self):
+        path = os.path.join(self.tempdir, 'does-not-exist')
+        # just make sure it doesn't blow up
+        utils.unlink_older_than(path, next(self.ts))
+
+    def test_unlink_older_than_file(self):
+        path = os.path.join(self.tempdir, 'some-file')
+        self.touch(path)
+        with self.assertRaises(OSError) as ctx:
+            utils.unlink_older_than(path, next(self.ts))
+        self.assertEqual(ctx.exception.errno, errno.ENOTDIR)
+
+    def test_unlink_older_than_now(self):
+        self.touch(os.path.join(self.tempdir, 'test'))
+        with self.high_resolution_getmtime():
+            utils.unlink_older_than(self.tempdir, next(self.ts))
+        self.assertEqual([], os.listdir(self.tempdir))
+
+    def test_unlink_not_old_enough(self):
+        start = next(self.ts)
+        self.touch(os.path.join(self.tempdir, 'test'))
+        with self.high_resolution_getmtime():
+            utils.unlink_older_than(self.tempdir, start)
+        self.assertEqual(['test'], os.listdir(self.tempdir))
+
+    def test_unlink_mixed(self):
+        self.touch(os.path.join(self.tempdir, 'first'))
+        cutoff = next(self.ts)
+        self.touch(os.path.join(self.tempdir, 'second'))
+        with self.high_resolution_getmtime():
+            utils.unlink_older_than(self.tempdir, cutoff)
+        self.assertEqual(['second'], os.listdir(self.tempdir))
+
+    def test_unlink_paths(self):
+        paths = []
+        for item in ('first', 'second', 'third'):
+            path = os.path.join(self.tempdir, item)
+            self.touch(path)
+            paths.append(path)
+        # don't unlink everyone
+        with self.high_resolution_getmtime():
+            utils.unlink_paths_older_than(paths[:2], next(self.ts))
+        self.assertEqual(['third'], os.listdir(self.tempdir))
+
+    def test_unlink_empty_paths(self):
+        # just make sure it doesn't blow up
+        utils.unlink_paths_older_than([], next(self.ts))
+
+    def test_unlink_not_exists_paths(self):
+        path = os.path.join(self.tempdir, 'does-not-exist')
+        # just make sure it doesn't blow up
+        utils.unlink_paths_older_than([path], next(self.ts))
+
+
+class TestFileLikeIter(unittest.TestCase):
+
+    def test_iter_file_iter(self):
+        in_iter = [b'abc', b'de', b'fghijk', b'l']
+        chunks = []
+        for chunk in utils.FileLikeIter(in_iter):
+            chunks.append(chunk)
+        self.assertEqual(chunks, in_iter)
+
+    def test_next(self):
+        in_iter = [b'abc', b'de', b'fghijk', b'l']
+        chunks = []
+        iter_file = utils.FileLikeIter(in_iter)
         while True:
             try:
-                payload = self.sock.recv(4096)
-                if payload and 'STOP' in payload:
-                    return 42
-                self.queue.put(payload)
-            except Exception, e:
-                sys.stderr.write('statsd_reader thread: %r' % (e,))
+                chunk = next(iter_file)
+            except StopIteration:
                 break
+            chunks.append(chunk)
+        self.assertEqual(chunks, in_iter)
+
+    def test_read(self):
+        in_iter = [b'abc', b'de', b'fghijk', b'l']
+        expected = b''.join(in_iter)
+        self.assertEqual(utils.FileLikeIter(in_iter).read(), expected)
+        self.assertEqual(utils.FileLikeIter(in_iter).read(-1), expected)
+        self.assertEqual(utils.FileLikeIter(in_iter).read(None), expected)
+
+    def test_read_empty(self):
+        in_iter = [b'abc']
+        ip = utils.FileLikeIter(in_iter)
+        self.assertEqual(b'abc', ip.read())
+        self.assertEqual(b'', ip.read())
+
+    def test_read_with_size(self):
+        in_iter = [b'abc', b'de', b'fghijk', b'l']
+        chunks = []
+        iter_file = utils.FileLikeIter(in_iter)
+        while True:
+            chunk = iter_file.read(2)
+            if not chunk:
+                break
+            self.assertTrue(len(chunk) <= 2)
+            chunks.append(chunk)
+        self.assertEqual(b''.join(chunks), b''.join(in_iter))
+
+    def test_read_with_size_zero(self):
+        # makes little sense, but file supports it, so...
+        self.assertEqual(utils.FileLikeIter(b'abc').read(0), b'')
+
+    def test_readline(self):
+        in_iter = [b'abc\n', b'd', b'\nef', b'g\nh', b'\nij\n\nk\n',
+                   b'trailing.']
+        lines = []
+        iter_file = utils.FileLikeIter(in_iter)
+        while True:
+            line = iter_file.readline()
+            if not line:
+                break
+            lines.append(line)
+        self.assertEqual(
+            lines,
+            [v if v == b'trailing.' else v + b'\n'
+             for v in b''.join(in_iter).split(b'\n')])
 
-    def _send_and_get(self, sender_fn, *args, **kwargs):
-        """
-        Because the client library may not actually send a packet with
-        sample_rate < 1, we keep trying until we get one through.
-        """
-        got = None
-        while not got:
-            sender_fn(*args, **kwargs)
-            try:
-                got = self.queue.get(timeout=0.5)
-            except Empty:
+    def test_readline_size_unlimited(self):
+        in_iter = [b'abc', b'd\nef']
+        self.assertEqual(
+            utils.FileLikeIter(in_iter).readline(-1),
+            b'abcd\n')
+        self.assertEqual(
+            utils.FileLikeIter(in_iter).readline(None),
+            b'abcd\n')
+
+    def test_readline2(self):
+        self.assertEqual(
+            utils.FileLikeIter([b'abc', b'def\n']).readline(4),
+            b'abcd')
+
+    def test_readline3(self):
+        self.assertEqual(
+            utils.FileLikeIter([b'a' * 1111, b'bc\ndef']).readline(),
+            (b'a' * 1111) + b'bc\n')
+
+    def test_readline_with_size(self):
+
+        in_iter = [b'abc\n', b'd', b'\nef', b'g\nh', b'\nij\n\nk\n',
+                   b'trailing.']
+        lines = []
+        iter_file = utils.FileLikeIter(in_iter)
+        while True:
+            line = iter_file.readline(2)
+            if not line:
+                break
+            lines.append(line)
+        self.assertEqual(
+            lines,
+            [b'ab', b'c\n', b'd\n', b'ef', b'g\n', b'h\n', b'ij', b'\n', b'\n',
+             b'k\n', b'tr', b'ai', b'li', b'ng', b'.'])
+
+    def test_readlines(self):
+        in_iter = [b'abc\n', b'd', b'\nef', b'g\nh', b'\nij\n\nk\n',
+                   b'trailing.']
+        lines = utils.FileLikeIter(in_iter).readlines()
+        self.assertEqual(
+            lines,
+            [v if v == b'trailing.' else v + b'\n'
+             for v in b''.join(in_iter).split(b'\n')])
+        lines = utils.FileLikeIter(in_iter).readlines(sizehint=-1)
+        self.assertEqual(
+            lines,
+            [v if v == b'trailing.' else v + b'\n'
+             for v in b''.join(in_iter).split(b'\n')])
+        lines = utils.FileLikeIter(in_iter).readlines(sizehint=None)
+        self.assertEqual(
+            lines,
+            [v if v == b'trailing.' else v + b'\n'
+             for v in b''.join(in_iter).split(b'\n')])
+
+    def test_readlines_with_size(self):
+        in_iter = [b'abc\n', b'd', b'\nef', b'g\nh', b'\nij\n\nk\n',
+                   b'trailing.']
+        iter_file = utils.FileLikeIter(in_iter)
+        lists_of_lines = []
+        while True:
+            lines = iter_file.readlines(2)
+            if not lines:
+                break
+            lists_of_lines.append(lines)
+        self.assertEqual(
+            lists_of_lines,
+            [[b'ab'], [b'c\n'], [b'd\n'], [b'ef'], [b'g\n'], [b'h\n'], [b'ij'],
+             [b'\n', b'\n'], [b'k\n'], [b'tr'], [b'ai'], [b'li'], [b'ng'],
+             [b'.']])
+
+    def test_close(self):
+        iter_file = utils.FileLikeIter([b'a', b'b', b'c'])
+        self.assertEqual(next(iter_file), b'a')
+        iter_file.close()
+        self.assertTrue(iter_file.closed)
+        self.assertRaises(ValueError, next, iter_file)
+        self.assertRaises(ValueError, iter_file.read)
+        self.assertRaises(ValueError, iter_file.readline)
+        self.assertRaises(ValueError, iter_file.readlines)
+        # Just make sure repeated close calls don't raise an Exception
+        iter_file.close()
+        self.assertTrue(iter_file.closed)
+
+    def test_get_hub(self):
+        # This test mock the eventlet.green.select module without poll
+        # as in eventlet > 0.20
+        # https://github.com/eventlet/eventlet/commit/614a20462
+        # We add __original_module_select to sys.modules to mock usage
+        # of eventlet.patcher.original
+
+        class SelectWithPoll(object):
+            def poll():
                 pass
-        return got
-
-    def assertStat(self, expected, sender_fn, *args, **kwargs):
-        got = self._send_and_get(sender_fn, *args, **kwargs)
-        return self.assertEqual(expected, got)
-
-    def assertStatMatches(self, expected_regexp, sender_fn, *args, **kwargs):
-        got = self._send_and_get(sender_fn, *args, **kwargs)
-        return self.assert_(re.search(expected_regexp, got),
-                            [got, expected_regexp])
-
-    def test_methods_are_no_ops_when_not_enabled(self):
-        logger = utils.get_logger({
-            # No "log_statsd_host" means "disabled"
-            'log_statsd_port': str(self.port),
-        }, 'some-name')
-        # Delegate methods are no-ops
-        self.assertEqual(None, logger.update_stats('foo', 88))
-        self.assertEqual(None, logger.update_stats('foo', 88, 0.57))
-        self.assertEqual(None, logger.update_stats('foo', 88,
-                                                   sample_rate=0.61))
-        self.assertEqual(None, logger.increment('foo'))
-        self.assertEqual(None, logger.increment('foo', 0.57))
-        self.assertEqual(None, logger.increment('foo', sample_rate=0.61))
-        self.assertEqual(None, logger.decrement('foo'))
-        self.assertEqual(None, logger.decrement('foo', 0.57))
-        self.assertEqual(None, logger.decrement('foo', sample_rate=0.61))
-        self.assertEqual(None, logger.timing('foo', 88.048))
-        self.assertEqual(None, logger.timing('foo', 88.57, 0.34))
-        self.assertEqual(None, logger.timing('foo', 88.998, sample_rate=0.82))
-        self.assertEqual(None, logger.timing_since('foo', 8938))
-        self.assertEqual(None, logger.timing_since('foo', 8948, 0.57))
-        self.assertEqual(None, logger.timing_since('foo', 849398,
-                                                   sample_rate=0.61))
-        # Now, the queue should be empty (no UDP packets sent)
-        self.assertRaises(Empty, self.queue.get_nowait)
-
-    def test_delegate_methods_with_no_default_sample_rate(self):
-        self.logger = utils.get_logger({
-            'log_statsd_host': 'localhost',
-            'log_statsd_port': str(self.port),
-        }, 'some-name')
-        self.assertStat('some-name.some.counter:1|c', self.logger.increment,
-                        'some.counter')
-        self.assertStat('some-name.some.counter:-1|c', self.logger.decrement,
-                        'some.counter')
-        self.assertStat('some-name.some.operation:4900.0|ms',
-                        self.logger.timing, 'some.operation', 4.9 * 1000)
-        self.assertStatMatches('some-name\.another\.operation:\d+\.\d+\|ms',
-                               self.logger.timing_since, 'another.operation',
-                               time.time())
-        self.assertStat('some-name.another.counter:42|c',
-                        self.logger.update_stats, 'another.counter', 42)
-
-        # Each call can override the sample_rate (also, bonus prefix test)
-        self.logger.set_statsd_prefix('pfx')
-        self.assertStat('pfx.some.counter:1|c|@0.972', self.logger.increment,
-                        'some.counter', sample_rate=0.972)
-        self.assertStat('pfx.some.counter:-1|c|@0.972', self.logger.decrement,
-                        'some.counter', sample_rate=0.972)
-        self.assertStat('pfx.some.operation:4900.0|ms|@0.972',
-                        self.logger.timing, 'some.operation', 4.9 * 1000,
-                        sample_rate=0.972)
-        self.assertStatMatches('pfx\.another\.op:\d+\.\d+\|ms|@0.972',
-                               self.logger.timing_since, 'another.op',
-                               time.time(), sample_rate=0.972)
-        self.assertStat('pfx.another.counter:3|c|@0.972',
-                        self.logger.update_stats, 'another.counter', 3,
-                        sample_rate=0.972)
-
-        # Can override sample_rate with non-keyword arg
-        self.logger.set_statsd_prefix('')
-        self.assertStat('some.counter:1|c|@0.939', self.logger.increment,
-                        'some.counter', 0.939)
-        self.assertStat('some.counter:-1|c|@0.939', self.logger.decrement,
-                        'some.counter', 0.939)
-        self.assertStat('some.operation:4900.0|ms|@0.939',
-                        self.logger.timing, 'some.operation',
-                        4.9 * 1000, 0.939)
-        self.assertStatMatches('another\.op:\d+\.\d+\|ms|@0.939',
-                               self.logger.timing_since, 'another.op',
-                               time.time(), 0.939)
-        self.assertStat('another.counter:3|c|@0.939',
-                        self.logger.update_stats, 'another.counter', 3, 0.939)
-
-    def test_delegate_methods_with_default_sample_rate(self):
-        self.logger = utils.get_logger({
-            'log_statsd_host': 'localhost',
-            'log_statsd_port': str(self.port),
-            'log_statsd_default_sample_rate': '0.93',
-        }, 'pfx')
-        self.assertStat('pfx.some.counter:1|c|@0.93', self.logger.increment,
-                        'some.counter')
-        self.assertStat('pfx.some.counter:-1|c|@0.93', self.logger.decrement,
-                        'some.counter')
-        self.assertStat('pfx.some.operation:4760.0|ms|@0.93',
-                        self.logger.timing, 'some.operation', 4.76 * 1000)
-        self.assertStatMatches('pfx\.another\.op:\d+\.\d+\|ms|@0.93',
-                               self.logger.timing_since, 'another.op',
-                               time.time())
-        self.assertStat('pfx.another.counter:3|c|@0.93',
-                        self.logger.update_stats, 'another.counter', 3)
-
-        # Each call can override the sample_rate
-        self.assertStat('pfx.some.counter:1|c|@0.9912', self.logger.increment,
-                        'some.counter', sample_rate=0.9912)
-        self.assertStat('pfx.some.counter:-1|c|@0.9912', self.logger.decrement,
-                        'some.counter', sample_rate=0.9912)
-        self.assertStat('pfx.some.operation:4900.0|ms|@0.9912',
-                        self.logger.timing, 'some.operation', 4.9 * 1000,
-                        sample_rate=0.9912)
-        self.assertStatMatches('pfx\.another\.op:\d+\.\d+\|ms|@0.9912',
-                               self.logger.timing_since, 'another.op',
-                               time.time(), sample_rate=0.9912)
-        self.assertStat('pfx.another.counter:3|c|@0.9912',
-                        self.logger.update_stats, 'another.counter', 3,
-                        sample_rate=0.9912)
-
-        # Can override sample_rate with non-keyword arg
-        self.logger.set_statsd_prefix('')
-        self.assertStat('some.counter:1|c|@0.987654', self.logger.increment,
-                        'some.counter', 0.987654)
-        self.assertStat('some.counter:-1|c|@0.987654', self.logger.decrement,
-                        'some.counter', 0.987654)
-        self.assertStat('some.operation:4900.0|ms|@0.987654',
-                        self.logger.timing, 'some.operation',
-                        4.9 * 1000, 0.987654)
-        self.assertStatMatches('another\.op:\d+\.\d+\|ms|@0.987654',
-                               self.logger.timing_since, 'another.op',
-                               time.time(), 0.987654)
-        self.assertStat('another.counter:3|c|@0.987654',
-                        self.logger.update_stats, 'another.counter',
-                        3, 0.987654)
-
-    def test_delegate_methods_with_metric_prefix(self):
-        self.logger = utils.get_logger({
-            'log_statsd_host': 'localhost',
-            'log_statsd_port': str(self.port),
-            'log_statsd_metric_prefix': 'alpha.beta',
-        }, 'pfx')
-        self.assertStat('alpha.beta.pfx.some.counter:1|c',
-                        self.logger.increment, 'some.counter')
-        self.assertStat('alpha.beta.pfx.some.counter:-1|c',
-                        self.logger.decrement, 'some.counter')
-        self.assertStat('alpha.beta.pfx.some.operation:4760.0|ms',
-                        self.logger.timing, 'some.operation', 4.76 * 1000)
-        self.assertStatMatches(
-            'alpha\.beta\.pfx\.another\.op:\d+\.\d+\|ms',
-            self.logger.timing_since, 'another.op', time.time())
-        self.assertStat('alpha.beta.pfx.another.counter:3|c',
-                        self.logger.update_stats, 'another.counter', 3)
-
-        self.logger.set_statsd_prefix('')
-        self.assertStat('alpha.beta.some.counter:1|c|@0.9912',
-                        self.logger.increment, 'some.counter',
-                        sample_rate=0.9912)
-        self.assertStat('alpha.beta.some.counter:-1|c|@0.9912',
-                        self.logger.decrement, 'some.counter', 0.9912)
-        self.assertStat('alpha.beta.some.operation:4900.0|ms|@0.9912',
-                        self.logger.timing, 'some.operation', 4.9 * 1000,
-                        sample_rate=0.9912)
-        self.assertStatMatches('alpha\.beta\.another\.op:\d+\.\d+\|ms|@0.9912',
-                               self.logger.timing_since, 'another.op',
-                               time.time(), sample_rate=0.9912)
-        self.assertStat('alpha.beta.another.counter:3|c|@0.9912',
-                        self.logger.update_stats, 'another.counter', 3,
-                        sample_rate=0.9912)
 
-    def test_get_valid_utf8_str(self):
-        unicode_sample = u'\uc77c\uc601'
-        valid_utf8_str = unicode_sample.encode('utf-8')
-        invalid_utf8_str = unicode_sample.encode('utf-8')[::-1]
-        self.assertEquals(valid_utf8_str,
-                          utils.get_valid_utf8_str(valid_utf8_str))
-        self.assertEquals(valid_utf8_str,
-                          utils.get_valid_utf8_str(unicode_sample))
-        self.assertEquals('\xef\xbf\xbd\xef\xbf\xbd\xec\xbc\x9d\xef\xbf\xbd',
-                          utils.get_valid_utf8_str(invalid_utf8_str))
-
-    def test_thread_locals(self):
-        logger = utils.get_logger(None)
-        orig_thread_locals = logger.thread_locals
+        class SelectWithoutPoll(object):
+            pass
+
+        # Platform with poll() that call get_hub before eventlet patching
+        with mock.patch.dict('sys.modules',
+                             {'select': SelectWithPoll,
+                              '__original_module_select': SelectWithPoll}):
+            self.assertEqual(utils.get_hub(), 'poll')
+
+        # Platform with poll() that call get_hub after eventlet patching
+        with mock.patch.dict('sys.modules',
+                             {'select': SelectWithoutPoll,
+                              '__original_module_select': SelectWithPoll}):
+            self.assertEqual(utils.get_hub(), 'poll')
+
+        # Platform without poll() -- before or after patching doesn't matter
+        with mock.patch.dict('sys.modules',
+                             {'select': SelectWithoutPoll,
+                              '__original_module_select': SelectWithoutPoll}):
+            self.assertEqual(utils.get_hub(), 'selects')
+
+
+class TestInputProxy(unittest.TestCase):
+    def test_read_all(self):
+        self.assertEqual(utils.InputProxy(io.BytesIO(b'abc')).read(), b'abc')
+        self.assertEqual(utils.InputProxy(io.BytesIO(b'abc')).read(-1), b'abc')
+        self.assertEqual(
+            utils.InputProxy(io.BytesIO(b'abc')).read(None), b'abc')
+
+    def test_read_size(self):
+        self.assertEqual(utils.InputProxy(io.BytesIO(b'abc')).read(0), b'')
+        self.assertEqual(utils.InputProxy(io.BytesIO(b'abc')).read(2), b'ab')
+        self.assertEqual(utils.InputProxy(io.BytesIO(b'abc')).read(4), b'abc')
+
+    def test_readline(self):
+        ip = utils.InputProxy(io.BytesIO(b'ab\nc'))
+        self.assertEqual(ip.readline(), b'ab\n')
+        self.assertFalse(ip.client_disconnect)
+
+    def test_bytes_received(self):
+        ip = utils.InputProxy(io.BytesIO(b'ab\ncdef'))
+        ip.readline()
+        self.assertEqual(3, ip.bytes_received)
+        ip.read(2)
+        self.assertEqual(5, ip.bytes_received)
+        ip.read(99)
+        self.assertEqual(7, ip.bytes_received)
+
+    def test_close(self):
+        utils.InputProxy(object()).close()  # safe
+
+        fake = mock.MagicMock()
+        fake.close = mock.MagicMock()
+        ip = (utils.InputProxy(fake))
+        ip.close()
+        self.assertEqual([mock.call()], fake.close.call_args_list)
+        self.assertFalse(ip.client_disconnect)
+
+    def test_read_piecemeal_chunk_update(self):
+        ip = utils.InputProxy(io.BytesIO(b'abc'))
+        with mock.patch.object(ip, 'chunk_update') as mocked:
+            ip.read(1)
+            ip.read(2)
+            ip.read(1)
+            ip.read(1)
+        self.assertEqual([mock.call(b'a', False),
+                          mock.call(b'bc', False),
+                          mock.call(b'', True),
+                          mock.call(b'', True)], mocked.call_args_list)
+
+    def test_read_unlimited_chunk_update(self):
+        ip = utils.InputProxy(io.BytesIO(b'abc'))
+        with mock.patch.object(ip, 'chunk_update') as mocked:
+            ip.read()
+            ip.read()
+        self.assertEqual([mock.call(b'abc', True),
+                          mock.call(b'', True)], mocked.call_args_list)
+        ip = utils.InputProxy(io.BytesIO(b'abc'))
+        with mock.patch.object(ip, 'chunk_update') as mocked:
+            ip.read(None)
+            ip.read(None)
+        self.assertEqual([mock.call(b'abc', True),
+                          mock.call(b'', True)], mocked.call_args_list)
+        ip = utils.InputProxy(io.BytesIO(b'abc'))
+        with mock.patch.object(ip, 'chunk_update') as mocked:
+            ip.read(-1)
+            ip.read(-1)
+        self.assertEqual([mock.call(b'abc', True),
+                          mock.call(b'', True)], mocked.call_args_list)
+
+    def test_readline_piecemeal_chunk_update(self):
+        ip = utils.InputProxy(io.BytesIO(b'ab\nc'))
+        with mock.patch.object(ip, 'chunk_update') as mocked:
+            ip.readline(3)
+            ip.readline(1)  # read to exact length
+            ip.readline(1)
+        self.assertEqual([mock.call(b'ab\n', False),
+                          mock.call(b'c', False),
+                          mock.call(b'', True)], mocked.call_args_list)
+        ip = utils.InputProxy(io.BytesIO(b'ab\nc'))
+        with mock.patch.object(ip, 'chunk_update') as mocked:
+            ip.readline(3)
+            ip.readline(2)  # read beyond exact length
+            ip.readline(1)
+        self.assertEqual([mock.call(b'ab\n', False),
+                          mock.call(b'c', True),
+                          mock.call(b'', True)], mocked.call_args_list)
+
+    def test_readline_unlimited_chunk_update(self):
+        ip = utils.InputProxy(io.BytesIO(b'ab\nc'))
+        with mock.patch.object(ip, 'chunk_update') as mocked:
+            ip.readline()
+            ip.readline()
+        self.assertEqual([mock.call(b'ab\n', False),
+                          mock.call(b'c', True)], mocked.call_args_list)
+        ip = utils.InputProxy(io.BytesIO(b'ab\nc'))
+        with mock.patch.object(ip, 'chunk_update') as mocked:
+            ip.readline(None)
+            ip.readline(None)
+        self.assertEqual([mock.call(b'ab\n', False),
+                          mock.call(b'c', True)], mocked.call_args_list)
+        ip = utils.InputProxy(io.BytesIO(b'ab\nc'))
+        with mock.patch.object(ip, 'chunk_update') as mocked:
+            ip.readline(-1)
+            ip.readline(-1)
+        self.assertEqual([mock.call(b'ab\n', False),
+                          mock.call(b'c', True)], mocked.call_args_list)
+
+    def test_chunk_update_modifies_chunk(self):
+        ip = utils.InputProxy(io.BytesIO(b'abc'))
+        with mock.patch.object(ip, 'chunk_update', return_value='modified'):
+            actual = ip.read()
+        self.assertEqual('modified', actual)
+
+    def test_read_client_disconnect(self):
+        fake = mock.MagicMock()
+        fake.read = mock.MagicMock(side_effect=ValueError('boom'))
+        ip = utils.InputProxy(fake)
+        with self.assertRaises(ValueError) as cm:
+            ip.read()
+        self.assertTrue(ip.client_disconnect)
+        self.assertEqual('boom', str(cm.exception))
+
+    def test_readline_client_disconnect(self):
+        fake = mock.MagicMock()
+        fake.readline = mock.MagicMock(side_effect=ValueError('boom'))
+        ip = utils.InputProxy(fake)
+        with self.assertRaises(ValueError) as cm:
+            ip.readline()
+        self.assertTrue(ip.client_disconnect)
+        self.assertEqual('boom', str(cm.exception))
+
+
+class UnsafeXrange(object):
+    """
+    Like range(limit), but with extra context switching to screw things up.
+    """
+
+    def __init__(self, upper_bound):
+        self.current = 0
+        self.concurrent_calls = 0
+        self.upper_bound = upper_bound
+        self.concurrent_call = False
+
+    def __iter__(self):
+        return self
+
+    def __next__(self):
+        if self.concurrent_calls > 0:
+            self.concurrent_call = True
+
+        self.concurrent_calls += 1
         try:
-            self.assertEquals(logger.thread_locals, (None, None))
-            logger.txn_id = '1234'
-            logger.client_ip = '1.2.3.4'
-            self.assertEquals(logger.thread_locals, ('1234', '1.2.3.4'))
-            logger.txn_id = '5678'
-            logger.client_ip = '5.6.7.8'
-            self.assertEquals(logger.thread_locals, ('5678', '5.6.7.8'))
+            if self.current >= self.upper_bound:
+                raise StopIteration
+            else:
+                val = self.current
+                self.current += 1
+                eventlet.sleep()   # yield control
+                return val
         finally:
-            logger.thread_locals = orig_thread_locals
+            self.concurrent_calls -= 1
+
+
+class TestEventletRateLimiter(unittest.TestCase):
+    def test_init(self):
+        rl = utils.EventletRateLimiter(0.1)
+        self.assertEqual(0.1, rl.max_rate)
+        self.assertEqual(0.0, rl.running_time)
+        self.assertEqual(5000, rl.rate_buffer_ms)
+
+        rl = utils.EventletRateLimiter(
+            0.2, rate_buffer=2, running_time=1234567.8)
+        self.assertEqual(0.2, rl.max_rate)
+        self.assertEqual(1234567.8, rl.running_time)
+        self.assertEqual(2000, rl.rate_buffer_ms)
+
+    def test_set_max_rate(self):
+        rl = utils.EventletRateLimiter(0.1)
+        self.assertEqual(0.1, rl.max_rate)
+        self.assertEqual(10000, rl.time_per_incr)
+        rl.set_max_rate(2)
+        self.assertEqual(2, rl.max_rate)
+        self.assertEqual(500, rl.time_per_incr)
+
+    def test_set_rate_buffer(self):
+        rl = utils.EventletRateLimiter(0.1)
+        self.assertEqual(5000.0, rl.rate_buffer_ms)
+        rl.set_rate_buffer(2.3)
+        self.assertEqual(2300, rl.rate_buffer_ms)
+
+    def test_non_blocking(self):
+        rate_limiter = utils.EventletRateLimiter(0.1, rate_buffer=0)
+        with patch('time.time',) as mock_time:
+            with patch('eventlet.sleep') as mock_sleep:
+                mock_time.return_value = 0
+                self.assertTrue(rate_limiter.is_allowed())
+                mock_sleep.assert_not_called()
+                self.assertFalse(rate_limiter.is_allowed())
+                mock_sleep.assert_not_called()
+
+                mock_time.return_value = 9.99
+                self.assertFalse(rate_limiter.is_allowed())
+                mock_sleep.assert_not_called()
+                mock_time.return_value = 10.0
+                self.assertTrue(rate_limiter.is_allowed())
+                mock_sleep.assert_not_called()
+                self.assertFalse(rate_limiter.is_allowed())
+                mock_sleep.assert_not_called()
+
+        rate_limiter = utils.EventletRateLimiter(0.1, rate_buffer=20)
+        with patch('time.time',) as mock_time:
+            with patch('eventlet.sleep') as mock_sleep:
+                mock_time.return_value = 20.0
+                self.assertTrue(rate_limiter.is_allowed())
+                mock_sleep.assert_not_called()
+                self.assertTrue(rate_limiter.is_allowed())
+                mock_sleep.assert_not_called()
+                self.assertTrue(rate_limiter.is_allowed())
+                mock_sleep.assert_not_called()
+                self.assertFalse(rate_limiter.is_allowed())
+                mock_sleep.assert_not_called()
+
+    def test_non_blocking_max_rate_adjusted(self):
+        rate_limiter = utils.EventletRateLimiter(0.1, rate_buffer=0)
+        with patch('time.time',) as mock_time:
+            with patch('eventlet.sleep') as mock_sleep:
+                mock_time.return_value = 0
+                self.assertTrue(rate_limiter.is_allowed())
+                self.assertFalse(rate_limiter.is_allowed())
+                mock_time.return_value = 9.99
+                self.assertFalse(rate_limiter.is_allowed())
+                mock_time.return_value = 10.0
+                self.assertTrue(rate_limiter.is_allowed())
+                self.assertFalse(rate_limiter.is_allowed())
+                # increase max_rate...but the new max_rate won't have impact
+                # until the running time is next incremented, i.e. when
+                # a call to is_allowed() next returns True
+                rate_limiter.set_max_rate(0.2)
+                self.assertFalse(rate_limiter.is_allowed())
+                mock_time.return_value = 19.99
+                self.assertFalse(rate_limiter.is_allowed())
+                mock_time.return_value = 20.0
+                self.assertTrue(rate_limiter.is_allowed())
+                # now we can go faster...
+                self.assertFalse(rate_limiter.is_allowed())
+                mock_time.return_value = 24.99
+                self.assertFalse(rate_limiter.is_allowed())
+                mock_time.return_value = 25.0
+                self.assertTrue(rate_limiter.is_allowed())
+                self.assertFalse(rate_limiter.is_allowed())
+
+        mock_sleep.assert_not_called()
+
+    def _do_test(self, max_rate, running_time, start_time, rate_buffer,
+                 burst_after_idle=False, incr_by=1.0):
+        rate_limiter = utils.EventletRateLimiter(
+            max_rate,
+            running_time=1000 * running_time,  # msecs
+            rate_buffer=rate_buffer,
+            burst_after_idle=burst_after_idle)
+        grant_times = []
+        current_time = [start_time]
+
+        def mock_time():
+            return current_time[0]
+
+        def mock_sleep(duration):
+            current_time[0] += duration
+
+        with patch('time.time', mock_time):
+            with patch('eventlet.sleep', mock_sleep):
+                for i in range(5):
+                    rate_limiter.wait(incr_by=incr_by)
+                    grant_times.append(current_time[0])
+        return [round(t, 6) for t in grant_times]
+
+    def test_ratelimit(self):
+        grant_times = self._do_test(1, 0, 1, 0)
+        self.assertEqual([1, 2, 3, 4, 5], grant_times)
+
+        grant_times = self._do_test(10, 0, 1, 0)
+        self.assertEqual([1, 1.1, 1.2, 1.3, 1.4], grant_times)
+
+        grant_times = self._do_test(.1, 0, 1, 0)
+        self.assertEqual([1, 11, 21, 31, 41], grant_times)
+
+        grant_times = self._do_test(.1, 11, 1, 0)
+        self.assertEqual([11, 21, 31, 41, 51], grant_times)
+
+    def test_incr_by(self):
+        grant_times = self._do_test(1, 0, 1, 0, incr_by=2.5)
+        self.assertEqual([1, 3.5, 6, 8.5, 11], grant_times)
+
+    def test_burst(self):
+        grant_times = self._do_test(1, 1, 4, 0)
+        self.assertEqual([4, 5, 6, 7, 8], grant_times)
+
+        grant_times = self._do_test(1, 1, 4, 1)
+        self.assertEqual([4, 5, 6, 7, 8], grant_times)
+
+        grant_times = self._do_test(1, 1, 4, 2)
+        self.assertEqual([4, 5, 6, 7, 8], grant_times)
+
+        grant_times = self._do_test(1, 1, 4, 3)
+        self.assertEqual([4, 4, 4, 4, 5], grant_times)
+
+        grant_times = self._do_test(1, 1, 4, 4)
+        self.assertEqual([4, 4, 4, 4, 5], grant_times)
+
+        grant_times = self._do_test(1, 1, 3, 3)
+        self.assertEqual([3, 3, 3, 4, 5], grant_times)
+
+        grant_times = self._do_test(1, 0, 2, 3)
+        self.assertEqual([2, 2, 2, 3, 4], grant_times)
+
+        grant_times = self._do_test(1, 1, 3, 3)
+        self.assertEqual([3, 3, 3, 4, 5], grant_times)
+
+        grant_times = self._do_test(1, 0, 3, 3)
+        self.assertEqual([3, 3, 3, 3, 4], grant_times)
+
+        grant_times = self._do_test(1, 1, 3, 3)
+        self.assertEqual([3, 3, 3, 4, 5], grant_times)
+
+        grant_times = self._do_test(1, 0, 4, 3)
+        self.assertEqual([4, 5, 6, 7, 8], grant_times)
+
+    def test_burst_after_idle(self):
+        grant_times = self._do_test(1, 1, 4, 1, burst_after_idle=True)
+        self.assertEqual([4, 4, 5, 6, 7], grant_times)
+
+        grant_times = self._do_test(1, 1, 4, 2, burst_after_idle=True)
+        self.assertEqual([4, 4, 4, 5, 6], grant_times)
+
+        grant_times = self._do_test(1, 0, 4, 3, burst_after_idle=True)
+        self.assertEqual([4, 4, 4, 4, 5], grant_times)
+
+        # running_time = start_time prevents burst on start-up
+        grant_times = self._do_test(1, 4, 4, 3, burst_after_idle=True)
+        self.assertEqual([4, 5, 6, 7, 8], grant_times)
+
+
+class TestRateLimitedIterator(unittest.TestCase):
+
+    def run_under_pseudo_time(
+            self, func, *args, **kwargs):
+        curr_time = [42.0]
+
+        def my_time():
+            curr_time[0] += 0.001
+            return curr_time[0]
+
+        def my_sleep(duration):
+            curr_time[0] += 0.001
+            curr_time[0] += duration
+
+        with patch('time.time', my_time), \
+                patch('eventlet.sleep', my_sleep):
+            return func(*args, **kwargs)
+
+    def test_rate_limiting(self):
+
+        def testfunc():
+            limited_iterator = utils.RateLimitedIterator(range(9999), 100)
+            got = []
+            started_at = time.time()
+            try:
+                while time.time() - started_at < 0.1:
+                    got.append(next(limited_iterator))
+            except StopIteration:
+                pass
+            return got
+
+        got = self.run_under_pseudo_time(testfunc)
+        # it's 11, not 10, because ratelimiting doesn't apply to the very
+        # first element.
+        self.assertEqual(len(got), 11)
+
+    def test_rate_limiting_sometimes(self):
+
+        def testfunc():
+            limited_iterator = utils.RateLimitedIterator(
+                range(9999), 100,
+                ratelimit_if=lambda item: item % 23 != 0)
+            got = []
+            started_at = time.time()
+            try:
+                while time.time() - started_at < 0.5:
+                    got.append(next(limited_iterator))
+            except StopIteration:
+                pass
+            return got
+
+        got = self.run_under_pseudo_time(testfunc)
+        # we'd get 51 without the ratelimit_if, but because 0, 23 and 46
+        # weren't subject to ratelimiting, we get 54 instead
+        self.assertEqual(len(got), 54)
+
+    def test_limit_after(self):
+
+        def testfunc():
+            limited_iterator = utils.RateLimitedIterator(
+                range(9999), 100, limit_after=5)
+            got = []
+            started_at = time.time()
+            try:
+                while time.time() - started_at < 0.1:
+                    got.append(next(limited_iterator))
+            except StopIteration:
+                pass
+            return got
+
+        got = self.run_under_pseudo_time(testfunc)
+        # it's 16, not 15, because ratelimiting doesn't apply to the very
+        # first element.
+        self.assertEqual(len(got), 16)
+
+
+class TestGreenthreadSafeIterator(unittest.TestCase):
+
+    def increment(self, iterable):
+        plus_ones = []
+        for n in iterable:
+            plus_ones.append(n + 1)
+        return plus_ones
+
+    def test_setup_works(self):
+        # it should work without concurrent access
+        self.assertEqual([0, 1, 2, 3], list(UnsafeXrange(4)))
+
+        iterable = UnsafeXrange(10)
+        pile = eventlet.GreenPile(2)
+        for _ in range(2):
+            pile.spawn(self.increment, iterable)
+
+        sorted([resp for resp in pile])
+        self.assertTrue(
+            iterable.concurrent_call, 'test setup is insufficiently crazy')
+
+    def test_access_is_serialized(self):
+        pile = eventlet.GreenPile(2)
+        unsafe_iterable = UnsafeXrange(10)
+        iterable = utils.GreenthreadSafeIterator(unsafe_iterable)
+        for _ in range(2):
+            pile.spawn(self.increment, iterable)
+        response = sorted(sum([resp for resp in pile], []))
+        self.assertEqual(list(range(1, 11)), response)
+        self.assertTrue(
+            not unsafe_iterable.concurrent_call, 'concurrent call occurred')
+
+
+class TestAuditLocationGenerator(unittest.TestCase):
+
+    def test_drive_tree_access(self):
+        orig_listdir = utils.listdir
+
+        def _mock_utils_listdir(path):
+            if 'bad_part' in path:
+                raise OSError(errno.EACCES)
+            elif 'bad_suffix' in path:
+                raise OSError(errno.EACCES)
+            elif 'bad_hash' in path:
+                raise OSError(errno.EACCES)
+            else:
+                return orig_listdir(path)
+
+        # Check Raise on Bad partition
+        tmpdir = mkdtemp()
+        data = os.path.join(tmpdir, "drive", "data")
+        os.makedirs(data)
+        obj_path = os.path.join(data, "bad_part")
+        with open(obj_path, "w"):
+            pass
+        part1 = os.path.join(data, "partition1")
+        os.makedirs(part1)
+        part2 = os.path.join(data, "partition2")
+        os.makedirs(part2)
+        with patch('swift.common.utils.listdir', _mock_utils_listdir):
+            audit = lambda: list(utils.audit_location_generator(
+                tmpdir, "data", mount_check=False))
+            self.assertRaises(OSError, audit)
+        rmtree(tmpdir)
+
+        # Check Raise on Bad Suffix
+        tmpdir = mkdtemp()
+        data = os.path.join(tmpdir, "drive", "data")
+        os.makedirs(data)
+        part1 = os.path.join(data, "partition1")
+        os.makedirs(part1)
+        part2 = os.path.join(data, "partition2")
+        os.makedirs(part2)
+        obj_path = os.path.join(part1, "bad_suffix")
+        with open(obj_path, 'w'):
+            pass
+        suffix = os.path.join(part2, "suffix")
+        os.makedirs(suffix)
+        with patch('swift.common.utils.listdir', _mock_utils_listdir):
+            audit = lambda: list(utils.audit_location_generator(
+                tmpdir, "data", mount_check=False))
+            self.assertRaises(OSError, audit)
+        rmtree(tmpdir)
+
+        # Check Raise on Bad Hash
+        tmpdir = mkdtemp()
+        data = os.path.join(tmpdir, "drive", "data")
+        os.makedirs(data)
+        part1 = os.path.join(data, "partition1")
+        os.makedirs(part1)
+        suffix = os.path.join(part1, "suffix")
+        os.makedirs(suffix)
+        hash1 = os.path.join(suffix, "hash1")
+        os.makedirs(hash1)
+        obj_path = os.path.join(suffix, "bad_hash")
+        with open(obj_path, 'w'):
+            pass
+        with patch('swift.common.utils.listdir', _mock_utils_listdir):
+            audit = lambda: list(utils.audit_location_generator(
+                tmpdir, "data", mount_check=False))
+            self.assertRaises(OSError, audit)
+        rmtree(tmpdir)
+
+    def test_non_dir_drive(self):
+        with temptree([]) as tmpdir:
+            logger = debug_logger()
+            data = os.path.join(tmpdir, "drive", "data")
+            os.makedirs(data)
+            # Create a file, that represents a non-dir drive
+            open(os.path.join(tmpdir, 'asdf'), 'w')
+            locations = utils.audit_location_generator(
+                tmpdir, "data", mount_check=False, logger=logger
+            )
+            self.assertEqual(list(locations), [])
+            self.assertEqual(1, len(logger.get_lines_for_level('warning')))
+            # Test without the logger
+            locations = utils.audit_location_generator(
+                tmpdir, "data", mount_check=False
+            )
+            self.assertEqual(list(locations), [])
+
+    def test_mount_check_drive(self):
+        with temptree([]) as tmpdir:
+            logger = debug_logger()
+            data = os.path.join(tmpdir, "drive", "data")
+            os.makedirs(data)
+            # Create a file, that represents a non-dir drive
+            open(os.path.join(tmpdir, 'asdf'), 'w')
+            locations = utils.audit_location_generator(
+                tmpdir, "data", mount_check=True, logger=logger
+            )
+            self.assertEqual(list(locations), [])
+            self.assertEqual(2, len(logger.get_lines_for_level('warning')))
+
+            # Test without the logger
+            locations = utils.audit_location_generator(
+                tmpdir, "data", mount_check=True
+            )
+            self.assertEqual(list(locations), [])
+
+    def test_non_dir_contents(self):
+        with temptree([]) as tmpdir:
+            logger = debug_logger()
+            data = os.path.join(tmpdir, "drive", "data")
+            os.makedirs(data)
+            with open(os.path.join(data, "partition1"), "w"):
+                pass
+            partition = os.path.join(data, "partition2")
+            os.makedirs(partition)
+            with open(os.path.join(partition, "suffix1"), "w"):
+                pass
+            suffix = os.path.join(partition, "suffix2")
+            os.makedirs(suffix)
+            with open(os.path.join(suffix, "hash1"), "w"):
+                pass
+            locations = utils.audit_location_generator(
+                tmpdir, "data", mount_check=False, logger=logger
+            )
+            self.assertEqual(list(locations), [])
+
+    def test_find_objects(self):
+        with temptree([]) as tmpdir:
+            expected_objs = list()
+            expected_dirs = list()
+            logger = debug_logger()
+            data = os.path.join(tmpdir, "drive", "data")
+            os.makedirs(data)
+            # Create a file, that represents a non-dir drive
+            open(os.path.join(tmpdir, 'asdf'), 'w')
+            partition = os.path.join(data, "partition1")
+            os.makedirs(partition)
+            suffix = os.path.join(partition, "suffix")
+            os.makedirs(suffix)
+            hash_path = os.path.join(suffix, "hash")
+            os.makedirs(hash_path)
+            expected_dirs.append((hash_path, 'drive', 'partition1'))
+            obj_path = os.path.join(hash_path, "obj1.db")
+            with open(obj_path, "w"):
+                pass
+            expected_objs.append((obj_path, 'drive', 'partition1'))
+            partition = os.path.join(data, "partition2")
+            os.makedirs(partition)
+            suffix = os.path.join(partition, "suffix2")
+            os.makedirs(suffix)
+            hash_path = os.path.join(suffix, "hash2")
+            os.makedirs(hash_path)
+            expected_dirs.append((hash_path, 'drive', 'partition2'))
+            obj_path = os.path.join(hash_path, "obj2.db")
+            with open(obj_path, "w"):
+                pass
+            expected_objs.append((obj_path, 'drive', 'partition2'))
+            locations = utils.audit_location_generator(
+                tmpdir, "data", mount_check=False, logger=logger
+            )
+            got_objs = list(locations)
+            self.assertEqual(len(got_objs), len(expected_objs))
+            self.assertEqual(sorted(got_objs), sorted(expected_objs))
+            self.assertEqual(1, len(logger.get_lines_for_level('warning')))
+
+            # check yield_hash_dirs option
+            locations = utils.audit_location_generator(
+                tmpdir, "data", mount_check=False, logger=logger,
+                yield_hash_dirs=True,
+            )
+            got_dirs = list(locations)
+            self.assertEqual(sorted(got_dirs), sorted(expected_dirs))
+
+    def test_ignore_metadata(self):
+        with temptree([]) as tmpdir:
+            logger = debug_logger()
+            data = os.path.join(tmpdir, "drive", "data")
+            os.makedirs(data)
+            partition = os.path.join(data, "partition2")
+            os.makedirs(partition)
+            suffix = os.path.join(partition, "suffix2")
+            os.makedirs(suffix)
+            hash_path = os.path.join(suffix, "hash2")
+            os.makedirs(hash_path)
+            obj_path = os.path.join(hash_path, "obj1.dat")
+            with open(obj_path, "w"):
+                pass
+            meta_path = os.path.join(hash_path, "obj1.meta")
+            with open(meta_path, "w"):
+                pass
+            locations = utils.audit_location_generator(
+                tmpdir, "data", ".dat", mount_check=False, logger=logger
+            )
+            self.assertEqual(list(locations),
+                             [(obj_path, "drive", "partition2")])
+
+    def test_hooks(self):
+        with temptree([]) as tmpdir:
+            logger = debug_logger()
+            data = os.path.join(tmpdir, "drive", "data")
+            os.makedirs(data)
+            partition = os.path.join(data, "partition1")
+            os.makedirs(partition)
+            suffix = os.path.join(partition, "suffix1")
+            os.makedirs(suffix)
+            hash_path = os.path.join(suffix, "hash1")
+            os.makedirs(hash_path)
+            obj_path = os.path.join(hash_path, "obj1.dat")
+            with open(obj_path, "w"):
+                pass
+            meta_path = os.path.join(hash_path, "obj1.meta")
+            with open(meta_path, "w"):
+                pass
+            hook_pre_device = MagicMock()
+            hook_post_device = MagicMock()
+            hook_pre_partition = MagicMock()
+            hook_post_partition = MagicMock()
+            hook_pre_suffix = MagicMock()
+            hook_post_suffix = MagicMock()
+            hook_pre_hash = MagicMock()
+            hook_post_hash = MagicMock()
+            locations = utils.audit_location_generator(
+                tmpdir, "data", ".dat", mount_check=False, logger=logger,
+                hook_pre_device=hook_pre_device,
+                hook_post_device=hook_post_device,
+                hook_pre_partition=hook_pre_partition,
+                hook_post_partition=hook_post_partition,
+                hook_pre_suffix=hook_pre_suffix,
+                hook_post_suffix=hook_post_suffix,
+                hook_pre_hash=hook_pre_hash,
+                hook_post_hash=hook_post_hash
+            )
+            list(locations)
+            hook_pre_device.assert_called_once_with(os.path.join(tmpdir,
+                                                                 "drive"))
+            hook_post_device.assert_called_once_with(os.path.join(tmpdir,
+                                                                  "drive"))
+            hook_pre_partition.assert_called_once_with(partition)
+            hook_post_partition.assert_called_once_with(partition)
+            hook_pre_suffix.assert_called_once_with(suffix)
+            hook_post_suffix.assert_called_once_with(suffix)
+            hook_pre_hash.assert_called_once_with(hash_path)
+            hook_post_hash.assert_called_once_with(hash_path)
+
+    def test_filters(self):
+        with temptree([]) as tmpdir:
+            logger = debug_logger()
+            data = os.path.join(tmpdir, "drive", "data")
+            os.makedirs(data)
+            partition = os.path.join(data, "partition1")
+            os.makedirs(partition)
+            suffix = os.path.join(partition, "suffix1")
+            os.makedirs(suffix)
+            hash_path = os.path.join(suffix, "hash1")
+            os.makedirs(hash_path)
+            obj_path = os.path.join(hash_path, "obj1.dat")
+            with open(obj_path, "w"):
+                pass
+            meta_path = os.path.join(hash_path, "obj1.meta")
+            with open(meta_path, "w"):
+                pass
+
+            def audit_location_generator(**kwargs):
+                return utils.audit_location_generator(
+                    tmpdir, "data", ".dat", mount_check=False, logger=logger,
+                    **kwargs)
+
+            # Return the list of devices
+
+            with patch('os.listdir', side_effect=os.listdir) as m_listdir:
+                # devices_filter
+                m_listdir.reset_mock()
+                devices_filter = MagicMock(return_value=["drive"])
+                list(audit_location_generator(devices_filter=devices_filter))
+                devices_filter.assert_called_once_with(tmpdir, ["drive"])
+                self.assertIn(((data,),), m_listdir.call_args_list)
+
+                m_listdir.reset_mock()
+                devices_filter = MagicMock(return_value=[])
+                list(audit_location_generator(devices_filter=devices_filter))
+                devices_filter.assert_called_once_with(tmpdir, ["drive"])
+                self.assertNotIn(((data,),), m_listdir.call_args_list)
+
+                # partitions_filter
+                m_listdir.reset_mock()
+                partitions_filter = MagicMock(return_value=["partition1"])
+                list(audit_location_generator(
+                    partitions_filter=partitions_filter))
+                partitions_filter.assert_called_once_with(data,
+                                                          ["partition1"])
+                self.assertIn(((partition,),), m_listdir.call_args_list)
+
+                m_listdir.reset_mock()
+                partitions_filter = MagicMock(return_value=[])
+                list(audit_location_generator(
+                    partitions_filter=partitions_filter))
+                partitions_filter.assert_called_once_with(data,
+                                                          ["partition1"])
+                self.assertNotIn(((partition,),), m_listdir.call_args_list)
+
+                # suffixes_filter
+                m_listdir.reset_mock()
+                suffixes_filter = MagicMock(return_value=["suffix1"])
+                list(audit_location_generator(suffixes_filter=suffixes_filter))
+                suffixes_filter.assert_called_once_with(partition, ["suffix1"])
+                self.assertIn(((suffix,),), m_listdir.call_args_list)
+
+                m_listdir.reset_mock()
+                suffixes_filter = MagicMock(return_value=[])
+                list(audit_location_generator(suffixes_filter=suffixes_filter))
+                suffixes_filter.assert_called_once_with(partition, ["suffix1"])
+                self.assertNotIn(((suffix,),), m_listdir.call_args_list)
+
+                # hashes_filter
+                m_listdir.reset_mock()
+                hashes_filter = MagicMock(return_value=["hash1"])
+                list(audit_location_generator(hashes_filter=hashes_filter))
+                hashes_filter.assert_called_once_with(suffix, ["hash1"])
+                self.assertIn(((hash_path,),), m_listdir.call_args_list)
+
+                m_listdir.reset_mock()
+                hashes_filter = MagicMock(return_value=[])
+                list(audit_location_generator(hashes_filter=hashes_filter))
+                hashes_filter.assert_called_once_with(suffix, ["hash1"])
+                self.assertNotIn(((hash_path,),), m_listdir.call_args_list)
+
+    @with_tempdir
+    def test_error_counter(self, tmpdir):
+        def assert_no_errors(devices, mount_check=False):
+            logger = debug_logger()
+            error_counter = {}
+            locations = utils.audit_location_generator(
+                devices, "data", mount_check=mount_check, logger=logger,
+                error_counter=error_counter
+            )
+            self.assertEqual([], list(locations))
+            self.assertEqual([], logger.get_lines_for_level('warning'))
+            self.assertEqual([], logger.get_lines_for_level('error'))
+            self.assertEqual({}, error_counter)
+
+        # no devices, no problem
+        devices = os.path.join(tmpdir, 'devices1')
+        os.makedirs(devices)
+        assert_no_errors(devices)
+
+        # empty dir under devices/
+        devices = os.path.join(tmpdir, 'devices2')
+        os.makedirs(devices)
+        dev_dir = os.path.join(devices, 'device_is_empty_dir')
+        os.makedirs(dev_dir)
+
+        def assert_listdir_error(devices, expected):
+            logger = debug_logger()
+            error_counter = {}
+            locations = utils.audit_location_generator(
+                devices, "data", mount_check=False, logger=logger,
+                error_counter=error_counter
+            )
+            self.assertEqual([], list(locations))
+            self.assertEqual(1, len(logger.get_lines_for_level('warning')))
+            self.assertEqual({'unlistable_partitions': expected},
+                             error_counter)
+
+        # file under devices/
+        devices = os.path.join(tmpdir, 'devices3')
+        os.makedirs(devices)
+        with open(os.path.join(devices, 'device_is_file'), 'w'):
+            pass
+        listdir_error_data_dir = os.path.join(devices, 'device_is_file',
+                                              'data')
+        assert_listdir_error(devices, [listdir_error_data_dir])
+
+        # dir under devices/
+        devices = os.path.join(tmpdir, 'devices4')
+        device = os.path.join(devices, 'device')
+        os.makedirs(device)
+        expected_datadir = os.path.join(devices, 'device', 'data')
+        assert_no_errors(devices)
+
+        # error for dir under devices/
+        orig_listdir = utils.listdir
+
+        def mocked(path):
+            if path.endswith('data'):
+                raise OSError
+            return orig_listdir(path)
+
+        with mock.patch('swift.common.utils.listdir', mocked):
+            assert_listdir_error(devices, [expected_datadir])
+
+        # mount check error
+        devices = os.path.join(tmpdir, 'devices5')
+        device = os.path.join(devices, 'device')
+        os.makedirs(device)
+
+        # no check
+        with mock.patch('swift.common.utils.ismount', return_value=False):
+            assert_no_errors(devices, mount_check=False)
+
+        # check passes
+        with mock.patch('swift.common.utils.ismount', return_value=True):
+            assert_no_errors(devices, mount_check=True)
+
+        # check fails
+        logger = debug_logger()
+        error_counter = {}
+        with mock.patch('swift.common.utils.ismount', return_value=False):
+            locations = utils.audit_location_generator(
+                devices, "data", mount_check=True, logger=logger,
+                error_counter=error_counter
+            )
+        self.assertEqual([], list(locations))
+        self.assertEqual(1, len(logger.get_lines_for_level('warning')))
+        self.assertEqual({'unmounted': ['device']}, error_counter)
+
+
+class TestGreenAsyncPile(unittest.TestCase):
 
+    def setUp(self):
+        self.timeout = Timeout(5.0)
+
+    def tearDown(self):
+        self.timeout.cancel()
+
+    def test_runs_everything(self):
+        def run_test():
+            tests_ran[0] += 1
+            return tests_ran[0]
+        tests_ran = [0]
+        pile = utils.GreenAsyncPile(3)
+        for x in range(3):
+            pile.spawn(run_test)
+        self.assertEqual(sorted(x for x in pile), [1, 2, 3])
+
+    def test_is_asynchronous(self):
+        def run_test(index):
+            events[index].wait()
+            return index
+
+        pile = utils.GreenAsyncPile(3)
+        for order in ((1, 2, 0), (0, 1, 2), (2, 1, 0), (0, 2, 1)):
+            events = [eventlet.event.Event(), eventlet.event.Event(),
+                      eventlet.event.Event()]
+            for x in range(3):
+                pile.spawn(run_test, x)
+            for x in order:
+                events[x].send()
+                self.assertEqual(next(pile), x)
+
+    def test_next_when_empty(self):
+        def run_test():
+            pass
+        pile = utils.GreenAsyncPile(3)
+        pile.spawn(run_test)
+        self.assertIsNone(next(pile))
+        self.assertRaises(StopIteration, lambda: next(pile))
+
+    def test_waitall_timeout_timesout(self):
+        def run_test(sleep_duration):
+            eventlet.sleep(sleep_duration)
+            completed[0] += 1
+            return sleep_duration
+
+        completed = [0]
+        pile = utils.GreenAsyncPile(3)
+        pile.spawn(run_test, 0.1)
+        pile.spawn(run_test, 1.0)
+        self.assertEqual(pile.waitall(0.5), [0.1])
+        self.assertEqual(completed[0], 1)
+
+    def test_waitall_timeout_completes(self):
+        def run_test(sleep_duration):
+            eventlet.sleep(sleep_duration)
+            completed[0] += 1
+            return sleep_duration
+
+        completed = [0]
+        pile = utils.GreenAsyncPile(3)
+        pile.spawn(run_test, 0.1)
+        pile.spawn(run_test, 0.1)
+        self.assertEqual(pile.waitall(0.5), [0.1, 0.1])
+        self.assertEqual(completed[0], 2)
+
+    def test_waitfirst_only_returns_first(self):
+        def run_test(name):
+            eventlet.sleep(0)
+            completed.append(name)
+            return name
+
+        completed = []
+        pile = utils.GreenAsyncPile(3)
+        pile.spawn(run_test, 'first')
+        pile.spawn(run_test, 'second')
+        pile.spawn(run_test, 'third')
+        self.assertEqual(pile.waitfirst(0.5), completed[0])
+        # 3 still completed, but only the first was returned.
+        self.assertEqual(3, len(completed))
+
+    def test_wait_with_firstn(self):
+        def run_test(name):
+            eventlet.sleep(0)
+            completed.append(name)
+            return name
+
+        for first_n in [None] + list(range(6)):
+            completed = []
+            pile = utils.GreenAsyncPile(10)
+            for i in range(10):
+                pile.spawn(run_test, i)
+            actual = pile._wait(1, first_n)
+            expected_n = first_n if first_n else 10
+            self.assertEqual(completed[:expected_n], actual)
+            self.assertEqual(10, len(completed))
+
+    def test_pending(self):
+        pile = utils.GreenAsyncPile(3)
+        self.assertEqual(0, pile._pending)
+        for repeats in range(2):
+            # repeat to verify that pending will go again up after going down
+            for i in range(4):
+                pile.spawn(lambda: i)
+            self.assertEqual(4, pile._pending)
+            for i in range(3, -1, -1):
+                next(pile)
+                self.assertEqual(i, pile._pending)
+            # sanity check - the pile is empty
+            self.assertRaises(StopIteration, next, pile)
+            # pending remains 0
+            self.assertEqual(0, pile._pending)
+
+    def _exploder(self, arg):
+        if isinstance(arg, Exception):
+            raise arg
+        else:
+            return arg
+
+    def test_blocking_last_next_explodes(self):
+        pile = utils.GreenAsyncPile(2)
+        pile.spawn(self._exploder, 1)
+        pile.spawn(self._exploder, 2)
+        pile.spawn(self._exploder, Exception('kaboom'))
+        self.assertEqual(1, next(pile))
+        self.assertEqual(2, next(pile))
+        with mock.patch('sys.stderr', StringIO()) as mock_stderr, \
+                self.assertRaises(StopIteration):
+            next(pile)
+        self.assertEqual(pile.inflight, 0)
+        self.assertEqual(pile._pending, 0)
+        self.assertIn('Exception: kaboom', mock_stderr.getvalue())
+        self.assertIn('Traceback (most recent call last):',
+                      mock_stderr.getvalue())
+
+    def test_no_blocking_last_next_explodes(self):
+        pile = utils.GreenAsyncPile(10)
+        pile.spawn(self._exploder, 1)
+        self.assertEqual(1, next(pile))
+        pile.spawn(self._exploder, 2)
+        self.assertEqual(2, next(pile))
+        pile.spawn(self._exploder, Exception('kaboom'))
+        with mock.patch('sys.stderr', StringIO()) as mock_stderr, \
+                self.assertRaises(StopIteration):
+            next(pile)
+        self.assertEqual(pile.inflight, 0)
+        self.assertEqual(pile._pending, 0)
+        self.assertIn('Exception: kaboom', mock_stderr.getvalue())
+        self.assertIn('Traceback (most recent call last):',
+                      mock_stderr.getvalue())
+
+    def test_exceptions_in_streaming_pile(self):
+        with mock.patch('sys.stderr', StringIO()) as mock_stderr, \
+                utils.StreamingPile(2) as pile:
+            results = list(pile.asyncstarmap(self._exploder, [
+                (1,),
+                (Exception('kaboom'),),
+                (3,),
+            ]))
+        self.assertEqual(results, [1, 3])
+        self.assertEqual(pile.inflight, 0)
+        self.assertEqual(pile._pending, 0)
+        self.assertIn('Exception: kaboom', mock_stderr.getvalue())
+        self.assertIn('Traceback (most recent call last):',
+                      mock_stderr.getvalue())
+
+    def test_exceptions_at_end_of_streaming_pile(self):
+        with mock.patch('sys.stderr', StringIO()) as mock_stderr, \
+                utils.StreamingPile(2) as pile:
+            results = list(pile.asyncstarmap(self._exploder, [
+                (1,),
+                (2,),
+                (Exception('kaboom'),),
+            ]))
+        self.assertEqual(results, [1, 2])
+        self.assertEqual(pile.inflight, 0)
+        self.assertEqual(pile._pending, 0)
+        self.assertIn('Exception: kaboom', mock_stderr.getvalue())
+        self.assertIn('Traceback (most recent call last):',
+                      mock_stderr.getvalue())
+
+
+class TestLRUCache(unittest.TestCase):
+
+    def test_maxsize(self):
+        @utils.LRUCache(maxsize=10)
+        def f(*args):
+            return math.sqrt(*args)
+        _orig_math_sqrt = math.sqrt
+        # setup cache [0-10)
+        for i in range(10):
+            self.assertEqual(math.sqrt(i), f(i))
+        self.assertEqual(f.size(), 10)
+        # validate cache [0-10)
+        with patch('math.sqrt'):
+            for i in range(10):
+                self.assertEqual(_orig_math_sqrt(i), f(i))
+        self.assertEqual(f.size(), 10)
+        # update cache [10-20)
+        for i in range(10, 20):
+            self.assertEqual(math.sqrt(i), f(i))
+        # cache size is fixed
+        self.assertEqual(f.size(), 10)
+        # validate cache [10-20)
+        with patch('math.sqrt'):
+            for i in range(10, 20):
+                self.assertEqual(_orig_math_sqrt(i), f(i))
+        # validate un-cached [0-10)
+        with patch('math.sqrt', new=None):
+            for i in range(10):
+                self.assertRaises(TypeError, f, i)
+        # cache unchanged
+        self.assertEqual(f.size(), 10)
+        with patch('math.sqrt'):
+            for i in range(10, 20):
+                self.assertEqual(_orig_math_sqrt(i), f(i))
+        self.assertEqual(f.size(), 10)
+
+    def test_maxtime(self):
+        @utils.LRUCache(maxtime=30)
+        def f(*args):
+            return math.sqrt(*args)
+        self.assertEqual(30, f.maxtime)
+        _orig_math_sqrt = math.sqrt
+
+        now = time.time()
+        the_future = now + 31
+        # setup cache [0-10)
+        with patch('time.time', lambda: now):
+            for i in range(10):
+                self.assertEqual(math.sqrt(i), f(i))
+            self.assertEqual(f.size(), 10)
+            # validate cache [0-10)
+            with patch('math.sqrt'):
+                for i in range(10):
+                    self.assertEqual(_orig_math_sqrt(i), f(i))
+            self.assertEqual(f.size(), 10)
+
+        # validate expired [0-10)
+        with patch('math.sqrt', new=None):
+            with patch('time.time', lambda: the_future):
+                for i in range(10):
+                    self.assertRaises(TypeError, f, i)
+
+        # validate repopulates [0-10)
+        with patch('time.time', lambda: the_future):
+            for i in range(10):
+                self.assertEqual(math.sqrt(i), f(i))
+        # reuses cache space
+        self.assertEqual(f.size(), 10)
+
+    def test_set_maxtime(self):
+        @utils.LRUCache(maxtime=30)
+        def f(*args):
+            return math.sqrt(*args)
+        self.assertEqual(30, f.maxtime)
+        self.assertEqual(2, f(4))
+        self.assertEqual(1, f.size())
+        # expire everything
+        f.maxtime = -1
+        # validate un-cached [0-10)
+        with patch('math.sqrt', new=None):
+            self.assertRaises(TypeError, f, 4)
+
+    def test_set_maxsize(self):
+        @utils.LRUCache(maxsize=10)
+        def f(*args):
+            return math.sqrt(*args)
+        for i in range(12):
+            f(i)
+        self.assertEqual(f.size(), 10)
+        f.maxsize = 4
+        for i in range(12):
+            f(i)
+        self.assertEqual(f.size(), 4)
+
+
+class TestSpliterator(unittest.TestCase):
+    def test_string(self):
+        input_chunks = ["coun", "ter-", "b", "ra", "nch-mater",
+                        "nit", "y-fungusy", "-nummular"]
+        si = utils.Spliterator(input_chunks)
+
+        self.assertEqual(''.join(si.take(8)), "counter-")
+        self.assertEqual(''.join(si.take(7)), "branch-")
+        self.assertEqual(''.join(si.take(10)), "maternity-")
+        self.assertEqual(''.join(si.take(8)), "fungusy-")
+        self.assertEqual(''.join(si.take(8)), "nummular")
+
+    def test_big_input_string(self):
+        input_chunks = ["iridium"]
+        si = utils.Spliterator(input_chunks)
+
+        self.assertEqual(''.join(si.take(2)), "ir")
+        self.assertEqual(''.join(si.take(1)), "i")
+        self.assertEqual(''.join(si.take(2)), "di")
+        self.assertEqual(''.join(si.take(1)), "u")
+        self.assertEqual(''.join(si.take(1)), "m")
+
+    def test_chunk_boundaries(self):
+        input_chunks = ["soylent", "green", "is", "people"]
+        si = utils.Spliterator(input_chunks)
+
+        self.assertEqual(''.join(si.take(7)), "soylent")
+        self.assertEqual(''.join(si.take(5)), "green")
+        self.assertEqual(''.join(si.take(2)), "is")
+        self.assertEqual(''.join(si.take(6)), "people")
+
+    def test_no_empty_strings(self):
+        input_chunks = ["soylent", "green", "is", "people"]
+        si = utils.Spliterator(input_chunks)
+
+        outputs = (list(si.take(7))     # starts and ends on chunk boundary
+                   + list(si.take(2))   # spans two chunks
+                   + list(si.take(3))   # begins but does not end chunk
+                   + list(si.take(2))   # ends but does not begin chunk
+                   + list(si.take(6)))  # whole chunk + EOF
+        self.assertNotIn('', outputs)
+
+    def test_running_out(self):
+        input_chunks = ["not much"]
+        si = utils.Spliterator(input_chunks)
+
+        self.assertEqual(''.join(si.take(4)), "not ")
+        self.assertEqual(''.join(si.take(99)), "much")  # short
+        self.assertEqual(''.join(si.take(4)), "")
+        self.assertEqual(''.join(si.take(4)), "")
+
+    def test_overlap(self):
+        input_chunks = ["one fish", "two fish", "red fish", "blue fish"]
+
+        si = utils.Spliterator(input_chunks)
+        t1 = si.take(20)  # longer than first chunk
+        self.assertLess(len(next(t1)), 20)  # it's not exhausted
+
+        t2 = si.take(20)
+        self.assertRaises(ValueError, next, t2)
+
+    def test_closing(self):
+        input_chunks = ["abcd", "efg", "hij"]
+
+        si = utils.Spliterator(input_chunks)
+        it = si.take(3)  # shorter than first chunk
+        self.assertEqual(next(it), 'abc')
+        it.close()
+        self.assertEqual(list(si.take(20)), ['d', 'efg', 'hij'])
+
+        si = utils.Spliterator(input_chunks)
+        self.assertEqual(list(si.take(1)), ['a'])
+        it = si.take(1)  # still shorter than first chunk
+        self.assertEqual(next(it), 'b')
+        it.close()
+        self.assertEqual(list(si.take(20)), ['cd', 'efg', 'hij'])
+
+        si = utils.Spliterator(input_chunks)
+        it = si.take(6)  # longer than first chunk, shorter than first + second
+        self.assertEqual(next(it), 'abcd')
+        self.assertEqual(next(it), 'ef')
+        it.close()
+        self.assertEqual(list(si.take(20)), ['g', 'hij'])
+
+        si = utils.Spliterator(input_chunks)
+        self.assertEqual(list(si.take(2)), ['ab'])
+        it = si.take(3)  # longer than rest of chunk
+        self.assertEqual(next(it), 'cd')
+        it.close()
+        self.assertEqual(list(si.take(20)), ['efg', 'hij'])
+
+
+class TestParseContentRange(unittest.TestCase):
+    def test_good(self):
+        start, end, total = utils.parse_content_range("bytes 100-200/300")
+        self.assertEqual(start, 100)
+        self.assertEqual(end, 200)
+        self.assertEqual(total, 300)
+
+    def test_bad(self):
+        self.assertRaises(ValueError, utils.parse_content_range,
+                          "100-300/500")
+        self.assertRaises(ValueError, utils.parse_content_range,
+                          "bytes 100-200/aardvark")
+        self.assertRaises(ValueError, utils.parse_content_range,
+                          "bytes bulbous-bouffant/4994801")
+
+
+class TestParseContentDisposition(unittest.TestCase):
+
+    def test_basic_content_type(self):
+        name, attrs = utils.parse_content_disposition('text/plain')
+        self.assertEqual(name, 'text/plain')
+        self.assertEqual(attrs, {})
+
+    def test_content_type_with_charset(self):
+        name, attrs = utils.parse_content_disposition(
+            'text/plain; charset=UTF8')
+        self.assertEqual(name, 'text/plain')
+        self.assertEqual(attrs, {'charset': 'UTF8'})
+
+    def test_content_disposition(self):
+        name, attrs = utils.parse_content_disposition(
+            'form-data; name="somefile"; filename="test.html"')
+        self.assertEqual(name, 'form-data')
+        self.assertEqual(attrs, {'name': 'somefile', 'filename': 'test.html'})
+
+    def test_content_disposition_without_white_space(self):
+        name, attrs = utils.parse_content_disposition(
+            'form-data;name="somefile";filename="test.html"')
+        self.assertEqual(name, 'form-data')
+        self.assertEqual(attrs, {'name': 'somefile', 'filename': 'test.html'})
+
+
+class TestIterMultipartMimeDocuments(unittest.TestCase):
+
+    def test_bad_start(self):
+        it = utils.iter_multipart_mime_documents(BytesIO(b'blah'), b'unique')
+        exc = None
+        try:
+            next(it)
+        except MimeInvalid as err:
+            exc = err
+        self.assertTrue('invalid starting boundary' in str(exc))
+        self.assertTrue('--unique' in str(exc))
+
+    def test_empty(self):
+        it = utils.iter_multipart_mime_documents(BytesIO(b'--unique'),
+                                                 b'unique')
+        fp = next(it)
+        self.assertEqual(fp.read(), b'')
+        self.assertRaises(StopIteration, next, it)
+
+    def test_basic(self):
+        it = utils.iter_multipart_mime_documents(
+            BytesIO(b'--unique\r\nabcdefg\r\n--unique--'), b'unique')
+        fp = next(it)
+        self.assertEqual(fp.read(), b'abcdefg')
+        self.assertRaises(StopIteration, next, it)
+
+    def test_basic2(self):
+        it = utils.iter_multipart_mime_documents(
+            BytesIO(b'--unique\r\nabcdefg\r\n--unique\r\nhijkl\r\n--unique--'),
+            b'unique')
+        fp = next(it)
+        self.assertEqual(fp.read(), b'abcdefg')
+        fp = next(it)
+        self.assertEqual(fp.read(), b'hijkl')
+        self.assertRaises(StopIteration, next, it)
+
+    def test_tiny_reads(self):
+        it = utils.iter_multipart_mime_documents(
+            BytesIO(b'--unique\r\nabcdefg\r\n--unique\r\nhijkl\r\n--unique--'),
+            b'unique')
+        fp = next(it)
+        self.assertEqual(fp.read(2), b'ab')
+        self.assertEqual(fp.read(2), b'cd')
+        self.assertEqual(fp.read(2), b'ef')
+        self.assertEqual(fp.read(2), b'g')
+        self.assertEqual(fp.read(2), b'')
+        fp = next(it)
+        self.assertEqual(fp.read(), b'hijkl')
+        self.assertRaises(StopIteration, next, it)
+
+    def test_big_reads(self):
+        it = utils.iter_multipart_mime_documents(
+            BytesIO(b'--unique\r\nabcdefg\r\n--unique\r\nhijkl\r\n--unique--'),
+            b'unique')
+        fp = next(it)
+        self.assertEqual(fp.read(65536), b'abcdefg')
+        self.assertEqual(fp.read(), b'')
+        fp = next(it)
+        self.assertEqual(fp.read(), b'hijkl')
+        self.assertRaises(StopIteration, next, it)
+
+    def test_leading_crlfs(self):
+        it = utils.iter_multipart_mime_documents(
+            BytesIO(b'\r\n\r\n\r\n--unique\r\nabcdefg\r\n'
+                    b'--unique\r\nhijkl\r\n--unique--'),
+            b'unique')
+        fp = next(it)
+        self.assertEqual(fp.read(65536), b'abcdefg')
+        self.assertEqual(fp.read(), b'')
+        fp = next(it)
+        self.assertEqual(fp.read(), b'hijkl')
+        self.assertRaises(StopIteration, next, it)
+
+    def test_broken_mid_stream(self):
+        # We go ahead and accept whatever is sent instead of rejecting the
+        # whole request, in case the partial form is still useful.
+        it = utils.iter_multipart_mime_documents(
+            BytesIO(b'--unique\r\nabc'), b'unique')
+        fp = next(it)
+        self.assertEqual(fp.read(), b'abc')
+        self.assertRaises(StopIteration, next, it)
+
+    def test_readline(self):
+        it = utils.iter_multipart_mime_documents(
+            BytesIO(b'--unique\r\nab\r\ncd\ref\ng\r\n--unique\r\nhi\r\n\r\n'
+                    b'jkl\r\n\r\n--unique--'), b'unique')
+        fp = next(it)
+        self.assertEqual(fp.readline(), b'ab\r\n')
+        self.assertEqual(fp.readline(), b'cd\ref\ng')
+        self.assertEqual(fp.readline(), b'')
+        fp = next(it)
+        self.assertEqual(fp.readline(), b'hi\r\n')
+        self.assertEqual(fp.readline(), b'\r\n')
+        self.assertEqual(fp.readline(), b'jkl\r\n')
+        self.assertRaises(StopIteration, next, it)
+
+    def test_readline_with_tiny_chunks(self):
+        it = utils.iter_multipart_mime_documents(
+            BytesIO(b'--unique\r\nab\r\ncd\ref\ng\r\n--unique\r\nhi\r\n'
+                    b'\r\njkl\r\n\r\n--unique--'),
+            b'unique',
+            read_chunk_size=2)
+        fp = next(it)
+        self.assertEqual(fp.readline(), b'ab\r\n')
+        self.assertEqual(fp.readline(), b'cd\ref\ng')
+        self.assertEqual(fp.readline(), b'')
+        fp = next(it)
+        self.assertEqual(fp.readline(), b'hi\r\n')
+        self.assertEqual(fp.readline(), b'\r\n')
+        self.assertEqual(fp.readline(), b'jkl\r\n')
+        self.assertRaises(StopIteration, next, it)
+
+
+class TestParseMimeHeaders(unittest.TestCase):
+
+    def test_parse_mime_headers(self):
+        doc_file = BytesIO(b"""Content-Disposition: form-data; name="file_size"
+Foo: Bar
+NOT-title-cAsED: quux
+Connexion: =?iso8859-1?q?r=E9initialis=E9e_par_l=27homologue?=
+Status: =?utf-8?b?5byA5aeL6YCa6L+H5a+56LGh5aSN5Yi2?=
+Latin-1: Resincronizaci\xf3n realizada con \xe9xito
+Utf-8: \xd0\xba\xd0\xbe\xd0\xbd\xd1\x82\xd0\xb5\xd0\xb9\xd0\xbd\xd0\xb5\xd1\x80
+
+This is the body
+""")
+        headers = utils.parse_mime_headers(doc_file)
+        utf8 = u'\u043a\u043e\u043d\u0442\u0435\u0439\u043d\u0435\u0440'
+
+        expected_headers = {
+            'Content-Disposition': 'form-data; name="file_size"',
+            'Foo': "Bar",
+            'Not-Title-Cased': "quux",
+            # Encoded-word or non-ASCII values are treated just like any other
+            # bytestring (at least for now)
+            'Connexion': "=?iso8859-1?q?r=E9initialis=E9e_par_l=27homologue?=",
+            'Status': "=?utf-8?b?5byA5aeL6YCa6L+H5a+56LGh5aSN5Yi2?=",
+            'Latin-1': "Resincronizaci\xf3n realizada con \xe9xito",
+            'Utf-8': utf8,
+        }
+        self.assertEqual(expected_headers, headers)
+        self.assertEqual(b"This is the body\n", doc_file.read())
+
+
+class FakeResponse(object):
+    def __init__(self, status_int=200, headers=None, body=b''):
+        self.status_int = status_int
+        self.status = status_int
+        self.headers = HeaderKeyDict(headers)
+        self.body = BytesIO(body)
+
+    def getheader(self, header_name):
+        return str(self.headers.get(header_name, ''))
+
+    def getheaders(self):
+        return self.headers.items()
+
+    def read(self, length=None):
+        return self.body.read(length)
+
+    def readline(self, length=None):
+        return self.body.readline(length)
+
+
+class TestDocumentItersToHTTPResponseBody(unittest.TestCase):
+    def test_no_parts(self):
+        logger = debug_logger()
+        body = utils.document_iters_to_http_response_body(
+            iter([]), 'dontcare', multipart=False, logger=logger)
+        self.assertEqual(body, '')
+        self.assertFalse(logger.all_log_lines())
+
+    def test_single_part(self):
+        body = b"time flies like an arrow; fruit flies like a banana"
+        doc_iters = [{'part_iter': iter(BytesIO(body).read, b'')}]
+        logger = debug_logger()
+
+        resp_body = b''.join(
+            utils.document_iters_to_http_response_body(
+                iter(doc_iters), b'dontcare', multipart=False, logger=logger))
+        self.assertEqual(resp_body, body)
+        self.assertFalse(logger.all_log_lines())
+
+    def test_single_part_unexpected_ranges(self):
+        body = b"time flies like an arrow; fruit flies like a banana"
+        doc_iters = [{'part_iter': iter(BytesIO(body).read, b'')}, 'junk']
+        logger = debug_logger()
+
+        resp_body = b''.join(
+            utils.document_iters_to_http_response_body(
+                iter(doc_iters), b'dontcare', multipart=False, logger=logger))
+        self.assertEqual(resp_body, body)
+        self.assertEqual(['More than one part in a single-part response?'],
+                         logger.get_lines_for_level('warning'))
+
+    def test_multiple_parts(self):
+        part1 = b"two peanuts were walking down a railroad track"
+        part2 = b"and one was a salted. ... peanut."
+
+        doc_iters = [{
+            'start_byte': 88,
+            'end_byte': 133,
+            'content_type': 'application/peanut',
+            'entity_length': 1024,
+            'part_iter': iter(BytesIO(part1).read, b''),
+        }, {
+            'start_byte': 500,
+            'end_byte': 532,
+            'content_type': 'application/salted',
+            'entity_length': 1024,
+            'part_iter': iter(BytesIO(part2).read, b''),
+        }]
+
+        resp_body = b''.join(
+            utils.document_iters_to_http_response_body(
+                iter(doc_iters), b'boundaryboundary',
+                multipart=True, logger=debug_logger()))
+        self.assertEqual(resp_body, (
+            b"--boundaryboundary\r\n" +
+            # This is a little too strict; we don't actually care that the
+            # headers are in this order, but the test is much more legible
+            # this way.
+            b"Content-Type: application/peanut\r\n" +
+            b"Content-Range: bytes 88-133/1024\r\n" +
+            b"\r\n" +
+            part1 + b"\r\n" +
+            b"--boundaryboundary\r\n"
+            b"Content-Type: application/salted\r\n" +
+            b"Content-Range: bytes 500-532/1024\r\n" +
+            b"\r\n" +
+            part2 + b"\r\n" +
+            b"--boundaryboundary--"))
+
+    def test_closed_part_iterator(self):
+        useful_iter_mock = mock.MagicMock()
+        useful_iter_mock.__iter__.return_value = ['']
+        body_iter = utils.document_iters_to_http_response_body(
+            iter([{'part_iter': useful_iter_mock}]), 'dontcare',
+            multipart=False, logger=debug_logger())
+        body = ''
+        for s in body_iter:
+            body += s
+        self.assertEqual(body, '')
+        useful_iter_mock.close.assert_called_once_with()
+
+        # Calling "close" on the mock will now raise an AttributeError
+        del useful_iter_mock.close
+        body_iter = utils.document_iters_to_http_response_body(
+            iter([{'part_iter': useful_iter_mock}]), 'dontcare',
+            multipart=False, logger=debug_logger())
+        body = ''
+        for s in body_iter:
+            body += s
+
+
+class TestPairs(unittest.TestCase):
+    def test_pairs(self):
+        items = [10, 20, 30, 40, 50, 60]
+        got_pairs = set(utils.pairs(items))
+        self.assertEqual(got_pairs,
+                         set([(10, 20), (10, 30), (10, 40), (10, 50), (10, 60),
+                              (20, 30), (20, 40), (20, 50), (20, 60),
+                              (30, 40), (30, 50), (30, 60),
+                              (40, 50), (40, 60),
+                              (50, 60)]))
+
+
+class TestSocketStringParser(unittest.TestCase):
+    def test_socket_string_parser(self):
+        default = 1337
+        addrs = [('1.2.3.4', '1.2.3.4', default),
+                 ('1.2.3.4:5000', '1.2.3.4', 5000),
+                 ('[dead:beef::1]', 'dead:beef::1', default),
+                 ('[dead:beef::1]:5000', 'dead:beef::1', 5000),
+                 ('example.com', 'example.com', default),
+                 ('example.com:5000', 'example.com', 5000),
+                 ('foo.1-2-3.bar.com:5000', 'foo.1-2-3.bar.com', 5000),
+                 ('1.2.3.4:10:20', None, None),
+                 ('dead:beef::1:5000', None, None)]
+
+        for addr, expected_host, expected_port in addrs:
+            if expected_host:
+                host, port = utils.parse_socket_string(addr, default)
+                self.assertEqual(expected_host, host)
+                self.assertEqual(expected_port, int(port))
+            else:
+                with self.assertRaises(ValueError):
+                    utils.parse_socket_string(addr, default)
+
+
+class TestHashForFileFunction(unittest.TestCase):
+    def setUp(self):
+        self.tempfilename = tempfile.mktemp()
+
+    def tearDown(self):
+        try:
+            os.unlink(self.tempfilename)
+        except OSError:
+            pass
+
+    def test_hash_for_file_smallish(self):
+        stub_data = b'some data'
+        with open(self.tempfilename, 'wb') as fd:
+            fd.write(stub_data)
+        with mock.patch('swift.common.utils.md5') as mock_md5:
+            mock_hasher = mock_md5.return_value
+            rv = utils.md5_hash_for_file(self.tempfilename)
+        self.assertTrue(mock_hasher.hexdigest.called)
+        self.assertEqual(rv, mock_hasher.hexdigest.return_value)
+        self.assertEqual([mock.call(stub_data)],
+                         mock_hasher.update.call_args_list)
+
+    def test_hash_for_file_big(self):
+        num_blocks = 10
+        block_size = utils.MD5_BLOCK_READ_BYTES
+        truncate = 523
+        start_char = ord('a')
+        expected_blocks = [chr(i).encode('utf8') * block_size
+                           for i in range(start_char, start_char + num_blocks)]
+        full_data = b''.join(expected_blocks)
+        trimmed_data = full_data[:-truncate]
+        # sanity
+        self.assertEqual(len(trimmed_data), block_size * num_blocks - truncate)
+        with open(self.tempfilename, 'wb') as fd:
+            fd.write(trimmed_data)
+        with mock.patch('swift.common.utils.md5') as mock_md5:
+            mock_hasher = mock_md5.return_value
+            rv = utils.md5_hash_for_file(self.tempfilename)
+        self.assertTrue(mock_hasher.hexdigest.called)
+        self.assertEqual(rv, mock_hasher.hexdigest.return_value)
+        self.assertEqual(num_blocks, len(mock_hasher.update.call_args_list))
+        found_blocks = []
+        for i, (expected_block, call) in enumerate(zip(
+                expected_blocks, mock_hasher.update.call_args_list)):
+            args, kwargs = call
+            self.assertEqual(kwargs, {})
+            self.assertEqual(1, len(args))
+            block = args[0]
+            if i < num_blocks - 1:
+                self.assertEqual(block, expected_block)
+            else:
+                self.assertEqual(block, expected_block[:-truncate])
+            found_blocks.append(block)
+        self.assertEqual(b''.join(found_blocks), trimmed_data)
+
+    def test_hash_for_file_empty(self):
+        with open(self.tempfilename, 'wb'):
+            pass
+        with mock.patch('swift.common.utils.md5') as mock_md5:
+            mock_hasher = mock_md5.return_value
+            rv = utils.md5_hash_for_file(self.tempfilename)
+        self.assertTrue(mock_hasher.hexdigest.called)
+        self.assertIs(rv, mock_hasher.hexdigest.return_value)
+        self.assertEqual([], mock_hasher.update.call_args_list)
+
+    def test_hash_for_file_brittle(self):
+        data_to_expected_hash = {
+            b'': 'd41d8cd98f00b204e9800998ecf8427e',
+            b'some data': '1e50210a0202497fb79bc38b6ade6c34',
+            (b'a' * 4096 * 10)[:-523]: '06a41551609656c85f14f659055dc6d3',
+        }
+        # unlike some other places where the concrete implementation really
+        # matters for backwards compatibility these brittle tests are probably
+        # not needed or justified, if a future maintainer rips them out later
+        # they're probably doing the right thing
+        failures = []
+        for stub_data, expected_hash in data_to_expected_hash.items():
+            with open(self.tempfilename, 'wb') as fd:
+                fd.write(stub_data)
+            rv = utils.md5_hash_for_file(self.tempfilename)
+            try:
+                self.assertEqual(expected_hash, rv)
+            except AssertionError:
+                trim_cap = 80
+                if len(stub_data) > trim_cap:
+                    stub_data = '%s...<truncated>' % stub_data[:trim_cap]
+                failures.append('hash for %r was %s instead of expected %s' % (
+                    stub_data, rv, expected_hash))
+        if failures:
+            self.fail('Some data did not compute expected hash:\n' +
+                      '\n'.join(failures))
+
+
+class TestFsHasFreeSpace(unittest.TestCase):
+    def setUp(self):
+        self.fake_result = posix.statvfs_result([
+            4096,     # f_bsize
+            4096,     # f_frsize
+            2854907,  # f_blocks
+            1984802,  # f_bfree   (free blocks for root)
+            1728089,  # f_bavail  (free blocks for non-root)
+            1280000,  # f_files
+            1266040,  # f_ffree,
+            1266040,  # f_favail,
+            4096,     # f_flag
+            255,      # f_namemax
+        ])
+
+    def test_bytes(self):
+        with mock.patch(
+                'os.statvfs', return_value=self.fake_result) as mock_statvfs:
+            self.assertTrue(utils.fs_has_free_space("/", 0, False))
+            self.assertTrue(utils.fs_has_free_space("/", 1, False))
+            # free space left = f_bavail * f_bsize = 7078252544
+            self.assertTrue(utils.fs_has_free_space("/", 7078252544, False))
+            self.assertFalse(utils.fs_has_free_space("/", 7078252545, False))
+            self.assertFalse(utils.fs_has_free_space("/", 2 ** 64, False))
+        mock_statvfs.assert_has_calls([mock.call("/")] * 5)
+
+    def test_bytes_using_file_descriptor(self):
+        with mock.patch(
+                'os.fstatvfs', return_value=self.fake_result) as mock_fstatvfs:
+            self.assertTrue(utils.fs_has_free_space(99, 0, False))
+            self.assertTrue(utils.fs_has_free_space(99, 1, False))
+            # free space left = f_bavail * f_bsize = 7078252544
+            self.assertTrue(utils.fs_has_free_space(99, 7078252544, False))
+            self.assertFalse(utils.fs_has_free_space(99, 7078252545, False))
+            self.assertFalse(utils.fs_has_free_space(99, 2 ** 64, False))
+        mock_fstatvfs.assert_has_calls([mock.call(99)] * 5)
+
+    def test_percent(self):
+        with mock.patch('os.statvfs', return_value=self.fake_result):
+            self.assertTrue(utils.fs_has_free_space("/", 0, True))
+            self.assertTrue(utils.fs_has_free_space("/", 1, True))
+            # percentage of free space for the faked statvfs is 60%
+            self.assertTrue(utils.fs_has_free_space("/", 60, True))
+            self.assertFalse(utils.fs_has_free_space("/", 61, True))
+            self.assertFalse(utils.fs_has_free_space("/", 100, True))
+            self.assertFalse(utils.fs_has_free_space("/", 110, True))
+
+
+class TestSetSwiftDir(unittest.TestCase):
+    def setUp(self):
+        self.swift_dir = tempfile.mkdtemp()
+        self.swift_conf = os.path.join(self.swift_dir, 'swift.conf')
+        self.policy_name = ''.join(random.sample(string.ascii_letters, 20))
+        with open(self.swift_conf, "wt") as sc:
+            sc.write('''
+[swift-hash]
+swift_hash_path_suffix = changeme
+
+[storage-policy:0]
+name = default
+default = yes
+
+[storage-policy:1]
+name = %s
+''' % self.policy_name)
+
+    def tearDown(self):
+        shutil.rmtree(self.swift_dir, ignore_errors=True)
+
+    def test_set_swift_dir(self):
+        set_swift_dir(None)
+        reload_storage_policies()
+        self.assertIsNone(POLICIES.get_by_name(self.policy_name))
+
+        set_swift_dir(self.swift_dir)
+        reload_storage_policies()
+        self.assertIsNotNone(POLICIES.get_by_name(self.policy_name))
+
+
+class TestDistributeEvenly(unittest.TestCase):
+    def test_evenly_divided(self):
+        out = utils.distribute_evenly(range(12), 3)
+        self.assertEqual(out, [
+            [0, 3, 6, 9],
+            [1, 4, 7, 10],
+            [2, 5, 8, 11],
+        ])
+
+        out = utils.distribute_evenly(range(12), 4)
+        self.assertEqual(out, [
+            [0, 4, 8],
+            [1, 5, 9],
+            [2, 6, 10],
+            [3, 7, 11],
+        ])
+
+    def test_uneven(self):
+        out = utils.distribute_evenly(range(11), 3)
+        self.assertEqual(out, [
+            [0, 3, 6, 9],
+            [1, 4, 7, 10],
+            [2, 5, 8],
+        ])
+
+    def test_just_one(self):
+        out = utils.distribute_evenly(range(5), 1)
+        self.assertEqual(out, [[0, 1, 2, 3, 4]])
+
+    def test_more_buckets_than_items(self):
+        out = utils.distribute_evenly(range(5), 7)
+        self.assertEqual(out, [[0], [1], [2], [3], [4], [], []])
+
+
+@mock.patch('swift.common.utils.open')
+class TestGetPpid(unittest.TestCase):
+    def test_happy_path(self, mock_open):
+        mock_open.return_value.__enter__().read.return_value = \
+            'pid comm stat 456 see the procfs(5) man page for more info\n'
+        self.assertEqual(utils.get_ppid(123), 456)
+        self.assertIn(mock.call('/proc/123/stat'), mock_open.mock_calls)
+
+    @mock.patch('swift.common.utils.os.path.exists', return_value=True)
+    def test_not_found(self, _mock_exists, mock_open):
+        mock_open.side_effect = IOError(errno.ENOENT, "Not there")
+        with self.assertRaises(OSError) as caught:
+            utils.get_ppid(123)
+        self.assertEqual(caught.exception.errno, errno.ESRCH)
+        self.assertEqual(mock_open.mock_calls[0], mock.call('/proc/123/stat'))
+
+    def test_not_allowed(self, mock_open):
+        mock_open.side_effect = OSError(errno.EPERM, "Not for you")
+        with self.assertRaises(OSError) as caught:
+            utils.get_ppid(123)
+        self.assertEqual(caught.exception.errno, errno.EPERM)
+        self.assertEqual(mock_open.mock_calls[0], mock.call('/proc/123/stat'))
+
+
+class TestShardName(unittest.TestCase):
+    def test(self):
+        ts = utils.Timestamp.now()
+        created = utils.ShardName.create('a', 'root', 'parent', ts, 1)
+        parent_hash = md5(b'parent', usedforsecurity=False).hexdigest()
+        expected = 'a/root-%s-%s-1' % (parent_hash, ts.internal)
+        actual = str(created)
+        self.assertEqual(expected, actual)
+        parsed = utils.ShardName.parse(actual)
+        # normally a ShardName will be in the .shards prefix
+        self.assertEqual('a', parsed.account)
+        self.assertEqual('root', parsed.root_container)
+        self.assertEqual(parent_hash, parsed.parent_container_hash)
+        self.assertEqual(ts, parsed.timestamp)
+        self.assertEqual(1, parsed.index)
+        self.assertEqual(actual, str(parsed))
+
+    def test_root_has_hyphens(self):
+        parsed = utils.ShardName.parse(
+            'a/root-has-some-hyphens-hash-1234-99')
+        self.assertEqual('a', parsed.account)
+        self.assertEqual('root-has-some-hyphens', parsed.root_container)
+        self.assertEqual('hash', parsed.parent_container_hash)
+        self.assertEqual(utils.Timestamp(1234), parsed.timestamp)
+        self.assertEqual(99, parsed.index)
+
+    def test_realistic_shard_range_names(self):
+        parsed = utils.ShardName.parse(
+            '.shards_a1/r1-'
+            '7c92cf1eee8d99cc85f8355a3d6e4b86-'
+            '1662475499.00000-1')
+        self.assertEqual('.shards_a1', parsed.account)
+        self.assertEqual('r1', parsed.root_container)
+        self.assertEqual('7c92cf1eee8d99cc85f8355a3d6e4b86',
+                         parsed.parent_container_hash)
+        self.assertEqual(utils.Timestamp('1662475499'), parsed.timestamp)
+        self.assertEqual(1, parsed.index)
+
+        ts = utils.Timestamp(1234)
+        parsed = utils.ShardName('.shards_a', 'c', 'hash', ts, 42)
+        self.assertEqual('.shards_a/c-hash-%s-42' % ts.internal, str(parsed))
+
+        parsed = utils.ShardName.create('.shards_a', 'c', 'c', ts, 42)
+        self.assertEqual(
+            '.shards_a/c-4a8a08f09d37b73795649038408b5f33-%s-42' % ts.internal,
+            str(parsed))
+
+    def test_bad_parse(self):
+        with self.assertRaises(ValueError) as cm:
+            utils.ShardName.parse('a')
+        self.assertEqual('invalid name: a', str(cm.exception))
+        with self.assertRaises(ValueError) as cm:
+            utils.ShardName.parse('a/c')
+        self.assertEqual('invalid name: a/c', str(cm.exception))
+        with self.assertRaises(ValueError) as cm:
+            utils.ShardName.parse('a/root-hash-bad')
+        self.assertEqual('invalid name: a/root-hash-bad', str(cm.exception))
+        with self.assertRaises(ValueError) as cm:
+            utils.ShardName.parse('a/root-hash-bad-0')
+        self.assertEqual('invalid name: a/root-hash-bad-0',
+                         str(cm.exception))
+        with self.assertRaises(ValueError) as cm:
+            utils.ShardName.parse('a/root-hash-12345678.12345-bad')
+        self.assertEqual('invalid name: a/root-hash-12345678.12345-bad',
+                         str(cm.exception))
+
+    def test_bad_create(self):
+        with self.assertRaises(ValueError):
+            utils.ShardName.create('a', 'root', 'hash', 'bad', '0')
+        with self.assertRaises(ValueError):
+            utils.ShardName.create('a', 'root', None, '1235678', 'bad')
+
+
+class BaseNamespaceShardRange(object):
+
+    def _check_name_account_container(self, nsr, exp_name):
+        # check that the name, account, container properties are consistent
+        exp_account, exp_container = exp_name.split('/')
+        self.assertEqual(exp_name, nsr.name)
+        self.assertEqual(exp_account, nsr.account)
+        self.assertEqual(exp_container, nsr.container)
+
+
+class TestNamespace(unittest.TestCase, BaseNamespaceShardRange):
+
+    def test_lower_setter(self):
+        ns = utils.Namespace('a/c', 'b', '')
+        # sanity checks
+        self.assertEqual('b', ns.lower_str)
+        self.assertEqual(ns.MAX, ns.upper)
+
+        def do_test(good_value, expected):
+            ns.lower = good_value
+            self.assertEqual(expected, ns.lower)
+            self.assertEqual(ns.MAX, ns.upper)
+
+        do_test(utils.Namespace.MIN, utils.Namespace.MIN)
+        do_test(utils.Namespace.MAX, utils.Namespace.MAX)
+        do_test(b'', utils.Namespace.MIN)
+        do_test(u'', utils.Namespace.MIN)
+        do_test(None, utils.Namespace.MIN)
+        do_test(b'a', 'a')
+        do_test(b'y', 'y')
+        do_test(u'a', 'a')
+        do_test(u'y', 'y')
+
+        expected = u'\N{SNOWMAN}'
+        with warnings.catch_warnings(record=True) as captured_warnings:
+            do_test(u'\N{SNOWMAN}', expected)
+            do_test(u'\N{SNOWMAN}'.encode('utf-8'), expected)
+        self.assertFalse(captured_warnings)
+
+        ns = utils.Namespace('a/c', 'b', 'y')
+        ns.lower = ''
+        self.assertEqual(ns.MIN, ns.lower)
+
+        ns = utils.Namespace('a/c', 'b', 'y')
+        with self.assertRaises(ValueError) as cm:
+            ns.lower = 'z'
+        self.assertIn("must be less than or equal to upper", str(cm.exception))
+        self.assertEqual('b', ns.lower_str)
+        self.assertEqual('y', ns.upper_str)
+
+        def do_test(bad_value):
+            with self.assertRaises(TypeError) as cm:
+                ns.lower = bad_value
+            self.assertIn("lower must be a string", str(cm.exception))
+            self.assertEqual('b', ns.lower_str)
+            self.assertEqual('y', ns.upper_str)
+
+        do_test(1)
+        do_test(1.234)
+
+    def test_upper_setter(self):
+        ns = utils.Namespace('a/c', '', 'y')
+        # sanity checks
+        self.assertEqual(ns.MIN, ns.lower)
+        self.assertEqual('y', ns.upper_str)
+
+        def do_test(good_value, expected):
+            ns.upper = good_value
+            self.assertEqual(expected, ns.upper)
+            self.assertEqual(ns.MIN, ns.lower)
+
+        do_test(utils.Namespace.MIN, utils.Namespace.MIN)
+        do_test(utils.Namespace.MAX, utils.Namespace.MAX)
+        do_test(b'', utils.Namespace.MAX)
+        do_test(u'', utils.Namespace.MAX)
+        do_test(None, utils.Namespace.MAX)
+        do_test(b'z', 'z')
+        do_test(b'b', 'b')
+        do_test(u'z', 'z')
+        do_test(u'b', 'b')
+
+        expected = u'\N{SNOWMAN}'
+        with warnings.catch_warnings(record=True) as captured_warnings:
+            do_test(u'\N{SNOWMAN}', expected)
+            do_test(u'\N{SNOWMAN}'.encode('utf-8'), expected)
+        self.assertFalse(captured_warnings)
+
+        ns = utils.Namespace('a/c', 'b', 'y')
+        ns.upper = ''
+        self.assertEqual(ns.MAX, ns.upper)
+
+        ns = utils.Namespace('a/c', 'b', 'y')
+        with self.assertRaises(ValueError) as cm:
+            ns.upper = 'a'
+        self.assertIn(
+            "must be greater than or equal to lower",
+            str(cm.exception))
+        self.assertEqual('b', ns.lower_str)
+        self.assertEqual('y', ns.upper_str)
+
+        def do_test(bad_value):
+            with self.assertRaises(TypeError) as cm:
+                ns.upper = bad_value
+            self.assertIn("upper must be a string", str(cm.exception))
+            self.assertEqual('b', ns.lower_str)
+            self.assertEqual('y', ns.upper_str)
+
+        do_test(1)
+        do_test(1.234)
+
+    def test_end_marker(self):
+        ns = utils.Namespace('a/c', '', 'y')
+        self.assertEqual('y\x00', ns.end_marker)
+        ns = utils.Namespace('a/c', '', '')
+        self.assertEqual('', ns.end_marker)
+
+    def test_bounds_serialization(self):
+        ns = utils.Namespace('a/c', None, None)
+        self.assertEqual('a/c', ns.name)
+        self.assertEqual(utils.Namespace.MIN, ns.lower)
+        self.assertEqual('', ns.lower_str)
+        self.assertEqual(utils.Namespace.MAX, ns.upper)
+        self.assertEqual('', ns.upper_str)
+        self.assertEqual('', ns.end_marker)
+
+        lower = u'\u00e4'
+        upper = u'\u00fb'
+        ns = utils.Namespace('a/%s-%s' % (lower, upper), lower, upper)
+        exp_lower = lower
+        exp_upper = upper
+        self.assertEqual(exp_lower, ns.lower)
+        self.assertEqual(exp_lower, ns.lower_str)
+        self.assertEqual(exp_upper, ns.upper)
+        self.assertEqual(exp_upper, ns.upper_str)
+        self.assertEqual(exp_upper + '\x00', ns.end_marker)
+
+    def test_name(self):
+        # constructor
+        path = 'a/c'
+        ns = utils.Namespace(path, 'l', 'u')
+        self._check_name_account_container(ns, path)
+
+        # constructor
+        path = u'\u1234a/\N{SNOWMAN}'
+        ns = utils.Namespace(path, 'l', 'u')
+        self._check_name_account_container(ns, path)
+        ns = utils.Namespace(path.encode('utf8'), 'l', 'u')
+        self._check_name_account_container(ns, path)
+
+    def test_name_unexpected_format(self):
+        # name is not a/c format
+        ns = utils.Namespace('foo', 'l', 'u')
+        self.assertEqual('foo', ns.name)
+        self.assertEqual('foo', ns.account)
+        with self.assertRaises(IndexError):
+            ns.container
+
+    def test_unicode_name(self):
+        shard_bounds = ('', 'ham', 'pie', u'\N{SNOWMAN}', u'\U0001F334', '')
+        exp_bounds = [(l, u)
+                      for l, u in zip(shard_bounds[:-1], shard_bounds[1:])]
+        namespaces = [utils.Namespace('.shards_a/c_%s' % upper, lower, upper)
+                      for lower, upper in exp_bounds]
+        for i in range(len(exp_bounds)):
+            self.assertEqual(namespaces[i].name,
+                             '.shards_a/c_%s' % exp_bounds[i][1])
+            self.assertEqual(namespaces[i].lower_str, exp_bounds[i][0])
+
+            self.assertEqual(namespaces[i].upper_str, exp_bounds[i][1])
+
+    def test_entire_namespace(self):
+        # test entire range (no boundaries)
+        entire = utils.Namespace('a/test', None, None)
+        self.assertEqual(utils.Namespace.MAX, entire.upper)
+        self.assertEqual(utils.Namespace.MIN, entire.lower)
+        self.assertIs(True, entire.entire_namespace())
+
+        for x in range(100):
+            self.assertTrue(str(x) in entire)
+            self.assertTrue(chr(x) in entire)
+
+        for x in ('a', 'z', 'zzzz', '124fsdf', u'\u00e4'):
+            self.assertTrue(x in entire, '%r should be in %r' % (x, entire))
+
+        entire.lower = 'a'
+        self.assertIs(False, entire.entire_namespace())
+
+    def test_comparisons(self):
+        # upper (if provided) *must* be greater than lower
+        with self.assertRaises(ValueError):
+            utils.Namespace('f-a', 'f', 'a')
+
+        # test basic boundaries
+        btoc = utils.Namespace('a/b-c', 'b', 'c')
+        atof = utils.Namespace('a/a-f', 'a', 'f')
+        ftol = utils.Namespace('a/f-l', 'f', 'l')
+        ltor = utils.Namespace('a/l-r', 'l', 'r')
+        rtoz = utils.Namespace('a/r-z', 'r', 'z')
+        lower = utils.Namespace('a/lower', '', 'mid')
+        upper = utils.Namespace('a/upper', 'mid', '')
+        entire = utils.Namespace('a/test', None, None)
+
+        # overlapping ranges
+        dtof = utils.Namespace('a/d-f', 'd', 'f')
+        dtom = utils.Namespace('a/d-m', 'd', 'm')
+
+        # test range > and <
+        # non-adjacent
+        self.assertFalse(rtoz < atof)
+        self.assertTrue(atof < ltor)
+        self.assertTrue(ltor > atof)
+        self.assertFalse(ftol > rtoz)
+
+        # adjacent
+        self.assertFalse(rtoz < ltor)
+        self.assertTrue(ltor < rtoz)
+        self.assertFalse(ltor > rtoz)
+        self.assertTrue(rtoz > ltor)
+
+        # wholly within
+        self.assertFalse(btoc < atof)
+        self.assertFalse(btoc > atof)
+        self.assertFalse(atof < btoc)
+        self.assertFalse(atof > btoc)
+
+        self.assertFalse(atof < dtof)
+        self.assertFalse(dtof > atof)
+        self.assertFalse(atof > dtof)
+        self.assertFalse(dtof < atof)
+
+        self.assertFalse(dtof < dtom)
+        self.assertFalse(dtof > dtom)
+        self.assertFalse(dtom > dtof)
+        self.assertFalse(dtom < dtof)
+
+        # overlaps
+        self.assertFalse(atof < dtom)
+        self.assertFalse(atof > dtom)
+        self.assertFalse(ltor > dtom)
+
+        # ranges including min/max bounds
+        self.assertTrue(upper > lower)
+        self.assertTrue(lower < upper)
+        self.assertFalse(upper < lower)
+        self.assertFalse(lower > upper)
+
+        self.assertFalse(lower < entire)
+        self.assertFalse(entire > lower)
+        self.assertFalse(lower > entire)
+        self.assertFalse(entire < lower)
+
+        self.assertFalse(upper < entire)
+        self.assertFalse(entire > upper)
+        self.assertFalse(upper > entire)
+        self.assertFalse(entire < upper)
+
+        self.assertFalse(entire < entire)
+        self.assertFalse(entire > entire)
+
+        # test range < and > to an item
+        # range is > lower and <= upper to lower boundary isn't
+        # actually included
+        self.assertTrue(ftol > 'f')
+        self.assertFalse(atof < 'f')
+        self.assertTrue(ltor < 'y')
+
+        self.assertFalse(ftol < 'f')
+        self.assertFalse(atof > 'f')
+        self.assertFalse(ltor > 'y')
+
+        self.assertTrue('f' < ftol)
+        self.assertFalse('f' > atof)
+        self.assertTrue('y' > ltor)
+
+        self.assertFalse('f' > ftol)
+        self.assertFalse('f' < atof)
+        self.assertFalse('y' < ltor)
+
+        # Now test ranges with only 1 boundary
+        start_to_l = utils.Namespace('a/None-l', '', 'l')
+        l_to_end = utils.Namespace('a/l-None', 'l', '')
+
+        for x in ('l', 'm', 'z', 'zzz1231sd'):
+            if x == 'l':
+                self.assertFalse(x in l_to_end)
+                self.assertFalse(start_to_l < x)
+                self.assertFalse(x > start_to_l)
+            else:
+                self.assertTrue(x in l_to_end)
+                self.assertTrue(start_to_l < x)
+                self.assertTrue(x > start_to_l)
+
+        # Now test some of the range to range checks with missing boundaries
+        self.assertFalse(atof < start_to_l)
+        self.assertFalse(start_to_l < entire)
+
+        # Now test overlaps(other)
+        self.assertTrue(atof.overlaps(atof))
+        self.assertFalse(atof.overlaps(ftol))
+        self.assertFalse(ftol.overlaps(atof))
+        self.assertTrue(atof.overlaps(dtof))
+        self.assertTrue(dtof.overlaps(atof))
+        self.assertFalse(dtof.overlaps(ftol))
+        self.assertTrue(dtom.overlaps(ftol))
+        self.assertTrue(ftol.overlaps(dtom))
+        self.assertFalse(start_to_l.overlaps(l_to_end))
+
+    def test_contains(self):
+        lower = utils.Namespace('a/-h', '', 'h')
+        mid = utils.Namespace('a/h-p', 'h', 'p')
+        upper = utils.Namespace('a/p-', 'p', '')
+        entire = utils.Namespace('a/all', '', '')
+
+        self.assertTrue('a' in entire)
+        self.assertTrue('x' in entire)
+
+        # the empty string is not a valid object name, so it cannot be in any
+        # range
+        self.assertFalse('' in lower)
+        self.assertFalse('' in upper)
+        self.assertFalse('' in entire)
+
+        self.assertTrue('a' in lower)
+        self.assertTrue('h' in lower)
+        self.assertFalse('i' in lower)
+
+        self.assertFalse('h' in mid)
+        self.assertTrue('p' in mid)
+
+        self.assertFalse('p' in upper)
+        self.assertTrue('x' in upper)
+
+        self.assertIn(utils.Namespace.MAX, entire)
+        self.assertNotIn(utils.Namespace.MAX, lower)
+        self.assertIn(utils.Namespace.MAX, upper)
+
+        # lower bound is excluded so MIN cannot be in any range.
+        self.assertNotIn(utils.Namespace.MIN, entire)
+        self.assertNotIn(utils.Namespace.MIN, upper)
+        self.assertNotIn(utils.Namespace.MIN, lower)
+
+    def test_includes(self):
+        _to_h = utils.Namespace('a/-h', '', 'h')
+        d_to_t = utils.Namespace('a/d-t', 'd', 't')
+        d_to_k = utils.Namespace('a/d-k', 'd', 'k')
+        e_to_l = utils.Namespace('a/e-l', 'e', 'l')
+        k_to_t = utils.Namespace('a/k-t', 'k', 't')
+        p_to_ = utils.Namespace('a/p-', 'p', '')
+        t_to_ = utils.Namespace('a/t-', 't', '')
+        entire = utils.Namespace('a/all', '', '')
+
+        self.assertTrue(entire.includes(entire))
+        self.assertTrue(d_to_t.includes(d_to_t))
+        self.assertTrue(_to_h.includes(_to_h))
+        self.assertTrue(p_to_.includes(p_to_))
+
+        self.assertTrue(entire.includes(_to_h))
+        self.assertTrue(entire.includes(d_to_t))
+        self.assertTrue(entire.includes(p_to_))
+
+        self.assertTrue(d_to_t.includes(d_to_k))
+        self.assertTrue(d_to_t.includes(e_to_l))
+        self.assertTrue(d_to_t.includes(k_to_t))
+        self.assertTrue(p_to_.includes(t_to_))
+
+        self.assertFalse(_to_h.includes(d_to_t))
+        self.assertFalse(p_to_.includes(d_to_t))
+        self.assertFalse(k_to_t.includes(d_to_k))
+        self.assertFalse(d_to_k.includes(e_to_l))
+        self.assertFalse(k_to_t.includes(e_to_l))
+        self.assertFalse(t_to_.includes(p_to_))
+
+        self.assertFalse(_to_h.includes(entire))
+        self.assertFalse(p_to_.includes(entire))
+        self.assertFalse(d_to_t.includes(entire))
+
+    def test_expand(self):
+        bounds = (('', 'd'), ('d', 'k'), ('k', 't'), ('t', ''))
+        donors = [
+            utils.Namespace('a/c-%d' % i, b[0], b[1])
+            for i, b in enumerate(bounds)
+        ]
+        acceptor = utils.Namespace('a/c-acc', 'f', 's')
+        self.assertTrue(acceptor.expand(donors[:1]))
+        self.assertEqual((utils.Namespace.MIN, 's'),
+                         (acceptor.lower, acceptor.upper))
+
+        acceptor = utils.Namespace('a/c-acc', 'f', 's')
+        self.assertTrue(acceptor.expand(donors[:2]))
+        self.assertEqual((utils.Namespace.MIN, 's'),
+                         (acceptor.lower, acceptor.upper))
+
+        acceptor = utils.Namespace('a/c-acc', 'f', 's')
+        self.assertTrue(acceptor.expand(donors[1:3]))
+        self.assertEqual(('d', 't'),
+                         (acceptor.lower, acceptor.upper))
+
+        acceptor = utils.Namespace('a/c-acc', 'f', 's')
+        self.assertTrue(acceptor.expand(donors))
+        self.assertEqual((utils.Namespace.MIN, utils.Namespace.MAX),
+                         (acceptor.lower, acceptor.upper))
+
+        acceptor = utils.Namespace('a/c-acc', 'f', 's')
+        self.assertTrue(acceptor.expand(donors[1:2] + donors[3:]))
+        self.assertEqual(('d', utils.Namespace.MAX),
+                         (acceptor.lower, acceptor.upper))
+
+        acceptor = utils.Namespace('a/c-acc', '', 'd')
+        self.assertFalse(acceptor.expand(donors[:1]))
+        self.assertEqual((utils.Namespace.MIN, 'd'),
+                         (acceptor.lower, acceptor.upper))
+
+        acceptor = utils.Namespace('a/c-acc', 'b', 'v')
+        self.assertFalse(acceptor.expand(donors[1:3]))
+        self.assertEqual(('b', 'v'),
+                         (acceptor.lower, acceptor.upper))
+
+    def test_total_ordering(self):
+        a_start_ns = utils.Namespace('a/-a', '', 'a')
+        a_atob_ns = utils.Namespace('a/a-b', 'a', 'b')
+        a_atof_ns = utils.Namespace('a/a-f', 'a', 'f')
+        a_ftol_ns = utils.Namespace('a/f-l', 'f', 'l')
+        a_ltor_ns = utils.Namespace('a/l-r', 'l', 'r')
+        a_rtoz_ns = utils.Namespace('a/r-z', 'r', 'z')
+        a_end_ns = utils.Namespace('a/z-', 'z', '')
+        b_start_ns = utils.Namespace('b/-a', '', 'a')
+        self.assertEqual(a_start_ns, b_start_ns)
+        self.assertNotEqual(a_start_ns, a_atob_ns)
+        self.assertLess(a_start_ns, a_atob_ns)
+        self.assertLess(a_atof_ns, a_ftol_ns)
+        self.assertLess(a_ftol_ns, a_ltor_ns)
+        self.assertLess(a_ltor_ns, a_rtoz_ns)
+        self.assertLess(a_rtoz_ns, a_end_ns)
+        self.assertLessEqual(a_start_ns, a_atof_ns)
+        self.assertLessEqual(a_atof_ns, a_rtoz_ns)
+        self.assertLessEqual(a_atof_ns, a_atof_ns)
+        self.assertGreater(a_end_ns, a_atof_ns)
+        self.assertGreater(a_rtoz_ns, a_ftol_ns)
+        self.assertGreater(a_end_ns, a_start_ns)
+        self.assertGreaterEqual(a_atof_ns, a_atof_ns)
+        self.assertGreaterEqual(a_end_ns, a_atof_ns)
+        self.assertGreaterEqual(a_rtoz_ns, a_start_ns)
+
+
+class TestNamespaceBoundList(unittest.TestCase):
+    def setUp(self):
+        start = ['', 'a/-a']
+        self.start_ns = utils.Namespace('a/-a', '', 'a')
+        atof = ['a', 'a/a-f']
+        self.atof_ns = utils.Namespace('a/a-f', 'a', 'f')
+        ftol = ['f', 'a/f-l']
+        self.ftol_ns = utils.Namespace('a/f-l', 'f', 'l')
+        ltor = ['l', 'a/l-r']
+        self.ltor_ns = utils.Namespace('a/l-r', 'l', 'r')
+        rtoz = ['r', 'a/r-z']
+        self.rtoz_ns = utils.Namespace('a/r-z', 'r', 'z')
+        end = ['z', 'a/z-']
+        self.end_ns = utils.Namespace('a/z-', 'z', '')
+        self.lowerbounds = [start, atof, ftol, ltor, rtoz, end]
+
+    def test_eq(self):
+        this = utils.NamespaceBoundList(self.lowerbounds)
+        that = utils.NamespaceBoundList(self.lowerbounds)
+        self.assertEqual(this, that)
+        that = utils.NamespaceBoundList(self.lowerbounds[:1])
+        self.assertNotEqual(this, that)
+        self.assertNotEqual(this, None)
+        self.assertNotEqual(this, self.lowerbounds)
+
+    def test_get_namespace(self):
+        namespace_list = utils.NamespaceBoundList(self.lowerbounds)
+        self.assertEqual(namespace_list.bounds, self.lowerbounds)
+        self.assertEqual(namespace_list.get_namespace('1'), self.start_ns)
+        self.assertEqual(namespace_list.get_namespace('a'), self.start_ns)
+        self.assertEqual(namespace_list.get_namespace('b'), self.atof_ns)
+        self.assertEqual(namespace_list.get_namespace('f'), self.atof_ns)
+        self.assertEqual(namespace_list.get_namespace('f\x00'), self.ftol_ns)
+        self.assertEqual(namespace_list.get_namespace('l'), self.ftol_ns)
+        self.assertEqual(namespace_list.get_namespace('x'), self.rtoz_ns)
+        self.assertEqual(namespace_list.get_namespace('r'), self.ltor_ns)
+        self.assertEqual(namespace_list.get_namespace('}'), self.end_ns)
+
+    def test_parse(self):
+        namespaces_list = utils.NamespaceBoundList.parse(None)
+        self.assertEqual(namespaces_list, None)
+        namespaces = [self.start_ns, self.atof_ns, self.ftol_ns,
+                      self.ltor_ns, self.rtoz_ns, self.end_ns]
+        namespace_list = utils.NamespaceBoundList.parse(namespaces)
+        self.assertEqual(namespace_list.bounds, self.lowerbounds)
+        self.assertEqual(namespace_list.get_namespace('1'), self.start_ns)
+        self.assertEqual(namespace_list.get_namespace('l'), self.ftol_ns)
+        self.assertEqual(namespace_list.get_namespace('x'), self.rtoz_ns)
+        self.assertEqual(namespace_list.get_namespace('r'), self.ltor_ns)
+        self.assertEqual(namespace_list.get_namespace('}'), self.end_ns)
+        self.assertEqual(namespace_list.bounds, self.lowerbounds)
+        overlap_f_ns = utils.Namespace('a/-f', '', 'f')
+        overlapping_namespaces = [self.start_ns, self.atof_ns, overlap_f_ns,
+                                  self.ftol_ns, self.ltor_ns, self.rtoz_ns,
+                                  self.end_ns]
+        namespace_list = utils.NamespaceBoundList.parse(
+            overlapping_namespaces)
+        self.assertEqual(namespace_list.bounds, self.lowerbounds)
+        overlap_l_ns = utils.Namespace('a/a-l', 'a', 'l')
+        overlapping_namespaces = [self.start_ns, self.atof_ns, self.ftol_ns,
+                                  overlap_l_ns, self.ltor_ns, self.rtoz_ns,
+                                  self.end_ns]
+        namespace_list = utils.NamespaceBoundList.parse(
+            overlapping_namespaces)
+        self.assertEqual(namespace_list.bounds, self.lowerbounds)
+
+
+class TestShardRange(unittest.TestCase, BaseNamespaceShardRange):
+    def setUp(self):
+        self.ts_iter = make_timestamp_iter()
+
+    def test_constants(self):
+        self.assertEqual({utils.ShardRange.SHARDING,
+                          utils.ShardRange.SHARDED,
+                          utils.ShardRange.SHRINKING,
+                          utils.ShardRange.SHRUNK},
+                         set(utils.ShardRange.CLEAVING_STATES))
+        self.assertEqual({utils.ShardRange.SHARDING,
+                          utils.ShardRange.SHARDED},
+                         set(utils.ShardRange.SHARDING_STATES))
+        self.assertEqual({utils.ShardRange.SHRINKING,
+                          utils.ShardRange.SHRUNK},
+                         set(utils.ShardRange.SHRINKING_STATES))
+
+    def test_min_max_bounds(self):
+        with self.assertRaises(TypeError):
+            utils.NamespaceOuterBound()
+
+        # max
+        self.assertEqual(utils.ShardRange.MAX, utils.ShardRange.MAX)
+        self.assertFalse(utils.ShardRange.MAX > utils.ShardRange.MAX)
+        self.assertFalse(utils.ShardRange.MAX < utils.ShardRange.MAX)
+
+        for val in 'z', u'\u00e4':
+            self.assertFalse(utils.ShardRange.MAX == val)
+            self.assertFalse(val > utils.ShardRange.MAX)
+            self.assertTrue(val < utils.ShardRange.MAX)
+            self.assertTrue(utils.ShardRange.MAX > val)
+            self.assertFalse(utils.ShardRange.MAX < val)
+
+        self.assertEqual('', str(utils.ShardRange.MAX))
+        self.assertFalse(utils.ShardRange.MAX)
+        self.assertTrue(utils.ShardRange.MAX == utils.ShardRange.MAX)
+        self.assertFalse(utils.ShardRange.MAX != utils.ShardRange.MAX)
+        self.assertTrue(
+            utils.ShardRange.MaxBound() == utils.ShardRange.MaxBound())
+        self.assertTrue(
+            utils.ShardRange.MaxBound() is utils.ShardRange.MaxBound())
+        self.assertTrue(
+            utils.ShardRange.MaxBound() is utils.ShardRange.MAX)
+        self.assertFalse(
+            utils.ShardRange.MaxBound() != utils.ShardRange.MaxBound())
+
+        # min
+        self.assertEqual(utils.ShardRange.MIN, utils.ShardRange.MIN)
+        self.assertFalse(utils.ShardRange.MIN > utils.ShardRange.MIN)
+        self.assertFalse(utils.ShardRange.MIN < utils.ShardRange.MIN)
+
+        for val in 'z', u'\u00e4':
+            self.assertFalse(utils.ShardRange.MIN == val)
+            self.assertFalse(val < utils.ShardRange.MIN)
+            self.assertTrue(val > utils.ShardRange.MIN)
+            self.assertTrue(utils.ShardRange.MIN < val)
+            self.assertFalse(utils.ShardRange.MIN > val)
+            self.assertFalse(utils.ShardRange.MIN)
+
+        self.assertEqual('', str(utils.ShardRange.MIN))
+        self.assertFalse(utils.ShardRange.MIN)
+        self.assertTrue(utils.ShardRange.MIN == utils.ShardRange.MIN)
+        self.assertFalse(utils.ShardRange.MIN != utils.ShardRange.MIN)
+        self.assertTrue(
+            utils.ShardRange.MinBound() == utils.ShardRange.MinBound())
+        self.assertTrue(
+            utils.ShardRange.MinBound() is utils.ShardRange.MinBound())
+        self.assertTrue(
+            utils.ShardRange.MinBound() is utils.ShardRange.MIN)
+        self.assertFalse(
+            utils.ShardRange.MinBound() != utils.ShardRange.MinBound())
+
+        self.assertFalse(utils.ShardRange.MAX == utils.ShardRange.MIN)
+        self.assertFalse(utils.ShardRange.MIN == utils.ShardRange.MAX)
+        self.assertTrue(utils.ShardRange.MAX != utils.ShardRange.MIN)
+        self.assertTrue(utils.ShardRange.MIN != utils.ShardRange.MAX)
+        self.assertFalse(utils.ShardRange.MAX is utils.ShardRange.MIN)
+
+        self.assertEqual(utils.ShardRange.MAX,
+                         max(utils.ShardRange.MIN, utils.ShardRange.MAX))
+        self.assertEqual(utils.ShardRange.MIN,
+                         min(utils.ShardRange.MIN, utils.ShardRange.MAX))
+
+        # check the outer bounds are hashable
+        hashmap = {utils.ShardRange.MIN: 'min',
+                   utils.ShardRange.MAX: 'max'}
+        self.assertEqual(hashmap[utils.ShardRange.MIN], 'min')
+        self.assertEqual(hashmap[utils.ShardRange.MinBound()], 'min')
+        self.assertEqual(hashmap[utils.ShardRange.MAX], 'max')
+        self.assertEqual(hashmap[utils.ShardRange.MaxBound()], 'max')
+
+    def test_shard_range_initialisation(self):
+        def assert_initialisation_ok(params, expected):
+            pr = utils.ShardRange(**params)
+            self.assertDictEqual(dict(pr), expected)
+
+        def assert_initialisation_fails(params, err_type=ValueError):
+            with self.assertRaises(err_type):
+                utils.ShardRange(**params)
+
+        ts_1 = next(self.ts_iter)
+        ts_2 = next(self.ts_iter)
+        ts_3 = next(self.ts_iter)
+        ts_4 = next(self.ts_iter)
+        empty_run = dict(name=None, timestamp=None, lower=None,
+                         upper=None, object_count=0, bytes_used=0,
+                         meta_timestamp=None, deleted=0,
+                         state=utils.ShardRange.FOUND, state_timestamp=None,
+                         epoch=None)
+        # name, timestamp must be given
+        assert_initialisation_fails(empty_run.copy())
+        assert_initialisation_fails(dict(empty_run, name='a/c'), TypeError)
+        assert_initialisation_fails(dict(empty_run, timestamp=ts_1))
+        # name must be form a/c
+        assert_initialisation_fails(dict(empty_run, name='c', timestamp=ts_1))
+        assert_initialisation_fails(dict(empty_run, name='', timestamp=ts_1))
+        assert_initialisation_fails(dict(empty_run, name='/a/c',
+                                         timestamp=ts_1))
+        assert_initialisation_fails(dict(empty_run, name='/c',
+                                         timestamp=ts_1))
+        # lower, upper can be None
+        expect = dict(name='a/c', timestamp=ts_1.internal, lower='',
+                      upper='', object_count=0, bytes_used=0,
+                      meta_timestamp=ts_1.internal, deleted=0,
+                      state=utils.ShardRange.FOUND,
+                      state_timestamp=ts_1.internal, epoch=None,
+                      reported=0, tombstones=-1)
+        assert_initialisation_ok(dict(empty_run, name='a/c', timestamp=ts_1),
+                                 expect)
+        assert_initialisation_ok(dict(name='a/c', timestamp=ts_1), expect)
+
+        good_run = dict(name='a/c', timestamp=ts_1, lower='l',
+                        upper='u', object_count=2, bytes_used=10,
+                        meta_timestamp=ts_2, deleted=0,
+                        state=utils.ShardRange.CREATED,
+                        state_timestamp=ts_3.internal, epoch=ts_4,
+                        reported=0, tombstones=11)
+        expect.update({'lower': 'l', 'upper': 'u', 'object_count': 2,
+                       'bytes_used': 10, 'meta_timestamp': ts_2.internal,
+                       'state': utils.ShardRange.CREATED,
+                       'state_timestamp': ts_3.internal, 'epoch': ts_4,
+                       'reported': 0, 'tombstones': 11})
+        assert_initialisation_ok(good_run.copy(), expect)
+
+        # obj count, tombstones and bytes used as int strings
+        good_str_run = good_run.copy()
+        good_str_run.update({'object_count': '2', 'bytes_used': '10',
+                             'tombstones': '11'})
+        assert_initialisation_ok(good_str_run, expect)
+
+        good_no_meta = good_run.copy()
+        good_no_meta.pop('meta_timestamp')
+        assert_initialisation_ok(good_no_meta,
+                                 dict(expect, meta_timestamp=ts_1.internal))
+
+        good_deleted = good_run.copy()
+        good_deleted['deleted'] = 1
+        assert_initialisation_ok(good_deleted,
+                                 dict(expect, deleted=1))
+
+        good_reported = good_run.copy()
+        good_reported['reported'] = 1
+        assert_initialisation_ok(good_reported,
+                                 dict(expect, reported=1))
+
+        assert_initialisation_fails(dict(good_run, timestamp='water balloon'))
+
+        assert_initialisation_fails(
+            dict(good_run, meta_timestamp='water balloon'))
+
+        assert_initialisation_fails(dict(good_run, lower='water balloon'))
+
+        assert_initialisation_fails(dict(good_run, upper='balloon'))
+
+        assert_initialisation_fails(
+            dict(good_run, object_count='water balloon'))
+
+        assert_initialisation_fails(dict(good_run, bytes_used='water ballon'))
+
+        assert_initialisation_fails(dict(good_run, object_count=-1))
+
+        assert_initialisation_fails(dict(good_run, bytes_used=-1))
+        assert_initialisation_fails(dict(good_run, state=-1))
+        assert_initialisation_fails(dict(good_run, state_timestamp='not a ts'))
+        assert_initialisation_fails(dict(good_run, name='/a/c'))
+        assert_initialisation_fails(dict(good_run, name='/a/c/'))
+        assert_initialisation_fails(dict(good_run, name='a/c/'))
+        assert_initialisation_fails(dict(good_run, name='a'))
+        assert_initialisation_fails(dict(good_run, name=''))
+
+    def _check_to_from_dict(self, lower, upper):
+        ts_1 = next(self.ts_iter)
+        ts_2 = next(self.ts_iter)
+        ts_3 = next(self.ts_iter)
+        ts_4 = next(self.ts_iter)
+        sr = utils.ShardRange('a/test', ts_1, lower, upper, 10, 100, ts_2,
+                              state=None, state_timestamp=ts_3, epoch=ts_4)
+        sr_dict = dict(sr)
+        expected = {
+            'name': 'a/test', 'timestamp': ts_1.internal, 'lower': lower,
+            'upper': upper, 'object_count': 10, 'bytes_used': 100,
+            'meta_timestamp': ts_2.internal, 'deleted': 0,
+            'state': utils.ShardRange.FOUND, 'state_timestamp': ts_3.internal,
+            'epoch': ts_4, 'reported': 0, 'tombstones': -1}
+        self.assertEqual(expected, sr_dict)
+        self.assertIsInstance(sr_dict['lower'], str)
+        self.assertIsInstance(sr_dict['upper'], str)
+        sr_new = utils.ShardRange.from_dict(sr_dict)
+        self.assertEqual(sr, sr_new)
+        self.assertEqual(sr_dict, dict(sr_new))
+
+        sr_new = utils.ShardRange(**sr_dict)
+        self.assertEqual(sr, sr_new)
+        self.assertEqual(sr_dict, dict(sr_new))
+
+        for key in sr_dict:
+            bad_dict = dict(sr_dict)
+            bad_dict.pop(key)
+            if key in ('reported', 'tombstones'):
+                # These were added after the fact, and we need to be able to
+                # eat data from old servers
+                utils.ShardRange.from_dict(bad_dict)
+                utils.ShardRange(**bad_dict)
+                continue
+
+            # The rest were present from the beginning
+            with self.assertRaises(KeyError):
+                utils.ShardRange.from_dict(bad_dict)
+            # But __init__ still (generally) works!
+            if key != 'name':
+                utils.ShardRange(**bad_dict)
+            else:
+                with self.assertRaises(TypeError):
+                    utils.ShardRange(**bad_dict)
+
+    def test_to_from_dict(self):
+        self._check_to_from_dict('l', 'u')
+        self._check_to_from_dict('', '')
+
+    def test_name(self):
+        # constructor
+        path = 'a/c'
+        sr = utils.ShardRange(path, 0, 'l', 'u')
+        self._check_name_account_container(sr, path)
+        # name setter
+        path = 'a2/c2'
+        sr.name = path
+        self._check_name_account_container(sr, path)
+
+        # constructor
+        path = u'\u1234a/\N{SNOWMAN}'
+        sr = utils.ShardRange(path, 0, 'l', 'u')
+        self._check_name_account_container(sr, path)
+        sr = utils.ShardRange(path.encode('utf8'), 0, 'l', 'u')
+        self._check_name_account_container(sr, path)
+        # name setter
+        path = u'\N{SNOWMAN}/\u1234c'
+        sr.name = path
+        self._check_name_account_container(sr, path)
+        sr.name = path.encode('utf-8')
+        self._check_name_account_container(sr, path)
+
+    def test_name_validation(self):
+        def check_invalid(call, *args):
+            with self.assertRaises(ValueError) as cm:
+                call(*args)
+            self.assertIn(
+                "Name must be of the form '<account>/<container>'",
+                str(cm.exception))
+
+        ts = next(self.ts_iter)
+        check_invalid(utils.ShardRange, '', ts, 'l', 'u')
+        check_invalid(utils.ShardRange, 'a', ts, 'l', 'u')
+        check_invalid(utils.ShardRange, b'a', ts, 'l', 'u')
+        check_invalid(utils.ShardRange, 'a/', ts, 'l', 'u')
+        check_invalid(utils.ShardRange, b'a/', ts, 'l', 'u')
+        check_invalid(utils.ShardRange, '/', ts, 'l', 'u')
+        check_invalid(utils.ShardRange, '/c', ts, 'l', 'u')
+        check_invalid(utils.ShardRange, b'/c', ts, 'l', 'u')
+        check_invalid(utils.ShardRange, None, ts, 'l', 'u')
+
+        ns = utils.ShardRange('a/c', ts, 'l', 'u')
+        check_invalid(setattr, ns, 'name', b'')
+        check_invalid(setattr, ns, 'name', b'a')
+        check_invalid(setattr, ns, 'name', b'a/')
+        check_invalid(setattr, ns, 'name', b'/')
+        check_invalid(setattr, ns, 'name', b'/c')
+        check_invalid(setattr, ns, 'name', None)
+
+    def test_timestamp_setter(self):
+        ts_1 = next(self.ts_iter)
+        sr = utils.ShardRange('a/test', ts_1, 'l', 'u', 0, 0, None)
+        self.assertEqual(ts_1, sr.timestamp)
+
+        ts_2 = next(self.ts_iter)
+        sr.timestamp = ts_2
+        self.assertEqual(ts_2, sr.timestamp)
+
+        sr.timestamp = 0
+        self.assertEqual(utils.Timestamp(0), sr.timestamp)
+
+        with self.assertRaises(TypeError):
+            sr.timestamp = None
+
+    def test_meta_timestamp_setter(self):
+        ts_1 = next(self.ts_iter)
+        sr = utils.ShardRange('a/test', ts_1, 'l', 'u', 0, 0, None)
+        self.assertEqual(ts_1, sr.timestamp)
+        self.assertEqual(ts_1, sr.meta_timestamp)
+
+        ts_2 = next(self.ts_iter)
+        sr.meta_timestamp = ts_2
+        self.assertEqual(ts_1, sr.timestamp)
+        self.assertEqual(ts_2, sr.meta_timestamp)
+
+        ts_3 = next(self.ts_iter)
+        sr.timestamp = ts_3
+        self.assertEqual(ts_3, sr.timestamp)
+        self.assertEqual(ts_2, sr.meta_timestamp)
+
+        # meta_timestamp defaults to tracking timestamp
+        sr.meta_timestamp = None
+        self.assertEqual(ts_3, sr.timestamp)
+        self.assertEqual(ts_3, sr.meta_timestamp)
+        ts_4 = next(self.ts_iter)
+        sr.timestamp = ts_4
+        self.assertEqual(ts_4, sr.timestamp)
+        self.assertEqual(ts_4, sr.meta_timestamp)
+
+        sr.meta_timestamp = 0
+        self.assertEqual(ts_4, sr.timestamp)
+        self.assertEqual(utils.Timestamp(0), sr.meta_timestamp)
+
+    def test_update_meta(self):
+        ts_1 = next(self.ts_iter)
+        sr = utils.ShardRange('a/test', ts_1, 'l', 'u', 0, 0, None)
+        with mock_timestamp_now(next(self.ts_iter)) as now:
+            sr.update_meta(9, 99)
+        self.assertEqual(9, sr.object_count)
+        self.assertEqual(99, sr.bytes_used)
+        self.assertEqual(now, sr.meta_timestamp)
+
+        with mock_timestamp_now(next(self.ts_iter)) as now:
+            sr.update_meta(99, 999, None)
+        self.assertEqual(99, sr.object_count)
+        self.assertEqual(999, sr.bytes_used)
+        self.assertEqual(now, sr.meta_timestamp)
+
+        ts_2 = next(self.ts_iter)
+        sr.update_meta(21, 2112, ts_2)
+        self.assertEqual(21, sr.object_count)
+        self.assertEqual(2112, sr.bytes_used)
+        self.assertEqual(ts_2, sr.meta_timestamp)
+
+        sr.update_meta('11', '12')
+        self.assertEqual(11, sr.object_count)
+        self.assertEqual(12, sr.bytes_used)
+
+        def check_bad_args(*args):
+            with self.assertRaises(ValueError):
+                sr.update_meta(*args)
+        check_bad_args('bad', 10)
+        check_bad_args(10, 'bad')
+        check_bad_args(10, 11, 'bad')
+
+    def test_increment_meta(self):
+        ts_1 = next(self.ts_iter)
+        sr = utils.ShardRange('a/test', ts_1, 'l', 'u', 1, 2, None)
+        with mock_timestamp_now(next(self.ts_iter)) as now:
+            sr.increment_meta(9, 99)
+        self.assertEqual(10, sr.object_count)
+        self.assertEqual(101, sr.bytes_used)
+        self.assertEqual(now, sr.meta_timestamp)
+
+        sr.increment_meta('11', '12')
+        self.assertEqual(21, sr.object_count)
+        self.assertEqual(113, sr.bytes_used)
+
+        def check_bad_args(*args):
+            with self.assertRaises(ValueError):
+                sr.increment_meta(*args)
+        check_bad_args('bad', 10)
+        check_bad_args(10, 'bad')
+
+    def test_update_tombstones(self):
+        ts_1 = next(self.ts_iter)
+        sr = utils.ShardRange('a/test', ts_1, 'l', 'u', 0, 0, None)
+        self.assertEqual(-1, sr.tombstones)
+        self.assertFalse(sr.reported)
+
+        with mock_timestamp_now(next(self.ts_iter)) as now:
+            sr.update_tombstones(1)
+        self.assertEqual(1, sr.tombstones)
+        self.assertEqual(now, sr.meta_timestamp)
+        self.assertFalse(sr.reported)
+
+        sr.reported = True
+        with mock_timestamp_now(next(self.ts_iter)) as now:
+            sr.update_tombstones(3, None)
+        self.assertEqual(3, sr.tombstones)
+        self.assertEqual(now, sr.meta_timestamp)
+        self.assertFalse(sr.reported)
+
+        sr.reported = True
+        ts_2 = next(self.ts_iter)
+        sr.update_tombstones(5, ts_2)
+        self.assertEqual(5, sr.tombstones)
+        self.assertEqual(ts_2, sr.meta_timestamp)
+        self.assertFalse(sr.reported)
+
+        # no change in value -> no change in reported
+        sr.reported = True
+        ts_3 = next(self.ts_iter)
+        sr.update_tombstones(5, ts_3)
+        self.assertEqual(5, sr.tombstones)
+        self.assertEqual(ts_3, sr.meta_timestamp)
+        self.assertTrue(sr.reported)
+
+        sr.update_meta('11', '12')
+        self.assertEqual(11, sr.object_count)
+        self.assertEqual(12, sr.bytes_used)
+
+        def check_bad_args(*args):
+            with self.assertRaises(ValueError):
+                sr.update_tombstones(*args)
+        check_bad_args('bad')
+        check_bad_args(10, 'bad')
+
+    def test_row_count(self):
+        ts_1 = next(self.ts_iter)
+        sr = utils.ShardRange('a/test', ts_1, 'l', 'u', 0, 0, None)
+        self.assertEqual(0, sr.row_count)
+
+        sr.update_meta(11, 123)
+        self.assertEqual(11, sr.row_count)
+        sr.update_tombstones(13)
+        self.assertEqual(24, sr.row_count)
+        sr.update_meta(0, 0)
+        self.assertEqual(13, sr.row_count)
+
+    def test_state_timestamp_setter(self):
+        ts_1 = next(self.ts_iter)
+        sr = utils.ShardRange('a/test', ts_1, 'l', 'u', 0, 0, None)
+        self.assertEqual(ts_1, sr.timestamp)
+        self.assertEqual(ts_1, sr.state_timestamp)
+
+        ts_2 = next(self.ts_iter)
+        sr.state_timestamp = ts_2
+        self.assertEqual(ts_1, sr.timestamp)
+        self.assertEqual(ts_2, sr.state_timestamp)
+
+        ts_3 = next(self.ts_iter)
+        sr.timestamp = ts_3
+        self.assertEqual(ts_3, sr.timestamp)
+        self.assertEqual(ts_2, sr.state_timestamp)
+
+        # state_timestamp defaults to tracking timestamp
+        sr.state_timestamp = None
+        self.assertEqual(ts_3, sr.timestamp)
+        self.assertEqual(ts_3, sr.state_timestamp)
+        ts_4 = next(self.ts_iter)
+        sr.timestamp = ts_4
+        self.assertEqual(ts_4, sr.timestamp)
+        self.assertEqual(ts_4, sr.state_timestamp)
+
+        sr.state_timestamp = 0
+        self.assertEqual(ts_4, sr.timestamp)
+        self.assertEqual(utils.Timestamp(0), sr.state_timestamp)
+
+    def test_state_setter(self):
+        for state, state_name in utils.ShardRange.STATES.items():
+            for test_value in (
+                    state, str(state), state_name, state_name.upper()):
+                sr = utils.ShardRange('a/test', next(self.ts_iter), 'l', 'u')
+                sr.state = test_value
+                actual = sr.state
+                self.assertEqual(
+                    state, actual,
+                    'Expected %s but got %s for %s' %
+                    (state, actual, test_value)
+                )
+
+        for bad_state in (max(utils.ShardRange.STATES) + 1,
+                          -1, 99, None, 'stringy', 1.1):
+            sr = utils.ShardRange('a/test', next(self.ts_iter), 'l', 'u')
+            with self.assertRaises(ValueError) as cm:
+                sr.state = bad_state
+            self.assertIn('Invalid state', str(cm.exception))
+
+    def test_update_state(self):
+        sr = utils.ShardRange('a/c', next(self.ts_iter))
+        old_sr = sr.copy()
+        self.assertEqual(utils.ShardRange.FOUND, sr.state)
+        self.assertEqual(dict(sr), dict(old_sr))  # sanity check
+
+        for state in utils.ShardRange.STATES:
+            if state == utils.ShardRange.FOUND:
+                continue
+            self.assertTrue(sr.update_state(state))
+            self.assertEqual(dict(old_sr, state=state), dict(sr))
+            self.assertFalse(sr.update_state(state))
+            self.assertEqual(dict(old_sr, state=state), dict(sr))
+
+        sr = utils.ShardRange('a/c', next(self.ts_iter))
+        old_sr = sr.copy()
+        for state in utils.ShardRange.STATES:
+            ts = next(self.ts_iter)
+            self.assertTrue(sr.update_state(state, state_timestamp=ts))
+            self.assertEqual(dict(old_sr, state=state, state_timestamp=ts),
+                             dict(sr))
+
+    def test_resolve_state(self):
+        for name, number in utils.ShardRange.STATES_BY_NAME.items():
+            self.assertEqual(
+                (number, name), utils.ShardRange.resolve_state(name))
+            self.assertEqual(
+                (number, name), utils.ShardRange.resolve_state(name.upper()))
+            self.assertEqual(
+                (number, name), utils.ShardRange.resolve_state(name.title()))
+            self.assertEqual(
+                (number, name), utils.ShardRange.resolve_state(number))
+            self.assertEqual(
+                (number, name), utils.ShardRange.resolve_state(str(number)))
+
+        def check_bad_value(value):
+            with self.assertRaises(ValueError) as cm:
+                utils.ShardRange.resolve_state(value)
+            self.assertIn('Invalid state %r' % value, str(cm.exception))
+
+        check_bad_value(min(utils.ShardRange.STATES) - 1)
+        check_bad_value(max(utils.ShardRange.STATES) + 1)
+        check_bad_value('badstate')
+
+    def test_epoch_setter(self):
+        sr = utils.ShardRange('a/c', next(self.ts_iter))
+        self.assertIsNone(sr.epoch)
+        ts = next(self.ts_iter)
+        sr.epoch = ts
+        self.assertEqual(ts, sr.epoch)
+        ts = next(self.ts_iter)
+        sr.epoch = ts.internal
+        self.assertEqual(ts, sr.epoch)
+        sr.epoch = None
+        self.assertIsNone(sr.epoch)
+        with self.assertRaises(ValueError):
+            sr.epoch = 'bad'
+
+    def test_deleted_setter(self):
+        sr = utils.ShardRange('a/c', next(self.ts_iter))
+        for val in (True, 1):
+            sr.deleted = val
+            self.assertIs(True, sr.deleted)
+        for val in (False, 0, None):
+            sr.deleted = val
+            self.assertIs(False, sr.deleted)
+
+    def test_set_deleted(self):
+        sr = utils.ShardRange('a/c', next(self.ts_iter))
+        # initialise other timestamps
+        sr.update_state(utils.ShardRange.ACTIVE,
+                        state_timestamp=utils.Timestamp.now())
+        sr.update_meta(1, 2)
+        old_sr = sr.copy()
+        self.assertIs(False, sr.deleted)  # sanity check
+        self.assertEqual(dict(sr), dict(old_sr))  # sanity check
+
+        with mock_timestamp_now(next(self.ts_iter)) as now:
+            self.assertTrue(sr.set_deleted())
+        self.assertEqual(now, sr.timestamp)
+        self.assertIs(True, sr.deleted)
+        old_sr_dict = dict(old_sr)
+        old_sr_dict.pop('deleted')
+        old_sr_dict.pop('timestamp')
+        sr_dict = dict(sr)
+        sr_dict.pop('deleted')
+        sr_dict.pop('timestamp')
+        self.assertEqual(old_sr_dict, sr_dict)
+
+        # no change
+        self.assertFalse(sr.set_deleted())
+        self.assertEqual(now, sr.timestamp)
+        self.assertIs(True, sr.deleted)
+
+        # force timestamp change
+        with mock_timestamp_now(next(self.ts_iter)) as now:
+            self.assertTrue(sr.set_deleted(timestamp=now))
+        self.assertEqual(now, sr.timestamp)
+        self.assertIs(True, sr.deleted)
+
+    def test_repr(self):
+        ts = next(self.ts_iter)
+        ts.offset = 1234
+        meta_ts = next(self.ts_iter)
+        state_ts = next(self.ts_iter)
+        sr = utils.ShardRange('a/c', ts, 'l', 'u', 100, 1000,
+                              meta_timestamp=meta_ts,
+                              state=utils.ShardRange.ACTIVE,
+                              state_timestamp=state_ts)
+        self.assertEqual(
+            "ShardRange<%r to %r as of %s, (100, 1000) as of %s, "
+            "active as of %s>"
+            % ('l', 'u',
+               ts.internal, meta_ts.internal, state_ts.internal), str(sr))
+
+        ts.offset = 0
+        meta_ts.offset = 2
+        state_ts.offset = 3
+        sr = utils.ShardRange('a/c', ts, '', '', 100, 1000,
+                              meta_timestamp=meta_ts,
+                              state=utils.ShardRange.FOUND,
+                              state_timestamp=state_ts)
+        self.assertEqual(
+            "ShardRange<MinBound to MaxBound as of %s, (100, 1000) as of %s, "
+            "found as of %s>"
+            % (ts.internal, meta_ts.internal, state_ts.internal), str(sr))
+
+    def test_copy(self):
+        sr = utils.ShardRange('a/c', next(self.ts_iter), 'x', 'y', 99, 99000,
+                              meta_timestamp=next(self.ts_iter),
+                              state=utils.ShardRange.CREATED,
+                              state_timestamp=next(self.ts_iter))
+        new = sr.copy()
+        self.assertEqual(dict(sr), dict(new))
+
+        new = sr.copy(deleted=1)
+        self.assertEqual(dict(sr, deleted=1), dict(new))
+
+        new_timestamp = next(self.ts_iter)
+        new = sr.copy(timestamp=new_timestamp)
+        self.assertEqual(dict(sr, timestamp=new_timestamp.internal,
+                              meta_timestamp=new_timestamp.internal,
+                              state_timestamp=new_timestamp.internal),
+                         dict(new))
+
+        new = sr.copy(timestamp=new_timestamp, object_count=99)
+        self.assertEqual(dict(sr, timestamp=new_timestamp.internal,
+                              meta_timestamp=new_timestamp.internal,
+                              state_timestamp=new_timestamp.internal,
+                              object_count=99),
+                         dict(new))
+
+    def test_make_path(self):
+        ts = utils.Timestamp.now()
+        actual = utils.ShardRange.make_path('a', 'root', 'parent', ts, 0)
+        parent_hash = md5(b'parent', usedforsecurity=False).hexdigest()
+        self.assertEqual('a/root-%s-%s-0' % (parent_hash, ts.internal), actual)
+        actual = utils.ShardRange.make_path('a', 'root', 'parent', ts, 3)
+        self.assertEqual('a/root-%s-%s-3' % (parent_hash, ts.internal), actual)
+        actual = utils.ShardRange.make_path('a', 'root', 'parent', ts, '3')
+        self.assertEqual('a/root-%s-%s-3' % (parent_hash, ts.internal), actual)
+        actual = utils.ShardRange.make_path(
+            'a', 'root', 'parent', ts.internal, '3')
+        self.assertEqual('a/root-%s-%s-3' % (parent_hash, ts.internal), actual)
+
+    def test_sort_key_order(self):
+        self.assertEqual(
+            utils.ShardRange.sort_key_order(
+                name="a/c",
+                lower='lower',
+                upper='upper',
+                state=utils.ShardRange.ACTIVE),
+            ('upper', utils.ShardRange.ACTIVE, 'lower', "a/c"))
+
+    def test_sort_key(self):
+        orig_shard_ranges = [
+            utils.ShardRange('a/c', next(self.ts_iter), '', '',
+                             state=utils.ShardRange.SHARDED),
+            utils.ShardRange('.a/c1', next(self.ts_iter), 'a', 'd',
+                             state=utils.ShardRange.CREATED),
+            utils.ShardRange('.a/c0', next(self.ts_iter), '', 'a',
+                             state=utils.ShardRange.CREATED),
+            utils.ShardRange('.a/c2b', next(self.ts_iter), 'd', 'f',
+                             state=utils.ShardRange.SHARDING),
+            utils.ShardRange('.a/c2', next(self.ts_iter), 'c', 'f',
+                             state=utils.ShardRange.SHARDING),
+            utils.ShardRange('.a/c2a', next(self.ts_iter), 'd', 'f',
+                             state=utils.ShardRange.SHARDING),
+            utils.ShardRange('.a/c4', next(self.ts_iter), 'f', '',
+                             state=utils.ShardRange.ACTIVE)
+        ]
+        shard_ranges = list(orig_shard_ranges)
+        shard_ranges.sort(key=utils.ShardRange.sort_key)
+        self.assertEqual(shard_ranges[0], orig_shard_ranges[2])
+        self.assertEqual(shard_ranges[1], orig_shard_ranges[1])
+        self.assertEqual(shard_ranges[2], orig_shard_ranges[4])
+        self.assertEqual(shard_ranges[3], orig_shard_ranges[5])
+        self.assertEqual(shard_ranges[4], orig_shard_ranges[3])
+        self.assertEqual(shard_ranges[5], orig_shard_ranges[6])
+        self.assertEqual(shard_ranges[6], orig_shard_ranges[0])
+
+    def test_is_child_of(self):
+        # Set up some shard ranges in relational hierarchy:
+        # account -> root -> grandparent -> parent -> child
+        # using abbreviated names a_r_gp_p_c
+
+        # account 1
+        ts = next(self.ts_iter)
+        a1_r1 = utils.ShardRange('a1/r1', ts)
+        ts = next(self.ts_iter)
+        a1_r1_gp1 = utils.ShardRange(utils.ShardRange.make_path(
+            '.shards_a1', 'r1', 'r1', ts, 1), ts)
+        ts = next(self.ts_iter)
+        a1_r1_gp1_p1 = utils.ShardRange(utils.ShardRange.make_path(
+            '.shards_a1', 'r1', a1_r1_gp1.container, ts, 1), ts)
+        ts = next(self.ts_iter)
+        a1_r1_gp1_p1_c1 = utils.ShardRange(utils.ShardRange.make_path(
+            '.shards_a1', 'r1', a1_r1_gp1_p1.container, ts, 1), ts)
+        ts = next(self.ts_iter)
+        a1_r1_gp1_p1_c2 = utils.ShardRange(utils.ShardRange.make_path(
+            '.shards_a1', 'r1', a1_r1_gp1_p1.container, ts, 2), ts)
+        ts = next(self.ts_iter)
+        a1_r1_gp1_p2 = utils.ShardRange(utils.ShardRange.make_path(
+            '.shards_a1', 'r1', a1_r1_gp1.container, ts, 2), ts)
+        ts = next(self.ts_iter)
+        a1_r1_gp2 = utils.ShardRange(utils.ShardRange.make_path(
+            '.shards_a1', 'r1', 'r1', ts, 2), ts)  # different index
+        ts = next(self.ts_iter)
+        a1_r1_gp2_p1 = utils.ShardRange(utils.ShardRange.make_path(
+            '.shards_a1', 'r1', a1_r1_gp2.container, ts, 1), ts)
+        # drop the index from grandparent name
+        ts = next(self.ts_iter)
+        rogue_a1_r1_gp = utils.ShardRange(utils.ShardRange.make_path(
+            '.shards_a1', 'r1', 'r1', ts, 1)[:-2], ts)
+
+        # account 1, root 2
+        ts = next(self.ts_iter)
+        a1_r2 = utils.ShardRange('a1/r2', ts)
+        ts = next(self.ts_iter)
+        a1_r2_gp1 = utils.ShardRange(utils.ShardRange.make_path(
+            '.shards_a1', 'r2', a1_r2.container, ts, 1), ts)
+        ts = next(self.ts_iter)
+        a1_r2_gp1_p1 = utils.ShardRange(utils.ShardRange.make_path(
+            '.shards_a1', 'r2', a1_r2_gp1.container, ts, 3), ts)
+
+        # account 2, root1
+        a2_r1 = utils.ShardRange('a2/r1', ts)
+        ts = next(self.ts_iter)
+        a2_r1_gp1 = utils.ShardRange(utils.ShardRange.make_path(
+            '.shards_a2', 'r1', a2_r1.container, ts, 1), ts)
+        ts = next(self.ts_iter)
+        a2_r1_gp1_p1 = utils.ShardRange(utils.ShardRange.make_path(
+            '.shards_a2', 'r1', a2_r1_gp1.container, ts, 3), ts)
+
+        # verify parent-child within same account.
+        self.assertTrue(a1_r1_gp1.is_child_of(a1_r1))
+        self.assertTrue(a1_r1_gp1_p1.is_child_of(a1_r1_gp1))
+        self.assertTrue(a1_r1_gp1_p1_c1.is_child_of(a1_r1_gp1_p1))
+        self.assertTrue(a1_r1_gp1_p1_c2.is_child_of(a1_r1_gp1_p1))
+        self.assertTrue(a1_r1_gp1_p2.is_child_of(a1_r1_gp1))
+
+        self.assertTrue(a1_r1_gp2.is_child_of(a1_r1))
+        self.assertTrue(a1_r1_gp2_p1.is_child_of(a1_r1_gp2))
+
+        self.assertTrue(a1_r2_gp1.is_child_of(a1_r2))
+        self.assertTrue(a1_r2_gp1_p1.is_child_of(a1_r2_gp1))
+
+        self.assertTrue(a2_r1_gp1.is_child_of(a2_r1))
+        self.assertTrue(a2_r1_gp1_p1.is_child_of(a2_r1_gp1))
+
+        # verify not parent-child within same account.
+        self.assertFalse(a1_r1.is_child_of(a1_r1))
+        self.assertFalse(a1_r1.is_child_of(a1_r2))
+
+        self.assertFalse(a1_r1_gp1.is_child_of(a1_r2))
+        self.assertFalse(a1_r1_gp1.is_child_of(a1_r1_gp1))
+        self.assertFalse(a1_r1_gp1.is_child_of(a1_r1_gp1_p1))
+        self.assertFalse(a1_r1_gp1.is_child_of(a1_r1_gp1_p1_c1))
+
+        self.assertFalse(a1_r1_gp1_p1.is_child_of(a1_r1))
+        self.assertFalse(a1_r1_gp1_p1.is_child_of(a1_r2))
+        self.assertFalse(a1_r1_gp1_p1.is_child_of(a1_r1_gp2))
+        self.assertFalse(a1_r1_gp1_p1.is_child_of(a1_r2_gp1))
+        self.assertFalse(a1_r1_gp1_p1.is_child_of(rogue_a1_r1_gp))
+        self.assertFalse(a1_r1_gp1_p1.is_child_of(a1_r1_gp1_p1))
+        self.assertFalse(a1_r1_gp1_p1.is_child_of(a1_r1_gp1_p2))
+        self.assertFalse(a1_r1_gp1_p1.is_child_of(a1_r2_gp1_p1))
+        self.assertFalse(a1_r1_gp1_p1.is_child_of(a1_r1_gp1_p1_c1))
+        self.assertFalse(a1_r1_gp1_p1.is_child_of(a1_r1_gp1_p1_c2))
+
+        self.assertFalse(a1_r1_gp1_p1_c1.is_child_of(a1_r1))
+        self.assertFalse(a1_r1_gp1_p1_c1.is_child_of(a1_r1_gp1))
+        self.assertFalse(a1_r1_gp1_p1_c1.is_child_of(a1_r1_gp1_p2))
+        self.assertFalse(a1_r1_gp1_p1_c1.is_child_of(a1_r1_gp2_p1))
+        self.assertFalse(a1_r1_gp1_p1_c1.is_child_of(a1_r1_gp1_p1_c1))
+        self.assertFalse(a1_r1_gp1_p1_c1.is_child_of(a1_r1_gp1_p1_c2))
+        self.assertFalse(a1_r1_gp1_p1_c1.is_child_of(a1_r2_gp1_p1))
+        self.assertFalse(a1_r1_gp1_p1_c1.is_child_of(a2_r1_gp1_p1))
+
+        self.assertFalse(a1_r2_gp1.is_child_of(a1_r1))
+        self.assertFalse(a1_r2_gp1_p1.is_child_of(a1_r1_gp1))
+
+        # across different accounts, 'is_child_of' works in some cases but not
+        # all, so don't use it for shard ranges in different accounts.
+        self.assertFalse(a1_r1.is_child_of(a2_r1))
+        self.assertFalse(a2_r1_gp1_p1.is_child_of(a1_r1_gp1))
+        self.assertFalse(a1_r1_gp1_p1.is_child_of(a2_r1))
+        self.assertTrue(a1_r1_gp1.is_child_of(a2_r1))
+        self.assertTrue(a2_r1_gp1.is_child_of(a1_r1))
+
+    def test_find_root(self):
+        # account 1
+        ts = next(self.ts_iter)
+        a1_r1 = utils.ShardRange('a1/r1', ts)
+        ts = next(self.ts_iter)
+        a1_r1_gp1 = utils.ShardRange(utils.ShardRange.make_path(
+            '.shards_a1', 'r1', 'r1', ts, 1), ts, '', 'l')
+        ts = next(self.ts_iter)
+        a1_r1_gp1_p1 = utils.ShardRange(utils.ShardRange.make_path(
+            '.shards_a1', 'r1', a1_r1_gp1.container, ts, 1), ts, 'a', 'k')
+        ts = next(self.ts_iter)
+        a1_r1_gp1_p1_c1 = utils.ShardRange(utils.ShardRange.make_path(
+            '.shards_a1', 'r1', a1_r1_gp1_p1.container, ts, 1), ts, 'a', 'j')
+        ts = next(self.ts_iter)
+        a1_r1_gp1_p2 = utils.ShardRange(utils.ShardRange.make_path(
+            '.shards_a1', 'r1', a1_r1_gp1.container, ts, 2), ts, 'k', 'l')
+        ts = next(self.ts_iter)
+        a1_r1_gp2 = utils.ShardRange(utils.ShardRange.make_path(
+            '.shards_a1', 'r1', 'r1', ts, 2), ts, 'l', '')  # different index
+
+        # full ancestry plus some others
+        all_shard_ranges = [a1_r1, a1_r1_gp1, a1_r1_gp1_p1, a1_r1_gp1_p1_c1,
+                            a1_r1_gp1_p2, a1_r1_gp2]
+        random.shuffle(all_shard_ranges)
+        self.assertIsNone(a1_r1.find_root(all_shard_ranges))
+        self.assertEqual(a1_r1, a1_r1_gp1.find_root(all_shard_ranges))
+        self.assertEqual(a1_r1, a1_r1_gp1_p1.find_root(all_shard_ranges))
+        self.assertEqual(a1_r1, a1_r1_gp1_p1_c1.find_root(all_shard_ranges))
+
+        # missing a1_r1_gp1_p1
+        all_shard_ranges = [a1_r1, a1_r1_gp1, a1_r1_gp1_p1_c1,
+                            a1_r1_gp1_p2, a1_r1_gp2]
+        random.shuffle(all_shard_ranges)
+        self.assertIsNone(a1_r1.find_root(all_shard_ranges))
+        self.assertEqual(a1_r1, a1_r1_gp1.find_root(all_shard_ranges))
+        self.assertEqual(a1_r1, a1_r1_gp1_p1.find_root(all_shard_ranges))
+        self.assertEqual(a1_r1, a1_r1_gp1_p1_c1.find_root(all_shard_ranges))
+
+        # empty list
+        self.assertIsNone(a1_r1_gp1_p1_c1.find_root([]))
+
+        # double entry
+        all_shard_ranges = [a1_r1, a1_r1, a1_r1_gp1, a1_r1_gp1]
+        random.shuffle(all_shard_ranges)
+        self.assertEqual(a1_r1, a1_r1_gp1_p1.find_root(all_shard_ranges))
+        self.assertEqual(a1_r1, a1_r1_gp1_p1_c1.find_root(all_shard_ranges))
+
+    def test_find_ancestors(self):
+        # account 1
+        ts = next(self.ts_iter)
+        a1_r1 = utils.ShardRange('a1/r1', ts)
+        ts = next(self.ts_iter)
+        a1_r1_gp1 = utils.ShardRange(utils.ShardRange.make_path(
+            '.shards_a1', 'r1', 'r1', ts, 1), ts, '', 'l')
+        ts = next(self.ts_iter)
+        a1_r1_gp1_p1 = utils.ShardRange(utils.ShardRange.make_path(
+            '.shards_a1', 'r1', a1_r1_gp1.container, ts, 1), ts, 'a', 'k')
+        ts = next(self.ts_iter)
+        a1_r1_gp1_p1_c1 = utils.ShardRange(utils.ShardRange.make_path(
+            '.shards_a1', 'r1', a1_r1_gp1_p1.container, ts, 1), ts, 'a', 'j')
+        ts = next(self.ts_iter)
+        a1_r1_gp1_p2 = utils.ShardRange(utils.ShardRange.make_path(
+            '.shards_a1', 'r1', a1_r1_gp1.container, ts, 2), ts, 'k', 'l')
+        ts = next(self.ts_iter)
+        a1_r1_gp2 = utils.ShardRange(utils.ShardRange.make_path(
+            '.shards_a1', 'r1', 'r1', ts, 2), ts, 'l', '')  # different index
+
+        # full ancestry plus some others
+        all_shard_ranges = [a1_r1, a1_r1_gp1, a1_r1_gp1_p1, a1_r1_gp1_p1_c1,
+                            a1_r1_gp1_p2, a1_r1_gp2]
+        random.shuffle(all_shard_ranges)
+        self.assertEqual([], a1_r1.find_ancestors(all_shard_ranges))
+        self.assertEqual([a1_r1], a1_r1_gp1.find_ancestors(all_shard_ranges))
+        self.assertEqual([a1_r1_gp1, a1_r1],
+                         a1_r1_gp1_p1.find_ancestors(all_shard_ranges))
+        self.assertEqual([a1_r1_gp1_p1, a1_r1_gp1, a1_r1],
+                         a1_r1_gp1_p1_c1.find_ancestors(all_shard_ranges))
+
+        # missing a1_r1_gp1_p1
+        all_shard_ranges = [a1_r1, a1_r1_gp1, a1_r1_gp1_p1_c1,
+                            a1_r1_gp1_p2, a1_r1_gp2]
+        random.shuffle(all_shard_ranges)
+        self.assertEqual([], a1_r1.find_ancestors(all_shard_ranges))
+        self.assertEqual([a1_r1], a1_r1_gp1.find_ancestors(all_shard_ranges))
+        self.assertEqual([a1_r1_gp1, a1_r1],
+                         a1_r1_gp1_p1.find_ancestors(all_shard_ranges))
+        self.assertEqual([a1_r1],
+                         a1_r1_gp1_p1_c1.find_ancestors(all_shard_ranges))
+
+        # missing a1_r1_gp1
+        all_shard_ranges = [a1_r1, a1_r1_gp1_p1, a1_r1_gp1_p1_c1,
+                            a1_r1_gp1_p2, a1_r1_gp2]
+        random.shuffle(all_shard_ranges)
+        self.assertEqual([], a1_r1.find_ancestors(all_shard_ranges))
+        self.assertEqual([a1_r1], a1_r1_gp1.find_ancestors(all_shard_ranges))
+        self.assertEqual([a1_r1],
+                         a1_r1_gp1_p1.find_ancestors(all_shard_ranges))
+        self.assertEqual([a1_r1_gp1_p1, a1_r1],
+                         a1_r1_gp1_p1_c1.find_ancestors(all_shard_ranges))
+
+        # empty list
+        self.assertEqual([], a1_r1_gp1_p1_c1.find_ancestors([]))
+        # double entry
+        all_shard_ranges = [a1_r1, a1_r1, a1_r1_gp1, a1_r1_gp1]
+        random.shuffle(all_shard_ranges)
+        self.assertEqual([a1_r1_gp1, a1_r1],
+                         a1_r1_gp1_p1.find_ancestors(all_shard_ranges))
+        self.assertEqual([a1_r1],
+                         a1_r1_gp1_p1_c1.find_ancestors(all_shard_ranges))
+        all_shard_ranges = [a1_r1, a1_r1, a1_r1_gp1_p1, a1_r1_gp1_p1]
+        random.shuffle(all_shard_ranges)
+        self.assertEqual([a1_r1_gp1_p1, a1_r1],
+                         a1_r1_gp1_p1_c1.find_ancestors(all_shard_ranges))
+
+
+class TestShardRangeList(unittest.TestCase):
+    def setUp(self):
+        self.ts_iter = make_timestamp_iter()
+        self.t1 = next(self.ts_iter)
+        self.t2 = next(self.ts_iter)
+        self.ts_iter = make_timestamp_iter()
+        self.shard_ranges = [
+            utils.ShardRange('a/b', self.t1, 'a', 'b',
+                             object_count=2, bytes_used=22, tombstones=222),
+            utils.ShardRange('b/c', self.t2, 'b', 'c',
+                             object_count=4, bytes_used=44, tombstones=444),
+            utils.ShardRange('c/y', self.t1, 'c', 'y',
+                             object_count=6, bytes_used=66),
+        ]
+
+    def test_init(self):
+        srl = ShardRangeList()
+        self.assertEqual(0, len(srl))
+        self.assertEqual(utils.ShardRange.MIN, srl.lower)
+        self.assertEqual(utils.ShardRange.MIN, srl.upper)
+        self.assertEqual(0, srl.object_count)
+        self.assertEqual(0, srl.bytes_used)
+        self.assertEqual(0, srl.row_count)
+
+    def test_init_with_list(self):
+        srl = ShardRangeList(self.shard_ranges[:2])
+        self.assertEqual(2, len(srl))
+        self.assertEqual('a', srl.lower)
+        self.assertEqual('c', srl.upper)
+        self.assertEqual(6, srl.object_count)
+        self.assertEqual(66, srl.bytes_used)
+        self.assertEqual(672, srl.row_count)
+
+        srl.append(self.shard_ranges[2])
+        self.assertEqual(3, len(srl))
+        self.assertEqual('a', srl.lower)
+        self.assertEqual('y', srl.upper)
+        self.assertEqual(12, srl.object_count)
+        self.assertEqual(132, srl.bytes_used)
+        self.assertEqual(-1, self.shard_ranges[2].tombstones)  # sanity check
+        self.assertEqual(678, srl.row_count)  # NB: tombstones=-1 not counted
+
+    def test_pop(self):
+        srl = ShardRangeList(self.shard_ranges[:2])
+        srl.pop()
+        self.assertEqual(1, len(srl))
+        self.assertEqual('a', srl.lower)
+        self.assertEqual('b', srl.upper)
+        self.assertEqual(2, srl.object_count)
+        self.assertEqual(22, srl.bytes_used)
+        self.assertEqual(224, srl.row_count)
+
+    def test_slice(self):
+        srl = ShardRangeList(self.shard_ranges)
+        sublist = srl[:1]
+        self.assertIsInstance(sublist, ShardRangeList)
+        self.assertEqual(1, len(sublist))
+        self.assertEqual('a', sublist.lower)
+        self.assertEqual('b', sublist.upper)
+        self.assertEqual(2, sublist.object_count)
+        self.assertEqual(22, sublist.bytes_used)
+        self.assertEqual(224, sublist.row_count)
+
+        sublist = srl[1:]
+        self.assertIsInstance(sublist, ShardRangeList)
+        self.assertEqual(2, len(sublist))
+        self.assertEqual('b', sublist.lower)
+        self.assertEqual('y', sublist.upper)
+        self.assertEqual(10, sublist.object_count)
+        self.assertEqual(110, sublist.bytes_used)
+        self.assertEqual(454, sublist.row_count)
+
+    def test_includes(self):
+        srl = ShardRangeList(self.shard_ranges)
+
+        for sr in self.shard_ranges:
+            self.assertTrue(srl.includes(sr))
+
+        self.assertTrue(srl.includes(srl))
+
+        sr = utils.ShardRange('a/a', utils.Timestamp.now(), '', 'a')
+        self.assertFalse(srl.includes(sr))
+        sr = utils.ShardRange('a/a', utils.Timestamp.now(), '', 'b')
+        self.assertFalse(srl.includes(sr))
+        sr = utils.ShardRange('a/z', utils.Timestamp.now(), 'x', 'z')
+        self.assertFalse(srl.includes(sr))
+        sr = utils.ShardRange('a/z', utils.Timestamp.now(), 'y', 'z')
+        self.assertFalse(srl.includes(sr))
+        sr = utils.ShardRange('a/entire', utils.Timestamp.now(), '', '')
+        self.assertFalse(srl.includes(sr))
+
+        # entire range
+        srl_entire = ShardRangeList([sr])
+        self.assertFalse(srl.includes(srl_entire))
+        # make a fresh instance
+        sr = utils.ShardRange('a/entire', utils.Timestamp.now(), '', '')
+        self.assertTrue(srl_entire.includes(sr))
+
+    def test_timestamps(self):
+        srl = ShardRangeList(self.shard_ranges)
+        self.assertEqual({self.t1, self.t2}, srl.timestamps)
+        t3 = next(self.ts_iter)
+        self.shard_ranges[2].timestamp = t3
+        self.assertEqual({self.t1, self.t2, t3}, srl.timestamps)
+        srl.pop(0)
+        self.assertEqual({self.t2, t3}, srl.timestamps)
+
+    def test_states(self):
+        srl = ShardRangeList()
+        self.assertEqual(set(), srl.states)
+
+        srl = ShardRangeList(self.shard_ranges)
+        self.shard_ranges[0].update_state(
+            utils.ShardRange.CREATED, next(self.ts_iter))
+        self.shard_ranges[1].update_state(
+            utils.ShardRange.CLEAVED, next(self.ts_iter))
+        self.shard_ranges[2].update_state(
+            utils.ShardRange.ACTIVE, next(self.ts_iter))
+
+        self.assertEqual({utils.ShardRange.CREATED,
+                          utils.ShardRange.CLEAVED,
+                          utils.ShardRange.ACTIVE},
+                         srl.states)
+
+    def test_filter(self):
+        srl = ShardRangeList(self.shard_ranges)
+        self.assertEqual(self.shard_ranges, srl.filter())
+        self.assertEqual(self.shard_ranges,
+                         srl.filter(marker='', end_marker=''))
+        self.assertEqual(self.shard_ranges,
+                         srl.filter(marker=utils.ShardRange.MIN,
+                                    end_marker=utils.ShardRange.MAX))
+        self.assertEqual([], srl.filter(marker=utils.ShardRange.MAX,
+                                        end_marker=utils.ShardRange.MIN))
+        self.assertEqual([], srl.filter(marker=utils.ShardRange.MIN,
+                                        end_marker=utils.ShardRange.MIN))
+        self.assertEqual([], srl.filter(marker=utils.ShardRange.MAX,
+                                        end_marker=utils.ShardRange.MAX))
+        self.assertEqual(self.shard_ranges[:1],
+                         srl.filter(marker='', end_marker='b'))
+        self.assertEqual(self.shard_ranges[1:3],
+                         srl.filter(marker='b', end_marker='y'))
+        self.assertEqual([],
+                         srl.filter(marker='y', end_marker='y'))
+        self.assertEqual([],
+                         srl.filter(marker='y', end_marker='x'))
+        # includes trumps marker & end_marker
+        self.assertEqual(self.shard_ranges[0:1],
+                         srl.filter(includes='b', marker='c', end_marker='y'))
+        self.assertEqual(self.shard_ranges[0:1],
+                         srl.filter(includes='b', marker='', end_marker=''))
+        self.assertEqual([], srl.filter(includes='z'))
+
+    def test_find_lower(self):
+        srl = ShardRangeList(self.shard_ranges)
+        self.shard_ranges[0].update_state(
+            utils.ShardRange.CREATED, next(self.ts_iter))
+        self.shard_ranges[1].update_state(
+            utils.ShardRange.CLEAVED, next(self.ts_iter))
+        self.shard_ranges[2].update_state(
+            utils.ShardRange.ACTIVE, next(self.ts_iter))
+
+        def do_test(states):
+            return srl.find_lower(lambda sr: sr.state in states)
+
+        self.assertEqual(srl.upper,
+                         do_test([utils.ShardRange.FOUND]))
+        self.assertEqual(self.shard_ranges[0].lower,
+                         do_test([utils.ShardRange.CREATED]))
+        self.assertEqual(self.shard_ranges[0].lower,
+                         do_test((utils.ShardRange.CREATED,
+                                  utils.ShardRange.CLEAVED)))
+        self.assertEqual(self.shard_ranges[1].lower,
+                         do_test((utils.ShardRange.ACTIVE,
+                                  utils.ShardRange.CLEAVED)))
+        self.assertEqual(self.shard_ranges[2].lower,
+                         do_test([utils.ShardRange.ACTIVE]))
+
+
+class TestFsync(unittest.TestCase):
+
+    def test_no_fdatasync(self):
+        called = []
+
+        class NoFdatasync(object):
+            pass
+
+        def fsync(fd):
+            called.append(fd)
+
+        with patch('swift.common.utils.os', NoFdatasync()):
+            with patch('swift.common.utils.fsync', fsync):
+                utils.fdatasync(12345)
+                self.assertEqual(called, [12345])
+
+    def test_yes_fdatasync(self):
+        called = []
+
+        class YesFdatasync(object):
+
+            def fdatasync(self, fd):
+                called.append(fd)
+
+        with patch('swift.common.utils.os', YesFdatasync()):
+            utils.fdatasync(12345)
+            self.assertEqual(called, [12345])
+
+    def test_fsync_bad_fullsync(self):
+
+        class FCNTL(object):
+
+            F_FULLSYNC = 123
+
+            def fcntl(self, fd, op):
+                raise IOError(18)
+
+        with patch('swift.common.utils.fcntl', FCNTL()):
+            self.assertRaises(OSError, lambda: utils.fsync(12345))
 
-if __name__ == '__main__':
-    unittest.main()
+    def test_fsync_f_fullsync(self):
+        called = []
+
+        class FCNTL(object):
+
+            F_FULLSYNC = 123
+
+            def fcntl(self, fd, op):
+                called[:] = [fd, op]
+                return 0
+
+        with patch('swift.common.utils.fcntl', FCNTL()):
+            utils.fsync(12345)
+            self.assertEqual(called, [12345, 123])
+
+    def test_fsync_no_fullsync(self):
+        called = []
+
+        class FCNTL(object):
+            pass
+
+        def fsync(fd):
+            called.append(fd)
+
+        with patch('swift.common.utils.fcntl', FCNTL()):
+            with patch('os.fsync', fsync):
+                utils.fsync(12345)
+                self.assertEqual(called, [12345])
+
+
+@patch('ctypes.get_errno')
+@patch.object(utils, '_sys_posix_fallocate')
+@patch.object(utils, '_sys_fallocate')
+@patch.object(utils, 'FALLOCATE_RESERVE', 0)
+class TestFallocate(unittest.TestCase):
+    def test_fallocate(self, sys_fallocate_mock,
+                       sys_posix_fallocate_mock, get_errno_mock):
+        sys_fallocate_mock.available = True
+        sys_fallocate_mock.return_value = 0
+
+        utils.fallocate(1234, 5000 * 2 ** 20)
+
+        # We can't use sys_fallocate_mock.assert_called_once_with because no
+        # two ctypes.c_uint64 objects are equal even if their values are
+        # equal. Yes, ctypes.c_uint64(123) != ctypes.c_uint64(123).
+        calls = sys_fallocate_mock.mock_calls
+        self.assertEqual(len(calls), 1)
+        args = calls[0][1]
+        self.assertEqual(len(args), 4)
+        self.assertEqual(args[0], 1234)
+        self.assertEqual(args[1], utils.FALLOC_FL_KEEP_SIZE)
+        self.assertEqual(args[2].value, 0)
+        self.assertEqual(args[3].value, 5000 * 2 ** 20)
+
+        sys_posix_fallocate_mock.assert_not_called()
+
+    def test_fallocate_offset(self, sys_fallocate_mock,
+                              sys_posix_fallocate_mock, get_errno_mock):
+        sys_fallocate_mock.available = True
+        sys_fallocate_mock.return_value = 0
+
+        utils.fallocate(1234, 5000 * 2 ** 20, offset=3 * 2 ** 30)
+        calls = sys_fallocate_mock.mock_calls
+        self.assertEqual(len(calls), 1)
+        args = calls[0][1]
+        self.assertEqual(len(args), 4)
+        self.assertEqual(args[0], 1234)
+        self.assertEqual(args[1], utils.FALLOC_FL_KEEP_SIZE)
+        self.assertEqual(args[2].value, 3 * 2 ** 30)
+        self.assertEqual(args[3].value, 5000 * 2 ** 20)
+
+        sys_posix_fallocate_mock.assert_not_called()
+
+    def test_fallocate_fatal_error(self, sys_fallocate_mock,
+                                   sys_posix_fallocate_mock, get_errno_mock):
+        sys_fallocate_mock.available = True
+        sys_fallocate_mock.return_value = -1
+        get_errno_mock.return_value = errno.EIO
+
+        with self.assertRaises(OSError) as cm:
+            utils.fallocate(1234, 5000 * 2 ** 20)
+        self.assertEqual(cm.exception.errno, errno.EIO)
+
+    def test_fallocate_silent_errors(self, sys_fallocate_mock,
+                                     sys_posix_fallocate_mock, get_errno_mock):
+        sys_fallocate_mock.available = True
+        sys_fallocate_mock.return_value = -1
+
+        for silent_error in (0, errno.ENOSYS, errno.EOPNOTSUPP, errno.EINVAL):
+            get_errno_mock.return_value = silent_error
+            try:
+                utils.fallocate(1234, 5678)
+            except OSError:
+                self.fail("fallocate() raised an error on %d", silent_error)
+
+    def test_posix_fallocate_fallback(self, sys_fallocate_mock,
+                                      sys_posix_fallocate_mock,
+                                      get_errno_mock):
+        sys_fallocate_mock.available = False
+        sys_fallocate_mock.side_effect = NotImplementedError
+
+        sys_posix_fallocate_mock.available = True
+        sys_posix_fallocate_mock.return_value = 0
+
+        utils.fallocate(1234, 567890)
+        sys_fallocate_mock.assert_not_called()
+
+        calls = sys_posix_fallocate_mock.mock_calls
+        self.assertEqual(len(calls), 1)
+        args = calls[0][1]
+        self.assertEqual(len(args), 3)
+        self.assertEqual(args[0], 1234)
+        self.assertEqual(args[1].value, 0)
+        self.assertEqual(args[2].value, 567890)
+
+    def test_posix_fallocate_offset(self, sys_fallocate_mock,
+                                    sys_posix_fallocate_mock, get_errno_mock):
+        sys_fallocate_mock.available = False
+        sys_fallocate_mock.side_effect = NotImplementedError
+
+        sys_posix_fallocate_mock.available = True
+        sys_posix_fallocate_mock.return_value = 0
+
+        utils.fallocate(1234, 5000 * 2 ** 20, offset=3 * 2 ** 30)
+        calls = sys_posix_fallocate_mock.mock_calls
+        self.assertEqual(len(calls), 1)
+        args = calls[0][1]
+        self.assertEqual(len(args), 3)
+        self.assertEqual(args[0], 1234)
+        self.assertEqual(args[1].value, 3 * 2 ** 30)
+        self.assertEqual(args[2].value, 5000 * 2 ** 20)
+
+        sys_fallocate_mock.assert_not_called()
+
+    def test_no_fallocates_available(self, sys_fallocate_mock,
+                                     sys_posix_fallocate_mock, get_errno_mock):
+        sys_fallocate_mock.available = False
+        sys_posix_fallocate_mock.available = False
+
+        with mock.patch("logging.warning") as warning_mock, \
+                mock.patch.object(utils, "_fallocate_warned_about_missing",
+                                  False):
+            utils.fallocate(321, 654)
+            utils.fallocate(321, 654)
+
+        sys_fallocate_mock.assert_not_called()
+        sys_posix_fallocate_mock.assert_not_called()
+        get_errno_mock.assert_not_called()
+
+        self.assertEqual(len(warning_mock.mock_calls), 1)
+
+    def test_arg_bounds(self, sys_fallocate_mock,
+                        sys_posix_fallocate_mock, get_errno_mock):
+        sys_fallocate_mock.available = True
+        sys_fallocate_mock.return_value = 0
+        with self.assertRaises(ValueError):
+            utils.fallocate(0, 1 << 64, 0)
+        with self.assertRaises(ValueError):
+            utils.fallocate(0, 0, -1)
+        with self.assertRaises(ValueError):
+            utils.fallocate(0, 0, 1 << 64)
+        self.assertEqual([], sys_fallocate_mock.mock_calls)
+        # sanity check
+        utils.fallocate(0, 0, 0)
+        self.assertEqual(
+            [mock.call(0, utils.FALLOC_FL_KEEP_SIZE, mock.ANY, mock.ANY)],
+            sys_fallocate_mock.mock_calls)
+        # Go confirm the ctypes values separately; apparently == doesn't
+        # work the way you'd expect with ctypes :-/
+        self.assertEqual(sys_fallocate_mock.mock_calls[0][1][2].value, 0)
+        self.assertEqual(sys_fallocate_mock.mock_calls[0][1][3].value, 0)
+        sys_fallocate_mock.reset_mock()
+
+        # negative size will be adjusted as 0
+        utils.fallocate(0, -1, 0)
+        self.assertEqual(
+            [mock.call(0, utils.FALLOC_FL_KEEP_SIZE, mock.ANY, mock.ANY)],
+            sys_fallocate_mock.mock_calls)
+        self.assertEqual(sys_fallocate_mock.mock_calls[0][1][2].value, 0)
+        self.assertEqual(sys_fallocate_mock.mock_calls[0][1][3].value, 0)
+
+
+@patch.object(os, 'fstatvfs')
+@patch.object(utils, '_sys_fallocate', available=True, return_value=0)
+@patch.object(utils, 'FALLOCATE_RESERVE', 0)
+@patch.object(utils, 'FALLOCATE_IS_PERCENT', False)
+@patch.object(utils, '_fallocate_enabled', True)
+class TestFallocateReserve(unittest.TestCase):
+    def _statvfs_result(self, f_frsize, f_bavail):
+        # Only 3 values are relevant to us, so use zeros for the rest
+        f_blocks = 100
+        return posix.statvfs_result((0, f_frsize, f_blocks, 0, f_bavail,
+                                     0, 0, 0, 0, 0))
+
+    def test_disabled(self, sys_fallocate_mock, fstatvfs_mock):
+        utils.disable_fallocate()
+        utils.fallocate(123, 456)
+
+        sys_fallocate_mock.assert_not_called()
+        fstatvfs_mock.assert_not_called()
+
+    def test_zero_reserve(self, sys_fallocate_mock, fstatvfs_mock):
+        utils.fallocate(123, 456)
+
+        fstatvfs_mock.assert_not_called()
+        self.assertEqual(len(sys_fallocate_mock.mock_calls), 1)
+
+    def test_enough_space(self, sys_fallocate_mock, fstatvfs_mock):
+        # Want 1024 bytes in reserve plus 1023 allocated, and have 2 blocks
+        # of size 1024 free, so succeed
+        utils.FALLOCATE_RESERVE, utils.FALLOCATE_IS_PERCENT = \
+            utils.config_fallocate_value('1024')
+
+        fstatvfs_mock.return_value = self._statvfs_result(1024, 2)
+        utils.fallocate(88, 1023)
+
+    def test_not_enough_space(self, sys_fallocate_mock, fstatvfs_mock):
+        # Want 1024 bytes in reserve plus 1024 allocated, and have 2 blocks
+        # of size 1024 free, so fail
+        utils.FALLOCATE_RESERVE, utils.FALLOCATE_IS_PERCENT = \
+            utils.config_fallocate_value('1024')
+
+        fstatvfs_mock.return_value = self._statvfs_result(1024, 2)
+        with self.assertRaises(OSError) as catcher:
+            utils.fallocate(88, 1024)
+        self.assertEqual(
+            str(catcher.exception),
+            '[Errno %d] FALLOCATE_RESERVE fail 1024 <= 1024'
+            % errno.ENOSPC)
+        sys_fallocate_mock.assert_not_called()
+
+    def test_not_enough_space_large(self, sys_fallocate_mock, fstatvfs_mock):
+        # Want 1024 bytes in reserve plus 1GB allocated, and have 2 blocks
+        # of size 1024 free, so fail
+        utils.FALLOCATE_RESERVE, utils.FALLOCATE_IS_PERCENT = \
+            utils.config_fallocate_value('1024')
+
+        fstatvfs_mock.return_value = self._statvfs_result(1024, 2)
+        with self.assertRaises(OSError) as catcher:
+            utils.fallocate(88, 1 << 30)
+        self.assertEqual(
+            str(catcher.exception),
+            '[Errno %d] FALLOCATE_RESERVE fail %g <= 1024'
+            % (errno.ENOSPC, ((2 * 1024) - (1 << 30))))
+        sys_fallocate_mock.assert_not_called()
+
+    def test_enough_space_small_blocks(self, sys_fallocate_mock,
+                                       fstatvfs_mock):
+        # Want 1024 bytes in reserve plus 1023 allocated, and have 4 blocks
+        # of size 512 free, so succeed
+        utils.FALLOCATE_RESERVE, utils.FALLOCATE_IS_PERCENT = \
+            utils.config_fallocate_value('1024')
+
+        fstatvfs_mock.return_value = self._statvfs_result(512, 4)
+        utils.fallocate(88, 1023)
+
+    def test_not_enough_space_small_blocks(self, sys_fallocate_mock,
+                                           fstatvfs_mock):
+        # Want 1024 bytes in reserve plus 1024 allocated, and have 4 blocks
+        # of size 512 free, so fail
+        utils.FALLOCATE_RESERVE, utils.FALLOCATE_IS_PERCENT = \
+            utils.config_fallocate_value('1024')
+
+        fstatvfs_mock.return_value = self._statvfs_result(512, 4)
+        with self.assertRaises(OSError) as catcher:
+            utils.fallocate(88, 1024)
+        self.assertEqual(
+            str(catcher.exception),
+            '[Errno %d] FALLOCATE_RESERVE fail 1024 <= 1024'
+            % errno.ENOSPC)
+        sys_fallocate_mock.assert_not_called()
+
+    def test_free_space_under_reserve(self, sys_fallocate_mock, fstatvfs_mock):
+        # Want 2048 bytes in reserve but have only 3 blocks of size 512, so
+        # allocating even 0 bytes fails
+        utils.FALLOCATE_RESERVE, utils.FALLOCATE_IS_PERCENT = \
+            utils.config_fallocate_value('2048')
+
+        fstatvfs_mock.return_value = self._statvfs_result(512, 3)
+        with self.assertRaises(OSError) as catcher:
+            utils.fallocate(88, 0)
+        self.assertEqual(
+            str(catcher.exception),
+            '[Errno %d] FALLOCATE_RESERVE fail 1536 <= 2048'
+            % errno.ENOSPC)
+        sys_fallocate_mock.assert_not_called()
+
+    def test_all_reserved(self, sys_fallocate_mock, fstatvfs_mock):
+        # Filesystem is empty, but our reserve is bigger than the
+        # filesystem, so any allocation will fail
+        utils.FALLOCATE_RESERVE, utils.FALLOCATE_IS_PERCENT = \
+            utils.config_fallocate_value('9999999999999')
+
+        fstatvfs_mock.return_value = self._statvfs_result(1024, 100)
+        self.assertRaises(OSError, utils.fallocate, 88, 0)
+        sys_fallocate_mock.assert_not_called()
+
+    def test_enough_space_pct(self, sys_fallocate_mock, fstatvfs_mock):
+        # Want 1% reserved, filesystem has 3/100 blocks of size 1024 free
+        # and file size is 2047, so succeed
+        utils.FALLOCATE_RESERVE, utils.FALLOCATE_IS_PERCENT = \
+            utils.config_fallocate_value('1%')
+
+        fstatvfs_mock.return_value = self._statvfs_result(1024, 3)
+        utils.fallocate(88, 2047)
+
+    def test_not_enough_space_pct(self, sys_fallocate_mock, fstatvfs_mock):
+        # Want 1% reserved, filesystem has 3/100 blocks of size 1024 free
+        # and file size is 2048, so fail
+        utils.FALLOCATE_RESERVE, utils.FALLOCATE_IS_PERCENT = \
+            utils.config_fallocate_value('1%')
+
+        fstatvfs_mock.return_value = self._statvfs_result(1024, 3)
+        with self.assertRaises(OSError) as catcher:
+            utils.fallocate(88, 2048)
+        self.assertEqual(
+            str(catcher.exception),
+            '[Errno %d] FALLOCATE_RESERVE fail 1 <= 1'
+            % errno.ENOSPC)
+        sys_fallocate_mock.assert_not_called()
+
+    def test_all_space_reserved_pct(self, sys_fallocate_mock, fstatvfs_mock):
+        # Filesystem is empty, but our reserve is the whole filesystem, so
+        # any allocation will fail
+        utils.FALLOCATE_RESERVE, utils.FALLOCATE_IS_PERCENT = \
+            utils.config_fallocate_value('100%')
+
+        fstatvfs_mock.return_value = self._statvfs_result(1024, 100)
+        with self.assertRaises(OSError) as catcher:
+            utils.fallocate(88, 0)
+        self.assertEqual(
+            str(catcher.exception),
+            '[Errno %d] FALLOCATE_RESERVE fail 100 <= 100'
+            % errno.ENOSPC)
+        sys_fallocate_mock.assert_not_called()
+
+
+@patch('ctypes.get_errno')
+@patch.object(utils, '_sys_fallocate')
+class TestPunchHole(unittest.TestCase):
+    def test_punch_hole(self, sys_fallocate_mock, get_errno_mock):
+        sys_fallocate_mock.available = True
+        sys_fallocate_mock.return_value = 0
+
+        utils.punch_hole(123, 456, 789)
+
+        calls = sys_fallocate_mock.mock_calls
+        self.assertEqual(len(calls), 1)
+        args = calls[0][1]
+        self.assertEqual(len(args), 4)
+        self.assertEqual(args[0], 123)
+        self.assertEqual(
+            args[1], utils.FALLOC_FL_PUNCH_HOLE | utils.FALLOC_FL_KEEP_SIZE)
+        self.assertEqual(args[2].value, 456)
+        self.assertEqual(args[3].value, 789)
+
+    def test_error(self, sys_fallocate_mock, get_errno_mock):
+        sys_fallocate_mock.available = True
+        sys_fallocate_mock.return_value = -1
+        get_errno_mock.return_value = errno.EISDIR
+
+        with self.assertRaises(OSError) as cm:
+            utils.punch_hole(123, 456, 789)
+        self.assertEqual(cm.exception.errno, errno.EISDIR)
+
+    def test_arg_bounds(self, sys_fallocate_mock, get_errno_mock):
+        sys_fallocate_mock.available = True
+        sys_fallocate_mock.return_value = 0
+
+        with self.assertRaises(ValueError):
+            utils.punch_hole(0, 1, -1)
+        with self.assertRaises(ValueError):
+            utils.punch_hole(0, 1 << 64, 1)
+        with self.assertRaises(ValueError):
+            utils.punch_hole(0, -1, 1)
+        with self.assertRaises(ValueError):
+            utils.punch_hole(0, 1, 0)
+        with self.assertRaises(ValueError):
+            utils.punch_hole(0, 1, 1 << 64)
+        self.assertEqual([], sys_fallocate_mock.mock_calls)
+
+        # sanity check
+        utils.punch_hole(0, 0, 1)
+        self.assertEqual(
+            [mock.call(
+                0, utils.FALLOC_FL_PUNCH_HOLE | utils.FALLOC_FL_KEEP_SIZE,
+                mock.ANY, mock.ANY)],
+            sys_fallocate_mock.mock_calls)
+        # Go confirm the ctypes values separately; apparently == doesn't
+        # work the way you'd expect with ctypes :-/
+        self.assertEqual(sys_fallocate_mock.mock_calls[0][1][2].value, 0)
+        self.assertEqual(sys_fallocate_mock.mock_calls[0][1][3].value, 1)
+
+    def test_no_fallocate(self, sys_fallocate_mock, get_errno_mock):
+        sys_fallocate_mock.available = False
+
+        with self.assertRaises(OSError) as cm:
+            utils.punch_hole(123, 456, 789)
+        self.assertEqual(cm.exception.errno, errno.ENOTSUP)
+
+
+class TestPunchHoleReally(unittest.TestCase):
+    def setUp(self):
+        if not utils._sys_fallocate.available:
+            raise unittest.SkipTest("utils._sys_fallocate not available")
+
+    def test_punch_a_hole(self):
+        with TemporaryFile() as tf:
+            tf.write(b"x" * 64 + b"y" * 64 + b"z" * 64)
+            tf.flush()
+
+            # knock out the first half of the "y"s
+            utils.punch_hole(tf.fileno(), 64, 32)
+
+            tf.seek(0)
+            contents = tf.read(4096)
+            self.assertEqual(
+                contents,
+                b"x" * 64 + b"\0" * 32 + b"y" * 32 + b"z" * 64)
+
+
+class TestWatchdog(unittest.TestCase):
+    def test_start_stop(self):
+        w = utils.Watchdog()
+        w._evt.send = mock.Mock(side_effect=w._evt.send)
+        gth = object()
+
+        now = time.time()
+        timeout_value = 1.0
+        with patch('eventlet.greenthread.getcurrent', return_value=gth), \
+                patch('time.time', return_value=now):
+            # On first call, _next_expiration is None, it should unblock
+            # greenthread that is blocked for ever
+            key = w.start(timeout_value, Timeout)
+            self.assertIn(key, w._timeouts)
+            self.assertEqual(w._timeouts[key], (
+                timeout_value, now + timeout_value, gth, Timeout, now))
+            w._evt.send.assert_called_once()
+
+            w.stop(key)
+            self.assertNotIn(key, w._timeouts)
+
+    def test_timeout_concurrency(self):
+        w = utils.Watchdog()
+        w._evt.send = mock.Mock(side_effect=w._evt.send)
+        w._evt.wait = mock.Mock()
+        gth = object()
+
+        w._run()
+        w._evt.wait.assert_called_once_with(None)
+
+        with patch('eventlet.greenthread.getcurrent', return_value=gth):
+            w._evt.send.reset_mock()
+            w._evt.wait.reset_mock()
+            with patch('time.time', return_value=10.00):
+                # On first call, _next_expiration is None, it should unblock
+                # greenthread that is blocked for ever
+                w.start(5.0, Timeout)  # Will end at 15.0
+                w._evt.send.assert_called_once()
+
+            with patch('time.time', return_value=10.01):
+                w._run()
+                self.assertEqual(15.0, w._next_expiration)
+                w._evt.wait.assert_called_once_with(15.0 - 10.01)
+
+            w._evt.send.reset_mock()
+            w._evt.wait.reset_mock()
+            with patch('time.time', return_value=12.00):
+                # Now _next_expiration is 15.0, it won't unblock greenthread
+                # because this expiration is later
+                w.start(5.0, Timeout)  # Will end at 17.0
+                w._evt.send.assert_not_called()
+
+            w._evt.send.reset_mock()
+            w._evt.wait.reset_mock()
+            with patch('time.time', return_value=14.00):
+                # Now _next_expiration is still 15.0, it will unblock
+                # greenthread because this new expiration is 14.5
+                w.start(0.5, Timeout)  # Will end at 14.5
+                w._evt.send.assert_called_once()
+
+            with patch('time.time', return_value=14.01):
+                w._run()
+                w._evt.wait.assert_called_once_with(14.5 - 14.01)
+                self.assertEqual(14.5, w._next_expiration)
+                # Should wakeup at 14.5
+
+    def test_timeout_expire(self):
+        w = utils.Watchdog()
+        w._evt.send = mock.Mock()  # To avoid it to call get_hub()
+        w._evt.wait = mock.Mock()  # To avoid it to call get_hub()
+
+        with patch('eventlet.hubs.get_hub') as m_gh:
+            with patch('time.time', return_value=10.0):
+                w.start(5.0, Timeout)  # Will end at 15.0
+
+            with patch('time.time', return_value=16.0):
+                w._run()
+                m_gh.assert_called_once()
+                m_gh.return_value.schedule_call_global.assert_called_once()
+                exc = m_gh.return_value.schedule_call_global.call_args[0][2]
+                self.assertIsInstance(exc, Timeout)
+                self.assertEqual(exc.seconds, 5.0)
+                self.assertEqual(None, w._next_expiration)
+                w._evt.wait.assert_called_once_with(None)
+
+
+class TestReiterate(unittest.TestCase):
+    def test_reiterate_consumes_first(self):
+        test_iter = FakeIterable([1, 2, 3])
+        reiterated = utils.reiterate(test_iter)
+        self.assertEqual(1, test_iter.next_call_count)
+        self.assertEqual(1, next(reiterated))
+        self.assertEqual(1, test_iter.next_call_count)
+        self.assertEqual(2, next(reiterated))
+        self.assertEqual(2, test_iter.next_call_count)
+        self.assertEqual(3, next(reiterated))
+        self.assertEqual(3, test_iter.next_call_count)
+
+    def test_reiterate_closes(self):
+        test_iter = FakeIterable([1, 2, 3])
+        self.assertEqual(0, test_iter.close_call_count)
+        reiterated = utils.reiterate(test_iter)
+        self.assertEqual(0, test_iter.close_call_count)
+        self.assertTrue(hasattr(reiterated, 'close'))
+        self.assertTrue(callable(reiterated.close))
+        reiterated.close()
+        self.assertEqual(1, test_iter.close_call_count)
+
+        # empty iter gets closed when reiterated
+        test_iter = FakeIterable([])
+        self.assertEqual(0, test_iter.close_call_count)
+        reiterated = utils.reiterate(test_iter)
+        self.assertFalse(hasattr(reiterated, 'close'))
+        self.assertEqual(1, test_iter.close_call_count)
+
+    def test_reiterate_list_or_tuple(self):
+        test_list = [1, 2]
+        reiterated = utils.reiterate(test_list)
+        self.assertIs(test_list, reiterated)
+        test_tuple = (1, 2)
+        reiterated = utils.reiterate(test_tuple)
+        self.assertIs(test_tuple, reiterated)
+
+
+class TestClosingIterator(unittest.TestCase):
+    def _make_gen(self, items, captured_exit):
+        def gen():
+            try:
+                for it in items:
+                    if isinstance(it, Exception):
+                        raise it
+                    yield it
+            except GeneratorExit as e:
+                captured_exit.append(e)
+                raise
+        return gen()
+
+    def test_close(self):
+        wrapped = FakeIterable([1, 2, 3])
+        # note: iter(FakeIterable) is the same object
+        self.assertIs(wrapped, iter(wrapped))
+        it = utils.ClosingIterator(wrapped)
+        actual = [x for x in it]
+        self.assertEqual([1, 2, 3], actual)
+        self.assertEqual(1, wrapped.close_call_count)
+        it.close()
+        self.assertEqual(1, wrapped.close_call_count)
+
+    def test_close_others(self):
+        wrapped = FakeIterable([1, 2, 3])
+        others = [FakeIterable([4, 5, 6]), FakeIterable([])]
+        self.assertIs(wrapped, iter(wrapped))
+        it = utils.ClosingIterator(wrapped, others)
+        actual = [x for x in it]
+        self.assertEqual([1, 2, 3], actual)
+        self.assertEqual([1, 1, 1],
+                         [i.close_call_count for i in others + [wrapped]])
+        it.close()
+        self.assertEqual([1, 1, 1],
+                         [i.close_call_count for i in others + [wrapped]])
+
+    def test_close_gen(self):
+        # explicitly check generator closing
+        captured_exit = []
+        gen = self._make_gen([1, 2], captured_exit)
+        it = utils.ClosingIterator(gen)
+        self.assertFalse(captured_exit)
+        it.close()
+        self.assertFalse(captured_exit)  # the generator didn't start
+
+        captured_exit = []
+        gen = self._make_gen([1, 2], captured_exit)
+        it = utils.ClosingIterator(gen)
+        self.assertFalse(captured_exit)
+        self.assertEqual(1, next(it))  # start the generator
+        it.close()
+        self.assertEqual(1, len(captured_exit))
+
+    def test_close_wrapped_is_not_same_as_iter(self):
+        class AltFakeIterable(FakeIterable):
+            def __iter__(self):
+                return (x for x in self.values)
+
+        wrapped = AltFakeIterable([1, 2, 3])
+        # note: iter(AltFakeIterable) is a generator, not the same object
+        self.assertIsNot(wrapped, iter(wrapped))
+        it = utils.ClosingIterator(wrapped)
+        actual = [x for x in it]
+        self.assertEqual([1, 2, 3], actual)
+        self.assertEqual(1, wrapped.close_call_count)
+        it.close()
+        self.assertEqual(1, wrapped.close_call_count)
+
+    def test_init_with_iterable(self):
+        wrapped = [1, 2, 3]  # list is iterable but not an iterator
+        it = utils.ClosingIterator(wrapped)
+        actual = [x for x in it]
+        self.assertEqual([1, 2, 3], actual)
+        it.close()  # safe to call even though list has no close
+
+    def test_nested_iters(self):
+        wrapped = FakeIterable([1, 2, 3])
+        it = utils.ClosingIterator(utils.ClosingIterator(wrapped))
+        actual = [x for x in it]
+        self.assertEqual([1, 2, 3], actual)
+        self.assertEqual(1, wrapped.close_call_count)
+        it.close()
+        self.assertEqual(1, wrapped.close_call_count)
+
+    def test_close_on_stop_iteration(self):
+        wrapped = FakeIterable([1, 2, 3])
+        others = [FakeIterable([4, 5, 6]), FakeIterable([])]
+        self.assertIs(wrapped, iter(wrapped))
+        it = utils.ClosingIterator(wrapped, others)
+        actual = [x for x in it]
+        self.assertEqual([1, 2, 3], actual)
+        self.assertEqual([1, 1, 1],
+                         [i.close_call_count for i in others + [wrapped]])
+        it.close()
+        self.assertEqual([1, 1, 1],
+                         [i.close_call_count for i in others + [wrapped]])
+
+    def test_close_on_exception(self):
+        # sanity check: generator exits on raising exception without executing
+        # GeneratorExit
+        captured_exit = []
+        gen = self._make_gen([1, ValueError(), 2], captured_exit)
+        self.assertEqual(1, next(gen))
+        with self.assertRaises(ValueError):
+            next(gen)
+        self.assertFalse(captured_exit)
+        gen.close()
+        self.assertFalse(captured_exit)  # gen already exited
+
+        captured_exit = []
+        gen = self._make_gen([1, ValueError(), 2], captured_exit)
+        self.assertEqual(1, next(gen))
+        with self.assertRaises(ValueError):
+            next(gen)
+        self.assertFalse(captured_exit)
+        with self.assertRaises(StopIteration):
+            next(gen)  # gen already exited
+
+        # wrapped gen does the same...
+        captured_exit = []
+        gen = self._make_gen([1, ValueError(), 2], captured_exit)
+        others = [FakeIterable([4, 5, 6]), FakeIterable([])]
+        it = utils.ClosingIterator(gen, others)
+        self.assertEqual(1, next(it))
+        with self.assertRaises(ValueError):
+            next(it)
+        self.assertFalse(captured_exit)
+        # but other iters are closed :)
+        self.assertEqual([1, 1], [i.close_call_count for i in others])
+
+
+class TestClosingMapper(unittest.TestCase):
+    def test_close(self):
+        calls = []
+
+        def func(args):
+            calls.append(args)
+            return sum(args)
+
+        wrapped = FakeIterable([(2, 3), (4, 5)])
+        other = FakeIterable([])
+        it = utils.ClosingMapper(func, wrapped, [other])
+        actual = [x for x in it]
+        self.assertEqual([(2, 3), (4, 5)], calls)
+        self.assertEqual([5, 9], actual)
+        self.assertEqual(1, wrapped.close_call_count)
+        self.assertEqual(1, other.close_call_count)
+        # check against result of map()
+        wrapped = FakeIterable([(2, 3), (4, 5)])
+        mapped = [x for x in map(func, wrapped)]
+        self.assertEqual(mapped, actual)
+
+    def test_function_raises_exception(self):
+        calls = []
+
+        class TestExc(Exception):
+            pass
+
+        def func(args):
+            calls.append(args)
+            if len(calls) > 1:
+                raise TestExc('boom')
+            else:
+                return sum(args)
+
+        wrapped = FakeIterable([(2, 3), (4, 5), (6, 7)])
+        it = utils.ClosingMapper(func, wrapped)
+        self.assertEqual(5, next(it))
+        with self.assertRaises(TestExc) as cm:
+            next(it)
+        self.assertIn('boom', str(cm.exception))
+        self.assertEqual(1, wrapped.close_call_count)
+        with self.assertRaises(StopIteration) as cm:
+            next(it)
+
+
+class TestCloseableChain(unittest.TestCase):
+    def test_closeable_chain_iterates(self):
+        test_iter1 = FakeIterable([1])
+        test_iter2 = FakeIterable([2, 3])
+        chain = utils.CloseableChain(test_iter1, test_iter2)
+        self.assertEqual([1, 2, 3], [x for x in chain])
+
+        chain = utils.CloseableChain([1, 2], [3])
+        self.assertEqual([1, 2, 3], [x for x in chain])
+
+    def test_closeable_chain_closes(self):
+        test_iter1 = FakeIterable([1])
+        test_iter2 = FakeIterable([2, 3])
+        chain = utils.CloseableChain(test_iter1, test_iter2)
+        self.assertEqual(0, test_iter1.close_call_count)
+        self.assertEqual(0, test_iter2.close_call_count)
+        chain.close()
+        self.assertEqual(1, test_iter1.close_call_count)
+        self.assertEqual(1, test_iter2.close_call_count)
+
+        # check that close is safe to call even when component iters have no
+        # close
+        chain = utils.CloseableChain([1, 2], [3])
+        chain.close()
+        # read after close raises StopIteration
+        self.assertEqual([], [x for x in chain])
+
+        # check with generator in the chain
+        generator_closed = [False]
+
+        def gen():
+            try:
+                yield 2
+                yield 3
+            except GeneratorExit:
+                generator_closed[0] = True
+                raise
+
+        test_iter1 = FakeIterable([1])
+        chain = utils.CloseableChain(test_iter1, gen())
+        self.assertEqual(0, test_iter1.close_call_count)
+        self.assertFalse(generator_closed[0])
+        chain.close()
+        self.assertEqual(1, test_iter1.close_call_count)
+        # Generator never kicked off, so there's no GeneratorExit
+        self.assertFalse(generator_closed[0])
+
+        test_iter1 = FakeIterable([1])
+        chain = utils.CloseableChain(gen(), test_iter1)
+        self.assertEqual(2, next(chain))  # Kick off the generator
+        self.assertEqual(0, test_iter1.close_call_count)
+        self.assertFalse(generator_closed[0])
+        chain.close()
+        self.assertEqual(1, test_iter1.close_call_count)
+        self.assertTrue(generator_closed[0])
+
+
+class TestStringAlong(unittest.TestCase):
+    def test_happy(self):
+        logger = debug_logger()
+        it = FakeIterable([1, 2, 3])
+        other_it = FakeIterable([])
+        string_along = utils.StringAlong(
+            it, other_it, lambda: logger.warning('boom'))
+        for i, x in enumerate(string_along):
+            self.assertEqual(i + 1, x)
+            self.assertEqual(0, other_it.next_call_count, x)
+            self.assertEqual(0, other_it.close_call_count, x)
+        self.assertEqual(1, other_it.next_call_count, x)
+        self.assertEqual(1, other_it.close_call_count, x)
+        lines = logger.get_lines_for_level('warning')
+        self.assertFalse(lines)
+
+    def test_unhappy(self):
+        logger = debug_logger()
+        it = FakeIterable([1, 2, 3])
+        other_it = FakeIterable([1])
+        string_along = utils.StringAlong(
+            it, other_it, lambda: logger.warning('boom'))
+        for i, x in enumerate(string_along):
+            self.assertEqual(i + 1, x)
+            self.assertEqual(0, other_it.next_call_count, x)
+            self.assertEqual(0, other_it.close_call_count, x)
+        self.assertEqual(1, other_it.next_call_count, x)
+        self.assertEqual(1, other_it.close_call_count, x)
+        lines = logger.get_lines_for_level('warning')
+        self.assertEqual(1, len(lines))
+        self.assertIn('boom', lines[0])
+
+
+class TestCooperativeIterator(unittest.TestCase):
+    def test_init(self):
+        wrapped = itertools.count()
+        it = utils.CooperativeIterator(wrapped, period=3)
+        self.assertIs(wrapped, it.wrapped_iter)
+        self.assertEqual(0, it.count)
+        self.assertEqual(3, it.period)
+
+    def test_iter(self):
+        it = utils.CooperativeIterator(itertools.count())
+        actual = []
+        with mock.patch('swift.common.utils.sleep') as mock_sleep:
+            for i in it:
+                if i >= 100:
+                    break
+                actual.append(i)
+        self.assertEqual(list(range(100)), actual)
+        self.assertEqual(20, mock_sleep.call_count)
+
+    def test_close(self):
+        it = utils.CooperativeIterator(range(5))
+        it.close()
+
+        closeable = mock.MagicMock()
+        closeable.close = mock.MagicMock()
+        it = utils.CooperativeIterator(closeable)
+        it.close()
+        self.assertTrue(closeable.close.called)
+
+    def test_sleeps(self):
+        def do_test(it, period):
+            results = []
+            for i in range(period):
+                with mock.patch('swift.common.utils.sleep') as mock_sleep:
+                    results.append(next(it))
+                self.assertFalse(mock_sleep.called, i)
+
+            with mock.patch('swift.common.utils.sleep') as mock_sleep:
+                results.append(next(it))
+            self.assertTrue(mock_sleep.called)
+
+            for i in range(period - 1):
+                with mock.patch('swift.common.utils.sleep') as mock_sleep:
+                    results.append(next(it))
+                self.assertFalse(mock_sleep.called, i)
+
+            with mock.patch('swift.common.utils.sleep') as mock_sleep:
+                results.append(next(it))
+            self.assertTrue(mock_sleep.called)
+
+            return results
+
+        actual = do_test(utils.CooperativeIterator(itertools.count()), 5)
+        self.assertEqual(list(range(11)), actual)
+        actual = do_test(utils.CooperativeIterator(itertools.count(), 5), 5)
+        self.assertEqual(list(range(11)), actual)
+        actual = do_test(utils.CooperativeIterator(itertools.count(), 3), 3)
+        self.assertEqual(list(range(7)), actual)
+        actual = do_test(utils.CooperativeIterator(itertools.count(), 1), 1)
+        self.assertEqual(list(range(3)), actual)
+
+    def test_no_sleeps(self):
+        def do_test(period):
+            it = utils.CooperativeIterator(itertools.count(), period)
+            results = []
+            with mock.patch('swift.common.utils.sleep') as mock_sleep:
+                for i in range(100):
+                    results.append(next(it))
+                    self.assertFalse(mock_sleep.called, i)
+            self.assertEqual(list(range(100)), results)
+
+        do_test(0)
+        do_test(-1)
+        do_test(-111)
+        do_test(None)
+
+
+class TestContextPool(unittest.TestCase):
+    def test_context_manager(self):
+        size = 5
+        pool = utils.ContextPool(size)
+        with pool:
+            for _ in range(size):
+                pool.spawn(eventlet.sleep, 10)
+            self.assertEqual(pool.running(), size)
+        self.assertEqual(pool.running(), 0)
+
+    def test_close(self):
+        size = 10
+        pool = utils.ContextPool(size)
+        for _ in range(size):
+            pool.spawn(eventlet.sleep, 10)
+        self.assertEqual(pool.running(), size)
+        pool.close()
+        self.assertEqual(pool.running(), 0)
+
+
+class TestLoggerStatsdClientDelegation(unittest.TestCase):
+    def setUp(self):
+        self.logger_name = 'server'
+
+    def tearDown(self):
+        # Avoid test coupling by removing any StatsdClient instance
+        # that may have been patched on to a Logger.
+        core_logger = logging.getLogger(self.logger_name)
+        if hasattr(core_logger, 'statsd_client'):
+            del core_logger.statsd_client
+
+    def test_patch_statsd_methods(self):
+        client = FakeStatsdClient('host.com', 1234)
+        source = argparse.Namespace()
+        source.statsd_client = client
+
+        target = argparse.Namespace()
+        utils._patch_statsd_methods(target, source)
+        target.increment('a')
+        target.decrement('b')
+        target.update_stats('c', 4)
+        target.timing('d', 23.4)
+        target.timing_since('e', 23.4)
+        target.transfer_rate('f', 56.7, 1234.5)
+        exp = {
+            'decrement': [(('b',), {})],
+            'increment': [(('a',), {})],
+            'timing': [(('d', 23.4), {})],
+            'timing_since': [(('e', 23.4), {})],
+            'transfer_rate': [(('f', 56.7, 1234.5), {})],
+            'update_stats': [(('c', 4), {})]
+        }
+        self.assertEqual(exp, client.calls)
+
+    def test_patch_statsd_methods_source_is_none(self):
+        with self.assertRaises(ValueError) as cm:
+            utils._patch_statsd_methods(object, None)
+        self.assertEqual(
+            'statsd_client_source must have a statsd_client attribute',
+            str(cm.exception))
+
+    def test_patch_statsd_methods_source_no_statsd_client(self):
+        source = argparse.Namespace()
+        with self.assertRaises(ValueError) as cm:
+            utils._patch_statsd_methods(object, source)
+        self.assertEqual(
+            'statsd_client_source must have a statsd_client attribute',
+            str(cm.exception))
+
+    def test_patch_statsd_methods_source_statsd_client_is_none(self):
+        source = argparse.Namespace()
+        source.statsd_client = None
+        with self.assertRaises(ValueError) as cm:
+            utils._patch_statsd_methods(object, source)
+        self.assertEqual(
+            'statsd_client_source must have a statsd_client attribute',
+            str(cm.exception))
+
+    def test_patch_statsd_methods_client_deleted_from_source(self):
+        client = FakeStatsdClient('host.com', 1234)
+        source = argparse.Namespace()
+        source.statsd_client = client
+        target = argparse.Namespace()
+        utils._patch_statsd_methods(target, source)
+        target.increment('a')
+        exp = {
+            'increment': [(('a',), {})],
+        }
+        self.assertEqual(exp, client.calls)
+
+        # if the statsd_client is deleted you will blow up...
+        del source.statsd_client
+        try:
+            target.increment('b')
+        except AttributeError as err:
+            self.assertEqual(
+                str(err),
+                "'Namespace' object has no attribute 'statsd_client'")
+
+    def test_get_logger_provides_a_swift_log_adapter(self):
+        orig_get_swift_logger = utils.logs.get_swift_logger
+        calls = []
+
+        def fake_get_swift_logger(*args, **kwargs):
+            result = orig_get_swift_logger(*args, **kwargs)
+            calls.append((args, kwargs, result))
+            return result
+
+        conf = {}
+        fmt = 'test %(message)s'
+        with mock.patch(
+                'swift.common.utils.get_swift_logger', fake_get_swift_logger):
+            logger = utils.get_logger(
+                conf, name=self.logger_name, log_to_console=True,
+                log_route='test', fmt=fmt)
+        self.assertEqual(1, len(calls))
+        self.assertEqual(
+            ((conf, self.logger_name, True, 'test', fmt), {}),
+            calls[0][:2])
+        self.assertIs(calls[0][2], logger)
+
+    def test_get_logger_provides_statsd_client(self):
+        with mock.patch(
+                'swift.common.statsd_client.StatsdClient', FakeStatsdClient):
+            swift_logger = utils.get_logger(None, name=self.logger_name)
+        self.assertTrue(hasattr(swift_logger.logger, 'statsd_client'))
+        self.assertIsInstance(swift_logger.logger.statsd_client,
+                              FakeStatsdClient)
+        swift_logger.increment('a')
+        swift_logger.decrement('b')
+        swift_logger.update_stats('c', 4)
+        swift_logger.timing('d', 23.4)
+        swift_logger.timing_since('e', 23.4)
+        swift_logger.transfer_rate('f', 56.7, 1234.5)
+        exp = {
+            'decrement': [(('b',), {})],
+            'increment': [(('a',), {})],
+            'timing': [(('d', 23.4), {})],
+            'timing_since': [(('e', 23.4), {})],
+            'transfer_rate': [(('f', 56.7, 1234.5), {})],
+            'update_stats': [(('c', 4), {})]
+        }
+        self.assertTrue(hasattr(swift_logger.logger, 'statsd_client'))
+        client = swift_logger.logger.statsd_client
+        self.assertEqual(exp, client.calls)
+
+    def test_get_logger_statsd_client_default_conf(self):
+        logger = utils.get_logger({}, 'some-name', log_route='some-route')
+        # white-box construction validation
+        self.assertIsInstance(logger.logger.statsd_client, StatsdClient)
+        self.assertIsNone(logger.logger.statsd_client._host)
+        self.assertEqual(logger.logger.statsd_client._port, 8125)
+        self.assertEqual(logger.logger.statsd_client._prefix, 'some-name.')
+        self.assertEqual(logger.logger.statsd_client._default_sample_rate, 1)
+
+    def test_get_logger_statsd_client_non_default_conf(self):
+        logger = utils.get_logger({'log_statsd_host': 'some.host.com',
+                                   'log_statsd_port': 1234,
+                                   'log_statsd_default_sample_rate': 1.2,
+                                   'log_statsd_sample_rate_factor': 3.4},
+                                  'some-name', log_route='some-route')
+        # white-box construction validation
+        self.assertIsInstance(logger.logger.statsd_client, StatsdClient)
+        self.assertEqual(logger.logger.statsd_client._host, 'some.host.com')
+        self.assertEqual(logger.logger.statsd_client._port, 1234)
+        self.assertEqual(logger.logger.statsd_client._default_sample_rate, 1.2)
+        self.assertEqual(logger.logger.statsd_client._sample_rate_factor, 3.4)
+        self.assertEqual(logger.logger.statsd_client._prefix, 'some-name.')
+
+    def test_get_logger_statsd_client_prefix(self):
+        def call_get_logger(conf, name, statsd_tail_prefix, log_route=None):
+            swift_logger = utils.get_logger(
+                conf, name=name,
+                log_route=log_route,
+                statsd_tail_prefix=statsd_tail_prefix)
+            self.assertTrue(hasattr(swift_logger.logger, 'statsd_client'))
+            self.assertIsInstance(swift_logger.logger.statsd_client,
+                                  StatsdClient)
+            return swift_logger
+
+        # tail prefix defaults to swift
+        logger = call_get_logger(None, None, None)
+        self.assertEqual('swift.', logger.logger.statsd_client._prefix)
+        self.assertEqual('swift', logger.name)
+        self.assertEqual('swift', logger.server)
+
+        # tail prefix defaults to swift, log_route is ignored for stats
+        logger = call_get_logger(None, None, None, log_route='route')
+        self.assertEqual('swift.', logger.logger.statsd_client._prefix)
+        self.assertEqual('route', logger.name)
+        self.assertEqual('swift', logger.server)
+
+        # tail prefix defaults to conf log_name
+        conf = {'log_name': 'bar'}
+        logger = call_get_logger(conf, None, None)
+        self.assertEqual('bar.', logger.logger.statsd_client._prefix)
+        self.assertEqual('bar', logger.name)
+        self.assertEqual('bar', logger.server)
+
+        # tail prefix defaults to conf log_name, log_route is ignored for stats
+        conf = {'log_name': 'bar'}
+        logger = call_get_logger(conf, None, None, log_route='route')
+        self.assertEqual('bar.', logger.logger.statsd_client._prefix)
+        self.assertEqual('route', logger.name)
+        self.assertEqual('bar', logger.server)
+
+        # tail prefix defaults to name arg which overrides conf log_name
+        logger = call_get_logger(conf, '', None)
+        self.assertEqual('', logger.logger.statsd_client._prefix)
+
+        # tail prefix defaults to name arg which overrides conf log_name
+        logger = call_get_logger(conf, 'baz', None)
+        self.assertEqual('baz.', logger.logger.statsd_client._prefix)
+
+        # tail prefix set to statsd_tail_prefix arg which overrides name arg
+        logger = call_get_logger(conf, 'baz', '')
+        self.assertEqual('', logger.logger.statsd_client._prefix)
+
+        # tail prefix set to statsd_tail_prefix arg which overrides name arg
+        logger = call_get_logger(conf, 'baz', 'boo')
+        self.assertEqual('boo.', logger.logger.statsd_client._prefix)
+
+        # base prefix is configured, tail prefix defaults to swift
+        conf = {'log_statsd_metric_prefix': 'foo'}
+        logger = call_get_logger(conf, None, None)
+        self.assertEqual('foo.swift.', logger.logger.statsd_client._prefix)
+
+        # base prefix is configured, tail prefix defaults to conf log_name
+        conf = {'log_statsd_metric_prefix': 'foo', 'log_name': 'bar'}
+        logger = call_get_logger(conf, None, None)
+        self.assertEqual('foo.bar.', logger.logger.statsd_client._prefix)
+
+        # base prefix is configured, tail prefix defaults to name arg
+        logger = call_get_logger(conf, 'baz', None)
+        self.assertEqual('foo.baz.', logger.logger.statsd_client._prefix)
+
+        # base prefix is configured, tail prefix set to statsd_tail_prefix arg
+        logger = call_get_logger(conf, None, '')
+        self.assertEqual('foo.', logger.logger.statsd_client._prefix)
+
+        # base prefix is configured, tail prefix set to statsd_tail_prefix arg
+        logger = call_get_logger(conf, 'baz', 'boo')
+        self.assertEqual('foo.boo.', logger.logger.statsd_client._prefix)
+
+    def test_get_logger_replaces_statsd_client(self):
+        # Each call to get_logger creates a *new* StatsdClient instance and
+        # sets it as an attribute of the potentially *shared* Logger instance.
+        # This is a questionable pattern but the test at least reminds us.
+        orig_logger = utils.get_logger(
+            {'log_statsd_port': 1234},
+            name=self.logger_name,
+            statsd_tail_prefix='orig')
+        self.assertTrue(hasattr(orig_logger.logger, 'statsd_client'))
+        orig_client = orig_logger.logger.statsd_client
+        self.assertEqual('orig.', orig_client._prefix)
+        self.assertEqual(1234, orig_client._port)
+
+        new_adapted_logger = utils.get_logger(
+            {'log_statsd_port': 5678},
+            name=self.logger_name,
+            statsd_tail_prefix='new')
+        self.assertTrue(hasattr(new_adapted_logger.logger, 'statsd_client'))
+        new_client = new_adapted_logger.logger.statsd_client
+        # same core Logger...
+        self.assertIs(orig_logger.logger, new_adapted_logger.logger)
+        # ... different StatsdClient !
+        self.assertIsNot(new_client, orig_client)
+        self.assertIs(new_client, orig_logger.logger.statsd_client)
+        self.assertEqual('new.', new_client._prefix)
+        self.assertEqual(5678, new_client._port)
+
+    def test_get_prefixed_logger_calls_get_prefixed_swift_logger(self):
+        orig_get_prefixed_swift_logger = utils.logs.get_prefixed_swift_logger
+        base_logger = utils.logs.get_swift_logger(None)
+        calls = []
+
+        def fake_get_prefixed_swift_logger(*args, **kwargs):
+            result = orig_get_prefixed_swift_logger(*args, **kwargs)
+            calls.append((args, kwargs, result))
+            return result
+
+        with mock.patch(
+                'swift.common.utils.get_prefixed_swift_logger',
+                fake_get_prefixed_swift_logger):
+            logger = utils.get_prefixed_logger(base_logger, 'boo')
+        self.assertEqual(1, len(calls))
+        self.assertEqual(((base_logger,), {'prefix': 'boo'}), calls[0][:2])
+        self.assertEqual(calls[0][2], logger)
+        self.assertEqual('boo', logger.prefix)
+
+    def test_get_prefixed_logger_adopts_statsd_client(self):
+        # verify that get_prefixed_logger installs an interface to any existing
+        # StatsdClient that the source logger has
+        with mock.patch(
+                'swift.common.statsd_client.StatsdClient', FakeStatsdClient):
+            adapted_logger = utils.get_logger(None, name=self.logger_name)
+        self.assertTrue(hasattr(adapted_logger.logger, 'statsd_client'))
+        self.assertIsInstance(adapted_logger.logger.statsd_client,
+                              FakeStatsdClient)
+
+        prefixed_logger = utils.get_prefixed_logger(adapted_logger, 'test')
+        self.assertTrue(hasattr(prefixed_logger.logger, 'statsd_client'))
+        self.assertIs(prefixed_logger.logger.statsd_client,
+                      adapted_logger.logger.statsd_client)
+
+        prefixed_logger.increment('foo')
+        prefixed_logger.decrement('boo')
+
+        exp = {
+            'increment': [(('foo',), {})],
+            'decrement': [(('boo',), {})],
+        }
+        self.assertEqual(exp, prefixed_logger.logger.statsd_client.calls)
+        self.assertEqual(exp, adapted_logger.logger.statsd_client.calls)
+
+    def test_get_prefixed_logger_with_mutilated_statsd_client(self):
+        with mock.patch(
+                'swift.common.statsd_client.StatsdClient', FakeStatsdClient):
+            adapted_logger = utils.get_logger(None, name=self.logger_name)
+        self.assertTrue(hasattr(adapted_logger, 'statsd_client_source'))
+        self.assertIsInstance(
+            adapted_logger.statsd_client_source.statsd_client,
+            FakeStatsdClient)
+        # sanity
+        adapted_logger.increment('foo')
+        fake_statsd_client = adapted_logger.statsd_client_source.statsd_client
+        self.assertEqual(fake_statsd_client.get_increments(), ['foo'])
+
+        # kill and maim!
+        adapted_logger.statsd_client_source.statsd_client = None
+        # bro, what are you DOING!?  you're crazy!?
+        self.assertEqual(adapted_logger.logger.statsd_client, None)
+        # you can't do that, it *breaks* the statsd_client patch methods
+        with self.assertRaises(AttributeError):
+            adapted_logger.increment('bar')
+
+        # you can't get a prefixed logger from a *broken* adapter
+        with self.assertRaises(ValueError):
+            utils.get_prefixed_logger(adapted_logger, 'test')
+
+    def test_get_prefixed_logger_no_statsd_client(self):
+        # verify get_prefixed_logger can be used to mutate the prefix of a
+        # SwiftLogAdapter that does *not* have a StatsdClient interface
+        adapted_logger = utils.logs.get_swift_logger(
+            None, name=self.logger_name)
+        self.assertFalse(
+            hasattr(adapted_logger.logger, 'statsd_client'))
+        self.assertFalse(hasattr(adapted_logger, 'statsd_client_source'))
+        self.assertFalse(hasattr(adapted_logger, 'increment'))
+
+        prefixed_logger = utils.get_prefixed_logger(adapted_logger, 'test')
+        self.assertFalse(hasattr(prefixed_logger, 'statsd_client_source'))
+        self.assertFalse(hasattr(prefixed_logger.logger, 'statsd_client'))
+        self.assertFalse(hasattr(prefixed_logger, 'increment'))
+
+    def test_statsd_set_prefix_deprecation(self):
+        conf = {'log_statsd_host': 'another.host.com'}
+
+        with warnings.catch_warnings(record=True) as cm:
+            warnings.resetwarnings()
+            warnings.simplefilter('always', DeprecationWarning)
+            logger = utils.get_logger(
+                conf, 'some-name', log_route='some-route')
+            logger.set_statsd_prefix('some-name.more-specific')
+        msgs = [str(warning.message)
+                for warning in cm
+                if str(warning.message).startswith('set_statsd_prefix')]
+        self.assertEqual(
+            ['set_statsd_prefix() is deprecated; use the '
+             '``statsd_tail_prefix`` argument to ``get_logger`` instead.'],
+            msgs)
+
+
+class TestMemcachedTimingStatsDecorators(unittest.TestCase):
+    def test_memcached_timing_stats(self):
+        class MockMemcached(object):
+            def __init__(mock_self):
+                mock_self.logger = debug_logger()
+
+            @utils.memcached_timing_stats()
+            def set(mock_self):
+                pass
+
+            @utils.memcached_timing_stats()
+            def get(mock_self):
+                pass
+
+        mock_cache = MockMemcached()
+        with patch('time.time', return_value=1000.99):
+            mock_cache.set()
+        self.assertEqual(
+            {'timing_since': [(('memcached.set.timing', 1000.99), {})]},
+            mock_cache.logger.statsd_client.calls)
+
+        mock_cache = MockMemcached()
+        with patch('time.time', return_value=2000.99):
+            mock_cache.get()
+        self.assertEqual(
+            {'timing_since': [(('memcached.get.timing', 2000.99), {})]},
+            mock_cache.logger.statsd_client.calls)
diff --git a/test/unit/common/test_wsgi.py b/test/unit/common/test_wsgi.py
index 4884104371..3457d622a3 100644
--- a/test/unit/common/test_wsgi.py
+++ b/test/unit/common/test_wsgi.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010 OpenStack, LLC.
+# Copyright (c) 2010 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,78 +13,488 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-""" Tests for swift.common.utils """
+"""Tests for swift.common.wsgi"""
 
-from __future__ import with_statement
+import configparser
+import errno
+import json
 import logging
-import mimetools
-import os
+import signal
 import socket
-import sys
+import struct
 import unittest
-from getpass import getuser
-from shutil import rmtree
-from StringIO import StringIO
+import os
+import eventlet
+
 from collections import defaultdict
-from urllib import quote
+from io import BytesIO
+from textwrap import dedent
 
-from eventlet import sleep
+from urllib.parse import quote
 
+from unittest import mock
+
+import swift.common.middleware.catch_errors
+import swift.common.middleware.gatekeeper
+import swift.proxy.server
+
+import swift.obj.server as obj_server
+import swift.container.server as container_server
+import swift.account.server as account_server
 from swift.common.swob import Request
-from swift.common import wsgi
+from swift.common import wsgi, utils, constraints
+from swift.common.storage_policy import POLICIES
+
+from test import listen_zero
+from test.debug_logger import debug_logger
+from test.unit import (
+    temptree, with_tempdir, write_fake_ring, patch_policies)
 
+from paste.deploy import loadwsgi
 
+
+def _fake_rings(tmpdir):
+    write_fake_ring(os.path.join(tmpdir, 'account.ring.gz'))
+    write_fake_ring(os.path.join(tmpdir, 'container.ring.gz'))
+    for policy in POLICIES:
+        obj_ring_path = \
+            os.path.join(tmpdir, policy.ring_name + '.ring.gz')
+        write_fake_ring(obj_ring_path)
+        # make sure there's no other ring cached on this policy
+        policy.object_ring = None
+
+
+def _fake_swift_conf(tmpdir, custom_swift_conf=None):
+    swift_config = custom_swift_conf or dedent("""
+    [swift-hash]
+    swift_hash_path_prefix = arbitrary-nonempty-value
+    """)
+    conf_path = os.path.join(tmpdir, 'swift.conf')
+    with open(conf_path, 'w') as f:
+        f.write(swift_config)
+    return conf_path
+
+
+@patch_policies
 class TestWSGI(unittest.TestCase):
-    """ Tests for swift.common.wsgi """
-
-    def test_monkey_patch_mimetools(self):
-        sio = StringIO('blah')
-        self.assertEquals(mimetools.Message(sio).type, 'text/plain')
-        sio = StringIO('blah')
-        self.assertEquals(mimetools.Message(sio).plisttext, '')
-        sio = StringIO('blah')
-        self.assertEquals(mimetools.Message(sio).maintype, 'text')
-        sio = StringIO('blah')
-        self.assertEquals(mimetools.Message(sio).subtype, 'plain')
-        sio = StringIO('Content-Type: text/html; charset=ISO-8859-4')
-        self.assertEquals(mimetools.Message(sio).type, 'text/html')
-        sio = StringIO('Content-Type: text/html; charset=ISO-8859-4')
-        self.assertEquals(mimetools.Message(sio).plisttext,
-                          '; charset=ISO-8859-4')
-        sio = StringIO('Content-Type: text/html; charset=ISO-8859-4')
-        self.assertEquals(mimetools.Message(sio).maintype, 'text')
-        sio = StringIO('Content-Type: text/html; charset=ISO-8859-4')
-        self.assertEquals(mimetools.Message(sio).subtype, 'html')
-
-        wsgi.monkey_patch_mimetools()
-        sio = StringIO('blah')
-        self.assertEquals(mimetools.Message(sio).type, None)
-        sio = StringIO('blah')
-        self.assertEquals(mimetools.Message(sio).plisttext, '')
-        sio = StringIO('blah')
-        self.assertEquals(mimetools.Message(sio).maintype, None)
-        sio = StringIO('blah')
-        self.assertEquals(mimetools.Message(sio).subtype, None)
-        sio = StringIO('Content-Type: text/html; charset=ISO-8859-4')
-        self.assertEquals(mimetools.Message(sio).type, 'text/html')
-        sio = StringIO('Content-Type: text/html; charset=ISO-8859-4')
-        self.assertEquals(mimetools.Message(sio).plisttext,
-                          '; charset=ISO-8859-4')
-        sio = StringIO('Content-Type: text/html; charset=ISO-8859-4')
-        self.assertEquals(mimetools.Message(sio).maintype, 'text')
-        sio = StringIO('Content-Type: text/html; charset=ISO-8859-4')
-        self.assertEquals(mimetools.Message(sio).subtype, 'html')
+    """Tests for swift.common.wsgi"""
+
+    def test_init_request_processor(self):
+        config = """
+        [DEFAULT]
+        swift_dir = TEMPDIR
+        fallocate_reserve = 1%
+
+        [pipeline:main]
+        pipeline = proxy-server
+
+        [app:proxy-server]
+        use = egg:swift#proxy
+        conn_timeout = 0.2
+        """
+        contents = dedent(config)
+        with temptree(['proxy-server.conf']) as t:
+            conf_file = os.path.join(t, 'proxy-server.conf')
+            with open(conf_file, 'w') as f:
+                f.write(contents.replace('TEMPDIR', t))
+            _fake_rings(t)
+            _fake_swift_conf(t)
+            app, conf, logger, log_name = wsgi.init_request_processor(
+                conf_file, 'proxy-server')
+        # verify pipeline is: catch_errors -> gatekeeper -> listing_formats ->
+        #                     copy -> dlo -> proxy-server
+        expected = swift.common.middleware.catch_errors.CatchErrorMiddleware
+        self.assertIsInstance(app, expected)
+
+        app = app.app
+        expected = swift.common.middleware.gatekeeper.GatekeeperMiddleware
+        self.assertIsInstance(app, expected)
+
+        app = app.app
+        expected = swift.common.middleware.listing_formats.ListingFilter
+        self.assertIsInstance(app, expected)
+
+        app = app.app
+        expected = swift.common.middleware.copy.ServerSideCopyMiddleware
+        self.assertIsInstance(app, expected)
+
+        app = app.app
+        expected = swift.common.middleware.dlo.DynamicLargeObject
+        self.assertIsInstance(app, expected)
+
+        app = app.app
+        expected = \
+            swift.common.middleware.versioned_writes.VersionedWritesMiddleware
+        self.assertIsInstance(app, expected)
+
+        app = app.app
+        expected = swift.proxy.server.Application
+        self.assertIsInstance(app, expected)
+        # config settings applied to app instance
+        self.assertEqual(0.2, app.conn_timeout)
+        # appconfig returns values from 'proxy-server' section
+        expected = {
+            '__file__': conf_file,
+            'here': os.path.dirname(conf_file),
+            'conn_timeout': '0.2',
+            'fallocate_reserve': '1%',
+            'swift_dir': t,
+            '__name__': 'proxy-server'
+        }
+        self.assertEqual(expected, conf)
+        # logger works
+        logger.info('testing')
+        self.assertEqual('proxy-server', log_name)
+
+    @with_tempdir
+    def test_loadapp_from_file(self, tempdir):
+        conf_path = os.path.join(tempdir, 'object-server.conf')
+        conf_body = """
+        [DEFAULT]
+        CONN_timeout = 10
+        client_timeout = 1
+        [app:main]
+        use = egg:swift#object
+        conn_timeout = 5
+        client_timeout = 2
+        CLIENT_TIMEOUT = 3
+        """
+        contents = dedent(conf_body)
+        with open(conf_path, 'w') as f:
+            f.write(contents)
+        app = wsgi.loadapp(conf_path)
+        self.assertIsInstance(app, obj_server.ObjectController)
+        # N.B. paste config loading from *file* is already case-sensitive,
+        # so, CLIENT_TIMEOUT/client_timeout are unique options
+        self.assertEqual(1, app.client_timeout)
+        self.assertEqual(5, app.conn_timeout)
+
+    @with_tempdir
+    def test_loadapp_from_file_with_duplicate_var(self, tempdir):
+        conf_path = os.path.join(tempdir, 'object-server.conf')
+        conf_body = """
+        [app:main]
+        use = egg:swift#object
+        client_timeout = 2
+        client_timeout = 3
+        """
+        contents = dedent(conf_body)
+        with open(conf_path, 'w') as f:
+            f.write(contents)
+        with self.assertRaises(
+                configparser.DuplicateOptionError) as ctx:
+            wsgi.loadapp(conf_path)
+        msg = str(ctx.exception)
+        self.assertIn('client_timeout', msg)
+        self.assertIn('already exists', msg)
+
+    @with_tempdir
+    def test_loadapp_from_file_with_global_conf(self, tempdir):
+        # verify that global_conf items override conf file DEFAULTS...
+        conf_path = os.path.join(tempdir, 'object-server.conf')
+        conf_body = """
+        [DEFAULT]
+        log_name = swift
+        [app:main]
+        use = egg:swift#object
+        log_name = swift-main
+        """
+        contents = dedent(conf_body)
+        with open(conf_path, 'w') as f:
+            f.write(contents)
+        app = wsgi.loadapp(conf_path)
+        self.assertIsInstance(app, obj_server.ObjectController)
+        self.assertEqual('swift', app.logger.server)
+
+        app = wsgi.loadapp(conf_path, global_conf={'log_name': 'custom'})
+        self.assertIsInstance(app, obj_server.ObjectController)
+        self.assertEqual('custom', app.logger.server)
+
+        # and regular section options...
+        conf_path = os.path.join(tempdir, 'object-server.conf')
+        conf_body = """
+        [DEFAULT]
+        [app:main]
+        use = egg:swift#object
+        log_name = swift-main
+        """
+        contents = dedent(conf_body)
+        with open(conf_path, 'w') as f:
+            f.write(contents)
+        app = wsgi.loadapp(conf_path)
+        self.assertIsInstance(app, obj_server.ObjectController)
+        self.assertEqual('swift-main', app.logger.server)
+
+        app = wsgi.loadapp(conf_path, global_conf={'log_name': 'custom'})
+        self.assertIsInstance(app, obj_server.ObjectController)
+        self.assertEqual('custom', app.logger.server)
+
+        # ...but global_conf items do not override conf file 'set' options
+        conf_body = """
+        [DEFAULT]
+        log_name = swift
+        [app:main]
+        use = egg:swift#object
+        set log_name = swift-main
+        """
+        contents = dedent(conf_body)
+        with open(conf_path, 'w') as f:
+            f.write(contents)
+        app = wsgi.loadapp(conf_path)
+        self.assertIsInstance(app, obj_server.ObjectController)
+        self.assertEqual('swift-main', app.logger.server)
+
+        app = wsgi.loadapp(conf_path, global_conf={'log_name': 'custom'})
+        self.assertIsInstance(app, obj_server.ObjectController)
+        self.assertEqual('swift-main', app.logger.server)
+
+    def test_loadapp_from_string(self):
+        conf_body = """
+        [DEFAULT]
+        CONN_timeout = 10
+        client_timeout = 1
+        [app:main]
+        use = egg:swift#object
+        conn_timeout = 5
+        client_timeout = 2
+        """
+        app = wsgi.loadapp(wsgi.ConfigString(conf_body))
+        self.assertIsInstance(app, obj_server.ObjectController)
+        self.assertEqual(1, app.client_timeout)
+        self.assertEqual(5, app.conn_timeout)
+
+    @with_tempdir
+    def test_loadapp_from_dir(self, tempdir):
+        conf_files = {
+            'pipeline': """
+            [pipeline:main]
+            pipeline = tempauth proxy-server
+            """,
+            'tempauth': """
+            [DEFAULT]
+            swift_dir = %s
+            random_VAR = foo
+            [filter:tempauth]
+            use = egg:swift#tempauth
+            random_var = bar
+            """ % tempdir,
+            'proxy': """
+            [DEFAULT]
+            conn_timeout = 5
+            client_timeout = 1
+            [app:proxy-server]
+            use = egg:swift#proxy
+            CONN_timeout = 10
+            client_timeout = 2
+            """,
+        }
+        _fake_rings(tempdir)
+        _fake_swift_conf(tempdir)
+        for filename, conf_body in conf_files.items():
+            path = os.path.join(tempdir, filename + '.conf')
+            with open(path, 'wt') as fd:
+                fd.write(dedent(conf_body))
+        app = wsgi.loadapp(tempdir)
+        # DEFAULT takes priority (!?)
+        self.assertEqual(5, app._pipeline_final_app.conn_timeout)
+        self.assertEqual(1, app._pipeline_final_app.client_timeout)
+        self.assertEqual('foo', app.app.app.app.conf['random_VAR'])
+        self.assertEqual('bar', app.app.app.app.conf['random_var'])
+
+    @with_tempdir
+    def test_loadapp_from_dir_with_duplicate_var(self, tempdir):
+        conf_files = {
+            'pipeline': """
+            [pipeline:main]
+            pipeline = tempauth proxy-server
+            """,
+            'tempauth': """
+            [DEFAULT]
+            swift_dir = %s
+            random_VAR = foo
+            [filter:tempauth]
+            use = egg:swift#tempauth
+            random_var = bar
+            """ % tempdir,
+            'proxy': """
+            [app:proxy-server]
+            use = egg:swift#proxy
+            client_timeout = 2
+            CLIENT_TIMEOUT = 1
+            conn_timeout = 3
+            conn_timeout = 4
+            """,
+        }
+        _fake_rings(tempdir)
+        _fake_swift_conf(tempdir)
+        for filename, conf_body in conf_files.items():
+            path = os.path.join(tempdir, filename + '.conf')
+            with open(path, 'wt') as fd:
+                fd.write(dedent(conf_body))
+        with self.assertRaises(
+                configparser.DuplicateOptionError) as ctx:
+            wsgi.loadapp(tempdir)
+        msg = str(ctx.exception)
+        self.assertIn('conn_timeout', msg)
+        self.assertIn('already exists', msg)
+
+    @with_tempdir
+    def test_load_app_config(self, tempdir):
+        conf_file = os.path.join(tempdir, 'file.conf')
+
+        def _write_and_load_conf_file(conf):
+            with open(conf_file, 'wt') as fd:
+                fd.write(dedent(conf))
+            return wsgi.load_app_config(conf_file)
+
+        # typical case - DEFAULT options override same option in other sections
+        conf_str = """
+            [DEFAULT]
+            dflt_option = dflt-value
+
+            [pipeline:main]
+            pipeline = proxy-logging proxy-server
+
+            [filter:proxy-logging]
+            use = egg:swift#proxy_logging
+
+            [app:proxy-server]
+            use = egg:swift#proxy
+            proxy_option = proxy-value
+            dflt_option = proxy-dflt-value
+            """
+
+        proxy_conf = _write_and_load_conf_file(conf_str)
+        self.assertEqual('proxy-value', proxy_conf['proxy_option'])
+        self.assertEqual('dflt-value', proxy_conf['dflt_option'])
+
+        # 'set' overrides DEFAULT option
+        conf_str = """
+            [DEFAULT]
+            dflt_option = dflt-value
+
+            [pipeline:main]
+            pipeline = proxy-logging proxy-server
+
+            [filter:proxy-logging]
+            use = egg:swift#proxy_logging
+
+            [app:proxy-server]
+            use = egg:swift#proxy
+            proxy_option = proxy-value
+            set dflt_option = proxy-dflt-value
+            """
+
+        proxy_conf = _write_and_load_conf_file(conf_str)
+        self.assertEqual('proxy-value', proxy_conf['proxy_option'])
+        self.assertEqual('proxy-dflt-value', proxy_conf['dflt_option'])
+
+        # actual proxy server app name is dereferenced
+        conf_str = """
+            [pipeline:main]
+            pipeline = proxy-logging proxyserverapp
+
+            [filter:proxy-logging]
+            use = egg:swift#proxy_logging
+
+            [app:proxyserverapp]
+            use = egg:swift#proxy
+            proxy_option = proxy-value
+            dflt_option = proxy-dflt-value
+            """
+        proxy_conf = _write_and_load_conf_file(conf_str)
+        self.assertEqual('proxy-value', proxy_conf['proxy_option'])
+        self.assertEqual('proxy-dflt-value', proxy_conf['dflt_option'])
+
+        # no pipeline
+        conf_str = """
+            [filter:proxy-logging]
+            use = egg:swift#proxy_logging
+
+            [app:proxy-server]
+            use = egg:swift#proxy
+            proxy_option = proxy-value
+            """
+        proxy_conf = _write_and_load_conf_file(conf_str)
+        self.assertEqual({}, proxy_conf)
+
+        # no matching section
+        conf_str = """
+            [pipeline:main]
+            pipeline = proxy-logging proxy-server
+
+            [filter:proxy-logging]
+            use = egg:swift#proxy_logging
+            """
+        proxy_conf = _write_and_load_conf_file(conf_str)
+        self.assertEqual({}, proxy_conf)
+
+    def test_init_request_processor_from_conf_dir(self):
+        config_dir = {
+            'proxy-server.conf.d/pipeline.conf': """
+            [pipeline:main]
+            pipeline = catch_errors proxy-server
+            """,
+            'proxy-server.conf.d/app.conf': """
+            [app:proxy-server]
+            use = egg:swift#proxy
+            conn_timeout = 0.2
+            """,
+            'proxy-server.conf.d/catch-errors.conf': """
+            [filter:catch_errors]
+            use = egg:swift#catch_errors
+            """
+        }
+        # strip indent from test config contents
+        config_dir = dict((f, dedent(c)) for (f, c) in config_dir.items())
+        with mock.patch('swift.proxy.server.Application.modify_wsgi_pipeline'):
+            with temptree(*zip(*config_dir.items())) as conf_root:
+                conf_dir = os.path.join(conf_root, 'proxy-server.conf.d')
+                with open(os.path.join(conf_dir, 'swift.conf'), 'w') as f:
+                    f.write('[DEFAULT]\nswift_dir = %s' % conf_root)
+                _fake_rings(conf_root)
+                _fake_swift_conf(conf_root)
+                app, conf, logger, log_name = wsgi.init_request_processor(
+                    conf_dir, 'proxy-server')
+        # verify pipeline is catch_errors -> proxy-server
+        expected = swift.common.middleware.catch_errors.CatchErrorMiddleware
+        self.assertIsInstance(app, expected)
+        self.assertIsInstance(app.app, swift.proxy.server.Application)
+        # config settings applied to app instance
+        self.assertEqual(0.2, app.app.conn_timeout)
+        # appconfig returns values from 'proxy-server' section
+        expected = {
+            '__file__': conf_dir,
+            'here': conf_dir,
+            'conn_timeout': '0.2',
+            'swift_dir': conf_root,
+            '__name__': 'proxy-server'
+        }
+        self.assertEqual(expected, conf)
+        # logger works
+        logger.info('testing')
+        self.assertEqual('proxy-server', log_name)
+
+    def test_get_socket_bad_values(self):
+        # first try with no port set
+        self.assertRaises(wsgi.ConfigFilePortError, wsgi.get_socket, {})
+        # next try with a bad port value set
+        self.assertRaises(wsgi.ConfigFilePortError, wsgi.get_socket,
+                          {'bind_port': 'abc'})
+        self.assertRaises(wsgi.ConfigFilePortError, wsgi.get_socket,
+                          {'bind_port': None})
 
     def test_get_socket(self):
         # stubs
-        conf = {}
-        ssl_conf = {
-            'cert_file': '',
-            'key_file': '',
-        }
+        conf = {'bind_port': 54321}
+        ssl_conf = conf.copy()
+        ssl_conf.update({
+            'cert_file': 'cert.pem',
+            'key_file': 'private.key',
+        })
 
         # mocks
-        class MockSocket():
+        class MockSocket(object):
             def __init__(self):
                 self.opts = defaultdict(dict)
 
@@ -94,48 +504,86 @@ def setsockopt(self, level, optname, value):
         def mock_listen(*args, **kwargs):
             return MockSocket()
 
-        class MockSsl():
-            def __init__(self):
-                self.wrap_socket_called = []
+        class MockSslContext(object):
+            _instance = None
+
+            def __init__(self, *args, **kwargs):
+                MockSslContext._instance = self
+                self.load_cert_chain_args = []
 
-            def wrap_socket(self, sock, **kwargs):
-                self.wrap_socket_called.append(kwargs)
+            def wrap_socket(self, sock, *args, **kwargs):
                 return sock
 
+            def load_cert_chain(self, *args, **kwargs):
+                self.load_cert_chain_args.extend(args)
+
         # patch
         old_listen = wsgi.listen
-        old_ssl = wsgi.ssl
+        old_ssl_context = wsgi.ssl.SSLContext
         try:
             wsgi.listen = mock_listen
-            wsgi.ssl = MockSsl()
+            wsgi.ssl.SSLContext = MockSslContext
             # test
             sock = wsgi.get_socket(conf)
             # assert
-            self.assert_(isinstance(sock, MockSocket))
+            self.assertIsInstance(sock, MockSocket)
             expected_socket_opts = {
                 socket.SOL_SOCKET: {
-                    socket.SO_REUSEADDR: 1,
                     socket.SO_KEEPALIVE: 1,
                 },
                 socket.IPPROTO_TCP: {
-                    socket.TCP_KEEPIDLE: 600,
-                },
+                    socket.TCP_NODELAY: 1,
+                }
             }
-            self.assertEquals(sock.opts, expected_socket_opts)
+            if hasattr(socket, 'TCP_KEEPIDLE'):
+                expected_socket_opts[socket.IPPROTO_TCP][
+                    socket.TCP_KEEPIDLE] = 600
+            self.assertEqual(sock.opts, expected_socket_opts)
             # test ssl
             sock = wsgi.get_socket(ssl_conf)
-            expected_kwargs = {
-                'certfile': '',
-                'keyfile': '',
-            }
-            self.assertEquals(wsgi.ssl.wrap_socket_called, [expected_kwargs])
+            expected_args = ['cert.pem', 'private.key']
+            self.assertEqual(MockSslContext._instance.load_cert_chain_args,
+                             expected_args)
+
+            # test keep_idle value
+            keepIdle_value = 700
+            conf['keep_idle'] = keepIdle_value
+            sock = wsgi.get_socket(conf)
+            # assert
+            if hasattr(socket, 'TCP_KEEPIDLE'):
+                expected_socket_opts[socket.IPPROTO_TCP][
+                    socket.TCP_KEEPIDLE] = keepIdle_value
+            self.assertEqual(sock.opts, expected_socket_opts)
+
+            # test keep_idle for str -> int conversion
+            keepIdle_value = '800'
+            conf['keep_idle'] = keepIdle_value
+            sock = wsgi.get_socket(conf)
+            # assert
+            if hasattr(socket, 'TCP_KEEPIDLE'):
+                expected_socket_opts[socket.IPPROTO_TCP][
+                    socket.TCP_KEEPIDLE] = int(keepIdle_value)
+            self.assertEqual(sock.opts, expected_socket_opts)
+
+            # test keep_idle for negative value
+            conf['keep_idle'] = -600
+            self.assertRaises(wsgi.ConfigFileError, wsgi.get_socket, conf)
+
+            # test keep_idle for upperbound value
+            conf['keep_idle'] = 2 ** 15
+            self.assertRaises(wsgi.ConfigFileError, wsgi.get_socket, conf)
+
+            # test keep_idle for Type mismatch
+            conf['keep_idle'] = 'foobar'
+            self.assertRaises(wsgi.ConfigFileError, wsgi.get_socket, conf)
+
         finally:
             wsgi.listen = old_listen
-            wsgi.ssl = old_ssl
+            wsgi.ssl.SSLContext = old_ssl_context
 
     def test_address_in_use(self):
         # stubs
-        conf = {}
+        conf = {'bind_port': 54321}
 
         # mocks
         def mock_listen(*args, **kwargs):
@@ -147,7 +595,7 @@ def value_error_listen(*args, **kwargs):
         def mock_sleep(*args):
             pass
 
-        class MockTime():
+        class MockTime(object):
             """Fast clock advances 10 seconds after every call to time
             """
             def __init__(self):
@@ -176,27 +624,363 @@ def time(self, *args, **kwargs):
             wsgi.sleep = old_sleep
             wsgi.time = old_time
 
+    def test_run_server(self):
+        config = """
+        [DEFAULT]
+        client_timeout = 30
+        keepalive_timeout = 10
+        max_clients = 1000
+        swift_dir = TEMPDIR
+
+        [pipeline:main]
+        pipeline = proxy-server
+
+        [app:proxy-server]
+        use = egg:swift#proxy
+        # while "set" values normally override default
+        set client_timeout = 20
+        # this section is not in conf during run_server
+        set max_clients = 10
+        """
+
+        contents = dedent(config)
+        with temptree(['proxy-server.conf']) as t:
+            conf_file = os.path.join(t, 'proxy-server.conf')
+            with open(conf_file, 'w') as f:
+                f.write(contents.replace('TEMPDIR', t))
+            _fake_rings(t)
+            _fake_swift_conf(t)
+            with mock.patch('swift.common.wsgi.wsgi') as _wsgi, \
+                    mock.patch('swift.common.wsgi.eventlet') as _wsgi_evt:
+                conf = wsgi.appconfig(conf_file)
+                logger = logging.getLogger('test')
+                sock = listen_zero()
+                wsgi.run_server(conf, logger, sock,
+                                allow_modify_pipeline=False)
+        _wsgi_evt.hubs.use_hub.assert_called_with(utils.get_hub())
+        _wsgi_evt.debug.hub_exceptions.assert_called_with(False)
+        self.assertTrue(_wsgi.server.called)
+        args, kwargs = _wsgi.server.call_args
+        server_sock, server_app, server_logger = args
+        self.assertEqual(sock, server_sock)
+        self.assertIsInstance(server_app, swift.proxy.server.Application)
+        self.assertIsNone(server_app.watchdog._run_gth)
+        self.assertEqual(20, server_app.client_timeout)
+        self.assertIsInstance(server_logger, wsgi.NullLogger)
+        self.assertTrue('custom_pool' in kwargs)
+        self.assertEqual(1000, kwargs['custom_pool'].size)
+        self.assertEqual(30, kwargs['socket_timeout'])
+        self.assertEqual(10, kwargs['keepalive'])
+
+        proto_class = kwargs['protocol']
+        self.assertEqual(proto_class, wsgi.SwiftHttpProtocol)
+        self.assertEqual('HTTP/1.0', proto_class.default_request_version)
+
+    def test_run_server_proxied(self):
+        config = """
+        [DEFAULT]
+        client_timeout = 30
+        max_clients = 1000
+        swift_dir = TEMPDIR
+
+        [pipeline:main]
+        pipeline = proxy-server
+
+        [app:proxy-server]
+        use = egg:swift#proxy
+        # these "set" values override defaults
+        set client_timeout = 2.5
+        set max_clients = 10
+        require_proxy_protocol = true
+        """
+
+        contents = dedent(config)
+        with temptree(['proxy-server.conf']) as t:
+            conf_file = os.path.join(t, 'proxy-server.conf')
+            with open(conf_file, 'w') as f:
+                f.write(contents.replace('TEMPDIR', t))
+            _fake_rings(t)
+            with mock.patch('swift.proxy.server.Application.'
+                            'modify_wsgi_pipeline'), \
+                    mock.patch('swift.common.wsgi.wsgi') as _wsgi, \
+                    mock.patch('swift.common.wsgi.eventlet') as _eventlet:
+                conf = wsgi.appconfig(conf_file,
+                                      name='proxy-server')
+                logger = logging.getLogger('test')
+                sock = listen_zero()
+                wsgi.run_server(conf, logger, sock)
+        _eventlet.hubs.use_hub.assert_called_with(utils.get_hub())
+        _eventlet.debug.hub_exceptions.assert_called_with(False)
+        self.assertTrue(_wsgi.server.called)
+        args, kwargs = _wsgi.server.call_args
+        server_sock, server_app, server_logger = args
+        self.assertEqual(sock, server_sock)
+        self.assertIsInstance(server_app, swift.proxy.server.Application)
+        self.assertEqual(2.5, server_app.client_timeout)
+        self.assertIsInstance(server_logger, wsgi.NullLogger)
+        self.assertTrue('custom_pool' in kwargs)
+        self.assertEqual(10, kwargs['custom_pool'].size)
+        self.assertEqual(2.5, kwargs['socket_timeout'])
+        self.assertNotIn('keepalive', kwargs)  # eventlet defaults to True
+
+        proto_class = kwargs['protocol']
+        self.assertEqual(proto_class, wsgi.SwiftHttpProxiedProtocol)
+        self.assertEqual('HTTP/1.0', proto_class.default_request_version)
+
+    def test_run_server_with_latest_eventlet(self):
+        config = """
+        [DEFAULT]
+        swift_dir = TEMPDIR
+        keepalive_timeout = 0
+
+        [pipeline:main]
+        pipeline = proxy-server
+
+        [app:proxy-server]
+        use = egg:swift#proxy
+        """
+
+        contents = dedent(config)
+        with temptree(['proxy-server.conf']) as t:
+            conf_file = os.path.join(t, 'proxy-server.conf')
+            with open(conf_file, 'w') as f:
+                f.write(contents.replace('TEMPDIR', t))
+            _fake_rings(t)
+            _fake_swift_conf(t)
+            with mock.patch('swift.proxy.server.Application.'
+                            'modify_wsgi_pipeline'), \
+                    mock.patch('swift.common.wsgi.wsgi') as _wsgi, \
+                    mock.patch('swift.common.wsgi.eventlet'):
+                conf = wsgi.appconfig(conf_file)
+                logger = logging.getLogger('test')
+                sock = listen_zero()
+                wsgi.run_server(conf, logger, sock)
+
+        self.assertTrue(_wsgi.server.called)
+        args, kwargs = _wsgi.server.call_args
+        self.assertEqual(kwargs.get('capitalize_response_headers'), False)
+        self.assertTrue('protocol' in kwargs)
+        self.assertEqual('HTTP/1.0',
+                         kwargs['protocol'].default_request_version)
+        self.assertIs(False, kwargs['keepalive'])
+
+    def test_run_server_conf_dir(self):
+        config_dir = {
+            'proxy-server.conf.d/pipeline.conf': """
+            [pipeline:main]
+            pipeline = proxy-server
+            """,
+            'proxy-server.conf.d/app.conf': """
+            [app:proxy-server]
+            use = egg:swift#proxy
+            """,
+            'proxy-server.conf.d/default.conf': """
+            [DEFAULT]
+            client_timeout = 30
+            """
+        }
+        # strip indent from test config contents
+        config_dir = dict((f, dedent(c)) for (f, c) in config_dir.items())
+        with temptree(*zip(*config_dir.items())) as conf_root:
+            conf_dir = os.path.join(conf_root, 'proxy-server.conf.d')
+            with open(os.path.join(conf_dir, 'swift.conf'), 'w') as f:
+                f.write('[DEFAULT]\nswift_dir = %s' % conf_root)
+            _fake_rings(conf_root)
+            _fake_swift_conf(conf_root)
+            with mock.patch('swift.proxy.server.Application.'
+                            'modify_wsgi_pipeline'), \
+                    mock.patch('swift.common.wsgi.wsgi') as _wsgi, \
+                    mock.patch('swift.common.wsgi.eventlet') as _wsgi_evt, \
+                    mock.patch.dict('os.environ', {'TZ': ''}), \
+                    mock.patch('time.tzset'):
+                conf = wsgi.appconfig(conf_dir)
+                logger = logging.getLogger('test')
+                sock = listen_zero()
+                wsgi.run_server(conf, logger, sock)
+                self.assertNotEqual(os.environ['TZ'], '')
+
+        _wsgi_evt.hubs.use_hub.assert_called_with(utils.get_hub())
+        _wsgi_evt.debug.hub_exceptions.assert_called_with(False)
+        self.assertTrue(_wsgi.server.called)
+        args, kwargs = _wsgi.server.call_args
+        server_sock, server_app, server_logger = args
+        self.assertEqual(sock, server_sock)
+        self.assertIsInstance(server_app, swift.proxy.server.Application)
+        self.assertIsInstance(server_logger, wsgi.NullLogger)
+        self.assertTrue('custom_pool' in kwargs)
+        self.assertEqual(30, kwargs['socket_timeout'])
+        self.assertTrue('protocol' in kwargs)
+        self.assertEqual('HTTP/1.0',
+                         kwargs['protocol'].default_request_version)
+
+    def test_run_server_debug(self):
+        config = """
+        [DEFAULT]
+        eventlet_debug = yes
+        client_timeout = 30
+        max_clients = 1000
+        swift_dir = TEMPDIR
+
+        [pipeline:main]
+        pipeline = proxy-server
+
+        [app:proxy-server]
+        use = egg:swift#proxy
+        # while "set" values normally override default
+        set client_timeout = 20
+        # this section is not in conf during run_server
+        set max_clients = 10
+        """
+
+        contents = dedent(config)
+        with temptree(['proxy-server.conf']) as t:
+            conf_file = os.path.join(t, 'proxy-server.conf')
+            with open(conf_file, 'w') as f:
+                f.write(contents.replace('TEMPDIR', t))
+            _fake_rings(t)
+            _fake_swift_conf(t)
+            with mock.patch('swift.proxy.server.Application.'
+                            'modify_wsgi_pipeline'), \
+                    mock.patch('swift.common.wsgi.wsgi') as _wsgi, \
+                    mock.patch('swift.common.wsgi.eventlet') as _wsgi_evt:
+                mock_server = _wsgi.server
+                _wsgi.server = lambda *args, **kwargs: mock_server(
+                    *args, **kwargs)
+                conf = wsgi.appconfig(conf_file)
+                logger = logging.getLogger('test')
+                sock = listen_zero()
+                wsgi.run_server(conf, logger, sock)
+        _wsgi_evt.hubs.use_hub.assert_called_with(utils.get_hub())
+        _wsgi_evt.debug.hub_exceptions.assert_called_with(True)
+        self.assertTrue(mock_server.called)
+        args, kwargs = mock_server.call_args
+        server_sock, server_app, server_logger = args
+        self.assertEqual(sock, server_sock)
+        self.assertIsInstance(server_app, swift.proxy.server.Application)
+        self.assertEqual(20, server_app.client_timeout)
+        self.assertIsNone(server_logger)
+        self.assertTrue('custom_pool' in kwargs)
+        self.assertEqual(1000, kwargs['custom_pool'].size)
+        self.assertEqual(30, kwargs['socket_timeout'])
+        self.assertTrue('protocol' in kwargs)
+        self.assertEqual('HTTP/1.0',
+                         kwargs['protocol'].default_request_version)
+
+    def test_run_server_constraints(self):
+        config = """
+        [DEFAULT]
+        swift_dir = TEMPDIR
+
+        [pipeline:main]
+        pipeline = proxy-server
+
+        [app:proxy-server]
+        use = egg:swift#proxy
+        """
+
+        swift_conf = """
+        [swift-hash]
+        swift_hash_path_prefix = arbitrary-nonempty-value
+
+        [swift-constraints]
+        max_request_line = 10240
+        """
+
+        contents = dedent(config)
+        with temptree(['proxy-server.conf']) as t:
+            proxy_conf_file = os.path.join(t, 'proxy-server.conf')
+            with open(proxy_conf_file, 'w') as f:
+                f.write(contents.replace('TEMPDIR', t))
+            _fake_rings(t)
+            # rewrite swift.conf in tmp dir...
+            swift_conf_path = _fake_swift_conf(t, custom_swift_conf=swift_conf)
+            try:
+                # reload constraints using tmp dir swift.conf...
+                with mock.patch(
+                        'swift.common.constraints.utils.SWIFT_CONF_FILE',
+                        new=swift_conf_path):
+                    constraints.reload_constraints()
+                # run a wsgi server...
+                with mock.patch('swift.proxy.server.Application.'
+                                'modify_wsgi_pipeline'), \
+                        mock.patch('swift.common.wsgi.wsgi') as _wsgi, \
+                        mock.patch('swift.common.wsgi.eventlet') as _wsgi_evt:
+                    mock_server = _wsgi.server
+                    _wsgi.server = lambda *args, **kwargs: mock_server(
+                        *args, **kwargs)
+                    proxy_conf = wsgi.appconfig(proxy_conf_file)
+                    logger = logging.getLogger('test')
+                    sock = listen_zero()
+                    wsgi.run_server(proxy_conf, logger, sock)
+            finally:
+                constraints.reload_constraints()
+        _wsgi_evt.hubs.use_hub.assert_called_with(utils.get_hub())
+        _wsgi_evt.debug.hub_exceptions.assert_called_with(False)
+        self.assertTrue(mock_server.called)
+        args, kwargs = mock_server.call_args
+        server_sock, server_app, server_logger = args
+        self.assertEqual(sock, server_sock)
+        self.assertIsInstance(server_app, swift.proxy.server.Application)
+        self.assertEqual(10240, kwargs.get('url_length_limit'))
+
+    def test_appconfig_dir_ignores_hidden_files(self):
+        config_dir = {
+            'server.conf.d/01.conf': """
+            [app:main]
+            use = egg:swift#proxy
+            port = 8080
+            """,
+            'server.conf.d/.01.conf.swp': """
+            [app:main]
+            use = egg:swift#proxy
+            port = 8081
+            """,
+        }
+        # strip indent from test config contents
+        config_dir = dict((f, dedent(c)) for (f, c) in config_dir.items())
+        with temptree(*zip(*config_dir.items())) as path:
+            conf_dir = os.path.join(path, 'server.conf.d')
+            conf = wsgi.appconfig(conf_dir)
+        expected = {
+            '__file__': os.path.join(path, 'server.conf.d'),
+            'here': os.path.join(path, 'server.conf.d'),
+            'port': '8080', '__name__': 'main'
+        }
+        self.assertEqual(conf, expected)
+
     def test_pre_auth_wsgi_input(self):
         oldenv = {}
         newenv = wsgi.make_pre_authed_env(oldenv)
         self.assertTrue('wsgi.input' in newenv)
-        self.assertEquals(newenv['wsgi.input'].read(), '')
+        self.assertEqual(newenv['wsgi.input'].read(), b'')
 
-        oldenv = {'wsgi.input': StringIO('original wsgi.input')}
+        oldenv = {'wsgi.input': BytesIO(b'original wsgi.input')}
         newenv = wsgi.make_pre_authed_env(oldenv)
         self.assertTrue('wsgi.input' in newenv)
-        self.assertEquals(newenv['wsgi.input'].read(), '')
+        self.assertEqual(newenv['wsgi.input'].read(), b'')
+
+        oldenv = {'swift.source': 'UT'}
+        newenv = wsgi.make_pre_authed_env(oldenv)
+        self.assertEqual(newenv['swift.source'], 'UT')
+
+        oldenv = {'swift.source': 'UT'}
+        newenv = wsgi.make_pre_authed_env(oldenv, swift_source='SA')
+        self.assertEqual(newenv['swift.source'], 'SA')
 
     def test_pre_auth_req(self):
         class FakeReq(object):
             @classmethod
-            def fake_blank(cls, path, environ={}, body='', headers={}):
-                self.assertEquals(environ['swift.authorize']('test'), None)
+            def fake_blank(cls, path, environ=None, body=b'', headers=None):
+                if environ is None:
+                    environ = {}
+                if headers is None:
+                    headers = {}
+                self.assertIsNone(environ['swift.authorize']('test'))
                 self.assertFalse('HTTP_X_TRANS_ID' in environ)
         was_blank = Request.blank
         Request.blank = FakeReq.fake_blank
         wsgi.make_pre_authed_request({'HTTP_X_TRANS_ID': '1234'},
-                                     'PUT', '/', body='tester', headers={})
+                                     'PUT', '/', body=b'tester', headers={})
         wsgi.make_pre_authed_request({'HTTP_X_TRANS_ID': '1234'},
                                      'PUT', '/', headers={})
         Request.blank = was_blank
@@ -204,24 +988,24 @@ def fake_blank(cls, path, environ={}, body='', headers={}):
     def test_pre_auth_req_with_quoted_path(self):
         r = wsgi.make_pre_authed_request(
             {'HTTP_X_TRANS_ID': '1234'}, 'PUT', path=quote('/a space'),
-            body='tester', headers={})
-        self.assertEquals(r.path, quote('/a space'))
+            body=b'tester', headers={})
+        self.assertEqual(r.path, quote('/a space'))
 
     def test_pre_auth_req_drops_query(self):
         r = wsgi.make_pre_authed_request(
             {'QUERY_STRING': 'original'}, 'GET', 'path')
-        self.assertEquals(r.query_string, 'original')
+        self.assertEqual(r.query_string, 'original')
         r = wsgi.make_pre_authed_request(
             {'QUERY_STRING': 'original'}, 'GET', 'path?replacement')
-        self.assertEquals(r.query_string, 'replacement')
+        self.assertEqual(r.query_string, 'replacement')
         r = wsgi.make_pre_authed_request(
             {'QUERY_STRING': 'original'}, 'GET', 'path?')
-        self.assertEquals(r.query_string, '')
+        self.assertEqual(r.query_string, '')
 
     def test_pre_auth_req_with_body(self):
         r = wsgi.make_pre_authed_request(
-            {'QUERY_STRING': 'original'}, 'GET', 'path', 'the body')
-        self.assertEquals(r.body, 'the body')
+            {'QUERY_STRING': 'original'}, 'GET', 'path', b'the body')
+        self.assertEqual(r.body, b'the body')
 
     def test_pre_auth_creates_script_name(self):
         e = wsgi.make_pre_authed_env({})
@@ -229,13 +1013,1575 @@ def test_pre_auth_creates_script_name(self):
 
     def test_pre_auth_copies_script_name(self):
         e = wsgi.make_pre_authed_env({'SCRIPT_NAME': '/script_name'})
-        self.assertEquals(e['SCRIPT_NAME'], '/script_name')
+        self.assertEqual(e['SCRIPT_NAME'], '/script_name')
 
     def test_pre_auth_copies_script_name_unless_path_overridden(self):
         e = wsgi.make_pre_authed_env({'SCRIPT_NAME': '/script_name'},
                                      path='/override')
-        self.assertEquals(e['SCRIPT_NAME'], '')
-        self.assertEquals(e['PATH_INFO'], '/override')
+        self.assertEqual(e['SCRIPT_NAME'], '')
+        self.assertEqual(e['PATH_INFO'], '/override')
+
+    def test_pre_auth_req_swift_source(self):
+        r = wsgi.make_pre_authed_request(
+            {'QUERY_STRING': 'original'}, 'GET', 'path', b'the body',
+            swift_source='UT')
+        self.assertEqual(r.body, b'the body')
+        self.assertEqual(r.environ['swift.source'], 'UT')
+
+    def test_run_server_global_conf_callback(self):
+        calls = defaultdict(lambda: 0)
+
+        def _initrp(conf_file, app_section, *args, **kwargs):
+            return (
+                {'__file__': 'test', 'workers': 0, 'bind_port': 12345},
+                'logger',
+                'log_name')
+
+        loadapp_conf = []
+        to_inject = object()  # replication_timeout injects non-string data
+
+        def _global_conf_callback(preloaded_app_conf, global_conf):
+            calls['_global_conf_callback'] += 1
+            self.assertEqual(
+                preloaded_app_conf,
+                {'__file__': 'test', 'workers': 0, 'bind_port': 12345})
+            self.assertEqual(global_conf, {'log_name': 'log_name'})
+            global_conf['test1'] = to_inject
+
+        def _loadapp(uri, name=None, **kwargs):
+            calls['_loadapp'] += 1
+            self.assertIn('global_conf', kwargs)
+            loadapp_conf.append(kwargs['global_conf'])
+            # global_conf_callback hasn't been called yet
+            self.assertNotIn('test1', kwargs['global_conf'])
+
+        def _run_server(*args, **kwargs):
+            # but by the time that we actually *run* the server, it has
+            self.assertEqual(loadapp_conf,
+                             [{'log_name': 'log_name', 'test1': to_inject}])
+
+        with mock.patch.object(wsgi, '_initrp', _initrp), \
+                mock.patch.object(wsgi, 'get_socket'), \
+                mock.patch.object(wsgi, 'drop_privileges'), \
+                mock.patch.object(wsgi, 'loadapp', _loadapp), \
+                mock.patch.object(wsgi, 'capture_stdio'), \
+                mock.patch.object(wsgi, 'run_server', _run_server), \
+                mock.patch(
+                    'swift.common.wsgi.systemd_notify') as mock_notify, \
+                mock.patch('swift.common.utils.eventlet') as _utils_evt:
+            wsgi.run_wsgi('conf_file', 'app_section',
+                          global_conf_callback=_global_conf_callback)
+
+        self.assertEqual(calls['_global_conf_callback'], 1)
+        self.assertEqual(calls['_loadapp'], 1)
+        _utils_evt.patcher.monkey_patch.assert_called_with(all=False,
+                                                           socket=True,
+                                                           select=True,
+                                                           thread=True)
+        self.assertEqual(mock_notify.mock_calls, [
+            mock.call('logger', "STOPPING=1"),
+        ])
+
+    def test_run_server_success(self):
+        calls = defaultdict(int)
+
+        def _initrp(conf_file, app_section, *args, **kwargs):
+            calls['_initrp'] += 1
+            return (
+                {'__file__': 'test', 'workers': 0, 'bind_port': 12345},
+                'logger',
+                'log_name')
+
+        def _loadapp(uri, name=None, **kwargs):
+            calls['_loadapp'] += 1
+
+        logging.logThreads = 1  # reset to default
+        with mock.patch.object(wsgi, '_initrp', _initrp), \
+                mock.patch.object(wsgi, 'get_socket'), \
+                mock.patch.object(wsgi, 'drop_privileges') as _d_privs, \
+                mock.patch.object(wsgi, 'clean_up_daemon_hygiene') as _c_hyg, \
+                mock.patch.object(wsgi, 'loadapp', _loadapp), \
+                mock.patch.object(wsgi, 'capture_stdio'), \
+                mock.patch.object(wsgi, 'run_server'), \
+                mock.patch(
+                    'swift.common.wsgi.systemd_notify') as mock_notify, \
+                mock.patch('swift.common.utils.eventlet') as _utils_evt:
+            rc = wsgi.run_wsgi('conf_file', 'app_section')
+        self.assertEqual(calls['_initrp'], 1)
+        self.assertEqual(calls['_loadapp'], 1)
+        self.assertEqual(rc, 0)
+        _utils_evt.patcher.monkey_patch.assert_called_with(all=False,
+                                                           socket=True,
+                                                           select=True,
+                                                           thread=True)
+        self.assertEqual(mock_notify.mock_calls, [
+            mock.call('logger', "STOPPING=1"),
+        ])
+        # run_wsgi() no longer calls drop_privileges() in the parent process,
+        # just clean_up_daemon_hygene()
+        self.assertEqual([], _d_privs.mock_calls)
+        self.assertEqual([mock.call()], _c_hyg.mock_calls)
+        self.assertEqual(0, logging.logThreads)  # fixed in our monkey_patch
+
+    def test_run_server_test_config(self):
+        calls = defaultdict(int)
+
+        def _initrp(conf_file, app_section, *args, **kwargs):
+            calls['_initrp'] += 1
+            return (
+                {'__file__': 'test', 'workers': 0, 'bind_port': 12345},
+                'logger',
+                'log_name')
+
+        def _loadapp(uri, name=None, **kwargs):
+            calls['_loadapp'] += 1
+
+        with mock.patch.object(wsgi, '_initrp', _initrp), \
+                mock.patch.object(wsgi, 'get_socket') as _get_socket, \
+                mock.patch.object(wsgi, 'drop_privileges') as _d_privs, \
+                mock.patch.object(wsgi, 'clean_up_daemon_hygiene') as _c_hyg, \
+                mock.patch.object(wsgi, 'loadapp', _loadapp), \
+                mock.patch.object(wsgi, 'capture_stdio'), \
+                mock.patch.object(wsgi, 'run_server'), \
+                mock.patch('swift.common.utils.eventlet') as _utils_evt:
+            rc = wsgi.run_wsgi('conf_file', 'app_section', test_config=True)
+        self.assertEqual(calls['_initrp'], 1)
+        self.assertEqual(calls['_loadapp'], 1)
+        self.assertEqual(rc, 0)
+        _utils_evt.patcher.monkey_patch.assert_called_with(all=False,
+                                                           socket=True,
+                                                           select=True,
+                                                           thread=True)
+        # run_wsgi() stops before calling clean_up_daemon_hygene() or
+        # creating sockets
+        self.assertEqual([], _d_privs.mock_calls)
+        self.assertEqual([], _c_hyg.mock_calls)
+        self.assertEqual([], _get_socket.mock_calls)
+
+    @mock.patch('swift.common.wsgi.run_server')
+    @mock.patch('swift.common.wsgi.WorkersStrategy')
+    @mock.patch('swift.common.wsgi.ServersPerPortStrategy')
+    def test_run_server_strategy_plumbing(self, mock_per_port, mock_workers,
+                                          mock_run_server):
+        # Make sure the right strategy gets used in a number of different
+        # config cases.
+
+        class StopAtCreatingSockets(Exception):
+            '''Dummy exception to make sure we don't actually bind ports'''
+
+        mock_per_port().no_fork_sock.return_value = None
+        mock_per_port().new_worker_socks.side_effect = StopAtCreatingSockets
+        mock_workers().no_fork_sock.return_value = None
+        mock_workers().new_worker_socks.side_effect = StopAtCreatingSockets
+        logger = debug_logger()
+        stub__initrp = [
+            {'__file__': 'test', 'workers': 2, 'bind_port': 12345},  # conf
+            logger,
+            'log_name',
+        ]
+        with mock.patch.object(wsgi, '_initrp', return_value=stub__initrp), \
+                mock.patch.object(wsgi, 'loadapp'), \
+                mock.patch('swift.common.utils.monkey_patch'), \
+                mock.patch.object(wsgi, 'capture_stdio'):
+            for server_type in ('account-server', 'container-server',
+                                'object-server'):
+                mock_per_port.reset_mock()
+                mock_workers.reset_mock()
+                logger._clear()
+                with self.assertRaises(StopAtCreatingSockets):
+                    wsgi.run_wsgi('conf_file', server_type)
+                self.assertEqual([], mock_per_port.mock_calls)
+                self.assertEqual([
+                    mock.call(stub__initrp[0], logger),
+                    mock.call().no_fork_sock(),
+                    mock.call().new_worker_socks(),
+                ], mock_workers.mock_calls)
+
+            stub__initrp[0]['servers_per_port'] = 3
+            for server_type in ('account-server', 'container-server'):
+                mock_per_port.reset_mock()
+                mock_workers.reset_mock()
+                logger._clear()
+                with self.assertRaises(StopAtCreatingSockets):
+                    wsgi.run_wsgi('conf_file', server_type)
+                self.assertEqual([], mock_per_port.mock_calls)
+                self.assertEqual([
+                    mock.call(stub__initrp[0], logger),
+                    mock.call().no_fork_sock(),
+                    mock.call().new_worker_socks(),
+                ], mock_workers.mock_calls)
+
+            mock_per_port.reset_mock()
+            mock_workers.reset_mock()
+            logger._clear()
+            with self.assertRaises(StopAtCreatingSockets):
+                wsgi.run_wsgi('conf_file', 'object-server')
+            self.assertEqual([
+                mock.call(stub__initrp[0], logger, servers_per_port=3),
+                mock.call().no_fork_sock(),
+                mock.call().new_worker_socks(),
+            ], mock_per_port.mock_calls)
+            self.assertEqual([], mock_workers.mock_calls)
+
+    def test_run_server_failure1(self):
+        calls = defaultdict(lambda: 0)
+
+        def _initrp(conf_file, app_section, *args, **kwargs):
+            calls['_initrp'] += 1
+            raise wsgi.ConfigFileError('test exception')
+
+        def _loadapp(uri, name=None, **kwargs):
+            calls['_loadapp'] += 1
+
+        with mock.patch.object(wsgi, '_initrp', _initrp), \
+                mock.patch.object(wsgi, 'get_socket'), \
+                mock.patch.object(wsgi, 'drop_privileges'), \
+                mock.patch.object(wsgi, 'loadapp', _loadapp), \
+                mock.patch.object(wsgi, 'capture_stdio'), \
+                mock.patch.object(wsgi, 'run_server'):
+            rc = wsgi.run_wsgi('conf_file', 'app_section')
+        self.assertEqual(calls['_initrp'], 1)
+        self.assertEqual(calls['_loadapp'], 0)
+        self.assertEqual(rc, 1)
+
+    def test_run_server_bad_bind_port(self):
+        def do_test(port):
+            calls = defaultdict(lambda: 0)
+            logger = debug_logger()
+
+            def _initrp(conf_file, app_section, *args, **kwargs):
+                calls['_initrp'] += 1
+                return (
+                    {'__file__': 'test', 'workers': 0, 'bind_port': port},
+                    logger,
+                    'log_name')
+
+            def _loadapp(uri, name=None, **kwargs):
+                calls['_loadapp'] += 1
+
+            with mock.patch.object(wsgi, '_initrp', _initrp), \
+                    mock.patch.object(wsgi, 'get_socket'), \
+                    mock.patch.object(wsgi, 'drop_privileges'), \
+                    mock.patch.object(wsgi, 'loadapp', _loadapp), \
+                    mock.patch.object(wsgi, 'capture_stdio'), \
+                    mock.patch.object(wsgi, 'run_server'):
+                rc = wsgi.run_wsgi('conf_file', 'app_section')
+            self.assertEqual(calls['_initrp'], 1)
+            self.assertEqual(calls['_loadapp'], 0)
+            self.assertEqual(rc, 1)
+            self.assertEqual(
+                ["bind_port wasn't properly set in the config file. "
+                 "It must be explicitly set to a valid port number."],
+                logger.get_lines_for_level('error')
+            )
+
+        do_test('bad')
+        do_test('80000')
+
+    def test_pre_auth_req_with_empty_env_no_path(self):
+        r = wsgi.make_pre_authed_request(
+            {}, 'GET')
+        self.assertEqual(r.path, quote(''))
+        self.assertTrue('SCRIPT_NAME' in r.environ)
+        self.assertTrue('PATH_INFO' in r.environ)
+
+    def test_pre_auth_req_with_env_path(self):
+        r = wsgi.make_pre_authed_request(
+            {'PATH_INFO': '/unquoted path with %20'}, 'GET')
+        self.assertEqual(r.path, quote('/unquoted path with %20'))
+        self.assertEqual(r.environ['SCRIPT_NAME'], '')
+
+    def test_pre_auth_req_with_env_script(self):
+        r = wsgi.make_pre_authed_request({'SCRIPT_NAME': '/hello'}, 'GET')
+        self.assertEqual(r.path, quote('/hello'))
+
+    def test_pre_auth_req_with_env_path_and_script(self):
+        env = {'PATH_INFO': '/unquoted path with %20',
+               'SCRIPT_NAME': '/script'}
+        r = wsgi.make_pre_authed_request(env, 'GET')
+        expected_path = quote(env['SCRIPT_NAME'] + env['PATH_INFO'])
+        self.assertEqual(r.path, expected_path)
+        env = {'PATH_INFO': '', 'SCRIPT_NAME': '/script'}
+        r = wsgi.make_pre_authed_request(env, 'GET')
+        self.assertEqual(r.path, '/script')
+        env = {'PATH_INFO': '/path', 'SCRIPT_NAME': ''}
+        r = wsgi.make_pre_authed_request(env, 'GET')
+        self.assertEqual(r.path, '/path')
+        env = {'PATH_INFO': '', 'SCRIPT_NAME': ''}
+        r = wsgi.make_pre_authed_request(env, 'GET')
+        self.assertEqual(r.path, '')
+
+    def test_pre_auth_req_path_overrides_env(self):
+        env = {'PATH_INFO': '/path', 'SCRIPT_NAME': '/script'}
+        r = wsgi.make_pre_authed_request(env, 'GET', '/override')
+        self.assertEqual(r.path, '/override')
+        self.assertEqual(r.environ['SCRIPT_NAME'], '')
+        self.assertEqual(r.environ['PATH_INFO'], '/override')
+
+    def test_make_env_keep_user_project_id(self):
+        oldenv = {'HTTP_X_USER_ID': '1234', 'HTTP_X_PROJECT_ID': '5678'}
+        newenv = wsgi.make_env(oldenv)
+
+        self.assertTrue('HTTP_X_USER_ID' in newenv)
+        self.assertEqual(newenv['HTTP_X_USER_ID'], '1234')
+
+        self.assertTrue('HTTP_X_PROJECT_ID' in newenv)
+        self.assertEqual(newenv['HTTP_X_PROJECT_ID'], '5678')
+
+    def test_make_env_keeps_referer(self):
+        oldenv = {'HTTP_REFERER': 'http://blah.example.com'}
+        newenv = wsgi.make_env(oldenv)
+
+        self.assertTrue('HTTP_REFERER' in newenv)
+        self.assertEqual(newenv['HTTP_REFERER'], 'http://blah.example.com')
+
+    def test_make_env_keeps_infocache(self):
+        oldenv = {'swift.infocache': {}}
+        newenv = wsgi.make_env(oldenv)
+        self.assertIs(newenv.get('swift.infocache'), oldenv['swift.infocache'])
+
+    def test_make_env_keeps_shard_listing_history(self):
+        oldenv = {'swift.shard_listing_history': []}
+        newenv = wsgi.make_env(oldenv)
+        self.assertIs(newenv.get('swift.shard_listing_history'),
+                      oldenv['swift.shard_listing_history'])
+
+    def test_make_env_keeps_base_labels(self):
+        oldenv = {'swift.base_labels': []}
+        newenv = wsgi.make_env(oldenv)
+        self.assertIs(newenv.get('swift.base_labels'),
+                      oldenv['swift.base_labels'])
+
+
+class CommonTestMixin(object):
+
+    @mock.patch('swift.common.wsgi.capture_stdio')
+    def test_post_fork_hook(self, mock_capture):
+        self.strategy.post_fork_hook()
+
+        self.assertEqual([
+            mock.call('bob'),
+        ], self.mock_drop_privileges.mock_calls)
+        self.assertEqual([
+            mock.call(self.logger),
+        ], mock_capture.mock_calls)
+
+    def test_stale_pid_loading(self):
+        class FakeTime(object):
+            def __init__(self, step=10):
+                self.patchers = [
+                    mock.patch('swift.common.wsgi.time.time',
+                               side_effect=self.time),
+                    mock.patch('swift.common.wsgi.sleep',
+                               side_effect=self.sleep),
+                ]
+                self.now = 0
+                self.step = step
+                self.sleeps = []
+
+            def time(self):
+                self.now += self.step
+                return self.now
+
+            def sleep(self, delta):
+                if delta < 0:
+                    raise ValueError('cannot sleep negative time: %s' % delta)
+                self.now += delta
+                self.sleeps.append(delta)
+
+            def __enter__(self):
+                for patcher in self.patchers:
+                    patcher.start()
+                return self
+
+            def __exit__(self, *a):
+                for patcher in self.patchers:
+                    patcher.stop()
+
+        notify_rfd, notify_wfd = os.pipe()
+        state_rfd, state_wfd = os.pipe()
+        stale_process_data = {
+            "old_pids": {123: 5, 456: 6, 78: 27, 90: 28},
+        }
+        to_write = json.dumps(stale_process_data).encode('ascii')
+        os.write(state_wfd, struct.pack('!I', len(to_write)) + to_write)
+        os.close(state_wfd)
+        self.assertEqual(self.strategy.reload_pids, {})
+        os.environ['__SWIFT_SERVER_NOTIFY_FD'] = str(notify_wfd)
+        os.environ['__SWIFT_SERVER_CHILD_STATE_FD'] = str(state_rfd)
+        with mock.patch('swift.common.wsgi.capture_stdio'), \
+                mock.patch('swift.common.utils.get_ppid') as mock_ppid, \
+                mock.patch('os.kill') as mock_kill, FakeTime() as fake_time:
+            mock_ppid.side_effect = [
+                os.getpid(),
+                OSError(errno.ENOENT, "Not there"),
+                OSError(errno.EPERM, "Not for you"),
+                os.getpid(),
+            ]
+            self.strategy.signal_ready()
+            self.assertEqual(self.strategy.reload_pids,
+                             stale_process_data['old_pids'])
+
+            # We spawned our child-killer, but it hasn't been scheduled yet
+            self.assertEqual(mock_ppid.mock_calls, [])
+            self.assertEqual(mock_kill.mock_calls, [])
+            self.assertEqual(fake_time.sleeps, [])
+
+            # *Now* we let it run (with mocks still enabled)
+            eventlet.sleep()
+
+        self.assertEqual(str(os.getpid()).encode('ascii'),
+                         os.read(notify_rfd, 30))
+        os.close(notify_rfd)
+
+        self.assertEqual(mock_kill.mock_calls, [
+            mock.call(123, signal.SIGKILL),
+            mock.call(90, signal.SIGKILL)])
+        self.assertEqual(fake_time.sleeps, [86395, 2])
+
+
+class TestServersPerPortStrategy(unittest.TestCase, CommonTestMixin):
+    def setUp(self):
+        self.logger = debug_logger()
+        self.conf = {
+            'workers': 100,  # ignored
+            'user': 'bob',
+            'swift_dir': '/jim/cricket',
+            'ring_check_interval': '76',
+            'bind_ip': '2.3.4.5',
+        }
+        self.servers_per_port = 3
+        self.sockets = [mock.MagicMock() for _ in range(6)]
+        patcher = mock.patch('swift.common.wsgi.get_socket',
+                             side_effect=self.sockets)
+        self.mock_get_socket = patcher.start()
+        self.addCleanup(patcher.stop)
+        patcher = mock.patch('swift.common.wsgi.drop_privileges')
+        self.mock_drop_privileges = patcher.start()
+        self.addCleanup(patcher.stop)
+        patcher = mock.patch('swift.common.wsgi.BindPortsCache')
+        self.mock_cache_class = patcher.start()
+        self.addCleanup(patcher.stop)
+        patcher = mock.patch('swift.common.wsgi.os.setsid')
+        self.mock_setsid = patcher.start()
+        self.addCleanup(patcher.stop)
+        patcher = mock.patch('swift.common.wsgi.os.chdir')
+        self.mock_chdir = patcher.start()
+        self.addCleanup(patcher.stop)
+        patcher = mock.patch('swift.common.wsgi.os.umask')
+        self.mock_umask = patcher.start()
+        self.addCleanup(patcher.stop)
+
+        self.all_bind_ports_for_node = \
+            self.mock_cache_class().all_bind_ports_for_node
+        self.ports = (6006, 6007)
+        self.all_bind_ports_for_node.return_value = set(self.ports)
+
+        self.strategy = wsgi.ServersPerPortStrategy(self.conf, self.logger,
+                                                    self.servers_per_port)
+
+    def test_loop_timeout(self):
+        # This strategy should loop every ring_check_interval seconds, even if
+        # no workers exit.
+        self.assertEqual(76, self.strategy.loop_timeout())
+
+        # Check the default
+        del self.conf['ring_check_interval']
+        self.strategy = wsgi.ServersPerPortStrategy(self.conf, self.logger,
+                                                    self.servers_per_port)
+
+        self.assertEqual(15, self.strategy.loop_timeout())
+
+    def test_no_fork_sock(self):
+        self.assertIsNone(self.strategy.no_fork_sock())
+
+    def test_new_worker_socks(self):
+        self.all_bind_ports_for_node.reset_mock()
+
+        pid = 88
+        got_si = []
+        for s, i in self.strategy.new_worker_socks():
+            got_si.append((s, i))
+            self.strategy.register_worker_start(s, i, pid)
+            pid += 1
+
+        self.assertEqual([
+            (self.sockets[0], (6006, 0)),
+            (self.sockets[1], (6006, 1)),
+            (self.sockets[2], (6006, 2)),
+            (self.sockets[3], (6007, 0)),
+            (self.sockets[4], (6007, 1)),
+            (self.sockets[5], (6007, 2)),
+        ], got_si)
+        self.assertEqual([
+            'Started child %d (PID %d) for port %d' % (0, 88, 6006),
+            'Started child %d (PID %d) for port %d' % (1, 89, 6006),
+            'Started child %d (PID %d) for port %d' % (2, 90, 6006),
+            'Started child %d (PID %d) for port %d' % (0, 91, 6007),
+            'Started child %d (PID %d) for port %d' % (1, 92, 6007),
+            'Started child %d (PID %d) for port %d' % (2, 93, 6007),
+        ], self.logger.get_lines_for_level('notice'))
+        self.logger._clear()
+
+        # Steady-state...
+        self.assertEqual([], list(self.strategy.new_worker_socks()))
+        self.all_bind_ports_for_node.reset_mock()
+
+        # Get rid of servers for ports which disappear from the ring
+        self.ports = (6007,)
+        self.all_bind_ports_for_node.return_value = set(self.ports)
+        for s in self.sockets:
+            s.reset_mock()
+
+        with mock.patch('swift.common.wsgi.greenio') as mock_greenio:
+            self.assertEqual([], list(self.strategy.new_worker_socks()))
+
+        self.assertEqual([
+            mock.call(),  # ring_check_interval has passed...
+        ], self.all_bind_ports_for_node.mock_calls)
+        self.assertEqual([
+            [mock.call.close()]
+            for _ in range(3)
+        ], [s.mock_calls for s in self.sockets[:3]])
+        self.assertEqual({
+            ('shutdown_safe', (self.sockets[0],)),
+            ('shutdown_safe', (self.sockets[1],)),
+            ('shutdown_safe', (self.sockets[2],)),
+        }, {call[:2] for call in mock_greenio.mock_calls})
+        self.assertEqual([
+            [] for _ in range(3)
+        ], [s.mock_calls for s in self.sockets[3:]])  # not closed
+        self.assertEqual({
+            'Closing unnecessary sock for port %d (child pid %d)' % (6006, p)
+            for p in range(88, 91)
+        }, set(self.logger.get_lines_for_level('notice')))
+        self.logger._clear()
+
+        # Create new socket & workers for new ports that appear in ring
+        self.ports = (6007, 6009)
+        self.all_bind_ports_for_node.return_value = set(self.ports)
+        for s in self.sockets:
+            s.reset_mock()
+        self.mock_get_socket.side_effect = Exception('ack')
+
+        # But first make sure we handle failure to bind to the requested port!
+        got_si = []
+        for s, i in self.strategy.new_worker_socks():
+            got_si.append((s, i))
+            self.strategy.register_worker_start(s, i, pid)
+            pid += 1
+
+        self.assertEqual([], got_si)
+        self.assertEqual([
+            'Unable to bind to port %d: %s' % (6009, Exception('ack')),
+            'Unable to bind to port %d: %s' % (6009, Exception('ack')),
+            'Unable to bind to port %d: %s' % (6009, Exception('ack')),
+        ], self.logger.get_lines_for_level('critical'))
+        self.logger._clear()
+
+        # Will keep trying, so let it succeed again
+        new_sockets = self.mock_get_socket.side_effect = [
+            mock.MagicMock() for _ in range(3)]
+
+        got_si = []
+        for s, i in self.strategy.new_worker_socks():
+            got_si.append((s, i))
+            self.strategy.register_worker_start(s, i, pid)
+            pid += 1
+
+        self.assertEqual([
+            (s, (6009, i)) for i, s in enumerate(new_sockets)
+        ], got_si)
+        self.assertEqual([
+            'Started child %d (PID %d) for port %d' % (0, 94, 6009),
+            'Started child %d (PID %d) for port %d' % (1, 95, 6009),
+            'Started child %d (PID %d) for port %d' % (2, 96, 6009),
+        ], self.logger.get_lines_for_level('notice'))
+        self.logger._clear()
+
+        # Steady-state...
+        self.assertEqual([], list(self.strategy.new_worker_socks()))
+        self.all_bind_ports_for_node.reset_mock()
+
+        # Restart a guy who died on us
+        self.strategy.register_worker_exit(95)  # server_idx == 1
+
+        # TODO: check that the socket got cleaned up
+
+        new_socket = mock.MagicMock()
+        self.mock_get_socket.side_effect = [new_socket]
+
+        got_si = []
+        for s, i in self.strategy.new_worker_socks():
+            got_si.append((s, i))
+            self.strategy.register_worker_start(s, i, pid)
+            pid += 1
+
+        self.assertEqual([
+            (new_socket, (6009, 1)),
+        ], got_si)
+        self.assertEqual([
+            'Started child %d (PID %d) for port %d' % (1, 97, 6009),
+        ], self.logger.get_lines_for_level('notice'))
+        self.logger._clear()
+
+        # Check log_sock_exit
+        self.strategy.log_sock_exit(self.sockets[5], (6007, 2))
+        self.assertEqual([
+            'Child %d (PID %d, port %d) exiting normally' % (
+                2, os.getpid(), 6007),
+        ], self.logger.get_lines_for_level('notice'))
+
+        # It's ok to register_worker_exit for a PID that's already had its
+        # socket closed due to orphaning.
+        # This is one of the workers for port 6006 that already got reaped.
+        self.assertIsNone(self.strategy.register_worker_exit(89))
+
+    def test_servers_per_port_in_container(self):
+        # normally there's no configured ring_ip
+        conf = {
+            'bind_ip': '1.2.3.4',
+        }
+        self.strategy = wsgi.ServersPerPortStrategy(conf, self.logger, 1)
+        self.assertEqual(self.mock_cache_class.call_args,
+                         mock.call('/etc/swift', '1.2.3.4'))
+        self.assertEqual({6006, 6007},
+                         self.strategy.cache.all_bind_ports_for_node())
+        ports = {item[1][0] for item in self.strategy.new_worker_socks()}
+        self.assertEqual({6006, 6007}, ports)
+
+        # but in a container we can override it
+        conf = {
+            'bind_ip': '1.2.3.4',
+            'ring_ip': '2.3.4.5'
+        }
+        self.strategy = wsgi.ServersPerPortStrategy(conf, self.logger, 1)
+        # N.B. our fake BindPortsCache always returns {6006, 6007}, but a real
+        # BindPortsCache would only return ports for devices that match the ip
+        # address in the ring
+        self.assertEqual(self.mock_cache_class.call_args,
+                         mock.call('/etc/swift', '2.3.4.5'))
+        self.assertEqual({6006, 6007},
+                         self.strategy.cache.all_bind_ports_for_node())
+        ports = {item[1][0] for item in self.strategy.new_worker_socks()}
+        self.assertEqual({6006, 6007}, ports)
+
+    def test_shutdown_sockets(self):
+        pid = 88
+        for s, i in self.strategy.new_worker_socks():
+            self.strategy.register_worker_start(s, i, pid)
+            pid += 1
+
+        with mock.patch('swift.common.wsgi.greenio') as mock_greenio:
+            self.strategy.shutdown_sockets()
+
+        self.assertEqual([
+            mock.call.shutdown_safe(s)
+            for s in self.sockets
+        ], mock_greenio.mock_calls)
+        self.assertEqual([
+            [mock.call.close()]
+            for _ in range(3)
+        ], [s.mock_calls for s in self.sockets[:3]])
+
+
+class TestWorkersStrategy(unittest.TestCase, CommonTestMixin):
+    def setUp(self):
+        self.logger = debug_logger()
+        self.conf = {
+            'workers': 2,
+            'user': 'bob',
+        }
+        self.strategy = wsgi.WorkersStrategy(self.conf, self.logger)
+        self.mock_socket = mock.Mock()
+        patcher = mock.patch('swift.common.wsgi.get_socket',
+                             return_value=self.mock_socket)
+        self.mock_get_socket = patcher.start()
+        self.addCleanup(patcher.stop)
+        patcher = mock.patch('swift.common.wsgi.drop_privileges')
+        self.mock_drop_privileges = patcher.start()
+        self.addCleanup(patcher.stop)
+        patcher = mock.patch('swift.common.wsgi.clean_up_daemon_hygiene')
+        self.mock_clean_up_daemon_hygene = patcher.start()
+        self.addCleanup(patcher.stop)
+
+    def test_loop_timeout(self):
+        # This strategy should sit in the green.os.wait() for a bit (to avoid
+        # busy-waiting) but not forever (so the keep-running flag actually
+        # gets checked).
+        self.assertEqual(0.5, self.strategy.loop_timeout())
+
+    def test_no_fork_sock(self):
+        self.assertIsNone(self.strategy.no_fork_sock())
+
+        self.conf['workers'] = 0
+        self.strategy = wsgi.WorkersStrategy(self.conf, self.logger)
+
+        self.assertIs(self.mock_socket, self.strategy.no_fork_sock())
+
+    def test_new_worker_socks(self):
+        pid = 88
+        sock_count = 0
+        for s, i in self.strategy.new_worker_socks():
+            self.assertEqual(self.mock_socket, s)
+            self.assertIsNone(i)  # unused for this strategy
+            self.strategy.register_worker_start(s, 'unused', pid)
+            pid += 1
+            sock_count += 1
+
+        mypid = os.getpid()
+        self.assertEqual([
+            'Started child %s from parent %s' % (88, mypid),
+            'Started child %s from parent %s' % (89, mypid),
+        ], self.logger.get_lines_for_level('notice'))
+
+        self.assertEqual(2, sock_count)
+        self.assertEqual([], list(self.strategy.new_worker_socks()))
+
+        sock_count = 0
+        self.strategy.register_worker_exit(88)
+
+        self.assertEqual([
+            'Removing dead child %s from parent %s' % (88, mypid)
+        ], self.logger.get_lines_for_level('error'))
+
+        for s, i in self.strategy.new_worker_socks():
+            self.assertEqual(self.mock_socket, s)
+            self.assertIsNone(i)  # unused for this strategy
+            self.strategy.register_worker_start(s, 'unused', pid)
+            pid += 1
+            sock_count += 1
+
+        self.assertEqual(1, sock_count)
+        self.assertEqual([
+            'Started child %s from parent %s' % (88, mypid),
+            'Started child %s from parent %s' % (89, mypid),
+            'Started child %s from parent %s' % (90, mypid),
+        ], self.logger.get_lines_for_level('notice'))
+
+    def test_shutdown_sockets(self):
+        self.mock_get_socket.side_effect = sockets = [
+            mock.MagicMock(), mock.MagicMock()]
+
+        pid = 88
+        for s, i in self.strategy.new_worker_socks():
+            self.strategy.register_worker_start(s, 'unused', pid)
+            pid += 1
+
+        with mock.patch('swift.common.wsgi.greenio') as mock_greenio:
+            self.strategy.shutdown_sockets()
+        self.assertEqual([
+            mock.call.shutdown_safe(s)
+            for s in sockets
+        ], mock_greenio.mock_calls)
+        self.assertEqual([
+            [mock.call.close()] for _ in range(2)
+        ], [s.mock_calls for s in sockets])
+
+    def test_log_sock_exit(self):
+        self.strategy.log_sock_exit('blahblah', 'blahblah')
+        my_pid = os.getpid()
+        self.assertEqual([
+            'Child %d exiting normally' % my_pid,
+        ], self.logger.get_lines_for_level('notice'))
+
+
+class TestWSGIContext(unittest.TestCase):
+
+    def test_app_call(self):
+        statuses = ['200 Ok', '404 Not Found']
+
+        def app(env, start_response):
+            start_response(statuses.pop(0), [('Content-Length', '3')])
+            yield b'Ok\n'
+
+        wc = wsgi.WSGIContext(app)
+        r = Request.blank('/')
+        it = wc._app_call(r.environ)
+        self.assertEqual(wc._response_status, '200 Ok')
+        self.assertEqual(wc._get_status_int(), 200)
+        self.assertEqual(b''.join(it), b'Ok\n')
+        r = Request.blank('/')
+        it = wc._app_call(r.environ)
+        self.assertEqual(wc._response_status, '404 Not Found')
+        self.assertEqual(wc._get_status_int(), 404)
+        self.assertEqual(b''.join(it), b'Ok\n')
+
+    def test_app_iter_is_closable(self):
+
+        def app(env, start_response):
+            yield b''
+            yield b''
+            start_response('200 OK', [('Content-Length', '25')])
+            yield b'aaaaa'
+            yield b'bbbbb'
+            yield b'ccccc'
+            yield b'ddddd'
+            yield b'eeeee'
+
+        wc = wsgi.WSGIContext(app)
+        r = Request.blank('/')
+        iterable = wc._app_call(r.environ)
+        self.assertEqual(wc._response_status, '200 OK')
+        self.assertEqual(wc._get_status_int(), 200)
+
+        iterator = iter(iterable)
+        self.assertEqual(b'aaaaa', next(iterator))
+        self.assertEqual(b'bbbbb', next(iterator))
+        iterable.close()
+        with self.assertRaises(StopIteration):
+            next(iterator)
+
+    def test_update_content_length(self):
+        statuses = ['200 Ok']
+
+        def app(env, start_response):
+            start_response(statuses.pop(0), [('Content-Length', '30')])
+            yield b'Ok\n'
+
+        wc = wsgi.WSGIContext(app)
+        r = Request.blank('/')
+        it = wc._app_call(r.environ)
+        wc.update_content_length(35)
+        self.assertEqual(wc._response_status, '200 Ok')
+        self.assertEqual(wc._get_status_int(), 200)
+        self.assertEqual(b''.join(it), b'Ok\n')
+        self.assertEqual(wc._response_headers, [('Content-Length', '35')])
+
+    def test_app_returns_headers_as_dict_items(self):
+        statuses = ['200 Ok']
+
+        def app(env, start_response):
+            start_response(statuses.pop(0), {'Content-Length': '3'}.items())
+            yield b'Ok\n'
+
+        wc = wsgi.WSGIContext(app)
+        r = Request.blank('/')
+        it = wc._app_call(r.environ)
+        wc._response_headers.append(('X-Trans-Id', 'txn'))
+        self.assertEqual(wc._response_status, '200 Ok')
+        self.assertEqual(wc._get_status_int(), 200)
+        self.assertEqual(b''.join(it), b'Ok\n')
+        self.assertEqual(wc._response_headers, [
+            ('Content-Length', '3'),
+            ('X-Trans-Id', 'txn'),
+        ])
+
+
+class TestPipelineWrapper(unittest.TestCase):
+
+    def setUp(self):
+        config = """
+        [DEFAULT]
+        swift_dir = TEMPDIR
+
+        [pipeline:main]
+        pipeline = healthcheck catch_errors tempurl proxy-server
+
+        [app:proxy-server]
+        use = egg:swift#proxy
+        conn_timeout = 0.2
+
+        [filter:catch_errors]
+        use = egg:swift#catch_errors
+
+        [filter:healthcheck]
+        use = egg:swift#healthcheck
+
+        [filter:tempurl]
+        paste.filter_factory = swift.common.middleware.tempurl:filter_factory
+        """
+
+        contents = dedent(config)
+        with temptree(['proxy-server.conf']) as t:
+            conf_file = os.path.join(t, 'proxy-server.conf')
+            with open(conf_file, 'w') as f:
+                f.write(contents.replace('TEMPDIR', t))
+            ctx = wsgi.loadcontext(loadwsgi.APP, conf_file, global_conf={})
+            self.pipe = wsgi.PipelineWrapper(ctx)
+
+    def _entry_point_names(self):
+        # Helper method to return a list of the entry point names for the
+        # filters in the pipeline.
+        return [c.entry_point_name for c in self.pipe.context.filter_contexts]
+
+    def test_startswith(self):
+        self.assertTrue(self.pipe.startswith("healthcheck"))
+        self.assertFalse(self.pipe.startswith("tempurl"))
+
+    def test_startswith_no_filters(self):
+        config = """
+        [DEFAULT]
+        swift_dir = TEMPDIR
+
+        [pipeline:main]
+        pipeline = proxy-server
+
+        [app:proxy-server]
+        use = egg:swift#proxy
+        conn_timeout = 0.2
+        """
+        contents = dedent(config)
+        with temptree(['proxy-server.conf']) as t:
+            conf_file = os.path.join(t, 'proxy-server.conf')
+            with open(conf_file, 'w') as f:
+                f.write(contents.replace('TEMPDIR', t))
+            ctx = wsgi.loadcontext(loadwsgi.APP, conf_file, global_conf={})
+            pipe = wsgi.PipelineWrapper(ctx)
+        self.assertTrue(pipe.startswith('proxy'))
+
+    def test_insert_filter(self):
+        original_modules = ['healthcheck', 'catch_errors', None]
+        self.assertEqual(self._entry_point_names(), original_modules)
+
+        self.pipe.insert_filter(self.pipe.create_filter('catch_errors'))
+        expected_modules = ['catch_errors', 'healthcheck',
+                            'catch_errors', None]
+        self.assertEqual(self._entry_point_names(), expected_modules)
+
+    def test_str(self):
+        self.assertEqual(
+            str(self.pipe),
+            "healthcheck catch_errors tempurl proxy-server")
+
+    def test_str_unknown_filter(self):
+        del self.pipe.context.filter_contexts[0].__dict__['name']
+        self.pipe.context.filter_contexts[0].object = 'mysterious'
+        self.assertEqual(
+            str(self.pipe),
+            "<unknown> catch_errors tempurl proxy-server")
+
+
+@patch_policies
+class TestPipelineModification(unittest.TestCase):
+    def pipeline_modules(self, app):
+        # This is rather brittle; it'll break if a middleware stores its app
+        # anywhere other than an attribute named "app", but it works for now.
+        pipe = []
+        for _ in range(1000):
+            if app.__class__.__module__ == \
+                    'swift.common.middleware.versioned_writes.legacy':
+                pipe.append('swift.common.middleware.versioned_writes')
+            else:
+                pipe.append(app.__class__.__module__)
+
+            if not hasattr(app, 'app'):
+                break
+            app = app.app
+        return pipe
+
+    def test_load_app(self):
+        config = """
+        [DEFAULT]
+        swift_dir = TEMPDIR
+
+        [pipeline:main]
+        pipeline = healthcheck proxy-server
+
+        [app:proxy-server]
+        use = egg:swift#proxy
+        conn_timeout = 0.2
+
+        [filter:catch_errors]
+        use = egg:swift#catch_errors
+
+        [filter:healthcheck]
+        use = egg:swift#healthcheck
+        """
+
+        def modify_func(app, pipe):
+            new = pipe.create_filter('catch_errors')
+            pipe.insert_filter(new)
+
+        contents = dedent(config)
+        with temptree(['proxy-server.conf']) as t:
+            conf_file = os.path.join(t, 'proxy-server.conf')
+            with open(conf_file, 'w') as f:
+                f.write(contents.replace('TEMPDIR', t))
+            _fake_rings(t)
+            _fake_swift_conf(t)
+            with mock.patch(
+                    'swift.proxy.server.Application.modify_wsgi_pipeline',
+                    modify_func):
+                app = wsgi.loadapp(conf_file, global_conf={})
+            exp = swift.common.middleware.catch_errors.CatchErrorMiddleware
+            self.assertIsInstance(app, exp)
+            exp = swift.common.middleware.healthcheck.HealthCheckMiddleware
+            self.assertIsInstance(app.app, exp)
+            exp = swift.proxy.server.Application
+            self.assertIsInstance(app.app.app, exp)
+            # Everybody gets a reference to the final app, too
+            self.assertIs(app.app.app, app._pipeline_final_app)
+            self.assertIs(app.app.app, app._pipeline_request_logging_app)
+            self.assertIs(app.app.app, app.app._pipeline_final_app)
+            self.assertIs(app.app.app, app.app._pipeline_request_logging_app)
+            self.assertIs(app.app.app, app.app.app._pipeline_final_app)
+            exp_pipeline = [app, app.app, app.app.app]
+            self.assertEqual(exp_pipeline, app._pipeline)
+            self.assertEqual(exp_pipeline, app.app._pipeline)
+            self.assertEqual(exp_pipeline, app.app.app._pipeline)
+            self.assertIs(app._pipeline, app.app._pipeline)
+            self.assertIs(app._pipeline, app.app.app._pipeline)
+
+            # make sure you can turn off the pipeline modification if you want
+            def blow_up(*_, **__):
+                raise self.fail("needs more struts")
+
+            with mock.patch(
+                    'swift.proxy.server.Application.modify_wsgi_pipeline',
+                    blow_up):
+                app = wsgi.loadapp(conf_file, global_conf={},
+                                   allow_modify_pipeline=False)
+
+            # the pipeline was untouched
+            exp = swift.common.middleware.healthcheck.HealthCheckMiddleware
+            self.assertIsInstance(app, exp)
+            exp = swift.proxy.server.Application
+            self.assertIsInstance(app.app, exp)
+
+    def test_load_app_request_logging_app(self):
+        config = """
+        [DEFAULT]
+        swift_dir = TEMPDIR
+
+        [pipeline:main]
+        pipeline = catch_errors proxy_logging proxy-server
+
+        [app:proxy-server]
+        use = egg:swift#proxy
+        conn_timeout = 0.2
+
+        [filter:catch_errors]
+        use = egg:swift#catch_errors
+
+        [filter:proxy_logging]
+        use = egg:swift#proxy_logging
+        """
+
+        contents = dedent(config)
+        with temptree(['proxy-server.conf']) as t:
+            conf_file = os.path.join(t, 'proxy-server.conf')
+            with open(conf_file, 'w') as f:
+                f.write(contents.replace('TEMPDIR', t))
+            _fake_rings(t)
+            _fake_swift_conf(t)
+            app = wsgi.loadapp(conf_file, global_conf={})
+
+            self.assertEqual(self.pipeline_modules(app),
+                             ['swift.common.middleware.catch_errors',
+                              'swift.common.middleware.gatekeeper',
+                              'swift.common.middleware.proxy_logging',
+                              'swift.common.middleware.listing_formats',
+                              'swift.common.middleware.copy',
+                              'swift.common.middleware.dlo',
+                              'swift.common.middleware.versioned_writes',
+                              'swift.proxy.server'])
+
+            pipeline = app._pipeline
+            logging_app = app._pipeline_request_logging_app
+            final_app = app._pipeline_final_app
+            # Sanity check -- loadapp returns the start of the pipeline
+            self.assertIs(app, pipeline[0])
+            # ... and the final_app is the end
+            self.assertIs(final_app, pipeline[-1])
+
+            # The logging app is its own special short pipeline
+            self.assertEqual(self.pipeline_modules(logging_app), [
+                'swift.common.middleware.proxy_logging',
+                'swift.proxy.server'])
+            self.assertNotIn(logging_app, pipeline)
+            self.assertIs(logging_app.app, final_app)
+
+            # All the apps in the main pipeline got decorated identically
+            for app in pipeline:
+                self.assertIs(app._pipeline, pipeline)
+                self.assertIs(app._pipeline_request_logging_app, logging_app)
+                self.assertIs(app._pipeline_final_app, final_app)
+
+            # Special logging app got them, too
+            self.assertIs(logging_app._pipeline_request_logging_app,
+                          logging_app)
+            self.assertIs(logging_app._pipeline_final_app, final_app)
+            # Though the pipeline's different -- may or may not matter?
+            self.assertEqual(logging_app._pipeline, [logging_app, final_app])
+
+    def test_proxy_unmodified_wsgi_pipeline(self):
+        # Make sure things are sane even when we modify nothing
+        config = """
+        [DEFAULT]
+        swift_dir = TEMPDIR
+
+        [pipeline:main]
+        pipeline = catch_errors gatekeeper proxy-server
+
+        [app:proxy-server]
+        use = egg:swift#proxy
+        conn_timeout = 0.2
+
+        [filter:catch_errors]
+        use = egg:swift#catch_errors
+
+        [filter:gatekeeper]
+        use = egg:swift#gatekeeper
+        """
+
+        contents = dedent(config)
+        with temptree(['proxy-server.conf']) as t:
+            conf_file = os.path.join(t, 'proxy-server.conf')
+            with open(conf_file, 'w') as f:
+                f.write(contents.replace('TEMPDIR', t))
+            _fake_rings(t)
+            _fake_swift_conf(t)
+            app = wsgi.loadapp(conf_file, global_conf={})
+
+        self.assertEqual(self.pipeline_modules(app),
+                         ['swift.common.middleware.catch_errors',
+                          'swift.common.middleware.gatekeeper',
+                          'swift.common.middleware.listing_formats',
+                          'swift.common.middleware.copy',
+                          'swift.common.middleware.dlo',
+                          'swift.common.middleware.versioned_writes',
+                          'swift.proxy.server'])
+
+    def test_proxy_modify_wsgi_pipeline(self):
+        config = """
+        [DEFAULT]
+        swift_dir = TEMPDIR
+
+        [pipeline:main]
+        pipeline = healthcheck proxy-server
+
+        [app:proxy-server]
+        use = egg:swift#proxy
+        conn_timeout = 0.2
+
+        [filter:healthcheck]
+        use = egg:swift#healthcheck
+        """
+
+        contents = dedent(config)
+        with temptree(['proxy-server.conf']) as t:
+            conf_file = os.path.join(t, 'proxy-server.conf')
+            with open(conf_file, 'w') as f:
+                f.write(contents.replace('TEMPDIR', t))
+            _fake_rings(t)
+            _fake_swift_conf(t)
+            app = wsgi.loadapp(conf_file, global_conf={})
+
+        self.assertEqual(self.pipeline_modules(app),
+                         ['swift.common.middleware.catch_errors',
+                          'swift.common.middleware.gatekeeper',
+                          'swift.common.middleware.listing_formats',
+                          'swift.common.middleware.copy',
+                          'swift.common.middleware.dlo',
+                          'swift.common.middleware.versioned_writes',
+                          'swift.common.middleware.healthcheck',
+                          'swift.proxy.server'])
+
+    def test_proxy_modify_wsgi_pipeline_recommended_pipelines(self):
+        to_test = [
+            # Version, filter-only pipeline, expected final pipeline
+            ('1.4.1',
+             'catch_errors healthcheck cache ratelimit tempauth',
+             'catch_errors gatekeeper healthcheck memcache'
+             ' listing_formats ratelimit tempauth copy dlo versioned_writes'),
+            ('1.5.0',
+             'catch_errors healthcheck cache ratelimit tempauth proxy-logging',
+             'catch_errors gatekeeper healthcheck memcache ratelimit tempauth'
+             ' proxy_logging listing_formats copy dlo versioned_writes'),
+            ('1.8.0',
+             'catch_errors healthcheck proxy-logging cache slo ratelimit'
+             ' tempauth container-quotas account-quotas proxy-logging',
+             'catch_errors gatekeeper healthcheck proxy_logging memcache'
+             ' listing_formats slo ratelimit tempauth copy dlo'
+             ' versioned_writes container_quotas account_quotas'
+             ' proxy_logging'),
+            ('1.9.1',
+             'catch_errors healthcheck proxy-logging cache bulk slo ratelimit'
+             ' tempauth container-quotas account-quotas proxy-logging',
+             'catch_errors gatekeeper healthcheck proxy_logging memcache'
+             ' listing_formats bulk slo ratelimit tempauth copy dlo'
+             ' versioned_writes container_quotas account_quotas'
+             ' proxy_logging'),
+            ('1.12.0',
+             'catch_errors gatekeeper healthcheck proxy-logging cache'
+             ' container_sync bulk slo ratelimit tempauth container-quotas'
+             ' account-quotas proxy-logging',
+             'catch_errors gatekeeper healthcheck proxy_logging memcache'
+             ' listing_formats container_sync bulk slo ratelimit tempauth'
+             ' copy dlo versioned_writes container_quotas account_quotas'
+             ' proxy_logging'),
+            ('1.13.0',
+             'catch_errors gatekeeper healthcheck proxy-logging cache'
+             ' container_sync bulk slo dlo ratelimit tempauth'
+             ' container-quotas account-quotas proxy-logging',
+             'catch_errors gatekeeper healthcheck proxy_logging memcache'
+             ' listing_formats container_sync bulk slo dlo ratelimit'
+             ' tempauth copy versioned_writes container_quotas account_quotas'
+             ' proxy_logging'),
+            ('1.13.1',
+             'catch_errors gatekeeper healthcheck proxy-logging cache'
+             ' container_sync bulk tempurl slo dlo ratelimit tempauth'
+             ' container-quotas account-quotas proxy-logging',
+             'catch_errors gatekeeper healthcheck proxy_logging memcache'
+             ' listing_formats container_sync bulk tempurl slo dlo ratelimit'
+             ' tempauth copy versioned_writes container_quotas account_quotas'
+             ' proxy_logging'),
+            ('2.0.0',
+             'catch_errors gatekeeper healthcheck proxy-logging cache'
+             ' container_sync bulk tempurl ratelimit tempauth container-quotas'
+             ' account-quotas slo dlo proxy-logging',
+             'catch_errors gatekeeper healthcheck proxy_logging memcache'
+             ' listing_formats container_sync bulk tempurl ratelimit tempauth'
+             ' copy container_quotas account_quotas slo dlo versioned_writes'
+             ' proxy_logging'),
+            ('2.4.0',
+             'catch_errors gatekeeper healthcheck proxy-logging cache'
+             ' container_sync bulk tempurl ratelimit tempauth container-quotas'
+             ' account-quotas slo dlo versioned_writes proxy-logging',
+             'catch_errors gatekeeper healthcheck proxy_logging memcache'
+             ' listing_formats container_sync bulk tempurl ratelimit tempauth'
+             ' copy container_quotas account_quotas slo dlo versioned_writes'
+             ' proxy_logging'),
+            ('2.8.0',
+             'catch_errors gatekeeper healthcheck proxy-logging cache'
+             ' container_sync bulk tempurl ratelimit tempauth copy'
+             ' container-quotas account-quotas slo dlo versioned_writes'
+             ' proxy-logging',
+             'catch_errors gatekeeper healthcheck proxy_logging memcache'
+             ' listing_formats container_sync bulk tempurl ratelimit tempauth'
+             ' copy container_quotas account_quotas slo dlo versioned_writes'
+             ' proxy_logging'),
+            ('2.16.0',
+             'catch_errors gatekeeper healthcheck proxy-logging cache'
+             ' listing_formats container_sync bulk tempurl ratelimit'
+             ' tempauth copy container-quotas account-quotas slo dlo'
+             ' versioned_writes proxy-logging',
+             'catch_errors gatekeeper healthcheck proxy_logging memcache'
+             ' listing_formats container_sync bulk tempurl ratelimit'
+             ' tempauth copy container_quotas account_quotas slo dlo'
+             ' versioned_writes proxy_logging'),
+        ]
+
+        config = """
+            [DEFAULT]
+            swift_dir = %s
+
+            [pipeline:main]
+            pipeline = %s proxy-server
+
+            [app:proxy-server]
+            use = egg:swift#proxy
+            conn_timeout = 0.2
+
+            [filter:catch_errors]
+            use = egg:swift#catch_errors
+
+            [filter:gatekeeper]
+            use = egg:swift#gatekeeper
+
+            [filter:healthcheck]
+            use = egg:swift#healthcheck
+
+            [filter:proxy-logging]
+            use = egg:swift#proxy_logging
+
+            [filter:cache]
+            use = egg:swift#memcache
+
+            [filter:listing_formats]
+            use = egg:swift#listing_formats
+
+            [filter:container_sync]
+            use = egg:swift#container_sync
+
+            [filter:bulk]
+            use = egg:swift#bulk
+
+            [filter:tempurl]
+            use = egg:swift#tempurl
+
+            [filter:ratelimit]
+            use = egg:swift#ratelimit
+
+            [filter:tempauth]
+            use = egg:swift#tempauth
+            user_test_tester = t%%sting .admin
+
+            [filter:copy]
+            use = egg:swift#copy
+
+            [filter:container-quotas]
+            use = egg:swift#container_quotas
+
+            [filter:account-quotas]
+            use = egg:swift#account_quotas
+
+            [filter:slo]
+            use = egg:swift#slo
+
+            [filter:dlo]
+            use = egg:swift#dlo
+
+            [filter:versioned_writes]
+            use = egg:swift#versioned_writes
+        """
+        contents = dedent(config)
+
+        with temptree(['proxy-server.conf']) as t:
+            _fake_rings(t)
+            _fake_swift_conf(t)
+            for version, pipeline, expected in to_test:
+                conf_file = os.path.join(t, 'proxy-server.conf')
+                with open(conf_file, 'w') as f:
+                    to_write = contents % (t, pipeline)
+                    # Sanity check that the password only has one % in it
+                    self.assertIn('t%sting', to_write)
+                    f.write(to_write)
+                app = wsgi.loadapp(conf_file, global_conf={})
+
+                actual = ' '.join(m.rsplit('.', 1)[1]
+                                  for m in self.pipeline_modules(app)[:-1])
+                self.assertEqual(
+                    expected, actual,
+                    'Pipeline mismatch for version %s: got\n    %s\n'
+                    'but expected\n    %s' % (version, actual, expected))
+
+    def test_proxy_modify_wsgi_pipeline_inserts_versioned_writes(self):
+        config = """
+        [DEFAULT]
+        swift_dir = TEMPDIR
+
+        [pipeline:main]
+        pipeline = slo dlo healthcheck proxy-server
+
+        [app:proxy-server]
+        use = egg:swift#proxy
+        conn_timeout = 0.2
+
+        [filter:healthcheck]
+        use = egg:swift#healthcheck
+
+        [filter:dlo]
+        use = egg:swift#dlo
+
+        [filter:slo]
+        use = egg:swift#slo
+        """
+
+        contents = dedent(config)
+        with temptree(['proxy-server.conf']) as t:
+            conf_file = os.path.join(t, 'proxy-server.conf')
+            with open(conf_file, 'w') as f:
+                f.write(contents.replace('TEMPDIR', t))
+            _fake_rings(t)
+            app = wsgi.loadapp(conf_file, global_conf={})
+
+        self.assertEqual(self.pipeline_modules(app),
+                         ['swift.common.middleware.catch_errors',
+                          'swift.common.middleware.gatekeeper',
+                          'swift.common.middleware.listing_formats',
+                          'swift.common.middleware.copy',
+                          'swift.common.middleware.slo',
+                          'swift.common.middleware.dlo',
+                          'swift.common.middleware.versioned_writes',
+                          'swift.common.middleware.healthcheck',
+                          'swift.proxy.server'])
+
+    def test_proxy_modify_wsgi_pipeline_ordering(self):
+        config = """
+        [DEFAULT]
+        swift_dir = TEMPDIR
+
+        [pipeline:main]
+        pipeline = healthcheck proxy-logging bulk tempurl proxy-server
+
+        [app:proxy-server]
+        use = egg:swift#proxy
+        conn_timeout = 0.2
+
+        [filter:healthcheck]
+        use = egg:swift#healthcheck
+
+        [filter:proxy-logging]
+        use = egg:swift#proxy_logging
+
+        [filter:bulk]
+        use = egg:swift#bulk
+
+        [filter:tempurl]
+        use = egg:swift#tempurl
+        """
+
+        new_req_filters = [
+            # not in pipeline, no afters
+            {'name': 'catch_errors'},
+            # already in pipeline
+            {'name': 'proxy_logging',
+             'after_fn': lambda _: ['catch_errors']},
+            # not in pipeline, comes after more than one thing
+            {'name': 'container_quotas',
+             'after_fn': lambda _: ['catch_errors', 'bulk']}]
+
+        contents = dedent(config)
+        with temptree(['proxy-server.conf']) as t:
+            conf_file = os.path.join(t, 'proxy-server.conf')
+            with open(conf_file, 'w') as f:
+                f.write(contents.replace('TEMPDIR', t))
+            _fake_rings(t)
+            _fake_swift_conf(t)
+            with mock.patch.object(swift.proxy.server, 'required_filters',
+                                   new_req_filters):
+                app = wsgi.loadapp(conf_file, global_conf={})
+
+        self.assertEqual(self.pipeline_modules(app), [
+            'swift.common.middleware.catch_errors',
+            'swift.common.middleware.healthcheck',
+            'swift.common.middleware.proxy_logging',
+            'swift.common.middleware.bulk',
+            'swift.common.middleware.container_quotas',
+            'swift.common.middleware.tempurl',
+            'swift.proxy.server'])
+
+    def _proxy_modify_wsgi_pipeline(self, pipe):
+        config = """
+        [DEFAULT]
+        swift_dir = TEMPDIR
+
+        [pipeline:main]
+        pipeline = %s
+
+        [app:proxy-server]
+        use = egg:swift#proxy
+        conn_timeout = 0.2
+
+        [filter:healthcheck]
+        use = egg:swift#healthcheck
+
+        [filter:catch_errors]
+        use = egg:swift#catch_errors
+
+        [filter:gatekeeper]
+        use = egg:swift#gatekeeper
+        """
+        config = config % (pipe,)
+        contents = dedent(config)
+        with temptree(['proxy-server.conf']) as t:
+            conf_file = os.path.join(t, 'proxy-server.conf')
+            with open(conf_file, 'w') as f:
+                f.write(contents.replace('TEMPDIR', t))
+            _fake_rings(t)
+            _fake_swift_conf(t)
+            app = wsgi.loadapp(conf_file, global_conf={})
+        return app
+
+    def test_gatekeeper_insertion_catch_errors_configured_at_start(self):
+        # catch_errors is configured at start, gatekeeper is not configured,
+        # so gatekeeper should be inserted just after catch_errors
+        pipe = 'catch_errors healthcheck proxy-server'
+        app = self._proxy_modify_wsgi_pipeline(pipe)
+        self.assertEqual(self.pipeline_modules(app), [
+            'swift.common.middleware.catch_errors',
+            'swift.common.middleware.gatekeeper',
+            'swift.common.middleware.listing_formats',
+            'swift.common.middleware.copy',
+            'swift.common.middleware.dlo',
+            'swift.common.middleware.versioned_writes',
+            'swift.common.middleware.healthcheck',
+            'swift.proxy.server'])
+
+    def test_gatekeeper_insertion_catch_errors_configured_not_at_start(self):
+        # catch_errors is configured, gatekeeper is not configured, so
+        # gatekeeper should be inserted at start of pipeline
+        pipe = 'healthcheck catch_errors proxy-server'
+        app = self._proxy_modify_wsgi_pipeline(pipe)
+        self.assertEqual(self.pipeline_modules(app), [
+            'swift.common.middleware.gatekeeper',
+            'swift.common.middleware.healthcheck',
+            'swift.common.middleware.catch_errors',
+            'swift.common.middleware.listing_formats',
+            'swift.common.middleware.copy',
+            'swift.common.middleware.dlo',
+            'swift.common.middleware.versioned_writes',
+            'swift.proxy.server'])
+
+    def test_catch_errors_gatekeeper_configured_not_at_start(self):
+        # catch_errors is configured, gatekeeper is configured, so
+        # no change should be made to pipeline
+        pipe = 'healthcheck catch_errors gatekeeper proxy-server'
+        app = self._proxy_modify_wsgi_pipeline(pipe)
+        self.assertEqual(self.pipeline_modules(app), [
+            'swift.common.middleware.healthcheck',
+            'swift.common.middleware.catch_errors',
+            'swift.common.middleware.gatekeeper',
+            'swift.common.middleware.listing_formats',
+            'swift.common.middleware.copy',
+            'swift.common.middleware.dlo',
+            'swift.common.middleware.versioned_writes',
+            'swift.proxy.server'])
+
+    @with_tempdir
+    def test_loadapp_proxy(self, tempdir):
+        conf_path = os.path.join(tempdir, 'proxy-server.conf')
+        conf_body = """
+        [DEFAULT]
+        swift_dir = %s
+
+        [pipeline:main]
+        pipeline = catch_errors cache proxy-server
+
+        [app:proxy-server]
+        use = egg:swift#proxy
+
+        [filter:cache]
+        use = egg:swift#memcache
+
+        [filter:catch_errors]
+        use = egg:swift#catch_errors
+        """ % tempdir
+        with open(conf_path, 'w') as f:
+            f.write(dedent(conf_body))
+        _fake_rings(tempdir)
+        _fake_swift_conf(tempdir)
+        account_ring_path = os.path.join(tempdir, 'account.ring.gz')
+        container_ring_path = os.path.join(tempdir, 'container.ring.gz')
+        object_ring_paths = {}
+        for policy in POLICIES:
+            object_ring_paths[int(policy)] = os.path.join(
+                tempdir, policy.ring_name + '.ring.gz')
+
+        app = wsgi.loadapp(conf_path)
+        proxy_app = app._pipeline_final_app
+        self.assertEqual(proxy_app.account_ring.serialized_path,
+                         account_ring_path)
+        self.assertEqual(proxy_app.container_ring.serialized_path,
+                         container_ring_path)
+        for policy_index, expected_path in object_ring_paths.items():
+            object_ring = proxy_app.get_object_ring(policy_index)
+            self.assertEqual(expected_path, object_ring.serialized_path)
+
+    @with_tempdir
+    def test_loadapp_storage(self, tempdir):
+        expectations = {
+            'object': obj_server.ObjectController,
+            'container': container_server.ContainerController,
+            'account': account_server.AccountController,
+        }
+
+        for server_type, controller in expectations.items():
+            conf_path = os.path.join(
+                tempdir, '%s-server.conf' % server_type)
+            conf_body = """
+            [DEFAULT]
+            swift_dir = %s
+
+            [app:main]
+            use = egg:swift#%s
+            """ % (tempdir, server_type)
+            with open(conf_path, 'w') as f:
+                f.write(dedent(conf_body))
+            app = wsgi.loadapp(conf_path)
+            self.assertIsInstance(app, controller)
 
 
 if __name__ == '__main__':
diff --git a/test/unit/common/utils/__init__.py b/test/unit/common/utils/__init__.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/test/unit/common/utils/test_checksum.py b/test/unit/common/utils/test_checksum.py
new file mode 100644
index 0000000000..a17642d534
--- /dev/null
+++ b/test/unit/common/utils/test_checksum.py
@@ -0,0 +1,417 @@
+# Copyright (c) 2024 NVIDIA
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import sys
+import unittest
+from unittest import mock
+
+import zlib
+
+from swift.common.utils import checksum
+from test.debug_logger import debug_logger
+from test.unit import requires_crc32c, requires_crc64nvme
+
+
+class TestModuleFunctions(unittest.TestCase):
+    def test_find_isal_sys_package_preferred(self):
+        with mock.patch('ctypes.util.find_library', return_value='my-isal.so'):
+            with mock.patch('ctypes.CDLL', return_value='fake') as mock_cdll:
+                self.assertEqual('fake', checksum.find_isal())
+        self.assertEqual([mock.call('my-isal.so')], mock_cdll.call_args_list)
+
+    @unittest.skipIf(
+        sys.version_info.major == 3 and sys.version_info.minor < 8,
+        "importlib.metadata not available until py3.8")
+    def test_find_isal_pyeclib_install_found(self):
+        mock_pkg = mock.MagicMock()
+        mock_pkg.locate = mock.MagicMock(return_value='fake-pkg')
+        with mock.patch('ctypes.util.find_library', return_value=None):
+            with mock.patch('ctypes.CDLL', return_value='fake') as mock_cdll:
+                with mock.patch('importlib.metadata.files',
+                                return_value=[mock_pkg]):
+                    self.assertEqual('fake', checksum.find_isal())
+        self.assertEqual([mock.call('fake-pkg')], mock_cdll.call_args_list)
+
+    @unittest.skipIf(
+        sys.version_info.major == 3 and sys.version_info.minor < 8,
+        "importlib.metadata not available until py3.8")
+    def test_find_isal_pyeclib_install_not_found(self):
+        mock_pkg = mock.MagicMock()
+        mock_pkg.locate = mock.MagicMock(return_value='fake-pkg')
+        with mock.patch('ctypes.util.find_library', return_value=None):
+            with mock.patch('importlib.metadata.files', return_value=[]):
+                self.assertIsNone(checksum.find_isal())
+
+    @unittest.skipIf(
+        sys.version_info.major == 3 and sys.version_info.minor < 8,
+        "importlib.metadata not available until py3.8")
+    def test_find_isal_pyeclib_dist_missing_files(self):
+        with mock.patch('ctypes.util.find_library', return_value=None):
+            with mock.patch('importlib.metadata.files', return_value=None):
+                self.assertIsNone(checksum.find_isal())
+
+    @unittest.skipIf(
+        sys.version_info.major == 3 and sys.version_info.minor < 8,
+        "importlib.metadata not available until py3.8")
+    def test_find_isal_pyeclib_dist_info_missing(self):
+        from importlib.metadata import PackageNotFoundError
+        with mock.patch('ctypes.util.find_library', return_value=None):
+            with mock.patch('importlib.metadata.files',
+                            side_effect=PackageNotFoundError):
+                self.assertIsNone(checksum.find_isal())
+
+
+# If you're curious about the 0xe3069283, see "check" at
+# https://reveng.sourceforge.io/crc-catalogue/17plus.htm#crc.cat.crc-32-iscsi
+class TestCRC32C(unittest.TestCase):
+    def check_crc_func(self, impl):
+        self.assertEqual(impl(b"123456789"), 0xe3069283)
+        # Check that we can save/continue
+        partial = impl(b"12345")
+        self.assertEqual(impl(b"6789", partial), 0xe3069283)
+
+    @unittest.skipIf(checksum.crc32c_anycrc is None, 'No anycrc CRC32C')
+    def test_anycrc(self):
+        self.check_crc_func(checksum.crc32c_anycrc)
+        # Check preferences -- beats out reference, but not kernel or ISA-L
+        if checksum.crc32c_isal is None and checksum.crc32c_kern is None:
+            self.assertIs(checksum._select_crc32c_impl(),
+                          checksum.crc32c_anycrc)
+
+    @unittest.skipIf(checksum.crc32c_kern is None, 'No kernel CRC32C')
+    def test_kern(self):
+        self.check_crc_func(checksum.crc32c_kern)
+        # Check preferences -- beats out reference and anycrc, but not ISA-L
+        if checksum.crc32c_isal is None:
+            self.assertIs(checksum._select_crc32c_impl(), checksum.crc32c_kern)
+
+    @unittest.skipIf(checksum.crc32c_kern is None, 'No kernel CRC32C')
+    def test_kern_socket_close_happy_path(self):
+        mock_crc32c_socket = mock.MagicMock()
+        mock_socket = mock.MagicMock()
+        mock_socket.recv.return_value = b'1234'
+        mock_crc32c_socket.accept.return_value = (mock_socket, None)
+        with mock.patch('swift.common.utils.checksum.socket.socket',
+                        return_value=mock_crc32c_socket):
+            checksum.crc32c_kern(b'x')
+        self.assertEqual([mock.call()],
+                         mock_socket.close.call_args_list)
+        self.assertEqual([mock.call()],
+                         mock_crc32c_socket.close.call_args_list)
+
+    @unittest.skipIf(checksum.crc32c_kern is None, 'No kernel CRC32C')
+    def test_kern_socket_close_after_bind_error(self):
+        mock_crc32c_socket = mock.MagicMock()
+        mock_crc32c_socket.bind.side_effect = OSError('boom')
+        with mock.patch('swift.common.utils.checksum.socket.socket',
+                        return_value=mock_crc32c_socket):
+            with self.assertRaises(OSError) as cm:
+                checksum.crc32c_kern(b'x')
+        self.assertEqual('boom', str(cm.exception))
+        self.assertEqual([mock.call()],
+                         mock_crc32c_socket.close.call_args_list)
+
+    @unittest.skipIf(checksum.crc32c_kern is None, 'No kernel CRC32C')
+    def test_kern_socket_close_after_setsockopt_error(self):
+        mock_crc32c_socket = mock.MagicMock()
+        mock_crc32c_socket.setsockopt.side_effect = OSError('boom')
+        with mock.patch('swift.common.utils.checksum.socket.socket',
+                        return_value=mock_crc32c_socket):
+            with self.assertRaises(OSError) as cm:
+                checksum.crc32c_kern(b'x')
+        self.assertEqual('boom', str(cm.exception))
+        self.assertEqual([mock.call()],
+                         mock_crc32c_socket.close.call_args_list)
+
+    @unittest.skipIf(checksum.crc32c_kern is None, 'No kernel CRC32C')
+    def test_kern_socket_close_after_accept_error(self):
+        mock_crc32c_socket = mock.MagicMock()
+        mock_crc32c_socket.accept.side_effect = OSError('boom')
+        with mock.patch('swift.common.utils.checksum.socket.socket',
+                        return_value=mock_crc32c_socket):
+            with self.assertRaises(OSError) as cm:
+                checksum.crc32c_kern(b'x')
+        self.assertEqual('boom', str(cm.exception))
+        self.assertEqual([mock.call()],
+                         mock_crc32c_socket.close.call_args_list)
+
+    @unittest.skipIf(checksum.crc32c_kern is None, 'No kernel CRC32C')
+    def test_kern_socket_after_sendall_error(self):
+        mock_crc32c_socket = mock.MagicMock()
+        mock_socket = mock.MagicMock()
+        mock_socket.sendall.side_effect = OSError('boom')
+        mock_crc32c_socket.accept.return_value = (mock_socket, None)
+        with mock.patch('swift.common.utils.checksum.socket.socket',
+                        return_value=mock_crc32c_socket):
+            with self.assertRaises(OSError) as cm:
+                checksum.crc32c_kern(b'x')
+        self.assertEqual('boom', str(cm.exception))
+        self.assertEqual([mock.call()],
+                         mock_socket.close.call_args_list)
+        self.assertEqual([mock.call()],
+                         mock_crc32c_socket.close.call_args_list)
+
+    @unittest.skipIf(checksum.crc32c_kern is None, 'No kernel CRC32C')
+    def test_kern_socket_after_recv_error(self):
+        mock_crc32c_socket = mock.MagicMock()
+        mock_socket = mock.MagicMock()
+        mock_socket.recv.side_effect = OSError('boom')
+        mock_crc32c_socket.accept.return_value = (mock_socket, None)
+        with mock.patch('swift.common.utils.checksum.socket.socket',
+                        return_value=mock_crc32c_socket):
+            with self.assertRaises(OSError) as cm:
+                checksum.crc32c_kern(b'x')
+        self.assertEqual('boom', str(cm.exception))
+        self.assertEqual([mock.call()],
+                         mock_socket.close.call_args_list)
+        self.assertEqual([mock.call()],
+                         mock_crc32c_socket.close.call_args_list)
+
+    @unittest.skipIf(checksum.crc32c_isal is None, 'No ISA-L CRC32C')
+    def test_isal(self):
+        self.check_crc_func(checksum.crc32c_isal)
+        # Check preferences -- ISA-L always wins
+        self.assertIs(checksum._select_crc32c_impl(), checksum.crc32c_isal)
+
+
+class TestCRC64NVME(unittest.TestCase):
+    def check_crc_func(self, impl):
+        self.assertEqual(impl(b"123456789"), 0xae8b14860a799888)
+        # Check that we can save/continue
+        partial = impl(b"12345")
+        self.assertEqual(impl(b"6789", partial), 0xae8b14860a799888)
+
+    @unittest.skipIf(checksum.crc64nvme_anycrc is None, 'No anycrc CRC64NVME')
+    def test_anycrc(self):
+        self.check_crc_func(checksum.crc64nvme_anycrc)
+        if checksum.crc64nvme_isal is None:
+            self.assertIs(checksum._select_crc64nvme_impl(),
+                          checksum.crc64nvme_anycrc)
+
+    @unittest.skipIf(checksum.crc64nvme_isal is None, 'No ISA-L CRC64NVME')
+    def test_isal(self):
+        self.check_crc_func(checksum.crc64nvme_isal)
+        # Check preferences -- ISA-L always wins
+        self.assertIs(checksum._select_crc64nvme_impl(),
+                      checksum.crc64nvme_isal)
+
+
+class TestCRCHasher(unittest.TestCase):
+    def setUp(self):
+        self.logger = debug_logger()
+
+    def test_base_crc_hasher(self):
+        func = mock.MagicMock(return_value=0xbad1)
+        hasher = checksum.CRCHasher('fake', func)
+        self.assertEqual('fake', hasher.name)
+        self.assertEqual(32, hasher.width)
+        self.assertEqual(0, hasher.crc)
+        self.assertEqual(b'\x00\x00\x00\x00', hasher.digest())
+        self.assertEqual('00000000', hasher.hexdigest())
+
+        hasher.update(b'123456789')
+        self.assertEqual(0xbad1, hasher.crc)
+        self.assertEqual(b'\x00\x00\xba\xd1', hasher.digest())
+        self.assertEqual('0000bad1', hasher.hexdigest())
+
+    def test_crc32_hasher(self):
+        # See CRC-32/ISO-HDLC at
+        # https://reveng.sourceforge.io/crc-catalogue/17plus.htm
+        hasher = checksum.crc32()
+        self.assertEqual('crc32', hasher.name)
+        self.assertEqual(4, hasher.digest_size)
+        self.assertEqual(zlib.crc32, hasher.crc_func)
+        self.assertEqual(32, hasher.width)
+        self.assertEqual(0, hasher.crc)
+        self.assertEqual(b'\x00\x00\x00\x00', hasher.digest())
+        self.assertEqual('00000000', hasher.hexdigest())
+
+        hasher.update(b'123456789')
+        self.assertEqual(0xcbf43926, hasher.crc)
+        self.assertEqual(b'\xcb\xf4\x39\x26', hasher.digest())
+        self.assertEqual('cbf43926', hasher.hexdigest())
+
+    def test_crc32_hasher_contructed_with_data(self):
+        hasher = checksum.crc32(b'123456789')
+        self.assertEqual(zlib.crc32, hasher.crc_func)
+        self.assertEqual(0xcbf43926, hasher.crc)
+        self.assertEqual(b'\xcb\xf4\x39\x26', hasher.digest())
+        self.assertEqual('cbf43926', hasher.hexdigest())
+
+    def test_crc32_hasher_initial_value(self):
+        hasher = checksum.crc32(initial_value=0xcbf43926)
+        self.assertEqual(zlib.crc32, hasher.crc_func)
+        self.assertEqual(0xcbf43926, hasher.crc)
+        self.assertEqual(b'\xcb\xf4\x39\x26', hasher.digest())
+        self.assertEqual('cbf43926', hasher.hexdigest())
+
+    def test_crc32_hasher_copy(self):
+        hasher = checksum.crc32(b'123456789')
+        self.assertEqual(4, hasher.digest_size)
+        self.assertEqual('cbf43926', hasher.hexdigest())
+        hasher_copy = hasher.copy()
+        self.assertEqual('crc32', hasher.name)
+        self.assertEqual(zlib.crc32, hasher_copy.crc_func)
+        self.assertEqual('cbf43926', hasher_copy.hexdigest())
+        hasher_copy.update(b'foo')
+        self.assertEqual('cbf43926', hasher.hexdigest())
+        self.assertEqual('04e7e407', hasher_copy.hexdigest())
+        hasher.update(b'bar')
+        self.assertEqual('fe6b0d8c', hasher.hexdigest())
+        self.assertEqual('04e7e407', hasher_copy.hexdigest())
+
+    @requires_crc32c
+    def test_crc32c_hasher(self):
+        # See CRC-32/ISCSI at
+        # https://reveng.sourceforge.io/crc-catalogue/17plus.htm
+        hasher = checksum.crc32c()
+        self.assertEqual('crc32c', hasher.name)
+        self.assertEqual(32, hasher.width)
+        self.assertEqual(0, hasher.crc)
+        self.assertEqual(b'\x00\x00\x00\x00', hasher.digest())
+        self.assertEqual('00000000', hasher.hexdigest())
+
+        hasher.update(b'123456789')
+        self.assertEqual(0xe3069283, hasher.crc)
+        self.assertEqual(b'\xe3\x06\x92\x83', hasher.digest())
+        self.assertEqual('e3069283', hasher.hexdigest())
+
+    @requires_crc32c
+    def test_crc32c_hasher_constructed_with_data(self):
+        hasher = checksum.crc32c(b'123456789')
+        self.assertEqual(0xe3069283, hasher.crc)
+        self.assertEqual(b'\xe3\x06\x92\x83', hasher.digest())
+        self.assertEqual('e3069283', hasher.hexdigest())
+
+    @requires_crc32c
+    def test_crc32c_hasher_initial_value(self):
+        hasher = checksum.crc32c(initial_value=0xe3069283)
+        self.assertEqual(0xe3069283, hasher.crc)
+        self.assertEqual(b'\xe3\x06\x92\x83', hasher.digest())
+        self.assertEqual('e3069283', hasher.hexdigest())
+
+    @requires_crc32c
+    def test_crc32c_hasher_copy(self):
+        hasher = checksum.crc32c(b'123456789')
+        self.assertEqual('e3069283', hasher.hexdigest())
+        hasher_copy = hasher.copy()
+        self.assertEqual('crc32c', hasher_copy.name)
+        self.assertIs(hasher.crc_func, hasher_copy.crc_func)
+        self.assertEqual('e3069283', hasher_copy.hexdigest())
+        hasher_copy.update(b'foo')
+        self.assertEqual('e3069283', hasher.hexdigest())
+        self.assertEqual('6b2fc5b0', hasher_copy.hexdigest())
+        hasher.update(b'bar')
+        self.assertEqual('ae5c789c', hasher.hexdigest())
+        self.assertEqual('6b2fc5b0', hasher_copy.hexdigest())
+
+    def test_crc32c_hasher_selects_kern_impl(self):
+        scuc = 'swift.common.utils.checksum'
+        with mock.patch(scuc + '.crc32c_isal', None), \
+                mock.patch(scuc + '.crc32c_kern') as mock_kern, \
+                mock.patch(scuc + '.crc32c_anycrc', None):
+            mock_kern.__name__ = 'crc32c_kern'
+            self.assertIs(mock_kern, checksum.crc32c().crc_func)
+            checksum.log_selected_implementation(self.logger)
+        self.assertIn('Using crc32c_kern implementation for CRC32C.',
+                      self.logger.get_lines_for_level('info'))
+
+    def test_crc32c_hasher_selects_anycrc_impl(self):
+        scuc = 'swift.common.utils.checksum'
+        with mock.patch(scuc + '.crc32c_isal', None), \
+                mock.patch(scuc + '.crc32c_kern', None), \
+                mock.patch(scuc + '.crc32c_anycrc') as mock_anycrc:
+            mock_anycrc.__name__ = 'crc32c_anycrc'
+            self.assertIs(mock_anycrc, checksum.crc32c().crc_func)
+            checksum.log_selected_implementation(self.logger)
+        self.assertIn('Using crc32c_anycrc implementation for CRC32C.',
+                      self.logger.get_lines_for_level('info'))
+
+    def test_crc32c_hasher_selects_isal_impl(self):
+        scuc = 'swift.common.utils.checksum'
+        with mock.patch(scuc + '.crc32c_isal') as mock_isal, \
+                mock.patch(scuc + '.crc32c_kern'), \
+                mock.patch(scuc + '.crc32c_anycrc'):
+            mock_isal.__name__ = 'crc32c_isal'
+            self.assertIs(mock_isal, checksum.crc32c().crc_func)
+            checksum.log_selected_implementation(self.logger)
+        self.assertIn('Using crc32c_isal implementation for CRC32C.',
+                      self.logger.get_lines_for_level('info'))
+
+    @requires_crc64nvme
+    def test_crc64nvme_hasher(self):
+        # See CRC-64/NVME at
+        # https://reveng.sourceforge.io/crc-catalogue/17plus.htm
+        hasher = checksum.crc64nvme()
+        self.assertEqual('crc64nvme', hasher.name)
+        self.assertEqual(8, hasher.digest_size)
+        self.assertEqual(64, hasher.width)
+        self.assertEqual(0, hasher.crc)
+        self.assertEqual(b'\x00\x00\x00\x00\x00\x00\x00\x00', hasher.digest())
+        self.assertEqual('0000000000000000', hasher.hexdigest())
+
+        hasher.update(b'123456789')
+        self.assertEqual(0xae8b14860a799888, hasher.crc)
+        self.assertEqual(b'\xae\x8b\x14\x86\x0a\x79\x98\x88', hasher.digest())
+        self.assertEqual('ae8b14860a799888', hasher.hexdigest())
+
+    @requires_crc64nvme
+    def test_crc64nvme_hasher_constructed_with_data(self):
+        hasher = checksum.crc64nvme(b'123456789')
+        self.assertEqual(b'\xae\x8b\x14\x86\x0a\x79\x98\x88', hasher.digest())
+        self.assertEqual('ae8b14860a799888', hasher.hexdigest())
+
+    @requires_crc64nvme
+    def test_crc64nvme_hasher_initial_value(self):
+        hasher = checksum.crc64nvme(initial_value=0xae8b14860a799888)
+        self.assertEqual(b'\xae\x8b\x14\x86\x0a\x79\x98\x88', hasher.digest())
+        self.assertEqual('ae8b14860a799888', hasher.hexdigest())
+
+    @requires_crc64nvme
+    def test_crc64nvme_hasher_copy(self):
+        hasher = checksum.crc64nvme(b'123456789')
+        self.assertEqual('ae8b14860a799888', hasher.hexdigest())
+        hasher_copy = hasher.copy()
+        self.assertEqual('crc64nvme', hasher_copy.name)
+        self.assertIs(hasher.crc_func, hasher_copy.crc_func)
+        self.assertEqual('ae8b14860a799888', hasher_copy.hexdigest())
+        hasher_copy.update(b'foo')
+        self.assertEqual('ae8b14860a799888', hasher.hexdigest())
+        self.assertEqual('673ece0d56523f46', hasher_copy.hexdigest())
+        hasher.update(b'bar')
+        self.assertEqual('0991d5edf1b0062e', hasher.hexdigest())
+        self.assertEqual('673ece0d56523f46', hasher_copy.hexdigest())
+
+    def test_crc64nvme_hasher_selects_anycrc_impl(self):
+        scuc = 'swift.common.utils.checksum'
+        with mock.patch(scuc + '.crc64nvme_isal', None), \
+                mock.patch(scuc + '.crc64nvme_anycrc') as mock_anycrc:
+            mock_anycrc.__name__ = 'crc64nvme_anycrc'
+            self.assertIs(mock_anycrc,
+                          checksum.crc64nvme().crc_func)
+            checksum.log_selected_implementation(self.logger)
+        self.assertIn(
+            'Using crc64nvme_anycrc implementation for CRC64NVME.',
+            self.logger.get_lines_for_level('info'))
+
+    def test_crc64nvme_hasher_selects_isal_impl(self):
+        scuc = 'swift.common.utils.checksum'
+        with mock.patch(scuc + '.crc64nvme_isal') as mock_isal, \
+                mock.patch(scuc + '.crc64nvme_anycrc'):
+            mock_isal.__name__ = 'crc64nvme_isal'
+            self.assertIs(mock_isal, checksum.crc64nvme().crc_func)
+            checksum.log_selected_implementation(self.logger)
+        self.assertIn(
+            'Using crc64nvme_isal implementation for CRC64NVME.',
+            self.logger.get_lines_for_level('info'))
diff --git a/test/unit/common/utils/test_config.py b/test/unit/common/utils/test_config.py
new file mode 100644
index 0000000000..7d0b531a60
--- /dev/null
+++ b/test/unit/common/utils/test_config.py
@@ -0,0 +1,758 @@
+# Copyright (c) 2010-2024 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""Tests for swift.common.utils.config"""
+import os
+import tempfile
+from textwrap import dedent
+import unittest
+
+from unittest import mock
+
+from swift.common.utils import config
+
+from io import StringIO
+from test.unit import temptree
+
+
+class TestUtilsConfig(unittest.TestCase):
+
+    def test_TRUE_VALUES(self):
+        for v in config.TRUE_VALUES:
+            self.assertEqual(v, v.lower())
+
+    @mock.patch.object(config, 'TRUE_VALUES', 'hello world'.split())
+    def test_config_true_value(self):
+        for val in 'hello world HELLO WORLD'.split():
+            self.assertTrue(config.config_true_value(val) is True)
+        self.assertTrue(config.config_true_value(True) is True)
+        self.assertTrue(config.config_true_value('foo') is False)
+        self.assertTrue(config.config_true_value(False) is False)
+        self.assertTrue(config.config_true_value(None) is False)
+
+    def test_non_negative_float(self):
+        self.assertEqual(0, config.non_negative_float('0.0'))
+        self.assertEqual(0, config.non_negative_float(0.0))
+        self.assertEqual(1.1, config.non_negative_float(1.1))
+        self.assertEqual(1.1, config.non_negative_float('1.1'))
+        self.assertEqual(1.0, config.non_negative_float('1'))
+        self.assertEqual(1, config.non_negative_float(True))
+        self.assertEqual(0, config.non_negative_float(False))
+
+        with self.assertRaises(ValueError) as cm:
+            config.non_negative_float(-1.1)
+        self.assertEqual(
+            'Value must be a non-negative float number, not "-1.1".',
+            str(cm.exception))
+        with self.assertRaises(ValueError) as cm:
+            config.non_negative_float('-1.1')
+        self.assertEqual(
+            'Value must be a non-negative float number, not "-1.1".',
+            str(cm.exception))
+        with self.assertRaises(ValueError) as cm:
+            config.non_negative_float('one')
+        self.assertEqual(
+            'Value must be a non-negative float number, not "one".',
+            str(cm.exception))
+        with self.assertRaises(ValueError) as cm:
+            config.non_negative_float(None)
+        self.assertEqual(
+            'Value must be a non-negative float number, not "None".',
+            str(cm.exception))
+
+    def test_non_negative_int(self):
+        self.assertEqual(0, config.non_negative_int('0'))
+        self.assertEqual(0, config.non_negative_int(0.0))
+        self.assertEqual(1, config.non_negative_int(1))
+        self.assertEqual(1, config.non_negative_int(1.1))
+        self.assertEqual(1, config.non_negative_int('1'))
+        self.assertEqual(1, config.non_negative_int(True))
+        self.assertEqual(0, config.non_negative_int(False))
+
+        with self.assertRaises(ValueError) as cm:
+            config.non_negative_int(-1)
+        self.assertEqual(
+            'Value must be a non-negative integer, not "-1".',
+            str(cm.exception))
+        with self.assertRaises(ValueError) as cm:
+            config.non_negative_int('-1')
+        self.assertEqual(
+            'Value must be a non-negative integer, not "-1".',
+            str(cm.exception))
+        with self.assertRaises(ValueError) as cm:
+            config.non_negative_int('-1.1')
+        self.assertEqual(
+            'Value must be a non-negative integer, not "-1.1".',
+            str(cm.exception))
+        with self.assertRaises(ValueError) as cm:
+            config.non_negative_int('1.1')
+        self.assertEqual(
+            'Value must be a non-negative integer, not "1.1".',
+            str(cm.exception))
+        with self.assertRaises(ValueError) as cm:
+            config.non_negative_int('1.0')
+        self.assertEqual(
+            'Value must be a non-negative integer, not "1.0".',
+            str(cm.exception))
+        with self.assertRaises(ValueError) as cm:
+            config.non_negative_int('one')
+        self.assertEqual(
+            'Value must be a non-negative integer, not "one".',
+            str(cm.exception))
+
+    def test_config_positive_int_value(self):
+        expectations = {
+            # value : expected,
+            u'1': 1,
+            b'1': 1,
+            1: 1,
+            1.1: 1,
+            u'2': 2,
+            b'2': 2,
+            u'1024': 1024,
+            b'1024': 1024,
+            u'0': ValueError,
+            b'0': ValueError,
+            u'-1': ValueError,
+            b'-1': ValueError,
+            u'0x01': ValueError,
+            b'0x01': ValueError,
+            u'asdf': ValueError,
+            b'asdf': ValueError,
+            None: ValueError,
+            0: ValueError,
+            -1: ValueError,
+            u'1.2': ValueError,  # string expresses float should be value error
+            b'1.2': ValueError,  # string expresses float should be value error
+        }
+        for value, expected in expectations.items():
+            try:
+                rv = config.config_positive_int_value(value)
+            except Exception as e:
+                if e.__class__ is not expected:
+                    raise
+                else:
+                    self.assertEqual(
+                        'Config option must be an positive int number, '
+                        'not "%s".' % value, e.args[0])
+            else:
+                self.assertEqual(expected, rv)
+
+    def test_config_positive_float_value(self):
+        # Test cases that should pass
+        for value, expected in (
+                (99, 99.0),
+                (99.01, 99.01),
+                ('99', 99.0),
+                ('99.01', 99.01),
+                (1, 1.0),
+                ('0.00001', 0.00001),
+        ):
+            actual = config.config_positive_float_value(value)
+            self.assertEqual(expected, actual)
+
+        # Test cases that should raise ValueError
+        for value in (
+                0, '0', 0.0, '0.0',
+                -99, -99.01,
+                '-99', '-99.01',
+                None, 'not-a-float'
+        ):
+            with self.assertRaises(ValueError) as cm:
+                config.config_positive_float_value(value)
+            expected_msg = (
+                'Config option must be a positive float number, not "%s".' %
+                value)
+            self.assertEqual(expected_msg, str(cm.exception))
+
+    def test_config_float_value(self):
+        for args, expected in (
+                ((99, None, None), 99.0),
+                ((99.01, None, None), 99.01),
+                (('99', None, None), 99.0),
+                (('99.01', None, None), 99.01),
+                ((99, 99, None), 99.0),
+                ((99.01, 99.01, None), 99.01),
+                (('99', 99, None), 99.0),
+                (('99.01', 99.01, None), 99.01),
+                ((99, None, 99), 99.0),
+                ((99.01, None, 99.01), 99.01),
+                (('99', None, 99), 99.0),
+                (('99.01', None, 99.01), 99.01),
+                ((-99, -99, -99), -99.0),
+                ((-99.01, -99.01, -99.01), -99.01),
+                (('-99', -99, -99), -99.0),
+                (('-99.01', -99.01, -99.01), -99.01),):
+            actual = config.config_float_value(*args)
+            self.assertEqual(expected, actual)
+
+        for val, minimum in ((99, 100),
+                             ('99', 100),
+                             (-99, -98),
+                             ('-98.01', -98)):
+            with self.assertRaises(ValueError) as cm:
+                config.config_float_value(val, minimum=minimum)
+            self.assertIn('greater than %s' % minimum, cm.exception.args[0])
+            self.assertNotIn('less than', cm.exception.args[0])
+
+        for val, maximum in ((99, 98),
+                             ('99', 98),
+                             (-99, -100),
+                             ('-97.9', -98)):
+            with self.assertRaises(ValueError) as cm:
+                config.config_float_value(val, maximum=maximum)
+            self.assertIn('less than %s' % maximum, cm.exception.args[0])
+            self.assertNotIn('greater than', cm.exception.args[0])
+
+        for val, minimum, maximum in ((99, 99, 98),
+                                      ('99', 100, 100),
+                                      (99, 98, 98),):
+            with self.assertRaises(ValueError) as cm:
+                config.config_float_value(
+                    val, minimum=minimum, maximum=maximum)
+            self.assertIn('greater than %s' % minimum, cm.exception.args[0])
+            self.assertIn('less than %s' % maximum, cm.exception.args[0])
+
+    def test_config_percent_value(self):
+        for arg, expected in (
+                (99, 0.99),
+                (25.5, 0.255),
+                ('99', 0.99),
+                ('25.5', 0.255),
+                (0, 0.0),
+                ('0', 0.0),
+                ('100', 1.0),
+                (100, 1.0),
+                (1, 0.01),
+                ('1', 0.01),
+                (25, 0.25)):
+            actual = config.config_percent_value(arg)
+            self.assertEqual(expected, actual)
+
+        # bad values
+        for val in (-1, '-1', 101, '101'):
+            with self.assertRaises(ValueError) as cm:
+                config.config_percent_value(val)
+            self.assertIn('Config option must be a number, greater than 0, '
+                          'less than 100, not "{}"'.format(val),
+                          cm.exception.args[0])
+
+    def test_config_request_node_count_value(self):
+        def do_test(value, replicas, expected):
+            self.assertEqual(
+                expected,
+                config.config_request_node_count_value(value)(replicas))
+
+        do_test('0', 10, 0)
+        do_test('1 * replicas', 3, 3)
+        do_test('1 * replicas', 11, 11)
+        do_test('2 * replicas', 3, 6)
+        do_test('2 * replicas', 11, 22)
+        do_test('11', 11, 11)
+        do_test('10', 11, 10)
+        do_test('12', 11, 12)
+
+        for bad in ('1.1', 1.1, 'auto', 'bad',
+                    '2.5 * replicas', 'two * replicas'):
+            with self.subTest(option=bad):
+                with self.assertRaises(ValueError):
+                    config.config_request_node_count_value(bad)
+
+    def test_config_auto_int_value(self):
+        expectations = {
+            # (value, default) : expected,
+            ('1', 0): 1,
+            (1, 0): 1,
+            ('asdf', 0): ValueError,
+            ('auto', 1): 1,
+            ('AutO', 1): 1,
+            ('Aut0', 1): ValueError,
+            (None, 1): 1,
+        }
+        for (value, default), expected in expectations.items():
+            try:
+                rv = config.config_auto_int_value(value, default)
+            except Exception as e:
+                if e.__class__ is not expected:
+                    raise
+            else:
+                self.assertEqual(expected, rv)
+
+    def test_config_fallocate_value(self):
+        fallocate_value, is_percent = config.config_fallocate_value('10%')
+        self.assertEqual(fallocate_value, 10)
+        self.assertTrue(is_percent)
+        fallocate_value, is_percent = config.config_fallocate_value('10')
+        self.assertEqual(fallocate_value, 10)
+        self.assertFalse(is_percent)
+        try:
+            fallocate_value, is_percent = config.config_fallocate_value('ab%')
+        except ValueError as err:
+            exc = err
+        self.assertEqual(str(exc), 'Error: ab% is an invalid value for '
+                                   'fallocate_reserve.')
+        try:
+            fallocate_value, is_percent = config.config_fallocate_value('ab')
+        except ValueError as err:
+            exc = err
+        self.assertEqual(str(exc), 'Error: ab is an invalid value for '
+                                   'fallocate_reserve.')
+        try:
+            fallocate_value, is_percent = config.config_fallocate_value('1%%')
+        except ValueError as err:
+            exc = err
+        self.assertEqual(str(exc), 'Error: 1%% is an invalid value for '
+                                   'fallocate_reserve.')
+        try:
+            fallocate_value, is_percent = config.config_fallocate_value('10.0')
+        except ValueError as err:
+            exc = err
+        self.assertEqual(str(exc), 'Error: 10.0 is an invalid value for '
+                                   'fallocate_reserve.')
+        fallocate_value, is_percent = config.config_fallocate_value('10.5%')
+        self.assertEqual(fallocate_value, 10.5)
+        self.assertTrue(is_percent)
+        fallocate_value, is_percent = config.config_fallocate_value('10.000%')
+        self.assertEqual(fallocate_value, 10.000)
+        self.assertTrue(is_percent)
+
+
+class ResellerConfReader(unittest.TestCase):
+
+    def setUp(self):
+        self.default_rules = {'operator_roles': ['admin', 'swiftoperator'],
+                              'service_roles': [],
+                              'require_group': ''}
+
+    def test_defaults(self):
+        conf = {}
+        prefixes, options = config.config_read_reseller_options(
+            conf, self.default_rules)
+        self.assertEqual(prefixes, ['AUTH_'])
+        self.assertEqual(options['AUTH_'], self.default_rules)
+
+    def test_same_as_default(self):
+        conf = {'reseller_prefix': 'AUTH',
+                'operator_roles': 'admin, swiftoperator'}
+        prefixes, options = config.config_read_reseller_options(
+            conf, self.default_rules)
+        self.assertEqual(prefixes, ['AUTH_'])
+        self.assertEqual(options['AUTH_'], self.default_rules)
+
+    def test_single_blank_reseller(self):
+        conf = {'reseller_prefix': ''}
+        prefixes, options = config.config_read_reseller_options(
+            conf, self.default_rules)
+        self.assertEqual(prefixes, [''])
+        self.assertEqual(options[''], self.default_rules)
+
+    def test_single_blank_reseller_with_conf(self):
+        conf = {'reseller_prefix': '',
+                "''operator_roles": 'role1, role2'}
+        prefixes, options = config.config_read_reseller_options(
+            conf, self.default_rules)
+        self.assertEqual(prefixes, [''])
+        self.assertEqual(options[''].get('operator_roles'),
+                         ['role1', 'role2'])
+        self.assertEqual(options[''].get('service_roles'),
+                         self.default_rules.get('service_roles'))
+        self.assertEqual(options[''].get('require_group'),
+                         self.default_rules.get('require_group'))
+
+    def test_multiple_same_resellers(self):
+        conf = {'reseller_prefix': " '' , '' "}
+        prefixes, options = config.config_read_reseller_options(
+            conf, self.default_rules)
+        self.assertEqual(prefixes, [''])
+
+        conf = {'reseller_prefix': '_, _'}
+        prefixes, options = config.config_read_reseller_options(
+            conf, self.default_rules)
+        self.assertEqual(prefixes, ['_'])
+
+        conf = {'reseller_prefix': 'AUTH, PRE2, AUTH, PRE2'}
+        prefixes, options = config.config_read_reseller_options(
+            conf, self.default_rules)
+        self.assertEqual(prefixes, ['AUTH_', 'PRE2_'])
+
+    def test_several_resellers_with_conf(self):
+        conf = {'reseller_prefix': 'PRE1, PRE2',
+                'PRE1_operator_roles': 'role1, role2',
+                'PRE1_service_roles': 'role3, role4',
+                'PRE2_operator_roles': 'role5',
+                'PRE2_service_roles': 'role6',
+                'PRE2_require_group': 'pre2_group'}
+        prefixes, options = config.config_read_reseller_options(
+            conf, self.default_rules)
+        self.assertEqual(prefixes, ['PRE1_', 'PRE2_'])
+
+        self.assertEqual(set(['role1', 'role2']),
+                         set(options['PRE1_'].get('operator_roles')))
+        self.assertEqual(['role5'],
+                         options['PRE2_'].get('operator_roles'))
+        self.assertEqual(set(['role3', 'role4']),
+                         set(options['PRE1_'].get('service_roles')))
+        self.assertEqual(['role6'], options['PRE2_'].get('service_roles'))
+        self.assertEqual('', options['PRE1_'].get('require_group'))
+        self.assertEqual('pre2_group', options['PRE2_'].get('require_group'))
+
+    def test_several_resellers_first_blank(self):
+        conf = {'reseller_prefix': " '' , PRE2",
+                "''operator_roles": 'role1, role2',
+                "''service_roles": 'role3, role4',
+                'PRE2_operator_roles': 'role5',
+                'PRE2_service_roles': 'role6',
+                'PRE2_require_group': 'pre2_group'}
+        prefixes, options = config.config_read_reseller_options(
+            conf, self.default_rules)
+        self.assertEqual(prefixes, ['', 'PRE2_'])
+
+        self.assertEqual(set(['role1', 'role2']),
+                         set(options[''].get('operator_roles')))
+        self.assertEqual(['role5'],
+                         options['PRE2_'].get('operator_roles'))
+        self.assertEqual(set(['role3', 'role4']),
+                         set(options[''].get('service_roles')))
+        self.assertEqual(['role6'], options['PRE2_'].get('service_roles'))
+        self.assertEqual('', options[''].get('require_group'))
+        self.assertEqual('pre2_group', options['PRE2_'].get('require_group'))
+
+    def test_several_resellers_with_blank_comma(self):
+        conf = {'reseller_prefix': "AUTH , '', PRE2",
+                "''operator_roles": 'role1, role2',
+                "''service_roles": 'role3, role4',
+                'PRE2_operator_roles': 'role5',
+                'PRE2_service_roles': 'role6',
+                'PRE2_require_group': 'pre2_group'}
+        prefixes, options = config.config_read_reseller_options(
+            conf, self.default_rules)
+        self.assertEqual(prefixes, ['AUTH_', '', 'PRE2_'])
+        self.assertEqual(set(['admin', 'swiftoperator']),
+                         set(options['AUTH_'].get('operator_roles')))
+        self.assertEqual(set(['role1', 'role2']),
+                         set(options[''].get('operator_roles')))
+        self.assertEqual(['role5'],
+                         options['PRE2_'].get('operator_roles'))
+        self.assertEqual([],
+                         options['AUTH_'].get('service_roles'))
+        self.assertEqual(set(['role3', 'role4']),
+                         set(options[''].get('service_roles')))
+        self.assertEqual(['role6'], options['PRE2_'].get('service_roles'))
+        self.assertEqual('', options['AUTH_'].get('require_group'))
+        self.assertEqual('', options[''].get('require_group'))
+        self.assertEqual('pre2_group', options['PRE2_'].get('require_group'))
+
+    def test_stray_comma(self):
+        conf = {'reseller_prefix': "AUTH ,, PRE2",
+                "''operator_roles": 'role1, role2',
+                "''service_roles": 'role3, role4',
+                'PRE2_operator_roles': 'role5',
+                'PRE2_service_roles': 'role6',
+                'PRE2_require_group': 'pre2_group'}
+        prefixes, options = config.config_read_reseller_options(
+            conf, self.default_rules)
+        self.assertEqual(prefixes, ['AUTH_', 'PRE2_'])
+        self.assertEqual(set(['admin', 'swiftoperator']),
+                         set(options['AUTH_'].get('operator_roles')))
+        self.assertEqual(['role5'],
+                         options['PRE2_'].get('operator_roles'))
+        self.assertEqual([],
+                         options['AUTH_'].get('service_roles'))
+        self.assertEqual(['role6'], options['PRE2_'].get('service_roles'))
+        self.assertEqual('', options['AUTH_'].get('require_group'))
+        self.assertEqual('pre2_group', options['PRE2_'].get('require_group'))
+
+    def test_multiple_stray_commas_resellers(self):
+        conf = {'reseller_prefix': ' , , ,'}
+        prefixes, options = config.config_read_reseller_options(
+            conf, self.default_rules)
+        self.assertEqual(prefixes, [''])
+        self.assertEqual(options[''], self.default_rules)
+
+    def test_unprefixed_options(self):
+        conf = {'reseller_prefix': "AUTH , '', PRE2",
+                "operator_roles": 'role1, role2',
+                "service_roles": 'role3, role4',
+                'require_group': 'auth_blank_group',
+                'PRE2_operator_roles': 'role5',
+                'PRE2_service_roles': 'role6',
+                'PRE2_require_group': 'pre2_group'}
+        prefixes, options = config.config_read_reseller_options(
+            conf, self.default_rules)
+        self.assertEqual(prefixes, ['AUTH_', '', 'PRE2_'])
+        self.assertEqual(set(['role1', 'role2']),
+                         set(options['AUTH_'].get('operator_roles')))
+        self.assertEqual(set(['role1', 'role2']),
+                         set(options[''].get('operator_roles')))
+        self.assertEqual(['role5'],
+                         options['PRE2_'].get('operator_roles'))
+        self.assertEqual(set(['role3', 'role4']),
+                         set(options['AUTH_'].get('service_roles')))
+        self.assertEqual(set(['role3', 'role4']),
+                         set(options[''].get('service_roles')))
+        self.assertEqual(['role6'], options['PRE2_'].get('service_roles'))
+        self.assertEqual('auth_blank_group',
+                         options['AUTH_'].get('require_group'))
+        self.assertEqual('auth_blank_group', options[''].get('require_group'))
+        self.assertEqual('pre2_group', options['PRE2_'].get('require_group'))
+
+
+class TestAffinityKeyFunction(unittest.TestCase):
+    def setUp(self):
+        self.nodes = [dict(id=0, region=1, zone=1),
+                      dict(id=1, region=1, zone=2),
+                      dict(id=2, region=2, zone=1),
+                      dict(id=3, region=2, zone=2),
+                      dict(id=4, region=3, zone=1),
+                      dict(id=5, region=3, zone=2),
+                      dict(id=6, region=4, zone=0),
+                      dict(id=7, region=4, zone=1)]
+
+    def test_single_region(self):
+        keyfn = config.affinity_key_function("r3=1")
+        ids = [n['id'] for n in sorted(self.nodes, key=keyfn)]
+        self.assertEqual([4, 5, 0, 1, 2, 3, 6, 7], ids)
+
+    def test_bogus_value(self):
+        self.assertRaises(ValueError,
+                          config.affinity_key_function, "r3")
+        self.assertRaises(ValueError,
+                          config.affinity_key_function, "r3=elephant")
+
+    def test_empty_value(self):
+        # Empty's okay, it just means no preference
+        keyfn = config.affinity_key_function("")
+        self.assertTrue(callable(keyfn))
+        ids = [n['id'] for n in sorted(self.nodes, key=keyfn)]
+        self.assertEqual([0, 1, 2, 3, 4, 5, 6, 7], ids)
+
+    def test_all_whitespace_value(self):
+        # Empty's okay, it just means no preference
+        keyfn = config.affinity_key_function("  \n")
+        self.assertTrue(callable(keyfn))
+        ids = [n['id'] for n in sorted(self.nodes, key=keyfn)]
+        self.assertEqual([0, 1, 2, 3, 4, 5, 6, 7], ids)
+
+    def test_with_zone_zero(self):
+        keyfn = config.affinity_key_function("r4z0=1")
+        ids = [n['id'] for n in sorted(self.nodes, key=keyfn)]
+        self.assertEqual([6, 0, 1, 2, 3, 4, 5, 7], ids)
+
+    def test_multiple(self):
+        keyfn = config.affinity_key_function("r1=100, r4=200, r3z1=1")
+        ids = [n['id'] for n in sorted(self.nodes, key=keyfn)]
+        self.assertEqual([4, 0, 1, 6, 7, 2, 3, 5], ids)
+
+    def test_more_specific_after_less_specific(self):
+        keyfn = config.affinity_key_function("r2=100, r2z2=50")
+        ids = [n['id'] for n in sorted(self.nodes, key=keyfn)]
+        self.assertEqual([3, 2, 0, 1, 4, 5, 6, 7], ids)
+
+
+class TestAffinityLocalityPredicate(unittest.TestCase):
+    def setUp(self):
+        self.nodes = [dict(id=0, region=1, zone=1),
+                      dict(id=1, region=1, zone=2),
+                      dict(id=2, region=2, zone=1),
+                      dict(id=3, region=2, zone=2),
+                      dict(id=4, region=3, zone=1),
+                      dict(id=5, region=3, zone=2),
+                      dict(id=6, region=4, zone=0),
+                      dict(id=7, region=4, zone=1)]
+
+    def test_empty(self):
+        pred = config.affinity_locality_predicate('')
+        self.assertTrue(pred is None)
+
+    def test_region(self):
+        pred = config.affinity_locality_predicate('r1')
+        self.assertTrue(callable(pred))
+        ids = [n['id'] for n in self.nodes if pred(n)]
+        self.assertEqual([0, 1], ids)
+
+    def test_zone(self):
+        pred = config.affinity_locality_predicate('r1z1')
+        self.assertTrue(callable(pred))
+        ids = [n['id'] for n in self.nodes if pred(n)]
+        self.assertEqual([0], ids)
+
+    def test_multiple(self):
+        pred = config.affinity_locality_predicate('r1, r3, r4z0')
+        self.assertTrue(callable(pred))
+        ids = [n['id'] for n in self.nodes if pred(n)]
+        self.assertEqual([0, 1, 4, 5, 6], ids)
+
+    def test_invalid(self):
+        self.assertRaises(ValueError,
+                          config.affinity_locality_predicate, 'falafel')
+        self.assertRaises(ValueError,
+                          config.affinity_locality_predicate, 'r8zQ')
+        self.assertRaises(ValueError,
+                          config.affinity_locality_predicate, 'r2d2')
+        self.assertRaises(ValueError,
+                          config.affinity_locality_predicate, 'r1z1=1')
+
+
+class TestReadConf(unittest.TestCase):
+
+    def test_readconf(self):
+        conf = '''[section1]
+foo = bar
+
+[section2]
+log_name = yarr'''
+        # setup a real file
+        fd, temppath = tempfile.mkstemp()
+        with os.fdopen(fd, 'w') as f:
+            f.write(conf)
+        make_filename = lambda: temppath
+        # setup a file stream
+        make_fp = lambda: StringIO(conf)
+        for conf_object_maker in (make_filename, make_fp):
+            conffile = conf_object_maker()
+            result = config.readconf(conffile)
+            expected = {'__file__': conffile,
+                        'log_name': None,
+                        'section1': {'foo': 'bar'},
+                        'section2': {'log_name': 'yarr'}}
+            self.assertEqual(result, expected)
+            conffile = conf_object_maker()
+            result = config.readconf(conffile, 'section1')
+            expected = {'__file__': conffile, 'log_name': 'section1',
+                        'foo': 'bar'}
+            self.assertEqual(result, expected)
+            conffile = conf_object_maker()
+            result = config.readconf(conffile, 'section2').get('log_name')
+            expected = 'yarr'
+            self.assertEqual(result, expected)
+            conffile = conf_object_maker()
+            result = config.readconf(conffile, 'section1',
+                                     log_name='foo').get('log_name')
+            expected = 'foo'
+            self.assertEqual(result, expected)
+            conffile = conf_object_maker()
+            result = config.readconf(conffile, 'section1',
+                                     defaults={'bar': 'baz'})
+            expected = {'__file__': conffile, 'log_name': 'section1',
+                        'foo': 'bar', 'bar': 'baz'}
+            self.assertEqual(result, expected)
+
+        self.assertRaisesRegex(
+            ValueError, 'Unable to find section3 config section in.*',
+            config.readconf, temppath, 'section3')
+        os.unlink(temppath)
+        self.assertRaises(IOError, config.readconf, temppath)
+
+    def test_readconf_raw(self):
+        conf = '''[section1]
+foo = bar
+
+[section2]
+log_name = %(yarr)s'''
+        # setup a real file
+        fd, temppath = tempfile.mkstemp()
+        with os.fdopen(fd, 'w') as f:
+            f.write(conf)
+        make_filename = lambda: temppath
+        # setup a file stream
+        make_fp = lambda: StringIO(conf)
+        for conf_object_maker in (make_filename, make_fp):
+            conffile = conf_object_maker()
+            result = config.readconf(conffile, raw=True)
+            expected = {'__file__': conffile,
+                        'log_name': None,
+                        'section1': {'foo': 'bar'},
+                        'section2': {'log_name': '%(yarr)s'}}
+            self.assertEqual(result, expected)
+        os.unlink(temppath)
+        self.assertRaises(IOError, config.readconf, temppath)
+
+    def test_readconf_dir(self):
+        config_dir = {
+            'server.conf.d/01.conf': """
+            [DEFAULT]
+            port = 8080
+            foo = bar
+
+            [section1]
+            name=section1
+            """,
+            'server.conf.d/section2.conf': """
+            [DEFAULT]
+            port = 8081
+            bar = baz
+
+            [section2]
+            name=section2
+            """,
+            'other-server.conf.d/01.conf': """
+            [DEFAULT]
+            port = 8082
+
+            [section3]
+            name=section3
+            """
+        }
+        # strip indent from test config contents
+        config_dir = dict((f, dedent(c)) for (f, c) in config_dir.items())
+        with temptree(*zip(*config_dir.items())) as path:
+            conf_dir = os.path.join(path, 'server.conf.d')
+            conf = config.readconf(conf_dir)
+        expected = {
+            '__file__': os.path.join(path, 'server.conf.d'),
+            'log_name': None,
+            'section1': {
+                'port': '8081',
+                'foo': 'bar',
+                'bar': 'baz',
+                'name': 'section1',
+            },
+            'section2': {
+                'port': '8081',
+                'foo': 'bar',
+                'bar': 'baz',
+                'name': 'section2',
+            },
+        }
+        self.assertEqual(conf, expected)
+
+    def test_readconf_dir_ignores_hidden_and_nondotconf_files(self):
+        config_dir = {
+            'server.conf.d/01.conf': """
+            [section1]
+            port = 8080
+            """,
+            'server.conf.d/.01.conf.swp': """
+            [section]
+            port = 8081
+            """,
+            'server.conf.d/01.conf-bak': """
+            [section]
+            port = 8082
+            """,
+        }
+        # strip indent from test config contents
+        config_dir = dict((f, dedent(c)) for (f, c) in config_dir.items())
+        with temptree(*zip(*config_dir.items())) as path:
+            conf_dir = os.path.join(path, 'server.conf.d')
+            conf = config.readconf(conf_dir)
+        expected = {
+            '__file__': os.path.join(path, 'server.conf.d'),
+            'log_name': None,
+            'section1': {
+                'port': '8080',
+            },
+        }
+        self.assertEqual(conf, expected)
diff --git a/test/unit/common/utils/test_ipaddrs.py b/test/unit/common/utils/test_ipaddrs.py
new file mode 100644
index 0000000000..246abc6bfb
--- /dev/null
+++ b/test/unit/common/utils/test_ipaddrs.py
@@ -0,0 +1,178 @@
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import ctypes
+from unittest.mock import patch
+import socket
+import unittest
+
+# Continue importing from utils, as 3rd parties may depend on those imports
+from swift.common import utils
+from swift.common.utils import ipaddrs as utils_ipaddrs
+
+
+class TestIsValidIP(unittest.TestCase):
+    def test_is_valid_ip(self):
+        self.assertTrue(utils.is_valid_ip("127.0.0.1"))
+        self.assertTrue(utils.is_valid_ip("10.0.0.1"))
+        ipv6 = "fe80:0000:0000:0000:0204:61ff:fe9d:f156"
+        self.assertTrue(utils.is_valid_ip(ipv6))
+        ipv6 = "fe80:0:0:0:204:61ff:fe9d:f156"
+        self.assertTrue(utils.is_valid_ip(ipv6))
+        ipv6 = "fe80::204:61ff:fe9d:f156"
+        self.assertTrue(utils.is_valid_ip(ipv6))
+        ipv6 = "fe80:0000:0000:0000:0204:61ff:254.157.241.86"
+        self.assertTrue(utils.is_valid_ip(ipv6))
+        ipv6 = "fe80:0:0:0:0204:61ff:254.157.241.86"
+        self.assertTrue(utils.is_valid_ip(ipv6))
+        ipv6 = "fe80::204:61ff:254.157.241.86"
+        self.assertTrue(utils.is_valid_ip(ipv6))
+        ipv6 = "fe80::"
+        self.assertTrue(utils.is_valid_ip(ipv6))
+        ipv6 = "::1"
+        self.assertTrue(utils.is_valid_ip(ipv6))
+        not_ipv6 = "3ffe:0b00:0000:0001:0000:0000:000a"
+        self.assertFalse(utils.is_valid_ip(not_ipv6))
+        not_ipv6 = "1:2:3:4:5:6::7:8"
+        self.assertFalse(utils.is_valid_ip(not_ipv6))
+
+    def test_is_valid_ipv4(self):
+        self.assertTrue(utils.is_valid_ipv4("127.0.0.1"))
+        self.assertTrue(utils.is_valid_ipv4("10.0.0.1"))
+        ipv6 = "fe80:0000:0000:0000:0204:61ff:fe9d:f156"
+        self.assertFalse(utils.is_valid_ipv4(ipv6))
+        ipv6 = "fe80:0:0:0:204:61ff:fe9d:f156"
+        self.assertFalse(utils.is_valid_ipv4(ipv6))
+        ipv6 = "fe80::204:61ff:fe9d:f156"
+        self.assertFalse(utils.is_valid_ipv4(ipv6))
+        ipv6 = "fe80:0000:0000:0000:0204:61ff:254.157.241.86"
+        self.assertFalse(utils.is_valid_ipv4(ipv6))
+        ipv6 = "fe80:0:0:0:0204:61ff:254.157.241.86"
+        self.assertFalse(utils.is_valid_ipv4(ipv6))
+        ipv6 = "fe80::204:61ff:254.157.241.86"
+        self.assertFalse(utils.is_valid_ipv4(ipv6))
+        ipv6 = "fe80::"
+        self.assertFalse(utils.is_valid_ipv4(ipv6))
+        ipv6 = "::1"
+        self.assertFalse(utils.is_valid_ipv4(ipv6))
+        not_ipv6 = "3ffe:0b00:0000:0001:0000:0000:000a"
+        self.assertFalse(utils.is_valid_ipv4(not_ipv6))
+        not_ipv6 = "1:2:3:4:5:6::7:8"
+        self.assertFalse(utils.is_valid_ipv4(not_ipv6))
+
+    def test_is_valid_ipv6(self):
+        self.assertFalse(utils.is_valid_ipv6("127.0.0.1"))
+        self.assertFalse(utils.is_valid_ipv6("10.0.0.1"))
+        ipv6 = "fe80:0000:0000:0000:0204:61ff:fe9d:f156"
+        self.assertTrue(utils.is_valid_ipv6(ipv6))
+        ipv6 = "fe80:0:0:0:204:61ff:fe9d:f156"
+        self.assertTrue(utils.is_valid_ipv6(ipv6))
+        ipv6 = "fe80::204:61ff:fe9d:f156"
+        self.assertTrue(utils.is_valid_ipv6(ipv6))
+        ipv6 = "fe80:0000:0000:0000:0204:61ff:254.157.241.86"
+        self.assertTrue(utils.is_valid_ipv6(ipv6))
+        ipv6 = "fe80:0:0:0:0204:61ff:254.157.241.86"
+        self.assertTrue(utils.is_valid_ipv6(ipv6))
+        ipv6 = "fe80::204:61ff:254.157.241.86"
+        self.assertTrue(utils.is_valid_ipv6(ipv6))
+        ipv6 = "fe80::"
+        self.assertTrue(utils.is_valid_ipv6(ipv6))
+        ipv6 = "::1"
+        self.assertTrue(utils.is_valid_ipv6(ipv6))
+        not_ipv6 = "3ffe:0b00:0000:0001:0000:0000:000a"
+        self.assertFalse(utils.is_valid_ipv6(not_ipv6))
+        not_ipv6 = "1:2:3:4:5:6::7:8"
+        self.assertFalse(utils.is_valid_ipv6(not_ipv6))
+
+
+class TestExpandIPv6(unittest.TestCase):
+    def test_expand_ipv6(self):
+        expanded_ipv6 = "fe80::204:61ff:fe9d:f156"
+        upper_ipv6 = "fe80:0000:0000:0000:0204:61ff:fe9d:f156"
+        self.assertEqual(expanded_ipv6, utils.expand_ipv6(upper_ipv6))
+        omit_ipv6 = "fe80:0000:0000::0204:61ff:fe9d:f156"
+        self.assertEqual(expanded_ipv6, utils.expand_ipv6(omit_ipv6))
+        less_num_ipv6 = "fe80:0:00:000:0204:61ff:fe9d:f156"
+        self.assertEqual(expanded_ipv6, utils.expand_ipv6(less_num_ipv6))
+
+
+class TestWhatAreMyIPs(unittest.TestCase):
+    def test_whataremyips(self):
+        myips = utils.whataremyips()
+        self.assertTrue(len(myips) > 1)
+        self.assertIn('127.0.0.1', myips)
+
+    def test_whataremyips_bind_to_all(self):
+        for any_addr in ('0.0.0.0', '0000:0000:0000:0000:0000:0000:0000:0000',
+                         '::0', '::0000', '::',
+                         # Wacky parse-error input produces all IPs
+                         'I am a bear'):
+            myips = utils.whataremyips(any_addr)
+            self.assertTrue(len(myips) > 1)
+            self.assertIn('127.0.0.1', myips)
+
+    def test_whataremyips_bind_ip_specific(self):
+        self.assertEqual(['1.2.3.4'], utils.whataremyips('1.2.3.4'))
+
+    def test_whataremyips_getifaddrs(self):
+        def mock_getifaddrs(ptr):
+            addrs = [
+                utils_ipaddrs.ifaddrs(None, b'lo', 0, ctypes.pointer(
+                    utils_ipaddrs.sockaddr_in4(
+                        sin_family=socket.AF_INET,
+                        sin_addr=(127, 0, 0, 1)))),
+                utils_ipaddrs.ifaddrs(None, b'lo', 0, ctypes.cast(
+                    ctypes.pointer(utils_ipaddrs.sockaddr_in6(
+                        sin6_family=socket.AF_INET6,
+                        sin6_addr=(
+                            0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1))),
+                    ctypes.POINTER(utils_ipaddrs.sockaddr_in4))),
+                utils_ipaddrs.ifaddrs(None, b'eth0', 0, ctypes.pointer(
+                    utils_ipaddrs.sockaddr_in4(
+                        sin_family=socket.AF_INET,
+                        sin_addr=(192, 168, 50, 63)))),
+                utils_ipaddrs.ifaddrs(None, b'eth0', 0, ctypes.cast(
+                    ctypes.pointer(utils_ipaddrs.sockaddr_in6(
+                        sin6_family=socket.AF_INET6,
+                        sin6_addr=(
+                            254, 128, 0, 0, 0, 0, 0, 0,
+                            106, 191, 199, 168, 109, 243, 41, 35))),
+                    ctypes.POINTER(utils_ipaddrs.sockaddr_in4))),
+                # MAC address will be ignored
+                utils_ipaddrs.ifaddrs(None, b'eth0', 0, ctypes.cast(
+                    ctypes.pointer(utils_ipaddrs.sockaddr_in6(
+                        sin6_family=getattr(socket, 'AF_PACKET', 17),
+                        sin6_port=0,
+                        sin6_flowinfo=2,
+                        sin6_addr=(
+                            1, 0, 0, 6, 172, 116, 177, 85,
+                            64, 146, 0, 0, 0, 0, 0, 0))),
+                    ctypes.POINTER(utils_ipaddrs.sockaddr_in4))),
+                # Seen in the wild: no addresses at all
+                utils_ipaddrs.ifaddrs(None, b'cscotun0', 69841),
+            ]
+            for cur, nxt in zip(addrs, addrs[1:]):
+                cur.ifa_next = ctypes.pointer(nxt)
+            ptr._obj.contents = addrs[0]
+
+        with patch.object(utils_ipaddrs, 'getifaddrs', mock_getifaddrs), \
+                patch('swift.common.utils.ipaddrs.freeifaddrs') as mock_free:
+            self.assertEqual(utils.whataremyips(), [
+                '127.0.0.1',
+                '::1',
+                '192.168.50.63',
+                'fe80::6abf:c7a8:6df3:2923',
+            ])
+            self.assertEqual(len(mock_free.mock_calls), 1)
diff --git a/test/unit/common/utils/test_libc.py b/test/unit/common/utils/test_libc.py
new file mode 100644
index 0000000000..9d06293ef8
--- /dev/null
+++ b/test/unit/common/utils/test_libc.py
@@ -0,0 +1,167 @@
+# Copyright (c) 2010-2023 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""Tests for swift.common.utils.libc"""
+
+import ctypes
+import os
+import platform
+import tempfile
+import unittest
+
+from unittest import mock
+
+from swift.common.utils import libc
+
+from test.debug_logger import debug_logger
+
+
+class Test_LibcWrapper(unittest.TestCase):
+    def test_available_function(self):
+        # This should pretty much always exist
+        getpid_wrapper = libc._LibcWrapper('getpid')
+        self.assertTrue(getpid_wrapper.available)
+        self.assertEqual(getpid_wrapper(), os.getpid())
+
+    def test_unavailable_function(self):
+        # This won't exist
+        no_func_wrapper = libc._LibcWrapper('diffractively_protectorship')
+        self.assertFalse(no_func_wrapper.available)
+        self.assertRaises(NotImplementedError, no_func_wrapper)
+
+    def test_argument_plumbing(self):
+        lseek_wrapper = libc._LibcWrapper('lseek')
+        with tempfile.TemporaryFile() as tf:
+            tf.write(b"abcdefgh")
+            tf.flush()
+            lseek_wrapper(tf.fileno(),
+                          ctypes.c_uint64(3),
+                          # 0 is SEEK_SET
+                          0)
+            self.assertEqual(tf.read(100), b"defgh")
+
+
+class TestModifyPriority(unittest.TestCase):
+    def test_modify_priority(self):
+        pid = os.getpid()
+        logger = debug_logger()
+        called = {}
+
+        def _fake_setpriority(*args):
+            called['setpriority'] = args
+
+        def _fake_syscall(*args):
+            called['syscall'] = args
+
+        # Test if current architecture supports changing of priority
+        try:
+            libc.NR_ioprio_set()
+        except OSError as e:
+            raise unittest.SkipTest(e)
+
+        with mock.patch('swift.common.utils.libc._libc_setpriority',
+                        _fake_setpriority), \
+                mock.patch('swift.common.utils.libc._posix_syscall',
+                           _fake_syscall):
+            called = {}
+            # not set / default
+            libc.modify_priority({}, logger)
+            self.assertEqual(called, {})
+            called = {}
+            # just nice
+            libc.modify_priority({'nice_priority': '1'}, logger)
+            self.assertEqual(called, {'setpriority': (0, pid, 1)})
+            called = {}
+            # just ionice class uses default priority 0
+            libc.modify_priority({'ionice_class': 'IOPRIO_CLASS_RT'}, logger)
+            architecture = os.uname()[4]
+            arch_bits = platform.architecture()[0]
+            if architecture == 'x86_64' and arch_bits == '64bit':
+                self.assertEqual(called, {'syscall': (251, 1, pid, 1 << 13)})
+            elif architecture == 'aarch64' and arch_bits == '64bit':
+                self.assertEqual(called, {'syscall': (30, 1, pid, 1 << 13)})
+            else:
+                self.fail("Unexpected call: %r" % called)
+            called = {}
+            # just ionice priority is ignored
+            libc.modify_priority({'ionice_priority': '4'}, logger)
+            self.assertEqual(called, {})
+            called = {}
+            # bad ionice class
+            libc.modify_priority({'ionice_class': 'class_foo'}, logger)
+            self.assertEqual(called, {})
+            called = {}
+            # ionice class & priority
+            libc.modify_priority({
+                'ionice_class': 'IOPRIO_CLASS_BE',
+                'ionice_priority': '4',
+            }, logger)
+            if architecture == 'x86_64' and arch_bits == '64bit':
+                self.assertEqual(called, {
+                    'syscall': (251, 1, pid, 2 << 13 | 4)
+                })
+            elif architecture == 'aarch64' and arch_bits == '64bit':
+                self.assertEqual(called, {
+                    'syscall': (30, 1, pid, 2 << 13 | 4)
+                })
+            else:
+                self.fail("Unexpected call: %r" % called)
+            called = {}
+            # all
+            libc.modify_priority({
+                'nice_priority': '-15',
+                'ionice_class': 'IOPRIO_CLASS_IDLE',
+                'ionice_priority': '6',
+            }, logger)
+            if architecture == 'x86_64' and arch_bits == '64bit':
+                self.assertEqual(called, {
+                    'setpriority': (0, pid, -15),
+                    'syscall': (251, 1, pid, 3 << 13 | 6),
+                })
+            elif architecture == 'aarch64' and arch_bits == '64bit':
+                self.assertEqual(called, {
+                    'setpriority': (0, pid, -15),
+                    'syscall': (30, 1, pid, 3 << 13 | 6),
+                })
+            else:
+                self.fail("Unexpected call: %r" % called)
+
+    def test__NR_ioprio_set(self):
+        with mock.patch('os.uname', return_value=('', '', '', '', 'x86_64')), \
+                mock.patch('platform.architecture',
+                           return_value=('64bit', '')):
+            self.assertEqual(251, libc.NR_ioprio_set())
+
+        with mock.patch('os.uname', return_value=('', '', '', '', 'x86_64')), \
+                mock.patch('platform.architecture',
+                           return_value=('32bit', '')):
+            self.assertRaises(OSError, libc.NR_ioprio_set)
+
+        with mock.patch('os.uname',
+                        return_value=('', '', '', '', 'aarch64')), \
+                mock.patch('platform.architecture',
+                           return_value=('64bit', '')):
+            self.assertEqual(30, libc.NR_ioprio_set())
+
+        with mock.patch('os.uname',
+                        return_value=('', '', '', '', 'aarch64')), \
+                mock.patch('platform.architecture',
+                           return_value=('32bit', '')):
+            self.assertRaises(OSError, libc.NR_ioprio_set)
+
+        with mock.patch('os.uname', return_value=('', '', '', '', 'alpha')), \
+                mock.patch('platform.architecture',
+                           return_value=('64bit', '')):
+            self.assertRaises(OSError, libc.NR_ioprio_set)
diff --git a/test/unit/common/utils/test_logs.py b/test/unit/common/utils/test_logs.py
new file mode 100644
index 0000000000..89c76ea257
--- /dev/null
+++ b/test/unit/common/utils/test_logs.py
@@ -0,0 +1,1437 @@
+# Copyright (c) 2010-2024 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""Tests for swift.common.utils.logs"""
+
+import contextlib
+import errno
+import logging
+import os
+import socket
+import sys
+import time
+import unittest
+import eventlet
+import functools
+from unittest import mock
+
+from io import StringIO
+import http.client
+
+from test.unit import with_tempdir
+from test.unit import quiet_eventlet_exceptions
+from test.unit.common.test_utils import MockOs, MockSys
+from swift.common.exceptions import Timeout, MessageTimeout, ConnectionTimeout
+
+import eventlet.green.http.client as green_http_client
+
+from swift.common import utils
+
+from swift.common.swob import Request, Response
+from swift.common.utils.logs import SwiftLogFormatter, SwiftLogAdapter, \
+    get_swift_logger, get_prefixed_swift_logger
+
+
+def reset_loggers():
+    if hasattr(get_swift_logger, 'handler4logger'):
+        for logger, handler in get_swift_logger.handler4logger.items():
+            logger.removeHandler(handler)
+        delattr(get_swift_logger, 'handler4logger')
+    if hasattr(get_swift_logger, 'console_handler4logger'):
+        for logger, h in \
+                get_swift_logger.console_handler4logger.items():
+            logger.removeHandler(h)
+        delattr(get_swift_logger, 'console_handler4logger')
+    # Reset the LogAdapter class thread local state. Use get_swift_logger()
+    # here to fetch a LogAdapter instance because the items from
+    # get_swift_logger.handler4logger above are the underlying logger
+    # instances not the LogAdapter.
+    get_swift_logger(None).thread_locals = (None, None)
+
+
+def reset_logger_state(f):
+    @functools.wraps(f)
+    def wrapper(self, *args, **kwargs):
+        reset_loggers()
+        try:
+            return f(self, *args, **kwargs)
+        finally:
+            reset_loggers()
+    return wrapper
+
+
+class TestUtilsLogs(unittest.TestCase):
+
+    def test_NullLogger(self):
+        # Test swift.common.utils.NullLogger
+        sio = StringIO()
+        nl = utils.NullLogger()
+        nl.write('test')
+        self.assertEqual(sio.getvalue(), '')
+
+    def test_LoggerFileObject(self):
+        orig_stdout = sys.stdout
+        orig_stderr = sys.stderr
+        sio = StringIO()
+        handler = logging.StreamHandler(sio)
+        logger = logging.getLogger()
+        logger.addHandler(handler)
+        lfo_stdout = utils.LoggerFileObject(logger)
+        lfo_stderr = utils.LoggerFileObject(logger, 'STDERR')
+        print('test1')
+        self.assertEqual(sio.getvalue(), '')
+        sys.stdout = lfo_stdout
+        print('test2')
+        self.assertEqual(sio.getvalue(), 'STDOUT: test2\n')
+        sys.stderr = lfo_stderr
+        print('test4', file=sys.stderr)
+        self.assertEqual(sio.getvalue(), 'STDOUT: test2\nSTDERR: test4\n')
+        sys.stdout = orig_stdout
+        print('test5')
+        self.assertEqual(sio.getvalue(), 'STDOUT: test2\nSTDERR: test4\n')
+        print('test6', file=sys.stderr)
+        self.assertEqual(sio.getvalue(), 'STDOUT: test2\nSTDERR: test4\n'
+                         'STDERR: test6\n')
+        sys.stderr = orig_stderr
+        print('test8')
+        self.assertEqual(sio.getvalue(), 'STDOUT: test2\nSTDERR: test4\n'
+                         'STDERR: test6\n')
+        lfo_stdout.writelines(['a', 'b', 'c'])
+        self.assertEqual(sio.getvalue(), 'STDOUT: test2\nSTDERR: test4\n'
+                         'STDERR: test6\nSTDOUT: a#012b#012c\n')
+        lfo_stdout.close()
+        lfo_stderr.close()
+        lfo_stdout.write('d')
+        self.assertEqual(sio.getvalue(), 'STDOUT: test2\nSTDERR: test4\n'
+                         'STDERR: test6\nSTDOUT: a#012b#012c\nSTDOUT: d\n')
+        lfo_stdout.flush()
+        self.assertEqual(sio.getvalue(), 'STDOUT: test2\nSTDERR: test4\n'
+                         'STDERR: test6\nSTDOUT: a#012b#012c\nSTDOUT: d\n')
+        for lfo in (lfo_stdout, lfo_stderr):
+            got_exc = False
+            try:
+                for line in lfo:
+                    pass
+            except Exception:
+                got_exc = True
+            self.assertTrue(got_exc)
+            got_exc = False
+            try:
+                for line in lfo:
+                    pass
+            except Exception:
+                got_exc = True
+            self.assertTrue(got_exc)
+            self.assertRaises(IOError, lfo.read)
+            self.assertRaises(IOError, lfo.read, 1024)
+            self.assertRaises(IOError, lfo.readline)
+            self.assertRaises(IOError, lfo.readline, 1024)
+            lfo.tell()
+
+    def test_LoggerFileObject_recursion(self):
+        crashy_calls = [0]
+
+        class CrashyLogger(logging.Handler):
+            def emit(self, record):
+                crashy_calls[0] += 1
+                try:
+                    # Pretend to be trying to send to syslog, but syslogd is
+                    # dead. We need the raise here to set sys.exc_info.
+                    raise socket.error(errno.ENOTCONN, "This is an ex-syslog")
+                except socket.error:
+                    self.handleError(record)
+
+        logger = logging.getLogger()
+        logger.setLevel(logging.DEBUG)
+        handler = CrashyLogger()
+        logger.addHandler(handler)
+
+        # Set up some real file descriptors for stdio. If you run
+        # nosetests with "-s", you already have real files there, but
+        # otherwise they're StringIO objects.
+        #
+        # In any case, since capture_stdio() closes sys.stdin and friends,
+        # we'd want to set up some sacrificial files so as to not goof up
+        # the testrunner.
+        new_stdin = open(os.devnull, 'r+b')
+        new_stdout = open(os.devnull, 'w+b')
+        new_stderr = open(os.devnull, 'w+b')
+
+        with contextlib.closing(new_stdin), contextlib.closing(new_stdout), \
+                contextlib.closing(new_stderr):
+            # logging.raiseExceptions is set to False in test/__init__.py, but
+            # is True in Swift daemons, and the error doesn't manifest without
+            # it.
+            with mock.patch('sys.stdin', new_stdin), \
+                    mock.patch('sys.stdout', new_stdout), \
+                    mock.patch('sys.stderr', new_stderr), \
+                    mock.patch.object(logging, 'raiseExceptions', True):
+                # Note: since stdio is hooked up to /dev/null in here, using
+                # pdb is basically impossible. Sorry about that.
+                utils.capture_stdio(logger)
+                logger.info("I like ham")
+                self.assertGreaterEqual(crashy_calls[0], 1)
+
+        logger.removeHandler(handler)
+
+    def test_get_swift_logger(self):
+        sio = StringIO()
+        logger = logging.getLogger('server')
+        logger.addHandler(logging.StreamHandler(sio))
+        logger = get_swift_logger(None, 'server', log_route='server')
+        logger.warning('test1')
+        self.assertEqual(sio.getvalue(), 'test1\n')
+        logger.debug('test2')
+        self.assertEqual(sio.getvalue(), 'test1\n')
+        logger = get_swift_logger({'log_level': 'DEBUG'}, 'server',
+                                  log_route='server')
+        logger.debug('test3')
+        self.assertEqual(sio.getvalue(), 'test1\ntest3\n')
+        # Doesn't really test that the log facility is truly being used all the
+        # way to syslog; but exercises the code.
+        logger = get_swift_logger({'log_facility': 'LOG_LOCAL3'}, 'server',
+                                  log_route='server')
+        logger.warning('test4')
+        self.assertEqual(sio.getvalue(),
+                         'test1\ntest3\ntest4\n')
+        # make sure debug doesn't log by default
+        logger.debug('test5')
+        self.assertEqual(sio.getvalue(),
+                         'test1\ntest3\ntest4\n')
+        # make sure notice lvl logs by default
+        logger.notice('test6')
+        self.assertEqual(sio.getvalue(),
+                         'test1\ntest3\ntest4\ntest6\n')
+
+    def test_get_swift_logger_name_and_route(self):
+        @contextlib.contextmanager
+        def add_log_handler(logger):
+            # install a handler to capture log messages formatted as per swift
+            sio = StringIO()
+            handler = logging.StreamHandler(sio)
+            handler.setFormatter(SwiftLogFormatter(
+                fmt="%(server)s: %(message)s", max_line_length=20)
+            )
+            logger.logger.addHandler(handler)
+            yield sio
+            logger.logger.removeHandler(handler)
+
+        logger = utils.get_swift_logger({}, name='name', log_route='route')
+        # log_route becomes the LogAdapter.name and logging.Logger.name
+        self.assertEqual('route', logger.name)
+        self.assertEqual('route', logger.logger.name)
+        # name becomes the LogAdapter.server!
+        self.assertEqual('name', logger.server)
+        # LogAdapter.server is used when formatting a log message
+        with add_log_handler(logger) as sio:
+            logger.info('testing')
+            self.assertEqual('name: testing\n', sio.getvalue())
+
+        logger = utils.get_swift_logger({'log_name': 'conf-name'},
+                                        name='name', log_route='route')
+        self.assertEqual('route', logger.name)
+        self.assertEqual('name', logger.server)
+        with add_log_handler(logger) as sio:
+            logger.info('testing')
+            self.assertEqual('name: testing\n', sio.getvalue())
+
+        logger = utils.get_swift_logger({'log_name': 'conf-name'},
+                                        log_route='route')
+        self.assertEqual('route', logger.name)
+        self.assertEqual('conf-name', logger.server)
+        with add_log_handler(logger) as sio:
+            logger.info('testing')
+            self.assertEqual('conf-name: testing\n', sio.getvalue())
+
+        logger = utils.get_swift_logger({'log_name': 'conf-name'})
+        self.assertEqual('conf-name', logger.name)
+        self.assertEqual('conf-name', logger.server)
+        with add_log_handler(logger) as sio:
+            logger.info('testing')
+            self.assertEqual('conf-name: testing\n', sio.getvalue())
+
+        logger = utils.get_swift_logger({})
+        self.assertEqual('swift', logger.name)
+        self.assertEqual('swift', logger.server)
+        with add_log_handler(logger) as sio:
+            logger.info('testing')
+            self.assertEqual('swift: testing\n', sio.getvalue())
+
+        logger = utils.get_swift_logger({}, log_route='route')
+        self.assertEqual('route', logger.name)
+        self.assertEqual('swift', logger.server)
+        with add_log_handler(logger) as sio:
+            logger.info('testing')
+            self.assertEqual('swift: testing\n', sio.getvalue())
+
+        # same log_route, different names...
+        logger1 = utils.get_swift_logger({}, name='name1', log_route='route')
+        logger2 = utils.get_swift_logger({}, name='name2', log_route='route')
+        self.assertEqual('route', logger1.name)
+        self.assertEqual('route', logger1.logger.name)
+        self.assertEqual('name1', logger1.server)
+        self.assertEqual('route', logger2.name)
+        self.assertEqual('route', logger2.logger.name)
+        self.assertEqual('name2', logger2.server)
+        self.assertIs(logger2.logger, logger1.logger)
+        with add_log_handler(logger1) as sio:
+            logger1.info('testing')
+            self.assertEqual('name1: testing\n', sio.getvalue())
+        with add_log_handler(logger2) as sio:
+            logger2.info('testing')
+            self.assertEqual('name2: testing\n', sio.getvalue())
+
+        # different log_route, different names...
+        logger1 = utils.get_swift_logger({}, name='name1', log_route='route1')
+        logger2 = utils.get_swift_logger({}, name='name2', log_route='route2')
+        self.assertEqual('route1', logger1.name)
+        self.assertEqual('route1', logger1.logger.name)
+        self.assertEqual('name1', logger1.server)
+        self.assertEqual('route2', logger2.name)
+        self.assertEqual('route2', logger2.logger.name)
+        self.assertEqual('name2', logger2.server)
+        self.assertIsNot(logger2.logger, logger1.logger)
+        with add_log_handler(logger1) as sio:
+            logger1.info('testing')
+            self.assertEqual('name1: testing\n', sio.getvalue())
+        with add_log_handler(logger2) as sio:
+            logger2.info('testing')
+            self.assertEqual('name2: testing\n', sio.getvalue())
+
+    @with_tempdir
+    def test_get_swift_logger_sysloghandler_plumbing(self, tempdir):
+        orig_sysloghandler = utils.logs.ThreadSafeSysLogHandler
+        syslog_handler_args = []
+
+        def syslog_handler_catcher(*args, **kwargs):
+            syslog_handler_args.append((args, kwargs))
+            return orig_sysloghandler(*args, **kwargs)
+
+        syslog_handler_catcher.LOG_LOCAL0 = orig_sysloghandler.LOG_LOCAL0
+        syslog_handler_catcher.LOG_LOCAL3 = orig_sysloghandler.LOG_LOCAL3
+
+        # Some versions of python perform host resolution while initializing
+        # the handler. See https://bugs.python.org/issue30378
+        orig_getaddrinfo = socket.getaddrinfo
+
+        def fake_getaddrinfo(host, *args):
+            return orig_getaddrinfo('localhost', *args)
+
+        with mock.patch.object(utils.logs, 'ThreadSafeSysLogHandler',
+                               syslog_handler_catcher), \
+                mock.patch.object(socket, 'getaddrinfo', fake_getaddrinfo):
+            # default log_address
+            get_swift_logger({
+                'log_facility': 'LOG_LOCAL3',
+            }, 'server', log_route='server')
+            expected_args = [((), {'address': '/dev/log',
+                                   'facility': orig_sysloghandler.LOG_LOCAL3})]
+            if not os.path.exists('/dev/log') or \
+                    os.path.isfile('/dev/log') or \
+                    os.path.isdir('/dev/log'):
+                # Since socket on OSX is in /var/run/syslog, there will be
+                # a fallback to UDP.
+                expected_args = [
+                    ((), {'facility': orig_sysloghandler.LOG_LOCAL3})]
+            self.assertEqual(expected_args, syslog_handler_args)
+
+            # custom log_address - file doesn't exist: fallback to UDP
+            log_address = os.path.join(tempdir, 'foo')
+            syslog_handler_args = []
+            get_swift_logger({
+                'log_facility': 'LOG_LOCAL3',
+                'log_address': log_address,
+            }, 'server', log_route='server')
+            expected_args = [
+                ((), {'facility': orig_sysloghandler.LOG_LOCAL3})]
+            self.assertEqual(
+                expected_args, syslog_handler_args)
+
+            # custom log_address - file exists, not a socket: fallback to UDP
+            with open(log_address, 'w'):
+                pass
+            syslog_handler_args = []
+            get_swift_logger({
+                'log_facility': 'LOG_LOCAL3',
+                'log_address': log_address,
+            }, 'server', log_route='server')
+            expected_args = [
+                ((), {'facility': orig_sysloghandler.LOG_LOCAL3})]
+            self.assertEqual(
+                expected_args, syslog_handler_args)
+
+            # custom log_address - file exists, is a socket: use it
+            os.unlink(log_address)
+            with contextlib.closing(
+                    socket.socket(socket.AF_UNIX, socket.SOCK_DGRAM)) as sock:
+                sock.settimeout(5)
+                sock.bind(log_address)
+                syslog_handler_args = []
+                get_swift_logger({
+                    'log_facility': 'LOG_LOCAL3',
+                    'log_address': log_address,
+                }, 'server', log_route='server')
+            expected_args = [
+                ((), {'address': log_address,
+                      'facility': orig_sysloghandler.LOG_LOCAL3})]
+            self.assertEqual(
+                expected_args, syslog_handler_args)
+
+            # Using UDP with default port
+            syslog_handler_args = []
+            get_swift_logger({
+                'log_udp_host': 'syslog.funtimes.com',
+            }, 'server', log_route='server')
+            self.assertEqual([
+                ((), {'address': ('syslog.funtimes.com',
+                                  logging.handlers.SYSLOG_UDP_PORT),
+                      'facility': orig_sysloghandler.LOG_LOCAL0})],
+                syslog_handler_args)
+
+            # Using UDP with non-default port
+            syslog_handler_args = []
+            get_swift_logger({
+                'log_udp_host': 'syslog.funtimes.com',
+                'log_udp_port': '2123',
+            }, 'server', log_route='server')
+            self.assertEqual([
+                ((), {'address': ('syslog.funtimes.com', 2123),
+                      'facility': orig_sysloghandler.LOG_LOCAL0})],
+                syslog_handler_args)
+
+        with mock.patch.object(utils.logs, 'ThreadSafeSysLogHandler',
+                               side_effect=OSError(errno.EPERM, 'oops')):
+            with self.assertRaises(OSError) as cm:
+                get_swift_logger({
+                    'log_facility': 'LOG_LOCAL3',
+                    'log_address': 'log_address',
+                }, 'server', log_route='server')
+        self.assertEqual(errno.EPERM, cm.exception.errno)
+
+    def test_get_swift_logger_custom_log_handlers(self):
+        def custom_log_handler(conf, name, log_to_console, log_route, fmt,
+                               logger, adapted_logger):
+            adapted_logger.server = adapted_logger.server.upper()
+
+        sio = StringIO()
+        logger = logging.getLogger('my_logger_name')
+        handler = logging.StreamHandler(sio)
+        logger.addHandler(handler)
+        formatter = logging.Formatter('%(levelname)s: %(server)s %(message)s')
+        handler.setFormatter(formatter)
+
+        # sanity check...
+        conf = {}
+        adapted_logger = get_swift_logger(
+            conf, 'my_server', log_route='my_logger_name')
+        adapted_logger.warning('test')
+        self.assertEqual(sio.getvalue(),
+                         'WARNING: my_server test\n')
+
+        # custom log handler...
+        sio = StringIO()
+        handler.stream = sio
+        patch_target = 'test.unit.common.utils.custom_log_handler'
+        conf = {'log_custom_handlers': patch_target}
+        with mock.patch(patch_target, custom_log_handler, create=True):
+            adapted_logger = get_swift_logger(
+                conf, 'my_server', log_route='my_logger_name')
+            adapted_logger.warning('test')
+        self.assertEqual(sio.getvalue(),
+                         'WARNING: MY_SERVER test\n')
+
+    @reset_logger_state
+    def test_clean_logger_exception(self):
+        # setup stream logging
+        sio = StringIO()
+        logger = get_swift_logger(None)
+        handler = logging.StreamHandler(sio)
+        logger.logger.addHandler(handler)
+
+        def strip_value(sio):
+            sio.seek(0)
+            v = sio.getvalue()
+            sio.truncate(0)
+            return v
+
+        def log_exception(exc):
+            try:
+                raise exc
+            except (Exception, Timeout):
+                logger.exception('blah')
+        try:
+            # establish base case
+            self.assertEqual(strip_value(sio), '')
+            logger.info('test')
+            self.assertEqual(strip_value(sio), 'test\n')
+            self.assertEqual(strip_value(sio), '')
+            logger.info('test')
+            logger.info('test')
+            self.assertEqual(strip_value(sio), 'test\ntest\n')
+            self.assertEqual(strip_value(sio), '')
+
+            # test OSError
+            for en in (errno.EIO, errno.ENOSPC):
+                log_exception(OSError(en, 'my %s error message' % en))
+                log_msg = strip_value(sio)
+                self.assertNotIn('Traceback', log_msg)
+                self.assertIn('my %s error message' % en, log_msg)
+            # unfiltered
+            log_exception(OSError())
+            self.assertTrue('Traceback' in strip_value(sio))
+
+            # test socket.error
+            log_exception(socket.error(errno.ECONNREFUSED,
+                                       'my error message'))
+            log_msg = strip_value(sio)
+            self.assertNotIn('Traceback', log_msg)
+            self.assertNotIn('errno.ECONNREFUSED message test', log_msg)
+            self.assertIn('Connection refused', log_msg)
+            log_exception(socket.error(errno.EHOSTUNREACH,
+                                       'my error message'))
+            log_msg = strip_value(sio)
+            self.assertNotIn('Traceback', log_msg)
+            self.assertNotIn('my error message', log_msg)
+            self.assertIn('Host unreachable', log_msg)
+            log_exception(socket.error(errno.ETIMEDOUT, 'my error message'))
+            log_msg = strip_value(sio)
+            self.assertNotIn('Traceback', log_msg)
+            self.assertNotIn('my error message', log_msg)
+            self.assertIn('Connection timeout', log_msg)
+
+            log_exception(socket.error(errno.ENETUNREACH, 'my error message'))
+            log_msg = strip_value(sio)
+            self.assertNotIn('Traceback', log_msg)
+            self.assertNotIn('my error message', log_msg)
+            self.assertIn('Network unreachable', log_msg)
+
+            log_exception(socket.error(errno.EPIPE, 'my error message'))
+            log_msg = strip_value(sio)
+            self.assertNotIn('Traceback', log_msg)
+            self.assertNotIn('my error message', log_msg)
+            self.assertIn('Broken pipe', log_msg)
+            # unfiltered
+            log_exception(socket.error(0, 'my error message'))
+            log_msg = strip_value(sio)
+            self.assertIn('Traceback', log_msg)
+            self.assertIn('my error message', log_msg)
+
+            # test eventlet.Timeout
+            with ConnectionTimeout(42, 'my error message') \
+                    as connection_timeout:
+                now = time.time()
+                connection_timeout.created_at = now - 123.456
+                with mock.patch('swift.common.utils.time.time',
+                                return_value=now):
+                    log_exception(connection_timeout)
+                log_msg = strip_value(sio)
+                self.assertNotIn('Traceback', log_msg)
+                self.assertTrue('ConnectionTimeout' in log_msg)
+                self.assertTrue('(42s after 123.46s)' in log_msg)
+                self.assertNotIn('my error message', log_msg)
+
+            with MessageTimeout(42, 'my error message') as message_timeout:
+                log_exception(message_timeout)
+                log_msg = strip_value(sio)
+                self.assertNotIn('Traceback', log_msg)
+                self.assertTrue('MessageTimeout' in log_msg)
+                self.assertTrue('(42s)' in log_msg)
+                self.assertTrue('my error message' in log_msg)
+
+            # test BadStatusLine
+            log_exception(http.client.BadStatusLine(''))
+            log_msg = strip_value(sio)
+            self.assertNotIn('Traceback', log_msg)
+            self.assertIn('''BadStatusLine("''"''', log_msg)
+
+            # green version is separate :-(
+            log_exception(green_http_client.BadStatusLine(''))
+            log_msg = strip_value(sio)
+            self.assertNotIn('Traceback', log_msg)
+            self.assertIn('''BadStatusLine("''"''', log_msg)
+
+            # py3 introduced RemoteDisconnected exceptions which inherit
+            # from both BadStatusLine *and* OSError; make sure those are
+            # handled as BadStatusLine, not OSError
+            log_exception(http.client.RemoteDisconnected(
+                'Remote end closed connection'))
+            log_msg = strip_value(sio)
+            self.assertNotIn('Traceback', log_msg)
+            self.assertIn(
+                "RemoteDisconnected('Remote end closed connection'",
+                log_msg)
+
+            log_exception(green_http_client.RemoteDisconnected(
+                'Remote end closed connection'))
+            log_msg = strip_value(sio)
+            self.assertNotIn('Traceback', log_msg)
+            self.assertIn(
+                "RemoteDisconnected('Remote end closed connection'",
+                log_msg)
+
+            # test unhandled
+            log_exception(Exception('my error message'))
+            log_msg = strip_value(sio)
+            self.assertTrue('Traceback' in log_msg)
+            self.assertTrue('my error message' in log_msg)
+
+        finally:
+            logger.logger.removeHandler(handler)
+
+    @reset_logger_state
+    def test_swift_log_formatter_max_line_length(self):
+        # setup stream logging
+        sio = StringIO()
+        logger = get_swift_logger(None)
+        handler = logging.StreamHandler(sio)
+        formatter = utils.SwiftLogFormatter(max_line_length=10)
+        handler.setFormatter(formatter)
+        logger.logger.addHandler(handler)
+
+        def strip_value(sio):
+            sio.seek(0)
+            v = sio.getvalue()
+            sio.truncate(0)
+            return v
+
+        try:
+            logger.info('12345')
+            self.assertEqual(strip_value(sio), '12345\n')
+            logger.info('1234567890')
+            self.assertEqual(strip_value(sio), '1234567890\n')
+            logger.info('1234567890abcde')
+            self.assertEqual(strip_value(sio), '12 ... de\n')
+            formatter.max_line_length = 11
+            logger.info('1234567890abcde')
+            self.assertEqual(strip_value(sio), '123 ... cde\n')
+            formatter.max_line_length = 0
+            logger.info('1234567890abcde')
+            self.assertEqual(strip_value(sio), '1234567890abcde\n')
+            formatter.max_line_length = 1
+            logger.info('1234567890abcde')
+            self.assertEqual(strip_value(sio), '1\n')
+            formatter.max_line_length = 2
+            logger.info('1234567890abcde')
+            self.assertEqual(strip_value(sio), '12\n')
+            formatter.max_line_length = 3
+            logger.info('1234567890abcde')
+            self.assertEqual(strip_value(sio), '123\n')
+            formatter.max_line_length = 4
+            logger.info('1234567890abcde')
+            self.assertEqual(strip_value(sio), '1234\n')
+            formatter.max_line_length = 5
+            logger.info('1234567890abcde')
+            self.assertEqual(strip_value(sio), '12345\n')
+            formatter.max_line_length = 6
+            logger.info('1234567890abcde')
+            self.assertEqual(strip_value(sio), '123456\n')
+            formatter.max_line_length = 7
+            logger.info('1234567890abcde')
+            self.assertEqual(strip_value(sio), '1 ... e\n')
+            formatter.max_line_length = -10
+            logger.info('1234567890abcde')
+            self.assertEqual(strip_value(sio), '1234567890abcde\n')
+        finally:
+            logger.logger.removeHandler(handler)
+
+    @reset_logger_state
+    def test_swift_log_formatter(self):
+        # setup stream logging
+        sio = StringIO()
+        logger = get_swift_logger(None)
+        handler = logging.StreamHandler(sio)
+        handler.setFormatter(utils.SwiftLogFormatter())
+        logger.logger.addHandler(handler)
+
+        def strip_value(sio):
+            sio.seek(0)
+            v = sio.getvalue()
+            sio.truncate(0)
+            return v
+
+        try:
+            self.assertFalse(logger.txn_id)
+            logger.error('my error message')
+            log_msg = strip_value(sio)
+            self.assertIn('my error message', log_msg)
+            self.assertNotIn('txn', log_msg)
+            logger.txn_id = '12345'
+            logger.error('test')
+            log_msg = strip_value(sio)
+            self.assertIn('txn', log_msg)
+            self.assertIn('12345', log_msg)
+            # test txn in info message
+            self.assertEqual(logger.txn_id, '12345')
+            logger.info('test')
+            log_msg = strip_value(sio)
+            self.assertIn('txn', log_msg)
+            self.assertIn('12345', log_msg)
+            # test txn already in message
+            self.assertEqual(logger.txn_id, '12345')
+            logger.warning('test 12345 test')
+            self.assertEqual(strip_value(sio), 'test 12345 test\n')
+            # Test multi line collapsing
+            logger.error('my\nerror\nmessage')
+            log_msg = strip_value(sio)
+            self.assertIn('my#012error#012message', log_msg)
+
+            # test client_ip
+            self.assertFalse(logger.client_ip)
+            logger.error('my error message')
+            log_msg = strip_value(sio)
+            self.assertIn('my error message', log_msg)
+            self.assertNotIn('client_ip', log_msg)
+            logger.client_ip = '1.2.3.4'
+            logger.error('test')
+            log_msg = strip_value(sio)
+            self.assertIn('client_ip', log_msg)
+            self.assertIn('1.2.3.4', log_msg)
+            # test no client_ip on info message
+            self.assertEqual(logger.client_ip, '1.2.3.4')
+            logger.info('test')
+            log_msg = strip_value(sio)
+            self.assertNotIn('client_ip', log_msg)
+            self.assertNotIn('1.2.3.4', log_msg)
+            # test client_ip (and txn) already in message
+            self.assertEqual(logger.client_ip, '1.2.3.4')
+            logger.warning('test 1.2.3.4 test 12345')
+            self.assertEqual(strip_value(sio), 'test 1.2.3.4 test 12345\n')
+        finally:
+            logger.logger.removeHandler(handler)
+
+    @reset_logger_state
+    def test_get_prefixed_swift_logger(self):
+        # setup stream logging
+        sio = StringIO()
+        base_logger = get_swift_logger(None)
+        handler = logging.StreamHandler(sio)
+        base_logger.logger.addHandler(handler)
+        logger = get_prefixed_swift_logger(base_logger, 'some prefix: ')
+
+        def strip_value(sio):
+            sio.seek(0)
+            v = sio.getvalue()
+            sio.truncate(0)
+            return v
+
+        try:
+            # establish base case
+            self.assertEqual(strip_value(sio), '')
+            logger.info('test')
+            self.assertEqual(strip_value(sio), 'some prefix: test\n')
+
+            self.assertEqual(strip_value(sio), '')
+            logger.info('test')
+            logger.info('test')
+            self.assertEqual(
+                strip_value(sio),
+                'some prefix: test\nsome prefix: test\n')
+            self.assertEqual(strip_value(sio), '')
+        finally:
+            base_logger.logger.removeHandler(handler)
+
+    @reset_logger_state
+    def test_get_prefixed_swift_logger_exception_method(self):
+        # setup stream logging
+        sio = StringIO()
+        base_logger = get_swift_logger(None)
+        handler = logging.StreamHandler(sio)
+        base_logger.logger.addHandler(handler)
+        logger = get_prefixed_swift_logger(base_logger, 'some prefix: ')
+
+        def strip_value(sio):
+            sio.seek(0)
+            v = sio.getvalue()
+            sio.truncate(0)
+            return v
+
+        def log_exception(exc):
+            try:
+                raise exc
+            except (Exception, Timeout):
+                logger.exception('blah')
+            msg_lines = strip_value(sio).strip().split('\n')
+            return msg_lines
+
+        try:
+            # test OSError
+            for en in (errno.EIO, errno.ENOSPC):
+                exc = OSError(en, 'my %s error message' % en)
+                log_msg_lines = log_exception(exc)
+                self.assertEqual(1, len(log_msg_lines))
+                self.assertEqual('some prefix: blah: %s' % exc,
+                                 log_msg_lines[0])
+
+            # BadStatusLine
+            exc = http.client.BadStatusLine('my error message')
+            log_msg_lines = log_exception(exc)
+            self.assertEqual(1, len(log_msg_lines))
+            self.assertEqual("some prefix: blah: %r" % exc, log_msg_lines[0])
+
+            # Timeout
+            with ConnectionTimeout(99) as exc:
+                log_msg_lines = log_exception(exc)
+            self.assertEqual(1, len(log_msg_lines))
+            self.assertNotIn('Traceback', log_msg_lines[0])
+            self.assertEqual("some prefix: blah: ConnectionTimeout (99s)",
+                             log_msg_lines[0])
+
+            # unfiltered
+            for exc in (OSError(), ValueError()):
+                log_msg_lines = log_exception(exc)
+                self.assertEqual(2, len(log_msg_lines), log_msg_lines)
+                self.assertEqual('some prefix: blah: ', log_msg_lines[0])
+                traceback_lines = log_msg_lines[1].split('#012')
+                self.assertEqual('Traceback (most recent call last):',
+                                 traceback_lines[0])
+        finally:
+            base_logger.logger.removeHandler(handler)
+
+    @reset_logger_state
+    def test_get_prefixed_swift_logger_non_string_values(self):
+        # setup stream logging
+        sio = StringIO()
+        base_logger = get_swift_logger(None)
+        handler = logging.StreamHandler(sio)
+        base_logger.logger.addHandler(handler)
+        logger = get_prefixed_swift_logger(base_logger, 'some prefix: ')
+        exc = Exception('blah')
+
+        def strip_value(sio):
+            sio.seek(0)
+            v = sio.getvalue()
+            sio.truncate(0)
+            return v
+
+        try:
+            logger = get_prefixed_swift_logger(logger, 'abc')
+            self.assertEqual('abc', logger.prefix)
+            logger.info('test')
+            self.assertEqual(strip_value(sio), 'abctest\n')
+            logger.info(exc)
+            self.assertEqual(strip_value(sio), 'abcblah\n')
+
+            logger = get_prefixed_swift_logger(logger, '')
+            self.assertEqual('', logger.prefix)
+            logger.info('test')
+            self.assertEqual(strip_value(sio), 'test\n')
+            logger.info(exc)
+            self.assertEqual(strip_value(sio), 'blah\n')
+
+            logger = get_prefixed_swift_logger(logger, 0)
+            self.assertEqual(0, logger.prefix)
+            logger.info('test')
+            self.assertEqual(strip_value(sio), '0test\n')
+            logger.info(exc)
+            self.assertEqual(strip_value(sio), '0blah\n')
+        finally:
+            logger.logger.removeHandler(handler)
+
+    @reset_logger_state
+    def test_get_prefixed_swift_logger_replaces_prefix(self):
+        # setup stream logging
+        sio = StringIO()
+        base_logger = get_swift_logger(None)
+        handler = logging.StreamHandler(sio)
+        base_logger.logger.addHandler(handler)
+        logger1 = get_prefixed_swift_logger(base_logger, 'one: ')
+        logger2 = get_prefixed_swift_logger(logger1, 'two: ')
+
+        def strip_value(sio):
+            sio.seek(0)
+            v = sio.getvalue()
+            sio.truncate(0)
+            return v
+
+        try:
+            self.assertEqual(strip_value(sio), '')
+            base_logger.info('test')
+            self.assertEqual(strip_value(sio), 'test\n')
+
+            self.assertEqual(strip_value(sio), '')
+            logger1.info('test')
+            self.assertEqual(strip_value(sio), 'one: test\n')
+
+            self.assertEqual(strip_value(sio), '')
+            logger2.info('test')
+            self.assertEqual(strip_value(sio), 'two: test\n')
+        finally:
+            base_logger.logger.removeHandler(handler)
+
+    def test_get_prefixed_swift_logger_isolation(self):
+        # verify that the new instance's attributes are copied by value
+        # from the old (except prefix), but the thread_locals are still shared
+        adapted_logger = get_swift_logger(None, name='server')
+        adapted_logger.thread_locals = ('id', 'ip')
+        adapted_logger = get_prefixed_swift_logger(adapted_logger, 'foo')
+        self.assertEqual(adapted_logger.server, 'server')
+        self.assertEqual(adapted_logger.thread_locals, ('id', 'ip'))
+        self.assertEqual(adapted_logger.prefix, 'foo')
+
+        cloned_adapted_logger = get_prefixed_swift_logger(
+            adapted_logger, 'boo')
+        self.assertEqual(cloned_adapted_logger.server, 'server')
+        self.assertEqual(cloned_adapted_logger.thread_locals, ('id', 'ip'))
+        self.assertEqual(cloned_adapted_logger.txn_id, 'id')
+        self.assertEqual(cloned_adapted_logger.client_ip, 'ip')
+        self.assertEqual(adapted_logger.thread_locals, ('id', 'ip'))
+        self.assertEqual(cloned_adapted_logger.prefix, 'boo')
+        self.assertEqual(adapted_logger.prefix, 'foo')
+        self.assertIs(adapted_logger.logger, cloned_adapted_logger.logger)
+
+        cloned_adapted_logger = get_prefixed_swift_logger(
+            adapted_logger, adapted_logger.prefix + 'bar')
+        adapted_logger.server = 'waiter'
+        self.assertEqual(adapted_logger.server, 'waiter')
+        self.assertEqual(cloned_adapted_logger.server, 'server')
+        self.assertEqual(adapted_logger.prefix, 'foo')
+        self.assertEqual(cloned_adapted_logger.prefix, 'foobar')
+
+        adapted_logger.thread_locals = ('x', 'y')
+        self.assertEqual(adapted_logger.thread_locals, ('x', 'y'))
+        self.assertEqual(cloned_adapted_logger.thread_locals, ('x', 'y'))
+        self.assertIs(adapted_logger.logger, cloned_adapted_logger.logger)
+
+    @reset_logger_state
+    def test_capture_stdio(self):
+        # stubs
+        logger = get_swift_logger(None, 'dummy')
+
+        # mock utils system modules
+        mock_os = MockOs()
+        mock_sys = MockSys()
+        with mock.patch.object(utils.logs, 'os', mock_os), \
+                mock.patch.object(utils.logs, 'sys', mock_sys):
+            # basic test
+            utils.logs.capture_stdio(logger)
+            self.assertTrue(mock_sys.excepthook is not None)
+            self.assertEqual(mock_os.closed_fds, mock_sys.stdio_fds)
+            self.assertIsInstance(mock_sys.stdout,
+                                  utils.logs.LoggerFileObject)
+            self.assertIsInstance(mock_sys.stderr,
+                                  utils.logs.LoggerFileObject)
+
+        # reset; test same args, but exc when trying to close stdio
+        mock_os = MockOs(raise_funcs=('dup2',))
+        mock_sys = MockSys()
+        with mock.patch.object(utils.logs, 'os', mock_os), \
+                mock.patch.object(utils.logs, 'sys', mock_sys):
+            # test unable to close stdio
+            utils.logs.capture_stdio(logger)
+            self.assertTrue(utils.logs.sys.excepthook is not None)
+            self.assertEqual(utils.logs.os.closed_fds, [])
+            self.assertIsInstance(mock_sys.stdout,
+                                  utils.logs.LoggerFileObject)
+            self.assertIsInstance(mock_sys.stderr,
+                                  utils.logs.LoggerFileObject)
+
+        # reset; test some other args
+        mock_os = MockOs()
+        mock_sys = MockSys()
+        with mock.patch.object(utils.logs, 'os', mock_os), \
+                mock.patch.object(utils.logs, 'sys', mock_sys):
+            logger = get_swift_logger(None, log_to_console=True)
+
+            # test console log
+            utils.logs.capture_stdio(logger, capture_stdout=False,
+                                     capture_stderr=False)
+            self.assertTrue(utils.logs.sys.excepthook is not None)
+            # when logging to console, stderr remains open
+            self.assertEqual(mock_os.closed_fds,
+                             mock_sys.stdio_fds[:2])
+            reset_loggers()
+
+            # stdio not captured
+            self.assertFalse(isinstance(mock_sys.stdout,
+                                        utils.logs.LoggerFileObject))
+            self.assertFalse(isinstance(mock_sys.stderr,
+                                        utils.logs.LoggerFileObject))
+
+    @reset_logger_state
+    def test_get_swift_logger_console(self):
+        logger = get_swift_logger(None)
+        console_handlers = [h for h in logger.logger.handlers if
+                            isinstance(h, logging.StreamHandler)]
+        self.assertFalse(console_handlers)
+        logger = get_swift_logger(None, log_to_console=True)
+        console_handlers = [h for h in logger.logger.handlers if
+                            isinstance(h, logging.StreamHandler)]
+        self.assertTrue(console_handlers)
+        # make sure you can't have two console handlers
+        self.assertEqual(len(console_handlers), 1)
+        old_handler = console_handlers[0]
+        logger = get_swift_logger(None, log_to_console=True)
+        console_handlers = [h for h in logger.logger.handlers if
+                            isinstance(h, logging.StreamHandler)]
+        self.assertEqual(len(console_handlers), 1)
+        new_handler = console_handlers[0]
+        self.assertNotEqual(new_handler, old_handler)
+
+    def test_get_policy_index(self):
+        # Account has no information about a policy
+        req = Request.blank(
+            '/sda1/p/a',
+            environ={'REQUEST_METHOD': 'GET'})
+        res = Response()
+        self.assertIsNone(utils.get_policy_index(req.headers,
+                                                 res.headers))
+
+        # The policy of a container can be specified by the response header
+        req = Request.blank(
+            '/sda1/p/a/c',
+            environ={'REQUEST_METHOD': 'GET'})
+        res = Response(headers={'X-Backend-Storage-Policy-Index': '1'})
+        self.assertEqual('1', utils.get_policy_index(req.headers,
+                                                     res.headers))
+
+        # The policy of an object to be created can be specified by the request
+        # header
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Backend-Storage-Policy-Index': '2'})
+        res = Response()
+        self.assertEqual('2', utils.get_policy_index(req.headers,
+                                                     res.headers))
+
+    def test_log_string_formatter(self):
+        # Plain ASCII
+        lf = utils.LogStringFormatter()
+        self.assertEqual(lf.format('{a} {b}', a='Swift is', b='great'),
+                         'Swift is great')
+
+        lf = utils.LogStringFormatter()
+        self.assertEqual(lf.format('{a} {b}', a='', b='great'),
+                         ' great')
+
+        lf = utils.LogStringFormatter(default='-')
+        self.assertEqual(lf.format('{a} {b}', a='', b='great'),
+                         '- great')
+
+        lf = utils.LogStringFormatter(default='-', quote=True)
+        self.assertEqual(lf.format('{a} {b}', a='', b='great'),
+                         '- great')
+
+        lf = utils.LogStringFormatter(quote=True)
+        self.assertEqual(lf.format('{a} {b}', a='Swift is', b='great'),
+                         'Swift%20is great')
+
+        # Unicode & co
+        lf = utils.LogStringFormatter()
+        self.assertEqual(lf.format('{a} {b}', a='Swift est',
+                                   b=u'g\u00e9nial ^^'),
+                         u'Swift est g\u00e9nial ^^')
+
+        lf = utils.LogStringFormatter(quote=True)
+        self.assertEqual(lf.format('{a} {b}', a='Swift est',
+                                   b=u'g\u00e9nial ^^'),
+                         'Swift%20est g%C3%A9nial%20%5E%5E')
+
+    def test_str_anonymizer(self):
+        anon = utils.StrAnonymizer('Swift is great!', 'md5', '')
+        self.assertEqual(anon, 'Swift is great!')
+        self.assertEqual(anon.anonymized,
+                         '{MD5}45e6f00d48fdcf86213602a87df18772')
+
+        anon = utils.StrAnonymizer('Swift is great!', 'sha1', '')
+        self.assertEqual(anon, 'Swift is great!')
+        self.assertEqual(anon.anonymized,
+                         '{SHA1}0010a3df215495d8bfa0ae4b66acc2afcc8f4c5c')
+
+        anon = utils.StrAnonymizer('Swift is great!', 'md5', 'salty_secret')
+        self.assertEqual(anon, 'Swift is great!')
+        self.assertEqual(anon.anonymized,
+                         '{SMD5}ef4ce28fe3bdd10b6659458ceb1f3f0c')
+
+        anon = utils.StrAnonymizer('Swift is great!', 'sha1', 'salty_secret')
+        self.assertEqual(anon, 'Swift is great!')
+        self.assertEqual(anon.anonymized,
+                         '{SSHA1}a4968f76acaddff0eb4069ebe8805d9cab44c9fe')
+
+        self.assertRaises(ValueError, utils.StrAnonymizer,
+                          'Swift is great!', 'sha257', '')
+
+    def test_str_anonymizer_python_maddness(self):
+        utils.StrAnonymizer('Swift is great!', 'sha1', '')
+        self.assertRaises(ValueError, utils.StrAnonymizer,
+                          'Swift is great!', 'sha257', '')
+
+    def test_str_format_time(self):
+        dt = utils.StrFormatTime(10000.123456789)
+        self.assertEqual(str(dt), '10000.123456789')
+        self.assertEqual(dt.datetime, '01/Jan/1970/02/46/40')
+        self.assertEqual(dt.iso8601, '1970-01-01T02:46:40')
+        self.assertEqual(dt.asctime, 'Thu Jan  1 02:46:40 1970')
+        self.assertEqual(dt.s, '10000')
+        self.assertEqual(dt.ms, '123')
+        self.assertEqual(dt.us, '123456')
+        self.assertEqual(dt.ns, '123456789')
+        self.assertEqual(dt.a, 'Thu')
+        self.assertEqual(dt.A, 'Thursday')
+        self.assertEqual(dt.b, 'Jan')
+        self.assertEqual(dt.B, 'January')
+        self.assertEqual(dt.c, 'Thu Jan  1 02:46:40 1970')
+        self.assertEqual(dt.d, '01')
+        self.assertEqual(dt.H, '02')
+        self.assertEqual(dt.I, '02')
+        self.assertEqual(dt.j, '001')
+        self.assertEqual(dt.m, '01')
+        self.assertEqual(dt.M, '46')
+        self.assertEqual(dt.p, 'AM')
+        self.assertEqual(dt.S, '40')
+        self.assertEqual(dt.U, '00')
+        self.assertEqual(dt.w, '4')
+        self.assertEqual(dt.W, '00')
+        self.assertEqual(dt.x, '01/01/70')
+        self.assertEqual(dt.X, '02:46:40')
+        self.assertEqual(dt.y, '70')
+        self.assertEqual(dt.Y, '1970')
+        self.assertIn(dt.Z, ('GMT', 'UTC'))  # It depends of Python 2/3
+        self.assertRaises(ValueError, getattr, dt, 'z')
+
+    def test_get_log_line(self):
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'HEAD', 'REMOTE_ADDR': '1.2.3.4'})
+        res = Response()
+        trans_time = 1.2
+        additional_info = 'some information'
+        server_pid = 1234
+        exp_line = '1.2.3.4 - - [01/Jan/1970:02:46:41 +0000] "HEAD ' \
+            '/sda1/p/a/c/o" 200 - "-" "-" "-" 1.2000 "some information" 1234 -'
+        with mock.patch('time.time', mock.MagicMock(side_effect=[10001.0])):
+            with mock.patch(
+                    'os.getpid', mock.MagicMock(return_value=server_pid)):
+                self.assertEqual(
+                    exp_line,
+                    utils.get_log_line(req, res, trans_time, additional_info,
+                                       utils.LOG_LINE_DEFAULT_FORMAT,
+                                       'md5', '54LT'))
+
+
+class TestSwiftLogAdapter(unittest.TestCase):
+
+    def setUp(self):
+        self.core_logger = logging.getLogger('test')
+        self.core_logger.setLevel(logging.INFO)
+        self.sio = StringIO()
+        self.handler = logging.StreamHandler(self.sio)
+        self.core_logger.addHandler(self.handler)
+
+    def tearDown(self):
+        self.core_logger.removeHandler(self.handler)
+
+    def read_sio(self):
+        self.sio.seek(0)
+        v = self.sio.getvalue()
+        self.sio.truncate(0)
+        return v
+
+    def test_init(self):
+        adapter = SwiftLogAdapter(self.core_logger, 'my-server')
+        self.assertIs(self.core_logger, adapter.logger)
+        self.assertEqual('my-server', adapter.server)
+        self.assertEqual('', adapter.prefix)
+        adapter.info('hello')
+        self.assertEqual('hello\n', self.read_sio())
+
+    def test_init_with_prefix(self):
+        adapter = SwiftLogAdapter(self.core_logger, 'my-server', 'my-prefix: ')
+        self.assertIs(self.core_logger, adapter.logger)
+        self.assertEqual('my-server', adapter.server)
+        self.assertEqual('my-prefix: ', adapter.prefix)
+        adapter.info('hello')
+        self.assertEqual('my-prefix: hello\n', self.read_sio())
+
+    def test_formatter_extras(self):
+        formatter = logging.Formatter(
+            '%(levelname)s: %(server)s %(message)s %(txn_id)s %(client_ip)s')
+        self.handler.setFormatter(formatter)
+        adapter = SwiftLogAdapter(self.core_logger, 'my-server')
+        adapter.txn_id = 'my-txn-id'
+        adapter.client_ip = '1.2.3.4'
+        adapter.info('hello')
+        self.assertEqual('INFO: my-server hello my-txn-id 1.2.3.4\n',
+                         self.read_sio())
+
+    @reset_logger_state
+    def test_thread_locals(self):
+        adapter1 = SwiftLogAdapter(self.core_logger, 'foo')
+        adapter2 = SwiftLogAdapter(self.core_logger, 'foo')
+        locals1 = ('tx_123', '1.2.3.4')
+        adapter1.thread_locals = locals1
+        self.assertEqual(adapter1.thread_locals, locals1)
+        self.assertEqual(adapter2.thread_locals, locals1)
+
+        locals2 = ('tx_456', '1.2.3.456')
+        adapter2.thread_locals = locals2
+        self.assertEqual(adapter1.thread_locals, locals2)
+        self.assertEqual(adapter2.thread_locals, locals2)
+
+        adapter1.thread_locals = (None, None)
+        self.assertEqual(adapter1.thread_locals, (None, None))
+        self.assertEqual(adapter2.thread_locals, (None, None))
+
+        adapter1.txn_id = '5678'
+        self.assertEqual('5678', adapter1.txn_id)
+        self.assertEqual('5678', adapter2.txn_id)
+        self.assertIsNone(adapter1.client_ip)
+        self.assertIsNone(adapter2.client_ip)
+        self.assertEqual(('5678', None), adapter1.thread_locals)
+        self.assertEqual(('5678', None), adapter2.thread_locals)
+
+        adapter1.client_ip = '5.6.7.8'
+        self.assertEqual('5678', adapter1.txn_id)
+        self.assertEqual('5678', adapter2.txn_id)
+        self.assertEqual('5.6.7.8', adapter1.client_ip)
+        self.assertEqual('5.6.7.8', adapter2.client_ip)
+        self.assertEqual(('5678', '5.6.7.8'), adapter1.thread_locals)
+        self.assertEqual(('5678', '5.6.7.8'), adapter2.thread_locals)
+
+    @reset_logger_state
+    def test_thread_locals_stacked_adapter(self):
+        adapter1 = SwiftLogAdapter(self.core_logger, 'foo')
+        # adapter2 is stacked on adapter1
+        adapter2 = SwiftLogAdapter(adapter1, 'foo')
+        self.assertIs(adapter1, adapter2.logger)
+        # test the setter
+        adapter1.thread_locals = ('id', 'ip')
+        self.assertEqual(adapter1.thread_locals, ('id', 'ip'))
+        self.assertEqual(adapter2.thread_locals, ('id', 'ip'))
+        # reset
+        adapter1.thread_locals = (None, None)
+        self.assertEqual(adapter1.thread_locals, (None, None))
+        self.assertEqual(adapter2.thread_locals, (None, None))
+
+        adapter1.txn_id = '1234'
+        adapter1.client_ip = '1.2.3.4'
+        self.assertEqual(adapter1.thread_locals, ('1234', '1.2.3.4'))
+        self.assertEqual(adapter2.thread_locals, ('1234', '1.2.3.4'))
+        adapter2.txn_id = '5678'
+        adapter2.client_ip = '5.6.7.8'
+        self.assertEqual(adapter1.thread_locals, ('5678', '5.6.7.8'))
+        self.assertEqual(adapter2.thread_locals, ('5678', '5.6.7.8'))
+
+    def test_exception(self):
+        # verify that the adapter routes exception calls to SwiftLogAdapter
+        # for special case handling
+        adapter = SwiftLogAdapter(self.core_logger, 'foo')
+        try:
+            raise OSError(errno.ECONNREFUSED, 'oserror')
+        except OSError:
+            with mock.patch('logging.LoggerAdapter.error') as mocked:
+                adapter.exception('Caught')
+        mocked.assert_called_with('Caught: Connection refused')
+
+
+class TestPipeMutex(unittest.TestCase):
+    def setUp(self):
+        self.mutex = utils.PipeMutex()
+
+    def tearDown(self):
+        self.mutex.close()
+
+    def test_nonblocking(self):
+        evt_lock1 = eventlet.event.Event()
+        evt_lock2 = eventlet.event.Event()
+        evt_unlock = eventlet.event.Event()
+
+        def get_the_lock():
+            self.mutex.acquire()
+            evt_lock1.send('got the lock')
+            evt_lock2.wait()
+            self.mutex.release()
+            evt_unlock.send('released the lock')
+
+        eventlet.spawn(get_the_lock)
+        evt_lock1.wait()  # Now, the other greenthread has the lock.
+
+        self.assertFalse(self.mutex.acquire(blocking=False))
+        evt_lock2.send('please release the lock')
+        evt_unlock.wait()  # The other greenthread has released the lock.
+        self.assertTrue(self.mutex.acquire(blocking=False))
+
+    def test_recursive(self):
+        self.assertTrue(self.mutex.acquire(blocking=False))
+        self.assertTrue(self.mutex.acquire(blocking=False))
+
+        def try_acquire_lock():
+            return self.mutex.acquire(blocking=False)
+
+        self.assertFalse(eventlet.spawn(try_acquire_lock).wait())
+        self.mutex.release()
+        self.assertFalse(eventlet.spawn(try_acquire_lock).wait())
+        self.mutex.release()
+        self.assertTrue(eventlet.spawn(try_acquire_lock).wait())
+
+    def test_context_manager_api(self):
+        def try_acquire_lock():
+            return self.mutex.acquire(blocking=False)
+
+        with self.mutex as ref:
+            self.assertIs(ref, self.mutex)
+            self.assertFalse(eventlet.spawn(try_acquire_lock).wait())
+        self.assertTrue(eventlet.spawn(try_acquire_lock).wait())
+
+    def test_release_without_acquire(self):
+        self.assertRaises(RuntimeError, self.mutex.release)
+
+    def test_too_many_releases(self):
+        self.mutex.acquire()
+        self.mutex.release()
+        self.assertRaises(RuntimeError, self.mutex.release)
+
+    def test_wrong_releaser(self):
+        self.mutex.acquire()
+        with quiet_eventlet_exceptions():
+            self.assertRaises(RuntimeError,
+                              eventlet.spawn(self.mutex.release).wait)
+
+    def test_blocking(self):
+        evt = eventlet.event.Event()
+
+        sequence = []
+
+        def coro1():
+            eventlet.sleep(0)  # let coro2 go
+
+            self.mutex.acquire()
+            sequence.append('coro1 acquire')
+            evt.send('go')
+            self.mutex.release()
+            sequence.append('coro1 release')
+
+        def coro2():
+            evt.wait()  # wait for coro1 to start us
+            self.mutex.acquire()
+            sequence.append('coro2 acquire')
+            self.mutex.release()
+            sequence.append('coro2 release')
+
+        c1 = eventlet.spawn(coro1)
+        c2 = eventlet.spawn(coro2)
+
+        c1.wait()
+        c2.wait()
+
+        self.assertEqual(sequence, [
+            'coro1 acquire',
+            'coro1 release',
+            'coro2 acquire',
+            'coro2 release'])
+
+    def test_blocking_tpool(self):
+        # Note: this test's success isn't a guarantee that the mutex is
+        # working. However, this test's failure means that the mutex is
+        # definitely broken.
+        sequence = []
+
+        def do_stuff():
+            n = 10
+            while n > 0:
+                self.mutex.acquire()
+                sequence.append("<")
+                eventlet.sleep(0.0001)
+                sequence.append(">")
+                self.mutex.release()
+                n -= 1
+
+        greenthread1 = eventlet.spawn(do_stuff)
+        greenthread2 = eventlet.spawn(do_stuff)
+
+        real_thread1 = eventlet.patcher.original('threading').Thread(
+            target=do_stuff)
+        real_thread1.start()
+
+        real_thread2 = eventlet.patcher.original('threading').Thread(
+            target=do_stuff)
+        real_thread2.start()
+
+        greenthread1.wait()
+        greenthread2.wait()
+        real_thread1.join()
+        real_thread2.join()
+
+        self.assertEqual(''.join(sequence), "<>" * 40)
+
+    def test_blocking_preserves_ownership(self):
+        pthread1_event = eventlet.patcher.original('threading').Event()
+        pthread2_event1 = eventlet.patcher.original('threading').Event()
+        pthread2_event2 = eventlet.patcher.original('threading').Event()
+        thread_id = []
+        owner = []
+
+        def pthread1():
+            thread_id.append(id(eventlet.greenthread.getcurrent()))
+            self.mutex.acquire()
+            owner.append(self.mutex.owner)
+            pthread2_event1.set()
+
+            orig_os_write = utils.os.write
+
+            def patched_os_write(*a, **kw):
+                try:
+                    return orig_os_write(*a, **kw)
+                finally:
+                    pthread1_event.wait()
+
+            with mock.patch.object(utils.os, 'write', patched_os_write):
+                self.mutex.release()
+            pthread2_event2.set()
+
+        def pthread2():
+            pthread2_event1.wait()  # ensure pthread1 acquires lock first
+            thread_id.append(id(eventlet.greenthread.getcurrent()))
+            self.mutex.acquire()
+            pthread1_event.set()
+            pthread2_event2.wait()
+            owner.append(self.mutex.owner)
+            self.mutex.release()
+
+        real_thread1 = eventlet.patcher.original('threading').Thread(
+            target=pthread1)
+        real_thread1.start()
+
+        real_thread2 = eventlet.patcher.original('threading').Thread(
+            target=pthread2)
+        real_thread2.start()
+
+        real_thread1.join()
+        real_thread2.join()
+        self.assertEqual(thread_id, owner)
+        self.assertIsNone(self.mutex.owner)
+
+    @classmethod
+    def tearDownClass(cls):
+        # PipeMutex turns this off when you instantiate one
+        eventlet.debug.hub_prevent_multiple_readers(True)
+
+
+class TestNoopMutex(unittest.TestCase):
+    def setUp(self):
+        self.mutex = utils.NoopMutex()
+
+    def test_acquire_release_api(self):
+        # Prior to 3.13, logging called these explicitly
+        self.mutex.acquire()
+        self.mutex.release()
+
+    def test_context_manager_api(self):
+        # python 3.13 started using it as a context manager
+        def try_acquire_lock():
+            return self.mutex.acquire(blocking=False)
+
+        with self.mutex as ref:
+            self.assertIs(ref, self.mutex)
diff --git a/test/unit/common/utils/test_timestamp.py b/test/unit/common/utils/test_timestamp.py
new file mode 100644
index 0000000000..865e8e3690
--- /dev/null
+++ b/test/unit/common/utils/test_timestamp.py
@@ -0,0 +1,1063 @@
+# Copyright (c) 2010-2023 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""Tests for swift.common.utils.timestamp"""
+import os
+import random
+import time
+import unittest
+
+from unittest import mock
+
+from swift.common.utils import timestamp
+
+
+class TestTimestamp(unittest.TestCase):
+    """Tests for swift.common.utils.timestamp.Timestamp"""
+    def test_zero(self):
+        ts_zero = timestamp.Timestamp.zero()
+        self.assertEqual(0.0, float(ts_zero))
+        self.assertEqual(0, ts_zero.offset)
+        self.assertEqual(timestamp.Timestamp.zero(),
+                         timestamp.Timestamp(timestamp.Timestamp.zero()))
+        self.assertEqual(ts_zero.internal, '0000000000.00000')
+        # for now this is true...
+        self.assertEqual(timestamp.Timestamp(0), ts_zero)
+
+    def test_invalid_input(self):
+        with self.assertRaises(ValueError):
+            timestamp.Timestamp(time.time(), offset=-1)
+        with self.assertRaises(ValueError):
+            timestamp.Timestamp('123.456_78_90')
+        with self.assertRaises(ValueError):
+            timestamp.Timestamp('')
+        with self.assertRaises(TypeError):
+            timestamp.Timestamp(None)
+
+    def test_invalid_string_conversion(self):
+        t = timestamp.Timestamp.now()
+        self.assertRaises(TypeError, str, t)
+
+    def test_offset_limit(self):
+        t = 1417462430.78693
+        # can't have a offset above MAX_OFFSET
+        with self.assertRaises(ValueError):
+            timestamp.Timestamp(t, offset=timestamp.MAX_OFFSET + 1)
+        # exactly max offset is fine
+        ts = timestamp.Timestamp(t, offset=timestamp.MAX_OFFSET)
+        self.assertEqual(ts.internal, '1417462430.78693_ffffffffffffffff')
+        # but you can't offset it further
+        with self.assertRaises(ValueError):
+            timestamp.Timestamp(ts.internal, offset=1)
+        # unless you start below it
+        ts = timestamp.Timestamp(t, offset=timestamp.MAX_OFFSET - 1)
+        self.assertEqual(timestamp.Timestamp(ts.internal, offset=1),
+                         '1417462430.78693_ffffffffffffffff')
+
+    def test_normal_format_no_offset(self):
+        expected = '1402436408.91203'
+        test_values = (
+            '1402436408.91203',
+            '1402436408.91203_00000000',
+            '1402436408.912030000',
+            '1402436408.912030000_0000000000000',
+            '000001402436408.912030000',
+            '000001402436408.912030000_0000000000',
+            1402436408.91203,
+            1402436408.912029,
+            1402436408.9120300000000000,
+            1402436408.91202999999999999,
+            timestamp.Timestamp(1402436408.91203),
+            timestamp.Timestamp(1402436408.91203, offset=0),
+            timestamp.Timestamp(1402436408.912029),
+            timestamp.Timestamp(1402436408.912029, offset=0),
+            timestamp.Timestamp('1402436408.91203'),
+            timestamp.Timestamp('1402436408.91203', offset=0),
+            timestamp.Timestamp('1402436408.91203_00000000'),
+            timestamp.Timestamp('1402436408.91203_00000000', offset=0),
+        )
+        for value in test_values:
+            ts = timestamp.Timestamp(value)
+            self.assertEqual(ts.normal, expected)
+            # timestamp instance can also compare to string or float
+            self.assertEqual(ts, expected)
+            self.assertEqual(ts, float(expected))
+            self.assertEqual(ts, timestamp.normalize_timestamp(expected))
+
+    def test_isoformat(self):
+        expected = '2014-06-10T22:47:32.054580'
+        test_values = (
+            '1402440452.05458',
+            '1402440452.054579',
+            '1402440452.05458_00000000',
+            '1402440452.054579_00000000',
+            '1402440452.054580000',
+            '1402440452.054579999',
+            '1402440452.054580000_0000000000000',
+            '1402440452.054579999_0000ff00',
+            '000001402440452.054580000',
+            '000001402440452.0545799',
+            '000001402440452.054580000_0000000000',
+            '000001402440452.054579999999_00000fffff',
+            1402440452.05458,
+            1402440452.054579,
+            1402440452.0545800000000000,
+            1402440452.054579999,
+            timestamp.Timestamp(1402440452.05458),
+            timestamp.Timestamp(1402440452.0545799),
+            timestamp.Timestamp(1402440452.05458, offset=0),
+            timestamp.Timestamp(1402440452.05457999999, offset=0),
+            timestamp.Timestamp(1402440452.05458, offset=100),
+            timestamp.Timestamp(1402440452.054579, offset=100),
+            timestamp.Timestamp('1402440452.05458'),
+            timestamp.Timestamp('1402440452.054579999'),
+            timestamp.Timestamp('1402440452.05458', offset=0),
+            timestamp.Timestamp('1402440452.054579', offset=0),
+            timestamp.Timestamp('1402440452.05458', offset=300),
+            timestamp.Timestamp('1402440452.05457999', offset=300),
+            timestamp.Timestamp('1402440452.05458_00000000'),
+            timestamp.Timestamp('1402440452.05457999_00000000'),
+            timestamp.Timestamp('1402440452.05458_00000000', offset=0),
+            timestamp.Timestamp('1402440452.05457999_00000aaa', offset=0),
+            timestamp.Timestamp('1402440452.05458_00000000', offset=400),
+            timestamp.Timestamp('1402440452.054579_0a', offset=400),
+        )
+        for value in test_values:
+            self.assertEqual(timestamp.Timestamp(value).isoformat, expected)
+        expected = '1970-01-01T00:00:00.000000'
+        test_values = (
+            '0',
+            '0000000000.00000',
+            '0000000000.00000_ffffffffffff',
+            0,
+            0.0,
+        )
+        for value in test_values:
+            self.assertEqual(timestamp.Timestamp(value).isoformat, expected)
+
+    def test_from_isoformat(self):
+        ts = timestamp.Timestamp.from_isoformat('2014-06-10T22:47:32.054580')
+        self.assertIsInstance(ts, timestamp.Timestamp)
+        self.assertEqual(1402440452.05458, float(ts))
+        self.assertEqual('2014-06-10T22:47:32.054580', ts.isoformat)
+
+        ts = timestamp.Timestamp.from_isoformat('1970-01-01T00:00:00.000000')
+        self.assertIsInstance(ts, timestamp.Timestamp)
+        self.assertEqual(0.0, float(ts))
+        self.assertEqual('1970-01-01T00:00:00.000000', ts.isoformat)
+
+        ts = timestamp.Timestamp(1402440452.05458)
+        self.assertIsInstance(ts, timestamp.Timestamp)
+        self.assertEqual(ts, timestamp.Timestamp.from_isoformat(ts.isoformat))
+
+    def test_ceil(self):
+        self.assertEqual(0.0, timestamp.Timestamp(0).ceil())
+        self.assertEqual(1.0, timestamp.Timestamp(0.00001).ceil())
+        self.assertEqual(0.0, timestamp.Timestamp(0.000001).ceil())
+        self.assertEqual(1.0, timestamp.Timestamp(0.000006).ceil())
+        self.assertEqual(12345678.0, timestamp.Timestamp(12345678.0).ceil())
+        self.assertEqual(12345678.0,
+                         timestamp.Timestamp(12345678.000001).ceil())
+        self.assertEqual(12345679.0,
+                         timestamp.Timestamp(12345678.000006).ceil())
+
+    def test_not_equal(self):
+        ts = '1402436408.91203_0000000000000001'
+        test_values = (
+            timestamp.Timestamp('1402436408.91203_0000000000000002'),
+            timestamp.Timestamp('1402436408.91203'),
+            timestamp.Timestamp(1402436408.91203),
+            timestamp.Timestamp(1402436408.91204),
+            timestamp.Timestamp(1402436408.91203, offset=0),
+            timestamp.Timestamp(1402436408.91203, offset=2),
+        )
+        for value in test_values:
+            self.assertTrue(value != ts)
+
+        self.assertIs(True, timestamp.Timestamp(ts) == ts)  # sanity
+        self.assertIs(False,
+                      timestamp.Timestamp(ts) != timestamp.Timestamp(ts))
+        self.assertIs(False, timestamp.Timestamp(ts) != ts)
+        self.assertIs(False, timestamp.Timestamp(ts) is None)
+        self.assertIs(True, timestamp.Timestamp(ts) is not None)
+
+    def test_no_force_internal_no_offset(self):
+        """Test that internal is the same as normal with no offset"""
+        with mock.patch('swift.common.utils.timestamp.FORCE_INTERNAL',
+                        new=False):
+            self.assertEqual(timestamp.Timestamp(0).internal,
+                             '0000000000.00000')
+            self.assertEqual(timestamp.Timestamp(1402437380.58186).internal,
+                             '1402437380.58186')
+            self.assertEqual(timestamp.Timestamp(1402437380.581859).internal,
+                             '1402437380.58186')
+            self.assertEqual(timestamp.Timestamp(0).internal,
+                             timestamp.normalize_timestamp(0))
+
+    def test_no_force_internal_with_offset(self):
+        """Test that internal always includes the offset if significant"""
+        with mock.patch('swift.common.utils.timestamp.FORCE_INTERNAL',
+                        new=False):
+            self.assertEqual(timestamp.Timestamp(0, offset=1).internal,
+                             '0000000000.00000_0000000000000001')
+            self.assertEqual(
+                timestamp.Timestamp(1402437380.58186, offset=16).internal,
+                '1402437380.58186_0000000000000010')
+            self.assertEqual(
+                timestamp.Timestamp(1402437380.581859, offset=240).internal,
+                '1402437380.58186_00000000000000f0')
+            self.assertEqual(
+                timestamp.Timestamp('1402437380.581859_00000001',
+                                    offset=240).internal,
+                '1402437380.58186_00000000000000f1')
+
+    def test_force_internal(self):
+        """Test that internal always includes the offset if forced"""
+        with mock.patch('swift.common.utils.timestamp.FORCE_INTERNAL',
+                        new=True):
+            self.assertEqual(timestamp.Timestamp(0).internal,
+                             '0000000000.00000_0000000000000000')
+            self.assertEqual(timestamp.Timestamp(1402437380.58186).internal,
+                             '1402437380.58186_0000000000000000')
+            self.assertEqual(timestamp.Timestamp(1402437380.581859).internal,
+                             '1402437380.58186_0000000000000000')
+            self.assertEqual(timestamp.Timestamp(0, offset=1).internal,
+                             '0000000000.00000_0000000000000001')
+            self.assertEqual(
+                timestamp.Timestamp(1402437380.58186, offset=16).internal,
+                '1402437380.58186_0000000000000010')
+            self.assertEqual(
+                timestamp.Timestamp(1402437380.581859, offset=16).internal,
+                '1402437380.58186_0000000000000010')
+
+    def test_internal_format_no_offset(self):
+        expected = '1402436408.91203_0000000000000000'
+        test_values = (
+            '1402436408.91203',
+            '1402436408.91203_00000000',
+            '1402436408.912030000',
+            '1402436408.912030000_0000000000000',
+            '000001402436408.912030000',
+            '000001402436408.912030000_0000000000',
+            1402436408.91203,
+            1402436408.9120300000000000,
+            1402436408.912029,
+            1402436408.912029999999999999,
+            timestamp.Timestamp(1402436408.91203),
+            timestamp.Timestamp(1402436408.91203, offset=0),
+            timestamp.Timestamp(1402436408.912029),
+            timestamp.Timestamp(1402436408.91202999999999999, offset=0),
+            timestamp.Timestamp('1402436408.91203'),
+            timestamp.Timestamp('1402436408.91203', offset=0),
+            timestamp.Timestamp('1402436408.912029'),
+            timestamp.Timestamp('1402436408.912029', offset=0),
+            timestamp.Timestamp('1402436408.912029999999999'),
+            timestamp.Timestamp('1402436408.912029999999999', offset=0),
+        )
+        for value in test_values:
+            # timestamp instance is always equivalent
+            self.assertEqual(timestamp.Timestamp(value), expected)
+            if timestamp.FORCE_INTERNAL:
+                # the FORCE_INTERNAL flag makes the internal format always
+                # include the offset portion of the timestamp even when it's
+                # not significant and would be bad during upgrades
+                self.assertEqual(timestamp.Timestamp(value).internal, expected)
+            else:
+                # unless we FORCE_INTERNAL, when there's no offset the
+                # internal format is equivalent to the normalized format
+                self.assertEqual(timestamp.Timestamp(value).internal,
+                                 '1402436408.91203')
+
+    def test_internal_format_with_offset(self):
+        expected = '1402436408.91203_00000000000000f0'
+        test_values = (
+            '1402436408.91203_000000f0',
+            u'1402436408.91203_000000f0',
+            b'1402436408.91203_000000f0',
+            '1402436408.912030000_0000000000f0',
+            '1402436408.912029_000000f0',
+            '1402436408.91202999999_0000000000f0',
+            '000001402436408.912030000_000000000f0',
+            '000001402436408.9120299999_000000000f0',
+            timestamp.Timestamp(1402436408.91203, offset=240),
+            timestamp.Timestamp(1402436408.912029, offset=240),
+            timestamp.Timestamp('1402436408.91203', offset=240),
+            timestamp.Timestamp('1402436408.91203_00000000', offset=240),
+            timestamp.Timestamp('1402436408.91203_0000000f', offset=225),
+            timestamp.Timestamp('1402436408.9120299999', offset=240),
+            timestamp.Timestamp('1402436408.9120299999_00000000', offset=240),
+            timestamp.Timestamp('1402436408.9120299999_00000010', offset=224),
+        )
+        for value in test_values:
+            ts = timestamp.Timestamp(value)
+            self.assertEqual(ts.internal, expected)
+            # can compare with offset if the string is internalized
+            self.assertEqual(ts, expected)
+            # if comparison value only includes the normalized portion and the
+            # timestamp includes an offset, it is considered greater
+            normal = timestamp.Timestamp(expected).normal
+            self.assertTrue(ts > normal,
+                            '%r is not bigger than %r given %r' % (
+                                ts, normal, value))
+            self.assertTrue(ts > float(normal),
+                            '%r is not bigger than %f given %r' % (
+                                ts, float(normal), value))
+
+    def test_short_format_with_offset(self):
+        expected = '1402436408.91203_f0'
+        ts = timestamp.Timestamp(1402436408.91203, 0xf0)
+        self.assertEqual(expected, ts.short)
+
+        expected = '1402436408.91203'
+        ts = timestamp.Timestamp(1402436408.91203)
+        self.assertEqual(expected, ts.short)
+
+    def test_raw(self):
+        expected = 140243640891203
+        ts = timestamp.Timestamp(1402436408.91203)
+        self.assertEqual(expected, ts.raw)
+        self.assertEqual('1402436408.91203', ts.normal)
+
+        # 'raw' does not include offset
+        ts = timestamp.Timestamp(1402436408.91203, 0xf0)
+        self.assertEqual(expected, ts.raw)
+
+        expected = 175507756652338
+        ts = timestamp.Timestamp(1755077566.523385)
+        self.assertEqual(expected, ts.raw)
+        self.assertEqual('1755077566.52338', ts.normal)
+
+    def test_delta(self):
+        def _assertWithinBounds(expected, timestamp):
+            tolerance = 0.00001
+            minimum = expected - tolerance
+            maximum = expected + tolerance
+            self.assertTrue(float(timestamp) > minimum)
+            self.assertTrue(float(timestamp) < maximum)
+
+        ts = timestamp.Timestamp(1402436408.91203, delta=100)
+        _assertWithinBounds(1402436408.91303, ts)
+        self.assertEqual(140243640891303, ts.raw)
+
+        ts = timestamp.Timestamp(1402436408.91203, delta=-100)
+        _assertWithinBounds(1402436408.91103, ts)
+        self.assertEqual(140243640891103, ts.raw)
+
+        ts = timestamp.Timestamp(1402436408.91203, delta=0)
+        _assertWithinBounds(1402436408.91203, ts)
+        self.assertEqual(140243640891203, ts.raw)
+
+        # delta is independent of offset
+        ts = timestamp.Timestamp(1402436408.91203, offset=42, delta=100)
+        self.assertEqual(140243640891303, ts.raw)
+        self.assertEqual(42, ts.offset)
+
+        # cannot go negative
+        self.assertRaises(ValueError, timestamp.Timestamp, 1402436408.91203,
+                          delta=-140243640891203)
+
+    def test_int(self):
+        expected = 1402437965
+        test_values = (
+            '1402437965.91203',
+            '1402437965.91203_00000000',
+            '1402437965.912030000',
+            '1402437965.912030000_0000000000000',
+            '000001402437965.912030000',
+            '000001402437965.912030000_0000000000',
+            1402437965.91203,
+            1402437965.9120300000000000,
+            1402437965.912029,
+            1402437965.912029999999999999,
+            timestamp.Timestamp(1402437965.91203),
+            timestamp.Timestamp(1402437965.91203, offset=0),
+            timestamp.Timestamp(1402437965.91203, offset=500),
+            timestamp.Timestamp(1402437965.912029),
+            timestamp.Timestamp(1402437965.91202999999999999, offset=0),
+            timestamp.Timestamp(1402437965.91202999999999999, offset=300),
+            timestamp.Timestamp('1402437965.91203'),
+            timestamp.Timestamp('1402437965.91203', offset=0),
+            timestamp.Timestamp('1402437965.91203', offset=400),
+            timestamp.Timestamp('1402437965.912029'),
+            timestamp.Timestamp('1402437965.912029', offset=0),
+            timestamp.Timestamp('1402437965.912029', offset=200),
+            timestamp.Timestamp('1402437965.912029999999999'),
+            timestamp.Timestamp('1402437965.912029999999999', offset=0),
+            timestamp.Timestamp('1402437965.912029999999999', offset=100),
+        )
+        for value in test_values:
+            ts = timestamp.Timestamp(value)
+            self.assertEqual(int(ts), expected)
+            self.assertTrue(ts > expected)
+
+    def test_float(self):
+        expected = 1402438115.91203
+        test_values = (
+            '1402438115.91203',
+            '1402438115.91203_00000000',
+            '1402438115.912030000',
+            '1402438115.912030000_0000000000000',
+            '000001402438115.912030000',
+            '000001402438115.912030000_0000000000',
+            1402438115.91203,
+            1402438115.9120300000000000,
+            1402438115.912029,
+            1402438115.912029999999999999,
+            timestamp.Timestamp(1402438115.91203),
+            timestamp.Timestamp(1402438115.91203, offset=0),
+            timestamp.Timestamp(1402438115.91203, offset=500),
+            timestamp.Timestamp(1402438115.912029),
+            timestamp.Timestamp(1402438115.91202999999999999, offset=0),
+            timestamp.Timestamp(1402438115.91202999999999999, offset=300),
+            timestamp.Timestamp('1402438115.91203'),
+            timestamp.Timestamp('1402438115.91203', offset=0),
+            timestamp.Timestamp('1402438115.91203', offset=400),
+            timestamp.Timestamp('1402438115.912029'),
+            timestamp.Timestamp('1402438115.912029', offset=0),
+            timestamp.Timestamp('1402438115.912029', offset=200),
+            timestamp.Timestamp('1402438115.912029999999999'),
+            timestamp.Timestamp('1402438115.912029999999999', offset=0),
+            timestamp.Timestamp('1402438115.912029999999999', offset=100),
+        )
+        tolerance = 0.00001
+        minimum = expected - tolerance
+        maximum = expected + tolerance
+        for value in test_values:
+            ts = timestamp.Timestamp(value)
+            self.assertTrue(float(ts) > minimum,
+                            '%f is not bigger than %f given %r' % (
+                                ts, minimum, value))
+            self.assertTrue(float(ts) < maximum,
+                            '%f is not smaller than %f given %r' % (
+                                ts, maximum, value))
+            # direct comparison of timestamp works too
+            self.assertTrue(ts > minimum,
+                            '%s is not bigger than %f given %r' % (
+                                ts.normal, minimum, value))
+            self.assertTrue(ts < maximum,
+                            '%s is not smaller than %f given %r' % (
+                                ts.normal, maximum, value))
+            # ... even against strings
+            self.assertTrue(ts > '%f' % minimum,
+                            '%s is not bigger than %s given %r' % (
+                                ts.normal, minimum, value))
+            self.assertTrue(ts < '%f' % maximum,
+                            '%s is not smaller than %s given %r' % (
+                                ts.normal, maximum, value))
+
+    def test_false(self):
+        self.assertFalse(timestamp.Timestamp(0))
+        self.assertFalse(timestamp.Timestamp(0, offset=0))
+        self.assertFalse(timestamp.Timestamp('0'))
+        self.assertFalse(timestamp.Timestamp('0', offset=0))
+        self.assertFalse(timestamp.Timestamp(0.0))
+        self.assertFalse(timestamp.Timestamp(0.0, offset=0))
+        self.assertFalse(timestamp.Timestamp('0.0'))
+        self.assertFalse(timestamp.Timestamp('0.0', offset=0))
+        self.assertFalse(timestamp.Timestamp(00000000.00000000))
+        self.assertFalse(timestamp.Timestamp(00000000.00000000, offset=0))
+        self.assertFalse(timestamp.Timestamp('00000000.00000000'))
+        self.assertFalse(timestamp.Timestamp('00000000.00000000', offset=0))
+
+    def test_true(self):
+        self.assertTrue(timestamp.Timestamp(1))
+        self.assertTrue(timestamp.Timestamp(1, offset=1))
+        self.assertTrue(timestamp.Timestamp(0, offset=1))
+        self.assertTrue(timestamp.Timestamp('1'))
+        self.assertTrue(timestamp.Timestamp('1', offset=1))
+        self.assertTrue(timestamp.Timestamp('0', offset=1))
+        self.assertTrue(timestamp.Timestamp(1.1))
+        self.assertTrue(timestamp.Timestamp(1.1, offset=1))
+        self.assertTrue(timestamp.Timestamp(0.0, offset=1))
+        self.assertTrue(timestamp.Timestamp('1.1'))
+        self.assertTrue(timestamp.Timestamp('1.1', offset=1))
+        self.assertTrue(timestamp.Timestamp('0.0', offset=1))
+        self.assertTrue(timestamp.Timestamp(11111111.11111111))
+        self.assertTrue(timestamp.Timestamp(11111111.11111111, offset=1))
+        self.assertTrue(timestamp.Timestamp(00000000.00000000, offset=1))
+        self.assertTrue(timestamp.Timestamp('11111111.11111111'))
+        self.assertTrue(timestamp.Timestamp('11111111.11111111', offset=1))
+        self.assertTrue(timestamp.Timestamp('00000000.00000000', offset=1))
+
+    def test_greater_no_offset(self):
+        now = time.time()
+        older = now - 1
+        ts = timestamp.Timestamp(now)
+        test_values = (
+            0, '0', 0.0, '0.0', '0000.0000', '000.000_000',
+            1, '1', 1.1, '1.1', '1111.1111', '111.111_111',
+            1402443112.213252, '1402443112.213252', '1402443112.213252_ffff',
+            older, '%f' % older, '%f_0000ffff' % older,
+        )
+        for value in test_values:
+            other = timestamp.Timestamp(value)
+            self.assertNotEqual(ts, other)  # sanity
+            self.assertTrue(ts > value,
+                            '%r is not greater than %r given %r' % (
+                                ts, value, value))
+            self.assertTrue(ts > other,
+                            '%r is not greater than %r given %r' % (
+                                ts, other, value))
+            self.assertTrue(ts > other.normal,
+                            '%r is not greater than %r given %r' % (
+                                ts, other.normal, value))
+            self.assertTrue(ts > other.internal,
+                            '%r is not greater than %r given %r' % (
+                                ts, other.internal, value))
+            self.assertTrue(ts > float(other),
+                            '%r is not greater than %r given %r' % (
+                                ts, float(other), value))
+            self.assertTrue(ts > int(other),
+                            '%r is not greater than %r given %r' % (
+                                ts, int(other), value))
+
+    def _test_greater_with_offset(self, now, test_values):
+        for offset in range(1, 1000, 100):
+            ts = timestamp.Timestamp(now, offset=offset)
+            for value in test_values:
+                other = timestamp.Timestamp(value)
+                self.assertNotEqual(ts, other)  # sanity
+                self.assertTrue(ts > value,
+                                '%r is not greater than %r given %r' % (
+                                    ts, value, value))
+                self.assertTrue(ts > other,
+                                '%r is not greater than %r given %r' % (
+                                    ts, other, value))
+                self.assertTrue(ts > other.normal,
+                                '%r is not greater than %r given %r' % (
+                                    ts, other.normal, value))
+                self.assertTrue(ts > other.internal,
+                                '%r is not greater than %r given %r' % (
+                                    ts, other.internal, value))
+                self.assertTrue(ts > float(other),
+                                '%r is not greater than %r given %r' % (
+                                    ts, float(other), value))
+                self.assertTrue(ts > int(other),
+                                '%r is not greater than %r given %r' % (
+                                    ts, int(other), value))
+
+    def test_greater_with_offset(self):
+        # Part 1: use the natural time of the Python. This is deliciously
+        # unpredictable, but completely legitimate and realistic. Finds bugs!
+        now = time.time()
+        older = now - 1
+        test_values = (
+            0, '0', 0.0, '0.0', '0000.0000', '000.000_000',
+            1, '1', 1.1, '1.1', '1111.1111', '111.111_111',
+            1402443346.935174, '1402443346.93517', '1402443346.935169_ffff',
+            older, now,
+        )
+        self._test_greater_with_offset(now, test_values)
+        # Part 2: Same as above, but with fixed time values that reproduce
+        # specific corner cases.
+        now = 1519830570.6949348
+        older = now - 1
+        test_values = (
+            0, '0', 0.0, '0.0', '0000.0000', '000.000_000',
+            1, '1', 1.1, '1.1', '1111.1111', '111.111_111',
+            1402443346.935174, '1402443346.93517', '1402443346.935169_ffff',
+            older, now,
+        )
+        self._test_greater_with_offset(now, test_values)
+        # Part 3: The '%f' problem. Timestamps cannot be converted to %f
+        # strings, then back to timestamps, then compared with originals.
+        # You can only "import" a floating point representation once.
+        now = 1519830570.6949348
+        now = float('%f' % now)
+        older = now - 1
+        test_values = (
+            0, '0', 0.0, '0.0', '0000.0000', '000.000_000',
+            1, '1', 1.1, '1.1', '1111.1111', '111.111_111',
+            older, '%f' % older, '%f_0000ffff' % older,
+            now, '%f' % now, '%s_00000000' % now,
+        )
+        self._test_greater_with_offset(now, test_values)
+
+    def test_smaller_no_offset(self):
+        now = time.time()
+        newer = now + 1
+        ts = timestamp.Timestamp(now)
+        test_values = (
+            9999999999.99999, '9999999999.99999', '9999999999.99999_ffff',
+            newer, '%f' % newer, '%f_0000ffff' % newer,
+        )
+        for value in test_values:
+            other = timestamp.Timestamp(value)
+            self.assertNotEqual(ts, other)  # sanity
+            self.assertTrue(ts < value,
+                            '%r is not smaller than %r given %r' % (
+                                ts, value, value))
+            self.assertTrue(ts < other,
+                            '%r is not smaller than %r given %r' % (
+                                ts, other, value))
+            self.assertTrue(ts < other.normal,
+                            '%r is not smaller than %r given %r' % (
+                                ts, other.normal, value))
+            self.assertTrue(ts < other.internal,
+                            '%r is not smaller than %r given %r' % (
+                                ts, other.internal, value))
+            self.assertTrue(ts < float(other),
+                            '%r is not smaller than %r given %r' % (
+                                ts, float(other), value))
+            self.assertTrue(ts < int(other),
+                            '%r is not smaller than %r given %r' % (
+                                ts, int(other), value))
+
+    def test_smaller_with_offset(self):
+        now = time.time()
+        newer = now + 1
+        test_values = (
+            9999999999.99999, '9999999999.99999', '9999999999.99999_ffff',
+            newer, '%f' % newer, '%f_0000ffff' % newer,
+        )
+        for offset in range(1, 1000, 100):
+            ts = timestamp.Timestamp(now, offset=offset)
+            for value in test_values:
+                other = timestamp.Timestamp(value)
+                self.assertNotEqual(ts, other)  # sanity
+                self.assertTrue(ts < value,
+                                '%r is not smaller than %r given %r' % (
+                                    ts, value, value))
+                self.assertTrue(ts < other,
+                                '%r is not smaller than %r given %r' % (
+                                    ts, other, value))
+                self.assertTrue(ts < other.normal,
+                                '%r is not smaller than %r given %r' % (
+                                    ts, other.normal, value))
+                self.assertTrue(ts < other.internal,
+                                '%r is not smaller than %r given %r' % (
+                                    ts, other.internal, value))
+                self.assertTrue(ts < float(other),
+                                '%r is not smaller than %r given %r' % (
+                                    ts, float(other), value))
+                self.assertTrue(ts < int(other),
+                                '%r is not smaller than %r given %r' % (
+                                    ts, int(other), value))
+
+    def test_cmp_with_none(self):
+        self.assertGreater(timestamp.Timestamp(0), None)
+        self.assertGreater(timestamp.Timestamp(1.0), None)
+        self.assertGreater(timestamp.Timestamp(1.0, 42), None)
+
+    def test_ordering(self):
+        given = [
+            '1402444820.62590_000000000000000a',
+            '1402444820.62589_0000000000000001',
+            '1402444821.52589_0000000000000004',
+            '1402444920.62589_0000000000000004',
+            '1402444821.62589_000000000000000a',
+            '1402444821.72589_000000000000000a',
+            '1402444920.62589_0000000000000002',
+            '1402444820.62589_0000000000000002',
+            '1402444820.62589_000000000000000a',
+            '1402444820.62590_0000000000000004',
+            '1402444920.62589_000000000000000a',
+            '1402444820.62590_0000000000000002',
+            '1402444821.52589_0000000000000002',
+            '1402444821.52589_0000000000000000',
+            '1402444920.62589',
+            '1402444821.62589_0000000000000004',
+            '1402444821.72589_0000000000000001',
+            '1402444820.62590',
+            '1402444820.62590_0000000000000001',
+            '1402444820.62589_0000000000000004',
+            '1402444821.72589_0000000000000000',
+            '1402444821.52589_000000000000000a',
+            '1402444821.72589_0000000000000004',
+            '1402444821.62589',
+            '1402444821.52589_0000000000000001',
+            '1402444821.62589_0000000000000001',
+            '1402444821.62589_0000000000000002',
+            '1402444821.72589_0000000000000002',
+            '1402444820.62589',
+            '1402444920.62589_0000000000000001']
+        expected = [
+            '1402444820.62589',
+            '1402444820.62589_0000000000000001',
+            '1402444820.62589_0000000000000002',
+            '1402444820.62589_0000000000000004',
+            '1402444820.62589_000000000000000a',
+            '1402444820.62590',
+            '1402444820.62590_0000000000000001',
+            '1402444820.62590_0000000000000002',
+            '1402444820.62590_0000000000000004',
+            '1402444820.62590_000000000000000a',
+            '1402444821.52589',
+            '1402444821.52589_0000000000000001',
+            '1402444821.52589_0000000000000002',
+            '1402444821.52589_0000000000000004',
+            '1402444821.52589_000000000000000a',
+            '1402444821.62589',
+            '1402444821.62589_0000000000000001',
+            '1402444821.62589_0000000000000002',
+            '1402444821.62589_0000000000000004',
+            '1402444821.62589_000000000000000a',
+            '1402444821.72589',
+            '1402444821.72589_0000000000000001',
+            '1402444821.72589_0000000000000002',
+            '1402444821.72589_0000000000000004',
+            '1402444821.72589_000000000000000a',
+            '1402444920.62589',
+            '1402444920.62589_0000000000000001',
+            '1402444920.62589_0000000000000002',
+            '1402444920.62589_0000000000000004',
+            '1402444920.62589_000000000000000a',
+        ]
+        # less visual version
+        """
+        now = time.time()
+        given = [
+            timestamp.Timestamp(now + i, offset=offset).internal
+            for i in (0, 0.00001, 0.9, 1.0, 1.1, 100.0)
+            for offset in (0, 1, 2, 4, 10)
+        ]
+        expected = [t for t in given]
+        random.shuffle(given)
+        """
+        self.assertEqual(len(given), len(expected))  # sanity
+        timestamps = [timestamp.Timestamp(t) for t in given]
+        # our expected values don't include insignificant offsets
+        with mock.patch('swift.common.utils.timestamp.FORCE_INTERNAL',
+                        new=False):
+            self.assertEqual(
+                [t.internal for t in sorted(timestamps)], expected)
+            # string sorting works as well
+            self.assertEqual(
+                sorted([t.internal for t in timestamps]), expected)
+
+    def test_hashable(self):
+        ts_0 = timestamp.Timestamp('1402444821.72589')
+        ts_0_also = timestamp.Timestamp('1402444821.72589')
+        self.assertEqual(ts_0, ts_0_also)  # sanity
+        self.assertEqual(hash(ts_0), hash(ts_0_also))
+        d = {ts_0: 'whatever'}
+        self.assertIn(ts_0, d)  # sanity
+        self.assertIn(ts_0_also, d)
+
+    def test_out_of_range_comparisons(self):
+        now = timestamp.Timestamp.now()
+
+        def check_is_later(val):
+            self.assertTrue(now != val)
+            self.assertFalse(now == val)
+            self.assertTrue(now <= val)
+            self.assertTrue(now < val)
+            self.assertTrue(val > now)
+            self.assertTrue(val >= now)
+
+        check_is_later(1e30)
+        check_is_later(1579753284000)  # someone gave us ms instead of s!
+        check_is_later('1579753284000')
+        check_is_later(b'1e15')
+        check_is_later(u'1.e+10_f')
+
+        def check_is_earlier(val):
+            self.assertTrue(now != val)
+            self.assertFalse(now == val)
+            self.assertTrue(now >= val)
+            self.assertTrue(now > val)
+            self.assertTrue(val < now)
+            self.assertTrue(val <= now)
+
+        check_is_earlier(-1)
+        check_is_earlier(-0.1)
+        check_is_earlier('-9999999')
+        check_is_earlier(b'-9999.999')
+        check_is_earlier(u'-1234_5678')
+
+    def test_inversion(self):
+        ts = timestamp.Timestamp(0)
+        self.assertIsInstance(~ts, timestamp.Timestamp)
+        self.assertEqual((~ts).internal, '9999999999.99999')
+
+        ts = timestamp.Timestamp(123456.789)
+        self.assertIsInstance(~ts, timestamp.Timestamp)
+        self.assertEqual(ts.internal, '0000123456.78900')
+        self.assertEqual((~ts).internal, '9999876543.21099')
+
+        timestamps = sorted(timestamp.Timestamp(random.random() * 1e10)
+                            for _ in range(20))
+        self.assertEqual([x.internal for x in timestamps],
+                         sorted(x.internal for x in timestamps))
+        self.assertEqual([(~x).internal for x in reversed(timestamps)],
+                         sorted((~x).internal for x in timestamps))
+
+        ts = timestamp.Timestamp.now()
+        self.assertGreater(~ts, ts)  # NB: will break around 2128
+
+        ts = timestamp.Timestamp.now(offset=1)
+        with self.assertRaises(ValueError) as caught:
+            ~ts
+        self.assertEqual(caught.exception.args[0],
+                         'Cannot invert timestamps with offsets')
+
+    def test_inversion_reversibility(self):
+        ts = timestamp.Timestamp(1755077566.523385)
+        inv = ~ts
+        inv_inv = ~inv
+        self.assertEqual(ts, inv_inv)
+        self.assertEqual(ts.normal, inv_inv.normal)
+
+        inv_inv_inv = ~inv_inv
+        self.assertEqual(inv, inv_inv_inv)
+        self.assertEqual(inv.normal, inv_inv_inv.normal)
+
+        ts = timestamp.Timestamp.now()
+        inv = ~ts
+        inv_inv = ~inv
+        self.assertEqual(ts, inv_inv)
+        self.assertEqual(ts.normal, inv_inv.normal)
+
+
+class TestTimestampEncoding(unittest.TestCase):
+
+    def setUp(self):
+        t0 = timestamp.Timestamp(0.0)
+        t1 = timestamp.Timestamp(997.9996)
+        t2 = timestamp.Timestamp(999)
+        t3 = timestamp.Timestamp(1000, 24)
+        t4 = timestamp.Timestamp(1001)
+        t5 = timestamp.Timestamp(1002.00040)
+
+        # encodings that are expected when explicit = False
+        self.non_explicit_encodings = (
+            ('0000001000.00000_18', (t3, t3, t3)),
+            ('0000001000.00000_18', (t3, t3, None)),
+        )
+
+        # mappings that are expected when explicit = True
+        self.explicit_encodings = (
+            ('0000001000.00000_18+0+0', (t3, t3, t3)),
+            ('0000001000.00000_18+0', (t3, t3, None)),
+        )
+
+        # mappings that are expected when explicit = True or False
+        self.encodings = (
+            ('0000001000.00000_18+0+186a0', (t3, t3, t4)),
+            ('0000001000.00000_18+186a0+186c8', (t3, t4, t5)),
+            ('0000001000.00000_18-186a0+0', (t3, t2, t2)),
+            ('0000001000.00000_18+0-186a0', (t3, t3, t2)),
+            ('0000001000.00000_18-186a0-186c8', (t3, t2, t1)),
+            ('0000001000.00000_18', (t3, None, None)),
+            ('0000001000.00000_18+186a0', (t3, t4, None)),
+            ('0000001000.00000_18-186a0', (t3, t2, None)),
+            ('0000001000.00000_18', (t3, None, t1)),
+            ('0000001000.00000_18-5f5e100', (t3, t0, None)),
+            ('0000001000.00000_18+0-5f5e100', (t3, t3, t0)),
+            ('0000001000.00000_18-5f5e100+5f45a60', (t3, t0, t2)),
+        )
+
+        # decodings that are expected when explicit = False
+        self.non_explicit_decodings = (
+            ('0000001000.00000_18', (t3, t3, t3)),
+            ('0000001000.00000_18+186a0', (t3, t4, t4)),
+            ('0000001000.00000_18-186a0', (t3, t2, t2)),
+            ('0000001000.00000_18+186a0', (t3, t4, t4)),
+            ('0000001000.00000_18-186a0', (t3, t2, t2)),
+            ('0000001000.00000_18-5f5e100', (t3, t0, t0)),
+        )
+
+        # decodings that are expected when explicit = True
+        self.explicit_decodings = (
+            ('0000001000.00000_18+0+0', (t3, t3, t3)),
+            ('0000001000.00000_18+0', (t3, t3, None)),
+            ('0000001000.00000_18', (t3, None, None)),
+            ('0000001000.00000_18+186a0', (t3, t4, None)),
+            ('0000001000.00000_18-186a0', (t3, t2, None)),
+            ('0000001000.00000_18-5f5e100', (t3, t0, None)),
+        )
+
+        # decodings that are expected when explicit = True or False
+        self.decodings = (
+            ('0000001000.00000_18+0+186a0', (t3, t3, t4)),
+            ('0000001000.00000_18+186a0+186c8', (t3, t4, t5)),
+            ('0000001000.00000_18-186a0+0', (t3, t2, t2)),
+            ('0000001000.00000_18+0-186a0', (t3, t3, t2)),
+            ('0000001000.00000_18-186a0-186c8', (t3, t2, t1)),
+            ('0000001000.00000_18-5f5e100+5f45a60', (t3, t0, t2)),
+        )
+
+    def _assertEqual(self, expected, actual, test):
+        self.assertEqual(expected, actual,
+                         'Got %s but expected %s for parameters %s'
+                         % (actual, expected, test))
+
+    def test_encoding(self):
+        for test in self.explicit_encodings:
+            actual = timestamp.encode_timestamps(test[1][0], test[1][1],
+                                                 test[1][2], True)
+            self._assertEqual(test[0], actual, test[1])
+        for test in self.non_explicit_encodings:
+            actual = timestamp.encode_timestamps(test[1][0], test[1][1],
+                                                 test[1][2], False)
+            self._assertEqual(test[0], actual, test[1])
+        for explicit in (True, False):
+            for test in self.encodings:
+                actual = timestamp.encode_timestamps(test[1][0], test[1][1],
+                                                     test[1][2], explicit)
+                self._assertEqual(test[0], actual, test[1])
+
+    def test_decoding(self):
+        for test in self.explicit_decodings:
+            actual = timestamp.decode_timestamps(test[0], True)
+            self._assertEqual(test[1], actual, test[0])
+        for test in self.non_explicit_decodings:
+            actual = timestamp.decode_timestamps(test[0], False)
+            self._assertEqual(test[1], actual, test[0])
+        for explicit in (True, False):
+            for test in self.decodings:
+                actual = timestamp.decode_timestamps(test[0], explicit)
+                self._assertEqual(test[1], actual, test[0])
+
+
+class TestModuleFunctions(unittest.TestCase):
+    def test_normalize_timestamp(self):
+        # Test swift.common.utils.timestamp.normalize_timestamp
+        self.assertEqual(timestamp.normalize_timestamp('1253327593.48174'),
+                         "1253327593.48174")
+        self.assertEqual(timestamp.normalize_timestamp(1253327593.48174),
+                         "1253327593.48174")
+        self.assertEqual(timestamp.normalize_timestamp('1253327593.48'),
+                         "1253327593.48000")
+        self.assertEqual(timestamp.normalize_timestamp(1253327593.48),
+                         "1253327593.48000")
+        self.assertEqual(timestamp.normalize_timestamp('253327593.48'),
+                         "0253327593.48000")
+        self.assertEqual(timestamp.normalize_timestamp(253327593.48),
+                         "0253327593.48000")
+        self.assertEqual(timestamp.normalize_timestamp('1253327593'),
+                         "1253327593.00000")
+        self.assertEqual(timestamp.normalize_timestamp(1253327593),
+                         "1253327593.00000")
+        self.assertRaises(ValueError, timestamp.normalize_timestamp, '')
+        self.assertRaises(ValueError, timestamp.normalize_timestamp, 'abc')
+
+    def test_normalize_delete_at_timestamp(self):
+        self.assertEqual(
+            timestamp.normalize_delete_at_timestamp(1253327593),
+            '1253327593')
+        self.assertEqual(
+            timestamp.normalize_delete_at_timestamp(1253327593.67890),
+            '1253327593')
+        self.assertEqual(
+            timestamp.normalize_delete_at_timestamp('1253327593'),
+            '1253327593')
+        self.assertEqual(
+            timestamp.normalize_delete_at_timestamp('1253327593.67890'),
+            '1253327593')
+        self.assertEqual(
+            timestamp.normalize_delete_at_timestamp(-1253327593),
+            '0000000000')
+        self.assertEqual(
+            timestamp.normalize_delete_at_timestamp(-1253327593.67890),
+            '0000000000')
+        self.assertEqual(
+            timestamp.normalize_delete_at_timestamp('-1253327593'),
+            '0000000000')
+        self.assertEqual(
+            timestamp.normalize_delete_at_timestamp('-1253327593.67890'),
+            '0000000000')
+        self.assertEqual(
+            timestamp.normalize_delete_at_timestamp(71253327593),
+            '9999999999')
+        self.assertEqual(
+            timestamp.normalize_delete_at_timestamp(71253327593.67890),
+            '9999999999')
+        self.assertEqual(
+            timestamp.normalize_delete_at_timestamp('71253327593'),
+            '9999999999')
+        self.assertEqual(
+            timestamp.normalize_delete_at_timestamp('71253327593.67890'),
+            '9999999999')
+        with self.assertRaises(TypeError):
+            timestamp.normalize_delete_at_timestamp(None)
+        with self.assertRaises(ValueError):
+            timestamp.normalize_delete_at_timestamp('')
+        with self.assertRaises(ValueError):
+            timestamp.normalize_delete_at_timestamp('abc')
+
+    def test_normalize_delete_at_timestamp_high_precision(self):
+        self.assertEqual(
+            timestamp.normalize_delete_at_timestamp(1253327593, True),
+            '1253327593.00000')
+        self.assertEqual(
+            timestamp.normalize_delete_at_timestamp(1253327593.67890, True),
+            '1253327593.67890')
+        self.assertEqual(
+            timestamp.normalize_delete_at_timestamp('1253327593', True),
+            '1253327593.00000')
+        self.assertEqual(
+            timestamp.normalize_delete_at_timestamp('1253327593.67890', True),
+            '1253327593.67890')
+        self.assertEqual(
+            timestamp.normalize_delete_at_timestamp(-1253327593, True),
+            '0000000000.00000')
+        self.assertEqual(
+            timestamp.normalize_delete_at_timestamp(-1253327593.67890, True),
+            '0000000000.00000')
+        self.assertEqual(
+            timestamp.normalize_delete_at_timestamp('-1253327593', True),
+            '0000000000.00000')
+        self.assertEqual(
+            timestamp.normalize_delete_at_timestamp('-1253327593.67890', True),
+            '0000000000.00000')
+        self.assertEqual(
+            timestamp.normalize_delete_at_timestamp(71253327593, True),
+            '9999999999.99999')
+        self.assertEqual(
+            timestamp.normalize_delete_at_timestamp(71253327593.67890, True),
+            '9999999999.99999')
+        self.assertEqual(
+            timestamp.normalize_delete_at_timestamp('71253327593', True),
+            '9999999999.99999')
+        self.assertEqual(
+            timestamp.normalize_delete_at_timestamp('71253327593.67890', True),
+            '9999999999.99999')
+        with self.assertRaises(TypeError):
+            timestamp.normalize_delete_at_timestamp(None, True)
+        with self.assertRaises(ValueError):
+            timestamp.normalize_delete_at_timestamp('', True)
+        with self.assertRaises(ValueError):
+            timestamp.normalize_delete_at_timestamp('abc', True)
+
+    def test_last_modified_date_to_timestamp(self):
+        expectations = {
+            '1970-01-01T00:00:00.000000': timestamp.Timestamp.zero(),
+            '2014-02-28T23:22:36.698390':
+                timestamp.Timestamp(1393629756.698390),
+            '2011-03-19T04:03:00.604554':
+                timestamp.Timestamp(1300507380.604554),
+        }
+        for last_modified, ts in expectations.items():
+            real = timestamp.last_modified_date_to_timestamp(last_modified)
+            self.assertEqual(real, ts, "failed for %s" % last_modified)
+
+    def test_last_modified_date_to_timestamp_when_system_not_UTC(self):
+        try:
+            old_tz = os.environ.get('TZ')
+            # Western Argentina Summer Time. Found in glibc manual; this
+            # timezone always has a non-zero offset from UTC, so this test is
+            # always meaningful.
+            os.environ['TZ'] = 'WART4WARST,J1/0,J365/25'
+
+            self.assertEqual(timestamp.last_modified_date_to_timestamp(
+                '1970-01-01T00:00:00.000000'),
+                timestamp.Timestamp.zero())
+
+        finally:
+            if old_tz is not None:
+                os.environ['TZ'] = old_tz
+            else:
+                os.environ.pop('TZ')
diff --git a/test/unit/container/test_auditor.py b/test/unit/container/test_auditor.py
index 8d753949d2..96ffdc9287 100644
--- a/test/unit/container/test_auditor.py
+++ b/test/unit/container/test_auditor.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,15 +13,55 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-# TODO: Tests
-
 import unittest
+from unittest import mock
+import os
+
+from swift.common.utils import normalize_timestamp
 from swift.container import auditor
+from test.debug_logger import debug_logger
+from test.unit import with_tempdir
+from test.unit.container import test_backend
+
+
+class TestAuditorMigrations(unittest.TestCase):
+
+    @with_tempdir
+    @mock.patch('swift.common.db_auditor.dump_recon_cache')
+    def test_db_migration(self, tempdir, mock_recon):
+        db_path = os.path.join(tempdir, 'sda', 'containers', '0', '0', '0',
+                               'test.db')
+        with test_backend.TestContainerBrokerBeforeSPI.old_broker() as \
+                old_ContainerBroker:
+            broker = old_ContainerBroker(db_path, account='a', container='c')
+            broker.initialize(normalize_timestamp(0), -1)
+
+        with broker.get() as conn:
+            try:
+                conn.execute('SELECT storage_policy_index '
+                             'FROM container_stat')
+            except Exception as err:
+                self.assertTrue('no such column: storage_policy_index' in
+                                str(err))
+            else:
+                self.fail('TestContainerBrokerBeforeSPI broker class '
+                          'was already migrated')
 
-class TestReaper(unittest.TestCase):
+        conf = {'devices': tempdir, 'mount_check': False}
+        test_auditor = auditor.ContainerAuditor(conf, logger=debug_logger())
+        test_auditor.run_once()
 
-    def test_placeholder(self):
-        pass
+        broker = auditor.ContainerBroker(db_path, account='a', container='c')
+        info = broker.get_info()
+        expected = {
+            'account': 'a',
+            'container': 'c',
+            'object_count': 0,
+            'bytes_used': 0,
+            'storage_policy_index': 0,
+        }
+        for k, v in expected.items():
+            self.assertEqual(info[k], v)
 
 
 if __name__ == '__main__':
diff --git a/test/unit/container/test_backend.py b/test/unit/container/test_backend.py
new file mode 100644
index 0000000000..f65ec2bfc2
--- /dev/null
+++ b/test/unit/container/test_backend.py
@@ -0,0 +1,7373 @@
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+""" Tests for swift.container.backend """
+import base64
+import errno
+import os
+import inspect
+import shutil
+import unittest
+from time import sleep, time
+from uuid import uuid4
+import random
+from collections import defaultdict
+from contextlib import contextmanager
+import sqlite3
+import string
+import pickle
+import json
+import itertools
+
+from swift.common.exceptions import LockTimeout
+from swift.container.backend import ContainerBroker, \
+    update_new_item_from_existing, UNSHARDED, SHARDING, SHARDED, \
+    COLLAPSED, SHARD_LISTING_STATES, SHARD_UPDATE_STATES, sift_shard_ranges, \
+    merge_shards
+from swift.common.db import DatabaseAlreadyExists, GreenDBConnection, \
+    TombstoneReclaimer, GreenDBCursor
+from swift.common.request_helpers import get_reserved_name
+from swift.common.utils import Timestamp, encode_timestamps, hash_path, \
+    ShardRange, make_db_file_path, md5, ShardRangeList, Namespace, \
+    MD5_OF_EMPTY_STRING
+from swift.common.storage_policy import POLICIES
+
+from unittest import mock
+
+from test.debug_logger import debug_logger
+from test.unit import (patch_policies, with_tempdir, make_timestamp_iter,
+                       mock_timestamp_now)
+from test.unit.common import test_db
+
+
+class TestContainerBroker(test_db.TestDbBase):
+    """Tests for ContainerBroker"""
+    expected_db_tables = {'outgoing_sync', 'incoming_sync', 'object',
+                          'sqlite_sequence', 'policy_stat',
+                          'container_info', 'shard_range'}
+    server_type = 'container'
+
+    def setUp(self):
+        super(TestContainerBroker, self).setUp()
+        self.ts = make_timestamp_iter()
+
+    def _assert_shard_ranges(self, broker, expected, include_own=False):
+        actual = broker.get_shard_ranges(include_deleted=True,
+                                         include_own=include_own)
+        self.assertEqual([dict(sr) for sr in expected],
+                         [dict(sr) for sr in actual])
+
+    def _delete_table(self, broker, table):
+        """
+        Delete the table  ``table`` from broker database.
+
+        :param broker: an object instance of ContainerBroker.
+        :param table: the name of the table to delete.
+        """
+        with broker.get() as conn:
+            try:
+                conn.execute("""
+                    DROP TABLE %s
+                """ % table)
+            except sqlite3.OperationalError as err:
+                if ('no such table: %s' % table) in str(err):
+                    return
+                else:
+                    raise
+
+    def _add_shard_range_table(self, broker):
+        """
+        Add the 'shard_range' table into the broker database.
+
+        :param broker: an object instance of ContainerBroker.
+        """
+        with broker.get() as conn:
+            broker.create_shard_range_table(conn)
+
+    def test_creation(self):
+        # Test ContainerBroker.__init__
+        db_file = self.get_db_path()
+        broker = ContainerBroker(db_file, account='a', container='c')
+        self.assertEqual(broker._db_file, db_file)
+        broker.initialize(Timestamp('1').internal, 0)
+        with broker.get() as conn:
+            curs = conn.cursor()
+            curs.execute('SELECT 1')
+            self.assertEqual(curs.fetchall()[0][0], 1)
+            curs.execute("SELECT name FROM sqlite_master WHERE type='table';")
+            self.assertEqual(self.expected_db_tables,
+                             {row[0] for row in curs.fetchall()})
+        # check the update trigger
+        broker.put_object('blah', Timestamp.now().internal, 0, 'text/plain',
+                          'etag', 0, 0)
+        # commit pending file into db
+        broker._commit_puts()
+        with broker.get() as conn:
+            with self.assertRaises(sqlite3.DatabaseError) as cm:
+                conn.execute('UPDATE object SET name="blah";')
+        self.assertIn('UPDATE not allowed', str(cm.exception))
+        if 'shard_range' in self.expected_db_tables:
+            # check the update trigger
+            broker.merge_shard_ranges(broker.get_own_shard_range())
+            with broker.get() as conn:
+                with self.assertRaises(sqlite3.DatabaseError) as cm:
+                    conn.execute('UPDATE shard_range SET name="blah";')
+            self.assertIn('UPDATE not allowed', str(cm.exception))
+
+    @patch_policies
+    def test_storage_policy_property(self):
+        for policy in POLICIES:
+            broker = ContainerBroker(self.get_db_path(), account='a',
+                                     container='policy_%s' % policy.name)
+            broker.initialize(next(self.ts).internal, policy.idx)
+            with broker.get() as conn:
+                try:
+                    conn.execute('''SELECT storage_policy_index
+                                    FROM container_stat''')
+                except Exception:
+                    is_migrated = False
+                else:
+                    is_migrated = True
+            if not is_migrated:
+                # pre spi tests don't set policy on initialize
+                broker.set_storage_policy_index(policy.idx)
+            # clear cached state
+            if hasattr(broker, '_storage_policy_index'):
+                del broker._storage_policy_index
+
+            execute_queries = []
+            real_execute = GreenDBCursor.execute
+
+            def tracking_exec(*args):
+                if not args[1].startswith('PRAGMA '):
+                    execute_queries.append(args[1])
+                return real_execute(*args)
+
+            with mock.patch.object(GreenDBCursor, 'execute', tracking_exec):
+                self.assertEqual(policy.idx, broker.storage_policy_index)
+            self.assertEqual(len(execute_queries), 1, execute_queries)
+
+            broker.enable_sharding(next(self.ts))
+            self.assertTrue(broker.set_sharding_state())
+            if not is_migrated:
+                # pre spi tests don't set policy when initializing the
+                # new broker, either
+                broker.set_storage_policy_index(policy.idx)
+            del execute_queries[:]
+            del broker._storage_policy_index
+            with mock.patch.object(GreenDBCursor, 'execute', tracking_exec):
+                self.assertEqual(policy.idx, broker.storage_policy_index)
+            self.assertEqual(len(execute_queries), 1, execute_queries)
+
+            self.assertTrue(broker.set_sharded_state())
+            del execute_queries[:]
+            del broker._storage_policy_index
+            with mock.patch.object(GreenDBCursor, 'execute', tracking_exec):
+                self.assertEqual(policy.idx, broker.storage_policy_index)
+            self.assertEqual(len(execute_queries), 1, execute_queries)
+
+            # make sure it's cached
+            with mock.patch.object(broker, 'get', side_effect=RuntimeError):
+                self.assertEqual(policy.idx, broker.storage_policy_index)
+
+    def test_exception(self):
+        # Test ContainerBroker throwing a conn away after
+        # unhandled exception
+        first_conn = None
+        broker = ContainerBroker(self.get_db_path(),
+                                 account='a', container='c')
+        broker.initialize(Timestamp('1').internal, 0)
+        with broker.get() as conn:
+            first_conn = conn
+        try:
+            with broker.get() as conn:
+                self.assertEqual(first_conn, conn)
+                raise Exception('OMG')
+        except Exception:
+            pass
+        self.assertTrue(broker.conn is None)
+
+    @with_tempdir
+    @mock.patch("swift.container.backend.ContainerBroker.get")
+    def test_is_old_enough_to_reclaim(self, tempdir, mocked_get):
+        db_path = os.path.join(
+            tempdir, 'containers', 'part', 'suffix', 'hash', 'container.db')
+        broker = ContainerBroker(db_path, account='a', container='c')
+        broker.initialize(next(self.ts).internal, 0)
+
+        def do_test(now, reclaim_age, put_ts, delete_ts, expected):
+            mocked_get.return_value.\
+                __enter__.return_value.\
+                execute.return_value.\
+                fetchone.return_value = dict(delete_timestamp=delete_ts,
+                                             put_timestamp=put_ts)
+
+            self.assertEqual(expected,
+                             broker.is_old_enough_to_reclaim(now, reclaim_age))
+
+        now_time = time()
+        tests = (
+            # (now, reclaim_age, put_ts, del_ts, expected),
+            (0, 0, 0, 0, False),
+            # Never deleted
+            (now_time, 100, now_time - 200, 0, False),
+            # Deleted ts older the put_ts
+            (now_time, 100, now_time - 150, now_time - 200, False),
+            # not reclaim_age yet
+            (now_time, 100, now_time - 150, now_time - 50, False),
+            # right on reclaim doesn't work
+            (now_time, 100, now_time - 150, now_time - 100, False),
+            # put_ts wins over del_ts
+            (now_time, 100, now_time - 150, now_time - 150, False),
+            # good case, reclaim > delete_ts > put_ts
+            (now_time, 100, now_time - 150, now_time - 125, True))
+        for i, test in enumerate(tests):
+            with self.subTest(test=(i, test)):
+                do_test(*test)
+
+    @with_tempdir
+    def test_is_reclaimable(self, tempdir):
+        db_path = os.path.join(
+            tempdir, 'containers', 'part', 'suffix', 'hash', 'container.db')
+        broker = ContainerBroker(db_path, account='a', container='c')
+        broker.initialize(next(self.ts).internal, 0)
+
+        self.assertFalse(broker.is_reclaimable(float(next(self.ts)), 0))
+        broker.delete_db(next(self.ts).internal)
+        self.assertFalse(broker.is_reclaimable(float(next(self.ts)), 604800))
+        self.assertTrue(broker.is_reclaimable(float(next(self.ts)), 0))
+
+        # adding a shard range makes us unreclaimable
+        sr = ShardRange('.shards_a/shard_c', next(self.ts), object_count=0)
+        broker.merge_shard_ranges([sr])
+        self.assertFalse(broker.is_reclaimable(float(next(self.ts)), 0))
+        # ... but still "deleted"
+        self.assertTrue(broker.is_deleted())
+        # ... until the shard range is deleted
+        sr.set_deleted(next(self.ts))
+        broker.merge_shard_ranges([sr])
+        self.assertTrue(broker.is_reclaimable(float(next(self.ts)), 0))
+
+        # adding an object makes us unreclaimable
+        obj = {'name': 'o', 'created_at': next(self.ts).internal,
+               'size': 0, 'content_type': 'text/plain',
+               'etag': MD5_OF_EMPTY_STRING, 'deleted': 0}
+        broker.merge_items([dict(obj)])
+        self.assertFalse(broker.is_reclaimable(float(next(self.ts)), 0))
+        # ... and "not deleted"
+        self.assertFalse(broker.is_deleted())
+
+    @with_tempdir
+    def test_sharding_state_is_not_reclaimable(self, tempdir):
+        db_path = os.path.join(
+            tempdir, 'containers', 'part', 'suffix', 'hash', 'container.db')
+        broker = ContainerBroker(db_path, account='a', container='c')
+        broker.initialize(next(self.ts).internal, 0)
+        broker.enable_sharding(next(self.ts))
+        broker.set_sharding_state()
+        broker.delete_db(next(self.ts).internal)
+        self.assertTrue(broker.is_deleted())
+        # we won't reclaim in SHARDING state
+        self.assertEqual(SHARDING, broker.get_db_state())
+        self.assertFalse(broker.is_reclaimable(float(next(self.ts)), 0))
+        # ... but if we find one stuck like this it's easy enough to fix
+        broker.set_sharded_state()
+        self.assertTrue(broker.is_reclaimable(float(next(self.ts)), 0))
+
+    @with_tempdir
+    def test_is_deleted(self, tempdir):
+        # Test ContainerBroker.is_deleted() and get_info_is_deleted()
+        db_path = os.path.join(
+            tempdir, 'containers', 'part', 'suffix', 'hash', 'container.db')
+        broker = ContainerBroker(db_path, account='a', container='c')
+        broker.initialize(next(self.ts).internal, 0)
+
+        self.assertFalse(broker.is_deleted())
+        broker.delete_db(next(self.ts).internal)
+        self.assertTrue(broker.is_deleted())
+
+        def check_object_counted(broker_to_test, broker_with_object):
+            obj = {'name': 'o', 'created_at': next(self.ts).internal,
+                   'size': 0, 'content_type': 'text/plain',
+                   'etag': MD5_OF_EMPTY_STRING, 'deleted': 0}
+            broker_with_object.merge_items([dict(obj)])
+            self.assertFalse(broker_to_test.is_deleted())
+            info, deleted = broker_to_test.get_info_is_deleted()
+            self.assertFalse(deleted)
+            self.assertEqual(1, info['object_count'])
+            obj.update({'created_at': next(self.ts).internal, 'deleted': 1})
+            broker_with_object.merge_items([dict(obj)])
+            self.assertTrue(broker_to_test.is_deleted())
+            info, deleted = broker_to_test.get_info_is_deleted()
+            self.assertTrue(deleted)
+            self.assertEqual(0, info['object_count'])
+
+        def check_object_not_counted(broker):
+            obj = {'name': 'o', 'created_at': next(self.ts).internal,
+                   'size': 0, 'content_type': 'text/plain',
+                   'etag': MD5_OF_EMPTY_STRING, 'deleted': 0}
+            broker.merge_items([dict(obj)])
+            self.assertTrue(broker.is_deleted())
+            info, deleted = broker.get_info_is_deleted()
+            self.assertTrue(deleted)
+            self.assertEqual(0, info['object_count'])
+            obj.update({'created_at': next(self.ts).internal, 'deleted': 1})
+            broker.merge_items([dict(obj)])
+            self.assertTrue(broker.is_deleted())
+            info, deleted = broker.get_info_is_deleted()
+            self.assertTrue(deleted)
+            self.assertEqual(0, info['object_count'])
+
+        def check_shard_ranges_not_counted():
+            sr = ShardRange('.shards_a/shard_c', next(self.ts), object_count=0)
+            sr.update_meta(13, 99, meta_timestamp=next(self.ts))
+            for state in ShardRange.STATES:
+                sr.update_state(state, state_timestamp=next(self.ts))
+                broker.merge_shard_ranges([sr])
+                self.assertTrue(broker.is_deleted())
+                info, deleted = broker.get_info_is_deleted()
+                self.assertTrue(deleted)
+                self.assertEqual(0, info['object_count'])
+
+        def check_shard_ranges_counted():
+            sr = ShardRange('.shards_a/shard_c', next(self.ts), object_count=0)
+            sr.update_meta(13, 99, meta_timestamp=next(self.ts))
+            counted_states = (ShardRange.ACTIVE, ShardRange.SHARDING,
+                              ShardRange.SHRINKING)
+            for state in ShardRange.STATES:
+                sr.update_state(state, state_timestamp=next(self.ts))
+                broker.merge_shard_ranges([sr])
+                expected = state not in counted_states
+                self.assertEqual(expected, broker.is_deleted())
+                info, deleted = broker.get_info_is_deleted()
+                self.assertEqual(expected, deleted)
+                self.assertEqual(0 if expected else 13, info['object_count'])
+
+            sr.update_meta(0, 0, meta_timestamp=next(self.ts))
+            for state in ShardRange.STATES:
+                sr.update_state(state, state_timestamp=next(self.ts))
+                broker.merge_shard_ranges([sr])
+                self.assertTrue(broker.is_deleted())
+                info, deleted = broker.get_info_is_deleted()
+                self.assertTrue(deleted)
+                self.assertEqual(0, info['object_count'])
+
+        # unsharded
+        check_object_counted(broker, broker)
+        check_shard_ranges_not_counted()
+
+        # move to sharding state
+        broker.enable_sharding(next(self.ts))
+        self.assertTrue(broker.set_sharding_state())
+        self.assertTrue(broker.is_deleted())
+
+        # check object in retiring db is considered
+        check_object_counted(broker, broker.get_brokers()[0])
+        self.assertTrue(broker.is_deleted())
+        check_shard_ranges_not_counted()
+        # misplaced object in fresh db is not considered
+        check_object_not_counted(broker)
+
+        # move to sharded state
+        self.assertTrue(broker.set_sharded_state())
+        check_object_not_counted(broker)
+        check_shard_ranges_counted()
+
+        # own shard range has no influence
+        own_sr = broker.get_own_shard_range()
+        own_sr.update_meta(3, 4, meta_timestamp=next(self.ts))
+        broker.merge_shard_ranges([own_sr])
+        self.assertTrue(broker.is_deleted())
+
+    @with_tempdir
+    def test_empty(self, tempdir):
+        # Test ContainerBroker.empty
+        db_path = os.path.join(
+            tempdir, 'containers', 'part', 'suffix', 'hash', 'container.db')
+        broker = ContainerBroker(db_path, account='a', container='c')
+        broker.initialize(next(self.ts).internal, 0)
+        self.assertTrue(broker.is_root_container())
+
+        def check_object_counted(broker_to_test, broker_with_object):
+            obj = {'name': 'o', 'created_at': next(self.ts).internal,
+                   'size': 0, 'content_type': 'text/plain',
+                   'etag': MD5_OF_EMPTY_STRING, 'deleted': 0}
+            broker_with_object.merge_items([dict(obj)])
+            self.assertFalse(broker_to_test.empty())
+            # and delete it
+            obj.update({'created_at': next(self.ts).internal, 'deleted': 1})
+            broker_with_object.merge_items([dict(obj)])
+            self.assertTrue(broker_to_test.empty())
+
+        def check_shard_ranges_not_counted():
+            sr = ShardRange('.shards_a/shard_c', next(self.ts), object_count=0)
+            sr.update_meta(13, 99, meta_timestamp=next(self.ts))
+            for state in ShardRange.STATES:
+                sr.update_state(state, state_timestamp=next(self.ts))
+                broker.merge_shard_ranges([sr])
+                self.assertTrue(broker.empty())
+
+            # empty other shard ranges do not influence result
+            sr.update_meta(0, 0, meta_timestamp=next(self.ts))
+            for state in ShardRange.STATES:
+                sr.update_state(state, state_timestamp=next(self.ts))
+                broker.merge_shard_ranges([sr])
+                self.assertTrue(broker.empty())
+
+        self.assertTrue(broker.empty())
+        check_object_counted(broker, broker)
+        check_shard_ranges_not_counted()
+
+        # own shard range is not considered for object count
+        own_sr = broker.get_own_shard_range()
+        self.assertEqual(0, own_sr.object_count)
+        broker.merge_shard_ranges([own_sr])
+        self.assertTrue(broker.empty())
+
+        broker.put_object('o', next(self.ts).internal, 0, 'text/plain',
+                          MD5_OF_EMPTY_STRING)
+        own_sr = broker.get_own_shard_range()
+        self.assertEqual(0, own_sr.object_count)
+        broker.merge_shard_ranges([own_sr])
+        self.assertFalse(broker.empty())
+        broker.delete_object('o', next(self.ts).internal)
+        self.assertTrue(broker.empty())
+
+        # have own shard range but in state ACTIVE
+        self.assertEqual(ShardRange.ACTIVE, own_sr.state)
+        check_object_counted(broker, broker)
+        check_shard_ranges_not_counted()
+
+        def check_shard_ranges_counted():
+            # other shard range is considered
+            sr = ShardRange('.shards_a/shard_c', next(self.ts), object_count=0)
+            sr.update_meta(13, 99, meta_timestamp=next(self.ts))
+            counted_states = (ShardRange.ACTIVE, ShardRange.SHARDING,
+                              ShardRange.SHRINKING)
+            for state in ShardRange.STATES:
+                sr.update_state(state, state_timestamp=next(self.ts))
+                broker.merge_shard_ranges([sr])
+                self.assertEqual(state not in counted_states, broker.empty())
+
+            # empty other shard ranges do not influence result
+            sr.update_meta(0, 0, meta_timestamp=next(self.ts))
+            for state in ShardRange.STATES:
+                sr.update_state(state, state_timestamp=next(self.ts))
+                broker.merge_shard_ranges([sr])
+                self.assertTrue(broker.empty())
+
+        # enable sharding
+        broker.enable_sharding(next(self.ts))
+        check_object_counted(broker, broker)
+        check_shard_ranges_counted()
+
+        # move to sharding state
+        self.assertTrue(broker.set_sharding_state())
+        # check object in retiring db is considered
+        check_object_counted(broker, broker.get_brokers()[0])
+        self.assertTrue(broker.empty())
+        # as well as misplaced objects in fresh db
+        check_object_counted(broker, broker)
+        check_shard_ranges_counted()
+
+        # move to sharded state
+        self.assertTrue(broker.set_sharded_state())
+        self.assertTrue(broker.empty())
+        check_object_counted(broker, broker)
+        check_shard_ranges_counted()
+
+        # own shard range still has no influence
+        own_sr = broker.get_own_shard_range()
+        own_sr.update_meta(3, 4, meta_timestamp=next(self.ts))
+        broker.merge_shard_ranges([own_sr])
+        self.assertTrue(broker.empty())
+
+    @with_tempdir
+    def test_empty_old_style_shard_container(self, tempdir):
+        # Test ContainerBroker.empty for a shard container where shard range
+        # usage should not be considered
+        db_path = os.path.join(
+            tempdir, 'containers', 'part', 'suffix', 'hash', 'container.db')
+        broker = ContainerBroker(db_path, account='.shards_a', container='cc')
+        broker.initialize(next(self.ts).internal, 0)
+        broker.set_sharding_sysmeta('Root', 'a/c')
+        self.assertFalse(broker.is_root_container())
+
+        def check_object_counted(broker_to_test, broker_with_object):
+            obj = {'name': 'o', 'created_at': next(self.ts).internal,
+                   'size': 0, 'content_type': 'text/plain',
+                   'etag': MD5_OF_EMPTY_STRING, 'deleted': 0}
+            broker_with_object.merge_items([dict(obj)])
+            self.assertFalse(broker_to_test.empty())
+            # and delete it
+            obj.update({'created_at': next(self.ts).internal, 'deleted': 1})
+            broker_with_object.merge_items([dict(obj)])
+            self.assertTrue(broker_to_test.empty())
+
+        self.assertTrue(broker.empty())
+        check_object_counted(broker, broker)
+
+        # own shard range is not considered for object count
+        own_sr = broker.get_own_shard_range()
+        self.assertEqual(0, own_sr.object_count)
+        broker.merge_shard_ranges([own_sr])
+        self.assertTrue(broker.empty())
+
+        broker.put_object('o', next(self.ts).internal, 0, 'text/plain',
+                          MD5_OF_EMPTY_STRING)
+        own_sr = broker.get_own_shard_range()
+        self.assertEqual(0, own_sr.object_count)
+        broker.merge_shard_ranges([own_sr])
+        self.assertFalse(broker.empty())
+        broker.delete_object('o', next(self.ts).internal)
+        self.assertTrue(broker.empty())
+
+        def check_shard_ranges_not_counted():
+            sr = ShardRange('.shards_a/shard_c', next(self.ts), object_count=0)
+            sr.update_meta(13, 99, meta_timestamp=next(self.ts))
+            for state in ShardRange.STATES:
+                sr.update_state(state, state_timestamp=next(self.ts))
+                broker.merge_shard_ranges([sr])
+                self.assertTrue(broker.empty())
+
+            # empty other shard ranges do not influence result
+            sr.update_meta(0, 0, meta_timestamp=next(self.ts))
+            for state in ShardRange.STATES:
+                sr.update_state(state, state_timestamp=next(self.ts))
+                broker.merge_shard_ranges([sr])
+                self.assertTrue(broker.empty())
+
+        check_shard_ranges_not_counted()
+
+        # move to sharding state
+        broker.enable_sharding(next(self.ts))
+        self.assertTrue(broker.set_sharding_state())
+
+        # check object in retiring db is considered
+        check_object_counted(broker, broker.get_brokers()[0])
+        self.assertTrue(broker.empty())
+        # as well as misplaced objects in fresh db
+        check_object_counted(broker, broker)
+        check_shard_ranges_not_counted()
+
+        # move to sharded state
+        self.assertTrue(broker.set_sharded_state())
+        self.assertTrue(broker.empty())
+        check_object_counted(broker, broker)
+        check_shard_ranges_not_counted()
+
+        # own shard range still has no influence
+        own_sr = broker.get_own_shard_range()
+        own_sr.update_meta(3, 4, meta_timestamp=next(self.ts))
+        broker.merge_shard_ranges([own_sr])
+        self.assertTrue(broker.empty())
+
+    @with_tempdir
+    def test_empty_shard_container(self, tempdir):
+        # Test ContainerBroker.empty for a shard container where shard range
+        # usage should not be considered
+        db_path = os.path.join(
+            tempdir, 'containers', 'part', 'suffix', 'hash', 'container.db')
+        broker = ContainerBroker(db_path, account='.shards_a', container='cc')
+        broker.initialize(next(self.ts).internal, 0)
+        broker.set_sharding_sysmeta('Quoted-Root', 'a/c')
+        self.assertFalse(broker.is_root_container())
+        self.assertEqual('a/c', broker.root_path)
+
+        def check_object_counted(broker_to_test, broker_with_object):
+            obj = {'name': 'o', 'created_at': next(self.ts).internal,
+                   'size': 0, 'content_type': 'text/plain',
+                   'etag': MD5_OF_EMPTY_STRING, 'deleted': 0}
+            broker_with_object.merge_items([dict(obj)])
+            self.assertFalse(broker_to_test.empty())
+            # and delete it
+            obj.update({'created_at': next(self.ts).internal, 'deleted': 1})
+            broker_with_object.merge_items([dict(obj)])
+            self.assertTrue(broker_to_test.empty())
+
+        self.assertTrue(broker.empty())
+        self.assertFalse(broker.is_root_container())
+        check_object_counted(broker, broker)
+
+        # own shard range is not considered for object count
+        own_sr = broker.get_own_shard_range()
+        self.assertEqual(0, own_sr.object_count)
+        broker.merge_shard_ranges([own_sr])
+        self.assertTrue(broker.empty())
+
+        broker.put_object('o', next(self.ts).internal, 0, 'text/plain',
+                          MD5_OF_EMPTY_STRING)
+        own_sr = broker.get_own_shard_range()
+        self.assertEqual(0, own_sr.object_count)
+        broker.merge_shard_ranges([own_sr])
+        self.assertFalse(broker.empty())
+        broker.delete_object('o', next(self.ts).internal)
+        self.assertTrue(broker.empty())
+
+        def check_shard_ranges_not_counted():
+            sr = ShardRange('.shards_a/shard_c', next(self.ts), object_count=0)
+            sr.update_meta(13, 99, meta_timestamp=next(self.ts))
+            for state in ShardRange.STATES:
+                sr.update_state(state, state_timestamp=next(self.ts))
+                broker.merge_shard_ranges([sr])
+                self.assertTrue(broker.empty())
+
+            # empty other shard ranges do not influence result
+            sr.update_meta(0, 0, meta_timestamp=next(self.ts))
+            for state in ShardRange.STATES:
+                sr.update_state(state, state_timestamp=next(self.ts))
+                broker.merge_shard_ranges([sr])
+                self.assertTrue(broker.empty())
+
+        check_shard_ranges_not_counted()
+
+        # move to sharding state
+        broker.enable_sharding(next(self.ts))
+        self.assertTrue(broker.set_sharding_state())
+
+        # check object in retiring db is considered
+        check_object_counted(broker, broker.get_brokers()[0])
+        self.assertTrue(broker.empty())
+        # as well as misplaced objects in fresh db
+        check_object_counted(broker, broker)
+        check_shard_ranges_not_counted()
+
+        # move to sharded state
+        self.assertTrue(broker.set_sharded_state())
+        self.assertTrue(broker.empty())
+        check_object_counted(broker, broker)
+        check_shard_ranges_not_counted()
+
+        # own shard range still has no influence
+        own_sr = broker.get_own_shard_range()
+        own_sr.update_meta(3, 4, meta_timestamp=next(self.ts))
+        broker.merge_shard_ranges([own_sr])
+        self.assertTrue(broker.empty())
+        self.assertFalse(broker.is_deleted())
+        self.assertFalse(broker.is_root_container())
+
+        # sharder won't call delete_db() unless own_shard_range is deleted
+        own_sr.deleted = True
+        own_sr.timestamp = next(self.ts)
+        broker.merge_shard_ranges([own_sr])
+        broker.delete_db(next(self.ts).internal)
+        self.assertFalse(broker.is_root_container())
+        self.assertEqual('a/c', broker.root_path)
+
+        # Get a fresh broker, with instance cache unset
+        broker = ContainerBroker(db_path, account='.shards_a', container='cc')
+        self.assertTrue(broker.empty())
+        self.assertTrue(broker.is_deleted())
+        self.assertFalse(broker.is_root_container())
+        self.assertEqual('a/c', broker.root_path)
+
+        # older versions *did* delete sharding sysmeta when db was deleted...
+        # but still know they are not root containers
+        broker.set_sharding_sysmeta('Quoted-Root', '')
+        self.assertFalse(broker.is_root_container())
+        self.assertEqual('a/c', broker.root_path)
+        # however, they have bogus root path once instance cache is cleared...
+        broker = ContainerBroker(db_path, account='.shards_a', container='cc')
+        self.assertFalse(broker.is_root_container())
+        self.assertEqual('.shards_a/cc', broker.root_path)
+
+    def test_reclaim(self):
+        broker = ContainerBroker(self.get_db_path(),
+                                 account='test_account',
+                                 container='test_container')
+        broker.initialize(Timestamp('1').internal, 0)
+        broker.put_object('o', Timestamp.now().internal, 0, 'text/plain',
+                          'd41d8cd98f00b204e9800998ecf8427e')
+        # commit pending file into db
+        broker._commit_puts()
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM object "
+                "WHERE deleted = 0").fetchone()[0], 1)
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM object "
+                "WHERE deleted = 1").fetchone()[0], 0)
+        broker.reclaim(Timestamp(time() - 999).internal, time())
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM object "
+                "WHERE deleted = 0").fetchone()[0], 1)
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM object "
+                "WHERE deleted = 1").fetchone()[0], 0)
+        sleep(.00001)
+        broker.delete_object('o', Timestamp.now().internal)
+        broker._commit_puts()
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM object "
+                "WHERE deleted = 0").fetchone()[0], 0)
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM object "
+                "WHERE deleted = 1").fetchone()[0], 1)
+        broker.reclaim(Timestamp(time() - 999).internal, time())
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM object "
+                "WHERE deleted = 0").fetchone()[0], 0)
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM object "
+                "WHERE deleted = 1").fetchone()[0], 1)
+        sleep(.00001)
+        broker.reclaim(Timestamp.now().internal, time())
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM object "
+                "WHERE deleted = 0").fetchone()[0], 0)
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM object "
+                "WHERE deleted = 1").fetchone()[0], 0)
+        # Test the return values of reclaim()
+        broker.put_object('w', Timestamp.now().internal, 0, 'text/plain',
+                          'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('x', Timestamp.now().internal, 0, 'text/plain',
+                          'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('y', Timestamp.now().internal, 0, 'text/plain',
+                          'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('z', Timestamp.now().internal, 0, 'text/plain',
+                          'd41d8cd98f00b204e9800998ecf8427e')
+        broker._commit_puts()
+        # Test before deletion
+        broker.reclaim(Timestamp.now().internal, time())
+        broker.delete_db(Timestamp.now().internal)
+
+    def test_batch_reclaim(self):
+        num_of_objects = 60
+        obj_specs = []
+        now = time()
+        top_of_the_minute = now - (now % 60)
+        c = itertools.cycle([True, False])
+        for m, is_deleted in zip(range(num_of_objects), c):
+            offset = top_of_the_minute - (m * 60)
+            obj_specs.append((Timestamp(offset), is_deleted))
+        random.seed(now)
+        random.shuffle(obj_specs)
+        policy_indexes = list(p.idx for p in POLICIES)
+        broker = ContainerBroker(self.get_db_path(),
+                                 account='test_account',
+                                 container='test_container')
+        broker.initialize(Timestamp('1').internal, 0)
+        for i, obj_spec in enumerate(obj_specs):
+            # with object12 before object2 and shuffled ts.internal we
+            # shouldn't be able to accidently rely on any implicit ordering
+            obj_name = 'object%s' % i
+            pidx = random.choice(policy_indexes)
+            ts, is_deleted = obj_spec
+            if is_deleted:
+                broker.delete_object(obj_name, ts.internal, pidx)
+            else:
+                broker.put_object(obj_name, ts.internal, 0, 'text/plain',
+                                  'etag', storage_policy_index=pidx)
+        # commit pending file into db
+        broker._commit_puts()
+
+        def count_reclaimable(conn, reclaim_age):
+            return conn.execute(
+                "SELECT count(*) FROM object "
+                "WHERE deleted = 1 AND created_at < ?", (reclaim_age,)
+            ).fetchone()[0]
+
+        # This is intended to divide the set of timestamps exactly in half
+        # regardless of the value of now
+        reclaim_age = top_of_the_minute + 1 - (num_of_objects / 2 * 60)
+        with broker.get() as conn:
+            self.assertEqual(count_reclaimable(conn, reclaim_age),
+                             num_of_objects / 4)
+
+        trace = []
+
+        class TracingReclaimer(TombstoneReclaimer):
+            def _reclaim(self, conn):
+                trace.append(
+                    (self.age_timestamp, self.marker,
+                     count_reclaimable(conn, self.age_timestamp)))
+                return super(TracingReclaimer, self)._reclaim(conn)
+
+        with mock.patch(
+                'swift.common.db.TombstoneReclaimer', TracingReclaimer), \
+                mock.patch('swift.common.db.RECLAIM_PAGE_SIZE', 10):
+            broker.reclaim(reclaim_age, reclaim_age)
+
+        with broker.get() as conn:
+            self.assertEqual(count_reclaimable(conn, reclaim_age), 0)
+        self.assertEqual(3, len(trace), trace)
+        self.assertEqual([age for age, marker, reclaimable in trace],
+                         [reclaim_age] * 3)
+        # markers are in-order
+        self.assertLess(trace[0][1], trace[1][1])
+        self.assertLess(trace[1][1], trace[2][1])
+        # reclaimable count gradually decreases
+        # generally, count1 > count2 > count3, but because of the randomness
+        # we may occassionally have count1 == count2 or count2 == count3
+        self.assertGreaterEqual(trace[0][2], trace[1][2])
+        self.assertGreaterEqual(trace[1][2], trace[2][2])
+        # technically, this might happen occasionally, but *really* rarely
+        self.assertTrue(trace[0][2] > trace[1][2] or
+                        trace[1][2] > trace[2][2])
+
+    def test_reclaim_with_duplicate_names(self):
+        broker = ContainerBroker(self.get_db_path(),
+                                 account='test_account',
+                                 container='test_container')
+        broker.initialize(Timestamp('1').internal, 0)
+        now = time()
+        ages_ago = Timestamp(now - (3 * 7 * 24 * 60 * 60))
+        for i in range(10):
+            for spidx in range(10):
+                obj_name = 'object%s' % i
+                broker.delete_object(obj_name, ages_ago.internal, spidx)
+        # commit pending file into db
+        broker._commit_puts()
+        reclaim_age = now - (2 * 7 * 24 * 60 * 60)
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM object "
+                "WHERE created_at < ?", (reclaim_age,)
+            ).fetchone()[0], 100)
+        with mock.patch('swift.common.db.RECLAIM_PAGE_SIZE', 10):
+            broker.reclaim(reclaim_age, reclaim_age)
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM object "
+            ).fetchone()[0], 0)
+
+    @with_tempdir
+    def test_reclaim_deadlock(self, tempdir):
+        db_path = os.path.join(
+            tempdir, 'containers', 'part', 'suffix', 'hash', '%s.db' % uuid4())
+        broker = ContainerBroker(db_path, account='a', container='c')
+        broker.initialize(Timestamp(100).internal, 0)
+        # there's some magic count here that causes the failure, something
+        # about the size of object records and sqlite page size maybe?
+        count = 23000
+        for i in range(count):
+            obj_name = 'o%d' % i
+            ts = Timestamp(200).internal
+            broker.delete_object(obj_name, ts)
+        broker._commit_puts()
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM object").fetchone()[0], count)
+        # make a broker whose container attribute is not yet set so that
+        # reclaim will need to query info to set it
+        broker = ContainerBroker(db_path, timeout=1)
+        # verify that reclaim doesn't get deadlocked and timeout
+        broker.reclaim(300, 300)
+        # check all objects were reclaimed
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM object"
+            ).fetchone()[0], 0)
+
+    @with_tempdir
+    def test_reclaim_shard_ranges(self, tempdir):
+        db_path = os.path.join(
+            tempdir, 'containers', 'part', 'suffix', 'hash', '%s.db' % uuid4())
+        broker = ContainerBroker(db_path, account='a', container='c')
+        broker.initialize(next(self.ts).internal, 0)
+        older = next(self.ts)
+        same = next(self.ts)
+        newer = next(self.ts)
+        shard_ranges = [
+            ShardRange('.shards_a/older_deleted', older.internal, '', 'a',
+                       deleted=True),
+            ShardRange('.shards_a/same_deleted', same.internal, 'a', 'b',
+                       deleted=True),
+            ShardRange('.shards_a/newer_deleted', newer.internal, 'b', 'c',
+                       deleted=True),
+            ShardRange('.shards_a/older', older.internal, 'c', 'd'),
+            ShardRange('.shards_a/same', same.internal, 'd', 'e'),
+            ShardRange('.shards_a/newer', newer.internal, 'e', 'f'),
+            # own shard range is never reclaimed, even if deleted
+            ShardRange('a/c', older.internal, '', '', deleted=True)]
+        broker.merge_shard_ranges(
+            random.sample(shard_ranges, len(shard_ranges)))
+
+        def assert_row_count(expected):
+            with broker.get() as conn:
+                res = conn.execute("SELECT count(*) FROM shard_range")
+            self.assertEqual(expected, res.fetchone()[0])
+
+        broker.reclaim(older.internal, older.internal)
+        assert_row_count(7)
+        self._assert_shard_ranges(broker, shard_ranges, include_own=True)
+        broker.reclaim(older.internal, same.internal)
+        assert_row_count(6)
+        self._assert_shard_ranges(broker, shard_ranges[1:], include_own=True)
+        broker.reclaim(older.internal, newer.internal)
+        assert_row_count(5)
+        self._assert_shard_ranges(broker, shard_ranges[2:], include_own=True)
+        broker.reclaim(older.internal, next(self.ts).internal)
+        assert_row_count(4)
+        self._assert_shard_ranges(broker, shard_ranges[3:], include_own=True)
+
+    def test_get_info_is_deleted(self):
+        ts = make_timestamp_iter()
+        start = next(ts)
+        broker = ContainerBroker(self.get_db_path(),
+                                 account='test_account',
+                                 container='test_container')
+        # create it
+        broker.initialize(start.internal, POLICIES.default.idx)
+        info, is_deleted = broker.get_info_is_deleted()
+        self.assertEqual(is_deleted, broker.is_deleted())
+        self.assertEqual(is_deleted, False)  # sanity
+        self.assertEqual(info, broker.get_info())
+        self.assertEqual(info['put_timestamp'], start.internal)
+        self.assertTrue(Timestamp(info['created_at']) >= start)
+        self.assertEqual(info['delete_timestamp'], '0')
+        if self.__class__ in (
+                TestContainerBrokerBeforeMetadata,
+                TestContainerBrokerBeforeXSync,
+                TestContainerBrokerBeforeSPI,
+                TestContainerBrokerBeforeShardRanges,
+                TestContainerBrokerBeforeShardRangeReportedColumn,
+                TestContainerBrokerBeforeShardRangeTombstonesColumn):
+            self.assertEqual(info['status_changed_at'], '0')
+        else:
+            self.assertEqual(info['status_changed_at'],
+                             start.internal)
+
+        # delete it
+        delete_timestamp = next(ts)
+        broker.delete_db(delete_timestamp.internal)
+        info, is_deleted = broker.get_info_is_deleted()
+        self.assertEqual(is_deleted, True)  # sanity
+        self.assertEqual(is_deleted, broker.is_deleted())
+        self.assertEqual(info, broker.get_info())
+        self.assertEqual(info['put_timestamp'], start.internal)
+        self.assertTrue(Timestamp(info['created_at']) >= start)
+        self.assertEqual(info['delete_timestamp'], delete_timestamp)
+        self.assertEqual(info['status_changed_at'], delete_timestamp)
+
+        # bring back to life
+        broker.put_object('obj', next(ts).internal, 0, 'text/plain', 'etag',
+                          storage_policy_index=broker.storage_policy_index)
+        info, is_deleted = broker.get_info_is_deleted()
+        self.assertEqual(is_deleted, False)  # sanity
+        self.assertEqual(is_deleted, broker.is_deleted())
+        self.assertEqual(info, broker.get_info())
+        self.assertEqual(info['put_timestamp'], start.internal)
+        self.assertTrue(Timestamp(info['created_at']) >= start)
+        self.assertEqual(info['delete_timestamp'], delete_timestamp)
+        self.assertEqual(info['status_changed_at'], delete_timestamp)
+
+    def test_delete_object(self):
+        # Test ContainerBroker.delete_object
+        broker = ContainerBroker(self.get_db_path(), account='a',
+                                 container='c')
+        broker.initialize(Timestamp('1').internal, 0)
+        broker.put_object('o', Timestamp.now().internal, 0, 'text/plain',
+                          'd41d8cd98f00b204e9800998ecf8427e')
+        # commit pending file into db
+        broker._commit_puts()
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM object "
+                "WHERE deleted = 0").fetchone()[0], 1)
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM object "
+                "WHERE deleted = 1").fetchone()[0], 0)
+        sleep(.00001)
+        broker.delete_object('o', Timestamp.now().internal)
+        broker._commit_puts()
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM object "
+                "WHERE deleted = 0").fetchone()[0], 0)
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM object "
+                "WHERE deleted = 1").fetchone()[0], 1)
+
+    def test_put_object(self):
+        # Test ContainerBroker.put_object
+        broker = ContainerBroker(self.get_db_path(), account='a',
+                                 container='c')
+        broker.initialize(Timestamp('1').internal, 0)
+
+        # Create initial object
+        timestamp = Timestamp.now().internal
+        broker.put_object('"{<object \'&\' name>}"', timestamp, 123,
+                          'application/x-test',
+                          '5af83e3196bf99f440f31f2e1a6c9afe')
+        # commit pending file into db
+        broker._commit_puts()
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT name FROM object").fetchone()[0],
+                '"{<object \'&\' name>}"')
+            self.assertEqual(conn.execute(
+                "SELECT created_at FROM object").fetchone()[0], timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT size FROM object").fetchone()[0], 123)
+            self.assertEqual(conn.execute(
+                "SELECT content_type FROM object").fetchone()[0],
+                'application/x-test')
+            self.assertEqual(conn.execute(
+                "SELECT etag FROM object").fetchone()[0],
+                '5af83e3196bf99f440f31f2e1a6c9afe')
+            self.assertEqual(conn.execute(
+                "SELECT deleted FROM object").fetchone()[0], 0)
+
+        # Reput same event
+        broker.put_object('"{<object \'&\' name>}"', timestamp, 123,
+                          'application/x-test',
+                          '5af83e3196bf99f440f31f2e1a6c9afe')
+        broker._commit_puts()
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT name FROM object").fetchone()[0],
+                '"{<object \'&\' name>}"')
+            self.assertEqual(conn.execute(
+                "SELECT created_at FROM object").fetchone()[0], timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT size FROM object").fetchone()[0], 123)
+            self.assertEqual(conn.execute(
+                "SELECT content_type FROM object").fetchone()[0],
+                'application/x-test')
+            self.assertEqual(conn.execute(
+                "SELECT etag FROM object").fetchone()[0],
+                '5af83e3196bf99f440f31f2e1a6c9afe')
+            self.assertEqual(conn.execute(
+                "SELECT deleted FROM object").fetchone()[0], 0)
+
+        # Put new event
+        sleep(.00001)
+        timestamp = Timestamp.now().internal
+        broker.put_object('"{<object \'&\' name>}"', timestamp, 124,
+                          'application/x-test',
+                          'aa0749bacbc79ec65fe206943d8fe449')
+        broker._commit_puts()
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT name FROM object").fetchone()[0],
+                '"{<object \'&\' name>}"')
+            self.assertEqual(conn.execute(
+                "SELECT created_at FROM object").fetchone()[0], timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT size FROM object").fetchone()[0], 124)
+            self.assertEqual(conn.execute(
+                "SELECT content_type FROM object").fetchone()[0],
+                'application/x-test')
+            self.assertEqual(conn.execute(
+                "SELECT etag FROM object").fetchone()[0],
+                'aa0749bacbc79ec65fe206943d8fe449')
+            self.assertEqual(conn.execute(
+                "SELECT deleted FROM object").fetchone()[0], 0)
+
+        # Put old event
+        otimestamp = Timestamp(float(Timestamp(timestamp)) - 1).internal
+        broker.put_object('"{<object \'&\' name>}"', otimestamp, 124,
+                          'application/x-test',
+                          'aa0749bacbc79ec65fe206943d8fe449')
+        broker._commit_puts()
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT name FROM object").fetchone()[0],
+                '"{<object \'&\' name>}"')
+            self.assertEqual(conn.execute(
+                "SELECT created_at FROM object").fetchone()[0], timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT size FROM object").fetchone()[0], 124)
+            self.assertEqual(conn.execute(
+                "SELECT content_type FROM object").fetchone()[0],
+                'application/x-test')
+            self.assertEqual(conn.execute(
+                "SELECT etag FROM object").fetchone()[0],
+                'aa0749bacbc79ec65fe206943d8fe449')
+            self.assertEqual(conn.execute(
+                "SELECT deleted FROM object").fetchone()[0], 0)
+
+        # Put old delete event
+        dtimestamp = Timestamp(float(Timestamp(timestamp)) - 1).internal
+        broker.put_object('"{<object \'&\' name>}"', dtimestamp, 0, '', '',
+                          deleted=1)
+        broker._commit_puts()
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT name FROM object").fetchone()[0],
+                '"{<object \'&\' name>}"')
+            self.assertEqual(conn.execute(
+                "SELECT created_at FROM object").fetchone()[0], timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT size FROM object").fetchone()[0], 124)
+            self.assertEqual(conn.execute(
+                "SELECT content_type FROM object").fetchone()[0],
+                'application/x-test')
+            self.assertEqual(conn.execute(
+                "SELECT etag FROM object").fetchone()[0],
+                'aa0749bacbc79ec65fe206943d8fe449')
+            self.assertEqual(conn.execute(
+                "SELECT deleted FROM object").fetchone()[0], 0)
+
+        # Put new delete event
+        sleep(.00001)
+        timestamp = Timestamp.now().internal
+        broker.put_object('"{<object \'&\' name>}"', timestamp, 0, '', '',
+                          deleted=1)
+        broker._commit_puts()
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT name FROM object").fetchone()[0],
+                '"{<object \'&\' name>}"')
+            self.assertEqual(conn.execute(
+                "SELECT created_at FROM object").fetchone()[0], timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT deleted FROM object").fetchone()[0], 1)
+
+        # Put new event
+        sleep(.00001)
+        timestamp = Timestamp.now().internal
+        broker.put_object('"{<object \'&\' name>}"', timestamp, 123,
+                          'application/x-test',
+                          '5af83e3196bf99f440f31f2e1a6c9afe')
+        broker._commit_puts()
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT name FROM object").fetchone()[0],
+                '"{<object \'&\' name>}"')
+            self.assertEqual(conn.execute(
+                "SELECT created_at FROM object").fetchone()[0], timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT size FROM object").fetchone()[0], 123)
+            self.assertEqual(conn.execute(
+                "SELECT content_type FROM object").fetchone()[0],
+                'application/x-test')
+            self.assertEqual(conn.execute(
+                "SELECT etag FROM object").fetchone()[0],
+                '5af83e3196bf99f440f31f2e1a6c9afe')
+            self.assertEqual(conn.execute(
+                "SELECT deleted FROM object").fetchone()[0], 0)
+
+        # We'll use this later
+        sleep(.0001)
+        in_between_timestamp = Timestamp.now().internal
+
+        # New post event
+        sleep(.0001)
+        previous_timestamp = timestamp
+        timestamp = Timestamp.now().internal
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT name FROM object").fetchone()[0],
+                '"{<object \'&\' name>}"')
+            self.assertEqual(conn.execute(
+                "SELECT created_at FROM object").fetchone()[0],
+                previous_timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT size FROM object").fetchone()[0], 123)
+            self.assertEqual(conn.execute(
+                "SELECT content_type FROM object").fetchone()[0],
+                'application/x-test')
+            self.assertEqual(conn.execute(
+                "SELECT etag FROM object").fetchone()[0],
+                '5af83e3196bf99f440f31f2e1a6c9afe')
+            self.assertEqual(conn.execute(
+                "SELECT deleted FROM object").fetchone()[0], 0)
+
+        # Put event from after last put but before last post
+        timestamp = in_between_timestamp
+        broker.put_object('"{<object \'&\' name>}"', timestamp, 456,
+                          'application/x-test3',
+                          '6af83e3196bf99f440f31f2e1a6c9afe')
+        broker._commit_puts()
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT name FROM object").fetchone()[0],
+                '"{<object \'&\' name>}"')
+            self.assertEqual(conn.execute(
+                "SELECT created_at FROM object").fetchone()[0], timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT size FROM object").fetchone()[0], 456)
+            self.assertEqual(conn.execute(
+                "SELECT content_type FROM object").fetchone()[0],
+                'application/x-test3')
+            self.assertEqual(conn.execute(
+                "SELECT etag FROM object").fetchone()[0],
+                '6af83e3196bf99f440f31f2e1a6c9afe')
+            self.assertEqual(conn.execute(
+                "SELECT deleted FROM object").fetchone()[0], 0)
+
+    def test_merge_shard_range_single_record(self):
+        # Test ContainerBroker.merge_shard_range
+        broker = ContainerBroker(self.get_db_path(), account='a',
+                                 container='c')
+        broker.initialize(Timestamp('1').internal, 0)
+
+        # Stash these for later
+        old_put_timestamp = next(self.ts).internal
+        old_delete_timestamp = next(self.ts).internal
+
+        # Create initial object
+        timestamp = next(self.ts).internal
+        meta_timestamp = next(self.ts).internal
+        broker.merge_shard_ranges(
+            ShardRange('"a/{<shardrange \'&\' name>}"', timestamp,
+                       'low', 'up', meta_timestamp=meta_timestamp))
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT name FROM shard_range").fetchone()[0],
+                '"a/{<shardrange \'&\' name>}"')
+            self.assertEqual(conn.execute(
+                "SELECT timestamp FROM shard_range").fetchone()[0],
+                timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT meta_timestamp FROM shard_range").fetchone()[0],
+                meta_timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT lower FROM shard_range").fetchone()[0], 'low')
+            self.assertEqual(conn.execute(
+                "SELECT upper FROM shard_range").fetchone()[0], 'up')
+            self.assertEqual(conn.execute(
+                "SELECT deleted FROM shard_range").fetchone()[0], 0)
+            self.assertEqual(conn.execute(
+                "SELECT object_count FROM shard_range").fetchone()[0], 0)
+            self.assertEqual(conn.execute(
+                "SELECT bytes_used FROM shard_range").fetchone()[0], 0)
+            self.assertEqual(conn.execute(
+                "SELECT reported FROM shard_range").fetchone()[0], 0)
+
+        # Reput same event
+        broker.merge_shard_ranges(
+            ShardRange('"a/{<shardrange \'&\' name>}"', timestamp,
+                       'low', 'up', meta_timestamp=meta_timestamp))
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT name FROM shard_range").fetchone()[0],
+                '"a/{<shardrange \'&\' name>}"')
+            self.assertEqual(conn.execute(
+                "SELECT timestamp FROM shard_range").fetchone()[0],
+                timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT meta_timestamp FROM shard_range").fetchone()[0],
+                meta_timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT lower FROM shard_range").fetchone()[0], 'low')
+            self.assertEqual(conn.execute(
+                "SELECT upper FROM shard_range").fetchone()[0], 'up')
+            self.assertEqual(conn.execute(
+                "SELECT deleted FROM shard_range").fetchone()[0], 0)
+            self.assertEqual(conn.execute(
+                "SELECT object_count FROM shard_range").fetchone()[0], 0)
+            self.assertEqual(conn.execute(
+                "SELECT bytes_used FROM shard_range").fetchone()[0], 0)
+            self.assertEqual(conn.execute(
+                "SELECT reported FROM shard_range").fetchone()[0], 0)
+
+        # Mark it as reported
+        broker.merge_shard_ranges(
+            ShardRange('"a/{<shardrange \'&\' name>}"', timestamp,
+                       'low', 'up', meta_timestamp=meta_timestamp,
+                       reported=True))
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT name FROM shard_range").fetchone()[0],
+                '"a/{<shardrange \'&\' name>}"')
+            self.assertEqual(conn.execute(
+                "SELECT timestamp FROM shard_range").fetchone()[0],
+                timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT meta_timestamp FROM shard_range").fetchone()[0],
+                meta_timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT lower FROM shard_range").fetchone()[0], 'low')
+            self.assertEqual(conn.execute(
+                "SELECT upper FROM shard_range").fetchone()[0], 'up')
+            self.assertEqual(conn.execute(
+                "SELECT deleted FROM shard_range").fetchone()[0], 0)
+            self.assertEqual(conn.execute(
+                "SELECT object_count FROM shard_range").fetchone()[0], 0)
+            self.assertEqual(conn.execute(
+                "SELECT bytes_used FROM shard_range").fetchone()[0], 0)
+            self.assertEqual(conn.execute(
+                "SELECT reported FROM shard_range").fetchone()[0], 1)
+
+        # Reporting latches it
+        broker.merge_shard_ranges(
+            ShardRange('"a/{<shardrange \'&\' name>}"', timestamp,
+                       'low', 'up', meta_timestamp=meta_timestamp,
+                       reported=False))
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT name FROM shard_range").fetchone()[0],
+                '"a/{<shardrange \'&\' name>}"')
+            self.assertEqual(conn.execute(
+                "SELECT timestamp FROM shard_range").fetchone()[0],
+                timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT meta_timestamp FROM shard_range").fetchone()[0],
+                meta_timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT lower FROM shard_range").fetchone()[0], 'low')
+            self.assertEqual(conn.execute(
+                "SELECT upper FROM shard_range").fetchone()[0], 'up')
+            self.assertEqual(conn.execute(
+                "SELECT deleted FROM shard_range").fetchone()[0], 0)
+            self.assertEqual(conn.execute(
+                "SELECT object_count FROM shard_range").fetchone()[0], 0)
+            self.assertEqual(conn.execute(
+                "SELECT bytes_used FROM shard_range").fetchone()[0], 0)
+            self.assertEqual(conn.execute(
+                "SELECT reported FROM shard_range").fetchone()[0], 1)
+
+        # Put new event
+        timestamp = next(self.ts).internal
+        meta_timestamp = next(self.ts).internal
+        broker.merge_shard_ranges(
+            ShardRange('"a/{<shardrange \'&\' name>}"', timestamp,
+                       'lower', 'upper', 1, 2, meta_timestamp=meta_timestamp))
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT name FROM shard_range").fetchone()[0],
+                '"a/{<shardrange \'&\' name>}"')
+            self.assertEqual(conn.execute(
+                "SELECT timestamp FROM shard_range").fetchone()[0],
+                timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT meta_timestamp FROM shard_range").fetchone()[0],
+                meta_timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT lower FROM shard_range").fetchone()[0], 'lower')
+            self.assertEqual(conn.execute(
+                "SELECT upper FROM shard_range").fetchone()[0], 'upper')
+            self.assertEqual(conn.execute(
+                "SELECT deleted FROM shard_range").fetchone()[0], 0)
+            self.assertEqual(conn.execute(
+                "SELECT object_count FROM shard_range").fetchone()[0], 1)
+            self.assertEqual(conn.execute(
+                "SELECT bytes_used FROM shard_range").fetchone()[0], 2)
+            self.assertEqual(conn.execute(
+                "SELECT reported FROM shard_range").fetchone()[0], 0)
+
+        # Put old event
+        broker.merge_shard_ranges(
+            ShardRange('"a/{<shardrange \'&\' name>}"', old_put_timestamp,
+                       'lower', 'upper', 1, 2, meta_timestamp=meta_timestamp,
+                       reported=True))
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT name FROM shard_range").fetchone()[0],
+                '"a/{<shardrange \'&\' name>}"')
+            self.assertEqual(conn.execute(
+                "SELECT timestamp FROM shard_range").fetchone()[0],
+                timestamp)  # Not old_put_timestamp!
+            self.assertEqual(conn.execute(
+                "SELECT meta_timestamp FROM shard_range").fetchone()[0],
+                meta_timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT lower FROM shard_range").fetchone()[0], 'lower')
+            self.assertEqual(conn.execute(
+                "SELECT upper FROM shard_range").fetchone()[0], 'upper')
+            self.assertEqual(conn.execute(
+                "SELECT deleted FROM shard_range").fetchone()[0], 0)
+            self.assertEqual(conn.execute(
+                "SELECT object_count FROM shard_range").fetchone()[0], 1)
+            self.assertEqual(conn.execute(
+                "SELECT bytes_used FROM shard_range").fetchone()[0], 2)
+            self.assertEqual(conn.execute(
+                "SELECT reported FROM shard_range").fetchone()[0], 0)
+
+        # Put old delete event
+        broker.merge_shard_ranges(
+            ShardRange('"a/{<shardrange \'&\' name>}"', old_delete_timestamp,
+                       'lower', 'upper', meta_timestamp=meta_timestamp,
+                       deleted=1))
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT name FROM shard_range").fetchone()[0],
+                '"a/{<shardrange \'&\' name>}"')
+            self.assertEqual(conn.execute(
+                "SELECT timestamp FROM shard_range").fetchone()[0],
+                timestamp)  # Not old_delete_timestamp!
+            self.assertEqual(conn.execute(
+                "SELECT meta_timestamp FROM shard_range").fetchone()[0],
+                meta_timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT lower FROM shard_range").fetchone()[0], 'lower')
+            self.assertEqual(conn.execute(
+                "SELECT upper FROM shard_range").fetchone()[0], 'upper')
+            self.assertEqual(conn.execute(
+                "SELECT deleted FROM shard_range").fetchone()[0], 0)
+            self.assertEqual(conn.execute(
+                "SELECT object_count FROM shard_range").fetchone()[0], 1)
+            self.assertEqual(conn.execute(
+                "SELECT bytes_used FROM shard_range").fetchone()[0], 2)
+
+        # Put new delete event
+        timestamp = next(self.ts).internal
+        broker.merge_shard_ranges(
+            ShardRange('"a/{<shardrange \'&\' name>}"', timestamp,
+                       'lower', 'upper', meta_timestamp=meta_timestamp,
+                       deleted=1))
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT name FROM shard_range").fetchone()[0],
+                '"a/{<shardrange \'&\' name>}"')
+            self.assertEqual(conn.execute(
+                "SELECT timestamp FROM shard_range").fetchone()[0],
+                timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT deleted FROM shard_range").fetchone()[0], 1)
+
+        # Put new event
+        timestamp = next(self.ts).internal
+        meta_timestamp = next(self.ts).internal
+        broker.merge_shard_ranges(
+            ShardRange('"a/{<shardrange \'&\' name>}"', timestamp,
+                       'lowerer', 'upperer', 3, 4,
+                       meta_timestamp=meta_timestamp))
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT name FROM shard_range").fetchone()[0],
+                '"a/{<shardrange \'&\' name>}"')
+            self.assertEqual(conn.execute(
+                "SELECT timestamp FROM shard_range").fetchone()[0],
+                timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT meta_timestamp FROM shard_range").fetchone()[0],
+                meta_timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT lower FROM shard_range").fetchone()[0], 'lowerer')
+            self.assertEqual(conn.execute(
+                "SELECT upper FROM shard_range").fetchone()[0], 'upperer')
+            self.assertEqual(conn.execute(
+                "SELECT deleted FROM shard_range").fetchone()[0], 0)
+            self.assertEqual(conn.execute(
+                "SELECT object_count FROM shard_range").fetchone()[0], 3)
+            self.assertEqual(conn.execute(
+                "SELECT bytes_used FROM shard_range").fetchone()[0], 4)
+
+        # We'll use this later
+        in_between_timestamp = next(self.ts).internal
+
+        # New update event, meta_timestamp increases
+        meta_timestamp = next(self.ts).internal
+        broker.merge_shard_ranges(
+            ShardRange('"a/{<shardrange \'&\' name>}"', timestamp,
+                       'lowerer', 'upperer', 3, 4,
+                       meta_timestamp=meta_timestamp))
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT name FROM shard_range").fetchone()[0],
+                '"a/{<shardrange \'&\' name>}"')
+            self.assertEqual(conn.execute(
+                "SELECT timestamp FROM shard_range").fetchone()[0],
+                timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT meta_timestamp FROM shard_range").fetchone()[0],
+                meta_timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT lower FROM shard_range").fetchone()[0], 'lowerer')
+            self.assertEqual(conn.execute(
+                "SELECT upper FROM shard_range").fetchone()[0], 'upperer')
+            self.assertEqual(conn.execute(
+                "SELECT deleted FROM shard_range").fetchone()[0], 0)
+            self.assertEqual(conn.execute(
+                "SELECT object_count FROM shard_range").fetchone()[0], 3)
+            self.assertEqual(conn.execute(
+                "SELECT bytes_used FROM shard_range").fetchone()[0], 4)
+
+        # Put event from after last put but before last post
+        timestamp = in_between_timestamp
+        broker.merge_shard_ranges(
+            ShardRange('"a/{<shardrange \'&\' name>}"', timestamp,
+                       'lowererer', 'uppererer', 5, 6,
+                       meta_timestamp=meta_timestamp))
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT name FROM shard_range").fetchone()[0],
+                '"a/{<shardrange \'&\' name>}"')
+            self.assertEqual(conn.execute(
+                "SELECT timestamp FROM shard_range").fetchone()[0],
+                timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT meta_timestamp FROM shard_range").fetchone()[0],
+                meta_timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT lower FROM shard_range").fetchone()[0], 'lowererer')
+            self.assertEqual(conn.execute(
+                "SELECT upper FROM shard_range").fetchone()[0], 'uppererer')
+            self.assertEqual(conn.execute(
+                "SELECT deleted FROM shard_range").fetchone()[0], 0)
+            self.assertEqual(conn.execute(
+                "SELECT object_count FROM shard_range").fetchone()[0], 5)
+            self.assertEqual(conn.execute(
+                "SELECT bytes_used FROM shard_range").fetchone()[0], 6)
+
+    def test_merge_shard_ranges_deleted(self):
+        # Test ContainerBroker.merge_shard_ranges sets deleted attribute
+        broker = ContainerBroker(self.get_db_path(), account='a',
+                                 container='c')
+        broker.initialize(Timestamp('1').internal, 0)
+        # put shard range
+        broker.merge_shard_ranges(ShardRange('a/o', next(self.ts).internal))
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM shard_range "
+                "WHERE deleted = 0").fetchone()[0], 1)
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM shard_range "
+                "WHERE deleted = 1").fetchone()[0], 0)
+
+        # delete shard range
+        broker.merge_shard_ranges(ShardRange('a/o', next(self.ts).internal,
+                                             deleted=1))
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM shard_range "
+                "WHERE deleted = 0").fetchone()[0], 0)
+            self.assertEqual(conn.execute(
+                "SELECT count(*) FROM shard_range "
+                "WHERE deleted = 1").fetchone()[0], 1)
+
+    def test_make_tuple_for_pickle(self):
+        record = {'name': 'obj',
+                  'created_at': '1234567890.12345',
+                  'size': 42,
+                  'content_type': 'text/plain',
+                  'etag': 'hash_test',
+                  'deleted': '1',
+                  'storage_policy_index': '2',
+                  'ctype_timestamp': None,
+                  'meta_timestamp': None}
+        broker = ContainerBroker(self.get_db_path(), account='a',
+                                 container='c')
+
+        expect = ('obj', '1234567890.12345', 42, 'text/plain', 'hash_test',
+                  '1', '2', None, None)
+        result = broker.make_tuple_for_pickle(record)
+        self.assertEqual(expect, result)
+
+        record['ctype_timestamp'] = '2233445566.00000'
+        expect = ('obj', '1234567890.12345', 42, 'text/plain', 'hash_test',
+                  '1', '2', '2233445566.00000', None)
+        result = broker.make_tuple_for_pickle(record)
+        self.assertEqual(expect, result)
+
+        record['meta_timestamp'] = '5566778899.00000'
+        expect = ('obj', '1234567890.12345', 42, 'text/plain', 'hash_test',
+                  '1', '2', '2233445566.00000', '5566778899.00000')
+        result = broker.make_tuple_for_pickle(record)
+        self.assertEqual(expect, result)
+
+    @with_tempdir
+    def test_load_old_record_from_pending_file(self, tempdir):
+        # Test reading old update record from pending file
+        db_path = os.path.join(tempdir, 'container.db')
+        broker = ContainerBroker(db_path, account='a', container='c')
+        broker.initialize(time(), 0)
+
+        record = {'name': 'obj',
+                  'created_at': '1234567890.12345',
+                  'size': 42,
+                  'content_type': 'text/plain',
+                  'etag': 'hash_test',
+                  'deleted': '1',
+                  'storage_policy_index': '2',
+                  'ctype_timestamp': None,
+                  'meta_timestamp': None}
+
+        # sanity check
+        self.assertFalse(os.path.isfile(broker.pending_file))
+
+        # simulate existing pending items written with old code,
+        # i.e. without content_type and meta timestamps
+        def old_make_tuple_for_pickle(_, record):
+            return (record['name'], record['created_at'], record['size'],
+                    record['content_type'], record['etag'], record['deleted'],
+                    record['storage_policy_index'])
+
+        _new = 'swift.container.backend.ContainerBroker.make_tuple_for_pickle'
+        with mock.patch(_new, old_make_tuple_for_pickle):
+            broker.put_record(dict(record))
+
+        self.assertTrue(os.path.getsize(broker.pending_file) > 0)
+        read_items = []
+
+        def mock_merge_items(_, item_list, *args):
+            # capture the items read from the pending file
+            read_items.extend(item_list)
+
+        with mock.patch('swift.container.backend.ContainerBroker.merge_items',
+                        mock_merge_items):
+            broker._commit_puts()
+
+        self.assertEqual(1, len(read_items))
+        self.assertEqual(record, read_items[0])
+        self.assertTrue(os.path.getsize(broker.pending_file) == 0)
+
+    @with_tempdir
+    def test_save_and_load_record_from_pending_file(self, tempdir):
+        db_path = os.path.join(tempdir, 'container.db')
+        broker = ContainerBroker(db_path, account='a', container='c')
+        broker.initialize(time(), 0)
+
+        record = {'name': 'obj',
+                  'created_at': '1234567890.12345',
+                  'size': 42,
+                  'content_type': 'text/plain',
+                  'etag': 'hash_test',
+                  'deleted': '1',
+                  'storage_policy_index': '2',
+                  'ctype_timestamp': '1234567890.44444',
+                  'meta_timestamp': '1234567890.99999'}
+
+        # sanity check
+        self.assertFalse(os.path.isfile(broker.pending_file))
+        broker.put_record(dict(record))
+        self.assertTrue(os.path.getsize(broker.pending_file) > 0)
+        read_items = []
+
+        def mock_merge_items(_, item_list, *args):
+            # capture the items read from the pending file
+            read_items.extend(item_list)
+
+        with mock.patch('swift.container.backend.ContainerBroker.merge_items',
+                        mock_merge_items):
+            broker._commit_puts()
+
+        self.assertEqual(1, len(read_items))
+        self.assertEqual(record, read_items[0])
+        self.assertTrue(os.path.getsize(broker.pending_file) == 0)
+
+    def _assert_db_row(self, broker, name, timestamp, size, content_type, hash,
+                       deleted=0):
+        with broker.get() as conn:
+            self.assertEqual(conn.execute(
+                "SELECT name FROM object").fetchone()[0], name)
+            self.assertEqual(conn.execute(
+                "SELECT created_at FROM object").fetchone()[0], timestamp)
+            self.assertEqual(conn.execute(
+                "SELECT size FROM object").fetchone()[0], size)
+            self.assertEqual(conn.execute(
+                "SELECT content_type FROM object").fetchone()[0],
+                content_type)
+            self.assertEqual(conn.execute(
+                "SELECT etag FROM object").fetchone()[0], hash)
+            self.assertEqual(conn.execute(
+                "SELECT deleted FROM object").fetchone()[0], deleted)
+
+    def _test_put_object_multiple_encoded_timestamps(self, broker):
+        ts = make_timestamp_iter()
+        broker.initialize(next(ts).internal, 0)
+        t = [next(ts) for _ in range(9)]
+
+        # Create initial object
+        broker.put_object('obj_name', t[0].internal, 123,
+                          'application/x-test',
+                          '5af83e3196bf99f440f31f2e1a6c9afe')
+        self.assertEqual(1, len(broker.get_items_since(0, 100)))
+        self._assert_db_row(broker, 'obj_name', t[0].internal, 123,
+                            'application/x-test',
+                            '5af83e3196bf99f440f31f2e1a6c9afe')
+
+        # hash and size change with same data timestamp are ignored
+        t_encoded = encode_timestamps(t[0], t[1], t[1])
+        broker.put_object('obj_name', t_encoded, 456,
+                          'application/x-test-2',
+                          '1234567890abcdeffedcba0987654321')
+        self.assertEqual(1, len(broker.get_items_since(0, 100)))
+        self._assert_db_row(broker, 'obj_name', t_encoded, 123,
+                            'application/x-test-2',
+                            '5af83e3196bf99f440f31f2e1a6c9afe')
+
+        # content-type change with same timestamp is ignored
+        t_encoded = encode_timestamps(t[0], t[1], t[2])
+        broker.put_object('obj_name', t_encoded, 456,
+                          'application/x-test-3',
+                          '1234567890abcdeffedcba0987654321')
+        self.assertEqual(1, len(broker.get_items_since(0, 100)))
+        self._assert_db_row(broker, 'obj_name', t_encoded, 123,
+                            'application/x-test-2',
+                            '5af83e3196bf99f440f31f2e1a6c9afe')
+
+        # update with differing newer timestamps
+        t_encoded = encode_timestamps(t[4], t[6], t[8])
+        broker.put_object('obj_name', t_encoded, 789,
+                          'application/x-test-3',
+                          'abcdef1234567890abcdef1234567890')
+        self.assertEqual(1, len(broker.get_items_since(0, 100)))
+        self._assert_db_row(broker, 'obj_name', t_encoded, 789,
+                            'application/x-test-3',
+                            'abcdef1234567890abcdef1234567890')
+
+        # update with differing older timestamps should be ignored
+        t_encoded_older = encode_timestamps(t[3], t[5], t[7])
+        self.assertEqual(1, len(broker.get_items_since(0, 100)))
+        broker.put_object('obj_name', t_encoded_older, 9999,
+                          'application/x-test-ignored',
+                          'ignored_hash')
+        self.assertEqual(1, len(broker.get_items_since(0, 100)))
+        self._assert_db_row(broker, 'obj_name', t_encoded, 789,
+                            'application/x-test-3',
+                            'abcdef1234567890abcdef1234567890')
+
+    def test_put_object_multiple_encoded_timestamps_using_memory(self):
+        # Test ContainerBroker.put_object with differing data, content-type
+        # and metadata timestamps
+        broker = ContainerBroker(self.get_db_path(), account='a',
+                                 container='c')
+        self._test_put_object_multiple_encoded_timestamps(broker)
+
+    @with_tempdir
+    def test_has_other_shard_ranges(self, tempdir):
+        acct = 'account'
+        cont = 'container'
+        hsh = hash_path(acct, cont)
+        epoch = Timestamp.now()
+        db_file = "%s_%s.db" % (hsh, epoch.normal)
+        db_path = os.path.join(tempdir, db_file)
+        ts = Timestamp.now()
+        broker = ContainerBroker(db_path, account=acct,
+                                 container=cont, force_db_file=True)
+        # Create the test container database and all the tables.
+        broker.initialize(ts.internal, 0)
+
+        # Test the case which the 'shard_range' table doesn't exist yet.
+        self._delete_table(broker, 'shard_range')
+        self.assertFalse(broker.has_other_shard_ranges())
+
+        # Add the 'shard_range' table back to the database, but it doesn't
+        # have any shard range row in it yet.
+        self._add_shard_range_table(broker)
+        self.assertFalse(broker.get_shard_ranges(
+            include_deleted=True, states=None, include_own=True))
+        self.assertFalse(broker.has_other_shard_ranges())
+
+        # Insert its 'own_shard_range' into this test database.
+        own_shard_range = broker.get_own_shard_range()
+        own_shard_range.update_state(ShardRange.SHARDING)
+        own_shard_range.epoch = epoch
+        broker.merge_shard_ranges([own_shard_range])
+        self.assertTrue(broker.get_shard_ranges(include_own=True))
+        self.assertFalse(broker.has_other_shard_ranges())
+
+        # Insert a child shard range into this test database.
+        first_child_sr = ShardRange(
+            '.shards_%s/%s_1' % (acct, cont), Timestamp.now())
+        broker.merge_shard_ranges([first_child_sr])
+        self.assertTrue(broker.has_other_shard_ranges())
+
+        # Mark the first child shard range as deleted.
+        first_child_sr.deleted = 1
+        first_child_sr.timestamp = Timestamp.now()
+        broker.merge_shard_ranges([first_child_sr])
+        self.assertFalse(broker.has_other_shard_ranges())
+
+        # Insert second child shard range into this test database.
+        second_child_sr = ShardRange(
+            '.shards_%s/%s_2' % (acct, cont), Timestamp.now())
+        broker.merge_shard_ranges([second_child_sr])
+        self.assertTrue(broker.has_other_shard_ranges())
+
+        # Mark the 'own_shard_range' as deleted.
+        own_shard_range.deleted = 1
+        own_shard_range.timestamp = Timestamp.now()
+        broker.merge_shard_ranges([own_shard_range])
+        self.assertTrue(broker.has_other_shard_ranges())
+
+    @with_tempdir
+    def test_get_db_state(self, tempdir):
+        acct = 'account'
+        cont = 'container'
+        hsh = hash_path(acct, cont)
+        db_file = "%s.db" % hsh
+        epoch = Timestamp.now()
+        fresh_db_file = "%s_%s.db" % (hsh, epoch.normal)
+        db_path = os.path.join(tempdir, db_file)
+        fresh_db_path = os.path.join(tempdir, fresh_db_file)
+        ts = Timestamp.now()
+
+        # First test NOTFOUND state
+        broker = ContainerBroker(db_path, account=acct, container=cont)
+        self.assertEqual(broker.get_db_state(), 'not_found')
+
+        # Test UNSHARDED state, that is when db_file exists and fresh_db_file
+        # doesn't
+        broker.initialize(ts.internal, 0)
+        self.assertEqual(broker.get_db_state(), 'unsharded')
+
+        # Test the SHARDING state, this is the period when both the db_file and
+        # the fresh_db_file exist
+        fresh_broker = ContainerBroker(fresh_db_path, account=acct,
+                                       container=cont, force_db_file=True)
+        fresh_broker.initialize(ts.internal, 0)
+        own_shard_range = fresh_broker.get_own_shard_range()
+        own_shard_range.update_state(ShardRange.SHARDING)
+        own_shard_range.epoch = epoch
+        shard_range = ShardRange(
+            '.shards_%s/%s' % (acct, cont), Timestamp.now())
+        fresh_broker.merge_shard_ranges([own_shard_range, shard_range])
+
+        self.assertEqual(fresh_broker.get_db_state(), 'sharding')
+        # old broker will also change state if we reload its db files
+        broker.reload_db_files()
+        self.assertEqual(broker.get_db_state(), 'sharding')
+
+        # Test the SHARDED state, this is when only fresh_db_file exists.
+        os.unlink(db_path)
+        fresh_broker.reload_db_files()
+        self.assertEqual(fresh_broker.get_db_state(), 'sharded')
+
+        # Test the COLLAPSED state, this is when only fresh_db_file exists.
+        shard_range.deleted = 1
+        shard_range.timestamp = Timestamp.now()
+        fresh_broker.merge_shard_ranges([shard_range])
+        self.assertEqual(fresh_broker.get_db_state(), 'collapsed')
+
+        # back to UNSHARDED if the desired epoch changes
+        own_shard_range.update_state(ShardRange.SHRINKING,
+                                     state_timestamp=Timestamp.now())
+        own_shard_range.epoch = Timestamp.now()
+        fresh_broker.merge_shard_ranges([own_shard_range])
+        self.assertEqual(fresh_broker.get_db_state(), 'unsharded')
+
+    @with_tempdir
+    def test_delete_db_does_not_clear_particular_sharding_meta(self, tempdir):
+        acct = '.sharded_a'
+        cont = 'c'
+        hsh = hash_path(acct, cont)
+        db_file = "%s.db" % hsh
+        db_path = os.path.join(tempdir, db_file)
+        put_ts = next(self.ts)
+
+        broker = ContainerBroker(db_path, account=acct, container=cont)
+        broker.initialize(put_ts.internal, 0)
+
+        # add some metadata but include both types of root path
+        broker.update_metadata({
+            'foo': ('bar', put_ts.internal),
+            'icecream': ('sandwich', put_ts.internal),
+            'X-Container-Sysmeta-Some': ('meta', put_ts.internal),
+            'X-Container-Sysmeta-Sharding': ('yes', put_ts.internal),
+            'X-Container-Sysmeta-Shard-Quoted-Root': ('a/c', put_ts.internal),
+            'X-Container-Sysmeta-Shard-Root': ('a/c', put_ts.internal)})
+
+        self.assertEqual('a/c', broker.root_path)
+
+        # now let's delete the db. All meta
+        delete_ts = next(self.ts)
+        broker.delete_db(delete_ts.internal)
+
+        # ensure that metadata was cleared except for root paths
+        def check_metadata(broker):
+            meta = broker.metadata
+            self.assertEqual(meta['X-Container-Sysmeta-Some'],
+                             ['', delete_ts.internal])
+            self.assertEqual(meta['icecream'], ['', delete_ts.internal])
+            self.assertEqual(meta['foo'], ['', delete_ts.internal])
+            self.assertEqual(meta['X-Container-Sysmeta-Shard-Quoted-Root'],
+                             ['a/c', put_ts.internal])
+            self.assertEqual(meta['X-Container-Sysmeta-Shard-Root'],
+                             ['a/c', put_ts.internal])
+            self.assertEqual('a/c', broker.root_path)
+            self.assertEqual(meta['X-Container-Sysmeta-Sharding'],
+                             ['yes', put_ts.internal])
+            self.assertFalse(broker.is_root_container())
+
+        check_metadata(broker)
+        # fresh broker in case values were cached in previous instance
+        broker = ContainerBroker(db_path)
+        check_metadata(broker)
+
+    @with_tempdir
+    def test_db_file(self, tempdir):
+        acct = 'account'
+        cont = 'continer'
+        hsh = hash_path(acct, cont)
+        db_file = "%s.db" % hsh
+        ts_epoch = Timestamp.now()
+        fresh_db_file = "%s_%s.db" % (hsh, ts_epoch.normal)
+        db_path = os.path.join(tempdir, db_file)
+        fresh_db_path = os.path.join(tempdir, fresh_db_file)
+        ts = Timestamp.now()
+
+        # First test NOTFOUND state, this will return the db_file passed
+        # in the constructor
+        def check_unfound_db_files(broker, init_db_file):
+            self.assertEqual(init_db_file, broker.db_file)
+            self.assertEqual(broker._db_file, db_path)
+            self.assertFalse(os.path.exists(db_path))
+            self.assertFalse(os.path.exists(fresh_db_path))
+            self.assertEqual([], broker.db_files)
+
+        broker = ContainerBroker(db_path, account=acct, container=cont)
+        check_unfound_db_files(broker, db_path)
+        broker = ContainerBroker(fresh_db_path, account=acct, container=cont)
+        check_unfound_db_files(broker, fresh_db_path)
+
+        # Test UNSHARDED state, that is when db_file exists and fresh_db_file
+        # doesn't, so it should return the db_path
+        def check_unsharded_db_files(broker):
+            self.assertEqual(broker.db_file, db_path)
+            self.assertEqual(broker._db_file, db_path)
+            self.assertTrue(os.path.exists(db_path))
+            self.assertFalse(os.path.exists(fresh_db_path))
+            self.assertEqual([db_path], broker.db_files)
+
+        broker = ContainerBroker(db_path, account=acct, container=cont)
+        broker.initialize(ts.internal, 0)
+        check_unsharded_db_files(broker)
+        broker = ContainerBroker(fresh_db_path, account=acct, container=cont)
+        check_unsharded_db_files(broker)
+        # while UNSHARDED db_path is still used despite giving fresh_db_path
+        # to init, so we cannot initialize this broker
+        with self.assertRaises(DatabaseAlreadyExists):
+            broker.initialize(ts.internal, 0)
+
+        # Test the SHARDING state, this is the period when both the db_file and
+        # the fresh_db_file exist, in this case it should return the
+        # fresh_db_path.
+        def check_sharding_db_files(broker):
+            self.assertEqual(broker.db_file, fresh_db_path)
+            self.assertEqual(broker._db_file, db_path)
+            self.assertTrue(os.path.exists(db_path))
+            self.assertTrue(os.path.exists(fresh_db_path))
+            self.assertEqual([db_path, fresh_db_path], broker.db_files)
+
+        # Use force_db_file to have db_shard_path created when initializing
+        broker = ContainerBroker(fresh_db_path, account=acct,
+                                 container=cont, force_db_file=True)
+        self.assertEqual([db_path], broker.db_files)
+        broker.initialize(ts.internal, 0)
+        check_sharding_db_files(broker)
+        broker = ContainerBroker(db_path, account=acct, container=cont)
+        check_sharding_db_files(broker)
+        broker = ContainerBroker(fresh_db_path, account=acct, container=cont)
+        check_sharding_db_files(broker)
+
+        # force_db_file can be used to open db_path specifically
+        forced_broker = ContainerBroker(db_path, account=acct,
+                                        container=cont, force_db_file=True)
+        self.assertEqual(forced_broker.db_file, db_path)
+        self.assertEqual(forced_broker._db_file, db_path)
+
+        def check_sharded_db_files(broker):
+            self.assertEqual(broker.db_file, fresh_db_path)
+            self.assertEqual(broker._db_file, db_path)
+            self.assertFalse(os.path.exists(db_path))
+            self.assertTrue(os.path.exists(fresh_db_path))
+            self.assertEqual([fresh_db_path], broker.db_files)
+
+        # Test the SHARDED state, this is when only fresh_db_file exists, so
+        # obviously this should return the fresh_db_path
+        os.unlink(db_path)
+        broker.reload_db_files()
+        check_sharded_db_files(broker)
+        broker = ContainerBroker(db_path, account=acct, container=cont)
+        check_sharded_db_files(broker)
+
+    @with_tempdir
+    def test_sharding_initiated_and_required(self, tempdir):
+        db_path = os.path.join(
+            tempdir, 'containers', 'part', 'suffix', 'hash', '%s.db' % uuid4())
+        broker = ContainerBroker(db_path, account='a', container='c')
+        broker.initialize(Timestamp.now().internal, 0)
+        # no shard ranges
+        self.assertIs(False, broker.sharding_initiated())
+        self.assertIs(False, broker.sharding_required())
+        # only own shard range
+        own_sr = broker.get_own_shard_range()
+        for state in ShardRange.STATES:
+            own_sr.update_state(state, state_timestamp=Timestamp.now())
+            broker.merge_shard_ranges(own_sr)
+            self.assertIs(False, broker.sharding_initiated())
+            self.assertIs(False, broker.sharding_required())
+
+        # shard ranges, still ACTIVE
+        own_sr.update_state(ShardRange.ACTIVE,
+                            state_timestamp=Timestamp.now())
+        broker.merge_shard_ranges(own_sr)
+        broker.merge_shard_ranges(ShardRange('.shards_a/cc', Timestamp.now()))
+        self.assertIs(False, broker.sharding_initiated())
+        self.assertIs(False, broker.sharding_required())
+
+        # shard ranges and SHARDING, SHRINKING or SHARDED
+        broker.enable_sharding(Timestamp.now())
+        self.assertTrue(broker.set_sharding_state())
+        self.assertIs(True, broker.sharding_initiated())
+        self.assertIs(True, broker.sharding_required())
+
+        epoch = broker.db_epoch
+        own_sr.update_state(ShardRange.SHRINKING,
+                            state_timestamp=Timestamp.now())
+        own_sr.epoch = epoch
+        broker.merge_shard_ranges(own_sr)
+        self.assertIs(True, broker.sharding_initiated())
+        self.assertIs(True, broker.sharding_required())
+
+        own_sr.update_state(ShardRange.SHARDED)
+        broker.merge_shard_ranges(own_sr)
+        self.assertTrue(broker.set_sharded_state())
+        self.assertIs(True, broker.sharding_initiated())
+        self.assertIs(False, broker.sharding_required())
+
+    @with_tempdir
+    def test_put_object_multiple_encoded_timestamps_using_file(self, tempdir):
+        # Test ContainerBroker.put_object with differing data, content-type
+        # and metadata timestamps, using file db to ensure that the code paths
+        # to write/read pending file are exercised.
+        db_path = os.path.join(tempdir, 'container.db')
+        broker = ContainerBroker(db_path, account='a', container='c')
+        self._test_put_object_multiple_encoded_timestamps(broker)
+
+    def _test_put_object_multiple_explicit_timestamps(self, broker):
+        ts = make_timestamp_iter()
+        broker.initialize(next(ts).internal, 0)
+        t = [next(ts) for _ in range(11)]
+
+        # Create initial object
+        broker.put_object('obj_name', t[0].internal, 123,
+                          'application/x-test',
+                          '5af83e3196bf99f440f31f2e1a6c9afe',
+                          ctype_timestamp=None,
+                          meta_timestamp=None)
+        self.assertEqual(1, len(broker.get_items_since(0, 100)))
+        self._assert_db_row(broker, 'obj_name', t[0].internal, 123,
+                            'application/x-test',
+                            '5af83e3196bf99f440f31f2e1a6c9afe')
+
+        # hash and size change with same data timestamp are ignored
+        t_encoded = encode_timestamps(t[0], t[1], t[1])
+        broker.put_object('obj_name', t[0].internal, 456,
+                          'application/x-test-2',
+                          '1234567890abcdeffedcba0987654321',
+                          ctype_timestamp=t[1].internal,
+                          meta_timestamp=t[1].internal)
+        self.assertEqual(1, len(broker.get_items_since(0, 100)))
+        self._assert_db_row(broker, 'obj_name', t_encoded, 123,
+                            'application/x-test-2',
+                            '5af83e3196bf99f440f31f2e1a6c9afe')
+
+        # content-type change with same timestamp is ignored
+        t_encoded = encode_timestamps(t[0], t[1], t[2])
+        broker.put_object('obj_name', t[0].internal, 456,
+                          'application/x-test-ignored',
+                          '1234567890abcdeffedcba0987654321',
+                          ctype_timestamp=t[1].internal,
+                          meta_timestamp=t[2].internal)
+        self.assertEqual(1, len(broker.get_items_since(0, 100)))
+        self._assert_db_row(broker, 'obj_name', t_encoded, 123,
+                            'application/x-test-2',
+                            '5af83e3196bf99f440f31f2e1a6c9afe')
+
+        # update with differing newer timestamps
+        t_encoded = encode_timestamps(t[4], t[6], t[8])
+        broker.put_object('obj_name', t[4].internal, 789,
+                          'application/x-test-3',
+                          'abcdef1234567890abcdef1234567890',
+                          ctype_timestamp=t[6].internal,
+                          meta_timestamp=t[8].internal)
+        self.assertEqual(1, len(broker.get_items_since(0, 100)))
+        self._assert_db_row(broker, 'obj_name', t_encoded, 789,
+                            'application/x-test-3',
+                            'abcdef1234567890abcdef1234567890')
+
+        # update with differing older timestamps should be ignored
+        broker.put_object('obj_name', t[3].internal, 9999,
+                          'application/x-test-ignored',
+                          'ignored_hash',
+                          ctype_timestamp=t[5].internal,
+                          meta_timestamp=t[7].internal)
+        self.assertEqual(1, len(broker.get_items_since(0, 100)))
+        self._assert_db_row(broker, 'obj_name', t_encoded, 789,
+                            'application/x-test-3',
+                            'abcdef1234567890abcdef1234567890')
+
+        # content_type_timestamp == None defaults to data timestamp
+        t_encoded = encode_timestamps(t[9], t[9], t[8])
+        broker.put_object('obj_name', t[9].internal, 9999,
+                          'application/x-test-new',
+                          'new_hash',
+                          ctype_timestamp=None,
+                          meta_timestamp=t[7].internal)
+        self.assertEqual(1, len(broker.get_items_since(0, 100)))
+        self._assert_db_row(broker, 'obj_name', t_encoded, 9999,
+                            'application/x-test-new',
+                            'new_hash')
+
+        # meta_timestamp == None defaults to data timestamp
+        t_encoded = encode_timestamps(t[9], t[10], t[10])
+        broker.put_object('obj_name', t[8].internal, 1111,
+                          'application/x-test-newer',
+                          'older_hash',
+                          ctype_timestamp=t[10].internal,
+                          meta_timestamp=None)
+        self.assertEqual(1, len(broker.get_items_since(0, 100)))
+        self._assert_db_row(broker, 'obj_name', t_encoded, 9999,
+                            'application/x-test-newer',
+                            'new_hash')
+
+    def test_put_object_multiple_explicit_timestamps_using_memory(self):
+        # Test ContainerBroker.put_object with differing data, content-type
+        # and metadata timestamps passed as explicit args
+        broker = ContainerBroker(self.get_db_path(), account='a',
+                                 container='c')
+        self._test_put_object_multiple_explicit_timestamps(broker)
+
+    @with_tempdir
+    def test_put_object_multiple_explicit_timestamps_using_file(self, tempdir):
+        # Test ContainerBroker.put_object with differing data, content-type
+        # and metadata timestamps passed as explicit args, using file db to
+        # ensure that the code paths to write/read pending file are exercised.
+        db_path = os.path.join(tempdir, 'container.db')
+        broker = ContainerBroker(db_path, account='a', container='c')
+        self._test_put_object_multiple_explicit_timestamps(broker)
+
+    def test_last_modified_time(self):
+        # Test container listing reports the most recent of data or metadata
+        # timestamp as last-modified time
+        ts = make_timestamp_iter()
+        broker = ContainerBroker(self.get_db_path(), account='a',
+                                 container='c')
+        broker.initialize(next(ts).internal, 0)
+
+        # simple 'single' timestamp case
+        t0 = next(ts)
+        broker.put_object('obj1', t0.internal, 0, 'text/plain', 'hash1')
+        listing = broker.list_objects_iter(100, '', None, None, '')
+        self.assertEqual(len(listing), 1)
+        self.assertEqual(listing[0][0], 'obj1')
+        self.assertEqual(listing[0][1], t0.internal)
+
+        # content-type and metadata are updated at t1
+        t1 = next(ts)
+        t_encoded = encode_timestamps(t0, t1, t1)
+        broker.put_object('obj1', t_encoded, 0, 'text/plain', 'hash1')
+        listing = broker.list_objects_iter(100, '', None, None, '')
+        self.assertEqual(len(listing), 1)
+        self.assertEqual(listing[0][0], 'obj1')
+        self.assertEqual(listing[0][1], t1.internal)
+
+        # used later
+        t2 = next(ts)
+
+        # metadata is updated at t3
+        t3 = next(ts)
+        t_encoded = encode_timestamps(t0, t1, t3)
+        broker.put_object('obj1', t_encoded, 0, 'text/plain', 'hash1')
+        listing = broker.list_objects_iter(100, '', None, None, '')
+        self.assertEqual(len(listing), 1)
+        self.assertEqual(listing[0][0], 'obj1')
+        self.assertEqual(listing[0][1], t3.internal)
+
+        # all parts updated at t2, last-modified should remain at t3
+        t_encoded = encode_timestamps(t2, t2, t2)
+        broker.put_object('obj1', t_encoded, 0, 'text/plain', 'hash1')
+        listing = broker.list_objects_iter(100, '', None, None, '')
+        self.assertEqual(len(listing), 1)
+        self.assertEqual(listing[0][0], 'obj1')
+        self.assertEqual(listing[0][1], t3.internal)
+
+        # all parts updated at t4, last-modified should be t4
+        t4 = next(ts)
+        t_encoded = encode_timestamps(t4, t4, t4)
+        broker.put_object('obj1', t_encoded, 0, 'text/plain', 'hash1')
+        listing = broker.list_objects_iter(100, '', None, None, '')
+        self.assertEqual(len(listing), 1)
+        self.assertEqual(listing[0][0], 'obj1')
+        self.assertEqual(listing[0][1], t4.internal)
+
+    @patch_policies
+    def test_put_misplaced_object_does_not_effect_container_stats(self):
+        policy = random.choice(list(POLICIES))
+        ts = make_timestamp_iter()
+        broker = ContainerBroker(self.get_db_path(),
+                                 account='a', container='c')
+        broker.initialize(next(ts).internal, policy.idx)
+        # migration tests may not honor policy on initialize
+        if isinstance(self, ContainerBrokerMigrationMixin):
+            real_storage_policy_index = \
+                broker.get_info()['storage_policy_index']
+            policy = [p for p in POLICIES
+                      if p.idx == real_storage_policy_index][0]
+        broker.put_object('correct_o', next(ts).internal, 123, 'text/plain',
+                          '5af83e3196bf99f440f31f2e1a6c9afe',
+                          storage_policy_index=policy.idx)
+        info = broker.get_info()
+        self.assertEqual(1, info['object_count'])
+        self.assertEqual(123, info['bytes_used'])
+        other_policy = random.choice([p for p in POLICIES
+                                      if p is not policy])
+        broker.put_object('wrong_o', next(ts).internal, 123, 'text/plain',
+                          '5af83e3196bf99f440f31f2e1a6c9afe',
+                          storage_policy_index=other_policy.idx)
+        self.assertEqual(1, info['object_count'])
+        self.assertEqual(123, info['bytes_used'])
+
+    @patch_policies
+    def test_has_multiple_policies(self):
+        policy = random.choice(list(POLICIES))
+        ts = make_timestamp_iter()
+        broker = ContainerBroker(self.get_db_path(),
+                                 account='a', container='c')
+        broker.initialize(next(ts).internal, policy.idx)
+        # migration tests may not honor policy on initialize
+        if isinstance(self, ContainerBrokerMigrationMixin):
+            real_storage_policy_index = \
+                broker.get_info()['storage_policy_index']
+            policy = [p for p in POLICIES
+                      if p.idx == real_storage_policy_index][0]
+        broker.put_object('correct_o', next(ts).internal, 123, 'text/plain',
+                          '5af83e3196bf99f440f31f2e1a6c9afe',
+                          storage_policy_index=policy.idx)
+        # commit pending file into db
+        broker._commit_puts()
+        self.assertFalse(broker.has_multiple_policies())
+        other_policy = [p for p in POLICIES if p is not policy][0]
+        broker.put_object('wrong_o', next(ts).internal, 123, 'text/plain',
+                          '5af83e3196bf99f440f31f2e1a6c9afe',
+                          storage_policy_index=other_policy.idx)
+        broker._commit_puts()
+        self.assertTrue(broker.has_multiple_policies())
+
+    @patch_policies
+    def test_get_policy_info(self):
+        policy = random.choice(list(POLICIES))
+        ts = make_timestamp_iter()
+        broker = ContainerBroker(self.get_db_path(),
+                                 account='a', container='c')
+        broker.initialize(next(ts).internal, policy.idx)
+        # migration tests may not honor policy on initialize
+        if isinstance(self, ContainerBrokerMigrationMixin):
+            real_storage_policy_index = \
+                broker.get_info()['storage_policy_index']
+            policy = [p for p in POLICIES
+                      if p.idx == real_storage_policy_index][0]
+        policy_stats = broker.get_policy_stats()
+        expected = {policy.idx: {'bytes_used': 0, 'object_count': 0}}
+        self.assertEqual(policy_stats, expected)
+
+        # add an object
+        broker.put_object('correct_o', next(ts).internal, 123, 'text/plain',
+                          '5af83e3196bf99f440f31f2e1a6c9afe',
+                          storage_policy_index=policy.idx)
+        # commit pending file into db
+        broker._commit_puts()
+        policy_stats = broker.get_policy_stats()
+        expected = {policy.idx: {'bytes_used': 123, 'object_count': 1}}
+        self.assertEqual(policy_stats, expected)
+
+        # add a misplaced object
+        other_policy = random.choice([p for p in POLICIES
+                                      if p is not policy])
+        broker.put_object('wrong_o', next(ts).internal, 123, 'text/plain',
+                          '5af83e3196bf99f440f31f2e1a6c9afe',
+                          storage_policy_index=other_policy.idx)
+        broker._commit_puts()
+        policy_stats = broker.get_policy_stats()
+        expected = {
+            policy.idx: {'bytes_used': 123, 'object_count': 1},
+            other_policy.idx: {'bytes_used': 123, 'object_count': 1},
+        }
+        self.assertEqual(policy_stats, expected)
+
+    @patch_policies
+    def test_policy_stat_tracking(self):
+        ts = make_timestamp_iter()
+        broker = ContainerBroker(self.get_db_path(),
+                                 account='a', container='c')
+        # Note: in subclasses of this TestCase that inherit the
+        # ContainerBrokerMigrationMixin, passing POLICIES.default.idx here has
+        # no effect and broker.get_policy_stats() returns a dict with a single
+        # entry mapping policy index 0 to the container stats
+        broker.initialize(next(ts).internal, POLICIES.default.idx)
+        stats = defaultdict(dict)
+
+        def assert_empty_default_policy_stats(policy_stats):
+            # if no objects were added for the default policy we still
+            # expect an entry for the default policy in the returned info
+            # because the database was initialized with that storage policy
+            # - but it must be empty.
+            default_stats = policy_stats[POLICIES.default.idx]
+            expected = {'object_count': 0, 'bytes_used': 0}
+            self.assertEqual(default_stats, expected)
+
+        policy_stats = broker.get_policy_stats()
+        assert_empty_default_policy_stats(policy_stats)
+
+        iters = 100
+        for i in range(iters):
+            policy_index = random.randint(0, iters // 10)
+            name = 'object-%s' % random.randint(0, iters // 10)
+            size = random.randint(0, iters)
+            broker.put_object(name, next(ts).internal, size, 'text/plain',
+                              '5af83e3196bf99f440f31f2e1a6c9afe',
+                              storage_policy_index=policy_index)
+            # track the size of the latest timestamp put for each object
+            # in each storage policy
+            stats[policy_index][name] = size
+        # commit pending file into db
+        broker._commit_puts()
+        policy_stats = broker.get_policy_stats()
+        if POLICIES.default.idx not in stats:
+            # unlikely, but check empty default index still in policy stats
+            assert_empty_default_policy_stats(policy_stats)
+            policy_stats.pop(POLICIES.default.idx)
+        self.assertEqual(len(policy_stats), len(stats))
+        for policy_index, stat in policy_stats.items():
+            self.assertEqual(stat['object_count'], len(stats[policy_index]))
+            self.assertEqual(stat['bytes_used'],
+                             sum(stats[policy_index].values()))
+
+    def test_initialize_container_broker_in_default(self):
+        broker = ContainerBroker(self.get_db_path(), account='test1',
+                                 container='test2')
+
+        # initialize with no storage_policy_index argument
+        ts_put = Timestamp.now()
+        broker.initialize(ts_put.internal)
+
+        info = broker.get_info()
+        self.assertEqual(info['account'], 'test1')
+        self.assertEqual(info['container'], 'test2')
+        self.assertEqual(info['hash'], '00000000000000000000000000000000')
+        self.assertEqual(info['put_timestamp'], ts_put.internal)
+        self.assertEqual(info['delete_timestamp'], '0')
+
+        info = broker.get_info()
+        self.assertEqual(info['object_count'], 0)
+        self.assertEqual(info['bytes_used'], 0)
+
+        policy_stats = broker.get_policy_stats()
+
+        # Act as policy-0
+        self.assertTrue(0 in policy_stats)
+        self.assertEqual(policy_stats[0]['bytes_used'], 0)
+        self.assertEqual(policy_stats[0]['object_count'], 0)
+
+        broker.put_object('o1', Timestamp.now().internal, 123, 'text/plain',
+                          '5af83e3196bf99f440f31f2e1a6c9afe')
+
+        info = broker.get_info()
+        self.assertEqual(info['object_count'], 1)
+        self.assertEqual(info['bytes_used'], 123)
+
+        policy_stats = broker.get_policy_stats()
+
+        self.assertTrue(0 in policy_stats)
+        self.assertEqual(policy_stats[0]['object_count'], 1)
+        self.assertEqual(policy_stats[0]['bytes_used'], 123)
+
+    def test_get_info(self):
+        # Test ContainerBroker.get_info
+        broker = ContainerBroker(self.get_db_path(), account='test1',
+                                 container='test2')
+        ts_put = Timestamp.now()
+        broker.initialize(ts_put.internal, 0)
+
+        info = broker.get_info()
+        self.assertEqual(info['account'], 'test1')
+        self.assertEqual(info['container'], 'test2')
+        self.assertEqual(info['hash'], '00000000000000000000000000000000')
+        self.assertEqual(info['put_timestamp'], ts_put.internal)
+        self.assertEqual(info['delete_timestamp'], '0')
+        if self.__class__ in (
+                TestContainerBrokerBeforeMetadata,
+                TestContainerBrokerBeforeXSync,
+                TestContainerBrokerBeforeSPI,
+                TestContainerBrokerBeforeShardRanges,
+                TestContainerBrokerBeforeShardRangeReportedColumn,
+                TestContainerBrokerBeforeShardRangeTombstonesColumn):
+            self.assertEqual(info['status_changed_at'], '0')
+        else:
+            self.assertEqual(info['status_changed_at'], ts_put.internal)
+
+        info = broker.get_info()
+        self.assertEqual(info['object_count'], 0)
+        self.assertEqual(info['bytes_used'], 0)
+
+        broker.put_object('o1', Timestamp.now().internal, 123, 'text/plain',
+                          '5af83e3196bf99f440f31f2e1a6c9afe')
+        info = broker.get_info()
+        self.assertEqual(info['object_count'], 1)
+        self.assertEqual(info['bytes_used'], 123)
+
+        sleep(.00001)
+        broker.put_object('o2', Timestamp.now().internal, 123, 'text/plain',
+                          '5af83e3196bf99f440f31f2e1a6c9afe')
+        info = broker.get_info()
+        self.assertEqual(info['object_count'], 2)
+        self.assertEqual(info['bytes_used'], 246)
+
+        sleep(.00001)
+        broker.put_object('o2', Timestamp.now().internal, 1000,
+                          'text/plain', '5af83e3196bf99f440f31f2e1a6c9afe')
+        info = broker.get_info()
+        self.assertEqual(info['object_count'], 2)
+        self.assertEqual(info['bytes_used'], 1123)
+
+        sleep(.00001)
+        broker.delete_object('o1', Timestamp.now().internal)
+        info = broker.get_info()
+        self.assertEqual(info['object_count'], 1)
+        self.assertEqual(info['bytes_used'], 1000)
+
+        sleep(.00001)
+        broker.delete_object('o2', Timestamp.now().internal)
+        info = broker.get_info()
+        self.assertEqual(info['object_count'], 0)
+        self.assertEqual(info['bytes_used'], 0)
+
+        info = broker.get_info()
+        self.assertEqual(info['x_container_sync_point1'], -1)
+        self.assertEqual(info['x_container_sync_point2'], -1)
+
+    @with_tempdir
+    def test_get_info_sharding_states(self, tempdir):
+        db_path = os.path.join(
+            tempdir, 'containers', 'part', 'suffix', 'hash', 'hash.db')
+        broker = ContainerBroker(
+            db_path, account='myaccount', container='mycontainer')
+        broker.initialize(next(self.ts).internal, 0)
+        broker.put_object('o1', next(self.ts).internal, 123, 'text/plain',
+                          'fake etag')
+        sr = ShardRange('.shards_a/c', next(self.ts))
+        broker.merge_shard_ranges(sr)
+
+        def check_info(expected):
+            errors = []
+            for k, v in expected.items():
+                if info.get(k) != v:
+                    errors.append((k, v, info.get(k)))
+            if errors:
+                self.fail('Mismatches: %s' % ', '.join(
+                    ['%s should be %s but got %s' % error
+                     for error in errors]))
+
+        # unsharded
+        with mock.patch.object(
+                broker, 'get_shard_usage') as mock_get_shard_usage:
+            info = broker.get_info()
+        mock_get_shard_usage.assert_not_called()
+        check_info({'account': 'myaccount',
+                    'container': 'mycontainer',
+                    'object_count': 1,
+                    'bytes_used': 123,
+                    'db_state': 'unsharded'})
+
+        # sharding
+        epoch = next(self.ts)
+        broker.enable_sharding(epoch)
+        self.assertTrue(broker.set_sharding_state())
+        broker.put_object('o2', next(self.ts).internal, 1, 'text/plain',
+                          'fake etag')
+        broker.put_object('o3', next(self.ts).internal, 320, 'text/plain',
+                          'fake etag')
+        with mock.patch.object(
+                broker, 'get_shard_usage') as mock_get_shard_usage:
+            info = broker.get_info()
+        mock_get_shard_usage.assert_not_called()
+        check_info({'account': 'myaccount',
+                    'container': 'mycontainer',
+                    'object_count': 1,
+                    'bytes_used': 123,
+                    'db_state': 'sharding'})
+
+        # sharded
+        self.assertTrue(broker.set_sharded_state())
+        shard_stats = {'object_count': 1001, 'bytes_used': 3003}
+        with mock.patch.object(
+                broker, 'get_shard_usage') as mock_get_shard_usage:
+            mock_get_shard_usage.return_value = shard_stats
+            info = broker.get_info()
+        mock_get_shard_usage.assert_called_once_with()
+        check_info({'account': 'myaccount',
+                    'container': 'mycontainer',
+                    'object_count': 1001,
+                    'bytes_used': 3003,
+                    'db_state': 'sharded'})
+
+        # collapsed
+        sr.set_deleted(next(self.ts))
+        broker.merge_shard_ranges(sr)
+        with mock.patch.object(
+                broker, 'get_shard_usage') as mock_get_shard_usage:
+            info = broker.get_info()
+        mock_get_shard_usage.assert_not_called()
+        check_info({'account': 'myaccount',
+                    'container': 'mycontainer',
+                    'object_count': 2,
+                    'bytes_used': 321,
+                    'db_state': 'collapsed'})
+
+    def test_set_x_syncs(self):
+        broker = ContainerBroker(self.get_db_path(), account='test1',
+                                 container='test2')
+        broker.initialize(Timestamp('1').internal, 0)
+
+        info = broker.get_info()
+        self.assertEqual(info['x_container_sync_point1'], -1)
+        self.assertEqual(info['x_container_sync_point2'], -1)
+
+        broker.set_x_container_sync_points(1, 2)
+        info = broker.get_info()
+        self.assertEqual(info['x_container_sync_point1'], 1)
+        self.assertEqual(info['x_container_sync_point2'], 2)
+
+    def test_get_report_info(self):
+        broker = ContainerBroker(self.get_db_path(), account='test1',
+                                 container='test2')
+        broker.initialize(Timestamp('1').internal, 0)
+
+        info = broker.get_info()
+        self.assertEqual(info['account'], 'test1')
+        self.assertEqual(info['container'], 'test2')
+        self.assertEqual(info['object_count'], 0)
+        self.assertEqual(info['bytes_used'], 0)
+        self.assertEqual(info['reported_object_count'], 0)
+        self.assertEqual(info['reported_bytes_used'], 0)
+
+        broker.put_object('o1', Timestamp.now().internal, 123, 'text/plain',
+                          '5af83e3196bf99f440f31f2e1a6c9afe')
+        info = broker.get_info()
+        self.assertEqual(info['object_count'], 1)
+        self.assertEqual(info['bytes_used'], 123)
+        self.assertEqual(info['reported_object_count'], 0)
+        self.assertEqual(info['reported_bytes_used'], 0)
+
+        sleep(.00001)
+        broker.put_object('o2', Timestamp.now().internal, 123, 'text/plain',
+                          '5af83e3196bf99f440f31f2e1a6c9afe')
+        info = broker.get_info()
+        self.assertEqual(info['object_count'], 2)
+        self.assertEqual(info['bytes_used'], 246)
+        self.assertEqual(info['reported_object_count'], 0)
+        self.assertEqual(info['reported_bytes_used'], 0)
+
+        sleep(.00001)
+        broker.put_object('o2', Timestamp.now().internal, 1000,
+                          'text/plain', '5af83e3196bf99f440f31f2e1a6c9afe')
+        info = broker.get_info()
+        self.assertEqual(info['object_count'], 2)
+        self.assertEqual(info['bytes_used'], 1123)
+        self.assertEqual(info['reported_object_count'], 0)
+        self.assertEqual(info['reported_bytes_used'], 0)
+
+        put_timestamp = Timestamp.now().internal
+        sleep(.001)
+        delete_timestamp = Timestamp.now().internal
+        broker.reported(put_timestamp, delete_timestamp, 2, 1123)
+        info = broker.get_info()
+        self.assertEqual(info['object_count'], 2)
+        self.assertEqual(info['bytes_used'], 1123)
+        self.assertEqual(info['reported_put_timestamp'], put_timestamp)
+        self.assertEqual(info['reported_delete_timestamp'], delete_timestamp)
+        self.assertEqual(info['reported_object_count'], 2)
+        self.assertEqual(info['reported_bytes_used'], 1123)
+
+        sleep(.00001)
+        broker.delete_object('o1', Timestamp.now().internal)
+        info = broker.get_info()
+        self.assertEqual(info['object_count'], 1)
+        self.assertEqual(info['bytes_used'], 1000)
+        self.assertEqual(info['reported_object_count'], 2)
+        self.assertEqual(info['reported_bytes_used'], 1123)
+
+        sleep(.00001)
+        broker.delete_object('o2', Timestamp.now().internal)
+        info = broker.get_info()
+        self.assertEqual(info['object_count'], 0)
+        self.assertEqual(info['bytes_used'], 0)
+        self.assertEqual(info['reported_object_count'], 2)
+        self.assertEqual(info['reported_bytes_used'], 1123)
+
+    @with_tempdir
+    def test_get_replication_info(self, tempdir):
+        db_path = os.path.join(
+            tempdir, 'containers', 'part', 'suffix', 'hash', 'hash.db')
+        broker = ContainerBroker(
+            db_path, account='myaccount', container='mycontainer')
+        broker.initialize(next(self.ts).internal, 0)
+        metadata = {'blah': ['val', next(self.ts).internal]}
+        broker.update_metadata(metadata)
+        expected = broker.get_info()
+        expected['metadata'] = json.dumps(metadata)
+        expected.pop('object_count')
+        expected['count'] = 0
+        expected['max_row'] = -1
+        expected['shard_max_row'] = -1
+        actual = broker.get_replication_info()
+        self.assertEqual(expected, actual)
+
+        broker.put_object('o1', next(self.ts).internal, 123, 'text/plain',
+                          'fake etag')
+        expected = broker.get_info()
+        expected['metadata'] = json.dumps(metadata)
+        expected.pop('object_count')
+        expected['count'] = 1
+        expected['max_row'] = 1
+        expected['shard_max_row'] = -1
+        actual = broker.get_replication_info()
+        self.assertEqual(expected, actual)
+
+        sr = ShardRange('.shards_a/c', next(self.ts))
+        broker.merge_shard_ranges(sr)
+        expected['shard_max_row'] = 1
+        actual = broker.get_replication_info()
+        self.assertEqual(expected, actual)
+
+    @with_tempdir
+    def test_remove_objects(self, tempdir):
+        objects = (('undeleted', Timestamp.now().internal, 0, 'text/plain',
+                    MD5_OF_EMPTY_STRING, 0, 0),
+                   ('other_policy', Timestamp.now().internal, 0, 'text/plain',
+                    MD5_OF_EMPTY_STRING, 0, 1),
+                   ('deleted', Timestamp.now().internal, 0, 'text/plain',
+                    MD5_OF_EMPTY_STRING, 1, 0))
+        object_names = [o[0] for o in objects]
+
+        def get_rows(broker):
+            with broker.get() as conn:
+                cursor = conn.execute("SELECT * FROM object")
+                return [r[1] for r in cursor]
+
+        def do_setup():
+            db_path = os.path.join(
+                tempdir, 'containers', 'part', 'suffix',
+                'hash', '%s.db' % uuid4())
+            broker = ContainerBroker(db_path, account='a', container='c')
+            broker.initialize(Timestamp.now().internal, 0)
+            for obj in objects:
+                # ensure row order matches put order
+                broker.put_object(*obj)
+                broker._commit_puts()
+
+            self.assertEqual(3, broker.get_max_row())  # sanity check
+            self.assertEqual(object_names, get_rows(broker))  # sanity check
+            return broker
+
+        broker = do_setup()
+        broker.remove_objects('', '')
+        self.assertFalse(get_rows(broker))
+
+        broker = do_setup()
+        broker.remove_objects('deleted', '')
+        self.assertEqual([object_names[2]], get_rows(broker))
+
+        broker = do_setup()
+        broker.remove_objects('', 'deleted', max_row=2)
+        self.assertEqual(object_names, get_rows(broker))
+
+        broker = do_setup()
+        broker.remove_objects('deleted', 'un')
+        self.assertEqual([object_names[0], object_names[2]], get_rows(broker))
+
+        broker = do_setup()
+        broker.remove_objects('', '', max_row=-1)
+        self.assertEqual(object_names, get_rows(broker))
+
+        broker = do_setup()
+        broker.remove_objects('', '', max_row=0)
+        self.assertEqual(object_names, get_rows(broker))
+
+        broker = do_setup()
+        broker.remove_objects('', '', max_row=1)
+        self.assertEqual(object_names[1:], get_rows(broker))
+
+        broker = do_setup()
+        broker.remove_objects('', '', max_row=2)
+        self.assertEqual(object_names[2:], get_rows(broker))
+
+        broker = do_setup()
+        broker.remove_objects('', '', max_row=3)
+        self.assertFalse(get_rows(broker))
+
+        broker = do_setup()
+        broker.remove_objects('', '', max_row=99)
+        self.assertFalse(get_rows(broker))
+
+    def test_get_objects(self):
+        broker = ContainerBroker(self.get_db_path(), account='a',
+                                 container='c')
+        broker.initialize(Timestamp('1').internal, 0)
+        objects_0 = [{'name': 'obj_0_%d' % i,
+                      'created_at': next(self.ts).internal,
+                      'content_type': 'text/plain',
+                      'etag': 'etag_%d' % i,
+                      'size': 1024 * i,
+                      'deleted': i % 2,
+                      'storage_policy_index': 0
+                      } for i in range(1, 8)]
+        objects_1 = [{'name': 'obj_1_%d' % i,
+                      'created_at': next(self.ts).internal,
+                      'content_type': 'text/plain',
+                      'etag': 'etag_%d' % i,
+                      'size': 1024 * i,
+                      'deleted': i % 2,
+                      'storage_policy_index': 1
+                      } for i in range(1, 8)]
+        # merge_objects mutates items
+        broker.merge_items([dict(obj) for obj in objects_0 + objects_1])
+
+        actual = broker.get_objects()
+        self.assertEqual(objects_0 + objects_1, actual)
+
+        with mock.patch('swift.container.backend.CONTAINER_LISTING_LIMIT', 2):
+            actual = broker.get_objects()
+            self.assertEqual(objects_0[:2], actual)
+
+        with mock.patch('swift.container.backend.CONTAINER_LISTING_LIMIT', 2):
+            actual = broker.get_objects(limit=9)
+            self.assertEqual(objects_0 + objects_1[:2], actual)
+
+        actual = broker.get_objects(marker=objects_0[2]['name'])
+        self.assertEqual(objects_0[3:] + objects_1, actual)
+
+        actual = broker.get_objects(end_marker=objects_0[2]['name'])
+        self.assertEqual(objects_0[:2], actual)
+
+        actual = broker.get_objects(include_deleted=True)
+        self.assertEqual(objects_0[::2] + objects_1[::2], actual)
+
+        actual = broker.get_objects(include_deleted=False)
+        self.assertEqual(objects_0[1::2] + objects_1[1::2], actual)
+
+        actual = broker.get_objects(include_deleted=None)
+        self.assertEqual(objects_0 + objects_1, actual)
+
+    def test_get_objects_since_row(self):
+        broker = ContainerBroker(self.get_db_path(), account='a',
+                                 container='c')
+        broker.initialize(Timestamp('1').internal, 0)
+        obj_names = ['obj%03d' % i for i in range(20)]
+        timestamps = [next(self.ts) for o in obj_names]
+        for name, timestamp in zip(obj_names, timestamps):
+            broker.put_object(name, timestamp.internal,
+                              0, 'text/plain', MD5_OF_EMPTY_STRING)
+            broker._commit_puts()  # ensure predictable row order
+        timestamps = [next(self.ts) for o in obj_names[10:]]
+        for name, timestamp in zip(obj_names[10:], timestamps):
+            broker.put_object(name, timestamp.internal,
+                              0, 'text/plain', MD5_OF_EMPTY_STRING, deleted=1)
+            broker._commit_puts()  # ensure predictable row order
+
+        # sanity check
+        self.assertEqual(30, broker.get_max_row())
+        actual = broker.get_objects()
+        self.assertEqual(obj_names, [o['name'] for o in actual])
+
+        # all rows included
+        actual = broker.get_objects(since_row=None)
+        self.assertEqual(obj_names, [o['name'] for o in actual])
+
+        actual = broker.get_objects(since_row=-1)
+        self.assertEqual(obj_names, [o['name'] for o in actual])
+
+        # selected rows
+        for since_row in range(10):
+            actual = broker.get_objects(since_row=since_row)
+            with self.subTest(since_row=since_row):
+                self.assertEqual(obj_names[since_row:],
+                                 [o['name'] for o in actual])
+
+        for since_row in range(10, 20):
+            actual = broker.get_objects(since_row=since_row)
+            with self.subTest(since_row=since_row):
+                self.assertEqual(obj_names[10:],
+                                 [o['name'] for o in actual])
+
+        for since_row in range(20, len(obj_names) + 1):
+            actual = broker.get_objects(since_row=since_row)
+            with self.subTest(since_row=since_row):
+                self.assertEqual(obj_names[since_row - 10:],
+                                 [o['name'] for o in actual])
+
+        self.assertFalse(broker.get_objects(end_marker=obj_names[5],
+                                            since_row=5))
+
+    def test_list_objects_iter(self):
+        # Test ContainerBroker.list_objects_iter
+        broker = ContainerBroker(self.get_db_path(), account='a',
+                                 container='c')
+        broker.initialize(Timestamp('1').internal, 0)
+        for obj1 in range(4):
+            for obj2 in range(125):
+                broker.put_object('%d/%04d' % (obj1, obj2),
+                                  Timestamp.now().internal, 0, 'text/plain',
+                                  'd41d8cd98f00b204e9800998ecf8427e')
+        for obj in range(125):
+            broker.put_object('2/0051/%04d' % obj,
+                              Timestamp.now().internal, 0, 'text/plain',
+                              'd41d8cd98f00b204e9800998ecf8427e')
+
+        for obj in range(125):
+            broker.put_object('3/%04d/0049' % obj,
+                              Timestamp.now().internal, 0, 'text/plain',
+                              'd41d8cd98f00b204e9800998ecf8427e')
+
+        listing = broker.list_objects_iter(100, '', None, None, '')
+        self.assertEqual(len(listing), 100)
+        self.assertEqual(listing[0][0], '0/0000')
+        self.assertEqual(listing[-1][0], '0/0099')
+
+        listing = broker.list_objects_iter(100, '', '0/0050', None, '')
+        self.assertEqual(len(listing), 50)
+        self.assertEqual(listing[0][0], '0/0000')
+        self.assertEqual(listing[-1][0], '0/0049')
+
+        listing = broker.list_objects_iter(100, '0/0099', None, None, '')
+        self.assertEqual(len(listing), 100)
+        self.assertEqual(listing[0][0], '0/0100')
+        self.assertEqual(listing[-1][0], '1/0074')
+
+        listing = broker.list_objects_iter(55, '1/0074', None, None, '')
+        self.assertEqual(len(listing), 55)
+        self.assertEqual(listing[0][0], '1/0075')
+        self.assertEqual(listing[-1][0], '2/0004')
+
+        listing = broker.list_objects_iter(55, '2/0005', None, None, '',
+                                           reverse=True)
+        self.assertEqual(len(listing), 55)
+        self.assertEqual(listing[0][0], '2/0004')
+        self.assertEqual(listing[-1][0], '1/0075')
+
+        listing = broker.list_objects_iter(10, '', None, '0/01', '')
+        self.assertEqual(len(listing), 10)
+        self.assertEqual(listing[0][0], '0/0100')
+        self.assertEqual(listing[-1][0], '0/0109')
+
+        listing = broker.list_objects_iter(10, '', None, '0/', '/')
+        self.assertEqual(len(listing), 10)
+        self.assertEqual(listing[0][0], '0/0000')
+        self.assertEqual(listing[-1][0], '0/0009')
+
+        listing = broker.list_objects_iter(10, '', None, '0/', '/',
+                                           reverse=True)
+        self.assertEqual(len(listing), 10)
+        self.assertEqual(listing[0][0], '0/0124')
+        self.assertEqual(listing[-1][0], '0/0115')
+
+        # Same as above, but using the path argument.
+        listing = broker.list_objects_iter(10, '', None, None, '', '0')
+        self.assertEqual(len(listing), 10)
+        self.assertEqual(listing[0][0], '0/0000')
+        self.assertEqual(listing[-1][0], '0/0009')
+
+        listing = broker.list_objects_iter(10, '', None, None, '', '0',
+                                           reverse=True)
+        self.assertEqual(len(listing), 10)
+        self.assertEqual(listing[0][0], '0/0124')
+        self.assertEqual(listing[-1][0], '0/0115')
+
+        listing = broker.list_objects_iter(10, '', None, '', '/')
+        self.assertEqual(len(listing), 4)
+        self.assertEqual([row[0] for row in listing],
+                         ['0/', '1/', '2/', '3/'])
+
+        listing = broker.list_objects_iter(10, '', None, '', '/', reverse=True)
+        self.assertEqual(len(listing), 4)
+        self.assertEqual([row[0] for row in listing],
+                         ['3/', '2/', '1/', '0/'])
+
+        listing = broker.list_objects_iter(10, '2', None, None, '/')
+        self.assertEqual(len(listing), 2)
+        self.assertEqual([row[0] for row in listing], ['2/', '3/'])
+
+        listing = broker.list_objects_iter(10, '2/', None, None, '/')
+        self.assertEqual(len(listing), 1)
+        self.assertEqual([row[0] for row in listing], ['3/'])
+
+        listing = broker.list_objects_iter(10, '2/', None, None, '/',
+                                           reverse=True)
+        self.assertEqual(len(listing), 2)
+        self.assertEqual([row[0] for row in listing], ['1/', '0/'])
+
+        listing = broker.list_objects_iter(10, '20', None, None, '/',
+                                           reverse=True)
+        self.assertEqual(len(listing), 3)
+        self.assertEqual([row[0] for row in listing], ['2/', '1/', '0/'])
+
+        listing = broker.list_objects_iter(10, '2/0050', None, '2/', '/')
+        self.assertEqual(len(listing), 10)
+        self.assertEqual(listing[0][0], '2/0051')
+        self.assertEqual(listing[1][0], '2/0051/')
+        self.assertEqual(listing[2][0], '2/0052')
+        self.assertEqual(listing[-1][0], '2/0059')
+
+        listing = broker.list_objects_iter(10, '3/0045', None, '3/', '/')
+        self.assertEqual(len(listing), 10)
+        self.assertEqual([row[0] for row in listing],
+                         ['3/0045/', '3/0046', '3/0046/', '3/0047',
+                          '3/0047/', '3/0048', '3/0048/', '3/0049',
+                          '3/0049/', '3/0050'])
+
+        broker.put_object('3/0049/', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        listing = broker.list_objects_iter(10, '3/0048', None, None, None)
+        self.assertEqual(len(listing), 10)
+        self.assertEqual(
+            [row[0] for row in listing],
+            ['3/0048/0049', '3/0049', '3/0049/',
+             '3/0049/0049', '3/0050', '3/0050/0049', '3/0051', '3/0051/0049',
+             '3/0052', '3/0052/0049'])
+
+        listing = broker.list_objects_iter(10, '3/0048', None, '3/', '/')
+        self.assertEqual(len(listing), 10)
+        self.assertEqual(
+            [row[0] for row in listing],
+            ['3/0048/', '3/0049', '3/0049/', '3/0050',
+             '3/0050/', '3/0051', '3/0051/', '3/0052', '3/0052/', '3/0053'])
+
+        listing = broker.list_objects_iter(10, None, None, '3/0049/', '/')
+        self.assertEqual(len(listing), 2)
+        self.assertEqual(
+            [row[0] for row in listing],
+            ['3/0049/', '3/0049/0049'])
+
+        listing = broker.list_objects_iter(10, None, None, None, None,
+                                           '3/0049')
+        self.assertEqual(len(listing), 1)
+        self.assertEqual([row[0] for row in listing], ['3/0049/0049'])
+
+        listing = broker.list_objects_iter(2, None, None, '3/', '/')
+        self.assertEqual(len(listing), 2)
+        self.assertEqual([row[0] for row in listing], ['3/0000', '3/0000/'])
+
+        listing = broker.list_objects_iter(2, None, None, None, None, '3')
+        self.assertEqual(len(listing), 2)
+        self.assertEqual([row[0] for row in listing], ['3/0000', '3/0001'])
+
+    def test_list_objects_iter_with_reserved_name(self):
+        broker = ContainerBroker(self.get_db_path(), account='a',
+                                 container='c')
+        broker.initialize(next(self.ts).internal, 0)
+
+        broker.put_object(
+            'foo', next(self.ts).internal, 0, 0, 0, POLICIES.default.idx)
+        broker.put_object(
+            get_reserved_name('foo'), next(self.ts).internal, 0, 0, 0,
+            POLICIES.default.idx)
+
+        listing = broker.list_objects_iter(100, None, None, '', '')
+        self.assertEqual([row[0] for row in listing], ['foo'])
+
+        listing = broker.list_objects_iter(100, None, None, '', '',
+                                           reverse=True)
+        self.assertEqual([row[0] for row in listing], ['foo'])
+
+        listing = broker.list_objects_iter(100, None, None, '', '',
+                                           allow_reserved=True)
+        self.assertEqual([row[0] for row in listing],
+                         [get_reserved_name('foo'), 'foo'])
+
+        listing = broker.list_objects_iter(100, None, None, '', '',
+                                           reverse=True, allow_reserved=True)
+        self.assertEqual([row[0] for row in listing],
+                         ['foo', get_reserved_name('foo')])
+
+    def test_reverse_prefix_delim(self):
+        expectations = [
+            {
+                'objects': [
+                    'topdir1/subdir1.0/obj1',
+                    'topdir1/subdir1.1/obj1',
+                    'topdir1/subdir1/obj1',
+                ],
+                'params': {
+                    'prefix': 'topdir1/',
+                    'delimiter': '/',
+                },
+                'expected': [
+                    'topdir1/subdir1.0/',
+                    'topdir1/subdir1.1/',
+                    'topdir1/subdir1/',
+                ],
+            },
+            {
+                'objects': [
+                    'topdir1/subdir1.0/obj1',
+                    'topdir1/subdir1.1/obj1',
+                    'topdir1/subdir1/obj1',
+                    'topdir1/subdir10',
+                    'topdir1/subdir10/obj1',
+                ],
+                'params': {
+                    'prefix': 'topdir1/',
+                    'delimiter': '/',
+                },
+                'expected': [
+                    'topdir1/subdir1.0/',
+                    'topdir1/subdir1.1/',
+                    'topdir1/subdir1/',
+                    'topdir1/subdir10',
+                    'topdir1/subdir10/',
+                ],
+            },
+            {
+                'objects': [
+                    'topdir1/subdir1/obj1',
+                    'topdir1/subdir1.0/obj1',
+                    'topdir1/subdir1.1/obj1',
+                ],
+                'params': {
+                    'prefix': 'topdir1/',
+                    'delimiter': '/',
+                    'reverse': True,
+                },
+                'expected': [
+                    'topdir1/subdir1/',
+                    'topdir1/subdir1.1/',
+                    'topdir1/subdir1.0/',
+                ],
+            },
+            {
+                'objects': [
+                    'topdir1/subdir10/obj1',
+                    'topdir1/subdir10',
+                    'topdir1/subdir1/obj1',
+                    'topdir1/subdir1.0/obj1',
+                    'topdir1/subdir1.1/obj1',
+                ],
+                'params': {
+                    'prefix': 'topdir1/',
+                    'delimiter': '/',
+                    'reverse': True,
+                },
+                'expected': [
+                    'topdir1/subdir10/',
+                    'topdir1/subdir10',
+                    'topdir1/subdir1/',
+                    'topdir1/subdir1.1/',
+                    'topdir1/subdir1.0/',
+                ],
+            },
+            {
+                'objects': [
+                    '1',
+                    '2',
+                    '3/1',
+                    '3/2.2',
+                    '3/2/1',
+                    '3/2/2',
+                    '3/3',
+                    '4',
+                ],
+                'params': {
+                    'path': '3/',
+                },
+                'expected': [
+                    '3/1',
+                    '3/2.2',
+                    '3/3',
+                ],
+            },
+            {
+                'objects': [
+                    '1',
+                    '2',
+                    '3/1',
+                    '3/2.2',
+                    '3/2/1',
+                    '3/2/2',
+                    '3/3',
+                    '4',
+                ],
+                'params': {
+                    'path': '3/',
+                    'reverse': True,
+                },
+                'expected': [
+                    '3/3',
+                    '3/2.2',
+                    '3/1',
+                ],
+            },
+        ]
+        ts = make_timestamp_iter()
+        default_listing_params = {
+            'limit': 10000,
+            'marker': '',
+            'end_marker': None,
+            'prefix': None,
+            'delimiter': None,
+        }
+        obj_create_params = {
+            'size': 0,
+            'content_type': 'application/test',
+            'etag': MD5_OF_EMPTY_STRING,
+        }
+        failures = []
+        for expected in expectations:
+            broker = ContainerBroker(self.get_db_path(),
+                                     account='a', container='c')
+            broker.initialize(next(ts).internal, 0)
+            for name in expected['objects']:
+                broker.put_object(name, next(ts).internal, **obj_create_params)
+            # commit pending file into db
+            broker._commit_puts()
+            params = default_listing_params.copy()
+            params.update(expected['params'])
+            listing = list(o[0] for o in broker.list_objects_iter(**params))
+            if listing != expected['expected']:
+                expected['listing'] = listing
+                failures.append(
+                    "With objects %(objects)r, the params %(params)r "
+                    "produced %(listing)r instead of %(expected)r" % expected)
+        self.assertFalse(failures, "Found the following failures:\n%s" %
+                         '\n'.join(failures))
+
+    def test_list_objects_iter_non_slash(self):
+        # Test ContainerBroker.list_objects_iter using a
+        # delimiter that is not a slash
+        broker = ContainerBroker(self.get_db_path(), account='a',
+                                 container='c')
+        broker.initialize(Timestamp('1').internal, 0)
+        for obj1 in range(4):
+            for obj2 in range(125):
+                broker.put_object('%d:%04d' % (obj1, obj2),
+                                  Timestamp.now().internal, 0, 'text/plain',
+                                  'd41d8cd98f00b204e9800998ecf8427e')
+        for obj in range(125):
+            broker.put_object('2:0051:%04d' % obj,
+                              Timestamp.now().internal, 0, 'text/plain',
+                              'd41d8cd98f00b204e9800998ecf8427e')
+
+        for obj in range(125):
+            broker.put_object('3:%04d:0049' % obj,
+                              Timestamp.now().internal, 0, 'text/plain',
+                              'd41d8cd98f00b204e9800998ecf8427e')
+
+        listing = broker.list_objects_iter(100, '', None, None, '')
+        self.assertEqual(len(listing), 100)
+        self.assertEqual(listing[0][0], '0:0000')
+        self.assertEqual(listing[-1][0], '0:0099')
+
+        listing = broker.list_objects_iter(100, '', '0:0050', None, '')
+        self.assertEqual(len(listing), 50)
+        self.assertEqual(listing[0][0], '0:0000')
+        self.assertEqual(listing[-1][0], '0:0049')
+
+        listing = broker.list_objects_iter(100, '0:0099', None, None, '')
+        self.assertEqual(len(listing), 100)
+        self.assertEqual(listing[0][0], '0:0100')
+        self.assertEqual(listing[-1][0], '1:0074')
+
+        listing = broker.list_objects_iter(55, '1:0074', None, None, '')
+        self.assertEqual(len(listing), 55)
+        self.assertEqual(listing[0][0], '1:0075')
+        self.assertEqual(listing[-1][0], '2:0004')
+
+        listing = broker.list_objects_iter(10, '', None, '0:01', '')
+        self.assertEqual(len(listing), 10)
+        self.assertEqual(listing[0][0], '0:0100')
+        self.assertEqual(listing[-1][0], '0:0109')
+
+        listing = broker.list_objects_iter(10, '', None, '0:', ':')
+        self.assertEqual(len(listing), 10)
+        self.assertEqual(listing[0][0], '0:0000')
+        self.assertEqual(listing[-1][0], '0:0009')
+
+        # Same as above, but using the path argument, so nothing should be
+        # returned since path uses a '/' as a delimiter.
+        listing = broker.list_objects_iter(10, '', None, None, '', '0')
+        self.assertEqual(len(listing), 0)
+
+        listing = broker.list_objects_iter(10, '', None, '', ':')
+        self.assertEqual(len(listing), 4)
+        self.assertEqual([row[0] for row in listing],
+                         ['0:', '1:', '2:', '3:'])
+
+        listing = broker.list_objects_iter(10, '2', None, None, ':')
+        self.assertEqual(len(listing), 2)
+        self.assertEqual([row[0] for row in listing], ['2:', '3:'])
+
+        listing = broker.list_objects_iter(10, '2:', None, None, ':')
+        self.assertEqual(len(listing), 1)
+        self.assertEqual([row[0] for row in listing], ['3:'])
+
+        listing = broker.list_objects_iter(10, '2:0050', None, '2:', ':')
+        self.assertEqual(len(listing), 10)
+        self.assertEqual(listing[0][0], '2:0051')
+        self.assertEqual(listing[1][0], '2:0051:')
+        self.assertEqual(listing[2][0], '2:0052')
+        self.assertEqual(listing[-1][0], '2:0059')
+
+        listing = broker.list_objects_iter(10, '3:0045', None, '3:', ':')
+        self.assertEqual(len(listing), 10)
+        self.assertEqual([row[0] for row in listing],
+                         ['3:0045:', '3:0046', '3:0046:', '3:0047',
+                          '3:0047:', '3:0048', '3:0048:', '3:0049',
+                          '3:0049:', '3:0050'])
+
+        broker.put_object('3:0049:', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        listing = broker.list_objects_iter(10, '3:0048', None, None, None)
+        self.assertEqual(len(listing), 10)
+        self.assertEqual(
+            [row[0] for row in listing],
+            ['3:0048:0049', '3:0049', '3:0049:',
+             '3:0049:0049', '3:0050', '3:0050:0049', '3:0051', '3:0051:0049',
+             '3:0052', '3:0052:0049'])
+
+        listing = broker.list_objects_iter(10, '3:0048', None, '3:', ':')
+        self.assertEqual(len(listing), 10)
+        self.assertEqual(
+            [row[0] for row in listing],
+            ['3:0048:', '3:0049', '3:0049:', '3:0050',
+             '3:0050:', '3:0051', '3:0051:', '3:0052', '3:0052:', '3:0053'])
+
+        listing = broker.list_objects_iter(10, None, None, '3:0049:', ':')
+        self.assertEqual(len(listing), 2)
+        self.assertEqual(
+            [row[0] for row in listing],
+            ['3:0049:', '3:0049:0049'])
+
+        # Same as above, but using the path argument, so nothing should be
+        # returned since path uses a '/' as a delimiter.
+        listing = broker.list_objects_iter(10, None, None, None, None,
+                                           '3:0049')
+        self.assertEqual(len(listing), 0)
+
+        listing = broker.list_objects_iter(2, None, None, '3:', ':')
+        self.assertEqual(len(listing), 2)
+        self.assertEqual([row[0] for row in listing], ['3:0000', '3:0000:'])
+
+        listing = broker.list_objects_iter(2, None, None, None, None, '3')
+        self.assertEqual(len(listing), 0)
+
+    def test_list_objects_iter_prefix_delim(self):
+        # Test ContainerBroker.list_objects_iter
+        broker = ContainerBroker(self.get_db_path(), account='a',
+                                 container='c')
+        broker.initialize(Timestamp('1').internal, 0)
+
+        broker.put_object(
+            '/pets/dogs/1', Timestamp(0).internal, 0,
+            'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object(
+            '/pets/dogs/2', Timestamp(0).internal, 0,
+            'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object(
+            '/pets/fish/a', Timestamp(0).internal, 0,
+            'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object(
+            '/pets/fish/b', Timestamp(0).internal, 0,
+            'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object(
+            '/pets/fish_info.txt', Timestamp(0).internal, 0,
+            'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object(
+            '/snakes', Timestamp(0).internal, 0,
+            'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+
+        # def list_objects_iter(self, limit, marker, prefix, delimiter,
+        #                       path=None, format=None):
+        listing = broker.list_objects_iter(100, None, None, '/pets/f', '/')
+        self.assertEqual([row[0] for row in listing],
+                         ['/pets/fish/', '/pets/fish_info.txt'])
+        listing = broker.list_objects_iter(100, None, None, '/pets/fish', '/')
+        self.assertEqual([row[0] for row in listing],
+                         ['/pets/fish/', '/pets/fish_info.txt'])
+        listing = broker.list_objects_iter(100, None, None, '/pets/fish/', '/')
+        self.assertEqual([row[0] for row in listing],
+                         ['/pets/fish/a', '/pets/fish/b'])
+        listing = broker.list_objects_iter(100, None, None, None, '/')
+        self.assertEqual([row[0] for row in listing],
+                         ['/'])
+
+    def test_list_objects_iter_order_and_reverse(self):
+        # Test ContainerBroker.list_objects_iter
+        broker = ContainerBroker(self.get_db_path(), account='a',
+                                 container='c')
+        broker.initialize(Timestamp('1').internal, 0)
+
+        broker.put_object(
+            'o1', Timestamp(0).internal, 0,
+            'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object(
+            'o10', Timestamp(0).internal, 0,
+            'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object(
+            'O1', Timestamp(0).internal, 0,
+            'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object(
+            'o2', Timestamp(0).internal, 0,
+            'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object(
+            'o3', Timestamp(0).internal, 0,
+            'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object(
+            'O4', Timestamp(0).internal, 0,
+            'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+
+        listing = broker.list_objects_iter(100, None, None, '', '',
+                                           reverse=False)
+        self.assertEqual([row[0] for row in listing],
+                         ['O1', 'O4', 'o1', 'o10', 'o2', 'o3'])
+        listing = broker.list_objects_iter(100, None, None, '', '',
+                                           reverse=True)
+        self.assertEqual([row[0] for row in listing],
+                         ['o3', 'o2', 'o10', 'o1', 'O4', 'O1'])
+        listing = broker.list_objects_iter(2, None, None, '', '',
+                                           reverse=True)
+        self.assertEqual([row[0] for row in listing],
+                         ['o3', 'o2'])
+        listing = broker.list_objects_iter(100, 'o2', 'O4', '', '',
+                                           reverse=True)
+        self.assertEqual([row[0] for row in listing],
+                         ['o10', 'o1'])
+
+    def test_double_check_trailing_delimiter(self):
+        # Test ContainerBroker.list_objects_iter for a
+        # container that has an odd file with a trailing delimiter
+        broker = ContainerBroker(self.get_db_path(), account='a',
+                                 container='c')
+        broker.initialize(Timestamp('1').internal, 0)
+        broker.put_object('a', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('a/', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('a/a', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('a/a/a', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('a/a/b', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('a/b', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('b', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('b/a', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('b/b', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('c', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('a/0', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('0', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('0/', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('00', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('0/0', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('0/00', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('0/1', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('0/1/', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('0/1/0', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('1', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('1/', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('1/0', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        listing = broker.list_objects_iter(25, None, None, None, None)
+        self.assertEqual(len(listing), 22)
+        self.assertEqual(
+            [row[0] for row in listing],
+            ['0', '0/', '0/0', '0/00', '0/1', '0/1/', '0/1/0', '00', '1', '1/',
+             '1/0', 'a', 'a/', 'a/0', 'a/a', 'a/a/a', 'a/a/b', 'a/b', 'b',
+             'b/a', 'b/b', 'c'])
+        listing = broker.list_objects_iter(25, None, None, '', '/')
+        self.assertEqual(len(listing), 10)
+        self.assertEqual(
+            [row[0] for row in listing],
+            ['0', '0/', '00', '1', '1/', 'a', 'a/', 'b', 'b/', 'c'])
+        listing = broker.list_objects_iter(25, None, None, 'a/', '/')
+        self.assertEqual(len(listing), 5)
+        self.assertEqual(
+            [row[0] for row in listing],
+            ['a/', 'a/0', 'a/a', 'a/a/', 'a/b'])
+        listing = broker.list_objects_iter(25, None, None, '0/', '/')
+        self.assertEqual(len(listing), 5)
+        self.assertEqual(
+            [row[0] for row in listing],
+            ['0/', '0/0', '0/00', '0/1', '0/1/'])
+        listing = broker.list_objects_iter(25, None, None, '0/1/', '/')
+        self.assertEqual(len(listing), 2)
+        self.assertEqual(
+            [row[0] for row in listing],
+            ['0/1/', '0/1/0'])
+        listing = broker.list_objects_iter(25, None, None, 'b/', '/')
+        self.assertEqual(len(listing), 2)
+        self.assertEqual([row[0] for row in listing], ['b/a', 'b/b'])
+
+    def test_double_check_trailing_delimiter_non_slash(self):
+        # Test ContainerBroker.list_objects_iter for a
+        # container that has an odd file with a trailing delimiter
+        broker = ContainerBroker(self.get_db_path(), account='a',
+                                 container='c')
+        broker.initialize(Timestamp('1').internal, 0)
+        broker.put_object('a', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('a:', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('a:a', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('a:a:a', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('a:a:b', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('a:b', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('b', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('b:a', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('b:b', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('c', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('a:0', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('0', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('0:', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('00', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('0:0', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('0:00', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('0:1', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('0:1:', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('0:1:0', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('1', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('1:', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('1:0', Timestamp.now().internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        listing = broker.list_objects_iter(25, None, None, None, None)
+        self.assertEqual(len(listing), 22)
+        self.assertEqual(
+            [row[0] for row in listing],
+            ['0', '00', '0:', '0:0', '0:00', '0:1', '0:1:', '0:1:0', '1', '1:',
+             '1:0', 'a', 'a:', 'a:0', 'a:a', 'a:a:a', 'a:a:b', 'a:b', 'b',
+             'b:a', 'b:b', 'c'])
+        listing = broker.list_objects_iter(25, None, None, '', ':')
+        self.assertEqual(len(listing), 10)
+        self.assertEqual(
+            [row[0] for row in listing],
+            ['0', '00', '0:', '1', '1:', 'a', 'a:', 'b', 'b:', 'c'])
+        listing = broker.list_objects_iter(25, None, None, 'a:', ':')
+        self.assertEqual(len(listing), 5)
+        self.assertEqual(
+            [row[0] for row in listing],
+            ['a:', 'a:0', 'a:a', 'a:a:', 'a:b'])
+        listing = broker.list_objects_iter(25, None, None, '0:', ':')
+        self.assertEqual(len(listing), 5)
+        self.assertEqual(
+            [row[0] for row in listing],
+            ['0:', '0:0', '0:00', '0:1', '0:1:'])
+        listing = broker.list_objects_iter(25, None, None, '0:1:', ':')
+        self.assertEqual(len(listing), 2)
+        self.assertEqual(
+            [row[0] for row in listing],
+            ['0:1:', '0:1:0'])
+        listing = broker.list_objects_iter(25, None, None, 'b:', ':')
+        self.assertEqual(len(listing), 2)
+        self.assertEqual([row[0] for row in listing], ['b:a', 'b:b'])
+
+    def test_chexor(self):
+        def md5_str(s):
+            if not isinstance(s, bytes):
+                s = s.encode('utf8')
+            return md5(s, usedforsecurity=False).hexdigest()
+
+        broker = ContainerBroker(self.get_db_path(), account='a',
+                                 container='c')
+        broker.initialize(Timestamp('1').internal, 0)
+        timestamps = [next(self.ts) for _ in range(3)]
+        broker.put_object('a', timestamps[0].internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker.put_object('b', timestamps[1].internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        hasha = md5_str('%s-%s' % ('a', timestamps[0].internal))
+        hashb = md5_str('%s-%s' % ('b', timestamps[1].internal))
+        hashc = '%032x' % (int(hasha, 16) ^ int(hashb, 16))
+        self.assertEqual(broker.get_info()['hash'], hashc)
+        broker.put_object('b', timestamps[2].internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        hashb = md5_str('%s-%s' % ('b', timestamps[2].internal))
+        hashc = '%032x' % (int(hasha, 16) ^ int(hashb, 16))
+        self.assertEqual(broker.get_info()['hash'], hashc)
+
+    @with_tempdir
+    def test_newid(self, tempdir):
+        # test DatabaseBroker.newid
+        db_path = os.path.join(
+            tempdir, "d1234", 'contianers', 'part', 'suffix', 'hsh')
+        os.makedirs(db_path)
+        broker = ContainerBroker(os.path.join(db_path, 'my.db'),
+                                 account='a', container='c')
+        broker.initialize(Timestamp('1').internal, 0)
+        id = broker.get_info()['id']
+        broker.newid('someid')
+        self.assertNotEqual(id, broker.get_info()['id'])
+        # ends in the device name (from the path) unless it's an old
+        # container with just a uuid4 (tested in legecy broker
+        # tests e.g *BeforeMetaData)
+        if len(id) > 36:
+            self.assertTrue(id.endswith('d1234'))
+        # But the newid'ed version will now have the decide
+        self.assertTrue(broker.get_info()['id'].endswith('d1234'))
+
+        # if we move the broker (happens after an rsync)
+        new_db_path = os.path.join(
+            tempdir, "d5678", 'containers', 'part', 'suffix', 'hsh')
+        os.makedirs(new_db_path)
+        shutil.copy(os.path.join(db_path, 'my.db'),
+                    os.path.join(new_db_path, 'my.db'))
+
+        new_broker = ContainerBroker(os.path.join(new_db_path, 'my.db'),
+                                     account='a', container='c')
+        new_broker.newid(id)
+        # ends in the device name (from the path)
+        self.assertFalse(new_broker.get_info()['id'].endswith('d1234'))
+        self.assertTrue(new_broker.get_info()['id'].endswith('d5678'))
+
+    def test_get_items_since(self):
+        # test DatabaseBroker.get_items_since
+        broker = ContainerBroker(self.get_db_path(), account='a',
+                                 container='c')
+        broker.initialize(Timestamp('1').internal, 0)
+        broker.put_object('a', Timestamp(1).internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        max_row = broker.get_replication_info()['max_row']
+        broker.put_object('b', Timestamp(2).internal, 0,
+                          'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        items = broker.get_items_since(max_row, 1000)
+        self.assertEqual(len(items), 1)
+        self.assertEqual(items[0]['name'], 'b')
+
+    def test_sync_merging(self):
+        # exercise the DatabaseBroker sync functions a bit
+        broker1 = ContainerBroker(self.get_db_path(), account='a',
+                                  container='c')
+        broker1.initialize(Timestamp('1').internal, 0)
+        broker2 = ContainerBroker(self.get_db_path(),
+                                  account='a', container='c')
+        broker2.initialize(Timestamp('1').internal, 0)
+        self.assertEqual(broker2.get_sync('12345'), -1)
+        broker1.merge_syncs([{'sync_point': 3, 'remote_id': '12345'}])
+        broker2.merge_syncs(broker1.get_syncs())
+        self.assertEqual(broker2.get_sync('12345'), 3)
+
+    def test_merge_items(self):
+        broker1 = ContainerBroker(self.get_db_path(), account='a',
+                                  container='c')
+        broker1.initialize(Timestamp('1').internal, 0)
+        broker2 = ContainerBroker(self.get_db_path(),
+                                  account='a', container='c')
+        broker2.initialize(Timestamp('1').internal, 0)
+        broker1.put_object('a', Timestamp(1).internal, 0,
+                           'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker1.put_object('b', Timestamp(2).internal, 0,
+                           'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        # commit pending file into db
+        broker1._commit_puts()
+        id = broker1.get_info()['id']
+        broker2.merge_items(broker1.get_items_since(
+            broker2.get_sync(id), 1000), id)
+        items = broker2.get_items_since(-1, 1000)
+        self.assertEqual(len(items), 2)
+        self.assertEqual(['a', 'b'], sorted([rec['name'] for rec in items]))
+        broker1.put_object('c', Timestamp(3).internal, 0,
+                           'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker1._commit_puts()
+        broker2.merge_items(broker1.get_items_since(
+            broker2.get_sync(id), 1000), id)
+        items = broker2.get_items_since(-1, 1000)
+        self.assertEqual(len(items), 3)
+        self.assertEqual(['a', 'b', 'c'],
+                         sorted([rec['name'] for rec in items]))
+
+    @with_tempdir
+    def test_merge_items_is_green(self, tempdir):
+        ts = make_timestamp_iter()
+        db_path = os.path.join(tempdir, 'container.db')
+
+        broker = ContainerBroker(db_path, account='a', container='c')
+        broker.initialize(next(ts).internal, 1)
+
+        broker.put_object('b', next(ts).internal, 0, 'text/plain',
+                          MD5_OF_EMPTY_STRING)
+
+        with mock.patch('swift.container.backend.tpool') as mock_tpool:
+            broker.get_info()
+        mock_tpool.execute.assert_called_once()
+
+    def test_merge_items_overwrite_unicode(self):
+        # test DatabaseBroker.merge_items
+        snowman = u'\N{SNOWMAN}'
+        broker1 = ContainerBroker(self.get_db_path(), account='a',
+                                  container='c')
+        timestamps = [next(self.ts) for _ in range(4)]
+        broker1.initialize(timestamps[0].internal, 0)
+        id = broker1.get_info()['id']
+        broker2 = ContainerBroker(self.get_db_path(),
+                                  account='a', container='c')
+        broker2.initialize(timestamps[0].internal, 0)
+        broker1.put_object(snowman, timestamps[1].internal, 0,
+                           'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker1.put_object('b', timestamps[2].internal, 0,
+                           'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        # commit pending file into db
+        broker1._commit_puts()
+        broker2.merge_items(json.loads(json.dumps(broker1.get_items_since(
+            broker2.get_sync(id), 1000))), id)
+        broker1.put_object(snowman, timestamps[3].internal, 0, 'text/plain',
+                           'd41d8cd98f00b204e9800998ecf8427e')
+        broker1._commit_puts()
+        broker2.merge_items(json.loads(json.dumps(broker1.get_items_since(
+            broker2.get_sync(id), 1000))), id)
+        items = broker2.get_items_since(-1, 1000)
+        self.assertEqual(['b', snowman],
+                         sorted([rec['name'] for rec in items]))
+        for rec in items:
+            if rec['name'] == snowman:
+                self.assertEqual(rec['created_at'], timestamps[3].internal)
+            if rec['name'] == 'b':
+                self.assertEqual(rec['created_at'], timestamps[2].internal)
+
+    def test_merge_items_overwrite(self):
+        # test DatabaseBroker.merge_items
+        broker1 = ContainerBroker(self.get_db_path(), account='a',
+                                  container='c')
+        timestamps = [next(self.ts) for _ in range(5)]
+        broker1.initialize(timestamps[0].internal, 0)
+        id = broker1.get_info()['id']
+        broker2 = ContainerBroker(self.get_db_path(),
+                                  account='a', container='c')
+        broker2.initialize(timestamps[1].internal, 0)
+        broker1.put_object('a', timestamps[2].internal, 0,
+                           'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker1.put_object('b', timestamps[3].internal, 0,
+                           'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        # commit pending file into db
+        broker1._commit_puts()
+        broker2.merge_items(broker1.get_items_since(
+            broker2.get_sync(id), 1000), id)
+        broker1.put_object('a', timestamps[4].internal, 0,
+                           'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker1._commit_puts()
+        broker2.merge_items(broker1.get_items_since(
+            broker2.get_sync(id), 1000), id)
+        items = broker2.get_items_since(-1, 1000)
+        self.assertEqual(['a', 'b'], sorted([rec['name'] for rec in items]))
+        for rec in items:
+            if rec['name'] == 'a':
+                self.assertEqual(rec['created_at'], timestamps[4].internal)
+            if rec['name'] == 'b':
+                self.assertEqual(rec['created_at'], timestamps[3].internal)
+
+    def test_merge_items_post_overwrite_out_of_order(self):
+        # test DatabaseBroker.merge_items
+        broker1 = ContainerBroker(self.get_db_path(), account='a',
+                                  container='c')
+        timestamps = [next(self.ts) for _ in range(6)]
+        broker1.initialize(timestamps[1].internal, 0)
+        id = broker1.get_info()['id']
+        broker2 = ContainerBroker(self.get_db_path(),
+                                  account='a', container='c')
+        broker2.initialize(timestamps[1].internal, 0)
+        broker1.put_object('a', timestamps[2].internal, 0,
+                           'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker1.put_object('b', timestamps[3].internal, 0,
+                           'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        # commit pending file into db
+        broker1._commit_puts()
+        broker2.merge_items(broker1.get_items_since(
+            broker2.get_sync(id), 1000), id)
+        broker1.put_object('a', timestamps[4].internal, 0,
+                           'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker1._commit_puts()
+        broker2.merge_items(broker1.get_items_since(
+            broker2.get_sync(id), 1000), id)
+        items = broker2.get_items_since(-1, 1000)
+        self.assertEqual(['a', 'b'], sorted([rec['name'] for rec in items]))
+        for rec in items:
+            if rec['name'] == 'a':
+                self.assertEqual(rec['created_at'], timestamps[4].internal)
+            if rec['name'] == 'b':
+                self.assertEqual(rec['created_at'], timestamps[3].internal)
+                self.assertEqual(rec['content_type'], 'text/plain')
+        items = broker2.get_items_since(-1, 1000)
+        self.assertEqual(['a', 'b'], sorted([rec['name'] for rec in items]))
+        for rec in items:
+            if rec['name'] == 'a':
+                self.assertEqual(rec['created_at'], timestamps[4].internal)
+            if rec['name'] == 'b':
+                self.assertEqual(rec['created_at'], timestamps[3].internal)
+        broker1.put_object('b', timestamps[5].internal, 0,
+                           'text/plain', 'd41d8cd98f00b204e9800998ecf8427e')
+        broker1._commit_puts()
+        broker2.merge_items(broker1.get_items_since(
+            broker2.get_sync(id), 1000), id)
+        items = broker2.get_items_since(-1, 1000)
+        self.assertEqual(['a', 'b'], sorted([rec['name'] for rec in items]))
+        for rec in items:
+            if rec['name'] == 'a':
+                self.assertEqual(rec['created_at'], timestamps[4].internal)
+            if rec['name'] == 'b':
+                self.assertEqual(rec['created_at'], timestamps[5].internal)
+                self.assertEqual(rec['content_type'], 'text/plain')
+
+    def test_set_storage_policy_index(self):
+        ts = make_timestamp_iter()
+        broker = ContainerBroker(self.get_db_path(),
+                                 account='test_account',
+                                 container='test_container')
+        timestamp = next(ts)
+        broker.initialize(timestamp.internal, 0)
+
+        info = broker.get_info()
+        self.assertEqual(0, info['storage_policy_index'])  # sanity check
+        self.assertEqual(0, info['object_count'])
+        self.assertEqual(0, info['bytes_used'])
+        if self.__class__ in (
+                TestContainerBrokerBeforeMetadata,
+                TestContainerBrokerBeforeXSync,
+                TestContainerBrokerBeforeSPI,
+                TestContainerBrokerBeforeShardRanges,
+                TestContainerBrokerBeforeShardRangeReportedColumn,
+                TestContainerBrokerBeforeShardRangeTombstonesColumn):
+            self.assertEqual(info['status_changed_at'], '0')
+        else:
+            self.assertEqual(timestamp.internal, info['status_changed_at'])
+        expected = {0: {'object_count': 0, 'bytes_used': 0}}
+        self.assertEqual(expected, broker.get_policy_stats())
+
+        timestamp = next(ts)
+        broker.set_storage_policy_index(111, timestamp.internal)
+        self.assertEqual(broker.storage_policy_index, 111)
+        info = broker.get_info()
+        self.assertEqual(111, info['storage_policy_index'])
+        self.assertEqual(0, info['object_count'])
+        self.assertEqual(0, info['bytes_used'])
+        self.assertEqual(timestamp.internal, info['status_changed_at'])
+        expected[111] = {'object_count': 0, 'bytes_used': 0}
+        self.assertEqual(expected, broker.get_policy_stats())
+
+        timestamp = next(ts)
+        broker.set_storage_policy_index(222, timestamp.internal)
+        self.assertEqual(broker.storage_policy_index, 222)
+        info = broker.get_info()
+        self.assertEqual(222, info['storage_policy_index'])
+        self.assertEqual(0, info['object_count'])
+        self.assertEqual(0, info['bytes_used'])
+        self.assertEqual(timestamp.internal, info['status_changed_at'])
+        expected[222] = {'object_count': 0, 'bytes_used': 0}
+        self.assertEqual(expected, broker.get_policy_stats())
+
+        old_timestamp, timestamp = timestamp, next(ts)
+        # setting again is idempotent
+        broker.set_storage_policy_index(222, timestamp.internal)
+        info = broker.get_info()
+        self.assertEqual(222, info['storage_policy_index'])
+        self.assertEqual(0, info['object_count'])
+        self.assertEqual(0, info['bytes_used'])
+        self.assertEqual(old_timestamp.internal, info['status_changed_at'])
+        self.assertEqual(expected, broker.get_policy_stats())
+
+    def test_set_storage_policy_index_empty(self):
+        # Putting an object may trigger migrations, so test with a
+        # never-had-an-object container to make sure we handle it
+        broker = ContainerBroker(self.get_db_path(),
+                                 account='test_account',
+                                 container='test_container')
+        broker.initialize(Timestamp('1').internal, 0)
+        info = broker.get_info()
+        self.assertEqual(0, info['storage_policy_index'])
+
+        broker.set_storage_policy_index(2)
+        info = broker.get_info()
+        self.assertEqual(2, info['storage_policy_index'])
+
+    def test_reconciler_sync(self):
+        broker = ContainerBroker(self.get_db_path(),
+                                 account='test_account',
+                                 container='test_container')
+        broker.initialize(Timestamp('1').internal, 0)
+        self.assertEqual(-1, broker.get_reconciler_sync())
+        broker.update_reconciler_sync(10)
+        self.assertEqual(10, broker.get_reconciler_sync())
+
+    @with_tempdir
+    def test_legacy_pending_files(self, tempdir):
+        ts = make_timestamp_iter()
+        db_path = os.path.join(tempdir, 'container.db')
+
+        # first init an acct DB without the policy_stat table present
+        broker = ContainerBroker(db_path, account='a', container='c')
+        broker.initialize(next(ts).internal, 1)
+
+        # manually make some pending entries lacking storage_policy_index
+        with open(broker.pending_file, 'a+b') as fp:
+            for i in range(10):
+                name, timestamp, size, content_type, etag, deleted = (
+                    'o%s' % i, next(ts).internal, 0, 'c', 'e', 0)
+                fp.write(b':')
+                fp.write(base64.b64encode(pickle.dumps(
+                    (name, timestamp, size, content_type, etag, deleted),
+                    protocol=2)))
+                fp.flush()
+
+        # use put_object to append some more entries with different
+        # values for storage_policy_index
+        for i in range(10, 30):
+            name = 'o%s' % i
+            if i < 20:
+                size = 1
+                storage_policy_index = 0
+            else:
+                size = 2
+                storage_policy_index = 1
+            broker.put_object(name, next(ts).internal, size, 'c', 'e', 0,
+                              storage_policy_index=storage_policy_index)
+
+        broker._commit_puts_stale_ok()
+
+        # 10 objects with 0 bytes each in the legacy pending entries
+        # 10 objects with 1 bytes each in storage policy 0
+        # 10 objects with 2 bytes each in storage policy 1
+        expected = {
+            0: {'object_count': 20, 'bytes_used': 10},
+            1: {'object_count': 10, 'bytes_used': 20},
+        }
+        self.assertEqual(broker.get_policy_stats(), expected)
+
+    @with_tempdir
+    def test_get_info_no_stale_reads(self, tempdir):
+        ts = make_timestamp_iter()
+        db_path = os.path.join(tempdir, 'container.db')
+
+        def mock_commit_puts():
+            raise sqlite3.OperationalError('unable to open database file')
+
+        broker = ContainerBroker(db_path, account='a', container='c',
+                                 stale_reads_ok=False)
+        broker.initialize(next(ts).internal, 1)
+
+        # manually make some pending entries
+        with open(broker.pending_file, 'a+b') as fp:
+            for i in range(10):
+                name, timestamp, size, content_type, etag, deleted = (
+                    'o%s' % i, next(ts).internal, 0, 'c', 'e', 0)
+                fp.write(b':')
+                fp.write(base64.b64encode(pickle.dumps(
+                    (name, timestamp, size, content_type, etag, deleted),
+                    protocol=2)))
+                fp.flush()
+
+        broker._commit_puts = mock_commit_puts
+        with self.assertRaises(sqlite3.OperationalError) as exc_context:
+            broker.get_info()
+        self.assertIn('unable to open database file',
+                      str(exc_context.exception))
+
+    @with_tempdir
+    def test_get_info_stale_read_ok(self, tempdir):
+        ts = make_timestamp_iter()
+        db_path = os.path.join(tempdir, 'container.db')
+
+        def mock_commit_puts():
+            raise sqlite3.OperationalError('unable to open database file')
+
+        broker = ContainerBroker(db_path, account='a', container='c',
+                                 stale_reads_ok=True)
+        broker.initialize(next(ts).internal, 1)
+
+        # manually make some pending entries
+        with open(broker.pending_file, 'a+b') as fp:
+            for i in range(10):
+                name, timestamp, size, content_type, etag, deleted = (
+                    'o%s' % i, next(ts).internal, 0, 'c', 'e', 0)
+                fp.write(b':')
+                fp.write(base64.b64encode(pickle.dumps(
+                    (name, timestamp, size, content_type, etag, deleted),
+                    protocol=2)))
+                fp.flush()
+
+        broker._commit_puts = mock_commit_puts
+        broker.get_info()
+
+    @with_tempdir
+    def test_create_broker(self, tempdir):
+        broker, init = ContainerBroker.create_broker(tempdir, 0, 'a', 'c')
+        hsh = hash_path('a', 'c')
+        expected_path = os.path.join(
+            tempdir, 'containers', '0', hsh[-3:], hsh, hsh + '.db')
+        self.assertEqual(expected_path, broker.db_file)
+        self.assertTrue(os.path.isfile(expected_path))
+        self.assertTrue(init)
+        broker, init = ContainerBroker.create_broker(tempdir, 0, 'a', 'c')
+        self.assertEqual(expected_path, broker.db_file)
+        self.assertFalse(init)
+
+        ts = Timestamp.now()
+        broker, init = ContainerBroker.create_broker(tempdir, 0, 'a', 'c1',
+                                                     put_timestamp=ts.internal)
+        hsh = hash_path('a', 'c1')
+        expected_path = os.path.join(
+            tempdir, 'containers', '0', hsh[-3:], hsh, hsh + '.db')
+        self.assertEqual(expected_path, broker.db_file)
+        self.assertTrue(os.path.isfile(expected_path))
+        self.assertEqual(ts.internal, broker.get_info()['put_timestamp'])
+        self.assertEqual(0, broker.get_info()['storage_policy_index'])
+        self.assertTrue(init)
+
+        epoch = Timestamp.now()
+        broker, init = ContainerBroker.create_broker(tempdir, 0, 'a', 'c3',
+                                                     epoch=epoch)
+        hsh = hash_path('a', 'c3')
+        expected_path = os.path.join(
+            tempdir, 'containers', '0', hsh[-3:],
+            hsh, '%s_%s.db' % (hsh, epoch.normal))
+        self.assertEqual(expected_path, broker.db_file)
+        self.assertTrue(init)
+
+    @with_tempdir
+    def test_pending_file_name(self, tempdir):
+        # pending file should have same name for sharded or unsharded db
+        expected_pending_path = os.path.join(tempdir, 'container.db.pending')
+
+        db_path = os.path.join(tempdir, 'container.db')
+        fresh_db_path = os.path.join(tempdir, 'container_epoch.db')
+
+        def do_test(given_db_file, expected_db_file):
+            broker = ContainerBroker(given_db_file, account='a', container='c')
+            self.assertEqual(expected_pending_path, broker.pending_file)
+            self.assertEqual(expected_db_file, broker.db_file)
+
+        # no files exist
+        do_test(db_path, db_path)
+        do_test(fresh_db_path, fresh_db_path)
+
+        # only container.db exists - unsharded
+        with open(db_path, 'wb'):
+            pass
+        do_test(db_path, db_path)
+        do_test(fresh_db_path, db_path)
+
+        # container.db and container_shard.db exist - sharding
+        with open(fresh_db_path, 'wb'):
+            pass
+        do_test(db_path, fresh_db_path)
+        do_test(fresh_db_path, fresh_db_path)
+
+        # only container_shard.db exists - sharded
+        os.unlink(db_path)
+        do_test(db_path, fresh_db_path)
+        do_test(fresh_db_path, fresh_db_path)
+
+    @with_tempdir
+    def test_sharding_sysmeta(self, tempdir):
+        db_path = os.path.join(tempdir, 'container.db')
+        broker = ContainerBroker(
+            db_path, account='myaccount', container='mycontainer')
+        broker.initialize(Timestamp.now().internal)
+
+        expected = 'aaa/ccc'
+        with mock_timestamp_now() as now:
+            broker.set_sharding_sysmeta('Root', expected)
+        actual = broker.metadata
+        self.assertEqual([expected, now.internal],
+                         actual.get('X-Container-Sysmeta-Shard-Root'))
+        self.assertEqual(expected, broker.get_sharding_sysmeta('Root'))
+
+        expected = {'key': 'value'}
+        with mock_timestamp_now() as now:
+            broker.set_sharding_sysmeta('test', expected)
+        actual = broker.metadata
+        self.assertEqual([expected, now.internal],
+                         actual.get('X-Container-Sysmeta-Shard-test'))
+        self.assertEqual(expected, broker.get_sharding_sysmeta('test'))
+
+    @with_tempdir
+    def test_path(self, tempdir):
+        db_path = os.path.join(tempdir, 'container.db')
+        broker = ContainerBroker(
+            db_path, account='myaccount', container='mycontainer')
+        broker.initialize(next(self.ts).internal, 1)
+        # make sure we can cope with unitialized account and container
+        broker.account = broker.container = None
+        self.assertEqual('myaccount/mycontainer', broker.path)
+
+    @with_tempdir
+    def test_old_style_root_account_container_path(self, tempdir):
+        db_path = os.path.join(tempdir, 'container.db')
+        broker = ContainerBroker(
+            db_path, account='root_a', container='root_c')
+        broker.initialize(next(self.ts).internal, 1)
+        # make sure we can cope with unitialized account and container
+        broker.account = broker.container = None
+
+        self.assertEqual('root_a', broker.root_account)
+        self.assertEqual('root_c', broker.root_container)
+        self.assertEqual('root_a/root_c', broker.root_path)
+        self.assertTrue(broker.is_root_container())
+        self.assertEqual('root_a', broker.account)  # sanity check
+        self.assertEqual('root_c', broker.container)  # sanity check
+
+        # we don't expect root containers to have this sysmeta set but if it is
+        # the broker should still behave like a root container
+        metadata = {
+            'X-Container-Sysmeta-Shard-Root':
+                ('root_a/root_c', next(self.ts).internal)}
+        broker = ContainerBroker(
+            db_path, account='root_a', container='root_c')
+        broker.update_metadata(metadata)
+        broker.account = broker.container = None
+        self.assertEqual('root_a', broker.root_account)
+        self.assertEqual('root_c', broker.root_container)
+        self.assertEqual('root_a/root_c', broker.root_path)
+        self.assertTrue(broker.is_root_container())
+
+        # if root is marked deleted, it still considers itself to be a root
+        broker.delete_db(next(self.ts).internal)
+        self.assertEqual('root_a', broker.root_account)
+        self.assertEqual('root_c', broker.root_container)
+        self.assertEqual('root_a/root_c', broker.root_path)
+        self.assertTrue(broker.is_root_container())
+        # check the values are not just being cached
+        broker = ContainerBroker(db_path)
+        self.assertEqual('root_a', broker.root_account)
+        self.assertEqual('root_c', broker.root_container)
+        self.assertEqual('root_a/root_c', broker.root_path)
+        self.assertTrue(broker.is_root_container())
+
+        # check a shard container
+        db_path = os.path.join(tempdir, 'shard_container.db')
+        broker = ContainerBroker(
+            db_path, account='.shards_root_a', container='c_shard')
+        broker.initialize(next(self.ts).internal, 1)
+        # now the metadata is significant...
+        metadata = {
+            'X-Container-Sysmeta-Shard-Root':
+                ('root_a/root_c', next(self.ts).internal)}
+        broker.update_metadata(metadata)
+        broker.account = broker.container = None
+        broker._root_account = broker._root_container = None
+
+        self.assertEqual('root_a', broker.root_account)
+        self.assertEqual('root_c', broker.root_container)
+        self.assertEqual('root_a/root_c', broker.root_path)
+        self.assertFalse(broker.is_root_container())
+
+        # check validation
+        def check_validation(root_value):
+            metadata = {
+                'X-Container-Sysmeta-Shard-Root':
+                    (root_value, next(self.ts).internal)}
+            broker.update_metadata(metadata)
+            broker.account = broker.container = None
+            broker._root_account = broker._root_container = None
+            with self.assertRaises(ValueError) as cm:
+                broker.root_account
+            self.assertIn('Expected X-Container-Sysmeta-Shard-Root',
+                          str(cm.exception))
+            with self.assertRaises(ValueError):
+                broker.root_container
+
+        check_validation('root_a')
+        check_validation('/root_a')
+        check_validation('/root_a/root_c')
+        check_validation('/root_a/root_c/blah')
+        check_validation('/')
+
+    @with_tempdir
+    def test_root_account_container_path(self, tempdir):
+        db_path = os.path.join(tempdir, 'container.db')
+        broker = ContainerBroker(
+            db_path, account='root_a', container='root_c')
+        broker.initialize(next(self.ts).internal, 1)
+        # make sure we can cope with unitialized account and container
+        broker.account = broker.container = None
+
+        self.assertEqual('root_a', broker.root_account)
+        self.assertEqual('root_c', broker.root_container)
+        self.assertEqual('root_a/root_c', broker.root_path)
+        self.assertTrue(broker.is_root_container())
+        self.assertEqual('root_a', broker.account)  # sanity check
+        self.assertEqual('root_c', broker.container)  # sanity check
+
+        # we don't expect root containers to have this sysmeta set but if it is
+        # the broker should still behave like a root container
+        metadata = {
+            'X-Container-Sysmeta-Shard-Quoted-Root':
+                ('root_a/root_c', next(self.ts).internal)}
+        broker = ContainerBroker(
+            db_path, account='root_a', container='root_c')
+        broker.update_metadata(metadata)
+        broker.account = broker.container = None
+        self.assertEqual('root_a', broker.root_account)
+        self.assertEqual('root_c', broker.root_container)
+        self.assertEqual('root_a/root_c', broker.root_path)
+        self.assertTrue(broker.is_root_container())
+
+        # if root is marked deleted, it still considers itself to be a root
+        broker.delete_db(next(self.ts).internal)
+        self.assertEqual('root_a', broker.root_account)
+        self.assertEqual('root_c', broker.root_container)
+        self.assertEqual('root_a/root_c', broker.root_path)
+        self.assertTrue(broker.is_root_container())
+        # check the values are not just being cached
+        broker = ContainerBroker(db_path)
+        self.assertEqual('root_a', broker.root_account)
+        self.assertEqual('root_c', broker.root_container)
+        self.assertEqual('root_a/root_c', broker.root_path)
+        self.assertTrue(broker.is_root_container())
+
+        # check a shard container
+        db_path = os.path.join(tempdir, 'shard_container.db')
+        broker = ContainerBroker(
+            db_path, account='.shards_root_a', container='c_shard')
+        broker.initialize(next(self.ts).internal, 1)
+        # now the metadata is significant...
+        metadata = {
+            'X-Container-Sysmeta-Shard-Quoted-Root':
+                ('root_a/root_c', next(self.ts).internal)}
+        broker.update_metadata(metadata)
+        broker.account = broker.container = None
+        broker._root_account = broker._root_container = None
+
+        self.assertEqual('root_a', broker.root_account)
+        self.assertEqual('root_c', broker.root_container)
+        self.assertEqual('root_a/root_c', broker.root_path)
+        self.assertFalse(broker.is_root_container())
+
+        # check validation
+        def check_validation(root_value):
+            metadata = {
+                'X-Container-Sysmeta-Shard-Quoted-Root':
+                    (root_value, next(self.ts).internal)}
+            broker.update_metadata(metadata)
+            broker.account = broker.container = None
+            broker._root_account = broker._root_container = None
+            with self.assertRaises(ValueError) as cm:
+                broker.root_account
+            self.assertIn('Expected X-Container-Sysmeta-Shard-Quoted-Root',
+                          str(cm.exception))
+            with self.assertRaises(ValueError):
+                broker.root_container
+
+        check_validation('root_a')
+        check_validation('/root_a')
+        check_validation('/root_a/root_c')
+        check_validation('/root_a/root_c/blah')
+        check_validation('/')
+
+    def test_resolve_shard_range_states(self):
+        self.assertIsNone(ContainerBroker.resolve_shard_range_states(None))
+        self.assertIsNone(ContainerBroker.resolve_shard_range_states([]))
+
+        for state_num, state_name in ShardRange.STATES.items():
+            self.assertEqual({state_num},
+                             ContainerBroker.resolve_shard_range_states(
+                                 [state_name]))
+            self.assertEqual({state_num},
+                             ContainerBroker.resolve_shard_range_states(
+                                 [state_num]))
+
+        self.assertEqual(set(ShardRange.STATES),
+                         ContainerBroker.resolve_shard_range_states(
+                         ShardRange.STATES_BY_NAME))
+
+        self.assertEqual(
+            set(ShardRange.STATES),
+            ContainerBroker.resolve_shard_range_states(ShardRange.STATES))
+
+        # check aliases
+        self.assertEqual(
+            {ShardRange.CLEAVED, ShardRange.ACTIVE, ShardRange.SHARDING,
+             ShardRange.SHRINKING},
+            ContainerBroker.resolve_shard_range_states(['listing']))
+
+        self.assertEqual(
+            {ShardRange.CLEAVED, ShardRange.ACTIVE, ShardRange.SHARDING,
+             ShardRange.SHRINKING},
+            ContainerBroker.resolve_shard_range_states(['listing', 'active']))
+
+        self.assertEqual(
+            {ShardRange.CLEAVED, ShardRange.ACTIVE, ShardRange.SHARDING,
+             ShardRange.SHRINKING, ShardRange.CREATED},
+            ContainerBroker.resolve_shard_range_states(['listing', 'created']))
+
+        self.assertEqual(
+            {ShardRange.CREATED, ShardRange.CLEAVED, ShardRange.ACTIVE,
+             ShardRange.SHARDING},
+            ContainerBroker.resolve_shard_range_states(['updating']))
+
+        self.assertEqual(
+            {ShardRange.CREATED, ShardRange.CLEAVED, ShardRange.ACTIVE,
+             ShardRange.SHARDING, ShardRange.SHRINKING},
+            ContainerBroker.resolve_shard_range_states(
+                ['updating', 'listing']))
+
+        self.assertEqual(
+            {ShardRange.CREATED, ShardRange.CLEAVED,
+             ShardRange.ACTIVE, ShardRange.SHARDING, ShardRange.SHARDED,
+             ShardRange.SHRINKING, ShardRange.SHRUNK},
+            ContainerBroker.resolve_shard_range_states(['auditing']))
+
+        def check_bad_value(value):
+            with self.assertRaises(ValueError) as cm:
+                ContainerBroker.resolve_shard_range_states(value)
+            self.assertIn('Invalid state', str(cm.exception))
+
+        check_bad_value(['bad_state', 'active'])
+        check_bad_value([''])
+        check_bad_value('active')
+
+    def _check_get_sr(self, broker, expected_sr, **kwargs):
+        """
+        Get shard ranges from ``broker`` per parameters ``kwargs``, and check
+        returned shard ranges against expected shard ranges.
+        """
+        actual_sr = broker.get_shard_ranges(**kwargs)
+        self.assertEqual([dict(sr) for sr in expected_sr],
+                         [dict(sr) for sr in actual_sr])
+
+    def _check_get_ns(self, broker, expected_ns, **kwargs):
+        actual_ns = broker.get_namespaces(**kwargs)
+        self.assertEqual(expected_ns, actual_ns)
+
+    def _check_get_sr_and_ns(self, broker, expected_sr, **kwargs):
+        """
+        For those 'get_shard_ranges' calls who's params are compatible with
+        'get_namespaces', call both of them to cross-check each other.
+        """
+        self._check_get_sr(broker, expected_sr, **kwargs)
+        expected_ns = [Namespace(sr.name, sr.lower, sr.upper)
+                       for sr in expected_sr]
+        self._check_get_ns(broker, expected_ns, **kwargs)
+
+    @with_tempdir
+    def test_get_shard_ranges(self, tempdir):
+        db_path = os.path.join(tempdir, 'container.db')
+        broker = ContainerBroker(db_path, account='a', container='c')
+        broker.initialize(next(self.ts).internal, 0)
+
+        # no rows
+        self._check_get_sr_and_ns(broker, expected_sr=[])
+        # check that a default own shard range is not generated
+        self._check_get_sr(broker, expected_sr=[], include_own=True)
+
+        # merge row for own shard range
+        own_shard_range = ShardRange(broker.path, next(self.ts), 'l', 'u',
+                                     state=ShardRange.SHARDING)
+        broker.merge_shard_ranges([own_shard_range])
+        self._check_get_sr(broker, expected_sr=[])
+        self._check_get_sr(broker, expected_sr=[], include_own=False)
+        self._check_get_sr(
+            broker, expected_sr=[own_shard_range], include_own=True)
+
+        # merge rows for other shard ranges
+        shard_ranges = [
+            ShardRange('.a/c0', next(self.ts), 'a', 'c'),
+            ShardRange('.a/c1', next(self.ts), 'c', 'd'),
+            ShardRange('.a/c2', next(self.ts), 'd', 'f',
+                       state=ShardRange.ACTIVE),
+            ShardRange('.a/c3', next(self.ts), 'e', 'f', deleted=1,
+                       state=ShardRange.SHARDED,),
+            ShardRange('.a/c4', next(self.ts), 'f', 'h',
+                       state=ShardRange.CREATED),
+            ShardRange('.a/c5', next(self.ts), 'h', 'j', deleted=1)
+        ]
+        broker.merge_shard_ranges(shard_ranges)
+        undeleted = shard_ranges[:3] + shard_ranges[4:5]
+        self._check_get_sr_and_ns(broker, expected_sr=undeleted)
+
+        self._check_get_sr(
+            broker, expected_sr=shard_ranges, include_deleted=True)
+
+        self._check_get_sr_and_ns(
+            broker, reverse=True, expected_sr=list(reversed(undeleted)))
+        self._check_get_sr_and_ns(
+            broker, marker='c', end_marker='e', expected_sr=shard_ranges[1:3])
+        self._check_get_sr_and_ns(
+            broker, marker='c', end_marker='e', states=[ShardRange.ACTIVE],
+            expected_sr=shard_ranges[2:3])
+        self._check_get_sr_and_ns(broker, marker='e', end_marker='e',
+                                  expected_sr=[])
+
+        # check state filtering...
+        self._check_get_sr_and_ns(
+            broker, states=[ShardRange.FOUND], expected_sr=shard_ranges[:2])
+
+        # includes overrides include_own
+        self._check_get_sr(broker, expected_sr=[shard_ranges[0]],
+                           includes='b', include_own=True)
+        # ... unless they coincide
+        self._check_get_sr(broker, expected_sr=[own_shard_range],
+                           includes='t', include_own=True)
+
+        # exclude_others overrides includes
+        self._check_get_sr(broker, expected_sr=[],
+                           includes='b', exclude_others=True)
+
+        # include_deleted overrides includes
+        self._check_get_sr(broker, expected_sr=[shard_ranges[-1]],
+                           includes='i', include_deleted=True)
+        self._check_get_sr(broker, expected_sr=[],
+                           includes='i', include_deleted=False)
+
+        # includes overrides marker/end_marker
+        self._check_get_sr_and_ns(
+            broker, marker='e', end_marker='', includes='b',
+            expected_sr=[shard_ranges[0]])
+
+        self._check_get_sr_and_ns(
+            broker, includes='b', marker=Namespace.MAX,
+            expected_sr=[shard_ranges[0]])
+
+        # end_marker is Namespace.MAX
+        self._check_get_sr_and_ns(
+            broker, marker='e', end_marker='', expected_sr=undeleted[2:])
+        self._check_get_sr_and_ns(
+            broker, marker='e', end_marker='', reverse=True,
+            expected_sr=list(reversed(undeleted[:3])))
+
+        # marker is Namespace.MIN
+        self._check_get_sr_and_ns(
+            broker, marker='', end_marker='d', expected_sr=shard_ranges[:2])
+        self._check_get_sr(broker,
+                           expected_sr=list(reversed(shard_ranges[2:])),
+                           marker='', end_marker='d',
+                           reverse=True, include_deleted=True)
+
+        # marker, end_marker span entire namespace
+        self._check_get_sr_and_ns(
+            broker, marker='', end_marker='', expected_sr=undeleted)
+
+        # marker, end_marker override include_own
+        self._check_get_sr(broker, expected_sr=undeleted,
+                           marker='', end_marker='k', include_own=True)
+        self._check_get_sr(broker, expected_sr=[],
+                           marker='u', end_marker='', include_own=True)
+        # ...unless they coincide
+        self._check_get_sr(broker, expected_sr=[own_shard_range],
+                           marker='t', end_marker='', include_own=True)
+
+        # null namespace cases
+        self._check_get_sr_and_ns(
+            broker, end_marker=Namespace.MIN, expected_sr=[])
+        self._check_get_sr_and_ns(
+            broker, marker=Namespace.MAX, expected_sr=[])
+
+        orig_execute = GreenDBConnection.execute
+        mock_call_args = []
+
+        def mock_execute(*args, **kwargs):
+            mock_call_args.append(args)
+            return orig_execute(*args, **kwargs)
+
+        with mock.patch('swift.common.db.GreenDBConnection.execute',
+                        mock_execute):
+            self._check_get_sr(broker, shard_ranges[2:3], includes='f')
+        self.assertEqual(1, len(mock_call_args))
+        # verify that includes keyword plumbs through to an SQL condition
+        self.assertIn("WHERE deleted=0 AND name != ? AND lower < ? AND "
+                      "(upper = '' OR upper >= ?)", mock_call_args[0][1])
+        self.assertEqual(['a/c', 'f', 'f'], mock_call_args[0][2])
+
+        mock_call_args = []
+        with mock.patch('swift.common.db.GreenDBConnection.execute',
+                        mock_execute):
+            self._check_get_sr(broker, shard_ranges[1:2],
+                               marker='c', end_marker='d')
+        self.assertEqual(1, len(mock_call_args))
+        # verify that marker & end_marker plumb through to an SQL condition
+        self.assertIn("WHERE deleted=0 AND name != ? AND lower < ? AND "
+                      "(upper = '' OR upper > ?)", mock_call_args[0][1])
+        self.assertEqual(['a/c', 'd', 'c'], mock_call_args[0][2])
+
+        self._check_get_sr_and_ns(broker, includes='i', expected_sr=[])
+        self._check_get_sr_and_ns(
+            broker, states=[ShardRange.CREATED, ShardRange.ACTIVE],
+            expected_sr=[shard_ranges[2], shard_ranges[4]])
+
+        # fill gaps
+        filler = own_shard_range.copy()
+        filler.lower = 'h'
+        self._check_get_sr_and_ns(
+            broker, fill_gaps=True, expected_sr=undeleted + [filler])
+        self._check_get_sr_and_ns(
+            broker, fill_gaps=True, marker='a',
+            expected_sr=undeleted + [filler])
+        self._check_get_sr_and_ns(
+            broker, fill_gaps=True, end_marker='z',
+            expected_sr=undeleted + [filler])
+        filler.upper = 'k'
+        self._check_get_sr_and_ns(
+            broker, fill_gaps=True, end_marker='k',
+            expected_sr=undeleted + [filler])
+
+        # includes overrides fill_gaps
+        self._check_get_sr_and_ns(
+            broker, includes='b', fill_gaps=True,
+            expected_sr=[shard_ranges[0]])
+
+        # no filler needed...
+        self._check_get_sr_and_ns(
+            broker, fill_gaps=True, end_marker='h', expected_sr=undeleted)
+        self._check_get_sr_and_ns(
+            broker, fill_gaps=True, end_marker='a', expected_sr=[])
+
+        # get everything
+        self._check_get_sr(broker, expected_sr=undeleted + [own_shard_range],
+                           include_own=True)
+
+        # get just own range
+        self._check_get_sr(broker, expected_sr=[own_shard_range],
+                           include_own=True, exclude_others=True)
+
+        # if you ask for nothing you'll get nothing
+        self._check_get_sr(broker, expected_sr=[],
+                           include_own=False, exclude_others=True)
+
+    @with_tempdir
+    def test_get_shard_ranges_includes(self, tempdir):
+        ts = next(self.ts)
+        start = ShardRange('a/-a', ts, '', 'a')
+        atof = ShardRange('a/a-f', ts, 'a', 'f')
+        ftol = ShardRange('a/f-l', ts, 'f', 'l')
+        ltor = ShardRange('a/l-r', ts, 'l', 'r')
+        rtoz = ShardRange('a/r-z', ts, 'r', 'z')
+        end = ShardRange('a/z-', ts, 'z', '')
+        ranges = [start, atof, ftol, ltor, rtoz, end]
+        db_path = os.path.join(tempdir, 'container.db')
+        broker = ContainerBroker(db_path, account='a', container='c')
+        broker.initialize(next(self.ts).internal, 0)
+        broker.merge_shard_ranges(ranges)
+
+        self._check_get_sr_and_ns(broker, includes='', expected_sr=[])
+        self._check_get_sr_and_ns(broker, includes=' ', expected_sr=[start])
+        self._check_get_sr_and_ns(broker, includes='b', expected_sr=[atof])
+        self._check_get_sr_and_ns(broker, includes='f', expected_sr=[atof])
+        self._check_get_sr_and_ns(
+            broker, includes='f\x00', expected_sr=[ftol])
+        self._check_get_sr_and_ns(broker, includes='x', expected_sr=[rtoz])
+        self._check_get_sr_and_ns(broker, includes='r', expected_sr=[ltor])
+        self._check_get_sr_and_ns(broker, includes='}', expected_sr=[end])
+
+        # add some overlapping sub-shards
+        ftoh = ShardRange('a/f-h', ts, 'f', 'h')
+        htok = ShardRange('a/h-k', ts, 'h', 'k')
+
+        broker.merge_shard_ranges([ftoh, htok])
+        self._check_get_sr_and_ns(broker, includes='g', expected_sr=[ftoh])
+        self._check_get_sr_and_ns(broker, includes='h', expected_sr=[ftoh])
+        self._check_get_sr_and_ns(broker, includes='k', expected_sr=[htok])
+        self._check_get_sr_and_ns(broker, includes='l', expected_sr=[ftol])
+        self._check_get_sr_and_ns(broker, includes='m', expected_sr=[ltor])
+
+        # remove l-r from shard ranges and try and find a shard range for an
+        # item in that range.
+        ltor.set_deleted(next(self.ts))
+        broker.merge_shard_ranges([ltor])
+        self._check_get_sr_and_ns(broker, includes='p', expected_sr=[])
+
+    @with_tempdir
+    def test_overlap_shard_range_order(self, tempdir):
+        db_path = os.path.join(tempdir, 'container.db')
+        broker = ContainerBroker(db_path, account='a', container='c')
+        broker.initialize(next(self.ts).internal, 0)
+
+        epoch0 = next(self.ts)
+        epoch1 = next(self.ts)
+        shard_ranges = [
+            ShardRange('.shard_a/shard_%d-%d' % (e, s), epoch, l, u,
+                       state=ShardRange.ACTIVE)
+            for s, (l, u) in enumerate(zip(string.ascii_letters[:7],
+                                           string.ascii_letters[1:]))
+            for e, epoch in enumerate((epoch0, epoch1))
+        ]
+        expected_sr = [sr for sr in shard_ranges]
+
+        random.shuffle(shard_ranges)
+        for sr in shard_ranges:
+            broker.merge_shard_ranges([sr])
+
+        self._check_get_sr_and_ns(broker, expected_sr)
+
+    @with_tempdir
+    def test_get_shard_ranges_with_sharding_overlaps(self, tempdir):
+        db_path = os.path.join(tempdir, 'container.db')
+        broker = ContainerBroker(db_path, account='a', container='c')
+        broker.initialize(next(self.ts).internal, 0)
+        shard_ranges = [
+            ShardRange('.shards_a/c0', next(self.ts), 'a', 'd',
+                       state=ShardRange.ACTIVE),
+            ShardRange('.shards_a/c1_0', next(self.ts), 'd', 'g',
+                       state=ShardRange.CLEAVED),
+            ShardRange('.shards_a/c1_1', next(self.ts), 'g', 'j',
+                       state=ShardRange.CLEAVED),
+            ShardRange('.shards_a/c1_2', next(self.ts), 'j', 'm',
+                       state=ShardRange.CREATED),
+            ShardRange('.shards_a/c1', next(self.ts), 'd', 'm',
+                       state=ShardRange.SHARDING),
+            ShardRange('.shards_a/c2', next(self.ts), 'm', '',
+                       state=ShardRange.ACTIVE),
+        ]
+        broker.merge_shard_ranges(
+            random.sample(shard_ranges, len(shard_ranges)))
+        self._check_get_sr_and_ns(broker, expected_sr=shard_ranges)
+
+        self._check_get_sr_and_ns(
+            broker, states=SHARD_LISTING_STATES,
+            expected_sr=shard_ranges[:3] + shard_ranges[4:])
+
+        orig_execute = GreenDBConnection.execute
+        mock_call_args = []
+
+        def mock_execute(*args, **kwargs):
+            mock_call_args.append(args)
+            return orig_execute(*args, **kwargs)
+
+        with mock.patch('swift.common.db.GreenDBConnection.execute',
+                        mock_execute):
+            self._check_get_sr(broker, shard_ranges[1:2],
+                               states=SHARD_UPDATE_STATES, includes='e')
+        self.assertEqual(1, len(mock_call_args))
+        self.assertIn("WHERE deleted=0 AND state in (?,?,?,?) AND name != ? "
+                      "AND lower < ? AND (upper = '' OR upper >= ?)",
+                      mock_call_args[0][1])
+
+        self._check_get_sr(broker, shard_ranges[2:3],
+                           states=SHARD_UPDATE_STATES, includes='j')
+        self._check_get_sr(broker, shard_ranges[3:4],
+                           states=SHARD_UPDATE_STATES, includes='k')
+
+    @with_tempdir
+    def test_get_shard_ranges_with_shrinking_overlaps(self, tempdir):
+        db_path = os.path.join(tempdir, 'container.db')
+        broker = ContainerBroker(db_path, account='a', container='c')
+        broker.initialize(next(self.ts).internal, 0)
+        shard_ranges = [
+            ShardRange('.shards_a/c0', next(self.ts), 'a', 'k',
+                       state=ShardRange.ACTIVE),
+            ShardRange('.shards_a/c1', next(self.ts), 'k', 'm',
+                       state=ShardRange.SHRINKING),
+            ShardRange('.shards_a/c2', next(self.ts), 'k', 't',
+                       state=ShardRange.ACTIVE),
+            ShardRange('.shards_a/c3', next(self.ts), 't', '',
+                       state=ShardRange.ACTIVE),
+        ]
+        broker.merge_shard_ranges(
+            random.sample(shard_ranges, len(shard_ranges)))
+        self._check_get_sr_and_ns(broker, expected_sr=shard_ranges)
+        self._check_get_sr_and_ns(
+            broker, states=SHARD_UPDATE_STATES, includes='l',
+            expected_sr=[shard_ranges[2]])
+
+    @with_tempdir
+    def test_get_shard_range_rows_with_limit(self, tempdir):
+        db_path = os.path.join(tempdir, 'container.db')
+        broker = ContainerBroker(db_path, account='a', container='c')
+        broker.initialize(next(self.ts).internal, 0)
+        shard_ranges = [
+            ShardRange('a/c', next(self.ts), 'a', 'c'),
+            ShardRange('.a/c1', next(self.ts), 'c', 'd'),
+            ShardRange('.a/c2', next(self.ts), 'd', 'f'),
+            ShardRange('.a/c3', next(self.ts), 'd', 'f', deleted=1),
+        ]
+        broker.merge_shard_ranges(shard_ranges)
+        actual = broker._get_shard_range_rows(include_deleted=True,
+                                              include_own=True)
+        self.assertEqual(4, len(actual))
+        # the order of rows is not predictable, but they should be unique
+        self.assertEqual(4, len(set(actual)))
+        actual = broker._get_shard_range_rows(include_deleted=True)
+        self.assertEqual(3, len(actual))
+        self.assertEqual(3, len(set(actual)))
+        # negative -> unlimited
+        actual = broker._get_shard_range_rows(include_deleted=True, limit=-1)
+        self.assertEqual(3, len(actual))
+        self.assertEqual(3, len(set(actual)))
+        # zero is applied
+        actual = broker._get_shard_range_rows(include_deleted=True, limit=0)
+        self.assertFalse(actual)
+        actual = broker._get_shard_range_rows(include_deleted=True, limit=1)
+        self.assertEqual(1, len(actual))
+        self.assertEqual(1, len(set(actual)))
+        actual = broker._get_shard_range_rows(include_deleted=True, limit=2)
+        self.assertEqual(2, len(actual))
+        self.assertEqual(2, len(set(actual)))
+        actual = broker._get_shard_range_rows(include_deleted=True, limit=3)
+        self.assertEqual(3, len(actual))
+        self.assertEqual(3, len(set(actual)))
+        actual = broker._get_shard_range_rows(include_deleted=True, limit=4)
+        self.assertEqual(3, len(actual))
+        self.assertEqual(3, len(set(actual)))
+        actual = broker._get_shard_range_rows(include_deleted=True,
+                                              include_own=True,
+                                              exclude_others=True,
+                                              limit=1)
+        self.assertEqual(1, len(actual))
+        self.assertEqual(shard_ranges[0], ShardRange(*actual[0]))
+        actual = broker._get_shard_range_rows(include_deleted=True,
+                                              include_own=True,
+                                              exclude_others=True,
+                                              limit=4)
+        self.assertEqual(1, len(actual))
+        self.assertEqual(shard_ranges[0], ShardRange(*actual[0]))
+
+    def _setup_broker_with_shard_ranges(self, tempdir,
+                                        own_shard_range, shard_ranges):
+        db_path = os.path.join(tempdir, 'container.db')
+        broker = ContainerBroker(db_path, account='a', container='c')
+        broker.initialize(next(self.ts).internal, 0)
+
+        # no rows
+        self.assertFalse(broker.get_shard_ranges())
+        self.assertFalse(broker.get_namespaces())
+
+        # merge row for own shard range
+        broker.merge_shard_ranges([own_shard_range])
+        self._check_get_sr(broker, [own_shard_range], include_own=True)
+        self.assertFalse(broker.get_namespaces())
+
+        # merge rows for other shard ranges
+        broker.merge_shard_ranges(shard_ranges)
+        return broker
+
+    @with_tempdir
+    def test_get_namespaces(self, tempdir):
+        own_shard_range = ShardRange('a/c', next(
+            self.ts), 'a', 'z', state=ShardRange.SHARDING)
+        shard_ranges = [
+            ShardRange('.a/c0', next(self.ts), 'a',
+                       'c', state=ShardRange.CREATED),
+            ShardRange('.a/c1', next(self.ts), 'c',
+                       'd', state=ShardRange.CREATED),
+            ShardRange('.a/c2', next(self.ts), 'd', 'f',
+                       state=ShardRange.ACTIVE),
+            ShardRange('.a/c3', next(self.ts), 'e', 'f', deleted=1,
+                       state=ShardRange.SHARDING,),
+            ShardRange('.a/c4', next(self.ts), 'f', 'h',
+                       state=ShardRange.SHARDING),
+            ShardRange('.a/c5', next(self.ts), 'h', 'j', deleted=1)
+        ]
+        broker = self._setup_broker_with_shard_ranges(
+            tempdir, own_shard_range, shard_ranges)
+        undeleted = [sr for sr in shard_ranges if not sr.deleted]
+        self._check_get_sr(broker, undeleted)
+
+        # test get all undeleted namespaces with gap filled.
+        expected_ns = [Namespace(sr.name, sr.lower, sr.upper)
+                       for sr in undeleted]
+        filler = [Namespace('a/c', 'h', 'z')]
+        self._check_get_ns(broker, expected_ns + filler, fill_gaps=True)
+        # test get all undeleted namespaces w/o gap filled.
+        self._check_get_sr_and_ns(broker, undeleted)
+
+        orig_execute = GreenDBConnection.execute
+        mock_call_args = []
+
+        def mock_execute(*args, **kwargs):
+            mock_call_args.append(args)
+            return orig_execute(*args, **kwargs)
+
+        with mock.patch('swift.common.db.GreenDBConnection.execute',
+                        mock_execute):
+            self._check_get_ns(broker, expected_ns,
+                               states=[ShardRange.CREATED, ShardRange.ACTIVE,
+                                       ShardRange.SHARDING])
+        self.assertEqual(1, len(mock_call_args))
+        # verify that includes keyword plumbs through to an SQL condition
+        self.assertIn(
+            "WHERE deleted = 0 AND name != ? AND state in (?,?,?)",
+            mock_call_args[0][1])
+        self.assertEqual(set(['a/c', ShardRange.ACTIVE, ShardRange.CREATED,
+                         ShardRange.SHARDING]), set(mock_call_args[0][2]))
+
+        mock_call_args = []
+        with mock.patch('swift.common.db.GreenDBConnection.execute',
+                        mock_execute):
+            self._check_get_ns(broker, expected_ns[2:3], includes='f')
+        self.assertEqual(1, len(mock_call_args))
+        # verify that includes keyword plumbs through to an SQL condition
+        self.assertIn("WHERE deleted = 0 AND name != ? AND lower < ? AND "
+                      "(upper = '' OR upper >= ?)", mock_call_args[0][1])
+        self.assertEqual(['a/c', 'f', 'f'], mock_call_args[0][2])
+
+        mock_call_args = []
+        with mock.patch('swift.common.db.GreenDBConnection.execute',
+                        mock_execute):
+            self._check_get_ns(broker, expected_ns[1:2],
+                               marker='c', end_marker='d')
+        self.assertEqual(1, len(mock_call_args))
+        # verify that marker & end_marker plumb through to an SQL condition
+        self.assertIn("WHERE deleted = 0 AND name != ? AND lower < ? AND "
+                      "(upper = '' OR upper > ?)", mock_call_args[0][1])
+        self.assertEqual(['a/c', 'd', 'c'], mock_call_args[0][2])
+
+    @with_tempdir
+    def test_get_namespaces_state_filtering(self, tempdir):
+        own_shard_range = ShardRange('a/c', next(
+            self.ts), 'a', 'z', state=ShardRange.SHARDING)
+        shard_ranges = [
+            ShardRange('.a/c0', next(self.ts), 'a', 'c',
+                       state=ShardRange.CREATED),
+            ShardRange('.a/c1', next(self.ts), 'c', 'd',
+                       state=ShardRange.CREATED),
+            ShardRange('.a/c2', next(self.ts), 'd', 'f',
+                       state=ShardRange.SHARDING),
+            ShardRange('.a/c2a', next(self.ts), 'd', 'e',
+                       state=ShardRange.ACTIVE),
+            ShardRange('.a/c2b', next(self.ts), 'e', 'f',
+                       state=ShardRange.ACTIVE, ),
+            ShardRange('.a/c3', next(self.ts), 'f', 'h',
+                       state=ShardRange.SHARDING),
+            ShardRange('.a/c4', next(self.ts), 'h', 'j', deleted=1,
+                       state=ShardRange.SHARDED)
+        ]
+        broker = self._setup_broker_with_shard_ranges(
+            tempdir, own_shard_range, shard_ranges)
+
+        def do_test(states, expected_sr):
+            self._check_get_sr_and_ns(broker, expected_sr, states=states)
+            expected_ns = [Namespace(sr.name, sr.lower, sr.upper)
+                           for sr in expected_sr]
+            filler_lower = expected_sr[-1].upper if expected_sr else 'a'
+            filler = [Namespace('a/c', filler_lower, 'z')]
+            self._check_get_ns(broker, expected_ns + filler,
+                               states=states, fill_gaps=True)
+
+        do_test([ShardRange.CREATED], shard_ranges[:2])
+        do_test([ShardRange.CREATED, ShardRange.ACTIVE],
+                shard_ranges[:2] + shard_ranges[3:5])
+        # this case verifies that state trumps lower for ordering...
+        do_test([ShardRange.ACTIVE, ShardRange.SHARDING],
+                shard_ranges[3:5] + shard_ranges[2:3] + shard_ranges[5:6])
+        do_test([ShardRange.CREATED, ShardRange.ACTIVE, ShardRange.SHARDING],
+                shard_ranges[:2] + shard_ranges[3:5] + shard_ranges[2:3] +
+                shard_ranges[5:6])
+        do_test([ShardRange.SHARDED], [])
+
+    @with_tempdir
+    def test_get_namespaces_root_container_fill_gap(self, tempdir):
+        # Test GET namespaces from a root container with full namespace.
+        own_shard_range = ShardRange('a/c', next(
+            self.ts), '', '', state=ShardRange.SHARDED)
+        shard_ranges = [
+            ShardRange('.a/c0', next(self.ts), '',
+                       'a', state=ShardRange.CREATED),
+            ShardRange('.a/c1', next(self.ts), 'a',
+                       'c', state=ShardRange.CREATED),
+            ShardRange('.a/c2', next(self.ts), 'c',
+                       'd', state=ShardRange.CREATED),
+            ShardRange('.a/c3', next(self.ts), 'd', 'f',
+                       state=ShardRange.ACTIVE),
+            ShardRange('.a/c4', next(self.ts), 'f', 'h',
+                       state=ShardRange.SHARDING),
+            ShardRange('.a/c5', next(self.ts), 'h', '',
+                       state=ShardRange.SHARDING),
+        ]
+        broker = self._setup_broker_with_shard_ranges(
+            tempdir, own_shard_range, shard_ranges)
+        undeleted = [sr for sr in shard_ranges if not sr.deleted]
+        self._check_get_sr_and_ns(broker, undeleted, fill_gaps=True)
+
+        # test optimization will skip ``get_own_shard_range`` call.
+        with mock.patch.object(
+                broker, 'get_own_shard_range') as mock_get_own_sr:
+            self._check_get_ns(broker, undeleted, fill_gaps=True)
+        mock_get_own_sr.assert_not_called()
+        # test get all undeleted namespaces w/o gap filled.
+        self._check_get_sr_and_ns(broker, undeleted)
+
+    @with_tempdir
+    def test_get_own_shard_range(self, tempdir):
+        db_path = os.path.join(tempdir, 'container.db')
+        broker = ContainerBroker(
+            db_path, account='.shards_a', container='shard_c')
+        broker.initialize(next(self.ts).internal, 0)
+
+        # no row for own shard range - expect a default own shard range
+        # covering the entire namespace default
+        now = Timestamp.now()
+        own_sr = ShardRange(broker.path, now, '', '', 0, 0, now,
+                            state=ShardRange.ACTIVE)
+        with mock.patch('swift.container.backend.Timestamp.now',
+                        return_value=now):
+            actual = broker.get_own_shard_range()
+        self.assertEqual(dict(own_sr), dict(actual))
+
+        actual = broker.get_own_shard_range(no_default=True)
+        self.assertIsNone(actual)
+
+        # row for own shard range and others
+        ts_1 = next(self.ts)
+        own_sr = ShardRange(broker.path, ts_1, 'l', 'u')
+        broker.merge_shard_ranges(
+            [own_sr,
+             ShardRange('.a/c1', next(self.ts), 'b', 'c'),
+             ShardRange('.a/c2', next(self.ts), 'c', 'd')])
+        actual = broker.get_own_shard_range()
+        self.assertEqual(dict(own_sr), dict(actual))
+
+        # check stats are not automatically updated
+        broker.put_object(
+            'o1', next(self.ts).internal, 100, 'text/plain', 'etag1')
+        broker.put_object(
+            'o2', next(self.ts).internal, 99, 'text/plain', 'etag2')
+        actual = broker.get_own_shard_range()
+        self.assertEqual(dict(own_sr), dict(actual))
+
+        # check non-zero stats returned
+        own_sr.update_meta(object_count=2, bytes_used=199,
+                           meta_timestamp=next(self.ts))
+        broker.merge_shard_ranges(own_sr)
+        actual = broker.get_own_shard_range()
+        self.assertEqual(dict(own_sr), dict(actual))
+
+        # still returned when deleted
+        own_sr.update_meta(object_count=0, bytes_used=0,
+                           meta_timestamp=next(self.ts))
+        delete_ts = next(self.ts)
+        own_sr.set_deleted(timestamp=delete_ts)
+        broker.merge_shard_ranges(own_sr)
+        actual = broker.get_own_shard_range()
+        self.assertEqual(dict(own_sr), dict(actual))
+
+        # still in table after reclaim_age
+        broker.reclaim(next(self.ts).internal, next(self.ts).internal)
+        actual = broker.get_own_shard_range()
+        self.assertEqual(dict(own_sr), dict(actual))
+
+        # entire namespace
+        ts_2 = next(self.ts)
+        own_sr = ShardRange(broker.path, ts_2, '', '')
+        broker.merge_shard_ranges([own_sr])
+        actual = broker.get_own_shard_range()
+        self.assertEqual(dict(own_sr), dict(actual))
+
+        orig_execute = GreenDBConnection.execute
+        mock_call_args = []
+
+        def mock_execute(*args, **kwargs):
+            mock_call_args.append(args)
+            return orig_execute(*args, **kwargs)
+
+        with mock.patch('swift.common.db.GreenDBConnection.execute',
+                        mock_execute):
+            actual = broker.get_own_shard_range()
+        self.assertEqual(dict(own_sr), dict(actual))
+        self.assertEqual(1, len(mock_call_args))
+        # verify that SQL is optimised with LIMIT
+        self.assertIn("WHERE name = ? LIMIT 1", mock_call_args[0][1])
+        self.assertEqual(['.shards_a/shard_c'], mock_call_args[0][2])
+
+    @with_tempdir
+    def test_enable_sharding(self, tempdir):
+        db_path = os.path.join(tempdir, 'container.db')
+        broker = ContainerBroker(
+            db_path, account='.shards_a', container='shard_c')
+        broker.initialize(next(self.ts).internal, 0)
+        epoch = next(self.ts)
+        broker.enable_sharding(epoch)
+        own_sr = broker.get_own_shard_range(no_default=True)
+        self.assertEqual(epoch, own_sr.epoch)
+        self.assertEqual(epoch, own_sr.state_timestamp)
+        self.assertEqual(ShardRange.SHARDING, own_sr.state)
+
+    @with_tempdir
+    def test_get_shard_usage(self, tempdir):
+        shard_range_by_state = dict(
+            (state, ShardRange('.shards_a/c_%s' % state, next(self.ts),
+                               str(state), str(state + 1),
+                               2 * state, 2 * state + 1, 2,
+                               state=state))
+            for state in ShardRange.STATES)
+
+        def make_broker(a, c):
+            db_path = os.path.join(tempdir, '%s.db' % uuid4())
+            broker = ContainerBroker(db_path, account=a, container=c)
+            broker.initialize(next(self.ts).internal, 0)
+            broker.set_sharding_sysmeta('Root', 'a/c')
+            broker.merge_shard_ranges(list(shard_range_by_state.values()))
+            return broker
+
+        # make broker appear to be a root container
+        broker = make_broker('a', 'c')
+        self.assertTrue(broker.is_root_container())
+        included_states = (ShardRange.ACTIVE, ShardRange.SHARDING,
+                           ShardRange.SHRINKING)
+        included = [shard_range_by_state[state] for state in included_states]
+        expected = {
+            'object_count': sum([sr.object_count for sr in included]),
+            'bytes_used': sum([sr.bytes_used for sr in included])
+        }
+        self.assertEqual(expected, broker.get_shard_usage())
+
+    @with_tempdir
+    def _check_find_shard_ranges(self, c_lower, c_upper, tempdir):
+        ts_now = Timestamp.now()
+        container_name = 'test_container'
+
+        def do_test(expected_bounds, expected_last_found, shard_size, limit,
+                    start_index=0, existing=None, minimum_size=1):
+            # expected_bounds is a list of tuples (lower, upper, object_count)
+            # build expected shard ranges
+            expected_shard_ranges = [
+                dict(lower=lower, upper=upper, index=index,
+                     object_count=object_count)
+                for index, (lower, upper, object_count)
+                in enumerate(expected_bounds, start_index)]
+
+            with mock.patch('swift.common.utils.time.time',
+                            return_value=float(ts_now)):
+                ranges, last_found = broker.find_shard_ranges(
+                    shard_size, limit=limit, existing_ranges=existing,
+                    minimum_shard_size=minimum_size)
+            self.assertEqual(expected_shard_ranges, ranges)
+            self.assertEqual(expected_last_found, last_found)
+
+        db_path = os.path.join(tempdir, 'test_container.db')
+        broker = ContainerBroker(
+            db_path, account='a', container=container_name)
+        # shard size > object count, no objects
+        broker.initialize(next(self.ts).internal, 0)
+
+        ts = next(self.ts)
+        if c_lower or c_upper:
+            # testing a shard, so set its own shard range
+            own_shard_range = ShardRange(broker.path, ts, c_lower, c_upper)
+            broker.merge_shard_ranges([own_shard_range])
+
+        self.assertEqual(([], False), broker.find_shard_ranges(10))
+
+        for i in range(10):
+            broker.put_object(
+                'obj%02d' % i, next(self.ts).internal, 0, 'text/plain', 'etag')
+
+        expected_bounds = [(c_lower, 'obj04', 5), ('obj04', c_upper, 5)]
+        do_test(expected_bounds, True, shard_size=5, limit=None)
+
+        expected = [(c_lower, 'obj06', 7), ('obj06', c_upper, 3)]
+        do_test(expected, True, shard_size=7, limit=None)
+        expected = [(c_lower, 'obj08', 9), ('obj08', c_upper, 1)]
+        do_test(expected, True, shard_size=9, limit=None)
+        # shard size >= object count
+        do_test([], False, shard_size=10, limit=None)
+        do_test([], False, shard_size=11, limit=None)
+
+        # check use of limit
+        do_test([], False, shard_size=4, limit=0)
+        expected = [(c_lower, 'obj03', 4)]
+        do_test(expected, False, shard_size=4, limit=1)
+        expected = [(c_lower, 'obj03', 4), ('obj03', 'obj07', 4)]
+        do_test(expected, False, shard_size=4, limit=2)
+        expected = [(c_lower, 'obj03', 4), ('obj03', 'obj07', 4),
+                    ('obj07', c_upper, 2)]
+        do_test(expected, True, shard_size=4, limit=3)
+        do_test(expected, True, shard_size=4, limit=4)
+        do_test(expected, True, shard_size=4, limit=-1)
+
+        # check use of minimum_shard_size
+        expected = [(c_lower, 'obj03', 4), ('obj03', 'obj07', 4),
+                    ('obj07', c_upper, 2)]
+        do_test(expected, True, shard_size=4, limit=None, minimum_size=2)
+        # crazy values ignored...
+        do_test(expected, True, shard_size=4, limit=None, minimum_size=0)
+        do_test(expected, True, shard_size=4, limit=None, minimum_size=-1)
+        # minimum_size > potential final shard
+        expected = [(c_lower, 'obj03', 4), ('obj03', c_upper, 6)]
+        do_test(expected, True, shard_size=4, limit=None, minimum_size=3)
+        # extended shard size >= object_count
+        do_test([], False, shard_size=6, limit=None, minimum_size=5)
+        do_test([], False, shard_size=6, limit=None, minimum_size=500)
+
+        # increase object count to 11
+        broker.put_object(
+            'obj10', next(self.ts).internal, 0, 'text/plain', 'etag')
+        expected = [(c_lower, 'obj03', 4), ('obj03', 'obj07', 4),
+                    ('obj07', c_upper, 3)]
+        do_test(expected, True, shard_size=4, limit=None)
+
+        expected = [(c_lower, 'obj09', 10), ('obj09', c_upper, 1)]
+        do_test(expected, True, shard_size=10, limit=None)
+        do_test([], False, shard_size=11, limit=None)
+
+        # now pass in a pre-existing shard range
+        existing = [ShardRange(
+            '.shards_a/srange-0', Timestamp.now(), '', 'obj03',
+            object_count=4, state=ShardRange.FOUND)]
+
+        expected = [('obj03', 'obj07', 4), ('obj07', c_upper, 3)]
+        do_test(expected, True, shard_size=4, limit=None, start_index=1,
+                existing=existing)
+        expected = [('obj03', 'obj07', 4)]
+        do_test(expected, False, shard_size=4, limit=1, start_index=1,
+                existing=existing)
+        # using increased shard size should not distort estimation of progress
+        expected = [('obj03', 'obj09', 6), ('obj09', c_upper, 1)]
+        do_test(expected, True, shard_size=6, limit=None, start_index=1,
+                existing=existing)
+
+        # add another existing...
+        existing.append(ShardRange(
+            '.shards_a/srange-1', Timestamp.now(), '', 'obj07',
+            object_count=4, state=ShardRange.FOUND))
+        expected = [('obj07', c_upper, 3)]
+        do_test(expected, True, shard_size=10, limit=None, start_index=2,
+                existing=existing)
+        # an existing shard range not in FOUND state should not distort
+        # estimation of progress, but may cause final range object count to
+        # default to shard_size
+        existing[-1].state = ShardRange.CREATED
+        existing[-1].object_count = 10
+        # there's only 3 objects left to scan but progress cannot be reliably
+        # calculated, so final shard range has object count of 2
+        expected = [('obj07', 'obj09', 2), ('obj09', c_upper, 2)]
+        do_test(expected, True, shard_size=2, limit=None, start_index=2,
+                existing=existing)
+
+        # add last shard range so there's none left to find
+        existing.append(ShardRange(
+            '.shards_a/srange-2', Timestamp.now(), 'obj07', c_upper,
+            object_count=4, state=ShardRange.FOUND))
+        do_test([], True, shard_size=4, limit=None, existing=existing)
+
+    def test_find_shard_ranges(self):
+        self._check_find_shard_ranges('', '')
+        self._check_find_shard_ranges('', 'upper')
+        self._check_find_shard_ranges('lower', '')
+        self._check_find_shard_ranges('lower', 'upper')
+
+    @with_tempdir
+    def test_find_shard_ranges_with_misplaced_objects(self, tempdir):
+        # verify that misplaced objects outside of a shard's range do not
+        # influence choice of shard ranges (but do distort the object counts)
+        ts_now = Timestamp.now()
+        container_name = 'test_container'
+
+        db_path = os.path.join(tempdir, 'test_container.db')
+        broker = ContainerBroker(
+            db_path, account='a', container=container_name)
+        # shard size > object count, no objects
+        broker.initialize(next(self.ts).internal, 0)
+
+        ts = next(self.ts)
+        own_shard_range = ShardRange(broker.path, ts, 'l', 'u')
+        broker.merge_shard_ranges([own_shard_range])
+
+        self.assertEqual(([], False), broker.find_shard_ranges(10))
+
+        for name in ('a-misplaced', 'm', 'n', 'p', 'q', 'r', 'z-misplaced'):
+            broker.put_object(
+                name, next(self.ts).internal, 0, 'text/plain', 'etag')
+
+        expected_bounds = (
+            ('l', 'n', 2),  # contains m, n
+            ('n', 'q', 2),  # contains p, q
+            ('q', 'u', 3)   # contains r; object count distorted by 2 misplaced
+        )
+        expected_shard_ranges = [
+            dict(lower=lower, upper=upper, index=index,
+                 object_count=object_count)
+            for index, (lower, upper, object_count)
+            in enumerate(expected_bounds)]
+
+        with mock.patch('swift.common.utils.time.time',
+                        return_value=float(ts_now)):
+            actual_shard_ranges, last_found = broker.find_shard_ranges(2, -1)
+        self.assertEqual(expected_shard_ranges, actual_shard_ranges)
+
+    @with_tempdir
+    def test_find_shard_ranges_errors(self, tempdir):
+        db_path = os.path.join(tempdir, 'test_container.db')
+        broker = ContainerBroker(db_path, account='a', container='c',
+                                 logger=debug_logger())
+        broker.initialize(next(self.ts).internal, 0)
+        for i in range(2):
+            broker.put_object(
+                'obj%d' % i, next(self.ts).internal, 0, 'text/plain', 'etag')
+
+        klass = 'swift.container.backend.ContainerBroker'
+        with mock.patch(klass + '._get_next_shard_range_upper',
+                        side_effect=LockTimeout()):
+            ranges, last_found = broker.find_shard_ranges(1)
+        self.assertFalse(ranges)
+        self.assertFalse(last_found)
+        lines = broker.logger.get_lines_for_level('error')
+        self.assertIn('Problem finding shard upper', lines[0])
+        self.assertFalse(lines[1:])
+
+        broker.logger.clear()
+        with mock.patch(klass + '._get_next_shard_range_upper',
+                        side_effect=sqlite3.OperationalError()):
+            ranges, last_found = broker.find_shard_ranges(1)
+        self.assertFalse(last_found)
+        self.assertFalse(ranges)
+        lines = broker.logger.get_lines_for_level('error')
+        self.assertIn('Problem finding shard upper', lines[0])
+        self.assertFalse(lines[1:])
+
+    @with_tempdir
+    def test_set_db_states(self, tempdir):
+        db_path = os.path.join(
+            tempdir, 'containers', 'part', 'suffix', 'hash', 'container.db')
+        broker = ContainerBroker(db_path, account='a', container='c')
+        broker.initialize(next(self.ts).internal, 0)
+
+        # load up the broker with some objects
+        objects = [{'name': 'obj_%d' % i,
+                    'created_at': next(self.ts).internal,
+                    'content_type': 'text/plain',
+                    'etag': 'etag_%d' % i,
+                    'size': 1024 * i,
+                    'deleted': 0,
+                    'storage_policy_index': 0,
+                    } for i in range(1, 6)]
+        # merge_items mutates items
+        broker.merge_items([dict(obj) for obj in objects])
+        original_info = broker.get_info()
+
+        # Add some metadata
+        meta = {
+            'X-Container-Meta-Color': ['Blue', next(self.ts).internal],
+            'X-Container-Meta-Cleared': ['', next(self.ts).internal],
+            'X-Container-Sysmeta-Shape': ['Circle', next(self.ts).internal],
+        }
+        broker.update_metadata(meta)
+
+        # Add some syncs
+        incoming_sync = {'remote_id': 'incoming_123', 'sync_point': 1}
+        outgoing_sync = {'remote_id': 'outgoing_123', 'sync_point': 2}
+        broker.merge_syncs([outgoing_sync], incoming=False)
+        broker.merge_syncs([incoming_sync], incoming=True)
+
+        # Add some ShardRanges
+        shard_ranges = [ShardRange(
+            name='.shards_a/shard_range_%s' % i,
+            timestamp=next(self.ts), lower='obj_%d' % i,
+            upper='obj_%d' % (i + 2),
+            object_count=len(objects[i:i + 2]),
+            bytes_used=sum(obj['size'] for obj in objects[i:i + 2]),
+            meta_timestamp=next(self.ts)) for i in range(0, 6, 2)]
+        deleted_range = ShardRange('.shards_a/shard_range_z', next(self.ts),
+                                   'z', '', state=ShardRange.SHARDED,
+                                   deleted=1)
+        own_sr = ShardRange(name='a/c', timestamp=next(self.ts),
+                            state=ShardRange.ACTIVE)
+        broker.merge_shard_ranges([own_sr] + shard_ranges + [deleted_range])
+        ts_epoch = next(self.ts)
+        new_db_path = os.path.join(tempdir, 'containers', 'part', 'suffix',
+                                   'hash', 'container_%s.db' % ts_epoch.normal)
+
+        def check_broker_properties(broker):
+            # these broker properties should remain unchanged as state changes
+            self.assertEqual(broker.get_max_row(), 5)
+            all_metadata = broker.metadata
+            original_meta = dict((k, all_metadata[k]) for k in meta)
+            self.assertEqual(original_meta, meta)
+            self.assertEqual(broker.get_syncs(True)[0], incoming_sync)
+            self.assertEqual(broker.get_syncs(False)[0], outgoing_sync)
+            self.assertEqual(shard_ranges + [own_sr, deleted_range],
+                             broker.get_shard_ranges(include_own=True,
+                                                     include_deleted=True))
+
+        def check_broker_info(actual_info):
+            for key in ('db_state', 'id', 'hash'):
+                actual_info.pop(key, None)
+                original_info.pop(key, None)
+            self.assertEqual(original_info, actual_info)
+
+        def check_unsharded_state(broker):
+            # these are expected properties in unsharded state
+            self.assertEqual(len(broker.get_brokers()), 1)
+            self.assertEqual(broker.get_db_state(), UNSHARDED)
+            self.assertTrue(os.path.exists(db_path))
+            self.assertFalse(os.path.exists(new_db_path))
+            self.assertEqual(objects, broker.get_objects())
+
+        # Sanity checks
+        check_broker_properties(broker)
+        check_unsharded_state(broker)
+        check_broker_info(broker.get_info())
+
+        # first test that moving from UNSHARDED to SHARDED doesn't work
+        self.assertFalse(broker.set_sharded_state())
+        # check nothing changed
+        check_broker_properties(broker)
+        check_broker_info(broker.get_info())
+        check_unsharded_state(broker)
+
+        # cannot go to SHARDING without an epoch set
+        self.assertFalse(broker.set_sharding_state())
+
+        # now set sharding epoch and make sure everything moves.
+        broker.enable_sharding(ts_epoch)
+        self.assertTrue(broker.set_sharding_state())
+        check_broker_properties(broker)
+        check_broker_info(broker.get_info())
+
+        def check_sharding_state(broker):
+            self.assertEqual(len(broker.get_brokers()), 2)
+            self.assertEqual(broker.get_db_state(), SHARDING)
+            self.assertTrue(os.path.exists(db_path))
+            self.assertTrue(os.path.exists(new_db_path))
+            self.assertEqual([], broker.get_objects())
+            self.assertEqual(objects, broker.get_brokers()[0].get_objects())
+            self.assertEqual(broker.get_reconciler_sync(), -1)
+            info = broker.get_info()
+            if info.get('x_container_sync_point1'):
+                self.assertEqual(info['x_container_sync_point1'], -1)
+                self.assertEqual(info['x_container_sync_point2'], -1)
+        check_sharding_state(broker)
+
+        # to confirm we're definitely looking at the shard db
+        broker2 = ContainerBroker(new_db_path)
+        check_broker_properties(broker2)
+        check_broker_info(broker2.get_info())
+        self.assertEqual([], broker2.get_objects())
+
+        # Try to set sharding state again
+        self.assertFalse(broker.set_sharding_state())
+        # check nothing changed
+        check_broker_properties(broker)
+        check_broker_info(broker.get_info())
+        check_sharding_state(broker)
+
+        # Now move to the final state - update shard ranges' state
+        broker.merge_shard_ranges(
+            [dict(sr, state=ShardRange.ACTIVE,
+                  state_timestamp=next(self.ts).internal)
+             for sr in shard_ranges])
+        # pretend all ranges have been cleaved
+        self.assertTrue(broker.set_sharded_state())
+        check_broker_properties(broker)
+        check_broker_info(broker.get_info())
+
+        def check_sharded_state(broker):
+            self.assertEqual(broker.get_db_state(), SHARDED)
+            self.assertEqual(len(broker.get_brokers()), 1)
+            self.assertFalse(os.path.exists(db_path))
+            self.assertTrue(os.path.exists(new_db_path))
+            self.assertEqual([], broker.get_objects())
+        check_sharded_state(broker)
+
+        # Try to set sharded state again
+        self.assertFalse(broker.set_sharded_state())
+        # check nothing changed
+        check_broker_properties(broker)
+        check_broker_info(broker.get_info())
+        check_sharded_state(broker)
+
+        # delete the container
+        broker.delete_db(next(self.ts).internal)
+        # but it is not considered deleted while shards have content
+        self.assertFalse(broker.is_deleted())
+        check_sharded_state(broker)
+        # empty the shard ranges
+        empty_shard_ranges = [sr.copy(object_count=0, bytes_used=0,
+                                      meta_timestamp=next(self.ts))
+                              for sr in shard_ranges]
+        broker.merge_shard_ranges(empty_shard_ranges)
+        # and now it is deleted
+        self.assertTrue(broker.is_deleted())
+        check_sharded_state(broker)
+
+        def do_revive_shard_delete(shard_ranges):
+            # delete all shard ranges
+            deleted_shard_ranges = [sr.copy(timestamp=next(self.ts), deleted=1)
+                                    for sr in shard_ranges]
+            broker.merge_shard_ranges(deleted_shard_ranges)
+            self.assertEqual(COLLAPSED, broker.get_db_state())
+
+            # add new shard ranges and go to sharding state - need to force
+            # broker time to be after the delete time in order to write new
+            # sysmeta
+            broker.enable_sharding(next(self.ts))
+            shard_ranges = [sr.copy(timestamp=next(self.ts))
+                            for sr in shard_ranges]
+            broker.merge_shard_ranges(shard_ranges)
+            with mock.patch('swift.common.db.time.time',
+                            lambda: float(next(self.ts))):
+                self.assertTrue(broker.set_sharding_state())
+            self.assertEqual(SHARDING, broker.get_db_state())
+
+            # go to sharded
+            self.assertTrue(
+                broker.set_sharded_state())
+            self.assertEqual(SHARDED, broker.get_db_state())
+
+            # delete again
+            broker.delete_db(next(self.ts).internal)
+            self.assertTrue(broker.is_deleted())
+            self.assertEqual(SHARDED, broker.get_db_state())
+
+        do_revive_shard_delete(shard_ranges)
+        do_revive_shard_delete(shard_ranges)
+
+    @with_tempdir
+    def test_set_sharding_state(self, tempdir):
+        db_path = os.path.join(
+            tempdir, 'containers', 'part', 'suffix', 'hash', 'container.db')
+        broker = ContainerBroker(db_path, account='a', container='c',
+                                 logger=debug_logger())
+        broker.initialize(next(self.ts).internal, 0)
+        broker.merge_items([{'name': 'obj_%d' % i,
+                             'created_at': next(self.ts).internal,
+                             'content_type': 'text/plain',
+                             'etag': 'etag_%d' % i,
+                             'size': 1024 * i,
+                             'deleted': 0,
+                             'storage_policy_index': 0,
+                             } for i in range(1, 6)])
+        broker.set_x_container_sync_points(1, 2)
+        broker.update_reconciler_sync(3)
+        self.assertEqual(3, broker.get_reconciler_sync())
+        broker.reported(next(self.ts).internal, next(self.ts).internal,
+                        next(self.ts).internal, next(self.ts).internal)
+        epoch = next(self.ts)
+        broker.enable_sharding(epoch)
+        self.assertEqual(UNSHARDED, broker.get_db_state())
+        self.assertFalse(broker.is_deleted())
+        retiring_info = broker.get_info()
+        self.assertEqual(1, len(broker.db_files))
+
+        self.assertTrue(broker.set_sharding_state())
+        broker = ContainerBroker(db_path, account='a', container='c',
+                                 logger=debug_logger())
+        self.assertEqual(SHARDING, broker.get_db_state())
+        fresh_info = broker.get_info()
+        for key in ('reported_put_timestamp', 'reported_delete_timestamp'):
+            retiring_info.pop(key)
+            self.assertEqual('0', fresh_info.pop(key), key)
+        for key in ('reported_object_count', 'reported_bytes_used'):
+            retiring_info.pop(key)
+            self.assertEqual(0, fresh_info.pop(key), key)
+        self.assertNotEqual(retiring_info.pop('id'), fresh_info.pop('id'))
+        self.assertNotEqual(retiring_info.pop('hash'), fresh_info.pop('hash'))
+        self.assertNotEqual(retiring_info.pop('x_container_sync_point1'),
+                            fresh_info.pop('x_container_sync_point1'))
+        self.assertNotEqual(retiring_info.pop('x_container_sync_point2'),
+                            fresh_info.pop('x_container_sync_point2'))
+        self.assertEqual(-1, broker.get_reconciler_sync())
+        self.assertEqual('unsharded', retiring_info.pop('db_state'))
+        self.assertEqual('sharding', fresh_info.pop('db_state'))
+        self.assertEqual(retiring_info, fresh_info)
+        self.assertFalse(broker.is_deleted())
+        self.assertEqual(2, len(broker.db_files))
+        self.assertEqual(db_path, broker.db_files[0])
+        fresh_db_path = os.path.join(
+            tempdir, 'containers', 'part', 'suffix', 'hash',
+            'container_%s.db' % epoch.normal)
+        self.assertEqual(fresh_db_path, broker.db_files[1])
+
+    @with_tempdir
+    def test_set_sharding_state_deleted(self, tempdir):
+        db_path = os.path.join(
+            tempdir, 'containers', 'part', 'suffix', 'hash', 'container.db')
+        broker = ContainerBroker(db_path, account='a', container='c',
+                                 logger=debug_logger())
+        broker.initialize(next(self.ts).internal, 0)
+        broker.set_x_container_sync_points(1, 2)
+        broker.update_reconciler_sync(3)
+        self.assertEqual(3, broker.get_reconciler_sync())
+        broker.reported(next(self.ts).internal, next(self.ts).internal,
+                        next(self.ts).internal, next(self.ts).internal)
+        epoch = next(self.ts)
+        broker.enable_sharding(epoch)
+        self.assertEqual(UNSHARDED, broker.get_db_state())
+        broker.delete_db(next(self.ts).internal)
+        self.assertTrue(broker.is_deleted())
+        retiring_info = broker.get_info()
+        self.assertEqual("DELETED", retiring_info['status'])
+        self.assertEqual(1, len(broker.db_files))
+
+        self.assertTrue(broker.set_sharding_state())
+        broker = ContainerBroker(db_path, account='a', container='c',
+                                 logger=debug_logger())
+        self.assertEqual(SHARDING, broker.get_db_state())
+        fresh_info = broker.get_info()
+        for key in ('reported_put_timestamp', 'reported_delete_timestamp'):
+            retiring_info.pop(key)
+            self.assertEqual('0', fresh_info.pop(key), key)
+        for key in ('reported_object_count', 'reported_bytes_used'):
+            retiring_info.pop(key)
+            self.assertEqual(0, fresh_info.pop(key), key)
+        self.assertNotEqual(retiring_info.pop('id'), fresh_info.pop('id'))
+        self.assertNotEqual(retiring_info.pop('x_container_sync_point1'),
+                            fresh_info.pop('x_container_sync_point1'))
+        self.assertNotEqual(retiring_info.pop('x_container_sync_point2'),
+                            fresh_info.pop('x_container_sync_point2'))
+        self.assertEqual(-1, broker.get_reconciler_sync())
+        self.assertEqual('unsharded', retiring_info.pop('db_state'))
+        self.assertEqual('sharding', fresh_info.pop('db_state'))
+        self.assertEqual(retiring_info, fresh_info)
+        self.assertTrue(broker.is_deleted())
+        self.assertEqual(2, len(broker.db_files))
+        self.assertEqual(db_path, broker.db_files[0])
+        fresh_db_path = os.path.join(
+            tempdir, 'containers', 'part', 'suffix', 'hash',
+            'container_%s.db' % epoch.normal)
+        self.assertEqual(fresh_db_path, broker.db_files[1])
+
+    @with_tempdir
+    def test_set_sharding_state_errors(self, tempdir):
+        db_path = os.path.join(
+            tempdir, 'containers', 'part', 'suffix', 'hash', 'container.db')
+        broker = ContainerBroker(db_path, account='a', container='c',
+                                 logger=debug_logger())
+        broker.initialize(next(self.ts).internal, 0)
+        broker.enable_sharding(next(self.ts))
+
+        orig_execute = GreenDBConnection.execute
+        trigger = 'INSERT into object'
+
+        def mock_execute(conn, *args, **kwargs):
+            if trigger in args[0]:
+                raise sqlite3.OperationalError()
+            return orig_execute(conn, *args, **kwargs)
+
+        with mock.patch('swift.common.db.GreenDBConnection.execute',
+                        mock_execute):
+            res = broker.set_sharding_state()
+        self.assertFalse(res)
+        lines = broker.logger.get_lines_for_level('error')
+        self.assertIn('Failed to set the ROWID', lines[0])
+        self.assertFalse(lines[1:])
+
+        broker.logger.clear()
+        trigger = 'UPDATE container_stat SET created_at'
+        with mock.patch('swift.common.db.GreenDBConnection.execute',
+                        mock_execute):
+            res = broker.set_sharding_state()
+        self.assertFalse(res)
+        lines = broker.logger.get_lines_for_level('error')
+        self.assertIn(
+            'Failed to sync the container_stat table/view with the fresh '
+            'database', lines[0])
+        self.assertFalse(lines[1:])
+
+    @with_tempdir
+    def test_set_sharded_state_errors(self, tempdir):
+        retiring_db_path = os.path.join(
+            tempdir, 'containers', 'part', 'suffix', 'hash', 'container.db')
+        broker = ContainerBroker(retiring_db_path, account='a', container='c',
+                                 logger=debug_logger())
+        broker.initialize(next(self.ts).internal, 0)
+        pre_epoch = next(self.ts)
+        broker.enable_sharding(next(self.ts))
+        self.assertTrue(broker.set_sharding_state())
+        # unlink fails
+        with mock.patch('os.unlink', side_effect=OSError(errno.EPERM)):
+            self.assertFalse(broker.set_sharded_state())
+        lines = broker.logger.get_lines_for_level('error')
+        self.assertIn('Failed to unlink', lines[0])
+        self.assertFalse(lines[1:])
+        self.assertFalse(broker.logger.get_lines_for_level('warning'))
+        self.assertTrue(os.path.exists(retiring_db_path))
+        self.assertTrue(os.path.exists(broker.db_file))
+
+        # extra files
+        extra_filename = make_db_file_path(broker.db_file, pre_epoch)
+        self.assertNotEqual(extra_filename, broker.db_file)  # sanity check
+        with open(extra_filename, 'wb'):
+            pass
+        broker.logger.clear()
+        self.assertFalse(broker.set_sharded_state())
+        lines = broker.logger.get_lines_for_level('warning')
+        self.assertIn('Still have multiple db files', lines[0])
+        self.assertFalse(lines[1:])
+        self.assertFalse(broker.logger.get_lines_for_level('error'))
+        self.assertTrue(os.path.exists(retiring_db_path))
+        self.assertTrue(os.path.exists(broker.db_file))
+
+        # retiring file missing
+        broker.logger.clear()
+        os.unlink(retiring_db_path)
+        self.assertFalse(broker.set_sharded_state())
+        lines = broker.logger.get_lines_for_level('warning')
+        self.assertIn('Refusing to delete', lines[0])
+        self.assertFalse(lines[1:])
+        self.assertFalse(broker.logger.get_lines_for_level('error'))
+        self.assertTrue(os.path.exists(broker.db_file))
+
+    @with_tempdir
+    def test_get_brokers(self, tempdir):
+        retiring_db_path = os.path.join(
+            tempdir, 'containers', 'part', 'suffix', 'hash', 'container.db')
+        broker = ContainerBroker(retiring_db_path, account='a', container='c',
+                                 logger=debug_logger())
+        broker.initialize(next(self.ts).internal, 0)
+        brokers = broker.get_brokers()
+        self.assertEqual(retiring_db_path, brokers[0].db_file)
+        self.assertFalse(brokers[0].skip_commits)
+        self.assertFalse(brokers[1:])
+
+        broker.enable_sharding(next(self.ts))
+        self.assertTrue(broker.set_sharding_state())
+        brokers = broker.get_brokers()
+        self.assertEqual(retiring_db_path, brokers[0].db_file)
+        self.assertTrue(brokers[0].skip_commits)
+        self.assertEqual(broker.db_file, brokers[1].db_file)
+        self.assertFalse(brokers[1].skip_commits)
+        self.assertFalse(brokers[2:])
+
+        # same outcome when called on retiring db broker
+        brokers = brokers[0].get_brokers()
+        self.assertEqual(retiring_db_path, brokers[0].db_file)
+        self.assertTrue(brokers[0].skip_commits)
+        self.assertEqual(broker.db_file, brokers[1].db_file)
+        self.assertFalse(brokers[1].skip_commits)
+        self.assertFalse(brokers[2:])
+
+        self.assertTrue(broker.set_sharded_state())
+        brokers = broker.get_brokers()
+        self.assertEqual(broker.db_file, brokers[0].db_file)
+        self.assertFalse(brokers[0].skip_commits)
+        self.assertFalse(brokers[1:])
+
+        # unexpected extra file should be ignored
+        with open(retiring_db_path, 'wb'):
+            pass
+        retiring_db_path = broker.db_file
+        broker.enable_sharding(next(self.ts))
+        self.assertTrue(broker.set_sharding_state())
+        broker.reload_db_files()
+        self.assertEqual(3, len(broker.db_files))  # sanity check
+        brokers = broker.get_brokers()
+        self.assertEqual(retiring_db_path, brokers[0].db_file)
+        self.assertTrue(brokers[0].skip_commits)
+        self.assertEqual(broker.db_file, brokers[1].db_file)
+        self.assertFalse(brokers[1].skip_commits)
+        self.assertFalse(brokers[2:])
+        lines = broker.logger.get_lines_for_level('warning')
+        self.assertIn('Unexpected db files', lines[0])
+        self.assertFalse(lines[1:])
+
+    @with_tempdir
+    def test_merge_shard_ranges(self, tempdir):
+        ts = [next(self.ts) for _ in range(16)]
+        db_path = os.path.join(
+            tempdir, 'containers', 'part', 'suffix', 'hash', 'container.db')
+        broker = ContainerBroker(
+            db_path, account='a', container='c')
+        broker.initialize(next(self.ts).internal, 0)
+
+        # sanity check
+        self.assertFalse(broker.get_shard_ranges(include_deleted=True))
+
+        broker.merge_shard_ranges(None)
+        self.assertFalse(broker.get_shard_ranges(include_deleted=True))
+
+        # merge item at ts1
+        # sr_<upper>_<created ts>_<meta ts>
+        sr_b_1_1 = ShardRange('a/c_b', ts[1], lower='a', upper='b',
+                              object_count=2)
+        broker.merge_shard_ranges([sr_b_1_1])
+        self._assert_shard_ranges(broker, [sr_b_1_1])
+
+        # merge older item - ignored
+        sr_b_0_0 = ShardRange('a/c_b', ts[0], lower='a', upper='b',
+                              object_count=1)
+        broker.merge_shard_ranges([sr_b_0_0])
+        self._assert_shard_ranges(broker, [sr_b_1_1])
+
+        # merge same timestamp - ignored
+        broker.merge_shard_ranges([dict(sr_b_1_1, lower='', upper='c')])
+        self._assert_shard_ranges(broker, [sr_b_1_1])
+        broker.merge_shard_ranges([dict(sr_b_1_1, object_count=99)])
+        self._assert_shard_ranges(broker, [sr_b_1_1])
+
+        # merge list with older item *after* newer item
+        sr_c_2_2 = ShardRange('a/c_c', ts[2], lower='b', upper='c',
+                              object_count=3)
+        sr_c_3_3 = ShardRange('a/c_c', ts[3], lower='b', upper='c',
+                              object_count=4)
+        broker.merge_shard_ranges([sr_c_3_3, sr_c_2_2])
+        self._assert_shard_ranges(broker, [sr_b_1_1, sr_c_3_3])
+
+        # merge newer item - updated
+        sr_c_5_5 = ShardRange('a/c_c', ts[5], lower='b', upper='c',
+                              object_count=5)
+        broker.merge_shard_ranges([sr_c_5_5])
+        self._assert_shard_ranges(broker, [sr_b_1_1, sr_c_5_5])
+
+        # merge older metadata item - ignored
+        sr_c_5_4 = ShardRange('a/c_c', ts[5], lower='b', upper='c',
+                              object_count=6, meta_timestamp=ts[4])
+        broker.merge_shard_ranges([sr_c_5_4])
+        self._assert_shard_ranges(broker, [sr_b_1_1, sr_c_5_5])
+
+        # merge newer metadata item - only metadata is updated
+        sr_c_5_6 = ShardRange('a/c_c', ts[5], lower='b', upper='c',
+                              object_count=7, meta_timestamp=ts[6])
+        broker.merge_shard_ranges([dict(sr_c_5_6, lower='', upper='d')])
+        self._assert_shard_ranges(broker, [sr_b_1_1, sr_c_5_6])
+
+        # merge older created_at, newer metadata item - ignored
+        sr_c_4_7 = ShardRange('a/c_c', ts[4], lower='b', upper='c',
+                              object_count=8, meta_timestamp=ts[7])
+        broker.merge_shard_ranges([sr_c_4_7])
+        self._assert_shard_ranges(broker, [sr_b_1_1, sr_c_5_6])
+
+        # merge list with older metadata item *after* newer metadata item
+        sr_c_5_11 = ShardRange('a/c_c', ts[5], lower='b', upper='c',
+                               object_count=9, meta_timestamp=ts[11])
+        broker.merge_shard_ranges([sr_c_5_11, sr_c_5_6])
+        self._assert_shard_ranges(broker, [sr_b_1_1, sr_c_5_11])
+
+        # deleted item at *same timestamp* as existing - deleted ignored
+        broker.merge_shard_ranges([dict(sr_b_1_1, deleted=1, object_count=0)])
+        self._assert_shard_ranges(broker, [sr_b_1_1, sr_c_5_11])
+        sr_b_1_1.meta_timestamp = ts[11]
+        broker.merge_shard_ranges([dict(sr_b_1_1, deleted=1)])
+        self._assert_shard_ranges(broker, [sr_b_1_1, sr_c_5_11])
+        sr_b_1_1.state_timestamp = ts[11]
+        broker.merge_shard_ranges([dict(sr_b_1_1, deleted=1)])
+        self._assert_shard_ranges(broker, [sr_b_1_1, sr_c_5_11])
+
+        # delete item at *newer timestamp* - updated
+        sr_b_2_2_deleted = ShardRange('a/c_b', ts[2], lower='a', upper='b',
+                                      object_count=0, deleted=1)
+        broker.merge_shard_ranges([sr_b_2_2_deleted])
+        self._assert_shard_ranges(broker, [sr_b_2_2_deleted, sr_c_5_11])
+
+        # merge list with older undeleted item *after* newer deleted item
+        # NB deleted timestamp trumps newer meta timestamp
+        sr_c_9_12 = ShardRange('a/c_c', ts[9], lower='b', upper='c',
+                               object_count=10, meta_timestamp=ts[12])
+        sr_c_10_10_deleted = ShardRange('a/c_c', ts[10], lower='b', upper='c',
+                                        object_count=0, deleted=1)
+        broker.merge_shard_ranges([sr_c_10_10_deleted, sr_c_9_12])
+        self._assert_shard_ranges(
+            broker, [sr_b_2_2_deleted, sr_c_10_10_deleted])
+
+        # merge a ShardRangeList
+        sr_b_13 = ShardRange('a/c_b', ts[13], lower='a', upper='b',
+                             object_count=10, meta_timestamp=ts[13])
+        sr_c_13 = ShardRange('a/c_c', ts[13], lower='b', upper='c',
+                             object_count=10, meta_timestamp=ts[13])
+        broker.merge_shard_ranges(ShardRangeList([sr_c_13, sr_b_13]))
+        self._assert_shard_ranges(
+            broker, [sr_b_13, sr_c_13])
+        # merge with tombstones but same meta_timestamp
+        sr_c_13_tombs = ShardRange('a/c_c', ts[13], lower='b', upper='c',
+                                   object_count=10, meta_timestamp=ts[13],
+                                   tombstones=999)
+        broker.merge_shard_ranges(sr_c_13_tombs)
+        self._assert_shard_ranges(
+            broker, [sr_b_13, sr_c_13])
+        # merge with tombstones at newer meta_timestamp
+        sr_c_13_tombs = ShardRange('a/c_c', ts[13], lower='b', upper='c',
+                                   object_count=1, meta_timestamp=ts[14],
+                                   tombstones=999)
+        broker.merge_shard_ranges(sr_c_13_tombs)
+        self._assert_shard_ranges(
+            broker, [sr_b_13, sr_c_13_tombs])
+
+    @with_tempdir
+    def test_merge_shard_ranges_state(self, tempdir):
+        db_path = os.path.join(
+            tempdir, 'containers', 'part', 'suffix', 'hash', 'container.db')
+        broker = ContainerBroker(db_path, account='a', container='c')
+        broker.initialize(next(self.ts).internal, 0)
+        expected_shard_ranges = []
+
+        def do_test(orig_state, orig_timestamp, test_state, test_timestamp,
+                    expected_state, expected_timestamp):
+            index = len(expected_shard_ranges)
+            sr = ShardRange('a/%s' % index, orig_timestamp, '%03d' % index,
+                            '%03d' % (index + 1), state=orig_state)
+            broker.merge_shard_ranges([sr])
+            sr.state = test_state
+            sr.state_timestamp = test_timestamp
+            broker.merge_shard_ranges([sr])
+            sr.state = expected_state
+            sr.state_timestamp = expected_timestamp
+            expected_shard_ranges.append(sr)
+            self._assert_shard_ranges(broker, expected_shard_ranges)
+
+        # state at older state_timestamp is not merged
+        for orig_state in ShardRange.STATES:
+            for test_state in ShardRange.STATES:
+                ts_older = next(self.ts)
+                ts = next(self.ts)
+                do_test(orig_state, ts, test_state, ts_older, orig_state, ts)
+
+        # more advanced state at same timestamp is merged
+        for orig_state in ShardRange.STATES:
+            for test_state in ShardRange.STATES:
+                ts = next(self.ts)
+                do_test(orig_state, ts, test_state, ts,
+                        test_state if test_state > orig_state else orig_state,
+                        ts)
+
+        # any state at newer timestamp is merged
+        for orig_state in ShardRange.STATES:
+            for test_state in ShardRange.STATES:
+                ts = next(self.ts)
+                ts_newer = next(self.ts)
+                do_test(orig_state, ts, test_state, ts_newer, test_state,
+                        ts_newer)
+
+    def _check_object_stats_when_old_style_sharded(
+            self, a, c, root_a, root_c, tempdir):
+        # common setup and assertions for root and shard containers
+        db_path = os.path.join(
+            tempdir, 'containers', 'part', 'suffix', 'hash', 'container.db')
+        broker = ContainerBroker(
+            db_path, account=a, container=c)
+        broker.initialize(next(self.ts).internal, 0)
+        broker.set_sharding_sysmeta('Root', '%s/%s' % (root_a, root_c))
+        broker.merge_items([{'name': 'obj', 'size': 14, 'etag': 'blah',
+                             'content_type': 'text/plain', 'deleted': 0,
+                             'created_at': Timestamp.now().internal}])
+        self.assertEqual(1, broker.get_info()['object_count'])
+        self.assertEqual(14, broker.get_info()['bytes_used'])
+
+        broker.enable_sharding(next(self.ts))
+        self.assertTrue(broker.set_sharding_state())
+        sr_1 = ShardRange(
+            '%s/%s1' % (root_a, root_c), Timestamp.now(), lower='', upper='m',
+            object_count=99, bytes_used=999, state=ShardRange.ACTIVE)
+        sr_2 = ShardRange(
+            '%s/%s2' % (root_a, root_c), Timestamp.now(), lower='m', upper='',
+            object_count=21, bytes_used=1000, state=ShardRange.ACTIVE)
+        broker.merge_shard_ranges([sr_1, sr_2])
+        self.assertEqual(1, broker.get_info()['object_count'])
+        self.assertEqual(14, broker.get_info()['bytes_used'])
+        return broker
+
+    @with_tempdir
+    def test_object_stats_old_style_root_container(self, tempdir):
+        broker = self._check_object_stats_when_old_style_sharded(
+            'a', 'c', 'a', 'c', tempdir)
+        self.assertTrue(broker.is_root_container())  # sanity
+        self.assertTrue(broker.set_sharded_state())
+        self.assertEqual(120, broker.get_info()['object_count'])
+        self.assertEqual(1999, broker.get_info()['bytes_used'])
+
+    @with_tempdir
+    def test_object_stats_old_style_shard_container(self, tempdir):
+        broker = self._check_object_stats_when_old_style_sharded(
+            '.shard_a', 'c-blah', 'a', 'c', tempdir)
+        self.assertFalse(broker.is_root_container())  # sanity
+        self.assertTrue(broker.set_sharded_state())
+        self.assertEqual(0, broker.get_info()['object_count'])
+        self.assertEqual(0, broker.get_info()['bytes_used'])
+
+    def _check_object_stats_when_sharded(self, a, c, root_a, root_c, tempdir):
+        # common setup and assertions for root and shard containers
+        db_path = os.path.join(
+            tempdir, 'containers', 'part', 'suffix', 'hash', 'container.db')
+        broker = ContainerBroker(
+            db_path, account=a, container=c)
+        broker.initialize(next(self.ts).internal, 0)
+        broker.set_sharding_sysmeta('Quoted-Root', '%s/%s' % (root_a, root_c))
+        broker.merge_items([{'name': 'obj', 'size': 14, 'etag': 'blah',
+                             'content_type': 'text/plain', 'deleted': 0,
+                             'created_at': Timestamp.now().internal}])
+        self.assertEqual(1, broker.get_info()['object_count'])
+        self.assertEqual(14, broker.get_info()['bytes_used'])
+
+        broker.enable_sharding(next(self.ts))
+        self.assertTrue(broker.set_sharding_state())
+        sr_1 = ShardRange(
+            '%s/%s1' % (root_a, root_c), Timestamp.now(), lower='', upper='m',
+            object_count=99, bytes_used=999, state=ShardRange.ACTIVE)
+        sr_2 = ShardRange(
+            '%s/%s2' % (root_a, root_c), Timestamp.now(), lower='m', upper='',
+            object_count=21, bytes_used=1000, state=ShardRange.ACTIVE)
+        broker.merge_shard_ranges([sr_1, sr_2])
+        self.assertEqual(1, broker.get_info()['object_count'])
+        self.assertEqual(14, broker.get_info()['bytes_used'])
+        return broker
+
+    @with_tempdir
+    def test_object_stats_root_container(self, tempdir):
+        broker = self._check_object_stats_when_sharded(
+            'a', 'c', 'a', 'c', tempdir)
+        self.assertTrue(broker.is_root_container())  # sanity
+        self.assertTrue(broker.set_sharded_state())
+        self.assertEqual(120, broker.get_info()['object_count'])
+        self.assertEqual(1999, broker.get_info()['bytes_used'])
+
+    @with_tempdir
+    def test_object_stats_shard_container(self, tempdir):
+        broker = self._check_object_stats_when_sharded(
+            '.shard_a', 'c-blah', 'a', 'c', tempdir)
+        self.assertFalse(broker.is_root_container())  # sanity
+        self.assertTrue(broker.set_sharded_state())
+        self.assertEqual(0, broker.get_info()['object_count'])
+        self.assertEqual(0, broker.get_info()['bytes_used'])
+
+
+class TestCommonContainerBroker(test_db.TestExampleBroker):
+
+    broker_class = ContainerBroker
+    server_type = 'container'
+
+    def setUp(self):
+        super(TestCommonContainerBroker, self).setUp()
+        self.policy = random.choice(list(POLICIES))
+
+    def put_item(self, broker, timestamp):
+        broker.put_object('test', timestamp, 0, 'text/plain', 'x',
+                          storage_policy_index=int(self.policy))
+
+    def delete_item(self, broker, timestamp):
+        broker.delete_object('test', timestamp,
+                             storage_policy_index=int(self.policy))
+
+
+class ContainerBrokerMigrationMixin(test_db.TestDbBase):
+    """
+    Mixin for running ContainerBroker against databases created with
+    older schemas.
+    """
+    class OverrideCreateShardRangesTable(object):
+        def __init__(self, func):
+            self.func = func
+
+        def __get__(self, obj, obj_type):
+            if inspect.stack()[1][3] == '_initialize':
+                return lambda *a, **kw: None
+            return self.func.__get__(obj, obj_type)
+
+    def setUp(self):
+        super(ContainerBrokerMigrationMixin, self).setUp()
+        self._imported_create_object_table = \
+            ContainerBroker.create_object_table
+        ContainerBroker.create_object_table = \
+            prespi_create_object_table
+        self._imported_create_container_info_table = \
+            ContainerBroker.create_container_info_table
+        ContainerBroker.create_container_info_table = \
+            premetadata_create_container_info_table
+        self._imported_create_policy_stat_table = \
+            ContainerBroker.create_policy_stat_table
+        ContainerBroker.create_policy_stat_table = lambda *args: None
+
+        self._imported_create_shard_range_table = \
+            ContainerBroker.create_shard_range_table
+        if 'shard_range' not in self.expected_db_tables:
+            ContainerBroker.create_shard_range_table = \
+                self.OverrideCreateShardRangesTable(
+                    ContainerBroker.create_shard_range_table)
+
+    @classmethod
+    @contextmanager
+    def old_broker(cls):
+        cls.runTest = lambda *a, **k: None
+        case = cls()
+        case.setUp()
+        try:
+            yield ContainerBroker
+        finally:
+            case.tearDown()
+
+    def tearDown(self):
+        ContainerBroker.create_container_info_table = \
+            self._imported_create_container_info_table
+        ContainerBroker.create_object_table = \
+            self._imported_create_object_table
+        ContainerBroker.create_shard_range_table = \
+            self._imported_create_shard_range_table
+        ContainerBroker.create_policy_stat_table = \
+            self._imported_create_policy_stat_table
+        # We need to manually teardown and clean the self.tempdir
+
+
+def premetadata_create_container_info_table(self, conn, put_timestamp,
+                                            _spi=None):
+    """
+    Copied from ContainerBroker before the metadata column was
+    added; used for testing with TestContainerBrokerBeforeMetadata.
+
+    Create the container_stat table which is specific to the container DB.
+
+    :param conn: DB connection object
+    :param put_timestamp: put timestamp
+    """
+    if put_timestamp is None:
+        put_timestamp = Timestamp(0).internal
+    conn.executescript('''
+        CREATE TABLE container_stat (
+            account TEXT,
+            container TEXT,
+            created_at TEXT,
+            put_timestamp TEXT DEFAULT '0',
+            delete_timestamp TEXT DEFAULT '0',
+            object_count INTEGER,
+            bytes_used INTEGER,
+            reported_put_timestamp TEXT DEFAULT '0',
+            reported_delete_timestamp TEXT DEFAULT '0',
+            reported_object_count INTEGER DEFAULT 0,
+            reported_bytes_used INTEGER DEFAULT 0,
+            hash TEXT default '00000000000000000000000000000000',
+            id TEXT,
+            status TEXT DEFAULT '',
+            status_changed_at TEXT DEFAULT '0'
+        );
+
+        INSERT INTO container_stat (object_count, bytes_used)
+            VALUES (0, 0);
+    ''')
+    conn.execute('''
+        UPDATE container_stat
+        SET account = ?, container = ?, created_at = ?, id = ?,
+            put_timestamp = ?
+    ''', (self.account, self.container, Timestamp.now().internal,
+          str(uuid4()), put_timestamp))
+
+
+class TestContainerBrokerBeforeMetadata(ContainerBrokerMigrationMixin,
+                                        TestContainerBroker):
+    """
+    Tests for ContainerBroker against databases created before
+    the metadata column was added.
+    """
+    expected_db_tables = {'outgoing_sync', 'incoming_sync', 'object',
+                          'sqlite_sequence', 'container_stat'}
+
+    def setUp(self):
+        super(TestContainerBrokerBeforeMetadata, self).setUp()
+        broker = ContainerBroker(self.get_db_path(), account='a',
+                                 container='c')
+        broker.initialize(Timestamp('1').internal, 0)
+        exc = None
+        with broker.get() as conn:
+            try:
+                conn.execute('SELECT metadata FROM container_stat')
+            except BaseException as err:
+                exc = err
+        self.assertTrue('no such column: metadata' in str(exc))
+
+    def tearDown(self):
+        super(TestContainerBrokerBeforeMetadata, self).tearDown()
+        broker = ContainerBroker(self.get_db_path(), account='a',
+                                 container='c')
+        broker.initialize(Timestamp('1').internal, 0)
+        with broker.get() as conn:
+            conn.execute('SELECT metadata FROM container_stat')
+        test_db.TestDbBase.tearDown(self)
+
+
+def prexsync_create_container_info_table(self, conn, put_timestamp,
+                                         _spi=None):
+    """
+    Copied from ContainerBroker before the
+    x_container_sync_point[12] columns were added; used for testing with
+    TestContainerBrokerBeforeXSync.
+
+    Create the container_stat table which is specific to the container DB.
+
+    :param conn: DB connection object
+    :param put_timestamp: put timestamp
+    """
+    if put_timestamp is None:
+        put_timestamp = Timestamp(0).internal
+    conn.executescript("""
+        CREATE TABLE container_stat (
+            account TEXT,
+            container TEXT,
+            created_at TEXT,
+            put_timestamp TEXT DEFAULT '0',
+            delete_timestamp TEXT DEFAULT '0',
+            object_count INTEGER,
+            bytes_used INTEGER,
+            reported_put_timestamp TEXT DEFAULT '0',
+            reported_delete_timestamp TEXT DEFAULT '0',
+            reported_object_count INTEGER DEFAULT 0,
+            reported_bytes_used INTEGER DEFAULT 0,
+            hash TEXT default '00000000000000000000000000000000',
+            id TEXT,
+            status TEXT DEFAULT '',
+            status_changed_at TEXT DEFAULT '0',
+            metadata TEXT DEFAULT ''
+        );
+
+        INSERT INTO container_stat (object_count, bytes_used)
+            VALUES (0, 0);
+    """)
+    conn.execute('''
+        UPDATE container_stat
+        SET account = ?, container = ?, created_at = ?, id = ?,
+            put_timestamp = ?
+    ''', (self.account, self.container, Timestamp.now().internal,
+          str(uuid4()), put_timestamp))
+
+
+class TestContainerBrokerBeforeXSync(ContainerBrokerMigrationMixin,
+                                     TestContainerBroker):
+    """
+    Tests for ContainerBroker against databases created
+    before the x_container_sync_point[12] columns were added.
+    """
+    expected_db_tables = {'outgoing_sync', 'incoming_sync', 'object',
+                          'sqlite_sequence', 'container_stat'}
+
+    def setUp(self):
+        super(TestContainerBrokerBeforeXSync, self).setUp()
+        ContainerBroker.create_container_info_table = \
+            prexsync_create_container_info_table
+        broker = ContainerBroker(self.get_db_path(), account='a',
+                                 container='c')
+        broker.initialize(Timestamp('1').internal, 0)
+        exc = None
+        with broker.get() as conn:
+            try:
+                conn.execute('''SELECT x_container_sync_point1
+                                FROM container_stat''')
+            except BaseException as err:
+                exc = err
+        self.assertTrue('no such column: x_container_sync_point1' in str(exc))
+
+    def tearDown(self):
+        super(TestContainerBrokerBeforeXSync, self).tearDown()
+        broker = ContainerBroker(self.get_db_path(), account='a',
+                                 container='c')
+        broker.initialize(Timestamp('1').internal, 0)
+        with broker.get() as conn:
+            conn.execute('SELECT x_container_sync_point1 FROM container_stat')
+        test_db.TestDbBase.tearDown(self)
+
+
+def prespi_create_object_table(self, conn, *args, **kwargs):
+    conn.executescript("""
+        CREATE TABLE object (
+            ROWID INTEGER PRIMARY KEY AUTOINCREMENT,
+            name TEXT,
+            created_at TEXT,
+            size INTEGER,
+            content_type TEXT,
+            etag TEXT,
+            deleted INTEGER DEFAULT 0
+        );
+
+        CREATE INDEX ix_object_deleted_name ON object (deleted, name);
+
+        CREATE TRIGGER object_insert AFTER INSERT ON object
+        BEGIN
+            UPDATE container_stat
+            SET object_count = object_count + (1 - new.deleted),
+                bytes_used = bytes_used + new.size,
+                hash = chexor(hash, new.name, new.created_at);
+        END;
+
+        CREATE TRIGGER object_update BEFORE UPDATE ON object
+        BEGIN
+            SELECT RAISE(FAIL, 'UPDATE not allowed; DELETE and INSERT');
+        END;
+
+        CREATE TRIGGER object_delete AFTER DELETE ON object
+        BEGIN
+            UPDATE container_stat
+            SET object_count = object_count - (1 - old.deleted),
+                bytes_used = bytes_used - old.size,
+                hash = chexor(hash, old.name, old.created_at);
+        END;
+    """)
+
+
+def prespi_create_container_info_table(self, conn, put_timestamp,
+                                       _spi=None):
+    """
+    Copied from ContainerBroker before the
+    storage_policy_index column was added; used for testing with
+    TestContainerBrokerBeforeSPI.
+
+    Create the container_stat table which is specific to the container DB.
+
+    :param conn: DB connection object
+    :param put_timestamp: put timestamp
+    """
+    if put_timestamp is None:
+        put_timestamp = Timestamp(0).internal
+    conn.executescript("""
+        CREATE TABLE container_stat (
+            account TEXT,
+            container TEXT,
+            created_at TEXT,
+            put_timestamp TEXT DEFAULT '0',
+            delete_timestamp TEXT DEFAULT '0',
+            object_count INTEGER,
+            bytes_used INTEGER,
+            reported_put_timestamp TEXT DEFAULT '0',
+            reported_delete_timestamp TEXT DEFAULT '0',
+            reported_object_count INTEGER DEFAULT 0,
+            reported_bytes_used INTEGER DEFAULT 0,
+            hash TEXT default '00000000000000000000000000000000',
+            id TEXT,
+            status TEXT DEFAULT '',
+            status_changed_at TEXT DEFAULT '0',
+            metadata TEXT DEFAULT '',
+            x_container_sync_point1 INTEGER DEFAULT -1,
+            x_container_sync_point2 INTEGER DEFAULT -1
+        );
+
+        INSERT INTO container_stat (object_count, bytes_used)
+            VALUES (0, 0);
+    """)
+    conn.execute('''
+        UPDATE container_stat
+        SET account = ?, container = ?, created_at = ?, id = ?,
+            put_timestamp = ?
+    ''', (self.account, self.container, Timestamp.now().internal,
+          str(uuid4()), put_timestamp))
+
+
+class TestContainerBrokerBeforeSPI(ContainerBrokerMigrationMixin,
+                                   TestContainerBroker):
+    """
+    Tests for ContainerBroker against databases created
+    before the storage_policy_index column was added.
+    """
+    expected_db_tables = {'outgoing_sync', 'incoming_sync', 'object',
+                          'sqlite_sequence', 'container_stat'}
+
+    def setUp(self):
+        super(TestContainerBrokerBeforeSPI, self).setUp()
+        ContainerBroker.create_container_info_table = \
+            prespi_create_container_info_table
+
+        broker = ContainerBroker(self.get_db_path(), account='a',
+                                 container='c')
+        broker.initialize(Timestamp('1').internal, 0)
+        with self.assertRaises(sqlite3.DatabaseError) as raised, \
+                broker.get() as conn:
+            conn.execute('''SELECT storage_policy_index
+                            FROM container_stat''')
+        self.assertIn('no such column: storage_policy_index',
+                      str(raised.exception))
+
+    def tearDown(self):
+        super(TestContainerBrokerBeforeSPI, self).tearDown()
+        broker = ContainerBroker(self.get_db_path(), account='a',
+                                 container='c')
+        broker.initialize(Timestamp('1').internal, 0)
+        with broker.get() as conn:
+            conn.execute('SELECT storage_policy_index FROM container_stat')
+        test_db.TestDbBase.tearDown(self)
+
+    @patch_policies
+    @with_tempdir
+    def test_object_table_migration(self, tempdir):
+        db_path = os.path.join(tempdir, 'container.db')
+
+        # initialize an un-migrated database
+        broker = ContainerBroker(db_path, account='a', container='c')
+        put_timestamp = Timestamp(int(time())).internal
+        broker.initialize(put_timestamp, None)
+        with broker.get() as conn:
+            try:
+                conn.execute('''
+                    SELECT storage_policy_index FROM object
+                    ''').fetchone()[0]
+            except sqlite3.OperationalError as err:
+                # confirm that the table doesn't have this column
+                self.assertTrue('no such column: storage_policy_index' in
+                                str(err))
+            else:
+                self.fail('broker did not raise sqlite3.OperationalError '
+                          'trying to select from storage_policy_index '
+                          'from object table!')
+
+        # manually insert an existing row to avoid automatic migration
+        obj_put_timestamp = Timestamp.now().internal
+        with broker.get() as conn:
+            conn.execute('''
+                INSERT INTO object (name, created_at, size,
+                    content_type, etag, deleted)
+                VALUES (?, ?, ?, ?, ?, ?)
+            ''', ('test_name', obj_put_timestamp, 123,
+                  'text/plain', '8f4c680e75ca4c81dc1917ddab0a0b5c', 0))
+            conn.commit()
+
+        # make sure we can iter objects without performing migration
+        for o in broker.list_objects_iter(1, None, None, None, None):
+            self.assertEqual(o, ('test_name', obj_put_timestamp, 123,
+                                 'text/plain',
+                                 '8f4c680e75ca4c81dc1917ddab0a0b5c'))
+
+        # get_info
+        info = broker.get_info()
+        expected = {
+            'account': 'a',
+            'container': 'c',
+            'put_timestamp': put_timestamp,
+            'delete_timestamp': '0',
+            'status_changed_at': '0',
+            'bytes_used': 123,
+            'object_count': 1,
+            'reported_put_timestamp': '0',
+            'reported_delete_timestamp': '0',
+            'reported_object_count': 0,
+            'reported_bytes_used': 0,
+            'x_container_sync_point1': -1,
+            'x_container_sync_point2': -1,
+            'storage_policy_index': 0,
+        }
+        for k, v in expected.items():
+            self.assertEqual(info[k], v,
+                             'The value for %s was %r not %r' % (
+                                 k, info[k], v))
+        self.assertTrue(
+            Timestamp(info['created_at']) > Timestamp(put_timestamp))
+        self.assertNotEqual(int(info['hash'], 16), 0)
+        orig_hash = info['hash']
+        # get_replication_info
+        info = broker.get_replication_info()
+        # translate object count for replicators
+        expected['count'] = expected.pop('object_count')
+        for k, v in expected.items():
+            self.assertEqual(info[k], v)
+        self.assertTrue(
+            Timestamp(info['created_at']) > Timestamp(put_timestamp))
+        self.assertEqual(info['hash'], orig_hash)
+        self.assertEqual(info['max_row'], 1)
+        self.assertEqual(info['metadata'], '')
+        # get_policy_stats
+        info = broker.get_policy_stats()
+        expected = {
+            0: {'bytes_used': 123, 'object_count': 1}
+        }
+        self.assertEqual(info, expected)
+        # empty & is_deleted
+        self.assertEqual(broker.empty(), False)
+        self.assertEqual(broker.is_deleted(), False)
+
+        # no migrations have occurred yet
+
+        # container_stat table
+        with broker.get() as conn:
+            try:
+                conn.execute('''
+                    SELECT storage_policy_index FROM container_stat
+                    ''').fetchone()[0]
+            except sqlite3.OperationalError as err:
+                # confirm that the table doesn't have this column
+                self.assertTrue('no such column: storage_policy_index' in
+                                str(err))
+            else:
+                self.fail('broker did not raise sqlite3.OperationalError '
+                          'trying to select from storage_policy_index '
+                          'from container_stat table!')
+
+        # object table
+        with broker.get() as conn:
+            try:
+                conn.execute('''
+                    SELECT storage_policy_index FROM object
+                    ''').fetchone()[0]
+            except sqlite3.OperationalError as err:
+                # confirm that the table doesn't have this column
+                self.assertTrue('no such column: storage_policy_index' in
+                                str(err))
+            else:
+                self.fail('broker did not raise sqlite3.OperationalError '
+                          'trying to select from storage_policy_index '
+                          'from object table!')
+
+        # policy_stat table
+        with broker.get() as conn:
+            try:
+                conn.execute('''
+                    SELECT storage_policy_index FROM policy_stat
+                    ''').fetchone()[0]
+            except sqlite3.OperationalError as err:
+                # confirm that the table does not exist yet
+                self.assertTrue('no such table: policy_stat' in str(err))
+            else:
+                self.fail('broker did not raise sqlite3.OperationalError '
+                          'trying to select from storage_policy_index '
+                          'from policy_stat table!')
+
+        # now do a PUT with a different value for storage_policy_index
+        # which will update the DB schema as well as update policy_stats
+        # for legacy objects in the DB (those without an SPI)
+        second_object_put_timestamp = Timestamp.now().internal
+        other_policy = [p for p in POLICIES if p.idx != 0][0]
+        broker.put_object('test_second', second_object_put_timestamp,
+                          456, 'text/plain',
+                          'cbac50c175793513fa3c581551c876ab',
+                          storage_policy_index=other_policy.idx)
+        broker._commit_puts_stale_ok()
+
+        # we are fully migrated and both objects have their
+        # storage_policy_index
+        with broker.get() as conn:
+            storage_policy_index = conn.execute('''
+                SELECT storage_policy_index FROM container_stat
+                ''').fetchone()[0]
+            self.assertEqual(storage_policy_index, 0)
+            rows = conn.execute('''
+                SELECT name, storage_policy_index FROM object
+                ''').fetchall()
+            for row in rows:
+                if row[0] == 'test_name':
+                    self.assertEqual(row[1], 0)
+                else:
+                    self.assertEqual(row[1], other_policy.idx)
+
+        # and all stats tracking is in place
+        stats = broker.get_policy_stats()
+        self.assertEqual(len(stats), 2)
+        self.assertEqual(stats[0]['object_count'], 1)
+        self.assertEqual(stats[0]['bytes_used'], 123)
+        self.assertEqual(stats[other_policy.idx]['object_count'], 1)
+        self.assertEqual(stats[other_policy.idx]['bytes_used'], 456)
+
+        # get info still reports on the legacy storage policy
+        info = broker.get_info()
+        self.assertEqual(info['object_count'], 1)
+        self.assertEqual(info['bytes_used'], 123)
+
+        # unless you change the storage policy
+        broker.set_storage_policy_index(other_policy.idx)
+        info = broker.get_info()
+        self.assertEqual(info['object_count'], 1)
+        self.assertEqual(info['bytes_used'], 456)
+
+
+class TestContainerBrokerBeforeShardRanges(ContainerBrokerMigrationMixin,
+                                           TestContainerBroker):
+    """
+    Tests for ContainerBroker against databases created
+    before the shard_ranges table was added.
+    """
+    # *grumble grumble* This should include container_info/policy_stat :-/
+    expected_db_tables = {'outgoing_sync', 'incoming_sync', 'object',
+                          'sqlite_sequence', 'container_stat'}
+
+    def setUp(self):
+        super(TestContainerBrokerBeforeShardRanges, self).setUp()
+        broker = ContainerBroker(self.get_db_path(), account='a',
+                                 container='c')
+        broker.initialize(Timestamp('1').internal, 0)
+        with self.assertRaises(sqlite3.DatabaseError) as raised, \
+                broker.get() as conn:
+            conn.execute('''SELECT *
+                            FROM shard_range''')
+        self.assertIn('no such table: shard_range', str(raised.exception))
+
+    def tearDown(self):
+        super(TestContainerBrokerBeforeShardRanges, self).tearDown()
+        broker = ContainerBroker(self.get_db_path(), account='a',
+                                 container='c')
+        broker.initialize(Timestamp('1').internal, 0)
+        with broker.get() as conn:
+            conn.execute('''SELECT *
+                            FROM shard_range''')
+        test_db.TestDbBase.tearDown(self)
+
+
+def pre_reported_create_shard_range_table(self, conn):
+    """
+    Copied from ContainerBroker before the
+    reported column was added; used for testing with
+    TestContainerBrokerBeforeShardRangeReportedColumn.
+
+    Create a shard_range table with no 'reported' column.
+
+    :param conn: DB connection object
+    """
+    conn.execute("""
+        CREATE TABLE shard_range (
+            ROWID INTEGER PRIMARY KEY AUTOINCREMENT,
+            name TEXT,
+            timestamp TEXT,
+            lower TEXT,
+            upper TEXT,
+            object_count INTEGER DEFAULT 0,
+            bytes_used INTEGER DEFAULT 0,
+            meta_timestamp TEXT,
+            deleted INTEGER DEFAULT 0,
+            state INTEGER,
+            state_timestamp TEXT,
+            epoch TEXT
+        );
+    """)
+
+    conn.execute("""
+        CREATE TRIGGER shard_range_update BEFORE UPDATE ON shard_range
+        BEGIN
+            SELECT RAISE(FAIL, 'UPDATE not allowed; DELETE and INSERT');
+        END;
+    """)
+
+
+class TestContainerBrokerBeforeShardRangeReportedColumn(
+        ContainerBrokerMigrationMixin, TestContainerBroker):
+    """
+    Tests for ContainerBroker against databases created
+    before the shard_ranges table reported column was added.
+    """
+    # *grumble grumble* This should include container_info/policy_stat :-/
+    expected_db_tables = {'outgoing_sync', 'incoming_sync', 'object',
+                          'sqlite_sequence', 'container_stat', 'shard_range'}
+
+    def setUp(self):
+        super(TestContainerBrokerBeforeShardRangeReportedColumn,
+              self).setUp()
+        ContainerBroker.create_shard_range_table = \
+            pre_reported_create_shard_range_table
+
+        broker = ContainerBroker(self.get_db_path(), account='a',
+                                 container='c')
+        broker.initialize(Timestamp('1').internal, 0)
+        with self.assertRaises(sqlite3.DatabaseError) as raised, \
+                broker.get() as conn:
+            conn.execute('''SELECT reported
+                            FROM shard_range''')
+        self.assertIn('no such column: reported', str(raised.exception))
+
+    def tearDown(self):
+        super(TestContainerBrokerBeforeShardRangeReportedColumn,
+              self).tearDown()
+        broker = ContainerBroker(self.get_db_path(), account='a',
+                                 container='c')
+        broker.initialize(Timestamp('1').internal, 0)
+        with broker.get() as conn:
+            conn.execute('''SELECT reported
+                            FROM shard_range''')
+        test_db.TestDbBase.tearDown(self)
+
+    @with_tempdir
+    def test_get_shard_ranges_attempts(self, tempdir):
+        # verify that old broker handles new sql query for shard range rows
+        db_path = os.path.join(tempdir, 'container.db')
+        broker = ContainerBroker(db_path, account='a', container='c')
+        broker.initialize(next(self.ts).internal, 0)
+
+        @contextmanager
+        def patch_execute():
+            with broker.get() as conn:
+                mock_conn = mock.MagicMock()
+                mock_execute = mock.MagicMock()
+                mock_conn.execute = mock_execute
+
+            @contextmanager
+            def mock_get():
+                yield mock_conn
+
+            with mock.patch.object(broker, 'get', mock_get):
+                yield mock_execute, conn
+
+        with patch_execute() as (mock_execute, conn):
+            mock_execute.side_effect = conn.execute
+            broker.get_shard_ranges()
+
+        expected = [
+            mock.call('\n            SELECT name, timestamp, lower, upper, '
+                      'object_count, bytes_used, meta_timestamp, deleted, '
+                      'state, state_timestamp, epoch, reported, '
+                      'tombstones\n            '
+                      'FROM shard_range WHERE deleted=0 AND name != ?;\n'
+                      '            ', ['a/c']),
+            mock.call('\n            SELECT name, timestamp, lower, upper, '
+                      'object_count, bytes_used, meta_timestamp, deleted, '
+                      'state, state_timestamp, epoch, 0 as reported, '
+                      'tombstones\n            '
+                      'FROM shard_range WHERE deleted=0 AND name != ?;\n'
+                      '            ', ['a/c']),
+            mock.call('\n            SELECT name, timestamp, lower, upper, '
+                      'object_count, bytes_used, meta_timestamp, deleted, '
+                      'state, state_timestamp, epoch, 0 as reported, '
+                      '-1 as tombstones\n            '
+                      'FROM shard_range WHERE deleted=0 AND name != ?;\n'
+                      '            ', ['a/c']),
+        ]
+
+        self.assertEqual(expected, mock_execute.call_args_list,
+                         mock_execute.call_args_list)
+
+        # if unexpectedly the call to execute continues to fail for reported,
+        # verify that the exception is raised after a retry
+        with patch_execute() as (mock_execute, conn):
+            def mock_execute_handler(*args, **kwargs):
+                if len(mock_execute.call_args_list) < 3:
+                    return conn.execute(*args, **kwargs)
+                else:
+                    raise sqlite3.OperationalError('no such column: reported')
+            mock_execute.side_effect = mock_execute_handler
+            with self.assertRaises(sqlite3.OperationalError):
+                broker.get_shard_ranges()
+        self.assertEqual(expected, mock_execute.call_args_list,
+                         mock_execute.call_args_list)
+
+        # if unexpectedly the call to execute continues to fail for tombstones,
+        # verify that the exception is raised after a retry
+        with patch_execute() as (mock_execute, conn):
+            def mock_execute_handler(*args, **kwargs):
+                if len(mock_execute.call_args_list) < 3:
+                    return conn.execute(*args, **kwargs)
+                else:
+                    raise sqlite3.OperationalError(
+                        'no such column: tombstones')
+            mock_execute.side_effect = mock_execute_handler
+            with self.assertRaises(sqlite3.OperationalError):
+                broker.get_shard_ranges()
+        self.assertEqual(expected, mock_execute.call_args_list,
+                         mock_execute.call_args_list)
+
+    @with_tempdir
+    def test_merge_shard_ranges_migrates_table(self, tempdir):
+        # verify that old broker migrates shard range table
+        db_path = os.path.join(tempdir, 'container.db')
+        broker = ContainerBroker(db_path, account='a', container='c')
+        broker.initialize(next(self.ts).internal, 0)
+        shard_ranges = [ShardRange('.shards_a/c_0', next(self.ts), 'a', 'b'),
+                        ShardRange('.shards_a/c_1', next(self.ts), 'b', 'c')]
+
+        orig_migrate_reported = broker._migrate_add_shard_range_reported
+        orig_migrate_tombstones = broker._migrate_add_shard_range_tombstones
+
+        with mock.patch.object(
+                broker, '_migrate_add_shard_range_reported',
+                side_effect=orig_migrate_reported) as mocked_reported:
+            with mock.patch.object(
+                    broker, '_migrate_add_shard_range_tombstones',
+                    side_effect=orig_migrate_tombstones) as mocked_tombstones:
+                broker.merge_shard_ranges(shard_ranges[:1])
+
+        mocked_reported.assert_called_once_with(mock.ANY)
+        mocked_tombstones.assert_called_once_with(mock.ANY)
+        self._assert_shard_ranges(broker, shard_ranges[:1])
+
+        with mock.patch.object(
+                broker, '_migrate_add_shard_range_reported',
+                side_effect=orig_migrate_reported) as mocked_reported:
+            with mock.patch.object(
+                    broker, '_migrate_add_shard_range_tombstones',
+                    side_effect=orig_migrate_tombstones) as mocked_tombstones:
+                broker.merge_shard_ranges(shard_ranges[1:])
+
+        mocked_reported.assert_not_called()
+        mocked_tombstones.assert_not_called()
+        self._assert_shard_ranges(broker, shard_ranges)
+
+    @with_tempdir
+    def test_merge_shard_ranges_fails_to_migrate_table(self, tempdir):
+        # verify that old broker will raise exception if it unexpectedly fails
+        # to migrate shard range table
+        db_path = os.path.join(tempdir, 'container.db')
+        broker = ContainerBroker(db_path, account='a', container='c')
+        broker.initialize(next(self.ts).internal, 0)
+        shard_ranges = [ShardRange('.shards_a/c_0', next(self.ts), 'a', 'b'),
+                        ShardRange('.shards_a/c_1', next(self.ts), 'b', 'c')]
+
+        # unexpected error during migration
+        with mock.patch.object(
+                broker, '_migrate_add_shard_range_reported',
+                side_effect=sqlite3.OperationalError('unexpected')) \
+                as mocked_reported:
+            with self.assertRaises(sqlite3.OperationalError):
+                broker.merge_shard_ranges(shard_ranges)
+
+        # one failed attempt was made to add reported column
+        self.assertEqual(1, mocked_reported.call_count)
+
+        # migration silently fails
+        with mock.patch.object(
+                broker, '_migrate_add_shard_range_reported') \
+                as mocked_reported:
+            with self.assertRaises(sqlite3.OperationalError):
+                broker.merge_shard_ranges(shard_ranges)
+
+        # one failed attempt was made to add reported column
+        self.assertEqual(1, mocked_reported.call_count)
+
+        with mock.patch.object(
+                broker, '_migrate_add_shard_range_tombstones') \
+                as mocked_tombstones:
+            with self.assertRaises(sqlite3.OperationalError):
+                broker.merge_shard_ranges(shard_ranges)
+
+        # first migration adds reported column
+        # one failed attempt was made to add tombstones column
+        self.assertEqual(1, mocked_tombstones.call_count)
+
+
+def pre_tombstones_create_shard_range_table(self, conn):
+    """
+    Copied from ContainerBroker before the
+    tombstones column was added; used for testing with
+    TestContainerBrokerBeforeShardRangeTombstonesColumn.
+
+    Create a shard_range table with no 'tombstones' column.
+
+    :param conn: DB connection object
+    """
+    # Use execute (not executescript) so we get the benefits of our
+    # GreenDBConnection. Creating a table requires a whole-DB lock;
+    # *any* in-progress cursor will otherwise trip a "database is locked"
+    # error.
+    conn.execute("""
+            CREATE TABLE shard_range (
+                ROWID INTEGER PRIMARY KEY AUTOINCREMENT,
+                name TEXT,
+                timestamp TEXT,
+                lower TEXT,
+                upper TEXT,
+                object_count INTEGER DEFAULT 0,
+                bytes_used INTEGER DEFAULT 0,
+                meta_timestamp TEXT,
+                deleted INTEGER DEFAULT 0,
+                state INTEGER,
+                state_timestamp TEXT,
+                epoch TEXT,
+                reported INTEGER DEFAULT 0
+            );
+        """)
+
+    conn.execute("""
+            CREATE TRIGGER shard_range_update BEFORE UPDATE ON shard_range
+            BEGIN
+                SELECT RAISE(FAIL, 'UPDATE not allowed; DELETE and INSERT');
+            END;
+        """)
+
+
+class TestContainerBrokerBeforeShardRangeTombstonesColumn(
+        ContainerBrokerMigrationMixin, TestContainerBroker):
+    """
+    Tests for ContainerBroker against databases created
+    before the shard_ranges table tombstones column was added.
+    """
+    expected_db_tables = {'outgoing_sync', 'incoming_sync', 'object',
+                          'sqlite_sequence', 'container_stat', 'shard_range'}
+
+    def setUp(self):
+        super(TestContainerBrokerBeforeShardRangeTombstonesColumn,
+              self).setUp()
+        ContainerBroker.create_shard_range_table = \
+            pre_tombstones_create_shard_range_table
+
+        broker = ContainerBroker(self.get_db_path(), account='a',
+                                 container='c')
+        broker.initialize(Timestamp('1').internal, 0)
+        with self.assertRaises(sqlite3.DatabaseError) as raised, \
+                broker.get() as conn:
+            conn.execute('''SELECT tombstones
+                            FROM shard_range''')
+        self.assertIn('no such column: tombstones', str(raised.exception))
+
+    def tearDown(self):
+        super(TestContainerBrokerBeforeShardRangeTombstonesColumn,
+              self).tearDown()
+        broker = ContainerBroker(self.get_db_path(), account='a',
+                                 container='c')
+        broker.initialize(Timestamp('1').internal, 0)
+        with broker.get() as conn:
+            conn.execute('''SELECT tombstones
+                            FROM shard_range''')
+        test_db.TestDbBase.tearDown(self)
+
+
+class TestUpdateNewItemFromExisting(unittest.TestCase):
+    # TODO: add test scenarios that have swift_bytes in content_type
+    t0 = Timestamp(1234567890.00000)
+    t1 = Timestamp(1234567890.00001)
+    t2 = Timestamp(1234567890.00002)
+    t3 = Timestamp(1234567890.00003)
+    t4 = Timestamp(1234567890.00004)
+    t5 = Timestamp(1234567890.00005)
+    t6 = Timestamp(1234567890.00006)
+    t7 = Timestamp(1234567890.00007)
+    t8 = Timestamp(1234567890.00008)
+    t20 = Timestamp(1234567890.00020)
+    t30 = Timestamp(1234567890.00030)
+
+    base_new_item = {'etag': 'New_item',
+                     'size': 'nEw_item',
+                     'content_type': 'neW_item',
+                     'deleted': '0'}
+    base_existing = {'etag': 'Existing',
+                     'size': 'eXisting',
+                     'content_type': 'exIsting',
+                     'deleted': '0'}
+    #
+    # each scenario is a tuple of:
+    #    (existing timestamp str, new item timestamps, expected updated item)
+    #
+    #  e.g.:
+    # existing -> ({'created_at': t5.internal},
+    # new_item -> {'created_at': t, 'ctype_timestamp': t, 'meta_timestamp': t},
+    # expected -> {'created_at': t.internal,
+    #              'etag': <val>, 'size': <val>, 'content_type': <val>})
+    #
+    scenarios_when_all_existing_wins = (
+        #
+        # all new_item times <= all existing times -> existing values win
+        #
+        # existing has attrs at single time
+        #
+        ({'created_at': t3.internal},
+         {'created_at': t0,
+          'ctype_timestamp': t0,
+          'meta_timestamp': t0},
+         {'created_at': t3.internal,
+         'etag': 'Existing', 'size': 'eXisting', 'content_type': 'exIsting'}),
+
+        ({'created_at': t3.internal},
+         {'created_at': t0,
+          'ctype_timestamp': t0,
+          'meta_timestamp': t1},
+         {'created_at': t3.internal,
+         'etag': 'Existing', 'size': 'eXisting', 'content_type': 'exIsting'}),
+
+        ({'created_at': t3.internal},
+         {'created_at': t0,
+          'ctype_timestamp': t1,
+          'meta_timestamp': t1},
+         {'created_at': t3.internal,
+         'etag': 'Existing', 'size': 'eXisting', 'content_type': 'exIsting'}),
+
+        ({'created_at': t3.internal},
+         {'created_at': t0,
+          'ctype_timestamp': t1,
+          'meta_timestamp': t2},
+         {'created_at': t3.internal,
+         'etag': 'Existing', 'size': 'eXisting', 'content_type': 'exIsting'}),
+
+        ({'created_at': t3.internal},
+         {'created_at': t0,
+          'ctype_timestamp': t1,
+          'meta_timestamp': t3},
+         {'created_at': t3.internal,
+         'etag': 'Existing', 'size': 'eXisting', 'content_type': 'exIsting'}),
+
+        ({'created_at': t3.internal},
+         {'created_at': t0,
+          'ctype_timestamp': t3,
+          'meta_timestamp': t3},
+         {'created_at': t3.internal,
+         'etag': 'Existing', 'size': 'eXisting', 'content_type': 'exIsting'}),
+
+        ({'created_at': t3.internal},
+         {'created_at': t3,
+          'ctype_timestamp': t3,
+          'meta_timestamp': t3},
+         {'created_at': t3.internal,
+         'etag': 'Existing', 'size': 'eXisting', 'content_type': 'exIsting'}),
+
+        #
+        # existing has attrs at multiple times:
+        # data @ t3, ctype @ t5, meta @t7 -> existing created_at = t3+2+2
+        #
+        ({'created_at': t3.internal + '+2+2'},
+         {'created_at': t0,
+          'ctype_timestamp': t0,
+          'meta_timestamp': t0},
+         {'created_at': t3.internal + '+2+2',
+         'etag': 'Existing', 'size': 'eXisting', 'content_type': 'exIsting'}),
+
+        ({'created_at': t3.internal + '+2+2'},
+         {'created_at': t3,
+          'ctype_timestamp': t3,
+          'meta_timestamp': t3},
+         {'created_at': t3.internal + '+2+2',
+         'etag': 'Existing', 'size': 'eXisting', 'content_type': 'exIsting'}),
+
+        ({'created_at': t3.internal + '+2+2'},
+         {'created_at': t3,
+          'ctype_timestamp': t4,
+          'meta_timestamp': t4},
+         {'created_at': t3.internal + '+2+2',
+         'etag': 'Existing', 'size': 'eXisting', 'content_type': 'exIsting'}),
+
+        ({'created_at': t3.internal + '+2+2'},
+         {'created_at': t3,
+          'ctype_timestamp': t4,
+          'meta_timestamp': t5},
+         {'created_at': t3.internal + '+2+2',
+         'etag': 'Existing', 'size': 'eXisting', 'content_type': 'exIsting'}),
+
+        ({'created_at': t3.internal + '+2+2'},
+         {'created_at': t3,
+          'ctype_timestamp': t4,
+          'meta_timestamp': t7},
+         {'created_at': t3.internal + '+2+2',
+         'etag': 'Existing', 'size': 'eXisting', 'content_type': 'exIsting'}),
+
+        ({'created_at': t3.internal + '+2+2'},
+         {'created_at': t3,
+          'ctype_timestamp': t4,
+          'meta_timestamp': t7},
+         {'created_at': t3.internal + '+2+2',
+         'etag': 'Existing', 'size': 'eXisting', 'content_type': 'exIsting'}),
+
+        ({'created_at': t3.internal + '+2+2'},
+         {'created_at': t3,
+          'ctype_timestamp': t5,
+          'meta_timestamp': t5},
+         {'created_at': t3.internal + '+2+2',
+         'etag': 'Existing', 'size': 'eXisting', 'content_type': 'exIsting'}),
+
+        ({'created_at': t3.internal + '+2+2'},
+         {'created_at': t3,
+          'ctype_timestamp': t5,
+          'meta_timestamp': t6},
+         {'created_at': t3.internal + '+2+2',
+         'etag': 'Existing', 'size': 'eXisting', 'content_type': 'exIsting'}),
+
+        ({'created_at': t3.internal + '+2+2'},
+         {'created_at': t3,
+          'ctype_timestamp': t5,
+          'meta_timestamp': t7},
+         {'created_at': t3.internal + '+2+2',
+         'etag': 'Existing', 'size': 'eXisting', 'content_type': 'exIsting'}),
+    )
+
+    scenarios_when_all_new_item_wins = (
+        # no existing record
+        (None,
+         {'created_at': t4,
+          'ctype_timestamp': t4,
+          'meta_timestamp': t4},
+         {'created_at': t4.internal,
+          'etag': 'New_item', 'size': 'nEw_item', 'content_type': 'neW_item'}),
+
+        (None,
+         {'created_at': t4,
+          'ctype_timestamp': t4,
+          'meta_timestamp': t5},
+         {'created_at': t4.internal + '+0+1',
+          'etag': 'New_item', 'size': 'nEw_item', 'content_type': 'neW_item'}),
+
+        (None,
+         {'created_at': t4,
+          'ctype_timestamp': t5,
+          'meta_timestamp': t5},
+         {'created_at': t4.internal + '+1+0',
+          'etag': 'New_item', 'size': 'nEw_item', 'content_type': 'neW_item'}),
+
+        (None,
+         {'created_at': t4,
+          'ctype_timestamp': t5,
+          'meta_timestamp': t6},
+         {'created_at': t4.internal + '+1+1',
+          'etag': 'New_item', 'size': 'nEw_item', 'content_type': 'neW_item'}),
+
+        #
+        # all new_item times > all existing times -> new item values win
+        #
+        # existing has attrs at single time
+        #
+        ({'created_at': t3.internal},
+         {'created_at': t4,
+          'ctype_timestamp': t4,
+          'meta_timestamp': t4},
+         {'created_at': t4.internal,
+         'etag': 'New_item', 'size': 'nEw_item', 'content_type': 'neW_item'}),
+
+        ({'created_at': t3.internal},
+         {'created_at': t4,
+          'ctype_timestamp': t4,
+          'meta_timestamp': t5},
+         {'created_at': t4.internal + '+0+1',
+         'etag': 'New_item', 'size': 'nEw_item', 'content_type': 'neW_item'}),
+
+        ({'created_at': t3.internal},
+         {'created_at': t4,
+          'ctype_timestamp': t5,
+          'meta_timestamp': t5},
+         {'created_at': t4.internal + '+1+0',
+         'etag': 'New_item', 'size': 'nEw_item', 'content_type': 'neW_item'}),
+
+        ({'created_at': t3.internal},
+         {'created_at': t4,
+          'ctype_timestamp': t5,
+          'meta_timestamp': t6},
+         {'created_at': t4.internal + '+1+1',
+         'etag': 'New_item', 'size': 'nEw_item', 'content_type': 'neW_item'}),
+
+        #
+        # existing has attrs at multiple times:
+        # data @ t3, ctype @ t5, meta @t7 -> existing created_at = t3+2+2
+        #
+        ({'created_at': t3.internal + '+2+2'},
+         {'created_at': t4,
+          'ctype_timestamp': t6,
+          'meta_timestamp': t8},
+         {'created_at': t4.internal + '+2+2',
+         'etag': 'New_item', 'size': 'nEw_item', 'content_type': 'neW_item'}),
+
+        ({'created_at': t3.internal + '+2+2'},
+         {'created_at': t6,
+          'ctype_timestamp': t6,
+          'meta_timestamp': t8},
+         {'created_at': t6.internal + '+0+2',
+         'etag': 'New_item', 'size': 'nEw_item', 'content_type': 'neW_item'}),
+
+        ({'created_at': t3.internal + '+2+2'},
+         {'created_at': t4,
+          'ctype_timestamp': t8,
+          'meta_timestamp': t8},
+         {'created_at': t4.internal + '+4+0',
+         'etag': 'New_item', 'size': 'nEw_item', 'content_type': 'neW_item'}),
+
+        ({'created_at': t3.internal + '+2+2'},
+         {'created_at': t6,
+          'ctype_timestamp': t8,
+          'meta_timestamp': t8},
+         {'created_at': t6.internal + '+2+0',
+         'etag': 'New_item', 'size': 'nEw_item', 'content_type': 'neW_item'}),
+
+        ({'created_at': t3.internal + '+2+2'},
+         {'created_at': t8,
+          'ctype_timestamp': t8,
+          'meta_timestamp': t8},
+         {'created_at': t8.internal,
+         'etag': 'New_item', 'size': 'nEw_item', 'content_type': 'neW_item'}),
+    )
+
+    scenarios_when_some_new_item_wins = (
+        #
+        # some but not all new_item times > existing times -> mixed updates
+        #
+        # existing has attrs at single time
+        #
+        ({'created_at': t3.internal},
+         {'created_at': t3,
+          'ctype_timestamp': t3,
+          'meta_timestamp': t4},
+         {'created_at': t3.internal + '+0+1',
+          'etag': 'Existing', 'size': 'eXisting', 'content_type': 'exIsting'}),
+
+        ({'created_at': t3.internal},
+         {'created_at': t3,
+          'ctype_timestamp': t4,
+          'meta_timestamp': t4},
+         {'created_at': t3.internal + '+1+0',
+          'etag': 'Existing', 'size': 'eXisting', 'content_type': 'neW_item'}),
+
+        ({'created_at': t3.internal},
+         {'created_at': t3,
+          'ctype_timestamp': t4,
+          'meta_timestamp': t5},
+         {'created_at': t3.internal + '+1+1',
+          'etag': 'Existing', 'size': 'eXisting', 'content_type': 'neW_item'}),
+
+        #
+        # existing has attrs at multiple times:
+        # data @ t3, ctype @ t5, meta @t7 -> existing created_at = t3+2+2
+        #
+        ({'created_at': t3.internal + '+2+2'},
+         {'created_at': t3,
+          'ctype_timestamp': t3,
+          'meta_timestamp': t8},
+         {'created_at': t3.internal + '+2+3',
+          'etag': 'Existing', 'size': 'eXisting', 'content_type': 'exIsting'}),
+
+        ({'created_at': t3.internal + '+2+2'},
+         {'created_at': t3,
+          'ctype_timestamp': t6,
+          'meta_timestamp': t8},
+         {'created_at': t3.internal + '+3+2',
+          'etag': 'Existing', 'size': 'eXisting', 'content_type': 'neW_item'}),
+
+        ({'created_at': t3.internal + '+2+2'},
+         {'created_at': t4,
+          'ctype_timestamp': t4,
+          'meta_timestamp': t6},
+         {'created_at': t4.internal + '+1+2',
+          'etag': 'New_item', 'size': 'nEw_item', 'content_type': 'exIsting'}),
+
+        ({'created_at': t3.internal + '+2+2'},
+         {'created_at': t4,
+          'ctype_timestamp': t6,
+          'meta_timestamp': t6},
+         {'created_at': t4.internal + '+2+1',
+          'etag': 'New_item', 'size': 'nEw_item', 'content_type': 'neW_item'}),
+
+        ({'created_at': t3.internal + '+2+2'},
+         {'created_at': t4,
+          'ctype_timestamp': t4,
+          'meta_timestamp': t8},
+         {'created_at': t4.internal + '+1+3',
+          'etag': 'New_item', 'size': 'nEw_item', 'content_type': 'exIsting'}),
+
+        # this scenario is to check that the deltas are in hex
+        ({'created_at': t3.internal + '+2+2'},
+         {'created_at': t2,
+          'ctype_timestamp': t20,
+          'meta_timestamp': t30},
+         {'created_at': t3.internal + '+11+a',
+          'etag': 'Existing', 'size': 'eXisting', 'content_type': 'neW_item'}),
+    )
+
+    def _test_scenario(self, scenario, newer):
+        existing_time, new_item_times, expected_attrs = scenario
+        # this is the existing record...
+        existing = None
+        if existing_time:
+            existing = dict(self.base_existing)
+            existing.update(existing_time)
+
+        # this is the new item to update
+        new_item = dict(self.base_new_item)
+        new_item.update({k: v.internal for k, v in new_item_times.items()})
+
+        # this is the expected result of the update
+        expected = dict(new_item)
+        expected.update(expected_attrs)
+        expected['data_timestamp'] = new_item['created_at']
+
+        try:
+            self.assertIs(newer,
+                          update_new_item_from_existing(new_item, existing))
+            self.assertDictEqual(expected, new_item)
+        except AssertionError as e:
+            msg = ('Scenario: existing %s, new_item %s, expected %s.'
+                   % scenario)
+            msg = '%s Failed with: %s' % (msg, e)
+            raise AssertionError(msg)
+
+    def test_update_new_item_from_existing(self):
+        for scenario in self.scenarios_when_all_existing_wins:
+            self._test_scenario(scenario, False)
+
+        for scenario in self.scenarios_when_all_new_item_wins:
+            self._test_scenario(scenario, True)
+
+        for scenario in self.scenarios_when_some_new_item_wins:
+            self._test_scenario(scenario, True)
+
+
+class TestModuleFunctions(unittest.TestCase):
+    def setUp(self):
+        super(TestModuleFunctions, self).setUp()
+        self.ts_iter = make_timestamp_iter()
+        self.ts = [next(self.ts_iter).internal for _ in range(10)]
+
+    def test_merge_shards_existing_none(self):
+        data = dict(ShardRange('a/o', self.ts[1]), reported=True)
+        exp_data = dict(data)
+        self.assertTrue(merge_shards(data, None))
+        self.assertEqual(exp_data, data)
+
+    def test_merge_shards_existing_ts_lt(self):
+        existing = dict(ShardRange('a/o', self.ts[0]))
+        data = dict(ShardRange('a/o', self.ts[1]), reported=True)
+        exp_data = dict(data, reported=False)
+        self.assertTrue(merge_shards(data, existing))
+        self.assertEqual(exp_data, data)
+
+    def test_merge_shards_existing_ts_gt(self):
+        existing = dict(ShardRange('a/o', self.ts[1]))
+        data = dict(ShardRange('a/o', self.ts[0]), reported=True)
+        exp_data = dict(data)
+        self.assertFalse(merge_shards(data, existing))
+        self.assertEqual(exp_data, data)
+
+        # existing timestamp trumps data state_timestamp
+        data = dict(ShardRange('a/o', self.ts[0]), state=ShardRange.ACTIVE,
+                    state_timestamp=self.ts[2])
+        exp_data = dict(data)
+        self.assertFalse(merge_shards(data, existing))
+        self.assertEqual(exp_data, data)
+
+        # existing timestamp trumps data meta_timestamp
+        data = dict(ShardRange('a/o', self.ts[0]), state=ShardRange.ACTIVE,
+                    meta_timestamp=self.ts[2])
+        exp_data = dict(data)
+        self.assertFalse(merge_shards(data, existing))
+        self.assertEqual(exp_data, data)
+
+    def test_merge_shards_existing_ts_eq_merge_reported(self):
+        existing = dict(ShardRange('a/o', self.ts[0]))
+        data = dict(ShardRange('a/o', self.ts[0]), reported=False)
+        exp_data = dict(data)
+        self.assertFalse(merge_shards(data, existing))
+        self.assertEqual(exp_data, data)
+
+        data = dict(ShardRange('a/o', self.ts[0]), reported=True)
+        exp_data = dict(data)
+        self.assertTrue(merge_shards(data, existing))
+        self.assertEqual(exp_data, data)
+
+    def test_merge_shards_existing_ts_eq_retain_bounds(self):
+        existing = dict(ShardRange('a/o', self.ts[0]))
+        data = dict(ShardRange('a/o', self.ts[0]), lower='l', upper='u')
+        exp_data = dict(data, lower='', upper='')
+        self.assertFalse(merge_shards(data, existing))
+        self.assertEqual(exp_data, data)
+
+    def test_merge_shards_existing_ts_eq_retain_deleted(self):
+        existing = dict(ShardRange('a/o', self.ts[0]))
+        data = dict(ShardRange('a/o', self.ts[0]), deleted=1)
+        exp_data = dict(data, deleted=0)
+        self.assertFalse(merge_shards(data, existing))
+        self.assertEqual(exp_data, data)
+
+    def test_merge_shards_existing_ts_eq_meta_ts_gte(self):
+        existing = dict(
+            ShardRange('a/o', self.ts[0], meta_timestamp=self.ts[1],
+                       object_count=1, bytes_used=2, tombstones=3))
+        data = dict(
+            ShardRange('a/o', self.ts[0], meta_timestamp=self.ts[1],
+                       object_count=10, bytes_used=20, tombstones=30))
+        exp_data = dict(data, object_count=1, bytes_used=2, tombstones=3)
+        self.assertFalse(merge_shards(data, existing))
+        self.assertEqual(exp_data, data)
+
+        existing = dict(
+            ShardRange('a/o', self.ts[0], meta_timestamp=self.ts[2],
+                       object_count=1, bytes_used=2, tombstones=3))
+        exp_data = dict(data, object_count=1, bytes_used=2, tombstones=3,
+                        meta_timestamp=self.ts[2])
+        self.assertFalse(merge_shards(data, existing))
+        self.assertEqual(exp_data, data)
+
+    def test_merge_shards_existing_ts_eq_meta_ts_lt(self):
+        existing = dict(
+            ShardRange('a/o', self.ts[0], meta_timestamp=self.ts[1],
+                       object_count=1, bytes_used=2, tombstones=3,
+                       epoch=self.ts[3]))
+        data = dict(
+            ShardRange('a/o', self.ts[0], meta_timestamp=self.ts[2],
+                       object_count=10, bytes_used=20, tombstones=30,
+                       epoch=None))
+        exp_data = dict(data, epoch=self.ts[3])
+        self.assertTrue(merge_shards(data, existing))
+        self.assertEqual(exp_data, data)
+
+    def test_merge_shards_existing_ts_eq_state_ts_eq(self):
+        # data has more advanced state
+        existing = dict(
+            ShardRange('a/o', self.ts[0], state_timestamp=self.ts[1],
+                       state=ShardRange.CREATED, epoch=self.ts[4]))
+        data = dict(
+            ShardRange('a/o', self.ts[0], state_timestamp=self.ts[1],
+                       state=ShardRange.ACTIVE, epoch=self.ts[5]))
+        exp_data = dict(data)
+        self.assertTrue(merge_shards(data, existing))
+        self.assertEqual(exp_data, data)
+
+        # data has less advanced state
+        existing = dict(
+            ShardRange('a/o', self.ts[0], state_timestamp=self.ts[1],
+                       state=ShardRange.CREATED, epoch=self.ts[4]))
+        data = dict(
+            ShardRange('a/o', self.ts[0], state_timestamp=self.ts[1],
+                       state=ShardRange.FOUND, epoch=self.ts[5]))
+        exp_data = dict(data, state=ShardRange.CREATED, epoch=self.ts[4])
+        self.assertFalse(merge_shards(data, existing))
+        self.assertEqual(exp_data, data)
+
+    def test_merge_shards_existing_ts_eq_state_ts_gt(self):
+        existing = dict(
+            ShardRange('a/o', self.ts[0], state_timestamp=self.ts[2],
+                       state=ShardRange.CREATED, epoch=self.ts[4]))
+        data = dict(
+            ShardRange('a/o', self.ts[0], state_timestamp=self.ts[1],
+                       state=ShardRange.ACTIVE, epoch=self.ts[5]))
+        exp_data = dict(data, state_timestamp=self.ts[2],
+                        state=ShardRange.CREATED, epoch=self.ts[4])
+        self.assertFalse(merge_shards(data, existing))
+        self.assertEqual(exp_data, data)
+
+    def test_merge_shards_existing_ts_eq_state_ts_lt(self):
+        existing = dict(
+            ShardRange('a/o', self.ts[0], state_timestamp=self.ts[0],
+                       state=ShardRange.CREATED, epoch=self.ts[4]))
+        data = dict(
+            ShardRange('a/o', self.ts[0], state_timestamp=self.ts[1],
+                       state=ShardRange.ACTIVE, epoch=self.ts[5]))
+        exp_data = dict(data)
+        self.assertTrue(merge_shards(data, existing))
+        self.assertEqual(exp_data, data)
+
+    def test_merge_shards_epoch_reset(self):
+        # not sure if these scenarios are realistic, but we have seen epoch
+        # resets in prod
+        # same timestamps, data has more advanced state but no epoch
+        existing = dict(
+            ShardRange('a/o', self.ts[0], state_timestamp=self.ts[1],
+                       state=ShardRange.CREATED, epoch=self.ts[4]))
+        data = dict(
+            ShardRange('a/o', self.ts[0], state_timestamp=self.ts[1],
+                       state=ShardRange.ACTIVE, epoch=None))
+        exp_data = dict(data)
+        self.assertTrue(merge_shards(data, existing))
+        self.assertEqual(exp_data, data)
+        self.assertIsNone(exp_data['epoch'])
+
+        # data has more advanced state_timestamp but no epoch
+        existing = dict(
+            ShardRange('a/o', self.ts[0], state_timestamp=self.ts[1],
+                       state=ShardRange.CREATED, epoch=self.ts[4]))
+        data = dict(
+            ShardRange('a/o', self.ts[0], state_timestamp=self.ts[2],
+                       state=ShardRange.FOUND, epoch=None))
+        exp_data = dict(data)
+        self.assertTrue(merge_shards(data, existing))
+        self.assertEqual(exp_data, data)
+        self.assertIsNone(exp_data['epoch'])
+
+    def test_sift_shard_ranges(self):
+        existing_shards = {}
+        sr1 = dict(ShardRange('a/o', next(self.ts_iter).internal))
+        sr2 = dict(ShardRange('a/o2', next(self.ts_iter).internal))
+        new_shard_ranges = [sr1, sr2]
+
+        # first empty existing shards will just add the shards
+        to_add, to_delete = sift_shard_ranges(new_shard_ranges,
+                                              existing_shards)
+        self.assertEqual(2, len(to_add))
+        self.assertIn(sr1, to_add)
+        self.assertIn(sr2, to_add)
+        self.assertFalse(to_delete)
+
+        # if there is a newer version in the existing shards then it won't be
+        # added to to_add
+        existing_shards['a/o'] = dict(
+            ShardRange('a/o', next(self.ts_iter).internal))
+        to_add, to_delete = sift_shard_ranges(new_shard_ranges,
+                                              existing_shards)
+        self.assertEqual([sr2], list(to_add))
+        self.assertFalse(to_delete)
+
+        # But if a newer version is in new_shard_ranges then the old will be
+        # added to to_delete and new is added to to_add.
+        sr1['timestamp'] = next(self.ts_iter).internal
+        to_add, to_delete = sift_shard_ranges(new_shard_ranges,
+                                              existing_shards)
+        self.assertEqual(2, len(to_add))
+        self.assertIn(sr1, to_add)
+        self.assertIn(sr2, to_add)
+        self.assertEqual({'a/o'}, to_delete)
+
+
+class TestExpirerBytesCtypeTimestamp(test_db.TestDbBase):
+
+    def setUp(self):
+        super(TestExpirerBytesCtypeTimestamp, self).setUp()
+        self.policy = POLICIES.default
+
+    def _get_broker(self):
+        broker = ContainerBroker(self.db_path,
+                                 account='.expiring_objects',
+                                 container='1234')
+        broker.initialize(next(self.ts).internal, self.policy.idx)
+        return broker
+
+    def test_in_order_expirer_bytes_ctype(self):
+        broker = self._get_broker()
+        # The ctype timestamp can be older than the row's data timestamp. For
+        # example, this may be the case with an expirer queue update arising
+        # from an object's x-delete-at being modified by a POST; the data
+        # timestamp is the time at which x-delete-at was modified by the POST;
+        # the content-type holds the object's size so the ctype timestamp is
+        # the time at which the expiring object was originally PUT.
+        put1_ts = next(self.ts)
+        put2_ts = next(self.ts)
+        post_ts = next(self.ts)
+
+        broker.put_object(
+            '1234-a/c/o', post_ts.internal, 0,
+            'text/plain;swift_expirer_bytes=1',
+            'd41d8cd98f00b204e9800998ecf8427e',
+            storage_policy_index=self.policy.idx,
+            ctype_timestamp=put1_ts.internal)
+        broker.put_object(
+            '1234-a/c/o', post_ts.internal, 0,
+            'text/plain;swift_expirer_bytes=2',
+            'd41d8cd98f00b204e9800998ecf8427e',
+            storage_policy_index=self.policy.idx,
+            ctype_timestamp=put2_ts.internal)
+
+        self.assertEqual([{
+            'content_type': 'text/plain;swift_expirer_bytes=2',
+            'created_at': encode_timestamps(post_ts, put2_ts, put2_ts),
+            'deleted': 0,
+            'etag': 'd41d8cd98f00b204e9800998ecf8427e',
+            'name': '1234-a/c/o',
+            'size': 0,
+            'storage_policy_index': self.policy.idx,
+        }], broker.get_objects())
+
+    def test_out_of_order_expirer_bytes_ctype(self):
+        broker = self._get_broker()
+
+        put1_ts = next(self.ts)
+        put2_ts = next(self.ts)
+        post_ts = next(self.ts)
+
+        broker.put_object(
+            '1234-a/c/o', post_ts.internal, 0,
+            'text/plain;swift_expirer_bytes=2',
+            'd41d8cd98f00b204e9800998ecf8427e',
+            storage_policy_index=self.policy.idx,
+            ctype_timestamp=put2_ts.internal)
+        # order doesn't matter, more recent put2_ts ctype_timestamp wins
+        broker.put_object(
+            '1234-a/c/o', post_ts.internal, 0,
+            'text/plain;swift_expirer_bytes=1',
+            'd41d8cd98f00b204e9800998ecf8427e',
+            storage_policy_index=self.policy.idx,
+            ctype_timestamp=put1_ts.internal)
+
+        self.assertEqual([{
+            'content_type': 'text/plain;swift_expirer_bytes=2',
+            'created_at': encode_timestamps(post_ts, put2_ts, put2_ts),
+            'deleted': 0,
+            'etag': 'd41d8cd98f00b204e9800998ecf8427e',
+            'name': '1234-a/c/o',
+            'size': 0,
+            'storage_policy_index': self.policy.idx,
+        }], broker.get_objects())
+
+    def test_unupgraded_expirer_bytes_ctype(self):
+        broker = self._get_broker()
+
+        put1_ts = next(self.ts)
+        post_ts = next(self.ts)
+
+        broker.put_object(
+            '1234-a/c/o', post_ts.internal, 0,
+            'text/plain',
+            'd41d8cd98f00b204e9800998ecf8427e',
+            storage_policy_index=self.policy.idx)
+        # since the un-upgraded server's task creation request arrived w/o a
+        # ctype_timestamp, the row treats it's ctype timestamp as being the
+        # same as the x-timestamp that created the row (the post_ts) - which is
+        # more recent than the put1_ts used as the ctype_timestamp from the
+        # already-upgraded server
+        broker.put_object(
+            '1234-a/c/o', post_ts.internal, 0,
+            'text/plain;swift_expirer_bytes=1',
+            'd41d8cd98f00b204e9800998ecf8427e',
+            storage_policy_index=self.policy.idx,
+            ctype_timestamp=put1_ts.internal)
+
+        # so the un-upgraded row wins
+        self.assertEqual([{
+            'content_type': 'text/plain',
+            'created_at': post_ts,
+            'deleted': 0,
+            'etag': 'd41d8cd98f00b204e9800998ecf8427e',
+            'name': '1234-a/c/o',
+            'size': 0,
+            'storage_policy_index': self.policy.idx,
+        }], broker.get_objects())
diff --git a/test/unit/container/test_reconciler.py b/test/unit/container/test_reconciler.py
new file mode 100644
index 0000000000..adfdd81739
--- /dev/null
+++ b/test/unit/container/test_reconciler.py
@@ -0,0 +1,2174 @@
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import json
+import shutil
+from functools import partial
+from tempfile import mkdtemp
+
+from unittest import mock
+import operator
+import time
+import unittest
+import socket
+import os
+import errno
+import itertools
+import random
+import eventlet
+
+from collections import defaultdict
+from datetime import datetime
+from datetime import timezone
+import urllib.parse
+from swift.common.storage_policy import StoragePolicy, ECStoragePolicy
+from swift.common.swob import Request
+
+from swift.container import reconciler
+from swift.container.server import gen_resp_headers, ContainerController
+from swift.common.direct_client import ClientException
+from swift.common import swob
+from swift.common.header_key_dict import HeaderKeyDict
+from swift.common.utils import split_path, Timestamp, encode_timestamps, \
+    mkdirs
+
+from test.debug_logger import debug_logger
+from test.unit import FakeRing, fake_http_connect, patch_policies, \
+    DEFAULT_TEST_EC_TYPE, make_timestamp_iter, mock_timestamp_now
+from test.unit.common.middleware import helpers
+
+
+def timestamp_to_last_modified(timestamp):
+    dt = datetime.fromtimestamp(float(Timestamp(timestamp)), timezone.utc)
+    return dt.strftime('%Y-%m-%dT%H:%M:%S.%f')
+
+
+def container_resp_headers(**kwargs):
+    return HeaderKeyDict(gen_resp_headers(kwargs))
+
+
+class FakeStoragePolicySwift(object):
+
+    def __init__(self):
+        self.storage_policy = defaultdict(
+            partial(helpers.FakeSwift, capture_unexpected_calls=False))
+        self._mock_oldest_spi_map = {}
+
+    def __getattribute__(self, name):
+        try:
+            return object.__getattribute__(self, name)
+        except AttributeError:
+            return getattr(self.storage_policy[None], name)
+
+    def __call__(self, env, start_response):
+        method = env['REQUEST_METHOD']
+        path = env['PATH_INFO']
+        _, acc, cont, obj = split_path(env['PATH_INFO'], 0, 4,
+                                       rest_with_last=True)
+        if not obj:
+            policy_index = None
+        else:
+            policy_index = self._mock_oldest_spi_map.get(cont, 0)
+            # allow backend policy override
+            if 'HTTP_X_BACKEND_STORAGE_POLICY_INDEX' in env:
+                policy_index = int(env['HTTP_X_BACKEND_STORAGE_POLICY_INDEX'])
+
+        try:
+            return self.storage_policy[policy_index].__call__(
+                env, start_response)
+        except KeyError:
+            pass
+
+        if method == 'PUT':
+            resp_class = swob.HTTPCreated
+        else:
+            resp_class = swob.HTTPNotFound
+        self.storage_policy[policy_index].register(
+            method, path, resp_class, {}, '')
+
+        return self.storage_policy[policy_index].__call__(
+            env, start_response)
+
+
+class FakeInternalClient(reconciler.InternalClient):
+    def __init__(self, listings=None):
+        self.app = FakeStoragePolicySwift()
+        self.user_agent = 'fake-internal-client'
+        self.request_tries = 1
+        self.use_replication_network = True
+        self.parse(listings)
+        self.container_ring = FakeRing()
+
+    def parse(self, listings):
+        listings = listings or {}
+        self.accounts = defaultdict(lambda: defaultdict(list))
+        for item, timestamp in listings.items():
+            # XXX this interface is stupid
+            if isinstance(timestamp, tuple):
+                timestamp, content_type = timestamp
+            else:
+                timestamp, content_type = timestamp, 'application/x-put'
+            storage_policy_index, path = item
+            account, container_name, obj_name = split_path(
+                path, 0, 3, rest_with_last=True)
+            self.accounts[account][container_name].append(
+                (obj_name, storage_policy_index, timestamp, content_type))
+        for account_name, containers in self.accounts.items():
+            for con in containers:
+                self.accounts[account_name][con].sort(key=lambda t: t[0])
+        for account, containers in self.accounts.items():
+            account_listing_data = []
+            account_path = '/v1/%s' % account
+            for container, objects in containers.items():
+                container_path = account_path + '/' + container
+                container_listing_data = []
+                for entry in objects:
+                    (obj_name, storage_policy_index,
+                     timestamp, content_type) = entry
+                    if storage_policy_index is None and not obj_name:
+                        # empty container
+                        continue
+                    obj_path = swob.str_to_wsgi(
+                        container_path + '/' + obj_name)
+                    # some tests setup mock listings using floats, some use
+                    # strings, so normalize here
+                    ts = Timestamp(timestamp)
+                    headers = {'X-Timestamp': ts.normal,
+                               'X-Backend-Timestamp': ts.internal}
+                    # register object response
+                    self.app.storage_policy[storage_policy_index].register(
+                        'GET', obj_path, swob.HTTPOk, headers)
+                    self.app.storage_policy[storage_policy_index].register(
+                        'DELETE', obj_path, swob.HTTPNoContent, {})
+                    # container listing entry
+                    obj_data = {
+                        'bytes': 0,
+                        # listing data is unicode
+                        'name': obj_name,
+                        'last_modified': ts.isoformat,
+                        'hash': ts.internal,
+                        'content_type': content_type,
+                    }
+                    container_listing_data.append(obj_data)
+                container_listing_data.sort(key=operator.itemgetter('name'))
+                # register container listing response
+                container_headers = {}
+                container_qry_string = helpers.normalize_query_string(
+                    '?format=json&marker=&end_marker=&prefix=')
+                self.app.register('GET', container_path + container_qry_string,
+                                  swob.HTTPOk, container_headers,
+                                  json.dumps(container_listing_data))
+                if container_listing_data:
+                    obj_name = container_listing_data[-1]['name']
+                    # client should quote and encode marker
+                    end_qry_string = helpers.normalize_query_string(
+                        '?format=json&marker=%s&end_marker=&prefix=' % (
+                            urllib.parse.quote(obj_name.encode('utf-8'))))
+                    self.app.register('GET', container_path + end_qry_string,
+                                      swob.HTTPOk, container_headers,
+                                      json.dumps([]))
+                self.app.register('DELETE', container_path,
+                                  swob.HTTPConflict, {}, '')
+                # simple account listing entry
+                container_data = {'name': container}
+                account_listing_data.append(container_data)
+            # register account response
+            account_listing_data.sort(key=operator.itemgetter('name'))
+            account_headers = {}
+            account_qry_string = '?format=json&marker=&end_marker=&prefix='
+            self.app.register('GET', account_path + account_qry_string,
+                              swob.HTTPOk, account_headers,
+                              json.dumps(account_listing_data))
+            end_qry_string = '?format=json&marker=%s&end_marker=&prefix=' % (
+                urllib.parse.quote(account_listing_data[-1]['name']))
+            self.app.register('GET', account_path + end_qry_string,
+                              swob.HTTPOk, account_headers,
+                              json.dumps([]))
+
+
+class TestReconcilerUtils(unittest.TestCase):
+
+    def setUp(self):
+        self.fake_ring = FakeRing()
+        reconciler.direct_get_container_policy_index.reset()
+        self.tempdir = mkdtemp()
+        self.ts_iter = make_timestamp_iter()
+
+    def tearDown(self):
+        shutil.rmtree(self.tempdir, ignore_errors=True)
+
+    def test_parse_raw_obj(self):
+        ts = [next(self.ts_iter) for _ in range(2)]
+        got = reconciler.parse_raw_obj({
+            'name': "2:/AUTH_bob/con/obj",
+            'hash': ts[0].internal,
+            'last_modified': timestamp_to_last_modified(ts[1]),
+            'content_type': 'application/x-delete',
+        })
+        self.assertEqual(got['q_policy_index'], 2)
+        self.assertEqual(got['account'], 'AUTH_bob')
+        self.assertEqual(got['container'], 'con')
+        self.assertEqual(got['obj'], 'obj')
+        self.assertEqual(got['q_ts'], ts[0])
+        self.assertEqual(got['q_record'], ts[1])
+        self.assertEqual(got['q_op'], 'DELETE')
+
+        ts = [next(self.ts_iter) for _ in range(4)]
+        got = reconciler.parse_raw_obj({
+            'name': "1:/AUTH_bob/con/obj",
+            'hash': ts[0].internal,
+            'last_modified': timestamp_to_last_modified(ts[1]),
+            'content_type': 'application/x-put',
+        })
+        self.assertEqual(got['q_policy_index'], 1)
+        self.assertEqual(got['account'], 'AUTH_bob')
+        self.assertEqual(got['container'], 'con')
+        self.assertEqual(got['obj'], 'obj')
+        self.assertEqual(got['q_ts'], ts[0])
+        self.assertEqual(got['q_record'], ts[1])
+        self.assertEqual(got['q_op'], 'PUT')
+
+        # the 'hash' field in object listing has the raw 'created_at' value
+        # which could be a composite of timestamps
+        timestamp_str = encode_timestamps(ts[0], ts[2], ts[3], explicit=True)
+        got = reconciler.parse_raw_obj({
+            'name': "1:/AUTH_bob/con/obj",
+            'hash': timestamp_str,
+            'last_modified': timestamp_to_last_modified(ts[1]),
+            'content_type': 'application/x-put',
+        })
+        self.assertEqual(got['q_policy_index'], 1)
+        self.assertEqual(got['account'], 'AUTH_bob')
+        self.assertEqual(got['container'], 'con')
+        self.assertEqual(got['obj'], 'obj')
+        self.assertEqual(got['q_ts'], ts[0])
+        self.assertEqual(got['q_record'], ts[1])
+        self.assertEqual(got['q_op'], 'PUT')
+
+        # negative test
+        obj_info = {
+            'name': "1:/AUTH_bob/con/obj",
+            'hash': ts[0].internal,
+            'last_modified': timestamp_to_last_modified(ts[1]),
+        }
+        self.assertRaises(ValueError, reconciler.parse_raw_obj, obj_info)
+        obj_info['content_type'] = 'foo'
+        self.assertRaises(ValueError, reconciler.parse_raw_obj, obj_info)
+        obj_info['content_type'] = 'appliation/x-post'
+        self.assertRaises(ValueError, reconciler.parse_raw_obj, obj_info)
+        self.assertRaises(ValueError, reconciler.parse_raw_obj,
+                          {'name': 'bogus'})
+        self.assertRaises(ValueError, reconciler.parse_raw_obj,
+                          {'name': '-1:/AUTH_test/container'})
+        self.assertRaises(ValueError, reconciler.parse_raw_obj,
+                          {'name': 'asdf:/AUTH_test/c/obj'})
+        self.assertRaises(KeyError, reconciler.parse_raw_obj,
+                          {'name': '0:/AUTH_test/c/obj',
+                           'content_type': 'application/x-put'})
+
+    def test_get_container_policy_index(self):
+        ts = itertools.count(int(time.time()))
+        mock_path = 'swift.container.reconciler.direct_head_container'
+        stub_resp_headers = [
+            container_resp_headers(
+                status_changed_at=Timestamp(next(ts)).internal,
+                storage_policy_index=0,
+            ),
+            container_resp_headers(
+                status_changed_at=Timestamp(next(ts)).internal,
+                storage_policy_index=1,
+            ),
+            container_resp_headers(
+                status_changed_at=Timestamp(next(ts)).internal,
+                storage_policy_index=0,
+            ),
+        ]
+        for permutation in itertools.permutations((0, 1, 2)):
+            reconciler.direct_get_container_policy_index.reset()
+            resp_headers = [stub_resp_headers[i] for i in permutation]
+            with mock.patch(mock_path) as direct_head:
+                direct_head.side_effect = resp_headers
+                oldest_spi = reconciler.direct_get_container_policy_index(
+                    self.fake_ring, 'a', 'con')
+            test_values = [(info['x-storage-policy-index'],
+                            info['x-backend-status-changed-at']) for
+                           info in resp_headers]
+            self.assertEqual(oldest_spi, 0,
+                             "oldest policy index wrong "
+                             "for permutation %r" % test_values)
+
+    def test_get_container_policy_index_with_error(self):
+        ts = itertools.count(int(time.time()))
+        mock_path = 'swift.container.reconciler.direct_head_container'
+        stub_resp_headers = [
+            container_resp_headers(
+                status_change_at=next(ts),
+                storage_policy_index=2,
+            ),
+            container_resp_headers(
+                status_changed_at=next(ts),
+                storage_policy_index=1,
+            ),
+            # old timestamp, but 500 should be ignored...
+            ClientException(
+                'Container Server blew up',
+                http_status=500, http_reason='Server Error',
+                http_headers=container_resp_headers(
+                    status_changed_at=Timestamp(0).internal,
+                    storage_policy_index=0,
+                ),
+            ),
+        ]
+        random.shuffle(stub_resp_headers)
+        with mock.patch(mock_path) as direct_head:
+            direct_head.side_effect = stub_resp_headers
+            oldest_spi = reconciler.direct_get_container_policy_index(
+                self.fake_ring, 'a', 'con')
+        self.assertEqual(oldest_spi, 2)
+
+    def test_get_container_policy_index_with_socket_error(self):
+        ts = itertools.count(int(time.time()))
+        mock_path = 'swift.container.reconciler.direct_head_container'
+        stub_resp_headers = [
+            container_resp_headers(
+                status_changed_at=Timestamp(next(ts)).internal,
+                storage_policy_index=1,
+            ),
+            container_resp_headers(
+                status_changed_at=Timestamp(next(ts)).internal,
+                storage_policy_index=0,
+            ),
+            socket.error(errno.ECONNREFUSED, os.strerror(errno.ECONNREFUSED)),
+        ]
+        random.shuffle(stub_resp_headers)
+        with mock.patch(mock_path) as direct_head:
+            direct_head.side_effect = stub_resp_headers
+            oldest_spi = reconciler.direct_get_container_policy_index(
+                self.fake_ring, 'a', 'con')
+        self.assertEqual(oldest_spi, 1)
+
+    def test_get_container_policy_index_with_too_many_errors(self):
+        ts = itertools.count(int(time.time()))
+        mock_path = 'swift.container.reconciler.direct_head_container'
+        stub_resp_headers = [
+            container_resp_headers(
+                status_changed_at=Timestamp(next(ts)).internal,
+                storage_policy_index=0,
+            ),
+            socket.error(errno.ECONNREFUSED, os.strerror(errno.ECONNREFUSED)),
+            ClientException(
+                'Container Server blew up',
+                http_status=500, http_reason='Server Error',
+                http_headers=container_resp_headers(
+                    status_changed_at=Timestamp(next(ts)).internal,
+                    storage_policy_index=1,
+                ),
+            ),
+        ]
+        random.shuffle(stub_resp_headers)
+        with mock.patch(mock_path) as direct_head:
+            direct_head.side_effect = stub_resp_headers
+            oldest_spi = reconciler.direct_get_container_policy_index(
+                self.fake_ring, 'a', 'con')
+        self.assertIsNone(oldest_spi)
+
+    def test_get_container_policy_index_for_deleted(self):
+        mock_path = 'swift.container.reconciler.direct_head_container'
+        headers = container_resp_headers(
+            status_changed_at=Timestamp.now().internal,
+            storage_policy_index=1,
+        )
+        stub_resp_headers = [
+            ClientException(
+                'Container Not Found',
+                http_status=404, http_reason='Not Found',
+                http_headers=headers,
+            ),
+            ClientException(
+                'Container Not Found',
+                http_status=404, http_reason='Not Found',
+                http_headers=headers,
+            ),
+            ClientException(
+                'Container Not Found',
+                http_status=404, http_reason='Not Found',
+                http_headers=headers,
+            ),
+        ]
+        random.shuffle(stub_resp_headers)
+        with mock.patch(mock_path) as direct_head:
+            direct_head.side_effect = stub_resp_headers
+            oldest_spi = reconciler.direct_get_container_policy_index(
+                self.fake_ring, 'a', 'con')
+        self.assertEqual(oldest_spi, 1)
+
+    def test_get_container_policy_index_for_recently_deleted(self):
+        ts = itertools.count(int(time.time()))
+        mock_path = 'swift.container.reconciler.direct_head_container'
+        stub_resp_headers = [
+            ClientException(
+                'Container Not Found',
+                http_status=404, http_reason='Not Found',
+                http_headers=container_resp_headers(
+                    put_timestamp=next(ts),
+                    delete_timestamp=next(ts),
+                    status_changed_at=next(ts),
+                    storage_policy_index=0,
+                ),
+            ),
+            ClientException(
+                'Container Not Found',
+                http_status=404, http_reason='Not Found',
+                http_headers=container_resp_headers(
+                    put_timestamp=next(ts),
+                    delete_timestamp=next(ts),
+                    status_changed_at=next(ts),
+                    storage_policy_index=1,
+                ),
+            ),
+            ClientException(
+                'Container Not Found',
+                http_status=404, http_reason='Not Found',
+                http_headers=container_resp_headers(
+                    put_timestamp=next(ts),
+                    delete_timestamp=next(ts),
+                    status_changed_at=next(ts),
+                    storage_policy_index=2,
+                ),
+            ),
+        ]
+        random.shuffle(stub_resp_headers)
+        with mock.patch(mock_path) as direct_head:
+            direct_head.side_effect = stub_resp_headers
+            oldest_spi = reconciler.direct_get_container_policy_index(
+                self.fake_ring, 'a', 'con')
+        self.assertEqual(oldest_spi, 2)
+
+    def test_get_container_policy_index_for_recently_recreated(self):
+        ts = itertools.count(int(time.time()))
+        mock_path = 'swift.container.reconciler.direct_head_container'
+        stub_resp_headers = [
+            # old put, no recreate
+            container_resp_headers(
+                delete_timestamp=0,
+                put_timestamp=next(ts),
+                status_changed_at=next(ts),
+                storage_policy_index=0,
+            ),
+            # recently deleted
+            ClientException(
+                'Container Not Found',
+                http_status=404, http_reason='Not Found',
+                http_headers=container_resp_headers(
+                    put_timestamp=next(ts),
+                    delete_timestamp=next(ts),
+                    status_changed_at=next(ts),
+                    storage_policy_index=1,
+                ),
+            ),
+            # recently recreated
+            container_resp_headers(
+                delete_timestamp=next(ts),
+                put_timestamp=next(ts),
+                status_changed_at=next(ts),
+                storage_policy_index=2,
+            ),
+        ]
+        random.shuffle(stub_resp_headers)
+        with mock.patch(mock_path) as direct_head:
+            direct_head.side_effect = stub_resp_headers
+            oldest_spi = reconciler.direct_get_container_policy_index(
+                self.fake_ring, 'a', 'con')
+        self.assertEqual(oldest_spi, 2)
+
+    def test_get_container_policy_index_for_recently_split_brain(self):
+        ts = itertools.count(int(time.time()))
+        mock_path = 'swift.container.reconciler.direct_head_container'
+        stub_resp_headers = [
+            # oldest put
+            container_resp_headers(
+                delete_timestamp=0,
+                put_timestamp=next(ts),
+                status_changed_at=next(ts),
+                storage_policy_index=0,
+            ),
+            # old recreate
+            container_resp_headers(
+                delete_timestamp=next(ts),
+                put_timestamp=next(ts),
+                status_changed_at=next(ts),
+                storage_policy_index=1,
+            ),
+            # recently put
+            container_resp_headers(
+                delete_timestamp=0,
+                put_timestamp=next(ts),
+                status_changed_at=next(ts),
+                storage_policy_index=2,
+            ),
+        ]
+        random.shuffle(stub_resp_headers)
+        with mock.patch(mock_path) as direct_head:
+            direct_head.side_effect = stub_resp_headers
+            oldest_spi = reconciler.direct_get_container_policy_index(
+                self.fake_ring, 'a', 'con')
+        self.assertEqual(oldest_spi, 1)
+
+    @patch_policies(
+        [StoragePolicy(0, 'zero', is_default=True),
+         StoragePolicy(1, 'one'),
+         StoragePolicy(2, 'two')])
+    def test_get_container_policy_index_for_recently_split_recreated(self):
+        # verify that get_container_policy_index reaches same conclusion as a
+        # container server that receives all requests in chronological order
+        ts_iter = make_timestamp_iter()
+        ts = [next(ts_iter) for _ in range(8)]
+
+        # make 3 container replicas
+        device_dirs = [os.path.join(self.tempdir, str(i)) for i in range(3)]
+        for device_dir in device_dirs:
+            mkdirs(os.path.join(device_dir, 'sda1'))
+        controllers = [ContainerController(
+            {'devices': devices,
+             'mount_check': 'false',
+             'replication_server': 'true'})
+            for devices in device_dirs]
+
+        # initial PUT goes to all 3 replicas
+        responses = []
+        for controller in controllers:
+            req = Request.blank('/sda1/p/a/c', method='PUT', headers={
+                'X-Timestamp': ts[0].internal,
+                'X-Backend-Storage-Policy-Index': 0,
+            })
+            responses.append(req.get_response(controller))
+        self.assertEqual([resp.status_int for resp in responses],
+                         [201, 201, 201])
+
+        # DELETE to all 3 replicas
+        responses = []
+        for controller in controllers:
+            req = Request.blank('/sda1/p/a/c', method='DELETE', headers={
+                'X-Timestamp': ts[2].internal,
+            })
+            responses.append(req.get_response(controller))
+        self.assertEqual([resp.status_int for resp in responses],
+                         [204, 204, 204])
+
+        # first recreate PUT, SPI=1, goes to replicas 0 and 1
+        responses = []
+        for controller in controllers[:2]:
+            req = Request.blank('/sda1/p/a/c', method='PUT', headers={
+                'X-Timestamp': ts[3].internal,
+                'X-Backend-Storage-Policy-Index': 1,
+            })
+            responses.append(req.get_response(controller))
+        # all ok, PUT follows DELETE
+        self.assertEqual([resp.status_int for resp in responses],
+                         [201, 201])
+
+        # second recreate PUT, SPI=2, goes to replicas 0 and 2
+        responses = []
+        for controller in [controllers[0], controllers[2]]:
+            req = Request.blank('/sda1/p/a/c', method='PUT', headers={
+                'X-Timestamp': ts[5].internal,
+                'X-Backend-Storage-Policy-Index': 2,
+            })
+            responses.append(req.get_response(controller))
+        # note: 409 from replica 0 because PUT follows previous PUT
+        self.assertEqual([resp.status_int for resp in responses],
+                         [409, 201])
+
+        # now do a HEAD on all replicas
+        responses = []
+        for controller in controllers:
+            req = Request.blank('/sda1/p/a/c', method='HEAD')
+            responses.append(req.get_response(controller))
+        self.assertEqual([resp.status_int for resp in responses],
+                         [204, 204, 204])
+
+        resp_headers = [resp.headers for resp in responses]
+        # replica 0 should be authoritative because it received all requests
+        self.assertEqual(ts[3].normal, resp_headers[0]['X-Put-Timestamp'])
+        self.assertEqual('1',
+                         resp_headers[0]['X-Backend-Storage-Policy-Index'])
+        self.assertEqual(ts[3].normal, resp_headers[1]['X-Put-Timestamp'])
+        self.assertEqual('1',
+                         resp_headers[1]['X-Backend-Storage-Policy-Index'])
+        self.assertEqual(ts[5].normal, resp_headers[2]['X-Put-Timestamp'])
+        self.assertEqual('2',
+                         resp_headers[2]['X-Backend-Storage-Policy-Index'])
+
+        # now feed the headers from each replica to
+        # direct_get_container_policy_index
+        mock_path = 'swift.container.reconciler.direct_head_container'
+        random.shuffle(resp_headers)
+        with mock.patch(mock_path) as direct_head:
+            direct_head.side_effect = resp_headers
+            oldest_spi = reconciler.direct_get_container_policy_index(
+                self.fake_ring, 'a', 'con')
+        # expect the same outcome as the authoritative replica 0
+        self.assertEqual(oldest_spi, 1)
+
+    def test_get_container_policy_index_cache(self):
+        now = time.time()
+        ts = itertools.count(int(now))
+        mock_path = 'swift.container.reconciler.direct_head_container'
+        stub_resp_headers = [
+            container_resp_headers(
+                status_changed_at=Timestamp(next(ts)).internal,
+                storage_policy_index=0,
+            ),
+            container_resp_headers(
+                status_changed_at=Timestamp(next(ts)).internal,
+                storage_policy_index=1,
+            ),
+            container_resp_headers(
+                status_changed_at=Timestamp(next(ts)).internal,
+                storage_policy_index=0,
+            ),
+        ]
+        random.shuffle(stub_resp_headers)
+        with mock.patch(mock_path) as direct_head:
+            direct_head.side_effect = stub_resp_headers
+            oldest_spi = reconciler.direct_get_container_policy_index(
+                self.fake_ring, 'a', 'con')
+        self.assertEqual(oldest_spi, 0)
+        # re-mock with errors
+        stub_resp_headers = [
+            socket.error(errno.ECONNREFUSED, os.strerror(errno.ECONNREFUSED)),
+            socket.error(errno.ECONNREFUSED, os.strerror(errno.ECONNREFUSED)),
+            socket.error(errno.ECONNREFUSED, os.strerror(errno.ECONNREFUSED)),
+        ]
+        with mock.patch('time.time', new=lambda: now):
+            with mock.patch(mock_path) as direct_head:
+                direct_head.side_effect = stub_resp_headers
+                oldest_spi = reconciler.direct_get_container_policy_index(
+                    self.fake_ring, 'a', 'con')
+        # still cached
+        self.assertEqual(oldest_spi, 0)
+        # propel time forward
+        the_future = now + 31
+        with mock.patch('time.time', new=lambda: the_future):
+            with mock.patch(mock_path) as direct_head:
+                direct_head.side_effect = stub_resp_headers
+                oldest_spi = reconciler.direct_get_container_policy_index(
+                    self.fake_ring, 'a', 'con')
+        # expired
+        self.assertIsNone(oldest_spi)
+
+    def test_direct_delete_container_entry(self):
+        mock_path = 'swift.common.direct_client.http_connect'
+        connect_args = []
+
+        def test_connect(ipaddr, port, device, partition, method, path,
+                         headers=None, query_string=None):
+            connect_args.append({
+                'ipaddr': ipaddr, 'port': port, 'device': device,
+                'partition': partition, 'method': method, 'path': path,
+                'headers': headers, 'query_string': query_string})
+
+        x_timestamp = Timestamp.now()
+        headers = {'x-timestamp': x_timestamp.internal}
+        fake_hc = fake_http_connect(200, 200, 200, give_connect=test_connect)
+        with mock.patch(mock_path, fake_hc):
+            reconciler.direct_delete_container_entry(
+                self.fake_ring, 'a', 'c', 'o', headers=headers)
+
+        self.assertEqual(len(connect_args), 3)
+        for args in connect_args:
+            self.assertEqual(args['method'], 'DELETE')
+            self.assertEqual(args['path'], '/a/c/o')
+            self.assertEqual(args['headers'].get('x-timestamp'),
+                             headers['x-timestamp'])
+
+    def test_direct_delete_container_entry_with_errors(self):
+        # setup mock direct_delete
+        mock_path = \
+            'swift.container.reconciler.direct_delete_container_object'
+        stub_resp = [
+            None,
+            socket.error(errno.ECONNREFUSED, os.strerror(errno.ECONNREFUSED)),
+            ClientException(
+                'Container Server blew up',
+                '10.0.0.12', 6201, 'sdj', 404, 'Not Found'
+            ),
+        ]
+        mock_direct_delete = mock.MagicMock()
+        mock_direct_delete.side_effect = stub_resp
+
+        with mock.patch(mock_path, mock_direct_delete), \
+                mock.patch('eventlet.greenpool.DEBUG', False):
+            rv = reconciler.direct_delete_container_entry(
+                self.fake_ring, 'a', 'c', 'o')
+        self.assertIsNone(rv)
+        self.assertEqual(len(mock_direct_delete.mock_calls), 3)
+
+    def test_add_to_reconciler_queue(self):
+        mock_path = 'swift.common.direct_client.http_connect'
+        connect_args = []
+
+        def test_connect(ipaddr, port, device, partition, method, path,
+                         headers=None, query_string=None):
+            connect_args.append({
+                'ipaddr': ipaddr, 'port': port, 'device': device,
+                'partition': partition, 'method': method, 'path': path,
+                'headers': headers, 'query_string': query_string})
+
+        fake_hc = fake_http_connect(200, 200, 200, give_connect=test_connect)
+        with mock.patch(mock_path, fake_hc):
+            ret = reconciler.add_to_reconciler_queue(
+                self.fake_ring, 'a', 'c', 'o', 17, 5948918.63946, 'DELETE')
+
+        self.assertTrue(ret)
+        self.assertEqual(ret, str(int(5948918.63946 // 3600 * 3600)))
+        self.assertEqual(len(connect_args), 3)
+
+        required_headers = ('x-content-type', 'x-etag')
+
+        for args in connect_args:
+            self.assertEqual(args['headers']['X-Timestamp'], '5948918.63946')
+            self.assertEqual(args['path'],
+                             '/.misplaced_objects/5947200/17:/a/c/o')
+            self.assertEqual(args['headers']['X-Content-Type'],
+                             'application/x-delete')
+            for header in required_headers:
+                self.assertTrue(header in args['headers'],
+                                '%r was missing request headers %r' % (
+                                    header, args['headers']))
+
+    def test_add_to_reconciler_queue_force(self):
+        mock_path = 'swift.common.direct_client.http_connect'
+        connect_args = []
+
+        def test_connect(ipaddr, port, device, partition, method, path,
+                         headers=None, query_string=None):
+            connect_args.append({
+                'ipaddr': ipaddr, 'port': port, 'device': device,
+                'partition': partition, 'method': method, 'path': path,
+                'headers': headers, 'query_string': query_string})
+
+        fake_hc = fake_http_connect(200, 200, 200, give_connect=test_connect)
+        now = next(self.ts_iter)
+        with mock.patch(mock_path, fake_hc), \
+                mock_timestamp_now(now):
+            ret = reconciler.add_to_reconciler_queue(
+                self.fake_ring, 'a', 'c', 'o', 17, 5948918.63946, 'PUT',
+                force=True)
+
+        self.assertTrue(ret)
+        self.assertEqual(ret, str(int(5948918.63946 // 3600 * 3600)))
+        self.assertEqual(len(connect_args), 3)
+
+        required_headers = ('x-size', 'x-content-type')
+
+        for args in connect_args:
+            self.assertEqual(args['headers']['X-Timestamp'],
+                             now.internal)
+            self.assertEqual(args['headers']['X-Etag'], '5948918.63946')
+            self.assertEqual(args['path'],
+                             '/.misplaced_objects/5947200/17:/a/c/o')
+            for header in required_headers:
+                self.assertTrue(header in args['headers'],
+                                '%r was missing request headers %r' % (
+                                    header, args['headers']))
+
+    def test_add_to_reconciler_queue_fails(self):
+        mock_path = 'swift.common.direct_client.http_connect'
+
+        fake_connects = [fake_http_connect(200),
+                         fake_http_connect(200, raise_timeout_exc=True),
+                         fake_http_connect(507)]
+
+        def fake_hc(*a, **kw):
+            return fake_connects.pop()(*a, **kw)
+
+        with mock.patch(mock_path, fake_hc):
+            ret = reconciler.add_to_reconciler_queue(
+                self.fake_ring, 'a', 'c', 'o', 17, 5948918.63946, 'PUT')
+        self.assertFalse(ret)
+
+    def test_add_to_reconciler_queue_socket_error(self):
+        mock_path = 'swift.common.direct_client.http_connect'
+
+        exc = socket.error(errno.ECONNREFUSED,
+                           os.strerror(errno.ECONNREFUSED))
+        fake_connects = [fake_http_connect(200),
+                         fake_http_connect(200, raise_timeout_exc=True),
+                         fake_http_connect(500, raise_exc=exc)]
+
+        def fake_hc(*a, **kw):
+            return fake_connects.pop()(*a, **kw)
+
+        with mock.patch(mock_path, fake_hc):
+            ret = reconciler.add_to_reconciler_queue(
+                self.fake_ring, 'a', 'c', 'o', 17, 5948918.63946, 'DELETE')
+        self.assertFalse(ret)
+
+
+def listing_qs(marker):
+    return helpers.normalize_query_string(
+        "?format=json&marker=%s&end_marker=&prefix=" %
+        urllib.parse.quote(marker.encode('utf-8')))
+
+
+@patch_policies(
+    [StoragePolicy(0, 'zero', is_default=True),
+     ECStoragePolicy(1, 'one', ec_type=DEFAULT_TEST_EC_TYPE,
+                     ec_ndata=6, ec_nparity=2), ],
+    fake_ring_args=[{}, {'replicas': 8}])
+class TestReconciler(unittest.TestCase):
+
+    maxDiff = None
+
+    def setUp(self):
+        self.logger = debug_logger()
+        conf = {}
+        self.swift = FakeInternalClient()
+        self.reconciler = reconciler.ContainerReconciler(
+            conf, logger=self.logger, swift=self.swift)
+        self.start_interval = int(time.time() // 3600 * 3600)
+        self.current_container_path = '/v1/.misplaced_objects/%d' % (
+            self.start_interval) + listing_qs('')
+        self.ts_iter = make_timestamp_iter()
+
+    def test_concurrency_config(self):
+        conf = {}
+        r = reconciler.ContainerReconciler(conf, self.logger, self.swift)
+        self.assertEqual(r.concurrency, 1)
+
+        conf = {'concurrency': '10'}
+        r = reconciler.ContainerReconciler(conf, self.logger, self.swift)
+        self.assertEqual(r.concurrency, 10)
+
+        conf = {'concurrency': 48}
+        r = reconciler.ContainerReconciler(conf, self.logger, self.swift)
+        self.assertEqual(r.concurrency, 48)
+
+        conf = {'concurrency': 0}
+        self.assertRaises(ValueError, reconciler.ContainerReconciler,
+                          conf, self.logger, self.swift)
+
+        conf = {'concurrency': '-1'}
+        self.assertRaises(ValueError, reconciler.ContainerReconciler,
+                          conf, self.logger, self.swift)
+
+    def test_processes_config(self):
+        conf = {}
+        r = reconciler.ContainerReconciler(conf, self.logger, self.swift)
+        self.assertEqual(r.process, 0)
+        self.assertEqual(r.processes, 0)
+
+        conf = {'processes': '1'}
+        r = reconciler.ContainerReconciler(conf, self.logger, self.swift)
+        self.assertEqual(r.process, 0)
+        self.assertEqual(r.processes, 1)
+
+        conf = {'processes': 10, 'process': '9'}
+        r = reconciler.ContainerReconciler(conf, self.logger, self.swift)
+        self.assertEqual(r.process, 9)
+        self.assertEqual(r.processes, 10)
+
+        conf = {'processes': -1}
+        self.assertRaises(ValueError, reconciler.ContainerReconciler,
+                          conf, self.logger, self.swift)
+
+        conf = {'process': -1}
+        self.assertRaises(ValueError, reconciler.ContainerReconciler,
+                          conf, self.logger, self.swift)
+
+        conf = {'processes': 9, 'process': 9}
+        self.assertRaises(ValueError, reconciler.ContainerReconciler,
+                          conf, self.logger, self.swift)
+
+    def test_init_internal_client_log_name(self):
+        def _do_test_init_ic_log_name(conf, exp_internal_client_log_name):
+            with mock.patch(
+                    'swift.container.reconciler.InternalClient') \
+                    as mock_ic:
+                reconciler.ContainerReconciler(conf)
+            mock_ic.assert_called_once_with(
+                '/etc/swift/container-reconciler.conf',
+                'Swift Container Reconciler', 3,
+                global_conf={'log_name': exp_internal_client_log_name},
+                use_replication_network=True)
+
+        _do_test_init_ic_log_name({}, 'container-reconciler-ic')
+        _do_test_init_ic_log_name({'log_name': 'my-container-reconciler'},
+                                  'my-container-reconciler-ic')
+
+    def _mock_listing(self, objects):
+        self.swift.parse(objects)
+        self.fake_swift = self.reconciler.swift.app
+
+    def _mock_oldest_spi(self, container_oldest_spi_map):
+        self.fake_swift._mock_oldest_spi_map = container_oldest_spi_map
+
+    def _run_once(self):
+        """
+        Helper method to run the reconciler once with appropriate direct-client
+        mocks in place.
+
+        Returns the list of direct-deleted container entries in the format
+        [(acc1, con1, obj1), ...]
+        """
+
+        def mock_oldest_spi(ring, account, container_name):
+            return self.fake_swift._mock_oldest_spi_map.get(container_name, 0)
+
+        items = {
+            'direct_get_container_policy_index': mock_oldest_spi,
+            'direct_delete_container_entry': mock.DEFAULT,
+        }
+
+        mock_time_iter = itertools.count(self.start_interval)
+        with mock.patch.multiple(reconciler, **items) as mocks:
+            self.mock_delete_container_entry = \
+                mocks['direct_delete_container_entry']
+            with mock.patch('time.time', lambda: next(mock_time_iter)):
+                self.reconciler.run_once()
+
+        return [tuple(list(c[1][1:4]) + [c[2]['headers']['X-Timestamp']])
+                for c in mocks['direct_delete_container_entry'].mock_calls]
+
+    def test_no_concurrency(self):
+        ts = [next(self.ts_iter) for _ in range(2)]
+
+        self._mock_listing({
+            (None, "/.misplaced_objects/3600/1:/AUTH_bob/c/o1"): ts[0],
+            (None, "/.misplaced_objects/3600/1:/AUTH_bob/c/o2"): ts[1],
+            (1, "/AUTH_bob/c/o1"): ts[0],
+            (1, "/AUTH_bob/c/o2"): ts[1],
+        })
+
+        order_recieved = []
+
+        def fake_reconcile_object(account, container, obj, q_policy_index,
+                                  q_ts, q_op, path, **kwargs):
+            order_recieved.append(obj)
+            return True
+
+        self.reconciler._reconcile_object = fake_reconcile_object
+        self.assertEqual(self.reconciler.concurrency, 1)  # sanity
+        deleted_container_entries = self._run_once()
+        self.assertEqual(order_recieved, ['o1', 'o2'])
+        # process in order recieved
+        self.assertEqual(deleted_container_entries, [
+            ('.misplaced_objects', '3600', '1:/AUTH_bob/c/o1',
+             Timestamp(ts[0], offset=2).internal),
+            ('.misplaced_objects', '3600', '1:/AUTH_bob/c/o2',
+             Timestamp(ts[1], offset=2).internal)
+        ])
+
+    def test_concurrency(self):
+        ts = [next(self.ts_iter) for _ in range(2)]
+
+        self._mock_listing({
+            (None, "/.misplaced_objects/3600/1:/AUTH_bob/c/o1"): ts[0],
+            (None, "/.misplaced_objects/3600/1:/AUTH_bob/c/o2"): ts[1],
+            (1, "/AUTH_bob/c/o1"): ts[0],
+            (1, "/AUTH_bob/c/o2"): ts[1],
+        })
+
+        order_recieved = []
+
+        def fake_reconcile_object(account, container, obj, q_policy_index,
+                                  q_ts, q_op, path, **kwargs):
+            order_recieved.append(obj)
+            if obj == 'o1':
+                # o1 takes longer than o2 for some reason
+                for i in range(10):
+                    eventlet.sleep(0.0)
+            return True
+
+        self.reconciler._reconcile_object = fake_reconcile_object
+        self.reconciler.concurrency = 2
+        deleted_container_entries = self._run_once()
+        self.assertEqual(order_recieved, ['o1', 'o2'])
+        # ... and so we finish o2 first
+        self.assertEqual(deleted_container_entries, [
+            ('.misplaced_objects', '3600', '1:/AUTH_bob/c/o2',
+             Timestamp(ts[1], offset=2).internal),
+            ('.misplaced_objects', '3600', '1:/AUTH_bob/c/o1',
+             Timestamp(ts[0], offset=2).internal),
+        ])
+
+    def test_multi_process_should_process(self):
+        def mkqi(a, c, o):
+            "make queue item"
+            return {
+                'account': a,
+                'container': c,
+                'obj': o,
+            }
+        queue = [
+            mkqi('a', 'c', 'o1'),
+            mkqi('a', 'c', 'o2'),
+            mkqi('a', 'c', 'o3'),
+            mkqi('a', 'c', 'o4'),
+        ]
+
+        def map_should_process(process, processes):
+            self.reconciler.process = process
+            self.reconciler.processes = processes
+            with mock.patch('swift.common.utils.HASH_PATH_SUFFIX',
+                            b'endcap'), \
+                    mock.patch('swift.common.utils.HASH_PATH_PREFIX', b''):
+                return [self.reconciler.should_process(q_item)
+                        for q_item in queue]
+
+        def check_process(process, processes, expected):
+            should_process = map_should_process(process, processes)
+            try:
+                self.assertEqual(should_process, expected)
+            except AssertionError as e:
+                self.fail('unexpected items processed for %s/%s\n%s' % (
+                    process, processes, e))
+
+        check_process(0, 0, [True] * 4)
+        check_process(0, 1, [True] * 4)
+        check_process(0, 2, [False, True, False, False])
+        check_process(1, 2, [True, False, True, True])
+
+        check_process(0, 4, [False, True, False, False])
+        check_process(1, 4, [True, False, False, False])
+        check_process(2, 4, [False] * 4)  # lazy
+        check_process(3, 4, [False, False, True, True])
+
+        queue = [mkqi('a%s' % i, 'c%s' % i, 'o%s' % i) for i in range(1000)]
+        items_handled = [0] * 1000
+        for process in range(100):
+            should_process = map_should_process(process, 100)
+            for i, handled in enumerate(should_process):
+                if handled:
+                    items_handled[i] += 1
+        self.assertEqual([1] * 1000, items_handled)
+
+    def test_invalid_queue_name(self):
+        self._mock_listing({
+            (None, "/.misplaced_objects/3600/bogus"): 3618.84187,
+        })
+        deleted_container_entries = self._run_once()
+        # we try to find something useful
+        self.assertEqual(
+            self.fake_swift.calls,
+            [('GET', self.current_container_path),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('3600')),
+             ('GET', '/v1/.misplaced_objects/3600' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects/3600' +
+              listing_qs('bogus'))])
+        # but only get the bogus record
+        self.assertEqual(self.reconciler.stats['invalid_record'], 1)
+        # and just leave it on the queue
+        self.assertEqual(self.reconciler.stats['pop_queue'], 0)
+        self.assertFalse(deleted_container_entries)
+
+    def test_invalid_queue_name_marches_onward(self):
+        ts = [next(self.ts_iter) for _ in range(2)]
+
+        # there's something useful there on the queue
+        self._mock_listing({
+            (None, "/.misplaced_objects/3600/00000bogus"): ts[0],
+            (None, "/.misplaced_objects/3600/1:/AUTH_bob/c/o1"): ts[1],
+            (1, "/AUTH_bob/c/o1"): ts[1],
+        })
+        self._mock_oldest_spi({'c': 1})  # already in the right spot!
+        deleted_container_entries = self._run_once()
+        # we get all the queue entries we can
+        self.assertEqual(
+            self.fake_swift.calls,
+            [('GET', self.current_container_path),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('3600')),
+             ('GET', '/v1/.misplaced_objects/3600' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects/3600' +
+              listing_qs('1:/AUTH_bob/c/o1'))])
+        # and one is garbage
+        self.assertEqual(self.reconciler.stats['invalid_record'], 1)
+        # but the other is workable
+        self.assertEqual(self.reconciler.stats['noop_object'], 1)
+        # so pop the queue for that one
+        self.assertEqual(self.reconciler.stats['pop_queue'], 1)
+        self.assertEqual(deleted_container_entries,
+                         [('.misplaced_objects', '3600', '1:/AUTH_bob/c/o1',
+                           Timestamp(ts[1], offset=2).internal)])
+        self.assertEqual(self.reconciler.stats['success'], 1)
+
+    def test_queue_name_with_policy_index_delimiter_in_name(self):
+        ts1 = next(self.ts_iter)
+        q_path = '.misplaced_objects/3600'
+        obj_path = "AUTH_bob/c:sneaky/o1:sneaky"
+        # there's something useful there on the queue
+        self._mock_listing({
+            (None, "/%s/1:/%s" % (q_path, obj_path)): ts1,
+            (1, '/%s' % obj_path): ts1,
+        })
+        self._mock_oldest_spi({'c': 0})
+        deleted_container_entries = self._run_once()
+        # we find the misplaced object
+        self.assertEqual(self.reconciler.stats['misplaced_object'], 1)
+        self.assertEqual(
+            self.fake_swift.calls,
+            [('GET', self.current_container_path),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('3600')),
+             ('GET', '/v1/.misplaced_objects/3600' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects/3600' +
+              listing_qs('1:/%s' % obj_path))])
+        # move it
+        self.assertEqual(self.reconciler.stats['copy_attempt'], 1)
+        self.assertEqual(self.reconciler.stats['copy_success'], 1)
+        self.assertEqual(
+            self.fake_swift.storage_policy[1].calls,
+            [('GET', '/v1/%s' % obj_path),
+             ('DELETE', '/v1/%s' % obj_path)])
+        delete_headers = self.fake_swift.storage_policy[1].headers[1]
+        self.assertEqual(
+            self.fake_swift.storage_policy[0].calls,
+            [('HEAD', '/v1/%s' % obj_path),
+             ('PUT', '/v1/%s' % obj_path)])
+        # clean up the source
+        self.assertEqual(self.reconciler.stats['cleanup_attempt'], 1)
+        self.assertEqual(self.reconciler.stats['cleanup_success'], 1)
+        # we DELETE the object from the wrong place with source_ts + offset 1
+        # timestamp to make sure the change takes effect
+        self.assertEqual(delete_headers.get('X-Timestamp'),
+                         Timestamp(ts1, offset=1).internal)
+        # and pop the queue for that one
+        self.assertEqual(self.reconciler.stats['pop_queue'], 1)
+        self.assertEqual(deleted_container_entries, [(
+            '.misplaced_objects', '3600', '1:/%s' % obj_path,
+            Timestamp(ts1, offset=2).internal)])
+        self.assertEqual(self.reconciler.stats['success'], 1)
+
+    def test_unable_to_direct_get_oldest_storage_policy(self):
+        self._mock_listing({
+            (None, "/.misplaced_objects/3600/1:/AUTH_bob/c/o1"): 3618.84187,
+        })
+        # the reconciler gets "None" if we can't quorum the container
+        self._mock_oldest_spi({'c': None})
+        deleted_container_entries = self._run_once()
+        # we look for misplaced objects
+        self.assertEqual(
+            self.fake_swift.calls,
+            [('GET', self.current_container_path),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('3600')),
+             ('GET', '/v1/.misplaced_objects/3600' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects/3600' +
+              listing_qs('1:/AUTH_bob/c/o1'))])
+        # but can't really say where to go looking
+        self.assertEqual(self.reconciler.stats['unavailable_container'], 1)
+        # we don't clean up anything
+        self.assertEqual(self.reconciler.stats['cleanup_object'], 0)
+        # and we definitely should not pop_queue
+        self.assertFalse(deleted_container_entries)
+        self.assertEqual(self.reconciler.stats['retry'], 1)
+
+    @patch_policies(
+        [StoragePolicy(0, 'zero', is_default=True),
+         StoragePolicy(1, 'one'),
+         ECStoragePolicy(2, 'two', ec_type=DEFAULT_TEST_EC_TYPE,
+                         ec_ndata=6, ec_nparity=2)],
+        fake_ring_args=[
+            {'next_part_power': 1}, {}, {'next_part_power': 1}])
+    def test_can_reconcile_policy(self):
+        for policy_index, expected in ((0, False), (1, True), (2, False),
+                                       (3, False), ('apple', False),
+                                       (None, False)):
+            self.assertEqual(
+                self.reconciler.can_reconcile_policy(policy_index), expected)
+
+    @patch_policies(
+        [StoragePolicy(0, 'zero', is_default=True),
+         ECStoragePolicy(1, 'one', ec_type=DEFAULT_TEST_EC_TYPE,
+                         ec_ndata=6, ec_nparity=2), ],
+        fake_ring_args=[{'next_part_power': 1}, {}])
+    def test_fail_to_move_if_ppi(self):
+        self._mock_listing({
+            (None, "/.misplaced_objects/3600/1:/AUTH_bob/c/o1"): 3618.84187,
+            (1, "/AUTH_bob/c/o1"): 3618.84187,
+        })
+        self._mock_oldest_spi({'c': 0})
+        deleted_container_entries = self._run_once()
+
+        # skipped sending because policy_index 0 is in the middle of a PPI
+        self.assertFalse(deleted_container_entries)
+        self.assertEqual(
+            self.fake_swift.calls,
+            [('GET', self.current_container_path),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('3600')),
+             ('GET', '/v1/.misplaced_objects/3600' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects/3600' +
+              listing_qs('1:/AUTH_bob/c/o1'))])
+        self.assertEqual(self.reconciler.stats['ppi_skip'], 1)
+        self.assertEqual(self.reconciler.stats['retry'], 1)
+
+    def test_object_move(self):
+        ts1 = next(self.ts_iter)
+        self._mock_listing({
+            (None, "/.misplaced_objects/3600/1:/AUTH_bob/c/o1"): ts1,
+            (1, "/AUTH_bob/c/o1"): ts1,
+        })
+        self._mock_oldest_spi({'c': 0})
+        deleted_container_entries = self._run_once()
+
+        # found a misplaced object
+        self.assertEqual(self.reconciler.stats['misplaced_object'], 1)
+        self.assertEqual(
+            self.fake_swift.calls,
+            [('GET', self.current_container_path),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('3600')),
+             ('GET', '/v1/.misplaced_objects/3600' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects/3600' +
+              listing_qs('1:/AUTH_bob/c/o1'))])
+        # moves it
+        self.assertEqual(self.reconciler.stats['copy_attempt'], 1)
+        self.assertEqual(self.reconciler.stats['copy_success'], 1)
+        self.assertEqual(
+            self.fake_swift.storage_policy[1].calls,
+            [('GET', '/v1/AUTH_bob/c/o1'),
+             ('DELETE', '/v1/AUTH_bob/c/o1')])
+        delete_headers = self.fake_swift.storage_policy[1].headers[1]
+        self.assertEqual(
+            self.fake_swift.storage_policy[0].calls,
+            [('HEAD', '/v1/AUTH_bob/c/o1'),
+             ('PUT', '/v1/AUTH_bob/c/o1')])
+        put_headers = self.fake_swift.storage_policy[0].headers[1]
+        # we PUT the object in the right place with q_ts + offset 3
+        self.assertEqual(put_headers.get('X-Timestamp'),
+                         Timestamp(ts1, offset=3))
+        # cleans up the old
+        self.assertEqual(self.reconciler.stats['cleanup_attempt'], 1)
+        self.assertEqual(self.reconciler.stats['cleanup_success'], 1)
+        # we DELETE the object from the wrong place with source_ts + offset 1
+        # timestamp to make sure the change takes effect
+        self.assertEqual(delete_headers.get('X-Timestamp'),
+                         Timestamp(ts1, offset=1))
+        # and when we're done, we pop the entry from the queue
+        self.assertEqual(self.reconciler.stats['pop_queue'], 1)
+        self.assertEqual(deleted_container_entries,
+                         [('.misplaced_objects', '3600', '1:/AUTH_bob/c/o1',
+                           Timestamp(ts1, offset=2).internal)])
+        self.assertEqual(self.reconciler.stats['success'], 1)
+
+    def test_object_move_the_other_direction(self):
+        ts1 = next(self.ts_iter)
+        self._mock_listing({
+            (None, "/.misplaced_objects/3600/0:/AUTH_bob/c/o1"): ts1,
+            (0, "/AUTH_bob/c/o1"): ts1,
+        })
+        self._mock_oldest_spi({'c': 1})
+        deleted_container_entries = self._run_once()
+
+        # found a misplaced object
+        self.assertEqual(self.reconciler.stats['misplaced_object'], 1)
+        self.assertEqual(
+            self.fake_swift.calls,
+            [('GET', self.current_container_path),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('3600')),
+             ('GET', '/v1/.misplaced_objects/3600' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects/3600' +
+              listing_qs('0:/AUTH_bob/c/o1'))])
+        # moves it
+        self.assertEqual(self.reconciler.stats['copy_attempt'], 1)
+        self.assertEqual(self.reconciler.stats['copy_success'], 1)
+        self.assertEqual(
+            self.fake_swift.storage_policy[0].calls,
+            [('GET', '/v1/AUTH_bob/c/o1'),  # 2
+             ('DELETE', '/v1/AUTH_bob/c/o1')])  # 4
+        delete_headers = self.fake_swift.storage_policy[0].headers[1]
+        self.assertEqual(
+            self.fake_swift.storage_policy[1].calls,
+            [('HEAD', '/v1/AUTH_bob/c/o1'),  # 1
+             ('PUT', '/v1/AUTH_bob/c/o1')])  # 3
+        put_headers = self.fake_swift.storage_policy[1].headers[1]
+        # we PUT the object in the right place with q_ts + offset 3
+        self.assertEqual(put_headers.get('X-Timestamp'),
+                         Timestamp(ts1, offset=3).internal)
+        # cleans up the old
+        self.assertEqual(self.reconciler.stats['cleanup_attempt'], 1)
+        self.assertEqual(self.reconciler.stats['cleanup_success'], 1)
+        # we DELETE the object from the wrong place with source_ts + offset 1
+        # timestamp to make sure the change takes effect
+        self.assertEqual(delete_headers.get('X-Timestamp'),
+                         Timestamp(ts1, offset=1).internal)
+        # and when we're done, we pop the entry from the queue
+        self.assertEqual(self.reconciler.stats['pop_queue'], 1)
+        self.assertEqual(deleted_container_entries,
+                         [('.misplaced_objects', '3600', '0:/AUTH_bob/c/o1',
+                           Timestamp(ts1, offset=2).internal)])
+        self.assertEqual(self.reconciler.stats['success'], 1)
+
+    def test_object_move_with_unicode_and_spaces(self):
+        ts1 = next(self.ts_iter)
+        # the "name" in listings and the unicode string passed to all
+        # functions where we call them with (account, container, obj)
+        obj_name = u"AUTH_bob/c \u062a/o1 \u062a"
+        # anytime we talk about a call made to swift for a path
+        obj_path = obj_name.encode('utf-8').decode('latin-1')
+        # this mock expects unquoted unicode because it handles container
+        # listings as well as paths
+        self._mock_listing({
+            (None, "/.misplaced_objects/3600/1:/%s" % obj_name): ts1,
+            (1, "/%s" % obj_name): ts1,
+        })
+        self._mock_oldest_spi({'c': 0})
+        deleted_container_entries = self._run_once()
+
+        # found a misplaced object
+        self.assertEqual(self.reconciler.stats['misplaced_object'], 1)
+        # listing_qs encodes and quotes - so give it name
+        self.assertEqual(
+            self.fake_swift.calls,
+            [('GET', self.current_container_path),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('3600')),
+             ('GET', '/v1/.misplaced_objects/3600' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects/3600' +
+              listing_qs('1:/%s' % obj_name))])
+        # moves it
+        self.assertEqual(self.reconciler.stats['copy_attempt'], 1)
+        self.assertEqual(self.reconciler.stats['copy_success'], 1)
+        # these calls are to the real path
+        self.assertEqual(
+            self.fake_swift.storage_policy[1].calls,
+            [('GET', '/v1/%s' % obj_path),  # 2
+             ('DELETE', '/v1/%s' % obj_path)])  # 4
+        delete_headers = self.fake_swift.storage_policy[1].headers[1]
+        self.assertEqual(
+            self.fake_swift.storage_policy[0].calls,
+            [('HEAD', '/v1/%s' % obj_path),  # 1
+             ('PUT', '/v1/%s' % obj_path)])  # 3
+        put_headers = self.fake_swift.storage_policy[0].headers[1]
+        # we PUT the object in the right place with q_ts + offset 3
+        self.assertEqual(put_headers.get('X-Timestamp'),
+                         Timestamp(ts1, offset=3).internal)
+        # cleans up the old
+        self.assertEqual(self.reconciler.stats['cleanup_attempt'], 1)
+        self.assertEqual(self.reconciler.stats['cleanup_success'], 1)
+        # we DELETE the object from the wrong place with source_ts + offset 1
+        # timestamp to make sure the change takes effect
+        self.assertEqual(delete_headers.get('X-Timestamp'),
+                         Timestamp(ts1, offset=1).internal)
+        self.assertEqual(
+            delete_headers.get('X-Backend-Storage-Policy-Index'), '1')
+        # and when we're done, we pop the entry from the queue
+        self.assertEqual(self.reconciler.stats['pop_queue'], 1)
+        # this mock received the name, it's encoded down in buffered_http
+        self.assertEqual(deleted_container_entries,
+                         [('.misplaced_objects', '3600', '1:/%s' % obj_name,
+                           Timestamp(ts1, offset=2).internal)])
+        self.assertEqual(self.reconciler.stats['success'], 1)
+
+    def test_object_delete(self):
+        ts = [next(self.ts_iter) for _ in range(2)]
+        self._mock_listing({
+            (None, "/.misplaced_objects/3600/1:/AUTH_bob/c/o1"): (
+                ts[1].internal, 'application/x-delete'),
+            # object exists in "correct" storage policy - slightly older
+            (0, "/AUTH_bob/c/o1"): ts[0].internal,
+        })
+        self._mock_oldest_spi({'c': 0})
+        # the tombstone exists in the enqueued storage policy
+        self.fake_swift.storage_policy[1].register(
+            'GET', '/v1/AUTH_bob/c/o1', swob.HTTPNotFound,
+            {'X-Backend-Timestamp': ts[1].internal})
+        deleted_container_entries = self._run_once()
+
+        # found a misplaced object
+        self.assertEqual(self.reconciler.stats['misplaced_object'], 1)
+        self.assertEqual(
+            self.fake_swift.calls,
+            [('GET', self.current_container_path),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('3600')),
+             ('GET', '/v1/.misplaced_objects/3600' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects/3600' +
+              listing_qs('1:/AUTH_bob/c/o1'))])
+        # delete it
+        self.assertEqual(self.reconciler.stats['delete_attempt'], 1)
+        self.assertEqual(self.reconciler.stats['delete_success'], 1)
+        self.assertEqual(
+            self.fake_swift.storage_policy[1].calls,
+            [('GET', '/v1/AUTH_bob/c/o1'),
+             ('DELETE', '/v1/AUTH_bob/c/o1')])
+        delete_headers = self.fake_swift.storage_policy[1].headers[1]
+        self.assertEqual(
+            self.fake_swift.storage_policy[0].calls,
+            [('HEAD', '/v1/AUTH_bob/c/o1'),
+             ('DELETE', '/v1/AUTH_bob/c/o1')])
+        reconcile_headers = self.fake_swift.storage_policy[0].headers[1]
+        # we DELETE the object in the right place with q_ts + offset 3
+        self.assertEqual(reconcile_headers.get('X-Timestamp'),
+                         Timestamp(ts[1], offset=3).internal)
+        # cleans up the old
+        self.assertEqual(self.reconciler.stats['cleanup_attempt'], 1)
+        self.assertEqual(self.reconciler.stats['cleanup_success'], 1)
+        # we DELETE the object from the wrong place with source_ts + offset 1
+        # timestamp to make sure the change takes effect
+        self.assertEqual(delete_headers.get('X-Timestamp'),
+                         Timestamp(ts[1], offset=1))
+        # and when we're done, we pop the entry from the queue
+        self.assertEqual(self.reconciler.stats['pop_queue'], 1)
+        self.assertEqual(deleted_container_entries,
+                         [('.misplaced_objects', '3600', '1:/AUTH_bob/c/o1',
+                           Timestamp(ts[1], offset=2).internal)])
+        self.assertEqual(self.reconciler.stats['success'], 1)
+
+    def test_object_enqueued_for_the_correct_dest_noop(self):
+        ts1 = next(self.ts_iter)
+        self._mock_listing({
+            (None, "/.misplaced_objects/3600/1:/AUTH_bob/c/o1"): ts1,
+            (1, "/AUTH_bob/c/o1"): ts1,
+        })
+        self._mock_oldest_spi({'c': 1})  # already in the right spot!
+        deleted_container_entries = self._run_once()
+
+        # nothing to see here
+        self.assertEqual(self.reconciler.stats['noop_object'], 1)
+        self.assertEqual(
+            self.fake_swift.calls,
+            [('GET', self.current_container_path),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('3600')),
+             ('GET', '/v1/.misplaced_objects/3600' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects/3600' +
+              listing_qs('1:/AUTH_bob/c/o1'))])
+        # so we just pop the queue
+        self.assertEqual(self.reconciler.stats['pop_queue'], 1)
+        self.assertEqual(deleted_container_entries,
+                         [('.misplaced_objects', '3600', '1:/AUTH_bob/c/o1',
+                           Timestamp(ts1, offset=2).internal)])
+        self.assertEqual(self.reconciler.stats['success'], 1)
+
+    def test_object_move_src_object_newer_than_queue_entry(self):
+        ts1 = next(self.ts_iter)
+        ts2 = Timestamp(ts1, delta=1111)
+        # setup the cluster
+        self._mock_listing({
+            (None, "/.misplaced_objects/3600/1:/AUTH_bob/c/o1"): ts1,
+            (1, '/AUTH_bob/c/o1'): ts2,
+        })
+        self._mock_oldest_spi({'c': 0})  # destination
+        # turn the crank
+        deleted_container_entries = self._run_once()
+
+        # found a misplaced object
+        self.assertEqual(self.reconciler.stats['misplaced_object'], 1)
+        self.assertEqual(
+            self.fake_swift.calls,
+            [('GET', self.current_container_path),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('3600')),
+             ('GET', '/v1/.misplaced_objects/3600' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects/3600' +
+              listing_qs('1:/AUTH_bob/c/o1'))])
+        # proceed with the move
+        self.assertEqual(self.reconciler.stats['copy_attempt'], 1)
+        self.assertEqual(self.reconciler.stats['copy_success'], 1)
+        self.assertEqual(
+            self.fake_swift.storage_policy[1].calls,
+            [('GET', '/v1/AUTH_bob/c/o1'),  # 2
+             ('DELETE', '/v1/AUTH_bob/c/o1')])  # 4
+        delete_headers = self.fake_swift.storage_policy[1].headers[1]
+        self.assertEqual(
+            self.fake_swift.storage_policy[0].calls,
+            [('HEAD', '/v1/AUTH_bob/c/o1'),  # 1
+             ('PUT', '/v1/AUTH_bob/c/o1')])  # 3
+        # .. with source timestamp + offset 3
+        put_headers = self.fake_swift.storage_policy[0].headers[1]
+        self.assertEqual(put_headers.get('X-Timestamp'),
+                         Timestamp(ts2, offset=3))
+        # src object is cleaned up
+        self.assertEqual(self.reconciler.stats['cleanup_attempt'], 1)
+        self.assertEqual(self.reconciler.stats['cleanup_success'], 1)
+        # ... with q_ts + offset 1
+        self.assertEqual(delete_headers.get('X-Timestamp'),
+                         Timestamp(ts1, offset=1))
+        # and queue is popped
+        self.assertEqual(self.reconciler.stats['pop_queue'], 1)
+        self.assertEqual(deleted_container_entries,
+                         [('.misplaced_objects', '3600', '1:/AUTH_bob/c/o1',
+                           Timestamp(ts1, offset=2).internal)])
+        self.assertEqual(self.reconciler.stats['success'], 1)
+
+    def test_object_move_src_object_older_than_queue_entry(self):
+        # should be some sort of retry case
+        q_ts = time.time()
+        container = str(int(q_ts // 3600 * 3600))
+        q_path = '.misplaced_objects/%s' % container
+        self._mock_listing({
+            (None, "/%s/1:/AUTH_bob/c/o1" % q_path): q_ts,
+            (1, '/AUTH_bob/c/o1'): q_ts - 1,  # slightly older
+        })
+        self._mock_oldest_spi({'c': 0})
+        deleted_container_entries = self._run_once()
+
+        # found a misplaced object
+        self.assertEqual(self.reconciler.stats['misplaced_object'], 1)
+        self.assertEqual(
+            self.fake_swift.calls,
+            [('GET', '/v1/%s' % q_path + listing_qs('')),
+             ('GET', '/v1/%s' % q_path +
+              listing_qs('1:/AUTH_bob/c/o1')),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects' + listing_qs(container))])
+        self.assertEqual(
+            self.fake_swift.storage_policy[0].calls,
+            [('HEAD', '/v1/AUTH_bob/c/o1')])
+        # but no object copy is attempted
+        self.assertEqual(self.reconciler.stats['unavailable_source'], 1)
+        self.assertEqual(self.reconciler.stats['copy_attempt'], 0)
+        self.assertEqual(
+            self.fake_swift.storage_policy[1].calls,
+            [('GET', '/v1/AUTH_bob/c/o1')])
+        # src object is un-modified
+        self.assertEqual(self.reconciler.stats['cleanup_attempt'], 0)
+        # queue is un-changed, we'll have to retry
+        self.assertEqual(self.reconciler.stats['pop_queue'], 0)
+        self.assertEqual(deleted_container_entries, [])
+        self.assertEqual(self.reconciler.stats['retry'], 1)
+
+    def test_src_object_unavailable_with_slightly_newer_tombstone(self):
+        # should be some sort of retry case
+        q_ts = float(Timestamp.now())
+        container = str(int(q_ts // 3600 * 3600))
+        q_path = '.misplaced_objects/%s' % container
+        self._mock_listing({
+            (None, "/%s/1:/AUTH_bob/c/o1" % q_path): q_ts,
+        })
+        self._mock_oldest_spi({'c': 0})
+        self.fake_swift.storage_policy[1].register(
+            'GET', '/v1/AUTH_bob/c/o1', swob.HTTPNotFound,
+            {'X-Backend-Timestamp': Timestamp(q_ts, offset=3).internal})
+        deleted_container_entries = self._run_once()
+
+        # found a misplaced object
+        self.assertEqual(self.reconciler.stats['misplaced_object'], 1)
+        self.assertEqual(
+            self.fake_swift.calls,
+            [('GET', '/v1/%s' % q_path + listing_qs('')),
+             ('GET', '/v1/%s' % q_path +
+              listing_qs('1:/AUTH_bob/c/o1')),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects' + listing_qs(container))])
+        self.assertEqual(
+            self.fake_swift.storage_policy[0].calls,
+            [('HEAD', '/v1/AUTH_bob/c/o1')])
+        # but no object copy is attempted
+        self.assertEqual(self.reconciler.stats['unavailable_source'], 1)
+        self.assertEqual(self.reconciler.stats['copy_attempt'], 0)
+        self.assertEqual(
+            self.fake_swift.storage_policy[1].calls,
+            [('GET', '/v1/AUTH_bob/c/o1')])
+        # src object is un-modified
+        self.assertEqual(self.reconciler.stats['cleanup_attempt'], 0)
+        # queue is un-changed, we'll have to retry
+        self.assertEqual(self.reconciler.stats['pop_queue'], 0)
+        self.assertEqual(deleted_container_entries, [])
+        self.assertEqual(self.reconciler.stats['retry'], 1)
+
+    def test_src_object_unavailable_server_error(self):
+        # should be some sort of retry case
+        q_ts = float(Timestamp.now())
+        container = str(int(q_ts // 3600 * 3600))
+        q_path = '.misplaced_objects/%s' % container
+        self._mock_listing({
+            (None, "/%s/1:/AUTH_bob/c/o1" % q_path): q_ts,
+        })
+        self._mock_oldest_spi({'c': 0})
+        self.fake_swift.storage_policy[1].register(
+            'GET', '/v1/AUTH_bob/c/o1', swob.HTTPServiceUnavailable, {})
+        deleted_container_entries = self._run_once()
+
+        # found a misplaced object
+        self.assertEqual(self.reconciler.stats['misplaced_object'], 1)
+        self.assertEqual(
+            self.fake_swift.calls,
+            [('GET', '/v1/%s' % q_path + listing_qs('')),
+             ('GET', '/v1/%s' % q_path +
+              listing_qs('1:/AUTH_bob/c/o1')),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects' + listing_qs(container))])
+        self.assertEqual(
+            self.fake_swift.storage_policy[0].calls,
+            [('HEAD', '/v1/AUTH_bob/c/o1')])
+        # but no object copy is attempted
+        self.assertEqual(self.reconciler.stats['unavailable_source'], 1)
+        self.assertEqual(self.reconciler.stats['copy_attempt'], 0)
+        self.assertEqual(
+            self.fake_swift.storage_policy[1].calls,
+            [('GET', '/v1/AUTH_bob/c/o1')])
+        # src object is un-modified
+        self.assertEqual(self.reconciler.stats['cleanup_attempt'], 0)
+        # queue is un-changed, we'll have to retry
+        self.assertEqual(self.reconciler.stats['pop_queue'], 0)
+        self.assertEqual(deleted_container_entries, [])
+        self.assertEqual(self.reconciler.stats['retry'], 1)
+
+    def test_object_move_fails_preflight(self):
+        # setup the cluster
+        self._mock_listing({
+            (None, "/.misplaced_objects/3600/1:/AUTH_bob/c/o1"): 3600.123456,
+            (1, '/AUTH_bob/c/o1'): 3600.123457,  # slightly newer
+        })
+        self._mock_oldest_spi({'c': 0})  # destination
+
+        # make the HEAD blow up
+        self.fake_swift.storage_policy[0].register(
+            'HEAD', '/v1/AUTH_bob/c/o1', swob.HTTPServiceUnavailable, {})
+        # turn the crank
+        deleted_container_entries = self._run_once()
+
+        # we did some listings...
+        self.assertEqual(
+            self.fake_swift.calls,
+            [('GET', self.current_container_path),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('3600')),
+             ('GET', '/v1/.misplaced_objects/3600' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects/3600' +
+              listing_qs('1:/AUTH_bob/c/o1'))])
+        # ...but we can't even tell whether anything's misplaced or not
+        self.assertEqual(self.reconciler.stats['misplaced_object'], 0)
+        self.assertEqual(self.reconciler.stats['unavailable_destination'], 1)
+        # so we don't try to do any sort of move or cleanup
+        self.assertEqual(self.reconciler.stats['copy_attempt'], 0)
+        self.assertEqual(self.reconciler.stats['cleanup_attempt'], 0)
+        self.assertEqual(self.reconciler.stats['pop_queue'], 0)
+        self.assertEqual(deleted_container_entries, [])
+        # and we'll have to try again later
+        self.assertEqual(self.reconciler.stats['retry'], 1)
+        self.assertEqual(self.fake_swift.storage_policy[1].calls, [])
+        self.assertEqual(
+            self.fake_swift.storage_policy[0].calls,
+            [('HEAD', '/v1/AUTH_bob/c/o1')])
+
+    def test_object_move_fails_cleanup(self):
+        ts1 = next(self.ts_iter)
+        ts2 = Timestamp(ts1, delta=1)
+        # setup the cluster
+        self._mock_listing({
+            (None, "/.misplaced_objects/3600/1:/AUTH_bob/c/o1"): ts1,
+            (1, '/AUTH_bob/c/o1'): ts2,
+        })
+        self._mock_oldest_spi({'c': 0})  # destination
+
+        # make the DELETE blow up
+        self.fake_swift.storage_policy[1].register(
+            'DELETE', '/v1/AUTH_bob/c/o1', swob.HTTPServiceUnavailable, {})
+        # turn the crank
+        deleted_container_entries = self._run_once()
+
+        # found a misplaced object
+        self.assertEqual(self.reconciler.stats['misplaced_object'], 1)
+        self.assertEqual(
+            self.fake_swift.calls,
+            [('GET', self.current_container_path),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('3600')),
+             ('GET', '/v1/.misplaced_objects/3600' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects/3600' +
+              listing_qs('1:/AUTH_bob/c/o1'))])
+        # proceed with the move
+        self.assertEqual(self.reconciler.stats['copy_attempt'], 1)
+        self.assertEqual(self.reconciler.stats['copy_success'], 1)
+        self.assertEqual(
+            self.fake_swift.storage_policy[1].calls,
+            [('GET', '/v1/AUTH_bob/c/o1'),  # 2
+             ('DELETE', '/v1/AUTH_bob/c/o1')])  # 4
+        delete_headers = self.fake_swift.storage_policy[1].headers[1]
+        self.assertEqual(
+            self.fake_swift.storage_policy[0].calls,
+            [('HEAD', '/v1/AUTH_bob/c/o1'),  # 1
+             ('PUT', '/v1/AUTH_bob/c/o1')])  # 3
+        # .. with source timestamp + offset 3
+        put_headers = self.fake_swift.storage_policy[0].headers[1]
+        self.assertEqual(put_headers.get('X-Timestamp'),
+                         Timestamp(ts2, offset=3))
+        # we try to cleanup
+        self.assertEqual(self.reconciler.stats['cleanup_attempt'], 1)
+        # ... with q_ts + offset 1
+        self.assertEqual(delete_headers.get('X-Timestamp'),
+                         Timestamp(ts1, offset=1))
+        # but cleanup fails!
+        self.assertEqual(self.reconciler.stats['cleanup_failed'], 1)
+        # so the queue is not popped
+        self.assertEqual(self.reconciler.stats['pop_queue'], 0)
+        self.assertEqual(deleted_container_entries, [])
+        # and we'll have to retry
+        self.assertEqual(self.reconciler.stats['retry'], 1)
+
+    def test_object_move_src_object_is_forever_gone(self):
+        # oh boy, hate to be here - this is an oldy
+        q_ts = self.start_interval - self.reconciler.reclaim_age - 1
+        ts1 = Timestamp(q_ts)
+        self._mock_listing({
+            (None, "/.misplaced_objects/3600/1:/AUTH_bob/c/o1"): ts1,
+        })
+        self._mock_oldest_spi({'c': 0})
+        deleted_container_entries = self._run_once()
+
+        # found a misplaced object
+        self.assertEqual(self.reconciler.stats['misplaced_object'], 1)
+        self.assertEqual(
+            self.fake_swift.calls,
+            [('GET', self.current_container_path),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('3600')),
+             ('GET', '/v1/.misplaced_objects/3600' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects/3600' +
+              listing_qs('1:/AUTH_bob/c/o1'))])
+        self.assertEqual(
+            self.fake_swift.storage_policy[0].calls,
+            [('HEAD', '/v1/AUTH_bob/c/o1')])
+        # but it's gone :\
+        self.assertEqual(self.reconciler.stats['lost_source'], 1)
+        self.assertEqual(
+            self.fake_swift.storage_policy[1].calls,
+            [('GET', '/v1/AUTH_bob/c/o1')])
+        # gah, look, even if it was out there somewhere - we've been at this
+        # two weeks and haven't found it.  We can't just keep looking forever,
+        # so... we're done
+        self.assertEqual(self.reconciler.stats['pop_queue'], 1)
+        self.assertEqual(deleted_container_entries,
+                         [('.misplaced_objects', '3600', '1:/AUTH_bob/c/o1',
+                           Timestamp(ts1, offset=2).internal)])
+        # dunno if this is helpful, but FWIW we don't throw tombstones?
+        self.assertEqual(self.reconciler.stats['cleanup_attempt'], 0)
+        self.assertEqual(self.reconciler.stats['success'], 1)  # lol
+
+    def test_object_move_dest_already_moved(self):
+        ts1 = next(self.ts_iter)
+        self._mock_listing({
+            (None, "/.misplaced_objects/3600/1:/AUTH_bob/c/o1"): ts1,
+            (1, "/AUTH_bob/c/o1"): ts1,
+            (0, "/AUTH_bob/c/o1"): ts1,
+        })
+        self._mock_oldest_spi({'c': 0})
+        deleted_container_entries = self._run_once()
+
+        # we look for misplaced objects
+        self.assertEqual(
+            self.fake_swift.calls,
+            [('GET', self.current_container_path),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('3600')),
+             ('GET', '/v1/.misplaced_objects/3600' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects/3600' +
+              listing_qs('1:/AUTH_bob/c/o1'))])
+        # but we found it already in the right place!
+        self.assertEqual(self.reconciler.stats['found_object'], 1)
+        self.assertEqual(
+            self.fake_swift.storage_policy[0].calls,
+            [('HEAD', '/v1/AUTH_bob/c/o1')])
+        # so no attempt to read the source is made, but we do cleanup
+        self.assertEqual(
+            self.fake_swift.storage_policy[1].calls,
+            [('DELETE', '/v1/AUTH_bob/c/o1')])
+        delete_headers = self.fake_swift.storage_policy[1].headers[0]
+        # rather we just clean up the dark matter
+        self.assertEqual(self.reconciler.stats['cleanup_attempt'], 1)
+        self.assertEqual(self.reconciler.stats['cleanup_success'], 1)
+        self.assertEqual(delete_headers.get('X-Timestamp'),
+                         Timestamp(ts1, offset=1))
+        # and wipe our hands of it
+        self.assertEqual(self.reconciler.stats['pop_queue'], 1)
+        self.assertEqual(deleted_container_entries,
+                         [('.misplaced_objects', '3600', '1:/AUTH_bob/c/o1',
+                           Timestamp(ts1, offset=2).internal)])
+        self.assertEqual(self.reconciler.stats['success'], 1)
+
+    def test_object_move_dest_object_newer_than_queue_entry(self):
+        ts1 = next(self.ts_iter)
+        ts2 = Timestamp(ts1, delta=1)
+        self._mock_listing({
+            (None, "/.misplaced_objects/3600/1:/AUTH_bob/c/o1"): ts1,
+            (1, "/AUTH_bob/c/o1"): ts1,
+            (0, "/AUTH_bob/c/o1"): ts2,
+        })
+        self._mock_oldest_spi({'c': 0})
+        deleted_container_entries = self._run_once()
+
+        # we look for misplaced objects...
+        self.assertEqual(
+            self.fake_swift.calls,
+            [('GET', self.current_container_path),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('3600')),
+             ('GET', '/v1/.misplaced_objects/3600' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects/3600' +
+              listing_qs('1:/AUTH_bob/c/o1'))])
+        # but we found it already in the right place!
+        self.assertEqual(self.reconciler.stats['found_object'], 1)
+        self.assertEqual(
+            self.fake_swift.storage_policy[0].calls,
+            [('HEAD', '/v1/AUTH_bob/c/o1')])
+        # so not attempt to read is made, but we do cleanup
+        self.assertEqual(self.reconciler.stats['copy_attempt'], 0)
+        self.assertEqual(
+            self.fake_swift.storage_policy[1].calls,
+            [('DELETE', '/v1/AUTH_bob/c/o1')])
+        delete_headers = self.fake_swift.storage_policy[1].headers[0]
+        # rather we just clean up the dark matter
+        self.assertEqual(self.reconciler.stats['cleanup_attempt'], 1)
+        self.assertEqual(self.reconciler.stats['cleanup_success'], 1)
+
+        self.assertEqual(delete_headers.get('X-Timestamp'),
+                         Timestamp(ts1, offset=1))
+        # and since we cleaned up the old object, so this counts as done
+        self.assertEqual(self.reconciler.stats['pop_queue'], 1)
+        self.assertEqual(deleted_container_entries,
+                         [('.misplaced_objects', '3600', '1:/AUTH_bob/c/o1',
+                           Timestamp(ts1, offset=2).internal)])
+        self.assertEqual(self.reconciler.stats['success'], 1)
+
+    def test_object_move_dest_object_older_than_queue_entry(self):
+        ts = [next(self.ts_iter) for _ in range(2)]
+        self._mock_listing({
+            (None, "/.misplaced_objects/36000/1:/AUTH_bob/c/o1"): ts[1],
+            (1, "/AUTH_bob/c/o1"): ts[1],
+            (0, "/AUTH_bob/c/o1"): ts[0],
+        })
+        self._mock_oldest_spi({'c': 0})
+        deleted_container_entries = self._run_once()
+
+        # we found a misplaced object
+        self.assertEqual(self.reconciler.stats['misplaced_object'], 1)
+        self.assertEqual(
+            self.fake_swift.calls,
+            [('GET', self.current_container_path),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('36000')),
+             ('GET', '/v1/.misplaced_objects/36000' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects/36000' +
+              listing_qs('1:/AUTH_bob/c/o1'))])
+        # and since our version is *newer*, we overwrite
+        self.assertEqual(self.reconciler.stats['copy_attempt'], 1)
+        self.assertEqual(self.reconciler.stats['copy_success'], 1)
+        self.assertEqual(
+            self.fake_swift.storage_policy[1].calls,
+            [('GET', '/v1/AUTH_bob/c/o1'),  # 2
+             ('DELETE', '/v1/AUTH_bob/c/o1')])  # 4
+        delete_headers = self.fake_swift.storage_policy[1].headers[1]
+        self.assertEqual(
+            self.fake_swift.storage_policy[0].calls,
+            [('HEAD', '/v1/AUTH_bob/c/o1'),  # 1
+             ('PUT', '/v1/AUTH_bob/c/o1')])  # 3
+        # ... with a q_ts + offset 3
+        put_headers = self.fake_swift.storage_policy[0].headers[1]
+        self.assertEqual(put_headers.get('X-Timestamp'),
+                         Timestamp(ts[1], offset=3))
+        # then clean the dark matter
+        self.assertEqual(self.reconciler.stats['cleanup_attempt'], 1)
+        self.assertEqual(self.reconciler.stats['cleanup_success'], 1)
+        # ... with a q_ts + offset 1
+        self.assertEqual(delete_headers.get('X-Timestamp'),
+                         Timestamp(ts[1], offset=1))
+
+        # and pop the queue
+        self.assertEqual(self.reconciler.stats['pop_queue'], 1)
+        self.assertEqual(deleted_container_entries,
+                         [('.misplaced_objects', '36000', '1:/AUTH_bob/c/o1',
+                           Timestamp(ts[1], offset=2).internal)])
+        self.assertEqual(self.reconciler.stats['success'], 1)
+
+    def test_object_move_put_fails(self):
+        ts1 = next(self.ts_iter)
+        # setup the cluster
+        self._mock_listing({
+            (None, "/.misplaced_objects/36000/1:/AUTH_bob/c/o1"): ts1,
+            (1, "/AUTH_bob/c/o1"): ts1,
+        })
+        self._mock_oldest_spi({'c': 0})
+
+        # make the put to dest fail!
+        self.fake_swift.storage_policy[0].register(
+            'PUT', '/v1/AUTH_bob/c/o1', swob.HTTPServiceUnavailable, {})
+
+        # turn the crank
+        deleted_container_entries = self._run_once()
+
+        # we find a misplaced object
+        self.assertEqual(self.reconciler.stats['misplaced_object'], 1)
+        self.assertEqual(
+            self.fake_swift.calls,
+            [('GET', self.current_container_path),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('36000')),
+             ('GET', '/v1/.misplaced_objects/36000' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects/36000' +
+              listing_qs('1:/AUTH_bob/c/o1'))])
+        # and try to move it, but it fails
+        self.assertEqual(self.reconciler.stats['copy_attempt'], 1)
+        self.assertEqual(
+            self.fake_swift.storage_policy[1].calls,
+            [('GET', '/v1/AUTH_bob/c/o1')])  # 2
+        self.assertEqual(
+            self.fake_swift.storage_policy[0].calls,
+            [('HEAD', '/v1/AUTH_bob/c/o1'),  # 1
+             ('PUT', '/v1/AUTH_bob/c/o1')])  # 3
+        put_headers = self.fake_swift.storage_policy[0].headers[1]
+        # ...with q_ts + offset 3 (20-microseconds)
+        self.assertEqual(put_headers.get('X-Timestamp'),
+                         Timestamp(ts1, offset=3))
+        # but it failed
+        self.assertEqual(self.reconciler.stats['copy_success'], 0)
+        self.assertEqual(self.reconciler.stats['copy_failed'], 1)
+        # ... so we don't clean up the source
+        self.assertEqual(self.reconciler.stats['cleanup_attempt'], 0)
+        # and we don't pop the queue
+        self.assertEqual(deleted_container_entries, [])
+        self.assertEqual(self.reconciler.stats['unhandled_errors'], 0)
+        self.assertEqual(self.reconciler.stats['retry'], 1)
+
+    def test_object_move_put_blows_up_crazy_town(self):
+        ts1 = next(self.ts_iter)
+        # setup the cluster
+        self._mock_listing({
+            (None, "/.misplaced_objects/36000/1:/AUTH_bob/c/o1"): ts1,
+            (1, "/AUTH_bob/c/o1"): ts1,
+        })
+        self._mock_oldest_spi({'c': 0})
+
+        # make the put to dest blow up crazy town
+        def blow_up(*args, **kwargs):
+            raise Exception('kaboom!')
+
+        self.fake_swift.storage_policy[0].register(
+            'PUT', '/v1/AUTH_bob/c/o1', blow_up, {})
+
+        # turn the crank
+        deleted_container_entries = self._run_once()
+
+        # we find a misplaced object
+        self.assertEqual(self.reconciler.stats['misplaced_object'], 1)
+        self.assertEqual(
+            self.fake_swift.calls,
+            [('GET', self.current_container_path),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('36000')),
+             ('GET', '/v1/.misplaced_objects/36000' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects/36000' +
+              listing_qs('1:/AUTH_bob/c/o1'))])
+        # and attempt to move it
+        self.assertEqual(self.reconciler.stats['copy_attempt'], 1)
+        self.assertEqual(
+            self.fake_swift.storage_policy[1].calls,
+            [('GET', '/v1/AUTH_bob/c/o1')])  # 2
+        self.assertEqual(
+            self.fake_swift.storage_policy[0].calls,
+            [('HEAD', '/v1/AUTH_bob/c/o1'),  # 1
+             ('PUT', '/v1/AUTH_bob/c/o1')])  # 3
+        put_headers = self.fake_swift.storage_policy[0].headers[1]
+        # ...with q_ts + offset 3 (20-microseconds)
+        self.assertEqual(put_headers.get('X-Timestamp'),
+                         Timestamp(ts1, offset=3))
+        # but it blows up hard
+        self.assertEqual(self.reconciler.stats['unhandled_error'], 1)
+        # so we don't cleanup
+        self.assertEqual(self.reconciler.stats['cleanup_attempt'], 0)
+        # and we don't pop the queue
+        self.assertEqual(self.reconciler.stats['pop_queue'], 0)
+        self.assertEqual(deleted_container_entries, [])
+        self.assertEqual(self.reconciler.stats['retry'], 1)
+
+    def test_object_move_no_such_object_no_tombstone_recent(self):
+        q_ts = float(Timestamp.now())
+        container = str(int(q_ts // 3600 * 3600))
+        q_path = '.misplaced_objects/%s' % container
+
+        self._mock_listing({
+            (None, "/%s/1:/AUTH_jeb/c/o1" % q_path): q_ts
+        })
+        self._mock_oldest_spi({'c': 0})
+
+        deleted_container_entries = self._run_once()
+
+        self.assertEqual(
+            self.fake_swift.calls,
+            [('GET', '/v1/.misplaced_objects/%s' % container + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects/%s' % container +
+              listing_qs('1:/AUTH_jeb/c/o1')),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects' + listing_qs(container))])
+        self.assertEqual(
+            self.fake_swift.storage_policy[0].calls,
+            [('HEAD', '/v1/AUTH_jeb/c/o1')],
+        )
+        self.assertEqual(
+            self.fake_swift.storage_policy[1].calls,
+            [('GET', '/v1/AUTH_jeb/c/o1')],
+        )
+        # the queue entry is recent enough that there could easily be
+        # tombstones on offline nodes or something, so we'll just leave it
+        # here and try again later
+        self.assertEqual(deleted_container_entries, [])
+
+    def test_object_move_no_such_object_no_tombstone_ancient(self):
+        queue_ts = Timestamp(
+            float(Timestamp.now()) - self.reconciler.reclaim_age * 1.1)
+        container = str(int(float(queue_ts) // 3600 * 3600))
+
+        self._mock_listing({
+            (
+                None, "/.misplaced_objects/%s/1:/AUTH_jeb/c/o1" % container
+            ): queue_ts
+        })
+        self._mock_oldest_spi({'c': 0})
+
+        deleted_container_entries = self._run_once()
+
+        self.assertEqual(
+            self.fake_swift.calls,
+            [('GET', self.current_container_path),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects' + listing_qs(container)),
+             ('GET', '/v1/.misplaced_objects/%s' % container + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects/%s' % container +
+              listing_qs('1:/AUTH_jeb/c/o1'))])
+        self.assertEqual(
+            self.fake_swift.storage_policy[0].calls,
+            [('HEAD', '/v1/AUTH_jeb/c/o1')],
+        )
+        self.assertEqual(
+            self.fake_swift.storage_policy[1].calls,
+            [('GET', '/v1/AUTH_jeb/c/o1')],
+        )
+
+        # the queue entry is old enough that the tombstones, if any, have
+        # probably been reaped, so we'll just give up
+        self.assertEqual(
+            deleted_container_entries,
+            [('.misplaced_objects', container, '1:/AUTH_jeb/c/o1',
+              Timestamp(queue_ts, offset=2).internal)])
+
+    def test_delete_old_empty_queue_containers(self):
+        ts = time.time() - self.reconciler.reclaim_age * 1.1
+        container = str(int(ts // 3600 * 3600))
+        older_ts = ts - 3600
+        older_container = str(int(older_ts // 3600 * 3600))
+        self._mock_listing({
+            (None, "/.misplaced_objects/%s/" % container): 0,
+            (None, "/.misplaced_objects/%s/something" % older_container): 0,
+        })
+        deleted_container_entries = self._run_once()
+        self.assertEqual(deleted_container_entries, [])
+        self.assertEqual(
+            self.fake_swift.calls,
+            [('GET', self.current_container_path),
+             ('GET', '/v1/.misplaced_objects' + listing_qs('')),
+             ('GET', '/v1/.misplaced_objects' + listing_qs(container)),
+             ('GET', '/v1/.misplaced_objects/%s' % container + listing_qs('')),
+             ('DELETE', '/v1/.misplaced_objects/%s' % container),
+             ('GET', '/v1/.misplaced_objects/%s' % older_container +
+              listing_qs('')),
+             ('GET', '/v1/.misplaced_objects/%s' % older_container +
+              listing_qs('something'))])
+        self.assertEqual(self.reconciler.stats['invalid_record'], 1)
+
+    def test_iter_over_old_containers_in_reverse(self):
+        step = reconciler.MISPLACED_OBJECTS_CONTAINER_DIVISOR
+        now = self.start_interval
+        containers = []
+        for i in range(10):
+            container_ts = int(now - step * i)
+            container_name = str(container_ts // 3600 * 3600)
+            containers.append(container_name)
+        # add some old containers too
+        now -= self.reconciler.reclaim_age
+        old_containers = []
+        for i in range(10):
+            container_ts = int(now - step * i)
+            container_name = str(container_ts // 3600 * 3600)
+            old_containers.append(container_name)
+        containers.sort()
+        old_containers.sort()
+        all_containers = old_containers + containers
+        self._mock_listing(dict((
+            (None, "/.misplaced_objects/%s/" % container), 0
+        ) for container in all_containers))
+        deleted_container_entries = self._run_once()
+        self.assertEqual(deleted_container_entries, [])
+        last_container = all_containers[-1]
+        account_listing_calls = [
+            ('GET', '/v1/.misplaced_objects' + listing_qs('')),
+            ('GET', '/v1/.misplaced_objects' + listing_qs(last_container)),
+        ]
+        new_container_calls = [
+            ('GET', '/v1/.misplaced_objects/%s' % container +
+             listing_qs('')) for container in reversed(containers)
+        ][1:]  # current_container get's skipped the second time around...
+        old_container_listings = [
+            ('GET', '/v1/.misplaced_objects/%s' % container +
+             listing_qs('')) for container in reversed(old_containers)
+        ]
+        old_container_deletes = [
+            ('DELETE', '/v1/.misplaced_objects/%s' % container)
+            for container in reversed(old_containers)
+        ]
+        old_container_calls = list(itertools.chain(*zip(
+            old_container_listings, old_container_deletes)))
+        self.assertEqual(self.fake_swift.calls,
+                         [('GET', self.current_container_path)] +
+                         account_listing_calls + new_container_calls +
+                         old_container_calls)
+
+    def test_error_in_iter_containers(self):
+        self._mock_listing({})
+
+        # make the listing return an error
+        self.fake_swift.storage_policy[None].register(
+            'GET', '/v1/.misplaced_objects' + listing_qs(''),
+            swob.HTTPServiceUnavailable, {})
+
+        self._run_once()
+        self.assertEqual(
+            self.fake_swift.calls,
+            [('GET', self.current_container_path),
+             ('GET', '/v1/.misplaced_objects' + listing_qs(''))])
+        self.assertEqual(self.reconciler.stats, {})
+        errors = self.reconciler.logger.get_lines_for_level('error')
+        self.assertEqual(errors, [
+            'Error listing containers in account '
+            '.misplaced_objects (Unexpected response: '
+            '503 Service Unavailable)'])
+
+    def test_unhandled_exception_in_reconcile(self):
+        self._mock_listing({})
+
+        # make the listing blow up
+        def blow_up(*args, **kwargs):
+            raise Exception('kaboom!')
+
+        self.fake_swift.storage_policy[None].register(
+            'GET', '/v1/.misplaced_objects' + listing_qs(''),
+            blow_up, {})
+        self._run_once()
+        self.assertEqual(
+            self.fake_swift.calls,
+            [('GET', self.current_container_path),
+             ('GET', '/v1/.misplaced_objects' + listing_qs(''))])
+        self.assertEqual(self.reconciler.stats, {})
+        errors = self.reconciler.logger.get_lines_for_level('error')
+        self.assertEqual(errors,
+                         ['Unhandled Exception trying to reconcile: '])
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/container/test_replicator.py b/test/unit/container/test_replicator.py
index 9f1b0259a8..fb8b6a5478 100644
--- a/test/unit/container/test_replicator.py
+++ b/test/unit/container/test_replicator.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,47 +13,3013 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
+import os
+import time
+import shutil
+import itertools
 import unittest
-from swift.container import replicator
-from swift.common.utils import normalize_timestamp
+from unittest import mock
+import random
+import sqlite3
 
+from eventlet import sleep
 
-class TestReplicator(unittest.TestCase):
+from swift.common import db_replicator
+from swift.common.swob import HTTPServerError
+from swift.container import replicator, backend, server, sync_store
+from swift.container.reconciler import (
+    MISPLACED_OBJECTS_ACCOUNT, get_reconciler_container_name)
+from swift.common.utils import Timestamp, encode_timestamps, ShardRange, \
+    get_db_files, make_db_file_path, MD5_OF_EMPTY_STRING, quote, node_to_string
+from swift.common.storage_policy import POLICIES
 
-    def setUp(self):
-        self.orig_ring = replicator.db_replicator.ring.Ring
-        replicator.db_replicator.ring.Ring = lambda *args, **kwargs: None
+from test.debug_logger import debug_logger
+from test.unit.common import test_db_replicator
+from test.unit import patch_policies, make_timestamp_iter, mock_check_drive, \
+    attach_fake_replication_rpc, FakeHTTPResponse
+from contextlib import contextmanager
 
-    def tearDown(self):
-        replicator.db_replicator.ring.Ring = self.orig_ring
+
+@patch_policies
+class TestReplicatorSync(test_db_replicator.TestReplicatorSync):
+
+    backend = backend.ContainerBroker
+    datadir = server.DATADIR
+    replicator_daemon = replicator.ContainerReplicator
+    replicator_rpc = replicator.ContainerReplicatorRpc
+
+    def assertShardRangesEqual(self, x, y):
+        # ShardRange.__eq__ only compares lower and upper; here we generate
+        # dict representations to compare all attributes
+        self.assertEqual([dict(sr) for sr in x], [dict(sr) for sr in y])
+
+    def assertShardRangesNotEqual(self, x, y):
+        # ShardRange.__eq__ only compares lower and upper; here we generate
+        # dict representations to compare all attributes
+        self.assertNotEqual([dict(sr) for sr in x], [dict(sr) for sr in y])
 
     def test_report_up_to_date(self):
+        broker = self._get_broker('a', 'c', node_index=0)
+        ts_1 = Timestamp(1)
+        broker.initialize(ts_1.internal, int(POLICIES.default))
+        info = broker.get_info()
+        broker.reported(info['put_timestamp'],
+                        info['delete_timestamp'],
+                        info['object_count'],
+                        info['bytes_used'])
+        full_info = broker.get_replication_info()
+        expected_info = {'put_timestamp': ts_1.internal,
+                         'delete_timestamp': '0',
+                         'count': 0,
+                         'bytes_used': 0,
+                         'reported_put_timestamp': ts_1.internal,
+                         'reported_delete_timestamp': '0',
+                         'reported_object_count': 0,
+                         'reported_bytes_used': 0}
+        for key, value in expected_info.items():
+            msg = 'expected value for %r, %r != %r' % (
+                key, full_info[key], value)
+            self.assertEqual(full_info[key], value, msg)
         repl = replicator.ContainerReplicator({})
-        info = {'put_timestamp': normalize_timestamp(1),
-                'delete_timestamp': normalize_timestamp(0),
-                'object_count': 0,
-                'bytes_used': 0,
-                'reported_put_timestamp': normalize_timestamp(1),
-                'reported_delete_timestamp': normalize_timestamp(0),
-                'reported_object_count': 0,
-                'reported_bytes_used': 0}
-        self.assertTrue(repl.report_up_to_date(info))
-        info['delete_timestamp'] = normalize_timestamp(2)
-        self.assertFalse(repl.report_up_to_date(info))
-        info['reported_delete_timestamp'] = normalize_timestamp(2)
-        self.assertTrue(repl.report_up_to_date(info))
-        info['object_count'] = 1
-        self.assertFalse(repl.report_up_to_date(info))
-        info['reported_object_count'] = 1
-        self.assertTrue(repl.report_up_to_date(info))
-        info['bytes_used'] = 1
-        self.assertFalse(repl.report_up_to_date(info))
-        info['reported_bytes_used'] = 1
-        self.assertTrue(repl.report_up_to_date(info))
-        info['put_timestamp'] = normalize_timestamp(3)
-        self.assertFalse(repl.report_up_to_date(info))
-        info['reported_put_timestamp'] = normalize_timestamp(3)
-        self.assertTrue(repl.report_up_to_date(info))
+        self.assertTrue(repl.report_up_to_date(full_info))
+        ts_2 = Timestamp(2)
+        full_info['delete_timestamp'] = ts_2.internal
+        self.assertFalse(repl.report_up_to_date(full_info))
+        full_info['reported_delete_timestamp'] = ts_2.internal
+        self.assertTrue(repl.report_up_to_date(full_info))
+        full_info['count'] = 1
+        self.assertFalse(repl.report_up_to_date(full_info))
+        full_info['reported_object_count'] = 1
+        self.assertTrue(repl.report_up_to_date(full_info))
+        full_info['bytes_used'] = 1
+        self.assertFalse(repl.report_up_to_date(full_info))
+        full_info['reported_bytes_used'] = 1
+        self.assertTrue(repl.report_up_to_date(full_info))
+        ts_3 = Timestamp(3)
+        full_info['put_timestamp'] = ts_3.internal
+        self.assertFalse(repl.report_up_to_date(full_info))
+        full_info['reported_put_timestamp'] = ts_3.internal
+        self.assertTrue(repl.report_up_to_date(full_info))
+
+    def test_sync_remote_in_sync(self):
+        # setup a local container
+        broker = self._get_broker('a', 'c', node_index=0)
+        put_timestamp = time.time()
+        broker.initialize(put_timestamp, POLICIES.default.idx)
+        # "replicate" to same database
+        node = {'device': 'sdb', 'replication_ip': '127.0.0.1'}
+        daemon = replicator.ContainerReplicator({})
+        # replicate
+        part, node = self._get_broker_part_node(broker)
+        info = broker.get_replication_info()
+        success = daemon._repl_to_node(node, broker, part, info)
+        # nothing to do
+        self.assertTrue(success)
+        self.assertEqual(1, daemon.stats['no_change'])
+
+    def test_sync_shard_ranges_logs_via_db_log_debug(self):
+        daemon = replicator.ContainerReplicator({}, logger=self.logger)
+        broker = mock.Mock()
+        broker.db_file = '/path/to/db'
+        broker.path = '/v1/AUTH_a/c'
+        # The implementation uses get_all_shard_range_data()
+        broker.get_all_shard_range_data.return_value = [mock.Mock(),
+                                                        mock.Mock()]
+
+        http = mock.Mock()
+        http.node = {'ip': '10.0.0.1', 'port': 6201, 'device': 'sda1'}
+
+        with mock.patch.object(daemon, '_send_replicate_request',
+                               return_value=True) as mock_send:
+
+            success = daemon._sync_shard_ranges(broker, http,
+                                                local_id='local-uuid')
+
+        self.assertTrue(success)
+        mock_send.assert_called_once()
+        node_str = node_to_string(http.node, False)
+        lines = self.logger.get_lines_for_level('debug')
+        self.assertEqual(
+            ['synced 2 shard ranges to %s, path: /v1/AUTH_a/c, '
+             'db: /path/to/db'
+             % node_str], lines)
+
+    def test_choose_replication_mode_warning_for_old_peer(self):
+        daemon = replicator.ContainerReplicator({}, logger=self.logger)
+
+        broker = mock.Mock()
+        broker.db_file = '/path/to/db'
+        broker.path = '/v1/AUTH_a/c'
+        broker.sharding_initiated.return_value = False
+
+        node = {'ip': '10.0.0.2', 'port': 6201, 'device': 'sdb1'}
+        http = mock.Mock()
+        rinfo = {}  # no 'shard_max_row'
+        info = {'id': 'local-uuid'}
+        local_sync = mock.Mock()
+        different_region = False
+
+        with mock.patch.object(daemon, '_sync_shard_ranges') as mock_sync, \
+             mock.patch.object(db_replicator.Replicator,
+                               '_choose_replication_mode',
+                               return_value=True) as mock_choose_repl_mode:
+            daemon._choose_replication_mode(
+                node, rinfo, info, local_sync, broker, http, different_region)
+            mock_sync.assert_not_called()
+            mock_choose_repl_mode.assert_called_once_with(
+                node, rinfo, info, local_sync, broker, http, different_region
+            )
+
+        node_str = '%(ip)s:%(port)s/%(device)s' % node
+        lines = self.logger.get_lines_for_level('warning')
+        self.assertEqual(
+            ['unable to replicate shard ranges to peer %s; '
+             'peer may need upgrading, path: /v1/AUTH_a/c, db: /path/to/db'
+             % node_str], lines)
+
+    def test_choose_replication_mode_sharded_nothing_more_to_replicate(self):
+        daemon = replicator.ContainerReplicator({}, logger=self.logger)
+
+        broker = mock.Mock()
+        broker.db_file = '/path/to/db'
+        broker.path = '/v1/AUTH_a/c'
+        broker.sharding_initiated.return_value = True
+        broker.get_objects.return_value = []
+
+        node = {'ip': '10.0.0.3', 'port': 6201, 'device': 'sdc1'}
+        http = mock.Mock()
+        info = {'id': 'local-uuid', 'db_state': backend.SHARDED}
+        rinfo = {'shard_max_row': 123}
+        local_sync = mock.Mock()
+        different_region = False
+
+        with mock.patch.object(daemon, '_sync_shard_ranges',
+                               return_value=True), \
+                mock.patch.object(db_replicator.Replicator,
+                                  '_choose_replication_mode',
+                                  return_value=True):
+
+            daemon._choose_replication_mode(
+                node, rinfo, info, local_sync, broker, http, different_region)
+
+        node_str = '%(ip)s:%(port)s/%(device)s' % node
+        lines = self.logger.get_lines_for_level('debug')
+        self.assertEqual(
+            ['sharded and has nothing more to replicate to peer %s, '
+             'path: /v1/AUTH_a/c, db: /path/to/db'
+             % node_str], lines)
+        broker.get_objects.assert_called_once_with(limit=1)
+
+    def test_sync_remote_with_timings(self):
+        ts_iter = make_timestamp_iter()
+        # setup a local container
+        broker = self._get_broker('a', 'c', node_index=0)
+        put_timestamp = next(ts_iter)
+        broker.initialize(put_timestamp.internal, POLICIES.default.idx)
+        broker.update_metadata(
+            {'x-container-meta-test': ('foo', put_timestamp.internal)})
+        # setup remote container
+        remote_broker = self._get_broker('a', 'c', node_index=1)
+        remote_broker.initialize(next(ts_iter).internal, POLICIES.default.idx)
+        timestamp = next(ts_iter)
+        for db in (broker, remote_broker):
+            db.put_object(
+                '/a/c/o', timestamp.internal, 0, 'content-type', 'etag',
+                storage_policy_index=db.storage_policy_index)
+        # replicate
+        daemon = replicator.ContainerReplicator({})
+        part, node = self._get_broker_part_node(remote_broker)
+        info = broker.get_replication_info()
+        with mock.patch.object(db_replicator, 'DEBUG_TIMINGS_THRESHOLD', -1):
+            success = daemon._repl_to_node(node, broker, part, info)
+        # nothing to do
+        self.assertTrue(success)
+        self.assertEqual(1, daemon.stats['no_change'])
+        expected_timings = ('info', 'update_metadata', 'merge_timestamps',
+                            'get_sync', 'merge_syncs')
+        debug_lines = self.rpc.logger.logger.get_lines_for_level('debug')
+        self.assertEqual(len(expected_timings), len(debug_lines),
+                         'Expected %s debug lines but only got %s: %s' %
+                         (len(expected_timings), len(debug_lines),
+                          debug_lines))
+        for metric in expected_timings:
+            expected = 'replicator-rpc-sync time for %s:' % metric
+            self.assertTrue(any(expected in line for line in debug_lines),
+                            'debug timing %r was not in %r' % (
+                                expected, debug_lines))
+
+    def test_sync_remote_missing(self):
+        broker = self._get_broker('a', 'c', node_index=0)
+        put_timestamp = time.time()
+        broker.initialize(put_timestamp, POLICIES.default.idx)
+
+        # "replicate"
+        part, node = self._get_broker_part_node(broker)
+        daemon = self._run_once(node)
+
+        # complete rsync to all other nodes
+        self.assertEqual(2, daemon.stats['rsync'])
+        for i in range(1, 3):
+            remote_broker = self._get_broker('a', 'c', node_index=i)
+            self.assertTrue(os.path.exists(remote_broker.db_file))
+            remote_info = remote_broker.get_info()
+            local_info = self._get_broker(
+                'a', 'c', node_index=0).get_info()
+            for k, v in local_info.items():
+                if k == 'id':
+                    continue
+                self.assertEqual(remote_info[k], v,
+                                 "mismatch remote %s %r != %r" % (
+                                     k, remote_info[k], v))
+
+    def test_rsync_failure(self):
+        broker = self._get_broker('a', 'c', node_index=0)
+        put_timestamp = time.time()
+        broker.initialize(put_timestamp, POLICIES.default.idx)
+        # "replicate" to different device
+        daemon = replicator.ContainerReplicator({})
+
+        def _rsync_file_stub(broker_arg, *args, **kwargs):
+            self.assertIs(broker_arg, broker)
+            return False
+        daemon._rsync_file = _rsync_file_stub
+
+        # replicate
+        part, local_node = self._get_broker_part_node(broker)
+        node = random.choice([n for n in self._ring.devs
+                              if n['id'] != local_node['id']])
+        info = broker.get_replication_info()
+        with mock_check_drive(ismount=True):
+            success = daemon._repl_to_node(node, broker, part, info)
+        self.assertFalse(success)
+
+    def test_sync_remote_missing_most_rows(self):
+        put_timestamp = time.time()
+        # create "local" broker
+        broker = self._get_broker('a', 'c', node_index=0)
+        broker.initialize(put_timestamp, POLICIES.default.idx)
+        # create "remote" broker
+        remote_broker = self._get_broker('a', 'c', node_index=1)
+        remote_broker.initialize(put_timestamp, POLICIES.default.idx)
+        # add a row to "local" db
+        broker.put_object('/a/c/o', time.time(), 0, 'content-type', 'etag',
+                          storage_policy_index=broker.storage_policy_index)
+        # replicate
+        node = {'device': 'sdc', 'replication_ip': '127.0.0.1'}
+        daemon = replicator.ContainerReplicator({'per_diff': 1})
+
+        def _rsync_file(broker_arg, remote_file, **kwargs):
+            remote_server, remote_path = remote_file.split('/', 1)
+            dest_path = os.path.join(self.root, remote_path)
+            shutil.copy(broker_arg.db_file, dest_path)
+            return True
+        daemon._rsync_file = _rsync_file
+        part, node = self._get_broker_part_node(remote_broker)
+        info = broker.get_replication_info()
+        success = daemon._repl_to_node(node, broker, part, info)
+        self.assertTrue(success)
+        # row merge
+        self.assertEqual(1, daemon.stats['remote_merge'])
+        local_info = self._get_broker(
+            'a', 'c', node_index=0).get_info()
+        remote_info = self._get_broker(
+            'a', 'c', node_index=1).get_info()
+        for k, v in local_info.items():
+            if k == 'id':
+                continue
+            self.assertEqual(remote_info[k], v,
+                             "mismatch remote %s %r != %r" % (
+                                 k, remote_info[k], v))
+
+    def test_sync_remote_missing_one_rows(self):
+        put_timestamp = time.time()
+        # create "local" broker
+        broker = self._get_broker('a', 'c', node_index=0)
+        broker.initialize(put_timestamp, POLICIES.default.idx)
+        # create "remote" broker
+        remote_broker = self._get_broker('a', 'c', node_index=1)
+        remote_broker.initialize(put_timestamp, POLICIES.default.idx)
+        # add some rows to both db
+        for i in range(10):
+            put_timestamp = Timestamp.now()
+            for db in (broker, remote_broker):
+                path = '/a/c/o_%s' % i
+                db.put_object(
+                    path, put_timestamp.internal, 0, 'content-type', 'etag',
+                    storage_policy_index=db.storage_policy_index)
+        # now a row to the "local" broker only
+        broker.put_object('/a/c/o_missing', Timestamp.now().internal, 0,
+                          'content-type', 'etag',
+                          storage_policy_index=broker.storage_policy_index)
+        # replicate
+        daemon = replicator.ContainerReplicator({})
+        part, node = self._get_broker_part_node(remote_broker)
+        info = broker.get_replication_info()
+        success = daemon._repl_to_node(node, broker, part, info)
+        self.assertTrue(success)
+        # row merge
+        self.assertEqual(1, daemon.stats['diff'])
+        local_info = self._get_broker(
+            'a', 'c', node_index=0).get_info()
+        remote_info = self._get_broker(
+            'a', 'c', node_index=1).get_info()
+        for k, v in local_info.items():
+            if k == 'id':
+                continue
+            self.assertEqual(remote_info[k], v,
+                             "mismatch remote %s %r != %r" % (
+                                 k, remote_info[k], v))
+
+    def test_sync_remote_can_not_keep_up(self):
+        put_timestamp = time.time()
+        # create "local" broker
+        broker = self._get_broker('a', 'c', node_index=0)
+        broker.initialize(put_timestamp, POLICIES.default.idx)
+        # create "remote" broker
+        remote_broker = self._get_broker('a', 'c', node_index=1)
+        remote_broker.initialize(put_timestamp, POLICIES.default.idx)
+        # add some rows to both db's
+        for i in range(10):
+            put_timestamp = Timestamp.now()
+            for db in (broker, remote_broker):
+                obj_name = 'o_%s' % i
+                db.put_object(obj_name, put_timestamp.internal, 0,
+                              'content-type', 'etag',
+                              storage_policy_index=db.storage_policy_index)
+        # setup REPLICATE callback to simulate adding rows during merge_items
+        missing_counter = itertools.count()
+
+        def put_more_objects(op, *args):
+            if op != 'merge_items':
+                return
+            path = '/a/c/o_missing_%s' % next(missing_counter)
+            broker.put_object(
+                path, Timestamp.now().internal, 0, 'content-type', 'etag',
+                storage_policy_index=db.storage_policy_index)
+        FakeReplConnection = test_db_replicator.attach_fake_replication_rpc(
+            self.rpc, replicate_hook=put_more_objects)
+        # and add one extra to local db to trigger merge_items
+        put_more_objects('merge_items')
+        # limit number of times we'll call merge_items
+        daemon = replicator.ContainerReplicator({'max_diffs': 10})
+        # replicate
+        part, node = self._get_broker_part_node(remote_broker)
+        info = broker.get_replication_info()
+        with mock.patch.object(db_replicator, 'ReplConnection',
+                               FakeReplConnection):
+            success = daemon._repl_to_node(node, broker, part, info)
+        self.assertFalse(success)
+        # back off on the PUTs during replication...
+        FakeReplConnection = test_db_replicator.attach_fake_replication_rpc(
+            self.rpc, replicate_hook=None)
+        # retry replication
+        info = broker.get_replication_info()
+        with mock.patch.object(db_replicator, 'ReplConnection',
+                               FakeReplConnection):
+            success = daemon._repl_to_node(node, broker, part, info)
+        self.assertTrue(success)
+        # row merge
+        self.assertEqual(2, daemon.stats['diff'])
+        self.assertEqual(1, daemon.stats['diff_capped'])
+        local_info = self._get_broker(
+            'a', 'c', node_index=0).get_info()
+        remote_info = self._get_broker(
+            'a', 'c', node_index=1).get_info()
+        for k, v in local_info.items():
+            if k == 'id':
+                continue
+            self.assertEqual(remote_info[k], v,
+                             "mismatch remote %s %r != %r" % (
+                                 k, remote_info[k], v))
+
+    def test_diff_capped_sync(self):
+        ts = (Timestamp(t).internal for t in
+              itertools.count(int(time.time())))
+        put_timestamp = next(ts)
+        # start off with with a local db that is way behind
+        broker = self._get_broker('a', 'c', node_index=0)
+        broker.initialize(put_timestamp, POLICIES.default.idx)
+        for i in range(50):
+            broker.put_object(
+                'o%s' % i, next(ts), 0, 'content-type-old', 'etag',
+                storage_policy_index=broker.storage_policy_index)
+        # remote primary db has all the new bits...
+        remote_broker = self._get_broker('a', 'c', node_index=1)
+        remote_broker.initialize(put_timestamp, POLICIES.default.idx)
+        for i in range(100):
+            remote_broker.put_object(
+                'o%s' % i, next(ts), 0, 'content-type-new', 'etag',
+                storage_policy_index=remote_broker.storage_policy_index)
+        # except there's *one* tiny thing in our local broker that's newer
+        broker.put_object(
+            'o101', next(ts), 0, 'content-type-new', 'etag',
+            storage_policy_index=broker.storage_policy_index)
+
+        # setup daemon with smaller per_diff and max_diffs
+        part, node = self._get_broker_part_node(broker)
+        daemon = self._get_daemon(node, conf_updates={'per_diff': 10,
+                                                      'max_diffs': 3})
+        self.assertEqual(daemon.per_diff, 10)
+        self.assertEqual(daemon.max_diffs, 3)
+        # run once and verify diff capped
+        self._run_once(node, daemon=daemon)
+        self.assertEqual(
+            'Synchronization has fallen more than '
+            '30 rows behind; moving on and will try '
+            'again next pass, path: %s, db: %s' % (quote(broker.path),
+                                                   broker.db_file),
+            daemon.logger.get_lines_for_level('debug')[-1])
+        self.assertEqual(1, daemon.stats['diff'])
+        self.assertEqual(1, daemon.stats['diff_capped'])
+        # run again and verify fully synced
+        self._run_once(node, daemon=daemon)
+        self.assertEqual(1, daemon.stats['diff'])
+        self.assertEqual(0, daemon.stats['diff_capped'])
+        # now that we're synced the new item should be in remote db
+        remote_names = set()
+        for item in remote_broker.list_objects_iter(500, '', '', '', ''):
+            name, ts, size, content_type, etag = item
+            remote_names.add(name)
+            self.assertEqual(content_type, 'content-type-new')
+        self.assertTrue('o101' in remote_names)
+        self.assertEqual(len(remote_names), 101)
+        self.assertEqual(remote_broker.get_info()['object_count'], 101)
+
+    def test_sync_status_change(self):
+        # setup a local container
+        broker = self._get_broker('a', 'c', node_index=0)
+        put_timestamp = time.time()
+        broker.initialize(put_timestamp, POLICIES.default.idx)
+        # setup remote container
+        remote_broker = self._get_broker('a', 'c', node_index=1)
+        remote_broker.initialize(put_timestamp, POLICIES.default.idx)
+        # delete local container
+        broker.delete_db(time.time())
+        # replicate
+        daemon = replicator.ContainerReplicator({})
+        part, node = self._get_broker_part_node(remote_broker)
+        info = broker.get_replication_info()
+        success = daemon._repl_to_node(node, broker, part, info)
+        # nothing to do
+        self.assertTrue(success)
+        self.assertEqual(1, daemon.stats['no_change'])
+        # status in sync
+        self.assertTrue(remote_broker.is_deleted())
+        info = broker.get_info()
+        remote_info = remote_broker.get_info()
+        self.assertTrue(Timestamp(remote_info['status_changed_at']) >
+                        Timestamp(remote_info['put_timestamp']),
+                        'remote status_changed_at (%s) is not '
+                        'greater than put_timestamp (%s)' % (
+                            remote_info['status_changed_at'],
+                            remote_info['put_timestamp']))
+        self.assertTrue(Timestamp(remote_info['status_changed_at']) >
+                        Timestamp(info['status_changed_at']),
+                        'remote status_changed_at (%s) is not '
+                        'greater than local status_changed_at (%s)' % (
+                            remote_info['status_changed_at'],
+                            info['status_changed_at']))
+
+    @contextmanager
+    def _wrap_merge_timestamps(self, broker, calls):
+        def fake_merge_timestamps(*args, **kwargs):
+            calls.append(args[0])
+            orig_merge_timestamps(*args, **kwargs)
+
+        orig_merge_timestamps = broker.merge_timestamps
+        broker.merge_timestamps = fake_merge_timestamps
+        try:
+            yield True
+        finally:
+            broker.merge_timestamps = orig_merge_timestamps
+
+    def test_sync_merge_timestamps(self):
+        ts = (Timestamp(t).internal for t in
+              itertools.count(int(time.time())))
+        # setup a local container
+        broker = self._get_broker('a', 'c', node_index=0)
+        put_timestamp = next(ts)
+        broker.initialize(put_timestamp, POLICIES.default.idx)
+        # setup remote container
+        remote_broker = self._get_broker('a', 'c', node_index=1)
+        remote_put_timestamp = next(ts)
+        remote_broker.initialize(remote_put_timestamp, POLICIES.default.idx)
+        # replicate, expect call to merge_timestamps on remote and local
+        daemon = replicator.ContainerReplicator({})
+        part, node = self._get_broker_part_node(remote_broker)
+        info = broker.get_replication_info()
+        local_calls = []
+        remote_calls = []
+        with self._wrap_merge_timestamps(broker, local_calls):
+            with self._wrap_merge_timestamps(broker, remote_calls):
+                success = daemon._repl_to_node(node, broker, part, info)
+        self.assertTrue(success)
+        self.assertEqual(1, len(remote_calls))
+        self.assertEqual(1, len(local_calls))
+        self.assertEqual(remote_put_timestamp,
+                         broker.get_info()['put_timestamp'])
+        self.assertEqual(remote_put_timestamp,
+                         remote_broker.get_info()['put_timestamp'])
+
+        # replicate again, no changes so expect no calls to merge_timestamps
+        info = broker.get_replication_info()
+        local_calls = []
+        remote_calls = []
+        with self._wrap_merge_timestamps(broker, local_calls):
+            with self._wrap_merge_timestamps(broker, remote_calls):
+                success = daemon._repl_to_node(node, broker, part, info)
+        self.assertTrue(success)
+        self.assertEqual(0, len(remote_calls))
+        self.assertEqual(0, len(local_calls))
+        self.assertEqual(remote_put_timestamp,
+                         broker.get_info()['put_timestamp'])
+        self.assertEqual(remote_put_timestamp,
+                         remote_broker.get_info()['put_timestamp'])
+
+    def test_sync_bogus_db_quarantines(self):
+        ts = (Timestamp(t).internal for t in
+              itertools.count(int(time.time())))
+        policy = random.choice(list(POLICIES))
+
+        # create "local" broker
+        local_broker = self._get_broker('a', 'c', node_index=0)
+        local_broker.initialize(next(ts), policy.idx)
+
+        # create "remote" broker
+        remote_broker = self._get_broker('a', 'c', node_index=1)
+        remote_broker.initialize(next(ts), policy.idx)
+
+        db_path = local_broker.db_file
+        self.assertTrue(os.path.exists(db_path))  # sanity check
+        old_inode = os.stat(db_path).st_ino
+
+        _orig_get_info = backend.ContainerBroker.get_info
+
+        def fail_like_bad_db(broker):
+            if broker.db_file == local_broker.db_file:
+                raise sqlite3.OperationalError("no such table: container_info")
+            else:
+                return _orig_get_info(broker)
+
+        part, node = self._get_broker_part_node(remote_broker)
+        with mock.patch('swift.container.backend.ContainerBroker.get_info',
+                        fail_like_bad_db):
+            # Have the remote node replicate to local; local should see its
+            # corrupt DB, quarantine it, and act like the DB wasn't ever there
+            # in the first place.
+            daemon = self._run_once(node)
+
+        self.assertTrue(os.path.exists(db_path))
+        # Make sure we didn't just keep the old DB, but quarantined it and
+        # made a fresh copy.
+        new_inode = os.stat(db_path).st_ino
+        self.assertNotEqual(old_inode, new_inode)
+        self.assertEqual(daemon.stats['failure'], 0)
+
+    def _replication_scenarios(self, *scenarios, **kwargs):
+        remote_wins = kwargs.get('remote_wins', False)
+        # these tests are duplicated because of the differences in replication
+        # when row counts cause full rsync vs. merge
+        scenarios = scenarios or (
+            'no_row', 'local_row', 'remote_row', 'both_rows')
+        for scenario_name in scenarios:
+            ts = itertools.count(int(time.time()))
+            policy = random.choice(list(POLICIES))
+            remote_policy = random.choice(
+                [p for p in POLICIES if p is not policy])
+            broker = self._get_broker('a', 'c', node_index=0)
+            remote_broker = self._get_broker('a', 'c', node_index=1)
+            yield ts, policy, remote_policy, broker, remote_broker
+            # variations on different replication scenarios
+            variations = {
+                'no_row': (),
+                'local_row': (broker,),
+                'remote_row': (remote_broker,),
+                'both_rows': (broker, remote_broker),
+            }
+            dbs = variations[scenario_name]
+            obj_ts = next(ts)
+            for db in dbs:
+                db.put_object('/a/c/o', obj_ts, 0, 'content-type', 'etag',
+                              storage_policy_index=db.storage_policy_index)
+            # replicate
+            part, node = self._get_broker_part_node(broker)
+            daemon = self._run_once(node)
+            self.assertEqual(0, daemon.stats['failure'])
+
+            # in sync
+            local_info = self._get_broker(
+                'a', 'c', node_index=0).get_info()
+            remote_info = self._get_broker(
+                'a', 'c', node_index=1).get_info()
+            if remote_wins:
+                expected = remote_policy.idx
+                err = 'local policy did not change to match remote ' \
+                    'for replication row scenario %s' % scenario_name
+            else:
+                expected = policy.idx
+                err = 'local policy changed to match remote ' \
+                    'for replication row scenario %s' % scenario_name
+            self.assertEqual(local_info['storage_policy_index'], expected, err)
+            self.assertEqual(remote_info['storage_policy_index'],
+                             local_info['storage_policy_index'])
+            test_db_replicator.TestReplicatorSync.tearDown(self)
+            test_db_replicator.TestReplicatorSync.setUp(self)
+
+    def test_sync_local_create_policy_over_newer_remote_create(self):
+        for setup in self._replication_scenarios():
+            ts, policy, remote_policy, broker, remote_broker = setup
+            # create "local" broker
+            broker.initialize(next(ts), policy.idx)
+            # create "remote" broker
+            remote_broker.initialize(next(ts), remote_policy.idx)
+
+    def test_sync_local_create_policy_over_newer_remote_delete(self):
+        for setup in self._replication_scenarios():
+            ts, policy, remote_policy, broker, remote_broker = setup
+            # create older "local" broker
+            broker.initialize(next(ts), policy.idx)
+            # create "remote" broker
+            remote_broker.initialize(next(ts), remote_policy.idx)
+            # delete "remote" broker
+            remote_broker.delete_db(next(ts))
+
+    def test_sync_local_create_policy_over_older_remote_delete(self):
+        # remote_row & both_rows cases are covered by
+        # "test_sync_remote_half_delete_policy_over_newer_local_create"
+        for setup in self._replication_scenarios(
+                'no_row', 'local_row'):
+            ts, policy, remote_policy, broker, remote_broker = setup
+            # create older "remote" broker
+            remote_broker.initialize(next(ts), remote_policy.idx)
+            # delete older "remote" broker
+            remote_broker.delete_db(next(ts))
+            # create "local" broker
+            broker.initialize(next(ts), policy.idx)
+
+    def test_sync_local_half_delete_policy_over_newer_remote_create(self):
+        # no_row & remote_row cases are covered by
+        # "test_sync_remote_create_policy_over_older_local_delete"
+        for setup in self._replication_scenarios('local_row', 'both_rows'):
+            ts, policy, remote_policy, broker, remote_broker = setup
+            # create older "local" broker
+            broker.initialize(next(ts), policy.idx)
+            # half delete older "local" broker
+            broker.delete_db(next(ts))
+            # create "remote" broker
+            remote_broker.initialize(next(ts), remote_policy.idx)
+
+    def test_sync_local_recreate_policy_over_newer_remote_create(self):
+        for setup in self._replication_scenarios():
+            ts, policy, remote_policy, broker, remote_broker = setup
+            # create "local" broker
+            broker.initialize(next(ts), policy.idx)
+            # older recreate "local" broker
+            broker.delete_db(next(ts))
+            recreate_timestamp = next(ts)
+            broker.update_put_timestamp(recreate_timestamp)
+            broker.update_status_changed_at(recreate_timestamp)
+            # create "remote" broker
+            remote_broker.initialize(next(ts), remote_policy.idx)
+
+    def test_sync_local_recreate_policy_over_older_remote_create(self):
+        for setup in self._replication_scenarios():
+            ts, policy, remote_policy, broker, remote_broker = setup
+            # create older "remote" broker
+            remote_broker.initialize(next(ts), remote_policy.idx)
+            # create "local" broker
+            broker.initialize(next(ts), policy.idx)
+            # recreate "local" broker
+            broker.delete_db(next(ts))
+            recreate_timestamp = next(ts)
+            broker.update_put_timestamp(recreate_timestamp)
+            broker.update_status_changed_at(recreate_timestamp)
+
+    def test_sync_local_recreate_policy_over_newer_remote_delete(self):
+        for setup in self._replication_scenarios():
+            ts, policy, remote_policy, broker, remote_broker = setup
+            # create "local" broker
+            broker.initialize(next(ts), policy.idx)
+            # create "remote" broker
+            remote_broker.initialize(next(ts), remote_policy.idx)
+            # recreate "local" broker
+            broker.delete_db(next(ts))
+            recreate_timestamp = next(ts)
+            broker.update_put_timestamp(recreate_timestamp)
+            broker.update_status_changed_at(recreate_timestamp)
+            # older delete "remote" broker
+            remote_broker.delete_db(next(ts))
+
+    def test_sync_local_recreate_policy_over_older_remote_delete(self):
+        for setup in self._replication_scenarios():
+            ts, policy, remote_policy, broker, remote_broker = setup
+            # create "local" broker
+            broker.initialize(next(ts), policy.idx)
+            # create "remote" broker
+            remote_broker.initialize(next(ts), remote_policy.idx)
+            # older delete "remote" broker
+            remote_broker.delete_db(next(ts))
+            # recreate "local" broker
+            broker.delete_db(next(ts))
+            recreate_timestamp = next(ts)
+            broker.update_put_timestamp(recreate_timestamp)
+            broker.update_status_changed_at(recreate_timestamp)
+
+    def test_sync_local_recreate_policy_over_older_remote_recreate(self):
+        for setup in self._replication_scenarios():
+            ts, policy, remote_policy, broker, remote_broker = setup
+            # create "remote" broker
+            remote_broker.initialize(next(ts), remote_policy.idx)
+            # create "local" broker
+            broker.initialize(next(ts), policy.idx)
+            # older recreate "remote" broker
+            remote_broker.delete_db(next(ts))
+            remote_recreate_timestamp = next(ts)
+            remote_broker.update_put_timestamp(remote_recreate_timestamp)
+            remote_broker.update_status_changed_at(remote_recreate_timestamp)
+            # recreate "local" broker
+            broker.delete_db(next(ts))
+            local_recreate_timestamp = next(ts)
+            broker.update_put_timestamp(local_recreate_timestamp)
+            broker.update_status_changed_at(local_recreate_timestamp)
+
+    def test_sync_remote_create_policy_over_newer_local_create(self):
+        for setup in self._replication_scenarios(remote_wins=True):
+            ts, policy, remote_policy, broker, remote_broker = setup
+            # create older "remote" broker
+            remote_broker.initialize(next(ts), remote_policy.idx)
+            # create "local" broker
+            broker.initialize(next(ts), policy.idx)
+
+    def test_sync_remote_create_policy_over_newer_local_delete(self):
+        for setup in self._replication_scenarios(remote_wins=True):
+            ts, policy, remote_policy, broker, remote_broker = setup
+            # create older "remote" broker
+            remote_broker.initialize(next(ts), remote_policy.idx)
+            # create "local" broker
+            broker.initialize(next(ts), policy.idx)
+            # delete "local" broker
+            broker.delete_db(next(ts))
+
+    def test_sync_remote_create_policy_over_older_local_delete(self):
+        # local_row & both_rows cases are covered by
+        # "test_sync_local_half_delete_policy_over_newer_remote_create"
+        for setup in self._replication_scenarios(
+                'no_row', 'remote_row', remote_wins=True):
+            ts, policy, remote_policy, broker, remote_broker = setup
+            # create older "local" broker
+            broker.initialize(next(ts), policy.idx)
+            # delete older "local" broker
+            broker.delete_db(next(ts))
+            # create "remote" broker
+            remote_broker.initialize(next(ts), remote_policy.idx)
+
+    def test_sync_remote_half_delete_policy_over_newer_local_create(self):
+        # no_row & both_rows cases are covered by
+        # "test_sync_local_create_policy_over_older_remote_delete"
+        for setup in self._replication_scenarios('remote_row', 'both_rows',
+                                                 remote_wins=True):
+            ts, policy, remote_policy, broker, remote_broker = setup
+            # create older "remote" broker
+            remote_broker.initialize(next(ts), remote_policy.idx)
+            # half delete older "remote" broker
+            remote_broker.delete_db(next(ts))
+            # create "local" broker
+            broker.initialize(next(ts), policy.idx)
+
+    def test_sync_remote_recreate_policy_over_newer_local_create(self):
+        for setup in self._replication_scenarios(remote_wins=True):
+            ts, policy, remote_policy, broker, remote_broker = setup
+            # create "remote" broker
+            remote_broker.initialize(next(ts), remote_policy.idx)
+            # older recreate "remote" broker
+            remote_broker.delete_db(next(ts))
+            recreate_timestamp = next(ts)
+            remote_broker.update_put_timestamp(recreate_timestamp)
+            remote_broker.update_status_changed_at(recreate_timestamp)
+            # create "local" broker
+            broker.initialize(next(ts), policy.idx)
+
+    def test_sync_remote_recreate_policy_over_older_local_create(self):
+        for setup in self._replication_scenarios(remote_wins=True):
+            ts, policy, remote_policy, broker, remote_broker = setup
+            # create older "local" broker
+            broker.initialize(next(ts), policy.idx)
+            # create "remote" broker
+            remote_broker.initialize(next(ts), remote_policy.idx)
+            # recreate "remote" broker
+            remote_broker.delete_db(next(ts))
+            recreate_timestamp = next(ts)
+            remote_broker.update_put_timestamp(recreate_timestamp)
+            remote_broker.update_status_changed_at(recreate_timestamp)
+
+    def test_sync_remote_recreate_policy_over_newer_local_delete(self):
+        for setup in self._replication_scenarios(remote_wins=True):
+            ts, policy, remote_policy, broker, remote_broker = setup
+            # create "local" broker
+            broker.initialize(next(ts), policy.idx)
+            # create "remote" broker
+            remote_broker.initialize(next(ts), remote_policy.idx)
+            # recreate "remote" broker
+            remote_broker.delete_db(next(ts))
+            remote_recreate_timestamp = next(ts)
+            remote_broker.update_put_timestamp(remote_recreate_timestamp)
+            remote_broker.update_status_changed_at(remote_recreate_timestamp)
+            # older delete "local" broker
+            broker.delete_db(next(ts))
+
+    def test_sync_remote_recreate_policy_over_older_local_delete(self):
+        for setup in self._replication_scenarios(remote_wins=True):
+            ts, policy, remote_policy, broker, remote_broker = setup
+            # create "local" broker
+            broker.initialize(next(ts), policy.idx)
+            # create "remote" broker
+            remote_broker.initialize(next(ts), remote_policy.idx)
+            # older delete "local" broker
+            broker.delete_db(next(ts))
+            # recreate "remote" broker
+            remote_broker.delete_db(next(ts))
+            remote_recreate_timestamp = next(ts)
+            remote_broker.update_put_timestamp(remote_recreate_timestamp)
+            remote_broker.update_status_changed_at(remote_recreate_timestamp)
+
+    def test_sync_remote_recreate_policy_over_older_local_recreate(self):
+        for setup in self._replication_scenarios(remote_wins=True):
+            ts, policy, remote_policy, broker, remote_broker = setup
+            # create older "local" broker
+            broker.initialize(next(ts), policy.idx)
+            # create "remote" broker
+            remote_broker.initialize(next(ts), remote_policy.idx)
+            # older recreate "local" broker
+            broker.delete_db(next(ts))
+            local_recreate_timestamp = next(ts)
+            broker.update_put_timestamp(local_recreate_timestamp)
+            broker.update_status_changed_at(local_recreate_timestamp)
+            # recreate "remote" broker
+            remote_broker.delete_db(next(ts))
+            remote_recreate_timestamp = next(ts)
+            remote_broker.update_put_timestamp(remote_recreate_timestamp)
+            remote_broker.update_status_changed_at(remote_recreate_timestamp)
+
+    def test_sync_to_remote_with_misplaced(self):
+        ts = (Timestamp(t).internal for t in
+              itertools.count(int(time.time())))
+        # create "local" broker
+        policy = random.choice(list(POLICIES))
+        broker = self._get_broker('a', 'c', node_index=0)
+        broker.initialize(next(ts), policy.idx)
+
+        # create "remote" broker
+        remote_policy = random.choice([p for p in POLICIES if p is not
+                                       policy])
+        remote_broker = self._get_broker('a', 'c', node_index=1)
+        remote_broker.initialize(next(ts), remote_policy.idx)
+        # add misplaced row to remote_broker
+        remote_broker.put_object(
+            '/a/c/o', next(ts), 0, 'content-type',
+            'etag', storage_policy_index=remote_broker.storage_policy_index)
+        # since this row matches policy index or remote, it shows up in count
+        self.assertEqual(remote_broker.get_info()['object_count'], 1)
+        self.assertEqual([], remote_broker.get_misplaced_since(-1, 1))
+
+        # replicate
+        part, node = self._get_broker_part_node(broker)
+        daemon = self._run_once(node)
+        # since our local broker has no rows to push it logs as no_change
+        self.assertEqual(1, daemon.stats['no_change'])
+        self.assertEqual(0, broker.get_info()['object_count'])
+
+        # remote broker updates it's policy index; this makes the remote
+        # broker's object count change
+        info = remote_broker.get_info()
+        expectations = {
+            'object_count': 0,
+            'storage_policy_index': policy.idx,
+        }
+        for key, value in expectations.items():
+            self.assertEqual(info[key], value)
+        # but it also knows those objects are misplaced now
+        misplaced = remote_broker.get_misplaced_since(-1, 100)
+        self.assertEqual(len(misplaced), 1)
+
+        # we also pushed out to node 3 with rsync
+        self.assertEqual(1, daemon.stats['rsync'])
+        third_broker = self._get_broker('a', 'c', node_index=2)
+        info = third_broker.get_info()
+        for key, value in expectations.items():
+            self.assertEqual(info[key], value)
+
+    def test_misplaced_rows_replicate_and_enqueue(self):
+        # force all timestamps to fall in same hour
+        ts = (Timestamp(t) for t in
+              itertools.count(int(time.time()) // 3600 * 3600))
+        policy = random.choice(list(POLICIES))
+        broker = self._get_broker('a', 'c', node_index=0)
+        broker.initialize(next(ts).internal, policy.idx)
+        remote_policy = random.choice([p for p in POLICIES if p is not
+                                       policy])
+        remote_broker = self._get_broker('a', 'c', node_index=1)
+        remote_broker.initialize(next(ts).internal, remote_policy.idx)
+
+        # add a misplaced row to *local* broker
+        obj_put_timestamp = next(ts).internal
+        broker.put_object(
+            'o', obj_put_timestamp, 0, 'content-type',
+            'etag', storage_policy_index=remote_policy.idx)
+        misplaced = broker.get_misplaced_since(-1, 10)
+        self.assertEqual(len(misplaced), 1)
+        # since this row is misplaced it doesn't show up in count
+        self.assertEqual(broker.get_info()['object_count'], 0)
+
+        # add another misplaced row to *local* broker with composite timestamp
+        ts_data = next(ts)
+        ts_ctype = next(ts)
+        ts_meta = next(ts)
+        broker.put_object(
+            'o2', ts_data.internal, 0, 'content-type',
+            'etag', storage_policy_index=remote_policy.idx,
+            ctype_timestamp=ts_ctype.internal, meta_timestamp=ts_meta.internal)
+        misplaced = broker.get_misplaced_since(-1, 10)
+        self.assertEqual(len(misplaced), 2)
+        # since this row is misplaced it doesn't show up in count
+        self.assertEqual(broker.get_info()['object_count'], 0)
+
+        # replicate
+        part, node = self._get_broker_part_node(broker)
+        daemon = self._run_once(node)
+        # push to remote, and third node was missing (also maybe reconciler)
+        self.assertTrue(2 < daemon.stats['rsync'] <= 3, daemon.stats['rsync'])
+        self.assertEqual({
+            'attempts': 2,
+            'diffs': 1,
+            'successes': 4,
+            'rsyncs': 3,
+            'reconciler_db_created': 1,
+        }, self.logger.statsd_client.counters)
+
+        # grab the rsynced instance of remote_broker
+        remote_broker = self._get_broker('a', 'c', node_index=1)
+
+        # remote has misplaced rows too now
+        misplaced = remote_broker.get_misplaced_since(-1, 10)
+        self.assertEqual(len(misplaced), 2)
+
+        # and the correct policy_index and object_count
+        info = remote_broker.get_info()
+        expectations = {
+            'object_count': 0,
+            'storage_policy_index': policy.idx,
+        }
+        for key, value in expectations.items():
+            self.assertEqual(info[key], value)
+
+        # and we should have also enqueued these rows in a single reconciler,
+        # since we forced the object timestamps to be in the same hour.
+        self.logger.clear()
+        reconciler = daemon.get_reconciler_broker(misplaced[0]['created_at'])
+        self.assertEqual({
+            'reconciler_db_exists': 1,
+        }, self.logger.statsd_client.counters)
+        # but it may not be on the same node as us anymore though...
+        reconciler = self._get_broker(reconciler.account,
+                                      reconciler.container, node_index=0)
+        self.assertEqual(reconciler.get_info()['object_count'], 2)
+        objects = reconciler.list_objects_iter(
+            10, '', None, None, None, None, storage_policy_index=0)
+        self.assertEqual(len(objects), 2)
+        expected = ('%s:/a/c/o' % remote_policy.idx, obj_put_timestamp, 0,
+                    'application/x-put', obj_put_timestamp)
+        self.assertEqual(objects[0], expected)
+        # the second object's listing has ts_meta as its last modified time
+        # but its full composite timestamp is in the hash field.
+        expected = ('%s:/a/c/o2' % remote_policy.idx, ts_meta.internal, 0,
+                    'application/x-put',
+                    encode_timestamps(ts_data, ts_ctype, ts_meta))
+        self.assertEqual(objects[1], expected)
+
+        # having safely enqueued to the reconciler we can advance
+        # our sync pointer
+        self.assertEqual(broker.get_reconciler_sync(), 2)
+
+    def test_misplaced_rows_replicate_and_enqueue_from_old_style_shard(self):
+        # force all timestamps to fall in same hour
+        ts = (Timestamp(t) for t in
+              itertools.count(int(time.time()) // 3600 * 3600))
+        policy = random.choice(list(POLICIES))
+        broker = self._get_broker('.shards_a', 'some-other-c', node_index=0)
+        broker.initialize(next(ts).internal, policy.idx)
+        broker.set_sharding_sysmeta('Root', 'a/c')
+        remote_policy = random.choice([p for p in POLICIES if p is not
+                                       policy])
+        remote_broker = self._get_broker(
+            '.shards_a', 'some-other-c', node_index=1)
+        remote_broker.initialize(next(ts).internal, remote_policy.idx)
+
+        # add a misplaced row to *local* broker
+        obj_put_timestamp = next(ts).internal
+        broker.put_object(
+            'o', obj_put_timestamp, 0, 'content-type',
+            'etag', storage_policy_index=remote_policy.idx)
+        misplaced = broker.get_misplaced_since(-1, 10)
+        self.assertEqual(len(misplaced), 1)
+        # since this row is misplaced it doesn't show up in count
+        self.assertEqual(broker.get_info()['object_count'], 0)
+
+        # add another misplaced row to *local* broker with composite timestamp
+        ts_data = next(ts)
+        ts_ctype = next(ts)
+        ts_meta = next(ts)
+        broker.put_object(
+            'o2', ts_data.internal, 0, 'content-type',
+            'etag', storage_policy_index=remote_policy.idx,
+            ctype_timestamp=ts_ctype.internal, meta_timestamp=ts_meta.internal)
+        misplaced = broker.get_misplaced_since(-1, 10)
+        self.assertEqual(len(misplaced), 2)
+        # since this row is misplaced it doesn't show up in count
+        self.assertEqual(broker.get_info()['object_count'], 0)
+
+        # replicate
+        part, node = self._get_broker_part_node(broker)
+        daemon = self._run_once(node)
+        # push to remote, and third node was missing (also maybe reconciler)
+        self.assertTrue(2 < daemon.stats['rsync'] <= 3, daemon.stats['rsync'])
+
+        # grab the rsynced instance of remote_broker
+        remote_broker = self._get_broker(
+            '.shards_a', 'some-other-c', node_index=1)
+
+        # remote has misplaced rows too now
+        misplaced = remote_broker.get_misplaced_since(-1, 10)
+        self.assertEqual(len(misplaced), 2)
+
+        # and the correct policy_index and object_count
+        info = remote_broker.get_info()
+        expectations = {
+            'object_count': 0,
+            'storage_policy_index': policy.idx,
+        }
+        for key, value in expectations.items():
+            self.assertEqual(info[key], value)
+
+        # and we should have also enqueued these rows in a single reconciler,
+        # since we forced the object timestamps to be in the same hour.
+        reconciler = daemon.get_reconciler_broker(misplaced[0]['created_at'])
+        # but it may not be on the same node as us anymore though...
+        reconciler = self._get_broker(reconciler.account,
+                                      reconciler.container, node_index=0)
+        self.assertEqual(reconciler.get_info()['object_count'], 2)
+        objects = reconciler.list_objects_iter(
+            10, '', None, None, None, None, storage_policy_index=0)
+        self.assertEqual(len(objects), 2)
+        # NB: reconciler work is for the *root* container!
+        expected = ('%s:/a/c/o' % remote_policy.idx, obj_put_timestamp, 0,
+                    'application/x-put', obj_put_timestamp)
+        self.assertEqual(objects[0], expected)
+        # the second object's listing has ts_meta as its last modified time
+        # but its full composite timestamp is in the hash field.
+        expected = ('%s:/a/c/o2' % remote_policy.idx, ts_meta.internal, 0,
+                    'application/x-put',
+                    encode_timestamps(ts_data, ts_ctype, ts_meta))
+        self.assertEqual(objects[1], expected)
+
+        # having safely enqueued to the reconciler we can advance
+        # our sync pointer
+        self.assertEqual(broker.get_reconciler_sync(), 2)
+
+    def test_misplaced_rows_replicate_and_enqueue_from_shard(self):
+        # force all timestamps to fall in same hour
+        ts = (Timestamp(t) for t in
+              itertools.count(int(time.time()) // 3600 * 3600))
+        policy = random.choice(list(POLICIES))
+        broker = self._get_broker('.shards_a', 'some-other-c', node_index=0)
+        broker.initialize(next(ts).internal, policy.idx)
+        broker.set_sharding_sysmeta('Quoted-Root', 'a/c')
+        remote_policy = random.choice([p for p in POLICIES if p is not
+                                       policy])
+        remote_broker = self._get_broker(
+            '.shards_a', 'some-other-c', node_index=1)
+        remote_broker.initialize(next(ts).internal, remote_policy.idx)
+
+        # add a misplaced row to *local* broker
+        obj_put_timestamp = next(ts).internal
+        broker.put_object(
+            'o', obj_put_timestamp, 0, 'content-type',
+            'etag', storage_policy_index=remote_policy.idx)
+        misplaced = broker.get_misplaced_since(-1, 10)
+        self.assertEqual(len(misplaced), 1)
+        # since this row is misplaced it doesn't show up in count
+        self.assertEqual(broker.get_info()['object_count'], 0)
+
+        # add another misplaced row to *local* broker with composite timestamp
+        ts_data = next(ts)
+        ts_ctype = next(ts)
+        ts_meta = next(ts)
+        broker.put_object(
+            'o2', ts_data.internal, 0, 'content-type',
+            'etag', storage_policy_index=remote_policy.idx,
+            ctype_timestamp=ts_ctype.internal, meta_timestamp=ts_meta.internal)
+        misplaced = broker.get_misplaced_since(-1, 10)
+        self.assertEqual(len(misplaced), 2)
+        # since this row is misplaced it doesn't show up in count
+        self.assertEqual(broker.get_info()['object_count'], 0)
+
+        # replicate
+        part, node = self._get_broker_part_node(broker)
+        daemon = self._run_once(node)
+        # push to remote, and third node was missing (also maybe reconciler)
+        self.assertTrue(2 < daemon.stats['rsync'] <= 3, daemon.stats['rsync'])
+
+        # grab the rsynced instance of remote_broker
+        remote_broker = self._get_broker(
+            '.shards_a', 'some-other-c', node_index=1)
+
+        # remote has misplaced rows too now
+        misplaced = remote_broker.get_misplaced_since(-1, 10)
+        self.assertEqual(len(misplaced), 2)
+
+        # and the correct policy_index and object_count
+        info = remote_broker.get_info()
+        expectations = {
+            'object_count': 0,
+            'storage_policy_index': policy.idx,
+        }
+        for key, value in expectations.items():
+            self.assertEqual(info[key], value)
+
+        # and we should have also enqueued these rows in a single reconciler,
+        # since we forced the object timestamps to be in the same hour.
+        reconciler = daemon.get_reconciler_broker(misplaced[0]['created_at'])
+        # but it may not be on the same node as us anymore though...
+        reconciler = self._get_broker(reconciler.account,
+                                      reconciler.container, node_index=0)
+        self.assertEqual(reconciler.get_info()['object_count'], 2)
+        objects = reconciler.list_objects_iter(
+            10, '', None, None, None, None, storage_policy_index=0)
+        self.assertEqual(len(objects), 2)
+        # NB: reconciler work is for the *root* container!
+        expected = ('%s:/a/c/o' % remote_policy.idx, obj_put_timestamp, 0,
+                    'application/x-put', obj_put_timestamp)
+        self.assertEqual(objects[0], expected)
+        # the second object's listing has ts_meta as its last modified time
+        # but its full composite timestamp is in the hash field.
+        expected = ('%s:/a/c/o2' % remote_policy.idx, ts_meta.internal, 0,
+                    'application/x-put',
+                    encode_timestamps(ts_data, ts_ctype, ts_meta))
+        self.assertEqual(objects[1], expected)
+
+        # having safely enqueued to the reconciler we can advance
+        # our sync pointer
+        self.assertEqual(broker.get_reconciler_sync(), 2)
+
+    def test_multiple_out_sync_reconciler_enqueue_normalize(self):
+        ts = (Timestamp(t).internal for t in
+              itertools.count(int(time.time())))
+        policy = random.choice(list(POLICIES))
+        broker = self._get_broker('a', 'c', node_index=0)
+        broker.initialize(next(ts), policy.idx)
+        remote_policy = random.choice([p for p in POLICIES if p is not
+                                       policy])
+        remote_broker = self._get_broker('a', 'c', node_index=1)
+        remote_broker.initialize(next(ts), remote_policy.idx)
+
+        # add some rows to brokers
+        for db in (broker, remote_broker):
+            for p in (policy, remote_policy):
+                db.put_object('o-%s' % p.name, next(ts), 0, 'content-type',
+                              'etag', storage_policy_index=p.idx)
+            db._commit_puts()
+
+        expected_policy_stats = {
+            policy.idx: {'object_count': 1, 'bytes_used': 0},
+            remote_policy.idx: {'object_count': 1, 'bytes_used': 0},
+        }
+        for db in (broker, remote_broker):
+            policy_stats = db.get_policy_stats()
+            self.assertEqual(policy_stats, expected_policy_stats)
+
+        # each db has 2 rows, 4 total
+        all_items = set()
+        for db in (broker, remote_broker):
+            items = db.get_items_since(-1, 4)
+            all_items.update(
+                (item['name'], item['created_at']) for item in items)
+        self.assertEqual(4, len(all_items))
+
+        # replicate both ways
+        part, node = self._get_broker_part_node(broker)
+        self._run_once(node)
+        part, node = self._get_broker_part_node(remote_broker)
+        self._run_once(node)
+
+        # only the latest timestamps should survive
+        most_recent_items = {}
+        for name, timestamp in all_items:
+            most_recent_items[name] = max(
+                timestamp, most_recent_items.get(name, ''))
+        self.assertEqual(2, len(most_recent_items))
+
+        for db in (broker, remote_broker):
+            items = db.get_items_since(-1, 4)
+            self.assertEqual(len(items), len(most_recent_items))
+            for item in items:
+                self.assertEqual(most_recent_items[item['name']],
+                                 item['created_at'])
+
+        # and the reconciler also collapses updates
+        reconciler_containers = set()
+        for item in all_items:
+            _name, timestamp = item
+            reconciler_containers.add(
+                get_reconciler_container_name(timestamp))
+
+        reconciler_items = set()
+        for reconciler_container in reconciler_containers:
+            for node_index in range(3):
+                reconciler = self._get_broker(MISPLACED_OBJECTS_ACCOUNT,
+                                              reconciler_container,
+                                              node_index=node_index)
+                items = reconciler.get_items_since(-1, 4)
+                reconciler_items.update(
+                    (item['name'], item['created_at']) for item in items)
+        # they can't *both* be in the wrong policy ;)
+        self.assertEqual(1, len(reconciler_items))
+        for reconciler_name, timestamp in reconciler_items:
+            _policy_index, path = reconciler_name.split(':', 1)
+            a, c, name = path.lstrip('/').split('/')
+            self.assertEqual(most_recent_items[name], timestamp)
+
+    @contextmanager
+    def _wrap_update_reconciler_sync(self, broker, calls):
+        def wrapper_function(*args, **kwargs):
+            calls.append(args)
+            orig_function(*args, **kwargs)
+
+        orig_function = broker.update_reconciler_sync
+        broker.update_reconciler_sync = wrapper_function
+        try:
+            yield True
+        finally:
+            broker.update_reconciler_sync = orig_function
+
+    def test_post_replicate_hook(self):
+        ts = (Timestamp(t).internal for t in
+              itertools.count(int(time.time())))
+        broker = self._get_broker('a', 'c', node_index=0)
+        broker.initialize(next(ts), 0)
+        broker.put_object('foo', next(ts), 0, 'text/plain', 'xyz', deleted=0,
+                          storage_policy_index=0)
+        info = broker.get_replication_info()
+        self.assertEqual(1, info['max_row'])
+        self.assertEqual(-1, broker.get_reconciler_sync())
+        daemon = replicator.ContainerReplicator({})
+        calls = []
+        with self._wrap_update_reconciler_sync(broker, calls):
+            daemon._post_replicate_hook(broker, info, [])
+        self.assertEqual(1, len(calls))
+        # repeated call to _post_replicate_hook with no change to info
+        # should not call update_reconciler_sync
+        calls = []
+        with self._wrap_update_reconciler_sync(broker, calls):
+            daemon._post_replicate_hook(broker, info, [])
+        self.assertEqual(0, len(calls))
+
+    def test_update_sync_store_exception(self):
+        class FakeContainerSyncStore(object):
+            def update_sync_store(self, broker):
+                raise OSError(1, '1')
+
+        daemon = replicator.ContainerReplicator({}, logger=self.logger)
+        daemon.sync_store = FakeContainerSyncStore()
+        ts_iter = make_timestamp_iter()
+        broker = self._get_broker('a', 'c', node_index=0)
+        timestamp = next(ts_iter)
+        broker.initialize(timestamp.internal, POLICIES.default.idx)
+        info = broker.get_replication_info()
+        daemon._post_replicate_hook(broker, info, [])
+        lines = self.logger.get_lines_for_level('error')
+        expected = 'Failed to update sync_store, path: %s, db: %s: ' % (
+            quote(broker.path), broker.db_file
+        )
+        self.assertEqual([expected], lines)
+
+    def test_update_sync_store(self):
+        klass = 'swift.container.sync_store.ContainerSyncStore'
+        daemon = replicator.ContainerReplicator({})
+        daemon.sync_store = sync_store.ContainerSyncStore(
+            daemon.root, daemon.logger, daemon.mount_check)
+        ts_iter = make_timestamp_iter()
+        broker = self._get_broker('a', 'c', node_index=0)
+        timestamp = next(ts_iter)
+        broker.initialize(timestamp.internal, POLICIES.default.idx)
+        info = broker.get_replication_info()
+        with mock.patch(klass + '.remove_synced_container') as mock_remove:
+            with mock.patch(klass + '.add_synced_container') as mock_add:
+                daemon._post_replicate_hook(broker, info, [])
+        self.assertEqual(0, mock_remove.call_count)
+        self.assertEqual(0, mock_add.call_count)
+
+        timestamp = next(ts_iter)
+        # sync-to and sync-key empty - remove from store
+        broker.update_metadata(
+            {'X-Container-Sync-To': ('', timestamp.internal),
+             'X-Container-Sync-Key': ('', timestamp.internal)})
+        with mock.patch(klass + '.remove_synced_container') as mock_remove:
+            with mock.patch(klass + '.add_synced_container') as mock_add:
+                daemon._post_replicate_hook(broker, info, [])
+        self.assertEqual(0, mock_add.call_count)
+        mock_remove.assert_called_once_with(broker)
+
+        timestamp = next(ts_iter)
+        # sync-to is not empty sync-key is empty - remove from store
+        broker.update_metadata(
+            {'X-Container-Sync-To': ('a', timestamp.internal)})
+        with mock.patch(klass + '.remove_synced_container') as mock_remove:
+            with mock.patch(klass + '.add_synced_container') as mock_add:
+                daemon._post_replicate_hook(broker, info, [])
+        self.assertEqual(0, mock_add.call_count)
+        mock_remove.assert_called_once_with(broker)
+
+        timestamp = next(ts_iter)
+        # sync-to is empty sync-key is not empty - remove from store
+        broker.update_metadata(
+            {'X-Container-Sync-To': ('', timestamp.internal),
+             'X-Container-Sync-Key': ('secret', timestamp.internal)})
+        with mock.patch(klass + '.remove_synced_container') as mock_remove:
+            with mock.patch(klass + '.add_synced_container') as mock_add:
+                daemon._post_replicate_hook(broker, info, [])
+        self.assertEqual(0, mock_add.call_count)
+        mock_remove.assert_called_once_with(broker)
+
+        timestamp = next(ts_iter)
+        # sync-to, sync-key both not empty - add to store
+        broker.update_metadata(
+            {'X-Container-Sync-To': ('a', timestamp.internal),
+             'X-Container-Sync-Key': ('secret', timestamp.internal)})
+        with mock.patch(klass + '.remove_synced_container') as mock_remove:
+            with mock.patch(klass + '.add_synced_container') as mock_add:
+                daemon._post_replicate_hook(broker, info, [])
+        mock_add.assert_called_once_with(broker)
+        self.assertEqual(0, mock_remove.call_count)
+
+        timestamp = next(ts_iter)
+        # container is removed - need to remove from store
+        broker.delete_db(timestamp.internal)
+        broker.update_metadata(
+            {'X-Container-Sync-To': ('a', timestamp.internal),
+             'X-Container-Sync-Key': ('secret', timestamp.internal)})
+        with mock.patch(klass + '.remove_synced_container') as mock_remove:
+            with mock.patch(klass + '.add_synced_container') as mock_add:
+                daemon._post_replicate_hook(broker, info, [])
+        self.assertEqual(0, mock_add.call_count)
+        mock_remove.assert_called_once_with(broker)
+
+    def test_sync_triggers_sync_store_update(self):
+        klass = 'swift.container.sync_store.ContainerSyncStore'
+        ts_iter = make_timestamp_iter()
+        # Create two containers as follows:
+        # broker_1 which is not set for sync
+        # broker_2 which is set for sync and then unset
+        # test that while replicating both we see no activity
+        # for broker_1, and the anticipated activity for broker_2
+        broker_1 = self._get_broker('a', 'c', node_index=0)
+        broker_1.initialize(next(ts_iter).internal, POLICIES.default.idx)
+        broker_2 = self._get_broker('b', 'd', node_index=0)
+        broker_2.initialize(next(ts_iter).internal, POLICIES.default.idx)
+        broker_2.update_metadata(
+            {'X-Container-Sync-To': ('a', next(ts_iter).internal),
+             'X-Container-Sync-Key': ('secret', next(ts_iter).internal)})
+
+        # replicate once according to broker_1
+        # relying on the fact that FakeRing would place both
+        # in the same partition.
+        part, node = self._get_broker_part_node(broker_1)
+        with mock.patch(klass + '.remove_synced_container') as mock_remove:
+            with mock.patch(klass + '.add_synced_container') as mock_add:
+                self._run_once(node)
+        self.assertEqual(1, mock_add.call_count)
+        self.assertEqual(broker_2.db_file, mock_add.call_args[0][0].db_file)
+        self.assertEqual(0, mock_remove.call_count)
+
+        broker_2.update_metadata(
+            {'X-Container-Sync-To': ('', next(ts_iter).internal)})
+        # replicate once this time according to broker_2
+        # relying on the fact that FakeRing would place both
+        # in the same partition.
+        part, node = self._get_broker_part_node(broker_2)
+        with mock.patch(klass + '.remove_synced_container') as mock_remove:
+            with mock.patch(klass + '.add_synced_container') as mock_add:
+                self._run_once(node)
+        self.assertEqual(0, mock_add.call_count)
+        self.assertEqual(1, mock_remove.call_count)
+        self.assertEqual(broker_2.db_file, mock_remove.call_args[0][0].db_file)
+
+    def test_cleanup_post_replicate(self):
+        broker = self._get_broker('a', 'c', node_index=0)
+        put_timestamp = Timestamp.now()
+        broker.initialize(put_timestamp.internal, POLICIES.default.idx)
+        orig_info = broker.get_replication_info()
+        daemon = replicator.ContainerReplicator({}, logger=self.logger)
+
+        # db should not be here, replication ok, deleted
+        res = daemon.cleanup_post_replicate(broker, orig_info, [True] * 3)
+        self.assertTrue(res)
+        self.assertFalse(os.path.exists(broker.db_file))
+        self.assertEqual(['Successfully deleted db, path: %s, db: %s' %
+                          (broker.path, broker.db_file)],
+                         daemon.logger.get_lines_for_level('debug'))
+        daemon.logger.clear()
+
+        # failed replication, not deleted
+        broker.initialize(put_timestamp.internal, POLICIES.default.idx)
+        orig_info = broker.get_replication_info()
+        res = daemon.cleanup_post_replicate(broker, orig_info,
+                                            [False, True, True])
+        self.assertTrue(res)
+        self.assertTrue(os.path.exists(broker.db_file))
+        self.assertEqual(['Not deleting db (2/3 success), path: %s, '
+                          'db: %s' % (broker.path, broker.db_file)],
+                         daemon.logger.get_lines_for_level('debug'))
+        daemon.logger.clear()
+
+        # db has shard ranges, not deleted
+        broker.enable_sharding(Timestamp.now())
+        broker.merge_shard_ranges(
+            [ShardRange('.shards_a/c', Timestamp.now(), '', 'm')])
+        self.assertTrue(broker.sharding_required())  # sanity check
+        res = daemon.cleanup_post_replicate(broker, orig_info, [True] * 3)
+        self.assertTrue(res)
+        self.assertTrue(os.path.exists(broker.db_file))
+        self.assertEqual(
+            ['Not deleting db (requires sharding, state unsharded), '
+             'path: a/c, db: %s' % broker.db_file],
+            daemon.logger.get_lines_for_level('debug'))
+        daemon.logger.clear()
+
+        # db sharding, not deleted
+        self._goto_sharding_state(broker, Timestamp.now())
+        self.assertTrue(broker.sharding_required())  # sanity check
+        orig_info = broker.get_replication_info()
+        res = daemon.cleanup_post_replicate(broker, orig_info, [True] * 3)
+        self.assertTrue(res)
+        self.assertTrue(os.path.exists(broker.db_file))
+        self.assertEqual(
+            ['Not deleting db (requires sharding, state sharding), '
+             'path: a/c, db: %s' % broker.db_file],
+            daemon.logger.get_lines_for_level('debug'))
+        daemon.logger.clear()
+
+        # db sharded, should not be here, failed replication, not deleted
+        self._goto_sharded_state(broker)
+        self.assertFalse(broker.sharding_required())  # sanity check
+        res = daemon.cleanup_post_replicate(broker, orig_info,
+                                            [True, False, True])
+        self.assertTrue(res)
+        self.assertTrue(os.path.exists(broker.db_file))
+        self.assertEqual(['Not deleting db (2/3 success), path: %s, '
+                          'db: %s' % (broker.path, broker.db_file)],
+                         daemon.logger.get_lines_for_level('debug'))
+        daemon.logger.clear()
+
+        # db sharded, should not be here, new shard ranges (e.g. from reverse
+        # replication), deleted
+        broker.merge_shard_ranges(
+            [ShardRange('.shards_a/c', Timestamp.now(), '', 'm')])
+        res = daemon.cleanup_post_replicate(broker, orig_info, [True] * 3)
+        self.assertTrue(res)
+        self.assertFalse(os.path.exists(broker.db_file))
+        daemon.logger.clear()
+
+        # db sharded, should not be here, replication ok, deleted
+        broker.initialize(put_timestamp.internal, POLICIES.default.idx)
+        self.assertTrue(os.path.exists(broker.db_file))
+        orig_info = broker.get_replication_info()
+        res = daemon.cleanup_post_replicate(broker, orig_info, [True] * 3)
+        self.assertTrue(res)
+        self.assertFalse(os.path.exists(broker.db_file))
+        self.assertEqual(['Successfully deleted db, path: %s, db: %s' %
+                          (broker.path, broker.db_file)],
+                         daemon.logger.get_lines_for_level('debug'))
+        daemon.logger.clear()
+
+    def test_sync_shard_ranges_merge_remote_osr(self):
+        def do_test(local_osr, remote_osr, exp_merge, exp_warning,
+                    exp_rpc_warning):
+            put_timestamp = Timestamp.now().internal
+            # create "local" broker
+            broker = self._get_broker('a', 'c', node_index=0)
+            broker.initialize(put_timestamp, POLICIES.default.idx)
+            # create "remote" broker
+            remote_broker = self._get_broker('a', 'c', node_index=1)
+            remote_broker.initialize(put_timestamp, POLICIES.default.idx)
+
+            bounds = (('', 'g'), ('g', 'r'), ('r', ''))
+            shard_ranges = [
+                ShardRange('.shards_a/sr-%s' % upper, Timestamp.now(), lower,
+                           upper, i + 1, 10 * (i + 1))
+                for i, (lower, upper) in enumerate(bounds)
+            ]
+
+            for db in (broker, remote_broker):
+                db.merge_shard_ranges(shard_ranges)
+
+            if local_osr:
+                broker.merge_shard_ranges(ShardRange(**dict(local_osr)))
+            if remote_osr:
+                remote_broker.merge_shard_ranges(
+                    ShardRange(**dict(remote_osr)))
+
+            daemon = replicator.ContainerReplicator({}, logger=debug_logger())
+            part, remote_node = self._get_broker_part_node(remote_broker)
+            part, local_node = self._get_broker_part_node(broker)
+            info = broker.get_replication_info()
+            success = daemon._repl_to_node(remote_node, broker, part, info)
+            self.assertTrue(success)
+            local_info = self._get_broker(
+                'a', 'c', node_index=0).get_info()
+            remote_info = self._get_broker(
+                'a', 'c', node_index=1).get_info()
+            for k, v in local_info.items():
+                if k == 'id':
+                    continue
+                self.assertEqual(remote_info[k], v,
+                                 "mismatch remote %s %r != %r" % (
+                                     k, remote_info[k], v))
+            actual_osr = broker.get_own_shard_range(no_default=True)
+            actual_osr = dict(actual_osr) if actual_osr else actual_osr
+            if exp_merge:
+                exp_osr = (dict(remote_osr, meta_timestamp=mock.ANY)
+                           if remote_osr else remote_osr)
+            else:
+                exp_osr = (dict(local_osr, meta_timestamp=mock.ANY)
+                           if local_osr else local_osr)
+            self.assertEqual(exp_osr, actual_osr)
+            lines = daemon.logger.get_lines_for_level('warning')
+            debug_lines = daemon.logger.get_lines_for_level('debug')
+            if exp_warning:
+                self.assertEqual(len(lines), 1, lines)
+                self.assertIn("Ignoring remote osr w/o epoch", lines[0])
+                self.assertIn("own_sr: ", lines[0])
+                self.assertIn("'epoch': '%s'" % local_osr.epoch.normal,
+                              lines[0])
+                self.assertIn("remote_sr: ", lines[0])
+                self.assertIn("'epoch': None", lines[0])
+                hash_ = os.path.splitext(os.path.basename(broker.db_file))[0]
+                url = "%s/%s/%s/%s" % (
+                    remote_node['ip'], remote_node['device'], part, hash_)
+                self.assertIn("source: %s" % url, lines[0])
+            else:
+                self.assertFalse(lines)
+                expected_tail = ", path: %s, db: %s" % (
+                    quote(broker.path), broker.db_file)
+                self.assertTrue(
+                    any(dl.endswith(expected_tail) for dl in debug_lines),
+                    "Expected tail %r not found in debug lines: %r"
+                    % (expected_tail, debug_lines),
+                )
+            lines = self.rpc.logger.get_lines_for_level('warning')
+            if exp_rpc_warning:
+                self.assertEqual(len(lines), 1, lines)
+                self.assertIn("Ignoring remote osr w/o epoch", lines[0])
+                self.assertIn("source: repl_req", lines[0])
+            else:
+                self.assertFalse(lines)
+
+            os.remove(broker.db_file)
+            os.remove(remote_broker.db_file)
+            return daemon
+
+        # we'll use other broker as a template to use the "default" osrs
+        other_broker = self._get_broker('a', 'c', node_index=2)
+        other_broker.initialize(Timestamp.now().internal, POLICIES.default.idx)
+        default_osr = other_broker.get_own_shard_range()
+        self.assertIsNone(default_osr.epoch)
+        osr_with_epoch = other_broker.get_own_shard_range()
+        osr_with_epoch.epoch = Timestamp.now()
+        osr_with_different_epoch = other_broker.get_own_shard_range()
+        osr_with_different_epoch.epoch = Timestamp.now()
+        default_osr_newer = ShardRange(**dict(default_osr))
+        default_osr_newer.timestamp = Timestamp.now()
+
+        # local_osr, remote_osr, exp_merge, exp_warning, exp_rpc_warning
+        tests = (
+            # First the None case, ie no osrs
+            (None, None, False, False, False),
+            # Default and not the other
+            (None, default_osr, True, False, False),
+            (default_osr, None, False, False, False),
+            (default_osr, default_osr, True, False, False),
+            (default_osr, None, False, False, False),
+            # With an epoch and no OSR is also fine
+            (None, osr_with_epoch, True, False, False),
+            (osr_with_epoch, None, False, False, False),
+            # even with the same or different epochs
+            (osr_with_epoch, osr_with_epoch, True, False, False),
+            (osr_with_epoch, osr_with_different_epoch, True, False, False),
+            # But if local does have an epoch but the remote doesn't: false
+            # positive, nothing will merge anyway, no warning.
+            (osr_with_epoch, default_osr, False, False, False),
+            # It's also OK if the remote has an epoch but not the local,
+            # this also works on the RPC side because merge_shards happen on
+            # to local then sends updated shards to the remote. So if the
+            # OSR on the remote is newer then the default the RPC side will
+            # actually get a merged OSR, ie get the remote one back.
+            (default_osr, osr_with_epoch, True, False, False),
+            # But if the local default is newer then the epoched remote side
+            # we'd get an error logged on the RPC side and the local is newer
+            # so wil fail to merge
+            (default_osr_newer, osr_with_epoch, False, False, True),
+        )
+        for i, params in enumerate(tests):
+            with self.subTest(i=i, params=params):
+                do_test(*params)
+
+    def test_sync_shard_ranges(self):
+        put_timestamp = Timestamp.now().internal
+        # create "local" broker
+        broker = self._get_broker('a', 'c', node_index=0)
+        broker.initialize(put_timestamp, POLICIES.default.idx)
+        # create "remote" broker
+        remote_broker = self._get_broker('a', 'c', node_index=1)
+        remote_broker.initialize(put_timestamp, POLICIES.default.idx)
+
+        def check_replicate(expected_shard_ranges, from_broker, to_broker):
+            daemon = replicator.ContainerReplicator({}, logger=debug_logger())
+            part, node = self._get_broker_part_node(to_broker)
+            info = broker.get_replication_info()
+            success = daemon._repl_to_node(node, from_broker, part, info)
+            self.assertTrue(success)
+            self.assertEqual(
+                expected_shard_ranges,
+                to_broker.get_all_shard_range_data()
+            )
+            local_info = self._get_broker(
+                'a', 'c', node_index=0).get_info()
+            remote_info = self._get_broker(
+                'a', 'c', node_index=1).get_info()
+            for k, v in local_info.items():
+                if k == 'id':
+                    continue
+                self.assertEqual(remote_info[k], v,
+                                 "mismatch remote %s %r != %r" % (
+                                     k, remote_info[k], v))
+            return daemon
+
+        bounds = (('', 'g'), ('g', 'r'), ('r', ''))
+        shard_ranges = [
+            ShardRange('.shards_a/sr-%s' % upper, Timestamp.now(), lower,
+                       upper, i + 1, 10 * (i + 1))
+            for i, (lower, upper) in enumerate(bounds)
+        ]
+        # add first two shard_ranges to both brokers
+        for shard_range in shard_ranges[:2]:
+            for db in (broker, remote_broker):
+                db.merge_shard_ranges(shard_range)
+        # now add a shard range and an object to the "local" broker only
+        broker.merge_shard_ranges(shard_ranges[2])
+        broker_ranges = broker.get_all_shard_range_data()
+        self.assertShardRangesEqual(shard_ranges, broker_ranges)
+        broker.put_object('obj', Timestamp.now().internal, 0, 'text/plain',
+                          MD5_OF_EMPTY_STRING)
+        # sharding not yet enabled so replication not deferred
+        daemon = check_replicate(broker_ranges, broker, remote_broker)
+        self.assertEqual(0, daemon.stats['deferred'])
+        self.assertEqual(0, daemon.stats['no_change'])
+        self.assertEqual(0, daemon.stats['rsync'])
+        self.assertEqual(1, daemon.stats['diff'])
+        self.assertEqual({'diffs': 1},
+                         daemon.logger.statsd_client.get_stats_counts())
+
+        # update one shard range
+        shard_ranges[1].update_meta(50, 50)
+        # sharding not yet enabled so replication not deferred, but the two
+        # brokers' object tables are in sync so no rsync or usync either
+        daemon = check_replicate(broker_ranges, broker, remote_broker)
+        self.assertEqual(0, daemon.stats['deferred'])
+        self.assertEqual(1, daemon.stats['no_change'])
+        self.assertEqual(0, daemon.stats['rsync'])
+        self.assertEqual(0, daemon.stats['diff'])
+        self.assertEqual({'no_changes': 1},
+                         daemon.logger.statsd_client.get_stats_counts())
+
+        # now enable local broker for sharding
+        own_sr = broker.enable_sharding(Timestamp.now())
+        # update one shard range
+        shard_ranges[1].update_meta(13, 123)
+        broker.merge_shard_ranges(shard_ranges[1])
+        broker_ranges = broker.get_all_shard_range_data()
+        self.assertShardRangesEqual(shard_ranges + [own_sr], broker_ranges)
+
+        def check_stats(daemon):
+            self.assertEqual(1, daemon.stats['deferred'])
+            self.assertEqual(0, daemon.stats['no_change'])
+            self.assertEqual(0, daemon.stats['rsync'])
+            self.assertEqual(0, daemon.stats['diff'])
+            self.assertFalse(daemon.logger.statsd_client.get_increments())
+
+        daemon = check_replicate(broker_ranges, broker, remote_broker)
+        check_stats(daemon)
+
+        # update one shard range
+        shard_ranges[1].update_meta(99, 0)
+        broker.merge_shard_ranges(shard_ranges[1])
+        # sanity check
+        broker_ranges = broker.get_all_shard_range_data()
+        self.assertShardRangesEqual(shard_ranges + [own_sr], broker_ranges)
+        daemon = check_replicate(broker_ranges, broker, remote_broker)
+        check_stats(daemon)
+
+        # delete one shard range
+        shard_ranges[0].deleted = 1
+        shard_ranges[0].timestamp = Timestamp.now()
+        broker.merge_shard_ranges(shard_ranges[0])
+        # sanity check
+        broker_ranges = broker.get_all_shard_range_data()
+        self.assertShardRangesEqual(shard_ranges + [own_sr], broker_ranges)
+        daemon = check_replicate(broker_ranges, broker, remote_broker)
+        check_stats(daemon)
+
+        # put a shard range again
+        shard_ranges[2].timestamp = Timestamp.now()
+        shard_ranges[2].object_count = 0
+        broker.merge_shard_ranges(shard_ranges[2])
+        # sanity check
+        broker_ranges = broker.get_all_shard_range_data()
+        self.assertShardRangesEqual(shard_ranges + [own_sr], broker_ranges)
+        daemon = check_replicate(broker_ranges, broker, remote_broker)
+        check_stats(daemon)
+
+        # update same shard range on local and remote, remote later
+        shard_ranges[-1].meta_timestamp = Timestamp.now()
+        shard_ranges[-1].bytes_used += 1000
+        broker.merge_shard_ranges(shard_ranges[-1])
+        remote_shard_ranges = remote_broker.get_shard_ranges(
+            include_deleted=True)
+        remote_shard_ranges[-1].meta_timestamp = Timestamp.now()
+        remote_shard_ranges[-1].bytes_used += 2000
+        remote_broker.merge_shard_ranges(remote_shard_ranges[-1])
+        # sanity check
+        remote_broker_ranges = remote_broker.get_all_shard_range_data()
+        self.assertShardRangesEqual(remote_shard_ranges + [own_sr],
+                                    remote_broker_ranges)
+        self.assertShardRangesNotEqual(shard_ranges, remote_shard_ranges)
+        daemon = check_replicate(remote_broker_ranges, broker, remote_broker)
+        check_stats(daemon)
+
+        # undelete shard range *on the remote*
+        deleted_ranges = [sr for sr in remote_shard_ranges if sr.deleted]
+        self.assertEqual([shard_ranges[0]], deleted_ranges)
+        deleted_ranges[0].deleted = 0
+        deleted_ranges[0].timestamp = Timestamp.now()
+        remote_broker.merge_shard_ranges(deleted_ranges[0])
+        # sanity check
+        remote_broker_ranges = remote_broker.get_all_shard_range_data()
+        self.assertShardRangesEqual(remote_shard_ranges + [own_sr],
+                                    remote_broker_ranges)
+        self.assertShardRangesNotEqual(shard_ranges, remote_shard_ranges)
+        daemon = check_replicate(remote_broker_ranges, broker, remote_broker)
+        check_stats(daemon)
+
+        # reverse replication direction and expect syncs to propagate
+        daemon = check_replicate(remote_broker_ranges, remote_broker, broker)
+        check_stats(daemon)
+
+    def test_sync_shard_ranges_error(self):
+        # verify that replication is not considered successful if
+        # merge_shard_ranges fails
+        put_time = Timestamp.now().internal
+        broker = self._get_broker('a', 'c', node_index=0)
+        broker.initialize(put_time, POLICIES.default.idx)
+        remote_broker = self._get_broker('a', 'c', node_index=1)
+        remote_broker.initialize(put_time, POLICIES.default.idx)
+        # put an object into local broker
+        broker.put_object('obj', Timestamp.now().internal, 0, 'text/plain',
+                          MD5_OF_EMPTY_STRING)
+        # get an own shard range into local broker
+        broker.enable_sharding(Timestamp.now())
+        self.assertFalse(broker.sharding_initiated())
+
+        replicate_hook = mock.MagicMock()
+        fake_repl_connection = attach_fake_replication_rpc(
+            self.rpc, errors={'merge_shard_ranges': [
+                FakeHTTPResponse(HTTPServerError())]},
+            replicate_hook=replicate_hook)
+        part, node = self._get_broker_part_node(remote_broker)
+        info = broker.get_replication_info()
+        daemon = replicator.ContainerReplicator({})
+        daemon.logger = debug_logger()
+        with mock.patch.object(db_replicator, 'ReplConnection',
+                               fake_repl_connection):
+            success = daemon._repl_to_node(node, broker, part, info)
+        self.assertFalse(success)
+        # broker only has its own shard range so expect objects to be sync'd
+        self.assertEqual(
+            ['sync', 'merge_shard_ranges', 'merge_items',
+             'merge_syncs'],
+            [call[0][0] for call in replicate_hook.call_args_list])
+        error_lines = daemon.logger.get_lines_for_level('error')
+        self.assertIn('Bad response 500', error_lines[0])
+        self.assertFalse(error_lines[1:])
+        self.assertEqual(1, daemon.stats['diff'])
+        self.assertEqual(
+            1, daemon.logger.statsd_client.get_stats_counts()['diffs'])
+
+    def test_sync_shard_ranges_timeout_in_fetch(self):
+        # verify that replication is not considered successful if
+        # merge_shard_ranges fails
+        put_time = Timestamp.now().internal
+        broker = self._get_broker('a', 'c', node_index=0)
+        broker.initialize(put_time, POLICIES.default.idx)
+        remote_broker = self._get_broker('a', 'c', node_index=1)
+        remote_broker.initialize(put_time, POLICIES.default.idx)
+        # get an own shard range into remote broker
+        remote_broker.enable_sharding(Timestamp.now())
+
+        replicate_calls = []
+
+        def replicate_hook(op, *args):
+            replicate_calls.append(op)
+            if op == 'get_shard_ranges':
+                sleep(0.1)
+
+        fake_repl_connection = attach_fake_replication_rpc(
+            self.rpc, replicate_hook=replicate_hook)
+        part, node = self._get_broker_part_node(remote_broker)
+        daemon = replicator.ContainerReplicator({'node_timeout': '0.001'})
+        daemon.logger = debug_logger()
+        daemon.db_logger.logger = daemon.logger
+        with mock.patch.object(db_replicator, 'ReplConnection',
+                               fake_repl_connection), \
+                mock.patch.object(daemon.ring, 'get_part_nodes',
+                                  return_value=[node]), \
+                mock.patch.object(daemon, '_post_replicate_hook'):
+            success, _ = daemon._replicate_object(
+                part, broker.db_file, node['id'])
+        self.assertFalse(success)
+        # broker only has its own shard range so expect objects to be sync'd
+        self.assertEqual(['sync', 'get_shard_ranges'], replicate_calls)
+        error_lines = daemon.db_logger.logger.get_lines_for_level('error')
+        self.assertEqual('ERROR syncing with %s, '
+                         'path: %s, db: %s: Timeout (0.001s)'
+                         % (node, broker.path, broker.db_file),
+                         error_lines[0])
+        self.assertFalse(error_lines[1:])
+        self.assertEqual(0, daemon.stats['diff'])
+        self.assertNotIn(
+            'diffs', daemon.logger.statsd_client.get_stats_counts())
+        self.assertEqual(1, daemon.stats['failure'])
+        self.assertEqual(
+            1, daemon.logger.statsd_client.get_stats_counts()['failures'])
+
+    def test_sync_shard_ranges_none_to_sync(self):
+        # verify that merge_shard_ranges is not sent if there are no shard
+        # ranges to sync
+        put_time = Timestamp.now().internal
+        broker = self._get_broker('a', 'c', node_index=0)
+        broker.initialize(put_time, POLICIES.default.idx)
+        remote_broker = self._get_broker('a', 'c', node_index=1)
+        remote_broker.initialize(put_time, POLICIES.default.idx)
+        # put an object into local broker
+        broker.put_object('obj', Timestamp.now().internal, 0, 'text/plain',
+                          MD5_OF_EMPTY_STRING)
+
+        replicate_hook = mock.MagicMock()
+        fake_repl_connection = attach_fake_replication_rpc(
+            self.rpc, replicate_hook=replicate_hook)
+        part, node = self._get_broker_part_node(remote_broker)
+        info = broker.get_replication_info()
+        daemon = replicator.ContainerReplicator({})
+        with mock.patch.object(db_replicator, 'ReplConnection',
+                               fake_repl_connection):
+            success = daemon._repl_to_node(node, broker, part, info)
+        self.assertTrue(success)
+        # NB: remote has no shard ranges, so no call to get_shard_ranges
+        self.assertEqual(
+            ['sync', 'merge_items', 'merge_syncs'],
+            [call[0][0] for call in replicate_hook.call_args_list])
+
+    def test_sync_shard_ranges_trouble_receiving_so_none_to_sync(self):
+        # verify that merge_shard_ranges is not sent if local has no shard
+        # ranges to sync
+        put_time = Timestamp.now().internal
+        broker = self._get_broker('a', 'c', node_index=0)
+        broker.initialize(put_time, POLICIES.default.idx)
+        remote_broker = self._get_broker('a', 'c', node_index=1)
+        remote_broker.initialize(put_time, POLICIES.default.idx)
+        # ensure the remote has at least one shard range
+        remote_broker.enable_sharding(Timestamp.now())
+        # put an object into local broker
+        broker.put_object('obj', Timestamp.now().internal, 0, 'text/plain',
+                          MD5_OF_EMPTY_STRING)
+
+        replicate_hook = mock.MagicMock()
+        fake_repl_connection = attach_fake_replication_rpc(
+            self.rpc, errors={'get_shard_ranges': [
+                FakeHTTPResponse(HTTPServerError())]},
+            replicate_hook=replicate_hook)
+        part, node = self._get_broker_part_node(remote_broker)
+        info = broker.get_replication_info()
+        daemon = replicator.ContainerReplicator({})
+        with mock.patch.object(db_replicator, 'ReplConnection',
+                               fake_repl_connection):
+            success = daemon._repl_to_node(node, broker, part, info)
+        self.assertTrue(success)
+        # NB: remote had shard ranges, but there was... some sort of issue
+        # in getting them locally, so no call to merge_shard_ranges
+        self.assertEqual(
+            ['sync', 'get_shard_ranges', 'merge_items', 'merge_syncs'],
+            [call[0][0] for call in replicate_hook.call_args_list])
+
+    def test_sync_shard_ranges_with_rsync(self):
+        broker = self._get_broker('a', 'c', node_index=0)
+        put_timestamp = time.time()
+        broker.initialize(put_timestamp, POLICIES.default.idx)
+
+        bounds = (('', 'g'), ('g', 'r'), ('r', ''))
+        shard_ranges = [
+            ShardRange('.shards_a/sr-%s' % upper, Timestamp.now(), lower,
+                       upper, i + 1, 10 * (i + 1))
+            for i, (lower, upper) in enumerate(bounds)
+        ]
+        # add first shard range
+        own_sr = broker.enable_sharding(Timestamp.now())
+        broker.merge_shard_ranges(shard_ranges[:1])
+
+        # "replicate"
+        part, node = self._get_broker_part_node(broker)
+        daemon = self._run_once(node)
+        self.assertEqual(2, daemon.stats['rsync'])
+
+        # complete rsync to all other nodes
+        def check_replicate(expected_ranges):
+            for i in range(1, 3):
+                remote_broker = self._get_broker('a', 'c', node_index=i)
+                self.assertTrue(os.path.exists(remote_broker.db_file))
+                self.assertShardRangesEqual(
+                    expected_ranges,
+                    remote_broker.get_shard_ranges(include_deleted=True,
+                                                   include_own=True)
+                )
+                remote_info = remote_broker.get_info()
+                local_info = self._get_broker(
+                    'a', 'c', node_index=0).get_info()
+                for k, v in local_info.items():
+                    if k == 'id':
+                        continue
+                    if k == 'hash':
+                        self.assertEqual(remote_info[k], '0' * 32)
+                        continue
+                    if k == 'object_count':
+                        self.assertEqual(remote_info[k], 0)
+                        continue
+                    self.assertEqual(remote_info[k], v,
+                                     "mismatch remote %s %r != %r" % (
+                                         k, remote_info[k], v))
+
+        check_replicate([shard_ranges[0], own_sr])
+
+        # delete and add some more shard ranges
+        shard_ranges[0].deleted = 1
+        shard_ranges[0].timestamp = Timestamp.now()
+        for shard_range in shard_ranges:
+            broker.merge_shard_ranges(shard_range)
+        daemon = self._run_once(node)
+        self.assertEqual(2, daemon.stats['deferred'])
+        check_replicate(shard_ranges + [own_sr])
+
+    def check_replicate(self, from_broker, remote_node_index, repl_conf=None,
+                        expect_success=True):
+        repl_conf = repl_conf or {}
+        repl_calls = []
+        rsync_calls = []
+
+        def repl_hook(op, *sync_args):
+            repl_calls.append((op, sync_args))
+
+        fake_repl_connection = attach_fake_replication_rpc(
+            self.rpc, replicate_hook=repl_hook, errors=None)
+        daemon = replicator.ContainerReplicator(
+            repl_conf, logger=self.logger)
+        self._install_fake_rsync_file(daemon, rsync_calls)
+        part, nodes = self._ring.get_nodes(from_broker.account,
+                                           from_broker.container)
+
+        def find_node(node_index):
+            for node in nodes:
+                if node['index'] == node_index:
+                    return node
+            else:
+                self.fail('Failed to find node index %s' % remote_node_index)
+
+        remote_node = find_node(remote_node_index)
+        info = from_broker.get_replication_info()
+
+        with mock.patch.object(db_replicator, 'ReplConnection',
+                               fake_repl_connection):
+            success = daemon._repl_to_node(
+                remote_node, from_broker, part, info)
+        self.assertEqual(expect_success, success)
+        return daemon, repl_calls, rsync_calls
+
+    def assert_synced_shard_ranges(self, expected, synced_items):
+        expected.sort(key=lambda sr: (sr.lower, sr.upper))
+        for item in synced_items:
+            item.pop('record_type', None)
+        self.assertEqual([dict(ex) for ex in expected], synced_items)
+
+    def assert_info_synced(self, local, remote_node_index, mismatches=None):
+        mismatches = mismatches or []
+        mismatches.append('id')
+        remote = self._get_broker(local.account, local.container,
+                                  node_index=remote_node_index)
+        local_info = local.get_info()
+        remote_info = remote.get_info()
+        errors = []
+        for k, v in local_info.items():
+            if remote_info.get(k) == v:
+                if k in mismatches:
+                    errors.append(
+                        "unexpected match remote %s %r == %r" % (
+                            k, remote_info[k], v))
+                    continue
+            else:
+                if k not in mismatches:
+                    errors.append(
+                        "unexpected mismatch remote %s %r != %r" % (
+                            k, remote_info[k], v))
+        if errors:
+            self.fail('Found sync errors:\n' + '\n'.join(errors))
+
+    def assert_shard_ranges_synced(self, local_broker, remote_broker):
+        self.assertShardRangesEqual(
+            local_broker.get_shard_ranges(include_deleted=True,
+                                          include_own=True),
+            remote_broker.get_shard_ranges(include_deleted=True,
+                                           include_own=True)
+        )
+
+    def _setup_replication_test(self, node_index):
+        ts_iter = make_timestamp_iter()
+        policy_idx = POLICIES.default.idx
+        put_timestamp = Timestamp.now().internal
+        # create "local" broker
+        broker = self._get_broker('a', 'c', node_index=node_index)
+        broker.initialize(put_timestamp, policy_idx)
+
+        objs = [{'name': 'blah%03d' % i, 'created_at': next(ts_iter).internal,
+                 'size': i, 'content_type': 'text/plain', 'etag': 'etag%s' % i,
+                 'deleted': 0, 'storage_policy_index': policy_idx}
+                for i in range(20)]
+        bounds = (('', 'a'), ('a', 'b'), ('b', 'c'), ('c', ''))
+        shard_ranges = [
+            ShardRange(
+                '.sharded_a/sr-%s' % upper, Timestamp.now(), lower, upper)
+            for i, (lower, upper) in enumerate(bounds)
+        ]
+        return {'broker': broker,
+                'objects': objs,
+                'shard_ranges': shard_ranges}
+
+    def _merge_object(self, broker, objects, index, **kwargs):
+        if not isinstance(index, slice):
+            index = slice(index, index + 1)
+        objs = [dict(obj) for obj in objects[index]]
+        broker.merge_items(objs)
+
+    def _merge_shard_range(self, broker, shard_ranges, index, **kwargs):
+        broker.merge_shard_ranges(shard_ranges[index:index + 1])
+
+    def _goto_sharding_state(self, broker, epoch):
+        broker.enable_sharding(epoch)
+        self.assertTrue(broker.set_sharding_state())
+        self.assertEqual(backend.SHARDING, broker.get_db_state())
+
+    def _goto_sharded_state(self, broker):
+        self.assertTrue(broker.set_sharded_state())
+        self.assertEqual(backend.SHARDED, broker.get_db_state())
+
+    def _assert_local_sharded_in_sync(self, local_broker, local_id):
+        daemon, repl_calls, rsync_calls = self.check_replicate(local_broker, 1)
+        self.assertEqual(['sync', 'get_shard_ranges', 'merge_shard_ranges'],
+                         [call[0] for call in repl_calls])
+        self.assertEqual(1, daemon.stats['deferred'])
+        self.assertEqual(0, daemon.stats['rsync'])
+        self.assertEqual(0, daemon.stats['diff'])
+        self.assertFalse(rsync_calls)
+        # new db sync
+        self.assertEqual(local_id, repl_calls[0][1][2])
+        # ...but we still get a merge_shard_ranges for shard ranges
+        self.assert_synced_shard_ranges(
+            local_broker.get_shard_ranges(include_own=True),
+            repl_calls[2][1][0])
+        self.assertEqual(local_id, repl_calls[2][1][1])
+
+    def _check_only_shard_ranges_replicated(self, local_broker,
+                                            remote_node_index,
+                                            repl_conf,
+                                            expected_shard_ranges,
+                                            remote_has_shards=True,
+                                            expect_success=True):
+        # expected_shard_ranges is expected final list of sync'd ranges
+        daemon, repl_calls, rsync_calls = self.check_replicate(
+            local_broker, remote_node_index, repl_conf,
+            expect_success=expect_success)
+
+        # we always expect only shard ranges to end in abort
+        self.assertEqual(1, daemon.stats['deferred'])
+        self.assertEqual(0, daemon.stats['diff'])
+        self.assertEqual(0, daemon.stats['rsync'])
+        if remote_has_shards:
+            exp_calls = ['sync', 'get_shard_ranges', 'merge_shard_ranges']
+        else:
+            exp_calls = ['sync', 'merge_shard_ranges']
+        self.assertEqual(exp_calls, [call[0] for call in repl_calls])
+        self.assertFalse(rsync_calls)
+        # sync
+        local_id = local_broker.get_info()['id']
+        self.assertEqual(local_id, repl_calls[0][1][2])
+        # get_shard_ranges
+        if remote_has_shards:
+            self.assertEqual((), repl_calls[1][1])
+        # merge_shard_ranges for sending local shard ranges
+        self.assertShardRangesEqual(expected_shard_ranges,
+                                    repl_calls[-1][1][0])
+        self.assertEqual(local_id, repl_calls[-1][1][1])
+        remote_broker = self._get_broker(
+            local_broker.account, local_broker.container, node_index=1)
+        self.assertNotEqual(local_id, remote_broker.get_info()['id'])
+        self.assert_shard_ranges_synced(remote_broker, local_broker)
+
+    def test_replication_local_unsharded_remote_missing(self):
+        context = self._setup_replication_test(0)
+        local_broker = context['broker']
+        local_id = local_broker.get_info()['id']
+        objs = context['objects']
+        self._merge_object(index=0, **context)
+
+        daemon, repl_calls, rsync_calls = self.check_replicate(local_broker, 1)
+
+        self.assert_info_synced(local_broker, 1)
+        self.assertEqual(1, daemon.stats['rsync'])
+        self.assertEqual(['sync', 'complete_rsync'],
+                         [call[0] for call in repl_calls])
+        self.assertEqual(local_id, repl_calls[1][1][0])
+        self.assertEqual(os.path.basename(local_broker.db_file),
+                         repl_calls[1][1][1])
+        self.assertEqual(local_broker.db_file, rsync_calls[0][0])
+        self.assertEqual(local_id, os.path.basename(rsync_calls[0][1]))
+        self.assertFalse(rsync_calls[1:])
+        remote_broker = self._get_broker('a', 'c', node_index=1)
+        self.assert_shard_ranges_synced(local_broker, remote_broker)
+        self.assertTrue(os.path.exists(remote_broker._db_file))
+        self.assertNotEqual(local_id, remote_broker.get_info()['id'])
+        self.assertEqual(objs[:1], remote_broker.get_objects())
+
+    def _check_replication_local_unsharded_remote_sharded(self, repl_conf):
+        context = self._setup_replication_test(0)
+        local_broker = context['broker']
+        local_id = local_broker.get_info()['id']
+        self._merge_object(index=slice(0, 6), **context)
+
+        remote_context = self._setup_replication_test(1)
+        self._merge_object(index=4, **remote_context)
+        remote_broker = remote_context['broker']
+        epoch = Timestamp.now()
+        self._goto_sharding_state(remote_broker, epoch=epoch)
+        remote_context['shard_ranges'][0].object_count = 101
+        remote_context['shard_ranges'][0].bytes_used = 1010
+        remote_context['shard_ranges'][0].state = ShardRange.ACTIVE
+        self._merge_shard_range(index=0, **remote_context)
+        self._merge_object(index=5, **remote_context)
+        self._goto_sharded_state(remote_broker)
+        self.assertEqual(backend.SHARDED, remote_broker.get_db_state())
+
+        self._check_only_shard_ranges_replicated(
+            local_broker, 1, repl_conf,
+            remote_broker.get_shard_ranges(include_own=True))
+
+        remote_broker = self._get_broker(
+            local_broker.account, local_broker.container, node_index=1)
+        self.assertEqual(backend.SHARDED, remote_broker.get_db_state())
+        self.assertFalse(os.path.exists(remote_broker._db_file))
+        self.assertNotEqual(local_id, remote_broker.get_info()['id'])
+        self.assertEqual(remote_context['objects'][5:6],
+                         remote_broker.get_objects())
+
+        # Now that we have shard ranges, we're never considered in-sync :-/
+        self._check_only_shard_ranges_replicated(
+            local_broker, 1, repl_conf,
+            remote_broker.get_shard_ranges(include_own=True))
+
+    def test_replication_local_unsharded_remote_sharded(self):
+        self._check_replication_local_unsharded_remote_sharded({})
+
+    def test_replication_local_unsharded_remote_sharded_large_diff(self):
+        self._check_replication_local_unsharded_remote_sharded({'per_diff': 1})
+
+    def _check_replication_local_sharding_remote_missing(self, repl_conf):
+        local_context = self._setup_replication_test(0)
+        local_broker = local_context['broker']
+        self._merge_object(index=0, **local_context)
+        self._merge_object(index=1, **local_context)
+        epoch = Timestamp.now()
+        self._goto_sharding_state(local_broker, epoch)
+        self._merge_shard_range(index=0, **local_context)
+        self._merge_object(index=slice(2, 8), **local_context)
+        objs = local_context['objects']
+
+        daemon, repl_calls, rsync_calls = self.check_replicate(
+            local_broker, 1, repl_conf=repl_conf)
+
+        self.assertEqual(['sync', 'complete_rsync'],
+                         [call[0] for call in repl_calls])
+        self.assertEqual(1, daemon.stats['rsync'])
+        self.assertEqual(0, daemon.stats['deferred'])
+        self.assertEqual(0, daemon.stats['diff'])
+
+        # fresh db is sync'd first...
+        fresh_id = local_broker.get_info()['id']
+        self.assertEqual(fresh_id, repl_calls[0][1][2])
+        self.assertEqual(fresh_id, repl_calls[1][1][0])
+        # retired db is not sync'd at all
+        old_broker = self.backend(
+            local_broker._db_file, account=local_broker.account,
+            container=local_broker.container, force_db_file=True)
+        old_id = old_broker.get_info()['id']
+        bad_calls = []
+        for call in repl_calls:
+            if old_id in call[1]:
+                bad_calls.append(
+                    'old db id %r in %r call args %r' % (
+                        old_id, call[0], call[1]))
+        if bad_calls:
+            self.fail('Found some bad calls:\n' + '\n'.join(bad_calls))
+        # complete_rsync
+        self.assertEqual(os.path.basename(local_broker.db_file),
+                         repl_calls[1][1][1])
+        self.assertEqual(local_broker.db_file, rsync_calls[0][0])
+        self.assertEqual(fresh_id, os.path.basename(rsync_calls[0][1]))
+        self.assertFalse(rsync_calls[1:])
+
+        # TODO: make these stats better; in sharding state local broker pulls
+        # stats for 2 objects from old db, whereas remote thinks it's sharded
+        # and has an empty shard range table
+        self.assert_info_synced(local_broker, 1, mismatches=[
+            'object_count', 'bytes_used', 'db_state'])
+
+        remote_broker = self._get_broker('a', 'c', node_index=1)
+        remote_id = remote_broker.get_info()['id']
+        self.assertNotEqual(old_id, remote_id)
+        self.assertNotEqual(fresh_id, remote_id)
+        self.assertEqual(
+            [remote_broker.db_file], get_db_files(remote_broker.db_file))
+        self.assertEqual(os.path.basename(remote_broker.db_file),
+                         os.path.basename(local_broker.db_file))
+        self.assertEqual(epoch.normal, remote_broker.db_epoch)
+        # remote db has only the misplaced objects
+        self.assertEqual(objs[2:8], remote_broker.get_objects())
+        self.assert_shard_ranges_synced(local_broker, remote_broker)
+
+        # replicate again, check asserts abort
+        self._check_only_shard_ranges_replicated(
+            local_broker, 1, repl_conf,
+            local_broker.get_shard_ranges(include_own=True))
+
+        # sanity
+        remote_broker = self._get_broker('a', 'c', node_index=1)
+        self.assertEqual(
+            [remote_broker.db_file], get_db_files(remote_broker.db_file))
+        self.assertEqual(os.path.basename(remote_broker.db_file),
+                         os.path.basename(local_broker.db_file))
+        self.assertEqual(objs[2:8], remote_broker.get_objects())
+        self.assertEqual(epoch.normal, remote_broker.db_epoch)
+
+    def test_replication_local_sharding_remote_missing(self):
+        self._check_replication_local_sharding_remote_missing({})
+
+    def test_replication_local_sharding_remote_missing_large_diff(self):
+        # the local shard db has large diff with respect to the old db
+        self._check_replication_local_sharding_remote_missing({'per_diff': 1})
+
+    def _check_replication_local_sharding_remote_unsharded(self, repl_conf):
+        local_context = self._setup_replication_test(0)
+        self._merge_object(index=slice(0, 3), **local_context)
+        local_broker = local_context['broker']
+        epoch = Timestamp.now()
+        self._goto_sharding_state(local_broker, epoch)
+        self._merge_shard_range(index=0, **local_context)
+        self._merge_object(index=slice(3, 11), **local_context)
+
+        remote_context = self._setup_replication_test(1)
+        self._merge_object(index=11, **remote_context)
+
+        self._check_only_shard_ranges_replicated(
+            local_broker, 1, repl_conf,
+            local_broker.get_shard_ranges(include_own=True),
+            remote_has_shards=False)
+
+        remote_broker = self._get_broker('a', 'c', node_index=1)
+        self.assertEqual(
+            [remote_broker._db_file], get_db_files(remote_broker.db_file))
+        self.assertEqual(remote_context['objects'][11:12],
+                         remote_broker.get_objects())
+
+        self.assert_info_synced(
+            local_broker, 1,
+            mismatches=['db_state', 'object_count', 'bytes_used',
+                        'status_changed_at', 'hash'])
+
+        self._check_only_shard_ranges_replicated(
+            local_broker, 1, repl_conf,
+            local_broker.get_shard_ranges(include_own=True))
+
+    def test_replication_local_sharding_remote_unsharded(self):
+        self._check_replication_local_sharding_remote_unsharded({})
+
+    def test_replication_local_sharding_remote_unsharded_large_diff(self):
+        self._check_replication_local_sharding_remote_unsharded(
+            {'per_diff': 1})
+
+    def _check_only_sync(self, local_broker, remote_node_index, repl_conf):
+        daemon, repl_calls, rsync_calls = self.check_replicate(
+            local_broker, remote_node_index, repl_conf,
+            expect_success=False)
+
+        # When talking to an old (pre-2.18.0) container server, abort
+        # replication when we're sharding or sharded. Wait for the
+        # rolling upgrade that's presumably in-progress to finish instead.
+        self.assertEqual(1, daemon.stats['deferred'])
+        self.assertEqual(0, daemon.stats['diff'])
+        self.assertEqual(0, daemon.stats['rsync'])
+        self.assertEqual(['sync'],
+                         [call[0] for call in repl_calls])
+        self.assertFalse(rsync_calls)
+        lines = daemon.logger.get_lines_for_level('warning')
+        expected_tail = ", path: %s, db: %s" % (quote(local_broker.path),
+                                                local_broker.db_file)
+        self.assertIn('unable to replicate shard ranges', lines[0])
+        self.assertTrue(
+            lines[0].endswith(expected_tail),
+            "expected tail %r in %r" % (expected_tail, lines[0]),
+        )
+        self.assertIn('refusing to replicate objects', lines[1])
+        self.assertTrue(
+            lines[1].endswith(expected_tail),
+            "expected tail %r in %r" % (expected_tail, lines[1]),
+        )
+        # sync
+        local_id = local_broker.get_info()['id']
+        self.assertEqual(local_id, repl_calls[0][1][2])
+        remote_broker = self._get_broker(
+            local_broker.account, local_broker.container, node_index=1)
+        self.assertNotEqual(local_id, remote_broker.get_info()['id'])
+        self.assertEqual([], remote_broker.get_shard_ranges())
+        lines = daemon.logger.get_lines_for_level('warning')
+        self.assertEqual(
+            'unable to replicate shard ranges to peer 10.0.0.1:1001/sdb; '
+            'peer may need upgrading, path: %s, db: %s'
+            % (quote(local_broker.path), quote(local_broker.db_file)),
+            lines[0])
+
+        self.assertEqual(
+            'able to shard -- refusing to replicate objects to peer '
+            '10.0.0.1:1001/sdb; have shard ranges and will wait for cleaving,'
+            ' path: %s, db: %s'
+            % (quote(local_broker.path), quote(local_broker.db_file)),
+            lines[1])
+
+    def _check_replication_local_sharding_remote_presharding(self, repl_conf):
+        local_context = self._setup_replication_test(0)
+        self._merge_object(index=slice(0, 3), **local_context)
+        local_broker = local_context['broker']
+        epoch = Timestamp.now()
+        self._goto_sharding_state(local_broker, epoch)
+        self._merge_shard_range(index=0, **local_context)
+        self._merge_object(index=slice(3, 11), **local_context)
+
+        remote_context = self._setup_replication_test(1)
+        self._merge_object(index=11, **remote_context)
+
+        orig_get_remote_info = \
+            replicator.ContainerReplicatorRpc._get_synced_replication_info
+
+        def presharding_get_remote_info(*args):
+            rinfo = orig_get_remote_info(*args)
+            del rinfo['shard_max_row']
+            return rinfo
+
+        with mock.patch('swift.container.replicator.'
+                        'ContainerReplicatorRpc._get_synced_replication_info',
+                        presharding_get_remote_info):
+            self._check_only_sync(local_broker, 1, repl_conf)
+
+            remote_broker = self._get_broker('a', 'c', node_index=1)
+            self.assertEqual(
+                [remote_broker._db_file], get_db_files(remote_broker.db_file))
+            self.assertEqual(remote_context['objects'][11:12],
+                             remote_broker.get_objects())
+
+            self.assert_info_synced(
+                local_broker, 1,
+                mismatches=['db_state', 'object_count', 'bytes_used',
+                            'status_changed_at', 'hash'])
+
+            self._check_only_sync(local_broker, 1, repl_conf)
+
+    def test_replication_local_sharding_remote_presharding(self):
+        self._check_replication_local_sharding_remote_presharding({})
+
+    def test_replication_local_sharding_remote_presharding_large_diff(self):
+        self._check_replication_local_sharding_remote_presharding(
+            {'per_diff': 1})
+
+    def _check_replication_local_sharding_remote_sharding(self, repl_conf):
+        local_context = self._setup_replication_test(0)
+        self._merge_object(index=slice(0, 5), **local_context)
+        local_broker = local_context['broker']
+        epoch = Timestamp.now()
+        self._goto_sharding_state(local_broker, epoch)
+        self._merge_shard_range(index=0, **local_context)
+        self._merge_object(index=slice(5, 10), **local_context)
+
+        remote_context = self._setup_replication_test(1)
+        self._merge_object(index=12, **remote_context)
+        # take snapshot of info now before transition to sharding...
+        orig_remote_info = remote_context['broker'].get_info()
+        remote_broker = remote_context['broker']
+        self._goto_sharding_state(remote_broker, epoch)
+        self._merge_shard_range(index=0, **remote_context)
+        self._merge_object(index=13, **remote_context)
+
+        self._check_only_shard_ranges_replicated(
+            local_broker, 1, repl_conf,
+            remote_broker.get_shard_ranges(include_own=True))
+
+        # in sharding state brokers only reports object stats from old db, and
+        # they are different
+        self.assert_info_synced(
+            local_broker, 1, mismatches=['object_count', 'bytes_used',
+                                         'status_changed_at', 'hash'])
+
+        remote_broker = self._get_broker('a', 'c', node_index=1)
+        shard_db = make_db_file_path(remote_broker._db_file, epoch)
+        self.assertEqual([remote_broker._db_file, shard_db],
+                         get_db_files(remote_broker.db_file))
+        shard_db = make_db_file_path(remote_broker._db_file, epoch)
+        self.assertEqual([remote_broker._db_file, shard_db],
+                         get_db_files(remote_broker.db_file))
+        # no local objects have been sync'd to remote shard db
+        self.assertEqual(remote_context['objects'][13:14],
+                         remote_broker.get_objects())
+        # remote *old db* is unchanged
+        remote_old_broker = self.backend(
+            remote_broker._db_file, account=remote_broker.account,
+            container=remote_broker.container, force_db_file=True)
+        self.assertEqual(remote_context['objects'][12:13],
+                         remote_old_broker.get_objects())
+        self.assertFalse(remote_old_broker.get_shard_ranges())
+        remote_old_info = remote_old_broker.get_info()
+        orig_remote_info.pop('db_state')
+        remote_old_info.pop('db_state')
+        self.assertEqual(orig_remote_info, remote_old_info)
+
+        self._check_only_shard_ranges_replicated(
+            local_broker, 1, repl_conf,
+            local_broker.get_shard_ranges(include_own=True))
+
+    def test_replication_local_sharding_remote_sharding(self):
+        self._check_replication_local_sharding_remote_sharding({})
+
+    def test_replication_local_sharding_remote_sharding_large_diff(self):
+        self._check_replication_local_sharding_remote_sharding({'per_diff': 1})
+
+    def test_replication_local_sharded_remote_missing(self):
+        local_context = self._setup_replication_test(0)
+        local_broker = local_context['broker']
+        epoch = Timestamp.now()
+        self._goto_sharding_state(local_broker, epoch)
+        local_context['shard_ranges'][0].object_count = 99
+        local_context['shard_ranges'][0].state = ShardRange.ACTIVE
+        self._merge_shard_range(index=0, **local_context)
+        self._merge_object(index=slice(0, 3), **local_context)
+        self._goto_sharded_state(local_broker)
+        objs = local_context['objects']
+
+        daemon, repl_calls, rsync_calls = self.check_replicate(local_broker, 1)
+
+        self.assertEqual(['sync', 'complete_rsync'],
+                         [call[0] for call in repl_calls])
+        self.assertEqual(1, daemon.stats['rsync'])
+
+        # sync
+        local_id = local_broker.get_info()['id']
+        self.assertEqual(local_id, repl_calls[0][1][2])
+        # complete_rsync
+        self.assertEqual(local_id, repl_calls[1][1][0])
+        self.assertEqual(
+            os.path.basename(local_broker.db_file), repl_calls[1][1][1])
+        self.assertEqual(local_broker.db_file, rsync_calls[0][0])
+        self.assertEqual(local_id, os.path.basename(rsync_calls[0][1]))
+        self.assertFalse(rsync_calls[1:])
+
+        self.assert_info_synced(local_broker, 1)
+
+        remote_broker = self._get_broker('a', 'c', node_index=1)
+        remote_id = remote_broker.get_info()['id']
+        self.assertNotEqual(local_id, remote_id)
+        shard_db = make_db_file_path(remote_broker._db_file, epoch)
+        self.assertEqual([shard_db],
+                         get_db_files(remote_broker.db_file))
+        self.assertEqual(objs[:3], remote_broker.get_objects())
+        self.assertEqual(local_broker.get_shard_ranges(),
+                         remote_broker.get_shard_ranges())
+
+        # sanity check - in sync
+        self._assert_local_sharded_in_sync(local_broker, local_id)
+
+        _, remote_node = self._get_broker_part_node(remote_broker)
+        node_str = '%(ip)s:%(port)s/%(device)s' % remote_node
+        local_broker = local_context['broker']
+        self.assertEqual([
+            f'synced 2 shard ranges to {node_str}, path: {local_broker.path}'
+            f', db: {local_broker.db_file}'],
+            self.logger.get_lines_for_level('debug'))
+
+        remote_broker = self._get_broker('a', 'c', node_index=1)
+        shard_db = make_db_file_path(remote_broker._db_file, epoch)
+        self.assertEqual([shard_db],
+                         get_db_files(remote_broker.db_file))
+        # the remote broker object_count comes from replicated shard range...
+        self.assertEqual(99, remote_broker.get_info()['object_count'])
+        # these are replicated misplaced objects...
+        self.assertEqual(objs[:3], remote_broker.get_objects())
+        self.assertEqual(local_broker.get_shard_ranges(),
+                         remote_broker.get_shard_ranges())
+
+    def _check_replication_local_sharded_remote_unsharded(self, repl_conf):
+        local_context = self._setup_replication_test(0)
+        local_broker = local_context['broker']
+        epoch = Timestamp.now()
+        self._goto_sharding_state(local_broker, epoch)
+        local_context['shard_ranges'][0].object_count = 99
+        local_context['shard_ranges'][0].state = ShardRange.ACTIVE
+        self._merge_shard_range(index=0, **local_context)
+        self._merge_object(index=slice(0, 3), **local_context)
+        self._goto_sharded_state(local_broker)
+
+        remote_context = self._setup_replication_test(1)
+        self._merge_object(index=4, **remote_context)
+
+        self._check_only_shard_ranges_replicated(
+            local_broker, 1, repl_conf,
+            local_broker.get_shard_ranges(include_own=True),
+            remote_has_shards=False,
+            expect_success=True)
+
+        # sharded broker takes object count from shard range whereas remote
+        # unsharded broker takes it from object table
+        self.assert_info_synced(
+            local_broker, 1,
+            mismatches=['db_state', 'object_count', 'bytes_used',
+                        'status_changed_at', 'hash'])
+
+        remote_broker = self._get_broker('a', 'c', node_index=1)
+        self.assertEqual([remote_broker._db_file],
+                         get_db_files(remote_broker.db_file))
+        self.assertEqual(remote_context['objects'][4:5],
+                         remote_broker.get_objects())
+
+        self._check_only_shard_ranges_replicated(
+            local_broker, 1, repl_conf,
+            local_broker.get_shard_ranges(include_own=True),
+            # We just sent shards, so of course remote has some
+            remote_has_shards=True,
+            expect_success=True)
+
+        remote_broker = self._get_broker('a', 'c', node_index=1)
+        self.assertEqual([remote_broker._db_file],
+                         get_db_files(remote_broker.db_file))
+        self.assertEqual(remote_context['objects'][4:5],
+                         remote_broker.get_objects())
+
+    def test_replication_local_sharded_remote_unsharded(self):
+        self._check_replication_local_sharded_remote_unsharded({})
+
+    def test_replication_local_sharded_remote_unsharded_large_diff(self):
+        self._check_replication_local_sharded_remote_unsharded({'per_diff': 1})
+
+    def _check_replication_local_sharded_remote_sharding(self, repl_conf):
+        local_context = self._setup_replication_test(0)
+        local_broker = local_context['broker']
+        epoch = Timestamp.now()
+        self._goto_sharding_state(local_broker, epoch=epoch)
+        local_context['shard_ranges'][0].object_count = 99
+        local_context['shard_ranges'][0].bytes_used = 999
+        local_context['shard_ranges'][0].state = ShardRange.ACTIVE
+        self._merge_shard_range(index=0, **local_context)
+        self._merge_object(index=slice(0, 5), **local_context)
+        self._goto_sharded_state(local_broker)
+
+        remote_context = self._setup_replication_test(1)
+        self._merge_object(index=6, **remote_context)
+        remote_broker = remote_context['broker']
+        remote_info_orig = remote_broker.get_info()
+        self._goto_sharding_state(remote_broker, epoch=epoch)
+        self._merge_shard_range(index=0, **remote_context)
+        self._merge_object(index=7, **remote_context)
+
+        self._check_only_shard_ranges_replicated(
+            local_broker, 1, repl_conf,
+            # remote has newer timestamp for shard range
+            remote_broker.get_shard_ranges(include_own=True),
+            expect_success=True)
+
+        # sharded broker takes object count from shard range whereas remote
+        # sharding broker takes it from object table
+        self.assert_info_synced(
+            local_broker, 1,
+            mismatches=['db_state', 'object_count', 'bytes_used',
+                        'status_changed_at', 'hash'])
+
+        remote_broker = self._get_broker('a', 'c', node_index=1)
+        shard_db = make_db_file_path(remote_broker._db_file, epoch)
+        self.assertEqual([remote_broker._db_file, shard_db],
+                         get_db_files(remote_broker.db_file))
+        # remote fresh db objects are unchanged
+        self.assertEqual(remote_context['objects'][7:8],
+                         remote_broker.get_objects())
+        # remote old hash.db objects are unchanged
+        remote_old_broker = self.backend(
+            remote_broker._db_file, account=remote_broker.account,
+            container=remote_broker.container, force_db_file=True)
+        self.assertEqual(
+            remote_context['objects'][6:7],
+            remote_old_broker.get_objects())
+        remote_info = remote_old_broker.get_info()
+        remote_info_orig.pop('db_state')
+        remote_info.pop('db_state')
+        self.assertEqual(remote_info_orig, remote_info)
+        self.assertEqual(local_broker.get_shard_ranges(),
+                         remote_broker.get_shard_ranges())
+
+        self._check_only_shard_ranges_replicated(
+            local_broker, 1, repl_conf,
+            remote_broker.get_shard_ranges(include_own=True),
+            expect_success=True)
+
+    def test_replication_local_sharded_remote_sharding(self):
+        self._check_replication_local_sharded_remote_sharding({})
+
+    def test_replication_local_sharded_remote_sharding_large_diff(self):
+        self._check_replication_local_sharded_remote_sharding({'per_diff': 1})
+
+    def _check_replication_local_sharded_remote_sharded(self, repl_conf):
+        local_context = self._setup_replication_test(0)
+        local_broker = local_context['broker']
+        epoch = Timestamp.now()
+        self._goto_sharding_state(local_broker, epoch)
+        local_context['shard_ranges'][0].object_count = 99
+        local_context['shard_ranges'][0].bytes_used = 999
+        local_context['shard_ranges'][0].state = ShardRange.ACTIVE
+        self._merge_shard_range(index=0, **local_context)
+        self._merge_object(index=slice(0, 6), **local_context)
+        self._goto_sharded_state(local_broker)
+
+        remote_context = self._setup_replication_test(1)
+        self._merge_object(index=6, **remote_context)
+        remote_broker = remote_context['broker']
+        self._goto_sharding_state(remote_broker, epoch)
+        remote_context['shard_ranges'][0].object_count = 101
+        remote_context['shard_ranges'][0].bytes_used = 1010
+        remote_context['shard_ranges'][0].state = ShardRange.ACTIVE
+        self._merge_shard_range(index=0, **remote_context)
+        self._merge_object(index=7, **remote_context)
+        self._goto_sharded_state(remote_broker)
+
+        self._check_only_shard_ranges_replicated(
+            local_broker, 1, repl_conf,
+            # remote has newer timestamp for shard range
+            remote_broker.get_shard_ranges(include_own=True),
+            expect_success=True)
+
+        self.assert_info_synced(
+            local_broker, 1,
+            mismatches=['status_changed_at', 'hash'])
+
+        remote_broker = self._get_broker('a', 'c', node_index=1)
+        shard_db = make_db_file_path(remote_broker._db_file, epoch)
+        self.assertEqual([shard_db],
+                         get_db_files(remote_broker.db_file))
+        self.assertEqual(remote_context['objects'][7:8],
+                         remote_broker.get_objects())
+        # remote shard range was newer than local so object count is not
+        # updated by sync'd shard range
+        self.assertEqual(
+            101, remote_broker.get_shard_ranges()[0].object_count)
+
+        self._check_only_shard_ranges_replicated(
+            local_broker, 1, repl_conf,
+            # remote has newer timestamp for shard range
+            remote_broker.get_shard_ranges(include_own=True),
+            expect_success=True)
+
+    def test_replication_local_sharded_remote_sharded(self):
+        self._check_replication_local_sharded_remote_sharded({})
+
+    def test_replication_local_sharded_remote_sharded_large_diff(self):
+        self._check_replication_local_sharded_remote_sharded({'per_diff': 1})
+
+    def test_replication_rsync_then_merge_aborts_before_merge_sharding(self):
+        # verify that rsync_then_merge aborts if remote starts sharding during
+        # the rsync
+        local_context = self._setup_replication_test(0)
+        local_broker = local_context['broker']
+        self._merge_object(index=slice(0, 3), **local_context)
+        remote_context = self._setup_replication_test(1)
+        remote_broker = remote_context['broker']
+        remote_broker.logger = debug_logger()
+        self._merge_object(index=5, **remote_context)
+
+        orig_func = replicator.ContainerReplicatorRpc.rsync_then_merge
+
+        def mock_rsync_then_merge(*args):
+            remote_broker.merge_shard_ranges(
+                ShardRange('.shards_a/cc', Timestamp.now()))
+            self._goto_sharding_state(remote_broker, Timestamp.now())
+            return orig_func(*args)
+
+        with mock.patch(
+                'swift.container.replicator.ContainerReplicatorRpc.'
+                'rsync_then_merge',
+                mock_rsync_then_merge):
+            with mock.patch(
+                    'swift.container.backend.ContainerBroker.'
+                    'get_items_since') as mock_get_items_since:
+                daemon, repl_calls, rsync_calls = self.check_replicate(
+                    local_broker, 1, expect_success=False,
+                    repl_conf={'per_diff': 1})
+
+        mock_get_items_since.assert_not_called()
+        # No call to get_shard_ranges because remote didn't have shard ranges
+        # when the sync arrived
+        self.assertEqual(['sync', 'rsync_then_merge'],
+                         [call[0] for call in repl_calls])
+        self.assertEqual(local_broker.db_file, rsync_calls[0][0])
+        self.assertEqual(local_broker.get_info()['id'],
+                         os.path.basename(rsync_calls[0][1]))
+        self.assertFalse(rsync_calls[1:])
+
+    def test_replication_rsync_then_merge_aborts_before_merge_sharded(self):
+        # verify that rsync_then_merge aborts if remote completes sharding
+        # during the rsync
+        local_context = self._setup_replication_test(0)
+        local_broker = local_context['broker']
+        self._merge_object(index=slice(0, 3), **local_context)
+        remote_context = self._setup_replication_test(1)
+        remote_broker = remote_context['broker']
+        remote_broker.logger = debug_logger()
+        self._merge_object(index=5, **remote_context)
+
+        orig_func = replicator.ContainerReplicatorRpc.rsync_then_merge
+
+        def mock_rsync_then_merge(*args):
+            remote_broker.merge_shard_ranges(
+                ShardRange('.shards_a/cc', Timestamp.now()))
+            self._goto_sharding_state(remote_broker, Timestamp.now())
+            self._goto_sharded_state(remote_broker)
+            return orig_func(*args)
+
+        with mock.patch(
+                'swift.container.replicator.ContainerReplicatorRpc.'
+                'rsync_then_merge',
+                mock_rsync_then_merge):
+            with mock.patch(
+                    'swift.container.backend.ContainerBroker.'
+                    'get_items_since') as mock_get_items_since:
+                daemon, repl_calls, rsync_calls = self.check_replicate(
+                    local_broker, 1, expect_success=False,
+                    repl_conf={'per_diff': 1})
+
+        mock_get_items_since.assert_not_called()
+        # No call to get_shard_ranges because remote didn't have shard ranges
+        # when the sync arrived
+        self.assertEqual(['sync', 'rsync_then_merge'],
+                         [call[0] for call in repl_calls])
+        self.assertEqual(local_broker.db_file, rsync_calls[0][0])
+        self.assertEqual(local_broker.get_info()['id'],
+                         os.path.basename(rsync_calls[0][1]))
+        self.assertFalse(rsync_calls[1:])
+
+    def test_replication_rsync_then_merge_aborts_after_merge_sharding(self):
+        # verify that rsync_then_merge aborts if remote starts sharding during
+        # the merge
+        local_context = self._setup_replication_test(0)
+        local_broker = local_context['broker']
+        self._merge_object(index=slice(0, 3), **local_context)
+        remote_context = self._setup_replication_test(1)
+        remote_broker = remote_context['broker']
+        remote_broker.logger = debug_logger()
+        self._merge_object(index=5, **remote_context)
+
+        orig_get_items_since = backend.ContainerBroker.get_items_since
+        calls = []
+
+        def fake_get_items_since(broker, *args):
+            # remote starts sharding while rpc call is merging
+            if not calls:
+                remote_broker.merge_shard_ranges(
+                    ShardRange('.shards_a/cc', Timestamp.now()))
+                self._goto_sharding_state(remote_broker, Timestamp.now())
+            calls.append(args)
+            return orig_get_items_since(broker, *args)
+
+        to_patch = 'swift.container.backend.ContainerBroker.get_items_since'
+        with mock.patch(to_patch, fake_get_items_since), \
+                mock.patch('swift.common.db_replicator.sleep'), \
+                mock.patch('swift.container.backend.tpool.execute',
+                           lambda func, *args: func(*args)):
+            # For some reason, on py3 we start popping Timeouts
+            # if we let eventlet trampoline...
+            daemon, repl_calls, rsync_calls = self.check_replicate(
+                local_broker, 1, expect_success=False,
+                repl_conf={'per_diff': 1})
+
+        self.assertEqual(['sync', 'rsync_then_merge'],
+                         [call[0] for call in repl_calls])
+        self.assertEqual(local_broker.db_file, rsync_calls[0][0])
+        self.assertEqual(local_broker.get_info()['id'],
+                         os.path.basename(rsync_calls[0][1]))
+        self.assertFalse(rsync_calls[1:])
+
+    def test_replication_rsync_then_merge_aborts_after_merge_sharded(self):
+        # verify that rsync_then_merge aborts if remote completes sharding
+        # during the merge
+        local_context = self._setup_replication_test(0)
+        local_broker = local_context['broker']
+        self._merge_object(index=slice(0, 3), **local_context)
+        remote_context = self._setup_replication_test(1)
+        remote_broker = remote_context['broker']
+        remote_broker.logger = debug_logger()
+        self._merge_object(index=5, **remote_context)
+
+        orig_get_items_since = backend.ContainerBroker.get_items_since
+        calls = []
+
+        def fake_get_items_since(broker, *args):
+            # remote starts sharding while rpc call is merging
+            result = orig_get_items_since(broker, *args)
+            if calls:
+                remote_broker.merge_shard_ranges(
+                    ShardRange('.shards_a/cc', Timestamp.now()))
+                self._goto_sharding_state(remote_broker, Timestamp.now())
+                self._goto_sharded_state(remote_broker)
+            calls.append(args)
+            return result
+
+        to_patch = 'swift.container.backend.ContainerBroker.get_items_since'
+        with mock.patch(to_patch, fake_get_items_since), \
+                mock.patch('swift.common.db_replicator.sleep'), \
+                mock.patch('swift.container.backend.tpool.execute',
+                           lambda func, *args: func(*args)):
+            # For some reason, on py3 we start popping Timeouts
+            # if we let eventlet trampoline...
+            daemon, repl_calls, rsync_calls = self.check_replicate(
+                local_broker, 1, expect_success=False,
+                repl_conf={'per_diff': 1})
+
+        self.assertEqual(['sync', 'rsync_then_merge'],
+                         [call[0] for call in repl_calls])
+        self.assertEqual(local_broker.db_file, rsync_calls[0][0])
+        self.assertEqual(local_broker.get_info()['id'],
+                         os.path.basename(rsync_calls[0][1]))
+        self.assertFalse(rsync_calls[1:])
+
+    @mock.patch('swift.common.ring.ring.Ring.get_part_nodes', return_value=[])
+    def test_find_local_handoff_for_part(self, mock_part_nodes):
+
+        with mock.patch(
+                'swift.common.db_replicator.ring.Ring',
+                return_value=self._ring):
+            daemon = replicator.ContainerReplicator({}, logger=self.logger)
+
+        # First let's assume we find a primary node
+        ring_node1, ring_node2, ring_node3 = daemon.ring.devs[-3:]
+        mock_part_nodes.return_value = [ring_node1, ring_node2]
+        daemon._local_device_ids = {ring_node1['id']: ring_node1,
+                                    ring_node3['id']: ring_node3}
+        node = daemon.find_local_handoff_for_part(0)
+        self.assertEqual(node['id'], ring_node1['id'])
+
+        # And if we can't find one from the primaries get *some* local device
+        mock_part_nodes.return_value = []
+        daemon._local_device_ids = {ring_node3['id']: ring_node3}
+        node = daemon.find_local_handoff_for_part(0)
+        self.assertEqual(node['id'], ring_node3['id'])
+
+        # if there are more then 1 local_dev_id it'll randomly pick one, but
+        # not a zero-weight device
+        ring_node3['weight'] = 0
+        selected_node_ids = set()
+        local_dev_ids = {dev['id']: dev for dev in daemon.ring.devs[-3:]}
+        daemon._local_device_ids = local_dev_ids
+        for _ in range(15):
+            node = daemon.find_local_handoff_for_part(0)
+            self.assertIn(node['id'], local_dev_ids)
+            selected_node_ids.add(node['id'])
+            if len(selected_node_ids) == 3:
+                break  # unexpected
+        self.assertEqual(len(selected_node_ids), 2)
+        self.assertEqual([1, 1], [local_dev_ids[dev_id]['weight']
+                                  for dev_id in selected_node_ids])
+        warning_lines = self.logger.get_lines_for_level('warning')
+        self.assertFalse(warning_lines)
+
+        # ...unless all devices have zero-weight
+        ring_node3['weight'] = 0
+        ring_node2['weight'] = 0
+        selected_node_ids = set()
+        local_dev_ids = {dev['id']: dev for dev in daemon.ring.devs[-2:]}
+        daemon._local_device_ids = local_dev_ids
+        for _ in range(15):
+            self.logger.clear()
+            node = daemon.find_local_handoff_for_part(0)
+            self.assertIn(node['id'], local_dev_ids)
+            selected_node_ids.add(node['id'])
+            if len(selected_node_ids) == 2:
+                break  # expected
+        self.assertEqual(len(selected_node_ids), 2)
+        self.assertEqual([0, 0], [local_dev_ids[dev_id]['weight']
+                                  for dev_id in selected_node_ids])
+        warning_lines = self.logger.get_lines_for_level('warning')
+        self.assertEqual(1, len(warning_lines), warning_lines)
+        self.assertIn(
+            'Could not find a non-zero weight device for handoff partition',
+            warning_lines[0])
+
+        # If there are also no local_dev_ids, then we'll get the RuntimeError
+        daemon._local_device_ids = {}
+        with self.assertRaises(RuntimeError) as dev_err:
+            daemon.find_local_handoff_for_part(0)
+        expected_error_string = 'Cannot find local handoff; no local devices'
+        self.assertEqual(str(dev_err.exception), expected_error_string)
+
+    def test_delete_db_logs_on_sync_store_error(self):
+        daemon = replicator.ContainerReplicator({}, logger=self.logger)
+        daemon.sync_store = mock.Mock()
+        broker = self._get_broker('a', 'c', node_index=0)
+
+        daemon.sync_store.remove_synced_container.side_effect = Exception(
+            'kaboom')
+
+        delete_success = daemon.delete_db(broker)
+
+        lines = self.logger.get_lines_for_level('error')
+        self.assertEqual(
+            ['Failed to remove sync_store entry, path: a/c, db: %s: '
+             % broker.db_file], lines)
+        self.assertEqual(
+            [mock.call(broker)],
+            daemon.sync_store.remove_synced_container.call_args_list)
+        self.assertTrue(delete_success)
 
 
 if __name__ == '__main__':
diff --git a/test/unit/container/test_server.py b/test/unit/container/test_server.py
index 87dbaeb2b3..524039ff4a 100644
--- a/test/unit/container/test_server.py
+++ b/test/unit/container/test_server.py
@@ -1,4 +1,5 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# -*- coding: utf-8 -*-
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,907 +14,5674 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
+import operator
 import os
-import sys
+import posix
+from unittest import mock
 import unittest
+import itertools
+import time
+import random
+from contextlib import contextmanager
+from io import BytesIO, StringIO
 from shutil import rmtree
-from StringIO import StringIO
-from time import time
 from tempfile import mkdtemp
+from xml.dom import minidom
 
-from eventlet import spawn, Timeout, listen
-import simplejson
+from eventlet import spawn, Timeout
+import json
+from urllib.parse import quote
 
-from swift.common.swob import Request
+from swift import __version__ as swift_version
+from swift.common.header_key_dict import HeaderKeyDict
+from swift.common.swob import (Request, WsgiBytesIO, HTTPNoContent,
+                               bytes_to_wsgi, Response, date_header_format)
+import swift.container
 from swift.container import server as container_server
-from swift.common.utils import normalize_timestamp, mkdirs
+from swift.common import constraints
+from swift.common.utils import (Timestamp, mkdirs, public, replication,
+                                storage_directory, lock_parent_directory,
+                                ShardRange, RESERVED_STR, Namespace)
+from test.debug_logger import debug_logger
+from test.unit import fake_http_connect, mock_check_drive
+from swift.common.storage_policy import (POLICIES, StoragePolicy)
+from swift.common.request_helpers import get_sys_meta_prefix, get_reserved_name
 
+from test import listen_zero
+from test.unit import patch_policies, make_timestamp_iter, mock_timestamp_now
 
+
+@contextmanager
+def save_globals():
+    orig_http_connect = getattr(swift.container.server, 'http_connect',
+                                None)
+    try:
+        yield True
+    finally:
+        swift.container.server.http_connect = orig_http_connect
+
+
+@patch_policies
 class TestContainerController(unittest.TestCase):
-    """ Test swift.container_server.ContainerController """
+
     def setUp(self):
-        """ Set up for testing swift.object_server.ObjectController """
-        self.testdir = os.path.join(mkdtemp(),
-                                    'tmp_test_object_server_ObjectController')
+        self.testdir = os.path.join(
+            mkdtemp(), 'tmp_test_container_server_ContainerController')
         mkdirs(self.testdir)
         rmtree(self.testdir)
         mkdirs(os.path.join(self.testdir, 'sda1'))
         mkdirs(os.path.join(self.testdir, 'sda1', 'tmp'))
+        self.logger = debug_logger()
         self.controller = container_server.ContainerController(
-            {'devices': self.testdir, 'mount_check': 'false'})
+            {'devices': self.testdir, 'mount_check': 'false'},
+            logger=self.logger)
+        # some of the policy tests want at least two policies
+        self.assertTrue(len(POLICIES) > 1)
+        self.ts = make_timestamp_iter()
 
     def tearDown(self):
-        """ Tear down for testing swift.object_server.ObjectController """
         rmtree(os.path.dirname(self.testdir), ignore_errors=1)
 
+    def _update_object_put_headers(self, req):
+        """
+        Override this method in test subclasses to test post upgrade
+        behavior.
+        """
+        pass
+
+    def _put_shard_range(self, shard_range):
+        put_timestamp = shard_range.timestamp.internal
+        headers = {'X-Backend-Record-Type': 'shard',
+                   'X-Timestamp': put_timestamp}
+        body = json.dumps([dict(shard_range)])
+        req = Request.blank('/sda1/p/a/c', method='PUT', headers=headers,
+                            body=body)
+        resp = req.get_response(self.controller)
+        self.assertIn(resp.status_int, (201, 202))
+
+    def _check_put_container_storage_policy(self, req, policy_index):
+        resp = req.get_response(self.controller)
+        self.assertEqual(201, resp.status_int)
+        req = Request.blank(req.path, method='HEAD')
+        resp = req.get_response(self.controller)
+        self.assertEqual(204, resp.status_int)
+        self.assertEqual(str(policy_index),
+                         resp.headers['X-Backend-Storage-Policy-Index'])
+
+    def _assert_shard_ranges_equal(self, x, y):
+        # ShardRange.__eq__ only compares lower and upper; here we generate
+        # dict representations to compare all attributes
+        self.assertEqual([dict(sr) for sr in x], [dict(sr) for sr in y])
+
+    def test_creation(self):
+        # later config should be extended to assert more config options
+        app = container_server.ContainerController(
+            {'node_timeout': '3.5'}, logger=self.logger)
+        self.assertEqual(app.node_timeout, 3.5)
+        self.assertEqual(self.logger.get_lines_for_level('warning'), [])
+
+    def test_get_and_validate_policy_index(self):
+        # no policy is OK
+        req = Request.blank('/sda1/p/a/container_default', method='PUT',
+                            headers={'X-Timestamp': '0'})
+        self._check_put_container_storage_policy(req, POLICIES.default.idx)
+
+        # bogus policies
+        for policy in ('nada', 999):
+            req = Request.blank('/sda1/p/a/c_%s' % policy, method='PUT',
+                                headers={
+                                    'X-Timestamp': '0',
+                                    'X-Backend-Storage-Policy-Index': policy
+                                })
+            resp = req.get_response(self.controller)
+            self.assertEqual(400, resp.status_int)
+            self.assertIn(b'invalid', resp.body.lower())
+
+        # good policies
+        for policy in POLICIES:
+            req = Request.blank('/sda1/p/a/c_%s' % policy.name, method='PUT',
+                                headers={
+                                    'X-Timestamp': '0',
+                                    'X-Backend-Storage-Policy-Index':
+                                    policy.idx,
+                                })
+            self._check_put_container_storage_policy(req, policy.idx)
+
     def test_acl_container(self):
         # Ensure no acl by default
-        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
             headers={'X-Timestamp': '0'})
-        self.controller.PUT(req)
-        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'HEAD'})
-        response = self.controller.HEAD(req)
-        self.assert_(response.status.startswith('204'))
-        self.assert_('x-container-read' not in response.headers)
-        self.assert_('x-container-write' not in response.headers)
+        resp = req.get_response(self.controller)
+        self.assertTrue(resp.status.startswith('201'))
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'HEAD'})
+        response = req.get_response(self.controller)
+        self.assertTrue(response.status.startswith('204'))
+        self.assertNotIn('x-container-read', response.headers)
+        self.assertNotIn('x-container-write', response.headers)
         # Ensure POSTing acls works
-        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'POST'},
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'POST'},
             headers={'X-Timestamp': '1', 'X-Container-Read': '.r:*',
                      'X-Container-Write': 'account:user'})
-        self.controller.POST(req)
-        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'HEAD'})
-        response = self.controller.HEAD(req)
-        self.assert_(response.status.startswith('204'))
-        self.assertEquals(response.headers.get('x-container-read'), '.r:*')
-        self.assertEquals(response.headers.get('x-container-write'),
-                          'account:user')
+        resp = req.get_response(self.controller)
+        self.assertTrue(resp.status.startswith('204'))
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'HEAD'})
+        response = req.get_response(self.controller)
+        self.assertTrue(response.status.startswith('204'))
+        self.assertEqual(response.headers.get('x-container-read'), '.r:*')
+        self.assertEqual(response.headers.get('x-container-write'),
+                         'account:user')
         # Ensure we can clear acls on POST
-        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'POST'},
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'POST'},
             headers={'X-Timestamp': '3', 'X-Container-Read': '',
                      'X-Container-Write': ''})
-        self.controller.POST(req)
-        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'HEAD'})
-        response = self.controller.HEAD(req)
-        self.assert_(response.status.startswith('204'))
-        self.assert_('x-container-read' not in response.headers)
-        self.assert_('x-container-write' not in response.headers)
-        # Ensure PUTing acls works
-        req = Request.blank('/sda1/p/a/c2', environ={'REQUEST_METHOD': 'PUT'},
+        resp = req.get_response(self.controller)
+        self.assertTrue(resp.status.startswith('204'))
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'HEAD'})
+        response = req.get_response(self.controller)
+        self.assertTrue(response.status.startswith('204'))
+        self.assertNotIn('x-container-read', response.headers)
+        self.assertNotIn('x-container-write', response.headers)
+        # Ensure PUT acls works
+        req = Request.blank(
+            '/sda1/p/a/c2', environ={'REQUEST_METHOD': 'PUT'},
             headers={'X-Timestamp': '4', 'X-Container-Read': '.r:*',
                      'X-Container-Write': 'account:user'})
-        self.controller.PUT(req)
+        resp = req.get_response(self.controller)
+        self.assertTrue(resp.status.startswith('201'))
         req = Request.blank('/sda1/p/a/c2', environ={'REQUEST_METHOD': 'HEAD'})
-        response = self.controller.HEAD(req)
-        self.assert_(response.status.startswith('204'))
-        self.assertEquals(response.headers.get('x-container-read'), '.r:*')
-        self.assertEquals(response.headers.get('x-container-write'),
-                          'account:user')
+        response = req.get_response(self.controller)
+        self.assertTrue(response.status.startswith('204'))
+        self.assertEqual(response.headers.get('x-container-read'), '.r:*')
+        self.assertEqual(response.headers.get('x-container-write'),
+                         'account:user')
+
+    def test_HEAD_has_content_length(self):
+        # create a container
+        put_timestamp = next(self.ts)
+        expected_last_modified = Response(
+            last_modified=put_timestamp.ceil()).headers['Last-Modified']
+        created_at_timestamp = next(self.ts)
+        req = Request.blank('/sda1/p/a/c', method='PUT', headers={
+            'x-timestamp': put_timestamp.internal})
+        with mock.patch('swift.container.backend.Timestamp.now',
+                        return_value=created_at_timestamp):
+            resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        # do a HEAD
+        req = Request.blank('/sda1/p/a/c', method='HEAD')
+        status, headers, body_iter = req.call_application(self.controller)
+        self.assertEqual('204 No Content', status)
+        self.assertEqual({
+            'Content-Type': 'text/plain; charset=utf-8',
+            'Content-Length': '0',
+            'Last-Modified': expected_last_modified,
+            'X-Backend-Delete-Timestamp': '0000000000.00000',
+            'X-Backend-Put-Timestamp': put_timestamp.internal,
+            'X-Backend-Sharding-State': 'unsharded',
+            'X-Backend-Status-Changed-At': put_timestamp.internal,
+            'X-Backend-Storage-Policy-Index': str(int(POLICIES.default)),
+            'X-Backend-Timestamp': created_at_timestamp.internal,
+            'X-Container-Bytes-Used': '0',
+            'X-Container-Object-Count': '0',
+            'X-Put-Timestamp': put_timestamp.normal,
+            'X-Timestamp': created_at_timestamp.normal,
+        }, dict(headers))
+        self.assertEqual(b'', b''.join(body_iter))
+
+    def _test_head(self, ts_start, ts):
+        req = Request.blank('/sda1/p/a/c', method='HEAD')
+        response = req.get_response(self.controller)
+        self.assertEqual(response.status_int, 204)
+        self.assertEqual(response.headers['x-container-bytes-used'], '0')
+        self.assertEqual(response.headers['x-container-object-count'], '0')
+        obj_put_request = Request.blank(
+            '/sda1/p/a/c/o', method='PUT', headers={
+                'x-timestamp': next(ts).internal,
+                'x-size': 42,
+                'x-content-type': 'text/plain',
+                'x-etag': 'x',
+            })
+        self._update_object_put_headers(obj_put_request)
+        obj_put_resp = obj_put_request.get_response(self.controller)
+        self.assertEqual(obj_put_resp.status_int // 100, 2)
+        # re-issue HEAD request
+        response = req.get_response(self.controller)
+        self.assertEqual(response.status_int // 100, 2)
+        self.assertEqual(response.headers['x-container-bytes-used'], '42')
+        self.assertEqual(response.headers['x-container-object-count'], '1')
+        # created at time...
+        ts_created_at = Timestamp(response.headers['x-timestamp'])
+        self.assertEqual(response.headers['x-timestamp'],
+                         ts_created_at.normal)
+        self.assertTrue(ts_created_at >= ts_start)
+        self.assertEqual(response.headers['x-put-timestamp'], ts_start.normal)
+        self.assertEqual(response.headers['last-modified'],
+                         date_header_format(ts_start))
+
+        # backend headers
+        self.assertEqual(int(response.headers
+                             ['X-Backend-Storage-Policy-Index']),
+                         int(POLICIES.default))
+        self.assertTrue(
+            Timestamp(response.headers['x-backend-timestamp']) >= ts_start)
+        self.assertEqual(response.headers['x-backend-put-timestamp'],
+                         ts_start.internal)
+        # the delete timestamp column defaults to the string '0'
+        self.assertEqual(response.headers['x-backend-delete-timestamp'],
+                         Timestamp('0').internal)
+        self.assertEqual(response.headers['x-backend-status-changed-at'],
+                         ts_start.internal)
 
     def test_HEAD(self):
-        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        self.controller.PUT(req)
-        response = self.controller.HEAD(req)
-        self.assert_(response.status.startswith('204'))
-        self.assertEquals(int(response.headers['x-container-bytes-used']), 0)
-        self.assertEquals(int(response.headers['x-container-object-count']), 0)
-        req2 = Request.blank('/sda1/p/a/c/o', environ=
-                {'HTTP_X_TIMESTAMP': '1', 'HTTP_X_SIZE': 42,
-                 'HTTP_X_CONTENT_TYPE': 'text/plain', 'HTTP_X_ETAG': 'x'})
-        self.controller.PUT(req2)
-        response = self.controller.HEAD(req)
-        self.assertEquals(int(response.headers['x-container-bytes-used']), 42)
-        self.assertEquals(int(response.headers['x-container-object-count']), 1)
+        ts_start = next(self.ts)
+        req = Request.blank('/sda1/p/a/c', method='PUT', headers={
+            'x-timestamp': ts_start.internal})
+        req.get_response(self.controller)
+        self._test_head(ts_start, self.ts)
+
+    def test_HEAD_timestamp_with_offset(self):
+        ts_iter = (Timestamp(ts, offset=1) for ts in self.ts)
+        ts_start = next(ts_iter)
+        req = Request.blank('/sda1/p/a/c', method='PUT', headers={
+            'x-timestamp': ts_start.internal})
+        req.get_response(self.controller)
+        self._test_head(ts_start, ts_iter)
 
     def test_HEAD_not_found(self):
-        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'HEAD'})
-        resp = self.controller.HEAD(req)
-        self.assertEquals(resp.status_int, 404)
+        req = Request.blank('/sda1/p/a/c', method='HEAD')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)
+        self.assertEqual(int(resp.headers['X-Backend-Storage-Policy-Index']),
+                         0)
+        self.assertEqual(resp.headers['x-backend-timestamp'],
+                         Timestamp.zero().internal)
+        self.assertEqual(resp.headers['x-backend-put-timestamp'],
+                         Timestamp.zero().internal)
+        self.assertEqual(resp.headers['x-backend-status-changed-at'],
+                         Timestamp.zero().internal)
+        self.assertEqual(resp.headers['x-backend-delete-timestamp'],
+                         Timestamp.zero().internal)
+        self.assertIsNone(resp.last_modified)
+
+        for header in ('x-container-object-count', 'x-container-bytes-used',
+                       'x-timestamp', 'x-put-timestamp'):
+            self.assertIsNone(resp.headers[header])
+
+    def test_deleted_headers(self):
+        request_method_times = {
+            'PUT': next(self.ts).internal,
+            'DELETE': next(self.ts).internal,
+        }
+        # setup a deleted container
+        for method in ('PUT', 'DELETE'):
+            x_timestamp = request_method_times[method]
+            req = Request.blank('/sda1/p/a/c', method=method,
+                                headers={'x-timestamp': x_timestamp})
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int // 100, 2)
+
+        for method in ('GET', 'HEAD'):
+            req = Request.blank('/sda1/p/a/c', method=method)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 404)
+            self.assertIsNone(resp.last_modified)
+            # backend headers
+            self.assertEqual(int(resp.headers[
+                                 'X-Backend-Storage-Policy-Index']),
+                             int(POLICIES.default))
+            self.assertTrue(Timestamp(resp.headers['x-backend-timestamp']) >=
+                            Timestamp(request_method_times['PUT']))
+            self.assertEqual(resp.headers['x-backend-put-timestamp'],
+                             request_method_times['PUT'])
+            self.assertEqual(resp.headers['x-backend-delete-timestamp'],
+                             request_method_times['DELETE'])
+            self.assertEqual(resp.headers['x-backend-status-changed-at'],
+                             request_method_times['DELETE'])
+            for header in ('x-container-object-count',
+                           'x-container-bytes-used', 'x-timestamp',
+                           'x-put-timestamp'):
+                self.assertIsNone(resp.headers[header])
+
+    def test_HEAD_invalid_partition(self):
+        req = Request.blank('/sda1/./a/c', environ={'REQUEST_METHOD': 'HEAD',
+                                                    'HTTP_X_TIMESTAMP': '1'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 400)
+
+    def test_HEAD_invalid_content_type(self):
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'HEAD'},
+            headers={'Accept': 'application/plain'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 406)
+
+    def test_HEAD_invalid_accept(self):
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'HEAD'},
+            headers={'Accept': 'application/plain;q'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 400)
+        self.assertEqual(resp.body, b'')
+
+    def test_HEAD_invalid_format(self):
+        format = '%D1%BD%8A9'  # invalid UTF-8; should be %E1%BD%8A9 (E -> D)
+        req = Request.blank(
+            '/sda1/p/a/c?format=' + format,
+            environ={'REQUEST_METHOD': 'HEAD'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 400)
+
+    def test_OPTIONS(self):
+        server_handler = container_server.ContainerController(
+            {'devices': self.testdir, 'mount_check': 'false'})
+        req = Request.blank('/sda1/p/a/c/o', {'REQUEST_METHOD': 'OPTIONS'})
+        req.content_length = 0
+        resp = server_handler.OPTIONS(req)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual(sorted(resp.headers['Allow'].split(', ')), sorted(
+            'OPTIONS GET POST PUT DELETE HEAD REPLICATE UPDATE'.split()))
+        self.assertEqual(resp.headers['Server'],
+                         (self.controller.server_type + '/' + swift_version))
+
+    def test_insufficient_storage_mount_check_true(self):
+        conf = {'devices': self.testdir, 'mount_check': 'true'}
+        container_controller = container_server.ContainerController(conf)
+        self.assertTrue(container_controller.mount_check)
+        for method in container_controller.allowed_methods:
+            if method == 'OPTIONS':
+                continue
+            path = '/sda1/p/'
+            if method == 'REPLICATE':
+                path += 'suff'
+            else:
+                path += 'a/c'
+            req = Request.blank(path, method=method,
+                                headers={'x-timestamp': '1'})
+            with mock_check_drive() as mocks:
+                try:
+                    resp = req.get_response(container_controller)
+                    self.assertEqual(resp.status_int, 507)
+                    mocks['ismount'].return_value = True
+                    resp = req.get_response(container_controller)
+                    self.assertNotEqual(resp.status_int, 507)
+                    # feel free to rip out this last assertion...
+                    expected = 2 if method == 'PUT' else 4
+                    self.assertEqual(resp.status_int // 100, expected)
+                except AssertionError as e:
+                    self.fail('%s for %s' % (e, method))
+
+    def test_insufficient_storage_mount_check_false(self):
+        conf = {'devices': self.testdir, 'mount_check': 'false'}
+        container_controller = container_server.ContainerController(conf)
+        self.assertFalse(container_controller.mount_check)
+        for method in container_controller.allowed_methods:
+            if method == 'OPTIONS':
+                continue
+            path = '/sda1/p/'
+            if method == 'REPLICATE':
+                path += 'suff'
+            else:
+                path += 'a/c'
+            req = Request.blank(path, method=method,
+                                headers={'x-timestamp': '1'})
+            with mock_check_drive() as mocks:
+                try:
+                    resp = req.get_response(container_controller)
+                    self.assertEqual(resp.status_int, 507)
+                    mocks['isdir'].return_value = True
+                    resp = req.get_response(container_controller)
+                    self.assertNotEqual(resp.status_int, 507)
+                    # feel free to rip out this last assertion...
+                    expected = 2 if method == 'PUT' else 4
+                    self.assertEqual(resp.status_int // 100, expected)
+                except AssertionError as e:
+                    self.fail('%s for %s' % (e, method))
 
     def test_PUT(self):
-        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '1'})
-        resp = self.controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
-        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '2'})
-        resp = self.controller.PUT(req)
-        self.assertEquals(resp.status_int, 202)
+        req = Request.blank(
+            '/sda1/p/a/c',
+            environ={'REQUEST_METHOD': 'PUT', 'HTTP_X_TIMESTAMP': '1'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        req = Request.blank(
+            '/sda1/p/a/c',
+            environ={'REQUEST_METHOD': 'PUT', 'HTTP_X_TIMESTAMP': '2'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 202)
+
+    def test_PUT_HEAD_put_timestamp_updates(self):
+        ts = [next(self.ts) for _ in range(6)]
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': ts[1].internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+
+        def do_put_head(put_ts, meta_value, extra_hdrs, body='', path='a/c'):
+            # Set metadata header
+            req = Request.blank('/sda1/p/' + path,
+                                environ={'REQUEST_METHOD': 'PUT'},
+                                headers={'X-Timestamp': put_ts.internal,
+                                         'X-Container-Meta-Test': meta_value},
+                                body=body)
+            req.headers.update(extra_hdrs)
+            resp = req.get_response(self.controller)
+            self.assertTrue(resp.is_success)
+            req = Request.blank('/sda1/p/a/c',
+                                environ={'REQUEST_METHOD': 'HEAD'})
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 204)
+            return resp.headers
+
+        # put timestamp is advanced on PUT with container path
+        resp_hdrs = do_put_head(ts[2], 'val1',
+                                {'x-backend-no-timestamp-update': 'false'})
+        self.assertEqual(resp_hdrs.get('x-container-meta-test'), 'val1')
+        self.assertEqual(resp_hdrs.get('x-backend-put-timestamp'),
+                         ts[2].internal)
+        self.assertEqual(resp_hdrs.get('x-put-timestamp'), ts[2].normal)
+
+        resp_hdrs = do_put_head(ts[3], 'val2',
+                                {'x-backend-no-timestamp-update': 'true'})
+        self.assertEqual(resp_hdrs.get('x-container-meta-test'), 'val2')
+        self.assertEqual(resp_hdrs.get('x-backend-put-timestamp'),
+                         ts[3].internal)
+        self.assertEqual(resp_hdrs.get('x-put-timestamp'), ts[3].normal)
+
+        # put timestamp is NOT updated if record type is shard
+        resp_hdrs = do_put_head(
+            ts[4], 'val3', {'x-backend-record-type': 'shard'},
+            body=json.dumps([dict(ShardRange('x/y', 123.4))]))
+        self.assertEqual(resp_hdrs.get('x-container-meta-test'), 'val3')
+        self.assertEqual(resp_hdrs.get('x-backend-put-timestamp'),
+                         ts[3].internal)
+        self.assertEqual(resp_hdrs.get('x-put-timestamp'),
+                         ts[3].normal)
+
+        # put timestamp and metadata are NOT updated for request with obj path
+        resp_hdrs = do_put_head(
+            ts[5], 'val4',
+            {'x-content-type': 'plain/text', 'x-size': 0, 'x-etag': 'an-etag'},
+            path='a/c/o')
+        self.assertEqual(resp_hdrs.get('x-container-meta-test'), 'val3')
+        self.assertEqual(resp_hdrs.get('x-backend-put-timestamp'),
+                         ts[3].internal)
+        self.assertEqual(resp_hdrs.get('x-put-timestamp'),
+                         ts[3].normal)
+
+    def test_PUT_insufficient_space(self):
+        conf = {'devices': self.testdir,
+                'mount_check': 'false',
+                'fallocate_reserve': '2%'}
+        container_controller = container_server.ContainerController(conf)
+
+        req = Request.blank(
+            '/sda1/p/a/c',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': '1517617825.74832'})
+        statvfs_result = posix.statvfs_result([
+            4096,     # f_bsize
+            4096,     # f_frsize
+            2854907,  # f_blocks
+            59000,    # f_bfree
+            57000,    # f_bavail  (just under 2% free)
+            1280000,  # f_files
+            1266040,  # f_ffree,
+            1266040,  # f_favail,
+            4096,     # f_flag
+            255,      # f_namemax
+        ])
+        with mock.patch('os.statvfs',
+                        return_value=statvfs_result) as mock_statvfs:
+            resp = req.get_response(container_controller)
+        self.assertEqual(resp.status_int, 507)
+        self.assertEqual(mock_statvfs.mock_calls,
+                         [mock.call(os.path.join(self.testdir, 'sda1'))])
+
+    def test_PUT_simulated_create_race(self):
+        state = ['initial']
+
+        from swift.container.backend import ContainerBroker as OrigCoBr
+
+        class InterceptedCoBr(OrigCoBr):
+
+            def __init__(self, *args, **kwargs):
+                super(InterceptedCoBr, self).__init__(*args, **kwargs)
+                if state[0] == 'initial':
+                    # Do nothing initially
+                    pass
+                elif state[0] == 'race':
+                    # Save the original db_file attribute value
+                    self._saved_db_file = self.db_file
+                    self._db_file += '.doesnotexist'
+
+            def initialize(self, *args, **kwargs):
+                if state[0] == 'initial':
+                    # Do nothing initially
+                    pass
+                elif state[0] == 'race':
+                    # Restore the original db_file attribute to get the race
+                    # behavior
+                    self._db_file = self._saved_db_file
+                return super(InterceptedCoBr, self).initialize(*args, **kwargs)
+
+        with mock.patch("swift.container.server.ContainerBroker",
+                        InterceptedCoBr):
+            req = Request.blank(
+                '/sda1/p/a/c',
+                environ={'REQUEST_METHOD': 'PUT', 'HTTP_X_TIMESTAMP': '1'})
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 201)
+            state[0] = "race"
+            req = Request.blank(
+                '/sda1/p/a/c',
+                environ={'REQUEST_METHOD': 'PUT', 'HTTP_X_TIMESTAMP': '1'})
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 202)
 
     def test_PUT_obj_not_found(self):
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
             headers={'X-Timestamp': '1', 'X-Size': '0',
                      'X-Content-Type': 'text/plain', 'X-ETag': 'e'})
-        resp = self.controller.PUT(req)
-        self.assertEquals(resp.status_int, 404)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)
 
-    def test_PUT_GET_metadata(self):
+    def test_PUT_good_policy_specified(self):
+        policy = random.choice(list(POLICIES))
+        # Set metadata header
+        req = Request.blank('/sda1/p/a/c', method='PUT',
+                            headers={'X-Timestamp': Timestamp(1).internal,
+                                     'X-Backend-Storage-Policy-Index':
+                                     policy.idx})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        self.assertEqual(resp.headers.get('X-Backend-Storage-Policy-Index'),
+                         str(policy.idx))
+
+        # now make sure we read it back
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.headers.get('X-Backend-Storage-Policy-Index'),
+                         str(policy.idx))
+
+    def test_PUT_no_policy_specified(self):
         # Set metadata header
         req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
-            headers={'X-Timestamp': normalize_timestamp(1),
-                     'X-Container-Meta-Test': 'Value'})
-        resp = self.controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
+                            headers={'X-Timestamp': Timestamp(1).internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        self.assertEqual(resp.headers.get('X-Backend-Storage-Policy-Index'),
+                         str(POLICIES.default.idx))
+
+        # now make sure the default was used (pol 1)
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.headers.get('X-Backend-Storage-Policy-Index'),
+                         str(POLICIES.default.idx))
+
+    def test_PUT_bad_policy_specified(self):
+        # Set metadata header
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': Timestamp(1).internal,
+                                     'X-Backend-Storage-Policy-Index': 'nada'})
+        resp = req.get_response(self.controller)
+        # make sure we get bad response
+        self.assertEqual(resp.status_int, 400)
+        self.assertFalse('X-Backend-Storage-Policy-Index' in resp.headers)
+
+    def test_PUT_no_policy_change(self):
+        policy = random.choice(list(POLICIES))
+        # Set metadata header
+        req = Request.blank('/sda1/p/a/c', method='PUT', headers={
+            'X-Timestamp': next(self.ts).internal,
+            'X-Backend-Storage-Policy-Index': policy.idx})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        req = Request.blank('/sda1/p/a/c')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        # make sure we get the right index back
+        self.assertEqual(resp.headers.get('X-Backend-Storage-Policy-Index'),
+                         str(policy.idx))
+
+        # now try to update w/o changing the policy
+        for method in ('POST', 'PUT'):
+            req = Request.blank('/sda1/p/a/c', method=method, headers={
+                'X-Timestamp': next(self.ts).internal,
+                'X-Backend-Storage-Policy-Index': policy.idx
+            })
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int // 100, 2)
+        # make sure we get the right index back
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers.get('X-Backend-Storage-Policy-Index'),
+                         str(policy.idx))
+
+    def test_PUT_bad_policy_change(self):
+        policy = random.choice(list(POLICIES))
+        # Set metadata header
+        req = Request.blank('/sda1/p/a/c', method='PUT', headers={
+            'X-Timestamp': next(self.ts).internal,
+            'X-Backend-Storage-Policy-Index': policy.idx})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
         req = Request.blank('/sda1/p/a/c')
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 204)
-        self.assertEquals(resp.headers.get('x-container-meta-test'), 'Value')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        # make sure we get the right index back
+        self.assertEqual(resp.headers.get('X-Backend-Storage-Policy-Index'),
+                         str(policy.idx))
+
+        other_policies = [p for p in POLICIES if p != policy]
+        for other_policy in other_policies:
+            # now try to change it and make sure we get a conflict
+            req = Request.blank('/sda1/p/a/c', method='PUT', headers={
+                'X-Timestamp': next(self.ts).internal,
+                'X-Backend-Storage-Policy-Index': other_policy.idx
+            })
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 409)
+            self.assertEqual(
+                resp.headers.get('X-Backend-Storage-Policy-Index'),
+                str(policy.idx))
+
+        # and make sure there is no change!
+        req = Request.blank('/sda1/p/a/c')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        # make sure we get the right index back
+        self.assertEqual(resp.headers.get('X-Backend-Storage-Policy-Index'),
+                         str(policy.idx))
+
+    def test_POST_ignores_policy_change(self):
+        policy = random.choice(list(POLICIES))
+        req = Request.blank('/sda1/p/a/c', method='PUT', headers={
+            'X-Timestamp': next(self.ts).internal,
+            'X-Backend-Storage-Policy-Index': policy.idx})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        req = Request.blank('/sda1/p/a/c')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        # make sure we get the right index back
+        self.assertEqual(resp.headers.get('X-Backend-Storage-Policy-Index'),
+                         str(policy.idx))
+
+        other_policies = [p for p in POLICIES if p != policy]
+        for other_policy in other_policies:
+            # now try to change it and make sure we get a conflict
+            req = Request.blank('/sda1/p/a/c', method='POST', headers={
+                'X-Timestamp': next(self.ts).internal,
+                'X-Backend-Storage-Policy-Index': other_policy.idx
+            })
+            resp = req.get_response(self.controller)
+            # valid request
+            self.assertEqual(resp.status_int // 100, 2)
+
+            # but it does nothing
+            req = Request.blank('/sda1/p/a/c')
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 204)
+            # make sure we get the right index back
+            self.assertEqual(resp.headers.get
+                             ('X-Backend-Storage-Policy-Index'),
+                             str(policy.idx))
+
+    def test_PUT_no_policy_for_existing_default(self):
+        # create a container with the default storage policy
+        req = Request.blank('/sda1/p/a/c', method='PUT', headers={
+            'X-Timestamp': next(self.ts).internal,
+        })
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)  # sanity check
+
+        # check the policy index
+        req = Request.blank('/sda1/p/a/c', method='HEAD')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers['X-Backend-Storage-Policy-Index'],
+                         str(POLICIES.default.idx))
+
+        # put again without specifying the storage policy
+        req = Request.blank('/sda1/p/a/c', method='PUT', headers={
+            'X-Timestamp': next(self.ts).internal,
+        })
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 202)  # sanity check
+
+        # policy index is unchanged
+        req = Request.blank('/sda1/p/a/c', method='HEAD')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers['X-Backend-Storage-Policy-Index'],
+                         str(POLICIES.default.idx))
+
+    def test_PUT_proxy_default_no_policy_for_existing_default(self):
+        # make it look like the proxy has a different default than we do, like
+        # during a config change restart across a multi node cluster.
+        proxy_default = random.choice([p for p in POLICIES if not
+                                       p.is_default])
+        # create a container with the default storage policy
+        req = Request.blank('/sda1/p/a/c', method='PUT', headers={
+            'X-Timestamp': next(self.ts).internal,
+            'X-Backend-Storage-Policy-Default': int(proxy_default),
+        })
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)  # sanity check
+
+        # check the policy index
+        req = Request.blank('/sda1/p/a/c', method='HEAD')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(int(resp.headers['X-Backend-Storage-Policy-Index']),
+                         int(proxy_default))
+
+        # put again without proxy specifying the different default
+        req = Request.blank('/sda1/p/a/c', method='PUT', headers={
+            'X-Timestamp': next(self.ts).internal,
+            'X-Backend-Storage-Policy-Default': int(POLICIES.default),
+        })
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 202)  # sanity check
+
+        # policy index is unchanged
+        req = Request.blank('/sda1/p/a/c', method='HEAD')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(int(resp.headers['X-Backend-Storage-Policy-Index']),
+                         int(proxy_default))
+
+    def test_PUT_no_policy_for_existing_non_default(self):
+        non_default_policy = [p for p in POLICIES if not p.is_default][0]
+        # create a container with the non-default storage policy
+        req = Request.blank('/sda1/p/a/c', method='PUT', headers={
+            'X-Timestamp': next(self.ts).internal,
+            'X-Backend-Storage-Policy-Index': non_default_policy.idx,
+        })
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)  # sanity check
+
+        # check the policy index
+        req = Request.blank('/sda1/p/a/c', method='HEAD')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers['X-Backend-Storage-Policy-Index'],
+                         str(non_default_policy.idx))
+
+        # put again without specifying the storage policy
+        req = Request.blank('/sda1/p/a/c', method='PUT', headers={
+            'X-Timestamp': next(self.ts).internal,
+        })
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 202)  # sanity check
+
+        # policy index is unchanged
+        req = Request.blank('/sda1/p/a/c', method='HEAD')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers['X-Backend-Storage-Policy-Index'],
+                         str(non_default_policy.idx))
+
+    def test_create_reserved_namespace_container(self):
+        path = '/sda1/p/a/%sc' % RESERVED_STR
+        req = Request.blank(path, method='PUT', headers={
+            'X-Timestamp': next(self.ts).internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status, '201 Created', resp.body)
+
+        path = '/sda1/p/a/%sc%stest' % (RESERVED_STR, RESERVED_STR)
+        req = Request.blank(path, method='PUT', headers={
+            'X-Timestamp': next(self.ts).internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status, '201 Created', resp.body)
+
+    def test_create_reserved_object_in_container(self):
+        # create container
+        path = '/sda1/p/a/c/'
+        req = Request.blank(path, method='PUT', headers={
+            'X-Timestamp': next(self.ts).internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        # put null object in it
+        path += '%so' % RESERVED_STR
+        req = Request.blank(path, method='PUT', headers={
+            'X-Timestamp': next(self.ts).internal,
+            'X-Size': 0,
+            'X-Content-Type': 'application/x-test',
+            'X-Etag': 'x',
+        })
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status, '400 Bad Request')
+        self.assertEqual(resp.body, b'Invalid reserved-namespace object '
+                         b'in user-namespace container')
+
+    def test_PUT_non_utf8_metadata(self):
+        # Set metadata header
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': Timestamp(1).internal,
+                     'X-Container-Meta-Test': b'\xff'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 400)
+        # Set sysmeta header
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': Timestamp(1).internal,
+                     'X-Container-Sysmeta-Test': b'\xff'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 400)
+        # Set ACL
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': Timestamp(1).internal,
+                     'X-Container-Read': b'\xff'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 400)
+        # Send other
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': Timestamp(1).internal,
+                     'X-Will-Not-Be-Saved': b'\xff'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 202)
+
+    def test_PUT_GET_metadata(self):
+        # Set metadata header
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': Timestamp(1).internal,
+                     'X-Container-Meta-Test': 'Value'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers.get('x-container-meta-test'), 'Value')
         # Set another metadata header, ensuring old one doesn't disappear
-        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'POST'},
-            headers={'X-Timestamp': normalize_timestamp(1),
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'POST'},
+            headers={'X-Timestamp': Timestamp(1).internal,
                      'X-Container-Meta-Test2': 'Value2'})
-        resp = self.controller.POST(req)
-        self.assertEquals(resp.status_int, 204)
-        req = Request.blank('/sda1/p/a/c')
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 204)
-        self.assertEquals(resp.headers.get('x-container-meta-test'), 'Value')
-        self.assertEquals(resp.headers.get('x-container-meta-test2'), 'Value2')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers.get('x-container-meta-test'), 'Value')
+        self.assertEqual(resp.headers.get('x-container-meta-test2'), 'Value2')
         # Update metadata header
-        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
-            headers={'X-Timestamp': normalize_timestamp(3),
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': Timestamp(3).internal,
                      'X-Container-Meta-Test': 'New Value'})
-        resp = self.controller.PUT(req)
-        self.assertEquals(resp.status_int, 202)
-        req = Request.blank('/sda1/p/a/c')
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 204)
-        self.assertEquals(resp.headers.get('x-container-meta-test'),
-                          'New Value')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 202)
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers.get('x-container-meta-test'),
+                         'New Value')
         # Send old update to metadata header
-        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
-            headers={'X-Timestamp': normalize_timestamp(2),
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': Timestamp(2).internal,
                      'X-Container-Meta-Test': 'Old Value'})
-        resp = self.controller.PUT(req)
-        self.assertEquals(resp.status_int, 202)
-        req = Request.blank('/sda1/p/a/c')
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 204)
-        self.assertEquals(resp.headers.get('x-container-meta-test'),
-                          'New Value')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 202)
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers.get('x-container-meta-test'),
+                         'New Value')
         # Remove metadata header (by setting it to empty)
-        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
-            headers={'X-Timestamp': normalize_timestamp(4),
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': Timestamp(4).internal,
                      'X-Container-Meta-Test': ''})
-        resp = self.controller.PUT(req)
-        self.assertEquals(resp.status_int, 202)
-        req = Request.blank('/sda1/p/a/c')
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 204)
-        self.assert_('x-container-meta-test' not in resp.headers)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 202)
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertNotIn('x-container-meta-test', resp.headers)
+
+    def test_PUT_GET_sys_metadata(self):
+        prefix = get_sys_meta_prefix('container')
+        key = '%sTest' % prefix
+        key2 = '%sTest2' % prefix
+        # Set metadata header
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': Timestamp(1).internal,
+                                     key: 'Value'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers.get(key.lower()), 'Value')
+        # Set another metadata header, ensuring old one doesn't disappear
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'POST'},
+                            headers={'X-Timestamp': Timestamp(1).internal,
+                                     key2: 'Value2'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers.get(key.lower()), 'Value')
+        self.assertEqual(resp.headers.get(key2.lower()), 'Value2')
+        # Update metadata header
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': Timestamp(3).internal,
+                                     key: 'New Value'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 202)
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers.get(key.lower()),
+                         'New Value')
+        # Send old update to metadata header
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': Timestamp(2).internal,
+                                     key: 'Old Value'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 202)
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers.get(key.lower()),
+                         'New Value')
+        # Remove metadata header (by setting it to empty)
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': Timestamp(4).internal,
+                                     key: ''})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 202)
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertNotIn(key.lower(), resp.headers)
+
+    def test_PUT_invalid_partition(self):
+        req = Request.blank('/sda1/./a/c', environ={'REQUEST_METHOD': 'PUT',
+                                                    'HTTP_X_TIMESTAMP': '1'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 400)
+
+    def test_PUT_timestamp_not_float(self):
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT',
+                                                    'HTTP_X_TIMESTAMP': '0'})
+        req.get_response(self.controller)
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': 'not-float'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 400)
 
     def test_POST_HEAD_metadata(self):
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': Timestamp(1).internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        # Set metadata header
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'POST'},
+            headers={'X-Timestamp': Timestamp(1).internal,
+                     'X-Container-Meta-Test': 'Value'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'HEAD'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers.get('x-container-meta-test'), 'Value')
+        self.assertEqual(resp.headers.get('x-put-timestamp'),
+                         '0000000001.00000')
+        # Update metadata header
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'POST'},
+            headers={'X-Timestamp': Timestamp(3).internal,
+                     'X-Container-Meta-Test': 'New Value'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'HEAD'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers.get('x-container-meta-test'),
+                         'New Value')
+        self.assertEqual(resp.headers.get('x-put-timestamp'),
+                         '0000000003.00000')
+        # Send old update to metadata header
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'POST'},
+            headers={'X-Timestamp': Timestamp(2).internal,
+                     'X-Container-Meta-Test': 'Old Value'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'HEAD'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers.get('x-container-meta-test'),
+                         'New Value')
+        self.assertEqual(resp.headers.get('x-put-timestamp'),
+                         '0000000003.00000')
+        # Remove metadata header (by setting it to empty)
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'POST'},
+            headers={'X-Timestamp': Timestamp(4).internal,
+                     'X-Container-Meta-Test': ''})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'HEAD'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertNotIn('x-container-meta-test', resp.headers)
+        self.assertEqual(resp.headers.get('x-put-timestamp'),
+                         '0000000004.00000')
+
+    def test_POST_HEAD_sys_metadata(self):
+        prefix = get_sys_meta_prefix('container')
+        key = '%sTest' % prefix
         req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
-            headers={'X-Timestamp': normalize_timestamp(1)})
-        resp = self.controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
+                            headers={'X-Timestamp': Timestamp(1).internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
         # Set metadata header
         req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'POST'},
-            headers={'X-Timestamp': normalize_timestamp(1),
-                     'X-Container-Meta-Test': 'Value'})
-        resp = self.controller.POST(req)
-        self.assertEquals(resp.status_int, 204)
+                            headers={'X-Timestamp': Timestamp(1).internal,
+                                     key: 'Value'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
         req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'HEAD'})
-        resp = self.controller.HEAD(req)
-        self.assertEquals(resp.status_int, 204)
-        self.assertEquals(resp.headers.get('x-container-meta-test'), 'Value')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers.get(key.lower()), 'Value')
         # Update metadata header
         req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'POST'},
-            headers={'X-Timestamp': normalize_timestamp(3),
-                     'X-Container-Meta-Test': 'New Value'})
-        resp = self.controller.POST(req)
-        self.assertEquals(resp.status_int, 204)
+                            headers={'X-Timestamp': Timestamp(3).internal,
+                                     key: 'New Value'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
         req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'HEAD'})
-        resp = self.controller.HEAD(req)
-        self.assertEquals(resp.status_int, 204)
-        self.assertEquals(resp.headers.get('x-container-meta-test'),
-                          'New Value')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers.get(key.lower()),
+                         'New Value')
         # Send old update to metadata header
         req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'POST'},
-            headers={'X-Timestamp': normalize_timestamp(2),
-                     'X-Container-Meta-Test': 'Old Value'})
-        resp = self.controller.POST(req)
-        self.assertEquals(resp.status_int, 204)
+                            headers={'X-Timestamp': Timestamp(2).internal,
+                                     key: 'Old Value'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
         req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'HEAD'})
-        resp = self.controller.HEAD(req)
-        self.assertEquals(resp.status_int, 204)
-        self.assertEquals(resp.headers.get('x-container-meta-test'),
-                          'New Value')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers.get(key.lower()),
+                         'New Value')
         # Remove metadata header (by setting it to empty)
         req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'POST'},
-            headers={'X-Timestamp': normalize_timestamp(4),
-                     'X-Container-Meta-Test': ''})
-        resp = self.controller.POST(req)
-        self.assertEquals(resp.status_int, 204)
+                            headers={'X-Timestamp': Timestamp(4).internal,
+                                     key: ''})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
         req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'HEAD'})
-        resp = self.controller.HEAD(req)
-        self.assertEquals(resp.status_int, 204)
-        self.assert_('x-container-meta-test' not in resp.headers)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertNotIn(key.lower(), resp.headers)
+
+    def test_POST_HEAD_no_timestamp_update(self):
+        put_ts = next(self.ts)
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': put_ts.internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+
+        def do_post_head(post_ts, value, extra_hdrs):
+            # Set metadata header
+            req = Request.blank('/sda1/p/a/c',
+                                environ={'REQUEST_METHOD': 'POST'},
+                                headers={'X-Timestamp': post_ts.internal,
+                                         'X-Container-Meta-Test': value})
+            req.headers.update(extra_hdrs)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 204)
+            req = Request.blank('/sda1/p/a/c',
+                                environ={'REQUEST_METHOD': 'HEAD'})
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 204)
+            return resp.headers
+
+        # verify timestamp IS advanced
+        post_ts1 = next(self.ts)
+        resp_hdrs = do_post_head(post_ts1, 'val1', {})
+        self.assertEqual(resp_hdrs.get('x-container-meta-test'), 'val1')
+        self.assertEqual(resp_hdrs.get('x-backend-put-timestamp'),
+                         post_ts1.internal)
+
+        post_ts2 = next(self.ts)
+        resp_hdrs = do_post_head(post_ts2, 'val2',
+                                 {'x-backend-no-timestamp-update': 'false'})
+        self.assertEqual(resp_hdrs.get('x-container-meta-test'), 'val2')
+        self.assertEqual(resp_hdrs.get('x-backend-put-timestamp'),
+                         post_ts2.internal)
+
+        # verify timestamp IS NOT advanced, but metadata still updated
+        post_ts3 = next(self.ts)
+        resp_hdrs = do_post_head(post_ts3, 'val3',
+                                 {'x-backend-No-timeStamp-update': 'true'})
+        self.assertEqual(resp_hdrs.get('x-container-meta-test'), 'val3')
+        self.assertEqual(resp_hdrs.get('x-backend-put-timestamp'),
+                         post_ts2.internal)
+
+        # verify timestamp will not go backwards
+        resp_hdrs = do_post_head(post_ts1, 'val4',
+                                 {'x-backend-no-timestamp-update': 'true'})
+        self.assertEqual(resp_hdrs.get('x-container-meta-test'), 'val3')
+        self.assertEqual(resp_hdrs.get('x-backend-put-timestamp'),
+                         post_ts2.internal)
+
+    def test_POST_invalid_partition(self):
+        req = Request.blank('/sda1/./a/c', environ={'REQUEST_METHOD': 'POST',
+                                                    'HTTP_X_TIMESTAMP': '1'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 400)
+
+    def test_POST_insufficient_space(self):
+        conf = {'devices': self.testdir,
+                'mount_check': 'false',
+                'fallocate_reserve': '2%'}
+        container_controller = container_server.ContainerController(conf)
+
+        req = Request.blank(
+            '/sda1/p/a/c',
+            environ={'REQUEST_METHOD': 'POST'},
+            headers={'X-Timestamp': '1517618035.469202'})
+        statvfs_result = posix.statvfs_result([
+            4096,     # f_bsize
+            4096,     # f_frsize
+            2854907,  # f_blocks
+            59000,    # f_bfree
+            57000,    # f_bavail  (just under 2% free)
+            1280000,  # f_files
+            1266040,  # f_ffree,
+            1266040,  # f_favail,
+            4096,     # f_flag
+            255,      # f_namemax
+        ])
+        with mock.patch('os.statvfs',
+                        return_value=statvfs_result) as mock_statvfs:
+            resp = req.get_response(container_controller)
+        self.assertEqual(resp.status_int, 507)
+        self.assertEqual(mock_statvfs.mock_calls,
+                         [mock.call(os.path.join(self.testdir, 'sda1'))])
+
+    def test_POST_timestamp_not_float(self):
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT',
+                                                    'HTTP_X_TIMESTAMP': '0'})
+        req.get_response(self.controller)
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'POST'},
+                            headers={'X-Timestamp': 'not-float'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 400)
+
+    def test_POST_invalid_container_sync_to(self):
+        self.controller = container_server.ContainerController(
+            {'devices': self.testdir})
+        req = Request.blank(
+            '/sda-null/p/a/c', environ={'REQUEST_METHOD': 'POST',
+                                        'HTTP_X_TIMESTAMP': '1'},
+            headers={'x-container-sync-to': '192.168.0.1'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 400)
+
+    def test_POST_after_DELETE_not_found(self):
+        req = Request.blank('/sda1/p/a/c',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': '1'})
+        resp = req.get_response(self.controller)
+        req = Request.blank('/sda1/p/a/c',
+                            environ={'REQUEST_METHOD': 'DELETE'},
+                            headers={'X-Timestamp': '2'})
+        resp = req.get_response(self.controller)
+        req = Request.blank('/sda1/p/a/c/',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'X-Timestamp': '3'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)
 
     def test_DELETE_obj_not_found(self):
-        req = Request.blank('/sda1/p/a/c/o',
-                environ={'REQUEST_METHOD': 'DELETE'},
-                headers={'X-Timestamp': '1'})
-        resp = self.controller.DELETE(req)
-        self.assertEquals(resp.status_int, 404)
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'DELETE'},
+            headers={'X-Timestamp': '1'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)
+
+    def test_DELETE_container_not_found(self):
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT',
+                                                    'HTTP_X_TIMESTAMP': '0'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'DELETE',
+                                                    'HTTP_X_TIMESTAMP': '1'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)
 
     def test_PUT_utf8(self):
         snowman = u'\u2603'
         container_name = snowman.encode('utf-8')
-        req = Request.blank('/sda1/p/a/%s'%container_name, environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '1'})
-        resp = self.controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
+        req = Request.blank(
+            '/sda1/p/a/%s' % container_name,
+            environ={'REQUEST_METHOD': 'PUT',
+                     'HTTP_X_TIMESTAMP': '1'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+
+    def test_account_update_mismatched_host_device(self):
+        req = Request.blank(
+            '/sda1/p/a/c',
+            environ={'REQUEST_METHOD': 'PUT',
+                     'HTTP_X_TIMESTAMP': '1'},
+            headers={'X-Timestamp': '0000000001.00000',
+                     'X-Account-Host': '127.0.0.1:0',
+                     'X-Account-Partition': '123',
+                     'X-Account-Device': 'sda1,sda2'})
+        broker = self.controller._get_container_broker('sda1', 'p', 'a', 'c')
+        resp = self.controller.account_update(req, 'a', 'c', broker)
+        self.assertEqual(resp.status_int, 400)
+
+    def test_account_update_account_override_deleted(self):
+        bindsock = listen_zero()
+        req = Request.blank(
+            '/sda1/p/a/c',
+            environ={'REQUEST_METHOD': 'PUT',
+                     'HTTP_X_TIMESTAMP': '1'},
+            headers={'X-Timestamp': '0000000001.00000',
+                     'X-Account-Host': '%s:%s' %
+                     bindsock.getsockname(),
+                     'X-Account-Partition': '123',
+                     'X-Account-Device': 'sda1',
+                     'X-Account-Override-Deleted': 'yes'})
+        with save_globals():
+            new_connect = fake_http_connect(200, count=123)
+            swift.container.server.http_connect = new_connect
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 201)
 
     def test_PUT_account_update(self):
-        bindsock = listen(('127.0.0.1', 0))
+        bindsock = listen_zero()
+
         def accept(return_code, expected_timestamp):
+            if not isinstance(expected_timestamp, bytes):
+                expected_timestamp = expected_timestamp.encode('ascii')
             try:
                 with Timeout(3):
                     sock, addr = bindsock.accept()
                     inc = sock.makefile('rb')
                     out = sock.makefile('wb')
-                    out.write('HTTP/1.1 %d OK\r\nContent-Length: 0\r\n\r\n' %
+                    out.write(b'HTTP/1.1 %d OK\r\nContent-Length: 0\r\n\r\n' %
                               return_code)
                     out.flush()
-                    self.assertEquals(inc.readline(),
-                                      'PUT /sda1/123/a/c HTTP/1.1\r\n')
+                    self.assertEqual(inc.readline(),
+                                     b'PUT /sda1/123/a/c HTTP/1.1\r\n')
                     headers = {}
                     line = inc.readline()
-                    while line and line != '\r\n':
-                        headers[line.split(':')[0].lower()] = \
-                            line.split(':')[1].strip()
+                    while line and line != b'\r\n':
+                        headers[line.split(b':')[0].lower()] = \
+                            line.split(b':')[1].strip()
                         line = inc.readline()
-                    self.assertEquals(headers['x-put-timestamp'],
-                                      expected_timestamp)
-            except BaseException, err:
+                    self.assertEqual(headers[b'x-put-timestamp'],
+                                     expected_timestamp)
+            except BaseException as err:
                 return err
             return None
-        req = Request.blank('/sda1/p/a/c',
+
+        timestamps = [next(self.ts) for _ in range(5)]
+        req = Request.blank(
+            '/sda1/p/a/c',
             environ={'REQUEST_METHOD': 'PUT'},
-            headers={'X-Timestamp': '0000000001.00000',
+            headers={'X-Timestamp': timestamps[1].internal,
                      'X-Account-Host': '%s:%s' % bindsock.getsockname(),
                      'X-Account-Partition': '123',
                      'X-Account-Device': 'sda1'})
-        event = spawn(accept, 201, '0000000001.00000')
+        event = spawn(accept, 201, timestamps[1].internal)
         try:
             with Timeout(3):
-                resp = self.controller.PUT(req)
-                self.assertEquals(resp.status_int, 201)
+                resp = req.get_response(self.controller)
+                self.assertEqual(resp.status_int, 201)
         finally:
             err = event.wait()
             if err:
                 raise Exception(err)
-        req = Request.blank('/sda1/p/a/c',
+
+        req = Request.blank(
+            '/sda1/p/a/c',
             environ={'REQUEST_METHOD': 'DELETE'},
-            headers={'X-Timestamp': '2'})
-        resp = self.controller.DELETE(req)
-        self.assertEquals(resp.status_int, 204)
-        req = Request.blank('/sda1/p/a/c',
+            headers={'X-Timestamp': timestamps[2].internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+
+        req = Request.blank(
+            '/sda1/p/a/c',
             environ={'REQUEST_METHOD': 'PUT'},
-            headers={'X-Timestamp': '0000000003.00000',
+            headers={'X-Timestamp': timestamps[3].internal,
                      'X-Account-Host': '%s:%s' % bindsock.getsockname(),
                      'X-Account-Partition': '123',
                      'X-Account-Device': 'sda1'})
-        event = spawn(accept, 404, '0000000003.00000')
+        event = spawn(accept, 404, timestamps[3].internal)
         try:
             with Timeout(3):
-                resp = self.controller.PUT(req)
-                self.assertEquals(resp.status_int, 404)
+                resp = req.get_response(self.controller)
+                self.assertEqual(resp.status_int, 404)
         finally:
             err = event.wait()
             if err:
                 raise Exception(err)
-        req = Request.blank('/sda1/p/a/c',
+
+        req = Request.blank(
+            '/sda1/p/a/c',
             environ={'REQUEST_METHOD': 'PUT'},
-            headers={'X-Timestamp': '0000000005.00000',
+            headers={'X-Timestamp': timestamps[4].internal,
                      'X-Account-Host': '%s:%s' % bindsock.getsockname(),
                      'X-Account-Partition': '123',
                      'X-Account-Device': 'sda1'})
-        event = spawn(accept, 503, '0000000005.00000')
+        event = spawn(accept, 503, timestamps[4].internal)
         got_exc = False
         try:
             with Timeout(3):
-                resp = self.controller.PUT(req)
-        except BaseException, err:
+                resp = req.get_response(self.controller)
+        except BaseException:
             got_exc = True
         finally:
             err = event.wait()
             if err:
                 raise Exception(err)
-        self.assert_(not got_exc)
+        self.assertTrue(not got_exc)
 
     def test_PUT_reset_container_sync(self):
-        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
             headers={'x-timestamp': '1',
                      'x-container-sync-to': 'http://127.0.0.1:12345/v1/a/c'})
-        resp = self.controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
         db = self.controller._get_container_broker('sda1', 'p', 'a', 'c')
         info = db.get_info()
-        self.assertEquals(info['x_container_sync_point1'], -1)
-        self.assertEquals(info['x_container_sync_point2'], -1)
+        self.assertEqual(info['x_container_sync_point1'], -1)
+        self.assertEqual(info['x_container_sync_point2'], -1)
         db.set_x_container_sync_points(123, 456)
         info = db.get_info()
-        self.assertEquals(info['x_container_sync_point1'], 123)
-        self.assertEquals(info['x_container_sync_point2'], 456)
+        self.assertEqual(info['x_container_sync_point1'], 123)
+        self.assertEqual(info['x_container_sync_point2'], 456)
         # Set to same value
-        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
             headers={'x-timestamp': '1',
                      'x-container-sync-to': 'http://127.0.0.1:12345/v1/a/c'})
-        resp = self.controller.PUT(req)
-        self.assertEquals(resp.status_int, 202)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 202)
         db = self.controller._get_container_broker('sda1', 'p', 'a', 'c')
         info = db.get_info()
-        self.assertEquals(info['x_container_sync_point1'], 123)
-        self.assertEquals(info['x_container_sync_point2'], 456)
+        self.assertEqual(info['x_container_sync_point1'], 123)
+        self.assertEqual(info['x_container_sync_point2'], 456)
         # Set to new value
-        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
             headers={'x-timestamp': '1',
                      'x-container-sync-to': 'http://127.0.0.1:12345/v1/a/c2'})
-        resp = self.controller.PUT(req)
-        self.assertEquals(resp.status_int, 202)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 202)
         db = self.controller._get_container_broker('sda1', 'p', 'a', 'c')
         info = db.get_info()
-        self.assertEquals(info['x_container_sync_point1'], -1)
-        self.assertEquals(info['x_container_sync_point2'], -1)
+        self.assertEqual(info['x_container_sync_point1'], -1)
+        self.assertEqual(info['x_container_sync_point2'], -1)
 
     def test_POST_reset_container_sync(self):
-        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
             headers={'x-timestamp': '1',
                      'x-container-sync-to': 'http://127.0.0.1:12345/v1/a/c'})
-        resp = self.controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
         db = self.controller._get_container_broker('sda1', 'p', 'a', 'c')
         info = db.get_info()
-        self.assertEquals(info['x_container_sync_point1'], -1)
-        self.assertEquals(info['x_container_sync_point2'], -1)
+        self.assertEqual(info['x_container_sync_point1'], -1)
+        self.assertEqual(info['x_container_sync_point2'], -1)
         db.set_x_container_sync_points(123, 456)
         info = db.get_info()
-        self.assertEquals(info['x_container_sync_point1'], 123)
-        self.assertEquals(info['x_container_sync_point2'], 456)
+        self.assertEqual(info['x_container_sync_point1'], 123)
+        self.assertEqual(info['x_container_sync_point2'], 456)
         # Set to same value
-        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'POST'},
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'POST'},
             headers={'x-timestamp': '1',
                      'x-container-sync-to': 'http://127.0.0.1:12345/v1/a/c'})
-        resp = self.controller.POST(req)
-        self.assertEquals(resp.status_int, 204)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
         db = self.controller._get_container_broker('sda1', 'p', 'a', 'c')
         info = db.get_info()
-        self.assertEquals(info['x_container_sync_point1'], 123)
-        self.assertEquals(info['x_container_sync_point2'], 456)
+        self.assertEqual(info['x_container_sync_point1'], 123)
+        self.assertEqual(info['x_container_sync_point2'], 456)
         # Set to new value
-        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'POST'},
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'POST'},
             headers={'x-timestamp': '1',
                      'x-container-sync-to': 'http://127.0.0.1:12345/v1/a/c2'})
-        resp = self.controller.POST(req)
-        self.assertEquals(resp.status_int, 204)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
         db = self.controller._get_container_broker('sda1', 'p', 'a', 'c')
         info = db.get_info()
-        self.assertEquals(info['x_container_sync_point1'], -1)
-        self.assertEquals(info['x_container_sync_point2'], -1)
+        self.assertEqual(info['x_container_sync_point1'], -1)
+        self.assertEqual(info['x_container_sync_point2'], -1)
 
-    def test_DELETE(self):
-        req = Request.blank('/sda1/p/a/c',
-            environ={'REQUEST_METHOD': 'PUT'}, headers={'X-Timestamp': '1'})
-        resp = self.controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
-        req = Request.blank('/sda1/p/a/c',
-            environ={'REQUEST_METHOD': 'DELETE'}, headers={'X-Timestamp': '2'})
-        resp = self.controller.DELETE(req)
-        self.assertEquals(resp.status_int, 204)
-        req = Request.blank('/sda1/p/a/c',
-            environ={'REQUEST_METHOD': 'GET'}, headers={'X-Timestamp': '3'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 404)
+    def test_update_sync_store_on_PUT(self):
+        # Create a synced container and validate a link is created
+        self._create_synced_container_and_validate_sync_store('PUT')
+        # remove the sync using PUT and validate the link is deleted
+        self._remove_sync_and_validate_sync_store('PUT')
 
-    def test_DELETE_not_found(self):
-        # Even if the container wasn't previously heard of, the container
-        # server will accept the delete and replicate it to where it belongs
-        # later.
-        req = Request.blank('/sda1/p/a/c',
-            environ={'REQUEST_METHOD': 'DELETE', 'HTTP_X_TIMESTAMP': '1'})
-        resp = self.controller.DELETE(req)
-        self.assertEquals(resp.status_int, 404)
+    def test_update_sync_store_on_POST(self):
+        # Create a container and validate a link is not created
+        self._create_container_and_validate_sync_store()
+        # Update the container to be synced and validate a link is created
+        self._create_synced_container_and_validate_sync_store('POST')
+        # remove the sync using POST and validate the link is deleted
+        self._remove_sync_and_validate_sync_store('POST')
 
-    def test_DELETE_object(self):
-        req = Request.blank('/sda1/p/a/c',
-            environ={'REQUEST_METHOD': 'PUT'}, headers={'X-Timestamp': '2'})
-        resp = self.controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
-        req = Request.blank('/sda1/p/a/c/o',
-            environ={'REQUEST_METHOD': 'PUT', 'HTTP_X_TIMESTAMP': '0',
-                     'HTTP_X_SIZE': 1, 'HTTP_X_CONTENT_TYPE': 'text/plain',
-                     'HTTP_X_ETAG': 'x'})
-        resp = self.controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
-        req = Request.blank('/sda1/p/a/c',
-            environ={'REQUEST_METHOD': 'DELETE'}, headers={'X-Timestamp': '3'})
-        resp = self.controller.DELETE(req)
-        self.assertEquals(resp.status_int, 409)
-        req = Request.blank('/sda1/p/a/c/o',
-            environ={'REQUEST_METHOD': 'DELETE'}, headers={'X-Timestamp': '4'})
-        resp = self.controller.DELETE(req)
-        self.assertEquals(resp.status_int, 204)
-        req = Request.blank('/sda1/p/a/c',
-            environ={'REQUEST_METHOD': 'DELETE'}, headers={'X-Timestamp': '5'})
-        resp = self.controller.DELETE(req)
-        self.assertEquals(resp.status_int, 204)
-        req = Request.blank('/sda1/p/a/c',
-            environ={'REQUEST_METHOD': 'GET'}, headers={'X-Timestamp': '6'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 404)
+    def test_update_sync_store_on_DELETE(self):
+        # Create a synced container and validate a link is created
+        self._create_synced_container_and_validate_sync_store('PUT')
+        # Remove the container and validate the link is deleted
+        self._remove_sync_and_validate_sync_store('DELETE')
 
-    def test_DELETE_account_update(self):
-        bindsock = listen(('127.0.0.1', 0))
-        def accept(return_code, expected_timestamp):
+    def _create_container_and_validate_sync_store(self):
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'x-timestamp': '0'})
+        req.get_response(self.controller)
+        db = self.controller._get_container_broker('sda1', 'p', 'a', 'c')
+        sync_store = self.controller.sync_store
+        db_path = db.db_file
+        db_link = sync_store._container_to_synced_container_path(db_path)
+        self.assertFalse(os.path.exists(db_link))
+        sync_containers = [c for c in sync_store.synced_containers_generator()]
+        self.assertFalse(sync_containers)
+
+    def _create_synced_container_and_validate_sync_store(self, method):
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': method},
+            headers={'x-timestamp': '1',
+                     'x-container-sync-to': 'http://127.0.0.1:12345/v1/a/c',
+                     'x-container-sync-key': '1234'})
+        req.get_response(self.controller)
+        db = self.controller._get_container_broker('sda1', 'p', 'a', 'c')
+        sync_store = self.controller.sync_store
+        db_path = db.db_file
+        db_link = sync_store._container_to_synced_container_path(db_path)
+        self.assertTrue(os.path.exists(db_link))
+        sync_containers = [c for c in sync_store.synced_containers_generator()]
+        self.assertEqual(1, len(sync_containers))
+        self.assertEqual(db_path, sync_containers[0])
+
+    def _remove_sync_and_validate_sync_store(self, method):
+        if method == 'DELETE':
+            headers = {'x-timestamp': '2'}
+        else:
+            headers = {'x-timestamp': '2',
+                       'x-container-sync-to': '',
+                       'x-container-sync-key': '1234'}
+
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': method},
+            headers=headers)
+        req.get_response(self.controller)
+        db = self.controller._get_container_broker('sda1', 'p', 'a', 'c')
+        sync_store = self.controller.sync_store
+        db_path = db.db_file
+        db_link = sync_store._container_to_synced_container_path(db_path)
+        self.assertFalse(os.path.exists(db_link))
+        sync_containers = [c for c in sync_store.synced_containers_generator()]
+        self.assertFalse(sync_containers)
+
+    def test_REPLICATE_rsync_then_merge_works(self):
+        def fake_rsync_then_merge(self, drive, db_file, args):
+            return HTTPNoContent()
+
+        with mock.patch("swift.container.replicator.ContainerReplicatorRpc."
+                        "rsync_then_merge", fake_rsync_then_merge):
+            req = Request.blank('/sda1/p/a/',
+                                environ={'REQUEST_METHOD': 'REPLICATE'},
+                                headers={})
+            json_string = b'["rsync_then_merge", "a.db"]'
+            inbuf = WsgiBytesIO(json_string)
+            req.environ['wsgi.input'] = inbuf
+            resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+
+    def test_REPLICATE_complete_rsync_works(self):
+        def fake_complete_rsync(self, drive, db_file, args):
+            return HTTPNoContent()
+        with mock.patch("swift.container.replicator.ContainerReplicatorRpc."
+                        "complete_rsync", fake_complete_rsync):
+            req = Request.blank('/sda1/p/a/',
+                                environ={'REQUEST_METHOD': 'REPLICATE'},
+                                headers={})
+            json_string = b'["complete_rsync", "a.db"]'
+            inbuf = WsgiBytesIO(json_string)
+            req.environ['wsgi.input'] = inbuf
+            resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+
+    def test_REPLICATE_value_error_works(self):
+        req = Request.blank('/sda1/p/a/',
+                            environ={'REQUEST_METHOD': 'REPLICATE'},
+                            headers={})
+        # check valuerror
+        wsgi_input_valuerror = b'["sync" : sync, "-1"]'
+        inbuf1 = WsgiBytesIO(wsgi_input_valuerror)
+        req.environ['wsgi.input'] = inbuf1
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 400)
+
+    def test_REPLICATE_unknown_sync(self):
+        # First without existing DB file
+        req = Request.blank('/sda1/p/a/',
+                            environ={'REQUEST_METHOD': 'REPLICATE'},
+                            headers={})
+        json_string = b'["unknown_sync", "a.db"]'
+        inbuf = WsgiBytesIO(json_string)
+        req.environ['wsgi.input'] = inbuf
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)
+
+        mkdirs(os.path.join(self.testdir, 'sda1', 'containers', 'p', 'a', 'a'))
+        db_file = os.path.join(self.testdir, 'sda1',
+                               storage_directory('containers', 'p', 'a'),
+                               'a' + '.db')
+        open(db_file, 'w')
+        req = Request.blank('/sda1/p/a/',
+                            environ={'REQUEST_METHOD': 'REPLICATE'},
+                            headers={})
+        json_string = b'["unknown_sync", "a.db"]'
+        inbuf = WsgiBytesIO(json_string)
+        req.environ['wsgi.input'] = inbuf
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 500)
+
+    def test_REPLICATE_insufficient_space(self):
+        conf = {'devices': self.testdir,
+                'mount_check': 'false',
+                'fallocate_reserve': '2%'}
+        container_controller = container_server.ContainerController(conf)
+
+        req = Request.blank(
+            '/sda1/p/a/',
+            environ={'REQUEST_METHOD': 'REPLICATE'})
+        statvfs_result = posix.statvfs_result([
+            4096,     # f_bsize
+            4096,     # f_frsize
+            2854907,  # f_blocks
+            59000,    # f_bfree
+            57000,    # f_bavail  (just under 2% free)
+            1280000,  # f_files
+            1266040,  # f_ffree,
+            1266040,  # f_favail,
+            4096,     # f_flag
+            255,      # f_namemax
+        ])
+        with mock.patch('os.statvfs',
+                        return_value=statvfs_result) as mock_statvfs:
+            resp = req.get_response(container_controller)
+        self.assertEqual(resp.status_int, 507)
+        self.assertEqual(mock_statvfs.mock_calls,
+                         [mock.call(os.path.join(self.testdir, 'sda1'))])
+
+    def test_UPDATE(self):
+        req = Request.blank(
+            '/sda1/p/a/c',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': next(self.ts).internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+
+        req = Request.blank(
+            '/sda1/p/a/c',
+            environ={'REQUEST_METHOD': 'UPDATE'},
+            headers={'X-Timestamp': next(self.ts).internal},
+            body='[invalid json')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 400)
+
+        req = Request.blank(
+            '/sda1/p/a/c',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'X-Timestamp': next(self.ts).internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+
+        obj_ts = next(self.ts)
+        req = Request.blank(
+            '/sda1/p/a/c',
+            environ={'REQUEST_METHOD': 'UPDATE'},
+            headers={'X-Timestamp': next(self.ts).internal},
+            body=json.dumps([
+                {'name': 'some obj', 'deleted': 0,
+                 'created_at': obj_ts.internal,
+                 'etag': 'whatever', 'size': 1234,
+                 'storage_policy_index': POLICIES.default.idx,
+                 'content_type': 'foo/bar'},
+                {'name': 'some tombstone', 'deleted': 1,
+                 'created_at': next(self.ts).internal,
+                 'etag': 'noetag', 'size': 0,
+                 'storage_policy_index': POLICIES.default.idx,
+                 'content_type': 'application/deleted'},
+                {'name': 'wrong policy', 'deleted': 0,
+                 'created_at': next(self.ts).internal,
+                 'etag': 'whatever', 'size': 6789,
+                 'storage_policy_index': 1,
+                 'content_type': 'foo/bar'},
+            ]))
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 202)
+
+        req = Request.blank(
+            '/sda1/p/a/c?format=json',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'X-Timestamp': next(self.ts).internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(json.loads(resp.body), [
+            {'name': 'some obj', 'hash': 'whatever', 'bytes': 1234,
+             'content_type': 'foo/bar', 'last_modified': obj_ts.isoformat},
+        ])
+
+    def test_UPDATE_autocreate(self):
+        req = Request.blank(
+            '/sda1/p/.a/c',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'X-Timestamp': next(self.ts).internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)
+
+        obj_ts = next(self.ts)
+        req = Request.blank(
+            '/sda1/p/.a/c',
+            environ={'REQUEST_METHOD': 'UPDATE'},
+            headers={
+                'X-Timestamp': next(self.ts).internal,
+                'X-Backend-Storage-Policy-Index': str(POLICIES.default.idx)},
+            body=json.dumps([
+                {'name': 'some obj', 'deleted': 0,
+                 'created_at': obj_ts.internal,
+                 'etag': 'whatever', 'size': 1234,
+                 'storage_policy_index': POLICIES.default.idx,
+                 'content_type': 'foo/bar'},
+                {'name': 'some tombstone', 'deleted': 1,
+                 'created_at': next(self.ts).internal,
+                 'etag': 'noetag', 'size': 0,
+                 'storage_policy_index': POLICIES.default.idx,
+                 'content_type': 'application/deleted'},
+                {'name': 'wrong policy', 'deleted': 0,
+                 'created_at': next(self.ts).internal,
+                 'etag': 'whatever', 'size': 6789,
+                 'storage_policy_index': 1,
+                 'content_type': 'foo/bar'},
+            ]))
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 202, resp.body)
+
+        req = Request.blank(
+            '/sda1/p/.a/c?format=json',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'X-Timestamp': next(self.ts).internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(json.loads(resp.body), [
+            {'name': 'some obj', 'hash': 'whatever', 'bytes': 1234,
+             'content_type': 'foo/bar', 'last_modified': obj_ts.isoformat},
+        ])
+
+    def _populate_container(self, path):
+        req = Request.blank(
+            path,
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': next(self.ts).internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+
+        # PUT an *empty* shard range
+        sr = ShardRange('.shards_a/c', next(self.ts), 'l', 'u', 0, 0,
+                        state=ShardRange.ACTIVE)
+        req = Request.blank(
+            path,
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': next(self.ts).internal,
+                     'X-Backend-Record-Type': 'shard'},
+            body=json.dumps([dict(sr)]))
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 202)
+        return sr
+
+    def _populate_and_delete_container(self, path):
+        sr = self._populate_container(path)
+        req = Request.blank(
+            path,
+            environ={'REQUEST_METHOD': 'DELETE'},
+            headers={'X-Timestamp': next(self.ts).internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        return sr
+
+    def test_DELETE(self):
+        self._populate_container('/sda1/p/a/c')
+        req = Request.blank(
+            '/sda1/p/a/c',
+            environ={'REQUEST_METHOD': 'DELETE'},
+            headers={'X-Timestamp': next(self.ts).internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+
+        req = Request.blank(
+            '/sda1/p/a/c',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'X-Timestamp': next(self.ts).internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)
+        req = Request.blank(
+            '/sda1/p/a/c',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'X-Timestamp': next(self.ts).internal,
+                     'X-Backend-Record-Type': 'shard'},
+            params={'format': 'json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)
+        req = Request.blank(
+            '/sda1/p/a/c',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'X-Timestamp': next(self.ts).internal,
+                     'X-Backend-Record-Type': 'namespace'},
+            params={'format': 'json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)
+
+    def test_GET_with_override_deleted_ignored_for_objects(self):
+        self._populate_and_delete_container('/sda1/p/a/c')
+        # the override-deleted header is ignored for object records
+        req = Request.blank(
+            '/sda1/p/a/c',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'X-Timestamp': next(self.ts).internal,
+                     'X-Backend-Override-Deleted': 'true'},
+            params={'format': 'json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)
+
+    def test_GET_with_override_deleted_for_shard_ranges(self):
+        sr = self._populate_and_delete_container('/sda1/p/a/c')
+
+        # override-deleted header makes shard ranges available after DELETE
+        req = Request.blank(
+            '/sda1/p/a/c',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'X-Timestamp': next(self.ts).internal,
+                     'X-Backend-Record-Type': 'shard',
+                     'X-Backend-Override-Deleted': 'true'},
+            params={'format': 'json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual([dict(sr, last_modified=sr.timestamp.isoformat)],
+                         json.loads(resp.body))
+        self.assertIn('X-Backend-Record-Type', resp.headers)
+        self.assertEqual('shard', resp.headers['X-Backend-Record-Type'])
+        self.assertIn('X-Backend-Record-Shard-Format', resp.headers)
+        self.assertEqual(
+            'full', resp.headers['X-Backend-Record-Shard-Format'])
+
+        req = Request.blank(
+            '/sda1/p/a/c',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'X-Timestamp': next(self.ts).internal,
+                     'X-Backend-Record-Type': 'shard',
+                     'X-Backend-Record-Shard-Format': 'full',
+                     'X-Backend-Override-Deleted': 'true'},
+            params={'format': 'json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual([dict(sr, last_modified=sr.timestamp.isoformat)],
+                         json.loads(resp.body))
+        self.assertIn('X-Backend-Record-Type', resp.headers)
+        self.assertEqual('shard', resp.headers['X-Backend-Record-Type'])
+        self.assertIn('X-Backend-Record-Shard-Format', resp.headers)
+        self.assertEqual(
+            'full', resp.headers['X-Backend-Record-Shard-Format'])
+
+        # ... unless the override header equates to False
+        req = Request.blank(
+            '/sda1/p/a/c',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'X-Timestamp': next(self.ts).internal,
+                     'X-Backend-Record-Type': 'shard',
+                     'X-Backend-Override-Deleted': 'no'},
+            params={'format': 'json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)
+        self.assertNotIn('X-Backend-Record-Type', resp.headers)
+
+    def test_GET_with_override_deleted_for_namespaces(self):
+        sr = self._populate_and_delete_container('/sda1/p/a/c')
+        # override-deleted header makes shard ranges available after DELETE
+        req = Request.blank(
+            '/sda1/p/a/c',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'X-Timestamp': next(self.ts).internal,
+                     'X-Backend-Record-Type': 'shard',
+                     'X-Backend-Record-Shard-Format': 'namespace',
+                     'X-Backend-Override-Deleted': 'true'},
+            params={'format': 'json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual([dict(Namespace(sr.name, sr.lower, sr.upper))],
+                         json.loads(resp.body))
+        self.assertIn('X-Backend-Record-Type', resp.headers)
+        self.assertEqual('shard', resp.headers['X-Backend-Record-Type'])
+        self.assertIn('X-Backend-Record-Shard-Format', resp.headers)
+        self.assertEqual(
+            'namespace', resp.headers['X-Backend-Record-Shard-Format'])
+
+        # ... unless the override header equates to False
+        req = Request.blank(
+            '/sda1/p/a/c',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'X-Timestamp': next(self.ts).internal,
+                     'X-Backend-Record-Type': 'shard',
+                     'X-Backend-Record-Shard-Format': 'namespace',
+                     'X-Backend-Override-Deleted': 'no'},
+            params={'format': 'json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)
+        self.assertNotIn('X-Backend-Record-Type', resp.headers)
+
+    def test_GET_with_override_deleted_for_shard_ranges_db_unlinked(self):
+        self._populate_and_delete_container('/sda1/p/a/c')
+        broker = self.controller._get_container_broker('sda1', 'p', 'a', 'c')
+        self.assertTrue(os.path.exists(broker.db_file))
+        os.unlink(broker.db_file)
+        self.assertFalse(os.path.exists(broker.db_file))
+        req = Request.blank(
+            '/sda1/p/a/c',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'X-Timestamp': next(self.ts).internal,
+                     'X-Backend-Record-Type': 'shard',
+                     'X-Backend-Override-Deleted': 'true'},
+            params={'format': 'json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)
+        self.assertNotIn('X-Backend-Record-Type', resp.headers)
+
+    def test_DELETE_PUT_recreate(self):
+        timestamps = [next(self.ts) for _ in range(5)]
+        path = '/sda1/p/a/c'
+        req = Request.blank(path, method='PUT',
+                            headers={'X-Timestamp': timestamps[1].internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        req = Request.blank(path, method='DELETE',
+                            headers={'X-Timestamp': timestamps[2].internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        req = Request.blank(path, method='GET')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)  # sanity
+        # backend headers
+        expectations = {
+            'x-backend-put-timestamp': timestamps[1].internal,
+            'x-backend-delete-timestamp': timestamps[2].internal,
+            'x-backend-status-changed-at': timestamps[2].internal,
+        }
+        for header, value in expectations.items():
+            self.assertEqual(resp.headers[header], value,
+                             'response header %s was %s not %s' % (
+                                 header, resp.headers[header], value))
+        db = self.controller._get_container_broker('sda1', 'p', 'a', 'c')
+        self.assertEqual(True, db.is_deleted())
+        info = db.get_info()
+        self.assertEqual(info['put_timestamp'], timestamps[1].internal)
+        self.assertEqual(info['delete_timestamp'], timestamps[2].internal)
+        self.assertEqual(info['status_changed_at'], timestamps[2].internal)
+        # recreate
+        req = Request.blank(path, method='PUT',
+                            headers={'X-Timestamp': timestamps[4].internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        db = self.controller._get_container_broker('sda1', 'p', 'a', 'c')
+        self.assertEqual(False, db.is_deleted())
+        info = db.get_info()
+        self.assertEqual(info['put_timestamp'], timestamps[4].internal)
+        self.assertEqual(info['delete_timestamp'], timestamps[2].internal)
+        self.assertEqual(info['status_changed_at'], timestamps[4].internal)
+        for method in ('GET', 'HEAD'):
+            req = Request.blank(path)
+            resp = req.get_response(self.controller)
+            expectations = {
+                'x-put-timestamp': timestamps[4].normal,
+                'x-backend-put-timestamp': timestamps[4].internal,
+                'x-backend-delete-timestamp': timestamps[2].internal,
+                'x-backend-status-changed-at': timestamps[4].internal,
+            }
+            for header, expected in expectations.items():
+                self.assertEqual(resp.headers[header], expected,
+                                 'header %s was %s is not expected %s' % (
+                                     header, resp.headers[header], expected))
+
+    def test_DELETE_PUT_recreate_replication_race(self):
+        path = '/sda1/p/a/c'
+        # create a deleted db
+        req = Request.blank(path, method='PUT',
+                            headers={'X-Timestamp': '1'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        db = self.controller._get_container_broker('sda1', 'p', 'a', 'c')
+        req = Request.blank(path, method='DELETE',
+                            headers={'X-Timestamp': '2'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        req = Request.blank(path, method='GET')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)  # sanity
+        self.assertEqual(True, db.is_deleted())
+        # now save a copy of this db (and remove it from the "current node")
+        db = self.controller._get_container_broker('sda1', 'p', 'a', 'c')
+        db_path = db._db_file
+        other_path = os.path.join(self.testdir, 'othernode.db')
+        os.rename(db_path, other_path)
+        # that should make it missing on this node
+        req = Request.blank(path, method='GET')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)  # sanity
+
+        # setup the race in os.path.exists (first time no, then yes)
+        mock_called = []
+        _real_exists = os.path.exists
+
+        def mock_exists(db_path):
+            rv = _real_exists(db_path)
+            if db_path != db._db_file:
+                return rv
+            if not mock_called:
+                # be as careful as we might hope backend replication can be...
+                with lock_parent_directory(db_path, timeout=1):
+                    os.rename(other_path, db_path)
+            mock_called.append((rv, db_path))
+            return rv
+
+        req = Request.blank(path, method='PUT',
+                            headers={'X-Timestamp': '4'})
+        with mock.patch.object(container_server.os.path, 'exists',
+                               mock_exists):
+            resp = req.get_response(self.controller)
+        # db was successfully created
+        self.assertEqual(resp.status_int // 100, 2)
+        db = self.controller._get_container_broker('sda1', 'p', 'a', 'c')
+        self.assertEqual(False, db.is_deleted())
+        # mock proves the race
+        self.assertEqual(mock_called[:2],
+                         [(exists, db.db_file) for exists in (False, True)])
+        # info was updated
+        info = db.get_info()
+        self.assertEqual(info['put_timestamp'], Timestamp('4').internal)
+        self.assertEqual(info['delete_timestamp'], Timestamp('2').internal)
+
+    def test_DELETE_not_found(self):
+        # Even if the container wasn't previously heard of, the container
+        # server will accept the delete and replicate it to where it belongs
+        # later.
+        req = Request.blank(
+            '/sda1/p/a/c',
+            environ={'REQUEST_METHOD': 'DELETE', 'HTTP_X_TIMESTAMP': '1'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)
+
+    def test_change_storage_policy_via_DELETE_then_PUT(self):
+        ts = (Timestamp(t).internal for t in
+              itertools.count(int(time.time())))
+        policy = random.choice(list(POLICIES))
+        req = Request.blank(
+            '/sda1/p/a/c', method='PUT',
+            headers={'X-Timestamp': next(ts),
+                     'X-Backend-Storage-Policy-Index': policy.idx})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)  # sanity check
+
+        # try re-recreate with other policies
+        other_policies = [p for p in POLICIES if p != policy]
+        for other_policy in other_policies:
+            # first delete the existing container
+            req = Request.blank('/sda1/p/a/c', method='DELETE', headers={
+                'X-Timestamp': next(ts)})
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 204)  # sanity check
+
+            # at this point, the DB should still exist but be in a deleted
+            # state, so changing the policy index is perfectly acceptable
+            req = Request.blank('/sda1/p/a/c', method='PUT', headers={
+                'X-Timestamp': next(ts),
+                'X-Backend-Storage-Policy-Index': other_policy.idx})
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 201)  # sanity check
+
+            req = Request.blank(
+                '/sda1/p/a/c', method='HEAD')
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.headers['X-Backend-Storage-Policy-Index'],
+                             str(other_policy.idx))
+
+    def test_change_to_default_storage_policy_via_DELETE_then_PUT(self):
+        ts = (Timestamp(t).internal for t in
+              itertools.count(int(time.time())))
+        non_default_policy = random.choice([p for p in POLICIES
+                                            if not p.is_default])
+        req = Request.blank('/sda1/p/a/c', method='PUT', headers={
+            'X-Timestamp': next(ts),
+            'X-Backend-Storage-Policy-Index': non_default_policy.idx,
+        })
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)  # sanity check
+
+        req = Request.blank(
+            '/sda1/p/a/c', method='DELETE',
+            headers={'X-Timestamp': next(ts)})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)  # sanity check
+
+        # at this point, the DB should still exist but be in a deleted state,
+        # so changing the policy index is perfectly acceptable
+        req = Request.blank(
+            '/sda1/p/a/c', method='PUT',
+            headers={'X-Timestamp': next(ts)})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)  # sanity check
+
+        req = Request.blank('/sda1/p/a/c', method='HEAD')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.headers['X-Backend-Storage-Policy-Index'],
+                         str(POLICIES.default.idx))
+
+    def test_DELETE_object(self):
+        req = Request.blank(
+            '/sda1/p/a/c', method='PUT', headers={
+                'X-Timestamp': Timestamp(2).internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        req = Request.blank(
+            '/sda1/p/a/c/o', method='PUT', headers={
+                'X-Timestamp': Timestamp.zero().internal, 'X-Size': 1,
+                'X-Content-Type': 'text/plain', 'X-Etag': 'x'})
+        self._update_object_put_headers(req)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        ts = (Timestamp(t).internal for t in
+              itertools.count(3))
+        req = Request.blank('/sda1/p/a/c', method='DELETE', headers={
+            'X-Timestamp': next(ts)})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 409)
+        req = Request.blank('/sda1/p/a/c/o', method='DELETE', headers={
+            'X-Timestamp': next(ts)})
+        self._update_object_put_headers(req)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        req = Request.blank('/sda1/p/a/c', method='DELETE', headers={
+            'X-Timestamp': next(ts)})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        req = Request.blank('/sda1/p/a/c', method='GET', headers={
+            'X-Timestamp': next(ts)})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)
+
+    def test_object_update_with_offset(self):
+        # create container
+        req = Request.blank('/sda1/p/a/c', method='PUT', headers={
+            'X-Timestamp': next(self.ts).internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        # check status
+        req = Request.blank('/sda1/p/a/c', method='HEAD')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(int(resp.headers['X-Backend-Storage-Policy-Index']),
+                         int(POLICIES.default))
+        # create object
+        obj_timestamp = next(self.ts)
+        req = Request.blank(
+            '/sda1/p/a/c/o', method='PUT', headers={
+                'X-Timestamp': obj_timestamp.internal, 'X-Size': 1,
+                'X-Content-Type': 'text/plain', 'X-Etag': 'x'})
+        self._update_object_put_headers(req)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        # check listing
+        req = Request.blank('/sda1/p/a/c', method='GET',
+                            query_string='format=json')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(int(resp.headers['X-Container-Object-Count']), 1)
+        self.assertEqual(int(resp.headers['X-Container-Bytes-Used']), 1)
+        listing_data = json.loads(resp.body)
+        self.assertEqual(1, len(listing_data))
+        for obj in listing_data:
+            self.assertEqual(obj['name'], 'o')
+            self.assertEqual(obj['bytes'], 1)
+            self.assertEqual(obj['hash'], 'x')
+            self.assertEqual(obj['content_type'], 'text/plain')
+        # send an update with an offset
+        offset_timestamp = Timestamp(obj_timestamp, offset=1)
+        req = Request.blank(
+            '/sda1/p/a/c/o', method='PUT', headers={
+                'X-Timestamp': offset_timestamp.internal, 'X-Size': 2,
+                'X-Content-Type': 'text/html', 'X-Etag': 'y'})
+        self._update_object_put_headers(req)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        # check updated listing
+        req = Request.blank('/sda1/p/a/c', method='GET',
+                            query_string='format=json')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(int(resp.headers['X-Container-Object-Count']), 1)
+        self.assertEqual(int(resp.headers['X-Container-Bytes-Used']), 2)
+        listing_data = json.loads(resp.body)
+        self.assertEqual(1, len(listing_data))
+        for obj in listing_data:
+            self.assertEqual(obj['name'], 'o')
+            self.assertEqual(obj['bytes'], 2)
+            self.assertEqual(obj['hash'], 'y')
+            self.assertEqual(obj['content_type'], 'text/html')
+        # now overwrite with a newer time
+        delete_timestamp = next(self.ts)
+        req = Request.blank(
+            '/sda1/p/a/c/o', method='DELETE', headers={
+                'X-Timestamp': delete_timestamp.internal})
+        self._update_object_put_headers(req)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        # check empty listing
+        req = Request.blank('/sda1/p/a/c', method='GET',
+                            query_string='format=json')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(int(resp.headers['X-Container-Object-Count']), 0)
+        self.assertEqual(int(resp.headers['X-Container-Bytes-Used']), 0)
+        listing_data = json.loads(resp.body)
+        self.assertEqual(0, len(listing_data))
+        # recreate with an offset
+        offset_timestamp = Timestamp(delete_timestamp, offset=1)
+        req = Request.blank(
+            '/sda1/p/a/c/o', method='PUT', headers={
+                'X-Timestamp': offset_timestamp.internal, 'X-Size': 3,
+                'X-Content-Type': 'text/enriched', 'X-Etag': 'z'})
+        self._update_object_put_headers(req)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        # check un-deleted listing
+        req = Request.blank('/sda1/p/a/c', method='GET',
+                            query_string='format=json')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(int(resp.headers['X-Container-Object-Count']), 1)
+        self.assertEqual(int(resp.headers['X-Container-Bytes-Used']), 3)
+        listing_data = json.loads(resp.body)
+        self.assertEqual(1, len(listing_data))
+        for obj in listing_data:
+            self.assertEqual(obj['name'], 'o')
+            self.assertEqual(obj['bytes'], 3)
+            self.assertEqual(obj['hash'], 'z')
+            self.assertEqual(obj['content_type'], 'text/enriched')
+        # delete offset with newer offset
+        delete_timestamp = Timestamp(offset_timestamp, offset=1)
+        req = Request.blank(
+            '/sda1/p/a/c/o', method='DELETE', headers={
+                'X-Timestamp': delete_timestamp.internal})
+        self._update_object_put_headers(req)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        # check empty listing
+        req = Request.blank('/sda1/p/a/c', method='GET',
+                            query_string='format=json')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(int(resp.headers['X-Container-Object-Count']), 0)
+        self.assertEqual(int(resp.headers['X-Container-Bytes-Used']), 0)
+        listing_data = json.loads(resp.body)
+        self.assertEqual(0, len(listing_data))
+
+    def test_object_update_with_multiple_timestamps(self):
+
+        def do_update(t_data, etag, size, content_type,
+                      t_type=None, t_meta=None):
+            """
+            Make a PUT request to container controller to update an object
+            """
+            headers = {'X-Timestamp': t_data.internal,
+                       'X-Size': size,
+                       'X-Content-Type': content_type,
+                       'X-Etag': etag}
+            if t_type:
+                headers['X-Content-Type-Timestamp'] = t_type.internal
+            if t_meta:
+                headers['X-Meta-Timestamp'] = t_meta.internal
+            req = Request.blank(
+                '/sda1/p/a/c/o', method='PUT', headers=headers)
+            self._update_object_put_headers(req)
+            return req.get_response(self.controller)
+
+        ts = (Timestamp(t) for t in itertools.count(int(time.time())))
+        t0 = next(ts)
+
+        # create container
+        req = Request.blank('/sda1/p/a/c', method='PUT', headers={
+            'X-Timestamp': t0.internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+
+        # check status
+        req = Request.blank('/sda1/p/a/c', method='HEAD')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+
+        # create object at t1
+        t1 = next(ts)
+        resp = do_update(t1, 'etag_at_t1', 1, 'ctype_at_t1')
+        self.assertEqual(resp.status_int, 201)
+
+        # check listing, expect last_modified = t1
+        req = Request.blank('/sda1/p/a/c', method='GET',
+                            query_string='format=json')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(int(resp.headers['X-Container-Object-Count']), 1)
+        self.assertEqual(int(resp.headers['X-Container-Bytes-Used']), 1)
+        listing_data = json.loads(resp.body)
+        self.assertEqual(1, len(listing_data))
+        for obj in listing_data:
+            self.assertEqual(obj['name'], 'o')
+            self.assertEqual(obj['bytes'], 1)
+            self.assertEqual(obj['hash'], 'etag_at_t1')
+            self.assertEqual(obj['content_type'], 'ctype_at_t1')
+            self.assertEqual(obj['last_modified'], t1.isoformat)
+
+        # send an update with a content type timestamp at t4
+        t2 = next(ts)
+        t3 = next(ts)
+        t4 = next(ts)
+        resp = do_update(t1, 'etag_at_t1', 1, 'ctype_at_t4', t_type=t4)
+        self.assertEqual(resp.status_int, 201)
+
+        # check updated listing, expect last_modified = t4
+        req = Request.blank('/sda1/p/a/c', method='GET',
+                            query_string='format=json')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(int(resp.headers['X-Container-Object-Count']), 1)
+        self.assertEqual(int(resp.headers['X-Container-Bytes-Used']), 1)
+        listing_data = json.loads(resp.body)
+        self.assertEqual(1, len(listing_data))
+        for obj in listing_data:
+            self.assertEqual(obj['name'], 'o')
+            self.assertEqual(obj['bytes'], 1)
+            self.assertEqual(obj['hash'], 'etag_at_t1')
+            self.assertEqual(obj['content_type'], 'ctype_at_t4')
+            self.assertEqual(obj['last_modified'], t4.isoformat)
+
+        # now overwrite with an in-between data timestamp at t2
+        resp = do_update(t2, 'etag_at_t2', 2, 'ctype_at_t2', t_type=t2)
+        self.assertEqual(resp.status_int, 201)
+
+        # check updated listing
+        req = Request.blank('/sda1/p/a/c', method='GET',
+                            query_string='format=json')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(int(resp.headers['X-Container-Object-Count']), 1)
+        self.assertEqual(int(resp.headers['X-Container-Bytes-Used']), 2)
+        listing_data = json.loads(resp.body)
+        self.assertEqual(1, len(listing_data))
+        for obj in listing_data:
+            self.assertEqual(obj['name'], 'o')
+            self.assertEqual(obj['bytes'], 2)
+            self.assertEqual(obj['hash'], 'etag_at_t2')
+            self.assertEqual(obj['content_type'], 'ctype_at_t4')
+            self.assertEqual(obj['last_modified'], t4.isoformat)
+
+        # now overwrite with an in-between content-type timestamp at t3
+        resp = do_update(t2, 'etag_at_t2', 2, 'ctype_at_t3', t_type=t3)
+        self.assertEqual(resp.status_int, 201)
+
+        # check updated listing
+        req = Request.blank('/sda1/p/a/c', method='GET',
+                            query_string='format=json')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(int(resp.headers['X-Container-Object-Count']), 1)
+        self.assertEqual(int(resp.headers['X-Container-Bytes-Used']), 2)
+        listing_data = json.loads(resp.body)
+        self.assertEqual(1, len(listing_data))
+        for obj in listing_data:
+            self.assertEqual(obj['name'], 'o')
+            self.assertEqual(obj['bytes'], 2)
+            self.assertEqual(obj['hash'], 'etag_at_t2')
+            self.assertEqual(obj['content_type'], 'ctype_at_t4')
+            self.assertEqual(obj['last_modified'], t4.isoformat)
+
+        # now update with an in-between meta timestamp at t5
+        t5 = next(ts)
+        resp = do_update(t2, 'etag_at_t2', 2, 'ctype_at_t3', t_type=t3,
+                         t_meta=t5)
+        self.assertEqual(resp.status_int, 201)
+
+        # check updated listing
+        req = Request.blank('/sda1/p/a/c', method='GET',
+                            query_string='format=json')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(int(resp.headers['X-Container-Object-Count']), 1)
+        self.assertEqual(int(resp.headers['X-Container-Bytes-Used']), 2)
+        listing_data = json.loads(resp.body)
+        self.assertEqual(1, len(listing_data))
+        for obj in listing_data:
+            self.assertEqual(obj['name'], 'o')
+            self.assertEqual(obj['bytes'], 2)
+            self.assertEqual(obj['hash'], 'etag_at_t2')
+            self.assertEqual(obj['content_type'], 'ctype_at_t4')
+            self.assertEqual(obj['last_modified'], t5.isoformat)
+
+        # delete object at t6
+        t6 = next(ts)
+        req = Request.blank(
+            '/sda1/p/a/c/o', method='DELETE', headers={
+                'X-Timestamp': t6.internal})
+        self._update_object_put_headers(req)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+
+        # check empty listing
+        req = Request.blank('/sda1/p/a/c', method='GET',
+                            query_string='format=json')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(int(resp.headers['X-Container-Object-Count']), 0)
+        self.assertEqual(int(resp.headers['X-Container-Bytes-Used']), 0)
+        listing_data = json.loads(resp.body)
+        self.assertEqual(0, len(listing_data))
+
+        # subsequent content type timestamp at t8 should leave object deleted
+        t7 = next(ts)
+        t8 = next(ts)
+        t9 = next(ts)
+        resp = do_update(t2, 'etag_at_t2', 2, 'ctype_at_t8', t_type=t8,
+                         t_meta=t9)
+        self.assertEqual(resp.status_int, 201)
+
+        # check empty listing
+        req = Request.blank('/sda1/p/a/c', method='GET',
+                            query_string='format=json')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(int(resp.headers['X-Container-Object-Count']), 0)
+        self.assertEqual(int(resp.headers['X-Container-Bytes-Used']), 0)
+        listing_data = json.loads(resp.body)
+        self.assertEqual(0, len(listing_data))
+
+        # object recreated at t7 should pick up existing, later content-type
+        resp = do_update(t7, 'etag_at_t7', 7, 'ctype_at_t7')
+        self.assertEqual(resp.status_int, 201)
+
+        # check listing
+        req = Request.blank('/sda1/p/a/c', method='GET',
+                            query_string='format=json')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(int(resp.headers['X-Container-Object-Count']), 1)
+        self.assertEqual(int(resp.headers['X-Container-Bytes-Used']), 7)
+        listing_data = json.loads(resp.body)
+        self.assertEqual(1, len(listing_data))
+        for obj in listing_data:
+            self.assertEqual(obj['name'], 'o')
+            self.assertEqual(obj['bytes'], 7)
+            self.assertEqual(obj['hash'], 'etag_at_t7')
+            self.assertEqual(obj['content_type'], 'ctype_at_t8')
+            self.assertEqual(obj['last_modified'], t9.isoformat)
+
+    def test_DELETE_account_update(self):
+        bindsock = listen_zero()
+
+        def accept(return_code, expected_timestamp):
+            if not isinstance(expected_timestamp, bytes):
+                expected_timestamp = expected_timestamp.encode('ascii')
             try:
                 with Timeout(3):
                     sock, addr = bindsock.accept()
                     inc = sock.makefile('rb')
                     out = sock.makefile('wb')
-                    out.write('HTTP/1.1 %d OK\r\nContent-Length: 0\r\n\r\n' %
+                    out.write(b'HTTP/1.1 %d OK\r\nContent-Length: 0\r\n\r\n' %
                               return_code)
                     out.flush()
-                    self.assertEquals(inc.readline(),
-                                      'PUT /sda1/123/a/c HTTP/1.1\r\n')
+                    self.assertEqual(inc.readline(),
+                                     b'PUT /sda1/123/a/c HTTP/1.1\r\n')
                     headers = {}
                     line = inc.readline()
-                    while line and line != '\r\n':
-                        headers[line.split(':')[0].lower()] = \
-                            line.split(':')[1].strip()
+                    while line and line != b'\r\n':
+                        headers[line.split(b':')[0].lower()] = \
+                            line.split(b':')[1].strip()
                         line = inc.readline()
-                    self.assertEquals(headers['x-delete-timestamp'],
-                                      expected_timestamp)
-            except BaseException, err:
+                    self.assertEqual(headers[b'x-delete-timestamp'],
+                                     expected_timestamp)
+            except BaseException as err:
+                import traceback
+                traceback.print_exc()
                 return err
             return None
-        req = Request.blank('/sda1/p/a/c',
-            environ={'REQUEST_METHOD': 'PUT'}, headers={'X-Timestamp': '1'})
-        resp = self.controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
-        req = Request.blank('/sda1/p/a/c',
+
+        timestamps = [next(self.ts) for _ in range(6)]
+        req = Request.blank(
+            '/sda1/p/a/c',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': timestamps[1].internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        req = Request.blank(
+            '/sda1/p/a/c',
             environ={'REQUEST_METHOD': 'DELETE'},
-            headers={'X-Timestamp': '0000000002.00000',
+            headers={'X-Timestamp': timestamps[2].internal,
                      'X-Account-Host': '%s:%s' % bindsock.getsockname(),
                      'X-Account-Partition': '123',
                      'X-Account-Device': 'sda1'})
-        event = spawn(accept, 204, '0000000002.00000')
+        event = spawn(accept, 204, timestamps[2].internal)
         try:
             with Timeout(3):
-                resp = self.controller.DELETE(req)
-                self.assertEquals(resp.status_int, 204)
+                resp = req.get_response(self.controller)
+                self.assertEqual(resp.status_int, 204)
         finally:
             err = event.wait()
             if err:
                 raise Exception(err)
-        req = Request.blank('/sda1/p/a/c',
-            environ={'REQUEST_METHOD': 'PUT', 'HTTP_X_TIMESTAMP': '2'})
-        resp = self.controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
-        req = Request.blank('/sda1/p/a/c',
+        req = Request.blank(
+            '/sda1/p/a/c', method='PUT', headers={
+                'X-Timestamp': timestamps[2].internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        req = Request.blank(
+            '/sda1/p/a/c',
             environ={'REQUEST_METHOD': 'DELETE'},
-            headers={'X-Timestamp': '0000000003.00000',
+            headers={'X-Timestamp': timestamps[3].internal,
                      'X-Account-Host': '%s:%s' % bindsock.getsockname(),
                      'X-Account-Partition': '123',
                      'X-Account-Device': 'sda1'})
-        event = spawn(accept, 404, '0000000003.00000')
+        event = spawn(accept, 404, timestamps[3].internal)
         try:
             with Timeout(3):
-                resp = self.controller.DELETE(req)
-                self.assertEquals(resp.status_int, 404)
+                resp = req.get_response(self.controller)
+                self.assertEqual(resp.status_int, 404)
         finally:
             err = event.wait()
             if err:
                 raise Exception(err)
-        req = Request.blank('/sda1/p/a/c',
-            environ={'REQUEST_METHOD': 'PUT', 'HTTP_X_TIMESTAMP': '4'})
-        resp = self.controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
-        req = Request.blank('/sda1/p/a/c',
+        req = Request.blank(
+            '/sda1/p/a/c', method='PUT', headers={
+                'X-Timestamp': timestamps[4].internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        req = Request.blank(
+            '/sda1/p/a/c',
             environ={'REQUEST_METHOD': 'DELETE'},
-            headers={'X-Timestamp': '0000000005.00000',
+            headers={'X-Timestamp': timestamps[5].internal,
                      'X-Account-Host': '%s:%s' % bindsock.getsockname(),
                      'X-Account-Partition': '123',
                      'X-Account-Device': 'sda1'})
-        event = spawn(accept, 503, '0000000005.00000')
+        event = spawn(accept, 503, timestamps[5].internal)
         got_exc = False
         try:
             with Timeout(3):
-                resp = self.controller.DELETE(req)
-        except BaseException, err:
+                resp = req.get_response(self.controller)
+        except BaseException:
             got_exc = True
         finally:
             err = event.wait()
             if err:
                 raise Exception(err)
-        self.assert_(not got_exc)
+        self.assertTrue(not got_exc)
+
+    def test_DELETE_invalid_partition(self):
+        req = Request.blank(
+            '/sda1/./a/c', environ={'REQUEST_METHOD': 'DELETE',
+                                    'HTTP_X_TIMESTAMP': '1'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 400)
+
+    def test_DELETE_timestamp_not_float(self):
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT',
+                                    'HTTP_X_TIMESTAMP': '0'})
+        req.get_response(self.controller)
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'DELETE'},
+            headers={'X-Timestamp': 'not-float'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 400)
 
     def test_GET_over_limit(self):
-        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'},
-                            headers={'X-Timestamp': '0'})
-        resp = self.controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
-        req = Request.blank('/sda1/p/a/c?limit=%d' %
-            (container_server.CONTAINER_LISTING_LIMIT + 1),
+        req = Request.blank(
+            '/sda1/p/a/c?limit=%d' %
+            (constraints.CONTAINER_LISTING_LIMIT + 1),
             environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 412)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 412)
+
+    def test_PUT_shard_range_autocreates_shard_container(self):
+        shard_range = ShardRange('.shards_a/shard_c', next(self.ts))
+        put_timestamp = next(self.ts).internal
+        headers = {'X-Backend-Record-Type': 'shard',
+                   'X-Timestamp': put_timestamp,
+                   'X-Container-Sysmeta-Test': 'set',
+                   'X-Container-Meta-Test': 'persisted'}
+
+        # PUT shard range to non-existent container without autocreate flag
+        req = Request.blank(
+            '/sda1/p/.shards_a/shard_c', method='PUT', headers=headers,
+            body=json.dumps([dict(shard_range)]))
+        resp = req.get_response(self.controller)
+        self.assertEqual(404, resp.status_int)
+
+        # PUT shard range to non-existent container with autocreate flag,
+        # missing storage policy
+        headers['X-Timestamp'] = next(self.ts).internal
+        headers['X-Backend-Auto-Create'] = 't'
+        req = Request.blank(
+            '/sda1/p/.shards_a/shard_c', method='PUT', headers=headers,
+            body=json.dumps([dict(shard_range)]))
+        resp = req.get_response(self.controller)
+        self.assertEqual(400, resp.status_int)
+        self.assertIn(b'X-Backend-Storage-Policy-Index header is required',
+                      resp.body)
+
+        # PUT shard range to non-existent container with autocreate flag
+        headers['X-Timestamp'] = next(self.ts).internal
+        policy_index = random.choice(POLICIES).idx
+        headers['X-Backend-Storage-Policy-Index'] = str(policy_index)
+        req = Request.blank(
+            '/sda1/p/.shards_a/shard_c', method='PUT', headers=headers,
+            body=json.dumps([dict(shard_range)]))
+        resp = req.get_response(self.controller)
+        self.assertEqual(201, resp.status_int)
+
+        # repeat PUT of shard range to autocreated container - 202 response
+        headers['X-Timestamp'] = next(self.ts).internal
+        headers.pop('X-Backend-Storage-Policy-Index')  # no longer required
+        req = Request.blank(
+            '/sda1/p/.shards_a/shard_c', method='PUT', headers=headers,
+            body=json.dumps([dict(shard_range)]))
+        resp = req.get_response(self.controller)
+        self.assertEqual(202, resp.status_int)
+
+        # regular PUT to autocreated container - 202 response
+        headers['X-Timestamp'] = next(self.ts).internal
+        req = Request.blank(
+            '/sda1/p/.shards_a/shard_c', method='PUT',
+            headers={'X-Timestamp': next(self.ts).internal},
+            body=json.dumps([dict(shard_range)]))
+        resp = req.get_response(self.controller)
+        self.assertEqual(202, resp.status_int)
+
+    def test_PUT_shard_range_to_deleted_container(self):
+        put_time = next(self.ts).internal
+        # create a container, get it to sharded state and then delete it
+        req = Request.blank('/sda1/p/a/c', method='PUT',
+                            headers={'X-Timestamp': put_time})
+        resp = req.get_response(self.controller)
+        self.assertEqual(201, resp.status_int)
+
+        broker = self.controller._get_container_broker('sda1', 'p', 'a', 'c')
+        broker.enable_sharding(next(self.ts))
+        self.assertTrue(broker.set_sharding_state())
+        self.assertTrue(broker.set_sharded_state())
+
+        delete_time = next(self.ts).internal
+        req = Request.blank('/sda1/p/a/c', method='DELETE',
+                            headers={'X-Timestamp': delete_time})
+        resp = req.get_response(self.controller)
+        self.assertEqual(204, resp.status_int)
+        self.assertTrue(broker.is_deleted())
+        self.assertEqual(delete_time, broker.get_info()['delete_timestamp'])
+        self.assertEqual(put_time, broker.get_info()['put_timestamp'])
+        req = Request.blank('/sda1/p/a/c', method='GET')
+        resp = req.get_response(self.controller)
+        self.assertEqual(404, resp.status_int)
+
+        # shard range PUT is accepted but container remains deleted
+        shard_range = ShardRange('.shards_a/shard_c', next(self.ts),
+                                 state=ShardRange.ACTIVE)
+        headers = {'X-Backend-Record-Type': 'shard',
+                   'X-Timestamp': next(self.ts).internal,
+                   'X-Container-Sysmeta-Test': 'set',
+                   'X-Container-Meta-Test': 'persisted'}
+
+        req = Request.blank('/sda1/p/a/c', method='PUT', headers=headers,
+                            body=json.dumps([dict(shard_range)]))
+        resp = req.get_response(self.controller)
+        self.assertEqual(202, resp.status_int)
+        self.assertTrue(broker.get_info_is_deleted()[1])
+        self.assertEqual(delete_time, broker.get_info()['delete_timestamp'])
+        self.assertEqual(put_time, broker.get_info()['put_timestamp'])
+        req = Request.blank('/sda1/p/a/c', method='GET')
+        resp = req.get_response(self.controller)
+        self.assertEqual(404, resp.status_int)
+
+        # unless shard range has non-zero stats, then container is revived
+        shard_range.update_meta(99, 1234, meta_timestamp=next(self.ts))
+        req = Request.blank('/sda1/p/a/c', method='PUT', headers=headers,
+                            body=json.dumps([dict(shard_range)]))
+        resp = req.get_response(self.controller)
+        self.assertEqual(202, resp.status_int)
+        self.assertFalse(broker.get_info_is_deleted()[1])
+        self.assertEqual(delete_time, broker.get_info()['delete_timestamp'])
+        self.assertEqual(put_time, broker.get_info()['put_timestamp'])
+        req = Request.blank('/sda1/p/a/c', method='GET')
+        resp = req.get_response(self.controller)
+        self.assertEqual(204, resp.status_int)
+        self.assertEqual('99', resp.headers['X-Container-Object-Count'])
+
+    def test_PUT_shard_range_json_in_body(self):
+        oldest_ts = next(self.ts)  # used for stale shard range PUT later
+        shard_bounds = [('', 'ham', ShardRange.ACTIVE),
+                        ('ham', 'salami', ShardRange.ACTIVE),
+                        ('salami', '', ShardRange.CREATED)]
+        shard_ranges = [
+            ShardRange('.shards_a/_%s' % upper, next(self.ts),
+                       lower, upper,
+                       i * 100, i * 1000, meta_timestamp=next(self.ts),
+                       state=state, state_timestamp=next(self.ts))
+            for i, (lower, upper, state) in enumerate(shard_bounds)]
+
+        put_timestamp = next(self.ts).internal
+        headers = {'X-Backend-Record-Type': 'shard',
+                   'X-Timestamp': put_timestamp,
+                   'X-Container-Sysmeta-Test': 'set',
+                   'X-Container-Meta-Test': 'persisted'}
+        body = json.dumps([dict(sr) for sr in shard_ranges[:2]])
+
+        # PUT some shard ranges to non-existent container
+        req = Request.blank('/sda1/p/a/c', method='PUT', headers=headers,
+                            body=body)
+        resp = req.get_response(self.controller)
+        self.assertEqual(404, resp.status_int)
+
+        # create the container with a regular PUT
+        req = Request.blank(
+            '/sda1/p/a/c', method='PUT',
+            headers={'X-Timestamp': put_timestamp}, body=body)
+        resp = req.get_response(self.controller)
+        self.assertEqual(201, resp.status_int)
+
+        # now we can PUT shard ranges
+        req = Request.blank('/sda1/p/a/c', method='PUT', headers=headers,
+                            body=body)
+        resp = req.get_response(self.controller)
+        self.assertEqual(202, resp.status_int)
+
+        # check broker
+        broker = self.controller._get_container_broker('sda1', 'p', 'a', 'c')
+        # sysmeta and user meta is updated
+        exp_meta = {'X-Container-Sysmeta-Test': 'set',
+                    'X-Container-Meta-Test': 'persisted'}
+        self.assertEqual(
+            exp_meta, dict((k, v[0]) for k, v in broker.metadata.items()))
+        self.assertEqual(put_timestamp, broker.get_info()['put_timestamp'])
+        self._assert_shard_ranges_equal(shard_ranges[:2],
+                                        broker.get_shard_ranges())
+
+        # empty json dict
+        body = json.dumps({})
+        headers['X-Timestamp'] = next(self.ts).internal
+        req = Request.blank(
+            '/sda1/p/a/c', method='PUT', headers=headers, body=body)
+        resp = req.get_response(self.controller)
+        self.assertEqual(202, resp.status_int)
+        self.assertEqual(
+            exp_meta, dict((k, v[0]) for k, v in broker.metadata.items()))
+        self._assert_shard_ranges_equal(shard_ranges[:2],
+                                        broker.get_shard_ranges())
+        self.assertEqual(put_timestamp, broker.get_info()['put_timestamp'])
+
+        older_ts = next(self.ts)  # used for stale shard range PUT later
+        # updated and new shard ranges
+        shard_ranges[1].bytes_used += 100
+        shard_ranges[1].meta_timestamp = next(self.ts)
+        body = json.dumps([dict(sr) for sr in shard_ranges[1:]])
+        headers['X-Timestamp'] = next(self.ts).internal
+        req = Request.blank(
+            '/sda1/p/a/c', method='PUT', headers=headers, body=body)
+        resp = req.get_response(self.controller)
+        self.assertEqual(202, resp.status_int)
+        self.assertEqual(
+            exp_meta, dict((k, v[0]) for k, v in broker.metadata.items()))
+        self._assert_shard_ranges_equal(shard_ranges,
+                                        broker.get_shard_ranges())
+        self.assertEqual(put_timestamp, broker.get_info()['put_timestamp'])
+
+        # stale shard range
+        stale_shard_range = shard_ranges[1].copy()
+        stale_shard_range.bytes_used = 0
+        stale_shard_range.object_count = 0
+        stale_shard_range.meta_timestamp = older_ts
+        stale_shard_range.state = ShardRange.CREATED
+        stale_shard_range.state_timestamp = oldest_ts
+        body = json.dumps([dict(stale_shard_range)])
+        headers['X-Timestamp'] = next(self.ts).internal
+        req = Request.blank(
+            '/sda1/p/a/c', method='PUT', headers=headers, body=body)
+        resp = req.get_response(self.controller)
+        self.assertEqual(202, resp.status_int)
+        self.assertEqual(
+            exp_meta, dict((k, v[0]) for k, v in broker.metadata.items()))
+        self._assert_shard_ranges_equal(shard_ranges,
+                                        broker.get_shard_ranges())
+        self.assertEqual(put_timestamp, broker.get_info()['put_timestamp'])
+
+        # deleted shard range
+        shard_ranges[0].deleted = 1
+        shard_ranges[0].timestamp = next(self.ts)
+        body = json.dumps([dict(shard_ranges[0])])
+        req = Request.blank(
+            '/sda1/p/a/c', method='PUT', headers=headers, body=body)
+        resp = req.get_response(self.controller)
+        self.assertEqual(202, resp.status_int)
+        self.assertEqual(
+            exp_meta, dict((k, v[0]) for k, v in broker.metadata.items()))
+        self._assert_shard_ranges_equal(
+            shard_ranges, broker.get_shard_ranges(include_deleted=True))
+        self.assertEqual(put_timestamp, broker.get_info()['put_timestamp'])
+
+        def check_bad_body(body):
+            bad_put_timestamp = next(self.ts).internal
+            headers['X-Timestamp'] = bad_put_timestamp
+            req = Request.blank(
+                '/sda1/p/a/c', method='PUT', headers=headers, body=body)
+            resp = req.get_response(self.controller)
+            self.assertEqual(400, resp.status_int)
+            self.assertIn(b'Invalid body', resp.body)
+            self.assertEqual(
+                exp_meta, dict((k, v[0]) for k, v in broker.metadata.items()))
+            self._assert_shard_ranges_equal(
+                shard_ranges, broker.get_shard_ranges(include_deleted=True))
+            self.assertEqual(put_timestamp, broker.get_info()['put_timestamp'])
+
+        check_bad_body('not json')
+        check_bad_body('')
+        check_bad_body('["not a shard range"]')
+        check_bad_body('[[]]')
+        bad_shard_range = dict(ShardRange('a/c', next(self.ts)))
+        bad_shard_range.pop('timestamp')
+        check_bad_body(json.dumps([bad_shard_range]))
+
+        def check_not_shard_record_type(headers):
+            # body ignored
+            body = json.dumps([dict(sr) for sr in shard_ranges])
+            # note, regular PUT so put timestamp is updated
+            put_timestamp = next(self.ts).internal
+            headers['X-Timestamp'] = put_timestamp
+            req = Request.blank(
+                '/sda1/p/a/c', method='PUT', headers=headers, body=body)
+            resp = req.get_response(self.controller)
+            self.assertEqual(202, resp.status_int)
+            self._assert_shard_ranges_equal(
+                shard_ranges, broker.get_shard_ranges(include_deleted=True))
+            self.assertEqual(put_timestamp, broker.get_info()['put_timestamp'])
+
+        check_not_shard_record_type({'X-Backend-Record-Type': 'object',
+                                     'X-Timestamp': next(self.ts).internal})
+
+        check_not_shard_record_type({'X-Timestamp': next(self.ts).internal})
+
+    def test_PUT_GET_shard_ranges(self):
+        # make a container
+        ts_now = Timestamp.now()  # used when mocking Timestamp.now()
+        ts_put = next(self.ts)
+        headers = {'X-Timestamp': ts_put.normal}
+        req = Request.blank('/sda1/p/a/c', method='PUT', headers=headers)
+        self.assertEqual(201, req.get_response(self.controller).status_int)
+        # PUT some objects
+        objects = [{'name': 'obj_%d' % i,
+                    'x-timestamp': next(self.ts).normal,
+                    'x-content-type': 'text/plain',
+                    'x-etag': 'etag_%d' % i,
+                    'x-size': 1024 * i
+                    } for i in range(2)]
+        for obj in objects:
+            req = Request.blank('/sda1/p/a/c/%s' % obj['name'], method='PUT',
+                                headers=obj)
+            self._update_object_put_headers(req)
+            resp = req.get_response(self.controller)
+            self.assertEqual(201, resp.status_int)
+        # PUT some shard ranges
+        shard_bounds = [('', 'apple', ShardRange.SHRINKING),
+                        ('apple', 'ham', ShardRange.CLEAVED),
+                        ('ham', 'salami', ShardRange.ACTIVE),
+                        ('salami', 'yoghurt', ShardRange.CREATED),
+                        ('yoghurt', '', ShardRange.FOUND),
+                        ]
+        shard_ranges = [
+            ShardRange('.sharded_a/_%s' % upper, next(self.ts),
+                       lower, upper,
+                       i * 100, i * 1000, meta_timestamp=next(self.ts),
+                       state=state, state_timestamp=next(self.ts))
+            for i, (lower, upper, state) in enumerate(shard_bounds)]
+        for shard_range in shard_ranges:
+            self._put_shard_range(shard_range)
+
+        broker = self.controller._get_container_broker('sda1', 'p', 'a', 'c')
+        self.assertTrue(broker.is_root_container())  # sanity
+        self._assert_shard_ranges_equal(shard_ranges,
+                                        broker.get_shard_ranges())
+
+        # sanity check - no shard ranges when GET is only for objects
+        def check_object_GET(path):
+            req = Request.blank(path, method='GET')
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual(resp.content_type, 'application/json')
+            expected = [
+                dict(hash=obj['x-etag'], bytes=obj['x-size'],
+                     content_type=obj['x-content-type'],
+                     last_modified=Timestamp(obj['x-timestamp']).isoformat,
+                     name=obj['name']) for obj in objects]
+            self.assertEqual(expected, json.loads(resp.body))
+            self.assertIn('X-Backend-Record-Type', resp.headers)
+            self.assertEqual('object', resp.headers['X-Backend-Record-Type'])
+
+        check_object_GET('/sda1/p/a/c?format=json')
+
+        # GET only shard ranges
+        def check_shard_GET(expected_shard_ranges, path, params=''):
+            req = Request.blank('/sda1/p/%s?format=json%s' %
+                                (path, params), method='GET',
+                                headers={'X-Backend-Record-Type': 'shard'})
+            with mock_timestamp_now(ts_now):
+                resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual(resp.content_type, 'application/json')
+            expected = [
+                dict(sr, last_modified=Timestamp(sr.timestamp).isoformat)
+                for sr in expected_shard_ranges]
+            self.assertEqual(expected, json.loads(resp.body))
+            self.assertIn('X-Backend-Record-Type', resp.headers)
+            self.assertEqual('shard', resp.headers['X-Backend-Record-Type'])
+            self.assertEqual(
+                'GET_shard.timing',
+                self.logger.statsd_client.calls['timing_since'][-2][0][0])
+            self.assertEqual(
+                'GET.timing',
+                self.logger.statsd_client.calls['timing_since'][-1][0][0])
+
+        def check_shard_GET_override_filter(
+                expected_shard_ranges, path, state, params=''):
+            req_headers = {'X-Backend-Record-Type': 'shard',
+                           'X-Backend-Override-Shard-Name-Filter': state}
+            req = Request.blank('/sda1/p/%s?format=json%s' %
+                                (path, params), method='GET',
+                                headers=req_headers)
+            with mock_timestamp_now(ts_now):
+                resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual(resp.content_type, 'application/json')
+            expected = [
+                dict(sr, last_modified=Timestamp(sr.timestamp).isoformat)
+                for sr in expected_shard_ranges]
+            self.assertEqual(expected, json.loads(resp.body))
+            self.assertIn('X-Backend-Record-Type', resp.headers)
+            self.assertEqual('shard', resp.headers['X-Backend-Record-Type'])
+            return resp
+
+        # all shards
+        check_shard_GET(shard_ranges, 'a/c')
+        check_shard_GET(reversed(shard_ranges), 'a/c', params='&reverse=true')
+        # only created shards
+        check_shard_GET(shard_ranges[3:4], 'a/c', params='&states=created')
+        # only found shards
+        check_shard_GET(shard_ranges[4:5], 'a/c', params='&states=found')
+        # only cleaved shards
+        check_shard_GET(shard_ranges[1:2], 'a/c',
+                        params='&states=cleaved')
+        # only active shards
+        check_shard_GET(shard_ranges[2:3], 'a/c',
+                        params='&states=active&end_marker=pickle')
+        # only cleaved or active shards, reversed
+        check_shard_GET(
+            reversed(shard_ranges[1:3]), 'a/c',
+            params='&states=cleaved,active&reverse=true&marker=pickle')
+        # only shrinking shards
+        check_shard_GET(shard_ranges[:1], 'a/c',
+                        params='&states=shrinking&end_marker=pickle')
+        check_shard_GET(shard_ranges[:1], 'a/c',
+                        params='&states=shrinking&reverse=true&marker=pickle')
+        # only active or shrinking shards
+        check_shard_GET([shard_ranges[0], shard_ranges[2]], 'a/c',
+                        params='&states=shrinking,active&end_marker=pickle')
+        check_shard_GET(
+            [shard_ranges[2], shard_ranges[0]], 'a/c',
+            params='&states=active,shrinking&reverse=true&marker=pickle')
+        # only active or shrinking shards using listing alias
+        check_shard_GET(shard_ranges[:3], 'a/c',
+                        params='&states=listing&end_marker=pickle')
+        check_shard_GET(
+            reversed(shard_ranges[:3]), 'a/c',
+            params='&states=listing&reverse=true&marker=pickle')
+        # only created, cleaved, active, shrinking shards using updating alias
+        check_shard_GET(shard_ranges[1:4], 'a/c',
+                        params='&states=updating&end_marker=treacle')
+        check_shard_GET(
+            reversed(shard_ranges[1:4]), 'a/c',
+            params='&states=updating&reverse=true&marker=treacle')
+
+        # listing shards don't cover entire namespace so expect an extra filler
+        extra_shard_range = ShardRange(
+            'a/c', ts_now, shard_ranges[2].upper, ShardRange.MAX, 0, 0,
+            state=ShardRange.ACTIVE)
+        expected = shard_ranges[:3] + [extra_shard_range]
+        check_shard_GET(expected, 'a/c', params='&states=listing')
+        check_shard_GET(reversed(expected), 'a/c',
+                        params='&states=listing&reverse=true')
+        expected = [shard_ranges[2], extra_shard_range]
+        check_shard_GET(expected, 'a/c',
+                        params='&states=listing&marker=pickle')
+        check_shard_GET(
+            reversed(expected), 'a/c',
+            params='&states=listing&reverse=true&end_marker=pickle')
+        # updating shards don't cover entire namespace so expect a filler
+        extra_shard_range = ShardRange(
+            'a/c', ts_now, shard_ranges[3].upper, ShardRange.MAX, 0, 0,
+            state=ShardRange.ACTIVE)
+        expected = shard_ranges[1:4] + [extra_shard_range]
+        check_shard_GET(expected, 'a/c', params='&states=updating')
+        check_shard_GET(reversed(expected), 'a/c',
+                        params='&states=updating&reverse=true')
+        # when no listing shard ranges cover the requested namespace range then
+        # filler is for entire requested namespace
+        extra_shard_range = ShardRange(
+            'a/c', ts_now, 'treacle', ShardRange.MAX, 0, 0,
+            state=ShardRange.ACTIVE)
+        check_shard_GET([extra_shard_range], 'a/c',
+                        params='&states=listing&marker=treacle')
+        check_shard_GET(
+            [extra_shard_range], 'a/c',
+            params='&states=listing&reverse=true&end_marker=treacle')
+        extra_shard_range = ShardRange(
+            'a/c', ts_now, 'treacle', 'walnut', 0, 0,
+            state=ShardRange.ACTIVE)
+        params = '&states=listing&marker=treacle&end_marker=walnut'
+        check_shard_GET([extra_shard_range], 'a/c', params=params)
+        params = '&states=listing&reverse=true&marker=walnut' + \
+                 '&end_marker=treacle'
+        check_shard_GET([extra_shard_range], 'a/c', params=params)
+        # specific object
+        check_shard_GET(shard_ranges[1:2], 'a/c', params='&includes=cheese')
+        check_shard_GET(shard_ranges[1:2], 'a/c', params='&includes=ham')
+        check_shard_GET(shard_ranges[2:3], 'a/c', params='&includes=pickle')
+        check_shard_GET(shard_ranges[2:3], 'a/c', params='&includes=salami')
+        check_shard_GET(shard_ranges[3:4], 'a/c', params='&includes=walnut')
+        check_shard_GET(shard_ranges[3:4], 'a/c',
+                        params='&includes=walnut&reverse=true')
+        # with marker
+        check_shard_GET(shard_ranges[1:], 'a/c', params='&marker=cheese')
+        check_shard_GET(reversed(shard_ranges[:2]), 'a/c',
+                        params='&marker=cheese&reverse=true')
+        check_shard_GET(shard_ranges[2:], 'a/c', params='&marker=ham')
+        check_shard_GET(reversed(shard_ranges[:2]), 'a/c',
+                        params='&marker=ham&reverse=true')
+        check_shard_GET(shard_ranges[2:], 'a/c', params='&marker=pickle')
+        check_shard_GET(reversed(shard_ranges[:3]), 'a/c',
+                        params='&marker=pickle&reverse=true')
+        check_shard_GET(shard_ranges[3:], 'a/c', params='&marker=salami')
+        check_shard_GET(reversed(shard_ranges[:3]), 'a/c',
+                        params='&marker=salami&reverse=true')
+        check_shard_GET(shard_ranges[3:], 'a/c', params='&marker=walnut')
+        check_shard_GET(reversed(shard_ranges[:4]), 'a/c',
+                        params='&marker=walnut&reverse=true')
+        # with end marker
+        check_shard_GET(shard_ranges[:2], 'a/c', params='&end_marker=cheese')
+        check_shard_GET(reversed(shard_ranges[1:]), 'a/c',
+                        params='&end_marker=cheese&reverse=true')
+        # everything in range 'apple' - 'ham' is <= end_marker of 'ham' so that
+        # range is not included because end_marker is non-inclusive
+        check_shard_GET(shard_ranges[:2], 'a/c', params='&end_marker=ham')
+        check_shard_GET(reversed(shard_ranges[2:]), 'a/c',
+                        params='&end_marker=ham&reverse=true')
+        check_shard_GET(shard_ranges[:3], 'a/c', params='&end_marker=pickle')
+        check_shard_GET(reversed(shard_ranges[2:]), 'a/c',
+                        params='&end_marker=pickle&reverse=true')
+        check_shard_GET(shard_ranges[:3], 'a/c', params='&end_marker=salami')
+        check_shard_GET(reversed(shard_ranges[3:]), 'a/c',
+                        params='&end_marker=salami&reverse=true')
+        check_shard_GET(shard_ranges[:4], 'a/c', params='&end_marker=walnut')
+        check_shard_GET(reversed(shard_ranges[3:]), 'a/c',
+                        params='&end_marker=walnut&reverse=true')
+        # with marker and end marker
+        check_shard_GET(shard_ranges[1:2], 'a/c',
+                        params='&marker=cheese&end_marker=egg')
+        check_shard_GET(shard_ranges[1:2], 'a/c',
+                        params='&end_marker=cheese&marker=egg&reverse=true')
+        check_shard_GET(shard_ranges[1:3], 'a/c',
+                        params='&marker=egg&end_marker=jam')
+        check_shard_GET(reversed(shard_ranges[1:3]), 'a/c',
+                        params='&end_marker=egg&marker=jam&reverse=true')
+        check_shard_GET(shard_ranges[1:4], 'a/c',
+                        params='&marker=cheese&end_marker=walnut')
+        check_shard_GET(reversed(shard_ranges[1:4]), 'a/c',
+                        params='&end_marker=cheese&marker=walnut&reverse=true')
+        check_shard_GET(shard_ranges[2:4], 'a/c',
+                        params='&marker=jam&end_marker=walnut')
+        check_shard_GET(reversed(shard_ranges[2:4]), 'a/c',
+                        params='&end_marker=jam&marker=walnut&reverse=true')
+        check_shard_GET(shard_ranges[3:4], 'a/c',
+                        params='&marker=toast&end_marker=walnut')
+        check_shard_GET(shard_ranges[3:4], 'a/c',
+                        params='&end_marker=toast&marker=walnut&reverse=true')
+        check_shard_GET([], 'a/c',
+                        params='&marker=egg&end_marker=cheese')
+        check_shard_GET([], 'a/c',
+                        params='&marker=cheese&end_marker=egg&reverse=true')
+
+        # now vary the sharding state and check the consequences of sending the
+        # x-backend-override-shard-name-filter header:
+        # in unsharded & sharding state the header should be ignored
+        self.assertEqual('unsharded', broker.get_db_state())
+        check_shard_GET(
+            reversed(shard_ranges[:2]), 'a/c',
+            params='&states=listing&reverse=true&marker=egg')
+        resp = check_shard_GET_override_filter(
+            reversed(shard_ranges[:2]), 'a/c', state='unsharded',
+            params='&states=listing&reverse=true&marker=egg')
+        self.assertNotIn('X-Backend-Override-Shard-Name-Filter', resp.headers)
+        resp = check_shard_GET_override_filter(
+            reversed(shard_ranges[:2]), 'a/c', state='sharded',
+            params='&states=listing&reverse=true&marker=egg')
+        self.assertIsNone(
+            resp.headers.get('X-Backend-Override-Shard-Name-Filter'))
+        ts_epoch = next(self.ts)
+        broker.enable_sharding(ts_epoch)
+        self.assertTrue(broker.set_sharding_state())
+        check_shard_GET(
+            reversed(shard_ranges[:2]), 'a/c',
+            params='&states=listing&reverse=true&marker=egg')
+        resp = check_shard_GET_override_filter(
+            reversed(shard_ranges[:2]), 'a/c', state='sharding',
+            params='&states=listing&reverse=true&marker=egg')
+        self.assertNotIn('X-Backend-Override-Shard-Name-Filter', resp.headers)
+        resp = check_shard_GET_override_filter(
+            reversed(shard_ranges[:2]), 'a/c', state='sharded',
+            params='&states=listing&reverse=true&marker=egg')
+        self.assertIsNone(
+            resp.headers.get('X-Backend-Override-Shard-Name-Filter'))
+        # in sharded state the server *will* override the marker and reverse
+        # params and return listing shard ranges for entire namespace if
+        # X-Backend-Override-Shard-Name-Filter == 'sharded'
+        self.assertTrue(broker.set_sharded_state())
+        ts_now = next(self.ts)
+        with mock_timestamp_now(ts_now):
+            extra_shard_range = broker.get_own_shard_range()
+        extra_shard_range.lower = shard_ranges[2].upper
+        extra_shard_range.upper = ShardRange.MAX
+        check_shard_GET(
+            reversed(shard_ranges[:2]), 'a/c',
+            params='&states=listing&reverse=true&marker=egg')
+        expected = shard_ranges[:3] + [extra_shard_range]
+        resp = check_shard_GET_override_filter(
+            reversed(shard_ranges[:2]), 'a/c', state='sharding',
+            params='&states=listing&reverse=true&marker=egg')
+        self.assertNotIn('X-Backend-Override-Shard-Name-Filter', resp.headers)
+        resp = check_shard_GET_override_filter(
+            expected, 'a/c', state='sharded',
+            params='&states=listing&reverse=true&marker=egg')
+        self.assertEqual(
+            'true', resp.headers.get('X-Backend-Override-Shard-Name-Filter'))
+        # updating state excludes the first shard which has 'shrinking' state
+        # but includes the fourth which has 'created' state
+        extra_shard_range.lower = shard_ranges[3].upper
+        check_shard_GET(
+            shard_ranges[1:2], 'a/c',
+            params='&states=updating&includes=egg')
+        expected = shard_ranges[1:4] + [extra_shard_range]
+        resp = check_shard_GET_override_filter(
+            expected, 'a/c', state='sharded',
+            params='&states=updating&includes=egg')
+        self.assertEqual(
+            'true', resp.headers.get('X-Backend-Override-Shard-Name-Filter'))
+
+        # delete a shard range
+        shard_range = shard_ranges[1]
+        shard_range.set_deleted(timestamp=next(self.ts))
+        self._put_shard_range(shard_range)
+
+        self._assert_shard_ranges_equal(shard_ranges[:1] + shard_ranges[2:],
+                                        broker.get_shard_ranges())
+
+        check_shard_GET(shard_ranges[:1] + shard_ranges[2:], 'a/c')
+        check_shard_GET(shard_ranges[2:3], 'a/c', params='&includes=jam')
+        # specify obj, marker or end_marker not in any shard range
+        check_shard_GET([], 'a/c', params='&includes=cheese')
+        check_shard_GET([], 'a/c', params='&includes=cheese&reverse=true')
+        check_shard_GET([], 'a/c', params='&includes=ham')
+        check_shard_GET(shard_ranges[2:], 'a/c/', params='&marker=cheese')
+        check_shard_GET(shard_ranges[:1], 'a/c/',
+                        params='&marker=cheese&reverse=true')
+        check_shard_GET(shard_ranges[:1], 'a/c/', params='&end_marker=cheese')
+        check_shard_GET(reversed(shard_ranges[2:]), 'a/c/',
+                        params='&end_marker=cheese&reverse=true')
+
+        self.assertFalse(self.controller.logger.get_lines_for_level('warning'))
+        self.assertFalse(self.controller.logger.get_lines_for_level('error'))
+
+    def test_GET_shard_ranges_with_format_header(self):
+        # verify that shard range GET defaults to the 'full' format
+        sr = self._populate_container('/sda1/p/a/c')
+
+        def do_test(headers):
+            headers.update({'X-Timestamp': next(self.ts).internal,
+                            'X-Backend-Record-Type': 'shard'})
+            req = Request.blank(
+                '/sda1/p/a/c', environ={'REQUEST_METHOD': 'GET'},
+                headers=headers, params={'format': 'json'})
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual([dict(sr, last_modified=sr.timestamp.isoformat)],
+                             json.loads(resp.body))
+            self.assertIn('X-Backend-Record-Type', resp.headers)
+            self.assertEqual('shard', resp.headers['X-Backend-Record-Type'])
+            self.assertIn('X-Backend-Record-Shard-Format', resp.headers)
+            self.assertEqual(
+                'full', resp.headers['X-Backend-Record-Shard-Format'])
+
+        do_test({})
+        do_test({'X-Backend-Record-Shard-Format': ''})
+        do_test({'X-Backend-Record-Shard-Format': 'full'})
+        do_test({'X-Backend-Record-Shard-Format': 'nonsense'})
+
+    def test_GET_shard_ranges_from_compacted_shard(self):
+        # make a shrunk shard container with two acceptors that overlap with
+        # the shard's namespace
+        shard_path = '.shards_a/c_f'
+        ts_now = Timestamp.now()  # used when mocking Timestamp.now()
+        own_shard_range = ShardRange(shard_path, next(self.ts),
+                                     'b', 'f', 100, 1000,
+                                     meta_timestamp=next(self.ts),
+                                     state=ShardRange.SHRUNK,
+                                     state_timestamp=next(self.ts),
+                                     epoch=next(self.ts))
+        shard_ranges = []
+        for lower, upper in (('a', 'd'), ('d', 'g')):
+            shard_ranges.append(
+                ShardRange('.shards_a/c_%s' % upper, next(self.ts),
+                           lower, upper, 100, 1000,
+                           meta_timestamp=next(self.ts),
+                           state=ShardRange.ACTIVE,
+                           state_timestamp=next(self.ts)))
+
+        # create container
+        headers = {'X-Timestamp': next(self.ts).normal}
+        req = Request.blank(
+            '/sda1/p/%s' % shard_path, method='PUT', headers=headers)
+        self.assertIn(
+            req.get_response(self.controller).status_int, (201, 202))
+
+        # PUT the acceptor shard ranges and own shard range
+        headers = {'X-Timestamp': next(self.ts).normal,
+                   'X-Container-Sysmeta-Shard-Root': 'a/c',
+                   'X-Backend-Record-Type': 'shard'}
+        body = json.dumps(
+            [dict(sr) for sr in shard_ranges + [own_shard_range]])
+        req = Request.blank('/sda1/p/%s' % shard_path, method='PUT',
+                            headers=headers, body=body)
+        self.assertEqual(202, req.get_response(self.controller).status_int)
+
+        def do_get(params, extra_headers, expected):
+            expected = [dict(sr, last_modified=sr.timestamp.isoformat)
+                        for sr in expected]
+            headers = {'X-Backend-Record-Type': 'shard'}
+            headers.update(extra_headers)
+            req = Request.blank('/sda1/p/%s?format=json%s' %
+                                (shard_path, params), method='GET',
+                                headers=headers)
+            with mock_timestamp_now(ts_now):
+                resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual(resp.content_type, 'application/json')
+            self.assertEqual(expected, json.loads(resp.body))
+            self.assertIn('X-Backend-Record-Type', resp.headers)
+            self.assertEqual('shard', resp.headers['X-Backend-Record-Type'])
+            return resp
+
+        # unsharded shard container...
+        do_get('', {}, shard_ranges)
+        do_get('&marker=e', {}, shard_ranges[1:])
+        do_get('&end_marker=d', {}, shard_ranges[:1])
+        do_get('&end_marker=k', {}, shard_ranges)
+        do_get('&marker=b&end_marker=f&states=listing', {}, shard_ranges)
+        do_get('&marker=b&end_marker=c&states=listing', {}, shard_ranges[:1])
+        do_get('&marker=b&end_marker=z&states=listing', {}, shard_ranges)
+        do_get('&states=listing', {}, shard_ranges)
+
+        # send X-Backend-Override-Shard-Name-Filter, but db is not yet sharded
+        # so this has no effect
+        extra_headers = {'X-Backend-Override-Shard-Name-Filter': 'sharded'}
+        resp = do_get('', extra_headers, shard_ranges)
+        self.assertNotIn('X-Backend-Override-Shard-Name-Filter', resp.headers)
+        resp = do_get('&marker=e', extra_headers, shard_ranges[1:])
+        self.assertNotIn('X-Backend-Override-Shard-Name-Filter', resp.headers)
+        resp = do_get('&end_marker=d', extra_headers, shard_ranges[:1])
+        self.assertNotIn('X-Backend-Override-Shard-Name-Filter', resp.headers)
+        resp = do_get('&states=listing', {}, shard_ranges)
+        self.assertNotIn('X-Backend-Override-Shard-Name-Filter', resp.headers)
+
+        # set broker to sharded state so X-Backend-Override-Shard-Name-Filter
+        # does have effect
+        shard_broker = self.controller._get_container_broker(
+            'sda1', 'p', '.shards_a', 'c_f')
+        self.assertTrue(shard_broker.set_sharding_state())
+        self.assertTrue(shard_broker.set_sharded_state())
+
+        resp = do_get('', extra_headers, shard_ranges)
+        self.assertIn('X-Backend-Override-Shard-Name-Filter', resp.headers)
+        self.assertTrue(resp.headers['X-Backend-Override-Shard-Name-Filter'])
+
+        resp = do_get('&marker=e', extra_headers, shard_ranges)
+        self.assertIn('X-Backend-Override-Shard-Name-Filter', resp.headers)
+        self.assertTrue(resp.headers['X-Backend-Override-Shard-Name-Filter'])
+
+        resp = do_get('&end_marker=d', extra_headers, shard_ranges)
+        self.assertIn('X-Backend-Override-Shard-Name-Filter', resp.headers)
+        self.assertTrue(resp.headers['X-Backend-Override-Shard-Name-Filter'])
+
+    def test_GET_shard_ranges_using_state_aliases(self):
+        # make a shard container
+        shard_ranges = []
+        lower = ''
+        for state in sorted(ShardRange.STATES.keys()):
+            upper = str(state)
+            shard_ranges.append(
+                ShardRange('.shards_a/c_%s' % upper, next(self.ts),
+                           lower, upper, state * 100, state * 1000,
+                           meta_timestamp=next(self.ts),
+                           state=state, state_timestamp=next(self.ts)))
+            lower = upper
+
+        def do_test(root_path, path, params, expected_states):
+            expected = [
+                sr for sr in shard_ranges if sr.state in expected_states]
+            own_shard_range = ShardRange(path, next(self.ts), '', '',
+                                         state=ShardRange.ACTIVE)
+            expected.append(own_shard_range.copy(lower=expected[-1].upper))
+            expected = [dict(sr, last_modified=sr.timestamp.isoformat)
+                        for sr in expected]
+            headers = {'X-Timestamp': next(self.ts).normal}
+
+            # create container
+            req = Request.blank(
+                '/sda1/p/%s' % path, method='PUT', headers=headers)
+            self.assertIn(
+                req.get_response(self.controller).status_int, (201, 202))
+            # PUT some shard ranges
+            headers = {'X-Timestamp': next(self.ts).normal,
+                       'X-Container-Sysmeta-Shard-Root': root_path,
+                       'X-Backend-Record-Type': 'shard'}
+            body = json.dumps(
+                [dict(sr) for sr in shard_ranges + [own_shard_range]])
+            req = Request.blank(
+                '/sda1/p/%s' % path, method='PUT', headers=headers, body=body)
+            self.assertEqual(202, req.get_response(self.controller).status_int)
+
+            req = Request.blank('/sda1/p/%s?format=json%s' %
+                                (path, params), method='GET',
+                                headers={'X-Backend-Record-Type': 'shard'})
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual(resp.content_type, 'application/json')
+            self.assertEqual(expected, json.loads(resp.body))
+            self.assertIn('X-Backend-Record-Type', resp.headers)
+            self.assertEqual('shard', resp.headers['X-Backend-Record-Type'])
+
+        # root's shard ranges for listing
+        root_path = container_path = 'a/c'
+        params = '&states=listing'
+        expected_states = [
+            ShardRange.CLEAVED, ShardRange.ACTIVE, ShardRange.SHARDING,
+            ShardRange.SHRINKING]
+        do_test(root_path, container_path, params, expected_states)
+
+        # shard's shard ranges for listing
+        container_path = '.shards_a/c'
+        params = '&states=listing'
+        do_test(root_path, container_path, params, expected_states)
+
+        # root's shard ranges for updating
+        params = '&states=updating'
+        expected_states = [
+            ShardRange.CREATED, ShardRange.CLEAVED, ShardRange.ACTIVE,
+            ShardRange.SHARDING]
+        container_path = root_path
+        do_test(root_path, container_path, params, expected_states)
+
+        # shard's shard ranges for updating
+        container_path = '.shards_a/c'
+        do_test(root_path, container_path, params, expected_states)
+
+    def test_GET_shard_ranges_include_deleted(self):
+        # make a shard container
+        ts_now = Timestamp.now()  # used when mocking Timestamp.now()
+        shard_ranges = []
+        lower = ''
+        for state in sorted(ShardRange.STATES.keys()):
+            upper = str(state)
+            shard_ranges.append(
+                ShardRange('.shards_a/c_%s' % upper, next(self.ts),
+                           lower, upper, state * 100, state * 1000,
+                           meta_timestamp=next(self.ts),
+                           state=state, state_timestamp=next(self.ts)))
+            lower = upper
+        # create container
+        headers = {'X-Timestamp': next(self.ts).normal}
+        req = Request.blank(
+            '/sda1/p/a/c', method='PUT', headers=headers)
+        self.assertIn(
+            req.get_response(self.controller).status_int, (201, 202))
+        # PUT some shard ranges
+        headers = {'X-Timestamp': next(self.ts).normal,
+                   'X-Backend-Record-Type': 'shard'}
+        body = json.dumps([dict(sr) for sr in shard_ranges])
+        req = Request.blank(
+            '/sda1/p/a/c', method='PUT', headers=headers, body=body)
+        self.assertEqual(202, req.get_response(self.controller).status_int)
+
+        def do_test(include_deleted, expected):
+            expected = [dict(sr, last_modified=sr.timestamp.isoformat)
+                        for sr in expected]
+            headers = {'X-Backend-Record-Type': 'shard',
+                       'X-Backend-Include-Deleted': str(include_deleted)}
+            req = Request.blank('/sda1/p/a/c?format=json', method='GET',
+                                headers=headers)
+            with mock_timestamp_now(ts_now):
+                resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual(resp.content_type, 'application/json')
+            self.assertEqual(expected, json.loads(resp.body))
+            self.assertIn('X-Backend-Record-Type', resp.headers)
+            self.assertEqual('shard', resp.headers['X-Backend-Record-Type'])
+
+        do_test(False, shard_ranges)
+        do_test(True, shard_ranges)
+
+        headers = {'X-Timestamp': next(self.ts).normal,
+                   'X-Backend-Record-Type': 'shard'}
+        for sr in shard_ranges[::2]:
+            sr.set_deleted(timestamp=next(self.ts))
+        body = json.dumps([dict(sr) for sr in shard_ranges])
+        req = Request.blank(
+            '/sda1/p/a/c', method='PUT', headers=headers, body=body)
+        self.assertEqual(202, req.get_response(self.controller).status_int)
+        broker = self.controller._get_container_broker('sda1', 'p', 'a', 'c')
+        self._assert_shard_ranges_equal(
+            shard_ranges[1::2], broker.get_shard_ranges())
+        do_test(False, shard_ranges[1::2])
+        do_test(True, shard_ranges)
+
+        headers = {'X-Timestamp': next(self.ts).normal,
+                   'X-Backend-Record-Type': 'shard'}
+        for sr in shard_ranges[1::2]:
+            sr.set_deleted(timestamp=next(self.ts))
+        body = json.dumps([dict(sr) for sr in shard_ranges])
+        req = Request.blank(
+            '/sda1/p/a/c', method='PUT', headers=headers, body=body)
+        self.assertEqual(202, req.get_response(self.controller).status_int)
+        self.assertFalse(broker.get_shard_ranges())
+        do_test(False, [])
+        do_test(True, shard_ranges)
+
+    def test_GET_shard_ranges_errors(self):
+        # verify that x-backend-record-type is not included in error responses
+        ts_now = Timestamp.now()  # used when mocking Timestamp.now()
+        shard_ranges = []
+        lower = ''
+        for state in sorted(ShardRange.STATES.keys()):
+            upper = str(state)
+            shard_ranges.append(
+                ShardRange('.shards_a/c_%s' % upper, next(self.ts),
+                           lower, upper, state * 100, state * 1000,
+                           meta_timestamp=next(self.ts),
+                           state=state, state_timestamp=next(self.ts)))
+            lower = upper
+        # create container
+        headers = {'X-Timestamp': next(self.ts).normal}
+        req = Request.blank(
+            '/sda1/p/a/c', method='PUT', headers=headers)
+        self.assertIn(
+            req.get_response(self.controller).status_int, (201, 202))
+        # PUT some shard ranges
+        headers = {'X-Timestamp': next(self.ts).normal,
+                   'X-Backend-Record-Type': 'shard'}
+        body = json.dumps([dict(sr) for sr in shard_ranges])
+        req = Request.blank(
+            '/sda1/p/a/c', method='PUT', headers=headers, body=body)
+        self.assertEqual(202, req.get_response(self.controller).status_int)
+
+        def do_test(params, expected_status):
+            params['format'] = 'json'
+            headers = {'X-Backend-Record-Type': 'shard'}
+            req = Request.blank('/sda1/p/a/c', method='GET',
+                                headers=headers, params=params)
+            with mock_timestamp_now(ts_now):
+                resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, expected_status)
+            self.assertEqual(resp.content_type, 'text/html')
+            self.assertNotIn('X-Backend-Record-Type', resp.headers)
+            self.assertNotIn('X-Backend-Sharding-State', resp.headers)
+            self.assertNotIn('X-Container-Object-Count', resp.headers)
+            self.assertNotIn('X-Container-Bytes-Used', resp.headers)
+            self.assertNotIn('X-Timestamp', resp.headers)
+            self.assertNotIn('X-PUT-Timestamp', resp.headers)
+
+        do_test({'states': 'bad'}, 400)
+        do_test({'limit': str(constraints.CONTAINER_LISTING_LIMIT + 1)}, 412)
+        with mock.patch('swift.container.server.check_drive',
+                        side_effect=ValueError('sda1 is not mounted')):
+            do_test({}, 507)
+
+        # delete the container
+        req = Request.blank('/sda1/p/a/c', method='DELETE',
+                            headers={'X-Timestamp': next(self.ts).normal})
+        self.assertEqual(204, req.get_response(self.controller).status_int)
+
+        do_test({'states': 'bad'}, 404)
+        self.assertEqual(
+            'GET_shard.timing',
+            self.logger.statsd_client.calls['timing_since'][-2][0][0])
+        self.assertEqual(
+            'GET.timing',
+            self.logger.statsd_client.calls['timing_since'][-1][0][0])
+
+    def test_GET_shard_ranges_auditing(self):
+        # verify that states=auditing causes own shard range to be included
+        def put_shard_ranges(shard_ranges):
+            headers = {'X-Timestamp': next(self.ts).normal,
+                       'X-Backend-Record-Type': 'shard'}
+            body = json.dumps([dict(sr) for sr in shard_ranges])
+            req = Request.blank(
+                '/sda1/p/a/c', method='PUT', headers=headers, body=body)
+            self.assertEqual(202, req.get_response(self.controller).status_int)
+
+        def do_test(ts_now, extra_params):
+            headers = {'X-Backend-Record-Type': 'shard',
+                       'X-Backend-Include-Deleted': 'True'}
+            params = {'format': 'json'}
+            if extra_params:
+                params.update(extra_params)
+            req = Request.blank('/sda1/p/a/c?format=json', method='GET',
+                                headers=headers, params=params)
+            with mock_timestamp_now(ts_now):
+                resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual(resp.content_type, 'application/json')
+            self.assertIn('X-Backend-Record-Type', resp.headers)
+            self.assertEqual('shard', resp.headers['X-Backend-Record-Type'])
+            return resp
+
+        # initially not all shards are shrinking and root is sharded
+        own_sr = ShardRange('a/c', next(self.ts), '', '',
+                            state=ShardRange.SHARDED)
+        shard_bounds = [('', 'f', ShardRange.SHRUNK, True),
+                        ('f', 't', ShardRange.SHRINKING, False),
+                        ('t', '', ShardRange.ACTIVE, False)]
+        shard_ranges = [
+            ShardRange('.shards_a/_%s' % upper, next(self.ts),
+                       lower, upper, state=state, deleted=deleted)
+            for (lower, upper, state, deleted) in shard_bounds]
+        overlap = ShardRange('.shards_a/c_bad', next(self.ts), '', 'f',
+                             state=ShardRange.FOUND)
+
+        # create container and PUT some shard ranges
+        headers = {'X-Timestamp': next(self.ts).normal}
+        req = Request.blank(
+            '/sda1/p/a/c', method='PUT', headers=headers)
+        self.assertIn(
+            req.get_response(self.controller).status_int, (201, 202))
+        put_shard_ranges(shard_ranges + [own_sr, overlap])
+
+        # do *not* expect own shard range in default case (no states param)
+        ts_now = next(self.ts)
+        expected = [dict(sr, last_modified=sr.timestamp.isoformat)
+                    for sr in [overlap] + shard_ranges]
+        resp = do_test(ts_now, {})
+        self.assertEqual(expected, json.loads(resp.body))
+
+        # expect own shard range to be included when states=auditing
+        expected = [dict(sr, last_modified=sr.timestamp.isoformat)
+                    for sr in shard_ranges + [own_sr]]
+        resp = do_test(ts_now, {'states': 'auditing'})
+        self.assertEqual(expected, json.loads(resp.body))
+
+        # expect own shard range to be included, marker/end_marker respected
+        expected = [dict(sr, last_modified=sr.timestamp.isoformat)
+                    for sr in shard_ranges[1:2] + [own_sr]]
+        resp = do_test(ts_now, {'marker': 'f', 'end_marker': 't',
+                                'states': 'auditing'})
+        self.assertEqual(expected, json.loads(resp.body))
+
+        # update shards to all shrinking and root to active
+        shard_ranges[-1].update_state(ShardRange.SHRINKING, next(self.ts))
+        own_sr.update_state(ShardRange.ACTIVE, next(self.ts))
+        put_shard_ranges(shard_ranges + [own_sr])
+
+        # do *not* expect own shard range in default case (no states param)
+        ts_now = next(self.ts)
+        expected = [dict(sr, last_modified=sr.timestamp.isoformat)
+                    for sr in [overlap] + shard_ranges]
+        resp = do_test(ts_now, {})
+        self.assertEqual(expected, json.loads(resp.body))
+
+        # expect own shard range to be included when states=auditing
+        expected = [dict(sr, last_modified=sr.timestamp.isoformat)
+                    for sr in shard_ranges[:2] + [own_sr] + shard_ranges[2:]]
+        resp = do_test(ts_now, {'states': 'auditing'})
+        self.assertEqual(expected, json.loads(resp.body))
+
+        # expect own shard range to be included, marker/end_marker respected
+        expected = [dict(sr, last_modified=sr.timestamp.isoformat)
+                    for sr in shard_ranges[1:2] + [own_sr]]
+        resp = do_test(ts_now, {'marker': 'f', 'end_marker': 't',
+                                'states': 'auditing'})
+        self.assertEqual(expected, json.loads(resp.body))
+
+    def _do_get_namespaces_unsharded(self, root_path, path,
+                                     params, expected_states):
+        # make a shard container
+        shard_ranges = []
+        lower = ''
+        for state in sorted(ShardRange.STATES.keys()):
+            upper = str(state)
+            shard_ranges.append(
+                ShardRange('.shards_a/c_%s' % upper, next(self.ts),
+                           lower, upper, state * 100, state * 1000,
+                           meta_timestamp=next(self.ts),
+                           state=state, state_timestamp=next(self.ts)))
+            lower = upper
+        expected_sr = [
+            sr for sr in shard_ranges if sr.state in expected_states]
+        own_shard_range = ShardRange(path, next(self.ts), '', '',
+                                     state=ShardRange.ACTIVE)
+        filler_sr = own_shard_range.copy(lower=expected_sr[-1].upper)
+        expected_sr.append(filler_sr)
+        expected_ns = [{'name': sr.name, 'lower': sr.lower_str,
+                        'upper': sr.upper_str} for sr in expected_sr]
+        headers = {'X-Timestamp': next(self.ts).normal}
+
+        # create container
+        req = Request.blank(
+            '/sda1/p/%s' % path, method='PUT', headers=headers)
+        self.assertIn(
+            req.get_response(self.controller).status_int, (201, 202))
+        # PUT some shard ranges
+        headers = {'X-Timestamp': next(self.ts).normal,
+                   'X-Container-Sysmeta-Shard-Root': root_path,
+                   'X-Backend-Record-Type': 'shard'}
+        body = json.dumps(
+            [dict(sr) for sr in shard_ranges + [own_shard_range]])
+        req = Request.blank(
+            '/sda1/p/%s' % path, method='PUT', headers=headers, body=body)
+        self.assertEqual(202, req.get_response(self.controller).status_int)
+        # GET namespaces.
+        req = Request.blank(
+            "/sda1/p/%s?format=json%s" % (path, params),
+            method="GET",
+            headers={
+                "X-Backend-Record-Type": "shard",
+                "X-Backend-Record-shard-format": "namespace",
+                "X-Backend-Override-Shard-Name-Filter": "sharded",
+            },
+        )
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.content_type, 'application/json')
+        self.assertEqual(expected_ns, json.loads(resp.body))
+        self.assertIn('X-Backend-Record-Type', resp.headers)
+        self.assertEqual(
+            'shard', resp.headers['X-Backend-Record-Type'])
+        self.assertEqual(
+            'namespace', resp.headers['X-Backend-Record-Shard-Format'])
+        self.assertNotIn(
+            'X-Backend-Override-Shard-Name-Filter', resp.headers)
+        # GET shard ranges to cross-check.
+        req = Request.blank('/sda1/p/%s?format=json%s' %
+                            (path, params), method='GET',
+                            headers={'X-Backend-Record-Type': 'shard'})
+        resp = req.get_response(self.controller)
+        self.assertIn('X-Backend-Record-Type', resp.headers)
+        self.assertEqual(
+            'shard', resp.headers['X-Backend-Record-Type'])
+        self.assertIn('X-Backend-Record-Shard-Format', resp.headers)
+        self.assertEqual(
+            'full', resp.headers['X-Backend-Record-Shard-Format'])
+        raw_sr = json.loads(resp.body)
+        expected_sr = [{'name': sr['name'], 'lower': sr['lower'],
+                        'upper': sr['upper']}
+                       for sr in raw_sr]
+        self.assertEqual(expected_ns, expected_sr)
+        # GET shard ranges with explicit 'full' shard format.
+        req = Request.blank(
+            "/sda1/p/%s?format=json%s" % (path, params),
+            method="GET",
+            headers={
+                "X-Backend-Record-Type": "shard",
+                "X-Backend-Record-shard-format": "full",
+            },
+        )
+        resp = req.get_response(self.controller)
+        self.assertIn('X-Backend-Record-Type', resp.headers)
+        self.assertEqual(
+            'shard', resp.headers['X-Backend-Record-Type'])
+        self.assertIn('X-Backend-Record-Shard-Format', resp.headers)
+        self.assertEqual(
+            'full', resp.headers['X-Backend-Record-Shard-Format'])
+        self.assertEqual(raw_sr, json.loads(resp.body))
+
+    def test_GET_namespaces_unsharded_root_state_listing(self):
+        # root's namespaces for listing
+        root_path = container_path = 'a/c'
+        params = '&states=listing'
+        expected_states = [
+            ShardRange.CLEAVED, ShardRange.ACTIVE, ShardRange.SHARDING,
+            ShardRange.SHRINKING]
+        self._do_get_namespaces_unsharded(
+            root_path, container_path, params, expected_states)
+
+    def test_GET_namespaces_unsharded_subshard_state_listing(self):
+        # shard's namespaces for listing
+        root_path = 'a/c'
+        container_path = '.shards_a/c'
+        params = '&states=listing'
+        expected_states = [
+            ShardRange.CLEAVED, ShardRange.ACTIVE, ShardRange.SHARDING,
+            ShardRange.SHRINKING]
+        self._do_get_namespaces_unsharded(
+            root_path, container_path, params, expected_states)
+
+    def test_GET_namespaces_unsharded_root_state_updating(self):
+        # root's namespaces for updating
+        root_path = container_path = 'a/c'
+        params = '&states=updating'
+        expected_states = [
+            ShardRange.CREATED, ShardRange.CLEAVED, ShardRange.ACTIVE,
+            ShardRange.SHARDING]
+        container_path = root_path
+        self._do_get_namespaces_unsharded(
+            root_path, container_path, params, expected_states)
+
+    def test_GET_namespaces_unsharded_subshard_state_updating(self):
+        # shard's namespaces for updating
+        root_path = 'a/c'
+        container_path = '.shards_a/c'
+        params = '&states=updating'
+        expected_states = [
+            ShardRange.CREATED, ShardRange.CLEAVED, ShardRange.ACTIVE,
+            ShardRange.SHARDING]
+        self._do_get_namespaces_unsharded(
+            root_path, container_path, params, expected_states)
+
+    def _do_get_namespaces_sharded(self, root_path, path,
+                                   params, expected_states):
+        # make a shard container
+        shard_ranges = []
+        lower = ''
+        for state in sorted(ShardRange.STATES.keys()):
+            upper = str(state)
+            shard_ranges.append(
+                ShardRange('.shards_a/c_%s' % upper, next(self.ts),
+                           lower, upper, state * 100, state * 1000,
+                           meta_timestamp=next(self.ts),
+                           state=state, state_timestamp=next(self.ts)))
+            lower = upper
+        expected_sr = [
+            sr for sr in shard_ranges if sr.state in expected_states]
+        own_shard_range = ShardRange(path, next(self.ts), '', '',
+                                     100, 1000,
+                                     meta_timestamp=next(self.ts),
+                                     state=ShardRange.ACTIVE,
+                                     state_timestamp=next(self.ts),
+                                     epoch=next(self.ts))
+        filler_sr = own_shard_range.copy(lower=expected_sr[-1].upper)
+        expected_sr.append(filler_sr)
+        expected_ns = [{'name': sr.name, 'lower': sr.lower_str,
+                        'upper': sr.upper_str} for sr in expected_sr]
+        headers = {'X-Timestamp': next(self.ts).normal}
+
+        # create container
+        req = Request.blank(
+            '/sda1/p/%s' % path, method='PUT', headers=headers)
+        self.assertIn(
+            req.get_response(self.controller).status_int, (201, 202))
+        # PUT some shard ranges
+        headers = {'X-Timestamp': next(self.ts).normal,
+                   'X-Container-Sysmeta-Shard-Root': root_path,
+                   'X-Backend-Record-Type': 'shard'}
+        body = json.dumps(
+            [dict(sr) for sr in shard_ranges + [own_shard_range]])
+        req = Request.blank(
+            '/sda1/p/%s' % path, method='PUT', headers=headers, body=body)
+        self.assertEqual(202, req.get_response(self.controller).status_int)
+
+        # set broker to sharded state so
+        # X-Backend-Override-Shard-Name-Filter does have effect
+        shard_broker = self.controller._get_container_broker(
+            'sda1', 'p', '.shards_a', 'c')
+        self.assertTrue(shard_broker.set_sharding_state())
+        self.assertTrue(shard_broker.set_sharded_state())
+
+        # GET namespaces.
+        req = Request.blank(
+            "/sda1/p/%s?format=json%s" % (path, params),
+            method="GET",
+            headers={
+                "X-Backend-Record-Type": "shard",
+                "X-Backend-Record-shard-format": "namespace",
+                "X-Backend-Override-Shard-Name-Filter": "sharded",
+            },
+        )
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.content_type, 'application/json')
+        self.assertEqual(expected_ns, json.loads(resp.body))
+        self.assertIn('X-Backend-Record-Type', resp.headers)
+        self.assertEqual(
+            'shard', resp.headers['X-Backend-Record-Type'])
+        self.assertEqual(
+            'namespace', resp.headers['X-Backend-Record-Shard-Format'])
+        self.assertIn('X-Backend-Override-Shard-Name-Filter', resp.headers)
+        self.assertTrue(
+            resp.headers['X-Backend-Override-Shard-Name-Filter'])
+        # GET shard ranges to cross-check.
+        req = Request.blank(
+            "/sda1/p/%s?format=json%s" % (path, params),
+            method="GET",
+            headers={
+                "X-Backend-Record-Type": "shard",
+                "X-Backend-Record-shard-format": "full",
+                "X-Backend-Override-Shard-Name-Filter": "sharded",
+            },
+        )
+        resp = req.get_response(self.controller)
+        self.assertIn('X-Backend-Record-Type', resp.headers)
+        self.assertEqual(
+            'shard', resp.headers['X-Backend-Record-Type'])
+        self.assertIn('X-Backend-Record-Shard-Format', resp.headers)
+        self.assertEqual(
+            'full', resp.headers['X-Backend-Record-Shard-Format'])
+        raw_sr = json.loads(resp.body)
+        expected_sr = [{'name': sr['name'], 'lower': sr['lower'],
+                        'upper': sr['upper']}
+                       for sr in raw_sr]
+        self.assertEqual(expected_ns, expected_sr)
+
+    def test_GET_namespaces_sharded_subshard_state_listing(self):
+        # shard's namespaces for listing
+        root_path = 'a/c'
+        container_path = '.shards_a/c'
+        params = '&states=listing'
+        expected_states = [
+            ShardRange.CLEAVED, ShardRange.ACTIVE, ShardRange.SHARDING,
+            ShardRange.SHRINKING]
+        self._do_get_namespaces_sharded(
+            root_path, container_path, params, expected_states)
+
+    def test_GET_namespaces_sharded_subshard_state_updating(self):
+        # shard's namespaces for updating
+        root_path = 'a/c'
+        container_path = '.shards_a/c'
+        params = '&states=updating'
+        expected_states = [
+            ShardRange.CREATED, ShardRange.CLEAVED, ShardRange.ACTIVE,
+            ShardRange.SHARDING]
+        self._do_get_namespaces_sharded(
+            root_path, container_path, params, expected_states)
+
+    def _do_create_container_for_GET_namespaces(self):
+        # make a container
+        ts_put = next(self.ts)
+        headers = {'X-Timestamp': ts_put.normal}
+        req = Request.blank('/sda1/p/a/c', method='PUT', headers=headers)
+        self.assertEqual(201, req.get_response(self.controller).status_int)
+        # PUT some shard ranges
+        shard_bounds = [('', 'apple', ShardRange.SHRINKING),
+                        ('apple', 'ham', ShardRange.CLEAVED),
+                        ('ham', 'salami', ShardRange.ACTIVE),
+                        ('salami', 'yoghurt', ShardRange.CREATED),
+                        ('yoghurt', '', ShardRange.FOUND),
+                        ]
+        shard_ranges = [
+            ShardRange('.sharded_a/_%s' % upper, next(self.ts),
+                       lower, upper,
+                       i * 100, i * 1000, meta_timestamp=next(self.ts),
+                       state=state, state_timestamp=next(self.ts))
+            for i, (lower, upper, state) in enumerate(shard_bounds)]
+        for shard_range in shard_ranges:
+            self._put_shard_range(shard_range)
+
+        broker = self.controller._get_container_broker('sda1', 'p', 'a', 'c')
+        self.assertTrue(broker.is_root_container())  # sanity
+        self._assert_shard_ranges_equal(shard_ranges,
+                                        broker.get_shard_ranges())
+
+        return shard_ranges
+
+    def test_GET_namespaces_other_params(self):
+        shard_ranges = self._do_create_container_for_GET_namespaces()
+        ts_now = Timestamp.now()  # used when mocking Timestamp.now()
+
+        # Test namespace GET with 'include' or 'marker/end_marker' or 'reverse'
+        # parameters which are not supported.
+        def check_namespace_GET(expected_namespaces, path, params=''):
+            req = Request.blank(
+                '/sda1/p/%s?format=json%s' % (path, params), method='GET',
+                headers={
+                    "X-Backend-Record-Type": "shard",
+                    "X-Backend-Record-shard-format": "namespace",
+                })
+            with mock_timestamp_now(ts_now):
+                resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual(resp.content_type, 'application/json')
+            expected_ns = [dict(ns) for ns in expected_namespaces]
+            self.assertEqual(expected_ns, json.loads(resp.body))
+            self.assertIn('X-Backend-Record-Type', resp.headers)
+            self.assertEqual('shard', resp.headers['X-Backend-Record-Type'])
+            self.assertIn('X-Backend-Record-Shard-Format', resp.headers)
+            self.assertEqual(
+                'namespace', resp.headers['X-Backend-Record-Shard-Format'])
+
+        namespaces = [Namespace(sr.name, sr.lower, sr.upper)
+                      for sr in shard_ranges]
+        check_namespace_GET(
+            namespaces[:3], 'a/c',
+            params='&states=listing&end_marker=pickle')
+        check_namespace_GET(
+            reversed(namespaces[:3]), 'a/c',
+            params='&states=listing&reverse=true&marker=pickle')
+        check_namespace_GET(namespaces[1:4], 'a/c',
+                            params='&states=updating&end_marker=treacle')
+        check_namespace_GET(
+            reversed(namespaces[1:4]), 'a/c',
+            params='&states=updating&reverse=true&marker=treacle')
+        check_namespace_GET(namespaces[1:2],
+                            'a/c', params='&includes=cheese')
+        check_namespace_GET(namespaces[1:2], 'a/c', params='&includes=ham')
+        check_namespace_GET(reversed(namespaces),
+                            'a/c', params='&reverse=true')
+
+    def test_GET_namespaces_not_supported(self):
+        self._do_create_container_for_GET_namespaces()
+
+        # Test namespace GET with 'X-Backend-Include-Deleted' header.
+        req = Request.blank(
+            '/sda1/p/%s?format=json%s' % ('a/c', '&states=listing'),
+            method='GET',
+            headers={
+                "X-Backend-Record-Type": "shard",
+                "X-Backend-Record-shard-format": "namespace",
+                'X-Backend-Include-Deleted': 'True'
+            })
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status, '400 Bad Request')
+        self.assertEqual(resp.body, b'No include_deleted for namespace GET')
+
+        # Test namespace GET with 'auditing' state in query params.
+        req = Request.blank(
+            '/sda1/p/%s?format=json%s' % ('a/c', '&states=auditing'),
+            method='GET',
+            headers={
+                "X-Backend-Record-Type": "shard",
+                "X-Backend-Record-shard-format": "namespace",
+            })
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status, '400 Bad Request')
+        self.assertEqual(resp.body, b'No auditing state for namespace GET')
+
+    def test_GET_namespaces_errors(self):
+        self._do_create_container_for_GET_namespaces()
+
+        def do_test(params, expected_status):
+            params['format'] = 'json'
+            headers = {'X-Backend-Record-Type': 'shard',
+                       "X-Backend-Record-shard-format": "namespace"}
+            req = Request.blank('/sda1/p/a/c', method='GET',
+                                headers=headers, params=params)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, expected_status)
+            self.assertEqual(resp.content_type, 'text/html')
+            self.assertNotIn('X-Backend-Record-Type', resp.headers)
+            self.assertNotIn('X-Backend-Record-shard-format', resp.headers)
+            self.assertNotIn('X-Backend-Sharding-State', resp.headers)
+            self.assertNotIn('X-Container-Object-Count', resp.headers)
+            self.assertNotIn('X-Container-Bytes-Used', resp.headers)
+            self.assertNotIn('X-Timestamp', resp.headers)
+            self.assertNotIn('X-PUT-Timestamp', resp.headers)
+
+        do_test({'states': 'bad'}, 400)
+
+        with mock.patch('swift.container.server.check_drive',
+                        side_effect=ValueError('sda1 is not mounted')):
+            do_test({}, 507)
+
+        # delete the container
+        req = Request.blank('/sda1/p/a/c', method='DELETE',
+                            headers={'X-Timestamp': Timestamp.now().normal})
+        self.assertEqual(204, req.get_response(self.controller).status_int)
+
+        do_test({'states': 'bad'}, 404)
+
+    def test_GET_auto_record_type(self):
+        # make a container
+        ts_now = Timestamp.now()  # used when mocking Timestamp.now()
+        headers = {'X-Timestamp': next(self.ts).normal}
+        req = Request.blank('/sda1/p/a/c', method='PUT', headers=headers)
+        self.assertEqual(201, req.get_response(self.controller).status_int)
+        # PUT some objects
+        objects = [{'name': 'obj_%d' % i,
+                    'x-timestamp': next(self.ts).normal,
+                    'x-content-type': 'text/plain',
+                    'x-etag': 'etag_%d' % i,
+                    'x-size': 1024 * i
+                    } for i in range(2)]
+        for obj in objects:
+            req = Request.blank('/sda1/p/a/c/%s' % obj['name'], method='PUT',
+                                headers=obj)
+            self._update_object_put_headers(req)
+            resp = req.get_response(self.controller)
+            self.assertEqual(201, resp.status_int)
+        # PUT some shard ranges
+        shard_bounds = [('', 'm', ShardRange.CLEAVED),
+                        ('m', '', ShardRange.CREATED)]
+        shard_ranges = [
+            ShardRange('.sharded_a/_%s' % upper, next(self.ts),
+                       lower, upper,
+                       i * 100, i * 1000, meta_timestamp=next(self.ts),
+                       state=state, state_timestamp=next(self.ts))
+            for i, (lower, upper, state) in enumerate(shard_bounds)]
+        for shard_range in shard_ranges:
+            self._put_shard_range(shard_range)
+
+        broker = self.controller._get_container_broker('sda1', 'p', 'a', 'c')
+
+        def assert_GET_objects(req, expected_objects):
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual(resp.content_type, 'application/json')
+            expected = [
+                dict(hash=obj['x-etag'], bytes=obj['x-size'],
+                     content_type=obj['x-content-type'],
+                     last_modified=Timestamp(obj['x-timestamp']).isoformat,
+                     name=obj['name']) for obj in expected_objects]
+            self.assertEqual(expected, json.loads(resp.body))
+            self.assertIn('X-Backend-Record-Type', resp.headers)
+            self.assertEqual(
+                'object', resp.headers.pop('X-Backend-Record-Type'))
+            self.assertEqual(
+                str(POLICIES.default.idx),
+                resp.headers.pop('X-Backend-Storage-Policy-Index'))
+            self.assertEqual(
+                str(POLICIES.default.idx),
+                resp.headers.pop('X-Backend-Record-Storage-Policy-Index'))
+            resp.headers.pop('Content-Length')
+            return resp
+
+        def assert_GET_shard_ranges(req, expected_shard_ranges):
+            with mock_timestamp_now(ts_now):
+                resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual(resp.content_type, 'application/json')
+            expected = [
+                dict(sr, last_modified=Timestamp(sr.timestamp).isoformat)
+                for sr in expected_shard_ranges]
+            self.assertEqual(expected, json.loads(resp.body))
+            self.assertIn('X-Backend-Record-Type', resp.headers)
+            self.assertEqual(
+                'shard', resp.headers.pop('X-Backend-Record-Type'))
+            self.assertIn('X-Backend-Record-Shard-Format', resp.headers)
+            self.assertEqual(
+                'full', resp.headers.pop('X-Backend-Record-Shard-Format'))
+            self.assertEqual(
+                str(POLICIES.default.idx),
+                resp.headers.pop('X-Backend-Storage-Policy-Index'))
+            self.assertNotIn('X-Backend-Record-Storage-Policy-Index',
+                             resp.headers)
+            resp.headers.pop('Content-Length')
+            return resp
+
+        # unsharded
+        req = Request.blank('/sda1/p/a/c?format=json', method='GET',
+                            headers={'X-Backend-Record-Type': 'auto'})
+        resp = assert_GET_objects(req, objects)
+        headers = resp.headers
+        req = Request.blank('/sda1/p/a/c?format=json', method='GET',
+                            headers={'X-Backend-Record-Type': 'shard'})
+        resp = assert_GET_shard_ranges(req, shard_ranges)
+        self.assertEqual(headers, resp.headers)
+        req = Request.blank('/sda1/p/a/c?format=json', method='GET',
+                            headers={'X-Backend-Record-Type': 'object'})
+        resp = assert_GET_objects(req, objects)
+        self.assertEqual(headers, resp.headers)
+        req = Request.blank('/sda1/p/a/c?format=json', method='GET')
+        resp = assert_GET_objects(req, objects)
+        self.assertEqual(headers, resp.headers)
+
+        # move to sharding state
+        broker.enable_sharding(next(self.ts))
+        self.assertTrue(broker.set_sharding_state())
+        req = Request.blank('/sda1/p/a/c?format=json', method='GET',
+                            headers={'X-Backend-Record-Type': 'auto'})
+        resp = assert_GET_shard_ranges(req, shard_ranges)
+        headers = resp.headers
+        req = Request.blank('/sda1/p/a/c?format=json', method='GET',
+                            headers={'X-Backend-Record-Type': 'shard'})
+        resp = assert_GET_shard_ranges(req, shard_ranges)
+        self.assertEqual(headers, resp.headers)
+        req = Request.blank('/sda1/p/a/c?format=json', method='GET',
+                            headers={'X-Backend-Record-Type': 'object'})
+        resp = assert_GET_objects(req, objects)
+        self.assertEqual(headers, resp.headers)
+        req = Request.blank('/sda1/p/a/c?format=json', method='GET')
+        resp = assert_GET_objects(req, objects)
+        self.assertEqual(headers, resp.headers)
+
+        # limit is applied to objects but not shard ranges
+        req = Request.blank('/sda1/p/a/c?format=json&limit=1', method='GET',
+                            headers={'X-Backend-Record-Type': 'auto'})
+        resp = assert_GET_shard_ranges(req, shard_ranges)
+        headers = resp.headers
+        req = Request.blank('/sda1/p/a/c?format=json&limit=1', method='GET',
+                            headers={'X-Backend-Record-Type': 'shard'})
+        resp = assert_GET_shard_ranges(req, shard_ranges)
+        self.assertEqual(headers, resp.headers)
+        req = Request.blank('/sda1/p/a/c?format=json&limit=1', method='GET',
+                            headers={'X-Backend-Record-Type': 'object'})
+        resp = assert_GET_objects(req, objects[:1])
+        self.assertEqual(headers, resp.headers)
+        req = Request.blank('/sda1/p/a/c?format=json&limit=1', method='GET')
+        resp = assert_GET_objects(req, objects[:1])
+        self.assertEqual(headers, resp.headers)
+
+        # move to sharded state
+        self.assertTrue(broker.set_sharded_state())
+        req = Request.blank('/sda1/p/a/c?format=json', method='GET',
+                            headers={'X-Backend-Record-Type': 'auto'})
+        resp = assert_GET_shard_ranges(req, shard_ranges)
+        headers = resp.headers
+        req = Request.blank('/sda1/p/a/c?format=json', method='GET',
+                            headers={'X-Backend-Record-Type': 'shard'})
+        resp = assert_GET_shard_ranges(req, shard_ranges)
+        self.assertEqual(headers, resp.headers)
+        req = Request.blank('/sda1/p/a/c?format=json', method='GET',
+                            headers={'X-Backend-Record-Type': 'object'})
+        resp = assert_GET_objects(req, [])
+        self.assertEqual(headers, resp.headers)
+        req = Request.blank('/sda1/p/a/c?format=json', method='GET')
+        resp = assert_GET_objects(req, [])
+        self.assertEqual(headers, resp.headers)
+
+    def test_PUT_GET_to_sharding_container(self):
+        broker = self.controller._get_container_broker('sda1', 'p', 'a', 'c')
+        headers = {'X-Timestamp': next(self.ts).normal}
+        req = Request.blank('/sda1/p/a/c', method='PUT', headers=headers)
+        self.assertEqual(201, req.get_response(self.controller).status_int)
+
+        def do_update(name, timestamp=None, headers=None):
+            # Make a PUT request to container controller to update an object
+            timestamp = timestamp or next(self.ts)
+            headers = headers or {}
+            headers.update({'X-Timestamp': timestamp.internal,
+                            'X-Size': 17,
+                            'X-Content-Type': 'text/plain',
+                            'X-Etag': 'fake etag'})
+            req = Request.blank(
+                '/sda1/p/a/c/%s' % name, method='PUT', headers=headers)
+            self._update_object_put_headers(req)
+            resp = req.get_response(self.controller)
+            self.assertEqual(201, resp.status_int)
+
+        def get_api_listing():
+            req = Request.blank(
+                '/sda1/p/a/c', method='GET', params={'format': 'json'})
+            resp = req.get_response(self.controller)
+            self.assertEqual(200, resp.status_int)
+            return [obj['name'] for obj in json.loads(resp.body)]
+
+        def assert_broker_rows(broker, expected_names, expected_max_row):
+            self.assertEqual(expected_max_row, broker.get_max_row())
+            with broker.get() as conn:
+                curs = conn.execute('''
+                    SELECT * FROM object WHERE ROWID > -1 ORDER BY ROWID ASC
+                ''')
+                actual = [r[1] for r in curs]
+
+            self.assertEqual(expected_names, actual)
+
+        do_update('unsharded')
+        self.assertEqual(['unsharded'], get_api_listing())
+        assert_broker_rows(broker, ['unsharded'], 1)
+
+        # move container to sharding state
+        broker.enable_sharding(next(self.ts))
+        self.assertTrue(broker.set_sharding_state())
+        assert_broker_rows(broker.get_brokers()[0], ['unsharded'], 1)
+        assert_broker_rows(broker.get_brokers()[1], [], 1)
+
+        # add another update - should not merge into the older db and therefore
+        # not appear in api listing
+        do_update('sharding')
+        self.assertEqual(['unsharded'], get_api_listing())
+        assert_broker_rows(broker.get_brokers()[0], ['unsharded'], 1)
+        assert_broker_rows(broker.get_brokers()[1], ['sharding'], 2)
+
+        orig_lister = swift.container.backend.ContainerBroker.list_objects_iter
+
+        def mock_list_objects_iter(*args, **kwargs):
+            # cause an update to land in the pending file after it has been
+            # flushed by get_info() calls in the container PUT method, but
+            # before it is flushed by the call to list_objects_iter
+            do_update('racing_update')
+            return orig_lister(*args, **kwargs)
+
+        with mock.patch(
+                'swift.container.backend.ContainerBroker.list_objects_iter',
+                mock_list_objects_iter):
+            listing = get_api_listing()
+
+        self.assertEqual(['unsharded'], listing)
+        assert_broker_rows(broker.get_brokers()[0], ['unsharded'], 1)
+        assert_broker_rows(broker.get_brokers()[1], ['sharding'], 2)
+
+        # next listing will flush pending file
+        listing = get_api_listing()
+        self.assertEqual(['unsharded'], listing)
+        assert_broker_rows(broker.get_brokers()[0], ['unsharded'], 1)
+        assert_broker_rows(broker.get_brokers()[1],
+                           ['sharding', 'racing_update'], 3)
+
+    def _check_object_update_redirected_to_shard(self, method):
+        expected_status = 204 if method == 'DELETE' else 201
+        broker = self.controller._get_container_broker('sda1', 'p', 'a', 'c')
+        headers = {'X-Timestamp': next(self.ts).normal}
+        req = Request.blank('/sda1/p/a/c', method='PUT', headers=headers)
+        self.assertEqual(201, req.get_response(self.controller).status_int)
+
+        def do_update(name, timestamp=None, headers=None):
+            # Make a PUT request to container controller to update an object
+            timestamp = timestamp or next(self.ts)
+            headers = headers or {}
+            headers.update({'X-Timestamp': timestamp.internal,
+                            'X-Size': 17,
+                            'X-Content-Type': 'text/plain',
+                            'X-Etag': 'fake etag'})
+            req = Request.blank(
+                '/sda1/p/a/c/%s' % name, method=method, headers=headers)
+            self._update_object_put_headers(req)
+            return req.get_response(self.controller)
+
+        def get_listing(broker_index):
+            # index -1 is always the freshest db
+            sub_broker = broker.get_brokers()[broker_index]
+            return sub_broker.get_objects()
+
+        def assert_not_redirected(obj_name, timestamp=None, headers=None):
+            resp = do_update(obj_name, timestamp=timestamp, headers=headers)
+            self.assertEqual(expected_status, resp.status_int)
+            self.assertNotIn('Location', resp.headers)
+            self.assertNotIn('X-Backend-Redirect-Timestamp', resp.headers)
+
+        def assert_redirected(obj_name, shard_range, headers=None):
+            resp = do_update(obj_name, headers=headers)
+            self.assertEqual(301, resp.status_int)
+            self.assertEqual('/%s/%s' % (shard_range.name, obj_name),
+                             resp.headers['Location'])
+            self.assertEqual(shard_range.timestamp.internal,
+                             resp.headers['X-Backend-Redirect-Timestamp'])
+
+        # sanity check
+        ts_bashful_orig = next(self.ts)
+        mocked_fn = 'swift.container.backend.ContainerBroker.get_shard_ranges'
+        with mock.patch(mocked_fn) as mock_get_shard_ranges:
+            assert_not_redirected('bashful', ts_bashful_orig)
+        mock_get_shard_ranges.assert_not_called()
+
+        shard_ranges = {
+            'dopey': ShardRange(
+                '.sharded_a/sr_dopey', next(self.ts), '', 'dopey'),
+            'happy': ShardRange(
+                '.sharded_a/sr_happy', next(self.ts), 'dopey', 'happy'),
+            '': ShardRange('.sharded_a/sr_', next(self.ts), 'happy', '')
+        }
+        # start with only the middle shard range
+        self._put_shard_range(shard_ranges['happy'])
+
+        # db not yet sharding but shard ranges exist
+        sr_happy = shard_ranges['happy']
+        redirect_states = (
+            ShardRange.CREATED, ShardRange.CLEAVED, ShardRange.ACTIVE,
+            ShardRange.SHARDING)
+        headers = {'X-Backend-Accept-Redirect': 'true'}
+        for state in ShardRange.STATES:
+            self.assertTrue(
+                sr_happy.update_state(state,
+                                      state_timestamp=next(self.ts)))
+            self._put_shard_range(sr_happy)
+            with self.subTest(state=state):
+                obj_name = 'grumpy%s' % state
+                if state in redirect_states:
+                    assert_redirected(obj_name, sr_happy, headers=headers)
+                    self.assertNotIn(obj_name,
+                                     [obj['name'] for obj in get_listing(-1)])
+                else:
+                    assert_not_redirected(obj_name, headers=headers)
+                    self.assertIn(obj_name,
+                                  [obj['name'] for obj in get_listing(-1)])
+                obj_name = 'grumpy%s_no_header' % state
+                with mock.patch(mocked_fn) as mock_get_shard_ranges:
+                    assert_not_redirected(obj_name)
+                mock_get_shard_ranges.assert_not_called()
+                self.assertIn(obj_name,
+                              [obj['name'] for obj in get_listing(-1)])
+
+        # set broker to sharding state
+        broker.enable_sharding(next(self.ts))
+        self.assertTrue(broker.set_sharding_state())
+        for state in ShardRange.STATES:
+            self.assertTrue(
+                sr_happy.update_state(state,
+                                      state_timestamp=next(self.ts)))
+            self._put_shard_range(sr_happy)
+            with self.subTest(state=state):
+                obj_name = 'grumpier%s' % state
+                if state in redirect_states:
+                    assert_redirected(obj_name, sr_happy, headers=headers)
+                    self.assertNotIn(obj_name,
+                                     [obj['name'] for obj in get_listing(-1)])
+                else:
+                    assert_not_redirected(obj_name, headers=headers)
+                    # update goes to fresh db, misplaced
+                    self.assertIn(
+                        obj_name, [obj['name'] for obj in get_listing(-1)])
+                    self.assertNotIn(
+                        obj_name, [obj['name'] for obj in get_listing(0)])
+                obj_name = 'grumpier%s_no_header' % state
+                with mock.patch(mocked_fn) as mock_get_shard_ranges:
+                    assert_not_redirected(obj_name)
+                mock_get_shard_ranges.assert_not_called()
+                self.assertIn(
+                    obj_name, [obj['name'] for obj in get_listing(-1)])
+                # update is misplaced, not in retiring db
+                self.assertNotIn(
+                    obj_name, [obj['name'] for obj in get_listing(0)])
+
+        # no shard for this object yet so it is accepted by root container
+        # and stored in misplaced objects...
+        assert_not_redirected('dopey', timestamp=next(self.ts))
+        self.assertIn('dopey', [obj['name'] for obj in get_listing(-1)])
+        self.assertNotIn('dopey', [obj['name'] for obj in get_listing(0)])
+
+        # now PUT the first shard range
+        sr_dopey = shard_ranges['dopey']
+        sr_dopey.update_state(ShardRange.CLEAVED,
+                              state_timestamp=next(self.ts))
+        self._put_shard_range(sr_dopey)
+        for state in ShardRange.STATES:
+            self.assertTrue(
+                sr_happy.update_state(state,
+                                      state_timestamp=next(self.ts)))
+            self._put_shard_range(sr_happy)
+            with self.subTest(state=state):
+                obj_name = 'dopey%s' % state
+                if state in redirect_states:
+                    assert_redirected(obj_name, sr_happy, headers=headers)
+                    self.assertNotIn(obj_name,
+                                     [obj['name'] for obj in get_listing(-1)])
+                    self.assertNotIn(obj_name,
+                                     [obj['name'] for obj in get_listing(0)])
+                else:
+                    assert_not_redirected(obj_name, headers=headers)
+                    self.assertIn(obj_name,
+                                  [obj['name'] for obj in get_listing(-1)])
+                    self.assertNotIn(obj_name,
+                                     [obj['name'] for obj in get_listing(0)])
+                obj_name = 'dopey%s_no_header' % state
+                with mock.patch(mocked_fn) as mock_get_shard_ranges:
+                    assert_not_redirected(obj_name)
+                mock_get_shard_ranges.assert_not_called()
+                self.assertIn(obj_name,
+                              [obj['name'] for obj in get_listing(-1)])
+                self.assertNotIn(obj_name,
+                                 [obj['name'] for obj in get_listing(0)])
+
+        # further updates to bashful and dopey are now redirected...
+        assert_redirected('bashful', sr_dopey, headers=headers)
+        assert_redirected('dopey', sr_dopey, headers=headers)
+        # ...and existing updates in this container are *not* updated
+        self.assertEqual([ts_bashful_orig.internal],
+                         [obj['created_at'] for obj in get_listing(0)
+                          if obj['name'] == 'bashful'])
+
+        # set broker to sharded state
+        self.assertTrue(broker.set_sharded_state())
+        for state in ShardRange.STATES:
+            self.assertTrue(
+                sr_happy.update_state(state,
+                                      state_timestamp=next(self.ts)))
+            self._put_shard_range(sr_happy)
+            with self.subTest(state=state):
+                obj_name = 'grumpiest%s' % state
+                if state in redirect_states:
+                    assert_redirected(obj_name, sr_happy, headers=headers)
+                    self.assertNotIn(obj_name,
+                                     [obj['name'] for obj in get_listing(-1)])
+                else:
+                    assert_not_redirected(obj_name, headers=headers)
+                    self.assertIn(obj_name,
+                                  [obj['name'] for obj in get_listing(-1)])
+                obj_name = 'grumpiest%s_no_header' % state
+                with mock.patch(mocked_fn) as mock_get_shard_ranges:
+                    assert_not_redirected(obj_name)
+                mock_get_shard_ranges.assert_not_called()
+                self.assertIn(obj_name,
+                              [obj['name'] for obj in get_listing(-1)])
+
+    def test_PUT_object_update_redirected_to_shard(self):
+        self._check_object_update_redirected_to_shard('PUT')
+
+    def test_PUT_container_timing_metrics(self):
+        ts = (Timestamp(t).internal for t in
+              itertools.count(int(time.time())))
+        req = Request.blank('/sda1/p/a/c', method='PUT', headers={
+            'X-Timestamp': next(ts)})
+        with mock.patch('time.time',) as mock_time:
+            mock_time.return_value = 1000.99
+            resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        stats = self.logger.statsd_client.calls['timing_since']
+        self.assertEqual(2, len(stats))
+        self.assertEqual('PUT_container.timing', stats[-2][0][0])
+        self.assertEqual(stats[-2][0][1], 1000.99)
+        self.assertEqual('PUT.timing', stats[-1][0][0])
+        self.assertEqual(stats[-1][0][1], 1000.99)
+
+    def test_PUT_GET_object_timing_metrics(self):
+        ts = (Timestamp(t).internal for t in
+              itertools.count(int(time.time())))
+        req = Request.blank('/sda1/p/a/c', method='PUT', headers={
+            'X-Timestamp': next(ts)})
+        resp = req.get_response(self.controller)
+        # PUT object.
+        self.logger.clear()
+        req = Request.blank(
+            '/sda1/p/a/c/o', method='PUT', headers={
+                'X-Timestamp': next(ts), 'X-Size': 1,
+                'X-Content-Type': 'text/plain', 'X-Etag': 'x'})
+        self._update_object_put_headers(req)
+        with mock.patch('time.time',) as mock_time:
+            mock_time.return_value = 1000.99
+            resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        stats = self.logger.statsd_client.calls['timing_since']
+        self.assertEqual(2, len(stats))
+        self.assertEqual('PUT_object.timing', stats[-2][0][0])
+        self.assertEqual(stats[-2][0][1], 1000.99)
+        self.assertEqual('PUT.timing', stats[-1][0][0])
+        self.assertEqual(stats[-1][0][1], 1000.99)
+
+        # GET object.
+        self.logger.clear()
+        req = Request.blank('/sda1/p/a/c?format=json', method='GET')
+        with mock.patch('time.time',) as mock_time:
+            mock_time.return_value = 1000.99
+            resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.content_type, 'application/json')
+        self.assertEqual('object', resp.headers['X-Backend-Record-Type'])
+        stats = self.logger.statsd_client.calls['timing_since']
+        self.assertEqual(2, len(stats))
+        self.assertEqual('GET_object.timing', stats[-2][0][0])
+        self.assertEqual(stats[-2][0][1], 1000.99)
+        self.assertEqual('GET.timing', stats[-1][0][0])
+        self.assertEqual(stats[-1][0][1], 1000.99)
+
+    def test_PUT_GET_shards_timing_metrics(self):
+        ts = (Timestamp(t).internal for t in
+              itertools.count(int(time.time())))
+        req = Request.blank('/sda1/p/a/c', method='PUT', headers={
+            'X-Timestamp': next(ts)})
+        resp = req.get_response(self.controller)
+        # PUT shard ranges.
+        self.logger.clear()
+        shard_bounds = [('', 'ham', ShardRange.ACTIVE),
+                        ('ham', 'salami', ShardRange.ACTIVE),
+                        ('salami', '', ShardRange.CREATED)]
+        shard_ranges = [
+            ShardRange('.shards_a/_%s' % upper, next(ts),
+                       lower, upper,
+                       i * 100, i * 1000, meta_timestamp=next(ts),
+                       state=state, state_timestamp=next(ts))
+            for i, (lower, upper, state) in enumerate(shard_bounds)]
+        headers = {'X-Backend-Record-Type': 'shard',
+                   'X-Timestamp': next(ts),
+                   'X-Container-Sysmeta-Test': 'set',
+                   'X-Container-Meta-Test': 'persisted'}
+        body = json.dumps([dict(sr) for sr in shard_ranges[:2]])
+        req = Request.blank('/sda1/p/a/c', method='PUT', headers=headers,
+                            body=body)
+        with mock.patch('time.time',) as mock_time:
+            mock_time.return_value = 1000.99
+            resp = req.get_response(self.controller)
+        self.assertEqual(202, resp.status_int)
+        stats = self.logger.statsd_client.calls['timing_since']
+        self.assertEqual(2, len(stats))
+        self.assertEqual('PUT_shard.timing', stats[-2][0][0])
+        self.assertEqual(stats[-2][0][1], 1000.99)
+        self.assertEqual('PUT.timing', stats[-1][0][0])
+        self.assertEqual(stats[-1][0][1], 1000.99)
+
+        # GET shard ranges.
+        self.logger.clear()
+        req = Request.blank('/sda1/p/a/c?format=json', method='GET',
+                            headers={'X-Backend-Record-Type': 'shard'})
+        with mock.patch('time.time',) as mock_time:
+            mock_time.return_value = 1000.99
+            resp = req.get_response(self.controller)
+        self.assertIn('X-Backend-Record-Type', resp.headers)
+        self.assertEqual('shard', resp.headers['X-Backend-Record-Type'])
+        stats = self.logger.statsd_client.calls['timing_since']
+        self.assertEqual(2, len(stats))
+        self.assertEqual('GET_shard.timing', stats[-2][0][0])
+        self.assertEqual(stats[-2][0][1], 1000.99)
+        self.assertEqual('GET.timing', stats[-1][0][0])
+        self.assertEqual(stats[-1][0][1], 1000.99)
+
+    def test_DELETE_object_update_redirected_to_shard(self):
+        self._check_object_update_redirected_to_shard('DELETE')
 
     def test_GET_json(self):
         # make a container
-        req = Request.blank('/sda1/p/a/jsonc', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        resp = self.controller.PUT(req)
+        req = Request.blank(
+            '/sda1/p/a/jsonc', environ={'REQUEST_METHOD': 'PUT',
+                                        'HTTP_X_TIMESTAMP': '0'})
+        resp = req.get_response(self.controller)
         # test an empty container
-        req = Request.blank('/sda1/p/a/jsonc?format=json',
+        req = Request.blank(
+            '/sda1/p/a/jsonc?format=json',
             environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(eval(resp.body), [])
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(json.loads(resp.body), [])
         # fill the container
         for i in range(3):
-            req = Request.blank('/sda1/p/a/jsonc/%s'%i, environ=
-                    {'REQUEST_METHOD': 'PUT',
+            req = Request.blank(
+                '/sda1/p/a/jsonc/%s' % i, environ={
+                    'REQUEST_METHOD': 'PUT',
                     'HTTP_X_TIMESTAMP': '1',
                     'HTTP_X_CONTENT_TYPE': 'text/plain',
                     'HTTP_X_ETAG': 'x',
                     'HTTP_X_SIZE': 0})
-            resp = self.controller.PUT(req)
-            self.assertEquals(resp.status_int, 201)
+            self._update_object_put_headers(req)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 201)
         # test format
-        json_body = [{"name":"0",
-                    "hash":"x",
-                    "bytes":0,
-                    "content_type":"text/plain",
-                    "last_modified":"1970-01-01T00:00:01.000000"},
-                    {"name":"1",
-                    "hash":"x",
-                    "bytes":0,
-                    "content_type":"text/plain",
-                    "last_modified":"1970-01-01T00:00:01.000000"},
-                    {"name":"2",
-                    "hash":"x",
-                    "bytes":0,
-                    "content_type":"text/plain",
-                    "last_modified":"1970-01-01T00:00:01.000000"}]
-
-        req = Request.blank('/sda1/p/a/jsonc?format=json',
-                environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.content_type, 'application/json')
-        self.assertEquals(eval(resp.body), json_body)
-        self.assertEquals(resp.charset, 'utf-8')
+        json_body = [{"name": "0",
+                      "hash": "x",
+                      "bytes": 0,
+                      "content_type": "text/plain",
+                      "last_modified": "1970-01-01T00:00:01.000000"},
+                     {"name": "1",
+                      "hash": "x",
+                      "bytes": 0,
+                      "content_type": "text/plain",
+                      "last_modified": "1970-01-01T00:00:01.000000"},
+                     {"name": "2",
+                      "hash": "x",
+                      "bytes": 0,
+                      "content_type": "text/plain",
+                      "last_modified": "1970-01-01T00:00:01.000000"}]
 
-        resp = self.controller.HEAD(req)
-        self.assertEquals(resp.content_type, 'application/json')
+        req = Request.blank(
+            '/sda1/p/a/jsonc?format=json',
+            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.content_type, 'application/json')
+        self.assertEqual(
+            resp.last_modified.strftime("%a, %d %b %Y %H:%M:%S GMT"),
+            time.strftime("%a, %d %b %Y %H:%M:%S GMT", time.gmtime(0)))
+        self.assertEqual(json.loads(resp.body), json_body)
+        self.assertEqual(resp.charset, 'utf-8')
+        self.assertEqual(
+            'GET_object.timing',
+            self.logger.statsd_client.calls['timing_since'][-2][0][0])
+        self.assertEqual(
+            'GET.timing',
+            self.logger.statsd_client.calls['timing_since'][-1][0][0])
+
+        req = Request.blank(
+            '/sda1/p/a/jsonc?format=json',
+            environ={'REQUEST_METHOD': 'HEAD'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.content_type, 'application/json')
 
         for accept in ('application/json', 'application/json;q=1.0,*/*;q=0.9',
-                 '*/*;q=0.9,application/json;q=1.0', 'application/*'):
-            req = Request.blank('/sda1/p/a/jsonc',
-                    environ={'REQUEST_METHOD': 'GET'})
+                       '*/*;q=0.9,application/json;q=1.0', 'application/*'):
+            req = Request.blank(
+                '/sda1/p/a/jsonc',
+                environ={'REQUEST_METHOD': 'GET'})
             req.accept = accept
-            resp = self.controller.GET(req)
-            self.assertEquals(eval(resp.body), json_body,
+            resp = req.get_response(self.controller)
+            self.assertEqual(
+                json.loads(resp.body), json_body,
                 'Invalid body for Accept: %s' % accept)
-            self.assertEquals(resp.content_type, 'application/json',
+            self.assertEqual(
+                resp.content_type, 'application/json',
                 'Invalid content_type for Accept: %s' % accept)
 
-            resp = self.controller.HEAD(req)
-            self.assertEquals(resp.content_type, 'application/json',
+            req = Request.blank(
+                '/sda1/p/a/jsonc',
+                environ={'REQUEST_METHOD': 'HEAD'})
+            req.accept = accept
+            resp = req.get_response(self.controller)
+            self.assertEqual(
+                resp.content_type, 'application/json',
                 'Invalid content_type for Accept: %s' % accept)
 
+    def test_GET_non_ascii(self):
+        # make a container
+        req = Request.blank(
+            '/sda1/p/a/jsonc', environ={'REQUEST_METHOD': 'PUT',
+                                        'HTTP_X_TIMESTAMP': '0'})
+        resp = req.get_response(self.controller)
+
+        noodles = [u"Spätzle", u"ラーメン"]
+        for n in noodles:
+            req = Request.blank(
+                '/sda1/p/a/jsonc/%s' % bytes_to_wsgi(n.encode("utf-8")),
+                environ={'REQUEST_METHOD': 'PUT',
+                         'HTTP_X_TIMESTAMP': '1',
+                         'HTTP_X_CONTENT_TYPE': 'text/plain',
+                         'HTTP_X_ETAG': 'x',
+                         'HTTP_X_SIZE': 0})
+            self._update_object_put_headers(req)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 201)  # sanity check
+
+        json_body = [{"name": noodles[0],
+                      "hash": "x",
+                      "bytes": 0,
+                      "content_type": "text/plain",
+                      "last_modified": "1970-01-01T00:00:01.000000"},
+                     {"name": noodles[1],
+                      "hash": "x",
+                      "bytes": 0,
+                      "content_type": "text/plain",
+                      "last_modified": "1970-01-01T00:00:01.000000"}]
+
+        # JSON
+        req = Request.blank(
+            '/sda1/p/a/jsonc?format=json',
+            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)  # sanity check
+        self.assertEqual(json.loads(resp.body), json_body)
+
+        # Plain text
+        text_body = u''.join(n + u"\n" for n in noodles).encode('utf-8')
+        req = Request.blank(
+            '/sda1/p/a/jsonc?format=text',
+            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)  # sanity check
+        self.assertEqual(resp.body, text_body)
+
     def test_GET_plain(self):
         # make a container
-        req = Request.blank('/sda1/p/a/plainc', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        resp = self.controller.PUT(req)
+        req = Request.blank(
+            '/sda1/p/a/plainc', environ={'REQUEST_METHOD': 'PUT',
+                                         'HTTP_X_TIMESTAMP': '0'})
+        resp = req.get_response(self.controller)
         # test an empty container
-        req = Request.blank('/sda1/p/a/plainc', environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 204)
+        req = Request.blank(
+            '/sda1/p/a/plainc', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
         # fill the container
         for i in range(3):
-            req = Request.blank('/sda1/p/a/plainc/%s'%i, environ=
-                    {'REQUEST_METHOD': 'PUT',
+            req = Request.blank(
+                '/sda1/p/a/plainc/%s' % i, environ={
+                    'REQUEST_METHOD': 'PUT',
                     'HTTP_X_TIMESTAMP': '1',
                     'HTTP_X_CONTENT_TYPE': 'text/plain',
                     'HTTP_X_ETAG': 'x',
                     'HTTP_X_SIZE': 0})
-            resp = self.controller.PUT(req)
-            self.assertEquals(resp.status_int, 201)
-        plain_body = '0\n1\n2\n'
+            self._update_object_put_headers(req)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 201)
+        plain_body = b'0\n1\n2\n'
 
         req = Request.blank('/sda1/p/a/plainc',
-                environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.content_type, 'text/plain')
-        self.assertEquals(resp.body, plain_body)
-        self.assertEquals(resp.charset, 'utf-8')
+                            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.content_type, 'text/plain')
+        self.assertEqual(
+            resp.last_modified.strftime("%a, %d %b %Y %H:%M:%S GMT"),
+            time.strftime("%a, %d %b %Y %H:%M:%S GMT", time.gmtime(0)))
+        self.assertEqual(resp.body, plain_body)
+        self.assertEqual(resp.charset, 'utf-8')
+        self.assertEqual(
+            'GET_object.timing',
+            self.logger.statsd_client.calls['timing_since'][-2][0][0])
+        self.assertEqual(
+            'GET.timing',
+            self.logger.statsd_client.calls['timing_since'][-1][0][0])
 
-        resp = self.controller.HEAD(req)
-        self.assertEquals(resp.content_type, 'text/plain')
+        req = Request.blank('/sda1/p/a/plainc',
+                            environ={'REQUEST_METHOD': 'HEAD'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.content_type, 'text/plain')
 
         for accept in ('', 'text/plain', 'application/xml;q=0.8,*/*;q=0.9',
-                '*/*;q=0.9,application/xml;q=0.8', '*/*',
-                'text/plain,application/xml'):
-            req = Request.blank('/sda1/p/a/plainc',
-                    environ={'REQUEST_METHOD': 'GET'})
+                       '*/*;q=0.9,application/xml;q=0.8', '*/*',
+                       'text/plain,application/xml'):
+            req = Request.blank(
+                '/sda1/p/a/plainc',
+                environ={'REQUEST_METHOD': 'GET'})
             req.accept = accept
-            resp = self.controller.GET(req)
-            self.assertEquals(resp.body, plain_body,
+            resp = req.get_response(self.controller)
+            self.assertEqual(
+                resp.body, plain_body,
                 'Invalid body for Accept: %s' % accept)
-            self.assertEquals(resp.content_type, 'text/plain',
+            self.assertEqual(
+                resp.content_type, 'text/plain',
                 'Invalid content_type for Accept: %s' % accept)
 
-            resp = self.controller.HEAD(req)
-            self.assertEquals(resp.content_type, 'text/plain',
+            req = Request.blank(
+                '/sda1/p/a/plainc',
+                environ={'REQUEST_METHOD': 'GET'})
+            req.accept = accept
+            resp = req.get_response(self.controller)
+            self.assertEqual(
+                resp.content_type, 'text/plain',
                 'Invalid content_type for Accept: %s' % accept)
 
         # test conflicting formats
-        req = Request.blank('/sda1/p/a/plainc?format=plain',
-                environ={'REQUEST_METHOD': 'GET'})
+        req = Request.blank(
+            '/sda1/p/a/plainc?format=plain',
+            environ={'REQUEST_METHOD': 'GET'})
         req.accept = 'application/json'
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.content_type, 'text/plain')
-        self.assertEquals(resp.body, plain_body)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.content_type, 'text/plain')
+        self.assertEqual(resp.body, plain_body)
 
         # test unknown format uses default plain
-        req = Request.blank('/sda1/p/a/plainc?format=somethingelse',
-                environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(resp.content_type, 'text/plain')
-        self.assertEquals(resp.body, plain_body)
+        req = Request.blank(
+            '/sda1/p/a/plainc?format=somethingelse',
+            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.content_type, 'text/plain')
+        self.assertEqual(resp.body, plain_body)
 
     def test_GET_json_last_modified(self):
         # make a container
-        req = Request.blank('/sda1/p/a/jsonc', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        resp = self.controller.PUT(req)
-        for i, d in [(0, 1.5),
-                     (1, 1.0),]:
-            req = Request.blank('/sda1/p/a/jsonc/%s'%i, environ=
-                    {'REQUEST_METHOD': 'PUT',
+        req = Request.blank(
+            '/sda1/p/a/jsonc', environ={
+                'REQUEST_METHOD': 'PUT',
+                'HTTP_X_TIMESTAMP': '0'})
+        resp = req.get_response(self.controller)
+        for i, d in [(0, 1.5), (1, 1.0), ]:
+            req = Request.blank(
+                '/sda1/p/a/jsonc/%s' % i, environ={
+                    'REQUEST_METHOD': 'PUT',
                     'HTTP_X_TIMESTAMP': d,
                     'HTTP_X_CONTENT_TYPE': 'text/plain',
                     'HTTP_X_ETAG': 'x',
                     'HTTP_X_SIZE': 0})
-            resp = self.controller.PUT(req)
-            self.assertEquals(resp.status_int, 201)
+            self._update_object_put_headers(req)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 201)
         # test format
         # last_modified format must be uniform, even when there are not msecs
-        json_body = [{"name":"0",
-                    "hash":"x",
-                    "bytes":0,
-                    "content_type":"text/plain",
-                    "last_modified":"1970-01-01T00:00:01.500000"},
-                    {"name":"1",
-                    "hash":"x",
-                    "bytes":0,
-                    "content_type":"text/plain",
-                    "last_modified":"1970-01-01T00:00:01.000000"},]
-
-        req = Request.blank('/sda1/p/a/jsonc?format=json',
-                environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.content_type, 'application/json')
-        self.assertEquals(eval(resp.body), json_body)
-        self.assertEquals(resp.charset, 'utf-8')
+        json_body = [{"name": "0",
+                      "hash": "x",
+                      "bytes": 0,
+                      "content_type": "text/plain",
+                      "last_modified": "1970-01-01T00:00:01.500000"},
+                     {"name": "1",
+                      "hash": "x",
+                      "bytes": 0,
+                      "content_type": "text/plain",
+                      "last_modified": "1970-01-01T00:00:01.000000"}, ]
+
+        req = Request.blank(
+            '/sda1/p/a/jsonc?format=json',
+            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.content_type, 'application/json')
+        self.assertEqual(json.loads(resp.body), json_body)
+        self.assertEqual(resp.charset, 'utf-8')
 
     def test_GET_xml(self):
         # make a container
-        req = Request.blank('/sda1/p/a/xmlc', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        resp = self.controller.PUT(req)
+        req = Request.blank(
+            '/sda1/p/a/xmlc', environ={'REQUEST_METHOD': 'PUT',
+                                       'HTTP_X_TIMESTAMP': '0'})
+        resp = req.get_response(self.controller)
         # fill the container
         for i in range(3):
-            req = Request.blank('/sda1/p/a/xmlc/%s'%i, environ=
-                    {'REQUEST_METHOD': 'PUT',
+            req = Request.blank(
+                '/sda1/p/a/xmlc/%s' % i,
+                environ={
+                    'REQUEST_METHOD': 'PUT',
                     'HTTP_X_TIMESTAMP': '1',
                     'HTTP_X_CONTENT_TYPE': 'text/plain',
                     'HTTP_X_ETAG': 'x',
                     'HTTP_X_SIZE': 0})
-            resp = self.controller.PUT(req)
-            self.assertEquals(resp.status_int, 201)
-        xml_body = '<?xml version="1.0" encoding="UTF-8"?>\n' \
-            '<container name="xmlc">' \
-                '<object><name>0</name><hash>x</hash><bytes>0</bytes>' \
-                    '<content_type>text/plain</content_type>' \
-                    '<last_modified>1970-01-01T00:00:01.000000' \
-                    '</last_modified></object>' \
-                '<object><name>1</name><hash>x</hash><bytes>0</bytes>' \
-                    '<content_type>text/plain</content_type>' \
-                    '<last_modified>1970-01-01T00:00:01.000000' \
-                    '</last_modified></object>' \
-                '<object><name>2</name><hash>x</hash><bytes>0</bytes>' \
-                    '<content_type>text/plain</content_type>' \
-                    '<last_modified>1970-01-01T00:00:01.000000' \
-                    '</last_modified></object>' \
-            '</container>'
+            self._update_object_put_headers(req)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 201)
+        xml_body = b'<?xml version="1.0" encoding="UTF-8"?>\n' \
+            b'<container name="xmlc">' \
+            b'<object><name>0</name><hash>x</hash><bytes>0</bytes>' \
+            b'<content_type>text/plain</content_type>' \
+            b'<last_modified>1970-01-01T00:00:01.000000' \
+            b'</last_modified></object>' \
+            b'<object><name>1</name><hash>x</hash><bytes>0</bytes>' \
+            b'<content_type>text/plain</content_type>' \
+            b'<last_modified>1970-01-01T00:00:01.000000' \
+            b'</last_modified></object>' \
+            b'<object><name>2</name><hash>x</hash><bytes>0</bytes>' \
+            b'<content_type>text/plain</content_type>' \
+            b'<last_modified>1970-01-01T00:00:01.000000' \
+            b'</last_modified></object>' \
+            b'</container>'
+
         # tests
-        req = Request.blank('/sda1/p/a/xmlc?format=xml',
+        req = Request.blank(
+            '/sda1/p/a/xmlc?format=xml',
+            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.content_type, 'application/xml')
+        self.assertEqual(
+            resp.last_modified.strftime("%a, %d %b %Y %H:%M:%S GMT"),
+            time.strftime("%a, %d %b %Y %H:%M:%S GMT", time.gmtime(0)))
+        self.assertEqual(resp.body, xml_body)
+        self.assertEqual(resp.charset, 'utf-8')
+
+        req = Request.blank(
+            '/sda1/p/a/xmlc?format=xml',
+            environ={'REQUEST_METHOD': 'HEAD'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.content_type, 'application/xml')
+
+        for xml_accept in (
+                'application/xml', 'application/xml;q=1.0,*/*;q=0.9',
+                '*/*;q=0.9,application/xml;q=1.0', 'application/xml,text/xml'):
+            req = Request.blank(
+                '/sda1/p/a/xmlc',
                 environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.content_type, 'application/xml')
-        self.assertEquals(resp.body, xml_body)
-        self.assertEquals(resp.charset, 'utf-8')
-
-        resp = self.controller.HEAD(req)
-        self.assertEquals(resp.content_type, 'application/xml')
-
-        for xml_accept in ('application/xml', 'application/xml;q=1.0,*/*;q=0.9',
-                 '*/*;q=0.9,application/xml;q=1.0', 'application/xml,text/xml'):
-            req = Request.blank('/sda1/p/a/xmlc',
-                    environ={'REQUEST_METHOD': 'GET'})
             req.accept = xml_accept
-            resp = self.controller.GET(req)
-            self.assertEquals(resp.body, xml_body,
+            resp = req.get_response(self.controller)
+            self.assertEqual(
+                resp.body, xml_body,
                 'Invalid body for Accept: %s' % xml_accept)
-            self.assertEquals(resp.content_type, 'application/xml',
+            self.assertEqual(
+                resp.content_type, 'application/xml',
                 'Invalid content_type for Accept: %s' % xml_accept)
 
-            resp = self.controller.HEAD(req)
-            self.assertEquals(resp.content_type, 'application/xml',
+            req = Request.blank(
+                '/sda1/p/a/xmlc',
+                environ={'REQUEST_METHOD': 'HEAD'})
+            req.accept = xml_accept
+            resp = req.get_response(self.controller)
+            self.assertEqual(
+                resp.content_type, 'application/xml',
                 'Invalid content_type for Accept: %s' % xml_accept)
 
-        req = Request.blank('/sda1/p/a/xmlc',
-                environ={'REQUEST_METHOD': 'GET'})
+        req = Request.blank(
+            '/sda1/p/a/xmlc',
+            environ={'REQUEST_METHOD': 'GET'})
         req.accept = 'text/xml'
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.content_type, 'text/xml')
-        self.assertEquals(resp.body, xml_body)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.content_type, 'text/xml')
+        self.assertEqual(resp.body, xml_body)
+
+    def test_GET_invalid_accept(self):
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'GET'},
+            headers={'Accept': 'application/plain;q'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 400)
+        self.assertEqual(resp.body, b'Invalid Accept header')
 
     def test_GET_marker(self):
         # make a container
-        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        resp = self.controller.PUT(req)
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT',
+                                    'HTTP_X_TIMESTAMP': '0'})
+        req.get_response(self.controller)
         # fill the container
         for i in range(3):
-            req = Request.blank('/sda1/p/a/c/%s'%i, environ= {'REQUEST_METHOD': 'PUT',
-                    'HTTP_X_TIMESTAMP': '1', 'HTTP_X_CONTENT_TYPE': 'text/plain',
+            req = Request.blank(
+                '/sda1/p/a/c/%s' % i, environ={
+                    'REQUEST_METHOD': 'PUT',
+                    'HTTP_X_TIMESTAMP': '1',
+                    'HTTP_X_CONTENT_TYPE': 'text/plain',
                     'HTTP_X_ETAG': 'x', 'HTTP_X_SIZE': 0})
-            resp = self.controller.PUT(req)
-            self.assertEquals(resp.status_int, 201)
+            self._update_object_put_headers(req)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 201)
         # test limit with marker
-        req = Request.blank('/sda1/p/a/c?limit=2&marker=1', environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        result = resp.body.split()
-        self.assertEquals(result, ['2',])
+        req = Request.blank('/sda1/p/a/c?limit=2&marker=1',
+                            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        result = resp.body.split(b'\n')
+        self.assertEqual(result, [b'2', b''])
+        # test limit with end_marker
+        req = Request.blank('/sda1/p/a/c?limit=2&end_marker=1',
+                            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        result = resp.body.split(b'\n')
+        self.assertEqual(result, [b'0', b''])
+        # test limit, reverse with end_marker
+        req = Request.blank('/sda1/p/a/c?limit=2&end_marker=1&reverse=True',
+                            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        result = resp.body.split(b'\n')
+        self.assertEqual(result, [b'2', b''])
+        # test marker > end_marker
+        req = Request.blank('/sda1/p/a/c?marker=2&end_marker=1',
+                            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        result = resp.body.split(b'\n')
+        self.assertEqual(result, [b''])
 
     def test_weird_content_types(self):
         snowman = u'\u2603'
-        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        resp = self.controller.PUT(req)
-        for i, ctype in enumerate((snowman.encode('utf-8'), 'text/plain; "utf-8"')):
-            req = Request.blank('/sda1/p/a/c/%s'%i, environ= {'REQUEST_METHOD': 'PUT',
-                    'HTTP_X_TIMESTAMP': '1', 'HTTP_X_CONTENT_TYPE': ctype,
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT',
+                                    'HTTP_X_TIMESTAMP': '0'})
+        resp = req.get_response(self.controller)
+        for i, ctype in enumerate((snowman.encode('utf-8'),
+                                  b'text/plain; charset="utf-8"')):
+            req = Request.blank(
+                '/sda1/p/a/c/%s' % i, environ={
+                    'REQUEST_METHOD': 'PUT',
+                    'HTTP_X_TIMESTAMP': '1',
+                    'HTTP_X_CONTENT_TYPE': bytes_to_wsgi(ctype),
                     'HTTP_X_ETAG': 'x', 'HTTP_X_SIZE': 0})
-            resp = self.controller.PUT(req)
-            self.assertEquals(resp.status_int, 201)
-        req = Request.blank('/sda1/p/a/c?format=json', environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        result = [x['content_type'] for x in simplejson.loads(resp.body)]
-        self.assertEquals(result, [u'\u2603', 'text/plain; "utf-8"'])
+            self._update_object_put_headers(req)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 201)
+        req = Request.blank('/sda1/p/a/c?format=json',
+                            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        result = [x['content_type'] for x in json.loads(resp.body)]
+        self.assertEqual(result, [u'\u2603', 'text/plain;charset="utf-8"'])
+
+    def test_swift_bytes_in_content_type(self):
+        # create container
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT',
+                                    'HTTP_X_TIMESTAMP': '0'})
+        req.get_response(self.controller)
+
+        # regular object update
+        ctype = 'text/plain; charset="utf-8"'
+        req = Request.blank(
+            '/sda1/p/a/c/o1', environ={
+                'REQUEST_METHOD': 'PUT',
+                'HTTP_X_TIMESTAMP': '1', 'HTTP_X_CONTENT_TYPE': ctype,
+                'HTTP_X_ETAG': 'x', 'HTTP_X_SIZE': 99})
+        self._update_object_put_headers(req)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+
+        # slo object update
+        ctype = 'text/plain; charset="utf-8"; swift_bytes=12345678'
+        req = Request.blank(
+            '/sda1/p/a/c/o2', environ={
+                'REQUEST_METHOD': 'PUT',
+                'HTTP_X_TIMESTAMP': '1', 'HTTP_X_CONTENT_TYPE': ctype,
+                'HTTP_X_ETAG': 'x', 'HTTP_X_SIZE': 99})
+        self._update_object_put_headers(req)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+
+        # verify listing
+        req = Request.blank('/sda1/p/a/c?format=json',
+                            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        listing = json.loads(resp.body)
+        self.assertEqual(2, len(listing))
+        self.assertEqual('text/plain;charset="utf-8"',
+                         listing[0]['content_type'])
+        self.assertEqual(99, listing[0]['bytes'])
+        self.assertEqual('text/plain;charset="utf-8"',
+                         listing[1]['content_type'])
+        self.assertEqual(12345678, listing[1]['bytes'])
 
     def test_GET_accept_not_valid(self):
-        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        self.controller.PUT(req)
-        req = Request.blank('/sda1/p/a/c1', environ={'REQUEST_METHOD': 'PUT'},
-                            headers={'X-Put-Timestamp': '1',
-                                     'X-Delete-Timestamp': '0',
-                                     'X-Object-Count': '0',
-                                     'X-Bytes-Used': '0',
-                                     'X-Timestamp': normalize_timestamp(0)})
-        self.controller.PUT(req)
-        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'GET'})
+        req = Request.blank('/sda1/p/a/c', method='PUT', headers={
+            'X-Timestamp': Timestamp.zero().internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        req = Request.blank('/sda1/p/a/c', method='GET')
         req.accept = 'application/xml*'
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.status_int, 406)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 406)
+
+    @patch_policies([
+        StoragePolicy(0, name='nulo', is_default=True),
+        StoragePolicy(1, name='unu'),
+        StoragePolicy(2, name='du'),
+    ])
+    def test_GET_objects_of_different_policies(self):
+        # make a container
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT',
+                                    'HTTP_X_TIMESTAMP': '0'})
+        resp = req.get_response(self.controller)
+        resp_policy_idx = resp.headers['X-Backend-Storage-Policy-Index']
+        self.assertEqual(resp_policy_idx, str(POLICIES.default.idx))
+
+        pol_def_objs = ['obj_default_%d' % i for i in range(11)]
+        pol_1_objs = ['obj_1_%d' % i for i in range(10)]
+
+        # fill the container
+        for obj in pol_def_objs:
+            req = Request.blank(
+                '/sda1/p/a/c/%s' % obj,
+                environ={
+                    'REQUEST_METHOD': 'PUT',
+                    'HTTP_X_TIMESTAMP': '1',
+                    'HTTP_X_CONTENT_TYPE': 'text/plain',
+                    'HTTP_X_ETAG': 'x',
+                    'HTTP_X_SIZE': 0})
+            self._update_object_put_headers(req)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 201)
+
+        for obj in pol_1_objs:
+            req = Request.blank(
+                '/sda1/p/a/c/%s' % obj,
+                environ={
+                    'REQUEST_METHOD': 'PUT',
+                    'HTTP_X_TIMESTAMP': '1',
+                    'HTTP_X_CONTENT_TYPE': 'text/plain',
+                    'HTTP_X_ETAG': 'x',
+                    'HTTP_X_SIZE': 0,
+                    'HTTP_X_BACKEND_STORAGE_POLICY_INDEX': 1})
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 201)
+
+        expected_pol_def_objs = [o.encode('utf8') for o in pol_def_objs]
+        expected_pol_1_objs = [o.encode('utf8') for o in pol_1_objs]
+
+        # By default the container server will return objects belonging to
+        # the brokers storage policy
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        result = [o for o in resp.body.split(b'\n') if o]
+        self.assertEqual(len(result), 11)
+        self.assertEqual(sorted(result), sorted(expected_pol_def_objs))
+        self.assertIn('X-Backend-Storage-Policy-Index', resp.headers)
+        self.assertEqual('0', resp.headers['X-Backend-Storage-Policy-Index'])
+        self.assertEqual('0',
+                         resp.headers['X-Backend-Record-Storage-Policy-Index'])
+
+        # If we specify the policy 0 idx we should get the same
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'GET'})
+        req.headers['X-Backend-Storage-Policy-Index'] = POLICIES.default.idx
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        result = [o for o in resp.body.split(b'\n') if o]
+        self.assertEqual(len(result), 11)
+        self.assertEqual(sorted(result), sorted(expected_pol_def_objs))
+        self.assertIn('X-Backend-Storage-Policy-Index', resp.headers)
+        self.assertEqual('0', resp.headers['X-Backend-Storage-Policy-Index'])
+        self.assertEqual('0',
+                         resp.headers['X-Backend-Record-Storage-Policy-Index'])
+
+        # And if we specify a different idx we'll get objects for that policy
+        # and the X-Backend-Record-Storage-Policy-Index letting us know the
+        # policy for which these objects came from, if it differs from the
+        # policy stored in the DB.
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'GET'})
+        req.headers['X-Backend-Storage-Policy-Index'] = 1
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200)
+        result = [o for o in resp.body.split(b'\n') if o]
+        self.assertEqual(len(result), 10)
+        self.assertEqual(sorted(result), sorted(expected_pol_1_objs))
+        self.assertIn('X-Backend-Storage-Policy-Index', resp.headers)
+        self.assertEqual('0', resp.headers['X-Backend-Storage-Policy-Index'])
+        self.assertEqual('1',
+                         resp.headers['X-Backend-Record-Storage-Policy-Index'])
+
+        # And an index that the broker doesn't have any objects for
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'GET'})
+        req.headers['X-Backend-Storage-Policy-Index'] = 2
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 204)
+        result = [o for o in resp.body.split(b'\n') if o]
+        self.assertEqual(len(result), 0)
+        self.assertFalse(result)
+        self.assertIn('X-Backend-Storage-Policy-Index', resp.headers)
+        self.assertEqual('0', resp.headers['X-Backend-Storage-Policy-Index'])
+        self.assertEqual('2',
+                         resp.headers['X-Backend-Record-Storage-Policy-Index'])
+
+        # And an index that doesn't exist in POLICIES
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'GET'})
+        req.headers['X-Backend-Storage-Policy-Index'] = 3
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 400)
 
     def test_GET_limit(self):
         # make a container
-        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        resp = self.controller.PUT(req)
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT',
+                                    'HTTP_X_TIMESTAMP': '0'})
+        resp = req.get_response(self.controller)
         # fill the container
         for i in range(3):
-            req = Request.blank('/sda1/p/a/c/%s'%i, environ=
-                    {'REQUEST_METHOD': 'PUT',
+            req = Request.blank(
+                '/sda1/p/a/c/%s' % i,
+                environ={
+                    'REQUEST_METHOD': 'PUT',
                     'HTTP_X_TIMESTAMP': '1',
                     'HTTP_X_CONTENT_TYPE': 'text/plain',
                     'HTTP_X_ETAG': 'x',
                     'HTTP_X_SIZE': 0})
-            resp = self.controller.PUT(req)
-            self.assertEquals(resp.status_int, 201)
+            self._update_object_put_headers(req)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 201)
         # test limit
-        req = Request.blank('/sda1/p/a/c?limit=2', environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        result = resp.body.split()
-        self.assertEquals(result, ['0','1'])
+        req = Request.blank(
+            '/sda1/p/a/c?limit=2', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        result = resp.body.split(b'\n')
+        self.assertEqual(result, [b'0', b'1', b''])
+        self.assertEqual(
+            'GET_object.timing',
+            self.logger.statsd_client.calls['timing_since'][-2][0][0])
+        self.assertEqual(
+            'GET.timing',
+            self.logger.statsd_client.calls['timing_since'][-1][0][0])
 
     def test_GET_prefix(self):
-        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        resp = self.controller.PUT(req)
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT',
+                                    'HTTP_X_TIMESTAMP': '0'})
+        resp = req.get_response(self.controller)
         for i in ('a1', 'b1', 'a2', 'b2', 'a3', 'b3'):
-            req = Request.blank('/sda1/p/a/c/%s'%i, environ=
-                    {'REQUEST_METHOD': 'PUT',
+            req = Request.blank(
+                '/sda1/p/a/c/%s' % i,
+                environ={
+                    'REQUEST_METHOD': 'PUT',
                     'HTTP_X_TIMESTAMP': '1',
                     'HTTP_X_CONTENT_TYPE': 'text/plain',
                     'HTTP_X_ETAG': 'x',
                     'HTTP_X_SIZE': 0})
-            resp = self.controller.PUT(req)
-            self.assertEquals(resp.status_int, 201)
-        req = Request.blank('/sda1/p/a/c?prefix=a', environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.body.split(), ['a1','a2', 'a3'])
+            self._update_object_put_headers(req)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 201)
+        req = Request.blank(
+            '/sda1/p/a/c?prefix=a', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.body.split(b'\n'), [b'a1', b'a2', b'a3', b''])
+        self.assertEqual(
+            'GET_object.timing',
+            self.logger.statsd_client.calls['timing_since'][-2][0][0])
+        self.assertEqual(
+            'GET.timing',
+            self.logger.statsd_client.calls['timing_since'][-1][0][0])
 
     def test_GET_delimiter(self):
-        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        resp = self.controller.PUT(req)
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT',
+                                    'HTTP_X_TIMESTAMP': '0'})
+        resp = req.get_response(self.controller)
         for i in ('US-TX-A', 'US-TX-B', 'US-OK-A', 'US-OK-B', 'US-UT-A'):
-            req = Request.blank('/sda1/p/a/c/%s'%i, environ=
-                    {'REQUEST_METHOD': 'PUT', 'HTTP_X_TIMESTAMP': '1',
+            req = Request.blank(
+                '/sda1/p/a/c/%s' % i,
+                environ={
+                    'REQUEST_METHOD': 'PUT', 'HTTP_X_TIMESTAMP': '1',
                     'HTTP_X_CONTENT_TYPE': 'text/plain', 'HTTP_X_ETAG': 'x',
                     'HTTP_X_SIZE': 0})
-            resp = self.controller.PUT(req)
-            self.assertEquals(resp.status_int, 201)
-        req = Request.blank('/sda1/p/a/c?prefix=US-&delimiter=-&format=json',
-                environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(simplejson.loads(resp.body),
-            [{"subdir":"US-OK-"},{"subdir":"US-TX-"},{"subdir":"US-UT-"}])
+            self._update_object_put_headers(req)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 201)
+        req = Request.blank(
+            '/sda1/p/a/c?prefix=US-&delimiter=-&format=json',
+            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            json.loads(resp.body),
+            [{"subdir": "US-OK-"},
+             {"subdir": "US-TX-"},
+             {"subdir": "US-UT-"}])
+        self.assertEqual(
+            'GET_object.timing',
+            self.logger.statsd_client.calls['timing_since'][-2][0][0])
+        self.assertEqual(
+            'GET.timing',
+            self.logger.statsd_client.calls['timing_since'][-1][0][0])
+
+    def test_GET_multichar_delimiter(self):
+        self.maxDiff = None
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT',
+                                    'HTTP_X_TIMESTAMP': '0'})
+        resp = req.get_response(self.controller)
+        for i in ('US~~TX~~A', 'US~~TX~~B', 'US~~OK~~A', 'US~~OK~~B',
+                  'US~~OK~Tulsa~~A', 'US~~OK~Tulsa~~B',
+                  'US~~UT~~A', 'US~~UT~~~B'):
+            req = Request.blank(
+                '/sda1/p/a/c/%s' % i,
+                environ={
+                    'REQUEST_METHOD': 'PUT', 'HTTP_X_TIMESTAMP': '1',
+                    'HTTP_X_CONTENT_TYPE': 'text/plain', 'HTTP_X_ETAG': 'x',
+                    'HTTP_X_SIZE': 0})
+            self._update_object_put_headers(req)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 201)
+        req = Request.blank(
+            '/sda1/p/a/c?prefix=US~~&delimiter=~~&format=json',
+            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            json.loads(resp.body),
+            [{"subdir": "US~~OK~Tulsa~~"},
+             {"subdir": "US~~OK~~"},
+             {"subdir": "US~~TX~~"},
+             {"subdir": "US~~UT~~"}])
+
+        req = Request.blank(
+            '/sda1/p/a/c?prefix=US~~&delimiter=~~&format=json&reverse=on',
+            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            json.loads(resp.body),
+            [{"subdir": "US~~UT~~"},
+             {"subdir": "US~~TX~~"},
+             {"subdir": "US~~OK~~"},
+             {"subdir": "US~~OK~Tulsa~~"}])
+
+        req = Request.blank(
+            '/sda1/p/a/c?prefix=US~~UT&delimiter=~~&format=json',
+            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            json.loads(resp.body),
+            [{"subdir": "US~~UT~~"}])
+
+        req = Request.blank(
+            '/sda1/p/a/c?prefix=US~~UT&delimiter=~~&format=json&reverse=on',
+            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            json.loads(resp.body),
+            [{"subdir": "US~~UT~~"}])
+
+        req = Request.blank(
+            '/sda1/p/a/c?prefix=US~~UT~&delimiter=~~&format=json',
+            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            [{k: v for k, v in item.items() if k in ('subdir', 'name')}
+             for item in json.loads(resp.body)],
+            [{"name": "US~~UT~~A"},
+             {"subdir": "US~~UT~~~"}])
+
+        req = Request.blank(
+            '/sda1/p/a/c?prefix=US~~UT~&delimiter=~~&format=json&reverse=on',
+            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            [{k: v for k, v in item.items() if k in ('subdir', 'name')}
+             for item in json.loads(resp.body)],
+            [{"subdir": "US~~UT~~~"},
+             {"name": "US~~UT~~A"}])
+
+        req = Request.blank(
+            '/sda1/p/a/c?prefix=US~~UT~~&delimiter=~~&format=json',
+            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            [{k: v for k, v in item.items() if k in ('subdir', 'name')}
+             for item in json.loads(resp.body)],
+            [{"name": "US~~UT~~A"},
+             {"name": "US~~UT~~~B"}])
+
+        req = Request.blank(
+            '/sda1/p/a/c?prefix=US~~UT~~&delimiter=~~&format=json&reverse=on',
+            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            [{k: v for k, v in item.items() if k in ('subdir', 'name')}
+             for item in json.loads(resp.body)],
+            [{"name": "US~~UT~~~B"},
+             {"name": "US~~UT~~A"}])
+
+        req = Request.blank(
+            '/sda1/p/a/c?prefix=US~~UT~~~&delimiter=~~&format=json',
+            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            [{k: v for k, v in item.items() if k in ('subdir', 'name')}
+             for item in json.loads(resp.body)],
+            [{"name": "US~~UT~~~B"}])
+
+    def _report_objects(self, path, objects):
+        req = Request.blank(path, method='PUT', headers={
+            'x-timestamp': next(self.ts).internal})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int // 100, 2, resp.body)
+        for obj in objects:
+            obj_path = path + '/%s' % obj['name']
+            req = Request.blank(obj_path, method='PUT', headers={
+                'X-Timestamp': obj['timestamp'].internal,
+                'X-Size': obj['bytes'],
+                'X-Content-Type': obj['content_type'],
+                'X-Etag': obj['hash'],
+            })
+            self._update_object_put_headers(req)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int // 100, 2, resp.body)
+
+    def _expected_listing(self, objects):
+        return [dict(
+            last_modified=o['timestamp'].isoformat, **{
+                k: v for k, v in o.items()
+                if k != 'timestamp'
+            }) for o in sorted(objects, key=lambda o: o['name'])]
+
+    def test_listing_with_reserved(self):
+        objects = [{
+            'name': get_reserved_name('null', 'test01'),
+            'bytes': 8,
+            'content_type': 'application/octet-stream',
+            'hash': '70c1db56f301c9e337b0099bd4174b28',
+            'timestamp': next(self.ts),
+        }]
+        path = '/sda1/p/a/%s' % get_reserved_name('null')
+        self._report_objects(path, objects)
+
+        req = Request.blank(path, headers={'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body), [])
+
+        req = Request.blank(path, headers={
+            'X-Backend-Allow-Reserved-Names': 'true',
+            'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body),
+                         self._expected_listing(objects))
+
+    def test_delimiter_with_reserved(self):
+        objects = [{
+            'name': get_reserved_name('null', 'test01'),
+            'bytes': 8,
+            'content_type': 'application/octet-stream',
+            'hash': '70c1db56f301c9e337b0099bd4174b28',
+            'timestamp': next(self.ts),
+        }, {
+            'name': get_reserved_name('null', 'test02'),
+            'bytes': 8,
+            'content_type': 'application/octet-stream',
+            'hash': '70c1db56f301c9e337b0099bd4174b28',
+            'timestamp': next(self.ts),
+        }]
+        path = '/sda1/p/a/%s' % get_reserved_name('null')
+        self._report_objects(path, objects)
+
+        req = Request.blank(path + '?prefix=%s&delimiter=l' %
+                            get_reserved_name('nul'), headers={
+                                'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body), [])
+
+        req = Request.blank(path + '?prefix=%s&delimiter=l' %
+                            get_reserved_name('nul'), headers={
+                                'X-Backend-Allow-Reserved-Names': 'true',
+                                'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body), [{
+            'subdir': '%s' % get_reserved_name('null')}])
+
+        req = Request.blank(path + '?prefix=%s&delimiter=%s' % (
+                            get_reserved_name('nul'), get_reserved_name('')),
+                            headers={
+                                'X-Backend-Allow-Reserved-Names': 'true',
+                                'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body), [{
+            'subdir': '%s' % get_reserved_name('null', '')}])
+
+    def test_markers_with_reserved(self):
+        objects = [{
+            'name': get_reserved_name('null', 'test01'),
+            'bytes': 8,
+            'content_type': 'application/octet-stream',
+            'hash': '70c1db56f301c9e337b0099bd4174b28',
+            'timestamp': next(self.ts),
+        }, {
+            'name': get_reserved_name('null', 'test02'),
+            'bytes': 10,
+            'content_type': 'application/octet-stream',
+            'hash': '912ec803b2ce49e4a541068d495ab570',
+            'timestamp': next(self.ts),
+        }]
+        path = '/sda1/p/a/%s' % get_reserved_name('null')
+        self._report_objects(path, objects)
+
+        req = Request.blank(path + '?marker=%s' %
+                            get_reserved_name('null', ''), headers={
+                                'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body), [])
+
+        req = Request.blank(path + '?marker=%s' %
+                            get_reserved_name('null', ''), headers={
+                                'X-Backend-Allow-Reserved-Names': 'true',
+                                'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body),
+                         self._expected_listing(objects))
+
+        req = Request.blank(path + '?marker=%s' %
+                            quote(json.loads(resp.body)[0]['name']), headers={
+                                'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body), [])
+
+        req = Request.blank(path + '?marker=%s' %
+                            quote(self._expected_listing(objects)[0]['name']),
+                            headers={
+                                'X-Backend-Allow-Reserved-Names': 'true',
+                                'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body),
+                         self._expected_listing(objects)[1:])
+
+    def test_prefix_with_reserved(self):
+        objects = [{
+            'name': get_reserved_name('null', 'test01'),
+            'bytes': 8,
+            'content_type': 'application/octet-stream',
+            'hash': '70c1db56f301c9e337b0099bd4174b28',
+            'timestamp': next(self.ts),
+        }, {
+            'name': get_reserved_name('null', 'test02'),
+            'bytes': 10,
+            'content_type': 'application/octet-stream',
+            'hash': '912ec803b2ce49e4a541068d495ab570',
+            'timestamp': next(self.ts),
+        }, {
+            'name': get_reserved_name('null', 'foo'),
+            'bytes': 12,
+            'content_type': 'application/octet-stream',
+            'hash': 'acbd18db4cc2f85cedef654fccc4a4d8',
+            'timestamp': next(self.ts),
+        }, {
+            'name': get_reserved_name('nullish'),
+            'bytes': 13,
+            'content_type': 'application/octet-stream',
+            'hash': '37b51d194a7513e45b56f6524f2d51f2',
+            'timestamp': next(self.ts),
+        }]
+        path = '/sda1/p/a/%s' % get_reserved_name('null')
+        self._report_objects(path, objects)
+
+        req = Request.blank(path + '?prefix=%s' %
+                            get_reserved_name('null', 'test'), headers={
+                                'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body), [])
+
+        req = Request.blank(path + '?prefix=%s' %
+                            get_reserved_name('null', 'test'), headers={
+                                'X-Backend-Allow-Reserved-Names': 'true',
+                                'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body),
+                         self._expected_listing(objects[:2]))
+
+    def test_prefix_and_delim_with_reserved(self):
+        objects = [{
+            'name': get_reserved_name('null', 'test01'),
+            'bytes': 8,
+            'content_type': 'application/octet-stream',
+            'hash': '70c1db56f301c9e337b0099bd4174b28',
+            'timestamp': next(self.ts),
+        }, {
+            'name': get_reserved_name('null', 'test02'),
+            'bytes': 10,
+            'content_type': 'application/octet-stream',
+            'hash': '912ec803b2ce49e4a541068d495ab570',
+            'timestamp': next(self.ts),
+        }, {
+            'name': get_reserved_name('null', 'foo'),
+            'bytes': 12,
+            'content_type': 'application/octet-stream',
+            'hash': 'acbd18db4cc2f85cedef654fccc4a4d8',
+            'timestamp': next(self.ts),
+        }, {
+            'name': get_reserved_name('nullish'),
+            'bytes': 13,
+            'content_type': 'application/octet-stream',
+            'hash': '37b51d194a7513e45b56f6524f2d51f2',
+            'timestamp': next(self.ts),
+        }]
+        path = '/sda1/p/a/%s' % get_reserved_name('null')
+        self._report_objects(path, objects)
+
+        req = Request.blank(path + '?prefix=%s&delimiter=%s' % (
+            get_reserved_name('null'), get_reserved_name()), headers={
+                'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        self.assertEqual(json.loads(resp.body), [])
+
+        req = Request.blank(path + '?prefix=%s&delimiter=%s' % (
+            get_reserved_name('null'), get_reserved_name()), headers={
+                'X-Backend-Allow-Reserved-Names': 'true',
+                'Accept': 'application/json'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 200, resp.body)
+        expected = [{'subdir': get_reserved_name('null', '')}] + \
+            self._expected_listing(objects)[-1:]
+        self.assertEqual(json.loads(resp.body), expected)
+
+    def test_GET_delimiter_non_ascii(self):
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT',
+                                    'HTTP_X_TIMESTAMP': '0'})
+        resp = req.get_response(self.controller)
+        for obj_name in [u"a/❥/1", u"a/❥/2", u"a/ꙮ/1", u"a/ꙮ/2"]:
+            req = Request.blank(
+                '/sda1/p/a/c/%s' % bytes_to_wsgi(obj_name.encode('utf-8')),
+                environ={
+                    'REQUEST_METHOD': 'PUT', 'HTTP_X_TIMESTAMP': '1',
+                    'HTTP_X_CONTENT_TYPE': 'text/plain', 'HTTP_X_ETAG': 'x',
+                    'HTTP_X_SIZE': 0})
+            self._update_object_put_headers(req)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 201)
+
+        # JSON
+        req = Request.blank(
+            '/sda1/p/a/c?prefix=a/&delimiter=/&format=json',
+            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            json.loads(resp.body),
+            [{"subdir": u"a/❥/"},
+             {"subdir": u"a/ꙮ/"}])
+
+        # Plain text
+        req = Request.blank(
+            '/sda1/p/a/c?prefix=a/&delimiter=/&format=text',
+            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.body, u"a/❥/\na/ꙮ/\n".encode("utf-8"))
+
+    def test_GET_leading_delimiter(self):
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT',
+                                    'HTTP_X_TIMESTAMP': '0'})
+        resp = req.get_response(self.controller)
+        for i in ('US-TX-A', 'US-TX-B', '-UK', '-CH'):
+            req = Request.blank(
+                '/sda1/p/a/c/%s' % i,
+                environ={
+                    'REQUEST_METHOD': 'PUT', 'HTTP_X_TIMESTAMP': '1',
+                    'HTTP_X_CONTENT_TYPE': 'text/plain', 'HTTP_X_ETAG': 'x',
+                    'HTTP_X_SIZE': 0})
+            self._update_object_put_headers(req)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 201)
+        req = Request.blank(
+            '/sda1/p/a/c?delimiter=-&format=json',
+            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            json.loads(resp.body),
+            [{"subdir": "-"},
+             {"subdir": "US-"}])
 
     def test_GET_delimiter_xml(self):
-        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        resp = self.controller.PUT(req)
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT',
+                                    'HTTP_X_TIMESTAMP': '0'})
+        resp = req.get_response(self.controller)
         for i in ('US-TX-A', 'US-TX-B', 'US-OK-A', 'US-OK-B', 'US-UT-A'):
-            req = Request.blank('/sda1/p/a/c/%s'%i, environ=
-                    {'REQUEST_METHOD': 'PUT', 'HTTP_X_TIMESTAMP': '1',
+            req = Request.blank(
+                '/sda1/p/a/c/%s' % i,
+                environ={
+                    'REQUEST_METHOD': 'PUT', 'HTTP_X_TIMESTAMP': '1',
                     'HTTP_X_CONTENT_TYPE': 'text/plain', 'HTTP_X_ETAG': 'x',
                     'HTTP_X_SIZE': 0})
-            resp = self.controller.PUT(req)
-            self.assertEquals(resp.status_int, 201)
-        req = Request.blank('/sda1/p/a/c?prefix=US-&delimiter=-&format=xml',
-                environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(resp.body, '<?xml version="1.0" encoding="UTF-8"?>'
-            '\n<container name="c"><subdir name="US-OK-"><name>US-OK-</name></subdir>'
-            '<subdir name="US-TX-"><name>US-TX-</name></subdir>'
-            '<subdir name="US-UT-"><name>US-UT-</name></subdir></container>')
+            self._update_object_put_headers(req)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 201)
+        req = Request.blank(
+            '/sda1/p/a/c?prefix=US-&delimiter=-&format=xml',
+            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            resp.body, b'<?xml version="1.0" encoding="UTF-8"?>'
+            b'\n<container name="c"><subdir name="US-OK-">'
+            b'<name>US-OK-</name></subdir>'
+            b'<subdir name="US-TX-"><name>US-TX-</name></subdir>'
+            b'<subdir name="US-UT-"><name>US-UT-</name></subdir></container>')
+
+    def test_GET_delimiter_xml_with_quotes(self):
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT',
+                                    'HTTP_X_TIMESTAMP': '0'})
+        resp = req.get_response(self.controller)
+        req = Request.blank(
+            '/sda1/p/a/c/<\'sub\' "dir">/object',
+            environ={
+                'REQUEST_METHOD': 'PUT', 'HTTP_X_TIMESTAMP': '1',
+                'HTTP_X_CONTENT_TYPE': 'text/plain', 'HTTP_X_ETAG': 'x',
+                'HTTP_X_SIZE': 0})
+        self._update_object_put_headers(req)
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        req = Request.blank(
+            '/sda1/p/a/c?delimiter=/&format=xml',
+            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        dom = minidom.parseString(resp.body)
+        self.assertTrue(len(dom.getElementsByTagName('container')) == 1)
+        container = dom.getElementsByTagName('container')[0]
+        self.assertTrue(len(container.getElementsByTagName('subdir')) == 1)
+        subdir = container.getElementsByTagName('subdir')[0]
+        self.assertEqual(subdir.attributes['name'].value,
+                         '<\'sub\' "dir">/')
+        self.assertTrue(len(subdir.getElementsByTagName('name')) == 1)
+        name = subdir.getElementsByTagName('name')[0]
+        self.assertEqual(name.childNodes[0].data,
+                         '<\'sub\' "dir">/')
 
     def test_GET_path(self):
-        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT',
-            'HTTP_X_TIMESTAMP': '0'})
-        resp = self.controller.PUT(req)
+        req = Request.blank(
+            '/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT',
+                                    'HTTP_X_TIMESTAMP': '0'})
+        resp = req.get_response(self.controller)
         for i in ('US/TX', 'US/TX/B', 'US/OK', 'US/OK/B', 'US/UT/A'):
-            req = Request.blank('/sda1/p/a/c/%s'%i, environ=
-                    {'REQUEST_METHOD': 'PUT', 'HTTP_X_TIMESTAMP': '1',
+            req = Request.blank(
+                '/sda1/p/a/c/%s' % i,
+                environ={
+                    'REQUEST_METHOD': 'PUT', 'HTTP_X_TIMESTAMP': '1',
                     'HTTP_X_CONTENT_TYPE': 'text/plain', 'HTTP_X_ETAG': 'x',
                     'HTTP_X_SIZE': 0})
-            resp = self.controller.PUT(req)
-            self.assertEquals(resp.status_int, 201)
-        req = Request.blank('/sda1/p/a/c?path=US&format=json',
-                environ={'REQUEST_METHOD': 'GET'})
-        resp = self.controller.GET(req)
-        self.assertEquals(simplejson.loads(resp.body),
-            [{"name":"US/OK","hash":"x","bytes":0,"content_type":"text/plain",
-              "last_modified":"1970-01-01T00:00:01.000000"},
-             {"name":"US/TX","hash":"x","bytes":0,"content_type":"text/plain",
-              "last_modified":"1970-01-01T00:00:01.000000"}])
+            self._update_object_put_headers(req)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 201)
+        req = Request.blank(
+            '/sda1/p/a/c?path=US&format=json',
+            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            json.loads(resp.body),
+            [{"name": "US/OK", "hash": "x", "bytes": 0,
+              "content_type": "text/plain",
+              "last_modified": "1970-01-01T00:00:01.000000"},
+             {"name": "US/TX", "hash": "x", "bytes": 0,
+              "content_type": "text/plain",
+              "last_modified": "1970-01-01T00:00:01.000000"}])
 
     def test_through_call(self):
-        inbuf = StringIO()
+        inbuf = BytesIO()
         errbuf = StringIO()
         outbuf = StringIO()
-        def start_response(*args):
-            outbuf.writelines(args)
+
+        def start_response(status, headers):
+            outbuf.writelines(status)
+
         self.controller.__call__({'REQUEST_METHOD': 'GET',
                                   'SCRIPT_NAME': '',
                                   'PATH_INFO': '/sda1/p/a/c',
@@ -929,15 +5697,17 @@ def start_response(*args):
                                   'wsgi.multiprocess': False,
                                   'wsgi.run_once': False},
                                  start_response)
-        self.assertEquals(errbuf.getvalue(), '')
-        self.assertEquals(outbuf.getvalue()[:4], '404 ')
+        self.assertEqual(errbuf.getvalue(), '')
+        self.assertEqual(outbuf.getvalue()[:4], '404 ')
 
     def test_through_call_invalid_path(self):
-        inbuf = StringIO()
+        inbuf = BytesIO()
         errbuf = StringIO()
         outbuf = StringIO()
-        def start_response(*args):
-            outbuf.writelines(args)
+
+        def start_response(status, headers):
+            outbuf.writelines(status)
+
         self.controller.__call__({'REQUEST_METHOD': 'GET',
                                   'SCRIPT_NAME': '',
                                   'PATH_INFO': '/bob',
@@ -953,133 +5723,493 @@ def start_response(*args):
                                   'wsgi.multiprocess': False,
                                   'wsgi.run_once': False},
                                  start_response)
-        self.assertEquals(errbuf.getvalue(), '')
-        self.assertEquals(outbuf.getvalue()[:4], '400 ')
+        self.assertEqual(errbuf.getvalue(), '')
+        self.assertEqual(outbuf.getvalue()[:4], '400 ')
+
+    def test_through_call_invalid_path_utf8(self):
+        inbuf = BytesIO()
+        errbuf = StringIO()
+        outbuf = StringIO()
+
+        def start_response(status, headers):
+            outbuf.writelines(status)
+
+        self.controller.__call__({'REQUEST_METHOD': 'GET',
+                                  'SCRIPT_NAME': '',
+                                  'PATH_INFO': '/sda1/p/a/c\xd8\x3e%20/%',
+                                  'SERVER_NAME': '127.0.0.1',
+                                  'SERVER_PORT': '8080',
+                                  'SERVER_PROTOCOL': 'HTTP/1.0',
+                                  'CONTENT_LENGTH': '0',
+                                  'wsgi.version': (1, 0),
+                                  'wsgi.url_scheme': 'http',
+                                  'wsgi.input': inbuf,
+                                  'wsgi.errors': errbuf,
+                                  'wsgi.multithread': False,
+                                  'wsgi.multiprocess': False,
+                                  'wsgi.run_once': False},
+                                 start_response)
+        self.assertEqual(errbuf.getvalue(), '')
+        self.assertEqual(outbuf.getvalue()[:4], '412 ')
 
     def test_invalid_method_doesnt_exist(self):
-        inbuf = StringIO()
         errbuf = StringIO()
         outbuf = StringIO()
-        def start_response(*args):
-            outbuf.writelines(args)
+
+        def start_response(status, headers):
+            outbuf.writelines(status)
+
         self.controller.__call__({'REQUEST_METHOD': 'method_doesnt_exist',
                                   'PATH_INFO': '/sda1/p/a/c'},
                                  start_response)
-        self.assertEquals(errbuf.getvalue(), '')
-        self.assertEquals(outbuf.getvalue()[:4], '405 ')
+        self.assertEqual(errbuf.getvalue(), '')
+        self.assertEqual(outbuf.getvalue()[:4], '405 ')
 
     def test_invalid_method_is_not_public(self):
-        inbuf = StringIO()
         errbuf = StringIO()
         outbuf = StringIO()
-        def start_response(*args):
-            outbuf.writelines(args)
+
+        def start_response(status, headers):
+            outbuf.writelines(status)
+
         self.controller.__call__({'REQUEST_METHOD': '__init__',
                                   'PATH_INFO': '/sda1/p/a/c'},
                                  start_response)
-        self.assertEquals(errbuf.getvalue(), '')
-        self.assertEquals(outbuf.getvalue()[:4], '405 ')
+        self.assertEqual(errbuf.getvalue(), '')
+        self.assertEqual(outbuf.getvalue()[:4], '405 ')
 
     def test_params_format(self):
-        self.controller.PUT(Request.blank('/sda1/p/a/c',
-                            headers={'X-Timestamp': normalize_timestamp(1)},
-                            environ={'REQUEST_METHOD': 'PUT'}))
+        req = Request.blank(
+            '/sda1/p/a/c', method='PUT',
+            headers={'X-Timestamp': Timestamp(1).internal})
+        req.get_response(self.controller)
         for format in ('xml', 'json'):
             req = Request.blank('/sda1/p/a/c?format=%s' % format,
-                                environ={'REQUEST_METHOD': 'GET'})
-            resp = self.controller.GET(req)
-            self.assertEquals(resp.status_int, 200)
+                                method='GET')
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 200)
 
     def test_params_utf8(self):
-        self.controller.PUT(Request.blank('/sda1/p/a/c',
-                            headers={'X-Timestamp': normalize_timestamp(1)},
-                            environ={'REQUEST_METHOD': 'PUT'}))
-        for param in ('delimiter', 'limit', 'marker', 'path', 'prefix'):
+        # Bad UTF8 sequence, all parameters should cause 400 error
+        for param in ('delimiter', 'limit', 'marker', 'path', 'prefix',
+                      'end_marker', 'format'):
             req = Request.blank('/sda1/p/a/c?%s=\xce' % param,
                                 environ={'REQUEST_METHOD': 'GET'})
-            resp = self.controller.GET(req)
-            self.assertEquals(resp.status_int, 400)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 400,
+                             "%d on param %s" % (resp.status_int, param))
+        req = Request.blank('/sda1/p/a/c', method='PUT',
+                            headers={'X-Timestamp': Timestamp(1).internal})
+        req.get_response(self.controller)
+        # Good UTF8 sequence, ignored for limit, doesn't affect other queries
+        for param in ('limit', 'marker', 'path', 'prefix', 'end_marker',
+                      'format', 'delimiter'):
             req = Request.blank('/sda1/p/a/c?%s=\xce\xa9' % param,
                                 environ={'REQUEST_METHOD': 'GET'})
-            resp = self.controller.GET(req)
-            self.assert_(resp.status_int in (204, 412), resp.status_int)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, 204,
+                             "%d on param %s" % (resp.status_int, param))
 
     def test_put_auto_create(self):
-        headers = {'x-timestamp': normalize_timestamp(1),
-                   'x-size': '0',
-                   'x-content-type': 'text/plain',
-                   'x-etag': 'd41d8cd98f00b204e9800998ecf8427e'}
-
-        resp = self.controller.PUT(Request.blank('/sda1/p/a/c/o',
-            environ={'REQUEST_METHOD': 'PUT'}, headers=dict(headers)))
-        self.assertEquals(resp.status_int, 404)
+        def do_test(expected_status, path, extra_headers=None, body=None):
+            headers = {'x-timestamp': Timestamp(1).internal,
+                       'x-size': '0',
+                       'x-content-type': 'text/plain',
+                       'x-etag': 'd41d8cd98f00b204e9800998ecf8427e'}
+            if extra_headers:
+                headers.update(extra_headers)
+            req = Request.blank('/sda1/p/' + path,
+                                environ={'REQUEST_METHOD': 'PUT'},
+                                headers=headers, body=body)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, expected_status)
 
-        resp = self.controller.PUT(Request.blank('/sda1/p/.a/c/o',
-            environ={'REQUEST_METHOD': 'PUT'}, headers=dict(headers)))
-        self.assertEquals(resp.status_int, 201)
+        do_test(404, 'a/c/o')
+        do_test(404, '.a/c/o', {'X-Backend-Auto-Create': 'no'})
+        do_test(201, '.a/c/o')
+        do_test(404, 'a/.c/o')
+        do_test(404, 'a/c/.o')
+        do_test(201, 'a/c/o', {'X-Backend-Auto-Create': 'yes'})
 
-        resp = self.controller.PUT(Request.blank('/sda1/p/a/.c/o',
-            environ={'REQUEST_METHOD': 'PUT'}, headers=dict(headers)))
-        self.assertEquals(resp.status_int, 404)
-
-        resp = self.controller.PUT(Request.blank('/sda1/p/a/.c/.o',
-            environ={'REQUEST_METHOD': 'PUT'}, headers=dict(headers)))
-        self.assertEquals(resp.status_int, 404)
+        do_test(404, '.shards_a/c/o')
+        create_shard_headers = {
+            'X-Backend-Record-Type': 'shard',
+            'X-Backend-Storage-Policy-Index': '0'}
+        do_test(404, '.shards_a/c', create_shard_headers, '[]')
+        create_shard_headers['X-Backend-Auto-Create'] = 't'
+        do_test(201, '.shards_a/c', create_shard_headers, '[]')
 
     def test_delete_auto_create(self):
-        headers = {'x-timestamp': normalize_timestamp(1)}
-
-        resp = self.controller.DELETE(Request.blank('/sda1/p/a/c/o',
-            environ={'REQUEST_METHOD': 'DELETE'}, headers=dict(headers)))
-        self.assertEquals(resp.status_int, 404)
+        def do_test(expected_status, path, extra_headers=None):
+            headers = {'x-timestamp': Timestamp(1).internal}
+            if extra_headers:
+                headers.update(extra_headers)
+            req = Request.blank('/sda1/p/' + path,
+                                environ={'REQUEST_METHOD': 'DELETE'},
+                                headers=headers)
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.status_int, expected_status)
 
-        resp = self.controller.DELETE(Request.blank('/sda1/p/.a/c/o',
-            environ={'REQUEST_METHOD': 'DELETE'}, headers=dict(headers)))
-        self.assertEquals(resp.status_int, 204)
-
-        resp = self.controller.DELETE(Request.blank('/sda1/p/a/.c/o',
-            environ={'REQUEST_METHOD': 'DELETE'}, headers=dict(headers)))
-        self.assertEquals(resp.status_int, 404)
-
-        resp = self.controller.DELETE(Request.blank('/sda1/p/a/.c/.o',
-            environ={'REQUEST_METHOD': 'DELETE'}, headers=dict(headers)))
-        self.assertEquals(resp.status_int, 404)
+        do_test(404, 'a/c/o')
+        do_test(404, '.a/c/o', {'X-Backend-Auto-Create': 'false'})
+        do_test(204, '.a/c/o')
+        do_test(404, 'a/.c/o')
+        do_test(404, 'a/.c/.o')
+        do_test(404, '.shards_a/c/o')
+        do_test(204, 'a/c/o', {'X-Backend-Auto-Create': 'true'})
+        do_test(204, '.shards_a/c/o', {'X-Backend-Auto-Create': 'true'})
 
     def test_content_type_on_HEAD(self):
-        self.controller.PUT(Request.blank('/sda1/p/a/o',
-                            headers={'X-Timestamp': normalize_timestamp(1)},
-                            environ={'REQUEST_METHOD': 'PUT'}))
+        Request.blank('/sda1/p/a/o',
+                      headers={'X-Timestamp': Timestamp(1).internal},
+                      environ={'REQUEST_METHOD': 'PUT'}).get_response(
+                          self.controller)
 
         env = {'REQUEST_METHOD': 'HEAD'}
 
         req = Request.blank('/sda1/p/a/o?format=xml', environ=env)
-        resp = self.controller.HEAD(req)
-        self.assertEquals(resp.content_type, 'application/xml')
-        self.assertEquals(resp.charset, 'utf-8')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.content_type, 'application/xml')
+        self.assertEqual(resp.charset, 'utf-8')
 
         req = Request.blank('/sda1/p/a/o?format=json', environ=env)
-        resp = self.controller.HEAD(req)
-        self.assertEquals(resp.content_type, 'application/json')
-        self.assertEquals(resp.charset, 'utf-8')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.content_type, 'application/json')
+        self.assertEqual(resp.charset, 'utf-8')
 
         req = Request.blank('/sda1/p/a/o', environ=env)
-        resp = self.controller.HEAD(req)
-        self.assertEquals(resp.content_type, 'text/plain')
-        self.assertEquals(resp.charset, 'utf-8')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.content_type, 'text/plain')
+        self.assertEqual(resp.charset, 'utf-8')
 
         req = Request.blank(
             '/sda1/p/a/o', headers={'Accept': 'application/json'}, environ=env)
-        resp = self.controller.HEAD(req)
-        self.assertEquals(resp.content_type, 'application/json')
-        self.assertEquals(resp.charset, 'utf-8')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.content_type, 'application/json')
+        self.assertEqual(resp.charset, 'utf-8')
 
         req = Request.blank(
             '/sda1/p/a/o', headers={'Accept': 'application/xml'}, environ=env)
-        resp = self.controller.HEAD(req)
-        self.assertEquals(resp.content_type, 'application/xml')
-        self.assertEquals(resp.charset, 'utf-8')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.content_type, 'application/xml')
+        self.assertEqual(resp.charset, 'utf-8')
+
+    def test_updating_multiple_container_servers(self):
+        http_connect_args = []
+
+        def fake_http_connect(ipaddr, port, device, partition, method, path,
+                              headers=None, query_string=None, ssl=False):
+
+            class SuccessfulFakeConn(object):
+                @property
+                def status(self):
+                    return 200
+
+                def getresponse(self):
+                    return self
+
+                def read(self):
+                    return ''
+
+            captured_args = {'ipaddr': ipaddr, 'port': port,
+                             'device': device, 'partition': partition,
+                             'method': method, 'path': path, 'ssl': ssl,
+                             'headers': headers, 'query_string': query_string}
+
+            http_connect_args.append(
+                dict((k, v) for k, v in captured_args.items()
+                     if v is not None))
+
+        ts_put = next(self.ts)
+        req = Request.blank(
+            '/sda1/p/a/c',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': ts_put.internal,
+                     'X-Account-Partition': '30',
+                     'X-Account-Host': '1.2.3.4:5, 6.7.8.9:10',
+                     'X-Account-Device': 'sdb1, sdf1'})
+
+        orig_http_connect = container_server.http_connect
+        try:
+            container_server.http_connect = fake_http_connect
+            req.get_response(self.controller)
+        finally:
+            container_server.http_connect = orig_http_connect
+
+        http_connect_args.sort(key=operator.itemgetter('ipaddr'))
+
+        self.assertEqual(len(http_connect_args), 2)
+        self.assertEqual(
+            http_connect_args[0],
+            {'ipaddr': '1.2.3.4',
+             'port': '5',
+             'path': '/a/c',
+             'device': 'sdb1',
+             'partition': '30',
+             'method': 'PUT',
+             'ssl': False,
+             'headers': HeaderKeyDict({
+                 'x-bytes-used': 0,
+                 'x-delete-timestamp': '0',
+                 'x-object-count': 0,
+                 'x-put-timestamp': ts_put.internal,
+                 'X-Backend-Storage-Policy-Index': '%s' % POLICIES.default.idx,
+                 'referer': 'PUT http://localhost/sda1/p/a/c',
+                 'user-agent': 'container-server %d' % os.getpid(),
+                 'x-trans-id': '-'})})
+        self.assertEqual(
+            http_connect_args[1],
+            {'ipaddr': '6.7.8.9',
+             'port': '10',
+             'path': '/a/c',
+             'device': 'sdf1',
+             'partition': '30',
+             'method': 'PUT',
+             'ssl': False,
+             'headers': HeaderKeyDict({
+                 'x-bytes-used': 0,
+                 'x-delete-timestamp': '0',
+                 'x-object-count': 0,
+                 'x-put-timestamp': ts_put.internal,
+                 'X-Backend-Storage-Policy-Index': '%s' % POLICIES.default.idx,
+                 'referer': 'PUT http://localhost/sda1/p/a/c',
+                 'user-agent': 'container-server %d' % os.getpid(),
+                 'x-trans-id': '-'})})
+
+    def test_serv_reserv(self):
+        # Test replication_server flag was set from configuration file.
+        container_controller = container_server.ContainerController
+        conf = {'devices': self.testdir, 'mount_check': 'false'}
+        self.assertTrue(container_controller(conf).replication_server)
+        for val in [True, '1', 'True', 'true']:
+            conf['replication_server'] = val
+            self.assertTrue(container_controller(conf).replication_server)
+        for val in [False, 0, '0', 'False', 'false', 'test_string']:
+            conf['replication_server'] = val
+            self.assertFalse(container_controller(conf).replication_server)
+
+    def test_list_allowed_methods(self):
+        # Test list of allowed_methods
+        obj_methods = ['DELETE', 'PUT', 'HEAD', 'GET', 'POST']
+        repl_methods = ['REPLICATE']
+        for method_name in obj_methods:
+            method = getattr(self.controller, method_name)
+            self.assertFalse(hasattr(method, 'replication'))
+        for method_name in repl_methods:
+            method = getattr(self.controller, method_name)
+            self.assertEqual(method.replication, True)
+
+    def test_correct_allowed_method(self):
+        # Test correct work for allowed method using
+        # swift.container.server.ContainerController.__call__
+        inbuf = BytesIO()
+        errbuf = StringIO()
+        outbuf = StringIO()
+        self.controller = container_server.ContainerController(
+            {'devices': self.testdir, 'mount_check': 'false',
+             'replication_server': 'false'})
+
+        def start_response(status, headers):
+            """Sends args to outbuf"""
+            outbuf.writelines(status)
+
+        method = 'PUT'
+
+        env = {'REQUEST_METHOD': method,
+               'SCRIPT_NAME': '',
+               'PATH_INFO': '/sda1/p/a/c',
+               'SERVER_NAME': '127.0.0.1',
+               'SERVER_PORT': '8080',
+               'SERVER_PROTOCOL': 'HTTP/1.0',
+               'CONTENT_LENGTH': '0',
+               'wsgi.version': (1, 0),
+               'wsgi.url_scheme': 'http',
+               'wsgi.input': inbuf,
+               'wsgi.errors': errbuf,
+               'wsgi.multithread': False,
+               'wsgi.multiprocess': False,
+               'wsgi.run_once': False}
+
+        method_res = mock.MagicMock()
+        mock_method = public(lambda x: mock.MagicMock(return_value=method_res))
+        with mock.patch.object(self.controller, method, new=mock_method):
+            response = self.controller(env, start_response)
+            self.assertEqual(response, method_res)
+            # The controller passed responsibility of calling start_response
+            # to the mock, which never did
+            self.assertEqual(outbuf.getvalue(), '')
+
+    def test_not_allowed_method(self):
+        # Test correct work for NOT allowed method using
+        # swift.container.server.ContainerController.__call__
+        inbuf = BytesIO()
+        errbuf = StringIO()
+        outbuf = StringIO()
+        self.controller = container_server.ContainerController(
+            {'devices': self.testdir, 'mount_check': 'false',
+             'replication_server': 'false'})
+
+        def start_response(status, headers):
+            """Sends args to outbuf"""
+            outbuf.writelines(status)
+
+        method = 'PUT'
+
+        env = {'REQUEST_METHOD': method,
+               'SCRIPT_NAME': '',
+               'PATH_INFO': '/sda1/p/a/c',
+               'SERVER_NAME': '127.0.0.1',
+               'SERVER_PORT': '8080',
+               'SERVER_PROTOCOL': 'HTTP/1.0',
+               'CONTENT_LENGTH': '0',
+               'wsgi.version': (1, 0),
+               'wsgi.url_scheme': 'http',
+               'wsgi.input': inbuf,
+               'wsgi.errors': errbuf,
+               'wsgi.multithread': False,
+               'wsgi.multiprocess': False,
+               'wsgi.run_once': False}
+
+        answer = [b'<html><h1>Method Not Allowed</h1><p>The method is not '
+                  b'allowed for this resource.</p></html>']
+        mock_method = replication(public(lambda x: mock.MagicMock()))
+        with mock.patch.object(self.controller, method, new=mock_method):
+            response = self.controller.__call__(env, start_response)
+            self.assertEqual(response, answer)
+            self.assertEqual(outbuf.getvalue()[:4], '405 ')
+
+    def test_replication_server_call_all_methods(self):
+        inbuf = BytesIO()
+        errbuf = StringIO()
+        outbuf = StringIO()
+        self.controller = container_server.ContainerController(
+            {'devices': self.testdir, 'mount_check': 'false',
+             'replication_server': 'true'})
+
+        def start_response(status, headers):
+            """Sends args to outbuf"""
+            outbuf.writelines(status)
+
+        obj_methods = ['PUT', 'HEAD', 'GET', 'POST', 'DELETE', 'OPTIONS']
+        for method in obj_methods:
+            env = {'REQUEST_METHOD': method,
+                   'SCRIPT_NAME': '',
+                   'PATH_INFO': '/sda1/p/a/c',
+                   'SERVER_NAME': '127.0.0.1',
+                   'SERVER_PORT': '8080',
+                   'SERVER_PROTOCOL': 'HTTP/1.0',
+                   'HTTP_X_TIMESTAMP': next(self.ts).internal,
+                   'CONTENT_LENGTH': '0',
+                   'wsgi.version': (1, 0),
+                   'wsgi.url_scheme': 'http',
+                   'wsgi.input': inbuf,
+                   'wsgi.errors': errbuf,
+                   'wsgi.multithread': False,
+                   'wsgi.multiprocess': False,
+                   'wsgi.run_once': False}
+            self.controller(env, start_response)
+            self.assertEqual(errbuf.getvalue(), '')
+            self.assertIn(outbuf.getvalue()[:4], ('200 ', '201 ', '204 '))
+
+    def test__call__raise_timeout(self):
+        inbuf = WsgiBytesIO()
+        errbuf = StringIO()
+        outbuf = StringIO()
+        self.logger = debug_logger('test')
+        self.container_controller = container_server.ContainerController(
+            {'devices': self.testdir, 'mount_check': 'false',
+             'replication_server': 'false', 'log_requests': 'false'},
+            logger=self.logger)
+
+        def start_response(status, headers):
+            # Sends args to outbuf
+            outbuf.writelines(status)
+
+        method = 'PUT'
+
+        env = {'REQUEST_METHOD': method,
+               'SCRIPT_NAME': '',
+               'PATH_INFO': '/sda1/p/a/c',
+               'SERVER_NAME': '127.0.0.1',
+               'SERVER_PORT': '8080',
+               'SERVER_PROTOCOL': 'HTTP/1.0',
+               'CONTENT_LENGTH': '0',
+               'wsgi.version': (1, 0),
+               'wsgi.url_scheme': 'http',
+               'wsgi.input': inbuf,
+               'wsgi.errors': errbuf,
+               'wsgi.multithread': False,
+               'wsgi.multiprocess': False,
+               'wsgi.run_once': False}
+
+        @public
+        def mock_put_method(*args, **kwargs):
+            raise Exception()
+
+        with mock.patch.object(self.container_controller, method,
+                               new=mock_put_method):
+            response = self.container_controller.__call__(env, start_response)
+            self.assertTrue(response[0].startswith(
+                b'Traceback (most recent call last):'))
+            self.assertEqual(self.logger.get_lines_for_level('error'), [
+                'ERROR __call__ error with %(method)s %(path)s : ' % {
+                    'method': 'PUT', 'path': '/sda1/p/a/c'},
+            ])
+            self.assertEqual(self.logger.get_lines_for_level('info'), [])
+            self.assertEqual(outbuf.getvalue()[:4], '500 ')
+
+    def test_GET_log_requests_true(self):
+        self.controller.log_requests = True
+
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)
+        self.assertTrue(self.controller.logger.log_dict['info'])
+
+    def test_GET_log_requests_false(self):
+        self.controller.log_requests = False
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 404)
+        self.assertFalse(self.controller.logger.log_dict['info'])
+
+    def test_log_line_format(self):
+        req = Request.blank(
+            '/sda1/p/a/c',
+            environ={'REQUEST_METHOD': 'HEAD', 'REMOTE_ADDR': '1.2.3.4'})
+        with mock.patch('time.time',
+                        mock.MagicMock(side_effect=[10000.0, 10001.0, 10002.0,
+                                                    10002.0, 10002.0])), \
+                mock.patch('os.getpid', mock.MagicMock(return_value=1234)):
+            req.get_response(self.controller)
+        info_lines = self.controller.logger.get_lines_for_level('info')
+        self.assertEqual(info_lines, [
+            '1.2.3.4 - - [01/Jan/1970:02:46:42 +0000] "HEAD /sda1/p/a/c" '
+            '404 - "-" "-" "-" 2.0000 "-" 1234 0',
+        ])
+
+
+@patch_policies([
+    StoragePolicy(0, 'legacy'),
+    StoragePolicy(1, 'one'),
+    StoragePolicy(2, 'two', True),
+    StoragePolicy(3, 'three'),
+    StoragePolicy(4, 'four'),
+])
+class TestNonLegacyDefaultStoragePolicy(TestContainerController):
+    """
+    Test swift.container.server.ContainerController with a non-legacy default
+    Storage Policy.
+    """
+
+    def _update_object_put_headers(self, req):
+        """
+        Add policy index headers for containers created with default policy
+        - which in this TestCase is 2.
+        """
+        req.headers['X-Backend-Storage-Policy-Index'] = \
+            str(POLICIES.default.idx)
 
 
 if __name__ == '__main__':
     unittest.main()
-
diff --git a/test/unit/container/test_sharder.py b/test/unit/container/test_sharder.py
new file mode 100644
index 0000000000..86b63c4c3b
--- /dev/null
+++ b/test/unit/container/test_sharder.py
@@ -0,0 +1,9836 @@
+# Copyright (c) 2010-2017 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import json
+import random
+import argparse
+
+import eventlet
+import os
+import shutil
+from contextlib import contextmanager
+from tempfile import mkdtemp
+from uuid import uuid4
+
+from unittest import mock
+import unittest
+
+from collections import defaultdict
+
+import time
+
+from copy import deepcopy
+
+from swift.common import internal_client
+from swift.container import replicator
+from swift.container.backend import ContainerBroker, UNSHARDED, SHARDING, \
+    SHARDED, DATADIR
+from swift.container.sharder import ContainerSharder, sharding_enabled, \
+    CleavingContext, DEFAULT_SHARDER_CONF, finalize_shrinking, \
+    find_shrinking_candidates, process_compactible_shard_sequences, \
+    find_compactible_shard_sequences, is_shrinking_candidate, \
+    is_sharding_candidate, find_paths, rank_paths, ContainerSharderConf, \
+    find_paths_with_gaps, combine_shard_ranges, find_overlapping_ranges, \
+    update_own_shard_range_stats
+from swift.common.utils import ShardRange, Timestamp, hash_path, \
+    encode_timestamps, parse_db_filename, quorum_size, Everything, md5, \
+    ShardName, Namespace
+
+from test.debug_logger import debug_logger, debug_labeled_statsd_client
+from test.unit import FakeRing, make_timestamp_iter, unlink_files, \
+    mocked_http_conn, mock_timestamp_now, mock_timestamp_now_with_iter, \
+    attach_fake_replication_rpc
+
+
+class BaseTestSharder(unittest.TestCase):
+    def setUp(self):
+        self.tempdir = mkdtemp()
+        self.ts_iter = make_timestamp_iter()
+        self.logger = debug_logger('sharder-test')
+        conf = {
+            'log_statsd_host': 'host',
+            'log_statsd_port': 8125,
+            'statsd_label_mode': 'dogstatsd',
+            'statsd_emit_legacy': True,
+        }
+        self.statsd = debug_labeled_statsd_client(conf)
+
+    def tearDown(self):
+        shutil.rmtree(self.tempdir, ignore_errors=True)
+
+    def _assert_shard_ranges_equal(self, expected, actual):
+        self.assertEqual([dict(sr) for sr in expected],
+                         [dict(sr) for sr in actual])
+
+    def _make_broker(self, account='a', container='c', epoch=None,
+                     device='sda', part=0, hash_=None, put_timestamp=None):
+        """
+        Make a ContainerBroker.
+
+        :param account: account name
+        :param container: container name
+        :param epoch: epoch; a Timestamp instance
+        :param device: device name
+        :param part: partition number
+        :param hash_: hash of container name
+        :param put_timestamp: put timestamp; a Timestamp instance
+        :return: a ContainerBroker instance
+        """
+        hash_ = hash_ or md5(
+            container.encode('utf-8'), usedforsecurity=False).hexdigest()
+        datadir = os.path.join(
+            self.tempdir, device, 'containers', str(part), hash_[-3:], hash_)
+        if epoch:
+            filename = '%s_%s.db' % (hash_, epoch.normal)
+        else:
+            filename = hash_ + '.db'
+        db_file = os.path.join(datadir, filename)
+        broker = ContainerBroker(
+            db_file, account=account, container=container,
+            logger=self.logger)
+        put_ts_str = None if put_timestamp is None else put_timestamp.internal
+        broker.initialize(put_timestamp=put_ts_str)
+        return broker
+
+    def _make_old_style_sharding_broker(self, account='a', container='c',
+                                        shard_bounds=(('', 'middle'),
+                                                      ('middle', ''))):
+        broker = self._make_broker(account=account, container=container)
+        broker.set_sharding_sysmeta('Root', 'a/c')
+        old_db_id = broker.get_info()['id']
+        broker.enable_sharding(next(self.ts_iter))
+        shard_ranges = self._make_shard_ranges(
+            shard_bounds, state=ShardRange.CLEAVED)
+        broker.merge_shard_ranges(shard_ranges)
+        self.assertTrue(broker.set_sharding_state())
+        broker = ContainerBroker(broker.db_file, account='a', container='c')
+        self.assertNotEqual(old_db_id, broker.get_info()['id'])  # sanity check
+        return broker
+
+    def _make_sharding_broker(self, account='a', container='c',
+                              shard_bounds=(('', 'middle'), ('middle', ''))):
+        broker = self._make_broker(account=account, container=container)
+        broker.set_sharding_sysmeta('Quoted-Root', 'a/c')
+        old_db_id = broker.get_info()['id']
+        broker.enable_sharding(next(self.ts_iter))
+        shard_ranges = self._make_shard_ranges(
+            shard_bounds, state=ShardRange.CLEAVED)
+        broker.merge_shard_ranges(shard_ranges)
+        self.assertTrue(broker.set_sharding_state())
+        broker = ContainerBroker(broker.db_file, account='a', container='c')
+        self.assertNotEqual(old_db_id, broker.get_info()['id'])  # sanity check
+        return broker
+
+    def _make_shrinking_broker(self, account='.shards_a', container='shard_c',
+                               lower='here', upper='there', objects=None):
+        # caller should merge any acceptor range(s) into returned broker
+        broker = self._make_broker(account=account, container=container)
+        for obj in objects or []:
+            broker.put_object(*obj)
+        own_shard_range = ShardRange(
+            broker.path, next(self.ts_iter), lower, upper,
+            state=ShardRange.SHRINKING, epoch=next(self.ts_iter))
+        broker.merge_shard_ranges([own_shard_range])
+        broker.set_sharding_sysmeta('Root', 'a/c')
+        self.assertFalse(broker.is_root_container())  # sanity check
+        self.assertTrue(broker.set_sharding_state())
+        return broker
+
+    def _make_shard_ranges(self, bounds, state=None, object_count=0,
+                           timestamp=Timestamp.now(), **kwargs):
+        if not isinstance(state, (tuple, list)):
+            state = [state] * len(bounds)
+        state_iter = iter(state)
+        return [ShardRange('.shards_a/c_%s_%s' % (upper, index), timestamp,
+                           lower, upper, state=next(state_iter),
+                           object_count=object_count, **kwargs)
+                for index, (lower, upper) in enumerate(bounds)]
+
+    def ts_encoded(self):
+        # make a unique timestamp string with multiple timestamps encoded;
+        # use different deltas between component timestamps
+        timestamps = [next(self.ts_iter) for i in range(4)]
+        return encode_timestamps(
+            timestamps[0], timestamps[1], timestamps[3])
+
+
+class TestSharder(BaseTestSharder):
+    def _do_test_init(self, conf, expected, use_logger=True):
+        logger = self.logger if use_logger else None
+        if logger:
+            logger.clear()
+            self.statsd.clear()
+
+        with mock.patch(
+                'swift.container.sharder.internal_client.InternalClient') \
+                as mock_ic:
+            with mock.patch('swift.common.db_replicator.ring.Ring') \
+                    as mock_ring:
+                mock_ring.return_value = mock.MagicMock()
+                mock_ring.return_value.replica_count = 3
+                sharder = ContainerSharder(conf, logger=logger)
+        mock_ring.assert_called_once_with(
+            '/etc/swift', ring_name='container')
+        for k, v in expected.items():
+            self.assertTrue(hasattr(sharder, k), 'Missing attr %s' % k)
+            self.assertEqual(v, getattr(sharder, k),
+                             'Incorrect value: expected %s=%s but got %s' %
+                             (k, v, getattr(sharder, k)))
+        return sharder, mock_ic
+
+    def test_init(self):
+        # default values
+        expected = {
+            'mount_check': True, 'bind_ip': '0.0.0.0', 'port': 6201,
+            'per_diff': 1000, 'max_diffs': 100, 'interval': 30,
+            'databases_per_second': 50,
+            'cleave_row_batch_size': 10000,
+            'node_timeout': 10, 'conn_timeout': 5,
+            'rsync_compress': False,
+            'rsync_module': '{replication_ip}::container',
+            'reclaim_age': 86400 * 7,
+            'shard_container_threshold': 1000000,
+            'rows_per_shard': 500000,
+            'shrink_threshold': 100000,
+            'expansion_limit': 750000,
+            'cleave_batch_size': 2,
+            'shard_scanner_batch_size': 10,
+            'rcache': '/var/cache/swift/container.recon',
+            'shards_account_prefix': '.shards_',
+            'auto_shard': False,
+            'recon_candidates_limit': 5,
+            'recon_sharded_timeout': 43200,
+            'shard_replication_quorum': 2,
+            'existing_shard_replication_quorum': 2,
+            'max_shrinking': 1,
+            'max_expanding': -1,
+            'stats_interval': 3600,
+        }
+        sharder, mock_ic = self._do_test_init({}, expected, use_logger=False)
+        self.assertEqual(
+            'container-sharder', sharder.logger.logger.name)
+        mock_ic.assert_called_once_with(
+            '/etc/swift/internal-client.conf', 'Swift Container Sharder', 3,
+            use_replication_network=True,
+            global_conf={'log_name': 'container-sharder-ic'})
+        self.assertEqual(self.logger.get_lines_for_level('warning'), [])
+
+        # non-default shard_container_threshold influences other defaults
+        conf = {'shard_container_threshold': 20000000}
+        expected.update({
+            'shard_container_threshold': 20000000,
+            'shrink_threshold': 2000000,
+            'expansion_limit': 15000000,
+            'rows_per_shard': 10000000
+        })
+        sharder, mock_ic = self._do_test_init(conf, expected)
+        mock_ic.assert_called_once_with(
+            '/etc/swift/internal-client.conf', 'Swift Container Sharder', 3,
+            use_replication_network=True,
+            global_conf={'log_name': 'container-sharder-ic'})
+        self.assertEqual(self.logger.get_lines_for_level('warning'), [])
+
+        # non-default values
+        conf = {
+            'mount_check': False, 'bind_ip': '10.11.12.13', 'bind_port': 62010,
+            'per_diff': 2000, 'max_diffs': 200, 'interval': 60,
+            'databases_per_second': 5,
+            'cleave_row_batch_size': 3000,
+            'node_timeout': 20, 'conn_timeout': 1,
+            'rsync_compress': True,
+            'rsync_module': '{replication_ip}::container_sda/',
+            'reclaim_age': 86400 * 14,
+            'shrink_threshold': 2000000,
+            'expansion_limit': 17000000,
+            'shard_container_threshold': 20000000,
+            'cleave_batch_size': 4,
+            'shard_scanner_batch_size': 8,
+            'request_tries': 2,
+            'internal_client_conf_path': '/etc/swift/my-sharder-ic.conf',
+            'recon_cache_path': '/var/cache/swift-alt',
+            'auto_shard': 'yes',
+            'recon_candidates_limit': 10,
+            'recon_sharded_timeout': 7200,
+            'shard_replication_quorum': 1,
+            'existing_shard_replication_quorum': 0,
+            'max_shrinking': 5,
+            'max_expanding': 4,
+            'rows_per_shard': 13000000,
+            'stats_interval': 300,
+        }
+        expected = {
+            'mount_check': False, 'bind_ip': '10.11.12.13', 'port': 62010,
+            'per_diff': 2000, 'max_diffs': 200, 'interval': 60,
+            'databases_per_second': 5,
+            'cleave_row_batch_size': 3000,
+            'node_timeout': 20, 'conn_timeout': 1,
+            'rsync_compress': True,
+            'rsync_module': '{replication_ip}::container_sda',
+            'reclaim_age': 86400 * 14,
+            'shard_container_threshold': 20000000,
+            'rows_per_shard': 13000000,
+            'shrink_threshold': 2000000,
+            'expansion_limit': 17000000,
+            'cleave_batch_size': 4,
+            'shard_scanner_batch_size': 8,
+            'rcache': '/var/cache/swift-alt/container.recon',
+            'shards_account_prefix': '.shards_',
+            'auto_shard': True,
+            'recon_candidates_limit': 10,
+            'recon_sharded_timeout': 7200,
+            'shard_replication_quorum': 1,
+            'existing_shard_replication_quorum': 0,
+            'max_shrinking': 5,
+            'max_expanding': 4,
+            'stats_interval': 300,
+        }
+        sharder, mock_ic = self._do_test_init(conf, expected)
+        mock_ic.assert_called_once_with(
+            '/etc/swift/my-sharder-ic.conf', 'Swift Container Sharder', 2,
+            use_replication_network=True,
+            global_conf={'log_name': 'container-sharder-ic'})
+        self.assertEqual(self.logger.get_lines_for_level('warning'), [])
+
+        expected.update({'shard_replication_quorum': 3,
+                         'existing_shard_replication_quorum': 3})
+        conf.update({'shard_replication_quorum': 4,
+                     'existing_shard_replication_quorum': 4})
+        self._do_test_init(conf, expected)
+        self.assertEqual(self.logger.get_lines_for_level('warning'), [
+            'shard_replication_quorum of 4 exceeds replica count 3, '
+            'reducing to 3',
+            'existing_shard_replication_quorum of 4 exceeds replica count 3, '
+            'reducing to 3',
+        ])
+
+        with self.assertRaises(ValueError) as cm:
+            self._do_test_init({'shard_shrink_point': 101}, {})
+        self.assertIn(
+            'greater than 0, less than 100, not "101"', str(cm.exception))
+
+        with self.assertRaises(ValueError) as cm:
+            self._do_test_init({'shard_shrink_merge_point': 101}, {})
+        self.assertIn(
+            'greater than 0, less than 100, not "101"', str(cm.exception))
+
+    def test_init_deprecated_options(self):
+        # percent values applied if absolute values not given
+        conf = {
+            'shard_shrink_point': 7,  # trumps shrink_threshold
+            'shard_shrink_merge_point': 95,  # trumps expansion_limit
+            'shard_container_threshold': 20000000,
+        }
+        expected = {
+            'mount_check': True, 'bind_ip': '0.0.0.0', 'port': 6201,
+            'per_diff': 1000, 'max_diffs': 100, 'interval': 30,
+            'databases_per_second': 50,
+            'cleave_row_batch_size': 10000,
+            'node_timeout': 10, 'conn_timeout': 5,
+            'rsync_compress': False,
+            'rsync_module': '{replication_ip}::container',
+            'reclaim_age': 86400 * 7,
+            'shard_container_threshold': 20000000,
+            'rows_per_shard': 10000000,
+            'shrink_threshold': 1400000,
+            'expansion_limit': 19000000,
+            'cleave_batch_size': 2,
+            'shard_scanner_batch_size': 10,
+            'rcache': '/var/cache/swift/container.recon',
+            'shards_account_prefix': '.shards_',
+            'auto_shard': False,
+            'recon_candidates_limit': 5,
+            'shard_replication_quorum': 2,
+            'existing_shard_replication_quorum': 2,
+            'max_shrinking': 1,
+            'max_expanding': -1
+        }
+        self._do_test_init(conf, expected)
+        # absolute values override percent values
+        conf = {
+            'shard_shrink_point': 7,
+            'shrink_threshold': 1300000,  # trumps shard_shrink_point
+            'shard_shrink_merge_point': 95,
+            'expansion_limit': 17000000,  # trumps shard_shrink_merge_point
+            'shard_container_threshold': 20000000,
+        }
+        expected = {
+            'mount_check': True, 'bind_ip': '0.0.0.0', 'port': 6201,
+            'per_diff': 1000, 'max_diffs': 100, 'interval': 30,
+            'databases_per_second': 50,
+            'cleave_row_batch_size': 10000,
+            'node_timeout': 10, 'conn_timeout': 5,
+            'rsync_compress': False,
+            'rsync_module': '{replication_ip}::container',
+            'reclaim_age': 86400 * 7,
+            'shard_container_threshold': 20000000,
+            'rows_per_shard': 10000000,
+            'shrink_threshold': 1300000,
+            'expansion_limit': 17000000,
+            'cleave_batch_size': 2,
+            'shard_scanner_batch_size': 10,
+            'rcache': '/var/cache/swift/container.recon',
+            'shards_account_prefix': '.shards_',
+            'auto_shard': False,
+            'recon_candidates_limit': 5,
+            'shard_replication_quorum': 2,
+            'existing_shard_replication_quorum': 2,
+            'max_shrinking': 1,
+            'max_expanding': -1
+        }
+        self._do_test_init(conf, expected)
+
+    def test_init_internal_client_conf_loading_error(self):
+        with mock.patch('swift.common.db_replicator.ring.Ring') \
+                as mock_ring:
+            mock_ring.return_value = mock.MagicMock()
+            mock_ring.return_value.replica_count = 3
+            with self.assertRaises(SystemExit) as cm:
+                ContainerSharder(
+                    {'internal_client_conf_path':
+                     os.path.join(self.tempdir, 'nonexistent')})
+        self.assertIn('Unable to load internal client', str(cm.exception))
+
+        with mock.patch('swift.common.db_replicator.ring.Ring') \
+                as mock_ring:
+            mock_ring.return_value = mock.MagicMock()
+            mock_ring.return_value.replica_count = 3
+            with mock.patch(
+                    'swift.container.sharder.internal_client.InternalClient',
+                    side_effect=Exception('kaboom')):
+                with self.assertRaises(Exception) as cm:
+                    ContainerSharder({})
+        self.assertIn('kaboom', str(cm.exception))
+
+    def test_init_internal_client_log_name(self):
+        def _do_test_init_ic_log_name(conf, exp_internal_client_log_name):
+            with mock.patch(
+                    'swift.container.sharder.internal_client.InternalClient') \
+                    as mock_ic:
+                with mock.patch('swift.common.db_replicator.ring.Ring') \
+                        as mock_ring:
+                    mock_ring.return_value = mock.MagicMock()
+                    mock_ring.return_value.replica_count = 3
+                    ContainerSharder(conf)
+            mock_ic.assert_called_once_with(
+                '/etc/swift/internal-client.conf',
+                'Swift Container Sharder', 3,
+                global_conf={'log_name': exp_internal_client_log_name},
+                use_replication_network=True)
+
+        _do_test_init_ic_log_name({}, 'container-sharder-ic')
+        _do_test_init_ic_log_name({'log_name': 'container-sharder-6021'},
+                                  'container-sharder-6021-ic')
+
+    def test_periodic_warning(self):
+        now = [time.time()]
+
+        def mock_time():
+            return now[0]
+
+        with mock.patch('swift.container.sharder.time.time', mock_time):
+            with self._mock_sharder() as sharder:
+                sharder.periodic_warnings_interval = 5
+                broker1 = self._make_broker(container='c1')
+                broker2 = self._make_broker(container='c2')
+                for i in range(5):
+                    sharder.periodic_warning(broker1, 'periodic warning 1')
+                    sharder.periodic_warning(broker1, 'periodic warning 1a')
+                    sharder.periodic_warning(broker2, 'periodic warning 2')
+                    now[0] += 1
+                sharder.db_logger.warning(broker1, 'normal warning')
+                sharder.periodic_warning(broker1, 'periodic warning 1')
+                sharder.periodic_warning(broker1, 'periodic warning 1a')
+                sharder.periodic_warning(broker2, 'periodic warning 2')
+                sharder.db_logger.warning(broker1, 'normal warning')
+                for i in range(10):
+                    sharder.periodic_warning(broker1, 'periodic warning 1')
+                    sharder.periodic_warning(broker1, 'periodic warning 1a')
+                    sharder.periodic_warning(broker2, 'periodic warning 2')
+                    now[0] += 1
+        lines = self.logger.get_lines_for_level('warning')
+        self.assertEqual(11, len(lines))
+        self.assertEqual(
+            ['periodic warning 1, path: a/c1, db: %s' % broker1.db_file,
+             'periodic warning 1a, path: a/c1, db: %s' % broker1.db_file,
+             'periodic warning 2, path: a/c2, db: %s' % broker2.db_file,
+             'normal warning, path: a/c1, db: %s' % broker1.db_file,
+             'periodic warning 1, path: a/c1, db: %s' % broker1.db_file,
+             'periodic warning 1a, path: a/c1, db: %s' % broker1.db_file,
+             'periodic warning 2, path: a/c2, db: %s' % broker2.db_file,
+             'normal warning, path: a/c1, db: %s' % broker1.db_file,
+             'periodic warning 1, path: a/c1, db: %s' % broker1.db_file,
+             'periodic warning 1a, path: a/c1, db: %s' % broker1.db_file,
+             'periodic warning 2, path: a/c2, db: %s' % broker2.db_file],
+            lines)
+
+    def _assert_stats(self, expected, sharder, category):
+        # assertEqual doesn't work with a stats defaultdict so copy to a dict
+        # before comparing
+        stats = sharder.stats['sharding'][category]
+        actual = {}
+        for k, v in expected.items():
+            actual[k] = stats[k]
+        self.assertEqual(expected, actual)
+        return stats
+
+    def _assert_recon_stats(self, expected, sharder, category):
+        with open(sharder.rcache, 'rb') as fd:
+            recon = json.load(fd)
+        stats = recon['sharding_stats']['sharding'].get(category)
+        self.assertEqual(expected, stats)
+
+    def assert_labeled_timing_since_stats(self, exp_metrics_values_labels):
+        statsd_calls = self.statsd.calls['timing_since']
+        exp_calls = []
+        for metric, value, labels in exp_metrics_values_labels:
+            exp_calls.append(((metric, mock.ANY), {'labels': labels}))
+        self.assertEqual(exp_calls, statsd_calls)
+        for i, (metric, value, labels) in enumerate(exp_metrics_values_labels):
+            self.assertAlmostEqual(
+                value, statsd_calls[i][0][1], places=4, msg=i)
+
+    def test_increment_stats(self):
+        with self._mock_sharder() as sharder:
+            sharder._increment_stat('visited', 'success')
+            sharder._increment_stat('visited', 'success')
+            sharder._increment_stat('visited', 'failure')
+            sharder._increment_stat('visited', 'completed')
+            sharder._increment_stat('cleaved', 'success')
+        expected = {'success': 2,
+                    'failure': 1,
+                    'completed': 1}
+        self._assert_stats(expected, sharder, 'visited')
+        self._assert_stats({'success': 1}, sharder, 'cleaved')
+
+    def test_increment_stats_with_statsd(self):
+        with self._mock_sharder() as sharder:
+            sharder._increment_stat('visited', 'success', statsd=True)
+            sharder._increment_stat('visited', 'success', statsd=True)
+            sharder._increment_stat('visited', 'failure', statsd=True)
+            sharder._increment_stat('visited', 'failure', statsd=False)
+            sharder._increment_stat('visited', 'completed')
+        expected = {'success': 2,
+                    'failure': 2,
+                    'completed': 1}
+        self._assert_stats(expected, sharder, 'visited')
+        counts = sharder.logger.statsd_client.get_stats_counts()
+        self.assertEqual(2, counts.get('visited_success'))
+        self.assertEqual(1, counts.get('visited_failure'))
+        self.assertIsNone(counts.get('visited_completed'))
+
+    def test_update_stat(self):
+        with self._mock_sharder() as sharder:
+            sharder._update_stat('scanned', 'found', step=4)
+        self._assert_stats({'found': 4}, sharder, 'scanned')
+        with self._mock_sharder() as sharder:
+            sharder._update_stat('scanned', 'found', step=4)
+            sharder._update_stat('misplaced', 'placed', step=456, statsd=True)
+        self._assert_stats({'found': 4}, sharder, 'scanned')
+        self._assert_stats({'placed': 456}, sharder, 'misplaced')
+        self.assertEqual({'misplaced_placed': 456},
+                         sharder.logger.statsd_client.get_stats_counts())
+
+    def test_run_forever(self):
+        conf = {'recon_cache_path': self.tempdir,
+                'devices': self.tempdir}
+        with self._mock_sharder(conf) as sharder:
+            sharder._check_node = lambda node: os.path.join(
+                sharder.conf['devices'], node['device'])
+            sharder.logger.clear()
+            brokers = []
+            for container in ('c1', 'c2'):
+                broker = self._make_broker(
+                    container=container, hash_=container + 'hash',
+                    device=sharder.ring.devs[0]['device'], part=0)
+                broker.update_metadata({'X-Container-Sysmeta-Sharding':
+                                        ('true', next(self.ts_iter).internal)})
+                brokers.append(broker)
+
+            fake_stats = {
+                'scanned': {'attempted': 1, 'success': 1, 'failure': 0,
+                            'found': 2, 'min_time': 99, 'max_time': 123},
+                'created': {'attempted': 1, 'success': 1, 'failure': 1},
+                'cleaved': {'attempted': 1, 'success': 1, 'failure': 0,
+                            'min_time': 0.01, 'max_time': 1.3},
+                'misplaced': {'attempted': 1, 'success': 1, 'failure': 0,
+                              'found': 1, 'placed': 1, 'unplaced': 0},
+                'audit_root': {'attempted': 5, 'success': 4, 'failure': 1,
+                               'num_overlap': 0, "has_overlap": 0},
+                'audit_shard': {'attempted': 2, 'success': 2, 'failure': 0},
+            }
+            time_progression = [1, 2, 3, 3600, 4, 15, 15, 0]
+            recon_data = []
+            fake_process_broker_calls = []
+            MAX_BROKER_CALLS = 8
+
+            def mock_dump_recon_cache(data, *args):
+                recon_data.append(deepcopy(data))
+
+            with mock.patch('swift.container.sharder.time.time') as fake_time:
+                def fake_process_broker(broker, *args, **kwargs):
+                    fake_process_broker_calls.append((broker, args, kwargs))
+
+                    if len(fake_process_broker_calls) == MAX_BROKER_CALLS:
+                        mock_sleep.side_effect = Exception('Test over')
+                    else:
+                        fake_time.return_value += time_progression[
+                            len(fake_process_broker_calls)]
+
+                    sharder.stats['sharding'].update(fake_stats)
+
+                with mock.patch(
+                        'swift.container.sharder.time.sleep') as mock_sleep:
+                    with mock.patch(
+                            'swift.container.sharder.is_sharding_candidate',
+                            return_value=True):
+                        with mock.patch(
+                                'swift.container.sharder.dump_recon_cache',
+                                mock_dump_recon_cache):
+                            fake_time.return_value = time_progression[0]
+                            sharder._is_sharding_candidate = lambda x: True
+                            sharder._process_broker = fake_process_broker
+                            with self.assertRaises(Exception) as cm:
+                                sharder.run_forever()
+
+            self.assertEqual('Test over', str(cm.exception))
+            # four cycles are started, two brokers visited per cycle, but
+            # fourth never completes
+            self.assertEqual(8, len(fake_process_broker_calls))
+            # expect initial random sleep then one sleep between first and
+            # second pass
+            self.assertEqual(3, mock_sleep.call_count)
+            self.assertLessEqual(mock_sleep.call_args_list[0][0][0], 30)
+            self.assertLessEqual(mock_sleep.call_args_list[1][0][0],
+                                 30 - time_progression[1])
+
+            lines = sharder.logger.get_lines_for_level('info')
+            categories = ('visited', 'scanned', 'created', 'cleaved',
+                          'misplaced', 'audit_root', 'audit_shard')
+
+            def check_categories(start_time):
+                for category in categories:
+                    line = lines.pop(0)
+                    self.assertIn('Since %s' % time.ctime(start_time), line)
+                    self.assertIn(category, line)
+                    for k, v in fake_stats.get(category, {}).items():
+                        self.assertIn('%s:%s' % (k, v), line)
+
+            def check_logs(cycle_time, start_time,
+                           expect_periodic_stats=False):
+                self.assertIn('Container sharder cycle starting', lines.pop(0))
+                check_categories(start_time)
+                if expect_periodic_stats:
+                    check_categories(start_time)
+                self.assertIn('Container sharder cycle completed: %.02fs' %
+                              cycle_time, lines.pop(0))
+
+            check_logs(sum(time_progression[1:3]), time_progression[0])
+            check_logs(sum(time_progression[3:5]), sum(time_progression[:3]),
+                       expect_periodic_stats=True)
+            check_logs(sum(time_progression[5:7]), sum(time_progression[0:5]))
+            check_logs(sum(time_progression[7:9]), sum(time_progression[:7]))
+            lines = sharder.logger.get_lines_for_level('error')
+            # there is no exception handling around our Test Over "exit" during
+            # the interval sleep of run_forever
+            self.assertEqual([], lines)
+
+            def check_recon(data, time, last, expected_stats):
+                self.assertEqual(time, data['sharding_time'])
+                self.assertEqual(last, data['sharding_last'])
+                self.assertEqual(
+                    expected_stats, dict(data['sharding_stats']['sharding']))
+
+            def stats_for_candidate(broker):
+                return {'object_count': 0,
+                        'tombstones': -1,
+                        'account': broker.account,
+                        'meta_timestamp': mock.ANY,
+                        'container': broker.container,
+                        'file_size': os.stat(broker.db_file).st_size,
+                        'path': broker.db_file,
+                        'root': broker.path,
+                        'node_index': 0}
+
+            self.assertEqual(5, len(recon_data))
+            # stats report at end of first cycle
+            fake_stats.update({'visited': {'attempted': 2, 'skipped': 0,
+                                           'success': 2, 'failure': 0,
+                                           'completed': 0}})
+            fake_stats.update({
+                'sharding_candidates': {
+                    'found': 2,
+                    'top': [stats_for_candidate(call[0])
+                            for call in fake_process_broker_calls[:2]]
+                }
+            })
+            fake_stats.update({
+                'shrinking_candidates': {
+                    'found': 0,
+                    'top': []
+                }
+            })
+            check_recon(recon_data[0], sum(time_progression[1:3]),
+                        sum(time_progression[:3]), fake_stats)
+            # periodic stats report after first broker has been visited during
+            # second cycle - one candidate identified so far this cycle
+            fake_stats.update({'visited': {'attempted': 1, 'skipped': 0,
+                                           'success': 1, 'failure': 0,
+                                           'completed': 0}})
+            fake_stats.update({
+                'sharding_candidates': {
+                    'found': 1,
+                    'top': [stats_for_candidate(call[0])
+                            for call in fake_process_broker_calls[2:3]]
+                }
+            })
+            check_recon(recon_data[1], time_progression[3],
+                        sum(time_progression[:4]), fake_stats)
+            # stats report at end of second cycle - both candidates reported
+            fake_stats.update({'visited': {'attempted': 2, 'skipped': 0,
+                                           'success': 2, 'failure': 0,
+                                           'completed': 0}})
+            fake_stats.update({
+                'sharding_candidates': {
+                    'found': 2,
+                    'top': [stats_for_candidate(call[0])
+                            for call in fake_process_broker_calls[2:4]]
+                }
+            })
+            check_recon(recon_data[2], sum(time_progression[3:5]),
+                        sum(time_progression[:5]), fake_stats)
+            # stats report at end of third cycle
+            fake_stats.update({'visited': {'attempted': 2, 'skipped': 0,
+                                           'success': 2, 'failure': 0,
+                                           'completed': 0}})
+            fake_stats.update({
+                'sharding_candidates': {
+                    'found': 2,
+                    'top': [stats_for_candidate(call[0])
+                            for call in fake_process_broker_calls[4:6]]
+                }
+            })
+            check_recon(recon_data[3], sum(time_progression[5:7]),
+                        sum(time_progression[:7]), fake_stats)
+
+    def test_one_shard_cycle(self):
+        conf = {'recon_cache_path': self.tempdir,
+                'devices': self.tempdir,
+                'shard_container_threshold': 9}
+
+        def fake_ismount(path):
+            # unmounted_dev is defined from .get_more_nodes() below
+            unmounted_path = os.path.join(conf['devices'],
+                                          unmounted_dev['device'])
+            if path == unmounted_path:
+                return False
+            else:
+                return True
+
+        with self._mock_sharder(conf) as sharder, \
+                mock.patch('swift.common.utils.ismount', fake_ismount), \
+                mock.patch('swift.container.sharder.is_local_device',
+                           return_value=True):
+            sharder.reported = time.time()
+            brokers = []
+            device_ids = set(d['id'] for d in sharder.ring.devs)
+
+            sharder.ring.max_more_nodes = 1
+            unmounted_dev = next(sharder.ring.get_more_nodes(1))
+            unmounted_dev['device'] = 'xxxx'
+            sharder.ring.add_node(unmounted_dev)
+            for device_id in device_ids:
+                brokers.append(self._make_broker(
+                    container='c%s' % device_id, hash_='c%shash' % device_id,
+                    device=sharder.ring.devs[device_id]['device'], part=0))
+            # enable a/c2 and a/c3 for sharding
+            for broker in brokers[1:]:
+                broker.update_metadata({'X-Container-Sysmeta-Sharding':
+                                        ('true', next(self.ts_iter).internal)})
+            # make a/c2 a candidate for sharding
+            for i in range(10):
+                brokers[1].put_object('o%s' % i, next(self.ts_iter).internal,
+                                      0, 'text/plain', 'etag', 0)
+
+            # check only sharding enabled containers are processed
+            with mock.patch('eventlet.sleep'), mock.patch.object(
+                    sharder, '_process_broker'
+            ) as mock_process_broker:
+                sharder._local_device_ids = {'stale_node_id': {}}
+                sharder._one_shard_cycle(Everything(), Everything())
+
+            lines = sharder.logger.get_lines_for_level('warning')
+            expected = 'Skipping %s as it is not mounted' % \
+                unmounted_dev['device']
+            self.assertIn(expected, lines[0])
+            self.assertEqual(device_ids, set(sharder._local_device_ids.keys()))
+            self.assertEqual(2, mock_process_broker.call_count)
+            processed_paths = [call[0][0].path
+                               for call in mock_process_broker.call_args_list]
+            self.assertEqual({'a/c1', 'a/c2'}, set(processed_paths))
+            self.assertFalse(sharder.logger.get_lines_for_level('error'))
+            expected_stats = {'attempted': 2, 'success': 2, 'failure': 0,
+                              'skipped': 1, 'completed': 0}
+            self._assert_recon_stats(expected_stats, sharder, 'visited')
+            expected_candidate_stats = {
+                'found': 1,
+                'top': [{'object_count': 10, 'tombstones': -1, 'account': 'a',
+                         'container': 'c1', 'meta_timestamp': mock.ANY,
+                         'file_size': os.stat(brokers[1].db_file).st_size,
+                         'path': brokers[1].db_file, 'root': 'a/c1',
+                         'node_index': 1}]}
+            self._assert_recon_stats(
+                expected_candidate_stats, sharder, 'sharding_candidates')
+            self._assert_recon_stats(None, sharder, 'sharding_progress')
+
+            # enable and progress container a/c1 by giving it shard ranges
+            now = next(self.ts_iter)
+            own_shard_range_0 = ShardRange(
+                'a/c0', now, '', '', state=ShardRange.SHARDING)
+            own_shard_range_0.epoch = now
+            # Add 5 tombstones to c0
+            for i in range(5):
+                brokers[0].put_object('tombstone_%d' % i,
+                                      next(self.ts_iter).internal,
+                                      1, 'text/plain', 'etag', 0)
+            for i in range(5):
+                brokers[0].delete_object('tombstone_%d' % i,
+                                         next(self.ts_iter).internal)
+            own_shard_range_0.update_tombstones(5)
+            own_shard_range_1 = ShardRange(
+                'a/c1', now, '', '', state=ShardRange.SHARDING)
+            own_shard_range_1.epoch = now
+            brokers[0].merge_shard_ranges(
+                [own_shard_range_0,
+                 ShardRange('.s_a/1', now, '', 'b', state=ShardRange.ACTIVE),
+                 ShardRange('.s_a/2', now, 'b', 'c', state=ShardRange.CLEAVED),
+                 ShardRange('.s_a/3', now, 'c', 'd', state=ShardRange.CREATED),
+                 ShardRange('.s_a/4', now, 'd', 'e', state=ShardRange.CREATED),
+                 ShardRange('.s_a/5', now, 'e', '', state=ShardRange.FOUND)])
+            brokers[1].merge_shard_ranges(
+                [own_shard_range_1,
+                 ShardRange('.s_a/6', now, '', 'b', state=ShardRange.ACTIVE),
+                 ShardRange('.s_a/7', now, 'b', 'c', state=ShardRange.ACTIVE),
+                 ShardRange('.s_a/8', now, 'c', 'd', state=ShardRange.CLEAVED),
+                 ShardRange('.s_a/9', now, 'd', 'e', state=ShardRange.CREATED),
+                 ShardRange('.s_a/0', now, 'e', '', state=ShardRange.CREATED)])
+            for i in range(11):
+                brokers[2].put_object('o%s' % i, next(self.ts_iter).internal,
+                                      0, 'text/plain', 'etag', 0)
+
+            def mock_processing(broker, node, part):
+                if broker.path == 'a/c1':
+                    raise Exception('kapow!')
+                elif broker.path not in ('a/c0', 'a/c2'):
+                    raise BaseException("I don't know how to handle a broker "
+                                        "for %s" % broker.path)
+
+            # check exceptions are handled
+            sharder.logger.clear()
+            with mock.patch('eventlet.sleep'), mock.patch.object(
+                    sharder, '_process_broker', side_effect=mock_processing
+            ) as mock_process_broker:
+                sharder._local_device_ids = {'stale_node_id': {}}
+                sharder._one_shard_cycle(Everything(), Everything())
+
+            lines = sharder.logger.get_lines_for_level('warning')
+            expected = 'Skipping %s as it is not mounted' % \
+                unmounted_dev['device']
+            self.assertIn(expected, lines[0])
+            self.assertEqual(device_ids, set(sharder._local_device_ids.keys()))
+            self.assertEqual(3, mock_process_broker.call_count)
+            processed_paths = [call[0][0].path
+                               for call in mock_process_broker.call_args_list]
+            self.assertEqual({'a/c0', 'a/c1', 'a/c2'}, set(processed_paths))
+            lines = sharder.logger.get_lines_for_level('error')
+            self.assertIn('Unhandled exception while processing', lines[0])
+            self.assertIn('path: a/c', lines[0])  # match one of the brokers
+            self.assertFalse(lines[1:])
+            sharder.logger.clear()
+            expected_stats = {'attempted': 3, 'success': 2, 'failure': 1,
+                              'skipped': 0, 'completed': 0}
+            self._assert_recon_stats(expected_stats, sharder, 'visited')
+            expected_candidate_stats = {
+                'found': 1,
+                'top': [{'object_count': 11, 'tombstones': -1, 'account': 'a',
+                         'container': 'c2', 'meta_timestamp': mock.ANY,
+                         'file_size': os.stat(brokers[1].db_file).st_size,
+                         'path': brokers[2].db_file, 'root': 'a/c2',
+                         'node_index': 2}]}
+            self._assert_recon_stats(
+                expected_candidate_stats, sharder, 'sharding_candidates')
+            expected_in_progress_stats = {
+                'all': [{'object_count': 0, 'tombstones': 5, 'account': 'a',
+                         'container': 'c0',
+                         'meta_timestamp': mock.ANY,
+                         'file_size': os.stat(brokers[0].db_file).st_size,
+                         'path': brokers[0].db_file, 'root': 'a/c0',
+                         'node_index': 0,
+                         'found': 1, 'created': 2, 'cleaved': 1, 'active': 1,
+                         'state': 'sharding', 'db_state': 'unsharded',
+                         'error': None, 'processing_time': mock.ANY},
+                        {'object_count': 10, 'tombstones': -1, 'account': 'a',
+                         'container': 'c1',
+                         'meta_timestamp': mock.ANY,
+                         'file_size': os.stat(brokers[1].db_file).st_size,
+                         'path': brokers[1].db_file, 'root': 'a/c1',
+                         'node_index': 1,
+                         'found': 0, 'created': 2, 'cleaved': 1, 'active': 2,
+                         'state': 'sharding', 'db_state': 'unsharded',
+                         'error': 'kapow!'}]}
+            self._assert_stats(
+                expected_in_progress_stats, sharder, 'sharding_in_progress')
+
+            # check that candidates and in progress stats don't stick in recon
+            own_shard_range = brokers[0].get_own_shard_range()
+            own_shard_range.state = ShardRange.ACTIVE
+            brokers[0].merge_shard_ranges([own_shard_range])
+            for i in range(10):
+                brokers[1].delete_object(
+                    'o%s' % i, next(self.ts_iter).internal)
+            with mock.patch('eventlet.sleep'), mock.patch.object(
+                    sharder, '_process_broker'
+            ) as mock_process_broker:
+                sharder._local_device_ids = {999: {}}
+                sharder._one_shard_cycle(Everything(), Everything())
+
+            self.assertEqual(device_ids, set(sharder._local_device_ids.keys()))
+            self.assertEqual(3, mock_process_broker.call_count)
+            processed_paths = [call[0][0].path
+                               for call in mock_process_broker.call_args_list]
+            self.assertEqual({'a/c0', 'a/c1', 'a/c2'}, set(processed_paths))
+            self.assertFalse(sharder.logger.get_lines_for_level('error'))
+            expected_stats = {'attempted': 3, 'success': 3, 'failure': 0,
+                              'skipped': 0, 'completed': 0}
+            self._assert_recon_stats(expected_stats, sharder, 'visited')
+            self._assert_recon_stats(
+                expected_candidate_stats, sharder, 'sharding_candidates')
+            self._assert_recon_stats(None, sharder, 'sharding_progress')
+
+            # let's progress broker 1 (broker[0])
+            brokers[0].enable_sharding(next(self.ts_iter))
+            brokers[0].set_sharding_state()
+            shard_ranges = brokers[0].get_shard_ranges()
+            for sr in shard_ranges[:-1]:
+                sr.update_state(ShardRange.CLEAVED)
+            brokers[0].merge_shard_ranges(shard_ranges)
+
+            with mock.patch('eventlet.sleep'), mock.patch.object(
+                    sharder, '_process_broker'
+            ) as mock_process_broker:
+                sharder._local_device_ids = {999: {}}
+                sharder._one_shard_cycle(Everything(), Everything())
+
+            expected_in_progress_stats = {
+                'all': [{'object_count': 0, 'account': 'a', 'container': 'c0',
+                         'meta_timestamp': mock.ANY,
+                         'file_size': os.stat(brokers[0].db_file).st_size,
+                         'path': brokers[0].db_file, 'root': 'a/c0',
+                         'node_index': 0,
+                         'found': 1, 'created': 0, 'cleaved': 3, 'active': 1,
+                         'state': 'sharding', 'db_state': 'sharding',
+                         'error': None, 'processing_time': mock.ANY,
+                         'tombstones': 5},
+                        {'object_count': 0, 'account': 'a', 'container': 'c1',
+                         'meta_timestamp': mock.ANY,
+                         'file_size': os.stat(brokers[1].db_file).st_size,
+                         'path': brokers[1].db_file, 'root': 'a/c1',
+                         'node_index': 1,
+                         'found': 0, 'created': 2, 'cleaved': 1, 'active': 2,
+                         'state': 'sharding', 'db_state': 'unsharded',
+                         'error': None, 'processing_time': mock.ANY,
+                         'tombstones': -1}]}
+            self._assert_stats(
+                expected_in_progress_stats, sharder, 'sharding_in_progress')
+
+            # Now complete sharding broker 1.
+            shard_ranges[-1].update_state(ShardRange.CLEAVED)
+            own_sr = brokers[0].get_own_shard_range()
+            own_sr.update_state(ShardRange.SHARDED)
+            brokers[0].merge_shard_ranges(shard_ranges + [own_sr])
+            # make and complete a cleave context, this is used for the
+            # recon_sharded_timeout timer.
+            cxt = CleavingContext.load(brokers[0])
+            cxt.misplaced_done = cxt.cleaving_done = True
+            ts_now = next(self.ts_iter)
+            with mock_timestamp_now(ts_now):
+                cxt.store(brokers[0])
+            self.assertTrue(brokers[0].set_sharded_state())
+
+            with mock.patch('eventlet.sleep'), \
+                    mock.patch.object(sharder, '_process_broker') \
+                    as mock_process_broker, mock_timestamp_now(ts_now):
+                sharder._local_device_ids = {999: {}}
+                sharder._one_shard_cycle(Everything(), Everything())
+
+            self.maxDiff = None
+            expected_in_progress_stats = {
+                'all': [{'object_count': 0, 'account': 'a', 'container': 'c0',
+                         'meta_timestamp': mock.ANY,
+                         'file_size': os.stat(brokers[0].db_file).st_size,
+                         'path': brokers[0].db_file, 'root': 'a/c0',
+                         'node_index': 0,
+                         'found': 0, 'created': 0, 'cleaved': 4, 'active': 1,
+                         'state': 'sharded', 'db_state': 'sharded',
+                         'error': None, 'processing_time': mock.ANY,
+                         'tombstones': 5,
+                         'total_sharding_time': mock.ANY,
+                         'total_replicate_time': mock.ANY},
+                        {'object_count': 0, 'account': 'a', 'container': 'c1',
+                         'meta_timestamp': mock.ANY,
+                         'file_size': os.stat(brokers[1].db_file).st_size,
+                         'path': brokers[1].db_file, 'root': 'a/c1',
+                         'node_index': 1,
+                         'found': 0, 'created': 2, 'cleaved': 1, 'active': 2,
+                         'state': 'sharding', 'db_state': 'unsharded',
+                         'error': None, 'processing_time': mock.ANY,
+                         'tombstones': -1}]}
+            self._assert_stats(
+                expected_in_progress_stats, sharder, 'sharding_in_progress')
+
+            # one more cycle at recon_sharded_timeout seconds into the
+            # future to check that the completed broker is still reported
+            ts_now = Timestamp(ts_now.timestamp +
+                               sharder.recon_sharded_timeout)
+            with mock.patch('eventlet.sleep'), \
+                    mock.patch.object(sharder, '_process_broker') \
+                    as mock_process_broker, mock_timestamp_now(ts_now):
+                sharder._local_device_ids = {999: {}}
+                sharder._one_shard_cycle(Everything(), Everything())
+            self._assert_stats(
+                expected_in_progress_stats, sharder, 'sharding_in_progress')
+
+            # when we move recon_sharded_timeout + 1 seconds into the future,
+            # broker 1 will be removed from the progress report
+            ts_now = Timestamp(ts_now.timestamp +
+                               sharder.recon_sharded_timeout + 1)
+            with mock.patch('eventlet.sleep'), \
+                    mock.patch.object(sharder, '_process_broker') \
+                    as mock_process_broker, mock_timestamp_now(ts_now):
+                sharder._local_device_ids = {999: {}}
+                sharder._one_shard_cycle(Everything(), Everything())
+
+            expected_in_progress_stats = {
+                'all': [{'object_count': 0, 'account': 'a', 'container': 'c1',
+                         'meta_timestamp': mock.ANY,
+                         'file_size': os.stat(brokers[1].db_file).st_size,
+                         'path': brokers[1].db_file, 'root': 'a/c1',
+                         'node_index': 1,
+                         'found': 0, 'created': 2, 'cleaved': 1, 'active': 2,
+                         'state': 'sharding', 'db_state': 'unsharded',
+                         'error': None, 'processing_time': mock.ANY,
+                         'tombstones': -1}]}
+            self._assert_stats(
+                expected_in_progress_stats, sharder, 'sharding_in_progress')
+
+    def test_one_shard_cycle_no_containers(self):
+        conf = {'recon_cache_path': self.tempdir,
+                'devices': self.tempdir,
+                'mount_check': False}
+
+        with self._mock_sharder(conf) as sharder:
+            for dev in sharder.ring.devs:
+                os.mkdir(os.path.join(self.tempdir, dev['device']))
+            with mock.patch('swift.container.sharder.is_local_device',
+                            return_value=True):
+                sharder._one_shard_cycle(Everything(), Everything())
+        self.assertEqual([], sharder.logger.get_lines_for_level('warning'))
+        self.assertIn('Found no containers directories',
+                      sharder.logger.get_lines_for_level('info'))
+        with self._mock_sharder(conf) as sharder:
+            os.mkdir(os.path.join(self.tempdir, dev['device'], 'containers'))
+            with mock.patch('swift.container.sharder.is_local_device',
+                            return_value=True):
+                sharder._one_shard_cycle(Everything(), Everything())
+        self.assertEqual([], sharder.logger.get_lines_for_level('warning'))
+        self.assertNotIn('Found no containers directories',
+                         sharder.logger.get_lines_for_level('info'))
+
+    def test_ratelimited_roundrobin(self):
+        n_databases = 100
+
+        def stub_iter(dirs):
+            for i in range(n_databases):
+                yield i, '/srv/node/sda/path/to/container.db', {}
+
+        now = time.time()
+        clock = {
+            'sleeps': [],
+            'now': now,
+        }
+
+        def fake_sleep(t):
+            clock['sleeps'].append(t)
+            clock['now'] += t
+
+        def fake_time():
+            return clock['now']
+
+        with self._mock_sharder({'databases_per_second': 1}) as sharder, \
+                mock.patch('swift.common.db_replicator.roundrobin_datadirs',
+                           stub_iter), \
+                mock.patch('time.time', fake_time), \
+                mock.patch('eventlet.sleep', fake_sleep):
+            list(sharder.roundrobin_datadirs(None))
+        # 100 db at 1/s should take ~100s
+        run_time = sum(clock['sleeps'])
+        self.assertTrue(97 <= run_time < 100, 'took %s' % run_time)
+
+        n_databases = 1000
+        now = time.time()
+        clock = {
+            'sleeps': [],
+            'now': now,
+        }
+
+        with self._mock_sharder({'databases_per_second': 50}) as sharder, \
+                mock.patch('swift.common.db_replicator.roundrobin_datadirs',
+                           stub_iter), \
+                mock.patch('time.time', fake_time), \
+                mock.patch('eventlet.sleep', fake_sleep):
+            list(sharder.roundrobin_datadirs(None))
+        # 1000 db at 50/s
+        run_time = sum(clock['sleeps'])
+        self.assertTrue(18 <= run_time < 20, 'took %s' % run_time)
+
+    @contextmanager
+    def _mock_sharder(self, conf=None, replicas=3):
+        self.logger.clear()
+        self.statsd.clear()
+        conf = conf or {}
+        conf['devices'] = self.tempdir
+        fake_ring = FakeRing(replicas=replicas, separate_replication=True)
+        with mock.patch(
+                'swift.container.sharder.internal_client.InternalClient'):
+            with mock.patch(
+                    'swift.common.db_replicator.ring.Ring',
+                    return_value=fake_ring):
+                sharder = ContainerSharder(conf, logger=self.logger,
+                                           statsd=self.statsd)
+                sharder._local_device_ids = {dev['id']: dev
+                                             for dev in fake_ring.devs}
+                sharder._replicate_object = mock.MagicMock(
+                    return_value=(True, [True] * sharder.ring.replica_count))
+                yield sharder
+
+    def _get_raw_object_records(self, broker):
+        # use list_objects_iter with no-op transform_func to get back actual
+        # un-transformed rows with encoded timestamps
+        return [list(obj) for obj in broker.list_objects_iter(
+            10, '', '', '', '', include_deleted=None, all_policies=True,
+            transform_func=lambda record: record)]
+
+    def _check_objects(self, expected_objs, shard_dbs):
+        shard_dbs = shard_dbs if isinstance(shard_dbs, list) else [shard_dbs]
+        shard_objs = []
+        for shard_db in shard_dbs:
+            shard_broker = ContainerBroker(shard_db)
+            shard_objs.extend(self._get_raw_object_records(shard_broker))
+        expected_objs = [list(obj) for obj in expected_objs]
+        self.assertEqual(expected_objs, shard_objs)
+
+    def _check_shard_range(self, expected, actual):
+        expected_dict = dict(expected)
+        actual_dict = dict(actual)
+        self.assertGreater(actual_dict.pop('meta_timestamp'),
+                           expected_dict.pop('meta_timestamp'))
+        self.assertEqual(expected_dict, actual_dict)
+
+    def test_check_node(self):
+        node = {
+            'replication_ip': '127.0.0.1',
+            'replication_port': 5000,
+            'device': 'd100',
+        }
+        with self._mock_sharder() as sharder:
+            sharder.mount_check = True
+            sharder.ips = ['127.0.0.1']
+            sharder.port = 5000
+
+            # normal behavior
+            with mock.patch(
+                    'swift.common.utils.ismount',
+                    lambda *args: True):
+                r = sharder._check_node(node)
+            expected = os.path.join(sharder.conf['devices'], node['device'])
+            self.assertEqual(r, expected)
+
+            # test with an unmounted drive
+            with mock.patch(
+                    'swift.common.utils.ismount',
+                    lambda *args: False):
+                r = sharder._check_node(node)
+            self.assertEqual(r, False)
+            lines = sharder.logger.get_lines_for_level('warning')
+            expected = 'Skipping %s as it is not mounted' % node['device']
+            self.assertIn(expected, lines[0])
+
+    def test_fetch_shard_ranges_unexpected_response(self):
+        broker = self._make_broker()
+        exc = internal_client.UnexpectedResponse(
+            'Unexpected response: 404', None)
+        with self._mock_sharder() as sharder:
+            sharder.int_client.make_request.side_effect = exc
+            self.assertIsNone(sharder._fetch_shard_ranges(broker))
+        lines = sharder.logger.get_lines_for_level('warning')
+        self.assertIn('Unexpected response: 404', lines[0])
+        self.assertFalse(lines[1:])
+
+    def test_fetch_shard_ranges_bad_record_type(self):
+        def do_test(mock_resp_headers):
+            with self._mock_sharder() as sharder:
+                mock_make_request = mock.MagicMock(
+                    return_value=mock.MagicMock(headers=mock_resp_headers))
+                sharder.int_client.make_request = mock_make_request
+                self.assertIsNone(sharder._fetch_shard_ranges(broker))
+            lines = sharder.logger.get_lines_for_level('error')
+            self.assertIn('unexpected record type', lines[0])
+            self.assertFalse(lines[1:])
+
+        broker = self._make_broker()
+        do_test({})
+        do_test({'x-backend-record-type': 'object'})
+        do_test({'x-backend-record-type': 'disco'})
+
+    def test_fetch_shard_ranges_bad_data(self):
+        def do_test(mock_resp_body):
+            mock_resp_headers = {'x-backend-record-type': 'shard'}
+            with self._mock_sharder() as sharder:
+                mock_make_request = mock.MagicMock(
+                    return_value=mock.MagicMock(headers=mock_resp_headers,
+                                                body=mock_resp_body))
+                sharder.int_client.make_request = mock_make_request
+                self.assertIsNone(sharder._fetch_shard_ranges(broker))
+            lines = sharder.logger.get_lines_for_level('error')
+            self.assertIn('invalid data', lines[0])
+            self.assertFalse(lines[1:])
+
+        broker = self._make_broker()
+        do_test({})
+        do_test('')
+        do_test(json.dumps({}))
+        do_test(json.dumps([{'account': 'a', 'container': 'c'}]))
+        do_test(json.dumps([dict(Namespace('a/c', 'l', 'u'))]))
+        sr_dict = dict(ShardRange('a/c', next(self.ts_iter), 'l', 'u'))
+        sr_dict.pop('object_count')
+        do_test(json.dumps([sr_dict]))
+
+    def test_fetch_shard_ranges_ok(self):
+        def do_test(mock_resp_body, params):
+            mock_resp_headers = {'x-backend-record-type': 'shard'}
+            with self._mock_sharder() as sharder:
+                mock_make_request = mock.MagicMock(
+                    return_value=mock.MagicMock(headers=mock_resp_headers,
+                                                body=mock_resp_body))
+                sharder.int_client.make_request = mock_make_request
+                mock_make_path = mock.MagicMock(return_value='/v1/a/c')
+                sharder.int_client.make_path = mock_make_path
+                actual = sharder._fetch_shard_ranges(broker, params=params)
+            sharder.int_client.make_path.assert_called_once_with('a', 'c')
+            self.assertFalse(sharder.logger.get_lines_for_level('error'))
+            return actual, mock_make_request
+
+        expected_headers = {'X-Backend-Record-Type': 'shard',
+                            'X-Backend-Include-Deleted': 'False',
+                            'X-Backend-Override-Deleted': 'true',
+                            'X-Backend-Record-Shard-Format': 'full'}
+        broker = self._make_broker()
+        shard_ranges = self._make_shard_ranges((('', 'm'), ('m', '')))
+
+        params = {'format': 'json'}
+        actual, mock_call = do_test(json.dumps([dict(shard_ranges[0])]),
+                                    params={})
+        mock_call.assert_called_once_with(
+            'GET', '/v1/a/c', expected_headers, acceptable_statuses=(2,),
+            params=params)
+        self._assert_shard_ranges_equal([shard_ranges[0]], actual)
+
+        params = {'format': 'json', 'includes': 'thing'}
+        actual, mock_call = do_test(
+            json.dumps([dict(sr) for sr in shard_ranges]), params=params)
+        self._assert_shard_ranges_equal(shard_ranges, actual)
+        mock_call.assert_called_once_with(
+            'GET', '/v1/a/c', expected_headers, acceptable_statuses=(2,),
+            params=params)
+
+        params = {'format': 'json',
+                  'end_marker': 'there', 'marker': 'here'}
+        actual, mock_call = do_test(json.dumps([]), params=params)
+        self._assert_shard_ranges_equal([], actual)
+        mock_call.assert_called_once_with(
+            'GET', '/v1/a/c', expected_headers, acceptable_statuses=(2,),
+            params=params)
+
+    def test_yield_objects(self):
+        broker = self._make_broker()
+        objects = [
+            ('o%02d' % i, self.ts_encoded(), 10, 'text/plain', 'etag_a',
+             i % 2, 0) for i in range(30)]
+        for obj in objects:
+            broker.put_object(*obj)
+
+        src_range = ShardRange('dont/care', Timestamp.now())
+        with self._mock_sharder(conf={}) as sharder:
+            batches = [b for b, _ in
+                       sharder.yield_objects(broker, src_range)]
+        self.assertEqual([15, 15], [len(b) for b in batches])
+        self.assertEqual([[0] * 15, [1] * 15],
+                         [[o['deleted'] for o in b] for b in batches])
+
+        # custom batch size
+        with self._mock_sharder(conf={}) as sharder:
+            batches = [b for b, _ in
+                       sharder.yield_objects(broker, src_range, batch_size=10)]
+        self.assertEqual([10, 5, 10, 5], [len(b) for b in batches])
+        self.assertEqual([[0] * 10, [0] * 5, [1] * 10, [1] * 5],
+                         [[o['deleted'] for o in b] for b in batches])
+
+        # restricted source range
+        src_range = ShardRange('dont/care', Timestamp.now(),
+                               lower='o10', upper='o20')
+        with self._mock_sharder(conf={}) as sharder:
+            batches = [b for b, _ in
+                       sharder.yield_objects(broker, src_range)]
+        self.assertEqual([5, 5], [len(b) for b in batches])
+        self.assertEqual([[0] * 5, [1] * 5],
+                         [[o['deleted'] for o in b] for b in batches])
+
+        # null source range
+        src_range = ShardRange('dont/care', Timestamp.now(),
+                               lower=ShardRange.MAX)
+        with self._mock_sharder(conf={}) as sharder:
+            batches = [b for b, _ in
+                       sharder.yield_objects(broker, src_range)]
+        self.assertEqual([], batches)
+        src_range = ShardRange('dont/care', Timestamp.now(),
+                               upper=ShardRange.MIN)
+        with self._mock_sharder(conf={}) as sharder:
+            batches = [b for b, _ in
+                       sharder.yield_objects(broker, src_range)]
+        self.assertEqual([], batches)
+
+    def test_yield_objects_to_shard_range_no_objects(self):
+        # verify that dest_shard_ranges func is not called if the source
+        # broker has no objects
+        broker = self._make_broker()
+        dest_shard_ranges = mock.MagicMock()
+        src_range = ShardRange('dont/care', Timestamp.now())
+        with self._mock_sharder(conf={}) as sharder:
+            batches = [b for b, _ in
+                       sharder.yield_objects_to_shard_range(
+                           broker, src_range, dest_shard_ranges)]
+        self.assertEqual([], batches)
+        dest_shard_ranges.assert_not_called()
+
+    def test_yield_objects_to_shard_range(self):
+        broker = self._make_broker()
+        objects = [
+            ('o%02d' % i, self.ts_encoded(), 10, 'text/plain', 'etag_a',
+             i % 2, 0) for i in range(30)]
+        for obj in objects:
+            broker.put_object(*obj)
+        orig_info = broker.get_info()
+        # yield_objects annotates the info dict...
+        orig_info['max_row'] = 30
+        dest_ranges = [
+            ShardRange('shard/0', Timestamp.now(), upper='o09'),
+            ShardRange('shard/1', Timestamp.now(), lower='o09', upper='o19'),
+            ShardRange('shard/2', Timestamp.now(), lower='o19'),
+        ]
+
+        # complete overlap of src and dest, multiple batches per dest shard
+        # range per deleted/not deleted
+        src_range = ShardRange('dont/care', Timestamp.now())
+        dest_shard_ranges = mock.MagicMock(return_value=dest_ranges)
+        with self._mock_sharder(conf={'cleave_row_batch_size': 4}) as sharder:
+            yielded = [y for y in
+                       sharder.yield_objects_to_shard_range(
+                           broker, src_range, dest_shard_ranges)]
+        self.assertEqual([dest_ranges[0], dest_ranges[0],
+                          dest_ranges[0], dest_ranges[0],
+                          dest_ranges[1], dest_ranges[1],
+                          dest_ranges[1], dest_ranges[1],
+                          dest_ranges[2], dest_ranges[2],
+                          dest_ranges[2], dest_ranges[2]],
+                         [dest for _, dest, _ in yielded])
+        self.assertEqual([[o[0] for o in objects[0:8:2]],
+                          [o[0] for o in objects[8:10:2]],
+                          [o[0] for o in objects[1:8:2]],
+                          [o[0] for o in objects[9:10:2]],
+                          [o[0] for o in objects[10:18:2]],
+                          [o[0] for o in objects[18:20:2]],
+                          [o[0] for o in objects[11:18:2]],
+                          [o[0] for o in objects[19:20:2]],
+                          [o[0] for o in objects[20:28:2]],
+                          [o[0] for o in objects[28:30:2]],
+                          [o[0] for o in objects[21:28:2]],
+                          [o[0] for o in objects[29:30:2]]],
+                         [[o['name'] for o in objs] for objs, _, _ in yielded])
+        self.assertEqual([orig_info] * 12, [info for _, _, info in yielded])
+
+        # src narrower than dest
+        src_range = ShardRange('dont/care', Timestamp.now(),
+                               lower='o15', upper='o25')
+        dest_shard_ranges = mock.MagicMock(return_value=dest_ranges)
+        with self._mock_sharder(conf={}) as sharder:
+            yielded = [y for y in
+                       sharder.yield_objects_to_shard_range(
+                           broker, src_range, dest_shard_ranges)]
+        self.assertEqual([dest_ranges[1], dest_ranges[1],
+                          dest_ranges[2], dest_ranges[2]],
+                         [dest for _, dest, _ in yielded])
+        self.assertEqual([[o[0] for o in objects[16:20:2]],
+                          [o[0] for o in objects[17:20:2]],
+                          [o[0] for o in objects[20:26:2]],
+                          [o[0] for o in objects[21:26:2]]],
+                         [[o['name'] for o in objs] for objs, _, _ in yielded])
+        self.assertEqual([orig_info] * 4, [info for _, _, info in yielded])
+
+        # src much narrower than dest
+        src_range = ShardRange('dont/care', Timestamp.now(),
+                               lower='o15', upper='o18')
+        dest_shard_ranges = mock.MagicMock(return_value=dest_ranges)
+        with self._mock_sharder(conf={}) as sharder:
+            yielded = [y for y in
+                       sharder.yield_objects_to_shard_range(
+                           broker, src_range, dest_shard_ranges)]
+        self.assertEqual([dest_ranges[1], dest_ranges[1]],
+                         [dest for _, dest, _ in yielded])
+        self.assertEqual([[o[0] for o in objects[16:19:2]],
+                          [o[0] for o in objects[17:19:2]]],
+                         [[o['name'] for o in objs] for objs, _, _ in yielded])
+        self.assertEqual([orig_info] * 2, [info for _, _, info in yielded])
+
+        # dest narrower than src
+        src_range = ShardRange('dont/care', Timestamp.now(),
+                               lower='o05', upper='o25')
+        dest_shard_ranges = mock.MagicMock(return_value=dest_ranges[1:])
+        with self._mock_sharder(conf={}) as sharder:
+            yielded = [y for y in
+                       sharder.yield_objects_to_shard_range(
+                           broker, src_range, dest_shard_ranges)]
+        self.assertEqual([None, None,
+                          dest_ranges[1], dest_ranges[1],
+                          dest_ranges[2], dest_ranges[2]],
+                         [dest for _, dest, _ in yielded])
+        self.assertEqual([[o[0] for o in objects[6:10:2]],
+                          [o[0] for o in objects[7:10:2]],
+                          [o[0] for o in objects[10:20:2]],
+                          [o[0] for o in objects[11:20:2]],
+                          [o[0] for o in objects[20:26:2]],
+                          [o[0] for o in objects[21:26:2]]],
+                         [[o['name'] for o in objs] for objs, _, _ in yielded])
+        self.assertEqual([orig_info] * 6, [info for _, _, info in yielded])
+
+        # dest much narrower than src
+        src_range = ShardRange('dont/care', Timestamp.now(),
+                               lower='o05', upper='o25')
+        dest_shard_ranges = mock.MagicMock(return_value=dest_ranges[1:2])
+        with self._mock_sharder(conf={}) as sharder:
+            yielded = [y for y in
+                       sharder.yield_objects_to_shard_range(
+                           broker, src_range, dest_shard_ranges)]
+        self.assertEqual([None, None,
+                          dest_ranges[1], dest_ranges[1],
+                          None, None],
+                         [dest for _, dest, _ in yielded])
+        self.assertEqual([[o[0] for o in objects[6:10:2]],
+                          [o[0] for o in objects[7:10:2]],
+                          [o[0] for o in objects[10:20:2]],
+                          [o[0] for o in objects[11:20:2]],
+                          [o[0] for o in objects[20:26:2]],
+                          [o[0] for o in objects[21:26:2]]],
+                         [[o['name'] for o in objs] for objs, _, _ in yielded])
+        self.assertEqual([orig_info] * 6, [info for _, _, info in yielded])
+
+        # no dest, source is entire namespace, multiple batches
+        src_range = ShardRange('dont/care', Timestamp.now())
+        dest_shard_ranges = mock.MagicMock(return_value=[])
+        with self._mock_sharder(conf={'cleave_row_batch_size': 10}) as sharder:
+            yielded = [y for y in
+                       sharder.yield_objects_to_shard_range(
+                           broker, src_range, dest_shard_ranges)]
+        self.assertEqual([None] * 4,
+                         [dest for _, dest, _ in yielded])
+        self.assertEqual([[o[0] for o in objects[:20:2]],
+                          [o[0] for o in objects[20::2]],
+                          [o[0] for o in objects[1:20:2]],
+                          [o[0] for o in objects[21::2]]],
+                         [[o['name'] for o in objs] for objs, _, _ in yielded])
+        self.assertEqual([orig_info] * 4, [info for _, _, info in yielded])
+
+    def test_fresh_db_id_has_device_suffix(self):
+        broker = self._make_broker()
+        objects = [
+            ('o%02d' % i, self.ts_encoded(), 10, 'text/plain', 'etag_a',
+             i % 2, 0) for i in range(30)]
+        for obj in objects:
+            broker.put_object(*obj)
+        broker.enable_sharding(Timestamp.now())
+        dest_ranges = [
+            ShardRange('shard/0', Timestamp.now(), upper='o09'),
+            ShardRange('shard/1', Timestamp.now(), lower='o09', upper='o19'),
+            ShardRange('shard/2', Timestamp.now(), lower='o19'),
+        ]
+        broker.merge_shard_ranges(dest_ranges)
+        self.assertTrue(broker.set_sharding_state())
+
+        # In sharding state let's confirm retiring and fresh dbs were
+        # generated correctly. They both should have the device "sda" as a
+        # a suffix, as it's in their path.
+        # First retiring broker
+        self.assertTrue(
+            broker.get_brokers()[0].get_info()['id'].endswith('sda'))
+        self.assertTrue(
+            broker.get_brokers()[1].get_info()['id'].endswith('sda'))
+
+    def _check_cleave_root(self, conf=None):
+        broker = self._make_broker()
+        objects = [
+            # shard 0
+            ('a', self.ts_encoded(), 10, 'text/plain', 'etag_a', 0, 0),
+            ('here', self.ts_encoded(), 10, 'text/plain', 'etag_here', 0, 0),
+            # shard 1
+            ('m', self.ts_encoded(), 1, 'text/plain', 'etag_m', 0, 0),
+            ('n', self.ts_encoded(), 2, 'text/plain', 'etag_n', 0, 0),
+            ('there', self.ts_encoded(), 3, 'text/plain', 'etag_there', 0, 0),
+            # shard 2
+            ('where', self.ts_encoded(), 100, 'text/plain', 'etag_where', 0,
+             0),
+            # shard 3
+            ('x', self.ts_encoded(), 0, '', '', 1, 0),  # deleted
+            ('y', self.ts_encoded(), 1000, 'text/plain', 'etag_y', 0, 0),
+            # shard 4
+            ('yyyy', self.ts_encoded(), 14, 'text/plain', 'etag_yyyy', 0, 0),
+        ]
+        for obj in objects:
+            broker.put_object(*obj)
+        initial_root_info = broker.get_info()
+        broker.enable_sharding(Timestamp.now())
+
+        shard_bounds = (('', 'here'), ('here', 'there'),
+                        ('there', 'where'), ('where', 'yonder'),
+                        ('yonder', ''))
+        shard_ranges = self._make_shard_ranges(shard_bounds)
+        expected_shard_dbs = []
+        for shard_range in shard_ranges:
+            db_hash = hash_path(shard_range.account, shard_range.container)
+            expected_shard_dbs.append(
+                os.path.join(self.tempdir, 'sda', 'containers', '0',
+                             db_hash[-3:], db_hash, db_hash + '.db'))
+
+        # used to accumulate stats from sharded dbs
+        total_shard_stats = {'object_count': 0, 'bytes_used': 0}
+        # run cleave - no shard ranges, nothing happens
+        with self._mock_sharder(conf=conf) as sharder:
+            self.assertFalse(sharder._cleave(broker))
+
+        context = CleavingContext.load(broker)
+        self.assertTrue(context.misplaced_done)
+        self.assertFalse(context.cleaving_done)
+        self.assertFalse(context.done())
+        self.assertEqual('', context.cursor)
+        self.assertEqual(9, context.cleave_to_row)
+        self.assertEqual(9, context.max_row)
+        self.assertEqual(0, context.ranges_done)
+        self.assertEqual(0, context.ranges_todo)
+
+        self.assertEqual(UNSHARDED, broker.get_db_state())
+        sharder._replicate_object.assert_not_called()
+        for db in expected_shard_dbs:
+            with self.subTest(db=db):
+                self.assertFalse(os.path.exists(db))
+
+        # run cleave - all shard ranges in found state, nothing happens
+        broker.merge_shard_ranges(shard_ranges[:4])
+        self.assertTrue(broker.set_sharding_state())
+
+        with self._mock_sharder(conf=conf) as sharder:
+            self.assertFalse(sharder._cleave(broker))
+
+        context = CleavingContext.load(broker)
+        self.assertTrue(context.misplaced_done)
+        self.assertFalse(context.cleaving_done)
+        self.assertFalse(context.done())
+        self.assertEqual('', context.cursor)
+        self.assertEqual(9, context.cleave_to_row)
+        self.assertEqual(9, context.max_row)
+        self.assertEqual(0, context.ranges_done)
+        self.assertEqual(4, context.ranges_todo)
+        self.assertEqual(0, context.replication_time)
+
+        self.assertEqual(SHARDING, broker.get_db_state())
+        sharder._replicate_object.assert_not_called()
+        for db in expected_shard_dbs:
+            with self.subTest(db=db):
+                self.assertFalse(os.path.exists(db))
+        for shard_range in broker.get_shard_ranges():
+            with self.subTest(shard_range=shard_range):
+                self.assertEqual(ShardRange.FOUND, shard_range.state)
+
+        # move first shard range to created state, first shard range is cleaved
+        shard_ranges[0].update_state(ShardRange.CREATED)
+        broker.merge_shard_ranges(shard_ranges[:1])
+        with self._mock_sharder(conf=conf) as sharder:
+            self.assertFalse(sharder._cleave(broker))
+
+        expected = {'attempted': 1, 'success': 1, 'failure': 0,
+                    'min_time': mock.ANY, 'max_time': mock.ANY,
+                    'db_created': 1, 'db_exists': 0}
+        stats = self._assert_stats(expected, sharder, 'cleaved')
+        self.assertIsInstance(stats['min_time'], float)
+        self.assertIsInstance(stats['max_time'], float)
+        self.assertLessEqual(stats['min_time'], stats['max_time'])
+        self.assertEqual(
+            1, sharder.logger.statsd_client.get_stats_counts().get(
+                'cleaved_db_created'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'cleaved_db_exists'))
+        self.assertEqual(SHARDING, broker.get_db_state())
+        sharder._replicate_object.assert_called_once_with(
+            0, expected_shard_dbs[0], 0)
+        shard_broker = ContainerBroker(expected_shard_dbs[0])
+        shard_own_sr = shard_broker.get_own_shard_range()
+        self.assertEqual(ShardRange.CLEAVED, shard_own_sr.state)
+        shard_info = shard_broker.get_info()
+        total_shard_stats['object_count'] += shard_info['object_count']
+        total_shard_stats['bytes_used'] += shard_info['bytes_used']
+
+        updated_shard_ranges = broker.get_shard_ranges()
+        self.assertEqual(4, len(updated_shard_ranges))
+        # update expected state and metadata, check cleaved shard range
+        shard_ranges[0].bytes_used = 20
+        shard_ranges[0].object_count = 2
+        shard_ranges[0].state = ShardRange.CLEAVED
+        self._check_shard_range(shard_ranges[0], updated_shard_ranges[0])
+        self._check_objects(objects[:2], expected_shard_dbs[0])
+        # other shard ranges should be unchanged
+        for i in range(1, len(shard_ranges)):
+            with self.subTest(i=i):
+                self.assertFalse(os.path.exists(expected_shard_dbs[i]))
+        for i in range(1, len(updated_shard_ranges)):
+            with self.subTest(i=i):
+                self.assertEqual(dict(shard_ranges[i]),
+                                 dict(updated_shard_ranges[i]))
+
+        context = CleavingContext.load(broker)
+        self.assertTrue(context.misplaced_done)
+        self.assertFalse(context.cleaving_done)
+        self.assertFalse(context.done())
+        self.assertEqual('here', context.cursor)
+        self.assertEqual(9, context.cleave_to_row)
+        self.assertEqual(9, context.max_row)
+        self.assertEqual(1, context.ranges_done)
+        self.assertEqual(3, context.ranges_todo)
+
+        unlink_files(expected_shard_dbs)
+
+        # move more shard ranges to created state
+        for i in range(1, 4):
+            shard_ranges[i].update_state(ShardRange.CREATED)
+        broker.merge_shard_ranges(shard_ranges[1:4])
+
+        # replication of next shard range is not sufficiently successful
+        with self._mock_sharder(conf=conf) as sharder:
+            quorum = quorum_size(sharder.ring.replica_count)
+            successes = [True] * (quorum - 1)
+            fails = [False] * (sharder.ring.replica_count - len(successes))
+            responses = successes + fails
+            random.shuffle(responses)
+            sharder._replicate_object = mock.MagicMock(
+                side_effect=((False, responses),))
+            self.assertFalse(sharder._cleave(broker))
+        sharder._replicate_object.assert_called_once_with(
+            0, expected_shard_dbs[1], 0)
+
+        expected = {'attempted': 1, 'success': 0, 'failure': 1,
+                    'min_time': mock.ANY, 'max_time': mock.ANY,
+                    'db_created': 1, 'db_exists': 0}
+        self._assert_stats(expected, sharder, 'cleaved')
+        self.assertEqual(
+            1, sharder.logger.statsd_client.get_stats_counts().get(
+                'cleaved_db_created'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'cleaved_db_exists'))
+
+        # cleaving state is unchanged
+        updated_shard_ranges = broker.get_shard_ranges()
+        self.assertEqual(4, len(updated_shard_ranges))
+        for i in range(1, len(updated_shard_ranges)):
+            with self.subTest(i=i):
+                self.assertEqual(dict(shard_ranges[i]),
+                                 dict(updated_shard_ranges[i]))
+        context = CleavingContext.load(broker)
+        self.assertTrue(context.misplaced_done)
+        self.assertFalse(context.cleaving_done)
+        self.assertFalse(context.done())
+        self.assertEqual('here', context.cursor)
+        self.assertEqual(9, context.cleave_to_row)
+        self.assertEqual(9, context.max_row)
+        self.assertEqual(1, context.ranges_done)
+        self.assertEqual(3, context.ranges_todo)
+
+        # try again, this time replication is sufficiently successful
+        with self._mock_sharder(conf=conf) as sharder:
+            successes = [True] * quorum
+            fails = [False] * (sharder.ring.replica_count - len(successes))
+            responses1 = successes + fails
+            responses2 = fails + successes
+            sharder._replicate_object = mock.MagicMock(
+                side_effect=((False, responses1), (False, responses2)))
+            self.assertFalse(sharder._cleave(broker))
+
+        expected = {'attempted': 2, 'success': 2, 'failure': 0,
+                    'min_time': mock.ANY, 'max_time': mock.ANY,
+                    'db_created': 1, 'db_exists': 1}
+        stats = self._assert_stats(expected, sharder, 'cleaved')
+        self.assertIsInstance(stats['min_time'], float)
+        self.assertIsInstance(stats['max_time'], float)
+        self.assertLessEqual(stats['min_time'], stats['max_time'])
+        self.assertEqual(
+            1, sharder.logger.statsd_client.get_stats_counts().get(
+                'cleaved_db_created'))
+        self.assertEqual(
+            1, sharder.logger.statsd_client.get_stats_counts().get(
+                'cleaved_db_exists'))
+
+        self.assertEqual(SHARDING, broker.get_db_state())
+        sharder._replicate_object.assert_has_calls(
+            [mock.call(0, db, 0) for db in expected_shard_dbs[1:3]]
+        )
+        for db in expected_shard_dbs[1:3]:
+            shard_broker = ContainerBroker(db)
+            shard_own_sr = shard_broker.get_own_shard_range()
+            self.assertEqual(ShardRange.CLEAVED, shard_own_sr.state)
+            shard_info = shard_broker.get_info()
+            total_shard_stats['object_count'] += shard_info['object_count']
+            total_shard_stats['bytes_used'] += shard_info['bytes_used']
+
+        updated_shard_ranges = broker.get_shard_ranges()
+        self.assertEqual(4, len(updated_shard_ranges))
+
+        # only 2 are cleaved per batch
+        # update expected state and metadata, check cleaved shard ranges
+        shard_ranges[1].bytes_used = 6
+        shard_ranges[1].object_count = 3
+        shard_ranges[1].state = ShardRange.CLEAVED
+        shard_ranges[2].bytes_used = 100
+        shard_ranges[2].object_count = 1
+        shard_ranges[2].state = ShardRange.CLEAVED
+        for i in range(0, 3):
+            with self.subTest(i=i):
+                self._check_shard_range(
+                    shard_ranges[i], updated_shard_ranges[i])
+        self._check_objects(objects[2:5], expected_shard_dbs[1])
+        self._check_objects(objects[5:6], expected_shard_dbs[2])
+        # other shard ranges should be unchanged
+        self.assertFalse(os.path.exists(expected_shard_dbs[0]))
+        for i, db in enumerate(expected_shard_dbs[3:], 3):
+            with self.subTest(i=i):
+                self.assertFalse(os.path.exists(db))
+        for i, updated_shard_range in enumerate(updated_shard_ranges[3:], 3):
+            with self.subTest(i=i):
+                self.assertEqual(dict(shard_ranges[i]),
+                                 dict(updated_shard_range))
+        context = CleavingContext.load(broker)
+        self.assertTrue(context.misplaced_done)
+        self.assertFalse(context.cleaving_done)
+        self.assertFalse(context.done())
+        self.assertEqual('where', context.cursor)
+        self.assertEqual(9, context.cleave_to_row)
+        self.assertEqual(9, context.max_row)
+        self.assertEqual(3, context.ranges_done)
+        self.assertEqual(1, context.ranges_todo)
+        self.assertGreater(context.replication_time, 0)
+
+        unlink_files(expected_shard_dbs)
+
+        # run cleave again - should process the fourth range
+        with self._mock_sharder(conf=conf) as sharder:
+            self.assertFalse(sharder._cleave(broker))
+
+        expected = {'attempted': 1, 'success': 1, 'failure': 0,
+                    'min_time': mock.ANY, 'max_time': mock.ANY,
+                    'db_created': 1, 'db_exists': 0}
+        stats = self._assert_stats(expected, sharder, 'cleaved')
+        self.assertIsInstance(stats['min_time'], float)
+        self.assertIsInstance(stats['max_time'], float)
+        self.assertLessEqual(stats['min_time'], stats['max_time'])
+        self.assertEqual(
+            1, sharder.logger.statsd_client.get_stats_counts().get(
+                'cleaved_db_created'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'cleaved_db_exists'))
+
+        self.assertEqual(SHARDING, broker.get_db_state())
+        sharder._replicate_object.assert_called_once_with(
+            0, expected_shard_dbs[3], 0)
+        shard_broker = ContainerBroker(expected_shard_dbs[3])
+        shard_own_sr = shard_broker.get_own_shard_range()
+        self.assertEqual(ShardRange.CLEAVED, shard_own_sr.state)
+        shard_info = shard_broker.get_info()
+        total_shard_stats['object_count'] += shard_info['object_count']
+        total_shard_stats['bytes_used'] += shard_info['bytes_used']
+
+        updated_shard_ranges = broker.get_shard_ranges()
+        self.assertEqual(4, len(updated_shard_ranges))
+
+        shard_ranges[3].bytes_used = 1000
+        shard_ranges[3].object_count = 1
+        shard_ranges[3].state = ShardRange.CLEAVED
+        for i in range(0, 4):
+            with self.subTest(i=i):
+                self._check_shard_range(
+                    shard_ranges[i], updated_shard_ranges[i])
+        # NB includes the deleted object
+        self._check_objects(objects[6:8], expected_shard_dbs[3])
+        # other shard ranges should be unchanged
+        for i, db in enumerate(expected_shard_dbs[:3]):
+            with self.subTest(i=i):
+                self.assertFalse(os.path.exists(db))
+        self.assertFalse(os.path.exists(expected_shard_dbs[4]))
+        for i, updated_shard_range in enumerate(updated_shard_ranges[4:], 4):
+            with self.subTest(i=i):
+                self.assertEqual(dict(shard_ranges[i]),
+                                 dict(updated_shard_range))
+
+        self.assertFalse(os.path.exists(expected_shard_dbs[4]))
+        context = CleavingContext.load(broker)
+        self.assertTrue(context.misplaced_done)
+        self.assertFalse(context.cleaving_done)
+        self.assertFalse(context.done())
+        self.assertEqual('yonder', context.cursor)
+        self.assertEqual(9, context.cleave_to_row)
+        self.assertEqual(9, context.max_row)
+        self.assertEqual(4, context.ranges_done)
+        self.assertEqual(0, context.ranges_todo)
+        self.assertGreater(context.replication_time, 0)
+
+        unlink_files(expected_shard_dbs)
+
+        # run cleave - should be a no-op, all existing ranges have been cleaved
+        with self._mock_sharder(conf=conf) as sharder:
+            self.assertFalse(sharder._cleave(broker))
+
+        self.assertEqual(SHARDING, broker.get_db_state())
+        sharder._replicate_object.assert_not_called()
+
+        # add final shard range - move this to ACTIVE state and update stats to
+        # simulate another replica having cleaved it and replicated its state
+        shard_ranges[4].update_state(ShardRange.ACTIVE)
+        shard_ranges[4].update_meta(2, 15)
+        broker.merge_shard_ranges(shard_ranges[4:])
+
+        with self._mock_sharder(conf=conf) as sharder:
+            self.assertTrue(sharder._cleave(broker))
+
+        expected = {'attempted': 1, 'success': 1, 'failure': 0,
+                    'min_time': mock.ANY, 'max_time': mock.ANY,
+                    'db_created': 1, 'db_exists': 0}
+        stats = self._assert_stats(expected, sharder, 'cleaved')
+        self.assertIsInstance(stats['min_time'], float)
+        self.assertIsInstance(stats['max_time'], float)
+        self.assertLessEqual(stats['min_time'], stats['max_time'])
+        self.assertEqual(
+            1, sharder.logger.statsd_client.get_stats_counts().get(
+                'cleaved_db_created'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'cleaved_db_exists'))
+
+        sharder._replicate_object.assert_called_once_with(
+            0, expected_shard_dbs[4], 0)
+        shard_broker = ContainerBroker(expected_shard_dbs[4])
+        shard_own_sr = shard_broker.get_own_shard_range()
+        self.assertEqual(ShardRange.ACTIVE, shard_own_sr.state)
+        shard_info = shard_broker.get_info()
+        total_shard_stats['object_count'] += shard_info['object_count']
+        total_shard_stats['bytes_used'] += shard_info['bytes_used']
+
+        updated_shard_ranges = broker.get_shard_ranges()
+        self.assertEqual(5, len(updated_shard_ranges))
+        # NB stats of the ACTIVE shard range should not be reset by cleaving
+        for i in range(0, 4):
+            with self.subTest(i=i):
+                self._check_shard_range(
+                    shard_ranges[i], updated_shard_ranges[i])
+        self.assertEqual(dict(shard_ranges[4]), dict(updated_shard_ranges[4]))
+
+        # object copied to shard
+        self._check_objects(objects[8:], expected_shard_dbs[4])
+        # other shard ranges should be unchanged
+        for i, db in enumerate(expected_shard_dbs[:4]):
+            with self.subTest(i=i):
+                self.assertFalse(os.path.exists(db))
+
+        self.assertEqual(initial_root_info['object_count'],
+                         total_shard_stats['object_count'])
+        self.assertEqual(initial_root_info['bytes_used'],
+                         total_shard_stats['bytes_used'])
+
+        context = CleavingContext.load(broker)
+        self.assertTrue(context.misplaced_done)
+        self.assertTrue(context.cleaving_done)
+        self.assertTrue(context.done())
+        self.assertEqual('', context.cursor)
+        self.assertEqual(9, context.cleave_to_row)
+        self.assertEqual(9, context.max_row)
+        self.assertEqual(5, context.ranges_done)
+        self.assertEqual(0, context.ranges_todo)
+        self.assertGreater(context.replication_time, 0)
+
+        with self._mock_sharder(conf=conf) as sharder:
+            self.assertTrue(sharder._cleave(broker))
+        sharder._replicate_object.assert_not_called()
+
+        self.assertTrue(broker.set_sharded_state())
+        # run cleave - should be a no-op
+        with self._mock_sharder(conf=conf) as sharder:
+            self.assertTrue(sharder._cleave(broker))
+
+        sharder._replicate_object.assert_not_called()
+
+    def test_cleave_root(self):
+        self._check_cleave_root()
+
+    def test_cleave_root_listing_limit_one(self):
+        # force yield_objects to update its marker and call to the broker's
+        # get_objects() for each shard range, to check the marker moves on
+        self._check_cleave_root(conf={'cleave_row_batch_size': 1})
+
+    def test_cleave_root_ranges_change(self):
+        # verify that objects are not missed if shard ranges change between
+        # cleaving batches
+        broker = self._make_broker()
+        # this root db has very few object rows...
+        objects = [
+            ('a', self.ts_encoded(), 10, 'text/plain', 'etag_a', 0, 0),
+            ('b', self.ts_encoded(), 10, 'text/plain', 'etag_b', 0, 0),
+            ('c', self.ts_encoded(), 1, 'text/plain', 'etag_c', 0, 0),
+            ('d', self.ts_encoded(), 2, 'text/plain', 'etag_d', 0, 0),
+            ('e', self.ts_encoded(), 3, 'text/plain', 'etag_e', 0, 0),
+            ('f', self.ts_encoded(), 100, 'text/plain', 'etag_f', 0, 0),
+            ('x', self.ts_encoded(), 0, '', '', 1, 0),  # deleted
+            ('z', self.ts_encoded(), 1000, 'text/plain', 'etag_z', 0, 0)
+        ]
+        for obj in objects:
+            broker.put_object(*obj)
+        broker.enable_sharding(Timestamp.now())
+
+        shard_bounds = (('', 'd'), ('d', 'x'), ('x', ''))
+        # shard ranges start life with object count that is typically much
+        # larger than this DB's object population...
+        shard_ranges = self._make_shard_ranges(
+            shard_bounds, state=ShardRange.CREATED, object_count=500000)
+        expected_shard_dbs = []
+        for shard_range in shard_ranges:
+            db_hash = hash_path(shard_range.account, shard_range.container)
+            expected_shard_dbs.append(
+                os.path.join(self.tempdir, 'sda', 'containers', '0',
+                             db_hash[-3:], db_hash, db_hash + '.db'))
+
+        broker.merge_shard_ranges(shard_ranges[:3])
+        self.assertTrue(broker.set_sharding_state())
+
+        # run cleave - first batch is cleaved
+        with self._mock_sharder() as sharder:
+            self.assertFalse(sharder._cleave(broker))
+        context = CleavingContext.load(broker)
+        self.assertTrue(context.misplaced_done)
+        self.assertFalse(context.cleaving_done)
+        self.assertFalse(context.done())
+        self.assertEqual(shard_ranges[1].upper_str, context.cursor)
+        self.assertEqual(8, context.cleave_to_row)
+        self.assertEqual(8, context.max_row)
+
+        self.assertEqual(SHARDING, broker.get_db_state())
+        sharder._replicate_object.assert_has_calls(
+            [mock.call(0, db, 0) for db in expected_shard_dbs[:2]]
+        )
+
+        updated_shard_ranges = broker.get_shard_ranges()
+        self.assertEqual(3, len(updated_shard_ranges))
+
+        # now they have reached CLEAVED state, the first 2 shard ranges should
+        # have updated object count, bytes used and meta_timestamp
+        shard_ranges[0].bytes_used = 23
+        shard_ranges[0].object_count = 4
+        shard_ranges[0].state = ShardRange.CLEAVED
+        self._check_shard_range(shard_ranges[0], updated_shard_ranges[0])
+        shard_ranges[1].bytes_used = 103
+        shard_ranges[1].object_count = 2
+        shard_ranges[1].state = ShardRange.CLEAVED
+        self._check_shard_range(shard_ranges[1], updated_shard_ranges[1])
+        self._check_objects(objects[:4], expected_shard_dbs[0])
+        self._check_objects(objects[4:7], expected_shard_dbs[1])
+        # the actual object counts were set in the new shard brokers' own_sr's
+        shard_broker = ContainerBroker(expected_shard_dbs[0])
+        self.assertEqual(4, shard_broker.get_own_shard_range().object_count)
+        shard_broker = ContainerBroker(expected_shard_dbs[1])
+        self.assertEqual(2, shard_broker.get_own_shard_range().object_count)
+        self.assertFalse(os.path.exists(expected_shard_dbs[2]))
+
+        # third shard range should be unchanged - not yet cleaved
+        self.assertEqual(dict(shard_ranges[2]),
+                         dict(updated_shard_ranges[2]))
+
+        context = CleavingContext.load(broker)
+        self.assertTrue(context.misplaced_done)
+        self.assertFalse(context.cleaving_done)
+        self.assertFalse(context.done())
+        self.assertEqual(shard_ranges[1].upper_str, context.cursor)
+        self.assertEqual(8, context.cleave_to_row)
+        self.assertEqual(8, context.max_row)
+
+        # now change the shard ranges so that third consumes second
+        shard_ranges[1].set_deleted()
+        shard_ranges[2].lower = 'd'
+        shard_ranges[2].timestamp = Timestamp.now()
+
+        broker.merge_shard_ranges(shard_ranges[1:3])
+
+        # run cleave - should process the extended third (final) range
+        with self._mock_sharder() as sharder:
+            self.assertTrue(sharder._cleave(broker))
+
+        self.assertEqual(SHARDING, broker.get_db_state())
+        sharder._replicate_object.assert_called_once_with(
+            0, expected_shard_dbs[2], 0)
+        updated_shard_ranges = broker.get_shard_ranges()
+        self.assertEqual(2, len(updated_shard_ranges))
+        self._check_shard_range(shard_ranges[0], updated_shard_ranges[0])
+        # third shard range should now have updated object count, bytes used,
+        # including objects previously in the second shard range
+        shard_ranges[2].bytes_used = 1103
+        shard_ranges[2].object_count = 3
+        shard_ranges[2].state = ShardRange.CLEAVED
+        self._check_shard_range(shard_ranges[2], updated_shard_ranges[1])
+        self._check_objects(objects[4:8], expected_shard_dbs[2])
+
+        context = CleavingContext.load(broker)
+        self.assertTrue(context.misplaced_done)
+        self.assertTrue(context.cleaving_done)
+        self.assertTrue(context.done())
+        self.assertEqual(shard_ranges[2].upper_str, context.cursor)
+        self.assertEqual(8, context.cleave_to_row)
+        self.assertEqual(8, context.max_row)
+
+    def test_cleave_root_empty_db_with_ranges(self):
+        broker = self._make_broker()
+        broker.enable_sharding(Timestamp.now())
+
+        shard_bounds = (('', 'd'), ('d', 'x'), ('x', ''))
+        shard_ranges = self._make_shard_ranges(
+            shard_bounds, state=ShardRange.CREATED)
+
+        broker.merge_shard_ranges(shard_ranges)
+        self.assertTrue(broker.set_sharding_state())
+
+        sharder_conf = {'cleave_batch_size': 1}
+        with self._mock_sharder(sharder_conf) as sharder:
+            self.assertTrue(sharder._cleave(broker))
+
+        info_lines = sharder.logger.get_lines_for_level('info')
+        expected_zero_obj = [line for line in info_lines
+                             if " - zero objects found" in line]
+        self.assertEqual(len(expected_zero_obj), len(shard_bounds))
+
+        cleaving_context = CleavingContext.load(broker)
+        # even though there is a cleave_batch_size of 1, we don't count empty
+        # ranges when cleaving seeing as they aren't replicated
+        self.assertEqual(cleaving_context.ranges_done, 3)
+        self.assertEqual(cleaving_context.ranges_todo, 0)
+        self.assertTrue(cleaving_context.cleaving_done)
+
+        self.assertEqual([ShardRange.CLEAVED] * 3,
+                         [sr.state for sr in broker.get_shard_ranges()])
+
+    def test_cleave_root_empty_db_with_pre_existing_shard_db_handoff(self):
+        broker = self._make_broker()
+        broker.enable_sharding(Timestamp.now())
+
+        shard_bounds = (('', 'd'), ('d', 'x'), ('x', ''))
+        shard_ranges = self._make_shard_ranges(
+            shard_bounds, state=ShardRange.CREATED)
+
+        broker.merge_shard_ranges(shard_ranges)
+        self.assertTrue(broker.set_sharding_state())
+
+        sharder_conf = {'cleave_batch_size': 1}
+        with self._mock_sharder(sharder_conf) as sharder:
+            # pre-create a shard broker on a handoff location. This will force
+            # the sharder to not skip it but instead force to replicate it and
+            # use up a cleave_batch_size count.
+            sharder._get_shard_broker(shard_ranges[0], broker.root_path,
+                                      0)
+            self.assertFalse(sharder._cleave(broker))
+
+        info_lines = sharder.logger.get_lines_for_level('info')
+        expected_zero_obj = [line for line in info_lines
+                             if " - zero objects found" in line]
+        self.assertEqual(len(expected_zero_obj), 1)
+
+        cleaving_context = CleavingContext.load(broker)
+        # even though there is a cleave_batch_size of 1, we don't count empty
+        # ranges when cleaving seeing as they aren't replicated
+        self.assertEqual(cleaving_context.ranges_done, 1)
+        self.assertEqual(cleaving_context.ranges_todo, 2)
+        self.assertFalse(cleaving_context.cleaving_done)
+
+        self.assertEqual(
+            [ShardRange.CLEAVED, ShardRange.CREATED, ShardRange.CREATED],
+            [sr.state for sr in broker.get_shard_ranges()])
+
+    def test_cleave_shard_range_no_own_shard_range(self):
+        # create an unsharded broker that has shard ranges but no
+        # own_shard_range, verify that it does not cleave...
+        broker = self._make_broker()
+        broker.set_sharding_sysmeta('Quoted-Root', 'a/c')
+        shard_ranges = self._make_shard_ranges(
+            (('', 'middle'), ('middle', '')),
+            state=ShardRange.CLEAVED)
+        broker.merge_shard_ranges(shard_ranges)
+        obj = {'name': 'obj', 'created_at': next(self.ts_iter).internal,
+               'size': 14, 'content_type': 'text/plain', 'etag': 'an etag',
+               'deleted': 0}
+        broker.get_brokers()[0].merge_items([obj])
+        with self._mock_sharder() as sharder:
+            self.assertFalse(sharder._cleave(broker))
+        self.assertEqual(UNSHARDED, broker.get_db_state())
+        warning_lines = sharder.logger.get_lines_for_level('warning')
+        self.assertEqual(warning_lines[0],
+                         'Failed to get own_shard_range, path: a/c, db: %s'
+                         % broker.db_file)
+        sharder._replicate_object.assert_not_called()
+        context = CleavingContext.load(broker)
+        self.assertTrue(context.misplaced_done)
+        self.assertFalse(context.cleaving_done)
+        # only the root broker on disk
+        suffix_dir = os.path.dirname(broker.db_dir)
+        self.assertEqual([os.path.basename(broker.db_dir)],
+                         os.listdir(suffix_dir))
+        partition_dir = os.path.dirname(suffix_dir)
+        self.assertEqual([broker.db_dir[-3:]], os.listdir(partition_dir))
+        containers_dir = os.path.dirname(partition_dir)
+        self.assertEqual(['0'], os.listdir(containers_dir))
+
+    def test_cleave_shard(self):
+        broker = self._make_broker(account='.shards_a', container='shard_c')
+        own_shard_range = ShardRange(
+            broker.path, Timestamp.now(), 'here', 'where',
+            state=ShardRange.SHARDING, epoch=Timestamp.now())
+        broker.merge_shard_ranges([own_shard_range])
+        broker.set_sharding_sysmeta('Root', 'a/c')
+        self.assertFalse(broker.is_root_container())  # sanity check
+
+        objects = [
+            ('m', self.ts_encoded(), 1, 'text/plain', 'etag_m', 0, 0),
+            ('n', self.ts_encoded(), 2, 'text/plain', 'etag_n', 0, 0),
+            ('there', self.ts_encoded(), 3, 'text/plain', 'etag_there', 0, 0),
+            ('where', self.ts_encoded(), 100, 'text/plain', 'etag_where', 0,
+             0),
+        ]
+        misplaced_objects = [
+            ('a', self.ts_encoded(), 1, 'text/plain', 'etag_a', 0, 0),
+            ('z', self.ts_encoded(), 100, 'text/plain', 'etag_z', 1, 0),
+        ]
+        for obj in objects + misplaced_objects:
+            broker.put_object(*obj)
+
+        shard_bounds = (('here', 'there'),
+                        ('there', 'where'))
+        shard_ranges = self._make_shard_ranges(
+            shard_bounds, state=ShardRange.CREATED)
+        expected_shard_dbs = []
+        for shard_range in shard_ranges:
+            db_hash = hash_path(shard_range.account, shard_range.container)
+            expected_shard_dbs.append(
+                os.path.join(self.tempdir, 'sda', 'containers', '0',
+                             db_hash[-3:], db_hash, db_hash + '.db'))
+
+        misplaced_bounds = (('', 'here'),
+                            ('where', ''))
+        misplaced_ranges = self._make_shard_ranges(
+            misplaced_bounds, state=ShardRange.ACTIVE)
+        misplaced_dbs = []
+        for shard_range in misplaced_ranges:
+            db_hash = hash_path(shard_range.account, shard_range.container)
+            misplaced_dbs.append(
+                os.path.join(self.tempdir, 'sda', 'containers', '0',
+                             db_hash[-3:], db_hash, db_hash + '.db'))
+
+        broker.merge_shard_ranges(shard_ranges)
+        self.assertTrue(broker.set_sharding_state())
+
+        # run cleave - first range is cleaved but move of misplaced objects is
+        # not successful
+        sharder_conf = {'cleave_batch_size': 1}
+        with self._mock_sharder(sharder_conf) as sharder:
+            with mock.patch.object(
+                    sharder, '_make_shard_range_fetcher',
+                    return_value=lambda: iter(misplaced_ranges)):
+                # cause misplaced objects replication to not succeed
+                quorum = quorum_size(sharder.ring.replica_count)
+                successes = [True] * (quorum - 1)
+                fails = [False] * (sharder.ring.replica_count - len(successes))
+                responses = successes + fails
+                random.shuffle(responses)
+                bad_result = (False, responses)
+                ok_result = (True, [True] * sharder.ring.replica_count)
+                sharder._replicate_object = mock.MagicMock(
+                    # result for misplaced, misplaced, cleave
+                    side_effect=(bad_result, ok_result, ok_result))
+                self.assertFalse(sharder._cleave(broker))
+
+        context = CleavingContext.load(broker)
+        self.assertFalse(context.misplaced_done)
+        self.assertFalse(context.cleaving_done)
+        self.assertEqual(shard_ranges[0].upper_str, context.cursor)
+        self.assertEqual(6, context.cleave_to_row)
+        self.assertEqual(6, context.max_row)
+
+        self.assertEqual(SHARDING, broker.get_db_state())
+        sharder._replicate_object.assert_has_calls(
+            [mock.call(0, misplaced_dbs[0], 0),
+             mock.call(0, misplaced_dbs[1], 0),
+             mock.call(0, expected_shard_dbs[0], 0)])
+        shard_broker = ContainerBroker(expected_shard_dbs[0])
+        # NB cleaving a shard, state goes to CLEAVED not ACTIVE
+        shard_own_sr = shard_broker.get_own_shard_range()
+        self.assertEqual(ShardRange.CLEAVED, shard_own_sr.state)
+
+        updated_shard_ranges = broker.get_shard_ranges()
+        self.assertEqual(2, len(updated_shard_ranges))
+
+        # first shard range should have updated object count, bytes used and
+        # meta_timestamp
+        shard_ranges[0].bytes_used = 6
+        shard_ranges[0].object_count = 3
+        shard_ranges[0].state = ShardRange.CLEAVED
+        self._check_shard_range(shard_ranges[0], updated_shard_ranges[0])
+        self._check_objects(objects[:3], expected_shard_dbs[0])
+        self.assertFalse(os.path.exists(expected_shard_dbs[1]))
+        self._check_objects(misplaced_objects[:1], misplaced_dbs[0])
+        self._check_objects(misplaced_objects[1:], misplaced_dbs[1])
+        unlink_files(expected_shard_dbs)
+        unlink_files(misplaced_dbs)
+
+        # run cleave - second (final) range is cleaved; move this range to
+        # CLEAVED state and update stats to simulate another replica having
+        # cleaved it and replicated its state
+        shard_ranges[1].update_state(ShardRange.CLEAVED)
+        shard_ranges[1].update_meta(2, 15)
+        broker.merge_shard_ranges(shard_ranges[1:2])
+        with self._mock_sharder(sharder_conf) as sharder:
+            with mock.patch.object(
+                    sharder, '_make_shard_range_fetcher',
+                    return_value=lambda: iter(misplaced_ranges)):
+                self.assertTrue(sharder._cleave(broker))
+
+        context = CleavingContext.load(broker)
+        self.assertTrue(context.misplaced_done)
+        self.assertTrue(context.cleaving_done)
+        self.assertEqual(shard_ranges[1].upper_str, context.cursor)
+        self.assertEqual(6, context.cleave_to_row)
+        self.assertEqual(6, context.max_row)
+
+        self.assertEqual(SHARDING, broker.get_db_state())
+        sharder._replicate_object.assert_has_calls(
+            [mock.call(0, misplaced_dbs[0], 0),
+             mock.call(0, expected_shard_dbs[1], 0)])
+        shard_broker = ContainerBroker(expected_shard_dbs[1])
+        shard_own_sr = shard_broker.get_own_shard_range()
+        self.assertEqual(ShardRange.CLEAVED, shard_own_sr.state)
+
+        updated_shard_ranges = broker.get_shard_ranges()
+        self.assertEqual(2, len(updated_shard_ranges))
+
+        # second shard range should have updated object count, bytes used and
+        # meta_timestamp
+        self.assertEqual(dict(shard_ranges[1]), dict(updated_shard_ranges[1]))
+        self._check_objects(objects[3:], expected_shard_dbs[1])
+        self.assertFalse(os.path.exists(expected_shard_dbs[0]))
+        self._check_objects(misplaced_objects[:1], misplaced_dbs[0])
+        self.assertFalse(os.path.exists(misplaced_dbs[1]))
+
+    def test_cleave_shard_shrinking(self):
+        unique = [0]
+
+        def do_test(acceptor_state, acceptor_bounds, expect_delete,
+                    exp_progress_bounds=None):
+            # 'unique' ensures fresh dbs on each test iteration
+            unique[0] += 1
+
+            objects = [
+                ('i', self.ts_encoded(), 3, 'text/plain', 'etag_t', 0, 0),
+                ('m', self.ts_encoded(), 33, 'text/plain', 'etag_m', 0, 0),
+                ('w', self.ts_encoded(), 100, 'text/plain', 'etag_w', 0, 0),
+            ]
+            broker = self._make_shrinking_broker(
+                container='donor_%s' % unique[0], lower='h', upper='w',
+                objects=objects)
+            acceptor_epoch = next(self.ts_iter)
+            acceptors = [
+                ShardRange('.shards_a/acceptor_%s_%s' % (unique[0], bounds[1]),
+                           Timestamp.now(), bounds[0], bounds[1],
+                           '1000', '11111',
+                           state=acceptor_state, epoch=acceptor_epoch)
+                for bounds in acceptor_bounds]
+            # by default expect cleaving to progress through all acceptors
+            if exp_progress_bounds is None:
+                exp_progress_acceptors = acceptors
+            else:
+                exp_progress_acceptors = [
+                    ShardRange(
+                        '.shards_a/acceptor_%s_%s' % (unique[0], bounds[1]),
+                        Timestamp.now(), bounds[0], bounds[1], '1000', '11111',
+                        state=acceptor_state, epoch=acceptor_epoch)
+                    for bounds in exp_progress_bounds]
+            expected_acceptor_dbs = []
+            for acceptor in exp_progress_acceptors:
+                db_hash = hash_path(acceptor.account,
+                                    acceptor.container)
+                # NB expected cleaved db name includes acceptor epoch
+                db_name = '%s_%s.db' % (db_hash, acceptor_epoch.normal)
+                expected_acceptor_dbs.append(
+                    os.path.join(self.tempdir, 'sda', 'containers', '0',
+                                 db_hash[-3:], db_hash, db_name))
+
+            broker.merge_shard_ranges(acceptors)
+
+            # run cleave
+            with mock_timestamp_now_with_iter(self.ts_iter):
+                with self._mock_sharder() as sharder:
+                    sharder.cleave_batch_size = 3
+                    self.assertEqual(expect_delete, sharder._cleave(broker))
+
+            # check the cleave context and source broker
+            context = CleavingContext.load(broker)
+            self.assertTrue(context.misplaced_done)
+            self.assertEqual(expect_delete, context.cleaving_done)
+            own_sr = broker.get_own_shard_range()
+            if exp_progress_acceptors:
+                expected_cursor = exp_progress_acceptors[-1].upper_str
+            else:
+                expected_cursor = own_sr.lower_str
+            self.assertEqual(expected_cursor, context.cursor)
+            self.assertEqual(3, context.cleave_to_row)
+            self.assertEqual(3, context.max_row)
+            self.assertEqual(SHARDING, broker.get_db_state())
+            if expect_delete and len(acceptor_bounds) == 1:
+                self.assertTrue(own_sr.deleted)
+                self.assertEqual(ShardRange.SHRUNK, own_sr.state)
+            else:
+                self.assertFalse(own_sr.deleted)
+                self.assertEqual(ShardRange.SHRINKING, own_sr.state)
+
+            # check the acceptor db's
+            sharder._replicate_object.assert_has_calls(
+                [mock.call(0, acceptor_db, 0)
+                 for acceptor_db in expected_acceptor_dbs])
+            for acceptor_db in expected_acceptor_dbs:
+                self.assertTrue(os.path.exists(acceptor_db))
+                # NB when *shrinking* a shard container then expect the
+                # acceptor broker's own shard range state to remain in the
+                # original state of the acceptor shard range rather than being
+                # set to CLEAVED as it would when *sharding*.
+                acceptor_broker = ContainerBroker(acceptor_db)
+                self.assertEqual(acceptor_state,
+                                 acceptor_broker.get_own_shard_range().state)
+                acceptor_ranges = acceptor_broker.get_shard_ranges(
+                    include_deleted=True)
+                if expect_delete and len(acceptor_bounds) == 1:
+                    # special case when deleted shrinking shard range is
+                    # forwarded to single enclosing acceptor
+                    self.assertEqual([own_sr], acceptor_ranges)
+                    self.assertTrue(acceptor_ranges[0].deleted)
+                    self.assertEqual(ShardRange.SHRUNK,
+                                     acceptor_ranges[0].state)
+                else:
+                    self.assertEqual([], acceptor_ranges)
+
+            expected_objects = [
+                obj for obj in objects
+                if any(acceptor.lower < obj[0] <= acceptor.upper
+                       for acceptor in exp_progress_acceptors)
+            ]
+            self._check_objects(expected_objects, expected_acceptor_dbs)
+
+            # check that *shrinking* shard's copies of acceptor ranges are not
+            # updated as they would be if *sharding*
+            updated_shard_ranges = broker.get_shard_ranges()
+            self.assertEqual([dict(sr) for sr in acceptors],
+                             [dict(sr) for sr in updated_shard_ranges])
+
+            # check that *shrinking* shard's copies of acceptor ranges are not
+            # updated when completing sharding as they would be if *sharding*
+            with mock_timestamp_now_with_iter(self.ts_iter):
+                sharder._complete_sharding(broker)
+
+            updated_shard_ranges = broker.get_shard_ranges()
+            self.assertEqual([dict(sr) for sr in acceptors],
+                             [dict(sr) for sr in updated_shard_ranges])
+            own_sr = broker.get_own_shard_range()
+            self.assertEqual(expect_delete, own_sr.deleted)
+            if expect_delete:
+                self.assertEqual(ShardRange.SHRUNK, own_sr.state)
+            else:
+                self.assertEqual(ShardRange.SHRINKING, own_sr.state)
+
+        # note: shrinking shard bounds are (h, w)
+        # shrinking to a single acceptor with enclosing namespace
+        expect_delete = True
+        do_test(ShardRange.CREATED, (('h', ''),), expect_delete)
+        do_test(ShardRange.CLEAVED, (('h', ''),), expect_delete)
+        do_test(ShardRange.ACTIVE, (('h', ''),), expect_delete)
+
+        # shrinking to multiple acceptors that enclose namespace
+        do_test(ShardRange.CREATED, (('d', 'k'), ('k', '')), expect_delete)
+        do_test(ShardRange.CLEAVED, (('d', 'k'), ('k', '')), expect_delete)
+        do_test(ShardRange.ACTIVE, (('d', 'k'), ('k', '')), expect_delete)
+        do_test(ShardRange.CLEAVED, (('d', 'k'), ('k', 't'), ('t', '')),
+                expect_delete)
+        do_test(ShardRange.CREATED, (('d', 'k'), ('k', 't'), ('t', '')),
+                expect_delete)
+        do_test(ShardRange.ACTIVE, (('d', 'k'), ('k', 't'), ('t', '')),
+                expect_delete)
+
+        # shrinking to incomplete acceptors, gap at end of namespace
+        expect_delete = False
+        do_test(ShardRange.CREATED, (('d', 'k'),), expect_delete)
+        do_test(ShardRange.CLEAVED, (('d', 'k'), ('k', 't')), expect_delete)
+        # shrinking to incomplete acceptors, gap at start and end of namespace
+        do_test(ShardRange.CREATED, (('k', 't'),), expect_delete,
+                exp_progress_bounds=())
+        # shrinking to incomplete acceptors, gap at start of namespace
+        do_test(ShardRange.CLEAVED, (('k', 't'), ('t', '')), expect_delete,
+                exp_progress_bounds=())
+        # shrinking to incomplete acceptors, gap in middle - some progress
+        do_test(ShardRange.CLEAVED, (('d', 'k'), ('t', '')), expect_delete,
+                exp_progress_bounds=(('d', 'k'),))
+
+    def test_cleave_repeated(self):
+        # verify that if new objects are merged into retiring db after cleaving
+        # started then cleaving will repeat but only new objects are cleaved
+        # in the repeated cleaving pass
+        broker = self._make_broker()
+        objects = [
+            ('obj%03d' % i, next(self.ts_iter), 1, 'text/plain', 'etag', 0, 0)
+            for i in range(10)
+        ]
+        new_objects = [
+            (name, next(self.ts_iter), 1, 'text/plain', 'etag', 0, 0)
+            for name in ('alpha', 'zeta')
+        ]
+        for obj in objects:
+            broker.put_object(*obj)
+        broker._commit_puts()
+        broker.enable_sharding(Timestamp.now())
+        shard_bounds = (('', 'obj004'), ('obj004', ''))
+        shard_ranges = self._make_shard_ranges(
+            shard_bounds, state=ShardRange.CREATED)
+        expected_shard_dbs = []
+        for shard_range in shard_ranges:
+            db_hash = hash_path(shard_range.account, shard_range.container)
+            expected_shard_dbs.append(
+                os.path.join(self.tempdir, 'sda', 'containers', '0',
+                             db_hash[-3:], db_hash, db_hash + '.db'))
+        broker.merge_shard_ranges(shard_ranges)
+        old_broker = broker.get_brokers()[0]
+        node = {'ip': '1.2.3.4', 'port': 6040, 'device': 'sda5', 'id': '2',
+                'index': 0}
+
+        calls = []
+        key = ('name', 'created_at', 'size', 'content_type', 'etag', 'deleted')
+
+        def mock_replicate_object(part, db, node_id):
+            # merge new objects between cleave of first and second shard ranges
+            if not calls:
+                old_broker.merge_items(
+                    [dict(zip(key, obj)) for obj in new_objects])
+            calls.append((part, db, node_id))
+            return True, [True, True, True]
+
+        with self._mock_sharder() as sharder:
+            sharder._audit_container = mock.MagicMock()
+            sharder._replicate_object = mock_replicate_object
+            sharder._process_broker(broker, node, 99)
+
+        # sanity check - the new objects merged into the old db
+        self.assertFalse(broker.get_objects())
+        self.assertEqual(12, len(old_broker.get_objects()))
+
+        self.assertEqual(SHARDING, broker.get_db_state())
+        self.assertEqual(ShardRange.SHARDING,
+                         broker.get_own_shard_range().state)
+        self.assertEqual([(0, expected_shard_dbs[0], 0),
+                          (0, expected_shard_dbs[1], 0)], calls)
+
+        # check shard ranges were updated to CLEAVED
+        updated_shard_ranges = broker.get_shard_ranges()
+        # 'alpha' was not in table when first shard was cleaved
+        shard_ranges[0].bytes_used = 5
+        shard_ranges[0].object_count = 5
+        shard_ranges[0].state = ShardRange.CLEAVED
+        self._check_shard_range(shard_ranges[0], updated_shard_ranges[0])
+        self._check_objects(objects[:5], expected_shard_dbs[0])
+        # 'zeta' was in table when second shard was cleaved
+        shard_ranges[1].bytes_used = 6
+        shard_ranges[1].object_count = 6
+        shard_ranges[1].state = ShardRange.CLEAVED
+        self._check_shard_range(shard_ranges[1], updated_shard_ranges[1])
+        self._check_objects(objects[5:] + new_objects[1:],
+                            expected_shard_dbs[1])
+
+        context = CleavingContext.load(broker)
+        self.assertFalse(context.misplaced_done)
+        self.assertFalse(context.cleaving_done)
+        self.assertFalse(context.done())
+        self.assertEqual('', context.cursor)
+        self.assertEqual(10, context.cleave_to_row)
+        self.assertEqual(12, context.max_row)  # note that max row increased
+        self.assertTrue(self.logger.statsd_client.calls['timing_since'])
+        self.assertEqual(
+            'sharder.sharding.move_misplaced',
+            self.logger.statsd_client.calls['timing_since'][-3][0][0])
+        self.assertGreater(
+            self.logger.statsd_client.calls['timing_since'][-3][0][1], 0)
+        self.assertEqual(
+            'sharder.sharding.set_state',
+            self.logger.statsd_client.calls['timing_since'][-2][0][0])
+        self.assertGreater(
+            self.logger.statsd_client.calls['timing_since'][-2][0][1], 0)
+        self.assertEqual(
+            'sharder.sharding.cleave',
+            self.logger.statsd_client.calls['timing_since'][-1][0][0])
+        self.assertGreater(
+            self.logger.statsd_client.calls['timing_since'][-1][0][1], 0)
+        lines = sharder.logger.get_lines_for_level('info')
+        self.assertEqual(
+            ["Kick off container cleaving, own shard range in state "
+             "'sharding', path: a/c, db: %s" % broker.db_file,
+             "Starting to cleave (2 todo), path: a/c, db: %s"
+             % broker.db_file], lines[:2])
+        self.assertIn('Completed cleaving, DB remaining in sharding state, '
+                      'path: a/c, db: %s'
+                      % broker.db_file, lines[1:])
+        lines = sharder.logger.get_lines_for_level('warning')
+        self.assertIn('Repeat cleaving required', lines[0])
+        self.assertFalse(lines[1:])
+        unlink_files(expected_shard_dbs)
+
+        # repeat the cleaving - the newer objects get cleaved
+        with self._mock_sharder() as sharder:
+            sharder._audit_container = mock.MagicMock()
+            sharder._process_broker(broker, node, 99)
+
+        # this time the sharding completed
+        self.assertEqual(SHARDED, broker.get_db_state())
+        self.assertEqual(ShardRange.SHARDED,
+                         broker.get_own_shard_range().state)
+
+        sharder._replicate_object.assert_has_calls(
+            [mock.call(0, expected_shard_dbs[0], 0),
+             mock.call(0, expected_shard_dbs[1], 0)])
+
+        # shard ranges are now ACTIVE - stats not updated by cleaving
+        updated_shard_ranges = broker.get_shard_ranges()
+        shard_ranges[0].state = ShardRange.ACTIVE
+        self._check_shard_range(shard_ranges[0], updated_shard_ranges[0])
+        self._check_objects(new_objects[:1], expected_shard_dbs[0])
+        # both new objects are included in repeat cleaving but no older objects
+        shard_ranges[1].state = ShardRange.ACTIVE
+        self._check_shard_range(shard_ranges[1], updated_shard_ranges[1])
+        self._check_objects(new_objects[1:], expected_shard_dbs[1])
+        lines = sharder.logger.get_lines_for_level('info')
+        self.assertEqual(
+            'Starting to cleave (2 todo), path: a/c, db: %s'
+            % broker.db_file, lines[0])
+        self.assertIn(
+            'Completed cleaving, DB set to sharded state, path: a/c, db: %s'
+            % broker.db_file, lines[1:])
+        self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+        self.assertTrue(self.logger.statsd_client.calls['timing_since'])
+        self.assertEqual(
+            'sharder.sharding.move_misplaced',
+            self.logger.statsd_client.calls['timing_since'][-4][0][0])
+        self.assertGreater(
+            self.logger.statsd_client.calls['timing_since'][-4][0][1], 0)
+        self.assertEqual(
+            'sharder.sharding.cleave',
+            self.logger.statsd_client.calls['timing_since'][-3][0][0])
+        self.assertGreater(
+            self.logger.statsd_client.calls['timing_since'][-3][0][1], 0)
+        self.assertEqual(
+            'sharder.sharding.completed',
+            self.logger.statsd_client.calls['timing_since'][-2][0][0])
+        self.assertGreater(
+            self.logger.statsd_client.calls['timing_since'][-2][0][1], 0)
+        self.assertEqual(
+            'sharder.sharding.send_sr',
+            self.logger.statsd_client.calls['timing_since'][-1][0][0])
+        self.assertGreater(
+            self.logger.statsd_client.calls['timing_since'][-1][0][1], 0)
+
+    def test_cleave_timing_metrics(self):
+        broker = self._make_broker()
+        objects = [{'name': 'obj_%03d' % i,
+                    'created_at': Timestamp.now().normal,
+                    'content_type': 'text/plain',
+                    'etag': 'etag_%d' % i,
+                    'size': 1024 * i,
+                    'deleted': i % 2,
+                    'storage_policy_index': 0,
+                    } for i in range(1, 8)]
+        broker.merge_items([dict(obj) for obj in objects])
+        broker.enable_sharding(Timestamp.now())
+        shard_ranges = self._make_shard_ranges(
+            (('', 'obj_004'), ('obj_004', '')), state=ShardRange.CREATED)
+        expected_shard_dbs = []
+        for shard_range in shard_ranges:
+            db_hash = hash_path(shard_range.account, shard_range.container)
+            expected_shard_dbs.append(
+                os.path.join(self.tempdir, 'sda', 'containers', '0',
+                             db_hash[-3:], db_hash, db_hash + '.db'))
+        broker.merge_shard_ranges(shard_ranges)
+        self.assertTrue(broker.set_sharding_state())
+        node = {'ip': '1.2.3.4', 'port': 6040, 'device': 'sda5', 'id': '2',
+                'index': 0}
+
+        with self._mock_sharder() as sharder:
+            sharder._audit_container = mock.MagicMock()
+            sharder._process_broker(broker, node, 99)
+
+        lines = sharder.logger.get_lines_for_level('info')
+        self.assertEqual(
+            'Starting to cleave (2 todo), path: a/c, db: %s'
+            % broker.db_file, lines[0])
+        self.assertIn(
+            'Completed cleaving, DB set to sharded state, path: a/c, db: %s'
+            % broker.db_file, lines)
+
+        self.assertTrue(self.logger.statsd_client.calls['timing_since'])
+        self.assertEqual(
+            'sharder.sharding.move_misplaced',
+            self.logger.statsd_client.calls['timing_since'][-4][0][0])
+        self.assertGreater(
+            self.logger.statsd_client.calls['timing_since'][-4][0][1], 0)
+        self.assertEqual(
+            'sharder.sharding.cleave',
+            self.logger.statsd_client.calls['timing_since'][-3][0][0])
+        self.assertGreater(
+            self.logger.statsd_client.calls['timing_since'][-3][0][1], 0)
+        self.assertEqual(
+            'sharder.sharding.completed',
+            self.logger.statsd_client.calls['timing_since'][-2][0][0])
+        self.assertGreater(
+            self.logger.statsd_client.calls['timing_since'][-2][0][1], 0)
+        self.assertEqual(
+            'sharder.sharding.send_sr',
+            self.logger.statsd_client.calls['timing_since'][-1][0][0])
+        self.assertGreater(
+            self.logger.statsd_client.calls['timing_since'][-1][0][1], 0)
+
+        self.assert_labeled_timing_since_stats([
+            ('swift_container_sharder_time_to_first_cleave', mock.ANY,
+             {'account': 'a', 'container': 'c', 'ranges_todo': 2}),
+            ('swift_container_sharder_time_to_last_cleave', mock.ANY,
+             {'account': 'a', 'container': 'c', 'ranges_done': 2}),
+        ])
+
+        # check shard ranges were updated to ACTIVE
+        self.assertEqual([ShardRange.ACTIVE] * 2,
+                         [sr.state for sr in broker.get_shard_ranges()])
+        shard_broker = ContainerBroker(expected_shard_dbs[0])
+        actual_objects = shard_broker.get_objects()
+        self.assertEqual(objects[:4], actual_objects)
+        shard_broker = ContainerBroker(expected_shard_dbs[1])
+        actual_objects = shard_broker.get_objects()
+        self.assertEqual(objects[4:], actual_objects)
+
+    def test_cleave_multiple_storage_policies(self):
+        # verify that objects in all storage policies are cleaved
+        broker = self._make_broker()
+        # add objects in multiple policies
+        objects = [{'name': 'obj_%03d' % i,
+                    'created_at': Timestamp.now().normal,
+                    'content_type': 'text/plain',
+                    'etag': 'etag_%d' % i,
+                    'size': 1024 * i,
+                    'deleted': i % 2,
+                    'storage_policy_index': i % 2,
+                    } for i in range(1, 8)]
+        # merge_items mutates items
+        broker.merge_items([dict(obj) for obj in objects])
+        broker.enable_sharding(Timestamp.now())
+        shard_ranges = self._make_shard_ranges(
+            (('', 'obj_004'), ('obj_004', '')), state=ShardRange.CREATED)
+        expected_shard_dbs = []
+        for shard_range in shard_ranges:
+            db_hash = hash_path(shard_range.account, shard_range.container)
+            expected_shard_dbs.append(
+                os.path.join(self.tempdir, 'sda', 'containers', '0',
+                             db_hash[-3:], db_hash, db_hash + '.db'))
+        broker.merge_shard_ranges(shard_ranges)
+        self.assertTrue(broker.set_sharding_state())
+        node = {'ip': '1.2.3.4', 'port': 6040, 'device': 'sda5', 'id': '2',
+                'index': 0}
+
+        with self._mock_sharder() as sharder:
+            sharder._audit_container = mock.MagicMock()
+            sharder._process_broker(broker, node, 99)
+
+        # check shard ranges were updated to ACTIVE
+        self.assertEqual([ShardRange.ACTIVE] * 2,
+                         [sr.state for sr in broker.get_shard_ranges()])
+        shard_broker = ContainerBroker(expected_shard_dbs[0])
+        actual_objects = shard_broker.get_objects()
+        self.assertEqual(objects[:4], actual_objects)
+
+        shard_broker = ContainerBroker(expected_shard_dbs[1])
+        actual_objects = shard_broker.get_objects()
+        self.assertEqual(objects[4:], actual_objects)
+
+    def test_cleave_insufficient_replication(self):
+        # verify that if replication of a cleaved shard range fails then rows
+        # are not merged again to the existing shard db
+        broker = self._make_broker()
+        retiring_db_id = broker.get_info()['id']
+        objects = [
+            {'name': 'obj%03d' % i, 'created_at': next(self.ts_iter),
+             'size': 1, 'content_type': 'text/plain', 'etag': 'etag',
+             'deleted': 0, 'storage_policy_index': 0}
+            for i in range(10)
+        ]
+        broker.merge_items([dict(obj) for obj in objects])
+        broker._commit_puts()
+        broker.enable_sharding(Timestamp.now())
+        shard_bounds = (('', 'obj004'), ('obj004', ''))
+        shard_ranges = self._make_shard_ranges(
+            shard_bounds, state=ShardRange.CREATED)
+        expected_shard_dbs = []
+        for shard_range in shard_ranges:
+            db_hash = hash_path(shard_range.account, shard_range.container)
+            expected_shard_dbs.append(
+                os.path.join(self.tempdir, 'sda', 'containers', '0',
+                             db_hash[-3:], db_hash, db_hash + '.db'))
+        broker.merge_shard_ranges(shard_ranges)
+        self.assertTrue(broker.set_sharding_state())
+        new_object = {'name': 'alpha', 'created_at': next(self.ts_iter),
+                      'size': 0, 'content_type': 'text/plain', 'etag': 'etag',
+                      'deleted': 0, 'storage_policy_index': 0}
+        broker.merge_items([dict(new_object)])
+
+        node = {'ip': '1.2.3.4', 'port': 6040, 'device': 'sda5', 'id': '2',
+                'index': 0}
+        orig_merge_items = ContainerBroker.merge_items
+
+        def mock_merge_items(broker, items):
+            merge_items_calls.append((broker.path,
+                                      # merge mutates item so make a copy
+                                      [dict(item) for item in items]))
+            orig_merge_items(broker, items)
+
+        # first shard range cleaved but fails to replicate
+        merge_items_calls = []
+        with mock.patch('swift.container.backend.ContainerBroker.merge_items',
+                        mock_merge_items):
+            with self._mock_sharder() as sharder:
+                sharder._replicate_object = mock.MagicMock(
+                    return_value=(False, [False, False, True]))
+                sharder._audit_container = mock.MagicMock()
+                sharder._process_broker(broker, node, 99)
+
+        self.assertEqual(SHARDING, broker.get_db_state())
+        self.assertEqual(ShardRange.SHARDING,
+                         broker.get_own_shard_range().state)
+        self._assert_shard_ranges_equal(shard_ranges,
+                                        broker.get_shard_ranges())
+        # first shard range cleaved to shard broker
+        self.assertEqual([(shard_ranges[0].name, objects[:5])],
+                         merge_items_calls)
+        # replication of first shard range fails - no more shards attempted
+        sharder._replicate_object.assert_called_once_with(
+            0, expected_shard_dbs[0], 0)
+        # shard broker has sync points
+        shard_broker = ContainerBroker(expected_shard_dbs[0])
+        self.assertEqual(
+            [{'remote_id': retiring_db_id, 'sync_point': len(objects)}],
+            shard_broker.get_syncs())
+        self.assertEqual(objects[:5], shard_broker.get_objects())
+
+        # first shard range replicates ok, no new merges required, second is
+        # cleaved but fails to replicate
+        merge_items_calls = []
+        with mock.patch('swift.container.backend.ContainerBroker.merge_items',
+                        mock_merge_items), self._mock_sharder() as sharder:
+            sharder._replicate_object = mock.MagicMock(
+                side_effect=[(False, [False, True, True]),
+                             (False, [False, False, True])])
+            sharder._audit_container = mock.MagicMock()
+            sharder._process_broker(broker, node, 99)
+
+        self.assertEqual(SHARDING, broker.get_db_state())
+        self.assertEqual(ShardRange.SHARDING,
+                         broker.get_own_shard_range().state)
+
+        broker_shard_ranges = broker.get_shard_ranges()
+        shard_ranges[0].object_count = 5
+        shard_ranges[0].bytes_used = sum(obj['size'] for obj in objects[:5])
+        shard_ranges[0].state = ShardRange.CLEAVED
+        self._check_shard_range(shard_ranges[0], broker_shard_ranges[0])
+        # second shard range still in created state
+        self._assert_shard_ranges_equal([shard_ranges[1]],
+                                        [broker_shard_ranges[1]])
+        # only second shard range rows were merged to shard db
+        self.assertEqual([(shard_ranges[1].name, objects[5:])],
+                         merge_items_calls)
+        sharder._replicate_object.assert_has_calls(
+            [mock.call(0, expected_shard_dbs[0], 0),
+             mock.call(0, expected_shard_dbs[1], 0)])
+        # shard broker has sync points
+        shard_broker = ContainerBroker(expected_shard_dbs[1])
+        self.assertEqual(
+            [{'remote_id': retiring_db_id, 'sync_point': len(objects)}],
+            shard_broker.get_syncs())
+        self.assertEqual(objects[5:], shard_broker.get_objects())
+        lines = self.logger.get_lines_for_level('warning')
+        self.assertEqual(1, len(lines))
+        self.assertIn(
+            'Failed to sufficiently replicate cleaved shard %s'
+            % shard_ranges[1].name, lines[0])
+        self.assertIn('1 successes, 2 required', lines[0])
+        self.assertIn('shard db: %s' % expected_shard_dbs[1], lines[0])
+        self.assertIn('db: %s' % broker.db_file, lines[0])
+
+        # repeat - second shard range cleaves fully because its previously
+        # cleaved shard db no longer exists
+        self.logger.clear()
+        unlink_files(expected_shard_dbs)
+        merge_items_calls = []
+        with mock.patch('swift.container.backend.ContainerBroker.merge_items',
+                        mock_merge_items):
+            with self._mock_sharder() as sharder:
+                sharder._replicate_object = mock.MagicMock(
+                    side_effect=[(True, [True, True, True]),  # misplaced obj
+                                 (False, [False, True, True])])
+                sharder._audit_container = mock.MagicMock()
+                sharder._process_broker(broker, node, 99)
+
+        self.assertEqual(SHARDED, broker.get_db_state())
+        self.assertEqual(ShardRange.SHARDED,
+                         broker.get_own_shard_range().state)
+
+        broker_shard_ranges = broker.get_shard_ranges()
+        shard_ranges[1].object_count = 5
+        shard_ranges[1].bytes_used = sum(obj['size'] for obj in objects[5:])
+        shard_ranges[1].state = ShardRange.ACTIVE
+        self._check_shard_range(shard_ranges[1], broker_shard_ranges[1])
+        # second shard range rows were merged to shard db again
+        self.assertEqual([(shard_ranges[0].name, [new_object]),
+                          (shard_ranges[1].name, objects[5:])],
+                         merge_items_calls)
+        sharder._replicate_object.assert_has_calls(
+            [mock.call(0, expected_shard_dbs[0], 0),
+             mock.call(0, expected_shard_dbs[1], 0)])
+        # first shard broker was created by misplaced object - no sync point
+        shard_broker = ContainerBroker(expected_shard_dbs[0])
+        self.assertFalse(shard_broker.get_syncs())
+        self.assertEqual([new_object], shard_broker.get_objects())
+        # second shard broker has sync points
+        shard_broker = ContainerBroker(expected_shard_dbs[1])
+        self.assertEqual(
+            [{'remote_id': retiring_db_id, 'sync_point': len(objects)}],
+            shard_broker.get_syncs())
+        self.assertEqual(objects[5:], shard_broker.get_objects())
+        self.assertFalse(self.logger.get_lines_for_level('warning'))
+
+    def test_shard_replication_quorum_failures(self):
+        broker = self._make_broker()
+        objects = [
+            {'name': 'obj%03d' % i, 'created_at': next(self.ts_iter),
+             'size': 1, 'content_type': 'text/plain', 'etag': 'etag',
+             'deleted': 0, 'storage_policy_index': 0}
+            for i in range(10)
+        ]
+        broker.merge_items([dict(obj) for obj in objects])
+        broker._commit_puts()
+        shard_bounds = (('', 'obj002'), ('obj002', 'obj004'),
+                        ('obj004', 'obj006'), ('obj006', ''))
+        shard_ranges = self._make_shard_ranges(
+            shard_bounds, state=ShardRange.CREATED)
+        expected_shard_dbs = []
+        for shard_range in shard_ranges:
+            db_hash = hash_path(shard_range.account, shard_range.container)
+            expected_shard_dbs.append(
+                os.path.join(self.tempdir, 'sda', 'containers', '0',
+                             db_hash[-3:], db_hash, db_hash + '.db'))
+        broker.enable_sharding(Timestamp.now())
+        broker.merge_shard_ranges(shard_ranges)
+        self.assertTrue(broker.set_sharding_state())
+        node = {'ip': '1.2.3.4', 'port': 6040, 'device': 'sda5', 'id': '2',
+                'index': 0}
+        with self._mock_sharder({'shard_replication_quorum': 3}) as sharder:
+            sharder._replicate_object = mock.MagicMock(
+                side_effect=[(False, [False, True, True]),
+                             (False, [False, False, True])])
+            sharder._audit_container = mock.MagicMock()
+            sharder._process_broker(broker, node, 99)
+        # replication of first shard range fails - no more shards attempted
+        self.assertEqual(SHARDING, broker.get_db_state())
+        self.assertEqual(ShardRange.SHARDING,
+                         broker.get_own_shard_range().state)
+        sharder._replicate_object.assert_called_once_with(
+            0, expected_shard_dbs[0], 0)
+        self.assertEqual([ShardRange.CREATED] * 4,
+                         [sr.state for sr in broker.get_shard_ranges()])
+
+        # and again with a chilled out quorom, so cleaving moves onto second
+        # shard range which fails to reach even chilled quorum
+        with self._mock_sharder({'shard_replication_quorum': 1}) as sharder:
+            sharder._replicate_object = mock.MagicMock(
+                side_effect=[(False, [False, False, True]),
+                             (False, [False, False, False])])
+            sharder._audit_container = mock.MagicMock()
+            sharder._process_broker(broker, node, 99)
+        self.assertEqual(SHARDING, broker.get_db_state())
+        self.assertEqual(ShardRange.SHARDING,
+                         broker.get_own_shard_range().state)
+        self.assertEqual(sharder._replicate_object.call_args_list, [
+            mock.call(0, expected_shard_dbs[0], 0),
+            mock.call(0, expected_shard_dbs[1], 0),
+        ])
+        self.assertEqual(
+            [ShardRange.CLEAVED, ShardRange.CREATED, ShardRange.CREATED,
+             ShardRange.CREATED],
+            [sr.state for sr in broker.get_shard_ranges()])
+
+        # now pretend another node successfully cleaved the second shard range,
+        # but this node still fails to replicate so still cannot move on
+        shard_ranges[1].update_state(ShardRange.CLEAVED)
+        broker.merge_shard_ranges(shard_ranges[1])
+        with self._mock_sharder({'shard_replication_quorum': 1}) as sharder:
+            sharder._replicate_object = mock.MagicMock(
+                side_effect=[(False, [False, False, False])])
+            sharder._audit_container = mock.MagicMock()
+            sharder._process_broker(broker, node, 99)
+        self.assertEqual(SHARDING, broker.get_db_state())
+        self.assertEqual(ShardRange.SHARDING,
+                         broker.get_own_shard_range().state)
+        sharder._replicate_object.assert_called_once_with(
+            0, expected_shard_dbs[1], 0)
+        self.assertEqual(
+            [ShardRange.CLEAVED, ShardRange.CLEAVED, ShardRange.CREATED,
+             ShardRange.CREATED],
+            [sr.state for sr in broker.get_shard_ranges()])
+
+        # until a super-chilled quorum is used - but even then there must have
+        # been an attempt to replicate
+        with self._mock_sharder(
+                {'shard_replication_quorum': 1,
+                 'existing_shard_replication_quorum': 0}) as sharder:
+            sharder._replicate_object = mock.MagicMock(
+                side_effect=[(False, [])])  # maybe shard db was deleted
+            sharder._audit_container = mock.MagicMock()
+            sharder._process_broker(broker, node, 99)
+        self.assertEqual(SHARDING, broker.get_db_state())
+        self.assertEqual(ShardRange.SHARDING,
+                         broker.get_own_shard_range().state)
+        sharder._replicate_object.assert_called_once_with(
+            0, expected_shard_dbs[1], 0)
+        self.assertEqual(
+            [ShardRange.CLEAVED, ShardRange.CLEAVED, ShardRange.CREATED,
+             ShardRange.CREATED],
+            [sr.state for sr in broker.get_shard_ranges()])
+
+        # next pass - the second shard replication is attempted and fails, but
+        # that's ok because another node has cleaved it and
+        # existing_shard_replication_quorum is zero
+        with self._mock_sharder(
+                {'shard_replication_quorum': 1,
+                 'existing_shard_replication_quorum': 0}) as sharder:
+            sharder._replicate_object = mock.MagicMock(
+                side_effect=[(False, [False, False, False]),
+                             (False, [False, True, False])])
+            sharder._audit_container = mock.MagicMock()
+            sharder._process_broker(broker, node, 99)
+        self.assertEqual(SHARDING, broker.get_db_state())
+        self.assertEqual(ShardRange.SHARDING,
+                         broker.get_own_shard_range().state)
+        self.assertEqual(sharder._replicate_object.call_args_list, [
+            mock.call(0, expected_shard_dbs[1], 0),
+            mock.call(0, expected_shard_dbs[2], 0),
+        ])
+        self.assertEqual([ShardRange.CLEAVED] * 3 + [ShardRange.CREATED],
+                         [sr.state for sr in broker.get_shard_ranges()])
+        self.assertEqual(1, sharder.shard_replication_quorum)
+        self.assertEqual(0, sharder.existing_shard_replication_quorum)
+
+        # crazy replication quorums will be capped to replica_count
+        with self._mock_sharder(
+                {'shard_replication_quorum': 99,
+                 'existing_shard_replication_quorum': 99}) as sharder:
+            sharder._replicate_object = mock.MagicMock(
+                side_effect=[(False, [False, True, True])])
+            sharder._audit_container = mock.MagicMock()
+            sharder._process_broker(broker, node, 99)
+        self.assertEqual(SHARDING, broker.get_db_state())
+        self.assertEqual(ShardRange.SHARDING,
+                         broker.get_own_shard_range().state)
+        sharder._replicate_object.assert_called_once_with(
+            0, expected_shard_dbs[3], 0)
+        self.assertEqual([ShardRange.CLEAVED] * 3 + [ShardRange.CREATED],
+                         [sr.state for sr in broker.get_shard_ranges()])
+        self.assertEqual(3, sharder.shard_replication_quorum)
+        self.assertEqual(3, sharder.existing_shard_replication_quorum)
+
+        # ...and progress is still made if replication fully succeeds
+        with self._mock_sharder(
+                {'shard_replication_quorum': 99,
+                 'existing_shard_replication_quorum': 99}) as sharder:
+            sharder._replicate_object = mock.MagicMock(
+                side_effect=[(True, [True, True, True])])
+            sharder._audit_container = mock.MagicMock()
+            sharder._process_broker(broker, node, 99)
+        self.assertEqual(SHARDED, broker.get_db_state())
+        self.assertEqual(ShardRange.SHARDED,
+                         broker.get_own_shard_range().state)
+        sharder._replicate_object.assert_called_once_with(
+            0, expected_shard_dbs[3], 0)
+        self.assertEqual([ShardRange.ACTIVE] * 4,
+                         [sr.state for sr in broker.get_shard_ranges()])
+        warnings = sharder.logger.get_lines_for_level('warning')
+        self.assertIn(
+            'shard_replication_quorum of 99 exceeds replica count',
+            warnings[0])
+        self.assertIn(
+            'existing_shard_replication_quorum of 99 exceeds replica count',
+            warnings[1])
+        self.assertEqual(3, sharder.shard_replication_quorum)
+        self.assertEqual(3, sharder.existing_shard_replication_quorum)
+
+    def test_cleave_to_existing_shard_db(self):
+        # verify that when cleaving to an already existing shard db
+        def replicate(node, from_broker, part):
+            # short circuit replication
+            rpc = replicator.ContainerReplicatorRpc(
+                self.tempdir, DATADIR, ContainerBroker, mount_check=False)
+
+            fake_repl_connection = attach_fake_replication_rpc(rpc)
+            with mock.patch('swift.common.db_replicator.ReplConnection',
+                            fake_repl_connection):
+                with mock.patch('swift.common.db_replicator.ring.Ring',
+                                lambda *args, **kwargs: FakeRing()):
+                    daemon = replicator.ContainerReplicator({})
+                    info = from_broker.get_replication_info()
+                    success = daemon._repl_to_node(
+                        node, from_broker, part, info)
+                    self.assertTrue(success)
+
+        orig_merge_items = ContainerBroker.merge_items
+
+        def mock_merge_items(broker, items):
+            # capture merge_items calls
+            merge_items_calls.append((broker.path,
+                                      # merge mutates item so make a copy
+                                      [dict(item) for item in items]))
+            orig_merge_items(broker, items)
+
+        objects = [
+            {'name': 'obj%03d' % i, 'created_at': next(self.ts_iter),
+             'size': 1, 'content_type': 'text/plain', 'etag': 'etag',
+             'deleted': 0, 'storage_policy_index': 0}
+            for i in range(10)
+        ]
+        # local db gets 4 objects
+        local_broker = self._make_broker()
+        local_broker.merge_items([dict(obj) for obj in objects[2:6]])
+        local_broker._commit_puts()
+        local_retiring_db_id = local_broker.get_info()['id']
+
+        # remote db gets 5 objects
+        remote_broker = self._make_broker(device='sdb')
+        remote_broker.merge_items([dict(obj) for obj in objects[2:7]])
+        remote_broker._commit_puts()
+        remote_retiring_db_id = remote_broker.get_info()['id']
+
+        local_node = {'ip': '1.2.3.4', 'port': 6040, 'device': 'sda',
+                      'id': '2', 'index': 0, 'replication_ip': '1.2.3.4',
+                      'replication_port': 6040}
+        remote_node = {'ip': '1.2.3.5', 'port': 6040, 'device': 'sdb',
+                       'id': '3', 'index': 1, 'replication_ip': '1.2.3.5',
+                       'replication_port': 6040}
+
+        # remote db replicates to local, bringing local db's total to 5 objects
+        self.assertNotEqual(local_broker.get_objects(),
+                            remote_broker.get_objects())
+        replicate(local_node, remote_broker, 0)
+        self.assertEqual(local_broker.get_objects(),
+                         remote_broker.get_objects())
+
+        # local db gets 2 new objects, bringing its total to 7
+        local_broker.merge_items([dict(obj) for obj in objects[1:2]])
+        local_broker.merge_items([dict(obj) for obj in objects[7:8]])
+
+        # local db gets shard ranges
+        own_shard_range = local_broker.get_own_shard_range()
+        now = Timestamp.now()
+        own_shard_range.update_state(ShardRange.SHARDING, state_timestamp=now)
+        own_shard_range.epoch = now
+        shard_ranges = self._make_shard_ranges(
+            (('', 'obj004'), ('obj004', '')), state=ShardRange.CREATED)
+        local_broker.merge_shard_ranges([own_shard_range] + shard_ranges)
+        self.assertTrue(local_broker.set_sharding_state())
+
+        # local db shards
+        merge_items_calls = []
+        with mock.patch('swift.container.backend.ContainerBroker.merge_items',
+                        mock_merge_items):
+            with self._mock_sharder() as sharder:
+                sharder._replicate_object = mock.MagicMock(
+                    return_value=(True, [True, True, True]))
+                sharder._audit_container = mock.MagicMock()
+                sharder._process_broker(local_broker, local_node, 0)
+
+        # all objects merged from local to shard ranges
+        self.assertEqual([(shard_ranges[0].name, objects[1:5]),
+                          (shard_ranges[1].name, objects[5:8])],
+                         merge_items_calls)
+
+        # shard brokers have sync points
+        expected_shard_dbs = []
+        for shard_range in shard_ranges:
+            db_hash = hash_path(shard_range.account, shard_range.container)
+            expected_shard_dbs.append(
+                os.path.join(self.tempdir, 'sda', 'containers', '0',
+                             db_hash[-3:], db_hash, db_hash + '.db'))
+        shard_broker = ContainerBroker(expected_shard_dbs[0])
+        self.assertEqual(
+            [{'remote_id': local_retiring_db_id, 'sync_point': 7},
+             {'remote_id': remote_retiring_db_id, 'sync_point': 5}],
+            shard_broker.get_syncs())
+        self.assertEqual(objects[1:5], shard_broker.get_objects())
+        shard_broker = ContainerBroker(expected_shard_dbs[1])
+        self.assertEqual(
+            [{'remote_id': local_retiring_db_id, 'sync_point': 7},
+             {'remote_id': remote_retiring_db_id, 'sync_point': 5}],
+            shard_broker.get_syncs())
+        self.assertEqual(objects[5:8], shard_broker.get_objects())
+
+        # local db replicates to remote, so remote now has shard ranges
+        # note: no objects replicated because local is sharded
+        self.assertFalse(remote_broker.get_shard_ranges())
+        replicate(remote_node, local_broker, 0)
+        self._assert_shard_ranges_equal(local_broker.get_shard_ranges(),
+                                        remote_broker.get_shard_ranges())
+
+        # remote db gets 3 new objects, bringing its total to 8
+        remote_broker.merge_items([dict(obj) for obj in objects[:1]])
+        remote_broker.merge_items([dict(obj) for obj in objects[8:]])
+
+        merge_items_calls = []
+        with mock.patch('swift.container.backend.ContainerBroker.merge_items',
+                        mock_merge_items):
+            with self._mock_sharder() as sharder:
+                sharder._replicate_object = mock.MagicMock(
+                    return_value=(True, [True, True, True]))
+                sharder._audit_container = mock.MagicMock()
+                sharder._process_broker(remote_broker, remote_node, 0)
+
+        # shard brokers have sync points for the remote db so only new objects
+        # are merged from remote broker to shard brokers
+        self.assertEqual([(shard_ranges[0].name, objects[:1]),
+                          (shard_ranges[1].name, objects[8:])],
+                         merge_items_calls)
+        # sync points are updated
+        shard_broker = ContainerBroker(expected_shard_dbs[0])
+        self.assertEqual(
+            [{'remote_id': local_retiring_db_id, 'sync_point': 7},
+             {'remote_id': remote_retiring_db_id, 'sync_point': 8}],
+            shard_broker.get_syncs())
+        self.assertEqual(objects[:5], shard_broker.get_objects())
+        shard_broker = ContainerBroker(expected_shard_dbs[1])
+        self.assertEqual(
+            [{'remote_id': local_retiring_db_id, 'sync_point': 7},
+             {'remote_id': remote_retiring_db_id, 'sync_point': 8}],
+            shard_broker.get_syncs())
+        self.assertEqual(objects[5:], shard_broker.get_objects())
+
+    def test_cleave_skips_shrinking_and_stops_at_found(self):
+        broker = self._make_broker()
+        broker.enable_sharding(Timestamp.now())
+        shard_bounds = (('', 'b'),
+                        ('b', 'c'),
+                        ('b', 'd'),
+                        ('d', 'f'),
+                        ('f', ''))
+        # make sure there is an object in every shard range so cleaving will
+        # occur in batches of 2
+        objects = [
+            ('a', self.ts_encoded(), 10, 'text/plain', 'etag_a', 0, 0),
+            ('b', self.ts_encoded(), 10, 'text/plain', 'etag_b', 0, 0),
+            ('c', self.ts_encoded(), 1, 'text/plain', 'etag_c', 0, 0),
+            ('d', self.ts_encoded(), 2, 'text/plain', 'etag_d', 0, 0),
+            ('e', self.ts_encoded(), 3, 'text/plain', 'etag_e', 0, 0),
+            ('f', self.ts_encoded(), 100, 'text/plain', 'etag_f', 0, 0),
+            ('x', self.ts_encoded(), 0, '', '', 1, 0),  # deleted
+            ('z', self.ts_encoded(), 1000, 'text/plain', 'etag_z', 0, 0)
+        ]
+        for obj in objects:
+            broker.put_object(*obj)
+        shard_ranges = self._make_shard_ranges(
+            shard_bounds, state=[ShardRange.CREATED,
+                                 ShardRange.SHRINKING,
+                                 ShardRange.CREATED,
+                                 ShardRange.CREATED,
+                                 ShardRange.FOUND])
+        broker.merge_shard_ranges(shard_ranges)
+        self.assertTrue(broker.set_sharding_state())
+
+        # run cleave - first batch is cleaved, shrinking range doesn't count
+        # towards batch size of 2 nor towards ranges_done
+        with self._mock_sharder() as sharder:
+            self.assertFalse(sharder._cleave(broker))
+        context = CleavingContext.load(broker)
+        self.assertTrue(context.misplaced_done)
+        self.assertFalse(context.cleaving_done)
+        self.assertEqual(shard_ranges[2].upper_str, context.cursor)
+        self.assertEqual(2, context.ranges_done)
+        self.assertEqual(2, context.ranges_todo)
+
+        # run cleave - stops at shard range in FOUND state
+        with self._mock_sharder() as sharder:
+            self.assertFalse(sharder._cleave(broker))
+        context = CleavingContext.load(broker)
+        self.assertTrue(context.misplaced_done)
+        self.assertFalse(context.cleaving_done)
+        self.assertEqual(shard_ranges[3].upper_str, context.cursor)
+        self.assertEqual(3, context.ranges_done)
+        self.assertEqual(1, context.ranges_todo)
+
+        # run cleave - final shard range in CREATED state, cleaving proceeds
+        shard_ranges[4].update_state(ShardRange.CREATED,
+                                     state_timestamp=Timestamp.now())
+        broker.merge_shard_ranges(shard_ranges[4:])
+        with self._mock_sharder() as sharder:
+            self.assertTrue(sharder._cleave(broker))
+        context = CleavingContext.load(broker)
+        self.assertTrue(context.misplaced_done)
+        self.assertTrue(context.cleaving_done)
+        self.assertEqual(shard_ranges[4].upper_str, context.cursor)
+        self.assertEqual(4, context.ranges_done)
+        self.assertEqual(0, context.ranges_todo)
+
+    def test_cleave_shrinking_to_active_root_range(self):
+        broker = self._make_shrinking_broker(account='.shards_a',
+                                             container='shard_c')
+        deleted_range = ShardRange(
+            '.shards/other', next(self.ts_iter), 'here', 'there', deleted=True,
+            state=ShardRange.SHRUNK, epoch=next(self.ts_iter))
+        # root is the acceptor...
+        root = ShardRange(
+            'a/c', next(self.ts_iter), '', '',
+            state=ShardRange.ACTIVE, epoch=next(self.ts_iter))
+        broker.merge_shard_ranges([deleted_range, root])
+        broker.set_sharding_sysmeta('Root', 'a/c')
+        self.assertFalse(broker.is_root_container())  # sanity check
+
+        # expect cleave to the root
+        with self._mock_sharder() as sharder:
+            self.assertTrue(sharder._cleave(broker))
+        context = CleavingContext.load(broker)
+        self.assertTrue(context.misplaced_done)
+        self.assertTrue(context.cleaving_done)
+        self.assertEqual(root.upper_str, context.cursor)
+        self.assertEqual(1, context.ranges_done)
+        self.assertEqual(0, context.ranges_todo)
+
+    def test_cleave_shrinking_to_active_acceptor_with_sharded_root_range(self):
+        broker = self._make_broker(account='.shards_a', container='shard_c')
+        broker.put_object(
+            'here_a', next(self.ts_iter), 10, 'text/plain', 'etag_a', 0, 0)
+        own_shard_range = ShardRange(
+            broker.path, next(self.ts_iter), 'here', 'there',
+            state=ShardRange.SHARDING, epoch=next(self.ts_iter))
+        # the intended acceptor...
+        acceptor = ShardRange(
+            '.shards_a/shard_d', next(self.ts_iter), 'here', '',
+            state=ShardRange.ACTIVE, epoch=next(self.ts_iter))
+        # root range also gets pulled from root during audit...
+        root = ShardRange(
+            'a/c', next(self.ts_iter), '', '',
+            state=ShardRange.SHARDED, epoch=next(self.ts_iter))
+        broker.merge_shard_ranges([own_shard_range, acceptor, root])
+        broker.set_sharding_sysmeta('Root', 'a/c')
+        self.assertFalse(broker.is_root_container())  # sanity check
+        self.assertTrue(broker.set_sharding_state())
+
+        # sharded root range should always sort after an active acceptor so
+        # expect cleave to acceptor first then cleaving completes
+        with self._mock_sharder() as sharder:
+            self.assertTrue(sharder._cleave(broker))
+        context = CleavingContext.load(broker)
+        self.assertTrue(context.misplaced_done)
+        self.assertTrue(context.cleaving_done)
+        self.assertEqual(acceptor.upper_str, context.cursor)
+        self.assertEqual(1, context.ranges_done)  # cleaved the acceptor
+        self.assertEqual(1, context.ranges_todo)  # never reached sharded root
+
+    def test_cleave_shrinking_to_active_root_range_with_active_acceptor(self):
+        # if shrinking shard has both active root and active other acceptor,
+        # verify that shard only cleaves to one of them;
+        # root will sort before acceptor if acceptor.upper==MAX
+        objects = (
+            ('here_a', next(self.ts_iter), 10, 'text/plain', 'etag_a', 0, 0),)
+        broker = self._make_shrinking_broker(objects=objects)
+        # active acceptor with upper bound == MAX
+        acceptor = ShardRange(
+            '.shards/other', next(self.ts_iter), 'here', '', deleted=False,
+            state=ShardRange.ACTIVE, epoch=next(self.ts_iter))
+        # root is also active
+        root = ShardRange(
+            'a/c', next(self.ts_iter), '', '',
+            state=ShardRange.ACTIVE, epoch=next(self.ts_iter))
+        broker.merge_shard_ranges([acceptor, root])
+        broker.set_sharding_sysmeta('Root', 'a/c')
+        self.assertFalse(broker.is_root_container())  # sanity check
+
+        # expect cleave to the root
+        acceptor.upper = ''
+        acceptor.timestamp = next(self.ts_iter)
+        broker.merge_shard_ranges([acceptor])
+        with self._mock_sharder() as sharder:
+            self.assertTrue(sharder._cleave(broker))
+        context = CleavingContext.load(broker)
+        self.assertTrue(context.misplaced_done)
+        self.assertTrue(context.cleaving_done)
+        self.assertEqual(root.upper_str, context.cursor)
+        self.assertEqual(1, context.ranges_done)
+        self.assertEqual(1, context.ranges_todo)
+        info = [
+            line for line in self.logger.get_lines_for_level('info')
+            if line.startswith('Replicating new shard container a/c')
+        ]
+        self.assertEqual(1, len(info))
+
+    def test_cleave_shrinking_to_active_acceptor_with_active_root_range(self):
+        # if shrinking shard has both active root and active other acceptor,
+        # verify that shard only cleaves to one of them;
+        # root will sort after acceptor if acceptor.upper<MAX
+        objects = (
+            ('here_a', next(self.ts_iter), 10, 'text/plain', 'etag_a', 0, 0),)
+        broker = self._make_shrinking_broker(objects=objects)
+        # active acceptor with upper bound < MAX
+        acceptor = ShardRange(
+            '.shards/other', next(self.ts_iter), 'here', 'where',
+            deleted=False, state=ShardRange.ACTIVE, epoch=next(self.ts_iter))
+        # root is also active
+        root = ShardRange(
+            'a/c', next(self.ts_iter), '', '',
+            state=ShardRange.ACTIVE, epoch=next(self.ts_iter))
+        broker.merge_shard_ranges([acceptor, root])
+
+        # expect cleave to the acceptor
+        with self._mock_sharder() as sharder:
+            self.assertTrue(sharder._cleave(broker))
+        context = CleavingContext.load(broker)
+        self.assertTrue(context.misplaced_done)
+        self.assertTrue(context.cleaving_done)
+        self.assertEqual(acceptor.upper_str, context.cursor)
+        self.assertEqual(1, context.ranges_done)
+        self.assertEqual(1, context.ranges_todo)
+        info = [
+            line for line in self.logger.get_lines_for_level('info')
+            if line.startswith('Replicating new shard container .shards/other')
+        ]
+        self.assertEqual(1, len(info))
+
+    def _check_not_complete_sharding(self, broker):
+        with self._mock_sharder() as sharder:
+            self.assertFalse(sharder._complete_sharding(broker))
+        warning_lines = sharder.logger.get_lines_for_level('warning')
+        self.assertIn('Repeat cleaving required', warning_lines[0])
+        self.assertFalse(warning_lines[1:])
+        sharder.logger.clear()
+        context = CleavingContext.load(broker)
+        self.assertFalse(context.cleaving_done)
+        self.assertFalse(context.misplaced_done)
+        self.assertEqual('', context.cursor)
+        self.assertEqual(ShardRange.SHARDING,
+                         broker.get_own_shard_range().state)
+        for shard_range in broker.get_shard_ranges():
+            self.assertEqual(ShardRange.CLEAVED, shard_range.state)
+        self.assertEqual(SHARDING, broker.get_db_state())
+
+    def _check_complete_sharding(self, account, container, shard_bounds):
+        broker = self._make_sharding_broker(
+            account=account, container=container, shard_bounds=shard_bounds)
+        obj = {'name': 'obj', 'created_at': next(self.ts_iter).internal,
+               'size': 14, 'content_type': 'text/plain', 'etag': 'an etag',
+               'deleted': 0}
+        broker.get_brokers()[0].merge_items([obj])
+        self.assertEqual(2, len(broker.db_files))  # sanity check
+
+        # no cleave context progress
+        self._check_not_complete_sharding(broker)
+
+        # cleaving_done is False
+        context = CleavingContext.load(broker)
+        self.assertEqual(1, context.max_row)
+        context.cleave_to_row = 1  # pretend all rows have been cleaved
+        context.cleaving_done = False
+        context.misplaced_done = True
+        context.store(broker)
+        self._check_not_complete_sharding(broker)
+
+        # misplaced_done is False
+        context.misplaced_done = False
+        context.cleaving_done = True
+        context.store(broker)
+        self._check_not_complete_sharding(broker)
+
+        # modified db max row
+        old_broker = broker.get_brokers()[0]
+        obj = {'name': 'obj', 'created_at': next(self.ts_iter).internal,
+               'size': 14, 'content_type': 'text/plain', 'etag': 'an etag',
+               'deleted': 1}
+        old_broker.merge_items([obj])
+        self.assertGreater(old_broker.get_max_row(), context.max_row)
+        context.misplaced_done = True
+        context.cleaving_done = True
+        context.store(broker)
+        self._check_not_complete_sharding(broker)
+
+        # db id changes
+        broker.get_brokers()[0].newid('fake_remote_id')
+        context.cleave_to_row = 2  # pretend all rows have been cleaved, again
+        context.store(broker)
+        self._check_not_complete_sharding(broker)
+
+        # context ok
+        context = CleavingContext.load(broker)
+        context.cleave_to_row = context.max_row
+        context.misplaced_done = True
+        context.cleaving_done = True
+        context.store(broker)
+        with self._mock_sharder() as sharder:
+            self.assertTrue(sharder._complete_sharding(broker))
+        self.assertEqual(SHARDED, broker.get_db_state())
+        self.assertEqual(ShardRange.SHARDED,
+                         broker.get_own_shard_range().state)
+        for shard_range in broker.get_shard_ranges():
+            self.assertEqual(ShardRange.ACTIVE, shard_range.state)
+        warning_lines = sharder.logger.get_lines_for_level('warning')
+        self.assertFalse(warning_lines)
+        sharder.logger.clear()
+        return broker
+
+    def test_complete_sharding_root(self):
+        broker = self._check_complete_sharding(
+            'a', 'c', (('', 'mid'), ('mid', '')))
+        self.assertEqual(0, broker.get_own_shard_range().deleted)
+
+    def test_complete_sharding_shard(self):
+        broker = self._check_complete_sharding(
+            '.shards_', 'shard_c', (('l', 'mid'), ('mid', 'u')))
+        self.assertEqual(1, broker.get_own_shard_range().deleted)
+
+    def test_complete_sharding_missing_own_shard_range(self):
+        broker = self._make_sharding_broker()
+        obj = {'name': 'obj', 'created_at': next(self.ts_iter).internal,
+               'size': 14, 'content_type': 'text/plain', 'etag': 'an etag',
+               'deleted': 0}
+        broker.get_brokers()[0].merge_items([obj])
+        self.assertEqual(2, len(broker.db_files))  # sanity check
+
+        # Make cleaving context_done
+        context = CleavingContext.load(broker)
+        self.assertEqual(1, context.max_row)
+        context.cleave_to_row = 1  # pretend all rows have been cleaved
+        context.cleaving_done = True
+        context.misplaced_done = True
+        context.store(broker)
+
+        with self._mock_sharder() as sharder, mock.patch(
+                'swift.container.backend.ContainerBroker.get_own_shard_range',
+                return_value=None):
+            self.assertFalse(sharder._complete_sharding(broker))
+        self.assertEqual(SHARDING, broker.get_db_state())
+        warning_lines = sharder.logger.get_lines_for_level('warning')
+        self.assertEqual(warning_lines[0],
+                         'Failed to get own_shard_range, path: a/c, db: %s'
+                         % broker.db_file)
+
+    def test_sharded_record_sharding_progress_missing_contexts(self):
+        broker = self._check_complete_sharding(
+            'a', 'c', (('', 'mid'), ('mid', '')))
+
+        with self._mock_sharder() as sharder:
+            with mock.patch.object(sharder, '_append_stat') as mocked:
+                sharder._record_sharding_progress(broker, {}, None, 0.5)
+        mocked.assert_called_once_with('sharding_in_progress', 'all', mock.ANY)
+
+        # clear the contexts then run _record_sharding_progress
+        for context, _ in CleavingContext.load_all(broker):
+            context.delete(broker)
+
+        with self._mock_sharder() as sharder:
+            with mock.patch.object(sharder, '_append_stat') as mocked:
+                sharder._record_sharding_progress(broker, {}, None, 0.5)
+        mocked.assert_not_called()
+
+    def test_sharded_record_sharding_progress_tolerates_timestamp_offset(self):
+        # CleavingContext metadata might one day have timestamps with offset,
+        # so verify they can be sorted...
+        ts_iter_with_offset = (Timestamp(float(ts) + i, offset=i)
+                               for i, ts in enumerate(self.ts_iter, start=1))
+        with mock.patch('swift.common.utils.Timestamp.now',
+                        side_effect=ts_iter_with_offset):
+            broker = self._check_complete_sharding(
+                'a', 'c', (('', 'mid'), ('mid', '')))
+
+        with self._mock_sharder() as sharder:
+            with mock.patch.object(sharder, '_append_stat') as mocked:
+                sharder._record_sharding_progress(broker, {}, None, 1234)
+        mocked.assert_called_once_with('sharding_in_progress', 'all', mock.ANY)
+
+    def test_incomplete_sharding_progress_warning_log(self):
+        # test to verify sharder will print warning logs if sharding has been
+        # taking too long.
+        broker = self._make_sharding_broker(
+            'a', 'c', (('', 'mid'), ('mid', '')))
+        obj = {'name': 'obj', 'created_at': next(self.ts_iter).internal,
+               'size': 14, 'content_type': 'text/plain', 'etag': 'an etag',
+               'deleted': 0}
+        broker.get_brokers()[0].merge_items([obj])
+        self.assertEqual(2, len(broker.db_files))
+        # sharding is not complete due to no cleave context progress.
+        self._check_not_complete_sharding(broker)
+
+        own_shard_range = broker.get_own_shard_range()
+        # advance time but still within 'container_sharding_timeout'.
+        future_time = 10000 + float(own_shard_range.epoch)
+        with mock.patch(
+                'swift.container.sharder.time.time',
+                return_value=future_time), self._mock_sharder() as sharder:
+            sharder._record_sharding_progress(broker, {}, None, 0.5)
+        self.assertEqual([], self.logger.get_lines_for_level('warning'))
+        future_time = 172800 + float(own_shard_range.epoch)
+        with mock.patch(
+                'swift.container.sharder.time.time',
+                return_value=future_time), self._mock_sharder() as sharder:
+            sharder._record_sharding_progress(broker, {}, None, 0.5)
+        self.assertEqual([], self.logger.get_lines_for_level('warning'))
+
+        # advance time beyond 'container_sharding_timeout'.
+        future_time = 172800 + float(own_shard_range.epoch) + 1
+        with mock.patch(
+                'swift.container.sharder.time.time',
+                return_value=future_time), self._mock_sharder() as sharder:
+            sharder._record_sharding_progress(broker, {}, None, 0.5)
+        warning_lines = sharder.logger.get_lines_for_level('warning')
+        self.assertIn(
+            'Cleaving has not completed in %.2f seconds since %s. DB state: '
+            'sharding' % (future_time - float(own_shard_range.epoch),
+                          own_shard_range.epoch.isoformat),
+            warning_lines[0])
+
+    def test_incomplete_shrinking_progress_warning_log(self):
+        # test to verify sharder will print warning logs if shrinking has been
+        # taking too long.
+        broker = self._make_shrinking_broker()
+        obj = {'name': 'obj', 'created_at': next(self.ts_iter).internal,
+               'size': 14, 'content_type': 'text/plain', 'etag': 'an etag',
+               'deleted': 0}
+        broker.get_brokers()[0].merge_items([obj])
+        # active acceptor with upper bound < MAX
+        acceptor = ShardRange(
+            '.shards/other', next(self.ts_iter), 'here', 'where',
+            deleted=False, state=ShardRange.ACTIVE, epoch=next(self.ts_iter))
+        broker.merge_shard_ranges([acceptor])
+        context = CleavingContext.load(broker)
+        self.assertFalse(context.cleaving_done)
+
+        own_shard_range = broker.get_own_shard_range()
+        # advance time but still within 'container_sharding_timeout'.
+        future_time = 10000 + float(own_shard_range.epoch)
+        with mock.patch(
+                'swift.container.sharder.time.time',
+                return_value=future_time), self._mock_sharder() as sharder:
+            sharder._record_sharding_progress(broker, {}, None, 0.5)
+        self.assertEqual([], self.logger.get_lines_for_level('warning'))
+        future_time = 172800 + float(own_shard_range.epoch)
+        with mock.patch(
+                'swift.container.sharder.time.time',
+                return_value=future_time), self._mock_sharder() as sharder:
+            sharder._record_sharding_progress(broker, {}, None, 0.5)
+        self.assertEqual([], self.logger.get_lines_for_level('warning'))
+
+        # advance time beyond 'container_sharding_timeout'.
+        future_time = 172800 + float(own_shard_range.epoch) + 1
+        with mock.patch(
+                'swift.container.sharder.time.time',
+                return_value=future_time), self._mock_sharder() as sharder:
+            sharder._record_sharding_progress(broker, {}, None, 0.5)
+        warning_lines = sharder.logger.get_lines_for_level('warning')
+        self.assertIn(
+            'Cleaving has not completed in %.2f seconds since %s.' %
+            (future_time - float(own_shard_range.epoch),
+             own_shard_range.epoch.isoformat),
+            warning_lines[0])
+
+    def test_identify_sharding_old_style_candidate(self):
+        brokers = [self._make_broker(container='c%03d' % i) for i in range(6)]
+        for broker in brokers:
+            broker.set_sharding_sysmeta('Root', 'a/c')
+        node = {'index': 2}
+        # containers are all empty
+        with self._mock_sharder() as sharder:
+            for broker in brokers:
+                sharder._identify_sharding_candidate(broker, node)
+        expected_stats = {}
+        self._assert_stats(expected_stats, sharder, 'sharding_candidates')
+
+        objects = [
+            ['obj%3d' % i, next(self.ts_iter).internal, i, 'text/plain',
+             'etag%s' % i, 0] for i in range(160)]
+
+        # one container has 100 objects, which is below the sharding threshold
+        for obj in objects[:100]:
+            brokers[0].put_object(*obj)
+        conf = {'recon_cache_path': self.tempdir}
+        with self._mock_sharder(conf=conf) as sharder:
+            for broker in brokers:
+                sharder._identify_sharding_candidate(broker, node)
+        self.assertFalse(sharder.sharding_candidates)
+        expected_recon = {
+            'found': 0,
+            'top': []}
+        sharder._report_stats()
+        self._assert_recon_stats(
+            expected_recon, sharder, 'sharding_candidates')
+
+        # reduce the sharding threshold and the container is reported
+        conf = {'shard_container_threshold': 100,
+                'recon_cache_path': self.tempdir}
+        with self._mock_sharder(conf=conf) as sharder:
+            with mock_timestamp_now() as now:
+                for broker in brokers:
+                    sharder._identify_sharding_candidate(broker, node)
+        stats_0 = {'path': brokers[0].db_file,
+                   'node_index': 2,
+                   'account': 'a',
+                   'container': 'c000',
+                   'root': 'a/c',
+                   'object_count': 100,
+                   'tombstones': -1,
+                   'meta_timestamp': now.internal,
+                   'file_size': os.stat(brokers[0].db_file).st_size}
+        self.assertEqual([stats_0], sharder.sharding_candidates)
+        expected_recon = {
+            'found': 1,
+            'top': [stats_0]}
+        sharder._report_stats()
+        self._assert_recon_stats(
+            expected_recon, sharder, 'sharding_candidates')
+
+    def test_identify_sharding_candidate(self):
+        brokers = [self._make_broker(container='c%03d' % i) for i in range(6)]
+        for broker in brokers:
+            broker.set_sharding_sysmeta('Quoted-Root', 'a/c')
+        node = {'index': 2}
+        # containers are all empty
+        with self._mock_sharder() as sharder:
+            for broker in brokers:
+                sharder._identify_sharding_candidate(broker, node)
+        expected_stats = {}
+        self._assert_stats(expected_stats, sharder, 'sharding_candidates')
+
+        objects = [
+            ['obj%3d' % i, next(self.ts_iter).internal, i, 'text/plain',
+             'etag%s' % i, 0] for i in range(160)]
+
+        # one container has 100 objects, which is below the sharding threshold
+        for obj in objects[:100]:
+            brokers[0].put_object(*obj)
+        conf = {'recon_cache_path': self.tempdir}
+        with self._mock_sharder(conf=conf) as sharder:
+            for broker in brokers:
+                sharder._identify_sharding_candidate(broker, node)
+        self.assertFalse(sharder.sharding_candidates)
+        expected_recon = {
+            'found': 0,
+            'top': []}
+        sharder._report_stats()
+        self._assert_recon_stats(
+            expected_recon, sharder, 'sharding_candidates')
+
+        # reduce the sharding threshold and the container is reported
+        conf = {'shard_container_threshold': 100,
+                'recon_cache_path': self.tempdir}
+        with self._mock_sharder(conf=conf) as sharder:
+            with mock_timestamp_now() as now:
+                for broker in brokers:
+                    sharder._identify_sharding_candidate(broker, node)
+        stats_0 = {'path': brokers[0].db_file,
+                   'node_index': 2,
+                   'account': 'a',
+                   'container': 'c000',
+                   'root': 'a/c',
+                   'object_count': 100,
+                   'tombstones': -1,
+                   'meta_timestamp': now.internal,
+                   'file_size': os.stat(brokers[0].db_file).st_size}
+        self.assertEqual([stats_0], sharder.sharding_candidates)
+        expected_recon = {
+            'found': 1,
+            'top': [stats_0]}
+        sharder._report_stats()
+        self._assert_recon_stats(
+            expected_recon, sharder, 'sharding_candidates')
+
+        # repeat with handoff node and db_file error
+        with self._mock_sharder(conf=conf) as sharder:
+            with mock_timestamp_now(now):
+                with mock.patch('os.stat', side_effect=OSError('test error')):
+                    for broker in brokers:
+                        sharder._identify_sharding_candidate(broker, {})
+        stats_0_b = {'path': brokers[0].db_file,
+                     'node_index': None,
+                     'account': 'a',
+                     'container': 'c000',
+                     'root': 'a/c',
+                     'object_count': 100,
+                     'tombstones': -1,
+                     'meta_timestamp': now.internal,
+                     'file_size': None}
+        self.assertEqual([stats_0_b], sharder.sharding_candidates)
+        self._assert_stats(expected_stats, sharder, 'sharding_candidates')
+        expected_recon = {
+            'found': 1,
+            'top': [stats_0_b]}
+        sharder._report_stats()
+        self._assert_recon_stats(
+            expected_recon, sharder, 'sharding_candidates')
+
+        # load up another container, but not to threshold for sharding, and
+        # verify it is never a candidate for sharding
+        for obj in objects[:50]:
+            brokers[2].put_object(*obj)
+        own_sr = brokers[2].get_own_shard_range()
+        for state in ShardRange.STATES:
+            own_sr.update_state(state, state_timestamp=Timestamp.now())
+            brokers[2].merge_shard_ranges([own_sr])
+            with self._mock_sharder(conf=conf) as sharder:
+                with mock_timestamp_now(now):
+                    for broker in brokers:
+                        sharder._identify_sharding_candidate(broker, node)
+            with self.subTest(state=state):
+                self.assertEqual([stats_0], sharder.sharding_candidates)
+
+        # reduce the threshold and the second container is included
+        conf = {'shard_container_threshold': 50,
+                'recon_cache_path': self.tempdir}
+        own_sr.update_state(ShardRange.ACTIVE, state_timestamp=Timestamp.now())
+        brokers[2].merge_shard_ranges([own_sr])
+        with self._mock_sharder(conf=conf) as sharder:
+            with mock_timestamp_now(now):
+                for broker in brokers:
+                    sharder._identify_sharding_candidate(broker, node)
+        stats_2 = {'path': brokers[2].db_file,
+                   'node_index': 2,
+                   'account': 'a',
+                   'container': 'c002',
+                   'root': 'a/c',
+                   'object_count': 50,
+                   'tombstones': -1,
+                   'meta_timestamp': now.internal,
+                   'file_size': os.stat(brokers[2].db_file).st_size}
+        self.assertEqual([stats_0, stats_2], sharder.sharding_candidates)
+        expected_recon = {
+            'found': 2,
+            'top': [stats_0, stats_2]}
+        sharder._report_stats()
+        self._assert_recon_stats(
+            expected_recon, sharder, 'sharding_candidates')
+
+        # a broker not in active state is not included
+        own_sr = brokers[0].get_own_shard_range()
+        for state in ShardRange.STATES:
+            if state == ShardRange.ACTIVE:
+                continue
+            own_sr.update_state(state, state_timestamp=Timestamp.now())
+            brokers[0].merge_shard_ranges([own_sr])
+            with self._mock_sharder(conf=conf) as sharder:
+                with mock_timestamp_now(now):
+                    for broker in brokers:
+                        sharder._identify_sharding_candidate(broker, node)
+            with self.subTest(state=state):
+                self.assertEqual([stats_2], sharder.sharding_candidates)
+
+        own_sr.update_state(ShardRange.ACTIVE, state_timestamp=Timestamp.now())
+        brokers[0].merge_shard_ranges([own_sr])
+
+        # load up a third container with 150 objects
+        for obj in objects[:150]:
+            brokers[5].put_object(*obj)
+        with self._mock_sharder(conf=conf) as sharder:
+            with mock_timestamp_now(now):
+                for broker in brokers:
+                    sharder._identify_sharding_candidate(broker, node)
+        stats_5 = {'path': brokers[5].db_file,
+                   'node_index': 2,
+                   'account': 'a',
+                   'container': 'c005',
+                   'root': 'a/c',
+                   'object_count': 150,
+                   'tombstones': -1,
+                   'meta_timestamp': now.internal,
+                   'file_size': os.stat(brokers[5].db_file).st_size}
+        self.assertEqual([stats_0, stats_2, stats_5],
+                         sharder.sharding_candidates)
+        # note recon top list is sorted by size
+        expected_recon = {
+            'found': 3,
+            'top': [stats_5, stats_0, stats_2]}
+        sharder._report_stats()
+        self._assert_recon_stats(
+            expected_recon, sharder, 'sharding_candidates')
+
+        # restrict the number of reported candidates
+        conf = {'shard_container_threshold': 50,
+                'recon_cache_path': self.tempdir,
+                'recon_candidates_limit': 2}
+        with self._mock_sharder(conf=conf) as sharder:
+            with mock_timestamp_now(now):
+                for broker in brokers:
+                    sharder._identify_sharding_candidate(broker, node)
+        self.assertEqual([stats_0, stats_2, stats_5],
+                         sharder.sharding_candidates)
+        expected_recon = {
+            'found': 3,
+            'top': [stats_5, stats_0]}
+        sharder._report_stats()
+        self._assert_recon_stats(
+            expected_recon, sharder, 'sharding_candidates')
+
+        # unrestrict the number of reported candidates
+        conf = {'shard_container_threshold': 50,
+                'recon_cache_path': self.tempdir,
+                'recon_candidates_limit': -1}
+        for i, broker in enumerate([brokers[1]] + brokers[3:5]):
+            for obj in objects[:(151 + i)]:
+                broker.put_object(*obj)
+        with self._mock_sharder(conf=conf) as sharder:
+            with mock_timestamp_now(now):
+                for broker in brokers:
+                    sharder._identify_sharding_candidate(broker, node)
+
+        stats_4 = {'path': brokers[4].db_file,
+                   'node_index': 2,
+                   'account': 'a',
+                   'container': 'c004',
+                   'root': 'a/c',
+                   'object_count': 153,
+                   'tombstones': -1,
+                   'meta_timestamp': now.internal,
+                   'file_size': os.stat(brokers[4].db_file).st_size}
+        stats_3 = {'path': brokers[3].db_file,
+                   'node_index': 2,
+                   'account': 'a',
+                   'container': 'c003',
+                   'root': 'a/c',
+                   'object_count': 152,
+                   'tombstones': -1,
+                   'meta_timestamp': now.internal,
+                   'file_size': os.stat(brokers[3].db_file).st_size}
+        stats_1 = {'path': brokers[1].db_file,
+                   'node_index': 2,
+                   'account': 'a',
+                   'container': 'c001',
+                   'root': 'a/c',
+                   'object_count': 151,
+                   'tombstones': -1,
+                   'meta_timestamp': now.internal,
+                   'file_size': os.stat(brokers[1].db_file).st_size}
+
+        self.assertEqual(
+            [stats_0, stats_1, stats_2, stats_3, stats_4, stats_5],
+            sharder.sharding_candidates)
+        self._assert_stats(expected_stats, sharder, 'sharding_candidates')
+        expected_recon = {
+            'found': 6,
+            'top': [stats_4, stats_3, stats_1, stats_5, stats_0, stats_2]}
+        sharder._report_stats()
+        self._assert_recon_stats(
+            expected_recon, sharder, 'sharding_candidates')
+
+    def test_misplaced_objects_root_container(self):
+        broker = self._make_broker()
+        broker.enable_sharding(next(self.ts_iter))
+
+        objects = [
+            # misplaced objects in second and third shard ranges
+            ['n', self.ts_encoded(), 2, 'text/plain', 'etag_n', 0, 0],
+            ['there', self.ts_encoded(), 3, 'text/plain', 'etag_there', 0, 1],
+            ['where', self.ts_encoded(), 100, 'text/plain', 'etag_where', 0,
+             0],
+            # deleted
+            ['x', self.ts_encoded(), 0, '', '', 1, 1],
+        ]
+
+        shard_bounds = (('', 'here'), ('here', 'there'),
+                        ('there', 'where'), ('where', 'yonder'),
+                        ('yonder', ''))
+        initial_shard_ranges = self._make_shard_ranges(
+            shard_bounds, state=ShardRange.ACTIVE)
+        expected_shard_dbs = []
+        for shard_range in initial_shard_ranges:
+            db_hash = hash_path(shard_range.account, shard_range.container)
+            expected_shard_dbs.append(
+                os.path.join(self.tempdir, 'sda', 'containers', '0',
+                             db_hash[-3:], db_hash, db_hash + '.db'))
+        broker.merge_shard_ranges(initial_shard_ranges)
+
+        # unsharded
+        with self._mock_sharder() as sharder:
+            sharder._move_misplaced_objects(broker)
+        sharder._replicate_object.assert_not_called()
+        expected_stats = {'attempted': 1, 'success': 1, 'failure': 0,
+                          'found': 0, 'placed': 0, 'unplaced': 0,
+                          'db_created': 0, 'db_exists': 0}
+        self._assert_stats(expected_stats, sharder, 'misplaced')
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_found'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_placed'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_unplaced'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_db_created'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_db_exists'))
+
+        # sharding - no misplaced objects
+        self.assertTrue(broker.set_sharding_state())
+        with self._mock_sharder() as sharder:
+            sharder._move_misplaced_objects(broker)
+        sharder._replicate_object.assert_not_called()
+        self._assert_stats(expected_stats, sharder, 'misplaced')
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_found'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_placed'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_unplaced'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_db_created'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_db_exists'))
+
+        # pretend we cleaved up to end of second shard range
+        context = CleavingContext.load(broker)
+        context.cursor = 'there'
+        context.store(broker)
+        with self._mock_sharder() as sharder:
+            sharder._move_misplaced_objects(broker)
+        sharder._replicate_object.assert_not_called()
+        self._assert_stats(expected_stats, sharder, 'misplaced')
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_found'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_placed'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_unplaced'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_db_created'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_db_exists'))
+
+        # sharding - misplaced objects
+        for obj in objects:
+            broker.put_object(*obj)
+        # pretend we have not cleaved any ranges
+        context.cursor = ''
+        context.store(broker)
+        with self._mock_sharder() as sharder:
+            sharder._move_misplaced_objects(broker)
+        sharder._replicate_object.assert_not_called()
+        self._assert_stats(expected_stats, sharder, 'misplaced')
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_found'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_placed'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_unplaced'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_db_created'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_db_exists'))
+        self.assertFalse(os.path.exists(expected_shard_dbs[0]))
+        self.assertFalse(os.path.exists(expected_shard_dbs[1]))
+        self.assertFalse(os.path.exists(expected_shard_dbs[2]))
+        self.assertFalse(os.path.exists(expected_shard_dbs[3]))
+        self.assertFalse(os.path.exists(expected_shard_dbs[4]))
+
+        # pretend we cleaved up to end of second shard range
+        context.cursor = 'there'
+        context.store(broker)
+        with self._mock_sharder() as sharder:
+            sharder._move_misplaced_objects(broker)
+
+        sharder._replicate_object.assert_called_once_with(
+            0, expected_shard_dbs[1], 0)
+        expected_stats = {'attempted': 1, 'success': 1, 'failure': 0,
+                          'found': 1, 'placed': 2, 'unplaced': 0,
+                          'db_created': 1, 'db_exists': 0}
+        self._assert_stats(expected_stats, sharder, 'misplaced')
+        self.assertEqual(
+            1, sharder.logger.statsd_client.get_stats_counts()[
+                'misplaced_found'])
+        self.assertEqual(
+            2, sharder.logger.statsd_client.get_stats_counts()[
+                'misplaced_placed'])
+        self.assertEqual(
+            1, sharder.logger.statsd_client.get_stats_counts()[
+                'misplaced_db_created'])
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_db_exists'))
+
+        # check misplaced objects were moved
+        self._check_objects(objects[:2], expected_shard_dbs[1])
+        # ... and removed from the source db
+        self._check_objects(objects[2:], broker.db_file)
+        # ... and nothing else moved
+        self.assertFalse(os.path.exists(expected_shard_dbs[0]))
+        self.assertFalse(os.path.exists(expected_shard_dbs[2]))
+        self.assertFalse(os.path.exists(expected_shard_dbs[3]))
+        self.assertFalse(os.path.exists(expected_shard_dbs[4]))
+
+        # pretend we cleaved up to end of fourth shard range
+        context.cursor = 'yonder'
+        context.store(broker)
+        # and some new misplaced updates arrived in the first shard range
+        new_objects = [
+            ['b', self.ts_encoded(), 10, 'text/plain', 'etag_b', 0, 0],
+            ['c', self.ts_encoded(), 20, 'text/plain', 'etag_c', 0, 0],
+        ]
+        for obj in new_objects:
+            broker.put_object(*obj)
+
+        # check that *all* misplaced objects are moved despite exceeding
+        # the listing limit
+        with self._mock_sharder(conf={'cleave_row_batch_size': 2}) as sharder:
+            sharder._move_misplaced_objects(broker)
+        expected_stats = {'attempted': 1, 'success': 1, 'failure': 0,
+                          'found': 1, 'placed': 4, 'unplaced': 0,
+                          'db_created': 3, 'db_exists': 0}
+        self._assert_stats(expected_stats, sharder, 'misplaced')
+        sharder._replicate_object.assert_has_calls(
+            [mock.call(0, db, 0) for db in expected_shard_dbs[2:4]],
+            any_order=True
+        )
+        self._assert_stats(expected_stats, sharder, 'misplaced')
+        self.assertEqual(
+            1, sharder.logger.statsd_client.get_stats_counts()[
+                'misplaced_found'])
+        self.assertEqual(
+            4, sharder.logger.statsd_client.get_stats_counts()[
+                'misplaced_placed'])
+        self.assertEqual(
+            3, sharder.logger.statsd_client.get_stats_counts()[
+                'misplaced_db_created'])
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_db_exists'))
+
+        # check misplaced objects were moved
+        self._check_objects(new_objects, expected_shard_dbs[0])
+        self._check_objects(objects[:2], expected_shard_dbs[1])
+        self._check_objects(objects[2:3], expected_shard_dbs[2])
+        self._check_objects(objects[3:], expected_shard_dbs[3])
+        # ... and removed from the source db
+        self._check_objects([], broker.db_file)
+        self.assertFalse(os.path.exists(expected_shard_dbs[4]))
+
+        # pretend we cleaved all ranges - sharded state
+        self.assertTrue(broker.set_sharded_state())
+        with self._mock_sharder() as sharder:
+            sharder._move_misplaced_objects(broker)
+        sharder._replicate_object.assert_not_called()
+        expected_stats = {'attempted': 1, 'success': 1, 'failure': 0,
+                          'found': 0, 'placed': 0, 'unplaced': 0,
+                          'db_created': 0, 'db_exists': 0}
+        self._assert_stats(expected_stats, sharder, 'misplaced')
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_found'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_placed'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_db_created'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_db_exists'))
+
+        # and then more misplaced updates arrive
+        newer_objects = [
+            ['a-deleted', self.ts_encoded(), 51, 'text/plain', 'etag_a', 1, 0],
+            ['z', self.ts_encoded(), 52, 'text/plain', 'etag_z', 0, 0],
+            ['z-deleted', self.ts_encoded(), 52, 'text/plain', 'etag_z', 1, 0],
+        ]
+        for obj in newer_objects:
+            broker.put_object(*obj)
+        broker.get_info()  # force updates to be committed
+        # sanity check the puts landed in sharded broker
+        self._check_objects(newer_objects, broker.db_file)
+
+        with self._mock_sharder() as sharder:
+            sharder._move_misplaced_objects(broker)
+        sharder._replicate_object.assert_has_calls(
+            [mock.call(0, db, 0)
+             for db in (expected_shard_dbs[0], expected_shard_dbs[-1])],
+            any_order=True
+        )
+        # shard broker for first shard range was already created but not
+        # removed due to mocked _replicate_object so expect one created and one
+        # existed db stat...
+        expected_stats = {'attempted': 1, 'success': 1, 'failure': 0,
+                          'found': 1, 'placed': 3, 'unplaced': 0,
+                          'db_created': 1, 'db_exists': 1}
+        self._assert_stats(expected_stats, sharder, 'misplaced')
+        self.assertEqual(
+            1, sharder.logger.statsd_client.get_stats_counts()[
+                'misplaced_found'])
+        self.assertEqual(
+            3, sharder.logger.statsd_client.get_stats_counts()[
+                'misplaced_placed'])
+        self.assertEqual(
+            1, sharder.logger.statsd_client.get_stats_counts()[
+                'misplaced_db_created'])
+        self.assertEqual(
+            1, sharder.logger.statsd_client.get_stats_counts()[
+                'misplaced_db_exists'])
+
+        # check new misplaced objects were moved
+        self._check_objects(newer_objects[:1] + new_objects,
+                            expected_shard_dbs[0])
+        self._check_objects(newer_objects[1:], expected_shard_dbs[4])
+        # ... and removed from the source db
+        self._check_objects([], broker.db_file)
+        # ... and other shard dbs were unchanged
+        self._check_objects(objects[:2], expected_shard_dbs[1])
+        self._check_objects(objects[2:3], expected_shard_dbs[2])
+        self._check_objects(objects[3:], expected_shard_dbs[3])
+
+    def _setup_misplaced_objects(self):
+        # make a broker with shard ranges, move it to sharded state and then
+        # put some misplaced objects in it
+        broker = self._make_broker()
+        shard_bounds = (('', 'here'), ('here', 'there'),
+                        ('there', 'where'), ('where', 'yonder'),
+                        ('yonder', ''))
+        initial_shard_ranges = [
+            ShardRange('.shards_a/%s-%s' % (lower, upper),
+                       Timestamp.now(), lower, upper, state=ShardRange.ACTIVE)
+            for lower, upper in shard_bounds
+        ]
+        expected_dbs = []
+        for shard_range in initial_shard_ranges:
+            db_hash = hash_path(shard_range.account, shard_range.container)
+            expected_dbs.append(
+                os.path.join(self.tempdir, 'sda', 'containers', '0',
+                             db_hash[-3:], db_hash, db_hash + '.db'))
+        broker.merge_shard_ranges(initial_shard_ranges)
+        objects = [
+            # misplaced objects in second, third and fourth shard ranges
+            ['n', self.ts_encoded(), 2, 'text/plain', 'etag_n', 0, 0],
+            ['there', self.ts_encoded(), 3, 'text/plain', 'etag_there', 0, 0],
+            ['where', self.ts_encoded(), 100, 'text/plain', 'etag_where', 0,
+             0],
+            # deleted
+            ['x', self.ts_encoded(), 0, '', '', 1, 0],
+        ]
+        broker.enable_sharding(Timestamp.now())
+        self.assertTrue(broker.set_sharding_state())
+        self.assertTrue(broker.set_sharded_state())
+        for obj in objects:
+            broker.put_object(*obj)
+        self.assertEqual(SHARDED, broker.get_db_state())
+        return broker, objects, expected_dbs
+
+    def test_misplaced_objects_newer_objects(self):
+        # verify that objects merged to the db after misplaced objects have
+        # been identified are not removed from the db
+        broker, objects, expected_dbs = self._setup_misplaced_objects()
+        newer_objects = [
+            ['j', self.ts_encoded(), 51, 'text/plain', 'etag_j', 0, 0],
+            ['k', self.ts_encoded(), 52, 'text/plain', 'etag_k', 1, 0],
+        ]
+
+        calls = []
+        pre_removal_objects = []
+
+        def mock_replicate_object(part, db, node_id):
+            calls.append((part, db, node_id))
+            if db == expected_dbs[1]:
+                # put some new objects in the shard range that is being
+                # replicated before misplaced objects are removed from that
+                # range in the source db
+                for obj in newer_objects:
+                    broker.put_object(*obj)
+                    # grab a snapshot of the db contents - a side effect is
+                    # that the newer objects are now committed to the db
+                    pre_removal_objects.extend(
+                        broker.get_objects())
+            return True, [True, True, True]
+
+        with self._mock_sharder(replicas=3) as sharder:
+            sharder._replicate_object = mock_replicate_object
+            sharder._move_misplaced_objects(broker)
+
+        # sanity check - the newer objects were in the db before the misplaced
+        # object were removed
+        for obj in newer_objects:
+            self.assertIn(obj[0], [o['name'] for o in pre_removal_objects])
+        for obj in objects[:2]:
+            self.assertIn(obj[0], [o['name'] for o in pre_removal_objects])
+
+        self.assertEqual(
+            set([(0, db, 0) for db in (expected_dbs[1:4])]), set(calls))
+
+        # check misplaced objects were moved
+        self._check_objects(objects[:2], expected_dbs[1])
+        self._check_objects(objects[2:3], expected_dbs[2])
+        self._check_objects(objects[3:], expected_dbs[3])
+        # ... but newer objects were not removed from the source db
+        self._check_objects(newer_objects, broker.db_file)
+        self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+        expected_stats = {'attempted': 1, 'success': 1, 'failure': 0,
+                          'found': 1, 'placed': 4, 'unplaced': 0}
+        self._assert_stats(expected_stats, sharder, 'misplaced')
+
+        # they will be moved on next cycle
+        unlink_files(expected_dbs)
+        with self._mock_sharder(replicas=3) as sharder:
+            sharder._move_misplaced_objects(broker)
+
+        self._check_objects(newer_objects, expected_dbs[1])
+        self._check_objects([], broker.db_file)
+        expected_stats = {'attempted': 1, 'success': 1, 'failure': 0,
+                          'found': 1, 'placed': 2, 'unplaced': 0}
+        self._assert_stats(expected_stats, sharder, 'misplaced')
+
+    def test_misplaced_objects_db_id_changed(self):
+        broker, objects, expected_dbs = self._setup_misplaced_objects()
+
+        pre_info = broker.get_info()
+        calls = []
+        expected_retained_objects = []
+        expected_retained_objects_dbs = []
+
+        def mock_replicate_object(part, db, node_id):
+            calls.append((part, db, node_id))
+            if len(calls) == 2:
+                broker.newid('fake_remote_id')
+                # grab snapshot of the objects in the broker when it changed id
+                expected_retained_objects.extend(
+                    self._get_raw_object_records(broker))
+            if len(calls) >= 2:
+                expected_retained_objects_dbs.append(db)
+            return True, [True, True, True]
+
+        with self._mock_sharder(replicas=3) as sharder:
+            sharder._replicate_object = mock_replicate_object
+            sharder._move_misplaced_objects(broker)
+
+        # sanity checks
+        self.assertNotEqual(pre_info['id'], broker.get_info()['id'])
+        self.assertTrue(expected_retained_objects)
+
+        self.assertEqual(
+            set([(0, db, 0) for db in (expected_dbs[1:4])]), set(calls))
+
+        # check misplaced objects were moved
+        self._check_objects(objects[:2], expected_dbs[1])
+        self._check_objects(objects[2:3], expected_dbs[2])
+        self._check_objects(objects[3:], expected_dbs[3])
+        # ... but objects were not removed after the source db id changed
+        self._check_objects(expected_retained_objects, broker.db_file)
+        expected_stats = {'attempted': 1, 'success': 0, 'failure': 1,
+                          'found': 1, 'placed': 4, 'unplaced': 0}
+        self._assert_stats(expected_stats, sharder, 'misplaced')
+
+        lines = sharder.logger.get_lines_for_level('warning')
+        shard_ranges = broker.get_shard_ranges()
+        self.assertIn('Refused to remove misplaced objects for dest %s'
+                      % shard_ranges[2].name, lines[0])
+        self.assertIn('Refused to remove misplaced objects for dest %s'
+                      % shard_ranges[3].name, lines[1])
+        self.assertFalse(lines[2:])
+
+        # they will be moved again on next cycle
+        unlink_files(expected_dbs)
+        sharder.logger.clear()
+        with self._mock_sharder(replicas=3) as sharder:
+            sharder._move_misplaced_objects(broker)
+
+        self.assertEqual(2, len(set(expected_retained_objects_dbs)))
+        for db in expected_retained_objects_dbs:
+            if db == expected_dbs[1]:
+                self._check_objects(objects[:2], expected_dbs[1])
+            if db == expected_dbs[2]:
+                self._check_objects(objects[2:3], expected_dbs[2])
+            if db == expected_dbs[3]:
+                self._check_objects(objects[3:], expected_dbs[3])
+        self._check_objects([], broker.db_file)
+        self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+        expected_stats = {'attempted': 1, 'success': 1, 'failure': 0,
+                          'found': 1, 'placed': len(expected_retained_objects),
+                          'unplaced': 0}
+        self._assert_stats(expected_stats, sharder, 'misplaced')
+
+    def test_misplaced_objects_sufficient_replication(self):
+        broker, objects, expected_dbs = self._setup_misplaced_objects()
+
+        with self._mock_sharder(replicas=3) as sharder:
+            sharder._replicate_object.return_value = (True, [True, True, True])
+            sharder._move_misplaced_objects(broker)
+
+        sharder._replicate_object.assert_has_calls(
+            [mock.call(0, db, 0) for db in (expected_dbs[2:4])],
+            any_order=True)
+        expected_stats = {'attempted': 1, 'success': 1, 'failure': 0,
+                          'found': 1, 'placed': 4, 'unplaced': 0}
+        self._assert_stats(expected_stats, sharder, 'misplaced')
+        self.assertEqual(
+            1, sharder.logger.statsd_client.get_stats_counts()[
+                'misplaced_found'])
+        # check misplaced objects were moved
+        self._check_objects(objects[:2], expected_dbs[1])
+        self._check_objects(objects[2:3], expected_dbs[2])
+        self._check_objects(objects[3:], expected_dbs[3])
+        # ... and removed from the source db
+        self._check_objects([], broker.db_file)
+        # ... and nothing else moved
+        self.assertFalse(os.path.exists(expected_dbs[0]))
+        self.assertFalse(os.path.exists(expected_dbs[4]))
+
+    def test_misplaced_objects_insufficient_replication_3_replicas(self):
+        broker, objects, expected_dbs = self._setup_misplaced_objects()
+
+        returns = {expected_dbs[1]: (True, [True, True, True]),  # ok
+                   expected_dbs[2]: (False, [True, False, False]),  # < quorum
+                   expected_dbs[3]: (False, [False, True, True])}  # ok
+        calls = []
+
+        def mock_replicate_object(part, db, node_id):
+            calls.append((part, db, node_id))
+            return returns[db]
+
+        with self._mock_sharder(replicas=3) as sharder:
+            sharder._replicate_object = mock_replicate_object
+            sharder._move_misplaced_objects(broker)
+
+        self.assertEqual(
+            set([(0, db, 0) for db in (expected_dbs[1:4])]), set(calls))
+        expected_stats = {'attempted': 1, 'success': 0, 'failure': 1,
+                          'placed': 4, 'unplaced': 0}
+        self._assert_stats(expected_stats, sharder, 'misplaced')
+        self.assertEqual(
+            1, sharder.logger.statsd_client.get_stats_counts()[
+                'misplaced_found'])
+        # check misplaced objects were moved to shard dbs
+        self._check_objects(objects[:2], expected_dbs[1])
+        self._check_objects(objects[2:3], expected_dbs[2])
+        self._check_objects(objects[3:], expected_dbs[3])
+        # ... but only removed from the source db if sufficiently replicated
+        self._check_objects(objects[2:3], broker.db_file)
+        # ... and nothing else moved
+        self.assertFalse(os.path.exists(expected_dbs[0]))
+        self.assertFalse(os.path.exists(expected_dbs[4]))
+        lines = self.logger.get_lines_for_level('warning')
+        self.assertEqual(1, len(lines))
+        self.assertIn(
+            'Failed to sufficiently replicate misplaced objects shard %s'
+            % broker.get_shard_ranges()[2].name, lines[0])
+        self.assertIn('1 successes, 2 required', lines[0])
+        self.assertIn('shard db: %s' % expected_dbs[2], lines[0])
+        self.assertIn('db: %s' % broker.db_file, lines[0])
+
+    def test_misplaced_objects_insufficient_replication_2_replicas(self):
+        broker, objects, expected_dbs = self._setup_misplaced_objects()
+
+        returns = {expected_dbs[1]: (True, [True, True]),  # ok
+                   expected_dbs[2]: (False, [True, False]),  # ok
+                   expected_dbs[3]: (False, [False, False])}  # < quorum>
+        calls = []
+
+        def mock_replicate_object(part, db, node_id):
+            calls.append((part, db, node_id))
+            return returns[db]
+
+        with self._mock_sharder(replicas=2) as sharder:
+            sharder._replicate_object = mock_replicate_object
+            sharder._move_misplaced_objects(broker)
+
+        self.assertEqual(
+            set([(0, db, 0) for db in (expected_dbs[1:4])]), set(calls))
+        expected_stats = {'attempted': 1, 'success': 0, 'failure': 1,
+                          'placed': 4, 'unplaced': 0}
+        self._assert_stats(expected_stats, sharder, 'misplaced')
+        self.assertEqual(
+            1, sharder.logger.statsd_client.get_stats_counts()[
+                'misplaced_found'])
+        # check misplaced objects were moved to shard dbs
+        self._check_objects(objects[:2], expected_dbs[1])
+        self._check_objects(objects[2:3], expected_dbs[2])
+        self._check_objects(objects[3:], expected_dbs[3])
+        # ... but only removed from the source db if sufficiently replicated
+        self._check_objects(objects[3:], broker.db_file)
+        # ... and nothing else moved
+        self.assertFalse(os.path.exists(expected_dbs[0]))
+        self.assertFalse(os.path.exists(expected_dbs[4]))
+        lines = self.logger.get_lines_for_level('warning')
+        self.assertEqual(1, len(lines))
+        self.assertIn(
+            'Failed to sufficiently replicate misplaced objects shard %s'
+            % broker.get_shard_ranges()[3].name, lines[0])
+        self.assertIn('0 successes, 1 required', lines[0])
+        self.assertIn('shard db: %s' % expected_dbs[3], lines[0])
+        self.assertIn('db: %s' % broker.db_file, lines[0])
+
+    def test_misplaced_objects_insufficient_replication_4_replicas(self):
+        broker, objects, expected_dbs = self._setup_misplaced_objects()
+
+        returns = {expected_dbs[1]: (False, [True, False, False, False]),
+                   expected_dbs[2]: (True, [True, False, False, True]),
+                   expected_dbs[3]: (False, [False, False, False, False])}
+        calls = []
+
+        def mock_replicate_object(part, db, node_id):
+            calls.append((part, db, node_id))
+            return returns[db]
+
+        with self._mock_sharder(replicas=4) as sharder:
+            sharder._replicate_object = mock_replicate_object
+            sharder._move_misplaced_objects(broker)
+
+        self.assertEqual(
+            set([(0, db, 0) for db in (expected_dbs[1:4])]), set(calls))
+        expected_stats = {'attempted': 1, 'success': 0, 'failure': 1,
+                          'placed': 4, 'unplaced': 0}
+        self._assert_stats(expected_stats, sharder, 'misplaced')
+        self.assertEqual(
+            1, sharder.logger.statsd_client.get_stats_counts()[
+                'misplaced_found'])
+        # check misplaced objects were moved to shard dbs
+        self._check_objects(objects[:2], expected_dbs[1])
+        self._check_objects(objects[2:3], expected_dbs[2])
+        self._check_objects(objects[3:], expected_dbs[3])
+        # ... but only removed from the source db if sufficiently replicated
+        self._check_objects(objects[:2] + objects[3:], broker.db_file)
+        # ... and nothing else moved
+        self.assertFalse(os.path.exists(expected_dbs[0]))
+        self.assertFalse(os.path.exists(expected_dbs[4]))
+
+    def _check_misplaced_objects_shard_container_unsharded(self, conf=None):
+        broker = self._make_broker(account='.shards_a', container='.shard_c')
+        ts_shard = next(self.ts_iter)
+        own_sr = ShardRange(broker.path, ts_shard, 'here', 'where')
+        broker.merge_shard_ranges([own_sr])
+        broker.set_sharding_sysmeta('Root', 'a/c')
+        self.assertEqual(own_sr, broker.get_own_shard_range())  # sanity check
+        self.assertEqual(UNSHARDED, broker.get_db_state())
+
+        objects = [
+            # some of these are misplaced objects
+            ['b', self.ts_encoded(), 2, 'text/plain', 'etag_b', 0, 0],
+            ['here', self.ts_encoded(), 2, 'text/plain', 'etag_here', 0, 0],
+            ['n', self.ts_encoded(), 2, 'text/plain', 'etag_n', 0, 0],
+            ['there', self.ts_encoded(), 3, 'text/plain', 'etag_there', 0, 0],
+            ['x', self.ts_encoded(), 0, '', '', 1, 0],  # deleted
+            ['y', self.ts_encoded(), 10, 'text/plain', 'etag_y', 0, 0],
+        ]
+
+        shard_bounds = (('', 'here'), ('here', 'there'),
+                        ('there', 'where'), ('where', ''))
+        root_shard_ranges = self._make_shard_ranges(
+            shard_bounds, state=ShardRange.ACTIVE)
+        expected_shard_dbs = []
+        for sr in root_shard_ranges:
+            db_hash = hash_path(sr.account, sr.container)
+            expected_shard_dbs.append(
+                os.path.join(self.tempdir, 'sda', 'containers', '0',
+                             db_hash[-3:], db_hash, db_hash + '.db'))
+
+        # no objects
+        with self._mock_sharder(conf=conf) as sharder:
+            sharder._fetch_shard_ranges = mock.MagicMock(
+                return_value=root_shard_ranges)
+            sharder._move_misplaced_objects(broker)
+
+        sharder._fetch_shard_ranges.assert_not_called()
+
+        sharder._replicate_object.assert_not_called()
+        expected_stats = {'attempted': 1, 'success': 1, 'failure': 0,
+                          'found': 0, 'placed': 0, 'unplaced': 0}
+        self._assert_stats(expected_stats, sharder, 'misplaced')
+        self.assertEqual(
+            1, sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_success'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_failure'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_found'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_placed'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_unplaced'))
+        self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+
+        # now put objects
+        for obj in objects:
+            broker.put_object(*obj)
+        self._check_objects(objects, broker.db_file)  # sanity check
+
+        # NB final shard range not available
+        with self._mock_sharder(conf=conf) as sharder:
+            sharder._fetch_shard_ranges = mock.MagicMock(
+                return_value=root_shard_ranges[:-1])
+            sharder._move_misplaced_objects(broker)
+
+        sharder._fetch_shard_ranges.assert_has_calls(
+            [mock.call(broker, newest=True, params={'states': 'updating',
+                                                    'marker': '',
+                                                    'end_marker': 'here\x00'}),
+             mock.call(broker, newest=True, params={'states': 'updating',
+                                                    'marker': 'where',
+                                                    'end_marker': ''})])
+        sharder._replicate_object.assert_called_with(
+            0, expected_shard_dbs[0], 0),
+
+        expected_stats = {'attempted': 1, 'success': 0, 'failure': 1,
+                          'found': 1, 'placed': 2, 'unplaced': 2}
+        self._assert_stats(expected_stats, sharder, 'misplaced')
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_success'))
+        self.assertEqual(
+            1, sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_failure'))
+        self.assertEqual(
+            1, sharder.logger.statsd_client.get_stats_counts()[
+                'misplaced_found'])
+        self.assertEqual(
+            2, sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_placed'))
+        self.assertEqual(
+            2, sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_unplaced'))
+        # some misplaced objects could not be moved...
+        warning_lines = sharder.logger.get_lines_for_level('warning')
+        self.assertIn(
+            'Failed to find destination for at least 2 misplaced objects',
+            warning_lines[0])
+        self.assertFalse(warning_lines[1:])
+        sharder.logger.clear()
+
+        # check misplaced objects were moved
+        self._check_objects(objects[:2], expected_shard_dbs[0])
+        # ... and removed from the source db
+        self._check_objects(objects[2:], broker.db_file)
+        # ... and nothing else moved
+        self.assertFalse(os.path.exists(expected_shard_dbs[1]))
+        self.assertFalse(os.path.exists(expected_shard_dbs[2]))
+        self.assertFalse(os.path.exists(expected_shard_dbs[3]))
+
+        # repeat with final shard range available
+        with self._mock_sharder(conf=conf) as sharder:
+            sharder._fetch_shard_ranges = mock.MagicMock(
+                return_value=root_shard_ranges)
+            sharder._move_misplaced_objects(broker)
+
+        sharder._fetch_shard_ranges.assert_has_calls(
+            [mock.call(broker, newest=True, params={'states': 'updating',
+                                                    'marker': 'where',
+                                                    'end_marker': ''})])
+
+        sharder._replicate_object.assert_called_with(
+            0, expected_shard_dbs[-1], 0),
+
+        expected_stats = {'attempted': 1, 'success': 1, 'failure': 0,
+                          'found': 1, 'placed': 2, 'unplaced': 0}
+        self._assert_stats(expected_stats, sharder, 'misplaced')
+        self.assertEqual(
+            1, sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_success'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_failure'))
+        self.assertEqual(
+            1, sharder.logger.statsd_client.get_stats_counts()[
+                'misplaced_found'])
+        self.assertEqual(
+            2, sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_placed'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_unplaced'))
+        self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+
+        # check misplaced objects were moved
+        self._check_objects(objects[:2], expected_shard_dbs[0])
+        self._check_objects(objects[4:], expected_shard_dbs[3])
+        # ... and removed from the source db
+        self._check_objects(objects[2:4], broker.db_file)
+        # ... and nothing else moved
+        self.assertFalse(os.path.exists(expected_shard_dbs[1]))
+        self.assertFalse(os.path.exists(expected_shard_dbs[2]))
+
+        # repeat - no work remaining
+        with self._mock_sharder(conf=conf) as sharder:
+            sharder._fetch_shard_ranges = mock.MagicMock(
+                return_value=root_shard_ranges)
+            sharder._move_misplaced_objects(broker)
+
+        sharder._fetch_shard_ranges.assert_not_called()
+        sharder._replicate_object.assert_not_called()
+        expected_stats = {'attempted': 1, 'success': 1, 'failure': 0,
+                          'found': 0, 'placed': 0, 'unplaced': 0}
+        self._assert_stats(expected_stats, sharder, 'misplaced')
+        self.assertEqual(
+            1, sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_success'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_failure'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_found'))
+        self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_placed'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_unplaced'))
+
+        # and then more misplaced updates arrive
+        new_objects = [
+            ['a', self.ts_encoded(), 51, 'text/plain', 'etag_a', 0, 0],
+            ['z', self.ts_encoded(), 52, 'text/plain', 'etag_z', 0, 0],
+        ]
+        for obj in new_objects:
+            broker.put_object(*obj)
+        # sanity check the puts landed in sharded broker
+        self._check_objects(new_objects[:1] + objects[2:4] + new_objects[1:],
+                            broker.db_file)
+
+        with self._mock_sharder(conf=conf) as sharder:
+            sharder._fetch_shard_ranges = mock.MagicMock(
+                return_value=root_shard_ranges)
+            sharder._move_misplaced_objects(broker)
+
+        sharder._fetch_shard_ranges.assert_has_calls(
+            [mock.call(broker, newest=True,
+                       params={'states': 'updating',
+                               'marker': '', 'end_marker': 'here\x00'}),
+             mock.call(broker, newest=True, params={'states': 'updating',
+                                                    'marker': 'where',
+                                                    'end_marker': ''})])
+        sharder._replicate_object.assert_has_calls(
+            [mock.call(0, db, 0)
+             for db in (expected_shard_dbs[0], expected_shard_dbs[3])],
+            any_order=True
+        )
+        expected_stats = {'attempted': 1, 'success': 1, 'failure': 0,
+                          'found': 1, 'placed': 2, 'unplaced': 0}
+        self._assert_stats(expected_stats, sharder, 'misplaced')
+        self.assertEqual(
+            1, sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_success'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_failure'))
+        self.assertEqual(
+            1, sharder.logger.statsd_client.get_stats_counts()[
+                'misplaced_found'])
+        self.assertEqual(
+            2, sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_placed'))
+        self.assertFalse(
+            sharder.logger.statsd_client.get_stats_counts().get(
+                'misplaced_unplaced'))
+        self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+
+        # check new misplaced objects were moved
+        self._check_objects(new_objects[:1] + objects[:2],
+                            expected_shard_dbs[0])
+        self._check_objects(objects[4:] + new_objects[1:],
+                            expected_shard_dbs[3])
+        # ... and removed from the source db
+        self._check_objects(objects[2:4], broker.db_file)
+        # ... and nothing else moved
+        self.assertFalse(os.path.exists(expected_shard_dbs[1]))
+        self.assertFalse(os.path.exists(expected_shard_dbs[2]))
+
+    def test_misplaced_objects_shard_container_unsharded(self):
+        self._check_misplaced_objects_shard_container_unsharded()
+
+    def test_misplaced_objects_shard_container_unsharded_limit_two(self):
+        self._check_misplaced_objects_shard_container_unsharded(
+            conf={'cleave_row_batch_size': 2})
+
+    def test_misplaced_objects_shard_container_unsharded_limit_one(self):
+        self._check_misplaced_objects_shard_container_unsharded(
+            conf={'cleave_row_batch_size': 1})
+
+    def test_misplaced_objects_shard_container_sharding(self):
+        broker = self._make_broker(account='.shards_a', container='shard_c')
+        ts_shard = next(self.ts_iter)
+        # note that own_sr spans two root shard ranges
+        own_sr = ShardRange(broker.path, ts_shard, 'here', 'where')
+        own_sr.update_state(ShardRange.SHARDING)
+        own_sr.epoch = next(self.ts_iter)
+        broker.merge_shard_ranges([own_sr])
+        broker.set_sharding_sysmeta('Root', 'a/c')
+        self.assertEqual(own_sr, broker.get_own_shard_range())  # sanity check
+        self.assertEqual(UNSHARDED, broker.get_db_state())
+
+        objects = [
+            # some of these are misplaced objects
+            ['b', self.ts_encoded(), 2, 'text/plain', 'etag_b', 0, 0],
+            ['here', self.ts_encoded(), 2, 'text/plain', 'etag_here', 0, 0],
+            ['n', self.ts_encoded(), 2, 'text/plain', 'etag_n', 0, 0],
+            ['there', self.ts_encoded(), 3, 'text/plain', 'etag_there', 0, 0],
+            ['v', self.ts_encoded(), 10, 'text/plain', 'etag_v', 0, 0],
+            ['y', self.ts_encoded(), 10, 'text/plain', 'etag_y', 0, 0],
+        ]
+
+        shard_bounds = (('', 'here'), ('here', 'there'),
+                        ('there', 'where'), ('where', ''))
+        root_shard_ranges = self._make_shard_ranges(
+            shard_bounds, state=ShardRange.ACTIVE)
+        expected_shard_dbs = []
+        for sr in root_shard_ranges:
+            db_hash = hash_path(sr.account, sr.container)
+            expected_shard_dbs.append(
+                os.path.join(self.tempdir, 'sda', 'containers', '0',
+                             db_hash[-3:], db_hash, db_hash + '.db'))
+
+        # pretend broker is sharding but not yet cleaved a shard
+        self.assertTrue(broker.set_sharding_state())
+        broker.merge_shard_ranges([dict(sr) for sr in root_shard_ranges[1:3]])
+        # then some updates arrive
+        for obj in objects:
+            broker.put_object(*obj)
+        broker.get_info()
+        self._check_objects(objects, broker.db_file)  # sanity check
+
+        # first destination is not available
+        with self._mock_sharder() as sharder:
+            sharder._fetch_shard_ranges = mock.MagicMock(
+                return_value=root_shard_ranges[1:])
+            sharder._move_misplaced_objects(broker)
+
+        sharder._fetch_shard_ranges.assert_has_calls(
+            [mock.call(broker, newest=True,
+                       params={'states': 'updating',
+                               'marker': '', 'end_marker': 'here\x00'}),
+             mock.call(broker, newest=True,
+                       params={'states': 'updating',
+                               'marker': 'where', 'end_marker': ''})])
+        sharder._replicate_object.assert_has_calls(
+            [mock.call(0, expected_shard_dbs[-1], 0)],
+        )
+        expected_stats = {'attempted': 1, 'success': 0, 'failure': 1,
+                          'found': 1, 'placed': 1, 'unplaced': 2}
+        self._assert_stats(expected_stats, sharder, 'misplaced')
+        self.assertEqual(
+            1, sharder.logger.statsd_client.get_stats_counts()[
+                'misplaced_found'])
+        warning_lines = sharder.logger.get_lines_for_level('warning')
+        self.assertIn(
+            'Failed to find destination for at least 2 misplaced objects',
+            warning_lines[0])
+        self.assertFalse(warning_lines[1:])
+        sharder.logger.clear()
+
+        # check some misplaced objects were moved
+        self._check_objects(objects[5:], expected_shard_dbs[3])
+        # ... and removed from the source db
+        self._check_objects(objects[:5], broker.db_file)
+        self.assertFalse(os.path.exists(expected_shard_dbs[0]))
+        self.assertFalse(os.path.exists(expected_shard_dbs[1]))
+        self.assertFalse(os.path.exists(expected_shard_dbs[2]))
+
+        # normality resumes and all destinations are available
+        with self._mock_sharder() as sharder:
+            sharder._fetch_shard_ranges = mock.MagicMock(
+                return_value=root_shard_ranges)
+            sharder._move_misplaced_objects(broker)
+
+        sharder._fetch_shard_ranges.assert_has_calls(
+            [mock.call(broker, newest=True, params={'states': 'updating',
+                                                    'marker': '',
+                                                    'end_marker': 'here\x00'})]
+        )
+
+        sharder._replicate_object.assert_has_calls(
+            [mock.call(0, expected_shard_dbs[0], 0)],
+        )
+        expected_stats = {'attempted': 1, 'success': 1, 'failure': 0,
+                          'found': 1, 'placed': 2, 'unplaced': 0}
+        self._assert_stats(expected_stats, sharder, 'misplaced')
+        self.assertEqual(
+            1, sharder.logger.statsd_client.get_stats_counts()[
+                'misplaced_found'])
+        self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+
+        # check misplaced objects were moved
+        self._check_objects(objects[:2], expected_shard_dbs[0])
+        self._check_objects(objects[5:], expected_shard_dbs[3])
+        # ... and removed from the source db
+        self._check_objects(objects[2:5], broker.db_file)
+        self.assertFalse(os.path.exists(expected_shard_dbs[1]))
+        self.assertFalse(os.path.exists(expected_shard_dbs[2]))
+
+        # pretend first shard has been cleaved
+        context = CleavingContext.load(broker)
+        context.cursor = 'there'
+        context.store(broker)
+        # and then more misplaced updates arrive
+        new_objects = [
+            ['a', self.ts_encoded(), 51, 'text/plain', 'etag_a', 0, 0],
+            # this one is in the now cleaved shard range...
+            ['k', self.ts_encoded(), 52, 'text/plain', 'etag_k', 0, 0],
+            ['z', self.ts_encoded(), 53, 'text/plain', 'etag_z', 0, 0],
+        ]
+        for obj in new_objects:
+            broker.put_object(*obj)
+        broker.get_info()  # force updates to be committed
+        # sanity check the puts landed in sharded broker
+        self._check_objects(sorted(new_objects + objects[2:5]), broker.db_file)
+        with self._mock_sharder() as sharder:
+            sharder._fetch_shard_ranges = mock.MagicMock(
+                return_value=root_shard_ranges)
+            sharder._move_misplaced_objects(broker)
+
+        sharder._fetch_shard_ranges.assert_has_calls(
+            [mock.call(broker, newest=True,
+                       params={'states': 'updating', 'marker': '',
+                               'end_marker': 'there\x00'}),
+             mock.call(broker, newest=True,
+                       params={'states': 'updating', 'marker': 'where',
+                               'end_marker': ''})])
+
+        sharder._replicate_object.assert_has_calls(
+            [mock.call(0, db, 0) for db in (expected_shard_dbs[0],
+                                            expected_shard_dbs[1],
+                                            expected_shard_dbs[-1])],
+            any_order=True
+        )
+
+        expected_stats = {'attempted': 1, 'success': 1, 'failure': 0,
+                          'found': 1, 'placed': 5, 'unplaced': 0}
+        self._assert_stats(expected_stats, sharder, 'misplaced')
+        self.assertEqual(
+            1, sharder.logger.statsd_client.get_stats_counts()[
+                'misplaced_found'])
+        self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+
+        # check *all* the misplaced objects were moved
+        self._check_objects(new_objects[:1] + objects[:2],
+                            expected_shard_dbs[0])
+        self._check_objects(new_objects[1:2] + objects[2:4],
+                            expected_shard_dbs[1])
+        self._check_objects(objects[5:] + new_objects[2:],
+                            expected_shard_dbs[3])
+        # ... and removed from the source db
+        self._check_objects(objects[4:5], broker.db_file)
+        self.assertFalse(os.path.exists(expected_shard_dbs[2]))
+
+    def test_misplaced_objects_deleted_and_updated(self):
+        # setup
+        broker = self._make_broker()
+        broker.enable_sharding(next(self.ts_iter))
+
+        shard_bounds = (('', 'here'), ('here', ''))
+        root_shard_ranges = self._make_shard_ranges(
+            shard_bounds, state=ShardRange.ACTIVE)
+        expected_shard_dbs = []
+        for sr in root_shard_ranges:
+            db_hash = hash_path(sr.account, sr.container)
+            expected_shard_dbs.append(
+                os.path.join(self.tempdir, 'sda', 'containers', '0',
+                             db_hash[-3:], db_hash, db_hash + '.db'))
+        broker.merge_shard_ranges(root_shard_ranges)
+        self.assertTrue(broker.set_sharding_state())
+
+        ts_older_internal = self.ts_encoded()  # used later
+        # put deleted objects into source
+        objects = [
+            ['b', self.ts_encoded(), 0, '', '', 1, 0],
+            ['x', self.ts_encoded(), 0, '', '', 1, 0]
+        ]
+        for obj in objects:
+            broker.put_object(*obj)
+        broker.get_info()
+        self._check_objects(objects, broker.db_file)  # sanity check
+        # pretend we cleaved all ranges - sharded state
+        self.assertTrue(broker.set_sharded_state())
+
+        with self._mock_sharder() as sharder:
+            sharder._move_misplaced_objects(broker)
+
+        sharder._replicate_object.assert_has_calls(
+            [mock.call(0, db, 0) for db in (expected_shard_dbs[0],
+                                            expected_shard_dbs[1])],
+            any_order=True
+        )
+        expected_stats = {'attempted': 1, 'success': 1, 'failure': 0,
+                          'found': 1, 'placed': 2, 'unplaced': 0}
+        self._assert_stats(expected_stats, sharder, 'misplaced')
+        self.assertEqual(
+            1, sharder.logger.statsd_client.get_stats_counts()[
+                'misplaced_found'])
+
+        # check new misplaced objects were moved
+        self._check_objects(objects[:1], expected_shard_dbs[0])
+        self._check_objects(objects[1:], expected_shard_dbs[1])
+        # ... and removed from the source db
+        self._check_objects([], broker.db_file)
+
+        # update source db with older undeleted versions of same objects
+        old_objects = [
+            ['b', ts_older_internal, 2, 'text/plain', 'etag_b', 0, 0],
+            ['x', ts_older_internal, 4, 'text/plain', 'etag_x', 0, 0]
+        ]
+        for obj in old_objects:
+            broker.put_object(*obj)
+        broker.get_info()
+        self._check_objects(old_objects, broker.db_file)  # sanity check
+        with self._mock_sharder() as sharder:
+            sharder._move_misplaced_objects(broker)
+
+        sharder._replicate_object.assert_has_calls(
+            [mock.call(0, db, 0) for db in (expected_shard_dbs[0],
+                                            expected_shard_dbs[1])],
+            any_order=True
+        )
+        self._assert_stats(expected_stats, sharder, 'misplaced')
+        self.assertEqual(
+            1, sharder.logger.statsd_client.get_stats_counts()[
+                'misplaced_found'])
+
+        # check older misplaced objects were not merged to shard brokers
+        self._check_objects(objects[:1], expected_shard_dbs[0])
+        self._check_objects(objects[1:], expected_shard_dbs[1])
+        # ... and removed from the source db
+        self._check_objects([], broker.db_file)
+
+        # the destination shard dbs for misplaced objects may already exist so
+        # check they are updated correctly when overwriting objects
+        # update source db with newer deleted versions of same objects
+        new_objects = [
+            ['b', self.ts_encoded(), 0, '', '', 1, 0],
+            ['x', self.ts_encoded(), 0, '', '', 1, 0]
+        ]
+        for obj in new_objects:
+            broker.put_object(*obj)
+        broker.get_info()
+        self._check_objects(new_objects, broker.db_file)  # sanity check
+        shard_broker = ContainerBroker(
+            expected_shard_dbs[0], account=root_shard_ranges[0].account,
+            container=root_shard_ranges[0].container)
+        # update one shard container with even newer version of object
+        timestamps = [next(self.ts_iter) for i in range(7)]
+        ts_newer = encode_timestamps(
+            timestamps[1], timestamps[3], timestamps[5])
+        newer_object = ('b', ts_newer, 10, 'text/plain', 'etag_b', 0, 0)
+        shard_broker.put_object(*newer_object)
+
+        with self._mock_sharder() as sharder:
+            sharder._move_misplaced_objects(broker)
+
+        sharder._replicate_object.assert_has_calls(
+            [mock.call(0, db, 0) for db in (expected_shard_dbs[0],
+                                            expected_shard_dbs[1])],
+            any_order=True
+        )
+        self._assert_stats(expected_stats, sharder, 'misplaced')
+        self.assertEqual(
+            1, sharder.logger.statsd_client.get_stats_counts()[
+                'misplaced_found'])
+
+        # check only the newer misplaced object was moved
+        self._check_objects([newer_object], expected_shard_dbs[0])
+        self._check_objects(new_objects[1:], expected_shard_dbs[1])
+        # ... and removed from the source db
+        self._check_objects([], broker.db_file)
+
+        # update source with a version of 'b' that has newer data
+        # but older content-type and metadata relative to shard object
+        ts_update = encode_timestamps(
+            timestamps[2], timestamps[3], timestamps[4])
+        update_object = ('b', ts_update, 20, 'text/ignored', 'etag_newer', 0,
+                         0)
+        broker.put_object(*update_object)
+
+        with self._mock_sharder() as sharder:
+            sharder._move_misplaced_objects(broker)
+
+        ts_expected = encode_timestamps(
+            timestamps[2], timestamps[3], timestamps[5])
+        expected = ('b', ts_expected, 20, 'text/plain', 'etag_newer', 0, 0)
+        self._check_objects([expected], expected_shard_dbs[0])
+        self._check_objects([], broker.db_file)
+
+        # update source with a version of 'b' that has older data
+        # and content-type but newer metadata relative to shard object
+        ts_update = encode_timestamps(
+            timestamps[1], timestamps[3], timestamps[6])
+        update_object = ('b', ts_update, 999, 'text/ignored', 'etag_b', 0, 0)
+        broker.put_object(*update_object)
+
+        with self._mock_sharder() as sharder:
+            sharder._move_misplaced_objects(broker)
+
+        ts_expected = encode_timestamps(
+            timestamps[2], timestamps[3], timestamps[6])
+        expected = ('b', ts_expected, 20, 'text/plain', 'etag_newer', 0, 0)
+        self._check_objects([expected], expected_shard_dbs[0])
+        self._check_objects([], broker.db_file)
+
+        # update source with a version of 'b' that has older data
+        # but newer content-type and metadata
+        ts_update = encode_timestamps(
+            timestamps[2], timestamps[6], timestamps[6])
+        update_object = ('b', ts_update, 999, 'text/newer', 'etag_b', 0, 0)
+        broker.put_object(*update_object)
+
+        with self._mock_sharder() as sharder:
+            sharder._move_misplaced_objects(broker)
+
+        ts_expected = encode_timestamps(
+            timestamps[2], timestamps[6], timestamps[6])
+        expected = ('b', ts_expected, 20, 'text/newer', 'etag_newer', 0, 0)
+        self._check_objects([expected], expected_shard_dbs[0])
+        self._check_objects([], broker.db_file)
+
+    def _setup_old_style_find_ranges(self, account, cont, lower, upper):
+        broker = self._make_broker(account=account, container=cont)
+        own_sr = ShardRange('%s/%s' % (account, cont), Timestamp.now(),
+                            lower, upper)
+        broker.merge_shard_ranges([own_sr])
+        broker.set_sharding_sysmeta('Root', 'a/c')
+        objects = [
+            # some of these are misplaced objects
+            ['obj%3d' % i, self.ts_encoded(), i, 'text/plain', 'etag%s' % i, 0]
+            for i in range(100)]
+        for obj in objects:
+            broker.put_object(*obj)
+        return broker, objects
+
+    def _check_old_style_find_shard_ranges_none_found(self, broker, objects):
+        with self._mock_sharder() as sharder:
+            num_found = sharder._find_shard_ranges(broker)
+        self.assertGreater(sharder.rows_per_shard, len(objects))
+        self.assertEqual(0, num_found)
+        self.assertFalse(broker.get_shard_ranges())
+        expected_stats = {'attempted': 1, 'success': 0, 'failure': 1,
+                          'found': 0, 'min_time': mock.ANY,
+                          'max_time': mock.ANY}
+        stats = self._assert_stats(expected_stats, sharder, 'scanned')
+        self.assertGreaterEqual(stats['max_time'], stats['min_time'])
+
+        with self._mock_sharder(
+                conf={'shard_container_threshold': 200}) as sharder:
+            num_found = sharder._find_shard_ranges(broker)
+        self.assertEqual(sharder.rows_per_shard, len(objects))
+        self.assertEqual(0, num_found)
+        self.assertFalse(broker.get_shard_ranges())
+        expected_stats = {'attempted': 1, 'success': 0, 'failure': 1,
+                          'found': 0, 'min_time': mock.ANY,
+                          'max_time': mock.ANY}
+        stats = self._assert_stats(expected_stats, sharder, 'scanned')
+        self.assertGreaterEqual(stats['max_time'], stats['min_time'])
+
+    def test_old_style_find_shard_ranges_none_found_root(self):
+        broker, objects = self._setup_old_style_find_ranges('a', 'c', '', '')
+        self._check_old_style_find_shard_ranges_none_found(broker, objects)
+
+    def test_old_style_find_shard_ranges_none_found_shard(self):
+        broker, objects = self._setup_old_style_find_ranges(
+            '.shards_a', 'c', 'lower', 'upper')
+        self._check_old_style_find_shard_ranges_none_found(broker, objects)
+
+    def _check_old_style_find_shard_ranges_finds_two(
+            self, account, cont, lower, upper):
+        def check_ranges():
+            self.assertEqual(2, len(broker.get_shard_ranges()))
+            expected_ranges = [
+                ShardRange(
+                    ShardRange.make_path('.shards_a', 'c', cont, now, 0),
+                    now, lower, objects[98][0], 99),
+                ShardRange(
+                    ShardRange.make_path('.shards_a', 'c', cont, now, 1),
+                    now, objects[98][0], upper, 1),
+            ]
+            self._assert_shard_ranges_equal(expected_ranges,
+                                            broker.get_shard_ranges())
+
+        # first invocation finds both ranges
+        broker, objects = self._setup_old_style_find_ranges(
+            account, cont, lower, upper)
+        with self._mock_sharder(conf={'shard_container_threshold': 199,
+                                      'minimum_shard_size': 1,
+                                      'shrink_threshold': 0}
+                                ) as sharder:
+            with mock_timestamp_now() as now:
+                num_found = sharder._find_shard_ranges(broker)
+        self.assertEqual(99, sharder.rows_per_shard)
+        self.assertEqual(2, num_found)
+        check_ranges()
+        expected_stats = {'attempted': 1, 'success': 1, 'failure': 0,
+                          'found': 2, 'min_time': mock.ANY,
+                          'max_time': mock.ANY}
+        stats = self._assert_stats(expected_stats, sharder, 'scanned')
+        self.assertGreaterEqual(stats['max_time'], stats['min_time'])
+
+        # second invocation finds none
+        with self._mock_sharder(conf={'shard_container_threshold': 199,
+                                      'minimum_shard_size': 1,
+                                      'shrink_threshold': 0}
+                                ) as sharder:
+            num_found = sharder._find_shard_ranges(broker)
+        self.assertEqual(0, num_found)
+        self.assertEqual(2, len(broker.get_shard_ranges()))
+        check_ranges()
+        expected_stats = {'attempted': 0, 'success': 0, 'failure': 0,
+                          'found': 0, 'min_time': mock.ANY,
+                          'max_time': mock.ANY}
+        stats = self._assert_stats(expected_stats, sharder, 'scanned')
+        self.assertGreaterEqual(stats['max_time'], stats['min_time'])
+
+    def test_old_style_find_shard_ranges_finds_two_root(self):
+        self._check_old_style_find_shard_ranges_finds_two('a', 'c', '', '')
+
+    def test_old_style_find_shard_ranges_finds_two_shard(self):
+        self._check_old_style_find_shard_ranges_finds_two(
+            '.shards_a', 'c_', 'l', 'u')
+
+    def _setup_find_ranges(self, account, cont, lower, upper):
+        broker = self._make_broker(account=account, container=cont)
+        own_sr = ShardRange('%s/%s' % (account, cont), Timestamp.now(),
+                            lower, upper)
+        broker.merge_shard_ranges([own_sr])
+        broker.set_sharding_sysmeta('Quoted-Root', 'a/c')
+        objects = [
+            # some of these are misplaced objects
+            ['obj%3d' % i, self.ts_encoded(), i, 'text/plain', 'etag%s' % i, 0]
+            for i in range(100)]
+        for obj in objects:
+            broker.put_object(*obj)
+        return broker, objects
+
+    def _check_find_shard_ranges_none_found(self, broker, objects):
+        with self._mock_sharder() as sharder:
+            num_found = sharder._find_shard_ranges(broker)
+        self.assertGreater(sharder.rows_per_shard, len(objects))
+        self.assertEqual(0, num_found)
+        self.assertFalse(broker.get_shard_ranges())
+        expected_stats = {'attempted': 1, 'success': 0, 'failure': 1,
+                          'found': 0, 'min_time': mock.ANY,
+                          'max_time': mock.ANY}
+        stats = self._assert_stats(expected_stats, sharder, 'scanned')
+        self.assertGreaterEqual(stats['max_time'], stats['min_time'])
+
+        with self._mock_sharder(
+                conf={'shard_container_threshold': 200}) as sharder:
+            num_found = sharder._find_shard_ranges(broker)
+        self.assertEqual(sharder.rows_per_shard, len(objects))
+        self.assertEqual(0, num_found)
+        self.assertFalse(broker.get_shard_ranges())
+        expected_stats = {'attempted': 1, 'success': 0, 'failure': 1,
+                          'found': 0, 'min_time': mock.ANY,
+                          'max_time': mock.ANY}
+        stats = self._assert_stats(expected_stats, sharder, 'scanned')
+        self.assertGreaterEqual(stats['max_time'], stats['min_time'])
+
+    def test_find_shard_ranges_none_found_root(self):
+        broker, objects = self._setup_find_ranges('a', 'c', '', '')
+        self._check_find_shard_ranges_none_found(broker, objects)
+
+    def test_find_shard_ranges_none_found_shard(self):
+        broker, objects = self._setup_find_ranges(
+            '.shards_a', 'c', 'lower', 'upper')
+        self._check_find_shard_ranges_none_found(broker, objects)
+
+    def _check_find_shard_ranges_finds_two(self, account, cont, lower, upper):
+        def check_ranges():
+            self.assertEqual(2, len(broker.get_shard_ranges()))
+            expected_ranges = [
+                ShardRange(
+                    ShardRange.make_path('.shards_a', 'c', cont, now, 0),
+                    now, lower, objects[98][0], 99),
+                ShardRange(
+                    ShardRange.make_path('.shards_a', 'c', cont, now, 1),
+                    now, objects[98][0], upper, 1),
+            ]
+            self._assert_shard_ranges_equal(expected_ranges,
+                                            broker.get_shard_ranges())
+
+        # first invocation finds both ranges, sizes 99 and 1
+        broker, objects = self._setup_find_ranges(
+            account, cont, lower, upper)
+        with self._mock_sharder(conf={'shard_container_threshold': 199,
+                                      'minimum_shard_size': 1,
+                                      'shrink_threshold': 0},
+                                ) as sharder:
+            with mock_timestamp_now() as now:
+                num_found = sharder._find_shard_ranges(broker)
+        self.assertEqual(99, sharder.rows_per_shard)
+        self.assertEqual(2, num_found)
+        check_ranges()
+        expected_stats = {'attempted': 1, 'success': 1, 'failure': 0,
+                          'found': 2, 'min_time': mock.ANY,
+                          'max_time': mock.ANY}
+        stats = self._assert_stats(expected_stats, sharder, 'scanned')
+        self.assertGreaterEqual(stats['max_time'], stats['min_time'])
+
+        # second invocation finds none
+        with self._mock_sharder(conf={'shard_container_threshold': 199}
+                                ) as sharder:
+            num_found = sharder._find_shard_ranges(broker)
+        self.assertEqual(0, num_found)
+        self.assertEqual(2, len(broker.get_shard_ranges()))
+        check_ranges()
+        expected_stats = {'attempted': 0, 'success': 0, 'failure': 0,
+                          'found': 0, 'min_time': mock.ANY,
+                          'max_time': mock.ANY}
+        stats = self._assert_stats(expected_stats, sharder, 'scanned')
+        self.assertGreaterEqual(stats['max_time'], stats['min_time'])
+
+    def test_find_shard_ranges_finds_two_root(self):
+        self._check_find_shard_ranges_finds_two('a', 'c', '', '')
+
+    def test_find_shard_ranges_finds_two_shard(self):
+        self._check_find_shard_ranges_finds_two('.shards_a', 'c_', 'l', 'u')
+
+    def _check_find_shard_ranges_finds_three(self, account, cont, lower,
+                                             upper):
+        broker, objects = self._setup_find_ranges(
+            account, cont, lower, upper)
+        now = Timestamp.now()
+        expected_ranges = [
+            ShardRange(
+                ShardRange.make_path('.shards_a', 'c', cont, now, 0),
+                now, lower, objects[44][0], 45),
+            ShardRange(
+                ShardRange.make_path('.shards_a', 'c', cont, now, 1),
+                now, objects[44][0], objects[89][0], 45),
+            ShardRange(
+                ShardRange.make_path('.shards_a', 'c', cont, now, 2),
+                now, objects[89][0], upper, 10),
+        ]
+        # first invocation finds 2 ranges
+        # (third shard range will be > minimum_shard_size)
+        with self._mock_sharder(
+                conf={'shard_container_threshold': 90,
+                      'shard_scanner_batch_size': 2,
+                      'minimum_shard_size': 10}) as sharder:
+            with mock_timestamp_now(now):
+                num_found = sharder._find_shard_ranges(broker)
+        self.assertEqual(45, sharder.rows_per_shard)
+        self.assertEqual(2, num_found)
+        self.assertEqual(2, len(broker.get_shard_ranges()))
+        self._assert_shard_ranges_equal(expected_ranges[:2],
+                                        broker.get_shard_ranges())
+        expected_stats = {'attempted': 1, 'success': 1, 'failure': 0,
+                          'found': 2, 'min_time': mock.ANY,
+                          'max_time': mock.ANY}
+        stats = self._assert_stats(expected_stats, sharder, 'scanned')
+        self.assertGreaterEqual(stats['max_time'], stats['min_time'])
+
+        # second invocation finds third shard range
+        with self._mock_sharder(conf={'shard_container_threshold': 90,
+                                      'shard_scanner_batch_size': 2,
+                                      'minimum_shard_size': 10}
+                                ) as sharder:
+            with mock_timestamp_now(now):
+                num_found = sharder._find_shard_ranges(broker)
+        self.assertEqual(1, num_found)
+        self.assertEqual(3, len(broker.get_shard_ranges()))
+        self._assert_shard_ranges_equal(expected_ranges,
+                                        broker.get_shard_ranges())
+        expected_stats = {'attempted': 1, 'success': 1, 'failure': 0,
+                          'found': 1, 'min_time': mock.ANY,
+                          'max_time': mock.ANY}
+        stats = self._assert_stats(expected_stats, sharder, 'scanned')
+        self.assertGreaterEqual(stats['max_time'], stats['min_time'])
+
+        # third invocation finds none
+        with self._mock_sharder(conf={'shard_container_threshold': 199,
+                                      'shard_scanner_batch_size': 2,
+                                      'shrink_threshold': 0,
+                                      'minimum_shard_size': 10}
+                                ) as sharder:
+            sharder._send_shard_ranges = mock.MagicMock(return_value=True)
+            num_found = sharder._find_shard_ranges(broker)
+        self.assertEqual(0, num_found)
+        self.assertEqual(3, len(broker.get_shard_ranges()))
+        self._assert_shard_ranges_equal(expected_ranges,
+                                        broker.get_shard_ranges())
+        expected_stats = {'attempted': 0, 'success': 0, 'failure': 0,
+                          'found': 0, 'min_time': mock.ANY,
+                          'max_time': mock.ANY}
+        stats = self._assert_stats(expected_stats, sharder, 'scanned')
+        self.assertGreaterEqual(stats['max_time'], stats['min_time'])
+
+    def test_find_shard_ranges_finds_three_root(self):
+        self._check_find_shard_ranges_finds_three('a', 'c', '', '')
+
+    def test_find_shard_ranges_finds_three_shard(self):
+        self._check_find_shard_ranges_finds_three('.shards_a', 'c_', 'l', 'u')
+
+    def test_find_shard_ranges_with_minimum_size(self):
+        cont = 'c_'
+        lower = 'l'
+        upper = 'u'
+        broker, objects = self._setup_find_ranges(
+            '.shards_a', 'c_', lower, upper)
+        now = Timestamp.now()
+        expected_ranges = [
+            ShardRange(
+                ShardRange.make_path('.shards_a', 'c', cont, now, 0),
+                now, lower, objects[44][0], 45),
+            ShardRange(
+                ShardRange.make_path('.shards_a', 'c', cont, now, 1),
+                now, objects[44][0], upper, 55),
+        ]
+        # first invocation finds 2 ranges - second has been extended to avoid
+        # final shard range < minimum_size
+        with self._mock_sharder(
+                conf={'shard_container_threshold': 90,
+                      'shard_scanner_batch_size': 2,
+                      'minimum_shard_size': 11}) as sharder:
+            with mock_timestamp_now(now):
+                num_found = sharder._find_shard_ranges(broker)
+        self.assertEqual(45, sharder.rows_per_shard)
+        self.assertEqual(11, sharder.minimum_shard_size)
+        self.assertEqual(2, num_found)
+        self.assertEqual(2, len(broker.get_shard_ranges()))
+        self._assert_shard_ranges_equal(expected_ranges[:2],
+                                        broker.get_shard_ranges())
+        expected_stats = {'attempted': 1, 'success': 1, 'failure': 0,
+                          'found': 2, 'min_time': mock.ANY,
+                          'max_time': mock.ANY}
+        stats = self._assert_stats(expected_stats, sharder, 'scanned')
+        self.assertGreaterEqual(stats['max_time'], stats['min_time'])
+
+    def test_sharding_enabled(self):
+        broker = self._make_broker()
+        self.assertFalse(sharding_enabled(broker))
+        # Setting sharding to a true value and sharding will be enabled
+        broker.update_metadata(
+            {'X-Container-Sysmeta-Sharding':
+             ('yes', Timestamp.now().internal)})
+        self.assertTrue(sharding_enabled(broker))
+
+        # deleting broker doesn't clear the Sysmeta-Sharding sysmeta
+        broker.delete_db(Timestamp.now().internal)
+        self.assertTrue(sharding_enabled(broker))
+
+        # re-init the DB for the deleted tests
+        broker.set_storage_policy_index(0, Timestamp.now().internal)
+        broker.update_metadata(
+            {'X-Container-Sysmeta-Sharding':
+             ('yes', Timestamp.now().internal)})
+        self.assertTrue(sharding_enabled(broker))
+
+        # if the Sysmeta-Sharding is falsy value then sharding isn't enabled
+        for value in ('', 'no', 'false', 'some_fish'):
+            broker.update_metadata(
+                {'X-Container-Sysmeta-Sharding':
+                    (value, Timestamp.now().internal)})
+            self.assertFalse(sharding_enabled(broker))
+        # deleting broker doesn't clear the Sysmeta-Sharding sysmeta
+        broker.delete_db(Timestamp.now().internal)
+        self.assertEqual(broker.metadata['X-Container-Sysmeta-Sharding'][0],
+                         'some_fish')
+        # so it still isn't enabled (some_fish isn't a true value).
+        self.assertFalse(sharding_enabled(broker))
+
+        # but if broker has a shard range then sharding is enabled
+        broker.merge_shard_ranges(
+            ShardRange('acc/a_shard', Timestamp.now(), 'l', 'u'))
+        self.assertTrue(sharding_enabled(broker))
+
+    def test_send_shard_ranges(self):
+        broker = self._make_broker()
+        shard_ranges = self._make_shard_ranges((('', 'h'), ('h', '')))
+
+        def do_test(replicas, *resp_codes):
+            sent_data = defaultdict(bytes)
+
+            def on_send(fake_conn, data):
+                sent_data[fake_conn] += data
+
+            with self._mock_sharder(replicas=replicas) as sharder:
+                with mocked_http_conn(*resp_codes, give_send=on_send) as conn:
+                    with mock_timestamp_now() as now:
+                        # we don't expect these PUTs to have offsets but it's
+                        # used here to verify that the internal format of the
+                        # Timestamp is used for X-Timestamp
+                        now.offset = 1
+                        res = sharder._send_shard_ranges(
+                            broker, 'a', 'c', shard_ranges)
+
+            self.assertEqual(sharder.ring.replica_count, len(conn.requests))
+            expected_body = json.dumps([dict(sr) for sr in shard_ranges])
+            expected_body = expected_body.encode('ascii')
+            expected_headers = {'Content-Type': 'application/json',
+                                'Content-Length': str(len(expected_body)),
+                                'X-Timestamp': now.internal,
+                                'X-Backend-Record-Type': 'shard',
+                                'User-Agent': mock.ANY}
+            for data in sent_data.values():
+                self.assertEqual(expected_body, data)
+            hosts = set()
+            for req in conn.requests:
+                path_parts = req['path'].split('/')[1:]
+                hosts.add('%s:%s/%s' % (req['ip'], req['port'], path_parts[0]))
+                # FakeRing only has one partition
+                self.assertEqual('0', path_parts[1])
+                self.assertEqual('PUT', req['method'])
+                self.assertEqual(['a', 'c'], path_parts[-2:])
+                req_headers = req['headers']
+                for k, v in expected_headers.items():
+                    self.assertEqual(v, req_headers[k])
+                self.assertTrue(
+                    req_headers['User-Agent'].startswith('container-sharder'))
+            self.assertEqual(sharder.ring.replica_count, len(hosts))
+            return res, sharder, hosts
+
+        replicas = 3
+        res, sharder, _ = do_test(replicas, 202, 202, 202)
+        self.assertTrue(res)
+        self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+        self.assertFalse(sharder.logger.get_lines_for_level('error'))
+        res, sharder, _ = do_test(replicas, 202, 202, 404)
+        self.assertTrue(res)
+        self.assertEqual([True], [
+            'Failed to put shard ranges' in line for line in
+            sharder.logger.get_lines_for_level('warning')])
+        self.assertEqual([True], [
+            'path: a/c, db: %s' % broker.db_file in line for line in
+            sharder.logger.get_lines_for_level('warning')])
+        self.assertFalse(sharder.logger.get_lines_for_level('error'))
+        res, sharder, _ = do_test(replicas, 202, 202, Exception)
+        self.assertTrue(res)
+        self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+        self.assertEqual([True], [
+            'Failed to put shard ranges' in line for line in
+            sharder.logger.get_lines_for_level('error')])
+        self.assertEqual([True], [
+            'path: a/c, db: %s' % broker.db_file in line for line in
+            sharder.logger.get_lines_for_level('error')])
+        res, sharder, _ = do_test(replicas, 202, 404, 404)
+        self.assertFalse(res)
+        self.assertEqual([True, True], [
+            'Failed to put shard ranges' in line for line in
+            sharder.logger.get_lines_for_level('warning')])
+        self.assertEqual([True, True], [
+            'path: a/c, db: %s' % broker.db_file in line for line in
+            sharder.logger.get_lines_for_level('warning')])
+        self.assertFalse(sharder.logger.get_lines_for_level('error'))
+        res, sharder, hosts = do_test(replicas, 500, 500, 500)
+        self.assertFalse(res)
+        self.assertEqual(set(
+            'Failed to put shard ranges to %s a/c: 500, path: a/c, db: %s' %
+            (host, broker.db_file) for host in hosts),
+            set(sharder.logger.get_lines_for_level('warning')))
+        self.assertFalse(sharder.logger.get_lines_for_level('error'))
+        res, sharder, _ = do_test(replicas, Exception, Exception, 202)
+        self.assertEqual([True, True], [
+            'Failed to put shard ranges' in line for line in
+            sharder.logger.get_lines_for_level('error')])
+        self.assertEqual([True, True], [
+            'path: a/c, db: %s' % broker.db_file in line for line in
+            sharder.logger.get_lines_for_level('error')])
+        res, sharder, _ = do_test(replicas, Exception, eventlet.Timeout(), 202)
+        self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+        self.assertEqual([True, True], [
+            'Failed to put shard ranges' in line for line in
+            sharder.logger.get_lines_for_level('error')])
+        self.assertEqual([True, True], [
+            'path: a/c, db: %s' % broker.db_file in line for line in
+            sharder.logger.get_lines_for_level('error')])
+
+        replicas = 2
+        res, sharder, _ = do_test(replicas, 202, 202)
+        self.assertTrue(res)
+        self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+        self.assertFalse(sharder.logger.get_lines_for_level('error'))
+        res, sharder, _ = do_test(replicas, 202, 404)
+        self.assertTrue(res)
+        self.assertEqual([True], [
+            'Failed to put shard ranges' in line for line in
+            sharder.logger.get_lines_for_level('warning')])
+        self.assertEqual([True], [
+            'path: a/c, db: %s' % broker.db_file in line for line in
+            sharder.logger.get_lines_for_level('warning')])
+        self.assertFalse(sharder.logger.get_lines_for_level('error'))
+        res, sharder, _ = do_test(replicas, 202, Exception)
+        self.assertTrue(res)
+        self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+        self.assertEqual([True], [
+            'Failed to put shard ranges' in line for line in
+            sharder.logger.get_lines_for_level('error')])
+        self.assertEqual([True], [
+            'path: a/c, db: %s' % broker.db_file in line for line in
+            sharder.logger.get_lines_for_level('error')])
+        res, sharder, _ = do_test(replicas, 404, 404)
+        self.assertFalse(res)
+        self.assertEqual([True, True], [
+            'Failed to put shard ranges' in line for line in
+            sharder.logger.get_lines_for_level('warning')])
+        self.assertEqual([True, True], [
+            'path: a/c, db: %s' % broker.db_file in line for line in
+            sharder.logger.get_lines_for_level('warning')])
+        self.assertFalse(sharder.logger.get_lines_for_level('error'))
+        res, sharder, hosts = do_test(replicas, Exception, Exception)
+        self.assertFalse(res)
+        self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+        self.assertEqual(set(
+            'Failed to put shard ranges to %s a/c: FakeStatus Error, '
+            'path: a/c, db: %s: ' % (host, broker.db_file) for host in hosts),
+            set(sharder.logger.get_lines_for_level('error')))
+        res, sharder, _ = do_test(replicas, eventlet.Timeout(), Exception)
+        self.assertFalse(res)
+        self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+        self.assertEqual([True, True], [
+            'Failed to put shard ranges' in line for line in
+            sharder.logger.get_lines_for_level('error')])
+        self.assertEqual([True, True], [
+            'path: a/c, db: %s' % broker.db_file in line for line in
+            sharder.logger.get_lines_for_level('error')])
+
+        replicas = 4
+        res, sharder, _ = do_test(replicas, 202, 202, 202, 202)
+        self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+        self.assertFalse(sharder.logger.get_lines_for_level('error'))
+        self.assertTrue(res)
+        res, sharder, _ = do_test(replicas, 202, 202, 404, 404)
+        self.assertTrue(res)
+        self.assertEqual([True, True], [
+            'Failed to put shard ranges' in line for line in
+            sharder.logger.get_lines_for_level('warning')])
+        self.assertEqual([True, True], [
+            'path: a/c, db: %s' % broker.db_file in line for line in
+            sharder.logger.get_lines_for_level('warning')])
+        self.assertFalse(sharder.logger.get_lines_for_level('error'))
+        res, sharder, _ = do_test(replicas, 202, 202, Exception, Exception)
+        self.assertTrue(res)
+        self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+        self.assertEqual([True, True], [
+            'Failed to put shard ranges' in line for line in
+            sharder.logger.get_lines_for_level('error')])
+        self.assertEqual([True, True], [
+            'path: a/c, db: %s' % broker.db_file in line for line in
+            sharder.logger.get_lines_for_level('error')])
+        res, sharder, _ = do_test(replicas, 202, 404, 404, 404)
+        self.assertFalse(res)
+        self.assertEqual([True, True, True], [
+            'Failed to put shard ranges' in line for line in
+            sharder.logger.get_lines_for_level('warning')])
+        self.assertEqual([True, True, True], [
+            'path: a/c, db: %s' % broker.db_file in line for line in
+            sharder.logger.get_lines_for_level('warning')])
+        self.assertFalse(sharder.logger.get_lines_for_level('error'))
+        res, sharder, _ = do_test(replicas, 500, 500, 500, 202)
+        self.assertFalse(res)
+        self.assertEqual([True, True, True], [
+            'Failed to put shard ranges' in line for line in
+            sharder.logger.get_lines_for_level('warning')])
+        self.assertEqual([True, True, True], [
+            'path: a/c, db: %s' % broker.db_file in line for line in
+            sharder.logger.get_lines_for_level('warning')])
+        self.assertFalse(sharder.logger.get_lines_for_level('error'))
+        res, sharder, _ = do_test(replicas, Exception, Exception, 202, 404)
+        self.assertFalse(res)
+        self.assertEqual([True], [
+            all(msg in line for msg in ('Failed to put shard ranges', '404'))
+            for line in sharder.logger.get_lines_for_level('warning')])
+        self.assertEqual([True], [
+            'path: a/c, db: %s' % broker.db_file in line for line in
+            sharder.logger.get_lines_for_level('warning')])
+        self.assertEqual([True, True], [
+            'Failed to put shard ranges' in line for line in
+            sharder.logger.get_lines_for_level('error')])
+        self.assertEqual([True, True], [
+            'path: a/c, db: %s' % broker.db_file in line for line in
+            sharder.logger.get_lines_for_level('error')])
+        res, sharder, _ = do_test(
+            replicas, eventlet.Timeout(), eventlet.Timeout(), 202, 404)
+        self.assertFalse(res)
+        self.assertEqual([True], [
+            all(msg in line for msg in ('Failed to put shard ranges', '404'))
+            for line in sharder.logger.get_lines_for_level('warning')])
+        self.assertEqual([True], [
+            'path: a/c, db: %s' % broker.db_file in line for line in
+            sharder.logger.get_lines_for_level('warning')])
+        self.assertEqual([True, True], [
+            'Failed to put shard ranges' in line for line in
+            sharder.logger.get_lines_for_level('error')])
+        self.assertEqual([True, True], [
+            'path: a/c, db: %s' % broker.db_file in line for line in
+            sharder.logger.get_lines_for_level('error')])
+
+    def test_process_broker_not_sharding_no_others(self):
+        # verify that sharding process will not start when own shard range is
+        # missing or in wrong state or there are no other shard ranges
+        broker = self._make_broker()
+        node = {'ip': '1.2.3.4', 'port': 6040, 'device': 'sda5', 'id': '2',
+                'index': 0}
+        # sanity check
+        self.assertIsNone(broker.get_own_shard_range(no_default=True))
+        self.assertEqual(UNSHARDED, broker.get_db_state())
+
+        # no own shard range
+        with self._mock_sharder() as sharder:
+            sharder._process_broker(broker, node, 99)
+        self.assertIsNone(broker.get_own_shard_range(no_default=True))
+        self.assertEqual(UNSHARDED, broker.get_db_state())
+        self.assertFalse(broker.logger.get_lines_for_level('warning'))
+        self.assertFalse(broker.logger.get_lines_for_level('error'))
+        broker.logger.clear()
+
+        # now add own shard range
+        for state in sorted(ShardRange.STATES):
+            own_sr = broker.get_own_shard_range()  # returns the default
+            own_sr.update_state(state)
+            broker.merge_shard_ranges([own_sr])
+            with mock.patch.object(
+                    broker, 'set_sharding_state') as mock_set_sharding_state:
+                with self._mock_sharder() as sharder:
+                    with mock_timestamp_now():
+                        with mock.patch.object(sharder, '_audit_container'):
+                            sharder._process_broker(broker, node, 99)
+                            own_shard_range = broker.get_own_shard_range(
+                                no_default=True)
+            mock_set_sharding_state.assert_not_called()
+            self.assertEqual(dict(own_sr), dict(own_shard_range))
+            self.assertEqual(UNSHARDED, broker.get_db_state())
+            self.assertFalse(broker.logger.get_lines_for_level('warning'))
+            self.assertFalse(broker.logger.get_lines_for_level('error'))
+            broker.logger.clear()
+
+    def _check_process_broker_sharding_others(self, start_state, deleted):
+        # verify that when existing own_shard_range has given state and there
+        # are other shard ranges then the sharding process will complete
+        broker = self._make_broker(hash_='hash%s%s' % (start_state, deleted))
+        node = {'ip': '1.2.3.4', 'port': 6040, 'device': 'sda5', 'id': '2',
+                'index': 0}
+        own_sr = broker.get_own_shard_range()
+        self.assertTrue(own_sr.update_state(start_state))
+        epoch = next(self.ts_iter)
+        own_sr.epoch = epoch
+        shard_ranges = self._make_shard_ranges((('', 'm'), ('m', '')))
+        broker.merge_shard_ranges([own_sr] + shard_ranges)
+        if deleted:
+            broker.delete_db(next(self.ts_iter).internal)
+
+        with self._mock_sharder() as sharder:
+            # pretend shard containers are created ok so sharding proceeds
+            with mock.patch.object(
+                    sharder, '_send_shard_ranges', return_value=True):
+                with mock_timestamp_now_with_iter(self.ts_iter):
+                    sharder._audit_container = mock.MagicMock()
+                    sharder._process_broker(broker, node, 99)
+
+        final_own_sr = broker.get_own_shard_range(no_default=True)
+        self.assertEqual(SHARDED, broker.get_db_state())
+        self.assertEqual(epoch.normal, parse_db_filename(broker.db_file)[1])
+        lines = broker.logger.get_lines_for_level('info')
+        self.assertIn('Completed creating 2 shard range containers, '
+                      'path: a/c, db: %s' % broker.db_file, lines)
+        self.assertFalse(broker.logger.get_lines_for_level('warning'))
+        self.assertFalse(broker.logger.get_lines_for_level('error'))
+        self.assertEqual(deleted, broker.is_deleted())
+        return own_sr, final_own_sr
+
+    def test_process_broker_sharding_completes_with_own_and_other_ranges(self):
+        own_sr, final_own_sr = self._check_process_broker_sharding_others(
+            ShardRange.SHARDING, False)
+        exp_own_sr = dict(own_sr, state=ShardRange.SHARDED,
+                          meta_timestamp=mock.ANY)
+        self.assertEqual(exp_own_sr, dict(final_own_sr))
+
+        # verify that deleted DBs will be sharded
+        own_sr, final_own_sr = self._check_process_broker_sharding_others(
+            ShardRange.SHARDING, True)
+        exp_own_sr = dict(own_sr, state=ShardRange.SHARDED,
+                          meta_timestamp=mock.ANY)
+        self.assertEqual(exp_own_sr, dict(final_own_sr))
+
+        own_sr, final_own_sr = self._check_process_broker_sharding_others(
+            ShardRange.SHRINKING, False)
+        exp_own_sr = dict(own_sr, state=ShardRange.SHRUNK,
+                          meta_timestamp=mock.ANY)
+        self.assertEqual(exp_own_sr, dict(final_own_sr))
+
+        # verify that deleted DBs will be shrunk
+        own_sr, final_own_sr = self._check_process_broker_sharding_others(
+            ShardRange.SHRINKING, True)
+        exp_own_sr = dict(own_sr, state=ShardRange.SHRUNK,
+                          meta_timestamp=mock.ANY)
+        self.assertEqual(exp_own_sr, dict(final_own_sr))
+
+    def test_process_broker_not_sharding_others(self):
+        # verify that sharding process will not start when own shard range is
+        # missing or in wrong state even when other shard ranges are in the db
+        broker = self._make_broker()
+        node = {'ip': '1.2.3.4', 'port': 6040, 'device': 'sda5', 'id': '2',
+                'index': 0}
+        # sanity check
+        self.assertIsNone(broker.get_own_shard_range(no_default=True))
+        self.assertEqual(UNSHARDED, broker.get_db_state())
+
+        # add shard ranges - but not own
+        shard_ranges = self._make_shard_ranges((('', 'h'), ('h', '')))
+        broker.merge_shard_ranges(shard_ranges)
+
+        with self._mock_sharder() as sharder:
+            sharder._process_broker(broker, node, 99)
+        self.assertIsNone(broker.get_own_shard_range(no_default=True))
+        self.assertEqual(UNSHARDED, broker.get_db_state())
+        self.assertFalse(broker.logger.get_lines_for_level('warning'))
+        self.assertFalse(broker.logger.get_lines_for_level('error'))
+        broker.logger.clear()
+
+        # now add own shard range
+        for state in sorted(ShardRange.STATES):
+            if state in (ShardRange.SHARDING,
+                         ShardRange.SHRINKING,
+                         ShardRange.SHARDED,
+                         ShardRange.SHRUNK):
+                epoch = None
+            else:
+                epoch = Timestamp.now()
+
+            own_sr = broker.get_own_shard_range()  # returns the default
+            own_sr.update_state(state)
+            own_sr.epoch = epoch
+            broker.merge_shard_ranges([own_sr])
+            with self._mock_sharder() as sharder:
+                with mock_timestamp_now():
+                    sharder._process_broker(broker, node, 99)
+                    own_shard_range = broker.get_own_shard_range(
+                        no_default=True)
+            self.assertEqual(dict(own_sr), dict(own_shard_range))
+            self.assertEqual(UNSHARDED, broker.get_db_state())
+            if epoch:
+                self.assertFalse(broker.logger.get_lines_for_level('warning'))
+            else:
+                self.assertIn('missing epoch',
+                              broker.logger.get_lines_for_level('warning')[0])
+            self.assertFalse(broker.logger.get_lines_for_level('error'))
+            broker.logger.clear()
+
+    def _check_process_broker_sharding_stalls_others(self, state):
+        # verify states in which own_shard_range will cause sharding
+        # process to start when other shard ranges are in the db, but stop
+        # when shard containers have not been created
+        broker = self._make_broker(hash_='hash%s' % state)
+        node = {'ip': '1.2.3.4', 'port': 6040, 'device': 'sda5', 'id': '2',
+                'index': 0}
+        # add shard ranges - but not own
+        shard_ranges = self._make_shard_ranges((('', 'h'), ('h', '')))
+        broker.merge_shard_ranges(shard_ranges)
+        # sanity check
+        self.assertIsNone(broker.get_own_shard_range(no_default=True))
+        self.assertEqual(UNSHARDED, broker.get_db_state())
+
+        # now set own shard range to given state and persist it
+        own_sr = broker.get_own_shard_range()  # returns the default
+        self.assertTrue(own_sr.update_state(state))
+        epoch = Timestamp.now()
+        own_sr.epoch = epoch
+        broker.merge_shard_ranges([own_sr])
+        with self._mock_sharder() as sharder:
+            with mock_timestamp_now():
+                # we're not testing rest of the process here so prevent any
+                # attempt to progress shard range states
+                sharder._create_shard_containers = lambda *args: 0
+                sharder._process_broker(broker, node, 99)
+                own_shard_range = broker.get_own_shard_range(no_default=True)
+
+        self.assertEqual(dict(own_sr), dict(own_shard_range))
+        self.assertEqual(SHARDING, broker.get_db_state())
+        self.assertEqual(epoch.normal, parse_db_filename(broker.db_file)[1])
+        self.assertFalse(broker.logger.get_lines_for_level('warning'))
+        self.assertFalse(broker.logger.get_lines_for_level('error'))
+
+    def test_process_broker_sharding_stalls_with_own_and_other_ranges(self):
+        self._check_process_broker_sharding_stalls_others(ShardRange.SHARDING)
+        self._check_process_broker_sharding_stalls_others(ShardRange.SHRINKING)
+        self._check_process_broker_sharding_stalls_others(ShardRange.SHARDED)
+
+    def test_process_broker_leader_auto_shard(self):
+        # verify conditions for acting as auto-shard leader
+        broker = self._make_broker(put_timestamp=next(self.ts_iter))
+        objects = [
+            ['obj%3d' % i, self.ts_encoded(), i, 'text/plain',
+             'etag%s' % i, 0] for i in range(10)]
+        for obj in objects:
+            broker.put_object(*obj)
+        self.assertEqual(10, broker.get_info()['object_count'])
+        node = {'ip': '1.2.3.4', 'port': 6040, 'device': 'sda5', 'id': '2',
+                'index': 0}
+
+        def do_process(conf):
+            with self._mock_sharder(conf) as sharder:
+                with mock_timestamp_now():
+                    # we're not testing rest of the process here so prevent any
+                    # attempt to progress shard range states
+                    sharder._create_shard_containers = lambda *args: 0
+                    sharder._process_broker(broker, node, 99)
+
+        # auto shard disabled
+        conf = {'shard_container_threshold': 10,
+                'rows_per_shard': 5,
+                'shrink_threshold': 1,
+                'auto_shard': False}
+        do_process(conf)
+        self.assertEqual(UNSHARDED, broker.get_db_state())
+        own_sr = broker.get_own_shard_range(no_default=True)
+        self.assertIsNone(own_sr)
+
+        # auto shard enabled, not node 0
+        conf['auto_shard'] = True
+        node['index'] = 1
+        do_process(conf)
+        self.assertEqual(UNSHARDED, broker.get_db_state())
+        own_sr = broker.get_own_shard_range(no_default=True)
+        self.assertIsNone(own_sr)
+
+        # auto shard enabled, node 0 -> start sharding
+        node['index'] = 0
+        do_process(conf)
+        self.assertEqual(SHARDING, broker.get_db_state())
+        own_sr = broker.get_own_shard_range(no_default=True)
+        self.assertIsNotNone(own_sr)
+        self.assertEqual(ShardRange.SHARDING, own_sr.state)
+        self.assertEqual(own_sr.epoch.normal,
+                         parse_db_filename(broker.db_file)[1])
+        self.assertEqual(2, len(broker.get_shard_ranges()))
+
+    def test_process_broker_leader_auto_shard_deleted_db(self):
+        # verify no auto-shard leader if broker is deleted
+        conf = {'shard_container_threshold': 10,
+                'rows_per_shard': 5,
+                'shrink_threshold': 1,
+                'auto_shard': True}
+        broker = self._make_broker(put_timestamp=next(self.ts_iter))
+        broker.delete_db(next(self.ts_iter).internal)
+        self.assertTrue(broker.is_deleted())  # sanity check
+        node = {'ip': '1.2.3.4', 'port': 6040, 'device': 'sda5', 'id': '2',
+                'index': 0}
+
+        with self._mock_sharder(conf) as sharder:
+            with mock_timestamp_now():
+                with mock.patch.object(
+                        sharder, '_find_and_enable_sharding_candidates'
+                ) as mock_find_and_enable:
+                    sharder._process_broker(broker, node, 99)
+
+        self.assertEqual(UNSHARDED, broker.get_db_state())
+        own_sr = broker.get_own_shard_range(no_default=True)
+        self.assertIsNone(own_sr)
+        # this is the only concrete assertion that verifies the leader actions
+        # are not taken; no shard ranges would actually be found for an empty
+        # deleted db so there's no other way to differentiate from an undeleted
+        # db being processed...
+        mock_find_and_enable.assert_not_called()
+
+    def check_shard_ranges_sent(self, broker, expected_sent):
+        bodies = []
+        servers = []
+        referers = []
+
+        def capture_send(conn, data):
+            bodies.append(data)
+
+        def capture_connect(host, port, _method, _path, headers, *a, **kw):
+            servers.append((host, port))
+            referers.append(headers.get('Referer'))
+
+        self.assertFalse(broker.get_own_shard_range().reported)  # sanity
+        with self._mock_sharder() as sharder:
+            with mocked_http_conn(204, 204, 204,
+                                  give_send=capture_send,
+                                  give_connect=capture_connect) as mock_conn:
+                sharder._update_root_container(broker)
+
+        for req in mock_conn.requests:
+            self.assertEqual('PUT', req['method'])
+        self.assertEqual([expected_sent] * 3,
+                         [json.loads(b) for b in bodies])
+        self.assertEqual(servers, [
+            # NB: replication interfaces
+            ('10.0.1.0', 1100),
+            ('10.0.1.1', 1101),
+            ('10.0.1.2', 1102),
+        ])
+        self.assertEqual([broker.path] * 3, referers)
+        self.assertTrue(broker.get_own_shard_range().reported)
+
+    def test_update_root_container_own_range(self):
+        broker = self._make_broker()
+        obj_names = []
+
+        # nothing to send
+        with self._mock_sharder() as sharder:
+            with mocked_http_conn() as mock_conn:
+                sharder._update_root_container(broker)
+        self.assertFalse(mock_conn.requests)
+
+        def check_only_own_shard_range_sent(state):
+            own_shard_range = broker.get_own_shard_range()
+            self.assertTrue(own_shard_range.update_state(
+                state, state_timestamp=next(self.ts_iter)))
+            broker.merge_shard_ranges([own_shard_range])
+            # add an object, expect to see it reflected in the own shard range
+            # that is sent
+            obj_names.append(uuid4())
+            broker.put_object(str(obj_names[-1]),
+                              next(self.ts_iter).internal, 1, '', '')
+            with mock_timestamp_now() as now:
+                # check if the state if in SHARD_UPDATE_STAT_STATES
+                if state in [ShardRange.CLEAVED, ShardRange.ACTIVE,
+                             ShardRange.SHARDING, ShardRange.SHARDED,
+                             ShardRange.SHRINKING, ShardRange.SHRUNK]:
+                    exp_obj_count = len(obj_names)
+                    expected_sent = [
+                        dict(own_shard_range,
+                             meta_timestamp=now.internal,
+                             object_count=len(obj_names),
+                             bytes_used=len(obj_names))]
+                else:
+                    exp_obj_count = own_shard_range.object_count
+                    expected_sent = [
+                        dict(own_shard_range)]
+                self.check_shard_ranges_sent(broker, expected_sent)
+                self.assertEqual(
+                    exp_obj_count, broker.get_own_shard_range().object_count)
+
+        # initialise tombstones
+        with mock_timestamp_now(next(self.ts_iter)):
+            own_shard_range = broker.get_own_shard_range()
+            own_shard_range.update_tombstones(0)
+            broker.merge_shard_ranges([own_shard_range])
+
+        for state in ShardRange.STATES:
+            with self.subTest(state=state):
+                check_only_own_shard_range_sent(state)
+
+        init_obj_count = len(obj_names)
+
+        def check_tombstones_sent(state):
+            own_shard_range = broker.get_own_shard_range()
+            self.assertTrue(own_shard_range.update_state(
+                state, state_timestamp=next(self.ts_iter)))
+            broker.merge_shard_ranges([own_shard_range])
+            # delete an object, expect to see it reflected in the own shard
+            # range that is sent
+            broker.delete_object(str(obj_names.pop(-1)),
+                                 next(self.ts_iter).internal)
+            with mock_timestamp_now() as now:
+                # check if the state if in SHARD_UPDATE_STAT_STATES
+                if state in [ShardRange.CLEAVED, ShardRange.ACTIVE,
+                             ShardRange.SHARDING, ShardRange.SHARDED,
+                             ShardRange.SHRINKING, ShardRange.SHRUNK]:
+                    expected_sent = [
+                        dict(own_shard_range,
+                             meta_timestamp=now.internal,
+                             object_count=len(obj_names),
+                             bytes_used=len(obj_names),
+                             tombstones=init_obj_count - len(obj_names))]
+                else:
+                    expected_sent = [
+                        dict(own_shard_range)]
+                self.check_shard_ranges_sent(broker, expected_sent)
+
+        for i, state in enumerate(ShardRange.STATES):
+            with self.subTest(state=state):
+                check_tombstones_sent(state)
+
+    def test_update_root_container_already_reported(self):
+        broker = self._make_broker()
+
+        def check_already_reported_not_sent(state):
+            own_shard_range = broker.get_own_shard_range()
+
+            own_shard_range.reported = True
+            self.assertTrue(own_shard_range.update_state(
+                state, state_timestamp=next(self.ts_iter)))
+            # Check that updating state clears the flag
+            self.assertFalse(own_shard_range.reported)
+
+            # If we claim to have already updated...
+            own_shard_range.reported = True
+            broker.merge_shard_ranges([own_shard_range])
+
+            # ... then there's nothing to send
+            with self._mock_sharder() as sharder:
+                with mocked_http_conn() as mock_conn:
+                    sharder._update_root_container(broker)
+            self.assertFalse(mock_conn.requests)
+
+        # initialise tombstones
+        with mock_timestamp_now(next(self.ts_iter)):
+            own_shard_range = broker.get_own_shard_range()
+            own_shard_range.update_tombstones(0)
+            broker.merge_shard_ranges([own_shard_range])
+
+        for state in ShardRange.STATES:
+            with self.subTest(state=state):
+                check_already_reported_not_sent(state)
+
+    def test_update_root_container_all_ranges(self):
+        broker = self._make_broker()
+        other_shard_ranges = self._make_shard_ranges((('', 'h'), ('h', '')))
+        self.assertTrue(other_shard_ranges[0].set_deleted())
+        broker.merge_shard_ranges(other_shard_ranges)
+        obj_names = []
+
+        # own range missing - send nothing
+        with self._mock_sharder() as sharder:
+            with mocked_http_conn() as mock_conn:
+                sharder._update_root_container(broker)
+        self.assertFalse(mock_conn.requests)
+
+        def check_all_shard_ranges_sent(state):
+            own_shard_range = broker.get_own_shard_range()
+            self.assertTrue(own_shard_range.update_state(
+                state, state_timestamp=next(self.ts_iter)))
+            broker.merge_shard_ranges([own_shard_range])
+            # add an object, expect to see it reflected in the own shard range
+            # that is sent
+            obj_names.append(uuid4())
+            broker.put_object(str(obj_names[-1]),
+                              next(self.ts_iter).internal, 1, '', '')
+            with mock_timestamp_now() as now:
+                shard_ranges = broker.get_shard_ranges(include_deleted=True)
+                exp_own_shard_range = own_shard_range.copy()
+                # check if the state if in SHARD_UPDATE_STAT_STATES
+                if state in [ShardRange.CLEAVED, ShardRange.ACTIVE,
+                             ShardRange.SHARDING, ShardRange.SHARDED,
+                             ShardRange.SHRINKING, ShardRange.SHRUNK]:
+                    exp_own_shard_range.object_count = len(obj_names)
+                    exp_own_shard_range.bytes_used = len(obj_names)
+                    exp_own_shard_range.meta_timestamp = now.internal
+                    exp_own_shard_range.tombstones = 0
+                expected_sent = sorted(
+                    [exp_own_shard_range] + shard_ranges,
+                    key=lambda sr: (sr.upper, sr.state, sr.lower))
+                self.check_shard_ranges_sent(
+                    broker, [dict(sr) for sr in expected_sent])
+
+        for state in ShardRange.STATES.keys():
+            with self.subTest(state=state):
+                check_all_shard_ranges_sent(state)
+
+    def test_audit_root_container_reset_epoch(self):
+        epoch = next(self.ts_iter)
+        broker = self._make_broker(epoch=epoch)
+        shard_bounds = (('', 'j'), ('j', 'k'), ('k', 's'),
+                        ('s', 'y'), ('y', ''))
+        shard_ranges = self._make_shard_ranges(shard_bounds,
+                                               ShardRange.ACTIVE,
+                                               timestamp=next(self.ts_iter))
+        broker.merge_shard_ranges(shard_ranges)
+        own_shard_range = broker.get_own_shard_range()
+        own_shard_range.update_state(ShardRange.SHARDED, next(self.ts_iter))
+        own_shard_range.epoch = epoch
+        broker.merge_shard_ranges(own_shard_range)
+        with self._mock_sharder() as sharder:
+            with mock.patch.object(
+                    sharder, '_audit_shard_container') as mocked:
+                sharder._audit_container(broker)
+        self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+        self.assertFalse(sharder.logger.get_lines_for_level('error'))
+        self._assert_stats({'attempted': 1, 'success': 1, 'failure': 0},
+                           sharder, 'audit_root')
+        mocked.assert_not_called()
+
+        # test for a reset epoch
+        own_shard_range = broker.get_own_shard_range()
+        own_shard_range.epoch = None
+        own_shard_range.state_timestamp = next(self.ts_iter)
+        broker.merge_shard_ranges(own_shard_range)
+        with self._mock_sharder() as sharder:
+            with mock.patch.object(
+                    sharder, '_audit_shard_container') as mocked:
+                sharder._audit_container(broker)
+        lines = sharder.logger.get_lines_for_level('warning')
+
+        self.assertIn("own_shard_range reset to None should be %s"
+                      % broker.db_epoch, lines[0])
+
+    def test_audit_root_container(self):
+        broker = self._make_broker()
+
+        expected_stats = {'attempted': 1, 'success': 1, 'failure': 0,
+                          'has_overlap': 0, 'num_overlap': 0}
+        with self._mock_sharder() as sharder:
+            with mock.patch.object(
+                    sharder, '_audit_shard_container') as mocked:
+                sharder._audit_container(broker)
+        self._assert_stats(expected_stats, sharder, 'audit_root')
+        self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+        self.assertFalse(sharder.logger.get_lines_for_level('error'))
+        mocked.assert_not_called()
+
+        def assert_overlap_warning(line):
+            self.assertIn('Audit failed for root', line)
+            self.assertIn(broker.db_file, line)
+            self.assertIn(broker.path, line)
+            self.assertIn(
+                'overlapping ranges: 2 (use swift-manage-shard-ranges repair)',
+                line)
+            # check for no duplicates in reversed order
+            self.assertNotIn('s-z k-t', line)
+
+        expected_stats = {'attempted': 1, 'success': 0, 'failure': 1,
+                          'has_overlap': 1, 'num_overlap': 2}
+        shard_bounds = (('a', 'j'), ('k', 't'), ('s', 'y'),
+                        ('y', 'z'), ('y', 'z'))
+        for state in ShardRange.STATES:
+            if state in (ShardRange.SHRINKING,
+                         ShardRange.SHARDED,
+                         ShardRange.SHRUNK):
+                continue  # tested separately below
+            shard_ranges = self._make_shard_ranges(
+                shard_bounds, state, timestamp=next(self.ts_iter))
+            broker.merge_shard_ranges(shard_ranges)
+            with self._mock_sharder() as sharder:
+                with mock.patch.object(
+                        sharder, '_audit_shard_container') as mocked:
+                    sharder._audit_container(broker)
+            lines = sharder.logger.get_lines_for_level('warning')
+            assert_overlap_warning(lines[0])
+            self.assertFalse(lines[1:])
+            self.assertFalse(sharder.logger.get_lines_for_level('error'))
+            self._assert_stats(expected_stats, sharder, 'audit_root')
+            mocked.assert_not_called()
+
+        shard_ranges = self._make_shard_ranges(shard_bounds,
+                                               ShardRange.SHRINKING,
+                                               timestamp=next(self.ts_iter))
+        broker.merge_shard_ranges(shard_ranges)
+        with self._mock_sharder() as sharder:
+            with mock.patch.object(
+                    sharder, '_audit_shard_container') as mocked:
+                sharder._audit_container(broker)
+        self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+        self.assertFalse(sharder.logger.get_lines_for_level('error'))
+        self._assert_stats({'attempted': 1, 'success': 1, 'failure': 0,
+                            'has_overlap': 0, 'num_overlap': 0},
+                           sharder, 'audit_root')
+        mocked.assert_not_called()
+
+        for state in (ShardRange.SHRUNK, ShardRange.SHARDED):
+            shard_ranges = self._make_shard_ranges(
+                shard_bounds, state, timestamp=next(self.ts_iter))
+            for sr in shard_ranges:
+                sr.set_deleted(Timestamp.now())
+            broker.merge_shard_ranges(shard_ranges)
+            with self._mock_sharder() as sharder:
+                with mock.patch.object(
+                        sharder, '_audit_shard_container') as mocked:
+                    sharder._audit_container(broker)
+            self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+            self.assertFalse(sharder.logger.get_lines_for_level('error'))
+            self._assert_stats({'attempted': 1, 'success': 1, 'failure': 0,
+                                'has_overlap': 0, 'num_overlap': 0},
+                               sharder, 'audit_root')
+            mocked.assert_not_called()
+
+        # Put the shards back to a "useful" state
+        shard_ranges = self._make_shard_ranges(shard_bounds,
+                                               ShardRange.ACTIVE,
+                                               timestamp=next(self.ts_iter))
+        broker.merge_shard_ranges(shard_ranges)
+
+        def assert_missing_warning(line):
+            self.assertIn('Audit failed for root', line)
+            self.assertIn(
+                'missing range(s): 3 (use swift-manage-shard-ranges repair)',
+                line)
+            self.assertIn('path: %s, db: %s' % (broker.path, broker.db_file),
+                          line)
+
+        def check_missing():
+            own_shard_range = broker.get_own_shard_range()
+            states = (ShardRange.SHARDING, ShardRange.SHARDED)
+            for state in states:
+                own_shard_range.update_state(
+                    state, state_timestamp=next(self.ts_iter))
+                broker.merge_shard_ranges([own_shard_range])
+                with self._mock_sharder() as sharder:
+                    with mock.patch.object(
+                            sharder, '_audit_shard_container') as mocked:
+                        sharder._audit_container(broker)
+                lines = sharder.logger.get_lines_for_level('warning')
+                assert_missing_warning(lines[0])
+                assert_overlap_warning(lines[0])
+                self.assertFalse(lines[1:])
+                self.assertFalse(sharder.logger.get_lines_for_level('error'))
+                self._assert_stats(expected_stats, sharder, 'audit_root')
+                mocked.assert_not_called()
+
+        check_missing()
+
+        # fill the gaps with shrinking shards and check that these are still
+        # reported as 'missing'
+        missing_shard_bounds = (('', 'a'), ('j', 'k'), ('z', ''))
+        shrinking_shard_ranges = self._make_shard_ranges(
+            missing_shard_bounds, ShardRange.SHRINKING,
+            timestamp=next(self.ts_iter))
+        broker.merge_shard_ranges(shrinking_shard_ranges)
+        check_missing()
+
+    def test_audit_root_container_with_parent_child_overlapping(self):
+        # Test '_audit_root_container' when overlapping shard ranges are
+        # parent and children, expect no warnings. The case of non parent-child
+        # overlapping is tested in 'test_audit_root_container'.
+        now_ts = next(self.ts_iter)
+        past_ts = Timestamp(float(now_ts) - 604801)
+        root_sr = ShardRange('a/c', past_ts, state=ShardRange.SHARDED)
+        parent_range = ShardRange(ShardRange.make_path(
+            '.shards_a', 'c', root_sr.container,
+            past_ts, 0),
+            past_ts, 'a', 'f', object_count=1,
+            state=ShardRange.CLEAVED)
+        child_ranges = [
+            ShardRange(
+                ShardRange.make_path(
+                    '.shards_a', 'c', parent_range.container, past_ts, 0),
+                past_ts, lower='a', upper='c', object_count=1,
+                state=ShardRange.CLEAVED),
+            ShardRange(
+                ShardRange.make_path(
+                    '.shards_a', 'c', parent_range.container, past_ts, 1),
+                past_ts, lower='c', upper='f', object_count=1,
+                state=ShardRange.CLEAVED)]
+        self.assertTrue(find_overlapping_ranges([parent_range] + child_ranges))
+        broker = self._make_broker()
+
+        # The case of transient overlapping within reclaim_age.
+        expected_stats = {'attempted': 1, 'success': 1, 'failure': 0,
+                          'has_overlap': 0, 'num_overlap': 0}
+        broker.merge_shard_ranges([parent_range] + child_ranges)
+        with mock.patch('swift.container.sharder.time.time',
+                        return_value=float(now_ts) - 10):
+            with self._mock_sharder() as sharder:
+                with mock.patch.object(
+                        sharder, '_audit_shard_container') as mocked:
+                    sharder._audit_container(broker)
+        self._assert_stats(expected_stats, sharder, 'audit_root')
+        self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+        self.assertFalse(sharder.logger.get_lines_for_level('error'))
+        mocked.assert_not_called()
+
+        # The case of overlapping past reclaim_age.
+        expected_stats = {'attempted': 1, 'success': 0, 'failure': 1,
+                          'has_overlap': 1, 'num_overlap': 2}
+        with mock.patch('swift.container.sharder.time.time',
+                        return_value=float(now_ts)):
+            with self._mock_sharder() as sharder:
+                with mock.patch.object(
+                        sharder, '_audit_shard_container') as mocked:
+                    sharder._audit_container(broker)
+        lines = sharder.logger.get_lines_for_level('warning')
+        self.assertIn('Audit failed for root', lines[0])
+        self.assertFalse(lines[1:])
+        self.assertFalse(sharder.logger.get_lines_for_level('error'))
+        self._assert_stats(expected_stats, sharder, 'audit_root')
+        mocked.assert_not_called()
+
+    def test_audit_deleted_root_container(self):
+        broker = self._make_broker()
+        shard_bounds = (
+            ('a', 'b'), ('b', 'c'), ('c', 'd'), ('d', 'e'), ('e', 'f'))
+        shard_ranges = self._make_shard_ranges(shard_bounds, ShardRange.ACTIVE)
+        broker.merge_shard_ranges(shard_ranges)
+        self.assertTrue(broker.is_root_container())
+        with self._mock_sharder() as sharder:
+            sharder._audit_container(broker)
+        self.assertEqual([], self.logger.get_lines_for_level('warning'))
+
+        # delete it
+        delete_ts = next(self.ts_iter)
+        broker.delete_db(delete_ts.internal)
+        with self._mock_sharder() as sharder:
+            sharder._audit_container(broker)
+        self.assertEqual([], self.logger.get_lines_for_level('warning'))
+
+        # advance time
+        future_time = 6048000 + float(delete_ts)
+        with mock.patch(
+                'swift.container.sharder.time.time',
+                return_value=future_time), self._mock_sharder() as sharder:
+            sharder._audit_container(broker)
+        self.assertEqual(
+            ['Reclaimable db stuck waiting for shrinking, path: %s, db: %s'
+             % (broker.path, broker.db_file)],
+            self.logger.get_lines_for_level('warning'))
+
+        # delete all shard ranges
+        for sr in shard_ranges:
+            sr.update_state(ShardRange.SHRUNK, Timestamp.now())
+            sr.deleted = True
+            sr.timestamp = Timestamp.now()
+        broker.merge_shard_ranges(shard_ranges)
+
+        # no more warning
+        with mock.patch(
+                'swift.container.sharder.time.time',
+                return_value=future_time), self._mock_sharder() as sharder:
+            sharder._audit_container(broker)
+        self.assertEqual([], self.logger.get_lines_for_level('warning'))
+
+    def call_audit_container(self, broker, shard_ranges, exc=None):
+        with self._mock_sharder() as sharder:
+            with mock.patch.object(sharder, '_audit_root_container') \
+                    as mocked, mock.patch.object(
+                        sharder, 'int_client') as mock_swift:
+                mock_response = mock.MagicMock()
+                mock_response.headers = {
+                    'x-backend-record-type': 'shard',
+                    'X-Backend-Record-Shard-Format': 'full'}
+                shard_ranges.sort(key=ShardRange.sort_key)
+                mock_response.body = json.dumps(
+                    [dict(sr) for sr in shard_ranges])
+                mock_swift.make_request.return_value = mock_response
+                mock_swift.make_request.side_effect = exc
+                mock_swift.make_path = (lambda a, c:
+                                        '/v1/%s/%s' % (a, c))
+                sharder.reclaim_age = 0
+                sharder._audit_container(broker)
+        mocked.assert_not_called()
+        return sharder, mock_swift
+
+    def assert_no_audit_messages(self, sharder, mock_swift,
+                                 marker='k', end_marker='t'):
+        self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+        self.assertFalse(sharder.logger.get_lines_for_level('error'))
+        expected_stats = {'attempted': 1, 'success': 1, 'failure': 0}
+        self._assert_stats(expected_stats, sharder, 'audit_shard')
+        expected_headers = {'X-Backend-Record-Type': 'shard',
+                            'X-Newest': 'true',
+                            'X-Backend-Include-Deleted': 'True',
+                            'X-Backend-Override-Deleted': 'true',
+                            'X-Backend-Record-Shard-Format': 'full'}
+        params = {'format': 'json', 'marker': marker, 'end_marker': end_marker,
+                  'states': 'auditing'}
+        mock_swift.make_request.assert_called_once_with(
+            'GET', '/v1/a/c', expected_headers, acceptable_statuses=(2,),
+            params=params)
+
+    def _do_test_audit_shard_container(self, *args):
+        # include overlaps to verify correct match for updating own shard range
+        broker = self._make_broker(account='.shards_a', container='shard_c')
+        broker.set_sharding_sysmeta(*args)
+        shard_bounds = (
+            ('a', 'j'), ('k', 't'), ('k', 'u'), ('l', 'v'), ('s', 'z'))
+        shard_states = (
+            ShardRange.ACTIVE, ShardRange.ACTIVE, ShardRange.ACTIVE,
+            ShardRange.FOUND, ShardRange.CREATED
+        )
+        shard_ranges = self._make_shard_ranges(shard_bounds, shard_states,
+                                               timestamp=next(self.ts_iter))
+        shard_ranges[1].name = broker.path
+        expected_stats = {'attempted': 1, 'success': 0, 'failure': 1}
+
+        # bad account name
+        broker.account = 'bad_account'
+        sharder, mock_swift = self.call_audit_container(broker, shard_ranges)
+        lines = sharder.logger.get_lines_for_level('warning')
+        self._assert_stats(expected_stats, sharder, 'audit_shard')
+        self.assertIn('Audit failed for shard', lines[0])
+        self.assertIn('missing own shard range', lines[0])
+        self.assertIn('path: %s, db: %s' % (broker.path, broker.db_file),
+                      lines[0])
+        self.assertIn('Audit warnings for shard', lines[1])
+        self.assertIn('account not in shards namespace', lines[1])
+        self.assertIn('path: %s, db: %s' % (broker.path, broker.db_file),
+                      lines[1])
+        self.assertNotIn('root has no matching shard range', lines[1])
+        self.assertNotIn('unable to get shard ranges from root', lines[1])
+        self.assertFalse(lines[2:])
+        self.assertFalse(broker.is_deleted())
+
+        # missing own shard range
+        broker.get_info()
+        sharder, mock_swift = self.call_audit_container(broker, shard_ranges)
+        lines = sharder.logger.get_lines_for_level('warning')
+        self._assert_stats(expected_stats, sharder, 'audit_shard')
+        self.assertIn('Audit failed for shard', lines[0])
+        self.assertIn('missing own shard range', lines[0])
+        self.assertIn('path: %s, db: %s' % (broker.path, broker.db_file),
+                      lines[0])
+        self.assertNotIn('unable to get shard ranges from root', lines[0])
+        self.assertFalse(lines[1:])
+        self.assertFalse(sharder.logger.get_lines_for_level('error'))
+        self.assertFalse(broker.is_deleted())
+
+        # own shard range bounds don't match what's in root (e.g. this shard is
+        # expanding to be an acceptor)
+        expected_stats = {'attempted': 1, 'success': 1, 'failure': 0}
+        with mock_timestamp_now(next(self.ts_iter)):
+            own_shard_range = broker.get_own_shard_range()  # get the default
+        own_shard_range.lower = 'j'
+        own_shard_range.upper = 'k'
+        own_shard_range.name = broker.path
+        broker.merge_shard_ranges([own_shard_range])
+        # bump timestamp of root shard range to be newer than own
+        root_ts = next(self.ts_iter)
+        self.assertTrue(shard_ranges[1].update_state(ShardRange.ACTIVE,
+                                                     state_timestamp=root_ts))
+        shard_ranges[1].timestamp = root_ts
+        with mock_timestamp_now():
+            sharder, mock_swift = self.call_audit_container(
+                broker, shard_ranges)
+        self._assert_stats(expected_stats, sharder, 'audit_shard')
+        self.assertEqual(['Updating own shard range from root, path: '
+                          '.shards_a/shard_c, db: %s' % broker.db_file],
+                         sharder.logger.get_lines_for_level('debug'))
+        expected = shard_ranges[1].copy()
+        self.assertEqual(
+            ['Updated own shard range from %s to %s, path: .shards_a/shard_c, '
+             'db: %s' % (own_shard_range, expected, broker.db_file)],
+            sharder.logger.get_lines_for_level('info'))
+        self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+        self.assertFalse(sharder.logger.get_lines_for_level('error'))
+        self.assertFalse(broker.is_deleted())
+        expected_headers = {'X-Backend-Record-Type': 'shard',
+                            'X-Newest': 'true',
+                            'X-Backend-Include-Deleted': 'True',
+                            'X-Backend-Override-Deleted': 'true',
+                            'X-Backend-Record-Shard-Format': 'full'}
+        params = {'format': 'json', 'marker': 'j', 'end_marker': 'k',
+                  'states': 'auditing'}
+        mock_swift.make_request.assert_called_once_with(
+            'GET', '/v1/a/c', expected_headers, acceptable_statuses=(2,),
+            params=params)
+        # own shard range bounds are updated from root version
+        own_shard_range = broker.get_own_shard_range()
+        self.assertEqual(ShardRange.ACTIVE, own_shard_range.state)
+        self.assertEqual(root_ts, own_shard_range.state_timestamp)
+        self.assertEqual('k', own_shard_range.lower)
+        self.assertEqual('t', own_shard_range.upper)
+        # check other shard ranges from root are not merged (not shrinking)
+        self.assertEqual([own_shard_range],
+                         broker.get_shard_ranges(include_own=True))
+
+        # move root version of own shard range to shrinking state
+        root_ts = next(self.ts_iter)
+        self.assertTrue(shard_ranges[1].update_state(ShardRange.SHRINKING,
+                                                     state_timestamp=root_ts))
+        # bump own shard range state timestamp so it is newer than root
+        own_ts = next(self.ts_iter)
+        own_shard_range = broker.get_own_shard_range()
+        own_shard_range.update_state(ShardRange.ACTIVE, state_timestamp=own_ts)
+        broker.merge_shard_ranges([own_shard_range])
+
+        sharder, mock_swift = self.call_audit_container(broker, shard_ranges)
+        self._assert_stats(expected_stats, sharder, 'audit_shard')
+        self.assertEqual(['Updating own shard range from root, path: '
+                          '.shards_a/shard_c, db: %s' % broker.db_file],
+                         sharder.logger.get_lines_for_level('debug'))
+        self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+        self.assertFalse(sharder.logger.get_lines_for_level('error'))
+        self.assertFalse(broker.is_deleted())
+        expected_headers = {'X-Backend-Record-Type': 'shard',
+                            'X-Newest': 'true',
+                            'X-Backend-Include-Deleted': 'True',
+                            'X-Backend-Override-Deleted': 'true',
+                            'X-Backend-Record-Shard-Format': 'full'}
+        params = {'format': 'json', 'marker': 'k', 'end_marker': 't',
+                  'states': 'auditing'}
+        mock_swift.make_request.assert_called_once_with(
+            'GET', '/v1/a/c', expected_headers, acceptable_statuses=(2,),
+            params=params)
+        # check own shard range bounds
+        own_shard_range = broker.get_own_shard_range()
+        # own shard range state has not changed (root is older)
+        self.assertEqual(ShardRange.ACTIVE, own_shard_range.state)
+        self.assertEqual(own_ts, own_shard_range.state_timestamp)
+        self.assertEqual('k', own_shard_range.lower)
+        self.assertEqual('t', own_shard_range.upper)
+
+        # reset own shard range bounds, failed response from root
+        expected_stats = {'attempted': 1, 'success': 1, 'failure': 0}
+        own_shard_range = broker.get_own_shard_range()  # get the default
+        own_shard_range.lower = 'j'
+        own_shard_range.upper = 'k'
+        own_shard_range.timestamp = next(self.ts_iter)
+        broker.merge_shard_ranges([own_shard_range])
+        sharder, mock_swift = self.call_audit_container(
+            broker, shard_ranges,
+            exc=internal_client.UnexpectedResponse('bad', 'resp'))
+        lines = sharder.logger.get_lines_for_level('warning')
+        self.assertIn('Failed to get shard ranges', lines[0])
+        self.assertIn('Audit warnings for shard', lines[1])
+        self.assertIn('path: %s, db: %s' % (broker.path, broker.db_file),
+                      lines[1])
+        self.assertNotIn('account not in shards namespace', lines[1])
+        self.assertNotIn('missing own shard range', lines[1])
+        self.assertNotIn('root has no matching shard range', lines[1])
+        self.assertIn('unable to get shard ranges from root', lines[1])
+        self._assert_stats(expected_stats, sharder, 'audit_shard')
+        self.assertFalse(lines[2:])
+        self.assertFalse(sharder.logger.get_lines_for_level('error'))
+        self.assertFalse(broker.is_deleted())
+        params = {'format': 'json', 'marker': 'j', 'end_marker': 'k',
+                  'states': 'auditing'}
+        mock_swift.make_request.assert_called_once_with(
+            'GET', '/v1/a/c', expected_headers, acceptable_statuses=(2,),
+            params=params)
+
+        # make own shard range match one in root, but different state
+        own_ts = next(self.ts_iter)
+        shard_ranges[1].timestamp = own_ts
+        own_shard_range = shard_ranges[1].copy()
+        broker.merge_shard_ranges([own_shard_range])
+        root_ts = next(self.ts_iter)
+        shard_ranges[1].update_state(ShardRange.SHARDING,
+                                     state_timestamp=root_ts)
+        with mock_timestamp_now():
+            sharder, mock_swift = self.call_audit_container(
+                broker, shard_ranges)
+        self.assert_no_audit_messages(sharder, mock_swift)
+        self.assertFalse(broker.is_deleted())
+        self.assertEqual(['Updating own shard range from root, path: '
+                          '.shards_a/shard_c, db: %s' % broker.db_file],
+                         sharder.logger.get_lines_for_level('debug'))
+        expected = shard_ranges[1].copy()
+        self.assertEqual(
+            ['Updated own shard range from %s to %s, path: .shards_a/shard_c, '
+             'db: %s' % (own_shard_range, expected, broker.db_file)],
+            sharder.logger.get_lines_for_level('info'))
+        # own shard range state is updated from root version
+        own_shard_range = broker.get_own_shard_range()
+        self.assertEqual(ShardRange.SHARDING, own_shard_range.state)
+        self.assertEqual(root_ts, own_shard_range.state_timestamp)
+
+        own_shard_range.update_state(ShardRange.SHARDED,
+                                     state_timestamp=next(self.ts_iter))
+        broker.merge_shard_ranges([own_shard_range])
+        sharder, mock_swift = self.call_audit_container(broker, shard_ranges)
+        self.assert_no_audit_messages(sharder, mock_swift)
+
+        own_shard_range.deleted = 1
+        own_shard_range.timestamp = next(self.ts_iter)
+        broker.merge_shard_ranges([own_shard_range])
+        # mocks for delete/reclaim time comparisons
+        with mock_timestamp_now(next(self.ts_iter)):
+            with mock.patch('swift.container.sharder.time.time',
+                            lambda: float(next(self.ts_iter))):
+                sharder, mock_swift = self.call_audit_container(broker,
+                                                                shard_ranges)
+        self.assert_no_audit_messages(sharder, mock_swift)
+        self.assertTrue(broker.is_deleted())
+
+    def test_audit_old_style_shard_container(self):
+        self._do_test_audit_shard_container('Root', 'a/c')
+
+    def test_audit_shard_container(self):
+        self._do_test_audit_shard_container('Quoted-Root', 'a/c')
+
+    def _do_test_audit_shard_container_merge_other_ranges(self, *args):
+        # verify that shard only merges other ranges from root when it is
+        # cleaving
+        shard_bounds = (
+            ('a', 'p'), ('k', 't'), ('p', 'u'))
+        shard_states = (
+            ShardRange.ACTIVE, ShardRange.ACTIVE, ShardRange.FOUND,
+        )
+        shard_ranges = self._make_shard_ranges(shard_bounds, shard_states)
+
+        def check_audit(own_state, root_state):
+            shard_container = 'shard_c_%s' % root_ts.normal
+            broker = self._make_broker(account='.shards_a',
+                                       container=shard_container)
+            broker.set_sharding_sysmeta(*args)
+            shard_ranges[1].name = broker.path
+
+            # make shard's own shard range match shard_ranges[1]
+            own_sr = shard_ranges[1]
+            expected_stats = {'attempted': 1, 'success': 1, 'failure': 0}
+            self.assertTrue(own_sr.update_state(own_state,
+                                                state_timestamp=own_ts))
+            own_sr.timestamp = own_ts
+            broker.merge_shard_ranges([shard_ranges[1]])
+
+            # bump state and timestamp of root shard_ranges[1] to be newer
+            self.assertTrue(shard_ranges[1].update_state(
+                root_state, state_timestamp=root_ts))
+            shard_ranges[1].timestamp = root_ts
+            sharder, mock_swift = self.call_audit_container(broker,
+                                                            shard_ranges)
+            self._assert_stats(expected_stats, sharder, 'audit_shard')
+            debug_lines = sharder.logger.get_lines_for_level('debug')
+            self.assertGreater(len(debug_lines), 0)
+            self.assertEqual(
+                'Updating own shard range from root, path: .shards_a/%s, '
+                'db: %s' % (shard_container, broker.db_file),
+                sharder.logger.get_lines_for_level('debug')[0])
+            self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+            self.assertFalse(sharder.logger.get_lines_for_level('error'))
+            self.assertFalse(broker.is_deleted())
+            expected_headers = {'X-Backend-Record-Type': 'shard',
+                                'X-Newest': 'true',
+                                'X-Backend-Include-Deleted': 'True',
+                                'X-Backend-Override-Deleted': 'true',
+                                'X-Backend-Record-Shard-Format': 'full'}
+            params = {'format': 'json', 'marker': 'k', 'end_marker': 't',
+                      'states': 'auditing'}
+            mock_swift.make_request.assert_called_once_with(
+                'GET', '/v1/a/c', expected_headers, acceptable_statuses=(2,),
+                params=params)
+            return broker, shard_ranges
+
+        # make root's copy of shard range newer than shard's local copy, so
+        # shard will always update its own shard range from root, and may merge
+        # other shard ranges
+        for own_state in ShardRange.STATES:
+            for root_state in ShardRange.STATES:
+                with self.subTest(own_state=own_state, root_state=root_state):
+                    own_ts = next(self.ts_iter)
+                    root_ts = next(self.ts_iter)
+                    broker, shard_ranges = check_audit(own_state, root_state)
+                    # own shard range is updated from newer root version
+                    own_shard_range = broker.get_own_shard_range()
+                    self.assertEqual(root_state, own_shard_range.state)
+                    self.assertEqual(root_ts, own_shard_range.state_timestamp)
+                    updated_ranges = broker.get_shard_ranges(include_own=True)
+                    if root_state in ShardRange.CLEAVING_STATES:
+                        # check other shard ranges from root are merged
+                        self.assertEqual(shard_ranges, updated_ranges)
+                    else:
+                        # check other shard ranges from root are not merged
+                        self.assertEqual(shard_ranges[1:2], updated_ranges)
+
+        # make root's copy of shard range older than shard's local copy, so
+        # shard will never update its own shard range from root, but may merge
+        # other shard ranges
+        for own_state in ShardRange.STATES:
+            for root_state in ShardRange.STATES:
+                with self.subTest(own_state=own_state, root_state=root_state):
+                    root_ts = next(self.ts_iter)
+                    own_ts = next(self.ts_iter)
+                    broker, shard_ranges = check_audit(own_state, root_state)
+                    # own shard range is not updated from older root version
+                    own_shard_range = broker.get_own_shard_range()
+                    self.assertEqual(own_state, own_shard_range.state)
+                    self.assertEqual(own_ts, own_shard_range.state_timestamp)
+                    updated_ranges = broker.get_shard_ranges(include_own=True)
+                    if own_state in ShardRange.CLEAVING_STATES:
+                        # check other shard ranges from root are merged
+                        self.assertEqual(shard_ranges, updated_ranges)
+                    else:
+                        # check other shard ranges from root are not merged
+                        self.assertEqual(shard_ranges[1:2], updated_ranges)
+
+    def test_audit_old_style_shard_container_merge_other_ranges(self):
+        self._do_test_audit_shard_container_merge_other_ranges('Root', 'a/c')
+
+    def test_audit_shard_container_merge_other_ranges(self):
+        self._do_test_audit_shard_container_merge_other_ranges('Quoted-Root',
+                                                               'a/c')
+
+    def _assert_merge_into_shard(self, own_shard_range, shard_ranges,
+                                 root_shard_ranges, expected, *args, **kwargs):
+        # create a shard broker, initialise with shard_ranges, run audit on it
+        # supplying given root_shard_ranges and verify that the broker ends up
+        # with expected shard ranges.
+        broker = self._make_broker(account=own_shard_range.account,
+                                   container=own_shard_range.container)
+        broker.set_sharding_sysmeta(*args)
+        broker.merge_shard_ranges([own_shard_range] + shard_ranges)
+        db_state = kwargs.get('db_state', UNSHARDED)
+        if db_state == SHARDING:
+            broker.set_sharding_state()
+        if db_state == SHARDED:
+            broker.set_sharding_state()
+            broker.set_sharded_state()
+        self.assertEqual(db_state, broker.get_db_state())
+        self.assertFalse(broker.is_root_container())
+
+        sharder, mock_swift = self.call_audit_container(
+            broker, root_shard_ranges)
+        expected_headers = {'X-Backend-Record-Type': 'shard',
+                            'X-Newest': 'true',
+                            'X-Backend-Include-Deleted': 'True',
+                            'X-Backend-Override-Deleted': 'true',
+                            'X-Backend-Record-Shard-Format': 'full'}
+        params = {'format': 'json', 'marker': 'a', 'end_marker': 'b',
+                  'states': 'auditing'}
+        mock_swift.make_request.assert_called_once_with(
+            'GET', '/v1/a/c', expected_headers, acceptable_statuses=(2,),
+            params=params)
+
+        self._assert_shard_ranges_equal(expected, broker.get_shard_ranges())
+        self.assertEqual(own_shard_range,
+                         broker.get_own_shard_range(no_default=True))
+        expected_stats = {'attempted': 1, 'success': 1, 'failure': 0}
+        self._assert_stats(expected_stats, sharder, 'audit_shard')
+        return sharder
+
+    def _do_test_audit_shard_root_ranges_not_merged(self, *args):
+        # Make root and other ranges that fully contain the shard namespace...
+        root_own_sr = ShardRange('a/c', next(self.ts_iter))
+        acceptor = ShardRange(
+            str(ShardName.create('.shards_a', 'c', 'c',
+                                 next(self.ts_iter), 1)),
+            next(self.ts_iter), 'a', 'c')
+
+        def do_test(own_state, acceptor_state, root_state):
+            acceptor_from_root = acceptor.copy(
+                timestamp=next(self.ts_iter), state=acceptor_state)
+            root_from_root = root_own_sr.copy(
+                timestamp=next(self.ts_iter), state=root_state)
+            with self.subTest(own_state=own_state,
+                              acceptor_state=acceptor_state,
+                              root_state=root_state):
+                own_sr_name = ShardName.create(
+                    '.shards_a', 'c', 'c', next(self.ts_iter), 0)
+                own_sr = ShardRange(
+                    str(own_sr_name), next(self.ts_iter), state=own_state,
+                    state_timestamp=next(self.ts_iter), lower='a', upper='b')
+                expected = existing = []
+                sharder = self._assert_merge_into_shard(
+                    own_sr, existing,
+                    [own_sr, acceptor_from_root, root_from_root],
+                    expected, *args)
+                self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+                self.assertFalse(sharder.logger.get_lines_for_level('error'))
+
+        for own_state in ShardRange.STATES:
+            if own_state in ShardRange.CLEAVING_STATES:
+                # cleaving states are covered by other tests
+                continue
+            for acceptor_state in ShardRange.STATES:
+                for root_state in ShardRange.STATES:
+                    do_test(own_state, acceptor_state, root_state)
+
+    def test_audit_old_style_shard_root_ranges_not_merged_not_cleaving(self):
+        # verify that other shard ranges from root are NOT merged into shard
+        # when it is NOT in a cleaving state
+        self._do_test_audit_shard_root_ranges_not_merged('Root', 'a/c')
+
+    def test_audit_shard_root_ranges_not_merged_not_cleaving(self):
+        # verify that other shard ranges from root are NOT merged into shard
+        # when it is NOT in a cleaving state
+        self._do_test_audit_shard_root_ranges_not_merged('Quoted-Root', 'a/c')
+
+    def test_audit_shard_root_ranges_with_own_merged_while_shrinking(self):
+        # Verify that shrinking shard will merge other ranges, but not
+        # in-ACTIVE root range.
+        # Make root and other ranges that fully contain the shard namespace...
+        root_own_sr = ShardRange('a/c', next(self.ts_iter))
+        acceptor = ShardRange(
+            str(ShardName.create('.shards_a', 'c', 'c',
+                                 next(self.ts_iter), 1)),
+            next(self.ts_iter), 'a', 'c')
+
+        def do_test(own_state, acceptor_state, root_state):
+            acceptor_from_root = acceptor.copy(
+                timestamp=next(self.ts_iter), state=acceptor_state)
+            root_from_root = root_own_sr.copy(
+                timestamp=next(self.ts_iter), state=root_state)
+            ts = next(self.ts_iter)
+            own_sr = ShardRange(
+                str(ShardName.create('.shards_a', 'c', 'c', ts, 0)),
+                ts, lower='a', upper='b', state=own_state, state_timestamp=ts)
+            expected = [acceptor_from_root]
+            with self.subTest(own_state=own_state,
+                              acceptor_state=acceptor_state,
+                              root_state=root_state):
+                sharder = self._assert_merge_into_shard(
+                    own_sr, [],
+                    # own sr is in ranges fetched from root
+                    [own_sr, acceptor_from_root, root_from_root],
+                    expected, 'Quoted-Root', 'a/c')
+                self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+                self.assertFalse(sharder.logger.get_lines_for_level('error'))
+
+        for own_state in ShardRange.SHRINKING_STATES:
+            for acceptor_state in ShardRange.STATES:
+                if acceptor_state in ShardRange.CLEAVING_STATES:
+                    # special case covered in other tests
+                    continue
+                for root_state in ShardRange.STATES:
+                    if root_state == ShardRange.ACTIVE:
+                        # special case: ACTIVE root *is* merged
+                        continue
+                    with self.subTest(own_state=own_state,
+                                      acceptor_state=acceptor_state,
+                                      root_state=root_state):
+                        do_test(own_state, acceptor_state, root_state)
+
+    def test_audit_shard_root_ranges_missing_own_merged_while_shrinking(self):
+        # Verify that shrinking shard will merge other ranges, but not
+        # in-ACTIVE root range, even when root does not have shard's own range.
+        # Make root and other ranges that fully contain the shard namespace...
+        root_own_sr = ShardRange('a/c', next(self.ts_iter))
+        acceptor = ShardRange(
+            str(ShardName.create('.shards_a', 'c', 'c',
+                                 next(self.ts_iter), 1)),
+            next(self.ts_iter), 'a', 'c')
+
+        def do_test(own_state, acceptor_state, root_state):
+            acceptor_from_root = acceptor.copy(
+                timestamp=next(self.ts_iter), state=acceptor_state)
+            root_from_root = root_own_sr.copy(
+                timestamp=next(self.ts_iter), state=root_state)
+            ts = next(self.ts_iter)
+            own_sr = ShardRange(
+                str(ShardName.create('.shards_a', 'c', 'c', ts, 0)),
+                ts, lower='a', upper='b', state=own_state, state_timestamp=ts)
+            expected = [acceptor_from_root]
+            with self.subTest(own_state=own_state,
+                              acceptor_state=acceptor_state,
+                              root_state=root_state):
+                sharder = self._assert_merge_into_shard(
+                    own_sr, [],
+                    # own sr is NOT in ranges fetched from root
+                    [acceptor_from_root, root_from_root],
+                    expected, 'Quoted-Root', 'a/c')
+                warning_lines = sharder.logger.get_lines_for_level('warning')
+                self.assertEqual(1, len(warning_lines))
+                self.assertIn('root has no matching shard range',
+                              warning_lines[0])
+                self.assertFalse(sharder.logger.get_lines_for_level('error'))
+
+        for own_state in ShardRange.SHRINKING_STATES:
+            for acceptor_state in ShardRange.STATES:
+                if acceptor_state in ShardRange.CLEAVING_STATES:
+                    # special case covered in other tests
+                    continue
+                for root_state in ShardRange.STATES:
+                    if root_state == ShardRange.ACTIVE:
+                        # special case: ACTIVE root *is* merged
+                        continue
+                    with self.subTest(own_state=own_state,
+                                      acceptor_state=acceptor_state,
+                                      root_state=root_state):
+                        do_test(own_state, acceptor_state, root_state)
+
+    def test_audit_shard_root_range_not_merged_while_shrinking(self):
+        # Verify that shrinking shard will not merge an in-active root range
+        def do_test(own_state, root_state):
+            root_own_sr = ShardRange('a/c', next(self.ts_iter),
+                                     state=ShardRange.SHARDED)
+            own_sr = ShardRange(
+                str(ShardName.create(
+                    '.shards_a', 'c', 'c', next(self.ts_iter), 0)),
+                next(self.ts_iter), 'a', 'b', state=own_state)
+            expected = []
+            sharder = self._assert_merge_into_shard(
+                own_sr, [], [own_sr, root_own_sr],
+                expected, 'Quoted-Root', 'a/c')
+            self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+            self.assertFalse(sharder.logger.get_lines_for_level('error'))
+
+        for own_state in ShardRange.SHRINKING_STATES:
+            for root_state in ShardRange.STATES:
+                if root_state == ShardRange.ACTIVE:
+                    continue  # special case tested below
+                with self.subTest(own_state=own_state, root_state=root_state):
+                    do_test(own_state, root_state)
+
+    def test_audit_shard_root_range_overlap_not_merged_while_shrinking(self):
+        # Verify that shrinking shard will not merge an active root range that
+        # overlaps with an exosting sub-shard
+        def do_test(own_state):
+            root_own_sr = ShardRange('a/c', next(self.ts_iter),
+                                     state=ShardRange.ACTIVE)
+            own_sr = ShardRange(
+                str(ShardName.create(
+                    '.shards_a', 'c', 'c', next(self.ts_iter), 0)),
+                next(self.ts_iter), 'a', 'b', state=own_state)
+            ts = next(self.ts_iter)
+            sub_shard = ShardRange(
+                str(ShardName.create(
+                    '.shards_a', 'c', own_sr.container, ts, 0)),
+                ts, lower='a', upper='ab', state=ShardRange.ACTIVE)
+            expected = [sub_shard]
+            sharder = self._assert_merge_into_shard(
+                own_sr, [sub_shard], [own_sr, root_own_sr],
+                expected, 'Quoted-Root', 'a/c')
+            self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+            self.assertFalse(sharder.logger.get_lines_for_level('error'))
+
+        for own_state in ShardRange.SHRINKING_STATES:
+            with self.subTest(own_state=own_state):
+                do_test(own_state)
+
+    def test_audit_shard_active_root_range_merged_while_shrinking(self):
+        # Verify that shrinking shard will merge an active root range
+        def do_test(own_state):
+            root_own_sr = ShardRange('a/c', next(self.ts_iter),
+                                     state=ShardRange.ACTIVE)
+            own_sr = ShardRange(
+                str(ShardName.create(
+                    '.shards_a', 'c', 'c', next(self.ts_iter), 0)),
+                next(self.ts_iter), 'a', 'b', state=own_state)
+            expected = [root_own_sr]
+            sharder = self._assert_merge_into_shard(
+                own_sr, [], [own_sr, root_own_sr],
+                expected, 'Quoted-Root', 'a/c')
+            self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+            self.assertFalse(sharder.logger.get_lines_for_level('error'))
+
+        for own_state in ShardRange.SHRINKING_STATES:
+            with self.subTest(own_state=own_state):
+                do_test(own_state)
+
+    def test_audit_shard_root_ranges_fetch_fails_while_shrinking(self):
+        # check audit copes with failed response while shard is shrinking
+        broker = self._make_shrinking_broker(lower='a', upper='b')
+        own_sr = broker.get_own_shard_range()
+        sharder, mock_swift = self.call_audit_container(
+            broker, [], exc=internal_client.UnexpectedResponse('bad', 'resp'))
+        self.assertEqual([], broker.get_shard_ranges())
+        self.assertEqual(own_sr, broker.get_own_shard_range(no_default=True))
+        expected_stats = {'attempted': 1, 'success': 1, 'failure': 0}
+        self._assert_stats(expected_stats, sharder, 'audit_shard')
+        warning_lines = sharder.logger.get_lines_for_level('warning')
+        self.assertEqual(2, len(warning_lines))
+        self.assertIn('Failed to get shard ranges from a/c: bad',
+                      warning_lines[0])
+        self.assertIn('unable to get shard ranges from root',
+                      warning_lines[1])
+        self.assertFalse(sharder.logger.get_lines_for_level('error'))
+
+    def test_audit_shard_root_ranges_merge_while_unsharded(self):
+        # Verify that unsharded shard with no existing shard ranges will merge
+        # other ranges, but not root range.
+        root_own_sr = ShardRange('a/c', next(self.ts_iter))
+        acceptor = ShardRange(
+            str(ShardRange.make_path(
+                '.shards_a', 'c', 'c', next(self.ts_iter), 1)),
+            next(self.ts_iter), 'a', 'c', state=ShardRange.ACTIVE)
+
+        def do_test(own_state, acceptor_state, root_state):
+            acceptor_from_root = acceptor.copy(
+                timestamp=next(self.ts_iter), state=acceptor_state)
+            own_sr = ShardRange(
+                str(ShardName.create(
+                    '.shards_a', 'c', 'c', next(self.ts_iter), 0)),
+                next(self.ts_iter), 'a', 'b', state=own_state)
+            root_from_root = root_own_sr.copy(
+                timestamp=next(self.ts_iter), state=root_state)
+            expected = [acceptor_from_root]
+            sharder = self._assert_merge_into_shard(
+                own_sr, [],
+                [own_sr, acceptor_from_root, root_from_root],
+                expected, 'Quoted-Root', 'a/c')
+            self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+            self.assertFalse(sharder.logger.get_lines_for_level('error'))
+
+        for own_state in ShardRange.SHARDING_STATES:
+            for acceptor_state in ShardRange.STATES:
+                if acceptor_state in ShardRange.CLEAVING_STATES:
+                    # special case covered in other tests
+                    continue
+                for root_state in ShardRange.STATES:
+                    with self.subTest(
+                            own_state=own_state,
+                            acceptor_state=acceptor_state,
+                            root_state=root_state):
+                        do_test(own_state, acceptor_state, root_state)
+
+    def test_audit_shard_root_ranges_merge_while_sharding(self):
+        # Verify that sharding shard with no existing shard ranges will merge
+        # other ranges, but not root range.
+        root_own_sr = ShardRange('a/c', next(self.ts_iter))
+        acceptor = ShardRange(
+            str(ShardRange.make_path(
+                '.shards_a', 'c', 'c', next(self.ts_iter), 1)),
+            next(self.ts_iter), 'a', 'c', state=ShardRange.ACTIVE)
+
+        def do_test(own_state, acceptor_state, root_state):
+            acceptor_from_root = acceptor.copy(
+                timestamp=next(self.ts_iter), state=acceptor_state)
+            ts = next(self.ts_iter)
+            own_sr = ShardRange(
+                str(ShardName.create(
+                    '.shards_a', 'c', 'c', ts, 0)),
+                ts, 'a', 'b', epoch=ts, state=own_state)
+            root_from_root = root_own_sr.copy(
+                timestamp=next(self.ts_iter), state=root_state)
+            expected = [acceptor_from_root]
+            sharder = self._assert_merge_into_shard(
+                own_sr, [],
+                [own_sr, acceptor_from_root, root_from_root],
+                expected, 'Quoted-Root', 'a/c', db_state=SHARDING)
+            self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+            self.assertFalse(sharder.logger.get_lines_for_level('error'))
+
+        for own_state in ShardRange.SHARDING_STATES:
+            for acceptor_state in ShardRange.STATES:
+                if acceptor_state in ShardRange.CLEAVING_STATES:
+                    # special case covered in other tests
+                    continue
+                for root_state in ShardRange.STATES:
+                    with self.subTest(
+                            own_state=own_state,
+                            acceptor_state=acceptor_state,
+                            root_state=root_state):
+                        do_test(own_state, acceptor_state, root_state)
+
+    def test_audit_shard_root_ranges_not_merged_once_sharded(self):
+        # Verify that sharded shard will not merge other ranges from root
+        root_own_sr = ShardRange('a/c', next(self.ts_iter))
+        # the acceptor complements the single existing sub-shard...
+        other_sub_shard = ShardRange(
+            str(ShardRange.make_path(
+                '.shards_a', 'c', 'c', next(self.ts_iter), 1)),
+            next(self.ts_iter), 'ab', 'c', state=ShardRange.ACTIVE)
+
+        def do_test(own_state, other_sub_shard_state, root_state):
+            sub_shard_from_root = other_sub_shard.copy(
+                timestamp=next(self.ts_iter), state=other_sub_shard_state)
+            ts = next(self.ts_iter)
+            own_sr = ShardRange(
+                str(ShardName.create(
+                    '.shards_a', 'c', 'c', ts, 0)),
+                ts, 'a', 'b', epoch=ts, state=own_state)
+            ts = next(self.ts_iter)
+            sub_shard = ShardRange(
+                str(ShardName.create(
+                    '.shards_a', 'c', own_sr.container, ts, 0)),
+                ts, lower='a', upper='ab', state=ShardRange.ACTIVE)
+            root_from_root = root_own_sr.copy(
+                timestamp=next(self.ts_iter), state=root_state)
+            expected = [sub_shard]
+            sharder = self._assert_merge_into_shard(
+                own_sr, [sub_shard],
+                [own_sr, sub_shard_from_root, root_from_root],
+                expected, 'Quoted-Root', 'a/c', db_state=SHARDED)
+            self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+            self.assertFalse(sharder.logger.get_lines_for_level('error'))
+
+        for own_state in (ShardRange.SHARDED, ShardRange.SHRUNK):
+            for other_sub_shard_state in ShardRange.STATES:
+                for root_state in ShardRange.STATES:
+                    with self.subTest(
+                            own_state=own_state,
+                            other_sub_shard_state=other_sub_shard_state,
+                            root_state=root_state):
+                        do_test(own_state, other_sub_shard_state, root_state)
+
+    def test_audit_shard_root_ranges_replace_existing_while_cleaving(self):
+        # Verify that sharding shard with stale existing sub-shard ranges will
+        # merge other ranges, but not root range.
+        root_own_sr = ShardRange('a/c', next(self.ts_iter),
+                                 state=ShardRange.SHARDED)
+        acceptor = ShardRange(
+            str(ShardRange.make_path(
+                '.shards_a', 'c', 'c', next(self.ts_iter), 1)),
+            next(self.ts_iter), 'a', 'c', state=ShardRange.ACTIVE)
+        ts = next(self.ts_iter)
+        acceptor_sub_shards = [ShardRange(
+            str(ShardRange.make_path(
+                '.shards_a', 'c', acceptor.container, ts, i)),
+            ts, lower, upper, state=ShardRange.ACTIVE)
+            for i, lower, upper in ((0, 'a', 'ab'), (1, 'ab', 'c'))]
+
+        # shard has incomplete existing shard ranges, ranges from root delete
+        # existing sub-shard and replace with other acceptor sub-shards
+        def do_test(own_state):
+            own_sr = ShardRange(
+                str(ShardName.create(
+                    '.shards_a', 'c', 'c', next(self.ts_iter), 0)),
+                next(self.ts_iter), 'a', 'b', state=own_state)
+            ts = next(self.ts_iter)
+            sub_shard = ShardRange(
+                str(ShardName.create(
+                    '.shards_a', 'c', own_sr.container, ts, 0)),
+                ts, lower='a', upper='ab', state=ShardRange.ACTIVE)
+            deleted_sub_shard = sub_shard.copy(
+                timestamp=next(self.ts_iter), state=ShardRange.SHARDED,
+                deleted=1)
+            expected = acceptor_sub_shards
+            sharder = self._assert_merge_into_shard(
+                own_sr, [sub_shard],
+                [root_own_sr, own_sr, deleted_sub_shard] + acceptor_sub_shards,
+                expected, 'Quoted-Root', 'a/c')
+            self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+            self.assertFalse(sharder.logger.get_lines_for_level('error'))
+
+        for own_state in ShardRange.CLEAVING_STATES:
+            with self.subTest(own_state=own_state):
+                do_test(own_state)
+
+    def test_audit_shard_root_ranges_supplement_deleted_while_cleaving(self):
+        # Verify that sharding shard with deleted existing sub-shard ranges
+        # will merge other ranges while sharding, but not root range.
+        root_own_sr = ShardRange('a/c', next(self.ts_iter),
+                                 state=ShardRange.SHARDED)
+        acceptor = ShardRange(
+            str(ShardRange.make_path(
+                '.shards_a', 'c', 'c', next(self.ts_iter), 1)),
+            next(self.ts_iter), 'a', 'c', state=ShardRange.ACTIVE)
+        ts = next(self.ts_iter)
+        acceptor_sub_shards = [ShardRange(
+            str(ShardRange.make_path(
+                '.shards_a', 'c', acceptor.container, ts, i)),
+            ts, lower, upper, state=ShardRange.ACTIVE)
+            for i, lower, upper in ((0, 'a', 'ab'), (1, 'ab', 'c'))]
+
+        # shard already has deleted existing shard ranges
+        expected = acceptor_sub_shards
+
+        def do_test(own_state):
+            own_sr = ShardRange(
+                str(ShardName.create(
+                    '.shards_a', 'c', 'c', next(self.ts_iter), 0)),
+                next(self.ts_iter), 'a', 'b', state=own_state)
+            ts = next(self.ts_iter)
+            deleted_sub_shards = [ShardRange(
+                str(ShardName.create(
+                    '.shards_a', 'c', own_sr.container, ts, i)),
+                ts, lower, upper, state=ShardRange.SHARDED, deleted=1)
+                for i, lower, upper in ((0, 'a', 'ab'), (1, 'ab', 'b'))]
+            sharder = self._assert_merge_into_shard(
+                own_sr, deleted_sub_shards,
+                [own_sr, root_own_sr] + acceptor_sub_shards,
+                expected, 'Quoted-Root', 'a/c')
+            self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+            self.assertFalse(sharder.logger.get_lines_for_level('error'))
+
+        for own_state in ShardRange.CLEAVING_STATES:
+            with self.subTest(own_state=own_state):
+                do_test(own_state)
+
+    def test_audit_shard_root_ranges_supplement_existing_while_cleaving(self):
+        # Verify that sharding shard with incomplete existing sub-shard ranges
+        # will merge other ranges that fill the gap, but not root range.
+        root_own_sr = ShardRange('a/c', next(self.ts_iter),
+                                 state=ShardRange.SHARDED)
+        acceptor = ShardRange(
+            str(ShardRange.make_path(
+                '.shards_a', 'c', 'c', next(self.ts_iter), 1)),
+            next(self.ts_iter), 'a', 'c', state=ShardRange.ACTIVE)
+        ts = next(self.ts_iter)
+        acceptor_sub_shards = [ShardRange(
+            str(ShardRange.make_path(
+                '.shards_a', 'c', acceptor.container, ts, i)),
+            ts, lower, upper, state=ShardRange.ACTIVE)
+            for i, lower, upper in ((0, 'a', 'ab'), (1, 'ab', 'c'))]
+
+        # shard has incomplete existing shard ranges and range from root fills
+        # the gap
+        def do_test(own_state):
+            own_sr = ShardRange(
+                str(ShardName.create(
+                    '.shards_a', 'c', 'c', next(self.ts_iter), 0)),
+                next(self.ts_iter), 'a', 'b', state=own_state)
+            ts = next(self.ts_iter)
+            sub_shard = ShardRange(
+                str(ShardName.create(
+                    '.shards_a', 'c', own_sr.container, ts, 0)),
+                ts, lower='a', upper='ab', state=ShardRange.ACTIVE)
+            expected = [sub_shard] + acceptor_sub_shards[1:]
+            sharder = self._assert_merge_into_shard(
+                own_sr, [sub_shard],
+                [own_sr, root_own_sr] + acceptor_sub_shards[1:],
+                expected, 'Quoted-Root', 'a/c')
+            self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+            self.assertFalse(sharder.logger.get_lines_for_level('error'))
+
+        for own_state in ShardRange.CLEAVING_STATES:
+            with self.subTest(own_state=own_state):
+                do_test(own_state)
+
+    def test_audit_shard_root_ranges_cleaving_not_merged_while_cleaving(self):
+        # Verify that sharding shard will not merge other ranges that are in a
+        # cleaving state.
+        root_own_sr = ShardRange('a/c', next(self.ts_iter),
+                                 state=ShardRange.SHARDED)
+        acceptor = ShardRange(
+            str(ShardRange.make_path(
+                '.shards_a', 'c', 'c', next(self.ts_iter), 1)),
+            next(self.ts_iter), 'a', 'c', state=ShardRange.ACTIVE)
+
+        def do_test(own_state, acceptor_state, root_state):
+            own_sr = ShardRange(
+                str(ShardName.create(
+                    '.shards_a', 'c', 'c', next(self.ts_iter), 0)),
+                next(self.ts_iter), 'a', 'b', state=own_state)
+            root_from_root = root_own_sr.copy(
+                timestamp=next(self.ts_iter), state=root_state)
+            acceptor_from_root = acceptor.copy(
+                timestamp=next(self.ts_iter), state=acceptor_state)
+
+            if (own_state in ShardRange.SHRINKING_STATES and
+                    root_state == ShardRange.ACTIVE):
+                # special case: when shrinking, ACTIVE root shard *is* merged
+                expected = [root_from_root]
+            else:
+                expected = []
+
+            sharder = self._assert_merge_into_shard(
+                own_sr, [],
+                [own_sr, acceptor_from_root, root_from_root],
+                expected, 'Quoted-Root', 'a/c')
+            self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+            self.assertFalse(sharder.logger.get_lines_for_level('error'))
+
+        # ranges from root that are in a cleaving state are not merged...
+        for own_state in ShardRange.CLEAVING_STATES:
+            for acceptor_state in ShardRange.CLEAVING_STATES:
+                for root_state in ShardRange.STATES:
+                    with self.subTest(
+                            own_state=own_state,
+                            acceptor_state=acceptor_state,
+                            root_state=root_state):
+                        do_test(own_state, acceptor_state, root_state)
+
+    def test_audit_shard_root_ranges_overlap_not_merged_while_cleaving_1(self):
+        # Verify that sharding/shrinking shard will not merge other ranges that
+        # would create an overlap; shard has complete existing shard ranges,
+        # newer range from root ignored
+        root_own_sr = ShardRange('a/c', next(self.ts_iter),
+                                 state=ShardRange.SHARDED)
+        acceptor = ShardRange(
+            str(ShardRange.make_path(
+                '.shards_a', 'c', 'c', next(self.ts_iter), 1)),
+            next(self.ts_iter), 'a', 'c', state=ShardRange.ACTIVE)
+
+        def do_test(own_state):
+            own_sr = ShardRange(
+                str(ShardName.create(
+                    '.shards_a', 'c', 'c', next(self.ts_iter), 0)),
+                next(self.ts_iter), 'a', 'b', state=own_state)
+            ts = next(self.ts_iter)
+            sub_shards = [ShardRange(
+                str(ShardName.create(
+                    '.shards_a', 'c', own_sr.container, ts, i)),
+                ts, lower, upper, state=ShardRange.ACTIVE)
+                for i, lower, upper in ((0, 'a', 'ab'), (1, 'ab', 'b'))]
+            acceptor_from_root = acceptor.copy(timestamp=next(self.ts_iter))
+            expected = sub_shards
+            sharder = self._assert_merge_into_shard(
+                own_sr, sub_shards,
+                [own_sr, acceptor_from_root, root_own_sr],
+                expected, 'Quoted-Root', 'a/c')
+            self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+            self.assertFalse(sharder.logger.get_lines_for_level('error'))
+
+        for own_state in ShardRange.CLEAVING_STATES:
+            with self.subTest(own_state=own_state):
+                do_test(own_state)
+
+    def test_audit_shard_root_ranges_overlap_not_merged_while_cleaving_2(self):
+        # Verify that sharding/shrinking shard will not merge other ranges that
+        # would create an overlap; shard has incomplete existing shard ranges
+        # but ranges from root overlaps
+        root_own_sr = ShardRange('a/c', next(self.ts_iter),
+                                 state=ShardRange.SHARDED)
+        acceptor = ShardRange(
+            str(ShardRange.make_path(
+                '.shards_a', 'c', 'c', next(self.ts_iter), 1)),
+            next(self.ts_iter), 'a', 'c', state=ShardRange.ACTIVE)
+        ts = next(self.ts_iter)
+        acceptor_sub_shards = [ShardRange(
+            str(ShardRange.make_path(
+                '.shards_a', 'c', acceptor.container, ts, i)),
+            ts, lower, upper, state=ShardRange.ACTIVE)
+            for i, lower, upper in ((0, 'a', 'ab'), (1, 'ab', 'c'))]
+
+        def do_test(own_state):
+            own_sr = ShardRange(
+                str(ShardName.create(
+                    '.shards_a', 'c', 'c', next(self.ts_iter), 0)),
+                next(self.ts_iter), 'a', 'b', state=own_state)
+            ts = next(self.ts_iter)
+            sub_shard = ShardRange(
+                str(ShardName.create(
+                    '.shards_a', 'c', own_sr.container, ts, 0)),
+                ts, lower='a', upper='abc', state=ShardRange.ACTIVE)
+            expected = [sub_shard]
+            sharder = self._assert_merge_into_shard(
+                own_sr, [sub_shard],
+                acceptor_sub_shards[1:] + [own_sr, root_own_sr],
+                expected, 'Quoted-Root', 'a/c')
+            self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+            self.assertFalse(sharder.logger.get_lines_for_level('error'))
+
+        for own_state in ShardRange.CLEAVING_STATES:
+            with self.subTest(own_state=own_state):
+                do_test(own_state)
+
+    def test_audit_shard_root_ranges_with_gap_not_merged_while_cleaving(self):
+        # Verify that sharding/shrinking shard will not merge other ranges that
+        # would leave a gap.
+        root_own_sr = ShardRange('a/c', next(self.ts_iter),
+                                 state=ShardRange.SHARDED)
+        acceptor = ShardRange(
+            str(ShardRange.make_path(
+                '.shards_a', 'c', 'c', next(self.ts_iter), 1)),
+            next(self.ts_iter), 'a', 'c', state=ShardRange.ACTIVE)
+        ts = next(self.ts_iter)
+        acceptor_sub_shards = [ShardRange(
+            str(ShardRange.make_path(
+                '.shards_a', 'c', acceptor.container, ts, i)),
+            ts, lower, upper, state=ShardRange.ACTIVE)
+            for i, lower, upper in ((0, 'a', 'ab'), (1, 'ab', 'c'))]
+
+        def do_test(own_state):
+            own_sr = ShardRange(
+                str(ShardName.create(
+                    '.shards_a', 'c', 'c', next(self.ts_iter), 0)),
+                next(self.ts_iter), 'a', 'b', state=own_state)
+            # root ranges have gaps w.r.t. the shard namespace
+            existing = expected = []
+            sharder = self._assert_merge_into_shard(
+                own_sr, existing,
+                acceptor_sub_shards[:1] + [own_sr, root_own_sr],
+                expected, 'Quoted-Root', 'a/c')
+            self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+            self.assertFalse(sharder.logger.get_lines_for_level('error'))
+
+        for own_state in ShardRange.CLEAVING_STATES:
+            with self.subTest(own_state=own_state):
+                do_test(own_state)
+
+    def test_audit_shard_container_ancestors_not_merged_while_sharding(self):
+        # Verify that sharding shard will not merge parent and root shard
+        # ranges even when the sharding shard has no other ranges
+        root_sr = ShardRange('a/root', next(self.ts_iter),
+                             state=ShardRange.SHARDED)
+        grandparent_path = ShardRange.make_path(
+            '.shards_a', 'root', root_sr.container, next(self.ts_iter), 2)
+        grandparent_sr = ShardRange(grandparent_path, next(self.ts_iter),
+                                    '', 'd', state=ShardRange.ACTIVE)
+        self.assertTrue(grandparent_sr.is_child_of(root_sr))
+        parent_path = ShardRange.make_path(
+            '.shards_a', 'root', grandparent_sr.container, next(self.ts_iter),
+            2)
+        parent_sr = ShardRange(parent_path, next(self.ts_iter), '', 'd',
+                               state=ShardRange.ACTIVE)
+        self.assertTrue(parent_sr.is_child_of(grandparent_sr))
+        child_path = ShardRange.make_path(
+            '.shards_a', 'root', parent_sr.container, next(self.ts_iter), 2)
+        child_own_sr = ShardRange(child_path, next(self.ts_iter), 'a', 'b',
+                                  state=ShardRange.SHARDING)
+        self.assertTrue(child_own_sr.is_child_of(parent_sr))
+
+        ranges_from_root = [grandparent_sr, parent_sr, root_sr, child_own_sr]
+        expected = []
+        sharder = self._assert_merge_into_shard(
+            child_own_sr, [], ranges_from_root, expected, 'Quoted-Root', 'a/c')
+        self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+        self.assertFalse(sharder.logger.get_lines_for_level('error'))
+
+    def test_audit_shard_container_children_merged_while_sharding(self):
+        # Verify that sharding shard will always merge children shard ranges
+        def do_test(child_deleted, child_state):
+            root_sr = ShardRange('a/root', next(self.ts_iter),
+                                 state=ShardRange.SHARDED)
+            parent_path = ShardRange.make_path(
+                '.shards_a', 'root', root_sr.container,
+                next(self.ts_iter), 2)
+            parent_sr = ShardRange(
+                parent_path, next(self.ts_iter), 'a', 'd',
+                state=ShardRange.SHARDING)
+            child_srs = []
+            for i, lower, upper in ((0, 'a', 'b'), (0, 'b', 'd')):
+                child_path = ShardRange.make_path(
+                    '.shards_a', 'root', parent_sr.container,
+                    next(self.ts_iter), i)
+                child_sr = ShardRange(
+                    child_path, next(self.ts_iter), lower, upper,
+                    state=child_state, deleted=child_deleted)
+                self.assertTrue(child_sr.is_child_of(parent_sr))
+                child_srs.append(child_sr)
+            other_path = ShardRange.make_path(
+                '.shards_a', 'root', root_sr.container,
+                next(self.ts_iter), 3)  # different index w.r.t. parent
+            other_sr = ShardRange(
+                other_path, next(self.ts_iter), 'a', 'd',
+                state=ShardRange.ACTIVE)
+            self.assertFalse(other_sr.is_child_of(parent_sr))
+
+            # the parent is sharding...
+            broker = self._make_broker(account=parent_sr.account,
+                                       container=parent_sr.container)
+            broker.set_sharding_sysmeta('Quoted-Root', 'a/c')
+            broker.merge_shard_ranges(parent_sr)
+            self.assertEqual(UNSHARDED, broker.get_db_state())
+            self.assertEqual([parent_sr],
+                             broker.get_shard_ranges(include_own=True))
+
+            ranges_from_root = child_srs + [parent_sr, root_sr, other_sr]
+            sharder, mock_swift = self.call_audit_container(
+                broker, ranges_from_root)
+            expected_headers = {'X-Backend-Record-Type': 'shard',
+                                'X-Newest': 'true',
+                                'X-Backend-Include-Deleted': 'True',
+                                'X-Backend-Override-Deleted': 'true',
+                                'X-Backend-Record-Shard-Format': 'full'}
+            params = {'format': 'json', 'marker': 'a', 'end_marker': 'd',
+                      'states': 'auditing'}
+            mock_swift.make_request.assert_called_once_with(
+                'GET', '/v1/a/c', expected_headers,
+                acceptable_statuses=(2,), params=params)
+
+            expected = child_srs + [parent_sr]
+            if child_deleted:
+                expected.append(other_sr)
+            self._assert_shard_ranges_equal(
+                sorted(expected, key=ShardRange.sort_key),
+                sorted(broker.get_shard_ranges(
+                    include_own=True, include_deleted=True),
+                    key=ShardRange.sort_key))
+            expected_stats = {'attempted': 1, 'success': 1, 'failure': 0}
+            self._assert_stats(expected_stats, sharder, 'audit_shard')
+            self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+            self.assertFalse(sharder.logger.get_lines_for_level('error'))
+
+        for child_deleted in (False, True):
+            for child_state in ShardRange.STATES:
+                with self.subTest(child_deleted=child_deleted,
+                                  child_state=child_state):
+                    do_test(child_deleted, child_state)
+
+    def test_audit_shard_container_children_not_merged_once_sharded(self):
+        # Verify that sharding shard will not merge children shard ranges
+        # once the DB is sharded (but continues to merge own shard range
+        # received from root)
+        root_sr = ShardRange('a/root', next(self.ts_iter),
+                             state=ShardRange.SHARDED)
+        ts = next(self.ts_iter)
+        parent_path = ShardRange.make_path(
+            '.shards_a', 'root', root_sr.container, ts, 2)
+        parent_sr = ShardRange(
+            parent_path, ts, 'a', 'b', state=ShardRange.ACTIVE, epoch=ts)
+        child_srs = []
+        for i, lower, upper in ((0, 'a', 'ab'), (0, 'ab', 'b')):
+            child_path = ShardRange.make_path(
+                '.shards_a', 'root', parent_sr.container,
+                next(self.ts_iter), i)
+            child_sr = ShardRange(
+                child_path, next(self.ts_iter), lower, upper,
+                state=ShardRange.CLEAVED)
+            self.assertTrue(child_sr.is_child_of(parent_sr))
+            child_srs.append(child_sr)
+
+        # DB is unsharded...
+        broker = self._make_broker(account=parent_sr.account,
+                                   container=parent_sr.container)
+        broker.set_sharding_sysmeta('Quoted-Root', 'a/c')
+        broker.merge_shard_ranges(parent_sr)
+        self.assertEqual(UNSHARDED, broker.get_db_state())
+
+        self.assertTrue(parent_sr.update_state(
+            ShardRange.SHARDING, state_timestamp=next(self.ts_iter)))
+        ranges_from_root = child_srs + [parent_sr, root_sr]
+        sharder, _ = self.call_audit_container(broker, ranges_from_root)
+
+        # children ranges from root are merged
+        self._assert_shard_ranges_equal(child_srs, broker.get_shard_ranges())
+        # own sr from root is merged
+        self.assertEqual(dict(parent_sr), dict(broker.get_own_shard_range()))
+        self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+        self.assertFalse(sharder.logger.get_lines_for_level('error'))
+
+        # DB is sharding...
+        self.assertTrue(broker.set_sharding_state())
+        self.assertEqual(SHARDING, broker.get_db_state())
+        parent_sr.state_timestamp = next(self.ts_iter)
+        for child_sr in child_srs:
+            child_sr.update_state(ShardRange.ACTIVE,
+                                  state_timestamp=next(self.ts_iter))
+
+        sharder, _ = self.call_audit_container(broker, ranges_from_root)
+
+        # children ranges from root are merged
+        self._assert_shard_ranges_equal(child_srs, broker.get_shard_ranges())
+        # own sr from root is merged
+        self.assertEqual(dict(parent_sr), dict(broker.get_own_shard_range()))
+        self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+        self.assertFalse(sharder.logger.get_lines_for_level('error'))
+
+        # DB is sharded...
+        self.assertTrue(broker.set_sharded_state())
+        self.assertEqual(SHARDED, broker.get_db_state())
+        self.assertTrue(parent_sr.update_state(
+            ShardRange.SHARDED, state_timestamp=next(self.ts_iter)))
+        updated_child_srs = [
+            child_sr.copy(state=ShardRange.SHARDING,
+                          state_timestamp=next(self.ts_iter))
+            for child_sr in child_srs]
+
+        ranges_from_root = updated_child_srs + [parent_sr, root_sr]
+        sharder, _ = self.call_audit_container(broker, ranges_from_root)
+
+        # children ranges from root are NOT merged
+        self._assert_shard_ranges_equal(child_srs, broker.get_shard_ranges())
+        # own sr from root is merged
+        self.assertEqual(dict(parent_sr), dict(broker.get_own_shard_range()))
+        self.assertFalse(sharder.logger.get_lines_for_level('warning'))
+        self.assertFalse(sharder.logger.get_lines_for_level('error'))
+
+    def test_audit_shard_deleted_range_in_root_container(self):
+        # verify that shard DB is marked deleted when its own shard range is
+        # updated with deleted version from root
+        broker = self._make_broker(account='.shards_a', container='shard_c')
+        broker.set_sharding_sysmeta('Quoted-Root', 'a/c')
+        with mock_timestamp_now(next(self.ts_iter)):
+            own_shard_range = broker.get_own_shard_range()
+        own_shard_range.lower = 'k'
+        own_shard_range.upper = 't'
+        broker.merge_shard_ranges([own_shard_range])
+
+        self.assertFalse(broker.is_deleted())
+        self.assertFalse(broker.is_root_container())
+
+        shard_bounds = (
+            ('a', 'j'), ('k', 't'), ('k', 's'), ('l', 's'), ('s', 'z'))
+        shard_ranges = self._make_shard_ranges(shard_bounds, ShardRange.ACTIVE,
+                                               timestamp=next(self.ts_iter))
+        shard_ranges[1].name = broker.path
+        shard_ranges[1].update_state(ShardRange.SHARDED,
+                                     state_timestamp=next(self.ts_iter))
+        shard_ranges[1].deleted = 1
+
+        # mocks for delete/reclaim time comparisons
+        with mock_timestamp_now(next(self.ts_iter)):
+            with mock.patch('swift.container.sharder.time.time',
+                            lambda: float(next(self.ts_iter))):
+
+                sharder, mock_swift = self.call_audit_container(broker,
+                                                                shard_ranges)
+        self.assert_no_audit_messages(sharder, mock_swift)
+        self.assertTrue(broker.is_deleted())
+
+    def test_audit_shard_deleted_range_missing_from_root_container(self):
+        # verify that shard DB is marked deleted when its own shard range is
+        # marked deleted, despite receiving nothing from root
+        broker = self._make_broker(account='.shards_a', container='shard_c')
+        broker.set_sharding_sysmeta('Quoted-Root', 'a/c')
+        own_shard_range = broker.get_own_shard_range()
+        own_shard_range.lower = 'k'
+        own_shard_range.upper = 't'
+        own_shard_range.update_state(ShardRange.SHARDED,
+                                     state_timestamp=Timestamp.now())
+        own_shard_range.deleted = 1
+        broker.merge_shard_ranges([own_shard_range])
+
+        self.assertFalse(broker.is_deleted())
+        self.assertFalse(broker.is_root_container())
+
+        sharder, mock_swift = self.call_audit_container(broker, [])
+        self.assert_no_audit_messages(sharder, mock_swift)
+        self.assertTrue(broker.is_deleted())
+
+    def test_find_and_enable_sharding_candidates(self):
+        broker = self._make_broker()
+        broker.enable_sharding(next(self.ts_iter))
+        shard_bounds = (('', 'here'), ('here', 'there'), ('there', ''))
+        shard_ranges = self._make_shard_ranges(
+            shard_bounds, state=ShardRange.CLEAVED)
+        shard_ranges[0].state = ShardRange.ACTIVE
+        broker.merge_shard_ranges(shard_ranges)
+        self.assertTrue(broker.set_sharding_state())
+        self.assertTrue(broker.set_sharded_state())
+        with self._mock_sharder() as sharder:
+            sharder._find_and_enable_sharding_candidates(broker)
+
+        # one range just below threshold
+        shard_ranges[0].update_meta(sharder.shard_container_threshold - 1, 0)
+        broker.merge_shard_ranges(shard_ranges[0])
+        with self._mock_sharder() as sharder:
+            sharder._find_and_enable_sharding_candidates(broker)
+        self._assert_shard_ranges_equal(shard_ranges,
+                                        broker.get_shard_ranges())
+
+        # two ranges above threshold, only one ACTIVE
+        shard_ranges[0].update_meta(sharder.shard_container_threshold, 0)
+        shard_ranges[2].update_meta(sharder.shard_container_threshold + 1, 0)
+        broker.merge_shard_ranges([shard_ranges[0], shard_ranges[2]])
+        with self._mock_sharder() as sharder:
+            with mock_timestamp_now() as now:
+                sharder._find_and_enable_sharding_candidates(broker)
+        expected = shard_ranges[0].copy(state=ShardRange.SHARDING,
+                                        state_timestamp=now, epoch=now)
+        self._assert_shard_ranges_equal([expected] + shard_ranges[1:],
+                                        broker.get_shard_ranges())
+
+        # check idempotency
+        with self._mock_sharder() as sharder:
+            with mock_timestamp_now() as now:
+                sharder._find_and_enable_sharding_candidates(broker)
+        self._assert_shard_ranges_equal([expected] + shard_ranges[1:],
+                                        broker.get_shard_ranges())
+
+        # two ranges above threshold, both ACTIVE
+        shard_ranges[2].update_state(ShardRange.ACTIVE)
+        broker.merge_shard_ranges(shard_ranges[2])
+        with self._mock_sharder() as sharder:
+            with mock_timestamp_now() as now:
+                sharder._find_and_enable_sharding_candidates(broker)
+        expected_2 = shard_ranges[2].copy(state=ShardRange.SHARDING,
+                                          state_timestamp=now, epoch=now)
+        self._assert_shard_ranges_equal(
+            [expected, shard_ranges[1], expected_2], broker.get_shard_ranges())
+
+        # check idempotency
+        with self._mock_sharder() as sharder:
+            with mock_timestamp_now() as now:
+                sharder._find_and_enable_sharding_candidates(broker)
+        self._assert_shard_ranges_equal(
+            [expected, shard_ranges[1], expected_2], broker.get_shard_ranges())
+
+    def test_find_and_enable_sharding_candidates_bootstrap(self):
+        broker = self._make_broker()
+        with self._mock_sharder(
+                conf={'shard_container_threshold': 2}) as sharder:
+            sharder._find_and_enable_sharding_candidates(broker)
+        self.assertEqual(ShardRange.ACTIVE, broker.get_own_shard_range().state)
+        broker.put_object('obj1', next(self.ts_iter).internal, 1, '', '')
+        broker.put_object('obj2', next(self.ts_iter).internal, 1, '', '')
+        self.assertEqual(2, broker.get_info()['object_count'])
+        with self._mock_sharder(
+                conf={'shard_container_threshold': 2}) as sharder:
+            with mock_timestamp_now() as now:
+                own_sr = update_own_shard_range_stats(
+                    broker, broker.get_own_shard_range())
+                sharder._find_and_enable_sharding_candidates(
+                    broker, [own_sr])
+        own_sr = broker.get_own_shard_range()
+        self.assertEqual(ShardRange.SHARDING, own_sr.state)
+        self.assertEqual(now, own_sr.state_timestamp)
+        self.assertEqual(now, own_sr.epoch)
+
+        # check idempotency
+        with self._mock_sharder(
+                conf={'shard_container_threshold': 2}) as sharder:
+            with mock_timestamp_now():
+                own_sr = update_own_shard_range_stats(
+                    broker, broker.get_own_shard_range())
+                sharder._find_and_enable_sharding_candidates(
+                    broker, [own_sr])
+        own_sr = broker.get_own_shard_range()
+        self.assertEqual(ShardRange.SHARDING, own_sr.state)
+        self.assertEqual(now, own_sr.state_timestamp)
+        self.assertEqual(now, own_sr.epoch)
+
+    def test_find_and_enable_shrinking_candidates(self):
+        broker = self._make_broker()
+        broker.enable_sharding(next(self.ts_iter))
+        shard_bounds = (('', 'here'), ('here', 'there'), ('there', ''))
+        size = (DEFAULT_SHARDER_CONF['shrink_threshold'])
+
+        # all shard ranges too big to shrink
+        shard_ranges = self._make_shard_ranges(
+            shard_bounds, state=ShardRange.ACTIVE, object_count=size - 1,
+            tombstones=1)
+        own_sr = broker.get_own_shard_range()
+        own_sr.update_state(ShardRange.SHARDED, Timestamp.now())
+        broker.merge_shard_ranges(shard_ranges + [own_sr])
+        self.assertTrue(broker.set_sharding_state())
+        self.assertTrue(broker.set_sharded_state())
+        with self._mock_sharder() as sharder:
+            sharder._find_and_enable_shrinking_candidates(broker)
+        self._assert_shard_ranges_equal(shard_ranges,
+                                        broker.get_shard_ranges())
+
+        # one range just below threshold
+        shard_ranges[0].update_meta(size - 2, 0)
+        broker.merge_shard_ranges(shard_ranges[0])
+        with self._mock_sharder() as sharder:
+            with mock_timestamp_now() as now:
+                sharder._send_shard_ranges = mock.MagicMock()
+                sharder._find_and_enable_shrinking_candidates(broker)
+        acceptor = shard_ranges[1].copy(lower=shard_ranges[0].lower)
+        acceptor.timestamp = now
+        donor = shard_ranges[0].copy(state=ShardRange.SHRINKING,
+                                     state_timestamp=now, epoch=now)
+        self._assert_shard_ranges_equal([donor, acceptor, shard_ranges[2]],
+                                        broker.get_shard_ranges())
+        sharder._send_shard_ranges.assert_has_calls(
+            [mock.call(broker, acceptor.account, acceptor.container,
+                       [acceptor]),
+             mock.call(broker, donor.account, donor.container,
+                       [donor, acceptor])]
+        )
+
+        # check idempotency
+        with self._mock_sharder() as sharder:
+            with mock_timestamp_now() as now:
+                sharder._send_shard_ranges = mock.MagicMock()
+                sharder._find_and_enable_shrinking_candidates(broker)
+        self._assert_shard_ranges_equal([donor, acceptor, shard_ranges[2]],
+                                        broker.get_shard_ranges())
+        sharder._send_shard_ranges.assert_has_calls(
+            [mock.call(broker, acceptor.account, acceptor.container,
+                       [acceptor]),
+             mock.call(broker, donor.account, donor.container,
+                       [donor, acceptor])]
+        )
+
+        # acceptor falls below threshold - not a candidate
+        with self._mock_sharder() as sharder:
+            with mock_timestamp_now() as now:
+                acceptor.update_meta(0, 0, meta_timestamp=now)
+                broker.merge_shard_ranges(acceptor)
+                sharder._send_shard_ranges = mock.MagicMock()
+                sharder._find_and_enable_shrinking_candidates(broker)
+        self._assert_shard_ranges_equal([donor, acceptor, shard_ranges[2]],
+                                        broker.get_shard_ranges())
+        sharder._send_shard_ranges.assert_has_calls(
+            [mock.call(broker, acceptor.account, acceptor.container,
+                       [acceptor]),
+             mock.call(broker, donor.account, donor.container,
+                       [donor, acceptor])]
+        )
+
+        # ...until donor has shrunk
+        with self._mock_sharder() as sharder:
+            with mock_timestamp_now() as now:
+                donor.update_state(ShardRange.SHARDED, state_timestamp=now)
+                donor.set_deleted(timestamp=now)
+                broker.merge_shard_ranges(donor)
+                sharder._send_shard_ranges = mock.MagicMock()
+                sharder._find_and_enable_shrinking_candidates(broker)
+        new_acceptor = shard_ranges[2].copy(lower=acceptor.lower)
+        new_acceptor.timestamp = now
+        new_donor = acceptor.copy(state=ShardRange.SHRINKING,
+                                  state_timestamp=now, epoch=now)
+        self._assert_shard_ranges_equal(
+            [donor, new_donor, new_acceptor],
+            broker.get_shard_ranges(include_deleted=True))
+        sharder._send_shard_ranges.assert_has_calls(
+            [mock.call(broker, new_acceptor.account, new_acceptor.container,
+                       [new_acceptor]),
+             mock.call(broker, new_donor.account, new_donor.container,
+                       [new_donor, new_acceptor])]
+        )
+
+        # ..finally last shard shrinks to root
+        with self._mock_sharder() as sharder:
+            with mock_timestamp_now() as now:
+                new_donor.update_state(ShardRange.SHARDED, state_timestamp=now)
+                new_donor.set_deleted(timestamp=now)
+                new_acceptor.update_meta(0, 0, meta_timestamp=now)
+                broker.merge_shard_ranges([new_donor, new_acceptor])
+                sharder._send_shard_ranges = mock.MagicMock()
+                sharder._find_and_enable_shrinking_candidates(broker)
+        final_donor = new_acceptor.copy(state=ShardRange.SHRINKING,
+                                        state_timestamp=now, epoch=now)
+        self._assert_shard_ranges_equal(
+            [donor, new_donor, final_donor],
+            broker.get_shard_ranges(include_deleted=True))
+        sharder._send_shard_ranges.assert_has_calls(
+            [mock.call(broker, final_donor.account, final_donor.container,
+                       [final_donor, broker.get_own_shard_range()])]
+        )
+
+    def test_find_and_enable_multiple_shrinking_candidates(self):
+        broker = self._make_broker()
+        broker.enable_sharding(next(self.ts_iter))
+        shard_bounds = (('', 'a'), ('a', 'b'), ('b', 'c'),
+                        ('c', 'd'), ('d', 'e'), ('e', ''))
+        size = (DEFAULT_SHARDER_CONF['shrink_threshold'])
+        shard_ranges = self._make_shard_ranges(
+            shard_bounds, state=ShardRange.ACTIVE, object_count=size)
+        own_sr = broker.get_own_shard_range()
+        own_sr.update_state(ShardRange.SHARDED, Timestamp.now())
+        broker.merge_shard_ranges(shard_ranges + [own_sr])
+        self.assertTrue(broker.set_sharding_state())
+        self.assertTrue(broker.set_sharded_state())
+        with self._mock_sharder() as sharder:
+            sharder._find_and_enable_shrinking_candidates(broker)
+        self._assert_shard_ranges_equal(shard_ranges,
+                                        broker.get_shard_ranges())
+
+        # three ranges just below threshold
+        shard_ranges = broker.get_shard_ranges()  # get timestamps updated
+        shard_ranges[0].update_meta(size - 1, 0)
+        shard_ranges[1].update_meta(size - 1, 0)
+        shard_ranges[3].update_meta(size - 1, 0)
+        broker.merge_shard_ranges(shard_ranges)
+        with self._mock_sharder() as sharder:
+            with mock_timestamp_now() as now:
+                sharder._send_shard_ranges = mock.MagicMock()
+                sharder._find_and_enable_shrinking_candidates(broker)
+        # 0 shrinks into 1 (only one donor per acceptor is allowed)
+        shard_ranges[0].update_state(ShardRange.SHRINKING, state_timestamp=now)
+        shard_ranges[0].epoch = now
+        shard_ranges[1].lower = shard_ranges[0].lower
+        shard_ranges[1].timestamp = now
+        # 3 shrinks into 4
+        shard_ranges[3].update_state(ShardRange.SHRINKING, state_timestamp=now)
+        shard_ranges[3].epoch = now
+        shard_ranges[4].lower = shard_ranges[3].lower
+        shard_ranges[4].timestamp = now
+        self._assert_shard_ranges_equal(shard_ranges,
+                                        broker.get_shard_ranges())
+        for donor, acceptor in (shard_ranges[:2], shard_ranges[3:5]):
+            sharder._send_shard_ranges.assert_has_calls(
+                [mock.call(broker, acceptor.account, acceptor.container,
+                           [acceptor]),
+                 mock.call(broker, donor.account, donor.container,
+                           [donor, acceptor])]
+            )
+
+    def test_partition_and_device_filters(self):
+        # verify partitions and devices kwargs result in filtering of processed
+        # containers but not of the local device ids.
+        ring = FakeRing()
+        dev_ids = set()
+        container_data = []
+        for dev in ring.devs:
+            dev_ids.add(dev['id'])
+            part = str(dev['id'])
+            broker = self._make_broker(
+                container='c%s' % dev['id'], hash_='c%shash' % dev['id'],
+                device=dev['device'], part=part)
+            broker.update_metadata({'X-Container-Sysmeta-Sharding':
+                                    ('true', next(self.ts_iter).internal)})
+            container_data.append((broker.path, dev['id'], part))
+
+        with self._mock_sharder() as sharder:
+            sharder.ring = ring
+            sharder._check_node = lambda node: os.path.join(
+                sharder.conf['devices'], node['device'])
+            with mock.patch.object(
+                    sharder, '_process_broker') as mock_process_broker:
+                sharder.run_once()
+        self.assertEqual(dev_ids, set(sharder._local_device_ids.keys()))
+        self.assertEqual(set(container_data),
+                         set((call[0][0].path, call[0][1]['id'], call[0][2])
+                             for call in mock_process_broker.call_args_list))
+
+        with self._mock_sharder() as sharder:
+            sharder.ring = ring
+            sharder._check_node = lambda node: os.path.join(
+                sharder.conf['devices'], node['device'])
+            with mock.patch.object(
+                    sharder, '_process_broker') as mock_process_broker:
+                sharder.run_once(partitions='0')
+        self.assertEqual(dev_ids, set(sharder._local_device_ids.keys()))
+        self.assertEqual(set([container_data[0]]),
+                         set((call[0][0].path, call[0][1]['id'], call[0][2])
+                             for call in mock_process_broker.call_args_list))
+
+        with self._mock_sharder() as sharder:
+            sharder.ring = ring
+            sharder._check_node = lambda node: os.path.join(
+                sharder.conf['devices'], node['device'])
+            with mock.patch.object(
+                    sharder, '_process_broker') as mock_process_broker:
+                sharder.run_once(partitions='2,0')
+        self.assertEqual(dev_ids, set(sharder._local_device_ids.keys()))
+        self.assertEqual(set([container_data[0], container_data[2]]),
+                         set((call[0][0].path, call[0][1]['id'], call[0][2])
+                             for call in mock_process_broker.call_args_list))
+
+        with self._mock_sharder() as sharder:
+            sharder.ring = ring
+            sharder._check_node = lambda node: os.path.join(
+                sharder.conf['devices'], node['device'])
+            with mock.patch.object(
+                    sharder, '_process_broker') as mock_process_broker:
+                sharder.run_once(partitions='2,0', devices='sdc')
+        self.assertEqual(dev_ids, set(sharder._local_device_ids.keys()))
+        self.assertEqual(set([container_data[2]]),
+                         set((call[0][0].path, call[0][1]['id'], call[0][2])
+                             for call in mock_process_broker.call_args_list))
+
+        with self._mock_sharder() as sharder:
+            sharder.ring = ring
+            sharder._check_node = lambda node: os.path.join(
+                sharder.conf['devices'], node['device'])
+            with mock.patch.object(
+                    sharder, '_process_broker') as mock_process_broker:
+                sharder.run_once(devices='sdb,sdc')
+        self.assertEqual(dev_ids, set(sharder._local_device_ids.keys()))
+        self.assertEqual(set(container_data[1:]),
+                         set((call[0][0].path, call[0][1]['id'], call[0][2])
+                             for call in mock_process_broker.call_args_list))
+
+    def test_audit_cleave_contexts(self):
+
+        def add_cleave_context(id, last_modified, cleaving_done):
+            params = {'ref': id,
+                      'cursor': 'curs',
+                      'max_row': 2,
+                      'cleave_to_row': 2,
+                      'last_cleave_to_row': 1,
+                      'cleaving_done': cleaving_done,
+                      'misplaced_done': True,
+                      'ranges_done': 2,
+                      'ranges_todo': 4}
+            key = 'X-Container-Sysmeta-Shard-Context-%s' % id
+            with mock_timestamp_now(last_modified):
+                broker.update_metadata(
+                    {key: (json.dumps(params),
+                           last_modified.internal)})
+
+        def get_context(id, broker):
+            data = broker.get_sharding_sysmeta().get('Context-%s' % id)
+            if data:
+                return CleavingContext(**json.loads(data))
+            return data
+
+        reclaim_age = 100
+        recon_sharded_timeout = 50
+        broker = self._make_broker()
+
+        # sanity check
+        self.assertIsNone(broker.get_own_shard_range(no_default=True))
+        self.assertEqual(UNSHARDED, broker.get_db_state())
+
+        # Setup some cleaving contexts
+        id_old, id_newish, id_complete = [str(uuid4()) for _ in range(3)]
+        ts_old, ts_newish, ts_complete = (
+            Timestamp(1),
+            Timestamp(reclaim_age // 2),
+            Timestamp(reclaim_age - recon_sharded_timeout))
+        contexts = ((id_old, ts_old, False),
+                    (id_newish, ts_newish, False),
+                    (id_complete, ts_complete, True))
+        for id, last_modified, cleaving_done in contexts:
+            add_cleave_context(id, last_modified, cleaving_done)
+
+        sharder_conf = {'reclaim_age': str(reclaim_age),
+                        'recon_sharded_timeout': str(recon_sharded_timeout)}
+
+        with self._mock_sharder(sharder_conf) as sharder:
+            with mock_timestamp_now(Timestamp(reclaim_age + 2)):
+                sharder._audit_cleave_contexts(broker)
+
+        # old context is stale, ie last modified reached reclaim_age and was
+        # never completed (done).
+        old_ctx = get_context(id_old, broker)
+        self.assertEqual(old_ctx, "")
+
+        # Newish context is almost stale, as in it's been 1/2 reclaim age since
+        # it was last modified yet it's not completed. So it haven't been
+        # cleaned up.
+        newish_ctx = get_context(id_newish, broker)
+        self.assertEqual(newish_ctx.ref, id_newish)
+
+        # Complete context is complete (done) and it's been
+        # recon_sharded_timeout time since it was marked completed so it's
+        # been removed
+        complete_ctx = get_context(id_complete, broker)
+        self.assertEqual(complete_ctx, "")
+
+        # If we push time another reclaim age later, they are all removed
+        with self._mock_sharder(sharder_conf) as sharder:
+            with mock_timestamp_now(Timestamp(reclaim_age * 2)):
+                sharder._audit_cleave_contexts(broker)
+
+        newish_ctx = get_context(id_newish, broker)
+        self.assertEqual(newish_ctx, "")
+
+    def test_shrinking_candidate_recon_dump(self):
+        conf = {'recon_cache_path': self.tempdir,
+                'devices': self.tempdir}
+
+        shard_bounds = (
+            ('', 'd'), ('d', 'g'), ('g', 'l'), ('l', 'o'), ('o', 't'),
+            ('t', 'x'), ('x', ''))
+
+        with self._mock_sharder(conf) as sharder:
+            brokers = []
+            shard_ranges = []
+            C1, C2, C3 = 0, 1, 2
+
+            for container in ('c1', 'c2', 'c3'):
+                broker = self._make_broker(
+                    container=container, hash_=container + 'hash',
+                    device=sharder.ring.devs[0]['device'], part=0)
+                broker.update_metadata({'X-Container-Sysmeta-Sharding':
+                                        ('true', next(self.ts_iter).internal)})
+                my_sr = broker.get_own_shard_range()
+                my_sr.epoch = Timestamp.now()
+                broker.merge_shard_ranges([my_sr])
+                brokers.append(broker)
+                shard_ranges.append(self._make_shard_ranges(
+                    shard_bounds, state=ShardRange.ACTIVE,
+                    object_count=(
+                        DEFAULT_SHARDER_CONF['shard_container_threshold'] / 2),
+                    timestamp=next(self.ts_iter)))
+
+            # we want c2 to have 2 shrink pairs
+            shard_ranges[C2][1].object_count = 0
+            shard_ranges[C2][3].object_count = 0
+            brokers[C2].merge_shard_ranges(shard_ranges[C2])
+            brokers[C2].set_sharding_state()
+            brokers[C2].set_sharded_state()
+
+            # we want c1 to have the same, but one can't be shrunk
+            shard_ranges[C1][1].object_count = 0
+            shard_ranges[C1][2].object_count = \
+                DEFAULT_SHARDER_CONF['shard_container_threshold'] - 1
+            shard_ranges[C1][3].object_count = 0
+            brokers[C1].merge_shard_ranges(shard_ranges[C1])
+            brokers[C1].set_sharding_state()
+            brokers[C1].set_sharded_state()
+
+            # c3 we want to have more total_sharding donors then can be sharded
+            # in one go.
+            shard_ranges[C3][0].object_count = 0
+            shard_ranges[C3][1].object_count = 0
+            shard_ranges[C3][2].object_count = 0
+            shard_ranges[C3][3].object_count = 0
+            shard_ranges[C3][4].object_count = 0
+            shard_ranges[C3][5].object_count = 0
+            brokers[C3].merge_shard_ranges(shard_ranges[C3])
+            brokers[C3].set_sharding_state()
+            brokers[C3].set_sharded_state()
+
+            node = {'ip': '10.0.0.0', 'replication_ip': '10.0.1.0',
+                    'port': 1000, 'replication_port': 1100,
+                    'device': 'sda', 'zone': 0, 'region': 0, 'id': 1,
+                    'index': 0}
+
+            for broker in brokers:
+                sharder._identify_shrinking_candidate(broker, node)
+
+            sharder._report_stats()
+            expected_shrinking_candidates_data = {
+                'found': 3,
+                'top': [
+                    {
+                        'object_count': 500000,
+                        'tombstones': -1,
+                        'account': brokers[C3].account,
+                        'meta_timestamp': mock.ANY,
+                        'container': brokers[C3].container,
+                        'file_size': os.stat(brokers[C3].db_file).st_size,
+                        'path': brokers[C3].db_file,
+                        'root': brokers[C3].path,
+                        'node_index': 0,
+                        'compactible_ranges': 3
+                    }, {
+                        'object_count': 2500000,
+                        'tombstones': -1,
+                        'account': brokers[C2].account,
+                        'meta_timestamp': mock.ANY,
+                        'container': brokers[C2].container,
+                        'file_size': os.stat(brokers[1].db_file).st_size,
+                        'path': brokers[C2].db_file,
+                        'root': brokers[C2].path,
+                        'node_index': 0,
+                        'compactible_ranges': 2
+                    }, {
+                        'object_count': 2999999,
+                        'tombstones': -1,
+                        'account': brokers[C1].account,
+                        'meta_timestamp': mock.ANY,
+                        'container': brokers[C1].container,
+                        'file_size': os.stat(brokers[C1].db_file).st_size,
+                        'path': brokers[C1].db_file,
+                        'root': brokers[C1].path,
+                        'node_index': 0,
+                        'compactible_ranges': 1
+                    }
+                ]}
+            self._assert_recon_stats(expected_shrinking_candidates_data,
+                                     sharder, 'shrinking_candidates')
+
+            # check shrinking stats are reset
+            sharder._zero_stats()
+            for broker in brokers:
+                sharder._identify_shrinking_candidate(broker, node)
+            sharder._report_stats()
+            self._assert_recon_stats(expected_shrinking_candidates_data,
+                                     sharder, 'shrinking_candidates')
+
+            # set some ranges to shrinking and check that stats are updated; in
+            # this case the container C2 no longer has any shrinkable ranges
+            # and no longer appears in stats
+            def shrink_actionable_ranges(broker):
+                compactible = find_compactible_shard_sequences(
+                    broker, sharder.shrink_threshold, sharder.expansion_limit,
+                    1, -1)
+                self.assertNotEqual([], compactible)
+                with mock_timestamp_now(next(self.ts_iter)):
+                    process_compactible_shard_sequences(broker, compactible)
+
+            shrink_actionable_ranges(brokers[C2])
+            sharder._zero_stats()
+            for broker in brokers:
+                sharder._identify_shrinking_candidate(broker, node)
+            sharder._report_stats()
+            expected_shrinking_candidates_data = {
+                'found': 2,
+                'top': [
+                    {
+                        'object_count': mock.ANY,
+                        'tombstones': -1,
+                        'account': brokers[C3].account,
+                        'meta_timestamp': mock.ANY,
+                        'container': brokers[C3].container,
+                        'file_size': os.stat(brokers[C3].db_file).st_size,
+                        'path': brokers[C3].db_file,
+                        'root': brokers[C3].path,
+                        'node_index': 0,
+                        'compactible_ranges': 3
+                    }, {
+                        'object_count': mock.ANY,
+                        'tombstones': -1,
+                        'account': brokers[C1].account,
+                        'meta_timestamp': mock.ANY,
+                        'container': brokers[C1].container,
+                        'file_size': os.stat(brokers[C1].db_file).st_size,
+                        'path': brokers[C1].db_file,
+                        'root': brokers[C1].path,
+                        'node_index': 0,
+                        'compactible_ranges': 1
+                    }
+                ]}
+            self._assert_recon_stats(expected_shrinking_candidates_data,
+                                     sharder, 'shrinking_candidates')
+
+            # set some ranges to shrinking and check that stats are updated; in
+            # this case the container C3 no longer has any actionable ranges
+            # and no longer appears in stats
+            shrink_actionable_ranges(brokers[C3])
+            sharder._zero_stats()
+            for broker in brokers:
+                sharder._identify_shrinking_candidate(broker, node)
+            sharder._report_stats()
+            expected_shrinking_candidates_data = {
+                'found': 1,
+                'top': [
+                    {
+                        'object_count': mock.ANY,
+                        'tombstones': -1,
+                        'account': brokers[C1].account,
+                        'meta_timestamp': mock.ANY,
+                        'container': brokers[C1].container,
+                        'file_size': os.stat(brokers[C1].db_file).st_size,
+                        'path': brokers[C1].db_file,
+                        'root': brokers[C1].path,
+                        'node_index': 0,
+                        'compactible_ranges': 1
+                    }
+                ]}
+            self._assert_recon_stats(expected_shrinking_candidates_data,
+                                     sharder, 'shrinking_candidates')
+
+            # set some ranges to shrunk in C3 so that other sequences become
+            # compactible
+            now = next(self.ts_iter)
+            shard_ranges = brokers[C3].get_shard_ranges()
+            for (donor, acceptor) in zip(shard_ranges, shard_ranges[1:]):
+                if donor.state == ShardRange.SHRINKING:
+                    donor.update_state(ShardRange.SHRUNK, state_timestamp=now)
+                    donor.set_deleted(timestamp=now)
+                    acceptor.lower = donor.lower
+                    acceptor.timestamp = now
+            brokers[C3].merge_shard_ranges(shard_ranges)
+            sharder._zero_stats()
+            for broker in brokers:
+                sharder._identify_shrinking_candidate(broker, node)
+            sharder._report_stats()
+            expected_shrinking_candidates_data = {
+                'found': 2,
+                'top': [
+                    {
+                        'object_count': mock.ANY,
+                        'tombstones': -1,
+                        'account': brokers[C3].account,
+                        'meta_timestamp': mock.ANY,
+                        'container': brokers[C3].container,
+                        'file_size': os.stat(brokers[C3].db_file).st_size,
+                        'path': brokers[C3].db_file,
+                        'root': brokers[C3].path,
+                        'node_index': 0,
+                        'compactible_ranges': 2
+                    }, {
+                        'object_count': mock.ANY,
+                        'tombstones': -1,
+                        'account': brokers[C1].account,
+                        'meta_timestamp': mock.ANY,
+                        'container': brokers[C1].container,
+                        'file_size': os.stat(brokers[C1].db_file).st_size,
+                        'path': brokers[C1].db_file,
+                        'root': brokers[C1].path,
+                        'node_index': 0,
+                        'compactible_ranges': 1
+                    }
+                ]}
+            self._assert_recon_stats(expected_shrinking_candidates_data,
+                                     sharder, 'shrinking_candidates')
+
+    @mock.patch('swift.common.ring.ring.Ring.get_part_nodes', return_value=[])
+    @mock.patch('swift.common.ring.ring.Ring.get_more_nodes', return_value=[])
+    def test_get_shard_broker_no_local_handoff_for_part(
+            self, mock_part_nodes, mock_more_nodes):
+        broker = self._make_broker()
+        broker.enable_sharding(Timestamp.now())
+
+        shard_bounds = (('', 'd'), ('d', 'x'), ('x', ''))
+        shard_ranges = self._make_shard_ranges(
+            shard_bounds, state=ShardRange.CREATED)
+
+        broker.merge_shard_ranges(shard_ranges)
+        self.assertTrue(broker.set_sharding_state())
+
+        # first, let's assume there local_handoff_for_part fails because the
+        # node we're on is at zero weight for all disks. So it wont appear in
+        # the replica2part2dev table, meaning we wont get a node back.
+        # in this case, we'll fall back to one of our own devices which we
+        # determine from the ring.devs not the replica2part2dev table.
+        with self._mock_sharder() as sharder:
+            local_dev_ids = {dev['id']: dev for dev in sharder.ring.devs[-1:]}
+            sharder._local_device_ids = local_dev_ids
+            part, shard_broker, node_id, _ = sharder._get_shard_broker(
+                shard_ranges[0], broker.root_path, 0)
+            self.assertIn(node_id, local_dev_ids)
+
+        # if there are more then 1 local_dev_id it'll randomly pick one
+        selected_node_ids = set()
+        for _ in range(10):
+            with self._mock_sharder() as sharder:
+                local_dev_ids = {dev['id']: dev
+                                 for dev in sharder.ring.devs[-2:]}
+                sharder._local_device_ids = local_dev_ids
+                part, shard_broker, node_id, _ = sharder._get_shard_broker(
+                    shard_ranges[0], broker.root_path, 0)
+                self.assertIn(node_id, local_dev_ids)
+                selected_node_ids.add(node_id)
+            if len(selected_node_ids) == 2:
+                break
+        self.assertEqual(len(selected_node_ids), 2)
+
+        # If there are also no local_dev_ids, then we'll get the RuntimeError
+        with self._mock_sharder() as sharder:
+            sharder._local_device_ids = {}
+            with self.assertRaises(RuntimeError) as dev_err:
+                sharder._get_shard_broker(shard_ranges[0], broker.root_path, 0)
+
+        expected_error_string = 'Cannot find local handoff; no local devices'
+        self.assertEqual(str(dev_err.exception), expected_error_string)
+
+
+class TestCleavingContext(BaseTestSharder):
+    def test_init(self):
+        ctx = CleavingContext(ref='test')
+        self.assertEqual('test', ctx.ref)
+        self.assertEqual('', ctx.cursor)
+        self.assertIsNone(ctx.max_row)
+        self.assertIsNone(ctx.cleave_to_row)
+        self.assertIsNone(ctx.last_cleave_to_row)
+        self.assertFalse(ctx.misplaced_done)
+        self.assertFalse(ctx.cleaving_done)
+
+    def test_iter(self):
+        ctx = CleavingContext('test', 'curs', 12, 11, 10, False, True, 0, 4, 0)
+        expected = {'ref': 'test',
+                    'cursor': 'curs',
+                    'max_row': 12,
+                    'cleave_to_row': 11,
+                    'last_cleave_to_row': 10,
+                    'cleaving_done': False,
+                    'misplaced_done': True,
+                    'ranges_done': 0,
+                    'ranges_todo': 4,
+                    'replication_time': 0}
+        self.assertEqual(expected, dict(ctx))
+
+    def test_cursor(self):
+        broker = self._make_broker()
+        ref = CleavingContext._make_ref(broker)
+
+        for curs in ('curs', u'curs\u00e4\u00fb'):
+            with self.subTest(curs=curs):
+                expected = curs
+                ctx = CleavingContext(ref, curs, 12, 11, 10, False, True)
+                self.assertEqual(dict(ctx), {
+                    'cursor': expected,
+                    'max_row': 12,
+                    'cleave_to_row': 11,
+                    'last_cleave_to_row': 10,
+                    'cleaving_done': False,
+                    'misplaced_done': True,
+                    'ranges_done': 0,
+                    'ranges_todo': 0,
+                    'replication_time': 0,
+                    'ref': ref,
+                })
+                self.assertEqual(expected, ctx.cursor)
+                ctx.store(broker)
+                reloaded_ctx = CleavingContext.load(broker)
+                self.assertEqual(expected, reloaded_ctx.cursor)
+                # Since we reloaded, the max row gets updated from the broker
+                self.assertEqual(reloaded_ctx.max_row, -1)
+                # reset it so the dict comparison will succeed
+                reloaded_ctx.max_row = 12
+                self.assertEqual(dict(ctx), dict(reloaded_ctx))
+
+    def test_load(self):
+        broker = self._make_broker()
+        for i in range(6):
+            broker.put_object('o%s' % i, next(self.ts_iter).internal, 10,
+                              'text/plain', 'etag_a', 0)
+
+        db_id = broker.get_info()['id']
+        params = {'ref': db_id,
+                  'cursor': 'curs',
+                  'max_row': 2,
+                  'cleave_to_row': 2,
+                  'last_cleave_to_row': 1,
+                  'cleaving_done': False,
+                  'misplaced_done': True,
+                  'ranges_done': 2,
+                  'ranges_todo': 4,
+                  'replication_time': 0.5}
+        key = 'X-Container-Sysmeta-Shard-Context-%s' % db_id
+        broker.update_metadata(
+            {key: (json.dumps(params), Timestamp.now().internal)})
+        ctx = CleavingContext.load(broker)
+        self.assertEqual(db_id, ctx.ref)
+        self.assertEqual('curs', ctx.cursor)
+        # note max_row is dynamically updated during load
+        self.assertEqual(6, ctx.max_row)
+        self.assertEqual(2, ctx.cleave_to_row)
+        self.assertEqual(1, ctx.last_cleave_to_row)
+        self.assertTrue(ctx.misplaced_done)
+        self.assertFalse(ctx.cleaving_done)
+        self.assertEqual(2, ctx.ranges_done)
+        self.assertEqual(4, ctx.ranges_todo)
+        self.assertEqual(0.5, ctx.replication_time)
+
+    def test_load_all(self):
+        broker = self._make_broker()
+        last_ctx = None
+        timestamp = Timestamp.now()
+
+        db_ids = [str(uuid4()) for _ in range(6)]
+        for db_id in db_ids:
+            params = {'ref': db_id,
+                      'cursor': 'curs',
+                      'max_row': 2,
+                      'cleave_to_row': 2,
+                      'last_cleave_to_row': 1,
+                      'cleaving_done': False,
+                      'misplaced_done': True,
+                      'ranges_done': 2,
+                      'ranges_todo': 4}
+            key = 'X-Container-Sysmeta-Shard-Context-%s' % db_id
+            broker.update_metadata(
+                {key: (json.dumps(params), timestamp.internal)})
+        first_ctx = None
+        for ctx, lm in CleavingContext.load_all(broker):
+            if not first_ctx:
+                first_ctx = ctx
+            last_ctx = ctx
+            self.assertIn(ctx.ref, db_ids)
+            self.assertEqual(lm, timestamp.internal)
+
+        # If a context is deleted (metadata is "") then it's skipped
+        last_ctx.delete(broker)
+        db_ids.remove(last_ctx.ref)
+
+        # and let's modify the first
+        with mock_timestamp_now() as new_timestamp:
+            first_ctx.store(broker)
+
+        for ctx, lm in CleavingContext.load_all(broker):
+            self.assertIn(ctx.ref, db_ids)
+            if ctx.ref == first_ctx.ref:
+                self.assertEqual(lm, new_timestamp.internal)
+            else:
+                self.assertEqual(lm, timestamp.internal)
+
+        # delete all contexts
+        for ctx, lm in CleavingContext.load_all(broker):
+            ctx.delete(broker)
+        self.assertEqual([], CleavingContext.load_all(broker))
+
+    def test_delete(self):
+        broker = self._make_broker()
+
+        db_id = broker.get_info()['id']
+        params = {'ref': db_id,
+                  'cursor': 'curs',
+                  'max_row': 2,
+                  'cleave_to_row': 2,
+                  'last_cleave_to_row': 1,
+                  'cleaving_done': False,
+                  'misplaced_done': True,
+                  'ranges_done': 2,
+                  'ranges_todo': 4}
+        key = 'X-Container-Sysmeta-Shard-Context-%s' % db_id
+        broker.update_metadata(
+            {key: (json.dumps(params), Timestamp.now().internal)})
+        ctx = CleavingContext.load(broker)
+        self.assertEqual(db_id, ctx.ref)
+
+        # Now let's delete it. When deleted the metadata key will exist, but
+        # the value will be "" as this means it'll be reaped later.
+        ctx.delete(broker)
+
+        sysmeta = broker.get_sharding_sysmeta()
+        for key, val in sysmeta.items():
+            if key == "Context-%s" % db_id:
+                self.assertEqual(val, "")
+                break
+        else:
+            self.fail("Deleted context 'Context-%s' not found")
+
+    def test_store_old_style(self):
+        broker = self._make_old_style_sharding_broker()
+        old_db_id = broker.get_brokers()[0].get_info()['id']
+        last_mod = Timestamp.now()
+        ctx = CleavingContext(old_db_id, 'curs', 12, 11, 2, True, True, 2, 4,
+                              0.5)
+        with mock_timestamp_now(last_mod):
+            ctx.store(broker)
+        key = 'X-Container-Sysmeta-Shard-Context-%s' % old_db_id
+        data = json.loads(broker.metadata[key][0])
+        expected = {'ref': old_db_id,
+                    'cursor': 'curs',
+                    'max_row': 12,
+                    'cleave_to_row': 11,
+                    'last_cleave_to_row': 2,
+                    'cleaving_done': True,
+                    'misplaced_done': True,
+                    'ranges_done': 2,
+                    'ranges_todo': 4,
+                    'replication_time': 0.5}
+        self.assertEqual(expected, data)
+        # last modified is the metadata timestamp
+        self.assertEqual(broker.metadata[key][1], last_mod.internal)
+
+    def test_store_add_row_load_old_style(self):
+        # adding row to older db changes only max_row in the context
+        broker = self._make_old_style_sharding_broker()
+        old_broker = broker.get_brokers()[0]
+        old_db_id = old_broker.get_info()['id']
+        old_broker.merge_items([old_broker._record_to_dict(
+            ('obj', next(self.ts_iter).internal, 0, 'text/plain', 'etag', 1))])
+        old_max_row = old_broker.get_max_row()
+        self.assertEqual(1, old_max_row)  # sanity check
+        ctx = CleavingContext(old_db_id, 'curs', 1, 1, 0, True, True)
+        ctx.store(broker)
+
+        # adding a row changes max row
+        old_broker.merge_items([old_broker._record_to_dict(
+            ('obj', next(self.ts_iter).internal, 0, 'text/plain', 'etag', 1))])
+
+        new_ctx = CleavingContext.load(broker)
+        self.assertEqual(old_db_id, new_ctx.ref)
+        self.assertEqual('curs', new_ctx.cursor)
+        self.assertEqual(2, new_ctx.max_row)
+        self.assertEqual(1, new_ctx.cleave_to_row)
+        self.assertEqual(0, new_ctx.last_cleave_to_row)
+        self.assertTrue(new_ctx.misplaced_done)
+        self.assertTrue(new_ctx.cleaving_done)
+
+    def test_store_reclaim_load_old_style(self):
+        # reclaiming rows from older db does not change context
+        broker = self._make_old_style_sharding_broker()
+        old_broker = broker.get_brokers()[0]
+        old_db_id = old_broker.get_info()['id']
+        old_broker.merge_items([old_broker._record_to_dict(
+            ('obj', next(self.ts_iter).internal, 0, 'text/plain', 'etag', 1))])
+        old_max_row = old_broker.get_max_row()
+        self.assertEqual(1, old_max_row)  # sanity check
+        ctx = CleavingContext(old_db_id, 'curs', 1, 1, 0, True, True)
+        ctx.store(broker)
+
+        self.assertEqual(
+            1, len(old_broker.get_objects()))
+        now = next(self.ts_iter).internal
+        broker.get_brokers()[0].reclaim(now, now)
+        self.assertFalse(old_broker.get_objects())
+
+        new_ctx = CleavingContext.load(broker)
+        self.assertEqual(old_db_id, new_ctx.ref)
+        self.assertEqual('curs', new_ctx.cursor)
+        self.assertEqual(1, new_ctx.max_row)
+        self.assertEqual(1, new_ctx.cleave_to_row)
+        self.assertEqual(0, new_ctx.last_cleave_to_row)
+        self.assertTrue(new_ctx.misplaced_done)
+        self.assertTrue(new_ctx.cleaving_done)
+
+    def test_store_modify_db_id_load_old_style(self):
+        # changing id changes ref, so results in a fresh context
+        broker = self._make_old_style_sharding_broker()
+        old_broker = broker.get_brokers()[0]
+        old_db_id = old_broker.get_info()['id']
+        ctx = CleavingContext(old_db_id, 'curs', 12, 11, 2, True, True)
+        ctx.store(broker)
+
+        old_broker.newid('fake_remote_id')
+        new_db_id = old_broker.get_info()['id']
+        self.assertNotEqual(old_db_id, new_db_id)
+
+        new_ctx = CleavingContext.load(broker)
+        self.assertEqual(new_db_id, new_ctx.ref)
+        self.assertEqual('', new_ctx.cursor)
+        # note max_row is dynamically updated during load
+        self.assertEqual(-1, new_ctx.max_row)
+        self.assertEqual(None, new_ctx.cleave_to_row)
+        self.assertEqual(None, new_ctx.last_cleave_to_row)
+        self.assertFalse(new_ctx.misplaced_done)
+        self.assertFalse(new_ctx.cleaving_done)
+
+    def test_load_modify_store_load_old_style(self):
+        broker = self._make_old_style_sharding_broker()
+        old_db_id = broker.get_brokers()[0].get_info()['id']
+        ctx = CleavingContext.load(broker)
+        self.assertEqual(old_db_id, ctx.ref)
+        self.assertEqual('', ctx.cursor)  # sanity check
+        ctx.cursor = 'curs'
+        ctx.misplaced_done = True
+        ctx.store(broker)
+        ctx = CleavingContext.load(broker)
+        self.assertEqual(old_db_id, ctx.ref)
+        self.assertEqual('curs', ctx.cursor)
+        self.assertTrue(ctx.misplaced_done)
+
+    def test_store(self):
+        broker = self._make_sharding_broker()
+        old_db_id = broker.get_brokers()[0].get_info()['id']
+        last_mod = Timestamp.now()
+        ctx = CleavingContext(old_db_id, 'curs', 12, 11, 2, True, True, 2, 4,
+                              0.5)
+        with mock_timestamp_now(last_mod):
+            ctx.store(broker)
+        key = 'X-Container-Sysmeta-Shard-Context-%s' % old_db_id
+        data = json.loads(broker.metadata[key][0])
+        expected = {'ref': old_db_id,
+                    'cursor': 'curs',
+                    'max_row': 12,
+                    'cleave_to_row': 11,
+                    'last_cleave_to_row': 2,
+                    'cleaving_done': True,
+                    'misplaced_done': True,
+                    'ranges_done': 2,
+                    'ranges_todo': 4,
+                    'replication_time': 0.5}
+        self.assertEqual(expected, data)
+        # last modified is the metadata timestamp
+        self.assertEqual(broker.metadata[key][1], last_mod.internal)
+
+    def test_store_add_row_load(self):
+        # adding row to older db changes only max_row in the context
+        broker = self._make_sharding_broker()
+        old_broker = broker.get_brokers()[0]
+        old_db_id = old_broker.get_info()['id']
+        old_broker.merge_items([old_broker._record_to_dict(
+            ('obj', next(self.ts_iter).internal, 0, 'text/plain', 'etag', 1))])
+        old_max_row = old_broker.get_max_row()
+        self.assertEqual(1, old_max_row)  # sanity check
+        ctx = CleavingContext(old_db_id, 'curs', 1, 1, 0, True, True)
+        ctx.store(broker)
+
+        # adding a row changes max row
+        old_broker.merge_items([old_broker._record_to_dict(
+            ('obj', next(self.ts_iter).internal, 0, 'text/plain', 'etag', 1))])
+
+        new_ctx = CleavingContext.load(broker)
+        self.assertEqual(old_db_id, new_ctx.ref)
+        self.assertEqual('curs', new_ctx.cursor)
+        self.assertEqual(2, new_ctx.max_row)
+        self.assertEqual(1, new_ctx.cleave_to_row)
+        self.assertEqual(0, new_ctx.last_cleave_to_row)
+        self.assertTrue(new_ctx.misplaced_done)
+        self.assertTrue(new_ctx.cleaving_done)
+
+    def test_store_reclaim_load(self):
+        # reclaiming rows from older db does not change context
+        broker = self._make_sharding_broker()
+        old_broker = broker.get_brokers()[0]
+        old_db_id = old_broker.get_info()['id']
+        old_broker.merge_items([old_broker._record_to_dict(
+            ('obj', next(self.ts_iter).internal, 0, 'text/plain', 'etag', 1))])
+        old_max_row = old_broker.get_max_row()
+        self.assertEqual(1, old_max_row)  # sanity check
+        ctx = CleavingContext(old_db_id, 'curs', 1, 1, 0, True, True)
+        ctx.store(broker)
+
+        self.assertEqual(
+            1, len(old_broker.get_objects()))
+        now = next(self.ts_iter).internal
+        broker.get_brokers()[0].reclaim(now, now)
+        self.assertFalse(old_broker.get_objects())
+
+        new_ctx = CleavingContext.load(broker)
+        self.assertEqual(old_db_id, new_ctx.ref)
+        self.assertEqual('curs', new_ctx.cursor)
+        self.assertEqual(1, new_ctx.max_row)
+        self.assertEqual(1, new_ctx.cleave_to_row)
+        self.assertEqual(0, new_ctx.last_cleave_to_row)
+        self.assertTrue(new_ctx.misplaced_done)
+        self.assertTrue(new_ctx.cleaving_done)
+
+    def test_store_modify_db_id_load(self):
+        # changing id changes ref, so results in a fresh context
+        broker = self._make_sharding_broker()
+        old_broker = broker.get_brokers()[0]
+        old_db_id = old_broker.get_info()['id']
+        ctx = CleavingContext(old_db_id, 'curs', 12, 11, 2, True, True)
+        ctx.store(broker)
+
+        old_broker.newid('fake_remote_id')
+        new_db_id = old_broker.get_info()['id']
+        self.assertNotEqual(old_db_id, new_db_id)
+
+        new_ctx = CleavingContext.load(broker)
+        self.assertEqual(new_db_id, new_ctx.ref)
+        self.assertEqual('', new_ctx.cursor)
+        # note max_row is dynamically updated during load
+        self.assertEqual(-1, new_ctx.max_row)
+        self.assertEqual(None, new_ctx.cleave_to_row)
+        self.assertEqual(None, new_ctx.last_cleave_to_row)
+        self.assertFalse(new_ctx.misplaced_done)
+        self.assertFalse(new_ctx.cleaving_done)
+
+    def test_load_modify_store_load(self):
+        broker = self._make_sharding_broker()
+        old_db_id = broker.get_brokers()[0].get_info()['id']
+        ctx = CleavingContext.load(broker)
+        self.assertEqual(old_db_id, ctx.ref)
+        self.assertEqual('', ctx.cursor)  # sanity check
+        ctx.cursor = 'curs'
+        ctx.misplaced_done = True
+        ctx.store(broker)
+        ctx = CleavingContext.load(broker)
+        self.assertEqual(old_db_id, ctx.ref)
+        self.assertEqual('curs', ctx.cursor)
+        self.assertTrue(ctx.misplaced_done)
+
+    def test_reset(self):
+        ctx = CleavingContext('test', 'curs', 12, 11, 2, True, True,
+                              ranges_done=5, ranges_todo=3,
+                              replication_time=5.5)
+
+        def check_context():
+            self.assertEqual('test', ctx.ref)
+            self.assertEqual('', ctx.cursor)
+            self.assertEqual(12, ctx.max_row)
+            self.assertEqual(11, ctx.cleave_to_row)
+            self.assertEqual(11, ctx.last_cleave_to_row)
+            self.assertFalse(ctx.misplaced_done)
+            self.assertFalse(ctx.cleaving_done)
+            self.assertEqual(0, ctx.ranges_done)
+            self.assertEqual(0, ctx.ranges_todo)
+            self.assertEqual(0, ctx.replication_time)
+        ctx.reset()
+        check_context()
+        # check idempotency
+        ctx.reset()
+        check_context()
+
+    def test_start(self):
+        ctx = CleavingContext('test', 'curs', 12, 11, 2, True, True,
+                              ranges_done=5, ranges_todo=3,
+                              replication_time=5.5)
+
+        def check_context():
+            self.assertEqual('test', ctx.ref)
+            self.assertEqual('', ctx.cursor)
+            self.assertEqual(12, ctx.max_row)
+            self.assertEqual(12, ctx.cleave_to_row)
+            self.assertEqual(2, ctx.last_cleave_to_row)
+            self.assertTrue(ctx.misplaced_done)  # *not* reset here
+            self.assertFalse(ctx.cleaving_done)
+            self.assertEqual(0, ctx.ranges_done)
+            self.assertEqual(0, ctx.ranges_todo)
+            self.assertEqual(0, ctx.replication_time)
+
+        ctx.start()
+        check_context()
+        # check idempotency
+        ctx.start()
+        check_context()
+
+    def test_range_done(self):
+        ctx = CleavingContext('test', '', 12, 11, 2, True, True)
+        self.assertEqual(0, ctx.ranges_done)
+        self.assertEqual(0, ctx.ranges_todo)
+        self.assertEqual('', ctx.cursor)
+
+        ctx.ranges_todo = 5
+        ctx.range_done('b')
+        self.assertEqual(1, ctx.ranges_done)
+        self.assertEqual(4, ctx.ranges_todo)
+        self.assertEqual('b', ctx.cursor)
+
+        ctx.ranges_todo = 9
+        ctx.range_done('c')
+        self.assertEqual(2, ctx.ranges_done)
+        self.assertEqual(8, ctx.ranges_todo)
+        self.assertEqual('c', ctx.cursor)
+
+    def test_done(self):
+        ctx = CleavingContext(
+            'test', '', max_row=12, cleave_to_row=12, last_cleave_to_row=2,
+            cleaving_done=True, misplaced_done=True)
+        self.assertTrue(ctx.done())
+        ctx = CleavingContext(
+            'test', '', max_row=12, cleave_to_row=11, last_cleave_to_row=2,
+            cleaving_done=True, misplaced_done=True)
+        self.assertFalse(ctx.done())
+        ctx = CleavingContext(
+            'test', '', max_row=12, cleave_to_row=12, last_cleave_to_row=2,
+            cleaving_done=True, misplaced_done=False)
+        self.assertFalse(ctx.done())
+        ctx = CleavingContext(
+            'test', '', max_row=12, cleave_to_row=12, last_cleave_to_row=2,
+            cleaving_done=False, misplaced_done=True)
+        self.assertFalse(ctx.done())
+
+
+class TestSharderFunctions(BaseTestSharder):
+    def test_find_shrinking_candidates(self):
+        broker = self._make_broker()
+        shard_bounds = (('', 'a'), ('a', 'b'), ('b', 'c'), ('c', 'd'))
+        threshold = (DEFAULT_SHARDER_CONF['shrink_threshold'])
+        shard_ranges = self._make_shard_ranges(
+            shard_bounds, state=ShardRange.ACTIVE, object_count=threshold,
+            timestamp=next(self.ts_iter))
+        broker.merge_shard_ranges(shard_ranges)
+        pairs = find_shrinking_candidates(broker, threshold, threshold * 4)
+        self.assertEqual({}, pairs)
+
+        # one range just below threshold
+        shard_ranges[0].update_meta(threshold - 1, 0,
+                                    meta_timestamp=next(self.ts_iter))
+        broker.merge_shard_ranges(shard_ranges[0])
+        pairs = find_shrinking_candidates(broker, threshold, threshold * 4)
+        self.assertEqual(1, len(pairs), pairs)
+        for acceptor, donor in pairs.items():
+            self.assertEqual(shard_ranges[1], acceptor)
+            self.assertEqual(shard_ranges[0], donor)
+
+        # two ranges just below threshold
+        shard_ranges[2].update_meta(threshold - 1, 0,
+                                    meta_timestamp=next(self.ts_iter))
+        broker.merge_shard_ranges(shard_ranges[2])
+        pairs = find_shrinking_candidates(broker, threshold, threshold * 4)
+
+        # shenanigans to work around dicts with ShardRanges keys not comparing
+        def check_pairs(pairs):
+            acceptors = []
+            donors = []
+            for acceptor, donor in pairs.items():
+                acceptors.append(acceptor)
+                donors.append(donor)
+            acceptors.sort(key=ShardRange.sort_key)
+            donors.sort(key=ShardRange.sort_key)
+            self.assertEqual([shard_ranges[1], shard_ranges[3]], acceptors)
+            self.assertEqual([shard_ranges[0], shard_ranges[2]], donors)
+
+        check_pairs(pairs)
+
+        # repeat call after broker is updated and expect same pairs
+        shard_ranges[0].update_state(ShardRange.SHRINKING, next(self.ts_iter))
+        shard_ranges[2].update_state(ShardRange.SHRINKING, next(self.ts_iter))
+        shard_ranges[1].lower = shard_ranges[0].lower
+        shard_ranges[1].timestamp = next(self.ts_iter)
+        shard_ranges[3].lower = shard_ranges[2].lower
+        shard_ranges[3].timestamp = next(self.ts_iter)
+        broker.merge_shard_ranges(shard_ranges)
+        pairs = find_shrinking_candidates(broker, threshold, threshold * 4)
+        check_pairs(pairs)
+
+    def test_finalize_shrinking(self):
+        broker = self._make_broker()
+        broker.enable_sharding(next(self.ts_iter))
+        shard_bounds = (('', 'here'), ('here', 'there'), ('there', ''))
+        ts_0 = next(self.ts_iter)
+        shard_ranges = self._make_shard_ranges(
+            shard_bounds, state=ShardRange.ACTIVE, timestamp=ts_0)
+        self.assertTrue(broker.set_sharding_state())
+        self.assertTrue(broker.set_sharded_state())
+        ts_1 = next(self.ts_iter)
+        finalize_shrinking(broker, shard_ranges[2:], shard_ranges[:2], ts_1)
+        updated_ranges = broker.get_shard_ranges()
+        self.assertEqual(
+            [ShardRange.SHRINKING, ShardRange.SHRINKING, ShardRange.ACTIVE],
+            [sr.state for sr in updated_ranges]
+        )
+        # acceptor is not updated...
+        self.assertEqual(ts_0, updated_ranges[2].timestamp)
+        # donors are updated...
+        self.assertEqual([ts_1] * 2,
+                         [sr.state_timestamp for sr in updated_ranges[:2]])
+        self.assertEqual([ts_1] * 2,
+                         [sr.epoch for sr in updated_ranges[:2]])
+        # check idempotency
+        ts_2 = next(self.ts_iter)
+        finalize_shrinking(broker, shard_ranges[2:], shard_ranges[:2], ts_2)
+        updated_ranges = broker.get_shard_ranges()
+        self.assertEqual(
+            [ShardRange.SHRINKING, ShardRange.SHRINKING, ShardRange.ACTIVE],
+            [sr.state for sr in updated_ranges]
+        )
+        # acceptor is not updated...
+        self.assertEqual(ts_0, updated_ranges[2].timestamp)
+        # donors are not updated...
+        self.assertEqual([ts_1] * 2,
+                         [sr.state_timestamp for sr in updated_ranges[:2]])
+        self.assertEqual([ts_1] * 2,
+                         [sr.epoch for sr in updated_ranges[:2]])
+
+    def test_process_compactible(self):
+        # no sequences...
+        broker = self._make_broker()
+        with mock.patch('swift.container.sharder.finalize_shrinking') as fs:
+            with mock_timestamp_now(next(self.ts_iter)) as now:
+                process_compactible_shard_sequences(broker, [])
+        fs.assert_called_once_with(broker, [], [], now)
+
+        # two sequences with acceptor bounds needing to be updated
+        ts_0 = next(self.ts_iter)
+        sequence_1 = self._make_shard_ranges(
+            (('a', 'b'), ('b', 'c'), ('c', 'd')),
+            state=ShardRange.ACTIVE, timestamp=ts_0)
+        sequence_2 = self._make_shard_ranges(
+            (('x', 'y'), ('y', 'z')),
+            state=ShardRange.ACTIVE, timestamp=ts_0)
+        with mock.patch('swift.container.sharder.finalize_shrinking') as fs:
+            with mock_timestamp_now(next(self.ts_iter)) as now:
+                process_compactible_shard_sequences(
+                    broker, [sequence_1, sequence_2])
+        expected_donors = sequence_1[:-1] + sequence_2[:-1]
+        expected_acceptors = [sequence_1[-1].copy(lower='a', timestamp=now),
+                              sequence_2[-1].copy(lower='x', timestamp=now)]
+        fs.assert_called_once_with(
+            broker, expected_acceptors, expected_donors, now)
+        self.assertEqual([dict(sr) for sr in expected_acceptors],
+                         [dict(sr) for sr in fs.call_args[0][1]])
+        self.assertEqual([dict(sr) for sr in expected_donors],
+                         [dict(sr) for sr in fs.call_args[0][2]])
+
+        # sequences have already been processed - acceptors expanded
+        sequence_1 = self._make_shard_ranges(
+            (('a', 'b'), ('b', 'c'), ('a', 'd')),
+            state=ShardRange.ACTIVE, timestamp=ts_0)
+        sequence_2 = self._make_shard_ranges(
+            (('x', 'y'), ('x', 'z')),
+            state=ShardRange.ACTIVE, timestamp=ts_0)
+        with mock.patch('swift.container.sharder.finalize_shrinking') as fs:
+            with mock_timestamp_now(next(self.ts_iter)) as now:
+                process_compactible_shard_sequences(
+                    broker, [sequence_1, sequence_2])
+        expected_donors = sequence_1[:-1] + sequence_2[:-1]
+        expected_acceptors = [sequence_1[-1], sequence_2[-1]]
+        fs.assert_called_once_with(
+            broker, expected_acceptors, expected_donors, now)
+
+        self.assertEqual([dict(sr) for sr in expected_acceptors],
+                         [dict(sr) for sr in fs.call_args[0][1]])
+        self.assertEqual([dict(sr) for sr in expected_donors],
+                         [dict(sr) for sr in fs.call_args[0][2]])
+
+        # acceptor is root - needs state to be updated, but not bounds
+        sequence_1 = self._make_shard_ranges(
+            (('a', 'b'), ('b', 'c'), ('a', 'd'), ('d', ''), ('', '')),
+            state=[ShardRange.ACTIVE] * 4 + [ShardRange.SHARDED],
+            timestamp=ts_0)
+        with mock.patch('swift.container.sharder.finalize_shrinking') as fs:
+            with mock_timestamp_now(next(self.ts_iter)) as now:
+                process_compactible_shard_sequences(broker, [sequence_1])
+        expected_donors = sequence_1[:-1]
+        expected_acceptors = [sequence_1[-1].copy(state=ShardRange.ACTIVE,
+                                                  state_timestamp=now)]
+        fs.assert_called_once_with(
+            broker, expected_acceptors, expected_donors, now)
+
+        self.assertEqual([dict(sr) for sr in expected_acceptors],
+                         [dict(sr) for sr in fs.call_args[0][1]])
+        self.assertEqual([dict(sr) for sr in expected_donors],
+                         [dict(sr) for sr in fs.call_args[0][2]])
+
+    def test_find_compactible_shard_ranges_in_found_state(self):
+        broker = self._make_broker()
+        shard_ranges = self._make_shard_ranges(
+            (('a', 'b'), ('b', 'c'), ('c', 'd'), ('d', 'e'), ('e', 'f'),
+             ('f', 'g'), ('g', 'h'), ('h', 'i'), ('i', 'j'), ('j', '')),
+            state=ShardRange.FOUND)
+        broker.merge_shard_ranges(shard_ranges)
+        sequences = find_compactible_shard_sequences(broker, 10, 999, -1, -1)
+        self.assertEqual([], sequences)
+
+    def test_find_compactible_no_donors(self):
+        broker = self._make_broker()
+        shard_ranges = self._make_shard_ranges(
+            (('a', 'b'), ('b', 'c'), ('c', 'd'), ('d', 'e'), ('e', 'f'),
+             ('f', 'g'), ('g', 'h'), ('h', 'i'), ('i', 'j'), ('j', '')),
+            state=ShardRange.ACTIVE, object_count=10)
+        broker.merge_shard_ranges(shard_ranges)
+        # shards exceed shrink threshold
+        sequences = find_compactible_shard_sequences(broker, 10, 999, -1, -1)
+        self.assertEqual([], sequences)
+        # compacted shards would exceed merge size
+        sequences = find_compactible_shard_sequences(broker, 11, 19, -1, -1)
+        self.assertEqual([], sequences)
+        # shards exceed merge size
+        sequences = find_compactible_shard_sequences(broker, 11, 9, -1, -1)
+        self.assertEqual([], sequences)
+        # shards exceed merge size and shrink threshold
+        sequences = find_compactible_shard_sequences(broker, 10, 9, -1, -1)
+        self.assertEqual([], sequences)
+        # shards exceed *zero'd* merge size and shrink threshold
+        sequences = find_compactible_shard_sequences(broker, 0, 0, -1, -1)
+        self.assertEqual([], sequences)
+        # shards exceed *negative* merge size and shrink threshold
+        sequences = find_compactible_shard_sequences(broker, -1, -2, -1, -1)
+        self.assertEqual([], sequences)
+        # weird case: shards object count less than threshold but compacted
+        # shards would exceed merge size
+        sequences = find_compactible_shard_sequences(broker, 20, 19, -1, -1)
+        self.assertEqual([], sequences)
+
+    def test_find_compactible_nine_donors_one_acceptor(self):
+        # one sequence that spans entire namespace but does not shrink to root
+        broker = self._make_broker()
+        shard_ranges = self._make_shard_ranges(
+            (('', 'b'), ('b', 'c'), ('c', 'd'), ('d', 'e'), ('e', 'f'),
+             ('f', 'g'), ('g', 'h'), ('h', 'i'), ('i', 'j'), ('j', '')),
+            state=ShardRange.ACTIVE)
+        shard_ranges[9].object_count = 11  # final shard too big to shrink
+        broker.merge_shard_ranges(shard_ranges)
+        sequences = find_compactible_shard_sequences(broker, 10, 999, -1, -1)
+        self.assertEqual([shard_ranges], sequences)
+
+    def test_find_compactible_four_donors_two_acceptors(self):
+        small_ranges = (2, 3, 4, 7)
+        broker = self._make_broker()
+        shard_ranges = self._make_shard_ranges(
+            (('', 'b'), ('b', 'c'), ('c', 'd'), ('d', 'e'), ('e', 'f'),
+             ('f', 'g'), ('g', 'h'), ('h', 'i'), ('i', 'j'), ('j', '')),
+            state=ShardRange.ACTIVE)
+        for i, sr in enumerate(shard_ranges):
+            if i not in small_ranges:
+                sr.object_count = 100
+        broker.merge_shard_ranges(shard_ranges)
+        sequences = find_compactible_shard_sequences(broker, 10, 999, -1, -1)
+        self.assertEqual([shard_ranges[2:6], shard_ranges[7:9]], sequences)
+
+    def test_find_compactible_all_donors_shrink_to_root(self):
+        # by default all shard ranges are small enough to shrink so the root
+        # becomes the acceptor
+        broker = self._make_broker()
+        shard_ranges = self._make_shard_ranges(
+            (('', 'b'), ('b', 'c'), ('c', 'd'), ('d', 'e'), ('e', 'f'),
+             ('f', 'g'), ('g', 'h'), ('h', 'i'), ('i', 'j'), ('j', '')),
+            state=ShardRange.ACTIVE)
+        broker.merge_shard_ranges(shard_ranges)
+        own_sr = broker.get_own_shard_range()
+        own_sr.update_state(ShardRange.SHARDED)
+        broker.merge_shard_ranges(own_sr)
+        sequences = find_compactible_shard_sequences(broker, 10, 999, -1, -1)
+        self.assertEqual([shard_ranges + [own_sr]], sequences)
+
+    def test_find_compactible_single_donor_shrink_to_root(self):
+        # single shard range small enough to shrink so the root becomes the
+        # acceptor
+        broker = self._make_broker()
+        shard_ranges = self._make_shard_ranges(
+            (('', ''),), state=ShardRange.ACTIVE, timestamp=next(self.ts_iter))
+        broker.merge_shard_ranges(shard_ranges)
+        own_sr = broker.get_own_shard_range()
+        own_sr.update_state(ShardRange.SHARDED, next(self.ts_iter))
+        broker.merge_shard_ranges(own_sr)
+        sequences = find_compactible_shard_sequences(broker, 10, 999, -1, -1)
+        self.assertEqual([shard_ranges + [own_sr]], sequences)
+
+        # update broker with donor/acceptor
+        shard_ranges[0].update_state(ShardRange.SHRINKING, next(self.ts_iter))
+        own_sr.update_state(ShardRange.ACTIVE, next(self.ts_iter))
+        broker.merge_shard_ranges([shard_ranges[0], own_sr])
+        # we don't find the same sequence again...
+        sequences = find_compactible_shard_sequences(broker, 10, 999, -1, -1)
+        self.assertEqual([], sequences)
+        # ...unless explicitly requesting it
+        sequences = find_compactible_shard_sequences(broker, 10, 999, -1, -1,
+                                                     include_shrinking=True)
+        self.assertEqual([shard_ranges + [own_sr]], sequences)
+
+    def test_find_compactible_overlapping_ranges(self):
+        # unexpected case: all shrinkable, two overlapping sequences, one which
+        # spans entire namespace; should not shrink to root
+        broker = self._make_broker()
+        shard_ranges = self._make_shard_ranges(
+            (('', 'b'), ('b', 'c'),  # overlaps form one sequence
+             ('', 'j'), ('j', '')),  # second sequence spans entire namespace
+            state=ShardRange.ACTIVE)
+        shard_ranges[1].object_count = 11  # cannot shrink, so becomes acceptor
+        broker.merge_shard_ranges(shard_ranges)
+        sequences = find_compactible_shard_sequences(broker, 10, 999, -1, -1)
+        self.assertEqual([shard_ranges[:2], shard_ranges[2:]], sequences)
+
+    def test_find_compactible_overlapping_ranges_with_ineligible_state(self):
+        # unexpected case: one ineligible state shard range overlapping one
+        # sequence which spans entire namespace; should not shrink to root
+        broker = self._make_broker()
+        shard_ranges = self._make_shard_ranges(
+            (('', 'b'),  # overlap in ineligible state
+             ('', 'j'), ('j', '')),  # sequence spans entire namespace
+            state=[ShardRange.CREATED, ShardRange.ACTIVE, ShardRange.ACTIVE])
+        broker.merge_shard_ranges(shard_ranges)
+        sequences = find_compactible_shard_sequences(broker, 10, 999, -1, -1)
+        self.assertEqual([shard_ranges[1:]], sequences)
+
+    def test_find_compactible_donors_but_no_suitable_acceptor(self):
+        # if shard ranges are already shrinking, check that the final one is
+        # not made into an acceptor if a suitable adjacent acceptor is not
+        # found (unexpected scenario but possible in an overlap situation)
+        broker = self._make_broker()
+        shard_ranges = self._make_shard_ranges(
+            (('', 'b'), ('b', 'c'), ('c', 'd'), ('d', 'e'), ('e', 'f'),
+             ('f', 'g'), ('g', 'h'), ('h', 'i'), ('i', 'j'), ('j', '')),
+            state=([ShardRange.SHRINKING] * 3 +
+                   [ShardRange.SHARDING] +
+                   [ShardRange.ACTIVE] * 6))
+        broker.merge_shard_ranges(shard_ranges)
+        sequences = find_compactible_shard_sequences(broker, 10, 999, -1, -1)
+        self.assertEqual([shard_ranges[4:]], sequences)
+
+    def test_find_compactible_no_gaps(self):
+        # verify that compactible sequences do not include gaps
+        broker = self._make_broker()
+        shard_ranges = self._make_shard_ranges(
+            (('', 'b'), ('b', 'c'), ('c', 'd'), ('e', 'f'),  # gap d - e
+             ('f', 'g'), ('g', 'h'), ('h', 'i'), ('i', 'j'), ('j', '')),
+            state=ShardRange.ACTIVE)
+        broker.merge_shard_ranges(shard_ranges)
+        own_sr = broker.get_own_shard_range()
+        own_sr.update_state(ShardRange.SHARDED)
+        broker.merge_shard_ranges(own_sr)
+        sequences = find_compactible_shard_sequences(broker, 10, 999, -1, -1)
+        self.assertEqual([shard_ranges[:3], shard_ranges[3:]], sequences)
+
+    def test_find_compactible_eligible_states(self):
+        # verify that compactible sequences only include shards in valid states
+        broker = self._make_broker()
+        shard_ranges = self._make_shard_ranges(
+            (('', 'b'), ('b', 'c'), ('c', 'd'), ('d', 'e'), ('e', 'f'),
+             ('f', 'g'), ('g', 'h'), ('h', 'i'), ('i', 'j'), ('j', '')),
+            state=[ShardRange.SHRINKING, ShardRange.ACTIVE,  # ok, shrinking
+                   ShardRange.CREATED,  # ineligible state
+                   ShardRange.ACTIVE, ShardRange.ACTIVE,  # ok
+                   ShardRange.FOUND,  # ineligible state
+                   ShardRange.SHARDED,  # ineligible state
+                   ShardRange.ACTIVE, ShardRange.SHRINKING,  # ineligible state
+                   ShardRange.SHARDING,  # ineligible state
+                   ])
+        broker.merge_shard_ranges(shard_ranges)
+        own_sr = broker.get_own_shard_range()
+        own_sr.update_state(ShardRange.SHARDED)
+        broker.merge_shard_ranges(own_sr)
+        sequences = find_compactible_shard_sequences(broker, 10, 999, -1, -1,
+                                                     include_shrinking=True)
+        self.assertEqual([shard_ranges[:2], shard_ranges[3:5], ], sequences)
+
+    def test_find_compactible_max_shrinking(self):
+        # verify option to limit the number of shrinking shards per acceptor
+        broker = self._make_broker()
+        shard_ranges = self._make_shard_ranges(
+            (('', 'b'), ('b', 'c'), ('c', 'd'), ('d', 'e'), ('e', 'f'),
+             ('f', 'g'), ('g', 'h'), ('h', 'i'), ('i', 'j'), ('j', '')),
+            state=ShardRange.ACTIVE)
+        broker.merge_shard_ranges(shard_ranges)
+        # limit to 1 donor per acceptor
+        sequences = find_compactible_shard_sequences(broker, 10, 999, 1, -1)
+        self.assertEqual([shard_ranges[n:n + 2] for n in range(0, 9, 2)],
+                         sequences)
+
+    def test_find_compactible_max_expanding(self):
+        # verify option to limit the number of expanding shards per acceptor
+        broker = self._make_broker()
+        shard_ranges = self._make_shard_ranges(
+            (('', 'b'), ('b', 'c'), ('c', 'd'), ('d', 'e'), ('e', 'f'),
+             ('f', 'g'), ('g', 'h'), ('h', 'i'), ('i', 'j'), ('j', '')),
+            state=ShardRange.ACTIVE)
+        broker.merge_shard_ranges(shard_ranges)
+        # note: max_shrinking is set to 3 so that there is opportunity for more
+        # than 2 acceptors
+        sequences = find_compactible_shard_sequences(broker, 10, 999, 3, 2)
+        self.assertEqual([shard_ranges[:4], shard_ranges[4:8]], sequences)
+        # relax max_expanding
+        sequences = find_compactible_shard_sequences(broker, 10, 999, 3, 3)
+        self.assertEqual(
+            [shard_ranges[:4], shard_ranges[4:8], shard_ranges[8:]], sequences)
+
+        # commit the first two sequences to the broker
+        for sr in shard_ranges[:3] + shard_ranges[4:7]:
+            sr.update_state(ShardRange.SHRINKING,
+                            state_timestamp=next(self.ts_iter))
+        shard_ranges[3].lower = shard_ranges[0].lower
+        shard_ranges[3].timestamp = next(self.ts_iter)
+        shard_ranges[7].lower = shard_ranges[4].lower
+        shard_ranges[7].timestamp = next(self.ts_iter)
+        broker.merge_shard_ranges(shard_ranges)
+        # we don't find them again...
+        sequences = find_compactible_shard_sequences(broker, 10, 999, 3, 2)
+        self.assertEqual([], sequences)
+        # ...unless requested explicitly
+        sequences = find_compactible_shard_sequences(broker, 10, 999, 3, 2,
+                                                     include_shrinking=True)
+        self.assertEqual([shard_ranges[:4], shard_ranges[4:8]], sequences)
+        # we could find another if max_expanding is increased
+        sequences = find_compactible_shard_sequences(broker, 10, 999, 3, 3)
+        self.assertEqual([shard_ranges[8:]], sequences)
+
+    def _do_test_find_compactible_shrink_threshold(self, broker, shard_ranges):
+        # verify option to set the shrink threshold for compaction;
+        # (n-2)th shard range has one extra object
+        shard_ranges[-2].object_count = 11
+        broker.merge_shard_ranges(shard_ranges)
+        # with threshold set to 10 no shard ranges can be shrunk
+        sequences = find_compactible_shard_sequences(broker, 10, 999, -1, -1)
+        self.assertEqual([], sequences)
+        # with threshold == 11 all but the final 2 shard ranges can be shrunk;
+        # note: the (n-1)th shard range is NOT shrunk to root
+        sequences = find_compactible_shard_sequences(broker, 11, 999, -1, -1)
+        self.assertEqual([shard_ranges[:9]], sequences)
+
+    def test_find_compactible_shrink_threshold(self):
+        broker = self._make_broker()
+        shard_ranges = self._make_shard_ranges(
+            (('', 'b'), ('b', 'c'), ('c', 'd'), ('d', 'e'), ('e', 'f'),
+             ('f', 'g'), ('g', 'h'), ('h', 'i'), ('i', 'j'), ('j', '')),
+            state=ShardRange.ACTIVE, object_count=10)
+        self._do_test_find_compactible_shrink_threshold(broker, shard_ranges)
+
+    def test_find_compactible_shrink_threshold_with_tombstones(self):
+        broker = self._make_broker()
+        shard_ranges = self._make_shard_ranges(
+            (('', 'b'), ('b', 'c'), ('c', 'd'), ('d', 'e'), ('e', 'f'),
+             ('f', 'g'), ('g', 'h'), ('h', 'i'), ('i', 'j'), ('j', '')),
+            state=ShardRange.ACTIVE, object_count=7, tombstones=3)
+        self._do_test_find_compactible_shrink_threshold(broker, shard_ranges)
+
+    def _do_test_find_compactible_expansion_limit(self, broker, shard_ranges):
+        # verify option to limit the size of each acceptor after compaction
+        broker.merge_shard_ranges(shard_ranges)
+        sequences = find_compactible_shard_sequences(broker, 10, 33, -1, -1)
+        self.assertEqual([shard_ranges[:5], shard_ranges[5:]], sequences)
+        shard_ranges[4].update_meta(20, 2000)
+        shard_ranges[6].update_meta(28, 2700)
+        broker.merge_shard_ranges(shard_ranges)
+        sequences = find_compactible_shard_sequences(broker, 10, 33, -1, -1)
+        self.assertEqual([shard_ranges[:4], shard_ranges[7:]], sequences)
+
+    def test_find_compactible_expansion_limit(self):
+        # verify option to limit the size of each acceptor after compaction
+        broker = self._make_broker()
+        shard_ranges = self._make_shard_ranges(
+            (('', 'b'), ('b', 'c'), ('c', 'd'), ('d', 'e'), ('e', 'f'),
+             ('f', 'g'), ('g', 'h'), ('h', 'i'), ('i', 'j'), ('j', '')),
+            state=ShardRange.ACTIVE, object_count=6)
+        self._do_test_find_compactible_expansion_limit(broker, shard_ranges)
+
+    def test_find_compactible_expansion_limit_with_tombstones(self):
+        # verify option to limit the size of each acceptor after compaction
+        broker = self._make_broker()
+        shard_ranges = self._make_shard_ranges(
+            (('', 'b'), ('b', 'c'), ('c', 'd'), ('d', 'e'), ('e', 'f'),
+             ('f', 'g'), ('g', 'h'), ('h', 'i'), ('i', 'j'), ('j', '')),
+            state=ShardRange.ACTIVE, object_count=1, tombstones=5)
+        self._do_test_find_compactible_expansion_limit(broker, shard_ranges)
+
+    def test_is_sharding_candidate(self):
+        for state in ShardRange.STATES:
+            for object_count in (9, 10, 11):
+                sr = ShardRange('.shards_a/c', next(self.ts_iter), '', '',
+                                state=state, object_count=object_count,
+                                tombstones=100)  # tombstones not considered
+                with self.subTest(state=state, object_count=object_count):
+                    if state == ShardRange.ACTIVE and object_count >= 10:
+                        self.assertTrue(is_sharding_candidate(sr, 10))
+                    else:
+                        self.assertFalse(is_sharding_candidate(sr, 10))
+
+    def test_is_shrinking_candidate(self):
+        def do_check_true(state, ok_states):
+            # shard range has 9 objects
+            sr = ShardRange('.shards_a/c', next(self.ts_iter), '', '',
+                            state=state, object_count=9)
+            self.assertTrue(is_shrinking_candidate(sr, 10, 9, ok_states))
+            # shard range has 9 rows
+            sr = ShardRange('.shards_a/c', next(self.ts_iter), '', '',
+                            state=state, object_count=4, tombstones=5)
+            self.assertTrue(is_shrinking_candidate(sr, 10, 9, ok_states))
+
+        do_check_true(ShardRange.ACTIVE, (ShardRange.ACTIVE,))
+        do_check_true(ShardRange.ACTIVE,
+                      (ShardRange.ACTIVE, ShardRange.SHRINKING))
+        do_check_true(ShardRange.SHRINKING,
+                      (ShardRange.ACTIVE, ShardRange.SHRINKING))
+
+        def do_check_false(state, object_count, tombstones):
+            states = (ShardRange.ACTIVE, ShardRange.SHRINKING)
+            # shard range has 10 objects
+            sr = ShardRange('.shards_a/c', next(self.ts_iter), '', '',
+                            state=state, object_count=object_count,
+                            tombstones=tombstones)
+            self.assertFalse(is_shrinking_candidate(sr, 10, 20))
+            self.assertFalse(is_shrinking_candidate(sr, 10, 20, states))
+            self.assertFalse(is_shrinking_candidate(sr, 10, 9))
+            self.assertFalse(is_shrinking_candidate(sr, 10, 9, states))
+            self.assertFalse(is_shrinking_candidate(sr, 20, 9))
+            self.assertFalse(is_shrinking_candidate(sr, 20, 9, states))
+
+        for state in ShardRange.STATES:
+            for object_count in (10, 11):
+                with self.subTest(state=state, object_count=object_count):
+                    do_check_false(state, object_count, 0)
+            for tombstones in (10, 11):
+                with self.subTest(state=state, tombstones=tombstones):
+                    do_check_false(state, 0, tombstones)
+            for tombstones in (5, 6):
+                with self.subTest(state=state, tombstones=tombstones):
+                    do_check_false(state, 5, tombstones)
+
+    def test_find_and_rank_whole_path_split(self):
+        ts_0 = next(self.ts_iter)
+        ts_1 = next(self.ts_iter)
+        bounds_0 = (
+            ('', 'f'),
+            ('f', 'k'),
+            ('k', 's'),
+            ('s', 'x'),
+            ('x', ''),
+        )
+        bounds_1 = (
+            ('', 'g'),
+            ('g', 'l'),
+            ('l', 't'),
+            ('t', 'y'),
+            ('y', ''),
+        )
+        # path with newer timestamp wins
+        ranges_0 = self._make_shard_ranges(bounds_0, ShardRange.ACTIVE,
+                                           timestamp=ts_0)
+        ranges_1 = self._make_shard_ranges(bounds_1, ShardRange.ACTIVE,
+                                           timestamp=ts_1)
+
+        paths = find_paths(ranges_0 + ranges_1)
+        self.assertEqual(2, len(paths))
+        self.assertIn(ranges_0, paths)
+        self.assertIn(ranges_1, paths)
+        own_sr = ShardRange('a/c', Timestamp.now())
+        self.assertEqual(
+            [
+                ranges_1,  # complete and newer timestamp
+                ranges_0,  # complete
+            ],
+            rank_paths(paths, own_sr))
+
+        # but object_count trumps matching timestamp
+        ranges_0 = self._make_shard_ranges(bounds_0, ShardRange.ACTIVE,
+                                           timestamp=ts_1, object_count=1)
+        paths = find_paths(ranges_0 + ranges_1)
+        self.assertEqual(2, len(paths))
+        self.assertIn(ranges_0, paths)
+        self.assertIn(ranges_1, paths)
+        self.assertEqual(
+            [
+                ranges_0,  # complete with more objects
+                ranges_1,  # complete
+            ],
+            rank_paths(paths, own_sr))
+
+    def test_find_and_rank_two_sub_path_splits(self):
+        ts_0 = next(self.ts_iter)
+        ts_1 = next(self.ts_iter)
+        ts_2 = next(self.ts_iter)
+        bounds_0 = (
+            ('', 'a'),
+            ('a', 'm'),
+            ('m', 'p'),
+            ('p', 't'),
+            ('t', 'x'),
+            ('x', 'y'),
+            ('y', ''),
+        )
+        bounds_1 = (
+            ('a', 'g'),  # split at 'a'
+            ('g', 'l'),
+            ('l', 'm'),  # rejoin at 'm'
+        )
+        bounds_2 = (
+            ('t', 'y'),  # split at 't', rejoin at 'y'
+        )
+        ranges_0 = self._make_shard_ranges(bounds_0, ShardRange.ACTIVE,
+                                           timestamp=ts_0)
+        ranges_1 = self._make_shard_ranges(bounds_1, ShardRange.ACTIVE,
+                                           timestamp=ts_1, object_count=1)
+        ranges_2 = self._make_shard_ranges(bounds_2, ShardRange.ACTIVE,
+                                           timestamp=ts_2, object_count=1)
+        # all paths are complete
+        mix_path_0 = ranges_0[:1] + ranges_1 + ranges_0[2:]  # 3 objects
+        mix_path_1 = ranges_0[:4] + ranges_2 + ranges_0[6:]  # 1 object
+        mix_path_2 = (ranges_0[:1] + ranges_1 + ranges_0[2:4] + ranges_2 +
+                      ranges_0[6:])  # 4 objects
+        paths = find_paths(ranges_0 + ranges_1 + ranges_2)
+        self.assertEqual(4, len(paths))
+        self.assertIn(ranges_0, paths)
+        self.assertIn(mix_path_0, paths)
+        self.assertIn(mix_path_1, paths)
+        self.assertIn(mix_path_2, paths)
+        own_sr = ShardRange('a/c', Timestamp.now())
+        self.assertEqual(
+            [
+                mix_path_2,  # has 4 objects, 3 different timestamps
+                mix_path_0,  # has 3 objects, 2 different timestamps
+                mix_path_1,  # has 1 object, 2 different timestamps
+                ranges_0,  # has 0 objects, 1 timestamp
+            ],
+            rank_paths(paths, own_sr)
+        )
+
+    def test_find_and_rank_most_cleave_progress(self):
+        ts_0 = next(self.ts_iter)
+        ts_1 = next(self.ts_iter)
+        ts_2 = next(self.ts_iter)
+        bounds_0 = (
+            ('', 'f'),
+            ('f', 'k'),
+            ('k', 'p'),
+            ('p', '')
+        )
+        bounds_1 = (
+            ('', 'g'),
+            ('g', 'l'),
+            ('l', 'q'),
+            ('q', '')
+        )
+        bounds_2 = (
+            ('', 'r'),
+            ('r', '')
+        )
+        ranges_0 = self._make_shard_ranges(
+            bounds_0, [ShardRange.CLEAVED] * 3 + [ShardRange.CREATED],
+            timestamp=ts_1, object_count=1)
+        ranges_1 = self._make_shard_ranges(
+            bounds_1, [ShardRange.CLEAVED] * 4,
+            timestamp=ts_0)
+        ranges_2 = self._make_shard_ranges(
+            bounds_2, [ShardRange.CLEAVED, ShardRange.CREATED],
+            timestamp=ts_2, object_count=1)
+        paths = find_paths(ranges_0 + ranges_1 + ranges_2)
+        self.assertEqual(3, len(paths))
+        own_sr = ShardRange('a/c', Timestamp.now())
+        self.assertEqual(
+            [
+                ranges_1,  # cleaved to end
+                ranges_2,  # cleaved to r
+                ranges_0,  # cleaved to p
+            ],
+            rank_paths(paths, own_sr)
+        )
+        ranges_2 = self._make_shard_ranges(
+            bounds_2, [ShardRange.ACTIVE] * 2,
+            timestamp=ts_2, object_count=1)
+        paths = find_paths(ranges_0 + ranges_1 + ranges_2)
+        self.assertEqual(
+            [
+                ranges_2,  # active to end, newer timestamp
+                ranges_1,  # cleaved to r
+                ranges_0,  # cleaved to p
+            ],
+            rank_paths(paths, own_sr)
+        )
+
+    def test_find_and_rank_no_complete_path(self):
+        ts_0 = next(self.ts_iter)
+        ts_1 = next(self.ts_iter)
+        ts_2 = next(self.ts_iter)
+        bounds_0 = (
+            ('', 'f'),
+            ('f', 'k'),
+            ('k', 'm'),
+        )
+        bounds_1 = (
+            ('', 'g'),
+            ('g', 'l'),
+            ('l', 'n'),
+        )
+        bounds_2 = (
+            ('', 'l'),
+        )
+        ranges_0 = self._make_shard_ranges(bounds_0, ShardRange.ACTIVE,
+                                           timestamp=ts_0)
+        ranges_1 = self._make_shard_ranges(bounds_1, ShardRange.ACTIVE,
+                                           timestamp=ts_1, object_count=1)
+        ranges_2 = self._make_shard_ranges(bounds_2, ShardRange.ACTIVE,
+                                           timestamp=ts_2, object_count=1)
+        mix_path_0 = ranges_2 + ranges_1[2:]
+        paths = find_paths(ranges_0 + ranges_1 + ranges_2)
+        self.assertEqual(3, len(paths))
+        self.assertIn(ranges_0, paths)
+        self.assertIn(ranges_1, paths)
+        self.assertIn(mix_path_0, paths)
+        own_sr = ShardRange('a/c', Timestamp.now())
+        self.assertEqual(
+            [
+                ranges_1,  # cleaved to n, one timestamp
+                mix_path_0,  # cleaved to n, has two different timestamps
+                ranges_0,  # cleaved to m
+            ],
+            rank_paths(paths, own_sr)
+        )
+
+    def test_find_paths_with_gaps(self):
+        bounds = (
+            # gap
+            ('a', 'f'),
+            ('f', 'm'),  # overlap
+            ('k', 'p'),
+            # gap
+            ('q', 'y')
+            # gap
+        )
+        ranges = self._make_shard_ranges(
+            bounds, ShardRange.ACTIVE,
+            timestamp=next(self.ts_iter), object_count=1)
+        paths_with_gaps = find_paths_with_gaps(ranges)
+        self.assertEqual(3, len(paths_with_gaps), paths_with_gaps)
+        self.assertEqual(
+            [(ShardRange.MIN, ShardRange.MIN),
+             (ShardRange.MIN, 'a'),
+             ('a', 'm')],
+            [(r.lower, r.upper) for r in paths_with_gaps[0]]
+        )
+        self.assertEqual(
+            [('k', 'p'),
+             ('p', 'q'),
+             ('q', 'y')],
+            [(r.lower, r.upper) for r in paths_with_gaps[1]]
+        )
+        self.assertEqual(
+            [('q', 'y'),
+             ('y', ShardRange.MAX),
+             (ShardRange.MAX, ShardRange.MAX)],
+            [(r.lower, r.upper) for r in paths_with_gaps[2]]
+        )
+
+        range_of_interest = ShardRange('test/range', next(self.ts_iter))
+        range_of_interest.lower = 'a'
+        paths_with_gaps = find_paths_with_gaps(ranges, range_of_interest)
+        self.assertEqual(2, len(paths_with_gaps), paths_with_gaps)
+        self.assertEqual(
+            [('k', 'p'),
+             ('p', 'q'),
+             ('q', 'y')],
+            [(r.lower, r.upper) for r in paths_with_gaps[0]]
+        )
+        self.assertEqual(
+            [('q', 'y'),
+             ('y', ShardRange.MAX),
+             (ShardRange.MAX, ShardRange.MAX)],
+            [(r.lower, r.upper) for r in paths_with_gaps[1]]
+        )
+
+        range_of_interest.lower = 'b'
+        range_of_interest.upper = 'x'
+        paths_with_gaps = find_paths_with_gaps(ranges, range_of_interest)
+        self.assertEqual(1, len(paths_with_gaps), paths_with_gaps)
+        self.assertEqual(
+            [('k', 'p'),
+             ('p', 'q'),
+             ('q', 'y')],
+            [(r.lower, r.upper) for r in paths_with_gaps[0]]
+        )
+
+        range_of_interest.upper = 'c'
+        paths_with_gaps = find_paths_with_gaps(ranges, range_of_interest)
+        self.assertFalse(paths_with_gaps)
+
+    def test_find_overlapping_ranges(self):
+        now_ts = next(self.ts_iter)
+        past_ts = Timestamp(float(now_ts) - 61)
+        root_sr = ShardRange('a/c', past_ts, state=ShardRange.SHARDED)
+        bounds = (
+            ('', 'a'),
+            ('a', 'f'),  # the 'parent_range' in this test.
+            ('f', 'm'),  # shard range overlaps with the next.
+            ('k', 'p'),
+            ('p', 'y'),
+            ('y', '')
+        )
+        ranges = [
+            ShardRange(
+                ShardRange.make_path(
+                    '.shards_a', 'c', root_sr.container, past_ts,
+                    index),
+                past_ts, lower, upper, object_count=1,
+                state=ShardRange.SHARDED)
+            for index, (lower, upper) in enumerate(bounds)]
+        parent_range = ranges[1]
+        child_ranges = [
+            ShardRange(
+                ShardRange.make_path(
+                    '.shards_a', 'c', parent_range.container, past_ts, 0),
+                past_ts, lower='a', upper='c', object_count=1,
+                state=ShardRange.CLEAVED),
+            ShardRange(
+                ShardRange.make_path(
+                    '.shards_a', 'c', parent_range.container, past_ts, 1),
+                past_ts, lower='c', upper='f', object_count=1,
+                state=ShardRange.CLEAVED)]
+        overlapping_ranges = find_overlapping_ranges(ranges)
+        self.assertEqual({(ranges[2], ranges[3])}, overlapping_ranges)
+        overlapping_ranges = find_overlapping_ranges(
+            [ranges[1]] + child_ranges)
+        self.assertEqual(
+            {(child_ranges[0], child_ranges[1], ranges[1])},
+            overlapping_ranges)
+        overlapping_ranges = find_overlapping_ranges(
+            [ranges[1]] + child_ranges, exclude_parent_child=True)
+        self.assertEqual(0, len(overlapping_ranges))
+        with mock.patch(
+                'swift.container.sharder.time.time',
+                return_value=float(now_ts)):
+            overlapping_ranges = find_overlapping_ranges(
+                [ranges[1]] + child_ranges, exclude_parent_child=True,
+                time_period=61)
+            self.assertEqual(0, len(overlapping_ranges))
+            overlapping_ranges = find_overlapping_ranges(
+                [ranges[1]] + child_ranges, exclude_parent_child=True,
+                time_period=60)
+            self.assertEqual(
+                {(child_ranges[0], child_ranges[1], ranges[1])},
+                overlapping_ranges)
+        overlapping_ranges = find_overlapping_ranges(
+            ranges + child_ranges)
+        self.assertEqual(
+            {(child_ranges[0],
+              child_ranges[1],
+              ranges[1]),
+             (ranges[2],
+              ranges[3])},
+            overlapping_ranges)
+        overlapping_ranges = find_overlapping_ranges(
+            ranges + child_ranges, exclude_parent_child=True)
+        self.assertEqual({(ranges[2], ranges[3])}, overlapping_ranges)
+        with mock.patch(
+                'swift.container.sharder.time.time',
+                return_value=float(now_ts)):
+            overlapping_ranges = find_overlapping_ranges(
+                ranges + child_ranges, exclude_parent_child=True,
+                time_period=61)
+            self.assertEqual({(ranges[2], ranges[3])}, overlapping_ranges)
+            overlapping_ranges = find_overlapping_ranges(
+                ranges + child_ranges, exclude_parent_child=True,
+                time_period=60)
+            self.assertEqual(
+                {(child_ranges[0],
+                  child_ranges[1],
+                  ranges[1]),
+                 (ranges[2],
+                 ranges[3])},
+                overlapping_ranges)
+
+    def test_update_own_shard_range_stats(self):
+        broker = self._make_broker()
+        ts = next(self.ts_iter)
+        broker.merge_items([
+            {'name': 'obj%02d' % i, 'created_at': ts.internal, 'size': 9,
+             'content_type': 'application/octet-stream', 'etag': 'not-really',
+             'deleted': 0, 'storage_policy_index': 0,
+             'ctype_timestamp': ts.internal, 'meta_timestamp': ts.internal}
+            for i in range(100)])
+
+        self.assertEqual(100, broker.get_info()['object_count'])
+        self.assertEqual(900, broker.get_info()['bytes_used'])
+
+        own_sr = broker.get_own_shard_range()
+        self.assertEqual(0, own_sr.object_count)
+        self.assertEqual(0, own_sr.bytes_used)
+        # own_sr is updated...
+        update_own_shard_range_stats(broker, own_sr)
+        self.assertEqual(100, own_sr.object_count)
+        self.assertEqual(900, own_sr.bytes_used)
+        # ...but not persisted
+        own_sr = broker.get_own_shard_range()
+        self.assertEqual(0, own_sr.object_count)
+        self.assertEqual(0, own_sr.bytes_used)
+
+
+class TestContainerSharderConf(unittest.TestCase):
+    def test_default(self):
+        expected = {'shard_container_threshold': 1000000,
+                    'max_shrinking': 1,
+                    'max_expanding': -1,
+                    'shard_scanner_batch_size': 10,
+                    'cleave_batch_size': 2,
+                    'cleave_row_batch_size': 10000,
+                    'broker_timeout': 60,
+                    'recon_candidates_limit': 5,
+                    'recon_sharded_timeout': 43200,
+                    'container_sharding_timeout': 172800,
+                    'conn_timeout': 5.0,
+                    'auto_shard': False,
+                    'shrink_threshold': 100000,
+                    'expansion_limit': 750000,
+                    'rows_per_shard': 500000,
+                    'minimum_shard_size': 100000}
+        self.assertEqual(expected, vars(ContainerSharderConf()))
+        self.assertEqual(expected, vars(ContainerSharderConf(None)))
+        self.assertEqual(expected, DEFAULT_SHARDER_CONF)
+
+    def test_conf(self):
+        conf = {'shard_container_threshold': 2000000,
+                'max_shrinking': 2,
+                'max_expanding': 3,
+                'shard_scanner_batch_size': 11,
+                'cleave_batch_size': 4,
+                'cleave_row_batch_size': 50000,
+                'broker_timeout': 61,
+                'recon_candidates_limit': 6,
+                'recon_sharded_timeout': 43201,
+                'container_sharding_timeout': 172801,
+                'conn_timeout': 5.1,
+                'auto_shard': True,
+                'shrink_threshold': 100001,
+                'expansion_limit': 750001,
+                'rows_per_shard': 500001,
+                'minimum_shard_size': 20}
+        expected = dict(conf)
+        conf.update({'unexpected': 'option'})
+        self.assertEqual(expected, vars(ContainerSharderConf(conf)))
+
+    def test_deprecated_percent_conf(self):
+        base_conf = {'shard_container_threshold': 2000000,
+                     'max_shrinking': 2,
+                     'max_expanding': 3,
+                     'shard_scanner_batch_size': 11,
+                     'cleave_batch_size': 4,
+                     'cleave_row_batch_size': 50000,
+                     'broker_timeout': 61,
+                     'recon_candidates_limit': 6,
+                     'recon_sharded_timeout': 43201,
+                     'container_sharding_timeout': 172801,
+                     'conn_timeout': 5.1,
+                     'auto_shard': True,
+                     'minimum_shard_size': 1}
+
+        # percent options work
+        deprecated_conf = {'shard_shrink_point': 9,
+                           'shard_shrink_merge_point': 71}
+        expected = dict(base_conf, rows_per_shard=1000000,
+                        shrink_threshold=180000, expansion_limit=1420000)
+        conf = dict(base_conf)
+        conf.update(deprecated_conf)
+        self.assertEqual(expected, vars(ContainerSharderConf(conf)))
+
+        # check absolute options override percent options
+        conf.update({'shrink_threshold': 100001,
+                     'expansion_limit': 750001})
+
+        expected = dict(base_conf, rows_per_shard=1000000,
+                        shrink_threshold=100001, expansion_limit=750001)
+        conf.update(deprecated_conf)
+        self.assertEqual(expected, vars(ContainerSharderConf(conf)))
+
+    def test_bad_values(self):
+        not_positive_int = [0, -1, 'bad']
+        not_int = not_float = ['bad']
+        not_percent = ['bad', -1, 101, -0.1, 100.1]
+        bad = {'shard_container_threshold': not_positive_int,
+               'max_shrinking': not_int,
+               'max_expanding': not_int,
+               'shard_scanner_batch_size': not_positive_int,
+               'cleave_batch_size': not_positive_int,
+               'cleave_row_batch_size': not_positive_int,
+               'broker_timeout': not_positive_int,
+               'recon_candidates_limit': not_int,
+               'recon_sharded_timeout': not_int,
+               'conn_timeout': not_float,
+               # 'auto_shard': anything can be passed to config_true_value
+               'shrink_threshold': not_int,
+               'expansion_limit': not_int,
+               'shard_shrink_point': not_percent,
+               'shard_shrink_merge_point': not_percent,
+               'minimum_shard_size': not_positive_int}
+
+        for key, bad_values in bad.items():
+            for bad_value in bad_values:
+                with self.assertRaises(
+                        ValueError, msg='{%s : %s}' % (key, bad_value)) as cm:
+                    ContainerSharderConf({key: bad_value})
+                self.assertIn('Error setting %s' % key, str(cm.exception))
+
+    def test_validate(self):
+        def assert_bad(conf):
+            with self.assertRaises(ValueError):
+                ContainerSharderConf.validate_conf(ContainerSharderConf(conf))
+
+        def assert_ok(conf):
+            try:
+                ContainerSharderConf.validate_conf(ContainerSharderConf(conf))
+            except ValueError as err:
+                self.fail('Unexpected ValueError: %s' % err)
+
+        assert_ok({})
+        assert_ok({'minimum_shard_size': 100,
+                   'shrink_threshold': 100,
+                   'rows_per_shard': 100})
+        assert_bad({'minimum_shard_size': 100})
+        assert_bad({'shrink_threshold': 100001})
+        assert_ok({'minimum_shard_size': 100,
+                   'shrink_threshold': 100})
+        assert_bad({'minimum_shard_size': 100,
+                    'shrink_threshold': 100,
+                    'rows_per_shard': 99})
+
+        assert_ok({'shard_container_threshold': 100,
+                   'rows_per_shard': 99})
+        assert_bad({'shard_container_threshold': 100,
+                    'rows_per_shard': 100})
+        assert_bad({'rows_per_shard': 10000001})
+
+        assert_ok({'shard_container_threshold': 100,
+                   'expansion_limit': 99})
+        assert_bad({'shard_container_threshold': 100,
+                    'expansion_limit': 100})
+        assert_bad({'expansion_limit': 100000001})
+
+    def test_validate_subset(self):
+        # verify that validation is only applied for keys that exist in the
+        # given namespace
+        def assert_bad(conf):
+            with self.assertRaises(ValueError):
+                ContainerSharderConf.validate_conf(argparse.Namespace(**conf))
+
+        def assert_ok(conf):
+            try:
+                ContainerSharderConf.validate_conf(argparse.Namespace(**conf))
+            except ValueError as err:
+                self.fail('Unexpected ValueError: %s' % err)
+
+        assert_ok({})
+        assert_ok({'minimum_shard_size': 100,
+                   'shrink_threshold': 100,
+                   'rows_per_shard': 100})
+        assert_ok({'minimum_shard_size': 100})
+        assert_ok({'shrink_threshold': 100001})
+        assert_ok({'minimum_shard_size': 100,
+                   'shrink_threshold': 100})
+        assert_bad({'minimum_shard_size': 100,
+                    'shrink_threshold': 100,
+                    'rows_per_shard': 99})
+
+        assert_ok({'shard_container_threshold': 100,
+                   'rows_per_shard': 99})
+        assert_bad({'shard_container_threshold': 100,
+                    'rows_per_shard': 100})
+        assert_ok({'rows_per_shard': 10000001})
+
+        assert_ok({'shard_container_threshold': 100,
+                   'expansion_limit': 99})
+        assert_bad({'shard_container_threshold': 100,
+                    'expansion_limit': 100})
+        assert_ok({'expansion_limit': 100000001})
+
+    def test_combine_shard_ranges(self):
+        ts_iter = make_timestamp_iter()
+        this = ShardRange('a/o', next(ts_iter).internal)
+        that = ShardRange('a/o', next(ts_iter).internal)
+        actual = combine_shard_ranges([dict(this)], [dict(that)])
+        self.assertEqual([dict(that)], [dict(sr) for sr in actual])
+        actual = combine_shard_ranges([dict(that)], [dict(this)])
+        self.assertEqual([dict(that)], [dict(sr) for sr in actual])
+
+        ts = next(ts_iter).internal
+        this = ShardRange('a/o', ts, state=ShardRange.ACTIVE,
+                          state_timestamp=next(ts_iter))
+        that = ShardRange('a/o', ts, state=ShardRange.CREATED,
+                          state_timestamp=next(ts_iter))
+        actual = combine_shard_ranges([dict(this)], [dict(that)])
+        self.assertEqual([dict(that)], [dict(sr) for sr in actual])
+        actual = combine_shard_ranges([dict(that)], [dict(this)])
+        self.assertEqual([dict(that)], [dict(sr) for sr in actual])
+
+        that.update_meta(1, 2, meta_timestamp=next(ts_iter))
+        this.update_meta(3, 4, meta_timestamp=next(ts_iter))
+        expected = that.copy(object_count=this.object_count,
+                             bytes_used=this.bytes_used,
+                             meta_timestamp=this.meta_timestamp)
+        actual = combine_shard_ranges([dict(this)], [dict(that)])
+        self.assertEqual([dict(expected)], [dict(sr) for sr in actual])
+        actual = combine_shard_ranges([dict(that)], [dict(this)])
+        self.assertEqual([dict(expected)], [dict(sr) for sr in actual])
+
+        this = ShardRange('a/o', next(ts_iter).internal)
+        that = ShardRange('a/o', next(ts_iter).internal, deleted=True)
+        actual = combine_shard_ranges([dict(this)], [dict(that)])
+        self.assertFalse(actual, [dict(sr) for sr in actual])
+        actual = combine_shard_ranges([dict(that)], [dict(this)])
+        self.assertFalse(actual, [dict(sr) for sr in actual])
+
+        this = ShardRange('a/o', next(ts_iter).internal, deleted=True)
+        that = ShardRange('a/o', next(ts_iter).internal)
+        actual = combine_shard_ranges([dict(this)], [dict(that)])
+        self.assertEqual([dict(that)], [dict(sr) for sr in actual])
+        actual = combine_shard_ranges([dict(that)], [dict(this)])
+        self.assertEqual([dict(that)], [dict(sr) for sr in actual])
diff --git a/test/unit/container/test_sync.py b/test/unit/container/test_sync.py
index 10173d5d1b..6518f408b3 100644
--- a/test/unit/container/test_sync.py
+++ b/test/unit/container/test_sync.py
@@ -1,4 +1,5 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,23 +14,32 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
+import os
 import unittest
+from textwrap import dedent
 
-import re
-from test.unit import FakeLogger
+from unittest import mock
+import errno
+from swift.common.utils import Timestamp, readconf
+from test.debug_logger import debug_logger
 from swift.container import sync
+from swift.common.db import DatabaseConnectionError
 from swift.common import utils
-from swiftclient import ClientException
-
+from swift.common.wsgi import ConfigString
+from swift.common.exceptions import ClientException
+from swift.common.storage_policy import StoragePolicy
+import test
+from test.unit import patch_policies, with_tempdir
 
-utils.HASH_PATH_SUFFIX = 'endcap'
+utils.HASH_PATH_SUFFIX = b'endcap'
+utils.HASH_PATH_PREFIX = b'endcap'
 
 
 class FakeRing(object):
 
     def __init__(self):
         self.devs = [{'ip': '10.0.0.%s' % x, 'port': 1000 + x, 'device': 'sda'}
-                     for x in xrange(3)]
+                     for x in range(3)]
 
     def get_nodes(self, account, container=None, obj=None):
         return 1, list(self.devs)
@@ -40,6 +50,7 @@ class FakeContainerBroker(object):
     def __init__(self, path, metadata=None, info=None, deleted=False,
                  items_since=None):
         self.db_file = path
+        self.db_dir = os.path.dirname(path)
         self.metadata = metadata if metadata else {}
         self.info = info if info else {}
         self.deleted = deleted
@@ -47,6 +58,9 @@ def __init__(self, path, metadata=None, info=None, deleted=False,
         self.sync_point1 = -1
         self.sync_point2 = -1
 
+    def get_max_row(self):
+        return 1
+
     def get_info(self):
         return self.info
 
@@ -63,37 +77,106 @@ def set_x_container_sync_points(self, sync_point1, sync_point2):
         self.sync_point2 = sync_point2
 
 
+@patch_policies([StoragePolicy(0, 'zero', True, object_ring=FakeRing())])
 class TestContainerSync(unittest.TestCase):
 
-    def test_Iter2FileLikeObject(self):
-        flo = sync._Iter2FileLikeObject(iter(['123', '4567', '89', '0']))
-        expect = '1234567890'
+    def setUp(self):
+        self.logger = debug_logger('test-container-sync')
+
+    def test_FileLikeIter(self):
+        # Retained test to show new FileLikeIter acts just like the removed
+        # _Iter2FileLikeObject did.
+        flo = sync.FileLikeIter(iter([b'123', b'4567', b'89', b'0']))
+        expect = b'1234567890'
 
         got = flo.read(2)
         self.assertTrue(len(got) <= 2)
-        self.assertEquals(got, expect[:len(got)])
+        self.assertEqual(got, expect[:len(got)])
         expect = expect[len(got):]
 
         got = flo.read(5)
         self.assertTrue(len(got) <= 5)
-        self.assertEquals(got, expect[:len(got)])
+        self.assertEqual(got, expect[:len(got)])
         expect = expect[len(got):]
 
-        self.assertEquals(flo.read(), expect)
-        self.assertEquals(flo.read(), '')
-        self.assertEquals(flo.read(2), '')
+        self.assertEqual(flo.read(), expect)
+        self.assertEqual(flo.read(), b'')
+        self.assertEqual(flo.read(2), b'')
+
+        flo = sync.FileLikeIter(iter([b'123', b'4567', b'89', b'0']))
+        self.assertEqual(flo.read(), b'1234567890')
+        self.assertEqual(flo.read(), b'')
+        self.assertEqual(flo.read(2), b'')
 
-        flo = sync._Iter2FileLikeObject(iter(['123', '4567', '89', '0']))
-        self.assertEquals(flo.read(), '1234567890')
-        self.assertEquals(flo.read(), '')
-        self.assertEquals(flo.read(2), '')
+    def assertLogMessage(self, msg_level, expected, skip=0):
+        for line in self.logger.get_lines_for_level(msg_level)[skip:]:
+            msg = 'expected %r not in %r' % (expected, line)
+            self.assertTrue(expected in line, msg)
 
-    def test_init(self):
+    @with_tempdir
+    def test_init(self, tempdir):
+        ic_conf_path = os.path.join(tempdir, 'internal-client.conf')
         cring = FakeRing()
-        oring = FakeRing()
-        cs = sync.ContainerSync({}, container_ring=cring, object_ring=oring)
+
+        with mock.patch('swift.container.sync.InternalClient'):
+            cs = sync.ContainerSync({}, container_ring=cring)
         self.assertTrue(cs.container_ring is cring)
-        self.assertTrue(cs.object_ring is oring)
+
+        # specified but not exists will not start
+        conf = {'internal_client_conf_path': ic_conf_path}
+        self.assertRaises(SystemExit, sync.ContainerSync, conf,
+                          container_ring=cring, logger=self.logger)
+
+        # not specified will use default conf
+        with mock.patch('swift.container.sync.InternalClient') as mock_ic:
+            cs = sync.ContainerSync({}, container_ring=cring,
+                                    logger=self.logger)
+        self.assertTrue(cs.container_ring is cring)
+        self.assertTrue(mock_ic.called)
+        conf_path, name, retry = mock_ic.call_args[0]
+        self.assertIsInstance(conf_path, ConfigString)
+        self.assertEqual(conf_path.contents.getvalue(),
+                         dedent(sync.ic_conf_body))
+        self.assertLogMessage('warning', 'internal_client_conf_path')
+        self.assertLogMessage('warning', 'internal-client.conf-sample')
+
+        # correct
+        contents = dedent(sync.ic_conf_body)
+        with open(ic_conf_path, 'w') as f:
+            f.write(contents)
+        with mock.patch('swift.container.sync.InternalClient') as mock_ic:
+            cs = sync.ContainerSync(conf, container_ring=cring)
+        self.assertTrue(cs.container_ring is cring)
+        self.assertTrue(mock_ic.called)
+        conf_path, name, retry = mock_ic.call_args[0]
+        self.assertEqual(conf_path, ic_conf_path)
+
+        sample_conf_filename = os.path.join(
+            os.path.dirname(test.__file__),
+            '../etc/internal-client.conf-sample')
+        actual_conf = readconf(ConfigString(contents))
+        expected_conf = readconf(sample_conf_filename)
+        actual_conf.pop('__file__')
+        expected_conf.pop('__file__')
+        self.assertEqual(expected_conf, actual_conf)
+
+    def test_init_internal_client_log_name(self):
+        def _do_test_init_ic_log_name(conf, exp_internal_client_log_name):
+            with mock.patch(
+                    'swift.container.sync.InternalClient') \
+                    as mock_ic:
+                sync.ContainerSync(conf, container_ring='dummy object')
+            mock_ic.assert_called_once_with(
+                'conf-path',
+                'Swift Container Sync', 3,
+                global_conf={'log_name': exp_internal_client_log_name},
+                use_replication_network=True)
+
+        _do_test_init_ic_log_name({'internal_client_conf_path': 'conf-path'},
+                                  'container-sync-ic')
+        _do_test_init_ic_log_name({'internal_client_conf_path': 'conf-path',
+                                   'log_name': 'my-container-sync'},
+                                  'my-container-sync-ic')
 
     def test_run_forever(self):
         # This runs runs_forever with fakes to succeed for two loops, the first
@@ -101,7 +184,6 @@ def test_run_forever(self):
         # interval sleep.
         time_calls = [0]
         sleep_calls = []
-        audit_location_generator_calls = [0]
 
         def fake_time():
             time_calls[0] += 1
@@ -112,8 +194,7 @@ def fake_time():
                        3602,  # Elapsed time for "under interval" (no)
                        3602,  # Start time
                        3603,  # Is it report time (no)
-                       3603,  # Elapsed time for "under interval" (yes)
-                      ]
+                       3603]  # Elapsed time for "under interval" (yes)
             if time_calls[0] == len(returns) + 1:
                 raise Exception('we are now done')
             return returns[time_calls[0] - 1]
@@ -121,42 +202,36 @@ def fake_time():
         def fake_sleep(amount):
             sleep_calls.append(amount)
 
-        def fake_audit_location_generator(*args, **kwargs):
-            audit_location_generator_calls[0] += 1
-            # Makes .container_sync() short-circuit because 'path' doesn't end
-            # with .db
-            return [('path', 'device', 'partition')]
-
-        orig_time = sync.time
-        orig_sleep = sync.sleep
-        orig_audit_location_generator = sync.audit_location_generator
-        try:
-            sync.time = fake_time
-            sync.sleep = fake_sleep
-            sync.audit_location_generator = fake_audit_location_generator
-            cs = sync.ContainerSync({}, container_ring=FakeRing(),
-                                    object_ring=FakeRing())
-            cs.run_forever()
-        except Exception, err:
-            if str(err) != 'we are now done':
-                raise
-        finally:
-            sync.time = orig_time
-            sync.sleep = orig_sleep
-            sync.audit_location_generator = orig_audit_location_generator
-
-        self.assertEquals(time_calls, [9])
-        self.assertEquals(len(sleep_calls), 2)
-        self.assertTrue(sleep_calls[0] <= cs.interval)
-        self.assertTrue(sleep_calls[1] == cs.interval - 1)
-        self.assertEquals(audit_location_generator_calls, [2])
-        self.assertEquals(cs.reported, 3602)
+        gen_func = ('swift.container.sync_store.'
+                    'ContainerSyncStore.synced_containers_generator')
+        with mock.patch('swift.container.sync.InternalClient'), \
+                mock.patch('swift.container.sync.time', fake_time), \
+                mock.patch('swift.container.sync.sleep', fake_sleep), \
+                mock.patch(gen_func) as fake_generator, \
+                mock.patch('swift.container.sync.ContainerBroker',
+                           lambda p, logger: FakeContainerBroker(p, info={
+                               'account': 'a', 'container': 'c',
+                               'storage_policy_index': 0})):
+            fake_generator.side_effect = [iter(['container.db']),
+                                          iter(['container.db'])]
+            cs = sync.ContainerSync({}, container_ring=FakeRing())
+            try:
+                cs.run_forever()
+            except Exception as err:
+                if str(err) != 'we are now done':
+                    raise
+
+            self.assertEqual(time_calls, [9])
+            self.assertEqual(len(sleep_calls), 2)
+            self.assertLessEqual(sleep_calls[0], cs.interval)
+            self.assertEqual(cs.interval - 1, sleep_calls[1])
+            self.assertEqual(2, fake_generator.call_count)
+            self.assertEqual(cs.reported, 3602)
 
     def test_run_once(self):
         # This runs runs_once with fakes twice, the first causing an interim
-        # report, the second with no interm report.
+        # report, the second with no interim report.
         time_calls = [0]
-        audit_location_generator_calls = [0]
 
         def fake_time():
             time_calls[0] += 1
@@ -169,160 +244,224 @@ def fake_time():
                        3602,  # Start time
                        3603,  # Is it report time (no)
                        3604,  # End report time
-                       3605,  # For elapsed
-                      ]
+                       3605]  # For elapsed
             if time_calls[0] == len(returns) + 1:
                 raise Exception('we are now done')
             return returns[time_calls[0] - 1]
 
-        def fake_audit_location_generator(*args, **kwargs):
-            audit_location_generator_calls[0] += 1
-            # Makes .container_sync() short-circuit because 'path' doesn't end
-            # with .db
-            return [('path', 'device', 'partition')]
-
-        orig_time = sync.time
-        orig_audit_location_generator = sync.audit_location_generator
-        try:
-            sync.time = fake_time
-            sync.audit_location_generator = fake_audit_location_generator
-            cs = sync.ContainerSync({}, container_ring=FakeRing(),
-                                    object_ring=FakeRing())
-            cs.run_once()
-            self.assertEquals(time_calls, [6])
-            self.assertEquals(audit_location_generator_calls, [1])
-            self.assertEquals(cs.reported, 3602)
-            cs.run_once()
-        except Exception, err:
-            if str(err) != 'we are now done':
-                raise
-        finally:
-            sync.time = orig_time
-            sync.audit_location_generator = orig_audit_location_generator
-
-        self.assertEquals(time_calls, [10])
-        self.assertEquals(audit_location_generator_calls, [2])
-        self.assertEquals(cs.reported, 3604)
+        gen_func = ('swift.container.sync_store.'
+                    'ContainerSyncStore.synced_containers_generator')
+        with mock.patch('swift.container.sync.InternalClient'), \
+                mock.patch('swift.container.sync.time', fake_time), \
+                mock.patch(gen_func) as fake_generator, \
+                mock.patch('swift.container.sync.ContainerBroker',
+                           lambda p, logger: FakeContainerBroker(p, info={
+                               'account': 'a', 'container': 'c',
+                               'storage_policy_index': 0})):
+            fake_generator.side_effect = [iter(['container.db']),
+                                          iter(['container.db'])]
+            cs = sync.ContainerSync({}, container_ring=FakeRing())
+            try:
+                cs.run_once()
+                self.assertEqual(time_calls, [6])
+                self.assertEqual(1, fake_generator.call_count)
+                self.assertEqual(cs.reported, 3602)
+                cs.run_once()
+            except Exception as err:
+                if str(err) != 'we are now done':
+                    raise
+
+            self.assertEqual(time_calls, [10])
+            self.assertEqual(2, fake_generator.call_count)
+            self.assertEqual(cs.reported, 3604)
 
     def test_container_sync_not_db(self):
         cring = FakeRing()
-        oring = FakeRing()
-        cs = sync.ContainerSync({}, container_ring=cring, object_ring=oring)
-        self.assertEquals(cs.container_failures, 0)
+        with mock.patch('swift.container.sync.InternalClient'):
+            cs = sync.ContainerSync({}, container_ring=cring)
+        self.assertEqual(cs.container_failures, 0)
 
     def test_container_sync_missing_db(self):
         cring = FakeRing()
-        oring = FakeRing()
-        cs = sync.ContainerSync({}, container_ring=cring, object_ring=oring)
-        cs.container_sync('isa.db')
-        self.assertEquals(cs.container_failures, 1)
+        with mock.patch('swift.container.sync.InternalClient'):
+            cs = sync.ContainerSync({}, container_ring=cring)
+
+        broker = 'swift.container.backend.ContainerBroker'
+        store = 'swift.container.sync_store.ContainerSyncStore'
+
+        # In this test we call the container_sync instance several
+        # times with a missing db in various combinations.
+        # Since we use the same ContainerSync instance for all tests
+        # its failures counter increases by one with each call.
+
+        # Test the case where get_info returns DatabaseConnectionError
+        # with DB does not exist, and we succeed in deleting it.
+        with mock.patch(broker + '.get_info') as fake_get_info:
+            with mock.patch(store + '.remove_synced_container') as fake_remove:
+                fake_get_info.side_effect = DatabaseConnectionError(
+                    'a',
+                    "DB doesn't exist")
+                cs.container_sync('isa.db')
+                self.assertEqual(cs.container_failures, 1)
+                self.assertEqual(cs.container_skips, 0)
+                self.assertEqual(1, fake_remove.call_count)
+                self.assertEqual('isa.db', fake_remove.call_args[0][0].db_file)
+
+        # Test the case where get_info returns DatabaseConnectionError
+        # with DB does not exist, and we fail to delete it.
+        with mock.patch(broker + '.get_info') as fake_get_info:
+            with mock.patch(store + '.remove_synced_container') as fake_remove:
+                fake_get_info.side_effect = DatabaseConnectionError(
+                    'a',
+                    "DB doesn't exist")
+                fake_remove.side_effect = OSError('1')
+                cs.container_sync('isa.db')
+                self.assertEqual(cs.container_failures, 2)
+                self.assertEqual(cs.container_skips, 0)
+                self.assertEqual(1, fake_remove.call_count)
+                self.assertEqual('isa.db', fake_remove.call_args[0][0].db_file)
+
+        # Test the case where get_info returns DatabaseConnectionError
+        # with DB does not exist, and it returns an error != ENOENT.
+        with mock.patch(broker + '.get_info') as fake_get_info:
+            with mock.patch(store + '.remove_synced_container') as fake_remove:
+                fake_get_info.side_effect = DatabaseConnectionError(
+                    'a',
+                    "DB doesn't exist")
+                fake_remove.side_effect = OSError(errno.EPERM, 'a')
+                cs.container_sync('isa.db')
+                self.assertEqual(cs.container_failures, 3)
+                self.assertEqual(cs.container_skips, 0)
+                self.assertEqual(1, fake_remove.call_count)
+                self.assertEqual('isa.db', fake_remove.call_args[0][0].db_file)
+
+        # Test the case where get_info returns DatabaseConnectionError
+        # error different than DB does not exist
+        with mock.patch(broker + '.get_info') as fake_get_info:
+            with mock.patch(store + '.remove_synced_container') as fake_remove:
+                fake_get_info.side_effect = DatabaseConnectionError('a', 'a')
+                cs.container_sync('isa.db')
+                self.assertEqual(cs.container_failures, 4)
+                self.assertEqual(cs.container_skips, 0)
+                self.assertEqual(0, fake_remove.call_count)
 
     def test_container_sync_not_my_db(self):
         # Db could be there due to handoff replication so test that we ignore
         # those.
         cring = FakeRing()
-        oring = FakeRing()
-        cs = sync.ContainerSync({}, container_ring=cring, object_ring=oring)
+        with mock.patch('swift.container.sync.InternalClient'):
+            cs = sync.ContainerSync({
+                'bind_ip': '10.0.0.0',
+            }, container_ring=cring)
+            # Plumbing test for bind_ip and whataremyips()
+            self.assertEqual(['10.0.0.0'], cs._myips)
         orig_ContainerBroker = sync.ContainerBroker
         try:
-            sync.ContainerBroker = lambda p: FakeContainerBroker(p,
-                info={'account': 'a', 'container': 'c'})
+            sync.ContainerBroker = lambda p, logger: FakeContainerBroker(
+                p, info={'account': 'a', 'container': 'c',
+                         'storage_policy_index': 0})
             cs._myips = ['127.0.0.1']   # No match
             cs._myport = 1              # No match
             cs.container_sync('isa.db')
-            self.assertEquals(cs.container_failures, 0)
+            self.assertEqual(cs.container_failures, 0)
 
             cs._myips = ['10.0.0.0']    # Match
             cs._myport = 1              # No match
             cs.container_sync('isa.db')
-            self.assertEquals(cs.container_failures, 0)
+            self.assertEqual(cs.container_failures, 0)
 
             cs._myips = ['127.0.0.1']   # No match
             cs._myport = 1000           # Match
             cs.container_sync('isa.db')
-            self.assertEquals(cs.container_failures, 0)
+            self.assertEqual(cs.container_failures, 0)
 
             cs._myips = ['10.0.0.0']    # Match
             cs._myport = 1000           # Match
             # This complete match will cause the 1 container failure since the
             # broker's info doesn't contain sync point keys
             cs.container_sync('isa.db')
-            self.assertEquals(cs.container_failures, 1)
+            self.assertEqual(cs.container_failures, 1)
         finally:
             sync.ContainerBroker = orig_ContainerBroker
 
     def test_container_sync_deleted(self):
         cring = FakeRing()
-        oring = FakeRing()
-        cs = sync.ContainerSync({}, container_ring=cring, object_ring=oring)
+        with mock.patch('swift.container.sync.InternalClient'):
+            cs = sync.ContainerSync({}, container_ring=cring)
         orig_ContainerBroker = sync.ContainerBroker
         try:
-            sync.ContainerBroker = lambda p: FakeContainerBroker(p,
-                info={'account': 'a', 'container': 'c'}, deleted=False)
+            sync.ContainerBroker = lambda p, logger: FakeContainerBroker(
+                p, info={'account': 'a', 'container': 'c',
+                         'storage_policy_index': 0}, deleted=False)
             cs._myips = ['10.0.0.0']    # Match
             cs._myport = 1000           # Match
             # This complete match will cause the 1 container failure since the
             # broker's info doesn't contain sync point keys
             cs.container_sync('isa.db')
-            self.assertEquals(cs.container_failures, 1)
+            self.assertEqual(cs.container_failures, 1)
 
-            sync.ContainerBroker = lambda p: FakeContainerBroker(p,
-                info={'account': 'a', 'container': 'c'}, deleted=True)
+            sync.ContainerBroker = lambda p, logger: FakeContainerBroker(
+                p, info={'account': 'a', 'container': 'c',
+                         'storage_policy_index': 0}, deleted=True)
             # This complete match will not cause any more container failures
             # since the broker indicates deletion
             cs.container_sync('isa.db')
-            self.assertEquals(cs.container_failures, 1)
+            self.assertEqual(cs.container_failures, 1)
         finally:
             sync.ContainerBroker = orig_ContainerBroker
 
     def test_container_sync_no_to_or_key(self):
         cring = FakeRing()
-        oring = FakeRing()
-        cs = sync.ContainerSync({}, container_ring=cring, object_ring=oring)
+        with mock.patch('swift.container.sync.InternalClient'):
+            cs = sync.ContainerSync({}, container_ring=cring)
         orig_ContainerBroker = sync.ContainerBroker
         try:
-            sync.ContainerBroker = lambda p: FakeContainerBroker(p,
-                info={'account': 'a', 'container': 'c',
-                      'x_container_sync_point1': -1,
-                      'x_container_sync_point2': -1})
+            sync.ContainerBroker = lambda p, logger: FakeContainerBroker(
+                p, info={'account': 'a', 'container': 'c',
+                         'storage_policy_index': 0,
+                         'x_container_sync_point1': -1,
+                         'x_container_sync_point2': -1})
             cs._myips = ['10.0.0.0']    # Match
             cs._myport = 1000           # Match
             # This complete match will be skipped since the broker's metadata
             # has no x-container-sync-to or x-container-sync-key
             cs.container_sync('isa.db')
-            self.assertEquals(cs.container_failures, 0)
-            self.assertEquals(cs.container_skips, 1)
- 
-            sync.ContainerBroker = lambda p: FakeContainerBroker(p,
-                info={'account': 'a', 'container': 'c',
-                      'x_container_sync_point1': -1,
-                      'x_container_sync_point2': -1},
+            self.assertEqual(cs.container_failures, 0)
+            self.assertEqual(cs.container_skips, 1)
+
+            sync.ContainerBroker = lambda p, logger: FakeContainerBroker(
+                p, info={'account': 'a', 'container': 'c',
+                         'storage_policy_index': 0,
+                         'x_container_sync_point1': -1,
+                         'x_container_sync_point2': -1},
                 metadata={'x-container-sync-to': ('http://127.0.0.1/a/c', 1)})
             cs._myips = ['10.0.0.0']    # Match
             cs._myport = 1000           # Match
             # This complete match will be skipped since the broker's metadata
             # has no x-container-sync-key
             cs.container_sync('isa.db')
-            self.assertEquals(cs.container_failures, 0)
-            self.assertEquals(cs.container_skips, 2)
- 
-            sync.ContainerBroker = lambda p: FakeContainerBroker(p,
-                info={'account': 'a', 'container': 'c',
-                      'x_container_sync_point1': -1,
-                      'x_container_sync_point2': -1},
+            self.assertEqual(cs.container_failures, 0)
+            self.assertEqual(cs.container_skips, 2)
+
+            sync.ContainerBroker = lambda p, logger: FakeContainerBroker(
+                p, info={'account': 'a', 'container': 'c',
+                         'storage_policy_index': 0,
+                         'x_container_sync_point1': -1,
+                         'x_container_sync_point2': -1},
                 metadata={'x-container-sync-key': ('key', 1)})
             cs._myips = ['10.0.0.0']    # Match
             cs._myport = 1000           # Match
             # This complete match will be skipped since the broker's metadata
             # has no x-container-sync-to
             cs.container_sync('isa.db')
-            self.assertEquals(cs.container_failures, 0)
-            self.assertEquals(cs.container_skips, 3)
- 
-            sync.ContainerBroker = lambda p: FakeContainerBroker(p,
-                info={'account': 'a', 'container': 'c',
-                      'x_container_sync_point1': -1,
-                      'x_container_sync_point2': -1},
+            self.assertEqual(cs.container_failures, 0)
+            self.assertEqual(cs.container_skips, 3)
+
+            sync.ContainerBroker = lambda p, logger: FakeContainerBroker(
+                p, info={'account': 'a', 'container': 'c',
+                         'storage_policy_index': 0,
+                         'x_container_sync_point1': -1,
+                         'x_container_sync_point2': -1},
                 metadata={'x-container-sync-to': ('http://127.0.0.1/a/c', 1),
                           'x-container-sync-key': ('key', 1)})
             cs._myips = ['10.0.0.0']    # Match
@@ -331,13 +470,14 @@ def test_container_sync_no_to_or_key(self):
             # This complete match will cause a container failure since the
             # sync-to won't validate as allowed.
             cs.container_sync('isa.db')
-            self.assertEquals(cs.container_failures, 1)
-            self.assertEquals(cs.container_skips, 3)
- 
-            sync.ContainerBroker = lambda p: FakeContainerBroker(p,
-                info={'account': 'a', 'container': 'c',
-                      'x_container_sync_point1': -1,
-                      'x_container_sync_point2': -1},
+            self.assertEqual(cs.container_failures, 1)
+            self.assertEqual(cs.container_skips, 3)
+
+            sync.ContainerBroker = lambda p, logger: FakeContainerBroker(
+                p, info={'account': 'a', 'container': 'c',
+                         'storage_policy_index': 0,
+                         'x_container_sync_point1': -1,
+                         'x_container_sync_point2': -1},
                 metadata={'x-container-sync-to': ('http://127.0.0.1/a/c', 1),
                           'x-container-sync-key': ('key', 1)})
             cs._myips = ['10.0.0.0']    # Match
@@ -346,22 +486,23 @@ def test_container_sync_no_to_or_key(self):
             # This complete match will succeed completely since the broker
             # get_items_since will return no new rows.
             cs.container_sync('isa.db')
-            self.assertEquals(cs.container_failures, 1)
-            self.assertEquals(cs.container_skips, 3)
+            self.assertEqual(cs.container_failures, 1)
+            self.assertEqual(cs.container_skips, 3)
         finally:
             sync.ContainerBroker = orig_ContainerBroker
 
     def test_container_stop_at(self):
         cring = FakeRing()
-        oring = FakeRing()
-        cs = sync.ContainerSync({}, container_ring=cring, object_ring=oring)
+        with mock.patch('swift.container.sync.InternalClient'):
+            cs = sync.ContainerSync({}, container_ring=cring)
         orig_ContainerBroker = sync.ContainerBroker
         orig_time = sync.time
         try:
-            sync.ContainerBroker = lambda p: FakeContainerBroker(p,
-                info={'account': 'a', 'container': 'c',
-                      'x_container_sync_point1': -1,
-                      'x_container_sync_point2': -1},
+            sync.ContainerBroker = lambda p, logger: FakeContainerBroker(
+                p, info={'account': 'a', 'container': 'c',
+                         'storage_policy_index': 0,
+                         'x_container_sync_point1': -1,
+                         'x_container_sync_point2': -1},
                 metadata={'x-container-sync-to': ('http://127.0.0.1/a/c', 1),
                           'x-container-sync-key': ('key', 1)},
                 items_since=['erroneous data'])
@@ -370,8 +511,8 @@ def test_container_stop_at(self):
             cs.allowed_sync_hosts = ['127.0.0.1']
             # This sync will fail since the items_since data is bad.
             cs.container_sync('isa.db')
-            self.assertEquals(cs.container_failures, 1)
-            self.assertEquals(cs.container_skips, 0)
+            self.assertEqual(cs.container_failures, 1)
+            self.assertEqual(cs.container_skips, 0)
 
             # Set up fake times to make the sync short-circuit as having taken
             # too long
@@ -382,144 +523,153 @@ def test_container_stop_at(self):
 
             def fake_time():
                 return fake_times.pop(0)
-                
+
             sync.time = fake_time
             # This same sync won't fail since it will look like it took so long
             # as to be time to move on (before it ever actually tries to do
             # anything).
             cs.container_sync('isa.db')
-            self.assertEquals(cs.container_failures, 1)
-            self.assertEquals(cs.container_skips, 0)
+            self.assertEqual(cs.container_failures, 1)
+            self.assertEqual(cs.container_skips, 0)
         finally:
             sync.ContainerBroker = orig_ContainerBroker
             sync.time = orig_time
 
     def test_container_first_loop(self):
         cring = FakeRing()
-        oring = FakeRing()
-        cs = sync.ContainerSync({}, container_ring=cring, object_ring=oring)
-        orig_ContainerBroker = sync.ContainerBroker
-        orig_hash_path = sync.hash_path
-        orig_delete_object = sync.delete_object
-        try:
-
-            def fake_hash_path(account, container, obj, raw_digest=False):
-                # Ensures that no rows match for full syncing, ordinal is 0 and
-                # all hashes are 0
-                return '\x00' * 16
-
-            sync.hash_path = fake_hash_path
-            fcb = FakeContainerBroker('path',
-                info={'account': 'a', 'container': 'c',
-                      'x_container_sync_point1': 2,
-                      'x_container_sync_point2': -1},
-                metadata={'x-container-sync-to': ('http://127.0.0.1/a/c', 1),
-                          'x-container-sync-key': ('key', 1)},
-                items_since=[{'ROWID': 1, 'name': 'o'}])
-            sync.ContainerBroker = lambda p: fcb
+        with mock.patch('swift.container.sync.InternalClient'):
+            cs = sync.ContainerSync({}, container_ring=cring)
+
+        def fake_hash_path(account, container, obj, raw_digest=False):
+            # Ensures that no rows match for full syncing, ordinal is 0 and
+            # all hashes are 0
+            return '\x00' * 16
+        fcb = FakeContainerBroker(
+            'path',
+            info={'account': 'a', 'container': 'c',
+                  'storage_policy_index': 0,
+                  'x_container_sync_point1': 2,
+                  'x_container_sync_point2': -1},
+            metadata={'x-container-sync-to': ('http://127.0.0.1/a/c', 1),
+                      'x-container-sync-key': ('key', 1)},
+            items_since=[{'ROWID': 1, 'name': 'o'}])
+        with mock.patch('swift.container.sync.ContainerBroker',
+                        lambda p, logger: fcb), \
+                mock.patch('swift.container.sync.hash_path', fake_hash_path):
             cs._myips = ['10.0.0.0']    # Match
             cs._myport = 1000           # Match
             cs.allowed_sync_hosts = ['127.0.0.1']
             cs.container_sync('isa.db')
             # Succeeds because no rows match
-            self.assertEquals(cs.container_failures, 0)
-            self.assertEquals(cs.container_skips, 0)
-            self.assertEquals(fcb.sync_point1, None)
-            self.assertEquals(fcb.sync_point2, 1)
-
-            def fake_hash_path(account, container, obj, raw_digest=False):
-                # Ensures that all rows match for full syncing, ordinal is 0
-                # and all hashes are 1
-                return '\x01' * 16
-
-            sync.hash_path = fake_hash_path
-            fcb = FakeContainerBroker('path',
-                info={'account': 'a', 'container': 'c',
-                      'x_container_sync_point1': 1,
-                      'x_container_sync_point2': 1},
-                metadata={'x-container-sync-to': ('http://127.0.0.1/a/c', 1),
-                          'x-container-sync-key': ('key', 1)},
-                items_since=[{'ROWID': 1, 'name': 'o'}])
-            sync.ContainerBroker = lambda p: fcb
+            self.assertEqual(cs.container_failures, 1)
+            self.assertEqual(cs.container_skips, 0)
+            self.assertIsNone(fcb.sync_point1)
+            self.assertEqual(fcb.sync_point2, -1)
+
+        def fake_hash_path(account, container, obj, raw_digest=False):
+            # Ensures that all rows match for full syncing, ordinal is 0
+            # and all hashes are 1
+            return '\x01' * 16
+        fcb = FakeContainerBroker('path', info={'account': 'a',
+                                                'container': 'c',
+                                                'storage_policy_index': 0,
+                                                'x_container_sync_point1': 1,
+                                                'x_container_sync_point2': 1},
+                                  metadata={'x-container-sync-to':
+                                            ('http://127.0.0.1/a/c', 1),
+                                            'x-container-sync-key':
+                                            ('key', 1)},
+                                  items_since=[{'ROWID': 1, 'name': 'o'}])
+        with mock.patch('swift.container.sync.ContainerBroker',
+                        lambda p, logger: fcb), \
+                mock.patch('swift.container.sync.hash_path', fake_hash_path):
             cs._myips = ['10.0.0.0']    # Match
             cs._myport = 1000           # Match
             cs.allowed_sync_hosts = ['127.0.0.1']
             cs.container_sync('isa.db')
             # Succeeds because the two sync points haven't deviated yet
-            self.assertEquals(cs.container_failures, 0)
-            self.assertEquals(cs.container_skips, 0)
-            self.assertEquals(fcb.sync_point1, -1)
-            self.assertEquals(fcb.sync_point2, -1)
-
-            fcb = FakeContainerBroker('path',
-                info={'account': 'a', 'container': 'c',
-                      'x_container_sync_point1': 2,
-                      'x_container_sync_point2': -1},
-                metadata={'x-container-sync-to': ('http://127.0.0.1/a/c', 1),
-                          'x-container-sync-key': ('key', 1)},
-                items_since=[{'ROWID': 1, 'name': 'o'}])
-            sync.ContainerBroker = lambda p: fcb
+            self.assertEqual(cs.container_failures, 1)
+            self.assertEqual(cs.container_skips, 0)
+            self.assertEqual(fcb.sync_point1, -1)
+            self.assertEqual(fcb.sync_point2, -1)
+
+        fcb = FakeContainerBroker(
+            'path',
+            info={'account': 'a', 'container': 'c',
+                  'storage_policy_index': 0,
+                  'x_container_sync_point1': 2,
+                  'x_container_sync_point2': -1},
+            metadata={'x-container-sync-to': ('http://127.0.0.1/a/c', 1),
+                      'x-container-sync-key': ('key', 1)},
+            items_since=[{'ROWID': 1, 'name': 'o'}])
+        with mock.patch('swift.container.sync.ContainerBroker',
+                        lambda p, logger: fcb):
             cs._myips = ['10.0.0.0']    # Match
             cs._myport = 1000           # Match
             cs.allowed_sync_hosts = ['127.0.0.1']
             cs.container_sync('isa.db')
             # Fails because container_sync_row will fail since the row has no
             # 'deleted' key
-            self.assertEquals(cs.container_failures, 1)
-            self.assertEquals(cs.container_skips, 0)
-            self.assertEquals(fcb.sync_point1, -1)
-            self.assertEquals(fcb.sync_point2, -1)
-
-            fcb = FakeContainerBroker('path',
-                info={'account': 'a', 'container': 'c',
-                      'x_container_sync_point1': 2,
-                      'x_container_sync_point2': -1},
-                metadata={'x-container-sync-to': ('http://127.0.0.1/a/c', 1),
-                          'x-container-sync-key': ('key', 1)},
-                items_since=[{'ROWID': 1, 'name': 'o', 'created_at': '1.2',
-                              'deleted': True}])
-            sync.ContainerBroker = lambda p: fcb
+            self.assertEqual(cs.container_failures, 2)
+            self.assertEqual(cs.container_skips, 0)
+            self.assertIsNone(fcb.sync_point1)
+            self.assertEqual(fcb.sync_point2, -1)
+
+        def fake_delete_object(*args, **kwargs):
+            raise ClientException
+        fcb = FakeContainerBroker(
+            'path',
+            info={'account': 'a', 'container': 'c',
+                  'storage_policy_index': 0,
+                  'x_container_sync_point1': 2,
+                  'x_container_sync_point2': -1},
+            metadata={'x-container-sync-to': ('http://127.0.0.1/a/c', 1),
+                      'x-container-sync-key': ('key', 1)},
+            items_since=[{'ROWID': 1, 'name': 'o', 'created_at': '1.2',
+                          'deleted': True}])
+        with mock.patch('swift.container.sync.ContainerBroker',
+                        lambda p, logger: fcb), \
+                mock.patch('swift.container.sync.delete_object',
+                           fake_delete_object):
             cs._myips = ['10.0.0.0']    # Match
             cs._myport = 1000           # Match
             cs.allowed_sync_hosts = ['127.0.0.1']
             cs.container_sync('isa.db')
             # Fails because delete_object fails
-            self.assertEquals(cs.container_failures, 2)
-            self.assertEquals(cs.container_skips, 0)
-            self.assertEquals(fcb.sync_point1, -1)
-            self.assertEquals(fcb.sync_point2, -1)
-
-            def fake_delete_object(*args, **kwargs):
-                pass
-
-            sync.delete_object = fake_delete_object
-            fcb = FakeContainerBroker('path',
-                info={'account': 'a', 'container': 'c',
-                      'x_container_sync_point1': 2,
-                      'x_container_sync_point2': -1},
-                metadata={'x-container-sync-to': ('http://127.0.0.1/a/c', 1),
-                          'x-container-sync-key': ('key', 1)},
-                items_since=[{'ROWID': 1, 'name': 'o', 'created_at': '1.2',
-                              'deleted': True}])
-            sync.ContainerBroker = lambda p: fcb
+            self.assertEqual(cs.container_failures, 3)
+            self.assertEqual(cs.container_skips, 0)
+            self.assertIsNone(fcb.sync_point1)
+            self.assertEqual(fcb.sync_point2, -1)
+
+        fcb = FakeContainerBroker(
+            'path',
+            info={'account': 'a', 'container': 'c',
+                  'storage_policy_index': 0,
+                  'x_container_sync_point1': 2,
+                  'x_container_sync_point2': -1},
+            metadata={'x-container-sync-to': ('http://127.0.0.1/a/c', 1),
+                      'x-container-sync-key': ('key', 1)},
+            items_since=[{'ROWID': 1, 'name': 'o', 'created_at': '1.2',
+                          'deleted': True}])
+        with mock.patch('swift.container.sync.ContainerBroker',
+                        lambda p, logger: fcb), \
+                mock.patch('swift.container.sync.delete_object',
+                           lambda *x, **y: None):
             cs._myips = ['10.0.0.0']    # Match
             cs._myport = 1000           # Match
             cs.allowed_sync_hosts = ['127.0.0.1']
             cs.container_sync('isa.db')
             # Succeeds because delete_object succeeds
-            self.assertEquals(cs.container_failures, 2)
-            self.assertEquals(cs.container_skips, 0)
-            self.assertEquals(fcb.sync_point1, None)
-            self.assertEquals(fcb.sync_point2, 1)
-        finally:
-            sync.ContainerBroker = orig_ContainerBroker
-            sync.hash_path = orig_hash_path
-            sync.delete_object = orig_delete_object
+            self.assertEqual(cs.container_failures, 3)
+            self.assertEqual(cs.container_skips, 0)
+            self.assertIsNone(fcb.sync_point1)
+            self.assertEqual(fcb.sync_point2, 1)
 
     def test_container_second_loop(self):
         cring = FakeRing()
-        oring = FakeRing()
-        cs = sync.ContainerSync({}, container_ring=cring, object_ring=oring)
+        with mock.patch('swift.container.sync.InternalClient'):
+            cs = sync.ContainerSync({}, container_ring=cring,
+                                    logger=self.logger)
         orig_ContainerBroker = sync.ContainerBroker
         orig_hash_path = sync.hash_path
         orig_delete_object = sync.delete_object
@@ -530,289 +680,721 @@ def test_container_second_loop(self):
             def fake_hash_path(account, container, obj, raw_digest=False):
                 # Ensures that no rows match for second loop, ordinal is 0 and
                 # all hashes are 1
-                return '\x01' * 16
+                return b'\x01' * 16
 
             sync.hash_path = fake_hash_path
-            fcb = FakeContainerBroker('path',
+            fcb = FakeContainerBroker(
+                'path',
                 info={'account': 'a', 'container': 'c',
+                      'storage_policy_index': 0,
                       'x_container_sync_point1': -1,
                       'x_container_sync_point2': -1},
                 metadata={'x-container-sync-to': ('http://127.0.0.1/a/c', 1),
                           'x-container-sync-key': ('key', 1)},
                 items_since=[{'ROWID': 1, 'name': 'o'}])
-            sync.ContainerBroker = lambda p: fcb
+            sync.ContainerBroker = lambda p, logger: fcb
             cs._myips = ['10.0.0.0']    # Match
             cs._myport = 1000           # Match
             cs.allowed_sync_hosts = ['127.0.0.1']
             cs.container_sync('isa.db')
             # Succeeds because no rows match
-            self.assertEquals(cs.container_failures, 0)
-            self.assertEquals(cs.container_skips, 0)
-            self.assertEquals(fcb.sync_point1, 1)
-            self.assertEquals(fcb.sync_point2, None)
+            self.assertEqual(cs.container_failures, 0)
+            self.assertEqual(cs.container_skips, 0)
+            self.assertEqual(fcb.sync_point1, 1)
+            self.assertIsNone(fcb.sync_point2)
 
             def fake_hash_path(account, container, obj, raw_digest=False):
                 # Ensures that all rows match for second loop, ordinal is 0 and
                 # all hashes are 0
-                return '\x00' * 16
+                return b'\x00' * 16
 
             def fake_delete_object(*args, **kwargs):
                 pass
 
             sync.hash_path = fake_hash_path
             sync.delete_object = fake_delete_object
-            fcb = FakeContainerBroker('path',
+            fcb = FakeContainerBroker(
+                'path',
                 info={'account': 'a', 'container': 'c',
+                      'storage_policy_index': 0,
                       'x_container_sync_point1': -1,
                       'x_container_sync_point2': -1},
                 metadata={'x-container-sync-to': ('http://127.0.0.1/a/c', 1),
                           'x-container-sync-key': ('key', 1)},
                 items_since=[{'ROWID': 1, 'name': 'o'}])
-            sync.ContainerBroker = lambda p: fcb
+            sync.ContainerBroker = lambda p, logger: fcb
             cs._myips = ['10.0.0.0']    # Match
             cs._myport = 1000           # Match
             cs.allowed_sync_hosts = ['127.0.0.1']
             cs.container_sync('isa.db')
             # Fails because row is missing 'deleted' key
-            self.assertEquals(cs.container_failures, 1)
-            self.assertEquals(cs.container_skips, 0)
-            self.assertEquals(fcb.sync_point1, -1)
-            self.assertEquals(fcb.sync_point2, -1)
-
-            fcb = FakeContainerBroker('path',
+            # Nevertheless the fault is skipped
+            self.assertEqual(cs.container_failures, 1)
+            self.assertEqual(cs.container_skips, 0)
+            self.assertEqual(fcb.sync_point1, 1)
+            self.assertIsNone(fcb.sync_point2)
+
+            fcb = FakeContainerBroker(
+                'path',
                 info={'account': 'a', 'container': 'c',
+                      'storage_policy_index': 0,
                       'x_container_sync_point1': -1,
                       'x_container_sync_point2': -1},
                 metadata={'x-container-sync-to': ('http://127.0.0.1/a/c', 1),
                           'x-container-sync-key': ('key', 1)},
                 items_since=[{'ROWID': 1, 'name': 'o', 'created_at': '1.2',
                               'deleted': True}])
-            sync.ContainerBroker = lambda p: fcb
+            sync.ContainerBroker = lambda p, logger: fcb
             cs._myips = ['10.0.0.0']    # Match
             cs._myport = 1000           # Match
             cs.allowed_sync_hosts = ['127.0.0.1']
             cs.container_sync('isa.db')
             # Succeeds because row now has 'deleted' key and delete_object
             # succeeds
-            self.assertEquals(cs.container_failures, 1)
-            self.assertEquals(cs.container_skips, 0)
-            self.assertEquals(fcb.sync_point1, 1)
-            self.assertEquals(fcb.sync_point2, None)
+            self.assertEqual(cs.container_failures, 1)
+            self.assertEqual(cs.container_skips, 0)
+            self.assertEqual(fcb.sync_point1, 1)
+            self.assertIsNone(fcb.sync_point2)
         finally:
             sync.ContainerBroker = orig_ContainerBroker
             sync.hash_path = orig_hash_path
             sync.delete_object = orig_delete_object
 
+    def test_container_report(self):
+        container_stats = {'puts': 0,
+                           'deletes': 0,
+                           'bytes': 0}
+
+        def fake_container_sync_row(self, row, sync_to,
+                                    user_key, broker, info, realm, realm_key):
+            if 'deleted' in row:
+                container_stats['deletes'] += 1
+                return True
+
+            container_stats['puts'] += 1
+            container_stats['bytes'] += row['size']
+            return True
+
+        def fake_hash_path(account, container, obj, raw_digest=False):
+            # Ensures that no rows match for second loop, ordinal is 0 and
+            # all hashes are 1
+            return '\x01' * 16
+
+        fcb = FakeContainerBroker(
+            'path',
+            info={'account': 'a', 'container': 'c',
+                  'storage_policy_index': 0,
+                  'x_container_sync_point1': 5,
+                  'x_container_sync_point2': -1},
+            metadata={'x-container-sync-to': ('http://127.0.0.1/a/c', 1),
+                      'x-container-sync-key': ('key', 1)},
+            items_since=[{'ROWID': 1, 'name': 'o1', 'size': 0,
+                          'deleted': True},
+                         {'ROWID': 2, 'name': 'o2', 'size': 1010},
+                         {'ROWID': 3, 'name': 'o3', 'size': 0,
+                          'deleted': True},
+                         {'ROWID': 4, 'name': 'o4', 'size': 90},
+                         {'ROWID': 5, 'name': 'o5', 'size': 0}])
+
+        with mock.patch('swift.container.sync.InternalClient'), \
+                mock.patch('swift.container.sync.hash_path',
+                           fake_hash_path), \
+                mock.patch('swift.container.sync.ContainerBroker',
+                           lambda p, logger: fcb):
+            cring = FakeRing()
+            cs = sync.ContainerSync({}, container_ring=cring,
+                                    logger=self.logger)
+            cs.container_stats = container_stats
+            cs._myips = ['10.0.0.0']    # Match
+            cs._myport = 1000           # Match
+            cs.allowed_sync_hosts = ['127.0.0.1']
+            with mock.patch.object(cs, 'container_sync_row',
+                                   fake_container_sync_row):
+                cs.container_sync('isa.db')
+            # Succeeds because no rows match
+            log_line = cs.logger.get_lines_for_level('info')[0]
+            lines = log_line.split(',')
+            self.assertEqual('total_rows: 1', lines.pop().strip())
+            self.assertEqual('sync_point2: None', lines.pop().strip())
+            self.assertEqual('sync_point1: 5', lines.pop().strip())
+            self.assertEqual('bytes: 0', lines.pop().strip())
+            self.assertEqual('deletes: 0', lines.pop().strip())
+            self.assertEqual('posts: 0', lines.pop().strip())
+            self.assertEqual('puts: 0', lines.pop().strip())
+
     def test_container_sync_row_delete(self):
+        self._test_container_sync_row_delete(None, None)
+
+    def test_container_sync_row_delete_using_realms(self):
+        self._test_container_sync_row_delete('US', 'realm_key')
+
+    def _test_container_sync_row_delete(self, realm, realm_key):
+        orig_uuid = sync.uuid
         orig_delete_object = sync.delete_object
         try:
-
-            def fake_delete_object(path, name=None, headers=None, proxy=None):
-                self.assertEquals(path, 'http://sync/to/path')
-                self.assertEquals(name, 'object')
-                self.assertEquals(headers,
-                    {'x-container-sync-key': 'key', 'x-timestamp': '1.2'})
-                self.assertEquals(proxy, 'http://proxy')
+            class FakeUUID(object):
+                class uuid4(object):
+                    hex = 'abcdef'
+
+            sync.uuid = FakeUUID
+            ts_data = Timestamp(1.1)
+
+            def fake_delete_object(path, name=None, headers=None, proxy=None,
+                                   logger=None, timeout=None):
+                self.assertEqual(path, 'http://sync/to/path')
+                self.assertEqual(name, 'object')
+                if realm:
+                    self.assertEqual(headers, {
+                        'x-container-sync-auth':
+                        'US abcdef a2401ecb1256f469494a0abcb0eb62ffa73eca63',
+                        'x-timestamp': ts_data.internal})
+                else:
+                    self.assertEqual(
+                        headers,
+                        {'x-container-sync-key': 'key',
+                         'x-timestamp': ts_data.internal})
+                self.assertEqual(proxy, 'http://proxy')
+                self.assertEqual(timeout, 5.0)
+                self.assertEqual(logger, self.logger)
 
             sync.delete_object = fake_delete_object
-            cs = sync.ContainerSync({}, container_ring=FakeRing(),
-                                    object_ring=FakeRing())
-            cs.proxy = 'http://proxy'
-            # Success
-            self.assertTrue(cs.container_sync_row({'deleted': True,
-                'name': 'object', 'created_at': '1.2'}, 'http://sync/to/path',
-                'key', FakeContainerBroker('broker'), 'info'))
-            self.assertEquals(cs.container_deletes, 1)
+
+            with mock.patch('swift.container.sync.InternalClient'):
+                cs = sync.ContainerSync({}, container_ring=FakeRing(),
+                                        logger=self.logger)
+            cs.http_proxies = ['http://proxy']
+            # Success.
+            # simulate a row with tombstone at 1.1 and later ctype, meta times
+            created_at = ts_data.internal + '+1388+1388'  # last modified = 1.2
+            self.assertTrue(cs.container_sync_row(
+                {'deleted': True,
+                 'name': 'object',
+                 'created_at': created_at,
+                 'size': '1000'}, 'http://sync/to/path',
+                'key', FakeContainerBroker('broker'),
+                {'account': 'a', 'container': 'c', 'storage_policy_index': 0},
+                realm, realm_key))
+            self.assertEqual(cs.container_deletes, 1)
 
             exc = []
 
-            def fake_delete_object(path, name=None, headers=None, proxy=None):
+            def fake_delete_object(*args, **kwargs):
                 exc.append(Exception('test exception'))
                 raise exc[-1]
 
             sync.delete_object = fake_delete_object
             # Failure because of delete_object exception
-            self.assertFalse(cs.container_sync_row({'deleted': True,
-                'name': 'object', 'created_at': '1.2'}, 'http://sync/to/path',
-                'key', FakeContainerBroker('broker'), 'info'))
-            self.assertEquals(cs.container_deletes, 1)
-            self.assertEquals(len(exc), 1)
-            self.assertEquals(str(exc[-1]), 'test exception')
-
-            def fake_delete_object(path, name=None, headers=None, proxy=None):
+            self.assertFalse(cs.container_sync_row(
+                {'deleted': True,
+                 'name': 'object',
+                 'created_at': '1.2'}, 'http://sync/to/path',
+                'key', FakeContainerBroker('broker'),
+                {'account': 'a', 'container': 'c', 'storage_policy_index': 0},
+                realm, realm_key))
+            self.assertEqual(cs.container_deletes, 1)
+            self.assertEqual(len(exc), 1)
+            self.assertEqual(str(exc[-1]), 'test exception')
+
+            def fake_delete_object(*args, **kwargs):
                 exc.append(ClientException('test client exception'))
                 raise exc[-1]
 
             sync.delete_object = fake_delete_object
             # Failure because of delete_object exception
-            self.assertFalse(cs.container_sync_row({'deleted': True,
-                'name': 'object', 'created_at': '1.2'}, 'http://sync/to/path',
-                'key', FakeContainerBroker('broker'), 'info'))
-            self.assertEquals(cs.container_deletes, 1)
-            self.assertEquals(len(exc), 2)
-            self.assertEquals(str(exc[-1]), 'test client exception')
-
-            def fake_delete_object(path, name=None, headers=None, proxy=None):
+            self.assertFalse(cs.container_sync_row(
+                {'deleted': True,
+                 'name': 'object',
+                 'created_at': '1.2'}, 'http://sync/to/path',
+                'key', FakeContainerBroker('broker'),
+                {'account': 'a', 'container': 'c', 'storage_policy_index': 0},
+                realm, realm_key))
+            self.assertEqual(cs.container_deletes, 1)
+            self.assertEqual(len(exc), 2)
+            self.assertEqual(str(exc[-1]), 'test client exception')
+
+            def fake_delete_object(*args, **kwargs):
                 exc.append(ClientException('test client exception',
                                            http_status=404))
                 raise exc[-1]
 
             sync.delete_object = fake_delete_object
             # Success because the object wasn't even found
-            self.assertTrue(cs.container_sync_row({'deleted': True,
-                'name': 'object', 'created_at': '1.2'}, 'http://sync/to/path',
-                'key', FakeContainerBroker('broker'), 'info'))
-            self.assertEquals(cs.container_deletes, 2)
-            self.assertEquals(len(exc), 3)
-            self.assertEquals(str(exc[-1]), 'test client exception: 404')
+            self.assertTrue(cs.container_sync_row(
+                {'deleted': True,
+                 'name': 'object',
+                 'created_at': '1.2'}, 'http://sync/to/path',
+                'key', FakeContainerBroker('broker'),
+                {'account': 'a', 'container': 'c', 'storage_policy_index': 0},
+                realm, realm_key))
+            self.assertEqual(cs.container_deletes, 2)
+            self.assertEqual(len(exc), 3)
+            self.assertEqual(str(exc[-1]), 'test client exception: 404')
+
+            def fake_delete_object(*args, **kwargs):
+                exc.append(ClientException('test client exception',
+                                           http_status=409))
+                raise exc[-1]
+
+            sync.delete_object = fake_delete_object
+            # Success because our tombstone is out of date
+            self.assertTrue(cs.container_sync_row(
+                {'deleted': True,
+                 'name': 'object',
+                 'created_at': '1.2'}, 'http://sync/to/path',
+                'key', FakeContainerBroker('broker'),
+                {'account': 'a', 'container': 'c', 'storage_policy_index': 0},
+                realm, realm_key))
+            self.assertEqual(cs.container_deletes, 3)
+            self.assertEqual(len(exc), 4)
+            self.assertEqual(str(exc[-1]), 'test client exception: 409')
         finally:
+            sync.uuid = orig_uuid
             sync.delete_object = orig_delete_object
 
     def test_container_sync_row_put(self):
-        orig_shuffle = sync.shuffle
+        self._test_container_sync_row_put(None, None)
+
+    def test_container_sync_row_put_using_realms(self):
+        self._test_container_sync_row_put('US', 'realm_key')
+
+    def _test_container_sync_row_put(self, realm, realm_key):
+        orig_uuid = sync.uuid
         orig_put_object = sync.put_object
-        orig_direct_get_object = sync.direct_get_object
+        orig_head_object = sync.head_object
+
         try:
-            sync.shuffle = lambda x: x
-
-            def fake_put_object(sync_to, name=None, headers=None,
-                                contents=None, proxy=None):
-                self.assertEquals(sync_to, 'http://sync/to/path')
-                self.assertEquals(name, 'object')
-                self.assertEquals(headers, {'x-container-sync-key': 'key',
-                    'x-timestamp': '1.2',
+            class FakeUUID(object):
+                class uuid4(object):
+                    hex = 'abcdef'
+
+            sync.uuid = FakeUUID
+            ts_data = Timestamp(1.1)
+            timestamp = Timestamp(1.2)
+            timestamp2 = Timestamp(1.3)
+            put_object_calls = []
+
+            def fake_put_object(*args, **kwargs):
+                put_object_calls.append((args, kwargs))
+
+            def check_put_object(extra_headers, sync_to, name=None,
+                                 headers=None, contents=None, proxy=None,
+                                 logger=None, timeout=None):
+                self.assertEqual(sync_to, 'http://sync/to/path')
+                self.assertEqual(name, 'object')
+                expected_headers = {
+                    # x-timestamp here is normal, because it's forwarding
+                    # the response x-timestamp header it got from getting
+                    # the source object. This might be going to a different
+                    # cluster, so normal is probably the right call.
+                    'x-timestamp': timestamp.normal,
+                    'etag': 'etagvalue',
                     'other-header': 'other header value',
-                    'etag': 'etagvalue'})
-                self.assertEquals(contents.read(), 'contents')
-                self.assertEquals(proxy, 'http://proxy')
+                    'content-type': 'text/plain'}
+                if realm:
+                    expected_headers.update({
+                        'x-container-sync-auth':
+                        'US abcdef a5fb3cf950738e6e3b364190e246bd7dd21dad3c'})
+                else:
+                    expected_headers.update({
+                        'x-container-sync-key': 'key'})
+                expected_headers.update(extra_headers)
+                self.assertDictEqual(expected_headers, headers)
+                self.assertEqual(contents.read(), b'contents')
+                self.assertEqual(proxy, 'http://proxy')
+                self.assertEqual(timeout, 5.0)
+                self.assertEqual(logger, self.logger)
 
             sync.put_object = fake_put_object
-
-            cs = sync.ContainerSync({}, container_ring=FakeRing(),
-                                    object_ring=FakeRing())
-            cs.proxy = 'http://proxy'
-
-            def fake_direct_get_object(node, part, account, container, obj,
-                                       resp_chunk_size=1):
-                return ({'other-header': 'other header value',
-                         'etag': '"etagvalue"', 'x-timestamp': '1.2'},
-                        iter('contents'))
-
-            sync.direct_get_object = fake_direct_get_object
-            # Success as everything says it worked
-            self.assertTrue(cs.container_sync_row({'deleted': False,
-                'name': 'object', 'created_at': '1.2'}, 'http://sync/to/path',
-                'key', FakeContainerBroker('broker'), {'account': 'a',
-                'container': 'c'}))
-            self.assertEquals(cs.container_puts, 1)
-
-            def fake_direct_get_object(node, part, account, container, obj,
-                                       resp_chunk_size=1):
-                return ({'date': 'date value',
+            expected_put_count = 0
+            excepted_failure_count = 0
+
+            with mock.patch('swift.container.sync.InternalClient'):
+                cs = sync.ContainerSync({}, container_ring=FakeRing(),
+                                        logger=self.logger)
+            cs.http_proxies = ['http://proxy']
+
+            def fake_get_object(acct, con, obj, headers, acceptable_statuses,
+                                params=None):
+                self.assertEqual({'symlink': 'get'}, params)
+                self.assertEqual(headers['X-Backend-Storage-Policy-Index'],
+                                 '0')
+                return (200,
+                        {'other-header': 'other header value',
+                         'etag': '"etagvalue"',
+                         'x-timestamp': timestamp.normal,
+                         'content-type': 'text/plain; swift_bytes=123'},
+                        iter([b'contents']))
+
+            cs.swift.get_object = fake_get_object
+            # Success as everything says it worked.
+            # simulate a row with data at 1.1 and later ctype, meta times
+            # ts_data + 0.5s + 0.5s i.e. last_modified = 1.2
+            created_at = ts_data.internal + '+1388+1388'
+
+            def fake_object_in_rcontainer(row, sync_to, user_key,
+                                          broker, realm, realm_key):
+                return False
+
+            orig_object_in_rcontainer = cs._object_in_remote_container
+            cs._object_in_remote_container = fake_object_in_rcontainer
+
+            self.assertTrue(cs.container_sync_row(
+                {'deleted': False,
+                 'name': 'object',
+                 'created_at': created_at,
+                 'size': 50}, 'http://sync/to/path',
+                'key', FakeContainerBroker('broker'),
+                {'account': 'a', 'container': 'c', 'storage_policy_index': 0},
+                realm, realm_key))
+            self.assertEqual(1, len(put_object_calls))
+            check_put_object({'etag': 'etagvalue'},
+                             *put_object_calls[0][0], **put_object_calls[0][1])
+            expected_put_count += 1
+            self.assertEqual(cs.container_puts, expected_put_count)
+
+            def fake_get_object(acct, con, obj, headers, acceptable_statuses,
+                                params=None):
+                self.assertEqual({'symlink': 'get'}, params)
+                self.assertEqual(headers['X-Newest'], True)
+                self.assertEqual(headers['X-Backend-Storage-Policy-Index'],
+                                 '0')
+                return (200,
+                        {'date': 'date value',
                          'last-modified': 'last modified value',
-                         'x-timestamp': '1.2',
+                         'x-timestamp': timestamp.normal,
                          'other-header': 'other header value',
-                         'etag': '"etagvalue"'},
-                        iter('contents'))
+                         'etag': '"etagvalue"',
+                         'content-type': 'text/plain; swift_bytes=123'},
+                        iter([b'contents']))
+
+            cs.swift.get_object = fake_get_object
 
-            sync.direct_get_object = fake_direct_get_object
             # Success as everything says it worked, also checks 'date' and
             # 'last-modified' headers are removed and that 'etag' header is
             # stripped of double quotes.
-            self.assertTrue(cs.container_sync_row({'deleted': False,
-                'name': 'object', 'created_at': '1.2'}, 'http://sync/to/path',
-                'key', FakeContainerBroker('broker'), {'account': 'a',
-                'container': 'c'}))
-            self.assertEquals(cs.container_puts, 2)
+            put_object_calls = []
+            self.assertTrue(cs.container_sync_row(
+                {'deleted': False,
+                 'name': 'object',
+                 'created_at': timestamp.internal,
+                 'size': 60}, 'http://sync/to/path',
+                'key', FakeContainerBroker('broker'),
+                {'account': 'a', 'container': 'c', 'storage_policy_index': 0},
+                realm, realm_key))
+            self.assertEqual(1, len(put_object_calls))
+            check_put_object({'etag': 'etagvalue'},
+                             *put_object_calls[0][0], **put_object_calls[0][1])
+            expected_put_count += 1
+            self.assertEqual(cs.container_puts, expected_put_count)
+
+            # Success as everything says it worked, also check that PUT
+            # timestamp equals GET timestamp when it is newer than created_at
+            # value.
+            put_object_calls = []
+            self.assertTrue(cs.container_sync_row(
+                {'deleted': False,
+                 'name': 'object',
+                 'created_at': ts_data.internal,
+                 'size': 60}, 'http://sync/to/path',
+                'key', FakeContainerBroker('broker'),
+                {'account': 'a', 'container': 'c', 'storage_policy_index': 0},
+                realm, realm_key))
+            self.assertEqual(1, len(put_object_calls))
+            check_put_object({'etag': 'etagvalue'},
+                             *put_object_calls[0][0], **put_object_calls[0][1])
+            expected_put_count += 1
+            self.assertEqual(cs.container_puts, expected_put_count)
+
+            def fake_get_object(acct, con, obj, headers, acceptable_statuses,
+                                params=None):
+                self.assertEqual({'symlink': 'get'}, params)
+                self.assertEqual(headers['X-Newest'], True)
+                self.assertEqual(headers['X-Backend-Storage-Policy-Index'],
+                                 '0')
+                return (200,
+                        {'date': 'date value',
+                         'last-modified': 'last modified value',
+                         'x-timestamp': timestamp.normal,
+                         'other-header': 'other header value',
+                         'etag': '"etagvalue"',
+                         'x-static-large-object': 'true',
+                         'content-type': 'text/plain; swift_bytes=123'},
+                        iter([b'contents']))
+
+            cs.swift.get_object = fake_get_object
+
+            # Success as everything says it worked, also check that etag
+            # header removed in case of SLO
+            put_object_calls = []
+            self.assertTrue(cs.container_sync_row(
+                {'deleted': False,
+                 'name': 'object',
+                 'created_at': ts_data.internal,
+                 'size': 60}, 'http://sync/to/path',
+                'key', FakeContainerBroker('broker'),
+                {'account': 'a', 'container': 'c', 'storage_policy_index': 0},
+                realm, realm_key))
+            self.assertEqual(1, len(put_object_calls))
+            check_put_object({'x-static-large-object': 'true'},
+                             *put_object_calls[0][0], **put_object_calls[0][1])
+            expected_put_count += 1
+            self.assertEqual(cs.container_puts, expected_put_count)
 
             exc = []
 
-            def fake_direct_get_object(node, part, account, container, obj,
-                                       resp_chunk_size=1):
+            def fake_get_object(acct, con, obj, headers, acceptable_statuses,
+                                params=None):
+                self.assertEqual({'symlink': 'get'}, params)
+                self.assertEqual(headers['X-Newest'], True)
+                self.assertEqual(headers['X-Backend-Storage-Policy-Index'],
+                                 '0')
                 exc.append(Exception('test exception'))
                 raise exc[-1]
 
-            sync.direct_get_object = fake_direct_get_object
+            cs.swift.get_object = fake_get_object
             # Fail due to completely unexpected exception
-            self.assertFalse(cs.container_sync_row({'deleted': False,
-                'name': 'object', 'created_at': '1.2'}, 'http://sync/to/path',
-                'key', FakeContainerBroker('broker'), {'account': 'a',
-                'container': 'c'}))
-            self.assertEquals(cs.container_puts, 2)
-            self.assertEquals(len(exc), 3)
-            self.assertEquals(str(exc[-1]), 'test exception')
+            self.assertFalse(cs.container_sync_row(
+                {'deleted': False,
+                 'name': 'object',
+                 'created_at': timestamp.internal,
+                 'size': 70}, 'http://sync/to/path',
+                'key', FakeContainerBroker('broker'),
+                {'account': 'a', 'container': 'c', 'storage_policy_index': 0},
+                realm, realm_key))
+            self.assertEqual(cs.container_puts, expected_put_count)
+            excepted_failure_count += 1
+            self.assertEqual(len(exc), 1)
+            self.assertEqual(str(exc[-1]), 'test exception')
 
             exc = []
-            def fake_direct_get_object(node, part, account, container, obj,
-                                       resp_chunk_size=1):
+
+            def fake_get_object(acct, con, obj, headers, acceptable_statuses,
+                                params=None):
+                self.assertEqual({'symlink': 'get'}, params)
+                self.assertEqual(headers['X-Newest'], True)
+                self.assertEqual(headers['X-Backend-Storage-Policy-Index'],
+                                 '0')
+
                 exc.append(ClientException('test client exception'))
                 raise exc[-1]
 
-            sync.direct_get_object = fake_direct_get_object
+            cs.swift.get_object = fake_get_object
             # Fail due to all direct_get_object calls failing
-            self.assertFalse(cs.container_sync_row({'deleted': False,
-                'name': 'object', 'created_at': '1.2'}, 'http://sync/to/path',
-                'key', FakeContainerBroker('broker'), {'account': 'a',
-                'container': 'c'}))
-            self.assertEquals(cs.container_puts, 2)
-            self.assertEquals(len(exc), 3)
-            self.assertEquals(str(exc[-1]), 'test client exception')
-
-            def fake_direct_get_object(node, part, account, container, obj,
-                                       resp_chunk_size=1):
-                return ({'other-header': 'other header value',
-                         'x-timestamp': '1.2', 'etag': '"etagvalue"'},
-                        iter('contents'))
-
-            def fake_put_object(sync_to, name=None, headers=None,
-                                contents=None, proxy=None):
+            self.assertFalse(cs.container_sync_row(
+                {'deleted': False,
+                 'name': 'object',
+                 'created_at': timestamp.internal,
+                 'size': 80}, 'http://sync/to/path',
+                'key', FakeContainerBroker('broker'),
+                {'account': 'a', 'container': 'c', 'storage_policy_index': 0},
+                realm, realm_key))
+            self.assertEqual(cs.container_puts, expected_put_count)
+            excepted_failure_count += 1
+            self.assertEqual(len(exc), 1)
+            self.assertEqual(str(exc[-1]), 'test client exception')
+
+            def fake_get_object(acct, con, obj, headers, acceptable_statuses,
+                                params=None):
+                self.assertEqual({'symlink': 'get'}, params)
+                self.assertEqual(headers['X-Newest'], True)
+                self.assertEqual(headers['X-Backend-Storage-Policy-Index'],
+                                 '0')
+                return (200, {'other-header': 'other header value',
+                              'x-timestamp': timestamp.normal,
+                              'etag': '"etagvalue"'},
+                        iter([b'contents']))
+
+            def fake_put_object(*args, **kwargs):
                 raise ClientException('test client exception', http_status=401)
 
-            sync.direct_get_object = fake_direct_get_object
+            cs.swift.get_object = fake_get_object
             sync.put_object = fake_put_object
-            cs.logger = FakeLogger()
             # Fail due to 401
-            self.assertFalse(cs.container_sync_row({'deleted': False,
-                'name': 'object', 'created_at': '1.2'}, 'http://sync/to/path',
-                'key', FakeContainerBroker('broker'), {'account': 'a',
-                'container': 'c'}))
-            self.assertEquals(cs.container_puts, 2)
-            self.assert_(re.match('Unauth ',
-                                  cs.logger.log_dict['info'][0][0][0]))
-
-            def fake_put_object(sync_to, name=None, headers=None,
-                                contents=None, proxy=None):
+            self.assertFalse(cs.container_sync_row(
+                {'deleted': False,
+                 'name': 'object',
+                 'created_at': timestamp.internal,
+                 'size': 90}, 'http://sync/to/path',
+                'key', FakeContainerBroker('broker'),
+                {'account': 'a', 'container': 'c', 'storage_policy_index': 0},
+                realm, realm_key))
+            self.assertEqual(cs.container_puts, expected_put_count)
+            excepted_failure_count += 1
+            self.assertEqual(cs.container_failures, excepted_failure_count)
+            self.assertLogMessage('info', 'Unauth')
+
+            def fake_put_object(*args, **kwargs):
                 raise ClientException('test client exception', http_status=404)
 
             sync.put_object = fake_put_object
             # Fail due to 404
-            cs.logger = FakeLogger()
-            self.assertFalse(cs.container_sync_row({'deleted': False,
-                'name': 'object', 'created_at': '1.2'}, 'http://sync/to/path',
-                'key', FakeContainerBroker('broker'), {'account': 'a',
-                'container': 'c'}))
-            self.assertEquals(cs.container_puts, 2)
-            self.assert_(re.match('Not found ',
-                                  cs.logger.log_dict['info'][0][0][0]))
-
-            def fake_put_object(sync_to, name=None, headers=None,
-                                contents=None, proxy=None):
+            self.assertFalse(cs.container_sync_row(
+                {'deleted': False,
+                 'name': 'object',
+                 'created_at': timestamp.internal,
+                 'size': 50}, 'http://sync/to/path',
+                'key', FakeContainerBroker('broker'),
+                {'account': 'a', 'container': 'c', 'storage_policy_index': 0},
+                realm, realm_key))
+            self.assertEqual(cs.container_puts, expected_put_count)
+            excepted_failure_count += 1
+            self.assertEqual(cs.container_failures, excepted_failure_count)
+            self.assertLogMessage('info', 'Not found', 1)
+
+            def fake_put_object(*args, **kwargs):
                 raise ClientException('test client exception', http_status=503)
 
             sync.put_object = fake_put_object
             # Fail due to 503
-            self.assertFalse(cs.container_sync_row({'deleted': False,
-                'name': 'object', 'created_at': '1.2'}, 'http://sync/to/path',
-                'key', FakeContainerBroker('broker'), {'account': 'a',
-                'container': 'c'}))
-            self.assertEquals(cs.container_puts, 2)
-            self.assertTrue(
-                cs.logger.log_dict['exception'][0][0][0].startswith(
-                    'ERROR Syncing '))
+            self.assertFalse(cs.container_sync_row(
+                {'deleted': False,
+                 'name': 'object',
+                 'created_at': timestamp.internal,
+                 'size': 50}, 'http://sync/to/path',
+                'key', FakeContainerBroker('broker'),
+                {'account': 'a', 'container': 'c', 'storage_policy_index': 0},
+                realm, realm_key))
+            self.assertEqual(cs.container_puts, expected_put_count)
+            excepted_failure_count += 1
+            self.assertEqual(cs.container_failures, excepted_failure_count)
+            self.assertLogMessage('error', 'ERROR Syncing')
+
+            # Test the following cases:
+            # remote has the same date and a put doesn't take place
+            # remote has more up to date copy and a put doesn't take place
+            # head_object returns ClientException(404) and a put takes place
+            # head_object returns other ClientException put doesn't take place
+            # and we get failure
+            # head_object returns other Exception put does not take place
+            # and we get failure
+            # remote returns old copy and a put takes place
+            test_row = {'deleted': False,
+                        'name': 'object',
+                        'created_at': timestamp.internal,
+                        'etag': '1111',
+                        'size': 10}
+            test_info = {'account': 'a',
+                         'container': 'c',
+                         'storage_policy_index': 0}
+
+            actual_puts = []
+
+            def fake_put_object(*args, **kwargs):
+                actual_puts.append((args, kwargs))
+
+            def fake_head_object(*args, **kwargs):
+                return ({'x-timestamp': timestamp.normal}, '')
+
+            sync.put_object = fake_put_object
+            sync.head_object = fake_head_object
+            cs._object_in_remote_container = orig_object_in_rcontainer
+            self.assertTrue(cs.container_sync_row(
+                test_row, 'http://sync/to/path',
+                'key', FakeContainerBroker('broker'),
+                test_info,
+                realm, realm_key))
+            # No additional put has taken place
+            self.assertEqual(len(actual_puts), 0)
+            # No additional errors
+            self.assertEqual(cs.container_failures, excepted_failure_count)
+
+            def fake_head_object(*args, **kwargs):
+                return ({'x-timestamp': timestamp2.normal}, '')
+
+            sync.head_object = fake_head_object
+            self.assertTrue(cs.container_sync_row(
+                test_row, 'http://sync/to/path',
+                'key', FakeContainerBroker('broker'),
+                test_info,
+                realm, realm_key))
+            # No additional put has taken place
+            self.assertEqual(len(actual_puts), 0)
+            # No additional errors
+            self.assertEqual(cs.container_failures, excepted_failure_count)
+
+            actual_puts = []
+
+            def fake_head_object(*args, **kwargs):
+                raise ClientException('test client exception', http_status=404)
+
+            sync.head_object = fake_head_object
+            self.assertTrue(cs.container_sync_row(
+                test_row, 'http://sync/to/path',
+                'key', FakeContainerBroker('broker'),
+                test_info, realm, realm_key))
+            # Additional put has taken place
+            self.assertEqual(len(actual_puts), 1)
+            # No additional errors
+            self.assertEqual(cs.container_failures, excepted_failure_count)
+
+            def fake_head_object(*args, **kwargs):
+                raise ClientException('test client exception', http_status=401)
+
+            sync.head_object = fake_head_object
+            self.assertFalse(cs.container_sync_row(
+                test_row, 'http://sync/to/path',
+                'key', FakeContainerBroker('broker'),
+                test_info, realm, realm_key))
+            # No additional put has taken place, failures increased
+            self.assertEqual(len(actual_puts), 1)
+            excepted_failure_count += 1
+            self.assertEqual(cs.container_failures, excepted_failure_count)
+
+            def fake_head_object(*args, **kwargs):
+                raise Exception()
+
+            sync.head_object = fake_head_object
+            self.assertFalse(cs.container_sync_row(
+                             test_row,
+                             'http://sync/to/path',
+                             'key', FakeContainerBroker('broker'),
+                             test_info, realm, realm_key))
+            # No additional put has taken place, failures increased
+            self.assertEqual(len(actual_puts), 1)
+            excepted_failure_count += 1
+            self.assertEqual(cs.container_failures, excepted_failure_count)
+
+            def fake_head_object(*args, **kwargs):
+                return ({'x-timestamp': ts_data.normal}, '')
+
+            sync.head_object = fake_head_object
+            self.assertTrue(cs.container_sync_row(
+                test_row, 'http://sync/to/path',
+                'key', FakeContainerBroker('broker'),
+                test_info, realm, realm_key))
+            # Additional put has taken place
+            self.assertEqual(len(actual_puts), 2)
+            # No additional errors
+            self.assertEqual(cs.container_failures, excepted_failure_count)
+
         finally:
-            sync.shuffle = orig_shuffle
+            sync.uuid = orig_uuid
             sync.put_object = orig_put_object
-            sync.direct_get_object = orig_direct_get_object
+            sync.head_object = orig_head_object
+
+    def test_select_http_proxy_None(self):
+
+        with mock.patch('swift.container.sync.InternalClient'):
+            cs = sync.ContainerSync(
+                {'sync_proxy': ''}, container_ring=FakeRing())
+        self.assertIsNone(cs.select_http_proxy())
+
+    def test_select_http_proxy_one(self):
+
+        with mock.patch('swift.container.sync.InternalClient'):
+            cs = sync.ContainerSync(
+                {'sync_proxy': 'http://one'}, container_ring=FakeRing())
+        self.assertEqual(cs.select_http_proxy(), 'http://one')
+
+    def test_select_http_proxy_multiple(self):
+
+        with mock.patch('swift.container.sync.InternalClient'):
+            cs = sync.ContainerSync(
+                {'sync_proxy': 'http://one,http://two,http://three'},
+                container_ring=FakeRing())
+        self.assertEqual(
+            set(cs.http_proxies),
+            set(['http://one', 'http://two', 'http://three']))
 
 
 if __name__ == '__main__':
diff --git a/test/unit/container/test_sync_store.py b/test/unit/container/test_sync_store.py
new file mode 100644
index 0000000000..684fa1fa91
--- /dev/null
+++ b/test/unit/container/test_sync_store.py
@@ -0,0 +1,367 @@
+# Copyright (c) 2010-2016 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import os
+import errno
+from unittest import mock
+import random
+import logging
+import unittest
+import tempfile
+from shutil import rmtree
+from test.debug_logger import debug_logger
+
+from swift.container.backend import DATADIR
+from swift.container import sync_store
+
+
+class FakeContainerBroker(object):
+
+    def __init__(self, path):
+        self.db_file = path
+        self.db_dir = os.path.dirname(path)
+        self.metadata = dict()
+        self._is_deleted = False
+
+    def is_deleted(self):
+        return self._is_deleted
+
+
+class TestContainerSyncStore(unittest.TestCase):
+
+    def setUp(self):
+        self.logger = debug_logger('test-container-sync-store')
+        self.logger.level = logging.DEBUG
+        self.test_dir_prefix = tempfile.mkdtemp()
+        self.devices_dir = os.path.join(self.test_dir_prefix, 'srv/node/')
+        os.makedirs(self.devices_dir)
+        # Create dummy container dbs
+        self.devices = ['sdax', 'sdb', 'sdc']
+        self.partitions = ['21765', '38965', '13234']
+        self.suffixes = ['312', '435']
+        self.hashes = ['f19ed', '53ef', '0ab5', '9c3a']
+        for device in self.devices:
+            data_dir_path = os.path.join(self.devices_dir,
+                                         device,
+                                         DATADIR)
+            os.makedirs(data_dir_path)
+            for part in self.partitions:
+                for suffix in self.suffixes:
+                    for hsh in self.hashes:
+                        db_dir = os.path.join(data_dir_path,
+                                              part,
+                                              suffix,
+                                              hsh)
+                        os.makedirs(db_dir)
+                        db_file = os.path.join(db_dir, '%s.db' % hsh)
+                        with open(db_file, 'w') as outfile:
+                            outfile.write('%s' % db_file)
+
+    def tearDown(self):
+        rmtree(self.test_dir_prefix)
+
+    def pick_dbfile(self):
+        hsh = random.choice(self.hashes)
+        return os.path.join(self.devices_dir,
+                            random.choice(self.devices),
+                            DATADIR,
+                            random.choice(self.partitions),
+                            random.choice(self.suffixes),
+                            hsh,
+                            '%s.db' % hsh)
+
+    # Path conversion tests
+    # container path is of the form:
+    # /srv/node/sdb/containers/part/.../*.db
+    # or more generally:
+    # devices/device/DATADIR/part/.../*.db
+    # synced container path is assumed to be of the form:
+    # /srv/node/sdb/sync_containers/part/.../*.db
+    # or more generally:
+    # devices/device/SYNC_DATADIR/part/.../*.db
+    # Indeed the ONLY DIFFERENCE is DATADIR <-> SYNC_DATADIR
+    # Since, however, the strings represented by the constants
+    # DATADIR or SYNC_DATADIR
+    # can appear in the devices or the device part, the conversion
+    # function between the two is a bit more subtle then a mere replacement.
+
+    # This function tests the conversion between a container path
+    # and a synced container path
+    def test_container_to_synced_container_path_conversion(self):
+        # The conversion functions are oblivious to the suffix
+        # so we just pick up a constant one.
+        db_path_suffix = self._db_path_suffix()
+
+        # We build various container path putting in both
+        # DATADIR and SYNC_DATADIR strings in the
+        # device and devices parts.
+        for devices, device in self._container_path_elements_generator():
+            path = os.path.join(devices, device, DATADIR, db_path_suffix)
+            # Call the conversion function
+            sds = sync_store.ContainerSyncStore(devices, self.logger, False)
+            path = sds._container_to_synced_container_path(path)
+            # Validate that ONLY the DATADIR part was replaced with
+            # sync_store.SYNC_DATADIR
+            self._validate_container_path_parts(path, devices, device,
+                                                sync_store.SYNC_DATADIR,
+                                                db_path_suffix)
+
+    # This function tests the conversion between a synced container path
+    # and a container path
+    def test_synced_container_to_container_path_conversion(self):
+        # The conversion functions are oblivious to the suffix
+        # so we just pick up a constant one.
+        db_path_suffix = ('133791/625/82a7f5a2c43281b0eab3597e35bb9625/'
+                          '82a7f5a2c43281b0eab3597e35bb9625.db')
+
+        # We build various synced container path putting in both
+        # DATADIR and SYNC_DATADIR strings in the
+        # device and devices parts.
+        for devices, device in self._container_path_elements_generator():
+            path = os.path.join(devices, device,
+                                sync_store.SYNC_DATADIR, db_path_suffix)
+            # Call the conversion function
+            sds = sync_store.ContainerSyncStore(devices, self.logger, False)
+            path = sds._synced_container_to_container_path(path)
+            # Validate that ONLY the SYNC_DATADIR part was replaced with
+            # DATADIR
+            self._validate_container_path_parts(path, devices, device,
+                                                DATADIR,
+                                                db_path_suffix)
+
+    # Constructs a db path suffix of the form:
+    # 133791/625/82...25/82...25.db
+    def _db_path_suffix(self):
+        def random_hexa_string(length):
+            '%0x' % random.randrange(16 ** length)
+
+        db = random_hexa_string(32)
+        return '%s/%s/%s/%s.db' % (random_hexa_string(5),
+                                   random_hexa_string(3),
+                                   db, db)
+
+    def _container_path_elements_generator(self):
+        # We build various container path elements putting in both
+        # DATADIR and SYNC_DATADIR strings in the
+        # device and devices parts.
+        for devices in ['/srv/node', '/srv/node/',
+                        '/srv/node/dev',
+                        '/srv/node/%s' % DATADIR,
+                        '/srv/node/%s' % sync_store.SYNC_DATADIR]:
+            for device in ['sdf1', 'sdf1/sdf2',
+                           'sdf1/%s' % DATADIR,
+                           'sdf1/%s' % sync_store.SYNC_DATADIR,
+                           '%s/sda' % DATADIR,
+                           '%s/sda' % sync_store.SYNC_DATADIR]:
+                yield devices, device
+
+    def _validate_container_path_parts(self, path, devices,
+                                       device, target, suffix):
+        # Recall that the path is of the form:
+        # devices/device/target/suffix
+        # where each of the sub path elements (e.g. devices)
+        # has a path structure containing path elements separated by '/'
+        # We thus validate by splitting the path according to '/'
+        # traversing all of its path elements making sure that the
+        # first elements are those of devices,
+        # the second are those of device
+        # etc.
+        spath = path.split('/')
+        spath.reverse()
+        self.assertEqual(spath.pop(), '')
+        # Validate path against 'devices'
+        for p in [p for p in devices.split('/') if p]:
+            self.assertEqual(spath.pop(), p)
+        # Validate path against 'device'
+        for p in [p for p in device.split('/') if p]:
+            self.assertEqual(spath.pop(), p)
+        # Validate path against target
+        self.assertEqual(spath.pop(), target)
+        # Validate path against suffix
+        for p in [p for p in suffix.split('/') if p]:
+            self.assertEqual(spath.pop(), p)
+
+    def test_add_synced_container(self):
+        # Add non-existing and existing synced containers
+        sds = sync_store.ContainerSyncStore(self.devices_dir,
+                                            self.logger,
+                                            False)
+        cfile = self.pick_dbfile()
+        broker = FakeContainerBroker(cfile)
+        for i in range(2):
+            sds.add_synced_container(broker)
+            scpath = sds._container_to_synced_container_path(cfile)
+            with open(scpath, 'r') as infile:
+                self.assertEqual(infile.read(), cfile)
+
+        iterated_synced_containers = list()
+        for db_path in sds.synced_containers_generator():
+            iterated_synced_containers.append(db_path)
+
+        self.assertEqual(len(iterated_synced_containers), 1)
+
+    def test_remove_synced_container(self):
+        # Add a synced container to remove
+        sds = sync_store.ContainerSyncStore(self.devices_dir,
+                                            self.logger,
+                                            False)
+        cfile = self.pick_dbfile()
+        # We keep here the link file so as to validate its deletion later
+        lfile = sds._container_to_synced_container_path(cfile)
+        broker = FakeContainerBroker(cfile)
+        sds.add_synced_container(broker)
+
+        # Remove existing and non-existing synced containers
+        for i in range(2):
+            sds.remove_synced_container(broker)
+
+        iterated_synced_containers = list()
+        for db_path in sds.synced_containers_generator():
+            iterated_synced_containers.append(db_path)
+
+        self.assertEqual(len(iterated_synced_containers), 0)
+
+        # Make sure the whole link path gets deleted
+        # recall that the path has the following suffix:
+        # <hexa string of length 6>/<hexa string of length 3>/
+        # <hexa string of length 32>/<same 32 hexa string>.db
+        # and we expect the .db as well as all path elements
+        # to get deleted
+        self.assertFalse(os.path.exists(lfile))
+        lfile = os.path.dirname(lfile)
+        for i in range(3):
+            self.assertFalse(os.path.exists(os.path.dirname(lfile)))
+            lfile = os.path.dirname(lfile)
+
+    def test_iterate_synced_containers(self):
+        # populate sync container db
+        sds = sync_store.ContainerSyncStore(self.devices_dir,
+                                            self.logger,
+                                            False)
+        containers = list()
+        for i in range(10):
+            cfile = self.pick_dbfile()
+            broker = FakeContainerBroker(cfile)
+            sds.add_synced_container(broker)
+            containers.append(cfile)
+
+        iterated_synced_containers = list()
+        for db_path in sds.synced_containers_generator():
+            iterated_synced_containers.append(db_path)
+
+        self.assertEqual(
+            set(containers), set(iterated_synced_containers))
+
+    def test_unhandled_exceptions_in_add_remove(self):
+        sds = sync_store.ContainerSyncStore(self.devices_dir,
+                                            self.logger,
+                                            False)
+        cfile = self.pick_dbfile()
+        broker = FakeContainerBroker(cfile)
+
+        with mock.patch(
+                'swift.container.sync_store.os.stat',
+                side_effect=OSError(errno.EPERM, 'permission denied')):
+            with self.assertRaises(OSError) as cm:
+                sds.add_synced_container(broker)
+        self.assertEqual(errno.EPERM, cm.exception.errno)
+
+        with mock.patch(
+                'swift.container.sync_store.os.makedirs',
+                side_effect=OSError(errno.EPERM, 'permission denied')):
+            with self.assertRaises(OSError) as cm:
+                sds.add_synced_container(broker)
+        self.assertEqual(errno.EPERM, cm.exception.errno)
+
+        with mock.patch(
+                'swift.container.sync_store.os.symlink',
+                side_effect=OSError(errno.EPERM, 'permission denied')):
+            with self.assertRaises(OSError) as cm:
+                sds.add_synced_container(broker)
+        self.assertEqual(errno.EPERM, cm.exception.errno)
+
+        with mock.patch(
+                'swift.container.sync_store.os.unlink',
+                side_effect=OSError(errno.EPERM, 'permission denied')):
+            with self.assertRaises(OSError) as cm:
+                sds.remove_synced_container(broker)
+        self.assertEqual(errno.EPERM, cm.exception.errno)
+
+    def test_update_sync_store_according_to_metadata_and_deleted(self):
+        # This function tests the update_sync_store 'logics'
+        # with respect to various combinations of the
+        # sync-to and sync-key metadata items and whether
+        # the database is marked for delete.
+        # The table below summarizes the expected result
+        # for the various combinations, e.g.:
+        # If metadata items exist and the database
+        # is not marked for delete then add should be called.
+
+        results_list = [
+            [False, 'a', 'b', 'add'],
+            [False, 'a', '', 'remove'],
+            [False, 'a', None, 'remove'],
+            [False, '', 'b', 'remove'],
+            [False, '', '', 'remove'],
+            [False, '', None, 'remove'],
+            [False, None, 'b', 'remove'],
+            [False, None, '', 'remove'],
+            [False, None, None, 'none'],
+            [True, 'a', 'b', 'remove'],
+            [True, 'a', '', 'remove'],
+            [True, 'a', None, 'remove'],
+            [True, '', 'b', 'remove'],
+            [True, '', '', 'remove'],
+            [True, '', None, 'remove'],
+            [True, None, 'b', 'remove'],
+            [True, None, '', 'remove'],
+            [True, None, None, 'none'],
+        ]
+
+        store = 'swift.container.sync_store.ContainerSyncStore'
+        with mock.patch(store + '.add_synced_container') as add_container:
+            with mock.patch(
+                    store + '.remove_synced_container') as remove_container:
+                sds = sync_store.ContainerSyncStore(self.devices_dir,
+                                                    self.logger,
+                                                    False)
+                add_calls = 0
+                remove_calls = 0
+                # We now iterate over the list of combinations
+                # Validating that add and removed are called as
+                # expected
+                for deleted, sync_to, sync_key, expected_op in results_list:
+                    cfile = self.pick_dbfile()
+                    broker = FakeContainerBroker(cfile)
+                    broker._is_deleted = deleted
+                    if sync_to is not None:
+                        broker.metadata['X-Container-Sync-To'] = [
+                            sync_to, 1]
+                    if sync_key is not None:
+                        broker.metadata['X-Container-Sync-Key'] = [
+                            sync_key, 1]
+                    sds.update_sync_store(broker)
+                    if expected_op == 'add':
+                        add_calls += 1
+                    if expected_op == 'remove':
+                        remove_calls += 1
+                    self.assertEqual(add_container.call_count,
+                                     add_calls)
+                    self.assertEqual(remove_container.call_count,
+                                     remove_calls)
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/container/test_updater.py b/test/unit/container/test_updater.py
index 6e1fe32bec..5729bef728 100644
--- a/test/unit/container/test_updater.py
+++ b/test/unit/container/test_updater.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,64 +13,57 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-import cPickle as pickle
+from unittest import mock
 import os
-import sys
 import unittest
-from gzip import GzipFile
 from shutil import rmtree
 from tempfile import mkdtemp
+from test.debug_logger import debug_logger
+from test.unit import mock_check_drive
 
-from eventlet import spawn, Timeout, listen
+from eventlet import spawn, Timeout
 
-from swift.common import utils
+from swift.common import exceptions, utils
 from swift.container import updater as container_updater
-from swift.container import server as container_server
-from swift.common.db import ContainerBroker
+from swift.container.backend import ContainerBroker, DATADIR
 from swift.common.ring import RingData
-from swift.common.utils import normalize_timestamp
+from swift.common.utils import normalize_timestamp, Timestamp
+
+from test import listen_zero
 
 
 class TestContainerUpdater(unittest.TestCase):
 
     def setUp(self):
-        utils.HASH_PATH_SUFFIX = 'endcap'
+        utils.HASH_PATH_SUFFIX = b'endcap'
+        utils.HASH_PATH_PREFIX = b'startcap'
         self.testdir = os.path.join(mkdtemp(), 'tmp_test_container_updater')
         rmtree(self.testdir, ignore_errors=1)
         os.mkdir(self.testdir)
-        pickle.dump(RingData([[0, 1, 0, 1], [1, 0, 1, 0]],
-            [{'id': 0, 'ip': '127.0.0.1', 'port': 12345, 'device': 'sda1',
-              'zone': 0},
-             {'id': 1, 'ip': '127.0.0.1', 'port': 12345, 'device': 'sda1',
-              'zone': 2}], 30),
-            GzipFile(os.path.join(self.testdir, 'account.ring.gz'), 'wb'))
+        ring_file = os.path.join(self.testdir, 'account.ring.gz')
+        RingData([[0, 1, 0, 1], [1, 0, 1, 0]],
+                 [{'id': 0, 'ip': '127.0.0.2', 'port': 12345,
+                   'replication_ip': '127.0.0.1',
+                   # replication_port may be overridden in tests but
+                   # include here for completeness...
+                   'replication_port': 67890,
+                   'device': 'sda1', 'zone': 0, 'region': 1},
+                  {'id': 1, 'ip': '127.0.0.2', 'port': 12345,
+                   'replication_ip': '127.0.0.1',
+                   'replication_port': 67890,
+                   'device': 'sda1', 'zone': 2, 'region': 1}],
+                 30).save(ring_file)
         self.devices_dir = os.path.join(self.testdir, 'devices')
         os.mkdir(self.devices_dir)
         self.sda1 = os.path.join(self.devices_dir, 'sda1')
         os.mkdir(self.sda1)
+        self.logger = debug_logger('test')
 
     def tearDown(self):
         rmtree(os.path.dirname(self.testdir), ignore_errors=1)
 
-    def test_creation(self):
-        cu = container_updater.ContainerUpdater({
-            'devices': self.devices_dir,
-            'mount_check': 'false',
-            'swift_dir': self.testdir,
-            'interval': '1',
-            'concurrency': '2',
-            'node_timeout': '5',
-            })
-        self.assert_(hasattr(cu, 'logger'))
-        self.assert_(cu.logger is not None)
-        self.assertEquals(cu.devices, self.devices_dir)
-        self.assertEquals(cu.interval, 1)
-        self.assertEquals(cu.concurrency, 2)
-        self.assertEquals(cu.node_timeout, 5)
-        self.assert_(cu.get_account_ring() is not None)
-
-    def test_run_once(self):
-        cu = container_updater.ContainerUpdater({
+    def _get_container_updater(self, conf_updates=None):
+        conf = {
             'devices': self.devices_dir,
             'mount_check': 'false',
             'swift_dir': self.testdir,
@@ -78,133 +71,466 @@ def test_run_once(self):
             'concurrency': '1',
             'node_timeout': '15',
             'account_suppression_time': 0
-            })
+        }
+        if conf_updates:
+            conf.update(conf_updates)
+        return container_updater.ContainerUpdater(conf, logger=self.logger)
+
+    def test_creation(self):
+        cu = self._get_container_updater({'concurrency': '2',
+                                          'node_timeout': '5.5'})
+        self.assertTrue(hasattr(cu, 'logger'))
+        self.assertTrue(cu.logger is not None)
+        self.assertEqual(cu.devices, self.devices_dir)
+        self.assertEqual(cu.interval, 1)
+        self.assertEqual(cu.concurrency, 2)
+        self.assertEqual(cu.node_timeout, 5.5)
+        self.assertEqual(cu.account_suppression_time, 0)
+        self.assertTrue(cu.get_account_ring() is not None)
+
+    def test_conf_params(self):
+        # defaults
+        daemon = container_updater.ContainerUpdater({})
+        self.assertEqual(daemon.devices, '/srv/node')
+        self.assertEqual(daemon.mount_check, True)
+        self.assertEqual(daemon.swift_dir, '/etc/swift')
+        self.assertEqual(daemon.interval, 300)
+        self.assertEqual(daemon.concurrency, 4)
+        self.assertEqual(daemon.max_containers_per_second, 50.0)
+
+        # non-defaults
+        conf = {
+            'devices': '/some/where/else',
+            'mount_check': 'huh?',
+            'swift_dir': '/not/here',
+            'interval': '600.1',
+            'concurrency': '2',
+            'containers_per_second': '10.5',
+        }
+        daemon = container_updater.ContainerUpdater(conf)
+        self.assertEqual(daemon.devices, '/some/where/else')
+        self.assertEqual(daemon.mount_check, False)
+        self.assertEqual(daemon.swift_dir, '/not/here')
+        self.assertEqual(daemon.interval, 600.1)
+        self.assertEqual(daemon.concurrency, 2)
+        self.assertEqual(daemon.max_containers_per_second, 10.5)
+
+        # check deprecated option
+        daemon = container_updater.ContainerUpdater({'slowdown': '0.04'})
+        self.assertEqual(daemon.max_containers_per_second, 20.0)
+
+        def check_bad(conf):
+            with self.assertRaises(ValueError):
+                container_updater.ContainerUpdater(conf)
+
+        check_bad({'interval': 'foo'})
+        check_bad({'concurrency': 'bar'})
+        check_bad({'concurrency': '1.0'})
+        check_bad({'slowdown': 'baz'})
+        check_bad({'containers_per_second': 'quux'})
+
+    @mock.patch.object(container_updater.ContainerUpdater, 'container_sweep')
+    def test_run_once_with_device_unmounted(self, mock_sweep):
+        cu = self._get_container_updater()
+        containers_dir = os.path.join(self.sda1, DATADIR)
+        os.mkdir(containers_dir)
+        partition_dir = os.path.join(containers_dir, "a")
+        os.mkdir(partition_dir)
+
+        cu.run_once()
+        self.assertTrue(os.path.exists(containers_dir))  # sanity check
+
+        # only called if a partition dir exists
+        self.assertTrue(mock_sweep.called)
+
+        mock_sweep.reset_mock()
+        cu = self._get_container_updater({'mount_check': 'true'})
+        with mock_check_drive():
+            cu.run_once()
+        log_lines = self.logger.get_lines_for_level('warning')
+        self.assertGreater(len(log_lines), 0)
+        msg = '%s is not mounted' % self.sda1
+        self.assertEqual(log_lines[0], msg)
+        # Ensure that the container_sweep did not run
+        self.assertFalse(mock_sweep.called)
+
+    @mock.patch('swift.container.updater.dump_recon_cache')
+    def test_run_once_with_get_info_timeout(self, mock_dump_recon):
+        cu = self._get_container_updater()
+        containers_dir = os.path.join(self.sda1, DATADIR)
+        os.mkdir(containers_dir)
+        subdir = os.path.join(containers_dir, 'subdir')
+        os.mkdir(subdir)
+        db_file = os.path.join(subdir, 'hash.db')
+        cb = ContainerBroker(db_file, account='a', container='c')
+        cb.initialize(normalize_timestamp(1), 0)
+
+        timeout = exceptions.LockTimeout(10, db_file)
+        timeout.cancel()
+        with mock.patch('swift.container.updater.ContainerBroker.get_info',
+                        side_effect=timeout):
+            cu.run_once()
+        log_lines = self.logger.get_lines_for_level('info')
+        self.assertIn('Failed to get container info (Lock timeout: '
+                      '10 seconds: %s); skipping.' % db_file, log_lines)
+
+    @mock.patch('swift.container.updater.dump_recon_cache')
+    @mock.patch('swift.container.updater.ContainerUpdater.process_container',
+                side_effect=Exception('Boom!'))
+    def test_error_in_process(self, mock_process, mock_dump_recon):
+        cu = self._get_container_updater()
+        containers_dir = os.path.join(self.sda1, DATADIR)
+        os.mkdir(containers_dir)
+        subdir = os.path.join(containers_dir, 'subdir')
+        os.mkdir(subdir)
+        cb = ContainerBroker(os.path.join(subdir, 'hash.db'), account='a',
+                             container='c', pending_timeout=1)
+        cb.initialize(normalize_timestamp(1), 0)
+
+        cu.run_once()
+
+        log_lines = self.logger.get_lines_for_level('error')
+        self.assertTrue(log_lines)
+        self.assertIn('Error processing container ', log_lines[0])
+        self.assertIn('devices/sda1/containers/subdir/hash.db', log_lines[0])
+        self.assertIn('Boom!', log_lines[0])
+        self.assertFalse(log_lines[1:])
+        self.assertEqual(1, len(mock_dump_recon.mock_calls))
+
+    @mock.patch('swift.container.updater.dump_recon_cache')
+    def test_run_once(self, mock_recon):
+        cu = self._get_container_updater()
         cu.run_once()
-        containers_dir = os.path.join(self.sda1, container_server.DATADIR)
+        containers_dir = os.path.join(self.sda1, DATADIR)
         os.mkdir(containers_dir)
         cu.run_once()
-        self.assert_(os.path.exists(containers_dir))
+        self.assertTrue(os.path.exists(containers_dir))
         subdir = os.path.join(containers_dir, 'subdir')
         os.mkdir(subdir)
         cb = ContainerBroker(os.path.join(subdir, 'hash.db'), account='a',
                              container='c')
-        cb.initialize(normalize_timestamp(1))
+        cb.initialize(normalize_timestamp(1), 0)
+        self.assertTrue(cb.is_root_container())
         cu.run_once()
         info = cb.get_info()
-        self.assertEquals(info['object_count'], 0)
-        self.assertEquals(info['bytes_used'], 0)
-        self.assertEquals(info['reported_object_count'], 0)
-        self.assertEquals(info['reported_bytes_used'], 0)
+        self.assertEqual(info['object_count'], 0)
+        self.assertEqual(info['bytes_used'], 0)
+        self.assertEqual(info['reported_object_count'], 0)
+        self.assertEqual(info['reported_bytes_used'], 0)
 
         cb.put_object('o', normalize_timestamp(2), 3, 'text/plain',
                       '68b329da9893e34099c7d8ad5cb9c940')
         cu.run_once()
         info = cb.get_info()
-        self.assertEquals(info['object_count'], 1)
-        self.assertEquals(info['bytes_used'], 3)
-        self.assertEquals(info['reported_object_count'], 0)
-        self.assertEquals(info['reported_bytes_used'], 0)
+        self.assertEqual(info['object_count'], 1)
+        self.assertEqual(info['bytes_used'], 3)
+        self.assertEqual(info['reported_object_count'], 0)
+        self.assertEqual(info['reported_bytes_used'], 0)
 
         def accept(sock, addr, return_code):
             try:
                 with Timeout(3):
                     inc = sock.makefile('rb')
                     out = sock.makefile('wb')
-                    out.write('HTTP/1.1 %d OK\r\nContent-Length: 0\r\n\r\n' %
+                    out.write(b'HTTP/1.1 %d OK\r\nContent-Length: 0\r\n\r\n' %
                               return_code)
                     out.flush()
-                    self.assertEquals(inc.readline(),
-                                      'PUT /sda1/0/a/c HTTP/1.1\r\n')
+                    self.assertEqual(inc.readline(),
+                                     b'PUT /sda1/0/a/c HTTP/1.1\r\n')
                     headers = {}
                     line = inc.readline()
-                    while line and line != '\r\n':
-                        headers[line.split(':')[0].lower()] = \
-                            line.split(':')[1].strip()
+                    while line and line != b'\r\n':
+                        headers[line.split(b':')[0].lower()] = \
+                            line.split(b':')[1].strip()
                         line = inc.readline()
-                    self.assert_('x-put-timestamp' in headers)
-                    self.assert_('x-delete-timestamp' in headers)
-                    self.assert_('x-object-count' in headers)
-                    self.assert_('x-bytes-used' in headers)
-            except BaseException, err:
+                    self.assertIn(b'x-put-timestamp', headers)
+                    self.assertIn(b'x-delete-timestamp', headers)
+                    self.assertIn(b'x-object-count', headers)
+                    self.assertIn(b'x-bytes-used', headers)
+            except BaseException as err:
                 import traceback
                 traceback.print_exc()
                 return err
             return None
-        bindsock = listen(('127.0.0.1', 0))
+        bindsock = listen_zero()
+
         def spawn_accepts():
             events = []
-            for _junk in xrange(2):
+            for _junk in range(2):
                 sock, addr = bindsock.accept()
                 events.append(spawn(accept, sock, addr, 201))
             return events
+
         spawned = spawn(spawn_accepts)
         for dev in cu.get_account_ring().devs:
             if dev is not None:
-                dev['port'] = bindsock.getsockname()[1]
+                dev['replication_port'] = bindsock.getsockname()[1]
         cu.run_once()
-        for event in spawned.wait():
-            err = event.wait()
-            if err:
-                raise err
+        with Timeout(5):
+            for event in spawned.wait():
+                err = event.wait()
+                if err:
+                    raise err
         info = cb.get_info()
-        self.assertEquals(info['object_count'], 1)
-        self.assertEquals(info['bytes_used'], 3)
-        self.assertEquals(info['reported_object_count'], 1)
-        self.assertEquals(info['reported_bytes_used'], 3)
+        self.assertEqual(info['object_count'], 1)
+        self.assertEqual(info['bytes_used'], 3)
+        self.assertEqual(info['reported_object_count'], 1)
+        self.assertEqual(info['reported_bytes_used'], 3)
+
+    @mock.patch('os.listdir')
+    def test_listdir_with_exception(self, mock_listdir):
+        e = OSError('permission_denied')
+        mock_listdir.side_effect = e
+        cu = self._get_container_updater()
+        paths = cu.get_paths()
+        self.assertEqual(paths, [])
+        log_lines = self.logger.get_lines_for_level('error')
+        msg = ('ERROR:  Failed to get paths to drive partitions: '
+               'permission_denied')
+        self.assertEqual(log_lines[0], msg)
+
+    @mock.patch('os.listdir', return_value=['foo', 'bar'])
+    def test_listdir_without_exception(self, mock_listdir):
+        cu = self._get_container_updater()
+        path = cu._listdir('foo/bar/')
+        self.assertEqual(path, ['foo', 'bar'])
+        log_lines = self.logger.get_lines_for_level('error')
+        self.assertEqual(len(log_lines), 0)
 
     def test_unicode(self):
-        cu = container_updater.ContainerUpdater({
-            'devices': self.devices_dir,
-            'mount_check': 'false',
-            'swift_dir': self.testdir,
-            'interval': '1',
-            'concurrency': '1',
-            'node_timeout': '15',
-            })
-        containers_dir = os.path.join(self.sda1, container_server.DATADIR)
+        cu = self._get_container_updater()
+        containers_dir = os.path.join(self.sda1, DATADIR)
         os.mkdir(containers_dir)
         subdir = os.path.join(containers_dir, 'subdir')
         os.mkdir(subdir)
         cb = ContainerBroker(os.path.join(subdir, 'hash.db'), account='a',
                              container='\xce\xa9')
-        cb.initialize(normalize_timestamp(1))
-        cb.put_object('\xce\xa9', normalize_timestamp(2), 3, 'text/plain',
+        cb.initialize(normalize_timestamp(1), 0)
+        obj_name = u'\N{GREEK CAPITAL LETTER OMEGA}'
+        cb.put_object(obj_name, normalize_timestamp(2), 3, 'text/plain',
                       '68b329da9893e34099c7d8ad5cb9c940')
+
         def accept(sock, addr):
             try:
                 with Timeout(3):
                     inc = sock.makefile('rb')
                     out = sock.makefile('wb')
-                    out.write('HTTP/1.1 201 OK\r\nContent-Length: 0\r\n\r\n')
+                    out.write(b'HTTP/1.1 201 OK\r\nContent-Length: 0\r\n\r\n')
                     out.flush()
                     inc.read()
-            except BaseException, err:
+            except BaseException as err:
                 import traceback
                 traceback.print_exc()
                 return err
             return None
-        bindsock = listen(('127.0.0.1', 0))
+
+        bindsock = listen_zero()
+
         def spawn_accepts():
             events = []
-            for _junk in xrange(2):
+            for _junk in range(2):
                 with Timeout(3):
                     sock, addr = bindsock.accept()
                     events.append(spawn(accept, sock, addr))
             return events
+
+        spawned = spawn(spawn_accepts)
+        for dev in cu.get_account_ring().devs:
+            if dev is not None:
+                dev['replication_port'] = bindsock.getsockname()[1]
+        cu.run_once()
+        with Timeout(5):
+            for event in spawned.wait():
+                err = event.wait()
+                if err:
+                    raise err
+        info = cb.get_info()
+        self.assertEqual(info['object_count'], 1)
+        self.assertEqual(info['bytes_used'], 3)
+        self.assertEqual(info['reported_object_count'], 1)
+        self.assertEqual(info['reported_bytes_used'], 3)
+
+    def test_old_style_shard_container(self):
+        cu = self._get_container_updater()
+        cu.run_once()
+        containers_dir = os.path.join(self.sda1, DATADIR)
+        os.mkdir(containers_dir)
+        cu.run_once()
+        self.assertTrue(os.path.exists(containers_dir))
+        subdir = os.path.join(containers_dir, 'subdir')
+        os.mkdir(subdir)
+        cb = ContainerBroker(os.path.join(subdir, 'hash.db'),
+                             account='.shards_a', container='c')
+        put_ts = Timestamp(1)
+        cb.initialize(put_ts.internal, 0)
+        cb.set_sharding_sysmeta('Root', 'a/c')
+        self.assertFalse(cb.is_root_container())
+        cu.run_once()
+        info = cb.get_info()
+        self.assertEqual(info['object_count'], 0)
+        self.assertEqual(info['bytes_used'], 0)
+        self.assertEqual(info['reported_put_timestamp'], '0')
+        self.assertEqual(info['reported_delete_timestamp'], '0')
+        self.assertEqual(info['reported_object_count'], 0)
+        self.assertEqual(info['reported_bytes_used'], 0)
+
+        cb.put_object('o', normalize_timestamp(2), 3, 'text/plain',
+                      '68b329da9893e34099c7d8ad5cb9c940')
+        # Fake us having already reported *bad* stats under swift 2.18.0
+        cb.reported('0', '0', 1, 3)
+
+        # Should fail with a bunch of connection-refused
+        cu.run_once()
+        info = cb.get_info()
+        self.assertEqual(info['object_count'], 1)
+        self.assertEqual(info['bytes_used'], 3)
+        self.assertEqual(info['reported_put_timestamp'], '0')
+        self.assertEqual(info['reported_delete_timestamp'], '0')
+        self.assertEqual(info['reported_object_count'], 1)
+        self.assertEqual(info['reported_bytes_used'], 3)
+
+        def accept(sock, addr, return_code):
+            try:
+                with Timeout(3):
+                    inc = sock.makefile('rb')
+                    out = sock.makefile('wb')
+                    out.write(b'HTTP/1.1 %d OK\r\nContent-Length: 0\r\n\r\n' %
+                              return_code)
+                    out.flush()
+                    self.assertEqual(inc.readline(),
+                                     b'PUT /sda1/2/.shards_a/c HTTP/1.1\r\n')
+                    headers = {}
+                    line = inc.readline()
+                    while line and line != b'\r\n':
+                        headers[line.split(b':')[0].lower()] = \
+                            line.split(b':')[1].strip()
+                        line = inc.readline()
+                    self.assertIn(b'x-put-timestamp', headers)
+                    self.assertIn(b'x-delete-timestamp', headers)
+                    self.assertIn(b'x-object-count', headers)
+                    self.assertIn(b'x-bytes-used', headers)
+            except BaseException as err:
+                import traceback
+                traceback.print_exc()
+                return err
+            return None
+        bindsock = listen_zero()
+
+        def spawn_accepts():
+            events = []
+            for _junk in range(2):
+                sock, addr = bindsock.accept()
+                events.append(spawn(accept, sock, addr, 201))
+            return events
+
+        spawned = spawn(spawn_accepts)
+        for dev in cu.get_account_ring().devs:
+            if dev is not None:
+                dev['replication_port'] = bindsock.getsockname()[1]
+        cu.run_once()
+        with Timeout(5):
+            for event in spawned.wait():
+                err = event.wait()
+                if err:
+                    raise err
+        info = cb.get_info()
+        self.assertEqual(info['object_count'], 1)
+        self.assertEqual(info['bytes_used'], 3)
+        self.assertEqual(info['reported_put_timestamp'], put_ts.internal)
+        self.assertEqual(info['reported_delete_timestamp'], '0')
+        self.assertEqual(info['reported_object_count'], 0)
+        self.assertEqual(info['reported_bytes_used'], 0)
+
+    def test_shard_container(self):
+        cu = self._get_container_updater()
+        cu.run_once()
+        containers_dir = os.path.join(self.sda1, DATADIR)
+        os.mkdir(containers_dir)
+        cu.run_once()
+        self.assertTrue(os.path.exists(containers_dir))
+        subdir = os.path.join(containers_dir, 'subdir')
+        os.mkdir(subdir)
+        cb = ContainerBroker(os.path.join(subdir, 'hash.db'),
+                             account='.shards_a', container='c')
+        put_ts = Timestamp(1)
+        cb.initialize(put_ts.internal, 0)
+        cb.set_sharding_sysmeta('Quoted-Root', 'a/c')
+        self.assertFalse(cb.is_root_container())
+        cu.run_once()
+        info = cb.get_info()
+        self.assertEqual(info['object_count'], 0)
+        self.assertEqual(info['bytes_used'], 0)
+        self.assertEqual(info['reported_put_timestamp'], '0')
+        self.assertEqual(info['reported_delete_timestamp'], '0')
+        self.assertEqual(info['reported_object_count'], 0)
+        self.assertEqual(info['reported_bytes_used'], 0)
+
+        cb.put_object('o', normalize_timestamp(2), 3, 'text/plain',
+                      '68b329da9893e34099c7d8ad5cb9c940')
+        # Fake us having already reported *bad* stats under swift 2.18.0
+        cb.reported('0', '0', 1, 3)
+
+        # Should fail with a bunch of connection-refused
+        cu.run_once()
+        info = cb.get_info()
+        self.assertEqual(info['object_count'], 1)
+        self.assertEqual(info['bytes_used'], 3)
+        self.assertEqual(info['reported_put_timestamp'], '0')
+        self.assertEqual(info['reported_delete_timestamp'], '0')
+        self.assertEqual(info['reported_object_count'], 1)
+        self.assertEqual(info['reported_bytes_used'], 3)
+
+        def accept(sock, addr, return_code):
+            try:
+                with Timeout(3):
+                    inc = sock.makefile('rb')
+                    out = sock.makefile('wb')
+                    out.write(b'HTTP/1.1 %d OK\r\nContent-Length: 0\r\n\r\n' %
+                              return_code)
+                    out.flush()
+                    self.assertEqual(inc.readline(),
+                                     b'PUT /sda1/2/.shards_a/c HTTP/1.1\r\n')
+                    headers = {}
+                    line = inc.readline()
+                    while line and line != b'\r\n':
+                        headers[line.split(b':')[0].lower()] = \
+                            line.split(b':')[1].strip()
+                        line = inc.readline()
+                    self.assertIn(b'x-put-timestamp', headers)
+                    self.assertIn(b'x-delete-timestamp', headers)
+                    self.assertIn(b'x-object-count', headers)
+                    self.assertIn(b'x-bytes-used', headers)
+            except BaseException as err:
+                import traceback
+                traceback.print_exc()
+                return err
+            return None
+        bindsock = listen_zero()
+
+        def spawn_accepts():
+            events = []
+            for _junk in range(2):
+                sock, addr = bindsock.accept()
+                events.append(spawn(accept, sock, addr, 201))
+            return events
+
         spawned = spawn(spawn_accepts)
         for dev in cu.get_account_ring().devs:
             if dev is not None:
-                dev['port'] = bindsock.getsockname()[1]
+                dev['replication_port'] = bindsock.getsockname()[1]
         cu.run_once()
-        for event in spawned.wait():
-            err = event.wait()
-            if err:
-                raise err
+        with Timeout(5):
+            for event in spawned.wait():
+                err = event.wait()
+                if err:
+                    raise err
         info = cb.get_info()
-        self.assertEquals(info['object_count'], 1)
-        self.assertEquals(info['bytes_used'], 3)
-        self.assertEquals(info['reported_object_count'], 1)
-        self.assertEquals(info['reported_bytes_used'], 3)
+        self.assertEqual(info['object_count'], 1)
+        self.assertEqual(info['bytes_used'], 3)
+        self.assertEqual(info['reported_put_timestamp'], put_ts.internal)
+        self.assertEqual(info['reported_delete_timestamp'], '0')
+        self.assertEqual(info['reported_object_count'], 0)
+        self.assertEqual(info['reported_bytes_used'], 0)
 
 
 if __name__ == '__main__':
diff --git a/test/unit/helpers.py b/test/unit/helpers.py
new file mode 100644
index 0000000000..08bf0f5edc
--- /dev/null
+++ b/test/unit/helpers.py
@@ -0,0 +1,339 @@
+# Copyright (c) 2010-2016 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""
+Provides helper functions for unit tests.
+
+This cannot be in test/unit/__init__.py because that module is imported by the
+py34 unit test job and there are imports here that end up importing modules
+that are not yet ported to py34, such wsgi.py which import mimetools.
+"""
+import os
+from tempfile import mkdtemp
+import time
+import warnings
+
+from eventlet import spawn, wsgi
+from unittest import mock
+from shutil import rmtree
+
+import swift
+from swift.account import server as account_server
+from swift.common import storage_policy
+from swift.common.ring import RingData
+from swift.common.storage_policy import StoragePolicy, ECStoragePolicy
+from swift.common.middleware import listing_formats, proxy_logging
+from swift.common import utils
+from swift.common.utils import mkdirs, normalize_timestamp, NullLogger
+from swift.common.http_protocol import SwiftHttpProtocol
+from swift.container import server as container_server
+from swift.obj import server as object_server
+from swift.proxy import server as proxy_server
+import swift.proxy.controllers.obj
+
+from test import listen_zero
+from test.debug_logger import debug_logger
+from test.unit import write_fake_ring, DEFAULT_TEST_EC_TYPE, connect_tcp, \
+    readuntil2crlfs
+
+
+def setup_servers(the_object_server=object_server, extra_conf=None):
+    """
+    Setup proxy, account, container and object servers using a set of fake
+    rings and policies.
+
+    :param the_object_server: The object server module to use (optional,
+                              defaults to swift.obj.server)
+    :param extra_conf: A dict of config options that will update the basic
+                       config passed to all server instances.
+    :returns: A dict containing the following entries:
+                  orig_POLICIES: the value of storage_policy.POLICIES prior to
+                                 it being patched with fake policies
+                  orig_SysLogHandler: the value of utils.logs.SysLogHandler
+                                      prior to it being patched
+                  testdir: root directory used for test files
+                  test_POLICIES: a StoragePolicyCollection of fake policies
+                  test_servers: a tuple of test server instances
+                  test_sockets: a tuple of sockets used by test servers
+                  test_coros: a tuple of greenthreads in which test servers are
+                              running
+    """
+    context = {
+        "orig_POLICIES": storage_policy._POLICIES,
+        "orig_SysLogHandler": utils.logs.SysLogHandler}
+
+    utils.HASH_PATH_SUFFIX = b'endcap'
+    utils.logs.SysLogHandler = mock.MagicMock()
+    # Since we're starting up a lot here, we're going to test more than
+    # just chunked puts; we're also going to test parts of
+    # proxy_server.Application we couldn't get to easily otherwise.
+    context["testdir"] = _testdir = \
+        os.path.join(mkdtemp(), 'tmp_test_proxy_server_chunked')
+    mkdirs(_testdir)
+    rmtree(_testdir)
+    for drive in ('sda1', 'sdb1', 'sdc1', 'sdd1', 'sde1',
+                  'sdf1', 'sdg1', 'sdh1', 'sdi1', 'sdj1',
+                  'sdk1', 'sdl1'):
+        mkdirs(os.path.join(_testdir, drive, 'tmp'))
+    conf = {'devices': _testdir, 'swift_dir': _testdir,
+            'mount_check': 'false', 'allowed_headers':
+            'content-encoding, x-object-manifest, content-disposition, foo',
+            'allow_versions': 't', 'node_timeout': 20}
+    if extra_conf:
+        conf.update(extra_conf)
+    context['conf'] = conf
+    prolis = listen_zero()
+    acc1lis = listen_zero()
+    acc2lis = listen_zero()
+    con1lis = listen_zero()
+    con2lis = listen_zero()
+    obj1lis = listen_zero()
+    obj2lis = listen_zero()
+    obj3lis = listen_zero()
+    obj4lis = listen_zero()
+    obj5lis = listen_zero()
+    obj6lis = listen_zero()
+    objsocks = [obj1lis, obj2lis, obj3lis, obj4lis, obj5lis, obj6lis]
+    context["test_sockets"] = \
+        (prolis, acc1lis, acc2lis, con1lis, con2lis, obj1lis, obj2lis, obj3lis,
+         obj4lis, obj5lis, obj6lis)
+    account_ring_path = os.path.join(_testdir, 'account.ring.gz')
+    account_devs = [
+        {'port': acc1lis.getsockname()[1]},
+        {'port': acc2lis.getsockname()[1]},
+    ]
+    write_fake_ring(account_ring_path, *account_devs)
+    container_ring_path = os.path.join(_testdir, 'container.ring.gz')
+    container_devs = [
+        {'port': con1lis.getsockname()[1]},
+        {'port': con2lis.getsockname()[1]},
+    ]
+    write_fake_ring(container_ring_path, *container_devs)
+    storage_policy._POLICIES = storage_policy.StoragePolicyCollection([
+        StoragePolicy(0, 'zero', True),
+        StoragePolicy(1, 'one', False),
+        StoragePolicy(2, 'two', False),
+        ECStoragePolicy(3, 'ec', ec_type=DEFAULT_TEST_EC_TYPE,
+                        ec_ndata=2, ec_nparity=1, ec_segment_size=4096),
+        ECStoragePolicy(4, 'ec-dup', ec_type=DEFAULT_TEST_EC_TYPE,
+                        ec_ndata=2, ec_nparity=1, ec_segment_size=4096,
+                        ec_duplication_factor=2)])
+    obj_rings = {
+        0: ('sda1', 'sdb1'),
+        1: ('sdc1', 'sdd1'),
+        2: ('sde1', 'sdf1'),
+        # sdg1, sdh1, sdi1 taken by policy 3 (see below)
+    }
+    for policy_index, devices in obj_rings.items():
+        policy = storage_policy.POLICIES[policy_index]
+        obj_ring_path = os.path.join(_testdir, policy.ring_name + '.ring.gz')
+        obj_devs = [
+            {'port': objsock.getsockname()[1], 'device': dev}
+            for objsock, dev in zip(objsocks, devices)]
+        write_fake_ring(obj_ring_path, *obj_devs)
+
+    # write_fake_ring can't handle a 3-element ring, and the EC policy needs
+    # at least 6 devs to work with (ec_k=2, ec_m=1, duplication_factor=2),
+    # so we do it manually
+    devs = [{'id': 0, 'region': 1, 'zone': 0, 'device': 'sdg1',
+             'ip': '127.0.0.1', 'port': obj1lis.getsockname()[1]},
+            {'id': 1, 'region': 1, 'zone': 0, 'device': 'sdh1',
+             'ip': '127.0.0.1', 'port': obj2lis.getsockname()[1]},
+            {'id': 2, 'region': 1, 'zone': 0, 'device': 'sdi1',
+             'ip': '127.0.0.1', 'port': obj3lis.getsockname()[1]},
+            {'id': 3, 'region': 1, 'zone': 0, 'device': 'sdj1',
+             'ip': '127.0.0.1', 'port': obj4lis.getsockname()[1]},
+            {'id': 4, 'region': 1, 'zone': 0, 'device': 'sdk1',
+             'ip': '127.0.0.1', 'port': obj5lis.getsockname()[1]},
+            {'id': 5, 'region': 1, 'zone': 0, 'device': 'sdl1',
+             'ip': '127.0.0.1', 'port': obj6lis.getsockname()[1]}]
+    pol3_replica2part2dev_id = [[0, 1, 2, 0],
+                                [1, 2, 0, 1],
+                                [2, 0, 1, 2]]
+    pol4_replica2part2dev_id = [[0, 1, 2, 3],
+                                [1, 2, 3, 4],
+                                [2, 3, 4, 5],
+                                [3, 4, 5, 0],
+                                [4, 5, 0, 1],
+                                [5, 0, 1, 2]]
+    obj3_ring_path = os.path.join(
+        _testdir, storage_policy.POLICIES[3].ring_name + '.ring.gz')
+    part_shift = 30
+    RingData(pol3_replica2part2dev_id, devs, part_shift).save(obj3_ring_path)
+
+    obj4_ring_path = os.path.join(
+        _testdir, storage_policy.POLICIES[4].ring_name + '.ring.gz')
+    part_shift = 30
+    RingData(pol4_replica2part2dev_id, devs, part_shift).save(obj4_ring_path)
+
+    prosrv = proxy_server.Application(conf, logger=debug_logger('proxy'))
+    for policy in storage_policy.POLICIES:
+        # make sure all the rings are loaded
+        prosrv.get_object_ring(policy.idx)
+    # don't lose this one!
+    context["test_POLICIES"] = storage_policy._POLICIES
+    acc1srv = account_server.AccountController(
+        conf, logger=debug_logger('acct1'))
+    acc2srv = account_server.AccountController(
+        conf, logger=debug_logger('acct2'))
+    con1srv = container_server.ContainerController(
+        conf, logger=debug_logger('cont1'))
+    con2srv = container_server.ContainerController(
+        conf, logger=debug_logger('cont2'))
+    obj1srv = the_object_server.ObjectController(
+        conf, logger=debug_logger('obj1'))
+    obj2srv = the_object_server.ObjectController(
+        conf, logger=debug_logger('obj2'))
+    obj3srv = the_object_server.ObjectController(
+        conf, logger=debug_logger('obj3'))
+    obj4srv = the_object_server.ObjectController(
+        conf, logger=debug_logger('obj4'))
+    obj5srv = the_object_server.ObjectController(
+        conf, logger=debug_logger('obj5'))
+    obj6srv = the_object_server.ObjectController(
+        conf, logger=debug_logger('obj6'))
+    context["test_servers"] = \
+        (prosrv, acc1srv, acc2srv, con1srv, con2srv, obj1srv, obj2srv, obj3srv,
+         obj4srv, obj5srv, obj6srv)
+    nl = NullLogger()
+    logging_prosv = proxy_logging.ProxyLoggingMiddleware(
+        listing_formats.ListingFilter(prosrv, {}, logger=prosrv.logger),
+        conf, logger=prosrv.logger)
+    # Yes, eventlet, we know -- we have to support bad clients, though
+    warnings.filterwarnings(
+        'ignore', module='eventlet',
+        message='capitalize_response_headers is disabled')
+    prospa = spawn(wsgi.server, prolis, logging_prosv, nl,
+                   protocol=SwiftHttpProtocol,
+                   capitalize_response_headers=False)
+    acc1spa = spawn(wsgi.server, acc1lis, acc1srv, nl,
+                    protocol=SwiftHttpProtocol,
+                    capitalize_response_headers=False)
+    acc2spa = spawn(wsgi.server, acc2lis, acc2srv, nl,
+                    protocol=SwiftHttpProtocol,
+                    capitalize_response_headers=False)
+    con1spa = spawn(wsgi.server, con1lis, con1srv, nl,
+                    protocol=SwiftHttpProtocol,
+                    capitalize_response_headers=False)
+    con2spa = spawn(wsgi.server, con2lis, con2srv, nl,
+                    protocol=SwiftHttpProtocol,
+                    capitalize_response_headers=False)
+    obj1spa = spawn(wsgi.server, obj1lis, obj1srv, nl,
+                    protocol=SwiftHttpProtocol,
+                    capitalize_response_headers=False)
+    obj2spa = spawn(wsgi.server, obj2lis, obj2srv, nl,
+                    protocol=SwiftHttpProtocol,
+                    capitalize_response_headers=False)
+    obj3spa = spawn(wsgi.server, obj3lis, obj3srv, nl,
+                    protocol=SwiftHttpProtocol,
+                    capitalize_response_headers=False)
+    obj4spa = spawn(wsgi.server, obj4lis, obj4srv, nl,
+                    protocol=SwiftHttpProtocol,
+                    capitalize_response_headers=False)
+    obj5spa = spawn(wsgi.server, obj5lis, obj5srv, nl,
+                    protocol=SwiftHttpProtocol,
+                    capitalize_response_headers=False)
+    obj6spa = spawn(wsgi.server, obj6lis, obj6srv, nl,
+                    protocol=SwiftHttpProtocol,
+                    capitalize_response_headers=False)
+    context["test_coros"] = \
+        (prospa, acc1spa, acc2spa, con1spa, con2spa, obj1spa, obj2spa, obj3spa,
+         obj4spa, obj5spa, obj6spa)
+    # Create account
+    ts = normalize_timestamp(time.time())
+    partition, nodes = prosrv.account_ring.get_nodes('a')
+    for node in nodes:
+        conn = swift.proxy.controllers.obj.http_connect(node['ip'],
+                                                        node['port'],
+                                                        node['device'],
+                                                        partition, 'PUT', '/a',
+                                                        {'X-Timestamp': ts,
+                                                         'x-trans-id': 'test'})
+        resp = conn.getresponse()
+        assert resp.status == 201
+    # Create another account
+    # used for account-to-account tests
+    ts = normalize_timestamp(time.time())
+    partition, nodes = prosrv.account_ring.get_nodes('a1')
+    for node in nodes:
+        conn = swift.proxy.controllers.obj.http_connect(node['ip'],
+                                                        node['port'],
+                                                        node['device'],
+                                                        partition, 'PUT',
+                                                        '/a1',
+                                                        {'X-Timestamp': ts,
+                                                         'x-trans-id': 'test'})
+        resp = conn.getresponse()
+        assert resp.status == 201
+    # Create containers, 1 per test policy
+    sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+    fd = sock.makefile('rwb')
+    fd.write(b'PUT /v1/a/c HTTP/1.1\r\nHost: localhost\r\n'
+             b'Connection: close\r\nX-Auth-Token: t\r\n'
+             b'Content-Length: 0\r\n\r\n')
+    fd.flush()
+    headers = readuntil2crlfs(fd)
+    exp = b'HTTP/1.1 201'
+    assert headers[:len(exp)] == exp, "Expected '%s', encountered '%s'" % (
+        exp, headers[:len(exp)])
+    # Create container in other account
+    # used for account-to-account tests
+    sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+    fd = sock.makefile('rwb')
+    fd.write(b'PUT /v1/a1/c1 HTTP/1.1\r\nHost: localhost\r\n'
+             b'Connection: close\r\nX-Auth-Token: t\r\n'
+             b'Content-Length: 0\r\n\r\n')
+    fd.flush()
+    headers = readuntil2crlfs(fd)
+    exp = b'HTTP/1.1 201'
+    assert headers[:len(exp)] == exp, "Expected '%s', encountered '%s'" % (
+        exp, headers[:len(exp)])
+
+    sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+    fd = sock.makefile('rwb')
+    fd.write(
+        b'PUT /v1/a/c1 HTTP/1.1\r\nHost: localhost\r\n'
+        b'Connection: close\r\nX-Auth-Token: t\r\nX-Storage-Policy: one\r\n'
+        b'Content-Length: 0\r\n\r\n')
+    fd.flush()
+    headers = readuntil2crlfs(fd)
+    exp = b'HTTP/1.1 201'
+    assert headers[:len(exp)] == exp, \
+        "Expected %r, encountered %r" % (exp, headers[:len(exp)])
+
+    sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+    fd = sock.makefile('rwb')
+    fd.write(
+        b'PUT /v1/a/c2 HTTP/1.1\r\nHost: localhost\r\n'
+        b'Connection: close\r\nX-Auth-Token: t\r\nX-Storage-Policy: two\r\n'
+        b'Content-Length: 0\r\n\r\n')
+    fd.flush()
+    headers = readuntil2crlfs(fd)
+    exp = b'HTTP/1.1 201'
+    assert headers[:len(exp)] == exp, \
+        "Expected '%s', encountered '%s'" % (exp, headers[:len(exp)])
+    return context
+
+
+def teardown_servers(context):
+    for server in context["test_coros"]:
+        server.kill()
+    # We didn't start the proxy w/ run_server, so we have to kill the
+    # watchdog ourselves
+    context["test_servers"][0].watchdog.kill()
+    assert context["test_servers"][0].watchdog._run_gth is None
+    rmtree(os.path.dirname(context["testdir"]))
+    utils.logs.SysLogHandler = context["orig_SysLogHandler"]
+    storage_policy._POLICIES = context["orig_POLICIES"]
diff --git a/test/unit/obj/common.py b/test/unit/obj/common.py
new file mode 100644
index 0000000000..4cf8ff01c1
--- /dev/null
+++ b/test/unit/obj/common.py
@@ -0,0 +1,117 @@
+# Copyright (c) 2013 - 2015 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import os
+import shutil
+import tempfile
+import unittest
+
+from swift.common import utils
+from swift.common.storage_policy import POLICIES
+from swift.common.utils import Timestamp, md5
+from test.unit import make_timestamp_iter
+
+
+def write_diskfile(df, timestamp, data=b'test data', frag_index=None,
+                   commit=True, legacy_durable=False, extra_metadata=None):
+    # Helper method to write some data and metadata to a diskfile.
+    # Optionally do not commit the diskfile, or commit but using a legacy
+    # durable file
+    with df.create() as writer:
+        writer.write(data)
+        metadata = {
+            'ETag': md5(data, usedforsecurity=False).hexdigest(),
+            'X-Timestamp': timestamp.internal,
+            'Content-Length': str(len(data)),
+        }
+        if extra_metadata:
+            metadata.update(extra_metadata)
+        if frag_index is not None:
+            metadata['X-Object-Sysmeta-Ec-Frag-Index'] = str(frag_index)
+            metadata['X-Object-Sysmeta-Ec-Etag'] = 'fake-etag'
+        writer.put(metadata)
+        if commit and legacy_durable:
+            # simulate legacy .durable file creation
+            durable_file = os.path.join(df._datadir,
+                                        timestamp.internal + '.durable')
+            with open(durable_file, 'wb'):
+                pass
+        elif commit:
+            writer.commit(timestamp)
+        # else: don't make it durable
+    return metadata
+
+
+class BaseTest(unittest.TestCase):
+    def setUp(self):
+        self.device = 'dev'
+        self.partition = '9'
+        self.tmpdir = tempfile.mkdtemp()
+        # sender side setup
+        self.tx_testdir = os.path.join(self.tmpdir, 'tmp_test_ssync_sender')
+        utils.mkdirs(os.path.join(self.tx_testdir, self.device))
+        self.daemon_conf = {
+            'devices': self.tx_testdir,
+            'mount_check': 'false',
+        }
+        # daemon will be set in subclass setUp
+        self.daemon = None
+        self._ts_iter = make_timestamp_iter()
+
+    def tearDown(self):
+        shutil.rmtree(self.tmpdir, ignore_errors=True)
+
+    def ts(self):
+        """
+        Timestamps - forever.
+        """
+        return next(self._ts_iter)
+
+    def _make_diskfile(self, device='dev', partition='9',
+                       account='a', container='c', obj='o', body=b'test',
+                       extra_metadata=None, policy=None,
+                       frag_index=None, timestamp=None, df_mgr=None,
+                       commit=True, verify=True, **kwargs):
+        policy = policy or POLICIES.legacy
+        object_parts = account, container, obj
+        timestamp = Timestamp.now() if timestamp is None else timestamp
+        if df_mgr is None:
+            df_mgr = self.daemon._df_router[policy]
+        df = df_mgr.get_diskfile(
+            device, partition, *object_parts, policy=policy,
+            frag_index=frag_index, **kwargs)
+        write_diskfile(df, timestamp, data=body, extra_metadata=extra_metadata,
+                       commit=commit)
+        if commit and verify:
+            # when we write and commit stub data, sanity check it's readable
+            # and not quarantined because of any validation check
+            with df.open():
+                self.assertEqual(b''.join(df.reader()), body)
+            # sanity checks
+            listing = os.listdir(df._datadir)
+            self.assertTrue(listing)
+            for filename in listing:
+                self.assertTrue(filename.startswith(timestamp.internal))
+        return df
+
+    def _make_open_diskfile(self, device='dev', partition='9',
+                            account='a', container='c', obj='o', body=b'test',
+                            extra_metadata=None, policy=None,
+                            frag_index=None, timestamp=None, df_mgr=None,
+                            commit=True, **kwargs):
+        df = self._make_diskfile(device, partition, account, container, obj,
+                                 body, extra_metadata, policy, frag_index,
+                                 timestamp, df_mgr, commit, **kwargs)
+        df.open()
+        return df
diff --git a/test/unit/obj/test_auditor.py b/test/unit/obj/test_auditor.py
index a655170495..1891a06ad6 100644
--- a/test/unit/obj/test_auditor.py
+++ b/test/unit/obj/test_auditor.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,377 +13,2218 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-from test import unit
 import unittest
-import tempfile
+import json
+from unittest import mock
 import os
+import signal
+import string
+import sys
 import time
+import xattr
 from shutil import rmtree
-from hashlib import md5
 from tempfile import mkdtemp
-from test.unit import FakeLogger
-from swift.obj import auditor
-from swift.obj import server as object_server
-from swift.obj.server import DiskFile, write_metadata, DATADIR
-from swift.common.utils import hash_path, mkdirs, normalize_timestamp, \
-    renamer, storage_directory
-from swift.obj.replicator import invalidate_hash
-from swift.common.exceptions import AuditException
+import textwrap
+from os.path import dirname, basename
 
+from test import BaseTestCase
+from test.debug_logger import debug_logger
+from test.unit import (
+    DEFAULT_TEST_EC_TYPE, make_timestamp_iter, patch_policies,
+    skip_if_no_xattrs)
+from test.unit.obj.common import write_diskfile
+from swift.obj import auditor, replicator
+from swift.obj.watchers.dark_data import DarkDataWatcher
+from swift.obj.diskfile import (
+    DiskFile, write_metadata, invalidate_hash, get_data_dir,
+    DiskFileManager, ECDiskFileManager, AuditLocation, clear_auditor_status,
+    get_auditor_status, HASH_FILE, HASH_INVALIDATIONS_FILE)
+from swift.common.exceptions import ClientException
+from swift.common.utils import (
+    mkdirs, normalize_timestamp, Timestamp, readconf, md5)
+from swift.common.utils.logs import SwiftLogAdapter
+from swift.common.storage_policy import (
+    ECStoragePolicy, StoragePolicy, POLICIES, EC_POLICY)
 
-class TestAuditor(unittest.TestCase):
+_mocked_policies = [
+    StoragePolicy(0, 'zero', False),
+    StoragePolicy(1, 'one', True),
+    ECStoragePolicy(2, 'two', ec_type=DEFAULT_TEST_EC_TYPE,
+                    ec_ndata=2, ec_nparity=1, ec_segment_size=4096),
+]
+
+
+def works_only_once(callable_thing, exception):
+    called = [False]
+
+    def only_once(*a, **kw):
+        if called[0]:
+            raise exception
+        else:
+            called[0] = True
+            return callable_thing(*a, **kw)
+
+    return only_once
+
+
+class FakeRing1(object):
+
+    def __init__(self, swift_dir, ring_name=None):
+        return
+
+    def get_nodes(self, *args, **kwargs):
+        x = 1
+        node1 = {'ip': '10.0.0.%s' % x,
+                 'replication_ip': '10.0.0.%s' % x,
+                 'port': 6200 + x,
+                 'replication_port': 6200 + x,
+                 'device': 'sda',
+                 'zone': x % 3,
+                 'region': x % 2,
+                 'id': x,
+                 'handoff_index': 1}
+        return (1, [node1])
+
+
+class FakeRing2(object):
+
+    def __init__(self, swift_dir, ring_name=None):
+        return
+
+    def get_nodes(self, *args, **kwargs):
+        nodes = []
+        for x in [1, 2]:
+            nodes.append({'ip': '10.0.0.%s' % x,
+                          'replication_ip': '10.0.0.%s' % x,
+                          'port': 6200 + x,
+                          'replication_port': 6200 + x,
+                          'device': 'sda',
+                          'zone': x % 3,
+                          'region': x % 2,
+                          'id': x,
+                          'handoff_index': 1})
+        return (1, nodes)
+
+
+class TestAuditorBase(BaseTestCase):
 
     def setUp(self):
+        skip_if_no_xattrs()
         self.testdir = os.path.join(mkdtemp(), 'tmp_test_object_auditor')
         self.devices = os.path.join(self.testdir, 'node')
-        self.logger = FakeLogger()
+        self.rcache = os.path.join(self.testdir, 'object.recon')
+        self.logger = debug_logger()
         rmtree(self.testdir, ignore_errors=1)
         mkdirs(os.path.join(self.devices, 'sda'))
-        self.objects = os.path.join(self.devices, 'sda', 'objects')
-
         os.mkdir(os.path.join(self.devices, 'sdb'))
-        self.objects_2 = os.path.join(self.devices, 'sdb', 'objects')
 
+        # policy 0
+        self.objects = os.path.join(self.devices, 'sda',
+                                    get_data_dir(POLICIES[0]))
+        self.objects_2 = os.path.join(self.devices, 'sdb',
+                                      get_data_dir(POLICIES[0]))
         os.mkdir(self.objects)
+        # policy 1
+        self.objects_p1 = os.path.join(self.devices, 'sda',
+                                       get_data_dir(POLICIES[1]))
+        self.objects_2_p1 = os.path.join(self.devices, 'sdb',
+                                         get_data_dir(POLICIES[1]))
+        os.mkdir(self.objects_p1)
+        # policy 2
+        self.objects_p2 = os.path.join(self.devices, 'sda',
+                                       get_data_dir(POLICIES[2]))
+        self.objects_2_p2 = os.path.join(self.devices, 'sdb',
+                                         get_data_dir(POLICIES[2]))
+        os.mkdir(self.objects_p2)
+
         self.parts = {}
+        self.parts_p1 = {}
+        self.parts_p2 = {}
         for part in ['0', '1', '2', '3']:
             self.parts[part] = os.path.join(self.objects, part)
+            self.parts_p1[part] = os.path.join(self.objects_p1, part)
+            self.parts_p2[part] = os.path.join(self.objects_p2, part)
             os.mkdir(os.path.join(self.objects, part))
+            os.mkdir(os.path.join(self.objects_p1, part))
+            os.mkdir(os.path.join(self.objects_p2, part))
 
         self.conf = dict(
             devices=self.devices,
-            mount_check='false')
-        self.disk_file = DiskFile(self.devices, 'sda', '0', 'a', 'c', 'o',
-                                  self.logger)
+            mount_check='false',
+            object_size_stats='10,100,1024,10240')
+        self.df_mgr = DiskFileManager(self.conf, self.logger)
+        self.ec_df_mgr = ECDiskFileManager(self.conf, self.logger)
+
+        # diskfiles for policy 0, 1, 2
+        self.disk_file = self.df_mgr.get_diskfile('sda', '0', 'a', 'c', 'o',
+                                                  policy=POLICIES[0])
+        self.disk_file_p1 = self.df_mgr.get_diskfile('sda', '0', 'a', 'c2',
+                                                     'o', policy=POLICIES[1])
+        self.disk_file_ec = self.ec_df_mgr.get_diskfile(
+            'sda', '0', 'a', 'c_ec', 'o', policy=POLICIES[2], frag_index=1)
 
     def tearDown(self):
         rmtree(os.path.dirname(self.testdir), ignore_errors=1)
-        unit.xattr_data = {}
+
+
+@patch_policies(_mocked_policies)
+class TestAuditor(TestAuditorBase):
+
+    def setUp(self):
+        super().setUp()
+        self.ts = make_timestamp_iter()
+
+    def test_worker_conf_parms(self):
+        def check_common_defaults():
+            self.assertEqual(auditor_worker.max_bytes_per_second, 10000000)
+            self.assertEqual(auditor_worker.log_time, 3600)
+
+        # test default values
+        conf = dict(
+            devices=self.devices,
+            mount_check='false',
+            object_size_stats='10,100,1024,10240')
+        auditor_worker = auditor.AuditorWorker(conf, self.logger,
+                                               self.rcache, self.devices)
+        check_common_defaults()
+        for policy in POLICIES:
+            mgr = auditor_worker.diskfile_router[policy]
+            self.assertEqual(mgr.disk_chunk_size, 65536)
+        self.assertEqual(auditor_worker.max_files_per_second, 20)
+        self.assertEqual(auditor_worker.zero_byte_only_at_fps, 0)
+
+        # test specified audit value overrides
+        conf.update({'disk_chunk_size': 4096})
+        auditor_worker = auditor.AuditorWorker(conf, self.logger,
+                                               self.rcache, self.devices,
+                                               zero_byte_only_at_fps=50)
+        check_common_defaults()
+        for policy in POLICIES:
+            mgr = auditor_worker.diskfile_router[policy]
+            self.assertEqual(mgr.disk_chunk_size, 4096)
+        self.assertEqual(auditor_worker.max_files_per_second, 50)
+        self.assertEqual(auditor_worker.zero_byte_only_at_fps, 50)
 
     def test_object_audit_extra_data(self):
-        self.auditor = auditor.AuditorWorker(self.conf)
-        data = '0' * 1024
-        etag = md5()
-        with self.disk_file.mkstemp() as fd:
-            os.write(fd, data)
-            etag.update(data)
-            etag = etag.hexdigest()
-            timestamp = str(normalize_timestamp(time.time()))
+        def run_tests(disk_file):
+            auditor_worker = auditor.AuditorWorker(self.conf, self.logger,
+                                                   self.rcache, self.devices)
+            data = b'0' * 1024
+            if disk_file.policy.policy_type == EC_POLICY:
+                data = disk_file.policy.pyeclib_driver.encode(data)[0]
+            etag = md5(usedforsecurity=False)
+            with disk_file.create() as writer:
+                writer.write(data)
+                etag.update(data)
+                etag = etag.hexdigest()
+                timestamp = str(normalize_timestamp(time.time()))
+                metadata = {
+                    'ETag': etag,
+                    'X-Timestamp': timestamp,
+                    'Content-Length': str(os.fstat(writer._fd).st_size),
+                }
+                if disk_file.policy.policy_type == EC_POLICY:
+                    metadata.update({
+                        'X-Object-Sysmeta-Ec-Frag-Index': '1',
+                        'X-Object-Sysmeta-Ec-Etag': 'fake-etag',
+                    })
+                writer.put(metadata)
+                writer.commit(Timestamp(timestamp))
+                pre_quarantines = auditor_worker.quarantines
+
+                auditor_worker.object_audit(
+                    AuditLocation(disk_file._datadir, 'sda', '0',
+                                  policy=disk_file.policy))
+                self.assertEqual(auditor_worker.quarantines, pre_quarantines)
+
+                os.write(writer._fd, b'extra_data')
+
+                auditor_worker.object_audit(
+                    AuditLocation(disk_file._datadir, 'sda', '0',
+                                  policy=disk_file.policy))
+                self.assertEqual(auditor_worker.quarantines,
+                                 pre_quarantines + 1)
+        run_tests(self.disk_file)
+        run_tests(self.disk_file_p1)
+        run_tests(self.disk_file_ec)
+
+    def test_object_audit_adds_metadata_checksums(self):
+        disk_file = self.df_mgr.get_diskfile('sda', '0', 'a', 'c', 'o-md',
+                                             policy=POLICIES.legacy)
+
+        # simulate a PUT
+        now = time.time()
+        data = b'boots and cats and ' * 1024
+        hasher = md5(usedforsecurity=False)
+        with disk_file.create() as writer:
+            writer.write(data)
+            hasher.update(data)
+            etag = hasher.hexdigest()
             metadata = {
                 'ETag': etag,
-                'X-Timestamp': timestamp,
-                'Content-Length': str(os.fstat(fd).st_size),
+                'X-Timestamp': str(normalize_timestamp(now)),
+                'Content-Length': len(data),
+                'Content-Type': 'the old type',
             }
-            self.disk_file.put(fd, metadata)
-            pre_quarantines = self.auditor.quarantines
+            writer.put(metadata)
+            writer.commit(Timestamp(now))
+
+        # simulate a subsequent POST
+        post_metadata = metadata.copy()
+        post_metadata['Content-Type'] = 'the new type'
+        post_metadata['X-Object-Meta-Biff'] = 'buff'
+        post_metadata['X-Timestamp'] = str(normalize_timestamp(now + 1))
+        disk_file.write_metadata(post_metadata)
+
+        file_paths = [os.path.join(disk_file._datadir, fname)
+                      for fname in os.listdir(disk_file._datadir)
+                      if fname not in ('.', '..')]
+        file_paths.sort()
+
+        # sanity check: make sure we have a .data and a .meta file
+        self.assertEqual(len(file_paths), 2)
+        self.assertTrue(file_paths[0].endswith(".data"))
+        self.assertTrue(file_paths[1].endswith(".meta"))
+
+        # Go remove the xattr "user.swift.metadata_checksum" as if this
+        # object were written before Swift supported metadata checksums.
+        for file_path in file_paths:
+            xattr.removexattr(file_path, "user.swift.metadata_checksum")
+
+        # Run the auditor...
+        auditor_worker = auditor.AuditorWorker(self.conf, self.logger,
+                                               self.rcache, self.devices)
+        auditor_worker.object_audit(
+            AuditLocation(disk_file._datadir, 'sda', '0',
+                          policy=disk_file.policy))
+        self.assertEqual(auditor_worker.quarantines, 0)  # sanity
+
+        # ...and the checksums are back
+        for file_path in file_paths:
+            metadata = xattr.getxattr(file_path, "user.swift.metadata")
+            i = 1
+            while True:
+                try:
+                    metadata += xattr.getxattr(
+                        file_path, "user.swift.metadata%d" % i)
+                    i += 1
+                except (IOError, OSError):
+                    break
 
-            self.auditor.object_audit(
-                os.path.join(self.disk_file.datadir, timestamp + '.data'),
-                'sda', '0')
-            self.assertEquals(self.auditor.quarantines, pre_quarantines)
+            checksum = xattr.getxattr(
+                file_path, "user.swift.metadata_checksum")
 
-            os.write(fd, 'extra_data')
-            self.auditor.object_audit(
-                os.path.join(self.disk_file.datadir, timestamp + '.data'),
-                'sda', '0')
-            self.assertEquals(self.auditor.quarantines, pre_quarantines + 1)
+            self.assertEqual(
+                checksum,
+                (md5(metadata, usedforsecurity=False).hexdigest()
+                 .encode('ascii')))
 
     def test_object_audit_diff_data(self):
-        self.auditor = auditor.AuditorWorker(self.conf)
-        data = '0' * 1024
-        etag = md5()
-        timestamp = str(normalize_timestamp(time.time()))
-        with self.disk_file.mkstemp() as fd:
-            os.write(fd, data)
+        auditor_worker = auditor.AuditorWorker(self.conf, self.logger,
+                                               self.rcache, self.devices)
+        data = b'0' * 1024
+        etag = md5(usedforsecurity=False)
+        timestamp = next(self.ts)
+        with self.disk_file.create() as writer:
+            writer.write(data)
             etag.update(data)
             etag = etag.hexdigest()
             metadata = {
                 'ETag': etag,
-                'X-Timestamp': timestamp,
-                'Content-Length': str(os.fstat(fd).st_size),
+                'X-Timestamp': timestamp.normal,
+                'Content-Length': str(os.fstat(writer._fd).st_size),
             }
-            self.disk_file.put(fd, metadata)
-            pre_quarantines = self.auditor.quarantines
-            # remake so it will have metadata
-            self.disk_file = DiskFile(self.devices, 'sda', '0', 'a', 'c', 'o',
-                                      self.logger)
-
-            self.auditor.object_audit(
-                os.path.join(self.disk_file.datadir, timestamp + '.data'),
-                'sda', '0')
-            self.assertEquals(self.auditor.quarantines, pre_quarantines)
-            etag = md5()
-            etag.update('1' + '0' * 1023)
-            etag = etag.hexdigest()
-            metadata['ETag'] = etag
-            write_metadata(fd, metadata)
+            writer.put(metadata)
+            writer.commit(timestamp)
+            pre_quarantines = auditor_worker.quarantines
+
+        # remake so it will have metadata
+        self.disk_file = self.df_mgr.get_diskfile('sda', '0', 'a', 'c', 'o',
+                                                  policy=POLICIES.legacy)
+
+        auditor_worker.object_audit(
+            AuditLocation(self.disk_file._datadir, 'sda', '0',
+                          policy=POLICIES.legacy))
+        self.assertEqual(auditor_worker.quarantines, pre_quarantines)
+        etag = md5(b'1' + b'0' * 1023, usedforsecurity=False).hexdigest()
+        ts2 = next(self.ts)
+        metadata['ETag'] = etag
+        metadata['X-Timestamp'] = ts2.normal
+
+        with self.disk_file.create() as writer:
+            writer.write(data)
+            writer.put(metadata)
+            writer.commit(ts2)
+
+        auditor_worker.object_audit(
+            AuditLocation(self.disk_file._datadir, 'sda', '0',
+                          policy=POLICIES.legacy))
+        self.assertEqual(auditor_worker.quarantines, pre_quarantines + 1)
+
+    def test_object_audit_checks_EC_fragments(self):
+        disk_file = self.disk_file_ec
 
-            self.auditor.object_audit(
-                os.path.join(self.disk_file.datadir, timestamp + '.data'),
-                'sda', '0')
-            self.assertEquals(self.auditor.quarantines, pre_quarantines + 1)
+        def do_test(data):
+            # create diskfile and set ETag and content-length to match the data
+            etag = md5(data, usedforsecurity=False).hexdigest()
+            timestamp = str(normalize_timestamp(time.time()))
+            with disk_file.create() as writer:
+                writer.write(data)
+                metadata = {
+                    'ETag': etag,
+                    'X-Timestamp': timestamp,
+                    'Content-Length': len(data),
+                    'X-Object-Sysmeta-Ec-Frag-Index': '1',
+                    'X-Object-Sysmeta-Ec-Etag': 'fake-etag',
+                }
+                writer.put(metadata)
+                writer.commit(Timestamp(timestamp))
+
+            self.logger.clear()
+            auditor_worker = auditor.AuditorWorker(self.conf, self.logger,
+                                                   self.rcache, self.devices)
+            self.assertEqual(0, auditor_worker.quarantines)  # sanity check
+            auditor_worker.object_audit(
+                AuditLocation(disk_file._datadir, 'sda', '0',
+                              policy=disk_file.policy))
+            return auditor_worker
+
+        # two good frags in an EC archive
+        frag_0 = disk_file.policy.pyeclib_driver.encode(
+            b'x' * disk_file.policy.ec_segment_size)[0]
+        frag_1 = disk_file.policy.pyeclib_driver.encode(
+            b'y' * disk_file.policy.ec_segment_size)[0]
+        data = frag_0 + frag_1
+        auditor_worker = do_test(data)
+        self.assertEqual(0, auditor_worker.quarantines)
+        self.assertFalse(auditor_worker.logger.get_lines_for_level('error'))
+
+        # corrupt second frag headers
+        corrupt_frag_1 = b'blah' * 16 + frag_1[64:]
+        data = frag_0 + corrupt_frag_1
+        auditor_worker = do_test(data)
+        self.assertEqual(1, auditor_worker.quarantines)
+        log_lines = auditor_worker.logger.get_lines_for_level('error')
+        self.assertIn('failed audit and was quarantined: '
+                      'Invalid EC metadata at offset 0x%x' %
+                      len(frag_0),
+                      log_lines[0])
+
+        # dangling extra corrupt frag data
+        data = frag_0 + frag_1 + b'wtf' * 100
+        auditor_worker = do_test(data)
+        self.assertEqual(1, auditor_worker.quarantines)
+        log_lines = auditor_worker.logger.get_lines_for_level('error')
+        self.assertIn('failed audit and was quarantined: '
+                      'Invalid EC metadata at offset 0x%x' %
+                      len(frag_0 + frag_1),
+                      log_lines[0])
+
+        # simulate bug https://bugs.launchpad.net/bugs/1631144 by writing start
+        # of an ssync subrequest into the diskfile
+        data = (
+            b'PUT /a/c/o\r\n' +
+            b'Content-Length: 999\r\n' +
+            b'Content-Type: image/jpeg\r\n' +
+            b'X-Object-Sysmeta-Ec-Content-Length: 1024\r\n' +
+            b'X-Object-Sysmeta-Ec-Etag: 1234bff7eb767cc6d19627c6b6f9edef\r\n' +
+            b'X-Object-Sysmeta-Ec-Frag-Index: 1\r\n' +
+            b'X-Object-Sysmeta-Ec-Scheme: ' +
+            DEFAULT_TEST_EC_TYPE.encode('ascii') + b'\r\n' +
+            b'X-Object-Sysmeta-Ec-Segment-Size: 1048576\r\n' +
+            b'X-Timestamp: 1471512345.17333\r\n\r\n'
+        )
+        data += frag_0[:disk_file.policy.fragment_size - len(data)]
+        auditor_worker = do_test(data)
+        self.assertEqual(1, auditor_worker.quarantines)
+        log_lines = auditor_worker.logger.get_lines_for_level('error')
+        self.assertIn('failed audit and was quarantined: '
+                      'Invalid EC metadata at offset 0x0',
+                      log_lines[0])
 
     def test_object_audit_no_meta(self):
         timestamp = str(normalize_timestamp(time.time()))
-        path = os.path.join(self.disk_file.datadir, timestamp + '.data')
-        mkdirs(self.disk_file.datadir)
-        fp = open(path, 'w')
-        fp.write('0' * 1024)
+        path = os.path.join(self.disk_file._datadir, timestamp + '.data')
+        mkdirs(self.disk_file._datadir)
+        fp = open(path, 'wb')
+        fp.write(b'0' * 1024)
         fp.close()
-        invalidate_hash(os.path.dirname(self.disk_file.datadir))
-        self.auditor = auditor.AuditorWorker(self.conf)
-        pre_quarantines = self.auditor.quarantines
-        self.auditor.object_audit(
-            os.path.join(self.disk_file.datadir, timestamp + '.data'),
-            'sda', '0')
-        self.assertEquals(self.auditor.quarantines, pre_quarantines + 1)
-
-    def test_object_audit_bad_args(self):
-        self.auditor = auditor.AuditorWorker(self.conf)
-        pre_errors = self.auditor.errors
-        self.auditor.object_audit(5, 'sda', '0')
-        self.assertEquals(self.auditor.errors, pre_errors + 1)
-        pre_errors = self.auditor.errors
-        self.auditor.object_audit('badpath', 'sda', '0')
-        self.assertEquals(self.auditor.errors, pre_errors)  # just returns
+        invalidate_hash(os.path.dirname(self.disk_file._datadir))
+        auditor_worker = auditor.AuditorWorker(self.conf, self.logger,
+                                               self.rcache, self.devices)
+        pre_quarantines = auditor_worker.quarantines
+        auditor_worker.object_audit(
+            AuditLocation(self.disk_file._datadir, 'sda', '0',
+                          policy=POLICIES.legacy))
+        self.assertEqual(auditor_worker.quarantines, pre_quarantines + 1)
 
-    def test_object_run_once_pass(self):
-        self.auditor = auditor.AuditorWorker(self.conf)
-        self.auditor.log_time = 0
+    def test_object_audit_will_not_swallow_errors_in_tests(self):
         timestamp = str(normalize_timestamp(time.time()))
-        pre_quarantines = self.auditor.quarantines
-        data = '0' * 1024
-        etag = md5()
-        with self.disk_file.mkstemp() as fd:
-            os.write(fd, data)
+        path = os.path.join(self.disk_file._datadir, timestamp + '.data')
+        mkdirs(self.disk_file._datadir)
+        with open(path, 'w') as f:
+            write_metadata(f, {'name': '/a/c/o'})
+        auditor_worker = auditor.AuditorWorker(self.conf, self.logger,
+                                               self.rcache, self.devices)
+
+        def blowup(*args):
+            raise NameError('tpyo')
+        with mock.patch.object(DiskFileManager,
+                               'get_diskfile_from_audit_location', blowup):
+            self.assertRaises(NameError, auditor_worker.object_audit,
+                              AuditLocation(os.path.dirname(path), 'sda', '0',
+                                            policy=POLICIES.legacy))
+
+    def test_failsafe_object_audit_will_swallow_errors_in_tests(self):
+        timestamp = str(normalize_timestamp(time.time()))
+        path = os.path.join(self.disk_file._datadir, timestamp + '.data')
+        mkdirs(self.disk_file._datadir)
+        with open(path, 'w') as f:
+            write_metadata(f, {'name': '/a/c/o'})
+        auditor_worker = auditor.AuditorWorker(self.conf, self.logger,
+                                               self.rcache, self.devices)
+
+        def blowup(*args):
+            raise NameError('tpyo')
+        with mock.patch('swift.obj.diskfile.DiskFileManager.diskfile_cls',
+                        blowup):
+            auditor_worker.failsafe_object_audit(
+                AuditLocation(os.path.dirname(path), 'sda', '0',
+                              policy=POLICIES.legacy))
+        self.assertEqual(auditor_worker.errors, 1)
+
+    def test_audit_location_gets_quarantined(self):
+        auditor_worker = auditor.AuditorWorker(self.conf, self.logger,
+                                               self.rcache, self.devices)
+
+        location = AuditLocation(self.disk_file._datadir, 'sda', '0',
+                                 policy=self.disk_file.policy)
+
+        # instead of a datadir, we'll make a file!
+        mkdirs(os.path.dirname(self.disk_file._datadir))
+        open(self.disk_file._datadir, 'w')
+
+        # after we turn the crank ...
+        auditor_worker.object_audit(location)
+
+        # ... it should get quarantined
+        self.assertFalse(os.path.exists(self.disk_file._datadir))
+        self.assertEqual(1, auditor_worker.quarantines)
+
+    def test_rsync_tempfile_timeout_auto_option(self):
+        # if we don't have access to the replicator config section we'll use
+        # our default
+        auditor_worker = auditor.AuditorWorker(self.conf, self.logger,
+                                               self.rcache, self.devices)
+        self.assertEqual(auditor_worker.rsync_tempfile_timeout, 86400)
+        # if the rsync_tempfile_timeout option is set explicitly we use that
+        self.conf['rsync_tempfile_timeout'] = '1800'
+        auditor_worker = auditor.AuditorWorker(self.conf, self.logger,
+                                               self.rcache, self.devices)
+        self.assertEqual(auditor_worker.rsync_tempfile_timeout, 1800)
+        # if we have a real config we can be a little smarter
+        config_path = os.path.join(self.testdir, 'objserver.conf')
+        stub_config = """
+        [object-auditor]
+        rsync_tempfile_timeout = auto
+        """
+        with open(config_path, 'w') as f:
+            f.write(textwrap.dedent(stub_config))
+        # the Daemon loader will hand the object-auditor config to the
+        # auditor who will build the workers from it
+        conf = readconf(config_path, 'object-auditor')
+        auditor_worker = auditor.AuditorWorker(conf, self.logger,
+                                               self.rcache, self.devices)
+        # if there is no object-replicator section we still have to fall back
+        # to default because we can't parse the config for that section!
+        self.assertEqual(auditor_worker.rsync_tempfile_timeout, 86400)
+        stub_config = """
+        [object-replicator]
+        [object-auditor]
+        rsync_tempfile_timeout = auto
+        """
+        with open(config_path, 'w') as f:
+            f.write(textwrap.dedent(stub_config))
+        conf = readconf(config_path, 'object-auditor')
+        auditor_worker = auditor.AuditorWorker(conf, self.logger,
+                                               self.rcache, self.devices)
+        # if the object-replicator section will parse but does not override
+        # the default rsync_timeout we assume the default rsync_timeout value
+        # and add 15mins
+        self.assertEqual(auditor_worker.rsync_tempfile_timeout,
+                         replicator.DEFAULT_RSYNC_TIMEOUT + 900)
+        stub_config = """
+        [DEFAULT]
+        reclaim_age = 1209600
+        [object-replicator]
+        rsync_timeout = 3600
+        [object-auditor]
+        rsync_tempfile_timeout = auto
+        """
+        with open(config_path, 'w') as f:
+            f.write(textwrap.dedent(stub_config))
+        conf = readconf(config_path, 'object-auditor')
+        auditor_worker = auditor.AuditorWorker(conf, self.logger,
+                                               self.rcache, self.devices)
+        # if there is an object-replicator section with a rsync_timeout
+        # configured we'll use that value (3600) + 900
+        self.assertEqual(auditor_worker.rsync_tempfile_timeout, 3600 + 900)
+
+    def test_inprogress_rsync_tempfiles_get_cleaned_up(self):
+        auditor_worker = auditor.AuditorWorker(self.conf, self.logger,
+                                               self.rcache, self.devices)
+
+        location = AuditLocation(self.disk_file._datadir, 'sda', '0',
+                                 policy=self.disk_file.policy)
+
+        data = b'VERIFY'
+        etag = md5(usedforsecurity=False)
+        timestamp = str(normalize_timestamp(time.time()))
+        with self.disk_file.create() as writer:
+            writer.write(data)
+            etag.update(data)
+            metadata = {
+                'ETag': etag.hexdigest(),
+                'X-Timestamp': timestamp,
+                'Content-Length': str(os.fstat(writer._fd).st_size),
+            }
+            writer.put(metadata)
+            writer.commit(Timestamp(timestamp))
+
+        datafilename = None
+        datadir_files = os.listdir(self.disk_file._datadir)
+        for filename in datadir_files:
+            if filename.endswith('.data'):
+                datafilename = filename
+                break
+        else:
+            self.fail('Did not find .data file in %r: %r' %
+                      (self.disk_file._datadir, datadir_files))
+        rsynctempfile_path = os.path.join(self.disk_file._datadir,
+                                          '.%s.9ILVBL' % datafilename)
+        open(rsynctempfile_path, 'w')
+        # sanity check we have an extra file
+        rsync_files = os.listdir(self.disk_file._datadir)
+        self.assertEqual(len(datadir_files) + 1, len(rsync_files))
+
+        # and after we turn the crank ...
+        auditor_worker.object_audit(location)
+
+        # ... we've still got the rsync file
+        self.assertEqual(rsync_files, os.listdir(self.disk_file._datadir))
+
+        # and we'll keep it - depending on the rsync_tempfile_timeout
+        self.assertEqual(auditor_worker.rsync_tempfile_timeout, 86400)
+        self.conf['rsync_tempfile_timeout'] = '3600'
+        auditor_worker = auditor.AuditorWorker(self.conf, self.logger,
+                                               self.rcache, self.devices)
+        self.assertEqual(auditor_worker.rsync_tempfile_timeout, 3600)
+        now = time.time() + 1900
+        with mock.patch('swift.obj.auditor.time.time',
+                        return_value=now):
+            auditor_worker.object_audit(location)
+        self.assertEqual(rsync_files, os.listdir(self.disk_file._datadir))
+
+        # but *tomorrow* when we run
+        tomorrow = time.time() + 86400
+        with mock.patch('swift.obj.auditor.time.time',
+                        return_value=tomorrow):
+            auditor_worker.object_audit(location)
+
+        # ... we'll totally clean that stuff up!
+        self.assertEqual(datadir_files, os.listdir(self.disk_file._datadir))
+
+        # but if we have some random crazy file in there
+        random_crazy_file_path = os.path.join(self.disk_file._datadir,
+                                              '.random.crazy.file')
+        open(random_crazy_file_path, 'w')
+
+        tomorrow = time.time() + 86400
+        with mock.patch('swift.obj.auditor.time.time',
+                        return_value=tomorrow):
+            auditor_worker.object_audit(location)
+
+        # that's someone elses problem
+        self.assertIn(os.path.basename(random_crazy_file_path),
+                      os.listdir(self.disk_file._datadir))
+
+    def test_generic_exception_handling(self):
+        auditor_worker = auditor.AuditorWorker(self.conf, self.logger,
+                                               self.rcache, self.devices)
+        # pretend that we logged (and reset counters) just now
+        auditor_worker.last_logged = time.time()
+        timestamp = str(normalize_timestamp(time.time()))
+        pre_errors = auditor_worker.errors
+        data = b'0' * 1024
+        etag = md5(usedforsecurity=False)
+        with self.disk_file.create() as writer:
+            writer.write(data)
             etag.update(data)
             etag = etag.hexdigest()
             metadata = {
                 'ETag': etag,
                 'X-Timestamp': timestamp,
-                'Content-Length': str(os.fstat(fd).st_size),
+                'Content-Length': str(os.fstat(writer._fd).st_size),
+            }
+            writer.put(metadata)
+            writer.commit(Timestamp(timestamp))
+        with mock.patch('swift.obj.diskfile.DiskFileManager.diskfile_cls',
+                        lambda *_: 1 / 0):
+            auditor_worker.audit_all_objects()
+        self.assertEqual(auditor_worker.errors, pre_errors + 1)
+
+    def test_object_run_once_pass(self):
+        auditor_worker = auditor.AuditorWorker(self.conf, self.logger,
+                                               self.rcache, self.devices)
+        auditor_worker.log_time = 0
+        timestamp = next(self.ts)
+        pre_quarantines = auditor_worker.quarantines
+        data = b'0' * 1024
+
+        def write_file(df):
+            with df.create() as writer:
+                writer.write(data)
+                metadata = {
+                    'ETag': md5(data, usedforsecurity=False).hexdigest(),
+                    'X-Timestamp': timestamp.internal,
+                    'Content-Length': str(os.fstat(writer._fd).st_size),
+                }
+                writer.put(metadata)
+                writer.commit(timestamp)
+
+        # policy 0
+        write_file(self.disk_file)
+        # policy 1
+        write_file(self.disk_file_p1)
+        # policy 2
+        write_file(self.disk_file_ec)
+
+        auditor_worker.audit_all_objects()
+        self.assertEqual(auditor_worker.quarantines, pre_quarantines)
+        # 1 object per policy falls into 1024 bucket
+        self.assertEqual(auditor_worker.stats_buckets[1024], 3)
+        self.assertEqual(auditor_worker.stats_buckets[10240], 0)
+
+        # pick up some additional code coverage, large file
+        ts2 = next(self.ts)
+        data = b'0' * 1024 * 1024
+        for df in (self.disk_file, self.disk_file_ec):
+            with df.create() as writer:
+                writer.write(data)
+                metadata = {
+                    'ETag': md5(data, usedforsecurity=False).hexdigest(),
+                    'X-Timestamp': ts2.internal,
+                    'Content-Length': str(os.fstat(writer._fd).st_size),
+                }
+                writer.put(metadata)
+                writer.commit(ts2)
+        auditor_worker.audit_all_objects(device_dirs=['sda', 'sdb'])
+        self.assertEqual(auditor_worker.quarantines, pre_quarantines)
+        # still have the 1024 byte object left in policy-1 (plus the
+        # stats from the original 3)
+        self.assertEqual(auditor_worker.stats_buckets[1024], 4)
+        self.assertEqual(auditor_worker.stats_buckets[10240], 0)
+        # and then policy-0 disk_file was re-written as a larger object
+        self.assertEqual(auditor_worker.stats_buckets['OVER'], 2)
+
+        # pick up even more additional code coverage, misc paths
+        auditor_worker.log_time = -1
+        auditor_worker.stats_sizes = []
+        auditor_worker.audit_all_objects(device_dirs=['sda', 'sdb'])
+        self.assertEqual(auditor_worker.quarantines, pre_quarantines)
+        self.assertEqual(auditor_worker.stats_buckets[1024], 4)
+        self.assertEqual(auditor_worker.stats_buckets[10240], 0)
+        self.assertEqual(auditor_worker.stats_buckets['OVER'], 2)
+
+    def test_object_run_logging(self):
+        auditor_worker = auditor.AuditorWorker(self.conf, self.logger,
+                                               self.rcache, self.devices)
+        auditor_worker.audit_all_objects(device_dirs=['sda'])
+        log_lines = self.logger.get_lines_for_level('info')
+        self.assertGreater(len(log_lines), 0)
+        self.assertIn('ALL - parallel, sda', log_lines[0])
+
+        self.logger.clear()
+        auditor_worker = auditor.AuditorWorker(self.conf, self.logger,
+                                               self.rcache, self.devices,
+                                               zero_byte_only_at_fps=50)
+        auditor_worker.audit_all_objects(device_dirs=['sda'])
+        log_lines = self.logger.get_lines_for_level('info')
+        self.assertGreater(len(log_lines), 0)
+        self.assertIn('ZBF - sda', log_lines[0])
+
+    def test_object_run_recon_cache(self):
+        ts = Timestamp(time.time())
+        data = b'test_data'
+
+        with self.disk_file.create() as writer:
+            writer.write(data)
+            metadata = {
+                'ETag': md5(data, usedforsecurity=False).hexdigest(),
+                'X-Timestamp': ts.normal,
+                'Content-Length': str(os.fstat(writer._fd).st_size),
             }
-            self.disk_file.put(fd, metadata)
-            self.disk_file.close()
-        self.auditor.audit_all_objects()
-        self.assertEquals(self.auditor.quarantines, pre_quarantines)
+            writer.put(metadata)
+            writer.commit(ts)
+
+        # all devices
+        auditor_worker = auditor.AuditorWorker(self.conf, self.logger,
+                                               self.rcache, self.devices)
+        auditor_worker.audit_all_objects()
+        with open(self.rcache) as fd:
+            actual_rcache = json.load(fd)
+        expected = {'object_auditor_stats_ALL':
+                    {'passes': 1, 'errors': 0, 'audit_time': mock.ANY,
+                     'start_time': mock.ANY, 'quarantined': 0,
+                     'bytes_processed': 9}}
+        with open(self.rcache) as fd:
+            actual_rcache = json.load(fd)
+        self.assertEqual(expected, actual_rcache)
+
+        auditor_worker = auditor.AuditorWorker(self.conf, self.logger,
+                                               self.rcache, self.devices,
+                                               zero_byte_only_at_fps=50)
+        auditor_worker.audit_all_objects()
+        self.assertEqual(expected, actual_rcache)
+        with open(self.rcache) as fd:
+            actual_rcache = json.load(fd)
+        expected.update({
+            'object_auditor_stats_ZBF':
+            {'passes': 1, 'errors': 0, 'audit_time': mock.ANY,
+             'start_time': mock.ANY, 'quarantined': 0,
+             'bytes_processed': 0}})
+        self.assertEqual(expected, actual_rcache)
+
+        # specific devices
+        os.unlink(self.rcache)
+        auditor_worker = auditor.AuditorWorker(self.conf, self.logger,
+                                               self.rcache, self.devices)
+        auditor_worker.audit_all_objects(device_dirs=['sda'])
+        with open(self.rcache) as fd:
+            actual_rcache = json.load(fd)
+        expected = {'object_auditor_stats_ALL':
+                    {'sda': {'passes': 1, 'errors': 0, 'audit_time': mock.ANY,
+                             'start_time': mock.ANY, 'quarantined': 0,
+                             'bytes_processed': 9}}}
+        with open(self.rcache) as fd:
+            actual_rcache = json.load(fd)
+        self.assertEqual(expected, actual_rcache)
+
+        auditor_worker = auditor.AuditorWorker(self.conf, self.logger,
+                                               self.rcache, self.devices,
+                                               zero_byte_only_at_fps=50)
+        auditor_worker.audit_all_objects(device_dirs=['sda'])
+        self.assertEqual(expected, actual_rcache)
+        with open(self.rcache) as fd:
+            actual_rcache = json.load(fd)
+        expected.update({
+            'object_auditor_stats_ZBF':
+            {'sda': {'passes': 1, 'errors': 0, 'audit_time': mock.ANY,
+                     'start_time': mock.ANY, 'quarantined': 0,
+                     'bytes_processed': 0}}})
+        self.assertEqual(expected, actual_rcache)
 
     def test_object_run_once_no_sda(self):
-        self.auditor = auditor.AuditorWorker(self.conf)
+        auditor_worker = auditor.AuditorWorker(self.conf, self.logger,
+                                               self.rcache, self.devices)
         timestamp = str(normalize_timestamp(time.time()))
-        pre_quarantines = self.auditor.quarantines
-        data = '0' * 1024
-        etag = md5()
-        with self.disk_file.mkstemp() as fd:
-            os.write(fd, data)
+        pre_quarantines = auditor_worker.quarantines
+        # pretend that we logged (and reset counters) just now
+        auditor_worker.last_logged = time.time()
+        data = b'0' * 1024
+        etag = md5(usedforsecurity=False)
+        with self.disk_file.create() as writer:
+            writer.write(data)
             etag.update(data)
             etag = etag.hexdigest()
             metadata = {
                 'ETag': etag,
                 'X-Timestamp': timestamp,
-                'Content-Length': str(os.fstat(fd).st_size),
+                'Content-Length': str(os.fstat(writer._fd).st_size),
             }
-            self.disk_file.put(fd, metadata)
-            self.disk_file.close()
-            os.write(fd, 'extra_data')
-        self.auditor.audit_all_objects()
-        self.assertEquals(self.auditor.quarantines, pre_quarantines + 1)
+            writer.put(metadata)
+            os.write(writer._fd, b'extra_data')
+            writer.commit(Timestamp(timestamp))
+        auditor_worker.audit_all_objects()
+        self.assertEqual(auditor_worker.quarantines, pre_quarantines + 1)
 
     def test_object_run_once_multi_devices(self):
-        self.auditor = auditor.AuditorWorker(self.conf)
+        auditor_worker = auditor.AuditorWorker(self.conf, self.logger,
+                                               self.rcache, self.devices)
+        # pretend that we logged (and reset counters) just now
+        auditor_worker.last_logged = time.time()
         timestamp = str(normalize_timestamp(time.time()))
-        pre_quarantines = self.auditor.quarantines
-        data = '0' * 10
-        etag = md5()
-        with self.disk_file.mkstemp() as fd:
-            os.write(fd, data)
+        pre_quarantines = auditor_worker.quarantines
+        data = b'0' * 10
+        etag = md5(usedforsecurity=False)
+        with self.disk_file.create() as writer:
+            writer.write(data)
             etag.update(data)
             etag = etag.hexdigest()
             metadata = {
                 'ETag': etag,
                 'X-Timestamp': timestamp,
-                'Content-Length': str(os.fstat(fd).st_size),
+                'Content-Length': str(os.fstat(writer._fd).st_size),
             }
-            self.disk_file.put(fd, metadata)
-            self.disk_file.close()
-        self.auditor.audit_all_objects()
-        self.disk_file = DiskFile(self.devices, 'sdb', '0', 'a', 'c',
-                                  'ob', self.logger)
-        data = '1' * 10
-        etag = md5()
-        with self.disk_file.mkstemp() as fd:
-            os.write(fd, data)
+            writer.put(metadata)
+            writer.commit(Timestamp(timestamp))
+        auditor_worker.audit_all_objects()
+        self.disk_file = self.df_mgr.get_diskfile('sda', '0', 'a', 'c', 'ob',
+                                                  policy=POLICIES.legacy)
+        data = b'1' * 10
+        etag = md5(usedforsecurity=False)
+        with self.disk_file.create() as writer:
+            writer.write(data)
             etag.update(data)
             etag = etag.hexdigest()
             metadata = {
                 'ETag': etag,
                 'X-Timestamp': timestamp,
-                'Content-Length': str(os.fstat(fd).st_size),
+                'Content-Length': str(os.fstat(writer._fd).st_size),
             }
-            self.disk_file.put(fd, metadata)
-            self.disk_file.close()
-            os.write(fd, 'extra_data')
-        self.auditor.audit_all_objects()
-        self.assertEquals(self.auditor.quarantines, pre_quarantines + 1)
+            writer.put(metadata)
+            writer.commit(Timestamp(timestamp))
+            os.write(writer._fd, b'extra_data')
+        auditor_worker.audit_all_objects()
+        self.assertEqual(auditor_worker.quarantines, pre_quarantines + 1)
 
     def test_object_run_fast_track_non_zero(self):
         self.auditor = auditor.ObjectAuditor(self.conf)
         self.auditor.log_time = 0
-        data = '0' * 1024
-        etag = md5()
-        with self.disk_file.mkstemp() as fd:
-            os.write(fd, data)
+        data = b'0' * 1024
+        etag = md5(usedforsecurity=False)
+        with self.disk_file.create() as writer:
+            writer.write(data)
             etag.update(data)
             etag = etag.hexdigest()
+            timestamp = str(normalize_timestamp(time.time()))
             metadata = {
                 'ETag': etag,
-                'X-Timestamp': str(normalize_timestamp(time.time())),
-                'Content-Length': str(os.fstat(fd).st_size),
+                'X-Timestamp': timestamp,
+                'Content-Length': str(os.fstat(writer._fd).st_size),
             }
-            self.disk_file.put(fd, metadata)
-            etag = md5()
-            etag.update('1' + '0' * 1023)
+            writer.put(metadata)
+            writer.commit(Timestamp(timestamp))
+            etag = md5(usedforsecurity=False)
+            etag.update(b'1' + b'0' * 1023)
             etag = etag.hexdigest()
             metadata['ETag'] = etag
-            write_metadata(fd, metadata)
+            write_metadata(writer._fd, metadata)
 
         quarantine_path = os.path.join(self.devices,
                                        'sda', 'quarantined', 'objects')
-        self.auditor.run_once(zero_byte_fps=50)
+        kwargs = {'mode': 'once'}
+        kwargs['zero_byte_fps'] = 50
+        self.auditor.run_audit(**kwargs)
         self.assertFalse(os.path.isdir(quarantine_path))
-        self.auditor.run_once()
+        del (kwargs['zero_byte_fps'])
+        clear_auditor_status(self.devices, 'objects')
+        self.auditor.run_audit(**kwargs)
         self.assertTrue(os.path.isdir(quarantine_path))
 
-    def setup_bad_zero_byte(self, with_ts=False):
+    def setup_bad_zero_byte(self, timestamp=None):
+        if timestamp is None:
+            timestamp = Timestamp.now()
         self.auditor = auditor.ObjectAuditor(self.conf)
         self.auditor.log_time = 0
-        ts_file_path = ''
-        if with_ts:
-
-            name_hash = hash_path('a', 'c', 'o')
-            dir_path = os.path.join(self.devices, 'sda',
-                               storage_directory(DATADIR, '0', name_hash))
-            ts_file_path = os.path.join(dir_path, '99999.ts')
-            if not os.path.exists(dir_path):
-                mkdirs(dir_path)
-            fp = open(ts_file_path, 'w')
-            fp.close()
-
-        etag = md5()
-        with self.disk_file.mkstemp() as fd:
+        etag = md5(usedforsecurity=False)
+        with self.disk_file.create() as writer:
             etag = etag.hexdigest()
             metadata = {
                 'ETag': etag,
-                'X-Timestamp': str(normalize_timestamp(time.time())),
+                'X-Timestamp': timestamp.internal,
                 'Content-Length': 10,
             }
-            self.disk_file.put(fd, metadata)
-            etag = md5()
+            writer.put(metadata)
+            writer.commit(Timestamp(timestamp))
+            etag = md5(usedforsecurity=False)
             etag = etag.hexdigest()
             metadata['ETag'] = etag
-            write_metadata(fd, metadata)
-        if self.disk_file.data_file:
-            return self.disk_file.data_file
-        return ts_file_path
+            write_metadata(writer._fd, metadata)
 
     def test_object_run_fast_track_all(self):
         self.setup_bad_zero_byte()
-        self.auditor.run_once()
+        kwargs = {'mode': 'once'}
+        self.auditor.run_audit(**kwargs)
         quarantine_path = os.path.join(self.devices,
                                        'sda', 'quarantined', 'objects')
         self.assertTrue(os.path.isdir(quarantine_path))
 
     def test_object_run_fast_track_zero(self):
         self.setup_bad_zero_byte()
-        self.auditor.run_once(zero_byte_fps=50)
-        quarantine_path = os.path.join(self.devices,
-                                       'sda', 'quarantined', 'objects')
-        self.assertTrue(os.path.isdir(quarantine_path))
+        kwargs = {'mode': 'once'}
+        kwargs['zero_byte_fps'] = 50
+
+        called_args = [0]
+
+        def mock_get_auditor_status(path, logger, audit_type):
+            called_args[0] = audit_type
+            return get_auditor_status(path, logger, audit_type)
 
-    def test_with_tombstone(self):
-        ts_file_path = self.setup_bad_zero_byte(with_ts=True)
-        self.auditor.run_once()
+        with mock.patch('swift.obj.diskfile.get_auditor_status',
+                        mock_get_auditor_status):
+            self.auditor.run_audit(**kwargs)
         quarantine_path = os.path.join(self.devices,
                                        'sda', 'quarantined', 'objects')
-        self.assertTrue(ts_file_path.endswith('ts'))
-        self.assertTrue(os.path.exists(ts_file_path))
-
-    def test_sleeper(self):
-        auditor.SLEEP_BETWEEN_AUDITS = 0.10
-        my_auditor = auditor.ObjectAuditor(self.conf)
-        start = time.time()
-        my_auditor._sleep()
-        delta_t = time.time() - start
-        self.assert_(delta_t > 0.08)
-        self.assert_(delta_t < 0.12)
+        self.assertTrue(os.path.isdir(quarantine_path))
+        self.assertEqual('ZBF', called_args[0])
 
     def test_object_run_fast_track_zero_check_closed(self):
         rat = [False]
 
         class FakeFile(DiskFile):
 
-            def close(self, verify_file=True):
+            def _quarantine(self, data_file, msg):
                 rat[0] = True
-                DiskFile.close(self, verify_file=verify_file)
+                DiskFile._quarantine(self, data_file, msg)
+
         self.setup_bad_zero_byte()
-        was_df = object_server.DiskFile
-        try:
-            object_server.DiskFile = FakeFile
-            self.auditor.run_once(zero_byte_fps=50)
+        with mock.patch('swift.obj.diskfile.DiskFileManager.diskfile_cls',
+                        FakeFile):
+            kwargs = {'mode': 'once'}
+            kwargs['zero_byte_fps'] = 50
+            self.auditor.run_audit(**kwargs)
             quarantine_path = os.path.join(self.devices,
                                            'sda', 'quarantined', 'objects')
             self.assertTrue(os.path.isdir(quarantine_path))
             self.assertTrue(rat[0])
-        finally:
-            object_server.DiskFile = was_df
 
-    def test_run_forever(self):
+    @mock.patch.object(auditor.ObjectAuditor, 'run_audit')
+    @mock.patch('os.fork', return_value=0)
+    def test_with_inaccessible_object_location(self, mock_os_fork,
+                                               mock_run_audit):
+        # Need to ensure that any failures in run_audit do
+        # not prevent sys.exit() from running.  Otherwise we get
+        # zombie processes.
+        e = OSError('permission denied')
+        mock_run_audit.side_effect = e
+        self.auditor = auditor.ObjectAuditor(self.conf)
+        self.assertRaises(SystemExit, self.auditor.fork_child, self)
+
+    def test_with_only_tombstone(self):
+        # sanity check that auditor doesn't touch solitary tombstones
+        ts_iter = make_timestamp_iter()
+        self.setup_bad_zero_byte(timestamp=next(ts_iter))
+        self.disk_file.delete(next(ts_iter))
+        files = os.listdir(self.disk_file._datadir)
+        self.assertEqual(1, len(files))
+        self.assertTrue(files[0].endswith('ts'))
+        kwargs = {'mode': 'once'}
+        self.auditor.run_audit(**kwargs)
+        files_after = os.listdir(self.disk_file._datadir)
+        self.assertEqual(files, files_after)
+
+    def test_with_tombstone_and_data(self):
+        # rsync replication could leave a tombstone and data file in object
+        # dir - verify they are both removed during audit
+        ts_iter = make_timestamp_iter()
+        ts_tomb = next(ts_iter)
+        ts_data = next(ts_iter)
+        self.setup_bad_zero_byte(timestamp=ts_data)
+        tomb_file_path = os.path.join(self.disk_file._datadir,
+                                      '%s.ts' % ts_tomb.internal)
+        with open(tomb_file_path, 'wb') as fd:
+            write_metadata(fd, {'X-Timestamp': ts_tomb.internal})
+        files = os.listdir(self.disk_file._datadir)
+        self.assertEqual(2, len(files))
+        self.assertTrue(os.path.basename(tomb_file_path) in files, files)
+        kwargs = {'mode': 'once'}
+        self.auditor.run_audit(**kwargs)
+        self.assertFalse(os.path.exists(self.disk_file._datadir))
+
+    def _audit_tombstone(self, conf, ts_tomb, zero_byte_fps=0):
+        self.auditor = auditor.ObjectAuditor(conf)
+        self.auditor.log_time = 0
+        # create tombstone and hashes.pkl file, ensuring the tombstone is not
+        # reclaimed by mocking time to be the tombstone time
+        with mock.patch('time.time', return_value=float(ts_tomb)):
+            # this delete will create an invalid hashes entry
+            self.disk_file.delete(ts_tomb)
+            # this get_hashes call will truncate the invalid hashes entry
+            self.disk_file.manager.get_hashes(
+                'sda', '0', [], self.disk_file.policy)
+        suffix = basename(dirname(self.disk_file._datadir))
+        part_dir = dirname(dirname(self.disk_file._datadir))
+        # sanity checks...
+        self.assertEqual(['%s.ts' % ts_tomb.internal],
+                         os.listdir(self.disk_file._datadir))
+        self.assertTrue(os.path.exists(os.path.join(part_dir, HASH_FILE)))
+        hash_invalid = os.path.join(part_dir, HASH_INVALIDATIONS_FILE)
+        self.assertTrue(os.path.exists(hash_invalid))
+        with open(hash_invalid, 'rb') as fp:
+            self.assertEqual(b'', fp.read().strip(b'\n'))
+        # Run auditor
+        self.auditor.run_audit(mode='once', zero_byte_fps=zero_byte_fps)
+        # sanity check - auditor should not remove tombstone file
+        self.assertEqual(['%s.ts' % ts_tomb.internal],
+                         os.listdir(self.disk_file._datadir))
+        return part_dir, suffix
+
+    def test_non_reclaimable_tombstone(self):
+        # audit with a recent tombstone
+        ts_tomb = Timestamp(time.time() - 55)
+        part_dir, suffix = self._audit_tombstone(self.conf, ts_tomb)
+        self.assertTrue(os.path.exists(os.path.join(part_dir, HASH_FILE)))
+        hash_invalid = os.path.join(part_dir, HASH_INVALIDATIONS_FILE)
+        self.assertTrue(os.path.exists(hash_invalid))
+        with open(hash_invalid, 'rb') as fp:
+            self.assertEqual(b'', fp.read().strip(b'\n'))
+
+    def test_reclaimable_tombstone(self):
+        # audit with a reclaimable tombstone
+        ts_tomb = Timestamp(time.time() - 604800)
+        part_dir, suffix = self._audit_tombstone(self.conf, ts_tomb)
+        self.assertTrue(os.path.exists(os.path.join(part_dir, HASH_FILE)))
+        hash_invalid = os.path.join(part_dir, HASH_INVALIDATIONS_FILE)
+        self.assertTrue(os.path.exists(hash_invalid))
+        with open(hash_invalid, 'rb') as fp:
+            hash_val = fp.read()
+        self.assertEqual(suffix.encode('ascii'), hash_val.strip(b'\n'))
+
+    def test_non_reclaimable_tombstone_with_custom_reclaim_age(self):
+        # audit with a tombstone newer than custom reclaim age
+        ts_tomb = Timestamp(time.time() - 604800)
+        conf = dict(self.conf)
+        conf['reclaim_age'] = 2 * 604800
+        part_dir, suffix = self._audit_tombstone(conf, ts_tomb)
+        self.assertTrue(os.path.exists(os.path.join(part_dir, HASH_FILE)))
+        hash_invalid = os.path.join(part_dir, HASH_INVALIDATIONS_FILE)
+        self.assertTrue(os.path.exists(hash_invalid))
+        with open(hash_invalid, 'rb') as fp:
+            self.assertEqual(b'', fp.read().strip(b'\n'))
+
+    def test_reclaimable_tombstone_with_custom_reclaim_age(self):
+        # audit with a tombstone older than custom reclaim age
+        ts_tomb = Timestamp(time.time() - 55)
+        conf = dict(self.conf)
+        conf['reclaim_age'] = 10
+        part_dir, suffix = self._audit_tombstone(conf, ts_tomb)
+        self.assertTrue(os.path.exists(os.path.join(part_dir, HASH_FILE)))
+        hash_invalid = os.path.join(part_dir, HASH_INVALIDATIONS_FILE)
+        self.assertTrue(os.path.exists(hash_invalid))
+        with open(hash_invalid, 'rb') as fp:
+            hash_val = fp.read()
+        self.assertEqual(suffix.encode('ascii'), hash_val.strip(b'\n'))
+
+    def test_reclaimable_tombstone_with_zero_byte_fps(self):
+        # audit with a tombstone older than reclaim age by a zero_byte_fps
+        # worker does not invalidate the hash
+        ts_tomb = Timestamp(time.time() - 604800)
+        part_dir, suffix = self._audit_tombstone(
+            self.conf, ts_tomb, zero_byte_fps=50)
+        self.assertTrue(os.path.exists(os.path.join(part_dir, HASH_FILE)))
+        hash_invalid = os.path.join(part_dir, HASH_INVALIDATIONS_FILE)
+        self.assertTrue(os.path.exists(hash_invalid))
+        with open(hash_invalid, 'rb') as fp:
+            self.assertEqual(b'', fp.read().strip(b'\n'))
+
+    def _test_expired_object_is_ignored(self, zero_byte_fps):
+        # verify that an expired object does not get mistaken for a tombstone
+        audit = auditor.ObjectAuditor(self.conf, logger=self.logger)
+        audit.log_time = 0
+        now = time.time()
+        write_diskfile(self.disk_file, Timestamp(now - 20),
+                       extra_metadata={'X-Delete-At': now - 10})
+        files = os.listdir(self.disk_file._datadir)
+        self.assertTrue([f for f in files if f.endswith('.data')])  # sanity
+        # diskfile write appends to invalid hashes file
+        part_dir = dirname(dirname(self.disk_file._datadir))
+        hash_invalid = os.path.join(part_dir, HASH_INVALIDATIONS_FILE)
+        with open(hash_invalid, 'rb') as fp:
+            self.assertEqual(
+                basename(dirname(self.disk_file._datadir)).encode('ascii'),
+                fp.read().strip(b'\n'))  # sanity check
+
+        # run the auditor...
+        with mock.patch.object(auditor, 'dump_recon_cache'):
+            audit.run_audit(mode='once', zero_byte_fps=zero_byte_fps)
+
+        # the auditor doesn't touch anything on the invalidation file
+        # (i.e. not truncate and add no entry)
+        with open(hash_invalid, 'rb') as fp:
+            self.assertEqual(
+                basename(dirname(self.disk_file._datadir)).encode('ascii'),
+                fp.read().strip(b'\n'))  # sanity check
+
+        # this get_hashes call will truncate the invalid hashes entry
+        self.disk_file.manager.get_hashes(
+            'sda', '0', [], self.disk_file.policy)
+        with open(hash_invalid, 'rb') as fp:
+            self.assertEqual(b'', fp.read().strip(b'\n'))  # sanity check
+
+        # run the auditor, again...
+        with mock.patch.object(auditor, 'dump_recon_cache'):
+            audit.run_audit(mode='once', zero_byte_fps=zero_byte_fps)
+
+        # verify nothing changed
+        self.assertTrue(os.path.exists(self.disk_file._datadir))
+        self.assertEqual(files, os.listdir(self.disk_file._datadir))
+        self.assertFalse(audit.logger.get_lines_for_level('error'))
+        self.assertFalse(audit.logger.get_lines_for_level('warning'))
+        # and there was no hash invalidation
+        with open(hash_invalid, 'rb') as fp:
+            self.assertEqual(b'', fp.read().strip(b'\n'))
+
+    def test_expired_object_is_ignored(self):
+        self._test_expired_object_is_ignored(0)
+
+    def test_expired_object_is_ignored_with_zero_byte_fps(self):
+        self._test_expired_object_is_ignored(50)
+
+    def test_auditor_reclaim_age(self):
+        # if we don't have access to the replicator config section we'll use
+        # diskfile's default
+        auditor_worker = auditor.AuditorWorker(self.conf, self.logger,
+                                               self.rcache, self.devices)
+        router = auditor_worker.diskfile_router
+        for policy in POLICIES:
+            self.assertEqual(router[policy].reclaim_age, 86400 * 7)
+
+        # if the reclaim_age option is set explicitly we use that
+        self.conf['reclaim_age'] = '1800'
+        auditor_worker = auditor.AuditorWorker(self.conf, self.logger,
+                                               self.rcache, self.devices)
+        router = auditor_worker.diskfile_router
+        for policy in POLICIES:
+            self.assertEqual(router[policy].reclaim_age, 1800)
+
+        # if we have a real config we can be a little smarter
+        config_path = os.path.join(self.testdir, 'objserver.conf')
+
+        # if there is no object-replicator section we still have to fall back
+        # to default because we can't parse the config for that section!
+        stub_config = """
+        [object-auditor]
+        """
+        with open(config_path, 'w') as f:
+            f.write(textwrap.dedent(stub_config))
+        conf = readconf(config_path, 'object-auditor')
+        auditor_worker = auditor.AuditorWorker(conf, self.logger,
+                                               self.rcache, self.devices)
+        router = auditor_worker.diskfile_router
+        for policy in POLICIES:
+            self.assertEqual(router[policy].reclaim_age, 86400 * 7)
+
+        # verify reclaim_age is of auditor config value
+        stub_config = """
+                [object-replicator]
+                [object-auditor]
+                reclaim_age = 60
+                """
+        with open(config_path, 'w') as f:
+            f.write(textwrap.dedent(stub_config))
+        conf = readconf(config_path, 'object-auditor')
+        auditor_worker = auditor.AuditorWorker(conf, self.logger,
+                                               self.rcache, self.devices)
+        router = auditor_worker.diskfile_router
+        for policy in POLICIES:
+            self.assertEqual(router[policy].reclaim_age, 60)
+
+        # verify reclaim_age falls back to replicator config value
+        # if there is no auditor config value
+        config_path = os.path.join(self.testdir, 'objserver.conf')
+        stub_config = """
+                [object-replicator]
+                reclaim_age = 60
+                [object-auditor]
+                """
+        with open(config_path, 'w') as f:
+            f.write(textwrap.dedent(stub_config))
+        conf = readconf(config_path, 'object-auditor')
+        auditor_worker = auditor.AuditorWorker(conf, self.logger,
+                                               self.rcache, self.devices)
+        router = auditor_worker.diskfile_router
+        for policy in POLICIES:
+            self.assertEqual(router[policy].reclaim_age, 60)
+
+        # we'll prefer our own DEFAULT section to the replicator though
+        self.assertEqual(auditor_worker.rsync_tempfile_timeout,
+                         replicator.DEFAULT_RSYNC_TIMEOUT + 900)
+        stub_config = """
+        [DEFAULT]
+        reclaim_age = 1209600
+        [object-replicator]
+        reclaim_age = 1800
+        [object-auditor]
+        """
+        with open(config_path, 'w') as f:
+            f.write(textwrap.dedent(stub_config))
+        conf = readconf(config_path, 'object-auditor')
+        auditor_worker = auditor.AuditorWorker(conf, self.logger,
+                                               self.rcache, self.devices)
+        router = auditor_worker.diskfile_router
+        for policy in POLICIES:
+            self.assertEqual(router[policy].reclaim_age, 1209600)
+
+    def test_sleeper(self):
+        with mock.patch(
+                'time.sleep', mock.MagicMock()) as mock_sleep:
+            my_auditor = auditor.ObjectAuditor(self.conf)
+            my_auditor._sleep()
+            mock_sleep.assert_called_with(30)
+
+            my_conf = dict(interval=2)
+            my_conf.update(self.conf)
+            my_auditor = auditor.ObjectAuditor(my_conf)
+            my_auditor._sleep()
+            mock_sleep.assert_called_with(2)
+
+            my_auditor = auditor.ObjectAuditor(self.conf)
+            my_auditor.interval = 2
+            my_auditor._sleep()
+            mock_sleep.assert_called_with(2)
+
+    def test_run_parallel_audit(self):
 
         class StopForever(Exception):
             pass
 
+        class Bogus(Exception):
+            pass
+
+        loop_error = Bogus('exception')
+
+        class LetMeOut(BaseException):
+            pass
+
         class ObjectAuditorMock(object):
             check_args = ()
             check_kwargs = {}
+            check_device_dir = None
             fork_called = 0
-            fork_res = 0
+            master = 0
+            wait_called = 0
 
             def mock_run(self, *args, **kwargs):
                 self.check_args = args
                 self.check_kwargs = kwargs
+                if 'zero_byte_fps' in kwargs:
+                    self.check_device_dir = kwargs.get('device_dirs')
 
-            def mock_sleep(self):
+            def mock_sleep_stop(self):
                 raise StopForever('stop')
 
+            def mock_sleep_continue(self):
+                return
+
+            def mock_audit_loop_error(self, parent, zbo_fps,
+                                      override_devices=None, **kwargs):
+                raise loop_error
+
             def mock_fork(self):
                 self.fork_called += 1
-                return self.fork_res
+                if self.master:
+                    return self.fork_called
+                else:
+                    return 0
+
+            def mock_wait(self):
+                self.wait_called += 1
+                return (self.wait_called, 0)
+
+            def mock_signal(self, sig, action):
+                pass
+
+            def mock_exit(self):
+                pass
+
+        for i in string.ascii_letters[2:26]:
+            mkdirs(os.path.join(self.devices, 'sd%s' % i))
 
         my_auditor = auditor.ObjectAuditor(dict(devices=self.devices,
                                                 mount_check='false',
-                                                zero_byte_files_per_second=89))
+                                                zero_byte_files_per_second=89,
+                                                concurrency=1))
+
         mocker = ObjectAuditorMock()
-        my_auditor.run_once = mocker.mock_run
-        my_auditor._sleep = mocker.mock_sleep
+        my_auditor.logger.exception = mock.MagicMock()
+        real_audit_loop = my_auditor.audit_loop
+        my_auditor.audit_loop = mocker.mock_audit_loop_error
+        my_auditor.run_audit = mocker.mock_run
         was_fork = os.fork
+        was_wait = os.wait
+        was_signal = signal.signal
+        was_exit = sys.exit
+        os.fork = mocker.mock_fork
+        os.wait = mocker.mock_wait
+        signal.signal = mocker.mock_signal
+        sys.exit = mocker.mock_exit
         try:
-            os.fork = mocker.mock_fork
+            my_auditor._sleep = mocker.mock_sleep_stop
+            my_auditor.run_once(zero_byte_fps=50)
+            my_auditor.logger.exception.assert_called_once_with(
+                'ERROR auditing: %s', loop_error)
+            my_auditor.logger.exception.reset_mock()
+            self.assertRaises(StopForever, my_auditor.run_forever)
+            my_auditor.logger.exception.assert_called_once_with(
+                'ERROR auditing: %s', loop_error)
+            my_auditor.audit_loop = real_audit_loop
+
+            # sleep between ZBF scanner forks
+            self.assertRaises(StopForever, my_auditor.fork_child, True, True)
+
+            mocker.fork_called = 0
+            signal.signal = was_signal
+            sys.exit = was_exit
             self.assertRaises(StopForever,
                               my_auditor.run_forever, zero_byte_fps=50)
-            self.assertEquals(mocker.check_kwargs['zero_byte_fps'], 50)
-            self.assertEquals(mocker.fork_called, 0)
+            self.assertEqual(mocker.check_kwargs['zero_byte_fps'], 50)
+            self.assertEqual(mocker.fork_called, 0)
 
-            self.assertRaises(StopForever, my_auditor.run_forever)
-            self.assertEquals(mocker.fork_called, 1)
-            self.assertEquals(mocker.check_args, ())
+            self.assertRaises(SystemExit, my_auditor.run_once)
+            self.assertEqual(mocker.fork_called, 1)
+            self.assertEqual(mocker.check_kwargs['zero_byte_fps'], 89)
+            self.assertEqual(mocker.check_device_dir, [])
+            self.assertEqual(mocker.check_args, ())
 
-            mocker.fork_res = 1
+            device_list = ['sd%s' % i for i in string.ascii_letters[2:10]]
+            device_string = ','.join(device_list)
+            device_string_bogus = device_string + ',bogus'
+
+            mocker.fork_called = 0
+            self.assertRaises(SystemExit, my_auditor.run_once,
+                              devices=device_string_bogus)
+            self.assertEqual(mocker.fork_called, 1)
+            self.assertEqual(mocker.check_kwargs['zero_byte_fps'], 89)
+            self.assertEqual(sorted(mocker.check_device_dir), device_list)
+
+            mocker.master = 1
+
+            mocker.fork_called = 0
             self.assertRaises(StopForever, my_auditor.run_forever)
-            self.assertEquals(mocker.fork_called, 2)
-            self.assertEquals(mocker.check_kwargs['zero_byte_fps'], 89)
+            # Fork or Wait are called greate than or equal to 2 times in the
+            # main process. 2 times if zbf run once and 3 times if zbf run
+            # again
+            self.assertGreaterEqual(mocker.fork_called, 2)
+            self.assertGreaterEqual(mocker.wait_called, 2)
+
+            my_auditor._sleep = mocker.mock_sleep_continue
+            my_auditor.audit_loop = works_only_once(my_auditor.audit_loop,
+                                                    LetMeOut())
+
+            my_auditor.concurrency = 2
+            mocker.fork_called = 0
+            mocker.wait_called = 0
+            self.assertRaises(LetMeOut, my_auditor.run_forever)
+            # Fork or Wait are called greater than or equal to
+            # no. of devices + (no. of devices)/2 + 1 times in main process
+            no_devices = len(os.listdir(self.devices))
+            self.assertGreaterEqual(mocker.fork_called, no_devices +
+                                    no_devices / 2 + 1)
+            self.assertGreaterEqual(mocker.wait_called, no_devices +
+                                    no_devices / 2 + 1)
 
         finally:
             os.fork = was_fork
+            os.wait = was_wait
+
+    def test_run_audit_once(self):
+        my_auditor = auditor.ObjectAuditor(dict(devices=self.devices,
+                                                mount_check='false',
+                                                zero_byte_files_per_second=89,
+                                                concurrency=1))
+
+        forked_pids = []
+        next_zbf_pid = [2]
+        next_normal_pid = [1001]
+        outstanding_pids = [[]]
+
+        def fake_fork_child(**kwargs):
+            if len(forked_pids) > 10:
+                # something's gone horribly wrong
+                raise BaseException("forking too much")
+
+            # ZBF pids are all smaller than the normal-audit pids; this way
+            # we can return them first.
+            #
+            # Also, ZBF pids are even and normal-audit pids are odd; this is
+            # so humans seeing this test fail can better tell what's happening.
+            if kwargs.get('zero_byte_fps'):
+                pid = next_zbf_pid[0]
+                next_zbf_pid[0] += 2
+            else:
+                pid = next_normal_pid[0]
+                next_normal_pid[0] += 2
+            outstanding_pids[0].append(pid)
+            forked_pids.append(pid)
+            return pid
+
+        def fake_os_wait():
+            # Smallest pid first; that's ZBF if we have one, else normal
+            outstanding_pids[0].sort()
+            pid = outstanding_pids[0].pop(0)
+            return (pid, 0)   # (pid, status)
+
+        with mock.patch("swift.obj.auditor.os.wait", fake_os_wait), \
+                mock.patch.object(my_auditor, 'fork_child', fake_fork_child), \
+                mock.patch.object(my_auditor, '_sleep', lambda *a: None):
+            my_auditor.run_once()
+
+        self.assertEqual(sorted(forked_pids), [2, 1001])
+
+    def test_run_audit_once_zbfps(self):
+        my_auditor = auditor.ObjectAuditor(dict(devices=self.devices,
+                                                mount_check='false',
+                                                zero_byte_files_per_second=89,
+                                                concurrency=1,
+                                                recon_cache_path=self.testdir))
+
+        with mock.patch.object(my_auditor, '_sleep', lambda *a: None):
+            my_auditor.run_once(zero_byte_fps=50)
+
+        with open(self.rcache) as fd:
+            # there's no objects to audit so expect no stats; this assertion
+            # may change if https://bugs.launchpad.net/swift/+bug/1704858 is
+            # fixed
+            self.assertEqual({}, json.load(fd))
+
+        # check recon cache stays clean after a second run
+        with mock.patch.object(my_auditor, '_sleep', lambda *a: None):
+            my_auditor.run_once(zero_byte_fps=50)
+
+        with open(self.rcache) as fd:
+            self.assertEqual({}, json.load(fd))
+
+        ts = Timestamp(time.time())
+        with self.disk_file.create() as writer:
+            metadata = {
+                'ETag': md5(b'', usedforsecurity=False).hexdigest(),
+                'X-Timestamp': ts.normal,
+                'Content-Length': str(os.fstat(writer._fd).st_size),
+            }
+            writer.put(metadata)
+            writer.commit(ts)
+
+        # check recon cache stays clean after a second run
+        with mock.patch.object(my_auditor, '_sleep', lambda *a: None):
+            my_auditor.run_once(zero_byte_fps=50)
+        with open(self.rcache) as fd:
+            self.assertEqual({
+                'object_auditor_stats_ZBF': {
+                    'audit_time': 0,
+                    'bytes_processed': 0,
+                    'errors': 0,
+                    'passes': 1,
+                    'quarantined': 0,
+                    'start_time': mock.ANY}},
+                json.load(fd))
+
+    def test_run_parallel_audit_once(self):
+        my_auditor = auditor.ObjectAuditor(
+            dict(devices=self.devices, mount_check='false',
+                 zero_byte_files_per_second=89, concurrency=2))
+
+        # ZBF pids are smaller than the normal-audit pids; this way we can
+        # return them first from our mocked os.wait().
+        #
+        # Also, ZBF pids are even and normal-audit pids are odd; this is so
+        # humans seeing this test fail can better tell what's happening.
+        forked_pids = []
+        next_zbf_pid = [2]
+        next_normal_pid = [1001]
+        outstanding_pids = [[]]
+
+        def fake_fork_child(**kwargs):
+            if len(forked_pids) > 10:
+                # something's gone horribly wrong; try not to hang the test
+                # run because of it
+                raise BaseException("forking too much")
+
+            if kwargs.get('zero_byte_fps'):
+                pid = next_zbf_pid[0]
+                next_zbf_pid[0] += 2
+            else:
+                pid = next_normal_pid[0]
+                next_normal_pid[0] += 2
+            outstanding_pids[0].append(pid)
+            forked_pids.append(pid)
+            return pid
+
+        def fake_os_wait():
+            if not outstanding_pids[0]:
+                raise BaseException("nobody waiting")
+
+            # ZBF auditor finishes first
+            outstanding_pids[0].sort()
+            pid = outstanding_pids[0].pop(0)
+            return (pid, 0)   # (pid, status)
+
+        # make sure we've got enough devs that the ZBF auditor can finish
+        # before all the normal auditors have been started
+        mkdirs(os.path.join(self.devices, 'sdc'))
+        mkdirs(os.path.join(self.devices, 'sdd'))
+
+        with mock.patch("swift.obj.auditor.os.wait", fake_os_wait), \
+                mock.patch.object(my_auditor, 'fork_child', fake_fork_child), \
+                mock.patch.object(my_auditor, '_sleep', lambda *a: None):
+            my_auditor.run_once()
+
+        self.assertEqual(sorted(forked_pids), [2, 1001, 1003, 1005, 1007])
+
+    def test_run_parallel_audit_once_failed_fork(self):
+        my_auditor = auditor.ObjectAuditor(
+            dict(devices=self.devices, mount_check='false',
+                 concurrency=2))
+
+        start_pid = [1001]
+        outstanding_pids = []
+        failed_once = [False]
+
+        def failing_fork(**kwargs):
+            # this fork fails only on the 2nd call
+            # it's enough to cause the growth of orphaned child processes
+            if len(outstanding_pids) > 0 and not failed_once[0]:
+                failed_once[0] = True
+                raise OSError
+            start_pid[0] += 2
+            pid = start_pid[0]
+            outstanding_pids.append(pid)
+            return pid
+
+        def fake_wait():
+            return outstanding_pids.pop(0), 0
+
+        with mock.patch("swift.obj.auditor.os.wait", fake_wait), \
+                mock.patch.object(my_auditor, 'fork_child', failing_fork), \
+                mock.patch.object(my_auditor, '_sleep', lambda *a: None):
+            for i in range(3):
+                my_auditor.run_once()
+
+        self.assertEqual(len(outstanding_pids), 0,
+                         "orphaned children left {0}, expected 0."
+                         .format(outstanding_pids))
+
+
+@patch_policies(_mocked_policies)
+class TestAuditWatchers(TestAuditorBase):
+
+    def setUp(self):
+        super(TestAuditWatchers, self).setUp()
+
+        timestamp = Timestamp(time.time())
+
+        disk_file = self.df_mgr.get_diskfile(
+            'sda', '0', 'a', 'c', 'o0', policy=POLICIES.legacy)
+        data = b'0' * 1024
+        etag = md5()
+        with disk_file.create() as writer:
+            writer.write(data)
+            etag.update(data)
+            metadata = {
+                'ETag': etag.hexdigest(),
+                'X-Timestamp': timestamp.internal,
+                'Content-Length': str(len(data)),
+                'X-Object-Meta-Flavor': 'banana',
+            }
+            writer.put(metadata)
+            # The commit does nothing; we keep it for code copy-paste with EC.
+            writer.commit(timestamp)
+
+        disk_file = self.df_mgr.get_diskfile(
+            'sda', '0', 'a', 'c', 'o1', policy=POLICIES.legacy)
+        data = b'1' * 2048
+        etag = md5()
+        with disk_file.create() as writer:
+            writer.write(data)
+            etag.update(data)
+            metadata = {
+                'ETag': etag.hexdigest(),
+                'X-Timestamp': timestamp.internal,
+                'Content-Length': str(len(data)),
+                'X-Object-Meta-Flavor': 'orange',
+            }
+            writer.put(metadata)
+            writer.commit(timestamp)
+
+        frag_0 = self.disk_file_ec.policy.pyeclib_driver.encode(
+            b'x' * self.disk_file_ec.policy.ec_segment_size)[0]
+        etag = md5()
+        with self.disk_file_ec.create() as writer:
+            writer.write(frag_0)
+            etag.update(frag_0)
+            metadata = {
+                'ETag': etag.hexdigest(),
+                'X-Timestamp': timestamp.internal,
+                'Content-Length': str(len(frag_0)),
+                'X-Object-Meta-Flavor': 'peach',
+                'X-Object-Sysmeta-Ec-Frag-Index': '1',
+                'X-Object-Sysmeta-Ec-Etag': 'fake-etag',
+            }
+            writer.put(metadata)
+            writer.commit(timestamp)
+
+    def test_watchers(self):
+
+        calls = []
+
+        class TestWatcher(object):
+            def __init__(self, conf, logger):
+                self._started = False
+                self._ended = False
+                calls.append(["__init__", conf, logger])
+
+                # Make sure the logger is capable of quacking like a logger
+                logger.debug("getting started")
+
+            def start(self, audit_type, **other_kwargs):
+                if self._started:
+                    raise Exception("don't call it twice")
+                self._started = True
+                calls.append(['start', audit_type])
+
+            def see_object(self, object_metadata,
+                           data_file_path, **other_kwargs):
+                calls.append(['see_object', object_metadata,
+                              data_file_path, other_kwargs])
+
+            def end(self, **other_kwargs):
+                if self._ended:
+                    raise Exception("don't call it twice")
+                self._ended = True
+                calls.append(['end'])
+
+        conf = self.conf.copy()
+        conf['watchers'] = 'test_watcher1'
+        conf['__file__'] = '/etc/swift/swift.conf'
+        ret_config = {'swift#dark_data': {'action': 'log'}}
+        with mock.patch('swift.obj.auditor.parse_prefixed_conf',
+                        return_value=ret_config), \
+                mock.patch('swift.obj.auditor.load_pkg_resource',
+                           side_effect=[TestWatcher]) as mock_load, \
+                mock.patch('swift.obj.auditor.get_logger',
+                           lambda *a, **kw: self.logger):
+            my_auditor = auditor.ObjectAuditor(conf)
+
+        self.assertEqual(mock_load.mock_calls, [
+            mock.call('swift.object_audit_watcher', 'test_watcher1'),
+        ])
+
+        my_auditor.run_audit(mode='once', zero_byte_fps=float("inf"))
+
+        self.assertEqual(len(calls), 6)
+
+        self.assertEqual(calls[0], ["__init__", conf, mock.ANY])
+        watcher_logger = calls[0][2]
+        self.assertIsInstance(calls[0][2], SwiftLogAdapter)
+        self.assertIs(calls[0][2].logger, self.logger.logger)
+        self.assertEqual(watcher_logger.server, my_auditor.logger.server)
+        self.assertEqual('', my_auditor.logger.prefix)  # sanity check
+        self.assertEqual('[audit-watcher test_watcher1] ',
+                         watcher_logger.prefix)
+
+        self.assertEqual(calls[1], ["start", "ZBF"])
+
+        self.assertEqual(calls[2][0], "see_object")
+        self.assertEqual(calls[3][0], "see_object")
+
+        # The order in which the auditor finds things on the filesystem is
+        # irrelevant; what matters is that it finds all the things.
+        calls[2:5] = sorted(calls[2:5], key=lambda item: item[1]['name'])
+
+        self._assertDictContainsSubset({'name': '/a/c/o0',
+                                        'X-Object-Meta-Flavor': 'banana'},
+                                       calls[2][1])
+        self.assertIn('node/sda/objects/0/', calls[2][2])  # data_file_path
+        self.assertTrue(calls[2][2].endswith('.data'))  # data_file_path
+        self.assertEqual({}, calls[2][3])
+
+        self._assertDictContainsSubset({'name': '/a/c/o1',
+                                        'X-Object-Meta-Flavor': 'orange'},
+                                       calls[3][1])
+        self.assertIn('node/sda/objects/0/', calls[3][2])  # data_file_path
+        self.assertTrue(calls[3][2].endswith('.data'))  # data_file_path
+        self.assertEqual({}, calls[3][3])
+
+        self._assertDictContainsSubset({'name': '/a/c_ec/o',
+                                        'X-Object-Meta-Flavor': 'peach'},
+                                       calls[4][1])
+        self.assertIn('node/sda/objects-2/0/', calls[4][2])  # data_file_path
+        self.assertTrue(calls[4][2].endswith('.data'))  # data_file_path
+        self.assertEqual({}, calls[4][3])
+
+        self.assertEqual(calls[5], ["end"])
+
+        # check that watcher has not mutated the prefix of the auditor logger
+        my_auditor.logger.debug('the auditor has no logger prefix')
+        log_lines = self.logger.get_lines_for_level('debug')
+        self.assertIn(
+            "[audit-watcher test_watcher1] getting started",
+            log_lines)
+        self.assertIn(
+            "the auditor has no logger prefix",
+            log_lines)
+
+    def test_builtin_watchers(self):
+
+        # Yep, back-channel signaling in tests.
+        sentinel = 'DARK'
+
+        timestamp = Timestamp(time.time())
+
+        disk_file = self.df_mgr.get_diskfile(
+            'sda', '0', 'a', sentinel, 'o2', policy=POLICIES.legacy)
+        data = b'2' * 1024
+        etag = md5()
+        with disk_file.create() as writer:
+            writer.write(data)
+            etag.update(data)
+            metadata = {
+                'ETag': etag.hexdigest(),
+                'X-Timestamp': timestamp.internal,
+                'Content-Length': str(len(data)),
+                'X-Object-Meta-Flavor': 'mango',
+            }
+            writer.put(metadata)
+            writer.commit(timestamp)
+
+        def fake_direct_get_container(node, part, account, container,
+                                      prefix=None, limit=None,
+                                      extra_params=None, headers=None):
+            self.assertEqual(part, 1)
+            self.assertEqual(limit, 1)
+
+            if container == sentinel:
+                return {}, []
+
+            # The returned entry is not abbreviated, but is full of nonsese.
+            entry = {'bytes': 30968411,
+                     'hash': '60303f4122966fe5925f045eb52d1129',
+                     'name': '%s' % prefix,
+                     'content_type': 'video/mp4',
+                     'last_modified': '2017-08-15T03:30:57.693210'}
+            return {}, [entry]
+
+        conf = self.conf.copy()
+        conf['watchers'] = 'test_watcher1'
+        conf['__file__'] = '/etc/swift/swift.conf'
+
+        # with default watcher config the DARK object will not be older than
+        # grace_age so will not be logged
+        ret_config = {'test_watcher1': {'action': 'log'}}
+        with mock.patch('swift.obj.auditor.parse_prefixed_conf',
+                        return_value=ret_config), \
+                mock.patch('swift.obj.auditor.load_pkg_resource',
+                           side_effect=[DarkDataWatcher]):
+            my_auditor = auditor.ObjectAuditor(conf, logger=self.logger)
+
+        with mock.patch('swift.obj.watchers.dark_data.Ring', FakeRing1), \
+                mock.patch("swift.obj.watchers.dark_data.direct_get_container",
+                           fake_direct_get_container):
+            my_auditor.run_audit(mode='once')
+
+        log_lines = self.logger.get_lines_for_level('info')
+        self.assertIn(
+            '[audit-watcher test_watcher1] total unknown 0 ok 4 dark 0',
+            log_lines)
+
+        self.logger.clear()
+
+        # with grace_age=0 the DARK object will be older than
+        # grace_age so will be logged
+        ret_config = {'test_watcher1': {'action': 'log', 'grace_age': '0'}}
+        with mock.patch('swift.obj.auditor.parse_prefixed_conf',
+                        return_value=ret_config), \
+                mock.patch('swift.obj.auditor.load_pkg_resource',
+                           side_effect=[DarkDataWatcher]):
+            my_auditor = auditor.ObjectAuditor(conf, logger=self.logger)
+
+        with mock.patch('swift.obj.watchers.dark_data.Ring', FakeRing1), \
+                mock.patch("swift.obj.watchers.dark_data.direct_get_container",
+                           fake_direct_get_container):
+            my_auditor.run_audit(mode='once')
+
+        log_lines = self.logger.get_lines_for_level('info')
+        self.assertIn(
+            '[audit-watcher test_watcher1] total unknown 0 ok 3 dark 1',
+            log_lines)
+
+    def test_dark_data_watcher_init(self):
+        conf = {}
+        with mock.patch('swift.obj.watchers.dark_data.Ring', FakeRing1):
+            watcher = DarkDataWatcher(conf, self.logger)
+        self.assertEqual(self.logger, watcher.logger)
+        self.assertEqual(604800, watcher.grace_age)
+        self.assertEqual('log', watcher.dark_data_policy)
+
+        conf = {'grace_age': 360, 'action': 'delete'}
+        with mock.patch('swift.obj.watchers.dark_data.Ring', FakeRing1):
+            watcher = DarkDataWatcher(conf, self.logger)
+        self.assertEqual(self.logger, watcher.logger)
+        self.assertEqual(360, watcher.grace_age)
+        self.assertEqual('delete', watcher.dark_data_policy)
+
+        conf = {'grace_age': 0, 'action': 'invalid'}
+        with mock.patch('swift.obj.watchers.dark_data.Ring', FakeRing1):
+            watcher = DarkDataWatcher(conf, self.logger)
+        self.assertEqual(self.logger, watcher.logger)
+        self.assertEqual(0, watcher.grace_age)
+        self.assertEqual('log', watcher.dark_data_policy)
+
+    def test_dark_data_agreement(self):
+
+        # The dark data watcher only sees an object as dark if all container
+        # servers in the ring reply without an error and return an empty
+        # listing. So, we have the following permutations for an object:
+        #
+        #      Container Servers         Result
+        #      CS1         CS2
+        #      Listed      Listed        Good - the baseline result
+        #      Listed      Error         Good
+        #      Listed      Not listed    Good
+        #      Error       Error         Unknown - the baseline failure
+        #      Not listed  Error         Unknown
+        #      Not listed  Not listed    Dark - the only such result!
+        #
+        scenario = [
+            {'cr': ['L', 'L'], 'res': 'G'},
+            {'cr': ['L', 'E'], 'res': 'G'},
+            {'cr': ['L', 'N'], 'res': 'G'},
+            {'cr': ['E', 'E'], 'res': 'U'},
+            {'cr': ['N', 'E'], 'res': 'U'},
+            {'cr': ['N', 'N'], 'res': 'D'}]
+
+        conf = self.conf.copy()
+        conf['watchers'] = 'test_watcher1'
+        conf['__file__'] = '/etc/swift/swift.conf'
+        ret_config = {'test_watcher1': {'action': 'log', 'grace_age': '0'}}
+        with mock.patch('swift.obj.auditor.parse_prefixed_conf',
+                        return_value=ret_config), \
+                mock.patch('swift.obj.auditor.load_pkg_resource',
+                           side_effect=[DarkDataWatcher]):
+            my_auditor = auditor.ObjectAuditor(conf, logger=self.logger)
+
+        for cur in scenario:
+
+            def fake_direct_get_container(node, part, account, container,
+                                          prefix=None, limit=None,
+                                          extra_params=None, headers=None):
+                self.assertEqual(part, 1)
+                self.assertEqual(limit, 1)
+
+                reply_type = cur['cr'][int(node['id']) - 1]
+
+                if reply_type == 'E':
+                    raise ClientException("Emulated container server error")
+
+                if reply_type == 'N':
+                    return {}, []
+
+                entry = {'bytes': 30968411,
+                         'hash': '60303f4122966fe5925f045eb52d1129',
+                         'name': '%s' % prefix,
+                         'content_type': 'video/mp4',
+                         'last_modified': '2017-08-15T03:30:57.693210'}
+                return {}, [entry]
+
+            self.logger.clear()
+
+            namespace = 'swift.obj.watchers.dark_data.'
+            with mock.patch(namespace + 'Ring', FakeRing2), \
+                    mock.patch(namespace + 'direct_get_container',
+                               fake_direct_get_container):
+                my_auditor.run_audit(mode='once')
+
+            # We inherit a common setUp with 3 objects, so 3 everywhere.
+            if cur['res'] == 'U':
+                unk_exp, ok_exp, dark_exp = 3, 0, 0
+            elif cur['res'] == 'G':
+                unk_exp, ok_exp, dark_exp = 0, 3, 0
+            else:
+                unk_exp, ok_exp, dark_exp = 0, 0, 3
+
+            log_lines = self.logger.get_lines_for_level('info')
+            for line in log_lines:
+
+                if not line.startswith('[audit-watcher test_watcher1] total'):
+                    continue
+                words = line.split()
+                if not (words[3] == 'unknown' and
+                        words[5] == 'ok' and
+                        words[7] == 'dark'):
+                    unittest.TestCase.fail('Syntax error in %r' % (line,))
+
+                try:
+                    unk_cnt = int(words[4])
+                    ok_cnt = int(words[6])
+                    dark_cnt = int(words[8])
+                except ValueError:
+                    unittest.TestCase.fail('Bad value in %r' % (line,))
+
+            if unk_cnt != unk_exp or ok_cnt != ok_exp or dark_cnt != dark_exp:
+                fmt = 'Expected unknown %d ok %d dark %d, got %r, for nodes %r'
+                msg = fmt % (unk_exp, ok_exp, dark_exp,
+                             ' '.join(words[3:]), cur['cr'])
+                self.fail(msg=msg)
+
+    def test_dark_data_with_sharding(self):
+
+        # We use the EC object because it's all alone in its fake container.
+        main_acc = self.disk_file_ec._account
+        shard_acc = ".shards_%s" % main_acc
+        cont = self.disk_file_ec._container
+
+        def fake_direct_get_container(node, part, account, container,
+                                      prefix=None, limit=None,
+                                      extra_params=None, headers=None):
+            self.assertEqual(part, 1)
+            self.assertEqual(limit, 1)
+            self.assertIn('X-Backend-Record-Type', headers)
+            self.assertEqual(headers['X-Backend-Record-Type'], 'auto')
+
+            if account == shard_acc:
+                # Listing shards - just shortcut with a made-up response.
+                entry = {'bytes': 30968411,
+                         'hash': '60303f4122966fe5925f045eb52d1129',
+                         'name': '%s' % prefix,
+                         'content_type': 'video/mp4',
+                         'last_modified': '2017-08-15T03:30:57.693210'}
+                return {'X-Backend-Record-Type': 'object'}, [entry]
+
+            else:
+                if account == main_acc and container == cont:
+                    # The root container has no listing but has a shard range.
+                    entry = {
+                        'name': '%s/%s' % (shard_acc, cont),
+                        'timestamp': '1630106063.23826',
+                        'lower': '',
+                        'upper': '',
+                        'object_count': 1,
+                        'bytes_used': 1024,
+                        'meta_timestamp': '1630106063.23826',
+                        'deleted': 0,
+                        'state': 'sharded',
+                        'state_timestamp': '1630106063.23826',
+                        'epoch': None,
+                        'reported': 1,
+                        'tombstones': -1}
+                    return {'X-Backend-Record-Type': 'shard'}, [entry]
+
+                else:
+                    # It's an un-sharded container, no tricks.
+                    entry = {'bytes': 30968411,
+                             'hash': '60303f4122966fe5925f045eb52d1129',
+                             'name': '%s' % prefix,
+                             'content_type': 'video/mp4',
+                             'last_modified': '2017-08-15T03:30:57.693210'}
+                    return {}, [entry]
+
+        conf = self.conf.copy()
+        conf['watchers'] = 'test_watcher1'
+        conf['__file__'] = '/etc/swift/swift.conf'
+
+        ret_config = {'test_watcher1': {'action': 'log', 'grace_age': '0'}}
+        with mock.patch('swift.obj.auditor.parse_prefixed_conf',
+                        return_value=ret_config), \
+                mock.patch('swift.obj.auditor.load_pkg_resource',
+                           side_effect=[DarkDataWatcher]):
+            my_auditor = auditor.ObjectAuditor(conf, logger=self.logger)
+
+        with mock.patch('swift.obj.watchers.dark_data.Ring', FakeRing1), \
+                mock.patch("swift.obj.watchers.dark_data.direct_get_container",
+                           fake_direct_get_container):
+            my_auditor.run_audit(mode='once')
+
+        log_lines = self.logger.get_lines_for_level('info')
+        self.assertIn(
+            '[audit-watcher test_watcher1] total unknown 0 ok 3 dark 0',
+            log_lines)
+
+    def test_dark_data_with_sharding_fallback_to_root(self):
+
+        # We use the EC object because it's all alone in its fake container.
+        main_acc = self.disk_file_ec._account
+        shard_acc = ".shards_%s" % main_acc
+        cont = self.disk_file_ec._container
+        call_stack = []
+
+        def fake_direct_get_container(node, part, account, container,
+                                      prefix=None, limit=None,
+                                      extra_params=None, headers=None):
+            self.assertEqual(part, 1)
+            self.assertEqual(limit, 1)
+            call_stack.append((account, container, headers))
+
+            if account == shard_acc:
+                # return a shard listing that actaully points to the root OSR
+                entry = {
+                    'name': '%s/%s' % (main_acc, cont),
+                    'timestamp': '1630106063.23826',
+                    'lower': '',
+                    'upper': '',
+                    'object_count': 1,
+                    'bytes_used': 1024,
+                    'meta_timestamp': '1630106063.23826',
+                    'deleted': 0,
+                    'state': 'sharded',
+                    'state_timestamp': '1630106063.23826',
+                    'epoch': None,
+                    'reported': 1,
+                    'tombstones': -1}
+                return {'X-Backend-Record-Type': 'shard'}, [entry]
+
+            else:
+                if account == main_acc and container == cont:
+                    if headers['X-Backend-Record-Type'] == 'auto':
+                        # The root container has no listing but has a shard
+                        # range.
+                        entry = {
+                            'name': '%s/%s' % (shard_acc, cont),
+                            'timestamp': '1630106063.23826',
+                            'lower': '',
+                            'upper': '',
+                            'object_count': 1,
+                            'bytes_used': 1024,
+                            'meta_timestamp': '1630106063.23826',
+                            'deleted': 0,
+                            'state': 'sharded',
+                            'state_timestamp': '1630106063.23826',
+                            'epoch': None,
+                            'reported': 1,
+                            'tombstones': -1}
+                        return {'X-Backend-Record-Type': 'shard'}, [entry]
+                    else:
+                        # we've come back with a direct record-type = object
+                        self.assertEqual(headers['X-Backend-Record-Type'],
+                                         'object')
+                        # let's give them the obj, they've tried hard enough.
+                        entry = {'bytes': 30968411,
+                                 'hash': '60303f4122966fe5925f045eb52d1129',
+                                 'name': '%s' % prefix,
+                                 'content_type': 'video/mp4',
+                                 'last_modified': '2017-08-15T03:30:57.693210'}
+                        return {'X-Backend-Record-Type': 'object'}, [entry]
+
+                else:
+                    # It's an un-sharded container, no tricks.
+                    entry = {'bytes': 30968411,
+                             'hash': '60303f4122966fe5925f045eb52d1129',
+                             'name': '%s' % prefix,
+                             'content_type': 'video/mp4',
+                             'last_modified': '2017-08-15T03:30:57.693210'}
+                    return {}, [entry]
+
+        conf = self.conf.copy()
+        conf['watchers'] = 'test_watcher1'
+        conf['__file__'] = '/etc/swift/swift.conf'
+
+        ret_config = {'test_watcher1': {'action': 'log', 'grace_age': '0'}}
+        with mock.patch('swift.obj.auditor.parse_prefixed_conf',
+                        return_value=ret_config), \
+                mock.patch('swift.obj.auditor.load_pkg_resource',
+                           side_effect=[DarkDataWatcher]):
+            my_auditor = auditor.ObjectAuditor(conf, logger=self.logger)
+
+        with mock.patch('swift.obj.watchers.dark_data.Ring', FakeRing1), \
+                mock.patch("swift.obj.watchers.dark_data.direct_get_container",
+                           fake_direct_get_container):
+            my_auditor.run_audit(mode='once')
+
+        self.assertEqual(
+            call_stack[-3:],
+            [(main_acc, cont, {'X-Backend-Record-Type': 'auto'}),
+             (shard_acc, cont, {'X-Backend-Record-Type': 'auto'}),
+             (main_acc, cont, {'X-Backend-Record-Type': 'object'})])
+
+        log_lines = self.logger.get_lines_for_level('info')
+        self.assertIn(
+            '[audit-watcher test_watcher1] total unknown 0 ok 3 dark 0',
+            log_lines)
+
+    def test_dark_data_with_sharding_fallback_to_root_no_objects(self):
+
+        # We use the EC object because it's all alone in its fake container.
+        main_acc = self.disk_file_ec._account
+        shard_acc = ".shards_%s" % main_acc
+        cont = self.disk_file_ec._container
+        call_stack = []
+
+        def fake_direct_get_container(node, part, account, container,
+                                      prefix=None, limit=None,
+                                      extra_params=None, headers=None):
+            self.assertEqual(part, 1)
+            self.assertEqual(limit, 1)
+            call_stack.append((account, container, headers))
+
+            if account == shard_acc:
+                # return a shard listing that actaully points to the root OSR
+                entry = {
+                    'name': '%s/%s' % (main_acc, cont),
+                    'timestamp': '1630106063.23826',
+                    'lower': '',
+                    'upper': '',
+                    'object_count': 1,
+                    'bytes_used': 1024,
+                    'meta_timestamp': '1630106063.23826',
+                    'deleted': 0,
+                    'state': 'sharded',
+                    'state_timestamp': '1630106063.23826',
+                    'epoch': None,
+                    'reported': 1,
+                    'tombstones': -1}
+                return {'X-Backend-Record-Type': 'shard'}, [entry]
+
+            else:
+                if account == main_acc and container == cont:
+                    if headers['X-Backend-Record-Type'] == 'auto':
+                        # The root container has no listing but has a shard
+                        # range.
+                        entry = {
+                            'name': '%s/%s' % (shard_acc, cont),
+                            'timestamp': '1630106063.23826',
+                            'lower': '',
+                            'upper': '',
+                            'object_count': 1,
+                            'bytes_used': 1024,
+                            'meta_timestamp': '1630106063.23826',
+                            'deleted': 0,
+                            'state': 'sharded',
+                            'state_timestamp': '1630106063.23826',
+                            'epoch': None,
+                            'reported': 1,
+                            'tombstones': -1}
+                        return {'X-Backend-Record-Type': 'shard'}, [entry]
+                    else:
+                        # we've come back with a direct record-type = object
+                        self.assertEqual(headers['X-Backend-Record-Type'],
+                                         'object')
+                        return {'X-Backend-Record-Type': 'object'}, []
+
+                else:
+                    # It's an un-sharded container, no tricks.
+                    entry = {'bytes': 30968411,
+                             'hash': '60303f4122966fe5925f045eb52d1129',
+                             'name': '%s' % prefix,
+                             'content_type': 'video/mp4',
+                             'last_modified': '2017-08-15T03:30:57.693210'}
+                    return {}, [entry]
+
+        conf = self.conf.copy()
+        conf['watchers'] = 'test_watcher1'
+        conf['__file__'] = '/etc/swift/swift.conf'
+
+        ret_config = {'test_watcher1': {'action': 'log', 'grace_age': '0'}}
+        with mock.patch('swift.obj.auditor.parse_prefixed_conf',
+                        return_value=ret_config), \
+                mock.patch('swift.obj.auditor.load_pkg_resource',
+                           side_effect=[DarkDataWatcher]):
+            my_auditor = auditor.ObjectAuditor(conf, logger=self.logger)
+
+        with mock.patch('swift.obj.watchers.dark_data.Ring', FakeRing1), \
+                mock.patch("swift.obj.watchers.dark_data.direct_get_container",
+                           fake_direct_get_container):
+            my_auditor.run_audit(mode='once')
+
+        self.assertEqual(
+            call_stack[-3:],
+            [(main_acc, cont, {'X-Backend-Record-Type': 'auto'}),
+             (shard_acc, cont, {'X-Backend-Record-Type': 'auto'}),
+             (main_acc, cont, {'X-Backend-Record-Type': 'object'})])
+
+        log_lines = self.logger.get_lines_for_level('info')
+        self.assertIn(
+            '[audit-watcher test_watcher1] total unknown 0 ok 2 dark 1',
+            log_lines)
+
 
 if __name__ == '__main__':
     unittest.main()
diff --git a/test/unit/obj/test_diskfile.py b/test/unit/obj/test_diskfile.py
new file mode 100644
index 0000000000..d1b81c5bca
--- /dev/null
+++ b/test/unit/obj/test_diskfile.py
@@ -0,0 +1,9831 @@
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""Tests for swift.obj.diskfile"""
+
+import pickle
+import binascii
+import os
+import errno
+import itertools
+from unittest import mock
+import unittest
+import email
+import tempfile
+import threading
+import uuid
+import xattr
+import re
+import sys
+from collections import defaultdict
+from random import shuffle, randint
+from shutil import rmtree
+from time import time
+from tempfile import mkdtemp
+from contextlib import contextmanager
+import pyeclib.ec_iface
+
+from eventlet import hubs, timeout, tpool, spawn, sleep
+from swift.obj.diskfile import update_auditor_status, EUCLEAN
+from test import BaseTestCase
+from test.debug_logger import debug_logger
+from test.unit import (mock as unit_mock, temptree, mock_check_drive,
+                       patch_policies, make_timestamp_iter,
+                       DEFAULT_TEST_EC_TYPE, requires_o_tmpfile_support_in_tmp,
+                       encode_frag_archive_bodies, skip_if_no_xattrs)
+from swift.obj import diskfile
+from swift.common import utils
+from swift.common.utils import hash_path, mkdirs, Timestamp, lock_path, \
+    encode_timestamps, O_TMPFILE, md5 as _md5, MD5_OF_EMPTY_STRING
+from swift.common import ring
+from swift.common.splice import splice
+from swift.common.exceptions import DiskFileNotExist, DiskFileQuarantined, \
+    DiskFileDeviceUnavailable, DiskFileDeleted, DiskFileNotOpen, \
+    DiskFileError, ReplicationLockTimeout, DiskFileCollision, \
+    DiskFileExpired, SwiftException, DiskFileNoSpace, \
+    DiskFileXattrNotSupported, PartitionLockTimeout, DiskFileStateChanged
+from swift.common.storage_policy import (
+    POLICIES, get_policy_string, StoragePolicy, ECStoragePolicy, REPL_POLICY,
+    EC_POLICY, PolicyError)
+from test.unit.obj.common import write_diskfile
+
+
+test_policies = [
+    StoragePolicy(0, name='zero', is_default=True),
+    ECStoragePolicy(1, name='one', is_default=False,
+                    ec_type=DEFAULT_TEST_EC_TYPE,
+                    ec_ndata=10, ec_nparity=4),
+]
+
+
+class md5(object):
+    def __init__(self, s=b''):
+        if not isinstance(s, bytes):
+            s = s.encode('ascii')
+        self.md = _md5(s, usedforsecurity=False)
+
+    def update(self, s=b''):
+        if not isinstance(s, bytes):
+            s = s.encode('ascii')
+        return self.md.update(s)
+
+    @property
+    def hexdigest(self):
+        return self.md.hexdigest
+
+    @property
+    def digest(self):
+        return self.md.digest
+
+
+def find_paths_with_matching_suffixes(needed_matches=2, needed_suffixes=3):
+    paths = defaultdict(list)
+    while True:
+        path = ('a', 'c', uuid.uuid4().hex)
+        hash_ = hash_path(*path)
+        suffix = hash_[-3:]
+        paths[suffix].append(path)
+        if len(paths) < needed_suffixes:
+            # in the extreamly unlikely situation where you land the matches
+            # you need before you get the total suffixes you need - it's
+            # simpler to just ignore this suffix for now
+            continue
+        if len(paths[suffix]) >= needed_matches:
+            break
+    return paths, suffix
+
+
+def _create_test_ring(path, policy):
+    ring_name = get_policy_string('object', policy)
+    testgz = os.path.join(path, ring_name + '.ring.gz')
+    intended_replica2part2dev_id = [
+        [0, 1, 2, 3, 4, 5, 6],
+        [1, 2, 3, 0, 5, 6, 4],
+        [2, 3, 0, 1, 6, 4, 5]]
+    intended_devs = [
+        {'id': 0, 'device': 'sda1', 'region': 1, 'zone': 0, 'ip': '127.0.0.0',
+         'port': 6200},
+        {'id': 1, 'device': 'sda1', 'region': 1, 'zone': 1, 'ip': '127.0.0.1',
+         'port': 6200},
+        {'id': 2, 'device': 'sda1', 'region': 1, 'zone': 2, 'ip': '127.0.0.2',
+         'port': 6200},
+        {'id': 3, 'device': 'sda1', 'region': 1, 'zone': 4, 'ip': '127.0.0.3',
+         'port': 6200},
+        {'id': 4, 'device': 'sda1', 'region': 1, 'zone': 5, 'ip': '127.0.0.4',
+         'port': 6200},
+        {'id': 5, 'device': 'sda1', 'region': 1, 'zone': 6,
+         'ip': 'fe80::202:b3ff:fe1e:8329', 'port': 6200},
+        {'id': 6, 'device': 'sda1', 'region': 1, 'zone': 7,
+         'ip': '2001:0db8:85a3:0000:0000:8a2e:0370:7334',
+         'port': 6200}]
+    intended_part_shift = 30
+    intended_reload_time = 15
+    ring.RingData(intended_replica2part2dev_id, intended_devs,
+                  intended_part_shift).save(testgz)
+    return ring.Ring(path, ring_name=ring_name,
+                     reload_time=intended_reload_time)
+
+
+def _make_datafilename(timestamp, policy, frag_index=None, durable=False):
+    if frag_index is None:
+        frag_index = randint(0, 9)
+    filename = timestamp.internal
+    if policy.policy_type == EC_POLICY:
+        filename += '#%d' % int(frag_index)
+        if durable:
+            filename += '#d'
+    filename += '.data'
+    return filename
+
+
+def _make_metafilename(meta_timestamp, ctype_timestamp=None):
+    filename = meta_timestamp.internal
+    if ctype_timestamp is not None:
+        delta = meta_timestamp.raw - ctype_timestamp.raw
+        filename = '%s-%x' % (filename, delta)
+    filename += '.meta'
+    return filename
+
+
+@patch_policies
+class TestDiskFileModuleMethods(unittest.TestCase):
+
+    def setUp(self):
+        skip_if_no_xattrs()
+        utils.HASH_PATH_SUFFIX = b'endcap'
+        utils.HASH_PATH_PREFIX = b''
+        # Setup a test ring per policy (stolen from common/test_ring.py)
+        self.testdir = tempfile.mkdtemp()
+        self.devices = os.path.join(self.testdir, 'node')
+        rmtree(self.testdir, ignore_errors=1)
+        os.mkdir(self.testdir)
+        os.mkdir(self.devices)
+        self.existing_device = 'sda1'
+        os.mkdir(os.path.join(self.devices, self.existing_device))
+        self.objects = os.path.join(self.devices, self.existing_device,
+                                    'objects')
+        os.mkdir(self.objects)
+        self.parts = {}
+        for part in ['0', '1', '2', '3']:
+            self.parts[part] = os.path.join(self.objects, part)
+            os.mkdir(os.path.join(self.objects, part))
+        self.ring = _create_test_ring(self.testdir, POLICIES.legacy)
+        self.conf = dict(
+            swift_dir=self.testdir, devices=self.devices, mount_check='false',
+            timeout='300', stats_interval='1')
+        self.logger = debug_logger()
+        self.df_mgr = diskfile.DiskFileManager(self.conf, logger=self.logger)
+
+    def tearDown(self):
+        rmtree(self.testdir, ignore_errors=1)
+
+    def _create_diskfile(self, policy):
+        return self.df_mgr.get_diskfile(self.existing_device,
+                                        '0', 'a', 'c', 'o',
+                                        policy=policy)
+
+    def test_relink_paths(self):
+        target_dir = os.path.join(self.testdir, 'd1')
+        os.mkdir(target_dir)
+        target_path = os.path.join(target_dir, 'f1')
+        with open(target_path, 'w') as fd:
+            fd.write('junk')
+        new_target_path = os.path.join(self.testdir, 'd2', 'f1')
+        created = diskfile.relink_paths(target_path, new_target_path)
+        self.assertTrue(created)
+        self.assertTrue(os.path.isfile(new_target_path))
+        with open(new_target_path, 'r') as fd:
+            self.assertEqual('junk', fd.read())
+
+    def test_relink_paths_makedirs_error(self):
+        target_dir = os.path.join(self.testdir, 'd1')
+        os.mkdir(target_dir)
+        target_path = os.path.join(target_dir, 'f1')
+        with open(target_path, 'w') as fd:
+            fd.write('junk')
+        new_target_path = os.path.join(self.testdir, 'd2', 'f1')
+        with mock.patch('swift.obj.diskfile.os.makedirs',
+                        side_effect=Exception('oops')):
+            with self.assertRaises(Exception) as cm:
+                diskfile.relink_paths(target_path, new_target_path)
+            self.assertEqual('oops', str(cm.exception))
+            with self.assertRaises(Exception) as cm:
+                diskfile.relink_paths(target_path, new_target_path,
+                                      ignore_missing=False)
+            self.assertEqual('oops', str(cm.exception))
+
+    def test_relink_paths_makedirs_race(self):
+        # test two concurrent relinks of the same object hash dir with race
+        # around makedirs
+        target_dir = os.path.join(self.testdir, 'd1')
+        # target dir exists
+        os.mkdir(target_dir)
+        target_path_1 = os.path.join(target_dir, 't1.data')
+        target_path_2 = os.path.join(target_dir, 't2.data')
+        # new target dir and files do not exist
+        new_target_dir = os.path.join(self.testdir, 'd2')
+        new_target_path_1 = os.path.join(new_target_dir, 't1.data')
+        new_target_path_2 = os.path.join(new_target_dir, 't2.data')
+        created = []
+
+        def write_and_relink(target_path, new_target_path):
+            with open(target_path, 'w') as fd:
+                fd.write(target_path)
+            created.append(diskfile.relink_paths(target_path, new_target_path))
+
+        calls = []
+        orig_makedirs = os.makedirs
+
+        def mock_makedirs(path, *args):
+            calls.append(path)
+            if len(calls) == 1:
+                # pretend another process jumps in here and relinks same dirs
+                write_and_relink(target_path_2, new_target_path_2)
+            return orig_makedirs(path, *args)
+
+        with mock.patch('swift.obj.diskfile.os.makedirs', mock_makedirs):
+            write_and_relink(target_path_1, new_target_path_1)
+
+        self.assertEqual([new_target_dir, new_target_dir], calls)
+        self.assertTrue(os.path.isfile(new_target_path_1))
+        with open(new_target_path_1, 'r') as fd:
+            self.assertEqual(target_path_1, fd.read())
+        self.assertTrue(os.path.isfile(new_target_path_2))
+        with open(new_target_path_2, 'r') as fd:
+            self.assertEqual(target_path_2, fd.read())
+        self.assertEqual([True, True], created)
+
+    def test_relink_paths_object_dir_exists_but_not_dir(self):
+        target_dir = os.path.join(self.testdir, 'd1')
+        os.mkdir(target_dir)
+        target_path = os.path.join(target_dir, 't1.data')
+        with open(target_path, 'w') as fd:
+            fd.write(target_path)
+        # make a file where the new object dir should be
+        new_target_dir = os.path.join(self.testdir, 'd2')
+        with open(new_target_dir, 'w') as fd:
+            fd.write(new_target_dir)
+        new_target_path = os.path.join(new_target_dir, 't1.data')
+
+        with self.assertRaises(OSError) as cm:
+            diskfile.relink_paths(target_path, new_target_path)
+        self.assertEqual(errno.ENOTDIR, cm.exception.errno)
+
+        # make a symlink to target where the new object dir should be
+        os.unlink(new_target_dir)
+        os.symlink(target_path, new_target_dir)
+        with self.assertRaises(OSError) as cm:
+            diskfile.relink_paths(target_path, new_target_path)
+        self.assertEqual(errno.ENOTDIR, cm.exception.errno)
+
+    def test_relink_paths_os_link_error(self):
+        # check relink_paths raises exception from os.link
+        target_dir = os.path.join(self.testdir, 'd1')
+        os.mkdir(target_dir)
+        target_path = os.path.join(target_dir, 'f1')
+        with open(target_path, 'w') as fd:
+            fd.write('junk')
+        new_target_path = os.path.join(self.testdir, 'd2', 'f1')
+        with mock.patch('swift.obj.diskfile.os.link',
+                        side_effect=OSError(errno.EPERM, 'nope')):
+            with self.assertRaises(Exception) as cm:
+                diskfile.relink_paths(target_path, new_target_path)
+        self.assertEqual(errno.EPERM, cm.exception.errno)
+
+    def test_relink_paths_target_path_does_not_exist(self):
+        # check relink_paths does not raise exception
+        target_dir = os.path.join(self.testdir, 'd1')
+        os.mkdir(target_dir)
+        target_path = os.path.join(target_dir, 'f1')
+        new_target_path = os.path.join(self.testdir, 'd2', 'f1')
+        created = diskfile.relink_paths(target_path, new_target_path)
+        self.assertFalse(os.path.exists(target_path))
+        self.assertFalse(os.path.exists(new_target_path))
+        self.assertFalse(created)
+        with self.assertRaises(OSError) as cm:
+            diskfile.relink_paths(target_path, new_target_path,
+                                  ignore_missing=False)
+        self.assertEqual(errno.ENOENT, cm.exception.errno)
+        self.assertFalse(os.path.exists(target_path))
+        self.assertFalse(os.path.exists(new_target_path))
+
+    def test_relink_paths_os_link_race(self):
+        # test two concurrent relinks of the same object hash dir with race
+        # around os.link
+        target_dir = os.path.join(self.testdir, 'd1')
+        # target dir exists
+        os.mkdir(target_dir)
+        target_path = os.path.join(target_dir, 't1.data')
+        # new target dir and file do not exist
+        new_target_dir = os.path.join(self.testdir, 'd2')
+        new_target_path = os.path.join(new_target_dir, 't1.data')
+        created = []
+
+        def write_and_relink(target_path, new_target_path):
+            with open(target_path, 'w') as fd:
+                fd.write(target_path)
+            created.append(diskfile.relink_paths(target_path, new_target_path))
+
+        calls = []
+        orig_link = os.link
+
+        def mock_link(path, new_path):
+            calls.append((path, new_path))
+            if len(calls) == 1:
+                # pretend another process jumps in here and links same files
+                write_and_relink(target_path, new_target_path)
+            return orig_link(path, new_path)
+
+        with mock.patch('swift.obj.diskfile.os.link', mock_link):
+            write_and_relink(target_path, new_target_path)
+
+        self.assertEqual([(target_path, new_target_path)] * 2, calls)
+        self.assertTrue(os.path.isfile(new_target_path))
+        with open(new_target_path, 'r') as fd:
+            self.assertEqual(target_path, fd.read())
+        with open(target_path, 'r') as fd:
+            self.assertEqual(target_path, fd.read())
+        self.assertEqual([True, False], created)
+
+    def test_relink_paths_different_file_exists(self):
+        # check for an exception if a hard link cannot be made because a
+        # different file already exists at new_target_path
+        target_dir = os.path.join(self.testdir, 'd1')
+        # target dir and file exists
+        os.mkdir(target_dir)
+        target_path = os.path.join(target_dir, 't1.data')
+        with open(target_path, 'w') as fd:
+            fd.write(target_path)
+        # new target dir and different file exist
+        new_target_dir = os.path.join(self.testdir, 'd2')
+        os.mkdir(new_target_dir)
+        new_target_path = os.path.join(new_target_dir, 't1.data')
+        with open(new_target_path, 'w') as fd:
+            fd.write(new_target_path)
+
+        with self.assertRaises(OSError) as cm:
+            diskfile.relink_paths(target_path, new_target_path)
+
+        self.assertEqual(errno.EEXIST, cm.exception.errno)
+        # check nothing got deleted...
+        self.assertTrue(os.path.isfile(target_path))
+        with open(target_path, 'r') as fd:
+            self.assertEqual(target_path, fd.read())
+        self.assertTrue(os.path.isfile(new_target_path))
+        with open(new_target_path, 'r') as fd:
+            self.assertEqual(new_target_path, fd.read())
+
+    def test_relink_paths_same_file_exists(self):
+        # check for no exception if a hard link cannot be made because a link
+        # to the same file already exists at the path
+        target_dir = os.path.join(self.testdir, 'd1')
+        # target dir and file exists
+        os.mkdir(target_dir)
+        target_path = os.path.join(target_dir, 't1.data')
+        with open(target_path, 'w') as fd:
+            fd.write(target_path)
+        # new target dir and link to same file exist
+        new_target_dir = os.path.join(self.testdir, 'd2')
+        os.mkdir(new_target_dir)
+        new_target_path = os.path.join(new_target_dir, 't1.data')
+        os.link(target_path, new_target_path)
+        with open(new_target_path, 'r') as fd:
+            self.assertEqual(target_path, fd.read())  # sanity check
+
+        # existing link checks ok
+        created = diskfile.relink_paths(target_path, new_target_path)
+        with open(new_target_path, 'r') as fd:
+            self.assertEqual(target_path, fd.read())  # sanity check
+        self.assertFalse(created)
+
+        # now pretend there is an error when checking that the link already
+        # exists - expect the EEXIST exception to be raised
+        orig_stat = os.stat
+
+        def mocked_stat(path):
+            if path == new_target_path:
+                raise OSError(errno.EPERM, 'cannot be sure link exists :(')
+            return orig_stat(path)
+
+        with mock.patch('swift.obj.diskfile.os.stat', mocked_stat):
+            with self.assertRaises(OSError) as cm:
+                diskfile.relink_paths(target_path, new_target_path)
+        self.assertEqual(errno.EEXIST, cm.exception.errno, str(cm.exception))
+        with open(new_target_path, 'r') as fd:
+            self.assertEqual(target_path, fd.read())  # sanity check
+
+        # ...unless while checking for an existing link the target file is
+        # found to no longer exists, which is ok
+        def mocked_stat(path):
+            if path == target_path:
+                raise OSError(errno.ENOENT, 'target longer here :)')
+            return orig_stat(path)
+
+        with mock.patch('swift.obj.diskfile.os.stat', mocked_stat):
+            created = diskfile.relink_paths(target_path, new_target_path)
+        with open(new_target_path, 'r') as fd:
+            self.assertEqual(target_path, fd.read())  # sanity check
+        self.assertFalse(created)
+
+    def test_extract_policy(self):
+        # good path names
+        pn = 'objects/0/606/1984527ed7ef6247c78606/1401379842.14643.data'
+        self.assertEqual(diskfile.extract_policy(pn), POLICIES[0])
+        pn = 'objects-1/0/606/198452b6ef6247c78606/1401379842.14643.data'
+        self.assertEqual(diskfile.extract_policy(pn), POLICIES[1])
+
+        # leading slash
+        pn = '/objects/0/606/1984527ed7ef6247c78606/1401379842.14643.data'
+        self.assertEqual(diskfile.extract_policy(pn), POLICIES[0])
+        pn = '/objects-1/0/606/198452b6ef6247c78606/1401379842.14643.data'
+        self.assertEqual(diskfile.extract_policy(pn), POLICIES[1])
+
+        # full paths
+        good_path = '/srv/node/sda1/objects-1/1/abc/def/1234.data'
+        self.assertEqual(diskfile.extract_policy(good_path), POLICIES[1])
+        good_path = '/srv/node/sda1/objects/1/abc/def/1234.data'
+        self.assertEqual(diskfile.extract_policy(good_path), POLICIES[0])
+
+        # short paths
+        path = '/srv/node/sda1/objects/1/1234.data'
+        self.assertEqual(diskfile.extract_policy(path), POLICIES[0])
+        path = '/srv/node/sda1/objects-1/1/1234.data'
+        self.assertEqual(diskfile.extract_policy(path), POLICIES[1])
+
+        # well formatted but, unknown policy index
+        pn = 'objects-2/0/606/198427efcff042c78606/1401379842.14643.data'
+        self.assertIsNone(diskfile.extract_policy(pn))
+
+        # malformed path
+        self.assertIsNone(diskfile.extract_policy(''))
+        bad_path = '/srv/node/sda1/objects-t/1/abc/def/1234.data'
+        self.assertIsNone(diskfile.extract_policy(bad_path))
+        pn = 'XXXX/0/606/1984527ed42b6ef6247c78606/1401379842.14643.data'
+        self.assertIsNone(diskfile.extract_policy(pn))
+        bad_path = '/srv/node/sda1/foo-1/1/abc/def/1234.data'
+        self.assertIsNone(diskfile.extract_policy(bad_path))
+        bad_path = '/srv/node/sda1/obj1/1/abc/def/1234.data'
+        self.assertIsNone(diskfile.extract_policy(bad_path))
+
+    def test_quarantine_renamer(self):
+        for policy in POLICIES:
+            # we use this for convenience, not really about a diskfile layout
+            df = self._create_diskfile(policy=policy)
+            mkdirs(df._datadir)
+            exp_dir = os.path.join(self.devices, 'quarantined',
+                                   diskfile.get_data_dir(policy),
+                                   os.path.basename(df._datadir))
+            qbit = os.path.join(df._datadir, 'qbit')
+            with open(qbit, 'w') as f:
+                f.write('abc')
+            to_dir = diskfile.quarantine_renamer(self.devices, qbit)
+            self.assertEqual(to_dir, exp_dir)
+            self.assertRaises(OSError, diskfile.quarantine_renamer,
+                              self.devices, qbit)
+
+    def test_get_data_dir(self):
+        self.assertEqual(diskfile.get_data_dir(POLICIES[0]),
+                         diskfile.DATADIR_BASE)
+        self.assertEqual(diskfile.get_data_dir(POLICIES[1]),
+                         diskfile.DATADIR_BASE + "-1")
+        self.assertRaises(ValueError, diskfile.get_data_dir, 'junk')
+
+        self.assertRaises(ValueError, diskfile.get_data_dir, 99)
+
+    def test_get_async_dir(self):
+        self.assertEqual(diskfile.get_async_dir(POLICIES[0]),
+                         diskfile.ASYNCDIR_BASE)
+        self.assertEqual(diskfile.get_async_dir(POLICIES[1]),
+                         diskfile.ASYNCDIR_BASE + "-1")
+        self.assertRaises(ValueError, diskfile.get_async_dir, 'junk')
+
+        self.assertRaises(ValueError, diskfile.get_async_dir, 99)
+
+    def test_get_tmp_dir(self):
+        self.assertEqual(diskfile.get_tmp_dir(POLICIES[0]),
+                         diskfile.TMP_BASE)
+        self.assertEqual(diskfile.get_tmp_dir(POLICIES[1]),
+                         diskfile.TMP_BASE + "-1")
+        self.assertRaises(ValueError, diskfile.get_tmp_dir, 'junk')
+
+        self.assertRaises(ValueError, diskfile.get_tmp_dir, 99)
+
+    def test_pickle_async_update_tmp_dir(self):
+        for policy in POLICIES:
+            if int(policy) == 0:
+                tmp_part = 'tmp'
+            else:
+                tmp_part = 'tmp-%d' % policy
+            tmp_path = os.path.join(
+                self.devices, self.existing_device, tmp_part)
+            self.assertFalse(os.path.isdir(tmp_path))
+            pickle_args = (self.existing_device, 'a', 'c', 'o',
+                           'data', 0.0, policy)
+            os.makedirs(tmp_path)
+            # now create a async update
+            self.df_mgr.pickle_async_update(*pickle_args)
+            # check tempdir
+            self.assertTrue(os.path.isdir(tmp_path))
+
+    def test_get_part_path(self):
+        # partition passed as 'str'
+        part_dir = diskfile.get_part_path('/srv/node/sda1', POLICIES[0], '123')
+        exp_dir = '/srv/node/sda1/objects/123'
+        self.assertEqual(part_dir, exp_dir)
+
+        # partition passed as 'int'
+        part_dir = diskfile.get_part_path('/srv/node/sdb5', POLICIES[1], 123)
+        exp_dir = '/srv/node/sdb5/objects-1/123'
+        self.assertEqual(part_dir, exp_dir)
+
+    def test_can_read_old_meta(self):
+        # outputs taken from `xattr -l <diskfile>`
+        cases = {
+            'python_2.7.18_swift_2.13_replicated': '''
+0000   80 02 7D 71 01 28 55 0E 43 6F 6E 74 65 6E 74 2D    ..}q.(U.Content-
+0010   4C 65 6E 67 74 68 71 02 55 02 31 33 55 04 6E 61    Lengthq.U.13U.na
+0020   6D 65 71 03 55 12 2F 41 55 54 48 5F 74 65 73 74    meq.U./AUTH_test
+0030   2F E2 98 83 2F E2 98 83 71 04 55 13 58 2D 4F 62    /.../...q.U.X-Ob
+0040   6A 65 63 74 2D 4D 65 74 61 2D 4D 74 69 6D 65 55    ject-Meta-MtimeU
+0050   11 31 36 38 32 39 35 39 38 37 34 2E 37 35 36 32    .1682959874.7562
+0060   30 35 71 05 55 04 45 54 61 67 71 06 55 20 36 62    05q.U.ETagq.U 6b
+0070   37 64 39 61 31 63 35 64 31 36 37 63 63 35 30 30    7d9a1c5d167cc500
+0080   33 37 66 32 39 66 32 39 30 62 62 33 37 35 71 07    37f29f290bb375q.
+0090   55 0B 58 2D 54 69 6D 65 73 74 61 6D 70 71 08 55    U.X-Timestampq.U
+00A0   10 31 36 38 32 39 36 32 36 35 31 2E 39 37 34 39    .1682962651.9749
+00B0   34 55 11 58 2D 4F 62 6A 65 63 74 2D 4D 65 74 61    4U.X-Object-Meta
+00C0   2D E2 98 83 55 03 E2 98 83 71 09 55 0C 43 6F 6E    -...U....q.U.Con
+00D0   74 65 6E 74 2D 54 79 70 65 71 0A 55 18 61 70 70    tent-Typeq.U.app
+00E0   6C 69 63 61 74 69 6F 6E 2F 6F 63 74 65 74 2D 73    lication/octet-s
+00F0   74 72 65 61 6D 71 0B 75 2E                         treamq.u.
+            ''',
+            'python_2.7.18_swift_2.13_ec': '''
+0000   80 02 7D 71 01 28 55 0E 43 6F 6E 74 65 6E 74 2D    ..}q.(U.Content-
+0010   4C 65 6E 67 74 68 71 02 55 02 38 34 55 04 6E 61    Lengthq.U.84U.na
+0020   6D 65 71 03 55 12 2F 41 55 54 48 5F 74 65 73 74    meq.U./AUTH_test
+0030   2F E2 98 83 2F E2 98 83 71 04 58 1E 00 00 00 58    /.../...q.X....X
+0040   2D 4F 62 6A 65 63 74 2D 53 79 73 6D 65 74 61 2D    -Object-Sysmeta-
+0050   45 63 2D 46 72 61 67 2D 49 6E 64 65 78 71 05 55    Ec-Frag-Indexq.U
+0060   01 35 55 13 58 2D 4F 62 6A 65 63 74 2D 4D 65 74    .5U.X-Object-Met
+0070   61 2D 4D 74 69 6D 65 55 11 31 36 38 32 39 35 39    a-MtimeU.1682959
+0080   38 37 34 2E 37 35 36 32 30 35 71 06 58 22 00 00    874.756205q.X"..
+0090   00 58 2D 4F 62 6A 65 63 74 2D 53 79 73 6D 65 74    .X-Object-Sysmet
+00A0   61 2D 45 63 2D 43 6F 6E 74 65 6E 74 2D 4C 65 6E    a-Ec-Content-Len
+00B0   67 74 68 71 07 55 02 31 33 71 08 58 18 00 00 00    gthq.U.13q.X....
+00C0   58 2D 4F 62 6A 65 63 74 2D 53 79 73 6D 65 74 61    X-Object-Sysmeta
+00D0   2D 45 63 2D 45 74 61 67 71 09 55 20 36 62 37 64    -Ec-Etagq.U 6b7d
+00E0   39 61 31 63 35 64 31 36 37 63 63 35 30 30 33 37    9a1c5d167cc50037
+00F0   66 32 39 66 32 39 30 62 62 33 37 35 71 0A 55 04    f29f290bb375q.U.
+0100   45 54 61 67 71 0B 55 20 65 32 66 64 34 33 30 65    ETagq.U e2fd430e
+0110   61 66 37 32 32 33 63 32 35 30 33 63 34 65 38 33    af7223c2503c4e83
+0120   30 31 63 66 66 33 37 63 71 0C 55 0B 58 2D 54 69    01cff37cq.U.X-Ti
+0130   6D 65 73 74 61 6D 70 71 0D 55 10 31 36 38 32 39    mestampq.U.16829
+0140   36 32 32 36 32 2E 31 36 31 39 39 55 11 58 2D 4F    62262.16199U.X-O
+0150   62 6A 65 63 74 2D 4D 65 74 61 2D E2 98 83 55 03    bject-Meta-...U.
+0160   E2 98 83 71 0E 58 1A 00 00 00 58 2D 4F 62 6A 65    ...q.X....X-Obje
+0170   63 74 2D 53 79 73 6D 65 74 61 2D 45 63 2D 53 63    ct-Sysmeta-Ec-Sc
+0180   68 65 6D 65 71 0F 55 1A 6C 69 62 65 72 61 73 75    hemeq.U.liberasu
+0190   72 65 63 6F 64 65 5F 72 73 5F 76 61 6E 64 20 34    recode_rs_vand 4
+01A0   2B 32 71 10 55 0C 43 6F 6E 74 65 6E 74 2D 54 79    +2q.U.Content-Ty
+01B0   70 65 71 11 55 18 61 70 70 6C 69 63 61 74 69 6F    peq.U.applicatio
+01C0   6E 2F 6F 63 74 65 74 2D 73 74 72 65 61 6D 71 12    n/octet-streamq.
+01D0   58 20 00 00 00 58 2D 4F 62 6A 65 63 74 2D 53 79    X ...X-Object-Sy
+01E0   73 6D 65 74 61 2D 45 63 2D 53 65 67 6D 65 6E 74    smeta-Ec-Segment
+01F0   2D 53 69 7A 65 71 13 55 07 31 30 34 38 35 37 36    -Sizeq.U.1048576
+0200   71 14 75 2E                                        q.u.
+            ''',
+            'python_2.7.18_swift_2.23_replicated': '''
+0000   80 02 7D 71 01 28 55 0E 43 6F 6E 74 65 6E 74 2D    ..}q.(U.Content-
+0010   4C 65 6E 67 74 68 71 02 55 02 31 33 71 03 55 04    Lengthq.U.13q.U.
+0020   6E 61 6D 65 71 04 55 12 2F 41 55 54 48 5F 74 65    nameq.U./AUTH_te
+0030   73 74 2F E2 98 83 2F E2 98 83 71 05 55 0C 43 6F    st/.../...q.U.Co
+0040   6E 74 65 6E 74 2D 54 79 70 65 71 06 55 18 61 70    ntent-Typeq.U.ap
+0050   70 6C 69 63 61 74 69 6F 6E 2F 6F 63 74 65 74 2D    plication/octet-
+0060   73 74 72 65 61 6D 71 07 55 04 45 54 61 67 71 08    streamq.U.ETagq.
+0070   55 20 36 62 37 64 39 61 31 63 35 64 31 36 37 63    U 6b7d9a1c5d167c
+0080   63 35 30 30 33 37 66 32 39 66 32 39 30 62 62 33    c50037f29f290bb3
+0090   37 35 71 09 55 0B 58 2D 54 69 6D 65 73 74 61 6D    75q.U.X-Timestam
+00A0   70 71 0A 55 10 31 36 38 32 39 36 33 32 30 39 2E    pq.U.1682963209.
+00B0   38 32 32 37 32 71 0B 55 11 58 2D 4F 62 6A 65 63    82272q.U.X-Objec
+00C0   74 2D 4D 65 74 61 2D E2 98 83 71 0C 55 03 E2 98    t-Meta-...q.U...
+00D0   83 71 0D 55 13 58 2D 4F 62 6A 65 63 74 2D 4D 65    .q.U.X-Object-Me
+00E0   74 61 2D 4D 74 69 6D 65 71 0E 55 11 31 36 38 32    ta-Mtimeq.U.1682
+00F0   39 35 39 38 37 34 2E 37 35 36 32 30 35 71 0F 75    959874.756205q.u
+0100   2E                                                 .
+            ''',
+            'python_3.10.6_swift_2.23_replicated': '''
+0000   80 02 7D 71 00 28 63 5F 63 6F 64 65 63 73 0A 65    ..}q.(c_codecs.e
+0010   6E 63 6F 64 65 0A 71 01 58 0B 00 00 00 58 2D 54    ncode.q.X....X-T
+0020   69 6D 65 73 74 61 6D 70 71 02 58 06 00 00 00 6C    imestampq.X....l
+0030   61 74 69 6E 31 71 03 86 71 04 52 71 05 68 01 58    atin1q..q.Rq.h.X
+0040   10 00 00 00 31 36 38 32 39 36 33 30 31 37 2E 31    ....1682963017.1
+0050   30 34 37 32 71 06 68 03 86 71 07 52 71 08 68 01    0472q.h..q.Rq.h.
+0060   58 0C 00 00 00 43 6F 6E 74 65 6E 74 2D 54 79 70    X....Content-Typ
+0070   65 71 09 68 03 86 71 0A 52 71 0B 68 01 58 18 00    eq.h..q.Rq.h.X..
+0080   00 00 61 70 70 6C 69 63 61 74 69 6F 6E 2F 6F 63    ..application/oc
+0090   74 65 74 2D 73 74 72 65 61 6D 71 0C 68 03 86 71    tet-streamq.h..q
+00A0   0D 52 71 0E 68 01 58 0E 00 00 00 43 6F 6E 74 65    .Rq.h.X....Conte
+00B0   6E 74 2D 4C 65 6E 67 74 68 71 0F 68 03 86 71 10    nt-Lengthq.h..q.
+00C0   52 71 11 68 01 58 02 00 00 00 31 33 71 12 68 03    Rq.h.X....13q.h.
+00D0   86 71 13 52 71 14 68 01 58 04 00 00 00 45 54 61    .q.Rq.h.X....ETa
+00E0   67 71 15 68 03 86 71 16 52 71 17 68 01 58 20 00    gq.h..q.Rq.h.X .
+00F0   00 00 36 62 37 64 39 61 31 63 35 64 31 36 37 63    ..6b7d9a1c5d167c
+0100   63 35 30 30 33 37 66 32 39 66 32 39 30 62 62 33    c50037f29f290bb3
+0110   37 35 71 18 68 03 86 71 19 52 71 1A 68 01 58 13    75q.h..q.Rq.h.X.
+0120   00 00 00 58 2D 4F 62 6A 65 63 74 2D 4D 65 74 61    ...X-Object-Meta
+0130   2D 4D 74 69 6D 65 71 1B 68 03 86 71 1C 52 71 1D    -Mtimeq.h..q.Rq.
+0140   68 01 58 11 00 00 00 31 36 38 32 39 35 39 38 37    h.X....168295987
+0150   34 2E 37 35 36 32 30 35 71 1E 68 03 86 71 1F 52    4.756205q.h..q.R
+0160   71 20 68 01 58 1A 00 00 00 58 2D 4F 62 6A 65 63    q h.X....X-Objec
+0170   74 2D 4D 65 74 61 2D C3 83 C2 A2 C3 82 C2 98 C3    t-Meta-.........
+0180   82 C2 83 71 21 68 03 86 71 22 52 71 23 68 01 58    ...q!h..q"Rq#h.X
+0190   0C 00 00 00 C3 83 C2 A2 C3 82 C2 98 C3 82 C2 83    ................
+01A0   71 24 68 03 86 71 25 52 71 26 68 01 58 04 00 00    q$h..q%Rq&h.X...
+01B0   00 6E 61 6D 65 71 27 68 03 86 71 28 52 71 29 68    .nameq'h..q(Rq)h
+01C0   01 58 18 00 00 00 2F 41 55 54 48 5F 74 65 73 74    .X..../AUTH_test
+01D0   2F C3 A2 C2 98 C2 83 2F C3 A2 C2 98 C2 83 71 2A    /....../......q*
+01E0   68 03 86 71 2B 52 71 2C 75 2E                      h..q+Rq,u.
+            ''',
+            'python_2.7.18_swift_2.23_ec': '''
+0000   80 02 7D 71 01 28 55 0E 43 6F 6E 74 65 6E 74 2D    ..}q.(U.Content-
+0010   4C 65 6E 67 74 68 71 02 55 02 38 34 71 03 55 04    Lengthq.U.84q.U.
+0020   6E 61 6D 65 71 04 55 12 2F 41 55 54 48 5F 74 65    nameq.U./AUTH_te
+0030   73 74 2F E2 98 83 2F E2 98 83 71 05 55 1E 58 2D    st/.../...q.U.X-
+0040   4F 62 6A 65 63 74 2D 53 79 73 6D 65 74 61 2D 45    Object-Sysmeta-E
+0050   63 2D 46 72 61 67 2D 49 6E 64 65 78 55 01 35 55    c-Frag-IndexU.5U
+0060   0C 43 6F 6E 74 65 6E 74 2D 54 79 70 65 71 06 55    .Content-Typeq.U
+0070   18 61 70 70 6C 69 63 61 74 69 6F 6E 2F 6F 63 74    .application/oct
+0080   65 74 2D 73 74 72 65 61 6D 71 07 55 22 58 2D 4F    et-streamq.U"X-O
+0090   62 6A 65 63 74 2D 53 79 73 6D 65 74 61 2D 45 63    bject-Sysmeta-Ec
+00A0   2D 43 6F 6E 74 65 6E 74 2D 4C 65 6E 67 74 68 55    -Content-LengthU
+00B0   02 31 33 71 08 55 18 58 2D 4F 62 6A 65 63 74 2D    .13q.U.X-Object-
+00C0   53 79 73 6D 65 74 61 2D 45 63 2D 45 74 61 67 55    Sysmeta-Ec-EtagU
+00D0   20 36 62 37 64 39 61 31 63 35 64 31 36 37 63 63     6b7d9a1c5d167cc
+00E0   35 30 30 33 37 66 32 39 66 32 39 30 62 62 33 37    50037f29f290bb37
+00F0   35 71 09 55 04 45 54 61 67 71 0A 55 20 65 32 66    5q.U.ETagq.U e2f
+0100   64 34 33 30 65 61 66 37 32 32 33 63 32 35 30 33    d430eaf7223c2503
+0110   63 34 65 38 33 30 31 63 66 66 33 37 63 71 0B 55    c4e8301cff37cq.U
+0120   0B 58 2D 54 69 6D 65 73 74 61 6D 70 71 0C 55 10    .X-Timestampq.U.
+0130   31 36 38 32 39 36 33 31 33 30 2E 33 35 39 38 36    1682963130.35986
+0140   71 0D 55 11 58 2D 4F 62 6A 65 63 74 2D 4D 65 74    q.U.X-Object-Met
+0150   61 2D E2 98 83 71 0E 55 03 E2 98 83 71 0F 55 1A    a-...q.U....q.U.
+0160   58 2D 4F 62 6A 65 63 74 2D 53 79 73 6D 65 74 61    X-Object-Sysmeta
+0170   2D 45 63 2D 53 63 68 65 6D 65 55 1A 6C 69 62 65    -Ec-SchemeU.libe
+0180   72 61 73 75 72 65 63 6F 64 65 5F 72 73 5F 76 61    rasurecode_rs_va
+0190   6E 64 20 34 2B 32 71 10 55 13 58 2D 4F 62 6A 65    nd 4+2q.U.X-Obje
+01A0   63 74 2D 4D 65 74 61 2D 4D 74 69 6D 65 71 11 55    ct-Meta-Mtimeq.U
+01B0   11 31 36 38 32 39 35 39 38 37 34 2E 37 35 36 32    .1682959874.7562
+01C0   30 35 71 12 55 20 58 2D 4F 62 6A 65 63 74 2D 53    05q.U X-Object-S
+01D0   79 73 6D 65 74 61 2D 45 63 2D 53 65 67 6D 65 6E    ysmeta-Ec-Segmen
+01E0   74 2D 53 69 7A 65 55 07 31 30 34 38 35 37 36 71    t-SizeU.1048576q
+01F0   13 75 2E                                           .u.
+            ''',
+            'python_3.10.6_swift_2.23_ec': '''
+0000   80 02 7D 71 00 28 63 5F 63 6F 64 65 63 73 0A 65    ..}q.(c_codecs.e
+0010   6E 63 6F 64 65 0A 71 01 58 0B 00 00 00 58 2D 54    ncode.q.X....X-T
+0020   69 6D 65 73 74 61 6D 70 71 02 58 06 00 00 00 6C    imestampq.X....l
+0030   61 74 69 6E 31 71 03 86 71 04 52 71 05 68 01 58    atin1q..q.Rq.h.X
+0040   10 00 00 00 31 36 38 32 39 36 32 39 35 35 2E 33    ....1682962955.3
+0050   37 35 34 36 71 06 68 03 86 71 07 52 71 08 68 01    7546q.h..q.Rq.h.
+0060   58 0C 00 00 00 43 6F 6E 74 65 6E 74 2D 54 79 70    X....Content-Typ
+0070   65 71 09 68 03 86 71 0A 52 71 0B 68 01 58 18 00    eq.h..q.Rq.h.X..
+0080   00 00 61 70 70 6C 69 63 61 74 69 6F 6E 2F 6F 63    ..application/oc
+0090   74 65 74 2D 73 74 72 65 61 6D 71 0C 68 03 86 71    tet-streamq.h..q
+00A0   0D 52 71 0E 68 01 58 0E 00 00 00 43 6F 6E 74 65    .Rq.h.X....Conte
+00B0   6E 74 2D 4C 65 6E 67 74 68 71 0F 68 03 86 71 10    nt-Lengthq.h..q.
+00C0   52 71 11 68 01 58 02 00 00 00 38 34 71 12 68 03    Rq.h.X....84q.h.
+00D0   86 71 13 52 71 14 68 01 58 04 00 00 00 45 54 61    .q.Rq.h.X....ETa
+00E0   67 71 15 68 03 86 71 16 52 71 17 68 01 58 20 00    gq.h..q.Rq.h.X .
+00F0   00 00 65 32 66 64 34 33 30 65 61 66 37 32 32 33    ..e2fd430eaf7223
+0100   63 32 35 30 33 63 34 65 38 33 30 31 63 66 66 33    c2503c4e8301cff3
+0110   37 63 71 18 68 03 86 71 19 52 71 1A 68 01 58 13    7cq.h..q.Rq.h.X.
+0120   00 00 00 58 2D 4F 62 6A 65 63 74 2D 4D 65 74 61    ...X-Object-Meta
+0130   2D 4D 74 69 6D 65 71 1B 68 03 86 71 1C 52 71 1D    -Mtimeq.h..q.Rq.
+0140   68 01 58 11 00 00 00 31 36 38 32 39 35 39 38 37    h.X....168295987
+0150   34 2E 37 35 36 32 30 35 71 1E 68 03 86 71 1F 52    4.756205q.h..q.R
+0160   71 20 68 01 58 1A 00 00 00 58 2D 4F 62 6A 65 63    q h.X....X-Objec
+0170   74 2D 4D 65 74 61 2D C3 83 C2 A2 C3 82 C2 98 C3    t-Meta-.........
+0180   82 C2 83 71 21 68 03 86 71 22 52 71 23 68 01 58    ...q!h..q"Rq#h.X
+0190   0C 00 00 00 C3 83 C2 A2 C3 82 C2 98 C3 82 C2 83    ................
+01A0   71 24 68 03 86 71 25 52 71 26 68 01 58 18 00 00    q$h..q%Rq&h.X...
+01B0   00 58 2D 4F 62 6A 65 63 74 2D 53 79 73 6D 65 74    .X-Object-Sysmet
+01C0   61 2D 45 63 2D 45 74 61 67 71 27 68 03 86 71 28    a-Ec-Etagq'h..q(
+01D0   52 71 29 68 01 58 20 00 00 00 36 62 37 64 39 61    Rq)h.X ...6b7d9a
+01E0   31 63 35 64 31 36 37 63 63 35 30 30 33 37 66 32    1c5d167cc50037f2
+01F0   39 66 32 39 30 62 62 33 37 35 71 2A 68 03 86 71    9f290bb375q*h..q
+0200   2B 52 71 2C 68 01 58 22 00 00 00 58 2D 4F 62 6A    +Rq,h.X"...X-Obj
+0210   65 63 74 2D 53 79 73 6D 65 74 61 2D 45 63 2D 43    ect-Sysmeta-Ec-C
+0220   6F 6E 74 65 6E 74 2D 4C 65 6E 67 74 68 71 2D 68    ontent-Lengthq-h
+0230   03 86 71 2E 52 71 2F 68 01 58 02 00 00 00 31 33    ..q.Rq/h.X....13
+0240   71 30 68 03 86 71 31 52 71 32 68 01 58 1E 00 00    q0h..q1Rq2h.X...
+0250   00 58 2D 4F 62 6A 65 63 74 2D 53 79 73 6D 65 74    .X-Object-Sysmet
+0260   61 2D 45 63 2D 46 72 61 67 2D 49 6E 64 65 78 71    a-Ec-Frag-Indexq
+0270   33 68 03 86 71 34 52 71 35 68 01 58 01 00 00 00    3h..q4Rq5h.X....
+0280   35 71 36 68 03 86 71 37 52 71 38 68 01 58 1A 00    5q6h..q7Rq8h.X..
+0290   00 00 58 2D 4F 62 6A 65 63 74 2D 53 79 73 6D 65    ..X-Object-Sysme
+02A0   74 61 2D 45 63 2D 53 63 68 65 6D 65 71 39 68 03    ta-Ec-Schemeq9h.
+02B0   86 71 3A 52 71 3B 68 01 58 1A 00 00 00 6C 69 62    .q:Rq;h.X....lib
+02C0   65 72 61 73 75 72 65 63 6F 64 65 5F 72 73 5F 76    erasurecode_rs_v
+02D0   61 6E 64 20 34 2B 32 71 3C 68 03 86 71 3D 52 71    and 4+2q<h..q=Rq
+02E0   3E 68 01 58 20 00 00 00 58 2D 4F 62 6A 65 63 74    >h.X ...X-Object
+02F0   2D 53 79 73 6D 65 74 61 2D 45 63 2D 53 65 67 6D    -Sysmeta-Ec-Segm
+0300   65 6E 74 2D 53 69 7A 65 71 3F 68 03 86 71 40 52    ent-Sizeq?h..q@R
+0310   71 41 68 01 58 07 00 00 00 31 30 34 38 35 37 36    qAh.X....1048576
+0320   71 42 68 03 86 71 43 52 71 44 68 01 58 04 00 00    qBh..qCRqDh.X...
+0330   00 6E 61 6D 65 71 45 68 03 86 71 46 52 71 47 68    .nameqEh..qFRqGh
+0340   01 58 18 00 00 00 2F 41 55 54 48 5F 74 65 73 74    .X..../AUTH_test
+0350   2F C3 A2 C2 98 C2 83 2F C3 A2 C2 98 C2 83 71 48    /....../......qH
+0360   68 03 86 71 49 52 71 4A 75 2E                      h..qIRqJu.
+            ''',
+            'python3.8.10_swift_2.31.1_replicated': '''
+0000   80 02 7D 71 00 28 63 5F 63 6F 64 65 63 73 0A 65    ..}q.(c_codecs.e
+0010   6E 63 6F 64 65 0A 71 01 58 0B 00 00 00 58 2D 54    ncode.q.X....X-T
+0020   69 6D 65 73 74 61 6D 70 71 02 58 06 00 00 00 6C    imestampq.X....l
+0030   61 74 69 6E 31 71 03 86 71 04 52 71 05 68 01 58    atin1q..q.Rq.h.X
+0040   10 00 00 00 31 36 38 33 30 36 35 34 37 38 2E 32    ....1683065478.2
+0050   35 30 30 34 71 06 68 03 86 71 07 52 71 08 68 01    5004q.h..q.Rq.h.
+0060   58 0C 00 00 00 43 6F 6E 74 65 6E 74 2D 54 79 70    X....Content-Typ
+0070   65 71 09 68 03 86 71 0A 52 71 0B 68 01 58 18 00    eq.h..q.Rq.h.X..
+0080   00 00 61 70 70 6C 69 63 61 74 69 6F 6E 2F 6F 63    ..application/oc
+0090   74 65 74 2D 73 74 72 65 61 6D 71 0C 68 03 86 71    tet-streamq.h..q
+00A0   0D 52 71 0E 68 01 58 0E 00 00 00 43 6F 6E 74 65    .Rq.h.X....Conte
+00B0   6E 74 2D 4C 65 6E 67 74 68 71 0F 68 03 86 71 10    nt-Lengthq.h..q.
+00C0   52 71 11 68 01 58 01 00 00 00 38 71 12 68 03 86    Rq.h.X....8q.h..
+00D0   71 13 52 71 14 68 01 58 04 00 00 00 45 54 61 67    q.Rq.h.X....ETag
+00E0   71 15 68 03 86 71 16 52 71 17 68 01 58 20 00 00    q.h..q.Rq.h.X ..
+00F0   00 37 30 63 31 64 62 35 36 66 33 30 31 63 39 65    .70c1db56f301c9e
+0100   33 33 37 62 30 30 39 39 62 64 34 31 37 34 62 32    337b0099bd4174b2
+0110   38 71 18 68 03 86 71 19 52 71 1A 68 01 58 13 00    8q.h..q.Rq.h.X..
+0120   00 00 58 2D 4F 62 6A 65 63 74 2D 4D 65 74 61 2D    ..X-Object-Meta-
+0130   4D 74 69 6D 65 71 1B 68 03 86 71 1C 52 71 1D 68    Mtimeq.h..q.Rq.h
+0140   01 58 11 00 00 00 31 36 38 33 30 36 34 39 33 38    .X....1683064938
+0150   2E 36 39 39 30 32 37 71 1E 68 03 86 71 1F 52 71    .699027q.h..q.Rq
+0160   20 68 01 58 1A 00 00 00 58 2D 4F 62 6A 65 63 74     h.X....X-Object
+0170   2D 4D 65 74 61 2D C3 83 C2 A2 C3 82 C2 98 C3 82    -Meta-..........
+0180   C2 83 71 21 68 03 86 71 22 52 71 23 68 01 58 0C    ..q!h..q"Rq#h.X.
+0190   00 00 00 C3 83 C2 A2 C3 82 C2 98 C3 82 C2 83 71    ...............q
+01A0   24 68 03 86 71 25 52 71 26 68 01 58 04 00 00 00    $h..q%Rq&h.X....
+01B0   6E 61 6D 65 71 27 68 03 86 71 28 52 71 29 68 01    nameq'h..q(Rq)h.
+01C0   58 18 00 00 00 2F 41 55 54 48 5F 74 65 73 74 2F    X..../AUTH_test/
+01D0   C3 A2 C2 98 C2 83 2F C3 A2 C2 98 C2 83 71 2A 68    ....../......q*h
+01E0   03 86 71 2B 52 71 2C 75 2E                         ..q+Rq,u.
+            ''',
+        }
+
+        def raw_xattr(output):
+            return binascii.unhexlify(''.join(
+                line[7:55] for line in output.split('\n')
+            ).replace(' ', ''))
+
+        path = os.path.join(self.testdir, str(uuid.uuid4()))
+        for case, xattr_output in cases.items():
+            try:
+                to_write = raw_xattr(xattr_output)
+                with open(path, 'wb') as fp:
+                    xattr.setxattr(
+                        fp.fileno(), 'user.swift.metadata', to_write)
+                with open(path, 'rb') as fd:
+                    actual = diskfile.read_metadata(fd)
+                # name should come out as native strings
+                self.assertEqual(actual['name'], '/AUTH_test/\u2603/\u2603')
+                # other meta will be WSGI strings, though
+                self.assertEqual(
+                    actual['X-Object-Meta-\xe2\x98\x83'], '\xe2\x98\x83')
+            except Exception:
+                print('Failure in %s' % case, file=sys.stderr)
+                raise
+
+    def test_write_read_metadata(self):
+        path = os.path.join(self.testdir, str(uuid.uuid4()))
+        metadata = {'name': '/a/c/o',
+                    'Content-Length': 99,
+                    u'X-Object-Sysmeta-Ec-Frag-Index': 4,
+                    u'X-Object-Meta-Strange': u'should be bytes',
+                    b'X-Object-Meta-x\xff': b'not utf8 \xff',
+                    u'X-Object-Meta-y\xe8': u'not ascii \xe8'}
+        as_bytes = {b'name': b'/a/c/o',
+                    b'Content-Length': 99,
+                    b'X-Object-Sysmeta-Ec-Frag-Index': 4,
+                    b'X-Object-Meta-Strange': b'should be bytes',
+                    b'X-Object-Meta-x\xff': b'not utf8 \xff',
+                    b'X-Object-Meta-y\xc3\xa8': b'not ascii \xc3\xa8'}
+        as_native = dict((k.decode('utf-8', 'surrogateescape'),
+                          v if isinstance(v, int) else
+                          v.decode('utf-8', 'surrogateescape'))
+                         for k, v in as_bytes.items())
+
+        def check_metadata(expected, typ):
+            with open(path, 'rb') as fd:
+                actual = diskfile.read_metadata(fd)
+            self.assertEqual(expected, actual)
+            for k, v in actual.items():
+                self.assertIsInstance(k, typ)
+                self.assertIsInstance(v, (typ, int))
+
+        # Check can write raw bytes
+        with open(path, 'wb') as fd:
+            diskfile.write_metadata(fd, as_bytes)
+        check_metadata(as_native, str)
+        # Check can write native (with surrogates on py3)
+        with open(path, 'wb') as fd:
+            diskfile.write_metadata(fd, as_native)
+        check_metadata(as_native, str)
+        # Check can write some crazy mix
+        with open(path, 'wb') as fd:
+            diskfile.write_metadata(fd, metadata)
+        check_metadata(as_native, str)
+
+    def test_read_file_metadata(self):
+        path = os.path.join(self.testdir, str(uuid.uuid4()))
+        metadata = {'name': '/a/c/o'}
+        with open(path, 'wb') as fd:
+            diskfile.write_metadata(fd, metadata)
+
+        actual = diskfile._read_file_metadata(path)
+        self.assertEqual(metadata, actual)
+        with open(path, 'rb') as fd:
+            os.unlink(path)
+            actual = diskfile._read_file_metadata(fd)
+        self.assertEqual(metadata, actual)
+
+    def test_read_file_metadata_nonexistent_file(self):
+        with self.assertRaises(DiskFileStateChanged):
+            diskfile._read_file_metadata('nonexistent')
+
+    def test_read_metadata_nonexistent_file(self):
+        with self.assertRaises(DiskFileNotExist):
+            diskfile.read_metadata('nonexistent')
+
+
+@patch_policies
+class TestObjectAuditLocationGenerator(unittest.TestCase):
+    def _make_file(self, path):
+        try:
+            os.makedirs(os.path.dirname(path))
+        except OSError as err:
+            if err.errno != errno.EEXIST:
+                raise
+
+        with open(path, 'w'):
+            pass
+
+    def test_audit_location_class(self):
+        al = diskfile.AuditLocation('abc', '123', '_-_',
+                                    policy=POLICIES.legacy)
+        self.assertEqual(str(al), 'abc')
+
+    def test_finding_of_hashdirs(self):
+        with temptree([]) as tmpdir:
+            # the good
+            os.makedirs(os.path.join(tmpdir, "sdp", "objects", "1519", "aca",
+                                     "5c1fdc1ffb12e5eaf84edc30d8b67aca"))
+            os.makedirs(os.path.join(tmpdir, "sdp", "objects", "1519", "aca",
+                                     "fdfd184d39080020bc8b487f8a7beaca"))
+            os.makedirs(os.path.join(tmpdir, "sdp", "objects", "1519", "df2",
+                                     "b0fe7af831cc7b1af5bf486b1c841df2"))
+            os.makedirs(os.path.join(tmpdir, "sdp", "objects", "9720", "ca5",
+                                     "4a943bc72c2e647c4675923d58cf4ca5"))
+            os.makedirs(os.path.join(tmpdir, "sdq", "objects", "3071", "8eb",
+                                     "fcd938702024c25fef6c32fef05298eb"))
+            os.makedirs(os.path.join(tmpdir, "sdp", "objects-1", "9970", "ca5",
+                                     "4a943bc72c2e647c4675923d58cf4ca5"))
+
+            self._make_file(os.path.join(tmpdir, "sdp", "objects", "1519",
+                                         "fed"))
+            self._make_file(os.path.join(tmpdir, "sdq", "objects", "9876"))
+
+            # the empty
+            os.makedirs(os.path.join(tmpdir, "sdr"))
+            os.makedirs(os.path.join(tmpdir, "sds", "objects"))
+            os.makedirs(os.path.join(tmpdir, "sdt", "objects", "9601"))
+            os.makedirs(os.path.join(tmpdir, "sdu", "objects", "6499", "f80"))
+
+            # the irrelevant
+            os.makedirs(os.path.join(tmpdir, "sdv", "accounts", "77", "421",
+                                     "4b8c86149a6d532f4af018578fd9f421"))
+            os.makedirs(os.path.join(tmpdir, "sdw", "containers", "28", "51e",
+                                     "4f9eee668b66c6f0250bfa3c7ab9e51e"))
+
+            logger = debug_logger()
+            loc_generators = []
+            datadirs = ["objects", "objects-1"]
+            for datadir in datadirs:
+                loc_generators.append(
+                    diskfile.object_audit_location_generator(
+                        devices=tmpdir, datadir=datadir, mount_check=False,
+                        logger=logger))
+
+            all_locs = itertools.chain(*loc_generators)
+            locations = [(loc.path, loc.device, loc.partition, loc.policy) for
+                         loc in all_locs]
+            locations.sort()
+
+            expected =  \
+                [(os.path.join(tmpdir, "sdp", "objects-1", "9970", "ca5",
+                               "4a943bc72c2e647c4675923d58cf4ca5"),
+                  "sdp", "9970", POLICIES[1]),
+                 (os.path.join(tmpdir, "sdp", "objects", "1519", "aca",
+                               "5c1fdc1ffb12e5eaf84edc30d8b67aca"),
+                  "sdp", "1519", POLICIES[0]),
+                 (os.path.join(tmpdir, "sdp", "objects", "1519", "aca",
+                               "fdfd184d39080020bc8b487f8a7beaca"),
+                  "sdp", "1519", POLICIES[0]),
+                 (os.path.join(tmpdir, "sdp", "objects", "1519", "df2",
+                               "b0fe7af831cc7b1af5bf486b1c841df2"),
+                  "sdp", "1519", POLICIES[0]),
+                 (os.path.join(tmpdir, "sdp", "objects", "9720", "ca5",
+                               "4a943bc72c2e647c4675923d58cf4ca5"),
+                  "sdp", "9720", POLICIES[0]),
+                 (os.path.join(tmpdir, "sdq", "objects", "3071", "8eb",
+                               "fcd938702024c25fef6c32fef05298eb"),
+                  "sdq", "3071", POLICIES[0]),
+                 ]
+            self.assertEqual(locations, expected)
+
+            # Reset status file for next run
+            for datadir in datadirs:
+                diskfile.clear_auditor_status(tmpdir, datadir)
+
+            # now without a logger
+            for datadir in datadirs:
+                loc_generators.append(
+                    diskfile.object_audit_location_generator(
+                        devices=tmpdir, datadir=datadir, mount_check=False,
+                        logger=logger))
+
+            all_locs = itertools.chain(*loc_generators)
+            locations = [(loc.path, loc.device, loc.partition, loc.policy) for
+                         loc in all_locs]
+            locations.sort()
+            self.assertEqual(locations, expected)
+
+    def test_skipping_unmounted_devices(self):
+        with temptree([]) as tmpdir, mock_check_drive() as mocks:
+            mocks['ismount'].side_effect = lambda path: path.endswith('sdp')
+            os.makedirs(os.path.join(tmpdir, "sdp", "objects",
+                                     "2607", "df3",
+                                     "ec2871fe724411f91787462f97d30df3"))
+            os.makedirs(os.path.join(tmpdir, "sdq", "objects",
+                                     "9785", "a10",
+                                     "4993d582f41be9771505a8d4cb237a10"))
+
+            locations = [
+                (loc.path, loc.device, loc.partition, loc.policy)
+                for loc in diskfile.object_audit_location_generator(
+                    devices=tmpdir, datadir="objects", mount_check=True)]
+            locations.sort()
+
+            self.assertEqual(
+                locations,
+                [(os.path.join(tmpdir, "sdp", "objects",
+                               "2607", "df3",
+                               "ec2871fe724411f91787462f97d30df3"),
+                  "sdp", "2607", POLICIES[0])])
+
+            # Do it again, this time with a logger.
+            logger = debug_logger()
+            locations = [
+                (loc.path, loc.device, loc.partition, loc.policy)
+                for loc in diskfile.object_audit_location_generator(
+                    devices=tmpdir, datadir="objects", mount_check=True,
+                    logger=logger)]
+            debug_lines = logger.get_lines_for_level('debug')
+            self.assertEqual([
+                'Skipping: %s/sdq is not mounted' % tmpdir,
+            ], debug_lines)
+
+    def test_skipping_files(self):
+        with temptree([]) as tmpdir:
+            os.makedirs(os.path.join(tmpdir, "sdp", "objects",
+                                     "2607", "df3",
+                                     "ec2871fe724411f91787462f97d30df3"))
+            with open(os.path.join(tmpdir, "garbage"), "wb"):
+                pass
+
+            locations = [
+                (loc.path, loc.device, loc.partition, loc.policy)
+                for loc in diskfile.object_audit_location_generator(
+                    devices=tmpdir, datadir="objects", mount_check=False)]
+
+            self.assertEqual(
+                locations,
+                [(os.path.join(tmpdir, "sdp", "objects",
+                               "2607", "df3",
+                               "ec2871fe724411f91787462f97d30df3"),
+                  "sdp", "2607", POLICIES[0])])
+
+            # Do it again, this time with a logger.
+            logger = debug_logger('test')
+            locations = [
+                (loc.path, loc.device, loc.partition, loc.policy)
+                for loc in diskfile.object_audit_location_generator(
+                    devices=tmpdir, datadir="objects", mount_check=False,
+                    logger=logger)]
+            debug_lines = logger.get_lines_for_level('debug')
+            self.assertEqual([
+                'Skipping: %s/garbage is not a directory' % tmpdir,
+            ], debug_lines)
+            logger.clear()
+
+            with mock_check_drive() as mocks:
+                mocks['ismount'].side_effect = lambda path: (
+                    False if path.endswith('garbage') else True)
+                locations = [
+                    (loc.path, loc.device, loc.partition, loc.policy)
+                    for loc in diskfile.object_audit_location_generator(
+                        devices=tmpdir, datadir="objects", mount_check=True,
+                        logger=logger)]
+            debug_lines = logger.get_lines_for_level('debug')
+            self.assertEqual([
+                'Skipping: %s/garbage is not mounted' % tmpdir,
+            ], debug_lines)
+
+    def test_only_catch_expected_errors(self):
+        # Crazy exceptions should still escape object_audit_location_generator
+        # so that errors get logged and a human can see what's going wrong;
+        # only normal FS corruption should be skipped over silently.
+
+        def list_locations(dirname, datadir):
+            return [(loc.path, loc.device, loc.partition, loc.policy)
+                    for loc in diskfile.object_audit_location_generator(
+                        devices=dirname, datadir=datadir, mount_check=False)]
+
+        real_listdir = os.listdir
+
+        def splode_if_endswith(suffix):
+            def sploder(path):
+                if path.endswith(suffix):
+                    raise OSError(errno.EACCES, "don't try to ad-lib")
+                else:
+                    return real_listdir(path)
+            return sploder
+
+        with temptree([]) as tmpdir:
+            os.makedirs(os.path.join(tmpdir, "sdf", "objects",
+                                     "2607", "b54",
+                                     "fe450ec990a88cc4b252b181bab04b54"))
+            with mock.patch('os.listdir', splode_if_endswith("sdf/objects")):
+                self.assertRaises(OSError, list_locations, tmpdir, "objects")
+            with mock.patch('os.listdir', splode_if_endswith("2607")):
+                self.assertRaises(OSError, list_locations, tmpdir, "objects")
+            with mock.patch('os.listdir', splode_if_endswith("b54")):
+                self.assertRaises(OSError, list_locations, tmpdir, "objects")
+
+    def test_auditor_status(self):
+        with temptree([]) as tmpdir:
+            os.makedirs(os.path.join(tmpdir, "sdf", "objects", "1", "a", "b"))
+            os.makedirs(os.path.join(tmpdir, "sdf", "objects", "2", "a", "b"))
+            datadir = "objects"
+
+            # Pretend that some time passed between each partition
+            with mock.patch('os.stat') as mock_stat, \
+                    mock_check_drive(isdir=True):
+                mock_stat.return_value.st_mtime = time() - 60
+                # Auditor starts, there are two partitions to check
+                gen = diskfile.object_audit_location_generator(tmpdir,
+                                                               datadir,
+                                                               False)
+                next(gen)
+                next(gen)
+
+            # Auditor stopped for some reason without raising StopIterator in
+            # the generator and restarts There is now only one remaining
+            # partition to check
+            gen = diskfile.object_audit_location_generator(tmpdir, datadir,
+                                                           False)
+            with mock_check_drive(isdir=True):
+                next(gen)
+
+                # There are no more remaining partitions
+                self.assertRaises(StopIteration, next, gen)
+
+            # There are no partitions to check if the auditor restarts another
+            # time and the status files have not been cleared
+            gen = diskfile.object_audit_location_generator(tmpdir, datadir,
+                                                           False)
+            with mock_check_drive(isdir=True):
+                self.assertRaises(StopIteration, next, gen)
+
+            # Reset status file
+            diskfile.clear_auditor_status(tmpdir, datadir)
+
+            # If the auditor restarts another time, we expect to
+            # check two partitions again, because the remaining
+            # partitions were empty and a new listdir was executed
+            gen = diskfile.object_audit_location_generator(tmpdir, datadir,
+                                                           False)
+            with mock_check_drive(isdir=True):
+                next(gen)
+                next(gen)
+
+    def test_update_auditor_status_throttle(self):
+        # If there are a lot of nearly empty partitions, the
+        # update_auditor_status will write the status file many times a second,
+        # creating some unexpected high write load. This test ensures that the
+        # status file is only written once a minute.
+        with temptree([]) as tmpdir:
+            os.makedirs(os.path.join(tmpdir, "sdf", "objects", "1", "a", "b"))
+            with mock.patch('swift.obj.diskfile.open') as mock_open:
+                # File does not exist yet - write expected
+                update_auditor_status(tmpdir, None, ['42'], "ALL")
+                self.assertEqual(1, mock_open.call_count)
+
+                mock_open.reset_mock()
+
+                # File exists, updated just now - no write expected
+                with mock.patch('os.stat') as mock_stat:
+                    mock_stat.return_value.st_mtime = time()
+                    update_auditor_status(tmpdir, None, ['42'], "ALL")
+                    self.assertEqual(0, mock_open.call_count)
+
+                mock_open.reset_mock()
+
+                # File exists, updated just now, but empty partition list. This
+                # is a finalizing call, write expected
+                with mock.patch('os.stat') as mock_stat:
+                    mock_stat.return_value.st_mtime = time()
+                    update_auditor_status(tmpdir, None, [], "ALL")
+                    self.assertEqual(1, mock_open.call_count)
+
+                mock_open.reset_mock()
+
+                # File updated more than 60 seconds ago - write expected
+                with mock.patch('os.stat') as mock_stat:
+                    mock_stat.return_value.st_mtime = time() - 61
+                    update_auditor_status(tmpdir, None, ['42'], "ALL")
+                    self.assertEqual(1, mock_open.call_count)
+
+
+class TestDiskFileRouter(unittest.TestCase):
+
+    @patch_policies(test_policies)
+    def test_policy(self):
+        conf = {}
+        logger = debug_logger('test-' + self.__class__.__name__)
+        df_router = diskfile.DiskFileRouter(conf, logger)
+        manager_0 = df_router[POLICIES[0]]
+        self.assertIsInstance(manager_0, diskfile.DiskFileManager)
+        manager_1 = df_router[POLICIES[1]]
+        self.assertIsInstance(manager_1, diskfile.ECDiskFileManager)
+
+        # The DiskFileRouter should not have to load the policy again
+        with mock.patch('swift.common.storage_policy.BaseStoragePolicy.' +
+                        'get_diskfile_manager') as mock_load:
+            manager_3 = df_router[POLICIES[0]]
+            mock_load.assert_not_called()
+            self.assertIs(manager_3, manager_0)
+            self.assertIsInstance(manager_3, diskfile.DiskFileManager)
+
+    def test_invalid_policy_config(self):
+        # verify that invalid policy diskfile configs are detected when the
+        # DiskfileRouter is created
+        bad_policy = StoragePolicy(0, name='zero', is_default=True,
+                                   diskfile_module='erasure_coding.fs')
+
+        with patch_policies([bad_policy]):
+            with self.assertRaises(PolicyError) as cm:
+                diskfile.DiskFileRouter({}, debug_logger())
+        self.assertIn('Invalid diskfile_module erasure_coding.fs',
+                      str(cm.exception))
+
+        bad_policy = ECStoragePolicy(0, name='one', is_default=True,
+                                     ec_type=DEFAULT_TEST_EC_TYPE,
+                                     ec_ndata=10, ec_nparity=4,
+                                     diskfile_module='replication.fs')
+
+        with patch_policies([bad_policy]):
+            with self.assertRaises(PolicyError) as cm:
+                diskfile.DiskFileRouter({}, debug_logger())
+        self.assertIn('Invalid diskfile_module replication.fs',
+                      str(cm.exception))
+
+        bad_policy = StoragePolicy(0, name='zero', is_default=True,
+                                   diskfile_module='thin_air.fs')
+
+        with patch_policies([bad_policy]):
+            with self.assertRaises(PolicyError) as cm:
+                diskfile.DiskFileRouter({}, debug_logger())
+        self.assertIn('Unable to load diskfile_module thin_air.fs',
+                      str(cm.exception))
+
+
+class BaseDiskFileTestMixin(object):
+    """
+    Bag of helpers that are useful in the per-policy DiskFile test classes,
+    plus common setUp and tearDown methods.
+    """
+
+    # set mgr_cls on subclasses
+    mgr_cls = None
+
+    def setUp(self):
+        skip_if_no_xattrs()
+        self.tmpdir = mkdtemp()
+        self.testdir = os.path.join(
+            self.tmpdir, 'tmp_test_obj_server_DiskFile')
+        self.existing_device = 'sda1'
+        self.existing_device2 = 'sda2'
+        for policy in POLICIES:
+            mkdirs(os.path.join(self.testdir, self.existing_device,
+                                diskfile.get_tmp_dir(policy)))
+            mkdirs(os.path.join(self.testdir, self.existing_device2,
+                                diskfile.get_tmp_dir(policy)))
+        self._orig_tpool_exc = tpool.execute
+        tpool.execute = lambda f, *args, **kwargs: f(*args, **kwargs)
+        self.conf = dict(devices=self.testdir, mount_check='false',
+                         keep_cache_size=2 * 1024, mb_per_sync=1)
+        self.logger = debug_logger('test-' + self.__class__.__name__)
+        self.df_mgr = self.mgr_cls(self.conf, self.logger)
+        self.df_router = diskfile.DiskFileRouter(self.conf, self.logger)
+        self._ts_iter = (Timestamp(t) for t in
+                         itertools.count(int(time())))
+
+    def tearDown(self):
+        rmtree(self.tmpdir, ignore_errors=True)
+        tpool.execute = self._orig_tpool_exc
+
+    def _manager_mock(self, manager_attribute_name, df=None):
+        mgr_cls = df._manager.__class__ if df else self.mgr_cls
+        return '.'.join([
+            mgr_cls.__module__, mgr_cls.__name__, manager_attribute_name])
+
+
+class DiskFileManagerMixin(BaseDiskFileTestMixin):
+    """
+    Abstract test method mixin for concrete test cases - this class
+    won't get picked up by test runners because it doesn't subclass
+    unittest.TestCase and doesn't have [Tt]est in the name.
+    """
+    def _get_diskfile(self, policy, frag_index=None, **kwargs):
+        df_mgr = self.df_router[policy]
+        return df_mgr.get_diskfile('sda1', '0', 'a', 'c', 'o',
+                                   policy=policy, frag_index=frag_index,
+                                   **kwargs)
+
+    def test_init(self):
+        for policy in POLICIES:
+            df_router = diskfile.DiskFileRouter({}, self.logger)
+            df_mgr = df_router[policy]
+            self.assertEqual('/srv/node', df_mgr.devices)
+            self.assertEqual(604800, df_mgr.reclaim_age)
+            self.assertEqual(60.0, df_mgr.commit_window)
+            self.assertTrue(df_mgr.mount_check)
+
+        for policy in POLICIES:
+            conf = dict(devices=self.testdir,
+                        mount_check='false',
+                        reclaim_age=1000,
+                        commit_window=10.1)
+            df_router = diskfile.DiskFileRouter(conf, self.logger)
+            df_mgr = df_router[policy]
+            self.assertEqual(self.testdir, df_mgr.devices)
+            self.assertEqual(1000, df_mgr.reclaim_age)
+            self.assertEqual(10.1, df_mgr.commit_window)
+            self.assertFalse(df_mgr.mount_check)
+
+    def test_init_commit_window(self):
+        def assert_ok(value, expected):
+            for policy in POLICIES:
+                conf = {'commit_window': value}
+                df_mgr = diskfile.DiskFileRouter(conf, self.logger)[policy]
+                self.assertEqual(expected, df_mgr.commit_window)
+
+        assert_ok(10.1, 10.1)
+        assert_ok('10.1', 10.1)
+        assert_ok(0, 0.0)
+
+        def assert_invalid(value):
+            for policy in POLICIES:
+                conf = {'commit_window': value}
+                with self.assertRaises(ValueError):
+                    diskfile.DiskFileRouter(conf, self.logger)[policy]
+
+        assert_invalid(-1.1)
+        assert_invalid('-1.1')
+        assert_invalid('auto')
+
+    def test_cleanup_uses_configured_reclaim_age(self):
+        # verify that the reclaim_age used when cleaning up tombstones is
+        # either the default or the configured value
+        def do_test(ts, expect_reclaim):
+            for policy in POLICIES:
+                self.df_router = diskfile.DiskFileRouter(
+                    self.conf, self.logger)
+                df = self._get_diskfile(policy)
+                df.delete(ts.internal)
+                tombstone_file = os.path.join(df._datadir, ts.internal + '.ts')
+                # cleanup_ondisk_files always uses the configured value
+                df._manager.cleanup_ondisk_files(
+                    os.path.dirname(tombstone_file))
+                self.assertNotEqual(
+                    expect_reclaim, os.path.exists(tombstone_file))
+
+        # reclaim_age not configured so default should be used
+        do_test(Timestamp(time() - diskfile.DEFAULT_RECLAIM_AGE - 1), True)
+        do_test(Timestamp(time() - diskfile.DEFAULT_RECLAIM_AGE + 100), False)
+
+        # reclaim_age configured value should be used
+        self.conf['reclaim_age'] = 1000
+        do_test(Timestamp(time() - diskfile.DEFAULT_RECLAIM_AGE + 100), True)
+        do_test(Timestamp(time() - 1001), True)
+        do_test(Timestamp(time() + 100), False)
+
+    def _test_get_ondisk_files(self, scenarios, policy,
+                               frag_index=None, **kwargs):
+        class_under_test = self._get_diskfile(
+            policy, frag_index=frag_index, **kwargs)
+        for test in scenarios:
+            # test => [('filename.ext', '.ext'|False, ...), ...]
+            expected = {
+                ext[1:] + '_file': os.path.join(
+                    class_under_test._datadir, filename)
+                for (filename, ext) in [v[:2] for v in test]
+                if ext in ('.data', '.meta', '.ts')}
+            # list(zip(...)) for py3 compatibility (zip is lazy there)
+            files = list(list(zip(*test))[0])
+
+            for _order in ('ordered', 'shuffled', 'shuffled'):
+                class_under_test = self._get_diskfile(
+                    policy, frag_index=frag_index, **kwargs)
+                try:
+                    actual = class_under_test._get_ondisk_files(files)
+                    self._assertDictContainsSubset(
+                        expected, actual,
+                        'Expected %s from %s but got %s'
+                        % (expected, files, actual))
+                except AssertionError as e:
+                    self.fail('%s with files %s' % (str(e), files))
+                shuffle(files)
+
+    def _test_cleanup_ondisk_files(self, scenarios, policy,
+                                   reclaim_age=None, commit_window=None):
+        # check that expected files are left in hashdir after cleanup
+        for test in scenarios:
+            class_under_test = self.df_router[policy]
+            # list(zip(...)) for py3 compatibility (zip is lazy there)
+            files = list(list(zip(*test))[0])
+            hashdir = os.path.join(self.testdir, str(uuid.uuid4()))
+            os.mkdir(hashdir)
+            for fname in files:
+                open(os.path.join(hashdir, fname), 'w')
+            expected_after_cleanup = set([f[0] for f in test
+                                          if (f[2] if len(f) > 2 else f[1])])
+            if commit_window is not None:
+                class_under_test.commit_window = commit_window
+            if reclaim_age:
+                class_under_test.reclaim_age = reclaim_age
+                class_under_test.cleanup_ondisk_files(hashdir)
+            else:
+                with mock.patch('swift.obj.diskfile.time') as mock_time:
+                    # don't reclaim anything
+                    mock_time.time.return_value = 0.0
+                    class_under_test.cleanup_ondisk_files(hashdir)
+
+            if expected_after_cleanup:
+                after_cleanup = set(os.listdir(hashdir))
+                errmsg = "expected %r, got %r for test %r" % (
+                    sorted(expected_after_cleanup), sorted(after_cleanup), test
+                )
+                self.assertEqual(expected_after_cleanup, after_cleanup, errmsg)
+            else:
+                self.assertFalse(os.path.exists(hashdir))
+
+    def _test_yield_hashes_cleanup(self, scenarios, policy):
+        # opportunistic test to check that yield_hashes cleans up dir using
+        # same scenarios as passed to _test_cleanup_ondisk_files_files
+        for test in scenarios:
+            class_under_test = self.df_router[policy]
+            # list(zip(...)) for py3 compatibility (zip is lazy there)
+            files = list(list(zip(*test))[0])
+            dev_path = os.path.join(self.testdir, str(uuid.uuid4()))
+            hashdir = os.path.join(
+                dev_path, diskfile.get_data_dir(policy),
+                '0', 'abc', '9373a92d072897b136b3fc06595b4abc')
+            os.makedirs(hashdir)
+            for fname in files:
+                open(os.path.join(hashdir, fname), 'w')
+            expected_after_cleanup = set([f[0] for f in test
+                                          if f[1] or len(f) > 2 and f[2]])
+            with mock.patch('swift.obj.diskfile.time') as mock_time:
+                # don't reclaim anything
+                mock_time.time.return_value = 0.0
+                mocked = 'swift.obj.diskfile.BaseDiskFileManager.get_dev_path'
+                with mock.patch(mocked) as mock_path:
+                    mock_path.return_value = dev_path
+                    for _ in class_under_test.yield_hashes(
+                            'ignored', '0', policy, suffixes=['abc']):
+                        # return values are tested in test_yield_hashes_*
+                        pass
+
+            if expected_after_cleanup:
+                after_cleanup = set(os.listdir(hashdir))
+                errmsg = "expected %r, got %r for test %r" % (
+                    sorted(expected_after_cleanup), sorted(after_cleanup), test
+                )
+                self.assertEqual(expected_after_cleanup, after_cleanup, errmsg)
+            else:
+                self.assertFalse(os.path.exists(hashdir))
+
+    def test_get_ondisk_files_with_empty_dir(self):
+        files = []
+        expected = dict(
+            data_file=None, meta_file=None, ctype_file=None, ts_file=None)
+        for policy in POLICIES:
+            for frag_index in (0, None, '13'):
+                # check manager
+                df_mgr = self.df_router[policy]
+                datadir = os.path.join('/srv/node/sdb1/',
+                                       diskfile.get_data_dir(policy))
+                actual = df_mgr.get_ondisk_files(files, datadir)
+                self._assertDictContainsSubset(expected, actual)
+                # check diskfile under the hood
+                df = self._get_diskfile(policy, frag_index=frag_index)
+                actual = df._get_ondisk_files(files)
+                self._assertDictContainsSubset(expected, actual)
+                # check diskfile open
+                self.assertRaises(DiskFileNotExist, df.open)
+
+    def test_get_ondisk_files_with_unexpected_file(self):
+        unexpected_files = ['junk', 'junk.data', '.junk']
+        timestamp = next(make_timestamp_iter())
+        tomb_file = timestamp.internal + '.ts'
+        for policy in POLICIES:
+            for unexpected in unexpected_files:
+                self.logger.clear()
+                files = [unexpected, tomb_file]
+                df_mgr = self.df_router[policy]
+                datadir = os.path.join('/srv/node/sdb1/',
+                                       diskfile.get_data_dir(policy))
+
+                results = df_mgr.get_ondisk_files(files, datadir)
+
+                expected = {'ts_file': os.path.join(datadir, tomb_file)}
+                self._assertDictContainsSubset(expected, results)
+                log_lines = df_mgr.logger.get_lines_for_level('warning')
+                self.assertTrue(
+                    log_lines[0].startswith(
+                        'Unexpected file %s'
+                        % os.path.join(datadir, unexpected)))
+
+    def test_get_ondisk_files_no_rsync_temp_file_warning(self):
+        # get_ondisk_files logs no warnings for rsync temp files
+
+        class_under_test = self._get_diskfile(POLICIES[0])
+        files = [
+            '.1472017820.44503.data.QBYCYU',  # rsync tempfile for a .data
+            '.total-bs.abcdef',   # example of false positive
+        ]
+        paths = [os.path.join(class_under_test._datadir, f) for f in files]
+        expected = {'unexpected': paths}
+        results = class_under_test._get_ondisk_files(files)
+        for k, v in expected.items():
+            self.assertEqual(results[k], v)
+        # no warnings
+        self.assertFalse(self.logger.get_lines_for_level('warning'))
+        # but we do get a debug!
+        lines = self.logger.get_lines_for_level('debug')
+        for path in paths:
+            expected_msg = 'Rsync tempfile: %s' % path
+            self.assertIn(expected_msg, lines)
+
+    def test_cleanup_ondisk_files_reclaim_non_data_files(self):
+        # Each scenario specifies a list of (filename, extension, [survives])
+        # tuples. If extension is set or 'survives' is True, the filename
+        # should still be in the dir after cleanup.
+        much_older = Timestamp(time() - 2000).internal
+        older = Timestamp(time() - 1001).internal
+        newer = Timestamp(time() - 900).internal
+        scenarios = [
+            [('%s.ts' % older, False, False)],
+
+            # fresh tombstone is preserved
+            [('%s.ts' % newer, '.ts', True)],
+
+            # tombstone reclaimed despite junk file
+            [('junk', False, True),
+             ('%s.ts' % much_older, '.ts', False)],
+
+            # fresh .meta not reclaimed even if isolated
+            [('%s.meta' % newer, '.meta')],
+
+            # fresh .meta not reclaimed when tombstone is reclaimed
+            [('%s.meta' % newer, '.meta'),
+             ('%s.ts' % older, False, False)],
+
+            # stale isolated .meta is reclaimed
+            [('%s.meta' % older, False, False)],
+
+            # stale .meta is reclaimed along with tombstone
+            [('%s.meta' % older, False, False),
+             ('%s.ts' % older, False, False)]]
+
+        self._test_cleanup_ondisk_files(scenarios, POLICIES.default,
+                                        reclaim_age=1000, commit_window=0)
+
+    def test_construct_dev_path(self):
+        res_path = self.df_mgr.construct_dev_path('abc')
+        self.assertEqual(os.path.join(self.df_mgr.devices, 'abc'), res_path)
+
+    def test_pickle_async_update(self):
+        self.df_mgr.logger.increment = mock.MagicMock()
+        ts = Timestamp(10000.0).internal
+        with mock.patch('swift.obj.diskfile.write_pickle') as wp:
+            self.df_mgr.pickle_async_update(self.existing_device,
+                                            'a', 'c', 'o',
+                                            dict(a=1, b=2), ts, POLICIES[0])
+            dp = self.df_mgr.construct_dev_path(self.existing_device)
+            ohash = diskfile.hash_path('a', 'c', 'o')
+            wp.assert_called_with({'a': 1, 'b': 2},
+                                  os.path.join(
+                                      dp, diskfile.get_async_dir(POLICIES[0]),
+                                      ohash[-3:], ohash + '-' + ts),
+                                  os.path.join(dp, 'tmp'))
+        self.df_mgr.logger.increment.assert_called_with('async_pendings')
+
+    def test_object_audit_location_generator(self):
+        locations = list(
+            self.df_mgr.object_audit_location_generator(POLICIES[0]))
+        self.assertEqual(locations, [])
+
+    def test_replication_one_per_device_deprecation(self):
+        conf = dict(**self.conf)
+        mgr = diskfile.DiskFileManager(conf, self.logger)
+        self.assertEqual(mgr.replication_concurrency_per_device, 1)
+
+        conf = dict(replication_concurrency_per_device='0', **self.conf)
+        mgr = diskfile.DiskFileManager(conf, self.logger)
+        self.assertEqual(mgr.replication_concurrency_per_device, 0)
+
+        conf = dict(replication_concurrency_per_device='2', **self.conf)
+        mgr = diskfile.DiskFileManager(conf, self.logger)
+        self.assertEqual(mgr.replication_concurrency_per_device, 2)
+
+        conf = dict(replication_concurrency_per_device=2, **self.conf)
+        mgr = diskfile.DiskFileManager(conf, self.logger)
+        self.assertEqual(mgr.replication_concurrency_per_device, 2)
+
+        # Check backward compatibility
+        conf = dict(replication_one_per_device='true', **self.conf)
+        mgr = diskfile.DiskFileManager(conf, self.logger)
+        self.assertEqual(mgr.replication_concurrency_per_device, 1)
+        log_lines = mgr.logger.get_lines_for_level('warning')
+        self.assertIn('replication_one_per_device is deprecated',
+                      log_lines[-1])
+
+        conf = dict(replication_one_per_device='false', **self.conf)
+        mgr = diskfile.DiskFileManager(conf, self.logger)
+        self.assertEqual(mgr.replication_concurrency_per_device, 0)
+        log_lines = mgr.logger.get_lines_for_level('warning')
+        self.assertIn('replication_one_per_device is deprecated',
+                      log_lines[-1])
+
+        # If defined, new parameter has precedence
+        conf = dict(replication_concurrency_per_device='2',
+                    replication_one_per_device='true', **self.conf)
+        mgr = diskfile.DiskFileManager(conf, self.logger)
+        self.assertEqual(mgr.replication_concurrency_per_device, 2)
+        log_lines = mgr.logger.get_lines_for_level('warning')
+        self.assertIn('replication_one_per_device ignored',
+                      log_lines[-1])
+
+        conf = dict(replication_concurrency_per_device='2',
+                    replication_one_per_device='false', **self.conf)
+        mgr = diskfile.DiskFileManager(conf, self.logger)
+        self.assertEqual(mgr.replication_concurrency_per_device, 2)
+        log_lines = mgr.logger.get_lines_for_level('warning')
+        self.assertIn('replication_one_per_device ignored',
+                      log_lines[-1])
+
+        conf = dict(replication_concurrency_per_device='0',
+                    replication_one_per_device='true', **self.conf)
+        mgr = diskfile.DiskFileManager(conf, self.logger)
+        self.assertEqual(mgr.replication_concurrency_per_device, 0)
+        log_lines = mgr.logger.get_lines_for_level('warning')
+        self.assertIn('replication_one_per_device ignored',
+                      log_lines[-1])
+
+    def test_replication_lock_on(self):
+        # Double check settings
+        self.df_mgr.replication_concurrency_per_device = 1
+        self.df_mgr.replication_lock_timeout = 0.1
+        success = False
+        with self.df_mgr.replication_lock(self.existing_device,
+                                          POLICIES.legacy, '1'):
+            with self.assertRaises(ReplicationLockTimeout):
+                with self.df_mgr.replication_lock(self.existing_device,
+                                                  POLICIES.legacy, '2'):
+                    success = True
+        self.assertFalse(success)
+
+    def test_replication_lock_off(self):
+        # Double check settings
+        self.df_mgr.replication_concurrency_per_device = 0
+        self.df_mgr.replication_lock_timeout = 0.1
+
+        # 2 locks must succeed
+        success = False
+        with self.df_mgr.replication_lock(self.existing_device,
+                                          POLICIES.legacy, '1'):
+            try:
+                with self.df_mgr.replication_lock(self.existing_device,
+                                                  POLICIES.legacy, '2'):
+                    success = True
+            except ReplicationLockTimeout as err:
+                self.fail('Unexpected exception: %s' % err)
+        self.assertTrue(success)
+
+        # 3 locks must succeed
+        success = False
+        with self.df_mgr.replication_lock(self.existing_device,
+                                          POLICIES.legacy, '1'):
+            with self.df_mgr.replication_lock(self.existing_device,
+                                              POLICIES.legacy, '2'):
+                try:
+                    with self.df_mgr.replication_lock(self.existing_device,
+                                                      POLICIES.legacy, '3'):
+                        success = True
+                except ReplicationLockTimeout as err:
+                    self.fail('Unexpected exception: %s' % err)
+        self.assertTrue(success)
+
+    def test_replication_lock_2(self):
+        # Double check settings
+        self.df_mgr.replication_concurrency_per_device = 2
+        self.df_mgr.replication_lock_timeout = 0.1
+
+        # 2 locks with replication_concurrency_per_device=2 must succeed
+        success = False
+        with self.df_mgr.replication_lock(self.existing_device,
+                                          POLICIES.legacy, '1'):
+            try:
+                with self.df_mgr.replication_lock(self.existing_device,
+                                                  POLICIES.legacy, '2'):
+                    success = True
+            except ReplicationLockTimeout as err:
+                self.fail('Unexpected exception: %s' % err)
+        self.assertTrue(success)
+
+        # 3 locks with replication_concurrency_per_device=2 must fail
+        success = False
+        with self.df_mgr.replication_lock(self.existing_device,
+                                          POLICIES.legacy, '1'):
+            with self.df_mgr.replication_lock(self.existing_device,
+                                              POLICIES.legacy, '2'):
+                with self.assertRaises(ReplicationLockTimeout):
+                    with self.df_mgr.replication_lock(self.existing_device,
+                                                      POLICIES.legacy, '3'):
+                        success = True
+        self.assertFalse(success)
+
+    def test_replication_lock_another_device_fine(self):
+        # Double check settings
+        self.df_mgr.replication_concurrency_per_device = 1
+        self.df_mgr.replication_lock_timeout = 0.1
+        success = False
+        with self.df_mgr.replication_lock(self.existing_device,
+                                          POLICIES.legacy, '1'):
+            try:
+                with self.df_mgr.replication_lock(self.existing_device2,
+                                                  POLICIES.legacy, '2'):
+                    success = True
+            except ReplicationLockTimeout as err:
+                self.fail('Unexpected exception: %s' % err)
+        self.assertTrue(success)
+
+    def test_replication_lock_same_partition(self):
+        # Double check settings
+        self.df_mgr.replication_concurrency_per_device = 2
+        self.df_mgr.replication_lock_timeout = 0.1
+        success = False
+        with self.df_mgr.replication_lock(self.existing_device,
+                                          POLICIES.legacy, '1'):
+            with self.assertRaises(PartitionLockTimeout):
+                with self.df_mgr.replication_lock(self.existing_device,
+                                                  POLICIES.legacy, '1'):
+                    success = True
+        self.assertFalse(success)
+
+    def test_partition_lock_same_partition(self):
+        # Double check settings
+        self.df_mgr.replication_lock_timeout = 0.1
+        success = False
+        with self.df_mgr.partition_lock(self.existing_device,
+                                        POLICIES.legacy, '1', name='foo'):
+            with self.assertRaises(PartitionLockTimeout):
+                with self.df_mgr.partition_lock(self.existing_device,
+                                                POLICIES.legacy, '1',
+                                                name='foo'):
+                    success = True
+        self.assertFalse(success)
+
+    def test_partition_lock_same_partition_different_name(self):
+        # Double check settings
+        self.df_mgr.replication_lock_timeout = 0.1
+        success = False
+        with self.df_mgr.partition_lock(self.existing_device,
+                                        POLICIES.legacy, '1', name='foo'):
+            with self.df_mgr.partition_lock(self.existing_device,
+                                            POLICIES.legacy, '1',
+                                            name='bar'):
+                success = True
+        self.assertTrue(success)
+
+    def test_partition_lock_and_replication_lock_same_partition(self):
+        # Double check settings
+        self.df_mgr.replication_lock_timeout = 0.1
+        success = False
+        with self.df_mgr.partition_lock(self.existing_device,
+                                        POLICIES.legacy, '1',
+                                        name='replication'):
+            with self.assertRaises(PartitionLockTimeout):
+                with self.df_mgr.replication_lock(self.existing_device,
+                                                  POLICIES.legacy, '1'):
+                    success = True
+        self.assertFalse(success)
+
+        success = False
+        with self.df_mgr.replication_lock(self.existing_device,
+                                          POLICIES.legacy, '1'):
+            with self.assertRaises(PartitionLockTimeout):
+                with self.df_mgr.partition_lock(self.existing_device,
+                                                POLICIES.legacy, '1',
+                                                name='replication'):
+                    success = True
+        self.assertFalse(success)
+
+    def test_missing_splice_warning(self):
+        with mock.patch('swift.common.splice.splice._c_splice', None):
+            self.conf['splice'] = 'yes'
+            mgr = diskfile.DiskFileManager(self.conf, logger=self.logger)
+
+        warnings = self.logger.get_lines_for_level('warning')
+        self.assertGreater(len(warnings), 0)
+        self.assertTrue('splice()' in warnings[-1])
+        self.assertFalse(mgr.use_splice)
+
+    def test_get_diskfile_from_hash_dev_path_fail(self):
+        self.df_mgr.get_dev_path = mock.MagicMock(return_value=None)
+        with mock.patch(self._manager_mock('diskfile_cls')), \
+                mock.patch(self._manager_mock(
+                    'cleanup_ondisk_files')) as cleanup, \
+                mock.patch('swift.obj.diskfile.read_metadata') as readmeta:
+            cleanup.return_value = {'files': ['1381679759.90941.data']}
+            readmeta.return_value = {'name': '/a/c/o'}
+            self.assertRaises(
+                DiskFileDeviceUnavailable,
+                self.df_mgr.get_diskfile_from_hash,
+                'dev', '9', '9a7175077c01a23ade5956b8a2bba900', POLICIES[0])
+
+    def test_get_diskfile_from_hash_not_dir(self):
+        self.df_mgr.get_dev_path = mock.MagicMock(return_value='/srv/dev/')
+        with mock.patch(self._manager_mock('diskfile_cls')), \
+                mock.patch(self._manager_mock(
+                    'cleanup_ondisk_files')) as cleanup, \
+                mock.patch('swift.obj.diskfile.read_metadata') as readmeta, \
+                mock.patch(self._manager_mock(
+                    'quarantine_renamer')) as quarantine_renamer:
+            osexc = OSError()
+            osexc.errno = errno.ENOTDIR
+            cleanup.side_effect = osexc
+            readmeta.return_value = {'name': '/a/c/o'}
+            self.assertRaises(
+                DiskFileNotExist,
+                self.df_mgr.get_diskfile_from_hash,
+                'dev', '9', '9a7175077c01a23ade5956b8a2bba900', POLICIES[0])
+            quarantine_renamer.assert_called_once_with(
+                '/srv/dev/',
+                ('/srv/dev/objects/9/900/9a7175077c01a23ade5956b8a2bba900/' +
+                 'made-up-filename'))
+
+    def test_get_diskfile_from_hash_no_data(self):
+        self.df_mgr.get_dev_path = mock.MagicMock(return_value='/srv/dev/')
+        with mock.patch(self._manager_mock('diskfile_cls')), \
+                mock.patch(self._manager_mock(
+                    'cleanup_ondisk_files')) as cleanup, \
+                mock.patch('swift.obj.diskfile.read_metadata') as readmeta, \
+                mock.patch(self._manager_mock(
+                    'quarantine_renamer')) as quarantine_renamer:
+            osexc = OSError()
+            osexc.errno = errno.ENODATA
+            cleanup.side_effect = osexc
+            readmeta.return_value = {'name': '/a/c/o'}
+            self.assertRaises(
+                DiskFileNotExist,
+                self.df_mgr.get_diskfile_from_hash,
+                'dev', '9', '9a7175077c01a23ade5956b8a2bba900', POLICIES[0])
+            quarantine_renamer.assert_called_once_with(
+                '/srv/dev/',
+                ('/srv/dev/objects/9/900/9a7175077c01a23ade5956b8a2bba900/' +
+                 'made-up-filename'))
+
+    def test_get_diskfile_from_hash_unclean(self):
+        self.df_mgr.get_dev_path = mock.MagicMock(return_value='/srv/dev/')
+        with mock.patch(self._manager_mock('diskfile_cls')), \
+                mock.patch(self._manager_mock(
+                    'cleanup_ondisk_files')) as cleanup, \
+                mock.patch('swift.obj.diskfile.read_metadata') as readmeta, \
+                mock.patch(self._manager_mock(
+                    'quarantine_renamer')) as quarantine_renamer:
+            osexc = OSError()
+            osexc.errno = EUCLEAN
+            cleanup.side_effect = osexc
+            readmeta.return_value = {'name': '/a/c/o'}
+            self.assertRaises(
+                DiskFileNotExist,
+                self.df_mgr.get_diskfile_from_hash,
+                'dev', '9', '9a7175077c01a23ade5956b8a2bba900', POLICIES[0])
+            quarantine_renamer.assert_called_once_with(
+                '/srv/dev/',
+                ('/srv/dev/objects/9/900/9a7175077c01a23ade5956b8a2bba900/' +
+                 'made-up-filename'))
+
+    def test_get_diskfile_from_hash_no_dir(self):
+        self.df_mgr.get_dev_path = mock.MagicMock(return_value='/srv/dev/')
+        with mock.patch(self._manager_mock('diskfile_cls')), \
+                mock.patch(self._manager_mock(
+                    'cleanup_ondisk_files')) as cleanup, \
+                mock.patch('swift.obj.diskfile.read_metadata') as readmeta:
+            osexc = OSError()
+            osexc.errno = errno.ENOENT
+            cleanup.side_effect = osexc
+            readmeta.return_value = {'name': '/a/c/o'}
+            self.assertRaises(
+                DiskFileNotExist,
+                self.df_mgr.get_diskfile_from_hash,
+                'dev', '9', '9a7175077c01a23ade5956b8a2bba900', POLICIES[0])
+
+    def test_get_diskfile_from_hash_other_oserror(self):
+        self.df_mgr.get_dev_path = mock.MagicMock(return_value='/srv/dev/')
+        with mock.patch(self._manager_mock('diskfile_cls')), \
+                mock.patch(self._manager_mock(
+                    'cleanup_ondisk_files')) as cleanup, \
+                mock.patch('swift.obj.diskfile.read_metadata') as readmeta:
+            osexc = OSError()
+            cleanup.side_effect = osexc
+            readmeta.return_value = {'name': '/a/c/o'}
+            self.assertRaises(
+                OSError,
+                self.df_mgr.get_diskfile_from_hash,
+                'dev', '9', '9a7175077c01a23ade5956b8a2bba900', POLICIES[0])
+
+    def test_get_diskfile_from_hash_no_actual_files(self):
+        self.df_mgr.get_dev_path = mock.MagicMock(return_value='/srv/dev/')
+        with mock.patch(self._manager_mock('diskfile_cls')), \
+                mock.patch(self._manager_mock(
+                    'cleanup_ondisk_files')) as cleanup, \
+                mock.patch('swift.obj.diskfile.read_metadata') as readmeta:
+            cleanup.return_value = {'files': []}
+            readmeta.return_value = {'name': '/a/c/o'}
+            self.assertRaises(
+                DiskFileNotExist,
+                self.df_mgr.get_diskfile_from_hash,
+                'dev', '9', '9a7175077c01a23ade5956b8a2bba900', POLICIES[0])
+
+    def test_get_diskfile_from_hash_read_metadata_problem(self):
+        self.df_mgr.get_dev_path = mock.MagicMock(return_value='/srv/dev/')
+        with mock.patch(self._manager_mock('diskfile_cls')), \
+                mock.patch(self._manager_mock(
+                    'cleanup_ondisk_files')) as cleanup, \
+                mock.patch('swift.obj.diskfile.read_metadata') as readmeta:
+            cleanup.return_value = {'files': ['1381679759.90941.data']}
+            readmeta.side_effect = EOFError()
+            self.assertRaises(
+                DiskFileNotExist,
+                self.df_mgr.get_diskfile_from_hash,
+                'dev', '9', '9a7175077c01a23ade5956b8a2bba900', POLICIES[0])
+
+    def test_get_diskfile_from_hash_no_meta_name(self):
+        self.df_mgr.get_dev_path = mock.MagicMock(return_value='/srv/dev/')
+        with mock.patch(self._manager_mock('diskfile_cls')), \
+                mock.patch(self._manager_mock(
+                    'cleanup_ondisk_files')) as cleanup, \
+                mock.patch('swift.obj.diskfile.read_metadata') as readmeta:
+            cleanup.return_value = {'files': ['1381679759.90941.data']}
+            readmeta.return_value = {}
+            try:
+                self.df_mgr.get_diskfile_from_hash(
+                    'dev', '9', '9a7175077c01a23ade5956b8a2bba900',
+                    POLICIES[0])
+            except DiskFileNotExist as err:
+                exc = err
+            self.assertEqual(str(exc), '')
+
+    def test_get_diskfile_from_hash_bad_meta_name(self):
+        self.df_mgr.get_dev_path = mock.MagicMock(return_value='/srv/dev/')
+        with mock.patch(self._manager_mock('diskfile_cls')), \
+                mock.patch(self._manager_mock(
+                    'cleanup_ondisk_files')) as cleanup, \
+                mock.patch('swift.obj.diskfile.read_metadata') as readmeta:
+            cleanup.return_value = {'files': ['1381679759.90941.data']}
+            readmeta.return_value = {'name': 'bad'}
+            try:
+                self.df_mgr.get_diskfile_from_hash(
+                    'dev', '9', '9a7175077c01a23ade5956b8a2bba900',
+                    POLICIES[0])
+            except DiskFileNotExist as err:
+                exc = err
+            self.assertEqual(str(exc), '')
+
+    def test_get_diskfile_from_hash(self):
+        self.df_mgr.get_dev_path = mock.MagicMock(return_value='/srv/dev/')
+        mock_return = object()
+        with mock.patch(self._manager_mock('diskfile_cls'),
+                        return_value=mock_return) as dfclass, \
+                mock.patch(self._manager_mock(
+                    'cleanup_ondisk_files')) as cleanup, \
+                mock.patch('swift.obj.diskfile.read_metadata') as readmeta:
+            cleanup.return_value = {'files': ['1381679759.90941.data']}
+            readmeta.return_value = {'name': '/a/c/o'}
+            actual = self.df_mgr.get_diskfile_from_hash(
+                'dev', '9', '9a7175077c01a23ade5956b8a2bba900', POLICIES[0])
+            dfclass.assert_called_once_with(
+                self.df_mgr, '/srv/dev/', '9',
+                'a', 'c', 'o', policy=POLICIES[0])
+            cleanup.assert_called_once_with(
+                '/srv/dev/objects/9/900/9a7175077c01a23ade5956b8a2bba900')
+            readmeta.assert_called_once_with(
+                '/srv/dev/objects/9/900/9a7175077c01a23ade5956b8a2bba900/'
+                '1381679759.90941.data')
+            self.assertEqual(mock_return, actual)
+
+    def test_get_diskfile_and_filenames_from_hash(self):
+        self.df_mgr.get_dev_path = mock.MagicMock(return_value='/srv/dev/')
+        mock_return = object()
+        with mock.patch(self._manager_mock('diskfile_cls'),
+                        return_value=mock_return) as dfclass, \
+                mock.patch(self._manager_mock(
+                    'cleanup_ondisk_files')) as cleanup, \
+                mock.patch('swift.obj.diskfile.read_metadata') as readmeta:
+            cleanup.return_value = {'files': ['1381679759.90941.data']}
+            readmeta.return_value = {'name': '/a/c/o'}
+            actual, names = self.df_mgr.get_diskfile_and_filenames_from_hash(
+                'dev', '9', '9a7175077c01a23ade5956b8a2bba900', POLICIES[0])
+            dfclass.assert_called_once_with(
+                self.df_mgr, '/srv/dev/', '9',
+                'a', 'c', 'o', policy=POLICIES[0])
+            cleanup.assert_called_once_with(
+                '/srv/dev/objects/9/900/9a7175077c01a23ade5956b8a2bba900')
+            readmeta.assert_called_once_with(
+                '/srv/dev/objects/9/900/9a7175077c01a23ade5956b8a2bba900/'
+                '1381679759.90941.data')
+            self.assertEqual(mock_return, actual)
+            self.assertEqual(['1381679759.90941.data'], names)
+
+    def test_listdir_enoent(self):
+        oserror = OSError()
+        oserror.errno = errno.ENOENT
+        self.df_mgr.logger.error = mock.MagicMock()
+        with mock.patch('os.listdir', side_effect=oserror):
+            self.assertEqual(self.df_mgr._listdir('path'), [])
+            self.assertEqual(self.df_mgr.logger.error.mock_calls, [])
+
+    def test_listdir_other_oserror(self):
+        oserror = OSError()
+        self.df_mgr.logger.error = mock.MagicMock()
+        with mock.patch('os.listdir', side_effect=oserror):
+            self.assertEqual(self.df_mgr._listdir('path'), [])
+            self.df_mgr.logger.error.assert_called_once_with(
+                'ERROR: Skipping %r due to error with listdir attempt: %s',
+                'path', oserror)
+
+    def test_listdir(self):
+        self.df_mgr.logger.error = mock.MagicMock()
+        with mock.patch('os.listdir', return_value=['abc', 'def']):
+            self.assertEqual(self.df_mgr._listdir('path'), ['abc', 'def'])
+            self.assertEqual(self.df_mgr.logger.error.mock_calls, [])
+
+    def test_yield_suffixes_dev_path_fail(self):
+        self.df_mgr.get_dev_path = mock.MagicMock(return_value=None)
+        exc = None
+        try:
+            list(self.df_mgr.yield_suffixes(self.existing_device, '9', 0))
+        except DiskFileDeviceUnavailable as err:
+            exc = err
+        self.assertEqual(str(exc), '')
+
+    def test_yield_suffixes(self):
+        self.df_mgr._listdir = mock.MagicMock(return_value=[
+            'abc', 'def', 'ghi', 'abcd', '012'])
+        dev = self.existing_device
+        self.assertEqual(
+            list(self.df_mgr.yield_suffixes(dev, '9', POLICIES[0])),
+            [(self.testdir + '/' + dev + '/objects/9/abc', 'abc'),
+             (self.testdir + '/' + dev + '/objects/9/def', 'def'),
+             (self.testdir + '/' + dev + '/objects/9/012', '012')])
+
+    def test_yield_hashes_dev_path_fail(self):
+        self.df_mgr.get_dev_path = mock.MagicMock(return_value=None)
+        exc = None
+        try:
+            list(self.df_mgr.yield_hashes(self.existing_device, '9',
+                                          POLICIES[0]))
+        except DiskFileDeviceUnavailable as err:
+            exc = err
+        self.assertEqual(str(exc), '')
+
+    def test_yield_hashes_empty(self):
+        def _listdir(path):
+            return []
+
+        with mock.patch('os.listdir', _listdir):
+            self.assertEqual(list(self.df_mgr.yield_hashes(
+                self.existing_device, '9', POLICIES[0])), [])
+
+    def test_yield_hashes_cleans_up_everything(self):
+        the_time = [1525354555.657585]
+
+        def mock_time():
+            return the_time[0]
+
+        with mock.patch('time.time', mock_time):
+            # Make a couple of (soon-to-be-)expired tombstones
+            df1 = self.df_mgr.get_diskfile(
+                self.existing_device, 0, 'a', 'c', 'o1', POLICIES[0])
+            ts_delete1 = Timestamp(the_time[0])
+            df1.delete(ts_delete1)
+            df1_hash = utils.hash_path('a', 'c', 'o1')
+            df1_suffix = df1_hash[-3:]
+
+            df2 = self.df_mgr.get_diskfile(
+                self.existing_device, 0, 'a', 'c', 'o2', POLICIES[0])
+            ts_delete2 = Timestamp(the_time[0] + 1)
+            df2.delete(ts_delete2)
+            df2_hash = utils.hash_path('a', 'c', 'o2')
+            df2_suffix = df2_hash[-3:]
+
+            # sanity checks
+            self.assertTrue(os.path.exists(os.path.join(
+                self.testdir, self.existing_device, 'objects', '0',
+                df1_suffix, df1_hash,
+                "%s.ts" % ts_delete1.internal)))
+            self.assertTrue(os.path.exists(os.path.join(
+                self.testdir, self.existing_device, 'objects', '0',
+                df2_suffix, df2_hash,
+                "%s.ts" % ts_delete2.internal)))
+
+            # Cache the hashes and expire the tombstones
+            self.df_mgr.get_hashes(self.existing_device, '0', [], POLICIES[0])
+            the_time[0] += 2 * self.df_mgr.reclaim_age
+
+            hashes = list(self.df_mgr.yield_hashes(
+                self.existing_device, '0', POLICIES[0]))
+        self.assertEqual(hashes, [])
+
+        # The tombstones are gone
+        self.assertFalse(os.path.exists(os.path.join(
+            self.testdir, self.existing_device, 'objects', '0',
+            df1_suffix, df1_hash,
+            "%s.ts" % ts_delete1.internal)))
+        self.assertFalse(os.path.exists(os.path.join(
+            self.testdir, self.existing_device, 'objects', '0',
+            df2_suffix, df2_hash,
+            "%s.ts" % ts_delete2.internal)))
+
+        # The empty hash dirs are gone
+        self.assertFalse(os.path.exists(os.path.join(
+            self.testdir, self.existing_device, 'objects', '0',
+            df1_suffix, df1_hash)))
+        self.assertFalse(os.path.exists(os.path.join(
+            self.testdir, self.existing_device, 'objects', '0',
+            df2_suffix, df2_hash)))
+
+        # The empty suffix dirs, and partition are still there
+        self.assertTrue(os.path.isdir(os.path.join(
+            self.testdir, self.existing_device, 'objects', '0',
+            df1_suffix)))
+        self.assertTrue(os.path.isdir(os.path.join(
+            self.testdir, self.existing_device, 'objects', '0',
+            df2_suffix)))
+
+        # but the suffixes is invalid
+        part_dir = os.path.join(
+            self.testdir, self.existing_device, 'objects', '0')
+        invalidations_file = os.path.join(
+            part_dir, diskfile.HASH_INVALIDATIONS_FILE)
+        with open(invalidations_file) as f:
+            invalids = f.read().splitlines()
+            self.assertEqual(sorted((df1_suffix, df2_suffix)),
+                             sorted(invalids))  # sanity
+
+        # next time get hashes runs
+        with mock.patch('time.time', mock_time):
+            hashes = self.df_mgr.get_hashes(
+                self.existing_device, '0', [], POLICIES[0])
+        self.assertEqual(hashes, {})
+
+        # ... suffixes will get cleanup
+        self.assertFalse(os.path.exists(os.path.join(
+            self.testdir, self.existing_device, 'objects', '0',
+            df1_suffix)))
+        self.assertFalse(os.path.exists(os.path.join(
+            self.testdir, self.existing_device, 'objects', '0',
+            df2_suffix)))
+
+        # but really it's not diskfile's jobs to decide if a partition belongs
+        # on a node or not
+        self.assertTrue(os.path.isdir(os.path.join(
+            self.testdir, self.existing_device, 'objects', '0')))
+
+    def test_focused_yield_hashes_does_not_clean_up(self):
+        the_time = [1525354555.657585]
+
+        def mock_time():
+            return the_time[0]
+
+        with mock.patch('time.time', mock_time):
+            df = self.df_mgr.get_diskfile(
+                self.existing_device, 0, 'a', 'c', 'o', POLICIES[0])
+            ts_delete = Timestamp(the_time[0])
+            df.delete(ts_delete)
+            df_hash = utils.hash_path('a', 'c', 'o')
+            df_suffix = df_hash[-3:]
+
+            # sanity check
+            self.assertTrue(os.path.exists(os.path.join(
+                self.testdir, self.existing_device, 'objects', '0',
+                df_suffix, df_hash,
+                "%s.ts" % ts_delete.internal)))
+
+            # Expire the tombstone
+            the_time[0] += 2 * self.df_mgr.reclaim_age
+
+            hashes = list(self.df_mgr.yield_hashes(
+                self.existing_device, '0', POLICIES[0],
+                suffixes=[df_suffix]))
+        self.assertEqual(hashes, [])
+
+        # The partition dir is still there. Since we didn't visit all the
+        # suffix dirs, we didn't learn whether or not the partition dir was
+        # empty.
+        self.assertTrue(os.path.exists(os.path.join(
+            self.testdir, self.existing_device, 'objects', '0')))
+
+    def test_yield_hashes_empty_suffixes(self):
+        def _listdir(path):
+            return []
+
+        with mock.patch('os.listdir', _listdir):
+            self.assertEqual(
+                list(self.df_mgr.yield_hashes(self.existing_device, '9',
+                                              POLICIES[0],
+                                              suffixes=['456'])), [])
+
+    def _check_yield_hashes(self, policy, suffix_map, expected, **kwargs):
+        device = self.existing_device
+        part = '9'
+        part_path = os.path.join(
+            self.testdir, device, diskfile.get_data_dir(policy), part)
+
+        def _listdir(path):
+            if path == part_path:
+                return suffix_map.keys()
+            for suff, hash_map in suffix_map.items():
+                if path == os.path.join(part_path, suff):
+                    return hash_map.keys()
+                for hash_, files in hash_map.items():
+                    if path == os.path.join(part_path, suff, hash_):
+                        return files
+            self.fail('Unexpected listdir of %r' % path)
+        expected_items = [
+            (hash_, timestamps)
+            for hash_, timestamps in expected.items()]
+        with mock.patch('os.listdir', _listdir), \
+                mock.patch('os.unlink'), \
+                mock.patch('os.rmdir'):
+            df_mgr = self.df_router[policy]
+            hash_items = list(df_mgr.yield_hashes(
+                device, part, policy, **kwargs))
+            expected = sorted(expected_items)
+            actual = sorted(hash_items)
+            # default list diff easiest to debug
+            self.assertEqual(expected, actual)
+
+    def test_yield_hashes_tombstones(self):
+        ts_iter = (Timestamp(t) for t in itertools.count(int(time())))
+        ts1 = next(ts_iter)
+        ts2 = next(ts_iter)
+        ts3 = next(ts_iter)
+        suffix_map = {
+            '27e': {
+                '1111111111111111111111111111127e': [
+                    ts1.internal + '.ts'],
+                '2222222222222222222222222222227e': [
+                    ts2.internal + '.ts'],
+            },
+            'd41': {
+                'aaaaaaaaaaaaaaaaaaaaaaaaaaaaad41': []
+            },
+            'd98': {},
+            '00b': {
+                '3333333333333333333333333333300b': [
+                    ts1.internal + '.ts',
+                    ts2.internal + '.ts',
+                    ts3.internal + '.ts',
+                ]
+            },
+            '204': {
+                'bbbbbbbbbbbbbbbbbbbbbbbbbbbbb204': [
+                    ts3.internal + '.ts',
+                ]
+            }
+        }
+        expected = {
+            '1111111111111111111111111111127e': {'ts_data': ts1.internal},
+            '2222222222222222222222222222227e': {'ts_data': ts2.internal},
+            '3333333333333333333333333333300b': {'ts_data': ts3.internal},
+        }
+        for policy in POLICIES:
+            self._check_yield_hashes(policy, suffix_map, expected,
+                                     suffixes=['27e', '00b'])
+
+
+@patch_policies
+class TestDiskFileManager(DiskFileManagerMixin, BaseTestCase):
+
+    mgr_cls = diskfile.DiskFileManager
+
+    def test_get_ondisk_files_with_repl_policy(self):
+        # Each scenario specifies a list of (filename, extension) tuples. If
+        # extension is set then that filename should be returned by the method
+        # under test for that extension type.
+        scenarios = [[('0000000007.00000.data', '.data')],
+
+                     [('0000000007.00000.ts', '.ts')],
+
+                     # older tombstone is ignored
+                     [('0000000007.00000.ts', '.ts'),
+                      ('0000000006.00000.ts', False)],
+
+                     # older data is ignored
+                     [('0000000007.00000.data', '.data'),
+                      ('0000000006.00000.data', False),
+                      ('0000000004.00000.ts', False)],
+
+                     # newest meta trumps older meta
+                     [('0000000009.00000.meta', '.meta'),
+                      ('0000000008.00000.meta', False),
+                      ('0000000007.00000.data', '.data'),
+                      ('0000000004.00000.ts', False)],
+
+                     # meta older than data is ignored
+                     [('0000000007.00000.data', '.data'),
+                      ('0000000006.00000.meta', False),
+                      ('0000000004.00000.ts', False)],
+
+                     # meta without data is ignored
+                     [('0000000007.00000.meta', False, True),
+                      ('0000000006.00000.ts', '.ts'),
+                      ('0000000004.00000.data', False)],
+
+                     # tombstone trumps meta and data at same timestamp
+                     [('0000000006.00000.meta', False),
+                      ('0000000006.00000.ts', '.ts'),
+                      ('0000000006.00000.data', False)],
+                     ]
+
+        self._test_get_ondisk_files(scenarios, POLICIES[0], None)
+        self._test_cleanup_ondisk_files(scenarios, POLICIES[0])
+        self._test_yield_hashes_cleanup(scenarios, POLICIES[0])
+
+    def test_get_ondisk_files_with_stray_meta(self):
+        # get_ondisk_files ignores a stray .meta file
+
+        class_under_test = self._get_diskfile(POLICIES[0])
+        files = ['0000000007.00000.meta']
+
+        with mock.patch('swift.obj.diskfile.os.listdir', lambda *args: files):
+            self.assertRaises(DiskFileNotExist, class_under_test.open)
+
+    def test_verify_ondisk_files(self):
+        # ._verify_ondisk_files should only return False if get_ondisk_files
+        # has produced a bad set of files due to a bug, so to test it we need
+        # to probe it directly.
+        mgr = self.df_router[POLICIES.default]
+        ok_scenarios = (
+            {'ts_file': None, 'data_file': None, 'meta_file': None},
+            {'ts_file': None, 'data_file': 'a_file', 'meta_file': None},
+            {'ts_file': None, 'data_file': 'a_file', 'meta_file': 'a_file'},
+            {'ts_file': 'a_file', 'data_file': None, 'meta_file': None},
+        )
+
+        for scenario in ok_scenarios:
+            self.assertTrue(mgr._verify_ondisk_files(scenario),
+                            'Unexpected result for scenario %s' % scenario)
+
+        # construct every possible invalid combination of results
+        vals = (None, 'a_file')
+        for ts_file, data_file, meta_file in [
+                (a, b, c) for a in vals for b in vals for c in vals]:
+            scenario = {
+                'ts_file': ts_file,
+                'data_file': data_file,
+                'meta_file': meta_file}
+            if scenario in ok_scenarios:
+                continue
+            self.assertFalse(mgr._verify_ondisk_files(scenario),
+                             'Unexpected result for scenario %s' % scenario)
+
+    def test_parse_on_disk_filename(self):
+        mgr = self.df_router[POLICIES.default]
+        for ts in (Timestamp('1234567890.00001'),
+                   Timestamp('1234567890.00001', offset=17)):
+            for ext in ('.meta', '.data', '.ts'):
+                fname = '%s%s' % (ts.internal, ext)
+                info = mgr.parse_on_disk_filename(fname, POLICIES.default)
+                self.assertEqual(ts, info['timestamp'])
+                self.assertEqual(ext, info['ext'])
+
+    def test_parse_on_disk_filename_errors(self):
+        mgr = self.df_router[POLICIES.default]
+        with self.assertRaises(DiskFileError) as cm:
+            mgr.parse_on_disk_filename('junk', POLICIES.default)
+        self.assertEqual("Invalid Timestamp value in filename 'junk'",
+                         str(cm.exception))
+
+    def test_cleanup_ondisk_files_reclaim_with_data_files(self):
+        # Each scenario specifies a list of (filename, extension, [survives])
+        # tuples. If extension is set or 'survives' is True, the filename
+        # should still be in the dir after cleanup.
+        much_older = Timestamp(time() - 2000).internal
+        older = Timestamp(time() - 1001).internal
+        newer = Timestamp(time() - 900).internal
+        scenarios = [
+            # .data files are not reclaimed, ever
+            [('%s.data' % older, '.data', True)],
+            [('%s.data' % newer, '.data', True)],
+
+            # ... and we could have a mixture of fresh and stale .data
+            [('%s.data' % newer, '.data', True),
+             ('%s.data' % older, False, False)],
+
+            # tombstone reclaimed despite newer data
+            [('%s.data' % newer, '.data', True),
+             ('%s.data' % older, False, False),
+             ('%s.ts' % much_older, '.ts', False)],
+
+            # .meta not reclaimed if there is a .data file
+            [('%s.meta' % older, '.meta'),
+             ('%s.data' % much_older, '.data')]]
+
+        self._test_cleanup_ondisk_files(scenarios, POLICIES.default,
+                                        reclaim_age=1000)
+
+    def test_yield_hashes(self):
+        old_ts = '1383180000.12345'
+        fresh_ts = Timestamp(time() - 10).internal
+        fresher_ts = Timestamp(time() - 1).internal
+        suffix_map = {
+            'abc': {
+                '9373a92d072897b136b3fc06595b4abc': [
+                    fresh_ts + '.ts'],
+            },
+            '456': {
+                '9373a92d072897b136b3fc06595b0456': [
+                    old_ts + '.data'],
+                '9373a92d072897b136b3fc06595b7456': [
+                    fresh_ts + '.ts',
+                    fresher_ts + '.data'],
+            },
+            'def': {},
+        }
+        expected = {
+            '9373a92d072897b136b3fc06595b4abc': {'ts_data': fresh_ts},
+            '9373a92d072897b136b3fc06595b0456': {'ts_data': old_ts},
+            '9373a92d072897b136b3fc06595b7456': {'ts_data': fresher_ts},
+        }
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected)
+
+    def test_yield_hashes_yields_meta_timestamp(self):
+        ts_iter = (Timestamp(t) for t in itertools.count(int(time())))
+        ts1 = next(ts_iter)
+        ts2 = next(ts_iter)
+        ts3 = next(ts_iter)
+        suffix_map = {
+            'abc': {
+                # only tombstone is yield/sync -able
+                '9333a92d072897b136b3fc06595b4abc': [
+                    ts1.internal + '.ts',
+                    ts2.internal + '.meta'],
+                # dangling .meta is not yielded because it cannot be sync'd
+                '9222a92d072897b136b3fc06595b4abc': [
+                    ts3.internal + '.meta'],
+            },
+            '456': {
+                # only latest metadata timestamp
+                '9444a92d072897b136b3fc06595b0456': [
+                    ts1.internal + '.data',
+                    ts2.internal + '.meta',
+                    ts3.internal + '.meta'],
+                # exemplary datadir with .meta
+                '9555a92d072897b136b3fc06595b7456': [
+                    ts1.internal + '.data',
+                    ts2.internal + '.meta'],
+            },
+        }
+        expected = {
+            '9333a92d072897b136b3fc06595b4abc':
+            {'ts_data': ts1},
+            '9444a92d072897b136b3fc06595b0456':
+            {'ts_data': ts1, 'ts_meta': ts3},
+            '9555a92d072897b136b3fc06595b7456':
+            {'ts_data': ts1, 'ts_meta': ts2},
+        }
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected)
+
+    def test_yield_hashes_yields_content_type_timestamp(self):
+        hash_ = '9373a92d072897b136b3fc06595b4abc'
+        ts_iter = make_timestamp_iter()
+        ts0, ts1, ts2, ts3, ts4 = (next(ts_iter) for _ in range(5))
+        data_file = ts1.internal + '.data'
+
+        # no content-type delta
+        meta_file = ts2.internal + '.meta'
+        suffix_map = {'abc': {hash_: [data_file, meta_file]}}
+        expected = {hash_: {'ts_data': ts1,
+                            'ts_meta': ts2}}
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected)
+
+        # non-zero content-type delta
+        delta = ts3.raw - ts2.raw
+        meta_file = '%s-%x.meta' % (ts3.internal, delta)
+        suffix_map = {'abc': {hash_: [data_file, meta_file]}}
+        expected = {hash_: {'ts_data': ts1,
+                            'ts_meta': ts3,
+                            'ts_ctype': ts2}}
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected)
+
+        # zero content-type delta
+        meta_file = '%s+0.meta' % ts3.internal
+        suffix_map = {'abc': {hash_: [data_file, meta_file]}}
+        expected = {hash_: {'ts_data': ts1,
+                            'ts_meta': ts3,
+                            'ts_ctype': ts3}}
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected)
+
+        # content-type in second meta file
+        delta = ts3.raw - ts2.raw
+        meta_file1 = '%s-%x.meta' % (ts3.internal, delta)
+        meta_file2 = '%s.meta' % ts4.internal
+        suffix_map = {'abc': {hash_: [data_file, meta_file1, meta_file2]}}
+        expected = {hash_: {'ts_data': ts1,
+                            'ts_meta': ts4,
+                            'ts_ctype': ts2}}
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected)
+
+        # obsolete content-type in second meta file, older than data file
+        delta = ts3.raw - ts0.raw
+        meta_file1 = '%s-%x.meta' % (ts3.internal, delta)
+        meta_file2 = '%s.meta' % ts4.internal
+        suffix_map = {'abc': {hash_: [data_file, meta_file1, meta_file2]}}
+        expected = {hash_: {'ts_data': ts1,
+                            'ts_meta': ts4}}
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected)
+
+        # obsolete content-type in second meta file, same time as data file
+        delta = ts3.raw - ts1.raw
+        meta_file1 = '%s-%x.meta' % (ts3.internal, delta)
+        meta_file2 = '%s.meta' % ts4.internal
+        suffix_map = {'abc': {hash_: [data_file, meta_file1, meta_file2]}}
+        expected = {hash_: {'ts_data': ts1,
+                            'ts_meta': ts4}}
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected)
+
+    def test_yield_hashes_suffix_filter(self):
+        # test again with limited suffixes
+        old_ts = '1383180000.12345'
+        fresh_ts = Timestamp(time() - 10).internal
+        fresher_ts = Timestamp(time() - 1).internal
+        suffix_map = {
+            'abc': {
+                '9373a92d072897b136b3fc06595b4abc': [
+                    fresh_ts + '.ts'],
+            },
+            '456': {
+                '9373a92d072897b136b3fc06595b0456': [
+                    old_ts + '.data'],
+                '9373a92d072897b136b3fc06595b7456': [
+                    fresh_ts + '.ts',
+                    fresher_ts + '.data'],
+            },
+            'def': {},
+        }
+        expected = {
+            '9373a92d072897b136b3fc06595b0456': {'ts_data': old_ts},
+            '9373a92d072897b136b3fc06595b7456': {'ts_data': fresher_ts},
+        }
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected,
+                                 suffixes=['456'])
+
+    def test_yield_hashes_fails_with_bad_ondisk_filesets(self):
+        ts_iter = (Timestamp(t) for t in itertools.count(int(time())))
+        ts1 = next(ts_iter)
+        suffix_map = {
+            '456': {
+                '9373a92d072897b136b3fc06595b0456': [
+                    ts1.internal + '.data'],
+                '9373a92d072897b136b3fc06595ba456': [
+                    ts1.internal + '.meta'],
+            },
+        }
+        expected = {
+            '9373a92d072897b136b3fc06595b0456': {'ts_data': ts1},
+        }
+        try:
+            self._check_yield_hashes(POLICIES.default, suffix_map, expected,
+                                     frag_index=2)
+            self.fail('Expected AssertionError')
+        except AssertionError:
+            pass
+
+    def test_check_policy(self):
+        mock_policy = mock.MagicMock()
+        mock_policy.policy_type = REPL_POLICY
+        # sanity, DiskFileManager is ok with REPL_POLICY
+        diskfile.DiskFileManager.check_policy(mock_policy)
+        # DiskFileManager raises ValueError with EC_POLICY
+        mock_policy.policy_type = EC_POLICY
+        with self.assertRaises(ValueError) as cm:
+            diskfile.DiskFileManager.check_policy(mock_policy)
+        self.assertEqual('Invalid policy_type: %s' % EC_POLICY,
+                         str(cm.exception))
+
+
+@patch_policies(with_ec_default=True)
+class TestECDiskFileManager(DiskFileManagerMixin, BaseTestCase):
+
+    mgr_cls = diskfile.ECDiskFileManager
+
+    def test_get_ondisk_files_with_ec_policy_and_legacy_durable(self):
+        # Each scenario specifies a list of (filename, extension, [survives])
+        # tuples. If extension is set then that filename should be returned by
+        # the method under test for that extension type. If the optional
+        # 'survives' is True, the filename should still be in the dir after
+        # cleanup.
+        scenarios = [
+            # highest frag index is chosen by default
+            [('0000000007.00000.durable', '.durable'),
+             ('0000000007.00000#1.data', '.data'),
+             ('0000000007.00000#0.data', False, True)],
+
+            # data older than durable is ignored
+            [('0000000007.00000.durable', '.durable'),
+             ('0000000007.00000#1.data', '.data'),
+             ('0000000006.00000#1.data', False),
+             ('0000000004.00000.ts', False)],
+
+            # data older than durable ignored, even if its only data
+            [('0000000007.00000.durable', False, False),
+             ('0000000006.00000#1.data', False),
+             ('0000000004.00000.ts', False)],
+
+            # newer meta trumps older meta
+            [('0000000009.00000.meta', '.meta'),
+             ('0000000008.00000.meta', False),
+             ('0000000007.00000.durable', '.durable'),
+             ('0000000007.00000#14.data', '.data'),
+             ('0000000004.00000.ts', False)],
+
+            # older meta is ignored
+            [('0000000007.00000.durable', '.durable'),
+             ('0000000007.00000#14.data', '.data'),
+             ('0000000006.00000.meta', False),
+             ('0000000004.00000.ts', False)],
+
+            # tombstone trumps meta, data, durable at older timestamp
+            [('0000000006.00000.ts', '.ts'),
+             ('0000000005.00000.meta', False),
+             ('0000000004.00000.durable', False),
+             ('0000000004.00000#0.data', False)],
+
+            # tombstone trumps meta, data, durable at same timestamp
+            [('0000000006.00000.meta', False),
+             ('0000000006.00000.ts', '.ts'),
+             ('0000000006.00000.durable', False),
+             ('0000000006.00000#0.data', False)]
+        ]
+
+        # these scenarios have same outcome regardless of whether any
+        # fragment preferences are specified
+        self._test_get_ondisk_files(scenarios, POLICIES.default,
+                                    frag_index=None)
+        self._test_get_ondisk_files(scenarios, POLICIES.default,
+                                    frag_index=None, frag_prefs=[])
+        self._test_cleanup_ondisk_files(scenarios, POLICIES.default)
+        self._test_yield_hashes_cleanup(scenarios, POLICIES.default)
+
+        # next scenarios have different outcomes dependent on whether a
+        # frag_prefs parameter is passed to diskfile constructor or not
+        scenarios = [
+            # data with no durable is ignored
+            [('0000000007.00000#0.data', False, True)],
+
+            # data newer than tombstone with no durable is ignored
+            [('0000000007.00000#0.data', False, True),
+             ('0000000006.00000.ts', '.ts', True)],
+
+            # data newer than durable is ignored
+            [('0000000009.00000#2.data', False, True),
+             ('0000000009.00000#1.data', False, True),
+             ('0000000008.00000#3.data', False, True),
+             ('0000000007.00000.durable', '.durable'),
+             ('0000000007.00000#1.data', '.data'),
+             ('0000000007.00000#0.data', False, True)],
+
+            # data newer than durable ignored, even if its only data
+            [('0000000008.00000#1.data', False, True),
+             ('0000000007.00000.durable', False, False)],
+
+            # missing durable invalidates data, older meta deleted
+            [('0000000007.00000.meta', False, True),
+             ('0000000006.00000#0.data', False, True),
+             ('0000000005.00000.meta', False, False),
+             ('0000000004.00000#1.data', False, True)]]
+
+        self._test_get_ondisk_files(scenarios, POLICIES.default,
+                                    frag_index=None)
+        self._test_cleanup_ondisk_files(scenarios, POLICIES.default)
+
+        scenarios = [
+            # data with no durable is chosen
+            [('0000000007.00000#0.data', '.data', True)],
+
+            # data newer than tombstone with no durable is chosen
+            [('0000000007.00000#0.data', '.data', True),
+             ('0000000006.00000.ts', False, True)],
+
+            # data newer than durable is chosen, older data preserved
+            [('0000000009.00000#2.data', '.data', True),
+             ('0000000009.00000#1.data', False, True),
+             ('0000000008.00000#3.data', False, True),
+             ('0000000007.00000.durable', False, True),
+             ('0000000007.00000#1.data', False, True),
+             ('0000000007.00000#0.data', False, True)],
+
+            # data newer than durable chosen when its only data
+            [('0000000008.00000#1.data', '.data', True),
+             ('0000000007.00000.durable', False, False)],
+
+            # data plus meta chosen without durable, older meta deleted
+            [('0000000007.00000.meta', '.meta', True),
+             ('0000000006.00000#0.data', '.data', True),
+             ('0000000005.00000.meta', False, False),
+             ('0000000004.00000#1.data', False, True)]]
+
+        self._test_get_ondisk_files(scenarios, POLICIES.default,
+                                    frag_index=None, frag_prefs=[])
+        self._test_cleanup_ondisk_files(scenarios, POLICIES.default)
+
+    def test_get_ondisk_files_with_ec_policy(self):
+        # Each scenario specifies a list of (filename, extension, [survives])
+        # tuples. If extension is set then that filename should be returned by
+        # the method under test for that extension type. If the optional
+        # 'survives' is True, the filename should still be in the dir after
+        # cleanup.
+        scenarios = [[('0000000007.00000.ts', '.ts')],
+
+                     [('0000000007.00000.ts', '.ts'),
+                      ('0000000006.00000.ts', False)],
+
+                     # highest frag index is chosen by default
+                     [('0000000007.00000#1#d.data', '.data'),
+                      ('0000000007.00000#0.data', False, True)],
+
+                     # data older than durable is ignored
+                     [('0000000007.00000#1#d.data', '.data'),
+                      ('0000000006.00000#1.data', False),
+                      ('0000000004.00000.ts', False)],
+
+                     # newer meta trumps older meta
+                     [('0000000009.00000.meta', '.meta'),
+                      ('0000000008.00000.meta', False),
+                      ('0000000007.00000#14#d.data', '.data'),
+                      ('0000000004.00000.ts', False)],
+
+                     # older meta is ignored
+                     [('0000000007.00000#14#d.data', '.data'),
+                      ('0000000006.00000.meta', False),
+                      ('0000000004.00000.ts', False)],
+
+                     # tombstone trumps meta and data at older timestamp
+                     [('0000000006.00000.ts', '.ts'),
+                      ('0000000005.00000.meta', False),
+                      ('0000000004.00000#0#d.data', False)],
+
+                     # tombstone trumps meta and data at same timestamp
+                     [('0000000006.00000.meta', False),
+                      ('0000000006.00000.ts', '.ts'),
+                      ('0000000006.00000#0#d.data', False)],
+                     ]
+
+        # these scenarios have same outcome regardless of whether any
+        # fragment preferences are specified
+        self._test_get_ondisk_files(scenarios, POLICIES.default,
+                                    frag_index=None)
+        self._test_get_ondisk_files(scenarios, POLICIES.default,
+                                    frag_index=None, frag_prefs=[])
+        self._test_cleanup_ondisk_files(scenarios, POLICIES.default)
+        self._test_yield_hashes_cleanup(scenarios, POLICIES.default)
+
+        # next scenarios have different outcomes dependent on whether a
+        # frag_prefs parameter is passed to diskfile constructor or not
+        scenarios = [
+            # non-durable is ignored
+            [('0000000007.00000#0.data', False, True)],
+
+            # non-durable data newer than tombstone is ignored
+            [('0000000007.00000#0.data', False, True),
+             ('0000000006.00000.ts', '.ts', True)],
+
+            # data newer than durable data is ignored
+            [('0000000009.00000#2.data', False, True),
+             ('0000000009.00000#1.data', False, True),
+             ('0000000008.00000#3.data', False, True),
+             ('0000000007.00000#1#d.data', '.data'),
+             ('0000000007.00000#0#d.data', False, True)],
+
+            # non-durable data ignored, older meta deleted
+            [('0000000007.00000.meta', False, True),
+             ('0000000006.00000#0.data', False, True),
+             ('0000000005.00000.meta', False, False),
+             ('0000000004.00000#1.data', False, True)]]
+
+        self._test_get_ondisk_files(scenarios, POLICIES.default,
+                                    frag_index=None)
+        self._test_cleanup_ondisk_files(scenarios, POLICIES.default)
+
+        scenarios = [
+            # non-durable data is chosen
+            [('0000000007.00000#0.data', '.data', True)],
+
+            # non-durable data newer than tombstone is chosen
+            [('0000000007.00000#0.data', '.data', True),
+             ('0000000006.00000.ts', False, True)],
+
+            # non-durable data newer than durable data is chosen, older data
+            # preserved
+            [('0000000009.00000#2.data', '.data', True),
+             ('0000000009.00000#1.data', False, True),
+             ('0000000008.00000#3.data', False, True),
+             ('0000000007.00000#1#d.data', False, True),
+             ('0000000007.00000#0#d.data', False, True)],
+
+            # non-durable data plus meta chosen, older meta deleted
+            [('0000000007.00000.meta', '.meta', True),
+             ('0000000006.00000#0.data', '.data', True),
+             ('0000000005.00000.meta', False, False),
+             ('0000000004.00000#1.data', False, True)]]
+
+        self._test_get_ondisk_files(scenarios, POLICIES.default,
+                                    frag_index=None, frag_prefs=[])
+        self._test_cleanup_ondisk_files(scenarios, POLICIES.default)
+
+    def test_get_ondisk_files_with_ec_policy_and_frag_index_legacy(self):
+        # Each scenario specifies a list of (filename, extension, [survives])
+        # tuples. If extension is set then that filename should be returned by
+        # the method under test for that extension type.
+        scenarios = [[('0000000007.00000#2.data', False, True),
+                      ('0000000007.00000#1.data', '.data'),
+                      ('0000000007.00000#0.data', False, True),
+                      ('0000000007.00000.durable', '.durable')],
+
+                     # specific frag newer than durable is ignored
+                     [('0000000007.00000#2.data', False, True),
+                      ('0000000007.00000#1.data', False, True),
+                      ('0000000007.00000#0.data', False, True),
+                      ('0000000006.00000.durable', False)],
+
+                     # specific frag older than durable is ignored
+                     [('0000000007.00000#2.data', False),
+                      ('0000000007.00000#1.data', False),
+                      ('0000000007.00000#0.data', False),
+                      ('0000000008.00000.durable', False)],
+
+                     # specific frag older than newest durable is ignored
+                     # even if is also has a durable
+                     [('0000000007.00000#2.data', False),
+                      ('0000000007.00000#1.data', False),
+                      ('0000000007.00000.durable', False),
+                      ('0000000008.00000#0.data', False, True),
+                      ('0000000008.00000.durable', '.durable')],
+
+                     # meta included when frag index is specified
+                     [('0000000009.00000.meta', '.meta'),
+                      ('0000000007.00000#2.data', False, True),
+                      ('0000000007.00000#1.data', '.data'),
+                      ('0000000007.00000#0.data', False, True),
+                      ('0000000007.00000.durable', '.durable')],
+
+                     # specific frag older than tombstone is ignored
+                     [('0000000009.00000.ts', '.ts'),
+                      ('0000000007.00000#2.data', False),
+                      ('0000000007.00000#1.data', False),
+                      ('0000000007.00000#0.data', False),
+                      ('0000000007.00000.durable', False)],
+
+                     # no data file returned if specific frag index missing
+                     [('0000000007.00000#2.data', False, True),
+                      ('0000000007.00000#14.data', False, True),
+                      ('0000000007.00000#0.data', False, True),
+                      ('0000000007.00000.durable', '.durable')],
+
+                     # meta ignored if specific frag index missing
+                     [('0000000008.00000.meta', False, True),
+                      ('0000000007.00000#14.data', False, True),
+                      ('0000000007.00000#0.data', False, True),
+                      ('0000000007.00000.durable', '.durable')],
+
+                     # meta ignored if no data files
+                     # Note: this is anomalous, because we are specifying a
+                     # frag_index, get_ondisk_files will tolerate .meta with
+                     # no .data
+                     [('0000000088.00000.meta', False, True),
+                      ('0000000077.00000.durable', False, False)]
+                     ]
+
+        self._test_get_ondisk_files(scenarios, POLICIES.default, frag_index=1)
+        self._test_cleanup_ondisk_files(scenarios, POLICIES.default)
+
+        # scenarios for empty frag_prefs, meaning durable not required
+        scenarios = [
+            # specific frag newer than durable is chosen
+            [('0000000007.00000#2.data', False, True),
+             ('0000000007.00000#1.data', '.data', True),
+             ('0000000007.00000#0.data', False, True),
+             ('0000000006.00000.durable', False, False)],
+        ]
+        self._test_get_ondisk_files(scenarios, POLICIES.default, frag_index=1,
+                                    frag_prefs=[])
+        self._test_cleanup_ondisk_files(scenarios, POLICIES.default)
+
+    def test_get_ondisk_files_with_ec_policy_and_frag_index(self):
+        # Each scenario specifies a list of (filename, extension, [survives])
+        # tuples. If extension is set then that filename should be returned by
+        # the method under test for that extension type.
+        scenarios = [[('0000000007.00000#2#d.data', False, True),
+                      ('0000000007.00000#1#d.data', '.data'),
+                      ('0000000007.00000#0#d.data', False, True)],
+
+                     # specific frag index 1 is returned as long as one durable
+                     [('0000000007.00000#2.data', False, True),
+                      ('0000000007.00000#1.data', '.data', True),
+                      ('0000000007.00000#0#d.data', False, True)],
+
+                     # specific frag newer than durable data is ignored
+                     [('0000000007.00000#2.data', False, True),
+                      ('0000000007.00000#1.data', False, True),
+                      ('0000000007.00000#0.data', False, True),
+                      ('0000000006.00000#0#d.data', False, True)],
+
+                     # specific frag older than durable data is ignored
+                     [('0000000007.00000#2.data', False),
+                      ('0000000007.00000#1.data', False),
+                      ('0000000007.00000#0.data', False),
+                      ('0000000008.00000#0#d.data', False, True)],
+
+                     # specific frag older than newest durable data is ignored
+                     # even if is durable
+                     [('0000000007.00000#2#d.data', False),
+                      ('0000000007.00000#1#d.data', False),
+                      ('0000000008.00000#0#d.data', False, True)],
+
+                     # meta included when frag index is specified
+                     [('0000000009.00000.meta', '.meta'),
+                      ('0000000007.00000#2#d.data', False, True),
+                      ('0000000007.00000#1#d.data', '.data'),
+                      ('0000000007.00000#0#d.data', False, True)],
+
+                     # specific frag older than tombstone is ignored
+                     [('0000000009.00000.ts', '.ts'),
+                      ('0000000007.00000#2#d.data', False),
+                      ('0000000007.00000#1#d.data', False),
+                      ('0000000007.00000#0#d.data', False)],
+
+                     # no data file returned if specific frag index missing
+                     [('0000000007.00000#2#d.data', False, True),
+                      ('0000000007.00000#14#d.data', False, True),
+                      ('0000000007.00000#0#d.data', False, True)],
+
+                     # meta ignored if specific frag index missing
+                     [('0000000008.00000.meta', False, True),
+                      ('0000000007.00000#14#d.data', False, True),
+                      ('0000000007.00000#0#d.data', False, True)],
+
+                     # meta ignored if no data files
+                     # Note: this is anomalous, because we are specifying a
+                     # frag_index, get_ondisk_files will tolerate .meta with
+                     # no .data
+                     [('0000000088.00000.meta', False, True)]
+                     ]
+
+        self._test_get_ondisk_files(scenarios, POLICIES.default, frag_index=1)
+        self._test_cleanup_ondisk_files(scenarios, POLICIES.default)
+
+        # scenarios for empty frag_prefs, meaning durable not required
+        scenarios = [
+            # specific frag newer than durable is chosen
+            [('0000000007.00000#2.data', False, True),
+             ('0000000007.00000#1.data', '.data', True),
+             ('0000000007.00000#0.data', False, True)],
+        ]
+        self._test_get_ondisk_files(scenarios, POLICIES.default, frag_index=1,
+                                    frag_prefs=[])
+        self._test_cleanup_ondisk_files(scenarios, POLICIES.default)
+
+    def test_get_ondisk_files_with_ec_policy_some_legacy(self):
+        # Test mixture of legacy durable files and durable data files that
+        # might somehow end up in the same object dir.
+        # Each scenario specifies a list of (filename, extension, [survives])
+        # tuples. If extension is set then that filename should be returned by
+        # the method under test for that extension type. If the optional
+        # 'survives' is True, the filename should still be in the dir after
+        # cleanup.
+        scenarios = [
+            # .durable at same timestamp is ok
+            [('0000000007.00000#1#d.data', '.data', True),
+             ('0000000007.00000#0#d.data', False, True),
+             ('0000000007.00000.durable', False, True)],
+
+            # .durable at same timestamp is ok with non durable wanted frag
+            [('0000000007.00000#1.data', '.data', True),
+             ('0000000007.00000#0#d.data', False, True),
+             ('0000000007.00000.durable', False, True)],
+
+            # older .durable file is cleaned up
+            [('0000000007.00000#1#d.data', '.data', True),
+             ('0000000007.00000#0#d.data', False, True),
+             ('0000000006.00000.durable', False, False)],
+
+            # older .durable does not interfere with non durable wanted frag
+            [('0000000007.00000#1.data', '.data', True),
+             ('0000000007.00000#0#d.data', False, True),
+             ('0000000006.00000.durable', False, False)],
+
+            # ...even if it has accompanying .data file
+            [('0000000007.00000#1.data', '.data', True),
+             ('0000000007.00000#0#d.data', False, True),
+             ('0000000006.00000#0.data', False, False),
+             ('0000000006.00000.durable', False, False)],
+
+            # newer .durable file trumps older durable-data
+            [('0000000007.00000#1#d.data', False, False),
+             ('0000000007.00000#0#d.data', False, False),
+             ('0000000008.00000#1.data', '.data', True),
+             ('0000000008.00000.durable', False, True)],
+
+            # newer .durable file with no .data trumps older durable-data
+            [('0000000007.00000#1#d.data', False, False),
+             ('0000000007.00000#0#d.data', False, False),
+             ('0000000008.00000.durable', False, False)],
+        ]
+
+        self._test_get_ondisk_files(scenarios, POLICIES.default, frag_index=1)
+        self._test_cleanup_ondisk_files(scenarios, POLICIES.default)
+        self._test_yield_hashes_cleanup(scenarios, POLICIES.default)
+
+    def test_cleanup_ondisk_files_reclaim_with_data_files_legacy_durable(self):
+        # Each scenario specifies a list of (filename, extension, [survives])
+        # tuples. If extension is set or 'survives' is True, the filename
+        # should still be in the dir after cleanup.
+        much_older = Timestamp(time() - 2000).internal
+        older = Timestamp(time() - 1001).internal
+        newer = Timestamp(time() - 900).internal
+        scenarios = [
+            # isolated legacy .durable is cleaned up immediately
+            [('%s.durable' % newer, False, False)],
+
+            # ...even when other older files are in dir
+            [('%s.durable' % older, False, False),
+             ('%s.ts' % much_older, False, False)],
+
+            # isolated .data files are cleaned up when stale
+            # ...even when there is an older legacy durable
+            [('%s#2.data' % older, False, False),
+             ('%s#4.data' % older, False, False),
+             ('%s#2.data' % much_older, '.data', True),
+             ('%s#4.data' % much_older, False, True),
+             ('%s.durable' % much_older, '.durable', True)],
+
+            # tombstone reclaimed despite much older legacy durable
+            [('%s.ts' % older, '.ts', False),
+             ('%s.durable' % much_older, False, False)],
+
+            # .meta not reclaimed if there is legacy durable data
+            [('%s.meta' % older, '.meta', True),
+             ('%s#4.data' % much_older, False, True),
+             ('%s.durable' % much_older, '.durable', True)],
+
+            # stale .meta reclaimed along with stale legacy .durable
+            [('%s.meta' % older, False, False),
+             ('%s.durable' % much_older, False, False)]]
+
+        self._test_cleanup_ondisk_files(scenarios, POLICIES.default,
+                                        reclaim_age=1000, commit_window=0)
+
+    def test_cleanup_ondisk_files_reclaim_with_data_files(self):
+        # Each scenario specifies a list of (filename, extension, [survives])
+        # tuples. If extension is set or 'survives' is True, the filename
+        # should still be in the dir after cleanup.
+        much_older = Timestamp(time() - 2000).internal
+        older = Timestamp(time() - 1001).internal
+        newer = Timestamp(time() - 900).internal
+        scenarios = [
+            # isolated .data files are cleaned up when stale
+            [('%s#2.data' % older, False, False),
+             ('%s#4.data' % older, False, False)],
+
+            # ...even when there is an older durable fileset
+            [('%s#2.data' % older, False, False),
+             ('%s#4.data' % older, False, False),
+             ('%s#2#d.data' % much_older, '.data', True),
+             ('%s#4#d.data' % much_older, False, True)],
+
+            # ... but preserved if still fresh
+            [('%s#2.data' % newer, False, True),
+             ('%s#4.data' % newer, False, True)],
+
+            # ... and we could have a mixture of fresh and stale .data
+            [('%s#2.data' % newer, False, True),
+             ('%s#4.data' % older, False, False)],
+
+            # tombstone reclaimed despite newer non-durable data
+            [('%s#2.data' % newer, False, True),
+             ('%s#4.data' % older, False, False),
+             ('%s.ts' % much_older, '.ts', False)],
+
+            # tombstone reclaimed despite much older durable
+            [('%s.ts' % older, '.ts', False),
+             ('%s#4#d.data' % much_older, False, False)],
+
+            # .meta not reclaimed if there is durable data
+            [('%s.meta' % older, '.meta', True),
+             ('%s#4#d.data' % much_older, False, True)],
+
+            # stale .meta reclaimed along with stale non-durable .data
+            [('%s.meta' % older, False, False),
+             ('%s#4.data' % much_older, False, False)]]
+
+        self._test_cleanup_ondisk_files(scenarios, POLICIES.default,
+                                        reclaim_age=1000, commit_window=0)
+
+    def test_cleanup_ondisk_files_commit_window(self):
+        # verify that non-durable files are not reclaimed regardless of
+        # timestamp if written to disk within commit_window
+        much_older = Timestamp(time() - 2000).internal
+        older = Timestamp(time() - 1001).internal
+        newer = Timestamp(time() - 900).internal
+        scenarios = [
+            # recently written nondurables not cleaned up
+            [('%s#1.data' % older, True),
+             ('%s#2.data' % newer, True),
+             ('%s.meta' % much_older, False),
+             ('%s.ts' % much_older, False)]]
+        self._test_cleanup_ondisk_files(scenarios, POLICIES.default,
+                                        reclaim_age=1000, commit_window=60)
+
+        # ... but if commit_window is reduced then recently written files are
+        # cleaned up
+        scenarios = [
+            # older *timestamps* cleaned up
+            [('%s#1.data' % older, False),
+             ('%s#2.data' % newer, True),
+             ('%s.meta' % much_older, False),
+             ('%s.ts' % much_older, False)]]
+        self._test_cleanup_ondisk_files(scenarios, POLICIES.default,
+                                        reclaim_age=1000, commit_window=0)
+
+    def test_get_ondisk_files_with_stray_meta(self):
+        # get_ondisk_files ignores a stray .meta file
+        class_under_test = self._get_diskfile(POLICIES.default)
+
+        @contextmanager
+        def create_files(df, files):
+            os.makedirs(df._datadir)
+            for fname in files:
+                fpath = os.path.join(df._datadir, fname)
+                with open(fpath, 'w') as f:
+                    diskfile.write_metadata(f, {'name': df._name,
+                                                'Content-Length': 0})
+            yield
+            rmtree(df._datadir, ignore_errors=True)
+
+        # sanity
+        good_files = [
+            '0000000006.00000.meta',
+            '0000000006.00000#1#d.data'
+        ]
+        with create_files(class_under_test, good_files):
+            class_under_test.open()
+
+        scenarios = [['0000000007.00000.meta'],
+
+                     ['0000000007.00000.meta',
+                      '0000000006.00000.durable'],  # legacy durable file
+
+                     ['0000000007.00000.meta',
+                      '0000000006.00000#1.data'],
+
+                     ['0000000007.00000.meta',
+                      '0000000006.00000.durable',  # legacy durable file
+                      '0000000005.00000#1.data']
+                     ]
+        for files in scenarios:
+            with create_files(class_under_test, files):
+                try:
+                    class_under_test.open()
+                except DiskFileNotExist:
+                    continue
+            self.fail('expected DiskFileNotExist opening %s with %r' % (
+                class_under_test.__class__.__name__, files))
+
+        # Simulate another process deleting the data after we list contents
+        # but before we actually open them
+        orig_listdir = os.listdir
+
+        def deleting_listdir(d):
+            result = orig_listdir(d)
+            for f in result:
+                os.unlink(os.path.join(d, f))
+            return result
+
+        with create_files(class_under_test, good_files), \
+                mock.patch('swift.obj.diskfile.os.listdir',
+                           side_effect=deleting_listdir), \
+                self.assertRaises(DiskFileStateChanged):
+            class_under_test.open()
+
+    def test_verify_ondisk_files(self):
+        # _verify_ondisk_files should only return False if get_ondisk_files
+        # has produced a bad set of files due to a bug, so to test it we need
+        # to probe it directly.
+        mgr = self.df_router[POLICIES.default]
+        ok_scenarios = (
+            {'ts_file': None, 'data_file': None, 'meta_file': None,
+             'durable_frag_set': None},
+            {'ts_file': None, 'data_file': 'a_file', 'meta_file': None,
+             'durable_frag_set': ['a_file']},
+            {'ts_file': None, 'data_file': 'a_file', 'meta_file': 'a_file',
+             'durable_frag_set': ['a_file']},
+            {'ts_file': 'a_file', 'data_file': None, 'meta_file': None,
+             'durable_frag_set': None},
+        )
+
+        for scenario in ok_scenarios:
+            self.assertTrue(mgr._verify_ondisk_files(scenario),
+                            'Unexpected result for scenario %s' % scenario)
+
+        # construct every possible invalid combination of results
+        vals = (None, 'a_file')
+        for ts_file, data_file, meta_file, durable_frag in [
+            (a, b, c, d)
+                for a in vals for b in vals for c in vals for d in vals]:
+            scenario = {
+                'ts_file': ts_file,
+                'data_file': data_file,
+                'meta_file': meta_file,
+                'durable_frag_set': [durable_frag] if durable_frag else None}
+            if scenario in ok_scenarios:
+                continue
+            self.assertFalse(mgr._verify_ondisk_files(scenario),
+                             'Unexpected result for scenario %s' % scenario)
+
+    def test_parse_on_disk_filename(self):
+        mgr = self.df_router[POLICIES.default]
+        for ts in (Timestamp('1234567890.00001'),
+                   Timestamp('1234567890.00001', offset=17)):
+            # non-durable data file
+            for frag in (0, 2, 13):
+                fname = '%s#%s.data' % (ts.internal, frag)
+                info = mgr.parse_on_disk_filename(fname, POLICIES.default)
+                self.assertEqual(ts, info['timestamp'])
+                self.assertEqual('.data', info['ext'])
+                self.assertEqual(frag, info['frag_index'])
+                self.assertIs(False, info['durable'])
+                self.assertEqual(mgr.make_on_disk_filename(**info), fname)
+
+            # durable data file
+            for frag in (0, 2, 13):
+                fname = '%s#%s#d.data' % (ts.internal, frag)
+                info = mgr.parse_on_disk_filename(fname, POLICIES.default)
+                self.assertEqual(ts, info['timestamp'])
+                self.assertEqual('.data', info['ext'])
+                self.assertEqual(frag, info['frag_index'])
+                self.assertIs(True, info['durable'])
+                self.assertEqual(mgr.make_on_disk_filename(**info), fname)
+
+            # data file with unexpected suffix marker, not an error in case
+            # alternative marker suffixes added in future
+            for frag in (0, 2, 13):
+                fname = '%s#%s#junk.data' % (ts.internal, frag)
+                info = mgr.parse_on_disk_filename(fname, POLICIES.default)
+                self.assertEqual(ts, info['timestamp'])
+                self.assertEqual('.data', info['ext'])
+                self.assertEqual(frag, info['frag_index'])
+                self.assertIs(False, info['durable'])
+                expected = '%s#%s.data' % (ts.internal, frag)
+                self.assertEqual(mgr.make_on_disk_filename(**info), expected)
+
+            for ext in ('.meta', '.durable', '.ts'):
+                fname = '%s%s' % (ts.internal, ext)
+                info = mgr.parse_on_disk_filename(fname, POLICIES.default)
+                self.assertEqual(ts, info['timestamp'])
+                self.assertEqual(ext, info['ext'])
+                self.assertIsNone(info['frag_index'])
+                self.assertEqual(mgr.make_on_disk_filename(**info), fname)
+
+    def test_parse_on_disk_filename_errors(self):
+        mgr = self.df_router[POLICIES.default]
+        for ts in (Timestamp('1234567890.00001'),
+                   Timestamp('1234567890.00001', offset=17)):
+            fname = '%s.data' % ts.internal
+            with self.assertRaises(DiskFileError) as cm:
+                mgr.parse_on_disk_filename(fname, POLICIES.default)
+            self.assertTrue(str(cm.exception).startswith("Bad fragment index"))
+
+            expected = {
+                '': 'bad',
+                'foo': 'bad',
+                '1.314': 'bad',
+                1.314: 'bad',
+                -2: 'negative',
+                '-2': 'negative',
+                None: 'bad',
+                'None': 'bad',
+            }
+
+            # non-durable data file
+            for frag, msg in expected.items():
+                fname = '%s#%s.data' % (ts.internal, frag)
+                with self.assertRaises(DiskFileError) as cm:
+                    mgr.parse_on_disk_filename(fname, POLICIES.default)
+                self.assertIn(msg, str(cm.exception).lower())
+
+            # durable data file
+            for frag, msg in expected.items():
+                fname = '%s#%s#d.data' % (ts.internal, frag)
+                with self.assertRaises(DiskFileError) as cm:
+                    mgr.parse_on_disk_filename(fname, POLICIES.default)
+                self.assertIn(msg, str(cm.exception).lower())
+
+        with self.assertRaises(DiskFileError) as cm:
+            mgr.parse_on_disk_filename('junk', POLICIES.default)
+        self.assertEqual("Invalid Timestamp value in filename 'junk'",
+                         str(cm.exception))
+
+    def test_make_on_disk_filename(self):
+        mgr = self.df_router[POLICIES.default]
+        for ts in (Timestamp('1234567890.00001'),
+                   Timestamp('1234567890.00001', offset=17)):
+            for frag in (0, '0', 2, '2', 13, '13'):
+                for durable in (True, False):
+                    expected = _make_datafilename(
+                        ts, POLICIES.default, frag_index=frag, durable=durable)
+                    actual = mgr.make_on_disk_filename(
+                        ts, '.data', frag_index=frag, durable=durable)
+                    self.assertEqual(expected, actual)
+                    parsed = mgr.parse_on_disk_filename(
+                        actual, POLICIES.default)
+                    self.assertEqual(parsed, {
+                        'timestamp': ts,
+                        'frag_index': int(frag),
+                        'ext': '.data',
+                        'ctype_timestamp': None,
+                        'durable': durable
+                    })
+                    # these functions are inverse
+                    self.assertEqual(
+                        mgr.make_on_disk_filename(**parsed),
+                        expected)
+
+                    for ext in ('.meta', '.durable', '.ts'):
+                        expected = '%s%s' % (ts.internal, ext)
+                        # frag index should not be required
+                        actual = mgr.make_on_disk_filename(ts, ext)
+                        self.assertEqual(expected, actual)
+                        # frag index should be ignored
+                        actual = mgr.make_on_disk_filename(
+                            ts, ext, frag_index=frag)
+                        self.assertEqual(expected, actual)
+                        parsed = mgr.parse_on_disk_filename(
+                            actual, POLICIES.default)
+                        self.assertEqual(parsed, {
+                            'timestamp': ts,
+                            'frag_index': None,
+                            'ext': ext,
+                            'ctype_timestamp': None
+                        })
+                        # these functions are inverse
+                        self.assertEqual(
+                            mgr.make_on_disk_filename(**parsed),
+                            expected)
+
+            actual = mgr.make_on_disk_filename(ts)
+            self.assertEqual(ts, actual)
+
+    def test_make_on_disk_filename_with_bad_frag_index(self):
+        mgr = self.df_router[POLICIES.default]
+        ts = Timestamp('1234567890.00001')
+        with self.assertRaises(DiskFileError):
+            # .data requires a frag_index kwarg
+            mgr.make_on_disk_filename(ts, '.data')
+
+        for frag in (None, 'foo', '1.314', 1.314, -2, '-2'):
+            with self.assertRaises(DiskFileError):
+                mgr.make_on_disk_filename(ts, '.data', frag_index=frag)
+
+            for ext in ('.meta', '.durable', '.ts'):
+                expected = '%s%s' % (ts.internal, ext)
+                # bad frag index should be ignored
+                actual = mgr.make_on_disk_filename(ts, ext, frag_index=frag)
+                self.assertEqual(expected, actual)
+
+    def test_make_on_disk_filename_for_meta_with_content_type(self):
+        # verify .meta filename encodes content-type timestamp
+        mgr = self.df_router[POLICIES.default]
+        time_ = 1234567890.00001
+        for delta in (0, 1, 111111):
+            t_meta = Timestamp(time_)
+            t_type = Timestamp(time_ - delta / 100000.)
+            sign = '-' if delta else '+'
+            expected = '%s%s%x.meta' % (t_meta.short, sign, delta)
+            actual = mgr.make_on_disk_filename(
+                t_meta, '.meta', ctype_timestamp=t_type)
+            self.assertEqual(expected, actual)
+            parsed = mgr.parse_on_disk_filename(actual, POLICIES.default)
+            self.assertEqual(parsed, {
+                'timestamp': t_meta,
+                'frag_index': None,
+                'ext': '.meta',
+                'ctype_timestamp': t_type
+            })
+            # these functions are inverse
+            self.assertEqual(
+                mgr.make_on_disk_filename(**parsed),
+                expected)
+
+    def test_yield_hashes_legacy_durable(self):
+        old_ts = Timestamp('1383180000.12345')
+        fresh_ts = Timestamp(time() - 10)
+        fresher_ts = Timestamp(time() - 1)
+        suffix_map = {
+            'abc': {
+                '9373a92d072897b136b3fc06595b4abc': [
+                    fresh_ts.internal + '.ts'],
+            },
+            '456': {
+                '9373a92d072897b136b3fc06595b0456': [
+                    old_ts.internal + '#2.data',
+                    old_ts.internal + '.durable'],
+                '9373a92d072897b136b3fc06595b7456': [
+                    fresh_ts.internal + '.ts',
+                    fresher_ts.internal + '#2.data',
+                    fresher_ts.internal + '.durable'],
+            },
+            'def': {},
+        }
+        expected = {
+            '9373a92d072897b136b3fc06595b4abc': {'ts_data': fresh_ts},
+            '9373a92d072897b136b3fc06595b0456': {'ts_data': old_ts,
+                                                 'durable': True},
+            '9373a92d072897b136b3fc06595b7456': {'ts_data': fresher_ts,
+                                                 'durable': True},
+        }
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected,
+                                 frag_index=2)
+
+    def test_yield_hashes(self):
+        old_ts = Timestamp('1383180000.12345')
+        fresh_ts = Timestamp(time() - 10)
+        fresher_ts = Timestamp(time() - 1)
+        suffix_map = {
+            'abc': {
+                '9373a92d072897b136b3fc06595b4abc': [
+                    fresh_ts.internal + '.ts'],
+            },
+            '456': {
+                '9373a92d072897b136b3fc06595b0456': [
+                    old_ts.internal + '#2#d.data'],
+                '9373a92d072897b136b3fc06595b7456': [
+                    fresh_ts.internal + '.ts',
+                    fresher_ts.internal + '#2#d.data'],
+            },
+            'def': {},
+        }
+        expected = {
+            '9373a92d072897b136b3fc06595b4abc': {'ts_data': fresh_ts},
+            '9373a92d072897b136b3fc06595b0456': {'ts_data': old_ts,
+                                                 'durable': True},
+            '9373a92d072897b136b3fc06595b7456': {'ts_data': fresher_ts,
+                                                 'durable': True},
+        }
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected,
+                                 frag_index=2)
+
+    def test_yield_hashes_yields_meta_timestamp_legacy_durable(self):
+        ts_iter = (Timestamp(t) for t in itertools.count(int(time())))
+        ts1 = next(ts_iter)
+        ts2 = next(ts_iter)
+        ts3 = next(ts_iter)
+        suffix_map = {
+            'abc': {
+                '9373a92d072897b136b3fc06595b4abc': [
+                    ts1.internal + '.ts',
+                    ts2.internal + '.meta'],
+            },
+            '456': {
+                '9373a92d072897b136b3fc06595b0456': [
+                    ts1.internal + '#2.data',
+                    ts1.internal + '.durable',
+                    ts2.internal + '.meta',
+                    ts3.internal + '.meta'],
+                '9373a92d072897b136b3fc06595b7456': [
+                    ts1.internal + '#2.data',
+                    ts1.internal + '.durable',
+                    ts2.internal + '.meta'],
+            },
+        }
+        expected = {
+            '9373a92d072897b136b3fc06595b4abc': {'ts_data': ts1},
+            '9373a92d072897b136b3fc06595b0456': {'ts_data': ts1,
+                                                 'ts_meta': ts3,
+                                                 'durable': True},
+            '9373a92d072897b136b3fc06595b7456': {'ts_data': ts1,
+                                                 'ts_meta': ts2,
+                                                 'durable': True},
+        }
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected)
+
+        # but meta timestamp is *not* returned if specified frag index
+        # is not found
+        expected = {
+            '9373a92d072897b136b3fc06595b4abc': {'ts_data': ts1},
+        }
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected,
+                                 frag_index=3)
+
+    def test_yield_hashes_yields_meta_timestamp(self):
+        ts_iter = (Timestamp(t) for t in itertools.count(int(time())))
+        ts1 = next(ts_iter)
+        ts2 = next(ts_iter)
+        ts3 = next(ts_iter)
+        suffix_map = {
+            'abc': {
+                '9373a92d072897b136b3fc06595b4abc': [
+                    ts1.internal + '.ts',
+                    ts2.internal + '.meta'],
+            },
+            '456': {
+                '9373a92d072897b136b3fc06595b0456': [
+                    ts1.internal + '#2#d.data',
+                    ts2.internal + '.meta',
+                    ts3.internal + '.meta'],
+                '9373a92d072897b136b3fc06595b7456': [
+                    ts1.internal + '#2#d.data',
+                    ts2.internal + '.meta'],
+            },
+        }
+        expected = {
+            '9373a92d072897b136b3fc06595b4abc': {'ts_data': ts1},
+            '9373a92d072897b136b3fc06595b0456': {'ts_data': ts1,
+                                                 'ts_meta': ts3,
+                                                 'durable': True},
+            '9373a92d072897b136b3fc06595b7456': {'ts_data': ts1,
+                                                 'ts_meta': ts2,
+                                                 'durable': True},
+        }
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected)
+
+        # but meta timestamp is *not* returned if specified frag index
+        # is not found
+        expected = {
+            '9373a92d072897b136b3fc06595b4abc': {'ts_data': ts1},
+        }
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected,
+                                 frag_index=3)
+
+    def test_yield_hashes_suffix_filter_legacy_durable(self):
+        # test again with limited suffixes
+        old_ts = '1383180000.12345'
+        fresh_ts = Timestamp(time() - 10).internal
+        fresher_ts = Timestamp(time() - 1).internal
+        suffix_map = {
+            'abc': {
+                '9373a92d072897b136b3fc06595b4abc': [
+                    fresh_ts + '.ts'],
+            },
+            '456': {
+                '9373a92d072897b136b3fc06595b0456': [
+                    old_ts + '#2.data',
+                    old_ts + '.durable'],
+                '9373a92d072897b136b3fc06595b7456': [
+                    fresh_ts + '.ts',
+                    fresher_ts + '#2.data',
+                    fresher_ts + '.durable'],
+            },
+            'def': {},
+        }
+        expected = {
+            '9373a92d072897b136b3fc06595b0456': {'ts_data': old_ts,
+                                                 'durable': True},
+            '9373a92d072897b136b3fc06595b7456': {'ts_data': fresher_ts,
+                                                 'durable': True},
+        }
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected,
+                                 suffixes=['456'], frag_index=2)
+
+    def test_yield_hashes_suffix_filter(self):
+        # test again with limited suffixes
+        old_ts = '1383180000.12345'
+        fresh_ts = Timestamp(time() - 10).internal
+        fresher_ts = Timestamp(time() - 1).internal
+        suffix_map = {
+            'abc': {
+                '9373a92d072897b136b3fc06595b4abc': [
+                    fresh_ts + '.ts'],
+            },
+            '456': {
+                '9373a92d072897b136b3fc06595b0456': [
+                    old_ts + '#2#d.data'],
+                '9373a92d072897b136b3fc06595b7456': [
+                    fresh_ts + '.ts',
+                    fresher_ts + '#2#d.data'],
+            },
+            'def': {},
+        }
+        expected = {
+            '9373a92d072897b136b3fc06595b0456': {'ts_data': old_ts,
+                                                 'durable': True},
+            '9373a92d072897b136b3fc06595b7456': {'ts_data': fresher_ts,
+                                                 'durable': True},
+        }
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected,
+                                 suffixes=['456'], frag_index=2)
+
+    def test_yield_hashes_skips_non_durable_data(self):
+        ts_iter = (Timestamp(t) for t in itertools.count(int(time())))
+        ts1 = next(ts_iter)
+        suffix_map = {
+            '456': {
+                '9373a92d072897b136b3fc06595b0456': [
+                    ts1.internal + '#2#d.data'],
+                '9373a92d072897b136b3fc06595b7456': [
+                    ts1.internal + '#2.data'],
+            },
+        }
+        expected = {
+            '9373a92d072897b136b3fc06595b0456': {'ts_data': ts1,
+                                                 'durable': True},
+        }
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected,
+                                 frag_index=2)
+
+        # if we add a durable it shows up
+        suffix_map['456']['9373a92d072897b136b3fc06595b7456'] = [
+            ts1.internal + '#2#d.data']
+        expected = {
+            '9373a92d072897b136b3fc06595b0456': {'ts_data': ts1,
+                                                 'durable': True},
+            '9373a92d072897b136b3fc06595b7456': {'ts_data': ts1,
+                                                 'durable': True},
+        }
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected,
+                                 frag_index=2)
+
+    def test_yield_hashes_optionally_yields_non_durable_data(self):
+        ts_iter = (Timestamp(t) for t in itertools.count(int(time())))
+        ts1 = next(ts_iter)
+        ts2 = next(ts_iter)
+        suffix_map = {
+            'abc': {
+                '9373a92d072897b136b3fc06595b4abc': [
+                    ts1.internal + '#2#d.data',
+                    ts2.internal + '#2.data'],  # newer non-durable
+                '9373a92d072897b136b3fc06595b0abc': [
+                    ts1.internal + '#2.data',  # older non-durable
+                    ts2.internal + '#2#d.data'],
+            },
+            '456': {
+                '9373a92d072897b136b3fc06595b0456': [
+                    ts1.internal + '#2#d.data'],
+                '9373a92d072897b136b3fc06595b7456': [
+                    ts2.internal + '#2.data'],
+            },
+        }
+
+        # sanity check non-durables not yielded
+        expected = {
+            '9373a92d072897b136b3fc06595b4abc': {'ts_data': ts1,
+                                                 'durable': True},
+            '9373a92d072897b136b3fc06595b0abc': {'ts_data': ts2,
+                                                 'durable': True},
+            '9373a92d072897b136b3fc06595b0456': {'ts_data': ts1,
+                                                 'durable': True},
+        }
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected,
+                                 frag_index=2, frag_prefs=None)
+
+        # an empty frag_prefs list is sufficient to get non-durables yielded
+        # (in preference over *older* durable)
+        expected = {
+            '9373a92d072897b136b3fc06595b4abc': {'ts_data': ts2,
+                                                 'durable': False},
+            '9373a92d072897b136b3fc06595b0abc': {'ts_data': ts2,
+                                                 'durable': True},
+            '9373a92d072897b136b3fc06595b0456': {'ts_data': ts1,
+                                                 'durable': True},
+            '9373a92d072897b136b3fc06595b7456': {'ts_data': ts2,
+                                                 'durable': False},
+        }
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected,
+                                 frag_index=2, frag_prefs=[])
+
+    def test_yield_hashes_skips_missing_legacy_durable(self):
+        ts_iter = (Timestamp(t) for t in itertools.count(int(time())))
+        ts1 = next(ts_iter)
+        suffix_map = {
+            '456': {
+                '9373a92d072897b136b3fc06595b0456': [
+                    ts1.internal + '#2.data',
+                    ts1.internal + '.durable'],
+                '9373a92d072897b136b3fc06595b7456': [
+                    ts1.internal + '#2.data'],
+            },
+        }
+        expected = {
+            '9373a92d072897b136b3fc06595b0456': {'ts_data': ts1,
+                                                 'durable': True},
+        }
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected,
+                                 frag_index=2)
+
+        # if we add a durable it shows up
+        suffix_map['456']['9373a92d072897b136b3fc06595b7456'].append(
+            ts1.internal + '.durable')
+        expected = {
+            '9373a92d072897b136b3fc06595b0456': {'ts_data': ts1,
+                                                 'durable': True},
+            '9373a92d072897b136b3fc06595b7456': {'ts_data': ts1,
+                                                 'durable': True},
+        }
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected,
+                                 frag_index=2)
+
+    def test_yield_hashes_skips_newer_data_without_legacy_durable(self):
+        ts_iter = (Timestamp(t) for t in itertools.count(int(time())))
+        ts1 = next(ts_iter)
+        ts2 = next(ts_iter)
+        ts3 = next(ts_iter)
+        suffix_map = {
+            '456': {
+                '9373a92d072897b136b3fc06595b0456': [
+                    ts1.internal + '#2.data',
+                    ts1.internal + '.durable',
+                    ts2.internal + '#2.data',
+                    ts3.internal + '#2.data'],
+            },
+        }
+        expected = {
+            '9373a92d072897b136b3fc06595b0456': {'ts_data': ts1,
+                                                 'durable': True},
+        }
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected,
+                                 frag_index=None)
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected,
+                                 frag_index=2)
+
+        # if we add a durable then newer data shows up
+        suffix_map['456']['9373a92d072897b136b3fc06595b0456'].append(
+            ts2.internal + '.durable')
+        expected = {
+            '9373a92d072897b136b3fc06595b0456': {'ts_data': ts2,
+                                                 'durable': True},
+        }
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected,
+                                 frag_index=None)
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected,
+                                 frag_index=2)
+
+    def test_yield_hashes_skips_newer_non_durable_data(self):
+        ts_iter = (Timestamp(t) for t in itertools.count(int(time())))
+        ts1 = next(ts_iter)
+        ts2 = next(ts_iter)
+        ts3 = next(ts_iter)
+        suffix_map = {
+            '456': {
+                '9373a92d072897b136b3fc06595b0456': [
+                    ts1.internal + '#2#d.data',
+                    ts2.internal + '#2.data',
+                    ts3.internal + '#2.data'],
+            },
+        }
+        expected = {
+            '9373a92d072897b136b3fc06595b0456': {'ts_data': ts1,
+                                                 'durable': True},
+        }
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected,
+                                 frag_index=None)
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected,
+                                 frag_index=2)
+
+        # if we make it durable then newer data shows up
+        suffix_map = {
+            '456': {
+                '9373a92d072897b136b3fc06595b0456': [
+                    ts1.internal + '#2#d.data',
+                    ts2.internal + '#2#d.data',
+                    ts3.internal + '#2.data'],
+            },
+        }
+        expected = {
+            '9373a92d072897b136b3fc06595b0456': {'ts_data': ts2,
+                                                 'durable': True},
+        }
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected,
+                                 frag_index=None)
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected,
+                                 frag_index=2)
+
+    def test_yield_hashes_ignores_bad_ondisk_filesets(self):
+        # this differs from DiskFileManager.yield_hashes which will fail
+        # when encountering a bad on-disk file set
+        ts_iter = (Timestamp(t) for t in itertools.count(int(time())))
+        ts1 = next(ts_iter)
+        ts2 = next(ts_iter)
+        suffix_map = {
+            '456': {
+                # this one is fine
+                '9333a92d072897b136b3fc06595b0456': [
+                    ts1.internal + '#2#d.data'],
+                # this one is fine, legacy durable
+                '9333a92d072897b136b3fc06595b1456': [
+                    ts1.internal + '#2.data',
+                    ts1.internal + '.durable'],
+                # missing frag index
+                '9444a92d072897b136b3fc06595b7456': [
+                    ts1.internal + '.data'],
+                # junk
+                '9555a92d072897b136b3fc06595b8456': [
+                    'junk_file'],
+                # not durable
+                '9666a92d072897b136b3fc06595b9456': [
+                    ts1.internal + '#2.data',
+                    ts2.internal + '.meta'],
+                # .meta files w/o .data files can't be opened, and are ignored
+                '9777a92d072897b136b3fc06595ba456': [
+                    ts1.internal + '.meta'],
+                # multiple meta files with no data
+                '9888a92d072897b136b3fc06595bb456': [
+                    ts1.internal + '.meta',
+                    ts2.internal + '.meta'],
+                # this is good with meta
+                '9999a92d072897b136b3fc06595bb456': [
+                    ts1.internal + '#2#d.data',
+                    ts2.internal + '.meta'],
+                # this is good with meta, legacy durable
+                '9999a92d072897b136b3fc06595bc456': [
+                    ts1.internal + '#2.data',
+                    ts1.internal + '.durable',
+                    ts2.internal + '.meta'],
+                # this one is wrong frag index
+                '9aaaa92d072897b136b3fc06595b0456': [
+                    ts1.internal + '#7#d.data'],
+                # this one is wrong frag index, legacy durable
+                '9aaaa92d072897b136b3fc06595b1456': [
+                    ts1.internal + '#7.data',
+                    ts1.internal + '.durable'],
+            },
+        }
+        expected = {
+            '9333a92d072897b136b3fc06595b0456': {'ts_data': ts1,
+                                                 'durable': True},
+            '9999a92d072897b136b3fc06595bb456': {'ts_data': ts1,
+                                                 'ts_meta': ts2,
+                                                 'durable': True},
+            '9333a92d072897b136b3fc06595b1456': {'ts_data': ts1,
+                                                 'durable': True},
+            '9999a92d072897b136b3fc06595bc456': {'ts_data': ts1,
+                                                 'ts_meta': ts2,
+                                                 'durable': True},
+        }
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected,
+                                 frag_index=2)
+
+    def test_yield_hashes_filters_frag_index(self):
+        ts_iter = (Timestamp(t) for t in itertools.count(int(time())))
+        ts1 = next(ts_iter)
+        ts2 = next(ts_iter)
+        ts3 = next(ts_iter)
+        suffix_map = {
+            '27e': {
+                '1111111111111111111111111111127e': [
+                    ts1.internal + '#2#d.data',
+                    ts1.internal + '#3#d.data',
+                ],
+                '2222222222222222222222222222227e': [
+                    ts1.internal + '#2#d.data',
+                    ts2.internal + '#2#d.data',
+                ],
+            },
+            'd41': {
+                'aaaaaaaaaaaaaaaaaaaaaaaaaaaaad41': [
+                    ts1.internal + '#3#d.data',
+                ],
+            },
+            '00b': {
+                '3333333333333333333333333333300b': [
+                    ts1.internal + '#2.data',
+                    ts2.internal + '#2.data',
+                    ts3.internal + '#2#d.data',
+                ],
+            },
+        }
+        expected = {
+            '1111111111111111111111111111127e': {'ts_data': ts1,
+                                                 'durable': True},
+            '2222222222222222222222222222227e': {'ts_data': ts2,
+                                                 'durable': True},
+            '3333333333333333333333333333300b': {'ts_data': ts3,
+                                                 'durable': True},
+        }
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected,
+                                 frag_index=2)
+
+    def test_yield_hashes_filters_frag_index_legacy_durable(self):
+        ts_iter = (Timestamp(t) for t in itertools.count(int(time())))
+        ts1 = next(ts_iter)
+        ts2 = next(ts_iter)
+        ts3 = next(ts_iter)
+        suffix_map = {
+            '27e': {
+                '1111111111111111111111111111127e': [
+                    ts1.internal + '#2.data',
+                    ts1.internal + '#3.data',
+                    ts1.internal + '.durable',
+                ],
+                '2222222222222222222222222222227e': [
+                    ts1.internal + '#2.data',
+                    ts1.internal + '.durable',
+                    ts2.internal + '#2.data',
+                    ts2.internal + '.durable',
+                ],
+            },
+            'd41': {
+                'aaaaaaaaaaaaaaaaaaaaaaaaaaaaad41': [
+                    ts1.internal + '#3.data',
+                    ts1.internal + '.durable',
+                ],
+            },
+            '00b': {
+                '3333333333333333333333333333300b': [
+                    ts1.internal + '#2.data',
+                    ts2.internal + '#2.data',
+                    ts3.internal + '#2.data',
+                    ts3.internal + '.durable',
+                ],
+            },
+        }
+        expected = {
+            '1111111111111111111111111111127e': {'ts_data': ts1,
+                                                 'durable': True},
+            '2222222222222222222222222222227e': {'ts_data': ts2,
+                                                 'durable': True},
+            '3333333333333333333333333333300b': {'ts_data': ts3,
+                                                 'durable': True},
+        }
+        self._check_yield_hashes(POLICIES.default, suffix_map, expected,
+                                 frag_index=2)
+
+    def _test_get_diskfile_from_hash_frag_index_filter(self, legacy_durable):
+        df = self._get_diskfile(POLICIES.default)
+        hash_ = os.path.basename(df._datadir)
+        self.assertRaises(DiskFileNotExist,
+                          self.df_mgr.get_diskfile_from_hash,
+                          self.existing_device, '0', hash_,
+                          POLICIES.default)  # sanity
+        timestamp = Timestamp.now()
+        for frag_index in (4, 7):
+            write_diskfile(df, timestamp, frag_index=frag_index,
+                           legacy_durable=legacy_durable)
+
+        df4 = self.df_mgr.get_diskfile_from_hash(
+            self.existing_device, '0', hash_, POLICIES.default, frag_index=4)
+        self.assertEqual(df4._frag_index, 4)
+        self.assertEqual(
+            df4.read_metadata()['X-Object-Sysmeta-Ec-Frag-Index'], '4')
+        df7 = self.df_mgr.get_diskfile_from_hash(
+            self.existing_device, '0', hash_, POLICIES.default, frag_index=7)
+        self.assertEqual(df7._frag_index, 7)
+        self.assertEqual(
+            df7.read_metadata()['X-Object-Sysmeta-Ec-Frag-Index'], '7')
+
+    def test_get_diskfile_from_hash_frag_index_filter(self):
+        self._test_get_diskfile_from_hash_frag_index_filter(False)
+
+    def test_get_diskfile_from_hash_frag_index_filter_legacy_durable(self):
+        self._test_get_diskfile_from_hash_frag_index_filter(True)
+
+    def test_check_policy(self):
+        mock_policy = mock.MagicMock()
+        mock_policy.policy_type = EC_POLICY
+        # sanity, ECDiskFileManager is ok with EC_POLICY
+        diskfile.ECDiskFileManager.check_policy(mock_policy)
+        # ECDiskFileManager raises ValueError with REPL_POLICY
+        mock_policy.policy_type = REPL_POLICY
+        with self.assertRaises(ValueError) as cm:
+            diskfile.ECDiskFileManager.check_policy(mock_policy)
+        self.assertEqual('Invalid policy_type: %s' % REPL_POLICY,
+                         str(cm.exception))
+
+
+class DiskFileMixin(BaseDiskFileTestMixin):
+
+    def ts(self):
+        """
+        Timestamps - forever.
+        """
+        return next(self._ts_iter)
+
+    def _create_ondisk_file(self, df, data, timestamp, metadata=None,
+                            ctype_timestamp=None,
+                            ext='.data', legacy_durable=False, commit=True):
+        mkdirs(df._datadir)
+        if timestamp is None:
+            timestamp = time()
+        timestamp = Timestamp(timestamp)
+        if not metadata:
+            metadata = {}
+        if 'X-Timestamp' not in metadata:
+            metadata['X-Timestamp'] = timestamp.internal
+        if 'ETag' not in metadata:
+            etag = md5()
+            etag.update(data)
+            metadata['ETag'] = etag.hexdigest()
+        if 'name' not in metadata:
+            metadata['name'] = '/a/c/o'
+        if 'Content-Length' not in metadata:
+            metadata['Content-Length'] = str(len(data))
+        filename = timestamp.internal
+        if ext == '.data' and df.policy.policy_type == EC_POLICY:
+            if legacy_durable:
+                filename = '%s#%s' % (timestamp.internal, df._frag_index)
+                if commit:
+                    durable_file = os.path.join(
+                        df._datadir, '%s.durable' % timestamp.internal)
+                    with open(durable_file, 'wb') as f:
+                        pass
+            elif commit:
+                filename = '%s#%s#d' % (timestamp.internal, df._frag_index)
+            else:
+                filename = '%s#%s' % (timestamp.internal, df._frag_index)
+        if ctype_timestamp:
+            metadata.update(
+                {'Content-Type-Timestamp':
+                 Timestamp(ctype_timestamp).internal})
+            filename = encode_timestamps(timestamp,
+                                         Timestamp(ctype_timestamp),
+                                         explicit=True)
+        data_file = os.path.join(df._datadir, filename + ext)
+        with open(data_file, 'wb') as f:
+            f.write(data)
+            xattr.setxattr(f.fileno(), diskfile.METADATA_KEY,
+                           pickle.dumps(metadata, diskfile.PICKLE_PROTOCOL))
+
+    def _simple_get_diskfile(self, partition='0', account='a', container='c',
+                             obj='o', policy=None, frag_index=None, **kwargs):
+        policy = policy or POLICIES.default
+        df_mgr = self.df_router[policy]
+        if policy.policy_type == EC_POLICY and frag_index is None:
+            frag_index = 2
+        return df_mgr.get_diskfile(self.existing_device, partition,
+                                   account, container, obj,
+                                   policy=policy, frag_index=frag_index,
+                                   **kwargs)
+
+    def _create_test_file(self, data, timestamp=None, metadata=None,
+                          account='a', container='c', obj='o', **kwargs):
+        if not isinstance(data, bytes):
+            raise ValueError('data must be bytes')
+        if metadata is None:
+            metadata = {}
+        metadata.setdefault('name', '/%s/%s/%s' % (account, container, obj))
+        df = self._simple_get_diskfile(account=account, container=container,
+                                       obj=obj, **kwargs)
+        if timestamp is None:
+            timestamp = time()
+        timestamp = Timestamp(timestamp)
+
+        # avoid getting O_TMPFILE warning in logs
+        if not utils.o_tmpfile_in_tmpdir_supported():
+            df.manager.use_linkat = False
+
+        if df.policy.policy_type == EC_POLICY:
+            data = encode_frag_archive_bodies(df.policy, data)[df._frag_index]
+
+        with df.create() as writer:
+            new_metadata = {
+                'ETag': md5(data).hexdigest(),
+                'X-Timestamp': timestamp.internal,
+                'Content-Length': len(data),
+            }
+            new_metadata.update(metadata)
+            writer.write(data)
+            writer.put(new_metadata)
+            writer.commit(timestamp)
+        df.open()
+        return df, data
+
+    def test_get_dev_path(self):
+        self.df_mgr.devices = '/srv'
+        device = 'sda1'
+        dev_path = os.path.join(self.df_mgr.devices, device)
+
+        mount_check = None
+        self.df_mgr.mount_check = True
+        with mock_check_drive(ismount=False):
+            self.assertEqual(self.df_mgr.get_dev_path(device, mount_check),
+                             None)
+        with mock_check_drive(ismount=True):
+            self.assertEqual(self.df_mgr.get_dev_path(device, mount_check),
+                             dev_path)
+
+        self.df_mgr.mount_check = False
+        with mock_check_drive(isdir=False):
+            self.assertEqual(self.df_mgr.get_dev_path(device, mount_check),
+                             None)
+        with mock_check_drive(isdir=True):
+            self.assertEqual(self.df_mgr.get_dev_path(device, mount_check),
+                             dev_path)
+
+        mount_check = True
+        with mock_check_drive(ismount=False):
+            self.assertEqual(self.df_mgr.get_dev_path(device, mount_check),
+                             None)
+        with mock_check_drive(ismount=True):
+            self.assertEqual(self.df_mgr.get_dev_path(device, mount_check),
+                             dev_path)
+
+        mount_check = False
+        self.assertEqual(self.df_mgr.get_dev_path(device, mount_check),
+                         dev_path)
+
+    def test_open_not_exist(self):
+        df = self._simple_get_diskfile()
+        self.assertRaises(DiskFileNotExist, df.open)
+
+    def test_open_expired(self):
+        self.assertRaises(DiskFileExpired,
+                          self._create_test_file,
+                          b'1234567890', metadata={'X-Delete-At': '0'})
+
+        try:
+            self._create_test_file(b'1234567890', open_expired=True,
+                                   metadata={'X-Delete-At': '0',
+                                             'X-Object-Meta-Foo': 'bar'})
+            df = self._simple_get_diskfile(open_expired=True)
+            md = df.read_metadata()
+            self.assertEqual(md['X-Object-Meta-Foo'], 'bar')
+        except SwiftException as err:
+            self.fail("Unexpected swift exception raised: %r" % err)
+
+    def test_open_not_expired(self):
+        try:
+            self._create_test_file(
+                b'1234567890', metadata={'X-Delete-At': str(2 * int(time()))})
+        except SwiftException as err:
+            self.fail("Unexpected swift exception raised: %r" % err)
+
+    def test_get_metadata(self):
+        timestamp = self.ts().internal
+        df, df_data = self._create_test_file(b'1234567890',
+                                             timestamp=timestamp)
+        md = df.get_metadata()
+        self.assertEqual(md['X-Timestamp'], timestamp)
+
+    def test_read_metadata(self):
+        timestamp = self.ts().internal
+        self._create_test_file(b'1234567890', timestamp=timestamp)
+        df = self._simple_get_diskfile()
+        md = df.read_metadata()
+        self.assertEqual(md['X-Timestamp'], timestamp)
+
+    def test_read_metadata_no_xattr(self):
+        def mock_getxattr(*args, **kargs):
+            error_num = errno.ENOTSUP if hasattr(errno, 'ENOTSUP') else \
+                errno.EOPNOTSUPP
+            raise IOError(error_num, "Operation not supported")
+
+        with mock.patch('xattr.getxattr', mock_getxattr):
+            self.assertRaises(
+                DiskFileXattrNotSupported,
+                diskfile.read_metadata, 'n/a')
+
+    def test_get_metadata_not_opened(self):
+        df = self._simple_get_diskfile()
+        with self.assertRaises(DiskFileNotOpen):
+            df.get_metadata()
+
+    def test_get_datafile_metadata(self):
+        ts_iter = make_timestamp_iter()
+        body = b'1234567890'
+        ts_data = next(ts_iter)
+        metadata = {'X-Object-Meta-Test': 'test1',
+                    'X-Object-Sysmeta-Test': 'test1'}
+        df, df_data = self._create_test_file(body, timestamp=ts_data.internal,
+                                             metadata=metadata)
+        expected = df.get_metadata()
+        ts_meta = next(ts_iter)
+        df.write_metadata({'X-Timestamp': ts_meta.internal,
+                           'X-Object-Meta-Test': 'changed',
+                           'X-Object-Sysmeta-Test': 'ignored'})
+        df.open()
+        self.assertEqual(expected, df.get_datafile_metadata())
+        expected.update({'X-Timestamp': ts_meta.internal,
+                         'X-Object-Meta-Test': 'changed'})
+        self.assertEqual(expected, df.get_metadata())
+
+    def test_get_datafile_metadata_not_opened(self):
+        df = self._simple_get_diskfile()
+        with self.assertRaises(DiskFileNotOpen):
+            df.get_datafile_metadata()
+
+    def test_get_metafile_metadata(self):
+        ts_iter = make_timestamp_iter()
+        body = b'1234567890'
+        ts_data = next(ts_iter)
+        metadata = {'X-Object-Meta-Test': 'test1',
+                    'X-Object-Sysmeta-Test': 'test1'}
+        df, df_data = self._create_test_file(body, timestamp=ts_data.internal,
+                                             metadata=metadata)
+        self.assertIsNone(df.get_metafile_metadata())
+
+        # now create a meta file
+        ts_meta = next(ts_iter)
+        df.write_metadata({'X-Timestamp': ts_meta.internal,
+                           'X-Object-Meta-Test': 'changed'})
+        df.open()
+        expected = {'X-Timestamp': ts_meta.internal,
+                    'X-Object-Meta-Test': 'changed'}
+        self.assertEqual(expected, df.get_metafile_metadata())
+
+    def test_get_metafile_metadata_not_opened(self):
+        df = self._simple_get_diskfile()
+        with self.assertRaises(DiskFileNotOpen):
+            df.get_metafile_metadata()
+
+    def test_not_opened(self):
+        df = self._simple_get_diskfile()
+        with self.assertRaises(DiskFileNotOpen):
+            with df:
+                pass
+
+    def test_disk_file_default_disallowed_metadata(self):
+        # build an object with some meta (at t0+1s)
+        orig_metadata = {'X-Object-Meta-Key1': 'Value1',
+                         'X-Object-Transient-Sysmeta-KeyA': 'ValueA',
+                         'Content-Type': 'text/garbage'}
+        df = self._get_open_disk_file(ts=self.ts().internal,
+                                      extra_metadata=orig_metadata)
+        with df.open():
+            if df.policy.policy_type == EC_POLICY:
+                expected = df.policy.pyeclib_driver.get_segment_info(
+                    1024, df.policy.ec_segment_size)['fragment_size']
+            else:
+                expected = 1024
+            self.assertEqual(str(expected), df._metadata['Content-Length'])
+        # write some new metadata (fast POST, don't send orig meta, at t0+1)
+        df = self._simple_get_diskfile()
+        df.write_metadata({'X-Timestamp': self.ts().internal,
+                           'X-Object-Transient-Sysmeta-KeyB': 'ValueB',
+                           'X-Object-Meta-Key2': 'Value2'})
+        df = self._simple_get_diskfile()
+        with df.open():
+            # non-fast-post updateable keys are preserved
+            self.assertEqual('text/garbage', df._metadata['Content-Type'])
+            # original fast-post updateable keys are removed
+            self.assertNotIn('X-Object-Meta-Key1', df._metadata)
+            self.assertNotIn('X-Object-Transient-Sysmeta-KeyA', df._metadata)
+            # new fast-post updateable keys are added
+            self.assertEqual('Value2', df._metadata['X-Object-Meta-Key2'])
+            self.assertEqual('ValueB',
+                             df._metadata['X-Object-Transient-Sysmeta-KeyB'])
+
+    def test_disk_file_preserves_sysmeta(self):
+        # build an object with some meta (at t0)
+        orig_metadata = {'X-Object-Sysmeta-Key1': 'Value1',
+                         'Content-Type': 'text/garbage'}
+        df = self._get_open_disk_file(ts=self.ts().internal,
+                                      extra_metadata=orig_metadata)
+        with df.open():
+            if df.policy.policy_type == EC_POLICY:
+                expected = df.policy.pyeclib_driver.get_segment_info(
+                    1024, df.policy.ec_segment_size)['fragment_size']
+            else:
+                expected = 1024
+            self.assertEqual(str(expected), df._metadata['Content-Length'])
+        # write some new metadata (fast POST, don't send orig meta, at t0+1s)
+        df = self._simple_get_diskfile()
+        df.write_metadata({'X-Timestamp': self.ts().internal,
+                           'X-Object-Sysmeta-Key1': 'Value2',
+                           'X-Object-Meta-Key3': 'Value3'})
+        df = self._simple_get_diskfile()
+        with df.open():
+            # non-fast-post updateable keys are preserved
+            self.assertEqual('text/garbage', df._metadata['Content-Type'])
+            # original sysmeta keys are preserved
+            self.assertEqual('Value1', df._metadata['X-Object-Sysmeta-Key1'])
+
+    def test_disk_file_preserves_slo(self):
+        # build an object with some meta (at t0)
+        orig_metadata = {'X-Static-Large-Object': 'True',
+                         'Content-Type': 'text/garbage'}
+        df = self._get_open_disk_file(ts=self.ts().internal,
+                                      extra_metadata=orig_metadata)
+
+        # sanity test
+        with df.open():
+            self.assertEqual('True', df._metadata['X-Static-Large-Object'])
+            if df.policy.policy_type == EC_POLICY:
+                expected = df.policy.pyeclib_driver.get_segment_info(
+                    1024, df.policy.ec_segment_size)['fragment_size']
+            else:
+                expected = 1024
+            self.assertEqual(str(expected), df._metadata['Content-Length'])
+
+        # write some new metadata (fast POST, don't send orig meta, at t0+1s)
+        df = self._simple_get_diskfile()
+        df.write_metadata({'X-Timestamp': self.ts().internal})
+        df = self._simple_get_diskfile()
+        with df.open():
+            # non-fast-post updateable keys are preserved
+            self.assertEqual('text/garbage', df._metadata['Content-Type'])
+            self.assertEqual('True', df._metadata['X-Static-Large-Object'])
+
+    def test_disk_file_reader_iter(self):
+        df, df_data = self._create_test_file(b'1234567890')
+        quarantine_msgs = []
+        reader = df.reader(_quarantine_hook=quarantine_msgs.append)
+        self.assertEqual(b''.join(reader), df_data)
+        self.assertEqual(quarantine_msgs, [])
+
+    def test_disk_file_reader_iter_w_quarantine(self):
+        df, df_data = self._create_test_file(b'1234567890')
+
+        def raise_dfq(m):
+            raise DiskFileQuarantined(m)
+
+        reader = df.reader(_quarantine_hook=raise_dfq)
+        reader._obj_size += 1
+        self.assertRaises(DiskFileQuarantined, b''.join, reader)
+
+    def test_disk_file_reader_iter_w_io_error(self):
+        df, df_data = self._create_test_file(b'1234567890')
+
+        class FakeFp(object):
+            def __init__(self, buf):
+                self.pos = 0
+                self.buf = buf
+
+            def read(self, sz):
+                if not self.buf:
+                    raise IOError(5, 'Input/output error')
+                chunk, self.buf = self.buf, b''
+                self.pos += len(chunk)
+                return chunk
+
+            def close(self):
+                pass
+
+            def tell(self):
+                return self.pos
+
+        def raise_dfq(m):
+            raise DiskFileQuarantined(m)
+
+        reader = df.reader(_quarantine_hook=raise_dfq)
+        reader._fp = FakeFp(b'1234')
+        self.assertRaises(DiskFileQuarantined, b''.join, reader)
+
+    def test_disk_file_app_iter_corners(self):
+        df, df_data = self._create_test_file(b'1234567890')
+        quarantine_msgs = []
+        reader = df.reader(_quarantine_hook=quarantine_msgs.append)
+        self.assertEqual(b''.join(reader.app_iter_range(0, None)),
+                         df_data)
+        self.assertEqual(quarantine_msgs, [])
+        df = self._simple_get_diskfile()
+        with df.open():
+            reader = df.reader()
+            self.assertEqual(b''.join(reader.app_iter_range(5, None)),
+                             df_data[5:])
+
+    def test_disk_file_app_iter_range_w_none(self):
+        df, df_data = self._create_test_file(b'1234567890')
+        quarantine_msgs = []
+        reader = df.reader(_quarantine_hook=quarantine_msgs.append)
+        self.assertEqual(b''.join(reader.app_iter_range(None, None)),
+                         df_data)
+        self.assertEqual(quarantine_msgs, [])
+
+    def test_disk_file_app_iter_partial_closes(self):
+        df, df_data = self._create_test_file(b'1234567890')
+        quarantine_msgs = []
+        reader = df.reader(_quarantine_hook=quarantine_msgs.append)
+        it = reader.app_iter_range(0, 5)
+        self.assertEqual(b''.join(it), df_data[:5])
+        self.assertEqual(quarantine_msgs, [])
+        self.assertTrue(reader._fp is None)
+
+    def test_disk_file_app_iter_ranges(self):
+        df, df_data = self._create_test_file(b'012345678911234567892123456789')
+        quarantine_msgs = []
+        reader = df.reader(_quarantine_hook=quarantine_msgs.append)
+        it = reader.app_iter_ranges([(0, 10), (10, 20), (20, 30)],
+                                    'plain/text',
+                                    '\r\n--someheader\r\n', len(df_data))
+        value = b''.join(it)
+        self.assertIn(df_data[:10], value)
+        self.assertIn(df_data[10:20], value)
+        self.assertIn(df_data[20:30], value)
+        self.assertEqual(quarantine_msgs, [])
+
+    def test_disk_file_app_iter_ranges_w_quarantine(self):
+        df, df_data = self._create_test_file(b'012345678911234567892123456789')
+        quarantine_msgs = []
+        reader = df.reader(_quarantine_hook=quarantine_msgs.append)
+        self.assertEqual(len(df_data), reader._obj_size)  # sanity check
+        reader._obj_size += 1
+        it = reader.app_iter_ranges([(0, len(df_data))],
+                                    'plain/text',
+                                    '\r\n--someheader\r\n', len(df_data))
+        value = b''.join(it)
+        self.assertIn(df_data, value)
+        self.assertEqual(quarantine_msgs,
+                         ["Bytes read: %s, does not match metadata: %s" %
+                          (len(df_data), len(df_data) + 1)])
+
+    def test_disk_file_app_iter_ranges_w_no_etag_quarantine(self):
+        df, df_data = self._create_test_file(b'012345678911234567892123456789')
+        quarantine_msgs = []
+        reader = df.reader(_quarantine_hook=quarantine_msgs.append)
+        it = reader.app_iter_ranges([(0, 10)],
+                                    'plain/text',
+                                    '\r\n--someheader\r\n', len(df_data))
+        value = b''.join(it)
+        self.assertIn(df_data[:10], value)
+        self.assertEqual(quarantine_msgs, [])
+
+    def test_disk_file_app_iter_ranges_edges(self):
+        df, df_data = self._create_test_file(b'012345678911234567892123456789')
+        quarantine_msgs = []
+        reader = df.reader(_quarantine_hook=quarantine_msgs.append)
+        it = reader.app_iter_ranges([(3, 10), (0, 2)], 'application/whatever',
+                                    '\r\n--someheader\r\n', len(df_data))
+        value = b''.join(it)
+        self.assertIn(df_data[3:10], value)
+        self.assertIn(df_data[:2], value)
+        self.assertEqual(quarantine_msgs, [])
+
+    def test_disk_file_large_app_iter_ranges(self):
+        # This test case is to make sure that the disk file app_iter_ranges
+        # method all the paths being tested.
+        long_str = b'01234567890' * 65536
+        df, df_data = self._create_test_file(long_str)
+        target_strs = [df_data[3:10], df_data[0:65590]]
+        quarantine_msgs = []
+        reader = df.reader(_quarantine_hook=quarantine_msgs.append)
+        it = reader.app_iter_ranges([(3, 10), (0, 65590)], 'plain/text',
+                                    '5e816ff8b8b8e9a5d355497e5d9e0301',
+                                    len(df_data))
+
+        # The produced string actually missing the MIME headers
+        # need to add these headers to make it as real MIME message.
+        # The body of the message is produced by method app_iter_ranges
+        # off of DiskFile object.
+        header = b''.join([b'Content-Type: multipart/byteranges;',
+                           b'boundary=',
+                           b'5e816ff8b8b8e9a5d355497e5d9e0301\r\n'])
+
+        value = header + b''.join(it)
+        self.assertEqual(quarantine_msgs, [])
+
+        message = email.message_from_bytes(value)
+        parts = [p.get_payload(decode=True) for p in message.walk()][1:3]
+        self.assertEqual(parts, target_strs)
+
+    def test_disk_file_app_iter_ranges_empty(self):
+        # This test case tests when empty value passed into app_iter_ranges
+        # When ranges passed into the method is either empty array or None,
+        # this method will yield empty string
+        df, df_data = self._create_test_file(b'012345678911234567892123456789')
+        quarantine_msgs = []
+        reader = df.reader(_quarantine_hook=quarantine_msgs.append)
+        it = reader.app_iter_ranges([], 'application/whatever',
+                                    '\r\n--someheader\r\n', len(df_data))
+        self.assertEqual(b''.join(it), b'')
+
+        df = self._simple_get_diskfile()
+        with df.open():
+            reader = df.reader()
+            it = reader.app_iter_ranges(None, 'app/something',
+                                        '\r\n--someheader\r\n', 150)
+            self.assertEqual(b''.join(it), b'')
+            self.assertEqual(quarantine_msgs, [])
+
+    def test_disk_file_mkstemp_creates_dir(self):
+        for policy in POLICIES:
+            tmpdir = os.path.join(self.testdir, self.existing_device,
+                                  diskfile.get_tmp_dir(policy))
+            os.rmdir(tmpdir)
+            df = self._simple_get_diskfile(policy=policy)
+            df.manager.use_linkat = False
+            with df.create():
+                self.assertTrue(os.path.exists(tmpdir))
+
+    def test_disk_file_writer(self):
+        df = self._simple_get_diskfile()
+        with df.create() as writer:
+            self.assertIsInstance(writer, diskfile.BaseDiskFileWriter)
+            # create automatically opens for us
+            self.assertIsNotNone(writer._fd)
+            # can't re-open since we're already open
+            with self.assertRaises(ValueError):
+                writer.open()
+            writer.write(b'asdf')
+            writer.close()
+            # can't write any more
+            with self.assertRaises(ValueError):
+                writer.write(b'asdf')
+            # can close again
+            writer.close()
+
+    def test_disk_file_concurrent_writes(self):
+        def threadA(df, events, errors):
+            try:
+                ts = self.ts()
+                with df.create() as writer:
+                    writer.write(b'dataA')
+                    writer.put({
+                        'X-Timestamp': ts.internal,
+                        'Content-Length': 5,
+                    })
+                    events[0].set()
+                    events[1].wait()
+                    writer.commit(ts)
+            except Exception as e:
+                errors.append(e)
+                raise
+
+        def threadB(df, events, errors):
+            try:
+                events[0].wait()
+                ts = self.ts()
+                with df.create() as writer:
+                    writer.write(b'dataB')
+                    writer.put({
+                        'X-Timestamp': ts.internal,
+                        'Content-Length': 5,
+                    })
+                    writer.commit(ts)
+                events[1].set()
+            except Exception as e:
+                errors.append(e)
+                raise
+
+        df = self._simple_get_diskfile()
+        events = [threading.Event(), threading.Event()]
+        errors = []
+
+        threads = [threading.Thread(target=tgt, args=(df, events, errors))
+                   for tgt in (threadA, threadB)]
+        for thread in threads:
+            thread.start()
+        for thread in threads:
+            thread.join()
+        self.assertFalse(errors)
+
+        with df.open(), open(df._data_file, 'rb') as fp:
+            self.assertEqual(b'dataB', fp.read())
+
+    def test_disk_file_concurrent_marked_durable(self):
+        ts = self.ts()
+
+        def threadA(df, events, errors):
+            try:
+                with df.create() as writer:
+                    writer.write(b'dataA')
+                    writer.put({
+                        'X-Timestamp': ts.internal,
+                        'Content-Length': 5,
+                    })
+                    events[0].set()
+                    events[1].wait()
+                    writer.commit(ts)
+            except Exception as e:
+                errors.append(e)
+                raise
+
+        def threadB(df, events, errors):
+            try:
+                events[0].wait()
+                # Mark it durable just like in ssync_receiver
+                with df.create() as writer:
+                    writer.commit(ts)
+                events[1].set()
+            except Exception as e:
+                errors.append(e)
+                raise
+
+        df = self._simple_get_diskfile()
+        events = [threading.Event(), threading.Event()]
+        errors = []
+
+        threads = [threading.Thread(target=tgt, args=(df, events, errors))
+                   for tgt in (threadA, threadB)]
+        for thread in threads:
+            thread.start()
+        for thread in threads:
+            thread.join()
+        self.assertFalse(errors)
+
+        with df.open(), open(df._data_file, 'rb') as fp:
+            if df.policy.policy_type == EC_POLICY:
+                # Confirm that it really *was* marked durable
+                self.assertTrue(df._data_file.endswith('#d.data'))
+            self.assertEqual(b'dataA', fp.read())
+
+    def test_disk_file_concurrent_delete(self):
+        def threadA(df, events, errors):
+            try:
+                ts = self.ts()
+                with df.create() as writer:
+                    writer.write(b'dataA')
+                    writer.put({'X-Timestamp': ts.internal})
+                    events[0].set()
+                    events[1].wait()
+                    writer.commit(ts)
+            except Exception as e:
+                errors.append(e)
+                raise
+
+        def threadB(df, events, errors):
+            try:
+                events[0].wait()
+                df.delete(self.ts())
+                events[1].set()
+            except Exception as e:
+                errors.append(e)
+                raise
+
+        df = self._simple_get_diskfile()
+        events = [threading.Event(), threading.Event()]
+        errors = []
+
+        threads = [threading.Thread(target=tgt, args=(df, events, errors))
+                   for tgt in (threadA, threadB)]
+        for thread in threads:
+            thread.start()
+        for thread in threads:
+            thread.join()
+        self.assertFalse(errors)
+
+        self.assertRaises(DiskFileDeleted, df.open)
+
+    def _get_open_disk_file(self, invalid_type=None, obj_name='o', fsize=1024,
+                            csize=8, mark_deleted=False, prealloc=False,
+                            ts=None, mount_check=False, extra_metadata=None,
+                            policy=None, frag_index=None, data=None,
+                            commit=True):
+        '''returns a DiskFile'''
+        policy = policy or POLICIES.legacy
+        df = self._simple_get_diskfile(obj=obj_name, policy=policy,
+                                       frag_index=frag_index)
+        data = data or b'0' * fsize
+        if not isinstance(data, bytes):
+            raise ValueError('data must be bytes')
+        if policy.policy_type == EC_POLICY:
+            archives = encode_frag_archive_bodies(policy, data)
+            try:
+                data = archives[df._frag_index]
+            except IndexError:
+                data = archives[0]
+
+        if ts:
+            timestamp = Timestamp(ts)
+        else:
+            timestamp = Timestamp.now()
+        if prealloc:
+            prealloc_size = fsize
+        else:
+            prealloc_size = None
+
+        with df.create(size=prealloc_size) as writer:
+            writer.write(data)
+            upload_size, etag = writer.chunks_finished()
+            metadata = {
+                'ETag': etag,
+                'X-Timestamp': timestamp.internal,
+                'Content-Length': str(upload_size),
+            }
+            metadata.update(extra_metadata or {})
+            writer.put(metadata)
+            if invalid_type == 'ETag':
+                etag = md5()
+                etag.update('1' + '0' * (fsize - 1))
+                etag = etag.hexdigest()
+                metadata['ETag'] = etag
+                diskfile.write_metadata(writer._fd, metadata)
+            elif invalid_type == 'Content-Length':
+                metadata['Content-Length'] = fsize - 1
+                diskfile.write_metadata(writer._fd, metadata)
+            elif invalid_type == 'Bad-Content-Length':
+                metadata['Content-Length'] = 'zero'
+                diskfile.write_metadata(writer._fd, metadata)
+            elif invalid_type == 'Missing-Content-Length':
+                del metadata['Content-Length']
+                diskfile.write_metadata(writer._fd, metadata)
+            elif invalid_type == 'Bad-X-Delete-At':
+                metadata['X-Delete-At'] = 'bad integer'
+                diskfile.write_metadata(writer._fd, metadata)
+            if commit:
+                writer.commit(timestamp)
+
+        if mark_deleted:
+            df.delete(timestamp)
+
+        data_files = [os.path.join(df._datadir, fname)
+                      for fname in sorted(os.listdir(df._datadir),
+                                          reverse=True)
+                      if fname.endswith('.data')]
+        if invalid_type == 'Corrupt-Xattrs':
+            # We have to go below read_metadata/write_metadata to get proper
+            # corruption.
+            meta_xattr = xattr.getxattr(data_files[0], "user.swift.metadata")
+            wrong_byte = b'X' if meta_xattr[:1] != b'X' else b'Y'
+            xattr.setxattr(data_files[0], "user.swift.metadata",
+                           wrong_byte + meta_xattr[1:])
+        elif invalid_type == 'Subtly-Corrupt-Xattrs':
+            # We have to go below read_metadata/write_metadata to get proper
+            # corruption.
+            meta_xattr = xattr.getxattr(data_files[0], "user.swift.metadata")
+            wrong_checksum = md5(meta_xattr + b"some extra stuff").hexdigest()
+            xattr.setxattr(data_files[0], "user.swift.metadata_checksum",
+                           wrong_checksum.encode())
+        elif invalid_type == 'Truncated-Xattrs':
+            meta_xattr = xattr.getxattr(data_files[0], "user.swift.metadata")
+            xattr.setxattr(data_files[0], "user.swift.metadata",
+                           meta_xattr[:-1])
+        elif invalid_type == 'Missing-Name':
+            md = diskfile.read_metadata(data_files[0])
+            del md['name']
+            diskfile.write_metadata(data_files[0], md)
+        elif invalid_type == 'Bad-Name':
+            md = diskfile.read_metadata(data_files[0])
+            md['name'] = md['name'] + 'garbage'
+            diskfile.write_metadata(data_files[0], md)
+
+        self.conf['disk_chunk_size'] = csize
+        self.conf['mount_check'] = mount_check
+        self.df_mgr = self.mgr_cls(self.conf, self.logger)
+        self.df_router = diskfile.DiskFileRouter(self.conf, self.logger)
+
+        # actual on disk frag_index may have been set by metadata
+        frag_index = metadata.get('X-Object-Sysmeta-Ec-Frag-Index',
+                                  frag_index)
+        df = self._simple_get_diskfile(obj=obj_name, policy=policy,
+                                       frag_index=frag_index)
+        df.open()
+
+        if invalid_type == 'Zero-Byte':
+            fp = open(df._data_file, 'w')
+            fp.close()
+        df.unit_test_len = fsize
+        return df
+
+    def test_keep_cache(self):
+        df = self._get_open_disk_file(fsize=65)
+        with mock.patch("swift.obj.diskfile.drop_buffer_cache") as foo:
+            for _ in df.reader():
+                pass
+            self.assertTrue(foo.called)
+
+        df = self._get_open_disk_file(fsize=65)
+        with mock.patch("swift.obj.diskfile.drop_buffer_cache") as bar:
+            for _ in df.reader(keep_cache=False):
+                pass
+            self.assertTrue(bar.called)
+
+        df = self._get_open_disk_file(fsize=65)
+        with mock.patch("swift.obj.diskfile.drop_buffer_cache") as boo:
+            for _ in df.reader(keep_cache=True):
+                pass
+            self.assertFalse(boo.called)
+
+        df = self._get_open_disk_file(fsize=50 * 1024, csize=256)
+        with mock.patch("swift.obj.diskfile.drop_buffer_cache") as goo:
+            for _ in df.reader(keep_cache=True):
+                pass
+            self.assertTrue(goo.called)
+
+    def test_quarantine_valids(self):
+
+        def verify(*args, **kwargs):
+            try:
+                df = self._get_open_disk_file(**kwargs)
+                reader = df.reader()
+                for chunk in reader:
+                    pass
+            except DiskFileQuarantined:
+                self.fail(
+                    "Unexpected quarantining occurred: args=%r, kwargs=%r" % (
+                        args, kwargs))
+            else:
+                pass
+
+        verify(obj_name='1')
+
+        verify(obj_name='2', csize=1)
+
+        verify(obj_name='3', csize=100000)
+
+    def run_quarantine_invalids(self, invalid_type):
+        open_exc = invalid_type in ('Content-Length', 'Bad-Content-Length',
+                                    'Subtly-Corrupt-Xattrs',
+                                    'Corrupt-Xattrs', 'Truncated-Xattrs',
+                                    'Missing-Name', 'Bad-X-Delete-At')
+        open_collision = invalid_type == 'Bad-Name'
+
+        def verify(*args, **kwargs):
+            quarantine_msgs = []
+            try:
+                df = self._get_open_disk_file(**kwargs)
+                reader = df.reader(_quarantine_hook=quarantine_msgs.append)
+            except DiskFileQuarantined as err:
+                if not open_exc:
+                    self.fail(
+                        "Unexpected DiskFileQuarantine raised: %r" % err)
+                return
+            except DiskFileCollision as err:
+                if not open_collision:
+                    self.fail(
+                        "Unexpected DiskFileCollision raised: %r" % err)
+                return
+            else:
+                if open_exc:
+                    self.fail("Expected DiskFileQuarantine exception")
+            try:
+                for chunk in reader:
+                    pass
+            except DiskFileQuarantined as err:
+                self.fail("Unexpected DiskFileQuarantine raised: :%r" % err)
+            else:
+                if not open_exc:
+                    self.assertEqual(1, len(quarantine_msgs))
+
+        verify(invalid_type=invalid_type, obj_name='1')
+
+        verify(invalid_type=invalid_type, obj_name='2', csize=1)
+
+        verify(invalid_type=invalid_type, obj_name='3', csize=100000)
+
+        verify(invalid_type=invalid_type, obj_name='4')
+
+        def verify_air(params, start=0, adjustment=0):
+            """verify (a)pp (i)ter (r)ange"""
+            try:
+                df = self._get_open_disk_file(**params)
+                reader = df.reader()
+            except DiskFileQuarantined as err:
+                if not open_exc:
+                    self.fail(
+                        "Unexpected DiskFileQuarantine raised: %r" % err)
+                return
+            except DiskFileCollision as err:
+                if not open_collision:
+                    self.fail(
+                        "Unexpected DiskFileCollision raised: %r" % err)
+                return
+            else:
+                if open_exc:
+                    self.fail("Expected DiskFileQuarantine exception")
+            try:
+                for chunk in reader.app_iter_range(
+                        start,
+                        df.unit_test_len + adjustment):
+                    pass
+            except DiskFileQuarantined as err:
+                self.fail("Unexpected DiskFileQuarantine raised: :%r" % err)
+
+        verify_air(dict(invalid_type=invalid_type, obj_name='5'))
+
+        verify_air(dict(invalid_type=invalid_type, obj_name='6'), 0, 100)
+
+        verify_air(dict(invalid_type=invalid_type, obj_name='7'), 1)
+
+        verify_air(dict(invalid_type=invalid_type, obj_name='8'), 0, -1)
+
+        verify_air(dict(invalid_type=invalid_type, obj_name='8'), 1, 1)
+
+    def test_quarantine_corrupt_xattrs(self):
+        self.run_quarantine_invalids('Corrupt-Xattrs')
+
+    def test_quarantine_subtly_corrupt_xattrs(self):
+        # xattrs that unpickle without error, but whose checksum does not
+        # match
+        self.run_quarantine_invalids('Subtly-Corrupt-Xattrs')
+
+    def test_quarantine_truncated_xattrs(self):
+        self.run_quarantine_invalids('Truncated-Xattrs')
+
+    def test_quarantine_invalid_etag(self):
+        self.run_quarantine_invalids('ETag')
+
+    def test_quarantine_invalid_missing_name(self):
+        self.run_quarantine_invalids('Missing-Name')
+
+    def test_quarantine_invalid_bad_name(self):
+        self.run_quarantine_invalids('Bad-Name')
+
+    def test_quarantine_invalid_bad_x_delete_at(self):
+        self.run_quarantine_invalids('Bad-X-Delete-At')
+
+    def test_quarantine_invalid_content_length(self):
+        self.run_quarantine_invalids('Content-Length')
+
+    def test_quarantine_invalid_content_length_bad(self):
+        self.run_quarantine_invalids('Bad-Content-Length')
+
+    def test_quarantine_invalid_zero_byte(self):
+        self.run_quarantine_invalids('Zero-Byte')
+
+    def test_quarantine_deleted_files(self):
+        try:
+            self._get_open_disk_file(invalid_type='Content-Length')
+        except DiskFileQuarantined:
+            pass
+        else:
+            self.fail("Expected DiskFileQuarantined exception")
+        try:
+            self._get_open_disk_file(invalid_type='Content-Length',
+                                     mark_deleted=True)
+        except DiskFileQuarantined as err:
+            self.fail("Unexpected DiskFileQuarantined exception"
+                      " encountered: %r" % err)
+        except DiskFileNotExist:
+            pass
+        else:
+            self.fail("Expected DiskFileNotExist exception")
+        try:
+            self._get_open_disk_file(invalid_type='Content-Length',
+                                     mark_deleted=True)
+        except DiskFileNotExist:
+            pass
+        else:
+            self.fail("Expected DiskFileNotExist exception")
+
+    def test_quarantine_missing_content_length(self):
+        self.assertRaises(
+            DiskFileQuarantined,
+            self._get_open_disk_file,
+            invalid_type='Missing-Content-Length')
+
+    def test_quarantine_bad_content_length(self):
+        self.assertRaises(
+            DiskFileQuarantined,
+            self._get_open_disk_file,
+            invalid_type='Bad-Content-Length')
+
+    def test_quarantine_fstat_oserror(self):
+        with mock.patch('os.fstat', side_effect=OSError()):
+            self.assertRaises(
+                DiskFileQuarantined,
+                self._get_open_disk_file)
+
+    def test_quarantine_ioerror_enodata(self):
+        df = self._get_open_disk_file()
+
+        def my_open(filename, mode, *args, **kwargs):
+            if mode == 'rb':
+                raise IOError(errno.ENODATA, '-ENODATA fool!')
+            return open(filename, mode, *args, **kwargs)
+
+        with mock.patch('swift.obj.diskfile.open', my_open):
+            with self.assertRaises(DiskFileQuarantined) as err:
+                df.open()
+            self.assertEqual(
+                'Failed to open %s: [Errno %d] -ENODATA fool!'
+                % (df._data_file, errno.ENODATA), str(err.exception))
+
+    def test_quarantine_ioerror_euclean(self):
+        df = self._get_open_disk_file()
+
+        def my_open(filename, mode, *args, **kwargs):
+            if mode == 'rb':
+                raise IOError(EUCLEAN, '-EUCLEAN fool!')
+            return open(filename, mode, *args, **kwargs)
+
+        with mock.patch('swift.obj.diskfile.open', my_open):
+            with self.assertRaises(DiskFileQuarantined) as err:
+                df.open()
+            self.assertEqual(
+                'Failed to open %s: [Errno %d] -EUCLEAN fool!'
+                % (df._data_file, EUCLEAN), str(err.exception))
+
+    def test_quarantine_hashdir_not_a_directory(self):
+        df, df_data = self._create_test_file(b'1234567890', account="abc",
+                                             container='123', obj='xyz')
+        hashdir = df._datadir
+        rmtree(hashdir)
+        with open(hashdir, 'w'):
+            pass
+
+        df = self.df_mgr.get_diskfile(self.existing_device, '0', 'abc', '123',
+                                      'xyz', policy=POLICIES.legacy)
+        self.assertRaises(DiskFileQuarantined, df.open)
+
+        # make sure the right thing got quarantined; the suffix dir should not
+        # have moved, as that could have many objects in it
+        self.assertFalse(os.path.exists(hashdir))
+        self.assertTrue(os.path.exists(os.path.dirname(hashdir)))
+
+    def test_quarantine_hashdir_not_listable(self):
+        for eno in (errno.ENODATA, EUCLEAN):
+            df, df_data = self._create_test_file(b'1234567890', account="abc",
+                                                 container='123', obj='xyz')
+            hashdir = df._datadir
+            df = self.df_mgr.get_diskfile(
+                self.existing_device, '0', 'abc', '123', 'xyz',
+                policy=POLICIES.legacy)
+            with mock.patch('os.listdir',
+                            side_effect=OSError(eno, 'nope')):
+                self.assertRaises(DiskFileQuarantined, df.open)
+
+            # make sure the right thing got quarantined; the suffix dir should
+            # not have moved, as that could have many objects in it
+            self.assertFalse(os.path.exists(hashdir))
+            self.assertTrue(os.path.exists(os.path.dirname(hashdir)))
+
+    def test_create_prealloc(self):
+        df = self.df_mgr.get_diskfile(self.existing_device, '0', 'abc', '123',
+                                      'xyz', policy=POLICIES.legacy)
+        with mock.patch("swift.obj.diskfile.fallocate") as fa:
+            with df.create(size=200) as writer:
+                used_fd = writer._fd
+        fa.assert_called_with(used_fd, 200)
+
+    def test_create_prealloc_oserror(self):
+        df = self.df_mgr.get_diskfile(self.existing_device, '0', 'abc', '123',
+                                      'xyz', policy=POLICIES.legacy)
+        for e in (errno.ENOSPC, errno.EDQUOT):
+            with mock.patch("swift.obj.diskfile.fallocate",
+                            mock.MagicMock(side_effect=OSError(
+                                e, os.strerror(e)))):
+                try:
+                    with df.create(size=200):
+                        pass
+                except DiskFileNoSpace:
+                    pass
+                else:
+                    self.fail("Expected exception DiskFileNoSpace")
+
+        # Other OSErrors must not be raised as DiskFileNoSpace
+        with mock.patch("swift.obj.diskfile.fallocate",
+                        mock.MagicMock(side_effect=OSError(
+                            errno.EACCES, os.strerror(errno.EACCES)))):
+            try:
+                with df.create(size=200):
+                    pass
+            except OSError:
+                pass
+            else:
+                self.fail("Expected exception OSError")
+
+    def test_create_mkstemp_no_space(self):
+        df = self.df_mgr.get_diskfile(self.existing_device, '0', 'abc', '123',
+                                      'xyz', policy=POLICIES.legacy)
+        df.manager.use_linkat = False
+        for e in (errno.ENOSPC, errno.EDQUOT):
+            with mock.patch("swift.obj.diskfile.mkstemp",
+                            mock.MagicMock(side_effect=OSError(
+                                e, os.strerror(e)))):
+                with self.assertRaises(DiskFileNoSpace):
+                    with df.create(size=200):
+                        pass
+
+        # Other OSErrors must not be raised as DiskFileNoSpace
+        with mock.patch("swift.obj.diskfile.mkstemp",
+                        mock.MagicMock(side_effect=OSError(
+                            errno.EACCES, os.strerror(errno.EACCES)))):
+            with self.assertRaises(OSError) as raised:
+                with df.create(size=200):
+                    pass
+        self.assertEqual(raised.exception.errno, errno.EACCES)
+
+    def test_create_close_oserror(self):
+        err = OSError(errno.EACCES, os.strerror(errno.EACCES))
+        # Disable fallocate for this test. Otherwise, the ctypes machinery may
+        # also call os.close (for example, when this test is run in isolation),
+        # but we're only interested in what diskfile is doing.
+        with mock.patch.object(utils, '_fallocate_enabled', False):
+            df = self.df_mgr.get_diskfile(self.existing_device, '0', 'abc',
+                                          '123', 'xyz', policy=POLICIES.legacy)
+            with mock.patch("swift.obj.diskfile.os.close") as mock_close:
+                mock_close.side_effect = err
+                with df.create(size=200) as dfw:
+                    fd = dfw._fd
+        self.assertEqual([mock.call(fd)], mock_close.call_args_list)
+
+    def test_write_metadata(self):
+        df, df_data = self._create_test_file(b'1234567890')
+        file_count = len(os.listdir(df._datadir))
+        timestamp = Timestamp.now().internal
+        metadata = {'X-Timestamp': timestamp, 'X-Object-Meta-test': 'data'}
+        df.write_metadata(metadata)
+        dl = os.listdir(df._datadir)
+        self.assertEqual(len(dl), file_count + 1)
+        exp_name = '%s.meta' % timestamp
+        self.assertIn(exp_name, set(dl))
+
+    def test_write_metadata_with_content_type(self):
+        # if metadata has content-type then its time should be in file name
+        df, df_data = self._create_test_file(b'1234567890')
+        file_count = len(os.listdir(df._datadir))
+        timestamp = Timestamp.now()
+        metadata = {'X-Timestamp': timestamp.internal,
+                    'X-Object-Meta-test': 'data',
+                    'Content-Type': 'foo',
+                    'Content-Type-Timestamp': timestamp.internal}
+        df.write_metadata(metadata)
+        dl = os.listdir(df._datadir)
+        self.assertEqual(len(dl), file_count + 1)
+        exp_name = '%s+0.meta' % timestamp.internal
+        self.assertTrue(exp_name in set(dl),
+                        'Expected file %s not found in %s' % (exp_name, dl))
+
+    def test_write_metadata_with_older_content_type(self):
+        # if metadata has content-type then its time should be in file name
+        ts_iter = make_timestamp_iter()
+        df, df_data = self._create_test_file(b'1234567890',
+                                             timestamp=next(ts_iter))
+        file_count = len(os.listdir(df._datadir))
+        timestamp = next(ts_iter)
+        timestamp2 = next(ts_iter)
+        metadata = {'X-Timestamp': timestamp2.internal,
+                    'X-Object-Meta-test': 'data',
+                    'Content-Type': 'foo',
+                    'Content-Type-Timestamp': timestamp.internal}
+        df.write_metadata(metadata)
+        dl = os.listdir(df._datadir)
+        self.assertEqual(len(dl), file_count + 1, dl)
+        exp_name = '%s-%x.meta' % (timestamp2.internal,
+                                   timestamp2.raw - timestamp.raw)
+        self.assertTrue(exp_name in set(dl),
+                        'Expected file %s not found in %s' % (exp_name, dl))
+
+    def test_write_metadata_with_content_type_removes_same_time_meta(self):
+        # a meta file without content-type should be cleaned up in favour of
+        # a meta file at same time with content-type
+        ts_iter = make_timestamp_iter()
+        df, df_data = self._create_test_file(b'1234567890',
+                                             timestamp=next(ts_iter))
+        file_count = len(os.listdir(df._datadir))
+        timestamp = next(ts_iter)
+        timestamp2 = next(ts_iter)
+        metadata = {'X-Timestamp': timestamp2.internal,
+                    'X-Object-Meta-test': 'data'}
+        df.write_metadata(metadata)
+        metadata = {'X-Timestamp': timestamp2.internal,
+                    'X-Object-Meta-test': 'data',
+                    'Content-Type': 'foo',
+                    'Content-Type-Timestamp': timestamp.internal}
+        df.write_metadata(metadata)
+
+        dl = os.listdir(df._datadir)
+        self.assertEqual(len(dl), file_count + 1, dl)
+        exp_name = '%s-%x.meta' % (timestamp2.internal,
+                                   timestamp2.raw - timestamp.raw)
+        self.assertTrue(exp_name in set(dl),
+                        'Expected file %s not found in %s' % (exp_name, dl))
+
+    def test_write_metadata_with_content_type_removes_multiple_metas(self):
+        # a combination of a meta file without content-type and an older meta
+        # file with content-type should be cleaned up in favour of a meta file
+        # at newer time with content-type
+        ts_iter = make_timestamp_iter()
+        df, df_data = self._create_test_file(b'1234567890',
+                                             timestamp=next(ts_iter))
+        file_count = len(os.listdir(df._datadir))
+        timestamp = next(ts_iter)
+        timestamp2 = next(ts_iter)
+        metadata = {'X-Timestamp': timestamp2.internal,
+                    'X-Object-Meta-test': 'data'}
+        df.write_metadata(metadata)
+        metadata = {'X-Timestamp': timestamp.internal,
+                    'X-Object-Meta-test': 'data',
+                    'Content-Type': 'foo',
+                    'Content-Type-Timestamp': timestamp.internal}
+        df.write_metadata(metadata)
+
+        dl = os.listdir(df._datadir)
+        self.assertEqual(len(dl), file_count + 2, dl)
+
+        metadata = {'X-Timestamp': timestamp2.internal,
+                    'X-Object-Meta-test': 'data',
+                    'Content-Type': 'foo',
+                    'Content-Type-Timestamp': timestamp.internal}
+        df.write_metadata(metadata)
+
+        dl = os.listdir(df._datadir)
+        self.assertEqual(len(dl), file_count + 1, dl)
+        exp_name = '%s-%x.meta' % (timestamp2.internal,
+                                   timestamp2.raw - timestamp.raw)
+        self.assertTrue(exp_name in set(dl),
+                        'Expected file %s not found in %s' % (exp_name, dl))
+
+    def test_write_metadata_no_xattr(self):
+        timestamp = Timestamp.now().internal
+        metadata = {'X-Timestamp': timestamp, 'X-Object-Meta-test': 'data'}
+
+        def mock_setxattr(*args, **kargs):
+            error_num = errno.ENOTSUP if hasattr(errno, 'ENOTSUP') else \
+                errno.EOPNOTSUPP
+            raise IOError(error_num, "Operation not supported")
+
+        with mock.patch('xattr.setxattr', mock_setxattr):
+            self.assertRaises(
+                DiskFileXattrNotSupported,
+                diskfile.write_metadata, 'n/a', metadata)
+
+    def test_write_metadata_disk_full(self):
+        timestamp = Timestamp.now().internal
+        metadata = {'X-Timestamp': timestamp, 'X-Object-Meta-test': 'data'}
+
+        def mock_setxattr_ENOSPC(*args, **kargs):
+            raise IOError(errno.ENOSPC, "No space left on device")
+
+        def mock_setxattr_EDQUOT(*args, **kargs):
+            raise IOError(errno.EDQUOT, "Exceeded quota")
+
+        with mock.patch('xattr.setxattr', mock_setxattr_ENOSPC):
+            self.assertRaises(
+                DiskFileNoSpace,
+                diskfile.write_metadata, 'n/a', metadata)
+
+        with mock.patch('xattr.setxattr', mock_setxattr_EDQUOT):
+            self.assertRaises(
+                DiskFileNoSpace,
+                diskfile.write_metadata, 'n/a', metadata)
+
+    def _create_diskfile_dir(self, timestamp, policy, legacy_durable=False,
+                             partition=0, next_part_power=None,
+                             expect_error=False):
+        timestamp = Timestamp(timestamp)
+        df = self._simple_get_diskfile(account='a', container='c',
+                                       obj='o_%s' % policy,
+                                       policy=policy,
+                                       partition=partition,
+                                       next_part_power=next_part_power)
+        frag_index = None
+        if policy.policy_type == EC_POLICY:
+            frag_index = df._frag_index or 7
+        if expect_error:
+            with self.assertRaises(Exception):
+                write_diskfile(df, timestamp, frag_index=frag_index,
+                               legacy_durable=legacy_durable)
+        else:
+            write_diskfile(df, timestamp, frag_index=frag_index,
+                           legacy_durable=legacy_durable)
+        return df._datadir
+
+    def test_commit(self):
+        for policy in POLICIES:
+            timestamp = Timestamp.now()
+            df = self._simple_get_diskfile(account='a', container='c',
+                                           obj='o_%s' % policy,
+                                           policy=policy)
+            write_diskfile(df, timestamp, frag_index=2)
+            dl = os.listdir(df._datadir)
+            expected = [_make_datafilename(
+                timestamp, policy, frag_index=2, durable=True)]
+            self.assertEqual(len(dl), len(expected),
+                             'Unexpected dir listing %s' % dl)
+            self.assertEqual(expected, dl)
+            if policy.policy_type == EC_POLICY:
+                self.assertEqual(2, df._frag_index)
+
+    def _do_test_write_cleanup(self, policy, legacy_durable=False):
+        # create first fileset as starting state
+        timestamp_1 = Timestamp.now()
+        datadir_1 = self._create_diskfile_dir(
+            timestamp_1, policy, legacy_durable)
+        # second write should clean up first fileset
+        timestamp_2 = Timestamp(time() + 1)
+        datadir_2 = self._create_diskfile_dir(timestamp_2, policy)
+        # sanity check
+        self.assertEqual(datadir_1, datadir_2)
+        dl = os.listdir(datadir_2)
+        expected = [_make_datafilename(
+            timestamp_2, policy, frag_index=2, durable=True)]
+        self.assertEqual(len(dl), len(expected),
+                         'Unexpected dir listing %s' % dl)
+        self.assertEqual(expected, dl)
+
+    def test_write_cleanup(self):
+        for policy in POLICIES:
+            self._do_test_write_cleanup(policy)
+
+    def test_write_cleanup_legacy_durable(self):
+        for policy in POLICIES:
+            self._do_test_write_cleanup(policy, legacy_durable=True)
+
+    @mock.patch("swift.obj.diskfile.BaseDiskFileManager.cleanup_ondisk_files")
+    def test_write_cleanup_part_power_increase(self, mock_cleanup):
+        # Without next_part_power set we expect only one cleanup per DiskFile
+        # and no linking
+        for policy in POLICIES:
+            timestamp = Timestamp(time()).internal
+            df_dir = self._create_diskfile_dir(timestamp, policy)
+            self.assertEqual(1, mock_cleanup.call_count)
+            mock_cleanup.assert_called_once_with(df_dir)
+            mock_cleanup.reset_mock()
+
+        # With next_part_power set to part_power + 1 we expect two cleanups per
+        # DiskFile: first cleanup the current directory, but also cleanup the
+        # future directory where hardlinks are created
+        for policy in POLICIES:
+            timestamp = Timestamp(time()).internal
+            df_dir = self._create_diskfile_dir(
+                timestamp, policy, next_part_power=11)
+
+            self.assertEqual(2, mock_cleanup.call_count)
+            mock_cleanup.assert_any_call(df_dir)
+
+            # Make sure the translated path is also cleaned up
+            expected_dir = utils.replace_partition_in_path(
+                self.conf['devices'], df_dir, 11)
+            mock_cleanup.assert_any_call(expected_dir)
+
+            mock_cleanup.reset_mock()
+
+        # With next_part_power set to part_power we expect two cleanups per
+        # DiskFile: first cleanup the current directory, but also cleanup the
+        # previous old directory
+        for policy in POLICIES:
+            hash_path = utils.hash_path('a', 'c', 'o_%s' % policy)
+            partition = utils.get_partition_for_hash(hash_path, 10)
+            timestamp = Timestamp(time()).internal
+            df_dir = self._create_diskfile_dir(
+                timestamp, policy, partition=partition, next_part_power=10)
+
+            self.assertEqual(2, mock_cleanup.call_count)
+            mock_cleanup.assert_any_call(df_dir)
+
+            # Make sure the path using the old part power is also cleaned up
+            expected_dir = utils.replace_partition_in_path(
+                self.conf['devices'], df_dir, 9)
+            mock_cleanup.assert_any_call(expected_dir)
+
+            mock_cleanup.reset_mock()
+
+    @mock.patch.object(diskfile.BaseDiskFileManager, 'cleanup_ondisk_files',
+                       side_effect=Exception)
+    def test_killed_before_cleanup(self, mock_cleanup):
+        for policy in POLICIES:
+            timestamp = Timestamp(time()).internal
+            hash_path = utils.hash_path('a', 'c', 'o_%s' % policy)
+            partition = utils.get_partition_for_hash(hash_path, 10)
+            df_dir = self._create_diskfile_dir(timestamp, policy,
+                                               partition=partition,
+                                               next_part_power=11,
+                                               expect_error=True)
+            expected_dir = utils.replace_partition_in_path(
+                self.conf['devices'], df_dir, 11)
+
+            self.assertEqual(os.listdir(df_dir), os.listdir(expected_dir))
+
+    def test_commit_fsync(self):
+        for policy in POLICIES:
+            df = self._simple_get_diskfile(account='a', container='c',
+                                           obj='o', policy=policy)
+
+            timestamp = Timestamp.now()
+            with df.create() as writer:
+                metadata = {
+                    'ETag': 'bogus_etag',
+                    'X-Timestamp': timestamp.internal,
+                    'Content-Length': '0',
+                }
+                with mock.patch('swift.obj.diskfile.fsync') as mock_fsync:
+                    writer.put(metadata)
+                    self.assertEqual(1, mock_fsync.call_count)
+                    writer.commit(timestamp)
+                    self.assertEqual(1, mock_fsync.call_count)
+            if policy.policy_type == EC_POLICY:
+                self.assertIsInstance(mock_fsync.call_args[0][0], int)
+
+    def test_commit_ignores_cleanup_ondisk_files_error(self):
+        for policy in POLICIES:
+            # Check OSError from cleanup_ondisk_files is caught and ignored
+            mock_cleanup = mock.MagicMock(side_effect=OSError)
+            df = self._simple_get_diskfile(account='a', container='c',
+                                           obj='o_error', policy=policy)
+
+            timestamp = Timestamp.now()
+            with df.create() as writer:
+                metadata = {
+                    'ETag': 'bogus_etag',
+                    'X-Timestamp': timestamp.internal,
+                    'Content-Length': '0',
+                }
+                writer.put(metadata)
+                with mock.patch(self._manager_mock(
+                        'cleanup_ondisk_files', df), mock_cleanup):
+                    writer.commit(timestamp)
+            expected = {
+                EC_POLICY: 1,
+                REPL_POLICY: 0,
+            }[policy.policy_type]
+            self.assertEqual(expected, mock_cleanup.call_count)
+            if expected:
+                self.assertIn(
+                    'Problem cleaning up',
+                    df.manager.logger.get_lines_for_level('error')[0])
+
+            expected = [_make_datafilename(
+                timestamp, policy, frag_index=2, durable=True)]
+            dl = os.listdir(df._datadir)
+            self.assertEqual(len(dl), len(expected),
+                             'Unexpected dir listing %s' % dl)
+            self.assertEqual(expected, dl)
+
+    def test_number_calls_to_cleanup_ondisk_files_during_create(self):
+        # Check how many calls are made to cleanup_ondisk_files, and when,
+        # during put(), commit() sequence
+        for policy in POLICIES:
+            expected = {
+                EC_POLICY: (0, 1),
+                REPL_POLICY: (1, 0),
+            }[policy.policy_type]
+            df = self._simple_get_diskfile(account='a', container='c',
+                                           obj='o_error', policy=policy)
+            timestamp = Timestamp.now()
+            with df.create() as writer:
+                metadata = {
+                    'ETag': 'bogus_etag',
+                    'X-Timestamp': timestamp.internal,
+                    'Content-Length': '0',
+                }
+                with mock.patch(self._manager_mock(
+                        'cleanup_ondisk_files', df)) as mock_cleanup:
+                    writer.put(metadata)
+                    self.assertEqual(expected[0], mock_cleanup.call_count)
+                with mock.patch(self._manager_mock(
+                        'cleanup_ondisk_files', df)) as mock_cleanup:
+                    writer.commit(timestamp)
+                    self.assertEqual(expected[1], mock_cleanup.call_count)
+
+    def test_number_calls_to_cleanup_ondisk_files_during_delete(self):
+        # Check how many calls are made to cleanup_ondisk_files, and when,
+        # for delete() and necessary prerequisite steps
+        for policy in POLICIES:
+            expected = {
+                EC_POLICY: (0, 1, 1),
+                REPL_POLICY: (1, 0, 1),
+            }[policy.policy_type]
+            df = self._simple_get_diskfile(account='a', container='c',
+                                           obj='o_error', policy=policy)
+            timestamp = Timestamp.now()
+            with df.create() as writer:
+                metadata = {
+                    'ETag': 'bogus_etag',
+                    'X-Timestamp': timestamp.internal,
+                    'Content-Length': '0',
+                }
+                with mock.patch(self._manager_mock(
+                        'cleanup_ondisk_files', df)) as mock_cleanup:
+                    writer.put(metadata)
+                    self.assertEqual(expected[0], mock_cleanup.call_count)
+                with mock.patch(self._manager_mock(
+                        'cleanup_ondisk_files', df)) as mock_cleanup:
+                    writer.commit(timestamp)
+                    self.assertEqual(expected[1], mock_cleanup.call_count)
+                with mock.patch(self._manager_mock(
+                        'cleanup_ondisk_files', df)) as mock_cleanup:
+                    timestamp = Timestamp.now()
+                    df.delete(timestamp)
+                    self.assertEqual(expected[2], mock_cleanup.call_count)
+
+    def test_delete(self):
+        for policy in POLICIES:
+            if policy.policy_type == EC_POLICY:
+                metadata = {'X-Object-Sysmeta-Ec-Frag-Index': '1'}
+                fi = 1
+            else:
+                metadata = {}
+                fi = None
+            df = self._get_open_disk_file(policy=policy, frag_index=fi,
+                                          extra_metadata=metadata)
+
+            ts = Timestamp.now()
+            df.delete(ts)
+            exp_name = '%s.ts' % ts.internal
+            dl = os.listdir(df._datadir)
+            self.assertEqual(len(dl), 1)
+            self.assertIn(exp_name, set(dl))
+            # cleanup before next policy
+            os.unlink(os.path.join(df._datadir, exp_name))
+
+    def test_open_deleted(self):
+        df = self._get_open_disk_file()
+        ts = Timestamp.now()
+        df.delete(ts)
+        exp_name = '%s.ts' % ts.internal
+        dl = os.listdir(df._datadir)
+        self.assertEqual(len(dl), 1)
+        self.assertIn(exp_name, set(dl))
+        df = self._simple_get_diskfile()
+        self.assertRaises(DiskFileDeleted, df.open)
+
+    def test_open_deleted_with_corrupt_tombstone(self):
+        df = self._get_open_disk_file()
+        ts = Timestamp.now()
+        df.delete(ts)
+        exp_name = '%s.ts' % ts.internal
+        dl = os.listdir(df._datadir)
+        self.assertEqual(len(dl), 1)
+        self.assertIn(exp_name, set(dl))
+        # it's pickle-format, so removing the last byte is sufficient to
+        # corrupt it
+        ts_fullpath = os.path.join(df._datadir, exp_name)
+        self.assertTrue(os.path.exists(ts_fullpath))  # sanity check
+        meta_xattr = xattr.getxattr(ts_fullpath, "user.swift.metadata")
+        xattr.setxattr(ts_fullpath, "user.swift.metadata", meta_xattr[:-1])
+
+        df = self._simple_get_diskfile()
+        self.assertRaises(DiskFileNotExist, df.open)
+        self.assertFalse(os.path.exists(ts_fullpath))
+
+    def test_open_data_file_concurrently_unlinked(self):
+        # if a .data file is cleaned up while diskfile is being opened then
+        # DiskFileStateChanged can be raised
+        ts_data = self.ts()
+        ts_meta1 = self.ts()
+        self._create_test_file(b'1234567890', timestamp=ts_data)
+        df = self._simple_get_diskfile()
+        df.write_metadata({'X-Timestamp': ts_meta1.internal, 'test': 'me'})
+        with df.open():
+            self.assertEqual(ts_data, df.data_timestamp)
+            self.assertEqual(ts_meta1, df.timestamp)
+
+        df = self._simple_get_diskfile()
+        orig_get_ondisk_files = df._get_ondisk_files
+
+        def fake_get_ondisk_files(files, policy):
+            # once the datadir has been listed for the open(), unlink the .data
+            # file
+            file_info = orig_get_ondisk_files(files, policy)
+            os.unlink(file_info['data_file'])
+            return file_info
+
+        with mock.patch.object(df, '_get_ondisk_files', fake_get_ondisk_files):
+            with self.assertRaises(DiskFileStateChanged):
+                df.open()
+
+    def test_open_meta_file_concurrently_unlinked(self):
+        # if a .meta file is cleaned up while diskfile is being opened then
+        # DiskFileStateChanged can be raised
+        ts_data = self.ts()
+        ts_meta1 = self.ts()
+        ts_meta2 = self.ts()
+        self._create_test_file(b'1234567890', timestamp=ts_data)
+        df = self._simple_get_diskfile()
+        df.write_metadata({'X-Timestamp': ts_meta1.internal, 'test': 'me'})
+        with df.open():
+            self.assertEqual(ts_data, df.data_timestamp)
+            self.assertEqual(ts_meta1, df.timestamp)
+
+        df = self._simple_get_diskfile()
+        orig_get_ondisk_files = df._get_ondisk_files
+
+        def fake_get_ondisk_files(files, policy):
+            # once the datadir has been listed for the open(), replace the meta
+            # file with a newer one
+            file_info = orig_get_ondisk_files(files, policy)
+            os.unlink(file_info['meta_file'])
+            df.write_metadata(
+                {'X-Timestamp': ts_meta2.internal, 'test': 'me'})
+            return file_info
+
+        with mock.patch.object(df, '_get_ondisk_files', fake_get_ondisk_files):
+            with self.assertRaises(DiskFileStateChanged):
+                df.open()
+
+        df = self._simple_get_diskfile()
+        with df.open():
+            self.assertEqual(ts_data, df.data_timestamp)
+            self.assertEqual(ts_meta2, df.timestamp)
+
+    def test_from_audit_location(self):
+        df, df_data = self._create_test_file(
+            b'blah blah',
+            account='three', container='blind', obj='mice')
+        hashdir = df._datadir
+        df = self.df_mgr.get_diskfile_from_audit_location(
+            diskfile.AuditLocation(hashdir, self.existing_device, '0',
+                                   policy=POLICIES.default))
+        df.open()
+        self.assertEqual(df._name, '/three/blind/mice')
+
+    def test_from_audit_location_with_mismatched_hash(self):
+        df, df_data = self._create_test_file(
+            b'blah blah',
+            account='this', container='is', obj='right')
+        hashdir = df._datadir
+        datafilename = [f for f in os.listdir(hashdir)
+                        if f.endswith('.data')][0]
+        datafile = os.path.join(hashdir, datafilename)
+        meta = diskfile.read_metadata(datafile)
+        meta['name'] = '/this/is/wrong'
+        diskfile.write_metadata(datafile, meta)
+
+        df = self.df_mgr.get_diskfile_from_audit_location(
+            diskfile.AuditLocation(hashdir, self.existing_device, '0',
+                                   policy=POLICIES.default))
+        self.assertRaises(DiskFileQuarantined, df.open)
+
+    def test_close_error(self):
+
+        def mock_handle_close_quarantine():
+            raise Exception("Bad")
+
+        df = self._get_open_disk_file(fsize=1024 * 1024 * 2, csize=1024)
+        reader = df.reader()
+        reader._handle_close_quarantine = mock_handle_close_quarantine
+        for chunk in reader:
+            pass
+        # close is called at the end of the iterator
+        self.assertIsNone(reader._fp)
+        error_lines = df._logger.get_lines_for_level('error')
+        self.assertEqual(len(error_lines), 1)
+        self.assertIn('close failure', error_lines[0])
+        self.assertIn('Bad', error_lines[0])
+
+    def test_mount_checking(self):
+
+        def _mock_cm(*args, **kwargs):
+            return False
+
+        with mock.patch("swift.common.constraints.check_mount", _mock_cm):
+            self.assertRaises(
+                DiskFileDeviceUnavailable,
+                self._get_open_disk_file,
+                mount_check=True)
+
+    def test_ondisk_search_loop_ts_meta_data(self):
+        df = self._simple_get_diskfile()
+        ts = [Timestamp(i) for i in range(11)]
+        self._create_ondisk_file(df, b'', ext='.ts', timestamp=ts[10])
+        self._create_ondisk_file(df, b'', ext='.ts', timestamp=ts[9])
+        self._create_ondisk_file(df, b'', ext='.meta', timestamp=ts[8])
+        self._create_ondisk_file(df, b'', ext='.meta', timestamp=ts[7])
+        self._create_ondisk_file(df, b'B', ext='.data', timestamp=ts[6])
+        self._create_ondisk_file(df, b'A', ext='.data', timestamp=ts[5])
+        df = self._simple_get_diskfile()
+        with self.assertRaises(DiskFileDeleted) as raised:
+            df.open()
+        self.assertEqual(raised.exception.timestamp, ts[10].internal)
+
+    def test_ondisk_search_loop_meta_ts_data(self):
+        df = self._simple_get_diskfile()
+        ts = [Timestamp(i) for i in range(11)]
+        self._create_ondisk_file(df, b'', ext='.meta', timestamp=ts[10])
+        self._create_ondisk_file(df, b'', ext='.meta', timestamp=ts[9])
+        self._create_ondisk_file(df, b'', ext='.ts', timestamp=ts[8])
+        self._create_ondisk_file(df, b'', ext='.ts', timestamp=ts[7])
+        self._create_ondisk_file(df, b'B', ext='.data', timestamp=ts[6])
+        self._create_ondisk_file(df, b'A', ext='.data', timestamp=ts[5])
+        df = self._simple_get_diskfile()
+        with self.assertRaises(DiskFileDeleted) as raised:
+            df.open()
+        self.assertEqual(raised.exception.timestamp, ts[8].internal)
+
+    def _test_ondisk_search_loop_meta_data_ts(self, legacy_durable=False):
+        df = self._simple_get_diskfile()
+        ts = [Timestamp(i) for i in range(11)]
+        self._create_ondisk_file(df, b'', ext='.meta', timestamp=ts[10])
+        self._create_ondisk_file(df, b'', ext='.meta', timestamp=ts[9])
+        self._create_ondisk_file(
+            df, b'B', ext='.data', legacy_durable=legacy_durable,
+            timestamp=ts[8])
+        self._create_ondisk_file(
+            df, b'A', ext='.data', legacy_durable=legacy_durable,
+            timestamp=ts[7])
+        self._create_ondisk_file(df, b'', ext='.ts', timestamp=ts[6])
+        self._create_ondisk_file(df, b'', ext='.ts', timestamp=ts[5])
+        df = self._simple_get_diskfile()
+        with df.open():
+            self.assertIn('X-Timestamp', df._metadata)
+            self.assertEqual(df._metadata['X-Timestamp'], ts[10].internal)
+            self.assertNotIn('deleted', df._metadata)
+
+    def test_ondisk_search_loop_meta_data_ts(self):
+        self._test_ondisk_search_loop_meta_data_ts()
+
+    def test_ondisk_search_loop_meta_data_ts_legacy_durable(self):
+        self._test_ondisk_search_loop_meta_data_ts(legacy_durable=True)
+
+    def _test_ondisk_search_loop_multiple_meta_data(self,
+                                                    legacy_durable=False):
+        df = self._simple_get_diskfile()
+        ts = [Timestamp(i) for i in range(11)]
+        self._create_ondisk_file(df, b'', ext='.meta', timestamp=ts[10],
+                                 metadata={'X-Object-Meta-User': 'user-meta'})
+        self._create_ondisk_file(df, b'', ext='.meta', timestamp=ts[9],
+                                 ctype_timestamp=ts[9],
+                                 metadata={'Content-Type': 'newest',
+                                           'X-Object-Meta-User': 'blah'})
+        self._create_ondisk_file(
+            df, b'B', ext='.data', legacy_durable=legacy_durable,
+            timestamp=ts[8],
+            metadata={'Content-Type': 'newer'})
+        self._create_ondisk_file(
+            df, b'A', ext='.data', legacy_durable=legacy_durable,
+            timestamp=ts[7],
+            metadata={'Content-Type': 'oldest'})
+        df = self._simple_get_diskfile()
+        with df.open():
+            self.assertTrue('X-Timestamp' in df._metadata)
+            self.assertEqual(df._metadata['X-Timestamp'], ts[10].internal)
+            self.assertTrue('Content-Type' in df._metadata)
+            self.assertEqual(df._metadata['Content-Type'], 'newest')
+            self.assertTrue('X-Object-Meta-User' in df._metadata)
+            self.assertEqual(df._metadata['X-Object-Meta-User'], 'user-meta')
+
+    def test_ondisk_search_loop_multiple_meta_data(self):
+        self._test_ondisk_search_loop_multiple_meta_data()
+
+    def test_ondisk_search_loop_multiple_meta_data_legacy_durable(self):
+        self._test_ondisk_search_loop_multiple_meta_data(legacy_durable=True)
+
+    def _test_ondisk_search_loop_stale_meta_data(self, legacy_durable=False):
+        df = self._simple_get_diskfile()
+        ts = [Timestamp(i) for i in range(11)]
+        self._create_ondisk_file(df, b'', ext='.meta', timestamp=ts[10],
+                                 metadata={'X-Object-Meta-User': 'user-meta'})
+        self._create_ondisk_file(df, b'', ext='.meta', timestamp=ts[9],
+                                 ctype_timestamp=ts[7],
+                                 metadata={'Content-Type': 'older',
+                                           'X-Object-Meta-User': 'blah'})
+        self._create_ondisk_file(
+            df, b'B', ext='.data', legacy_durable=legacy_durable,
+            timestamp=ts[8], metadata={'Content-Type': 'newer'})
+        df = self._simple_get_diskfile()
+        with df.open():
+            self.assertTrue('X-Timestamp' in df._metadata)
+            self.assertEqual(df._metadata['X-Timestamp'], ts[10].internal)
+            self.assertTrue('Content-Type' in df._metadata)
+            self.assertEqual(df._metadata['Content-Type'], 'newer')
+            self.assertTrue('X-Object-Meta-User' in df._metadata)
+            self.assertEqual(df._metadata['X-Object-Meta-User'], 'user-meta')
+
+    def test_ondisk_search_loop_stale_meta_data(self):
+        self._test_ondisk_search_loop_stale_meta_data()
+
+    def test_ondisk_search_loop_stale_meta_data_legacy_durable(self):
+        self._test_ondisk_search_loop_stale_meta_data(legacy_durable=True)
+
+    def _test_ondisk_search_loop_data_ts_meta(self, legacy_durable=False):
+        df = self._simple_get_diskfile()
+        ts = [Timestamp(i) for i in range(11)]
+        self._create_ondisk_file(
+            df, b'B', ext='.data', legacy_durable=legacy_durable,
+            timestamp=ts[10])
+        self._create_ondisk_file(
+            df, b'A', ext='.data', legacy_durable=legacy_durable,
+            timestamp=ts[9])
+        self._create_ondisk_file(df, b'', ext='.ts', timestamp=ts[8])
+        self._create_ondisk_file(df, b'', ext='.ts', timestamp=ts[7])
+        self._create_ondisk_file(df, b'', ext='.meta', timestamp=ts[6])
+        self._create_ondisk_file(df, b'', ext='.meta', timestamp=ts[5])
+        df = self._simple_get_diskfile()
+        with df.open():
+            self.assertIn('X-Timestamp', df._metadata)
+            self.assertEqual(df._metadata['X-Timestamp'], ts[10].internal)
+            self.assertNotIn('deleted', df._metadata)
+
+    def test_ondisk_search_loop_data_ts_meta(self):
+        self._test_ondisk_search_loop_data_ts_meta()
+
+    def test_ondisk_search_loop_data_ts_meta_legacy_durable(self):
+        self._test_ondisk_search_loop_data_ts_meta(legacy_durable=True)
+
+    def _test_ondisk_search_loop_wayward_files_ignored(self,
+                                                       legacy_durable=False):
+        df = self._simple_get_diskfile()
+        ts = [Timestamp(i) for i in range(12)]
+        self._create_ondisk_file(df, b'X', ext='.bar', timestamp=ts[11])
+        self._create_ondisk_file(
+            df, b'B', ext='.data', legacy_durable=legacy_durable,
+            timestamp=ts[10])
+        self._create_ondisk_file(
+            df, b'A', ext='.data', legacy_durable=legacy_durable,
+            timestamp=ts[9])
+        self._create_ondisk_file(df, b'', ext='.ts', timestamp=ts[8])
+        self._create_ondisk_file(df, b'', ext='.ts', timestamp=ts[7])
+        self._create_ondisk_file(df, b'', ext='.meta', timestamp=ts[6])
+        self._create_ondisk_file(df, b'', ext='.meta', timestamp=ts[5])
+        df = self._simple_get_diskfile()
+        with df.open():
+            self.assertIn('X-Timestamp', df._metadata)
+            self.assertEqual(df._metadata['X-Timestamp'], ts[10].internal)
+            self.assertNotIn('deleted', df._metadata)
+
+    def test_ondisk_search_loop_wayward_files_ignored(self):
+        self._test_ondisk_search_loop_wayward_files_ignored()
+
+    def test_ondisk_search_loop_wayward_files_ignored_legacy_durable(self):
+        self._test_ondisk_search_loop_wayward_files_ignored(
+            legacy_durable=True)
+
+    def _test_ondisk_search_loop_listdir_error(self, legacy_durable=False):
+        df = self._simple_get_diskfile()
+
+        def mock_listdir_exp(*args, **kwargs):
+            raise OSError(errno.EACCES, os.strerror(errno.EACCES))
+
+        with mock.patch("os.listdir", mock_listdir_exp):
+            self._create_ondisk_file(df, b'X', ext='.bar', timestamp=11)
+            self._create_ondisk_file(df, b'B', ext='.data', timestamp=10,
+                                     legacy_durable=legacy_durable)
+            self._create_ondisk_file(df, b'A', ext='.data', timestamp=9,
+                                     legacy_durable=legacy_durable)
+            self._create_ondisk_file(df, b'', ext='.ts', timestamp=8)
+            self._create_ondisk_file(df, b'', ext='.ts', timestamp=7)
+            self._create_ondisk_file(df, b'', ext='.meta', timestamp=6)
+            self._create_ondisk_file(df, b'', ext='.meta', timestamp=5)
+            df = self._simple_get_diskfile()
+            self.assertRaises(DiskFileError, df.open)
+
+    def test_ondisk_search_loop_listdir_error(self):
+        self._test_ondisk_search_loop_listdir_error()
+
+    def test_ondisk_search_loop_listdir_error_legacy_durable(self):
+        self._test_ondisk_search_loop_listdir_error(legacy_durable=True)
+
+    def test_exception_in_handle_close_quarantine(self):
+        df = self._get_open_disk_file()
+
+        def blow_up():
+            raise Exception('a very special error')
+
+        reader = df.reader()
+        reader._handle_close_quarantine = blow_up
+        for _ in reader:
+            pass
+        reader.close()
+        log_lines = df._logger.get_lines_for_level('error')
+        self.assertIn('a very special error', log_lines[-1])
+
+    def test_diskfile_names(self):
+        df = self._simple_get_diskfile()
+        self.assertEqual(df.account, 'a')
+        self.assertEqual(df.container, 'c')
+        self.assertEqual(df.obj, 'o')
+
+    def test_diskfile_content_length_not_open(self):
+        df = self._simple_get_diskfile()
+        exc = None
+        try:
+            df.content_length
+        except DiskFileNotOpen as err:
+            exc = err
+        self.assertEqual(str(exc), '')
+
+    def test_diskfile_content_length_deleted(self):
+        df = self._get_open_disk_file()
+        ts = Timestamp.now()
+        df.delete(ts)
+        exp_name = '%s.ts' % ts.internal
+        dl = os.listdir(df._datadir)
+        self.assertEqual(len(dl), 1)
+        self.assertIn(exp_name, set(dl))
+        df = self._simple_get_diskfile()
+        exc = None
+        try:
+            with df.open():
+                df.content_length
+        except DiskFileDeleted as err:
+            exc = err
+        self.assertEqual(str(exc), '')
+
+    def test_diskfile_content_length(self):
+        self._get_open_disk_file()
+        df = self._simple_get_diskfile()
+        with df.open():
+            if df.policy.policy_type == EC_POLICY:
+                expected = df.policy.pyeclib_driver.get_segment_info(
+                    1024, df.policy.ec_segment_size)['fragment_size']
+            else:
+                expected = 1024
+            self.assertEqual(df.content_length, expected)
+
+    def test_diskfile_timestamp_not_open(self):
+        df = self._simple_get_diskfile()
+        exc = None
+        try:
+            df.timestamp
+        except DiskFileNotOpen as err:
+            exc = err
+        self.assertEqual(str(exc), '')
+
+    def test_diskfile_timestamp_deleted(self):
+        df = self._get_open_disk_file()
+        ts = Timestamp.now()
+        df.delete(ts)
+        exp_name = '%s.ts' % ts.internal
+        dl = os.listdir(df._datadir)
+        self.assertEqual(len(dl), 1)
+        self.assertIn(exp_name, set(dl))
+        df = self._simple_get_diskfile()
+        exc = None
+        try:
+            with df.open():
+                df.timestamp
+        except DiskFileDeleted as err:
+            exc = err
+        self.assertEqual(str(exc), '')
+
+    def test_diskfile_timestamp(self):
+        ts_1 = self.ts()
+        self._get_open_disk_file(ts=ts_1.internal)
+        df = self._simple_get_diskfile()
+        with df.open():
+            self.assertEqual(df.timestamp, ts_1.internal)
+        ts_2 = self.ts()
+        df.write_metadata({'X-Timestamp': ts_2.internal})
+        with df.open():
+            self.assertEqual(df.timestamp, ts_2.internal)
+
+    def test_data_timestamp(self):
+        ts_1 = self.ts()
+        self._get_open_disk_file(ts=ts_1.internal)
+        df = self._simple_get_diskfile()
+        with df.open():
+            self.assertEqual(df.data_timestamp, ts_1.internal)
+        ts_2 = self.ts()
+        df.write_metadata({'X-Timestamp': ts_2.internal})
+        with df.open():
+            self.assertEqual(df.data_timestamp, ts_1.internal)
+
+    def test_data_timestamp_not_open(self):
+        df = self._simple_get_diskfile()
+        with self.assertRaises(DiskFileNotOpen):
+            df.data_timestamp
+
+    def test_content_type_and_timestamp(self):
+        ts_1 = self.ts()
+        self._get_open_disk_file(ts=ts_1.internal,
+                                 extra_metadata={'Content-Type': 'image/jpeg'})
+        df = self._simple_get_diskfile()
+        with df.open():
+            self.assertEqual(ts_1.internal, df.data_timestamp)
+            self.assertEqual(ts_1.internal, df.timestamp)
+            self.assertEqual(ts_1.internal, df.content_type_timestamp)
+            self.assertEqual('image/jpeg', df.content_type)
+        ts_2 = self.ts()
+        ts_3 = self.ts()
+        df.write_metadata({'X-Timestamp': ts_3.internal,
+                           'Content-Type': 'image/gif',
+                           'Content-Type-Timestamp': ts_2.internal})
+        with df.open():
+            self.assertEqual(ts_1.internal, df.data_timestamp)
+            self.assertEqual(ts_3.internal, df.timestamp)
+            self.assertEqual(ts_2.internal, df.content_type_timestamp)
+            self.assertEqual('image/gif', df.content_type)
+
+    def test_content_type_timestamp_not_open(self):
+        df = self._simple_get_diskfile()
+        with self.assertRaises(DiskFileNotOpen):
+            df.content_type_timestamp
+
+    def test_content_type_not_open(self):
+        df = self._simple_get_diskfile()
+        with self.assertRaises(DiskFileNotOpen):
+            df.content_type
+
+    def _do_test_durable_timestamp(self, legacy_durable):
+        ts_1 = self.ts()
+        df = self._simple_get_diskfile(frag_index=2)
+        write_diskfile(df, ts_1, legacy_durable=legacy_durable)
+        # get a new instance of the diskfile to ensure timestamp variable is
+        # set by the open() and not just the write operations
+        df = self._simple_get_diskfile(frag_index=2)
+        with df.open():
+            self.assertEqual(df.durable_timestamp, ts_1.internal)
+        # verify durable timestamp does not change when metadata is written
+        ts_2 = self.ts()
+        df.write_metadata({'X-Timestamp': ts_2.internal})
+        with df.open():
+            self.assertEqual(df.durable_timestamp, ts_1.internal)
+
+    def test_durable_timestamp(self):
+        self._do_test_durable_timestamp(False)
+
+    def test_durable_timestamp_not_open(self):
+        df = self._simple_get_diskfile()
+        with self.assertRaises(DiskFileNotOpen):
+            df.durable_timestamp
+
+    def test_durable_timestamp_no_data_file(self):
+        df = self._get_open_disk_file(self.ts().internal)
+        for f in os.listdir(df._datadir):
+            if f.endswith('.data'):
+                os.unlink(os.path.join(df._datadir, f))
+        df = self._simple_get_diskfile()
+        with self.assertRaises(DiskFileNotExist):
+            df.open()
+        # open() was attempted, but no data file so expect None
+        self.assertIsNone(df.durable_timestamp)
+
+    def test_error_in_cleanup_ondisk_files(self):
+
+        def mock_cleanup(*args, **kwargs):
+            raise OSError()
+
+        df = self._get_open_disk_file()
+        file_count = len(os.listdir(df._datadir))
+        ts = Timestamp.now()
+        with mock.patch(
+                self._manager_mock('cleanup_ondisk_files'), mock_cleanup):
+            # Expect to swallow the OSError
+            df.delete(ts)
+        exp_name = '%s.ts' % Timestamp(ts).internal
+        dl = os.listdir(df._datadir)
+        self.assertEqual(len(dl), file_count + 1)
+        self.assertIn(exp_name, set(dl))
+
+    def _system_can_zero_copy(self):
+        if not splice.available:
+            return False
+
+        try:
+            utils.get_md5_socket()
+        except IOError:
+            return False
+
+        return True
+
+    def test_zero_copy_cache_dropping(self):
+        if not self._system_can_zero_copy():
+            raise unittest.SkipTest("zero-copy support is missing")
+        self.conf['splice'] = 'on'
+        self.conf['keep_cache_size'] = 16384
+        self.conf['disk_chunk_size'] = 4096
+
+        df = self._get_open_disk_file(fsize=163840)
+        reader = df.reader()
+        self.assertTrue(reader.can_zero_copy_send())
+        with mock.patch("swift.obj.diskfile.drop_buffer_cache") as dbc:
+            with mock.patch("swift.obj.diskfile.DROP_CACHE_WINDOW", 4095):
+                with open('/dev/null', 'w') as devnull:
+                    reader.zero_copy_send(devnull.fileno())
+                if df.policy.policy_type == EC_POLICY:
+                    expected = 4 + 1
+                else:
+                    expected = (4 * 10) + 1
+                self.assertEqual(len(dbc.mock_calls), expected)
+
+    def test_zero_copy_turns_off_when_md5_sockets_not_supported(self):
+        if not self._system_can_zero_copy():
+            raise unittest.SkipTest("zero-copy support is missing")
+        df_mgr = self.df_router[POLICIES.default]
+        self.conf['splice'] = 'on'
+        with mock.patch('swift.obj.diskfile.get_md5_socket') as mock_md5sock:
+            mock_md5sock.side_effect = IOError(
+                errno.EAFNOSUPPORT, "MD5 socket busted")
+            df = self._get_open_disk_file(fsize=128)
+            reader = df.reader()
+            self.assertFalse(reader.can_zero_copy_send())
+
+            log_lines = df_mgr.logger.get_lines_for_level('warning')
+            self.assertIn('MD5 sockets', log_lines[-1])
+
+    def test_tee_to_md5_pipe_length_mismatch(self):
+        if not self._system_can_zero_copy():
+            raise unittest.SkipTest("zero-copy support is missing")
+        self.conf['splice'] = 'on'
+
+        df = self._get_open_disk_file(fsize=16385)
+        reader = df.reader()
+        self.assertTrue(reader.can_zero_copy_send())
+
+        with mock.patch('swift.obj.diskfile.tee') as mock_tee:
+            mock_tee.side_effect = lambda _1, _2, _3, cnt: cnt - 1
+
+            with open('/dev/null', 'w') as devnull:
+                exc_re = (r'tee\(\) failed: tried to move \d+ bytes, but only '
+                          r'moved -?\d+')
+                try:
+                    reader.zero_copy_send(devnull.fileno())
+                except Exception as e:
+                    self.assertTrue(re.match(exc_re, str(e)))
+                else:
+                    self.fail('Expected Exception was not raised')
+
+    def test_splice_to_wsockfd_blocks(self):
+        if not self._system_can_zero_copy():
+            raise unittest.SkipTest("zero-copy support is missing")
+        self.conf['splice'] = 'on'
+
+        df = self._get_open_disk_file(fsize=16385)
+        reader = df.reader()
+        self.assertTrue(reader.can_zero_copy_send())
+
+        def _run_test():
+            # Set up mock of `splice`
+            splice_called = [False]  # State hack
+
+            def fake_splice(fd_in, off_in, fd_out, off_out, len_, flags):
+                if fd_out == devnull.fileno() and not splice_called[0]:
+                    splice_called[0] = True
+                    err = errno.EWOULDBLOCK
+                    raise IOError(err, os.strerror(err))
+
+                return splice(fd_in, off_in, fd_out, off_out,
+                              len_, flags)
+
+            mock_splice.side_effect = fake_splice
+
+            # Set up mock of `trampoline`
+            # There are 2 reasons to mock this:
+            #
+            # - We want to ensure it's called with the expected arguments at
+            #   least once
+            # - When called with our write FD (which points to `/dev/null`), we
+            #   can't actually call `trampoline`, because adding such FD to an
+            #   `epoll` handle results in `EPERM`
+            def fake_trampoline(fd, read=None, write=None, timeout=None,
+                                timeout_exc=timeout.Timeout,
+                                mark_as_closed=None):
+                if write and fd == devnull.fileno():
+                    return
+                else:
+                    hubs.trampoline(fd, read=read, write=write,
+                                    timeout=timeout, timeout_exc=timeout_exc,
+                                    mark_as_closed=mark_as_closed)
+
+            mock_trampoline.side_effect = fake_trampoline
+
+            reader.zero_copy_send(devnull.fileno())
+
+            # Assert the end of `zero_copy_send` was reached
+            self.assertTrue(mock_close.called)
+            # Assert there was at least one call to `trampoline` waiting for
+            # `write` access to the output FD
+            mock_trampoline.assert_any_call(devnull.fileno(), write=True)
+            # Assert at least one call to `splice` with the output FD we expect
+            for call in mock_splice.call_args_list:
+                args = call[0]
+                if args[2] == devnull.fileno():
+                    break
+            else:
+                self.fail('`splice` not called with expected arguments')
+
+        with mock.patch('swift.obj.diskfile.splice') as mock_splice:
+            with mock.patch.object(
+                    reader, 'close', side_effect=reader.close) as mock_close:
+                with open('/dev/null', 'w') as devnull:
+                    with mock.patch('swift.obj.diskfile.trampoline') as \
+                            mock_trampoline:
+                        _run_test()
+
+    def test_create_unlink_cleanup_DiskFileNoSpace(self):
+        # Test cleanup when DiskFileNoSpace() is raised.
+        df = self.df_mgr.get_diskfile(self.existing_device, '0', 'abc', '123',
+                                      'xyz', policy=POLICIES.legacy)
+        df.manager.use_linkat = False
+        _m_fallocate = mock.MagicMock(side_effect=OSError(errno.ENOSPC,
+                                      os.strerror(errno.ENOSPC)))
+        _m_unlink = mock.Mock()
+        with mock.patch("swift.obj.diskfile.fallocate", _m_fallocate):
+            with mock.patch("os.unlink", _m_unlink):
+                try:
+                    with df.create(size=100):
+                        pass
+                except DiskFileNoSpace:
+                    pass
+                else:
+                    self.fail("Expected exception DiskFileNoSpace")
+        self.assertTrue(_m_fallocate.called)
+        self.assertTrue(_m_unlink.called)
+        self.assertNotIn('error', self.logger.all_log_lines())
+
+    def test_create_unlink_cleanup_renamer_fails(self):
+        # Test cleanup when renamer fails
+        _m_renamer = mock.MagicMock(side_effect=OSError(errno.ENOENT,
+                                    os.strerror(errno.ENOENT)))
+        _m_unlink = mock.Mock()
+        df = self._simple_get_diskfile()
+        df.manager.use_linkat = False
+        data = b'0' * 100
+        metadata = {
+            'ETag': md5(data).hexdigest(),
+            'X-Timestamp': Timestamp.now().internal,
+            'Content-Length': str(100),
+        }
+        with mock.patch("swift.obj.diskfile.renamer", _m_renamer):
+            with mock.patch("os.unlink", _m_unlink):
+                try:
+                    with df.create(size=100) as writer:
+                        writer.write(data)
+                        writer.put(metadata)
+                except OSError:
+                    pass
+                else:
+                    self.fail("Expected OSError exception")
+        self.assertFalse(writer._put_succeeded)
+        self.assertTrue(_m_renamer.called)
+        self.assertTrue(_m_unlink.called)
+        self.assertNotIn('error', self.logger.all_log_lines())
+
+    def test_create_unlink_cleanup_logging(self):
+        # Test logging of os.unlink() failures.
+        df = self.df_mgr.get_diskfile(self.existing_device, '0', 'abc', '123',
+                                      'xyz', policy=POLICIES.legacy)
+        df.manager.use_linkat = False
+        _m_fallocate = mock.MagicMock(side_effect=OSError(errno.ENOSPC,
+                                      os.strerror(errno.ENOSPC)))
+        _m_unlink = mock.MagicMock(side_effect=OSError(errno.ENOENT,
+                                   os.strerror(errno.ENOENT)))
+        with mock.patch("swift.obj.diskfile.fallocate", _m_fallocate):
+            with mock.patch("os.unlink", _m_unlink):
+                try:
+                    with df.create(size=100):
+                        pass
+                except DiskFileNoSpace:
+                    pass
+                else:
+                    self.fail("Expected exception DiskFileNoSpace")
+        self.assertTrue(_m_fallocate.called)
+        self.assertTrue(_m_unlink.called)
+        error_lines = self.logger.get_lines_for_level('error')
+        for line in error_lines:
+            self.assertTrue(line.startswith("Error removing tempfile:"))
+
+    @requires_o_tmpfile_support_in_tmp
+    def test_get_tempfile_use_linkat_os_open_called(self):
+        df = self._simple_get_diskfile()
+        self.assertTrue(df.manager.use_linkat)
+        _m_mkstemp = mock.MagicMock()
+        _m_os_open = mock.Mock(return_value=12345)
+        _m_mkc = mock.Mock()
+        with mock.patch("swift.obj.diskfile.mkstemp", _m_mkstemp):
+            with mock.patch("swift.obj.diskfile.os.open", _m_os_open):
+                with mock.patch("swift.obj.diskfile.makedirs_count", _m_mkc):
+                    writer = df.writer()
+                    fd, tmppath = writer._get_tempfile()
+        self.assertTrue(_m_mkc.called)
+        flags = O_TMPFILE | os.O_WRONLY
+        _m_os_open.assert_called_once_with(df._datadir, flags)
+        self.assertIsNone(tmppath)
+        self.assertEqual(fd, 12345)
+        self.assertFalse(_m_mkstemp.called)
+
+    @requires_o_tmpfile_support_in_tmp
+    def test_get_tempfile_fallback_to_mkstemp(self):
+        df = self._simple_get_diskfile()
+        df._logger = debug_logger()
+        self.assertTrue(df.manager.use_linkat)
+        for err in (errno.EOPNOTSUPP, errno.EISDIR, errno.EINVAL):
+            df.manager.use_linkat = True
+            _m_open = mock.Mock(side_effect=OSError(err, os.strerror(err)))
+            _m_mkstemp = mock.MagicMock(return_value=(0, "blah"))
+            _m_mkc = mock.Mock()
+            with mock.patch("swift.obj.diskfile.os.open", _m_open):
+                with mock.patch("swift.obj.diskfile.mkstemp", _m_mkstemp):
+                    with mock.patch("swift.obj.diskfile.makedirs_count",
+                                    _m_mkc):
+                        writer = df.writer()
+                        fd, tmppath = writer._get_tempfile()
+            self.assertTrue(_m_mkc.called)
+            # Fallback should succeed and mkstemp() should be called.
+            self.assertTrue(_m_mkstemp.called)
+            self.assertEqual(tmppath, "blah")
+            # Once opening file with O_TMPFILE has failed,
+            # failure is cached to not try again
+            self.assertFalse(df.manager.use_linkat)
+            # Now that we try to use O_TMPFILE all the time, log at debug
+            # instead of warning
+            log = df.manager.logger.get_lines_for_level('warning')
+            self.assertFalse(log)
+            log = df.manager.logger.get_lines_for_level('debug')
+            self.assertGreater(len(log), 0)
+            self.assertTrue('O_TMPFILE' in log[-1])
+
+    @requires_o_tmpfile_support_in_tmp
+    def test_get_tmpfile_os_open_other_exceptions_are_raised(self):
+        df = self._simple_get_diskfile()
+        _m_open = mock.Mock(side_effect=OSError(errno.ENOSPC,
+                            os.strerror(errno.ENOSPC)))
+        _m_mkstemp = mock.MagicMock()
+        _m_mkc = mock.Mock()
+        with mock.patch("swift.obj.diskfile.os.open", _m_open):
+            with mock.patch("swift.obj.diskfile.mkstemp", _m_mkstemp):
+                with mock.patch("swift.obj.diskfile.makedirs_count", _m_mkc):
+                    try:
+                        writer = df.writer()
+                        fd, tmppath = writer._get_tempfile()
+                    except OSError as err:
+                        self.assertEqual(err.errno, errno.ENOSPC)
+                    else:
+                        self.fail("Expecting ENOSPC")
+        self.assertTrue(_m_mkc.called)
+        # mkstemp() should not be invoked.
+        self.assertFalse(_m_mkstemp.called)
+
+    @requires_o_tmpfile_support_in_tmp
+    def test_create_use_linkat_renamer_not_called(self):
+        df = self._simple_get_diskfile()
+        data = b'0' * 100
+        metadata = {
+            'ETag': md5(data).hexdigest(),
+            'X-Timestamp': Timestamp.now().internal,
+            'Content-Length': str(100),
+        }
+        _m_renamer = mock.Mock()
+        with mock.patch("swift.obj.diskfile.renamer", _m_renamer):
+            with df.create(size=100) as writer:
+                writer.write(data)
+                writer.put(metadata)
+                self.assertTrue(writer._put_succeeded)
+
+        self.assertFalse(_m_renamer.called)
+
+
+@patch_policies(test_policies)
+class TestDiskFile(DiskFileMixin, unittest.TestCase):
+
+    mgr_cls = diskfile.DiskFileManager
+
+
+@patch_policies(with_ec_default=True)
+class TestECDiskFile(DiskFileMixin, unittest.TestCase):
+
+    mgr_cls = diskfile.ECDiskFileManager
+
+    def _test_commit_raises_DiskFileError_for_rename_error(self, fake_err):
+        df = self._simple_get_diskfile(account='a', container='c',
+                                       obj='o_rename_err',
+                                       policy=POLICIES.default)
+        timestamp = Timestamp.now()
+        with df.create() as writer:
+            metadata = {
+                'ETag': 'bogus_etag',
+                'X-Timestamp': timestamp.internal,
+                'Content-Length': '0',
+            }
+            writer.put(metadata)
+            with mock.patch('swift.obj.diskfile.os.rename',
+                            side_effect=fake_err):
+                with self.assertRaises(DiskFileError) as cm:
+                    writer.commit(timestamp)
+        dl = os.listdir(df._datadir)
+        datafile = _make_datafilename(
+            timestamp, POLICIES.default, frag_index=2, durable=False)
+        self.assertEqual([datafile], dl)
+        return df, cm.exception
+
+    def test_commit_raises_DiskFileError_for_rename_ENOSPC_IOError(self):
+        df, exc = self._test_commit_raises_DiskFileError_for_rename_error(
+            IOError(errno.ENOSPC, 'ENOSPC'))
+        self.assertIsInstance(exc, DiskFileNoSpace)
+        self.assertIn('No space left on device', str(exc))
+        self.assertIn('No space left on device',
+                      df.manager.logger.get_lines_for_level('error')[0])
+        self.assertFalse(df.manager.logger.get_lines_for_level('error')[1:])
+
+    def test_commit_raises_DiskFileError_for_rename_EDQUOT_IOError(self):
+        df, exc = self._test_commit_raises_DiskFileError_for_rename_error(
+            IOError(errno.EDQUOT, 'EDQUOT'))
+        self.assertIsInstance(exc, DiskFileNoSpace)
+        self.assertIn('No space left on device', str(exc))
+        self.assertIn('No space left on device',
+                      df.manager.logger.get_lines_for_level('error')[0])
+        self.assertFalse(df.manager.logger.get_lines_for_level('error')[1:])
+
+    def test_commit_raises_DiskFileError_for_rename_other_IOError(self):
+        df, exc = self._test_commit_raises_DiskFileError_for_rename_error(
+            IOError(21, 'Some other IO Error'))
+        self.assertIn('Problem making data file durable', str(exc))
+        self.assertIn('Problem making data file durable',
+                      df.manager.logger.get_lines_for_level('error')[0])
+        self.assertFalse(df.manager.logger.get_lines_for_level('error')[1:])
+
+    def test_commit_raises_DiskFileError_for_rename_OSError(self):
+        df, exc = self._test_commit_raises_DiskFileError_for_rename_error(
+            OSError(100, 'Some Error'))
+        self.assertIn('Problem making data file durable', str(exc))
+        self.assertIn('Problem making data file durable',
+                      df.manager.logger.get_lines_for_level('error')[0])
+        self.assertFalse(df.manager.logger.get_lines_for_level('error')[1:])
+
+    def _test_commit_raises_DiskFileError_for_fsync_dir_errors(self, fake_err):
+        df = self._simple_get_diskfile(account='a', container='c',
+                                       obj='o_fsync_dir_err',
+                                       policy=POLICIES.default)
+        timestamp = Timestamp.now()
+        with df.create() as writer:
+            metadata = {
+                'ETag': 'bogus_etag',
+                'X-Timestamp': timestamp.internal,
+                'Content-Length': '0',
+            }
+            writer.put(metadata)
+            with mock.patch('swift.obj.diskfile.fsync_dir',
+                            side_effect=fake_err):
+                with self.assertRaises(DiskFileError) as cm:
+                    writer.commit(timestamp)
+        dl = os.listdir(df._datadir)
+        datafile = _make_datafilename(
+            timestamp, POLICIES.default, frag_index=2, durable=True)
+        self.assertEqual([datafile], dl)
+        self.assertIn('Problem making data file durable', str(cm.exception))
+        self.assertIn('Problem making data file durable',
+                      df.manager.logger.get_lines_for_level('error')[0])
+        self.assertFalse(df.manager.logger.get_lines_for_level('error')[1:])
+
+    def test_commit_raises_DiskFileError_for_fsync_dir_IOError(self):
+        self._test_commit_raises_DiskFileError_for_fsync_dir_errors(
+            IOError(21, 'Some IO Error'))
+
+    def test_commit_raises_DiskFileError_for_fsync_dir_OSError(self):
+        self._test_commit_raises_DiskFileError_for_fsync_dir_errors(
+            OSError(100, 'Some Error'))
+
+    def test_commit_raises_DiskFileError_for_error_in_ppi_rename(self):
+        df = self._simple_get_diskfile(account='a', container='c',
+                                       obj='o_fsync_dir_err',
+                                       policy=POLICIES.default,
+                                       next_part_power=11)
+
+        orig_rename = os.rename
+        captured_renames = []
+
+        def exploding_rename(*args):
+            captured_renames.append(args)
+            if len(captured_renames) >= 2:
+                raise IOError(21, 'Some IO Error')
+            else:
+                return orig_rename(*args)
+        timestamp = Timestamp.now()
+        with df.create() as writer:
+            metadata = {
+                'ETag': 'bogus_etag',
+                'X-Timestamp': timestamp.internal,
+                'Content-Length': '0',
+            }
+            writer.put(metadata)
+            with mock.patch('swift.obj.diskfile.os.rename',
+                            side_effect=exploding_rename):
+                with self.assertRaises(DiskFileError) as cm:
+                    writer.commit(timestamp)
+        self.assertEqual(2, len(captured_renames))
+        dl = os.listdir(df._datadir)
+        datafile = _make_datafilename(
+            timestamp, POLICIES.default, frag_index=2, durable=True)
+        self.assertEqual([datafile], dl)
+        self.assertIn('Problem making data file durable', str(cm.exception))
+        error_lines = df.manager.logger.get_lines_for_level('error')
+        self.assertEqual(2, len(error_lines), error_lines)
+        self.assertTrue(error_lines[0].startswith('Renaming new path'))
+        self.assertTrue(error_lines[1].startswith(
+            'Problem making data file durable'))
+
+    def test_commit_overwritten_before_ppi_rename(self):
+        df = self._simple_get_diskfile(account='a', container='c',
+                                       obj='o_fsync_dir_err',
+                                       policy=POLICIES.default,
+                                       next_part_power=11)
+
+        orig_rename = os.rename
+        captured_renames = []
+
+        def overwriting_rename(*args):
+            captured_renames.append(args)
+            if len(captured_renames) == 2:
+                # Overwrite!
+                with df.create() as writer:
+                    metadata = {
+                        'ETag': 'also_bogus_etag',
+                        'X-Timestamp': ts2.internal,
+                        'Content-Length': '0',
+                    }
+                    writer.put(metadata)
+                    writer.commit(ts2)
+                os.unlink(args[0])
+            return orig_rename(*args)
+
+        timestamp = Timestamp.now()
+        ts2 = Timestamp(timestamp, delta=1)
+        with df.create() as writer:
+            metadata = {
+                'ETag': 'bogus_etag',
+                'X-Timestamp': timestamp.internal,
+                'Content-Length': '0',
+            }
+            writer.put(metadata)
+            with mock.patch('swift.obj.diskfile.os.rename',
+                            side_effect=overwriting_rename):
+                writer.commit(timestamp)
+        exp_renames = \
+            [(df._manager.make_on_disk_filename(timestamp, '.data', 2,
+                                                durable=False),
+              df._manager.make_on_disk_filename(timestamp, '.data', 2,
+                                                durable=True))
+             ] * 2
+        if not df._manager.use_linkat:
+            # we capture an extra tmp file rename on some platforms
+            exp_renames += \
+                [(mock.ANY,
+                  df._manager.make_on_disk_filename(ts2, '.data', 2,
+                                                    durable=False))]
+        exp_renames += \
+            [(df._manager.make_on_disk_filename(ts2, '.data', 2,
+                                                durable=False),
+              df._manager.make_on_disk_filename(ts2, '.data', 2,
+                                                durable=True))
+             ] * 2
+        self.assertEqual(
+            exp_renames,
+            [(os.path.basename(args[0]), os.path.basename(args[1]))
+             for args in captured_renames])
+        dl = os.listdir(df._datadir)
+        datafile = _make_datafilename(
+            ts2, POLICIES.default, frag_index=2, durable=True)
+        self.assertEqual([datafile], dl)
+        error_lines = df.manager.logger.get_lines_for_level('error')
+        self.assertEqual(0, len(error_lines), error_lines)
+
+    def test_data_file_has_frag_index(self):
+        policy = POLICIES.default
+        for good_value in (0, '0', 2, '2', 13, '13'):
+            # frag_index set by constructor arg
+            ts = self.ts()
+            expected = [_make_datafilename(
+                ts, policy, good_value, durable=True)]
+            df = self._get_open_disk_file(ts=ts, policy=policy,
+                                          frag_index=good_value)
+            self.assertEqual(expected, sorted(os.listdir(df._datadir)))
+            # frag index should be added to object sysmeta
+            actual = df.get_metadata().get('X-Object-Sysmeta-Ec-Frag-Index')
+            self.assertEqual(int(good_value), int(actual))
+
+            # metadata value overrides the constructor arg
+            ts = self.ts()
+            expected = [_make_datafilename(
+                ts, policy, good_value, durable=True)]
+            meta = {'X-Object-Sysmeta-Ec-Frag-Index': good_value}
+            df = self._get_open_disk_file(ts=ts, policy=policy,
+                                          frag_index='3',
+                                          extra_metadata=meta)
+            self.assertEqual(expected, sorted(os.listdir(df._datadir)))
+            actual = df.get_metadata().get('X-Object-Sysmeta-Ec-Frag-Index')
+            self.assertEqual(int(good_value), int(actual))
+
+            # metadata value alone is sufficient
+            ts = self.ts()
+            expected = [_make_datafilename(
+                ts, policy, good_value, durable=True)]
+            meta = {'X-Object-Sysmeta-Ec-Frag-Index': good_value}
+            df = self._get_open_disk_file(ts=ts, policy=policy,
+                                          frag_index=None,
+                                          extra_metadata=meta)
+            self.assertEqual(expected, sorted(os.listdir(df._datadir)))
+            actual = df.get_metadata().get('X-Object-Sysmeta-Ec-Frag-Index')
+            self.assertEqual(int(good_value), int(actual))
+
+    def test_sysmeta_frag_index_is_immutable(self):
+        # the X-Object-Sysmeta-Ec-Frag-Index should *only* be set when
+        # the .data file is written.
+        policy = POLICIES.default
+        orig_frag_index = 13
+        # frag_index set by constructor arg
+        ts = self.ts()
+        expected = [_make_datafilename(
+            ts, policy, frag_index=orig_frag_index, durable=True)]
+        df = self._get_open_disk_file(ts=ts, policy=policy, obj_name='my_obj',
+                                      frag_index=orig_frag_index)
+        self.assertEqual(expected, sorted(os.listdir(df._datadir)))
+        # frag index should be added to object sysmeta
+        actual = df.get_metadata().get('X-Object-Sysmeta-Ec-Frag-Index')
+        self.assertEqual(int(orig_frag_index), int(actual))
+
+        # open the same diskfile with no frag_index passed to constructor
+        df = self.df_router[policy].get_diskfile(
+            self.existing_device, 0, 'a', 'c', 'my_obj', policy=policy,
+            frag_index=None)
+        df.open()
+        actual = df.get_metadata().get('X-Object-Sysmeta-Ec-Frag-Index')
+        self.assertEqual(int(orig_frag_index), int(actual))
+
+        # write metadata to a meta file
+        ts = self.ts()
+        metadata = {'X-Timestamp': ts.internal,
+                    'X-Object-Meta-Fruit': 'kiwi'}
+        df.write_metadata(metadata)
+        # sanity check we did write a meta file
+        expected.append('%s.meta' % ts.internal)
+        actual_files = sorted(os.listdir(df._datadir))
+        self.assertEqual(expected, actual_files)
+
+        # open the same diskfile, check frag index is unchanged
+        df = self.df_router[policy].get_diskfile(
+            self.existing_device, 0, 'a', 'c', 'my_obj', policy=policy,
+            frag_index=None)
+        df.open()
+        # sanity check we have read the meta file
+        self.assertEqual(ts, df.get_metadata().get('X-Timestamp'))
+        self.assertEqual('kiwi', df.get_metadata().get('X-Object-Meta-Fruit'))
+        # check frag index sysmeta is unchanged
+        actual = df.get_metadata().get('X-Object-Sysmeta-Ec-Frag-Index')
+        self.assertEqual(int(orig_frag_index), int(actual))
+
+        # attempt to overwrite frag index sysmeta
+        ts = self.ts()
+        metadata = {'X-Timestamp': ts.internal,
+                    'X-Object-Sysmeta-Ec-Frag-Index': 99,
+                    'X-Object-Meta-Fruit': 'apple'}
+        df.write_metadata(metadata)
+
+        # open the same diskfile, check frag index is unchanged
+        df = self.df_router[policy].get_diskfile(
+            self.existing_device, 0, 'a', 'c', 'my_obj', policy=policy,
+            frag_index=None)
+        df.open()
+        # sanity check we have read the meta file
+        self.assertEqual(ts, df.get_metadata().get('X-Timestamp'))
+        self.assertEqual('apple', df.get_metadata().get('X-Object-Meta-Fruit'))
+        actual = df.get_metadata().get('X-Object-Sysmeta-Ec-Frag-Index')
+        self.assertEqual(int(orig_frag_index), int(actual))
+
+    def test_data_file_errors_bad_frag_index(self):
+        policy = POLICIES.default
+        df_mgr = self.df_router[policy]
+        for bad_value in ('foo', '-2', -2, '3.14', 3.14, '14', 14, '999'):
+            # check that bad frag_index set by constructor arg raises error
+            # as soon as diskfile is constructed, before data is written
+            self.assertRaises(DiskFileError, self._simple_get_diskfile,
+                              policy=policy, frag_index=bad_value)
+
+            # bad frag_index set by metadata value
+            # (drive-by check that it is ok for constructor arg to be None)
+            df = df_mgr.get_diskfile(self.existing_device, '0', 'a', 'c', 'o',
+                                     policy=policy, frag_index=None)
+            ts = self.ts()
+            meta = {'X-Object-Sysmeta-Ec-Frag-Index': bad_value,
+                    'X-Timestamp': ts.internal,
+                    'Content-Length': 0,
+                    'Etag': MD5_OF_EMPTY_STRING,
+                    'Content-Type': 'plain/text'}
+            with df.create() as writer:
+                try:
+                    writer.put(meta)
+                    self.fail('Expected DiskFileError for frag_index %s'
+                              % bad_value)
+                except DiskFileError:
+                    pass
+
+            # bad frag_index set by metadata value overrides ok constructor arg
+            df = df_mgr.get_diskfile(self.existing_device, '0', 'a', 'c', 'o',
+                                     policy=policy, frag_index=2)
+            ts = self.ts()
+            meta = {'X-Object-Sysmeta-Ec-Frag-Index': bad_value,
+                    'X-Timestamp': ts.internal,
+                    'Content-Length': 0,
+                    'Etag': MD5_OF_EMPTY_STRING,
+                    'Content-Type': 'plain/text'}
+            with df.create() as writer:
+                try:
+                    writer.put(meta)
+                    self.fail('Expected DiskFileError for frag_index %s'
+                              % bad_value)
+                except DiskFileError:
+                    pass
+
+    def test_purge_one_fragment_index(self):
+        ts = self.ts()
+        for frag_index in (1, 2):
+            df = self._simple_get_diskfile(frag_index=frag_index)
+            write_diskfile(df, ts)
+        ts_meta = self.ts()
+        df.write_metadata({
+            'X-Timestamp': ts_meta.internal,
+            'X-Object-Meta-Delete': 'me'
+        })
+
+        # sanity
+        self.assertEqual(sorted(os.listdir(df._datadir)), [
+            ts.internal + '#1#d.data',
+            ts.internal + '#2#d.data',
+            ts_meta.internal + '.meta',
+        ])
+        df.purge(ts, 2)
+        # by default .meta file is not purged
+        self.assertEqual(sorted(os.listdir(df._datadir)), [
+            ts.internal + '#1#d.data',
+            ts_meta.internal + '.meta',
+        ])
+
+    def test_purge_final_fragment_index_and_meta(self):
+        ts = self.ts()
+        df = self._simple_get_diskfile(frag_index=1)
+        write_diskfile(df, ts)
+        ts_meta = self.ts()
+        df.write_metadata({
+            'X-Timestamp': ts_meta.internal,
+            'X-Object-Meta-Delete': 'me',
+        })
+
+        # sanity
+        self.assertEqual(sorted(os.listdir(df._datadir)), [
+            ts.internal + '#1#d.data',
+            ts_meta.internal + '.meta',
+        ])
+        df.purge(ts, 1, meta_timestamp=ts_meta)
+        self.assertFalse(os.path.exists(df._datadir))
+
+    def test_purge_final_fragment_index_and_not_meta(self):
+        ts = self.ts()
+        df = self._simple_get_diskfile(frag_index=1)
+        write_diskfile(df, ts)
+        ts_meta = self.ts()
+        df.write_metadata({
+            'X-Timestamp': ts_meta.internal,
+            'X-Object-Meta-Delete': 'me',
+        })
+
+        # sanity
+        self.assertEqual(sorted(os.listdir(df._datadir)), [
+            ts.internal + '#1#d.data',
+            ts_meta.internal + '.meta',
+        ])
+        df.purge(ts, 1, meta_timestamp=ts)
+        self.assertEqual(sorted(os.listdir(df._datadir)), [
+            ts_meta.internal + '.meta',
+        ])
+
+    def test_purge_last_fragment_index(self):
+        ts = self.ts()
+        frag_index = 0
+        df = self._simple_get_diskfile(frag_index=frag_index)
+        write_diskfile(df, ts)
+        # sanity
+        self.assertEqual(os.listdir(df._datadir), [
+            ts.internal + '#0#d.data',
+        ])
+        df.purge(ts, frag_index)
+        self.assertFalse(os.path.exists(df._datadir))
+
+    def test_purge_last_fragment_index_legacy_durable(self):
+        # a legacy durable file doesn't get purged in case another fragment is
+        # relying on it for durability
+        ts = self.ts()
+        frag_index = 0
+        df = self._simple_get_diskfile(frag_index=frag_index)
+        write_diskfile(df, ts, legacy_durable=True)
+        # sanity
+        self.assertEqual(sorted(os.listdir(df._datadir)), [
+            ts.internal + '#0.data',
+            ts.internal + '.durable',
+        ])
+        df.purge(ts, frag_index)
+        self.assertEqual(sorted(os.listdir(df._datadir)), [
+            ts.internal + '.durable',
+        ])
+
+    def test_purge_non_existent_fragment_index(self):
+        ts = self.ts()
+        frag_index = 7
+        df = self._simple_get_diskfile(frag_index=frag_index)
+        write_diskfile(df, ts)
+
+        # sanity
+        self.assertEqual(os.listdir(df._datadir), [
+            ts.internal + '#7#d.data',
+        ])
+        df.purge(ts, 3)
+        # no effect
+        self.assertEqual(os.listdir(df._datadir), [
+            ts.internal + '#7#d.data',
+        ])
+
+    def test_purge_old_timestamp_frag_index(self):
+        old_ts = self.ts()
+        ts = self.ts()
+        frag_index = 1
+        df = self._simple_get_diskfile(frag_index=frag_index)
+        write_diskfile(df, ts)
+
+        # sanity
+        self.assertEqual(os.listdir(df._datadir), [
+            ts.internal + '#1#d.data',
+        ])
+        df.purge(old_ts, 1)
+        # no effect
+        self.assertEqual(os.listdir(df._datadir), [
+            ts.internal + '#1#d.data',
+        ])
+
+    def test_purge_tombstone(self):
+        ts = self.ts()
+        df = self._simple_get_diskfile(frag_index=3)
+        df.delete(ts)
+
+        # sanity
+        self.assertEqual(sorted(os.listdir(df._datadir)), [
+            ts.internal + '.ts',
+        ])
+        df.purge(ts, 3)
+        self.assertFalse(os.path.exists(df._datadir))
+
+    def test_purge_without_frag(self):
+        ts = self.ts()
+        df = self._simple_get_diskfile()
+        df.delete(ts)
+
+        # sanity
+        self.assertEqual(sorted(os.listdir(df._datadir)), [
+            ts.internal + '.ts',
+        ])
+        df.purge(ts, None)
+        self.assertEqual(sorted(os.listdir(df._datadir)), [])
+
+    def test_purge_old_tombstone(self):
+        old_ts = self.ts()
+        ts = self.ts()
+        df = self._simple_get_diskfile(frag_index=5)
+        df.delete(ts)
+
+        # sanity
+        self.assertEqual(sorted(os.listdir(df._datadir)), [
+            ts.internal + '.ts',
+        ])
+        df.purge(old_ts, 5)
+        # no effect
+        self.assertEqual(sorted(os.listdir(df._datadir)), [
+            ts.internal + '.ts',
+        ])
+
+    def test_purge_already_removed(self):
+        df = self._simple_get_diskfile(frag_index=6)
+
+        df.purge(self.ts(), 6)  # no errors
+
+        # sanity
+        os.makedirs(df._datadir)
+        self.assertEqual(sorted(os.listdir(df._datadir)), [])
+        df.purge(self.ts(), 6)
+        # the directory was empty and has been removed
+        self.assertFalse(os.path.exists(df._datadir))
+
+    def _do_test_open_most_recent_durable(self, legacy_durable):
+        policy = POLICIES.default
+        df_mgr = self.df_router[policy]
+
+        df = df_mgr.get_diskfile(self.existing_device, '0',
+                                 'a', 'c', 'o', policy=policy)
+
+        ts = self.ts()
+        write_diskfile(df, ts, frag_index=3,
+                       legacy_durable=legacy_durable)
+        metadata = {
+            'ETag': md5('test data').hexdigest(),
+            'X-Timestamp': ts.internal,
+            'Content-Length': str(len('test data')),
+            'X-Object-Sysmeta-Ec-Etag': 'fake-etag',
+            'X-Object-Sysmeta-Ec-Frag-Index': '3',
+        }
+
+        # add some .meta stuff
+        extra_meta = {
+            'X-Object-Meta-Foo': 'Bar',
+            'X-Timestamp': self.ts().internal,
+        }
+        df = df_mgr.get_diskfile(self.existing_device, '0',
+                                 'a', 'c', 'o', policy=policy)
+        df.write_metadata(extra_meta)
+
+        # sanity
+        df = df_mgr.get_diskfile(self.existing_device, '0',
+                                 'a', 'c', 'o', policy=policy)
+        metadata.update(extra_meta)
+        self.assertEqual(metadata, df.read_metadata())
+
+        # add a newer datafile
+        df = df_mgr.get_diskfile(self.existing_device, '0',
+                                 'a', 'c', 'o', policy=policy)
+        ts = self.ts()
+        write_diskfile(df, ts, frag_index=3, commit=False,
+                       legacy_durable=legacy_durable)
+        # N.B. don't make it durable
+
+        # and we still get the old metadata (same as if no .data!)
+        df = df_mgr.get_diskfile(self.existing_device, '0',
+                                 'a', 'c', 'o', policy=policy)
+        self.assertEqual(metadata, df.read_metadata())
+
+    def test_open_most_recent_durable(self):
+        self._do_test_open_most_recent_durable(False)
+
+    def test_open_most_recent_durable_legacy(self):
+        self._do_test_open_most_recent_durable(True)
+
+    def test_open_most_recent_missing_durable(self):
+        policy = POLICIES.default
+        df_mgr = self.df_router[policy]
+
+        df = df_mgr.get_diskfile(self.existing_device, '0',
+                                 'a', 'c', 'o', policy=policy)
+
+        self.assertRaises(DiskFileNotExist, df.read_metadata)
+
+        # now create a datafile missing durable
+        ts = self.ts()
+        write_diskfile(df, ts, frag_index=3, commit=False)
+        # add some .meta stuff
+        extra_meta = {
+            'X-Object-Meta-Foo': 'Bar',
+            'X-Timestamp': self.ts().internal,
+        }
+        df = df_mgr.get_diskfile(self.existing_device, '0',
+                                 'a', 'c', 'o', policy=policy)
+        df.write_metadata(extra_meta)
+
+        # we still get the DiskFileNotExist (same as if no .data!)
+        df = df_mgr.get_diskfile(self.existing_device, '0',
+                                 'a', 'c', 'o', policy=policy,
+                                 frag_index=3)
+        self.assertRaises(DiskFileNotExist, df.read_metadata)
+
+        # sanity, without the frag_index kwarg
+        df = df_mgr.get_diskfile(self.existing_device, '0',
+                                 'a', 'c', 'o', policy=policy)
+        self.assertRaises(DiskFileNotExist, df.read_metadata)
+
+    def test_fragments(self):
+        ts_1 = self.ts()
+        self._get_open_disk_file(ts=ts_1.internal, frag_index=0)
+        df = self._get_open_disk_file(ts=ts_1.internal, frag_index=2)
+        self.assertEqual(df.fragments, {ts_1: [0, 2]})
+
+        # now add a newer datafile for frag index 3 but don't write a
+        # durable with it (so ignore the error when we try to open)
+        ts_2 = self.ts()
+        try:
+            df = self._get_open_disk_file(ts=ts_2.internal, frag_index=3,
+                                          commit=False)
+        except DiskFileNotExist:
+            pass
+
+        # sanity check: should have 3* .data
+        files = os.listdir(df._datadir)
+        self.assertEqual(3, len(files))
+        with df.open():
+            self.assertEqual(df.fragments, {ts_1: [0, 2], ts_2: [3]})
+
+    def test_fragments_available_when_not_durable(self):
+        # verify frags available even if open fails e.g. if none are durable
+        ts_1 = self.ts()
+        ts_2 = self.ts()
+        for ts, fi in ((ts_1, 0), (ts_1, 2), (ts_2, 3)):
+            try:
+                df = self._get_open_disk_file(
+                    ts=ts, frag_index=fi, commit=False)
+            except DiskFileNotExist:
+                pass
+        df = self._simple_get_diskfile()
+
+        # sanity check: should have 3* .data
+        files = os.listdir(df._datadir)
+        self.assertEqual(3, len(files))
+        self.assertRaises(DiskFileNotExist, df.open)
+        self.assertEqual(df.fragments, {ts_1: [0, 2], ts_2: [3]})
+
+    def test_fragments_not_open(self):
+        df = self._simple_get_diskfile()
+        self.assertIsNone(df.fragments)
+
+    def test_durable_timestamp_when_not_durable(self):
+        try:
+            self._get_open_disk_file(self.ts().internal, commit=False)
+        except DiskFileNotExist:
+            pass
+        df = self._simple_get_diskfile()
+        with self.assertRaises(DiskFileNotExist):
+            df.open()
+        # open() was attempted, but no durable file so expect None
+        self.assertIsNone(df.durable_timestamp)
+
+    def test_durable_timestamp_missing_frag_index(self):
+        ts1 = self.ts()
+        self._get_open_disk_file(ts=ts1.internal, frag_index=1)
+        df = self._simple_get_diskfile(frag_index=2)
+        with self.assertRaises(DiskFileNotExist):
+            df.open()
+        # open() was attempted, but no data file for frag index so expect None
+        self.assertIsNone(df.durable_timestamp)
+
+    def test_durable_timestamp_newer_non_durable_data_file(self):
+        ts1 = self.ts()
+        self._get_open_disk_file(ts=ts1.internal)
+        ts2 = self.ts()
+        try:
+            self._get_open_disk_file(ts=ts2.internal, commit=False)
+        except DiskFileNotExist:
+            pass
+        df = self._simple_get_diskfile()
+        # sanity check - two .data files
+        self.assertEqual(2, len(os.listdir(df._datadir)))
+        df.open()
+        self.assertEqual(ts1, df.durable_timestamp)
+
+    def test_durable_timestamp_legacy_durable(self):
+        self._do_test_durable_timestamp(True)
+
+    def _test_open_with_fragment_preferences(self, legacy_durable=False):
+        policy = POLICIES.default
+        df_mgr = self.df_router[policy]
+
+        df = df_mgr.get_diskfile(self.existing_device, '0',
+                                 'a', 'c', 'o', policy=policy)
+
+        ts_1, ts_2, ts_3, ts_4 = (self.ts() for _ in range(4))
+
+        # create two durable frags, first with index 0
+        frag_0_metadata = write_diskfile(df, ts_1, frag_index=0,
+                                         legacy_durable=legacy_durable)
+
+        # second with index 3
+        frag_3_metadata = write_diskfile(df, ts_1, frag_index=3,
+                                         legacy_durable=legacy_durable)
+
+        # sanity check: should have 2 * .data plus possibly a .durable
+        self.assertEqual(3 if legacy_durable else 2,
+                         len(os.listdir(df._datadir)))
+
+        # add some .meta stuff
+        meta_1_metadata = {
+            'X-Object-Meta-Foo': 'Bar',
+            'X-Timestamp': ts_2.internal,
+        }
+        df = df_mgr.get_diskfile(self.existing_device, '0',
+                                 'a', 'c', 'o', policy=policy)
+        df.write_metadata(meta_1_metadata)
+        # sanity check: should have 2 * .data, possibly .durable, .meta
+        self.assertEqual(4 if legacy_durable else 3,
+                         len(os.listdir(df._datadir)))
+
+        # sanity: should get frag index 3
+        df = df_mgr.get_diskfile(self.existing_device, '0',
+                                 'a', 'c', 'o', policy=policy)
+        expected = dict(frag_3_metadata)
+        expected.update(meta_1_metadata)
+        self.assertEqual(expected, df.read_metadata())
+
+        # add a newer datafile for frag index 2
+        # N.B. don't make it durable - skip call to commit()
+        df = df_mgr.get_diskfile(self.existing_device, '0',
+                                 'a', 'c', 'o', policy=policy)
+        frag_2_metadata = write_diskfile(df, ts_3, frag_index=2, commit=False,
+                                         data=b'new test data',
+                                         legacy_durable=legacy_durable)
+        # sanity check: should have 2* .data, possibly .durable, .meta, .data
+        self.assertEqual(5 if legacy_durable else 4,
+                         len(os.listdir(df._datadir)))
+
+        # sanity check: with no frag preferences we get old metadata
+        df = df_mgr.get_diskfile(self.existing_device, '0', 'a', 'c', 'o',
+                                 policy=policy)
+        self.assertEqual(expected, df.read_metadata())
+        self.assertEqual(ts_2.internal, df.timestamp)
+        self.assertEqual(ts_1.internal, df.data_timestamp)
+        self.assertEqual(ts_1.internal, df.durable_timestamp)
+        self.assertEqual({ts_1: [0, 3], ts_3: [2]}, df.fragments)
+
+        # with empty frag preferences we get metadata from newer non-durable
+        # data file
+        df = df_mgr.get_diskfile(self.existing_device, '0', 'a', 'c', 'o',
+                                 policy=policy, frag_prefs=[])
+        self.assertEqual(frag_2_metadata, df.read_metadata())
+        self.assertEqual(ts_3.internal, df.timestamp)
+        self.assertEqual(ts_3.internal, df.data_timestamp)
+        self.assertEqual(ts_1.internal, df.durable_timestamp)
+        self.assertEqual({ts_1: [0, 3], ts_3: [2]}, df.fragments)
+
+        # check we didn't destroy any potentially valid data by opening the
+        # non-durable data file
+        df = df_mgr.get_diskfile(self.existing_device, '0', 'a', 'c', 'o',
+                                 policy=policy)
+        self.assertEqual(expected, df.read_metadata())
+
+        # now add some newer .meta stuff which should replace older .meta
+        meta_2_metadata = {
+            'X-Object-Meta-Foo': 'BarBarBarAnne',
+            'X-Timestamp': ts_4.internal,
+        }
+        df = df_mgr.get_diskfile(self.existing_device, '0',
+                                 'a', 'c', 'o', policy=policy)
+        df.write_metadata(meta_2_metadata)
+        # sanity check: should have 2 * .data, possibly .durable, .data, .meta
+        self.assertEqual(5 if legacy_durable else 4,
+                         len(os.listdir(df._datadir)))
+
+        # sanity check: with no frag preferences we get newer metadata applied
+        # to durable data file
+        expected = dict(frag_3_metadata)
+        expected.update(meta_2_metadata)
+        df = df_mgr.get_diskfile(self.existing_device, '0', 'a', 'c', 'o',
+                                 policy=policy)
+        self.assertEqual(expected, df.read_metadata())
+        self.assertEqual(ts_4.internal, df.timestamp)
+        self.assertEqual(ts_1.internal, df.data_timestamp)
+        self.assertEqual(ts_1.internal, df.durable_timestamp)
+        self.assertEqual({ts_1: [0, 3], ts_3: [2]}, df.fragments)
+
+        # with empty frag preferences we still get metadata from newer .meta
+        # but applied to non-durable data file
+        expected = dict(frag_2_metadata)
+        expected.update(meta_2_metadata)
+        df = df_mgr.get_diskfile(self.existing_device, '0', 'a', 'c', 'o',
+                                 policy=policy, frag_prefs=[])
+        self.assertEqual(expected, df.read_metadata())
+        self.assertEqual(ts_4.internal, df.timestamp)
+        self.assertEqual(ts_3.internal, df.data_timestamp)
+        self.assertEqual(ts_1.internal, df.durable_timestamp)
+        self.assertEqual({ts_1: [0, 3], ts_3: [2]}, df.fragments)
+
+        # check we didn't destroy any potentially valid data by opening the
+        # non-durable data file
+        expected = dict(frag_3_metadata)
+        expected.update(meta_2_metadata)
+        df = df_mgr.get_diskfile(self.existing_device, '0', 'a', 'c', 'o',
+                                 policy=policy)
+        self.assertEqual(expected, df.read_metadata())
+        self.assertEqual(ts_4.internal, df.timestamp)
+        self.assertEqual(ts_1.internal, df.data_timestamp)
+        self.assertEqual(ts_1.internal, df.durable_timestamp)
+        self.assertEqual({ts_1: [0, 3], ts_3: [2]}, df.fragments)
+
+        # prefer frags at ts_1, exclude no indexes, expect highest frag index
+        prefs = [{'timestamp': ts_1.internal, 'exclude': []},
+                 {'timestamp': ts_2.internal, 'exclude': []},
+                 {'timestamp': ts_3.internal, 'exclude': []}]
+        expected = dict(frag_3_metadata)
+        expected.update(meta_2_metadata)
+        df = df_mgr.get_diskfile(self.existing_device, '0', 'a', 'c', 'o',
+                                 policy=policy, frag_prefs=prefs)
+        self.assertEqual(expected, df.read_metadata())
+        self.assertEqual(ts_4.internal, df.timestamp)
+        self.assertEqual(ts_1.internal, df.data_timestamp)
+        self.assertEqual(ts_1.internal, df.durable_timestamp)
+        self.assertEqual({ts_1: [0, 3], ts_3: [2]}, df.fragments)
+
+        # prefer frags at ts_1, exclude frag index 3 so expect frag index 0
+        prefs = [{'timestamp': ts_1.internal, 'exclude': [3]},
+                 {'timestamp': ts_2.internal, 'exclude': []},
+                 {'timestamp': ts_3.internal, 'exclude': []}]
+        expected = dict(frag_0_metadata)
+        expected.update(meta_2_metadata)
+        df = df_mgr.get_diskfile(self.existing_device, '0', 'a', 'c', 'o',
+                                 policy=policy, frag_prefs=prefs)
+        self.assertEqual(expected, df.read_metadata())
+        self.assertEqual(ts_4.internal, df.timestamp)
+        self.assertEqual(ts_1.internal, df.data_timestamp)
+        self.assertEqual(ts_1.internal, df.durable_timestamp)
+        self.assertEqual({ts_1: [0, 3], ts_3: [2]}, df.fragments)
+
+        # now make ts_3 the preferred timestamp, excluded indexes don't exist
+        prefs = [{'timestamp': ts_3.internal, 'exclude': [4, 5, 6]},
+                 {'timestamp': ts_2.internal, 'exclude': []},
+                 {'timestamp': ts_1.internal, 'exclude': []}]
+        expected = dict(frag_2_metadata)
+        expected.update(meta_2_metadata)
+        df = df_mgr.get_diskfile(self.existing_device, '0', 'a', 'c', 'o',
+                                 policy=policy, frag_prefs=prefs)
+        self.assertEqual(expected, df.read_metadata())
+        self.assertEqual(ts_4.internal, df.timestamp)
+        self.assertEqual(ts_3.internal, df.data_timestamp)
+        self.assertEqual(ts_1.internal, df.durable_timestamp)
+        self.assertEqual({ts_1: [0, 3], ts_3: [2]}, df.fragments)
+
+        # now make ts_2 the preferred timestamp - there are no frags at ts_2,
+        # next preference is ts_3 but index 2 is excluded, then at ts_1 index 3
+        # is excluded so we get frag 0 at ts_1
+        prefs = [{'timestamp': ts_2.internal, 'exclude': [1]},
+                 {'timestamp': ts_3.internal, 'exclude': [2]},
+                 {'timestamp': ts_1.internal, 'exclude': [3]}]
+
+        expected = dict(frag_0_metadata)
+        expected.update(meta_2_metadata)
+        df = df_mgr.get_diskfile(self.existing_device, '0', 'a', 'c', 'o',
+                                 policy=policy, frag_prefs=prefs)
+        self.assertEqual(expected, df.read_metadata())
+        self.assertEqual(ts_4.internal, df.timestamp)
+        self.assertEqual(ts_1.internal, df.data_timestamp)
+        self.assertEqual(ts_1.internal, df.durable_timestamp)
+        self.assertEqual({ts_1: [0, 3], ts_3: [2]}, df.fragments)
+
+    def test_open_with_fragment_preferences_legacy_durable(self):
+        self._test_open_with_fragment_preferences(legacy_durable=True)
+
+    def test_open_with_fragment_preferences(self):
+        self._test_open_with_fragment_preferences(legacy_durable=False)
+
+    def test_open_with_bad_fragment_preferences(self):
+        policy = POLICIES.default
+        df_mgr = self.df_router[policy]
+
+        for bad in (
+            'ouch',
+            2,
+            [{'timestamp': '1234.5678', 'excludes': [1]}, {}],
+            [{'timestamp': 'not a timestamp', 'excludes': [1, 2]}],
+            [{'timestamp': '1234.5678', 'excludes': [1, -1]}],
+            [{'timestamp': '1234.5678', 'excludes': 1}],
+            [{'timestamp': '1234.5678'}],
+            [{'excludes': [1, 2]}]
+
+        ):
+            try:
+                df_mgr.get_diskfile(self.existing_device, '0', 'a', 'c', 'o',
+                                    policy=policy, frag_prefs=bad)
+                self.fail('Expected DiskFileError for bad frag_prefs: %r'
+                          % bad)
+            except DiskFileError as e:
+                self.assertIn('frag_prefs', str(e))
+
+    def test_disk_file_app_iter_ranges_checks_only_aligned_frag_data(self):
+        policy = POLICIES.default
+        frag_size = policy.fragment_size
+        # make sure there are two fragment size worth of data on disk
+        data = b'ab' * policy.ec_segment_size
+        df, df_data = self._create_test_file(data)
+        quarantine_msgs = []
+        reader = df.reader(_quarantine_hook=quarantine_msgs.append)
+        # each range uses a fresh reader app_iter_range which triggers a disk
+        # read at the range offset - make sure each of those disk reads will
+        # fetch an amount of data from disk that is greater than but not equal
+        # to a fragment size
+        reader._disk_chunk_size = int(frag_size * 1.5)
+        with mock.patch.object(
+                reader._diskfile.policy.pyeclib_driver, 'get_metadata')\
+                as mock_get_metadata:
+            it = reader.app_iter_ranges(
+                [(0, 10), (10, 20),
+                 (frag_size + 20, frag_size + 30)],
+                'plain/text', '\r\n--someheader\r\n', len(df_data))
+            value = b''.join(it)
+        # check that only first range which starts at 0 triggers a frag check
+        self.assertEqual(1, mock_get_metadata.call_count)
+        self.assertIn(df_data[:10], value)
+        self.assertIn(df_data[10:20], value)
+        self.assertIn(df_data[frag_size + 20:frag_size + 30], value)
+        self.assertEqual(quarantine_msgs, [])
+
+    def test_reader_quarantines_corrupted_ec_archive(self):
+        # This has same purpose as
+        # TestAuditor.test_object_audit_checks_EC_fragments just making
+        # sure that checks happen in DiskFileReader layer.
+        policy = POLICIES.default
+        df, df_data = self._create_test_file(b'x' * policy.ec_segment_size,
+                                             timestamp=self.ts())
+
+        def do_test(corrupted_frag_body, expected_offset, expected_read):
+            # expected_offset is offset at which corruption should be reported
+            # expected_read is number of bytes that should be read before the
+            # exception is raised
+            ts = self.ts()
+            write_diskfile(df, ts, corrupted_frag_body)
+
+            # at the open for the diskfile, no error occurred
+            # reading first corrupt frag is sufficient to detect the corruption
+            df.open()
+            with self.assertRaises(DiskFileQuarantined) as cm:
+                reader = df.reader()
+                reader._disk_chunk_size = int(policy.fragment_size)
+                bytes_read = 0
+                for chunk in reader:
+                    bytes_read += len(chunk)
+
+            with self.assertRaises(DiskFileNotExist):
+                df.open()
+
+            self.assertEqual(expected_read, bytes_read)
+            self.assertEqual('Invalid EC metadata at offset 0x%x' %
+                             expected_offset, cm.exception.args[0])
+
+        # TODO with liberasurecode < 1.2.0 the EC metadata verification checks
+        # only the magic number at offset 59 bytes into the frag so we'll
+        # corrupt up to and including that. Once liberasurecode >= 1.2.0 is
+        # required we should be able to reduce the corruption length.
+        corruption_length = 64
+        # corrupted first frag can be detected
+        corrupted_frag_body = (b' ' * corruption_length +
+                               df_data[corruption_length:])
+        do_test(corrupted_frag_body, 0, 0)
+
+        # corrupted the second frag can be also detected
+        corrupted_frag_body = (df_data + b' ' * corruption_length +
+                               df_data[corruption_length:])
+        do_test(corrupted_frag_body, len(df_data), len(df_data))
+
+        # if the second frag is shorter than frag size then corruption is
+        # detected when the reader is closed
+        corrupted_frag_body = (df_data + b' ' * corruption_length +
+                               df_data[corruption_length:-10])
+        do_test(corrupted_frag_body, len(df_data), len(corrupted_frag_body))
+
+    def test_reader_ec_exception_causes_quarantine(self):
+        policy = POLICIES.default
+
+        def do_test(exception):
+            df, df_data = self._create_test_file(b'x' * policy.ec_segment_size,
+                                                 timestamp=self.ts())
+            df.manager.logger.clear()
+
+            with mock.patch.object(df.policy.pyeclib_driver, 'get_metadata',
+                                   side_effect=exception):
+                df.open()
+                with self.assertRaises(DiskFileQuarantined) as cm:
+                    for chunk in df.reader():
+                        pass
+
+            with self.assertRaises(DiskFileNotExist):
+                df.open()
+
+            self.assertEqual('Invalid EC metadata at offset 0x0',
+                             cm.exception.args[0])
+            log_lines = df.manager.logger.get_lines_for_level('warning')
+            self.assertIn('Quarantined object', log_lines[0])
+            self.assertIn('Invalid EC metadata at offset 0x0', log_lines[0])
+
+        do_test(pyeclib.ec_iface.ECInvalidFragmentMetadata('testing'))
+        do_test(pyeclib.ec_iface.ECBadFragmentChecksum('testing'))
+        do_test(pyeclib.ec_iface.ECInvalidParameter('testing'))
+
+    def test_reader_ec_exception_does_not_cause_quarantine(self):
+        # ECDriverError should not cause quarantine, only certain subclasses
+        policy = POLICIES.default
+
+        df, df_data = self._create_test_file(b'x' * policy.ec_segment_size,
+                                             timestamp=self.ts())
+
+        with mock.patch.object(
+                df.policy.pyeclib_driver, 'get_metadata',
+                side_effect=pyeclib.ec_iface.ECDriverError('testing')):
+            df.open()
+            read_data = b''.join([d for d in df.reader()])
+        self.assertEqual(df_data, read_data)
+        log_lines = df.manager.logger.get_lines_for_level('warning')
+        self.assertIn('Problem checking EC fragment', log_lines[0])
+
+        df.open()  # not quarantined
+
+    def test_reader_frag_check_does_not_quarantine_if_its_not_binary(self):
+        # This may look weird but for super-safety, check the
+        # ECDiskFileReader._frag_check doesn't quarantine when non-binary
+        # type chunk incomming (that would occurre only from coding bug)
+        policy = POLICIES.default
+
+        df, df_data = self._create_test_file(b'x' * policy.ec_segment_size,
+                                             timestamp=self.ts())
+        df.open()
+        for invalid_type_chunk in (None, [], [[]], 1):
+            reader = df.reader()
+            reader._check_frag(invalid_type_chunk)
+
+        # None and [] are just skipped and [[]] and 1 are detected as invalid
+        # chunks
+        log_lines = df.manager.logger.get_lines_for_level('warning')
+        self.assertEqual(2, len(log_lines))
+        for log_line in log_lines:
+            self.assertIn(
+                'Unexpected fragment data type (not quarantined)', log_line)
+
+        df.open()  # not quarantined
+
+    def test_ondisk_data_info_has_durable_key(self):
+        # non-durable; use frag_prefs=[] to allow it to be opened
+        df = self._simple_get_diskfile(obj='o1', frag_prefs=[])
+        ts_data = Timestamp(10)
+        self._create_ondisk_file(df, b'', ext='.data', timestamp=ts_data,
+                                 metadata={'name': '/a/c/o1'}, commit=False)
+        with df.open():
+            self.assertIn('durable', df._ondisk_info['data_info'])
+            self.assertFalse(df._ondisk_info['data_info']['durable'])
+
+        # durable
+        df = self._simple_get_diskfile(obj='o2')
+        self._create_ondisk_file(df, b'', ext='.data', timestamp=ts_data,
+                                 metadata={'name': '/a/c/o2'})
+        with df.open():
+            self.assertIn('durable', df._ondisk_info['data_info'])
+            self.assertTrue(df._ondisk_info['data_info']['durable'])
+
+        # legacy durable
+        df = self._simple_get_diskfile(obj='o3')
+        ts_legacy = Timestamp('10')
+        self._create_ondisk_file(df, b'', ext='.data', timestamp=ts_legacy,
+                                 metadata={'name': '/a/c/o3'},
+                                 legacy_durable=True)
+        with df.open():
+            data_info = df._ondisk_info['data_info']
+            # sanity check it is legacy with no #d part in filename
+            self.assertEqual(data_info['filename'], '0000000010.00000#2.data')
+            self.assertIn('durable', data_info)
+            self.assertTrue(data_info['durable'])
+
+
+@patch_policies(with_ec_default=True)
+class TestSuffixHashes(unittest.TestCase):
+    """
+    This tests all things related to hashing suffixes and therefore
+    there's also few test methods for cleanup_ondisk_files as well
+    (because it's used by hash_suffix).
+
+    The public interface to suffix hashing is on the Manager::
+
+         * cleanup_ondisk_files(hsh_path)
+         * get_hashes(device, partition, suffixes, policy)
+         * invalidate_hash(suffix_dir)
+
+    The Manager.get_hashes method (used by the REPLICATE verb)
+    calls Manager._get_hashes (which may be an alias to the module
+    method get_hashes), which calls hash_suffix, which calls
+    cleanup_ondisk_files.
+
+    Outside of that, cleanup_ondisk_files and invalidate_hash are
+    used mostly after writing new files via PUT or DELETE.
+
+    Test methods are organized by::
+
+        * cleanup_ondisk_files tests - behaviors
+        * cleanup_ondisk_files tests - error handling
+        * invalidate_hash tests - behavior
+        * invalidate_hash tests - error handling
+        * get_hashes tests - hash_suffix behaviors
+        * get_hashes tests - hash_suffix error handling
+        * get_hashes tests - behaviors
+        * get_hashes tests - error handling
+
+    """
+
+    def setUp(self):
+        skip_if_no_xattrs()
+        self.testdir = tempfile.mkdtemp()
+        self.logger = debug_logger('suffix-hash-test')
+        self.devices = os.path.join(self.testdir, 'node')
+        os.mkdir(self.devices)
+        self.existing_device = 'sda1'
+        os.mkdir(os.path.join(self.devices, self.existing_device))
+        self.conf = {
+            'swift_dir': self.testdir,
+            'devices': self.devices,
+            'mount_check': False,
+        }
+        self.df_router = diskfile.DiskFileRouter(self.conf, self.logger)
+        self._ts_iter = make_timestamp_iter()
+        self.policy = None
+
+    def ts(self):
+        """
+        Timestamps - forever.
+        """
+        return next(self._ts_iter)
+
+    def fname_to_ts_hash(self, fname):
+        """
+        EC datafiles are only hashed by their timestamp
+        """
+        return md5(fname.split('#', 1)[0]).hexdigest()
+
+    def tearDown(self):
+        rmtree(self.testdir, ignore_errors=1)
+
+    def iter_policies(self):
+        for policy in POLICIES:
+            self.policy = policy
+            yield policy
+
+    @contextmanager
+    def policy_in_message(self):
+        try:
+            yield
+        except AssertionError as err:
+            if not self.policy:
+                raise
+            policy_trailer = '\n\n... for policy %r' % self.policy
+            raise AssertionError(str(err) + policy_trailer)
+
+    def assertEqual(self, *args):
+        with self.policy_in_message():
+            unittest.TestCase.assertEqual(self, *args)
+
+    def get_different_suffix_df(self, df, **kwargs):
+        # returns diskfile in the same partition with different suffix
+        suffix_dir = os.path.dirname(df._datadir)
+        for i in itertools.count():
+            df2 = df._manager.get_diskfile(
+                os.path.basename(df._device_path),
+                df._datadir.split('/')[-3],
+                df._account,
+                df._container,
+                'o%d' % i,
+                policy=df.policy,
+                **kwargs)
+            suffix_dir2 = os.path.dirname(df2._datadir)
+            if suffix_dir != suffix_dir2:
+                return df2
+
+    def test_valid_suffix(self):
+        self.assertTrue(diskfile.valid_suffix(u'000'))
+        self.assertTrue(diskfile.valid_suffix('000'))
+        self.assertTrue(diskfile.valid_suffix('123'))
+        self.assertTrue(diskfile.valid_suffix('fff'))
+        self.assertFalse(diskfile.valid_suffix(list('123')))
+        self.assertFalse(diskfile.valid_suffix(123))
+        self.assertFalse(diskfile.valid_suffix(' 12'))
+        self.assertFalse(diskfile.valid_suffix('-00'))
+        self.assertFalse(diskfile.valid_suffix(u'-00'))
+        self.assertFalse(diskfile.valid_suffix('1234'))
+
+    def check_cleanup_ondisk_files(self, policy, input_files, output_files):
+        orig_unlink = os.unlink
+        file_list = list(input_files)
+        rmdirs = []
+
+        def mock_listdir(path):
+            return list(file_list)
+
+        def mock_unlink(path):
+            # timestamp 1 is a special tag to pretend a file disappeared
+            # between the listdir and unlink.
+            if '/0000000001.00000.' in path:
+                # Using actual os.unlink for a non-existent name to reproduce
+                # exactly what OSError it raises in order to prove that
+                # common.utils.remove_file is squelching the error - but any
+                # OSError would do.
+                orig_unlink(uuid.uuid4().hex)
+            file_list.remove(os.path.basename(path))
+
+        df_mgr = self.df_router[policy]
+        with unit_mock({'os.listdir': mock_listdir, 'os.unlink': mock_unlink,
+                        'os.rmdir': rmdirs.append}):
+            if isinstance(output_files, Exception):
+                path = os.path.join(self.testdir, 'does-not-matter')
+                self.assertRaises(output_files.__class__,
+                                  df_mgr.cleanup_ondisk_files, path)
+                return
+            df_mgr.commit_window = 0
+            files = df_mgr.cleanup_ondisk_files('/whatever')['files']
+            self.assertEqual(files, output_files)
+            if files:
+                self.assertEqual(rmdirs, [])
+            else:
+                self.assertEqual(rmdirs, ['/whatever'])
+
+    # cleanup_ondisk_files tests - behaviors
+
+    def test_cleanup_ondisk_files_purge_data_newer_ts(self):
+        for policy in self.iter_policies():
+            # purge .data if there's a newer .ts
+            file1 = _make_datafilename(self.ts(), policy)
+            file2 = self.ts().internal + '.ts'
+            file_list = [file1, file2]
+            self.check_cleanup_ondisk_files(policy, file_list, [file2])
+
+    def test_cleanup_ondisk_files_purge_expired_ts(self):
+        for policy in self.iter_policies():
+            # purge older .ts files if there's a newer .data
+            file1 = self.ts().internal + '.ts'
+            file2 = self.ts().internal + '.ts'
+            timestamp = self.ts()
+            file3 = _make_datafilename(timestamp, policy, durable=False)
+            file_list = [file1, file2, file3]
+            expected = {
+                # no durable datafile means you can't get rid of the
+                # latest tombstone even if datafile is newer
+                EC_POLICY: [file3, file2],
+                REPL_POLICY: [file3],
+            }[policy.policy_type]
+            self.check_cleanup_ondisk_files(policy, file_list, expected)
+
+    def _do_test_cleanup_ondisk_files_purge_ts_newer_data(
+            self, policy, legacy_durable=False):
+        # purge .ts if there's a newer .data
+        file1 = self.ts().internal + '.ts'
+        timestamp = self.ts()
+        file2 = _make_datafilename(
+            timestamp, policy, durable=not legacy_durable)
+        file_list = [file1, file2]
+        expected = [file2]
+        if policy.policy_type == EC_POLICY and legacy_durable:
+            durable_file = timestamp.internal + '.durable'
+            file_list.append(durable_file)
+            expected.insert(0, durable_file)
+        self.check_cleanup_ondisk_files(policy, file_list, expected)
+
+    def test_cleanup_ondisk_files_purge_ts_newer_data(self):
+        for policy in self.iter_policies():
+            self._do_test_cleanup_ondisk_files_purge_ts_newer_data(policy)
+
+    def test_cleanup_ondisk_files_purge_ts_newer_data_and_legacy_durable(self):
+        for policy in self.iter_policies():
+            if policy.policy_type == EC_POLICY:
+                self._do_test_cleanup_ondisk_files_purge_ts_newer_data(
+                    policy, legacy_durable=True)
+
+    def test_cleanup_ondisk_files_purge_older_ts(self):
+        for policy in self.iter_policies():
+            file1 = self.ts().internal + '.ts'
+            file2 = self.ts().internal + '.ts'
+            file3 = _make_datafilename(self.ts(), policy, durable=False)
+            file4 = self.ts().internal + '.meta'
+            expected = {
+                # no durable means we can only throw out things before
+                # the latest tombstone
+                EC_POLICY: [file4, file3, file2],
+                # keep .meta and .data and purge all .ts files
+                REPL_POLICY: [file4, file3],
+            }[policy.policy_type]
+            file_list = [file1, file2, file3, file4]
+            self.check_cleanup_ondisk_files(policy, file_list, expected)
+
+    def _do_test_cleanup_ondisk_files_keep_meta_data_purge_ts(
+            self, policy, legacy_durable=False):
+        file1 = self.ts().internal + '.ts'
+        file2 = self.ts().internal + '.ts'
+        timestamp = self.ts()
+        file3 = _make_datafilename(
+            timestamp, policy, durable=not legacy_durable)
+        file_list = [file1, file2, file3]
+        expected = [file3]
+        if policy.policy_type == EC_POLICY and legacy_durable:
+            durable_filename = timestamp.internal + '.durable'
+            file_list.append(durable_filename)
+            expected.insert(0, durable_filename)
+        file4 = self.ts().internal + '.meta'
+        file_list.append(file4)
+        expected.insert(0, file4)
+        # keep .meta and .data if meta newer than data and purge .ts
+        self.check_cleanup_ondisk_files(policy, file_list, expected)
+
+    def test_cleanup_ondisk_files_keep_meta_data_purge_ts(self):
+        for policy in self.iter_policies():
+            self._do_test_cleanup_ondisk_files_keep_meta_data_purge_ts(policy)
+
+    def test_cleanup_ondisk_files_keep_meta_data_purge_ts_legacy_durable(self):
+        for policy in self.iter_policies():
+            if policy.policy_type == EC_POLICY:
+                self._do_test_cleanup_ondisk_files_keep_meta_data_purge_ts(
+                    policy, legacy_durable=True)
+
+    def test_cleanup_ondisk_files_keep_one_ts(self):
+        for policy in self.iter_policies():
+            file1, file2, file3 = [self.ts().internal + '.ts'
+                                   for i in range(3)]
+            file_list = [file1, file2, file3]
+            # keep only latest of multiple .ts files
+            self.check_cleanup_ondisk_files(policy, file_list, [file3])
+
+    def test_cleanup_ondisk_files_multi_data_file(self):
+        for policy in self.iter_policies():
+            file1 = _make_datafilename(self.ts(), policy, 1, durable=False)
+            file2 = _make_datafilename(self.ts(), policy, 2, durable=False)
+            file3 = _make_datafilename(self.ts(), policy, 3, durable=False)
+            expected = {
+                # keep all non-durable datafiles
+                EC_POLICY: [file3, file2, file1],
+                # keep only latest of multiple .data files
+                REPL_POLICY: [file3]
+            }[policy.policy_type]
+            file_list = [file1, file2, file3]
+            self.check_cleanup_ondisk_files(policy, file_list, expected)
+
+    def _do_test_cleanup_ondisk_files_keeps_one_datafile(self, policy,
+                                                         legacy_durable=False):
+        timestamps = [self.ts() for i in range(3)]
+        file1 = _make_datafilename(timestamps[0], policy, 1,
+                                   durable=not legacy_durable)
+        file2 = _make_datafilename(timestamps[1], policy, 2,
+                                   durable=not legacy_durable)
+        file3 = _make_datafilename(timestamps[2], policy, 3,
+                                   durable=not legacy_durable)
+        file_list = [file1, file2, file3]
+        expected = [file3]
+        if policy.policy_type == EC_POLICY and legacy_durable:
+            for t in timestamps:
+                file_list.append(t.internal + '.durable')
+            expected.insert(0, file_list[-1])
+        self.check_cleanup_ondisk_files(policy, file_list, expected)
+
+    def test_cleanup_ondisk_files_keeps_one_datafile(self):
+        for policy in self.iter_policies():
+            self._do_test_cleanup_ondisk_files_keeps_one_datafile(policy)
+
+    def test_cleanup_ondisk_files_keeps_one_datafile_and_legacy_durable(self):
+        for policy in self.iter_policies():
+            if policy.policy_type == EC_POLICY:
+                self._do_test_cleanup_ondisk_files_keeps_one_datafile(
+                    policy, legacy_durable=True)
+
+    def _do_test_cleanup_ondisk_files_keep_one_meta(self, policy,
+                                                    legacy_durable=False):
+        # keep only latest of multiple .meta files
+        t_data = self.ts()
+        file1 = _make_datafilename(t_data, policy, durable=not legacy_durable)
+        file2, file3 = [self.ts().internal + '.meta' for i in range(2)]
+        file_list = [file1, file2, file3]
+        expected = [file3, file1]
+        if policy.policy_type == EC_POLICY and legacy_durable:
+            durable_file = t_data.internal + '.durable'
+            file_list.append(durable_file)
+            expected.insert(1, durable_file)
+        self.check_cleanup_ondisk_files(policy, file_list, expected)
+
+    def test_cleanup_ondisk_files_keep_one_meta(self):
+        for policy in self.iter_policies():
+            self._do_test_cleanup_ondisk_files_keep_one_meta(policy)
+
+    def test_cleanup_ondisk_files_keep_one_meta_legacy_durable(self):
+        for policy in self.iter_policies():
+            if policy.policy_type == EC_POLICY:
+                self._do_test_cleanup_ondisk_files_keep_one_meta(
+                    policy, legacy_durable=True)
+
+    def test_cleanup_ondisk_files_only_meta(self):
+        for policy in self.iter_policies():
+            file1, file2 = [self.ts().internal + '.meta' for i in range(2)]
+            file_list = [file1, file2]
+            self.check_cleanup_ondisk_files(policy, file_list, [file2])
+
+    def test_cleanup_ondisk_files_ignore_orphaned_ts(self):
+        for policy in self.iter_policies():
+            # A more recent orphaned .meta file will prevent old .ts files
+            # from being cleaned up otherwise
+            file1, file2 = [self.ts().internal + '.ts' for i in range(2)]
+            file3 = self.ts().internal + '.meta'
+            file_list = [file1, file2, file3]
+            self.check_cleanup_ondisk_files(policy, file_list, [file3, file2])
+
+    def test_cleanup_ondisk_files_purge_old_data_only(self):
+        for policy in self.iter_policies():
+            # Oldest .data will be purge, .meta and .ts won't be touched
+            file1 = _make_datafilename(self.ts(), policy)
+            file2 = self.ts().internal + '.ts'
+            file3 = self.ts().internal + '.meta'
+            file_list = [file1, file2, file3]
+            self.check_cleanup_ondisk_files(policy, file_list, [file3, file2])
+
+    def test_cleanup_ondisk_files_purge_old_ts(self):
+        for policy in self.iter_policies():
+            # A single old .ts file will be removed
+            old_float = time() - (diskfile.DEFAULT_RECLAIM_AGE + 1)
+            file1 = Timestamp(old_float).internal + '.ts'
+            file_list = [file1]
+            self.check_cleanup_ondisk_files(policy, file_list, [])
+
+    def test_cleanup_ondisk_files_keep_isolated_meta_purge_old_ts(self):
+        for policy in self.iter_policies():
+            # A single old .ts file will be removed despite presence of a .meta
+            old_float = time() - (diskfile.DEFAULT_RECLAIM_AGE + 1)
+            file1 = Timestamp(old_float).internal + '.ts'
+            file2 = Timestamp(time() + 2).internal + '.meta'
+            file_list = [file1, file2]
+            self.check_cleanup_ondisk_files(policy, file_list, [file2])
+
+    def test_cleanup_ondisk_files_keep_single_old_data(self):
+        for policy in self.iter_policies():
+            old_float = time() - (diskfile.DEFAULT_RECLAIM_AGE + 1)
+            file1 = _make_datafilename(
+                Timestamp(old_float), policy, durable=True)
+            file_list = [file1]
+            self.check_cleanup_ondisk_files(policy, file_list, file_list)
+
+    def test_cleanup_ondisk_drops_old_non_durable_data(self):
+        for policy in self.iter_policies():
+            if policy.policy_type == EC_POLICY:
+                old_float = time() - (diskfile.DEFAULT_RECLAIM_AGE + 1)
+                file1 = _make_datafilename(
+                    Timestamp(old_float), policy, durable=False)
+                file_list = [file1]
+                # for EC an isolated old non-durable .data file is removed
+                expected = []
+                self.check_cleanup_ondisk_files(policy, file_list, expected)
+
+    def test_cleanup_ondisk_files_drops_isolated_durable(self):
+        # check behaviour for legacy durable files
+        for policy in self.iter_policies():
+            if policy.policy_type == EC_POLICY:
+                file1 = Timestamp.now().internal + '.durable'
+                file_list = [file1]
+                self.check_cleanup_ondisk_files(policy, file_list, [])
+
+    def test_cleanup_ondisk_files_purges_single_old_meta(self):
+        for policy in self.iter_policies():
+            # A single old .meta file will be removed
+            old_float = time() - (diskfile.DEFAULT_RECLAIM_AGE + 1)
+            file1 = Timestamp(old_float).internal + '.meta'
+            file_list = [file1]
+            self.check_cleanup_ondisk_files(policy, file_list, [])
+
+    # cleanup_ondisk_files tests - error handling
+
+    def test_cleanup_ondisk_files_hsh_path_enoent(self):
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            # common.utils.listdir *completely* mutes ENOENT
+            path = os.path.join(self.testdir, 'does-not-exist')
+            self.assertEqual(df_mgr.cleanup_ondisk_files(path)['files'], [])
+
+    def test_cleanup_ondisk_files_hsh_path_other_oserror(self):
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            with mock.patch('os.listdir') as mock_listdir:
+                mock_listdir.side_effect = OSError('kaboom!')
+                # but it will raise other OSErrors
+                path = os.path.join(self.testdir, 'does-not-matter')
+                self.assertRaises(OSError, df_mgr.cleanup_ondisk_files,
+                                  path)
+
+    def test_cleanup_ondisk_files_reclaim_tombstone_remove_file_error(self):
+        for policy in self.iter_policies():
+            # Timestamp 1 makes the check routine pretend the file
+            # disappeared after listdir before unlink.
+            file1 = '0000000001.00000.ts'
+            file_list = [file1]
+            self.check_cleanup_ondisk_files(policy, file_list, [])
+
+    def test_cleanup_ondisk_files_older_remove_file_error(self):
+        for policy in self.iter_policies():
+            # Timestamp 1 makes the check routine pretend the file
+            # disappeared after listdir before unlink.
+            file1 = _make_datafilename(Timestamp(1), policy)
+            file2 = '0000000002.00000.ts'
+            file_list = [file1, file2]
+            self.check_cleanup_ondisk_files(policy, file_list, [])
+
+    # invalidate_hash tests - behavior
+
+    def test_invalidate_hash_race_with_partition_delete(self):
+        part_dir = os.path.join(self.testdir, '0')
+        suffix_dir = os.path.join(part_dir, 'fff')
+        os.makedirs(suffix_dir)
+
+        def replicatorish():
+            with lock_path(part_dir):
+                sleep(0.01)
+                rmtree(part_dir)
+                sleep(0.01)
+
+        spawn(replicatorish)
+        sleep(0)  # make sure thread starts
+        diskfile.invalidate_hash(suffix_dir)
+
+    def test_invalidate_hash_file_does_not_exist(self):
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            df = df_mgr.get_diskfile('sda1', '0', 'a', 'c', 'o',
+                                     policy=policy)
+            suffix_dir = os.path.dirname(df._datadir)
+            suffix = os.path.basename(suffix_dir)
+            part_path = os.path.join(self.devices, 'sda1',
+                                     diskfile.get_data_dir(policy), '0')
+            hashes_file = os.path.join(part_path, diskfile.HASH_FILE)
+            inv_file = os.path.join(
+                part_path, diskfile.HASH_INVALIDATIONS_FILE)
+            # sanity, new partition has no suffix hashing artifacts
+            self.assertFalse(os.path.exists(hashes_file))
+            self.assertFalse(os.path.exists(inv_file))
+            # invalidating a hash does not create the hashes_file
+            with mock.patch(
+                    'swift.obj.diskfile.BaseDiskFileManager.invalidate_hash',
+                    side_effect=diskfile.invalidate_hash) \
+                    as mock_invalidate_hash:
+                df.delete(self.ts())
+            self.assertFalse(os.path.exists(hashes_file))
+            # ... but does invalidate the suffix
+            self.assertEqual([mock.call(suffix_dir)],
+                             mock_invalidate_hash.call_args_list)
+            with open(inv_file) as f:
+                self.assertEqual(suffix, f.read().strip('\n'))
+            # ... and hashing suffixes finds (and hashes) the new suffix
+            hashes = df_mgr.get_hashes('sda1', '0', [], policy)
+            self.assertIn(suffix, hashes)
+            self.assertTrue(os.path.exists(hashes_file))
+            self.assertIn(os.path.basename(suffix_dir), hashes)
+            with open(hashes_file, 'rb') as f:
+                found_hashes = pickle.load(f)
+                found_hashes.pop('updated')
+                self.assertTrue(found_hashes.pop('valid'))
+                self.assertEqual(hashes, found_hashes)
+            # ... and truncates the invalidations file
+            with open(inv_file) as f:
+                self.assertEqual('', f.read().strip('\n'))
+
+    def test_invalidate_hash_empty_file_exists(self):
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            part_path = os.path.join(self.devices, 'sda1',
+                                     diskfile.get_data_dir(policy), '0')
+            mkdirs(part_path)
+            hashes = df_mgr.get_hashes('sda1', '0', [], policy)
+            pkl_path = os.path.join(part_path, diskfile.HASH_FILE)
+            self.assertTrue(os.path.exists(pkl_path))
+            self.assertEqual(hashes, {})
+            # create something to hash
+            df = df_mgr.get_diskfile('sda1', '0', 'a', 'c', 'o',
+                                     policy=policy)
+            df.delete(self.ts())
+            suffix_dir = os.path.dirname(df._datadir)
+            suffix = os.path.basename(suffix_dir)
+            hashes = df_mgr.get_hashes('sda1', '0', [], policy)
+            self.assertIn(suffix, hashes)  # sanity
+
+    def test_invalidate_hash_file_not_truncated_when_empty(self):
+        orig_open = open
+
+        def watch_open(*args, **kargs):
+            name = os.path.basename(args[0])
+            open_log[name].append(args[1])
+            return orig_open(*args, **kargs)
+
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            part_path = os.path.join(self.devices, 'sda1',
+                                     diskfile.get_data_dir(policy), '0')
+            mkdirs(part_path)
+            inv_file = os.path.join(
+                part_path, diskfile.HASH_INVALIDATIONS_FILE)
+            hash_file = os.path.join(
+                part_path, diskfile.HASH_FILE)
+
+            hashes = df_mgr.get_hashes('sda1', '0', [], policy)
+            self.assertEqual(hashes, {})
+            self.assertTrue(os.path.exists(hash_file))
+            # create something to hash
+            df = df_mgr.get_diskfile('sda1', '0', 'a', 'c', 'o',
+                                     policy=policy)
+            df.delete(self.ts())
+            self.assertTrue(os.path.exists(inv_file))
+            # invalidation file created, lets consolidate it
+            df_mgr.get_hashes('sda1', '0', [], policy)
+
+            open_log = defaultdict(list)
+            with mock.patch('builtins.open', watch_open):
+                self.assertTrue(os.path.exists(inv_file))
+                # no new suffixes get invalidated... so no write iop
+                df_mgr.get_hashes('sda1', '0', [], policy)
+            # each file is opened once to read
+            expected = {
+                'hashes.pkl': ['rb'],
+                'hashes.invalid': ['r'],
+            }
+            self.assertEqual(open_log, expected)
+
+    def _test_invalidate_hash_racing_get_hashes_diff_suffix(self, existing):
+        # a suffix can be changed or created by second process while new pkl is
+        # being calculated - verify that suffix is correct after next
+        # get_hashes call
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            part_path = os.path.join(self.devices, 'sda1',
+                                     diskfile.get_data_dir(policy), '0')
+            if existing:
+                mkdirs(part_path)
+                # force hashes.pkl to exist
+                df_mgr.get_hashes('sda1', '0', [], policy)
+                self.assertTrue(os.path.exists(os.path.join(
+                    part_path, diskfile.HASH_FILE)))
+            orig_listdir = os.listdir
+            df = df_mgr.get_diskfile('sda1', '0', 'a', 'c', 'o',
+                                     policy=policy)
+            suffix = os.path.basename(os.path.dirname(df._datadir))
+            df2 = self.get_different_suffix_df(df)
+            suffix2 = os.path.basename(os.path.dirname(df2._datadir))
+            non_local = {'df2touched': False}
+            df.delete(self.ts())
+
+            def mock_listdir(*args, **kwargs):
+                # simulating an invalidation occurring in another process while
+                # get_hashes is executing
+                result = orig_listdir(*args, **kwargs)
+                if not non_local['df2touched']:
+                    non_local['df2touched'] = True
+                    # other process creates new suffix
+                    df2.delete(self.ts())
+                return result
+
+            if not existing:
+                self.assertFalse(os.path.exists(os.path.join(
+                    part_path, diskfile.HASH_FILE)))
+            with mock.patch('swift.obj.diskfile.os.listdir',
+                            mock_listdir):
+                # creates pkl file if not already there
+                hashes = df_mgr.get_hashes('sda1', '0', [], policy)
+            self.assertTrue(os.path.exists(os.path.join(
+                part_path, diskfile.HASH_FILE)))
+
+            # second suffix added after directory listing, it's added later
+            self.assertIn(suffix, hashes)
+            self.assertNotIn(suffix2, hashes)
+            # updates pkl file
+            hashes = df_mgr.get_hashes('sda1', '0', [], policy)
+            self.assertIn(suffix, hashes)
+            self.assertIn(suffix2, hashes)
+
+    def test_invalidate_hash_racing_get_hashes_diff_suffix_new_part(self):
+        self._test_invalidate_hash_racing_get_hashes_diff_suffix(False)
+
+    def test_invalidate_hash_racing_get_hashes_diff_suffix_existing_part(self):
+        self._test_invalidate_hash_racing_get_hashes_diff_suffix(True)
+
+    def _check_hash_invalidations_race_get_hashes_same_suffix(self, existing):
+        # verify that when two processes concurrently call get_hashes, then any
+        # concurrent hash invalidation will survive and be consolidated on a
+        # subsequent call to get_hashes (i.e. ensure first get_hashes process
+        # does not ignore the concurrent hash invalidation that second
+        # get_hashes might have consolidated to hashes.pkl)
+        non_local = {}
+
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            orig_hash_suffix = df_mgr._hash_suffix
+            if existing:
+                # create hashes.pkl
+                part_path = os.path.join(self.devices, 'sda1',
+                                         diskfile.get_data_dir(policy), '0')
+                mkdirs(part_path)
+                df_mgr.get_hashes('sda1', '0', [], policy)
+                self.assertTrue(os.path.exists(os.path.join(
+                    part_path, diskfile.HASH_FILE)))
+
+            df = df_mgr.get_diskfile('sda1', '0', 'a', 'c', 'o',
+                                     policy=policy)
+            suffix_dir = os.path.dirname(df._datadir)
+            suffix = os.path.basename(suffix_dir)
+            part_dir = os.path.dirname(suffix_dir)
+            invalidations_file = os.path.join(
+                part_dir, diskfile.HASH_INVALIDATIONS_FILE)
+
+            non_local['hash'] = None
+            non_local['called'] = False
+
+            # delete will append suffix to hashes.invalid
+            df.delete(self.ts())
+            with open(invalidations_file) as f:
+                self.assertEqual(suffix, f.read().strip('\n'))  # sanity
+            hash1 = df_mgr._hash_suffix(suffix_dir)
+
+            def mock_hash_suffix(*args, **kwargs):
+                # after first get_hashes has called _hash_suffix, simulate a
+                # second process invalidating the same suffix, followed by a
+                # third process calling get_hashes and failing (or yielding)
+                # after consolidate_hashes has completed
+                result = orig_hash_suffix(*args, **kwargs)
+                if not non_local['called']:
+                    non_local['called'] = True
+                    # appends suffix to hashes.invalid
+                    df.delete(self.ts())
+                    # simulate another process calling get_hashes but failing
+                    # after hash invalidation have been consolidated
+                    hashes = df_mgr.consolidate_hashes(part_dir)
+                    if existing:
+                        self.assertTrue(hashes['valid'])
+                    else:
+                        self.assertFalse(hashes['valid'])
+                    # get the updated suffix hash...
+                    non_local['hash'] = orig_hash_suffix(suffix_dir)
+                return result
+
+            with mock.patch.object(df_mgr, '_hash_suffix', mock_hash_suffix):
+                # repeats listing when pkl modified
+                hashes = df_mgr.get_hashes('sda1', '0', [], policy)
+
+            # first get_hashes should complete with suffix1 state
+            self.assertIn(suffix, hashes)
+            # sanity check - the suffix hash has changed...
+            self.assertNotEqual(hash1, non_local['hash'])
+            # the invalidation file has been truncated...
+            with open(invalidations_file, 'r') as f:
+                self.assertEqual('', f.read())
+            # so hashes should have the latest suffix hash...
+            self.assertEqual(hashes[suffix], non_local['hash'])
+
+            non_local['called'] = False
+            with mock.patch.object(df_mgr, '_hash_suffix', mock_hash_suffix):
+                df_mgr.get_hashes('sda1', '0', [suffix], policy,
+                                  skip_rehash=True)
+            self.assertFalse(non_local['called'])
+            with open(invalidations_file) as f:
+                self.assertEqual(suffix, f.read().strip('\n'))  # sanity
+
+    def test_hash_invalidations_race_get_hashes_same_suffix_new(self):
+        self._check_hash_invalidations_race_get_hashes_same_suffix(False)
+
+    def test_hash_invalidations_race_get_hashes_same_suffix_existing(self):
+        self._check_hash_invalidations_race_get_hashes_same_suffix(True)
+
+    def _check_unpickle_error_and_get_hashes_failure(self, existing):
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            df = df_mgr.get_diskfile('sda1', '0', 'a', 'c', 'o',
+                                     policy=policy)
+            suffix = os.path.basename(os.path.dirname(df._datadir))
+
+            # avoid getting O_TMPFILE warning in logs
+            if not utils.o_tmpfile_in_tmpdir_supported():
+                df.manager.use_linkat = False
+            if existing:
+                df.delete(self.ts())
+                hashes = df_mgr.get_hashes('sda1', '0', [], policy)
+            df.delete(self.ts())
+            part_path = os.path.join(self.devices, 'sda1',
+                                     diskfile.get_data_dir(policy), '0')
+            hashes_file = os.path.join(part_path, diskfile.HASH_FILE)
+            # write a corrupt hashes.pkl
+            open(hashes_file, 'w')
+            # simulate first call to get_hashes failing after attempting to
+            # consolidate hashes
+            with mock.patch('swift.obj.diskfile.os.listdir',
+                            side_effect=Exception()):
+                self.assertRaises(
+                    Exception, df_mgr.get_hashes, 'sda1', '0', [], policy)
+            # sanity on-disk state is invalid
+            with open(hashes_file, 'rb') as f:
+                found_hashes = pickle.load(f)
+                found_hashes.pop('updated')
+                self.assertEqual(False, found_hashes.pop('valid'))
+            # verify subsequent call to get_hashes reaches correct outcome
+            hashes = df_mgr.get_hashes('sda1', '0', [], policy)
+            self.assertIn(suffix, hashes)
+            self.assertEqual([], df_mgr.logger.get_lines_for_level('warning'))
+
+    def test_unpickle_error_and_get_hashes_failure_new_part(self):
+        self._check_unpickle_error_and_get_hashes_failure(False)
+
+    def test_unpickle_error_and_get_hashes_failure_existing_part(self):
+        self._check_unpickle_error_and_get_hashes_failure(True)
+
+    def test_invalidate_hash_consolidation(self):
+        def assert_consolidation(suffixes):
+            # verify that suffixes are invalidated after consolidation
+            with mock.patch('swift.obj.diskfile.lock_path') as mock_lock:
+                hashes = df_mgr.consolidate_hashes(part_path)
+            self.assertTrue(mock_lock.called)
+            for suffix in suffixes:
+                self.assertIn(suffix, hashes)
+                self.assertIsNone(hashes[suffix])
+            with open(hashes_file, 'rb') as f:
+                found_hashes = pickle.load(f)
+                self.assertTrue(hashes['valid'])
+                self.assertEqual(hashes, found_hashes)
+            with open(invalidations_file, 'r') as f:
+                self.assertEqual("", f.read())
+            return hashes
+
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            # create something to hash
+            df = df_mgr.get_diskfile('sda1', '0', 'a', 'c', 'o',
+                                     policy=policy)
+            df.delete(self.ts())
+            suffix_dir = os.path.dirname(df._datadir)
+            suffix = os.path.basename(suffix_dir)
+            original_hashes = df_mgr.get_hashes('sda1', '0', [], policy)
+            self.assertIn(suffix, original_hashes)  # sanity
+            self.assertIsNotNone(original_hashes[suffix])
+
+            # sanity check hashes file
+            part_path = os.path.join(self.devices, 'sda1',
+                                     diskfile.get_data_dir(policy), '0')
+            hashes_file = os.path.join(part_path, diskfile.HASH_FILE)
+            invalidations_file = os.path.join(
+                part_path, diskfile.HASH_INVALIDATIONS_FILE)
+            with open(hashes_file, 'rb') as f:
+                found_hashes = pickle.load(f)
+                found_hashes.pop('updated')
+                self.assertTrue(found_hashes.pop('valid'))
+                self.assertEqual(original_hashes, found_hashes)
+
+            # invalidate the hash
+            with mock.patch('swift.obj.diskfile.lock_path') as mock_lock:
+                df_mgr.invalidate_hash(suffix_dir)
+            self.assertTrue(mock_lock.called)
+            # suffix should be in invalidations file
+            with open(invalidations_file, 'r') as f:
+                self.assertEqual(suffix + "\n", f.read())
+            # hashes file is unchanged
+            with open(hashes_file, 'rb') as f:
+                found_hashes = pickle.load(f)
+                found_hashes.pop('updated')
+                self.assertTrue(found_hashes.pop('valid'))
+                self.assertEqual(original_hashes, found_hashes)
+
+            # consolidate the hash and the invalidations
+            hashes = assert_consolidation([suffix])
+
+            # invalidate a different suffix hash in same partition but not in
+            # existing hashes.pkl
+            df2 = self.get_different_suffix_df(df)
+            df2.delete(self.ts())
+            suffix_dir2 = os.path.dirname(df2._datadir)
+            suffix2 = os.path.basename(suffix_dir2)
+            # suffix2 should be in invalidations file
+            with open(invalidations_file, 'r') as f:
+                self.assertEqual(suffix2 + "\n", f.read())
+            # hashes file is not yet changed
+            with open(hashes_file, 'rb') as f:
+                found_hashes = pickle.load(f)
+                self.assertTrue(hashes['valid'])
+                self.assertEqual(hashes, found_hashes)
+
+            # consolidate hashes
+            hashes = assert_consolidation([suffix, suffix2])
+
+            # invalidating suffix2 multiple times is ok
+            df2.delete(self.ts())
+            df2.delete(self.ts())
+            # suffix2 should be in invalidations file
+            with open(invalidations_file, 'r') as f:
+                invalids = f.read().splitlines()
+                self.assertEqual(sorted((suffix2, suffix2)),
+                                 sorted(invalids))  # sanity
+            # hashes file is not yet changed
+            with open(hashes_file, 'rb') as f:
+                found_hashes = pickle.load(f)
+                self.assertTrue(hashes['valid'])
+                self.assertEqual(hashes, found_hashes)
+            # consolidate hashes
+            assert_consolidation([suffix, suffix2])
+
+            # Might get some garbage in your invalidations file
+            part_dir = os.path.dirname(suffix_dir)
+            bad_suffix = "~" + suffix
+            df_mgr.invalidate_hash(os.path.join(part_dir, bad_suffix))
+            # Sure enough, it's in there
+            with open(invalidations_file, 'r') as f:
+                self.assertEqual(bad_suffix + "\n", f.read())
+            # ... but it won't taint your pickle
+            hashes = df_mgr.consolidate_hashes(part_path)
+            self.assertNotIn(bad_suffix, hashes)
+            with open(invalidations_file, 'r') as f:
+                self.assertEqual("", f.read())
+
+            # Old code doesn't have that protection
+            df_mgr.invalidate_hash(os.path.join(part_dir, bad_suffix))
+            with open(invalidations_file, 'r') as f:
+                self.assertEqual(bad_suffix + "\n", f.read())
+            with mock.patch.object(diskfile, 'valid_suffix', lambda s: True):
+                # ... so it would propogate to the pickle when we consolidate,
+                # and we ought to be able to deal with that
+                hashes = assert_consolidation([bad_suffix])
+            self.assertIn(bad_suffix, hashes)
+            self.assertIsNone(hashes[bad_suffix])
+            # When we go to really get hashes, we see the bad,
+            # throw out the existing pickle, and rehash everything
+            hashes = df_mgr.get_hashes('sda1', '0', [], policy)
+            self.assertNotIn(bad_suffix, hashes)
+
+    def test_get_hashes_consolidates_suffix_rehash_once(self):
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            df = df_mgr.get_diskfile('sda1', '0', 'a', 'c', 'o',
+                                     policy=policy)
+            df.delete(self.ts())
+            suffix_dir = os.path.dirname(df._datadir)
+
+            with mock.patch.object(df_mgr, 'consolidate_hashes',
+                                   side_effect=df_mgr.consolidate_hashes
+                                   ) as mock_consolidate_hashes, \
+                    mock.patch.object(df_mgr, '_hash_suffix',
+                                      side_effect=df_mgr._hash_suffix
+                                      ) as mock_hash_suffix:
+                # creates pkl file
+                df_mgr.get_hashes('sda1', '0', [], policy)
+                mock_consolidate_hashes.assert_called_once()
+                self.assertEqual([mock.call(suffix_dir, policy=policy)],
+                                 mock_hash_suffix.call_args_list)
+                # second object in path
+                df2 = self.get_different_suffix_df(df)
+                df2.delete(self.ts())
+                suffix_dir2 = os.path.dirname(df2._datadir)
+                mock_consolidate_hashes.reset_mock()
+                mock_hash_suffix.reset_mock()
+                # updates pkl file
+                df_mgr.get_hashes('sda1', '0', [], policy)
+                mock_consolidate_hashes.assert_called_once()
+                self.assertEqual([mock.call(suffix_dir2, policy=policy)],
+                                 mock_hash_suffix.call_args_list)
+
+    def test_consolidate_hashes_raises_exception(self):
+        # verify that if consolidate_hashes raises an exception then suffixes
+        # are rehashed and a hashes.pkl is written
+        for policy in self.iter_policies():
+            part_path = os.path.join(self.devices, 'sda1',
+                                     diskfile.get_data_dir(policy), '0')
+            hashes_file = os.path.join(part_path, diskfile.HASH_FILE)
+            invalidations_file = os.path.join(
+                part_path, diskfile.HASH_INVALIDATIONS_FILE)
+
+            self.logger.clear()
+            df_mgr = self.df_router[policy]
+            # create something to hash
+            df = df_mgr.get_diskfile('sda1', '0', 'a', 'c', 'o',
+                                     policy=policy)
+
+            # avoid getting O_TMPFILE warning in logs
+            if not utils.o_tmpfile_in_tmpdir_supported():
+                df.manager.use_linkat = False
+
+            self.assertFalse(os.path.exists(part_path))
+            df.delete(self.ts())
+            self.assertTrue(os.path.exists(invalidations_file))
+            suffix_dir = os.path.dirname(df._datadir)
+            suffix = os.path.basename(suffix_dir)
+            # no pre-existing hashes.pkl
+            self.assertFalse(os.path.exists(hashes_file))
+            with mock.patch.object(df_mgr, '_hash_suffix',
+                                   return_value='fake hash'):
+                with mock.patch.object(df_mgr, 'consolidate_hashes',
+                                       side_effect=Exception()):
+                    hashes = df_mgr.get_hashes('sda1', '0', [], policy)
+            self.assertEqual({suffix: 'fake hash'}, hashes)
+
+            # sanity check hashes file
+            with open(hashes_file, 'rb') as f:
+                found_hashes = pickle.load(f)
+                found_hashes.pop('updated')
+                self.assertTrue(found_hashes.pop('valid'))
+                self.assertEqual(hashes, found_hashes)
+
+            # sanity check log warning
+            warnings = self.logger.get_lines_for_level('warning')
+            self.assertEqual(warnings, ["Unable to read %r" % hashes_file])
+
+            # repeat with pre-existing hashes.pkl
+            self.logger.clear()
+            with mock.patch.object(df_mgr, '_hash_suffix',
+                                   return_value='new fake hash'):
+                with mock.patch.object(df_mgr, 'consolidate_hashes',
+                                       side_effect=Exception()):
+                    hashes = df_mgr.get_hashes('sda1', '0', [], policy)
+            self.assertEqual({suffix: 'new fake hash'}, hashes)
+
+            # sanity check hashes file
+            with open(hashes_file, 'rb') as f:
+                found_hashes = pickle.load(f)
+                found_hashes.pop('updated')
+                self.assertTrue(found_hashes.pop('valid'))
+                self.assertEqual(hashes, found_hashes)
+
+            # sanity check log warning
+            warnings = self.logger.get_lines_for_level('warning')
+            self.assertEqual(warnings, ["Unable to read %r" % hashes_file])
+
+    # invalidate_hash tests - error handling
+
+    def test_invalidate_hash_bad_pickle(self):
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            # make some valid data
+            df = df_mgr.get_diskfile('sda1', '0', 'a', 'c', 'o',
+                                     policy=policy)
+            suffix_dir = os.path.dirname(df._datadir)
+            suffix = os.path.basename(suffix_dir)
+            df.delete(self.ts())
+            # sanity check hashes file
+            part_path = os.path.join(self.devices, 'sda1',
+                                     diskfile.get_data_dir(policy), '0')
+            hashes_file = os.path.join(part_path, diskfile.HASH_FILE)
+            self.assertFalse(os.path.exists(hashes_file))
+            # write some garbage in hashes file
+            with open(hashes_file, 'w') as f:
+                f.write('asdf')
+            # invalidate_hash silently *NOT* repair invalid data
+            df_mgr.invalidate_hash(suffix_dir)
+            with open(hashes_file) as f:
+                self.assertEqual(f.read(), 'asdf')
+            # ... but get_hashes will
+            hashes = df_mgr.get_hashes('sda1', '0', [], policy)
+            self.assertIn(suffix, hashes)
+
+    # get_hashes tests - hash_suffix behaviors
+
+    def test_hash_suffix_one_tombstone(self):
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            df = df_mgr.get_diskfile(
+                'sda1', '0', 'a', 'c', 'o', policy=policy)
+            suffix = os.path.basename(os.path.dirname(df._datadir))
+            # write a tombstone
+            timestamp = self.ts()
+            df.delete(timestamp)
+            tombstone_hash = md5(timestamp.internal + '.ts').hexdigest()
+            hashes = df_mgr.get_hashes('sda1', '0', [], policy)
+            expected = {
+                REPL_POLICY: {suffix: tombstone_hash},
+                EC_POLICY: {suffix: {
+                    # fi is None here because we have a tombstone
+                    None: tombstone_hash}},
+            }[policy.policy_type]
+            self.assertEqual(hashes, expected)
+
+    def test_hash_suffix_one_tombstone_and_one_meta(self):
+        # A tombstone plus a newer meta file can happen if a tombstone is
+        # replicated to a node with a newer meta file but older data file. The
+        # meta file will be ignored when the diskfile is opened so the
+        # effective state of the disk files is equivalent to only having the
+        # tombstone. Replication cannot remove the meta file, and the meta file
+        # cannot be ssync replicated to a node with only the tombstone, so
+        # we want the get_hashes result to be the same as if the meta file was
+        # not there.
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            df = df_mgr.get_diskfile(
+                'sda1', '0', 'a', 'c', 'o', policy=policy)
+            suffix = os.path.basename(os.path.dirname(df._datadir))
+            # write a tombstone
+            timestamp = self.ts()
+            df.delete(timestamp)
+            # write a meta file
+            df.write_metadata({'X-Timestamp': self.ts().internal})
+            # sanity check
+            self.assertEqual(2, len(os.listdir(df._datadir)))
+            tombstone_hash = md5(timestamp.internal + '.ts').hexdigest()
+            hashes = df_mgr.get_hashes('sda1', '0', [], policy)
+            expected = {
+                REPL_POLICY: {suffix: tombstone_hash},
+                EC_POLICY: {suffix: {
+                    # fi is None here because we have a tombstone
+                    None: tombstone_hash}},
+            }[policy.policy_type]
+            self.assertEqual(hashes, expected)
+
+    def test_hash_suffix_one_reclaim_tombstone_and_one_meta(self):
+        # An isolated meta file can happen if a tombstone is replicated to a
+        # node with a newer meta file but older data file, and the tombstone is
+        # subsequently reclaimed. The meta file will be ignored when the
+        # diskfile is opened so the effective state of the disk files is
+        # equivalent to having no files.
+        for policy in self.iter_policies():
+            if policy.policy_type == EC_POLICY:
+                continue
+            df_mgr = self.df_router[policy]
+            df = df_mgr.get_diskfile(
+                'sda1', '0', 'a', 'c', 'o', policy=policy)
+            suffix = os.path.basename(os.path.dirname(df._datadir))
+            now = time()
+            # write a tombstone that's just a *little* older than reclaim time
+            df.delete(Timestamp(now - 1001))
+            # write a meta file that's not quite so old
+            ts_meta = Timestamp(now - 501)
+            df.write_metadata({'X-Timestamp': ts_meta.internal})
+            # sanity check
+            self.assertEqual(2, len(os.listdir(df._datadir)))
+            # scale back the df manager's reclaim age a bit to make the
+            # tombstone reclaimable
+            df_mgr.reclaim_age = 1000
+
+            hashes = df_mgr.get_hashes('sda1', '0', [], policy)
+            # the tombstone is reclaimed, the meta file remains, the suffix
+            # hash is not updated BUT the suffix dir cannot be deleted so
+            # a suffix hash equal to hash of empty string is reported.
+            # TODO: this is not same result as if the meta file did not exist!
+            self.assertEqual([ts_meta.internal + '.meta'],
+                             os.listdir(df._datadir))
+            self.assertEqual(hashes, {suffix: MD5_OF_EMPTY_STRING})
+
+            # scale back the df manager's reclaim age even more - call to
+            # get_hashes does not trigger reclaim because the suffix has
+            # MD5_OF_EMPTY_STRING in hashes.pkl
+            df_mgr.reclaim_age = 500
+            df_mgr.commit_window = 0
+            hashes = df_mgr.get_hashes('sda1', '0', [], policy)
+            self.assertEqual([ts_meta.internal + '.meta'],
+                             os.listdir(df._datadir))
+            self.assertEqual(hashes, {suffix: MD5_OF_EMPTY_STRING})
+
+            # call get_hashes with recalculate = [suffix] and the suffix dir
+            # gets re-hashed so the .meta if finally reclaimed.
+            hashes = df_mgr.get_hashes('sda1', '0', [suffix], policy)
+            self.assertFalse(os.path.exists(os.path.dirname(df._datadir)))
+            self.assertEqual(hashes, {})
+
+    def test_hash_suffix_one_reclaim_tombstone(self):
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            df = df_mgr.get_diskfile(
+                'sda1', '0', 'a', 'c', 'o', policy=policy)
+            # scale back this tests manager's reclaim age a bit
+            df_mgr.reclaim_age = 1000
+            # write a tombstone that's just a *little* older
+            old_time = time() - 1001
+            timestamp = Timestamp(old_time)
+            df.delete(timestamp.internal)
+            hashes = df_mgr.get_hashes('sda1', '0', [], policy)
+            self.assertEqual(hashes, {})
+
+    def test_hash_suffix_ts_cleanup_after_recalc(self):
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            df = df_mgr.get_diskfile(
+                'sda1', '0', 'a', 'c', 'o', policy=policy)
+            suffix_dir = os.path.dirname(df._datadir)
+            suffix = os.path.basename(suffix_dir)
+
+            # scale back reclaim age a bit
+            df_mgr.reclaim_age = 1000
+            # write a valid tombstone
+            old_time = time() - 500
+            timestamp = Timestamp(old_time)
+            df.delete(timestamp.internal)
+            hashes = df_mgr.get_hashes('sda1', '0', [], policy)
+            self.assertIn(suffix, hashes)
+            self.assertIsNotNone(hashes[suffix])
+
+            # we have tombstone entry
+            tombstone = '%s.ts' % timestamp.internal
+            self.assertTrue(os.path.exists(df._datadir))
+            self.assertIn(tombstone, os.listdir(df._datadir))
+
+            # lower reclaim age to force tombstone reclaiming
+            df_mgr.reclaim_age = 200
+
+            # not cleaning up because suffix not invalidated
+            hashes = df_mgr.get_hashes('sda1', '0', [], policy)
+            self.assertTrue(os.path.exists(df._datadir))
+            self.assertIn(tombstone, os.listdir(df._datadir))
+            self.assertIn(suffix, hashes)
+            self.assertIsNotNone(hashes[suffix])
+
+            # recalculating suffix hash cause cleanup
+            hashes = df_mgr.get_hashes('sda1', '0', [suffix], policy)
+
+            self.assertEqual(hashes, {})
+            self.assertFalse(os.path.exists(df._datadir))
+
+    def test_hash_suffix_ts_cleanup_after_invalidate_hash(self):
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            df = df_mgr.get_diskfile(
+                'sda1', '0', 'a', 'c', 'o', policy=policy)
+            suffix_dir = os.path.dirname(df._datadir)
+            suffix = os.path.basename(suffix_dir)
+
+            # scale back reclaim age a bit
+            df_mgr.reclaim_age = 1000
+            # write a valid tombstone
+            old_time = time() - 500
+            timestamp = Timestamp(old_time)
+            df.delete(timestamp.internal)
+            hashes = df_mgr.get_hashes('sda1', '0', [], policy)
+            self.assertIn(suffix, hashes)
+            self.assertIsNotNone(hashes[suffix])
+
+            # we have tombstone entry
+            tombstone = '%s.ts' % timestamp.internal
+            self.assertTrue(os.path.exists(df._datadir))
+            self.assertIn(tombstone, os.listdir(df._datadir))
+
+            # lower reclaim age to force tombstone reclaiming
+            df_mgr.reclaim_age = 200
+
+            # not cleaning up because suffix not invalidated
+            hashes = df_mgr.get_hashes('sda1', '0', [], policy)
+            self.assertTrue(os.path.exists(df._datadir))
+            self.assertIn(tombstone, os.listdir(df._datadir))
+            self.assertIn(suffix, hashes)
+            self.assertIsNotNone(hashes[suffix])
+
+            # However if we call invalidate_hash for the suffix dir,
+            # get_hashes can reclaim the tombstone
+            with mock.patch('swift.obj.diskfile.lock_path'):
+                df_mgr.invalidate_hash(suffix_dir)
+
+            # updating invalidated hashes cause cleanup
+            hashes = df_mgr.get_hashes('sda1', '0', [], policy)
+
+            self.assertEqual(hashes, {})
+            self.assertFalse(os.path.exists(df._datadir))
+
+    def test_hash_suffix_one_reclaim_and_one_valid_tombstone(self):
+        paths, suffix = find_paths_with_matching_suffixes(2, 1)
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            a, c, o = paths[suffix][0]
+            df1 = df_mgr.get_diskfile(
+                'sda1', '0', a, c, o, policy=policy)
+            # scale back this tests manager's reclaim age a bit
+            df_mgr.reclaim_age = 1000
+            # write one tombstone that's just a *little* older
+            df1.delete(Timestamp(time() - 1001))
+            # create another tombstone in same suffix dir that's newer
+            a, c, o = paths[suffix][1]
+            df2 = df_mgr.get_diskfile(
+                'sda1', '0', a, c, o, policy=policy)
+            t_df2 = Timestamp(time() - 900)
+            df2.delete(t_df2)
+
+            hashes = df_mgr.get_hashes('sda1', '0', [], policy)
+
+            suffix = os.path.basename(os.path.dirname(df1._datadir))
+            df2_tombstone_hash = md5(t_df2.internal + '.ts').hexdigest()
+            expected = {
+                REPL_POLICY: {suffix: df2_tombstone_hash},
+                EC_POLICY: {suffix: {
+                    # fi is None here because we have a tombstone
+                    None: df2_tombstone_hash}},
+            }[policy.policy_type]
+
+            self.assertEqual(hashes, expected)
+
+    def test_hash_suffix_one_datafile(self):
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            df = df_mgr.get_diskfile(
+                'sda1', '0', 'a', 'c', 'o', policy=policy, frag_index=7)
+            suffix = os.path.basename(os.path.dirname(df._datadir))
+            # write a datafile
+            timestamp = self.ts()
+            with df.create() as writer:
+                test_data = b'test file'
+                writer.write(test_data)
+                metadata = {
+                    'X-Timestamp': timestamp.internal,
+                    'ETag': md5(test_data).hexdigest(),
+                    'Content-Length': len(test_data),
+                }
+                writer.put(metadata)
+                # note - no commit so data is non-durable
+            hashes = df_mgr.get_hashes('sda1', '0', [], policy)
+            datafile_hash = md5({
+                EC_POLICY: timestamp.internal,
+                REPL_POLICY: timestamp.internal + '.data',
+            }[policy.policy_type]).hexdigest()
+            expected = {
+                REPL_POLICY: {suffix: datafile_hash},
+                EC_POLICY: {suffix: {
+                    # because there's no durable state, we have no hash for
+                    # the None key - only the frag index for the data file
+                    7: datafile_hash}},
+            }[policy.policy_type]
+            msg = 'expected %r != %r for policy %r' % (
+                expected, hashes, policy)
+            self.assertEqual(hashes, expected, msg)
+
+    def test_hash_suffix_multi_file_ends_in_tombstone(self):
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            df = df_mgr.get_diskfile('sda1', '0', 'a', 'c', 'o', policy=policy,
+                                     frag_index=4)
+            suffix = os.path.basename(os.path.dirname(df._datadir))
+            mkdirs(df._datadir)
+            now = time()
+            # go behind the scenes and setup a bunch of weird file names
+            timestamps = [Timestamp(now - tdiff)
+                          for tdiff in [500, 100, 10, 1]]
+            for timestamp in timestamps:
+                for suff in ['.meta', '.data', '.ts']:
+                    filename = timestamp.internal
+                    if policy.policy_type == EC_POLICY and suff == '.data':
+                        filename += '#%s' % df._frag_index
+                    filename += suff
+                    open(os.path.join(df._datadir, filename), 'w').close()
+            tombstone_hash = md5(filename).hexdigest()
+            # call get_hashes and it should clean things up
+            hashes = df_mgr.get_hashes('sda1', '0', [], policy)
+            expected = {
+                REPL_POLICY: {suffix: tombstone_hash},
+                EC_POLICY: {suffix: {
+                    # fi is None here because we have a tombstone
+                    None: tombstone_hash}},
+            }[policy.policy_type]
+            self.assertEqual(hashes, expected)
+            # only the tombstone should be left
+            found_files = os.listdir(df._datadir)
+            self.assertEqual(found_files, [filename])
+
+    def _do_hash_suffix_multi_file_ends_in_datafile(self, policy,
+                                                    legacy_durable):
+        # if legacy_durable is True then synthesize legacy durable files
+        # instead of having a durable marker in the data file name
+        frag_index = 4
+        df_mgr = self.df_router[policy]
+        df = df_mgr.get_diskfile('sda1', '0', 'a', 'c', 'o', policy=policy,
+                                 frag_index=frag_index)
+        suffix = os.path.basename(os.path.dirname(df._datadir))
+        mkdirs(df._datadir)
+        now = time()
+        timestamp = None
+        # go behind the scenes and setup a bunch of weird file names
+        timestamps = [Timestamp(now - tdiff)
+                      for tdiff in [500, 100, 10, 1]]
+        for i, timestamp in enumerate(timestamps):
+            suffs = ['.meta', '.data']
+            if i < 2:
+                suffs.append('.ts')
+            if policy.policy_type == EC_POLICY and legacy_durable:
+                suffs.append('.durable')
+            for suff in suffs:
+                if suff == '.data':
+                    filename = _make_datafilename(
+                        timestamp, policy, frag_index,
+                        durable=not legacy_durable)
+                else:
+                    filename = timestamp.internal + suff
+                open(os.path.join(df._datadir, filename), 'w').close()
+        meta_timestamp = Timestamp(now)
+        metadata_filename = meta_timestamp.internal + '.meta'
+        open(os.path.join(df._datadir, metadata_filename), 'w').close()
+
+        # call get_hashes and it should clean up all but the most recent files
+        hashes = df_mgr.get_hashes('sda1', '0', [], policy)
+
+        # calculate expected outcome
+        data_filename = _make_datafilename(
+            timestamp, policy, frag_index, durable=not legacy_durable)
+        expected_files = [data_filename, metadata_filename]
+        if policy.policy_type == EC_POLICY:
+            # note: expected hashes is same with or without legacy durable file
+            hasher = md5()
+            hasher.update(metadata_filename)
+            hasher.update(timestamp.internal + '.durable')
+            expected = {
+                suffix: {
+                    # metadata & durable updates are hashed separately
+                    None: hasher.hexdigest(),
+                    4: self.fname_to_ts_hash(data_filename),
+                }
+            }
+            if legacy_durable:
+                expected_files.append(timestamp.internal + '.durable')
+        elif policy.policy_type == REPL_POLICY:
+            hasher = md5()
+            hasher.update(metadata_filename)
+            hasher.update(data_filename)
+            expected = {suffix: hasher.hexdigest()}
+        else:
+            self.fail('unknown policy type %r' % policy.policy_type)
+        self.assertEqual(hashes, expected)
+        # only the meta and data should be left
+        self.assertEqual(sorted(os.listdir(df._datadir)),
+                         sorted(expected_files))
+
+    def test_hash_suffix_multifile_ends_in_datafile(self):
+        for policy in self.iter_policies():
+            self._do_hash_suffix_multi_file_ends_in_datafile(
+                policy, legacy_durable=False)
+
+    def test_hash_suffix_multifile_ends_in_datafile_legacy_durable(self):
+        for policy in self.iter_policies():
+            if policy.policy_type == EC_POLICY:
+                self._do_hash_suffix_multi_file_ends_in_datafile(
+                    policy, legacy_durable=True)
+
+    def _verify_get_hashes(self, filenames, ts_data, ts_meta, ts_ctype,
+                           policy):
+        """
+        Helper method to create a set of ondisk files and verify suffix_hashes.
+
+        :param filenames: list of filenames to create in an object hash dir
+        :param ts_data: newest data timestamp, used for expected result
+        :param ts_meta: newest meta timestamp, used for expected result
+        :param ts_ctype: newest content-type timestamp, used for expected
+                         result
+        :param policy: storage policy to use for test
+        """
+        df_mgr = self.df_router[policy]
+        df = df_mgr.get_diskfile('sda1', '0', 'a', 'c', 'o',
+                                 policy=policy, frag_index=4)
+        suffix = os.path.basename(os.path.dirname(df._datadir))
+        partition_dir = os.path.dirname(os.path.dirname(df._datadir))
+        rmtree(partition_dir, ignore_errors=True)  # clean dir for each test
+        mkdirs(df._datadir)
+
+        # calculate expected result
+        hasher = md5()
+        if policy.policy_type == EC_POLICY:
+            hasher.update(ts_meta.internal + '.meta')
+            hasher.update(ts_data.internal + '.durable')
+            if ts_ctype:
+                hasher.update(ts_ctype.internal + '_ctype')
+            expected = {
+                suffix: {
+                    None: hasher.hexdigest(),
+                    4: md5(ts_data.internal).hexdigest(),
+                }
+            }
+        elif policy.policy_type == REPL_POLICY:
+            hasher.update(ts_meta.internal + '.meta')
+            hasher.update(ts_data.internal + '.data')
+            if ts_ctype:
+                hasher.update(ts_ctype.internal + '_ctype')
+            expected = {suffix: hasher.hexdigest()}
+        else:
+            self.fail('unknown policy type %r' % policy.policy_type)
+
+        for fname in filenames:
+            open(os.path.join(df._datadir, fname), 'w').close()
+
+        hashes = df_mgr.get_hashes('sda1', '0', [], policy)
+
+        msg = 'expected %r != %r for policy %r' % (
+            expected, hashes, policy)
+        self.assertEqual(hashes, expected, msg)
+
+    def test_hash_suffix_with_older_content_type_in_meta(self):
+        # single meta file having older content-type
+        def do_test(legacy_durable):
+            for policy in self.iter_policies():
+                ts_data, ts_ctype, ts_meta = (
+                    self.ts(), self.ts(), self.ts())
+
+                filenames = [_make_datafilename(ts_data, policy, frag_index=4,
+                                                durable=not legacy_durable),
+                             _make_metafilename(ts_meta, ts_ctype)]
+                if policy.policy_type == EC_POLICY and legacy_durable:
+                    filenames.append(ts_data.internal + '.durable')
+
+                self._verify_get_hashes(
+                    filenames, ts_data, ts_meta, ts_ctype, policy)
+
+        do_test(False)
+        do_test(True)
+
+    def test_hash_suffix_with_same_age_content_type_in_meta(self):
+        # single meta file having same age content-type
+        def do_test(legacy_durable):
+            for policy in self.iter_policies():
+                ts_data, ts_meta = (self.ts(), self.ts())
+
+                filenames = [_make_datafilename(ts_data, policy, frag_index=4,
+                                                durable=not legacy_durable),
+                             _make_metafilename(ts_meta, ts_meta)]
+                if policy.policy_type == EC_POLICY and legacy_durable:
+                    filenames.append(ts_data.internal + '.durable')
+
+                self._verify_get_hashes(
+                    filenames, ts_data, ts_meta, ts_meta, policy)
+
+        do_test(False)
+        do_test(True)
+
+    def test_hash_suffix_with_obsolete_content_type_in_meta(self):
+        # After rsync replication we could have a single meta file having
+        # content-type older than a replicated data file
+        def do_test(legacy_durable):
+            for policy in self.iter_policies():
+                ts_ctype, ts_data, ts_meta = (self.ts(), self.ts(), self.ts())
+
+                filenames = [_make_datafilename(ts_data, policy, frag_index=4,
+                                                durable=not legacy_durable),
+                             _make_metafilename(ts_meta, ts_ctype)]
+                if policy.policy_type == EC_POLICY and legacy_durable:
+                    filenames.append(ts_data.internal + '.durable')
+
+                self._verify_get_hashes(
+                    filenames, ts_data, ts_meta, None, policy)
+
+        do_test(False)
+        do_test(True)
+
+    def test_hash_suffix_with_older_content_type_in_newer_meta(self):
+        # After rsync replication we could have two meta files: newest
+        # content-type is in newer meta file, older than newer meta file
+        def do_test(legacy_durable):
+            for policy in self.iter_policies():
+                ts_data, ts_older_meta, ts_ctype, ts_newer_meta = (
+                    self.ts() for _ in range(4))
+
+                filenames = [_make_datafilename(ts_data, policy, frag_index=4,
+                                                durable=not legacy_durable),
+                             _make_metafilename(ts_older_meta),
+                             _make_metafilename(ts_newer_meta, ts_ctype)]
+                if policy.policy_type == EC_POLICY and legacy_durable:
+                    filenames.append(ts_data.internal + '.durable')
+
+                self._verify_get_hashes(
+                    filenames, ts_data, ts_newer_meta, ts_ctype, policy)
+
+        do_test(False)
+        do_test(True)
+
+    def test_hash_suffix_with_same_age_content_type_in_newer_meta(self):
+        # After rsync replication we could have two meta files: newest
+        # content-type is in newer meta file, at same age as newer meta file
+        def do_test(legacy_durable):
+            for policy in self.iter_policies():
+                ts_data, ts_older_meta, ts_newer_meta = (
+                    self.ts() for _ in range(3))
+
+                filenames = [_make_datafilename(ts_data, policy, frag_index=4,
+                                                durable=not legacy_durable),
+                             _make_metafilename(ts_newer_meta, ts_newer_meta)]
+                if policy.policy_type == EC_POLICY and legacy_durable:
+                    filenames.append(ts_data.internal + '.durable')
+
+                self._verify_get_hashes(
+                    filenames, ts_data, ts_newer_meta, ts_newer_meta, policy)
+
+        do_test(False)
+        do_test(True)
+
+    def test_hash_suffix_with_older_content_type_in_older_meta(self):
+        # After rsync replication we could have two meta files: newest
+        # content-type is in older meta file, older than older meta file
+        def do_test(legacy_durable):
+            for policy in self.iter_policies():
+                ts_data, ts_ctype, ts_older_meta, ts_newer_meta = (
+                    self.ts() for _ in range(4))
+
+                filenames = [_make_datafilename(ts_data, policy, frag_index=4,
+                                                durable=not legacy_durable),
+                             _make_metafilename(ts_newer_meta),
+                             _make_metafilename(ts_older_meta, ts_ctype)]
+                if policy.policy_type == EC_POLICY and legacy_durable:
+                    filenames.append(ts_data.internal + '.durable')
+
+                self._verify_get_hashes(
+                    filenames, ts_data, ts_newer_meta, ts_ctype, policy)
+
+        do_test(False)
+        do_test(True)
+
+    def test_hash_suffix_with_same_age_content_type_in_older_meta(self):
+        # After rsync replication we could have two meta files: newest
+        # content-type is in older meta file, at same age as older meta file
+        def do_test(legacy_durable):
+            for policy in self.iter_policies():
+                ts_data, ts_older_meta, ts_newer_meta = (
+                    self.ts() for _ in range(3))
+
+                filenames = [_make_datafilename(ts_data, policy, frag_index=4,
+                                                durable=not legacy_durable),
+                             _make_metafilename(ts_newer_meta),
+                             _make_metafilename(ts_older_meta, ts_older_meta)]
+                if policy.policy_type == EC_POLICY and legacy_durable:
+                    filenames.append(ts_data.internal + '.durable')
+
+                self._verify_get_hashes(
+                    filenames, ts_data, ts_newer_meta, ts_older_meta, policy)
+
+        do_test(False)
+        do_test(True)
+
+    def test_hash_suffix_with_obsolete_content_type_in_older_meta(self):
+        # After rsync replication we could have two meta files: newest
+        # content-type is in older meta file, but older than data file
+        def do_test(legacy_durable):
+            for policy in self.iter_policies():
+                ts_ctype, ts_data, ts_older_meta, ts_newer_meta = (
+                    self.ts() for _ in range(4))
+
+                filenames = [_make_datafilename(ts_data, policy, frag_index=4,
+                                                durable=not legacy_durable),
+                             _make_metafilename(ts_newer_meta),
+                             _make_metafilename(ts_older_meta, ts_ctype)]
+                if policy.policy_type == EC_POLICY and legacy_durable:
+                    filenames.append(ts_data.internal + '.durable')
+
+                self._verify_get_hashes(
+                    filenames, ts_data, ts_newer_meta, None, policy)
+
+        do_test(False)
+        do_test(True)
+
+    def test_hash_suffix_removes_empty_hashdir_and_suffix(self):
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            df = df_mgr.get_diskfile('sda1', '0', 'a', 'c', 'o',
+                                     policy=policy, frag_index=2)
+            os.makedirs(df._datadir)
+            self.assertTrue(os.path.exists(df._datadir))  # sanity
+            df_mgr.get_hashes('sda1', '0', [], policy)
+            suffix_dir = os.path.dirname(df._datadir)
+            self.assertFalse(os.path.exists(suffix_dir))
+
+    def test_hash_suffix_removes_empty_hashdirs_in_valid_suffix(self):
+        paths, suffix = find_paths_with_matching_suffixes(needed_matches=3,
+                                                          needed_suffixes=0)
+        matching_paths = paths.pop(suffix)
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            df = df_mgr.get_diskfile('sda1', '0', *matching_paths[0],
+                                     policy=policy, frag_index=2)
+            # create a real, valid hsh_path
+            df.delete(Timestamp.now())
+            # and a couple of empty hsh_paths
+            empty_hsh_paths = []
+            for path in matching_paths[1:]:
+                fake_df = df_mgr.get_diskfile('sda1', '0', *path,
+                                              policy=policy)
+                os.makedirs(fake_df._datadir)
+                empty_hsh_paths.append(fake_df._datadir)
+            for hsh_path in empty_hsh_paths:
+                self.assertTrue(os.path.exists(hsh_path))  # sanity
+            # get_hashes will cleanup empty hsh_path and leave valid one
+            hashes = df_mgr.get_hashes('sda1', '0', [], policy)
+            self.assertIn(suffix, hashes)
+            self.assertTrue(os.path.exists(df._datadir))
+            for hsh_path in empty_hsh_paths:
+                self.assertFalse(os.path.exists(hsh_path))
+
+    # get_hashes tests - hash_suffix error handling
+
+    def test_hash_suffix_listdir_enotdir(self):
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            suffix = '123'
+            suffix_path = os.path.join(self.devices, 'sda1',
+                                       diskfile.get_data_dir(policy), '0',
+                                       suffix)
+            os.makedirs(suffix_path)
+            self.assertTrue(os.path.exists(suffix_path))  # sanity
+            hashes = df_mgr.get_hashes('sda1', '0', [suffix], policy)
+            # suffix dir cleaned up by get_hashes
+            self.assertFalse(os.path.exists(suffix_path))
+            expected = {}
+            msg = 'expected %r != %r for policy %r' % (
+                expected, hashes, policy)
+            self.assertEqual(hashes, expected, msg)
+
+            # now make the suffix path a file
+            open(suffix_path, 'w').close()
+            hashes = df_mgr.get_hashes('sda1', '0', [suffix], policy)
+            expected = {}
+            msg = 'expected %r != %r for policy %r' % (
+                expected, hashes, policy)
+            self.assertEqual(hashes, expected, msg)
+
+    def test_hash_suffix_listdir_enoent(self):
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            part_path = os.path.join(self.devices, 'sda1',
+                                     diskfile.get_data_dir(policy), '0')
+            mkdirs(part_path)  # ensure we'll bother writing a pkl at all
+            orig_listdir = os.listdir
+            listdir_calls = []
+
+            def mock_listdir(path):
+                success = False
+                try:
+                    rv = orig_listdir(path)
+                    success = True
+                    return rv
+                finally:
+                    listdir_calls.append((path, success))
+
+            with mock.patch('swift.obj.diskfile.os.listdir',
+                            mock_listdir):
+                # recalc always forces hash_suffix even if the suffix
+                # does not exist!
+                df_mgr.get_hashes('sda1', '0', ['123'], policy)
+
+            self.assertEqual(listdir_calls, [
+                # part path gets created automatically
+                (part_path, True),
+                # this one blows up
+                (os.path.join(part_path, '123'), False),
+            ])
+
+    def test_hash_suffix_cleanup_ondisk_files_enotdir_quarantined(self):
+        for policy in self.iter_policies():
+            df = self.df_router[policy].get_diskfile(
+                self.existing_device, '0', 'a', 'c', 'o', policy=policy)
+            # make the suffix directory
+            suffix_path = os.path.dirname(df._datadir)
+            os.makedirs(suffix_path)
+            suffix = os.path.basename(suffix_path)
+
+            # make the df hash path a file
+            open(df._datadir, 'wb').close()
+            df_mgr = self.df_router[policy]
+            hashes = df_mgr.get_hashes(self.existing_device, '0', [suffix],
+                                       policy)
+            self.assertEqual(hashes, {})
+            # and hash path is quarantined
+            self.assertFalse(os.path.exists(df._datadir))
+            # each device a quarantined directory
+            quarantine_base = os.path.join(self.devices,
+                                           self.existing_device, 'quarantined')
+            # the quarantine path is...
+            quarantine_path = os.path.join(
+                quarantine_base,  # quarantine root
+                diskfile.get_data_dir(policy),  # per-policy data dir
+                os.path.basename(df._datadir)  # name of quarantined file
+            )
+            self.assertTrue(os.path.exists(quarantine_path))
+
+    def test_auditor_hashdir_not_listable(self):
+        def list_locations(dirname, datadir):
+            return [(loc.path, loc.device, loc.partition, loc.policy)
+                    for loc in diskfile.object_audit_location_generator(
+                    devices=dirname, datadir=datadir, mount_check=False)]
+
+        real_listdir = os.listdir
+
+        def splode_if_endswith(suffix, err):
+            def sploder(path):
+                if path.endswith(suffix):
+                    raise OSError(err, os.strerror(err))
+                else:
+                    return real_listdir(path)
+
+            return sploder
+
+        with temptree([]) as tmpdir:
+            hashdir1 = os.path.join(tmpdir, "sdf", "objects", "2607", "b54",
+                                    "fe450ec990a88cc4b252b181bab04b54")
+            os.makedirs(hashdir1)
+            with open(os.path.join(hashdir1, '1656032666.98003.ts'), 'w'):
+                pass
+            hashdir2 = os.path.join(tmpdir, "sdf", "objects", "2809", "afd",
+                                    "7089ab48d955ab0851fc51cc17a34afd")
+            os.makedirs(hashdir2)
+            with open(os.path.join(hashdir2, '1656080624.31899.ts'), 'w'):
+                pass
+
+            expected = [(hashdir2, 'sdf', '2809', POLICIES[0])]
+
+            # Parts that look like files are just skipped
+            with mock.patch('os.listdir', splode_if_endswith(
+                    "2607", errno.ENOTDIR)):
+                self.assertEqual(expected, list_locations(tmpdir, 'objects'))
+            diskfile.clear_auditor_status(tmpdir, 'objects')
+            # ENODATA on a suffix is ok
+            with mock.patch('os.listdir', splode_if_endswith(
+                    "b54", errno.ENODATA)):
+                self.assertEqual(expected, list_locations(tmpdir, 'objects'))
+            diskfile.clear_auditor_status(tmpdir, 'objects')
+            # EUCLEAN too
+            with mock.patch('os.listdir', splode_if_endswith(
+                    "b54", EUCLEAN)):
+                self.assertEqual(expected, list_locations(tmpdir, 'objects'))
+            diskfile.clear_auditor_status(tmpdir, 'objects')
+
+            # sanity the other way
+            expected = [(hashdir1, 'sdf', '2607', POLICIES[0])]
+            with mock.patch('os.listdir', splode_if_endswith(
+                    "2809", errno.ENODATA)):
+                self.assertEqual(expected, list_locations(tmpdir, 'objects'))
+            diskfile.clear_auditor_status(tmpdir, 'objects')
+            with mock.patch('os.listdir', splode_if_endswith(
+                    "2809", EUCLEAN)):
+                self.assertEqual(expected, list_locations(tmpdir, 'objects'))
+            diskfile.clear_auditor_status(tmpdir, 'objects')
+            with mock.patch('os.listdir', splode_if_endswith(
+                    "afd", errno.ENOTDIR)):
+                self.assertEqual(expected, list_locations(tmpdir, 'objects'))
+            diskfile.clear_auditor_status(tmpdir, 'objects')
+
+    def test_hash_suffix_cleanup_ondisk_files_enodata_quarantined(self):
+        for policy in self.iter_policies():
+            df = self.df_router[policy].get_diskfile(
+                self.existing_device, '0', 'a', 'c', 'o', policy=policy)
+            # make everything down to the hash directory
+            os.makedirs(df._datadir)
+            suffix = os.path.basename(os.path.dirname(df._datadir))
+            orig_listdir = os.listdir
+
+            def fake_listdir(path):
+                if path == df._datadir:
+                    raise OSError(errno.ENODATA, 'nope')
+                return orig_listdir(path)
+
+            df_mgr = self.df_router[policy]
+            with mock.patch('os.listdir', side_effect=fake_listdir):
+                hashes = df_mgr.get_hashes(self.existing_device, '0', [suffix],
+                                           policy)
+            self.assertEqual(hashes, {})
+            # and hash path is quarantined
+            self.assertFalse(os.path.exists(df._datadir))
+            # each device a quarantined directory
+            quarantine_base = os.path.join(self.devices,
+                                           self.existing_device, 'quarantined')
+            # the quarantine path is...
+            quarantine_path = os.path.join(
+                quarantine_base,  # quarantine root
+                diskfile.get_data_dir(policy),  # per-policy data dir
+                os.path.basename(df._datadir)  # name of quarantined file
+            )
+            self.assertTrue(os.path.exists(quarantine_path))
+
+    def test_hash_suffix_cleanup_ondisk_files_euclean_quarantined(self):
+        for policy in self.iter_policies():
+            df = self.df_router[policy].get_diskfile(
+                self.existing_device, '0', 'a', 'c', 'o', policy=policy)
+            # make everything down to the hash directory
+            os.makedirs(df._datadir)
+            suffix = os.path.basename(os.path.dirname(df._datadir))
+            orig_listdir = os.listdir
+
+            def fake_listdir(path):
+                if path == df._datadir:
+                    raise OSError(EUCLEAN, 'nope')
+                return orig_listdir(path)
+
+            df_mgr = self.df_router[policy]
+            with mock.patch('os.listdir', side_effect=fake_listdir):
+                hashes = df_mgr.get_hashes(self.existing_device, '0', [suffix],
+                                           policy)
+            self.assertEqual(hashes, {})
+            # and hash path is quarantined
+            self.assertFalse(os.path.exists(df._datadir))
+            # each device a quarantined directory
+            quarantine_base = os.path.join(self.devices,
+                                           self.existing_device, 'quarantined')
+            # the quarantine path is...
+            quarantine_path = os.path.join(
+                quarantine_base,  # quarantine root
+                diskfile.get_data_dir(policy),  # per-policy data dir
+                os.path.basename(df._datadir)  # name of quarantined file
+            )
+            self.assertTrue(os.path.exists(quarantine_path))
+
+    def test_hash_suffix_cleanup_ondisk_files_other_oserror(self):
+        for policy in self.iter_policies():
+            timestamp = self.ts()
+            df_mgr = self.df_router[policy]
+            df = df_mgr.get_diskfile(self.existing_device, '0', 'a', 'c',
+                                     'o', policy=policy,
+                                     frag_index=7)
+            suffix = os.path.basename(os.path.dirname(df._datadir))
+            with df.create() as writer:
+                test_data = b'test_data'
+                writer.write(test_data)
+                metadata = {
+                    'X-Timestamp': timestamp.internal,
+                    'ETag': md5(test_data).hexdigest(),
+                    'Content-Length': len(test_data),
+                }
+                writer.put(metadata)
+
+            orig_os_listdir = os.listdir
+            listdir_calls = []
+
+            part_path = os.path.join(self.devices, self.existing_device,
+                                     diskfile.get_data_dir(policy), '0')
+            suffix_path = os.path.join(part_path, suffix)
+            datadir_path = os.path.join(suffix_path, hash_path('a', 'c', 'o'))
+
+            def mock_os_listdir(path):
+                listdir_calls.append(path)
+                if path == datadir_path:
+                    # we want the part and suffix listdir calls to pass and
+                    # make the cleanup_ondisk_files raise an exception
+                    raise OSError(errno.EACCES, os.strerror(errno.EACCES))
+                return orig_os_listdir(path)
+
+            with mock.patch('os.listdir', mock_os_listdir):
+                hashes = df_mgr.get_hashes(self.existing_device, '0', [],
+                                           policy)
+
+            self.assertEqual(listdir_calls, [
+                part_path,
+                suffix_path,
+                datadir_path,
+            ])
+            expected = {suffix: None}
+            msg = 'expected %r != %r for policy %r' % (
+                expected, hashes, policy)
+            self.assertEqual(hashes, expected, msg)
+
+    def test_hash_suffix_rmdir_hsh_path_oserror(self):
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            # make an empty hsh_path to be removed
+            df = df_mgr.get_diskfile(self.existing_device, '0', 'a', 'c',
+                                     'o', policy=policy)
+            os.makedirs(df._datadir)
+            suffix = os.path.basename(os.path.dirname(df._datadir))
+            with mock.patch('os.rmdir', side_effect=OSError()):
+                hashes = df_mgr.get_hashes(self.existing_device, '0', [],
+                                           policy)
+            expected = {
+                EC_POLICY: {},
+                REPL_POLICY: md5().hexdigest(),
+            }[policy.policy_type]
+            self.assertEqual(hashes, {suffix: expected})
+            self.assertTrue(os.path.exists(df._datadir))
+
+    def test_hash_suffix_rmdir_suffix_oserror(self):
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            # make an empty hsh_path to be removed
+            df = df_mgr.get_diskfile(self.existing_device, '0', 'a', 'c',
+                                     'o', policy=policy)
+            os.makedirs(df._datadir)
+            suffix_path = os.path.dirname(df._datadir)
+            suffix = os.path.basename(suffix_path)
+
+            captured_paths = []
+
+            def mock_rmdir(path):
+                captured_paths.append(path)
+                if path == suffix_path:
+                    raise OSError('kaboom!')
+
+            with mock.patch('os.rmdir', mock_rmdir):
+                hashes = df_mgr.get_hashes(self.existing_device, '0', [],
+                                           policy)
+            expected = {
+                EC_POLICY: {},
+                REPL_POLICY: md5().hexdigest(),
+            }[policy.policy_type]
+            self.assertEqual(hashes, {suffix: expected})
+            self.assertTrue(os.path.exists(suffix_path))
+            self.assertEqual([
+                df._datadir,
+                suffix_path,
+            ], captured_paths)
+
+    # get_hashes tests - behaviors
+
+    def test_get_hashes_does_not_create_partition(self):
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            hashes = df_mgr.get_hashes(self.existing_device, '0', [],
+                                       policy)
+            self.assertEqual(hashes, {})
+            part_path = os.path.join(
+                self.devices, 'sda1', diskfile.get_data_dir(policy), '0')
+            self.assertFalse(os.path.exists(part_path))
+
+    def test_get_hashes_creates_pkl(self):
+        # like above, but -- if the partition already exists, make the pickle
+        for policy in self.iter_policies():
+            part_path = os.path.join(
+                self.devices, 'sda1', diskfile.get_data_dir(policy), '0')
+            mkdirs(part_path)
+            df_mgr = self.df_router[policy]
+            hashes = df_mgr.get_hashes(self.existing_device, '0', [],
+                                       policy)
+            self.assertEqual(hashes, {})
+            self.assertTrue(os.path.exists(part_path))
+            hashes_file = os.path.join(part_path,
+                                       diskfile.HASH_FILE)
+            self.assertTrue(os.path.exists(hashes_file))
+
+            # and double check the hashes
+            new_hashes = df_mgr.get_hashes(self.existing_device, '0', [],
+                                           policy)
+            self.assertEqual(hashes, new_hashes)
+
+    def _do_test_get_hashes_new_pkl_finds_new_suffix_dirs(self, device):
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            part_path = os.path.join(
+                self.devices, self.existing_device,
+                diskfile.get_data_dir(policy), '0')
+            hashes_file = os.path.join(part_path,
+                                       diskfile.HASH_FILE)
+            # add something to find
+            df = df_mgr.get_diskfile(self.existing_device, '0', 'a', 'c',
+                                     'o', policy=policy, frag_index=4)
+            timestamp = self.ts()
+            df.delete(timestamp)
+            suffix_dir = os.path.dirname(df._datadir)
+            suffix = os.path.basename(suffix_dir)
+            # get_hashes will find the untracked suffix dir
+            self.assertFalse(os.path.exists(hashes_file))  # sanity
+            hashes = df_mgr.get_hashes(device, '0', [], policy)
+            self.assertIn(suffix, hashes)
+            # ... and create a hashes pickle for it
+            self.assertTrue(os.path.exists(hashes_file))
+            # repeat and check there is no rehashing
+            with mock.patch.object(df_mgr, '_hash_suffix',
+                                   return_value=hashes[suffix]) as mocked:
+                repeat_hashes = df_mgr.get_hashes(device, '0', [], policy)
+            self.assertEqual(hashes, repeat_hashes)
+            mocked.assert_not_called()
+
+    def test_get_hashes_new_pkl_finds_new_suffix_dirs_unicode(self):
+        self._do_test_get_hashes_new_pkl_finds_new_suffix_dirs(u'sda1')
+
+    def test_get_hashes_new_pkl_finds_new_suffix_dirs(self):
+        self._do_test_get_hashes_new_pkl_finds_new_suffix_dirs('sda1')
+
+    def test_get_hashes_new_pkl_missing_invalid_finds_new_suffix_dirs(self):
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            part_path = os.path.join(
+                self.devices, self.existing_device,
+                diskfile.get_data_dir(policy), '0')
+            hashes_file = os.path.join(part_path,
+                                       diskfile.HASH_FILE)
+            invalidations_file = os.path.join(
+                part_path, diskfile.HASH_INVALIDATIONS_FILE)
+            # add something to find
+            df = df_mgr.get_diskfile(self.existing_device, '0', 'a', 'c',
+                                     'o', policy=policy, frag_index=4)
+            timestamp = self.ts()
+            df.delete(timestamp)
+            suffix = os.path.basename(os.path.dirname(df._datadir))
+            with open(invalidations_file) as f:
+                self.assertEqual('%s\n' % suffix, f.read())
+            # even if invalidations_file is missing ...
+            os.unlink(invalidations_file)
+            hashes = df_mgr.get_hashes(self.existing_device, '0', [], policy)
+            # get_hashes will *still* find the untracked suffix dir
+            self.assertIn(suffix, hashes)
+            # ... and create a hashes pickle for it
+            self.assertTrue(os.path.exists(hashes_file))
+
+    def test_get_hashes_new_pkl_lying_invalid_finds_new_suffix_dirs(self):
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            part_path = os.path.join(
+                self.devices, self.existing_device,
+                diskfile.get_data_dir(policy), '0')
+            hashes_file = os.path.join(part_path,
+                                       diskfile.HASH_FILE)
+            invalidations_file = os.path.join(
+                part_path, diskfile.HASH_INVALIDATIONS_FILE)
+            # add something to find
+            df = df_mgr.get_diskfile(self.existing_device, '0', 'a', 'c',
+                                     'o', policy=policy, frag_index=4)
+            timestamp = self.ts()
+            df.delete(timestamp)
+            suffix = os.path.basename(os.path.dirname(df._datadir))
+            with open(invalidations_file) as f:
+                self.assertEqual('%s\n' % suffix, f.read())
+            # even if invalidations_file is lying ...
+            with open(invalidations_file, 'w') as f:
+                f.write('%x\n' % (int(suffix, 16) + 1))
+            hashes = df_mgr.get_hashes(self.existing_device, '0', [], policy)
+            # get_hashes will *still* find the untracked suffix dir
+            self.assertIn(suffix, hashes)
+            # ... and create a hashes pickle for it
+            self.assertTrue(os.path.exists(hashes_file))
+
+    def test_get_hashes_old_pickle_does_not_find_new_suffix_dirs(self):
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            # create an empty stale pickle
+            part_path = os.path.join(
+                self.devices, 'sda1', diskfile.get_data_dir(policy), '0')
+            mkdirs(part_path)
+            hashes_file = os.path.join(part_path,
+                                       diskfile.HASH_FILE)
+            hashes = df_mgr.get_hashes(self.existing_device, '0', [], policy)
+            self.assertEqual(hashes, {})
+            self.assertTrue(os.path.exists(hashes_file))  # sanity
+            # add something to find
+            df = df_mgr.get_diskfile(self.existing_device, '0', 'a', 'c', 'o',
+                                     policy=policy, frag_index=4)
+            os.makedirs(df._datadir)
+            filename = Timestamp.now().internal + '.ts'
+            open(os.path.join(df._datadir, filename), 'w').close()
+            suffix = os.path.basename(os.path.dirname(df._datadir))
+            # but get_hashes has no reason to find it (because we didn't
+            # call invalidate_hash)
+            new_hashes = df_mgr.get_hashes(self.existing_device, '0', [],
+                                           policy)
+            self.assertEqual(new_hashes, hashes)
+            # ... unless remote end asks for a recalc
+            hashes = df_mgr.get_hashes(self.existing_device, '0', [suffix],
+                                       policy)
+            self.assertIn(suffix, hashes)
+
+    def test_get_hashes_does_not_rehash_known_suffix_dirs(self):
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            df = df_mgr.get_diskfile(self.existing_device, '0', 'a', 'c',
+                                     'o', policy=policy, frag_index=4)
+            suffix = os.path.basename(os.path.dirname(df._datadir))
+            timestamp = self.ts()
+            df.delete(timestamp)
+            # create the baseline hashes file
+            hashes = df_mgr.get_hashes(self.existing_device, '0', [], policy)
+            self.assertIn(suffix, hashes)
+            # now change the contents of the suffix w/o calling
+            # invalidate_hash
+            rmtree(df._datadir)
+            suffix_path = os.path.dirname(df._datadir)
+            self.assertTrue(os.path.exists(suffix_path))  # sanity
+            new_hashes = df_mgr.get_hashes(self.existing_device, '0', [],
+                                           policy)
+            # ... and get_hashes is none the wiser
+            self.assertEqual(new_hashes, hashes)
+
+            # ... unless remote end asks for a recalc
+            hashes = df_mgr.get_hashes(self.existing_device, '0', [suffix],
+                                       policy)
+            self.assertNotEqual(new_hashes, hashes)
+            # and the empty suffix path is removed
+            self.assertFalse(os.path.exists(suffix_path))
+            # ... and the suffix key is removed
+            expected = {}
+            self.assertEqual(expected, hashes)
+
+    def test_get_hashes_multi_file_multi_suffix(self):
+        paths, suffix = find_paths_with_matching_suffixes(needed_matches=2,
+                                                          needed_suffixes=3)
+        matching_paths = paths.pop(suffix)
+        matching_paths.sort(key=lambda path: hash_path(*path))
+        other_paths = []
+        for suffix, paths in paths.items():
+            other_paths.append(paths[0])
+            if len(other_paths) >= 2:
+                break
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            # first we'll make a tombstone
+            df = df_mgr.get_diskfile(self.existing_device, '0',
+                                     *other_paths[0], policy=policy,
+                                     frag_index=4)
+            timestamp = self.ts()
+            df.delete(timestamp)
+            tombstone_hash = md5(timestamp.internal + '.ts').hexdigest()
+            tombstone_suffix = os.path.basename(os.path.dirname(df._datadir))
+            # second file in another suffix has a .datafile
+            df = df_mgr.get_diskfile(self.existing_device, '0',
+                                     *other_paths[1], policy=policy,
+                                     frag_index=5)
+            timestamp = self.ts()
+            with df.create() as writer:
+                test_data = b'test_file'
+                writer.write(test_data)
+                metadata = {
+                    'X-Timestamp': timestamp.internal,
+                    'ETag': md5(test_data).hexdigest(),
+                    'Content-Length': len(test_data),
+                }
+                writer.put(metadata)
+                writer.commit(timestamp)
+            datafile_name = _make_datafilename(
+                timestamp, policy, frag_index=5)
+            durable_hash = md5(timestamp.internal + '.durable').hexdigest()
+            datafile_suffix = os.path.basename(os.path.dirname(df._datadir))
+            # in the *third* suffix - two datafiles for different hashes
+            df = df_mgr.get_diskfile(self.existing_device, '0',
+                                     *matching_paths[0], policy=policy,
+                                     frag_index=6)
+            matching_suffix = os.path.basename(os.path.dirname(df._datadir))
+            timestamp = self.ts()
+            with df.create() as writer:
+                test_data = b'test_file'
+                writer.write(test_data)
+                metadata = {
+                    'X-Timestamp': timestamp.internal,
+                    'ETag': md5(test_data).hexdigest(),
+                    'Content-Length': len(test_data),
+                }
+                writer.put(metadata)
+                writer.commit(timestamp)
+            # we'll keep track of file names for hash calculations
+            filename = _make_datafilename(
+                timestamp, policy, frag_index=6)
+            data_filenames = {
+                6: filename
+            }
+            df = df_mgr.get_diskfile(self.existing_device, '0',
+                                     *matching_paths[1], policy=policy,
+                                     frag_index=7)
+            self.assertEqual(os.path.basename(os.path.dirname(df._datadir)),
+                             matching_suffix)  # sanity
+            timestamp = self.ts()
+            with df.create() as writer:
+                test_data = b'test_file'
+                writer.write(test_data)
+                metadata = {
+                    'X-Timestamp': timestamp.internal,
+                    'ETag': md5(test_data).hexdigest(),
+                    'Content-Length': len(test_data),
+                }
+                writer.put(metadata)
+                writer.commit(timestamp)
+            filename = _make_datafilename(
+                timestamp, policy, frag_index=7)
+            data_filenames[7] = filename
+            # now make up the expected suffixes!
+            if policy.policy_type == EC_POLICY:
+                hasher = md5()
+                for filename in data_filenames.values():
+                    # each data file updates the hasher with durable timestamp
+                    hasher.update(filename.split('#', 1)[0] + '.durable')
+                expected = {
+                    tombstone_suffix: {
+                        None: tombstone_hash,
+                    },
+                    datafile_suffix: {
+                        None: durable_hash,
+                        5: self.fname_to_ts_hash(datafile_name),
+                    },
+                    matching_suffix: {
+                        None: hasher.hexdigest(),
+                        6: self.fname_to_ts_hash(data_filenames[6]),
+                        7: self.fname_to_ts_hash(data_filenames[7]),
+                    },
+                }
+            elif policy.policy_type == REPL_POLICY:
+                hasher = md5()
+                for filename in data_filenames.values():
+                    hasher.update(filename)
+                expected = {
+                    tombstone_suffix: tombstone_hash,
+                    datafile_suffix: md5(datafile_name).hexdigest(),
+                    matching_suffix: hasher.hexdigest(),
+                }
+            else:
+                self.fail('unknown policy type %r' % policy.policy_type)
+            hashes = df_mgr.get_hashes('sda1', '0', [], policy)
+            self.assertEqual(hashes, expected)
+
+    # get_hashes tests - error handling
+
+    def test_get_hashes_bad_dev(self):
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            df_mgr.mount_check = True
+            with mock_check_drive(ismount=False):
+                self.assertRaises(
+                    DiskFileDeviceUnavailable,
+                    df_mgr.get_hashes, self.existing_device, '0', ['123'],
+                    policy)
+
+    def test_get_hashes_zero_bytes_pickle(self):
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            part_path = os.path.join(self.devices, self.existing_device,
+                                     diskfile.get_data_dir(policy), '0')
+            os.makedirs(part_path)
+            # create a pre-existing zero-byte file
+            open(os.path.join(part_path, diskfile.HASH_FILE), 'w').close()
+            hashes = df_mgr.get_hashes(self.existing_device, '0', [],
+                                       policy)
+            self.assertEqual(hashes, {})
+
+    def _test_get_hashes_race(self, hash_breaking_function):
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+
+            df = df_mgr.get_diskfile(self.existing_device, '0', 'a', 'c',
+                                     'o', policy=policy, frag_index=3)
+            suffix = os.path.basename(os.path.dirname(df._datadir))
+
+            df2 = self.get_different_suffix_df(df, frag_index=5)
+            suffix2 = os.path.basename(os.path.dirname(df2._datadir))
+            part_path = os.path.dirname(os.path.dirname(
+                os.path.join(df._datadir)))
+            mkdirs(part_path)
+            hashfile_path = os.path.join(part_path, diskfile.HASH_FILE)
+            # create hashes.pkl
+            hashes = df_mgr.get_hashes(self.existing_device, '0', [],
+                                       policy)
+            self.assertEqual(hashes, {})  # sanity
+            self.assertTrue(os.path.exists(hashfile_path))
+            # and optionally tamper with the hashes.pkl...
+            hash_breaking_function(hashfile_path)
+            non_local = {'called': False}
+            orig_hash_suffix = df_mgr._hash_suffix
+
+            # then create a suffix
+            df.delete(self.ts())
+
+            def mock_hash_suffix(*args, **kwargs):
+                # capture first call to mock_hash
+                if not non_local['called']:
+                    non_local['called'] = True
+                    df2.delete(self.ts())
+                    non_local['other_hashes'] = df_mgr.get_hashes(
+                        self.existing_device, '0', [], policy)
+                return orig_hash_suffix(*args, **kwargs)
+
+            with mock.patch.object(df_mgr, '_hash_suffix', mock_hash_suffix):
+                hashes = df_mgr.get_hashes(self.existing_device, '0', [],
+                                           policy)
+
+            self.assertTrue(non_local['called'])
+            self.assertIn(suffix, hashes)
+            self.assertIn(suffix2, hashes)
+
+    def test_get_hashes_race_invalid_pickle(self):
+        def hash_breaking_function(hashfile_path):
+            # create a garbage invalid zero-byte file which can not unpickle
+            open(hashfile_path, 'w').close()
+        self._test_get_hashes_race(hash_breaking_function)
+
+    def test_get_hashes_race_new_partition(self):
+        def hash_breaking_function(hashfile_path):
+            # simulate rebalanced part doing post-rsync REPLICATE
+            os.unlink(hashfile_path)
+            part_dir = os.path.dirname(hashfile_path)
+            os.unlink(os.path.join(part_dir, '.lock'))
+            # sanity
+            self.assertEqual([], os.listdir(os.path.dirname(hashfile_path)))
+        self._test_get_hashes_race(hash_breaking_function)
+
+    def test_get_hashes_race_existing_partition(self):
+        def hash_breaking_function(hashfile_path):
+            # no-op - simulate ok existing partition
+            self.assertTrue(os.path.exists(hashfile_path))
+        self._test_get_hashes_race(hash_breaking_function)
+
+    def test_get_hashes_hash_suffix_enotdir(self):
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            # create a real suffix dir
+            df = df_mgr.get_diskfile(self.existing_device, '0', 'a', 'c',
+                                     'o', policy=policy, frag_index=3)
+            df.delete(Timestamp.now())
+            suffix = os.path.basename(os.path.dirname(df._datadir))
+            # touch a bad suffix dir
+            part_dir = os.path.join(self.devices, self.existing_device,
+                                    diskfile.get_data_dir(policy), '0')
+            open(os.path.join(part_dir, 'bad'), 'w').close()
+            hashes = df_mgr.get_hashes(self.existing_device, '0', [], policy)
+            self.assertIn(suffix, hashes)
+            self.assertNotIn('bad', hashes)
+
+    def test_get_hashes_hash_suffix_other_oserror(self):
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            suffix = '123'
+            suffix_path = os.path.join(self.devices, self.existing_device,
+                                       diskfile.get_data_dir(policy), '0',
+                                       suffix)
+            os.makedirs(suffix_path)
+            self.assertTrue(os.path.exists(suffix_path))  # sanity
+            hashes = df_mgr.get_hashes(self.existing_device, '0', [suffix],
+                                       policy)
+            expected = {}
+            msg = 'expected %r != %r for policy %r' % (expected, hashes,
+                                                       policy)
+            self.assertEqual(hashes, expected, msg)
+
+            # this OSError does *not* raise PathNotDir, and is allowed to leak
+            # from hash_suffix into get_hashes
+            mocked_os_listdir = mock.Mock(
+                side_effect=OSError(errno.EACCES, os.strerror(errno.EACCES)))
+            with mock.patch("os.listdir", mocked_os_listdir):
+                with mock.patch('swift.obj.diskfile.logging') as mock_logging:
+                    hashes = df_mgr.get_hashes('sda1', '0', [suffix], policy)
+            self.assertEqual(mock_logging.method_calls,
+                             [mock.call.exception('Error hashing suffix')])
+            # recalc always causes a suffix to get reset to None; the listdir
+            # error prevents the suffix from being rehashed
+            expected = {'123': None}
+            msg = 'expected %r != %r for policy %r' % (expected, hashes,
+                                                       policy)
+            self.assertEqual(hashes, expected, msg)
+
+    def test_get_hashes_modified_recursive_retry(self):
+        for policy in self.iter_policies():
+            df_mgr = self.df_router[policy]
+            part_path = os.path.join(self.devices, self.existing_device,
+                                     diskfile.get_data_dir(policy), '0')
+            mkdirs(part_path)
+            # first create an empty pickle
+            df_mgr.get_hashes(self.existing_device, '0', [], policy)
+            self.assertTrue(os.path.exists(os.path.join(
+                part_path, diskfile.HASH_FILE)))
+            non_local = {'suffix_count': 1}
+            calls = []
+
+            def mock_read_hashes(filename):
+                rv = {'%03x' % i: 'fake'
+                      for i in range(non_local['suffix_count'])}
+                if len(calls) <= 3:
+                    # this will make the *next* call get slightly
+                    # different content
+                    non_local['suffix_count'] += 1
+                # track exactly the value for every return
+                calls.append(dict(rv))
+                rv['valid'] = True
+                return rv
+            with mock.patch('swift.obj.diskfile.read_hashes',
+                            mock_read_hashes):
+                df_mgr.get_hashes(self.existing_device, '0', ['123'],
+                                  policy)
+
+            self.assertEqual(calls, [
+                {'000': 'fake'},  # read
+                {'000': 'fake', '001': 'fake'},  # modification
+                {'000': 'fake', '001': 'fake', '002': 'fake'},  # read
+                {'000': 'fake', '001': 'fake', '002': 'fake',
+                 '003': 'fake'},  # modifed
+                {'000': 'fake', '001': 'fake', '002': 'fake',
+                 '003': 'fake', '004': 'fake'},  # read
+                {'000': 'fake', '001': 'fake', '002': 'fake',
+                 '003': 'fake', '004': 'fake'},  # not modifed
+            ])
+
+
+class TestHashesHelpers(unittest.TestCase):
+
+    def setUp(self):
+        self.testdir = tempfile.mkdtemp()
+
+    def tearDown(self):
+        rmtree(self.testdir, ignore_errors=1)
+
+    def test_read_legacy_hashes(self):
+        hashes = {'fff': 'fake'}
+        hashes_file = os.path.join(self.testdir, diskfile.HASH_FILE)
+        with open(hashes_file, 'wb') as f:
+            pickle.dump(hashes, f)
+        expected = {
+            'fff': 'fake',
+            'updated': -1,
+            'valid': True,
+        }
+        self.assertEqual(expected, diskfile.read_hashes(self.testdir))
+
+    def test_write_hashes_valid_updated(self):
+        hashes = {'888': 'fake', 'valid': True}
+        now = time()
+        with mock.patch('swift.obj.diskfile.time.time', return_value=now):
+            diskfile.write_hashes(self.testdir, hashes)
+        hashes_file = os.path.join(self.testdir, diskfile.HASH_FILE)
+        with open(hashes_file, 'rb') as f:
+            data = pickle.load(f)
+        expected = {
+            '888': 'fake',
+            'updated': now,
+            'valid': True,
+        }
+        self.assertEqual(expected, data)
+
+    def test_write_hashes_invalid_updated(self):
+        hashes = {'valid': False}
+        now = time()
+        with mock.patch('swift.obj.diskfile.time.time', return_value=now):
+            diskfile.write_hashes(self.testdir, hashes)
+        hashes_file = os.path.join(self.testdir, diskfile.HASH_FILE)
+        with open(hashes_file, 'rb') as f:
+            data = pickle.load(f)
+        expected = {
+            'updated': now,
+            'valid': False,
+        }
+        self.assertEqual(expected, data)
+
+    def test_write_hashes_safe_default(self):
+        hashes = {}
+        now = time()
+        with mock.patch('swift.obj.diskfile.time.time', return_value=now):
+            diskfile.write_hashes(self.testdir, hashes)
+        hashes_file = os.path.join(self.testdir, diskfile.HASH_FILE)
+        with open(hashes_file, 'rb') as f:
+            data = pickle.load(f)
+        expected = {
+            'updated': now,
+            'valid': False,
+        }
+        self.assertEqual(expected, data)
+
+    def test_read_write_valid_hashes_mutation_and_transative_equality(self):
+        hashes = {'000': 'fake', 'valid': True}
+        diskfile.write_hashes(self.testdir, hashes)
+        # write_hashes mutates the passed in hashes, it adds the updated key
+        self.assertIn('updated', hashes)
+        self.assertTrue(hashes['valid'])
+        result = diskfile.read_hashes(self.testdir)
+        # unpickling result in a new object
+        self.assertNotEqual(id(hashes), id(result))
+        # with the exactly the same value mutation from write_hashes
+        self.assertEqual(hashes, result)
+
+    def test_read_write_invalid_hashes_mutation_and_transative_equality(self):
+        hashes = {'valid': False}
+        diskfile.write_hashes(self.testdir, hashes)
+        # write_hashes mutates the passed in hashes, it adds the updated key
+        self.assertIn('updated', hashes)
+        self.assertFalse(hashes['valid'])
+        result = diskfile.read_hashes(self.testdir)
+        # unpickling result in a new object
+        self.assertNotEqual(id(hashes), id(result))
+        # with the exactly the same value mutation from write_hashes
+        self.assertEqual(hashes, result)
+
+    def test_ignore_corrupted_hashes(self):
+        corrupted_hashes = {u'\x00\x00\x00': False, 'valid': True}
+        diskfile.write_hashes(self.testdir, corrupted_hashes)
+        result = diskfile.read_hashes(self.testdir)
+        self.assertFalse(result['valid'])
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/obj/test_expirer.py b/test/unit/obj/test_expirer.py
index bcd3974e91..b45519a6a0 100644
--- a/test/unit/obj/test_expirer.py
+++ b/test/unit/obj/test_expirer.py
@@ -1,4 +1,5 @@
-# Copyright (c) 2011 OpenStack, LLC.
+# -*- coding: utf-8 -*-
+# Copyright (c) 2011 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -12,16 +13,26 @@
 # implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
-
-import json
-from sys import exc_info
+import contextlib
+import os
+import itertools
 from time import time
 from unittest import main, TestCase
-from test.unit import FakeLogger
+from test.debug_logger import debug_logger
+from test.unit import FakeRing, mocked_http_conn, make_timestamp_iter
+from tempfile import mkdtemp
+from shutil import rmtree
+from collections import defaultdict
+from copy import deepcopy
+
+from unittest import mock
+import urllib.parse
 
-from swift.common import internal_client
-from swift.obj import expirer
-from swift.proxy.server import Application
+from swift.common import internal_client, utils, swob
+from swift.common.utils import Timestamp
+from swift.common.swob import Response
+from swift.obj import expirer, diskfile
+from swift.obj.expirer import ExpirerConfig
 
 
 def not_random():
@@ -36,360 +47,2176 @@ def not_sleep(seconds):
     last_not_sleep = seconds
 
 
+class FakeInternalClient(object):
+    container_ring = FakeRing()
+
+    def __init__(self, aco_dict):
+        """
+        :param aco_dict: A dict of account ,container, object that
+            FakeInternalClient can return when each method called. Each account
+            has container name dict, and each container dict has a list of
+            objects in the container.
+            e.g. {'account1': {
+                      'container1: ['obj1', 'obj2', {'name': 'obj3'}],
+                      'container2: [],
+                      },
+                  'account2': {},
+                  'account3': {
+                      'some_bad_container': UnexpectedResponse(),
+                  },
+                 }
+            N.B. the objects entries should be the container-server JSON style
+            db rows, but this fake will dynamically detect when names are given
+            and wrap them for convenience.
+        """
+        self.aco_dict = defaultdict(dict)
+        self.aco_dict.update(aco_dict)
+        self._calls = []
+
+    def get_account_info(self, account):
+        acc_dict = self.aco_dict[account]
+        container_count = len(acc_dict)
+        obj_count = 0
+        for obj_list_or_err in acc_dict.values():
+            if isinstance(obj_list_or_err, Exception):
+                continue
+            obj_count += len(obj_list_or_err)
+        return container_count, obj_count
+
+    def iter_containers(self, account, prefix=''):
+        acc_dict = self.aco_dict[account]
+        return [{'name': str(container)}
+                for container in sorted(acc_dict)
+                if container.startswith(prefix)]
+
+    def delete_container(self, account, container, **kwargs):
+        self._calls.append(
+            ('delete_container', '/'.join((account, container)), kwargs)
+        )
+
+    def iter_objects(self, account, container, **kwargs):
+        self._calls.append(
+            ('iter_objects', '/'.join((account, container)), kwargs)
+        )
+        acc_dict = self.aco_dict[account]
+        obj_iter = acc_dict.get(container, [])
+        if isinstance(obj_iter, Exception):
+            raise obj_iter
+        resp = []
+        for obj in obj_iter:
+            if not isinstance(obj, dict):
+                obj = {'name': str(obj)}
+            resp.append(obj)
+        return resp
+
+    def delete_object(self, account, container, obj, **kwargs):
+        self._calls.append(
+            ('delete_object', '/'.join((account, container, obj)), kwargs)
+        )
+
+
+class TestExpirerConfig(TestCase):
+    def setUp(self):
+        self.logger = debug_logger()
+
+    @mock.patch('swift.obj.expirer.utils.hash_path', return_value=hex(101)[2:])
+    def test_get_expirer_container(self, mock_hash_path):
+        expirer_config = ExpirerConfig(
+            {'expiring_objects_container_divisor': 200}, logger=self.logger)
+        container = expirer_config.get_expirer_container(
+            12340, 'a', 'c', 'o')
+        self.assertEqual(container, '0000012199')
+        expirer_config = ExpirerConfig(
+            {'expiring_objects_container_divisor': 2000}, logger=self.logger)
+        container = expirer_config.get_expirer_container(
+            12340, 'a', 'c', 'o')
+        self.assertEqual(container, '0000011999')
+
+    def test_is_expected_task_container(self):
+        expirer_config = ExpirerConfig({}, logger=self.logger)
+        self.assertEqual('.expiring_objects', expirer_config.account_name)
+        self.assertEqual(86400, expirer_config.expirer_divisor)
+        self.assertEqual(100, expirer_config.task_container_per_day)
+        self.assertFalse(expirer_config.is_expected_task_container(172801))
+        self.assertTrue(expirer_config.is_expected_task_container(172800))
+        self.assertTrue(expirer_config.is_expected_task_container(172799))
+        self.assertTrue(expirer_config.is_expected_task_container(172701))
+        self.assertFalse(expirer_config.is_expected_task_container(172700))
+        self.assertFalse(expirer_config.is_expected_task_container(86401))
+        self.assertTrue(expirer_config.is_expected_task_container(86400))
+        self.assertTrue(expirer_config.is_expected_task_container(86399))
+        self.assertTrue(expirer_config.is_expected_task_container(86301))
+        self.assertFalse(expirer_config.is_expected_task_container(86300))
+
+        expirer_config = ExpirerConfig({
+            'expiring_objects_container_divisor': 1000,
+        }, logger=self.logger)
+        self.assertEqual('.expiring_objects', expirer_config.account_name)
+        self.assertEqual(1000, expirer_config.expirer_divisor)
+        self.assertEqual(100, expirer_config.task_container_per_day)
+        self.assertFalse(expirer_config.is_expected_task_container(2001))
+        self.assertTrue(expirer_config.is_expected_task_container(2000))
+        self.assertTrue(expirer_config.is_expected_task_container(1999))
+        self.assertTrue(expirer_config.is_expected_task_container(1901))
+        self.assertFalse(expirer_config.is_expected_task_container(1900))
+        self.assertFalse(expirer_config.is_expected_task_container(1001))
+        self.assertTrue(expirer_config.is_expected_task_container(1000))
+        self.assertTrue(expirer_config.is_expected_task_container(999))
+        self.assertTrue(expirer_config.is_expected_task_container(901))
+        self.assertFalse(expirer_config.is_expected_task_container(900))
+
+    def test_get_expirer_container_legacy_config(self):
+        per_divisor = 100
+        expirer_config = ExpirerConfig({
+            'expiring_objects_container_divisor': 86400 * 2,
+        }, logger=self.logger)
+        delete_at = time()
+        found = set()
+        for i in range(per_divisor * 10):
+            c = expirer_config.get_expirer_container(
+                delete_at, 'a', 'c', 'obj%s' % i)
+            found.add(c)
+        self.assertEqual(per_divisor, len(found))
+
+    def test_get_expirer_config_default(self):
+        conf = {}
+        config = ExpirerConfig(conf, logger=self.logger)
+        self.assertEqual('.expiring_objects', config.account_name)
+        self.assertEqual(86400, config.expirer_divisor)
+        self.assertEqual(100, config.task_container_per_day)
+        self.assertFalse(self.logger.all_log_lines())
+
+    def test_get_expirer_config_legacy(self):
+        conf = {
+            'expiring_objects_account_name': 'exp',
+            'expiring_objects_container_divisor': '1000',
+        }
+        config = ExpirerConfig(conf, logger=self.logger)
+        self.assertEqual('.exp', config.account_name)
+        self.assertEqual(1000, config.expirer_divisor)
+        self.assertEqual(100, config.task_container_per_day)
+        self.assertEqual([
+            'expiring_objects_container_divisor is deprecated',
+            'expiring_objects_account_name is deprecated; you need to '
+            'migrate to the standard .expiring_objects account',
+        ], self.logger.get_lines_for_level('warning'))
+
+    def test_get_expirer_config_legacy_no_logger_given(self):
+        # verify that a logger is constructed from conf if not given
+        conf = {
+            'expiring_objects_account_name': 'exp',
+            'expiring_objects_container_divisor': '1000',
+            'log_route': 'test',
+        }
+
+        with mock.patch(
+                'swift.obj.expirer.get_logger', return_value=self.logger
+        ) as mock_get_logger:
+            config = ExpirerConfig(conf, logger=None)
+        self.assertEqual('.exp', config.account_name)
+        self.assertEqual(1000, config.expirer_divisor)
+        self.assertEqual(100, config.task_container_per_day)
+        self.assertEqual([
+            'expiring_objects_container_divisor is deprecated',
+            'expiring_objects_account_name is deprecated; you need to '
+            'migrate to the standard .expiring_objects account',
+        ], self.logger.get_lines_for_level('warning'))
+        self.assertEqual([mock.call(conf)], mock_get_logger.call_args_list)
+
+    def test_get_expirer_account_and_container_default(self):
+        expirer_config = ExpirerConfig({}, logger=self.logger)
+        delete_at = time()
+        account, container = \
+            expirer_config.get_expirer_account_and_container(
+                delete_at, 'a', 'c', 'o')
+        self.assertEqual('.expiring_objects', account)
+        self.assertTrue(expirer_config.is_expected_task_container(
+            int(container)))
+
+    def test_get_expirer_account_and_container_legacy(self):
+        expirer_config = ExpirerConfig({
+            'expiring_objects_account_name': 'exp',
+            'expiring_objects_container_divisor': 1000,
+        }, logger=self.logger)
+        delete_at = time()
+        account, container = expirer_config.get_expirer_account_and_container(
+            delete_at, 'a', 'c', 'o')
+        self.assertEqual('.exp', account)
+        self.assertEqual(1000, expirer_config.expirer_divisor)
+        self.assertEqual(100, expirer_config.task_container_per_day)
+        self.assertTrue(expirer_config.is_expected_task_container(
+            int(container)))
+
+    def test_get_delete_at_nodes(self):
+        container_ring = FakeRing()
+        # it seems default FakeRing is very predictable
+        self.assertEqual(32, container_ring._part_shift)
+        self.assertEqual(3, container_ring.replicas)
+        self.assertEqual(3, len(container_ring.devs))
+        expirer_config = ExpirerConfig(
+            {}, logger=self.logger, container_ring=container_ring)
+        delete_at = time()
+        part, nodes, task_container = expirer_config.get_delete_at_nodes(
+            delete_at, 'a', 'c', 'o2')
+        self.assertEqual(0, part)  # only one part
+        self.assertEqual([
+            dict(n, index=i) for i, n in enumerate(container_ring.devs)
+        ], nodes)  # assigned to all ring devices
+        self.assertTrue(expirer_config.is_expected_task_container(
+            int(task_container)))
+
+    def test_get_delete_at_nodes_no_ring(self):
+        expirer_config = ExpirerConfig({}, logger=self.logger)
+        delete_at = time()
+        with self.assertRaises(RuntimeError) as ctx:
+            expirer_config.get_delete_at_nodes(
+                delete_at, 'a', 'c', 'o2')
+        self.assertIn('ExpirerConfig', str(ctx.exception))
+        self.assertIn('container_ring', str(ctx.exception))
+
+
+class TestExpirerHelpers(TestCase):
+
+    def test_add_expirer_bytes_to_ctype(self):
+        self.assertEqual(
+            'text/plain;swift_expirer_bytes=10',
+            expirer.embed_expirer_bytes_in_ctype(
+                'text/plain', {'Content-Length': 10}))
+        self.assertEqual(
+            'text/plain;some_foo=bar;swift_expirer_bytes=10',
+            expirer.embed_expirer_bytes_in_ctype(
+                'text/plain;some_foo=bar', {'Content-Length': '10'}))
+        # you could probably make a case it'd be better to replace an existing
+        # value if the swift_expirer_bytes key already exists in the content
+        # type; but in the only case we use this function currently the content
+        # type is hard coded to text/plain
+        self.assertEqual(
+            'text/plain;some_foo=bar;swift_expirer_bytes=10;'
+            'swift_expirer_bytes=11',
+            expirer.embed_expirer_bytes_in_ctype(
+                'text/plain;some_foo=bar;swift_expirer_bytes=10',
+                {'Content-Length': '11'}))
+
+    def test_extract_expirer_bytes_from_ctype(self):
+        self.assertEqual(10, expirer.extract_expirer_bytes_from_ctype(
+            'text/plain;swift_expirer_bytes=10'))
+        self.assertEqual(10, expirer.extract_expirer_bytes_from_ctype(
+            'text/plain;swift_expirer_bytes=10;some_foo=bar'))
+
+    def test_inverse_add_extract_bytes_from_ctype(self):
+        ctype_bytes = [
+            ('null', 0),
+            ('text/plain', 10),
+            ('application/octet-stream', 42),
+            ('application/json', 512),
+            ('gzip', 1000044),
+        ]
+        for ctype, expirer_bytes in ctype_bytes:
+            embedded_ctype = expirer.embed_expirer_bytes_in_ctype(
+                ctype, {'Content-Length': expirer_bytes})
+            found_bytes = expirer.extract_expirer_bytes_from_ctype(
+                embedded_ctype)
+            self.assertEqual(expirer_bytes, found_bytes)
+
+    def test_add_invalid_expirer_bytes_to_ctype(self):
+        self.assertRaises(TypeError,
+                          expirer.embed_expirer_bytes_in_ctype, 'nill', None)
+        self.assertRaises(TypeError,
+                          expirer.embed_expirer_bytes_in_ctype, 'bar', 'foo')
+        self.assertRaises(KeyError,
+                          expirer.embed_expirer_bytes_in_ctype, 'nill', {})
+        self.assertRaises(TypeError,
+                          expirer.embed_expirer_bytes_in_ctype, 'nill',
+                          {'Content-Length': None})
+        self.assertRaises(ValueError,
+                          expirer.embed_expirer_bytes_in_ctype, 'nill',
+                          {'Content-Length': 'foo'})
+        # perhaps could be an error
+        self.assertEqual(
+            'weird/float;swift_expirer_bytes=15',
+            expirer.embed_expirer_bytes_in_ctype('weird/float',
+                                                 {'Content-Length': 15.9}))
+
+    def test_embed_expirer_bytes_from_diskfile_metadata(self):
+        self.logger = debug_logger('test-expirer')
+        self.ts = make_timestamp_iter()
+        self.devices = mkdtemp()
+        self.conf = {
+            'mount_check': 'false',
+            'devices': self.devices,
+        }
+        self.df_mgr = diskfile.DiskFileManager(self.conf, logger=self.logger)
+        utils.mkdirs(os.path.join(self.devices, 'sda1'))
+        df = self.df_mgr.get_diskfile('sda1', '0', 'a', 'c', 'o', policy=0)
+
+        ts = next(self.ts)
+        with df.create() as writer:
+            writer.write(b'test')
+            writer.put({
+                # wrong key/case here would KeyError
+                'X-Timestamp': ts.internal,
+                # wrong key/case here would cause quarantine on read
+                'Content-Length': '4',
+            })
+
+        metadata = df.read_metadata()
+        # the Content-Type in the metadata is irrelevant; this method is used
+        # to create the content_type of an expirer queue task object
+        embeded_ctype_entry = expirer.embed_expirer_bytes_in_ctype(
+            'text/plain', metadata)
+        self.assertEqual('text/plain;swift_expirer_bytes=4',
+                         embeded_ctype_entry)
+
+    def test_extract_missing_bytes_from_ctype(self):
+        self.assertEqual(
+            None, expirer.extract_expirer_bytes_from_ctype('text/plain'))
+        self.assertEqual(
+            None, expirer.extract_expirer_bytes_from_ctype(
+                'text/plain;swift_bytes=10'))
+        self.assertEqual(
+            None, expirer.extract_expirer_bytes_from_ctype(
+                'text/plain;bytes=21'))
+        self.assertEqual(
+            None, expirer.extract_expirer_bytes_from_ctype(
+                'text/plain;some_foo=bar;other-baz=buz'))
+
+
 class TestObjectExpirer(TestCase):
     maxDiff = None
+    internal_client = None
+
+    def get_expirer_container(self, delete_at, target_account='a',
+                              target_container='c', target_object='o'):
+        # the actual target a/c/o used only matters for consistent
+        # distribution, tests typically only create one task container per-day,
+        # but we want the task container names to be realistic
+        expirer = getattr(self, 'expirer', None)
+        expirer_config = expirer.expirer_config if expirer else \
+            ExpirerConfig(self.conf, self.logger)
+        return expirer_config.get_expirer_container(
+            delete_at, target_account, target_container, target_object)
 
     def setUp(self):
         global not_sleep
 
-        self.old_loadapp = internal_client.loadapp
         self.old_sleep = internal_client.sleep
 
-        internal_client.loadapp = lambda x: None
         internal_client.sleep = not_sleep
 
-    def teardown(self):
+        self.rcache = mkdtemp()
+        self.conf = {'recon_cache_path': self.rcache}
+        self.logger = debug_logger('test-expirer')
+
+        self.ts = make_timestamp_iter()
+
+        self.now = now = int(time())
+
+        self.empty_time = str(now - 864000)
+        self.empty_time_container = self.get_expirer_container(
+            self.empty_time)
+        self.past_time = str(now - 86400)
+        self.past_time_container = self.get_expirer_container(
+            self.past_time)
+        self.just_past_time = str(now - 1)
+        self.just_past_time_container = self.get_expirer_container(
+            self.just_past_time)
+        self.future_time = str(now + 86400)
+        self.future_time_container = self.get_expirer_container(
+            self.future_time)
+        # Dummy task queue for test
+        self._setup_fake_swift({
+            '.expiring_objects': {
+                # this task container will be checked
+                self.empty_time_container: [],
+                self.past_time_container: [
+                    # tasks ready for execution
+                    self.past_time + '-a0/c0/o0',
+                    self.past_time + '-a1/c1/o1',
+                    self.past_time + '-a2/c2/o2',
+                    self.past_time + '-a3/c3/o3',
+                    self.past_time + '-a4/c4/o4'],
+                self.just_past_time_container: [
+                    self.just_past_time + '-a5/c5/o5',
+                    self.just_past_time + '-a6/c6/o6',
+                    self.just_past_time + '-a7/c7/o7',
+                    # task objects for unicode test
+                    self.just_past_time + u'-a8/c8/o8\u2661',
+                    self.just_past_time + u'-a9/c9/o9\xf8',
+                    # this task will be skipped and prevent us from even
+                    # *trying* to delete the container
+                    self.future_time + '-a10/c10/o10'],
+                # this task container will be skipped
+                self.future_time_container: [
+                    self.future_time + '-a11/c11/o11']}
+        })
+
+        # map of times to target object paths which should be expirerd now
+        self.expired_target_paths = {
+            self.past_time: [
+                swob.wsgi_to_str(tgt) for tgt in (
+                    'a0/c0/o0', 'a1/c1/o1', 'a2/c2/o2', 'a3/c3/o3', 'a4/c4/o4',
+                )
+            ],
+            self.just_past_time: [
+                swob.wsgi_to_str(tgt) for tgt in (
+                    'a5/c5/o5', 'a6/c6/o6', 'a7/c7/o7',
+                    'a8/c8/o8\xe2\x99\xa1', 'a9/c9/o9\xc3\xb8',
+                )
+            ],
+        }
+
+    def _setup_fake_swift(self, aco_dict):
+        self.fake_swift = FakeInternalClient(aco_dict)
+        self.expirer = expirer.ObjectExpirer(self.conf, logger=self.logger,
+                                             swift=self.fake_swift)
+        self.expirer_config = self.expirer.expirer_config
+
+    def make_fake_ic(self, app):
+        app._pipeline_final_app = mock.MagicMock()
+        return internal_client.InternalClient(None, 'fake-ic', 1, app=app)
+
+    def tearDown(self):
+        rmtree(self.rcache)
         internal_client.sleep = self.old_sleep
-        internal_client.loadapp = self.loadapp
+
+    def test_init(self):
+        with mock.patch.object(expirer, 'InternalClient',
+                               return_value=self.fake_swift) as mock_ic:
+            x = expirer.ObjectExpirer({}, logger=self.logger)
+        self.assertEqual(mock_ic.mock_calls, [mock.call(
+            '/etc/swift/object-expirer.conf', 'Swift Object Expirer', 3,
+            use_replication_network=True,
+            global_conf={'log_name': 'object-expirer-ic'})])
+        self.assertEqual(self.logger.get_lines_for_level('warning'), [])
+        self.assertEqual(x.expirer_config.account_name, '.expiring_objects')
+        self.assertIs(x.swift, self.fake_swift)
+
+    def test_init_default_round_robin_cache_default(self):
+        conf = {}
+        x = expirer.ObjectExpirer(conf, logger=self.logger,
+                                  swift=self.fake_swift)
+        self.assertEqual(x.round_robin_task_cache_size,
+                         expirer.MAX_OBJECTS_TO_CACHE)
+
+    def test_init_large_round_robin_cache(self):
+        conf = {
+            'round_robin_task_cache_size': '1000000',
+        }
+        x = expirer.ObjectExpirer(conf, logger=self.logger,
+                                  swift=self.fake_swift)
+        self.assertEqual(x.round_robin_task_cache_size, 1000000)
+
+    def test_init_internal_client_path_from_expirer_conf(self):
+        # conf read from object-expirer.conf, no internal_client_conf_path
+        conf = {'__file__': '/etc/swift/object-expirer.conf'}
+        with mock.patch.object(expirer, 'InternalClient',
+                               return_value=self.fake_swift) as mock_ic:
+            x = expirer.ObjectExpirer(conf, logger=self.logger)
+        self.assertEqual(mock_ic.mock_calls, [mock.call(
+            '/etc/swift/object-expirer.conf', 'Swift Object Expirer', 3,
+            use_replication_network=True,
+            global_conf={'log_name': 'object-expirer-ic'})])
+        self.assertEqual(self.logger.get_lines_for_level('warning'), [])
+        self.assertIs(x.swift, self.fake_swift)
+
+    def test_init_internal_client_path_from_internal_and_other_conf(self):
+        # conf read from /etc/swift/object-expirer.conf
+        # -> /etc/swift/object-expirer.conf
+        conf = {'__file__': '/etc/swift/object-expirer.conf',
+                'internal_client_conf_path':
+                    '/etc/swift/other-internal-client.conf'}
+        with mock.patch.object(expirer, 'InternalClient',
+                               return_value=self.fake_swift) as mock_ic:
+            x = expirer.ObjectExpirer(conf, logger=self.logger)
+        self.assertEqual(mock_ic.mock_calls, [mock.call(
+            '/etc/swift/other-internal-client.conf', 'Swift Object Expirer', 3,
+            use_replication_network=True,
+            global_conf={'log_name': 'object-expirer-ic'})])
+        self.assertEqual(self.logger.get_lines_for_level('warning'), [])
+        self.assertIs(x.swift, self.fake_swift)
+
+    def test_init_internal_client_path_from_server_conf(self):
+        # conf read from object-server.conf, no internal_client_conf_path
+        # specified -> /etc/swift/internal-client.conf
+        conf = {'__file__': '/etc/swift/object-server.conf'}
+        with mock.patch.object(expirer, 'InternalClient',
+                               return_value=self.fake_swift) as mock_ic:
+            x = expirer.ObjectExpirer(conf, logger=self.logger)
+        self.assertEqual(mock_ic.mock_calls, [mock.call(
+            '/etc/swift/internal-client.conf', 'Swift Object Expirer', 3,
+            use_replication_network=True,
+            global_conf={'log_name': 'object-expirer-ic'})])
+        self.assertEqual(self.logger.get_lines_for_level('warning'), [])
+        self.assertIs(x.swift, self.fake_swift)
+
+    def test_init_internal_client_path_from_server_and_other_conf(self):
+        # conf read from object-server.conf, internal_client_conf_path is
+        # specified -> internal_client_conf_path value
+        conf = {'__file__': '/etc/swift/object-server.conf',
+                'internal_client_conf_path':
+                    '/etc/swift/other-internal-client.conf'}
+        with mock.patch.object(expirer, 'InternalClient',
+                               return_value=self.fake_swift) as mock_ic:
+            x = expirer.ObjectExpirer(conf, logger=self.logger)
+        self.assertEqual(mock_ic.mock_calls, [mock.call(
+            '/etc/swift/other-internal-client.conf', 'Swift Object Expirer', 3,
+            use_replication_network=True,
+            global_conf={'log_name': 'object-expirer-ic'})])
+        self.assertEqual(self.logger.get_lines_for_level('warning'), [])
+        self.assertIs(x.swift, self.fake_swift)
+
+    def test_init_internal_client_path_from_other_and_other_conf(self):
+        # conf read from other file, internal_client_conf_path is
+        # specified -> internal_client_conf_path value
+        conf = {'__file__': '/etc/swift/other-object-server.conf',
+                'internal_client_conf_path':
+                    '/etc/swift/other-internal-client.conf'}
+        with mock.patch.object(expirer, 'InternalClient',
+                               return_value=self.fake_swift) as mock_ic:
+            x = expirer.ObjectExpirer(conf, logger=self.logger)
+        self.assertEqual(mock_ic.mock_calls, [mock.call(
+            '/etc/swift/other-internal-client.conf', 'Swift Object Expirer', 3,
+            use_replication_network=True,
+            global_conf={'log_name': 'object-expirer-ic'})])
+        self.assertEqual(self.logger.get_lines_for_level('warning'), [])
+        self.assertIs(x.swift, self.fake_swift)
+
+    def test_init_internal_client_path_from_empty_conf(self):
+        conf = {}
+        with mock.patch.object(expirer, 'InternalClient',
+                               return_value=self.fake_swift) as mock_ic:
+            x = expirer.ObjectExpirer(conf, logger=self.logger)
+        self.assertEqual(mock_ic.mock_calls, [mock.call(
+            '/etc/swift/object-expirer.conf', 'Swift Object Expirer', 3,
+            use_replication_network=True,
+            global_conf={'log_name': 'object-expirer-ic'})])
+        self.assertEqual(self.logger.get_lines_for_level('warning'), [])
+        self.assertIs(x.swift, self.fake_swift)
+
+    def test_init_internal_client_log_name(self):
+        def _do_test_init_ic_log_name(conf, exp_internal_client_log_name):
+            with mock.patch(
+                    'swift.obj.expirer.InternalClient') \
+                    as mock_ic:
+                expirer.ObjectExpirer(conf)
+            mock_ic.assert_called_once_with(
+                '/etc/swift/object-expirer.conf',
+                'Swift Object Expirer', 3,
+                global_conf={'log_name': exp_internal_client_log_name},
+                use_replication_network=True)
+
+        _do_test_init_ic_log_name({}, 'object-expirer-ic')
+        _do_test_init_ic_log_name({'log_name': 'my-object-expirer'},
+                                  'my-object-expirer-ic')
+
+    def test_set_process_values_from_kwargs(self):
+        x = expirer.ObjectExpirer({}, swift=self.fake_swift)
+        vals = {
+            'processes': 5,
+            'process': 1,
+        }
+        x.override_proceses_config_from_command_line(**vals)
+        self.assertEqual(x.processes, 5)
+        self.assertEqual(x.process, 1)
+
+    def test_set_process_values_from_config(self):
+        conf = {
+            'processes': 5,
+            'process': 1,
+        }
+        x = expirer.ObjectExpirer(conf, swift=self.fake_swift)
+        self.assertEqual(x.processes, 5)
+        self.assertEqual(x.process, 1)
+
+    def test_set_process_values_negative_process(self):
+        vals = {
+            'processes': 5,
+            'process': -1,
+        }
+        # from config
+        expected_msg = 'must be a non-negative integer'
+        with self.assertRaises(ValueError) as ctx:
+            expirer.ObjectExpirer(vals, swift=self.fake_swift)
+        self.assertIn(expected_msg, str(ctx.exception))
+        # from kwargs
+        x = expirer.ObjectExpirer({}, swift=self.fake_swift)
+        with self.assertRaises(ValueError) as ctx:
+            x.override_proceses_config_from_command_line(**vals)
+        self.assertIn(expected_msg, str(ctx.exception))
+
+    def test_set_process_values_negative_processes(self):
+        vals = {
+            'processes': -5,
+            'process': 1,
+        }
+        # from config
+        expected_msg = 'must be a non-negative integer'
+        with self.assertRaises(ValueError) as ctx:
+            expirer.ObjectExpirer(vals, swift=self.fake_swift)
+        self.assertIn(expected_msg, str(ctx.exception))
+        # from kwargs
+        x = expirer.ObjectExpirer({}, swift=self.fake_swift)
+        with self.assertRaises(ValueError) as ctx:
+            x.override_proceses_config_from_command_line(**vals)
+        self.assertIn(expected_msg, str(ctx.exception))
+
+    def test_set_process_values_process_greater_than_processes(self):
+        vals = {
+            'processes': 5,
+            'process': 7,
+        }
+        # from config
+        expected_msg = 'process must be less than processes'
+        with self.assertRaises(ValueError) as ctx:
+            x = expirer.ObjectExpirer(vals, swift=self.fake_swift)
+        self.assertEqual(str(ctx.exception), expected_msg)
+        # from kwargs
+        x = expirer.ObjectExpirer({}, swift=self.fake_swift)
+        with self.assertRaises(ValueError) as ctx:
+            x.override_proceses_config_from_command_line(**vals)
+        self.assertEqual(str(ctx.exception), expected_msg)
+
+    def test_set_process_values_process_equal_to_processes(self):
+        vals = {
+            'processes': 5,
+            'process': 5,
+        }
+        # from config
+        expected_msg = 'process must be less than processes'
+        with self.assertRaises(ValueError) as ctx:
+            expirer.ObjectExpirer(vals, swift=self.fake_swift)
+        self.assertEqual(str(ctx.exception), expected_msg)
+        # from kwargs
+        x = expirer.ObjectExpirer({}, swift=self.fake_swift)
+        with self.assertRaises(ValueError) as ctx:
+            x.override_proceses_config_from_command_line(**vals)
+        self.assertEqual(str(ctx.exception), expected_msg)
+
+    def test_valid_delay_reaping(self):
+        conf = {}
+        x = expirer.ObjectExpirer(conf, swift=self.fake_swift)
+        self.assertEqual(x.delay_reaping_times, {})
+
+        conf = {
+            'delay_reaping_a': 1.0,
+        }
+        x = expirer.ObjectExpirer(conf, swift=self.fake_swift)
+        self.assertEqual(x.delay_reaping_times, {('a', None): 1.0})
+
+        # allow delay_reaping to be 0
+        conf = {
+            'delay_reaping_a': 0.0,
+        }
+        x = expirer.ObjectExpirer(conf, swift=self.fake_swift)
+        self.assertEqual(x.delay_reaping_times, {('a', None): 0.0})
+
+        conf = {
+            'delay_reaping_a/b': 0.0,
+        }
+        x = expirer.ObjectExpirer(conf, swift=self.fake_swift)
+        self.assertEqual(x.delay_reaping_times, {('a', 'b'): 0.0})
+
+        # test configure multi-account delay_reaping
+        conf = {
+            'delay_reaping_a': 1.0,
+            'delay_reaping_b': '259200.0',
+            'delay_reaping_AUTH_aBC': 999,
+            u'delay_reaping_AUTH_aBáC': 555,
+        }
+        x = expirer.ObjectExpirer(conf, swift=self.fake_swift)
+        self.assertEqual(x.delay_reaping_times, {
+            ('a', None): 1.0,
+            ('b', None): 259200.0,
+            ('AUTH_aBC', None): 999,
+            (u'AUTH_aBáC', None): 555,
+        })
+
+        # test configure multi-account delay_reaping with containers
+        conf = {
+            'delay_reaping_a': 10.0,
+            'delay_reaping_a/test': 1.0,
+            'delay_reaping_b': '259200.0',
+            'delay_reaping_AUTH_aBC/test2': 999,
+            u'delay_reaping_AUTH_aBáC/tést': 555,
+            'delay_reaping_AUTH_test/special%0Achars%3Dare%20quoted': 777,
+            'delay_reaping_AUTH_test/plus+signs+are+preserved': 888,
+        }
+        x = expirer.ObjectExpirer(conf, swift=self.fake_swift)
+        self.assertEqual(x.delay_reaping_times, {
+            ('a', None): 10.0,
+            ('a', 'test'): 1.0,
+            ('b', None): 259200.0,
+            ('AUTH_aBC', 'test2'): 999,
+            (u'AUTH_aBáC', u'tést'): 555,
+            ('AUTH_test', 'special\nchars=are quoted'): 777,
+            ('AUTH_test', 'plus+signs+are+preserved'): 888,
+        })
+
+    def test_invalid_delay_reaping_keys(self):
+        # there is no global delay_reaping
+        conf = {
+            'delay_reaping': 0.0,
+        }
+        x = expirer.ObjectExpirer(conf, swift=self.fake_swift)
+        self.assertEqual(x.delay_reaping_times, {})
+
+        # Multiple "/" or invalid parsing
+        conf = {
+            'delay_reaping_A_U_TH_foo_bar/my-container_name/with/slash': 60400,
+        }
+        with self.assertRaises(ValueError) as ctx:
+            expirer.ObjectExpirer(conf, swift=self.fake_swift)
+        self.assertEqual(
+            'delay_reaping_A_U_TH_foo_bar/my-container_name/with/slash '
+            'should be in the form delay_reaping_<account> '
+            'or delay_reaping_<account>/<container> '
+            '(at most one "/" is allowed)',
+            str(ctx.exception))
+
+        # Can't sneak around it by escaping
+        conf = {
+            'delay_reaping_AUTH_test/sneaky%2fsneaky': 60400,
+        }
+        with self.assertRaises(ValueError) as ctx:
+            expirer.ObjectExpirer(conf, swift=self.fake_swift)
+        self.assertEqual(
+            'delay_reaping_AUTH_test/sneaky%2fsneaky '
+            'should be in the form delay_reaping_<account> '
+            'or delay_reaping_<account>/<container> '
+            '(at most one "/" is allowed)',
+            str(ctx.exception))
+
+        conf = {
+            'delay_reaping_': 60400
+        }
+        with self.assertRaises(ValueError) as ctx:
+            expirer.ObjectExpirer(conf, swift=self.fake_swift)
+        self.assertEqual(
+            'delay_reaping_ '
+            'should be in the form delay_reaping_<account> '
+            'or delay_reaping_<account>/<container> '
+            '(at most one "/" is allowed)',
+            str(ctx.exception))
+
+        # Leading and trailing "/"
+        conf = {
+            'delay_reaping_/a': 60400,
+        }
+        with self.assertRaises(ValueError) as ctx:
+            expirer.ObjectExpirer(conf, swift=self.fake_swift)
+        self.assertEqual(
+            'delay_reaping_/a '
+            'should be in the form delay_reaping_<account> '
+            'or delay_reaping_<account>/<container> '
+            '(leading or trailing "/" is not allowed)',
+            str(ctx.exception))
+
+        conf = {
+            'delay_reaping_a/': 60400,
+        }
+        with self.assertRaises(ValueError) as ctx:
+            expirer.ObjectExpirer(conf, swift=self.fake_swift)
+        self.assertEqual(
+            'delay_reaping_a/ '
+            'should be in the form delay_reaping_<account> '
+            'or delay_reaping_<account>/<container> '
+            '(leading or trailing "/" is not allowed)',
+            str(ctx.exception))
+
+        conf = {
+            'delay_reaping_/a/c/': 60400,
+        }
+        with self.assertRaises(ValueError) as ctx:
+            expirer.ObjectExpirer(conf, swift=self.fake_swift)
+        self.assertEqual(
+            'delay_reaping_/a/c/ '
+            'should be in the form delay_reaping_<account> '
+            'or delay_reaping_<account>/<container> '
+            '(leading or trailing "/" is not allowed)',
+            str(ctx.exception))
+
+    def test_invalid_delay_reaping_values(self):
+        # negative tests
+        conf = {
+            'delay_reaping_a': -1.0,
+        }
+        with self.assertRaises(ValueError) as ctx:
+            expirer.ObjectExpirer(conf, swift=self.fake_swift)
+        self.assertEqual(
+            'delay_reaping_a must be a float greater than or equal to 0',
+            str(ctx.exception))
+        conf = {
+            'delay_reaping_a': '-259200.0'
+        }
+        with self.assertRaises(ValueError) as ctx:
+            expirer.ObjectExpirer(conf, swift=self.fake_swift)
+        self.assertEqual(
+            'delay_reaping_a must be a float greater than or equal to 0',
+            str(ctx.exception))
+        conf = {
+            'delay_reaping_a': 'foo'
+        }
+        with self.assertRaises(ValueError) as ctx:
+            expirer.ObjectExpirer(conf, swift=self.fake_swift)
+        self.assertEqual(
+            'delay_reaping_a must be a float greater than or equal to 0',
+            str(ctx.exception))
+
+        # negative tests with containers
+        conf = {
+            'delay_reaping_a/b': -100.0
+        }
+        with self.assertRaises(ValueError) as ctx:
+            expirer.ObjectExpirer(conf, swift=self.fake_swift)
+        self.assertEqual(
+            'delay_reaping_a/b must be a float greater than or equal to 0',
+            str(ctx.exception))
+        conf = {
+            'delay_reaping_a/b': '-259200.0'
+        }
+        with self.assertRaises(ValueError) as ctx:
+            expirer.ObjectExpirer(conf, swift=self.fake_swift)
+        self.assertEqual(
+            'delay_reaping_a/b must be a float greater than or equal to 0',
+            str(ctx.exception))
+        conf = {
+            'delay_reaping_a/b': 'foo'
+        }
+        with self.assertRaises(ValueError) as ctx:
+            expirer.ObjectExpirer(conf, swift=self.fake_swift)
+        self.assertEqual(
+            'delay_reaping_a/b must be a float greater than or equal to 0',
+            str(ctx.exception))
+
+    def test_get_delay_reaping(self):
+        conf = {
+            'delay_reaping_a': 1.0,
+            'delay_reaping_a/test': 2.0,
+            'delay_reaping_b': '259200.0',
+            'delay_reaping_b/a': '0.0',
+            'delay_reaping_c/test': '3.0'
+        }
+        x = expirer.ObjectExpirer(conf, swift=self.fake_swift)
+        self.assertEqual(1.0, x.get_delay_reaping('a', None))
+        self.assertEqual(1.0, x.get_delay_reaping('a', 'not-test'))
+        self.assertEqual(2.0, x.get_delay_reaping('a', 'test'))
+        self.assertEqual(259200.0, x.get_delay_reaping('b', None))
+        self.assertEqual(0.0, x.get_delay_reaping('b', 'a'))
+        self.assertEqual(259200.0, x.get_delay_reaping('b', 'test'))
+        self.assertEqual(3.0, x.get_delay_reaping('c', 'test'))
+        self.assertEqual(0.0, x.get_delay_reaping('c', 'not-test'))
+        self.assertEqual(0.0, x.get_delay_reaping('no-conf', 'test'))
+
+    def test_init_concurrency_too_small(self):
+        conf = {
+            'concurrency': 0,
+        }
+        with self.assertRaises(ValueError):
+            expirer.ObjectExpirer(conf, swift=self.fake_swift)
+        conf = {
+            'concurrency': -1,
+        }
+        with self.assertRaises(ValueError):
+            expirer.ObjectExpirer(conf, swift=self.fake_swift)
+
+    def test_process_based_concurrency(self):
+
+        @contextlib.contextmanager
+        def capture_deleted_objects(exp):
+            captured = defaultdict(set)
+
+            def mock_delete_object(target_path, delete_timestamp,
+                                   task_account, task_container, task_object,
+                                   is_async_delete):
+                captured[task_container].add(task_object)
+
+            with mock.patch.object(exp, 'delete_object', mock_delete_object):
+                yield captured
+
+        conf = dict(self.conf, processes=3)
+        x = expirer.ObjectExpirer(
+            conf, swift=self.fake_swift, logger=self.logger)
+
+        deleted_objects = defaultdict(set)
+        for i in range(3):
+            x.process = i
+            # reset progress so we know we don't double-up work among processes
+            with capture_deleted_objects(x) as captured_deleted_objects:
+                x.run_once()
+            for task_container, deleted in captured_deleted_objects.items():
+                self.assertFalse(deleted_objects[task_container] & deleted)
+                deleted_objects[task_container] |= deleted
+
+        self.assertEqual({
+            'tasks.assigned': 10,
+            'tasks.skipped': 20,
+        }, self.logger.statsd_client.get_stats_counts())
+
+        # sort for comparison
+        deleted_objects = {
+            con: sorted(o_set) for con, o_set in deleted_objects.items()}
+        expected = {
+            self.past_time_container: [
+                self.past_time + '-' + target_path
+                for target_path in self.expired_target_paths[self.past_time]],
+            self.just_past_time_container: [
+                self.just_past_time + '-' + target_path
+                for target_path
+                in self.expired_target_paths[self.just_past_time]]}
+        self.assertEqual(deleted_objects, expected)
+
+    def test_delete_object(self):
+        x = expirer.ObjectExpirer({}, logger=self.logger,
+                                  swift=self.fake_swift)
+        actual_obj = 'actual_obj'
+        timestamp = int(time())
+        reclaim_ts = timestamp - x.reclaim_age
+        account = 'account'
+        container = 'container'
+        obj = 'obj'
+
+        http_exc = {
+            resp_code:
+                internal_client.UnexpectedResponse(
+                    str(resp_code), swob.HTTPException(status=resp_code))
+            for resp_code in {404, 412, 500}
+        }
+        exc_other = Exception()
+
+        def check_call_to_delete_object(exc, ts, should_pop):
+            x.logger.clear()
+            start_reports = x.report_objects
+            with mock.patch.object(x, 'delete_actual_object',
+                                   side_effect=exc) as delete_actual:
+                with mock.patch.object(x, 'pop_queue') as pop_queue:
+                    x.delete_object(actual_obj, ts, account, container, obj,
+                                    False)
+
+            delete_actual.assert_called_once_with(actual_obj, ts, False)
+            log_lines = x.logger.get_lines_for_level('error')
+            if should_pop:
+                pop_queue.assert_called_once_with(account, container, obj)
+                self.assertEqual(start_reports + 1, x.report_objects)
+                self.assertFalse(log_lines)
+            else:
+                self.assertFalse(pop_queue.called)
+                self.assertEqual(start_reports, x.report_objects)
+                self.assertEqual(1, len(log_lines))
+                if isinstance(exc, internal_client.UnexpectedResponse):
+                    self.assertEqual(
+                        log_lines[0],
+                        'Unexpected response while deleting object '
+                        'account container obj: %s' % exc.resp.status_int)
+                else:
+                    self.assertTrue(log_lines[0].startswith(
+                        'Exception while deleting object '
+                        'account container obj'))
+
+        # verify pop_queue logic on exceptions
+        for exc, ts, should_pop in [(None, timestamp, True),
+                                    (http_exc[404], timestamp, False),
+                                    (http_exc[412], timestamp, False),
+                                    (http_exc[500], reclaim_ts, False),
+                                    (exc_other, reclaim_ts, False),
+                                    (http_exc[404], reclaim_ts, True),
+                                    (http_exc[412], reclaim_ts, True)]:
+
+            try:
+                check_call_to_delete_object(exc, ts, should_pop)
+            except AssertionError as err:
+                self.fail("Failed on %r at %f: %s" % (exc, ts, err))
 
     def test_report(self):
-        x = expirer.ObjectExpirer({})
-        x.logger = FakeLogger()
+        x = expirer.ObjectExpirer({}, logger=self.logger,
+                                  swift=self.fake_swift)
 
         x.report()
-        self.assertEquals(x.logger.log_dict['info'], [])
+        self.assertEqual(x.logger.get_lines_for_level('info'), [])
 
         x.logger._clear()
         x.report(final=True)
-        self.assertTrue('completed' in x.logger.log_dict['info'][-1][0][0],
-                        x.logger.log_dict['info'])
-        self.assertTrue('so far' not in x.logger.log_dict['info'][-1][0][0],
-                        x.logger.log_dict['info'])
+        self.assertTrue(
+            'completed' in str(x.logger.get_lines_for_level('info')))
+        self.assertTrue(
+            'so far' not in str(x.logger.get_lines_for_level('info')))
 
         x.logger._clear()
         x.report_last_time = time() - x.report_interval
         x.report()
-        self.assertTrue('completed' not in x.logger.log_dict['info'][-1][0][0],
-                        x.logger.log_dict['info'])
-        self.assertTrue('so far' in x.logger.log_dict['info'][-1][0][0],
-                        x.logger.log_dict['info'])
+        self.assertTrue(
+            'completed' not in str(x.logger.get_lines_for_level('info')))
+        self.assertTrue(
+            'so far' in str(x.logger.get_lines_for_level('info')))
+
+    def test_parse_task_obj(self):
+        x = expirer.ObjectExpirer(self.conf, logger=self.logger,
+                                  swift=self.fake_swift)
+
+        def assert_parse_task_obj(task_obj, expected_delete_at,
+                                  expected_account, expected_container,
+                                  expected_obj):
+            delete_at, account, container, obj = x.parse_task_obj(task_obj)
+            self.assertEqual(delete_at, expected_delete_at)
+            self.assertEqual(account, expected_account)
+            self.assertEqual(container, expected_container)
+            self.assertEqual(obj, expected_obj)
+
+        assert_parse_task_obj('0000-a/c/o', 0, 'a', 'c', 'o')
+        assert_parse_task_obj('0001-a/c/o', 1, 'a', 'c', 'o')
+        assert_parse_task_obj('1000-a/c/o', 1000, 'a', 'c', 'o')
+        assert_parse_task_obj('0000-acc/con/obj', 0, 'acc', 'con', 'obj')
+
+    def make_task(self, task_container, delete_at, target,
+                  is_async_delete=False):
+        return {
+            'task_account': '.expiring_objects',
+            'task_container': task_container,
+            'task_object': delete_at + '-' + target,
+            'delete_timestamp': Timestamp(delete_at),
+            'target_path': target,
+            'is_async_delete': is_async_delete,
+        }
+
+    def test_round_robin_order(self):
+        x = expirer.ObjectExpirer(self.conf, logger=self.logger,
+                                  swift=self.fake_swift)
+
+        def make_task(delete_at, target_path, is_async_delete=False):
+            a, c, o = utils.split_path('/' + target_path, 1, 3, True)
+            task_container = self.get_expirer_container(
+                delete_at, a, c or 'c', o or 'o')
+            return self.make_task(task_container, delete_at, target_path,
+                                  is_async_delete=is_async_delete)
+
+        task_con_obj_list = [
+            # objects in 0000 timestamp container
+            make_task('0000', 'a/c0/o0'),
+            make_task('0000', 'a/c0/o1'),
+            # objects in 0001 timestamp container
+            make_task('0001', 'a/c1/o0'),
+            make_task('0001', 'a/c1/o1'),
+            # objects in 0002 timestamp container
+            make_task('0002', 'a/c2/o0'),
+            make_task('0002', 'a/c2/o1'),
+        ]
+        result = list(x.round_robin_order(task_con_obj_list))
+
+        # sorted by popping one object to delete for each target_container
+        expected = [
+            make_task('0000', 'a/c0/o0'),
+            make_task('0001', 'a/c1/o0'),
+            make_task('0002', 'a/c2/o0'),
+            make_task('0000', 'a/c0/o1'),
+            make_task('0001', 'a/c1/o1'),
+            make_task('0002', 'a/c2/o1'),
+        ]
+        self.assertEqual(expected, result)
+
+        # task containers have some task objects with invalid target paths
+        task_con_obj_list = [
+            # objects in 0000 timestamp container
+            make_task('0000', 'invalid0'),
+            make_task('0000', 'a/c0/o0'),
+            make_task('0000', 'a/c0/o1'),
+            # objects in 0001 timestamp container
+            make_task('0001', 'a/c1/o0'),
+            make_task('0001', 'invalid1'),
+            make_task('0001', 'a/c1/o1'),
+            # objects in 0002 timestamp container
+            make_task('0002', 'a/c2/o0'),
+            make_task('0002', 'a/c2/o1'),
+            make_task('0002', 'invalid2'),
+        ]
+        result = list(x.round_robin_order(task_con_obj_list))
+
+        # the invalid task objects are ignored
+        expected = [
+            make_task('0000', 'a/c0/o0'),
+            make_task('0001', 'a/c1/o0'),
+            make_task('0002', 'a/c2/o0'),
+            make_task('0000', 'a/c0/o1'),
+            make_task('0001', 'a/c1/o1'),
+            make_task('0002', 'a/c2/o1'),
+        ]
+        self.assertEqual(expected, result)
+
+        # for a given target container, tasks won't necessarily all go in
+        # the same timestamp container
+        task_con_obj_list = [
+            # objects in 0000 timestamp container
+            make_task('0000', 'a/c0/o0'),
+            make_task('0000', 'a/c0/o1'),
+            make_task('0000', 'a/c2/o2'),
+            make_task('0000', 'a/c2/o3'),
+            # objects in 0001 timestamp container
+            make_task('0001', 'a/c0/o2'),
+            make_task('0001', 'a/c0/o3'),
+            make_task('0001', 'a/c1/o0'),
+            make_task('0001', 'a/c1/o1'),
+            # objects in 0002 timestamp container
+            make_task('0002', 'a/c2/o0'),
+            make_task('0002', 'a/c2/o1'),
+        ]
+        result = list(x.round_robin_order(task_con_obj_list))
+
+        # so we go around popping by *target* container, not *task* container
+        expected = [
+            make_task('0000', 'a/c0/o0'),
+            make_task('0001', 'a/c1/o0'),
+            make_task('0000', 'a/c2/o2'),
+            make_task('0000', 'a/c0/o1'),
+            make_task('0001', 'a/c1/o1'),
+            make_task('0000', 'a/c2/o3'),
+            make_task('0001', 'a/c0/o2'),
+            make_task('0002', 'a/c2/o0'),
+            make_task('0001', 'a/c0/o3'),
+            make_task('0002', 'a/c2/o1'),
+        ]
+        self.assertEqual(expected, result)
+
+        # all of the work to be done could be for different target containers
+        task_con_obj_list = [
+            # objects in 0000 timestamp container
+            make_task('0000', 'a/c0/o'),
+            make_task('0000', 'a/c1/o'),
+            make_task('0000', 'a/c2/o'),
+            make_task('0000', 'a/c3/o'),
+            # objects in 0001 timestamp container
+            make_task('0001', 'a/c4/o'),
+            make_task('0001', 'a/c5/o'),
+            make_task('0001', 'a/c6/o'),
+            make_task('0001', 'a/c7/o'),
+            # objects in 0002 timestamp container
+            make_task('0002', 'a/c8/o'),
+            make_task('0002', 'a/c9/o'),
+        ]
+        result = list(x.round_robin_order(task_con_obj_list))
+
+        # in which case, we kind of hammer the task containers
+        self.assertEqual(task_con_obj_list, result)
+
+    def test_hash_mod(self):
+        x = expirer.ObjectExpirer(self.conf, logger=self.logger,
+                                  swift=self.fake_swift)
+        mod_count = [0, 0, 0]
+        for i in range(1000):
+            name = 'obj%d' % i
+            mod = x.hash_mod(name, 3)
+            mod_count[mod] += 1
+
+        # 1000 names are well shuffled
+        self.assertGreater(mod_count[0], 300)
+        self.assertGreater(mod_count[1], 300)
+        self.assertGreater(mod_count[2], 300)
+
+    def test_iter_task_accounts_to_expire(self):
+        x = expirer.ObjectExpirer(self.conf, logger=self.logger,
+                                  swift=self.fake_swift)
+        results = [_ for _ in x.iter_task_accounts_to_expire()]
+        self.assertEqual(results, [('.expiring_objects', 0, 1)])
+
+        self.conf['processes'] = '2'
+        self.conf['process'] = '1'
+        x = expirer.ObjectExpirer(self.conf, logger=self.logger,
+                                  swift=self.fake_swift)
+        results = [_ for _ in x.iter_task_accounts_to_expire()]
+        self.assertEqual(results, [('.expiring_objects', 1, 2)])
 
     def test_run_once_nothing_to_do(self):
-        x = expirer.ObjectExpirer({})
-        x.logger = FakeLogger()
+        x = expirer.ObjectExpirer(self.conf, logger=self.logger,
+                                  swift=self.fake_swift)
         x.swift = 'throw error because a string does not have needed methods'
         x.run_once()
-        self.assertEquals(x.logger.log_dict['exception'],
-                          [(("Unhandled exception",), {},
-                            "'str' object has no attribute "
-                            "'get_account_info'")])
+        self.assertEqual(x.logger.get_lines_for_level('error'),
+                         ["Unhandled exception: "])
+        log_args, log_kwargs = x.logger.log_dict['error'][0]
+        self.assertEqual(str(log_kwargs['exc_info'][1]),
+                         "'str' object has no attribute 'get_account_info'")
 
     def test_run_once_calls_report(self):
-        class InternalClient(object):
-            def get_account_info(*a, **kw):
-                return 1, 2
-
-            def iter_containers(*a, **kw):
-                return []
-
-        x = expirer.ObjectExpirer({})
-        x.logger = FakeLogger()
-        x.swift = InternalClient()
+        with mock.patch.object(self.expirer, 'pop_queue',
+                               lambda a, c, o: None):
+            self.expirer.run_once()
+        self.assertEqual(
+            self.expirer.logger.get_lines_for_level('info'), [
+                'Pass beginning for task account .expiring_objects; '
+                '4 possible containers; 12 possible objects',
+                'Pass completed in 0s; 10 objects expired',
+            ])
+
+    def test_run_once_rate_limited(self):
+        x = expirer.ObjectExpirer(
+            dict(self.conf, tasks_per_second=2),
+            logger=self.logger,
+            swift=self.fake_swift)
+        x.pop_queue = lambda a, c, o: None
+
+        calls = []
+
+        def fake_ratelimiter(iterator, elements_per_second):
+            captured_iter = list(iterator)
+            calls.append((captured_iter, elements_per_second))
+            return captured_iter
+
+        with mock.patch('swift.obj.expirer.RateLimitedIterator',
+                        side_effect=fake_ratelimiter):
+            x.run_once()
+        self.assertEqual(calls, [([
+            self.make_task(self.past_time_container, self.past_time,
+                           target_path)
+            for target_path in self.expired_target_paths[self.past_time]
+        ] + [
+            self.make_task(self.just_past_time_container, self.just_past_time,
+                           target_path)
+            for target_path in self.expired_target_paths[self.just_past_time]
+        ], 2)])
+
+    def test_skip_task_account_without_task_container(self):
+        fake_swift = FakeInternalClient({
+            # task account has no containers
+            '.expiring_objects': dict()
+        })
+        x = expirer.ObjectExpirer(self.conf, logger=self.logger,
+                                  swift=fake_swift)
         x.run_once()
-        self.assertEquals(
-            x.logger.log_dict['info'],
-            [(('Pass beginning; 1 possible containers; '
-               '2 possible objects',), {}),
-             (('Pass completed in 0s; 0 objects expired',), {})])
-
-    def test_container_timestamp_break(self):
-        class InternalClient(object):
-            def __init__(self, containers):
-                self.containers = containers
+        self.assertEqual(
+            x.logger.get_lines_for_level('info'), [
+                'Pass completed in 0s; 0 objects expired',
+            ])
+
+    def test_get_task_containers_unexpected_container(self):
+        expected = self.get_expirer_container(time())
+        unexpected = str(int(expected) - 200)
+        for name in (expected, unexpected):
+            self.assertTrue(name.isdigit())  # sanity
+
+        container_list = [{'name': unexpected}, {'name': expected}]
+        with mock.patch.object(self.expirer.swift, 'iter_containers',
+                               return_value=container_list):
+            self.assertEqual(
+                self.expirer.get_task_containers_to_expire('task_account'),
+                [unexpected, expected])
+        self.assertEqual(self.expirer.logger.all_log_lines(), {'info': [
+            'processing 1 unexpected task containers (e.g. %s)' % unexpected,
+        ]})
+
+    def test_get_task_containers_invalid_container(self):
+        ok_names = ['86301', '86400']
+        bad_names = ['-1', 'rogue']
+        unexpected = ['86300', '86401']
+
+        container_list = [{'name': name} for name in bad_names] + \
+                         [{'name': name} for name in ok_names] + \
+                         [{'name': name} for name in unexpected]
+        with mock.patch.object(self.expirer.swift, 'iter_containers',
+                               return_value=container_list):
+            self.assertEqual(
+                self.expirer.get_task_containers_to_expire('task_account'),
+                ok_names + unexpected)
+        lines = self.expirer.logger.get_lines_for_level('error')
+        self.assertEqual(lines, [
+            'skipping invalid task container: task_account/-1',
+            'skipping invalid task container: task_account/rogue',
+        ])
+        lines = self.expirer.logger.get_lines_for_level('info')
+        self.assertEqual(lines, [
+            'processing 2 unexpected task containers (e.g. 86300 86401)'
+        ])
+
+    def _expirer_run_once_with_mocks(self, now=None, stub_pop_queue=None):
+        """
+        call self.expirer.run_once() with some things (optionally) stubbed out
+        """
+        now = now or time()
+        # IME abuse of MagicMock's call tracking will pop OOM
+        memory_efficient_noop = lambda *args, **kwargs: None
+        stub_pop_queue = stub_pop_queue or memory_efficient_noop
+        memory_efficient_time = lambda: now
+        with mock.patch.object(self.expirer, 'pop_queue', stub_pop_queue), \
+                mock.patch('eventlet.sleep', memory_efficient_noop), \
+                mock.patch('swift.common.utils.timestamp.time.time',
+                           memory_efficient_time), \
+                mock.patch('swift.obj.expirer.time', memory_efficient_time):
+            self.expirer.run_once()
+
+    def test_run_once_with_invalid_container(self):
+        now = time()
+        t0 = Timestamp(now - 100000)
+        t1 = Timestamp(now - 10000)
+        normal_task_container = self.get_expirer_container(t0)
+        self.assertTrue(normal_task_container.isdigit())
+        next_task_container = self.get_expirer_container(t1)
+        for name in (normal_task_container, next_task_container):
+            self.assertTrue(name.isdigit())  # sanity
+
+        strange_task_container = normal_task_container + '-crazy'
+        self.assertFalse(strange_task_container.isdigit())
+
+        task_per_container = 3
+        self._setup_fake_swift({
+            '.expiring_objects': {
+                normal_task_container: [
+                    expirer.build_task_obj(t0, 'a', 'c1', 'o%s' % i)
+                    for i in range(task_per_container)
+                ],
+                strange_task_container: [
+                    expirer.build_task_obj(t0, 'a', 'c2', 'o%s' % i)
+                    for i in range(task_per_container)
+                ],
+                next_task_container: [
+                    expirer.build_task_obj(t1, 'a', 'c3', 'o%s' % i)
+                    for i in range(task_per_container)
+                ],
+            }
+        })
+        # sanity
+        self.assertEqual(
+            sorted(self.expirer.swift.aco_dict['.expiring_objects'].keys()), [
+                normal_task_container,
+                strange_task_container,
+                next_task_container,
+            ])
+        self._expirer_run_once_with_mocks(now=now)
+        # we processed all tasks in all valid containers
+        self.assertEqual(task_per_container * 2, self.expirer.report_objects)
+
+    def test_iter_task_to_expire(self):
+        # In this test, all tasks are assigned to the tested expirer
+        my_index = 0
+        divisor = 1
+
+        # empty container gets deleted inline
+        task_account_container_list = [
+            ('.expiring_objects', self.empty_time_container)
+        ]
+        with mock.patch.object(self.expirer.swift, 'delete_container') \
+                as mock_delete_container:
+            self.assertEqual(
+                list(self.expirer.iter_task_to_expire(
+                    task_account_container_list, my_index, divisor)),
+                [])
+        self.assertEqual(mock_delete_container.mock_calls, [
+            mock.call('.expiring_objects', self.empty_time_container,
+                      acceptable_statuses=(2, 404, 409))])
+        self.assertEqual(
+            {}, self.expirer.logger.statsd_client.get_stats_counts())
+
+        # 404 (account/container list race) gets deleted inline
+        task_account_container_list = [
+            ('.expiring_objects', 'does-not-matter')
+        ]
+        with mock.patch.object(self.expirer.swift, 'delete_container') \
+                as mock_delete_container:
+            self.assertEqual(
+                list(self.expirer.iter_task_to_expire(
+                    task_account_container_list, my_index, divisor)),
+                [])
+        self.assertEqual(mock_delete_container.mock_calls, [
+            mock.call('.expiring_objects', 'does-not-matter',
+                      acceptable_statuses=(2, 404, 409))])
+        self.assertEqual(
+            {}, self.expirer.logger.statsd_client.get_stats_counts())
+
+        # ready containers are processed
+        task_account_container_list = [
+            ('.expiring_objects', self.past_time_container)]
+
+        expected = [
+            self.make_task(self.past_time_container, self.past_time,
+                           target_path)
+            for target_path in self.expired_target_paths[self.past_time]]
+
+        with mock.patch.object(self.expirer.swift, 'delete_container') \
+                as mock_delete_container:
+            self.assertEqual(
+                list(self.expirer.iter_task_to_expire(
+                    task_account_container_list, my_index, divisor)),
+                expected)
+        # not empty; not deleted
+        self.assertEqual(mock_delete_container.mock_calls, [])
+        self.assertEqual(
+            {'tasks.assigned': 5},
+            self.expirer.logger.statsd_client.get_stats_counts()
+        )
+
+        # the task queue has invalid task object
+        self.expirer.logger.statsd_client.clear()
+        invalid_aco_dict = deepcopy(self.fake_swift.aco_dict)
+        invalid_aco_dict['.expiring_objects'][self.past_time_container].insert(
+            0, self.past_time + '-invalid0')
+        invalid_aco_dict['.expiring_objects'][self.past_time_container].insert(
+            5, self.past_time + '-invalid1')
+        invalid_fake_swift = FakeInternalClient(invalid_aco_dict)
+        x = expirer.ObjectExpirer(self.conf, logger=self.logger,
+                                  swift=invalid_fake_swift)
+
+        # but the invalid tasks are skipped
+        self.assertEqual(
+            list(x.iter_task_to_expire(
+                task_account_container_list, my_index, divisor)),
+            expected)
+        self.assertEqual(
+            {'tasks.assigned': 5, 'tasks.parse_errors': 2},
+            self.expirer.logger.statsd_client.get_stats_counts()
+        )
+
+        # test some of that async delete
+        self.expirer.logger.statsd_client.clear()
+        async_delete_aco_dict = {
+            '.expiring_objects': {
+                # this task container will be checked
+                self.past_time_container: [
+                    # tasks ready for execution
+                    {'name': self.past_time + '-a0/c0/o0',
+                     'content_type': 'application/async-deleted'},
+                    {'name': self.past_time + '-a1/c1/o1',
+                     'content_type': 'application/async-deleted'},
+                    {'name': self.past_time + '-a2/c2/o2',
+                     'content_type': 'application/async-deleted'},
+                    {'name': self.past_time + '-a3/c3/o3',
+                     'content_type': 'application/async-deleted'},
+                    {'name': self.past_time + '-a4/c4/o4',
+                     'content_type': 'application/async-deleted'},
+                    {'name': self.past_time + '-a5/c5/o5',
+                     'content_type': 'application/async-deleted'},
+                    {'name': self.past_time + '-a6/c6/o6',
+                     'content_type': 'application/async-deleted'},
+                    {'name': self.past_time + '-a7/c7/o7',
+                     'content_type': 'application/async-deleted'},
+                    # task objects for unicode test
+                    {'name': self.past_time + u'-a8/c8/o8\u2661',
+                     'content_type': 'application/async-deleted'},
+                    {'name': self.past_time + u'-a9/c9/o9\xf8',
+                     'content_type': 'application/async-deleted'},
+                ]
+            }
+        }
+        async_delete_fake_swift = FakeInternalClient(async_delete_aco_dict)
+        x = expirer.ObjectExpirer(self.conf, logger=self.logger,
+                                  swift=async_delete_fake_swift)
+
+        expected = [
+            self.make_task(self.past_time_container, self.past_time,
+                           target_path, is_async_delete=True)
+            for target_path in (
+                self.expired_target_paths[self.past_time] +
+                self.expired_target_paths[self.just_past_time]
+            )
+        ]
 
-            def get_account_info(*a, **kw):
-                return 1, 2
+        found = list(x.iter_task_to_expire(
+            task_account_container_list, my_index, divisor))
+
+        self.assertEqual(expected, found)
+        self.assertEqual(
+            {'tasks.assigned': 10},
+            self.expirer.logger.statsd_client.get_stats_counts()
+        )
+
+    def test_iter_task_to_expire_with_skipped_tasks_single_process(self):
+        # Only one task is assigned to the tested expirer
+        my_index = 0
+        divisor = 10
+        task_account_container_list = [
+            (".expiring_objects", self.past_time_container)
+        ]
 
-            def iter_containers(self, *a, **kw):
-                return self.containers
+        expected = [
+            self.make_task(
+                self.past_time_container,
+                self.past_time,
+                self.expired_target_paths[self.past_time][0],
+            )
+        ]
+        # Use mock of hash_mod to output predictable result.
+        with mock.patch.object(self.expirer, "hash_mod",
+                               side_effect=itertools.cycle(range(10))):
+            self.assertEqual(
+                expected,
+                list(
+                    self.expirer.iter_task_to_expire(
+                        task_account_container_list, my_index, divisor
+                    )
+                )
+            )
+        self.assertEqual(
+            {"tasks.assigned": 1, "tasks.skipped": 4},
+            self.expirer.logger.statsd_client.get_stats_counts()
+        )
+
+    def test_iter_task_to_expire_with_skipped_tasks_multi_processes(self):
+        processes = 10
+        task_account_container_list = [
+            (".expiring_objects", self.past_time_container),
+            (".expiring_objects", self.just_past_time_container),
+            (".expiring_objects", self.future_time_container),
+        ]
 
-            def iter_objects(*a, **kw):
-                raise Exception('This should not have been called')
+        total_tasks = 0
+        for i in range(processes):
+            yielded_tasks = list(
+                self.expirer.iter_task_to_expire(
+                    task_account_container_list, i, processes
+                ))
+            total_tasks += len(yielded_tasks)
+        # Ten tasks, each process gets 1 on average.
+        # N.B. each process may get 0 or multiple tasks, since hash_mod is
+        # based on names of current time.
+        self.assertEqual(10, total_tasks)
+
+        # On average, each process was assigned 1 task and skipped 9
+        self.assertEqual({
+            'tasks.assigned': 10,
+            'tasks.skipped': 90,
+        }, self.expirer.logger.statsd_client.get_stats_counts())
+
+    def test_iter_task_to_expire_with_skipped_and_delayed_tasks(self):
+        divisor = 3
+        task_account_container_list = [
+            (".expiring_objects", self.past_time_container),
+            (".expiring_objects", self.just_past_time_container),
+        ]
+        expected_task_paths = [
+            path
+            for path in sorted(self.expired_target_paths[self.past_time] +
+                               self.expired_target_paths[self.just_past_time])
+            if not path.startswith('a1')  # delayed task
+        ]
+        self.assertEqual(9, len(expected_task_paths))  # sanity check
+
+        actual_task_paths = []
+        proc_stats = defaultdict(int)
+        for process in range(divisor):
+            self.conf['delay_reaping_a1'] = 2 * 86400
+            self.conf['process'] = process
+            self.conf['processes'] = 3
+            x = expirer.ObjectExpirer(self.conf, logger=debug_logger(),
+                                      swift=self.fake_swift)
+            actual_task_paths.extend(
+                sorted([task['target_path'] for task in
+                       x.iter_task_to_expire(
+                        task_account_container_list, process, divisor)]))
+            for k, v in x.logger.statsd_client.get_stats_counts().items():
+                proc_stats[k] += v
+
+        self.assertEqual(
+            {"tasks.skipped": 20,
+             "tasks.delayed": 1,
+             "tasks.assigned": 9},
+            proc_stats,
+        )
+        self.assertEqual(expected_task_paths, sorted(actual_task_paths))
+
+    def test_iter_task_to_expire_with_delay_reaping(self):
+        aco_dict = {
+            '.expiring_objects': {
+                self.past_time_container: [
+                    # tasks well past ready for execution
+                    {'name': self.past_time + '-a0/c0/o0'},
+                    {'name': self.past_time + '-a1/c1/o1'},
+                    {'name': self.past_time + '-a1/c2/o2'},
+                ],
+                self.just_past_time_container: [
+                    # tasks only just ready for execution
+                    {'name': self.just_past_time + '-a0/c0/o0'},
+                    {'name': self.just_past_time + '-a1/c1/o1'},
+                    {'name': self.just_past_time + '-a1/c2/o2'},
+                ],
+                self.future_time_container: [
+                    # tasks not yet ready for execution
+                    {'name': self.future_time + '-a0/c0/o0'},
+                    {'name': self.future_time + '-a1/c1/o1'},
+                    {'name': self.future_time + '-a1/c2/o2'},
+                ],
+            }
+        }
+        fake_swift = FakeInternalClient(aco_dict)
+        # sanity, no accounts configured with delay_reaping
+        x = expirer.ObjectExpirer(self.conf, logger=self.logger,
+                                  swift=fake_swift)
+        # ... we expect tasks past time to yield
+        expected = [
+            self.make_task(self.past_time_container, self.past_time,
+                           target_path)
+            for target_path in (
+                swob.wsgi_to_str(tgt) for tgt in (
+                    'a0/c0/o0',
+                    'a1/c1/o1',
+                    'a1/c2/o2',
+                )
+            )
+        ] + [
+            self.make_task(self.just_past_time_container, self.just_past_time,
+                           target_path)
+            for target_path in (
+                swob.wsgi_to_str(tgt) for tgt in (
+                    'a0/c0/o0',
+                    'a1/c1/o1',
+                    'a1/c2/o2',
+                )
+            )
+        ]
+        task_account_container_list = [
+            ('.expiring_objects', self.past_time_container),
+            ('.expiring_objects', self.just_past_time_container),
+        ]
+        observed = list(x.iter_task_to_expire(
+            task_account_container_list, 0, 1))
+        self.assertEqual(expected, observed)
+        self.assertEqual(
+            {'tasks.assigned': 6},
+            self.expirer.logger.statsd_client.get_stats_counts()
+        )
+
+        # configure delay for account a1
+        self.expirer.logger.statsd_client.clear()
+        self.conf['delay_reaping_a1'] = 300.0
+        x = expirer.ObjectExpirer(self.conf, logger=self.logger,
+                                  swift=fake_swift)
+        # ... and we don't expect *recent* a1 tasks or future tasks
+        expected = [
+            self.make_task(self.past_time_container, self.past_time,
+                           target_path)
+            for target_path in (
+                swob.wsgi_to_str(tgt) for tgt in (
+                    'a0/c0/o0',
+                    'a1/c1/o1',
+                    'a1/c2/o2',
+                )
+            )
+        ] + [
+            self.make_task(self.just_past_time_container, self.just_past_time,
+                           target_path)
+            for target_path in (
+                swob.wsgi_to_str(tgt) for tgt in (
+                    'a0/c0/o0',
+                )
+            )
+        ]
+        observed = list(x.iter_task_to_expire(
+            task_account_container_list, 0, 1))
+        self.assertEqual(expected, observed)
+        self.assertEqual(
+            {'tasks.assigned': 4, 'tasks.delayed': 2},
+            self.expirer.logger.statsd_client.get_stats_counts()
+        )
+
+        # configure delay for account a1 and for account a1 and container c2
+        # container a1/c2 expires expires almost immediately
+        # but other containers in account a1 remain (a1/c1 and a1/c3)
+        self.expirer.logger.statsd_client.clear()
+        self.conf['delay_reaping_a1'] = 300.0
+        self.conf['delay_reaping_a1/c2'] = 0.1
+        x = expirer.ObjectExpirer(self.conf, logger=self.logger,
+                                  swift=fake_swift)
+        # ... and we don't expect *recent* a1 tasks, excluding c2
+        # or future tasks
+        expected = [
+            self.make_task(self.past_time_container, self.past_time,
+                           target_path)
+            for target_path in (
+                swob.wsgi_to_str(tgt) for tgt in (
+                    'a0/c0/o0',
+                    'a1/c1/o1',
+                    'a1/c2/o2',
+                )
+            )
+        ] + [
+            self.make_task(self.just_past_time_container, self.just_past_time,
+                           target_path)
+            for target_path in (
+                swob.wsgi_to_str(tgt) for tgt in (
+                    'a0/c0/o0',
+                    'a1/c2/o2',
+                )
+            )
+        ]
+        observed = list(x.iter_task_to_expire(
+            task_account_container_list, 0, 1))
+        self.assertEqual(expected, observed)
+        self.assertEqual(
+            {'tasks.assigned': 5, 'tasks.delayed': 1},
+            self.expirer.logger.statsd_client.get_stats_counts()
+        )
+
+        # configure delay for account a1 and for account a1 and container c2
+        # container a1/c2 does not expire but others in account a1 do
+        self.expirer.logger.statsd_client.clear()
+        self.conf['delay_reaping_a1'] = 0.1
+        self.conf['delay_reaping_a1/c2'] = 300.0
+        x = expirer.ObjectExpirer(self.conf, logger=self.logger,
+                                  swift=fake_swift)
+        # ... and we don't expect *recent* a1 tasks, excluding c2
+        # or future tasks
+        expected = [
+            self.make_task(self.past_time_container, self.past_time,
+                           target_path)
+            for target_path in (
+                swob.wsgi_to_str(tgt) for tgt in (
+                    'a0/c0/o0',
+                    'a1/c1/o1',
+                    'a1/c2/o2',
+                )
+            )
+        ] + [
+            self.make_task(self.just_past_time_container, self.just_past_time,
+                           target_path)
+            for target_path in (
+                swob.wsgi_to_str(tgt) for tgt in (
+                    'a0/c0/o0',
+                    'a1/c1/o1',
+                )
+            )
+        ]
+        observed = list(x.iter_task_to_expire(
+            task_account_container_list, 0, 1))
+        self.assertEqual(expected, observed)
+        self.assertEqual(
+            {'tasks.assigned': 5, 'tasks.delayed': 1},
+            self.expirer.logger.statsd_client.get_stats_counts()
+        )
+
+    def test_iter_task_to_expire_with_delay_reaping_is_async(self):
+        aco_dict = {
+            '.expiring_objects': {
+                self.past_time_container: [
+                    # tasks 86400s past ready for execution
+                    {'name': self.past_time + '-a0/c0/o00',
+                     'content_type': 'application/async-deleted'},
+                    {'name': self.past_time + '-a0/c0/o01',
+                     'content_type': 'text/plain'},
+                    {'name': self.past_time + '-a1/c0/o02',
+                     'content_type': 'application/async-deleted'},
+                    {'name': self.past_time + '-a1/c0/o03',
+                     'content_type': 'text/plain'},
+                    {'name': self.past_time + '-a1/c1/o04',
+                     'content_type': 'application/async-deleted'},
+                    {'name': self.past_time + '-a1/c1/o05',
+                     'content_type': 'text/plain'},
+                ],
+                self.just_past_time_container: [
+                    # tasks only just 1s ready for execution
+                    {'name': self.just_past_time + '-a0/c0/o06',
+                     'content_type': 'application/async-deleted'},
+                    {'name': self.just_past_time + '-a0/c0/o07',
+                     'content_type': 'text/plain'},
+                    {'name': self.just_past_time + '-a1/c0/o08',
+                     'content_type': 'application/async-deleted'},
+                    {'name': self.just_past_time + '-a1/c0/o09',
+                     'content_type': 'text/plain'},
+                    {'name': self.just_past_time + '-a1/c1/o10',
+                     'content_type': 'application/async-deleted'},
+                    {'name': self.just_past_time + '-a1/c1/o11',
+                     'content_type': 'text/plain'},
+                ],
+                self.future_time_container: [
+                    # tasks not yet ready for execution
+                    {'name': self.future_time + '-a0/c0/o12',
+                     'content_type': 'application/async-deleted'},
+                    {'name': self.future_time + '-a0/c0/o13',
+                     'content_type': 'text/plain'},
+                    {'name': self.future_time + '-a1/c0/o14',
+                     'content_type': 'application/async-deleted'},
+                    {'name': self.future_time + '-a1/c0/o15',
+                     'content_type': 'text/plain'},
+                    {'name': self.future_time + '-a1/c1/o16',
+                     'content_type': 'application/async-deleted'},
+                    {'name': self.future_time + '-a1/c1/o17',
+                     'content_type': 'text/plain'},
+                ],
+            }
+        }
+        fake_swift = FakeInternalClient(aco_dict)
+        # no accounts configured with delay_reaping
+        x = expirer.ObjectExpirer(self.conf, logger=self.logger,
+                                  swift=fake_swift)
+        # ... we expect all past async tasks to yield
+        expected = [
+            self.make_task(self.past_time_container, self.past_time,
+                           swob.wsgi_to_str(tgt), is_async_delete=is_async)
+            for (tgt, is_async) in (
+                ('a0/c0/o00', True),
+                ('a0/c0/o01', False),  # a0 no delay
+                ('a1/c0/o02', True),
+                # a1/c0/o03 a1 long delay
+                ('a1/c1/o04', True),
+                ('a1/c1/o05', False),  # c1 short delay
+            )
+        ] + [
+            self.make_task(self.just_past_time_container, self.just_past_time,
+                           swob.wsgi_to_str(tgt), is_async_delete=is_async)
+            for (tgt, is_async) in (
+                ('a0/c0/o06', True),
+                ('a0/c0/o07', False),  # a0 no delay
+                ('a1/c0/o08', True),
+                # a1/c0/o09 a1 delay
+                ('a1/c1/o10', True),  # async
+                # a1/c1/o11 c1 delay
+            )
+        ]
+        # configure delays
+        self.conf['delay_reaping_a1'] = 86500.0
+        self.conf['delay_reaping_a1/c1'] = 300.0
+        x = expirer.ObjectExpirer(self.conf, logger=self.logger,
+                                  swift=fake_swift)
+        # ... and we still expect all past async tasks to yield
+        task_account_container_list = [
+            ('.expiring_objects', self.past_time_container),
+            ('.expiring_objects', self.just_past_time_container),
+            ('.expiring_objects', self.future_time_container),
+        ]
+        observed = list(x.iter_task_to_expire(
+            task_account_container_list, 0, 1))
+        self.assertEqual(expected, observed)
+
+    def test_iter_task_to_expire_unexpected_response(self):
+        # Test that object listing on the first container returns 503 and raise
+        # UnexpectedResponse, and expect the second task container will
+        # continue to be processed.
+
+        self.expirer.swift.aco_dict['.expiring_objects'][
+            self.just_past_time_container] = \
+            internal_client.UnexpectedResponse(
+                'Mocked error', Response(status=503))
+
+        with mock.patch.object(self.expirer, 'pop_queue'):
+            self.expirer.run_once()
+        # everything but the broken container
+        expected = sorted(
+            p
+            for c, paths in self.expired_target_paths.items()
+            for p in paths
+            if c != self.just_past_time
+        )
+        self.assertEqual(
+            expected, sorted(
+                path
+                for method, path, kwargs in self.expirer.swift._calls
+                if method == 'delete_object'
+            ))
+        self.assertEqual(
+            [('.expiring_objects/%s' % self.empty_time_container,
+              {'acceptable_statuses': (2, 404, 409)})], [
+                (path, kwargs)
+                for method, path, kwargs in self.expirer.swift._calls
+                if method == 'delete_container'
+            ])
+
+        log_lines = self.logger.get_lines_for_level('error')
+        self.assertEqual(
+            log_lines,
+            ['Unexpected response while listing objects in container '
+             '.expiring_objects %s: Mocked error'
+             % self.just_past_time_container]
+        )
+        self.assertEqual(
+            {'tasks.assigned': 5, 'objects': 5},
+            self.expirer.logger.statsd_client.get_stats_counts()
+        )
+
+    def test_iter_task_to_expire_exception(self):
+        # Test that object listing on the first container raise Exception, and
+        # expect the second task container will continue to be processed.
+
+        self.expirer.swift.aco_dict['.expiring_objects'][
+            self.just_past_time_container] = Exception('failed to connect')
+
+        with mock.patch.object(self.expirer, 'pop_queue'):
+            self.expirer.run_once()
+
+        # everything but the broken container
+        expected = sorted(
+            p
+            for c, paths in self.expired_target_paths.items()
+            for p in paths
+            if c != self.just_past_time
+        )
+        self.assertEqual(expected, sorted(
+            path
+            for method, path, kwargs in self.expirer.swift._calls
+            if method == 'delete_object'
+        ))
+        self.assertEqual(
+            [('.expiring_objects/%s' % self.empty_time_container,
+              {'acceptable_statuses': (2, 404, 409)})], [
+                (path, kwargs)
+                for method, path, kwargs in self.expirer.swift._calls
+                if method == 'delete_container'
+            ])
+
+        log_lines = self.logger.get_lines_for_level('error')
+        self.assertEqual(
+            log_lines,
+            ['Exception while listing objects in container '
+             '.expiring_objects %s: failed to connect'
+             % self.just_past_time_container]
+        )
+        self.assertEqual(
+            {'tasks.assigned': 5, 'objects': 5},
+            self.expirer.logger.statsd_client.get_stats_counts()
+        )
+
+    def test_iter_task_to_expire_404_response_on_missing_container(self):
+        # Test that object listing on a missing container returns 404 and
+        # raise UnexpectedResponse, and expect ``iter_task_to_expire`` won't
+        # delete this task container.
+        missing_time = str(self.now - 172800)
+        missing_time_container = self.get_expirer_container(missing_time)
+        self.expirer.swift.aco_dict[
+            '.expiring_objects'][missing_time_container] = \
+            internal_client.UnexpectedResponse(
+                'Mocked error', Response(status=404))
+
+        with mock.patch.object(self.expirer, 'pop_queue'):
+            self.expirer.run_once()
+
+        # all containers iter'd
+        self.assertEqual([
+            ('.expiring_objects/%s' % c, {'acceptable_statuses': [2]})
+            for c in [
+                self.empty_time_container,
+                missing_time_container,
+                self.past_time_container,
+                self.just_past_time_container,
+            ]
+        ], [
+            (path, kwargs) for method, path, kwargs in
+            self.expirer.swift._calls
+            if method == 'iter_objects'
+        ])
+        # everything is still expired
+        expected = sorted(
+            p
+            for c, paths in self.expired_target_paths.items()
+            for p in paths
+        )
+        self.assertEqual(expected, sorted(
+            path
+            for method, path, kwargs in self.expirer.swift._calls
+            if method == 'delete_object'
+        ))
+        # Only the empty task container gets deleted.
+        self.assertEqual(
+            [('.expiring_objects/%s' % self.empty_time_container,
+              {'acceptable_statuses': (2, 404, 409)})], [
+                (path, kwargs)
+                for method, path, kwargs in self.expirer.swift._calls
+                if method == 'delete_container'
+            ])
+
+        log_lines = self.logger.get_lines_for_level('error')
+        self.assertFalse(log_lines)
+
+    def test_iter_task_to_expire_503_response_on_container(self):
+        # Test that object listing on a container returns 503 and raise
+        # UnexpectedResponse, and expect ``iter_task_to_expire`` won't delete
+        # this task container.
+        missing_time = str(self.now - 172800)
+        missing_time_container = self.get_expirer_container(missing_time)
+        self.expirer.swift.aco_dict[
+            '.expiring_objects'][missing_time_container] = \
+            internal_client.UnexpectedResponse(
+                'Mocked error', Response(status=503))
+
+        with mock.patch.object(self.expirer, 'pop_queue'):
+            self.expirer.run_once()
+
+        # all containers iter'd
+        self.assertEqual([
+            ('.expiring_objects/%s' % c, {'acceptable_statuses': [2]})
+            for c in [
+                self.empty_time_container,
+                missing_time_container,
+                self.past_time_container,
+                self.just_past_time_container,
+            ]
+        ], [
+            (path, kwargs) for method, path, kwargs in
+            self.expirer.swift._calls
+            if method == 'iter_objects'
+        ])
+        # everything is still expired
+        expected = sorted(
+            path
+            for c, paths in self.expired_target_paths.items()
+            for path in paths
+        )
+        self.assertEqual(expected, sorted(
+            path
+            for method, path, kwargs in self.expirer.swift._calls
+            if method == 'delete_object'
+        ))
+        # Only the empty task container gets deleted.
+        self.assertEqual(
+            [('.expiring_objects/%s' % self.empty_time_container,
+              {'acceptable_statuses': (2, 404, 409)})], [
+                (path, kwargs)
+                for method, path, kwargs in self.expirer.swift._calls
+                if method == 'delete_container'
+            ])
+
+        log_lines = self.logger.get_lines_for_level('error')
+        self.assertEqual(
+            log_lines[0],
+            'Unexpected response while listing objects in container '
+            '.expiring_objects %s: Mocked error'
+            % missing_time_container,
+        )
+
+    def test_run_once_unicode_problem(self):
+        requests = []
+
+        def capture_requests(ipaddr, port, method, path, *args, **kwargs):
+            requests.append((method, path))
+
+        # 3 DELETE requests for each 10 executed task objects to pop_queue
+        code_list = [200] * 3 * 10
+        with mocked_http_conn(*code_list, give_connect=capture_requests):
+            self.expirer.run_once()
+        self.assertEqual(len(requests), 30)
 
-        x = expirer.ObjectExpirer({})
-        x.logger = FakeLogger()
-        x.swift = InternalClient([{'name': str(int(time() + 86400))}])
-        x.run_once()
-        for exccall in x.logger.log_dict['exception']:
-            self.assertTrue(
-                'This should not have been called' not in exccall[0][0])
-        self.assertEquals(
-            x.logger.log_dict['info'],
-            [(('Pass beginning; 1 possible containers; '
-               '2 possible objects',), {}),
-             (('Pass completed in 0s; 0 objects expired',), {})])
-
-        # Reverse test to be sure it still would blow up the way expected.
-        x = expirer.ObjectExpirer({})
-        x.logger = FakeLogger()
-        x.swift = InternalClient([{'name': str(int(time() - 86400))}])
-        x.run_once()
-        self.assertEquals(x.logger.log_dict['exception'],
-            [(('Unhandled exception',), {},
-              str(Exception('This should not have been called')))])
+    def test_container_timestamp_break(self):
+        with mock.patch.object(self.fake_swift, 'iter_objects') as mock_method:
+            self.expirer.run_once()
+
+        # iter_objects is called only for past_time, not future_time
+        self.assertEqual(mock_method.call_args_list, [
+            mock.call('.expiring_objects',
+                      self.empty_time_container,
+                      acceptable_statuses=[2]),
+            mock.call('.expiring_objects',
+                      self.past_time_container,
+                      acceptable_statuses=[2]),
+            mock.call('.expiring_objects',
+                      self.just_past_time_container,
+                      acceptable_statuses=[2])])
 
     def test_object_timestamp_break(self):
-        class InternalClient(object):
-            def __init__(self, containers, objects):
-                self.containers = containers
-                self.objects = objects
-
-            def get_account_info(*a, **kw):
-                return 1, 2
-
-            def iter_containers(self, *a, **kw):
-                return self.containers
-
-            def delete_container(*a, **kw):
-                pass
-
-            def iter_objects(self, *a, **kw):
-                return self.objects
-
-        def should_not_be_called(*a, **kw):
-            raise Exception('This should not have been called')
-
-        x = expirer.ObjectExpirer({})
-        x.logger = FakeLogger()
-        x.swift = InternalClient([{'name': str(int(time() - 86400))}],
-            [{'name': '%d-actual-obj' % int(time() + 86400)}])
-        x.run_once()
-        for exccall in x.logger.log_dict['exception']:
-            self.assertTrue(
-                'This should not have been called' not in exccall[0][0])
-        self.assertEquals(x.logger.log_dict['info'],
-            [(('Pass beginning; 1 possible containers; '
-               '2 possible objects',), {}),
-             (('Pass completed in 0s; 0 objects expired',), {})])
-
-        # Reverse test to be sure it still would blow up the way expected.
-        x = expirer.ObjectExpirer({})
-        x.logger = FakeLogger()
-        ts = int(time() - 86400)
-        x.swift = InternalClient([{'name': str(int(time() - 86400))}],
-            [{'name': '%d-actual-obj' % ts}])
-        x.delete_actual_object = should_not_be_called
-        x.run_once()
-        excswhiledeleting = []
-        for exccall in x.logger.log_dict['exception']:
-            if exccall[0][0].startswith('Exception while deleting '):
-                excswhiledeleting.append(exccall[0][0])
-        self.assertEquals(excswhiledeleting,
-            ['Exception while deleting object %d %d-actual-obj '
-             'This should not have been called' % (ts, ts)])
+        with mock.patch.object(self.expirer, 'delete_actual_object') \
+                as mock_method, \
+                mock.patch.object(self.expirer, 'pop_queue'):
+            self.expirer.run_once()
+
+        # executed tasks are with past time
+        self.assertEqual(
+            mock_method.call_args_list,
+            [mock.call(target_path, self.past_time, False)
+             for target_path in self.expired_target_paths[self.past_time]] +
+            [mock.call(target_path, self.just_past_time, False)
+             for target_path
+             in self.expired_target_paths[self.just_past_time]])
 
     def test_failed_delete_keeps_entry(self):
-        class InternalClient(object):
-            def __init__(self, containers, objects):
-                self.containers = containers
-                self.objects = objects
-
-            def get_account_info(*a, **kw):
-                return 1, 2
-
-            def iter_containers(self, *a, **kw):
-                return self.containers
-
-            def delete_container(*a, **kw):
-                pass
-
-            def delete_object(*a, **kw):
-                raise Exception('This should not have been called')
-
-            def iter_objects(self, *a, **kw):
-                return self.objects
-
         def deliberately_blow_up(actual_obj, timestamp):
             raise Exception('failed to delete actual object')
 
-        def should_not_get_called(container, obj):
-            raise Exception('This should not have been called')
-
-        x = expirer.ObjectExpirer({})
-        x.logger = FakeLogger()
-        x.iter_containers = lambda: [str(int(time() - 86400))]
-        ts = int(time() - 86400)
-        x.delete_actual_object = deliberately_blow_up
-        x.swift = InternalClient([{'name': str(int(time() - 86400))}],
-            [{'name': '%d-actual-obj' % ts}])
-        x.run_once()
-        excswhiledeleting = []
-        for exccall in x.logger.log_dict['exception']:
-            if exccall[0][0].startswith('Exception while deleting '):
-                excswhiledeleting.append(exccall[0][0])
-        self.assertEquals(excswhiledeleting,
-            ['Exception while deleting object %d %d-actual-obj '
-             'failed to delete actual object' % (ts, ts)])
-        self.assertEquals(x.logger.log_dict['info'],
-            [(('Pass beginning; 1 possible containers; '
-               '2 possible objects',), {}),
-             (('Pass completed in 0s; 0 objects expired',), {})])
-
-        # Reverse test to be sure it still would blow up the way expected.
-        x = expirer.ObjectExpirer({})
-        x.logger = FakeLogger()
-        ts = int(time() - 86400)
-        x.delete_actual_object = lambda o, t: None
-        x.swift = InternalClient([{'name': str(int(time() - 86400))}],
-            [{'name': '%d-actual-obj' % ts}])
-        x.run_once()
-        excswhiledeleting = []
-        for exccall in x.logger.log_dict['exception']:
-            if exccall[0][0].startswith('Exception while deleting '):
-                excswhiledeleting.append(exccall[0][0])
-        self.assertEquals(excswhiledeleting,
-            ['Exception while deleting object %d %d-actual-obj This should '
-             'not have been called' % (ts, ts)])
+        # any tasks are not done
+        with mock.patch.object(self.expirer, 'delete_actual_object',
+                               deliberately_blow_up), \
+                mock.patch.object(self.expirer, 'pop_queue') as mock_method:
+            self.expirer.run_once()
+
+        # no tasks are popped from the queue
+        self.assertEqual(mock_method.call_args_list, [])
+        self.assertEqual(
+            {'errors': 10, 'tasks.assigned': 10},
+            self.expirer.logger.statsd_client.get_stats_counts())
+
+        # all tasks are done
+        self.expirer.logger.clear()
+        with mock.patch.object(self.expirer, 'delete_actual_object',
+                               lambda o, t, b: None), \
+                mock.patch.object(self.expirer, 'pop_queue') as mock_method:
+            self.expirer.run_once()
+
+        # all tasks are popped from the queue
+        self.assertEqual(
+            mock_method.call_args_list,
+            [mock.call('.expiring_objects', self.past_time_container,
+             self.past_time + '-' + target_path)
+             for target_path in self.expired_target_paths[self.past_time]] +
+            [mock.call('.expiring_objects', self.just_past_time_container,
+             self.just_past_time + '-' + target_path)
+             for target_path
+             in self.expired_target_paths[self.just_past_time]])
+        self.assertEqual(
+            {'objects': 10, 'tasks.assigned': 10},
+            self.expirer.logger.statsd_client.get_stats_counts())
 
     def test_success_gets_counted(self):
-        class InternalClient(object):
-            def __init__(self, containers, objects):
-                self.containers = containers
-                self.objects = objects
-
-            def get_account_info(*a, **kw):
-                return 1, 2
-
-            def iter_containers(self, *a, **kw):
-                return self.containers
-
-            def delete_container(*a, **kw):
-                pass
-
-            def delete_object(*a, **kw):
-                pass
-
-            def iter_objects(self, *a, **kw):
-                return self.objects
-
-        x = expirer.ObjectExpirer({})
-        x.logger = FakeLogger()
-        x.delete_actual_object = lambda o, t: None
-        self.assertEquals(x.report_objects, 0)
-        x.swift = InternalClient([{'name': str(int(time() - 86400))}],
-            [{'name': '%d-actual-obj' % int(time() - 86400)}])
-        x.run_once()
-        self.assertEquals(x.report_objects, 1)
-        self.assertEquals(x.logger.log_dict['info'],
-            [(('Pass beginning; 1 possible containers; '
-               '2 possible objects',), {}),
-             (('Pass completed in 0s; 1 objects expired',), {})])
-
-    def test_delete_actual_object_does_not_get_unicode(self):
-        class InternalClient(object):
-            def __init__(self, containers, objects):
-                self.containers = containers
-                self.objects = objects
-
-            def get_account_info(*a, **kw):
-                return 1, 2
-
-            def iter_containers(self, *a, **kw):
-                return self.containers
-
-            def delete_container(*a, **kw):
-                pass
-
-            def delete_object(*a, **kw):
-                pass
-
-            def iter_objects(self, *a, **kw):
-                return self.objects
-
-        got_unicode = [False]
-
-        def delete_actual_object_test_for_unicode(actual_obj, timestamp):
-            if isinstance(actual_obj, unicode):
-                got_unicode[0] = True
-
-        x = expirer.ObjectExpirer({})
-        x.logger = FakeLogger()
-        x.delete_actual_object = delete_actual_object_test_for_unicode
-        self.assertEquals(x.report_objects, 0)
-        x.swift = InternalClient([{'name': str(int(time() - 86400))}],
-            [{'name': u'%d-actual-obj' % int(time() - 86400)}])
-        x.run_once()
-        self.assertEquals(x.report_objects, 1)
-        self.assertEquals(x.logger.log_dict['info'],
-            [(('Pass beginning; 1 possible containers; '
-               '2 possible objects',), {}),
-             (('Pass completed in 0s; 1 objects expired',), {})])
-        self.assertFalse(got_unicode[0])
+        self.assertEqual(self.expirer.report_objects, 0)
+        with mock.patch.object(self.expirer,
+                               'round_robin_task_cache_size', 0), \
+                mock.patch.object(self.expirer, 'delete_actual_object',
+                                  lambda o, t, b: None), \
+                mock.patch.object(self.expirer, 'pop_queue',
+                                  lambda a, c, o: None):
+            self.expirer.run_once()
+        self.assertEqual(self.expirer.report_objects, 10)
+        self.assertEqual(
+            {'tasks.assigned': 10, 'objects': 10},
+            self.expirer.logger.statsd_client.get_stats_counts()
+        )
+
+    def test_delete_actual_object_gets_native_string(self):
+        got_str = [False]
+
+        def delete_actual_object_test_for_string(actual_obj, timestamp,
+                                                 is_async_delete):
+            if isinstance(actual_obj, str):
+                got_str[0] = True
+
+        self.assertEqual(self.expirer.report_objects, 0)
+
+        with mock.patch.object(self.expirer, 'delete_actual_object',
+                               delete_actual_object_test_for_string), \
+                mock.patch.object(self.expirer, 'pop_queue',
+                                  lambda a, c, o: None):
+            self.expirer.run_once()
+
+        self.assertEqual(self.expirer.report_objects, 10)
+        self.assertTrue(got_str[0])
 
     def test_failed_delete_continues_on(self):
-        class InternalClient(object):
-            def __init__(self, containers, objects):
-                self.containers = containers
-                self.objects = objects
-
-            def get_account_info(*a, **kw):
-                return 1, 2
-
-            def iter_containers(self, *a, **kw):
-                return self.containers
-
-            def delete_container(*a, **kw):
-                raise Exception('failed to delete container')
-
-            def delete_object(*a, **kw):
-                pass
-
-            def iter_objects(self, *a, **kw):
-                return self.objects
-
-        def fail_delete_actual_object(actual_obj, timestamp):
-            raise Exception('failed to delete actual object')
-
-        x = expirer.ObjectExpirer({})
-        x.logger = FakeLogger()
-
-        cts = int(time() - 86400)
-        ots = int(time() - 86400)
-
-        containers = [
-            {'name': str(cts)},
-            {'name': str(cts + 1)},
-        ]
-
-        objects = [
-            {'name': '%d-actual-obj' % ots},
-            {'name': '%d-next-obj' % ots}
-        ]
-
-        x.swift = InternalClient(containers, objects)
-        x.delete_actual_object = fail_delete_actual_object
-        x.run_once()
-        excswhiledeleting = []
-        for exccall in x.logger.log_dict['exception']:
-            if exccall[0][0].startswith('Exception while deleting '):
-                excswhiledeleting.append(exccall[0][0])
-        self.assertEquals(excswhiledeleting, [
-            'Exception while deleting object %d %d-actual-obj failed to '
-            'delete actual object' % (cts, ots),
-            'Exception while deleting object %d %d-next-obj failed to '
-            'delete actual object' % (cts, ots),
-            'Exception while deleting container %d failed to delete '
-            'container' % (cts,),
-            'Exception while deleting object %d %d-actual-obj failed to '
-            'delete actual object' % (cts + 1, ots),
-            'Exception while deleting object %d %d-next-obj failed to '
-            'delete actual object' % (cts + 1, ots),
-            'Exception while deleting container %d failed to delete '
-            'container' % (cts + 1,)])
-        self.assertEquals(x.logger.log_dict['info'],
-            [(('Pass beginning; 1 possible containers; '
-               '2 possible objects',), {}),
-             (('Pass completed in 0s; 0 objects expired',), {})])
+        def fail_delete_container(*a, **kw):
+            raise Exception('failed to delete container')
+
+        def fail_delete_actual_object(actual_obj, timestamp, is_async_delete):
+            if timestamp == self.just_past_time:
+                raise Exception('failed to delete actual object')
+
+        with mock.patch.object(self.fake_swift, 'delete_container',
+                               fail_delete_container), \
+                mock.patch.object(self.expirer, 'delete_actual_object',
+                                  fail_delete_actual_object), \
+                mock.patch.object(self.expirer, 'pop_queue') as mock_pop:
+            self.expirer.run_once()
+
+        error_lines = self.expirer.logger.get_lines_for_level('error')
+
+        self.assertEqual(error_lines, [
+            'Exception while deleting container .expiring_objects %s failed '
+            'to delete container: ' % self.empty_time_container
+        ] + [
+            'Exception while deleting object %s %s %s '
+            'failed to delete actual object: ' % (
+                '.expiring_objects', self.just_past_time_container,
+                self.just_past_time + '-' + target_path)
+            for target_path in self.expired_target_paths[self.just_past_time]
+        ])
+        self.assertEqual(self.expirer.logger.get_lines_for_level('info'), [
+            'Pass beginning for task account .expiring_objects; '
+            '4 possible containers; 12 possible objects',
+            'Pass completed in 0s; 5 objects expired',
+        ])
+        self.assertEqual(mock_pop.mock_calls, [
+            mock.call('.expiring_objects', self.past_time_container,
+                      self.past_time + '-' + target_path)
+            for target_path in self.expired_target_paths[self.past_time]
+        ])
+        self.assertEqual(
+            {'errors': 5, 'objects': 5, 'tasks.assigned': 10},
+            self.expirer.logger.statsd_client.get_stats_counts())
 
     def test_run_forever_initial_sleep_random(self):
         global last_not_sleep
@@ -398,23 +2225,16 @@ def raise_system_exit():
             raise SystemExit('test_run_forever')
 
         interval = 1234
-        x = expirer.ObjectExpirer({'__file__': 'unit_test',
-                                   'interval': interval})
-        orig_random = expirer.random
-        orig_sleep = expirer.sleep
-        exc = None
-        try:
-            expirer.random = not_random
-            expirer.sleep = not_sleep
+        x = expirer.ObjectExpirer(
+            {'__file__': 'unit_test', 'interval': interval},
+            swift=self.fake_swift)
+        with mock.patch.object(expirer, 'random', not_random), \
+                mock.patch.object(expirer, 'sleep', not_sleep), \
+                self.assertRaises(SystemExit) as caught:
             x.run_once = raise_system_exit
             x.run_forever()
-        except SystemExit, err:
-            exc = err
-        finally:
-            expirer.random = orig_random
-            expirer.sleep = orig_sleep
-        self.assertEquals(str(err), 'test_run_forever')
-        self.assertEquals(last_not_sleep, 0.5 * interval)
+        self.assertEqual(str(caught.exception), 'test_run_forever')
+        self.assertEqual(last_not_sleep, 0.5 * interval)
 
     def test_run_forever_catches_usual_exceptions(self):
         raises = [0]
@@ -425,22 +2245,77 @@ def raise_exceptions():
                 raise Exception('exception %d' % raises[0])
             raise SystemExit('exiting exception %d' % raises[0])
 
-        x = expirer.ObjectExpirer({})
-        x.logger = FakeLogger()
+        x = expirer.ObjectExpirer({}, logger=self.logger,
+                                  swift=self.fake_swift)
         orig_sleep = expirer.sleep
-        exc = None
         try:
             expirer.sleep = not_sleep
             x.run_once = raise_exceptions
             x.run_forever()
-        except SystemExit, err:
-            exc = err
+        except SystemExit as err:
+            self.assertEqual(str(err), 'exiting exception 2')
         finally:
             expirer.sleep = orig_sleep
-        self.assertEquals(str(err), 'exiting exception 2')
-        self.assertEquals(x.logger.log_dict['exception'],
-                          [(('Unhandled exception',), {},
-                            'exception 1')])
+        self.assertEqual(x.logger.get_lines_for_level('error'),
+                         ['Unhandled exception: '])
+        log_args, log_kwargs = x.logger.log_dict['error'][0]
+        self.assertEqual(str(log_kwargs['exc_info'][1]),
+                         'exception 1')
+
+    def test_run_forever_bad_process_values_config(self):
+        conf = {
+            'processes': -1,
+            'process': -2,
+            'interval': 1,
+        }
+        iterations = [0]
+
+        def wrap_with_exit(orig_f, exit_after_count=3):
+            def wrapped_f(*args, **kwargs):
+                iterations[0] += 1
+                if iterations[0] > exit_after_count:
+                    raise SystemExit('that is enough for now')
+                return orig_f(*args, **kwargs)
+            return wrapped_f
+
+        with self.assertRaises(ValueError) as ctx:
+            # we should blow up here
+            x = expirer.ObjectExpirer(conf, logger=self.logger,
+                                      swift=self.fake_swift)
+            x.pop_queue = lambda a, c, o: None
+            x.run_once = wrap_with_exit(x.run_once)
+            # at least we should hopefully we blow up here?
+            x.run_forever()
+
+        # bad config should exit immediately with ValueError
+        self.assertIn('must be a non-negative integer', str(ctx.exception))
+
+    def test_run_forever_bad_process_values_command_line(self):
+        conf = {
+            'interval': 1,
+        }
+        bad_kwargs = {
+            'processes': -1,
+            'process': -2,
+        }
+        iterations = [0]
+
+        def wrap_with_exit(orig_f, exit_after_count=3):
+            def wrapped_f(*args, **kwargs):
+                iterations[0] += 1
+                if iterations[0] > exit_after_count:
+                    raise SystemExit('that is enough for now')
+                return orig_f(*args, **kwargs)
+            return wrapped_f
+
+        with self.assertRaises(ValueError) as ctx:
+            x = expirer.ObjectExpirer(conf, logger=self.logger,
+                                      swift=self.fake_swift)
+            x.run_once = wrap_with_exit(x.run_once)
+            x.run_forever(**bad_kwargs)
+
+        # bad command args should exit immediately with ValueError
+        self.assertIn('must be a non-negative integer', str(ctx.exception))
 
     def test_delete_actual_object(self):
         got_env = [None]
@@ -450,16 +2325,16 @@ def fake_app(env, start_response):
             start_response('204 No Content', [('Content-Length', '0')])
             return []
 
-        internal_client.loadapp = lambda x: fake_app
-
-        x = expirer.ObjectExpirer({})
-        ts = '1234'
-        x.delete_actual_object('/path/to/object', ts)
-        self.assertEquals(got_env[0]['HTTP_X_IF_DELETE_AT'], ts)
+        x = expirer.ObjectExpirer({}, swift=self.make_fake_ic(fake_app))
+        ts = Timestamp('1234')
+        x.delete_actual_object('path/to/object', ts, False)
+        self.assertEqual(got_env[0]['HTTP_X_IF_DELETE_AT'], ts)
+        self.assertEqual(got_env[0]['HTTP_X_TIMESTAMP'],
+                         got_env[0]['HTTP_X_IF_DELETE_AT'])
+        self.assertEqual(
+            got_env[0]['HTTP_X_BACKEND_CLEAN_EXPIRING_OBJECT_QUEUE'], 'no')
 
-    def test_delete_actual_object_nourlquoting(self):
-        # delete_actual_object should not do its own url quoting because
-        # internal client's make_request handles that.
+    def test_delete_actual_object_bulk(self):
         got_env = [None]
 
         def fake_app(env, start_response):
@@ -467,55 +2342,174 @@ def fake_app(env, start_response):
             start_response('204 No Content', [('Content-Length', '0')])
             return []
 
-        internal_client.loadapp = lambda x: fake_app
-
-        x = expirer.ObjectExpirer({})
-        ts = '1234'
-        x.delete_actual_object('/path/to/object name', ts)
-        self.assertEquals(got_env[0]['HTTP_X_IF_DELETE_AT'], ts)
-        self.assertEquals(got_env[0]['PATH_INFO'], '/v1/path/to/object name')
+        x = expirer.ObjectExpirer({}, swift=self.make_fake_ic(fake_app))
+        ts = Timestamp('1234')
+        x.delete_actual_object('path/to/object', ts, True)
+        self.assertNotIn('HTTP_X_IF_DELETE_AT', got_env[0])
+        self.assertNotIn('HTTP_X_BACKEND_CLEAN_EXPIRING_OBJECT_QUEUE',
+                         got_env[0])
+        self.assertEqual(got_env[0]['HTTP_X_TIMESTAMP'], ts.internal)
 
-    def test_delete_actual_object_handles_404(self):
+    def test_delete_actual_object_nourlquoting(self):
+        # delete_actual_object should not do its own url quoting because
+        # internal client's make_request handles that.
+        got_env = [None]
 
         def fake_app(env, start_response):
-            start_response('404 Not Found', [('Content-Length', '0')])
+            got_env[0] = env
+            start_response('204 No Content', [('Content-Length', '0')])
             return []
 
-        internal_client.loadapp = lambda x: fake_app
-
-        x = expirer.ObjectExpirer({})
-        x.delete_actual_object('/path/to/object', '1234')
-
-    def test_delete_actual_object_handles_412(self):
-
-        def fake_app(env, start_response):
-            start_response('412 Precondition Failed',
-                           [('Content-Length', '0')])
-            return []
+        x = expirer.ObjectExpirer({}, swift=self.make_fake_ic(fake_app))
+        ts = Timestamp('1234')
+        x.delete_actual_object('path/to/object name', ts, False)
+        self.assertEqual(got_env[0]['HTTP_X_IF_DELETE_AT'], ts)
+        self.assertEqual(got_env[0]['HTTP_X_TIMESTAMP'],
+                         got_env[0]['HTTP_X_IF_DELETE_AT'])
+        self.assertEqual(got_env[0]['PATH_INFO'], '/v1/path/to/object name')
+
+    def test_delete_actual_object_async_returns_expected_error(self):
+        def do_test(test_status, should_raise):
+            calls = [0]
+
+            def fake_app(env, start_response):
+                calls[0] += 1
+                calls.append(env['PATH_INFO'])
+                start_response(test_status, [('Content-Length', '0')])
+                return []
 
-        internal_client.loadapp = lambda x: fake_app
+            x = expirer.ObjectExpirer({}, swift=self.make_fake_ic(fake_app))
+            ts = Timestamp('1234')
+            if should_raise:
+                with self.assertRaises(internal_client.UnexpectedResponse):
+                    x.delete_actual_object('path/to/object', ts, True)
+            else:
+                x.delete_actual_object('path/to/object', ts, True)
+            self.assertEqual(calls[0], 1, calls)
+
+        # object was deleted and tombstone reaped
+        do_test('404 Not Found', False)
+        # object was overwritten *after* the original delete, or
+        # object was deleted but tombstone still exists, or ...
+        do_test('409 Conflict', False)
+        # Anything else, raise
+        do_test('400 Bad Request', True)
+
+    def test_delete_actual_object_returns_expected_error(self):
+        def do_test(test_status, should_raise):
+            calls = [0]
+
+            def fake_app(env, start_response):
+                calls[0] += 1
+                start_response(test_status, [('Content-Length', '0')])
+                return []
 
-        x = expirer.ObjectExpirer({})
-        x.delete_actual_object('/path/to/object', '1234')
+            x = expirer.ObjectExpirer({}, swift=self.make_fake_ic(fake_app))
+            ts = Timestamp('1234')
+            if should_raise:
+                with self.assertRaises(internal_client.UnexpectedResponse):
+                    x.delete_actual_object('path/to/object', ts, False)
+            else:
+                x.delete_actual_object('path/to/object', ts, False)
+            self.assertEqual(calls[0], 1)
+
+        # object was deleted and tombstone reaped
+        do_test('404 Not Found', True)
+        # object was overwritten *after* the original expiration, or
+        do_test('409 Conflict', False)
+        # object was deleted but tombstone still exists, or
+        # object was overwritten ahead of the original expiration, or
+        # object was POSTed to with a new (or no) expiration, or ...
+        do_test('412 Precondition Failed', True)
 
     def test_delete_actual_object_does_not_handle_odd_stuff(self):
 
         def fake_app(env, start_response):
-            start_response('503 Internal Server Error',
+            start_response(
+                '503 Internal Server Error',
                 [('Content-Length', '0')])
             return []
 
-        internal_client.loadapp = lambda x: fake_app
-
-        x = expirer.ObjectExpirer({})
+        x = expirer.ObjectExpirer({}, swift=self.make_fake_ic(fake_app))
         exc = None
         try:
-            x.delete_actual_object('/path/to/object', '1234')
-        except Exception, err:
+            x.delete_actual_object('path/to/object', Timestamp('1234'), False)
+        except Exception as err:
             exc = err
         finally:
             pass
-        self.assertEquals(503, exc.resp.status_int)
+        self.assertEqual(503, exc.resp.status_int)
+
+    def test_delete_actual_object_quotes(self):
+        name = 'this name/should get/quoted'
+        timestamp = Timestamp('1366063156.863045')
+        x = expirer.ObjectExpirer({}, swift=self.make_fake_ic(self.fake_swift))
+        x.swift.make_request = mock.Mock()
+        x.swift.make_request.return_value.status_int = 204
+        x.swift.make_request.return_value.app_iter = []
+        x.delete_actual_object(name, timestamp, False)
+        self.assertEqual(x.swift.make_request.call_count, 1)
+        self.assertEqual(x.swift.make_request.call_args[0][1],
+                         '/v1/' + urllib.parse.quote(name))
+
+    def test_delete_actual_object_queue_cleaning(self):
+        name = 'acc/cont/something'
+        timestamp = Timestamp('1515544858.80602')
+        x = expirer.ObjectExpirer({}, swift=self.make_fake_ic(self.fake_swift))
+        x.swift.make_request = mock.MagicMock(
+            return_value=swob.HTTPNoContent())
+        x.delete_actual_object(name, timestamp, False)
+        self.assertEqual(x.swift.make_request.call_count, 1)
+        header = 'X-Backend-Clean-Expiring-Object-Queue'
+        self.assertEqual(
+            x.swift.make_request.call_args[0][2].get(header),
+            'no')
+
+    def test_pop_queue(self):
+        x = expirer.ObjectExpirer({}, logger=self.logger,
+                                  swift=FakeInternalClient({}))
+        requests = []
+
+        def capture_requests(ipaddr, port, method, path, *args, **kwargs):
+            requests.append((method, path))
+        with mocked_http_conn(
+                200, 200, 200, give_connect=capture_requests) as fake_conn:
+            x.pop_queue('a', 'c', 'o')
+            with self.assertRaises(StopIteration):
+                next(fake_conn.code_iter)
+        for method, path in requests:
+            self.assertEqual(method, 'DELETE')
+            device, part, account, container, obj = utils.split_path(
+                path, 5, 5, True)
+            self.assertEqual(account, 'a')
+            self.assertEqual(container, 'c')
+            self.assertEqual(obj, 'o')
+
+    def test_build_task_obj_round_trip(self):
+        ts = next(self.ts)
+        a = 'a1'
+        c = 'c2'
+        o = 'obj1'
+        # ts is normalized such that the hex part is lost, which makes it
+        # equivalent to a v1 timestamp
+        exp_ts = Timestamp(str(float(ts)))
+        args = (exp_ts, a, c, o)
+        self.assertEqual(args, expirer.parse_task_obj(
+            expirer.build_task_obj(ts, a, c, o)))
+        self.assertEqual(args, expirer.parse_task_obj(
+            expirer.build_task_obj(ts, a, c, o, high_precision=True)))
+
+        ts = Timestamp(next(self.ts), delta=1234)
+        a = u'\N{SNOWMAN}'
+        c = u'\N{SNOWFLAKE}'
+        o = u'\U0001F334'
+        exp_ts = Timestamp(str(float(ts)))
+        args = (exp_ts, a, c, o)
+        self.assertNotEqual(args, expirer.parse_task_obj(
+            expirer.build_task_obj(ts, a, c, o)))
+        self.assertEqual(args, expirer.parse_task_obj(
+            expirer.build_task_obj(ts, a, c, o, high_precision=True)))
+
 
 if __name__ == '__main__':
     main()
diff --git a/test/unit/obj/test_reconstructor.py b/test/unit/obj/test_reconstructor.py
new file mode 100644
index 0000000000..9102368f24
--- /dev/null
+++ b/test/unit/obj/test_reconstructor.py
@@ -0,0 +1,6870 @@
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import itertools
+import json
+import unittest
+import os
+from unittest import mock
+import pickle
+import tempfile
+import time
+import shutil
+import re
+import random
+import struct
+import collections
+from eventlet import Timeout, sleep, spawn
+from eventlet.green import threading
+
+from contextlib import contextmanager
+from shutil import rmtree
+from urllib.parse import unquote
+from swift.common import utils
+from swift.common.exceptions import DiskFileError, DiskFileQuarantined
+from swift.common.header_key_dict import HeaderKeyDict
+from swift.common.utils import dump_recon_cache, md5, Timestamp, mkdirs
+from swift.obj import diskfile, reconstructor as object_reconstructor
+from swift.common import ring
+from swift.common.storage_policy import (StoragePolicy, ECStoragePolicy,
+                                         POLICIES, EC_POLICY)
+from swift.obj.reconstructor import SYNC, REVERT
+
+from test.debug_logger import debug_logger
+from test.unit import (patch_policies, mocked_http_conn, FabricatedRing,
+                       make_timestamp_iter, DEFAULT_TEST_EC_TYPE,
+                       encode_frag_archive_bodies, quiet_eventlet_exceptions,
+                       skip_if_no_xattrs)
+from test.unit.obj.common import write_diskfile
+
+
+class FakeSsyncSender(object):
+    def __init__(self, daemon, node, job, suffixes, ssync_calls=None,
+                 response_callback=None, **kwargs):
+        if ssync_calls is not None:
+            call_args = {'node': node, 'job': job, 'suffixes': suffixes}
+            call_args.update(kwargs)
+            ssync_calls.append(call_args)
+        self.response_callback = response_callback
+        self.node = node
+        self.job = job
+        self.suffixes = suffixes
+        self.limited_by_max_objects = False
+
+    def __call__(self):
+        if self.response_callback:
+            response = self.response_callback(
+                self.node, self.job, self.suffixes)
+        else:
+            response = True, {}
+        return response
+
+
+@contextmanager
+def mock_ssync_sender(ssync_calls=None, response_callback=None, **kwargs):
+    def fake_ssync(daemon, node, job, suffixes, **kwargs):
+        return FakeSsyncSender(daemon, node, job, suffixes, ssync_calls,
+                               response_callback, **kwargs)
+
+    with mock.patch('swift.obj.reconstructor.ssync_sender', fake_ssync):
+        yield fake_ssync
+
+
+def make_ec_archive_bodies(policy, test_body):
+    segment_size = policy.ec_segment_size
+    # split up the body into buffers
+    chunks = [test_body[x:x + segment_size]
+              for x in range(0, len(test_body), segment_size)]
+    # encode the buffers into fragment payloads
+    fragment_payloads = []
+    for chunk in chunks:
+        fragments = \
+            policy.pyeclib_driver.encode(chunk) * policy.ec_duplication_factor
+        if not fragments:
+            break
+        fragment_payloads.append(fragments)
+
+    # join up the fragment payloads per node
+    ec_archive_bodies = [''.join(frags) for frags in zip(*fragment_payloads)]
+    return ec_archive_bodies
+
+
+def _create_test_rings(path, next_part_power=None):
+    testgz = os.path.join(path, 'object.ring.gz')
+    intended_replica2part2dev_id = [
+        [0, 1, 2],
+        [1, 2, 3],
+        [2, 3, 0]
+    ]
+
+    intended_devs = [
+        {'id': 0, 'device': 'sda1', 'region': 1, 'zone': 0, 'ip': '127.0.0.0',
+         'port': 6200},
+        {'id': 1, 'device': 'sda1', 'region': 1, 'zone': 1, 'ip': '127.0.0.1',
+         'port': 6200},
+        {'id': 2, 'device': 'sda1', 'region': 1, 'zone': 2, 'ip': '127.0.0.2',
+         'port': 6200},
+        {'id': 3, 'device': 'sda1', 'region': 1, 'zone': 4, 'ip': '127.0.0.3',
+         'port': 6200}
+    ]
+    intended_part_shift = 30
+    ring.RingData(intended_replica2part2dev_id,
+                  intended_devs, intended_part_shift,
+                  next_part_power).save(testgz)
+
+    testgz = os.path.join(path, 'object-1.ring.gz')
+    ring.RingData(intended_replica2part2dev_id,
+                  intended_devs, intended_part_shift,
+                  next_part_power).save(testgz)
+
+
+def count_stats(logger, key, metric):
+    count = 0
+    for record in logger.statsd_client.calls[key]:
+        stat_args, stat_kwargs = record
+        m = stat_args[0]
+        if re.match(metric, m):
+            count += 1
+    return count
+
+
+def get_header_frag_index(self, body):
+    metadata = self.policy.pyeclib_driver.get_metadata(body)
+    frag_index = struct.unpack('h', metadata[:2])[0]
+    return {
+        'X-Object-Sysmeta-Ec-Frag-Index': frag_index,
+    }
+
+
+@patch_policies([StoragePolicy(0, name='zero', is_default=True),
+                 ECStoragePolicy(1, name='one',
+                                 ec_type=DEFAULT_TEST_EC_TYPE,
+                                 ec_ndata=3, ec_nparity=2),
+                 ECStoragePolicy(2, name='two',
+                                 ec_type=DEFAULT_TEST_EC_TYPE,
+                                 ec_ndata=3, ec_nparity=2)])
+class TestGlobalSetupObjectReconstructor(unittest.TestCase):
+    # Tests for reconstructor using real objects in test partition directories.
+    legacy_durable = False
+
+    def setUp(self):
+        skip_if_no_xattrs()
+        self.testdir = tempfile.mkdtemp()
+        POLICIES[0].object_ring = FabricatedRing(3)
+        POLICIES[1].object_ring = FabricatedRing(5)
+        POLICIES[2].object_ring = FabricatedRing(5)
+        utils.HASH_PATH_SUFFIX = b'endcap'
+        utils.HASH_PATH_PREFIX = b''
+        self.devices = os.path.join(self.testdir, 'node')
+        os.makedirs(self.devices)
+        os.mkdir(os.path.join(self.devices, 'sda1'))
+        self.objects = os.path.join(self.devices, 'sda1',
+                                    diskfile.get_data_dir(POLICIES[0]))
+        self.objects_1 = os.path.join(self.devices, 'sda1',
+                                      diskfile.get_data_dir(POLICIES[1]))
+        os.mkdir(self.objects)
+        os.mkdir(self.objects_1)
+        self.parts = {}
+        self.parts_1 = {}
+        self.part_nums = ['0', '1', '2']
+        for part in self.part_nums:
+            self.parts[part] = os.path.join(self.objects, part)
+            os.mkdir(self.parts[part])
+            self.parts_1[part] = os.path.join(self.objects_1, part)
+            os.mkdir(self.parts_1[part])
+
+        self.conf = dict(
+            swift_dir=self.testdir, devices=self.devices, mount_check='false',
+            timeout='300', stats_interval='1',
+            bind_ip='10.0.0.1', bind_port=6200)
+        self.logger = debug_logger('test-reconstructor')
+        self.reconstructor = object_reconstructor.ObjectReconstructor(
+            self.conf, logger=self.logger)
+
+        self.policy = POLICIES[1]
+
+        # just in case someone messes with patched policies...
+        for policy in [p for p in POLICIES if p.policy_type == EC_POLICY]:
+            self.ec_policy = policy
+            self.ec_obj_ring = self.reconstructor.load_object_ring(
+                self.ec_policy)
+            break
+        else:
+            self.fail('Failed to find an EC policy')
+        self.assertEqual(int(self.policy), int(self.ec_policy))
+
+        data_dir = diskfile.get_data_dir(self.ec_policy)
+        ips = utils.whataremyips(self.reconstructor.ring_ip)
+        for local_dev in [dev for dev in self.ec_obj_ring.devs
+                          if dev and dev['replication_ip'] in ips and
+                          dev['replication_port'] ==
+                          self.reconstructor.port]:
+            self.ec_local_dev = local_dev
+            dev_path = os.path.join(self.reconstructor.devices_dir,
+                                    self.ec_local_dev['device'])
+            self.ec_obj_path = os.path.join(dev_path, data_dir)
+            break
+        else:
+            self.fail('Failed to find an EC local device')
+
+        # the local device is 'sda1'...
+        self.assertEqual('sda1', self.ec_local_dev['device'])
+
+        # most of the reconstructor test methods require that there be real
+        # object fragments in place, not just part dirs, so we'll create them
+        # all here....
+        t = 1421181937.70054  # time.time()
+        ts = utils.Timestamp(t)
+        with mock.patch('swift.obj.diskfile.time') as mock_time:
+            # since (a) we are using a fixed time here to create
+            # frags which corresponds to all the hardcoded hashes and
+            # (b) the EC diskfile will delete its .data file right
+            # after creating if it has expired, use this horrible hack
+            # to prevent the reclaim happening
+            mock_time.time.return_value = 0.0
+            # part 0:
+            # sda1 is assigned frag index 1 for objs in part 0...
+            self.assertEqual(
+                ['sda0', 'sda1', 'sda2', 'sda3', 'sda4'],
+                [n['device'] for n in self.ec_obj_ring.get_part_nodes(0)])
+            #   3c1/hash/xxx#1#d.data  <-- job: sync_only - partners (FI 1)
+            #   061/hash/xxx#1#d.data  <-- included in earlier job (FI 1)
+            #           /xxx#2#d.data  <-- job: sync_revert to index 2
+            self._create_diskfile(part=0, object_name='o0', frag_index=1,
+                                  policy=policy, timestamp=ts)
+            self._create_diskfile(part=0, object_name='o1', frag_index=1,
+                                  policy=policy, timestamp=ts)
+            self._create_diskfile(part=0, object_name='o1', frag_index=2,
+                                  policy=policy, timestamp=ts)
+            # part 1:
+            # sda1 is assigned frag index 4 for objs in part 1...
+            self.assertEqual(
+                ['sda5', 'sda6', 'sda7', 'sda0', 'sda1'],
+                [n['device'] for n in self.ec_obj_ring.get_part_nodes(1)])
+            #   3c1/hash/xxx#0#d.data  <-- job: sync_revert to index 0
+            #           /xxx#1#d.data  <-- job: sync_revert to index 1
+            #   061/hash/xxx#1#d.data  <-- included in earlier job (FI 1)
+            self._create_diskfile(part=1, object_name='o0', frag_index=0,
+                                  policy=policy, timestamp=ts)
+            self._create_diskfile(part=1, object_name='o0', frag_index=1,
+                                  policy=policy, timestamp=ts)
+            self._create_diskfile(part=1, object_name='o1', frag_index=1,
+                                  policy=policy, timestamp=ts)
+            # part 2:
+            # sda1 is a handoff for objs in part 2...
+            self.assertEqual(
+                ['sda2', 'sda3', 'sda4', 'sda5', 'sda6'],
+                [n['device'] for n in self.ec_obj_ring.get_part_nodes(2)])
+            #   3c1/hash/xxx#2#d.data  <-- job: sync_revert to index 2
+            #   061/hash/xxx#0#d.data  <-- job: sync_revert to index 0
+            self._create_diskfile(part=2, object_name='o0', frag_index=2,
+                                  policy=policy, timestamp=ts)
+            self._create_diskfile(part=2, object_name='o1', frag_index=0,
+                                  policy=policy, timestamp=ts)
+        self.frag_hash = md5(ts.internal.encode('utf-8')).hexdigest()
+        self.durable_hash = md5(
+            (ts.internal + '.durable').encode('utf-8')).hexdigest()
+
+    def tearDown(self):
+        rmtree(self.testdir, ignore_errors=1)
+
+    def _create_diskfile(self, policy=None, part=0, object_name='o',
+                         frag_index=0, timestamp=None, test_data=None,
+                         commit=True):
+        policy = policy or self.policy
+        df_mgr = self.reconstructor._df_router[policy]
+        df = df_mgr.get_diskfile('sda1', part, 'a', 'c', object_name,
+                                 policy=policy)
+        timestamp = timestamp or utils.Timestamp.now()
+        test_data = test_data or b'test data'
+        write_diskfile(df, timestamp, data=test_data, frag_index=frag_index,
+                       commit=commit, legacy_durable=self.legacy_durable)
+        return df
+
+    def assert_expected_jobs(self, part_num, jobs):
+        # the dict diffs can be pretty big
+        self.maxDiff = 2048
+
+        for job in jobs:
+            del job['path']
+            del job['policy']
+            if 'local_index' in job:
+                del job['local_index']
+            job['suffixes'].sort()
+
+        expected = []
+        # part num 0
+        expected.append(
+            [{
+                'sync_to': [{
+                    'index': 2,
+                    'replication_port': 6200,
+                    'zone': 1,
+                    'ip': '10.0.0.2',
+                    'region': 1,
+                    'port': 6200,
+                    'replication_ip': '10.0.0.2',
+                    'device': 'sda2',
+                    'id': 2,
+                    'weight': 1.0,
+                }],
+                'job_type': object_reconstructor.REVERT,
+                'suffixes': ['061'],
+                'partition': 0,
+                'frag_index': 2,
+                'primary_frag_index': 1,
+                'device': 'sda1',
+                'local_dev': {
+                    'replication_port': 6200,
+                    'zone': 1,
+                    'ip': '10.0.0.1',
+                    'region': 1,
+                    'id': 1,
+                    'replication_ip': '10.0.0.1',
+                    'device': 'sda1',
+                    'port': 6200,
+                    'weight': 1.0,
+                },
+                'hashes': {
+                    '061': {
+                        None: self.durable_hash,
+                        2: self.frag_hash,
+                        1: self.frag_hash,
+                    },
+                    '3c1': {
+                        None: self.durable_hash,
+                        1: self.frag_hash,
+                    },
+                },
+            }, {
+                'sync_to': [{
+                    'index': 0,
+                    'replication_port': 6200,
+                    'zone': 1,
+                    'ip': '10.0.0.0',
+                    'region': 1,
+                    'port': 6200,
+                    'replication_ip': '10.0.0.0',
+                    'device': 'sda0',
+                    'id': 0,
+                    'weight': 1.0,
+                }, {
+                    'index': 2,
+                    'replication_port': 6200,
+                    'zone': 1,
+                    'ip': '10.0.0.2',
+                    'region': 1,
+                    'port': 6200,
+                    'replication_ip': '10.0.0.2',
+                    'device': 'sda2',
+                    'id': 2,
+                    'weight': 1.0,
+                }, {
+                    'index': 3,
+                    'replication_port': 6200,
+                    'zone': 1,
+                    'ip': '10.0.0.3',
+                    'region': 1,
+                    'port': 6200,
+                    'replication_ip': '10.0.0.3',
+                    'device': 'sda3',
+                    'id': 3,
+                    'weight': 1.0,
+                }],
+                'job_type': object_reconstructor.SYNC,
+                'sync_diskfile_builder': self.reconstructor.reconstruct_fa,
+                'suffixes': ['061', '3c1'],
+                'partition': 0,
+                'frag_index': 1,
+                'primary_frag_index': 1,
+                'device': 'sda1',
+                'local_dev': {
+                    'replication_port': 6200,
+                    'zone': 1,
+                    'ip': '10.0.0.1',
+                    'region': 1,
+                    'id': 1,
+                    'replication_ip': '10.0.0.1',
+                    'device': 'sda1',
+                    'port': 6200,
+                    'weight': 1.0,
+                },
+                'hashes':
+                {
+                    '061': {
+                        None: self.durable_hash,
+                        2: self.frag_hash,
+                        1: self.frag_hash
+                    },
+                    '3c1': {
+                        None: self.durable_hash,
+                        1: self.frag_hash,
+                    },
+                },
+            }]
+        )
+        # part num 1
+        expected.append(
+            [{
+                'sync_to': [{
+                    'index': 1,
+                    'replication_port': 6200,
+                    'zone': 1,
+                    'ip': '10.0.0.2',
+                    'region': 1,
+                    'port': 6200,
+                    'replication_ip': '10.0.0.2',
+                    'device': 'sda6',
+                    'id': 6,
+                    'weight': 1.0,
+                }],
+                'job_type': object_reconstructor.REVERT,
+                'suffixes': ['061', '3c1'],
+                'partition': 1,
+                'frag_index': 1,
+                'primary_frag_index': 4,
+                'device': 'sda1',
+                'local_dev': {
+                    'replication_port': 6200,
+                    'zone': 1,
+                    'ip': '10.0.0.1',
+                    'region': 1,
+                    'id': 1,
+                    'replication_ip': '10.0.0.1',
+                    'device': 'sda1',
+                    'port': 6200,
+                    'weight': 1.0,
+                },
+                'hashes':
+                {
+                    '061': {
+                        None: self.durable_hash,
+                        1: self.frag_hash,
+                    },
+                    '3c1': {
+                        0: self.frag_hash,
+                        None: self.durable_hash,
+                        1: self.frag_hash,
+                    },
+                },
+            }, {
+                'sync_to': [{
+                    'index': 0,
+                    'replication_port': 6200,
+                    'zone': 1,
+                    'ip': '10.0.0.1',
+                    'region': 1,
+                    'port': 6200,
+                    'replication_ip': '10.0.0.1',
+                    'device': 'sda5',
+                    'id': 5,
+                    'weight': 1.0,
+                }],
+                'job_type': object_reconstructor.REVERT,
+                'suffixes': ['3c1'],
+                'partition': 1,
+                'frag_index': 0,
+                'primary_frag_index': 4,
+                'device': 'sda1',
+                'local_dev': {
+                    'replication_port': 6200,
+                    'zone': 1,
+                    'ip': '10.0.0.1',
+                    'region': 1,
+                    'id': 1,
+                    'replication_ip': '10.0.0.1',
+                    'device': 'sda1',
+                    'port': 6200,
+                    'weight': 1.0,
+                },
+                'hashes': {
+                    '061': {
+                        None: self.durable_hash,
+                        1: self.frag_hash,
+                    },
+                    '3c1': {
+                        0: self.frag_hash,
+                        None: self.durable_hash,
+                        1: self.frag_hash,
+                    },
+                },
+            }, {
+                'sync_to': [{
+                    'index': 3,
+                    'replication_port': 6200,
+                    'zone': 1,
+                    'ip': '10.0.0.0',
+                    'region': 1,
+                    'port': 6200,
+                    'replication_ip': '10.0.0.0',
+                    'device': 'sda0',
+                    'id': 0,
+                    'weight': 1.0,
+                }, {
+                    'index': 0,
+                    'replication_port': 6200,
+                    'zone': 1,
+                    'ip': '10.0.0.1',
+                    'region': 1,
+                    'port': 6200,
+                    'replication_ip': '10.0.0.1',
+                    'device': 'sda5',
+                    'id': 5,
+                    'weight': 1.0,
+                }, {
+                    'index': 1,
+                    'replication_port': 6200,
+                    'zone': 1,
+                    'ip': '10.0.0.2',
+                    'region': 1,
+                    'port': 6200,
+                    'replication_ip': '10.0.0.2',
+                    'device': 'sda6',
+                    'id': 6,
+                    'weight': 1.0,
+                }],
+                'job_type': object_reconstructor.SYNC,
+                'sync_diskfile_builder': self.reconstructor.reconstruct_fa,
+                'suffixes': [],
+                'partition': 1,
+                'frag_index': 4,
+                'primary_frag_index': 4,
+                'device': 'sda1',
+                'local_dev': {
+                    'replication_port': 6200,
+                    'zone': 1,
+                    'ip': '10.0.0.1',
+                    'region': 1,
+                    'id': 1,
+                    'replication_ip': '10.0.0.1',
+                    'device': 'sda1',
+                    'port': 6200,
+                    'weight': 1.0,
+                },
+                'hashes': {
+                    '061': {
+                        None: self.durable_hash,
+                        1: self.frag_hash,
+                    },
+                    '3c1': {
+                        0: self.frag_hash,
+                        None: self.durable_hash,
+                        1: self.frag_hash,
+                    },
+                },
+
+            }]
+        )
+        # part num 2
+        expected.append(
+            [{
+                'sync_to': [{
+                    'index': 0,
+                    'replication_port': 6200,
+                    'zone': 1,
+                    'ip': '10.0.0.2',
+                    'region': 1,
+                    'port': 6200,
+                    'replication_ip': '10.0.0.2',
+                    'device': 'sda2',
+                    'id': 2,
+                    'weight': 1.0,
+                }],
+                'job_type': object_reconstructor.REVERT,
+                'suffixes': ['061'],
+                'partition': 2,
+                'frag_index': 0,
+                'primary_frag_index': None,
+                'device': 'sda1',
+                'local_dev': {
+                    'replication_port': 6200,
+                    'zone': 1,
+                    'ip': '10.0.0.1',
+                    'region': 1,
+                    'id': 1,
+                    'replication_ip': '10.0.0.1',
+                    'device': 'sda1',
+                    'port': 6200,
+                    'weight': 1.0,
+                },
+                'hashes': {
+                    '061': {
+                        0: self.frag_hash,
+                        None: self.durable_hash
+                    },
+                    '3c1': {
+                        None: self.durable_hash,
+                        2: self.frag_hash
+                    },
+                },
+            }, {
+                'sync_to': [{
+                    'index': 2,
+                    'replication_port': 6200,
+                    'zone': 1,
+                    'ip': '10.0.0.0',
+                    'region': 1,
+                    'port': 6200,
+                    'replication_ip': '10.0.0.0',
+                    'device': 'sda4',
+                    'id': 4,
+                    'weight': 1.0,
+                }],
+                'job_type': object_reconstructor.REVERT,
+                'suffixes': ['3c1'],
+                'partition': 2,
+                'frag_index': 2,
+                'primary_frag_index': None,
+                'device': 'sda1',
+                'local_dev': {
+                    'replication_port': 6200,
+                    'zone': 1,
+                    'ip': '10.0.0.1',
+                    'region': 1,
+                    'id': 1,
+                    'replication_ip': '10.0.0.1',
+                    'device': 'sda1',
+                    'port': 6200,
+                    'weight': 1.0,
+                },
+                'hashes': {
+                    '061': {
+                        0: self.frag_hash,
+                        None: self.durable_hash
+                    },
+                    '3c1': {
+                        None: self.durable_hash,
+                        2: self.frag_hash
+                    },
+                },
+            }]
+        )
+
+        def check_jobs(part_num):
+            try:
+                expected_jobs = expected[int(part_num)]
+            except (IndexError, ValueError):
+                self.fail('Unknown part number %r' % part_num)
+            expected_by_part_frag_index = dict(
+                ((j['partition'], j['frag_index']), j) for j in expected_jobs)
+            unexpected_jobs = []
+            for job in jobs:
+                job_key = (job['partition'], job['frag_index'])
+                if job_key in expected_by_part_frag_index:
+                    self.assertEqual(job, expected_by_part_frag_index[job_key])
+                else:
+                    unexpected_jobs.append(job)
+            if unexpected_jobs:
+                self.fail(
+                    'Unexpected jobs for frags %r in part num %s - '
+                    'expected jobs for frags %r' % (
+                        [j['frag_index'] for j in unexpected_jobs], part_num,
+                        [k[1] for k in expected_by_part_frag_index]))
+            for expected_job in expected_jobs:
+                if expected_job in jobs:
+                    jobs.remove(expected_job)
+            self.assertFalse(jobs)  # that should be all of them
+        check_jobs(part_num)
+
+    def _run_once(self, http_count, extra_devices, override_devices=None):
+        id_counter = itertools.count(
+            max(d['id'] for d in self.policy.object_ring.devs) + 1)
+        for device, parts in extra_devices.items():
+            device_path = os.path.join(self.devices, device)
+            os.mkdir(device_path)
+            for part in range(parts):
+                hash_path = os.path.join(
+                    device_path, 'objects-1', str(part), 'abc', 'hash')
+                os.makedirs(hash_path)
+                tombstone_file = utils.Timestamp(time.time()).internal + '.ts'
+                with open(os.path.join(hash_path, tombstone_file), 'w'):
+                    pass
+            # use sda1 as a base to make is_local happy
+            new_device = dict(self.policy.object_ring.devs[1])
+            new_device['device'] = device
+            new_device['id'] = next(id_counter)
+            self.policy.object_ring.devs.append(new_device)
+
+        self.reconstructor.stats_interval = object()
+
+        can_process = threading.Event()
+        can_do_stats = threading.Event()
+        can_do_stats.set()
+
+        def fake_sleep(secs=0):
+            if secs is not self.reconstructor.stats_interval:
+                return sleep(secs)
+            can_do_stats.wait()
+            can_do_stats.clear()
+            can_process.set()
+
+        def fake_process(job):
+            can_process.wait()
+            can_process.clear()
+            can_do_stats.set()
+
+        self.reconstructor.process_job = fake_process
+        with mock_ssync_sender(), mock.patch(
+                'swift.obj.reconstructor.sleep', fake_sleep):
+            self.reconstructor.run_once(devices=override_devices)
+
+    def test_run_once(self):
+        # sda1: 3 is done in setup
+        extra_devices = {
+            'sdb1': 4,
+            'sdc1': 1,
+            'sdd1': 0,
+        }
+        with Timeout(60):
+            self._run_once(32, extra_devices)
+        stats_lines = set()
+        for line in self.logger.get_lines_for_level('info'):
+            if 'reconstructed in' not in line:
+                continue
+            stat_line = line.split('reconstructed', 1)[0].strip()
+            stats_lines.add(stat_line)
+        acceptable = set([
+            '2/8 (25.00%) partitions',
+            '3/8 (37.50%) partitions',
+            '4/8 (50.00%) partitions',
+            '5/8 (62.50%) partitions',
+            '6/8 (75.00%) partitions',
+            '7/8 (87.50%) partitions',
+            '8/8 (100.00%) partitions',
+        ])
+        matched = stats_lines & acceptable
+        self.assertEqual(matched, acceptable,
+                         'missing some expected acceptable:\n%s' % (
+                             '\n'.join(sorted(acceptable - matched))))
+        self.assertEqual(self.reconstructor.reconstruction_part_count, 8)
+        self.assertEqual(self.reconstructor.part_count, 8)
+
+    def test_run_once_override_devices(self):
+        # sda1: 3 is done in setup
+        extra_devices = {
+            'sdb1': 4,
+            'sdc1': 1,
+            'sdd1': 0,
+        }
+        with Timeout(60):
+            self._run_once(3, extra_devices, 'sdc1')
+        stats_lines = set()
+        for line in self.logger.get_lines_for_level('info'):
+            if 'reconstructed in' not in line:
+                continue
+            stat_line = line.split('reconstructed', 1)[0].strip()
+            stats_lines.add(stat_line)
+        acceptable = set([
+            '1/1 (100.00%) partitions',
+        ])
+        matched = stats_lines & acceptable
+        self.assertEqual(matched, acceptable,
+                         'missing some expected acceptable:\n%s' % (
+                             '\n'.join(sorted(acceptable - matched))))
+        self.assertEqual(self.reconstructor.reconstruction_part_count, 1)
+        self.assertEqual(self.reconstructor.part_count, 1)
+
+    def test_get_response(self):
+        part = self.part_nums[0]
+        node = self.policy.object_ring.get_part_nodes(int(part))[0]
+        # separate replication network
+        node['replication_port'] = node['port'] + 1000
+
+        def do_test(stat_code):
+            with mocked_http_conn(stat_code) as mock_conn:
+                resp = self.reconstructor._get_response(
+                    node, self.policy, part, path='/nada', headers={})
+            self.assertEqual(mock_conn.requests, [{
+                'ssl': False,
+                'ip': node['replication_ip'],
+                'port': node['replication_port'],
+                'method': 'GET',
+                'path': '/sda0/%s/nada' % part,
+                'qs': None,
+                'headers': {},
+            }])
+            return resp
+
+        for status in (200, 400, 404, 503):
+            resp = do_test(status)
+            self.assertEqual(status, resp.status)
+
+        resp = do_test(Exception())
+        self.assertIsNone(resp)
+        # exception should result in error logs
+        for line in self.logger.get_lines_for_level('error'):
+            self.assertIn('Trying to GET', line)
+        self.logger._clear()
+
+        # Timeout also should result in error logs
+        resp = do_test(Timeout())
+        self.assertIsNone(resp)
+        for line in self.logger.get_lines_for_level('error'):
+            self.assertIn('Trying to GET', line)
+            # sanity Timeout has extra message in the error log
+            self.assertIn('Timeout', line)
+        self.logger.clear()
+
+    def test_reconstructor_skips_bogus_partition_dirs(self):
+        # A directory in the wrong place shouldn't crash the reconstructor
+        self.reconstructor._reset_stats()
+        rmtree(self.objects_1)
+        os.mkdir(self.objects_1)
+
+        os.mkdir(os.path.join(self.objects_1, "burrito"))
+        jobs = []
+        for part_info in self.reconstructor.collect_parts():
+            jobs += self.reconstructor.build_reconstruction_jobs(part_info)
+        self.assertFalse(jobs)
+
+    def test_check_ring(self):
+        testring = tempfile.mkdtemp()
+        _create_test_rings(testring)
+        obj_ring = ring.Ring(testring, ring_name='object')  # noqa
+        self.assertTrue(self.reconstructor.check_ring(obj_ring))
+        orig_check = self.reconstructor.next_check
+        self.reconstructor.next_check = orig_check - 30
+        self.assertTrue(self.reconstructor.check_ring(obj_ring))
+        self.reconstructor.next_check = orig_check
+        orig_ring_time = obj_ring._mtime
+        obj_ring._mtime = orig_ring_time - 30
+        self.assertTrue(self.reconstructor.check_ring(obj_ring))
+        self.reconstructor.next_check = orig_check - 30
+        self.assertFalse(self.reconstructor.check_ring(obj_ring))
+        rmtree(testring, ignore_errors=1)
+
+    def test_reconstruct_check_ring(self):
+        # test reconstruct logs info when check_ring is false and that
+        # there are no jobs built
+        objects_2 = os.path.join(self.devices, 'sda1',
+                                 diskfile.get_data_dir(POLICIES[2]))
+        os.mkdir(objects_2)
+        for part in ['0', '1', '2']:
+            os.mkdir(os.path.join(objects_2, part))
+
+        with mock.patch.object(self.reconstructor, 'process_job') as mock_pj, \
+            mock.patch(
+                'swift.obj.reconstructor.ObjectReconstructor.check_ring',
+                side_effect=lambda ring: ring is not POLICIES[1].object_ring):
+            self.reconstructor.reconstruct()
+        msgs = self.logger.get_lines_for_level('info')
+        self.assertEqual(1, msgs.count(
+            'Ring change detected for policy 1 (one). Aborting '
+            'current reconstruction pass for this policy.'), msgs)
+        self.assertEqual(
+            [call[1][0]['job_type'] for call in mock_pj.mock_calls],
+            ['sync_only'] * 2)
+        self.assertEqual(
+            [call[1][0]['policy'] for call in mock_pj.mock_calls],
+            [POLICIES[2]] * 2)
+        # partition 2 doesn't belong here and doesn't have data,
+        # so it just gets cleaned up
+        self.assertEqual(
+            {call[1][0]['partition'] for call in mock_pj.mock_calls},
+            {0, 1})
+
+    def test_build_reconstruction_jobs(self):
+        self.reconstructor._reset_stats()
+        for part_info in self.reconstructor.collect_parts():
+            jobs = self.reconstructor.build_reconstruction_jobs(part_info)
+            self.assertTrue(jobs[0]['job_type'] in
+                            (object_reconstructor.SYNC,
+                             object_reconstructor.REVERT))
+            self.assert_expected_jobs(part_info['partition'], jobs)
+
+    def test_handoffs_only(self):
+        self.reconstructor.handoffs_only = True
+
+        found_job_types = set()
+
+        def fake_process_job(job):
+            # increment failure counter
+            self.reconstructor.handoffs_remaining += 1
+            found_job_types.add(job['job_type'])
+
+        self.reconstructor.process_job = fake_process_job
+
+        _orig_build_jobs = self.reconstructor.build_reconstruction_jobs
+        built_jobs = []
+
+        def capture_jobs(part_info):
+            jobs = _orig_build_jobs(part_info)
+            built_jobs.append((part_info, jobs))
+            return jobs
+
+        with mock.patch.object(self.reconstructor, 'build_reconstruction_jobs',
+                               capture_jobs):
+            self.reconstructor.reconstruct()
+        # only revert jobs
+        found = [(part_info['partition'], set(
+                 j['job_type'] for j in jobs))
+                 for part_info, jobs in built_jobs]
+        self.assertEqual([
+            # partition, job_types
+            (2, {'sync_revert'}),
+        ], found)
+        self.assertEqual(found_job_types, {object_reconstructor.REVERT})
+        # but failures keep handoffs remaining
+        msgs = self.logger.get_lines_for_level('info')
+        self.assertIn('Next pass will continue to revert handoffs', msgs[-1])
+        self.logger._clear()
+
+        found_job_types = set()
+
+        def fake_process_job(job):
+            # success does not increment failure counter
+            found_job_types.add(job['job_type'])
+
+        self.reconstructor.process_job = fake_process_job
+
+        # only revert jobs ... but all handoffs cleared out successfully
+        self.reconstructor.reconstruct()
+        self.assertEqual(found_job_types, {object_reconstructor.REVERT})
+        # it's time to turn off handoffs_only
+        msgs = self.logger.get_lines_for_level('warning')
+        self.assertIn('You should disable handoffs_only', msgs[-1])
+
+    def test_get_partners(self):
+        expected = (
+            # node_index, part_nodes => partners
+            (0, [0, 1, 2, 3], [3, 1, 2]),
+            (0, [2, 3, 1, 0], [0, 3, 1]),
+            (0, [0, 1, 2, 3, 4], [4, 1, 2]),
+            (0, [0, 1, 2, 3, 4, 5], [5, 1, 3]),
+            (1, [0, 1, 2, 3, 4, 5], [0, 2, 4]),
+            (2, [0, 1, 2, 3, 4, 5], [1, 3, 5]),
+            (3, [0, 1, 2, 3, 4, 5], [2, 4, 0]),
+            (4, [0, 1, 2, 3, 4, 5], [3, 5, 1]),
+            (5, [0, 1, 2, 3, 4, 5], [4, 0, 2]),
+            (5, [1, 4, 0, 2, 3, 5], [3, 1, 0]),
+        )
+        failures = []
+        for frag_index, part_nodes, partners in expected:
+            sync_to = object_reconstructor._get_partners(
+                frag_index, part_nodes)
+            if partners != sync_to:
+                failures.append('Given nodes %r for index %s we expected '
+                                '%r but got %r' % (
+                                    part_nodes, frag_index, partners, sync_to))
+        if failures:
+            failures.insert(0, 'Some test scenarios failed:')
+            self.fail('\n'.join(failures))
+
+    def test_iter_nodes_for_frag(self):
+        # no limit
+        self.reconstructor.rebuild_handoff_node_count = -1
+        policy = ECStoragePolicy(1, name='test', ec_type=DEFAULT_TEST_EC_TYPE,
+                                 ec_ndata=4, ec_nparity=3)
+        policy.object_ring = FabricatedRing(replicas=7, devices=28)
+        primaries = policy.object_ring.get_part_nodes(0)
+
+        node = primaries[0]
+        nodes_for_frag = list(self.reconstructor._iter_nodes_for_frag(
+            policy, 0, node))
+        expected = [0, 0, 7, 14]
+        self.assertEqual(expected, [n.get('index', n.get('handoff_index'))
+                                    for n in nodes_for_frag])
+        for node in nodes_for_frag:
+            self.assertEqual(0, node['backend_index'])
+
+        node = primaries[3]
+        nodes_for_frag = list(self.reconstructor._iter_nodes_for_frag(
+            policy, 0, node))
+        expected = [3, 3, 10, 17]
+        self.assertEqual(expected, [n.get('index', n.get('handoff_index'))
+                                    for n in nodes_for_frag])
+        for node in nodes_for_frag:
+            self.assertEqual(3, node['backend_index'])
+
+        node = primaries[-1]
+        nodes_for_frag = list(self.reconstructor._iter_nodes_for_frag(
+            policy, 0, node))
+        expected = [6, 6, 13, 20]
+        self.assertEqual(expected, [n.get('index', n.get('handoff_index'))
+                                    for n in nodes_for_frag])
+        for node in nodes_for_frag:
+            self.assertEqual(6, node['backend_index'])
+
+        # default limit is 2
+        self.reconstructor.rebuild_handoff_node_count = 2
+        node = primaries[0]
+        nodes_for_frag = list(self.reconstructor._iter_nodes_for_frag(
+            policy, 0, node))
+        expected = [0, 0, 7]
+        self.assertEqual(expected, [n.get('index', n.get('handoff_index'))
+                                    for n in nodes_for_frag])
+        for node in nodes_for_frag:
+            self.assertEqual(0, node['backend_index'])
+
+        # zero means only primaries
+        self.reconstructor.rebuild_handoff_node_count = 0
+        node = primaries[0]
+        nodes_for_frag = list(self.reconstructor._iter_nodes_for_frag(
+            policy, 0, node))
+        expected = [0]
+        self.assertEqual(expected, [n.get('index', n.get('handoff_index'))
+                                    for n in nodes_for_frag])
+        for node in nodes_for_frag:
+            self.assertEqual(0, node['backend_index'])
+
+    def test_collect_parts(self):
+        self.reconstructor._reset_stats()
+        parts = []
+        for part_info in self.reconstructor.collect_parts():
+            parts.append(part_info['partition'])
+        self.assertEqual(sorted(parts), [0, 1, 2])
+
+    def test_collect_parts_mkdirs_error(self):
+
+        def blowup_mkdirs(path):
+            raise OSError('Ow!')
+
+        self.reconstructor._reset_stats()
+        with mock.patch.object(object_reconstructor, 'mkdirs', blowup_mkdirs):
+            rmtree(self.objects_1, ignore_errors=1)
+            parts = []
+            for part_info in self.reconstructor.collect_parts():
+                parts.append(part_info['partition'])
+            error_lines = self.logger.get_lines_for_level('error')
+            self.assertEqual(
+                len(error_lines), 2,
+                'Expected exactly two errors, got %r' % error_lines)
+            log_args, log_kwargs = self.logger.log_dict['error'][0]
+            self.assertEqual(str(log_kwargs['exc_info'][1]), 'Ow!')
+            log_args, log_kwargs = self.logger.log_dict['error'][1]
+            self.assertEqual(str(log_kwargs['exc_info'][1]), 'Ow!')
+
+    def test_removes_zbf(self):
+        # suppress unmount warning
+        os.mkdir(os.path.join(self.devices, 'sda5'))
+        # After running xfs_repair, a partition directory could become a
+        # zero-byte file. If this happens, the reconstructor should clean it
+        # up, log something, and move on to the next partition.
+
+        # Surprise! Partition dir 1 is actually a zero-byte file.
+        pol_1_part_1_path = os.path.join(self.objects_1, '1')
+        rmtree(pol_1_part_1_path)
+        with open(pol_1_part_1_path, 'w'):
+            pass
+        self.assertTrue(os.path.isfile(pol_1_part_1_path))  # sanity check
+
+        self.reconstructor.process_job = lambda j: None
+        self.reconstructor.reconstruct()
+
+        self.assertFalse(os.path.exists(pol_1_part_1_path))
+        warnings = self.logger.get_lines_for_level('warning')
+        self.assertEqual(2, len(warnings))
+        # first warning is due to get_hashes failing to take lock on non-dir
+        self.assertIn(pol_1_part_1_path + '/hashes.pkl', warnings[0])
+        self.assertIn('unable to read', warnings[0].lower())
+        self.assertIn(pol_1_part_1_path, warnings[1])
+        self.assertIn('not a directory', warnings[1].lower())
+
+    def test_ignores_status_file(self):
+        # Following fd86d5a, the auditor will leave status files on each device
+        # until an audit can complete. The reconstructor should ignore these
+
+        @contextmanager
+        def status_files(*auditor_types):
+            status_paths = [os.path.join(self.objects_1,
+                                         'auditor_status_%s.json' % typ)
+                            for typ in auditor_types]
+            for status_path in status_paths:
+                self.assertFalse(os.path.exists(status_path))  # sanity check
+                with open(status_path, 'w'):
+                    pass
+                self.assertTrue(os.path.isfile(status_path))  # sanity check
+            try:
+                yield status_paths
+            finally:
+                for status_path in status_paths:
+                    try:
+                        os.unlink(status_path)
+                    except OSError as e:
+                        if e.errno != 2:
+                            raise
+
+        # suppress unmount warning
+        os.mkdir(os.path.join(self.devices, 'sda5'))
+
+        # since our collect_parts job is a generator, that yields directly
+        # into build_jobs and then spawns it's safe to do the remove_files
+        # without making reconstructor startup slow
+        with status_files('ALL', 'ZBF') as status_paths:
+            self.reconstructor._reset_stats()
+            for part_info in self.reconstructor.collect_parts():
+                self.assertNotIn(part_info['part_path'], status_paths)
+            warnings = self.logger.get_lines_for_level('warning')
+            self.assertEqual(0, len(warnings))
+            for status_path in status_paths:
+                self.assertTrue(os.path.exists(status_path))
+
+    def _make_fake_ssync(self, ssync_calls, fail_jobs=None):
+        """
+        Replace SsyncSender with a thin Fake.
+
+        :param ssync_calls: an empty list, a non_local, all calls to ssync will
+                            be captured for assertion in the caller.
+        :param fail_jobs: optional iter of dicts, any job passed into Fake that
+                          matches a failure dict will return success == False.
+        """
+        class _fake_ssync(object):
+            def __init__(self, daemon, node, job, suffixes,
+                         include_non_durable=False, max_objects=0,
+                         **kwargs):
+                # capture context and generate an available_map of objs
+                context = {}
+                context['node'] = node
+                context['job'] = job
+                context['suffixes'] = suffixes
+                context['max_objects'] = max_objects
+                self.suffixes = suffixes
+                self.daemon = daemon
+                self.job = job
+                frag_prefs = [] if include_non_durable else None
+                hash_gen = self.daemon._df_router[job['policy']].yield_hashes(
+                    self.job['device'], self.job['partition'],
+                    self.job['policy'], self.suffixes,
+                    frag_index=self.job.get('frag_index'),
+                    frag_prefs=frag_prefs)
+                self.available_map = {}
+                self.limited_by_max_objects = False
+                nlines = 0
+                for hash_, timestamps in hash_gen:
+                    self.available_map[hash_] = timestamps
+                    nlines += 1
+                    if 0 < max_objects <= nlines:
+                        break
+                for _ in hash_gen:
+                    self.limited_by_max_objects = True
+                    break
+                context['available_map'] = self.available_map
+                ssync_calls.append(context)
+                self.success = True
+                for failure in (fail_jobs or []):
+                    if all(job.get(k) == v for (k, v) in failure.items()):
+                        self.success = False
+                        break
+                context['success'] = self.success
+                context['include_non_durable'] = include_non_durable
+
+            def __call__(self, *args, **kwargs):
+                return self.success, self.available_map if self.success else {}
+
+        return _fake_ssync
+
+    def test_delete_reverted(self):
+        # verify reconstructor deletes reverted frag indexes after ssync'ing
+
+        def visit_obj_dirs(context):
+            for suff in context['suffixes']:
+                suff_dir = os.path.join(
+                    context['job']['path'], suff)
+                for root, dirs, files in os.walk(suff_dir):
+                    for d in dirs:
+                        dirpath = os.path.join(root, d)
+                        files = os.listdir(dirpath)
+                        yield dirpath, files
+
+        n_files = n_files_after = 0
+
+        # run reconstructor with delete function mocked out to check calls
+        ssync_calls = []
+        with mock.patch('swift.obj.reconstructor.ssync_sender',
+                        self._make_fake_ssync(ssync_calls)), \
+                mocked_http_conn(*[200] * 6, body=pickle.dumps({})), \
+                mock.patch.object(
+                    self.reconstructor, 'delete_reverted_objs') as mock_delete:
+            self.reconstructor.reconstruct()
+        expected_calls = []
+        for context in ssync_calls:
+            if context['job']['job_type'] == REVERT:
+                self.assertTrue(context.get('include_non_durable'))
+                for dirpath, files in visit_obj_dirs(context):
+                    # sanity check - expect some files to be in dir,
+                    # may not be for the reverted frag index
+                    self.assertTrue(files)
+                    n_files += len(files)
+                self.assertEqual(context['job']['frag_index'],
+                                 context['node']['index'])
+                expected_calls.append(mock.call(context['job'],
+                                      context['available_map']))
+            else:
+                self.assertFalse(context.get('include_non_durable'))
+            self.assertEqual(0, context.get('max_objects'))
+
+        mock_delete.assert_has_calls(expected_calls, any_order=True)
+
+        # N.B. in this next test sequence we acctually delete files after
+        # revert, so the on-disk hashes can change.  In partition 1, if the
+        # revert jobs (for frag_index 0 or 1) run before the sync job
+        # (frag_index 4) all suffixes will get removed and the sync job won't
+        # have anything to ship the remote (meaning there's no post-sync
+        # REPLICATE call).  To keep the number of mocked_http_conn responses
+        # predictable we force a stable job order by mocking random's shuffle.
+        ssync_calls = []
+        with mock.patch('swift.obj.reconstructor.ssync_sender',
+                        self._make_fake_ssync(ssync_calls)), \
+                mocked_http_conn(*[200] * 6, body=pickle.dumps({})), \
+                mock.patch('swift.obj.reconstructor.random.shuffle'):
+            self.reconstructor.reconstruct()
+        for context in ssync_calls:
+            if context['job']['job_type'] == REVERT:
+                self.assertTrue(context.get('include_non_durable'))
+                data_file_tail = ('#%s.data'
+                                  % context['node']['index'])
+                for dirpath, files in visit_obj_dirs(context):
+                    n_files_after += len(files)
+                    for filename in files:
+                        self.assertFalse(
+                            filename.endswith(data_file_tail), filename)
+            else:
+                self.assertFalse(context.get('include_non_durable'))
+            self.assertEqual(0, context.get('max_objects'))
+
+        # sanity check that some files should were deleted
+        self.assertGreater(n_files, n_files_after)
+
+    def test_max_objects_per_revert_only_for_revert_jobs(self):
+        # verify max_objects_per_revert option is only passed to revert jobs
+        ssync_calls = []
+        conf = dict(self.conf, max_objects_per_revert=2)
+        with mock.patch('swift.obj.reconstructor.ssync_sender',
+                        self._make_fake_ssync(ssync_calls)), \
+                mocked_http_conn(*[200] * 6, body=pickle.dumps({})):
+            reconstructor = object_reconstructor.ObjectReconstructor(
+                conf, logger=self.logger)
+            reconstructor.reconstruct()
+        reverts = syncs = 0
+        for context in ssync_calls:
+            if context['job']['job_type'] == REVERT:
+                self.assertEqual(2, context.get('max_objects'))
+                reverts += 1
+            else:
+                self.assertEqual(0, context.get('max_objects'))
+                syncs += 1
+        self.assertGreater(reverts, 0)
+        self.assertGreater(syncs, 0)
+
+    def test_delete_reverted_nondurable(self):
+        # verify reconstructor only deletes reverted nondurable fragments older
+        # commit_window
+        shutil.rmtree(self.ec_obj_path)
+        ips = utils.whataremyips(self.reconstructor.ring_ip)
+        local_devs = [dev for dev in self.ec_obj_ring.devs
+                      if dev and dev['replication_ip'] in ips and
+                      dev['replication_port'] ==
+                      self.reconstructor.port]
+        partition = (local_devs[0]['id'] + 1) % 3
+        # recent non-durable
+        df_recent = self._create_diskfile(
+            object_name='recent', part=partition, commit=False)
+        datafile_recent = df_recent.manager.cleanup_ondisk_files(
+            df_recent._datadir, frag_prefs=[])['data_file']
+        # older non-durable but with recent mtime
+        df_older = self._create_diskfile(
+            object_name='older', part=partition, commit=False,
+            timestamp=Timestamp(time.time() - 61))
+        datafile_older = df_older.manager.cleanup_ondisk_files(
+            df_older._datadir, frag_prefs=[])['data_file']
+        # durable
+        df_durable = self._create_diskfile(
+            object_name='durable', part=partition, commit=True)
+        datafile_durable = df_durable.manager.cleanup_ondisk_files(
+            df_durable._datadir, frag_prefs=[])['data_file']
+        self.assertTrue(os.path.exists(datafile_recent))
+        self.assertTrue(os.path.exists(datafile_older))
+        self.assertTrue(os.path.exists(datafile_durable))
+        ssync_calls = []
+        with mock.patch('swift.obj.reconstructor.ssync_sender',
+                        self._make_fake_ssync(ssync_calls)):
+            self.reconstructor.handoffs_only = True
+            self.reconstructor.reconstruct()
+        for context in ssync_calls:
+            self.assertEqual(REVERT, context['job']['job_type'])
+            self.assertTrue(context.get('include_non_durable'))
+        # neither nondurable should be removed yet with default commit_window
+        # because their mtimes are too recent
+        self.assertTrue(os.path.exists(datafile_recent))
+        self.assertTrue(os.path.exists(datafile_older))
+        # but durable is purged
+        self.assertFalse(os.path.exists(datafile_durable), datafile_durable)
+
+        ssync_calls = []
+        with mock.patch('swift.obj.reconstructor.ssync_sender',
+                        self._make_fake_ssync(ssync_calls)):
+            self.reconstructor.handoffs_only = True
+            # let the file get a little bit older and turn down the
+            # commit_window...
+            sleep(0.01)
+            df_older.manager.commit_window = 0.005
+            self.reconstructor.reconstruct()
+        for context in ssync_calls:
+            self.assertEqual(REVERT, context['job']['job_type'])
+            self.assertTrue(context.get('include_non_durable'))
+
+        # ...now the nondurables get purged
+        self.assertFalse(os.path.exists(datafile_recent))
+        self.assertFalse(os.path.exists(datafile_older))
+
+    def test_sync_old_nondurable_before_committed_non_zero_commit_window(self):
+        # verify that a *recently written* nondurable fragment survives being
+        # visited by the reconstructor, despite having timestamp older than
+        # reclaim_age
+        shutil.rmtree(self.ec_obj_path)
+        ips = utils.whataremyips(self.reconstructor.ring_ip)
+        local_devs = [dev for dev in self.ec_obj_ring.devs
+                      if dev and dev['replication_ip'] in ips and
+                      dev['replication_port'] ==
+                      self.reconstructor.port]
+        partition = local_devs[0]['id']
+        # recently written, recent timestamp non-durable
+        ts_recent = Timestamp(time.time())
+        df_mgr = self.reconstructor._df_router[self.policy]
+        reclaim_age = df_mgr.reclaim_age
+        df_recent = self._create_diskfile(
+            object_name='recent', part=partition, commit=False,
+            timestamp=ts_recent, frag_index=4)
+        datafile_recent = df_recent.manager.cleanup_ondisk_files(
+            df_recent._datadir, frag_prefs=[])['data_file']
+
+        # recently written but old timestamp non-durable
+        ts_old = Timestamp(time.time() - reclaim_age - 1)
+        df_older = self._create_diskfile(
+            object_name='older', part=partition, commit=False,
+            timestamp=ts_old, frag_index=4)
+        datafile_older = df_older.manager.cleanup_ondisk_files(
+            df_older._datadir, frag_prefs=[])['data_file']
+        self.assertTrue(os.path.exists(datafile_recent))
+        self.assertTrue(os.path.exists(datafile_older))
+
+        # for this test we don't actually need to ssync anything, so pretend
+        # all suffixes are in sync
+        self.reconstructor._get_suffixes_to_sync = (
+            lambda job, node: ([], node))
+        df_mgr.commit_window = 1000  # avoid non-durables being reclaimed
+        self.reconstructor.reconstruct()
+        # neither nondurable should be removed yet with default commit_window
+        # because their mtimes are too recent
+        self.assertTrue(os.path.exists(datafile_recent))
+        self.assertTrue(os.path.exists(datafile_older))
+        # and we can still make the nondurables durable
+        df_recent.writer().commit(ts_recent)
+        self.assertTrue(os.path.exists(datafile_recent.replace('#4', '#4#d')))
+        df_older.writer().commit(ts_old)
+        self.assertTrue(os.path.exists(datafile_older.replace('#4', '#4#d')))
+
+    def test_sync_old_nondurable_before_committed_zero_commit_window(self):
+        # verify that a *recently written* nondurable fragment won't survive
+        # being visited by the reconstructor if its timestamp is older than
+        # reclaim_age and commit_window is zero; this test illustrates the
+        # potential data loss bug that commit_window addresses
+        shutil.rmtree(self.ec_obj_path)
+        ips = utils.whataremyips(self.reconstructor.ring_ip)
+        local_devs = [dev for dev in self.ec_obj_ring.devs
+                      if dev and dev['replication_ip'] in ips and
+                      dev['replication_port'] ==
+                      self.reconstructor.port]
+        partition = local_devs[0]['id']
+        # recently written, recent timestamp non-durable
+        ts_recent = Timestamp(time.time())
+        df_mgr = self.reconstructor._df_router[self.policy]
+        reclaim_age = df_mgr.reclaim_age
+        df_recent = self._create_diskfile(
+            object_name='recent', part=partition, commit=False,
+            timestamp=ts_recent, frag_index=4)
+        datafile_recent = df_recent.manager.cleanup_ondisk_files(
+            df_recent._datadir, frag_prefs=[])['data_file']
+
+        # recently written but old timestamp non-durable
+        ts_old = Timestamp(time.time() - reclaim_age - 1)
+        df_older = self._create_diskfile(
+            object_name='older', part=partition, commit=False,
+            timestamp=ts_old, frag_index=4)
+        datafile_older = df_older.manager.cleanup_ondisk_files(
+            df_older._datadir, frag_prefs=[])['data_file']
+        self.assertTrue(os.path.exists(datafile_recent))
+        self.assertTrue(os.path.exists(datafile_older))
+
+        # for this test we don't actually need to ssync anything, so pretend
+        # all suffixes are in sync
+        self.reconstructor._get_suffixes_to_sync = (
+            lambda job, node: ([], node))
+        df_mgr.commit_window = 0
+        with mock.patch(
+                'swift.obj.diskfile.is_file_older') as mock_is_file_older:
+            self.reconstructor.reconstruct()
+        # older nondurable will be removed with commit_window = 0
+        self.assertTrue(os.path.exists(datafile_recent))
+        self.assertFalse(os.path.exists(datafile_older))
+        df_recent.writer().commit(ts_recent)
+        self.assertTrue(os.path.exists(datafile_recent.replace('#4', '#4#d')))
+        # ...and attempt to commit will fail :(
+        with self.assertRaises(DiskFileError):
+            df_older.writer().commit(ts_old)
+        # with zero commit_window the call to stat the file is not made
+        mock_is_file_older.assert_not_called()
+
+    def test_sync_old_nondurable_before_committed_past_commit_window(self):
+        # verify that a *not so recently written* nondurable fragment won't
+        # survive being visited by the reconstructor if its timestamp is older
+        # than reclaim_age
+        shutil.rmtree(self.ec_obj_path)
+        ips = utils.whataremyips(self.reconstructor.ring_ip)
+        local_devs = [dev for dev in self.ec_obj_ring.devs
+                      if dev and dev['replication_ip'] in ips and
+                      dev['replication_port'] ==
+                      self.reconstructor.port]
+        partition = local_devs[0]['id']
+        # recently written, recent timestamp non-durable
+        ts_recent = Timestamp(time.time())
+        df_mgr = self.reconstructor._df_router[self.policy]
+        reclaim_age = df_mgr.reclaim_age
+        df_recent = self._create_diskfile(
+            object_name='recent', part=partition, commit=False,
+            timestamp=ts_recent, frag_index=4)
+        datafile_recent = df_recent.manager.cleanup_ondisk_files(
+            df_recent._datadir, frag_prefs=[])['data_file']
+
+        # recently written but old timestamp non-durable
+        ts_old = Timestamp(time.time() - reclaim_age - 1)
+        df_older = self._create_diskfile(
+            object_name='older', part=partition, commit=False,
+            timestamp=ts_old, frag_index=4)
+        datafile_older = df_older.manager.cleanup_ondisk_files(
+            df_older._datadir, frag_prefs=[])['data_file']
+        # pretend file was written more than commit_window seconds ago
+        now = time.time()
+        os.utime(datafile_older, (now - 60.1, now - 60.1))
+        self.assertTrue(os.path.exists(datafile_recent))
+        self.assertTrue(os.path.exists(datafile_older))
+
+        # for this test we don't actually need to ssync anything, so pretend
+        # all suffixes are in sync
+        self.reconstructor._get_suffixes_to_sync = (
+            lambda job, node: ([], node))
+        # leave commit_window at default of 60 seconds
+        self.reconstructor.reconstruct()
+        # older nondurable will be removed
+        self.assertTrue(os.path.exists(datafile_recent))
+        self.assertFalse(os.path.exists(datafile_older))
+        df_recent.writer().commit(ts_recent)
+        self.assertTrue(os.path.exists(datafile_recent.replace('#4', '#4#d')))
+        # ...and attempt to commit will fail :(
+        with self.assertRaises(DiskFileError):
+            df_older.writer().commit(ts_old)
+
+    def test_delete_reverted_max_objects_per_revert(self):
+        # verify reconstructor only deletes objects that were actually reverted
+        # when ssync is limited by max_objects_per_revert
+        shutil.rmtree(self.ec_obj_path)
+        ips = utils.whataremyips(self.reconstructor.ring_ip)
+        local_devs = [dev for dev in self.ec_obj_ring.devs
+                      if dev and dev['replication_ip'] in ips and
+                      dev['replication_port'] ==
+                      self.reconstructor.port]
+        partition = (local_devs[0]['id'] + 1) % 3
+        # three durable objects
+        df_0 = self._create_diskfile(
+            object_name='zero', part=partition)
+        datafile_0 = df_0.manager.cleanup_ondisk_files(
+            df_0._datadir, frag_prefs=[])['data_file']
+        self.assertTrue(os.path.exists(datafile_0))
+        df_1 = self._create_diskfile(
+            object_name='one', part=partition)
+        datafile_1 = df_1.manager.cleanup_ondisk_files(
+            df_1._datadir, frag_prefs=[])['data_file']
+        self.assertTrue(os.path.exists(datafile_1))
+        df_2 = self._create_diskfile(
+            object_name='two', part=partition)
+        datafile_2 = df_2.manager.cleanup_ondisk_files(
+            df_2._datadir, frag_prefs=[])['data_file']
+        self.assertTrue(os.path.exists(datafile_2))
+
+        datafiles = [datafile_0, datafile_1, datafile_2]
+        actual_datafiles = [df for df in datafiles if os.path.exists(df)]
+        self.assertEqual(datafiles, actual_datafiles)
+
+        # only two objects will be sync'd and purged...
+        ssync_calls = []
+        conf = dict(self.conf, max_objects_per_revert=2, handoffs_only=True)
+        self.reconstructor = object_reconstructor.ObjectReconstructor(
+            conf, logger=self.logger)
+        with mock.patch('swift.obj.reconstructor.ssync_sender',
+                        self._make_fake_ssync(ssync_calls)):
+            self.reconstructor.reconstruct()
+        for context in ssync_calls:
+            self.assertEqual(REVERT, context['job']['job_type'])
+            self.assertEqual(2, context.get('max_objects'))
+        actual_datafiles = [df for df in datafiles if os.path.exists(df)]
+        self.assertEqual(1, len(actual_datafiles), actual_datafiles)
+        # handoff still reported as remaining
+        self.assertEqual(1, self.reconstructor.handoffs_remaining)
+
+        # ...until next reconstructor run which will sync and purge the last
+        # object; max_objects_per_revert == actual number of objects
+        ssync_calls = []
+        conf = dict(self.conf, max_objects_per_revert=1, handoffs_only=True)
+        self.reconstructor = object_reconstructor.ObjectReconstructor(
+            conf, logger=self.logger)
+        with mock.patch('swift.obj.reconstructor.ssync_sender',
+                        self._make_fake_ssync(ssync_calls)):
+            self.reconstructor.reconstruct()
+        for context in ssync_calls:
+            self.assertEqual(REVERT, context['job']['job_type'])
+            self.assertEqual(1, context.get('max_objects'))
+        actual_datafiles = [df for df in datafiles if os.path.exists(df)]
+        self.assertEqual([], actual_datafiles)
+        # handoff is no longer remaining
+        self.assertEqual(0, self.reconstructor.handoffs_remaining)
+
+    def test_no_delete_failed_revert(self):
+        # test will only process revert jobs
+        self.reconstructor.handoffs_only = True
+        # suppress unmount warning
+        os.mkdir(os.path.join(self.devices, 'sda5'))
+
+        captured_ssync = []
+        # fail all jobs on part 2 on sda1
+        fail_jobs = [
+            {'device': 'sda1', 'partition': 2},
+        ]
+        with mock.patch('swift.obj.reconstructor.ssync_sender',
+                        self._make_fake_ssync(
+                            captured_ssync, fail_jobs=fail_jobs)), \
+                mocked_http_conn() as request_log:
+            self.reconstructor.reconstruct()
+        self.assertFalse(request_log.unexpected_requests)
+
+        # global setup has four revert jobs
+        self.assertEqual(len(captured_ssync), 2)
+        expected_ssync_calls = {
+            # device, part, frag_index: expected_occurrences
+            ('sda1', 2, 2, True): 1,
+            ('sda1', 2, 0, True): 1,
+        }
+        self.assertEqual(expected_ssync_calls, dict(collections.Counter(
+            (context['job']['device'],
+             context['job']['partition'],
+             context['job']['frag_index'],
+             context['include_non_durable'])
+            for context in captured_ssync
+        )))
+
+        # failed jobs don't sync suffixes
+        self.assertFalse(
+            self.logger.get_lines_for_level('warning'))
+        self.assertFalse(
+            self.logger.get_lines_for_level('error'))
+        # handoffs remaining and part exists
+        self.assertEqual(2, self.reconstructor.handoffs_remaining)
+        self.assertTrue(os.path.exists(self.parts_1['2']))
+
+        # again with no failures
+        captured_ssync = []
+        with mock.patch('swift.obj.reconstructor.ssync_sender',
+                        self._make_fake_ssync(captured_ssync)):
+            self.reconstructor.reconstruct()
+        # same jobs
+        self.assertEqual(len(captured_ssync), 2)
+        self.assertFalse(
+            self.logger.get_lines_for_level('error'))
+        # handoffs are cleaned up
+        self.assertEqual(0, self.reconstructor.handoffs_remaining)
+        warning_msgs = self.logger.get_lines_for_level('warning')
+        self.assertEqual(1, len(warning_msgs))
+        self.assertIn('no handoffs remaining', warning_msgs[0])
+
+        # need one more pass to cleanup the part dir
+        self.assertTrue(os.path.exists(self.parts_1['2']))
+        with mock.patch('swift.obj.reconstructor.ssync_sender',
+                        self._make_fake_ssync([])), \
+                mocked_http_conn() as request_log:
+            self.reconstructor.reconstruct()
+        self.assertFalse(os.path.exists(self.parts_1['2']))
+
+    def test_get_part_jobs(self):
+        # yeah, this test code expects a specific setup
+        self.assertEqual(len(self.part_nums), 3)
+
+        # OK, at this point we should have 4 loaded parts with one
+        jobs = []
+        for partition in os.listdir(self.ec_obj_path):
+            part_path = os.path.join(self.ec_obj_path, partition)
+            jobs = self.reconstructor._get_part_jobs(
+                self.ec_local_dev, part_path, int(partition), self.ec_policy)
+            self.assert_expected_jobs(partition, jobs)
+
+    def assertStatCount(self, stat_method, stat_prefix, expected_count):
+        count = count_stats(self.logger, stat_method, stat_prefix)
+        msg = 'expected %s != %s for %s %s' % (
+            expected_count, count, stat_method, stat_prefix)
+        self.assertEqual(expected_count, count, msg)
+
+    def test_delete_partition(self):
+        # part 2 is predefined to have all revert jobs
+        part_path = os.path.join(self.objects_1, '2')
+        self.assertTrue(os.access(part_path, os.F_OK))
+
+        ssync_calls = []
+        with mock.patch('swift.obj.reconstructor.ssync_sender',
+                        self._make_fake_ssync(ssync_calls)):
+            self.reconstructor.reconstruct(override_partitions=[2])
+
+        expected_ssync_calls = sorted([
+            (u'10.0.0.0', REVERT, 2, [u'3c1'], True),
+            (u'10.0.0.2', REVERT, 2, [u'061'], True),
+        ])
+        self.assertEqual(expected_ssync_calls, sorted((
+            c['node']['ip'],
+            c['job']['job_type'],
+            c['job']['partition'],
+            c['suffixes'],
+            c.get('include_non_durable')
+        ) for c in ssync_calls))
+
+        expected_stats = {
+            ('increment', 'partition.delete.count.'): 2,
+            ('timing_since', 'partition.delete.timing'): 2,
+        }
+        for stat_key, expected in expected_stats.items():
+            stat_method, stat_prefix = stat_key
+            self.assertStatCount(stat_method, stat_prefix, expected)
+
+        stub_data = self.reconstructor._get_hashes(
+            'sda1', 2, self.policy, do_listdir=True)
+        stub_data.update({'7ca': {None: '8f19c38e1cf8e2390d4ca29051407ae3'}})
+        pickle_path = os.path.join(part_path, 'hashes.pkl')
+        with open(pickle_path, 'wb') as f:
+            pickle.dump(stub_data, f)
+
+        # part 2 should be totally empty
+        hash_gen = self.reconstructor._df_router[self.policy].yield_hashes(
+            'sda1', '2', self.policy, suffixes=stub_data.keys())
+        for hash_, ts in hash_gen:
+            self.fail('found %s : %s' % (hash_, ts))
+
+        new_hashes = self.reconstructor._get_hashes(
+            'sda1', 2, self.policy, do_listdir=True)
+        self.assertFalse(new_hashes)
+
+        # N.B. the partition directory is removed next pass
+        ssync_calls = []
+        with mocked_http_conn() as request_log:
+            with mock.patch('swift.obj.reconstructor.ssync_sender',
+                            self._make_fake_ssync(ssync_calls)):
+                self.reconstructor.reconstruct(override_partitions=[2])
+        self.assertEqual([], ssync_calls)
+        self.assertEqual([], request_log.requests)
+        self.assertFalse(os.access(part_path, os.F_OK))
+
+    def test_process_job_all_success(self):
+        rehash_per_job_type = {SYNC: 1, REVERT: 0}
+        self.reconstructor._reset_stats()
+        with mock_ssync_sender():
+            found_jobs = []
+            for part_info in self.reconstructor.collect_parts():
+                jobs = self.reconstructor.build_reconstruction_jobs(
+                    part_info)
+                found_jobs.extend(jobs)
+                for job in jobs:
+                    self.logger.clear()
+                    node_count = len(job['sync_to'])
+                    rehash_count = node_count * rehash_per_job_type[
+                        job['job_type']]
+                    with mocked_http_conn(*[200] * rehash_count,
+                                          body=pickle.dumps({})):
+                        self.reconstructor.process_job(job)
+                    if job['job_type'] == object_reconstructor.REVERT:
+                        self.assertStatCount('update_stats',
+                                             'suffix.hashes', 0)
+                    else:
+                        self.assertStatCount('update_stats',
+                                             'suffix.hashes', node_count)
+                        self.assertStatCount('update_stats',
+                                             'suffix.syncs', node_count)
+                    self.assertNotIn('error', self.logger.all_log_lines())
+        self.assertEqual(
+            dict(collections.Counter((job['device'], job['partition'],
+                                      job['frag_index'], job['job_type'])
+                                     for job in found_jobs)),
+            {('sda1', 0, 1, SYNC): 1,
+             ('sda1', 0, 2, REVERT): 1,
+             ('sda1', 1, 0, REVERT): 1,
+             ('sda1', 1, 1, REVERT): 1,
+             ('sda1', 1, 4, SYNC): 1,
+             ('sda1', 2, 0, REVERT): 1,
+             ('sda1', 2, 2, REVERT): 1})
+        self.assertEqual(self.reconstructor.suffix_sync, 12)
+        self.assertEqual(self.reconstructor.suffix_count, 12)
+        self.assertEqual(self.reconstructor.reconstruction_count, 7)
+
+    def test_process_job_all_insufficient_storage(self):
+        self.reconstructor._reset_stats()
+        with mock_ssync_sender():
+            with mocked_http_conn(*[507] * 10):
+                found_jobs = []
+                for part_info in self.reconstructor.collect_parts():
+                    jobs = self.reconstructor.build_reconstruction_jobs(
+                        part_info)
+                    found_jobs.extend(jobs)
+                    for job in jobs:
+                        self.logger.clear()
+                        self.reconstructor.process_job(job)
+                        for line in self.logger.get_lines_for_level('error'):
+                            self.assertIn('responded as unmounted', line)
+                        self.assertEqual(0, count_stats(
+                            self.logger, 'update_stats', 'suffix.hashes'))
+                        self.assertEqual(0, count_stats(
+                            self.logger, 'update_stats', 'suffix.syncs'))
+        self.assertEqual(
+            dict(collections.Counter((job['device'], job['partition'],
+                                      job['frag_index'], job['job_type'])
+                                     for job in found_jobs)),
+            {('sda1', 0, 1, SYNC): 1,
+             ('sda1', 0, 2, REVERT): 1,
+             ('sda1', 1, 0, REVERT): 1,
+             ('sda1', 1, 1, REVERT): 1,
+             ('sda1', 1, 4, SYNC): 1,
+             ('sda1', 2, 0, REVERT): 1,
+             ('sda1', 2, 2, REVERT): 1})
+        self.assertEqual(self.reconstructor.suffix_sync, 0)
+        self.assertEqual(self.reconstructor.suffix_count, 0)
+        self.assertEqual(self.reconstructor.reconstruction_count, 7)
+
+    def test_process_job_all_client_error(self):
+        self.reconstructor._reset_stats()
+        with mock_ssync_sender():
+            with mocked_http_conn(*[400] * 6):
+                found_jobs = []
+                for part_info in self.reconstructor.collect_parts():
+                    jobs = self.reconstructor.build_reconstruction_jobs(
+                        part_info)
+                    found_jobs.extend(jobs)
+                    for job in jobs:
+                        self.logger.clear()
+                        self.reconstructor.process_job(job)
+                        for line in self.logger.get_lines_for_level('error'):
+                            self.assertIn('Invalid response 400', line)
+                        self.assertEqual(0, count_stats(
+                            self.logger, 'update_stats', 'suffix.hashes'))
+                        self.assertEqual(0, count_stats(
+                            self.logger, 'update_stats', 'suffix.syncs'))
+        self.assertEqual(
+            dict(collections.Counter(
+                (job['device'], job['partition'], job['frag_index'])
+                for job in found_jobs)),
+            {('sda1', 0, 1): 1,
+             ('sda1', 0, 2): 1,
+             ('sda1', 1, 0): 1,
+             ('sda1', 1, 1): 1,
+             ('sda1', 1, 4): 1,
+             ('sda1', 2, 0): 1,
+             ('sda1', 2, 2): 1})
+        self.assertEqual(self.reconstructor.suffix_sync, 0)
+        self.assertEqual(self.reconstructor.suffix_count, 0)
+        self.assertEqual(self.reconstructor.reconstruction_count, 7)
+
+    def test_process_job_all_timeout(self):
+        self.reconstructor._reset_stats()
+        with mock_ssync_sender(), mocked_http_conn(*[Timeout()] * 6):
+            found_jobs = []
+            for part_info in self.reconstructor.collect_parts():
+                jobs = self.reconstructor.build_reconstruction_jobs(
+                    part_info)
+                found_jobs.extend(jobs)
+                for job in jobs:
+                    self.logger.clear()
+                    self.reconstructor.process_job(job)
+                    for line in self.logger.get_lines_for_level('error'):
+                        self.assertIn('Timeout (Nones)', line)
+                    self.assertStatCount(
+                        'update_stats', 'suffix.hashes', 0)
+                    self.assertStatCount(
+                        'update_stats', 'suffix.syncs', 0)
+        self.assertEqual(
+            dict(collections.Counter(
+                (job['device'], job['partition'], job['frag_index'])
+                for job in found_jobs)),
+            {('sda1', 0, 1): 1,
+             ('sda1', 0, 2): 1,
+             ('sda1', 1, 0): 1,
+             ('sda1', 1, 1): 1,
+             ('sda1', 1, 4): 1,
+             ('sda1', 2, 0): 1,
+             ('sda1', 2, 2): 1})
+        self.assertEqual(self.reconstructor.suffix_sync, 0)
+        self.assertEqual(self.reconstructor.suffix_count, 0)
+        self.assertEqual(self.reconstructor.reconstruction_count, 7)
+
+    def test_reconstructor_skipped_partpower_increase(self):
+        self.reconstructor._reset_stats()
+        _create_test_rings(self.testdir, 10)
+        # Enforce re-reading the EC ring
+        POLICIES[1].object_ring = ring.Ring(self.testdir, ring_name='object-1')
+
+        self.reconstructor.reconstruct()
+
+        self.assertEqual(0, self.reconstructor.reconstruction_count)
+        warnings = self.logger.get_lines_for_level('warning')
+        self.assertIn(
+            "next_part_power set in policy 'one'. Skipping", warnings)
+
+
+class TestGlobalSetupObjectReconstructorLegacyDurable(
+        TestGlobalSetupObjectReconstructor):
+    # Tests for reconstructor using real objects in test partition directories.
+    legacy_durable = True
+
+
+@patch_policies(with_ec_default=True)
+class TestWorkerReconstructor(unittest.TestCase):
+
+    maxDiff = None
+
+    def setUp(self):
+        super(TestWorkerReconstructor, self).setUp()
+        self.logger = debug_logger()
+        self.testdir = tempfile.mkdtemp()
+        self.recon_cache_path = os.path.join(self.testdir, 'recon')
+        self.rcache = os.path.join(self.recon_cache_path, 'object.recon')
+        # dump_recon_cache expects recon_cache_path to exist
+        os.mkdir(self.recon_cache_path)
+
+    def tearDown(self):
+        super(TestWorkerReconstructor, self).tearDown()
+        shutil.rmtree(self.testdir)
+
+    def test_no_workers_by_default(self):
+        reconstructor = object_reconstructor.ObjectReconstructor(
+            {}, logger=self.logger)
+        self.assertEqual(0, reconstructor.reconstructor_workers)
+        self.assertEqual(0, len(list(reconstructor.get_worker_args())))
+
+    def test_bad_value_workers(self):
+        reconstructor = object_reconstructor.ObjectReconstructor(
+            {'reconstructor_workers': '-1'}, logger=self.logger)
+        self.assertEqual(-1, reconstructor.reconstructor_workers)
+        self.assertEqual(0, len(list(reconstructor.get_worker_args())))
+
+    def test_workers_with_no_devices(self):
+        def do_test(num_workers):
+            reconstructor = object_reconstructor.ObjectReconstructor(
+                {'reconstructor_workers': num_workers}, logger=self.logger)
+            self.assertEqual(num_workers, reconstructor.reconstructor_workers)
+            self.assertEqual(1, len(list(reconstructor.get_worker_args())))
+            self.assertEqual([
+                {'override_partitions': [], 'override_devices': [],
+                 'multiprocess_worker_index': 0},
+            ], list(reconstructor.get_worker_args()))
+        do_test(1)
+        do_test(10)
+
+    def test_workers_with_devices_and_no_valid_overrides(self):
+        reconstructor = object_reconstructor.ObjectReconstructor(
+            {'reconstructor_workers': '2'}, logger=self.logger)
+        reconstructor.get_local_devices = lambda: ['sdb', 'sdc']
+        self.assertEqual(2, reconstructor.reconstructor_workers)
+        # N.B. sdz is not in local_devices so there are no devices to process
+        # but still expect a single worker process
+        worker_args = list(reconstructor.get_worker_args(
+            once=True, devices='sdz'))
+        self.assertEqual(1, len(worker_args))
+        self.assertEqual([{'override_partitions': [],
+                           'override_devices': ['sdz'],
+                           'multiprocess_worker_index': 0}],
+                         worker_args)
+        # overrides are ignored in forever mode
+        worker_args = list(reconstructor.get_worker_args(
+            once=False, devices='sdz'))
+        self.assertEqual(2, len(worker_args))
+        self.assertEqual([
+            {'override_partitions': [], 'override_devices': ['sdb'],
+             'multiprocess_worker_index': 0},
+            {'override_partitions': [], 'override_devices': ['sdc'],
+             'multiprocess_worker_index': 1},
+        ], worker_args)
+
+    def test_workers_with_devices(self):
+        reconstructor = object_reconstructor.ObjectReconstructor(
+            {'reconstructor_workers': '2'}, logger=self.logger)
+        reconstructor.get_local_devices = lambda: ['sdb', 'sdc']
+        self.assertEqual(2, reconstructor.reconstructor_workers)
+        self.assertEqual(2, len(list(reconstructor.get_worker_args())))
+        expected = [
+            {'override_partitions': [], 'override_devices': ['sdb'],
+             'multiprocess_worker_index': 0},
+            {'override_partitions': [], 'override_devices': ['sdc'],
+             'multiprocess_worker_index': 1},
+        ]
+        worker_args = list(reconstructor.get_worker_args(once=False))
+        self.assertEqual(2, len(worker_args))
+        self.assertEqual(expected, worker_args)
+        worker_args = list(reconstructor.get_worker_args(once=True))
+        self.assertEqual(2, len(worker_args))
+        self.assertEqual(expected, worker_args)
+
+    def test_workers_with_devices_and_overrides(self):
+        reconstructor = object_reconstructor.ObjectReconstructor(
+            {'reconstructor_workers': '2'}, logger=self.logger)
+        reconstructor.get_local_devices = lambda: ['sdb', 'sdc']
+        self.assertEqual(2, reconstructor.reconstructor_workers)
+        # check we don't get more workers than override devices...
+        # N.B. sdz is not in local_devices so should be ignored for the
+        # purposes of generating workers
+        worker_args = list(reconstructor.get_worker_args(
+            once=True, devices='sdb,sdz', partitions='99,333'))
+        self.assertEqual(1, len(worker_args))
+        self.assertEqual(
+            [{'override_partitions': [99, 333], 'override_devices': ['sdb'],
+              'multiprocess_worker_index': 0}],
+            worker_args)
+
+        # overrides are ignored in forever mode
+        reconstructor = object_reconstructor.ObjectReconstructor(
+            {'reconstructor_workers': '2'}, logger=self.logger)
+        reconstructor.get_local_devices = lambda: ['sdb', 'sdc']
+        worker_args = list(reconstructor.get_worker_args(
+            once=False, devices='sdb,sdz', partitions='99,333'))
+        self.assertEqual([
+            {'override_partitions': [], 'override_devices': ['sdb'],
+             'multiprocess_worker_index': 0},
+            {'override_partitions': [], 'override_devices': ['sdc'],
+             'multiprocess_worker_index': 1}
+        ], worker_args)
+
+    def test_workers_with_lots_of_devices(self):
+        reconstructor = object_reconstructor.ObjectReconstructor(
+            {'reconstructor_workers': '2'}, logger=self.logger)
+        reconstructor.get_local_devices = lambda: [
+            'sdb', 'sdc', 'sdd', 'sde', 'sdf']
+        self.assertEqual(2, reconstructor.reconstructor_workers)
+        self.assertEqual(2, len(list(reconstructor.get_worker_args())))
+        self.assertEqual([
+            {'override_partitions': [],
+             'override_devices': ['sdb', 'sdd', 'sdf'],
+             'multiprocess_worker_index': 0},
+            {'override_partitions': [],
+             'override_devices': ['sdc', 'sde'],
+             'multiprocess_worker_index': 1},
+        ], list(reconstructor.get_worker_args()))
+
+    def test_workers_with_lots_of_devices_and_overrides(self):
+        # check that override devices get distributed across workers
+        # in similar fashion to all devices
+        reconstructor = object_reconstructor.ObjectReconstructor(
+            {'reconstructor_workers': '2'}, logger=self.logger)
+        reconstructor.get_local_devices = lambda: [
+            'sdb', 'sdc', 'sdd', 'sde', 'sdf']
+        self.assertEqual(2, reconstructor.reconstructor_workers)
+        worker_args = list(reconstructor.get_worker_args(
+            once=True, devices='sdb,sdd,sdf', partitions='99,333'))
+        # 3 devices to operate on, 2 workers -> one worker gets two devices
+        # and the other worker just gets one
+        self.assertEqual([{
+            'override_partitions': [99, 333],
+            'override_devices': ['sdb', 'sdf'],
+            'multiprocess_worker_index': 0,
+        }, {
+            'override_partitions': [99, 333],
+            'override_devices': ['sdd'],
+            'multiprocess_worker_index': 1,
+        }], worker_args)
+
+        # with 4 override devices, expect 2 per worker
+        worker_args = list(reconstructor.get_worker_args(
+            once=True, devices='sdb,sdc,sdd,sdf', partitions='99,333'))
+        self.assertEqual(2, len(worker_args))
+        self.assertEqual([
+            {'override_partitions': [99, 333],
+             'override_devices': ['sdb', 'sdd'],
+             'multiprocess_worker_index': 0},
+            {'override_partitions': [99, 333],
+             'override_devices': ['sdc', 'sdf'],
+             'multiprocess_worker_index': 1},
+        ], worker_args)
+
+    def test_workers_with_lots_of_workers(self):
+        reconstructor = object_reconstructor.ObjectReconstructor(
+            {'reconstructor_workers': '10'}, logger=self.logger)
+        reconstructor.get_local_devices = lambda: ['sdb', 'sdc']
+        self.assertEqual(10, reconstructor.reconstructor_workers)
+        self.assertEqual(2, len(list(reconstructor.get_worker_args())))
+        self.assertEqual([
+            {'override_partitions': [], 'override_devices': ['sdb'],
+             'multiprocess_worker_index': 0},
+            {'override_partitions': [], 'override_devices': ['sdc'],
+             'multiprocess_worker_index': 1},
+        ], list(reconstructor.get_worker_args()))
+
+    def test_workers_with_lots_of_workers_and_devices(self):
+        reconstructor = object_reconstructor.ObjectReconstructor(
+            {'reconstructor_workers': '10'}, logger=self.logger)
+        reconstructor.get_local_devices = lambda: [
+            'sdb', 'sdc', 'sdd', 'sde', 'sdf']
+        self.assertEqual(10, reconstructor.reconstructor_workers)
+        self.assertEqual(5, len(list(reconstructor.get_worker_args())))
+        self.assertEqual([
+            {'override_partitions': [], 'override_devices': ['sdb'],
+             'multiprocess_worker_index': 0},
+            {'override_partitions': [], 'override_devices': ['sdc'],
+             'multiprocess_worker_index': 1},
+            {'override_partitions': [], 'override_devices': ['sdd'],
+             'multiprocess_worker_index': 2},
+            {'override_partitions': [], 'override_devices': ['sde'],
+             'multiprocess_worker_index': 3},
+            {'override_partitions': [], 'override_devices': ['sdf'],
+             'multiprocess_worker_index': 4},
+        ], list(reconstructor.get_worker_args()))
+
+    def test_workers_with_some_workers_and_devices(self):
+        reconstructor = object_reconstructor.ObjectReconstructor(
+            {}, logger=self.logger)
+        reconstructor.get_local_devices = lambda: [
+            'd%s' % (i + 1) for i in range(21)]
+
+        # With more devices than workers, the work is spread out as evenly
+        # as we can manage. When number-of-devices is a multiple of
+        # number-of-workers, every worker has the same number of devices to
+        # operate on.
+        reconstructor.reconstructor_workers = 7
+        worker_args = list(reconstructor.get_worker_args())
+        self.assertEqual([len(a['override_devices']) for a in worker_args],
+                         [3] * 7)
+
+        # When number-of-devices is not a multiple of number-of-workers,
+        # device counts differ by at most 1.
+        reconstructor.reconstructor_workers = 5
+        worker_args = list(reconstructor.get_worker_args())
+        self.assertEqual(
+            sorted([len(a['override_devices']) for a in worker_args]),
+            [4, 4, 4, 4, 5])
+
+        # With more workers than devices, we don't create useless workers.
+        # We'll only make one per device.
+        reconstructor.reconstructor_workers = 22
+        worker_args = list(reconstructor.get_worker_args())
+        self.assertEqual(
+            [len(a['override_devices']) for a in worker_args],
+            [1] * 21)
+
+        # This is true even if we have far more workers than devices.
+        reconstructor.reconstructor_workers = 2 ** 16
+        worker_args = list(reconstructor.get_worker_args())
+        self.assertEqual(
+            [len(a['override_devices']) for a in worker_args],
+            [1] * 21)
+
+        # Spot check one full result for sanity's sake
+        reconstructor.reconstructor_workers = 11
+        self.assertEqual([
+            {'override_partitions': [], 'override_devices': ['d1', 'd12'],
+             'multiprocess_worker_index': 0},
+            {'override_partitions': [], 'override_devices': ['d2', 'd13'],
+             'multiprocess_worker_index': 1},
+            {'override_partitions': [], 'override_devices': ['d3', 'd14'],
+             'multiprocess_worker_index': 2},
+            {'override_partitions': [], 'override_devices': ['d4', 'd15'],
+             'multiprocess_worker_index': 3},
+            {'override_partitions': [], 'override_devices': ['d5', 'd16'],
+             'multiprocess_worker_index': 4},
+            {'override_partitions': [], 'override_devices': ['d6', 'd17'],
+             'multiprocess_worker_index': 5},
+            {'override_partitions': [], 'override_devices': ['d7', 'd18'],
+             'multiprocess_worker_index': 6},
+            {'override_partitions': [], 'override_devices': ['d8', 'd19'],
+             'multiprocess_worker_index': 7},
+            {'override_partitions': [], 'override_devices': ['d9', 'd20'],
+             'multiprocess_worker_index': 8},
+            {'override_partitions': [], 'override_devices': ['d10', 'd21'],
+             'multiprocess_worker_index': 9},
+            {'override_partitions': [], 'override_devices': ['d11'],
+             'multiprocess_worker_index': 10},
+        ], list(reconstructor.get_worker_args()))
+
+    def test_next_rcache_update_configured_with_stats_interval(self):
+        now = time.time()
+        with mock.patch('swift.obj.reconstructor.time.time', return_value=now):
+            reconstructor = object_reconstructor.ObjectReconstructor(
+                {}, logger=self.logger)
+            self.assertEqual(now + 300, reconstructor._next_rcache_update)
+            reconstructor = object_reconstructor.ObjectReconstructor(
+                {'stats_interval': '30'}, logger=self.logger)
+            self.assertEqual(now + 30, reconstructor._next_rcache_update)
+
+    def test_is_healthy_rcache_update_waits_for_next_update(self):
+        now = time.time()
+        with mock.patch('swift.obj.reconstructor.time.time', return_value=now):
+            reconstructor = object_reconstructor.ObjectReconstructor(
+                {'recon_cache_path': self.recon_cache_path},
+                logger=self.logger)
+        # file does not exist to start
+        self.assertFalse(os.path.exists(self.rcache))
+        with mock.patch('swift.obj.reconstructor.os.path.getmtime',
+                        return_value=10):
+            self.assertTrue(reconstructor.is_healthy())
+        # ... and isn't created until _next_rcache_update
+        self.assertFalse(os.path.exists(self.rcache))
+        # ... but if we wait 5 mins (by default)
+        orig_next_update = reconstructor._next_rcache_update
+        with mock.patch('swift.obj.reconstructor.time.time',
+                        return_value=now + 301):
+            with mock.patch('swift.obj.reconstructor.os.path.getmtime',
+                            return_value=11):
+                self.assertTrue(reconstructor.is_healthy())
+        self.assertGreater(reconstructor._next_rcache_update, orig_next_update)
+        # ... it will be created
+        self.assertTrue(os.path.exists(self.rcache))
+        with open(self.rcache) as f:
+            data = json.load(f)
+        # and empty
+        self.assertEqual({}, data)
+
+    def test_is_healthy(self):
+        reconstructor = object_reconstructor.ObjectReconstructor(
+            {'recon_cache_path': self.recon_cache_path},
+            logger=self.logger)
+        with mock.patch('swift.obj.reconstructor.os.path.getmtime',
+                        return_value=10):
+            self.assertTrue(reconstructor.is_healthy())
+        reconstructor.get_local_devices = lambda: {
+            'sdb%d' % p for p in reconstructor.policies}
+        with mock.patch('swift.obj.reconstructor.os.path.getmtime',
+                        return_value=11):
+            self.assertFalse(reconstructor.is_healthy())
+        reconstructor.all_local_devices = {
+            'sdb%d' % p for p in reconstructor.policies}
+        with mock.patch('swift.obj.reconstructor.os.path.getmtime',
+                        return_value=12):
+            self.assertTrue(reconstructor.is_healthy())
+
+    def test_is_healthy_detects_ring_change(self):
+        reconstructor = object_reconstructor.ObjectReconstructor(
+            {'recon_cache_path': self.recon_cache_path,
+             'reconstructor_workers': 1,
+             # bind ip and port will not match any dev in first version of ring
+             'bind_ip': '10.0.0.20', 'bind_port': '1020'},
+            logger=self.logger)
+        p = random.choice(reconstructor.policies)
+        self.assertEqual(14, len(p.object_ring.devs))  # sanity check
+        worker_args = list(reconstructor.get_worker_args())
+        self.assertFalse(worker_args[0]['override_devices'])  # no local devs
+        with mock.patch('swift.obj.reconstructor.os.path.getmtime',
+                        return_value=10):
+            self.assertTrue(reconstructor.is_healthy())
+        # expand ring - now there are local devices
+        p.object_ring.set_replicas(28)
+        self.assertEqual(28, len(p.object_ring.devs))  # sanity check
+
+        # If ring.gz mtime did not change, there is no change to detect
+        with mock.patch('swift.obj.reconstructor.os.path.getmtime',
+                        return_value=10):
+            self.assertTrue(reconstructor.is_healthy())
+        # Now, ring.gz mtime changed, so the change will be detected
+        with mock.patch('swift.obj.reconstructor.os.path.getmtime',
+                        return_value=11):
+            self.assertFalse(reconstructor.is_healthy())
+
+        self.assertNotEqual(worker_args, list(reconstructor.get_worker_args()))
+        with mock.patch('swift.obj.reconstructor.os.path.getmtime',
+                        return_value=12):
+            self.assertTrue(reconstructor.is_healthy())
+
+    def test_final_recon_dump(self):
+        reconstructor = object_reconstructor.ObjectReconstructor(
+            {'recon_cache_path': self.recon_cache_path},
+            logger=self.logger)
+        reconstructor.all_local_devices = ['sda', 'sdc']
+        total = 12.0
+        now = time.time()
+        with mock.patch('swift.obj.reconstructor.time.time', return_value=now):
+            reconstructor.final_recon_dump(total)
+        with open(self.rcache) as f:
+            data = json.load(f)
+        self.assertEqual({
+            'object_reconstruction_last': now,
+            'object_reconstruction_time': total,
+        }, data)
+        total = 14.0
+        now += total * 60
+        with mock.patch('swift.obj.reconstructor.time.time', return_value=now):
+            reconstructor.final_recon_dump(total)
+        with open(self.rcache) as f:
+            data = json.load(f)
+        self.assertEqual({
+            'object_reconstruction_last': now,
+            'object_reconstruction_time': total,
+        }, data)
+
+        def check_per_disk_stats(before, now, old_total, total,
+                                 override_devices):
+            with mock.patch('swift.obj.reconstructor.time.time',
+                            return_value=now), \
+                    mock.patch('swift.obj.reconstructor.os.getpid',
+                               return_value='pid-1'):
+                reconstructor.final_recon_dump(
+                    total, override_devices=override_devices)
+            with open(self.rcache) as f:
+                data = json.load(f)
+            self.assertEqual({
+                'object_reconstruction_last': before,
+                'object_reconstruction_time': old_total,
+                'object_reconstruction_per_disk': {
+                    'sda': {
+                        'object_reconstruction_last': now,
+                        'object_reconstruction_time': total,
+                        'pid': 'pid-1',
+                    },
+                    'sdc': {
+                        'object_reconstruction_last': now,
+                        'object_reconstruction_time': total,
+                        'pid': 'pid-1',
+                    },
+
+                },
+            }, data)
+
+        # per_disk_stats with workers and local_devices
+        reconstructor.reconstructor_workers = 1
+        old_total = total
+        total = 16.0
+        before = now
+        now += total * 60
+        check_per_disk_stats(before, now, old_total, total, ['sda', 'sdc'])
+
+        # per_disk_stats with workers and local_devices but no overrides
+        reconstructor.reconstructor_workers = 1
+        total = 17.0
+        now += total * 60
+        check_per_disk_stats(before, now, old_total, total, [])
+
+        # and without workers we clear it out
+        reconstructor.reconstructor_workers = 0
+        total = 18.0
+        now += total * 60
+        with mock.patch('swift.obj.reconstructor.time.time', return_value=now):
+            reconstructor.final_recon_dump(total)
+        with open(self.rcache) as f:
+            data = json.load(f)
+        self.assertEqual({
+            'object_reconstruction_last': now,
+            'object_reconstruction_time': total,
+        }, data)
+
+        # set per disk stats again...
+        reconstructor.reconstructor_workers = 1
+        old_total = total
+        total = 18.0
+        before = now
+        now += total * 60
+        check_per_disk_stats(before, now, old_total, total, ['sda', 'sdc'])
+
+        # ...then remove all devices and check we clear out per-disk stats
+        reconstructor.all_local_devices = []
+        total = 20.0
+        now += total * 60
+        with mock.patch('swift.obj.reconstructor.time.time', return_value=now):
+            reconstructor.final_recon_dump(total)
+        with open(self.rcache) as f:
+            data = json.load(f)
+        self.assertEqual({
+            'object_reconstruction_last': now,
+            'object_reconstruction_time': total,
+        }, data)
+
+    def test_dump_recon_run_once_inline(self):
+        reconstructor = object_reconstructor.ObjectReconstructor(
+            {'recon_cache_path': self.recon_cache_path},
+            logger=self.logger)
+        reconstructor.reconstruct = mock.MagicMock()
+        now = time.time()
+        later = now + 300  # 5 mins
+        with mock.patch('swift.obj.reconstructor.time.time', side_effect=[
+                now, later, later]):
+            reconstructor.run_once()
+        # no override args passed to reconstruct
+        self.assertEqual([mock.call(
+            override_devices=[],
+            override_partitions=[]
+        )], reconstructor.reconstruct.call_args_list)
+        # script mode with no override args, we expect recon dumps
+        self.assertTrue(os.path.exists(self.rcache))
+        with open(self.rcache) as f:
+            data = json.load(f)
+        self.assertEqual({
+            'object_reconstruction_last': later,
+            'object_reconstruction_time': 5.0,
+        }, data)
+        total = 10.0
+        later += total * 60
+        with mock.patch('swift.obj.reconstructor.time.time',
+                        return_value=later):
+            reconstructor.final_recon_dump(total)
+        with open(self.rcache) as f:
+            data = json.load(f)
+        self.assertEqual({
+            'object_reconstruction_last': later,
+            'object_reconstruction_time': 10.0,
+        }, data)
+
+    def test_dump_recon_run_once_in_worker(self):
+        reconstructor = object_reconstructor.ObjectReconstructor(
+            {'recon_cache_path': self.recon_cache_path,
+             'reconstructor_workers': 1},
+            logger=self.logger)
+        reconstructor.get_local_devices = lambda: {'sda'}
+        now = time.time()
+        later = now + 300  # 5 mins
+
+        def do_test(run_kwargs, expected_device):
+            # get the actual kwargs that would be passed to run_once in a
+            # worker
+            run_once_kwargs = list(
+                reconstructor.get_worker_args(once=True, **run_kwargs))[0]
+            reconstructor.reconstruct = mock.MagicMock()
+            with mock.patch('swift.obj.reconstructor.time.time',
+                            side_effect=[now, later, later]):
+                reconstructor.run_once(**run_once_kwargs)
+            self.assertEqual([mock.call(
+                override_devices=[expected_device],
+                override_partitions=[]
+            )], reconstructor.reconstruct.call_args_list)
+            self.assertTrue(os.path.exists(self.rcache))
+            with open(self.rcache) as f:
+                data = json.load(f)
+            self.assertEqual({
+                # no aggregate is written but perhaps it should be, in which
+                # case this assertion will need to change
+                'object_reconstruction_per_disk': {
+                    expected_device: {
+                        'object_reconstruction_last': later,
+                        'object_reconstruction_time': 5.0,
+                        'pid': mock.ANY
+                    }
+                }
+            }, data)
+
+        # script mode with no CLI override args, we expect recon dumps
+        do_test({}, 'sda')
+        # script mode *with* CLI override devices, we expect recon dumps
+        os.unlink(self.rcache)
+        do_test(dict(devices='sda'), 'sda')
+        # if the override device is not in local devices we still get
+        # a recon dump, but it'll get cleaned up in the next aggregation
+        os.unlink(self.rcache)
+        do_test(dict(devices='sdz'), 'sdz')
+        # repeat with no local devices
+        reconstructor.get_local_devices = lambda: set()
+        os.unlink(self.rcache)
+        do_test(dict(devices='sdz'), 'sdz')
+
+        # now disable workers and check that inline run_once updates rcache
+        # and clears out per disk stats
+        reconstructor.get_local_devices = lambda: {'sda'}
+        now = time.time()
+        later = now + 600  # 10 mins
+        reconstructor.reconstructor_workers = 0
+        with mock.patch('swift.obj.reconstructor.time.time',
+                        side_effect=[now, later, later]):
+            reconstructor.run_once()
+        with open(self.rcache) as f:
+            data = json.load(f)
+        self.assertEqual({
+            'object_reconstruction_last': later,
+            'object_reconstruction_time': 10.0,
+        }, data)
+
+    def test_no_dump_recon_run_once(self):
+        reconstructor = object_reconstructor.ObjectReconstructor(
+            {'recon_cache_path': self.recon_cache_path},
+            logger=self.logger)
+        reconstructor.get_local_devices = lambda: {'sda', 'sdb', 'sdc'}
+
+        def do_test(run_once_kwargs, expected_devices, expected_partitions):
+            reconstructor.reconstruct = mock.MagicMock()
+            now = time.time()
+            later = now + 300  # 5 mins
+            with mock.patch('swift.obj.reconstructor.time.time', side_effect=[
+                    now, later, later]):
+                reconstructor.run_once(**run_once_kwargs)
+            # override args passed to reconstruct
+            actual_calls = reconstructor.reconstruct.call_args_list
+            self.assertEqual({'override_devices', 'override_partitions'},
+                             set(actual_calls[0][1]))
+            self.assertEqual(sorted(expected_devices),
+                             sorted(actual_calls[0][1]['override_devices']))
+            self.assertEqual(sorted(expected_partitions),
+                             sorted(actual_calls[0][1]['override_partitions']))
+            self.assertFalse(actual_calls[1:])
+            self.assertEqual(False, os.path.exists(self.rcache))
+
+        # inline mode with overrides never does recon dump
+        reconstructor.reconstructor_workers = 0
+        kwargs = {'devices': 'sda,sdb'}
+        do_test(kwargs, ['sda', 'sdb'], [])
+
+        # Have partition override, so no recon dump
+        kwargs = {'partitions': '1,2,3'}
+        do_test(kwargs, [], [1, 2, 3])
+        reconstructor.reconstructor_workers = 1
+        worker_kwargs = list(
+            reconstructor.get_worker_args(once=True, **kwargs))[0]
+        do_test(worker_kwargs, ['sda', 'sdb', 'sdc'], [1, 2, 3])
+
+        reconstructor.reconstructor_workers = 0
+        kwargs = {'devices': 'sda,sdb', 'partitions': '1,2,3'}
+        do_test(kwargs, ['sda', 'sdb'], [1, 2, 3])
+        reconstructor.reconstructor_workers = 1
+        worker_kwargs = list(
+            reconstructor.get_worker_args(once=True, **kwargs))[0]
+        do_test(worker_kwargs, ['sda', 'sdb'], [1, 2, 3])
+
+        # 'sdz' is not in local devices
+        reconstructor.reconstructor_workers = 0
+        kwargs = {'devices': 'sdz'}
+        do_test(kwargs, ['sdz'], [])
+
+    def test_run_forever_recon_aggregation(self):
+
+        class StopForever(Exception):
+            pass
+
+        reconstructor = object_reconstructor.ObjectReconstructor({
+            'reconstructor_workers': 2,
+            'recon_cache_path': self.recon_cache_path
+        }, logger=self.logger)
+        reconstructor.get_local_devices = lambda: ['sda', 'sdb', 'sdc', 'sdd']
+        reconstructor.reconstruct = mock.MagicMock()
+        now = time.time()
+        later = now + 300  # 5 mins
+        worker_args = list(
+            # include 'devices' kwarg as a sanity check - it should be ignored
+            # in run_forever mode
+            reconstructor.get_worker_args(once=False, devices='sda'))
+        with mock.patch('swift.obj.reconstructor.time.time',
+                        side_effect=[now, later, later]), \
+                mock.patch('swift.obj.reconstructor.os.getpid',
+                           return_value='pid-1'), \
+                mock.patch('swift.obj.reconstructor.sleep',
+                           side_effect=[StopForever]), \
+                Timeout(.3), quiet_eventlet_exceptions(), \
+                self.assertRaises(StopForever):
+            gt = spawn(reconstructor.run_forever, **worker_args[0])
+            gt.wait()
+        # override args are passed to reconstruct
+        self.assertEqual([mock.call(
+            override_devices=['sda', 'sdc'],
+            override_partitions=[]
+        )], reconstructor.reconstruct.call_args_list)
+        # forever mode with override args, we expect per-disk recon dumps
+        self.assertTrue(os.path.exists(self.rcache))
+        with open(self.rcache) as f:
+            data = json.load(f)
+        self.assertEqual({
+            'object_reconstruction_per_disk': {
+                'sda': {
+                    'object_reconstruction_last': later,
+                    'object_reconstruction_time': 5.0,
+                    'pid': 'pid-1',
+                },
+                'sdc': {
+                    'object_reconstruction_last': later,
+                    'object_reconstruction_time': 5.0,
+                    'pid': 'pid-1',
+                },
+            }
+        }, data)
+        reconstructor.reconstruct.reset_mock()
+        # another worker would get *different* disks
+        before = now = later
+        later = now + 300  # 5 more minutes
+        with mock.patch('swift.obj.reconstructor.time.time',
+                        side_effect=[now, later, later]), \
+                mock.patch('swift.obj.reconstructor.os.getpid',
+                           return_value='pid-2'), \
+                mock.patch('swift.obj.reconstructor.sleep',
+                           side_effect=[StopForever]), \
+                Timeout(.3), quiet_eventlet_exceptions(), \
+                self.assertRaises(StopForever):
+            gt = spawn(reconstructor.run_forever, **worker_args[1])
+            gt.wait()
+        # override args are parsed
+        self.assertEqual([mock.call(
+            override_devices=['sdb', 'sdd'],
+            override_partitions=[]
+        )], reconstructor.reconstruct.call_args_list)
+        # forever mode with override args, we expect per-disk recon dumps
+        self.assertTrue(os.path.exists(self.rcache))
+        with open(self.rcache) as f:
+            data = json.load(f)
+        self.assertEqual({
+            'object_reconstruction_per_disk': {
+                'sda': {
+                    'object_reconstruction_last': before,
+                    'object_reconstruction_time': 5.0,
+                    'pid': 'pid-1',
+                },
+                'sdb': {
+                    'object_reconstruction_last': later,
+                    'object_reconstruction_time': 5.0,
+                    'pid': 'pid-2',
+                },
+                'sdc': {
+                    'object_reconstruction_last': before,
+                    'object_reconstruction_time': 5.0,
+                    'pid': 'pid-1',
+                },
+                'sdd': {
+                    'object_reconstruction_last': later,
+                    'object_reconstruction_time': 5.0,
+                    'pid': 'pid-2',
+                },
+            }
+        }, data)
+
+        # aggregation is done in the parent thread even later
+        reconstructor.aggregate_recon_update()
+        with open(self.rcache) as f:
+            data = json.load(f)
+        self.assertEqual({
+            'object_reconstruction_last': later,
+            'object_reconstruction_time': 10.0,
+            'object_reconstruction_per_disk': {
+                'sda': {
+                    'object_reconstruction_last': before,
+                    'object_reconstruction_time': 5.0,
+                    'pid': 'pid-1',
+                },
+                'sdb': {
+                    'object_reconstruction_last': later,
+                    'object_reconstruction_time': 5.0,
+                    'pid': 'pid-2',
+                },
+                'sdc': {
+                    'object_reconstruction_last': before,
+                    'object_reconstruction_time': 5.0,
+                    'pid': 'pid-1',
+                },
+                'sdd': {
+                    'object_reconstruction_last': later,
+                    'object_reconstruction_time': 5.0,
+                    'pid': 'pid-2',
+                },
+            }
+        }, data)
+
+    def test_run_forever_recon_no_devices(self):
+
+        class StopForever(Exception):
+            pass
+
+        reconstructor = object_reconstructor.ObjectReconstructor({
+            'reconstructor_workers': 2,
+            'recon_cache_path': self.recon_cache_path
+        }, logger=self.logger)
+
+        def run_forever_but_stop(pid, mock_times, worker_kwargs):
+            with mock.patch('swift.obj.reconstructor.time.time',
+                            side_effect=mock_times), \
+                    mock.patch('swift.obj.reconstructor.os.getpid',
+                               return_value=pid), \
+                    mock.patch('swift.obj.reconstructor.sleep',
+                               side_effect=[StopForever]), \
+                    Timeout(.3), quiet_eventlet_exceptions(), \
+                    self.assertRaises(StopForever):
+                gt = spawn(reconstructor.run_forever, **worker_kwargs)
+                gt.wait()
+
+        reconstructor.reconstruct = mock.MagicMock()
+        now = time.time()
+        # first run_forever with no devices
+        reconstructor.get_local_devices = lambda: []
+        later = now + 6  # 6 sec
+        worker_args = list(
+            # include 'devices' kwarg as a sanity check - it should be ignored
+            # in run_forever mode
+            reconstructor.get_worker_args(once=False, devices='sda'))
+        run_forever_but_stop('pid-1', [now, later, later], worker_args[0])
+        # override args are passed to reconstruct
+        self.assertEqual([mock.call(
+            override_devices=[],
+            override_partitions=[]
+        )], reconstructor.reconstruct.call_args_list)
+        # forever mode with no args, we expect total recon dumps
+        self.assertTrue(os.path.exists(self.rcache))
+        with open(self.rcache) as f:
+            data = json.load(f)
+        expected = {
+            'object_reconstruction_last': later,
+            'object_reconstruction_time': 0.1,
+        }
+        self.assertEqual(expected, data)
+        reconstructor.reconstruct.reset_mock()
+
+        # aggregation is done in the parent thread even later
+        now = later + 300
+        with mock.patch('swift.obj.reconstructor.time.time',
+                        side_effect=[now]):
+            reconstructor.aggregate_recon_update()
+        with open(self.rcache) as f:
+            data = json.load(f)
+        self.assertEqual(expected, data)
+
+    def test_recon_aggregation_waits_for_all_devices(self):
+        reconstructor = object_reconstructor.ObjectReconstructor({
+            'reconstructor_workers': 2,
+            'recon_cache_path': self.recon_cache_path
+        }, logger=self.logger)
+        reconstructor.all_local_devices = set([
+            'd0', 'd1', 'd2', 'd3',
+            # unreported device definitely matters
+            'd4'])
+        start = time.time() - 1000
+        for i in range(4):
+            with mock.patch('swift.obj.reconstructor.time.time',
+                            return_value=start + (300 * i)), \
+                    mock.patch('swift.obj.reconstructor.os.getpid',
+                               return_value='pid-%s' % i):
+                reconstructor.final_recon_dump(
+                    i, override_devices=['d%s' % i])
+        # sanity
+        with open(self.rcache) as f:
+            data = json.load(f)
+        self.assertEqual({
+            'object_reconstruction_per_disk': {
+                'd0': {
+                    'object_reconstruction_last': start,
+                    'object_reconstruction_time': 0.0,
+                    'pid': 'pid-0',
+                },
+                'd1': {
+                    'object_reconstruction_last': start + 300,
+                    'object_reconstruction_time': 1,
+                    'pid': 'pid-1',
+                },
+                'd2': {
+                    'object_reconstruction_last': start + 600,
+                    'object_reconstruction_time': 2,
+                    'pid': 'pid-2',
+                },
+                'd3': {
+                    'object_reconstruction_last': start + 900,
+                    'object_reconstruction_time': 3,
+                    'pid': 'pid-3',
+                },
+            }
+        }, data)
+
+        # unreported device d4 prevents aggregation
+        reconstructor.aggregate_recon_update()
+        with open(self.rcache) as f:
+            data = json.load(f)
+        self.assertNotIn('object_reconstruction_last', data)
+        self.assertNotIn('object_reconstruction_time', data)
+        self.assertEqual(set(['d0', 'd1', 'd2', 'd3']),
+                         set(data['object_reconstruction_per_disk'].keys()))
+
+        # it's idempotent
+        reconstructor.aggregate_recon_update()
+        with open(self.rcache) as f:
+            data = json.load(f)
+        self.assertNotIn('object_reconstruction_last', data)
+        self.assertNotIn('object_reconstruction_time', data)
+        self.assertEqual(set(['d0', 'd1', 'd2', 'd3']),
+                         set(data['object_reconstruction_per_disk'].keys()))
+
+        # remove d4, we no longer wait on it for aggregation
+        reconstructor.all_local_devices = set(['d0', 'd1', 'd2', 'd3'])
+        reconstructor.aggregate_recon_update()
+        with open(self.rcache) as f:
+            data = json.load(f)
+        self.assertEqual(start + 900, data['object_reconstruction_last'])
+        self.assertEqual(15, data['object_reconstruction_time'])
+        self.assertEqual(set(['d0', 'd1', 'd2', 'd3']),
+                         set(data['object_reconstruction_per_disk'].keys()))
+
+    def test_recon_aggregation_removes_devices(self):
+        reconstructor = object_reconstructor.ObjectReconstructor({
+            'reconstructor_workers': 2,
+            'recon_cache_path': self.recon_cache_path
+        }, logger=self.logger)
+        reconstructor.all_local_devices = set(['d0', 'd1', 'd2', 'd3'])
+        start = time.time() - 1000
+        for i in range(4):
+            with mock.patch('swift.obj.reconstructor.time.time',
+                            return_value=start + (300 * i)), \
+                    mock.patch('swift.obj.reconstructor.os.getpid',
+                               return_value='pid-%s' % i):
+                reconstructor.final_recon_dump(
+                    i, override_devices=['d%s' % i])
+        # sanity
+        with open(self.rcache) as f:
+            data = json.load(f)
+        self.assertEqual({
+            'object_reconstruction_per_disk': {
+                'd0': {
+                    'object_reconstruction_last': start,
+                    'object_reconstruction_time': 0.0,
+                    'pid': 'pid-0',
+                },
+                'd1': {
+                    'object_reconstruction_last': start + 300,
+                    'object_reconstruction_time': 1,
+                    'pid': 'pid-1',
+                },
+                'd2': {
+                    'object_reconstruction_last': start + 600,
+                    'object_reconstruction_time': 2,
+                    'pid': 'pid-2',
+                },
+                'd3': {
+                    'object_reconstruction_last': start + 900,
+                    'object_reconstruction_time': 3,
+                    'pid': 'pid-3',
+                },
+            }
+        }, data)
+
+        reconstructor.all_local_devices = set(['d0', 'd1', 'd2', 'd3'])
+        reconstructor.aggregate_recon_update()
+        with open(self.rcache) as f:
+            data = json.load(f)
+        self.assertEqual(start + 900, data['object_reconstruction_last'])
+        self.assertEqual(15, data['object_reconstruction_time'])
+        self.assertEqual(set(['d0', 'd1', 'd2', 'd3']),
+                         set(data['object_reconstruction_per_disk'].keys()))
+
+        # it's idempotent
+        reconstructor.aggregate_recon_update()
+        with open(self.rcache) as f:
+            data = json.load(f)
+        self.assertEqual({
+            'object_reconstruction_last': start + 900,
+            'object_reconstruction_time': 15,
+            'object_reconstruction_per_disk': {
+                'd0': {
+                    'object_reconstruction_last': start,
+                    'object_reconstruction_time': 0.0,
+                    'pid': 'pid-0',
+                },
+                'd1': {
+                    'object_reconstruction_last': start + 300,
+                    'object_reconstruction_time': 1,
+                    'pid': 'pid-1',
+                },
+                'd2': {
+                    'object_reconstruction_last': start + 600,
+                    'object_reconstruction_time': 2,
+                    'pid': 'pid-2',
+                },
+                'd3': {
+                    'object_reconstruction_last': start + 900,
+                    'object_reconstruction_time': 3,
+                    'pid': 'pid-3',
+                },
+            }
+        }, data)
+
+        # if a device is removed from the ring
+        reconstructor.all_local_devices = set(['d1', 'd2', 'd3'])
+        reconstructor.aggregate_recon_update()
+        with open(self.rcache) as f:
+            data = json.load(f)
+        # ... it's per-disk stats are removed (d0)
+        self.assertEqual({
+            'object_reconstruction_last': start + 900,
+            'object_reconstruction_time': 11,
+            'object_reconstruction_per_disk': {
+                'd1': {
+                    'object_reconstruction_last': start + 300,
+                    'object_reconstruction_time': 1,
+                    'pid': 'pid-1',
+                },
+                'd2': {
+                    'object_reconstruction_last': start + 600,
+                    'object_reconstruction_time': 2,
+                    'pid': 'pid-2',
+                },
+                'd3': {
+                    'object_reconstruction_last': start + 900,
+                    'object_reconstruction_time': 3,
+                    'pid': 'pid-3',
+                },
+            }
+        }, data)
+
+        # which can affect the aggregates!
+        reconstructor.all_local_devices = set(['d1', 'd2'])
+        reconstructor.aggregate_recon_update()
+        with open(self.rcache) as f:
+            data = json.load(f)
+        self.assertEqual({
+            'object_reconstruction_last': start + 600,
+            'object_reconstruction_time': 6,
+            'object_reconstruction_per_disk': {
+                'd1': {
+                    'object_reconstruction_last': start + 300,
+                    'object_reconstruction_time': 1,
+                    'pid': 'pid-1',
+                },
+                'd2': {
+                    'object_reconstruction_last': start + 600,
+                    'object_reconstruction_time': 2,
+                    'pid': 'pid-2',
+                },
+            }
+        }, data)
+
+    def test_recon_aggregation_at_end_of_run_once(self):
+        reconstructor = object_reconstructor.ObjectReconstructor({
+            'reconstructor_workers': 2,
+            'recon_cache_path': self.recon_cache_path
+        }, logger=self.logger)
+        reconstructor.all_local_devices = set(['d0', 'd1', 'd2', 'd3'])
+        start = time.time() - 1000
+        for i in range(4):
+            with mock.patch('swift.obj.reconstructor.time.time',
+                            return_value=start + (300 * i)), \
+                    mock.patch('swift.obj.reconstructor.os.getpid',
+                               return_value='pid-%s' % i):
+                reconstructor.final_recon_dump(
+                    i, override_devices=['d%s' % i])
+        # sanity
+        with open(self.rcache) as f:
+            data = json.load(f)
+        self.assertEqual({
+            'object_reconstruction_per_disk': {
+                'd0': {
+                    'object_reconstruction_last': start,
+                    'object_reconstruction_time': 0.0,
+                    'pid': 'pid-0',
+                },
+                'd1': {
+                    'object_reconstruction_last': start + 300,
+                    'object_reconstruction_time': 1,
+                    'pid': 'pid-1',
+                },
+                'd2': {
+                    'object_reconstruction_last': start + 600,
+                    'object_reconstruction_time': 2,
+                    'pid': 'pid-2',
+                },
+                'd3': {
+                    'object_reconstruction_last': start + 900,
+                    'object_reconstruction_time': 3,
+                    'pid': 'pid-3',
+                },
+            }
+        }, data)
+
+        reconstructor.post_multiprocess_run()
+        with open(self.rcache) as f:
+            data = json.load(f)
+        self.assertEqual(start + 900, data['object_reconstruction_last'])
+        self.assertEqual(15, data['object_reconstruction_time'])
+
+    def test_recon_aggregation_races_with_final_recon_dump(self):
+        reconstructor = object_reconstructor.ObjectReconstructor({
+            'reconstructor_workers': 2,
+            'recon_cache_path': self.recon_cache_path
+        }, logger=self.logger)
+        reconstructor.all_local_devices = set(['d0', 'd1'])
+        start = time.time() - 1000
+        # first worker dumps to recon cache
+        with mock.patch('swift.obj.reconstructor.time.time',
+                        return_value=start), \
+                mock.patch('swift.obj.reconstructor.os.getpid',
+                           return_value='pid-0'):
+            reconstructor.final_recon_dump(
+                1, override_devices=['d0'])
+        # sanity
+        with open(self.rcache) as f:
+            data = json.load(f)
+        self.assertEqual({
+            'object_reconstruction_per_disk': {
+                'd0': {
+                    'object_reconstruction_last': start,
+                    'object_reconstruction_time': 1,
+                    'pid': 'pid-0',
+                },
+            }
+        }, data)
+
+        # simulate a second worker concurrently dumping to recon cache while
+        # parent is aggregating existing results; mock dump_recon_cache as a
+        # convenient way to interrupt parent aggregate_recon_update and 'pass
+        # control' to second worker
+        updated_data = []  # state of recon cache just after second worker dump
+
+        def simulate_other_process_final_recon_dump():
+            with mock.patch('swift.obj.reconstructor.time.time',
+                            return_value=start + 999), \
+                    mock.patch('swift.obj.reconstructor.os.getpid',
+                               return_value='pid-1'):
+                reconstructor.final_recon_dump(
+                    1000, override_devices=['d1'])
+                with open(self.rcache) as f:
+                    updated_data.append(json.load(f))
+
+        def fake_dump_recon_cache(*args, **kwargs):
+            # temporarily put back real dump_recon_cache
+            with mock.patch('swift.obj.reconstructor.dump_recon_cache',
+                            dump_recon_cache):
+                simulate_other_process_final_recon_dump()
+            # and now proceed with parent dump_recon_cache
+            dump_recon_cache(*args, **kwargs)
+
+        reconstructor.dump_recon_cache = fake_dump_recon_cache
+        with mock.patch('swift.obj.reconstructor.dump_recon_cache',
+                        fake_dump_recon_cache):
+            reconstructor.aggregate_recon_update()
+
+        self.assertEqual([{  # sanity check - second process did dump its data
+            'object_reconstruction_per_disk': {
+                'd0': {
+                    'object_reconstruction_last': start,
+                    'object_reconstruction_time': 1,
+                    'pid': 'pid-0',
+                },
+                'd1': {
+                    'object_reconstruction_last': start + 999,
+                    'object_reconstruction_time': 1000,
+                    'pid': 'pid-1',
+                },
+            }
+        }], updated_data)
+
+        with open(self.rcache) as f:
+            data = json.load(f)
+        self.assertEqual({
+            'object_reconstruction_per_disk': {
+                'd0': {
+                    'object_reconstruction_last': start,
+                    'object_reconstruction_time': 1,
+                    'pid': 'pid-0',
+                },
+                'd1': {
+                    'object_reconstruction_last': start + 999,
+                    'object_reconstruction_time': 1000,
+                    'pid': 'pid-1',
+                },
+            }
+        }, data)
+
+        # next aggregation will find d1 stats
+        reconstructor.aggregate_recon_update()
+
+        with open(self.rcache) as f:
+            data = json.load(f)
+        self.assertEqual({
+            'object_reconstruction_last': start + 999,
+            'object_reconstruction_time': 1000,
+            'object_reconstruction_per_disk': {
+                'd0': {
+                    'object_reconstruction_last': start,
+                    'object_reconstruction_time': 1,
+                    'pid': 'pid-0',
+                },
+                'd1': {
+                    'object_reconstruction_last': start + 999,
+                    'object_reconstruction_time': 1000,
+                    'pid': 'pid-1',
+                },
+            }
+        }, data)
+
+    def test_worker_logging(self):
+        reconstructor = object_reconstructor.ObjectReconstructor({
+            'reconstructor_workers': 4,
+            'recon_cache_path': self.recon_cache_path
+        }, logger=self.logger)
+
+        def log_some_stuff(*a, **kw):
+            reconstructor.logger.debug("debug message")
+            reconstructor.logger.info("info message")
+            reconstructor.logger.warning("warning message")
+            reconstructor.logger.error("error message")
+
+        with mock.patch.object(reconstructor, 'reconstruct',
+                               log_some_stuff), \
+                mock.patch("os.getpid", lambda: 20641):
+            reconstructor.get_worker_args()
+            reconstructor.run_once(multiprocess_worker_index=1,
+                                   override_devices=['sda', 'sdb'])
+
+        prefix = "[worker 2/4 pid=20641] "
+        for level, lines in self.logger.logger.all_log_lines().items():
+            for line in lines:
+                self.assertTrue(
+                    line.startswith(prefix),
+                    "%r doesn't start with %r (level %s)" % (
+                        line, prefix, level))
+
+
+@patch_policies(with_ec_default=True)
+class BaseTestObjectReconstructor(unittest.TestCase):
+    def setUp(self):
+        skip_if_no_xattrs()
+        self.policy = POLICIES.default
+        self.policy.object_ring._rtime = time.time() + 3600
+        self.testdir = tempfile.mkdtemp()
+        self.devices = os.path.join(self.testdir, 'devices')
+        self.local_dev = self.policy.object_ring.devs[0]
+        self.ip = self.local_dev['replication_ip']
+        self.port = self.local_dev['replication_port']
+        self.conf = {
+            'devices': self.devices,
+            'mount_check': False,
+            'bind_ip': self.ip,
+            'bind_port': self.port,
+        }
+        self.logger = debug_logger('object-reconstructor')
+        self._configure_reconstructor()
+        self.policy.object_ring.max_more_nodes = \
+            self.policy.object_ring.replicas
+        self.ts_iter = make_timestamp_iter()
+        self.fabricated_ring = FabricatedRing(replicas=14, devices=28)
+
+    def _configure_reconstructor(self, **kwargs):
+        self.conf.update(kwargs)
+        self.reconstructor = object_reconstructor.ObjectReconstructor(
+            self.conf, logger=self.logger)
+        self.reconstructor._reset_stats()
+        # some tests bypass build_reconstruction_jobs and go to process_job
+        # directly, so you end up with a /0 when you try to show the
+        # percentage of complete jobs as ratio of the total job count
+        self.reconstructor.job_count = 1
+        # if we ever let a test through without properly patching the
+        # REPLICATE and SSYNC calls - let's fail sort fast-ish
+        self.reconstructor.lockup_timeout = 3
+
+    def tearDown(self):
+        self.reconstructor._reset_stats()
+        self.reconstructor.stats_line()
+        shutil.rmtree(self.testdir)
+
+    def ts(self):
+        return next(self.ts_iter)
+
+
+class TestObjectReconstructor(BaseTestObjectReconstructor):
+    def test_ring_ip_and_bind_ip(self):
+        # make clean base_conf
+        base_conf = dict(self.conf)
+        for key in ('bind_ip', 'ring_ip'):
+            base_conf.pop(key, None)
+
+        # default ring_ip is always 0.0.0.0
+        self.conf = base_conf
+        self._configure_reconstructor()
+        self.assertEqual('0.0.0.0', self.reconstructor.ring_ip)
+
+        # bind_ip works fine for legacy configs
+        self.conf = dict(base_conf)
+        self.conf['bind_ip'] = '192.168.1.42'
+        self._configure_reconstructor()
+        self.assertEqual('192.168.1.42', self.reconstructor.ring_ip)
+
+        # ring_ip works fine by-itself
+        self.conf = dict(base_conf)
+        self.conf['ring_ip'] = '192.168.1.43'
+        self._configure_reconstructor()
+        self.assertEqual('192.168.1.43', self.reconstructor.ring_ip)
+
+        # if you have both ring_ip wins
+        self.conf = dict(base_conf)
+        self.conf['bind_ip'] = '192.168.1.44'
+        self.conf['ring_ip'] = '192.168.1.45'
+        self._configure_reconstructor()
+        self.assertEqual('192.168.1.45', self.reconstructor.ring_ip)
+
+    def test_handoffs_only_default(self):
+        # sanity neither option added to default conf
+        self.conf.pop('handoffs_first', None)
+        self.conf.pop('handoffs_only', None)
+        self.reconstructor = object_reconstructor.ObjectReconstructor(
+            self.conf, logger=self.logger)
+        self.assertFalse(self.reconstructor.handoffs_only)
+
+    def test_handoffs_first_enables_handoffs_only(self):
+        self.conf['handoffs_first'] = "True"
+        self.conf.pop('handoffs_only', None)  # sanity
+        self.reconstructor = object_reconstructor.ObjectReconstructor(
+            self.conf, logger=self.logger)
+        self.assertTrue(self.reconstructor.handoffs_only)
+        warnings = self.logger.get_lines_for_level('warning')
+        expected = [
+            'The handoffs_first option is deprecated in favor '
+            'of handoffs_only. This option may be ignored in a '
+            'future release.',
+            'Handoff only mode is not intended for normal operation, '
+            'use handoffs_only with care.',
+        ]
+        self.assertEqual(expected, warnings)
+
+    def test_handoffs_only_ignores_handoffs_first(self):
+        self.conf['handoffs_first'] = "True"
+        self.conf['handoffs_only'] = "False"
+        self.reconstructor = object_reconstructor.ObjectReconstructor(
+            self.conf, logger=self.logger)
+        self.assertFalse(self.reconstructor.handoffs_only)
+        warnings = self.logger.get_lines_for_level('warning')
+        expected = [
+            'The handoffs_first option is deprecated in favor of '
+            'handoffs_only. This option may be ignored in a future release.',
+            'Ignored handoffs_first option in favor of handoffs_only.',
+        ]
+        self.assertEqual(expected, warnings)
+
+    def test_handoffs_only_enabled(self):
+        self.conf.pop('handoffs_first', None)  # sanity
+        self.conf['handoffs_only'] = "True"
+        self.reconstructor = object_reconstructor.ObjectReconstructor(
+            self.conf, logger=self.logger)
+        self.assertTrue(self.reconstructor.handoffs_only)
+        warnings = self.logger.get_lines_for_level('warning')
+        expected = [
+            'Handoff only mode is not intended for normal operation, '
+            'use handoffs_only with care.',
+        ]
+        self.assertEqual(expected, warnings)
+
+    def test_handoffs_only_true_and_first_true(self):
+        self.conf['handoffs_first'] = "True"
+        self.conf['handoffs_only'] = "True"
+        self.reconstructor = object_reconstructor.ObjectReconstructor(
+            self.conf, logger=self.logger)
+        self.assertTrue(self.reconstructor.handoffs_only)
+        warnings = self.logger.get_lines_for_level('warning')
+        expected = [
+            'The handoffs_first option is deprecated in favor of '
+            'handoffs_only. This option may be ignored in a future release.',
+            'Handoff only mode is not intended for normal operation, '
+            'use handoffs_only with care.',
+        ]
+        self.assertEqual(expected, warnings)
+
+    def test_handoffs_only_false_and_first_false(self):
+        self.conf['handoffs_only'] = "False"
+        self.conf['handoffs_first'] = "False"
+        self.reconstructor = object_reconstructor.ObjectReconstructor(
+            self.conf, logger=self.logger)
+        self.assertFalse(self.reconstructor.handoffs_only)
+        warnings = self.logger.get_lines_for_level('warning')
+        expected = [
+            'The handoffs_first option is deprecated in favor of '
+            'handoffs_only. This option may be ignored in a future release.',
+        ]
+        self.assertEqual(expected, warnings)
+
+    def test_handoffs_only_none_and_first_false(self):
+        self.conf['handoffs_first'] = "False"
+        self.conf.pop('handoffs_only', None)  # sanity
+        self.reconstructor = object_reconstructor.ObjectReconstructor(
+            self.conf, logger=self.logger)
+        self.assertFalse(self.reconstructor.handoffs_only)
+        warnings = self.logger.get_lines_for_level('warning')
+        expected = [
+            'The handoffs_first option is deprecated in favor of '
+            'handoffs_only. This option may be ignored in a future release.',
+        ]
+        self.assertEqual(expected, warnings)
+
+    def test_handoffs_only_false_and_first_none(self):
+        self.conf.pop('handoffs_first', None)  # sanity
+        self.conf['handoffs_only'] = "False"
+        self.reconstructor = object_reconstructor.ObjectReconstructor(
+            self.conf, logger=self.logger)
+        self.assertFalse(self.reconstructor.handoffs_only)
+        warnings = self.logger.get_lines_for_level('warning')
+        self.assertFalse(warnings)
+
+    def test_handoffs_only_true_and_first_false(self):
+        self.conf['handoffs_first'] = "False"
+        self.conf['handoffs_only'] = "True"
+        self.reconstructor = object_reconstructor.ObjectReconstructor(
+            self.conf, logger=self.logger)
+        self.assertTrue(self.reconstructor.handoffs_only)
+        warnings = self.logger.get_lines_for_level('warning')
+        expected = [
+            'The handoffs_first option is deprecated in favor of '
+            'handoffs_only. This option may be ignored in a future release.',
+            'Handoff only mode is not intended for normal operation, '
+            'use handoffs_only with care.',
+        ]
+        self.assertEqual(expected, warnings)
+
+    def test_two_ec_policies(self):
+        with patch_policies([
+                StoragePolicy(0, name='zero', is_deprecated=True),
+                ECStoragePolicy(1, name='one', is_default=True,
+                                ec_type=DEFAULT_TEST_EC_TYPE,
+                                ec_ndata=4, ec_nparity=3),
+                ECStoragePolicy(2, name='two',
+                                ec_type=DEFAULT_TEST_EC_TYPE,
+                                ec_ndata=8, ec_nparity=2)],
+                            fake_ring_args=[
+                                {}, {'replicas': 7}, {'replicas': 10}]):
+            self._configure_reconstructor()
+            jobs = []
+
+            def process_job(job):
+                jobs.append(job)
+
+            self.reconstructor.process_job = process_job
+
+            os.makedirs(os.path.join(self.devices, 'sda', 'objects-1', '0'))
+            self.reconstructor.run_once()
+            self.assertEqual(1, len(jobs))
+
+    def test_collect_parts_skips_non_ec_policy_and_device(self):
+        stub_parts = (371, 78, 419, 834)
+        for policy in POLICIES:
+            datadir = diskfile.get_data_dir(policy)
+            for part in stub_parts:
+                utils.mkdirs(os.path.join(
+                    self.devices, self.local_dev['device'],
+                    datadir, str(part)))
+        part_infos = list(self.reconstructor.collect_parts())
+        found_parts = sorted(int(p['partition']) for p in part_infos)
+        self.assertEqual(found_parts, sorted(stub_parts))
+        for part_info in part_infos:
+            self.assertEqual(part_info['local_dev'], self.local_dev)
+            self.assertEqual(part_info['policy'], self.policy)
+            self.assertEqual(part_info['part_path'],
+                             os.path.join(self.devices,
+                                          self.local_dev['device'],
+                                          diskfile.get_data_dir(self.policy),
+                                          str(part_info['partition'])))
+
+    def test_collect_parts_skips_non_local_devs_servers_per_port(self):
+        self._configure_reconstructor(devices=self.devices, mount_check=False,
+                                      bind_ip=self.ip, bind_port=self.port,
+                                      servers_per_port=2)
+
+        device_parts = {
+            'sda': (374,),
+            'sdb': (179, 807),  # w/one-serv-per-port, same IP alone is local
+            'sdc': (363, 468, 843),
+            'sdd': (912,),  # "not local" via different IP
+        }
+        for policy in POLICIES:
+            datadir = diskfile.get_data_dir(policy)
+            for dev, parts in device_parts.items():
+                for part in parts:
+                    utils.mkdirs(os.path.join(
+                        self.devices, dev,
+                        datadir, str(part)))
+
+        # we're only going to add sda and sdc into the ring
+        local_devs = ('sda', 'sdb', 'sdc')
+        stub_ring_devs = [{
+            'id': i,
+            'device': dev,
+            'replication_ip': self.ip,
+            'replication_port': self.port + 1 if dev == 'sdb' else self.port,
+        } for i, dev in enumerate(local_devs)]
+        stub_ring_devs.append({
+            'id': len(local_devs),
+            'device': 'sdd',
+            'replication_ip': '127.0.0.88',  # not local via IP
+            'replication_port': self.port,
+        })
+        self.reconstructor.ring_ip = '0.0.0.0'  # use whataremyips
+        with mock.patch('swift.obj.reconstructor.whataremyips',
+                        return_value=[self.ip]), \
+                mock.patch.object(self.policy.object_ring, '_devs',
+                                  new=stub_ring_devs):
+            part_infos = list(self.reconstructor.collect_parts())
+        found_parts = sorted(int(p['partition']) for p in part_infos)
+        expected_parts = sorted(itertools.chain(
+            *(device_parts[d] for d in local_devs)))
+        self.assertEqual(found_parts, expected_parts)
+        for part_info in part_infos:
+            self.assertEqual(part_info['policy'], self.policy)
+            self.assertIn(part_info['local_dev'], stub_ring_devs)
+            dev = part_info['local_dev']
+            self.assertEqual(part_info['part_path'],
+                             os.path.join(self.devices,
+                                          dev['device'],
+                                          diskfile.get_data_dir(self.policy),
+                                          str(part_info['partition'])))
+
+    def test_collect_parts_multi_device_skips_non_non_local_devs(self):
+        device_parts = {
+            'sda': (374,),
+            'sdb': (179, 807),  # "not local" via different port
+            'sdc': (363, 468, 843),
+            'sdd': (912,),  # "not local" via different IP
+        }
+        for policy in POLICIES:
+            datadir = diskfile.get_data_dir(policy)
+            for dev, parts in device_parts.items():
+                for part in parts:
+                    utils.mkdirs(os.path.join(
+                        self.devices, dev,
+                        datadir, str(part)))
+
+        # we're only going to add sda and sdc into the ring
+        local_devs = ('sda', 'sdc')
+        stub_ring_devs = [{
+            'id': i,
+            'device': dev,
+            'replication_ip': self.ip,
+            'replication_port': self.port,
+        } for i, dev in enumerate(local_devs)]
+        stub_ring_devs.append({
+            'id': len(local_devs),
+            'device': 'sdb',
+            'replication_ip': self.ip,
+            'replication_port': self.port + 1,  # not local via port
+        })
+        stub_ring_devs.append({
+            'id': len(local_devs) + 1,
+            'device': 'sdd',
+            'replication_ip': '127.0.0.88',  # not local via IP
+            'replication_port': self.port,
+        })
+        self.reconstructor.ring_ip = '0.0.0.0'  # use whataremyips
+        with mock.patch('swift.obj.reconstructor.whataremyips',
+                        return_value=[self.ip]), \
+                mock.patch.object(self.policy.object_ring, '_devs',
+                                  new=stub_ring_devs):
+            part_infos = list(self.reconstructor.collect_parts())
+        found_parts = sorted(int(p['partition']) for p in part_infos)
+        expected_parts = sorted(itertools.chain(
+            *(device_parts[d] for d in local_devs)))
+        self.assertEqual(found_parts, expected_parts)
+        for part_info in part_infos:
+            self.assertEqual(part_info['policy'], self.policy)
+            self.assertIn(part_info['local_dev'], stub_ring_devs)
+            dev = part_info['local_dev']
+            self.assertEqual(part_info['part_path'],
+                             os.path.join(self.devices,
+                                          dev['device'],
+                                          diskfile.get_data_dir(self.policy),
+                                          str(part_info['partition'])))
+
+    def test_collect_parts_multi_device_skips_non_ring_devices(self):
+        device_parts = {
+            'sda': (374,),
+            'sdc': (363, 468, 843),
+        }
+        for policy in POLICIES:
+            datadir = diskfile.get_data_dir(policy)
+            for dev, parts in device_parts.items():
+                for part in parts:
+                    utils.mkdirs(os.path.join(
+                        self.devices, dev,
+                        datadir, str(part)))
+
+        # we're only going to add sda and sdc into the ring
+        local_devs = ('sda', 'sdc')
+        stub_ring_devs = [{
+            'id': i,
+            'device': dev,
+            'replication_ip': self.ip,
+            'replication_port': self.port,
+        } for i, dev in enumerate(local_devs)]
+        self.reconstructor.ring_ip = '0.0.0.0'  # use whataremyips
+        with mock.patch('swift.obj.reconstructor.whataremyips',
+                        return_value=[self.ip]), \
+                mock.patch.object(self.policy.object_ring, '_devs',
+                                  new=stub_ring_devs):
+            part_infos = list(self.reconstructor.collect_parts())
+        found_parts = sorted(int(p['partition']) for p in part_infos)
+        expected_parts = sorted(itertools.chain(
+            *(device_parts[d] for d in local_devs)))
+        self.assertEqual(found_parts, expected_parts)
+        for part_info in part_infos:
+            self.assertEqual(part_info['policy'], self.policy)
+            self.assertIn(part_info['local_dev'], stub_ring_devs)
+            dev = part_info['local_dev']
+            self.assertEqual(part_info['part_path'],
+                             os.path.join(self.devices,
+                                          dev['device'],
+                                          diskfile.get_data_dir(self.policy),
+                                          str(part_info['partition'])))
+
+    def test_collect_parts_mount_check(self):
+        # each device has one part in it
+        local_devs = ('sda', 'sdb')
+        for i, dev in enumerate(local_devs):
+            datadir = diskfile.get_data_dir(self.policy)
+            utils.mkdirs(os.path.join(
+                self.devices, dev, datadir, str(i)))
+        stub_ring_devs = [{
+            'id': i,
+            'device': dev,
+            'replication_ip': self.ip,
+            'replication_port': self.port
+        } for i, dev in enumerate(local_devs)]
+        with mock.patch('swift.obj.reconstructor.whataremyips',
+                        return_value=[self.ip]), \
+                mock.patch.object(self.policy.object_ring, '_devs',
+                                  new=stub_ring_devs):
+            part_infos = list(self.reconstructor.collect_parts())
+        self.assertEqual(2, len(part_infos))  # sanity
+        self.assertEqual(set(int(p['partition']) for p in part_infos),
+                         set([0, 1]))
+
+        paths = []
+
+        def fake_check_drive(devices, device, mount_check):
+            path = os.path.join(devices, device)
+            if (not mount_check) and os.path.isdir(path):
+                # while mount_check is false, the test still creates the dirs
+                paths.append(path)
+                return path
+            return None
+
+        with mock.patch('swift.obj.reconstructor.whataremyips',
+                        return_value=[self.ip]), \
+                mock.patch.object(self.policy.object_ring, '_devs',
+                                  new=stub_ring_devs), \
+                mock.patch('swift.obj.diskfile.check_drive',
+                           fake_check_drive):
+            part_infos = list(self.reconstructor.collect_parts())
+        self.assertEqual(2, len(part_infos))  # sanity, same jobs
+        self.assertEqual(set(int(p['partition']) for p in part_infos),
+                         set([0, 1]))
+
+        # ... because fake_check_drive returned paths for both dirs
+        self.assertEqual(set(paths), set([
+            os.path.join(self.devices, dev) for dev in local_devs]))
+
+        # ... now with mount check
+        self._configure_reconstructor(mount_check=True)
+        self.assertTrue(self.reconstructor.mount_check)
+        paths = []
+        for policy in POLICIES:
+            self.assertTrue(self.reconstructor._df_router[policy].mount_check)
+        with mock.patch('swift.obj.reconstructor.whataremyips',
+                        return_value=[self.ip]), \
+                mock.patch.object(self.policy.object_ring, '_devs',
+                                  new=stub_ring_devs), \
+                mock.patch('swift.obj.diskfile.check_drive',
+                           fake_check_drive):
+            part_infos = list(self.reconstructor.collect_parts())
+        self.assertEqual([], part_infos)  # sanity, no jobs
+
+        # ... because fake_check_drive returned False for both paths
+        self.assertFalse(paths)
+
+        def fake_check_drive(devices, device, mount_check):
+            self.assertTrue(mount_check)
+            if device == 'sda':
+                return os.path.join(devices, device)
+            else:
+                return False
+
+        with mock.patch('swift.obj.reconstructor.whataremyips',
+                        return_value=[self.ip]), \
+                mock.patch.object(self.policy.object_ring, '_devs',
+                                  new=stub_ring_devs), \
+                mock.patch('swift.obj.diskfile.check_drive',
+                           fake_check_drive):
+            part_infos = list(self.reconstructor.collect_parts())
+        self.assertEqual(1, len(part_infos))  # only sda picked up (part 0)
+        self.assertEqual(part_infos[0]['partition'], 0)
+
+    def test_collect_parts_cleans_tmp(self):
+        local_devs = ('sda', 'sdc')
+        stub_ring_devs = [{
+            'id': i,
+            'device': dev,
+            'replication_ip': self.ip,
+            'replication_port': self.port
+        } for i, dev in enumerate(local_devs)]
+        for device in local_devs:
+            utils.mkdirs(os.path.join(self.devices, device))
+        fake_unlink = mock.MagicMock()
+        self._configure_reconstructor(reclaim_age=1000)
+        now = time.time()
+        with mock.patch('swift.obj.reconstructor.whataremyips',
+                        return_value=[self.ip]), \
+                mock.patch('swift.obj.reconstructor.time.time',
+                           return_value=now), \
+                mock.patch.object(self.policy.object_ring, '_devs',
+                                  new=stub_ring_devs), \
+                mock.patch('swift.obj.reconstructor.unlink_older_than',
+                           fake_unlink):
+            self.assertEqual([], list(self.reconstructor.collect_parts()))
+        # each local device hash unlink_older_than called on it,
+        # with now - self.reclaim_age
+        tmpdir = diskfile.get_tmp_dir(self.policy)
+        expected = now - 1000
+        self.assertEqual(fake_unlink.mock_calls, [
+            mock.call(os.path.join(self.devices, dev, tmpdir), expected)
+            for dev in local_devs])
+
+    def test_collect_parts_creates_datadir(self):
+        # create just the device path
+        dev_path = os.path.join(self.devices, self.local_dev['device'])
+        utils.mkdirs(dev_path)
+        with mock.patch('swift.obj.reconstructor.whataremyips',
+                        return_value=[self.ip]):
+            self.assertEqual([], list(self.reconstructor.collect_parts()))
+        datadir_path = os.path.join(dev_path,
+                                    diskfile.get_data_dir(self.policy))
+        self.assertTrue(os.path.exists(datadir_path))
+
+    def test_collect_parts_creates_datadir_error(self):
+        # create just the device path
+        datadir_path = os.path.join(self.devices, self.local_dev['device'],
+                                    diskfile.get_data_dir(self.policy))
+        utils.mkdirs(os.path.dirname(datadir_path))
+        with mock.patch('swift.obj.reconstructor.whataremyips',
+                        return_value=[self.ip]), \
+                mock.patch('swift.obj.reconstructor.mkdirs',
+                           side_effect=OSError('kaboom!')):
+            self.assertEqual([], list(self.reconstructor.collect_parts()))
+        error_lines = self.logger.get_lines_for_level('error')
+        self.assertEqual(len(error_lines), 1,
+                         'Expected only one error, got %r' % error_lines)
+        line = error_lines[0]
+        self.assertIn('Unable to create', line)
+        self.assertIn(datadir_path, line)
+
+    def test_collect_parts_skips_invalid_paths(self):
+        datadir_path = os.path.join(self.devices, self.local_dev['device'],
+                                    diskfile.get_data_dir(self.policy))
+        utils.mkdirs(os.path.dirname(datadir_path))
+        with open(datadir_path, 'w') as f:
+            f.write('junk')
+        with mock.patch('swift.obj.reconstructor.whataremyips',
+                        return_value=[self.ip]):
+            self.assertEqual([], list(self.reconstructor.collect_parts()))
+        self.assertTrue(os.path.exists(datadir_path))
+        error_lines = self.logger.get_lines_for_level('error')
+        self.assertEqual(len(error_lines), 1,
+                         'Expected only one error, got %r' % error_lines)
+        line = error_lines[0]
+        self.assertIn('Unable to list partitions', line)
+        self.assertIn(datadir_path, line)
+
+    def test_reconstruct_removes_non_partition_files(self):
+        # create some junk next to partitions
+        datadir_path = os.path.join(self.devices, self.local_dev['device'],
+                                    diskfile.get_data_dir(self.policy))
+        num_parts = 3
+        for part in range(num_parts):
+            utils.mkdirs(os.path.join(datadir_path, str(part)))
+
+        # Add some clearly non-partition dentries
+        utils.mkdirs(os.path.join(datadir_path, 'not/a/partition'))
+        for junk_name in ('junk', '1234'):
+            junk_file = os.path.join(datadir_path, junk_name)
+            with open(junk_file, 'w') as f:
+                f.write('junk')
+
+        with mock.patch('swift.obj.reconstructor.whataremyips',
+                        return_value=[self.ip]), \
+                mock.patch('swift.obj.reconstructor.'
+                           'ObjectReconstructor.process_job'):
+            self.reconstructor.reconstruct()
+
+        # all the bad gets cleaned up
+        errors = []
+        for junk_name in ('junk', '1234', 'not'):
+            junk_file = os.path.join(datadir_path, junk_name)
+            if os.path.exists(junk_file):
+                errors.append('%s still exists!' % junk_file)
+
+        self.assertFalse(errors)
+
+        error_lines = self.logger.get_lines_for_level('warning')
+        self.assertIn('Unexpected entity in data dir: %r'
+                      % os.path.join(datadir_path, 'not'), error_lines)
+        self.assertIn('Unexpected entity in data dir: %r'
+                      % os.path.join(datadir_path, 'junk'), error_lines)
+        self.assertIn('Unexpected entity %r is not a directory'
+                      % os.path.join(datadir_path, '1234'), error_lines)
+        self.assertEqual(self.reconstructor.reconstruction_part_count, 6)
+
+    def test_collect_parts_overrides(self):
+        # setup multiple devices, with multiple parts
+        device_parts = {
+            'sda': (374, 843),
+            'sdb': (179, 807),
+            'sdc': (363, 468, 843),
+        }
+        datadir = diskfile.get_data_dir(self.policy)
+        for dev, parts in device_parts.items():
+            for part in parts:
+                utils.mkdirs(os.path.join(
+                    self.devices, dev,
+                    datadir, str(part)))
+
+        # we're only going to add sda and sdc into the ring
+        local_devs = ('sda', 'sdc')
+        stub_ring_devs = [{
+            'id': i,
+            'device': dev,
+            'replication_ip': self.ip,
+            'replication_port': self.port
+        } for i, dev in enumerate(local_devs)]
+
+        expected = (
+            ({}, [
+                ('sda', 374),
+                ('sda', 843),
+                ('sdc', 363),
+                ('sdc', 468),
+                ('sdc', 843),
+            ]),
+            ({'override_devices': ['sda', 'sdc']}, [
+                ('sda', 374),
+                ('sda', 843),
+                ('sdc', 363),
+                ('sdc', 468),
+                ('sdc', 843),
+            ]),
+            ({'override_devices': ['sdc']}, [
+                ('sdc', 363),
+                ('sdc', 468),
+                ('sdc', 843),
+            ]),
+            ({'override_devices': ['sda']}, [
+                ('sda', 374),
+                ('sda', 843),
+            ]),
+            ({'override_devices': ['sdx']}, []),
+            ({'override_partitions': [374]}, [
+                ('sda', 374),
+            ]),
+            ({'override_partitions': [843]}, [
+                ('sda', 843),
+                ('sdc', 843),
+            ]),
+            ({'override_partitions': [843], 'override_devices': ['sda']}, [
+                ('sda', 843),
+            ]),
+        )
+        with mock.patch('swift.obj.reconstructor.whataremyips',
+                        return_value=[self.ip]), \
+            mock.patch.object(self.policy.object_ring, '_devs',
+                              new=stub_ring_devs):
+            for kwargs, expected_parts in expected:
+                part_infos = list(self.reconstructor.collect_parts(**kwargs))
+                expected_paths = set(
+                    os.path.join(self.devices, dev, datadir, str(part))
+                    for dev, part in expected_parts)
+                found_paths = set(p['part_path'] for p in part_infos)
+                msg = 'expected %r != %r for %r' % (
+                    expected_paths, found_paths, kwargs)
+                self.assertEqual(expected_paths, found_paths, msg)
+
+    def test_build_jobs_creates_empty_hashes(self):
+        part_path = os.path.join(self.devices, self.local_dev['device'],
+                                 diskfile.get_data_dir(self.policy), '0')
+        utils.mkdirs(part_path)
+        part_info = {
+            'local_dev': self.local_dev,
+            'policy': self.policy,
+            'partition': 0,
+            'part_path': part_path,
+        }
+        jobs = self.reconstructor.build_reconstruction_jobs(part_info)
+        self.assertEqual(1, len(jobs))
+        job = jobs[0]
+        self.assertEqual(job['job_type'], object_reconstructor.SYNC)
+        self.assertEqual(job['frag_index'], 0)
+        self.assertEqual(job['suffixes'], [])
+        self.assertEqual(len(job['sync_to']), 3)
+        self.assertEqual(job['partition'], 0)
+        self.assertEqual(job['path'], part_path)
+        self.assertEqual(job['hashes'], {})
+        self.assertEqual(job['policy'], self.policy)
+        self.assertEqual(job['local_dev'], self.local_dev)
+        self.assertEqual(job['device'], self.local_dev['device'])
+        hashes_file = os.path.join(part_path,
+                                   diskfile.HASH_FILE)
+        self.assertTrue(os.path.exists(hashes_file))
+        suffixes = self.reconstructor._get_hashes(
+            self.local_dev['device'], 0, self.policy, do_listdir=True)
+        self.assertEqual(suffixes, {})
+
+    def test_build_jobs_no_hashes(self):
+        part_path = os.path.join(self.devices, self.local_dev['device'],
+                                 diskfile.get_data_dir(self.policy), '0')
+        part_info = {
+            'local_dev': self.local_dev,
+            'policy': self.policy,
+            'partition': 0,
+            'part_path': part_path,
+        }
+        stub_hashes = {}
+        with mock.patch('swift.obj.diskfile.ECDiskFileManager._get_hashes',
+                        return_value=(0, stub_hashes)):
+            jobs = self.reconstructor.build_reconstruction_jobs(part_info)
+        self.assertEqual(1, len(jobs))
+        job = jobs[0]
+        self.assertEqual(job['job_type'], object_reconstructor.SYNC)
+        self.assertEqual(job['frag_index'], 0)
+        self.assertEqual(job['suffixes'], [])
+        self.assertEqual(len(job['sync_to']), 3)
+        self.assertEqual(job['partition'], 0)
+        self.assertEqual(job['path'], part_path)
+        self.assertEqual(job['hashes'], {})
+        self.assertEqual(job['policy'], self.policy)
+        self.assertEqual(job['local_dev'], self.local_dev)
+        self.assertEqual(job['device'], self.local_dev['device'])
+
+    def test_build_jobs_primary(self):
+        ring = self.policy.object_ring = self.fabricated_ring
+        # find a partition for which we're a primary
+        for partition in range(2 ** ring.part_power):
+            part_nodes = ring.get_part_nodes(partition)
+            try:
+                frag_index = [n['id'] for n in part_nodes].index(
+                    self.local_dev['id'])
+            except ValueError:
+                pass
+            else:
+                break
+        else:
+            self.fail("the ring doesn't work: %r" % ring._replica2part2dev_id)
+        part_path = os.path.join(self.devices, self.local_dev['device'],
+                                 diskfile.get_data_dir(self.policy),
+                                 str(partition))
+        part_info = {
+            'local_dev': self.local_dev,
+            'policy': self.policy,
+            'partition': partition,
+            'part_path': part_path,
+        }
+        stub_hashes = {
+            '123': {frag_index: 'hash', None: 'hash'},
+            'abc': {frag_index: 'hash', None: 'hash'},
+        }
+        with mock.patch('swift.obj.diskfile.ECDiskFileManager._get_hashes',
+                        return_value=(0, stub_hashes)):
+            jobs = self.reconstructor.build_reconstruction_jobs(part_info)
+        self.assertEqual(1, len(jobs))
+        job = jobs[0]
+        self.assertEqual(job['job_type'], object_reconstructor.SYNC)
+        self.assertEqual(job['frag_index'], frag_index)
+        self.assertEqual(job['suffixes'], list(stub_hashes.keys()))
+        self.assertEqual(set([n['index'] for n in job['sync_to']]),
+                         set([(frag_index + 1) % ring.replicas,
+                              (frag_index - 1) % ring.replicas,
+                              (frag_index + int(0.5 * ring.replicas)),
+                              ]))
+        self.assertEqual(job['partition'], partition)
+        self.assertEqual(job['path'], part_path)
+        self.assertEqual(job['hashes'], stub_hashes)
+        self.assertEqual(job['policy'], self.policy)
+        self.assertEqual(job['local_dev'], self.local_dev)
+        self.assertEqual(job['device'], self.local_dev['device'])
+
+    def test_build_jobs_handoff(self):
+        ring = self.policy.object_ring = self.fabricated_ring
+        # find a partition for which we're a handoff
+        for partition in range(2 ** ring.part_power):
+            part_nodes = ring.get_part_nodes(partition)
+            if self.local_dev['id'] not in [n['id'] for n in part_nodes]:
+                break
+        else:
+            self.fail("the ring doesn't work: %r" % ring._replica2part2dev_id)
+        part_path = os.path.join(self.devices, self.local_dev['device'],
+                                 diskfile.get_data_dir(self.policy),
+                                 str(partition))
+        part_info = {
+            'local_dev': self.local_dev,
+            'policy': self.policy,
+            'partition': partition,
+            'part_path': part_path,
+        }
+        # since this part doesn't belong on us it doesn't matter what
+        # frag_index we have
+        frag_index = random.randint(0, self.policy.ec_n_unique_fragments - 1)
+        stub_hashes = {
+            '123': {frag_index: 'hash', None: 'hash'},
+            'abc': {None: 'hash'},
+        }
+        with mock.patch('swift.obj.diskfile.ECDiskFileManager._get_hashes',
+                        return_value=(0, stub_hashes)):
+            jobs = self.reconstructor.build_reconstruction_jobs(part_info)
+        self.assertEqual(1, len(jobs), 'Expected only one job, got %r' % jobs)
+        job = jobs[0]
+        self.assertEqual(job['job_type'], object_reconstructor.REVERT)
+        self.assertEqual(job['frag_index'], frag_index)
+        self.assertEqual(sorted(job['suffixes']), sorted(stub_hashes.keys()))
+        self.assertEqual(
+            self.policy.ec_duplication_factor, len(job['sync_to']))
+        # the sync_to node should be different each other
+        node_ids = set([node['id'] for node in job['sync_to']])
+        self.assertEqual(len(node_ids),
+                         self.policy.ec_duplication_factor)
+        # but all the nodes have same backend index to sync
+        node_indexes = set(
+            self.policy.get_backend_index(node['index'])
+            for node in job['sync_to'])
+        self.assertEqual(1, len(node_indexes))
+        self.assertEqual(job['sync_to'][0]['index'], frag_index)
+        self.assertEqual(job['path'], part_path)
+        self.assertEqual(job['partition'], partition)
+        self.assertEqual(sorted(job['hashes']), sorted(stub_hashes))
+        self.assertEqual(job['local_dev'], self.local_dev)
+
+    def test_build_jobs_mixed(self):
+        ring = self.policy.object_ring = self.fabricated_ring
+        # find a partition for which we're a primary
+        for partition in range(2 ** ring.part_power):
+            part_nodes = ring.get_part_nodes(partition)
+            try:
+                node_index = [n['id'] for n in part_nodes].index(
+                    self.local_dev['id'])
+            except ValueError:
+                pass
+            else:
+                break
+        else:
+            self.fail("the ring doesn't work: %r" % ring._replica2part2dev_id)
+        part_path = os.path.join(self.devices, self.local_dev['device'],
+                                 diskfile.get_data_dir(self.policy),
+                                 str(partition))
+        part_info = {
+            'local_dev': self.local_dev,
+            'policy': self.policy,
+            'partition': partition,
+            'part_path': part_path,
+        }
+        frag_index = self.policy.get_backend_index(node_index)
+        other_frag_index = random.choice(
+            [f for f in range(self.policy.ec_n_unique_fragments)
+             if f != node_index])
+        stub_hashes = {
+            '123': {frag_index: 'hash', None: 'hash'},
+            '456': {other_frag_index: 'hash', None: 'hash'},
+            'abc': {None: 'hash'},
+        }
+        with mock.patch('swift.obj.diskfile.ECDiskFileManager._get_hashes',
+                        return_value=(0, stub_hashes)):
+            jobs = self.reconstructor.build_reconstruction_jobs(part_info)
+        self.assertEqual(2, len(jobs))
+        sync_jobs, revert_jobs = [], []
+        for job in jobs:
+            self.assertEqual(job['partition'], partition)
+            self.assertEqual(job['path'], part_path)
+            self.assertEqual(sorted(job['hashes']), sorted(stub_hashes))
+            self.assertEqual(job['policy'], self.policy)
+            self.assertEqual(job['local_dev'], self.local_dev)
+            self.assertEqual(job['device'], self.local_dev['device'])
+            {
+                object_reconstructor.SYNC: sync_jobs,
+                object_reconstructor.REVERT: revert_jobs,
+            }[job['job_type']].append(job)
+        self.assertEqual(1, len(sync_jobs))
+        job = sync_jobs[0]
+        self.assertEqual(job['frag_index'], frag_index)
+        self.assertEqual(sorted(job['suffixes']), sorted(['123', 'abc']))
+        self.assertEqual(len(job['sync_to']), 3)
+        self.assertEqual(set([n['index'] for n in job['sync_to']]),
+                         set([(frag_index + 1) % ring.replicas,
+                              (frag_index - 1) % ring.replicas,
+                              (frag_index + int(0.5 * ring.replicas)),
+                              ]))
+        self.assertEqual(1, len(revert_jobs))
+        job = revert_jobs[0]
+        self.assertEqual(job['frag_index'], other_frag_index)
+        self.assertEqual(job['suffixes'], ['456'])
+        self.assertEqual(len(job['sync_to']),
+                         self.policy.ec_duplication_factor)
+        self.assertEqual(job['sync_to'][0]['index'], other_frag_index)
+
+    def test_build_jobs_revert_only_tombstones(self):
+        ring = self.policy.object_ring = self.fabricated_ring
+        # find a partition for which we're a handoff
+        for partition in range(2 ** ring.part_power):
+            part_nodes = ring.get_part_nodes(partition)
+            if self.local_dev['id'] not in [n['id'] for n in part_nodes]:
+                break
+        else:
+            self.fail("the ring doesn't work: %r" % ring._replica2part2dev_id)
+        part_path = os.path.join(self.devices, self.local_dev['device'],
+                                 diskfile.get_data_dir(self.policy),
+                                 str(partition))
+        part_info = {
+            'local_dev': self.local_dev,
+            'policy': self.policy,
+            'partition': partition,
+            'part_path': part_path,
+        }
+        # we have no fragment index to hint the jobs where they belong
+        stub_hashes = {
+            '123': {None: 'hash'},
+            'abc': {None: 'hash'},
+        }
+        with mock.patch('swift.obj.diskfile.ECDiskFileManager._get_hashes',
+                        return_value=(0, stub_hashes)):
+            jobs = self.reconstructor.build_reconstruction_jobs(part_info)
+        self.assertEqual(len(jobs), 1, 'Expected only one job, got %r' % jobs)
+        job = jobs[0]
+        expected = {
+            'job_type': object_reconstructor.REVERT,
+            'frag_index': None,
+            'suffixes': list(stub_hashes.keys()),
+            'partition': partition,
+            'path': part_path,
+            'hashes': stub_hashes,
+            'policy': self.policy,
+            'local_dev': self.local_dev,
+            'device': self.local_dev['device'],
+        }
+        self.assertEqual(ring.replica_count, len(part_nodes))
+        expected_samples = (
+            (self.policy.ec_n_unique_fragments *
+             self.policy.ec_duplication_factor) -
+            self.policy.ec_ndata + 1)
+        self.assertEqual(len(job['sync_to']), expected_samples)
+        for k, v in expected.items():
+            msg = 'expected %s != %s for %s' % (
+                v, job[k], k)
+            self.assertEqual(v, job[k], msg)
+
+    def test_get_suffixes_to_sync(self):
+        part_path = os.path.join(self.devices, self.local_dev['device'],
+                                 diskfile.get_data_dir(self.policy), '1')
+        utils.mkdirs(part_path)
+        part_info = {
+            'local_dev': self.local_dev,
+            'policy': self.policy,
+            'partition': 1,
+            'part_path': part_path,
+        }
+        jobs = self.reconstructor.build_reconstruction_jobs(part_info)
+        self.assertEqual(1, len(jobs))
+        job = jobs[0]
+        node = job['sync_to'][0]
+        # process_job used to try and modify the instance base headers
+        self.reconstructor.headers['X-Backend-Storage-Policy-Index'] = \
+            int(POLICIES[1])
+        # ... which doesn't work out under concurrency with multiple policies
+        self.assertNotEqual(
+            self.reconstructor.headers['X-Backend-Storage-Policy-Index'],
+            int(job['policy']))
+        with mocked_http_conn(200, body=pickle.dumps({})) as request_log:
+            suffixes, new_node = self.reconstructor._get_suffixes_to_sync(
+                job, node)
+        self.assertEqual([int(job['policy'])], [
+            r['headers']['X-Backend-Storage-Policy-Index']
+            for r in request_log.requests])
+        self.assertEqual(suffixes, [])
+        self.assertEqual(new_node, node)
+
+    def test_get_suffixes_in_sync(self):
+        part_path = os.path.join(self.devices, self.local_dev['device'],
+                                 diskfile.get_data_dir(self.policy), '1')
+        utils.mkdirs(part_path)
+        part_info = {
+            'local_dev': self.local_dev,
+            'policy': self.policy,
+            'partition': 1,
+            'part_path': part_path,
+        }
+        jobs = self.reconstructor.build_reconstruction_jobs(part_info)
+        self.assertEqual(1, len(jobs))
+        job = jobs[0]
+        node = job['sync_to'][0]
+        local_hashes = {
+            '123': {job['frag_index']: 'hash', None: 'hash'},
+            'abc': {job['frag_index']: 'hash', None: 'hash'},
+        }
+        self.assertEqual(node['index'], self.policy.object_ring.replicas - 1)
+        remote_index = self.policy.get_backend_index(node['index'])
+        remote_hashes = {
+            '123': {remote_index: 'hash', None: 'hash'},
+            'abc': {remote_index: 'hash', None: 'hash'},
+        }
+        remote_response = pickle.dumps(remote_hashes)
+        with mock.patch('swift.obj.diskfile.ECDiskFileManager._get_hashes',
+                        return_value=(0, local_hashes)), \
+                mocked_http_conn(200, body=remote_response) as request_log:
+            suffixes, new_node = self.reconstructor._get_suffixes_to_sync(
+                job, node)
+        self.assertEqual([node['replication_ip']],
+                         [r['ip'] for r in request_log.requests])
+        self.assertEqual(suffixes, [])
+        self.assertEqual(new_node, node)
+
+    def test_get_suffix_delta(self):
+        # different
+        local_suff = {'123': {None: 'abc', 0: 'def'}}
+        remote_suff = {'456': {None: 'ghi', 0: 'jkl'}}
+        local_index = 0
+        remote_index = 0
+        suffs = self.reconstructor.get_suffix_delta(local_suff,
+                                                    local_index,
+                                                    remote_suff,
+                                                    remote_index)
+        self.assertEqual(suffs, ['123'])
+
+        # now the same
+        remote_suff = {'123': {None: 'abc', 0: 'def'}}
+        suffs = self.reconstructor.get_suffix_delta(local_suff,
+                                                    local_index,
+                                                    remote_suff,
+                                                    remote_index)
+        self.assertEqual(suffs, [])
+
+        # now with a mis-matched None key (missing durable)
+        remote_suff = {'123': {None: 'ghi', 0: 'def'}}
+        suffs = self.reconstructor.get_suffix_delta(local_suff,
+                                                    local_index,
+                                                    remote_suff,
+                                                    remote_index)
+        self.assertEqual(suffs, ['123'])
+
+        # now with bogus local index
+        local_suff = {'123': {None: 'abc', 99: 'def'}}
+        remote_suff = {'456': {None: 'ghi', 0: 'jkl'}}
+        suffs = self.reconstructor.get_suffix_delta(local_suff,
+                                                    local_index,
+                                                    remote_suff,
+                                                    remote_index)
+        self.assertEqual(suffs, ['123'])
+
+    def test_process_job_primary_in_sync(self):
+        partition = 0
+        part_nodes = self.policy.object_ring.get_part_nodes(partition)
+        local_dev = random.choice(part_nodes)
+        frag_index = self.policy.get_backend_index(local_dev['index'])
+        sync_to = object_reconstructor._get_partners(
+            local_dev['index'], part_nodes)
+        # setup left, right and far hashes
+        stub_hashes = {
+            '123': {frag_index: 'hash', None: 'hash'},
+            'abc': {frag_index: 'hash', None: 'hash'},
+        }
+        left_frag_index = self.policy.get_backend_index(sync_to[0]['index'])
+        left_hashes = {
+            '123': {left_frag_index: 'hash', None: 'hash'},
+            'abc': {left_frag_index: 'hash', None: 'hash'},
+        }
+        right_frag_index = self.policy.get_backend_index(sync_to[1]['index'])
+        right_hashes = {
+            '123': {right_frag_index: 'hash', None: 'hash'},
+            'abc': {right_frag_index: 'hash', None: 'hash'},
+        }
+        far_index = self.policy.get_backend_index(sync_to[2]['index'])
+        far_hashes = {
+            '123': {far_index: 'hash', None: 'hash'},
+            'abc': {far_index: 'hash', None: 'hash'},
+        }
+        partition = 0
+        part_path = os.path.join(self.devices, self.local_dev['device'],
+                                 diskfile.get_data_dir(self.policy),
+                                 str(partition))
+        job = {
+            'job_type': object_reconstructor.SYNC,
+            'frag_index': frag_index,
+            'suffixes': stub_hashes.keys(),
+            'sync_to': sync_to,
+            'partition': partition,
+            'path': part_path,
+            'hashes': stub_hashes,
+            'policy': self.policy,
+            'local_dev': self.local_dev,
+        }
+
+        responses = [(200, pickle.dumps(hashes)) for hashes in (
+            left_hashes, right_hashes, far_hashes)]
+        codes, body_iter = zip(*responses)
+
+        ssync_calls = []
+
+        with mock_ssync_sender(ssync_calls), \
+                mock.patch('swift.obj.diskfile.ECDiskFileManager._get_hashes',
+                           return_value=(0, stub_hashes)), \
+                mocked_http_conn(*codes, body_iter=body_iter) as request_log:
+            self.reconstructor.process_job(job)
+
+        expected_suffix_calls = [
+            (sync_to[0]['ip'], '/%s/0' % sync_to[0]['device']),
+            (sync_to[1]['ip'], '/%s/0' % sync_to[1]['device']),
+            (sync_to[2]['ip'], '/%s/0' % sync_to[2]['device']),
+        ]
+        self.assertEqual(expected_suffix_calls,
+                         [(r['ip'], r['path']) for r in request_log.requests])
+
+        self.assertFalse(ssync_calls)
+
+    def test_process_job_primary_not_in_sync(self):
+        partition = 0
+        part_nodes = self.policy.object_ring.get_part_nodes(partition)
+        local_dev = random.choice(part_nodes)
+        frag_index = self.policy.get_backend_index(local_dev['index'])
+        sync_to = object_reconstructor._get_partners(
+            local_dev['index'], part_nodes)
+        # setup left and right hashes
+        stub_hashes = {
+            '123': {frag_index: 'hash', None: 'hash'},
+            'abc': {frag_index: 'hash', None: 'hash'},
+        }
+        left_hashes = {}
+        right_hashes = {}
+        far_hashes = {}
+
+        partition = 0
+        part_path = os.path.join(self.devices, self.local_dev['device'],
+                                 diskfile.get_data_dir(self.policy),
+                                 str(partition))
+        job = {
+            'job_type': object_reconstructor.SYNC,
+            'frag_index': frag_index,
+            'suffixes': stub_hashes.keys(),
+            'sync_to': sync_to,
+            'partition': partition,
+            'path': part_path,
+            'hashes': stub_hashes,
+            'policy': self.policy,
+            'local_dev': self.local_dev,
+        }
+
+        responses = []
+        for hashes in (left_hashes, right_hashes, far_hashes):
+            responses.append((200, pickle.dumps(hashes)))
+        codes, body_iter = zip(*responses)
+
+        ssync_calls = []
+        with mock_ssync_sender(ssync_calls), \
+                mock.patch('swift.obj.diskfile.ECDiskFileManager._get_hashes',
+                           return_value=(0, stub_hashes)), \
+                mocked_http_conn(*codes, body_iter=body_iter) as request_log:
+            self.reconstructor.process_job(job)
+
+        expected_suffix_calls = [
+            (sync_to[0]['ip'], '/%s/0' % sync_to[0]['device']),
+            (sync_to[1]['ip'], '/%s/0' % sync_to[1]['device']),
+            (sync_to[2]['ip'], '/%s/0' % sync_to[2]['device']),
+        ]
+        self.assertEqual(expected_suffix_calls,
+                         [(r['ip'], r['path']) for r in request_log.requests])
+
+        expected_ssync_calls = sorted([
+            (sync_to[0]['ip'], 0, set(['123', 'abc']), False),
+            (sync_to[1]['ip'], 0, set(['123', 'abc']), False),
+            (sync_to[2]['ip'], 0, set(['123', 'abc']), False),
+        ])
+        self.assertEqual(expected_ssync_calls, sorted((
+            c['node']['ip'],
+            c['job']['partition'],
+            set(c['suffixes']),
+            c.get('include_non_durable'),
+        ) for c in ssync_calls))
+
+    def test_sync_duplicates_to_remote_region(self):
+        partition = 0
+        part_nodes = self.policy.object_ring.get_part_nodes(partition)
+        # in the non-duplicate case we just pick a random node
+        local_dev = random.choice(part_nodes[-14:])
+        frag_index = self.policy.get_backend_index(local_dev['index'])
+        sync_to = object_reconstructor._get_partners(
+            local_dev['index'], part_nodes)
+        part_path = os.path.join(self.devices, self.local_dev['device'],
+                                 diskfile.get_data_dir(self.policy),
+                                 str(partition))
+        # setup left and right hashes
+        stub_hashes = {
+            '123': {frag_index: 'hash', None: 'hash'},
+            'abc': {frag_index: 'hash', None: 'hash'},
+        }
+        # left hand side is in sync
+        left_frag_index = self.policy.get_backend_index(sync_to[0]['index'])
+        left_hashes = {
+            '123': {left_frag_index: 'hash', None: 'hash'},
+            'abc': {left_frag_index: 'hash', None: 'hash'},
+        }
+        # right hand side needs sync
+        right_frag_index = self.policy.get_backend_index(sync_to[1]['index'])
+        right_hashes = {
+            '123': {right_frag_index: 'hash', None: 'hash'},
+            'abc': {right_frag_index: 'hashX', None: 'hash'},
+        }
+        far_index = self.policy.get_backend_index(sync_to[2]['index'])
+        far_hashes = {
+            '123': {far_index: 'hash', None: 'hash'},
+            'abc': {far_index: 'hash', None: 'hash'},
+        }
+
+        job = {
+            'job_type': object_reconstructor.SYNC,
+            'frag_index': frag_index,
+            'suffixes': stub_hashes.keys(),
+            'sync_to': sync_to,
+            'partition': partition,
+            'path': part_path,
+            'hashes': stub_hashes,
+            'policy': self.policy,
+            'local_dev': self.local_dev,
+            'device': self.local_dev['device'],
+        }
+
+        responses = [
+            (200, pickle.dumps(left_hashes)),
+            (200, pickle.dumps(right_hashes)),
+            (200, pickle.dumps(far_hashes)),
+        ]
+        codes, body_iter = zip(*responses)
+
+        # we're going to dip our mocks into the ssync layer a bit
+        ssync_resp = mock.MagicMock()
+        ssync_resp.status = 200
+        ssync_resp.readline.side_effect = [
+            b':MISSING_CHECK: START',
+            b':MISSING_CHECK: END',
+            b':UPDATES: START',
+            b':UPDATES: END',
+        ]
+
+        ssync_headers = []
+
+        def capture_headers(name, value):
+            ssync_headers.append((name, value))
+
+        ssync_conn = mock.MagicMock()
+        ssync_conn.getresponse.return_value = ssync_resp
+        ssync_conn.putheader = capture_headers
+
+        with mock.patch('swift.obj.ssync_sender.SsyncBufferedHTTPConnection',
+                        return_value=ssync_conn), \
+                mock.patch('swift.obj.diskfile.ECDiskFileManager._get_hashes',
+                           return_value=(0, stub_hashes)), \
+                mock.patch('swift.obj.diskfile.ECDiskFileManager.yield_hashes',
+                           return_value=iter([])), \
+                mocked_http_conn(*codes, body_iter=body_iter):
+            self.reconstructor.process_job(job)
+
+        # ... to make sure it sets up our headers correctly
+        self.assertEqual(ssync_headers, [
+            ('Transfer-Encoding', 'chunked'),
+            ('X-Backend-Storage-Policy-Index', 0),
+            ('X-Backend-Ssync-Frag-Index', right_frag_index),
+            # we include this for backwards compat
+            ('X-Backend-Ssync-Node-Index', right_frag_index),
+        ])
+
+    def test_process_job_sync_missing_durable(self):
+        partition = 0
+        part_nodes = self.policy.object_ring.get_part_nodes(partition)
+        local_dev = random.choice(part_nodes)
+        frag_index = self.policy.get_backend_index(local_dev['index'])
+        sync_to = object_reconstructor._get_partners(
+            local_dev['index'], part_nodes)
+        # setup left and right hashes
+        stub_hashes = {
+            '123': {frag_index: 'hash', None: 'hash'},
+            'abc': {frag_index: 'hash', None: 'hash'},
+        }
+        # left hand side is in sync
+        left_frag_index = self.policy.get_backend_index(sync_to[0]['index'])
+        left_hashes = {
+            '123': {left_frag_index: 'hash', None: 'hash'},
+            'abc': {left_frag_index: 'hash', None: 'hash'},
+        }
+        # right hand side has fragment, but no durable (None key is whack)
+        right_frag_index = self.policy.get_backend_index(sync_to[1]['index'])
+        right_hashes = {
+            '123': {right_frag_index: 'hash', None: 'hash'},
+            'abc': {right_frag_index: 'hash',
+                    None: 'different-because-durable'},
+        }
+        # far side is in sync
+        far_index = self.policy.get_backend_index(sync_to[2]['index'])
+        far_hashes = {
+            '123': {far_index: 'hash', None: 'hash'},
+            'abc': {far_index: 'hash', None: 'hash'},
+        }
+
+        part_path = os.path.join(self.devices, self.local_dev['device'],
+                                 diskfile.get_data_dir(self.policy),
+                                 str(partition))
+        job = {
+            'job_type': object_reconstructor.SYNC,
+            'frag_index': frag_index,
+            'suffixes': stub_hashes.keys(),
+            'sync_to': sync_to,
+            'partition': partition,
+            'path': part_path,
+            'hashes': stub_hashes,
+            'policy': self.policy,
+            'local_dev': self.local_dev,
+        }
+
+        responses = [(200, pickle.dumps(hashes)) for hashes in (
+            left_hashes, right_hashes, far_hashes)]
+        codes, body_iter = zip(*responses)
+
+        ssync_calls = []
+        with mock_ssync_sender(ssync_calls), \
+                mock.patch('swift.obj.diskfile.ECDiskFileManager._get_hashes',
+                           return_value=(0, stub_hashes)), \
+                mocked_http_conn(*codes, body_iter=body_iter) as request_log:
+            self.reconstructor.process_job(job)
+
+        expected_suffix_calls = set([
+            (sync_to[0]['ip'], '/%s/0' % sync_to[0]['device']),
+            (sync_to[1]['ip'], '/%s/0' % sync_to[1]['device']),
+            (sync_to[2]['ip'], '/%s/0' % sync_to[2]['device']),
+        ])
+        self.assertEqual(expected_suffix_calls,
+                         set((r['ip'], r['path'])
+                             for r in request_log.requests))
+
+        expected_ssync_calls = sorted([
+            (sync_to[1]['ip'], 0, ['abc'], False),
+        ])
+        self.assertEqual(expected_ssync_calls, sorted((
+            c['node']['ip'],
+            c['job']['partition'],
+            c['suffixes'],
+            c.get('include_non_durable')
+        ) for c in ssync_calls))
+
+    def test_process_job_primary_some_in_sync(self):
+        partition = 0
+        part_nodes = self.policy.object_ring.get_part_nodes(partition)
+        local_dev = random.choice(part_nodes)
+        frag_index = self.policy.get_backend_index(local_dev['index'])
+        sync_to = object_reconstructor._get_partners(
+            local_dev['index'], part_nodes)
+        # setup left and right hashes
+        stub_hashes = {
+            '123': {frag_index: 'hash', None: 'hash'},
+            'abc': {frag_index: 'hash', None: 'hash'},
+        }
+        left_frag_index = self.policy.get_backend_index(sync_to[0]['index'])
+        left_hashes = {
+            '123': {left_frag_index: 'hashX', None: 'hash'},
+            'abc': {left_frag_index: 'hash', None: 'hash'},
+        }
+        right_frag_index = self.policy.get_backend_index(sync_to[1]['index'])
+        right_hashes = {
+            '123': {right_frag_index: 'hash', None: 'hash'},
+        }
+        far_index = self.policy.get_backend_index(sync_to[2]['index'])
+        far_hashes = {
+            'abc': {far_index: 'hashX', None: 'hash'},
+        }
+        part_path = os.path.join(self.devices, self.local_dev['device'],
+                                 diskfile.get_data_dir(self.policy),
+                                 str(partition))
+        job = {
+            'job_type': object_reconstructor.SYNC,
+            'frag_index': frag_index,
+            'suffixes': stub_hashes.keys(),
+            'sync_to': sync_to,
+            'partition': partition,
+            'path': part_path,
+            'hashes': stub_hashes,
+            'policy': self.policy,
+            'local_dev': self.local_dev,
+        }
+
+        responses = []
+        for hashes in (left_hashes, right_hashes, far_hashes):
+            responses.append((200, pickle.dumps(hashes)))
+        codes, body_iter = zip(*responses)
+
+        ssync_calls = []
+
+        with mock_ssync_sender(ssync_calls), \
+                mock.patch('swift.obj.diskfile.ECDiskFileManager._get_hashes',
+                           return_value=(0, stub_hashes)), \
+                mocked_http_conn(*codes, body_iter=body_iter) as request_log:
+            self.reconstructor.process_job(job)
+
+        expected_suffix_calls = set([
+            (sync_to[0]['ip'], '/%s/0' % sync_to[0]['device']),
+            (sync_to[1]['ip'], '/%s/0' % sync_to[1]['device']),
+            (sync_to[2]['ip'], '/%s/0' % sync_to[2]['device']),
+        ])
+        self.assertEqual(expected_suffix_calls,
+                         set((r['ip'], r['path'])
+                             for r in request_log.requests))
+
+        self.assertEqual(
+            dict(collections.Counter(
+                (c['node']['index'], tuple(sorted(c['suffixes'])),
+                 c.get('include_non_durable'))
+                for c in ssync_calls)),
+            {(sync_to[0]['index'], ('123',), False): 1,
+             (sync_to[1]['index'], ('abc',), False): 1,
+             (sync_to[2]['index'], ('123', 'abc'), False): 1,
+             })
+
+    def test_process_job_primary_down(self):
+        partition = 0
+        frag_index = random.randint(
+            0, self.policy.ec_n_unique_fragments - 1)
+        stub_hashes = {
+            '123': {frag_index: 'hash', None: 'hash'},
+            'abc': {frag_index: 'hash', None: 'hash'},
+        }
+
+        part_nodes = self.policy.object_ring.get_part_nodes(partition)
+        sync_to = part_nodes[:3]
+
+        part_path = os.path.join(self.devices, self.local_dev['device'],
+                                 diskfile.get_data_dir(self.policy),
+                                 str(partition))
+        job = {
+            'job_type': object_reconstructor.SYNC,
+            'frag_index': frag_index,
+            'suffixes': stub_hashes.keys(),
+            'sync_to': sync_to,
+            'partition': partition,
+            'path': part_path,
+            'hashes': stub_hashes,
+            'policy': self.policy,
+            'device': self.local_dev['device'],
+            'local_dev': self.local_dev,
+        }
+
+        non_local = {'called': 0}
+
+        def ssync_response_callback(*args):
+            # in this test, ssync fails on the first (primary sync_to) node
+            if non_local['called'] >= 1:
+                return True, {}
+            non_local['called'] += 1
+            return False, {}
+
+        expected_suffix_calls = set()
+        for node in part_nodes[:3]:
+            expected_suffix_calls.update([
+                (node['replication_ip'], '/%s/0' % node['device']),
+            ])
+
+        ssync_calls = []
+        with mock_ssync_sender(ssync_calls,
+                               response_callback=ssync_response_callback), \
+                mock.patch('swift.obj.diskfile.ECDiskFileManager._get_hashes',
+                           return_value=(0, stub_hashes)), \
+                mocked_http_conn(*[200] * len(expected_suffix_calls),
+                                 body=pickle.dumps({})) as request_log:
+            self.reconstructor.process_job(job)
+
+        found_suffix_calls = set((r['ip'], r['path'])
+                                 for r in request_log.requests)
+        self.assertEqual(expected_suffix_calls, found_suffix_calls)
+
+        expected_ssync_calls = sorted([
+            ('10.0.0.0', 0, set(['123', 'abc']), False),
+            ('10.0.0.1', 0, set(['123', 'abc']), False),
+            ('10.0.0.2', 0, set(['123', 'abc']), False),
+        ])
+        found_ssync_calls = sorted((
+            c['node']['ip'],
+            c['job']['partition'],
+            set(c['suffixes']),
+            c.get('include_non_durable')
+        ) for c in ssync_calls)
+        self.assertEqual(expected_ssync_calls, found_ssync_calls)
+
+    def test_process_job_suffix_call_errors(self):
+        partition = 0
+        frag_index = random.randint(
+            0, self.policy.ec_n_unique_fragments - 1)
+        stub_hashes = {
+            '123': {frag_index: 'hash', None: 'hash'},
+            'abc': {frag_index: 'hash', None: 'hash'},
+        }
+
+        part_nodes = self.policy.object_ring.get_part_nodes(partition)
+        sync_to = part_nodes[:2]
+
+        part_path = os.path.join(self.devices, self.local_dev['device'],
+                                 diskfile.get_data_dir(self.policy),
+                                 str(partition))
+        job = {
+            'job_type': object_reconstructor.SYNC,
+            'frag_index': frag_index,
+            'suffixes': stub_hashes.keys(),
+            'sync_to': sync_to,
+            'partition': partition,
+            'path': part_path,
+            'hashes': stub_hashes,
+            'policy': self.policy,
+            'device': self.local_dev['device'],
+            'local_dev': self.local_dev,
+        }
+
+        expected_suffix_calls = set((
+            node['replication_ip'], '/%s/0' % node['device']
+        ) for node in sync_to)
+
+        possible_errors = [404, Timeout(), Exception('kaboom!')]
+        codes = [random.choice(possible_errors)
+                 for r in expected_suffix_calls]
+
+        ssync_calls = []
+        with mock_ssync_sender(ssync_calls), \
+                mock.patch('swift.obj.diskfile.ECDiskFileManager._get_hashes',
+                           return_value=(0, stub_hashes)), \
+                mocked_http_conn(*codes) as request_log:
+            self.reconstructor.process_job(job)
+
+        found_suffix_calls = set((r['ip'], r['path'])
+                                 for r in request_log.requests)
+        self.assertEqual(expected_suffix_calls, found_suffix_calls)
+
+        self.assertFalse(ssync_calls)
+
+    def test_process_job_sync_partner_unmounted(self):
+        partition = 0
+        part_nodes = self.policy.object_ring.get_part_nodes(partition)
+        frag_index = [n['id'] for n in part_nodes].index(self.local_dev['id'])
+        sync_to = object_reconstructor._get_partners(frag_index, part_nodes)
+        self.assertEqual(3, len(sync_to))
+        stub_hashes = {
+            '123': {frag_index: 'hash', None: 'hash'},
+            'abc': {frag_index: 'hash', None: 'hash'},
+        }
+        # left partner out of sync
+        left_frag_index = self.policy.get_backend_index(sync_to[0]['index'])
+        left_hashes = {
+            '123': {left_frag_index: 'not-in-sync-hash', None: 'hash'},
+            'abc': {left_frag_index: 'hash', None: 'hash'},
+        }
+        # we don't need right partner hashes
+        # far partner in sync
+        far_index = self.policy.get_backend_index(sync_to[2]['index'])
+        far_hashes = {
+            '123': {far_index: 'hash', None: 'hash'},
+            'abc': {far_index: 'hash', None: 'hash'},
+        }
+        part_path = os.path.join(self.devices, self.local_dev['device'],
+                                 diskfile.get_data_dir(self.policy),
+                                 str(partition))
+        job = {
+            'job_type': object_reconstructor.SYNC,
+            'frag_index': frag_index,
+            'suffixes': stub_hashes.keys(),
+            'sync_to': sync_to,
+            'partition': partition,
+            'path': part_path,
+            'hashes': stub_hashes,
+            'policy': self.policy,
+            'device': self.local_dev['device'],
+            'local_dev': self.local_dev,
+        }
+
+        responses = [
+            (200, pickle.dumps(left_hashes)),  # hashes left partner
+            (507, ''),  # unmounted right partner
+            (200, pickle.dumps({})),  # hashes handoff
+            (200, pickle.dumps(far_hashes)),  # hashes far partner
+        ]
+        codes, body_iter = zip(*responses)
+
+        ssync_calls = []
+        with mock_ssync_sender(ssync_calls), \
+                mock.patch('swift.obj.diskfile.ECDiskFileManager._get_hashes',
+                           return_value=(0, stub_hashes)), \
+                mocked_http_conn(*codes, body_iter=body_iter) as request_log:
+            self.reconstructor.process_job(job)
+        # increment frag_index since we're rebuilding to our right
+        frag_index = (frag_index + 1) % self.policy.ec_n_unique_fragments
+        handoffs = self.policy.object_ring.get_more_nodes(partition)
+        for i, handoff in enumerate(handoffs):
+            if i == frag_index:
+                break
+        else:
+            self.fail('Unable to find handoff?!')
+        expected = collections.Counter([
+            (200, sync_to[0]['ip']),
+            (507, sync_to[1]['ip']),
+            (200, handoff['ip']),
+            (200, sync_to[2]['ip']),
+        ])
+        self.assertEqual(expected, collections.Counter(
+            [(c, r['ip']) for c, r in zip(codes, request_log.requests)]))
+        expected = collections.Counter([
+            sync_to[0]['ip'],
+            handoff['ip'],
+        ])
+        self.assertEqual(expected, collections.Counter(
+            [c['node']['ip'] for c in ssync_calls]))
+
+    def test_process_job_handoff(self):
+        frag_index = random.randint(
+            0, self.policy.ec_n_unique_fragments - 1)
+        sync_to = [random.choice([n for n in self.policy.object_ring.devs
+                                  if n != self.local_dev])]
+        sync_to[0]['index'] = frag_index
+
+        stub_hashes = {
+            '123': {frag_index: 'hash', None: 'hash'},
+            'abc': {frag_index: 'hash', None: 'hash'},
+        }
+        partition = 0
+        part_path = os.path.join(self.devices, self.local_dev['device'],
+                                 diskfile.get_data_dir(self.policy),
+                                 str(partition))
+        os.makedirs(part_path)
+        job = {
+            'job_type': object_reconstructor.REVERT,
+            'frag_index': frag_index,
+            'suffixes': stub_hashes.keys(),
+            'sync_to': sync_to,
+            'partition': partition,
+            'path': part_path,
+            'hashes': stub_hashes,
+            'policy': self.policy,
+            'local_dev': self.local_dev,
+            'device': self.local_dev['device'],
+        }
+
+        ssync_calls = []
+        with mock_ssync_sender(ssync_calls), \
+                mock.patch('swift.obj.diskfile.ECDiskFileManager._get_hashes',
+                           return_value=(0, stub_hashes)):
+            self.reconstructor.process_job(job)
+
+        self.assertEqual(
+            sorted(collections.Counter(
+                (c['node']['ip'], c['node']['port'], c['node']['device'],
+                 tuple(sorted(c['suffixes'])),
+                 c.get('include_non_durable'))
+                for c in ssync_calls).items()),
+            [((sync_to[0]['ip'], sync_to[0]['port'], sync_to[0]['device'],
+               ('123', 'abc'), True), 1)])
+
+    def test_process_job_will_not_revert_to_handoff(self):
+        frag_index = random.randint(
+            0, self.policy.ec_n_unique_fragments - 1)
+        sync_to = [random.choice([n for n in self.policy.object_ring.devs
+                                  if n != self.local_dev])]
+        sync_to[0]['index'] = frag_index
+        partition = 0
+
+        stub_hashes = {
+            '123': {frag_index: 'hash', None: 'hash'},
+            'abc': {frag_index: 'hash', None: 'hash'},
+        }
+        part_path = os.path.join(self.devices, self.local_dev['device'],
+                                 diskfile.get_data_dir(self.policy),
+                                 str(partition))
+        os.makedirs(part_path)
+        job = {
+            'job_type': object_reconstructor.REVERT,
+            'frag_index': frag_index,
+            'suffixes': stub_hashes.keys(),
+            'sync_to': sync_to,
+            'partition': partition,
+            'path': part_path,
+            'hashes': stub_hashes,
+            'policy': self.policy,
+            'local_dev': self.local_dev,
+            'device': self.local_dev['device'],
+        }
+
+        non_local = {'called': 0}
+
+        def ssync_response_callback(*args):
+            # in this test, ssync fails on the first (primary sync_to) node
+            if non_local['called'] >= 1:
+                return True, {}
+            non_local['called'] += 1
+            return False, {}
+
+        ssync_calls = []
+        with mock_ssync_sender(ssync_calls,
+                               response_callback=ssync_response_callback), \
+                mocked_http_conn() as request_log:
+            self.reconstructor.process_job(job)
+
+        # failed ssync job should not generate a suffix rehash
+        self.assertEqual([], request_log.requests)
+
+        self.assertEqual(
+            sorted(collections.Counter(
+                (c['node']['ip'], c['node']['port'], c['node']['device'],
+                 tuple(sorted(c['suffixes'])),
+                 c.get('include_non_durable'))
+                for c in ssync_calls).items()),
+            [((sync_to[0]['ip'], sync_to[0]['port'], sync_to[0]['device'],
+               ('123', 'abc'), True), 1)])
+
+    def test_process_job_revert_is_handoff_fails(self):
+        frag_index = random.randint(
+            0, self.policy.ec_n_unique_fragments - 1)
+        sync_to = [random.choice([n for n in self.policy.object_ring.devs
+                                  if n != self.local_dev])]
+        sync_to[0]['index'] = frag_index
+        partition = 0
+        handoff_nodes = list(self.policy.object_ring.get_more_nodes(partition))
+
+        stub_hashes = {
+            '123': {frag_index: 'hash', None: 'hash'},
+            'abc': {frag_index: 'hash', None: 'hash'},
+        }
+        part_path = os.path.join(self.devices, self.local_dev['device'],
+                                 diskfile.get_data_dir(self.policy),
+                                 str(partition))
+        os.makedirs(part_path)
+        job = {
+            'job_type': object_reconstructor.REVERT,
+            'frag_index': frag_index,
+            'suffixes': stub_hashes.keys(),
+            'sync_to': sync_to,
+            'partition': partition,
+            'path': part_path,
+            'hashes': stub_hashes,
+            'policy': self.policy,
+            'local_dev': handoff_nodes[-1],
+            'device': self.local_dev['device'],
+        }
+
+        def ssync_response_callback(*args):
+            # in this test ssync always fails, until we encounter ourselves in
+            # the list of possible handoff's to sync to, so handoffs_remaining
+            # should increment
+            return False, {}
+
+        ssync_calls = []
+        with mock_ssync_sender(ssync_calls,
+                               response_callback=ssync_response_callback), \
+                mocked_http_conn() as request_log:
+            self.reconstructor.process_job(job)
+
+        # failed ssync job should not generate a suffix rehash
+        self.assertEqual([], request_log.requests)
+
+        # this is ssync call to primary (which fails) and nothing else!
+        self.assertEqual(
+            sorted(collections.Counter(
+                (c['node']['ip'], c['node']['port'], c['node']['device'],
+                 tuple(sorted(c['suffixes'])),
+                 c.get('include_non_durable'))
+                for c in ssync_calls).items()),
+            [((sync_to[0]['ip'], sync_to[0]['port'], sync_to[0]['device'],
+               ('123', 'abc'), True), 1)])
+        self.assertEqual(self.reconstructor.handoffs_remaining, 1)
+
+    def test_process_job_revert_cleanup(self):
+        frag_index = random.randint(
+            0, self.policy.ec_n_unique_fragments - 1)
+        sync_to = [random.choice([n for n in self.policy.object_ring.devs
+                                  if n != self.local_dev])]
+        sync_to[0]['index'] = frag_index
+        partition = 0
+
+        part_path = os.path.join(self.devices, self.local_dev['device'],
+                                 diskfile.get_data_dir(self.policy),
+                                 str(partition))
+        os.makedirs(part_path)
+        df_mgr = self.reconstructor._df_router[self.policy]
+        df = df_mgr.get_diskfile(self.local_dev['device'], partition, 'a',
+                                 'c', 'data-obj', policy=self.policy)
+        ts = self.ts()
+        with df.create() as writer:
+            test_data = b'test data'
+            writer.write(test_data)
+            metadata = {
+                'X-Timestamp': ts.internal,
+                'Content-Length': len(test_data),
+                'Etag': md5(test_data, usedforsecurity=False).hexdigest(),
+                'X-Object-Sysmeta-Ec-Frag-Index': frag_index,
+            }
+            writer.put(metadata)
+            writer.commit(ts)
+
+        ohash = os.path.basename(df._datadir)
+        suffix = os.path.basename(os.path.dirname(df._datadir))
+
+        job = {
+            'job_type': object_reconstructor.REVERT,
+            'frag_index': frag_index,
+            'primary_frag_index': None,
+            'suffixes': [suffix],
+            'sync_to': sync_to,
+            'partition': partition,
+            'path': part_path,
+            'hashes': {},
+            'policy': self.policy,
+            'local_dev': self.local_dev,
+            'device': self.local_dev['device'],
+        }
+
+        def ssync_response_callback(*args):
+            # success should not increment handoffs_remaining
+            return True, {ohash: {'ts_data': ts}}
+
+        ssync_calls = []
+        with mock_ssync_sender(ssync_calls,
+                               response_callback=ssync_response_callback):
+            self.reconstructor.process_job(job)
+
+        # hashpath has been removed
+        self.assertFalse(os.path.exists(df._datadir))
+
+        self.assertEqual(self.reconstructor.handoffs_remaining, 0)
+
+    def test_process_job_revert_cleanup_but_already_reclaimed(self):
+        frag_index = random.randint(
+            0, self.policy.ec_n_unique_fragments - 1)
+        sync_to = [random.choice([n for n in self.policy.object_ring.devs
+                                  if n != self.local_dev])]
+        sync_to[0]['index'] = frag_index
+        partition = 0
+
+        part_path = os.path.join(self.devices, self.local_dev['device'],
+                                 diskfile.get_data_dir(self.policy),
+                                 str(partition))
+        os.makedirs(part_path)
+        df_mgr = self.reconstructor._df_router[self.policy]
+        df = df_mgr.get_diskfile(self.local_dev['device'], partition, 'a',
+                                 'c', 'data-obj', policy=self.policy)
+        ts_delete = self.ts()
+        df.delete(ts_delete)
+        ohash = os.path.basename(df._datadir)
+        suffix = os.path.basename(os.path.dirname(df._datadir))
+
+        job = {
+            'job_type': object_reconstructor.REVERT,
+            'frag_index': frag_index,
+            'suffixes': [suffix],
+            'sync_to': sync_to,
+            'partition': partition,
+            'path': part_path,
+            'hashes': {},
+            'policy': self.policy,
+            'local_dev': self.local_dev,
+            'device': self.local_dev['device'],
+        }
+
+        fake_time = [float(ts_delete) + df_mgr.reclaim_age - 100]
+
+        def mock_time():
+            return fake_time[0]
+
+        def ssync_response_callback(*args):
+            # pretend ssync completed and time has moved just beyonf the
+            # reclaim age for the tombstone
+            fake_time[0] = float(ts_delete) + df_mgr.reclaim_age + 1
+            return True, {ohash: {'ts_data': ts_delete}}
+
+        ssync_calls = []
+        with mock.patch('swift.obj.diskfile.time.time', mock_time):
+            with mock_ssync_sender(ssync_calls,
+                                   response_callback=ssync_response_callback):
+                self.reconstructor.process_job(job)
+
+        self.assertFalse(os.path.exists(df._datadir))
+        self.assertEqual(self.reconstructor.handoffs_remaining, 0)
+        # check there's no tracebacks for opening the reclaimed tombstone
+        self.assertEqual(
+            [], self.reconstructor.logger.logger.get_lines_for_level('error'))
+
+    def _make_frag(self, df, fi, ts_data):
+        with df.create() as writer:
+            test_data = b'test data'
+            writer.write(test_data)
+            metadata = {
+                'X-Timestamp': ts_data.internal,
+                'Content-Length': len(test_data),
+                'Etag': md5(test_data, usedforsecurity=False).hexdigest(),
+                'X-Object-Sysmeta-Ec-Frag-Index': fi,
+            }
+            writer.put(metadata)
+            writer.commit(ts_data)
+
+    def _do_test_process_job_revert_cleanup_with_meta(self, frag_indexes,
+                                                      primary_frag_index):
+        sync_to = [[dict(random.choice([n for n in self.policy.object_ring.devs
+                                        if n != self.local_dev]),
+                         index=frag_index)] for frag_index in frag_indexes]
+        partition = 0
+
+        part_path = os.path.join(self.devices, self.local_dev['device'],
+                                 diskfile.get_data_dir(self.policy),
+                                 str(partition))
+        mkdirs(part_path)
+        df_mgr = self.reconstructor._df_router[self.policy]
+        df = df_mgr.get_diskfile(self.local_dev['device'], partition, 'a',
+                                 'c', 'data-obj', policy=self.policy)
+
+        ts_data = self.ts()
+        for frag_index in frag_indexes:
+            self._make_frag(df, frag_index, ts_data)
+        if primary_frag_index is not None:
+            self._make_frag(df, primary_frag_index, ts_data)
+        ts_meta = self.ts()
+        df.write_metadata({'X-Timestamp': ts_meta.internal,
+                           'X-Object-Meta-Test': 'testing'})
+
+        ohash = os.path.basename(df._datadir)
+        suffix = os.path.basename(os.path.dirname(df._datadir))
+
+        jobs = [{
+            'job_type': object_reconstructor.REVERT,
+            'frag_index': frag_index,
+            'primary_frag_index': primary_frag_index,
+            'suffixes': [suffix],
+            'sync_to': sync_to[i],
+            'partition': partition,
+            'path': part_path,
+            'hashes': {},
+            'policy': self.policy,
+            'local_dev': self.local_dev,
+            'device': self.local_dev['device'],
+        } for i, frag_index in enumerate(frag_indexes)]
+
+        ondisk_files_during_sync = []
+
+        def ssync_response_callback(*args):
+            ondisk_files_during_sync.append(os.listdir(df._datadir))
+            # success should not increment handoffs_remaining
+            return True, {ohash: {'ts_data': ts_data, 'ts_meta': ts_meta}}
+
+        ssync_calls = []
+        with mock_ssync_sender(ssync_calls,
+                               response_callback=ssync_response_callback):
+            for job in jobs:
+                self.reconstructor.process_job(job)
+
+        self.assertEqual(self.reconstructor.handoffs_remaining, 0)
+        self.assertEqual(len(jobs), len(ssync_calls))
+        self.assertEqual(len(jobs), len(ondisk_files_during_sync))
+        # verify that the meta file is intact at startof every job/ssync call:
+        # if it is removed at all, it should be removed in the *last* call
+        for fileset in ondisk_files_during_sync:
+            self.assertIn(ts_meta.internal + '.meta', fileset)
+        return df
+
+    def test_process_job_revert_does_cleanup_meta_pure_handoff(self):
+        # verify that danging meta files are cleaned up if the revert job is
+        # for a pure handoff partition
+        frag_index = random.randint(
+            0, self.policy.ec_n_unique_fragments - 1)
+        df = self._do_test_process_job_revert_cleanup_with_meta(
+            frag_indexes=[frag_index], primary_frag_index=None)
+        # hashpath has been removed
+        self.assertFalse(os.path.exists(df._datadir))
+
+        extra_index = frag_index
+        while extra_index == frag_index:
+            extra_index = random.randint(
+                0, self.policy.ec_n_unique_fragments - 1)
+        df = self._do_test_process_job_revert_cleanup_with_meta(
+            frag_indexes=[frag_index, extra_index], primary_frag_index=None)
+        # hashpath has been removed
+        self.assertFalse(os.path.exists(df._datadir))
+
+    def test_process_job_revert_does_not_cleanup_meta_also_primary(self):
+        # verify that danging meta files are not cleaned up if the revert job
+        # is for a handoff partition that is also a primary for another frag
+        # index
+        frag_index = random.randint(
+            0, self.policy.ec_n_unique_fragments - 1)
+        primary_frag_index = frag_index
+        while primary_frag_index == frag_index:
+            primary_frag_index = random.randint(
+                0, self.policy.ec_n_unique_fragments - 1)
+        df = self._do_test_process_job_revert_cleanup_with_meta(
+            frag_indexes=[frag_index], primary_frag_index=primary_frag_index)
+        # hashpath has not been removed
+        self.assertTrue(os.path.exists(df._datadir))
+        file_info = df._manager.cleanup_ondisk_files(df._datadir)
+        self.maxDiff = None
+        self.assertTrue('meta_file' in file_info)
+        self.assertTrue(os.path.exists(file_info['meta_file']))
+        self.assertTrue('data_info' in file_info)
+        self.assertEqual(primary_frag_index,
+                         file_info['data_info']['frag_index'])
+        self.assertTrue(os.path.exists(file_info['data_file']))
+        # only the primary frag and meta file remain
+        self.assertEqual(2, len(os.listdir(df._datadir)))
+
+    def test_process_job_revert_does_not_cleanup_meta_new_data(self):
+        # verify that danging meta files are not cleaned up if the revert job
+        # is for a pure handoff partition that has a newer data frag in
+        # addition to the frag that was sync'd
+        frag_index = 0
+        extra_frag_index = 1
+        sync_to = [dict(random.choice([n for n in self.policy.object_ring.devs
+                                       if n != self.local_dev]),
+                        index=frag_index)]
+        partition = 0
+
+        part_path = os.path.join(self.devices, self.local_dev['device'],
+                                 diskfile.get_data_dir(self.policy),
+                                 str(partition))
+        mkdirs(part_path)
+        df_mgr = self.reconstructor._df_router[self.policy]
+        df = df_mgr.get_diskfile(self.local_dev['device'], partition, 'a',
+                                 'c', 'data-obj', policy=self.policy)
+
+        ts_data0 = self.ts()  # original frag
+        ts_data1 = self.ts()  # new one written during ssync
+        self._make_frag(df, frag_index, ts_data0)
+        ts_meta = self.ts()
+        df.write_metadata({'X-Timestamp': ts_meta.internal,
+                           'X-Object-Meta-Test': 'testing'})
+
+        ohash = os.path.basename(df._datadir)
+        suffix = os.path.basename(os.path.dirname(df._datadir))
+
+        job = {
+            'job_type': object_reconstructor.REVERT,
+            'frag_index': frag_index,
+            'primary_frag_index': None,
+            'suffixes': [suffix],
+            'sync_to': sync_to,
+            'partition': partition,
+            'path': part_path,
+            'hashes': {},
+            'policy': self.policy,
+            'local_dev': self.local_dev,
+            'device': self.local_dev['device'],
+        }
+
+        def ssync_response_callback(*args):
+            # pretend that during the ssync call the original frag is replaced
+            # by a newer one
+            self._make_frag(df, extra_frag_index, ts_data1)
+            return True, {ohash: {'ts_data': ts_data0, 'ts_meta': ts_meta}}
+
+        ssync_calls = []
+        with mock_ssync_sender(ssync_calls,
+                               response_callback=ssync_response_callback):
+            self.reconstructor.process_job(job)
+
+        self.assertEqual(1, len(ssync_calls))
+        # hashpath has not been removed
+        self.assertTrue(os.path.exists(df._datadir))
+        file_info = df._manager.cleanup_ondisk_files(df._datadir)
+        self.maxDiff = None
+        self.assertIsNotNone(file_info['meta_file'])
+        self.assertTrue(os.path.exists(file_info['meta_file']))
+        self.assertTrue('data_info' in file_info)
+        self.assertTrue(os.path.exists(file_info['data_file']))
+        # only the newer frag and meta file remain
+        self.assertEqual(2, len(os.listdir(df._datadir)))
+        self.assertEqual(ts_data1, file_info['data_info']['timestamp'])
+
+    def test_process_job_revert_cleanup_tombstone(self):
+        partition = 0
+        sync_to = [random.choice([
+            n for n in self.policy.object_ring.get_part_nodes(partition)
+            if n['id'] != self.local_dev['id']])]
+
+        part_path = os.path.join(self.devices, self.local_dev['device'],
+                                 diskfile.get_data_dir(self.policy),
+                                 str(partition))
+        os.makedirs(part_path)
+        df_mgr = self.reconstructor._df_router[self.policy]
+        df = df_mgr.get_diskfile(self.local_dev['device'], partition, 'a',
+                                 'c', 'data-obj', policy=self.policy)
+        ts = self.ts()
+        df.delete(ts)
+
+        ohash = os.path.basename(df._datadir)
+        suffix = os.path.basename(os.path.dirname(df._datadir))
+
+        job = {
+            'job_type': object_reconstructor.REVERT,
+            'frag_index': None,
+            'primary_frag_index': None,
+            'suffixes': [suffix],
+            'sync_to': sync_to,
+            'partition': partition,
+            'path': part_path,
+            'hashes': {},
+            'policy': self.policy,
+            'local_dev': self.local_dev,
+            'device': self.local_dev['device'],
+        }
+
+        def ssync_response_callback(*args):
+            return True, {ohash: {'ts_data': ts}}
+
+        ssync_calls = []
+        with mock_ssync_sender(ssync_calls,
+                               response_callback=ssync_response_callback):
+            self.reconstructor.process_job(job)
+
+        # hashpath is still there, but it's empty
+        self.assertEqual([], os.listdir(df._datadir))
+
+    def test_get_local_devices(self):
+        local_devs = self.reconstructor.get_local_devices()
+        self.assertEqual({'sda'}, local_devs)
+
+    @patch_policies(legacy_only=True)
+    def test_get_local_devices_with_no_ec_policy_env(self):
+        # even no ec_policy found on the server, it runs just like as
+        # no ec device found
+        self._configure_reconstructor()
+        self.assertEqual([], self.reconstructor.policies)
+        local_devs = self.reconstructor.get_local_devices()
+        self.assertEqual(set(), local_devs)
+
+    @patch_policies(legacy_only=True)
+    def test_reconstruct_with_no_ec_policy_env(self):
+        self._configure_reconstructor()
+        self.assertEqual([], self.reconstructor.policies)
+        collect_parts_results = []
+        _orig_collect_parts = self.reconstructor.collect_parts
+
+        def capture_collect_parts(**kwargs):
+            part_infos = _orig_collect_parts(**kwargs)
+            collect_parts_results.append(part_infos)
+            return part_infos
+
+        with mock.patch.object(self.reconstructor, 'collect_parts',
+                               capture_collect_parts):
+            self.reconstructor.reconstruct()
+
+        # There is one call, and it returns an empty list
+        self.assertEqual([[]], collect_parts_results)
+        log_lines = self.logger.all_log_lines()
+        self.assertEqual(log_lines, {'info': [mock.ANY]})
+        line = log_lines['info'][0]
+        self.assertTrue(line.startswith('Nothing reconstructed '), line)
+
+
+class TestReconstructFragmentArchive(BaseTestObjectReconstructor):
+    obj_name = b'o'  # subclass overrides this
+
+    def setUp(self):
+        super(TestReconstructFragmentArchive, self).setUp()
+        self.obj_path = b'/a/c/' + self.obj_name
+        self.obj_timestamp = self.ts()
+
+    def _create_fragment(self, frag_index, body=b'test data'):
+        utils.mkdirs(os.path.join(self.devices, 'sda1'))
+        df_mgr = self.reconstructor._df_router[self.policy]
+        obj_name = self.obj_name.decode('utf8')
+        self.df = df_mgr.get_diskfile('sda1', 9, 'a', 'c', obj_name,
+                                      policy=self.policy)
+        write_diskfile(self.df, self.obj_timestamp, data=body,
+                       frag_index=frag_index)
+        self.df.open()
+        self.logger.clear()
+        return self.df
+
+    def test_reconstruct_fa_no_errors(self):
+        job = {
+            'partition': 0,
+            'policy': self.policy,
+        }
+        part_nodes = self.policy.object_ring.get_part_nodes(0)
+        node = part_nodes[1]
+        node['backend_index'] = self.policy.get_backend_index(node['index'])
+
+        test_data = (b'rebuild' * self.policy.ec_segment_size)[:-777]
+        etag = md5(test_data, usedforsecurity=False).hexdigest()
+        ec_archive_bodies = encode_frag_archive_bodies(self.policy, test_data)
+        broken_body = ec_archive_bodies.pop(1)
+
+        responses = list()
+        for body in ec_archive_bodies:
+            headers = get_header_frag_index(self, body)
+            headers.update({'X-Object-Sysmeta-Ec-Etag': etag})
+            responses.append((200, body, headers))
+
+        # make a hook point at
+        # swift.obj.reconstructor.ObjectReconstructor._get_response
+        called_headers = []
+        orig_func = object_reconstructor.ObjectReconstructor._get_response
+
+        def _get_response_hook(self, node, policy, part, path, headers):
+            called_headers.append(headers)
+            return orig_func(self, node, policy, part, path, headers)
+
+        codes, body_iter, headers = zip(*responses)
+        get_response_path = \
+            'swift.obj.reconstructor.ObjectReconstructor._get_response'
+        with mock.patch(get_response_path, _get_response_hook):
+            with mocked_http_conn(
+                    *codes, body_iter=body_iter, headers=headers):
+                df = self.reconstructor.reconstruct_fa(
+                    job, node, self._create_fragment(2, body=b''))
+                self.assertEqual(0, df.content_length)
+                fixed_body = b''.join(df.reader())
+        self.assertEqual(len(fixed_body), len(broken_body))
+        self.assertEqual(md5(fixed_body, usedforsecurity=False).hexdigest(),
+                         md5(broken_body, usedforsecurity=False).hexdigest())
+        self.assertEqual(len(part_nodes) - 1, len(called_headers),
+                         'Expected %d calls, got %r' % (len(part_nodes) - 1,
+                                                        called_headers))
+        for called_header in called_headers:
+            called_header = HeaderKeyDict(called_header)
+            self.assertIn('Content-Length', called_header)
+            self.assertEqual(called_header['Content-Length'], '0')
+            self.assertIn('User-Agent', called_header)
+            user_agent = called_header['User-Agent']
+            self.assertTrue(user_agent.startswith('obj-reconstructor'))
+            self.assertIn('X-Backend-Storage-Policy-Index', called_header)
+            self.assertEqual(called_header['X-Backend-Storage-Policy-Index'],
+                             self.policy)
+            self.assertIn('X-Backend-Fragment-Preferences', called_header)
+            self.assertEqual(
+                [{'timestamp': self.obj_timestamp.normal, 'exclude': []}],
+                json.loads(called_header['X-Backend-Fragment-Preferences']))
+            self.assertIn('X-Backend-Replication', called_header)
+        # no error and warning
+        self.assertFalse(self.logger.get_lines_for_level('error'))
+        self.assertFalse(self.logger.get_lines_for_level('warning'))
+
+    def test_reconstruct_fa_errors_works(self):
+        job = {
+            'partition': 0,
+            'policy': self.policy,
+        }
+        part_nodes = self.policy.object_ring.get_part_nodes(0)
+        node = part_nodes[4]
+        node['backend_index'] = self.policy.get_backend_index(node['index'])
+
+        test_data = (b'rebuild' * self.policy.ec_segment_size)[:-777]
+        etag = md5(test_data, usedforsecurity=False).hexdigest()
+        ec_archive_bodies = encode_frag_archive_bodies(self.policy, test_data)
+
+        broken_body = ec_archive_bodies.pop(4)
+
+        base_responses = list()
+        for body in ec_archive_bodies:
+            headers = get_header_frag_index(self, body)
+            headers.update({'X-Object-Sysmeta-Ec-Etag': etag})
+            base_responses.append((200, body, headers))
+
+        # since we're already missing a fragment a +2 scheme can only support
+        # one additional failure at a time
+        for error in (Timeout(), 404, Exception('kaboom!')):
+            responses = base_responses
+            error_index = random.randint(0, len(responses) - 1)
+            responses[error_index] = (error, '', '')
+            codes, body_iter, headers_iter = zip(*responses)
+            with mocked_http_conn(*codes, body_iter=body_iter,
+                                  headers=headers_iter):
+                df = self.reconstructor.reconstruct_fa(
+                    job, node, self._create_fragment(2))
+                fixed_body = b''.join(df.reader())
+                self.assertEqual(len(fixed_body), len(broken_body))
+                self.assertEqual(
+                    md5(fixed_body, usedforsecurity=False).hexdigest(),
+                    md5(broken_body, usedforsecurity=False).hexdigest())
+
+    def test_reconstruct_fa_mixed_meta_timestamps_works(self):
+        # verify scenario where all fragments have same data timestamp but some
+        # have different meta timestamp
+        job = {
+            'partition': 0,
+            'policy': self.policy,
+        }
+        part_nodes = self.policy.object_ring.get_part_nodes(0)
+        node = part_nodes[4]
+        node['backend_index'] = self.policy.get_backend_index(node['index'])
+
+        test_data = (b'rebuild' * self.policy.ec_segment_size)[:-777]
+        etag = md5(test_data, usedforsecurity=False).hexdigest()
+        ec_archive_bodies = encode_frag_archive_bodies(self.policy, test_data)
+
+        broken_body = ec_archive_bodies.pop(4)
+        ts_data = next(self.ts_iter)  # all frags .data timestamp
+        ts_meta = next(self.ts_iter)  # some frags .meta timestamp
+        ts_cycle = itertools.cycle((ts_data, ts_meta))
+        responses = list()
+        for body in ec_archive_bodies:
+            ts = next(ts_cycle)  # vary timestamp between data and meta
+            headers = get_header_frag_index(self, body)
+            headers.update({'X-Object-Sysmeta-Ec-Etag': etag,
+                            'X-Timestamp': ts.normal,
+                            'X-Backend-Timestamp': ts.internal,
+                            'X-Backend-Data-Timestamp': ts_data.internal,
+                            'X-Backend-Durable-Timestamp': ts_data.internal})
+            responses.append((200, body, headers))
+
+        codes, body_iter, headers_iter = zip(*responses)
+        with mocked_http_conn(*codes, body_iter=body_iter,
+                              headers=headers_iter):
+            df = self.reconstructor.reconstruct_fa(
+                job, node, self._create_fragment(2))
+            fixed_body = b''.join(df.reader())
+            self.assertEqual(len(fixed_body), len(broken_body))
+            self.assertEqual(
+                md5(fixed_body, usedforsecurity=False).hexdigest(),
+                md5(broken_body, usedforsecurity=False).hexdigest())
+
+    def test_reconstruct_fa_error_with_invalid_header(self):
+        job = {
+            'partition': 0,
+            'policy': self.policy,
+        }
+        part_nodes = self.policy.object_ring.get_part_nodes(0)
+        node = part_nodes[4]
+        node['backend_index'] = self.policy.get_backend_index(node['index'])
+
+        test_data = (b'rebuild' * self.policy.ec_segment_size)[:-777]
+        etag = md5(test_data, usedforsecurity=False).hexdigest()
+        ec_archive_bodies = encode_frag_archive_bodies(self.policy, test_data)
+
+        broken_body = ec_archive_bodies.pop(4)
+
+        base_responses = list()
+        for body in ec_archive_bodies:
+            headers = get_header_frag_index(self, body)
+            headers.update({'X-Object-Sysmeta-Ec-Etag': etag})
+            base_responses.append((200, body, headers))
+
+        responses = base_responses
+        # force the test to exercise the handling of this bad response by
+        # sticking it in near the front
+        error_index = random.randint(0, self.policy.ec_ndata - 1)
+        status, body, headers = responses[error_index]
+        # one esoteric failure is a literal string 'None' in place of the
+        # X-Object-Sysmeta-EC-Frag-Index
+        stub_node_job = {'some_keys': 'foo', 'but_not': 'frag_index'}
+        headers['X-Object-Sysmeta-Ec-Frag-Index'] = str(
+            stub_node_job.get('frag_index'))
+        # oops!
+        self.assertEqual('None',
+                         headers.get('X-Object-Sysmeta-Ec-Frag-Index'))
+        responses[error_index] = status, body, headers
+        codes, body_iter, headers_iter = zip(*responses)
+        with mocked_http_conn(*codes, body_iter=body_iter,
+                              headers=headers_iter):
+            df = self.reconstructor.reconstruct_fa(
+                job, node, self._create_fragment(2))
+            fixed_body = b''.join(df.reader())
+            # ... this bad response should be ignored like any other failure
+            self.assertEqual(len(fixed_body), len(broken_body))
+            self.assertEqual(
+                md5(fixed_body, usedforsecurity=False).hexdigest(),
+                md5(broken_body, usedforsecurity=False).hexdigest())
+
+    def test_reconstruct_parity_fa_with_data_node_failure(self):
+        job = {
+            'partition': 0,
+            'policy': self.policy,
+        }
+        part_nodes = self.policy.object_ring.get_part_nodes(0)
+        node = part_nodes[-4]
+        node['backend_index'] = self.policy.get_backend_index(node['index'])
+
+        # make up some data (trim some amount to make it unaligned with
+        # segment size)
+        test_data = (b'rebuild' * self.policy.ec_segment_size)[:-454]
+        etag = md5(test_data, usedforsecurity=False).hexdigest()
+        ec_archive_bodies = encode_frag_archive_bodies(self.policy, test_data)
+        # the scheme is 10+4, so this gets a parity node
+        broken_body = ec_archive_bodies.pop(-4)
+
+        responses = list()
+        for body in ec_archive_bodies:
+            headers = get_header_frag_index(self, body)
+            headers.update({'X-Object-Sysmeta-Ec-Etag': etag})
+            responses.append((200, body, headers))
+
+        for error in (Timeout(), 404, Exception('kaboom!')):
+            # grab a data node index
+            error_index = random.randint(0, self.policy.ec_ndata - 1)
+            responses[error_index] = (error, '', '')
+            codes, body_iter, headers_iter = zip(*responses)
+            with mocked_http_conn(*codes, body_iter=body_iter,
+                                  headers=headers_iter):
+                df = self.reconstructor.reconstruct_fa(
+                    job, node, self._create_fragment(2))
+                fixed_body = b''.join(df.reader())
+                self.assertEqual(len(fixed_body), len(broken_body))
+                self.assertEqual(
+                    md5(fixed_body, usedforsecurity=False).hexdigest(),
+                    md5(broken_body, usedforsecurity=False).hexdigest())
+
+    def test_reconstruct_fa_exceptions_fails(self):
+        job = {
+            'partition': 0,
+            'policy': self.policy,
+        }
+        part_nodes = self.policy.object_ring.get_part_nodes(0)
+        node = part_nodes[1]
+        node['backend_index'] = self.policy.get_backend_index(node['index'])
+        policy = self.policy
+
+        possible_errors = [Timeout(), Exception('kaboom!')]
+        codes = [random.choice(possible_errors) for i in
+                 range(policy.object_ring.replicas - 1)]
+        with mocked_http_conn(*codes):
+            self.assertRaises(DiskFileError, self.reconstructor.reconstruct_fa,
+                              job, node, self._create_fragment(2))
+        error_lines = self.logger.get_lines_for_level('error')
+        # # of replicas failed and one more error log to report not enough
+        # responses to reconstruct.
+        self.assertEqual(policy.object_ring.replicas, len(error_lines))
+        for line in error_lines[:-1]:
+            self.assertIn("Trying to GET", line)
+        self.assertIn(
+            'Unable to get enough responses (%s x unknown error responses)'
+            % (policy.object_ring.replicas - 1),
+            error_lines[-1],
+            "Unexpected error line found: %s" % error_lines[-1])
+        # no warning
+        self.assertFalse(self.logger.get_lines_for_level('warning'))
+
+    def test_reconstruct_fa_all_404s_fails(self):
+        self._create_fragment(2)
+        job = {
+            'partition': 0,
+            'policy': self.policy,
+        }
+        part_nodes = self.policy.object_ring.get_part_nodes(0)
+        node = part_nodes[1]
+        node['backend_index'] = self.policy.get_backend_index(node['index'])
+        policy = self.policy
+
+        codes = [404 for i in range(policy.object_ring.replicas - 1)]
+        with mocked_http_conn(*codes):
+            self.assertRaises(DiskFileError, self.reconstructor.reconstruct_fa,
+                              job, node, self.df)
+        error_lines = self.logger.get_lines_for_level('error')
+        # only 1 log to report not enough responses
+        self.assertEqual(1, len(error_lines))
+        self.assertIn(
+            'Unable to get enough responses (%s x 404 error responses)'
+            % (policy.object_ring.replicas - 1),
+            error_lines[0],
+            "Unexpected error line found: %s" % error_lines[0])
+        # no warning
+        self.assertFalse(self.logger.get_lines_for_level('warning'))
+
+    def test_reconstruct_fa_all_404s_fails_custom_request_node_count(self):
+        # verify that when quarantine_threshold is not set the number of
+        # requests is capped at replicas - 1 regardless of request_node_count
+        self._create_fragment(2)
+        job = {
+            'partition': 0,
+            'policy': self.policy,
+        }
+        part_nodes = self.policy.object_ring.get_part_nodes(0)
+        node = part_nodes[1]
+        node['backend_index'] = self.policy.get_backend_index(node['index'])
+        ring = self.policy.object_ring
+        # sanity check: number of handoffs available == replicas
+        self.assertEqual(ring.max_more_nodes, ring.replicas)
+        for request_node_count in (0,
+                                   self.policy.ec_ndata - 1,
+                                   ring.replicas + 1,
+                                   2 * ring.replicas - 1,
+                                   2 * ring.replicas,
+                                   3 * ring.replicas,
+                                   99 * ring.replicas):
+            with self.subTest(request_node_count=request_node_count):
+                self.logger.clear()
+                self.reconstructor.request_node_count = \
+                    lambda replicas: request_node_count
+                # request count capped at num primaries - 1
+                exp_requests = ring.replicas - 1
+                codes = [404 for i in range(exp_requests)]
+                with mocked_http_conn(*codes):
+                    self.assertRaises(DiskFileError,
+                                      self.reconstructor.reconstruct_fa,
+                                      job, node, self.df)
+                error_lines = self.logger.get_lines_for_level('error')
+                # only 1 log to report not enough responses
+                self.assertEqual(1, len(error_lines))
+                self.assertIn(
+                    'Unable to get enough responses (%s x 404 error responses)'
+                    % exp_requests,
+                    error_lines[0],
+                    "Unexpected error line found: %s" % error_lines[0])
+                # no warning
+                self.assertFalse(self.logger.get_lines_for_level('warning'))
+
+    def test_reconstruct_fa_mixture_of_errors_fails(self):
+        self._create_fragment(2)
+        job = {
+            'partition': 0,
+            'policy': self.policy,
+        }
+        part_nodes = self.policy.object_ring.get_part_nodes(0)
+        node = part_nodes[1]
+        node['backend_index'] = self.policy.get_backend_index(node['index'])
+        policy = self.policy
+
+        # ensure at least one of each error type
+        possible_errors = [Timeout(), 404, 507]
+        codes = possible_errors + [random.choice(possible_errors) for i in
+                                   range(policy.object_ring.replicas - 4)]
+        with mocked_http_conn(*codes):
+            self.assertRaises(DiskFileError, self.reconstructor.reconstruct_fa,
+                              job, node, self.df)
+        exp_timeouts = len([c for c in codes if isinstance(c, Timeout)])
+        exp_404s = len([c for c in codes if c == 404])
+        exp_507s = len([c for c in codes if c == 507])
+        error_lines = self.logger.get_lines_for_level('error')
+        # 1 error log to report not enough responses and possibly some to
+        # report Timeouts
+        self.assertEqual(len(error_lines), exp_timeouts + 1, error_lines)
+        for line in error_lines[:-1]:
+            self.assertIn("Trying to GET", line)
+        self.assertIn(
+            'Unable to get enough responses '
+            '(%s x unknown, %s x 404, %s x 507 error responses)'
+            % (exp_timeouts, exp_404s, exp_507s), error_lines[-1],
+            "Unexpected error line found: %s" % error_lines[-1])
+        # no warning
+        warning_lines = self.logger.get_lines_for_level('warning')
+        self.assertEqual(exp_507s, len(warning_lines), warning_lines)
+        for line in warning_lines:
+            self.assertIn('Invalid response 507', line)
+
+    def test_reconstruct_fa_with_mixed_old_etag(self):
+        job = {
+            'partition': 0,
+            'policy': self.policy,
+        }
+        part_nodes = self.policy.object_ring.get_part_nodes(0)
+        node = part_nodes[1]
+        node['backend_index'] = self.policy.get_backend_index(node['index'])
+
+        test_data = (b'rebuild' * self.policy.ec_segment_size)[:-777]
+        etag = md5(test_data, usedforsecurity=False).hexdigest()
+        ec_archive_bodies = encode_frag_archive_bodies(self.policy, test_data)
+
+        # bad response
+        broken_body = ec_archive_bodies.pop(1)
+        ts = make_timestamp_iter()
+        bad_headers = get_header_frag_index(self, broken_body)
+        bad_headers.update({
+            'X-Object-Sysmeta-Ec-Etag': 'some garbage',
+            'X-Backend-Timestamp': next(ts).internal,
+        })
+
+        # good responses
+        responses = list()
+        t1 = next(ts).internal
+        for body in ec_archive_bodies:
+            headers = get_header_frag_index(self, body)
+            headers.update({'X-Object-Sysmeta-Ec-Etag': etag,
+                            'X-Backend-Timestamp': t1})
+            responses.append((200, body, headers))
+
+        # include the one older frag with different etag in first responses
+        error_index = random.randint(0, self.policy.ec_ndata - 1)
+        error_headers = get_header_frag_index(self,
+                                              (responses[error_index])[1])
+        error_headers.update(bad_headers)
+        bad_response = (200, '', bad_headers)
+        responses[error_index] = bad_response
+        codes, body_iter, headers = zip(*responses)
+        with mocked_http_conn(*codes, body_iter=body_iter, headers=headers):
+            df = self.reconstructor.reconstruct_fa(
+                job, node, self._create_fragment(2))
+            fixed_body = b''.join(df.reader())
+            self.assertEqual(len(fixed_body), len(broken_body))
+            self.assertEqual(
+                md5(fixed_body, usedforsecurity=False).hexdigest(),
+                md5(broken_body, usedforsecurity=False).hexdigest())
+
+        # no error and warning
+        self.assertFalse(self.logger.get_lines_for_level('error'))
+        self.assertFalse(self.logger.get_lines_for_level('warning'))
+
+    def test_reconstruct_fa_with_mixed_new_etag(self):
+        job = {
+            'partition': 0,
+            'policy': self.policy,
+        }
+        part_nodes = self.policy.object_ring.get_part_nodes(0)
+        node = part_nodes[1]
+        node['backend_index'] = self.policy.get_backend_index(node['index'])
+
+        test_data = (b'rebuild' * self.policy.ec_segment_size)[:-777]
+        etag = md5(test_data, usedforsecurity=False).hexdigest()
+        ec_archive_bodies = encode_frag_archive_bodies(self.policy, test_data)
+
+        broken_body = ec_archive_bodies.pop(1)
+        ts = make_timestamp_iter()
+
+        # good responses
+        responses = list()
+        t0 = next(ts).internal
+        for body in ec_archive_bodies:
+            headers = get_header_frag_index(self, body)
+            headers.update({'X-Object-Sysmeta-Ec-Etag': etag,
+                            'X-Backend-Timestamp': t0})
+            responses.append((200, body, headers))
+
+        # sanity check before negative test
+        codes, body_iter, headers = zip(*responses)
+        with mocked_http_conn(*codes, body_iter=body_iter, headers=headers):
+            df = self.reconstructor.reconstruct_fa(
+                job, node, self._create_fragment(2))
+            fixed_body = b''.join(df.reader())
+            self.assertEqual(len(fixed_body), len(broken_body))
+            self.assertEqual(
+                md5(fixed_body, usedforsecurity=False).hexdigest(),
+                md5(broken_body, usedforsecurity=False).hexdigest())
+
+        # one newer etag won't spoil the bunch
+        new_index = random.randint(0, self.policy.ec_ndata - 1)
+        new_headers = get_header_frag_index(self, (responses[new_index])[1])
+        new_headers.update({'X-Object-Sysmeta-Ec-Etag': 'some garbage',
+                            'X-Backend-Timestamp': next(ts).internal})
+        new_response = (200, '', new_headers)
+        responses[new_index] = new_response
+        codes, body_iter, headers = zip(*responses)
+        with mocked_http_conn(*codes, body_iter=body_iter, headers=headers):
+            df = self.reconstructor.reconstruct_fa(
+                job, node, self._create_fragment(2))
+            fixed_body = b''.join(df.reader())
+            self.assertEqual(len(fixed_body), len(broken_body))
+            self.assertEqual(
+                md5(fixed_body, usedforsecurity=False).hexdigest(),
+                md5(broken_body, usedforsecurity=False).hexdigest())
+
+        # no error and warning
+        self.assertFalse(self.logger.get_lines_for_level('error'))
+        self.assertFalse(self.logger.get_lines_for_level('warning'))
+
+    def test_reconstruct_fa_with_mixed_etag_with_same_timestamp(self):
+        job = {
+            'partition': 0,
+            'policy': self.policy,
+        }
+        part_nodes = self.policy.object_ring.get_part_nodes(0)
+        node = part_nodes[1]
+        node['backend_index'] = self.policy.get_backend_index(node['index'])
+
+        test_data = (b'rebuild' * self.policy.ec_segment_size)[:-777]
+        etag = md5(test_data, usedforsecurity=False).hexdigest()
+        ec_archive_bodies = encode_frag_archive_bodies(self.policy, test_data)
+
+        broken_body = ec_archive_bodies.pop(1)
+
+        # good responses
+        responses = list()
+        for body in ec_archive_bodies:
+            headers = get_header_frag_index(self, body)
+            headers.update({'X-Object-Sysmeta-Ec-Etag': etag})
+            responses.append((200, body, headers))
+
+        # sanity check before negative test
+        codes, body_iter, headers = zip(*responses)
+        with mocked_http_conn(*codes, body_iter=body_iter, headers=headers):
+            df = self.reconstructor.reconstruct_fa(
+                job, node, self._create_fragment(2))
+            fixed_body = b''.join(df.reader())
+            self.assertEqual(len(fixed_body), len(broken_body))
+            self.assertEqual(
+                md5(fixed_body, usedforsecurity=False).hexdigest(),
+                md5(broken_body, usedforsecurity=False).hexdigest())
+
+        # a response at same timestamp but different etag won't spoil the bunch
+        # N.B. (FIXME). if we choose the first response as garbage, the
+        # reconstruction fails because all other *correct* frags will be
+        # assumed as garbage. To avoid the freaky failing set randint
+        # as [1, self.policy.ec_ndata - 1] to make the first response
+        # always have the correct etag to reconstruct
+        new_index = random.randint(1, self.policy.ec_ndata - 1)
+        new_headers = get_header_frag_index(self, (responses[new_index])[1])
+        new_headers.update({'X-Object-Sysmeta-Ec-Etag': 'some garbage'})
+        new_response = (200, '', new_headers)
+        responses[new_index] = new_response
+        codes, body_iter, headers = zip(*responses)
+        with mocked_http_conn(*codes, body_iter=body_iter, headers=headers):
+            df = self.reconstructor.reconstruct_fa(
+                job, node, self._create_fragment(2))
+            fixed_body = b''.join(df.reader())
+            self.assertEqual(len(fixed_body), len(broken_body))
+            self.assertEqual(
+                md5(fixed_body, usedforsecurity=False).hexdigest(),
+                md5(broken_body, usedforsecurity=False).hexdigest())
+
+        # expect an error log but no warnings
+        error_log_lines = self.logger.get_lines_for_level('error')
+        self.assertEqual(1, len(error_log_lines))
+        self.assertIn(
+            'Mixed Etag (some garbage, %s) for 10.0.0.1:1001/sdb/0%s '
+            'policy#%s frag#1' %
+            (etag, self.obj_path.decode('utf8'), int(self.policy)),
+            error_log_lines[0])
+        self.assertFalse(self.logger.get_lines_for_level('warning'))
+
+    def test_reconstruct_fa_with_mixed_timestamps_etags_fail(self):
+        job = {
+            'partition': 0,
+            'policy': self.policy,
+        }
+        part_nodes = self.policy.object_ring.get_part_nodes(0)
+        node = part_nodes[1]
+        node['backend_index'] = self.policy.get_backend_index(node['index'])
+
+        test_data = (b'rebuild' * self.policy.ec_segment_size)[:-777]
+        ec_archive_dict = dict()
+        ts = make_timestamp_iter()
+        # create 3 different ec bodies
+        for i in range(3):
+            body = test_data[i:]
+            archive_bodies = encode_frag_archive_bodies(self.policy, body)
+            # pop the index to the destination node
+            archive_bodies.pop(1)
+            key = (md5(body, usedforsecurity=False).hexdigest(),
+                   next(ts).internal, bool(i % 2))
+            ec_archive_dict[key] = archive_bodies
+
+        responses = list()
+        # fill out response list by 3 different etag bodies
+        for etag, ts, durable in itertools.cycle(ec_archive_dict):
+            body = ec_archive_dict[(etag, ts, durable)].pop(0)
+            headers = get_header_frag_index(self, body)
+            headers.update({'X-Object-Sysmeta-Ec-Etag': etag,
+                            'X-Backend-Timestamp': ts})
+            if durable:
+                headers['X-Backend-Durable-Timestamp'] = ts
+            responses.append((200, body, headers))
+            if len(responses) >= (self.policy.object_ring.replicas - 1):
+                break
+
+        # sanity, there is 3 different etag and each etag
+        # doesn't have > ec_k bodies
+        etag_count = collections.Counter(
+            [in_resp_headers['X-Object-Sysmeta-Ec-Etag']
+             for _, _, in_resp_headers in responses])
+        self.assertEqual(3, len(etag_count))
+        for etag, count in etag_count.items():
+            self.assertLess(count, self.policy.ec_ndata)
+
+        codes, body_iter, headers = zip(*responses)
+        with mocked_http_conn(*codes, body_iter=body_iter, headers=headers):
+            self.assertRaises(DiskFileError, self.reconstructor.reconstruct_fa,
+                              job, node, self._create_fragment(2))
+
+        error_lines = self.logger.get_lines_for_level('error')
+        # 1 error log per etag to report not enough responses
+        self.assertEqual(3, len(error_lines))
+        for error_line in error_lines:
+            for expected_etag, ts, durable in ec_archive_dict:
+                if expected_etag in error_line:
+                    break
+            else:
+                self.fail(
+                    "no expected etag %s found: %s" %
+                    (list(ec_archive_dict), error_line))
+            # remove the found etag which should not be found in the
+            # following error lines
+            del ec_archive_dict[(expected_etag, ts, durable)]
+
+            expected = 'Unable to get enough responses (%s/10 from %s ok ' \
+                       'responses) to reconstruct %s 10.0.0.1:1001/sdb/0%s ' \
+                       'policy#0 frag#1 with ETag %s and timestamp %s' %\
+                       (etag_count[expected_etag], etag_count[expected_etag],
+                        'durable' if durable else 'non-durable',
+                        self.obj_path.decode('utf8'), expected_etag, ts)
+            self.assertIn(
+                expected, error_line,
+                "Unexpected error line found: Expected: %s Got: %s"
+                % (expected, error_line))
+        # no warning
+        self.assertFalse(self.logger.get_lines_for_level('warning'))
+
+    def test_reconstruct_fa_with_mixed_etags_same_timestamp_fail(self):
+        self._create_fragment(2)
+        job = {
+            'partition': 0,
+            'policy': self.policy,
+        }
+        part_nodes = self.policy.object_ring.get_part_nodes(0)
+        node = part_nodes[1]
+        node['backend_index'] = self.policy.get_backend_index(node['index'])
+
+        test_data = (b'rebuild' * self.policy.ec_segment_size)[:-777]
+        ec_archive_dict = dict()
+        ts = next(make_timestamp_iter())
+        # create 3 different ec bodies
+        for i in range(3):
+            body = test_data[i:]
+            archive_bodies = encode_frag_archive_bodies(self.policy, body)
+            # pop the index to the destination node
+            archive_bodies.pop(1)
+            key = (md5(body, usedforsecurity=False).hexdigest(),
+                   ts.internal, bool(i % 2))
+            ec_archive_dict[key] = archive_bodies
+
+        responses = list()
+        # fill out response list by 3 different etag bodies, same timestamp
+        for etag, ts, durable in itertools.cycle(ec_archive_dict):
+            body = ec_archive_dict[(etag, ts, durable)].pop(0)
+            headers = get_header_frag_index(self, body)
+            headers.update({'X-Object-Sysmeta-Ec-Etag': etag,
+                            'X-Backend-Timestamp': ts})
+            if durable:
+                headers['X-Backend-Durable-Timestamp'] = ts
+            responses.append((200, body, headers))
+            if len(responses) >= (self.policy.object_ring.replicas - 1):
+                break
+
+        # sanity, there is 3 different etag and each etag
+        # doesn't have > ec_k bodies
+        etag_count = collections.Counter(
+            [in_resp_headers['X-Object-Sysmeta-Ec-Etag']
+             for _, _, in_resp_headers in responses])
+        self.assertEqual(3, len(etag_count))
+        for etag, count in etag_count.items():
+            self.assertLess(count, self.policy.ec_ndata)
+
+        codes, body_iter, headers = zip(*responses)
+        with mocked_http_conn(*codes, body_iter=body_iter, headers=headers):
+            self.assertRaises(DiskFileError, self.reconstructor.reconstruct_fa,
+                              job, node, self.df)
+
+        error_lines = self.logger.get_lines_for_level('error')
+        self.assertGreater(len(error_lines), 1)
+        for expected_etag, ts, durable in ec_archive_dict:
+            if expected_etag in error_lines[-1]:
+                break
+        else:
+            self.fail(
+                "no expected etag %s found: %s" %
+                (list(ec_archive_dict), error_lines[0]))
+
+        other_etags_count = sum(count for etag, count in etag_count.items()
+                                if etag != expected_etag)
+        self.assertEqual(other_etags_count + 1, len(error_lines))
+        for line in error_lines[:-1]:
+            self.assertIn('Mixed Etag', line)
+        expected = 'Unable to get enough responses (%s/10 from %s ok ' \
+                   'responses) to reconstruct %s 10.0.0.1:1001/sdb/0%s ' \
+                   'policy#0 frag#1 with ETag %s and timestamp %s' % \
+                   (etag_count[expected_etag], len(responses),
+                    'durable' if durable else 'non-durable',
+                    self.obj_path.decode('utf8'), expected_etag, ts)
+        self.assertIn(
+            expected, error_lines[-1],
+            "Unexpected error line found: Expected: %s Got: %s"
+            % (expected, error_lines[0]))
+        # no warning
+        self.assertFalse(self.logger.get_lines_for_level('warning'))
+
+    def test_reconstruct_fa_finds_missing_frag_does_not_fail(self):
+        # verify that reconstruction of a missing frag can cope with finding
+        # that missing frag in the responses it gets from other nodes while
+        # attempting to rebuild the missing frag
+        job = {
+            'partition': 0,
+            'policy': self.policy,
+        }
+        part_nodes = self.policy.object_ring.get_part_nodes(0)
+        broken_index = random.randint(0, self.policy.ec_ndata - 1)
+        node = part_nodes[broken_index]
+        node['backend_index'] = self.policy.get_backend_index(node['index'])
+
+        test_data = (b'rebuild' * self.policy.ec_segment_size)[:-777]
+        etag = md5(test_data, usedforsecurity=False).hexdigest()
+        ec_archive_bodies = encode_frag_archive_bodies(self.policy, test_data)
+
+        # instead of popping the broken body, we'll just leave it in the list
+        # of responses and take away something else.
+        broken_body = ec_archive_bodies[broken_index]
+        ec_archive_bodies = ec_archive_bodies[:-1]
+
+        def make_header(body):
+            headers = get_header_frag_index(self, body)
+            headers.update({'X-Object-Sysmeta-Ec-Etag': etag})
+            return headers
+
+        responses = [(200, body, make_header(body))
+                     for body in ec_archive_bodies]
+        codes, body_iter, headers = zip(*responses)
+        with mocked_http_conn(*codes, body_iter=body_iter, headers=headers):
+            df = self.reconstructor.reconstruct_fa(
+                job, node, self._create_fragment(2))
+            fixed_body = b''.join(df.reader())
+            self.assertEqual(len(fixed_body), len(broken_body))
+            self.assertEqual(
+                md5(fixed_body, usedforsecurity=False).hexdigest(),
+                md5(broken_body, usedforsecurity=False).hexdigest())
+
+        # no error, no warning
+        self.assertFalse(self.logger.get_lines_for_level('error'))
+        self.assertFalse(self.logger.get_lines_for_level('warning'))
+        # the found own frag will be reported in the debug message
+        debug_log_lines = self.logger.get_lines_for_level('debug')
+        # redundant frag found once in first ec_ndata responses
+        self.assertIn(
+            'Found existing frag #%s at' % broken_index,
+            debug_log_lines[0], debug_log_lines)
+
+        # N.B. in the future, we could avoid those check because
+        # definitely sending the copy rather than reconstruct will
+        # save resources. But one more reason, we're avoiding to
+        # use the dest index fragment even if it goes to reconstruct
+        # function is that it will cause a bunch of warning log from
+        # liberasurecode[1].
+        # 1: https://github.com/openstack/liberasurecode/blob/
+        #    master/src/erasurecode.c#L870
+        log_prefix = 'Reconstruct frag #%s with frag indexes' % broken_index
+        self.assertIn(log_prefix, debug_log_lines[1])
+        self.assertFalse(debug_log_lines[2:])
+        got_frag_index_list = json.loads(
+            debug_log_lines[1][len(log_prefix):])
+        self.assertNotIn(broken_index, got_frag_index_list)
+
+    def test_quarantine_threshold_conf(self):
+        reconstructor = object_reconstructor.ObjectReconstructor({})
+        self.assertEqual(0, reconstructor.quarantine_threshold)
+
+        reconstructor = object_reconstructor.ObjectReconstructor(
+            {'quarantine_threshold': '0'})
+        self.assertEqual(0, reconstructor.quarantine_threshold)
+
+        reconstructor = object_reconstructor.ObjectReconstructor(
+            {'quarantine_threshold': '1'})
+        self.assertEqual(1, reconstructor.quarantine_threshold)
+
+        reconstructor = object_reconstructor.ObjectReconstructor(
+            {'quarantine_threshold': 2.0})
+        self.assertEqual(2, reconstructor.quarantine_threshold)
+
+        for bad in ('1.1', '-1', -1, 'auto', 'bad'):
+            with self.subTest(option=bad):
+                with self.assertRaises(ValueError):
+                    object_reconstructor.ObjectReconstructor(
+                        {'quarantine_threshold': bad})
+
+    def test_quarantine_age_conf(self):
+        # defaults to DEFAULT_RECLAIM_AGE
+        reconstructor = object_reconstructor.ObjectReconstructor({})
+        self.assertEqual(604800, reconstructor.quarantine_age)
+
+        reconstructor = object_reconstructor.ObjectReconstructor(
+            {'quarantine_age': '0'})
+        self.assertEqual(0, reconstructor.quarantine_age)
+
+        reconstructor = object_reconstructor.ObjectReconstructor(
+            {'quarantine_age': '1'})
+        self.assertEqual(1, reconstructor.quarantine_age)
+
+        # trumps reclaim_age
+        reconstructor = object_reconstructor.ObjectReconstructor(
+            {'quarantine_age': '1', 'reclaim_age': 0})
+        self.assertEqual(1, reconstructor.quarantine_age)
+        reconstructor = object_reconstructor.ObjectReconstructor(
+            {'quarantine_age': '1', 'reclaim_age': 2})
+        self.assertEqual(1, reconstructor.quarantine_age)
+
+        reconstructor = object_reconstructor.ObjectReconstructor(
+            {'quarantine_age': 2.2})
+        self.assertEqual(2, reconstructor.quarantine_age)
+
+        for bad in ('1.1', 'auto', 'bad'):
+            with self.subTest(option=bad):
+                with self.assertRaises(ValueError):
+                    object_reconstructor.ObjectReconstructor(
+                        {'quarantine_age': bad})
+
+    def test_request_node_count_conf(self):
+        # default is 1 * replicas
+        reconstructor = object_reconstructor.ObjectReconstructor({})
+        self.assertEqual(6, reconstructor.request_node_count(3))
+        self.assertEqual(22, reconstructor.request_node_count(11))
+
+        def do_test(value, replicas, expected):
+            reconstructor = object_reconstructor.ObjectReconstructor(
+                {'request_node_count': value})
+            self.assertEqual(expected,
+                             reconstructor.request_node_count(replicas))
+        do_test('0', 10, 0)
+        do_test('1 * replicas', 3, 3)
+        do_test('1 * replicas', 11, 11)
+        do_test('2 * replicas', 3, 6)
+        do_test('2 * replicas', 11, 22)
+        do_test('11', 11, 11)
+        do_test('10', 11, 10)
+        do_test('12', 11, 12)
+
+        for bad in ('1.1', 1.1, 'auto', 'bad',
+                    '2.5 * replicas', 'two * replicas'):
+            with self.subTest(option=bad):
+                with self.assertRaises(ValueError):
+                    object_reconstructor.ObjectReconstructor(
+                        {'request_node_count': bad})
+
+    def _do_test_reconstruct_insufficient_frags(
+            self, extra_conf, num_frags, other_responses,
+            local_frag_index=2, frag_index_to_rebuild=1,
+            resp_timestamps=None, resp_etags=None):
+        # num_frags is number of ok responses, other_responses is bad responses
+        # By default frag_index_to_rebuild is less than local_frag_index and
+        # all frag responses have indexes >= local_frag_index
+        self.assertGreater(num_frags, 0)
+        self.logger.clear()
+        self._configure_reconstructor(**extra_conf)
+        self._create_fragment(local_frag_index)
+        job = {
+            'partition': 0,
+            'policy': self.policy,
+        }
+        part_nodes = self.policy.object_ring.get_part_nodes(0)
+        node = part_nodes[frag_index_to_rebuild]
+        node['backend_index'] = self.policy.get_backend_index(node['index'])
+
+        test_data = (b'rebuild' * self.policy.ec_segment_size)[:-777]
+        etag = md5(test_data, usedforsecurity=False).hexdigest()
+        ec_archive_bodies = encode_frag_archive_bodies(self.policy, test_data)
+        frags = ec_archive_bodies[
+            local_frag_index:local_frag_index + num_frags]
+
+        if resp_etags:
+            self.assertEqual(len(frags), len(resp_etags))
+            etags = []
+            for other_etag in resp_etags:
+                # use default etag where other_etag is None
+                etags.append(other_etag if other_etag else etag)
+        else:
+            etags = [etag] * len(frags)
+
+        def make_header(body):
+            headers = get_header_frag_index(self, body)
+            headers.update({'X-Object-Sysmeta-Ec-Etag': etags.pop(0)})
+            return headers
+
+        responses = [(200, frag, make_header(frag)) for frag in frags]
+        codes, body_iter, headers = zip(*(responses + other_responses))
+        resp_timestamps = (resp_timestamps if resp_timestamps
+                           else [self.obj_timestamp] * len(codes))
+        resp_timestamps = [ts.internal for ts in resp_timestamps]
+        with mocked_http_conn(*codes, body_iter=body_iter,
+                              headers=headers,
+                              timestamps=resp_timestamps):
+            with self.assertRaises(DiskFileError) as cm:
+                self.reconstructor.reconstruct_fa(
+                    job, node, self._create_fragment(2))
+        return cm.exception
+
+    def _verify_error_lines(self, num_frags, other_responses,
+                            exp_useful_responses):
+        error_lines = self.logger.get_lines_for_level('error')
+        self.assertEqual(2, len(error_lines), error_lines)
+        self.assertIn(
+            'Unable to get enough responses (%d/%d from %d ok responses)'
+            % (exp_useful_responses, self.policy.ec_ndata, num_frags),
+            error_lines[0])
+        bad_codes = collections.Counter(
+            status for status, _, _ in other_responses)
+        errors = ', '.join('%s x %s' % (num, code)
+                           for code, num in sorted(bad_codes.items()))
+        self.assertIn('Unable to get enough responses (%s error responses)'
+                      % errors, error_lines[1])
+
+    def _assert_diskfile_quarantined(self):
+        warning_lines = self.logger.get_lines_for_level('warning')
+        self.assertEqual(1, len(warning_lines), warning_lines)
+        self.assertIn('Quarantined object', warning_lines[0])
+
+        # Check the diskfile has moved to quarantine dir
+        data_filename = os.path.basename(self.df._data_file)
+        df_hash = os.path.basename(self.df._datadir)
+        quarantine_dir = os.path.join(
+            self.df._device_path, 'quarantined',
+            diskfile.get_data_dir(self.policy), df_hash)
+        self.assertTrue(os.path.isdir(quarantine_dir))
+        quarantine_file = os.path.join(quarantine_dir, data_filename)
+        self.assertTrue(os.path.isfile(quarantine_file))
+        with open(quarantine_file, 'r') as fd:
+            self.assertEqual('test data', fd.read())
+        self.assertFalse(os.path.exists(self.df._data_file))
+
+    def _assert_diskfile_not_quarantined(self):
+        # Check the diskfile has not moved to quarantine dir
+        quarantine_dir = os.path.join(
+            self.df._device_path, 'quarantined')
+        self.assertFalse(os.path.isdir(quarantine_dir))
+        self.assertTrue(os.path.exists(self.df._data_file))
+        with open(self.df._data_file, 'r') as fd:
+            self.assertEqual('test data', fd.read())
+
+    def test_reconstruct_fa_quarantine_threshold_one_rnc_two_replicas(self):
+        # use default request_node_count == 2 * replicas
+        num_other_resps = 2 * self.policy.object_ring.replicas - 2
+        other_responses = [(404, None, None)] * num_other_resps
+        conf = {'quarantine_threshold': 1, 'reclaim_age': 0}
+        exc = self._do_test_reconstruct_insufficient_frags(
+            conf, 1, other_responses)
+        self.assertIsInstance(exc, DiskFileQuarantined)
+        self._assert_diskfile_quarantined()
+        self._verify_error_lines(1, other_responses, 1)
+
+    def test_reconstruct_fa_quarantine_threshold_one_rnc_three_replicas(self):
+        num_other_resps = 3 * self.policy.object_ring.replicas - 2
+        other_responses = [(404, None, None)] * num_other_resps
+        conf = {'quarantine_threshold': 1, 'reclaim_age': 0,
+                'request_node_count': '3 * replicas'}
+        # set ring get_more_nodes to yield enough handoffs
+        self.policy.object_ring.max_more_nodes = (
+            2 * self.policy.object_ring.replicas)
+        exc = self._do_test_reconstruct_insufficient_frags(
+            conf, 1, other_responses)
+        self.assertIsInstance(exc, DiskFileQuarantined)
+        self._assert_diskfile_quarantined()
+        self._verify_error_lines(1, other_responses, 1)
+
+    def test_reconstruct_fa_quarantine_threshold_one_rnc_four_replicas(self):
+        # verify handoff search exhausting handoff node iter
+        num_other_resps = 3 * self.policy.object_ring.replicas - 2
+        other_responses = [(404, None, None)] * num_other_resps
+        conf = {'quarantine_threshold': 1, 'reclaim_age': 0,
+                'request_node_count': '4 * replicas'}
+        # limit ring get_more_nodes to yield less than
+        # (request_node_count - 1 * replicas) nodes
+        self.policy.object_ring.max_more_nodes = (
+            2 * self.policy.object_ring.replicas)
+        exc = self._do_test_reconstruct_insufficient_frags(
+            conf, 1, other_responses)
+        self.assertIsInstance(exc, DiskFileQuarantined)
+        self._assert_diskfile_quarantined()
+        self._verify_error_lines(1, other_responses, 1)
+
+    def test_reconstruct_fa_quarantine_threshold_one_rnc_absolute_number(self):
+        def do_test(rnc_num):
+            if rnc_num < self.policy.object_ring.replicas:
+                num_other_resps = self.policy.object_ring.replicas - 2
+            else:
+                num_other_resps = rnc_num - 2
+            other_responses = [(404, None, None)] * num_other_resps
+            conf = {'quarantine_threshold': 1, 'reclaim_age': 0,
+                    'request_node_count': str(rnc_num)}
+            # set ring get_more_nodes to yield enough handoffs
+            self.policy.object_ring.max_more_nodes = (
+                2 * self.policy.object_ring.replicas)
+            exc = self._do_test_reconstruct_insufficient_frags(
+                conf, 1, other_responses)
+            self.assertIsInstance(exc, DiskFileQuarantined)
+            self._assert_diskfile_quarantined()
+            self._verify_error_lines(1, other_responses, 1)
+
+        for rnc_num in range(0, 3 * self.policy.object_ring.replicas):
+            do_test(rnc_num)
+
+    def test_reconstruct_fa_quarantine_threshold_two(self):
+        num_other_resps = 2 * self.policy.object_ring.replicas - 3
+        other_responses = [(404, None, None)] * num_other_resps
+        conf = {'quarantine_threshold': 2, 'reclaim_age': 0}
+        exc = self._do_test_reconstruct_insufficient_frags(
+            conf, 2, other_responses)
+        self.assertIsInstance(exc, DiskFileQuarantined)
+        self._assert_diskfile_quarantined()
+        self._verify_error_lines(2, other_responses, 2)
+
+    def test_reconstruct_fa_quarantine_threshold_two_with_quarantine_age(self):
+        num_other_resps = 2 * self.policy.object_ring.replicas - 3
+        other_responses = [(404, None, None)] * num_other_resps
+        conf = {'quarantine_threshold': 2,
+                'quarantine_age': 0,  # quarantine age trumps reclaim age
+                'reclaim_age': 1000}
+        exc = self._do_test_reconstruct_insufficient_frags(
+            conf, 2, other_responses)
+        self.assertIsInstance(exc, DiskFileQuarantined)
+        self._assert_diskfile_quarantined()
+        self._verify_error_lines(2, other_responses, 2)
+
+    def test_reconstruct_fa_no_quarantine_more_than_threshold_frags(self):
+        # default config
+        num_other_resps = self.policy.object_ring.replicas - 2
+        other_responses = [(404, None, None)] * num_other_resps
+        exc = self._do_test_reconstruct_insufficient_frags(
+            {'reclaim_age': 0}, 1, other_responses)
+        self.assertIsInstance(exc, DiskFileError)
+        self._assert_diskfile_not_quarantined()
+
+        # configured quarantine_threshold
+        for quarantine_threshold in range(self.policy.ec_ndata):
+            for num_frags in range(quarantine_threshold + 1,
+                                   self.policy.ec_ndata):
+                num_other_resps = (self.policy.object_ring.replicas -
+                                   num_frags - 1)
+                other_responses = [(404, None, None)] * num_other_resps
+                exc = self._do_test_reconstruct_insufficient_frags(
+                    {'quarantine_threshold': quarantine_threshold,
+                     'reclaim_age': 0},
+                    num_frags, other_responses)
+                self.assertIsInstance(exc, DiskFileError)
+                self._assert_diskfile_not_quarantined()
+                self._verify_error_lines(num_frags, other_responses, num_frags)
+                warning_lines = self.logger.get_lines_for_level('warning')
+                self.assertEqual([], warning_lines)
+
+        # responses include the frag_index_to_rebuild - verify that response is
+        # counted against the threshold
+        num_other_resps = self.policy.object_ring.replicas - 3
+        other_responses = [(404, None, None)] * num_other_resps
+        exc = self._do_test_reconstruct_insufficient_frags(
+            {'quarantine_threshold': 1, 'reclaim_age': 0}, 2, other_responses,
+            local_frag_index=2, frag_index_to_rebuild=3)
+        self.assertIsInstance(exc, DiskFileError)
+        self._assert_diskfile_not_quarantined()
+        self._verify_error_lines(2, other_responses, 1)
+
+    def test_reconstruct_fa_no_quarantine_non_404_response(self):
+        num_frags = 1
+        ring = self.policy.object_ring
+        for bad_status in (400, 503, 507):
+            # a non-404 in primary responses will prevent quarantine
+            num_other_resps = ring.replicas - num_frags - 1
+            other_responses = [(404, None, None)] * (num_other_resps - 1)
+            other_responses.append((bad_status, None, None))
+            exc = self._do_test_reconstruct_insufficient_frags(
+                {'quarantine_threshold': 1, 'reclaim_age': 0},
+                num_frags, other_responses)
+            self.assertIsInstance(exc, DiskFileError)
+            self._assert_diskfile_not_quarantined()
+            self._verify_error_lines(num_frags, other_responses, num_frags)
+            warning_lines = self.logger.get_lines_for_level('warning')
+            self.assertEqual(1, len(warning_lines), warning_lines)
+            self.assertIn('Invalid response %s' % bad_status, warning_lines[0])
+
+            # a non-404 in handoff responses will prevent quarantine; non-404
+            # is the *final* handoff response...
+            ring.max_more_nodes = (13 * ring.replicas)
+            for request_node_count in (2, 3, 13):
+                num_other_resps = (request_node_count * ring.replicas
+                                   - num_frags - 1)
+                other_responses = [(404, None, None)] * (num_other_resps - 1)
+                other_responses.append((bad_status, None, None))
+                with self.subTest(request_node_count=request_node_count):
+                    exc = self._do_test_reconstruct_insufficient_frags(
+                        {'quarantine_threshold': 1,
+                         'reclaim_age': 0,
+                         'request_node_count': '%s * replicas'
+                                               % request_node_count},
+                        num_frags, other_responses)
+                self.assertIsInstance(exc, DiskFileError)
+                self._assert_diskfile_not_quarantined()
+                self._verify_error_lines(num_frags, other_responses, num_frags)
+                warning_lines = self.logger.get_lines_for_level('warning')
+                self.assertEqual(1, len(warning_lines), warning_lines)
+                self.assertIn('Invalid response %s' % bad_status,
+                              warning_lines[0])
+
+            # a non-404 in handoff responses will prevent quarantine; non-404
+            # is part way through all handoffs so not all handoffs are used
+            # regardless of how big request_node_count is
+            non_404_handoff = 3
+            for request_node_count in (2, 3, 13):
+                # replicas - 1 - num_frags other_responses from primaries,
+                # plus a batch of replicas - 1 during which non-404 shows up,
+                # plus some that trickle out before the non-404 shows up, but
+                # limited to (request_node_count * replicas - num_frags - 1)
+                # e.g. for 10+4 policy with request_node_count > 2
+                #   - batch of 13 requests go to primaries,
+                #   - 12 other_responses are consumed,
+                #   - then a batch of 13 handoff requests is sent,
+                #   - the non-404 is the 4th response in that batch,
+                #   - so 3 more requests will have been trickled out
+                batch_size = ring.replicas - 1
+                num_other_resps = min(
+                    2 * batch_size - num_frags + non_404_handoff,
+                    request_node_count * ring.replicas - 1 - num_frags)
+                other_responses = [(404, None, None)] * (num_other_resps - 1)
+                other_responses.insert(
+                    batch_size - num_frags + non_404_handoff,
+                    (bad_status, None, None))
+                exc = self._do_test_reconstruct_insufficient_frags(
+                    {'quarantine_threshold': 1, 'reclaim_age': 0,
+                     'request_node_count': '%s * replicas'
+                                           % request_node_count},
+                    num_frags, other_responses)
+                self.assertIsInstance(exc, DiskFileError)
+                self._assert_diskfile_not_quarantined()
+                self._verify_error_lines(num_frags, other_responses, num_frags)
+                warning_lines = self.logger.get_lines_for_level('warning')
+                self.assertEqual(1, len(warning_lines), warning_lines)
+                self.assertIn('Invalid response %s' % bad_status,
+                              warning_lines[0])
+
+    def test_reconstruct_fa_no_quarantine_frag_not_old_enough(self):
+        # verify that solitary fragment is not quarantined if it has not
+        # reached reclaim_age
+        num_other_resps = self.policy.object_ring.replicas - 2
+        other_responses = [(404, None, None)] * num_other_resps
+        exc = self._do_test_reconstruct_insufficient_frags(
+            {'quarantine_threshold': 1, 'reclaim_age': 10000},
+            1, other_responses)
+        self.assertIsInstance(exc, DiskFileError)
+        self._assert_diskfile_not_quarantined()
+        self._verify_error_lines(1, other_responses, 1)
+
+        exc = self._do_test_reconstruct_insufficient_frags(
+            {'quarantine_threshold': 1,
+             'quarantine_age': 10000,  # quarantine_age trumps reclaim_age
+             'reclaim_age': 0},
+            1, other_responses)
+        self.assertIsInstance(exc, DiskFileError)
+        self._assert_diskfile_not_quarantined()
+        self._verify_error_lines(1, other_responses, 1)
+
+        exc = self._do_test_reconstruct_insufficient_frags(
+            {'quarantine_threshold': 1},  # default reclaim_age
+            1, other_responses)
+        self.assertIsInstance(exc, DiskFileError)
+        self._assert_diskfile_not_quarantined()
+        self._verify_error_lines(1, other_responses, 1)
+
+    def test_reconstruct_fa_no_quarantine_frag_resp_different_timestamp(self):
+        # verify that solitary fragment is not quarantined if the only frag
+        # response is for a different timestamp than the local frag
+        resp_timestamp = utils.Timestamp(float(self.obj_timestamp) + 1)
+        num_other_resps = self.policy.object_ring.replicas - 2
+        other_responses = [(404, None, None)] * num_other_resps
+        resp_timestamps = [resp_timestamp] * (num_other_resps + 1)
+        exc = self._do_test_reconstruct_insufficient_frags(
+            {'quarantine_threshold': 1, 'reclaim_age': 0},
+            1, other_responses, resp_timestamps=resp_timestamps)
+        self.assertIsInstance(exc, DiskFileError)
+        self._assert_diskfile_not_quarantined()
+        self._verify_error_lines(1, other_responses, 1)
+
+    def test_reconstruct_fa_no_quarantine_frag_resp_mixed_timestamps(self):
+        # verify that solitary fragment is not quarantined if there is a
+        # response for a frag at different timestamp in addition to the
+        # response for the solitary local frag
+        resp_timestamp = utils.Timestamp(float(self.obj_timestamp) + 1)
+        num_other_resps = self.policy.object_ring.replicas - 3
+        other_responses = [(404, None, None)] * num_other_resps
+        resp_timestamps = ([self.obj_timestamp] +
+                           [resp_timestamp] * (num_other_resps + 1))
+        exc = self._do_test_reconstruct_insufficient_frags(
+            {'quarantine_threshold': 1, 'reclaim_age': 0},
+            2, other_responses, resp_timestamps=resp_timestamps)
+        self.assertIsInstance(exc, DiskFileError)
+        self._assert_diskfile_not_quarantined()
+        error_lines = self.logger.get_lines_for_level('error')
+        self.assertEqual(3, len(error_lines), error_lines)
+        self.assertIn(
+            'Unable to get enough responses (1/%d from 1 ok responses)'
+            % (self.policy.ec_ndata,), error_lines[0])
+        self.assertIn(
+            'Unable to get enough responses (1/%d from 1 ok responses)'
+            % (self.policy.ec_ndata,), error_lines[1])
+        self.assertIn(
+            'Unable to get enough responses (%d x 404 error responses)'
+            % num_other_resps, error_lines[2])
+
+    def test_reconstruct_fa_no_quarantine_frag_resp_mixed_etags(self):
+        # verify that solitary fragment is not quarantined if there is a
+        # response for a frag with different etag in addition to the
+        # response for the solitary local frag
+        etags = [None, 'unexpected_etag']
+        num_other_resps = self.policy.object_ring.replicas - 3
+        other_responses = [(404, None, None)] * num_other_resps
+        exc = self._do_test_reconstruct_insufficient_frags(
+            {'quarantine_threshold': 1, 'reclaim_age': 0},
+            2, other_responses, resp_etags=etags)
+        self.assertIsInstance(exc, DiskFileError)
+        self._assert_diskfile_not_quarantined()
+        error_lines = self.logger.get_lines_for_level('error')
+        self.assertEqual(3, len(error_lines), error_lines)
+        self.assertIn(
+            'Mixed Etag', error_lines[0])
+        self.assertIn(
+            'Unable to get enough responses (1/%d from 2 ok responses)'
+            % (self.policy.ec_ndata,), error_lines[1])
+        self.assertIn(
+            'Unable to get enough responses (%d x 404 error responses)'
+            % num_other_resps, error_lines[2])
+
+    def _do_test_reconstruct_fa_no_quarantine_bad_headers(self, bad_headers):
+        # verify that responses with invalid headers count against the
+        # quarantine_threshold
+        self._configure_reconstructor(reclaim_age=0, quarantine_threshold=1)
+        local_frag_index = 2
+        self._create_fragment(local_frag_index)
+        job = {
+            'partition': 0,
+            'policy': self.policy,
+        }
+        part_nodes = self.policy.object_ring.get_part_nodes(0)
+        node = part_nodes[0]
+        node['backend_index'] = self.policy.get_backend_index(node['index'])
+
+        test_data = (b'rebuild' * self.policy.ec_segment_size)[:-777]
+        etag = md5(test_data, usedforsecurity=False).hexdigest()
+        ec_archive_bodies = encode_frag_archive_bodies(self.policy, test_data)
+
+        def make_header(body):
+            headers = get_header_frag_index(self, body)
+            headers.update({'X-Object-Sysmeta-Ec-Etag': etag})
+            return headers
+
+        responses = []
+        body = ec_archive_bodies[2]
+        headers = make_header(body)
+        responses.append((200, body, headers))
+        body = ec_archive_bodies[3]
+        headers = make_header(body)
+        headers.update(bad_headers)
+        responses.append((200, body, headers))
+        other_responses = ([(404, None, None)] *
+                           (self.policy.object_ring.replicas - 3))
+        codes, body_iter, headers = zip(*(responses + other_responses))
+        resp_timestamps = [self.obj_timestamp] * len(codes)
+        resp_timestamps = [ts.internal for ts in resp_timestamps]
+        with mocked_http_conn(*codes, body_iter=body_iter,
+                              headers=headers,
+                              timestamps=resp_timestamps):
+            with self.assertRaises(DiskFileError) as cm:
+                self.reconstructor.reconstruct_fa(
+                    job, node, self._create_fragment(2))
+        self.assertIsInstance(cm.exception, DiskFileError)
+        self._assert_diskfile_not_quarantined()
+        error_lines = self.logger.get_lines_for_level('error')
+        self.assertEqual(2, len(error_lines), error_lines)
+        self.assertIn(
+            'Unable to get enough responses (1/%d from 1 ok responses)'
+            % (self.policy.ec_ndata,), error_lines[0])
+        self.assertIn(
+            'Unable to get enough responses '
+            '(1 x unknown, %d x 404 error responses)'
+            % len(other_responses), error_lines[1])
+
+    def test_reconstruct_fa_no_quarantine_invalid_frag_index_header(self):
+        self._do_test_reconstruct_fa_no_quarantine_bad_headers(
+            {'X-Object-Sysmeta-Ec-Frag-Index': 'two'})
+
+    def test_reconstruct_fa_no_quarantine_missing_frag_index_header(self):
+        self._do_test_reconstruct_fa_no_quarantine_bad_headers(
+            {'X-Object-Sysmeta-Ec-Frag-Index': ''})
+
+    def test_reconstruct_fa_no_quarantine_missing_timestamp_header(self):
+        self._do_test_reconstruct_fa_no_quarantine_bad_headers(
+            {'X-Backend-Data-Timestamp': ''})
+
+    def test_reconstruct_fa_no_quarantine_missing_etag_header(self):
+        self._do_test_reconstruct_fa_no_quarantine_bad_headers(
+            {'X-Object-Sysmeta-Ec-Etag': ''})
+
+    def test_reconstruct_fa_frags_on_handoffs(self):
+        # just a lonely old frag on primaries: this appears to be a quarantine
+        # candidate, but unexpectedly the other frags are found on handoffs so
+        # expect rebuild
+        # set reclaim_age to 0 to make lonely frag old enugh for quarantine
+        self._configure_reconstructor(quarantine_threshold=1, reclaim_age=0)
+        job = {
+            'partition': 0,
+            'policy': self.policy,
+        }
+        part_nodes = self.policy.object_ring.get_part_nodes(0)
+        node = part_nodes[1]
+        node['backend_index'] = self.policy.get_backend_index(node['index'])
+
+        test_data = (b'rebuild' * self.policy.ec_segment_size)[:-777]
+        etag = md5(test_data, usedforsecurity=False).hexdigest()
+        ec_archive_bodies = encode_frag_archive_bodies(self.policy, test_data)
+        broken_body = ec_archive_bodies.pop(1)
+
+        # arrange for just one 200 to come from a primary, then 404s, then 200s
+        # from handoffs
+        responses = list()
+        for i, body in enumerate(ec_archive_bodies):
+            if i == 1:
+                # skip: this is the frag index we're rebuilding; insert 404s
+                responses.extend(
+                    ((404, None, None),) * self.policy.object_ring.replicas)
+            headers = get_header_frag_index(self, body)
+            headers.update({'X-Object-Sysmeta-Ec-Etag': etag})
+            responses.append((200, body, headers))
+
+        codes, body_iter, headers = zip(*responses)
+        with mocked_http_conn(
+                *codes, body_iter=body_iter, headers=headers,
+                timestamps=[self.obj_timestamp.internal] * len(codes)):
+            df = self.reconstructor.reconstruct_fa(
+                job, node, self._create_fragment(0, body=b''))
+            self.assertEqual(0, df.content_length)
+            fixed_body = b''.join(df.reader())
+        self.assertEqual(len(fixed_body), len(broken_body))
+        self.assertEqual(md5(fixed_body, usedforsecurity=False).hexdigest(),
+                         md5(broken_body, usedforsecurity=False).hexdigest())
+        # no error and warning
+        self.assertFalse(self.logger.get_lines_for_level('error'))
+        self.assertFalse(self.logger.get_lines_for_level('warning'))
+        debug_lines = self.logger.get_lines_for_level('debug')
+        self.assertIn('Reconstructing frag from handoffs, node_count=%d'
+                      % (self.policy.object_ring.replicas * 2), debug_lines)
+
+    def test_reconstruct_fa_finds_duplicate_does_not_fail(self):
+        job = {
+            'partition': 0,
+            'policy': self.policy,
+        }
+        part_nodes = self.policy.object_ring.get_part_nodes(0)
+        node = part_nodes[1]
+        node['backend_index'] = self.policy.get_backend_index(node['index'])
+
+        test_data = (b'rebuild' * self.policy.ec_segment_size)[:-777]
+        etag = md5(test_data, usedforsecurity=False).hexdigest()
+        ec_archive_bodies = encode_frag_archive_bodies(self.policy, test_data)
+
+        broken_body = ec_archive_bodies.pop(1)
+        # add some duplicates
+        num_duplicates = self.policy.ec_nparity - 1
+        ec_archive_bodies = (ec_archive_bodies[:num_duplicates] +
+                             ec_archive_bodies)[:-num_duplicates]
+
+        def make_header(body):
+            headers = get_header_frag_index(self, body)
+            headers.update({'X-Object-Sysmeta-Ec-Etag': etag})
+            return headers
+
+        responses = [(200, body, make_header(body))
+                     for body in ec_archive_bodies]
+        codes, body_iter, headers = zip(*responses)
+        with mocked_http_conn(*codes, body_iter=body_iter, headers=headers):
+            df = self.reconstructor.reconstruct_fa(
+                job, node, self._create_fragment(2))
+            fixed_body = b''.join(df.reader())
+            self.assertEqual(len(fixed_body), len(broken_body))
+            self.assertEqual(
+                md5(fixed_body, usedforsecurity=False).hexdigest(),
+                md5(broken_body, usedforsecurity=False).hexdigest())
+
+        # no error and warning
+        self.assertFalse(self.logger.get_lines_for_level('error'))
+        self.assertFalse(self.logger.get_lines_for_level('warning'))
+        debug_log_lines = self.logger.get_lines_for_level('debug')
+        self.assertEqual(1, len(debug_log_lines))
+        expected_prefix = 'Reconstruct frag #1 with frag indexes'
+        self.assertIn(expected_prefix, debug_log_lines[0])
+        got_frag_index_list = json.loads(
+            debug_log_lines[0][len(expected_prefix):])
+        self.assertNotIn(1, got_frag_index_list)
+
+    def test_reconstruct_fa_missing_headers(self):
+        # This is much negative tests asserting when the expected
+        # headers are missing in the responses to gather fragments
+        # to reconstruct
+
+        job = {
+            'partition': 0,
+            'policy': self.policy,
+        }
+        part_nodes = self.policy.object_ring.get_part_nodes(0)
+        node = part_nodes[1]
+        node['backend_index'] = self.policy.get_backend_index(node['index'])
+
+        test_data = (b'rebuild' * self.policy.ec_segment_size)[:-777]
+        etag = md5(test_data, usedforsecurity=False).hexdigest()
+        ec_archive_bodies = encode_frag_archive_bodies(self.policy, test_data)
+
+        broken_body = ec_archive_bodies.pop(1)
+
+        def make_header(body):
+            headers = get_header_frag_index(self, body)
+            headers.update(
+                {'X-Object-Sysmeta-Ec-Etag': etag,
+                 'X-Backend-Timestamp': self.obj_timestamp.internal})
+            return headers
+
+        def test_missing_header(missing_header, warning_extra):
+            self.logger._clear()
+            responses = [(200, body, make_header(body))
+                         for body in ec_archive_bodies]
+
+            # To drop the header from the response[0], set None as the value
+            # explicitly instead of deleting the key because if no key exists
+            # in the dict, fake_http_connect will insert some key/value pairs
+            # automatically (e.g. X-Backend-Timestamp)
+            responses[0][2].update({missing_header: None})
+
+            codes, body_iter, headers = zip(*responses)
+            with mocked_http_conn(
+                    *codes, body_iter=body_iter, headers=headers) as mock_conn:
+                df = self.reconstructor.reconstruct_fa(
+                    job, node, self._create_fragment(2))
+                fixed_body = b''.join(df.reader())
+                self.assertEqual(len(fixed_body), len(broken_body))
+                self.assertEqual(
+                    md5(fixed_body, usedforsecurity=False).hexdigest(),
+                    md5(broken_body, usedforsecurity=False).hexdigest())
+
+            # no errors
+            self.assertFalse(self.logger.get_lines_for_level('error'))
+            # ...but warning for the missing header
+            warning_log_lines = self.logger.get_lines_for_level('warning')
+            self.assertEqual(1, len(warning_log_lines))
+
+            path = unquote(
+                '%(ip)s:%(port)d%(path)s' % mock_conn.requests[0]
+            )
+            expected_warning = 'Invalid resp from %s policy#0%s' % (
+                path, warning_extra)
+            self.assertIn(expected_warning, warning_log_lines)
+
+        test_missing_header(
+            'X-Object-Sysmeta-Ec-Frag-Index',
+            ' (invalid X-Object-Sysmeta-Ec-Frag-Index: None)')
+        test_missing_header(
+            'X-Object-Sysmeta-Ec-Etag',
+            ', frag index 0 (missing Etag)')
+        test_missing_header(
+            'X-Backend-Timestamp',
+            ', frag index 0 (missing X-Backend-Data-Timestamp and '
+            'X-Backend-Timestamp)')
+
+    def test_reconstruct_fa_invalid_frag_index_headers(self):
+        # This is much negative tests asserting when the expected
+        # ec frag index header has invalid value in the responses
+        # to gather fragments to reconstruct
+
+        job = {
+            'partition': 0,
+            'policy': self.policy,
+        }
+        part_nodes = self.policy.object_ring.get_part_nodes(0)
+        node = part_nodes[1]
+        node['backend_index'] = self.policy.get_backend_index(node['index'])
+
+        test_data = (b'rebuild' * self.policy.ec_segment_size)[:-777]
+        etag = md5(test_data, usedforsecurity=False).hexdigest()
+        ec_archive_bodies = encode_frag_archive_bodies(self.policy, test_data)
+
+        broken_body = ec_archive_bodies.pop(1)
+
+        def make_header(body):
+            headers = get_header_frag_index(self, body)
+            headers.update({'X-Object-Sysmeta-Ec-Etag': etag})
+            return headers
+
+        def test_invalid_ec_frag_index_header(invalid_frag_index):
+            self.logger._clear()
+            responses = [(200, body, make_header(body))
+                         for body in ec_archive_bodies]
+
+            responses[0][2].update({
+                'X-Object-Sysmeta-Ec-Frag-Index': invalid_frag_index})
+
+            codes, body_iter, headers = zip(*responses)
+            with mocked_http_conn(
+                    *codes, body_iter=body_iter, headers=headers) as mock_conn:
+                df = self.reconstructor.reconstruct_fa(
+                    job, node, self._create_fragment(2))
+                fixed_body = b''.join(df.reader())
+                self.assertEqual(len(fixed_body), len(broken_body))
+                self.assertEqual(
+                    md5(fixed_body, usedforsecurity=False).hexdigest(),
+                    md5(broken_body, usedforsecurity=False).hexdigest())
+
+            # no errors
+            self.assertFalse(self.logger.get_lines_for_level('error'))
+            # ...but warning for the invalid header
+            warning_log_lines = self.logger.get_lines_for_level('warning')
+            self.assertEqual(1, len(warning_log_lines))
+
+            path = unquote(
+                '%(ip)s:%(port)d%(path)s' % mock_conn.requests[0]
+            )
+            expected_warning = (
+                'Invalid resp from %s policy#0 '
+                '(invalid X-Object-Sysmeta-Ec-Frag-Index: %r)'
+                % (path, invalid_frag_index))
+            self.assertIn(expected_warning, warning_log_lines)
+
+        for value in ('None', 'invalid'):
+            test_invalid_ec_frag_index_header(value)
+
+
+@patch_policies(with_ec_default=True)
+class TestReconstructFragmentArchiveUTF8(TestReconstructFragmentArchive):
+    # repeat superclass tests with an object path that contains non-ascii chars
+    obj_name = b'o\xc3\xa8'
+
+
+@patch_policies([ECStoragePolicy(0, name='ec', is_default=True,
+                                 ec_type=DEFAULT_TEST_EC_TYPE,
+                                 ec_ndata=10, ec_nparity=4,
+                                 ec_segment_size=4096,
+                                 ec_duplication_factor=2),
+                 StoragePolicy(1, name='other')],
+                fake_ring_args=[{'replicas': 28}, {'replicas': 3}])
+class TestReconstructFragmentArchiveECDuplicationFactor(
+        TestReconstructFragmentArchive):
+    def test_reconstruct_fa_no_quarantine_duplicate_frags(self):
+        # verify that quarantine does not happen if the only other response in
+        # addition to the lonely frag's own response is for the same
+        # (duplicate) frag index
+        self._configure_reconstructor(quarantine_threshold=1, reclaim_age=0)
+        local_frag_index = 2
+        self._create_fragment(local_frag_index)
+        job = {
+            'partition': 0,
+            'policy': self.policy,
+        }
+        part_nodes = self.policy.object_ring.get_part_nodes(0)
+        node = part_nodes[0]
+        node['backend_index'] = self.policy.get_backend_index(node['index'])
+
+        test_data = (b'rebuild' * self.policy.ec_segment_size)[:-777]
+        etag = md5(test_data, usedforsecurity=False).hexdigest()
+        ec_archive_bodies = encode_frag_archive_bodies(self.policy, test_data)
+        frags = [
+            ec_archive_bodies[local_frag_index],
+            ec_archive_bodies[local_frag_index +
+                              self.policy.ec_n_unique_fragments]]
+
+        def make_header(body):
+            headers = get_header_frag_index(self, body)
+            headers.update({'X-Object-Sysmeta-Ec-Etag': etag})
+            return headers
+
+        responses = [(200, frag, make_header(frag)) for frag in frags]
+        other_responses = ([(404, None, None)] *
+                           (self.policy.ec_n_unique_fragments * 2 - 3))
+        codes, body_iter, headers = zip(*(responses + other_responses))
+        resp_timestamps = [self.obj_timestamp.internal] * len(codes)
+        with mocked_http_conn(*codes, body_iter=body_iter,
+                              headers=headers,
+                              timestamps=resp_timestamps):
+            with self.assertRaises(DiskFileError) as cm:
+                self.reconstructor.reconstruct_fa(
+                    job, node, self._create_fragment(2))
+        self.assertIsInstance(cm.exception, DiskFileError)
+        self._assert_diskfile_not_quarantined()
+        self._verify_error_lines(2, other_responses, 1)
+
+
+@patch_policies([ECStoragePolicy(0, name='ec', is_default=True,
+                                 ec_type=DEFAULT_TEST_EC_TYPE,
+                                 ec_ndata=10, ec_nparity=4,
+                                 ec_segment_size=4096,
+                                 ec_duplication_factor=2),
+                 StoragePolicy(1, name='other')],
+                fake_ring_args=[{'replicas': 28}, {'replicas': 3}])
+class TestObjectReconstructorECDuplicationFactor(TestObjectReconstructor):
+    def setUp(self):
+        super(TestObjectReconstructorECDuplicationFactor, self).setUp()
+        self.fabricated_ring = FabricatedRing(replicas=28, devices=56)
+
+    def _test_reconstruct_with_duplicate_frags_no_errors(self, index):
+        utils.mkdirs(os.path.join(self.devices, 'sda1'))
+        df_mgr = self.reconstructor._df_router[self.policy]
+        df = df_mgr.get_diskfile('sda1', 9, 'a', 'c', 'o',
+                                 policy=self.policy)
+        write_diskfile(df, self.ts(), data=b'', frag_index=2)
+        df.open()
+
+        job = {
+            'partition': 0,
+            'policy': self.policy,
+        }
+        part_nodes = self.policy.object_ring.get_part_nodes(0)
+        node = part_nodes[index]
+        node['backend_index'] = self.policy.get_backend_index(node['index'])
+
+        test_data = (b'rebuild' * self.policy.ec_segment_size)[:-777]
+        etag = md5(test_data, usedforsecurity=False).hexdigest()
+        ec_archive_bodies = encode_frag_archive_bodies(self.policy, test_data)
+
+        broken_body = ec_archive_bodies.pop(index)
+
+        responses = list()
+        for body in ec_archive_bodies:
+            headers = get_header_frag_index(self, body)
+            headers.update({'X-Object-Sysmeta-Ec-Etag': etag})
+            responses.append((200, body, headers))
+
+        # make a hook point at
+        # swift.obj.reconstructor.ObjectReconstructor._get_response
+        called_headers = []
+        orig_func = object_reconstructor.ObjectReconstructor._get_response
+
+        def _get_response_hook(self, node, policy, part, path, headers):
+            called_headers.append(headers)
+            return orig_func(self, node, policy, part, path, headers)
+
+        # need parity + 1 node failures to reach duplicated fragments
+        failed_start_at = (
+            self.policy.ec_n_unique_fragments - self.policy.ec_nparity - 1)
+
+        # set Timeout for node #9, #10, #11, #12, #13
+        for i in range(self.policy.ec_nparity + 1):
+            responses[failed_start_at + i] = (Timeout(), '', '')
+
+        codes, body_iter, headers = zip(*responses)
+        get_response_path = \
+            'swift.obj.reconstructor.ObjectReconstructor._get_response'
+        with mock.patch(get_response_path, _get_response_hook):
+            with mocked_http_conn(
+                    *codes, body_iter=body_iter, headers=headers):
+                df = self.reconstructor.reconstruct_fa(
+                    job, node, df)
+                fixed_body = b''.join(df.reader())
+                self.assertEqual(len(fixed_body), len(broken_body))
+                self.assertEqual(
+                    md5(fixed_body, usedforsecurity=False).hexdigest(),
+                    md5(broken_body, usedforsecurity=False).hexdigest())
+                for called_header in called_headers:
+                    called_header = HeaderKeyDict(called_header)
+                    self.assertIn('Content-Length', called_header)
+                    self.assertEqual(called_header['Content-Length'], '0')
+                    self.assertIn('User-Agent', called_header)
+                    user_agent = called_header['User-Agent']
+                    self.assertTrue(user_agent.startswith('obj-reconstructor'))
+
+    def test_reconstruct_with_duplicate_frags_no_errors(self):
+        # any fragments can be broken
+        for index in range(28):
+            self._test_reconstruct_with_duplicate_frags_no_errors(index)
+
+    def test_iter_nodes_for_frag(self):
+        self.reconstructor.rebuild_handoff_node_count = -1
+        policy = ECStoragePolicy(1, name='test', ec_type=DEFAULT_TEST_EC_TYPE,
+                                 ec_ndata=4, ec_nparity=3,
+                                 ec_duplication_factor=2)
+        policy.object_ring = FabricatedRing(replicas=14, devices=42)
+        primaries = policy.object_ring.get_part_nodes(0)
+
+        node = primaries[0]
+        nodes_for_frag = list(self.reconstructor._iter_nodes_for_frag(
+            policy, 0, node))
+        expected = [0, 0, 7, 14, 21]
+        self.assertEqual(expected, [n.get('index', n.get('handoff_index'))
+                                    for n in nodes_for_frag])
+        for node in nodes_for_frag:
+            self.assertEqual(0, node['backend_index'])
+
+        node = primaries[3]
+        nodes_for_frag = list(self.reconstructor._iter_nodes_for_frag(
+            policy, 0, node))
+        expected = [3, 3, 10, 17, 24]
+        self.assertEqual(expected, [n.get('index', n.get('handoff_index'))
+                                    for n in nodes_for_frag])
+        for node in nodes_for_frag:
+            self.assertEqual(3, node['backend_index'])
+
+        node = primaries[7]
+        nodes_for_frag = list(self.reconstructor._iter_nodes_for_frag(
+            policy, 0, node))
+        expected = [7, 0, 7, 14, 21]
+        self.assertEqual(expected, [n.get('index', n.get('handoff_index'))
+                                    for n in nodes_for_frag])
+        for node in nodes_for_frag:
+            self.assertEqual(0, node['backend_index'])
+
+        node = primaries[-1]
+        nodes_for_frag = list(self.reconstructor._iter_nodes_for_frag(
+            policy, 0, node))
+        expected = [13, 6, 13, 20, 27]
+        self.assertEqual(expected, [n.get('index', n.get('handoff_index'))
+                                    for n in nodes_for_frag])
+        for node in nodes_for_frag:
+            self.assertEqual(6, node['backend_index'])
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/obj/test_replicator.py b/test/unit/obj/test_replicator.py
index 1591131a33..e7190a2eb1 100644
--- a/test/unit/obj/test_replicator.py
+++ b/test/unit/obj/test_replicator.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -12,32 +12,39 @@
 # implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
-
-from __future__ import with_statement
-
+import collections
+import errno
+import io
+import json
 import unittest
 import os
-from gzip import GzipFile
+from unittest import mock
 from shutil import rmtree
-import cPickle as pickle
-import logging
-import fcntl
+import pickle
 import time
 import tempfile
 from contextlib import contextmanager
+from collections import defaultdict
+from errno import ENOENT, ENOTEMPTY, ENOTDIR
+
 from eventlet.green import subprocess
-from eventlet import Timeout, tpool
-from test.unit import FakeLogger, mock
+from eventlet import Timeout, sleep
+
+from test.debug_logger import debug_logger
+from test.unit import (patch_policies, make_timestamp_iter, mocked_http_conn,
+                       mock_check_drive, skip_if_no_xattrs)
 from swift.common import utils
-from swift.common.utils import hash_path, mkdirs, normalize_timestamp
+from swift.common.utils import (hash_path, mkdirs, normalize_timestamp,
+                                storage_directory)
 from swift.common import ring
-from swift.obj import replicator as object_replicator
-from swift.obj.server import DiskFile
+from swift.common.recon import RECON_OBJECT_FILE
+from swift.obj import diskfile, replicator as object_replicator
+from swift.common.storage_policy import StoragePolicy, POLICIES
+from swift.common.exceptions import PartitionLockTimeout
 
 
-def _ips():
+def _ips(*args, **kwargs):
     return ['127.0.0.0']
-object_replicator.whataremyips = _ips
 
 
 def mock_http_connect(status):
@@ -69,6 +76,7 @@ def close(self):
             return
     return lambda *args, **kwargs: FakeConn(status, *args, **kwargs)
 
+
 process_errors = []
 
 
@@ -76,526 +84,2972 @@ class MockProcess(object):
     ret_code = None
     ret_log = None
     check_args = None
+    captured_log = None
 
     class Stream(object):
 
         def read(self):
-            return MockProcess.ret_log.next()
+            return next(MockProcess.ret_log)
 
     def __init__(self, *args, **kwargs):
-        targs = MockProcess.check_args.next()
+        targs = next(MockProcess.check_args)
         for targ in targs:
-            if targ not in args[0]:
-                process_errors.append("Invalid: %s not in %s" % (targ,
-                                                                 args))
+            # Allow more than 2 candidate targs
+            # (e.g. a case that either node is fine when nodes shuffled)
+            if isinstance(targ, tuple):
+                allowed = False
+                for target in targ:
+                    if target in args[0]:
+                        allowed = True
+                if not allowed:
+                    process_errors.append("Invalid: %s not in %s" % (targ,
+                                                                     args))
+            else:
+                if targ not in args[0]:
+                    process_errors.append("Invalid: %s not in %s" % (targ,
+                                                                     args))
+        self.captured_info = {
+            'rsync_args': args[0],
+        }
         self.stdout = self.Stream()
 
     def wait(self):
-        return self.ret_code.next()
+        # the _mock_process context manager assures this class attribute is a
+        # mutable list and takes care of resetting it
+        rv = next(self.ret_code)
+        if self.captured_log is not None:
+            self.captured_info['ret_code'] = rv
+            self.captured_log.append(self.captured_info)
+        return rv
 
 
 @contextmanager
 def _mock_process(ret):
+    captured_log = []
+    MockProcess.captured_log = captured_log
     orig_process = subprocess.Popen
     MockProcess.ret_code = (i[0] for i in ret)
-    MockProcess.ret_log = (i[1] for i in ret)
+    MockProcess.ret_log = (i[1].encode('utf8') for i in ret)
     MockProcess.check_args = (i[2] for i in ret)
     object_replicator.subprocess.Popen = MockProcess
-    yield
+    yield captured_log
+    MockProcess.captured_log = None
     object_replicator.subprocess.Popen = orig_process
 
 
-def _create_test_ring(path):
-    testgz = os.path.join(path, 'object.ring.gz')
+class MockHungProcess(object):
+    def __init__(self, polls_needed=0, *args, **kwargs):
+        class MockStdout(object):
+            def read(self):
+                pass
+        self.stdout = MockStdout()
+        self._state = 'running'
+        self._calls = []
+        self._polls = 0
+        self._polls_needed = polls_needed
+
+    def wait(self, timeout=None):
+        self._calls.append(('wait', self._state))
+        if self._state == 'running':
+            # Sleep so we trip the rsync timeout
+            sleep(1)
+            raise BaseException('You need to mock out some timeouts')
+        if not self._polls_needed:
+            self._state = 'os-reaped'
+            return 137
+        if timeout is not None:
+            raise subprocess.TimeoutExpired('some cmd', timeout)
+        raise BaseException("You're waiting indefinitely on something "
+                            "we've established is hung")
+
+    def poll(self):
+        self._calls.append(('poll', self._state))
+        self._polls += 1
+        if self._polls >= self._polls_needed:
+            self._state = 'os-reaped'
+            return 137
+        else:
+            return None
+
+    def terminate(self):
+        self._calls.append(('terminate', self._state))
+        if self._state == 'running':
+            self._state = 'terminating'
+
+    def kill(self):
+        self._calls.append(('kill', self._state))
+        self._state = 'killed'
+
+
+def _create_test_rings(path, devs=None, next_part_power=None):
     intended_replica2part2dev_id = [
-        [0, 1, 2, 3, 4, 5, 6],
-        [1, 2, 3, 0, 5, 6, 4],
-        [2, 3, 0, 1, 6, 4, 5],
-        ]
-    intended_devs = [
-        {'id': 0, 'device': 'sda', 'zone': 0, 'ip': '127.0.0.0', 'port': 6000},
-        {'id': 1, 'device': 'sda', 'zone': 1, 'ip': '127.0.0.1', 'port': 6000},
-        {'id': 2, 'device': 'sda', 'zone': 2, 'ip': '127.0.0.2', 'port': 6000},
-        {'id': 3, 'device': 'sda', 'zone': 4, 'ip': '127.0.0.3', 'port': 6000},
-        {'id': 4, 'device': 'sda', 'zone': 5, 'ip': '127.0.0.4', 'port': 6000},
+        [0, 1, 2, 3],
+        [1, 2, 3, 0],
+        [2, 3, 0, 1],
+    ]
+    intended_devs = devs or [
+        {'id': 0, 'device': 'sda', 'zone': 0,
+         'region': 1, 'ip': '127.0.0.0', 'port': 6200},
+        {'id': 1, 'device': 'sda', 'zone': 1,
+         'region': 2, 'ip': '127.0.0.1', 'port': 6200},
+        {'id': 2, 'device': 'sda', 'zone': 2,
+         'region': 3, 'ip': '127.0.0.2', 'port': 6200},
+        {'id': 3, 'device': 'sda', 'zone': 4,
+         'region': 2, 'ip': '127.0.0.3', 'port': 6200},
+        {'id': 4, 'device': 'sda', 'zone': 5,
+         'region': 1, 'ip': '127.0.0.4', 'port': 6200,
+         'replication_ip': '127.0.1.4'},
         {'id': 5, 'device': 'sda', 'zone': 6,
-         'ip': 'fe80::202:b3ff:fe1e:8329', 'port': 6000},
-        {'id': 6, 'device': 'sda', 'zone': 7,
-         'ip': '2001:0db8:85a3:0000:0000:8a2e:0370:7334', 'port': 6000},
-        ]
+         'region': 3, 'ip': 'fe80::202:b3ff:fe1e:8329', 'port': 6200},
+        {'id': 6, 'device': 'sda', 'zone': 7, 'region': 1,
+         'ip': '2001:0db8:85a3:0000:0000:8a2e:0370:7334', 'port': 6200},
+    ]
     intended_part_shift = 30
-    intended_reload_time = 15
-    pickle.dump(ring.RingData(intended_replica2part2dev_id,
-        intended_devs, intended_part_shift),
-        GzipFile(testgz, 'wb'))
-    return ring.Ring(path, ring_name='object', reload_time=intended_reload_time)
+    ring.RingData(
+        intended_replica2part2dev_id,
+        intended_devs,
+        intended_part_shift,
+        next_part_power,
+    ).save(os.path.join(path, 'object.ring.gz'))
+
+    ring.RingData(
+        intended_replica2part2dev_id * 2,
+        intended_devs,
+        intended_part_shift,
+        next_part_power,
+    ).save(os.path.join(path, 'object-1.ring.gz'))
+    for policy in POLICIES:
+        policy.object_ring = None  # force reload
+    return
 
 
+@patch_policies([StoragePolicy(0, 'zero', False),
+                StoragePolicy(1, 'one', True)])
 class TestObjectReplicator(unittest.TestCase):
 
     def setUp(self):
-        utils.HASH_PATH_SUFFIX = 'endcap'
+        skip_if_no_xattrs()
+        utils.HASH_PATH_SUFFIX = b'endcap'
+        utils.HASH_PATH_PREFIX = b''
+        # recon cache path
+        self.recon_cache = tempfile.mkdtemp()
+        rmtree(self.recon_cache, ignore_errors=1)
+        os.mkdir(self.recon_cache)
         # Setup a test ring (stolen from common/test_ring.py)
         self.testdir = tempfile.mkdtemp()
         self.devices = os.path.join(self.testdir, 'node')
         rmtree(self.testdir, ignore_errors=1)
         os.mkdir(self.testdir)
         os.mkdir(self.devices)
-        os.mkdir(os.path.join(self.devices, 'sda'))
-        self.objects = os.path.join(self.devices, 'sda', 'objects')
-        os.mkdir(self.objects)
-        self.parts = {}
-        for part in ['0', '1', '2', '3']:
-            self.parts[part] = os.path.join(self.objects, part)
-            os.mkdir(os.path.join(self.objects, part))
-        self.ring = _create_test_ring(self.testdir)
+
+        self.objects, self.objects_1, self.parts, self.parts_1 = \
+            self._write_disk_data('sda')
+        _create_test_rings(self.testdir)
+        self.logger = debug_logger('test-replicator')
         self.conf = dict(
+            bind_ip=_ips()[0], bind_port=6200,
             swift_dir=self.testdir, devices=self.devices, mount_check='false',
-            timeout='300', stats_interval='1')
-        self.replicator = object_replicator.ObjectReplicator(
-            self.conf)
-        self.replicator.logger = FakeLogger()
+            timeout='300', stats_interval='1', sync_method='rsync',
+            recon_cache_path=self.recon_cache)
+        self._create_replicator()
+        self.ts = make_timestamp_iter()
 
     def tearDown(self):
-        process_errors = []
+        self.assertFalse(process_errors)
         rmtree(self.testdir, ignore_errors=1)
+        rmtree(self.recon_cache, ignore_errors=1)
 
-    def test_run_once(self):
+    def test_ring_ip_and_bind_ip(self):
+        # make clean base_conf
+        base_conf = dict(self.conf)
+        for key in ('bind_ip', 'ring_ip'):
+            base_conf.pop(key, None)
+
+        # default ring_ip is always 0.0.0.0
+        self.conf = base_conf
+        self._create_replicator()
+        self.assertEqual('0.0.0.0', self.replicator.ring_ip)
+
+        # bind_ip works fine for legacy configs
+        self.conf = dict(base_conf)
+        self.conf['bind_ip'] = '192.168.1.42'
+        self._create_replicator()
+        self.assertEqual('192.168.1.42', self.replicator.ring_ip)
+
+        # ring_ip works fine by-itself
+        self.conf = dict(base_conf)
+        self.conf['ring_ip'] = '192.168.1.43'
+        self._create_replicator()
+        self.assertEqual('192.168.1.43', self.replicator.ring_ip)
+
+        # if you have both ring_ip wins
+        self.conf = dict(base_conf)
+        self.conf['bind_ip'] = '192.168.1.44'
+        self.conf['ring_ip'] = '192.168.1.45'
+        self._create_replicator()
+        self.assertEqual('192.168.1.45', self.replicator.ring_ip)
+
+    def test_handoff_replication_setting_warnings(self):
+        conf_tests = [
+            # (config, expected_warning)
+            ({}, False),
+            ({'handoff_delete': 'auto'}, False),
+            ({'handoffs_first': 'no'}, False),
+            ({'handoff_delete': '2'}, True),
+            ({'handoffs_first': 'yes'}, True),
+            ({'handoff_delete': '1', 'handoffs_first': 'yes'}, True),
+        ]
+        log_message = 'Handoff only mode is not intended for normal ' \
+            'operation, please disable handoffs_first and ' \
+            'handoff_delete before the next normal rebalance'
+        for config, expected_warning in conf_tests:
+            self.logger.clear()
+            object_replicator.ObjectReplicator(config, logger=self.logger)
+            warning_log_lines = self.logger.get_lines_for_level('warning')
+            if expected_warning:
+                expected_log_lines = [log_message]
+            else:
+                expected_log_lines = []
+            self.assertEqual(expected_log_lines, warning_log_lines,
+                             'expected %s != %s for config %r' % (
+                                 expected_log_lines,
+                                 warning_log_lines,
+                                 config,
+                             ))
+
+    def test_massive_handoff_delete_setting_warnings(self):
         replicator = object_replicator.ObjectReplicator(
-            dict(swift_dir=self.testdir, devices=self.devices,
-                mount_check='false', timeout='300', stats_interval='1'))
+            {'swift_dir': self.testdir, 'handoff_delete': '1000'},
+            logger=self.logger)
+        self.assertEqual(self.logger.get_lines_for_level('warning'), [
+            'Handoff only mode is not intended for normal operation, '
+            'please disable handoffs_first and handoff_delete before '
+            'the next normal rebalance',
+            'No storage policies found for which handoff_delete=1000 '
+            'would have an effect. Disabling.',
+        ])
+        self.assertEqual(replicator.handoff_delete, 0)
+
+    def _write_disk_data(self, disk_name, with_json=False):
+        os.mkdir(os.path.join(self.devices, disk_name))
+        objects = os.path.join(self.devices, disk_name,
+                               diskfile.get_data_dir(POLICIES[0]))
+        objects_1 = os.path.join(self.devices, disk_name,
+                                 diskfile.get_data_dir(POLICIES[1]))
+        os.mkdir(objects)
+        os.mkdir(objects_1)
+        parts = {}
+        parts_1 = {}
+        for part in ['0', '1', '2', '3']:
+            parts[part] = os.path.join(objects, part)
+            os.mkdir(parts[part])
+            parts_1[part] = os.path.join(objects_1, part)
+            os.mkdir(parts_1[part])
+
+        if with_json:
+            for json_file in ['auditor_status_ZBF.json',
+                              'auditor_status_ALL.json']:
+                for obj_dir in [objects, objects_1]:
+                    with open(os.path.join(obj_dir, json_file), 'w'):
+                        pass
+
+        return objects, objects_1, parts, parts_1
+
+    def _create_replicator(self):
+        self.replicator = object_replicator.ObjectReplicator(self.conf)
+        self.replicator.logger = self.logger
+        self.replicator._zero_stats()
+        self.replicator.all_devs_info = set()
+        self.df_mgr = diskfile.DiskFileManager(self.conf, self.logger)
+
+    def test_run_once_no_local_device_in_ring(self):
+        conf = dict(swift_dir=self.testdir, devices=self.devices,
+                    bind_ip='1.1.1.1', recon_cache_path=self.recon_cache,
+                    mount_check='false', timeout='300', stats_interval='1')
+        replicator = object_replicator.ObjectReplicator(conf,
+                                                        logger=self.logger)
+        replicator.run_once()
+        expected = [
+            "Can't find itself in policy with index 0 with ips 1.1.1.1 and"
+            " with port 6200 in ring file, not replicating",
+            "Can't find itself in policy with index 1 with ips 1.1.1.1 and"
+            " with port 6200 in ring file, not replicating",
+        ]
+        self.assertEqual(expected, self.logger.get_lines_for_level('error'))
+
+    def test_run_once(self):
+        conf = dict(swift_dir=self.testdir, devices=self.devices,
+                    bind_ip=_ips()[0], recon_cache_path=self.recon_cache,
+                    mount_check='false', timeout='300', stats_interval='1')
+        replicator = object_replicator.ObjectReplicator(conf,
+                                                        logger=self.logger)
         was_connector = object_replicator.http_connect
         object_replicator.http_connect = mock_http_connect(200)
         cur_part = '0'
-        df = DiskFile(self.devices, 'sda', cur_part, 'a', 'c', 'o',
-                      FakeLogger())
-        mkdirs(df.datadir)
-        f = open(os.path.join(df.datadir,
+        df = self.df_mgr.get_diskfile('sda', cur_part, 'a', 'c', 'o',
+                                      policy=POLICIES[0])
+        mkdirs(df._datadir)
+        f = open(os.path.join(df._datadir,
                               normalize_timestamp(time.time()) + '.data'),
                  'wb')
-        f.write('1234567890')
+        f.write(b'1234567890')
         f.close()
         ohash = hash_path('a', 'c', 'o')
         data_dir = ohash[-3:]
         whole_path_from = os.path.join(self.objects, cur_part, data_dir)
         process_arg_checker = []
+        ring = replicator.load_object_ring(POLICIES[0])
         nodes = [node for node in
-                 self.ring.get_part_nodes(int(cur_part)) \
-                     if node['ip'] not in _ips()]
+                 ring.get_part_nodes(int(cur_part))
+                 if node['ip'] not in _ips()]
+        rsync_mods = tuple(['%s::object/sda/objects/%s' %
+                            (node['ip'], cur_part) for node in nodes])
         for node in nodes:
-            rsync_mod = '%s::object/sda/objects/%s' % (node['ip'], cur_part)
             process_arg_checker.append(
-                (0, '', ['rsync', whole_path_from, rsync_mod]))
+                (0, '', ['rsync', whole_path_from, rsync_mods]))
+        start = replicator.replication_cycle
+        self.assertGreaterEqual(start, 0)
+        self.assertLessEqual(start, 9)
         with _mock_process(process_arg_checker):
             replicator.run_once()
+        self.assertEqual((start + 1) % 10, replicator.replication_cycle)
         self.assertFalse(process_errors)
+        self.assertFalse(self.logger.get_lines_for_level('error'))
 
-        object_replicator.http_connect = was_connector
+        # Returns 0 at first, and 60 on all following .next() calls
+        def _infinite_gen():
+            yield 0
+            while True:
+                yield 60
 
-    def test_get_hashes(self):
-        df = DiskFile(self.devices, 'sda', '0', 'a', 'c', 'o', FakeLogger())
-        mkdirs(df.datadir)
-        with open(os.path.join(df.datadir, normalize_timestamp(
-                    time.time()) + '.ts'), 'wb') as f:
-            f.write('1234567890')
-        part = os.path.join(self.objects, '0')
-        hashed, hashes = object_replicator.get_hashes(part)
-        self.assertEquals(hashed, 1)
-        self.assert_('a83' in hashes)
-        hashed, hashes = object_replicator.get_hashes(part, do_listdir=True)
-        self.assertEquals(hashed, 0)
-        self.assert_('a83' in hashes)
-        hashed, hashes = object_replicator.get_hashes(part,
-                                                      recalculate=['a83'])
-        self.assertEquals(hashed, 1)
-        self.assert_('a83' in hashes)
-
-    def test_get_hashes_bad_dir(self):
-        df = DiskFile(self.devices, 'sda', '0', 'a', 'c', 'o', FakeLogger())
-        mkdirs(df.datadir)
-        with open(os.path.join(self.objects, '0', 'bad'), 'wb') as f:
-            f.write('1234567890')
-        part = os.path.join(self.objects, '0')
-        hashed, hashes = object_replicator.get_hashes(part)
-        self.assertEquals(hashed, 1)
-        self.assert_('a83' in hashes)
-        self.assert_('bad' not in hashes)
-
-    def test_get_hashes_unmodified(self):
-        df = DiskFile(self.devices, 'sda', '0', 'a', 'c', 'o', FakeLogger())
-        mkdirs(df.datadir)
-        with open(os.path.join(df.datadir, normalize_timestamp(
-                    time.time()) + '.ts'), 'wb') as f:
-            f.write('1234567890')
-        part = os.path.join(self.objects, '0')
-        hashed, hashes = object_replicator.get_hashes(part)
-        i = [0]
-        def getmtime(filename):
-            i[0] += 1
-            return 1
-        with mock({'os.path.getmtime': getmtime}):
-            hashed, hashes = object_replicator.get_hashes(
-                part, recalculate=['a83'])
-        self.assertEquals(i[0], 2)
-
-    def test_get_hashes_unmodified_and_zero_bytes(self):
-        df = DiskFile(self.devices, 'sda', '0', 'a', 'c', 'o', FakeLogger())
-        mkdirs(df.datadir)
-        part = os.path.join(self.objects, '0')
-        open(os.path.join(part, object_replicator.HASH_FILE), 'w')
-        # Now the hash file is zero bytes.
-        i = [0]
-        def getmtime(filename):
-            i[0] += 1
-            return 1
-        with mock({'os.path.getmtime': getmtime}):
-            hashed, hashes = object_replicator.get_hashes(
-                part, recalculate=[])
-        # getmtime will actually not get called.  Initially, the pickle.load
-        # will raise an exception first and later, force_rewrite will
-        # short-circuit the if clause to determine whether to write out a fresh
-        # hashes_file.
-        self.assertEquals(i[0], 0)
-        self.assertTrue('a83' in hashes)
-
-    def test_get_hashes_modified(self):
-        df = DiskFile(self.devices, 'sda', '0', 'a', 'c', 'o', FakeLogger())
-        mkdirs(df.datadir)
-        with open(os.path.join(df.datadir, normalize_timestamp(
-                    time.time()) + '.ts'), 'wb') as f:
-            f.write('1234567890')
-        part = os.path.join(self.objects, '0')
-        hashed, hashes = object_replicator.get_hashes(part)
-        i = [0]
-        def getmtime(filename):
-            if i[0] < 3:
-                i[0] += 1
-            return i[0]
-        with mock({'os.path.getmtime': getmtime}):
-            hashed, hashes = object_replicator.get_hashes(
-                part, recalculate=['a83'])
-        self.assertEquals(i[0], 3)
-
-    def test_hash_suffix_hash_dir_is_file_quarantine(self):
-        df = DiskFile(self.devices, 'sda', '0', 'a', 'c', 'o', FakeLogger())
-        mkdirs(os.path.dirname(df.datadir))
-        open(df.datadir, 'wb').close()
-        ohash = hash_path('a', 'c', 'o')
-        data_dir = ohash[-3:]
-        whole_path_from = os.path.join(self.objects, '0', data_dir)
-        orig_quarantine_renamer = object_replicator.quarantine_renamer
-        called = [False]
+        for cycle in range(1, 10):
+            with _mock_process(process_arg_checker):
+                with mock.patch('time.time', side_effect=_infinite_gen()):
+                    replicator.run_once()
+                    self.assertEqual((start + 1 + cycle) % 10,
+                                     replicator.replication_cycle)
 
-        def wrapped(*args, **kwargs):
-            called[0] = True
-            return orig_quarantine_renamer(*args, **kwargs)
+        recon_fname = os.path.join(self.recon_cache, RECON_OBJECT_FILE)
+        with open(recon_fname) as cachefile:
+            recon = json.loads(cachefile.read())
+            self.assertEqual(1, recon.get('replication_time'))
+            self.assertIn('replication_stats', recon)
+            self.assertIn('replication_last', recon)
+        expected = 'Object replication complete (once). (1.00 minutes)'
+        self.assertIn(expected, self.logger.get_lines_for_level('info'))
+        self.assertFalse(self.logger.get_lines_for_level('error'))
+        object_replicator.http_connect = was_connector
 
-        try:
-            object_replicator.quarantine_renamer = wrapped
-            object_replicator.hash_suffix(whole_path_from, 101)
-        finally:
-            object_replicator.quarantine_renamer = orig_quarantine_renamer
-        self.assertTrue(called[0])
-
-    def test_hash_suffix_one_file(self):
-        df = DiskFile(self.devices, 'sda', '0', 'a', 'c', 'o', FakeLogger())
-        mkdirs(df.datadir)
-        f = open(os.path.join(df.datadir,
-                     normalize_timestamp(time.time() - 100) + '.ts'),
+    # policy 1
+    def test_run_once_1(self):
+        conf = dict(swift_dir=self.testdir, devices=self.devices,
+                    recon_cache_path=self.recon_cache,
+                    mount_check='false', timeout='300', stats_interval='1')
+        replicator = object_replicator.ObjectReplicator(conf,
+                                                        logger=self.logger)
+        was_connector = object_replicator.http_connect
+        object_replicator.http_connect = mock_http_connect(200)
+        cur_part = '0'
+        df = self.df_mgr.get_diskfile('sda', cur_part, 'a', 'c', 'o',
+                                      policy=POLICIES[1])
+        mkdirs(df._datadir)
+        f = open(os.path.join(df._datadir,
+                              normalize_timestamp(time.time()) + '.data'),
                  'wb')
-        f.write('1234567890')
+        f.write(b'1234567890')
         f.close()
         ohash = hash_path('a', 'c', 'o')
         data_dir = ohash[-3:]
-        whole_path_from = os.path.join(self.objects, '0', data_dir)
-        object_replicator.hash_suffix(whole_path_from, 101)
-        self.assertEquals(len(os.listdir(self.parts['0'])), 1)
-
-        object_replicator.hash_suffix(whole_path_from, 99)
-        self.assertEquals(len(os.listdir(self.parts['0'])), 0)
-
-    def test_hash_suffix_multi_file_one(self):
-        df = DiskFile(self.devices, 'sda', '0', 'a', 'c', 'o', FakeLogger())
-        mkdirs(df.datadir)
-        for tdiff in [1, 50, 100, 500]:
-            for suff in ['.meta', '.data', '.ts']:
-                f = open(os.path.join(df.datadir,
-                        normalize_timestamp(int(time.time()) - tdiff) + suff),
-                         'wb')
-                f.write('1234567890')
-                f.close()
+        whole_path_from = os.path.join(self.objects_1, cur_part, data_dir)
+        process_arg_checker = []
+        ring = replicator.load_object_ring(POLICIES[1])
+        nodes = [node for node in
+                 ring.get_part_nodes(int(cur_part))
+                 if node['ip'] not in _ips()]
+        rsync_mods = tuple(['%s::object/sda/objects-1/%s' %
+                            (node['ip'], cur_part) for node in nodes])
+        for node in nodes:
+            process_arg_checker.append(
+                (0, '', ['rsync', whole_path_from, rsync_mods]))
+        with _mock_process(process_arg_checker):
+            with mock.patch('swift.obj.replicator.whataremyips',
+                            side_effect=_ips):
+                replicator.run_once()
+        self.assertFalse(process_errors)
+        self.assertFalse(self.logger.get_lines_for_level('error'))
+        object_replicator.http_connect = was_connector
 
-        ohash = hash_path('a', 'c', 'o')
-        data_dir = ohash[-3:]
-        whole_path_from = os.path.join(self.objects, '0', data_dir)
-        hsh_path = os.listdir(whole_path_from)[0]
-        whole_hsh_path = os.path.join(whole_path_from, hsh_path)
-
-        object_replicator.hash_suffix(whole_path_from, 99)
-        # only the tombstone should be left
-        self.assertEquals(len(os.listdir(whole_hsh_path)), 1)
-
-    def test_hash_suffix_multi_file_two(self):
-        df = DiskFile(self.devices, 'sda', '0', 'a', 'c', 'o', FakeLogger())
-        mkdirs(df.datadir)
-        for tdiff in [1, 50, 100, 500]:
-            suffs = ['.meta', '.data']
-            if tdiff > 50:
-                suffs.append('.ts')
-            for suff in suffs:
-                f = open(os.path.join(df.datadir,
-                        normalize_timestamp(int(time.time()) - tdiff) + suff),
-                         'wb')
-                f.write('1234567890')
-                f.close()
+    def test_check_ring(self):
+        for pol in POLICIES:
+            obj_ring = self.replicator.load_object_ring(pol)
+            self.assertTrue(self.replicator.check_ring(obj_ring))
+            orig_check = self.replicator.next_check
+            self.replicator.next_check = orig_check - 30
+            self.assertTrue(self.replicator.check_ring(obj_ring))
+            self.replicator.next_check = orig_check
+            orig_ring_time = obj_ring._mtime
+            obj_ring._mtime = orig_ring_time - 30
+            self.assertTrue(self.replicator.check_ring(obj_ring))
+            self.replicator.next_check = orig_check - 30
+            self.assertFalse(self.replicator.check_ring(obj_ring))
 
-        ohash = hash_path('a', 'c', 'o')
-        data_dir = ohash[-3:]
-        whole_path_from = os.path.join(self.objects, '0', data_dir)
-        hsh_path = os.listdir(whole_path_from)[0]
-        whole_hsh_path = os.path.join(whole_path_from, hsh_path)
+    def test_collect_jobs_mkdirs_error(self):
 
-        object_replicator.hash_suffix(whole_path_from, 99)
-        # only the meta and data should be left
-        self.assertEquals(len(os.listdir(whole_hsh_path)), 2)
+        non_local = {}
 
-    def test_invalidate_hash(self):
+        def blowup_mkdirs(path):
+            non_local['path'] = path
+            raise OSError('Ow!')
 
-        def assertFileData(file_path, data):
-            with open(file_path, 'r') as fp:
-                fdata = fp.read()
-                self.assertEquals(pickle.loads(fdata), pickle.loads(data))
+        with mock.patch.object(object_replicator, 'mkdirs', blowup_mkdirs):
+            rmtree(self.objects, ignore_errors=1)
+            object_replicator.mkdirs = blowup_mkdirs
+            self.replicator.collect_jobs()
+            self.assertEqual(self.logger.get_lines_for_level('error'), [
+                'ERROR creating %s: ' % non_local['path']])
+            log_args, log_kwargs = self.logger.log_dict['error'][0]
+            self.assertEqual(str(log_kwargs['exc_info'][1]), 'Ow!')
 
-        df = DiskFile(self.devices, 'sda', '0', 'a', 'c', 'o', FakeLogger())
-        mkdirs(df.datadir)
-        ohash = hash_path('a', 'c', 'o')
-        data_dir = ohash[-3:]
-        whole_path_from = os.path.join(self.objects, '0', data_dir)
-        hashes_file = os.path.join(self.objects, '0',
-                                   object_replicator.HASH_FILE)
-        # test that non existant file except caught
-        self.assertEquals(object_replicator.invalidate_hash(whole_path_from),
-                          None)
-        # test that hashes get cleared
-        check_pickle_data = pickle.dumps({data_dir: None},
-                                         object_replicator.PICKLE_PROTOCOL)
-        for data_hash in [{data_dir: None}, {data_dir: 'abcdefg'}]:
-            with open(hashes_file, 'wb') as fp:
-                pickle.dump(data_hash, fp, object_replicator.PICKLE_PROTOCOL)
-            object_replicator.invalidate_hash(whole_path_from)
-            assertFileData(hashes_file, check_pickle_data)
+    def test_collect_jobs(self):
+        jobs = self.replicator.collect_jobs()
+        jobs_to_delete = [j for j in jobs if j['delete']]
+        jobs_by_pol_part = {}
+        for job in jobs:
+            jobs_by_pol_part[str(int(job['policy'])) + job['partition']] = job
+        self.assertEqual(len(jobs_to_delete), 2)
+        self.assertEqual('1', jobs_to_delete[0]['partition'])
+        self.assertEqual(
+            [node['id'] for node in jobs_by_pol_part['00']['nodes']], [1, 2])
+        self.assertEqual(
+            [node['id'] for node in jobs_by_pol_part['01']['nodes']],
+            [1, 2, 3])
+        self.assertEqual(
+            [node['id'] for node in jobs_by_pol_part['02']['nodes']], [2, 3])
+        self.assertEqual(
+            [node['id'] for node in jobs_by_pol_part['03']['nodes']], [3, 1])
+        self.assertEqual(
+            [node['id'] for node in jobs_by_pol_part['10']['nodes']], [1, 2])
+        self.assertEqual(
+            [node['id'] for node in jobs_by_pol_part['11']['nodes']],
+            [1, 2, 3])
+        self.assertEqual(
+            [node['id'] for node in jobs_by_pol_part['12']['nodes']], [2, 3])
+        self.assertEqual(
+            [node['id'] for node in jobs_by_pol_part['13']['nodes']], [3, 1])
+        for part in ['00', '01', '02', '03']:
+            for node in jobs_by_pol_part[part]['nodes']:
+                self.assertEqual(node['device'], 'sda')
+            self.assertEqual(jobs_by_pol_part[part]['path'],
+                             os.path.join(self.objects, part[1:]))
+        for part in ['10', '11', '12', '13']:
+            for node in jobs_by_pol_part[part]['nodes']:
+                self.assertEqual(node['device'], 'sda')
+            self.assertEqual(jobs_by_pol_part[part]['path'],
+                             os.path.join(self.objects_1, part[1:]))
 
-    def test_check_ring(self):
-        self.assertTrue(self.replicator.check_ring())
-        orig_check = self.replicator.next_check
-        self.replicator.next_check = orig_check - 30
-        self.assertTrue(self.replicator.check_ring())
-        self.replicator.next_check = orig_check
-        orig_ring_time = self.replicator.object_ring._mtime
-        self.replicator.object_ring._mtime = orig_ring_time - 30
-        self.assertTrue(self.replicator.check_ring())
-        self.replicator.next_check = orig_check - 30
-        self.assertFalse(self.replicator.check_ring())
+    def test_collect_jobs_unmounted(self):
+        with mock_check_drive() as mocks:
+            jobs = self.replicator.collect_jobs()
+        self.assertEqual(jobs, [])
+        self.assertEqual(mocks['ismount'].mock_calls, [])
+        self.assertEqual(len(mocks['isdir'].mock_calls), 2)
+
+        self.replicator.mount_check = True
+        with mock_check_drive() as mocks:
+            jobs = self.replicator.collect_jobs()
+        self.assertEqual(jobs, [])
+        self.assertEqual(mocks['isdir'].mock_calls, [])
+        self.assertEqual(len(mocks['ismount'].mock_calls), 2)
+
+    def test_collect_jobs_failure_report_with_auditor_stats_json(self):
+        devs = [
+            {'id': 0, 'device': 'sda', 'zone': 0,
+             'region': 1, 'ip': '1.1.1.1', 'port': 1111,
+             'replication_ip': '127.0.0.0', 'replication_port': 6200},
+            {'id': 1, 'device': 'sdb', 'zone': 1,
+             'region': 1, 'ip': '1.1.1.1', 'port': 1111,
+             'replication_ip': '127.0.0.0', 'replication_port': 6200},
+            {'id': 2, 'device': 'sdc', 'zone': 2,
+             'region': 1, 'ip': '1.1.1.1', 'port': 1111,
+             'replication_ip': '127.0.0.1', 'replication_port': 6200},
+            {'id': 3, 'device': 'sdd', 'zone': 3,
+             'region': 1, 'ip': '1.1.1.1', 'port': 1111,
+             'replication_ip': '127.0.0.1', 'replication_port': 6200},
+        ]
+        objects_sdb, objects_1_sdb, _, _ = \
+            self._write_disk_data('sdb', with_json=True)
+        objects_sdc, objects_1_sdc, _, _ = \
+            self._write_disk_data('sdc', with_json=True)
+        objects_sdd, objects_1_sdd, _, _ = \
+            self._write_disk_data('sdd', with_json=True)
+        _create_test_rings(self.testdir, devs)
+
+        self.replicator.collect_jobs(override_partitions=[1])
+        self.assertEqual(self.replicator.total_stats.failure, 0)
+
+    def test_collect_jobs_with_override_parts_and_unexpected_part_dir(self):
+        self.replicator.collect_jobs(override_partitions=[0, 2])
+        self.assertEqual(self.replicator.total_stats.failure, 0)
+        os.mkdir(os.path.join(self.objects_1, 'foo'))
+        jobs = self.replicator.collect_jobs(override_partitions=[0, 2])
+        found_jobs = set()
+        for j in jobs:
+            found_jobs.add((int(j['policy']), int(j['partition'])))
+        self.assertEqual(found_jobs, {
+            (0, 0),
+            (0, 2),
+            (1, 0),
+            (1, 2),
+        })
+        num_disks = len(POLICIES[1].object_ring.devs)
+        # N.B. it's not clear why the UUT increments failure per device
+        self.assertEqual(self.replicator.total_stats.failure, num_disks)
+
+    @mock.patch('swift.obj.replicator.random.shuffle', side_effect=lambda l: l)
+    def test_collect_jobs_multi_disk(self, mock_shuffle):
+        devs = [
+            # Two disks on same IP/port
+            {'id': 0, 'device': 'sda', 'zone': 0,
+             'region': 1, 'ip': '1.1.1.1', 'port': 1111,
+             'replication_ip': '127.0.0.0', 'replication_port': 6200},
+            {'id': 1, 'device': 'sdb', 'zone': 1,
+             'region': 1, 'ip': '1.1.1.1', 'port': 1111,
+             'replication_ip': '127.0.0.0', 'replication_port': 6200},
+            # Two disks on same server, different ports
+            {'id': 2, 'device': 'sdc', 'zone': 2,
+             'region': 2, 'ip': '1.1.1.2', 'port': 1112,
+             'replication_ip': '127.0.0.1', 'replication_port': 6200},
+            {'id': 3, 'device': 'sdd', 'zone': 4,
+             'region': 2, 'ip': '1.1.1.2', 'port': 1112,
+             'replication_ip': '127.0.0.1', 'replication_port': 6201},
+        ]
+        objects_sdb, objects_1_sdb, _, _ = self._write_disk_data('sdb')
+        objects_sdc, objects_1_sdc, _, _ = self._write_disk_data('sdc')
+        objects_sdd, objects_1_sdd, _, _ = self._write_disk_data('sdd')
+        _create_test_rings(self.testdir, devs)
 
-    def test_collect_jobs(self):
         jobs = self.replicator.collect_jobs()
+
+        self.assertEqual([mock.call(jobs)], mock_shuffle.mock_calls)
+
         jobs_to_delete = [j for j in jobs if j['delete']]
-        jobs_to_keep = [j for j in jobs if not j['delete']]
-        jobs_by_part = {}
+        self.assertEqual(len(jobs_to_delete), 4)
+        self.assertEqual([
+            '1', '2',  # policy 0; 1 not on sda, 2 not on sdb
+            '1', '2',  # policy 1; 1 not on sda, 2 not on sdb
+        ], [j['partition'] for j in jobs_to_delete])
+
+        jobs_by_pol_part_dev = {}
         for job in jobs:
-            jobs_by_part[job['partition']] = job
-        self.assertEquals(len(jobs_to_delete), 1)
-        self.assertTrue('1', jobs_to_delete[0]['partition'])
-        self.assertEquals(
-            [node['id'] for node in jobs_by_part['0']['nodes']], [1, 2])
-        self.assertEquals(
-            [node['id'] for node in jobs_by_part['1']['nodes']], [1, 2, 3])
-        self.assertEquals(
-            [node['id'] for node in jobs_by_part['2']['nodes']], [2, 3])
-        self.assertEquals(
-            [node['id'] for node in jobs_by_part['3']['nodes']], [3, 1])
-        for part in ['0', '1', '2', '3']:
-            for node in jobs_by_part[part]['nodes']:
-                self.assertEquals(node['device'], 'sda')
-            self.assertEquals(jobs_by_part[part]['path'],
-                              os.path.join(self.objects, part))
-
-    def test_collect_jobs_removes_zbf(self):
-        """
-        After running xfs_repair, a partition directory could become a
-        zero-byte file.  If this happens, collect_jobs() should clean it up and
-        *not* create a job which will hit an exception as it tries to listdir()
-        a file.
-        """
-        # Surprise! Partition dir 1 is actually a zero-byte-file
-        part_1_path = os.path.join(self.objects, '1')
-        rmtree(part_1_path)
-        with open(part_1_path, 'w'):
-            pass
-        self.assertTrue(os.path.isfile(part_1_path))  # sanity check
+            # There should be no jobs with a device not in just sda & sdb
+            self.assertTrue(job['device'] in ('sda', 'sdb'))
+            jobs_by_pol_part_dev[
+                str(int(job['policy'])) + job['partition'] + job['device']
+            ] = job
+
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['00sda']['nodes']],
+                         [1, 2])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['00sdb']['nodes']],
+                         [0, 2])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['01sda']['nodes']],
+                         [1, 2, 3])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['01sdb']['nodes']],
+                         [2, 3])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['02sda']['nodes']],
+                         [2, 3])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['02sdb']['nodes']],
+                         [2, 3, 0])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['03sda']['nodes']],
+                         [3, 1])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['03sdb']['nodes']],
+                         [3, 0])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['10sda']['nodes']],
+                         [1, 2])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['10sdb']['nodes']],
+                         [0, 2])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['11sda']['nodes']],
+                         [1, 2, 3])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['11sdb']['nodes']],
+                         [2, 3])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['12sda']['nodes']],
+                         [2, 3])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['12sdb']['nodes']],
+                         [2, 3, 0])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['13sda']['nodes']],
+                         [3, 1])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['13sdb']['nodes']],
+                         [3, 0])
+        for part in ['00', '01', '02', '03']:
+            self.assertEqual(jobs_by_pol_part_dev[part + 'sda']['path'],
+                             os.path.join(self.objects, part[1:]))
+            self.assertEqual(jobs_by_pol_part_dev[part + 'sdb']['path'],
+                             os.path.join(objects_sdb, part[1:]))
+        for part in ['10', '11', '12', '13']:
+            self.assertEqual(jobs_by_pol_part_dev[part + 'sda']['path'],
+                             os.path.join(self.objects_1, part[1:]))
+            self.assertEqual(jobs_by_pol_part_dev[part + 'sdb']['path'],
+                             os.path.join(objects_1_sdb, part[1:]))
+
+    @mock.patch('swift.obj.replicator.random.shuffle', side_effect=lambda l: l)
+    def test_collect_jobs_multi_disk_diff_ports_normal(self, mock_shuffle):
+        # Normally (servers_per_port=0), replication_ip AND replication_port
+        # are used to determine local ring device entries.  Here we show that
+        # with bind_ip='127.0.0.1', bind_port=6200, only "sdc" is local.
+        devs = [
+            # Two disks on same IP/port
+            {'id': 0, 'device': 'sda', 'zone': 0,
+             'region': 1, 'ip': '1.1.1.1', 'port': 1111,
+             'replication_ip': '127.0.0.0', 'replication_port': 6200},
+            {'id': 1, 'device': 'sdb', 'zone': 1,
+             'region': 1, 'ip': '1.1.1.1', 'port': 1111,
+             'replication_ip': '127.0.0.0', 'replication_port': 6200},
+            # Two disks on same server, different ports
+            {'id': 2, 'device': 'sdc', 'zone': 2,
+             'region': 2, 'ip': '1.1.1.2', 'port': 1112,
+             'replication_ip': '127.0.0.1', 'replication_port': 6200},
+            {'id': 3, 'device': 'sdd', 'zone': 4,
+             'region': 2, 'ip': '1.1.1.2', 'port': 1112,
+             'replication_ip': '127.0.0.1', 'replication_port': 6201},
+        ]
+        objects_sdb, objects_1_sdb, _, _ = self._write_disk_data('sdb')
+        objects_sdc, objects_1_sdc, _, _ = self._write_disk_data('sdc')
+        objects_sdd, objects_1_sdd, _, _ = self._write_disk_data('sdd')
+        _create_test_rings(self.testdir, devs)
+
+        self.conf['bind_ip'] = '127.0.0.1'
+        self._create_replicator()
+
         jobs = self.replicator.collect_jobs()
+
+        self.assertEqual([mock.call(jobs)], mock_shuffle.mock_calls)
+
         jobs_to_delete = [j for j in jobs if j['delete']]
-        jobs_to_keep = [j for j in jobs if not j['delete']]
-        jobs_by_part = {}
+        self.assertEqual(len(jobs_to_delete), 2)
+        self.assertEqual([
+            '3',  # policy 0; 3 not on sdc
+            '3',  # policy 1; 3 not on sdc
+        ], [j['partition'] for j in jobs_to_delete])
+
+        jobs_by_pol_part_dev = {}
         for job in jobs:
-            jobs_by_part[job['partition']] = job
-        self.assertEquals(len(jobs_to_delete), 0)
-        self.assertEquals(
-            [node['id'] for node in jobs_by_part['0']['nodes']], [1, 2])
-        self.assertFalse('1' in jobs_by_part)
-        self.assertEquals(
-            [node['id'] for node in jobs_by_part['2']['nodes']], [2, 3])
-        self.assertEquals(
-            [node['id'] for node in jobs_by_part['3']['nodes']], [3, 1])
-        for part in ['0', '2', '3']:
-            for node in jobs_by_part[part]['nodes']:
-                self.assertEquals(node['device'], 'sda')
-            self.assertEquals(jobs_by_part[part]['path'],
-                              os.path.join(self.objects, part))
-        self.assertFalse(os.path.exists(part_1_path))
-        self.assertEquals(
-            [(('Removing partition directory which was a file: %s',
-               part_1_path), {})],
-            self.replicator.logger.log_dict['warning'])
+            # There should be no jobs with a device not sdc
+            self.assertEqual(job['device'], 'sdc')
+            jobs_by_pol_part_dev[
+                str(int(job['policy'])) + job['partition'] + job['device']
+            ] = job
 
-    def test_delete_partition(self):
-        df = DiskFile(self.devices, 'sda', '0', 'a', 'c', 'o', FakeLogger())
-        mkdirs(df.datadir)
-        ohash = hash_path('a', 'c', 'o')
-        data_dir = ohash[-3:]
-        part_path = os.path.join(self.objects, '1')
-        self.assertTrue(os.access(part_path, os.F_OK))
-        self.replicator.replicate()
-        self.assertFalse(os.access(part_path, os.F_OK))
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['00sdc']['nodes']],
+                         [0, 1])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['01sdc']['nodes']],
+                         [1, 3])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['02sdc']['nodes']],
+                         [3, 0])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['03sdc']['nodes']],
+                         [3, 0, 1])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['10sdc']['nodes']],
+                         [0, 1])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['11sdc']['nodes']],
+                         [1, 3])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['12sdc']['nodes']],
+                         [3, 0])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['13sdc']['nodes']],
+                         [3, 0, 1])
+        for part in ['00', '01', '02', '03']:
+            self.assertEqual(jobs_by_pol_part_dev[part + 'sdc']['path'],
+                             os.path.join(objects_sdc, part[1:]))
+        for part in ['10', '11', '12', '13']:
+            self.assertEqual(jobs_by_pol_part_dev[part + 'sdc']['path'],
+                             os.path.join(objects_1_sdc, part[1:]))
 
-    def test_delete_partition_override_params(self):
-        df = DiskFile(self.devices, 'sda', '0', 'a', 'c', 'o', FakeLogger())
-        mkdirs(df.datadir)
-        ohash = hash_path('a', 'c', 'o')
-        data_dir = ohash[-3:]
-        part_path = os.path.join(self.objects, '1')
-        self.assertTrue(os.access(part_path, os.F_OK))
-        self.replicator.replicate(override_devices=['sdb'])
-        self.assertTrue(os.access(part_path, os.F_OK))
-        self.replicator.replicate(override_partitions=['9'])
-        self.assertTrue(os.access(part_path, os.F_OK))
-        self.replicator.replicate(override_devices=['sda'],
-                                  override_partitions=['1'])
-        self.assertFalse(os.access(part_path, os.F_OK))
+    @mock.patch('swift.obj.replicator.random.shuffle', side_effect=lambda l: l)
+    def test_collect_jobs_multi_disk_servers_per_port(self, mock_shuffle):
+        # Normally (servers_per_port=0), replication_ip AND replication_port
+        # are used to determine local ring device entries.  Here we show that
+        # with servers_per_port > 0 and bind_ip='127.0.0.1', bind_port=6200,
+        # then both "sdc" and "sdd" are local.
+        devs = [
+            # Two disks on same IP/port
+            {'id': 0, 'device': 'sda', 'zone': 0,
+             'region': 1, 'ip': '1.1.1.1', 'port': 1111,
+             'replication_ip': '127.0.0.0', 'replication_port': 6200},
+            {'id': 1, 'device': 'sdb', 'zone': 1,
+             'region': 1, 'ip': '1.1.1.1', 'port': 1111,
+             'replication_ip': '127.0.0.0', 'replication_port': 6200},
+            # Two disks on same server, different ports
+            {'id': 2, 'device': 'sdc', 'zone': 2,
+             'region': 2, 'ip': '1.1.1.2', 'port': 1112,
+             'replication_ip': '127.0.0.1', 'replication_port': 6200},
+            {'id': 3, 'device': 'sdd', 'zone': 4,
+             'region': 2, 'ip': '1.1.1.2', 'port': 1112,
+             'replication_ip': '127.0.0.1', 'replication_port': 6201},
+        ]
+        objects_sdb, objects_1_sdb, _, _ = self._write_disk_data('sdb')
+        objects_sdc, objects_1_sdc, _, _ = self._write_disk_data('sdc')
+        objects_sdd, objects_1_sdd, _, _ = self._write_disk_data('sdd')
+        _create_test_rings(self.testdir, devs)
 
-    def test_run_once_recover_from_failure(self):
-        replicator = object_replicator.ObjectReplicator(
-            dict(swift_dir=self.testdir, devices=self.devices,
-                mount_check='false', timeout='300', stats_interval='1'))
-        was_connector = object_replicator.http_connect
-        try:
-            object_replicator.http_connect = mock_http_connect(200)
-            # Write some files into '1' and run replicate- they should be moved
-            # to the other partitoins and then node should get deleted.
-            cur_part = '1'
-            df = DiskFile(self.devices, 'sda', cur_part, 'a', 'c', 'o',
-                          FakeLogger())
-            mkdirs(df.datadir)
-            f = open(os.path.join(df.datadir,
+        self.conf['bind_ip'] = '127.0.0.1'
+        self.conf['servers_per_port'] = 1  # diff port ok
+        self._create_replicator()
+
+        jobs = self.replicator.collect_jobs()
+
+        self.assertEqual([mock.call(jobs)], mock_shuffle.mock_calls)
+
+        jobs_to_delete = [j for j in jobs if j['delete']]
+        self.assertEqual(len(jobs_to_delete), 4)
+        self.assertEqual([
+            '3', '0',  # policy 0; 3 not on sdc, 0 not on sdd
+            '3', '0',  # policy 1; 3 not on sdc, 0 not on sdd
+        ], [j['partition'] for j in jobs_to_delete])
+
+        jobs_by_pol_part_dev = {}
+        for job in jobs:
+            # There should be no jobs with a device not in just sdc & sdd
+            self.assertTrue(job['device'] in ('sdc', 'sdd'))
+            jobs_by_pol_part_dev[
+                str(int(job['policy'])) + job['partition'] + job['device']
+            ] = job
+
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['00sdc']['nodes']],
+                         [0, 1])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['00sdd']['nodes']],
+                         [0, 1, 2])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['01sdc']['nodes']],
+                         [1, 3])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['01sdd']['nodes']],
+                         [1, 2])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['02sdc']['nodes']],
+                         [3, 0])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['02sdd']['nodes']],
+                         [2, 0])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['03sdc']['nodes']],
+                         [3, 0, 1])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['03sdd']['nodes']],
+                         [0, 1])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['10sdc']['nodes']],
+                         [0, 1])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['10sdd']['nodes']],
+                         [0, 1, 2])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['11sdc']['nodes']],
+                         [1, 3])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['11sdd']['nodes']],
+                         [1, 2])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['12sdc']['nodes']],
+                         [3, 0])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['12sdd']['nodes']],
+                         [2, 0])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['13sdc']['nodes']],
+                         [3, 0, 1])
+        self.assertEqual([node['id']
+                          for node in jobs_by_pol_part_dev['13sdd']['nodes']],
+                         [0, 1])
+        for part in ['00', '01', '02', '03']:
+            self.assertEqual(jobs_by_pol_part_dev[part + 'sdc']['path'],
+                             os.path.join(objects_sdc, part[1:]))
+            self.assertEqual(jobs_by_pol_part_dev[part + 'sdd']['path'],
+                             os.path.join(objects_sdd, part[1:]))
+        for part in ['10', '11', '12', '13']:
+            self.assertEqual(jobs_by_pol_part_dev[part + 'sdc']['path'],
+                             os.path.join(objects_1_sdc, part[1:]))
+            self.assertEqual(jobs_by_pol_part_dev[part + 'sdd']['path'],
+                             os.path.join(objects_1_sdd, part[1:]))
+
+    def test_collect_jobs_handoffs_first(self):
+        self.replicator.handoffs_first = True
+        jobs = self.replicator.collect_jobs()
+        self.assertTrue(jobs[0]['delete'])
+        self.assertEqual('1', jobs[0]['partition'])
+
+    def test_handoffs_first_mode_will_process_all_jobs_after_handoffs(self):
+        # make an object in the handoff & primary partition
+        expected_suffix_paths = []
+        for policy in POLICIES:
+            # primary
+            ts = next(self.ts)
+            df = self.df_mgr.get_diskfile('sda', '0', 'a', 'c', 'o', policy)
+            with df.create() as w:
+                w.write(b'asdf')
+                w.put({'X-Timestamp': ts.internal})
+                w.commit(ts)
+            expected_suffix_paths.append(os.path.dirname(df._datadir))
+            # handoff
+            ts = next(self.ts)
+            df = self.df_mgr.get_diskfile('sda', '1', 'a', 'c', 'o', policy)
+            with df.create() as w:
+                w.write(b'asdf')
+                w.put({'X-Timestamp': ts.internal})
+                w.commit(ts)
+            expected_suffix_paths.append(os.path.dirname(df._datadir))
+
+        # rsync will be called for all parts we created objects in
+        process_arg_checker = [
+            # (return_code, stdout, <each in capture rsync args>)
+            (0, '', []),
+            (0, '', []),
+            (0, '', []),  # handoff job "first" policy
+            (0, '', []),
+            (0, '', []),
+            (0, '', []),  # handoff job "second" policy
+            (0, '', []),
+            (0, '', []),  # update job "first" policy
+            (0, '', []),
+            (0, '', []),  # update job "second" policy
+        ]
+        # each handoff partition node gets one replicate request for after
+        # rsync (2 * 3), each primary partition with objects gets two
+        # replicate requests (pre-flight and post sync) to each of each
+        # partners (2 * 2 * 2), the 2 remaining empty parts (2 & 3) get a
+        # pre-flight replicate request per node for each storage policy
+        # (2 * 2 * 2) - so 6 + 8 + 8 == 22
+        replicate_responses = [200] * 22
+        stub_body = pickle.dumps({})
+        with _mock_process(process_arg_checker) as rsync_log, \
+            mock.patch('swift.obj.replicator.whataremyips',
+                       side_effect=_ips), \
+                mocked_http_conn(*replicate_responses,
+                                 body=stub_body) as conn_log:
+            self.replicator.handoffs_first = True
+            self.replicator.replicate()
+        # all jobs processed!
+        self.assertEqual(self.replicator.job_count,
+                         self.replicator.total_stats.attempted)
+        self.assertFalse(self.replicator.handoffs_remaining)
+
+        # sanity, all the handoffs suffixes we filled in were rsync'd
+        found_rsync_suffix_paths = set()
+        for subprocess_info in rsync_log:
+            local_path, remote_path = subprocess_info['rsync_args'][-2:]
+            found_rsync_suffix_paths.add(local_path)
+        self.assertEqual(set(expected_suffix_paths), found_rsync_suffix_paths)
+        # sanity, all nodes got replicated
+        found_replicate_calls = defaultdict(int)
+        for req in conn_log.requests:
+            self.assertEqual(req['method'], 'REPLICATE')
+            found_replicate_key = (
+                int(req['headers']['X-Backend-Storage-Policy-Index']),
+                req['path'])
+            found_replicate_calls[found_replicate_key] += 1
+        expected_replicate_calls = {
+            (0, '/sda/1/a83'): 3,
+            (1, '/sda/1/a83'): 3,
+            (0, '/sda/0'): 2,
+            (0, '/sda/0/a83'): 2,
+            (1, '/sda/0'): 2,
+            (1, '/sda/0/a83'): 2,
+            (0, '/sda/2'): 2,
+            (1, '/sda/2'): 2,
+            (0, '/sda/3'): 2,
+            (1, '/sda/3'): 2,
+        }
+        self.assertEqual(dict(found_replicate_calls),
+                         expected_replicate_calls)
+
+    def test_handoffs_first_mode_will_abort_if_handoffs_remaining(self):
+        # make an object in the handoff partition
+        handoff_suffix_paths = []
+        for policy in POLICIES:
+            ts = next(self.ts)
+            df = self.df_mgr.get_diskfile('sda', '1', 'a', 'c', 'o', policy)
+            with df.create() as w:
+                w.write(b'asdf')
+                w.put({'X-Timestamp': ts.internal})
+                w.commit(ts)
+            handoff_suffix_paths.append(os.path.dirname(df._datadir))
+        process_arg_checker = [
+            # (return_code, stdout, <each in capture rsync args>)
+            (0, '', []),
+            (1, '', []),
+            (0, '', []),
+            (0, '', []),
+            (0, '', []),
+            (0, '', []),
+        ]
+        stub_body = pickle.dumps({})
+        with _mock_process(process_arg_checker) as rsync_log, \
+            mock.patch('swift.obj.replicator.whataremyips',
+                       side_effect=_ips), \
+                mocked_http_conn(*[200] * 5, body=stub_body) as conn_log:
+            self.replicator.handoffs_first = True
+            self.replicator.replicate()
+        # stopped after handoffs!
+        self.assertEqual(1, self.replicator.handoffs_remaining)
+        self.assertEqual(8, self.replicator.job_count)
+        self.assertEqual(self.replicator.total_stats.failure, 1)
+        # in addition to the two revert jobs as many as "concurrency"
+        # jobs may have been spawned into the pool before the failed
+        # revert job incremented handoffs_remaining and caused the
+        # handoffs_first check to abort the current pass
+        self.assertLessEqual(self.replicator.total_stats.attempted,
+                             2 + self.replicator.concurrency)
+
+        # sanity, all the handoffs suffixes we filled in were rsync'd
+        found_rsync_suffix_paths = set()
+        expected_replicate_requests = set()
+        for subprocess_info in rsync_log:
+            local_path, remote_path = subprocess_info['rsync_args'][-2:]
+            found_rsync_suffix_paths.add(local_path)
+            if subprocess_info['ret_code'] == 0:
+                node_ip = remote_path.split(':', 1)[0]
+                expected_replicate_requests.add(node_ip)
+        self.assertEqual(set(handoff_suffix_paths), found_rsync_suffix_paths)
+        # sanity, all successful rsync nodes got REPLICATE requests
+        found_replicate_requests = set()
+        self.assertEqual(5, len(conn_log.requests))
+        for req in conn_log.requests:
+            self.assertEqual(req['method'], 'REPLICATE')
+            found_replicate_requests.add(req['ip'])
+        self.assertEqual(expected_replicate_requests,
+                         found_replicate_requests)
+
+        # and at least one partition got removed!
+        remaining_policies = []
+        for path in handoff_suffix_paths:
+            if os.path.exists(path):
+                policy = diskfile.extract_policy(path)
+                remaining_policies.append(policy)
+        self.assertEqual(len(remaining_policies), 1)
+        remaining_policy = remaining_policies[0]
+
+        # try again but with handoff_delete allowing for a single failure
+        with _mock_process(process_arg_checker) as rsync_log, \
+            mock.patch('swift.obj.replicator.whataremyips',
+                       side_effect=_ips), \
+                mocked_http_conn(*[200] * 14, body=stub_body) as conn_log:
+            self.replicator.handoff_delete = 2
+            self.replicator._zero_stats()
+            self.replicator.replicate()
+        # all jobs processed!
+        self.assertEqual(self.replicator.job_count,
+                         self.replicator.total_stats.attempted)
+        self.assertFalse(self.replicator.handoffs_remaining)
+        # sanity, all parts got replicated
+        found_replicate_calls = defaultdict(int)
+        for req in conn_log.requests:
+            self.assertEqual(req['method'], 'REPLICATE')
+            found_replicate_key = (
+                int(req['headers']['X-Backend-Storage-Policy-Index']),
+                req['path'])
+            found_replicate_calls[found_replicate_key] += 1
+        expected_replicate_calls = {
+            (int(remaining_policy), '/sda/1/a83'): 2,
+            (0, '/sda/0'): 2,
+            (1, '/sda/0'): 2,
+            (0, '/sda/2'): 2,
+            (1, '/sda/2'): 2,
+            (0, '/sda/3'): 2,
+            (1, '/sda/3'): 2,
+        }
+        self.assertEqual(dict(found_replicate_calls),
+                         expected_replicate_calls)
+
+        # and now all handoff partitions have been rebalanced away!
+        removed_paths = set()
+        for path in handoff_suffix_paths:
+            if not os.path.exists(path):
+                removed_paths.add(path)
+        self.assertEqual(removed_paths, set(handoff_suffix_paths))
+
+    def test_replicator_skips_bogus_partition_dirs(self):
+        # A directory in the wrong place shouldn't crash the replicator
+        rmtree(self.objects)
+        rmtree(self.objects_1)
+        os.mkdir(self.objects)
+        os.mkdir(self.objects_1)
+
+        os.mkdir(os.path.join(self.objects, "burrito"))
+        jobs = self.replicator.collect_jobs()
+        self.assertEqual(len(jobs), 0)
+
+    def test_replicator_skips_rsync_temp_files(self):
+        # the empty pre-setup dirs aren't that useful to us
+        device_path = os.path.join(self.devices, 'sda')
+        rmtree(device_path, ignore_errors=1)
+        os.mkdir(device_path)
+        # create a real data file to trigger rsync
+        df = self.df_mgr.get_diskfile('sda', '0', 'a', 'c', 'o',
+                                      policy=POLICIES.legacy)
+        ts = next(self.ts)
+        with df.create() as w:
+            w.write(b'asdf')
+            w.put({'X-Timestamp': ts.internal})
+            w.commit(ts)
+        # pre-flight and post sync request for both other primaries
+        expected_replicate_requests = 4
+        process_arg_checker = [
+            # (return_code, stdout, <each in capture rsync args>)
+            (0, '', []),
+            (0, '', []),
+        ]
+        stub_body = pickle.dumps({})
+        with _mock_process(process_arg_checker) as rsync_log, \
+            mock.patch('swift.obj.replicator.whataremyips',
+                       side_effect=_ips), \
+                mocked_http_conn(*[200] * expected_replicate_requests,
+                                 body=stub_body) as conn_log:
+            self.replicator.replicate()
+        self.assertEqual(['REPLICATE'] * expected_replicate_requests,
+                         [r['method'] for r in conn_log.requests])
+        # expect one rsync to each other primary node
+        self.assertEqual(2, len(rsync_log))
+        expected = '--exclude=.*.[0-9a-zA-Z][0-9a-zA-Z][0-9a-zA-Z]' \
+            '[0-9a-zA-Z][0-9a-zA-Z][0-9a-zA-Z]'
+        for subprocess_info in rsync_log:
+            rsync_args = subprocess_info['rsync_args']
+            for arg in rsync_args:
+                if arg.startswith('--exclude'):
+                    self.assertEqual(arg, expected)
+                    break
+            else:
+                self.fail('Did not find --exclude argument in %r' %
+                          rsync_args)
+
+    def test_replicator_removes_zbf(self):
+        # After running xfs_repair, a partition directory could become a
+        # zero-byte file. If this happens, the replicator should clean it
+        # up, log something, and move on to the next partition.
+
+        # Surprise! Partition dir 1 is actually a zero-byte file.
+        pol_0_part_1_path = os.path.join(self.objects, '1')
+        rmtree(pol_0_part_1_path)
+        with open(pol_0_part_1_path, 'w'):
+            pass
+        self.assertTrue(os.path.isfile(pol_0_part_1_path))  # sanity check
+
+        # Policy 1's partition dir 1 is also a zero-byte file.
+        pol_1_part_1_path = os.path.join(self.objects_1, '1')
+        rmtree(pol_1_part_1_path)
+        with open(pol_1_part_1_path, 'w'):
+            pass
+        self.assertTrue(os.path.isfile(pol_1_part_1_path))  # sanity check
+
+        # Don't delete things in collect_jobs(); all the stat() calls would
+        # make replicator startup really slow.
+        self.replicator.collect_jobs()
+        self.assertTrue(os.path.exists(pol_0_part_1_path))
+        self.assertTrue(os.path.exists(pol_1_part_1_path))
+
+        # After a replication pass, the files should be gone
+        with mock.patch('swift.obj.replicator.http_connect',
+                        mock_http_connect(200)):
+            self.replicator.run_once()
+
+        self.assertFalse(os.path.exists(pol_0_part_1_path))
+        self.assertFalse(os.path.exists(pol_1_part_1_path))
+        self.assertEqual(
+            sorted(self.logger.get_lines_for_level('warning')), [
+                ('Removing partition directory which was a file: %s'
+                 % pol_1_part_1_path),
+                ('Removing partition directory which was a file: %s'
+                 % pol_0_part_1_path),
+            ])
+
+    def test_delete_partition(self):
+        with mock.patch('swift.obj.replicator.http_connect',
+                        mock_http_connect(200)):
+            df = self.df_mgr.get_diskfile('sda', '1', 'a', 'c', 'o',
+                                          policy=POLICIES.legacy)
+            mkdirs(df._datadir)
+            f = open(os.path.join(df._datadir,
                                   normalize_timestamp(time.time()) + '.data'),
                      'wb')
-            f.write('1234567890')
+            f.write(b'1234567890')
             f.close()
             ohash = hash_path('a', 'c', 'o')
             data_dir = ohash[-3:]
-            whole_path_from = os.path.join(self.objects, cur_part, data_dir)
+            whole_path_from = os.path.join(self.objects, '1', data_dir)
+            part_path = os.path.join(self.objects, '1')
+            self.assertTrue(os.path.exists(part_path))
+            ring = self.replicator.load_object_ring(POLICIES[0])
+            nodes = [node for node in
+                     ring.get_part_nodes(1)
+                     if node['ip'] not in _ips()]
             process_arg_checker = []
+            for node in nodes:
+                rsync_mod = '%s::object/sda/objects/%s' % (node['ip'], 1)
+                process_arg_checker.append(
+                    (0, '', ['rsync', whole_path_from, rsync_mod]))
+            with _mock_process(process_arg_checker):
+                self.replicator.replicate()
+            self.assertFalse(os.path.exists(part_path))
+
+    def test_delete_partition_default_sync_method(self):
+        self.replicator.conf.pop('sync_method')
+        with mock.patch('swift.obj.replicator.http_connect',
+                        mock_http_connect(200)):
+            df = self.df_mgr.get_diskfile('sda', '1', 'a', 'c', 'o',
+                                          policy=POLICIES.legacy)
+            mkdirs(df._datadir)
+            f = open(os.path.join(df._datadir,
+                                  normalize_timestamp(time.time()) + '.data'),
+                     'wb')
+            f.write(b'1234567890')
+            f.close()
+            ohash = hash_path('a', 'c', 'o')
+            data_dir = ohash[-3:]
+            whole_path_from = os.path.join(self.objects, '1', data_dir)
+            part_path = os.path.join(self.objects, '1')
+            self.assertTrue(os.path.exists(part_path))
+            ring = self.replicator.load_object_ring(POLICIES[0])
             nodes = [node for node in
-                     self.ring.get_part_nodes(int(cur_part)) \
-                         if node['ip'] not in _ips()]
+                     ring.get_part_nodes(1)
+                     if node['ip'] not in _ips()]
+            process_arg_checker = []
             for node in nodes:
-                rsync_mod = '%s::object/sda/objects/%s' % (node['ip'],
-                                                           cur_part)
+                rsync_mod = '%s::object/sda/objects/%s' % (node['ip'], 1)
                 process_arg_checker.append(
                     (0, '', ['rsync', whole_path_from, rsync_mod]))
-            self.assertTrue(os.access(os.path.join(self.objects,
-                                                   '1', data_dir, ohash),
-                                      os.F_OK))
             with _mock_process(process_arg_checker):
-                replicator.run_once()
-            self.assertFalse(process_errors)
-            for i, result in [('0', True), ('1', False),
-                              ('2', True), ('3', True)]:
-                self.assertEquals(os.access(
-                        os.path.join(self.objects,
-                                     i, object_replicator.HASH_FILE),
-                        os.F_OK), result)
-        finally:
-            object_replicator.http_connect = was_connector
+                self.replicator.replicate()
+            self.assertFalse(os.path.exists(part_path))
 
-    def test_run_once_recover_from_timeout(self):
-        replicator = object_replicator.ObjectReplicator(
-            dict(swift_dir=self.testdir, devices=self.devices,
-                mount_check='false', timeout='300', stats_interval='1'))
-        was_connector = object_replicator.http_connect
-        was_get_hashes = object_replicator.get_hashes
-        was_execute = tpool.execute
-        self.get_hash_count = 0
-        try:
+    def test_delete_partition_ssync_single_region(self):
+        devs = [
+            {'id': 0, 'device': 'sda', 'zone': 0,
+             'region': 1, 'ip': '127.0.0.0', 'port': 6200},
+            {'id': 1, 'device': 'sda', 'zone': 1,
+             'region': 1, 'ip': '127.0.0.1', 'port': 6200},
+            {'id': 2, 'device': 'sda', 'zone': 2,
+             'region': 1, 'ip': '127.0.0.2', 'port': 6200},
+            {'id': 3, 'device': 'sda', 'zone': 4,
+             'region': 1, 'ip': '127.0.0.3', 'port': 6200},
+            {'id': 4, 'device': 'sda', 'zone': 5,
+             'region': 1, 'ip': '127.0.0.4', 'port': 6200},
+            {'id': 5, 'device': 'sda', 'zone': 6,
+             'region': 1, 'ip': 'fe80::202:b3ff:fe1e:8329', 'port': 6200},
+            {'id': 6, 'device': 'sda', 'zone': 7, 'region': 1,
+             'ip': '2001:0db8:85a3:0000:0000:8a2e:0370:7334', 'port': 6200},
+        ]
+        _create_test_rings(self.testdir, devs=devs)
+        self.conf['sync_method'] = 'ssync'
+        self.replicator = object_replicator.ObjectReplicator(self.conf)
+        self.replicator.logger = debug_logger()
+        self.replicator._zero_stats()
+
+        with mock.patch('swift.obj.replicator.http_connect',
+                        mock_http_connect(200)):
+            df = self.df_mgr.get_diskfile('sda', '1', 'a', 'c', 'o',
+                                          policy=POLICIES.legacy)
+            mkdirs(df._datadir)
+            ts = normalize_timestamp(time.time())
+            f = open(os.path.join(df._datadir, ts + '.data'),
+                     'wb')
+            f.write(b'1234567890')
+            f.close()
+            ohash = hash_path('a', 'c', 'o')
+            whole_path_from = storage_directory(self.objects, 1, ohash)
+            suffix_dir_path = os.path.dirname(whole_path_from)
+            part_path = os.path.join(self.objects, '1')
+            self.assertTrue(os.path.exists(part_path))
+
+            def _fake_ssync(node, job, suffixes, **kwargs):
+                return True, {ohash: ts}
+
+            self.replicator.sync_method = _fake_ssync
+            self.replicator.replicate()
+            self.assertFalse(os.path.exists(whole_path_from))
+            self.assertFalse(os.path.exists(suffix_dir_path))
+            self.assertFalse(os.path.exists(part_path))
+
+    def test_delete_partition_1(self):
+        with mock.patch('swift.obj.replicator.http_connect',
+                        mock_http_connect(200)):
+            df = self.df_mgr.get_diskfile('sda', '1', 'a', 'c', 'o',
+                                          policy=POLICIES[1])
+            mkdirs(df._datadir)
+            f = open(os.path.join(df._datadir,
+                                  normalize_timestamp(time.time()) + '.data'),
+                     'wb')
+            f.write(b'1234567890')
+            f.close()
+            ohash = hash_path('a', 'c', 'o')
+            data_dir = ohash[-3:]
+            whole_path_from = os.path.join(self.objects_1, '1', data_dir)
+            part_path = os.path.join(self.objects_1, '1')
+            self.assertTrue(os.path.exists(part_path))
+            ring = self.replicator.load_object_ring(POLICIES[1])
+            nodes = [node for node in
+                     ring.get_part_nodes(1)
+                     if node['ip'] not in _ips()]
+            process_arg_checker = []
+            for node in nodes:
+                rsync_mod = '%s::object/sda/objects-1/%s' % (node['ip'], 1)
+                process_arg_checker.append(
+                    (0, '', ['rsync', whole_path_from, rsync_mod]))
+            with _mock_process(process_arg_checker):
+                self.replicator.replicate()
+            self.assertFalse(os.path.exists(part_path))
+
+    def test_delete_partition_with_failures(self):
+        with mock.patch('swift.obj.replicator.http_connect',
+                        mock_http_connect(200)):
+            df = self.df_mgr.get_diskfile('sda', '1', 'a', 'c', 'o',
+                                          policy=POLICIES.legacy)
+            mkdirs(df._datadir)
+            f = open(os.path.join(df._datadir,
+                                  normalize_timestamp(time.time()) + '.data'),
+                     'wb')
+            f.write(b'1234567890')
+            f.close()
+            ohash = hash_path('a', 'c', 'o')
+            data_dir = ohash[-3:]
+            whole_path_from = os.path.join(self.objects, '1', data_dir)
+            part_path = os.path.join(self.objects, '1')
+            self.assertTrue(os.path.exists(part_path))
+            ring = self.replicator.load_object_ring(POLICIES[0])
+            nodes = [node for node in
+                     ring.get_part_nodes(1)
+                     if node['ip'] not in _ips()]
+            process_arg_checker = []
+            for i, node in enumerate(nodes):
+                rsync_mod = '%s::object/sda/objects/%s' % (node['ip'], 1)
+                if i == 0:
+                    # force one of the rsync calls to fail
+                    ret_code = 1
+                else:
+                    ret_code = 0
+                process_arg_checker.append(
+                    (ret_code, '', ['rsync', whole_path_from, rsync_mod]))
+            with _mock_process(process_arg_checker):
+                self.replicator.replicate()
+            # The path should still exist
+            self.assertTrue(os.path.exists(part_path))
+
+    def test_delete_partition_with_handoff_delete(self):
+        with mock.patch('swift.obj.replicator.http_connect',
+                        mock_http_connect(200)):
+            self.replicator.handoff_delete = 2
+            df = self.df_mgr.get_diskfile('sda', '1', 'a', 'c', 'o',
+                                          policy=POLICIES.legacy)
+            mkdirs(df._datadir)
+            f = open(os.path.join(df._datadir,
+                                  normalize_timestamp(time.time()) + '.data'),
+                     'wb')
+            f.write(b'1234567890')
+            f.close()
+            ohash = hash_path('a', 'c', 'o')
+            data_dir = ohash[-3:]
+            whole_path_from = os.path.join(self.objects, '1', data_dir)
+            part_path = os.path.join(self.objects, '1')
+            self.assertTrue(os.path.exists(part_path))
+            ring = self.replicator.load_object_ring(POLICIES[0])
+            nodes = [node for node in
+                     ring.get_part_nodes(1)
+                     if node['ip'] not in _ips()]
+            process_arg_checker = []
+            for i, node in enumerate(nodes):
+                rsync_mod = '%s::object/sda/objects/%s' % (node['ip'], 1)
+                if i == 0:
+                    # force one of the rsync calls to fail
+                    ret_code = 1
+                else:
+                    ret_code = 0
+                process_arg_checker.append(
+                    (ret_code, '', ['rsync', whole_path_from, rsync_mod]))
+            with _mock_process(process_arg_checker):
+                self.replicator.replicate()
+            self.assertFalse(os.path.exists(part_path))
+
+    def test_delete_partition_with_too_high_handoff_delete(self):
+        with mock.patch('swift.obj.replicator.http_connect',
+                        mock_http_connect(200)):
+            self.replicator.handoff_delete = 5
+            df = self.df_mgr.get_diskfile('sda', '1', 'a', 'c', 'o',
+                                          policy=POLICIES.legacy)
+            mkdirs(df._datadir)
+            f = open(os.path.join(df._datadir,
+                                  normalize_timestamp(time.time()) + '.data'),
+                     'wb')
+            f.write(b'1234567890')
+            f.close()
+            ohash = hash_path('a', 'c', 'o')
+            data_dir = ohash[-3:]
+            whole_path_from = os.path.join(self.objects, '1', data_dir)
+            part_path = os.path.join(self.objects, '1')
+            self.assertTrue(os.path.exists(part_path))
+            ring = self.replicator.load_object_ring(POLICIES[0])
+            nodes = [node for node in
+                     ring.get_part_nodes(1)
+                     if node['ip'] not in _ips()]
+            self.assertLess(len(nodes), self.replicator.handoff_delete)
+            process_arg_checker = []
+            for i, node in enumerate(nodes):
+                rsync_mod = '%s::object/sda/objects/%s' % (node['ip'], 1)
+                # everybody succeeds
+                ret_code = 0
+                process_arg_checker.append(
+                    (ret_code, '', ['rsync', whole_path_from, rsync_mod]))
+            with _mock_process(process_arg_checker):
+                self.replicator.replicate()
+            self.assertFalse(os.path.exists(part_path))
+
+    def test_delete_partition_with_handoff_delete_failures(self):
+        with mock.patch('swift.obj.replicator.http_connect',
+                        mock_http_connect(200)):
+            self.replicator.handoff_delete = 2
+            df = self.df_mgr.get_diskfile('sda', '1', 'a', 'c', 'o',
+                                          policy=POLICIES.legacy)
+            mkdirs(df._datadir)
+            f = open(os.path.join(df._datadir,
+                                  normalize_timestamp(time.time()) + '.data'),
+                     'wb')
+            f.write(b'1234567890')
+            f.close()
+            ohash = hash_path('a', 'c', 'o')
+            data_dir = ohash[-3:]
+            whole_path_from = os.path.join(self.objects, '1', data_dir)
+            part_path = os.path.join(self.objects, '1')
+            self.assertTrue(os.path.exists(part_path))
+            ring = self.replicator.load_object_ring(POLICIES[0])
+            nodes = [node for node in
+                     ring.get_part_nodes(1)
+                     if node['ip'] not in _ips()]
+            process_arg_checker = []
+            for i, node in enumerate(nodes):
+                rsync_mod = '%s::object/sda/objects/%s' % (node['ip'], 1)
+                if i in (0, 1):
+                    # force two of the rsync calls to fail
+                    ret_code = 1
+                else:
+                    ret_code = 0
+                process_arg_checker.append(
+                    (ret_code, '', ['rsync', whole_path_from, rsync_mod]))
+            with _mock_process(process_arg_checker):
+                self.replicator.replicate()
+            # The file should still exist
+            self.assertTrue(os.path.exists(part_path))
+
+    def test_delete_partition_with_handoff_delete_fail_in_other_region(self):
+        with mock.patch('swift.obj.replicator.http_connect',
+                        mock_http_connect(200)):
+            df = self.df_mgr.get_diskfile('sda', '1', 'a', 'c', 'o',
+                                          policy=POLICIES.legacy)
+            mkdirs(df._datadir)
+            f = open(os.path.join(df._datadir,
+                                  normalize_timestamp(time.time()) + '.data'),
+                     'wb')
+            f.write(b'1234567890')
+            f.close()
+            ohash = hash_path('a', 'c', 'o')
+            data_dir = ohash[-3:]
+            whole_path_from = os.path.join(self.objects, '1', data_dir)
+            part_path = os.path.join(self.objects, '1')
+            self.assertTrue(os.path.exists(part_path))
+            ring = self.replicator.load_object_ring(POLICIES[0])
+            nodes = [node for node in
+                     ring.get_part_nodes(1)
+                     if node['ip'] not in _ips()]
+            process_arg_checker = []
+            for node in nodes:
+                rsync_mod = '%s::object/sda/objects/%s' % (node['ip'], 1)
+                if node['region'] != 1:
+                    #  the rsync calls for other region to fail
+                    ret_code = 1
+                else:
+                    ret_code = 0
+                process_arg_checker.append(
+                    (ret_code, '', ['rsync', whole_path_from, rsync_mod]))
+            with _mock_process(process_arg_checker):
+                self.replicator.replicate()
+            # The file should still exist
+            self.assertTrue(os.path.exists(part_path))
+
+    def test_delete_partition_override_params(self):
+        df = self.df_mgr.get_diskfile('sda', '0', 'a', 'c', 'o',
+                                      policy=POLICIES.legacy)
+        mkdirs(df._datadir)
+        part_path = os.path.join(self.objects, '1')
+        self.assertTrue(os.path.exists(part_path))
+        self.replicator.replicate(override_devices=['sdb'])
+        self.assertTrue(os.path.exists(part_path))
+        self.replicator.replicate(override_partitions=[9])
+        self.assertTrue(os.path.exists(part_path))
+        self.replicator.replicate(override_devices=['sda'],
+                                  override_partitions=[1])
+        self.assertFalse(os.path.exists(part_path))
+
+    def _make_OSError(self, err):
+        return OSError(err, os.strerror(err))
+
+    def test_delete_partition_override_params_os_not_empty_error(self):
+        part_path = os.path.join(self.objects, '1')
+        with mock.patch('swift.obj.replicator.shutil.rmtree') as mockrmtree:
+            mockrmtree.side_effect = self._make_OSError(errno.ENOTEMPTY)
+            self.replicator.replicate(override_devices=['sda'],
+                                      override_partitions=[1],
+                                      override_policies=[0])
+            error_lines = self.replicator.logger.get_lines_for_level('error')
+            self.assertFalse(error_lines)
+            self.assertTrue(os.path.exists(part_path))
+            self.assertEqual([mock.call(part_path)], mockrmtree.call_args_list)
+
+    def test_delete_partition_ignores_os_no_entity_error(self):
+        part_path = os.path.join(self.objects, '1')
+        with mock.patch('swift.obj.replicator.shutil.rmtree') as mockrmtree:
+            mockrmtree.side_effect = self._make_OSError(errno.ENOENT)
+            self.replicator.replicate(override_devices=['sda'],
+                                      override_partitions=[1],
+                                      override_policies=[0])
+        error_lines = self.replicator.logger.get_lines_for_level('error')
+        self.assertFalse(error_lines)
+        self.assertTrue(os.path.exists(part_path))
+        self.assertEqual([mock.call(part_path)], mockrmtree.call_args_list)
+
+    def test_delete_partition_ignores_os_no_data_error(self):
+        part_path = os.path.join(self.objects, '1')
+        with mock.patch('swift.obj.replicator.shutil.rmtree') as mockrmtree:
+            mockrmtree.side_effect = self._make_OSError(errno.ENODATA)
+            self.replicator.replicate(override_devices=['sda'],
+                                      override_partitions=[1],
+                                      override_policies=[0])
+            error_lines = self.replicator.logger.get_lines_for_level('error')
+            self.assertFalse(error_lines)
+            self.assertTrue(os.path.exists(part_path))
+            self.assertEqual([mock.call(part_path)], mockrmtree.call_args_list)
+
+    @mock.patch('swift.common.bufferedhttp.BufferedHTTPConnection.connect',
+                side_effect=OSError(errno.ECONNREFUSED, 'ECONNREFUSED'))
+    def test_delete_policy_override_params(self, _mock_connect):
+        df0 = self.df_mgr.get_diskfile('sda', '99', 'a', 'c', 'o',
+                                       policy=POLICIES.legacy)
+        df1 = self.df_mgr.get_diskfile('sda', '99', 'a', 'c', 'o',
+                                       policy=POLICIES[1])
+        mkdirs(df0._datadir)
+        mkdirs(df1._datadir)
+
+        pol0_part_path = os.path.join(self.objects, '99')
+        pol1_part_path = os.path.join(self.objects_1, '99')
+
+        # sanity checks
+        self.assertTrue(os.path.exists(pol0_part_path))
+        self.assertTrue(os.path.exists(pol1_part_path))
+
+        # a bogus policy index doesn't bother the replicator any more than a
+        # bogus device or partition does
+        self.replicator.run_once(policies='1,2,5')
+
+        self.assertFalse(os.path.exists(pol1_part_path))
+        self.assertTrue(os.path.exists(pol0_part_path))
+
+        # since we weren't operating on everything, but only a subset of
+        # storage policies, we didn't dump any recon stats.
+        self.assertFalse(os.path.exists(
+            os.path.join(self.recon_cache, RECON_OBJECT_FILE)))
+
+    def test_delete_partition_ssync(self):
+        with mock.patch('swift.obj.replicator.http_connect',
+                        mock_http_connect(200)):
+            df = self.df_mgr.get_diskfile('sda', '1', 'a', 'c', 'o',
+                                          policy=POLICIES.legacy)
+            mkdirs(df._datadir)
+            ts = normalize_timestamp(time.time())
+            f = open(os.path.join(df._datadir, ts + '.data'),
+                     'wb')
+            f.write(b'0')
+            f.close()
+            ohash = hash_path('a', 'c', 'o')
+            whole_path_from = storage_directory(self.objects, 1, ohash)
+            suffix_dir_path = os.path.dirname(whole_path_from)
+            part_path = os.path.join(self.objects, '1')
+            self.assertTrue(os.path.exists(part_path))
 
-            def fake_get_hashes(*args, **kwargs):
-                self.get_hash_count += 1
-                if self.get_hash_count == 3:
-                    # raise timeout on last call to get hashes
-                    raise Timeout()
-                return 2, {'abc': 'def'}
+            self.call_nums = 0
+            self.conf['sync_method'] = 'ssync'
 
-            def fake_exc(tester, *args, **kwargs):
-                if 'Error syncing partition' in args[0]:
-                    tester.i_failed = True
+            def _fake_ssync(node, job, suffixes, **kwargs):
+                success = True
+                ret_val = {ohash: ts}
+                if self.call_nums == 2:
+                    # ssync should return (True, []) only when the second
+                    # candidate node has not get the replica yet.
+                    success = False
+                    ret_val = {}
+                self.call_nums += 1
+                return success, ret_val
 
-            self.i_failed = False
+            self.replicator.sync_method = _fake_ssync
+            self.replicator.replicate()
+            # The file should still exist
+            self.assertTrue(os.path.exists(whole_path_from))
+            self.assertTrue(os.path.exists(suffix_dir_path))
+            self.assertTrue(os.path.exists(part_path))
+            self.replicator.replicate()
+            # The file should be deleted at the second replicate call
+            self.assertFalse(os.path.exists(whole_path_from))
+            self.assertFalse(os.path.exists(suffix_dir_path))
+            self.assertTrue(os.path.exists(part_path))
+            self.replicator.replicate()
+            # The partition should be deleted at the third replicate call
+            self.assertFalse(os.path.exists(whole_path_from))
+            self.assertFalse(os.path.exists(suffix_dir_path))
+            self.assertFalse(os.path.exists(part_path))
+            del self.call_nums
+
+    def test_delete_partition_ssync_with_sync_failure(self):
+        with mock.patch('swift.obj.replicator.http_connect',
+                        mock_http_connect(200)):
+            df = self.df_mgr.get_diskfile('sda', '1', 'a', 'c', 'o',
+                                          policy=POLICIES.legacy)
+            ts = normalize_timestamp(time.time())
+            mkdirs(df._datadir)
+            f = open(os.path.join(df._datadir, ts + '.data'), 'wb')
+            f.write(b'0')
+            f.close()
+            ohash = hash_path('a', 'c', 'o')
+            whole_path_from = storage_directory(self.objects, 1, ohash)
+            suffix_dir_path = os.path.dirname(whole_path_from)
+            part_path = os.path.join(self.objects, '1')
+            self.assertTrue(os.path.exists(part_path))
+            self.call_nums = 0
+            self.conf['sync_method'] = 'ssync'
+
+            def _fake_ssync(node, job, suffixes, **kwags):
+                success = False
+                ret_val = {}
+                if self.call_nums == 2:
+                    # ssync should return (True, []) only when the second
+                    # candidate node has not get the replica yet.
+                    success = True
+                    ret_val = {ohash: ts}
+                self.call_nums += 1
+                return success, ret_val
+
+            self.replicator.sync_method = _fake_ssync
+            self.replicator.replicate()
+            # The file should still exist
+            self.assertTrue(os.path.exists(whole_path_from))
+            self.assertTrue(os.path.exists(suffix_dir_path))
+            self.assertTrue(os.path.exists(part_path))
+            self.replicator.replicate()
+            # The file should still exist
+            self.assertTrue(os.path.exists(whole_path_from))
+            self.assertTrue(os.path.exists(suffix_dir_path))
+            self.assertTrue(os.path.exists(part_path))
+            self.replicator.replicate()
+            # The file should still exist
+            self.assertTrue(os.path.exists(whole_path_from))
+            self.assertTrue(os.path.exists(suffix_dir_path))
+            self.assertTrue(os.path.exists(part_path))
+            del self.call_nums
+
+    def test_delete_objs_ssync_only_when_in_sync(self):
+        self.replicator.logger = debug_logger('test-replicator')
+        with mock.patch('swift.obj.replicator.http_connect',
+                        mock_http_connect(200)):
+            df = self.df_mgr.get_diskfile('sda', '1', 'a', 'c', 'o',
+                                          policy=POLICIES.legacy)
+            mkdirs(df._datadir)
+            ts = normalize_timestamp(time.time())
+            f = open(os.path.join(df._datadir, ts + '.data'), 'wb')
+            f.write(b'0')
+            f.close()
+            ohash = hash_path('a', 'c', 'o')
+            whole_path_from = storage_directory(self.objects, 1, ohash)
+            suffix_dir_path = os.path.dirname(whole_path_from)
+            part_path = os.path.join(self.objects, '1')
+            self.assertTrue(os.path.exists(part_path))
+            self.call_nums = 0
+            self.conf['sync_method'] = 'ssync'
+
+            in_sync_objs = {}
+
+            def _fake_ssync(node, job, suffixes, remote_check_objs=None):
+                self.call_nums += 1
+                if remote_check_objs is None:
+                    # sync job
+                    ret_val = {ohash: ts}
+                else:
+                    ret_val = in_sync_objs
+                return True, ret_val
+
+            self.replicator.sync_method = _fake_ssync
+            self.replicator.replicate()
+            self.assertEqual(3, self.call_nums)
+            # The file should still exist
+            self.assertTrue(os.path.exists(whole_path_from))
+            self.assertTrue(os.path.exists(suffix_dir_path))
+            self.assertTrue(os.path.exists(part_path))
+
+            del self.call_nums
+
+    def test_delete_partition_ssync_with_cleanup_failure(self):
+        with mock.patch('swift.obj.replicator.http_connect',
+                        mock_http_connect(200)):
+            self.replicator.logger = mock_logger = \
+                debug_logger('test-replicator')
+            df = self.df_mgr.get_diskfile('sda', '1', 'a', 'c', 'o',
+                                          policy=POLICIES.legacy)
+            mkdirs(df._datadir)
+            ts = normalize_timestamp(time.time())
+            f = open(os.path.join(df._datadir, ts + '.data'), 'wb')
+            f.write(b'0')
+            f.close()
+            ohash = hash_path('a', 'c', 'o')
+            whole_path_from = storage_directory(self.objects, 1, ohash)
+            suffix_dir_path = os.path.dirname(whole_path_from)
+            part_path = os.path.join(self.objects, '1')
+            self.assertTrue(os.path.exists(part_path))
+
+            self.call_nums = 0
+            self.conf['sync_method'] = 'ssync'
+
+            def _fake_ssync(node, job, suffixes, **kwargs):
+                success = True
+                ret_val = {ohash: ts}
+                if self.call_nums == 2:
+                    # ssync should return (True, []) only when the second
+                    # candidate node has not get the replica yet.
+                    success = False
+                    ret_val = {}
+                self.call_nums += 1
+                return success, ret_val
+
+            rmdir_func = os.rmdir
+
+            def raise_exception_rmdir(exception_class, error_no):
+                instance = exception_class()
+                instance.errno = error_no
+                instance.strerror = os.strerror(error_no)
+
+                def func(directory, dir_fd=None):
+                    if directory == suffix_dir_path:
+                        raise instance
+                    else:
+                        rmdir_func(directory)
+
+                return func
+
+            self.replicator.sync_method = _fake_ssync
+            self.replicator.replicate()
+            # The file should still exist
+            self.assertTrue(os.path.exists(whole_path_from))
+            self.assertTrue(os.path.exists(suffix_dir_path))
+            self.assertTrue(os.path.exists(part_path))
+
+            # Fail with ENOENT
+            with mock.patch('os.rmdir',
+                            raise_exception_rmdir(OSError, ENOENT)):
+                self.replicator.replicate()
+            self.assertFalse(mock_logger.get_lines_for_level('error'))
+            self.assertFalse(os.path.exists(whole_path_from))
+            self.assertTrue(os.path.exists(suffix_dir_path))
+            self.assertTrue(os.path.exists(part_path))
+
+            # Fail with ENOTEMPTY
+            with mock.patch('os.rmdir',
+                            raise_exception_rmdir(OSError, ENOTEMPTY)):
+                self.replicator.replicate()
+            self.assertFalse(mock_logger.get_lines_for_level('error'))
+            self.assertFalse(os.path.exists(whole_path_from))
+            self.assertTrue(os.path.exists(suffix_dir_path))
+            self.assertTrue(os.path.exists(part_path))
+
+            # Fail with ENOTDIR
+            with mock.patch('os.rmdir',
+                            raise_exception_rmdir(OSError, ENOTDIR)):
+                self.replicator.replicate()
+            self.assertEqual(mock_logger.get_lines_for_level('error'), [
+                'Unexpected error trying to cleanup suffix dir %r: ' %
+                os.path.dirname(df._datadir),
+            ])
+            self.assertFalse(os.path.exists(whole_path_from))
+            self.assertTrue(os.path.exists(suffix_dir_path))
+            self.assertTrue(os.path.exists(part_path))
+
+            # Finally we can cleanup everything
+            self.replicator.replicate()
+            self.assertFalse(os.path.exists(whole_path_from))
+            self.assertFalse(os.path.exists(suffix_dir_path))
+            self.assertTrue(os.path.exists(part_path))
+            self.replicator.replicate()
+            self.assertFalse(os.path.exists(whole_path_from))
+            self.assertFalse(os.path.exists(suffix_dir_path))
+            self.assertFalse(os.path.exists(part_path))
+
+    def test_run_once_recover_from_failure(self):
+        conf = dict(swift_dir=self.testdir, devices=self.devices,
+                    bind_ip=_ips()[0],
+                    mount_check='false', timeout='300', stats_interval='1')
+        replicator = object_replicator.ObjectReplicator(conf)
+        was_connector = object_replicator.http_connect
+        try:
             object_replicator.http_connect = mock_http_connect(200)
-            object_replicator.get_hashes = fake_get_hashes
-            replicator.logger.exception = \
-                lambda *args, **kwargs: fake_exc(self, *args, **kwargs)
             # Write some files into '1' and run replicate- they should be moved
             # to the other partitions and then node should get deleted.
             cur_part = '1'
-            df = DiskFile(self.devices, 'sda', cur_part, 'a', 'c', 'o',
-                          FakeLogger())
-            mkdirs(df.datadir)
-            f = open(os.path.join(df.datadir,
+            df = self.df_mgr.get_diskfile('sda', cur_part, 'a', 'c', 'o',
+                                          policy=POLICIES.legacy)
+            mkdirs(df._datadir)
+            f = open(os.path.join(df._datadir,
                                   normalize_timestamp(time.time()) + '.data'),
                      'wb')
-            f.write('1234567890')
+            f.write(b'1234567890')
             f.close()
             ohash = hash_path('a', 'c', 'o')
             data_dir = ohash[-3:]
             whole_path_from = os.path.join(self.objects, cur_part, data_dir)
+            ring = replicator.load_object_ring(POLICIES[0])
             process_arg_checker = []
             nodes = [node for node in
-                     self.ring.get_part_nodes(int(cur_part)) \
-                         if node['ip'] not in _ips()]
+                     ring.get_part_nodes(int(cur_part))
+                     if node['ip'] not in _ips()]
             for node in nodes:
                 rsync_mod = '%s::object/sda/objects/%s' % (node['ip'],
                                                            cur_part)
                 process_arg_checker.append(
                     (0, '', ['rsync', whole_path_from, rsync_mod]))
-            self.assertTrue(os.access(os.path.join(self.objects,
-                                                   '1', data_dir, ohash),
-                                      os.F_OK))
+            self.assertTrue(os.path.exists(os.path.join(
+                self.objects, '1', data_dir, ohash)))
             with _mock_process(process_arg_checker):
                 replicator.run_once()
             self.assertFalse(process_errors)
-            self.assertFalse(self.i_failed)
+            for i, result in [('0', True), ('1', False),
+                              ('2', True), ('3', True)]:
+                hashes_pkl = os.path.join(self.objects, i, diskfile.HASH_FILE)
+                self.assertEqual(os.path.exists(hashes_pkl), result)
         finally:
             object_replicator.http_connect = was_connector
-            object_replicator.get_hashes = was_get_hashes
-            tpool.execute = was_execute
+
+    def test_run_once_recover_from_timeout(self):
+        # verify that replicator will pass over all policies' partitions even
+        # if a timeout occurs while replicating one partition to one node.
+        timeouts = [Timeout()]
+
+        def fake_get_hashes(df_mgr, device, partition, policy, **kwargs):
+            self.get_hash_count += 1
+            dev_path = df_mgr.get_dev_path(device)
+            part_path = os.path.join(dev_path, diskfile.get_data_dir(policy),
+                                     str(partition))
+            # Simulate a REPLICATE timeout by raising Timeout for second call
+            # to get_hashes (with recalculate suffixes) for a specific
+            # partition
+            if (timeouts and '/objects/' in part_path and
+                    part_path.endswith('0') and 'recalculate' in kwargs):
+                raise timeouts.pop(0)
+            return 1, {'abc': 'def'}
+
+        # map partition_path -> [nodes]
+        sync_paths = collections.defaultdict(list)
+
+        def fake_sync(node, job, suffixes, *args, **kwargs):
+            sync_paths[job['path']].append(node)
+            return True, {}
+
+        conf = dict(swift_dir=self.testdir, devices=self.devices,
+                    bind_ip=_ips()[0],  # local dev has id=0
+                    mount_check='false', timeout='300', stats_interval='1')
+        with mock.patch('swift.obj.diskfile.DiskFileManager._get_hashes',
+                        fake_get_hashes):
+            with mock.patch('swift.obj.replicator.http_connect',
+                            mock_http_connect(200)):
+                with mock.patch('swift.obj.replicator.dump_recon_cache'):
+                    replicator = object_replicator.ObjectReplicator(
+                        conf, logger=self.logger)
+
+                    self.get_hash_count = 0
+                    with mock.patch.object(replicator, 'sync', fake_sync):
+                        replicator.run_once()
+
+        log_lines = replicator.logger.logger.get_lines_for_level('error')
+        self.assertIn("Error syncing with node:", log_lines[0])
+        self.assertFalse(log_lines[1:])
+        # setup creates 4 partitions; partition 1 does not map to local dev id
+        # 0 so will be handled by update_delete(); partitions 0, 2, 3 are
+        # handled by update() for each of two policies, so expect 6 paths to be
+        # sync'd
+        self.assertEqual(6, len(sync_paths))
+        # partition 3 has 2 nodes in remote region, only first node is sync'd.
+        # partition 0 in policy 0 has fake_get_hashes timeout before first
+        # sync, so only second node is sync'd.
+        # other partitions are sync'd to 2 nodes in same region.
+        expected_node_count = {  # map path_end -> expected sync node count
+            '/objects/0': 1,
+            '/objects/1': 2,
+            '/objects/2': 2,
+            '/objects/3': 1,
+            '/objects-1/0': 2,
+            '/objects-1/1': 2,
+            '/objects-1/2': 2,
+            '/objects-1/3': 1
+        }
+        for path, nodes in sync_paths.items():
+            path_end = path[path.index('/objects'):]
+            self.assertEqual(expected_node_count[path_end], len(nodes),
+                             'Expected %s but got %s for path %s' %
+                             (expected_node_count[path_end], len(nodes), path))
+        # partitions 0 and 2 attempt 3 calls each per policy to get_hashes = 12
+        # partitions 3 attempts 2 calls per policy to get_hashes = 4
+        # partitions 1 dosn't get_hashes because of revert
+        self.assertEqual(16, self.get_hash_count)
+
+        # attempt to 16 times but succeeded only 15 times due to Timeout
+        suffix_hashes = sum(
+            call[0][1] for call in
+            replicator.logger.logger.statsd_client.calls['update_stats']
+            if call[0][0] == 'suffix.hashes')
+        self.assertEqual(15, suffix_hashes)
 
     def test_run(self):
         with _mock_process([(0, '')] * 100):
-            self.replicator.replicate()
+            with mock.patch('swift.obj.replicator.http_connect',
+                            mock_http_connect(200)):
+                self.replicator.replicate()
 
     def test_run_withlog(self):
         with _mock_process([(0, "stuff in log")] * 100):
-            self.replicator.replicate()
+            with mock.patch('swift.obj.replicator.http_connect',
+                            mock_http_connect(200)):
+                self.replicator.replicate()
+
+    def test_sync_just_calls_sync_method(self):
+        self.replicator.sync_method = mock.MagicMock()
+        self.replicator.sync('node', 'job', 'suffixes')
+        self.replicator.sync_method.assert_called_once_with(
+            'node', 'job', 'suffixes')
+
+    @mock.patch('swift.obj.replicator.tpool.execute')
+    @mock.patch('swift.obj.replicator.http_connect', autospec=True)
+    @mock.patch('swift.obj.replicator._do_listdir')
+    def test_update(self, mock_do_listdir, mock_http, mock_tpool_execute):
+
+        def set_default(self):
+            self.replicator.suffix_count = 0
+            self.replicator.suffix_sync = 0
+            self.replicator.suffix_hash = 0
+            self.replicator.last_replication_count = 0
+            self.replicator._zero_stats()
+            self.replicator.partition_times = []
+
+        self.headers = {'Content-Length': '0',
+                        'user-agent': 'object-replicator %s' % os.getpid()}
+        mock_tpool_execute.return_value = (0, {})
+
+        all_jobs = self.replicator.collect_jobs()
+        jobs = [job for job in all_jobs if not job['delete']]
+
+        mock_http.return_value = answer = mock.MagicMock()
+        answer.getresponse.return_value = resp = mock.MagicMock()
+        # Check incorrect http_connect with status 507 and
+        # count of attempts and call args
+        resp.status = 507
+        expected_listdir_calls = [
+            mock.call(int(job['partition']),
+                      self.replicator.replication_cycle)
+            for job in jobs]
+        do_listdir_results = [False, False, True, False, True, False]
+        mock_do_listdir.side_effect = do_listdir_results
+        expected_tpool_calls = [
+            mock.call(self.replicator._df_router[job['policy']]._get_hashes,
+                      job['device'], job['partition'], job['policy'],
+                      do_listdir=do_listdir)
+            for job, do_listdir in zip(jobs, do_listdir_results)
+        ]
+        for job in jobs:
+            set_default(self)
+            ring = job['policy'].object_ring
+            self.headers['X-Backend-Storage-Policy-Index'] = int(job['policy'])
+            self.replicator.update(job)
+            error_lines = self.logger.get_lines_for_level('error')
+            expected = []
+            error = '%s responded as unmounted'
+            # ... first the primaries
+            for node in job['nodes']:
+                node_str = utils.node_to_string(node, replication=True)
+                expected.append(error % node_str)
+            # ... then it will get handoffs
+            for node in job['policy'].object_ring.get_more_nodes(
+                    int(job['partition'])):
+                node_str = utils.node_to_string(node, replication=True)
+                expected.append(error % node_str)
+            # ... and finally we get an error about running out of nodes
+            expected.append('Ran out of handoffs while replicating '
+                            'partition %s of policy %d' %
+                            (job['partition'], job['policy']))
+            self.assertEqual(expected, error_lines)
+            self.assertEqual(len(self.replicator.partition_times), 1)
+            self.assertEqual(mock_http.call_count,
+                             ring.assigned_device_count - 1)
+            reqs = []
+            for node in job['nodes']:
+                reqs.append(mock.call(node['ip'], node['port'], node['device'],
+                                      job['partition'], 'REPLICATE', '',
+                                      headers=self.headers))
+            if job['partition'] == '0':
+                self.assertEqual(self.replicator.suffix_hash, 0)
+            mock_http.assert_has_calls(reqs, any_order=True)
+            mock_http.reset_mock()
+            self.logger.clear()
+        mock_do_listdir.assert_has_calls(expected_listdir_calls)
+        mock_tpool_execute.assert_has_calls(expected_tpool_calls)
+        mock_do_listdir.side_effect = None
+        mock_do_listdir.return_value = False
+        # Check incorrect http_connect with status 400 != HTTP_OK
+        resp.status = 400
+        error = 'Invalid response %(resp)s from %(node)s'
+        for job in jobs:
+            set_default(self)
+            self.replicator.update(job)
+            # ... only the primaries
+            expected = [
+                error % {
+                    "resp": 400,
+                    "node": utils.node_to_string(node, replication=True)}
+                for node in job['nodes']]
+            self.assertEqual(expected,
+                             self.logger.get_lines_for_level('error'))
+            self.assertEqual(len(self.replicator.partition_times), 1)
+            self.logger.clear()
+
+        # Check successful http_connection and exception with
+        # incorrect pickle.loads(resp.read())
+        resp.status = 200
+        resp.read.return_value = b'garbage'
+        expect = 'Error syncing with node: %s: '
+        for job in jobs:
+            set_default(self)
+            self.replicator.update(job)
+            # ... only the primaries
+            expected = [expect % utils.node_to_string(node, replication=True)
+                        for node in job['nodes']]
+            error_lines = self.logger.get_lines_for_level('error')
+            self.assertEqual(expected, error_lines)
+            self.assertEqual(len(self.replicator.partition_times), 1)
+            self.logger.clear()
+
+        # Check successful http_connection and correct
+        # pickle.loads(resp.read()) for non local node
+        resp.status = 200
+        local_job = None
+        resp.read.return_value = pickle.dumps({})
+        for job in jobs:
+            set_default(self)
+            # limit local job to policy 0 for simplicity
+            if job['partition'] == '0' and int(job['policy']) == 0:
+                local_job = job.copy()
+                continue
+            self.replicator.update(job)
+            self.assertEqual([], self.logger.get_lines_for_level('error'))
+            self.assertEqual(len(self.replicator.partition_times), 1)
+            self.assertEqual(self.replicator.suffix_hash, 0)
+            self.assertEqual(self.replicator.suffix_sync, 0)
+            self.assertEqual(self.replicator.suffix_count, 0)
+            self.logger.clear()
+
+        # Check successful http_connect and sync for local node
+        mock_tpool_execute.return_value = (1, {'a83': 'ba47fd314242ec8c'
+                                                      '7efb91f5d57336e4'})
+        resp.read.return_value = pickle.dumps({'a83': 'c130a2c17ed45102a'
+                                                      'ada0f4eee69494ff'})
+        set_default(self)
+        self.replicator.sync = fake_func = \
+            mock.MagicMock(return_value=(True, []))
+        self.replicator.update(local_job)
+        reqs = []
+        for node in local_job['nodes']:
+            reqs.append(mock.call(node, local_job, ['a83']))
+        fake_func.assert_has_calls(reqs, any_order=True)
+        self.assertEqual(fake_func.call_count, 2)
+        stats = self.replicator.total_stats
+        self.assertEqual(stats.attempted, 1)
+        self.assertEqual(stats.suffix_sync, 2)
+        self.assertEqual(stats.suffix_hash, 1)
+        self.assertEqual(stats.suffix_count, 1)
+        self.assertEqual(stats.hashmatch, 0)
+
+        # Efficient Replication Case
+        set_default(self)
+        self.replicator.sync = fake_func = \
+            mock.MagicMock(return_value=(True, []))
+        all_jobs = self.replicator.collect_jobs()
+        job = None
+        for tmp in all_jobs:
+            if tmp['partition'] == '3':
+                job = tmp
+                break
+        # The candidate nodes to replicate (i.e. dev1 and dev3)
+        # belong to another region
+        self.replicator.update(job)
+        self.assertEqual(fake_func.call_count, 1)
+        stats = self.replicator.total_stats
+        self.assertEqual(stats.attempted, 1)
+        self.assertEqual(stats.suffix_sync, 1)
+        self.assertEqual(stats.suffix_hash, 1)
+        self.assertEqual(stats.suffix_count, 1)
+        self.assertEqual(stats.hashmatch, 0)
+
+        mock_http.reset_mock()
+        self.logger.clear()
+
+        # test for replication params on policy 0 only
+        repl_job = local_job.copy()
+        for node in repl_job['nodes']:
+            node['replication_ip'] = '127.0.0.11'
+            node['replication_port'] = '6011'
+        set_default(self)
+        # with only one set of headers make sure we specify index 0 here
+        # as otherwise it may be different from earlier tests
+        self.headers['X-Backend-Storage-Policy-Index'] = 0
+        self.replicator.update(repl_job)
+        reqs = []
+        for node in repl_job['nodes']:
+            reqs.append(mock.call(node['replication_ip'],
+                                  node['replication_port'], node['device'],
+                                  repl_job['partition'], 'REPLICATE',
+                                  '', headers=self.headers))
+        mock_http.assert_has_calls(reqs, any_order=True)
+
+    @mock.patch('swift.obj.replicator.tpool.execute')
+    @mock.patch('swift.obj.replicator.http_connect', autospec=True)
+    @mock.patch('swift.obj.replicator._do_listdir')
+    def test_update_local_hash_changes_during_replication(
+            self, mock_do_listdir, mock_http, mock_tpool_execute):
+        mock_http.return_value = answer = mock.MagicMock()
+        answer.getresponse.return_value = resp = mock.MagicMock()
+        resp.status = 200
+        resp.read.return_value = pickle.dumps({
+            'a83': 'c130a2c17ed45102aada0f4eee69494ff'})
+
+        self.replicator.sync = fake_sync = \
+            mock.MagicMock(return_value=(True, []))
+        local_job = [
+            job for job in self.replicator.collect_jobs()
+            if not job['delete']
+            and job['partition'] == '0' and int(job['policy']) == 0
+        ][0]
+
+        mock_tpool_execute.side_effect = [
+            (1, {'a83': 'ba47fd314242ec8c7efb91f5d57336e4'}),
+            (1, {'a83': 'c130a2c17ed45102aada0f4eee69494ff'}),
+        ]
+        self.replicator.update(local_job)
+        self.assertEqual(fake_sync.call_count, 0)
+        self.assertEqual(mock_http.call_count, 2)
+        stats = self.replicator.total_stats
+        self.assertEqual(stats.attempted, 1)
+        self.assertEqual(stats.suffix_sync, 0)
+        self.assertEqual(stats.suffix_hash, 1)
+        self.assertEqual(stats.suffix_count, 1)
+        self.assertEqual(stats.hashmatch, 2)
+
+    def test_rsync_compress_different_region(self):
+        self.assertEqual(self.replicator.sync_method, self.replicator.rsync)
+        jobs = self.replicator.collect_jobs()
+        _m_rsync = mock.Mock(return_value=0)
+        _m_os_path_exists = mock.Mock(return_value=True)
+        expected_reqs = []
+        with mock.patch.object(self.replicator, '_rsync', _m_rsync), \
+                mock.patch('os.path.exists', _m_os_path_exists), \
+                mocked_http_conn(
+                    *[200] * 2 * sum(len(job['nodes']) for job in jobs),
+                    body=pickle.dumps('{}')) as request_log:
+            for job in jobs:
+                self.assertTrue('region' in job)
+                for node in job['nodes']:
+                    for rsync_compress in (True, False):
+                        expected_reqs.append((
+                            'REPLICATE', node['ip'],
+                            '/%s/%s/fake_suffix' % (
+                                node['device'], job['partition']),
+                        ))
+                        self.replicator.rsync_compress = rsync_compress
+                        ret = self.replicator.sync(node, job,
+                                                   ['fake_suffix'])
+                        self.assertTrue(ret)
+                        if node['region'] != job['region']:
+                            if rsync_compress:
+                                # --compress arg should be passed to rsync
+                                # binary only when rsync_compress option is
+                                # enabled AND destination node is in a
+                                # different region
+                                self.assertTrue('--compress' in
+                                                _m_rsync.call_args[0][0])
+                            else:
+                                self.assertFalse('--compress' in
+                                                 _m_rsync.call_args[0][0])
+                        else:
+                            self.assertFalse('--compress' in
+                                             _m_rsync.call_args[0][0])
+                        self.assertEqual(
+                            _m_os_path_exists.call_args_list[-1][0][0],
+                            os.path.join(job['path'], 'fake_suffix'))
+                        self.assertEqual(
+                            _m_os_path_exists.call_args_list[-2][0][0],
+                            os.path.join(job['path']))
+        self.assertEqual(expected_reqs, [
+            (r['method'], r['ip'], r['path']) for r in request_log.requests])
+
+    def test_rsync_failure_logging(self):
+        with mock.patch('swift.obj.replicator.subprocess.Popen') as mock_popen:
+            mock_popen.return_value.stdout = io.BytesIO(b'\n'.join([
+                b'',
+                b'cd+++++++++ suf',
+                b'cd+++++++++ suf/hash1',
+                b'<f+++++++++ suf/hash1/1637956993.28907.data',
+                b'',
+                b'cd+++++++++ suf/hash2',
+                b'<f+++++++++ suf/hash2/1615174984.55017.data',
+                b'',
+                b'cd+++++++++ suf/hash3',
+                b'<f+++++++++ suf/hash3/1616276756.37760.data',
+                b'<f+++++++++ suf/hash3/1637954870.98055.meta',
+                b'',
+                b'Oh no, some error!',
+            ]))
+            mock_popen.return_value.wait.return_value = 5
+            self.assertEqual(5, self.replicator._rsync([
+                'rsync', '--recursive', '--whole-file', '--human-readable',
+                '--xattrs', '--itemize-changes', '--ignore-existing',
+                '--timeout=30', '--contimeout=30', '--bwlimit=100M',
+                '--exclude=rsync-tempfile-pattern',
+                '/srv/node/d1/objects/part/suf',
+                '192.168.50.30::object/d8/objects/241']))
+        error_lines = self.logger.get_lines_for_level('error')
+        self.assertEqual(error_lines[:5], [
+            '<f+++++++++ suf/hash1/1637956993.28907.data',
+            '<f+++++++++ suf/hash2/1615174984.55017.data',
+            '<f+++++++++ suf/hash3/1616276756.37760.data',
+            '<f+++++++++ suf/hash3/1637954870.98055.meta',
+            'Oh no, some error!',
+        ])
+        expected_start = "Bad rsync return code: 5 <- ['rsync', '--recursive'"
+        self.assertEqual(error_lines[5][:len(expected_start)], expected_start,
+                         'Expected %r to start with %r' % (error_lines[5],
+                                                           expected_start))
+        self.assertFalse(error_lines[6:])
+        self.assertFalse(self.logger.get_lines_for_level('info'))
+        self.assertFalse(self.logger.get_lines_for_level('debug'))
+
+    def test_rsync_failure_logging_no_transfer(self):
+        with mock.patch('swift.obj.replicator.subprocess.Popen') as mock_popen:
+            mock_popen.return_value.stdout = io.BytesIO(b'\n'.join([
+                b'',
+                b'cd+++++++++ suf',
+                b'cd+++++++++ suf/hash1',
+                b'<f+++++++++ suf/hash1/1637956993.28907.data',
+                b'',
+                b'cd+++++++++ suf/hash2',
+                b'<f+++++++++ suf/hash2/1615174984.55017.data',
+                b'',
+                b'cd+++++++++ suf/hash3',
+                b'<f+++++++++ suf/hash3/1616276756.37760.data',
+                b'<f+++++++++ suf/hash3/1637954870.98055.meta',
+                b'',
+                b'Oh no, some error!',
+            ]))
+            mock_popen.return_value.wait.return_value = 5
+            self.replicator.log_rsync_transfers = False
+            self.assertEqual(5, self.replicator._rsync([
+                'rsync', '--recursive', '--whole-file', '--human-readable',
+                '--xattrs', '--itemize-changes', '--ignore-existing',
+                '--timeout=30', '--contimeout=30', '--bwlimit=100M',
+                '--exclude=rsync-tempfile-pattern',
+                '/srv/node/d1/objects/part/suf',
+                '192.168.50.30::object/d8/objects/241']))
+        error_lines = self.logger.get_lines_for_level('error')
+        self.assertEqual(error_lines[0], 'Oh no, some error!')
+        expected_start = "Bad rsync return code: 5 <- ['rsync', '--recursive'"
+        self.assertEqual(error_lines[1][:len(expected_start)], expected_start,
+                         'Expected %r to start with %r' % (error_lines[1],
+                                                           expected_start))
+        self.assertFalse(error_lines[2:])
+        self.assertFalse(self.logger.get_lines_for_level('info'))
+        self.assertFalse(self.logger.get_lines_for_level('debug'))
+
+    def test_rsync_success_logging(self):
+        with mock.patch(
+                'swift.obj.replicator.subprocess.Popen') as mock_popen, \
+                mock.patch('time.time', side_effect=[123.4, 123.5]):
+            mock_popen.return_value.stdout = io.BytesIO(b'\n'.join([
+                b'',
+                b'cd+++++++++ suf',
+                b'cd+++++++++ suf/hash1',
+                b'<f+++++++++ suf/hash1/1637956993.28907.data',
+                b'',
+                b'cd+++++++++ suf/hash2',
+                b'<f+++++++++ suf/hash2/1615174984.55017.data',
+                b'',
+                b'cd+++++++++ suf/hash3',
+                b'<f+++++++++ suf/hash3/1616276756.37760.data',
+                b'<f+++++++++ suf/hash3/1637954870.98055.meta',
+                b'',
+                b'Yay! It worked!',
+            ]))
+            mock_popen.return_value.wait.return_value = 0
+            self.assertEqual(0, self.replicator._rsync([
+                'rsync', '--recursive', '--whole-file', '--human-readable',
+                '--xattrs', '--itemize-changes', '--ignore-existing',
+                '--timeout=30', '--contimeout=30', '--bwlimit=100M',
+                '--exclude=rsync-tempfile-pattern',
+                '/srv/node/d1/objects/part/suf',
+                '192.168.50.30::object/d8/objects/241']))
+        self.assertFalse(self.logger.get_lines_for_level('error'))
+        debug_lines = self.logger.get_lines_for_level('debug')
+        self.assertEqual(debug_lines, [
+            '<f+++++++++ suf/hash1/1637956993.28907.data',
+            '<f+++++++++ suf/hash2/1615174984.55017.data',
+            '<f+++++++++ suf/hash3/1616276756.37760.data',
+            '<f+++++++++ suf/hash3/1637954870.98055.meta',
+            'Yay! It worked!',
+        ])
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertEqual(info_lines, [
+            'Successful rsync of /srv/node/d1/objects/part/... to '
+            '192.168.50.30::object/d8/objects/241 (0.100)'])
+
+    def test_rsync_success_logging_no_transfer(self):
+        with mock.patch(
+                'swift.obj.replicator.subprocess.Popen') as mock_popen, \
+                mock.patch('time.time', side_effect=[123.4, 123.5]):
+            mock_popen.return_value.stdout = io.BytesIO(b'\n'.join([
+                b'',
+                b'cd+++++++++ sf1',
+                b'cd+++++++++ sf1/hash1',
+                b'<f+++++++++ sf1/hash1/1637956993.28907.data',
+                b'',
+                b'cd+++++++++ sf1/hash2',
+                b'<f+++++++++ sf1/hash2/1615174984.55017.data',
+                b'',
+                b'cd+++++++++ sf2/hash3',
+                b'<f+++++++++ sf2/hash3/1616276756.37760.data',
+                b'<f+++++++++ sf2/hash3/1637954870.98055.meta',
+                b'',
+                b'Yay! It worked!',
+            ]))
+            mock_popen.return_value.wait.return_value = 0
+            self.replicator.log_rsync_transfers = False
+            self.assertEqual(0, self.replicator._rsync([
+                'rsync', '--recursive', '--whole-file', '--human-readable',
+                '--xattrs', '--itemize-changes', '--ignore-existing',
+                '--timeout=30', '--contimeout=30', '--bwlimit=100M',
+                '--exclude=rsync-tempfile-pattern',
+                '/srv/node/d1/objects/part/sf1',
+                '/srv/node/d1/objects/part/sf2',
+                '192.168.50.30::object/d8/objects/241']))
+        self.assertFalse(self.logger.get_lines_for_level('error'))
+        debug_lines = self.logger.get_lines_for_level('debug')
+        self.assertEqual(debug_lines, ['Yay! It worked!'])
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertEqual(info_lines, [
+            'Successful rsync of /srv/node/d1/objects/part/... to '
+            '192.168.50.30::object/d8/objects/241 (0.100)'])
+
+    def test_do_listdir(self):
+        # Test if do_listdir is enabled for every 10th partition to rehash
+        # First number is the number of partitions in the job, list entries
+        # are the expected partition numbers per run
+        test_data = {
+            9: [1, 0, 1, 1, 1, 1, 1, 1, 1, 1],
+            29: [3, 2, 3, 3, 3, 3, 3, 3, 3, 3],
+            111: [12, 11, 11, 11, 11, 11, 11, 11, 11, 11]}
+
+        for partitions, expected in test_data.items():
+            seen = []
+            for phase in range(10):
+                invalidated = 0
+                for partition in range(partitions):
+                    if object_replicator._do_listdir(partition, phase):
+                        seen.append(partition)
+                        invalidated += 1
+                # Every 10th partition is seen after each phase
+                self.assertEqual(expected[phase], invalidated)
+
+            # After 10 cycles every partition is seen exactly once
+            self.assertEqual(sorted(range(partitions)), sorted(seen))
+
+    def test_revert_partition_lock_timeout(self):
+        self.replicator.handoffs_remaining = 0
+        jobs = self.replicator.collect_jobs()
+        delete_jobs = [j for j in jobs if j['delete']]
+        delete_jobs.sort(key=lambda j: j['policy'])
+        job = delete_jobs[0]
+        df_mgr = self.replicator._df_router[job['policy']]
+        with mock.patch.object(df_mgr, 'partition_lock',
+                               side_effect=PartitionLockTimeout):
+            self.replicator.revert(job)
+        logs = self.logger.get_lines_for_level('info')
+        self.assertEqual(['Unable to lock handoff partition 1 for '
+                          'replication on device sda policy 0'], logs)
+
+    def test_replicate_skipped_partpower_increase(self):
+        _create_test_rings(self.testdir, next_part_power=4)
+        self.replicator.get_local_devices()  # refresh rings
+        self.replicator.replicate()
+        self.assertEqual(0, self.replicator.job_count)
+        self.assertEqual(0, self.replicator.total_stats.attempted)
+        warnings = self.logger.get_lines_for_level('warning')
+        self.assertIn(
+            "next_part_power set in policy 'one'. Skipping", warnings)
+
+    def test_replicate_rsync_timeout(self):
+        cur_part = '0'
+        df = self.df_mgr.get_diskfile('sda', cur_part, 'a', 'c', 'o',
+                                      policy=POLICIES[0])
+        mkdirs(df._datadir)
+        f = open(os.path.join(df._datadir,
+                              normalize_timestamp(time.time()) + '.data'),
+                 'wb')
+        f.write(b'1234567890')
+        f.close()
+
+        mock_procs = []
+
+        def new_mock(*a, **kw):
+            proc = MockHungProcess()
+            mock_procs.append(proc)
+            return proc
+
+        with mock.patch('swift.obj.replicator.http_connect',
+                        mock_http_connect(200)), \
+                mock.patch.object(self.replicator, 'rsync_timeout', 0.01), \
+                mock.patch('eventlet.green.subprocess.Popen', new_mock):
+            self.replicator.rsync_error_log_line_length = 40
+            self.replicator.run_once()
+        for proc in mock_procs:
+            self.assertEqual(proc._calls, [
+                ('wait', 'running'),
+                ('kill', 'running'),
+                ('wait', 'killed'),
+            ])
+        self.assertEqual(len(mock_procs), 2)
+        error_lines = self.replicator.logger.get_lines_for_level('error')
+        # verify logs are truncated to rsync_error_log_line_length
+        self.assertEqual(["Killing long-running rsync after 0s: ['r"] * 2,
+                         error_lines)
+
+    def test_replicate_rsync_timeout_wedged(self):
+        cur_part = '0'
+        df = self.df_mgr.get_diskfile('sda', cur_part, 'a', 'c', 'o',
+                                      policy=POLICIES[0])
+        mkdirs(df._datadir)
+        f = open(os.path.join(df._datadir,
+                              normalize_timestamp(time.time()) + '.data'),
+                 'wb')
+        f.write(b'1234567890')
+        f.close()
+
+        mock_procs = []
+
+        def new_mock(*a, **kw):
+            proc = MockHungProcess(polls_needed=2)
+            mock_procs.append(proc)
+            return proc
+
+        with mock.patch('swift.obj.replicator.http_connect',
+                        mock_http_connect(200)), \
+                mock.patch.object(self.replicator, 'rsync_timeout', 0.01), \
+                mock.patch('eventlet.green.subprocess.Popen', new_mock):
+            self.replicator.run_once()
+        for proc in mock_procs:
+            self.assertEqual(proc._calls, [
+                ('wait', 'running'),
+                ('kill', 'running'),
+                ('wait', 'killed'),
+                ('poll', 'killed'),
+                ('poll', 'killed'),
+            ])
+        self.assertEqual(len(mock_procs), 2)
+
+    def test_limit_rsync_log(self):
+        def do_test(length_limit, log_line, expected):
+            self.replicator.rsync_error_log_line_length = length_limit
+            result = self.replicator._limit_rsync_log(log_line)
+            self.assertEqual(result, expected)
+
+        tests = [{'length_limit': 20,
+                  'log_line': 'a' * 20,
+                  'expected': 'a' * 20},
+                 {'length_limit': 20,
+                  'log_line': 'a' * 19,
+                  'expected': 'a' * 19},
+                 {'length_limit': 20,
+                  'log_line': 'a' * 21,
+                  'expected': 'a' * 20},
+                 {'length_limit': None,
+                  'log_line': 'a' * 50,
+                  'expected': 'a' * 50},
+                 {'length_limit': 0,
+                  'log_line': 'a' * 50,
+                  'expected': 'a' * 50}]
+
+        for params in tests:
+            do_test(**params)
+
+
+@patch_policies([StoragePolicy(0, 'zero', False),
+                 StoragePolicy(1, 'one', True)])
+class TestMultiProcessReplicator(unittest.TestCase):
+    def setUp(self):
+        # recon cache path
+        self.recon_cache = tempfile.mkdtemp()
+        rmtree(self.recon_cache, ignore_errors=1)
+        os.mkdir(self.recon_cache)
+        self.recon_file = os.path.join(self.recon_cache, RECON_OBJECT_FILE)
+
+        bind_port = 6200
+
+        # Set up some rings
+        self.testdir = tempfile.mkdtemp()
+        _create_test_rings(self.testdir, devs=[
+            {'id': 0, 'device': 'sda', 'zone': 0,
+             'region': 1, 'ip': '127.0.0.1', 'port': bind_port},
+            {'id': 1, 'device': 'sdb', 'zone': 0,
+             'region': 1, 'ip': '127.0.0.1', 'port': bind_port},
+            {'id': 2, 'device': 'sdc', 'zone': 0,
+             'region': 1, 'ip': '127.0.0.1', 'port': bind_port},
+            {'id': 3, 'device': 'sdd', 'zone': 0,
+             'region': 1, 'ip': '127.0.0.1', 'port': bind_port},
+            {'id': 4, 'device': 'sde', 'zone': 0,
+             'region': 1, 'ip': '127.0.0.1', 'port': bind_port},
+            {'id': 100, 'device': 'notme0', 'zone': 0,
+             'region': 1, 'ip': '127.99.99.99', 'port': bind_port}])
+
+        self.logger = debug_logger('test-replicator')
+        self.conf = dict(
+            bind_ip='127.0.0.1', bind_port=bind_port,
+            swift_dir=self.testdir,
+            mount_check='false', recon_cache_path=self.recon_cache,
+            timeout='300', stats_interval='1', sync_method='rsync')
+
+        self.replicator = object_replicator.ObjectReplicator(
+            self.conf, logger=self.logger)
+
+    def tearDown(self):
+        self.assertFalse(process_errors)
+        rmtree(self.testdir, ignore_errors=1)
+        rmtree(self.recon_cache, ignore_errors=1)
+
+    def fake_replicate(self, override_devices, **kw):
+        # Faked-out replicate() method. Just updates the stats, but doesn't
+        # do any work.
+        for device in override_devices:
+            stats = self.replicator.stats_for_dev[device]
+            if device == 'sda':
+                stats.attempted = 1
+                stats.success = 10
+                stats.failure = 100
+                stats.hashmatch = 1000
+                stats.rsync = 10000
+                stats.remove = 100000
+                stats.suffix_count = 1000000
+                stats.suffix_hash = 10000000
+                stats.suffix_sync = 100000000
+                stats.failure_nodes = {
+                    '10.1.1.1': {'d11': 1}}
+            elif device == 'sdb':
+                stats.attempted = 2
+                stats.success = 20
+                stats.failure = 200
+                stats.hashmatch = 2000
+                stats.rsync = 20000
+                stats.remove = 200000
+                stats.suffix_count = 2000000
+                stats.suffix_hash = 20000000
+                stats.suffix_sync = 200000000
+                stats.failure_nodes = {
+                    '10.2.2.2': {'d22': 2}}
+            elif device == 'sdc':
+                stats.attempted = 3
+                stats.success = 30
+                stats.failure = 300
+                stats.hashmatch = 3000
+                stats.rsync = 30000
+                stats.remove = 300000
+                stats.suffix_count = 3000000
+                stats.suffix_hash = 30000000
+                stats.suffix_sync = 300000000
+                stats.failure_nodes = {
+                    '10.3.3.3': {'d33': 3}}
+            elif device == 'sdd':
+                stats.attempted = 4
+                stats.success = 40
+                stats.failure = 400
+                stats.hashmatch = 4000
+                stats.rsync = 40000
+                stats.remove = 400000
+                stats.suffix_count = 4000000
+                stats.suffix_hash = 40000000
+                stats.suffix_sync = 400000000
+                stats.failure_nodes = {
+                    '10.4.4.4': {'d44': 4}}
+            elif device == 'sde':
+                stats.attempted = 5
+                stats.success = 50
+                stats.failure = 500
+                stats.hashmatch = 5000
+                stats.rsync = 50000
+                stats.remove = 500000
+                stats.suffix_count = 5000000
+                stats.suffix_hash = 50000000
+                stats.suffix_sync = 500000000
+                stats.failure_nodes = {
+                    '10.5.5.5': {'d55': 5}}
+            else:
+                raise Exception("mock can't handle %r" % device)
+
+    def test_no_multiprocessing(self):
+        self.replicator.replicator_workers = 0
+        self.assertEqual(self.replicator.get_worker_args(), [])
+
+    def test_device_distribution(self):
+        self.replicator.replicator_workers = 2
+        self.assertEqual(self.replicator.get_worker_args(), [{
+            'override_devices': ['sda', 'sdc', 'sde'],
+            'override_partitions': [],
+            'override_policies': [],
+            'have_overrides': False,
+            'multiprocess_worker_index': 0,
+        }, {
+            'override_devices': ['sdb', 'sdd'],
+            'override_partitions': [],
+            'override_policies': [],
+            'have_overrides': False,
+            'multiprocess_worker_index': 1,
+        }])
+
+    def test_override_policies(self):
+        self.replicator.replicator_workers = 2
+        args = self.replicator.get_worker_args(policies="3,5,7", once=True)
+        self.assertEqual(args, [{
+            'override_devices': ['sda', 'sdc', 'sde'],
+            'override_partitions': [],
+            'override_policies': [3, 5, 7],
+            'have_overrides': True,
+            'multiprocess_worker_index': 0,
+        }, {
+            'override_devices': ['sdb', 'sdd'],
+            'override_partitions': [],
+            'override_policies': [3, 5, 7],
+            'have_overrides': True,
+            'multiprocess_worker_index': 1,
+        }])
+
+        # override policies don't apply in run-forever mode
+        args = self.replicator.get_worker_args(policies="3,5,7", once=False)
+        self.assertEqual(args, [{
+            'override_devices': ['sda', 'sdc', 'sde'],
+            'override_partitions': [],
+            'override_policies': [],
+            'have_overrides': False,
+            'multiprocess_worker_index': 0,
+        }, {
+            'override_devices': ['sdb', 'sdd'],
+            'override_partitions': [],
+            'override_policies': [],
+            'have_overrides': False,
+            'multiprocess_worker_index': 1,
+        }])
+
+    def test_more_workers_than_disks(self):
+        self.replicator.replicator_workers = 999
+        self.assertEqual(self.replicator.get_worker_args(), [{
+            'override_devices': ['sda'],
+            'override_partitions': [],
+            'override_policies': [],
+            'have_overrides': False,
+            'multiprocess_worker_index': 0,
+        }, {
+            'override_devices': ['sdb'],
+            'override_partitions': [],
+            'override_policies': [],
+            'have_overrides': False,
+            'multiprocess_worker_index': 1,
+        }, {
+            'override_devices': ['sdc'],
+            'override_partitions': [],
+            'override_policies': [],
+            'have_overrides': False,
+            'multiprocess_worker_index': 2,
+        }, {
+            'override_devices': ['sdd'],
+            'override_partitions': [],
+            'override_policies': [],
+            'have_overrides': False,
+            'multiprocess_worker_index': 3,
+        }, {
+            'override_devices': ['sde'],
+            'override_partitions': [],
+            'override_policies': [],
+            'have_overrides': False,
+            'multiprocess_worker_index': 4,
+        }])
+
+        # Remember how many workers we actually have so that the log-line
+        # prefixes are reasonable. Otherwise, we'd have five workers, each
+        # logging lines starting with things like "[worker X/999 pid=P]"
+        # despite there being only five.
+        self.assertEqual(self.replicator.replicator_workers, 5)
+
+    def test_command_line_overrides(self):
+        self.replicator.replicator_workers = 2
+
+        args = self.replicator.get_worker_args(
+            devices="sda,sdc,sdd", partitions="12,34,56", once=True)
+        self.assertEqual(args, [{
+            'override_devices': ['sda', 'sdd'],
+            'override_partitions': [12, 34, 56],
+            'override_policies': [],
+            'have_overrides': True,
+            'multiprocess_worker_index': 0,
+        }, {
+            'override_devices': ['sdc'],
+            'override_partitions': [12, 34, 56],
+            'override_policies': [],
+            'have_overrides': True,
+            'multiprocess_worker_index': 1,
+        }])
+
+        args = self.replicator.get_worker_args(
+            devices="sda,sdc,sdd", once=True)
+        self.assertEqual(args, [{
+            'override_devices': ['sda', 'sdd'],
+            'override_partitions': [],
+            'override_policies': [],
+            'have_overrides': True,
+            'multiprocess_worker_index': 0,
+        }, {
+            'override_devices': ['sdc'],
+            'override_partitions': [],
+            'override_policies': [],
+            'have_overrides': True,
+            'multiprocess_worker_index': 1,
+        }])
+
+        # no overrides apply in run-forever mode
+        args = self.replicator.get_worker_args(
+            devices="sda,sdc,sdd", partitions="12,34,56", once=False)
+        self.assertEqual(args, [{
+            'override_devices': ['sda', 'sdc', 'sde'],
+            'override_partitions': [],
+            'override_policies': [],
+            'have_overrides': False,
+            'multiprocess_worker_index': 0,
+        }, {
+            'override_devices': ['sdb', 'sdd'],
+            'override_partitions': [],
+            'override_policies': [],
+            'have_overrides': False,
+            'multiprocess_worker_index': 1,
+        }])
+
+    def test_worker_logging(self):
+        self.replicator.replicator_workers = 3
+
+        def log_some_stuff(*a, **kw):
+            self.replicator.logger.debug("debug message")
+            self.replicator.logger.info("info message")
+            self.replicator.logger.warning("warning message")
+            self.replicator.logger.error("error message")
+
+        with mock.patch.object(self.replicator, 'replicate', log_some_stuff), \
+                mock.patch("os.getpid", lambda: 8804):
+            self.replicator.get_worker_args()
+            self.replicator.run_once(multiprocess_worker_index=0,
+                                     override_devices=['sda', 'sdb'])
+
+        prefix = "[worker 1/3 pid=8804] "
+        for level, lines in self.logger.logger.all_log_lines().items():
+            for line in lines:
+                self.assertTrue(
+                    line.startswith(prefix),
+                    "%r doesn't start with %r (level %s)" % (
+                        line, prefix, level))
+
+    def test_recon_run_once(self):
+        self.replicator.replicator_workers = 3
+
+        the_time = [1521680000]
+
+        def mock_time():
+            rv = the_time[0]
+            the_time[0] += 120
+            return rv
+
+        # Simulate a couple child processes
+        with mock.patch.object(self.replicator, 'replicate',
+                               self.fake_replicate), \
+                mock.patch('time.time', mock_time):
+            self.replicator.get_worker_args()
+            self.replicator.run_once(multiprocess_worker_index=0,
+                                     override_devices=['sda', 'sdb'])
+            self.replicator.run_once(multiprocess_worker_index=1,
+                                     override_devices=['sdc'])
+            self.replicator.run_once(multiprocess_worker_index=2,
+                                     override_devices=['sdd', 'sde'])
+
+        with open(self.recon_file) as fh:
+            recon_data = json.load(fh)
+        self.assertIn('object_replication_per_disk', recon_data)
+        self.assertIn('sda', recon_data['object_replication_per_disk'])
+        self.assertIn('sdb', recon_data['object_replication_per_disk'])
+        self.assertIn('sdc', recon_data['object_replication_per_disk'])
+        self.assertIn('sdd', recon_data['object_replication_per_disk'])
+        self.assertIn('sde', recon_data['object_replication_per_disk'])
+        sda = recon_data['object_replication_per_disk']['sda']
+
+        # Spot-check a couple of fields
+        self.assertEqual(sda['replication_stats']['attempted'], 1)
+        self.assertEqual(sda['replication_stats']['success'], 10)
+        self.assertEqual(sda['object_replication_time'], 2)  # minutes
+        self.assertEqual(sda['object_replication_last'], 1521680120)
+
+        # Aggregate the workers' recon updates
+        self.replicator.post_multiprocess_run()
+        with open(self.recon_file) as fh:
+            recon_data = json.load(fh)
+        self.assertEqual(recon_data['replication_stats']['attempted'], 15)
+        self.assertEqual(recon_data['replication_stats']['failure'], 1500)
+        self.assertEqual(recon_data['replication_stats']['hashmatch'], 15000)
+        self.assertEqual(recon_data['replication_stats']['remove'], 1500000)
+        self.assertEqual(recon_data['replication_stats']['rsync'], 150000)
+        self.assertEqual(recon_data['replication_stats']['success'], 150)
+        self.assertEqual(recon_data['replication_stats']['suffix_count'],
+                         15000000)
+        self.assertEqual(recon_data['replication_stats']['suffix_hash'],
+                         150000000)
+        self.assertEqual(recon_data['replication_stats']['suffix_sync'],
+                         1500000000)
+        self.assertEqual(recon_data['replication_stats']['failure_nodes'], {
+            '10.1.1.1': {'d11': 1},
+            '10.2.2.2': {'d22': 2},
+            '10.3.3.3': {'d33': 3},
+            '10.4.4.4': {'d44': 4},
+            '10.5.5.5': {'d55': 5},
+        })
+        self.assertEqual(recon_data['object_replication_time'], 2)  # minutes
+        self.assertEqual(recon_data['object_replication_last'], 1521680120)
+
+    def test_recon_skipped_with_overrides(self):
+        self.replicator.replicator_workers = 3
+
+        the_time = [1521680000]
+
+        def mock_time():
+            rv = the_time[0]
+            the_time[0] += 120
+            return rv
+
+        with mock.patch.object(self.replicator, 'replicate',
+                               self.fake_replicate), \
+                mock.patch('time.time', mock_time):
+            self.replicator.get_worker_args()
+            self.replicator.run_once(multiprocess_worker_index=0,
+                                     have_overrides=True,
+                                     override_devices=['sda', 'sdb'])
+        self.assertFalse(os.path.exists(self.recon_file))
+
+        # have_overrides=False makes us get recon stats
+        with mock.patch.object(self.replicator, 'replicate',
+                               self.fake_replicate), \
+                mock.patch('time.time', mock_time):
+            self.replicator.get_worker_args()
+            self.replicator.run_once(multiprocess_worker_index=0,
+                                     have_overrides=False,
+                                     override_devices=['sda', 'sdb'])
+        with open(self.recon_file) as fh:
+            recon_data = json.load(fh)
+        self.assertIn('sda', recon_data['object_replication_per_disk'])
+
+    def test_recon_run_forever(self):
+        the_time = [1521521521.52152]
+
+        def mock_time():
+            rv = the_time[0]
+            the_time[0] += 120
+            return rv
+
+        self.replicator.replicator_workers = 2
+        self.replicator._next_rcache_update = the_time[0]
+
+        # One worker has finished a pass, the other hasn't.
+        with mock.patch.object(self.replicator, 'replicate',
+                               self.fake_replicate), \
+                mock.patch('time.time', mock_time):
+            self.replicator.get_worker_args()
+            # Yes, this says run_once, but this is only to populate
+            # object.recon with some stats. The real test is for the
+            # aggregation.
+            self.replicator.run_once(multiprocess_worker_index=0,
+                                     override_devices=['sda', 'sdb', 'sdc'])
+
+        # This will not produce aggregate stats since not every device has
+        # finished a pass.
+        the_time[0] += self.replicator.stats_interval
+        with mock.patch('time.time', mock_time):
+            rv = self.replicator.is_healthy()
+        self.assertTrue(rv)
+        with open(self.recon_file) as fh:
+            recon_data = json.load(fh)
+        self.assertNotIn('replication_stats', recon_data)
+
+        # Now all the local devices have completed a replication pass, so we
+        # will produce aggregate stats.
+        with mock.patch.object(self.replicator, 'replicate',
+                               self.fake_replicate), \
+                mock.patch('time.time', mock_time):
+            self.replicator.get_worker_args()
+            self.replicator.run_once(multiprocess_worker_index=1,
+                                     override_devices=['sdd', 'sde'])
+        the_time[0] += self.replicator.stats_interval
+        with mock.patch('time.time', mock_time):
+            rv = self.replicator.is_healthy()
+        self.assertTrue(rv)
+        with open(self.recon_file) as fh:
+            recon_data = json.load(fh)
+        self.assertIn('replication_stats', recon_data)
+
+        # no need to exhaustively check every sum
+        self.assertEqual(recon_data['replication_stats']['attempted'], 15)
+        self.assertEqual(recon_data['replication_stats']['success'], 150)
+
+        self.assertEqual(
+            recon_data['replication_last'],
+            min(pd['replication_last']
+                for pd in recon_data['object_replication_per_disk'].values()))
+
+
+class TestReplicatorStats(unittest.TestCase):
+    def test_to_recon(self):
+        st = object_replicator.Stats(
+            attempted=1, failure=2, hashmatch=3, remove=4,
+            rsync=5, success=7,
+            suffix_count=8, suffix_hash=9, suffix_sync=10,
+            failure_nodes={'10.1.2.3': {'sda': 100, 'sdb': 200}})
+        # This is what appears in the recon dump
+        self.assertEqual(st.to_recon(), {
+            'attempted': 1,
+            'failure': 2,
+            'hashmatch': 3,
+            'remove': 4,
+            'rsync': 5,
+            'success': 7,
+            'suffix_count': 8,
+            'suffix_hash': 9,
+            'suffix_sync': 10,
+            'failure_nodes': {'10.1.2.3': {'sda': 100, 'sdb': 200}},
+        })
+
+    def test_recon_roundtrip(self):
+        before = object_replicator.Stats(
+            attempted=1, failure=2, hashmatch=3, remove=4,
+            rsync=5, success=7,
+            suffix_count=8, suffix_hash=9, suffix_sync=10,
+            failure_nodes={'10.1.2.3': {'sda': 100, 'sdb': 200}})
+        after = object_replicator.Stats.from_recon(before.to_recon())
+        self.assertEqual(after.attempted, before.attempted)
+        self.assertEqual(after.failure, before.failure)
+        self.assertEqual(after.hashmatch, before.hashmatch)
+        self.assertEqual(after.remove, before.remove)
+        self.assertEqual(after.rsync, before.rsync)
+        self.assertEqual(after.success, before.success)
+        self.assertEqual(after.suffix_count, before.suffix_count)
+        self.assertEqual(after.suffix_hash, before.suffix_hash)
+        self.assertEqual(after.suffix_sync, before.suffix_sync)
+        self.assertEqual(after.failure_nodes, before.failure_nodes)
+
+    def test_from_recon_skips_extra_fields(self):
+        # If another attribute ever sneaks its way in, we should ignore it.
+        # This will make aborted upgrades a little less painful for
+        # operators.
+        recon_dict = {'attempted': 1, 'failure': 2, 'hashmatch': 3,
+                      'spices': 5, 'treasures': 8}
+        stats = object_replicator.Stats.from_recon(recon_dict)
+        self.assertEqual(stats.attempted, 1)
+        self.assertEqual(stats.failure, 2)
+        self.assertEqual(stats.hashmatch, 3)
+        # We don't gain attributes just because they're in object.recon.
+        self.assertFalse(hasattr(stats, 'spices'))
+        self.assertFalse(hasattr(stats, 'treasures'))
+
+    def test_add_failure_stats(self):
+        st = object_replicator.Stats()
+        st.add_failure_stats([('10.1.1.1', 'd10'), ('10.1.1.1', 'd11')])
+        st.add_failure_stats([('10.1.1.1', 'd10')])
+        st.add_failure_stats([('10.1.1.1', 'd12'), ('10.2.2.2', 'd20'),
+                              ('10.2.2.2', 'd21'), ('10.2.2.2', 'd21'),
+                              ('10.2.2.2', 'd21')])
+        self.assertEqual(st.failure, 8)
+
+        as_dict = st.to_recon()
+        self.assertEqual(as_dict['failure_nodes'], {
+            '10.1.1.1': {
+                'd10': 2,
+                'd11': 1,
+                'd12': 1,
+            },
+            '10.2.2.2': {
+                'd20': 1,
+                'd21': 3,
+            },
+        })
+
+    def test_add(self):
+        st1 = object_replicator.Stats(
+            attempted=1, failure=2, hashmatch=3, remove=4, rsync=5,
+            success=6, suffix_count=7, suffix_hash=8, suffix_sync=9,
+            failure_nodes={
+                '10.1.1.1': {'sda': 10, 'sdb': 20},
+                '10.1.1.2': {'sda': 10, 'sdb': 20}})
+        st2 = object_replicator.Stats(
+            attempted=2, failure=4, hashmatch=6, remove=8, rsync=10,
+            success=12, suffix_count=14, suffix_hash=16, suffix_sync=18,
+            failure_nodes={
+                '10.1.1.2': {'sda': 10, 'sdb': 20},
+                '10.1.1.3': {'sda': 10, 'sdb': 20}})
+        total = st1 + st2
+        self.assertEqual(total.attempted, 3)
+        self.assertEqual(total.failure, 6)
+        self.assertEqual(total.hashmatch, 9)
+        self.assertEqual(total.remove, 12)
+        self.assertEqual(total.rsync, 15)
+        self.assertEqual(total.success, 18)
+        self.assertEqual(total.suffix_count, 21)
+        self.assertEqual(total.suffix_hash, 24)
+        self.assertEqual(total.suffix_sync, 27)
+        self.assertEqual(total.failure_nodes, {
+            '10.1.1.1': {'sda': 10, 'sdb': 20},
+            '10.1.1.2': {'sda': 20, 'sdb': 40},
+            '10.1.1.3': {'sda': 10, 'sdb': 20},
+        })
+
 
 if __name__ == '__main__':
     unittest.main()
diff --git a/test/unit/obj/test_server.py b/test/unit/obj/test_server.py
old mode 100755
new mode 100644
index 5be7604ece..4d7747fc8a
--- a/test/unit/obj/test_server.py
+++ b/test/unit/obj/test_server.py
@@ -1,4 +1,5 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# coding: utf-8
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,499 +14,1028 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-""" Tests for swift.object_server """
+"""Tests for swift.obj.server"""
 
-import cPickle as pickle
+import pickle
+import datetime
+import json
+import errno
+import operator
 import os
+from unittest import mock
+from io import StringIO
 import unittest
-import email
+import random
 from shutil import rmtree
-from StringIO import StringIO
-from time import gmtime, sleep, strftime, time
+from time import strftime, time, struct_time
 from tempfile import mkdtemp
-from hashlib import md5
-
-from eventlet import sleep, spawn, wsgi, listen, Timeout
-from test.unit import FakeLogger
-from test.unit import _getxattr as getxattr
-from test.unit import _setxattr as setxattr
-from test.unit import connect_tcp, readuntil2crlfs
-from swift.obj import server as object_server, replicator
-from swift.common import utils
+from collections import defaultdict
+from contextlib import contextmanager
+from textwrap import dedent
+
+from eventlet import sleep, spawn, wsgi, Timeout, tpool, greenthread
+from eventlet.green.http import client as http_client
+
+from swift import __version__ as swift_version
+from swift.common.http import is_success
+from swift.obj.expirer import ExpirerConfig
+from test import listen_zero, BaseTestCase
+from test.debug_logger import debug_logger, FakeStatsdClient, \
+    FakeLabeledStatsdClient
+from test.unit import mocked_http_conn, \
+    make_timestamp_iter, DEFAULT_TEST_EC_TYPE, skip_if_no_xattrs, \
+    connect_tcp, readuntil2crlfs, patch_policies, encode_frag_archive_bodies, \
+    mock_check_drive, FakeRing
+from swift.obj import server as object_server
+from swift.obj import updater, diskfile
+from swift.common import utils, bufferedhttp, http_protocol
+from swift.common.header_key_dict import HeaderKeyDict
 from swift.common.utils import hash_path, mkdirs, normalize_timestamp, \
-                               NullLogger, storage_directory
-from swift.common.exceptions import DiskFileNotExist
+    NullLogger, storage_directory, public, replication, encode_timestamps, \
+    Timestamp, md5
 from swift.common import constraints
-from eventlet import tpool
-from swift.common.swob import Request
+from swift.common.request_helpers import get_reserved_name
+from swift.common.statsd_client import LabeledStatsdClient
+from swift.common.swob import Request, WsgiBytesIO, \
+    HTTPRequestedRangeNotSatisfiable, date_header_format
+from swift.common.splice import splice
+from swift.common.storage_policy import (StoragePolicy, ECStoragePolicy,
+                                         POLICIES, EC_POLICY)
+from swift.common.exceptions import DiskFileDeviceUnavailable, \
+    DiskFileNoSpace, DiskFileQuarantined
+from swift.common.wsgi import init_request_processor
+
+
+def mock_time(*args, **kwargs):
+    return 5000.0
+
+
+test_policies = [
+    StoragePolicy(0, name='zero', is_default=True),
+    ECStoragePolicy(1, name='one', ec_type=DEFAULT_TEST_EC_TYPE,
+                    ec_ndata=10, ec_nparity=4),
+]
+
+
+@contextmanager
+def fake_spawn():
+    """
+    Spawn and capture the result so we can later wait on it. This means we can
+    test code executing in a greenthread but still wait() on the result to
+    ensure that the method has completed.
+    """
+
+    greenlets = []
+
+    def _inner_fake_spawn(func, *a, **kw):
+        gt = greenthread.spawn(func, *a, **kw)
+        greenlets.append(gt)
+        return gt
+
+    object_server.spawn = _inner_fake_spawn
+    with mock.patch('swift.obj.server.spawn', _inner_fake_spawn):
+        try:
+            yield
+        finally:
+            for gt in greenlets:
+                gt.wait()
 
 
-class TestDiskFile(unittest.TestCase):
-    """Test swift.obj.server.DiskFile"""
+class TestTpoolSize(unittest.TestCase):
+    def test_default_config(self):
+        with mock.patch('eventlet.tpool.set_num_threads') as mock_snt:
+            object_server.ObjectController({})
+        self.assertEqual([], mock_snt.mock_calls)
 
-    def setUp(self):
-        """ Set up for testing swift.object_server.ObjectController """
-        self.testdir = os.path.join(mkdtemp(), 'tmp_test_obj_server_DiskFile')
-        mkdirs(os.path.join(self.testdir, 'sda1', 'tmp'))
+    def test_explicit_setting(self):
+        conf = {'eventlet_tpool_num_threads': '17'}
+        with mock.patch('eventlet.tpool.set_num_threads') as mock_snt:
+            object_server.ObjectController(conf)
+        self.assertEqual([mock.call(17)], mock_snt.mock_calls)
 
-        def fake_exe(*args, **kwargs):
-            pass
-        tpool.execute = fake_exe
+    def test_servers_per_port_no_explicit_setting(self):
+        conf = {'servers_per_port': '3'}
+        with mock.patch('eventlet.tpool.set_num_threads') as mock_snt:
+            object_server.ObjectController(conf)
+        self.assertEqual([mock.call(1)], mock_snt.mock_calls)
 
-    def tearDown(self):
-        """ Tear down for testing swift.object_server.ObjectController """
-        rmtree(os.path.dirname(self.testdir))
-
-    def _create_test_file(self, data, keep_data_fp=True):
-        df = object_server.DiskFile(self.testdir, 'sda1', '0', 'a', 'c', 'o',
-                                    FakeLogger())
-        mkdirs(df.datadir)
-        f = open(os.path.join(df.datadir,
-                              normalize_timestamp(time()) + '.data'), 'wb')
-        f.write(data)
-        setxattr(f.fileno(), object_server.METADATA_KEY,
-                 pickle.dumps({}, object_server.PICKLE_PROTOCOL))
-        f.close()
-        df = object_server.DiskFile(self.testdir, 'sda1', '0', 'a', 'c', 'o',
-                                    FakeLogger(), keep_data_fp=keep_data_fp)
-        return df
-
-    def test_disk_file_app_iter_corners(self):
-        df = self._create_test_file('1234567890')
-        self.assertEquals(''.join(df.app_iter_range(0, None)), '1234567890')
-
-        df = object_server.DiskFile(self.testdir, 'sda1', '0', 'a', 'c', 'o',
-                                    FakeLogger(), keep_data_fp=True)
-        self.assertEqual(''.join(df.app_iter_range(5, None)), '67890')
-
-    def test_disk_file_app_iter_ranges(self):
-        df = self._create_test_file('012345678911234567892123456789')
-        it = df.app_iter_ranges([(0, 10), (10, 20), (20, 30)], 'plain/text',
-                                '\r\n--someheader\r\n', 30)
-        value = ''.join(it)
-        self.assert_('0123456789' in value)
-        self.assert_('1123456789' in value)
-        self.assert_('2123456789' in value)
-
-    def test_disk_file_app_iter_ranges_edges(self):
-        df = self._create_test_file('012345678911234567892123456789')
-        it = df.app_iter_ranges([(3, 10), (0, 2)], 'application/whatever',
-                                '\r\n--someheader\r\n', 30)
-        value = ''.join(it)
-        self.assert_('3456789' in value)
-        self.assert_('01' in value)
-
-    def test_disk_file_large_app_iter_ranges(self):
-        """
-        This test case is to make sure that the disk file app_iter_ranges
-        method all the paths being tested.
-        """
-        long_str = '01234567890' * 65536
-        target_strs = ['3456789', long_str[0:65590]]
-        df = self._create_test_file(long_str)
+    def test_servers_per_port_with_explicit_setting(self):
+        conf = {'eventlet_tpool_num_threads': '17',
+                'servers_per_port': '3'}
+        with mock.patch('eventlet.tpool.set_num_threads') as mock_snt:
+            object_server.ObjectController(conf)
+        self.assertEqual([mock.call(17)], mock_snt.mock_calls)
 
-        it = df.app_iter_ranges([(3, 10), (0, 65590)], 'plain/text',
-                                '5e816ff8b8b8e9a5d355497e5d9e0301', 655360)
+    def test_servers_per_port_empty(self):
+        # run_wsgi is robust to this, so we should be too
+        conf = {'servers_per_port': ''}
+        with mock.patch('eventlet.tpool.set_num_threads') as mock_snt:
+            object_server.ObjectController(conf)
+        self.assertEqual([], mock_snt.mock_calls)
 
-        """
-        the produced string actually missing the MIME headers
-        need to add these headers to make it as real MIME message.
-        The body of the message is produced by method app_iter_ranges
-        off of DiskFile object.
-        """
-        header = ''.join(['Content-Type: multipart/byteranges;',
-                          'boundary=',
-                          '5e816ff8b8b8e9a5d355497e5d9e0301\r\n'])
 
-        value = header + ''.join(it)
+class SameReqEnv(object):
 
-        parts = map(lambda p: p.get_payload(decode=True),
-                    email.message_from_string(value).walk())[1:3]
-        self.assertEqual(parts, target_strs)
+    def __init__(self, req):
+        self.environ = req.environ
 
-    def test_disk_file_app_iter_ranges_empty(self):
-        """
-        This test case tests when empty value passed into app_iter_ranges
-        When ranges passed into the method is either empty array or None,
-        this method will yield empty string
-        """
-        df = self._create_test_file('012345678911234567892123456789')
-        it = df.app_iter_ranges([], 'application/whatever',
-                                '\r\n--someheader\r\n', 100)
-        self.assertEqual(''.join(it), '')
-
-        df = object_server.DiskFile(self.testdir, 'sda1', '0', 'a', 'c', 'o',
-                                    FakeLogger(), keep_data_fp=True)
-        it = df.app_iter_ranges(None, 'app/something',
-                                '\r\n--someheader\r\n', 150)
-        self.assertEqual(''.join(it), '')
-
-    def test_disk_file_mkstemp_creates_dir(self):
-        tmpdir = os.path.join(self.testdir, 'sda1', 'tmp')
-        os.rmdir(tmpdir)
-        with object_server.DiskFile(self.testdir, 'sda1', '0', 'a', 'c',
-                                    'o', FakeLogger()).mkstemp():
-            self.assert_(os.path.exists(tmpdir))
-
-    def test_iter_hook(self):
-        hook_call_count = [0]
-        def hook():
-            hook_call_count[0] += 1
-
-        df = self._get_data_file(fsize=65, csize=8, iter_hook=hook)
-        print repr(df.__dict__)
-        for _ in df:
-            pass
+    def __eq__(self, other):
+        return self.environ == other.environ
 
-        self.assertEquals(hook_call_count[0], 9)
 
-    def test_quarantine(self):
-        df = object_server.DiskFile(self.testdir, 'sda1', '0', 'a', 'c', 'o',
-                                    FakeLogger())
-        mkdirs(df.datadir)
-        f = open(os.path.join(df.datadir,
-                              normalize_timestamp(time()) + '.data'), 'wb')
-        setxattr(f.fileno(), object_server.METADATA_KEY,
-                 pickle.dumps({}, object_server.PICKLE_PROTOCOL))
-        df = object_server.DiskFile(self.testdir, 'sda1', '0', 'a', 'c', 'o',
-                                    FakeLogger())
-        df.quarantine()
-        quar_dir = os.path.join(self.testdir, 'sda1', 'quarantined',
-                                'objects', os.path.basename(os.path.dirname(
-                                                            df.data_file)))
-        self.assert_(os.path.isdir(quar_dir))
-
-    def test_quarantine_same_file(self):
-        df = object_server.DiskFile(self.testdir, 'sda1', '0', 'a', 'c', 'o',
-                                    FakeLogger())
-        mkdirs(df.datadir)
-        f = open(os.path.join(df.datadir,
-                              normalize_timestamp(time()) + '.data'), 'wb')
-        setxattr(f.fileno(), object_server.METADATA_KEY,
-                 pickle.dumps({}, object_server.PICKLE_PROTOCOL))
-        df = object_server.DiskFile(self.testdir, 'sda1', '0', 'a', 'c', 'o',
-                                    FakeLogger())
-        new_dir = df.quarantine()
-        quar_dir = os.path.join(self.testdir, 'sda1', 'quarantined',
-                                'objects', os.path.basename(os.path.dirname(
-                                                            df.data_file)))
-        self.assert_(os.path.isdir(quar_dir))
-        self.assertEquals(quar_dir, new_dir)
-        # have to remake the datadir and file
-        mkdirs(df.datadir)
-        f = open(os.path.join(df.datadir,
-                              normalize_timestamp(time()) + '.data'), 'wb')
-        setxattr(f.fileno(), object_server.METADATA_KEY,
-                 pickle.dumps({}, object_server.PICKLE_PROTOCOL))
-
-        df = object_server.DiskFile(self.testdir, 'sda1', '0', 'a', 'c', 'o',
-                                    FakeLogger(), keep_data_fp=True)
-        double_uuid_path = df.quarantine()
-        self.assert_(os.path.isdir(double_uuid_path))
-        self.assert_('-' in os.path.basename(double_uuid_path))
-
-    def _get_data_file(self, invalid_type=None, obj_name='o',
-                       fsize=1024, csize=8, extension='.data', ts=None,
-                       iter_hook=None):
-        '''returns a DiskFile'''
-        df = object_server.DiskFile(self.testdir, 'sda1', '0', 'a', 'c',
-                                    obj_name, FakeLogger())
-        data = '0' * fsize
-        etag = md5()
-        if ts:
-            timestamp = ts
-        else:
-            timestamp = str(normalize_timestamp(time()))
-        with df.mkstemp() as fd:
-            os.write(fd, data)
-            etag.update(data)
-            etag = etag.hexdigest()
-            metadata = {
-                'ETag': etag,
-                'X-Timestamp': timestamp,
-                'Content-Length': str(os.fstat(fd).st_size),
-            }
-            df.put(fd, metadata, extension=extension)
-            if invalid_type == 'ETag':
-                etag = md5()
-                etag.update('1' + '0' * (fsize - 1))
-                etag = etag.hexdigest()
-                metadata['ETag'] = etag
-                object_server.write_metadata(fd, metadata)
-            if invalid_type == 'Content-Length':
-                metadata['Content-Length'] = fsize - 1
-                object_server.write_metadata(fd, metadata)
-
-        df = object_server.DiskFile(self.testdir, 'sda1', '0', 'a', 'c',
-                                    obj_name, FakeLogger(),
-                                    keep_data_fp=True, disk_chunk_size=csize,
-                                    iter_hook=iter_hook)
-        if invalid_type == 'Zero-Byte':
-            os.remove(df.data_file)
-            fp = open(df.data_file, 'w')
-            fp.close()
-        df.unit_test_len = fsize
-        return df
-
-    def test_quarantine_valids(self):
-        df = self._get_data_file(obj_name='1')
-        for chunk in df:
-            pass
-        self.assertFalse(df.quarantined_dir)
+@patch_policies(test_policies)
+class TestObjectController(BaseTestCase):
+    """Test swift.obj.server.ObjectController"""
 
-        df = self._get_data_file(obj_name='2', csize=1)
-        for chunk in df:
-            pass
-        self.assertFalse(df.quarantined_dir)
+    def setUp(self):
+        """Set up for testing swift.object.server.ObjectController"""
+        skip_if_no_xattrs()
+        utils.HASH_PATH_SUFFIX = b'endcap'
+        utils.HASH_PATH_PREFIX = b'startcap'
+        self.tmpdir = mkdtemp()
+        self.testdir = os.path.join(self.tmpdir,
+                                    'tmp_test_object_server_ObjectController')
+        self.sda1 = os.path.join(self.testdir, 'sda1')
+        mkdirs(self.sda1)
+        self.conf = {'devices': self.testdir, 'mount_check': 'false',
+                     'container_update_timeout': 0.0}
+        self.logger = debug_logger('test-object-controller')
+        self.object_controller = object_server.ObjectController(
+            self.conf, logger=self.logger)
+        self.object_controller.bytes_per_sync = 1
+        self._orig_tpool_exc = tpool.execute
+        tpool.execute = lambda f, *args, **kwargs: f(*args, **kwargs)
+        self.df_mgr = diskfile.DiskFileManager(self.conf,
+                                               self.object_controller.logger)
 
-        df = self._get_data_file(obj_name='3', csize=100000)
-        for chunk in df:
-            pass
-        self.assertFalse(df.quarantined_dir)
+        self.ts = make_timestamp_iter()
+        self.ec_policies = [p for p in POLICIES if p.policy_type == EC_POLICY]
+        self.container_ring = FakeRing()
 
-    def run_quarantine_invalids(self, invalid_type):
-        df = self._get_data_file(invalid_type=invalid_type, obj_name='1')
-        for chunk in df:
-            pass
-        self.assertTrue(df.quarantined_dir)
-        df = self._get_data_file(invalid_type=invalid_type,
-                                 obj_name='2', csize=1)
-        for chunk in df:
-            pass
-        self.assertTrue(df.quarantined_dir)
-        df = self._get_data_file(invalid_type=invalid_type,
-                                 obj_name='3', csize=100000)
-        for chunk in df:
-            pass
-        self.assertTrue(df.quarantined_dir)
-        df = self._get_data_file(invalid_type=invalid_type, obj_name='4')
-        self.assertFalse(df.quarantined_dir)
-        df = self._get_data_file(invalid_type=invalid_type, obj_name='5')
-        for chunk in df.app_iter_range(0, df.unit_test_len):
-            pass
-        self.assertTrue(df.quarantined_dir)
-        df = self._get_data_file(invalid_type=invalid_type, obj_name='6')
-        for chunk in df.app_iter_range(0, df.unit_test_len + 100):
-            pass
-        self.assertTrue(df.quarantined_dir)
-        expected_quar = False
-        # for the following, Content-Length/Zero-Byte errors will always result
-        # in a quarantine, even if the whole file isn't check-summed
-        if invalid_type in ('Zero-Byte', 'Content-Length'):
-            expected_quar = True
-        df = self._get_data_file(invalid_type=invalid_type, obj_name='7')
-        for chunk in df.app_iter_range(1, df.unit_test_len):
-            pass
-        self.assertEquals(bool(df.quarantined_dir), expected_quar)
-        df = self._get_data_file(invalid_type=invalid_type, obj_name='8')
-        for chunk in df.app_iter_range(0, df.unit_test_len - 1):
-            pass
-        self.assertEquals(bool(df.quarantined_dir), expected_quar)
-        df = self._get_data_file(invalid_type=invalid_type, obj_name='8')
-        for chunk in df.app_iter_range(1, df.unit_test_len + 1):
-            pass
-        self.assertEquals(bool(df.quarantined_dir), expected_quar)
-
-    def test_quarantine_invalids(self):
-        self.run_quarantine_invalids('ETag')
-        self.run_quarantine_invalids('Content-Length')
-        self.run_quarantine_invalids('Zero-Byte')
-
-    def test_quarantine_deleted_files(self):
-        df = self._get_data_file(invalid_type='Content-Length',
-                                 extension='.data')
-        df.close()
-        self.assertTrue(df.quarantined_dir)
-        df = self._get_data_file(invalid_type='Content-Length',
-                                 extension='.ts')
-        df.close()
-        self.assertFalse(df.quarantined_dir)
-        df = self._get_data_file(invalid_type='Content-Length',
-                                 extension='.ts')
-        self.assertRaises(DiskFileNotExist, df.get_data_file_size)
-
-    def test_put_metadata(self):
-        df = self._get_data_file()
-        ts = time()
-        metadata = { 'X-Timestamp': ts, 'X-Object-Meta-test': 'data' }
-        df.put_metadata(metadata)
-        exp_name = '%s.meta' % str(normalize_timestamp(ts))
-        dl = os.listdir(df.datadir)
-        self.assertEquals(len(dl), 2)
-        self.assertTrue(exp_name in set(dl))
-
-    def test_put_metadata_ts(self):
-        df = self._get_data_file()
-        ts = time()
-        metadata = { 'X-Timestamp': ts, 'X-Object-Meta-test': 'data' }
-        df.put_metadata(metadata, tombstone=True)
-        exp_name = '%s.ts' % str(normalize_timestamp(ts))
-        dl = os.listdir(df.datadir)
-        self.assertEquals(len(dl), 2)
-        self.assertTrue(exp_name in set(dl))
-
-    def test_unlinkold(self):
-        df1 = self._get_data_file()
-        future_time = str(normalize_timestamp(time() + 100))
-        df2 = self._get_data_file(ts=future_time)
-        self.assertEquals(len(os.listdir(df1.datadir)), 2)
-        df1.unlinkold(future_time)
-        self.assertEquals(len(os.listdir(df1.datadir)), 1)
-        self.assertEquals(os.listdir(df1.datadir)[0], "%s.data" % future_time)
-
-    def test_close_error(self):
-
-        def err():
-            raise Exception("bad")
-
-        df = self._get_data_file(fsize=1024 * 1024 * 2)
-        df._handle_close_quarantine = err
-        for chunk in df:
-            pass
-        # close is called at the end of the iterator
-        self.assertEquals(df.fp, None)
-        self.assertEquals(len(df.logger.log_dict['error']), 1)
+    def tearDown(self):
+        """Tear down for testing swift.object.server.ObjectController"""
+        rmtree(self.tmpdir)
+        tpool.execute = self._orig_tpool_exc
+
+    def _stage_tmp_dir(self, policy):
+        mkdirs(os.path.join(self.testdir, 'sda1',
+                            diskfile.get_tmp_dir(policy)))
+
+    def iter_policies(self):
+        for policy in POLICIES:
+            self.policy = policy
+            yield policy
+
+    def test_init(self):
+        conf = {
+            'devices': self.testdir,
+            'mount_check': 'false',
+            'container_update_timeout': 0.0,
+        }
+        self.logger.clear()
+        app = object_server.ObjectController(conf, logger=self.logger)
+        self.assertEqual(app.container_update_timeout, 0.0)
+        self.assertEqual(app.auto_create_account_prefix, '.')
+        self.assertIsInstance(app.statsd, LabeledStatsdClient)
+        self.assertEqual({
+            'debug': [
+                'Labeled statsd mode: disabled (test-object-controller)'
+            ]}, self.logger.all_log_lines())
+
+    def check_all_api_methods(self, obj_name='o', alt_res=None):
+        path = '/sda1/p/a/c/%s' % obj_name
+        body = b'SPECIAL_STRING'
+
+        op_table = {
+            "PUT": (body, alt_res or 201, b''),  # create one
+            "GET": (b'', alt_res or 200, body),  # check it
+            "POST": (b'', alt_res or 202, b''),   # update it
+            "HEAD": (b'', alt_res or 200, b''),   # head it
+            "DELETE": (b'', alt_res or 204, b'')  # delete it
+        }
+
+        for method in ["PUT", "GET", "POST", "HEAD", "DELETE"]:
+            in_body, res, out_body = op_table[method]
+            timestamp = normalize_timestamp(time())
+            req = Request.blank(
+                path, environ={'REQUEST_METHOD': method},
+                headers={'X-Timestamp': timestamp,
+                         'Content-Type': 'application/x-test'})
+            req.body = in_body
+            resp = req.get_response(self.object_controller)
+            self.assertEqual(resp.status_int, res)
+            if out_body and (200 <= res < 300):
+                self.assertEqual(resp.body, out_body)
+
+    def _do_test_timing_stats(self, conf, req, now):
+        self.logger.clear()
+        with mock.patch('swift.common.utils.time.time', return_value=now), \
+                mock.patch('swift.common.statsd_client.LabeledStatsdClient',
+                           FakeLabeledStatsdClient):
+            app = object_server.ObjectController(conf, logger=self.logger)
+            statsd_client = app.logger.logger.statsd_client
+            statsd = app.statsd
+
+            with mock.patch.object(statsd_client, 'random', return_value=0), \
+                    mock.patch.object(statsd, 'random', return_value=0):
+                resp = req.get_response(app)
+
+        self.assertIsInstance(statsd_client, FakeStatsdClient)
+        self.assertIsInstance(statsd, FakeLabeledStatsdClient)
+        return statsd_client, statsd, resp
+
+    def test_legacy_and_labeled_timing_stats_get_success(self):
+        timestamp = normalize_timestamp(time())
+        headers = {'X-Timestamp': timestamp,
+                   'Content-Type': 'text/plain'}
 
-    def test_quarantine_twice(self):
-        df = self._get_data_file(invalid_type='Content-Length',
-                                 extension='.data')
-        self.assert_(os.path.isfile(df.data_file))
-        quar_dir = df.quarantine()
-        self.assertFalse(os.path.isfile(df.data_file))
-        self.assert_(os.path.isdir(quar_dir))
-        self.assertEquals(df.quarantine(), None)
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers=headers, body=b'VERIFY')
+        now = time()
+        statsd_client, statsd, resp = self._do_test_timing_stats(
+            self.conf, req, now)
+        self.assertEqual(resp.status_int, 201)
+
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'})
+        statsd_client, statsd, _ = self._do_test_timing_stats(
+            self.conf, req, now)
+        self.assertEqual({
+            'timing_since': [
+                (('GET.timing', now), {})
+            ]
+        }, statsd_client.calls)
+        self.assertEqual({
+            'timing_since': [(('swift_object_server_request_timing', now), {
+                'labels': {
+                    'method': 'GET',
+                    'account': 'a',
+                    'container': 'c',
+                    'policy': 0,
+                    'status': 200
+                },
+            })]
+        }, statsd.calls)
+
+    def test_legacy_and_labeled_timing_stats_put_post_success(self):
+        timestamp = normalize_timestamp(time())
+        headers = {'X-Timestamp': timestamp,
+                   'Content-Type': 'text/plain'}
 
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers=headers, body=b'VERIFY')
+        now = time()
+        statsd_client, statsd, resp = self._do_test_timing_stats(
+            self.conf, req, now)
+        self.assertEqual(resp.status_int, 201)
+        self.assertEqual({
+            'transfer_rate': [(('PUT.sda1.timing', mock.ANY, mock.ANY), {})],
+            'timing_since': [(('PUT.timing', now), {})]
+        }, statsd_client.calls)
+        self.assertEqual({
+            'timing_since': [(('swift_object_server_request_timing', now), {
+                'labels': {
+                    'method': 'PUT',
+                    'account': 'a',
+                    'container': 'c',
+                    'policy': 0,
+                    'status': 201
+                },
+            })]
+        }, statsd.calls)
 
-class TestObjectController(unittest.TestCase):
-    """ Test swift.obj.server.ObjectController """
+        timestamp = normalize_timestamp(time())
+        headers['X-Timestamp'] = timestamp
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers=headers)
+        statsd_client, statsd, _ = self._do_test_timing_stats(
+            self.conf, req, now)
+        self.assertEqual({
+            'timing_since': [(('POST.timing', now), {})]
+        }, statsd_client.calls)
+        self.assertEqual({
+            'timing_since': [(('swift_object_server_request_timing', now), {
+                'labels': {
+                    'method': 'POST',
+                    'account': 'a',
+                    'container': 'c',
+                    'policy': 0,
+                    'status': 202
+                },
+            })]
+        }, statsd.calls)
+
+    def test_legacy_and_labeled_timing_stats_head_success(self):
+        timestamp = normalize_timestamp(time())
+        headers = {'X-Timestamp': timestamp,
+                   'Content-Type': 'text/plain'}
 
-    def setUp(self):
-        """ Set up for testing swift.object_server.ObjectController """
-        utils.HASH_PATH_SUFFIX = 'endcap'
-        self.testdir = \
-            os.path.join(mkdtemp(), 'tmp_test_object_server_ObjectController')
-        mkdirs(os.path.join(self.testdir, 'sda1', 'tmp'))
-        conf = {'devices': self.testdir, 'mount_check': 'false'}
-        self.object_controller = object_server.ObjectController(conf)
-        self.object_controller.bytes_per_sync = 1
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers=headers, body=b'VERIFY')
+        now = time()
+        statsd_client, statsd, resp = self._do_test_timing_stats(
+            self.conf, req, now)
+        self.assertEqual(resp.status_int, 201)
+
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'HEAD'})
+        statsd_client, statsd, _ = self._do_test_timing_stats(
+            self.conf, req, now)
+        self.assertEqual({
+            'timing_since': [
+                (('HEAD.timing', now), {'sample_rate': 0.8}),
+            ]
+        }, statsd_client.calls)
+        self.assertEqual({
+            'timing_since': [(('swift_object_server_request_timing', now), {
+                'labels': {
+                    'method': 'HEAD',
+                    'account': 'a',
+                    'container': 'c',
+                    'policy': 0,
+                    'status': 200
+                }
+            })]
+        }, statsd.calls)
+
+    def test_legacy_and_labeled_timing_stats_delete_success(self):
+        timestamp = normalize_timestamp(time())
+        headers = {'X-Timestamp': timestamp,
+                   'Content-Type': 'text/plain'}
 
-    def tearDown(self):
-        """ Tear down for testing swift.object_server.ObjectController """
-        rmtree(os.path.dirname(self.testdir))
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers=headers, body=b'VERIFY')
+        now = time()
+        statsd_client, statsd, resp = self._do_test_timing_stats(
+            self.conf, req, now)
+        self.assertEqual(resp.status_int, 201)
+
+        timestamp = normalize_timestamp(time())
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'DELETE'},
+            headers={'X-Timestamp': timestamp})
+        statsd_client, statsd, _ = self._do_test_timing_stats(
+            self.conf, req, now)
+        self.assertEqual({
+            'timing_since': [
+                (('DELETE.timing', now), {})
+            ]
+        }, statsd_client.calls)
+        self.assertEqual({
+            'timing_since': [(('swift_object_server_request_timing', now), {
+                'labels': {
+                    'method': 'DELETE',
+                    'account': 'a',
+                    'container': 'c',
+                    'policy': 0,
+                    'status': 204
+                },
+            })]
+        }, statsd.calls)
+
+    def test_legacy_and_labeled_timing_stats_replicate_success(self):
+        req = Request.blank(
+            '/sda1/p/', environ={'REQUEST_METHOD': 'REPLICATE'})
+        now = time()
+        statsd_client, statsd, _ = self._do_test_timing_stats(
+            self.conf, req, now)
+        self.assertEqual({'timing_since': [(('REPLICATE.timing', now), {
+            'sample_rate': 0.1
+        })]}, statsd_client.calls)
+        self.assertEqual(
+            {'timing_since': [(('swift_object_server_request_timing', now), {
+                'labels': {
+                    'method': 'REPLICATE',
+                    'policy': 0,
+                    'skip_rehash': False,
+                    'status': 200
+                }
+            })]},
+            statsd.calls)
+
+    def test_legacy_and_labeled_timing_stats_replicate_skip_rehash(self):
+        # suffixes in request path
+        req = Request.blank(
+            '/sda1/p/123-abc', environ={'REQUEST_METHOD': 'REPLICATE'})
+        now = time()
+        statsd_client, statsd, _ = self._do_test_timing_stats(
+            self.conf, req, now)
+        self.assertEqual({'timing_since': [(('REPLICATE.timing', now), {
+            'sample_rate': 0.1
+        })]}, statsd_client.calls)
+        self.assertEqual(
+            {'timing_since': [(('swift_object_server_request_timing', now), {
+                'labels': {
+                    'method': 'REPLICATE',
+                    'policy': 0,
+                    'skip_rehash': True,
+                    'status': 200
+                }
+            })]},
+            statsd.calls)
+
+    def test_legacy_and_labeled_timing_stats_replicate_policy(self):
+        # non-default policy
+        req = Request.blank(
+            '/sda1/p/', environ={'REQUEST_METHOD': 'REPLICATE'},
+            headers={'X-Backend-Storage-Policy-Index': '1'}
+        )
+        now = time()
+        statsd_client, statsd, _ = self._do_test_timing_stats(
+            self.conf, req, now)
+        self.assertEqual({'timing_since': [(('REPLICATE.timing', now), {
+            'sample_rate': 0.1
+        })]}, statsd_client.calls)
+        self.assertEqual(
+            {'timing_since': [(('swift_object_server_request_timing', now), {
+                'labels': {
+                    'method': 'REPLICATE',
+                    'policy': 1,
+                    'skip_rehash': False,
+                    'status': 200
+                }
+            })]},
+            statsd.calls)
+
+    def test_legacy_and_labeled_timing_stats_ssync_success(self):
+        req = Request.blank('/sda1/0',
+                            environ={'REQUEST_METHOD': 'SSYNC'},
+                            headers={})
+        now = time()
+        statsd_client, statsd, _ = self._do_test_timing_stats(
+            self.conf, req, now)
+        self.assertEqual({'timing_since': [(('SSYNC.timing', now), {
+            'sample_rate': 0.1
+        })]}, statsd_client.calls)
+        self.assertEqual({
+            'timing_since': [(('swift_object_server_request_timing', now), {
+                'labels': {
+                    'method': 'SSYNC',
+                    'policy': 0,
+                    'status': 200
+                }
+            })]
+        }, statsd.calls)
+
+    def _do_test_legacy_and_labeled_timing_stats_mount_check(
+            self, req, additional_labels=None, **kwargs):
+        now = time()
+        # mount_check will provoke a 507
+        conf = dict(self.conf, mount_check='true')
+        statsd_client, statsd, _ = self._do_test_timing_stats(conf, req, now)
+        self.assertEqual({
+            'timing_since': [((req.method + '.errors.timing', now), kwargs)]
+        }, statsd_client.calls)
+        self.assertEqual({
+            'timing_since': [(('swift_object_server_request_timing', now), {
+                'labels': {
+                    'method': req.method,
+                    'policy': 0,
+                    'status': 507,
+                    **additional_labels
+                }
+            })]
+        }, statsd.calls)
+
+    def test_legacy_and_labeled_timing_stats_get_error(self):
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'})
+        self._do_test_legacy_and_labeled_timing_stats_mount_check(
+            req, additional_labels={'account': 'a', 'container': 'c', })
+
+    def test_legacy_and_labeled_timing_stats_put_error(self):
+        timestamp = normalize_timestamp(time())
+        headers = {'X-Timestamp': timestamp,
+                   'Content-Type': 'text/plain'}
+
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers=headers, body=b'VERIFY')
+        self._do_test_legacy_and_labeled_timing_stats_mount_check(
+            req, additional_labels={'account': 'a', 'container': 'c', })
+
+    def test_legacy_and_labeled_timing_stats_post_error(self):
+        timestamp = normalize_timestamp(time())
+        headers = {'X-Timestamp': timestamp,
+                   'Content-Type': 'text/plain'}
+
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers=headers)
+        self._do_test_legacy_and_labeled_timing_stats_mount_check(
+            req, additional_labels={'account': 'a', 'container': 'c', })
+
+    def test_legacy_and_labeled_timing_stats_head_error(self):
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'HEAD'})
+        self._do_test_legacy_and_labeled_timing_stats_mount_check(
+            req, sample_rate=0.8,
+            additional_labels={'account': 'a', 'container': 'c', })
+
+    def test_legacy_and_labeled_timing_stats_delete_error(self):
+        timestamp = normalize_timestamp(time())
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'DELETE'},
+            headers={'X-Timestamp': timestamp,
+                     'Content-Type': 'application/x-test'})
+        self._do_test_legacy_and_labeled_timing_stats_mount_check(
+            req, additional_labels={'account': 'a', 'container': 'c', })
+
+    def test_legacy_and_labeled_timing_stats_replicate_507(self):
+        req = Request.blank(
+            '/sda1/p/', environ={'REQUEST_METHOD': 'REPLICATE'})
+        self._do_test_legacy_and_labeled_timing_stats_mount_check(
+            req, sample_rate=0.1, additional_labels={'skip_rehash': False, })
+
+    def test_legacy_and_labeled_timing_stats_ssync_error(self):
+        def fake_get_dev_path(*args, **kwargs):
+            return None
+
+        req = Request.blank('/sda1/0',
+                            environ={'REQUEST_METHOD': 'SSYNC'},
+                            headers={})
+        now = time()
+        conf = self.conf
+        with mock.patch('swift.common.utils.time.time', return_value=now), \
+                mock.patch('swift.common.statsd_client.LabeledStatsdClient',
+                           FakeLabeledStatsdClient):
+            app = object_server.ObjectController(conf, logger=self.logger)
+            app._diskfile_router[0].get_dev_path = fake_get_dev_path
+            statsd_client = app.logger.logger.statsd_client
+            statsd = app.statsd
+
+            with mock.patch.object(statsd_client, 'random', return_value=0), \
+                    mock.patch.object(statsd, 'random', return_value=0):
+                req.get_response(app)
+
+        self.assertIsInstance(statsd_client, FakeStatsdClient)
+        self.assertIsInstance(statsd, FakeLabeledStatsdClient)
+
+        kwargs = {'sample_rate': 0.1}
+        self.assertEqual({
+            'timing_since': [((req.method + '.errors.timing', now), kwargs)]
+        }, statsd_client.calls)
+        self.assertEqual({
+            'timing_since': [(('swift_object_server_request_timing', now), {
+                'labels': {
+                    'method': req.method,
+                    'status': 507,
+                }
+            })]
+        }, statsd.calls)
+
+    def _do_test_legacy_and_labeled_timing_stats_bad_policy(
+            self, req, sample_rate=None):
+        now = time()
+        statsd_client, statsd, _ = self._do_test_timing_stats(
+            self.conf, req, now)
+        kwargs = {} if sample_rate is None else {'sample_rate': sample_rate}
+        self.assertEqual({
+            'timing_since': [((req.method + '.errors.timing', now), kwargs)]
+        }, statsd_client.calls)
+        self.assertEqual({
+            'timing_since': [(('swift_object_server_request_timing', now), {
+                'labels': {
+                    'method': req.method,
+                    'status': 503,
+                }
+            })]
+        }, statsd.calls)
+
+    def test_legacy_and_labeled_timing_stats_ssync_bad_policy(self):
+        # non-existent policy
+        req = Request.blank(
+            '/sda1/0',
+            environ={'REQUEST_METHOD': 'SSYNC'},
+            headers={'X-Backend-Storage-Policy-Index': '99'}
+        )
+        self._do_test_legacy_and_labeled_timing_stats_bad_policy(
+            req, sample_rate=0.1)
+
+    def test_legacy_and_labeled_timing_stats_replicate_bad_policy(self):
+        # non-existent policy
+        req = Request.blank(
+            '/sda1/p/', environ={'REQUEST_METHOD': 'REPLICATE'},
+            headers={'X-Backend-Storage-Policy-Index': '99'}
+        )
+        self._do_test_legacy_and_labeled_timing_stats_bad_policy(
+            req, sample_rate=0.1)
+
+    def test_REQUEST_SPECIAL_CHARS(self):
+        obj = 'special昆%20/%'
+        # The path argument of Request.blank() is a WSGI string, somehow
+        obj = obj.encode('utf-8').decode('latin-1')
+        self.check_all_api_methods(obj)
+
+    def test_device_unavailable(self):
+        def raise_disk_unavail(*args, **kwargs):
+            raise DiskFileDeviceUnavailable()
+
+        self.object_controller.get_diskfile = raise_disk_unavail
+        self.check_all_api_methods(alt_res=507)
+
+    def test_allowed_headers(self):
+        dah = ['content-disposition', 'content-encoding', 'x-delete-at',
+               'x-object-manifest', 'x-static-large-object']
+        conf = {'devices': self.testdir, 'mount_check': 'false',
+                'allowed_headers': ','.join(['content-length'] + dah)}
+        self.object_controller = object_server.ObjectController(
+            conf, logger=debug_logger())
+        self.assertEqual(self.object_controller.allowed_headers, set(dah))
 
     def test_POST_update_meta(self):
-        """ Test swift.object_server.ObjectController.POST """
+        # Test swift.obj.server.ObjectController.POST
         original_headers = self.object_controller.allowed_headers
         test_headers = 'content-encoding foo bar'.split()
         self.object_controller.allowed_headers = set(test_headers)
-        timestamp = normalize_timestamp(time())
+        put_timestamp = next(self.ts)
+        headers = {'X-Timestamp': put_timestamp.internal,
+                   'Content-Type': 'application/x-test',
+                   'Foo': 'fooheader',
+                   'Baz': 'bazheader',
+                   'X-Object-Sysmeta-Color': 'blue',
+                   'X-Object-Transient-Sysmeta-Shape': 'circle',
+                   'X-Object-Meta-1': 'One',
+                   'X-Object-Meta-Two': 'Two'}
         req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                            headers={'X-Timestamp': timestamp,
-                                     'Content-Type': 'application/x-test',
-                                     'Foo': 'fooheader',
-                                     'Baz': 'bazheader',
-                                     'X-Object-Meta-1': 'One',
-                                     'X-Object-Meta-Two': 'Two'})
-        req.body = 'VERIFY'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
-
-        timestamp = normalize_timestamp(time())
+                            headers=headers)
+        req.body = b'VERIFY'
+        etag = '"%s"' % md5(b'VERIFY', usedforsecurity=False).hexdigest()
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+        self.assertEqual(dict(resp.headers), {
+            'Content-Type': 'text/html; charset=UTF-8',
+            'Content-Length': str(len(resp.body)),
+            'Etag': etag,
+        })
+
+        post_timestamp = next(self.ts)
+        headers = {'X-Timestamp': post_timestamp.internal,
+                   'X-Object-Meta-3': 'Three',
+                   'X-Object-Meta-4': 'Four',
+                   'x-object-meta-t\xc3\xa8st': 'm\xc3\xa8ta',
+                   'X-Backend-Replication-Headers':
+                       'x-object-meta-t\xc3\xa8st',
+                   'Content-Encoding': 'gzip',
+                   'Foo': 'fooheader',
+                   'Bar': 'barheader'}
         req = Request.blank('/sda1/p/a/c/o',
                             environ={'REQUEST_METHOD': 'POST'},
-                            headers={'X-Timestamp': timestamp,
-                                     'X-Object-Meta-3': 'Three',
-                                     'X-Object-Meta-4': 'Four',
-                                     'Content-Encoding': 'gzip',
-                                     'Foo': 'fooheader',
-                                     'Bar': 'barheader',
-                                     'Content-Type': 'application/x-test'})
-        resp = self.object_controller.POST(req)
-        self.assertEquals(resp.status_int, 202)
+                            headers=headers)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 202)
+        self.assertEqual(dict(resp.headers), {
+            'Content-Type': 'text/html; charset=UTF-8',
+            'Content-Length': str(len(resp.body)),
+            'X-Backend-Content-Type': 'application/x-test',
+            'X-Object-Sysmeta-Color': 'blue',
+        })
 
         req = Request.blank('/sda1/p/a/c/o')
-        resp = self.object_controller.GET(req)
-        self.assert_("X-Object-Meta-1" not in resp.headers and
-                     "X-Object-Meta-Two" not in resp.headers and
-                     "X-Object-Meta-3" in resp.headers and
-                     "X-Object-Meta-4" in resp.headers and
-                     "Foo" in resp.headers and
-                     "Bar" in resp.headers and
-                     "Baz" not in resp.headers and
-                     "Content-Encoding" in resp.headers)
-        self.assertEquals(resp.headers['Content-Type'], 'application/x-test')
+        resp = req.get_response(self.object_controller)
+        expected_headers = {
+            'Content-Type': 'application/x-test',
+            'Content-Length': '6',
+            'Etag': etag,
+            'X-Object-Sysmeta-Color': 'blue',
+            'X-Object-Meta-3': 'Three',
+            'X-Object-Meta-4': 'Four',
+            'X-Object-Meta-T\xc3\xa8St': 'm\xc3\xa8ta',
+            'Foo': 'fooheader',
+            'Bar': 'barheader',
+            'Content-Encoding': 'gzip',
+            'X-Backend-Timestamp': post_timestamp.internal,
+            'X-Timestamp': post_timestamp.normal,
+            'X-Backend-Data-Timestamp': put_timestamp.internal,
+            'X-Backend-Durable-Timestamp': put_timestamp.internal,
+            'Last-Modified': date_header_format(post_timestamp),
+        }
+        self.assertEqual(dict(resp.headers), expected_headers)
 
         req = Request.blank('/sda1/p/a/c/o',
                             environ={'REQUEST_METHOD': 'HEAD'})
-        resp = self.object_controller.HEAD(req)
-        self.assert_("X-Object-Meta-1" not in resp.headers and
-                     "X-Object-Meta-Two" not in resp.headers and
-                     "X-Object-Meta-3" in resp.headers and
-                     "X-Object-Meta-4" in resp.headers and
-                     "Foo" in resp.headers and
-                     "Bar" in resp.headers and
-                     "Baz" not in resp.headers and
-                     "Content-Encoding" in resp.headers)
-        self.assertEquals(resp.headers['Content-Type'], 'application/x-test')
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(dict(resp.headers), expected_headers)
 
-        timestamp = normalize_timestamp(time())
+        post_timestamp = next(self.ts)
         req = Request.blank('/sda1/p/a/c/o',
                             environ={'REQUEST_METHOD': 'POST'},
-                            headers={'X-Timestamp': timestamp,
-                                     'Content-Type': 'application/x-test'})
-        resp = self.object_controller.POST(req)
-        self.assertEquals(resp.status_int, 202)
+                            headers={'X-Timestamp': post_timestamp.internal,
+                                     'X-Object-Sysmeta-Color': 'red',
+                                     'Content-Type': 'application/x-test2'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 202)
+        self.assertEqual(dict(resp.headers), {
+            'Content-Type': 'text/html; charset=UTF-8',
+            'Content-Length': str(len(resp.body)),
+            'X-Backend-Content-Type': 'application/x-test2',
+            'X-Object-Sysmeta-Color': 'blue',
+        })
+
         req = Request.blank('/sda1/p/a/c/o')
-        resp = self.object_controller.GET(req)
-        self.assert_("X-Object-Meta-3" not in resp.headers and
-                     "X-Object-Meta-4" not in resp.headers and
-                     "Foo" not in resp.headers and
-                     "Bar" not in resp.headers and
-                     "Content-Encoding" not in resp.headers)
-        self.assertEquals(resp.headers['Content-Type'], 'application/x-test')
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(dict(resp.headers), {
+            'Content-Type': 'application/x-test2',
+            'Content-Length': '6',
+            'Etag': etag,
+            'X-Object-Sysmeta-Color': 'blue',
+            'X-Backend-Timestamp': post_timestamp.internal,
+            'X-Timestamp': post_timestamp.normal,
+            'X-Backend-Data-Timestamp': put_timestamp.internal,
+            'X-Backend-Durable-Timestamp': put_timestamp.internal,
+            'Last-Modified': date_header_format(post_timestamp),
+        })
 
         # test defaults
         self.object_controller.allowed_headers = original_headers
-        timestamp = normalize_timestamp(time())
+        put_timestamp = next(self.ts)
         req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                            headers={'X-Timestamp': timestamp,
+                            headers={'X-Timestamp': put_timestamp.internal,
                                      'Content-Type': 'application/x-test',
                                      'Foo': 'fooheader',
+                                     'X-Object-Sysmeta-Color': 'red',
                                      'X-Object-Meta-1': 'One',
                                      'X-Object-Manifest': 'c/bar',
                                      'Content-Encoding': 'gzip',
                                      'Content-Disposition': 'bar',
+                                     'X-Static-Large-Object': 'True',
                                      })
         req.body = 'VERIFY'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
-        req = Request.blank('/sda1/p/a/c/o')
-        resp = self.object_controller.GET(req)
-        self.assert_("X-Object-Meta-1" in resp.headers and
-                     "Foo" not in resp.headers and
-                     "Content-Encoding" in resp.headers and
-                     "X-Object-Manifest" in resp.headers and
-                     "Content-Disposition" in resp.headers)
-        self.assertEquals(resp.headers['Content-Type'], 'application/x-test')
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+        self.assertEqual(dict(resp.headers), {
+            'Content-Type': 'text/html; charset=UTF-8',
+            'Content-Length': str(len(resp.body)),
+            'Etag': etag,
+        })
 
-        timestamp = normalize_timestamp(time())
+        req = Request.blank('/sda1/p/a/c/o')
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(dict(resp.headers), {
+            'Content-Type': 'application/x-test',
+            'Content-Length': '6',
+            'Etag': etag,
+            'X-Object-Sysmeta-Color': 'red',
+            'X-Object-Meta-1': 'One',
+            'Content-Encoding': 'gzip',
+            'X-Object-Manifest': 'c/bar',
+            'Content-Disposition': 'bar',
+            'X-Static-Large-Object': 'True',
+            'X-Backend-Timestamp': put_timestamp.internal,
+            'X-Timestamp': put_timestamp.normal,
+            'X-Backend-Data-Timestamp': put_timestamp.internal,
+            'X-Backend-Durable-Timestamp': put_timestamp.internal,
+            'Last-Modified': date_header_format(put_timestamp),
+        })
+
+        post_timestamp = next(self.ts)
         req = Request.blank('/sda1/p/a/c/o',
                             environ={'REQUEST_METHOD': 'POST'},
-                            headers={'X-Timestamp': timestamp,
+                            headers={'X-Timestamp': post_timestamp.internal,
                                      'X-Object-Meta-3': 'Three',
                                      'Foo': 'fooheader',
                                      'Content-Type': 'application/x-test'})
-        resp = self.object_controller.POST(req)
-        self.assertEquals(resp.status_int, 202)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 202)
+        self.assertEqual(dict(resp.headers), {
+            'Content-Type': 'text/html; charset=UTF-8',
+            'Content-Length': str(len(resp.body)),
+            'X-Backend-Content-Type': 'application/x-test',
+            'X-Object-Sysmeta-Color': 'red',
+        })
+
         req = Request.blank('/sda1/p/a/c/o')
-        resp = self.object_controller.GET(req)
-        self.assert_("X-Object-Meta-1" not in resp.headers and
-                     "Foo" not in resp.headers and
-                     "Content-Encoding" not in resp.headers and
-                     "X-Object-Manifest" not in resp.headers and
-                     "Content-Disposition" not in resp.headers and
-                     "X-Object-Meta-3" in resp.headers)
-        self.assertEquals(resp.headers['Content-Type'], 'application/x-test')
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(dict(resp.headers), {
+            'Content-Type': 'application/x-test',
+            'Content-Length': '6',
+            'Etag': etag,
+            'X-Object-Sysmeta-Color': 'red',
+            'X-Object-Meta-3': 'Three',
+            'X-Static-Large-Object': 'True',
+            'X-Backend-Timestamp': post_timestamp.internal,
+            'X-Timestamp': post_timestamp.normal,
+            'X-Backend-Data-Timestamp': put_timestamp.internal,
+            'X-Backend-Durable-Timestamp': put_timestamp.internal,
+            'Last-Modified': date_header_format(post_timestamp),
+        })
+
+        # Test for empty metadata
+        post_timestamp = next(self.ts)
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'X-Timestamp': post_timestamp.internal,
+                                     'Content-Type': 'application/x-test',
+                                     'X-Object-Meta-3': ''})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 202)
+        self.assertEqual(dict(resp.headers), {
+            'Content-Type': 'text/html; charset=UTF-8',
+            'Content-Length': str(len(resp.body)),
+            'X-Backend-Content-Type': 'application/x-test',
+            'X-Object-Sysmeta-Color': 'red',
+        })
+
+        req = Request.blank('/sda1/p/a/c/o')
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(dict(resp.headers), {
+            'Content-Type': 'application/x-test',
+            'Content-Length': '6',
+            'Etag': etag,
+            'X-Object-Sysmeta-Color': 'red',
+            'X-Object-Meta-3': '',
+            'X-Static-Large-Object': 'True',
+            'X-Backend-Timestamp': post_timestamp.internal,
+            'X-Timestamp': post_timestamp.normal,
+            'X-Backend-Data-Timestamp': put_timestamp.internal,
+            'X-Backend-Durable-Timestamp': put_timestamp.internal,
+            'Last-Modified': date_header_format(post_timestamp),
+        })
+
+    def test_POST_old_timestamp(self):
+        ts = time()
+        orig_timestamp = utils.Timestamp(ts).internal
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': orig_timestamp,
+                                     'Content-Type': 'application/x-test',
+                                     'X-Object-Meta-1': 'One',
+                                     'X-Object-Meta-Two': 'Two'})
+        req.body = 'VERIFY'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        # Same timestamp should result in 409
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'X-Timestamp': orig_timestamp,
+                                     'X-Object-Meta-3': 'Three',
+                                     'X-Object-Meta-4': 'Four',
+                                     'Content-Encoding': 'gzip',
+                                     'Content-Type': 'application/x-test'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 409)
+        self.assertEqual(resp.headers['X-Backend-Timestamp'], orig_timestamp)
+
+        # Earlier timestamp should result in 409
+        timestamp = normalize_timestamp(ts - 1)
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'X-Timestamp': timestamp,
+                                     'X-Object-Meta-5': 'Five',
+                                     'X-Object-Meta-6': 'Six',
+                                     'Content-Encoding': 'gzip',
+                                     'Content-Type': 'application/x-test'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 409)
+        self.assertEqual(resp.headers['X-Backend-Timestamp'], orig_timestamp)
+
+    def test_POST_conflicts_with_later_POST(self):
+        t_put = next(self.ts).internal
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': t_put,
+                                     'Content-Length': 0,
+                                     'Content-Type': 'plain/text'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        t_post1 = next(self.ts).internal
+        t_post2 = next(self.ts).internal
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'X-Timestamp': t_post2})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 202)
+
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'X-Timestamp': t_post1})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 409)
+
+        obj_dir = os.path.join(
+            self.testdir, 'sda1',
+            storage_directory(diskfile.get_data_dir(0), 'p',
+                              hash_path('a', 'c', 'o')))
+
+        ts_file = os.path.join(obj_dir, t_post2 + '.meta')
+        self.assertTrue(os.path.isfile(ts_file))
+        meta_file = os.path.join(obj_dir, t_post1 + '.meta')
+        self.assertFalse(os.path.isfile(meta_file))
+
+    def _do_test_diskfile_metadata_unavailable(self, test_req):
+        # a concurrent request may cause ondisk files to be removed between the
+        # time they were listed and the time they were opened; verify that
+        # appropriate response is returned to the client
+        t_put = next(self.ts).internal
+        t_post = next(self.ts).internal
+
+        # PUT
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': t_put,
+                                     'Content-Length': 0,
+                                     'Content-Type': 'plain/text'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        # POST
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'X-Timestamp': t_post,
+                                     'X-Object-Meta-Test': 'test'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 202)
+
+        other_reqs = [Request.blank('/sda1/p/a/c/o',
+                                    environ={'REQUEST_METHOD': 'POST'},
+                                    headers={
+                                        'X-Timestamp': next(self.ts).internal,
+                                        'X-Object-Meta-Test': 'other'})]
+        test_req.headers['X-Timestamp'] = next(self.ts).internal
+
+        # test requests concurrent with an on-disk file being unlinked...
+        orig_read_metadata = diskfile._read_file_metadata
+        concurrent_resp = []
+
+        def fake_read_metadata(fd, *args, **kwargs):
+            metadata = orig_read_metadata(fd, *args, **kwargs)
+            if other_reqs:
+                timestamps.append(metadata['X-Timestamp'])
+                if timestamps[-1] == t_post:
+                    other_req = other_reqs.pop()
+                    if other_req:
+                        # this POST will remove the meta file that the test_req
+                        # has in its dir listing
+                        resp = other_req.get_response(self.object_controller)
+                        concurrent_resp.append(resp.status_int)
+            return orig_read_metadata(fd, *args, **kwargs)
+
+        # meta file listed but not found in _read_file_metadata
+        timestamps = []
+        with mock.patch('swift.obj.diskfile._read_file_metadata',
+                        fake_read_metadata):
+            resp = test_req.get_response(self.object_controller)
+        self.assertEqual([t_put, t_post], timestamps)
+        self.assertEqual([202], concurrent_resp)
+
+        # HEAD
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'X-Timestamp': next(self.ts).internal})
+        head_resp = req.get_response(self.object_controller)
+        return resp, head_resp
+
+    def test_PUT_metafile_unavailable(self):
+        req = Request.blank('/sda1/p/a/c/o',
+                            headers={'Content-Length': '0',
+                                     'Content-Type': 'plain/text'},
+                            environ={'REQUEST_METHOD': 'PUT'})
+        resp, head_resp = self._do_test_diskfile_metadata_unavailable(req)
+        self.assertEqual(resp.status_int, 201)
+        self.assertEqual(head_resp.status_int, 200)
+        # response x-timestamp uses the *normal* format
+        self.assertEqual(Timestamp(req.headers['X-Timestamp']).normal,
+                         head_resp.headers['X-Timestamp'])
+        # response x-<*>-timestamp uses the *internal* format
+        self.assertEqual(Timestamp(req.headers['X-Timestamp']).internal,
+                         head_resp.headers['X-Backend-Timestamp'])
+        self.assertEqual(Timestamp(req.headers['X-Timestamp']).internal,
+                         head_resp.headers['X-Backend-Data-Timestamp'])
+        self.assertNotIn('X-Object-Meta-Test', head_resp.headers)
+
+    def test_POST_metafile_unavailable(self):
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'POST'})
+        resp, head_resp = self._do_test_diskfile_metadata_unavailable(req)
+        self.assertEqual(resp.status_int, 503)
+        self.assertEqual(head_resp.status_int, 200)
+        self.assertEqual('other', head_resp.headers.get('X-Object-Meta-Test'))
+
+    def test_GET_metafile_unavailable(self):
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'GET'})
+        resp, head_resp = self._do_test_diskfile_metadata_unavailable(req)
+        self.assertEqual(resp.status_int, 503)
+        self.assertEqual(head_resp.status_int, 200)
+        self.assertEqual('other', head_resp.headers.get('X-Object-Meta-Test'))
+
+    def test_HEAD_metafile_unavailable(self):
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'HEAD'})
+        resp, head_resp = self._do_test_diskfile_metadata_unavailable(req)
+        self.assertEqual(resp.status_int, 503)
+        self.assertEqual(head_resp.status_int, 200)
+        self.assertEqual('other', head_resp.headers.get('X-Object-Meta-Test'))
+
+    def test_DELETE_metafile_unavailable(self):
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'DELETE'})
+        resp, head_resp = self._do_test_diskfile_metadata_unavailable(req)
+        self.assertEqual(resp.status_int, 503)
+        self.assertEqual(head_resp.status_int, 200)
+        self.assertEqual('other', head_resp.headers.get('X-Object-Meta-Test'))
 
     def test_POST_not_exist(self):
         timestamp = normalize_timestamp(time())
@@ -515,8 +1045,8 @@ def test_POST_not_exist(self):
                                      'X-Object-Meta-1': 'One',
                                      'X-Object-Meta-2': 'Two',
                                      'Content-Type': 'text/plain'})
-        resp = self.object_controller.POST(req)
-        self.assertEquals(resp.status_int, 404)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 404)
 
     def test_POST_invalid_path(self):
         timestamp = normalize_timestamp(time())
@@ -525,16 +1055,37 @@ def test_POST_invalid_path(self):
                                      'X-Object-Meta-1': 'One',
                                      'X-Object-Meta-2': 'Two',
                                      'Content-Type': 'text/plain'})
-        resp = self.object_controller.POST(req)
-        self.assertEquals(resp.status_int, 400)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 400)
 
-    def test_POST_container_connection(self):
+    def test_POST_no_timestamp(self):
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'X-Object-Meta-1': 'One',
+                                     'X-Object-Meta-2': 'Two',
+                                     'Content-Type': 'text/plain'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 400)
 
-        def mock_http_connect(response, with_exc=False):
+    def test_POST_bad_timestamp(self):
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'X-Timestamp': 'bad',
+                                     'X-Object-Meta-1': 'One',
+                                     'X-Object-Meta-2': 'Two',
+                                     'Content-Type': 'text/plain'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 400)
+
+    def test_POST_container_connection(self):
+        # Test that POST does call container_update and returns success
+        # whether update to container server succeeds or fails
+        def mock_http_connect(calls, response, with_exc=False):
 
             class FakeConn(object):
 
-                def __init__(self, status, with_exc):
+                def __init__(self, calls, status, with_exc):
+                    self.calls = calls
                     self.status = status
                     self.reason = 'Fake'
                     self.host = '1.2.3.4'
@@ -542,223 +1093,1999 @@ def __init__(self, status, with_exc):
                     self.with_exc = with_exc
 
                 def getresponse(self):
+                    calls[0] += 1
                     if self.with_exc:
                         raise Exception('test')
                     return self
 
                 def read(self, amt=None):
-                    return ''
+                    return b''
 
-            return lambda *args, **kwargs: FakeConn(response, with_exc)
+            return lambda *args, **kwargs: FakeConn(calls, response, with_exc)
+
+        ts = time()
+        timestamp = normalize_timestamp(ts)
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': timestamp,
+                     'Content-Type': 'text/plain',
+                     'Content-Length': '0'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'POST'},
+            headers={'X-Timestamp': normalize_timestamp(ts + 1),
+                     'X-Container-Host': '1.2.3.4:0',
+                     'X-Container-Partition': '3',
+                     'X-Container-Device': 'sda1',
+                     'X-Container-Timestamp': '1',
+                     'Content-Type': 'application/new1'})
+        calls = [0]
+        with mock.patch.object(object_server, 'http_connect',
+                               mock_http_connect(calls, 202)):
+            resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 202)
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'POST'},
+            headers={'X-Timestamp': normalize_timestamp(ts + 2),
+                     'X-Container-Host': '1.2.3.4:0',
+                     'X-Container-Partition': '3',
+                     'X-Container-Device': 'sda1',
+                     'X-Container-Timestamp': '1',
+                     'Content-Type': 'application/new1'})
+        calls = [0]
+        with mock.patch.object(object_server, 'http_connect',
+                               mock_http_connect(calls, 202, with_exc=True)):
+            resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 202)
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'POST'},
+            headers={'X-Timestamp': normalize_timestamp(ts + 3),
+                     'X-Container-Host': '1.2.3.4:0',
+                     'X-Container-Partition': '3',
+                     'X-Container-Device': 'sda1',
+                     'X-Container-Timestamp': '1',
+                     'Content-Type': 'application/new2'})
+        calls = [0]
+        with mock.patch.object(object_server, 'http_connect',
+                               mock_http_connect(calls, 500)):
+            resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 202)
+
+    def _test_POST_container_updates(self, policy, update_etag=None):
+        # Test that POST requests result in correct calls to container_update
+        t = [next(self.ts) for _ in range(0, 5)]
+        calls_made = []
+        update_etag = update_etag or '098f6bcd4621d373cade4e832627b4f6'
+
+        def mock_container_update(ctlr, op, account, container, obj, request,
+                                  headers_out, objdevice, policy):
+            calls_made.append((headers_out, policy))
+
+        body = 'test'
+        headers = {
+            'X-Timestamp': t[1].internal,
+            'Content-Type': 'application/octet-stream;swift_bytes=123456789',
+            'X-Backend-Storage-Policy-Index': int(policy)}
+        if policy.policy_type == EC_POLICY:
+            # EC fragments will typically have a different size to the body and
+            # for small bodies the fragments may be longer. For this test all
+            # that matters is that the fragment and body lengths differ.
+            body = body + 'ec_overhead'
+            headers['X-Backend-Container-Update-Override-Etag'] = update_etag
+            headers['X-Backend-Container-Update-Override-Size'] = '4'
+            headers['X-Object-Sysmeta-Ec-Etag'] = update_etag
+            headers['X-Object-Sysmeta-Ec-Content-Length'] = '4'
+            headers['X-Object-Sysmeta-Ec-Frag-Index'] = 2
+        headers['Content-Length'] = str(len(body))
+
+        req = Request.blank('/sda1/p/a/c/o', body=body,
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers=headers)
+        with mock.patch('swift.obj.server.ObjectController.container_update',
+                        mock_container_update):
+            resp = req.get_response(self.object_controller)
+
+        self.assertEqual(resp.status_int, 201)
+        self.assertEqual(1, len(calls_made))
+        expected_headers = HeaderKeyDict({
+            'x-size': '4',
+            'x-content-type': 'application/octet-stream;swift_bytes=123456789',
+            'x-timestamp': t[1].internal,
+            'x-etag': update_etag})
+        self.assertDictEqual(expected_headers, calls_made[0][0])
+        self.assertEqual(policy, calls_made[0][1])
+
+        # POST with no metadata newer than the data should return 409,
+        # container update not expected
+        calls_made = []
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'POST'},
+            headers={'X-Timestamp': t[0].internal,
+                     'X-Backend-Storage-Policy-Index': int(policy)})
+
+        with mock.patch('swift.obj.server.ObjectController.container_update',
+                        mock_container_update):
+            resp = req.get_response(self.object_controller)
+
+        self.assertEqual(resp.status_int, 409)
+        self.assertEqual(resp.headers['x-backend-timestamp'],
+                         t[1].internal)
+        self.assertEqual(0, len(calls_made))
+
+        # POST with newer metadata returns success and container update
+        # is expected
+        calls_made = []
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'POST'},
+            headers={'X-Timestamp': t[3].internal,
+                     'X-Backend-Storage-Policy-Index': int(policy)})
+
+        with mock.patch('swift.obj.server.ObjectController.container_update',
+                        mock_container_update):
+            resp = req.get_response(self.object_controller)
+
+        self.assertEqual(resp.status_int, 202)
+        self.assertEqual(1, len(calls_made))
+        expected_headers = HeaderKeyDict({
+            'x-size': '4',
+            'x-content-type': 'application/octet-stream;swift_bytes=123456789',
+            'x-timestamp': t[1].internal,
+            'x-content-type-timestamp': t[1].internal,
+            'x-meta-timestamp': t[3].internal,
+            'x-etag': update_etag})
+        self.assertDictEqual(expected_headers, calls_made[0][0])
+        self.assertEqual(policy, calls_made[0][1])
+
+        # POST with no metadata newer than existing metadata should return
+        # 409, container update not expected
+        calls_made = []
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'POST'},
+            headers={'X-Timestamp': t[2].internal,
+                     'X-Backend-Storage-Policy-Index': int(policy)})
+
+        with mock.patch('swift.obj.server.ObjectController.container_update',
+                        mock_container_update):
+            resp = req.get_response(self.object_controller)
+
+        self.assertEqual(resp.status_int, 409)
+        self.assertEqual(resp.headers['x-backend-timestamp'],
+                         t[3].internal)
+        self.assertEqual(0, len(calls_made))
+
+        # POST with newer content-type but older metadata returns success
+        # and container update is expected newer content-type should have
+        # existing swift_bytes appended
+        calls_made = []
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={
+                                'X-Timestamp': t[2].internal,
+                                'Content-Type': 'text/plain',
+                                'Content-Type-Timestamp': t[2].internal,
+                                'X-Backend-Storage-Policy-Index': int(policy)
+                            })
+
+        with mock.patch('swift.obj.server.ObjectController.container_update',
+                        mock_container_update):
+            resp = req.get_response(self.object_controller)
+
+        self.assertEqual(resp.status_int, 202)
+        self.assertEqual(1, len(calls_made))
+        expected_headers = HeaderKeyDict({
+            'x-size': '4',
+            'x-content-type': 'text/plain;swift_bytes=123456789',
+            'x-timestamp': t[1].internal,
+            'x-content-type-timestamp': t[2].internal,
+            'x-meta-timestamp': t[3].internal,
+            'x-etag': update_etag})
+        self.assertDictEqual(expected_headers, calls_made[0][0])
+        self.assertEqual(policy, calls_made[0][1])
+
+        # POST with older content-type but newer metadata returns success
+        # and container update is expected
+        calls_made = []
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={
+                                'X-Timestamp': t[4].internal,
+                                'Content-Type': 'older',
+                                'Content-Type-Timestamp': t[1].internal,
+                                'X-Backend-Storage-Policy-Index': int(policy)
+                            })
+
+        with mock.patch('swift.obj.server.ObjectController.container_update',
+                        mock_container_update):
+            resp = req.get_response(self.object_controller)
+
+        self.assertEqual(resp.status_int, 202)
+        self.assertEqual(1, len(calls_made))
+        expected_headers = HeaderKeyDict({
+            'x-size': '4',
+            'x-content-type': 'text/plain;swift_bytes=123456789',
+            'x-timestamp': t[1].internal,
+            'x-content-type-timestamp': t[2].internal,
+            'x-meta-timestamp': t[4].internal,
+            'x-etag': update_etag})
+        self.assertDictEqual(expected_headers, calls_made[0][0])
+        self.assertEqual(policy, calls_made[0][1])
+
+        # POST with same-time content-type and metadata returns 409
+        # and no container update is expected
+        calls_made = []
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={
+                                'X-Timestamp': t[4].internal,
+                                'Content-Type': 'ignored',
+                                'Content-Type-Timestamp': t[2].internal,
+                                'X-Backend-Storage-Policy-Index': int(policy)
+                            })
+
+        with mock.patch('swift.obj.server.ObjectController.container_update',
+                        mock_container_update):
+            resp = req.get_response(self.object_controller)
+
+        self.assertEqual(resp.status_int, 409)
+        self.assertEqual(0, len(calls_made))
+
+        # POST with implicit newer content-type but older metadata
+        # returns success and container update is expected,
+        # update reports existing metadata timestamp
+        calls_made = []
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={
+                                'X-Timestamp': t[3].internal,
+                                'Content-Type': 'text/newer',
+                                'X-Backend-Storage-Policy-Index': int(policy)
+                            })
+
+        with mock.patch('swift.obj.server.ObjectController.container_update',
+                        mock_container_update):
+            resp = req.get_response(self.object_controller)
+
+        self.assertEqual(resp.status_int, 202)
+        self.assertEqual(1, len(calls_made))
+        expected_headers = HeaderKeyDict({
+            'x-size': '4',
+            'x-content-type': 'text/newer;swift_bytes=123456789',
+            'x-timestamp': t[1].internal,
+            'x-content-type-timestamp': t[3].internal,
+            'x-meta-timestamp': t[4].internal,
+            'x-etag': update_etag})
+        self.assertDictEqual(expected_headers, calls_made[0][0])
+        self.assertEqual(policy, calls_made[0][1])
+
+    def test_POST_container_updates_with_replication_policy(self):
+        self._test_POST_container_updates(POLICIES[0])
+
+    def test_POST_container_updates_with_EC_policy(self):
+        self._test_POST_container_updates(
+            POLICIES[1], update_etag='override_etag')
+
+    def test_POST_container_updates_precedence(self):
+        # Verify correct etag and size being sent with container updates for a
+        # PUT and for a subsequent POST.
+
+        def do_test(body, headers, policy):
+            def mock_container_update(ctlr, op, account, container, obj, req,
+                                      headers_out, objdevice, policy):
+                calls_made.append((headers_out, policy))
+            calls_made = []
+            ts_put = next(self.ts)
+
+            # make PUT with given headers and verify correct etag is sent in
+            # container update
+            headers.update({
+                'Content-Type':
+                    'application/octet-stream;swift_bytes=123456789',
+                'X-Backend-Storage-Policy-Index': int(policy),
+                'X-Object-Sysmeta-Ec-Frag-Index': 2,
+                'X-Timestamp': ts_put.internal,
+                'Content-Length': len(body)})
 
-        old_http_connect = object_server.http_connect
-        try:
-            timestamp = normalize_timestamp(time())
-            req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD':
-                'POST'}, headers={'X-Timestamp': timestamp, 'Content-Type':
-                'text/plain', 'Content-Length': '0'})
-            resp = self.object_controller.PUT(req)
-            req = Request.blank('/sda1/p/a/c/o',
-                    environ={'REQUEST_METHOD': 'POST'},
-                    headers={'X-Timestamp': timestamp,
-                             'X-Container-Host': '1.2.3.4:0',
-                             'X-Container-Partition': '3',
-                             'X-Container-Device': 'sda1',
-                             'X-Container-Timestamp': '1',
-                             'Content-Type': 'application/new1'})
-            object_server.http_connect = mock_http_connect(202)
-            resp = self.object_controller.POST(req)
-            self.assertEquals(resp.status_int, 202)
-            req = Request.blank('/sda1/p/a/c/o',
-                    environ={'REQUEST_METHOD': 'POST'},
-                    headers={'X-Timestamp': timestamp,
-                             'X-Container-Host': '1.2.3.4:0',
-                             'X-Container-Partition': '3',
-                             'X-Container-Device': 'sda1',
-                             'X-Container-Timestamp': '1',
-                             'Content-Type': 'application/new1'})
-            object_server.http_connect = mock_http_connect(202, with_exc=True)
-            resp = self.object_controller.POST(req)
-            self.assertEquals(resp.status_int, 202)
             req = Request.blank('/sda1/p/a/c/o',
-                    environ={'REQUEST_METHOD': 'POST'},
-                    headers={'X-Timestamp': timestamp,
-                             'X-Container-Host': '1.2.3.4:0',
-                             'X-Container-Partition': '3',
-                             'X-Container-Device': 'sda1',
-                             'X-Container-Timestamp': '1',
-                             'Content-Type': 'application/new2'})
-            object_server.http_connect = mock_http_connect(500)
-            resp = self.object_controller.POST(req)
-            self.assertEquals(resp.status_int, 202)
-        finally:
-            object_server.http_connect = old_http_connect
+                                environ={'REQUEST_METHOD': 'PUT'},
+                                headers=headers, body=body)
+
+            with mock.patch(
+                    'swift.obj.server.ObjectController.container_update',
+                    mock_container_update):
+                resp = req.get_response(self.object_controller)
+
+            self.assertEqual(resp.status_int, 201)
+            self.assertEqual(1, len(calls_made))
+            expected_headers = HeaderKeyDict({
+                'x-size': '4',
+                'x-content-type':
+                    'application/octet-stream;swift_bytes=123456789',
+                'x-timestamp': ts_put.internal,
+                'x-etag': 'expected'})
+            self.assertDictEqual(expected_headers, calls_made[0][0])
+            self.assertEqual(policy, calls_made[0][1])
+
+            # make a POST and verify container update has the same etag
+            calls_made = []
+            ts_post = next(self.ts)
+            req = Request.blank(
+                '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'POST'},
+                headers={'X-Timestamp': ts_post.internal,
+                         'X-Backend-Storage-Policy-Index': int(policy)})
+
+            with mock.patch(
+                    'swift.obj.server.ObjectController.container_update',
+                    mock_container_update):
+                resp = req.get_response(self.object_controller)
+
+            self.assertEqual(resp.status_int, 202)
+            self.assertEqual(1, len(calls_made))
+            expected_headers.update({
+                'x-content-type-timestamp': ts_put.internal,
+                'x-meta-timestamp': ts_post.internal})
+            self.assertDictEqual(expected_headers, calls_made[0][0])
+            self.assertEqual(policy, calls_made[0][1])
+
+        # sanity check - EC headers are ok
+        headers = {
+            'X-Backend-Container-Update-Override-Etag': 'expected',
+            'X-Backend-Container-Update-Override-Size': '4',
+            'X-Object-Sysmeta-Ec-Etag': 'expected',
+            'X-Object-Sysmeta-Ec-Content-Length': '4'}
+        do_test('test ec frag longer than 4', headers, POLICIES[1])
+
+        # middleware overrides take precedence over EC/older overrides
+        headers = {
+            'X-Backend-Container-Update-Override-Etag': 'unexpected',
+            'X-Backend-Container-Update-Override-Size': '3',
+            'X-Object-Sysmeta-Ec-Etag': 'unexpected',
+            'X-Object-Sysmeta-Ec-Content-Length': '3',
+            'X-Object-Sysmeta-Container-Update-Override-Etag': 'expected',
+            'X-Object-Sysmeta-Container-Update-Override-Size': '4'}
+        do_test('test ec frag longer than 4', headers, POLICIES[1])
+
+        # overrides with replication policy
+        headers = {
+            'X-Object-Sysmeta-Container-Update-Override-Etag': 'expected',
+            'X-Object-Sysmeta-Container-Update-Override-Size': '4'}
+        do_test('longer than 4', headers, POLICIES[0])
+
+        # middleware overrides take precedence over EC/older overrides with
+        # replication policy
+        headers = {
+            'X-Backend-Container-Update-Override-Etag': 'unexpected',
+            'X-Backend-Container-Update-Override-Size': '3',
+            'X-Object-Sysmeta-Container-Update-Override-Etag': 'expected',
+            'X-Object-Sysmeta-Container-Update-Override-Size': '4'}
+        do_test('longer than 4', headers, POLICIES[0])
+
+    def _test_PUT_then_POST_async_pendings(self, policy, update_etag=None):
+        # Test that PUT and POST requests result in distinct async pending
+        # files when sync container update fails.
+        def fake_http_connect(*args):
+            raise Exception('test')
+
+        device_dir = os.path.join(self.testdir, 'sda1')
+        t_put = next(self.ts)
+        update_etag = update_etag or '098f6bcd4621d373cade4e832627b4f6'
+
+        put_headers = {
+            'X-Trans-Id': 'put_trans_id',
+            'X-Timestamp': t_put.internal,
+            'Content-Type': 'application/octet-stream;swift_bytes=123456789',
+            'Content-Length': '4',
+            'X-Backend-Storage-Policy-Index': int(policy),
+            'X-Container-Host': 'chost:cport',
+            'X-Container-Partition': 'cpartition',
+            'X-Container-Device': 'cdevice',
+            'X-Container-Root-Db-State': 'unsharded'}
+        if policy.policy_type == EC_POLICY:
+            put_headers.update({
+                'X-Object-Sysmeta-Ec-Frag-Index': '2',
+                'X-Backend-Container-Update-Override-Etag': update_etag,
+                'X-Object-Sysmeta-Ec-Etag': update_etag})
+
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers=put_headers, body='test')
+
+        with mock.patch('swift.obj.server.http_connect', fake_http_connect), \
+                mock.patch('swift.common.utils.HASH_PATH_PREFIX', b''), \
+                fake_spawn():
+            resp = req.get_response(self.object_controller)
+
+        self.assertEqual(resp.status_int, 201)
+
+        async_pending_file_put = os.path.join(
+            device_dir, diskfile.get_async_dir(policy), 'a83',
+            '06fbf0b514e5199dfc4e00f42eb5ea83-%s' % t_put.internal)
+        self.assertTrue(os.path.isfile(async_pending_file_put),
+                        'Expected %s to be a file but it is not.'
+                        % async_pending_file_put)
+        expected_put_headers = {
+            'Referer': 'PUT http://localhost/sda1/p/a/c/o',
+            'X-Trans-Id': 'put_trans_id',
+            'X-Timestamp': t_put.internal,
+            'X-Content-Type': 'application/octet-stream;swift_bytes=123456789',
+            'X-Size': '4',
+            'X-Etag': '098f6bcd4621d373cade4e832627b4f6',
+            'User-Agent': 'object-server %s' % os.getpid(),
+            'X-Backend-Storage-Policy-Index': '%d' % int(policy)}
+        if policy.policy_type == EC_POLICY:
+            expected_put_headers['X-Etag'] = update_etag
+        self.assertDictEqual(
+            pickle.load(open(async_pending_file_put, 'rb')),
+            {'headers': expected_put_headers,
+             'account': 'a', 'container': 'c', 'obj': 'o', 'op': 'PUT',
+             'db_state': 'unsharded'})
+
+        # POST with newer metadata returns success and container update
+        # is expected
+        t_post = next(self.ts)
+        post_headers = {
+            'X-Trans-Id': 'post_trans_id',
+            'X-Timestamp': t_post.internal,
+            'Content-Type': 'application/other',
+            'X-Backend-Storage-Policy-Index': int(policy),
+            'X-Container-Host': 'chost:cport',
+            'X-Container-Partition': 'cpartition',
+            'X-Container-Device': 'cdevice',
+            'X-Container-Root-Db-State': 'unsharded'}
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers=post_headers)
+
+        with mock.patch('swift.obj.server.http_connect', fake_http_connect), \
+                mock.patch('swift.common.utils.HASH_PATH_PREFIX', b''), \
+                fake_spawn():
+            resp = req.get_response(self.object_controller)
+
+        self.assertEqual(resp.status_int, 202)
+
+        self.maxDiff = None
+        # check async pending file for PUT is still intact
+        self.assertDictEqual(
+            pickle.load(open(async_pending_file_put, 'rb')),
+            {'headers': expected_put_headers,
+             'account': 'a', 'container': 'c', 'obj': 'o', 'op': 'PUT',
+             'db_state': 'unsharded'})
+
+        # check distinct async pending file for POST
+        async_pending_file_post = os.path.join(
+            device_dir, diskfile.get_async_dir(policy), 'a83',
+            '06fbf0b514e5199dfc4e00f42eb5ea83-%s' % t_post.internal)
+        self.assertTrue(os.path.isfile(async_pending_file_post),
+                        'Expected %s to be a file but it is not.'
+                        % async_pending_file_post)
+        expected_post_headers = {
+            'Referer': 'POST http://localhost/sda1/p/a/c/o',
+            'X-Trans-Id': 'post_trans_id',
+            'X-Timestamp': t_put.internal,
+            'X-Content-Type': 'application/other;swift_bytes=123456789',
+            'X-Size': '4',
+            'X-Etag': '098f6bcd4621d373cade4e832627b4f6',
+            'User-Agent': 'object-server %s' % os.getpid(),
+            'X-Backend-Storage-Policy-Index': '%d' % int(policy),
+            'X-Meta-Timestamp': t_post.internal,
+            'X-Content-Type-Timestamp': t_post.internal,
+        }
+        if policy.policy_type == EC_POLICY:
+            expected_post_headers['X-Etag'] = update_etag
+        self.assertDictEqual(
+            pickle.load(open(async_pending_file_post, 'rb')),
+            {'headers': expected_post_headers,
+             'account': 'a', 'container': 'c', 'obj': 'o', 'op': 'PUT',
+             'db_state': 'unsharded'})
+
+        # verify that only the POST (most recent) async update gets sent by the
+        # object updater, and that both update files are deleted
+        with mock.patch(
+            'swift.obj.updater.ObjectUpdater.object_update') as mock_update, \
+                mock.patch('swift.obj.updater.dump_recon_cache'):
+            object_updater = updater.ObjectUpdater(
+                {'devices': self.testdir,
+                 'mount_check': 'false'}, logger=debug_logger())
+            node = {'id': 1}
+            mock_ring = mock.MagicMock()
+            mock_ring.get_nodes.return_value = (99, [node])
+            object_updater.container_ring = mock_ring
+            mock_update.return_value = ((True, 1, None))
+            object_updater._process_device_in_child(self.sda1, 'sda1')
+        self.assertEqual(1, mock_update.call_count)
+        self.assertEqual((node, 99, 'PUT', '/a/c/o'),
+                         mock_update.call_args_list[0][0][0:4])
+        actual_headers = mock_update.call_args_list[0][0][4]
+        # User-Agent is updated.
+        expected_post_headers['User-Agent'] = 'object-updater %s' % os.getpid()
+        expected_post_headers['X-Backend-Accept-Redirect'] = 'true'
+        expected_post_headers['X-Backend-Accept-Quoted-Location'] = 'true'
+        self.assertDictEqual(expected_post_headers, actual_headers)
+        self.assertFalse(
+            os.listdir(os.path.join(
+                device_dir, diskfile.get_async_dir(policy))))
+
+    def test_PUT_then_POST_async_pendings_with_repl_policy(self):
+        self._test_PUT_then_POST_async_pendings(POLICIES[0])
+
+    def test_PUT_then_POST_async_pendings_with_EC_policy(self):
+        self._test_PUT_then_POST_async_pendings(
+            POLICIES[1], update_etag='override_etag')
+
+    def _check_PUT_redirected_async_pending(self, container_path=None,
+                                            old_style=False):
+        # When container update is redirected verify that the redirect location
+        # is persisted in the async pending file.
+        policy = POLICIES[0]
+        device_dir = os.path.join(self.testdir, 'sda1')
+        t_put = next(self.ts)
+        update_etag = '098f6bcd4621d373cade4e832627b4f6'
+
+        put_headers = {
+            'X-Trans-Id': 'put_trans_id',
+            'X-Timestamp': t_put.internal,
+            'Content-Type': 'application/octet-stream;swift_bytes=123456789',
+            'Content-Length': '4',
+            'X-Backend-Storage-Policy-Index': int(policy),
+            'X-Container-Host': 'chost:3200',
+            'X-Container-Partition': '99',
+            'X-Container-Device': 'cdevice',
+            'X-Container-Root-Db-State': 'unsharded'}
+
+        if container_path:
+            # the proxy may include either header
+            hdr = ('X-Backend-Container-Path' if old_style
+                   else 'X-Backend-Quoted-Container-Path')
+            put_headers[hdr] = container_path
+            put_headers['X-Container-Root-Db-State'] = 'sharded'
+            expected_update_path = '/cdevice/99/%s/o' % container_path
+        else:
+            expected_update_path = '/cdevice/99/a/c/o'
+
+        if policy.policy_type == EC_POLICY:
+            put_headers.update({
+                'X-Object-Sysmeta-Ec-Frag-Index': '2',
+                'X-Backend-Container-Update-Override-Etag': update_etag,
+                'X-Object-Sysmeta-Ec-Etag': update_etag})
+
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers=put_headers, body=b'test')
+        resp_headers = {'Location': '/.sharded_a/c_shard_1/o',
+                        'X-Backend-Redirect-Timestamp': next(self.ts).internal}
+
+        with mocked_http_conn(301, headers=[resp_headers]) as conn, \
+                mock.patch('swift.common.utils.HASH_PATH_PREFIX', b''), \
+                fake_spawn():
+            resp = req.get_response(self.object_controller)
+
+        self.assertEqual(resp.status_int, 201)
+        self.assertEqual(1, len(conn.requests))
+
+        self.assertEqual(expected_update_path, conn.requests[0]['path'])
+
+        # whether or not an X-Backend-Container-Path was received from the
+        # proxy, the async pending file should now have the container_path
+        # equal to the Location header received in the update response.
+        async_pending_file_put = os.path.join(
+            device_dir, diskfile.get_async_dir(policy), 'a83',
+            '06fbf0b514e5199dfc4e00f42eb5ea83-%s' % t_put.internal)
+        self.assertTrue(os.path.isfile(async_pending_file_put),
+                        'Expected %s to be a file but it is not.'
+                        % async_pending_file_put)
+        expected_put_headers = {
+            'Referer': 'PUT http://localhost/sda1/p/a/c/o',
+            'X-Trans-Id': 'put_trans_id',
+            'X-Timestamp': t_put.internal,
+            'X-Content-Type': 'application/octet-stream;swift_bytes=123456789',
+            'X-Size': '4',
+            'X-Etag': '098f6bcd4621d373cade4e832627b4f6',
+            'User-Agent': 'object-server %s' % os.getpid(),
+            'X-Backend-Storage-Policy-Index': '%d' % int(policy)}
+        if policy.policy_type == EC_POLICY:
+            expected_put_headers['X-Etag'] = update_etag
+        self.assertEqual(
+            {'headers': expected_put_headers,
+             'account': 'a', 'container': 'c', 'obj': 'o', 'op': 'PUT',
+             'container_path': '.sharded_a/c_shard_1',
+             'db_state': 'sharded' if container_path else 'unsharded'},
+            pickle.load(open(async_pending_file_put, 'rb')))
+
+        # when updater is run its first request will be to the redirect
+        # location that is persisted in the async pending file
+        with mocked_http_conn(201) as conn:
+            with mock.patch('swift.obj.updater.dump_recon_cache',
+                            lambda *args: None):
+                object_updater = updater.ObjectUpdater(
+                    {'devices': self.testdir,
+                     'mount_check': 'false'}, logger=debug_logger())
+                node = {'id': 1, 'ip': 'chost', 'port': 3200,
+                        'replication_ip': 'chost_repl',
+                        'replication_port': 6200,
+                        'device': 'cdevice'}
+                mock_ring = mock.MagicMock()
+                mock_ring.get_nodes.return_value = (99, [node])
+                object_updater.container_ring = mock_ring
+                object_updater._process_device_in_child(self.sda1, 'sda1')
+
+        self.assertEqual(1, len(conn.requests))
+        self.assertEqual('/cdevice/99/.sharded_a/c_shard_1/o',
+                         conn.requests[0]['path'])
+        self.assertEqual(6200, conn.requests[0]['port'])
+        self.assertEqual('chost_repl', conn.requests[0]['ip'])
+
+    def test_PUT_redirected_async_pending(self):
+        self._check_PUT_redirected_async_pending()
+
+    def test_PUT_redirected_async_pending_with_container_path(self):
+        self._check_PUT_redirected_async_pending(container_path='.another/c')
+
+    def test_PUT_redirected_async_pending_with_old_style_container_path(self):
+        self._check_PUT_redirected_async_pending(
+            container_path='.another/c', old_style=True)
 
     def test_POST_quarantine_zbyte(self):
-        """ Test swift.object_server.ObjectController.GET """
         timestamp = normalize_timestamp(time())
         req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
                             headers={'X-Timestamp': timestamp,
                                      'Content-Type': 'application/x-test'})
         req.body = 'VERIFY'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
-        file = object_server.DiskFile(self.testdir, 'sda1', 'p', 'a', 'c', 'o',
-                                      FakeLogger(), keep_data_fp=True)
-
-        file_name = os.path.basename(file.data_file)
-        with open(file.data_file) as fp:
-            metadata = object_server.read_metadata(fp)
-        os.unlink(file.data_file)
-        with open(file.data_file, 'w') as fp:
-            object_server.write_metadata(fp, metadata)
-
-        self.assertEquals(os.listdir(file.datadir)[0], file_name)
-        req = Request.blank('/sda1/p/a/c/o',
-                        headers={'X-Timestamp': normalize_timestamp(time())})
-        resp = self.object_controller.POST(req)
-        self.assertEquals(resp.status_int, 404)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        objfile = self.df_mgr.get_diskfile('sda1', 'p', 'a', 'c', 'o',
+                                           policy=POLICIES.legacy)
+        objfile.open()
+        file_name = os.path.basename(objfile._data_file)
+        with open(objfile._data_file) as fp:
+            metadata = diskfile.read_metadata(fp)
+        os.unlink(objfile._data_file)
+        with open(objfile._data_file, 'w') as fp:
+            diskfile.write_metadata(fp, metadata)
+        self.assertEqual(os.listdir(objfile._datadir)[0], file_name)
+
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'POST'},
+            headers={'X-Timestamp': normalize_timestamp(time())})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 404)
 
-        quar_dir = os.path.join(self.testdir, 'sda1', 'quarantined', 'objects',
-                       os.path.basename(os.path.dirname(file.data_file)))
-        self.assertEquals(os.listdir(quar_dir)[0], file_name)
+        quar_dir = os.path.join(
+            self.testdir, 'sda1', 'quarantined', 'objects',
+            os.path.basename(os.path.dirname(objfile._data_file)))
+        self.assertEqual(os.listdir(quar_dir)[0], file_name)
 
     def test_PUT_invalid_path(self):
         req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'PUT'})
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 400)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 400)
 
     def test_PUT_no_timestamp(self):
         req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT',
                                                       'CONTENT_LENGTH': '0'})
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 400)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 400)
+
+    def test_PUT_bad_timestamp(self):
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': 'bad'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 400)
 
     def test_PUT_no_content_type(self):
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                headers={'X-Timestamp': normalize_timestamp(time()),
-                         'Content-Length': '6'})
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': normalize_timestamp(time()),
+                     'Content-Length': '6'})
         req.body = 'VERIFY'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 400)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 400)
 
     def test_PUT_invalid_content_type(self):
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                headers={'X-Timestamp': normalize_timestamp(time()),
-                         'Content-Length': '6',
-                         'Content-Type': '\xff\xff'})
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': normalize_timestamp(time()),
+                     'Content-Length': '6',
+                     'Content-Type': '\xff\xff'})
         req.body = 'VERIFY'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 400)
-        self.assert_('Content-Type' in resp.body)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 400)
+        self.assertTrue(b'Content-Type' in resp.body)
 
     def test_PUT_no_content_length(self):
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                headers={'X-Timestamp': normalize_timestamp(time()),
-                         'Content-Type': 'application/octet-stream'})
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': normalize_timestamp(time()),
+                     'Content-Type': 'application/octet-stream'})
         req.body = 'VERIFY'
         del req.headers['Content-Length']
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 411)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 411)
+
+    def test_PUT_zero_content_length(self):
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': normalize_timestamp(time()),
+                     'Content-Type': 'application/octet-stream'})
+        req.body = ''
+        self.assertEqual(req.headers['Content-Length'], '0')
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+    def test_PUT_bad_transfer_encoding(self):
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': normalize_timestamp(time()),
+                     'Content-Type': 'application/octet-stream'})
+        req.body = 'VERIFY'
+        req.headers['Transfer-Encoding'] = 'bad'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 400)
+
+    def test_PUT_if_none_match_star(self):
+        # First PUT should succeed
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': next(self.ts).normal,
+                     'Content-Length': '6',
+                     'Content-Type': 'application/octet-stream',
+                     'If-None-Match': '*'})
+        req.body = 'VERIFY'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+        # File should already exist so it should fail
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': next(self.ts).normal,
+                     'Content-Length': '6',
+                     'Content-Type': 'application/octet-stream',
+                     'If-None-Match': '*'})
+        req.body = 'VERIFY'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 412)
+
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'DELETE'},
+                            headers={'X-Timestamp': next(self.ts).normal})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 204)
+
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': next(self.ts).normal,
+                     'Content-Length': '6',
+                     'Content-Type': 'application/octet-stream',
+                     'If-None-Match': '*'})
+        req.body = 'VERIFY'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+    def test_PUT_if_none_match(self):
+        # PUT with if-none-match set and nothing there should succeed
+        timestamp = normalize_timestamp(time())
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': timestamp,
+                     'Content-Length': '6',
+                     'Content-Type': 'application/octet-stream',
+                     'If-None-Match': 'notthere'})
+        req.body = 'VERIFY'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+        # PUT with if-none-match of the object etag should fail
+        timestamp = normalize_timestamp(time())
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': timestamp,
+                     'Content-Length': '6',
+                     'Content-Type': 'application/octet-stream',
+                     'If-None-Match': '0b4c12d7e0a73840c1c4f148fda3b037'})
+        req.body = 'VERIFY'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 412)
+
+    def _update_delete_at_headers(self, headers, a='a', c='c', o='o',
+                                  node_count=1):
+        delete_at = headers['X-Delete-At']
+        expirer_config = ExpirerConfig(
+            self.conf, logger=self.logger, container_ring=self.container_ring)
+        part, nodes, delete_at_container = expirer_config.get_delete_at_nodes(
+            delete_at, a, c, o)
+        # proxy assigns each replica a node, index 0 for test stability
+        nodes = nodes[:node_count]
+        headers.update({
+            'X-Delete-At': str(delete_at),
+            'X-Delete-At-Container': delete_at_container,
+            'X-Delete-At-Partition': str(part),
+            'X-Delete-At-Host': ','.join('%(ip)s:%(port)s' % n for n in nodes),
+            'X-Delete-At-Device': ','.join(n['device'] for n in nodes),
+        })
+        return headers
+
+    def test_PUT_if_none_match_but_expired(self):
+        inital_put = next(self.ts)
+        put_before_expire = next(self.ts)
+        delete_at_timestamp = int(next(self.ts))
+        put_after_expire = next(self.ts)
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers=self._update_delete_at_headers({
+                'X-Timestamp': inital_put.normal,
+                'X-Delete-At': str(delete_at_timestamp),
+                'Content-Length': '4',
+                'Content-Type': 'application/octet-stream'}))
+        req.body = 'TEST'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        # PUT again before object has expired should fail
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': put_before_expire.normal,
+                     'Content-Length': '4',
+                     'Content-Type': 'application/octet-stream',
+                     'If-None-Match': '*'})
+        req.body = 'TEST'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 412)
+
+        # PUT again after object has expired should succeed
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': put_after_expire.normal,
+                     'Content-Length': '4',
+                     'Content-Type': 'application/octet-stream',
+                     'If-None-Match': '*'})
+        req.body = 'TEST'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
 
     def test_PUT_common(self):
         timestamp = normalize_timestamp(time())
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                headers={'X-Timestamp': timestamp,
-                         'Content-Length': '6',
-                         'Content-Type': 'application/octet-stream'})
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': timestamp,
+                     'Content-Length': '6',
+                     'Content-Type': 'application/octet-stream',
+                     'x-object-meta-test': 'one',
+                     'x-object-meta-t\xc3\xa8st': 'm\xc3\xa8ta',
+                     'Custom-Header': '*',
+                     'X-Backend-Replication-Headers':
+                     'x-object-meta-t\xc3\xa8st Content-Type Content-Length'})
         req.body = 'VERIFY'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
-        objfile = os.path.join(self.testdir, 'sda1',
-            storage_directory(object_server.DATADIR, 'p',
-                              hash_path('a', 'c', 'o')),
-            timestamp + '.data')
-        self.assert_(os.path.isfile(objfile))
-        self.assertEquals(open(objfile).read(), 'VERIFY')
-        self.assertEquals(pickle.loads(getxattr(objfile,
-                            object_server.METADATA_KEY)),
-                          {'X-Timestamp': timestamp,
-                           'Content-Length': '6',
-                           'ETag': '0b4c12d7e0a73840c1c4f148fda3b037',
-                           'Content-Type': 'application/octet-stream',
-                           'name': '/a/c/o'})
+        with mock.patch.object(self.object_controller, 'allowed_headers',
+                               ['Custom-Header']):
+            self.object_controller.allowed_headers = ['Custom-Header']
+            resp = req.get_response(self.object_controller)
+
+        self.assertEqual(resp.status_int, 201)
+        objfile = os.path.join(
+            self.testdir, 'sda1',
+            storage_directory(diskfile.get_data_dir(POLICIES[0]),
+                              'p', hash_path('a', 'c', 'o')),
+            utils.Timestamp(timestamp).internal + '.data')
+        self.assertTrue(os.path.isfile(objfile))
+        self.assertEqual(open(objfile).read(), 'VERIFY')
+        self.assertEqual(diskfile.read_metadata(objfile),
+                         {'X-Timestamp': utils.Timestamp(timestamp).internal,
+                          'Content-Length': '6',
+                          'ETag': '0b4c12d7e0a73840c1c4f148fda3b037',
+                          'Content-Type': 'application/octet-stream',
+                          'name': '/a/c/o',
+                          'X-Object-Meta-Test': 'one',
+                          'X-Object-Meta-T\xc3\xa8St': 'm\xc3\xa8ta',
+                          'Custom-Header': '*'})
 
     def test_PUT_overwrite(self):
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                headers={'X-Timestamp': normalize_timestamp(time()),
-                         'Content-Length': '6',
-                         'Content-Type': 'application/octet-stream'})
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': normalize_timestamp(time()),
+                     'Content-Length': '6',
+                     'Content-Type': 'application/octet-stream'})
         req.body = 'VERIFY'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
         sleep(.00001)
         timestamp = normalize_timestamp(time())
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                            headers={'X-Timestamp': timestamp,
-                                     'Content-Type': 'text/plain',
-                                     'Content-Encoding': 'gzip'})
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': timestamp,
+                     'Content-Type': 'text/plain',
+                     'Content-Encoding': 'gzip'})
         req.body = 'VERIFY TWO'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
-        objfile = os.path.join(self.testdir, 'sda1',
-            storage_directory(object_server.DATADIR, 'p',
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+        objfile = os.path.join(
+            self.testdir, 'sda1',
+            storage_directory(diskfile.get_data_dir(POLICIES[0]), 'p',
                               hash_path('a', 'c', 'o')),
-            timestamp + '.data')
-        self.assert_(os.path.isfile(objfile))
-        self.assertEquals(open(objfile).read(), 'VERIFY TWO')
-        self.assertEquals(pickle.loads(getxattr(objfile,
-                            object_server.METADATA_KEY)),
-                          {'X-Timestamp': timestamp,
-                           'Content-Length': '10',
-                           'ETag': 'b381a4c5dab1eaa1eb9711fa647cd039',
-                           'Content-Type': 'text/plain',
-                           'name': '/a/c/o',
-                           'Content-Encoding': 'gzip'})
+            utils.Timestamp(timestamp).internal + '.data')
+        self.assertTrue(os.path.isfile(objfile))
+        self.assertEqual(open(objfile).read(), 'VERIFY TWO')
+        self.assertEqual(diskfile.read_metadata(objfile),
+                         {'X-Timestamp': utils.Timestamp(timestamp).internal,
+                          'Content-Length': '10',
+                          'ETag': 'b381a4c5dab1eaa1eb9711fa647cd039',
+                          'Content-Type': 'text/plain',
+                          'name': '/a/c/o',
+                          'Content-Encoding': 'gzip'})
+
+    def test_PUT_overwrite_to_older_ts_success(self):
+        old_timestamp = next(self.ts)
+        new_timestamp = next(self.ts)
+
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'DELETE'},
+            headers={'X-Timestamp': old_timestamp.internal,
+                     'Content-Length': '0',
+                     'Content-Type': 'application/octet-stream'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 404)
+
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': new_timestamp.internal,
+                     'Content-Type': 'text/plain',
+                     'Content-Encoding': 'gzip'})
+        req.body = 'VERIFY TWO'
+        resp = req.get_response(self.object_controller)
 
-    def test_PUT_no_etag(self):
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                           headers={'X-Timestamp': normalize_timestamp(time()),
-                                    'Content-Type': 'text/plain'})
-        req.body = 'test'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
+        self.assertEqual(resp.status_int, 201)
+        objfile = os.path.join(
+            self.testdir, 'sda1',
+            storage_directory(diskfile.get_data_dir(POLICIES[0]), 'p',
+                              hash_path('a', 'c', 'o')),
+            new_timestamp.internal + '.data')
+        self.assertTrue(os.path.isfile(objfile))
+        self.assertEqual(open(objfile).read(), 'VERIFY TWO')
+        self.assertEqual(
+            diskfile.read_metadata(objfile),
+            {'X-Timestamp': new_timestamp.internal,
+             'Content-Length': '10',
+             'ETag': 'b381a4c5dab1eaa1eb9711fa647cd039',
+             'Content-Type': 'text/plain',
+             'name': '/a/c/o',
+             'Content-Encoding': 'gzip'})
+
+    def test_PUT_overwrite_to_newer_ts_failed(self):
+        old_timestamp = next(self.ts)
+        new_timestamp = next(self.ts)
+
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'DELETE'},
+            headers={'X-Timestamp': new_timestamp.internal,
+                     'Content-Length': '0',
+                     'Content-Type': 'application/octet-stream'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 404)
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': old_timestamp.internal,
+                     'Content-Type': 'text/plain',
+                     'Content-Encoding': 'gzip'})
+        req.body = 'VERIFY TWO'
+
+        with mock.patch(
+                'swift.obj.diskfile.BaseDiskFile.create') as mock_create:
+            resp = req.get_response(self.object_controller)
+
+        self.assertEqual(resp.status_int, 409)
+        self.assertEqual(mock_create.call_count, 0)
+
+        # data file doesn't exist there (This is sanity because
+        # if .data written unexpectedly, it will be removed
+        # by cleanup_ondisk_files)
+        datafile = os.path.join(
+            self.testdir, 'sda1',
+            storage_directory(diskfile.get_data_dir(POLICIES[0]), 'p',
+                              hash_path('a', 'c', 'o')),
+            old_timestamp.internal + '.data')
+        self.assertFalse(os.path.exists(datafile))
+
+        # ts file sitll exists
+        tsfile = os.path.join(
+            self.testdir, 'sda1',
+            storage_directory(diskfile.get_data_dir(POLICIES[0]), 'p',
+                              hash_path('a', 'c', 'o')),
+            new_timestamp.internal + '.ts')
+        self.assertTrue(os.path.isfile(tsfile))
+
+    def test_PUT_overwrite_w_delete_at(self):
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': normalize_timestamp(time()),
+                     'X-Delete-At': 9999999999,
+                     'Content-Length': '6',
+                     'Content-Type': 'application/octet-stream'})
+        req.body = 'VERIFY'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+        sleep(.00001)
+        timestamp = normalize_timestamp(time())
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': timestamp,
+                     'Content-Type': 'text/plain',
+                     'Content-Encoding': 'gzip'})
+        req.body = 'VERIFY TWO'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+        objfile = os.path.join(
+            self.testdir, 'sda1',
+            storage_directory(diskfile.get_data_dir(POLICIES[0]), 'p',
+                              hash_path('a', 'c', 'o')),
+            utils.Timestamp(timestamp).internal + '.data')
+        self.assertTrue(os.path.isfile(objfile))
+        self.assertEqual(open(objfile).read(), 'VERIFY TWO')
+        self.assertEqual(diskfile.read_metadata(objfile),
+                         {'X-Timestamp': utils.Timestamp(timestamp).internal,
+                          'Content-Length': '10',
+                          'ETag': 'b381a4c5dab1eaa1eb9711fa647cd039',
+                          'Content-Type': 'text/plain',
+                          'name': '/a/c/o',
+                          'Content-Encoding': 'gzip'})
+
+    def test_PUT_old_timestamp(self):
+        older_timestamp = next(self.ts)
+        orig_timestamp = next(self.ts)
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': orig_timestamp.internal,
+                     'Content-Length': '6',
+                     'Content-Type': 'application/octet-stream'})
+        req.body = 'VERIFY'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': orig_timestamp.internal,
+                                     'Content-Type': 'text/plain',
+                                     'Content-Encoding': 'gzip'})
+        req.body = 'VERIFY TWO'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 409)
+        self.assertEqual(resp.headers['X-Backend-Timestamp'],
+                         orig_timestamp.internal)
 
-    def test_PUT_invalid_etag(self):
         req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                           headers={'X-Timestamp': normalize_timestamp(time()),
-                                    'Content-Type': 'text/plain',
-                                    'ETag': 'invalid'})
+                            headers={
+                                'X-Timestamp': older_timestamp.internal,
+                                'Content-Type': 'text/plain',
+                                'Content-Encoding': 'gzip'})
+        req.body = 'VERIFY THREE'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 409)
+        self.assertEqual(resp.headers['X-Backend-Timestamp'],
+                         orig_timestamp.internal)
+
+    def test_PUT_new_object_really_old_timestamp(self):
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': '-1',  # 1969-12-31 23:59:59
+                     'Content-Length': '6',
+                     'Content-Type': 'application/octet-stream'})
+        req.body = 'VERIFY'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 400)
+
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': '1',  # 1970-01-01 00:00:01
+                     'Content-Length': '6',
+                     'Content-Type': 'application/octet-stream'})
+        req.body = 'VERIFY'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+    def test_PUT_object_really_new_timestamp(self):
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': '9999999999',  # 2286-11-20 17:46:40
+                     'Content-Length': '6',
+                     'Content-Type': 'application/octet-stream'})
+        req.body = 'VERIFY'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        # roll over to 11 digits before the decimal
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': '10000000000',
+                     'Content-Length': '6',
+                     'Content-Type': 'application/octet-stream'})
+        req.body = 'VERIFY'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 400)
+
+    def test_PUT_no_etag(self):
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': normalize_timestamp(time()),
+                     'Content-Type': 'text/plain'})
+        req.body = 'test'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+    def test_PUT_invalid_etag(self):
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': normalize_timestamp(time()),
+                     'Content-Type': 'text/plain',
+                     'ETag': 'invalid'})
         req.body = 'test'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 422)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 422)
 
     def test_PUT_user_metadata(self):
         timestamp = normalize_timestamp(time())
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': timestamp,
+                     'Content-Type': 'text/plain',
+                     'ETag': 'b114ab7b90d9ccac4bd5d99cc7ebb568',
+                     'X-Object-Meta-1': 'One',
+                     'X-Object-Meta-Two': 'Two'})
+        req.body = 'VERIFY THREE'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+        objfile = os.path.join(
+            self.testdir, 'sda1',
+            storage_directory(diskfile.get_data_dir(POLICIES[0]), 'p',
+                              hash_path('a', 'c', 'o')),
+            utils.Timestamp(timestamp).internal + '.data')
+        self.assertTrue(os.path.isfile(objfile))
+        self.assertEqual(open(objfile).read(), 'VERIFY THREE')
+        self.assertEqual(diskfile.read_metadata(objfile),
+                         {'X-Timestamp': utils.Timestamp(timestamp).internal,
+                          'Content-Length': '12',
+                          'ETag': 'b114ab7b90d9ccac4bd5d99cc7ebb568',
+                          'Content-Type': 'text/plain',
+                          'name': '/a/c/o',
+                          'X-Object-Meta-1': 'One',
+                          'X-Object-Meta-Two': 'Two'})
+
+    def test_PUT_etag_in_footer(self):
+        timestamp = normalize_timestamp(time())
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            headers={'X-Timestamp': timestamp,
+                     'Content-Type': 'text/plain',
+                     'Transfer-Encoding': 'chunked',
+                     'Etag': 'other-etag',
+                     'X-Backend-Obj-Metadata-Footer': 'yes',
+                     'X-Backend-Obj-Multipart-Mime-Boundary': 'boundary'},
+            environ={'REQUEST_METHOD': 'PUT'})
+
+        obj_etag = md5(b"obj data", usedforsecurity=False).hexdigest()
+        footer_meta = json.dumps({"Etag": obj_etag}).encode('ascii')
+        footer_meta_cksum = md5(
+            footer_meta, usedforsecurity=False).hexdigest().encode('ascii')
+
+        req.body = b"\r\n".join((
+            b"--boundary",
+            b"",
+            b"obj data",
+            b"--boundary",
+            b"Content-MD5: " + footer_meta_cksum,
+            b"",
+            footer_meta,
+            b"--boundary--",
+        ))
+        req.headers.pop("Content-Length", None)
+
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+        self.assertEqual(resp.etag, obj_etag)
+
+        objfile = os.path.join(
+            self.testdir, 'sda1',
+            storage_directory(diskfile.get_data_dir(POLICIES[0]), 'p',
+                              hash_path('a', 'c', 'o')),
+            utils.Timestamp(timestamp).internal + '.data')
+        with open(objfile) as fh:
+            self.assertEqual(fh.read(), "obj data")
+
+    def _check_container_override_etag_preference(self, override_headers,
+                                                  override_footers):
+        def mock_container_update(ctlr, op, account, container, obj, req,
+                                  headers_out, objdevice, policy):
+            calls_made.append((headers_out, policy))
+        calls_made = []
+        ts_put = next(self.ts)
+
+        headers = {
+            'X-Timestamp': ts_put.internal,
+            'Content-Type': 'text/plain',
+            'Transfer-Encoding': 'chunked',
+            'Etag': 'other-etag',
+            'X-Backend-Obj-Metadata-Footer': 'yes',
+            'X-Backend-Obj-Multipart-Mime-Boundary': 'boundary'}
+        headers.update(override_headers)
+        req = Request.blank(
+            '/sda1/p/a/c/o', headers=headers,
+            environ={'REQUEST_METHOD': 'PUT'})
+
+        obj_etag = md5(b"obj data", usedforsecurity=False).hexdigest()
+        footers = {'Etag': obj_etag}
+        footers.update(override_footers)
+        footer_meta = json.dumps(footers).encode('ascii')
+        footer_meta_cksum = md5(
+            footer_meta, usedforsecurity=False).hexdigest().encode('ascii')
+
+        req.body = b"\r\n".join((
+            b"--boundary",
+            b"",
+            b"obj data",
+            b"--boundary",
+            b"Content-MD5: " + footer_meta_cksum,
+            b"",
+            footer_meta,
+            b"--boundary--",
+        ))
+        req.headers.pop("Content-Length", None)
+
+        with mock.patch(
+                'swift.obj.server.ObjectController.container_update',
+                mock_container_update):
+            resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.etag, obj_etag)
+        self.assertEqual(resp.status_int, 201)
+        self.assertEqual(1, len(calls_made))
+        self.assertEqual({
+            'X-Size': str(len('obj data')),
+            'X-Etag': 'update-etag',
+            'X-Content-Type': 'text/plain',
+            'X-Timestamp': ts_put.internal,
+        }, calls_made[0][0])
+        self.assertEqual(POLICIES[0], calls_made[0][1])
+
+    def test_override_etag_lone_header_footer(self):
+        self._check_container_override_etag_preference(
+            {'X-Backend-Container-Update-Override-Etag': 'update-etag'}, {})
+        self._check_container_override_etag_preference(
+            {}, {'X-Backend-Container-Update-Override-Etag': 'update-etag'})
+        self._check_container_override_etag_preference(
+            {'X-Object-Sysmeta-Container-Update-Override-Etag':
+             'update-etag'}, {})
+        self._check_container_override_etag_preference(
+            {}, {'X-Object-Sysmeta-Container-Update-Override-Etag':
+                 'update-etag'}),
+
+    def test_override_etag_footer_trumps_header(self):
+        self._check_container_override_etag_preference(
+            {'X-Backend-Container-Update-Override-Etag': 'ignored-etag'},
+            {'X-Backend-Container-Update-Override-Etag': 'update-etag'})
+        self._check_container_override_etag_preference(
+            {'X-Object-Sysmeta-Container-Update-Override-Etag':
+             'ignored-etag'},
+            {'X-Object-Sysmeta-Container-Update-Override-Etag':
+             'update-etag'})
+
+    def test_override_etag_sysmeta_trumps_backend(self):
+        self._check_container_override_etag_preference(
+            {'X-Backend-Container-Update-Override-Etag': 'ignored-etag',
+             'X-Object-Sysmeta-Container-Update-Override-Etag':
+             'update-etag'}, {})
+        self._check_container_override_etag_preference(
+            {}, {'X-Backend-Container-Update-Override-Etag': 'ignored-etag',
+                 'X-Object-Sysmeta-Container-Update-Override-Etag':
+                 'update-etag'})
+
+    def test_override_etag_sysmeta_header_trumps_backend_footer(self):
+        headers = {'X-Object-Sysmeta-Container-Update-Override-Etag':
+                   'update-etag'}
+        footers = {'X-Backend-Container-Update-Override-Etag':
+                   'ignored-etag'}
+        self._check_container_override_etag_preference(headers, footers)
+
+    def test_override_etag_sysmeta_footer_trumps_backend_header(self):
+        headers = {'X-Backend-Container-Update-Override-Etag':
+                   'ignored-etag'}
+        footers = {'X-Object-Sysmeta-Container-Update-Override-Etag':
+                   'update-etag'}
+        self._check_container_override_etag_preference(headers, footers)
+
+    def test_PUT_etag_in_footer_mismatch(self):
+        timestamp = normalize_timestamp(time())
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            headers={'X-Timestamp': timestamp,
+                     'Content-Type': 'text/plain',
+                     'Transfer-Encoding': 'chunked',
+                     'X-Backend-Obj-Metadata-Footer': 'yes',
+                     'X-Backend-Obj-Multipart-Mime-Boundary': 'boundary'},
+            environ={'REQUEST_METHOD': 'PUT'})
+
+        footers = {"Etag": md5(b"green", usedforsecurity=False).hexdigest()}
+        footer_meta = json.dumps(footers).encode('ascii')
+        footer_meta_cksum = md5(
+            footer_meta, usedforsecurity=False).hexdigest().encode('ascii')
+
+        req.body = b"\r\n".join((
+            b"--boundary",
+            b"",
+            b"blue",
+            b"--boundary",
+            b"Content-MD5: " + footer_meta_cksum,
+            b"",
+            footer_meta,
+            b"--boundary--",
+        ))
+        req.headers.pop("Content-Length", None)
+
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 422)
+
+    def test_PUT_meta_in_footer(self):
+        timestamp = normalize_timestamp(time())
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            headers={'X-Timestamp': timestamp,
+                     'Content-Type': 'text/plain',
+                     'Transfer-Encoding': 'chunked',
+                     'X-Object-Meta-X': 'Z',
+                     'X-Object-Sysmeta-X': 'Z',
+                     'X-Backend-Obj-Metadata-Footer': 'yes',
+                     'X-Backend-Obj-Multipart-Mime-Boundary': 'boundary'},
+            environ={'REQUEST_METHOD': 'PUT'})
+
+        footer_meta = json.dumps({
+            'X-Object-Meta-X': 'Y',
+            'X-Object-Sysmeta-X': 'Y',
+        }).encode('ascii')
+        footer_meta_cksum = md5(
+            footer_meta, usedforsecurity=False).hexdigest().encode('ascii')
+
+        req.body = b"\r\n".join((
+            b"--boundary",
+            b"",
+            b"stuff stuff stuff",
+            b"--boundary",
+            b"Content-MD5: " + footer_meta_cksum,
+            b"",
+            footer_meta,
+            b"--boundary--",
+        ))
+        req.headers.pop("Content-Length", None)
+
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        timestamp = normalize_timestamp(time())
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            headers={'X-Timestamp': timestamp},
+            environ={'REQUEST_METHOD': 'HEAD'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.headers.get('X-Object-Meta-X'), 'Y')
+        self.assertEqual(resp.headers.get('X-Object-Sysmeta-X'), 'Y')
+
+    def test_PUT_missing_footer_checksum(self):
+        timestamp = normalize_timestamp(time())
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            headers={'X-Timestamp': timestamp,
+                     'Content-Type': 'text/plain',
+                     'Transfer-Encoding': 'chunked',
+                     'X-Backend-Obj-Metadata-Footer': 'yes',
+                     'X-Backend-Obj-Multipart-Mime-Boundary': 'boundary'},
+            environ={'REQUEST_METHOD': 'PUT'})
+
+        footer_meta = json.dumps({
+            "Etag": md5(b"obj data", usedforsecurity=False).hexdigest()
+        }).encode('ascii')
+
+        req.body = b"\r\n".join((
+            b"--boundary",
+            b"",
+            b"obj data",
+            b"--boundary",
+            # no Content-MD5
+            b"",
+            footer_meta,
+            b"--boundary--",
+        ))
+        req.headers.pop("Content-Length", None)
+
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 400)
+
+    def test_PUT_bad_footer_checksum(self):
+        timestamp = normalize_timestamp(time())
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            headers={'X-Timestamp': timestamp,
+                     'Content-Type': 'text/plain',
+                     'Transfer-Encoding': 'chunked',
+                     'X-Backend-Obj-Metadata-Footer': 'yes',
+                     'X-Backend-Obj-Multipart-Mime-Boundary': 'boundary'},
+            environ={'REQUEST_METHOD': 'PUT'})
+
+        footer_meta = json.dumps({
+            "Etag": md5(b"obj data", usedforsecurity=False).hexdigest()
+        }).encode('ascii')
+        bad_footer_meta_cksum = \
+            md5(footer_meta + b"bad",
+                usedforsecurity=False).hexdigest().encode('ascii')
+
+        req.body = b"\r\n".join((
+            b"--boundary",
+            b"",
+            b"obj data",
+            b"--boundary",
+            b"Content-MD5: " + bad_footer_meta_cksum,
+            b"",
+            footer_meta,
+            b"--boundary--",
+        ))
+        req.headers.pop("Content-Length", None)
+
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 422)
+
+    def test_PUT_bad_footer_json(self):
+        timestamp = normalize_timestamp(time())
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            headers={'X-Timestamp': timestamp,
+                     'Content-Type': 'text/plain',
+                     'Transfer-Encoding': 'chunked',
+                     'X-Backend-Obj-Metadata-Footer': 'yes',
+                     'X-Backend-Obj-Multipart-Mime-Boundary': 'boundary'},
+            environ={'REQUEST_METHOD': 'PUT'})
+
+        footer_meta = b"{{{[[{{[{[[{[{[[{{{[{{{{[[{{[{["
+        footer_meta_cksum = md5(
+            footer_meta, usedforsecurity=False).hexdigest().encode('ascii')
+
+        req.body = b"\r\n".join((
+            b"--boundary",
+            b"",
+            b"obj data",
+            b"--boundary",
+            b"Content-MD5: " + footer_meta_cksum,
+            b"",
+            footer_meta,
+            b"--boundary--",
+        ))
+        req.headers.pop("Content-Length", None)
+
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 400)
+
+    def test_PUT_extra_mime_docs_ignored(self):
+        timestamp = normalize_timestamp(time())
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            headers={'X-Timestamp': timestamp,
+                     'Content-Type': 'text/plain',
+                     'Transfer-Encoding': 'chunked',
+                     'X-Backend-Obj-Metadata-Footer': 'yes',
+                     'X-Backend-Obj-Multipart-Mime-Boundary': 'boundary'},
+            environ={'REQUEST_METHOD': 'PUT'})
+
+        footer_meta = json.dumps({
+            'X-Object-Meta-Mint': 'pepper'
+        }).encode('ascii')
+        footer_meta_cksum = md5(
+            footer_meta, usedforsecurity=False).hexdigest().encode('ascii')
+
+        req.body = b"\r\n".join((
+            b"--boundary",
+            b"",
+            b"obj data",
+            b"--boundary",
+            b"Content-MD5: " + footer_meta_cksum,
+            b"",
+            footer_meta,
+            b"--boundary",
+            b"This-Document-Is-Useless: yes",
+            b"",
+            b"blah blah I take up space",
+            b"--boundary--"
+        ))
+        req.headers.pop("Content-Length", None)
+
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        # swob made this into a StringIO for us
+        wsgi_input = req.environ['wsgi.input']
+        self.assertEqual(wsgi_input.tell(), len(wsgi_input.getvalue()))
+
+    def test_PUT_user_metadata_no_xattr(self):
+        timestamp = normalize_timestamp(time())
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': timestamp,
+                     'Content-Type': 'text/plain',
+                     'ETag': 'b114ab7b90d9ccac4bd5d99cc7ebb568',
+                     'X-Object-Meta-1': 'One',
+                     'X-Object-Meta-Two': 'Two'})
+        req.body = 'VERIFY THREE'
+
+        def mock_get_and_setxattr(*args, **kargs):
+            error_num = errno.ENOTSUP if hasattr(errno, 'ENOTSUP') else \
+                errno.EOPNOTSUPP
+            raise IOError(error_num, 'Operation not supported')
+
+        with mock.patch('xattr.getxattr', mock_get_and_setxattr):
+            with mock.patch('xattr.setxattr', mock_get_and_setxattr):
+                resp = req.get_response(self.object_controller)
+                self.assertEqual(resp.status_int, 507)
+
+    def test_PUT_client_timeout(self):
+        class FakeTimeout(BaseException):
+            def __enter__(self):
+                raise self
+
+            def __exit__(self, typ, value, tb):
+                pass
+
+        with mock.patch.object(object_server, 'ChunkReadTimeout', FakeTimeout):
+            timestamp = normalize_timestamp(time())
+            req = Request.blank(
+                '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
                 headers={'X-Timestamp': timestamp,
                          'Content-Type': 'text/plain',
-                         'ETag': 'b114ab7b90d9ccac4bd5d99cc7ebb568',
-                         'X-Object-Meta-1': 'One',
-                         'X-Object-Meta-Two': 'Two'})
-        req.body = 'VERIFY THREE'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
-        objfile = os.path.join(self.testdir, 'sda1',
-            storage_directory(object_server.DATADIR, 'p',
+                         'Content-Length': '6'})
+            req.environ['wsgi.input'] = WsgiBytesIO(b'VERIFY')
+            resp = req.get_response(self.object_controller)
+            self.assertEqual(resp.status_int, 408)
+
+    def test_PUT_client_closed_connection(self):
+        class fake_input(object):
+            def read(self, *a, **kw):
+                # On client disconnect during a chunked transfer, eventlet
+                # may raise a ValueError (or ChunkReadError, following
+                # https://github.com/eventlet/eventlet/commit/c3ce3ee -- but
+                # that inherits from ValueError)
+                raise ValueError
+
+        timestamp = normalize_timestamp(time())
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': timestamp,
+                     'Content-Type': 'text/plain',
+                     'Content-Length': '6'})
+        req.environ['wsgi.input'] = fake_input()
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 499)
+
+    def test_PUT_system_metadata(self):
+        # check that sysmeta is stored in diskfile
+        timestamp = normalize_timestamp(time())
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': timestamp,
+                     'Content-Type': 'text/plain',
+                     'ETag': '1000d172764c9dbc3a5798a67ec5bb76',
+                     'X-Object-Meta-1': 'One',
+                     'X-Object-Sysmeta-1': 'One',
+                     'X-Object-Sysmeta-Two': 'Two',
+                     'X-Object-Transient-Sysmeta-Foo': 'Bar'})
+        req.body = 'VERIFY SYSMETA'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+        objfile = os.path.join(
+            self.testdir, 'sda1',
+            storage_directory(diskfile.get_data_dir(POLICIES[0]), 'p',
                               hash_path('a', 'c', 'o')),
             timestamp + '.data')
-        self.assert_(os.path.isfile(objfile))
-        self.assertEquals(open(objfile).read(), 'VERIFY THREE')
-        self.assertEquals(pickle.loads(getxattr(objfile,
-        object_server.METADATA_KEY)),
-                          {'X-Timestamp': timestamp,
-                           'Content-Length': '12',
-                           'ETag': 'b114ab7b90d9ccac4bd5d99cc7ebb568',
-                           'Content-Type': 'text/plain',
-                           'name': '/a/c/o',
-                           'X-Object-Meta-1': 'One',
-                           'X-Object-Meta-Two': 'Two'})
+        self.assertTrue(os.path.isfile(objfile))
+        self.assertEqual(open(objfile).read(), 'VERIFY SYSMETA')
+        self.assertEqual(diskfile.read_metadata(objfile),
+                         {'X-Timestamp': timestamp,
+                          'Content-Length': '14',
+                          'Content-Type': 'text/plain',
+                          'ETag': '1000d172764c9dbc3a5798a67ec5bb76',
+                          'name': '/a/c/o',
+                          'X-Object-Meta-1': 'One',
+                          'X-Object-Sysmeta-1': 'One',
+                          'X-Object-Sysmeta-Two': 'Two',
+                          'X-Object-Transient-Sysmeta-Foo': 'Bar'})
+
+    def test_PUT_succeeds_with_later_POST(self):
+        t_put = next(self.ts).internal
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': t_put,
+                                     'Content-Length': 0,
+                                     'Content-Type': 'plain/text'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        t_put2 = next(self.ts).internal
+        t_post = next(self.ts).internal
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'X-Timestamp': t_post})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 202)
+
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': t_put2,
+                                     'Content-Length': 0,
+                                     'Content-Type': 'plain/text'},
+                            )
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        obj_dir = os.path.join(
+            self.testdir, 'sda1',
+            storage_directory(diskfile.get_data_dir(0), 'p',
+                              hash_path('a', 'c', 'o')))
+
+        ts_file = os.path.join(obj_dir, t_put2 + '.data')
+        self.assertTrue(os.path.isfile(ts_file))
+        meta_file = os.path.join(obj_dir, t_post + '.meta')
+        self.assertTrue(os.path.isfile(meta_file))
+
+    def test_POST_system_metadata(self):
+        # check that diskfile sysmeta is not changed by a POST
+        timestamp1 = normalize_timestamp(time())
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': timestamp1,
+                     'Content-Type': 'text/plain',
+                     'ETag': '1000d172764c9dbc3a5798a67ec5bb76',
+                     'X-Object-Meta-1': 'One',
+                     'X-Object-Sysmeta-1': 'One',
+                     'X-Object-Sysmeta-Two': 'Two'})
+        req.body = 'VERIFY SYSMETA'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        timestamp2 = normalize_timestamp(time())
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'POST'},
+            headers={'X-Timestamp': timestamp2,
+                     'X-Object-Meta-1': 'Not One',
+                     'X-Object-Sysmeta-1': 'Not One',
+                     'X-Object-Sysmeta-Two': 'Not Two'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 202)
+
+        # original .data file metadata should be unchanged
+        objfile = os.path.join(
+            self.testdir, 'sda1',
+            storage_directory(diskfile.get_data_dir(POLICIES[0]), 'p',
+                              hash_path('a', 'c', 'o')),
+            timestamp1 + '.data')
+        self.assertTrue(os.path.isfile(objfile))
+        self.assertEqual(open(objfile).read(), 'VERIFY SYSMETA')
+        self.assertEqual(diskfile.read_metadata(objfile),
+                         {'X-Timestamp': timestamp1,
+                          'Content-Length': '14',
+                          'Content-Type': 'text/plain',
+                          'ETag': '1000d172764c9dbc3a5798a67ec5bb76',
+                          'name': '/a/c/o',
+                          'X-Object-Meta-1': 'One',
+                          'X-Object-Sysmeta-1': 'One',
+                          'X-Object-Sysmeta-Two': 'Two'})
+
+        # .meta file metadata should have only user meta items
+        metafile = os.path.join(
+            self.testdir, 'sda1',
+            storage_directory(diskfile.get_data_dir(POLICIES[0]), 'p',
+                              hash_path('a', 'c', 'o')),
+            timestamp2 + '.meta')
+        self.assertTrue(os.path.isfile(metafile))
+        self.assertEqual(diskfile.read_metadata(metafile),
+                         {'X-Timestamp': timestamp2,
+                          'name': '/a/c/o',
+                          'X-Object-Meta-1': 'Not One'})
+
+    def test_POST_then_fetch_content_type(self):
+        # check that content_type is updated by a POST
+        timestamp1 = next(self.ts)
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': timestamp1.internal,
+                     'Content-Type': 'text/plain',
+                     'ETag': '1000d172764c9dbc3a5798a67ec5bb76',
+                     'X-Object-Meta-1': 'One'})
+        req.body = 'VERIFY SYSMETA'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        timestamp2 = next(self.ts)
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'POST'},
+            headers={'X-Timestamp': timestamp2.internal,
+                     'X-Object-Meta-1': 'Not One',
+                     'Content-Type': 'text/html'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 202)
+
+        # original .data file metadata should be unchanged
+        objfile = os.path.join(
+            self.testdir, 'sda1',
+            storage_directory(diskfile.get_data_dir(0), 'p',
+                              hash_path('a', 'c', 'o')),
+            timestamp1.internal + '.data')
+        self.assertTrue(os.path.isfile(objfile))
+        self.assertEqual(open(objfile).read(), 'VERIFY SYSMETA')
+        self.assertEqual(diskfile.read_metadata(objfile),
+                         {'X-Timestamp': timestamp1.internal,
+                          'Content-Length': '14',
+                          'Content-Type': 'text/plain',
+                          'ETag': '1000d172764c9dbc3a5798a67ec5bb76',
+                          'name': '/a/c/o',
+                          'X-Object-Meta-1': 'One'})
+
+        # .meta file metadata should have updated content-type
+        metafile_name = encode_timestamps(timestamp2,
+                                          timestamp2,
+                                          explicit=True)
+        metafile = os.path.join(
+            self.testdir, 'sda1',
+            storage_directory(diskfile.get_data_dir(0), 'p',
+                              hash_path('a', 'c', 'o')),
+            metafile_name + '.meta')
+        self.assertTrue(os.path.isfile(metafile))
+        self.assertEqual(diskfile.read_metadata(metafile),
+                         {'X-Timestamp': timestamp2.internal,
+                          'name': '/a/c/o',
+                          'Content-Type': 'text/html',
+                          'Content-Type-Timestamp': timestamp2.internal,
+                          'X-Object-Meta-1': 'Not One'})
+
+        def check_response(resp):
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual(resp.content_length, 14)
+            self.assertEqual(resp.content_type, 'text/html')
+            self.assertEqual(resp.headers['content-type'], 'text/html')
+            self.assertEqual(resp.headers['last-modified'],
+                             date_header_format(timestamp2.ceil()))
+            self.assertEqual(resp.headers['etag'],
+                             '"1000d172764c9dbc3a5798a67ec5bb76"')
+            self.assertEqual(resp.headers['x-object-meta-1'], 'Not One')
+
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'HEAD'})
+        resp = req.get_response(self.object_controller)
+        check_response(resp)
+
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.object_controller)
+        check_response(resp)
+
+    def test_POST_transient_sysmeta(self):
+        # check that diskfile transient system meta is changed by a POST
+        timestamp1 = normalize_timestamp(time())
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': timestamp1,
+                     'Content-Type': 'text/plain',
+                     'ETag': '1000d172764c9dbc3a5798a67ec5bb76',
+                     'X-Object-Meta-1': 'One',
+                     'X-Object-Sysmeta-1': 'One',
+                     'X-Object-Transient-Sysmeta-Foo': 'Bar'})
+        req.body = 'VERIFY SYSMETA'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        timestamp2 = normalize_timestamp(time())
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'POST'},
+            headers={'X-Timestamp': timestamp2,
+                     'X-Object-Meta-1': 'Not One',
+                     'X-Object-Sysmeta-1': 'Not One',
+                     'X-Object-Transient-Sysmeta-Foo': 'Not Bar'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 202)
+
+        # original .data file metadata should be unchanged
+        objfile = os.path.join(
+            self.testdir, 'sda1',
+            storage_directory(diskfile.get_data_dir(0), 'p',
+                              hash_path('a', 'c', 'o')),
+            timestamp1 + '.data')
+        self.assertTrue(os.path.isfile(objfile))
+        self.assertEqual(open(objfile).read(), 'VERIFY SYSMETA')
+        self.assertDictEqual(diskfile.read_metadata(objfile),
+                             {'X-Timestamp': timestamp1,
+                              'Content-Length': '14',
+                              'Content-Type': 'text/plain',
+                              'ETag': '1000d172764c9dbc3a5798a67ec5bb76',
+                              'name': '/a/c/o',
+                              'X-Object-Meta-1': 'One',
+                              'X-Object-Sysmeta-1': 'One',
+                              'X-Object-Transient-Sysmeta-Foo': 'Bar'})
+
+        # .meta file metadata should have only user meta items
+        metafile = os.path.join(
+            self.testdir, 'sda1',
+            storage_directory(diskfile.get_data_dir(0), 'p',
+                              hash_path('a', 'c', 'o')),
+            timestamp2 + '.meta')
+        self.assertTrue(os.path.isfile(metafile))
+        self.assertDictEqual(diskfile.read_metadata(metafile),
+                             {'X-Timestamp': timestamp2,
+                              'name': '/a/c/o',
+                              'X-Object-Meta-1': 'Not One',
+                              'X-Object-Transient-Sysmeta-Foo': 'Not Bar'})
+
+    def test_PUT_then_fetch_system_metadata(self):
+        timestamp = next(self.ts)
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': timestamp.internal,
+                     'Content-Type': 'text/plain',
+                     'ETag': '1000d172764c9dbc3a5798a67ec5bb76',
+                     'X-Object-Meta-1': 'One',
+                     'X-Object-Sysmeta-1': 'One',
+                     'X-Object-Sysmeta-Two': 'Two',
+                     'X-Object-Transient-Sysmeta-Foo': 'Bar'})
+        req.body = 'VERIFY SYSMETA'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        def check_response(resp):
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual(resp.content_length, 14)
+            self.assertEqual(resp.content_type, 'text/plain')
+            self.assertEqual(resp.headers['content-type'], 'text/plain')
+            self.assertEqual(resp.headers['last-modified'],
+                             date_header_format(timestamp))
+            self.assertEqual(resp.headers['etag'],
+                             '"1000d172764c9dbc3a5798a67ec5bb76"')
+            self.assertEqual(resp.headers['x-object-meta-1'], 'One')
+            self.assertEqual(resp.headers['x-object-sysmeta-1'], 'One')
+            self.assertEqual(resp.headers['x-object-sysmeta-two'], 'Two')
+            self.assertEqual(resp.headers['x-object-transient-sysmeta-foo'],
+                             'Bar')
+
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'HEAD'})
+        resp = req.get_response(self.object_controller)
+        check_response(resp)
+
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.object_controller)
+        check_response(resp)
+
+    def test_PUT_then_POST_then_fetch_system_metadata(self):
+        timestamp = next(self.ts)
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': timestamp.internal,
+                     'Content-Type': 'text/plain',
+                     'ETag': '1000d172764c9dbc3a5798a67ec5bb76',
+                     'X-Object-Meta-0': 'deleted by post',
+                     'X-Object-Sysmeta-0': 'Zero',
+                     'X-Object-Transient-Sysmeta-0': 'deleted by post',
+                     'X-Object-Meta-1': 'One',
+                     'X-Object-Sysmeta-1': 'One',
+                     'X-Object-Sysmeta-Two': 'Two',
+                     'X-Object-Transient-Sysmeta-Foo': 'Bar'})
+        req.body = 'VERIFY SYSMETA'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        timestamp2 = next(self.ts)
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'POST'},
+            headers={'X-Timestamp': timestamp2.internal,
+                     'X-Object-Meta-1': 'Not One',
+                     'X-Object-Sysmeta-1': 'Not One',
+                     'X-Object-Sysmeta-Two': 'Not Two',
+                     'X-Object-Transient-Sysmeta-Foo': 'Not Bar'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 202)
+
+        def check_response(resp):
+            # user meta should be updated but not sysmeta
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual(resp.content_length, 14)
+            self.assertEqual(resp.content_type, 'text/plain')
+            self.assertEqual(resp.headers['content-type'], 'text/plain')
+            self.assertEqual(resp.headers['last-modified'],
+                             date_header_format(timestamp2.ceil()))
+            self.assertEqual(resp.headers['etag'],
+                             '"1000d172764c9dbc3a5798a67ec5bb76"')
+            self.assertEqual(resp.headers['x-object-meta-1'], 'Not One')
+            self.assertEqual(resp.headers['x-object-sysmeta-0'], 'Zero')
+            self.assertEqual(resp.headers['x-object-sysmeta-1'], 'One')
+            self.assertEqual(resp.headers['x-object-sysmeta-two'], 'Two')
+            self.assertEqual(resp.headers['x-object-transient-sysmeta-foo'],
+                             'Not Bar')
+            self.assertNotIn('x-object-meta-0', resp.headers)
+            self.assertNotIn('x-object-transient-sysmeta-0', resp.headers)
+
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'HEAD'})
+        resp = req.get_response(self.object_controller)
+        check_response(resp)
+
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.object_controller)
+        check_response(resp)
+
+    def test_PUT_with_replication_headers(self):
+        # check that otherwise disallowed headers are accepted when specified
+        # by X-Backend-Replication-Headers
+
+        # first PUT object
+        timestamp1 = normalize_timestamp(time())
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': timestamp1,
+                     'Content-Type': 'text/plain',
+                     'Content-Length': '14',
+                     'Etag': '1000d172764c9dbc3a5798a67ec5bb76',
+                     'Custom-Header': 'custom1',
+                     'X-Object-Meta-1': 'meta1',
+                     'X-Static-Large-Object': 'False'})
+        req.body = 'VERIFY SYSMETA'
+
+        # restrict set of allowed headers on this server
+        with mock.patch.object(self.object_controller, 'allowed_headers',
+                               ['Custom-Header']):
+            resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        objfile = os.path.join(
+            self.testdir, 'sda1',
+            storage_directory(diskfile.get_data_dir(0), 'p',
+                              hash_path('a', 'c', 'o')),
+            timestamp1 + '.data')
+        # X-Static-Large-Object is disallowed.
+        self.assertEqual(diskfile.read_metadata(objfile),
+                         {'X-Timestamp': timestamp1,
+                          'Content-Type': 'text/plain',
+                          'Content-Length': '14',
+                          'ETag': '1000d172764c9dbc3a5798a67ec5bb76',
+                          'name': '/a/c/o',
+                          'Custom-Header': 'custom1',
+                          'X-Object-Meta-1': 'meta1'})
+
+        # PUT object again with X-Backend-Replication-Headers
+        timestamp2 = normalize_timestamp(time())
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': timestamp2,
+                     'Content-Type': 'text/plain',
+                     'Content-Length': '14',
+                     'Etag': '1000d172764c9dbc3a5798a67ec5bb76',
+                     'Custom-Header': 'custom1',
+                     'X-Object-Meta-1': 'meta1',
+                     'X-Static-Large-Object': 'False',
+                     'X-Backend-Replication-Headers':
+                     'X-Static-Large-Object'})
+        req.body = 'VERIFY SYSMETA'
+
+        with mock.patch.object(self.object_controller, 'allowed_headers',
+                               ['Custom-Header']):
+            resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        objfile = os.path.join(
+            self.testdir, 'sda1',
+            storage_directory(diskfile.get_data_dir(0), 'p',
+                              hash_path('a', 'c', 'o')),
+            timestamp2 + '.data')
+        # X-Static-Large-Object should be copied since it is now allowed by
+        # replication headers.
+        self.assertEqual(diskfile.read_metadata(objfile),
+                         {'X-Timestamp': timestamp2,
+                          'Content-Type': 'text/plain',
+                          'Content-Length': '14',
+                          'ETag': '1000d172764c9dbc3a5798a67ec5bb76',
+                          'name': '/a/c/o',
+                          'Custom-Header': 'custom1',
+                          'X-Object-Meta-1': 'meta1',
+                          'X-Static-Large-Object': 'False'})
 
     def test_PUT_container_connection(self):
 
@@ -779,211 +3106,753 @@ def getresponse(self):
                     return self
 
                 def read(self, amt=None):
-                    return ''
+                    return b''
 
             return lambda *args, **kwargs: FakeConn(response, with_exc)
 
-        old_http_connect = object_server.http_connect
-        try:
-            timestamp = normalize_timestamp(time())
-            req = Request.blank('/sda1/p/a/c/o',
-                    environ={'REQUEST_METHOD': 'POST'},
-                    headers={'X-Timestamp': timestamp,
-                             'X-Container-Host': '1.2.3.4:0',
-                             'X-Container-Partition': '3',
-                             'X-Container-Device': 'sda1',
-                             'X-Container-Timestamp': '1',
-                             'Content-Type': 'application/new1',
-                             'Content-Length': '0'})
-            object_server.http_connect = mock_http_connect(201)
-            resp = self.object_controller.PUT(req)
-            self.assertEquals(resp.status_int, 201)
-            timestamp = normalize_timestamp(time())
-            req = Request.blank('/sda1/p/a/c/o',
-                                environ={'REQUEST_METHOD': 'POST'},
-                                headers={'X-Timestamp': timestamp,
-                                         'X-Container-Host': '1.2.3.4:0',
-                                         'X-Container-Partition': '3',
-                                         'X-Container-Device': 'sda1',
-                                         'X-Container-Timestamp': '1',
-                                         'Content-Type': 'application/new1',
-                                         'Content-Length': '0'})
-            object_server.http_connect = mock_http_connect(500)
-            resp = self.object_controller.PUT(req)
-            self.assertEquals(resp.status_int, 201)
-            timestamp = normalize_timestamp(time())
-            req = Request.blank('/sda1/p/a/c/o',
-                                environ={'REQUEST_METHOD': 'POST'},
-                                headers={'X-Timestamp': timestamp,
-                                         'X-Container-Host': '1.2.3.4:0',
-                                         'X-Container-Partition': '3',
-                                         'X-Container-Device': 'sda1',
-                                         'X-Container-Timestamp': '1',
-                                         'Content-Type': 'application/new1',
-                                         'Content-Length': '0'})
-            object_server.http_connect = mock_http_connect(500, with_exc=True)
-            resp = self.object_controller.PUT(req)
-            self.assertEquals(resp.status_int, 201)
-        finally:
-            object_server.http_connect = old_http_connect
+        timestamp = normalize_timestamp(time())
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': timestamp,
+                     'X-Container-Host': '1.2.3.4:0',
+                     'X-Container-Partition': '3',
+                     'X-Container-Device': 'sda1',
+                     'X-Container-Timestamp': '1',
+                     'Content-Type': 'application/new1',
+                     'Content-Length': '0'})
+        with mock.patch.object(
+                object_server, 'http_connect', mock_http_connect(201)):
+            with fake_spawn():
+                resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+        timestamp = normalize_timestamp(time())
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': timestamp,
+                     'X-Container-Host': '1.2.3.4:0',
+                     'X-Container-Partition': '3',
+                     'X-Container-Device': 'sda1',
+                     'X-Container-Timestamp': '1',
+                     'Content-Type': 'application/new1',
+                     'Content-Length': '0'})
+        with mock.patch.object(
+                object_server, 'http_connect', mock_http_connect(500)):
+            with fake_spawn():
+                resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+        timestamp = normalize_timestamp(time())
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': timestamp,
+                     'X-Container-Host': '1.2.3.4:0',
+                     'X-Container-Partition': '3',
+                     'X-Container-Device': 'sda1',
+                     'X-Container-Timestamp': '1',
+                     'Content-Type': 'application/new1',
+                     'Content-Length': '0'})
+        with mock.patch.object(
+                object_server, 'http_connect',
+                mock_http_connect(500, with_exc=True)):
+            with fake_spawn():
+                resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+    def test_EC_PUT_GET_data(self):
+        for policy in self.ec_policies:
+            ts = next(self.ts)
+            raw_data = (b'VERIFY' * policy.ec_segment_size)[:-432]
+            frag_archives = encode_frag_archive_bodies(policy, raw_data)
+            frag_index = random.randint(0, len(frag_archives) - 1)
+            # put EC frag archive
+            req = Request.blank('/sda1/p/a/c/o', method='PUT', headers={
+                'X-Timestamp': ts.internal,
+                'Content-Type': 'application/verify',
+                'Content-Length': len(frag_archives[frag_index]),
+                'X-Object-Sysmeta-Ec-Frag-Index': frag_index,
+                'X-Backend-Storage-Policy-Index': int(policy),
+            })
+            req.body = frag_archives[frag_index]
+            resp = req.get_response(self.object_controller)
+            self.assertEqual(resp.status_int, 201)
+
+            # get EC frag archive
+            req = Request.blank('/sda1/p/a/c/o', headers={
+                'X-Backend-Storage-Policy-Index': int(policy),
+            })
+            resp = req.get_response(self.object_controller)
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual(resp.body, frag_archives[frag_index])
+
+            # check the diskfile is durable
+            df_mgr = diskfile.ECDiskFileManager(self.conf,
+                                                self.object_controller.logger)
+            df = df_mgr.get_diskfile('sda1', 'p', 'a', 'c', 'o', policy,
+                                     frag_prefs=[])
+            with df.open():
+                self.assertEqual(ts, df.data_timestamp)
+                self.assertEqual(df.data_timestamp, df.durable_timestamp)
+
+    def test_EC_PUT_GET_data_no_commit(self):
+        for policy in self.ec_policies:
+            ts = next(self.ts)
+            raw_data = (b'VERIFY' * policy.ec_segment_size)[:-432]
+            frag_archives = encode_frag_archive_bodies(policy, raw_data)
+            frag_index = random.randint(0, len(frag_archives) - 1)
+            # put EC frag archive
+            req = Request.blank('/sda1/p/a/c/o', method='PUT', headers={
+                'X-Timestamp': ts.internal,
+                'Content-Type': 'application/verify',
+                'Content-Length': len(frag_archives[frag_index]),
+                'X-Backend-No-Commit': 'true',
+                'X-Object-Sysmeta-Ec-Frag-Index': frag_index,
+                'X-Backend-Storage-Policy-Index': int(policy),
+            })
+            req.body = frag_archives[frag_index]
+            resp = req.get_response(self.object_controller)
+            self.assertEqual(resp.status_int, 201)
+
+            # get EC frag archive will 404 - nothing durable...
+            req = Request.blank('/sda1/p/a/c/o', headers={
+                'X-Backend-Storage-Policy-Index': int(policy),
+            })
+            resp = req.get_response(self.object_controller)
+            self.assertEqual(resp.status_int, 404)
+
+            # ...unless we explicitly request *any* fragment...
+            req = Request.blank('/sda1/p/a/c/o', headers={
+                'X-Backend-Storage-Policy-Index': int(policy),
+                'X-Backend-Fragment-Preferences': '[]',
+            })
+            resp = req.get_response(self.object_controller)
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual(resp.body, frag_archives[frag_index])
+
+            # check the diskfile is not durable
+            df_mgr = diskfile.ECDiskFileManager(self.conf,
+                                                self.object_controller.logger)
+            df = df_mgr.get_diskfile('sda1', 'p', 'a', 'c', 'o', policy,
+                                     frag_prefs=[])
+            with df.open():
+                self.assertEqual(ts, df.data_timestamp)
+                self.assertIsNone(df.durable_timestamp)
+
+    def test_EC_GET_quarantine_invalid_frag_archive(self):
+        policy = random.choice(self.ec_policies)
+        raw_data = (b'VERIFY' * policy.ec_segment_size)[:-432]
+        frag_archives = encode_frag_archive_bodies(policy, raw_data)
+        frag_index = random.randint(0, len(frag_archives) - 1)
+        content_length = len(frag_archives[frag_index])
+        # put EC frag archive
+        req = Request.blank('/sda1/p/a/c/o', method='PUT', headers={
+            'X-Timestamp': next(self.ts).internal,
+            'Content-Type': 'application/verify',
+            'Content-Length': content_length,
+            'X-Object-Sysmeta-Ec-Frag-Index': frag_index,
+            'X-Backend-Storage-Policy-Index': int(policy),
+        })
+        corrupt = b'garbage' + frag_archives[frag_index]
+        req.body = corrupt[:content_length]
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        # get EC frag archive
+        req = Request.blank('/sda1/p/a/c/o', headers={
+            'X-Backend-Storage-Policy-Index': int(policy),
+        })
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+
+        with self.assertRaises(DiskFileQuarantined) as ctx:
+            resp.body
+        self.assertIn("Invalid EC metadata", str(ctx.exception))
+
+        # nothing is logged on *our* loggers
+        errors = self.object_controller.logger.get_lines_for_level('error')
+        self.assertEqual(errors, [])
+
+        # get EC frag archive - it's gone
+        req = Request.blank('/sda1/p/a/c/o', headers={
+            'X-Backend-Storage-Policy-Index': int(policy),
+        })
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 404)
+
+    def test_PUT_ssync_multi_frag(self):
+        timestamp = utils.Timestamp.now().internal
+
+        def put_with_index(expected_rsp, frag_index, node_index=None):
+            data_file_tail = '#%d#d.data' % frag_index
+            headers = {'X-Timestamp': timestamp,
+                       'Content-Length': '6',
+                       'Content-Type': 'application/octet-stream',
+                       'X-Backend-Ssync-Frag-Index': node_index,
+                       'X-Object-Sysmeta-Ec-Frag-Index': frag_index,
+                       'X-Backend-Storage-Policy-Index': int(policy)}
+            req = Request.blank(
+                '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                headers=headers)
+            req.body = b'VERIFY'
+            resp = req.get_response(self.object_controller)
+
+            self.assertEqual(
+                resp.status_int, expected_rsp,
+                'got %s != %s for frag_index=%s node_index=%s' % (
+                    resp.status_int, expected_rsp,
+                    frag_index, node_index))
+            if expected_rsp == 409:
+                return
+            obj_dir = os.path.join(
+                self.testdir, 'sda1',
+                storage_directory(diskfile.get_data_dir(int(policy)),
+                                  'p', hash_path('a', 'c', 'o')))
+            data_file = os.path.join(obj_dir, timestamp) + data_file_tail
+            self.assertTrue(os.path.isfile(data_file),
+                            'Expected file %r not found in %r for policy %r'
+                            % (data_file, os.listdir(obj_dir), int(policy)))
+
+        for policy in POLICIES:
+            if policy.policy_type == EC_POLICY:
+                # upload with a ec-frag-index
+                put_with_index(201, 3)
+                # same timestamp will conflict a different ec-frag-index
+                put_with_index(409, 2)
+                # but with the ssync-frag-index (primary node) it will just
+                # save both!
+                put_with_index(201, 2, 2)
+                # but even with the ssync-frag-index we can still get a
+                # timestamp collisison if the file already exists
+                put_with_index(409, 3, 3)
+
+                # FWIW, ssync will never send in-consistent indexes - but if
+                # something else did, from the object server perspective ...
+
+                # ... the ssync-frag-index is canonical on the
+                # read/pre-existance check
+                put_with_index(409, 7, 2)
+                # ... but the ec-frag-index is canonical when it comes to on
+                # disk file
+                put_with_index(201, 7, 6)
+
+    def test_PUT_commits_data(self):
+        for policy in POLICIES:
+            timestamp = utils.Timestamp(int(time())).internal
+            data_file_tail = '.data'
+            headers = {'X-Timestamp': timestamp,
+                       'Content-Length': '6',
+                       'Content-Type': 'application/octet-stream',
+                       'X-Backend-Storage-Policy-Index': int(policy)}
+            if policy.policy_type == EC_POLICY:
+                # commit renames data file
+                headers['X-Object-Sysmeta-Ec-Frag-Index'] = '2'
+                data_file_tail = '#2#d.data'
+            req = Request.blank(
+                '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                headers=headers)
+            req.body = b'VERIFY'
+            resp = req.get_response(self.object_controller)
+
+            self.assertEqual(resp.status_int, 201)
+            obj_dir = os.path.join(
+                self.testdir, 'sda1',
+                storage_directory(diskfile.get_data_dir(int(policy)),
+                                  'p', hash_path('a', 'c', 'o')))
+            data_file = os.path.join(obj_dir, timestamp) + data_file_tail
+            self.assertTrue(os.path.isfile(data_file),
+                            'Expected file %r not found in %r for policy %r'
+                            % (data_file, os.listdir(obj_dir), int(policy)))
+            rmtree(obj_dir)
+
+    def test_PUT_next_part_power(self):
+        hash_path_ = hash_path('a', 'c', 'o')
+        part_power = 10
+        old_part = utils.get_partition_for_hash(hash_path_, part_power)
+        new_part = utils.get_partition_for_hash(hash_path_, part_power + 1)
+        policy = POLICIES.default
+        timestamp = utils.Timestamp(int(time())).internal
+        headers = {'X-Timestamp': timestamp,
+                   'Content-Length': '6',
+                   'Content-Type': 'application/octet-stream',
+                   'X-Backend-Storage-Policy-Index': int(policy),
+                   'X-Backend-Next-Part-Power': part_power + 1}
+        req = Request.blank(
+            '/sda1/%s/a/c/o' % old_part, method='PUT',
+            headers=headers, body=b'VERIFY')
+        resp = req.get_response(self.object_controller)
+
+        self.assertEqual(resp.status_int, 201)
+
+        def check_file(part):
+            data_file = os.path.join(
+                self.testdir, 'sda1',
+                storage_directory(diskfile.get_data_dir(int(policy)),
+                                  part, hash_path_), timestamp + '.data')
+            self.assertTrue(os.path.isfile(data_file))
+
+        check_file(old_part)
+        check_file(new_part)
+
+    def test_PUT_next_part_power_eexist(self):
+        hash_path_ = hash_path('a', 'c', 'o')
+        part_power = 10
+        old_part = utils.get_partition_for_hash(hash_path_, part_power)
+        new_part = utils.get_partition_for_hash(hash_path_, part_power + 1)
+        policy = POLICIES.default
+        timestamp = utils.Timestamp(int(time())).internal
+
+        # There's no substitute for the real thing ;-)
+        tpool.execute = self._orig_tpool_exc
+
+        # This is a little disingenuous, but it's easier than reproducing
+        # the actual race that could lead to this EEXIST
+        headers = {'X-Timestamp': timestamp,
+                   'Content-Length': '6',
+                   'Content-Type': 'application/octet-stream',
+                   'X-Backend-Storage-Policy-Index': int(policy),
+                   'X-Trans-Id': 'txn1'}
+        req = Request.blank(
+            '/sda1/%s/a/c/o' % new_part, method='PUT',
+            headers=headers, body=b'VERIFY')
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        # The write should succeed, but the relink will fail
+        headers = {'X-Timestamp': timestamp,
+                   'Content-Length': '6',
+                   'Content-Type': 'application/octet-stream',
+                   'X-Backend-Storage-Policy-Index': int(policy),
+                   'X-Backend-Next-Part-Power': part_power + 1,
+                   'X-Trans-Id': 'txn2'}
+        req = Request.blank(
+            '/sda1/%s/a/c/o' % old_part, method='PUT',
+            headers=headers, body=b'VERIFY')
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        def check_file(part):
+            data_file = os.path.join(
+                self.testdir, 'sda1',
+                storage_directory(diskfile.get_data_dir(int(policy)),
+                                  part, hash_path_), timestamp + '.data')
+            self.assertTrue(os.path.isfile(data_file))
+
+        check_file(old_part)
+        check_file(new_part)
+
+        error_lines = self.logger.get_lines_for_level('error')
+        self.assertIn('[Errno 17] File exists', error_lines[0])
+        self.assertEqual([], error_lines[1:])
+        log_extras = self.logger.log_dict['error'][0][1]['extra']
+        self.assertEqual('txn2', log_extras.get('txn_id'))
+
+    def test_PUT_next_part_power_races_around_makedirs_eexist(self):
+        # simulate two 'concurrent' racing to create the new object dir in the
+        # new partition and check that relinking tolerates the dir already
+        # existing when they attempt to create it
+        hash_path_ = hash_path('a', 'c', 'o')
+        part_power = 10
+        old_part = utils.get_partition_for_hash(hash_path_, part_power)
+        new_part = utils.get_partition_for_hash(hash_path_, part_power + 1)
+        policy = POLICIES.default
+
+        def make_request(timestamp):
+            headers = {'X-Timestamp': timestamp.internal,
+                       'Content-Length': '6',
+                       'Content-Type': 'application/octet-stream',
+                       'X-Backend-Storage-Policy-Index': int(policy),
+                       'X-Backend-Next-Part-Power': part_power + 1}
+            req = Request.blank(
+                '/sda1/%s/a/c/o' % old_part, method='PUT',
+                headers=headers, body=b'VERIFY')
+            resp = req.get_response(self.object_controller)
+            self.assertEqual(resp.status_int, 201)
+
+        def data_file(part, timestamp):
+            return os.path.join(
+                self.testdir, 'sda1',
+                storage_directory(diskfile.get_data_dir(int(policy)),
+                                  part, hash_path_),
+                timestamp.internal + '.data')
+
+        ts_1 = next(self.ts)
+        ts_2 = next(self.ts)
+        calls = []
+        orig_makedirs = os.makedirs
+
+        def mock_makedirs(path, *args, **kwargs):
+            # let another request catch up just as the first is about to create
+            # the next part power object dir, then pretend the first request
+            # process actually makes the dir
+            if path == os.path.dirname(data_file(new_part, ts_1)):
+                calls.append(path)
+                if len(calls) == 1:
+                    # pretend 'yield' to other request process
+                    make_request(ts_2)
+                if len(calls) == 2:
+                    # pretend 'yield' back to first request process for
+                    # its call to makedirs
+                    orig_makedirs(calls[0])
+            return orig_makedirs(path, *args, **kwargs)
+        with mock.patch('swift.obj.diskfile.os.makedirs', mock_makedirs):
+            make_request(ts_1)
+
+        self.assertEqual(
+            [os.path.dirname(data_file(new_part, ts_1)),
+             os.path.dirname(data_file(new_part, ts_1))], calls)
+        self.assertTrue(os.path.isfile(data_file(old_part, ts_2)))
+        self.assertTrue(os.path.isfile(data_file(new_part, ts_2)))
+        self.assertFalse(os.path.isfile(data_file(new_part, ts_1)))
+        self.assertFalse(os.path.isfile(data_file(old_part, ts_1)))
+        error_lines = self.logger.get_lines_for_level('error')
+        self.assertEqual([], error_lines)
+
+    def test_PUT_next_part_power_races_around_makedirs_enoent(self):
+        hash_path_ = hash_path('a', 'c', 'o')
+        part_power = 10
+        old_part = utils.get_partition_for_hash(hash_path_, part_power)
+        new_part = utils.get_partition_for_hash(hash_path_, part_power + 1)
+        policy = POLICIES.default
+
+        def make_request(timestamp):
+            headers = {'X-Timestamp': timestamp.internal,
+                       'Content-Length': '6',
+                       'Content-Type': 'application/octet-stream',
+                       'X-Backend-Storage-Policy-Index': int(policy),
+                       'X-Backend-Next-Part-Power': part_power + 1}
+            req = Request.blank(
+                '/sda1/%s/a/c/o' % old_part, method='PUT',
+                headers=headers, body=b'VERIFY')
+            resp = req.get_response(self.object_controller)
+            self.assertEqual(resp.status_int, 201)
+
+        def data_file(part, timestamp):
+            return os.path.join(
+                self.testdir, 'sda1',
+                storage_directory(diskfile.get_data_dir(int(policy)),
+                                  part, hash_path_),
+                timestamp.internal + '.data')
+
+        ts_1 = next(self.ts)
+        ts_2 = next(self.ts)
+        calls = []
+        orig_makedirs = os.makedirs
+
+        def mock_makedirs(path, *args, **kwargs):
+            # let another request race ahead just as the first is about to
+            # create the next part power object dir
+            if path == os.path.dirname(data_file(new_part, ts_1)):
+                calls.append(path)
+                if len(calls) == 1:
+                    # pretend 'yield' to other request process
+                    make_request(ts_2)
+            return orig_makedirs(path, *args, **kwargs)
+
+        with mock.patch('swift.obj.diskfile.os.makedirs', mock_makedirs):
+            make_request(ts_1)
+
+        self.assertEqual(
+            [os.path.dirname(data_file(new_part, ts_1)),
+             os.path.dirname(data_file(new_part, ts_1))], calls)
+        self.assertTrue(os.path.isfile(data_file(old_part, ts_2)))
+        self.assertTrue(os.path.isfile(data_file(new_part, ts_2)))
+        self.assertFalse(os.path.isfile(data_file(new_part, ts_1)))
+        self.assertFalse(os.path.isfile(data_file(old_part, ts_1)))
+        error_lines = self.logger.get_lines_for_level('error')
+        self.assertEqual([], error_lines)
 
     def test_HEAD(self):
-        """ Test swift.object_server.ObjectController.HEAD """
-        req = Request.blank('/sda1/p/a/c')
-        resp = self.object_controller.HEAD(req)
-        self.assertEquals(resp.status_int, 400)
+        # Test swift.obj.server.ObjectController.HEAD
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'HEAD'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 400)
 
-        req = Request.blank('/sda1/p/a/c/o')
-        resp = self.object_controller.HEAD(req)
-        self.assertEquals(resp.status_int, 404)
-
-        timestamp = normalize_timestamp(time())
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                            headers={'X-Timestamp': timestamp,
-                                     'Content-Type': 'application/x-test',
-                                     'X-Object-Meta-1': 'One',
-                                     'X-Object-Meta-Two': 'Two'})
-        req.body = 'VERIFY'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'HEAD'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 404)
+        self.assertFalse('X-Backend-Timestamp' in resp.headers)
+
+        timestamp = Timestamp.now()
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': timestamp.internal,
+                     'Content-Type': 'application/x-test',
+                     'X-Object-Meta-1': 'One',
+                     'X-Object-Meta-Two': 'Two'})
+        req.body = b'VERIFY'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
 
-        req = Request.blank('/sda1/p/a/c/o')
-        resp = self.object_controller.HEAD(req)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(resp.content_length, 6)
-        self.assertEquals(resp.content_type, 'application/x-test')
-        self.assertEquals(resp.headers['content-type'], 'application/x-test')
-        self.assertEquals(resp.headers['last-modified'],
-               strftime('%a, %d %b %Y %H:%M:%S GMT', gmtime(float(timestamp))))
-        self.assertEquals(resp.headers['etag'],
-                          '"0b4c12d7e0a73840c1c4f148fda3b037"')
-        self.assertEquals(resp.headers['x-object-meta-1'], 'One')
-        self.assertEquals(resp.headers['x-object-meta-two'], 'Two')
-
-        objfile = os.path.join(self.testdir, 'sda1',
-            storage_directory(object_server.DATADIR, 'p',
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'HEAD'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.content_length, 6)
+        self.assertEqual(resp.content_type, 'application/x-test')
+        self.assertEqual(resp.headers['content-type'], 'application/x-test')
+        self.assertEqual(resp.headers['last-modified'],
+                         date_header_format(timestamp))
+        self.assertEqual(resp.headers['etag'],
+                         '"0b4c12d7e0a73840c1c4f148fda3b037"')
+        self.assertEqual(resp.headers['x-object-meta-1'], 'One')
+        self.assertEqual(resp.headers['x-object-meta-two'], 'Two')
+
+        objfile = os.path.join(
+            self.testdir, 'sda1',
+            storage_directory(diskfile.get_data_dir(POLICIES[0]), 'p',
                               hash_path('a', 'c', 'o')),
-            timestamp + '.data')
+            utils.Timestamp(timestamp).internal + '.data')
         os.unlink(objfile)
-        req = Request.blank('/sda1/p/a/c/o')
-        resp = self.object_controller.HEAD(req)
-        self.assertEquals(resp.status_int, 404)
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'HEAD'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 404)
 
         sleep(.00001)
-        timestamp = normalize_timestamp(time())
+        timestamp = Timestamp.now()
         req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
                             headers={
-                                'X-Timestamp': timestamp,
+                                'X-Timestamp': timestamp.internal,
                                 'Content-Type': 'application/octet-stream',
                                 'Content-length': '6'})
-        req.body = 'VERIFY'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
+        req.body = b'VERIFY'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
 
         sleep(.00001)
-        timestamp = normalize_timestamp(time())
+        timestamp = Timestamp.now()
         req = Request.blank('/sda1/p/a/c/o',
                             environ={'REQUEST_METHOD': 'DELETE'},
-                            headers={'X-Timestamp': timestamp})
-        resp = self.object_controller.DELETE(req)
-        self.assertEquals(resp.status_int, 204)
+                            headers={'X-Timestamp': timestamp.internal})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 204)
 
-        req = Request.blank('/sda1/p/a/c/o')
-        resp = self.object_controller.HEAD(req)
-        self.assertEquals(resp.status_int, 404)
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'HEAD'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 404)
+        self.assertEqual(resp.headers['X-Backend-Timestamp'],
+                         timestamp.internal)
 
     def test_HEAD_quarantine_zbyte(self):
-        """ Test swift.object_server.ObjectController.GET """
+        # Test swift.obj.server.ObjectController.GET
         timestamp = normalize_timestamp(time())
         req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
                             headers={'X-Timestamp': timestamp,
                                      'Content-Type': 'application/x-test'})
-        req.body = 'VERIFY'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
-        file = object_server.DiskFile(self.testdir, 'sda1', 'p', 'a', 'c', 'o',
-                                      FakeLogger(), keep_data_fp=True)
-
-        file_name = os.path.basename(file.data_file)
-        with open(file.data_file) as fp:
-            metadata = object_server.read_metadata(fp)
-        os.unlink(file.data_file)
-        with open(file.data_file, 'w') as fp:
-            object_server.write_metadata(fp, metadata)
-
-        self.assertEquals(os.listdir(file.datadir)[0], file_name)
-        req = Request.blank('/sda1/p/a/c/o')
-        resp = self.object_controller.HEAD(req)
-        self.assertEquals(resp.status_int, 404)
+        req.body = b'VERIFY'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+        disk_file = self.df_mgr.get_diskfile('sda1', 'p', 'a', 'c', 'o',
+                                             policy=POLICIES.legacy)
+        disk_file.open()
+
+        file_name = os.path.basename(disk_file._data_file)
+        with open(disk_file._data_file) as fp:
+            metadata = diskfile.read_metadata(fp)
+        os.unlink(disk_file._data_file)
+        with open(disk_file._data_file, 'w') as fp:
+            diskfile.write_metadata(fp, metadata)
+
+        file_name = os.path.basename(disk_file._data_file)
+        self.assertEqual(os.listdir(disk_file._datadir)[0], file_name)
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'HEAD'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 404)
+
+        quar_dir = os.path.join(
+            self.testdir, 'sda1', 'quarantined', 'objects',
+            os.path.basename(os.path.dirname(disk_file._data_file)))
+        self.assertEqual(os.listdir(quar_dir)[0], file_name)
 
-        quar_dir = os.path.join(self.testdir, 'sda1', 'quarantined', 'objects',
-                       os.path.basename(os.path.dirname(file.data_file)))
-        self.assertEquals(os.listdir(quar_dir)[0], file_name)
+    def test_OPTIONS(self):
+        conf = {'devices': self.testdir, 'mount_check': 'false'}
+        server_handler = object_server.ObjectController(
+            conf, logger=debug_logger())
+        req = Request.blank('/sda1/p/a/c/o', {'REQUEST_METHOD': 'OPTIONS'})
+        req.content_length = 0
+        resp = server_handler.OPTIONS(req)
+        self.assertEqual(200, resp.status_int)
+        for verb in 'OPTIONS GET POST PUT DELETE HEAD REPLICATE \
+                SSYNC'.split():
+            self.assertTrue(
+                verb in resp.headers['Allow'].split(', '))
+        self.assertEqual(len(resp.headers['Allow'].split(', ')), 8)
+        self.assertEqual(resp.headers['Server'],
+                         (server_handler.server_type + '/' + swift_version))
+
+    def test_insufficient_storage_mount_check_true(self):
+        conf = {'devices': self.testdir, 'mount_check': 'true'}
+        object_controller = object_server.ObjectController(conf)
+        for policy in POLICIES:
+            mgr = object_controller._diskfile_router[policy]
+            self.assertTrue(mgr.mount_check)
+        for method in object_controller.allowed_methods:
+            if method in ('OPTIONS', 'SSYNC'):
+                continue
+            path = '/sda1/p/'
+            if method == 'REPLICATE':
+                path += 'suff'
+            else:
+                path += 'a/c/o'
+            req = Request.blank(path, method=method,
+                                headers={'x-timestamp': '1',
+                                         'content-type': 'app/test',
+                                         'content-length': 0})
+            with mock_check_drive() as mocks:
+                try:
+                    resp = req.get_response(object_controller)
+                    self.assertEqual(resp.status_int, 507)
+                    mocks['ismount'].return_value = True
+                    resp = req.get_response(object_controller)
+                    self.assertNotEqual(resp.status_int, 507)
+                    # feel free to rip out this last assertion...
+                    expected = 2 if method in ('PUT', 'REPLICATE') else 4
+                    self.assertEqual(resp.status_int // 100, expected)
+                except AssertionError as e:
+                    self.fail('%s for %s' % (e, method))
+
+    def test_insufficient_storage_mount_check_false(self):
+        conf = {'devices': self.testdir, 'mount_check': 'false'}
+        object_controller = object_server.ObjectController(conf)
+        for policy in POLICIES:
+            mgr = object_controller._diskfile_router[policy]
+            self.assertFalse(mgr.mount_check)
+        for method in object_controller.allowed_methods:
+            if method in ('OPTIONS', 'SSYNC'):
+                continue
+            path = '/sda1/p/'
+            if method == 'REPLICATE':
+                path += 'suff'
+            else:
+                path += 'a/c/o'
+            req = Request.blank(path, method=method,
+                                headers={'x-timestamp': '1',
+                                         'content-type': 'app/test',
+                                         'content-length': 0})
+            with mock_check_drive() as mocks:
+                try:
+                    resp = req.get_response(object_controller)
+                    self.assertEqual(resp.status_int, 507)
+                    mocks['isdir'].return_value = True
+                    resp = req.get_response(object_controller)
+                    self.assertNotEqual(resp.status_int, 507)
+                    # feel free to rip out this last assertion...
+                    expected = 2 if method in ('PUT', 'REPLICATE') else 4
+                    self.assertEqual(resp.status_int // 100, expected)
+                except AssertionError as e:
+                    self.fail('%s for %s' % (e, method))
 
     def test_GET(self):
-        """ Test swift.object_server.ObjectController.GET """
-        req = Request.blank('/sda1/p/a/c')
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 400)
+        # Test swift.obj.server.ObjectController.GET
+        req = Request.blank('/sda1/p/a/c', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 400)
 
-        req = Request.blank('/sda1/p/a/c/o')
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 404)
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 404)
+        self.assertFalse('X-Backend-Timestamp' in resp.headers)
 
-        timestamp = normalize_timestamp(time())
+        timestamp = next(self.ts)
         req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                            headers={'X-Timestamp': timestamp,
+                            headers={'X-Timestamp': timestamp.internal,
                                      'Content-Type': 'application/x-test',
                                      'X-Object-Meta-1': 'One',
                                      'X-Object-Meta-Two': 'Two'})
-        req.body = 'VERIFY'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
+        req.body = b'VERIFY'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
 
-        req = Request.blank('/sda1/p/a/c/o')
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(resp.body, 'VERIFY')
-        self.assertEquals(resp.content_length, 6)
-        self.assertEquals(resp.content_type, 'application/x-test')
-        self.assertEquals(resp.headers['content-length'], '6')
-        self.assertEquals(resp.headers['content-type'], 'application/x-test')
-        self.assertEquals(resp.headers['last-modified'],
-               strftime('%a, %d %b %Y %H:%M:%S GMT', gmtime(float(timestamp))))
-        self.assertEquals(resp.headers['etag'],
-                          '"0b4c12d7e0a73840c1c4f148fda3b037"')
-        self.assertEquals(resp.headers['x-object-meta-1'], 'One')
-        self.assertEquals(resp.headers['x-object-meta-two'], 'Two')
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.body, b'VERIFY')
+        self.assertEqual(resp.content_length, 6)
+        self.assertEqual(resp.content_type, 'application/x-test')
+        self.assertEqual(resp.headers['content-length'], '6')
+        self.assertEqual(resp.headers['content-type'], 'application/x-test')
+        self.assertEqual(resp.headers['last-modified'],
+                         date_header_format(timestamp))
+        self.assertEqual(resp.headers['etag'],
+                         '"0b4c12d7e0a73840c1c4f148fda3b037"')
+        self.assertEqual(resp.headers['x-object-meta-1'], 'One')
+        self.assertEqual(resp.headers['x-object-meta-two'], 'Two')
 
-        req = Request.blank('/sda1/p/a/c/o')
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'})
         req.range = 'bytes=1-3'
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 206)
-        self.assertEquals(resp.body, 'ERI')
-        self.assertEquals(resp.headers['content-length'], '3')
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 206)
+        self.assertEqual(resp.body, b'ERI')
+        self.assertEqual(resp.headers['content-length'], '3')
 
-        req = Request.blank('/sda1/p/a/c/o')
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'})
         req.range = 'bytes=1-'
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 206)
-        self.assertEquals(resp.body, 'ERIFY')
-        self.assertEquals(resp.headers['content-length'], '5')
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 206)
+        self.assertEqual(resp.body, b'ERIFY')
+        self.assertEqual(resp.headers['content-length'], '5')
 
-        req = Request.blank('/sda1/p/a/c/o')
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'})
         req.range = 'bytes=-2'
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 206)
-        self.assertEquals(resp.body, 'FY')
-        self.assertEquals(resp.headers['content-length'], '2')
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 206)
+        self.assertEqual(resp.body, b'FY')
+        self.assertEqual(resp.headers['content-length'], '2')
 
-        objfile = os.path.join(self.testdir, 'sda1',
-            storage_directory(object_server.DATADIR, 'p',
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'})
+        req.range = 'bytes=100-'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 416)
+        self.assertIn(b'Not Satisfiable', resp.body)
+        self.assertEqual('bytes */6', resp.headers['content-range'])
+
+        # Proxy (SLO in particular) can say that if some metadata's present,
+        # it wants the whole thing
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'})
+        req.range = 'bytes=1-3'
+        req.headers['X-Backend-Ignore-Range-If-Metadata-Present'] = \
+            'X-Object-Meta-1'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.body, b'VERIFY')
+        self.assertEqual(resp.headers['content-length'], '6')
+        self.assertNotIn('content-range', resp.headers)
+
+        # If it's not present, Range is still respected
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'})
+        req.range = 'bytes=1-3'
+        req.headers['X-Backend-Ignore-Range-If-Metadata-Present'] = \
+            'X-Object-Meta-5'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 206)
+        self.assertEqual(resp.body, b'ERI')
+        self.assertEqual(resp.headers['content-length'], '3')
+        self.assertEqual('bytes 1-3/6', resp.headers['content-range'])
+
+        # Works like "any", not "all"; also works where we would've 416ed
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'})
+        req.range = 'bytes=100-'
+        req.headers['X-Backend-Ignore-Range-If-Metadata-Present'] = \
+            'X-Object-Meta-1, X-Object-Meta-5'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.body, b'VERIFY')
+        self.assertEqual(resp.headers['content-length'], '6')
+        self.assertNotIn('content-range', resp.headers)
+
+        objfile = os.path.join(
+            self.testdir, 'sda1',
+            storage_directory(diskfile.get_data_dir(POLICIES[0]), 'p',
                               hash_path('a', 'c', 'o')),
-            timestamp + '.data')
+            utils.Timestamp(timestamp).internal + '.data')
         os.unlink(objfile)
-        req = Request.blank('/sda1/p/a/c/o')
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 404)
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 404)
 
         sleep(.00001)
         timestamp = normalize_timestamp(time())
@@ -992,21 +3861,72 @@ def test_GET(self):
                                 'X-Timestamp': timestamp,
                                 'Content-Type': 'application:octet-stream',
                                 'Content-Length': '6'})
-        req.body = 'VERIFY'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
+        req.body = b'VERIFY'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
 
         sleep(.00001)
         timestamp = normalize_timestamp(time())
         req = Request.blank('/sda1/p/a/c/o',
                             environ={'REQUEST_METHOD': 'DELETE'},
                             headers={'X-Timestamp': timestamp})
-        resp = self.object_controller.DELETE(req)
-        self.assertEquals(resp.status_int, 204)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 204)
 
-        req = Request.blank('/sda1/p/a/c/o')
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 404)
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 404)
+        self.assertEqual(resp.headers['X-Backend-Timestamp'],
+                         utils.Timestamp(timestamp).internal)
+
+    def test_GET_range_zero_byte_object(self):
+        timestamp = normalize_timestamp(time())
+        req = Request.blank('/sda1/p/a/c/zero-byte',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': timestamp,
+                                     'Content-Type': 'application/x-test'})
+        req.body = b''
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        req = Request.blank('/sda1/p/a/c/zero-byte',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Range': 'bytes=-10'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+
+    def test_GET_range_not_satisfiable(self):
+        timestamp = normalize_timestamp(time())
+        req = Request.blank('/sda1/p/a/c/zero-byte',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': timestamp,
+                                     'Content-Type': 'application/x-test'})
+        req.body = b'7 bytes'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        req = Request.blank('/sda1/p/a/c/zero-byte',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Range': 'bytes=1-20, 30-40'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 206)
+        self.assertEqual('bytes 1-6/7', resp.headers.get('Content-Range'))
+        self.assertEqual(b' bytes', resp.body)
+
+        req = Request.blank('/sda1/p/a/c/zero-byte',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Range': 'bytes=10-20'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 416)
+        self.assertEqual('bytes */7', resp.headers.get('Content-Range'))
+        exp_resp_body = b''.join(
+            HTTPRequestedRangeNotSatisfiable()({}, lambda *args: None))
+        self.assertEqual(str(len(exp_resp_body)),
+                         resp.headers.get('Content-Length'))
+        self.assertEqual(
+            '"%s"' % md5(b'7 bytes', usedforsecurity=False).hexdigest(),
+            resp.headers.get('Etag'))
+        self.assertEqual(exp_resp_body, resp.body)
 
     def test_GET_if_match(self):
         req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
@@ -1014,349 +3934,1920 @@ def test_GET_if_match(self):
                                 'X-Timestamp': normalize_timestamp(time()),
                                 'Content-Type': 'application/octet-stream',
                                 'Content-Length': '4'})
-        req.body = 'test'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
+        req.body = b'test'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
         etag = resp.etag
 
         req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'})
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(resp.etag, etag)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.etag, etag)
 
         req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
                             headers={'If-Match': '*'})
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(resp.etag, etag)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.etag, etag)
 
         req = Request.blank('/sda1/p/a/c/o2',
                             environ={'REQUEST_METHOD': 'GET'},
                             headers={'If-Match': '*'})
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 412)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 412)
 
         req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
                             headers={'If-Match': '"%s"' % etag})
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(resp.etag, etag)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.etag, etag)
+
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'HEAD'},
+            headers={'If-Match': '"11111111111111111111111111111111"'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 412)
+        self.assertIn(
+            '"HEAD /sda1/p/a/c/o" 412 - ',
+            self.object_controller.logger.get_lines_for_level('info')[-1])
+
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
+            headers={'If-Match': '"11111111111111111111111111111111"'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 412)
+        self.assertIn(
+            '"GET /sda1/p/a/c/o" 412 - ',
+            self.object_controller.logger.get_lines_for_level('info')[-1])
+
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
+            headers={
+                'If-Match': '"11111111111111111111111111111111", "%s"' % etag})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
+            headers={
+                'If-Match':
+                '"11111111111111111111111111111111", '
+                '"22222222222222222222222222222222"'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 412)
+
+    def test_GET_if_match_etag_is_at(self):
+        headers = {
+            'X-Timestamp': utils.Timestamp.now().internal,
+            'Content-Type': 'application/octet-stream',
+            'X-Object-Meta-Xtag': 'madeup',
+            'X-Object-Sysmeta-Xtag': 'alternate madeup',
+        }
+        req = Request.blank('/sda1/p/a/c/o', method='PUT',
+                            headers=headers)
+        req.body = b'test'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+        real_etag = resp.etag
+
+        # match x-backend-etag-is-at
+        req = Request.blank('/sda1/p/a/c/o', headers={
+            'If-Match': 'madeup',
+            'X-Backend-Etag-Is-At': 'X-Object-Meta-Xtag'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+
+        # match x-backend-etag-is-at, using first in list of alternates
+        req = Request.blank('/sda1/p/a/c/o', headers={
+            'If-Match': 'madeup',
+            'X-Backend-Etag-Is-At':
+                'X-Object-Meta-Xtag,X-Object-Sysmeta-Z'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+
+        # match x-backend-etag-is-at, using second in list of alternates
+        alts = 'X-Object-Sysmeta-Y,X-Object-Meta-Xtag,X-Object-Sysmeta-Z'
+        req = Request.blank('/sda1/p/a/c/o', headers={
+            'If-Match': 'madeup',
+            'X-Backend-Etag-Is-At': alts})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+
+        # match x-backend-etag-is-at, choosing first of multiple alternates
+        alts = 'X-Object-Sysmeta-Y,X-Object-Meta-Xtag,X-Object-Sysmeta-Xtag'
+        req = Request.blank('/sda1/p/a/c/o', headers={
+            'If-Match': 'madeup',
+            'X-Backend-Etag-Is-At': alts})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+
+        # match x-backend-etag-is-at, choosing first of multiple alternates
+        # (switches order of second two alternates from previous assertion)
+        alts = 'X-Object-Sysmeta-Y,X-Object-Sysmeta-Xtag,X-Object-Meta-Xtag'
+        req = Request.blank('/sda1/p/a/c/o', headers={
+            'If-Match': 'alternate madeup',
+            'X-Backend-Etag-Is-At': alts})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+
+        # no match x-backend-etag-is-at
+        req = Request.blank('/sda1/p/a/c/o', headers={
+            'If-Match': real_etag,
+            'X-Backend-Etag-Is-At': 'X-Object-Meta-Xtag'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 412)
+
+        # etag-is-at metadata doesn't exist, default to real etag
+        req = Request.blank('/sda1/p/a/c/o', headers={
+            'If-Match': real_etag,
+            'X-Backend-Etag-Is-At': 'X-Object-Meta-Missing'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+
+        # sanity no-match with no etag-is-at
+        req = Request.blank('/sda1/p/a/c/o', headers={
+            'If-Match': 'madeup'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 412)
+
+        # sanity match with no etag-is-at
+        req = Request.blank('/sda1/p/a/c/o', headers={
+            'If-Match': real_etag})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+
+        # sanity with no if-match
+        req = Request.blank('/sda1/p/a/c/o', headers={
+            'X-Backend-Etag-Is-At': 'X-Object-Meta-Xtag'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+
+    def test_HEAD_if_match(self):
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={
+                                'X-Timestamp': normalize_timestamp(time()),
+                                'Content-Type': 'application/octet-stream',
+                                'Content-Length': '4'})
+        req.body = b'test'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+        etag = resp.etag
 
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
-                            headers={'If-Match':
-                                        '"11111111111111111111111111111111"'})
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 412)
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'HEAD'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.etag, etag)
 
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
-                            headers={'If-Match':
-                            '"11111111111111111111111111111111", "%s"' % etag})
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'If-Match': '*'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.etag, etag)
 
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
-                            headers={'If-Match':
-                            '"11111111111111111111111111111111", '
-                            '"22222222222222222222222222222222"'})
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 412)
+        req = Request.blank('/sda1/p/a/c/o2',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'If-Match': '*'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 412)
+
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'If-Match': '"%s"' % etag})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.etag, etag)
+
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'HEAD'},
+            headers={'If-Match': '"11111111111111111111111111111111"'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 412)
+
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'HEAD'},
+            headers={
+                'If-Match': '"11111111111111111111111111111111", "%s"' % etag})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'HEAD'},
+            headers={
+                'If-Match':
+                '"11111111111111111111111111111111", '
+                '"22222222222222222222222222222222"'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 412)
 
     def test_GET_if_none_match(self):
         req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
                             headers={
                                 'X-Timestamp': normalize_timestamp(time()),
-                                'Content-Type': 'application/octet-stream',
+                                'X-Object-Meta-Soup': 'gazpacho',
+                                'Content-Type': 'application/fizzbuzz',
                                 'Content-Length': '4'})
-        req.body = 'test'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
+        req.body = b'test'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
         etag = resp.etag
 
         req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'})
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(resp.etag, etag)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.etag, etag)
 
         req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
                             headers={'If-None-Match': '*'})
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 304)
-        self.assertEquals(resp.etag, etag)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 304)
+        self.assertEqual(resp.etag, etag)
+        self.assertEqual(resp.headers['Content-Type'], 'application/fizzbuzz')
+        self.assertEqual(resp.headers['X-Object-Meta-Soup'], 'gazpacho')
 
         req = Request.blank('/sda1/p/a/c/o2',
                             environ={'REQUEST_METHOD': 'GET'},
                             headers={'If-None-Match': '*'})
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 404)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 404)
 
         req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
                             headers={'If-None-Match': '"%s"' % etag})
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 304)
-        self.assertEquals(resp.etag, etag)
-
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
-                            headers={'If-None-Match':
-                                        '"11111111111111111111111111111111"'})
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(resp.etag, etag)
-
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
-                            headers={'If-None-Match':
-                                        '"11111111111111111111111111111111", '
-                                        '"%s"' % etag})
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 304)
-        self.assertEquals(resp.etag, etag)
-
-    def test_GET_if_modified_since(self):
-        timestamp = normalize_timestamp(time())
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 304)
+        self.assertEqual(resp.etag, etag)
+
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
+            headers={'If-None-Match': '"11111111111111111111111111111111"'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.etag, etag)
+
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
+            headers={'If-None-Match':
+                     '"11111111111111111111111111111111", '
+                     '"%s"' % etag})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 304)
+        self.assertEqual(resp.etag, etag)
+
+    def test_HEAD_if_none_match(self):
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT'},
                             headers={
-                                'X-Timestamp': timestamp,
+                                'X-Timestamp': normalize_timestamp(time()),
                                 'Content-Type': 'application/octet-stream',
                                 'Content-Length': '4'})
-        req.body = 'test'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
+        req.body = b'test'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+        etag = resp.etag
+
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'HEAD'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.etag, etag)
+
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'If-None-Match': '*'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 304)
+        self.assertEqual(resp.etag, etag)
+
+        req = Request.blank('/sda1/p/a/c/o2',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'If-None-Match': '*'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 404)
+
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'If-None-Match': '"%s"' % etag})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 304)
+        self.assertEqual(resp.etag, etag)
+
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'HEAD'},
+            headers={'If-None-Match': '"11111111111111111111111111111111"'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.etag, etag)
+
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'HEAD'},
+            headers={'If-None-Match':
+                     '"11111111111111111111111111111111", '
+                     '"%s"' % etag})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 304)
+        self.assertEqual(resp.etag, etag)
+
+    def test_GET_if_modified_since(self):
+        timestamp = next(self.ts)
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={
+                                'X-Timestamp': timestamp.internal,
+                                'Content-Type': 'application/octet-stream',
+                                'Content-Length': '4'})
+        req.body = b'test'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
 
         req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'})
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
 
-        since = strftime('%a, %d %b %Y %H:%M:%S GMT', gmtime(float(timestamp) + 1))
+        since = date_header_format(float(timestamp) + 1)
         req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
                             headers={'If-Modified-Since': since})
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 304)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 304)
 
-        since = \
-            strftime('%a, %d %b %Y %H:%M:%S GMT', gmtime(float(timestamp) - 1))
+        since = date_header_format(float(timestamp) - 1)
         req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
                             headers={'If-Modified-Since': since})
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+
+        since = date_header_format(float(timestamp) + 1)
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
+                            headers={'If-Modified-Since': since})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 304)
+
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'HEAD'})
+        resp = req.get_response(self.object_controller)
+        since = resp.headers['Last-Modified']
+        self.assertEqual(since, date_header_format(float(timestamp)))
 
-        since = \
-            strftime('%a, %d %b %Y %H:%M:%S GMT', gmtime(float(timestamp) + 1))
         req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
                             headers={'If-Modified-Since': since})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 304)
+
+        timestamp = next(self.ts)
+        req = Request.blank('/sda1/p/a/c/o2',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={
+                                'X-Timestamp': timestamp.internal,
+                                'Content-Type': 'application/octet-stream',
+                                'Content-Length': '4'})
+        req.body = b'test'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        since = date_header_format(float(timestamp))
+        req = Request.blank('/sda1/p/a/c/o2',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'If-Modified-Since': since})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 304)
+
+    def test_HEAD_if_modified_since(self):
+        timestamp = next(self.ts)
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={
+                                'X-Timestamp': timestamp.internal,
+                                'Content-Type': 'application/octet-stream',
+                                'Content-Length': '4'})
+        req.body = b'test'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'HEAD'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+
+        since = date_header_format(float(timestamp) + 1)
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'If-Modified-Since': since})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 304)
+
+        since = date_header_format(float(timestamp) - 1)
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'If-Modified-Since': since})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+
+        since = date_header_format(float(timestamp) + 1)
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'If-Modified-Since': since})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 304)
+
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'HEAD'})
+        resp = req.get_response(self.object_controller)
+        since = resp.headers['Last-Modified']
+        self.assertEqual(since, date_header_format(float(timestamp)))
+
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'If-Modified-Since': since})
         resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 304)
+        self.assertEqual(resp.status_int, 304)
+
+        timestamp = next(self.ts)
+        req = Request.blank('/sda1/p/a/c/o2',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={
+                                'X-Timestamp': timestamp.internal,
+                                'Content-Type': 'application/octet-stream',
+                                'Content-Length': '4'})
+        req.body = b'test'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        since = date_header_format(float(timestamp))
+        req = Request.blank('/sda1/p/a/c/o2',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'If-Modified-Since': since})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 304)
 
     def test_GET_if_unmodified_since(self):
-        timestamp = normalize_timestamp(time())
+        timestamp = next(self.ts)
         req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
                             headers={
-                                'X-Timestamp': timestamp,
-                                'Content-Type': 'application/octet-stream',
+                                'X-Timestamp': timestamp.internal,
+                                'X-Object-Meta-Burr': 'ito',
+                                'Content-Type': 'application/cat-picture',
                                 'Content-Length': '4'})
-        req.body = 'test'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
+        req.body = b'test'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
 
         req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'})
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
 
-        since = strftime('%a, %d %b %Y %H:%M:%S GMT',
-                         gmtime(float(timestamp) + 1))
+        since = date_header_format(float(timestamp) + 1)
         req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
                             headers={'If-Unmodified-Since': since})
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
 
-        since = \
-            strftime('%a, %d %b %Y %H:%M:%S GMT', gmtime(float(timestamp) - 9))
+        since = date_header_format(float(timestamp) - 9)
         req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
                             headers={'If-Unmodified-Since': since})
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 412)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 412)
+        self.assertEqual(resp.headers['Content-Type'],
+                         'application/cat-picture')
+        self.assertEqual(resp.headers['X-Object-Meta-Burr'], 'ito')
 
-        since = \
-            strftime('%a, %d %b %Y %H:%M:%S GMT', gmtime(float(timestamp) + 9))
+        since = date_header_format(float(timestamp) + 9)
         req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
                             headers={'If-Unmodified-Since': since})
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'HEAD'})
+        resp = req.get_response(self.object_controller)
+        since = resp.headers['Last-Modified']
+        self.assertEqual(since, date_header_format(float(timestamp)))
+
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
+                            headers={'If-Unmodified-Since': since})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+
+    def test_HEAD_if_unmodified_since(self):
+        timestamp = next(self.ts)
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': timestamp.internal,
+                     'Content-Type': 'application/octet-stream',
+                     'Content-Length': '4'})
+        req.body = b'test'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        since = date_header_format(float(timestamp) + 1)
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'If-Unmodified-Since': since})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+
+        since = date_header_format(float(timestamp))
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'If-Unmodified-Since': since})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+
+        since = date_header_format(float(timestamp) - 1)
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'If-Unmodified-Since': since})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 412)
+
+    def assertECBodyEqual(self, resp, expected):
+        # we pull the policy index from the request environ since it seems to
+        # be missing from the response headers
+        policy_index = int(
+            resp.request.headers['X-Backend-Storage-Policy-Index'])
+        policy = POLICIES[policy_index]
+        frags = encode_frag_archive_bodies(policy, expected)
+        frag_index = int(resp.headers['X-Object-Sysmeta-Ec-Frag-Index'])
+        self.assertEqual(resp.body, frags[frag_index])
+
+    def _create_ondisk_fragments(self, policy):
+        # Create some on disk files...
+        # PUT at ts_0
+        ts_0 = next(self.ts)
+        body = b'OLDER'
+        headers = {'X-Timestamp': ts_0.internal,
+                   'Content-Length': '5',
+                   'Content-Type': 'application/octet-stream',
+                   'X-Backend-Storage-Policy-Index': int(policy)}
+        if policy.policy_type == EC_POLICY:
+            body = encode_frag_archive_bodies(policy, body)[0]
+            headers.update({
+                'X-Object-Sysmeta-Ec-Frag-Index': '0',
+                'Content-Length': len(body),
+            })
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers=headers)
+        req.body = body
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        # POST at ts_1
+        ts_1 = next(self.ts)
+        headers = {'X-Timestamp': ts_1.internal,
+                   'X-Backend-Storage-Policy-Index': int(policy)}
+        headers['X-Object-Meta-Test'] = 'abc'
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers=headers)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 202)
+
+        # PUT again at ts_2 but without making the data file durable
+        ts_2 = next(self.ts)
+        body = b'NEWER'
+        headers = {'X-Timestamp': ts_2.internal,
+                   'Content-Length': '5',
+                   'Content-Type': 'application/octet-stream',
+                   'X-Backend-Storage-Policy-Index': int(policy)}
+        if policy.policy_type == EC_POLICY:
+            body = encode_frag_archive_bodies(policy, body)[2]
+            headers.update({
+                'X-Object-Sysmeta-Ec-Frag-Index': '2',
+                'Content-Length': len(body),
+            })
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers=headers)
+        req.body = body
+        # patch the commit method to do nothing so EC object is non-durable
+        with mock.patch('swift.obj.diskfile.ECDiskFileWriter.commit'):
+            resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        return ts_0, ts_1, ts_2
+
+    def test_GET_HEAD_with_fragment_preferences(self):
+        for policy in POLICIES:
+            ts_0, ts_1, ts_2 = self._create_ondisk_fragments(policy)
+
+            backend_frags = {ts_0.internal: [0], ts_2.internal: [2]}
+
+            def _assert_frag_0_at_ts_0(resp):
+                expect = {
+                    'X-Timestamp': ts_1.normal,
+                    'X-Backend-Timestamp': ts_1.internal,
+                    'X-Backend-Data-Timestamp': ts_0.internal,
+                    'X-Backend-Durable-Timestamp': ts_0.internal,
+                    'X-Object-Sysmeta-Ec-Frag-Index': '0',
+                    'X-Object-Meta-Test': 'abc'}
+                self._assertDictContainsSubset(expect, resp.headers)
+                self.assertEqual(backend_frags, json.loads(
+                    resp.headers['X-Backend-Fragments']))
+
+            def _assert_repl_data_at_ts_2():
+                self.assertIn(resp.status_int, (200, 202))
+                expect = {
+                    'X-Timestamp': ts_2.normal,
+                    'X-Backend-Timestamp': ts_2.internal,
+                    'X-Backend-Data-Timestamp': ts_2.internal,
+                    'X-Backend-Durable-Timestamp': ts_2.internal}
+                self._assertDictContainsSubset(expect, resp.headers)
+                self.assertNotIn('X-Object-Meta-Test', resp.headers)
+
+            # Sanity check: Request with no preferences should default to the
+            # durable frag
+            headers = {'X-Backend-Storage-Policy-Index': int(policy)}
+            req = Request.blank('/sda1/p/a/c/o', headers=headers,
+                                environ={'REQUEST_METHOD': 'GET'})
+            resp = req.get_response(self.object_controller)
+
+            if policy.policy_type == EC_POLICY:
+                _assert_frag_0_at_ts_0(resp)
+                self.assertECBodyEqual(resp, b'OLDER')
+            else:
+                _assert_repl_data_at_ts_2()
+                self.assertEqual(resp.body, b'NEWER')
+
+            req = Request.blank('/sda1/p/a/c/o', headers=headers,
+                                environ={'REQUEST_METHOD': 'HEAD'})
+            resp = req.get_response(self.object_controller)
+            self.assertEqual(resp.status_int, 200)
+            if policy.policy_type == EC_POLICY:
+                _assert_frag_0_at_ts_0(resp)
+            else:
+                _assert_repl_data_at_ts_2()
+
+            # Request with preferences can select the older frag
+            prefs = json.dumps(
+                [{'timestamp': ts_0.internal, 'exclude': [1, 3]}])
+            headers = {'X-Backend-Storage-Policy-Index': int(policy),
+                       'X-Backend-Fragment-Preferences': prefs}
+            req = Request.blank('/sda1/p/a/c/o', headers=headers,
+                                environ={'REQUEST_METHOD': 'GET'})
+            resp = req.get_response(self.object_controller)
+
+            if policy.policy_type == EC_POLICY:
+                _assert_frag_0_at_ts_0(resp)
+                self.assertECBodyEqual(resp, b'OLDER')
+            else:
+                _assert_repl_data_at_ts_2()
+                self.assertEqual(resp.body, b'NEWER')
+
+            req = Request.blank('/sda1/p/a/c/o', headers=headers,
+                                environ={'REQUEST_METHOD': 'HEAD'})
+            resp = req.get_response(self.object_controller)
+
+            if policy.policy_type == EC_POLICY:
+                _assert_frag_0_at_ts_0(resp)
+            else:
+                _assert_repl_data_at_ts_2()
+
+            def _assert_frag_2_at_ts_2(resp):
+                self.assertIn(resp.status_int, (200, 202))
+                # do not expect meta file to be included since it is older
+                expect = {
+                    'X-Timestamp': ts_2.normal,
+                    'X-Backend-Timestamp': ts_2.internal,
+                    'X-Backend-Data-Timestamp': ts_2.internal,
+                    'X-Backend-Durable-Timestamp': ts_0.internal,
+                    'X-Object-Sysmeta-Ec-Frag-Index': '2'}
+                self._assertDictContainsSubset(expect, resp.headers)
+                self.assertEqual(backend_frags, json.loads(
+                    resp.headers['X-Backend-Fragments']))
+                self.assertNotIn('X-Object-Meta-Test', resp.headers)
+
+            # Request with preferences can select the newer non-durable frag
+            prefs = json.dumps(
+                [{'timestamp': ts_2.internal, 'exclude': [1, 3]}])
+            headers = {'X-Backend-Storage-Policy-Index': int(policy),
+                       'X-Backend-Fragment-Preferences': prefs}
+            req = Request.blank('/sda1/p/a/c/o', headers=headers,
+                                environ={'REQUEST_METHOD': 'GET'})
+            resp = req.get_response(self.object_controller)
+
+            if policy.policy_type == EC_POLICY:
+                _assert_frag_2_at_ts_2(resp)
+                self.assertECBodyEqual(resp, b'NEWER')
+            else:
+                _assert_repl_data_at_ts_2()
+                self.assertEqual(resp.body, b'NEWER')
+
+            req = Request.blank('/sda1/p/a/c/o', headers=headers,
+                                environ={'REQUEST_METHOD': 'HEAD'})
+            resp = req.get_response(self.object_controller)
+
+            if policy.policy_type == EC_POLICY:
+                _assert_frag_2_at_ts_2(resp)
+            else:
+                _assert_repl_data_at_ts_2()
+
+            # Request with preference for ts_0 but excludes index 0 will
+            # default to newest frag
+            prefs = json.dumps(
+                [{'timestamp': ts_0.internal, 'exclude': [0]}])
+            headers = {'X-Backend-Storage-Policy-Index': int(policy),
+                       'X-Backend-Fragment-Preferences': prefs}
+            req = Request.blank('/sda1/p/a/c/o', headers=headers,
+                                environ={'REQUEST_METHOD': 'GET'})
+            resp = req.get_response(self.object_controller)
+            if policy.policy_type == EC_POLICY:
+                _assert_frag_2_at_ts_2(resp)
+                self.assertECBodyEqual(resp, b'NEWER')
+            else:
+                _assert_repl_data_at_ts_2()
+                self.assertEqual(resp.body, b'NEWER')
+
+            req = Request.blank('/sda1/p/a/c/o', headers=headers,
+                                environ={'REQUEST_METHOD': 'HEAD'})
+            resp = req.get_response(self.object_controller)
+
+            if policy.policy_type == EC_POLICY:
+                _assert_frag_2_at_ts_2(resp)
+            else:
+                _assert_repl_data_at_ts_2()
+
+            # Request with preferences that exclude all frags get nothing
+            prefs = json.dumps(
+                [{'timestamp': ts_0.internal, 'exclude': [0]},
+                 {'timestamp': ts_2.internal, 'exclude': [2]}])
+            headers = {'X-Backend-Storage-Policy-Index': int(policy),
+                       'X-Backend-Fragment-Preferences': prefs}
+            req = Request.blank('/sda1/p/a/c/o', headers=headers,
+                                environ={'REQUEST_METHOD': 'GET'})
+            resp = req.get_response(self.object_controller)
+            if policy.policy_type == EC_POLICY:
+                self.assertEqual(resp.status_int, 404)
+            else:
+                _assert_repl_data_at_ts_2()
+                self.assertEqual(resp.body, b'NEWER')
+
+            req = Request.blank('/sda1/p/a/c/o', headers=headers,
+                                environ={'REQUEST_METHOD': 'HEAD'})
+            resp = req.get_response(self.object_controller)
+
+            if policy.policy_type == EC_POLICY:
+                self.assertEqual(resp.status_int, 404)
+            else:
+                _assert_repl_data_at_ts_2()
+
+            # Request with empty preferences will get non-durable
+            prefs = json.dumps([])
+            headers = {'X-Backend-Storage-Policy-Index': int(policy),
+                       'X-Backend-Fragment-Preferences': prefs}
+            req = Request.blank('/sda1/p/a/c/o', headers=headers,
+                                environ={'REQUEST_METHOD': 'GET'})
+            resp = req.get_response(self.object_controller)
+            if policy.policy_type == EC_POLICY:
+                _assert_frag_2_at_ts_2(resp)
+                self.assertECBodyEqual(resp, b'NEWER')
+            else:
+                _assert_repl_data_at_ts_2()
+                self.assertEqual(resp.body, b'NEWER')
+
+            req = Request.blank('/sda1/p/a/c/o', headers=headers,
+                                environ={'REQUEST_METHOD': 'HEAD'})
+            resp = req.get_response(self.object_controller)
+
+            if policy.policy_type == EC_POLICY:
+                _assert_frag_2_at_ts_2(resp)
+            else:
+                _assert_repl_data_at_ts_2()
 
     def test_GET_quarantine(self):
-        """ Test swift.object_server.ObjectController.GET """
+        # Test swift.obj.server.ObjectController.GET
         timestamp = normalize_timestamp(time())
         req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
                             headers={'X-Timestamp': timestamp,
                                      'Content-Type': 'application/x-test'})
-        req.body = 'VERIFY'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
-        file = object_server.DiskFile(self.testdir, 'sda1', 'p', 'a', 'c', 'o',
-                                      FakeLogger(), keep_data_fp=True)
-        file_name = os.path.basename(file.data_file)
-        etag = md5()
-        etag.update('VERIF')
+        req.body = b'VERIFY'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+        disk_file = self.df_mgr.get_diskfile('sda1', 'p', 'a', 'c', 'o',
+                                             policy=POLICIES.legacy)
+        disk_file.open()
+        file_name = os.path.basename(disk_file._data_file)
+        etag = md5(usedforsecurity=False)
+        etag.update(b'VERIF')
         etag = etag.hexdigest()
-        metadata = {'X-Timestamp': timestamp,
+        metadata = {'X-Timestamp': timestamp, 'name': '/a/c/o',
                     'Content-Length': 6, 'ETag': etag}
-        object_server.write_metadata(file.fp, metadata)
-        self.assertEquals(os.listdir(file.datadir)[0], file_name)
+        diskfile.write_metadata(disk_file._fp, metadata)
+        self.assertEqual(os.listdir(disk_file._datadir)[0], file_name)
         req = Request.blank('/sda1/p/a/c/o')
-        resp = self.object_controller.GET(req)
-        quar_dir = os.path.join(self.testdir, 'sda1', 'quarantined', 'objects',
-                       os.path.basename(os.path.dirname(file.data_file)))
-        self.assertEquals(os.listdir(file.datadir)[0], file_name)
+        resp = req.get_response(self.object_controller)
+        quar_dir = os.path.join(
+            self.testdir, 'sda1', 'quarantined', 'objects',
+            os.path.basename(os.path.dirname(disk_file._data_file)))
+        self.assertEqual(os.listdir(disk_file._datadir)[0], file_name)
         body = resp.body  # actually does quarantining
-        self.assertEquals(body, 'VERIFY')
-        self.assertEquals(os.listdir(quar_dir)[0], file_name)
+        self.assertEqual(body, b'VERIFY')
+        self.assertEqual(os.listdir(quar_dir)[0], file_name)
         req = Request.blank('/sda1/p/a/c/o')
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 404)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 404)
+
+    def test_GET_no_etag_validation(self):
+        conf = {'devices': self.testdir, 'mount_check': 'false',
+                'container_update_timeout': 0.0,
+                'etag_validate_pct': '0'}
+        object_controller = object_server.ObjectController(
+            conf, logger=self.logger)
+        timestamp = normalize_timestamp(time())
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': timestamp,
+                                     'Content-Type': 'application/x-test'})
+        req.body = b'VERIFY'
+        resp = req.get_response(object_controller)
+        self.assertEqual(resp.status_int, 201)
+        disk_file = self.df_mgr.get_diskfile('sda1', 'p', 'a', 'c', 'o',
+                                             policy=POLICIES.legacy)
+        disk_file.open()
+        file_name = os.path.basename(disk_file._data_file)
+        bad_etag = md5(b'VERIF', usedforsecurity=False).hexdigest()
+        metadata = {'X-Timestamp': timestamp, 'name': '/a/c/o',
+                    'Content-Length': 6, 'ETag': bad_etag}
+        diskfile.write_metadata(disk_file._fp, metadata)
+        self.assertEqual(os.listdir(disk_file._datadir)[0], file_name)
+        req = Request.blank('/sda1/p/a/c/o')
+        resp = req.get_response(object_controller)
+        quar_dir = os.path.join(
+            self.testdir, 'sda1', 'quarantined', 'objects',
+            os.path.basename(os.path.dirname(disk_file._data_file)))
+        self.assertEqual(os.listdir(disk_file._datadir)[0], file_name)
+        body = resp.body
+        self.assertEqual(body, b'VERIFY')
+        self.assertEqual(resp.headers['Etag'], '"%s"' % bad_etag)
+        # Didn't quarantine!
+        self.assertFalse(os.path.exists(quar_dir))
+        req = Request.blank('/sda1/p/a/c/o')
+        resp = req.get_response(object_controller)
+        body = resp.body
+        self.assertEqual(body, b'VERIFY')
+        self.assertEqual(resp.headers['Etag'], '"%s"' % bad_etag)
+
+        # If there's a size mismatch, though, we *should* quarantine
+        metadata = {'X-Timestamp': timestamp, 'name': '/a/c/o',
+                    'Content-Length': 5, 'ETag': bad_etag}
+        diskfile.write_metadata(disk_file._fp, metadata)
+        self.assertEqual(os.listdir(disk_file._datadir)[0], file_name)
+        req = Request.blank('/sda1/p/a/c/o')
+        resp = req.get_response(object_controller)
+        self.assertEqual('404 Not Found', resp.status)
+        self.assertFalse(os.path.exists(disk_file._datadir))
+        self.assertTrue(os.path.exists(quar_dir))
 
     def test_GET_quarantine_zbyte(self):
-        """ Test swift.object_server.ObjectController.GET """
+        # Test swift.obj.server.ObjectController.GET
         timestamp = normalize_timestamp(time())
         req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
                             headers={'X-Timestamp': timestamp,
                                      'Content-Type': 'application/x-test'})
         req.body = 'VERIFY'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
-        file = object_server.DiskFile(self.testdir, 'sda1', 'p', 'a', 'c', 'o',
-                                      FakeLogger(), keep_data_fp=True)
-        file_name = os.path.basename(file.data_file)
-        with open(file.data_file) as fp:
-            metadata = object_server.read_metadata(fp)
-        os.unlink(file.data_file)
-        with open(file.data_file, 'w') as fp:
-            object_server.write_metadata(fp, metadata)
-
-        self.assertEquals(os.listdir(file.datadir)[0], file_name)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+        disk_file = self.df_mgr.get_diskfile('sda1', 'p', 'a', 'c', 'o',
+                                             policy=POLICIES.legacy)
+        disk_file.open(timestamp)
+        file_name = os.path.basename(disk_file._data_file)
+        with open(disk_file._data_file) as fp:
+            metadata = diskfile.read_metadata(fp)
+        os.unlink(disk_file._data_file)
+        with open(disk_file._data_file, 'w') as fp:
+            diskfile.write_metadata(fp, metadata)
+
+        self.assertEqual(os.listdir(disk_file._datadir)[0], file_name)
         req = Request.blank('/sda1/p/a/c/o')
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 404)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 404)
 
-        quar_dir = os.path.join(self.testdir, 'sda1', 'quarantined', 'objects',
-                       os.path.basename(os.path.dirname(file.data_file)))
-        self.assertEquals(os.listdir(quar_dir)[0], file_name)
+        quar_dir = os.path.join(
+            self.testdir, 'sda1', 'quarantined', 'objects',
+            os.path.basename(os.path.dirname(disk_file._data_file)))
+        self.assertEqual(os.listdir(quar_dir)[0], file_name)
 
     def test_GET_quarantine_range(self):
-        """ Test swift.object_server.ObjectController.GET """
+        # Test swift.obj.server.ObjectController.GET
         timestamp = normalize_timestamp(time())
         req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
                             headers={'X-Timestamp': timestamp,
                                      'Content-Type': 'application/x-test'})
-        req.body = 'VERIFY'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
-        file = object_server.DiskFile(self.testdir, 'sda1', 'p', 'a', 'c', 'o',
-                                      FakeLogger(), keep_data_fp=True)
-        file_name = os.path.basename(file.data_file)
-        etag = md5()
-        etag.update('VERIF')
+        req.body = b'VERIFY'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+        disk_file = self.df_mgr.get_diskfile('sda1', 'p', 'a', 'c', 'o',
+                                             policy=POLICIES.legacy)
+        disk_file.open(timestamp)
+        file_name = os.path.basename(disk_file._data_file)
+        etag = md5(usedforsecurity=False)
+        etag.update(b'VERIF')
         etag = etag.hexdigest()
-        metadata = {'X-Timestamp': timestamp,
+        metadata = {'X-Timestamp': timestamp, 'name': '/a/c/o',
                     'Content-Length': 6, 'ETag': etag}
-        object_server.write_metadata(file.fp, metadata)
-        self.assertEquals(os.listdir(file.datadir)[0], file_name)
+        diskfile.write_metadata(disk_file._fp, metadata)
+        self.assertEqual(os.listdir(disk_file._datadir)[0], file_name)
         req = Request.blank('/sda1/p/a/c/o')
         req.range = 'bytes=0-4'  # partial
-        resp = self.object_controller.GET(req)
-        quar_dir = os.path.join(self.testdir, 'sda1', 'quarantined', 'objects',
-                            os.path.basename(os.path.dirname(file.data_file)))
-        body = resp.body
-        self.assertEquals(os.listdir(file.datadir)[0], file_name)
+        resp = req.get_response(self.object_controller)
+        quar_dir = os.path.join(
+            self.testdir, 'sda1', 'quarantined', 'objects',
+            os.path.basename(os.path.dirname(disk_file._data_file)))
+        resp.body
+        self.assertEqual(os.listdir(disk_file._datadir)[0], file_name)
         self.assertFalse(os.path.isdir(quar_dir))
         req = Request.blank('/sda1/p/a/c/o')
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
 
         req = Request.blank('/sda1/p/a/c/o')
         req.range = 'bytes=1-6'  # partial
-        resp = self.object_controller.GET(req)
-        quar_dir = os.path.join(self.testdir, 'sda1', 'quarantined', 'objects',
-                            os.path.basename(os.path.dirname(file.data_file)))
-        body = resp.body
-        self.assertEquals(os.listdir(file.datadir)[0], file_name)
+        resp = req.get_response(self.object_controller)
+        quar_dir = os.path.join(
+            self.testdir, 'sda1', 'quarantined', 'objects',
+            os.path.basename(os.path.dirname(disk_file._data_file)))
+        resp.body
+        self.assertEqual(os.listdir(disk_file._datadir)[0], file_name)
         self.assertFalse(os.path.isdir(quar_dir))
 
         req = Request.blank('/sda1/p/a/c/o')
         req.range = 'bytes=0-14'  # full
-        resp = self.object_controller.GET(req)
-        quar_dir = os.path.join(self.testdir, 'sda1', 'quarantined', 'objects',
-                       os.path.basename(os.path.dirname(file.data_file)))
-        self.assertEquals(os.listdir(file.datadir)[0], file_name)
-        body = resp.body
+        resp = req.get_response(self.object_controller)
+        quar_dir = os.path.join(
+            self.testdir, 'sda1', 'quarantined', 'objects',
+            os.path.basename(os.path.dirname(disk_file._data_file)))
+        self.assertEqual(os.listdir(disk_file._datadir)[0], file_name)
+        resp.body
         self.assertTrue(os.path.isdir(quar_dir))
         req = Request.blank('/sda1/p/a/c/o')
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 404)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 404)
+
+    def test_GET_keep_cache_private_config_true(self):
+        # Test swift.obj.server.ObjectController.GET that, when
+        # 'keep_cache_private' is configured True, then
+        # disk_file.reader will be called with keep_cache=True.
+        # Set up a new ObjectController with customized configurations.
+        conf = {'devices': self.testdir, 'mount_check': 'false',
+                'container_update_timeout': 0.0,
+                'keep_cache_private': 'True'}
+        obj_controller = object_server.ObjectController(
+            conf, logger=self.logger)
+        obj_controller.bytes_per_sync = 1
+        timestamp = Timestamp.now()
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': timestamp.internal,
+                                     'Content-Type': 'application/x-test'})
+        req.body = b'VERIFY'
+        resp = req.get_response(obj_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        # Request headers have neither 'X-Auth-Token' nor 'X-Storage-Token'.
+        req = Request.blank('/sda1/p/a/c/o',
+                            headers={'Content-Type': 'application/x-test'})
+        reader_mock = mock.Mock(keep_cache=False)
+        with mock.patch('swift.obj.diskfile.BaseDiskFile.reader', reader_mock):
+            resp = req.get_response(obj_controller)
+            reader_mock.assert_called_with(
+                keep_cache=True, cooperative_period=0, etag_validate_frac=1)
+        self.assertEqual(resp.status_int, 200)
+        etag = '"%s"' % md5(b'VERIFY', usedforsecurity=False).hexdigest()
+        self.assertEqual(dict(resp.headers), {
+            'Content-Type': 'application/x-test',
+            'Content-Length': '6',
+            'Etag': etag,
+            'X-Backend-Timestamp': timestamp.internal,
+            'X-Timestamp': timestamp.normal,
+            'X-Backend-Data-Timestamp': timestamp.internal,
+            'X-Backend-Durable-Timestamp': timestamp.internal,
+            'Last-Modified': date_header_format(timestamp),
+        })
+
+        # Request headers have 'X-Auth-Token'.
+        req = Request.blank('/sda1/p/a/c/o',
+                            headers={'Content-Type': 'application/x-test',
+                                     'X-Auth-Token': '2340lsdfhhjl02lxfjj'})
+        reader_mock = mock.Mock(keep_cache=False)
+        with mock.patch('swift.obj.diskfile.BaseDiskFile.reader', reader_mock):
+            resp = req.get_response(obj_controller)
+            reader_mock.assert_called_with(
+                keep_cache=True, cooperative_period=0, etag_validate_frac=1)
+        self.assertEqual(resp.status_int, 200)
+
+        # Request headers have 'X-Storage-Token'.
+        req = Request.blank('/sda1/p/a/c/o',
+                            headers={'Content-Type': 'application/x-test',
+                                     'X-Storage-Token': '2340lsdfhhjl02lxfjj'})
+        reader_mock = mock.Mock(keep_cache=False)
+        with mock.patch('swift.obj.diskfile.BaseDiskFile.reader', reader_mock):
+            resp = req.get_response(obj_controller)
+            reader_mock.assert_called_with(
+                keep_cache=True, cooperative_period=0, etag_validate_frac=1)
+        self.assertEqual(resp.status_int, 200)
+
+        # Request headers have both 'X-Auth-Token' and 'X-Storage-Token'.
+        req = Request.blank('/sda1/p/a/c/o',
+                            headers={'Content-Type': 'application/x-test',
+                                     'X-Auth-Token': '2340lsdfhhjl02lxfjj',
+                                     'X-Storage-Token': '2340lsdfhhjl02lxfjj'})
+        reader_mock = mock.Mock(keep_cache=False)
+        with mock.patch('swift.obj.diskfile.BaseDiskFile.reader', reader_mock):
+            resp = req.get_response(obj_controller)
+            reader_mock.assert_called_with(
+                keep_cache=True, cooperative_period=0, etag_validate_frac=1)
+        self.assertEqual(resp.status_int, 200)
+
+    def test_GET_keep_cache_private_config_false(self):
+        # Test swift.obj.server.ObjectController.GET that, when
+        # 'keep_cache_private' is configured false, then
+        # disk_file.reader will be called with correct 'keep_cache'.
+        # Set up a new ObjectController with customized configurations.
+        conf = {'devices': self.testdir, 'mount_check': 'false',
+                'container_update_timeout': 0.0,
+                'keep_cache_private': 'false'}
+        obj_controller = object_server.ObjectController(
+            conf, logger=self.logger)
+        obj_controller.bytes_per_sync = 1
+        timestamp = Timestamp.now()
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': timestamp.internal,
+                                     'Content-Type': 'application/x-test'})
+        req.body = b'VERIFY'
+        resp = req.get_response(obj_controller)
+        self.assertEqual(resp.status_int, 201)
 
+        # Request headers have neither 'X-Auth-Token' nor 'X-Storage-Token'.
+        req = Request.blank('/sda1/p/a/c/o',
+                            headers={'Content-Type': 'application/x-test'})
+        reader_mock = mock.Mock(keep_cache=False)
+        with mock.patch('swift.obj.diskfile.BaseDiskFile.reader', reader_mock):
+            resp = req.get_response(obj_controller)
+            reader_mock.assert_called_with(
+                keep_cache=True, cooperative_period=0, etag_validate_frac=1.0)
+        self.assertEqual(resp.status_int, 200)
+        etag = '"%s"' % md5(b'VERIFY', usedforsecurity=False).hexdigest()
+        self.assertEqual(dict(resp.headers), {
+            'Content-Type': 'application/x-test',
+            'Content-Length': '6',
+            'Etag': etag,
+            'X-Backend-Timestamp': timestamp.internal,
+            'X-Timestamp': timestamp.normal,
+            'X-Backend-Data-Timestamp': timestamp.internal,
+            'X-Backend-Durable-Timestamp': timestamp.internal,
+            'Last-Modified': date_header_format(timestamp),
+        })
+
+        # Request headers have 'X-Auth-Token'.
+        req = Request.blank('/sda1/p/a/c/o',
+                            headers={'Content-Type': 'application/x-test',
+                                     'X-Auth-Token': '2340lsdfhhjl02lxfjj'})
+        reader_mock = mock.Mock(keep_cache=False)
+        with mock.patch('swift.obj.diskfile.BaseDiskFile.reader', reader_mock):
+            resp = req.get_response(obj_controller)
+            reader_mock.assert_called_with(
+                keep_cache=False, cooperative_period=0, etag_validate_frac=1)
+        self.assertEqual(resp.status_int, 200)
+
+        # Request headers have 'X-Storage-Token'.
+        req = Request.blank('/sda1/p/a/c/o',
+                            headers={'Content-Type': 'application/x-test',
+                                     'X-Storage-Token': '2340lsdfhhjl02lxfjj'})
+        reader_mock = mock.Mock(keep_cache=False)
+        with mock.patch('swift.obj.diskfile.BaseDiskFile.reader', reader_mock):
+            resp = req.get_response(obj_controller)
+            reader_mock.assert_called_with(
+                keep_cache=False, cooperative_period=0, etag_validate_frac=1)
+        self.assertEqual(resp.status_int, 200)
+
+        # Request headers have both 'X-Auth-Token' and 'X-Storage-Token'.
+        req = Request.blank('/sda1/p/a/c/o',
+                            headers={'Content-Type': 'application/x-test',
+                                     'X-Auth-Token': '2340lsdfhhjl02lxfjj',
+                                     'X-Storage-Token': '2340lsdfhhjl02lxfjj'})
+        reader_mock = mock.Mock(keep_cache=False)
+        with mock.patch('swift.obj.diskfile.BaseDiskFile.reader', reader_mock):
+            resp = req.get_response(obj_controller)
+            reader_mock.assert_called_with(
+                keep_cache=False, cooperative_period=0, etag_validate_frac=1)
+        self.assertEqual(resp.status_int, 200)
+
+    def test_GET_keep_cache_slo_manifest_no_config(self):
+        # Test swift.obj.server.ObjectController.GET that, when
+        # 'keep_cache_slo_manifest' is not configured and object
+        # metadata has "X-Static-Large-Object", then disk_file.reader
+        # will be called with keep_cache=False.
+        # Set up a new ObjectController with customized configurations.
+        conf = {'devices': self.testdir, 'mount_check': 'false',
+                'container_update_timeout': 0.0,
+                'keep_cache_private': 'false'}
+        obj_controller = object_server.ObjectController(
+            conf, logger=self.logger)
+        obj_controller.bytes_per_sync = 1
+        timestamp = Timestamp.now()
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': timestamp.internal,
+                                     'Content-Type': 'application/x-test',
+                                     'X-Static-Large-Object': 'True'})
+        req.body = b'VERIFY'
+        resp = req.get_response(obj_controller)
+        self.assertEqual(resp.status_int, 201)
+        req = Request.blank('/sda1/p/a/c/o',
+                            headers={'Content-Type': 'application/x-test',
+                                     'X-Auth-Token': '2340lsdfhhjl02lxfjj'})
+
+        reader_mock = mock.Mock(keep_cache=False)
+        with mock.patch('swift.obj.diskfile.BaseDiskFile.reader', reader_mock):
+            resp = req.get_response(obj_controller)
+            reader_mock.assert_called_with(
+                keep_cache=False, cooperative_period=0, etag_validate_frac=1)
+        self.assertEqual(resp.status_int, 200)
+        etag = '"%s"' % md5(b'VERIFY', usedforsecurity=False).hexdigest()
+        self.assertEqual(dict(resp.headers), {
+            'Content-Type': 'application/x-test',
+            'Content-Length': '6',
+            'Etag': etag,
+            'X-Static-Large-Object': 'True',
+            'X-Backend-Timestamp': timestamp.internal,
+            'X-Timestamp': timestamp.normal,
+            'X-Backend-Data-Timestamp': timestamp.internal,
+            'X-Backend-Durable-Timestamp': timestamp.internal,
+            'Last-Modified': date_header_format(timestamp),
+        })
+
+    def test_GET_keep_cache_slo_manifest_config_false(self):
+        # Test swift.obj.server.ObjectController.GET that, when
+        # 'keep_cache_slo_manifest' is configured False and object
+        # metadata has "X-Static-Large-Object", then disk_file.reader
+        # will be called with keep_cache=False.
+        # Set up a new ObjectController with customized configurations.
+        conf = {'devices': self.testdir, 'mount_check': 'false',
+                'container_update_timeout': 0.0,
+                'keep_cache_private': 'false',
+                'keep_cache_slo_manifest': 'false'}
+        obj_controller = object_server.ObjectController(
+            conf, logger=self.logger)
+        obj_controller.bytes_per_sync = 1
+        timestamp = Timestamp.now()
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': timestamp.internal,
+                                     'Content-Type': 'application/x-test',
+                                     'X-Static-Large-Object': 'True'})
+        req.body = b'VERIFY'
+        resp = req.get_response(obj_controller)
+        self.assertEqual(resp.status_int, 201)
+        req = Request.blank('/sda1/p/a/c/o',
+                            headers={'Content-Type': 'application/x-test',
+                                     'X-Auth-Token': '2340lsdfhhjl02lxfjj'})
+
+        reader_mock = mock.Mock(keep_cache=False)
+        with mock.patch('swift.obj.diskfile.BaseDiskFile.reader', reader_mock):
+            resp = req.get_response(obj_controller)
+            reader_mock.assert_called_with(
+                keep_cache=False, cooperative_period=0, etag_validate_frac=1)
+        self.assertEqual(resp.status_int, 200)
+        etag = '"%s"' % md5(b'VERIFY', usedforsecurity=False).hexdigest()
+        self.assertEqual(dict(resp.headers), {
+            'Content-Type': 'application/x-test',
+            'Content-Length': '6',
+            'Etag': etag,
+            'X-Static-Large-Object': 'True',
+            'X-Backend-Timestamp': timestamp.internal,
+            'X-Timestamp': timestamp.normal,
+            'X-Backend-Data-Timestamp': timestamp.internal,
+            'X-Backend-Durable-Timestamp': timestamp.internal,
+            'Last-Modified': date_header_format(timestamp),
+        })
+
+    def test_GET_keep_cache_slo_manifest_config_true(self):
+        # Test swift.obj.server.ObjectController.GET that, when
+        # 'keep_cache_slo_manifest' is configured true and object
+        # metadata has "X-Static-Large-Object", then disk_file.reader
+        # will be called with keep_cache=True.
+        # Set up a new ObjectController with customized configurations.
+        conf = {'devices': self.testdir, 'mount_check': 'false',
+                'container_update_timeout': 0.0,
+                'keep_cache_private': 'false',
+                'keep_cache_slo_manifest': 'true'}
+        obj_controller = object_server.ObjectController(
+            conf, logger=self.logger)
+        obj_controller.bytes_per_sync = 1
+        timestamp = Timestamp.now()
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': timestamp.internal,
+                                     'Content-Type': 'application/x-test',
+                                     'X-Static-Large-Object': 'True'})
+        req.body = b'VERIFY'
+        resp = req.get_response(obj_controller)
+        self.assertEqual(resp.status_int, 201)
+        req = Request.blank('/sda1/p/a/c/o',
+                            headers={'Content-Type': 'application/x-test',
+                                     'X-Auth-Token': '2340lsdfhhjl02lxfjj'})
+
+        reader_mock = mock.Mock(keep_cache=False)
+        with mock.patch('swift.obj.diskfile.BaseDiskFile.reader', reader_mock):
+            resp = req.get_response(obj_controller)
+            reader_mock.assert_called_with(
+                keep_cache=True, cooperative_period=0, etag_validate_frac=1)
+        self.assertEqual(resp.status_int, 200)
+        etag = '"%s"' % md5(b'VERIFY', usedforsecurity=False).hexdigest()
+        self.assertEqual(dict(resp.headers), {
+            'Content-Type': 'application/x-test',
+            'Content-Length': '6',
+            'Etag': etag,
+            'X-Static-Large-Object': 'True',
+            'X-Backend-Timestamp': timestamp.internal,
+            'X-Timestamp': timestamp.normal,
+            'X-Backend-Data-Timestamp': timestamp.internal,
+            'X-Backend-Durable-Timestamp': timestamp.internal,
+            'Last-Modified': date_header_format(timestamp),
+        })
+
+    def test_GET_keep_cache_slo_manifest_not_slo(self):
+        # Test swift.obj.server.ObjectController.GET that, when
+        # 'keep_cache_slo_manifest' is configured true and object
+        # metadata has NO "X-Static-Large-Object", then disk_file.reader
+        # will be called with keep_cache=False.
+        # Set up a new ObjectController with customized configurations.
+        conf = {'devices': self.testdir, 'mount_check': 'false',
+                'container_update_timeout': 0.0,
+                'keep_cache_private': 'false',
+                'keep_cache_slo_manifest': 'true'}
+        obj_controller = object_server.ObjectController(
+            conf, logger=self.logger)
+        obj_controller.bytes_per_sync = 1
+        timestamp = Timestamp.now()
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': timestamp.internal,
+                                     'Content-Type': 'application/x-test'})
+        req.body = b'VERIFY'
+        resp = req.get_response(obj_controller)
+        self.assertEqual(resp.status_int, 201)
+        req = Request.blank('/sda1/p/a/c/o',
+                            headers={'Content-Type': 'application/x-test',
+                                     'X-Auth-Token': '2340lsdfhhjl02lxfjj'})
+
+        reader_mock = mock.Mock(keep_cache=False)
+        with mock.patch('swift.obj.diskfile.BaseDiskFile.reader', reader_mock):
+            resp = req.get_response(obj_controller)
+            reader_mock.assert_called_with(
+                keep_cache=False, cooperative_period=0, etag_validate_frac=1)
+        self.assertEqual(resp.status_int, 200)
+        etag = '"%s"' % md5(b'VERIFY', usedforsecurity=False).hexdigest()
+        self.assertEqual(dict(resp.headers), {
+            'Content-Type': 'application/x-test',
+            'Content-Length': '6',
+            'Etag': etag,
+            'X-Backend-Timestamp': timestamp.internal,
+            'X-Timestamp': timestamp.normal,
+            'X-Backend-Data-Timestamp': timestamp.internal,
+            'X-Backend-Durable-Timestamp': timestamp.internal,
+            'Last-Modified': date_header_format(timestamp),
+        })
+
+    def test_GET_cooperative_period_config(self):
+        # Test config of 'cooperative_period' gets passed to DiskFile reader.
+        conf = {'devices': self.testdir, 'mount_check': 'false',
+                'container_update_timeout': 0.0,
+                'cooperative_period': '99'}
+        obj_controller = object_server.ObjectController(
+            conf, logger=self.logger)
+
+        timestamp = normalize_timestamp(time())
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': timestamp,
+                                     'Content-Type': 'application/x-test'})
+        req.body = b'7 bytes'
+        resp = req.get_response(obj_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        req = Request.blank('/sda1/p/a/c/o',
+                            headers={'Content-Type': 'application/x-test',
+                                     'X-Auth-Token': '2340lsdfhhjl02lxfjj'})
+        with mock.patch(
+            "swift.obj.diskfile.BaseDiskFile.reader"
+        ) as reader_mock:
+            resp = req.get_response(obj_controller)
+        reader_mock.assert_called_with(keep_cache=False, cooperative_period=99,
+                                       etag_validate_frac=1.0)
+        self.assertEqual(resp.status_int, 200)
+
+        # Test DiskFile reader actually sleeps when reading chunks. When
+        # cooperative_period is 1, disk reader sleeps once AFTER each next().
+        conf['cooperative_period'] = '1'
+        obj_controller = object_server.ObjectController(
+            conf, logger=self.logger)
+
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Range': 'bytes=1-6'})
+        with mock.patch('swift.common.utils.sleep') as mock_sleep:
+            resp = req.get_response(obj_controller)
+            self.assertEqual(resp.status_int, 206)
+            self.assertEqual('bytes 1-6/7', resp.headers.get('Content-Range'))
+            self.assertEqual(b' bytes', resp.body)
+        self.assertEqual(1, mock_sleep.call_count)
+
+        # Test DiskFile reader actually sleeps when reading chunks. And verify
+        # number of sleeps when 'disk_chunk_size' is set.
+        conf['cooperative_period'] = '2'
+        conf['disk_chunk_size'] = 2
+        obj_controller = object_server.ObjectController(
+            conf, logger=self.logger)
+
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'GET'})
+        with mock.patch('swift.common.utils.sleep') as mock_sleep:
+            resp = req.get_response(obj_controller)
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual(b'7 bytes', resp.body)
+        self.assertEqual(2, mock_sleep.call_count)
+
+        conf['cooperative_period'] = '2'
+        conf['disk_chunk_size'] = 3
+        obj_controller = object_server.ObjectController(
+            conf, logger=self.logger)
+
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'GET'})
+        with mock.patch('swift.common.utils.sleep') as mock_sleep:
+            resp = req.get_response(obj_controller)
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual(b'7 bytes', resp.body)
+        self.assertEqual(1, mock_sleep.call_count)
+
+        # Test DiskFile reader won't sleep with cooperative_period set as 0.
+        conf['cooperative_period'] = '0'
+        obj_controller = object_server.ObjectController(
+            conf, logger=self.logger)
+
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Range': 'bytes=1-6'})
+        with mock.patch('swift.common.utils.sleep') as mock_sleep:
+            resp = req.get_response(obj_controller)
+            self.assertEqual(resp.status_int, 206)
+            self.assertEqual('bytes 1-6/7', resp.headers.get('Content-Range'))
+            self.assertEqual(b' bytes', resp.body)
+        self.assertFalse(mock_sleep.called)
+
+        # Test DiskFile reader won't sleep with default cooperative_period
+        # which is also 0.
+        conf.pop('cooperative_period')
+        obj_controller = object_server.ObjectController(
+            conf, logger=self.logger)
+
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Range': 'bytes=1-6'})
+        with mock.patch('swift.common.utils.sleep') as mock_sleep:
+            resp = req.get_response(obj_controller)
+            self.assertEqual(resp.status_int, 206)
+            self.assertEqual('bytes 1-6/7', resp.headers.get('Content-Range'))
+            self.assertEqual(b' bytes', resp.body)
+        self.assertFalse(mock_sleep.called)
+
+    def test_PUT_cooperative_period_config(self):
+        # Test DiskFile writer actually sleeps when writing chunks. When
+        # cooperative_period is 1, disk writer sleeps once.
+        conf = {'devices': self.testdir, 'mount_check': 'false',
+                'container_update_timeout': 0.0,
+                'cooperative_period': '1'}
+        obj_controller = object_server.ObjectController(
+            conf, logger=self.logger)
+
+        timestamp = normalize_timestamp(time())
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': timestamp,
+                                     'Content-Type': 'application/x-test'})
+        req.body = b'7 bytes'
+        with mock.patch('swift.common.utils.sleep') as mock_sleep:
+            resp = req.get_response(obj_controller)
+            self.assertEqual(resp.status_int, 201)
+        self.assertEqual(1, mock_sleep.call_count)
+
+        # Test DiskFile writer actually sleeps when writing chunks. And verify
+        # number of sleeps when 'disk_chunk_size' is set.
+        conf['cooperative_period'] = '2'
+        conf['network_chunk_size'] = 2
+        obj_controller = object_server.ObjectController(
+            conf, logger=self.logger)
+
+        timestamp = normalize_timestamp(time())
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': timestamp,
+                                     'Content-Type': 'application/x-test'})
+        req.body = b'7 bytes'
+        with mock.patch('swift.common.utils.sleep') as mock_sleep:
+            resp = req.get_response(obj_controller)
+            self.assertEqual(resp.status_int, 201)
+        self.assertEqual(2, mock_sleep.call_count)
+
+        conf['cooperative_period'] = '2'
+        conf['network_chunk_size'] = 3
+        obj_controller = object_server.ObjectController(
+            conf, logger=self.logger)
+
+        timestamp = normalize_timestamp(time())
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': timestamp,
+                                     'Content-Type': 'application/x-test'})
+        req.body = b'7 bytes'
+        with mock.patch('swift.common.utils.sleep') as mock_sleep:
+            resp = req.get_response(obj_controller)
+            self.assertEqual(resp.status_int, 201)
+        self.assertEqual(1, mock_sleep.call_count)
+
+        # Test DiskFile reader won't sleep with cooperative_period set as 0.
+        conf['cooperative_period'] = '0'
+        obj_controller = object_server.ObjectController(
+            conf, logger=self.logger)
+
+        timestamp = normalize_timestamp(time())
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': timestamp,
+                                     'Content-Type': 'application/x-test'})
+        req.body = b'7 bytes'
+        with mock.patch('swift.common.utils.sleep') as mock_sleep:
+            resp = req.get_response(obj_controller)
+            self.assertEqual(resp.status_int, 201)
+        self.assertFalse(mock_sleep.called)
+
+        # Test DiskFile reader won't sleep with default cooperative_period
+        # which is also 0.
+        conf.pop('cooperative_period')
+        obj_controller = object_server.ObjectController(
+            conf, logger=self.logger)
+
+        timestamp = normalize_timestamp(time())
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': timestamp,
+                                     'Content-Type': 'application/x-test'})
+        req.body = b'7 bytes'
+        with mock.patch('swift.common.utils.sleep') as mock_sleep:
+            resp = req.get_response(obj_controller)
+            self.assertEqual(resp.status_int, 201)
+        self.assertFalse(mock_sleep.called)
+
+    @mock.patch("time.time", mock_time)
     def test_DELETE(self):
-        """ Test swift.object_server.ObjectController.DELETE """
+        # Test swift.obj.server.ObjectController.DELETE
         req = Request.blank('/sda1/p/a/c',
                             environ={'REQUEST_METHOD': 'DELETE'})
-        resp = self.object_controller.DELETE(req)
-        self.assertEquals(resp.status_int, 400)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 400)
 
         req = Request.blank('/sda1/p/a/c/o',
                             environ={'REQUEST_METHOD': 'DELETE'})
-        resp = self.object_controller.DELETE(req)
-        self.assertEquals(resp.status_int, 400)
-        # self.assertRaises(KeyError, self.object_controller.DELETE, req)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 400)
 
-        timestamp = normalize_timestamp(time())
+        # The following should have created a tombstone file
+        timestamp = normalize_timestamp(1000)
         req = Request.blank('/sda1/p/a/c/o',
                             environ={'REQUEST_METHOD': 'DELETE'},
                             headers={'X-Timestamp': timestamp})
-        resp = self.object_controller.DELETE(req)
-        self.assertEquals(resp.status_int, 404)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 404)
+        ts_1000_file = os.path.join(
+            self.testdir, 'sda1',
+            storage_directory(diskfile.get_data_dir(POLICIES[0]), 'p',
+                              hash_path('a', 'c', 'o')),
+            utils.Timestamp(timestamp).internal + '.ts')
+        self.assertTrue(os.path.isfile(ts_1000_file))
+        # There should now be a 1000 ts file.
+        self.assertEqual(len(os.listdir(os.path.dirname(ts_1000_file))), 1)
 
-        sleep(.00001)
-        timestamp = normalize_timestamp(time())
+        # The following should *not* have created a tombstone file.
+        timestamp = normalize_timestamp(999)
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'DELETE'},
+                            headers={'X-Timestamp': timestamp})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 404)
+        ts_999_file = os.path.join(
+            self.testdir, 'sda1',
+            storage_directory(diskfile.get_data_dir(POLICIES[0]), 'p',
+                              hash_path('a', 'c', 'o')),
+            utils.Timestamp(timestamp).internal + '.ts')
+        self.assertFalse(os.path.isfile(ts_999_file))
+        self.assertTrue(os.path.isfile(ts_1000_file))
+        self.assertEqual(len(os.listdir(os.path.dirname(ts_1000_file))), 1)
+
+        orig_timestamp = utils.Timestamp(1002).internal
+        headers = {'X-Timestamp': orig_timestamp,
+                   'Content-Type': 'application/octet-stream',
+                   'Content-Length': '4'}
         req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                            headers={
-                                'X-Timestamp': timestamp,
-                                'Content-Type': 'application/octet-stream',
-                                'Content-Length': '4',
-                                })
+                            headers=headers)
         req.body = 'test'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+        # There should now be 1000 ts and a 1001 data file.
+        data_1002_file = os.path.join(
+            self.testdir, 'sda1',
+            storage_directory(diskfile.get_data_dir(POLICIES[0]), 'p',
+                              hash_path('a', 'c', 'o')),
+            orig_timestamp + '.data')
+        self.assertTrue(os.path.isfile(data_1002_file))
+        self.assertEqual(len(os.listdir(os.path.dirname(data_1002_file))), 1)
 
-        timestamp = normalize_timestamp(float(timestamp) - 1)
+        # The following should *not* have created a tombstone file.
+        timestamp = normalize_timestamp(1001)
         req = Request.blank('/sda1/p/a/c/o',
                             environ={'REQUEST_METHOD': 'DELETE'},
                             headers={'X-Timestamp': timestamp})
-        resp = self.object_controller.DELETE(req)
-        self.assertEquals(resp.status_int, 204)
-        objfile = os.path.join(self.testdir, 'sda1',
-            storage_directory(object_server.DATADIR, 'p',
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 409)
+        self.assertEqual(resp.headers['X-Backend-Timestamp'], orig_timestamp)
+        ts_1001_file = os.path.join(
+            self.testdir, 'sda1',
+            storage_directory(diskfile.get_data_dir(POLICIES[0]), 'p',
                               hash_path('a', 'c', 'o')),
-            timestamp + '.ts')
-        self.assert_(os.path.isfile(objfile))
+            utils.Timestamp(timestamp).internal + '.ts')
+        self.assertFalse(os.path.isfile(ts_1001_file))
+        self.assertTrue(os.path.isfile(data_1002_file))
+        self.assertEqual(len(os.listdir(os.path.dirname(ts_1001_file))), 1)
 
-        sleep(.00001)
-        timestamp = normalize_timestamp(time())
+        timestamp = normalize_timestamp(1003)
         req = Request.blank('/sda1/p/a/c/o',
                             environ={'REQUEST_METHOD': 'DELETE'},
                             headers={'X-Timestamp': timestamp})
-        resp = self.object_controller.DELETE(req)
-        self.assertEquals(resp.status_int, 204)
-        objfile = os.path.join(self.testdir, 'sda1',
-            storage_directory(object_server.DATADIR, 'p',
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 204)
+        ts_1003_file = os.path.join(
+            self.testdir, 'sda1',
+            storage_directory(diskfile.get_data_dir(POLICIES[0]), 'p',
                               hash_path('a', 'c', 'o')),
-            timestamp + '.ts')
-        self.assert_(os.path.isfile(objfile))
+            utils.Timestamp(timestamp).internal + '.ts')
+        self.assertTrue(os.path.isfile(ts_1003_file))
+        self.assertEqual(len(os.listdir(os.path.dirname(ts_1003_file))), 1)
+
+    def test_DELETE_bad_timestamp(self):
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'DELETE'},
+            headers={'X-Timestamp': 'bad'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 400)
+
+    def test_DELETE_succeeds_with_later_POST(self):
+        t_put = next(self.ts).internal
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': t_put,
+                                     'Content-Length': 0,
+                                     'Content-Type': 'plain/text'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        t_delete = next(self.ts).internal
+        t_post = next(self.ts).internal
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'X-Timestamp': t_post})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 202)
+
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'DELETE'},
+                            headers={'X-Timestamp': t_delete},
+                            )
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 204)
+
+        obj_dir = os.path.join(
+            self.testdir, 'sda1',
+            storage_directory(diskfile.get_data_dir(0), 'p',
+                              hash_path('a', 'c', 'o')))
+
+        ts_file = os.path.join(obj_dir, t_delete + '.ts')
+        self.assertTrue(os.path.isfile(ts_file))
+        meta_file = os.path.join(obj_dir, t_post + '.meta')
+        self.assertTrue(os.path.isfile(meta_file))
+
+    def test_DELETE_container_updates(self):
+        # Test swift.obj.server.ObjectController.DELETE and container
+        # updates, making sure container update is called in the correct
+        # state.
+        start = time()
+        orig_timestamp = utils.Timestamp(start)
+        headers = {'X-Timestamp': orig_timestamp.internal,
+                   'Content-Type': 'application/octet-stream',
+                   'Content-Length': '4'}
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers=headers)
+        req.body = 'test'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        calls_made = [0]
+
+        def our_container_update(*args, **kwargs):
+            calls_made[0] += 1
+
+        orig_cu = self.object_controller.container_update
+        self.object_controller.container_update = our_container_update
+        try:
+            # The following request should return 409 (HTTP Conflict). A
+            # tombstone file should not have been created with this timestamp.
+            timestamp = utils.Timestamp(start - 0.00001)
+            req = Request.blank('/sda1/p/a/c/o',
+                                environ={'REQUEST_METHOD': 'DELETE'},
+                                headers={'X-Timestamp': timestamp.internal})
+            resp = req.get_response(self.object_controller)
+            self.assertEqual(resp.status_int, 409)
+            self.assertEqual(resp.headers['x-backend-timestamp'],
+                             orig_timestamp.internal)
+            objfile = os.path.join(
+                self.testdir, 'sda1',
+                storage_directory(diskfile.get_data_dir(POLICIES[0]), 'p',
+                                  hash_path('a', 'c', 'o')),
+                utils.Timestamp(timestamp).internal + '.ts')
+            self.assertFalse(os.path.isfile(objfile))
+            self.assertEqual(len(os.listdir(os.path.dirname(objfile))), 1)
+            self.assertEqual(0, calls_made[0])
+
+            # The following request should return 204, and the object should
+            # be truly deleted (container update is performed) because this
+            # timestamp is newer. A tombstone file should have been created
+            # with this timestamp.
+            timestamp = utils.Timestamp(start + 0.00001)
+            req = Request.blank('/sda1/p/a/c/o',
+                                environ={'REQUEST_METHOD': 'DELETE'},
+                                headers={'X-Timestamp': timestamp.internal})
+            resp = req.get_response(self.object_controller)
+            self.assertEqual(resp.status_int, 204,
+                             (start, orig_timestamp, timestamp))
+            objfile = os.path.join(
+                self.testdir, 'sda1',
+                storage_directory(diskfile.get_data_dir(POLICIES[0]), 'p',
+                                  hash_path('a', 'c', 'o')),
+                utils.Timestamp(timestamp).internal + '.ts')
+            self.assertTrue(os.path.isfile(objfile))
+            self.assertEqual(1, calls_made[0])
+            self.assertEqual(len(os.listdir(os.path.dirname(objfile))), 1)
+
+            # The following request should return a 404, as the object should
+            # already have been deleted, but it should have also performed a
+            # container update because the timestamp is newer, and a tombstone
+            # file should also exist with this timestamp.
+            timestamp = utils.Timestamp(start + 0.00002)
+            req = Request.blank('/sda1/p/a/c/o',
+                                environ={'REQUEST_METHOD': 'DELETE'},
+                                headers={'X-Timestamp': timestamp.internal})
+            resp = req.get_response(self.object_controller)
+            self.assertEqual(resp.status_int, 404)
+            objfile = os.path.join(
+                self.testdir, 'sda1',
+                storage_directory(diskfile.get_data_dir(POLICIES[0]), 'p',
+                                  hash_path('a', 'c', 'o')),
+                utils.Timestamp(timestamp).internal + '.ts')
+            self.assertTrue(os.path.isfile(objfile))
+            self.assertEqual(2, calls_made[0])
+            self.assertEqual(len(os.listdir(os.path.dirname(objfile))), 1)
+
+            # The following request should return a 404, as the object should
+            # already have been deleted, and it should not have performed a
+            # container update because the timestamp is older, or created a
+            # tombstone file with this timestamp.
+            timestamp = utils.Timestamp(start + 0.00001)
+            req = Request.blank('/sda1/p/a/c/o',
+                                environ={'REQUEST_METHOD': 'DELETE'},
+                                headers={'X-Timestamp': timestamp.internal})
+            resp = req.get_response(self.object_controller)
+            self.assertEqual(resp.status_int, 404)
+            objfile = os.path.join(
+                self.testdir, 'sda1',
+                storage_directory(diskfile.get_data_dir(POLICIES[0]), 'p',
+                                  hash_path('a', 'c', 'o')),
+                utils.Timestamp(timestamp).internal + '.ts')
+            self.assertFalse(os.path.isfile(objfile))
+            self.assertEqual(2, calls_made[0])
+            self.assertEqual(len(os.listdir(os.path.dirname(objfile))), 1)
+        finally:
+            self.object_controller.container_update = orig_cu
+
+    def test_DELETE_full_drive(self):
 
-    def test_call(self):
-        """ Test swift.object_server.ObjectController.__call__ """
-        inbuf = StringIO()
+        def mock_diskfile_delete(self, timestamp):
+            raise DiskFileNoSpace()
+
+        t_put = utils.Timestamp.now()
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': t_put.internal,
+                                     'Content-Length': 0,
+                                     'Content-Type': 'plain/text'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        with mock.patch('swift.obj.diskfile.BaseDiskFile.delete',
+                        mock_diskfile_delete):
+            t_delete = utils.Timestamp.now()
+            req = Request.blank('/sda1/p/a/c/o',
+                                environ={'REQUEST_METHOD': 'DELETE'},
+                                headers={'X-Timestamp': t_delete.internal})
+            resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 507)
+
+    def test_object_update_with_offset(self):
+        container_updates = []
+
+        def capture_updates(ip, port, method, path, headers, *args, **kwargs):
+            container_updates.append((ip, port, method, path, headers))
+        # create a new object
+        create_timestamp = next(self.ts)
+        req = Request.blank('/sda1/p/a/c/o', method='PUT', body=b'test1',
+                            headers={'X-Timestamp': create_timestamp.internal,
+                                     'X-Container-Host': '10.0.0.1:8080',
+                                     'X-Container-Device': 'sda1',
+                                     'X-Container-Partition': 'p',
+                                     'Content-Type': 'text/plain'})
+        with mocked_http_conn(200, give_connect=capture_updates) as fake_conn:
+            with fake_spawn():
+                resp = req.get_response(self.object_controller)
+        with self.assertRaises(StopIteration):
+            next(fake_conn.code_iter)
+        self.assertEqual(resp.status_int, 201)
+        self.assertEqual(1, len(container_updates))
+        for update in container_updates:
+            ip, port, method, path, headers = update
+            self.assertEqual(ip, '10.0.0.1')
+            self.assertEqual(port, '8080')
+            self.assertEqual(method, 'PUT')
+            self.assertEqual(path, '/sda1/p/a/c/o')
+            expected = {
+                'X-Size': len(b'test1'),
+                'X-Etag': md5(b'test1', usedforsecurity=False).hexdigest(),
+                'X-Content-Type': 'text/plain',
+                'X-Timestamp': create_timestamp.internal,
+            }
+            for key, value in expected.items():
+                self.assertEqual(headers[key], str(value))
+        container_updates = []  # reset
+        # read back object
+        req = Request.blank('/sda1/p/a/c/o', method='GET')
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['X-Timestamp'], create_timestamp.normal)
+        self.assertEqual(resp.headers['X-Backend-Timestamp'],
+                         create_timestamp.internal)
+        self.assertEqual(resp.headers['X-Backend-Data-Timestamp'],
+                         create_timestamp.internal)
+        self.assertEqual(resp.body, b'test1')
+        # send an update with an offset
+        offset_timestamp = utils.Timestamp(create_timestamp, offset=1)
+        req = Request.blank('/sda1/p/a/c/o', method='PUT', body=b'test2',
+                            headers={'X-Timestamp': offset_timestamp.internal,
+                                     'X-Container-Host': '10.0.0.1:8080',
+                                     'X-Container-Device': 'sda1',
+                                     'X-Container-Partition': 'p',
+                                     'Content-Type': 'text/html'})
+        with mocked_http_conn(200, give_connect=capture_updates) as fake_conn:
+            with fake_spawn():
+                resp = req.get_response(self.object_controller)
+        with self.assertRaises(StopIteration):
+            next(fake_conn.code_iter)
+        self.assertEqual(resp.status_int, 201)
+        self.assertEqual(1, len(container_updates))
+        for update in container_updates:
+            ip, port, method, path, headers = update
+            self.assertEqual(ip, '10.0.0.1')
+            self.assertEqual(port, '8080')
+            self.assertEqual(method, 'PUT')
+            self.assertEqual(path, '/sda1/p/a/c/o')
+            expected = {
+                'X-Size': len(b'test2'),
+                'X-Etag': md5(b'test2', usedforsecurity=False).hexdigest(),
+                'X-Content-Type': 'text/html',
+                'X-Timestamp': offset_timestamp.internal,
+            }
+            for key, value in expected.items():
+                self.assertEqual(headers[key], str(value))
+        container_updates = []  # reset
+        # read back new offset
+        req = Request.blank('/sda1/p/a/c/o', method='GET')
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['X-Timestamp'], offset_timestamp.normal)
+        self.assertEqual(resp.headers['X-Backend-Timestamp'],
+                         offset_timestamp.internal)
+        self.assertEqual(resp.body, b'test2')
+        # now overwrite with a newer time
+        overwrite_timestamp = next(self.ts)
+        req = Request.blank(
+            '/sda1/p/a/c/o', method='PUT', body=b'test3',
+            headers={'X-Timestamp': overwrite_timestamp.internal,
+                     'X-Container-Host': '10.0.0.1:8080',
+                     'X-Container-Device': 'sda1',
+                     'X-Container-Partition': 'p',
+                     'Content-Type': 'text/enriched'})
+        with mocked_http_conn(200, give_connect=capture_updates) as fake_conn:
+            with fake_spawn():
+                resp = req.get_response(self.object_controller)
+        with self.assertRaises(StopIteration):
+            next(fake_conn.code_iter)
+        self.assertEqual(resp.status_int, 201)
+        self.assertEqual(1, len(container_updates))
+        for update in container_updates:
+            ip, port, method, path, headers = update
+            self.assertEqual(ip, '10.0.0.1')
+            self.assertEqual(port, '8080')
+            self.assertEqual(method, 'PUT')
+            self.assertEqual(path, '/sda1/p/a/c/o')
+            expected = {
+                'X-Size': len(b'test3'),
+                'X-Etag': md5(b'test3', usedforsecurity=False).hexdigest(),
+                'X-Content-Type': 'text/enriched',
+                'X-Timestamp': overwrite_timestamp.internal,
+            }
+            for key, value in expected.items():
+                self.assertEqual(headers[key], str(value))
+        container_updates = []  # reset
+        # read back overwrite
+        req = Request.blank('/sda1/p/a/c/o', method='GET')
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['X-Timestamp'],
+                         overwrite_timestamp.normal)
+        self.assertEqual(resp.headers['X-Backend-Timestamp'],
+                         overwrite_timestamp.internal)
+        self.assertEqual(resp.headers['X-Backend-Data-Timestamp'],
+                         overwrite_timestamp.internal)
+        self.assertEqual(resp.body, b'test3')
+        # delete with an offset
+        offset_delete = utils.Timestamp(overwrite_timestamp, offset=1)
+        req = Request.blank(
+            '/sda1/p/a/c/o', method='DELETE',
+            headers={'X-Timestamp': offset_delete.internal,
+                     'X-Container-Host': '10.0.0.1:8080',
+                     'X-Container-Device': 'sda1',
+                     'X-Container-Partition': 'p'})
+        with mocked_http_conn(200, give_connect=capture_updates) as fake_conn:
+            with fake_spawn():
+                resp = req.get_response(self.object_controller)
+        with self.assertRaises(StopIteration):
+            next(fake_conn.code_iter)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(1, len(container_updates))
+        for update in container_updates:
+            ip, port, method, path, headers = update
+            self.assertEqual(ip, '10.0.0.1')
+            self.assertEqual(port, '8080')
+            self.assertEqual(method, 'DELETE')
+            self.assertEqual(path, '/sda1/p/a/c/o')
+            expected = {
+                'X-Timestamp': offset_delete.internal,
+            }
+            for key, value in expected.items():
+                self.assertEqual(headers[key], str(value))
+        container_updates = []  # reset
+        # read back offset delete
+        req = Request.blank('/sda1/p/a/c/o', method='GET')
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 404)
+        self.assertIsNone(resp.headers['X-Timestamp'])
+        self.assertEqual(resp.headers['X-Backend-Timestamp'],
+                         offset_delete.internal)
+        # and one more delete with a newer timestamp
+        delete_timestamp = next(self.ts)
+        req = Request.blank('/sda1/p/a/c/o', method='DELETE',
+                            headers={'X-Timestamp': delete_timestamp.internal,
+                                     'X-Container-Host': '10.0.0.1:8080',
+                                     'X-Container-Device': 'sda1',
+                                     'X-Container-Partition': 'p'})
+        with mocked_http_conn(200, give_connect=capture_updates) as fake_conn:
+            with fake_spawn():
+                resp = req.get_response(self.object_controller)
+        with self.assertRaises(StopIteration):
+            next(fake_conn.code_iter)
+        self.assertEqual(resp.status_int, 404)
+        self.assertEqual(1, len(container_updates))
+        for update in container_updates:
+            ip, port, method, path, headers = update
+            self.assertEqual(ip, '10.0.0.1')
+            self.assertEqual(port, '8080')
+            self.assertEqual(method, 'DELETE')
+            self.assertEqual(path, '/sda1/p/a/c/o')
+            expected = {
+                'X-Timestamp': delete_timestamp.internal,
+            }
+            for key, value in expected.items():
+                self.assertEqual(headers[key], str(value))
+        container_updates = []  # reset
+        # read back delete
+        req = Request.blank('/sda1/p/a/c/o', method='GET')
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 404)
+        self.assertIsNone(resp.headers['X-Timestamp'])
+        self.assertEqual(resp.headers['X-Backend-Timestamp'],
+                         delete_timestamp.internal)
+
+    def test_call_bad_request(self):
+        # Test swift.obj.server.ObjectController.__call__
+        inbuf = WsgiBytesIO()
         errbuf = StringIO()
         outbuf = StringIO()
 
         def start_response(*args):
-            """ Sends args to outbuf """
-            outbuf.writelines(args)
+            """Sends args to outbuf"""
+            outbuf.write(args[0])
 
         self.object_controller.__call__({'REQUEST_METHOD': 'PUT',
                                          'SCRIPT_NAME': '',
@@ -1373,12 +5864,18 @@ def start_response(*args):
                                          'wsgi.multiprocess': False,
                                          'wsgi.run_once': False},
                                         start_response)
-        self.assertEquals(errbuf.getvalue(), '')
-        self.assertEquals(outbuf.getvalue()[:4], '400 ')
+        self.assertEqual(errbuf.getvalue(), '')
+        self.assertEqual(outbuf.getvalue()[:4], '400 ')
 
-        inbuf = StringIO()
+    def test_call_not_found(self):
+        inbuf = WsgiBytesIO()
         errbuf = StringIO()
         outbuf = StringIO()
+
+        def start_response(*args):
+            """Sends args to outbuf"""
+            outbuf.write(args[0])
+
         self.object_controller.__call__({'REQUEST_METHOD': 'GET',
                                          'SCRIPT_NAME': '',
                                          'PATH_INFO': '/sda1/p/a/c/o',
@@ -1394,12 +5891,18 @@ def start_response(*args):
                                          'wsgi.multiprocess': False,
                                          'wsgi.run_once': False},
                                         start_response)
-        self.assertEquals(errbuf.getvalue(), '')
-        self.assertEquals(outbuf.getvalue()[:4], '404 ')
+        self.assertEqual(errbuf.getvalue(), '')
+        self.assertEqual(outbuf.getvalue()[:4], '404 ')
 
-        inbuf = StringIO()
+    def test_call_bad_method(self):
+        inbuf = WsgiBytesIO()
         errbuf = StringIO()
         outbuf = StringIO()
+
+        def start_response(*args):
+            """Sends args to outbuf"""
+            outbuf.write(args[0])
+
         self.object_controller.__call__({'REQUEST_METHOD': 'INVALID',
                                          'SCRIPT_NAME': '',
                                          'PATH_INFO': '/sda1/p/a/c/o',
@@ -1415,80 +5918,193 @@ def start_response(*args):
                                          'wsgi.multiprocess': False,
                                          'wsgi.run_once': False},
                                         start_response)
-        self.assertEquals(errbuf.getvalue(), '')
-        self.assertEquals(outbuf.getvalue()[:4], '405 ')
+        self.assertEqual(errbuf.getvalue(), '')
+        self.assertEqual(outbuf.getvalue()[:4], '405 ')
+
+    def test_call_name_collision(self):
+        def my_check(*args):
+            return False
+
+        def my_hash_path(*args):
+            return md5(b'collide', usedforsecurity=False).hexdigest()
+
+        with mock.patch("swift.obj.diskfile.hash_path", my_hash_path):
+            with mock.patch("swift.obj.server.check_object_creation",
+                            my_check):
+                inbuf = WsgiBytesIO()
+                errbuf = StringIO()
+                outbuf = StringIO()
+
+                def start_response(*args):
+                    """Sends args to outbuf"""
+                    outbuf.write(args[0])
+
+                self.object_controller.__call__({
+                    'REQUEST_METHOD': 'PUT',
+                    'SCRIPT_NAME': '',
+                    'PATH_INFO': '/sda1/p/a/c/o',
+                    'SERVER_NAME': '127.0.0.1',
+                    'SERVER_PORT': '8080',
+                    'SERVER_PROTOCOL': 'HTTP/1.0',
+                    'CONTENT_LENGTH': '0',
+                    'CONTENT_TYPE': 'text/html',
+                    'HTTP_X_TIMESTAMP': normalize_timestamp(1.2),
+                    'wsgi.version': (1, 0),
+                    'wsgi.url_scheme': 'http',
+                    'wsgi.input': inbuf,
+                    'wsgi.errors': errbuf,
+                    'wsgi.multithread': False,
+                    'wsgi.multiprocess': False,
+                    'wsgi.run_once': False},
+                    start_response)
+                self.assertEqual(errbuf.getvalue(), '')
+                self.assertEqual(outbuf.getvalue()[:4], '201 ')
+
+                inbuf = WsgiBytesIO()
+                errbuf = StringIO()
+                outbuf = StringIO()
+
+                def start_response(*args):
+                    """Sends args to outbuf"""
+                    outbuf.write(args[0])
+
+                self.object_controller.__call__({
+                    'REQUEST_METHOD': 'PUT',
+                    'SCRIPT_NAME': '',
+                    'PATH_INFO': '/sda1/p/b/d/x',
+                    'SERVER_NAME': '127.0.0.1',
+                    'SERVER_PORT': '8080',
+                    'SERVER_PROTOCOL': 'HTTP/1.0',
+                    'CONTENT_LENGTH': '0',
+                    'CONTENT_TYPE': 'text/html',
+                    'HTTP_X_TIMESTAMP': normalize_timestamp(1.3),
+                    'wsgi.version': (1, 0),
+                    'wsgi.url_scheme': 'http',
+                    'wsgi.input': inbuf,
+                    'wsgi.errors': errbuf,
+                    'wsgi.multithread': False,
+                    'wsgi.multiprocess': False,
+                    'wsgi.run_once': False},
+                    start_response)
+                self.assertEqual(errbuf.getvalue(), '')
+                self.assertEqual(outbuf.getvalue()[:4], '403 ')
 
     def test_invalid_method_doesnt_exist(self):
-        inbuf = StringIO()
         errbuf = StringIO()
         outbuf = StringIO()
+
         def start_response(*args):
-            outbuf.writelines(args)
-        self.object_controller.__call__({'REQUEST_METHOD': 'method_doesnt_exist',
-                                         'PATH_INFO': '/sda1/p/a/c/o'},
-                                        start_response)
-        self.assertEquals(errbuf.getvalue(), '')
-        self.assertEquals(outbuf.getvalue()[:4], '405 ')
+            outbuf.write(args[0])
+
+        self.object_controller.__call__({
+            'REQUEST_METHOD': 'method_doesnt_exist',
+            'PATH_INFO': '/sda1/p/a/c/o'},
+            start_response)
+        self.assertEqual(errbuf.getvalue(), '')
+        self.assertEqual(outbuf.getvalue()[:4], '405 ')
 
     def test_invalid_method_is_not_public(self):
-        inbuf = StringIO()
         errbuf = StringIO()
         outbuf = StringIO()
+
         def start_response(*args):
-            outbuf.writelines(args)
+            outbuf.write(args[0])
+
         self.object_controller.__call__({'REQUEST_METHOD': '__init__',
                                          'PATH_INFO': '/sda1/p/a/c/o'},
                                         start_response)
-        self.assertEquals(errbuf.getvalue(), '')
-        self.assertEquals(outbuf.getvalue()[:4], '405 ')
+        self.assertEqual(errbuf.getvalue(), '')
+        self.assertEqual(outbuf.getvalue()[:4], '405 ')
 
     def test_chunked_put(self):
-        listener = listen(('localhost', 0))
+        listener = listen_zero()
         port = listener.getsockname()[1]
         killer = spawn(wsgi.server, listener, self.object_controller,
                        NullLogger())
         sock = connect_tcp(('localhost', port))
-        fd = sock.makefile()
-        fd.write('PUT /sda1/p/a/c/o HTTP/1.1\r\nHost: localhost\r\n'
-                 'Content-Type: text/plain\r\n'
-                 'Connection: close\r\nX-Timestamp: 1.0\r\n'
-                 'Transfer-Encoding: chunked\r\n\r\n'
-                 '2\r\noh\r\n4\r\n hai\r\n0\r\n\r\n')
+        fd = sock.makefile('rwb')
+        s = 'PUT /sda1/p/a/c/o HTTP/1.1\r\nHost: localhost\r\n' \
+            'Content-Type: text/plain\r\n' \
+            'Connection: close\r\nX-Timestamp: %s\r\n' \
+            'Transfer-Encoding: chunked\r\n\r\n' \
+            '2\r\noh\r\n4\r\n hai\r\n0\r\n\r\n'
+        s = s % normalize_timestamp(1.0)
+        fd.write(s.encode('ascii'))
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
+        sock = connect_tcp(('localhost', port))
+        fd = sock.makefile('rwb')
+        fd.write(b'GET /sda1/p/a/c/o HTTP/1.1\r\nHost: localhost\r\n'
+                 b'Connection: close\r\n\r\n')
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 200'
+        self.assertEqual(headers[:len(exp)], exp)
+        response = fd.read()
+        self.assertEqual(response, b'oh hai')
+        killer.kill()
+
+    def test_chunked_content_length_mismatch_zero(self):
+        listener = listen_zero()
+        port = listener.getsockname()[1]
+        killer = spawn(wsgi.server, listener, self.object_controller,
+                       NullLogger(), protocol=http_protocol.SwiftHttpProtocol)
+        sock = connect_tcp(('localhost', port))
+        fd = sock.makefile('rwb')
+        s = 'PUT /sda1/p/a/c/o HTTP/1.1\r\nHost: localhost\r\n' \
+            'Content-Type: text/plain\r\n' \
+            'Connection: close\r\nX-Timestamp: %s\r\n' \
+            'Content-Length: 0\r\n' \
+            'Transfer-Encoding: chunked\r\n\r\n' \
+            '2\r\noh\r\n4\r\n hai\r\n0\r\n\r\n'
+        s = s % normalize_timestamp(1.0)
+        fd.write(s.encode('ascii'))
         fd.flush()
-        readuntil2crlfs(fd)
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
         sock = connect_tcp(('localhost', port))
-        fd = sock.makefile()
-        fd.write('GET /sda1/p/a/c/o HTTP/1.1\r\nHost: localhost\r\n'
-                 'Connection: close\r\n\r\n')
+        fd = sock.makefile('rwb')
+        s = 'GET /sda1/p/a/c/o HTTP/1.1\r\n' \
+            'Host: localhost\r\n' \
+            'X-Timestamp: %s\r\n' \
+            'Connection: close\r\n\r\n' % normalize_timestamp(2.0)
+        fd.write(s.encode('ascii'))
         fd.flush()
-        readuntil2crlfs(fd)
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 200'
+        self.assertEqual(headers[:len(exp)], exp)
         response = fd.read()
-        self.assertEquals(response, 'oh hai')
+        self.assertEqual(response, b'oh hai')
         killer.kill()
 
     def test_max_object_name_length(self):
         timestamp = normalize_timestamp(time())
         max_name_len = constraints.MAX_OBJECT_NAME_LENGTH
-        req = Request.blank('/sda1/p/a/c/' + ('1' * max_name_len),
-                environ={'REQUEST_METHOD': 'PUT'},
-                headers={'X-Timestamp': timestamp,
-                         'Content-Length': '4',
-                         'Content-Type': 'application/octet-stream'})
+        req = Request.blank(
+            '/sda1/p/a/c/' + ('1' * max_name_len),
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': timestamp,
+                     'Content-Length': '4',
+                     'Content-Type': 'application/octet-stream'})
         req.body = 'DATA'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
-        req = Request.blank('/sda1/p/a/c/' + ('2' * (max_name_len + 1)),
-                environ={'REQUEST_METHOD': 'PUT'},
-                headers={'X-Timestamp': timestamp,
-                         'Content-Length': '4',
-                         'Content-Type': 'application/octet-stream'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+        req = Request.blank(
+            '/sda1/p/a/c/' + ('2' * (max_name_len + 1)),
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': timestamp,
+                     'Content-Length': '4',
+                     'Content-Type': 'application/octet-stream'})
         req.body = 'DATA'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 400)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 400)
 
     def test_max_upload_time(self):
 
-        class SlowBody():
+        class SlowBody(object):
 
             def __init__(self):
                 self.sent = 0
@@ -1497,26 +6113,31 @@ def read(self, size=-1):
                 if self.sent < 4:
                     sleep(0.1)
                     self.sent += 1
-                    return ' '
-                return ''
+                    return b' '
+                return b''
 
-        req = Request.blank('/sda1/p/a/c/o',
+            def set_hundred_continue_response_headers(*a, **kw):
+                pass
+
+        req = Request.blank(
+            '/sda1/p/a/c/o',
             environ={'REQUEST_METHOD': 'PUT', 'wsgi.input': SlowBody()},
             headers={'X-Timestamp': normalize_timestamp(time()),
                      'Content-Length': '4', 'Content-Type': 'text/plain'})
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
         self.object_controller.max_upload_time = 0.1
-        req = Request.blank('/sda1/p/a/c/o',
+        req = Request.blank(
+            '/sda1/p/a/c/o',
             environ={'REQUEST_METHOD': 'PUT', 'wsgi.input': SlowBody()},
             headers={'X-Timestamp': normalize_timestamp(time()),
                      'Content-Length': '4', 'Content-Type': 'text/plain'})
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 408)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 408)
 
     def test_short_body(self):
 
-        class ShortBody():
+        class ShortBody(object):
 
             def __init__(self):
                 self.sent = False
@@ -1524,100 +6145,71 @@ def __init__(self):
             def read(self, size=-1):
                 if not self.sent:
                     self.sent = True
-                    return '   '
-                return ''
+                    return b'   '
+                return b''
 
-        req = Request.blank('/sda1/p/a/c/o',
+            def set_hundred_continue_response_headers(*a, **kw):
+                pass
+
+        req = Request.blank(
+            '/sda1/p/a/c/o',
             environ={'REQUEST_METHOD': 'PUT', 'wsgi.input': ShortBody()},
             headers={'X-Timestamp': normalize_timestamp(time()),
                      'Content-Length': '4', 'Content-Type': 'text/plain'})
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 499)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 499)
 
     def test_bad_sinces(self):
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
             headers={'X-Timestamp': normalize_timestamp(time()),
                      'Content-Length': '4', 'Content-Type': 'text/plain'},
-            body='    ')
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
+            body=b'    ')
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
             headers={'If-Unmodified-Since': 'Not a valid date'})
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
             headers={'If-Modified-Since': 'Not a valid date'})
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
-            headers={'If-Unmodified-Since': 'Sat, 29 Oct 1000 19:43:31 GMT'})
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 412)
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
-            headers={'If-Modified-Since': 'Sat, 29 Oct 1000 19:43:31 GMT'})
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 412)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+
+        too_big_date_list = list(datetime.datetime.max.timetuple())
+        too_big_date_list[0] += 1  # bump up the year
+        too_big_date = strftime(
+            "%a, %d %b %Y %H:%M:%S UTC", struct_time(too_big_date_list))
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
+            headers={'If-Unmodified-Since': too_big_date})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
 
     def test_content_encoding(self):
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
             headers={'X-Timestamp': normalize_timestamp(time()),
                      'Content-Length': '4', 'Content-Type': 'text/plain',
                      'Content-Encoding': 'gzip'},
-            body='    ')
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'})
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(resp.headers['content-encoding'], 'gzip')
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD':
-            'HEAD'})
-        resp = self.object_controller.HEAD(req)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(resp.headers['content-encoding'], 'gzip')
-
-    def test_manifest_header(self):
-        timestamp = normalize_timestamp(time())
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                headers={'X-Timestamp': timestamp,
-                         'Content-Type': 'text/plain',
-                         'Content-Length': '0',
-                         'X-Object-Manifest': 'c/o/'})
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
-        objfile = os.path.join(self.testdir, 'sda1',
-            storage_directory(object_server.DATADIR, 'p', hash_path('a', 'c',
-            'o')), timestamp + '.data')
-        self.assert_(os.path.isfile(objfile))
-        self.assertEquals(pickle.loads(getxattr(objfile,
-            object_server.METADATA_KEY)), {'X-Timestamp': timestamp,
-            'Content-Length': '0', 'Content-Type': 'text/plain', 'name':
-            '/a/c/o', 'X-Object-Manifest': 'c/o/', 'ETag':
-            'd41d8cd98f00b204e9800998ecf8427e'})
+            body=b'    ')
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
         req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'})
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
-        self.assertEquals(resp.headers.get('x-object-manifest'), 'c/o/')
-
-    def test_manifest_head_request(self):
-        timestamp = normalize_timestamp(time())
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                headers={'X-Timestamp': timestamp,
-                         'Content-Type': 'text/plain',
-                         'Content-Length': '0',
-                         'X-Object-Manifest': 'c/o/'})
-        req.body = 'hi'
-        resp = self.object_controller.PUT(req)
-        objfile = os.path.join(self.testdir, 'sda1',
-            storage_directory(object_server.DATADIR, 'p', hash_path('a', 'c',
-            'o')), timestamp + '.data')
-        self.assert_(os.path.isfile(objfile))
-        req = Request.blank('/sda1/p/a/c/o',
-                            environ={'REQUEST_METHOD': 'HEAD'})
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.body, '')
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['content-encoding'], 'gzip')
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'HEAD'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['content-encoding'], 'gzip')
 
     def test_async_update_http_connect(self):
+        policy = random.choice(list(POLICIES))
+        self._stage_tmp_dir(policy)
         given_args = []
 
         def fake_http_connect(*args):
@@ -1627,35 +6219,361 @@ def fake_http_connect(*args):
         orig_http_connect = object_server.http_connect
         try:
             object_server.http_connect = fake_http_connect
-            self.object_controller.async_update('PUT', 'a', 'c', 'o',
-                '127.0.0.1:1234', 1, 'sdc1',
-                {'x-timestamp': '1', 'x-out': 'set'}, 'sda1')
+            self.object_controller.async_update(
+                'PUT', 'a', 'c', 'o', '127.0.0.1:1234', 1, 'sdc1',
+                {'x-timestamp': '1', 'x-out': 'set',
+                 'X-Backend-Storage-Policy-Index': int(policy)}, 'sda1',
+                policy)
         finally:
             object_server.http_connect = orig_http_connect
-        self.assertEquals(given_args, ['127.0.0.1', '1234', 'sdc1', 1, 'PUT',
-            '/a/c/o', {'x-timestamp': '1', 'x-out': 'set'}])
+        self.assertEqual(
+            given_args,
+            ['127.0.0.1', '1234', 'sdc1', 1, 'PUT', '/a/c/o', {
+                'x-timestamp': '1', 'x-out': 'set',
+                'user-agent': 'object-server %s' % os.getpid(),
+                'X-Backend-Storage-Policy-Index': int(policy)}])
+
+    @patch_policies([StoragePolicy(0, 'zero', True),
+                     StoragePolicy(1, 'one'),
+                     StoragePolicy(37, 'fantastico')])
+    def test_updating_multiple_delete_at_container_servers(self):
+        # update router post patch
+        self.object_controller._diskfile_router = diskfile.DiskFileRouter(
+            self.conf, self.object_controller.logger)
+        policy = random.choice(list(POLICIES))
+        self.object_controller.expirer_config.account_name = 'exp'
+
+        http_connect_args = []
+
+        def fake_http_connect(ipaddr, port, device, partition, method, path,
+                              headers=None, query_string=None, ssl=False):
+
+            class SuccessfulFakeConn(object):
+
+                @property
+                def status(self):
+                    return 200
+
+                def getresponse(self):
+                    return self
+
+                def read(self):
+                    return b''
+
+            captured_args = {'ipaddr': ipaddr, 'port': port,
+                             'device': device, 'partition': partition,
+                             'method': method, 'path': path, 'ssl': ssl,
+                             'headers': headers, 'query_string': query_string}
+
+            http_connect_args.append(
+                dict((k, v) for k, v in captured_args.items()
+                     if v is not None))
+
+            return SuccessfulFakeConn()
+
+        req_headers = {
+            'X-Timestamp': '12345',
+            'Content-Type': 'application/burrito',
+            'Content-Length': '0',
+            'X-Backend-Storage-Policy-Index': int(policy),
+            'X-Container-Partition': '20',
+            'X-Container-Host': '1.2.3.4:5',
+            'X-Container-Device': 'sdb1',
+            'X-Delete-At': 9999999999,
+        }
+        self._update_delete_at_headers(req_headers, node_count=2)
+        req = Request.blank('/sda1/p/a/c/o', method='PUT', headers=req_headers)
+        with fake_spawn(), mock.patch.object(
+                object_server, 'http_connect', fake_http_connect):
+            resp = req.get_response(self.object_controller)
+
+        self.assertEqual(resp.status_int, 201)
+
+        http_connect_args.sort(key=operator.itemgetter('ipaddr'))
+
+        self.assertEqual(len(http_connect_args), 3)
+        self.assertEqual(
+            http_connect_args[0],
+            {'ipaddr': '1.2.3.4',
+             'port': '5',
+             'path': '/a/c/o',
+             'device': 'sdb1',
+             'partition': '20',
+             'method': 'PUT',
+             'ssl': False,
+             'headers': HeaderKeyDict({
+                 'x-content-type': 'application/burrito',
+                 'x-etag': 'd41d8cd98f00b204e9800998ecf8427e',
+                 'x-size': '0',
+                 'x-timestamp': utils.Timestamp('12345').internal,
+                 'referer': 'PUT http://localhost/sda1/p/a/c/o',
+                 'user-agent': 'object-server %d' % os.getpid(),
+                 'X-Backend-Storage-Policy-Index': int(policy),
+                 'x-trans-id': '-'})})
+        expected_hosts = [h.split(':') for h in
+                          req_headers['X-Delete-At-Host'].split(',')]
+        expected_devs = [d for d in
+                         req_headers['X-Delete-At-Device'].split(',')]
+        self.assertEqual(
+            http_connect_args[1],
+            {'ipaddr': expected_hosts[0][0],
+             'port': expected_hosts[0][1],
+             'path': ('/exp/%s/9999999999-a/c/o' %
+                      req_headers['X-Delete-At-Container']),
+             'device': expected_devs[0],
+             'partition': req_headers['X-Delete-At-Partition'],
+             'method': 'PUT',
+             'ssl': False,
+             'headers': HeaderKeyDict({
+                 'x-content-type': 'text/plain;swift_expirer_bytes=0',
+                 'x-content-type-timestamp': utils.Timestamp('12345').internal,
+                 'x-etag': 'd41d8cd98f00b204e9800998ecf8427e',
+                 'x-size': '0',
+                 'x-timestamp': utils.Timestamp('12345').internal,
+                 'referer': 'PUT http://localhost/sda1/p/a/c/o',
+                 'user-agent': 'object-server %d' % os.getpid(),
+                 # system account storage policy is 0
+                 'X-Backend-Storage-Policy-Index': 0,
+                 'x-trans-id': '-'})})
+        self.assertEqual(
+            http_connect_args[2],
+            {'ipaddr': expected_hosts[1][0],
+             'port': expected_hosts[1][1],
+             'path': ('/exp/%s/9999999999-a/c/o' %
+                      req_headers['X-Delete-At-Container']),
+             'device': expected_devs[1],
+             'partition': req_headers['X-Delete-At-Partition'],
+             'method': 'PUT',
+             'ssl': False,
+             'headers': HeaderKeyDict({
+                 'x-content-type': 'text/plain;swift_expirer_bytes=0',
+                 'x-content-type-timestamp': utils.Timestamp('12345').internal,
+                 'x-etag': 'd41d8cd98f00b204e9800998ecf8427e',
+                 'x-size': '0',
+                 'x-timestamp': utils.Timestamp('12345').internal,
+                 'referer': 'PUT http://localhost/sda1/p/a/c/o',
+                 'user-agent': 'object-server %d' % os.getpid(),
+                 # system account storage policy is 0
+                 'X-Backend-Storage-Policy-Index': 0,
+                 'x-trans-id': '-'})})
+
+    @patch_policies([StoragePolicy(0, 'zero', True),
+                     StoragePolicy(1, 'one'),
+                     StoragePolicy(26, 'twice-thirteen')])
+    def test_updating_multiple_container_servers(self):
+        # update router post patch
+        self.object_controller._diskfile_router = diskfile.DiskFileRouter(
+            self.conf, self.object_controller.logger)
+        http_connect_args = []
+
+        def fake_http_connect(ipaddr, port, device, partition, method, path,
+                              headers=None, query_string=None, ssl=False):
+
+            class SuccessfulFakeConn(object):
+
+                @property
+                def status(self):
+                    return 200
+
+                def getresponse(self):
+                    return self
+
+                def read(self):
+                    return b''
+
+            captured_args = {'ipaddr': ipaddr, 'port': port,
+                             'device': device, 'partition': partition,
+                             'method': method, 'path': path, 'ssl': ssl,
+                             'headers': headers, 'query_string': query_string}
+
+            http_connect_args.append(
+                dict((k, v) for k, v in captured_args.items()
+                     if v is not None))
+
+            return SuccessfulFakeConn()
+
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': '12345',
+                     'Content-Type': 'application/burrito',
+                     'Content-Length': '0',
+                     'X-Backend-Storage-Policy-Index': '26',
+                     'X-Container-Partition': '20',
+                     'X-Container-Host': '1.2.3.4:5, 6.7.8.9:10',
+                     'X-Container-Device': 'sdb1, sdf1'})
+
+        with mock.patch.object(
+                object_server, 'http_connect', fake_http_connect):
+            with fake_spawn():
+                req.get_response(self.object_controller)
+
+        http_connect_args.sort(key=operator.itemgetter('ipaddr'))
+
+        self.assertEqual(len(http_connect_args), 2)
+        self.assertEqual(
+            http_connect_args[0],
+            {'ipaddr': '1.2.3.4',
+             'port': '5',
+             'path': '/a/c/o',
+             'device': 'sdb1',
+             'partition': '20',
+             'method': 'PUT',
+             'ssl': False,
+             'headers': HeaderKeyDict({
+                 'x-content-type': 'application/burrito',
+                 'x-etag': 'd41d8cd98f00b204e9800998ecf8427e',
+                 'x-size': '0',
+                 'x-timestamp': utils.Timestamp('12345').internal,
+                 'X-Backend-Storage-Policy-Index': '26',
+                 'referer': 'PUT http://localhost/sda1/p/a/c/o',
+                 'user-agent': 'object-server %d' % os.getpid(),
+                 'x-trans-id': '-'})})
+        self.assertEqual(
+            http_connect_args[1],
+            {'ipaddr': '6.7.8.9',
+             'port': '10',
+             'path': '/a/c/o',
+             'device': 'sdf1',
+             'partition': '20',
+             'method': 'PUT',
+             'ssl': False,
+             'headers': HeaderKeyDict({
+                 'x-content-type': 'application/burrito',
+                 'x-etag': 'd41d8cd98f00b204e9800998ecf8427e',
+                 'x-size': '0',
+                 'x-timestamp': utils.Timestamp('12345').internal,
+                 'X-Backend-Storage-Policy-Index': '26',
+                 'referer': 'PUT http://localhost/sda1/p/a/c/o',
+                 'user-agent': 'object-server %d' % os.getpid(),
+                 'x-trans-id': '-'})})
+
+    def test_object_delete_at_async_update(self):
+        policy = random.choice(list(POLICIES))
+
+        container_updates = []
+
+        def capture_updates(ip, port, method, path, headers, *args, **kwargs):
+            container_updates.append((ip, port, method, path, headers))
+
+        # put everything in the future; otherwise setting X-Delete-At may fail
+        self.ts = make_timestamp_iter(10)
+
+        put_timestamp = next(self.ts).internal
+        delete_at_timestamp = utils.normalize_delete_at_timestamp(
+            next(self.ts).normal)
+        req_headers = {
+            'Content-Type': 'text/plain',
+            'X-Timestamp': put_timestamp,
+            'X-Container-Host': '10.0.0.1:6201',
+            'X-Container-Device': 'sda1',
+            'X-Container-Partition': 'p',
+            'X-Delete-At': delete_at_timestamp,
+            'X-Backend-Storage-Policy-Index': int(policy)}
+        self._update_delete_at_headers(req_headers)
+        if policy.policy_type == EC_POLICY:
+            req_headers['X-Object-Sysmeta-Ec-Frag-Index'] = '2'
+        req = Request.blank(
+            '/sda1/p/a/c/o', method='PUT', body=b'', headers=req_headers)
+        with mocked_http_conn(
+                500, 500, give_connect=capture_updates) as fake_conn:
+            with fake_spawn():
+                resp = req.get_response(self.object_controller)
+            self.assertEqual(201, resp.status_int, resp.body)
+        with self.assertRaises(StopIteration):
+            next(fake_conn.code_iter)
+        self.assertEqual(resp.status_int, 201)
+        self.assertEqual(2, len(container_updates))
+        delete_at_update, container_update = container_updates
+        # delete_at_update
+        ip, port, method, path, headers = delete_at_update
+        expected_ip, expected_port = req_headers['X-Delete-At-Host'].split(':')
+        self.assertEqual(ip, expected_ip)
+        self.assertEqual(port, expected_port)
+        self.assertEqual(method, 'PUT')
+        self.assertEqual(path, '/%s/%s/.expiring_objects/%s/%s-a/c/o' % (
+            req_headers['X-Delete-At-Device'],
+            req_headers['X-Delete-At-Partition'],
+            req_headers['X-Delete-At-Container'],
+            req_headers['X-Delete-At']))
+        expected = {
+            'X-Timestamp': put_timestamp,
+            # system account storage policy is 0
+            'X-Backend-Storage-Policy-Index': 0,
+        }
+        for key, value in expected.items():
+            self.assertEqual(headers[key], str(value))
+        # container_update
+        ip, port, method, path, headers = container_update
+        self.assertEqual(ip, '10.0.0.1')
+        self.assertEqual(port, '6201')
+        self.assertEqual(method, 'PUT')
+        self.assertEqual(path, '/sda1/p/a/c/o')
+        expected = {
+            'X-Timestamp': put_timestamp,
+            'X-Backend-Storage-Policy-Index': int(policy),
+        }
+        for key, value in expected.items():
+            self.assertEqual(headers[key], str(value))
+        # check async pendings
+        async_dir = os.path.join(self.testdir, 'sda1',
+                                 diskfile.get_async_dir(policy))
+        found_files = []
+        for root, dirs, files in os.walk(async_dir):
+            for f in files:
+                async_file = os.path.join(root, f)
+                found_files.append(async_file)
+                data = pickle.load(open(async_file, 'rb'))
+                if data['account'] == 'a':
+                    self.assertEqual(
+                        int(data['headers']
+                            ['X-Backend-Storage-Policy-Index']), int(policy))
+                elif data['account'] == '.expiring_objects':
+                    self.assertEqual(
+                        int(data['headers']
+                            ['X-Backend-Storage-Policy-Index']), 0)
+                else:
+                    self.fail('unexpected async pending data')
+        self.assertEqual(2, len(found_files))
 
     def test_async_update_saves_on_exception(self):
+        policy = random.choice(list(POLICIES))
+        self._stage_tmp_dir(policy)
+        _prefix = utils.HASH_PATH_PREFIX
+        utils.HASH_PATH_PREFIX = b''
 
         def fake_http_connect(*args):
             raise Exception('test')
 
+        timestamp = next(self.ts)
         orig_http_connect = object_server.http_connect
         try:
             object_server.http_connect = fake_http_connect
-            self.object_controller.async_update('PUT', 'a', 'c', 'o',
-                '127.0.0.1:1234', 1, 'sdc1',
-                {'x-timestamp': '1', 'x-out': 'set'}, 'sda1')
+            self.object_controller.async_update(
+                'PUT', 'a', 'c', 'o', '127.0.0.1:1234', 1, 'sdc1',
+                {'x-timestamp': timestamp.internal, 'x-out': 'set',
+                 'X-Backend-Storage-Policy-Index': int(policy)},
+                'sda1', policy, db_state='unsharded')
         finally:
             object_server.http_connect = orig_http_connect
-        self.assertEquals(
-            pickle.load(open(os.path.join(self.testdir, 'sda1',
-                'async_pending', 'a83',
-                '06fbf0b514e5199dfc4e00f42eb5ea83-0000000001.00000'))),
-            {'headers': {'x-timestamp': '1', 'x-out': 'set'}, 'account': 'a',
-             'container': 'c', 'obj': 'o', 'op': 'PUT'})
+            utils.HASH_PATH_PREFIX = _prefix
+        async_dir = diskfile.get_async_dir(policy)
+        self.assertEqual(
+            pickle.load(open(os.path.join(
+                self.testdir, 'sda1', async_dir, 'a83',
+                '06fbf0b514e5199dfc4e00f42eb5ea83-%s' % timestamp.internal),
+                'rb')),
+            {'headers': {'x-timestamp': timestamp.internal, 'x-out': 'set',
+                         'user-agent': 'object-server %s' % os.getpid(),
+                         'X-Backend-Storage-Policy-Index': int(policy)},
+             'account': 'a', 'container': 'c', 'obj': 'o', 'op': 'PUT',
+             'db_state': 'unsharded'})
 
     def test_async_update_saves_on_non_2xx(self):
+        policy = random.choice(list(POLICIES))
+        self._stage_tmp_dir(policy)
+        _prefix = utils.HASH_PATH_PREFIX
+        utils.HASH_PATH_PREFIX = b''
 
         def fake_http_connect(status):
 
@@ -1668,28 +6586,41 @@ def getresponse(self):
                     return self
 
                 def read(self):
-                    return ''
+                    return b''
 
             return lambda *args: FakeConn(status)
 
         orig_http_connect = object_server.http_connect
         try:
             for status in (199, 300, 503):
+                timestamp = next(self.ts)
                 object_server.http_connect = fake_http_connect(status)
-                self.object_controller.async_update('PUT', 'a', 'c', 'o',
-                    '127.0.0.1:1234', 1, 'sdc1',
-                    {'x-timestamp': '1', 'x-out': str(status)}, 'sda1')
-                self.assertEquals(
-                    pickle.load(open(os.path.join(self.testdir, 'sda1',
-                        'async_pending', 'a83',
-                        '06fbf0b514e5199dfc4e00f42eb5ea83-0000000001.00000'))),
-                    {'headers': {'x-timestamp': '1', 'x-out': str(status)},
+                self.object_controller.async_update(
+                    'PUT', 'a', 'c', 'o', '127.0.0.1:1234', 1, 'sdc1',
+                    {'x-timestamp': timestamp.internal, 'x-out': str(status),
+                     'X-Backend-Storage-Policy-Index': int(policy)},
+                    'sda1', policy, db_state='unsharded')
+                async_dir = diskfile.get_async_dir(policy)
+                self.assertEqual(
+                    pickle.load(open(os.path.join(
+                        self.testdir, 'sda1', async_dir, 'a83',
+                        '06fbf0b514e5199dfc4e00f42eb5ea83-%s' %
+                        timestamp.internal), 'rb')),
+                    {'headers': {'x-timestamp': timestamp.internal,
+                                 'x-out': str(status),
+                                 'user-agent':
+                                 'object-server %s' % os.getpid(),
+                                 'X-Backend-Storage-Policy-Index':
+                                 int(policy)},
                      'account': 'a', 'container': 'c', 'obj': 'o',
-                     'op': 'PUT'})
+                     'op': 'PUT', 'db_state': 'unsharded'})
         finally:
             object_server.http_connect = orig_http_connect
+            utils.HASH_PATH_PREFIX = _prefix
 
     def test_async_update_does_not_save_on_2xx(self):
+        _prefix = utils.HASH_PATH_PREFIX
+        utils.HASH_PATH_PREFIX = b''
 
         def fake_http_connect(status):
 
@@ -1702,107 +6633,946 @@ def getresponse(self):
                     return self
 
                 def read(self):
-                    return ''
+                    return b''
 
             return lambda *args: FakeConn(status)
 
         orig_http_connect = object_server.http_connect
         try:
             for status in (200, 299):
+                timestamp = next(self.ts)
                 object_server.http_connect = fake_http_connect(status)
-                self.object_controller.async_update('PUT', 'a', 'c', 'o',
-                    '127.0.0.1:1234', 1, 'sdc1',
-                    {'x-timestamp': '1', 'x-out': str(status)}, 'sda1')
+                self.object_controller.async_update(
+                    'PUT', 'a', 'c', 'o', '127.0.0.1:1234', 1, 'sdc1',
+                    {'x-timestamp': timestamp.internal,
+                     'x-out': str(status)},
+                    'sda1', 0)
                 self.assertFalse(
-                    os.path.exists(os.path.join(self.testdir, 'sda1',
-                        'async_pending', 'a83',
-                        '06fbf0b514e5199dfc4e00f42eb5ea83-0000000001.00000')))
+                    os.path.exists(os.path.join(
+                        self.testdir, 'sda1', 'async_pending', 'a83',
+                        '06fbf0b514e5199dfc4e00f42eb5ea83-%s'
+                        % timestamp.internal)))
+        finally:
+            object_server.http_connect = orig_http_connect
+            utils.HASH_PATH_PREFIX = _prefix
+
+    def test_async_update_saves_on_timeout(self):
+        policy = random.choice(list(POLICIES))
+        self._stage_tmp_dir(policy)
+        _prefix = utils.HASH_PATH_PREFIX
+        utils.HASH_PATH_PREFIX = b''
+
+        def fake_http_connect():
+
+            class FakeConn(object):
+
+                def getresponse(self):
+                    return sleep(1)
+
+            return lambda *args: FakeConn()
+
+        orig_http_connect = object_server.http_connect
+        try:
+            for status in (200, 299):
+                timestamp = next(self.ts)
+                object_server.http_connect = fake_http_connect()
+                self.object_controller.node_timeout = 0.001
+                self.object_controller.async_update(
+                    'PUT', 'a', 'c', 'o', '127.0.0.1:1234', 1, 'sdc1',
+                    {'x-timestamp': timestamp.internal,
+                     'x-out': str(status)},
+                    'sda1', policy)
+                async_dir = diskfile.get_async_dir(policy)
+                self.assertTrue(
+                    os.path.exists(os.path.join(
+                        self.testdir, 'sda1', async_dir, 'a83',
+                        '06fbf0b514e5199dfc4e00f42eb5ea83-%s' %
+                        timestamp.internal)))
         finally:
             object_server.http_connect = orig_http_connect
+            utils.HASH_PATH_PREFIX = _prefix
 
-    def test_delete_at_update_put(self):
+    def test_container_update_no_async_update(self):
+        policy = random.choice(list(POLICIES))
         given_args = []
 
         def fake_async_update(*args):
             given_args.extend(args)
 
         self.object_controller.async_update = fake_async_update
-        self.object_controller.delete_at_update('PUT', 2, 'a', 'c', 'o',
-            {'x-timestamp': '1'}, 'sda1')
-        self.assertEquals(given_args, ['PUT', '.expiring_objects', '0',
-            '2-a/c/o', None, None, None,
-            {'x-size': '0', 'x-etag': 'd41d8cd98f00b204e9800998ecf8427e',
-             'x-content-type': 'text/plain', 'x-timestamp': '1',
-             'x-trans-id': '-'},
-            'sda1'])
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': 1,
+                     'X-Trans-Id': '1234',
+                     'X-Backend-Storage-Policy-Index': int(policy)})
+        self.object_controller.container_update(
+            'PUT', 'a', 'c', 'o', req, {
+                'x-size': '0', 'x-etag': 'd41d8cd98f00b204e9800998ecf8427e',
+                'x-content-type': 'text/plain', 'x-timestamp': '1'},
+            'sda1', policy)
+        self.assertEqual(given_args, [])
+
+    def test_container_update_success(self):
+        container_updates = []
+
+        def capture_updates(ip, port, method, path, headers, *args, **kwargs):
+            container_updates.append((ip, port, method, path, headers))
+
+        timestamp = next(self.ts)
+        req = Request.blank(
+            '/sda1/0/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': timestamp.internal,
+                     'X-Trans-Id': '123',
+                     'X-Container-Host': 'chost:cport',
+                     'X-Container-Partition': 'cpartition',
+                     'X-Container-Device': 'cdevice',
+                     'Content-Type': 'text/plain'}, body='')
+        with mocked_http_conn(200, give_connect=capture_updates) as fake_conn:
+            with fake_spawn():
+                resp = req.get_response(self.object_controller)
+        with self.assertRaises(StopIteration):
+            next(fake_conn.code_iter)
+        self.assertEqual(resp.status_int, 201)
+        self.assertEqual(len(container_updates), 1)
+        ip, port, method, path, headers = container_updates[0]
+        self.assertEqual(ip, 'chost')
+        self.assertEqual(port, 'cport')
+        self.assertEqual(method, 'PUT')
+        self.assertEqual(path, '/cdevice/cpartition/a/c/o')
+        self.assertEqual(headers, HeaderKeyDict({
+            'user-agent': 'object-server %s' % os.getpid(),
+            'x-size': '0',
+            'x-etag': 'd41d8cd98f00b204e9800998ecf8427e',
+            'x-content-type': 'text/plain',
+            'x-timestamp': timestamp.internal,
+            'X-Backend-Storage-Policy-Index': '0',  # default when not given
+            'x-trans-id': '123',
+            'referer': 'PUT http://localhost/sda1/0/a/c/o'}))
+
+    def test_PUT_container_update_overrides(self):
+
+        def do_test(override_headers):
+            container_updates = []
+
+            def capture_updates(
+                    ip, port, method, path, headers, *args, **kwargs):
+                container_updates.append((ip, port, method, path, headers))
+
+            ts_put = next(self.ts)
+            headers = {
+                'X-Timestamp': ts_put.internal,
+                'X-Trans-Id': '123',
+                'X-Container-Host': 'chost:cport',
+                'X-Container-Partition': 'cpartition',
+                'X-Container-Device': 'cdevice',
+                'Content-Type': 'text/plain',
+            }
+            headers.update(override_headers)
+            req = Request.blank('/sda1/0/a/c/o', method='PUT',
+                                headers=headers, body='')
+            with mocked_http_conn(
+                    200, give_connect=capture_updates) as fake_conn:
+                with fake_spawn():
+                    resp = req.get_response(self.object_controller)
+            with self.assertRaises(StopIteration):
+                next(fake_conn.code_iter)
+            self.assertEqual(resp.status_int, 201)
+            self.assertEqual(len(container_updates), 1)
+            ip, port, method, path, headers = container_updates[0]
+            self.assertEqual(ip, 'chost')
+            self.assertEqual(port, 'cport')
+            self.assertEqual(method, 'PUT')
+            self.assertEqual(path, '/cdevice/cpartition/a/c/o')
+            self.assertEqual(headers, HeaderKeyDict({
+                'user-agent': 'object-server %s' % os.getpid(),
+                'x-size': '0',
+                'x-etag': 'override_etag',
+                'x-content-type': 'override_val',
+                'x-timestamp': ts_put.internal,
+                'X-Backend-Storage-Policy-Index': '0',  # default
+                'x-trans-id': '123',
+                'referer': 'PUT http://localhost/sda1/0/a/c/o',
+                'x-foo': 'bar'}))
+
+        # EC policy override headers
+        do_test({
+            'X-Backend-Container-Update-Override-Etag': 'override_etag',
+            'X-Backend-Container-Update-Override-Content-Type': 'override_val',
+            'X-Backend-Container-Update-Override-Foo': 'bar',
+            'X-Backend-Container-Ignored': 'ignored'})
+
+        # middleware override headers
+        do_test({
+            'X-Object-Sysmeta-Container-Update-Override-Etag': 'override_etag',
+            'X-Object-Sysmeta-Container-Update-Override-Content-Type':
+                'override_val',
+            'X-Object-Sysmeta-Container-Update-Override-Foo': 'bar',
+            'X-Object-Sysmeta-Ignored': 'ignored'})
+
+        # middleware override headers take precedence over EC policy headers
+        do_test({
+            'X-Object-Sysmeta-Container-Update-Override-Etag': 'override_etag',
+            'X-Object-Sysmeta-Container-Update-Override-Content-Type':
+                'override_val',
+            'X-Object-Sysmeta-Container-Update-Override-Foo': 'bar',
+            'X-Backend-Container-Update-Override-Etag': 'ignored',
+            'X-Backend-Container-Update-Override-Content-Type': 'ignored',
+            'X-Backend-Container-Update-Override-Foo': 'ignored'})
+
+    def test_PUT_container_update_to_old_style_shard(self):
+        # verify that alternate container update path is respected when
+        # included in request headers
+        def do_test(container_path, expected_path, expected_container_path):
+            policy = random.choice(list(POLICIES))
+            container_updates = []
+
+            def capture_updates(
+                    ip, port, method, path, headers, *args, **kwargs):
+                container_updates.append((ip, port, method, path, headers))
+
+            pickle_async_update_args = []
+
+            def fake_pickle_async_update(*args):
+                pickle_async_update_args.append(args)
+
+            diskfile_mgr = self.object_controller._diskfile_router[policy]
+            diskfile_mgr.pickle_async_update = fake_pickle_async_update
+
+            ts_put = next(self.ts)
+            headers = {
+                'X-Timestamp': ts_put.internal,
+                'X-Trans-Id': '123',
+                'X-Container-Host': 'chost:cport',
+                'X-Container-Partition': 'cpartition',
+                'X-Container-Device': 'cdevice',
+                'X-Container-Root-Db-State': 'unsharded',
+                'Content-Type': 'text/plain',
+                'X-Object-Sysmeta-Ec-Frag-Index': 0,
+                'X-Backend-Storage-Policy-Index': int(policy),
+            }
+            if container_path is not None:
+                headers['X-Backend-Container-Path'] = container_path
+                headers['X-Container-Root-Db-State'] = 'sharded'
+
+            req = Request.blank('/sda1/0/a/c/o', method='PUT',
+                                headers=headers, body='')
+            with mocked_http_conn(
+                    500, give_connect=capture_updates) as fake_conn:
+                with fake_spawn():
+                    resp = req.get_response(self.object_controller)
+            with self.assertRaises(StopIteration):
+                next(fake_conn.code_iter)
+            self.assertEqual(resp.status_int, 201)
+            self.assertEqual(len(container_updates), 1)
+            # verify expected path used in update request
+            ip, port, method, path, headers = container_updates[0]
+            self.assertEqual(ip, 'chost')
+            self.assertEqual(port, 'cport')
+            self.assertEqual(method, 'PUT')
+            self.assertEqual(path, '/cdevice/cpartition/%s/o' % expected_path)
+
+            # verify that the picked update *always* has root container
+            self.assertEqual(1, len(pickle_async_update_args))
+            (objdevice, account, container, obj, data, timestamp,
+             policy) = pickle_async_update_args[0]
+            self.assertEqual(objdevice, 'sda1')
+            self.assertEqual(account, 'a')  # NB user account
+            self.assertEqual(container, 'c')  # NB root container
+            self.assertEqual(obj, 'o')
+            self.assertEqual(timestamp, ts_put.internal)
+            self.assertEqual(policy, policy)
+            expected_data = {
+                'headers': HeaderKeyDict({
+                    'X-Size': '0',
+                    'User-Agent': 'object-server %s' % os.getpid(),
+                    'X-Content-Type': 'text/plain',
+                    'X-Timestamp': ts_put.internal,
+                    'X-Trans-Id': '123',
+                    'Referer': 'PUT http://localhost/sda1/0/a/c/o',
+                    'X-Backend-Storage-Policy-Index': int(policy),
+                    'X-Etag': 'd41d8cd98f00b204e9800998ecf8427e'}),
+                'obj': 'o',
+                'account': 'a',
+                'container': 'c',
+                'op': 'PUT',
+                'db_state': 'unsharded'}
+            if expected_container_path:
+                expected_data['container_path'] = expected_container_path
+            if container_path is not None:
+                expected_data['db_state'] = 'sharded'
+            self.assertEqual(expected_data, data)
+
+        do_test('a_shard/c_shard', 'a_shard/c_shard', 'a_shard/c_shard')
+        do_test('', 'a/c', None)
+        do_test(None, 'a/c', None)
+        # TODO: should these cases trigger a 400 response rather than
+        # defaulting to root path?
+        do_test('garbage', 'a/c', None)
+        do_test('/', 'a/c', None)
+        do_test('/no-acct', 'a/c', None)
+        do_test('no-cont/', 'a/c', None)
+        do_test('too/many/parts', 'a/c', None)
+        do_test('/leading/slash', 'a/c', None)
+
+    def test_PUT_container_update_to_shard(self):
+        # verify that alternate container update path is respected when
+        # included in request headers
+        def do_test(container_path, expected_path, expected_container_path):
+            policy = random.choice(list(POLICIES))
+            container_updates = []
+
+            def capture_updates(
+                    ip, port, method, path, headers, *args, **kwargs):
+                container_updates.append((ip, port, method, path, headers))
+
+            pickle_async_update_args = []
+
+            def fake_pickle_async_update(*args):
+                pickle_async_update_args.append(args)
+
+            diskfile_mgr = self.object_controller._diskfile_router[policy]
+            diskfile_mgr.pickle_async_update = fake_pickle_async_update
+
+            ts_put = next(self.ts)
+            headers = {
+                'X-Timestamp': ts_put.internal,
+                'X-Trans-Id': '123',
+                'X-Container-Host': 'chost:cport',
+                'X-Container-Partition': 'cpartition',
+                'X-Container-Device': 'cdevice',
+                'X-Container-Root-Db-State': 'unsharded',
+                'Content-Type': 'text/plain',
+                'X-Object-Sysmeta-Ec-Frag-Index': 0,
+                'X-Backend-Storage-Policy-Index': int(policy),
+            }
+            if container_path is not None:
+                headers['X-Backend-Quoted-Container-Path'] = container_path
+                headers['X-Container-Root-Db-State'] = 'sharded'
+
+            req = Request.blank('/sda1/0/a/c/o', method='PUT',
+                                headers=headers, body='')
+            with mocked_http_conn(
+                    500, give_connect=capture_updates) as fake_conn:
+                with fake_spawn():
+                    resp = req.get_response(self.object_controller)
+            with self.assertRaises(StopIteration):
+                next(fake_conn.code_iter)
+            self.assertEqual(resp.status_int, 201)
+            self.assertEqual(len(container_updates), 1)
+            # verify expected path used in update request
+            ip, port, method, path, headers = container_updates[0]
+            self.assertEqual(ip, 'chost')
+            self.assertEqual(port, 'cport')
+            self.assertEqual(method, 'PUT')
+            self.assertEqual(path, '/cdevice/cpartition/%s/o' % expected_path)
+
+            # verify that the picked update *always* has root container
+            self.assertEqual(1, len(pickle_async_update_args))
+            (objdevice, account, container, obj, data, timestamp,
+             policy) = pickle_async_update_args[0]
+            self.assertEqual(objdevice, 'sda1')
+            self.assertEqual(account, 'a')  # NB user account
+            self.assertEqual(container, 'c')  # NB root container
+            self.assertEqual(obj, 'o')
+            self.assertEqual(timestamp, ts_put.internal)
+            self.assertEqual(policy, policy)
+            expected_data = {
+                'headers': HeaderKeyDict({
+                    'X-Size': '0',
+                    'User-Agent': 'object-server %s' % os.getpid(),
+                    'X-Content-Type': 'text/plain',
+                    'X-Timestamp': ts_put.internal,
+                    'X-Trans-Id': '123',
+                    'Referer': 'PUT http://localhost/sda1/0/a/c/o',
+                    'X-Backend-Storage-Policy-Index': int(policy),
+                    'X-Etag': 'd41d8cd98f00b204e9800998ecf8427e'}),
+                'obj': 'o',
+                'account': 'a',
+                'container': 'c',
+                'op': 'PUT',
+                'db_state': 'unsharded'}
+            if expected_container_path:
+                expected_data['container_path'] = expected_container_path
+            if container_path is not None:
+                expected_data['db_state'] = 'sharded'
+            self.assertEqual(expected_data, data)
+
+        do_test('a_shard/c_shard', 'a_shard/c_shard', 'a_shard/c_shard')
+        do_test('', 'a/c', None)
+        do_test(None, 'a/c', None)
+        # TODO: should these cases trigger a 400 response rather than
+        # defaulting to root path?
+        do_test('garbage', 'a/c', None)
+        do_test('/', 'a/c', None)
+        do_test('/no-acct', 'a/c', None)
+        do_test('no-cont/', 'a/c', None)
+        do_test('too/many/parts', 'a/c', None)
+        do_test('/leading/slash', 'a/c', None)
+
+    def test_container_update_async(self):
+        policy = random.choice(list(POLICIES))
+        ts = next(self.ts)
+        req = Request.blank(
+            '/sda1/0/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': ts.internal,
+                     'X-Trans-Id': '123',
+                     'X-Container-Host': 'chost:cport',
+                     'X-Container-Partition': 'cpartition',
+                     'X-Container-Device': 'cdevice',
+                     'X-Container-Root-Db-State': 'unsharded',
+                     'Content-Type': 'text/plain',
+                     'X-Object-Sysmeta-Ec-Frag-Index': 0,
+                     'X-Backend-Storage-Policy-Index': int(policy)}, body='')
+        given_args = []
+
+        def fake_pickle_async_update(*args):
+            given_args[:] = args
+        diskfile_mgr = self.object_controller._diskfile_router[policy]
+        diskfile_mgr.pickle_async_update = fake_pickle_async_update
+        with mocked_http_conn(500) as fake_conn, fake_spawn():
+            resp = req.get_response(self.object_controller)
+        # fake_spawn() above waits on greenthreads to finish;
+        # don't start making assertions until then
+        with self.assertRaises(StopIteration):
+            next(fake_conn.code_iter)
+        self.assertEqual(resp.status_int, 201)
+        self.assertEqual(len(given_args), 7)
+        (objdevice, account, container, obj, data, timestamp,
+         policy) = given_args
+        self.assertEqual(objdevice, 'sda1')
+        self.assertEqual(account, 'a')
+        self.assertEqual(container, 'c')
+        self.assertEqual(obj, 'o')
+        self.assertEqual(timestamp, ts.internal)
+        self.assertEqual(policy, policy)
+        self.assertEqual(data, {
+            'headers': HeaderKeyDict({
+                'X-Size': '0',
+                'User-Agent': 'object-server %s' % os.getpid(),
+                'X-Content-Type': 'text/plain',
+                'X-Timestamp': ts.internal,
+                'X-Trans-Id': '123',
+                'Referer': 'PUT http://localhost/sda1/0/a/c/o',
+                'X-Backend-Storage-Policy-Index': int(policy),
+                'X-Etag': 'd41d8cd98f00b204e9800998ecf8427e'}),
+            'obj': 'o',
+            'account': 'a',
+            'container': 'c',
+            'op': 'PUT',
+            'db_state': 'unsharded'})
+
+    def test_container_update_as_greenthread(self):
+        greenthreads = []
+        saved_spawn_calls = []
+        called_async_update_args = []
+
+        def local_fake_spawn(func, *a, **kw):
+            saved_spawn_calls.append((func, a, kw))
+            return mock.MagicMock()
+
+        def local_fake_async_update(*a, **kw):
+            # just capture the args to see that we would have called
+            called_async_update_args.append([a, kw])
+
+        ts = next(self.ts)
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': ts.internal,
+                     'Content-Type': 'application/burrito',
+                     'Content-Length': '0',
+                     'X-Backend-Storage-Policy-Index': 0,
+                     'X-Container-Partition': '20',
+                     'X-Container-Host': '1.2.3.4:5',
+                     'X-Container-Device': 'sdb1',
+                     'X-Container-Root-Db-State': 'unsharded'})
+        with mock.patch.object(object_server, 'spawn', local_fake_spawn), \
+                mock.patch.object(self.object_controller, 'async_update',
+                                  local_fake_async_update):
+            resp = req.get_response(self.object_controller)
+            # check the response is completed and successful
+            self.assertEqual(resp.status_int, 201)
+            # check that async_update hasn't been called
+            self.assertFalse(len(called_async_update_args))
+            # now do the work in greenthreads
+            for func, a, kw in saved_spawn_calls:
+                gt = spawn(func, *a, **kw)
+                greenthreads.append(gt)
+            # wait for the greenthreads to finish
+            for gt in greenthreads:
+                gt.wait()
+        # check that the calls to async_update have happened
+        headers_out = {'X-Size': '0',
+                       'X-Content-Type': 'application/burrito',
+                       'X-Timestamp': ts.internal,
+                       'X-Trans-Id': '-',
+                       'Referer': 'PUT http://localhost/sda1/p/a/c/o',
+                       'X-Backend-Storage-Policy-Index': '0',
+                       'X-Etag': 'd41d8cd98f00b204e9800998ecf8427e'}
+        expected = [('PUT', 'a', 'c', 'o', '1.2.3.4:5', '20', 'sdb1',
+                     headers_out, 'sda1', POLICIES[0]),
+                    {'logger_thread_locals': (None, None),
+                     'container_path': None,
+                     'db_state': 'unsharded'}]
+        self.assertEqual(called_async_update_args, [expected])
+
+    def test_container_update_as_greenthread_with_timeout(self):
+        # give it one container to update (for only one greenthred)
+        # fake the greenthred so it will raise a timeout
+        # test that the right message is logged and the method returns None
+        called_async_update_args = []
+
+        def local_fake_spawn(func, *a, **kw):
+            m = mock.MagicMock()
+
+            def wait_with_error():
+                raise Timeout()
+            m.wait = wait_with_error  # because raise can't be in a lambda
+            return m
+
+        def local_fake_async_update(*a, **kw):
+            # just capture the args to see that we would have called
+            called_async_update_args.append([a, kw])
+
+        ts = next(self.ts)
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': ts.internal,
+                     'Content-Type': 'application/burrito',
+                     'Content-Length': '0',
+                     'X-Backend-Storage-Policy-Index': 0,
+                     'X-Container-Partition': '20',
+                     'X-Container-Host': '1.2.3.4:5',
+                     'X-Container-Device': 'sdb1'})
+        with mock.patch.object(object_server, 'spawn',
+                               local_fake_spawn):
+            with mock.patch.object(self.object_controller,
+                                   'container_update_timeout',
+                                   1.414213562):
+                resp = req.get_response(self.object_controller)
+        # check the response is completed and successful
+        self.assertEqual(resp.status_int, 201)
+        # check that the timeout was logged
+        expected_logged_error = "Container update timeout (1.4142s) " \
+            "waiting for [('1.2.3.4:5', 'sdb1')]"
+        self.assertTrue(
+            expected_logged_error in
+            self.object_controller.logger.get_lines_for_level('debug'))
+
+    def test_container_update_bad_args(self):
+        policy = random.choice(list(POLICIES))
+        given_args = []
+
+        def fake_async_update(*args):
+            given_args.extend(args)
+
+        ts = next(self.ts)
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': ts.internal,
+                     'X-Trans-Id': '123',
+                     'X-Container-Host': 'chost,badhost',
+                     'X-Container-Partition': 'cpartition',
+                     'X-Container-Device': 'cdevice',
+                     'X-Backend-Storage-Policy-Index': int(policy)})
+        with mock.patch.object(self.object_controller, 'async_update',
+                               fake_async_update):
+            self.object_controller.container_update(
+                'PUT', 'a', 'c', 'o', req, {
+                    'x-size': '0',
+                    'x-etag': 'd41d8cd98f00b204e9800998ecf8427e',
+                    'x-content-type': 'text/plain', 'x-timestamp': '1'},
+                'sda1', policy)
+        self.assertEqual(given_args, [])
+        errors = self.object_controller.logger.get_lines_for_level('error')
+        self.assertEqual(len(errors), 1)
+        msg = errors[0]
+        self.assertTrue('Container update failed' in msg)
+        self.assertTrue('different numbers of hosts and devices' in msg)
+        self.assertTrue('chost,badhost' in msg)
+        self.assertTrue('cdevice' in msg)
+
+    def test_delete_at_update_cleans_old_entries(self):
+        # Test how delete_at_update works with a request to overwrite an object
+        # with delete-at metadata
+        policy = random.choice(list(POLICIES))
+        ts = next(self.ts)
+
+        def do_test(method, headers, expected_args):
+            given_args = []
+
+            def fake_async_update(*args):
+                given_args.extend(args)
+
+            headers.update({'X-Timestamp': ts.internal,
+                            'X-Trans-Id': '123',
+                            'X-Backend-Storage-Policy-Index': int(policy)})
+            req = Request.blank(
+                '/v1/a/c/o',
+                environ={'REQUEST_METHOD': method},
+                headers=headers)
+            with mock.patch.object(self.object_controller, 'async_update',
+                                   fake_async_update):
+                self.object_controller.delete_at_update(
+                    'DELETE', 2, 'a', 'c', 'o', req, 'sda1', policy)
+            self.assertEqual(expected_args, given_args)
+
+        for method in ('PUT', 'POST', 'DELETE'):
+            expected_args = [
+                'DELETE', '.expiring_objects', '0000000000',
+                '0000000002-a/c/o', None, None,
+                None, HeaderKeyDict({
+                    'X-Backend-Storage-Policy-Index': 0,
+                    'x-timestamp': ts.internal,
+                    'x-trans-id': '123',
+                    'referer': '%s http://localhost/v1/a/c/o' % method}),
+                'sda1', policy]
+            # async_update should be called by default...
+            do_test(method, {}, expected_args)
+            do_test(method, {'X-Backend-Clean-Expiring-Object-Queue': 'true'},
+                    expected_args)
+            do_test(method, {'X-Backend-Clean-Expiring-Object-Queue': 't'},
+                    expected_args)
+            # ...unless header has a false value
+            do_test(method, {'X-Backend-Clean-Expiring-Object-Queue': 'false'},
+                    [])
+            do_test(method, {'X-Backend-Clean-Expiring-Object-Queue': 'f'}, [])
 
     def test_delete_at_negative(self):
+        # Test how delete_at_update works when issued a delete for old
+        # expiration info after a new put with no new expiration info.
         # Test negative is reset to 0
+        policy = random.choice(list(POLICIES))
         given_args = []
 
         def fake_async_update(*args):
             given_args.extend(args)
 
+        ts = next(self.ts)
         self.object_controller.async_update = fake_async_update
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': ts.internal,
+                     'X-Trans-Id': '1234', 'X-Backend-Storage-Policy-Index':
+                     int(policy)})
         self.object_controller.delete_at_update(
-            'PUT', -2, 'a', 'c', 'o', {'x-timestamp': '1'}, 'sda1')
-        self.assertEquals(given_args, [
-            'PUT', '.expiring_objects', '0', '0-a/c/o', None, None, None,
-            {'x-size': '0', 'x-etag': 'd41d8cd98f00b204e9800998ecf8427e',
-             'x-content-type': 'text/plain', 'x-timestamp': '1',
-             'x-trans-id': '-'},
-            'sda1'])
+            'DELETE', -2, 'a', 'c', 'o', req, 'sda1', policy)
+        self.assertEqual(given_args, [
+            'DELETE', '.expiring_objects', '0000000000', '0000000000-a/c/o',
+            None, None, None,
+            HeaderKeyDict({
+                # the expiring objects account is always 0
+                'X-Backend-Storage-Policy-Index': 0,
+                'x-timestamp': ts.internal,
+                'x-trans-id': '1234',
+                'referer': 'PUT http://localhost/v1/a/c/o'}),
+            'sda1', policy])
 
     def test_delete_at_cap(self):
+        # Test how delete_at_update works when issued a delete for old
+        # expiration info after a new put with no new expiration info.
         # Test past cap is reset to cap
+        policy = random.choice(list(POLICIES))
         given_args = []
 
         def fake_async_update(*args):
             given_args.extend(args)
 
         self.object_controller.async_update = fake_async_update
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': 1,
+                     'X-Trans-Id': '1234',
+                     'X-Backend-Storage-Policy-Index': int(policy)})
         self.object_controller.delete_at_update(
-            'PUT', 12345678901, 'a', 'c', 'o', {'x-timestamp': '1'}, 'sda1')
-        self.assertEquals(given_args, [
-            'PUT', '.expiring_objects', '9999936000', '9999999999-a/c/o', None,
-            None, None,
-            {'x-size': '0', 'x-etag': 'd41d8cd98f00b204e9800998ecf8427e',
-             'x-content-type': 'text/plain', 'x-timestamp': '1',
-             'x-trans-id': '-'},
-            'sda1'])
+            'DELETE', 12345678901, 'a', 'c', 'o', req, 'sda1', policy)
+        expiring_obj_container = given_args.pop(2)
+        expected_exp_cont = \
+            self.object_controller.expirer_config.get_expirer_container(
+                utils.normalize_delete_at_timestamp(12345678901),
+                'a', 'c', 'o')
+        self.assertEqual(expiring_obj_container, expected_exp_cont)
+
+        self.assertEqual(given_args, [
+            'DELETE', '.expiring_objects', '9999999999-a/c/o',
+            None, None, None,
+            HeaderKeyDict({
+                'X-Backend-Storage-Policy-Index': 0,
+                'x-timestamp': utils.Timestamp('1').internal,
+                'x-trans-id': '1234',
+                'referer': 'PUT http://localhost/v1/a/c/o'}),
+            'sda1', policy])
 
     def test_delete_at_update_put_with_info(self):
+        # Keep next test,
+        # test_delete_at_update_put_with_info_but_missing_container, in sync
+        # with this one but just missing the X-Delete-At-Container header.
+        policy = random.choice(list(POLICIES))
+        given_args = []
+
+        def fake_async_update(*args):
+            given_args.extend(args)
+
+        self.object_controller.async_update = fake_async_update
+        req_headers = {
+            'X-Timestamp': '1',
+            'X-Trans-Id': '1234',
+            'X-Delete-At': '2',
+            'X-Backend-Storage-Policy-Index': str(int(policy)),
+        }
+        self._update_delete_at_headers(req_headers)
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers=req_headers)
+        self.object_controller.delete_at_update('PUT', 2, 'a', 'c', 'o',
+                                                req, 'sda1', policy)
+        self.assertEqual(
+            given_args, [
+                'PUT', '.expiring_objects',
+                req_headers['X-Delete-At-Container'],
+                '0000000002-a/c/o',
+                req_headers['X-Delete-At-Host'],
+                req_headers['X-Delete-At-Partition'],
+                req_headers['X-Delete-At-Device'],
+                HeaderKeyDict({
+                    # the .expiring_objects account is always policy-0
+                    'X-Backend-Storage-Policy-Index': 0,
+                    'x-size': '0',
+                    'x-etag': 'd41d8cd98f00b204e9800998ecf8427e',
+                    'x-content-type': 'text/plain',
+                    'x-timestamp': utils.Timestamp('1').internal,
+                    'x-trans-id': '1234',
+                    'referer': 'PUT http://localhost/v1/a/c/o'}),
+                'sda1', policy])
+
+    def test_delete_at_update_put_with_info_but_missing_container(self):
+        # Same as previous test, test_delete_at_update_put_with_info, but just
+        # missing the X-Delete-At-Container header.
+        policy = random.choice(list(POLICIES))
+        given_args = []
+
+        def fake_async_update(*args):
+            given_args.extend(args)
+
+        self.object_controller.async_update = fake_async_update
+        self.object_controller.logger = self.logger
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': 1,
+                     'X-Trans-Id': '1234',
+                     'X-Delete-At-Host': '127.0.0.1:1234',
+                     'X-Delete-At-Partition': '3',
+                     'X-Delete-At-Device': 'sdc1',
+                     'X-Backend-Storage-Policy-Index': int(policy)})
+        self.object_controller.delete_at_update('PUT', 2, 'a', 'c', 'o',
+                                                req, 'sda1', policy)
+        # proxy servers started sending the x-delete-at-container along with
+        # host/part/device in 2013 Ia0081693f01631d3f2a59612308683e939ced76a
+        # it may be no longer necessary to say "warning: upgrade faster"
+        self.assertEqual(
+            self.logger.get_lines_for_level('warning'),
+            ['X-Delete-At-Container header must be specified for expiring '
+             'objects background PUT to work properly. Making best guess as '
+             'to the container name for now.'])
+        self.assertEqual(
+            given_args, [
+                'PUT', '.expiring_objects', '0000000000', '0000000002-a/c/o',
+                '127.0.0.1:1234',
+                '3', 'sdc1', HeaderKeyDict({
+                    # the .expiring_objects account is always policy-0
+                    'X-Backend-Storage-Policy-Index': 0,
+                    'x-size': '0',
+                    'x-etag': 'd41d8cd98f00b204e9800998ecf8427e',
+                    'x-content-type': 'text/plain',
+                    'x-timestamp': utils.Timestamp('1').internal,
+                    'x-trans-id': '1234',
+                    'referer': 'PUT http://localhost/v1/a/c/o'}),
+                'sda1', policy])
+
+    def test_delete_at_update_put_with_info_but_wrong_container(self):
+        # Same as test_delete_at_update_put_with_info, but the
+        # X-Delete-At-Container is "wrong"
+        policy = random.choice(list(POLICIES))
+        given_args = []
+
+        def fake_async_update(*args):
+            given_args.extend(args)
+
+        self.object_controller.async_update = fake_async_update
+        self.logger.clear()
+        delete_at = time()
+        req_headers = {
+            'X-Timestamp': 1,
+            'X-Trans-Id': '1234',
+            'X-Delete-At': delete_at,
+            'X-Backend-Storage-Policy-Index': int(policy),
+        }
+        self._update_delete_at_headers(req_headers)
+        delete_at = str(int(time() + 30))
+        expected_container = \
+            self.object_controller.expirer_config.get_expirer_container(
+                delete_at, 'a', 'c', 'o')
+        unexpected_container = str(int(delete_at) + 100)
+        req_headers['X-Delete-At-Container'] = unexpected_container
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers=req_headers)
+        self.object_controller.delete_at_update('PUT', delete_at,
+                                                'a', 'c', 'o',
+                                                req, 'sda1', policy)
+        self.assertEqual({'debug': [
+            "Proxy X-Delete-At-Container '%s' does not match expected "
+            "'%s' for current expirer_config." % (unexpected_container,
+                                                  expected_container)
+        ]}, self.logger.all_log_lines())
+        self.assertEqual(
+            given_args, [
+                'PUT', '.expiring_objects', unexpected_container,
+                '%s-a/c/o' % delete_at,
+                req_headers['X-Delete-At-Host'],
+                req_headers['X-Delete-At-Partition'],
+                req_headers['X-Delete-At-Device'], HeaderKeyDict({
+                    # the .expiring_objects account is always policy-0
+                    'X-Backend-Storage-Policy-Index': 0,
+                    'x-size': '0',
+                    'x-etag': 'd41d8cd98f00b204e9800998ecf8427e',
+                    'x-content-type': 'text/plain',
+                    'x-timestamp': utils.Timestamp('1').internal,
+                    'x-trans-id': '1234',
+                    'referer': 'PUT http://localhost/v1/a/c/o'}),
+                'sda1', policy])
+
+    def test_delete_at_update_put_with_info_but_missing_host(self):
+        # Same as test_delete_at_update_put_with_info, but just
+        # missing the X-Delete-At-Host header.
+        policy = random.choice(list(POLICIES))
+        given_args = []
+
+        def fake_async_update(*args):
+            given_args.extend(args)
+
+        self.object_controller.async_update = fake_async_update
+        self.logger.clear()
+        delete_at = time()
+        req_headers = {
+            'X-Timestamp': 1,
+            'X-Trans-Id': '1234',
+            'X-Delete-At': delete_at,
+            'X-Backend-Storage-Policy-Index': int(policy),
+        }
+        self._update_delete_at_headers(req_headers)
+        req_headers.pop('X-Delete-At-Host')
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers=req_headers)
+        self.object_controller.delete_at_update('PUT', delete_at,
+                                                'a', 'c', 'o',
+                                                req, 'sda1', policy)
+        self.assertEqual({}, self.logger.all_log_lines())
+        self.assertEqual(given_args, [])
+
+    def test_delete_at_update_put_with_info_but_empty_host(self):
+        # Same as test_delete_at_update_put_with_info, but empty
+        # X-Delete-At-Host header and no X-Delete-At-Partition nor
+        # X-Delete-At-Device.
+        policy = random.choice(list(POLICIES))
         given_args = []
 
         def fake_async_update(*args):
             given_args.extend(args)
 
         self.object_controller.async_update = fake_async_update
+        self.object_controller.logger = self.logger
+        delete_at_container = \
+            self.object_controller.expirer_config.get_expirer_container(
+                '1', 'a', 'c', 'o')
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': 1,
+                     'X-Trans-Id': '1234',
+                     'X-Delete-At-Container': delete_at_container,
+                     'X-Delete-At-Host': '',
+                     'X-Backend-Storage-Policy-Index': int(policy)})
         self.object_controller.delete_at_update('PUT', 2, 'a', 'c', 'o',
-            {'x-timestamp': '1', 'X-Delete-At-Host': '127.0.0.1:1234',
-             'X-Delete-At-Partition': '3', 'X-Delete-At-Device': 'sdc1'},
-            'sda1')
-        self.assertEquals(given_args, ['PUT', '.expiring_objects', '0',
-            '2-a/c/o', '127.0.0.1:1234', '3', 'sdc1',
-            {'x-size': '0', 'x-etag': 'd41d8cd98f00b204e9800998ecf8427e',
-             'x-content-type': 'text/plain', 'x-timestamp': '1',
-             'x-trans-id': '-'},
-            'sda1'])
+                                                req, 'sda1', policy)
+        self.assertFalse(self.logger.get_lines_for_level('warning'))
+        self.assertEqual(
+            given_args, [
+                'PUT', '.expiring_objects', '0000000000', '0000000002-a/c/o',
+                None,
+                None, None, HeaderKeyDict({
+                    # the .expiring_objects account is always policy-0
+                    'X-Backend-Storage-Policy-Index': 0,
+                    'x-size': '0',
+                    'x-etag': 'd41d8cd98f00b204e9800998ecf8427e',
+                    'x-content-type': 'text/plain',
+                    'x-timestamp': utils.Timestamp('1').internal,
+                    'x-trans-id': '1234',
+                    'referer': 'PUT http://localhost/v1/a/c/o'}),
+                'sda1', policy])
 
     def test_delete_at_update_delete(self):
+        policy = random.choice(list(POLICIES))
         given_args = []
 
         def fake_async_update(*args):
             given_args.extend(args)
 
         self.object_controller.async_update = fake_async_update
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'DELETE'},
+            headers={'X-Timestamp': 1,
+                     'X-Trans-Id': '1234',
+                     'X-Backend-Storage-Policy-Index': int(policy)})
         self.object_controller.delete_at_update('DELETE', 2, 'a', 'c', 'o',
-            {'x-timestamp': '1'}, 'sda1')
-        self.assertEquals(given_args, ['DELETE', '.expiring_objects', '0',
-            '2-a/c/o', None, None, None,
-            {'x-timestamp': '1', 'x-trans-id': '-'}, 'sda1'])
+                                                req, 'sda1', policy)
+        self.assertEqual(
+            given_args, [
+                'DELETE', '.expiring_objects', '0000000000',
+                '0000000002-a/c/o', None, None,
+                None, HeaderKeyDict({
+                    'X-Backend-Storage-Policy-Index': 0,
+                    'x-timestamp': utils.Timestamp('1').internal,
+                    'x-trans-id': '1234',
+                    'referer': 'DELETE http://localhost/v1/a/c/o'}),
+                'sda1', policy])
+
+    def test_delete_backend_replication(self):
+        # If X-Backend-Replication: True delete_at_update should completely
+        # short-circuit.
+        policy = random.choice(list(POLICIES))
+        given_args = []
+
+        def fake_async_update(*args):
+            given_args.extend(args)
+
+        self.object_controller.async_update = fake_async_update
+        req = Request.blank(
+            '/v1/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': 1,
+                     'X-Trans-Id': '1234',
+                     'X-Backend-Replication': 'True',
+                     'X-Backend-Storage-Policy-Index': int(policy)})
+        self.object_controller.delete_at_update(
+            'DELETE', -2, 'a', 'c', 'o', req, 'sda1', policy)
+        self.assertEqual(given_args, [])
 
     def test_POST_calls_delete_at(self):
+        policy = random.choice(list(POLICIES))
         given_args = []
 
         def fake_delete_at_update(*args):
@@ -1810,41 +7580,49 @@ def fake_delete_at_update(*args):
 
         self.object_controller.delete_at_update = fake_delete_at_update
 
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-            headers={'X-Timestamp': normalize_timestamp(time()),
+        timestamp0 = normalize_timestamp(time())
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': timestamp0,
                      'Content-Length': '4',
-                     'Content-Type': 'application/octet-stream'})
+                     'Content-Type': 'application/octet-stream',
+                     'X-Backend-Storage-Policy-Index': int(policy),
+                     'X-Object-Sysmeta-Ec-Frag-Index': 2})
         req.body = 'TEST'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
-        self.assertEquals(given_args, [])
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+        self.assertEqual(given_args, [])
 
         sleep(.00001)
-        req = Request.blank('/sda1/p/a/c/o',
+        req = Request.blank(
+            '/sda1/p/a/c/o',
             environ={'REQUEST_METHOD': 'POST'},
             headers={'X-Timestamp': normalize_timestamp(time()),
-                     'Content-Type': 'application/x-test'})
-        resp = self.object_controller.POST(req)
-        self.assertEquals(resp.status_int, 202)
-        self.assertEquals(given_args, [])
+                     'Content-Type': 'application/x-test',
+                     'X-Backend-Storage-Policy-Index': int(policy)})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 202)
+        self.assertEqual(given_args, [])
 
         sleep(.00001)
         timestamp1 = normalize_timestamp(time())
         delete_at_timestamp1 = str(int(time() + 1000))
-        req = Request.blank('/sda1/p/a/c/o',
+        req = Request.blank(
+            '/sda1/p/a/c/o',
             environ={'REQUEST_METHOD': 'POST'},
             headers={'X-Timestamp': timestamp1,
                      'Content-Type': 'application/x-test',
-                     'X-Delete-At': delete_at_timestamp1})
-        resp = self.object_controller.POST(req)
-        self.assertEquals(resp.status_int, 202)
-        self.assertEquals(given_args, [
-            'PUT', int(delete_at_timestamp1), 'a', 'c', 'o',
-            {'X-Delete-At': delete_at_timestamp1,
-             'Content-Type': 'application/x-test',
-             'X-Timestamp': timestamp1,
-             'Host': 'localhost:80'},
-            'sda1'])
+                     'X-Delete-At': delete_at_timestamp1,
+                     'X-Backend-Storage-Policy-Index': int(policy)})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 202)
+        self.assertEqual(
+            given_args, [
+                'PUT', int(delete_at_timestamp1), 'a', 'c', 'o',
+                given_args[5], 'sda1', policy, {
+                    'x-content-type': 'text/plain;swift_expirer_bytes=4',
+                    'x-content-type-timestamp': timestamp0
+                }])
 
         while given_args:
             given_args.pop()
@@ -1852,29 +7630,27 @@ def fake_delete_at_update(*args):
         sleep(.00001)
         timestamp2 = normalize_timestamp(time())
         delete_at_timestamp2 = str(int(time() + 2000))
-        req = Request.blank('/sda1/p/a/c/o',
+        req = Request.blank(
+            '/sda1/p/a/c/o',
             environ={'REQUEST_METHOD': 'POST'},
             headers={'X-Timestamp': timestamp2,
                      'Content-Type': 'application/x-test',
-                     'X-Delete-At': delete_at_timestamp2})
-        resp = self.object_controller.POST(req)
-        self.assertEquals(resp.status_int, 202)
-        self.assertEquals(given_args, [
-            'PUT', int(delete_at_timestamp2), 'a', 'c', 'o',
-            {'X-Delete-At': delete_at_timestamp2,
-             'Content-Type': 'application/x-test',
-             'X-Timestamp': timestamp2, 'Host': 'localhost:80'},
-            'sda1',
-            'DELETE', int(delete_at_timestamp1), 'a', 'c', 'o',
-            # This 2 timestamp is okay because it's ignored since it's just
-            # part of the current request headers. The above 1 timestamp is the
-            # important one.
-            {'X-Delete-At': delete_at_timestamp2,
-             'Content-Type': 'application/x-test',
-             'X-Timestamp': timestamp2, 'Host': 'localhost:80'},
-            'sda1'])
+                     'X-Delete-At': delete_at_timestamp2,
+                     'X-Backend-Storage-Policy-Index': int(policy)})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 202)
+        self.assertEqual(
+            given_args, [
+                'PUT', int(delete_at_timestamp2), 'a', 'c', 'o',
+                given_args[5], 'sda1', policy, {
+                    'x-content-type': 'text/plain;swift_expirer_bytes=4',
+                    'x-content-type-timestamp': timestamp0
+                },
+                'DELETE', int(delete_at_timestamp1), 'a', 'c', 'o',
+                given_args[5], 'sda1', policy])
 
     def test_PUT_calls_delete_at(self):
+        policy = random.choice(list(POLICIES))
         given_args = []
 
         def fake_delete_at_update(*args):
@@ -1882,34 +7658,39 @@ def fake_delete_at_update(*args):
 
         self.object_controller.delete_at_update = fake_delete_at_update
 
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
             headers={'X-Timestamp': normalize_timestamp(time()),
                      'Content-Length': '4',
-                     'Content-Type': 'application/octet-stream'})
+                     'Content-Type': 'application/octet-stream',
+                     'X-Backend-Storage-Policy-Index': int(policy),
+                     'X-Object-Sysmeta-Ec-Frag-Index': 4})
         req.body = 'TEST'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
-        self.assertEquals(given_args, [])
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+        self.assertEqual(given_args, [])
 
         sleep(.00001)
         timestamp1 = normalize_timestamp(time())
         delete_at_timestamp1 = str(int(time() + 1000))
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
             headers={'X-Timestamp': timestamp1,
                      'Content-Length': '4',
                      'Content-Type': 'application/octet-stream',
-                     'X-Delete-At': delete_at_timestamp1})
+                     'X-Delete-At': delete_at_timestamp1,
+                     'X-Backend-Storage-Policy-Index': int(policy),
+                     'X-Object-Sysmeta-Ec-Frag-Index': 3})
         req.body = 'TEST'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
-        self.assertEquals(given_args, [
-            'PUT', int(delete_at_timestamp1), 'a', 'c', 'o',
-            {'X-Delete-At': delete_at_timestamp1,
-             'Content-Length': '4',
-             'Content-Type': 'application/octet-stream',
-             'X-Timestamp': timestamp1,
-             'Host': 'localhost:80'},
-            'sda1'])
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+        self.assertEqual(
+            given_args, [
+                'PUT', int(delete_at_timestamp1), 'a', 'c', 'o',
+                given_args[5], 'sda1', policy, {
+                    'x-content-type': 'text/plain;swift_expirer_bytes=4',
+                    'x-content-type-timestamp': timestamp1
+                }])
 
         while given_args:
             given_args.pop()
@@ -1917,253 +7698,961 @@ def fake_delete_at_update(*args):
         sleep(.00001)
         timestamp2 = normalize_timestamp(time())
         delete_at_timestamp2 = str(int(time() + 2000))
-        req = Request.blank('/sda1/p/a/c/o',
+        req = Request.blank(
+            '/sda1/p/a/c/o',
             environ={'REQUEST_METHOD': 'PUT'},
             headers={'X-Timestamp': timestamp2,
                      'Content-Length': '4',
                      'Content-Type': 'application/octet-stream',
-                     'X-Delete-At': delete_at_timestamp2})
+                     'X-Delete-At': delete_at_timestamp2,
+                     'X-Backend-Storage-Policy-Index': int(policy),
+                     'X-Object-Sysmeta-Ec-Frag-Index': 3})
         req.body = 'TEST'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
-        self.assertEquals(given_args, [
-            'PUT', int(delete_at_timestamp2), 'a', 'c', 'o',
-            {'X-Delete-At': delete_at_timestamp2,
-             'Content-Length': '4',
-             'Content-Type': 'application/octet-stream',
-             'X-Timestamp': timestamp2, 'Host': 'localhost:80'},
-            'sda1',
-            'DELETE', int(delete_at_timestamp1), 'a', 'c', 'o',
-            # This 2 timestamp is okay because it's ignored since it's just
-            # part of the current request headers. The above 1 timestamp is the
-            # important one.
-            {'X-Delete-At': delete_at_timestamp2,
-             'Content-Length': '4',
-             'Content-Type': 'application/octet-stream',
-             'X-Timestamp': timestamp2, 'Host': 'localhost:80'},
-            'sda1'])
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+        self.maxDiff = None
+        self.assertEqual(
+            given_args, [
+                'PUT', int(delete_at_timestamp2), 'a', 'c', 'o',
+                given_args[5], 'sda1', policy, {
+                    'x-content-type': 'text/plain;swift_expirer_bytes=4',
+                    'x-content-type-timestamp': timestamp2
+                },
+                'DELETE', int(delete_at_timestamp1), 'a', 'c', 'o',
+                given_args[5], 'sda1', policy])
 
     def test_GET_but_expired(self):
-        test_time = time() + 10000
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-            headers={'X-Timestamp': normalize_timestamp(test_time - 2000),
-                     'X-Delete-At': str(int(test_time + 100)),
-                     'Content-Length': '4',
-                     'Content-Type': 'application/octet-stream'})
+        # Start off with an existing object that will expire
+        ts_now = Timestamp.now()
+        delete_at_seconds = int(ts_now) + 100
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers=self._update_delete_at_headers({
+                'X-Timestamp': ts_now.internal,
+                'X-Delete-At': delete_at_seconds,
+                'Content-Length': '4',
+                'Content-Type': 'application/octet-stream'}))
         req.body = 'TEST'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
-
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
-            headers={'X-Timestamp': normalize_timestamp(test_time)})
-        resp = self.object_controller.GET(req)
-        self.assertEquals(resp.status_int, 200)
-
-        orig_time = object_server.time.time
-        try:
-            t = time()
-            object_server.time.time = lambda: t
-            req = Request.blank('/sda1/p/a/c/o',
-                environ={'REQUEST_METHOD': 'PUT'},
-                headers={'X-Timestamp': normalize_timestamp(test_time - 1000),
-                         'X-Delete-At': str(int(t + 1)),
-                         'Content-Length': '4',
-                         'Content-Type': 'application/octet-stream'})
-            req.body = 'TEST'
-            resp = self.object_controller.PUT(req)
-            self.assertEquals(resp.status_int, 201)
-            req = Request.blank('/sda1/p/a/c/o',
-                environ={'REQUEST_METHOD': 'GET'},
-                headers={'X-Timestamp': normalize_timestamp(test_time)})
-            resp = self.object_controller.GET(req)
-            self.assertEquals(resp.status_int, 200)
-        finally:
-            object_server.time.time = orig_time
-
-        orig_time = object_server.time.time
-        try:
-            t = time() + 2
-            object_server.time.time = lambda: t
-            req = Request.blank('/sda1/p/a/c/o',
-                environ={'REQUEST_METHOD': 'GET'},
-                headers={'X-Timestamp': normalize_timestamp(t)})
-            resp = self.object_controller.GET(req)
-            self.assertEquals(resp.status_int, 404)
-        finally:
-            object_server.time.time = orig_time
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        # It expires in the future, so it's accessible via GET
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
+            headers={'X-Timestamp': ts_now.internal})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+
+        # It expires in the past, so it's not accessible via GET...
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'X-Timestamp': Timestamp(delete_at_seconds + 1).internal})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 404)
+        self.assertEqual(resp.headers['X-Backend-Timestamp'], ts_now.internal)
+
+        # ...unless X-Backend-Replication is sent
+        req = Request.blank(
+            '/sda1/p/a/c/o', method='GET',
+            headers={'X-Timestamp': Timestamp(delete_at_seconds + 1).internal,
+                     'X-Backend-Replication': 'True'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(b'TEST', resp.body)
+
+        # ...or x-backend-open-expired is sent
+        req = Request.blank(
+            '/sda1/p/a/c/o', method='GET',
+            headers={'X-Timestamp': Timestamp(delete_at_seconds + 1).internal,
+                     'x-backend-open-expired': 'True'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(b'TEST', resp.body)
 
     def test_HEAD_but_expired(self):
-        test_time = time() + 10000
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-            headers={'X-Timestamp': normalize_timestamp(test_time - 2000),
-                     'X-Delete-At': str(int(test_time + 100)),
-                     'Content-Length': '4',
-                     'Content-Type': 'application/octet-stream'})
-        req.body = 'TEST'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
-
-        req = Request.blank('/sda1/p/a/c/o',
+        # We have an object that expires in the future
+        ts_now = Timestamp.now()
+        delete_at_seconds = int(ts_now) + 100
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers=self._update_delete_at_headers({
+                'X-Timestamp': ts_now.internal,
+                'X-Delete-At': delete_at_seconds,
+                'Content-Length': '4',
+                'Content-Type': 'application/octet-stream'}))
+        req.body = b'TEST'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        # It's accessible since it expires in the future
+        req = Request.blank(
+            '/sda1/p/a/c/o',
             environ={'REQUEST_METHOD': 'HEAD'},
-            headers={'X-Timestamp': normalize_timestamp(test_time)})
-        resp = self.object_controller.HEAD(req)
-        self.assertEquals(resp.status_int, 200)
-
-        orig_time = object_server.time.time
-        try:
-            t = time()
-            object_server.time.time = lambda: t
-            req = Request.blank('/sda1/p/a/c/o',
-                environ={'REQUEST_METHOD': 'PUT'},
-                headers={'X-Timestamp': normalize_timestamp(test_time - 1000),
-                         'X-Delete-At': str(int(t + 1)),
-                         'Content-Length': '4',
-                         'Content-Type': 'application/octet-stream'})
-            req.body = 'TEST'
-            resp = self.object_controller.PUT(req)
-            self.assertEquals(resp.status_int, 201)
-            req = Request.blank('/sda1/p/a/c/o',
-                environ={'REQUEST_METHOD': 'HEAD'},
-                headers={'X-Timestamp': normalize_timestamp(test_time)})
-            resp = self.object_controller.HEAD(req)
-            self.assertEquals(resp.status_int, 200)
-        finally:
-            object_server.time.time = orig_time
+            headers={'X-Timestamp': ts_now.internal})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
 
-        orig_time = object_server.time.time
-        try:
-            t = time() + 2
-            object_server.time.time = lambda: t
-            req = Request.blank('/sda1/p/a/c/o',
-                environ={'REQUEST_METHOD': 'HEAD'},
-                headers={'X-Timestamp': normalize_timestamp(time())})
-            resp = self.object_controller.HEAD(req)
-            self.assertEquals(resp.status_int, 404)
-        finally:
-            object_server.time.time = orig_time
+        # It's not accessible now since it expires in the past
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'HEAD'},
+            headers={'X-Timestamp': Timestamp(delete_at_seconds + 1).internal})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 404)
+        self.assertEqual(resp.headers['X-Backend-Timestamp'],
+                         utils.Timestamp(ts_now))
+
+        # It should be accessible with x-backend-open-expired
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'HEAD'},
+            headers={'X-Timestamp': Timestamp(delete_at_seconds + 2).internal,
+                     'x-backend-open-expired': 'true'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+
+        # It should be accessible with x-backend-replication
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'HEAD'},
+            headers={'X-Timestamp': Timestamp(delete_at_seconds + 2).internal,
+                     'x-backend-replication': 'true'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(b'', resp.body)
 
     def test_POST_but_expired(self):
-        test_time = time() + 10000
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-            headers={'X-Timestamp': normalize_timestamp(test_time - 2000),
-                     'X-Delete-At': str(int(test_time + 100)),
-                     'Content-Length': '4',
-                     'Content-Type': 'application/octet-stream'})
+        # We have an object that expires in the future
+        now = time()
+        delete_at_timestamp = int(now + 100)
+
+        # PUT the object
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers=self._update_delete_at_headers({
+                'X-Timestamp': normalize_timestamp(now),
+                'X-Delete-At': str(delete_at_timestamp),
+                'Content-Length': '4',
+                'Content-Type': 'application/octet-stream'}))
+        req.body = b'TEST'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        # It's accessible since it expires in the future
+        the_time = now + 2
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'POST'},
+            headers={'X-Timestamp': normalize_timestamp(the_time),
+                     'X-Delete-At': str(delete_at_timestamp)})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 202)
+
+        # It's not accessible now since it expires in the past
+        the_time = delete_at_timestamp + 1
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'POST'},
+            headers={'X-Timestamp': normalize_timestamp(the_time),
+                     'X-Delete-At': str(delete_at_timestamp + 100)})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 404)
+
+        # It should be accessible with x-backend-open-expired
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'HEAD'},
+            headers={'X-Timestamp': normalize_timestamp(
+                delete_at_timestamp + 2), 'x-backend-open-expired': 'true'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers.get('x-delete-at'),
+                         str(delete_at_timestamp))
+
+    def test_POST_with_x_backend_open_expired(self):
+        now = time()
+        delete_at_timestamp = int(now + 100)
+
+        # Create the object at x-delete-at
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers=self._update_delete_at_headers({
+                'X-Timestamp': normalize_timestamp(now),
+                'X-Delete-At': str(delete_at_timestamp),
+                'Content-Length': '4',
+                'Content-Type': 'application/octet-stream'}))
         req.body = 'TEST'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
-
-        req = Request.blank('/sda1/p/a/c/o',
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        # You can POST to an expired object with a much later x-delete-at
+        # with x-backend-open-expired
+        the_time = delete_at_timestamp + 2
+        new_delete_at_timestamp = int(delete_at_timestamp + 100)
+        req = Request.blank(
+            '/sda1/p/a/c/o',
             environ={'REQUEST_METHOD': 'POST'},
-            headers={'X-Timestamp': normalize_timestamp(test_time - 1500)})
-        resp = self.object_controller.POST(req)
-        self.assertEquals(resp.status_int, 202)
-
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-            headers={'X-Timestamp': normalize_timestamp(test_time - 1000),
-                     'X-Delete-At': str(int(time() + 1)),
-                     'Content-Length': '4',
-                     'Content-Type': 'application/octet-stream'})
+            headers=self._update_delete_at_headers({
+                'X-Timestamp': normalize_timestamp(the_time),
+                'X-Delete-At': str(new_delete_at_timestamp),
+                'x-backend-open-expired': 'true'}))
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 202)
+
+        # Verify the later x-delete-at
+        the_time = delete_at_timestamp + 2
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'HEAD'},
+            headers={'X-Timestamp': normalize_timestamp(the_time),
+                     'x-backend-open-expired': 'false'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers.get('x-delete-at'),
+                         str(new_delete_at_timestamp))
+
+        # Verify object has expired
+        # We have no x-delete-at in response
+        the_time = new_delete_at_timestamp + 1
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'HEAD'},
+            headers={'X-Timestamp': normalize_timestamp(the_time),
+                     'x-backend-open-expired': 'false'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 404)
+        self.assertIsNone(resp.headers.get('x-delete-at'))
+
+        # But, it works with x-backend-open-expired set to true
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'HEAD'},
+            headers={'X-Timestamp': normalize_timestamp(the_time),
+                     'x-backend-open-expired': 'true'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers.get('x-delete-at'),
+                         str(new_delete_at_timestamp))
+
+    def test_POST_with_x_backend_replication(self):
+        now = time()
+        delete_at_timestamp = int(now + 100)
+
+        # Create object with future x-delete-at
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers=self._update_delete_at_headers({
+                'X-Timestamp': normalize_timestamp(now),
+                'X-Delete-At': str(delete_at_timestamp),
+                'Content-Length': '4',
+                'Content-Type': 'application/octet-stream'}))
+        req.body = 'TEST'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        # sending an x-backend-replication header lets you
+        # modify x-delete-at, even when object is expired
+        the_time = delete_at_timestamp + 2
+        new_delete_at_timestamp = delete_at_timestamp + 100
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'POST'},
+            headers=self._update_delete_at_headers({
+                'X-Timestamp': normalize_timestamp(the_time),
+                'x-backend-replication': 'true',
+                'X-Delete-At': str(new_delete_at_timestamp)}))
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 202)
+
+        # ...so the object becomes accessible again even without an
+        # x-backend-replication or x-backend-open-expired header
+        the_time = delete_at_timestamp + 3
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'POST'},
+            headers=self._update_delete_at_headers({
+                'X-Timestamp': normalize_timestamp(the_time),
+                'X-Delete-At': str(delete_at_timestamp + 101)}))
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 202)
+
+    def test_POST_invalid_headers(self):
+        now = time()
+        delete_at_timestamp = int(now + 100)
+
+        # Create the object at x-delete-at
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers=self._update_delete_at_headers({
+                'X-Timestamp': normalize_timestamp(now),
+                'X-Delete-At': str(delete_at_timestamp),
+                'Content-Length': '4',
+                'Content-Type': 'application/octet-stream'}))
+        req.body = 'TEST'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        # You cannot send an x-delete-at that is in the past with a POST even
+        # when x-backend-open-expired is sent
+        the_time = delete_at_timestamp + 75
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'POST'},
+            headers=self._update_delete_at_headers({
+                'X-Timestamp': normalize_timestamp(the_time),
+                'x-backend-open-expired': 'true',
+                'X-Delete-At': str(delete_at_timestamp - 50)}))
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 400)
+
+        # Object server always ignores x-open-expired and
+        # only understands x-backend-open-expired on expired objects
+        the_time = delete_at_timestamp + 2
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'POST'},
+            headers=self._update_delete_at_headers({
+                'X-Timestamp': normalize_timestamp(the_time),
+                'x-open-expired': 'true',
+                'X-Delete-At': str(delete_at_timestamp + 100)}))
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 404)
+
+    def test_DELETE_can_skip_updating_expirer_queue(self):
+        policy = POLICIES.get_by_index(0)
+        test_time = time()
+        put_time = test_time
+        delete_time = test_time + 1
+        delete_at_timestamp = int(test_time + 10000)
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers=self._update_delete_at_headers({
+                'X-Timestamp': normalize_timestamp(put_time),
+                'X-Delete-At': str(delete_at_timestamp),
+                'Content-Length': '4',
+                'Content-Type': 'application/octet-stream'}))
         req.body = 'TEST'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
 
-        orig_time = object_server.time.time
+        # Mock out async_update so we don't get any async_pending files.
+        with mock.patch.object(self.object_controller, 'async_update'):
+            resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'DELETE'},
+            headers={'X-Timestamp': normalize_timestamp(delete_time),
+                     'X-Backend-Clean-Expiring-Object-Queue': 'false',
+                     'X-If-Delete-At': str(delete_at_timestamp)})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 204)
+
+        async_pending_dir = os.path.join(
+            self.testdir, 'sda1', diskfile.get_async_dir(policy))
+        # empty dir or absent dir, either is fine
         try:
-            t = time() + 2
-            object_server.time.time = lambda: t
-            req = Request.blank('/sda1/p/a/c/o',
-                environ={'REQUEST_METHOD': 'POST'},
-                headers={'X-Timestamp': normalize_timestamp(time())})
-            resp = self.object_controller.POST(req)
-            self.assertEquals(resp.status_int, 404)
-        finally:
-            object_server.time.time = orig_time
+            self.assertEqual([], os.listdir(async_pending_dir))
+        except OSError as err:
+            self.assertEqual(err.errno, errno.ENOENT)
+
+    def test_x_if_delete_at_formats(self):
+        policy = POLICIES.get_by_index(0)
+        test_time = time()
+        put_time = test_time
+        delete_time = test_time + 1
+        delete_at_timestamp = int(test_time + 10000)
+
+        def do_test(if_delete_at, expected_status):
+            req = Request.blank(
+                '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                headers=self._update_delete_at_headers({
+                    'X-Timestamp': normalize_timestamp(put_time),
+                    'X-Delete-At': str(delete_at_timestamp),
+                    'Content-Length': '4',
+                    'Content-Type': 'application/octet-stream'}))
+            req.body = 'TEST'
+
+            # Mock out async_update so we don't get any async_pending files.
+            with mock.patch.object(self.object_controller, 'async_update'):
+                resp = req.get_response(self.object_controller)
+            self.assertEqual(resp.status_int, 201)
+
+            req = Request.blank(
+                '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'DELETE'},
+                headers={'X-Timestamp': normalize_timestamp(delete_time),
+                         'X-Backend-Clean-Expiring-Object-Queue': 'false',
+                         'X-If-Delete-At': if_delete_at})
+            # Again, we don't care about async_pending files (for this test)
+            with mock.patch.object(self.object_controller, 'async_update'):
+                resp = req.get_response(self.object_controller)
+            self.assertEqual(resp.status_int, expected_status)
+
+            # Clean up the tombstone
+            objfile = self.df_mgr.get_diskfile('sda1', 'p', 'a', 'c', 'o',
+                                               policy=policy)
+            files = os.listdir(objfile._datadir)
+            self.assertEqual(len(files), 1,
+                             'Expected to find one file, got %r' % files)
+            if expected_status == 204:
+                self.assertTrue(files[0].endswith('.ts'),
+                                'Expected a tombstone, found %r' % files[0])
+            else:
+                self.assertTrue(files[0].endswith('.data'),
+                                'Expected a data file, found %r' % files[0])
+            os.unlink(os.path.join(objfile._datadir, files[0]))
+
+        # More as a reminder than anything else
+        self.assertIsInstance(delete_at_timestamp, int)
+
+        do_test(str(delete_at_timestamp), 204)
+        do_test(str(delete_at_timestamp) + ':', 400)
+        do_test(Timestamp(delete_at_timestamp).isoformat, 400)
+        do_test(Timestamp(delete_at_timestamp).normal, 204)
+        do_test(Timestamp(delete_at_timestamp, delta=1).normal, 412)
+        do_test(Timestamp(delete_at_timestamp, delta=-1).normal, 412)
+        do_test(Timestamp(delete_at_timestamp, offset=1).internal, 412)
+        do_test(Timestamp(delete_at_timestamp, offset=15).internal, 412)
 
     def test_DELETE_but_expired(self):
         test_time = time() + 10000
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-            headers={'X-Timestamp': normalize_timestamp(test_time - 2000),
-                     'X-Delete-At': str(int(test_time + 100)),
-                     'Content-Length': '4',
-                     'Content-Type': 'application/octet-stream'})
+        delete_at_timestamp = int(test_time + 100)
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers=self._update_delete_at_headers({
+                'X-Timestamp': normalize_timestamp(test_time - 2000),
+                'X-Delete-At': str(delete_at_timestamp),
+                'Content-Length': '4',
+                'Content-Type': 'application/octet-stream'}))
         req.body = 'TEST'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
 
-        orig_time = object_server.time.time
-        try:
-            t = test_time + 100
-            object_server.time.time = lambda: float(t)
-            req = Request.blank('/sda1/p/a/c/o',
-                environ={'REQUEST_METHOD': 'DELETE'},
-                headers={'X-Timestamp': normalize_timestamp(time())})
-            resp = self.object_controller.DELETE(req)
-            self.assertEquals(resp.status_int, 404)
-        finally:
-            object_server.time.time = orig_time
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'DELETE'},
+            headers={'X-Timestamp': normalize_timestamp(
+                delete_at_timestamp + 1)})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 404)
+
+    def test_DELETE_if_delete_at_expired_still_deletes(self):
+        test_time = time() + 10
+        test_timestamp = normalize_timestamp(test_time)
+        delete_at_time = int(test_time + 10)
+        delete_at_timestamp = str(delete_at_time)
+        expired_time = delete_at_time + 1
+        expired_timestamp = normalize_timestamp(expired_time)
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers=self._update_delete_at_headers({
+                'X-Timestamp': test_timestamp,
+                'X-Delete-At': delete_at_timestamp,
+                'Content-Length': '4',
+                'Content-Type': 'application/octet-stream'}))
+        req.body = 'TEST'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        # sanity
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
+            headers={'X-Timestamp': test_timestamp})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.body, b'TEST')
+        objfile = os.path.join(
+            self.testdir, 'sda1',
+            storage_directory(diskfile.get_data_dir(POLICIES[0]), 'p',
+                              hash_path('a', 'c', 'o')),
+            utils.Timestamp(test_timestamp).internal + '.data')
+        self.assertTrue(os.path.isfile(objfile))
+
+        # move time past expiry
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'GET'},
+            headers={'X-Timestamp': expired_timestamp})
+        resp = req.get_response(self.object_controller)
+        # request will 404
+        self.assertEqual(resp.status_int, 404)
+        # but file still exists
+        self.assertTrue(os.path.isfile(objfile))
+
+        # make the x-if-delete-at with some wrong bits
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'DELETE'},
+            headers={'X-Timestamp': delete_at_timestamp,
+                     'X-If-Delete-At': int(delete_at_time + 1)})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 412)
+        self.assertTrue(os.path.isfile(objfile))
+
+        # make the x-if-delete-at with all the right bits
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'DELETE'},
+            headers={'X-Timestamp': delete_at_timestamp,
+                     'X-If-Delete-At': delete_at_timestamp})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertFalse(os.path.isfile(objfile))
+
+        # make the x-if-delete-at with all the right bits (again)
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'DELETE'},
+            headers={'X-Timestamp': delete_at_timestamp,
+                     'X-If-Delete-At': delete_at_timestamp})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 409)
+        self.assertFalse(os.path.isfile(objfile))
+
+        # overwrite with new content
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={
+                'X-Timestamp': str(test_time + 100),
+                'Content-Length': '0',
+                'Content-Type': 'application/octet-stream'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201, resp.body)
+
+        # simulate processing a stale expirer queue entry
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'DELETE'},
+            headers={'X-Timestamp': delete_at_timestamp,
+                     'X-If-Delete-At': delete_at_timestamp})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 409)
+
+        # make the x-if-delete-at for some not found
+        req = Request.blank(
+            '/sda1/p/a/c/o-not-found',
+            environ={'REQUEST_METHOD': 'DELETE'},
+            headers={'X-Timestamp': delete_at_timestamp,
+                     'X-If-Delete-At': delete_at_timestamp})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 404)
 
     def test_DELETE_if_delete_at(self):
         test_time = time() + 10000
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
             headers={'X-Timestamp': normalize_timestamp(test_time - 99),
                      'Content-Length': '4',
                      'Content-Type': 'application/octet-stream'})
         req.body = 'TEST'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
 
-        req = Request.blank('/sda1/p/a/c/o',
+        req = Request.blank(
+            '/sda1/p/a/c/o',
             environ={'REQUEST_METHOD': 'DELETE'},
             headers={'X-Timestamp': normalize_timestamp(test_time - 98)})
-        resp = self.object_controller.DELETE(req)
-        self.assertEquals(resp.status_int, 204)
-
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-            headers={'X-Timestamp': normalize_timestamp(test_time - 97),
-                     'X-Delete-At': str(int(test_time - 1)),
-                     'Content-Length': '4',
-                     'Content-Type': 'application/octet-stream'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 204)
+
+        delete_at_timestamp = int(test_time - 1)
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers=self._update_delete_at_headers({
+                'X-Timestamp': normalize_timestamp(test_time - 97),
+                'X-Delete-At': str(delete_at_timestamp),
+                'Content-Length': '4',
+                'Content-Type': 'application/octet-stream'}))
         req.body = 'TEST'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
 
-        req = Request.blank('/sda1/p/a/c/o',
+        req = Request.blank(
+            '/sda1/p/a/c/o',
             environ={'REQUEST_METHOD': 'DELETE'},
             headers={'X-Timestamp': normalize_timestamp(test_time - 95),
                      'X-If-Delete-At': str(int(test_time))})
-        resp = self.object_controller.DELETE(req)
-        self.assertEquals(resp.status_int, 412)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 412)
 
-        req = Request.blank('/sda1/p/a/c/o',
+        req = Request.blank(
+            '/sda1/p/a/c/o',
             environ={'REQUEST_METHOD': 'DELETE'},
             headers={'X-Timestamp': normalize_timestamp(test_time - 95)})
-        resp = self.object_controller.DELETE(req)
-        self.assertEquals(resp.status_int, 204)
-
-        delete_at_timestamp = str(int(test_time - 1))
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-            headers={'X-Timestamp': normalize_timestamp(test_time - 94),
-                     'X-Delete-At': delete_at_timestamp,
-                     'Content-Length': '4',
-                     'Content-Type': 'application/octet-stream'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 204)
+
+        delete_at_timestamp = int(test_time - 1)
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers=self._update_delete_at_headers({
+                'X-Timestamp': normalize_timestamp(test_time - 94),
+                'X-Delete-At': str(delete_at_timestamp),
+                'Content-Length': '4',
+                'Content-Type': 'application/octet-stream'}))
         req.body = 'TEST'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
 
-        req = Request.blank('/sda1/p/a/c/o',
-            environ={'REQUEST_METHOD': 'DELETE'},
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'DELETE'},
             headers={'X-Timestamp': normalize_timestamp(test_time - 92),
                      'X-If-Delete-At': str(int(test_time))})
-        resp = self.object_controller.DELETE(req)
-        self.assertEquals(resp.status_int, 412)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 412)
 
-        req = Request.blank('/sda1/p/a/c/o',
-            environ={'REQUEST_METHOD': 'DELETE'},
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'DELETE'},
             headers={'X-Timestamp': normalize_timestamp(test_time - 92),
                      'X-If-Delete-At': delete_at_timestamp})
-        resp = self.object_controller.DELETE(req)
-        self.assertEquals(resp.status_int, 204)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 204)
+
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'DELETE'},
+            headers={'X-Timestamp': normalize_timestamp(test_time - 92),
+                     'X-If-Delete-At': 'abc'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 400)
+
+    def test_extra_headers_contain_object_bytes(self):
+        timestamp1 = next(self.ts).normal
+        delete_at_timestamp1 = int(time() + 1000)
+        delete_at_container1 = \
+            self.object_controller.expirer_config.get_expirer_container(
+                delete_at_timestamp1, 'a', 'c', 'o')
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': timestamp1,
+                     'Content-Length': '4096',
+                     'Content-Type': 'application/octet-stream',
+                     'X-Delete-At': str(delete_at_timestamp1),
+                     'X-Delete-At-Container': delete_at_container1})
+        req.body = '\x00' * 4096
+        with mock.patch.object(self.object_controller, 'delete_at_update') \
+                as fake_delete_at_update:
+            resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+        self.assertEqual(fake_delete_at_update.call_args_list, [mock.call(
+            'PUT', int(delete_at_timestamp1), 'a', 'c', 'o',
+            SameReqEnv(req), 'sda1', POLICIES[0], {
+                'x-content-type': 'text/plain;swift_expirer_bytes=4096',
+                'x-content-type-timestamp': timestamp1
+            })])
+
+        timestamp2 = next(self.ts).normal
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': timestamp2,
+                     'Content-Length': '5120',
+                     'Content-Type': 'application/octet-stream',
+                     'X-Delete-At': str(delete_at_timestamp1),
+                     'X-Delete-At-Container': delete_at_container1})
+        req.body = '\x00' * 5120
+        with mock.patch.object(self.object_controller, 'delete_at_update') \
+                as fake_delete_at_update:
+            resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+        self.assertEqual(fake_delete_at_update.call_args_list, [mock.call(
+            'PUT', int(delete_at_timestamp1), 'a', 'c', 'o',
+            SameReqEnv(req), 'sda1', POLICIES[0], {
+                'x-content-type': 'text/plain;swift_expirer_bytes=5120',
+                'x-content-type-timestamp': timestamp2
+            }
+        )])
+
+        timestamp3 = next(self.ts).normal
+        delete_at_timestamp2 = str(int(next(self.ts)) + 2000)
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'POST'},
+            headers={'X-Timestamp': timestamp3,
+                     'X-Delete-At': delete_at_timestamp2})
+        with mock.patch.object(self.object_controller, 'delete_at_update') \
+                as fake_delete_at_update:
+            resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 202)
+        self.assertEqual(fake_delete_at_update.call_args_list, [mock.call(
+            'PUT', int(delete_at_timestamp2), 'a', 'c', 'o',
+            SameReqEnv(req), 'sda1', POLICIES[0], {
+                'x-content-type': 'text/plain;swift_expirer_bytes=5120',
+                'x-content-type-timestamp': timestamp2
+            },
+        ), mock.call(
+            'DELETE', int(delete_at_timestamp1), 'a', 'c', 'o',
+            SameReqEnv(req), 'sda1', POLICIES[0]
+        )])
+
+        timestamp4 = next(self.ts).normal
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'DELETE'},
+            headers={'X-Timestamp': timestamp4,
+                     'Content-Type': 'application/octet-stream'})
+        with mock.patch.object(self.object_controller, 'delete_at_update') \
+                as fake_delete_at_update:
+            resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(fake_delete_at_update.call_args_list, [mock.call(
+            'DELETE', int(delete_at_timestamp2), 'a', 'c', 'o',
+            SameReqEnv(req), 'sda1', POLICIES[0]
+        )])
+
+    def test_delete_at_overwrite_same_expiration_different_bytes(self):
+        container_updates = []
+
+        def capture_updates(ip, port, method, path, headers, *args, **kwargs):
+            container_updates.append((ip, port, method, path, headers))
+
+        policy = random.choice(list(POLICIES))
+        delete_at = int(next(self.ts)) + 30
+        delete_at_container = \
+            self.object_controller.expirer_config.get_expirer_container(
+                delete_at, 'a', 'c', 'o')
+        base_headers = {
+            'X-Backend-Storage-Policy-Index': int(policy),
+            'Content-Type': 'application/octet-stream',
+            # we exclude the user container listing updates for brevity
+            # 'X-Container-Partition': '20',
+            # 'X-Container-Host': '1.2.3.4:5105',
+            # 'X-Container-Device': 'sdb1',
+            'X-Delete-At': str(delete_at),
+            'X-Delete-At-Container': delete_at_container,
+            'X-Delete-At-Host': "10.1.1.1:6201",
+            'X-Delete-At-Partition': '6237',
+            'X-Delete-At-Device': 'sdp',
+        }
+        if policy.policy_type == EC_POLICY:
+            base_headers['X-Object-Sysmeta-Ec-Frag-Index'] = '2'
+
+        put1_ts = next(self.ts)
+        put1_size = 4042
+        req1 = Request.blank(
+            '/sda1/p/a/c/o', method='PUT', body='\x01' * put1_size,
+            headers=dict(base_headers, **{
+                'X-Timestamp': put1_ts.normal,
+                'Content-Length': str(put1_size),
+                'X-Trans-Id': 'txn1',
+            }))
+        put2_ts = next(self.ts)
+        put2_size = 2044
+        req2 = Request.blank(
+            '/sda1/p/a/c/o', method='PUT', body='\x02' * put2_size,
+            headers=dict(base_headers, **{
+                'X-Timestamp': put2_ts.normal,
+                'Content-Length': str(put2_size),
+                'X-Trans-Id': 'txn2',
+            }))
+        with fake_spawn(), mocked_http_conn(
+                200, 200, give_connect=capture_updates):
+            resp1 = req1.get_response(self.object_controller)
+            resp2 = req2.get_response(self.object_controller)
+        self.assertEqual(resp1.status_int, 201)
+        self.assertEqual(resp2.status_int, 201)
+
+        self.assertEqual([(
+            '10.1.1.1', '6201', 'PUT',
+            '/sdp/6237/.expiring_objects/%s/%s-a/c/o' % (
+                delete_at_container, delete_at
+            ), {
+                'X-Backend-Storage-Policy-Index': '0',
+                'X-Timestamp': put1_ts.normal,
+                'X-Trans-Id': 'txn1',
+                'Referer': 'PUT http://localhost/sda1/p/a/c/o',
+                'X-Size': '0',
+                'X-Etag': 'd41d8cd98f00b204e9800998ecf8427e',
+                'X-Content-Type':
+                'text/plain;swift_expirer_bytes=%s' % put1_size,
+                'X-Content-Type-Timestamp': put1_ts.normal,
+                'User-Agent': 'object-server %s' % os.getpid(),
+            }
+        ), (
+            '10.1.1.1', '6201', 'PUT',
+            '/sdp/6237/.expiring_objects/%s/%s-a/c/o' % (
+                delete_at_container, delete_at
+            ), {
+                'X-Backend-Storage-Policy-Index': '0',
+                'X-Timestamp': put2_ts.normal,
+                'X-Trans-Id': 'txn2',
+                'Referer': 'PUT http://localhost/sda1/p/a/c/o',
+                'X-Size': '0',
+                'X-Etag': 'd41d8cd98f00b204e9800998ecf8427e',
+                'X-Content-Type':
+                'text/plain;swift_expirer_bytes=%s' % put2_size,
+                'X-Content-Type-Timestamp': put2_ts.normal,
+                'User-Agent': 'object-server %s' % os.getpid(),
+            }
+        )], container_updates)
+
+        async_pendings = []
+        async_pending_dir = os.path.join(
+            self.testdir, 'sda1', diskfile.get_async_dir(policy))
+        for dirpath, _, filenames in os.walk(async_pending_dir):
+            for filename in filenames:
+                async_pendings.append(os.path.join(dirpath, filename))
+
+        self.assertEqual(len(async_pendings), 0)
+
+    def test_delete_at_POST_update_same_expiration(self):
+        container_updates = []
+
+        def capture_updates(ip, port, method, path, headers, *args, **kwargs):
+            container_updates.append((ip, port, method, path, headers))
+
+        policy = random.choice(list(POLICIES))
+        put_ts = next(self.ts)
+        put_size = 1548
+        put_delete_at = int(next(self.ts)) + 30
+        put_delete_at_container = \
+            self.object_controller.expirer_config.get_expirer_container(
+                put_delete_at, 'a', 'c', 'o')
+        put_req = Request.blank(
+            '/sda1/p/a/c/o', method='PUT', body='\x01' * put_size,
+            headers={
+                'X-Backend-Storage-Policy-Index': int(policy),
+                'X-Timestamp': put_ts.normal,
+                'Content-Length': str(put_size),
+                'X-Trans-Id': 'txn1',
+                'Content-Type': 'application/octet-stream',
+                # we exclude the user container listing updates for brevity
+                # 'X-Container-Partition': '20',
+                # 'X-Container-Host': '1.2.3.4:5105',
+                # 'X-Container-Device': 'sdb1',
+                'X-Delete-At': str(put_delete_at),
+                'X-Delete-At-Container': put_delete_at_container,
+                'X-Delete-At-Host': "10.1.1.1:6201",
+                'X-Delete-At-Partition': '6237',
+                'X-Delete-At-Device': 'sdp',
+            })
+        if policy.policy_type == EC_POLICY:
+            put_req.headers['X-Object-Sysmeta-Ec-Frag-Index'] = '3'
+
+        with fake_spawn(), mocked_http_conn(
+                200, give_connect=capture_updates):
+            put_resp = put_req.get_response(self.object_controller)
+        self.assertEqual(put_resp.status_int, 201)
+
+        self.assertEqual([(
+            '10.1.1.1', '6201', 'PUT',
+            '/sdp/6237/.expiring_objects/%s/%s-a/c/o' % (
+                put_delete_at_container, put_delete_at
+            ), {
+                'X-Backend-Storage-Policy-Index': '0',
+                'X-Timestamp': put_ts.normal,
+                'X-Trans-Id': 'txn1',
+                'Referer': 'PUT http://localhost/sda1/p/a/c/o',
+                'X-Size': '0',
+                'X-Etag': 'd41d8cd98f00b204e9800998ecf8427e',
+                'X-Content-Type':
+                'text/plain;swift_expirer_bytes=%s' % put_size,
+                'X-Content-Type-Timestamp': put_ts.normal,
+                'User-Agent': 'object-server %s' % os.getpid(),
+            }
+        )], container_updates)
+
+        # reset container updates
+        container_updates = []
+
+        delete_at = int(next(self.ts)) + 100
+        self.assertNotEqual(delete_at, put_delete_at)  # sanity
+        delete_at_container = \
+            self.object_controller.expirer_config.get_expirer_container(
+                delete_at, 'a', 'c', 'o')
+
+        base_headers = {
+            'X-Backend-Storage-Policy-Index': int(policy),
+            # we exclude the user container listing updates for brevity
+            # 'X-Container-Partition': '20',
+            # 'X-Container-Host': '1.2.3.4:5105',
+            # 'X-Container-Device': 'sdb1',
+            'X-Delete-At': str(delete_at),
+            'X-Delete-At-Container': delete_at_container,
+            'X-Delete-At-Host': "10.2.2.2:6202",
+            'X-Delete-At-Partition': '592',
+            'X-Delete-At-Device': 'sdm',
+        }
+
+        post1_ts = next(self.ts)
+        req1 = Request.blank(
+            '/sda1/p/a/c/o', method='POST', headers=dict(base_headers, **{
+                'X-Timestamp': post1_ts.normal,
+                'X-Trans-Id': 'txn2',
+            }))
+        post2_ts = next(self.ts)
+        req2 = Request.blank(
+            '/sda1/p/a/c/o', method='POST', headers=dict(base_headers, **{
+                'X-Timestamp': post2_ts.normal,
+                'X-Trans-Id': 'txn3',
+            }))
+
+        with fake_spawn(), mocked_http_conn(
+                200, 200, give_connect=capture_updates):
+            resp1 = req1.get_response(self.object_controller)
+            resp2 = req2.get_response(self.object_controller)
+        self.assertEqual(resp1.status_int, 202)
+        self.assertEqual(resp2.status_int, 202)
+
+        self.assertEqual([(
+            '10.2.2.2', '6202', 'PUT',
+            '/sdm/592/.expiring_objects/%s/%s-a/c/o' % (
+                delete_at_container, delete_at
+            ), {
+                'X-Backend-Storage-Policy-Index': '0',
+                # this the PUT from the POST-1
+                'X-Timestamp': post1_ts.normal,
+                'X-Trans-Id': 'txn2',
+                'Referer': 'POST http://localhost/sda1/p/a/c/o',
+                'X-Size': '0',
+                'X-Etag': 'd41d8cd98f00b204e9800998ecf8427e',
+                'X-Content-Type':
+                'text/plain;swift_expirer_bytes=%s' % put_size,
+                'X-Content-Type-Timestamp': put_ts.normal,
+                'User-Agent': 'object-server %s' % os.getpid(),
+            }
+        ), (
+            '10.2.2.2', '6202', 'PUT',
+            '/sdm/592/.expiring_objects/%s/%s-a/c/o' % (
+                delete_at_container, delete_at
+            ), {
+                'X-Backend-Storage-Policy-Index': '0',
+                # this the PUT from POST-2
+                'X-Timestamp': post2_ts.normal,
+                'X-Trans-Id': 'txn3',
+                'Referer': 'POST http://localhost/sda1/p/a/c/o',
+                'X-Size': '0',
+                'X-Etag': 'd41d8cd98f00b204e9800998ecf8427e',
+                'X-Content-Type':
+                'text/plain;swift_expirer_bytes=%s' % put_size,
+                'X-Content-Type-Timestamp': put_ts.normal,
+                'User-Agent': 'object-server %s' % os.getpid(),
+            }
+        )], container_updates)
+
+        async_pendings = []
+        async_pending_dir = os.path.join(
+            self.testdir, 'sda1', diskfile.get_async_dir(policy))
+        for dirpath, _, filenames in os.walk(async_pending_dir):
+            for filename in filenames:
+                async_pendings.append(os.path.join(dirpath, filename))
+
+        self.assertEqual(len(async_pendings), 1)
+
+        async_updates = []
+        for pending_file in async_pendings:
+            with open(pending_file, 'rb') as fh:
+                async_pending = pickle.load(fh)
+                async_updates.append(async_pending)
+        self.assertEqual([{
+            'op': 'DELETE',
+            'account': '.expiring_objects',
+            'container': delete_at_container,
+            'obj': '%s-a/c/o' % put_delete_at,
+            'db_state': None,
+            'headers': {
+                'X-Backend-Storage-Policy-Index': '0',
+                # only POST-1 has to clear the orig PUT delete-at
+                'X-Timestamp': post1_ts.normal,
+                'X-Trans-Id': 'txn2',
+                'Referer': 'POST http://localhost/sda1/p/a/c/o',
+                'User-Agent': 'object-server %s' % os.getpid(),
+            },
+        }], async_updates)
 
     def test_DELETE_calls_delete_at(self):
         given_args = []
@@ -2172,70 +8661,236 @@ def fake_delete_at_update(*args):
             given_args.extend(args)
 
         self.object_controller.delete_at_update = fake_delete_at_update
-
         timestamp1 = normalize_timestamp(time())
-        delete_at_timestamp1 = str(int(time() + 1000))
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+        delete_at_timestamp1 = int(time() + 1000)
+        delete_at_container1 = \
+            self.object_controller.expirer_config.get_expirer_container(
+                delete_at_timestamp1, 'a', 'c', 'o')
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
             headers={'X-Timestamp': timestamp1,
                      'Content-Length': '4',
                      'Content-Type': 'application/octet-stream',
-                     'X-Delete-At': delete_at_timestamp1})
+                     'X-Delete-At': str(delete_at_timestamp1),
+                     'X-Delete-At-Container': delete_at_container1})
         req.body = 'TEST'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
-        self.assertEquals(given_args, [
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+        self.assertEqual(given_args, [
             'PUT', int(delete_at_timestamp1), 'a', 'c', 'o',
-            {'X-Delete-At': delete_at_timestamp1,
-             'Content-Length': '4',
-             'Content-Type': 'application/octet-stream',
-             'X-Timestamp': timestamp1,
-             'Host': 'localhost:80'},
-            'sda1'])
+            given_args[5], 'sda1', POLICIES[0], {
+                'x-content-type': 'text/plain;swift_expirer_bytes=4',
+                'x-content-type-timestamp': timestamp1
+            }])
 
         while given_args:
             given_args.pop()
 
         sleep(.00001)
         timestamp2 = normalize_timestamp(time())
-        req = Request.blank('/sda1/p/a/c/o',
+        req = Request.blank(
+            '/sda1/p/a/c/o',
             environ={'REQUEST_METHOD': 'DELETE'},
             headers={'X-Timestamp': timestamp2,
                      'Content-Type': 'application/octet-stream'})
-        resp = self.object_controller.DELETE(req)
-        self.assertEquals(resp.status_int, 204)
-        self.assertEquals(given_args, [
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(given_args, [
             'DELETE', int(delete_at_timestamp1), 'a', 'c', 'o',
-            {'Content-Type': 'application/octet-stream',
-             'Host': 'localhost:80', 'X-Timestamp': timestamp2},
-            'sda1'])
+            given_args[5], 'sda1', POLICIES[0]])
+
+    def test_PUT_can_skip_updating_expirer_queue(self):
+        policy = POLICIES.get_by_index(0)
+        test_time = time()
+        put_time = test_time
+        overwrite_time = test_time + 1
+        delete_at_timestamp = int(test_time + 10000)
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers=self._update_delete_at_headers({
+                'X-Timestamp': normalize_timestamp(put_time),
+                'X-Delete-At': str(delete_at_timestamp),
+                'Content-Length': '4',
+                'Content-Type': 'application/octet-stream'}))
+        req.body = 'TEST'
+
+        # Mock out async_update so we don't get any async_pending files.
+        with mock.patch.object(self.object_controller, 'async_update'):
+            resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        # Overwrite with a non-expiring object
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': normalize_timestamp(overwrite_time),
+                     'X-Backend-Clean-Expiring-Object-Queue': 'false',
+                     'Content-Length': '9',
+                     'Content-Type': 'application/octet-stream'})
+        req.body = 'new stuff'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        async_pending_dir = os.path.join(
+            self.testdir, 'sda1', diskfile.get_async_dir(policy))
+        # empty dir or absent dir, either is fine
+        try:
+            self.assertEqual([], os.listdir(async_pending_dir))
+        except OSError as err:
+            self.assertEqual(err.errno, errno.ENOENT)
+
+    def test_PUT_can_skip_deleting_expirer_queue_but_still_inserts(self):
+        policy = POLICIES.get_by_index(0)
+        test_time = time()
+        put_time = test_time
+        overwrite_time = test_time + 1
+        delete_at_timestamp_1 = int(test_time + 10000)
+        delete_at_timestamp_2 = int(test_time + 20000)
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers=self._update_delete_at_headers({
+                'X-Timestamp': normalize_timestamp(put_time),
+                'X-Delete-At': str(delete_at_timestamp_1),
+                'Content-Length': '4',
+                'Content-Type': 'application/octet-stream'}))
+        req.body = 'TEST'
+
+        # Mock out async_update so we don't get any async_pending files.
+        with mock.patch.object(self.object_controller, 'async_update'):
+            resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        # Overwrite with an expiring object
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers=self._update_delete_at_headers({
+                'X-Timestamp': normalize_timestamp(overwrite_time),
+                'X-Backend-Clean-Expiring-Object-Queue': 'false',
+                'X-Delete-At': str(delete_at_timestamp_2),
+                'Content-Length': '9',
+                'Content-Type': 'application/octet-stream'}))
+        req.body = 'new stuff'
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        async_pendings = []
+        async_pending_dir = os.path.join(
+            self.testdir, 'sda1', diskfile.get_async_dir(policy))
+        for dirpath, _, filenames in os.walk(async_pending_dir):
+            for filename in filenames:
+                async_pendings.append(os.path.join(dirpath, filename))
+
+        self.assertEqual(len(async_pendings), 1)
+
+        async_pending_ops = []
+        for pending_file in async_pendings:
+            with open(pending_file, 'rb') as fh:
+                async_pending = pickle.load(fh)
+                async_pending_ops.append(async_pending['op'])
+        self.assertEqual(async_pending_ops, ['PUT'])
 
     def test_PUT_delete_at_in_past(self):
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
             headers={'X-Timestamp': normalize_timestamp(time()),
                      'X-Delete-At': str(int(time() - 1)),
                      'Content-Length': '4',
                      'Content-Type': 'application/octet-stream'})
         req.body = 'TEST'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 400)
-        self.assertTrue('X-Delete-At in past' in resp.body)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 400)
+        self.assertTrue(b'X-Delete-At in past' in resp.body)
+
+    def test_POST_can_skip_updating_expirer_queue(self):
+        policy = POLICIES.get_by_index(0)
+        test_time = time()
+        put_time = test_time
+        overwrite_time = test_time + 1
+        delete_at_timestamp = int(test_time + 10000)
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers=self._update_delete_at_headers({
+                'X-Timestamp': normalize_timestamp(put_time),
+                'X-Delete-At': str(delete_at_timestamp),
+                'Content-Length': '4',
+                'Content-Type': 'application/octet-stream'}))
+        req.body = 'TEST'
+
+        # Mock out async_update so we don't get any async_pending files.
+        with mock.patch.object(self.object_controller, 'async_update'):
+            resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        # POST to remove X-Delete-At
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'POST'},
+            headers={'X-Timestamp': normalize_timestamp(overwrite_time),
+                     'X-Backend-Clean-Expiring-Object-Queue': 'false',
+                     'X-Delete-At': ''})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 202)
+
+        async_pending_dir = os.path.join(
+            self.testdir, 'sda1', diskfile.get_async_dir(policy))
+        # empty dir or absent dir, either is fine
+        try:
+            self.assertEqual([], os.listdir(async_pending_dir))
+        except OSError as err:
+            self.assertEqual(err.errno, errno.ENOENT)
 
     def test_POST_delete_at_in_past(self):
-        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT'},
             headers={'X-Timestamp': normalize_timestamp(time()),
                      'Content-Length': '4',
                      'Content-Type': 'application/octet-stream'})
         req.body = 'TEST'
-        resp = self.object_controller.PUT(req)
-        self.assertEquals(resp.status_int, 201)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
 
-        req = Request.blank('/sda1/p/a/c/o',
+        req = Request.blank(
+            '/sda1/p/a/c/o',
             environ={'REQUEST_METHOD': 'POST'},
             headers={'X-Timestamp': normalize_timestamp(time() + 1),
                      'X-Delete-At': str(int(time() - 1))})
-        resp = self.object_controller.POST(req)
-        self.assertEquals(resp.status_int, 400)
-        self.assertTrue('X-Delete-At in past' in resp.body)
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 400)
+        self.assertTrue(b'X-Delete-At in past' in resp.body)
+
+    def test_POST_delete_at_in_past_with_skewed_clock(self):
+        proxy_server_put_time = 1000
+        proxy_server_post_time = 1001
+        delete_at = 1050
+        obj_server_put_time = 1100
+        obj_server_post_time = 1101
+
+        # test setup: make an object for us to POST to
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': normalize_timestamp(proxy_server_put_time),
+                     'Content-Length': '4',
+                     'Content-Type': 'application/octet-stream'})
+        req.body = 'TEST'
+        with mock.patch('swift.obj.server.time.time',
+                        return_value=obj_server_put_time):
+            resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        # then POST to it
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'POST'},
+            headers={'X-Timestamp':
+                     normalize_timestamp(proxy_server_post_time),
+                     'X-Delete-At': str(delete_at)})
+        with mock.patch('swift.obj.server.time.time',
+                        return_value=obj_server_post_time):
+            resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 202)
 
     def test_REPLICATE_works(self):
 
@@ -2245,21 +8900,43 @@ def fake_get_hashes(*args, **kwargs):
         def my_tpool_execute(func, *args, **kwargs):
             return func(*args, **kwargs)
 
-        was_get_hashes = object_server.get_hashes
-        object_server.get_hashes = fake_get_hashes
-        was_tpool_exe = tpool.execute
-        tpool.execute = my_tpool_execute
-        try:
-            req = Request.blank('/sda1/p/suff',
-                environ={'REQUEST_METHOD': 'REPLICATE'},
-                headers={})
-            resp = self.object_controller.REPLICATE(req)
-            self.assertEquals(resp.status_int, 200)
+        with mock.patch.object(diskfile.DiskFileManager, '_get_hashes',
+                               fake_get_hashes), \
+                mock.patch.object(tpool, 'execute', my_tpool_execute), \
+                mock.patch('swift.obj.diskfile.os.path.exists',
+                           return_value=True):
+            req = Request.blank('/sda1/p/',
+                                environ={'REQUEST_METHOD': 'REPLICATE'},
+                                headers={})
+            resp = req.get_response(self.object_controller)
+            self.assertEqual(resp.status_int, 200)
             p_data = pickle.loads(resp.body)
-            self.assertEquals(p_data, {1: 2})
-        finally:
-            tpool.execute = was_tpool_exe
-            object_server.get_hashes = was_get_hashes
+            self.assertEqual(p_data, {1: 2})
+
+    def test_REPLICATE_pickle_protocol(self):
+
+        def fake_get_hashes(*args, **kwargs):
+            return 0, {1: 2}
+
+        def my_tpool_execute(func, *args, **kwargs):
+            return func(*args, **kwargs)
+
+        with mock.patch.object(diskfile.DiskFileManager, '_get_hashes',
+                               fake_get_hashes), \
+                mock.patch.object(tpool, 'execute', my_tpool_execute), \
+                mock.patch('swift.obj.server.pickle.dumps') as fake_pickle, \
+                mock.patch('swift.obj.diskfile.os.path.exists',
+                           return_value=True):
+            req = Request.blank('/sda1/p/',
+                                environ={'REQUEST_METHOD': 'REPLICATE'},
+                                headers={})
+            fake_pickle.return_value = b''
+            req.get_response(self.object_controller)
+            # This is the key assertion: starting in Python 3.0, the
+            # default protocol version is 3, but such pickles can't be read
+            # on Python 2. As long as we may need to talk to a Python 2
+            # process, we need to cap our protocol version.
+            fake_pickle.assert_called_once_with({1: 2}, protocol=2)
 
     def test_REPLICATE_timeout(self):
 
@@ -2269,22 +8946,107 @@ def fake_get_hashes(*args, **kwargs):
         def my_tpool_execute(func, *args, **kwargs):
             return func(*args, **kwargs)
 
-        was_get_hashes = object_server.get_hashes
-        object_server.get_hashes = fake_get_hashes
-        was_tpool_exe = tpool.execute
-        tpool.execute = my_tpool_execute
-        try:
-            req = Request.blank('/sda1/p/suff',
-                environ={'REQUEST_METHOD': 'REPLICATE'},
-                headers={})
+        with mock.patch.object(diskfile.DiskFileManager, '_get_hashes',
+                               fake_get_hashes), \
+                mock.patch.object(tpool, 'execute', my_tpool_execute), \
+                mock.patch('swift.obj.diskfile.os.path.exists',
+                           return_value=True):
+            diskfile.DiskFileManager._get_hashes = fake_get_hashes
+            tpool.execute = my_tpool_execute
+            req = Request.blank('/sda1/p/',
+                                environ={'REQUEST_METHOD': 'REPLICATE'},
+                                headers={})
             self.assertRaises(Timeout, self.object_controller.REPLICATE, req)
-        finally:
-            tpool.execute = was_tpool_exe
-            object_server.get_hashes = was_get_hashes
+
+    def test_REPLICATE_reclaims_tombstones(self):
+        conf = {'devices': self.testdir, 'mount_check': False,
+                'reclaim_age': 100}
+        self.object_controller = object_server.ObjectController(
+            conf, logger=self.logger)
+        for policy in self.iter_policies():
+            # create a tombstone
+            ts = next(self.ts)
+            delete_request = Request.blank(
+                '/sda1/0/a/c/o', method='DELETE',
+                headers={
+                    'x-backend-storage-policy-index': int(policy),
+                    'x-timestamp': ts.internal,
+                })
+            resp = delete_request.get_response(self.object_controller)
+            self.assertEqual(resp.status_int, 404)
+            objfile = self.df_mgr.get_diskfile('sda1', '0', 'a', 'c', 'o',
+                                               policy=policy)
+            tombstone_file = os.path.join(objfile._datadir,
+                                          '%s.ts' % ts.internal)
+            self.assertTrue(os.path.exists(tombstone_file))
+
+            # REPLICATE will hash it
+            req = Request.blank(
+                '/sda1/0', method='REPLICATE',
+                headers={
+                    'x-backend-storage-policy-index': int(policy),
+                })
+            resp = req.get_response(self.object_controller)
+            self.assertEqual(resp.status_int, 200)
+            suffixes = list(pickle.loads(resp.body).keys())
+            self.assertEqual(1, len(suffixes),
+                             'Expected just one suffix; got %r' % (suffixes,))
+            suffix = suffixes[0]
+            self.assertEqual(suffix, os.path.basename(
+                os.path.dirname(objfile._datadir)))
+            # tombstone still exists
+            self.assertTrue(os.path.exists(tombstone_file))
+
+            # after reclaim REPLICATE will mark invalid (but NOT rehash!)
+            replicate_request = Request.blank(
+                '/sda1/0/%s' % suffix, method='REPLICATE',
+                headers={
+                    'x-backend-storage-policy-index': int(policy),
+                })
+            with mock.patch('swift.obj.diskfile.time.time',
+                            return_value=time() + 200):
+                resp = replicate_request.get_response(self.object_controller)
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual(None, pickle.loads(resp.body))
+            # no rehash means tombstone still exists...
+            self.assertTrue(os.path.exists(tombstone_file))
+
+            # but at some point (like the next pre-sync REPLICATE) it rehashes
+            replicate_request = Request.blank(
+                '/sda1/0/', method='REPLICATE',
+                headers={
+                    'x-backend-storage-policy-index': int(policy),
+                })
+            with mock.patch('swift.obj.diskfile.time.time',
+                            return_value=time() + 200):
+                resp = replicate_request.get_response(self.object_controller)
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual({}, pickle.loads(resp.body))
+            # and tombstone is reaped!
+            self.assertFalse(os.path.exists(tombstone_file))
+
+            # N.B. with a small reclaim age like this - if proxy clocks get far
+            # enough out of whack ...
+            with mock.patch('swift.obj.diskfile.time.time',
+                            return_value=time() + 200):
+                resp = delete_request.get_response(self.object_controller)
+                # we won't even create the tombstone
+                self.assertFalse(os.path.exists(tombstone_file))
+                # hashdir's empty, so it gets cleaned up
+                self.assertFalse(os.path.exists(objfile._datadir))
+
+    def test_SSYNC_can_be_called(self):
+        req = Request.blank('/sda1/0',
+                            environ={'REQUEST_METHOD': 'SSYNC'},
+                            headers={})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual('True',
+                         resp.headers.get('X-Backend-Accept-No-Commit'))
 
     def test_PUT_with_full_drive(self):
 
-        class IgnoredBody():
+        class IgnoredBody(object):
 
             def __init__(self):
                 self.read_called = False
@@ -2292,29 +9054,1716 @@ def __init__(self):
             def read(self, size=-1):
                 if not self.read_called:
                     self.read_called = True
-                    return 'VERIFY'
-                return ''
+                    return b'VERIFY'
+                return b''
 
         def fake_fallocate(fd, size):
-            raise OSError(42, 'Unable to fallocate(%d)' % size)
+            raise OSError(errno.ENOSPC, os.strerror(errno.ENOSPC))
 
-        orig_fallocate = object_server.fallocate
-        try:
-            object_server.fallocate = fake_fallocate
+        with mock.patch.object(diskfile, 'fallocate', fake_fallocate):
             timestamp = normalize_timestamp(time())
             body_reader = IgnoredBody()
-            req = Request.blank('/sda1/p/a/c/o',
-                    environ={'REQUEST_METHOD': 'PUT',
-                             'wsgi.input': body_reader},
-                    headers={'X-Timestamp': timestamp,
-                             'Content-Length': '6',
-                             'Content-Type': 'application/octet-stream',
-                             'Expect': '100-continue'})
-            resp = self.object_controller.PUT(req)
-            self.assertEquals(resp.status_int, 507)
+            req = Request.blank(
+                '/sda1/p/a/c/o',
+                environ={'REQUEST_METHOD': 'PUT',
+                         'wsgi.input': body_reader},
+                headers={'X-Timestamp': timestamp,
+                         'Content-Length': '6',
+                         'Content-Type': 'application/octet-stream',
+                         'Expect': '100-continue'})
+            resp = req.get_response(self.object_controller)
+            self.assertEqual(resp.status_int, 507)
             self.assertFalse(body_reader.read_called)
-        finally:
-            object_server.fallocate = orig_fallocate
+
+    def test_chunked_PUT_with_full_drive(self):
+
+        class IgnoredBody(object):
+
+            def __init__(self):
+                self.read_called = False
+
+            def read(self, size=-1):
+                if not self.read_called:
+                    self.read_called = True
+                    return b'VERIFY'
+                return b''
+
+        with mock.patch.object(diskfile, 'fs_has_free_space',
+                               return_value=False):
+            timestamp = normalize_timestamp(time())
+            body_reader = IgnoredBody()
+            req = Request.blank(
+                '/sda1/p/a/c/o',
+                environ={'REQUEST_METHOD': 'PUT',
+                         'wsgi.input': body_reader},
+                headers={'X-Timestamp': timestamp,
+                         'Transfer-Encoding': 'chunked',
+                         'Content-Type': 'application/octet-stream',
+                         'Expect': '100-continue'})
+            resp = req.get_response(self.object_controller)
+            self.assertEqual(resp.status_int, 507)
+            self.assertFalse(body_reader.read_called)
+
+    def test_POST_with_full_drive(self):
+        ts_iter = make_timestamp_iter()
+        timestamp = next(ts_iter).internal
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT'},
+            body=b'VERIFY',
+            headers={'X-Timestamp': timestamp,
+                     'Content-Type': 'application/octet-stream'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        with mock.patch.object(diskfile, 'fs_has_free_space',
+                               return_value=False):
+            timestamp = next(ts_iter).internal
+            req = Request.blank(
+                '/sda1/p/a/c/o',
+                environ={'REQUEST_METHOD': 'POST'},
+                headers={'X-Timestamp': timestamp,
+                         'Content-Type': 'application/octet-stream'})
+            resp = req.get_response(self.object_controller)
+            self.assertEqual(resp.status_int, 507)
+
+    def test_DELETE_with_full_drive(self):
+        timestamp = normalize_timestamp(time())
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT'},
+            body=b'VERIFY',
+            headers={'X-Timestamp': timestamp,
+                     'Content-Type': 'application/octet-stream'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        with mock.patch.object(diskfile, 'fs_has_free_space',
+                               return_value=False):
+            timestamp = normalize_timestamp(time())
+            req = Request.blank(
+                '/sda1/p/a/c/o',
+                method='DELETE',
+                body=b'',
+                headers={'X-Timestamp': timestamp})
+            resp = req.get_response(self.object_controller)
+            self.assertEqual(resp.status_int, 204)
+
+    def test_chunked_DELETE_with_full_drive(self):
+        timestamp = normalize_timestamp(time())
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'PUT'},
+            body=b'VERIFY',
+            headers={'X-Timestamp': timestamp,
+                     'Content-Type': 'application/octet-stream'})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        class IgnoredBody(object):
+
+            def __init__(self):
+                self.read_called = False
+
+            def read(self, size=-1):
+                if not self.read_called:
+                    self.read_called = True
+                    return b'VERIFY'
+                return b''
+
+        with mock.patch.object(diskfile, 'fs_has_free_space',
+                               return_value=False):
+            timestamp = normalize_timestamp(time())
+            body_reader = IgnoredBody()
+            req = Request.blank(
+                '/sda1/p/a/c/o',
+                environ={'REQUEST_METHOD': 'DELETE',
+                         'wsgi.input': body_reader},
+                headers={'X-Timestamp': timestamp,
+                         'Transfer-Encoding': 'chunked',
+                         'Content-Type': 'application/octet-stream',
+                         'Expect': '100-continue'})
+            resp = req.get_response(self.object_controller)
+            self.assertEqual(resp.status_int, 204)
+            self.assertFalse(body_reader.read_called)
+
+    def test_global_conf_callback_does_nothing(self):
+        preloaded_app_conf = {}
+        global_conf = {}
+        object_server.global_conf_callback(preloaded_app_conf, global_conf)
+        self.assertEqual(preloaded_app_conf, {})
+        self.assertEqual(list(global_conf.keys()), ['replication_semaphore'])
+        try:
+            value = global_conf['replication_semaphore'][0].get_value()
+        except NotImplementedError:
+            # On some operating systems (at a minimum, OS X) it's not possible
+            # to introspect the value of a semaphore
+            raise unittest.SkipTest
+        else:
+            self.assertEqual(value, 4)
+
+    def test_global_conf_callback_replication_semaphore(self):
+        preloaded_app_conf = {'replication_concurrency': 123}
+        global_conf = {}
+        with mock.patch.object(
+                object_server.multiprocessing, 'BoundedSemaphore',
+                return_value='test1') as mocked_Semaphore:
+            object_server.global_conf_callback(preloaded_app_conf, global_conf)
+        self.assertEqual(preloaded_app_conf, {'replication_concurrency': 123})
+        self.assertEqual(global_conf, {'replication_semaphore': ['test1']})
+        mocked_Semaphore.assert_called_once_with(123)
+
+    def test_handling_of_replication_semaphore_config(self):
+        conf = {'devices': self.testdir, 'mount_check': 'false'}
+        objsrv = object_server.ObjectController(conf)
+        self.assertTrue(objsrv.replication_semaphore is None)
+        conf['replication_semaphore'] = ['sema']
+        objsrv = object_server.ObjectController(conf)
+        self.assertEqual(objsrv.replication_semaphore, 'sema')
+
+    def test_serv_reserv(self):
+        # Test replication_server flag was set from configuration file.
+        conf = {'devices': self.testdir, 'mount_check': 'false'}
+        self.assertTrue(
+            object_server.ObjectController(conf).replication_server)
+        for val in [True, '1', 'True', 'true']:
+            conf['replication_server'] = val
+            self.assertTrue(
+                object_server.ObjectController(conf).replication_server)
+        for val in [False, 0, '0', 'False', 'false', 'test_string']:
+            conf['replication_server'] = val
+            self.assertFalse(
+                object_server.ObjectController(conf).replication_server)
+
+    def test_list_allowed_methods(self):
+        # Test list of allowed_methods
+        obj_methods = ['DELETE', 'PUT', 'HEAD', 'GET', 'POST']
+        repl_methods = ['REPLICATE', 'SSYNC']
+        for method_name in obj_methods:
+            method = getattr(self.object_controller, method_name)
+            self.assertFalse(hasattr(method, 'replication'))
+        for method_name in repl_methods:
+            method = getattr(self.object_controller, method_name)
+            self.assertEqual(method.replication, True)
+
+    def test_correct_allowed_method(self):
+        # Test correct work for allowed method using
+        # swift.obj.server.ObjectController.__call__
+        inbuf = WsgiBytesIO()
+        errbuf = StringIO()
+        outbuf = StringIO()
+        self.object_controller = object_server.app_factory(
+            {'devices': self.testdir, 'mount_check': 'false',
+             'replication_server': 'false'})
+
+        def start_response(*args):
+            # Sends args to outbuf
+            outbuf.write(args[0])
+
+        method = 'PUT'
+        env = {'REQUEST_METHOD': method,
+               'SCRIPT_NAME': '',
+               'PATH_INFO': '/sda1/p/a/c/o',
+               'SERVER_NAME': '127.0.0.1',
+               'SERVER_PORT': '8080',
+               'SERVER_PROTOCOL': 'HTTP/1.0',
+               'CONTENT_LENGTH': '0',
+               'wsgi.version': (1, 0),
+               'wsgi.url_scheme': 'http',
+               'wsgi.input': inbuf,
+               'wsgi.errors': errbuf,
+               'wsgi.multithread': False,
+               'wsgi.multiprocess': False,
+               'wsgi.run_once': False}
+
+        method_res = mock.MagicMock()
+        mock_method = public(lambda x:
+                             mock.MagicMock(return_value=method_res))
+        with mock.patch.object(self.object_controller, method,
+                               new=mock_method):
+            response = self.object_controller(env, start_response)
+            self.assertEqual(response, method_res)
+
+    def test_not_allowed_method(self):
+        # Test correct work for NOT allowed method using
+        # swift.obj.server.ObjectController.__call__
+        inbuf = WsgiBytesIO()
+        errbuf = StringIO()
+        outbuf = StringIO()
+        self.object_controller = object_server.ObjectController(
+            {'devices': self.testdir, 'mount_check': 'false',
+             'replication_server': 'false'}, logger=self.logger)
+
+        def start_response(*args):
+            # Sends args to outbuf
+            outbuf.write(args[0])
+
+        method = 'PUT'
+
+        env = {'REQUEST_METHOD': method,
+               'SCRIPT_NAME': '',
+               'PATH_INFO': '/sda1/p/a/c/o',
+               'SERVER_NAME': '127.0.0.1',
+               'SERVER_PORT': '8080',
+               'SERVER_PROTOCOL': 'HTTP/1.0',
+               'CONTENT_LENGTH': '0',
+               'wsgi.version': (1, 0),
+               'wsgi.url_scheme': 'http',
+               'wsgi.input': inbuf,
+               'wsgi.errors': errbuf,
+               'wsgi.multithread': False,
+               'wsgi.multiprocess': False,
+               'wsgi.run_once': False}
+
+        answer = [b'<html><h1>Method Not Allowed</h1><p>The method is not '
+                  b'allowed for this resource.</p></html>']
+        mock_method = replication(public(lambda x: mock.MagicMock()))
+        with mock.patch.object(self.object_controller, method,
+                               new=mock_method):
+            mock_method.replication = True
+            with mock.patch('time.time',
+                            mock.MagicMock(side_effect=[10000.0,
+                                                        10001.0, 10001.0])):
+                with mock.patch('os.getpid',
+                                mock.MagicMock(return_value=1234)):
+                    response = self.object_controller.__call__(
+                        env, start_response)
+                    self.assertEqual(response, answer)
+                    self.assertEqual(
+                        self.logger.get_lines_for_level('info'),
+                        ['- - - [01/Jan/1970:02:46:41 +0000] "PUT'
+                         ' /sda1/p/a/c/o" 405 91 "-" "-" "-" 1.0000 "-"'
+                         ' 1234 -'])
+
+    def test_replication_server_call_all_methods(self):
+        inbuf = WsgiBytesIO()
+        errbuf = StringIO()
+        outbuf = StringIO()
+        self.object_controller = object_server.ObjectController(
+            {'devices': self.testdir, 'mount_check': 'false',
+             'replication_server': 'true'}, logger=debug_logger())
+
+        def start_response(*args):
+            """Sends args to outbuf"""
+            outbuf.write(args[0])
+
+        obj_methods = ['PUT', 'HEAD', 'GET', 'POST', 'DELETE', 'OPTIONS']
+        for method in obj_methods:
+            env = {'REQUEST_METHOD': method,
+                   'HTTP_X_TIMESTAMP': next(self.ts).internal,
+                   'SCRIPT_NAME': '',
+                   'PATH_INFO': '/sda1/p/a/c/o',
+                   'SERVER_NAME': '127.0.0.1',
+                   'SERVER_PORT': '8080',
+                   'SERVER_PROTOCOL': 'HTTP/1.0',
+                   'CONTENT_TYPE': 'text/plain',
+                   'CONTENT_LENGTH': '0',
+                   'wsgi.version': (1, 0),
+                   'wsgi.url_scheme': 'http',
+                   'wsgi.input': inbuf,
+                   'wsgi.errors': errbuf,
+                   'wsgi.multithread': False,
+                   'wsgi.multiprocess': False,
+                   'wsgi.run_once': False}
+            self.object_controller(env, start_response)
+            self.assertEqual(errbuf.getvalue(), '')
+            self.assertIn(outbuf.getvalue()[:4], ('201 ', '204 ', '200 '))
+
+    def test_create_reserved_namespace_object(self):
+        path = '/sda1/p/a/%sc/%so' % (utils.RESERVED_STR, utils.RESERVED_STR)
+        req = Request.blank(path, method='PUT', headers={
+            'X-Timestamp': next(self.ts).internal,
+            'Content-Type': 'application/x-test',
+            'Content-Length': 0,
+        })
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status, '201 Created')
+
+    def test_create_reserved_namespace_object_in_user_container(self):
+        path = '/sda1/p/a/c/%so' % utils.RESERVED_STR
+        req = Request.blank(path, method='PUT', headers={
+            'X-Timestamp': next(self.ts).internal,
+            'Content-Type': 'application/x-test',
+            'Content-Length': 0,
+        })
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status, '400 Bad Request', resp.body)
+        self.assertEqual(resp.body, b'Invalid reserved-namespace object in '
+                         b'user-namespace container')
+
+    def test_other_methods_reserved_namespace_object(self):
+        container = get_reserved_name('c')
+        obj = get_reserved_name('o', 'v1')
+        path = '/sda1/p/a/%s/%s' % (container, obj)
+        req = Request.blank(path, method='PUT', headers={
+            'X-Timestamp': next(self.ts).internal,
+            'Content-Type': 'application/x-test',
+            'Content-Length': 0,
+        })
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status, '201 Created')
+
+        bad_req = Request.blank('/sda1/p/a/c/%s' % obj, method='PUT', headers={
+            'X-Timestamp': next(self.ts).internal})
+        resp = bad_req.get_response(self.object_controller)
+        self.assertEqual(resp.status, '400 Bad Request')
+        self.assertEqual(resp.body, b'Invalid reserved-namespace object '
+                         b'in user-namespace container')
+
+        for method in ('GET', 'POST', 'DELETE'):
+            req.method = method
+            req.headers['X-Timestamp'] = next(self.ts).internal
+            resp = req.get_response(self.object_controller)
+            self.assertEqual(resp.status_int // 100, 2)
+
+            bad_req.method = method
+            req.headers['X-Timestamp'] = next(self.ts).internal
+            resp = bad_req.get_response(self.object_controller)
+            self.assertEqual(resp.status, '400 Bad Request')
+            self.assertEqual(resp.body, b'Invalid reserved-namespace object '
+                             b'in user-namespace container')
+
+    def test_not_utf8_and_not_logging_requests(self):
+        inbuf = WsgiBytesIO()
+        errbuf = StringIO()
+        outbuf = StringIO()
+        self.object_controller = object_server.ObjectController(
+            {'devices': self.testdir, 'mount_check': 'false',
+             'replication_server': 'false', 'log_requests': 'false'},
+            logger=debug_logger())
+
+        def start_response(*args):
+            # Sends args to outbuf
+            outbuf.write(args[0])
+
+        method = 'PUT'
+
+        env = {'REQUEST_METHOD': method,
+               'SCRIPT_NAME': '',
+               'PATH_INFO': '/sda1/p/a/c/\xd8\x3e%20/%',
+               'SERVER_NAME': '127.0.0.1',
+               'SERVER_PORT': '8080',
+               'SERVER_PROTOCOL': 'HTTP/1.0',
+               'CONTENT_LENGTH': '0',
+               'wsgi.version': (1, 0),
+               'wsgi.url_scheme': 'http',
+               'wsgi.input': inbuf,
+               'wsgi.errors': errbuf,
+               'wsgi.multithread': False,
+               'wsgi.multiprocess': False,
+               'wsgi.run_once': False}
+
+        answer = [b'Invalid UTF8 or contains NULL']
+        mock_method = public(lambda x: mock.MagicMock())
+        with mock.patch.object(self.object_controller, method,
+                               new=mock_method):
+            response = self.object_controller.__call__(env, start_response)
+            self.assertEqual(response, answer)
+            self.assertEqual(self.logger.get_lines_for_level('info'), [])
+
+    def test__call__returns_500(self):
+        inbuf = WsgiBytesIO()
+        errbuf = StringIO()
+        outbuf = StringIO()
+        self.logger = debug_logger('test')
+        self.object_controller = object_server.ObjectController(
+            {'devices': self.testdir, 'mount_check': 'false',
+             'replication_server': 'false', 'log_requests': 'false'},
+            logger=self.logger)
+
+        def start_response(*args):
+            # Sends args to outbuf
+            outbuf.write(args[0])
+
+        method = 'PUT'
+
+        env = {'REQUEST_METHOD': method,
+               'SCRIPT_NAME': '',
+               'PATH_INFO': '/sda1/p/a/c/o',
+               'SERVER_NAME': '127.0.0.1',
+               'SERVER_PORT': '8080',
+               'SERVER_PROTOCOL': 'HTTP/1.0',
+               'CONTENT_LENGTH': '0',
+               'wsgi.version': (1, 0),
+               'wsgi.url_scheme': 'http',
+               'wsgi.input': inbuf,
+               'wsgi.errors': errbuf,
+               'wsgi.multithread': False,
+               'wsgi.multiprocess': False,
+               'wsgi.run_once': False}
+
+        @public
+        def mock_put_method(*args, **kwargs):
+            raise Exception()
+
+        with mock.patch.object(self.object_controller, method,
+                               new=mock_put_method):
+            response = self.object_controller.__call__(env, start_response)
+            self.assertTrue(response[0].startswith(
+                b'Traceback (most recent call last):'))
+            self.assertEqual(self.logger.get_lines_for_level('error'), [
+                'ERROR __call__ error with %(method)s %(path)s : ' % {
+                    'method': 'PUT', 'path': '/sda1/p/a/c/o'},
+            ])
+            self.assertEqual(self.logger.get_lines_for_level('info'), [])
+
+    def test_PUT_slow(self):
+        inbuf = WsgiBytesIO()
+        errbuf = StringIO()
+        outbuf = StringIO()
+        self.object_controller = object_server.ObjectController(
+            {'devices': self.testdir, 'mount_check': 'false',
+             'replication_server': 'false', 'log_requests': 'false',
+             'slow': '10'},
+            logger=self.logger)
+
+        def start_response(*args):
+            # Sends args to outbuf
+            outbuf.write(args[0])
+
+        method = 'PUT'
+
+        env = {'REQUEST_METHOD': method,
+               'SCRIPT_NAME': '',
+               'PATH_INFO': '/sda1/p/a/c/o',
+               'SERVER_NAME': '127.0.0.1',
+               'SERVER_PORT': '8080',
+               'SERVER_PROTOCOL': 'HTTP/1.0',
+               'CONTENT_LENGTH': '0',
+               'wsgi.version': (1, 0),
+               'wsgi.url_scheme': 'http',
+               'wsgi.input': inbuf,
+               'wsgi.errors': errbuf,
+               'wsgi.multithread': False,
+               'wsgi.multiprocess': False,
+               'wsgi.run_once': False}
+
+        mock_method = public(lambda x: mock.MagicMock())
+        with mock.patch.object(self.object_controller, method,
+                               new=mock_method):
+            with mock.patch('time.time',
+                            mock.MagicMock(side_effect=[10000.0,
+                                                        10001.0])):
+                with mock.patch('swift.obj.server.sleep',
+                                mock.MagicMock()) as ms:
+                    self.object_controller.__call__(env, start_response)
+                    ms.assert_called_with(9)
+                    self.assertEqual(self.logger.get_lines_for_level('info'),
+                                     [])
+
+    def test_log_line_format(self):
+        req = Request.blank(
+            '/sda1/p/a/c/o',
+            environ={'REQUEST_METHOD': 'HEAD', 'REMOTE_ADDR': '1.2.3.4'})
+        self.object_controller.logger = self.logger
+        with mock.patch('time.time',
+                        side_effect=[10000.0, 10000.0, 10001.0, 10002.0,
+                                     10002.0, 10002.0, 10002.0, 10002.0]), \
+                mock.patch('os.getpid', return_value=1234):
+            req.get_response(self.object_controller)
+        self.assertEqual(
+            self.logger.get_lines_for_level('info'),
+            ['1.2.3.4 - - [01/Jan/1970:02:46:42 +0000] "HEAD /sda1/p/a/c/o" '
+             '404 - "-" "-" "-" 2.0000 "-" 1234 -'])
+
+    @patch_policies([StoragePolicy(0, 'zero', True),
+                     StoragePolicy(1, 'one', False)])
+    def test_dynamic_datadir(self):
+        # update router post patch
+        self.object_controller._diskfile_router = diskfile.DiskFileRouter(
+            self.conf, self.object_controller.logger)
+        timestamp = normalize_timestamp(time())
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': timestamp,
+                                     'Content-Type': 'application/x-test',
+                                     'Foo': 'fooheader',
+                                     'Baz': 'bazheader',
+                                     'X-Backend-Storage-Policy-Index': 1,
+                                     'X-Object-Meta-1': 'One',
+                                     'X-Object-Meta-Two': 'Two'})
+        req.body = 'VERIFY'
+        object_dir = self.testdir + "/sda1/objects-1"
+        self.assertFalse(os.path.isdir(object_dir))
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+        self.assertTrue(os.path.isdir(object_dir))
+
+        # make sure no idx in header uses policy 0 data_dir
+        req = Request.blank('/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'X-Timestamp': timestamp,
+                                     'Content-Type': 'application/x-test',
+                                     'Foo': 'fooheader',
+                                     'Baz': 'bazheader',
+                                     'X-Object-Meta-1': 'One',
+                                     'X-Object-Meta-Two': 'Two'})
+        req.body = 'VERIFY'
+        object_dir = self.testdir + "/sda1/objects"
+        self.assertFalse(os.path.isdir(object_dir))
+        with mock.patch.object(POLICIES, 'get_by_index',
+                               lambda _: True):
+            resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+        self.assertTrue(os.path.isdir(object_dir))
+
+    def test_storage_policy_index_is_validated(self):
+        # sanity check that index for existing policy is ok
+        methods = ('PUT', 'POST', 'GET', 'HEAD', 'REPLICATE', 'DELETE')
+        valid_indices = sorted([int(policy) for policy in POLICIES])
+        for index in valid_indices:
+            object_dir = self.testdir + "/sda1/objects"
+            if index > 0:
+                object_dir = "%s-%s" % (object_dir, index)
+            self.assertFalse(os.path.isdir(object_dir))
+            for method in methods:
+                headers = {
+                    'X-Timestamp': next(self.ts).internal,
+                    'Content-Type': 'application/x-test',
+                    'X-Backend-Storage-Policy-Index': index}
+                if POLICIES[index].policy_type == EC_POLICY:
+                    headers['X-Object-Sysmeta-Ec-Frag-Index'] = '2'
+                req = Request.blank(
+                    '/sda1/p/a/c/o',
+                    environ={'REQUEST_METHOD': method},
+                    headers=headers)
+                req.body = 'VERIFY'
+                resp = req.get_response(self.object_controller)
+                self.assertTrue(is_success(resp.status_int),
+                                '%s method failed: %r' % (method, resp.status))
+
+        # index for non-existent policy should return 503
+        index = valid_indices[-1] + 1
+        for method in methods:
+            req = Request.blank('/sda1/p/a/c/o',
+                                environ={'REQUEST_METHOD': method},
+                                headers={
+                                    'X-Timestamp': next(self.ts).internal,
+                                    'Content-Type': 'application/x-test',
+                                    'X-Backend-Storage-Policy-Index': index})
+            req.body = 'VERIFY'
+            object_dir = self.testdir + "/sda1/objects-%s" % index
+            resp = req.get_response(self.object_controller)
+            self.assertEqual(resp.status_int, 503)
+            self.assertFalse(os.path.isdir(object_dir))
+
+    def test_race_doesnt_quarantine(self):
+        existing_timestamp = next(self.ts)
+        delete_timestamp = next(self.ts)
+        put_timestamp = next(self.ts)
+        head_timestamp = next(self.ts)
+
+        # make a .ts
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'DELETE'},
+            headers={'X-Timestamp': existing_timestamp.internal})
+        req.get_response(self.object_controller)
+
+        # force a PUT between the listdir and read_metadata of a DELETE
+        put_once = [False]
+        orig_listdir = os.listdir
+
+        def mock_listdir(path):
+            listing = orig_listdir(path)
+            if not put_once[0]:
+                put_once[0] = True
+                req = Request.blank(
+                    '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                    headers={'X-Timestamp': put_timestamp.internal,
+                             'Content-Length': '9',
+                             'Content-Type': 'application/octet-stream'})
+                req.body = 'some data'
+                resp = req.get_response(self.object_controller)
+                self.assertEqual(resp.status_int, 201)
+            return listing
+
+        with mock.patch('os.listdir', mock_listdir):
+            req = Request.blank(
+                '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'DELETE'},
+                headers={'X-Timestamp': delete_timestamp.internal})
+            resp = req.get_response(self.object_controller)
+            self.assertEqual(resp.status_int, 404)
+
+        qdir = os.path.join(self.testdir, 'sda1', 'quarantined')
+        self.assertFalse(os.path.exists(qdir))
+
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'X-Timestamp': head_timestamp.internal})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['X-Timestamp'], put_timestamp.normal)
+
+    def test_race_with_PUT_POST_PUT(self):
+        existing_timestamp = next(self.ts)
+        post_timestamp = next(self.ts)
+        put_timestamp = next(self.ts)
+        head_timestamp = next(self.ts)
+
+        # make a .data
+        req = Request.blank(
+            '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+            headers={'X-Timestamp': existing_timestamp.internal,
+                     'Content-Type': 'application/octet-stream'},
+            body=b'orig data')
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 201)
+
+        # force a PUT between the listdir and read_metadata of a PUT
+        put_once = [False]
+        orig_listdir = os.listdir
+
+        def mock_listdir(path):
+            listing = orig_listdir(path)
+            if not put_once[0]:
+                put_once[0] = True
+                req = Request.blank(
+                    '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                    headers={'X-Timestamp': put_timestamp.internal,
+                             'Content-Type': 'application/octet-stream'},
+                    body=b'some data')
+                resp = req.get_response(self.object_controller)
+                self.assertEqual(resp.status_int, 201)
+            return listing
+
+        with mock.patch('os.listdir', mock_listdir):
+            req = Request.blank(
+                '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'POST'},
+                headers={'X-Timestamp': post_timestamp.internal})
+            resp = req.get_response(self.object_controller)
+            self.assertNotIn('X-Backend-Timestamp', resp.headers)
+            self.assertEqual(resp.status_int, 503)
+
+        qdir = os.path.join(self.testdir, 'sda1', 'quarantined')
+        self.assertFalse(os.path.exists(qdir))
+
+        req = Request.blank('/sda1/p/a/c/o',
+                            environ={'REQUEST_METHOD': 'HEAD'},
+                            headers={'X-Timestamp': head_timestamp.internal})
+        resp = req.get_response(self.object_controller)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['X-Timestamp'], put_timestamp.normal)
+
+    def test_multiphase_put_draining(self):
+        # We want to ensure that we read the whole response body even if
+        # it's multipart MIME and there's document parts that we don't
+        # expect or understand. This'll help save our bacon if we ever jam
+        # more stuff in there.
+        in_a_timeout = [False]
+
+        # inherit from BaseException so we get a stack trace when the test
+        # fails instead of just a 500
+        class NotInATimeout(BaseException):
+            pass
+
+        class FakeTimeout(BaseException):
+            def __enter__(self):
+                in_a_timeout[0] = True
+
+            def __exit__(self, typ, value, tb):
+                in_a_timeout[0] = False
+
+        class PickyWsgiBytesIO(WsgiBytesIO):
+            def read(self, *a, **kw):
+                if not in_a_timeout[0]:
+                    raise NotInATimeout()
+                return WsgiBytesIO.read(self, *a, **kw)
+
+            def readline(self, *a, **kw):
+                if not in_a_timeout[0]:
+                    raise NotInATimeout()
+                return WsgiBytesIO.readline(self, *a, **kw)
+
+        test_data = b'obj data'
+        footer_meta = {
+            "X-Object-Sysmeta-Ec-Frag-Index": "7",
+            "Etag": md5(test_data, usedforsecurity=False).hexdigest(),
+        }
+        footer_json = json.dumps(footer_meta).encode('ascii')
+        footer_meta_cksum = md5(
+            footer_json, usedforsecurity=False).hexdigest().encode('ascii')
+        test_doc = b"\r\n".join((
+            b"--boundary123",
+            b"X-Document: object body",
+            b"",
+            test_data,
+            b"--boundary123",
+            b"X-Document: object metadata",
+            b"Content-MD5: " + footer_meta_cksum,
+            b"",
+            footer_json,
+            b"--boundary123",
+            b"X-Document: we got cleverer",
+            b"",
+            b"stuff stuff meaningless stuuuuuuuuuuff",
+            b"--boundary123",
+            b"X-Document: we got even cleverer; can you believe it?",
+            b"Waneshaft: ambifacient lunar",
+            b"Casing: malleable logarithmic",
+            b"",
+            b"potato potato potato potato potato potato potato",
+            b"--boundary123--"
+        ))
+
+        # phase1 - PUT request with object metadata in footer and
+        # multiphase commit conversation
+        put_timestamp = utils.Timestamp.now().internal
+        headers = {
+            'Content-Type': 'text/plain',
+            'X-Timestamp': put_timestamp,
+            'Transfer-Encoding': 'chunked',
+            'Expect': '100-continue',
+            'X-Backend-Storage-Policy-Index': '1',
+            'X-Backend-Obj-Content-Length': len(test_data),
+            'X-Backend-Obj-Metadata-Footer': 'yes',
+            'X-Backend-Obj-Multipart-Mime-Boundary': 'boundary123',
+        }
+        wsgi_input = PickyWsgiBytesIO(test_doc)
+        req = Request.blank(
+            "/sda1/0/a/c/o",
+            environ={'REQUEST_METHOD': 'PUT', 'wsgi.input': wsgi_input},
+            headers=headers)
+
+        app = object_server.ObjectController(self.conf, logger=self.logger)
+        with mock.patch('swift.obj.server.ChunkReadTimeout', FakeTimeout):
+            resp = req.get_response(app)
+        self.assertEqual(resp.status_int, 201)  # sanity check
+
+        in_a_timeout[0] = True  # so we can check without an exception
+        self.assertEqual(wsgi_input.read(), b'')  # we read all the bytes
+
+
+@patch_policies(test_policies)
+class TestObjectServer(unittest.TestCase):
+
+    def setUp(self):
+        skip_if_no_xattrs()
+        # dirs
+        self.tmpdir = mkdtemp()
+        self.tempdir = os.path.join(self.tmpdir, 'tmp_test_obj_server')
+
+        self.devices = os.path.join(self.tempdir, 'srv/node')
+        for device in ('sda1', 'sdb1'):
+            os.makedirs(os.path.join(self.devices, device))
+
+        self.conf = {
+            'devices': self.devices,
+            'swift_dir': self.tempdir,
+            'mount_check': 'false',
+            # hopefully 1s is long enough to improve gate reliability?
+            'client_timeout': 1,
+        }
+        self.logger = debug_logger('test-object-server')
+        self.app = object_server.ObjectController(
+            self.conf, logger=self.logger)
+        sock = listen_zero()
+        self.server = spawn(wsgi.server, sock, self.app, utils.NullLogger())
+        self.port = sock.getsockname()[1]
+
+    def tearDown(self):
+        rmtree(self.tmpdir)
+
+    def test_not_found(self):
+        conn = bufferedhttp.http_connect('127.0.0.1', self.port, 'sda1', '0',
+                                         'GET', '/a/c/o')
+        resp = conn.getresponse()
+        self.assertEqual(resp.status, 404)
+        resp.read()
+        resp.close()
+
+    def test_expect_on_put(self):
+        test_body = b'test'
+        headers = {
+            'Expect': '100-continue',
+            'Content-Length': len(test_body),
+            'Content-Type': 'application/test',
+            'X-Timestamp': utils.Timestamp.now().internal,
+        }
+        conn = bufferedhttp.http_connect('127.0.0.1', self.port, 'sda1', '0',
+                                         'PUT', '/a/c/o', headers=headers)
+        resp = conn.getexpect()
+        self.assertEqual(resp.status, 100)
+        conn.send(test_body)
+        resp = conn.getresponse()
+        self.assertEqual(resp.status, 201)
+        resp.read()
+        resp.close()
+
+    def test_expect_on_put_footer(self):
+        test_body = b'test'
+        headers = {
+            'Expect': '100-continue',
+            'Content-Length': len(test_body),
+            'Content-Type': 'application/test',
+            'X-Timestamp': utils.Timestamp.now().internal,
+            'X-Backend-Obj-Metadata-Footer': 'yes',
+            'X-Backend-Obj-Multipart-Mime-Boundary': 'boundary123',
+        }
+        conn = bufferedhttp.http_connect('127.0.0.1', self.port, 'sda1', '0',
+                                         'PUT', '/a/c/o', headers=headers)
+        resp = conn.getexpect()
+        self.assertEqual(resp.status, 100)
+        headers = HeaderKeyDict(resp.getheaders())
+        self.assertEqual(headers['X-Obj-Metadata-Footer'], 'yes')
+        resp.close()
+
+    def test_expect_on_put_conflict(self):
+        test_body = b'test'
+        put_timestamp = utils.Timestamp.now()
+        headers = {
+            'Expect': '100-continue',
+            'Content-Length': len(test_body),
+            'Content-Type': 'application/test',
+            'X-Timestamp': put_timestamp.internal,
+        }
+        conn = bufferedhttp.http_connect('127.0.0.1', self.port, 'sda1', '0',
+                                         'PUT', '/a/c/o', headers=headers)
+        resp = conn.getexpect()
+        self.assertEqual(resp.status, 100)
+        conn.send(test_body)
+        resp = conn.getresponse()
+        self.assertEqual(resp.status, 201)
+        resp.read()
+        resp.close()
+
+        # and again with same timestamp
+        conn = bufferedhttp.http_connect('127.0.0.1', self.port, 'sda1', '0',
+                                         'PUT', '/a/c/o', headers=headers)
+        resp = conn.getexpect()
+        self.assertEqual(resp.status, 409)
+        headers = HeaderKeyDict(resp.getheaders())
+        self.assertEqual(headers['X-Backend-Timestamp'], put_timestamp)
+        resp.read()
+        resp.close()
+
+    def test_multiphase_put_no_mime_boundary(self):
+        test_data = b'obj data'
+        put_timestamp = utils.Timestamp.now().internal
+        headers = {
+            'Content-Type': 'text/plain',
+            'X-Timestamp': put_timestamp,
+            'Transfer-Encoding': 'chunked',
+            'Expect': '100-continue',
+            'X-Backend-Obj-Content-Length': len(test_data),
+            'X-Backend-Obj-Multiphase-Commit': 'yes',
+        }
+        conn = bufferedhttp.http_connect('127.0.0.1', self.port, 'sda1', '0',
+                                         'PUT', '/a/c/o', headers=headers)
+        resp = conn.getexpect()
+        self.assertEqual(resp.status, 400)
+        resp.read()
+        resp.close()
+
+    def test_expect_on_multiphase_put_diconnect(self):
+        put_timestamp = utils.Timestamp.now().internal
+        headers = {
+            'Content-Type': 'text/plain',
+            'X-Timestamp': put_timestamp,
+            'Transfer-Encoding': 'chunked',
+            'Expect': '100-continue',
+            'X-Backend-Obj-Content-Length': 0,
+            'X-Backend-Obj-Multipart-Mime-Boundary': 'boundary123',
+            'X-Backend-Obj-Multiphase-Commit': 'yes',
+        }
+        conn = bufferedhttp.http_connect('127.0.0.1', self.port, 'sda1', '0',
+                                         'PUT', '/a/c/o', headers=headers)
+        resp = conn.getexpect()
+        self.assertEqual(resp.status, 100)
+        headers = HeaderKeyDict(resp.getheaders())
+        self.assertEqual(headers['X-Obj-Multiphase-Commit'], 'yes')
+
+        conn.send(b'c\r\n--boundary123\r\n')
+
+        # disconnect client
+        conn.sock.fd._real_close()
+        for i in range(2):
+            sleep(0)
+        self.assertFalse(self.logger.get_lines_for_level('error'))
+        for line in self.logger.get_lines_for_level('info'):
+            self.assertIn(' 499 ', line)
+
+    def find_files(self):
+        ignore_files = {'.lock', 'hashes.invalid'}
+        found_files = defaultdict(list)
+        for root, dirs, files in os.walk(self.devices):
+            for filename in files:
+                if filename in ignore_files:
+                    continue
+                _name, ext = os.path.splitext(filename)
+                file_path = os.path.join(root, filename)
+                found_files[ext].append(file_path)
+        return found_files
+
+    @contextmanager
+    def _check_multiphase_put_commit_handling(self,
+                                              test_doc=None,
+                                              headers=None,
+                                              finish_body=True):
+        """
+        This helper will setup a multiphase chunked PUT request and yield at
+        the context at the commit phase (after getting the second expect-100
+        continue response.
+
+        It can setup a reasonable stub request, but you can over-ride some
+        characteristics of the request via kwargs.
+
+        :param test_doc: first part of the mime conversation before the object
+                         server will send the 100-continue, this includes the
+                         object body
+        :param headers: headers to send along with the initial request; some
+                        object-metadata (e.g.  X-Backend-Obj-Content-Length)
+                        is generally expected to match the test_doc)
+        :param finish_body: boolean, if true send "0\r\n\r\n" after test_doc
+                            and wait for 100-continue before yielding context
+        """
+        test_data = encode_frag_archive_bodies(POLICIES[1], b'obj data')[0]
+        footer_meta = {
+            "X-Object-Sysmeta-Ec-Frag-Index": "2",
+            "Etag": md5(test_data, usedforsecurity=False).hexdigest(),
+        }
+        footer_json = json.dumps(footer_meta).encode('ascii')
+        footer_meta_cksum = md5(
+            footer_json, usedforsecurity=False).hexdigest().encode('ascii')
+        test_doc = test_doc or b"\r\n".join((
+            b"--boundary123",
+            b"X-Document: object body",
+            b"",
+            test_data,
+            b"--boundary123",
+            b"X-Document: object metadata",
+            b"Content-MD5: " + footer_meta_cksum,
+            b"",
+            footer_json,
+            b"--boundary123",
+        ))
+
+        # phase1 - PUT request with object metadata in footer and
+        # multiphase commit conversation
+        headers = headers or {
+            'Content-Type': 'text/plain',
+            'Transfer-Encoding': 'chunked',
+            'Expect': '100-continue',
+            'X-Backend-Storage-Policy-Index': '1',
+            'X-Backend-Obj-Content-Length': len(test_data),
+            'X-Backend-Obj-Metadata-Footer': 'yes',
+            'X-Backend-Obj-Multipart-Mime-Boundary': 'boundary123',
+            'X-Backend-Obj-Multiphase-Commit': 'yes',
+        }
+        put_timestamp = utils.Timestamp(headers.setdefault(
+            'X-Timestamp', utils.Timestamp.now().internal))
+        container_update = \
+            'swift.obj.server.ObjectController.container_update'
+        with mock.patch(container_update) as _container_update:
+            conn = bufferedhttp.http_connect(
+                '127.0.0.1', self.port, 'sda1', '0',
+                'PUT', '/a/c/o', headers=headers)
+            resp = conn.getexpect()
+            self.assertEqual(resp.status, 100)
+            expect_headers = HeaderKeyDict(resp.getheaders())
+
+            to_send = b"%x\r\n%s\r\n" % (len(test_doc), test_doc)
+            conn.send(to_send)
+            if finish_body:
+                conn.send(b"0\r\n\r\n")
+                # verify 100-continue response to mark end of phase1
+                resp = conn.getexpect()
+                self.assertEqual(resp.status, 100)
+
+            # yield relevant context for test
+            yield {
+                'conn': conn,
+                'expect_headers': expect_headers,
+                'put_timestamp': put_timestamp,
+                'mock_container_update': _container_update,
+            }
+
+        # give the object server a little time to trampoline enough to
+        # recognize request has finished, or socket has closed or whatever
+        sleep(0.01)
+
+    def test_multiphase_put_client_disconnect_right_before_commit(self):
+        with self._check_multiphase_put_commit_handling() as context:
+            conn = context['conn']
+            # just bail straight out
+            conn.sock.fd._real_close()
+        sleep(0)
+
+        put_timestamp = context['put_timestamp']
+        _container_update = context['mock_container_update']
+
+        # and make sure it demonstrates the client disconnect
+        log_lines = self.logger.get_lines_for_level('info')
+        self.assertEqual(len(log_lines), 1)
+        self.assertIn(' 499 ', log_lines[0])
+
+        # verify successful object data file write
+        found_files = self.find_files()
+        # non durable .data file is there
+        self.assertEqual(len(found_files['.data']), 1)
+        obj_datafile = found_files['.data'][0]
+        self.assertEqual("%s#2.data" % put_timestamp.internal,
+                         os.path.basename(obj_datafile))
+        # but no other files
+        self.assertFalse(found_files['.data'][1:])
+        found_files.pop('.data')
+        self.assertFalse(found_files)
+        # And no container update
+        self.assertFalse(_container_update.called)
+
+    def test_multiphase_put_client_disconnect_in_the_middle_of_commit(self):
+        with self._check_multiphase_put_commit_handling() as context:
+            conn = context['conn']
+            # start commit confirmation to start phase2
+            commit_confirmation_doc = b"\r\n".join((
+                b"X-Document: put commit",
+                b"",
+                b"commit_confirmation",
+                b"--boundary123--",
+            ))
+            # but don't quite the commit body
+            to_send = b"%x\r\n%s" % \
+                (len(commit_confirmation_doc), commit_confirmation_doc[:-1])
+            conn.send(to_send)
+
+            # and then bail out
+            conn.sock.fd._real_close()
+        sleep(0)
+
+        put_timestamp = context['put_timestamp']
+        _container_update = context['mock_container_update']
+
+        # and make sure it demonstrates the client disconnect
+        log_lines = self.logger.get_lines_for_level('info')
+        self.assertEqual(len(log_lines), 1)
+        self.assertIn(' 499 ', log_lines[0])
+
+        # verify successful object data file write
+        found_files = self.find_files()
+        # non durable .data file is there
+        self.assertEqual(len(found_files['.data']), 1)
+        obj_datafile = found_files['.data'][0]
+        self.assertEqual("%s#2.data" % put_timestamp.internal,
+                         os.path.basename(obj_datafile))
+        # but no other files
+        self.assertFalse(found_files['.data'][1:])
+        found_files.pop('.data')
+        self.assertFalse(found_files)
+        # And no container update
+        self.assertFalse(_container_update.called)
+
+    def test_multiphase_put_no_metadata_replicated(self):
+        test_data = b'obj data'
+        test_doc = b"\r\n".join((
+            b"--boundary123",
+            b"X-Document: object body",
+            b"",
+            test_data,
+            b"--boundary123",
+        ))
+
+        put_timestamp = utils.Timestamp.now().internal
+        headers = {
+            'Content-Type': 'text/plain',
+            'X-Timestamp': put_timestamp,
+            'Transfer-Encoding': 'chunked',
+            'Expect': '100-continue',
+            'X-Backend-Obj-Content-Length': len(test_data),
+            'X-Backend-Obj-Multipart-Mime-Boundary': 'boundary123',
+            'X-Backend-Obj-Multiphase-Commit': 'yes',
+        }
+        with self._check_multiphase_put_commit_handling(
+                test_doc=test_doc, headers=headers) as context:
+            expect_headers = context['expect_headers']
+            self.assertEqual(expect_headers['X-Obj-Multiphase-Commit'], 'yes')
+            # N.B. no X-Obj-Metadata-Footer header
+            self.assertNotIn('X-Obj-Metadata-Footer', expect_headers)
+
+            conn = context['conn']
+            # send commit confirmation to start phase2
+            commit_confirmation_doc = b"\r\n".join((
+                b"X-Document: put commit",
+                b"",
+                b"commit_confirmation",
+                b"--boundary123--",
+            ))
+            to_send = b"%x\r\n%s\r\n0\r\n\r\n" % \
+                (len(commit_confirmation_doc), commit_confirmation_doc)
+            conn.send(to_send)
+
+            # verify success (2xx) to make end of phase2
+            resp = conn.getresponse()
+            self.assertEqual(resp.status, 201)
+            resp.read()
+            resp.close()
+
+        # verify successful object data file write
+        put_timestamp = context['put_timestamp']
+        found_files = self.find_files()
+        # .data file is there
+        self.assertEqual(len(found_files['.data']), 1)
+        obj_datafile = found_files['.data'][0]
+        self.assertEqual("%s.data" % put_timestamp.internal,
+                         os.path.basename(obj_datafile))
+        # but no other files
+        self.assertFalse(found_files['.data'][1:])
+        found_files.pop('.data')
+        self.assertFalse(found_files)
+        # And container update was called
+        self.assertTrue(context['mock_container_update'].called)
+
+    def test_multiphase_put_metadata_footer(self):
+        with self._check_multiphase_put_commit_handling() as context:
+            expect_headers = context['expect_headers']
+            self.assertEqual(expect_headers['X-Obj-Multiphase-Commit'], 'yes')
+            self.assertEqual(expect_headers['X-Obj-Metadata-Footer'], 'yes')
+
+            conn = context['conn']
+            # send commit confirmation to start phase2
+            commit_confirmation_doc = b"\r\n".join((
+                b"X-Document: put commit",
+                b"",
+                b"commit_confirmation",
+                b"--boundary123--",
+            ))
+            to_send = b"%x\r\n%s\r\n0\r\n\r\n" % \
+                (len(commit_confirmation_doc), commit_confirmation_doc)
+            conn.send(to_send)
+
+            # verify success (2xx) to make end of phase2
+            resp = conn.getresponse()
+            self.assertEqual(resp.status, 201)
+            resp.read()
+            resp.close()
+
+        # verify successful object data and durable state file write
+        put_timestamp = context['put_timestamp']
+        found_files = self.find_files()
+        # .data file is there
+        self.assertEqual(len(found_files['.data']), 1)
+        obj_datafile = found_files['.data'][0]
+        self.assertEqual("%s#2#d.data" % put_timestamp.internal,
+                         os.path.basename(obj_datafile))
+
+        with open(obj_datafile) as fd:
+            actual_meta = diskfile.read_metadata(fd)
+        expected_meta = {'Content-Length': '82',
+                         'name': '/a/c/o',
+                         'X-Object-Sysmeta-Ec-Frag-Index': '2',
+                         'X-Timestamp': put_timestamp.internal,
+                         'Content-Type': 'text/plain'}
+        for k, v in actual_meta.items():
+            # See diskfile.py:_decode_metadata
+            self.assertIsInstance(k, str)
+            self.assertIsInstance(v, str)
+        self.assertIsNotNone(actual_meta.pop('ETag', None))
+        self.assertEqual(expected_meta, actual_meta)
+        # but no other files
+        self.assertFalse(found_files['.data'][1:])
+        found_files.pop('.data')
+        self.assertFalse(found_files)
+        # And container update was called
+        self.assertTrue(context['mock_container_update'].called)
+
+    def test_multiphase_put_metadata_footer_disconnect(self):
+        test_data = b'obj data'
+        test_doc = b"\r\n".join((
+            b"--boundary123",
+            b"X-Document: object body",
+            b"",
+            test_data,
+            b"--boundary123",
+        ))
+        # eventlet.wsgi won't return < network_chunk_size from a chunked read
+        self.app.network_chunk_size = 16
+        with self._check_multiphase_put_commit_handling(
+                test_doc=test_doc, finish_body=False) as context:
+            conn = context['conn']
+
+            # make footer doc
+            footer_meta = {
+                "X-Object-Sysmeta-Ec-Frag-Index": "2",
+                "Etag": md5(test_data, usedforsecurity=False).hexdigest(),
+            }
+            footer_json = json.dumps(footer_meta).encode('ascii')
+            footer_meta_cksum = md5(
+                footer_json, usedforsecurity=False).hexdigest().encode('ascii')
+
+            # send most of the footer doc
+            footer_doc = b"\r\n".join((
+                b"X-Document: object metadata",
+                b"Content-MD5: " + footer_meta_cksum,
+                b"",
+                footer_json,
+            ))
+
+            # but don't send final boundary nor last chunk
+            to_send = b"%x\r\n%s\r\n" % \
+                (len(footer_doc), footer_doc)
+            conn.send(to_send)
+
+            # and then bail out
+            conn.sock.fd._real_close()
+        sleep(0)
+
+        # and make sure it demonstrates the client disconnect
+        log_lines = self.logger.get_lines_for_level('info')
+        self.assertEqual(len(log_lines), 1)
+        self.assertIn(' 499 ', log_lines[0])
+
+        # no artifacts left on disk
+        found_files = self.find_files()
+        self.assertFalse(found_files)
+        # ... and no container update
+        _container_update = context['mock_container_update']
+        self.assertFalse(_container_update.called)
+
+    def test_multiphase_put_ec_fragment_in_headers_no_footers(self):
+        test_data = b'obj data'
+        test_doc = b"\r\n".join((
+            b"--boundary123",
+            b"X-Document: object body",
+            b"",
+            test_data,
+            b"--boundary123",
+        ))
+
+        # phase1 - PUT request with multiphase commit conversation
+        # no object metadata in footer
+        put_timestamp = utils.Timestamp.now().internal
+        headers = {
+            'Content-Type': 'text/plain',
+            'X-Timestamp': put_timestamp,
+            'Transfer-Encoding': 'chunked',
+            'Expect': '100-continue',
+            # normally the frag index gets sent in the MIME footer (which this
+            # test doesn't have, see `test_multiphase_put_metadata_footer`),
+            # but the proxy *could* send the frag index in the headers and
+            # this test verifies that would work.
+            'X-Object-Sysmeta-Ec-Frag-Index': '2',
+            'X-Backend-Storage-Policy-Index': '1',
+            'X-Backend-Obj-Content-Length': len(test_data),
+            'X-Backend-Obj-Multipart-Mime-Boundary': 'boundary123',
+            'X-Backend-Obj-Multiphase-Commit': 'yes',
+        }
+        with self._check_multiphase_put_commit_handling(
+                test_doc=test_doc, headers=headers) as context:
+            expect_headers = context['expect_headers']
+            self.assertEqual(expect_headers['X-Obj-Multiphase-Commit'], 'yes')
+            # N.B. no X-Obj-Metadata-Footer header
+            self.assertNotIn('X-Obj-Metadata-Footer', expect_headers)
+
+            conn = context['conn']
+            # send commit confirmation to start phase2
+            commit_confirmation_doc = b"\r\n".join((
+                b"X-Document: put commit",
+                b"",
+                b"commit_confirmation",
+                b"--boundary123--",
+            ))
+            to_send = b"%x\r\n%s\r\n0\r\n\r\n" % \
+                (len(commit_confirmation_doc), commit_confirmation_doc)
+            conn.send(to_send)
+
+            # verify success (2xx) to make end of phase2
+            resp = conn.getresponse()
+            self.assertEqual(resp.status, 201)
+            resp.read()
+            resp.close()
+
+        # verify successful object data and durable state file write
+        put_timestamp = context['put_timestamp']
+        found_files = self.find_files()
+        # .data file is there
+        self.assertEqual(len(found_files['.data']), 1)
+        obj_datafile = found_files['.data'][0]
+        self.assertEqual("%s#2#d.data" % put_timestamp.internal,
+                         os.path.basename(obj_datafile))
+        # but no other files
+        self.assertFalse(found_files['.data'][1:])
+        found_files.pop('.data')
+        self.assertFalse(found_files)
+        # And container update was called
+        self.assertTrue(context['mock_container_update'].called)
+
+    def test_multiphase_put_bad_commit_message(self):
+        with self._check_multiphase_put_commit_handling() as context:
+            conn = context['conn']
+            # send commit confirmation to start phase2
+            commit_confirmation_doc = b"\r\n".join((
+                b"junkjunk",
+                b"--boundary123--",
+            ))
+            to_send = b"%x\r\n%s\r\n0\r\n\r\n" % \
+                (len(commit_confirmation_doc), commit_confirmation_doc)
+            conn.send(to_send)
+            resp = conn.getresponse()
+            self.assertEqual(resp.status, 500)
+            resp.read()
+            resp.close()
+        put_timestamp = context['put_timestamp']
+        _container_update = context['mock_container_update']
+        # verify that durable data file was NOT created
+        found_files = self.find_files()
+        # non durable .data file is there
+        self.assertEqual(len(found_files['.data']), 1)
+        obj_datafile = found_files['.data'][0]
+        self.assertEqual("%s#2.data" % put_timestamp.internal,
+                         os.path.basename(obj_datafile))
+        # but no other files
+        self.assertFalse(found_files['.data'][1:])
+        found_files.pop('.data')
+        self.assertFalse(found_files)
+        # And no container update
+        self.assertFalse(_container_update.called)
+
+    def test_multiphase_put_drains_extra_commit_junk(self):
+        with self._check_multiphase_put_commit_handling() as context:
+            conn = context['conn']
+            # send commit confirmation to start phase2
+            commit_confirmation_doc = b"\r\n".join((
+                b"X-Document: put commit",
+                b"",
+                b"commit_confirmation",
+                b"--boundary123",
+                b"X-Document: we got cleverer",
+                b"",
+                b"stuff stuff meaningless stuuuuuuuuuuff",
+                b"--boundary123",
+                b"X-Document: we got even cleverer; can you believe it?",
+                b"Waneshaft: ambifacient lunar",
+                b"Casing: malleable logarithmic",
+                b"",
+                b"potato potato potato potato potato potato potato",
+                b"--boundary123--",
+            ))
+            to_send = b"%x\r\n%s\r\n0\r\n\r\n" % \
+                (len(commit_confirmation_doc), commit_confirmation_doc)
+            conn.send(to_send)
+
+            # verify success (2xx) to make end of phase2
+            resp = conn.getresponse()
+            self.assertEqual(resp.status, 201)
+            resp.read()
+
+            # make another request to validate the HTTP protocol state
+            conn.putrequest('GET', '/sda1/0/a/c/o')
+            conn.putheader('X-Backend-Storage-Policy-Index', '1')
+            conn.endheaders()
+            resp = conn.getresponse()
+            self.assertEqual(resp.status, 200)
+            resp.read()
+
+            resp.close()
+
+        # verify successful object data and durable state file write
+        put_timestamp = context['put_timestamp']
+        found_files = self.find_files()
+        # .data file is there
+        self.assertEqual(len(found_files['.data']), 1)
+        obj_datafile = found_files['.data'][0]
+        self.assertEqual("%s#2#d.data" % put_timestamp.internal,
+                         os.path.basename(obj_datafile))
+        # but no other files
+        self.assertFalse(found_files['.data'][1:])
+        found_files.pop('.data')
+        self.assertFalse(found_files)
+        # And container update was called
+        self.assertTrue(context['mock_container_update'].called)
+
+    def test_multiphase_put_drains_extra_commit_junk_disconnect(self):
+        commit_confirmation_doc = b"\r\n".join((
+            b"X-Document: put commit",
+            b"",
+            b"commit_confirmation",
+            b"--boundary123",
+            b"X-Document: we got cleverer",
+            b"",
+            b"stuff stuff meaningless stuuuuuuuuuuff",
+            b"--boundary123",
+            b"X-Document: we got even cleverer; can you believe it?",
+            b"Waneshaft: ambifacient lunar",
+            b"Casing: malleable logarithmic",
+            b"",
+            b"potato potato potato potato potato potato potato",
+        ))
+        # eventlet.wsgi won't return < network_chunk_size from a chunked read
+        self.app.network_chunk_size = 16
+        with self._check_multiphase_put_commit_handling() as context:
+            conn = context['conn']
+            # send commit confirmation and some other stuff
+            # but don't send final boundary or last chunk
+            to_send = b"%x\r\n%s\r\n" % \
+                (len(commit_confirmation_doc), commit_confirmation_doc)
+            conn.send(to_send)
+
+            # and then bail out
+            conn.sock.fd._real_close()
+
+        # the object server needs to recognize the socket is closed
+        # or at least timeout, we'll have to wait
+        timeout = time() + (self.conf['client_timeout'] + 1)
+        while True:
+            try:
+                # and make sure it demonstrates the client disconnect
+                log_lines = self.logger.get_lines_for_level('info')
+                self.assertEqual(len(log_lines), 1)
+            except AssertionError:
+                if time() < timeout:
+                    sleep(0.01)
+                else:
+                    raise
+            else:
+                break
+        status = log_lines[0].split()[7]
+        self.assertEqual(status, '499')
+
+        # verify successful object data and durable state file write
+        put_timestamp = context['put_timestamp']
+        found_files = self.find_files()
+        # .data file is there
+        self.assertEqual(len(found_files['.data']), 1)
+        obj_datafile = found_files['.data'][0]
+        self.assertEqual("%s#2#d.data" % put_timestamp.internal,
+                         os.path.basename(obj_datafile))
+        # but no other files
+        self.assertFalse(found_files['.data'][1:])
+        found_files.pop('.data')
+        self.assertFalse(found_files)
+        # but no container update
+        self.assertFalse(context['mock_container_update'].called)
+
+
+@patch_policies
+class TestZeroCopy(unittest.TestCase):
+    """Test the object server's zero-copy functionality"""
+
+    def _system_can_zero_copy(self):
+        if not splice.available:
+            return False
+
+        try:
+            utils.get_md5_socket()
+        except IOError:
+            return False
+
+        return True
+
+    def setUp(self):
+        skip_if_no_xattrs()
+        if not self._system_can_zero_copy():
+            raise unittest.SkipTest("zero-copy support is missing")
+
+        self.testdir = mkdtemp(suffix="obj_server_zero_copy")
+        mkdirs(os.path.join(self.testdir, 'sda1', 'tmp'))
+
+        conf = {'devices': self.testdir,
+                'mount_check': 'false',
+                'splice': 'yes',
+                'disk_chunk_size': '4096'}
+        self.object_controller = object_server.ObjectController(
+            conf, logger=debug_logger())
+        self.df_mgr = diskfile.DiskFileManager(
+            conf, self.object_controller.logger)
+
+        listener = listen_zero()
+        port = listener.getsockname()[1]
+        self.wsgi_greenlet = spawn(
+            wsgi.server, listener, self.object_controller, NullLogger())
+
+        self.http_conn = http_client.HTTPConnection('127.0.0.1', port)
+        self.http_conn.connect()
+
+    def tearDown(self):
+        """Tear down for testing swift.object.server.ObjectController"""
+        self.wsgi_greenlet.kill()
+        rmtree(self.testdir)
+
+    def test_GET(self):
+        url_path = '/sda1/2100/a/c/o'
+
+        self.http_conn.request('PUT', url_path, 'obj contents',
+                               {'X-Timestamp': '127082564.24709',
+                                'Content-Type': 'application/test'})
+        response = self.http_conn.getresponse()
+        self.assertEqual(response.status, 201)
+        response.read()
+
+        self.http_conn.request('GET', url_path)
+        response = self.http_conn.getresponse()
+        self.assertEqual(response.status, 200)
+        contents = response.read()
+        self.assertEqual(contents, b'obj contents')
+
+    def test_GET_big(self):
+        # Test with a large-ish object to make sure we handle full socket
+        # buffers correctly.
+        obj_contents = b'A' * 4 * 1024 * 1024  # 4 MiB
+        url_path = '/sda1/2100/a/c/o'
+
+        self.http_conn.request('PUT', url_path, obj_contents,
+                               {'X-Timestamp': '1402600322.52126',
+                                'Content-Type': 'application/test'})
+        response = self.http_conn.getresponse()
+        self.assertEqual(response.status, 201)
+        response.read()
+
+        self.http_conn.request('GET', url_path)
+        response = self.http_conn.getresponse()
+        self.assertEqual(response.status, 200)
+        contents = response.read()
+        self.assertEqual(contents, obj_contents)
+
+    def test_quarantine(self):
+        obj_hash = hash_path('a', 'c', 'o')
+        url_path = '/sda1/2100/a/c/o'
+        ts = '1402601849.47475'
+
+        self.http_conn.request('PUT', url_path, b'obj contents',
+                               {'X-Timestamp': ts,
+                                'Content-Type': 'application/test'})
+        response = self.http_conn.getresponse()
+        self.assertEqual(response.status, 201)
+        response.read()
+
+        # go goof up the file on disk
+        fname = os.path.join(self.testdir, 'sda1', 'objects', '2100',
+                             obj_hash[-3:], obj_hash, ts + '.data')
+
+        with open(fname, 'rb+') as fh:
+            fh.write(b'XYZ')
+
+        self.http_conn.request('GET', url_path)
+        response = self.http_conn.getresponse()
+        self.assertEqual(response.status, 200)
+        contents = response.read()
+        self.assertEqual(contents, b'XYZ contents')
+
+        self.http_conn.request('GET', url_path)
+        response = self.http_conn.getresponse()
+        # it was quarantined by the previous request
+        self.assertEqual(response.status, 404)
+        response.read()
+
+    def test_quarantine_on_well_formed_zero_byte_file(self):
+        # Make sure we work around an oddity in Linux's hash sockets
+        url_path = '/sda1/2100/a/c/o'
+        ts = '1402700497.71333'
+
+        self.http_conn.request(
+            'PUT', url_path, '',
+            {'X-Timestamp': ts, 'Content-Length': '0',
+             'Content-Type': 'application/test'})
+        response = self.http_conn.getresponse()
+        self.assertEqual(response.status, 201)
+        response.read()
+
+        self.http_conn.request('GET', url_path)
+        response = self.http_conn.getresponse()
+        self.assertEqual(response.status, 200)
+        contents = response.read()
+        self.assertEqual(contents, b'')
+
+        self.http_conn.request('GET', url_path)
+        response = self.http_conn.getresponse()
+        self.assertEqual(response.status, 200)  # still there
+        contents = response.read()
+        self.assertEqual(contents, b'')
+
+
+class TestConfigOptionHandling(unittest.TestCase):
+
+    def setUp(self):
+        self.tmpdir = mkdtemp()
+
+    def tearDown(self):
+        rmtree(self.tmpdir)
+
+    def _app_config(self, config):
+        contents = dedent(config)
+        conf_file = os.path.join(self.tmpdir, 'object-server.conf')
+        with open(conf_file, 'w') as f:
+            f.write(contents)
+        return init_request_processor(conf_file, 'object-server')[:2]
+
+    def test_default(self):
+        config = """
+        [DEFAULT]
+
+        [pipeline:main]
+        pipeline = object-server
+
+        [app:object-server]
+        use = egg:swift#object
+        """
+        app, config = self._app_config(config)
+        self.assertNotIn('reclaim_age', config)
+        for policy in POLICIES:
+            self.assertEqual(app._diskfile_router[policy].reclaim_age, 604800)
+
+    def test_option_in_app(self):
+        config = """
+        [DEFAULT]
+
+        [pipeline:main]
+        pipeline = object-server
+
+        [app:object-server]
+        use = egg:swift#object
+        reclaim_age = 100
+        """
+        app, config = self._app_config(config)
+        self.assertEqual(config['reclaim_age'], '100')
+        for policy in POLICIES:
+            self.assertEqual(app._diskfile_router[policy].reclaim_age, 100)
+
+    def test_option_in_default(self):
+        config = """
+        [DEFAULT]
+        reclaim_age = 200
+
+        [pipeline:main]
+        pipeline = object-server
+
+        [app:object-server]
+        use = egg:swift#object
+        """
+        app, config = self._app_config(config)
+        self.assertEqual(config['reclaim_age'], '200')
+        for policy in POLICIES:
+            self.assertEqual(app._diskfile_router[policy].reclaim_age, 200)
+
+    def test_option_in_both(self):
+        config = """
+        [DEFAULT]
+        reclaim_age = 300
+
+        [pipeline:main]
+        pipeline = object-server
+
+        [app:object-server]
+        use = egg:swift#object
+        reclaim_age = 400
+        """
+        app, config = self._app_config(config)
+        self.assertEqual(config['reclaim_age'], '300')
+        for policy in POLICIES:
+            self.assertEqual(app._diskfile_router[policy].reclaim_age, 300)
+
+        # use paste "set" syntax to override global config value
+        config = """
+        [DEFAULT]
+        reclaim_age = 500
+
+        [pipeline:main]
+        pipeline = object-server
+
+        [app:object-server]
+        use = egg:swift#object
+        set reclaim_age = 600
+        """
+        app, config = self._app_config(config)
+        self.assertEqual(config['reclaim_age'], '600')
+        for policy in POLICIES:
+            self.assertEqual(app._diskfile_router[policy].reclaim_age, 600)
+
 
 if __name__ == '__main__':
     unittest.main()
diff --git a/test/unit/obj/test_ssync.py b/test/unit/obj/test_ssync.py
new file mode 100644
index 0000000000..f42473d936
--- /dev/null
+++ b/test/unit/obj/test_ssync.py
@@ -0,0 +1,1953 @@
+# Copyright (c) 2013 - 2015 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from collections import defaultdict
+
+from unittest import mock
+import os
+import unittest
+
+import eventlet
+import urllib.parse
+
+from swift.common.exceptions import DiskFileNotExist, DiskFileError, \
+    DiskFileDeleted, DiskFileExpired
+from swift.common import swob
+from swift.common import utils
+from swift.common.storage_policy import POLICIES, EC_POLICY
+from swift.obj import ssync_sender, server, diskfile
+from swift.obj.reconstructor import RebuildingECDiskFileStream, \
+    ObjectReconstructor
+from swift.obj.replicator import ObjectReplicator
+
+from test import listen_zero
+from test.debug_logger import debug_logger
+from test.unit.obj.common import BaseTest
+from test.unit import patch_policies, encode_frag_archive_bodies, \
+    skip_if_no_xattrs, quiet_eventlet_exceptions, make_timestamp_iter
+
+
+class TestBaseSsync(BaseTest):
+    """
+    Provides a framework to test end to end interactions between sender and
+    receiver. The basis for each test is actual diskfile state on either side.
+    The connection between sender and receiver is wrapped to capture ssync
+    traffic for subsequent verification of the protocol. Assertions are made
+    about the final state of the sender and receiver diskfiles.
+    """
+    def setUp(self):
+        skip_if_no_xattrs()
+        super(TestBaseSsync, self).setUp()
+        # rx side setup
+        self.rx_testdir = os.path.join(self.tmpdir, 'tmp_test_ssync_receiver')
+        utils.mkdirs(os.path.join(self.rx_testdir, self.device))
+        conf = {
+            'devices': self.rx_testdir,
+            'mount_check': 'false',
+            'replication_concurrency_per_device': '0',
+            'log_requests': 'false'}
+        self.rx_logger = debug_logger(name='test-ssync-receiver')
+        self.rx_controller = server.ObjectController(conf, self.rx_logger)
+        self.ts_iter = make_timestamp_iter()
+        self.rx_ip = '127.0.0.1'
+        sock = listen_zero()
+        self.rx_server_pool = eventlet.GreenPool(size=1)
+        self.rx_server = eventlet.spawn(
+            eventlet.wsgi.server, sock, self.rx_controller, log=self.rx_logger,
+            custom_pool=self.rx_server_pool)
+        self.rx_port = sock.getsockname()[1]
+        self.rx_node = {'replication_ip': self.rx_ip,
+                        'replication_port': self.rx_port,
+                        'device': self.device}
+        self.obj_data = {}  # maps obj path -> obj data
+
+    def tearDown(self):
+        self.rx_server.kill()
+        super(TestBaseSsync, self).tearDown()
+
+    def _wait_for_rx_server(self):
+        # wait for receiver thread to complete before checking logs, but don't
+        # wait forever
+        with eventlet.Timeout(
+                seconds=1,
+                exception=AssertionError(
+                    'timed out waiting for ssync receiver thread')):
+            self.rx_server_pool.waitall()
+
+    def make_connect_wrapper(self, sender):
+        """
+        Make a wrapper function for the ssync_sender.Sender.connect() method
+        that will in turn wrap the HTTConnection.send() and the
+        Sender.readline() so that ssync protocol messages can be captured.
+        """
+        orig_connect = sender.connect
+        trace = dict(messages=[])
+
+        def add_trace(type, msg):
+            # record a protocol event for later analysis
+            if msg.strip():
+                trace['messages'].append((type, msg.strip()))
+
+        def make_send_wrapper(send):
+            def wrapped_send(msg):
+                _msg = msg.split(b'\r\n', 1)[1]
+                _msg = _msg.rsplit(b'\r\n', 1)[0]
+                add_trace('tx', _msg)
+                send(msg)
+            return wrapped_send
+
+        def make_readline_wrapper(readline):
+            def wrapped_readline(size=1024):
+                data = readline(size=size)
+                add_trace('rx', data)
+                bytes_read = trace.setdefault('readline_bytes', 0)
+                trace['readline_bytes'] = bytes_read + len(data)
+                return data
+            return wrapped_readline
+
+        def wrapped_connect():
+            connection, response = orig_connect()
+            connection.send = make_send_wrapper(
+                connection.send)
+            response.readline = make_readline_wrapper(response.readline)
+            return connection, response
+        return wrapped_connect, trace
+
+    def _get_object_data(self, path, **kwargs):
+        # return data for given path
+        if path not in self.obj_data:
+            self.obj_data[path] = b'%s___data' % path.encode('ascii')
+        return self.obj_data[path]
+
+    def _create_ondisk_files(self, df_mgr, obj_name, policy, timestamp,
+                             frag_indexes=None, commit=True, **kwargs):
+        frag_indexes = frag_indexes or [None]
+        metadata = {'Content-Type': 'plain/text'}
+        diskfiles = []
+        for frag_index in frag_indexes:
+            object_data = self._get_object_data('/a/c/%s' % obj_name,
+                                                frag_index=frag_index)
+            if policy.policy_type == EC_POLICY:
+                metadata['X-Object-Sysmeta-Ec-Frag-Index'] = str(frag_index)
+                metadata['X-Object-Sysmeta-Ec-Etag'] = 'fake-etag'
+            df = self._make_diskfile(
+                device=self.device, partition=self.partition, account='a',
+                container='c', obj=obj_name, body=object_data,
+                extra_metadata=metadata, timestamp=timestamp, policy=policy,
+                frag_index=frag_index, df_mgr=df_mgr, commit=commit, **kwargs)
+            diskfiles.append(df)
+        return diskfiles
+
+    def _open_tx_diskfile(self, obj_name, policy, frag_index=None, **kwargs):
+        df_mgr = self.daemon._df_router[policy]
+        df = df_mgr.get_diskfile(
+            self.device, self.partition, account='a', container='c',
+            obj=obj_name, policy=policy, frag_index=frag_index, **kwargs)
+        df.open()
+        return df
+
+    def _open_rx_diskfile(self, obj_name, policy, frag_index=None, **kwargs):
+        df = self.rx_controller.get_diskfile(
+            self.device, self.partition, 'a', 'c', obj_name, policy=policy,
+            frag_index=frag_index, open_expired=True, **kwargs)
+        df.open()
+        return df
+
+    def _verify_diskfile_sync(self, tx_df, rx_df, frag_index, same_etag=False):
+        # verify that diskfiles' metadata match
+        # sanity check, they are not the same ondisk files!
+        self.assertNotEqual(tx_df._datadir, rx_df._datadir)
+        rx_metadata = dict(rx_df.get_metadata())
+        for k, v in tx_df.get_metadata().items():
+            if k == 'X-Object-Sysmeta-Ec-Frag-Index':
+                # if tx_df had a frag_index then rx_df should also have one
+                self.assertIn(k, rx_metadata)
+                self.assertEqual(frag_index, int(rx_metadata.pop(k)))
+            elif k == 'ETag' and not same_etag:
+                self.assertNotEqual(v, rx_metadata.pop(k, None))
+                continue
+            else:
+                actual = rx_metadata.pop(k)
+                self.assertEqual(v, actual, 'Expected %r but got %r for %s' %
+                                 (v, actual, k))
+        self.assertFalse(rx_metadata)
+        expected_body = self._get_object_data(tx_df._name,
+                                              frag_index=frag_index)
+        actual_body = b''.join([chunk for chunk in rx_df.reader()])
+        self.assertEqual(expected_body, actual_body)
+
+    def _analyze_trace(self, trace):
+        """
+        Parse protocol trace captured by fake connection, making some
+        assertions along the way, and return results  as a dict of form:
+        results = {'tx_missing': <list of messages>,
+                   'rx_missing': <list of messages>,
+                   'tx_updates': <list of subreqs>,
+                   'rx_updates': <list of messages>}
+
+        Each subreq is a dict with keys: 'method', 'path', 'headers', 'body'
+        """
+        def tx_missing(results, line):
+            self.assertEqual('tx', line[0])
+            results['tx_missing'].append(line[1])
+
+        def rx_missing(results, line):
+            self.assertEqual('rx', line[0])
+            parts = line[1].split(b'\r\n')
+            for part in parts:
+                results['rx_missing'].append(part)
+
+        def tx_updates(results, line):
+            self.assertEqual('tx', line[0])
+            subrequests = results['tx_updates']
+            if line[1].startswith((b'PUT', b'DELETE', b'POST')):
+                parts = [swob.bytes_to_wsgi(l) for l in line[1].split(b'\r\n')]
+                method, path = parts[0].split()
+                subreq = {'method': method, 'path': path, 'req': line[1],
+                          'headers': parts[1:]}
+                subrequests.append(subreq)
+            else:
+                self.assertTrue(subrequests)
+                body = (subrequests[-1]).setdefault('body', b'')
+                body += line[1]
+                subrequests[-1]['body'] = body
+
+        def rx_updates(results, line):
+            self.assertEqual('rx', line[0])
+            results.setdefault['rx_updates'].append(line[1])
+
+        def unexpected(results, line):
+            results.setdefault('unexpected', []).append(line)
+
+        # each trace line is a tuple of ([tx|rx], msg)
+        handshakes = iter([(('tx', b':MISSING_CHECK: START'), tx_missing),
+                           (('tx', b':MISSING_CHECK: END'), unexpected),
+                           (('rx', b':MISSING_CHECK: START'), rx_missing),
+                           (('rx', b':MISSING_CHECK: END'), unexpected),
+                           (('tx', b':UPDATES: START'), tx_updates),
+                           (('tx', b':UPDATES: END'), unexpected),
+                           (('rx', b':UPDATES: START'), rx_updates),
+                           (('rx', b':UPDATES: END'), unexpected)])
+        expect_handshake = next(handshakes)
+        phases = ('tx_missing', 'rx_missing', 'tx_updates', 'rx_updates')
+        results = dict((k, []) for k in phases)
+        handler = unexpected
+        lines = list(trace.get('messages', []))
+        lines.reverse()
+        while lines:
+            line = lines.pop()
+            if line == expect_handshake[0]:
+                handler = expect_handshake[1]
+                try:
+                    expect_handshake = next(handshakes)
+                except StopIteration:
+                    # should be the last line
+                    self.assertFalse(
+                        lines, 'Unexpected trailing lines %s' % lines)
+                continue
+            handler(results, line)
+
+        try:
+            # check all handshakes occurred
+            missed = next(handshakes)
+            self.fail('Handshake %s not found' % str(missed[0]))
+        except StopIteration:
+            pass
+        # check no message outside of a phase
+        self.assertFalse(results.get('unexpected'),
+                         'Message outside of a phase: %s' % results.get(None))
+        return results
+
+    def _verify_ondisk_files(self, tx_objs, policy, tx_frag_index=None,
+                             rx_frag_index=None, **kwargs):
+        """
+        Verify tx and rx files that should be in sync.
+        :param tx_objs: sender diskfiles
+        :param policy: storage policy instance
+        :param tx_frag_index: the fragment index of tx diskfiles that should
+                              have been used as a source for sync'ing
+        :param rx_frag_index: the fragment index of expected rx diskfiles
+        """
+        for o_name, diskfiles in tx_objs.items():
+            for tx_df in diskfiles:
+                # check tx file still intact - ssync does not do any cleanup!
+                tx_df.open()
+                if tx_frag_index is None or tx_df._frag_index == tx_frag_index:
+                    # this diskfile should have been sync'd,
+                    # check rx file is ok
+                    rx_df = self._open_rx_diskfile(
+                        o_name, policy, rx_frag_index, **kwargs)
+                    # for EC revert job or replication etags should match
+                    match_etag = (tx_frag_index == rx_frag_index)
+                    self._verify_diskfile_sync(
+                        tx_df, rx_df, rx_frag_index, match_etag)
+                else:
+                    # this diskfile should not have been sync'd,
+                    # check no rx file,
+                    self.assertRaises(DiskFileNotExist, self._open_rx_diskfile,
+                                      o_name, policy,
+                                      frag_index=tx_df._frag_index)
+
+    def _verify_tombstones(self, tx_objs, policy):
+        # verify tx and rx tombstones that should be in sync
+        for o_name, diskfiles in tx_objs.items():
+            try:
+                self._open_tx_diskfile(o_name, policy)
+                self.fail('DiskFileDeleted expected')
+            except DiskFileDeleted as exc:
+                tx_delete_time = exc.timestamp
+            try:
+                self._open_rx_diskfile(o_name, policy)
+                self.fail('DiskFileDeleted expected')
+            except DiskFileDeleted as exc:
+                rx_delete_time = exc.timestamp
+            self.assertEqual(tx_delete_time, rx_delete_time)
+
+
+@patch_policies(with_ec_default=True)
+class TestBaseSsyncEC(TestBaseSsync):
+    def setUp(self):
+        super(TestBaseSsyncEC, self).setUp()
+        self.policy = POLICIES.default
+        self.logger = debug_logger('test-ssync-sender')
+        self.daemon = ObjectReconstructor(self.daemon_conf, self.logger)
+        self.rx_node['backend_index'] = 0
+
+    def _get_object_data(self, path, frag_index=None, **kwargs):
+        # return a frag archive for given object name and frag index.
+        # for EC policies obj_data maps obj path -> list of frag archives
+        if path not in self.obj_data:
+            # make unique frag archives for each object name
+            data = path.encode('ascii') * 2 * (
+                self.policy.ec_ndata + self.policy.ec_nparity)
+            self.obj_data[path] = encode_frag_archive_bodies(
+                self.policy, data)
+        return self.obj_data[path][frag_index]
+
+
+class TestSsyncEC(TestBaseSsyncEC):
+    def test_handoff_fragment_revert(self):
+        # test that a sync_revert type job does send the correct frag archives
+        # to the receiver
+        policy = POLICIES.default
+        rx_node_index = 0
+        tx_node_index = 1
+        # for a revert job we iterate over frag index that belongs on
+        # remote node
+        frag_index = rx_node_index
+
+        # create sender side diskfiles...
+        tx_objs = {}
+        rx_objs = {}
+        tx_tombstones = {}
+        tx_df_mgr = self.daemon._df_router[policy]
+        rx_df_mgr = self.rx_controller._diskfile_router[policy]
+        # o1 has primary and handoff fragment archives
+        t1 = next(self.ts_iter)
+        tx_objs['o1'] = self._create_ondisk_files(
+            tx_df_mgr, 'o1', policy, t1, (rx_node_index, tx_node_index))
+        # o2 only has primary
+        t2 = next(self.ts_iter)
+        tx_objs['o2'] = self._create_ondisk_files(
+            tx_df_mgr, 'o2', policy, t2, (tx_node_index,))
+        # o3 only has handoff, rx has other frag index
+        t3 = next(self.ts_iter)
+        tx_objs['o3'] = self._create_ondisk_files(
+            tx_df_mgr, 'o3', policy, t3, (rx_node_index,))
+        rx_objs['o3'] = self._create_ondisk_files(
+            rx_df_mgr, 'o3', policy, t3, (13,))
+        # o4 primary and handoff fragment archives on tx, handoff in sync on rx
+        t4 = next(self.ts_iter)
+        tx_objs['o4'] = self._create_ondisk_files(
+            tx_df_mgr, 'o4', policy, t4, (tx_node_index, rx_node_index,))
+        rx_objs['o4'] = self._create_ondisk_files(
+            rx_df_mgr, 'o4', policy, t4, (rx_node_index,))
+        # o5 is a tombstone, missing on receiver
+        t5 = next(self.ts_iter)
+        tx_tombstones['o5'] = self._create_ondisk_files(
+            tx_df_mgr, 'o5', policy, t5, (tx_node_index,))
+        tx_tombstones['o5'][0].delete(t5)
+
+        suffixes = set()
+        for diskfiles in list(tx_objs.values()) + list(tx_tombstones.values()):
+            for df in diskfiles:
+                suffixes.add(os.path.basename(os.path.dirname(df._datadir)))
+
+        # create ssync sender instance...
+        job = {'device': self.device,
+               'partition': self.partition,
+               'policy': policy,
+               'frag_index': frag_index}
+        node = dict(self.rx_node)
+        sender = ssync_sender.Sender(self.daemon, node, job, suffixes)
+        # wrap connection from tx to rx to capture ssync messages...
+        sender.connect, trace = self.make_connect_wrapper(sender)
+
+        # run the sync protocol...
+        sender()
+
+        # verify protocol
+        results = self._analyze_trace(trace)
+        # sender has handoff frags for o1, o3 and o4 and ts for o5
+        self.assertEqual(4, len(results['tx_missing']))
+        # receiver is missing frags for o1, o3 and ts for o5
+        self.assertEqual(3, len(results['rx_missing']))
+        self.assertEqual(3, len(results['tx_updates']))
+        self.assertFalse(results['rx_updates'])
+        sync_paths = []
+        for subreq in results.get('tx_updates'):
+            if subreq.get('method') == 'PUT':
+                self.assertTrue(
+                    'X-Object-Sysmeta-Ec-Frag-Index: %s' % rx_node_index
+                    in subreq.get('headers'))
+                expected_body = self._get_object_data(subreq['path'],
+                                                      rx_node_index)
+                self.assertEqual(expected_body, subreq['body'])
+            elif subreq.get('method') == 'DELETE':
+                self.assertEqual('/a/c/o5', subreq['path'])
+            sync_paths.append(subreq.get('path'))
+        self.assertEqual(['/a/c/o1', '/a/c/o3', '/a/c/o5'], sorted(sync_paths))
+
+        # verify on disk files...
+        self._verify_ondisk_files(
+            tx_objs, policy, frag_index, rx_node_index)
+        self._verify_tombstones(tx_tombstones, policy)
+
+    def test_handoff_fragment_only_missing_durable_state(self):
+        # test that a sync_revert type job does not PUT when the rx is only
+        # missing durable state
+        policy = POLICIES.default
+        rx_node_index = frag_index = 0
+        tx_node_index = 1
+
+        # create sender side diskfiles...
+        tx_objs = {}
+        rx_objs = {}
+        tx_df_mgr = self.daemon._df_router[policy]
+        rx_df_mgr = self.rx_controller._diskfile_router[policy]
+
+        expected_subreqs = defaultdict(list)
+
+        # o1 in sync on rx but rx missing durable state - no PUT required
+        t1a = next(self.ts_iter)  # older durable rx .data
+        t1b = next(self.ts_iter)  # rx .meta
+        t1c = next(self.ts_iter)  # durable tx .data, non-durable rx .data
+        obj_name = 'o1'
+        tx_objs[obj_name] = self._create_ondisk_files(
+            tx_df_mgr, obj_name, policy, t1c, (tx_node_index, rx_node_index,))
+        rx_objs[obj_name] = self._create_ondisk_files(
+            rx_df_mgr, obj_name, policy, t1a, (rx_node_index,))
+        metadata = {'X-Timestamp': t1b.internal}
+        rx_objs[obj_name][0].write_metadata(metadata)
+        rx_objs[obj_name] = self._create_ondisk_files(
+            rx_df_mgr, obj_name, policy, t1c, (rx_node_index, 9), commit=False)
+
+        # o2 on rx has wrong frag_indexes and is non-durable - PUT required
+        t2 = next(self.ts_iter)
+        obj_name = 'o2'
+        tx_objs[obj_name] = self._create_ondisk_files(
+            tx_df_mgr, obj_name, policy, t2, (tx_node_index, rx_node_index,))
+        rx_objs[obj_name] = self._create_ondisk_files(
+            rx_df_mgr, obj_name, policy, t2, (12, 13), commit=False)
+        expected_subreqs['PUT'].append(obj_name)
+
+        # o3 on rx has frag at newer time and non-durable - PUT required
+        t3 = next(self.ts_iter)
+        obj_name = 'o3'
+        tx_objs[obj_name] = self._create_ondisk_files(
+            tx_df_mgr, obj_name, policy, t3, (tx_node_index, rx_node_index,))
+        t3b = next(self.ts_iter)
+        rx_objs[obj_name] = self._create_ondisk_files(
+            rx_df_mgr, obj_name, policy, t3b, (rx_node_index,), commit=False)
+        expected_subreqs['PUT'].append(obj_name)
+
+        # o4 on rx has a newer tombstone and even newer frags - no PUT required
+        t4 = next(self.ts_iter)
+        obj_name = 'o4'
+        tx_objs[obj_name] = self._create_ondisk_files(
+            tx_df_mgr, obj_name, policy, t4, (tx_node_index, rx_node_index,))
+        rx_objs[obj_name] = self._create_ondisk_files(
+            rx_df_mgr, obj_name, policy, t4, (rx_node_index,))
+        t4b = next(self.ts_iter)
+        rx_objs[obj_name][0].delete(t4b)
+        t4c = next(self.ts_iter)
+        rx_objs[obj_name] = self._create_ondisk_files(
+            rx_df_mgr, obj_name, policy, t4c, (rx_node_index,), commit=False)
+
+        suffixes = set()
+        for diskfiles in tx_objs.values():
+            for df in diskfiles:
+                suffixes.add(os.path.basename(os.path.dirname(df._datadir)))
+
+        # create ssync sender instance...
+        job = {'device': self.device,
+               'partition': self.partition,
+               'policy': policy,
+               'frag_index': frag_index}
+        node = dict(self.rx_node)
+        sender = ssync_sender.Sender(self.daemon, node, job, suffixes)
+        # wrap connection from tx to rx to capture ssync messages...
+        sender.connect, trace = self.make_connect_wrapper(sender)
+
+        # run the sync protocol...
+        sender()
+
+        # verify protocol
+        results = self._analyze_trace(trace)
+        self.assertEqual(4, len(results['tx_missing']))
+        self.assertEqual(2, len(results['rx_missing']))
+        self.assertEqual(2, len(results['tx_updates']))
+        self.assertFalse(results['rx_updates'])
+        for subreq in results.get('tx_updates'):
+            obj = subreq['path'].split('/')[3]
+            method = subreq['method']
+            self.assertTrue(obj in expected_subreqs[method],
+                            'Unexpected %s subreq for object %s, expected %s'
+                            % (method, obj, expected_subreqs[method]))
+            expected_subreqs[method].remove(obj)
+            if method == 'PUT':
+                expected_body = self._get_object_data(
+                    subreq['path'], frag_index=rx_node_index)
+                self.assertEqual(expected_body, subreq['body'])
+        # verify all expected subreqs consumed
+        for _method, expected in expected_subreqs.items():
+            self.assertFalse(expected)
+
+        # verify on disk files...
+        tx_objs.pop('o4')  # o4 should not have been sync'd
+        self._verify_ondisk_files(
+            tx_objs, policy, frag_index, rx_node_index)
+
+    def test_handoff_non_durable_fragment(self):
+        # test that a sync_revert type job does PUT when the tx is non-durable
+        policy = POLICIES.default
+        rx_node_index = frag_index = 0
+        tx_node_index = 1
+
+        # create sender side diskfiles...
+        tx_objs = {}
+        rx_objs = {}
+        tx_df_mgr = self.daemon._df_router[policy]
+        rx_df_mgr = self.rx_controller._diskfile_router[policy]
+
+        expected_subreqs = defaultdict(list)
+
+        # o1 non-durable on tx and missing on rx
+        t1 = next(self.ts_iter)  # newer non-durable tx .data
+        obj_name = 'o1'
+        tx_objs[obj_name] = self._create_ondisk_files(
+            tx_df_mgr, obj_name, policy, t1, (tx_node_index, rx_node_index,),
+            commit=False, frag_prefs=[])
+        expected_subreqs['PUT'].append(obj_name)
+
+        # o2 non-durable on tx and rx
+        t2 = next(self.ts_iter)
+        obj_name = 'o2'
+        tx_objs[obj_name] = self._create_ondisk_files(
+            tx_df_mgr, obj_name, policy, t2, (tx_node_index, rx_node_index,),
+            commit=False, frag_prefs=[])
+        rx_objs[obj_name] = self._create_ondisk_files(
+            rx_df_mgr, obj_name, policy, t2, (rx_node_index,), commit=False,
+            frag_prefs=[])
+
+        # o3 durable on tx and missing on rx, to check the include_non_durable
+        # does not exclude durables
+        t3 = next(self.ts_iter)
+        obj_name = 'o3'
+        tx_objs[obj_name] = self._create_ondisk_files(
+            tx_df_mgr, obj_name, policy, t3, (tx_node_index, rx_node_index,))
+        expected_subreqs['PUT'].append(obj_name)
+
+        suffixes = set()
+        for diskfiles in tx_objs.values():
+            for df in diskfiles:
+                suffixes.add(os.path.basename(os.path.dirname(df._datadir)))
+
+        # create ssync sender instance...with include_non_durable
+        job = {'device': self.device,
+               'partition': self.partition,
+               'policy': policy,
+               'frag_index': frag_index}
+        node = dict(self.rx_node)
+        sender = ssync_sender.Sender(self.daemon, node, job, suffixes,
+                                     include_non_durable=True)
+        # wrap connection from tx to rx to capture ssync messages...
+        sender.connect, trace = self.make_connect_wrapper(sender)
+
+        # run the sync protocol...
+        sender()
+
+        # verify protocol
+        results = self._analyze_trace(trace)
+        self.assertEqual(3, len(results['tx_missing']))
+        self.assertEqual(2, len(results['rx_missing']))
+        self.assertEqual(2, len(results['tx_updates']))
+        self.assertFalse(results['rx_updates'])
+        for subreq in results.get('tx_updates'):
+            obj = subreq['path'].split('/')[3]
+            method = subreq['method']
+            self.assertTrue(obj in expected_subreqs[method],
+                            'Unexpected %s subreq for object %s, expected %s'
+                            % (method, obj, expected_subreqs[method]))
+            expected_subreqs[method].remove(obj)
+            if method == 'PUT':
+                expected_body = self._get_object_data(
+                    subreq['path'], frag_index=rx_node_index)
+                self.assertEqual(expected_body, subreq['body'])
+        # verify all expected subreqs consumed
+        for _method, expected in expected_subreqs.items():
+            self.assertFalse(expected)
+
+        # verify on disk files...
+        # tx_objs.pop('o4')  # o4 should not have been sync'd
+        self._verify_ondisk_files(
+            tx_objs, policy, frag_index, rx_node_index, frag_prefs=[])
+
+    def test_fragment_sync(self):
+        # check that a sync_only type job does call reconstructor to build a
+        # diskfile to send, and continues making progress despite an error
+        # when building one diskfile
+        policy = POLICIES.default
+        rx_node_index = 0
+        tx_node_index = 1
+        # for a sync job we iterate over frag index that belongs on local node
+        frag_index = tx_node_index
+
+        # create sender side diskfiles...
+        tx_objs = {}
+        tx_tombstones = {}
+        rx_objs = {}
+        tx_df_mgr = self.daemon._df_router[policy]
+        rx_df_mgr = self.rx_controller._diskfile_router[policy]
+        # o1 only has primary
+        t1 = next(self.ts_iter)
+        tx_objs['o1'] = self._create_ondisk_files(
+            tx_df_mgr, 'o1', policy, t1, (tx_node_index,))
+        # o2 only has primary
+        t2 = next(self.ts_iter)
+        tx_objs['o2'] = self._create_ondisk_files(
+            tx_df_mgr, 'o2', policy, t2, (tx_node_index,))
+        # o3 only has primary
+        t3 = next(self.ts_iter)
+        tx_objs['o3'] = self._create_ondisk_files(
+            tx_df_mgr, 'o3', policy, t3, (tx_node_index,))
+        # o4 primary fragment archives on tx, handoff in sync on rx
+        t4 = next(self.ts_iter)
+        tx_objs['o4'] = self._create_ondisk_files(
+            tx_df_mgr, 'o4', policy, t4, (tx_node_index,))
+        rx_objs['o4'] = self._create_ondisk_files(
+            rx_df_mgr, 'o4', policy, t4, (rx_node_index,))
+        # o5 is a tombstone, missing on receiver
+        t5 = next(self.ts_iter)
+        tx_tombstones['o5'] = self._create_ondisk_files(
+            tx_df_mgr, 'o5', policy, t5, (tx_node_index,))
+        tx_tombstones['o5'][0].delete(t5)
+
+        suffixes = set()
+        for diskfiles in list(tx_objs.values()) + list(tx_tombstones.values()):
+            for df in diskfiles:
+                suffixes.add(os.path.basename(os.path.dirname(df._datadir)))
+
+        reconstruct_fa_calls = []
+
+        def fake_reconstruct_fa(job, node, df):
+            reconstruct_fa_calls.append((job, node, policy, df))
+            if len(reconstruct_fa_calls) == 2:
+                # simulate second reconstruct failing
+                raise DiskFileError
+            metadata = df.get_datafile_metadata()
+            content = self._get_object_data(metadata['name'],
+                                            frag_index=rx_node_index)
+            return RebuildingECDiskFileStream(
+                metadata, rx_node_index, iter([content]))
+
+        # create ssync sender instance...
+        job = {'device': self.device,
+               'partition': self.partition,
+               'policy': policy,
+               'frag_index': frag_index,
+               'sync_diskfile_builder': fake_reconstruct_fa}
+        node = dict(self.rx_node)
+        sender = ssync_sender.Sender(self.daemon, node, job, suffixes)
+        # wrap connection from tx to rx to capture ssync messages...
+        sender.connect, trace = self.make_connect_wrapper(sender)
+
+        # run the sync protocol...
+        sender()
+
+        # verify protocol
+        results = self._analyze_trace(trace)
+        # sender has primary for o1, o2 and o3, o4 and ts for o5
+        self.assertEqual(5, len(results['tx_missing']))
+        # receiver is missing o1, o2 and o3 and ts for o5
+        self.assertEqual(4, len(results['rx_missing']))
+        # sender can only construct 2 out of 3 missing frags
+        self.assertEqual(3, len(results['tx_updates']))
+        self.assertEqual(3, len(reconstruct_fa_calls))
+        self.assertFalse(results['rx_updates'])
+        actual_sync_paths = []
+        for subreq in results.get('tx_updates'):
+            if subreq.get('method') == 'PUT':
+                self.assertTrue(
+                    'X-Object-Sysmeta-Ec-Frag-Index: %s' % rx_node_index
+                    in subreq.get('headers'))
+                expected_body = self._get_object_data(
+                    subreq['path'], frag_index=rx_node_index)
+                self.assertEqual(expected_body, subreq['body'])
+            elif subreq.get('method') == 'DELETE':
+                self.assertEqual('/a/c/o5', subreq['path'])
+            actual_sync_paths.append(subreq.get('path'))
+
+        # remove the failed df from expected synced df's
+        expect_sync_paths = ['/a/c/o1', '/a/c/o2', '/a/c/o3', '/a/c/o5']
+        failed_df = reconstruct_fa_calls[1][3]
+        failed_path = failed_df.get_datafile_metadata()['name']
+        expect_sync_paths.remove(failed_path)
+        failed_obj = None
+        for obj, diskfiles in tx_objs.items():
+            if diskfiles[0]._name == failed_path:
+                failed_obj = obj
+        # sanity check
+        self.assertTrue(tx_objs.pop(failed_obj))
+
+        # verify on disk files...
+        self.assertEqual(sorted(expect_sync_paths), sorted(actual_sync_paths))
+        self._verify_ondisk_files(
+            tx_objs, policy, frag_index, rx_node_index)
+        self._verify_tombstones(tx_tombstones, policy)
+
+    def test_send_with_frag_index_none(self):
+        policy = POLICIES.default
+        tx_df_mgr = self.daemon._df_router[policy]
+        rx_df_mgr = self.rx_controller._diskfile_router[policy]
+        # create an ec fragment on the remote node
+        ts1 = next(self.ts_iter)
+        remote_df = self._create_ondisk_files(
+            rx_df_mgr, 'o', policy, ts1, (3,))[0]
+
+        # create a tombstone on the local node
+        df = self._create_ondisk_files(
+            tx_df_mgr, 'o', policy, ts1, (3,))[0]
+        suffix = os.path.basename(os.path.dirname(df._datadir))
+        ts2 = next(self.ts_iter)
+        df.delete(ts2)
+        # a reconstructor revert job with only tombstones will have frag_index
+        # explicitly set to None
+        job = {
+            'frag_index': None,
+            'partition': self.partition,
+            'policy': policy,
+            'device': self.device,
+        }
+        sender = ssync_sender.Sender(
+            self.daemon, self.rx_node, job, [suffix])
+        success, _ = sender()
+        self.assertTrue(success)
+        try:
+            remote_df.read_metadata()
+        except DiskFileDeleted as e:
+            self.assertEqual(e.timestamp, ts2)
+        else:
+            self.fail('Successfully opened remote DiskFile')
+
+    def test_send_invalid_frag_index(self):
+        policy = POLICIES.default
+        job = {'frag_index': 'No one cares',
+               'device': self.device,
+               'partition': self.partition,
+               'policy': policy}
+        self.rx_node['backend_index'] = 'Not a number'
+        sender = ssync_sender.Sender(
+            self.daemon, self.rx_node, job, ['abc'])
+        success, _ = sender()
+        self.assertFalse(success)
+        error_log_lines = self.logger.get_lines_for_level('error')
+        self.assertEqual(1, len(error_log_lines))
+        error_msg = error_log_lines[0]
+        self.assertIn("Expected status 200; got 400", error_msg)
+        self.assertIn("Invalid X-Backend-Ssync-Frag-Index 'Not a number'",
+                      error_msg)
+
+    def test_revert_job_with_legacy_durable(self):
+        # test a sync_revert type job using a sender object with a legacy
+        # durable file, that will create a receiver object with durable data
+        policy = POLICIES.default
+        rx_node_index = 0
+        # for a revert job we iterate over frag index that belongs on
+        # remote node
+        frag_index = rx_node_index
+
+        # create non durable tx obj by not committing, then create a legacy
+        # .durable file
+        tx_objs = {}
+        tx_df_mgr = self.daemon._df_router[policy]
+        rx_df_mgr = self.rx_controller._diskfile_router[policy]
+        t1 = next(self.ts_iter)
+        tx_objs['o1'] = self._create_ondisk_files(
+            tx_df_mgr, 'o1', policy, t1, (rx_node_index,), commit=False)
+        tx_datadir = tx_objs['o1'][0]._datadir
+        durable_file = os.path.join(tx_datadir, t1.internal + '.durable')
+        with open(durable_file, 'wb'):
+            pass
+        self.assertEqual(2, len(os.listdir(tx_datadir)))  # sanity check
+
+        suffixes = [os.path.basename(os.path.dirname(tx_datadir))]
+
+        # create ssync sender instance...
+        job = {'device': self.device,
+               'partition': self.partition,
+               'policy': policy,
+               'frag_index': frag_index}
+        node = dict(self.rx_node)
+        sender = ssync_sender.Sender(self.daemon, node, job, suffixes)
+        # wrap connection from tx to rx to capture ssync messages...
+        sender.connect, trace = self.make_connect_wrapper(sender)
+
+        # run the sync protocol...
+        sender()
+
+        # verify protocol
+        results = self._analyze_trace(trace)
+        self.assertEqual(1, len(results['tx_missing']))
+        self.assertEqual(1, len(results['rx_missing']))
+        self.assertEqual(1, len(results['tx_updates']))
+        self.assertFalse(results['rx_updates'])
+
+        # sanity check - rx diskfile is durable
+        expected_rx_file = '%s#%s#d.data' % (t1.internal, rx_node_index)
+        rx_df = self._open_rx_diskfile('o1', policy, rx_node_index)
+        self.assertEqual([expected_rx_file], os.listdir(rx_df._datadir))
+
+        # verify on disk files...
+        self._verify_ondisk_files(
+            tx_objs, policy, frag_index, rx_node_index)
+
+        # verify that tx and rx both generate the same suffix hashes...
+        tx_hashes = tx_df_mgr.get_hashes(
+            self.device, self.partition, suffixes, policy)
+        rx_hashes = rx_df_mgr.get_hashes(
+            self.device, self.partition, suffixes, policy)
+        self.assertEqual(suffixes, list(tx_hashes.keys()))  # sanity
+        self.assertEqual(tx_hashes, rx_hashes)
+
+        # sanity check - run ssync again and expect no sync activity
+        sender = ssync_sender.Sender(self.daemon, node, job, suffixes)
+        sender.connect, trace = self.make_connect_wrapper(sender)
+        sender()
+        results = self._analyze_trace(trace)
+        self.assertEqual(1, len(results['tx_missing']))
+        self.assertFalse(results['rx_missing'])
+        self.assertFalse(results['tx_updates'])
+        self.assertFalse(results['rx_updates'])
+
+
+class FakeResponse(object):
+    def __init__(self, frag_index, obj_data, length=None, status=200):
+        self.frag_index = frag_index
+        self.obj_data = obj_data
+        self.data = b''
+        self.length = length
+        self.status = status
+
+    def init(self, path, conf):
+        if isinstance(self.obj_data, Exception):
+            self.data = self.obj_data
+        else:
+            self.data = self.obj_data[path][self.frag_index]
+        self.conf = conf
+
+    def getheaders(self):
+        return {
+            'X-Object-Sysmeta-Ec-Frag-Index': str(self.frag_index),
+            'X-Object-Sysmeta-Ec-Etag': 'the etag',
+            'X-Backend-Timestamp': self.conf['timestamp'].internal
+        }
+
+    def read(self, length):
+        if isinstance(self.data, Exception):
+            raise self.data
+        val = self.data
+        self.data = b''
+        return val if self.length is None else val[:self.length]
+
+
+class TestSsyncECReconstructorSyncJob(TestBaseSsyncEC):
+    def setUp(self):
+        super(TestSsyncECReconstructorSyncJob, self).setUp()
+        self.rx_node_index = 0
+        self.tx_node_index = 1
+
+        # create sender side diskfiles...ensure their timestamps are in the
+        # past so that tests that set reclaim_age=0 succeed in reclaiming
+        self.ts_iter = make_timestamp_iter(offset=-1000)
+        self.tx_objs = {}
+        tx_df_mgr = self.daemon._df_router[self.policy]
+        t1 = next(self.ts_iter)
+        self.tx_objs['o1'] = self._create_ondisk_files(
+            tx_df_mgr, 'o1', self.policy, t1, (self.tx_node_index,))
+        t2 = next(self.ts_iter)
+        self.tx_objs['o2'] = self._create_ondisk_files(
+            tx_df_mgr, 'o2', self.policy, t2, (self.tx_node_index,))
+        self.response_confs = {'/a/c/o1': {'timestamp': t1},
+                               '/a/c/o2': {'timestamp': t2}}
+
+        self.suffixes = set()
+        for diskfiles in list(self.tx_objs.values()):
+            for df in diskfiles:
+                self.suffixes.add(
+                    os.path.basename(os.path.dirname(df._datadir)))
+
+        self.job_node = dict(self.rx_node)
+        self.job_node['id'] = 0
+
+        self.frag_length = int(
+            self.tx_objs['o1'][0].get_metadata()['Content-Length'])
+
+    def _test_reconstructor_sync_job(self, frag_responses, custom_conf=None):
+        # Helper method to mock reconstructor to consume given lists of fake
+        # responses while reconstructing a fragment for a sync type job. The
+        # tests verify that when the reconstructed fragment iter fails in some
+        # way then ssync does not mistakenly create fragments on the receiving
+        # node which have incorrect data.
+        # See https://bugs.launchpad.net/swift/+bug/1631144
+
+        custom_conf = custom_conf if custom_conf else {}
+        # frag_responses is a list of two lists of responses to each
+        # reconstructor GET request for a fragment archive. The two items in
+        # the outer list are lists of responses for each of the two fragments
+        # to be reconstructed, and are used in the order that ssync syncs the
+        # fragments. Items in the inner lists are responses for each of the
+        # other fragments fetched during the reconstructor rebuild.
+        path_to_responses = {}
+        fake_get_response_calls = []
+
+        def fake_get_response(recon, node, policy, part, path, headers):
+            # select a list of fake responses for this path and return the next
+            # from the list: we don't know the order in which paths will show
+            # up but we do want frag_responses[0] to be used first, so the
+            # frag_responses aren't bound to a path until this point
+            if path not in path_to_responses:
+                path_to_responses[path] = frag_responses.pop(0)
+            response = path_to_responses[path].pop()
+            # the frag_responses list is in ssync task order: we only know the
+            # path when consuming the responses so initialise the path in the
+            # response now
+            if response:
+                response.init(path, self.response_confs[path])
+                # should be full path but just used for logging...
+                response.full_path = path
+            fake_get_response_calls.append(path)
+            return response
+
+        def fake_get_part_nodes(part):
+            # the reconstructor will try to remove the receiver node from the
+            # object ring part nodes, but the fake node we created for our
+            # receiver is not actually in the ring part nodes, so append it
+            # here simply so that the reconstructor does not fail to remove it.
+            return (self.policy.object_ring._get_part_nodes(part) +
+                    [self.job_node])
+
+        with mock.patch(
+                'swift.obj.reconstructor.ObjectReconstructor._get_response',
+                fake_get_response), \
+                mock.patch.object(
+                    self.policy.object_ring, 'get_part_nodes',
+                    fake_get_part_nodes):
+            conf = self.daemon_conf
+            conf.update(custom_conf)
+            self.reconstructor = ObjectReconstructor(conf, logger=self.logger)
+            job = {
+                'device': self.device,
+                'partition': self.partition,
+                'policy': self.policy,
+                'frag_index': self.tx_node_index,
+                'sync_diskfile_builder':
+                    self.reconstructor.reconstruct_fa
+            }
+            sender = ssync_sender.Sender(
+                self.reconstructor, self.job_node, job, self.suffixes)
+            sender.connect, trace = self.make_connect_wrapper(sender)
+            sender()
+        return trace
+
+    def test_sync_reconstructor_partial_rebuild(self):
+        # First fragment to sync gets partial content from reconstructor.
+        # Expect ssync job to exit early with no file written on receiver.
+        frag_responses = [
+            [FakeResponse(i, self.obj_data, length=-1)
+             for i in range(self.policy.ec_ndata + self.policy.ec_nparity)],
+            [FakeResponse(i, self.obj_data)
+             for i in range(self.policy.ec_ndata + self.policy.ec_nparity)]]
+
+        self._test_reconstructor_sync_job(frag_responses)
+        msgs = []
+        for obj_name in ('o1', 'o2'):
+            try:
+                df = self._open_rx_diskfile(
+                    obj_name, self.policy, self.rx_node_index)
+                msgs.append('Unexpected rx diskfile for %r with content %r' %
+                            (obj_name, b''.join([d for d in df.reader()])))
+            except DiskFileNotExist:
+                pass  # expected outcome
+        if msgs:
+            self.fail('Failed with:\n%s' % '\n'.join(msgs))
+        tx_error_log_lines = self.logger.get_lines_for_level('error')
+        self.assertIn('Sent data length does not match content-length',
+                      tx_error_log_lines[0])
+        self.assertFalse(tx_error_log_lines[1:])
+        self._wait_for_rx_server()
+        rx_warning_log_lines = self.rx_logger.get_lines_for_level('warning')
+        self.assertEqual(1, len(rx_warning_log_lines),
+                         self.rx_logger.all_log_lines())
+        self.assertIn('ssync subrequest failed with 499',
+                      rx_warning_log_lines[0])
+        self.assertFalse(rx_warning_log_lines[1:])
+        rx_error_lines = self.rx_logger.get_lines_for_level('error')
+        self.assertEqual(1, len(rx_error_lines), rx_error_lines)
+        self.assertIn('127.0.0.1/dev/9 read failed in ssync.Receiver: Early '
+                      'termination for PUT', rx_error_lines[0])
+
+    def test_sync_reconstructor_no_rebuilt_content(self):
+        # First fragment to sync gets no content in any response to
+        # reconstructor. Expect ssync job to exit early with no file written on
+        # receiver.
+        frag_responses = [
+            [FakeResponse(i, self.obj_data, length=0)
+             for i in range(self.policy.ec_ndata + self.policy.ec_nparity)],
+            [FakeResponse(i, self.obj_data)
+             for i in range(self.policy.ec_ndata + self.policy.ec_nparity)]]
+
+        self._test_reconstructor_sync_job(frag_responses)
+        msgs = []
+        for obj_name in ('o1', 'o2'):
+            try:
+                df = self._open_rx_diskfile(
+                    obj_name, self.policy, self.rx_node_index)
+                msgs.append('Unexpected rx diskfile for %r with content %r' %
+                            (obj_name, b''.join([d for d in df.reader()])))
+            except DiskFileNotExist:
+                pass  # expected outcome
+        if msgs:
+            self.fail('Failed with:\n%s' % '\n'.join(msgs))
+        tx_error_log_lines = self.logger.get_lines_for_level('error')
+        self.assertIn('Sent data length does not match content-length',
+                      tx_error_log_lines[0])
+        self.assertFalse(tx_error_log_lines[1:])
+        self._wait_for_rx_server()
+        rx_warning_log_lines = self.rx_logger.get_lines_for_level('warning')
+        self.assertIn('ssync subrequest failed with 499',
+                      rx_warning_log_lines[0])
+        self.assertFalse(rx_warning_log_lines[1:])
+        rx_error_lines = self.rx_logger.get_lines_for_level('error')
+        self.assertEqual(1, len(rx_error_lines), rx_error_lines)
+        self.assertIn('127.0.0.1/dev/9 read failed in ssync.Receiver: Early '
+                      'termination for PUT', rx_error_lines[0])
+
+    def test_sync_reconstructor_exception_during_rebuild(self):
+        # First fragment to sync has some reconstructor get responses raise
+        # exception while rebuilding. Expect ssync job to exit early with no
+        # files written on receiver.
+        frag_responses = [
+            # ec_ndata responses are ok, but one of these will be ignored as
+            # it is for the frag index being rebuilt
+            [FakeResponse(i, self.obj_data)
+             for i in range(self.policy.ec_ndata)] +
+            # ec_nparity responses will raise an Exception - at least one of
+            # these will be used during rebuild
+            [FakeResponse(i, Exception('raised in response read method'))
+             for i in range(self.policy.ec_ndata,
+                            self.policy.ec_ndata + self.policy.ec_nparity)],
+            # second set of response are all good
+            [FakeResponse(i, self.obj_data)
+             for i in range(self.policy.ec_ndata + self.policy.ec_nparity)]]
+
+        with quiet_eventlet_exceptions():
+            self._test_reconstructor_sync_job(frag_responses)
+
+        msgs = []
+        for obj_name in ('o1', 'o2'):
+            try:
+                df = self._open_rx_diskfile(
+                    obj_name, self.policy, self.rx_node_index)
+                msgs.append('Unexpected rx diskfile for %r with content %r' %
+                            (obj_name, b''.join([d for d in df.reader()])))
+            except DiskFileNotExist:
+                pass  # expected outcome
+        if msgs:
+            self.fail('Failed with:\n%s' % '\n'.join(msgs))
+
+        tx_error_log_lines = self.logger.get_lines_for_level('error')
+        self.assertIn('Error trying to rebuild', tx_error_log_lines[0])
+        self.assertIn('Sent data length does not match content-length',
+                      tx_error_log_lines[1])
+        self.assertFalse(tx_error_log_lines[2:])
+        self._wait_for_rx_server()
+        rx_warning_log_lines = self.rx_logger.get_lines_for_level('warning')
+        self.assertIn('ssync subrequest failed with 499',
+                      rx_warning_log_lines[0])
+        self.assertFalse(rx_warning_log_lines[1:])
+        rx_error_lines = self.rx_logger.get_lines_for_level('error')
+        self.assertEqual(1, len(rx_error_lines), rx_error_lines)
+        self.assertIn('127.0.0.1/dev/9 read failed in ssync.Receiver: Early '
+                      'termination for PUT', rx_error_lines[0])
+
+    def test_sync_reconstructor_no_responses(self):
+        # First fragment to sync gets no responses for reconstructor to rebuild
+        # with, nothing is sent to receiver so expect to skip that fragment and
+        # continue with second.
+        frag_responses = [
+            [None
+             for i in range(self.policy.ec_ndata + self.policy.ec_nparity)],
+            [FakeResponse(i, self.obj_data)
+             for i in range(self.policy.ec_ndata + self.policy.ec_nparity)]]
+
+        trace = self._test_reconstructor_sync_job(frag_responses)
+        results = self._analyze_trace(trace)
+        self.assertEqual(2, len(results['tx_missing']))
+        self.assertEqual(2, len(results['rx_missing']))
+        self.assertEqual(1, len(results['tx_updates']))
+        self.assertFalse(results['rx_updates'])
+        self.assertEqual('PUT', results['tx_updates'][0].get('method'))
+        synced_obj_path = results['tx_updates'][0].get('path')
+        synced_obj_name = synced_obj_path[-2:]
+
+        msgs = []
+        obj_name = synced_obj_name
+        try:
+            df = self._open_rx_diskfile(
+                obj_name, self.policy, self.rx_node_index)
+            self.assertEqual(
+                self._get_object_data(synced_obj_path,
+                                      frag_index=self.rx_node_index),
+                b''.join([d for d in df.reader()]))
+        except DiskFileNotExist:
+            msgs.append('Missing rx diskfile for %r' % obj_name)
+
+        obj_names = list(self.tx_objs)
+        obj_names.remove(synced_obj_name)
+        obj_name = obj_names[0]
+        try:
+            df = self._open_rx_diskfile(
+                obj_name, self.policy, self.rx_node_index)
+            msgs.append('Unexpected rx diskfile for %r with content %r' %
+                        (obj_name, b''.join([d for d in df.reader()])))
+        except DiskFileNotExist:
+            pass  # expected outcome
+        if msgs:
+            self.fail('Failed with:\n%s' % '\n'.join(msgs))
+        log_lines = self.logger.get_lines_for_level('error')
+        self.assertIn('Unable to get enough responses', log_lines[0])
+        self._wait_for_rx_server()
+        self.assertFalse(self.rx_logger.get_lines_for_level('warning'))
+        self.assertFalse(self.rx_logger.get_lines_for_level('error'))
+
+    def test_sync_reconstructor_quarantines_lonely_frag(self):
+        # First fragment to sync gets only one response for reconstructor to
+        # rebuild with, and that response is for the tx_node frag index: it
+        # should be quarantined, but after that the ssync session should still
+        # proceeed with rebuilding the second frag.
+        lonely_frag_responses = [
+            FakeResponse(i, self.obj_data, status=404)
+            for i in range(self.policy.ec_ndata + self.policy.ec_nparity)]
+        lonely_frag_responses[self.tx_node_index].status = 200
+        frag_responses = [
+            lonely_frag_responses,
+            [FakeResponse(i, self.obj_data)
+             for i in range(self.policy.ec_ndata + self.policy.ec_nparity)]]
+
+        # configure reconstructor to quarantine the lonely frag
+        custom_conf = {'reclaim_age': 0, 'quarantine_threshold': 1}
+        trace = self._test_reconstructor_sync_job(frag_responses, custom_conf)
+        results = self._analyze_trace(trace)
+        self.assertEqual(2, len(results['tx_missing']))
+        self.assertEqual(2, len(results['rx_missing']))
+        self.assertEqual(1, len(results['tx_updates']))
+        self.assertFalse(results['rx_updates'])
+        self.assertEqual('PUT', results['tx_updates'][0].get('method'))
+        synced_obj_path = results['tx_updates'][0].get('path')
+        synced_obj_name = synced_obj_path[-2:]
+
+        # verify that the second frag was rebuilt on rx node...
+        msgs = []
+        try:
+            df = self._open_rx_diskfile(
+                synced_obj_name, self.policy, self.rx_node_index)
+            self.assertEqual(
+                self._get_object_data(synced_obj_path,
+                                      frag_index=self.rx_node_index),
+                b''.join([d for d in df.reader()]))
+        except DiskFileNotExist:
+            msgs.append('Missing rx diskfile for %r' % synced_obj_name)
+        # ...and it is still on tx node...
+        try:
+            df = self._open_tx_diskfile(
+                synced_obj_name, self.policy, self.tx_node_index)
+            self.assertEqual(
+                self._get_object_data(df._name,
+                                      frag_index=self.tx_node_index),
+                b''.join([d for d in df.reader()]))
+        except DiskFileNotExist:
+            msgs.append('Missing tx diskfile for %r' % synced_obj_name)
+
+        # verify that the lonely frag was not rebuilt on rx node and was
+        # removed on tx node
+        obj_names = list(self.tx_objs)
+        obj_names.remove(synced_obj_name)
+        quarantined_obj_name = obj_names[0]
+        try:
+            df = self._open_rx_diskfile(
+                quarantined_obj_name, self.policy, self.rx_node_index)
+            msgs.append(
+                'Unexpected rx diskfile for %r with content %r' %
+                (quarantined_obj_name, b''.join([d for d in df.reader()])))
+        except DiskFileNotExist:
+            pass  # expected outcome
+        try:
+            df = self._open_tx_diskfile(
+                quarantined_obj_name, self.policy, self.tx_node_index)
+            msgs.append(
+                'Unexpected tx diskfile for %r with content %r' %
+                (quarantined_obj_name, b''.join([d for d in df.reader()])))
+        except DiskFileNotExist:
+            pass  # expected outcome
+
+        if msgs:
+            self.fail('Failed with:\n%s' % '\n'.join(msgs))
+        error_lines = self.logger.get_lines_for_level('error')
+        self.assertEqual(2, len(error_lines), error_lines)
+        self.assertIn('Unable to get enough responses', error_lines[0])
+        self.assertIn('Unable to get enough responses', error_lines[1])
+        warning_lines = self.logger.get_lines_for_level('warning')
+        self.assertEqual(1, len(warning_lines), warning_lines)
+        self.assertIn('Quarantined object', warning_lines[0])
+
+        # check we have a quarantined data file
+        df_mgr = self.daemon._df_router[self.policy]
+        quarantined_df = df_mgr.get_diskfile(
+            self.device, self.partition, account='a', container='c',
+            obj=quarantined_obj_name, policy=self.policy,
+            frag_index=self.tx_node_index)
+        df_hash = os.path.basename(quarantined_df._datadir)
+        quarantine_dir = os.path.join(
+            quarantined_df._device_path, 'quarantined',
+            diskfile.get_data_dir(self.policy), df_hash)
+        self.assertTrue(os.path.isdir(quarantine_dir))
+        data_file = os.listdir(quarantine_dir)[0]
+        with open(os.path.join(quarantine_dir, data_file), 'rb') as fd:
+            self.assertEqual(
+                self._get_object_data(quarantined_df._name,
+                                      frag_index=self.tx_node_index),
+                fd.read())
+
+        self._wait_for_rx_server()
+        self.assertFalse(self.rx_logger.get_lines_for_level('warning'))
+        self.assertFalse(self.rx_logger.get_lines_for_level('error'))
+
+    def test_sync_reconstructor_rebuild_ok(self):
+        # Sanity test for this class of tests. Both fragments get a full
+        # complement of responses and rebuild correctly.
+        frag_responses = [
+            [FakeResponse(i, self.obj_data)
+             for i in range(self.policy.ec_ndata + self.policy.ec_nparity)],
+            [FakeResponse(i, self.obj_data)
+             for i in range(self.policy.ec_ndata + self.policy.ec_nparity)]]
+
+        trace = self._test_reconstructor_sync_job(frag_responses)
+        results = self._analyze_trace(trace)
+        self.assertEqual(2, len(results['tx_missing']))
+        self.assertEqual(2, len(results['rx_missing']))
+        self.assertEqual(2, len(results['tx_updates']))
+        self.assertFalse(results['rx_updates'])
+        msgs = []
+        for obj_name in self.tx_objs:
+            try:
+                df = self._open_rx_diskfile(
+                    obj_name, self.policy, self.rx_node_index)
+                self.assertEqual(
+                    self._get_object_data(df._name,
+                                          frag_index=self.rx_node_index),
+                    b''.join([d for d in df.reader()]))
+            except DiskFileNotExist:
+                msgs.append('Missing rx diskfile for %r' % obj_name)
+        if msgs:
+            self.fail('Failed with:\n%s' % '\n'.join(msgs))
+        self.assertFalse(self.logger.get_lines_for_level('error'))
+        self.assertFalse(
+            self.logger.get_lines_for_level('error'))
+        self._wait_for_rx_server()
+        self.assertFalse(self.rx_logger.get_lines_for_level('warning'))
+        self.assertFalse(self.rx_logger.get_lines_for_level('error'))
+
+
+@patch_policies
+class TestSsyncReplication(TestBaseSsync):
+    def setUp(self):
+        super(TestSsyncReplication, self).setUp()
+        self.logger = debug_logger('test-ssync-sender')
+        self.daemon = ObjectReplicator(self.daemon_conf, self.logger)
+
+    def test_sync(self):
+        policy = POLICIES.default
+
+        # create sender side diskfiles...
+        tx_objs = {}
+        rx_objs = {}
+        tx_tombstones = {}
+        rx_tombstones = {}
+        tx_df_mgr = self.daemon._df_router[policy]
+        rx_df_mgr = self.rx_controller._diskfile_router[policy]
+        # o1 and o2 are on tx only
+        t1 = next(self.ts_iter)
+        tx_objs['o1'] = self._create_ondisk_files(tx_df_mgr, 'o1', policy, t1)
+        t2 = next(self.ts_iter)
+        tx_objs['o2'] = self._create_ondisk_files(tx_df_mgr, 'o2', policy, t2)
+        # o3 is on tx and older copy on rx
+        t3a = next(self.ts_iter)
+        rx_objs['o3'] = self._create_ondisk_files(rx_df_mgr, 'o3', policy, t3a)
+        t3b = next(self.ts_iter)
+        tx_objs['o3'] = self._create_ondisk_files(tx_df_mgr, 'o3', policy, t3b)
+        # o4 in sync on rx and tx
+        t4 = next(self.ts_iter)
+        tx_objs['o4'] = self._create_ondisk_files(tx_df_mgr, 'o4', policy, t4)
+        rx_objs['o4'] = self._create_ondisk_files(rx_df_mgr, 'o4', policy, t4)
+        # o5 is a tombstone, missing on receiver
+        t5 = next(self.ts_iter)
+        tx_tombstones['o5'] = self._create_ondisk_files(
+            tx_df_mgr, 'o5', policy, t5)
+        tx_tombstones['o5'][0].delete(t5)
+        # o6 is a tombstone, in sync on tx and rx
+        t6 = next(self.ts_iter)
+        tx_tombstones['o6'] = self._create_ondisk_files(
+            tx_df_mgr, 'o6', policy, t6)
+        tx_tombstones['o6'][0].delete(t6)
+        rx_tombstones['o6'] = self._create_ondisk_files(
+            rx_df_mgr, 'o6', policy, t6)
+        rx_tombstones['o6'][0].delete(t6)
+        # o7 is a tombstone on tx, older data on rx
+        t7a = next(self.ts_iter)
+        rx_objs['o7'] = self._create_ondisk_files(rx_df_mgr, 'o7', policy, t7a)
+        t7b = next(self.ts_iter)
+        tx_tombstones['o7'] = self._create_ondisk_files(
+            tx_df_mgr, 'o7', policy, t7b)
+        tx_tombstones['o7'][0].delete(t7b)
+
+        suffixes = set()
+        for diskfiles in list(tx_objs.values()) + list(tx_tombstones.values()):
+            for df in diskfiles:
+                suffixes.add(os.path.basename(os.path.dirname(df._datadir)))
+
+        # create ssync sender instance...
+        job = {'device': self.device,
+               'partition': self.partition,
+               'policy': policy}
+        node = dict(self.rx_node)
+        sender = ssync_sender.Sender(self.daemon, node, job, suffixes)
+        # wrap connection from tx to rx to capture ssync messages...
+        sender.connect, trace = self.make_connect_wrapper(sender)
+
+        # run the sync protocol...
+        success, in_sync_objs = sender()
+
+        self.assertEqual(7, len(in_sync_objs))
+        self.assertTrue(success)
+
+        # verify protocol
+        results = self._analyze_trace(trace)
+        self.assertEqual(7, len(results['tx_missing']))
+        self.assertEqual(5, len(results['rx_missing']))
+        self.assertEqual(5, len(results['tx_updates']))
+        self.assertFalse(results['rx_updates'])
+        sync_paths = []
+        for subreq in results.get('tx_updates'):
+            if subreq.get('method') == 'PUT':
+                self.assertTrue(
+                    subreq['path'] in ('/a/c/o1', '/a/c/o2', '/a/c/o3'))
+                expected_body = self._get_object_data(subreq['path'])
+                self.assertEqual(expected_body, subreq['body'])
+            elif subreq.get('method') == 'DELETE':
+                self.assertTrue(subreq['path'] in ('/a/c/o5', '/a/c/o7'))
+            sync_paths.append(subreq.get('path'))
+        self.assertEqual(
+            ['/a/c/o1', '/a/c/o2', '/a/c/o3', '/a/c/o5', '/a/c/o7'],
+            sorted(sync_paths))
+
+        # verify on disk files...
+        self._verify_ondisk_files(tx_objs, policy)
+        self._verify_tombstones(tx_tombstones, policy)
+
+    def test_nothing_to_sync(self):
+        job = {'device': self.device,
+               'partition': self.partition,
+               'policy': POLICIES.default}
+        node = {'replication_ip': self.rx_ip,
+                'replication_port': self.rx_port,
+                'device': self.device,
+                'index': 0}
+        sender = ssync_sender.Sender(self.daemon, node, job, ['abc'])
+        # wrap connection from tx to rx to capture ssync messages...
+        sender.connect, trace = self.make_connect_wrapper(sender)
+
+        result, in_sync_objs = sender()
+
+        self.assertTrue(result)
+        self.assertFalse(in_sync_objs)
+        results = self._analyze_trace(trace)
+        self.assertFalse(results['tx_missing'])
+        self.assertFalse(results['rx_missing'])
+        self.assertFalse(results['tx_updates'])
+        self.assertFalse(results['rx_updates'])
+        # Minimal receiver response as read by sender:
+        #               2  <-- initial \r\n to start ssync exchange
+        # +            23  <-- :MISSING CHECK START\r\n
+        # +             2  <-- \r\n (minimal missing check response)
+        # +            21  <-- :MISSING CHECK END\r\n
+        # +            17  <-- :UPDATES START\r\n
+        # +            15  <-- :UPDATES END\r\n
+        #    TOTAL =   80
+        self.assertEqual(80, trace.get('readline_bytes'))
+
+    def test_meta_file_sync(self):
+        policy = POLICIES.default
+
+        # create diskfiles...
+        tx_objs = {}
+        rx_objs = {}
+        tx_tombstones = {}
+        rx_tombstones = {}
+        tx_df_mgr = self.daemon._df_router[policy]
+        rx_df_mgr = self.rx_controller._diskfile_router[policy]
+
+        expected_subreqs = defaultdict(list)
+
+        # o1 on tx only with meta file
+        t1 = next(self.ts_iter)
+        tx_objs['o1'] = self._create_ondisk_files(tx_df_mgr, 'o1', policy, t1)
+        t1_meta = next(self.ts_iter)
+        metadata = {'X-Timestamp': t1_meta.internal,
+                    'X-Object-Meta-Test': 'o1',
+                    'X-Object-Sysmeta-Test': 'sys_o1'}
+        tx_objs['o1'][0].write_metadata(metadata)
+        expected_subreqs['PUT'].append('o1')
+        expected_subreqs['POST'].append('o1')
+
+        # o2 on tx with meta, on rx without meta
+        t2 = next(self.ts_iter)
+        tx_objs['o2'] = self._create_ondisk_files(tx_df_mgr, 'o2', policy, t2)
+        t2_meta = next(self.ts_iter)
+        metadata = {'X-Timestamp': t2_meta.internal,
+                    'X-Object-Meta-Test': 'o2',
+                    'X-Object-Sysmeta-Test': 'sys_o2'}
+        tx_objs['o2'][0].write_metadata(metadata)
+        rx_objs['o2'] = self._create_ondisk_files(rx_df_mgr, 'o2', policy, t2)
+        expected_subreqs['POST'].append('o2')
+
+        # o3 is on tx with meta, rx has newer data but no meta,
+        # meta timestamp has an offset
+        t3a = next(self.ts_iter)
+        tx_objs['o3'] = self._create_ondisk_files(tx_df_mgr, 'o3', policy, t3a)
+        t3b = next(self.ts_iter)
+        rx_objs['o3'] = self._create_ondisk_files(rx_df_mgr, 'o3', policy, t3b)
+        t3_meta = next(self.ts_iter)
+        t3_meta = utils.Timestamp(t3_meta, offset=2)
+        metadata = {'X-Timestamp': t3_meta.internal,
+                    'X-Object-Meta-Test': 'o3',
+                    'X-Object-Sysmeta-Test': 'sys_o3'}
+        tx_objs['o3'][0].write_metadata(metadata)
+        expected_subreqs['POST'].append('o3')
+
+        # o4 is on tx with meta, rx has older data and up to date meta,
+        t4a = next(self.ts_iter)
+        rx_objs['o4'] = self._create_ondisk_files(rx_df_mgr, 'o4', policy, t4a)
+        t4b = next(self.ts_iter)
+        tx_objs['o4'] = self._create_ondisk_files(tx_df_mgr, 'o4', policy, t4b)
+        t4_meta = next(self.ts_iter)
+        metadata = {'X-Timestamp': t4_meta.internal,
+                    'X-Object-Meta-Test': 'o4',
+                    'X-Object-Sysmeta-Test': 'sys_o4'}
+        tx_objs['o4'][0].write_metadata(metadata)
+        rx_objs['o4'][0].write_metadata(metadata)
+        expected_subreqs['PUT'].append('o4')
+
+        # o5 is on tx with meta, rx is in sync with data and meta
+        t5 = next(self.ts_iter)
+        t5 = utils.Timestamp(t5, offset=1)  # note: use an offset for this test
+        rx_objs['o5'] = self._create_ondisk_files(rx_df_mgr, 'o5', policy, t5)
+        tx_objs['o5'] = self._create_ondisk_files(tx_df_mgr, 'o5', policy, t5)
+        t5_meta = next(self.ts_iter)
+        metadata = {'X-Timestamp': t5_meta.internal,
+                    'X-Object-Meta-Test': 'o5',
+                    'X-Object-Sysmeta-Test': 'sys_o5'}
+        tx_objs['o5'][0].write_metadata(metadata)
+        rx_objs['o5'][0].write_metadata(metadata)
+
+        # o6 is tombstone on tx, rx has older data and meta
+        t6 = next(self.ts_iter)
+        tx_tombstones['o6'] = self._create_ondisk_files(
+            tx_df_mgr, 'o6', policy, t6)
+        rx_tombstones['o6'] = self._create_ondisk_files(
+            rx_df_mgr, 'o6', policy, t6)
+        metadata = {'X-Timestamp': next(self.ts_iter).internal,
+                    'X-Object-Meta-Test': 'o6',
+                    'X-Object-Sysmeta-Test': 'sys_o6'}
+        rx_tombstones['o6'][0].write_metadata(metadata)
+        tx_tombstones['o6'][0].delete(next(self.ts_iter))
+        expected_subreqs['DELETE'].append('o6')
+
+        # o7 is tombstone on rx, tx has older data and meta,
+        # no subreqs expected...
+        t7 = next(self.ts_iter)
+        tx_objs['o7'] = self._create_ondisk_files(tx_df_mgr, 'o7', policy, t7)
+        rx_tombstones['o7'] = self._create_ondisk_files(
+            rx_df_mgr, 'o7', policy, t7)
+        metadata = {'X-Timestamp': next(self.ts_iter).internal,
+                    'X-Object-Meta-Test': 'o7',
+                    'X-Object-Sysmeta-Test': 'sys_o7'}
+        tx_objs['o7'][0].write_metadata(metadata)
+        rx_tombstones['o7'][0].delete(next(self.ts_iter))
+
+        # o8 is on tx with meta, rx has in sync data but meta with different
+        # offset
+        t8 = next(self.ts_iter)
+        rx_objs['o8'] = self._create_ondisk_files(rx_df_mgr, 'o8', policy, t8)
+        tx_objs['o8'] = self._create_ondisk_files(tx_df_mgr, 'o8', policy, t8)
+        t8_meta = next(self.ts_iter)
+        t8_meta_offset = utils.Timestamp(t8_meta, offset=4)
+        metadata = {'X-Timestamp': t8_meta_offset.internal,
+                    'X-Object-Meta-Test': 'o8',
+                    'X-Object-Sysmeta-Test': 'sys_o8'}
+        tx_objs['o8'][0].write_metadata(metadata)
+        # different ts_meta offset on rx
+        t8_meta_offset = utils.Timestamp(t8_meta, offset=3)
+        metadata = {'X-Timestamp': t8_meta_offset.internal,
+                    'X-Object-Meta-Test': 'o8',
+                    'X-Object-Sysmeta-Test': 'sys_o8'}
+        rx_objs['o8'][0].write_metadata(metadata)
+        expected_subreqs['POST'].append('o8')
+
+        suffixes = set()
+        for diskfiles in list(tx_objs.values()) + list(tx_tombstones.values()):
+            for df in diskfiles:
+                suffixes.add(os.path.basename(os.path.dirname(df._datadir)))
+
+        # create ssync sender instance...
+        job = {'device': self.device,
+               'partition': self.partition,
+               'policy': policy}
+        node = dict(self.rx_node)
+        sender = ssync_sender.Sender(self.daemon, node, job, suffixes)
+        # wrap connection from tx to rx to capture ssync messages...
+        sender.connect, trace = self.make_connect_wrapper(sender)
+
+        # run the sync protocol...
+        success, in_sync_objs = sender()
+
+        self.assertEqual(8, len(in_sync_objs))
+        self.assertTrue(success)
+
+        # verify protocol
+        results = self._analyze_trace(trace)
+        self.assertEqual(8, len(results['tx_missing']))
+        self.assertEqual(6, len(results['rx_missing']))
+        for subreq in results.get('tx_updates'):
+            obj = subreq['path'].split('/')[3]
+            method = subreq['method']
+            self.assertTrue(obj in expected_subreqs[method],
+                            'Unexpected %s subreq for object %s, expected %s'
+                            % (method, obj, expected_subreqs[method]))
+            expected_subreqs[method].remove(obj)
+            if method == 'PUT':
+                expected_body = self._get_object_data(subreq['path'])
+                self.assertEqual(expected_body, subreq['body'])
+        # verify all expected subreqs consumed
+        for _method, expected in expected_subreqs.items():
+            self.assertFalse(expected)
+        self.assertFalse(results['rx_updates'])
+
+        # verify on disk files...
+        del tx_objs['o7']  # o7 not expected to be sync'd
+        self._verify_ondisk_files(tx_objs, policy)
+        self._verify_tombstones(tx_tombstones, policy)
+        for oname, rx_obj in rx_objs.items():
+            df = rx_obj[0].open()
+            metadata = df.get_metadata()
+            self.assertEqual(metadata['X-Object-Meta-Test'], oname)
+            self.assertEqual(metadata['X-Object-Sysmeta-Test'], 'sys_' + oname)
+
+    def test_expired_object(self):
+        # verify that expired objects sync
+        policy = POLICIES.default
+        tx_df_mgr = self.daemon._df_router[policy]
+        t1 = next(self.ts_iter)
+        obj_name = 'o1'
+        metadata = {'X-Delete-At': '0', 'Content-Type': 'plain/text'}
+        df = self._make_diskfile(
+            obj=obj_name, body=self._get_object_data('/a/c/%s' % obj_name),
+            extra_metadata=metadata, timestamp=t1, policy=policy,
+            df_mgr=tx_df_mgr, verify=False)
+        with self.assertRaises(DiskFileExpired):
+            df.open()  # sanity check - expired
+
+        # create ssync sender instance...
+        suffixes = [os.path.basename(os.path.dirname(df._datadir))]
+        job = {'device': self.device,
+               'partition': self.partition,
+               'policy': policy}
+        node = dict(self.rx_node)
+        sender = ssync_sender.Sender(self.daemon, node, job, suffixes)
+        # wrap connection from tx to rx to capture ssync messages...
+        sender.connect, trace = self.make_connect_wrapper(sender)
+
+        # run the sync protocol...
+        success, in_sync_objs = sender()
+
+        self.assertEqual(1, len(in_sync_objs))
+        self.assertTrue(success)
+        # allow the expired sender diskfile to be opened for verification
+        df._open_expired = True
+        self._verify_ondisk_files({obj_name: [df]}, policy)
+
+    def _check_no_longer_expired_object(self, obj_name, df, policy):
+        # verify that objects with x-delete-at metadata that are not expired
+        # can be sync'd
+
+        def do_ssync():
+            # create ssync sender instance...
+            suffixes = [os.path.basename(os.path.dirname(df._datadir))]
+            job = {'device': self.device,
+                   'partition': self.partition,
+                   'policy': policy}
+            node = dict(self.rx_node)
+            sender = ssync_sender.Sender(self.daemon, node, job, suffixes)
+            # wrap connection from tx to rx to capture ssync messages...
+            sender.connect, trace = self.make_connect_wrapper(sender)
+
+            # run the sync protocol...
+            return sender()
+
+        with self.assertRaises(DiskFileExpired):
+            df.open()  # sanity check - expired
+        t1_meta = next(self.ts_iter)
+        df.write_metadata({'X-Timestamp': t1_meta.internal})  # no x-delete-at
+        df.open()  # sanity check - no longer expired
+
+        success, in_sync_objs = do_ssync()
+        self.assertEqual(1, len(in_sync_objs))
+        self.assertTrue(success)
+        self._verify_ondisk_files({obj_name: [df]}, policy)
+
+        # update object metadata with x-delete-at in distant future
+        t2_meta = next(self.ts_iter)
+        df.write_metadata({'X-Timestamp': t2_meta.internal,
+                           'X-Delete-At': str(int(t2_meta) + 10000)})
+        df.open()  # sanity check - not expired
+
+        success, in_sync_objs = do_ssync()
+        self.assertEqual(1, len(in_sync_objs))
+        self.assertTrue(success)
+        self._verify_ondisk_files({obj_name: [df]}, policy)
+
+        # update object metadata with x-delete-at in not so distant future to
+        # check that we can update rx with older x-delete-at than it's current
+        t3_meta = next(self.ts_iter)
+        df.write_metadata({'X-Timestamp': t3_meta.internal,
+                           'X-Delete-At': str(int(t2_meta) + 5000)})
+        df.open()  # sanity check - not expired
+
+        success, in_sync_objs = do_ssync()
+        self.assertEqual(1, len(in_sync_objs))
+        self.assertTrue(success)
+        self._verify_ondisk_files({obj_name: [df]}, policy)
+
+    def test_no_longer_expired_object_syncs(self):
+        policy = POLICIES.default
+        # simulate o1 that was PUT with x-delete-at that is now expired but
+        # later had a POST that had no x-delete-at: object should not expire.
+        tx_df_mgr = self.daemon._df_router[policy]
+        t1 = next(self.ts_iter)
+        obj_name = 'o1'
+        metadata = {'X-Delete-At': '0', 'Content-Type': 'plain/text'}
+        df = self._make_diskfile(
+            obj=obj_name, body=self._get_object_data('/a/c/%s' % obj_name),
+            extra_metadata=metadata, timestamp=t1, policy=policy,
+            df_mgr=tx_df_mgr, verify=False)
+
+        self._check_no_longer_expired_object(obj_name, df, policy)
+
+    def test_no_longer_expired_object_syncs_meta(self):
+        policy = POLICIES.default
+        # simulate o1 that was PUT with x-delete-at that is now expired but
+        # later had a POST that had no x-delete-at: object should not expire.
+        tx_df_mgr = self.daemon._df_router[policy]
+        rx_df_mgr = self.rx_controller._diskfile_router[policy]
+        t1 = next(self.ts_iter)
+        obj_name = 'o1'
+        metadata = {'X-Delete-At': '0', 'Content-Type': 'plain/text'}
+        df = self._make_diskfile(
+            obj=obj_name, body=self._get_object_data('/a/c/%s' % obj_name),
+            extra_metadata=metadata, timestamp=t1, policy=policy,
+            df_mgr=tx_df_mgr, verify=False)
+        # rx got the .data file but is missing the .meta
+        rx_df = self._make_diskfile(
+            obj=obj_name, body=self._get_object_data('/a/c/%s' % obj_name),
+            extra_metadata=metadata, timestamp=t1, policy=policy,
+            df_mgr=rx_df_mgr, verify=False)
+        with self.assertRaises(DiskFileExpired):
+            rx_df.open()  # sanity check - expired
+
+        self._check_no_longer_expired_object(obj_name, df, policy)
+
+    def test_meta_file_not_synced_to_legacy_receiver(self):
+        # verify that the sender does sync a data file to a legacy receiver,
+        # but does not PUT meta file content to a legacy receiver
+        policy = POLICIES.default
+
+        # create diskfiles...
+        tx_df_mgr = self.daemon._df_router[policy]
+        rx_df_mgr = self.rx_controller._diskfile_router[policy]
+
+        # rx has data at t1 but no meta
+        # object is on tx with data at t2, meta at t3,
+        t1 = next(self.ts_iter)
+        self._create_ondisk_files(rx_df_mgr, 'o1', policy, t1)
+        t2 = next(self.ts_iter)
+        tx_obj = self._create_ondisk_files(tx_df_mgr, 'o1', policy, t2)[0]
+        t3 = next(self.ts_iter)
+        metadata = {'X-Timestamp': t3.internal,
+                    'X-Object-Meta-Test': 'o3',
+                    'X-Object-Sysmeta-Test': 'sys_o3'}
+        tx_obj.write_metadata(metadata)
+
+        suffixes = [os.path.basename(os.path.dirname(tx_obj._datadir))]
+        # create ssync sender instance...
+        job = {'device': self.device,
+               'partition': self.partition,
+               'policy': policy}
+        node = dict(self.rx_node)
+        sender = ssync_sender.Sender(self.daemon, node, job, suffixes)
+        # wrap connection from tx to rx to capture ssync messages...
+        sender.connect, trace = self.make_connect_wrapper(sender)
+
+        def _legacy_check_missing(self, line):
+            # reproduces behavior of 'legacy' ssync receiver missing_checks()
+            parts = line.decode('ascii').split()
+            object_hash = urllib.parse.unquote(parts[0])
+            timestamp = urllib.parse.unquote(parts[1])
+            want = False
+            try:
+                df = self.diskfile_mgr.get_diskfile_from_hash(
+                    self.device, self.partition, object_hash, self.policy,
+                    frag_index=self.frag_index)
+            except DiskFileNotExist:
+                want = True
+            else:
+                try:
+                    df.open()
+                except DiskFileDeleted as err:
+                    want = err.timestamp < timestamp
+                except DiskFileError:
+                    want = True
+                else:
+                    want = df.timestamp < timestamp
+            if want:
+                return urllib.parse.quote(object_hash)
+            return None
+
+        # run the sync protocol...
+        func = 'swift.obj.ssync_receiver.Receiver._check_missing'
+        with mock.patch(func, _legacy_check_missing):
+            success, in_sync_objs = sender()
+
+        self.assertEqual(1, len(in_sync_objs))
+        self.assertTrue(success)
+
+        # verify protocol, expecting only a PUT to legacy receiver
+        results = self._analyze_trace(trace)
+        self.assertEqual(1, len(results['tx_missing']))
+        self.assertEqual(1, len(results['rx_missing']))
+        self.assertEqual(1, len(results['tx_updates']))
+        self.assertEqual('PUT', results['tx_updates'][0]['method'])
+        self.assertFalse(results['rx_updates'])
+
+        # verify on disk files...
+        rx_obj = self._open_rx_diskfile('o1', policy)
+        tx_obj = self._open_tx_diskfile('o1', policy)
+        # with legacy behavior rx_obj data and meta timestamps are equal
+        self.assertEqual(t2, rx_obj.data_timestamp)
+        self.assertEqual(t2, rx_obj.timestamp)
+        # with legacy behavior rx_obj data timestamp should equal tx_obj
+        self.assertEqual(rx_obj.data_timestamp, tx_obj.data_timestamp)
+        # tx meta file should not have been sync'd to rx data file
+        self.assertNotIn('X-Object-Meta-Test', rx_obj.get_metadata())
+
+    def test_content_type_sync(self):
+        policy = POLICIES.default
+
+        # create diskfiles...
+        tx_objs = {}
+        rx_objs = {}
+        tx_df_mgr = self.daemon._df_router[policy]
+        rx_df_mgr = self.rx_controller._diskfile_router[policy]
+
+        expected_subreqs = defaultdict(list)
+
+        # o1 on tx only with two meta files
+        name = 'o1'
+        t1 = next(self.ts_iter)
+        tx_objs[name] = self._create_ondisk_files(tx_df_mgr, name, policy, t1)
+        t1_type = next(self.ts_iter)
+        metadata_1 = {'X-Timestamp': t1_type.internal,
+                      'Content-Type': 'text/test',
+                      'Content-Type-Timestamp': t1_type.internal}
+        tx_objs[name][0].write_metadata(metadata_1)
+        t1_meta = next(self.ts_iter)
+        metadata_2 = {'X-Timestamp': t1_meta.internal,
+                      'X-Object-Meta-Test': name}
+        tx_objs[name][0].write_metadata(metadata_2)
+        expected_subreqs['PUT'].append(name)
+        expected_subreqs['POST'].append(name)
+
+        # o2 on tx with two meta files, rx has .data and newest .meta but is
+        # missing latest content-type
+        name = 'o2'
+        t2 = next(self.ts_iter)
+        tx_objs[name] = self._create_ondisk_files(tx_df_mgr, name, policy, t2)
+        t2_type = next(self.ts_iter)
+        metadata_1 = {'X-Timestamp': t2_type.internal,
+                      'Content-Type': 'text/test',
+                      'Content-Type-Timestamp': t2_type.internal}
+        tx_objs[name][0].write_metadata(metadata_1)
+        t2_meta = next(self.ts_iter)
+        metadata_2 = {'X-Timestamp': t2_meta.internal,
+                      'X-Object-Meta-Test': name}
+        tx_objs[name][0].write_metadata(metadata_2)
+        rx_objs[name] = self._create_ondisk_files(rx_df_mgr, name, policy, t2)
+        rx_objs[name][0].write_metadata(metadata_2)
+        expected_subreqs['POST'].append(name)
+
+        # o3 on tx with two meta files, rx has .data and one .meta but does
+        # have latest content-type so nothing to sync
+        name = 'o3'
+        t3 = next(self.ts_iter)
+        tx_objs[name] = self._create_ondisk_files(tx_df_mgr, name, policy, t3)
+        t3_type = next(self.ts_iter)
+        metadata_1 = {'X-Timestamp': t3_type.internal,
+                      'Content-Type': 'text/test',
+                      'Content-Type-Timestamp': t3_type.internal}
+        tx_objs[name][0].write_metadata(metadata_1)
+        t3_meta = next(self.ts_iter)
+        metadata_2 = {'X-Timestamp': t3_meta.internal,
+                      'X-Object-Meta-Test': name}
+        tx_objs[name][0].write_metadata(metadata_2)
+        rx_objs[name] = self._create_ondisk_files(rx_df_mgr, name, policy, t3)
+        metadata_2b = {'X-Timestamp': t3_meta.internal,
+                       'X-Object-Meta-Test': name,
+                       'Content-Type': 'text/test',
+                       'Content-Type-Timestamp': t3_type.internal}
+        rx_objs[name][0].write_metadata(metadata_2b)
+
+        # o4 on tx with one meta file having latest content-type, rx has
+        # .data and two .meta having latest content-type so nothing to sync
+        # i.e. o4 is the reverse of o3 scenario
+        name = 'o4'
+        t4 = next(self.ts_iter)
+        tx_objs[name] = self._create_ondisk_files(tx_df_mgr, name, policy, t4)
+        t4_type = next(self.ts_iter)
+        t4_meta = next(self.ts_iter)
+        metadata_2b = {'X-Timestamp': t4_meta.internal,
+                       'X-Object-Meta-Test': name,
+                       'Content-Type': 'text/test',
+                       'Content-Type-Timestamp': t4_type.internal}
+        tx_objs[name][0].write_metadata(metadata_2b)
+        rx_objs[name] = self._create_ondisk_files(rx_df_mgr, name, policy, t4)
+        metadata_1 = {'X-Timestamp': t4_type.internal,
+                      'Content-Type': 'text/test',
+                      'Content-Type-Timestamp': t4_type.internal}
+        rx_objs[name][0].write_metadata(metadata_1)
+        metadata_2 = {'X-Timestamp': t4_meta.internal,
+                      'X-Object-Meta-Test': name}
+        rx_objs[name][0].write_metadata(metadata_2)
+
+        # o5 on tx with one meta file having latest content-type, rx has
+        # .data and no .meta
+        name = 'o5'
+        t5 = next(self.ts_iter)
+        tx_objs[name] = self._create_ondisk_files(tx_df_mgr, name, policy, t5)
+        t5_type = next(self.ts_iter)
+        t5_meta = next(self.ts_iter)
+        metadata = {'X-Timestamp': t5_meta.internal,
+                    'X-Object-Meta-Test': name,
+                    'Content-Type': 'text/test',
+                    'Content-Type-Timestamp': t5_type.internal}
+        tx_objs[name][0].write_metadata(metadata)
+        rx_objs[name] = self._create_ondisk_files(rx_df_mgr, name, policy, t5)
+        expected_subreqs['POST'].append(name)
+
+        suffixes = set()
+        for diskfiles in tx_objs.values():
+            for df in diskfiles:
+                suffixes.add(os.path.basename(os.path.dirname(df._datadir)))
+
+        # create ssync sender instance...
+        job = {'device': self.device,
+               'partition': self.partition,
+               'policy': policy}
+        node = dict(self.rx_node)
+        sender = ssync_sender.Sender(self.daemon, node, job, suffixes)
+        # wrap connection from tx to rx to capture ssync messages...
+        sender.connect, trace = self.make_connect_wrapper(sender)
+
+        # run the sync protocol...
+        success, in_sync_objs = sender()
+
+        self.assertEqual(5, len(in_sync_objs), trace['messages'])
+        self.assertTrue(success)
+
+        # verify protocol
+        results = self._analyze_trace(trace)
+        self.assertEqual(5, len(results['tx_missing']))
+        self.assertEqual(3, len(results['rx_missing']))
+        for subreq in results.get('tx_updates'):
+            obj = subreq['path'].split('/')[3]
+            method = subreq['method']
+            self.assertTrue(obj in expected_subreqs[method],
+                            'Unexpected %s subreq for object %s, expected %s'
+                            % (method, obj, expected_subreqs[method]))
+            expected_subreqs[method].remove(obj)
+            if method == 'PUT':
+                expected_body = self._get_object_data(subreq['path'])
+                self.assertEqual(expected_body, subreq['body'])
+        # verify all expected subreqs consumed
+        for _method, expected in expected_subreqs.items():
+            self.assertFalse(expected,
+                             'Expected subreqs not seen for %s for objects %s'
+                             % (_method, expected))
+        self.assertFalse(results['rx_updates'])
+
+        # verify on disk files...
+        self._verify_ondisk_files(tx_objs, policy)
+        for oname, rx_obj in rx_objs.items():
+            df = rx_obj[0].open()
+            metadata = df.get_metadata()
+            self.assertEqual(metadata['X-Object-Meta-Test'], oname)
+            self.assertEqual(metadata['Content-Type'], 'text/test')
+        # verify that tx and rx both generate the same suffix hashes...
+        tx_hashes = tx_df_mgr.get_hashes(
+            self.device, self.partition, suffixes, policy)
+        rx_hashes = rx_df_mgr.get_hashes(
+            self.device, self.partition, suffixes, policy)
+        self.assertEqual(tx_hashes, rx_hashes)
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/obj/test_ssync_receiver.py b/test/unit/obj/test_ssync_receiver.py
new file mode 100644
index 0000000000..7df5086520
--- /dev/null
+++ b/test/unit/obj/test_ssync_receiver.py
@@ -0,0 +1,3053 @@
+# Copyright (c) 2013 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import io
+import os
+import shutil
+import tempfile
+import unittest
+
+import eventlet
+import eventlet.wsgi
+from unittest import mock
+import itertools
+
+from swift.common import bufferedhttp
+from swift.common import exceptions
+from swift.common import swob
+from swift.common.exceptions import MessageTimeout, ChunkReadError
+from swift.common.storage_policy import POLICIES
+from swift.common import utils
+from swift.common.swob import HTTPException, HTTPCreated, Request, \
+    HTTPNoContent
+from swift.common.utils import public
+from swift.obj import diskfile
+from swift.obj import server
+from swift.obj import ssync_receiver, ssync_sender
+from swift.obj.reconstructor import ObjectReconstructor
+from swift.obj.ssync_receiver import SsyncInputProxy
+
+from test import listen_zero, unit
+from test.debug_logger import debug_logger
+from test.unit import (patch_policies, make_timestamp_iter, mock_check_drive,
+                       skip_if_no_xattrs)
+from test.unit.obj.common import write_diskfile
+
+
+UNPACK_ERR = b":ERROR: 0 'not enough values to unpack (expected 2, got 1)'"
+
+
+class FakeController(server.ObjectController):
+    def __init__(self, conf, logger=None):
+        super().__init__(conf, logger)
+        self.requests = []
+
+    def __call__(self, environ, start_response):
+        self.requests.append(Request(environ))
+        return super().__call__(environ, start_response)
+
+    @public
+    def PUT(self, req):
+        b''.join(req.environ['wsgi.input'])
+        return HTTPCreated()
+
+    @public
+    def DELETE(self, req):
+        b''.join(req.environ['wsgi.input'])
+        return HTTPNoContent()
+
+
+class SlowBytesIO(io.BytesIO):
+    """
+    A BytesIO that will sleep once for sleep_time before reading the byte at
+    sleep_index. If a read or readline call is completed by the byte at
+    (sleep_index - 1) then the call returns without sleeping, and the sleep
+    will occur at the start of the next read or readline call.
+    """
+    def __init__(self, value, sleep_index=-1, sleep_time=0.1):
+        io.BytesIO.__init__(self, value)
+        self.sleep_index = sleep_index
+        self.sleep_time = sleep_time
+        self.bytes_read = []
+        self.num_bytes_read = 0
+
+    def _read(self, size=-1, readline=False):
+        size = -1 if size is None else size
+        num_read = 0
+        data = b''
+        self.bytes_read.append(data)
+        while True:
+            if self.num_bytes_read == self.sleep_index:
+                self.sleep_index = -1
+                eventlet.sleep(self.sleep_time)
+            next_byte = io.BytesIO.read(self, 1)
+            data = data + next_byte
+            self.bytes_read[-1] = data
+            num_read += 1
+            self.num_bytes_read += 1
+            if len(data) < num_read:
+                break
+            if readline and data[-1:] == b'\n':
+                break
+            if 0 <= size <= num_read:
+                break
+
+        return data
+
+    def read(self, size=-1):
+        return self._read(size, False)
+
+    def readline(self, size=-1):
+        return self._read(size, True)
+
+
+@unit.patch_policies()
+class TestReceiver(unittest.TestCase):
+
+    def setUp(self):
+        skip_if_no_xattrs()
+        utils.HASH_PATH_SUFFIX = b'endcap'
+        utils.HASH_PATH_PREFIX = b'startcap'
+        # Not sure why the test.unit stuff isn't taking effect here; so I'm
+        # reinforcing it.
+        self.testdir = os.path.join(
+            tempfile.mkdtemp(), 'tmp_test_ssync_receiver')
+        utils.mkdirs(os.path.join(self.testdir, 'sda1', 'tmp'))
+        self.conf = {
+            'devices': self.testdir,
+            'mount_check': 'false',
+            'replication_concurrency_per_device': '0',
+            'log_requests': 'false'}
+        utils.mkdirs(os.path.join(self.testdir, 'device', 'partition'))
+        self.logger = debug_logger()
+        self.controller = server.ObjectController(
+            self.conf, logger=self.logger)
+        self.controller.bytes_per_sync = 1
+
+        self.account1 = 'a'
+        self.container1 = 'c'
+        self.object1 = 'o1'
+        self.name1 = '/' + '/'.join((
+            self.account1, self.container1, self.object1))
+        self.hash1 = utils.hash_path(
+            self.account1, self.container1, self.object1)
+        self.ts1 = '1372800001.00000'
+        self.metadata1 = {
+            'name': self.name1,
+            'X-Timestamp': self.ts1,
+            'Content-Length': '0'}
+
+        self.account2 = 'a'
+        self.container2 = 'c'
+        self.object2 = 'o2'
+        self.name2 = '/' + '/'.join((
+            self.account2, self.container2, self.object2))
+        self.hash2 = utils.hash_path(
+            self.account2, self.container2, self.object2)
+        self.ts2 = '1372800002.00000'
+        self.metadata2 = {
+            'name': self.name2,
+            'X-Timestamp': self.ts2,
+            'Content-Length': '0'}
+
+    def tearDown(self):
+        shutil.rmtree(os.path.dirname(self.testdir))
+
+    def body_lines(self, body):
+        lines = []
+        for line in body.split(b'\n'):
+            line = line.strip()
+            if line:
+                lines.append(line)
+        return lines
+
+    def test_SSYNC_semaphore_locked(self):
+        with mock.patch.object(
+                self.controller, 'replication_semaphore') as \
+                mocked_replication_semaphore:
+            self.controller.logger = mock.MagicMock()
+            mocked_replication_semaphore.acquire.return_value = False
+            req = swob.Request.blank(
+                '/device/partition', environ={'REQUEST_METHOD': 'SSYNC'})
+            resp = req.get_response(self.controller)
+            last_line = (
+                b":ERROR: 503 b'<html><h1>Service Unavailable</h1><p>The "
+                b"server is currently unavailable. Please try again at a "
+                b"later time.</p></html>'")
+            self.assertEqual(
+                self.body_lines(resp.body),
+                [last_line])
+            self.assertEqual(resp.status_int, 200)
+            self.assertFalse(self.controller.logger.error.called)
+            self.assertFalse(self.controller.logger.exception.called)
+
+    def test_SSYNC_calls_replication_lock(self):
+        with mock.patch.object(
+                self.controller._diskfile_router[POLICIES.legacy],
+                'replication_lock') as mocked_replication_lock:
+            req = swob.Request.blank(
+                '/sda1/1',
+                environ={'REQUEST_METHOD': 'SSYNC'},
+                body=':MISSING_CHECK: START\r\n'
+                     ':MISSING_CHECK: END\r\n'
+                     ':UPDATES: START\r\n:UPDATES: END\r\n')
+            resp = req.get_response(self.controller)
+            self.assertEqual(
+                self.body_lines(resp.body),
+                [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+                 b':UPDATES: START', b':UPDATES: END'])
+            self.assertEqual(resp.status_int, 200)
+            mocked_replication_lock.assert_called_once_with('sda1',
+                                                            POLICIES.legacy,
+                                                            '1')
+
+    def test_Receiver_with_default_storage_policy(self):
+        req = swob.Request.blank(
+            '/sda1/1',
+            environ={'REQUEST_METHOD': 'SSYNC'},
+            body=':MISSING_CHECK: START\r\n'
+                 ':MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n:UPDATES: END\r\n')
+        rcvr = ssync_receiver.Receiver(self.controller, req)
+        body_lines = [chunk.strip() for chunk in rcvr() if chunk.strip()]
+        self.assertEqual(
+            body_lines,
+            [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+             b':UPDATES: START', b':UPDATES: END'])
+        self.assertEqual(rcvr.policy, POLICIES[0])
+
+    def test_Receiver_with_storage_policy_index_header(self):
+        # update router post policy patch
+        self.controller._diskfile_router = diskfile.DiskFileRouter(
+            self.conf, self.controller.logger)
+        req = swob.Request.blank(
+            '/sda1/1',
+            environ={'REQUEST_METHOD': 'SSYNC',
+                     'HTTP_X_BACKEND_STORAGE_POLICY_INDEX': '1'},
+            body=':MISSING_CHECK: START\r\n'
+                 ':MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n:UPDATES: END\r\n')
+        rcvr = ssync_receiver.Receiver(self.controller, req)
+        body_lines = [chunk.strip() for chunk in rcvr() if chunk.strip()]
+        self.assertEqual(
+            body_lines,
+            [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+             b':UPDATES: START', b':UPDATES: END'])
+        self.assertEqual(rcvr.policy, POLICIES[1])
+        self.assertIsNone(rcvr.frag_index)
+
+    def test_Receiver_with_bad_storage_policy_index_header(self):
+        valid_indices = sorted([int(policy) for policy in POLICIES])
+        bad_index = valid_indices[-1] + 1
+        req = swob.Request.blank(
+            '/sda1/1',
+            environ={'REQUEST_METHOD': 'SSYNC',
+                     'HTTP_X_BACKEND_SSYNC_FRAG_INDEX': '0',
+                     'HTTP_X_BACKEND_STORAGE_POLICY_INDEX': bad_index},
+            body=':MISSING_CHECK: START\r\n'
+                 ':MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n:UPDATES: END\r\n')
+        self.controller.logger = mock.MagicMock()
+        with self.assertRaises(HTTPException) as caught:
+            ssync_receiver.Receiver(self.controller, req)
+        self.assertEqual('503 Service Unavailable', caught.exception.status)
+        self.assertEqual(b'No policy with index 2', caught.exception.body)
+
+    @unit.patch_policies()
+    def test_Receiver_with_only_frag_index_header(self):
+        # update router post policy patch
+        self.controller._diskfile_router = diskfile.DiskFileRouter(
+            self.conf, self.controller.logger)
+        req = swob.Request.blank(
+            '/sda1/1',
+            environ={'REQUEST_METHOD': 'SSYNC',
+                     'HTTP_X_BACKEND_SSYNC_FRAG_INDEX': '7',
+                     'HTTP_X_BACKEND_STORAGE_POLICY_INDEX': '1'},
+            body=':MISSING_CHECK: START\r\n'
+                 ':MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n:UPDATES: END\r\n')
+        rcvr = ssync_receiver.Receiver(self.controller, req)
+        body_lines = [chunk.strip() for chunk in rcvr() if chunk.strip()]
+        self.assertEqual(
+            body_lines,
+            [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+             b':UPDATES: START', b':UPDATES: END'])
+        self.assertEqual(rcvr.policy, POLICIES[1])
+        self.assertEqual(rcvr.frag_index, 7)
+
+    @unit.patch_policies()
+    def test_Receiver_with_only_node_index_header(self):
+        # update router post policy patch
+        self.controller._diskfile_router = diskfile.DiskFileRouter(
+            self.conf, self.controller.logger)
+        req = swob.Request.blank(
+            '/sda1/1',
+            environ={'REQUEST_METHOD': 'SSYNC',
+                     'HTTP_X_BACKEND_SSYNC_NODE_INDEX': '7',
+                     'HTTP_X_BACKEND_STORAGE_POLICY_INDEX': '1'},
+            body=':MISSING_CHECK: START\r\n'
+                 ':MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n:UPDATES: END\r\n')
+        rcvr = ssync_receiver.Receiver(self.controller, req)
+        body_lines = [chunk.strip() for chunk in rcvr() if chunk.strip()]
+        self.assertEqual(
+            body_lines,
+            [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+             b':UPDATES: START', b':UPDATES: END'])
+        self.assertEqual(rcvr.policy, POLICIES[1])
+        # we used to require the reconstructor to send the frag_index twice as
+        # two different headers because of evolutionary reasons, now we ignore
+        # node_index
+        self.assertEqual(rcvr.frag_index, None)
+
+    @unit.patch_policies()
+    def test_Receiver_with_matched_indexes(self):
+        # update router post policy patch
+        self.controller._diskfile_router = diskfile.DiskFileRouter(
+            self.conf, self.controller.logger)
+        req = swob.Request.blank(
+            '/sda1/1',
+            environ={'REQUEST_METHOD': 'SSYNC',
+                     'HTTP_X_BACKEND_SSYNC_NODE_INDEX': '7',
+                     'HTTP_X_BACKEND_SSYNC_FRAG_INDEX': '7',
+                     'HTTP_X_BACKEND_STORAGE_POLICY_INDEX': '1'},
+            body=':MISSING_CHECK: START\r\n'
+                 ':MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n:UPDATES: END\r\n')
+        rcvr = ssync_receiver.Receiver(self.controller, req)
+        body_lines = [chunk.strip() for chunk in rcvr() if chunk.strip()]
+        self.assertEqual(
+            body_lines,
+            [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+             b':UPDATES: START', b':UPDATES: END'])
+        self.assertEqual(rcvr.policy, POLICIES[1])
+        self.assertEqual(rcvr.frag_index, 7)
+
+    @unit.patch_policies()
+    def test_Receiver_with_invalid_indexes(self):
+        # update router post policy patch
+        self.controller._diskfile_router = diskfile.DiskFileRouter(
+            self.conf, self.controller.logger)
+        req = swob.Request.blank(
+            '/sda1/1',
+            environ={'REQUEST_METHOD': 'SSYNC',
+                     'HTTP_X_BACKEND_SSYNC_NODE_INDEX': 'None',
+                     'HTTP_X_BACKEND_SSYNC_FRAG_INDEX': 'None',
+                     'HTTP_X_BACKEND_STORAGE_POLICY_INDEX': '1'},
+            body=':MISSING_CHECK: START\r\n'
+                 ':MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n:UPDATES: END\r\n')
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 400)
+
+    @unit.patch_policies()
+    def test_Receiver_with_mismatched_indexes(self):
+        # update router post policy patch
+        self.controller._diskfile_router = diskfile.DiskFileRouter(
+            self.conf, self.controller.logger)
+        req = swob.Request.blank(
+            '/sda1/1',
+            environ={'REQUEST_METHOD': 'SSYNC',
+                     'HTTP_X_BACKEND_SSYNC_NODE_INDEX': '6',
+                     'HTTP_X_BACKEND_SSYNC_FRAG_INDEX': '7',
+                     'HTTP_X_BACKEND_STORAGE_POLICY_INDEX': '1'},
+            body=':MISSING_CHECK: START\r\n'
+                 ':MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n:UPDATES: END\r\n')
+        rcvr = ssync_receiver.Receiver(self.controller, req)
+        body_lines = [chunk.strip() for chunk in rcvr() if chunk.strip()]
+        self.assertEqual(
+            body_lines,
+            [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+             b':UPDATES: START', b':UPDATES: END'])
+        self.assertEqual(rcvr.policy, POLICIES[1])
+        # node_index if provided should always match frag_index; but if they
+        # differ, frag_index takes precedence
+        self.assertEqual(rcvr.frag_index, 7)
+
+    def test_SSYNC_replication_lock_fail(self):
+        def _mock(path, policy, partition):
+            with exceptions.ReplicationLockTimeout(0.01, '/somewhere/' + path):
+                eventlet.sleep(0.05)
+        with mock.patch.object(
+                self.controller._diskfile_router[POLICIES.legacy],
+                'replication_lock', _mock):
+            self.controller.logger = mock.MagicMock()
+            req = swob.Request.blank(
+                '/sda1/1',
+                environ={'REQUEST_METHOD': 'SSYNC'},
+                body=':MISSING_CHECK: START\r\n'
+                     ':MISSING_CHECK: END\r\n'
+                     ':UPDATES: START\r\n:UPDATES: END\r\n')
+            resp = req.get_response(self.controller)
+            self.assertEqual(
+                self.body_lines(resp.body),
+                [b":ERROR: 0 '0.01 seconds: /somewhere/sda1'"])
+            self.controller.logger.debug.assert_called_once_with(
+                'None/sda1/1 SSYNC LOCK TIMEOUT: 0.01 seconds: '
+                '/somewhere/sda1')
+
+    def test_SSYNC_replication_lock_per_partition(self):
+        def _concurrent_ssync(path1, path2):
+            env = {'REQUEST_METHOD': 'SSYNC'}
+            body = ':MISSING_CHECK: START\r\n:MISSING_CHECK: END\r\n' \
+                   ':UPDATES: START\r\n:UPDATES: END\r\n'
+            req1 = swob.Request.blank(path1, environ=env, body=body)
+            req2 = swob.Request.blank(path2, environ=env, body=body)
+
+            rcvr1 = ssync_receiver.Receiver(self.controller, req1)
+            rcvr2 = ssync_receiver.Receiver(self.controller, req2)
+
+            body_lines1 = []
+            body_lines2 = []
+
+            for chunk1, chunk2 in itertools.zip_longest(rcvr1(), rcvr2()):
+                if chunk1 and chunk1.strip():
+                    body_lines1.append(chunk1.strip())
+                if chunk2 and chunk2.strip():
+                    body_lines2.append(chunk2.strip())
+
+            return body_lines1, body_lines2
+
+        self.controller._diskfile_router[POLICIES[0]]\
+            .replication_lock_timeout = 0.01
+        self.controller._diskfile_router[POLICIES[0]]\
+            .replication_concurrency_per_device = 2
+        # It should be possible to lock two different partitions
+        body_lines1, body_lines2 = _concurrent_ssync('/sda1/1', '/sda1/2')
+        self.assertEqual(
+            body_lines1,
+            [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+             b':UPDATES: START', b':UPDATES: END'])
+        self.assertEqual(
+            body_lines2,
+            [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+             b':UPDATES: START', b':UPDATES: END'])
+
+        # It should not be possible to lock the same partition twice
+        body_lines1, body_lines2 = _concurrent_ssync('/sda1/1', '/sda1/1')
+        self.assertEqual(
+            body_lines1,
+            [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+             b':UPDATES: START', b':UPDATES: END'])
+        self.assertRegex(
+            b''.join(body_lines2),
+            br"^:ERROR: 0 '0\.0[0-9]+ seconds: "
+            br"/.+/sda1/objects/1/.lock-replication'$")
+
+    def test_SSYNC_initial_path(self):
+        with mock.patch.object(
+                self.controller, 'replication_semaphore') as \
+                mocked_replication_semaphore:
+            req = swob.Request.blank(
+                '/device', environ={'REQUEST_METHOD': 'SSYNC'})
+            resp = req.get_response(self.controller)
+            self.assertEqual(
+                self.body_lines(resp.body),
+                [b"Invalid path: /device"])
+            self.assertEqual(resp.status_int, 400)
+            self.assertFalse(mocked_replication_semaphore.acquire.called)
+            self.assertFalse(mocked_replication_semaphore.release.called)
+
+        with mock.patch.object(
+                self.controller, 'replication_semaphore') as \
+                mocked_replication_semaphore:
+            req = swob.Request.blank(
+                '/device/', environ={'REQUEST_METHOD': 'SSYNC'})
+            resp = req.get_response(self.controller)
+            self.assertEqual(
+                self.body_lines(resp.body),
+                [b"Invalid path: /device/"])
+            self.assertEqual(resp.status_int, 400)
+            self.assertFalse(mocked_replication_semaphore.acquire.called)
+            self.assertFalse(mocked_replication_semaphore.release.called)
+
+        with mock.patch.object(
+                self.controller, 'replication_semaphore') as \
+                mocked_replication_semaphore:
+            req = swob.Request.blank(
+                '/device/partition', environ={'REQUEST_METHOD': 'SSYNC'})
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.body, b'\r\n')
+            self.assertEqual(resp.status_int, 200)
+            mocked_replication_semaphore.acquire.assert_called_once_with(0)
+            mocked_replication_semaphore.release.assert_called_once_with()
+            error_lines = self.logger.get_lines_for_level('error')
+            self.assertEqual(['ssync client disconnected'], error_lines)
+
+        with mock.patch.object(
+                self.controller, 'replication_semaphore') as \
+                mocked_replication_semaphore:
+            req = swob.Request.blank(
+                '/device/partition/junk',
+                environ={'REQUEST_METHOD': 'SSYNC'})
+            resp = req.get_response(self.controller)
+            self.assertEqual(
+                self.body_lines(resp.body),
+                [b"Invalid path: /device/partition/junk"])
+            self.assertEqual(resp.status_int, 400)
+            self.assertFalse(mocked_replication_semaphore.acquire.called)
+            self.assertFalse(mocked_replication_semaphore.release.called)
+
+    def test_SSYNC_mount_check_isdir(self):
+        with mock.patch.object(self.controller, 'replication_semaphore'), \
+                mock.patch.object(
+                    self.controller._diskfile_router[POLICIES.legacy],
+                    'mount_check', False), \
+                mock_check_drive(isdir=True) as mocks:
+            req = swob.Request.blank(
+                '/device/partition', environ={'REQUEST_METHOD': 'SSYNC'})
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.body, b'\r\n')
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual([], mocks['ismount'].call_args_list)
+            error_lines = self.logger.get_lines_for_level('error')
+            self.assertEqual(['ssync client disconnected'], error_lines)
+
+    def test_SSYNC_mount_check(self):
+        with mock.patch.object(self.controller, 'replication_semaphore'), \
+                mock.patch.object(
+                    self.controller._diskfile_router[POLICIES.legacy],
+                    'mount_check', True), \
+                mock_check_drive(ismount=False) as mocks:
+            req = swob.Request.blank(
+                '/device/partition', environ={'REQUEST_METHOD': 'SSYNC'})
+            resp = req.get_response(self.controller)
+            self.assertEqual(
+                self.body_lines(resp.body),
+                [b"<html><h1>Insufficient Storage</h1><p>There "
+                 b"was not enough space to save the resource. Drive: "
+                 b"device</p></html>"])
+            self.assertEqual(resp.status_int, 507)
+            self.assertEqual([mock.call(os.path.join(
+                self.controller._diskfile_router[POLICIES.legacy].devices,
+                'device'))], mocks['ismount'].call_args_list)
+
+            mocks['ismount'].reset_mock()
+            mocks['ismount'].return_value = True
+            req = swob.Request.blank(
+                '/device/partition', environ={'REQUEST_METHOD': 'SSYNC'})
+            resp = req.get_response(self.controller)
+            self.assertEqual(resp.body, b'\r\n')
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual([mock.call(os.path.join(
+                self.controller._diskfile_router[POLICIES.legacy].devices,
+                'device'))] * 2, mocks['ismount'].call_args_list)
+            error_lines = self.logger.get_lines_for_level('error')
+            self.assertEqual(['ssync client disconnected'], error_lines)
+
+    def test_SSYNC_Exception(self):
+
+        class _Wrapper(io.BytesIO):
+
+            def __init__(self, value):
+                io.BytesIO.__init__(self, value)
+                self.mock_socket = mock.MagicMock()
+
+            def get_socket(self):
+                return self.mock_socket
+
+        with mock.patch.object(
+                ssync_receiver.eventlet.greenio, 'shutdown_safe') as \
+                mock_shutdown_safe:
+            self.controller.logger = mock.MagicMock()
+            req = swob.Request.blank(
+                '/device/partition',
+                environ={'REQUEST_METHOD': 'SSYNC'},
+                body=':MISSING_CHECK: START\r\n:MISSING_CHECK: END\r\n'
+                     ':UPDATES: START\r\nBad content is here\n')
+            req.remote_addr = '1.2.3.4'
+            mock_wsgi_input = _Wrapper(req.body)
+            req.environ['wsgi.input'] = mock_wsgi_input
+            resp = req.get_response(self.controller)
+            self.assertEqual(
+                self.body_lines(resp.body),
+                [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+                 b":ERROR: 0 'Got no headers for Bad content is here'"])
+            self.assertEqual(resp.status_int, 200)
+            mock_shutdown_safe.assert_called_once_with(
+                mock_wsgi_input.mock_socket)
+            mock_wsgi_input.mock_socket.close.assert_called_once_with()
+            self.controller.logger.exception.assert_called_once_with(
+                '1.2.3.4/device/partition EXCEPTION in ssync.Receiver')
+
+    def test_SSYNC_Exception_Exception(self):
+
+        class _Wrapper(io.BytesIO):
+
+            def __init__(self, value):
+                io.BytesIO.__init__(self, value)
+                self.mock_socket = mock.MagicMock()
+
+            def get_socket(self):
+                return self.mock_socket
+
+        with mock.patch.object(
+                ssync_receiver.eventlet.greenio, 'shutdown_safe') as \
+                mock_shutdown_safe:
+            self.controller.logger = mock.MagicMock()
+            req = swob.Request.blank(
+                '/device/partition',
+                environ={'REQUEST_METHOD': 'SSYNC'},
+                body=':MISSING_CHECK: START\r\n:MISSING_CHECK: END\r\n'
+                     ':UPDATES: START\r\nBad content is here\n')
+            req.remote_addr = mock.MagicMock()
+            req.remote_addr.__str__ = mock.Mock(
+                side_effect=Exception("can't stringify this"))
+            mock_wsgi_input = _Wrapper(req.body)
+            req.environ['wsgi.input'] = mock_wsgi_input
+            resp = req.get_response(self.controller)
+            self.assertEqual(
+                self.body_lines(resp.body),
+                [b':MISSING_CHECK: START', b':MISSING_CHECK: END'])
+            self.assertEqual(resp.status_int, 200)
+            mock_shutdown_safe.assert_called_once_with(
+                mock_wsgi_input.mock_socket)
+            mock_wsgi_input.mock_socket.close.assert_called_once_with()
+            self.controller.logger.exception.assert_called_once_with(
+                'EXCEPTION in ssync.Receiver')
+
+    def test_MISSING_CHECK_timeout(self):
+
+        class _Wrapper(io.BytesIO):
+
+            def __init__(self, value):
+                io.BytesIO.__init__(self, value)
+                self.mock_socket = mock.MagicMock()
+
+            def readline(self, sizehint=-1):
+                line = io.BytesIO.readline(self)
+                if line.startswith(b'hash'):
+                    eventlet.sleep(0.1)
+                return line
+
+            def get_socket(self):
+                return self.mock_socket
+
+        self.controller.client_timeout = 0.01
+        with mock.patch.object(
+                ssync_receiver.eventlet.greenio, 'shutdown_safe') as \
+                mock_shutdown_safe:
+            self.controller.logger = mock.MagicMock()
+            req = swob.Request.blank(
+                '/sda1/1',
+                environ={'REQUEST_METHOD': 'SSYNC'},
+                body=':MISSING_CHECK: START\r\n'
+                     'hash ts\r\n'
+                     ':MISSING_CHECK: END\r\n'
+                     ':UPDATES: START\r\n:UPDATES: END\r\n')
+            req.remote_addr = '2.3.4.5'
+            mock_wsgi_input = _Wrapper(req.body)
+            req.environ['wsgi.input'] = mock_wsgi_input
+            resp = req.get_response(self.controller)
+            self.assertEqual(
+                self.body_lines(resp.body),
+                [b":ERROR: 408 '0.01 seconds: missing_check line'"])
+            self.assertEqual(resp.status_int, 200)
+            self.assertTrue(mock_shutdown_safe.called)
+            self.controller.logger.error.assert_called_once_with(
+                '2.3.4.5/sda1/1 TIMEOUT in ssync.Receiver: '
+                '0.01 seconds: missing_check line')
+
+    def test_MISSING_CHECK_other_exception(self):
+
+        class _Wrapper(io.BytesIO):
+
+            def __init__(self, value):
+                io.BytesIO.__init__(self, value)
+                self.mock_socket = mock.MagicMock()
+
+            def readline(self, sizehint=-1):
+                line = io.BytesIO.readline(self)
+                if line.startswith(b'hash'):
+                    raise Exception('test exception')
+                return line
+
+            def get_socket(self):
+                return self.mock_socket
+
+        self.controller.client_timeout = 0.01
+        with mock.patch.object(
+                ssync_receiver.eventlet.greenio, 'shutdown_safe') as \
+                mock_shutdown_safe:
+            self.controller.logger = mock.MagicMock()
+            req = swob.Request.blank(
+                '/sda1/1',
+                environ={'REQUEST_METHOD': 'SSYNC'},
+                body=':MISSING_CHECK: START\r\n'
+                     'hash ts\r\n'
+                     ':MISSING_CHECK: END\r\n'
+                     ':UPDATES: START\r\n:UPDATES: END\r\n')
+            req.remote_addr = '3.4.5.6'
+            mock_wsgi_input = _Wrapper(req.body)
+            req.environ['wsgi.input'] = mock_wsgi_input
+            resp = req.get_response(self.controller)
+            self.assertEqual(
+                self.body_lines(resp.body),
+                [b":ERROR: 0 'test exception'"])
+            self.assertEqual(resp.status_int, 200)
+            self.assertTrue(mock_shutdown_safe.called)
+            self.controller.logger.exception.assert_called_once_with(
+                '3.4.5.6/sda1/1 EXCEPTION in ssync.Receiver')
+
+    def test_MISSING_CHECK_partial_line(self):
+        req = swob.Request.blank(
+            '/sda1/1',
+            environ={'REQUEST_METHOD': 'SSYNC'},
+            # not sure this would ever be yielded by the wsgi input since the
+            # bytes read wouldn't match the chunk size that was sent
+            body=':MISSING_CHECK: START\r\nhash no_newline'
+        )
+        resp = req.get_response(self.controller)
+        self.assertFalse(self.body_lines(resp.body))
+        self.assertEqual(resp.status_int, 200)
+        lines = self.logger.get_lines_for_level('error')
+        self.assertEqual(
+            ['None/sda1/1 read failed in ssync.Receiver: missing_check line: '
+             'missing newline'], lines)
+
+    def test_MISSING_CHECK_empty_list(self):
+
+        self.controller.logger = mock.MagicMock()
+        req = swob.Request.blank(
+            '/sda1/1',
+            environ={'REQUEST_METHOD': 'SSYNC'},
+            body=':MISSING_CHECK: START\r\n'
+                 ':MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n:UPDATES: END\r\n')
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            self.body_lines(resp.body),
+            [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+             b':UPDATES: START', b':UPDATES: END'])
+        self.assertEqual(resp.status_int, 200)
+        self.assertFalse(self.controller.logger.error.called)
+        self.assertFalse(self.controller.logger.exception.called)
+
+    def test_MISSING_CHECK_have_none(self):
+
+        self.controller.logger = mock.MagicMock()
+        req = swob.Request.blank(
+            '/sda1/1',
+            environ={'REQUEST_METHOD': 'SSYNC'},
+            body=':MISSING_CHECK: START\r\n' +
+                 self.hash1 + ' ' + self.ts1 + '\r\n' +
+                 self.hash2 + ' ' + self.ts2 + '\r\n'
+                 ':MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n:UPDATES: END\r\n')
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            self.body_lines(resp.body),
+            [b':MISSING_CHECK: START',
+             (self.hash1 + ' dm').encode('ascii'),
+             (self.hash2 + ' dm').encode('ascii'),
+             b':MISSING_CHECK: END',
+             b':UPDATES: START', b':UPDATES: END'])
+        self.assertEqual(resp.status_int, 200)
+        self.assertFalse(self.controller.logger.error.called)
+        self.assertFalse(self.controller.logger.exception.called)
+
+    def test_MISSING_CHECK_extra_line_parts(self):
+        # check that rx tolerates extra parts in missing check lines to
+        # allow for protocol upgrades
+        extra_1 = 'extra'
+        extra_2 = 'multiple extra parts'
+        self.controller.logger = mock.MagicMock()
+        req = swob.Request.blank(
+            '/sda1/1',
+            environ={'REQUEST_METHOD': 'SSYNC'},
+            body=':MISSING_CHECK: START\r\n' +
+                 self.hash1 + ' ' + self.ts1 + ' ' + extra_1 + '\r\n' +
+                 self.hash2 + ' ' + self.ts2 + ' ' + extra_2 + '\r\n'
+                 ':MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n:UPDATES: END\r\n')
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            self.body_lines(resp.body),
+            [b':MISSING_CHECK: START',
+             (self.hash1 + ' dm').encode('ascii'),
+             (self.hash2 + ' dm').encode('ascii'),
+             b':MISSING_CHECK: END',
+             b':UPDATES: START', b':UPDATES: END'])
+        self.assertEqual(resp.status_int, 200)
+        self.assertFalse(self.controller.logger.error.called)
+        self.assertFalse(self.controller.logger.exception.called)
+
+    def test_MISSING_CHECK_have_one_exact(self):
+        object_dir = utils.storage_directory(
+            os.path.join(self.testdir, 'sda1',
+                         diskfile.get_data_dir(POLICIES[0])),
+            '1', self.hash1)
+        utils.mkdirs(object_dir)
+        fp = open(os.path.join(object_dir, self.ts1 + '.data'), 'w+')
+        fp.write('1')
+        fp.flush()
+        self.metadata1['Content-Length'] = '1'
+        diskfile.write_metadata(fp, self.metadata1)
+
+        self.controller.logger = mock.MagicMock()
+        req = swob.Request.blank(
+            '/sda1/1',
+            environ={'REQUEST_METHOD': 'SSYNC'},
+            body=':MISSING_CHECK: START\r\n' +
+                 self.hash1 + ' ' + self.ts1 + '\r\n' +
+                 self.hash2 + ' ' + self.ts2 + '\r\n'
+                 ':MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n:UPDATES: END\r\n')
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            self.body_lines(resp.body),
+            [b':MISSING_CHECK: START',
+             (self.hash2 + ' dm').encode('ascii'),
+             b':MISSING_CHECK: END',
+             b':UPDATES: START', b':UPDATES: END'])
+        self.assertEqual(resp.status_int, 200)
+        self.assertFalse(self.controller.logger.error.called)
+        self.assertFalse(self.controller.logger.exception.called)
+
+    def test_MISSING_CHECK_missing_meta_expired_data(self):
+        # verify that even when rx disk file has expired x-delete-at, it will
+        # still be opened and checked for missing meta
+        self.controller.logger = mock.MagicMock()
+        ts1 = next(make_timestamp_iter())
+        df = self.controller.get_diskfile(
+            'sda1', '1', self.account1, self.container1, self.object1,
+            POLICIES[0])
+        write_diskfile(df, ts1, extra_metadata={'X-Delete-At': 0})
+
+        # make a request - expect newer metadata to be wanted
+        req = swob.Request.blank(
+            '/sda1/1',
+            environ={'REQUEST_METHOD': 'SSYNC',
+                     'HTTP_X_BACKEND_STORAGE_POLICY_INDEX': '0'},
+            body=':MISSING_CHECK: START\r\n' +
+                 self.hash1 + ' ' + ts1.internal + ' m:30d40\r\n'
+                 ':MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n:UPDATES: END\r\n')
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            self.body_lines(resp.body),
+            [b':MISSING_CHECK: START',
+             b'c2519f265f9633e74f9b2fe3b9bec27d m',
+             b':MISSING_CHECK: END',
+             b':UPDATES: START', b':UPDATES: END'])
+        self.assertEqual(resp.status_int, 200)
+        self.assertFalse(self.controller.logger.error.called)
+        self.assertFalse(self.controller.logger.exception.called)
+
+    @patch_policies(with_ec_default=True)
+    def test_MISSING_CHECK_missing_durable(self):
+        # check that local non-durable frag is made durable if remote sends
+        # same ts for same frag, but only if remote is durable
+        self.controller.logger = mock.MagicMock()
+        self.controller._diskfile_router = diskfile.DiskFileRouter(
+            self.conf, self.controller.logger)
+
+        # make rx disk file but don't commit it, so durable state is missing
+        ts1 = next(make_timestamp_iter()).internal
+        object_dir = utils.storage_directory(
+            os.path.join(self.testdir, 'sda1',
+                         diskfile.get_data_dir(POLICIES[0])),
+            '1', self.hash1)
+        utils.mkdirs(object_dir)
+        fp = open(os.path.join(object_dir, ts1 + '#2.data'), 'w+')
+        fp.write('1')
+        fp.flush()
+        metadata1 = {
+            'name': self.name1,
+            'X-Timestamp': ts1,
+            'Content-Length': '1'}
+        diskfile.write_metadata(fp, metadata1)
+        self.assertEqual([ts1 + '#2.data'], os.listdir(object_dir))  # sanity
+
+        # offer same non-durable frag - expect no data to be wanted
+        req = swob.Request.blank(
+            '/sda1/1',
+            environ={'REQUEST_METHOD': 'SSYNC',
+                     'HTTP_X_BACKEND_STORAGE_POLICY_INDEX': '0',
+                     'HTTP_X_BACKEND_SSYNC_FRAG_INDEX': '2'},
+            body=':MISSING_CHECK: START\r\n' +
+                 self.hash1 + ' ' + ts1 + ' durable:no\r\n'
+                 ':MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n:UPDATES: END\r\n')
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            self.body_lines(resp.body),
+            [b':MISSING_CHECK: START',
+             b':MISSING_CHECK: END',
+             b':UPDATES: START', b':UPDATES: END'])
+        self.assertEqual(resp.status_int, 200)
+        self.assertFalse(self.controller.logger.error.called)
+        self.assertFalse(self.controller.logger.exception.called)
+        # the local  frag is still not durable...
+        self.assertEqual([ts1 + '#2.data'], os.listdir(object_dir))
+
+        # offer same frag but durable - expect no data to be wanted
+        req = swob.Request.blank(
+            '/sda1/1',
+            environ={'REQUEST_METHOD': 'SSYNC',
+                     'HTTP_X_BACKEND_STORAGE_POLICY_INDEX': '0',
+                     'HTTP_X_BACKEND_SSYNC_FRAG_INDEX': '2'},
+            body=':MISSING_CHECK: START\r\n' +
+                 self.hash1 + ' ' + ts1 + '\r\n'
+                 ':MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n:UPDATES: END\r\n')
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            self.body_lines(resp.body),
+            [b':MISSING_CHECK: START',
+             b':MISSING_CHECK: END',
+             b':UPDATES: START', b':UPDATES: END'])
+        self.assertEqual(resp.status_int, 200)
+        self.assertFalse(self.controller.logger.error.called)
+        self.assertFalse(self.controller.logger.exception.called)
+        # the local frag is now durable...
+        self.assertEqual([ts1 + '#2#d.data'], os.listdir(object_dir))
+
+    @patch_policies(with_ec_default=True)
+    @mock.patch('swift.obj.diskfile.ECDiskFileWriter.commit')
+    def test_MISSING_CHECK_missing_durable_but_commit_fails(self, mock_commit):
+        self.controller.logger = mock.MagicMock()
+        self.controller._diskfile_router = diskfile.DiskFileRouter(
+            self.conf, self.controller.logger)
+
+        # make rx disk file but don't commit it, so durable state is missing
+        ts1 = next(make_timestamp_iter()).internal
+        object_dir = utils.storage_directory(
+            os.path.join(self.testdir, 'sda1',
+                         diskfile.get_data_dir(POLICIES[0])),
+            '1', self.hash1)
+        utils.mkdirs(object_dir)
+        fp = open(os.path.join(object_dir, ts1 + '#2.data'), 'w+')
+        fp.write('1')
+        fp.flush()
+        metadata1 = {
+            'name': self.name1,
+            'X-Timestamp': ts1,
+            'Content-Length': '1'}
+        diskfile.write_metadata(fp, metadata1)
+        self.assertEqual([ts1 + '#2.data'], os.listdir(object_dir))  # sanity
+
+        # make a request with commit disabled - expect data to be wanted
+        req = swob.Request.blank(
+            '/sda1/1',
+            environ={'REQUEST_METHOD': 'SSYNC',
+                     'HTTP_X_BACKEND_STORAGE_POLICY_INDEX': '0',
+                     'HTTP_X_BACKEND_SSYNC_FRAG_INDEX': '2'},
+            body=':MISSING_CHECK: START\r\n' +
+                 self.hash1 + ' ' + ts1 + '\r\n'
+                 ':MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n:UPDATES: END\r\n')
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            self.body_lines(resp.body),
+            [b':MISSING_CHECK: START',
+             (self.hash1 + ' dm').encode('ascii'),
+             b':MISSING_CHECK: END',
+             b':UPDATES: START', b':UPDATES: END'])
+        self.assertEqual(resp.status_int, 200)
+        self.assertFalse(self.controller.logger.error.called)
+        self.assertFalse(self.controller.logger.exception.called)
+
+        # make a request with commit raising error - expect data to be wanted
+        mock_commit.side_effect = Exception
+        req = swob.Request.blank(
+            '/sda1/1',
+            environ={'REQUEST_METHOD': 'SSYNC',
+                     'HTTP_X_BACKEND_STORAGE_POLICY_INDEX': '0',
+                     'HTTP_X_BACKEND_SSYNC_FRAG_INDEX': '2'},
+            body=':MISSING_CHECK: START\r\n' +
+                 self.hash1 + ' ' + ts1 + '\r\n'
+                 ':MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n:UPDATES: END\r\n')
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            self.body_lines(resp.body),
+            [b':MISSING_CHECK: START',
+             (self.hash1 + ' dm').encode('ascii'),
+             b':MISSING_CHECK: END',
+             b':UPDATES: START', b':UPDATES: END'])
+        self.assertEqual(resp.status_int, 200)
+        self.assertFalse(self.controller.logger.error.called)
+        self.assertTrue(self.controller.logger.exception.called)
+        self.assertIn(
+            'EXCEPTION in ssync.Receiver while attempting commit of',
+            self.controller.logger.exception.call_args[0][0])
+
+    @patch_policies(with_ec_default=True)
+    def test_MISSING_CHECK_local_non_durable(self):
+        # check that local non-durable fragment does not prevent other frags
+        # being wanted from the sender
+        self.controller.logger = mock.MagicMock()
+        self.controller._diskfile_router = diskfile.DiskFileRouter(
+            self.conf, self.controller.logger)
+
+        ts_iter = make_timestamp_iter()
+        ts1 = next(ts_iter).internal
+        ts2 = next(ts_iter).internal
+        ts3 = next(ts_iter).internal
+        # make non-durable rx disk file at ts2
+        object_dir = utils.storage_directory(
+            os.path.join(self.testdir, 'sda1',
+                         diskfile.get_data_dir(POLICIES[0])),
+            '1', self.hash1)
+        utils.mkdirs(object_dir)
+        fp = open(os.path.join(object_dir, ts2 + '#2.data'), 'w+')
+        fp.write('1')
+        fp.flush()
+        metadata1 = {
+            'name': self.name1,
+            'X-Timestamp': ts2,
+            'Content-Length': '1'}
+        diskfile.write_metadata(fp, metadata1)
+        self.assertEqual([ts2 + '#2.data'], os.listdir(object_dir))  # sanity
+
+        def do_check(tx_missing_line, expected_rx_missing_lines):
+            req = swob.Request.blank(
+                '/sda1/1',
+                environ={'REQUEST_METHOD': 'SSYNC',
+                         'HTTP_X_BACKEND_STORAGE_POLICY_INDEX': '0',
+                         'HTTP_X_BACKEND_SSYNC_FRAG_INDEX': '2'},
+                body=':MISSING_CHECK: START\r\n' +
+                     tx_missing_line + '\r\n'
+                     ':MISSING_CHECK: END\r\n'
+                     ':UPDATES: START\r\n:UPDATES: END\r\n')
+            resp = req.get_response(self.controller)
+            self.assertEqual(
+                self.body_lines(resp.body),
+                [b':MISSING_CHECK: START'] +
+                [l.encode('ascii') for l in expected_rx_missing_lines] +
+                [b':MISSING_CHECK: END',
+                 b':UPDATES: START', b':UPDATES: END'])
+            self.assertEqual(resp.status_int, 200)
+            self.assertFalse(self.controller.logger.error.called)
+            self.assertFalse(self.controller.logger.exception.called)
+
+        # check remote frag is always wanted - older, newer, durable or not...
+        do_check(self.hash1 + ' ' + ts1 + ' durable:no',
+                 [self.hash1 + ' dm'])
+        self.assertEqual([ts2 + '#2.data'], os.listdir(object_dir))
+        do_check(self.hash1 + ' ' + ts1 + ' durable:yes',
+                 [self.hash1 + ' dm'])
+        self.assertEqual([ts2 + '#2.data'], os.listdir(object_dir))
+        do_check(self.hash1 + ' ' + ts1, [self.hash1 + ' dm'])
+        self.assertEqual([ts2 + '#2.data'], os.listdir(object_dir))
+        do_check(self.hash1 + ' ' + ts3 + ' durable:no',
+                 [self.hash1 + ' dm'])
+        self.assertEqual([ts2 + '#2.data'], os.listdir(object_dir))
+        do_check(self.hash1 + ' ' + ts3 + ' durable:yes',
+                 [self.hash1 + ' dm'])
+        self.assertEqual([ts2 + '#2.data'], os.listdir(object_dir))
+        do_check(self.hash1 + ' ' + ts3, [self.hash1 + ' dm'])
+        self.assertEqual([ts2 + '#2.data'], os.listdir(object_dir))
+        # ... except when at same timestamp
+        do_check(self.hash1 + ' ' + ts2 + ' durable:no', [])
+        self.assertEqual([ts2 + '#2.data'], os.listdir(object_dir))
+        # durable remote frag at ts2 will make the local durable..
+        do_check(self.hash1 + ' ' + ts2 + ' durable:yes', [])
+        self.assertEqual([ts2 + '#2#d.data'], os.listdir(object_dir))
+
+    @patch_policies(with_ec_default=True)
+    def test_MISSING_CHECK_local_durable(self):
+        # check that local durable fragment does not prevent newer non-durable
+        # frags being wanted from the sender
+        self.controller.logger = mock.MagicMock()
+        self.controller._diskfile_router = diskfile.DiskFileRouter(
+            self.conf, self.controller.logger)
+
+        ts_iter = make_timestamp_iter()
+        ts1 = next(ts_iter).internal
+        ts2 = next(ts_iter).internal
+        ts3 = next(ts_iter).internal
+        # make non-durable rx disk file at ts2
+        object_dir = utils.storage_directory(
+            os.path.join(self.testdir, 'sda1',
+                         diskfile.get_data_dir(POLICIES[0])),
+            '1', self.hash1)
+        utils.mkdirs(object_dir)
+        fp = open(os.path.join(object_dir, ts2 + '#2.data'), 'w+')
+        fp.write('1')
+        fp.flush()
+        metadata1 = {
+            'name': self.name1,
+            'X-Timestamp': ts2,
+            'Content-Length': '1'}
+        diskfile.write_metadata(fp, metadata1)
+        self.assertEqual([ts2 + '#2.data'], os.listdir(object_dir))  # sanity
+
+        def do_check(tx_missing_line, expected_rx_missing_lines):
+            req = swob.Request.blank(
+                '/sda1/1',
+                environ={'REQUEST_METHOD': 'SSYNC',
+                         'HTTP_X_BACKEND_STORAGE_POLICY_INDEX': '0',
+                         'HTTP_X_BACKEND_SSYNC_FRAG_INDEX': '2'},
+                body=':MISSING_CHECK: START\r\n' +
+                     tx_missing_line + '\r\n'
+                     ':MISSING_CHECK: END\r\n'
+                     ':UPDATES: START\r\n:UPDATES: END\r\n')
+            resp = req.get_response(self.controller)
+            self.assertEqual(
+                self.body_lines(resp.body),
+                [b':MISSING_CHECK: START'] +
+                [l.encode('ascii') for l in expected_rx_missing_lines] +
+                [b':MISSING_CHECK: END',
+                 b':UPDATES: START', b':UPDATES: END'])
+            self.assertEqual(resp.status_int, 200)
+            self.assertFalse(self.controller.logger.error.called)
+            self.assertFalse(self.controller.logger.exception.called)
+
+        # check remote frag is always wanted - older, newer, durable or not...
+        do_check(self.hash1 + ' ' + ts1 + ' durable:no',
+                 [self.hash1 + ' dm'])
+        self.assertEqual([ts2 + '#2.data'], os.listdir(object_dir))
+        do_check(self.hash1 + ' ' + ts1 + ' durable:yes',
+                 [self.hash1 + ' dm'])
+        self.assertEqual([ts2 + '#2.data'], os.listdir(object_dir))
+        do_check(self.hash1 + ' ' + ts1, [self.hash1 + ' dm'])
+        self.assertEqual([ts2 + '#2.data'], os.listdir(object_dir))
+        do_check(self.hash1 + ' ' + ts3 + ' durable:no',
+                 [self.hash1 + ' dm'])
+        self.assertEqual([ts2 + '#2.data'], os.listdir(object_dir))
+        do_check(self.hash1 + ' ' + ts3 + ' durable:yes',
+                 [self.hash1 + ' dm'])
+        self.assertEqual([ts2 + '#2.data'], os.listdir(object_dir))
+        do_check(self.hash1 + ' ' + ts3, [self.hash1 + ' dm'])
+        self.assertEqual([ts2 + '#2.data'], os.listdir(object_dir))
+        # ... except when at same timestamp
+        do_check(self.hash1 + ' ' + ts2 + ' durable:no', [])
+        self.assertEqual([ts2 + '#2.data'], os.listdir(object_dir))
+        # durable remote frag at ts2 will make the local durable..
+        do_check(self.hash1 + ' ' + ts2 + ' durable:yes', [])
+        self.assertEqual([ts2 + '#2#d.data'], os.listdir(object_dir))
+
+    @patch_policies(with_ec_default=True)
+    def test_MISSING_CHECK_local_durable_older_than_remote_non_durable(self):
+        # check that newer non-durable fragment is wanted
+        self.controller.logger = mock.MagicMock()
+        self.controller._diskfile_router = diskfile.DiskFileRouter(
+            self.conf, self.controller.logger)
+
+        ts_iter = make_timestamp_iter()
+        ts1 = next(ts_iter).internal
+        ts2 = next(ts_iter).internal
+        # make durable rx disk file at ts2
+        object_dir = utils.storage_directory(
+            os.path.join(self.testdir, 'sda1',
+                         diskfile.get_data_dir(POLICIES[0])),
+            '1', self.hash1)
+        utils.mkdirs(object_dir)
+        fp = open(os.path.join(object_dir, ts1 + '#2#d.data'), 'w+')
+        fp.write('1')
+        fp.flush()
+        metadata1 = {
+            'name': self.name1,
+            'X-Timestamp': ts1,
+            'Content-Length': '1'}
+        diskfile.write_metadata(fp, metadata1)
+
+        # make a request offering non-durable at ts2
+        req = swob.Request.blank(
+            '/sda1/1',
+            environ={'REQUEST_METHOD': 'SSYNC',
+                     'HTTP_X_BACKEND_STORAGE_POLICY_INDEX': '0',
+                     'HTTP_X_BACKEND_SSYNC_FRAG_INDEX': '2'},
+            body=':MISSING_CHECK: START\r\n' +
+                 self.hash1 + ' ' + ts2 + ' durable:no\r\n'
+                 ':MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n:UPDATES: END\r\n')
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            self.body_lines(resp.body),
+            [b':MISSING_CHECK: START',
+             (self.hash1 + ' dm').encode('ascii'),
+             b':MISSING_CHECK: END',
+             b':UPDATES: START', b':UPDATES: END'])
+        self.assertEqual(resp.status_int, 200)
+        self.assertFalse(self.controller.logger.error.called)
+        self.assertFalse(self.controller.logger.exception.called)
+
+    def test_MISSING_CHECK_storage_policy(self):
+        # update router post policy patch
+        self.controller._diskfile_router = diskfile.DiskFileRouter(
+            self.conf, self.controller.logger)
+        object_dir = utils.storage_directory(
+            os.path.join(self.testdir, 'sda1',
+                         diskfile.get_data_dir(POLICIES[1])),
+            '1', self.hash1)
+        utils.mkdirs(object_dir)
+        fp = open(os.path.join(object_dir, self.ts1 + '.data'), 'w+')
+        fp.write('1')
+        fp.flush()
+        self.metadata1['Content-Length'] = '1'
+        diskfile.write_metadata(fp, self.metadata1)
+
+        self.controller.logger = mock.MagicMock()
+        req = swob.Request.blank(
+            '/sda1/1',
+            environ={'REQUEST_METHOD': 'SSYNC',
+                     'HTTP_X_BACKEND_STORAGE_POLICY_INDEX': '1'},
+            body=':MISSING_CHECK: START\r\n' +
+                 self.hash1 + ' ' + self.ts1 + '\r\n' +
+                 self.hash2 + ' ' + self.ts2 + '\r\n'
+                 ':MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n:UPDATES: END\r\n')
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            self.body_lines(resp.body),
+            [b':MISSING_CHECK: START',
+             (self.hash2 + ' dm').encode('ascii'),
+             b':MISSING_CHECK: END',
+             b':UPDATES: START', b':UPDATES: END'])
+        self.assertEqual(resp.status_int, 200)
+        self.assertFalse(self.controller.logger.error.called)
+        self.assertFalse(self.controller.logger.exception.called)
+
+    def test_MISSING_CHECK_have_one_newer(self):
+        object_dir = utils.storage_directory(
+            os.path.join(self.testdir, 'sda1',
+                         diskfile.get_data_dir(POLICIES[0])),
+            '1', self.hash1)
+        utils.mkdirs(object_dir)
+        newer_ts1 = utils.normalize_timestamp(float(self.ts1) + 1)
+        self.metadata1['X-Timestamp'] = newer_ts1
+        fp = open(os.path.join(object_dir, newer_ts1 + '.data'), 'w+')
+        fp.write('1')
+        fp.flush()
+        self.metadata1['Content-Length'] = '1'
+        diskfile.write_metadata(fp, self.metadata1)
+
+        self.controller.logger = mock.MagicMock()
+        req = swob.Request.blank(
+            '/sda1/1',
+            environ={'REQUEST_METHOD': 'SSYNC'},
+            body=':MISSING_CHECK: START\r\n' +
+                 self.hash1 + ' ' + self.ts1 + '\r\n' +
+                 self.hash2 + ' ' + self.ts2 + '\r\n'
+                 ':MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n:UPDATES: END\r\n')
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            self.body_lines(resp.body),
+            [b':MISSING_CHECK: START',
+             (self.hash2 + ' dm').encode('ascii'),
+             b':MISSING_CHECK: END',
+             b':UPDATES: START', b':UPDATES: END'])
+        self.assertEqual(resp.status_int, 200)
+        self.assertFalse(self.controller.logger.error.called)
+        self.assertFalse(self.controller.logger.exception.called)
+
+    def test_MISSING_CHECK_have_newer_meta(self):
+        object_dir = utils.storage_directory(
+            os.path.join(self.testdir, 'sda1',
+                         diskfile.get_data_dir(POLICIES[0])),
+            '1', self.hash1)
+        utils.mkdirs(object_dir)
+        older_ts1 = utils.normalize_timestamp(float(self.ts1) - 1)
+        self.metadata1['X-Timestamp'] = older_ts1
+        fp = open(os.path.join(object_dir, older_ts1 + '.data'), 'w+')
+        fp.write('1')
+        fp.flush()
+        self.metadata1['Content-Length'] = '1'
+        diskfile.write_metadata(fp, self.metadata1)
+        # write newer .meta file
+        metadata = {'name': self.name1, 'X-Timestamp': self.ts2,
+                    'X-Object-Meta-Test': 'test'}
+        fp = open(os.path.join(object_dir, self.ts2 + '.meta'), 'w+')
+        diskfile.write_metadata(fp, metadata)
+
+        # receiver has .data at older_ts, .meta at ts2
+        # sender has .data at ts1
+        self.controller.logger = mock.MagicMock()
+        req = swob.Request.blank(
+            '/sda1/1',
+            environ={'REQUEST_METHOD': 'SSYNC'},
+            body=':MISSING_CHECK: START\r\n' +
+                 self.hash1 + ' ' + self.ts1 + '\r\n'
+                 ':MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n:UPDATES: END\r\n')
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            self.body_lines(resp.body),
+            [b':MISSING_CHECK: START',
+             (self.hash1 + ' d').encode('ascii'),
+             b':MISSING_CHECK: END',
+             b':UPDATES: START', b':UPDATES: END'])
+        self.assertEqual(resp.status_int, 200)
+        self.assertFalse(self.controller.logger.error.called)
+        self.assertFalse(self.controller.logger.exception.called)
+
+    def test_MISSING_CHECK_have_older_meta(self):
+        object_dir = utils.storage_directory(
+            os.path.join(self.testdir, 'sda1',
+                         diskfile.get_data_dir(POLICIES[0])),
+            '1', self.hash1)
+        utils.mkdirs(object_dir)
+        older_ts1 = utils.normalize_timestamp(float(self.ts1) - 1)
+        self.metadata1['X-Timestamp'] = older_ts1
+        fp = open(os.path.join(object_dir, older_ts1 + '.data'), 'w+')
+        fp.write('1')
+        fp.flush()
+        self.metadata1['Content-Length'] = '1'
+        diskfile.write_metadata(fp, self.metadata1)
+        # write .meta file at ts1
+        metadata = {'name': self.name1, 'X-Timestamp': self.ts1,
+                    'X-Object-Meta-Test': 'test'}
+        fp = open(os.path.join(object_dir, self.ts1 + '.meta'), 'w+')
+        diskfile.write_metadata(fp, metadata)
+
+        # receiver has .data at older_ts, .meta at ts1
+        # sender has .data at older_ts, .meta at ts2
+        self.controller.logger = mock.MagicMock()
+        req = swob.Request.blank(
+            '/sda1/1',
+            environ={'REQUEST_METHOD': 'SSYNC'},
+            body=':MISSING_CHECK: START\r\n' +
+                 self.hash1 + ' ' + older_ts1 + ' m:30d40\r\n'
+                 ':MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n:UPDATES: END\r\n')
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            self.body_lines(resp.body),
+            [b':MISSING_CHECK: START',
+             (self.hash1 + ' m').encode('ascii'),
+             b':MISSING_CHECK: END',
+             b':UPDATES: START', b':UPDATES: END'])
+        self.assertEqual(resp.status_int, 200)
+        self.assertFalse(self.controller.logger.error.called)
+        self.assertFalse(self.controller.logger.exception.called)
+
+    def test_UPDATES_no_start(self):
+        # verify behavior when the sender disconnects and does not send
+        # ':UPDATES: START' e.g. if a sender timeout pops while waiting for
+        # receiver response to missing checks
+        self.controller.logger = mock.MagicMock()
+        req = swob.Request.blank(
+            '/device/partition',
+            environ={'REQUEST_METHOD': 'SSYNC'},
+            body=':MISSING_CHECK: START\r\n:MISSING_CHECK: END\r\n')
+        req.remote_addr = '2.3.4.5'
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            self.body_lines(resp.body),
+            [b':MISSING_CHECK: START', b':MISSING_CHECK: END'])
+        self.assertEqual(resp.status_int, 200)
+        self.controller.logger.error.assert_called_once_with(
+            'ssync client disconnected')
+
+    def test_UPDATES_timeout(self):
+
+        class _Wrapper(io.BytesIO):
+
+            def __init__(self, value):
+                io.BytesIO.__init__(self, value)
+                self.mock_socket = mock.MagicMock()
+
+            def readline(self, sizehint=-1):
+                line = io.BytesIO.readline(self)
+                if line.startswith(b'DELETE'):
+                    eventlet.sleep(0.1)
+                return line
+
+            def get_socket(self):
+                return self.mock_socket
+
+        self.controller.client_timeout = 0.01
+        with mock.patch.object(
+                ssync_receiver.eventlet.greenio, 'shutdown_safe') as \
+                mock_shutdown_safe:
+            self.controller.logger = mock.MagicMock()
+            req = swob.Request.blank(
+                '/device/partition',
+                environ={'REQUEST_METHOD': 'SSYNC'},
+                body=':MISSING_CHECK: START\r\n:MISSING_CHECK: END\r\n'
+                     ':UPDATES: START\r\n'
+                     'DELETE /a/c/o\r\n'
+                     'X-Timestamp: 1364456113.76334\r\n'
+                     '\r\n'
+                     ':UPDATES: END\r\n')
+            req.remote_addr = '2.3.4.5'
+            mock_wsgi_input = _Wrapper(req.body)
+            req.environ['wsgi.input'] = mock_wsgi_input
+            resp = req.get_response(self.controller)
+            self.assertEqual(
+                self.body_lines(resp.body),
+                [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+                 b":ERROR: 408 '0.01 seconds: updates line'"])
+            self.assertEqual(resp.status_int, 200)
+            mock_shutdown_safe.assert_called_once_with(
+                mock_wsgi_input.mock_socket)
+            mock_wsgi_input.mock_socket.close.assert_called_once_with()
+            self.controller.logger.error.assert_called_once_with(
+                '2.3.4.5/device/partition TIMEOUT in ssync.Receiver: '
+                '0.01 seconds: updates line')
+
+    def test_UPDATES_timeout_reading_PUT_subreq_input_1(self):
+        # timeout reading from wsgi input part way through a PUT subreq body
+        body_chunks = [
+            ':MISSING_CHECK: START\r\n',
+            ':MISSING_CHECK: END\r\n',
+            ':UPDATES: START\r\n',
+            'PUT /a/c/o\r\nContent-Length: 28\r\n\r\n',
+            'body_chunk_one',
+            'body_chunk_two',
+            ':UPDATES: END\r\n',
+            ''
+        ]
+        chunked_body = ''.join([
+            '%x\r\n%s\r\n' % (len(line), line) for line in body_chunks
+        ])
+        req = swob.Request.blank(
+            '/device/partition',
+            environ={'REQUEST_METHOD': 'SSYNC'},
+            body=chunked_body)
+        req.remote_addr = '2.3.4.5'
+        slow_down_index = chunked_body.find('chunk_one')
+        slow_io = SlowBytesIO(req.body, sleep_index=slow_down_index)
+        wsgi_input = eventlet.wsgi.Input(
+            rfile=slow_io, content_length=123, sock=mock.MagicMock(),
+            chunked_input=True)
+        req.environ['wsgi.input'] = wsgi_input
+        controller = FakeController(self.conf, logger=self.logger)
+        controller.client_timeout = 0.01
+        with mock.patch.object(
+                ssync_receiver.eventlet.greenio, 'shutdown_safe') as \
+                mock_shutdown_safe:
+            resp = req.get_response(controller)
+            resp_body_lines = self.body_lines(resp.body)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(
+            [b':MISSING_CHECK: START',
+             b':MISSING_CHECK: END',
+             b":ERROR: 408 '0.01 seconds: PUT /a/c/o'"], resp_body_lines)
+        self.assertEqual([
+            b'17\r\n',
+            b':MISSING_CHECK: START\r\n',
+            b'\r\n',
+            b'15\r\n',
+            b':MISSING_CHECK: END\r\n',
+            b'\r\n',
+            b'11\r\n',
+            b':UPDATES: START\r\n',
+            b'\r\n',
+            b'22\r\n',
+            b'PUT /a/c/o\r\n',
+            b'Content-Length: 28\r\n',
+            b'\r\n',
+            b'\r\n',
+            b'e\r\n',
+            b'body_',
+        ], slow_io.bytes_read)
+        # oops,the subreq body was not drained
+        self.assertEqual(
+            b'chunk_one\r\ne\r\nbody_chunk_two\r\n'
+            b'f\r\n:UPDATES: END\r\n\r\n'
+            b'0\r\n\r\n', slow_io.read())
+        mock_shutdown_safe.assert_called_once_with(
+            wsgi_input.get_socket())
+        self.assertTrue(wsgi_input.get_socket().closed)
+        log_lines = self.logger.get_lines_for_level('error')
+        self.assertEqual(
+            ['ERROR __call__ error with PUT /device/partition/a/c/o : '
+             'MessageTimeout (0.01s) PUT /a/c/o',
+             '2.3.4.5/device/partition TIMEOUT in ssync.Receiver: '
+             '0.01 seconds: PUT /a/c/o'],
+            log_lines)
+
+    def test_UPDATES_timeout_reading_PUT_subreq_input_2(self):
+        # timeout immediately before reading PUT subreq chunk content
+        body_chunks = [
+            ':MISSING_CHECK: START\r\n',
+            ':MISSING_CHECK: END\r\n',
+            ':UPDATES: START\r\n',
+            'PUT /a/c/o\r\nContent-Length: 99\r\n\r\n',
+            'first body chunk',
+            # NB: this is still the PUT subreq body, it just happens to look
+            # like the start of another subreq...
+            'DELETE /in/second/body chunk\r\n'
+            'X-Timestamp: 123456789.12345\r\nContent-Length: 0\r\n\r\n',
+            ':UPDATES: END\r\n',
+        ]
+        chunked_body = ''.join([
+            '%x\r\n%s\r\n' % (len(line), line) for line in body_chunks
+        ])
+        req = swob.Request.blank(
+            '/device/partition',
+            environ={'REQUEST_METHOD': 'SSYNC'},
+            body=chunked_body)
+        req.remote_addr = '2.3.4.5'
+        slow_down_index = chunked_body.find('DELETE /in/second/body chunk')
+        slow_io = SlowBytesIO(req.body, sleep_index=slow_down_index)
+        wsgi_input = eventlet.wsgi.Input(
+            rfile=slow_io, content_length=123, sock=mock.MagicMock(),
+            chunked_input=True)
+        req.environ['wsgi.input'] = wsgi_input
+        controller = FakeController(self.conf, logger=self.logger)
+        controller.client_timeout = 0.01
+        with mock.patch.object(
+                ssync_receiver.eventlet.greenio, 'shutdown_safe') as \
+                mock_shutdown_safe:
+            resp = req.get_response(controller)
+            resp_body_lines = self.body_lines(resp.body)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(['SSYNC', 'PUT'],
+                         [req.method for req in controller.requests])
+        self.assertEqual(chunked_body.encode('utf-8')[:slow_down_index],
+                         b''.join(slow_io.bytes_read))
+        self.assertEqual([
+            b':MISSING_CHECK: START',
+            b':MISSING_CHECK: END',
+            b":ERROR: 408 '0.01 seconds: PUT /a/c/o'"], resp_body_lines)
+        mock_shutdown_safe.assert_called_once_with(
+            wsgi_input.get_socket())
+        self.assertTrue(wsgi_input.get_socket().closed)
+        log_lines = self.logger.get_lines_for_level('error')
+        self.assertEqual(
+            ['ERROR __call__ error with PUT /device/partition/a/c/o : '
+             'MessageTimeout (0.01s) PUT /a/c/o',
+             '2.3.4.5/device/partition TIMEOUT in ssync.Receiver: '
+             '0.01 seconds: PUT /a/c/o'],
+            log_lines)
+
+    def test_UPDATES_other_exception(self):
+
+        class _Wrapper(io.BytesIO):
+
+            def __init__(self, value):
+                io.BytesIO.__init__(self, value)
+                self.mock_socket = mock.MagicMock()
+
+            def readline(self, sizehint=-1):
+                line = io.BytesIO.readline(self)
+                if line.startswith(b'DELETE'):
+                    raise Exception('test exception')
+                return line
+
+            def get_socket(self):
+                return self.mock_socket
+
+        self.controller.client_timeout = 0.01
+        with mock.patch.object(
+                ssync_receiver.eventlet.greenio, 'shutdown_safe') as \
+                mock_shutdown_safe:
+            self.controller.logger = mock.MagicMock()
+            req = swob.Request.blank(
+                '/device/partition',
+                environ={'REQUEST_METHOD': 'SSYNC'},
+                body=':MISSING_CHECK: START\r\n:MISSING_CHECK: END\r\n'
+                     ':UPDATES: START\r\n'
+                     'DELETE /a/c/o\r\n'
+                     'X-Timestamp: 1364456113.76334\r\n'
+                     '\r\n'
+                     ':UPDATES: END\r\n')
+            req.remote_addr = '3.4.5.6'
+            mock_wsgi_input = _Wrapper(req.body)
+            req.environ['wsgi.input'] = mock_wsgi_input
+            resp = req.get_response(self.controller)
+            self.assertEqual(
+                self.body_lines(resp.body),
+                [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+                 b":ERROR: 0 'test exception'"])
+            self.assertEqual(resp.status_int, 200)
+            mock_shutdown_safe.assert_called_once_with(
+                mock_wsgi_input.mock_socket)
+            mock_wsgi_input.mock_socket.close.assert_called_once_with()
+            self.controller.logger.exception.assert_called_once_with(
+                '3.4.5.6/device/partition EXCEPTION in ssync.Receiver')
+
+    def test_UPDATES_no_problems_no_hard_disconnect(self):
+
+        class _Wrapper(io.BytesIO):
+
+            def __init__(self, value):
+                io.BytesIO.__init__(self, value)
+                self.mock_socket = mock.MagicMock()
+
+            def get_socket(self):
+                return self.mock_socket
+
+        self.controller.client_timeout = 0.01
+        with mock.patch.object(ssync_receiver.eventlet.greenio,
+                               'shutdown_safe') as mock_shutdown_safe, \
+                mock.patch.object(
+                    self.controller, 'DELETE',
+                    return_value=swob.HTTPNoContent()):
+            req = swob.Request.blank(
+                '/device/partition',
+                environ={'REQUEST_METHOD': 'SSYNC'},
+                body=':MISSING_CHECK: START\r\n:MISSING_CHECK: END\r\n'
+                     ':UPDATES: START\r\n'
+                     'DELETE /a/c/o\r\n'
+                     'X-Timestamp: 1364456113.76334\r\n'
+                     '\r\n'
+                     ':UPDATES: END\r\n')
+            mock_wsgi_input = _Wrapper(req.body)
+            req.environ['wsgi.input'] = mock_wsgi_input
+            resp = req.get_response(self.controller)
+            self.assertEqual(
+                self.body_lines(resp.body),
+                [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+                 b':UPDATES: START', b':UPDATES: END'])
+            self.assertEqual(resp.status_int, 200)
+            self.assertFalse(mock_shutdown_safe.called)
+            self.assertFalse(mock_wsgi_input.mock_socket.close.called)
+
+    def test_UPDATES_bad_subrequest_line_1(self):
+        req = swob.Request.blank(
+            '/device/partition',
+            environ={'REQUEST_METHOD': 'SSYNC'},
+            body=':MISSING_CHECK: START\r\n:MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n'
+                 'bad_subrequest_line\r\n')
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            self.body_lines(resp.body),
+            [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+             UNPACK_ERR])
+        self.assertEqual(resp.status_int, 200)
+        lines = self.logger.get_lines_for_level('error')
+        self.assertEqual(
+            ['None/device/partition EXCEPTION in ssync.Receiver: '], lines)
+
+    def test_UPDATES_bad_subrequest_line_2(self):
+        # If there's no line feed, we probably read a partial buffer
+        # because the client hung up
+        with mock.patch.object(
+                self.controller, 'DELETE',
+                return_value=swob.HTTPNoContent()):
+            req = swob.Request.blank(
+                '/device/partition',
+                environ={'REQUEST_METHOD': 'SSYNC'},
+                body=':MISSING_CHECK: START\r\n:MISSING_CHECK: END\r\n'
+                     ':UPDATES: START\r\n'
+                     'DELETE /a/c/o\r\n'
+                     'X-Timestamp: 1364456113.76334\r\n'
+                     '\r\n'
+                     'bad_subrequest_line2')
+            resp = req.get_response(self.controller)
+            self.assertEqual(
+                self.body_lines(resp.body),
+                [b':MISSING_CHECK: START', b':MISSING_CHECK: END'])
+            # Since the client (presumably) hung up, no point in sending
+            # anything about the error
+            self.assertEqual(resp.status_int, 200)
+        lines = self.logger.get_lines_for_level('error')
+        self.assertEqual(
+            ['None/device/partition read failed in ssync.Receiver: '
+             'updates line: missing newline'], lines)
+
+    def test_UPDATES_no_headers(self):
+        self.controller.logger = mock.MagicMock()
+        req = swob.Request.blank(
+            '/device/partition',
+            environ={'REQUEST_METHOD': 'SSYNC'},
+            body=':MISSING_CHECK: START\r\n:MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n'
+                 'DELETE /a/c/o\r\n')
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            self.body_lines(resp.body),
+            [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+             b":ERROR: 0 'Got no headers for DELETE /a/c/o'"])
+        self.assertEqual(resp.status_int, 200)
+        self.controller.logger.exception.assert_called_once_with(
+            'None/device/partition EXCEPTION in ssync.Receiver')
+
+    def test_UPDATES_bad_headers(self):
+        self.controller.logger = mock.MagicMock()
+        req = swob.Request.blank(
+            '/device/partition',
+            environ={'REQUEST_METHOD': 'SSYNC'},
+            body=':MISSING_CHECK: START\r\n:MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n'
+                 'DELETE /a/c/o\r\n'
+                 'Bad-Header Test\r\n')
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            self.body_lines(resp.body),
+            [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+             UNPACK_ERR])
+        self.assertEqual(resp.status_int, 200)
+        self.controller.logger.exception.assert_called_once_with(
+            'None/device/partition EXCEPTION in ssync.Receiver')
+
+        self.controller.logger = mock.MagicMock()
+        req = swob.Request.blank(
+            '/device/partition',
+            environ={'REQUEST_METHOD': 'SSYNC'},
+            body=':MISSING_CHECK: START\r\n:MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n'
+                 'DELETE /a/c/o\r\n'
+                 'Good-Header: Test\r\n'
+                 'Bad-Header Test\r\n')
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            self.body_lines(resp.body),
+            [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+             UNPACK_ERR])
+        self.assertEqual(resp.status_int, 200)
+        self.controller.logger.exception.assert_called_once_with(
+            'None/device/partition EXCEPTION in ssync.Receiver')
+
+    def test_UPDATES_bad_content_length(self):
+        self.controller.logger = mock.MagicMock()
+        req = swob.Request.blank(
+            '/device/partition',
+            environ={'REQUEST_METHOD': 'SSYNC'},
+            body=':MISSING_CHECK: START\r\n:MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n'
+                 'PUT /a/c/o\r\n'
+                 'Content-Length: a\r\n\r\n')
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            self.body_lines(resp.body),
+            [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+             b':ERROR: 0 "invalid literal for int() with base 10: \'a\'"'])
+        self.assertEqual(resp.status_int, 200)
+        self.controller.logger.exception.assert_called_once_with(
+            'None/device/partition EXCEPTION in ssync.Receiver')
+
+    def test_UPDATES_content_length_with_DELETE(self):
+        self.controller.logger = mock.MagicMock()
+        req = swob.Request.blank(
+            '/device/partition',
+            environ={'REQUEST_METHOD': 'SSYNC'},
+            body=':MISSING_CHECK: START\r\n:MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n'
+                 'DELETE /a/c/o\r\n'
+                 'Content-Length: 1\r\n\r\n')
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            self.body_lines(resp.body),
+            [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+             b":ERROR: 0 'DELETE subrequest with content-length /a/c/o'"])
+        self.assertEqual(resp.status_int, 200)
+        self.controller.logger.exception.assert_called_once_with(
+            'None/device/partition EXCEPTION in ssync.Receiver')
+
+    def test_UPDATES_no_content_length_with_PUT(self):
+        self.controller.logger = mock.MagicMock()
+        req = swob.Request.blank(
+            '/device/partition',
+            environ={'REQUEST_METHOD': 'SSYNC'},
+            body=':MISSING_CHECK: START\r\n:MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n'
+                 'PUT /a/c/o\r\n\r\n')
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            self.body_lines(resp.body),
+            [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+             b":ERROR: 0 'No content-length sent for PUT /a/c/o'"])
+        self.assertEqual(resp.status_int, 200)
+        self.controller.logger.exception.assert_called_once_with(
+            'None/device/partition EXCEPTION in ssync.Receiver')
+
+    def test_UPDATES_early_termination(self):
+        self.controller.logger = mock.MagicMock()
+        req = swob.Request.blank(
+            '/device/partition',
+            environ={'REQUEST_METHOD': 'SSYNC'},
+            body=':MISSING_CHECK: START\r\n:MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n'
+                 'PUT /a/c/o\r\n'
+                 'Content-Length: 1\r\n\r\n')
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            self.body_lines(resp.body),
+            [b':MISSING_CHECK: START', b':MISSING_CHECK: END'])
+        self.assertEqual(resp.status_int, 200)
+        self.controller.logger.error.assert_called_once_with(
+            'None/device/partition read failed in ssync.Receiver: '
+            'Early termination for PUT /a/c/o')
+
+    def test_UPDATES_failures(self):
+
+        @server.public
+        def _DELETE(request):
+            if request.path == '/device/partition/a/c/works':
+                return swob.HTTPNoContent()
+            else:
+                return swob.HTTPInternalServerError()
+
+        # failures never hit threshold
+        with mock.patch.object(self.controller, 'DELETE', _DELETE):
+            self.controller.replication_failure_threshold = 4
+            self.controller.replication_failure_ratio = 1.5
+            self.controller.logger = mock.MagicMock()
+            req = swob.Request.blank(
+                '/device/partition',
+                environ={'REQUEST_METHOD': 'SSYNC'},
+                body=':MISSING_CHECK: START\r\n:MISSING_CHECK: END\r\n'
+                     ':UPDATES: START\r\n'
+                     'DELETE /a/c/o\r\n\r\n'
+                     'DELETE /a/c/o\r\n\r\n'
+                     'DELETE /a/c/o\r\n\r\n')
+            resp = req.get_response(self.controller)
+            final_line = (b":ERROR: 500 b'ERROR: With :UPDATES: "
+                          b"3 failures to 0 successes'")
+            self.assertEqual(
+                self.body_lines(resp.body),
+                [b':MISSING_CHECK: START', b':MISSING_CHECK: END', final_line])
+            self.assertEqual(resp.status_int, 200)
+            self.assertFalse(self.controller.logger.exception.called)
+            self.assertFalse(self.controller.logger.error.called)
+            self.assertTrue(self.controller.logger.warning.called)
+            self.assertEqual(3, self.controller.logger.warning.call_count)
+            self.controller.logger.clear()
+
+        # failures hit threshold and no successes, so ratio is like infinity
+        with mock.patch.object(self.controller, 'DELETE', _DELETE):
+            self.controller.replication_failure_threshold = 4
+            self.controller.replication_failure_ratio = 1.5
+            self.controller.logger = mock.MagicMock()
+            req = swob.Request.blank(
+                '/device/partition',
+                environ={'REQUEST_METHOD': 'SSYNC'},
+                body=':MISSING_CHECK: START\r\n:MISSING_CHECK: END\r\n'
+                     ':UPDATES: START\r\n'
+                     'DELETE /a/c/o\r\n\r\n'
+                     'DELETE /a/c/o\r\n\r\n'
+                     'DELETE /a/c/o\r\n\r\n'
+                     'DELETE /a/c/o\r\n\r\n'
+                     'DELETE /a/c/o\r\n\r\n'
+                     ':UPDATES: END\r\n')
+            resp = req.get_response(self.controller)
+            self.assertEqual(
+                self.body_lines(resp.body),
+                [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+                 b":ERROR: 0 'Too many 4 failures to 0 successes'"])
+            self.assertEqual(resp.status_int, 200)
+            self.controller.logger.exception.assert_called_once_with(
+                'None/device/partition EXCEPTION in ssync.Receiver')
+            self.assertFalse(self.controller.logger.error.called)
+            self.assertTrue(self.controller.logger.warning.called)
+            self.assertEqual(4, self.controller.logger.warning.call_count)
+            self.controller.logger.clear()
+
+        # failures hit threshold and ratio hits 1.33333333333
+        with mock.patch.object(self.controller, 'DELETE', _DELETE):
+            self.controller.replication_failure_threshold = 4
+            self.controller.replication_failure_ratio = 1.5
+            self.controller.logger = mock.MagicMock()
+            req = swob.Request.blank(
+                '/device/partition',
+                environ={'REQUEST_METHOD': 'SSYNC'},
+                body=':MISSING_CHECK: START\r\n:MISSING_CHECK: END\r\n'
+                     ':UPDATES: START\r\n'
+                     'DELETE /a/c/o\r\n\r\n'
+                     'DELETE /a/c/o\r\n\r\n'
+                     'DELETE /a/c/works\r\n\r\n'
+                     'DELETE /a/c/works\r\n\r\n'
+                     'DELETE /a/c/works\r\n\r\n'
+                     'DELETE /a/c/o\r\n\r\n'
+                     'DELETE /a/c/o\r\n\r\n'
+                     ':UPDATES: END\r\n')
+            resp = req.get_response(self.controller)
+            final_line = (b":ERROR: 500 b'ERROR: With :UPDATES: "
+                          b"4 failures to 3 successes'")
+            self.assertEqual(
+                self.body_lines(resp.body),
+                [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+                 final_line])
+            self.assertEqual(resp.status_int, 200)
+            self.assertFalse(self.controller.logger.exception.called)
+            self.assertFalse(self.controller.logger.error.called)
+            self.assertTrue(self.controller.logger.warning.called)
+            self.assertEqual(4, self.controller.logger.warning.call_count)
+            self.controller.logger.clear()
+
+        # failures hit threshold and ratio hits 2.0
+        with mock.patch.object(self.controller, 'DELETE', _DELETE):
+            self.controller.replication_failure_threshold = 4
+            self.controller.replication_failure_ratio = 1.5
+            self.controller.logger = mock.MagicMock()
+            req = swob.Request.blank(
+                '/device/partition',
+                environ={'REQUEST_METHOD': 'SSYNC'},
+                body=':MISSING_CHECK: START\r\n:MISSING_CHECK: END\r\n'
+                     ':UPDATES: START\r\n'
+                     'DELETE /a/c/o\r\n\r\n'
+                     'DELETE /a/c/o\r\n\r\n'
+                     'DELETE /a/c/works\r\n\r\n'
+                     'DELETE /a/c/works\r\n\r\n'
+                     'DELETE /a/c/o\r\n\r\n'
+                     'DELETE /a/c/o\r\n\r\n'
+                     ':UPDATES: END\r\n')
+            resp = req.get_response(self.controller)
+            self.assertEqual(
+                self.body_lines(resp.body),
+                [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+                 b":ERROR: 0 'Too many 4 failures to 2 successes'"])
+            self.assertEqual(resp.status_int, 200)
+            self.controller.logger.exception.assert_called_once_with(
+                'None/device/partition EXCEPTION in ssync.Receiver')
+            self.assertFalse(self.controller.logger.error.called)
+            self.assertTrue(self.controller.logger.warning.called)
+            self.assertEqual(4, self.controller.logger.warning.call_count)
+            self.controller.logger.clear()
+
+    def test_UPDATES_PUT(self):
+        _PUT_request = [None]
+
+        @server.public
+        def _PUT(request):
+            _PUT_request[0] = request
+            request.read_body = request.environ['wsgi.input'].read()
+            return swob.HTTPCreated()
+
+        with mock.patch.object(self.controller, 'PUT', _PUT):
+            self.controller.logger = mock.MagicMock()
+            req = swob.Request.blank(
+                '/device/partition',
+                environ={'REQUEST_METHOD': 'SSYNC'},
+                body=b':MISSING_CHECK: START\r\n:MISSING_CHECK: END\r\n'
+                     b':UPDATES: START\r\n'
+                     b'PUT /a/c/o\r\n'
+                     b'Content-Length: 1\r\n'
+                     b'Etag: c4ca4238a0b923820dcc509a6f75849b\r\n'
+                     b'X-Timestamp: 1364456113.12344\r\n'
+                     b'X-Object-Meta-Test1: one\r\n'
+                     b'X-Object-Meta-T\xc3\xa8st2: m\xc3\xa8ta\r\n'
+                     b'Content-Encoding: gzip\r\n'
+                     b'Specialty-Header: value\r\n'
+                     b'X-Backend-No-Commit: True\r\n'
+                     b'\r\n'
+                     b'1')
+            resp = req.get_response(self.controller)
+            self.assertEqual(
+                self.body_lines(resp.body),
+                [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+                 b':UPDATES: START', b':UPDATES: END'])
+            self.assertEqual(resp.status_int, 200)
+            self.assertFalse(self.controller.logger.exception.called)
+            self.assertFalse(self.controller.logger.error.called)
+            self.assertEqual(len(_PUT_request), 1)  # sanity
+            req = _PUT_request[0]
+            self.assertEqual(req.path, '/device/partition/a/c/o')
+            self.assertEqual(req.content_length, 1)
+            expected = {
+                'Etag': 'c4ca4238a0b923820dcc509a6f75849b',
+                'Content-Length': '1',
+                'X-Timestamp': '1364456113.12344',
+                'X-Object-Meta-Test1': 'one',
+                'X-Object-Meta-T\xc3\xa8st2': 'm\xc3\xa8ta',
+                'Content-Encoding': 'gzip',
+                'Specialty-Header': 'value',
+                'X-Backend-No-Commit': 'True',
+                'Host': 'localhost:80',
+                'X-Backend-Storage-Policy-Index': '0',
+                'X-Backend-Replication': 'True',
+                # note: Etag and X-Backend-No-Commit not in replication-headers
+                'X-Backend-Replication-Headers': (
+                    'content-length x-timestamp x-object-meta-test1 '
+                    'x-object-meta-t\xc3\xa8st2 content-encoding '
+                    'specialty-header')}
+            self.assertEqual({k: req.headers[k] for k in expected}, expected)
+
+    def test_UPDATES_PUT_replication_headers(self):
+        self.controller.logger = mock.MagicMock()
+
+        # sanity check - regular PUT will not persist Specialty-Header or
+        # X-Backend-No-Commit
+        req = swob.Request.blank(
+            '/sda1/0/a/c/o1', body='1',
+            environ={'REQUEST_METHOD': 'PUT'},
+            headers={'Content-Length': '1',
+                     'Content-Type': 'text/plain',
+                     'Etag': 'c4ca4238a0b923820dcc509a6f75849b',
+                     'X-Timestamp': '1364456113.12344',
+                     'X-Object-Meta-Test1': 'one',
+                     'Content-Encoding': 'gzip',
+                     'X-Backend-No-Commit': 'False',
+                     'Specialty-Header': 'value'})
+        resp = req.get_response(self.controller)
+        self.assertEqual(resp.status_int, 201)
+        df = self.controller.get_diskfile(
+            'sda1', '0', 'a', 'c', 'o1', POLICIES.default)
+        df.open()
+        self.assertFalse('Specialty-Header' in df.get_metadata())
+        self.assertFalse('X-Backend-No-Commit' in df.get_metadata())
+
+        # an SSYNC request can override PUT header filtering...
+        req = swob.Request.blank(
+            '/sda1/0',
+            environ={'REQUEST_METHOD': 'SSYNC'},
+            body=':MISSING_CHECK: START\r\n:MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n'
+                 'PUT /a/c/o2\r\n'
+                 'Content-Length: 1\r\n'
+                 'Content-Type: text/plain\r\n'
+                 'Etag: c4ca4238a0b923820dcc509a6f75849b\r\n'
+                 'X-Timestamp: 1364456113.12344\r\n'
+                 'X-Object-Meta-Test1: one\r\n'
+                 'Content-Encoding: gzip\r\n'
+                 'X-Backend-No-Commit: False\r\n'
+                 'Specialty-Header: value\r\n'
+                 '\r\n'
+                 '1')
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            self.body_lines(resp.body),
+            [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+             b':UPDATES: START', b':UPDATES: END'])
+        self.assertEqual(resp.status_int, 200)
+
+        # verify diskfile has metadata permitted by replication headers
+        # including Specialty-Header, but not Etag or X-Backend-No-Commit
+        df = self.controller.get_diskfile(
+            'sda1', '0', 'a', 'c', 'o2', POLICIES.default)
+        df.open()
+        for chunk in df.reader():
+            self.assertEqual(b'1', chunk)
+        expected = {'ETag': 'c4ca4238a0b923820dcc509a6f75849b',
+                    'Content-Length': '1',
+                    'Content-Type': 'text/plain',
+                    'X-Timestamp': '1364456113.12344',
+                    'X-Object-Meta-Test1': 'one',
+                    'Content-Encoding': 'gzip',
+                    'Specialty-Header': 'value',
+                    'name': '/a/c/o2'}
+        actual = df.get_metadata()
+        self.assertEqual(expected, actual)
+
+    def test_UPDATES_POST(self):
+        _POST_request = [None]
+
+        @server.public
+        def _POST(request):
+            _POST_request[0] = request
+            return swob.HTTPAccepted()
+
+        with mock.patch.object(self.controller, 'POST', _POST):
+            self.controller.logger = mock.MagicMock()
+            req = swob.Request.blank(
+                '/device/partition',
+                environ={'REQUEST_METHOD': 'SSYNC'},
+                body=':MISSING_CHECK: START\r\n:MISSING_CHECK: END\r\n'
+                     ':UPDATES: START\r\n'
+                     'POST /a/c/o\r\n'
+                     'X-Timestamp: 1364456113.12344\r\n'
+                     'X-Object-Meta-Test1: one\r\n'
+                     'Specialty-Header: value\r\n\r\n')
+            resp = req.get_response(self.controller)
+            self.assertEqual(
+                self.body_lines(resp.body),
+                [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+                 b':UPDATES: START', b':UPDATES: END'])
+            self.assertEqual(resp.status_int, 200)
+            self.assertFalse(self.controller.logger.exception.called)
+            self.assertFalse(self.controller.logger.error.called)
+            req = _POST_request[0]
+            self.assertEqual(req.path, '/device/partition/a/c/o')
+            self.assertIsNone(req.content_length)
+            self.assertEqual(req.headers, {
+                'X-Timestamp': '1364456113.12344',
+                'X-Object-Meta-Test1': 'one',
+                'Specialty-Header': 'value',
+                'Host': 'localhost:80',
+                'X-Backend-Storage-Policy-Index': '0',
+                'X-Backend-Replication': 'True',
+                'X-Backend-Replication-Headers': (
+                    'x-timestamp x-object-meta-test1 specialty-header')})
+
+    def test_UPDATES_with_storage_policy(self):
+        # update router post policy patch
+        self.controller._diskfile_router = diskfile.DiskFileRouter(
+            self.conf, self.controller.logger)
+        _PUT_request = [None]
+
+        @server.public
+        def _PUT(request):
+            _PUT_request[0] = request
+            request.read_body = request.environ['wsgi.input'].read()
+            return swob.HTTPCreated()
+
+        with mock.patch.object(self.controller, 'PUT', _PUT):
+            self.controller.logger = mock.MagicMock()
+            req = swob.Request.blank(
+                '/device/partition',
+                environ={'REQUEST_METHOD': 'SSYNC',
+                         'HTTP_X_BACKEND_STORAGE_POLICY_INDEX': '1'},
+                body=':MISSING_CHECK: START\r\n:MISSING_CHECK: END\r\n'
+                     ':UPDATES: START\r\n'
+                     'PUT /a/c/o\r\n'
+                     'Content-Length: 1\r\n'
+                     'X-Timestamp: 1364456113.12344\r\n'
+                     'X-Object-Meta-Test1: one\r\n'
+                     'Content-Encoding: gzip\r\n'
+                     'Specialty-Header: value\r\n'
+                     '\r\n'
+                     '1')
+            resp = req.get_response(self.controller)
+            self.assertEqual(
+                self.body_lines(resp.body),
+                [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+                 b':UPDATES: START', b':UPDATES: END'])
+            self.assertEqual(resp.status_int, 200)
+            self.assertFalse(self.controller.logger.exception.called)
+            self.assertFalse(self.controller.logger.error.called)
+            self.assertEqual(len(_PUT_request), 1)  # sanity
+            req = _PUT_request[0]
+            self.assertEqual(req.path, '/device/partition/a/c/o')
+            self.assertEqual(req.content_length, 1)
+            self.assertEqual(req.headers, {
+                'Content-Length': '1',
+                'X-Timestamp': '1364456113.12344',
+                'X-Object-Meta-Test1': 'one',
+                'Content-Encoding': 'gzip',
+                'Specialty-Header': 'value',
+                'Host': 'localhost:80',
+                'X-Backend-Storage-Policy-Index': '1',
+                'X-Backend-Replication': 'True',
+                'X-Backend-Replication-Headers': (
+                    'content-length x-timestamp x-object-meta-test1 '
+                    'content-encoding specialty-header')})
+            self.assertEqual(req.read_body, b'1')
+
+    def test_UPDATES_PUT_with_storage_policy_and_node_index(self):
+        # update router post policy patch
+        self.controller._diskfile_router = diskfile.DiskFileRouter(
+            self.conf, self.controller.logger)
+
+        _PUT_request = [None]
+
+        @server.public
+        def _PUT(request):
+            _PUT_request[0] = request
+            request.read_body = request.environ['wsgi.input'].read()
+            return swob.HTTPCreated()
+
+        with mock.patch.object(self.controller, 'PUT', _PUT):
+            self.controller.logger = mock.MagicMock()
+            req = swob.Request.blank(
+                '/device/partition',
+                environ={'REQUEST_METHOD': 'SSYNC',
+                         'HTTP_X_BACKEND_SSYNC_NODE_INDEX': '7',
+                         'HTTP_X_BACKEND_SSYNC_FRAG_INDEX': '7',
+                         'HTTP_X_BACKEND_STORAGE_POLICY_INDEX': '0'},
+                body=':MISSING_CHECK: START\r\n:MISSING_CHECK: END\r\n'
+                     ':UPDATES: START\r\n'
+                     'PUT /a/c/o\r\n'
+                     'Content-Length: 1\r\n'
+                     'X-Timestamp: 1364456113.12344\r\n'
+                     'X-Object-Meta-Test1: one\r\n'
+                     'Content-Encoding: gzip\r\n'
+                     'Specialty-Header: value\r\n'
+                     '\r\n'
+                     '1')
+            resp = req.get_response(self.controller)
+            self.assertEqual(
+                self.body_lines(resp.body),
+                [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+                 b':UPDATES: START', b':UPDATES: END'])
+            self.assertEqual(resp.status_int, 200)
+            self.assertFalse(self.controller.logger.exception.called)
+            self.assertFalse(self.controller.logger.error.called)
+            self.assertEqual(len(_PUT_request), 1)  # sanity
+            req = _PUT_request[0]
+            self.assertEqual(req.path, '/device/partition/a/c/o')
+            self.assertEqual(req.content_length, 1)
+            self.assertEqual(req.headers, {
+                'Content-Length': '1',
+                'X-Timestamp': '1364456113.12344',
+                'X-Object-Meta-Test1': 'one',
+                'Content-Encoding': 'gzip',
+                'Specialty-Header': 'value',
+                'Host': 'localhost:80',
+                'X-Backend-Storage-Policy-Index': '0',
+                'X-Backend-Ssync-Frag-Index': '7',
+                'X-Backend-Replication': 'True',
+                'X-Backend-Replication-Headers': (
+                    'content-length x-timestamp x-object-meta-test1 '
+                    'content-encoding specialty-header')})
+            self.assertEqual(req.read_body, b'1')
+
+    def test_UPDATES_DELETE(self):
+        _DELETE_request = [None]
+
+        @server.public
+        def _DELETE(request):
+            _DELETE_request[0] = request
+            return swob.HTTPNoContent()
+
+        with mock.patch.object(self.controller, 'DELETE', _DELETE):
+            self.controller.logger = mock.MagicMock()
+            req = swob.Request.blank(
+                '/device/partition',
+                environ={'REQUEST_METHOD': 'SSYNC'},
+                body=':MISSING_CHECK: START\r\n:MISSING_CHECK: END\r\n'
+                     ':UPDATES: START\r\n'
+                     'DELETE /a/c/o\r\n'
+                     'X-Timestamp: 1364456113.76334\r\n'
+                     '\r\n')
+            resp = req.get_response(self.controller)
+            self.assertEqual(
+                self.body_lines(resp.body),
+                [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+                 b':UPDATES: START', b':UPDATES: END'])
+            self.assertEqual(resp.status_int, 200)
+            self.assertFalse(self.controller.logger.exception.called)
+            self.assertFalse(self.controller.logger.error.called)
+            self.assertEqual(len(_DELETE_request), 1)  # sanity
+            req = _DELETE_request[0]
+            self.assertEqual(req.path, '/device/partition/a/c/o')
+            self.assertEqual(req.headers, {
+                'X-Timestamp': '1364456113.76334',
+                'Host': 'localhost:80',
+                'X-Backend-Storage-Policy-Index': '0',
+                'X-Backend-Replication': 'True',
+                'X-Backend-Replication-Headers': 'x-timestamp'})
+
+    def test_UPDATES_BONK(self):
+        _BONK_request = [None]
+
+        @server.public
+        def _BONK(request):
+            _BONK_request[0] = request
+            return swob.HTTPOk()
+
+        self.controller.BONK = _BONK
+        self.controller.logger = mock.MagicMock()
+        req = swob.Request.blank(
+            '/device/partition',
+            environ={'REQUEST_METHOD': 'SSYNC'},
+            body=':MISSING_CHECK: START\r\n:MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n'
+                 'BONK /a/c/o\r\n'
+                 'X-Timestamp: 1364456113.76334\r\n'
+                 '\r\n')
+        resp = req.get_response(self.controller)
+        self.assertEqual(
+            self.body_lines(resp.body),
+            [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+             b":ERROR: 0 'Invalid subrequest method BONK'"])
+        self.assertEqual(resp.status_int, 200)
+        self.controller.logger.exception.assert_called_once_with(
+            'None/device/partition EXCEPTION in ssync.Receiver')
+        self.assertEqual(len(_BONK_request), 1)  # sanity
+        self.assertIsNone(_BONK_request[0])
+
+    def test_UPDATES_multiple(self):
+        _requests = []
+
+        @server.public
+        def _PUT(request):
+            _requests.append(request)
+            request.read_body = request.environ['wsgi.input'].read()
+            return swob.HTTPCreated()
+
+        @server.public
+        def _POST(request):
+            _requests.append(request)
+            return swob.HTTPOk()
+
+        @server.public
+        def _DELETE(request):
+            _requests.append(request)
+            return swob.HTTPNoContent()
+
+        with mock.patch.object(self.controller, 'PUT', _PUT), \
+                mock.patch.object(self.controller, 'POST', _POST), \
+                mock.patch.object(self.controller, 'DELETE', _DELETE):
+            self.controller.logger = mock.MagicMock()
+            req = swob.Request.blank(
+                '/device/partition',
+                environ={'REQUEST_METHOD': 'SSYNC'},
+                body=':MISSING_CHECK: START\r\n:MISSING_CHECK: END\r\n'
+                     ':UPDATES: START\r\n'
+                     'PUT /a/c/o1\r\n'
+                     'Content-Length: 1\r\n'
+                     'X-Timestamp: 1364456113.00001\r\n'
+                     'X-Object-Meta-Test1: one\r\n'
+                     'Content-Encoding: gzip\r\n'
+                     'Specialty-Header: value\r\n'
+                     '\r\n'
+                     '1'
+                     'DELETE /a/c/o2\r\n'
+                     'X-Timestamp: 1364456113.00002\r\n'
+                     '\r\n'
+                     'PUT /a/c/o3\r\n'
+                     'Content-Length: 3\r\n'
+                     'X-Timestamp: 1364456113.00003\r\n'
+                     '\r\n'
+                     '123'
+                     'PUT /a/c/o4\r\n'
+                     'Content-Length: 4\r\n'
+                     'X-Timestamp: 1364456113.00004\r\n'
+                     '\r\n'
+                     '1\r\n4'
+                     'DELETE /a/c/o5\r\n'
+                     'X-Timestamp: 1364456113.00005\r\n'
+                     '\r\n'
+                     'DELETE /a/c/o6\r\n'
+                     'X-Timestamp: 1364456113.00006\r\n'
+                     '\r\n'
+                     'PUT /a/c/o7\r\n'
+                     'Content-Length: 7\r\n'
+                     'X-Timestamp: 1364456113.00007\r\n'
+                     '\r\n'
+                     '1234567'
+                     'POST /a/c/o7\r\n'
+                     'X-Object-Meta-Test-User: user_meta\r\n'
+                     'X-Timestamp: 1364456113.00008\r\n'
+                     '\r\n'
+            )
+            resp = req.get_response(self.controller)
+            self.assertEqual(
+                self.body_lines(resp.body),
+                [b':MISSING_CHECK: START', b':MISSING_CHECK: END',
+                 b':UPDATES: START', b':UPDATES: END'])
+            self.assertEqual(resp.status_int, 200)
+            self.assertFalse(self.controller.logger.exception.called)
+            self.assertFalse(self.controller.logger.error.called)
+            self.assertEqual(len(_requests), 8)  # sanity
+            req = _requests.pop(0)
+            self.assertEqual(req.method, 'PUT')
+            self.assertEqual(req.path, '/device/partition/a/c/o1')
+            self.assertEqual(req.content_length, 1)
+            self.assertEqual(req.headers, {
+                'Content-Length': '1',
+                'X-Timestamp': '1364456113.00001',
+                'X-Object-Meta-Test1': 'one',
+                'Content-Encoding': 'gzip',
+                'Specialty-Header': 'value',
+                'Host': 'localhost:80',
+                'X-Backend-Storage-Policy-Index': '0',
+                'X-Backend-Replication': 'True',
+                'X-Backend-Replication-Headers': (
+                    'content-length x-timestamp x-object-meta-test1 '
+                    'content-encoding specialty-header')})
+            self.assertEqual(req.read_body, b'1')
+            req = _requests.pop(0)
+            self.assertEqual(req.method, 'DELETE')
+            self.assertEqual(req.path, '/device/partition/a/c/o2')
+            self.assertEqual(req.headers, {
+                'X-Timestamp': '1364456113.00002',
+                'Host': 'localhost:80',
+                'X-Backend-Storage-Policy-Index': '0',
+                'X-Backend-Replication': 'True',
+                'X-Backend-Replication-Headers': 'x-timestamp'})
+            req = _requests.pop(0)
+            self.assertEqual(req.method, 'PUT')
+            self.assertEqual(req.path, '/device/partition/a/c/o3')
+            self.assertEqual(req.content_length, 3)
+            self.assertEqual(req.headers, {
+                'Content-Length': '3',
+                'X-Timestamp': '1364456113.00003',
+                'Host': 'localhost:80',
+                'X-Backend-Storage-Policy-Index': '0',
+                'X-Backend-Replication': 'True',
+                'X-Backend-Replication-Headers': (
+                    'content-length x-timestamp')})
+            self.assertEqual(req.read_body, b'123')
+            req = _requests.pop(0)
+            self.assertEqual(req.method, 'PUT')
+            self.assertEqual(req.path, '/device/partition/a/c/o4')
+            self.assertEqual(req.content_length, 4)
+            self.assertEqual(req.headers, {
+                'Content-Length': '4',
+                'X-Timestamp': '1364456113.00004',
+                'Host': 'localhost:80',
+                'X-Backend-Storage-Policy-Index': '0',
+                'X-Backend-Replication': 'True',
+                'X-Backend-Replication-Headers': (
+                    'content-length x-timestamp')})
+            self.assertEqual(req.read_body, b'1\r\n4')
+            req = _requests.pop(0)
+            self.assertEqual(req.method, 'DELETE')
+            self.assertEqual(req.path, '/device/partition/a/c/o5')
+            self.assertEqual(req.headers, {
+                'X-Timestamp': '1364456113.00005',
+                'Host': 'localhost:80',
+                'X-Backend-Storage-Policy-Index': '0',
+                'X-Backend-Replication': 'True',
+                'X-Backend-Replication-Headers': 'x-timestamp'})
+            req = _requests.pop(0)
+            self.assertEqual(req.method, 'DELETE')
+            self.assertEqual(req.path, '/device/partition/a/c/o6')
+            self.assertEqual(req.headers, {
+                'X-Timestamp': '1364456113.00006',
+                'Host': 'localhost:80',
+                'X-Backend-Storage-Policy-Index': '0',
+                'X-Backend-Replication': 'True',
+                'X-Backend-Replication-Headers': 'x-timestamp'})
+            req = _requests.pop(0)
+            self.assertEqual(req.method, 'PUT')
+            self.assertEqual(req.path, '/device/partition/a/c/o7')
+            self.assertEqual(req.content_length, 7)
+            self.assertEqual(req.headers, {
+                'Content-Length': '7',
+                'X-Timestamp': '1364456113.00007',
+                'Host': 'localhost:80',
+                'X-Backend-Storage-Policy-Index': '0',
+                'X-Backend-Replication': 'True',
+                'X-Backend-Replication-Headers': (
+                    'content-length x-timestamp')})
+            self.assertEqual(req.read_body, b'1234567')
+            req = _requests.pop(0)
+            self.assertEqual(req.method, 'POST')
+            self.assertEqual(req.path, '/device/partition/a/c/o7')
+            self.assertIsNone(req.content_length)
+            self.assertEqual(req.headers, {
+                'X-Timestamp': '1364456113.00008',
+                'X-Object-Meta-Test-User': 'user_meta',
+                'Host': 'localhost:80',
+                'X-Backend-Storage-Policy-Index': '0',
+                'X-Backend-Replication': 'True',
+                'X-Backend-Replication-Headers': (
+                    'x-object-meta-test-user x-timestamp')})
+            self.assertEqual(_requests, [])
+
+    def test_UPDATES_subreq_does_not_read_all(self):
+        # This tests that if a SSYNC subrequest fails and doesn't read
+        # all the subrequest body that it will read and throw away the rest of
+        # the body before moving on to the next subrequest.
+        # If you comment out the part in ssync_receiver where it does:
+        #     for junk in subreq.environ['wsgi.input']:
+        #         pass
+        # You can then see this test fail.
+        _requests = []
+
+        @server.public
+        def _PUT(request):
+            _requests.append(request)
+            # Deliberately just reading up to first 2 bytes.
+            request.read_body = request.environ['wsgi.input'].read(2)
+            return swob.HTTPInternalServerError()
+
+        class _IgnoreReadlineHint(io.BytesIO):
+
+            def __init__(self, value):
+                io.BytesIO.__init__(self, value)
+
+            def readline(self, hint=-1):
+                return io.BytesIO.readline(self)
+
+        self.controller.PUT = _PUT
+        self.controller.network_chunk_size = 2
+        self.controller.logger = mock.MagicMock()
+        req = swob.Request.blank(
+            '/device/partition',
+            environ={'REQUEST_METHOD': 'SSYNC'},
+            body=':MISSING_CHECK: START\r\n:MISSING_CHECK: END\r\n'
+                 ':UPDATES: START\r\n'
+                 'PUT /a/c/o1\r\n'
+                 'Content-Length: 3\r\n'
+                 'X-Timestamp: 1364456113.00001\r\n'
+                 '\r\n'
+                 '123'
+                 'PUT /a/c/o2\r\n'
+                 'Content-Length: 1\r\n'
+                 'X-Timestamp: 1364456113.00002\r\n'
+                 '\r\n'
+                 '1')
+        req.environ['wsgi.input'] = _IgnoreReadlineHint(req.body)
+        resp = req.get_response(self.controller)
+        final_line = (b":ERROR: 500 b'ERROR: With :UPDATES: "
+                      b"2 failures to 0 successes'")
+        self.assertEqual(
+            self.body_lines(resp.body),
+            [b':MISSING_CHECK: START', b':MISSING_CHECK: END', final_line])
+        self.assertEqual(resp.status_int, 200)
+        self.assertFalse(self.controller.logger.exception.called)
+        self.assertFalse(self.controller.logger.error.called)
+        self.assertTrue(self.controller.logger.warning.called)
+        self.assertEqual(2, self.controller.logger.warning.call_count)
+        self.assertEqual(len(_requests), 2)  # sanity
+        req = _requests.pop(0)
+        self.assertEqual(req.path, '/device/partition/a/c/o1')
+        self.assertEqual(req.content_length, 3)
+        self.assertEqual(req.headers, {
+            'Content-Length': '3',
+            'X-Timestamp': '1364456113.00001',
+            'Host': 'localhost:80',
+            'X-Backend-Storage-Policy-Index': '0',
+            'X-Backend-Replication': 'True',
+            'X-Backend-Replication-Headers': (
+                'content-length x-timestamp')})
+        self.assertEqual(req.read_body, b'12')
+        req = _requests.pop(0)
+        self.assertEqual(req.path, '/device/partition/a/c/o2')
+        self.assertEqual(req.content_length, 1)
+        self.assertEqual(req.headers, {
+            'Content-Length': '1',
+            'X-Timestamp': '1364456113.00002',
+            'Host': 'localhost:80',
+            'X-Backend-Storage-Policy-Index': '0',
+            'X-Backend-Replication': 'True',
+            'X-Backend-Replication-Headers': (
+                'content-length x-timestamp')})
+        self.assertEqual(req.read_body, b'1')
+        self.assertEqual(_requests, [])
+
+
+@patch_policies(with_ec_default=True)
+class TestSsyncRxServer(unittest.TestCase):
+    # Tests to verify behavior of SSYNC requests sent to an object
+    # server socket.
+
+    def setUp(self):
+        skip_if_no_xattrs()
+        # dirs
+        self.tmpdir = tempfile.mkdtemp()
+        self.tempdir = os.path.join(self.tmpdir, 'tmp_test_obj_server')
+
+        self.devices = os.path.join(self.tempdir, 'srv/node')
+        for device in ('sda1', 'sdb1'):
+            os.makedirs(os.path.join(self.devices, device))
+
+        self.conf = {
+            'devices': self.devices,
+            'mount_check': 'false',
+            'swift_dir': self.tempdir,
+        }
+        self.rx_logger = debug_logger('test-object-server')
+        rx_server = server.ObjectController(self.conf, logger=self.rx_logger)
+        self.rx_ip = '127.0.0.1'
+        self.sock = listen_zero()
+        self.rx_server = eventlet.spawn(
+            eventlet.wsgi.server, self.sock, rx_server, utils.NullLogger())
+        self.rx_port = self.sock.getsockname()[1]
+        self.tx_logger = debug_logger('test-reconstructor')
+        self.daemon = ObjectReconstructor(self.conf, self.tx_logger)
+        self.daemon._diskfile_mgr = self.daemon._df_router[POLICIES[0]]
+
+    def tearDown(self):
+        self.rx_server.kill()
+        self.sock.close()
+        eventlet.sleep(0)
+        shutil.rmtree(self.tmpdir)
+
+    def test_SSYNC_disconnect(self):
+        node = {
+            'replication_ip': '127.0.0.1',
+            'replication_port': self.rx_port,
+            'device': 'sdb1',
+        }
+        job = {
+            'partition': 0,
+            'policy': POLICIES[0],
+            'device': 'sdb1',
+        }
+        sender = ssync_sender.Sender(self.daemon, node, job, ['abc'])
+
+        # kick off the sender and let the error trigger failure
+        with mock.patch(
+                'swift.obj.ssync_receiver.Receiver.initialize_request') \
+                as mock_initialize_request:
+            mock_initialize_request.side_effect = \
+                swob.HTTPInternalServerError()
+            success, _ = sender()
+        self.assertFalse(success)
+        stderr = io.StringIO()
+        with mock.patch('sys.stderr', stderr):
+            # let gc and eventlet spin a bit
+            del sender
+            for i in range(3):
+                eventlet.sleep(0)
+        self.assertNotIn('ValueError: invalid literal for int() with base 16',
+                         stderr.getvalue())
+
+    def test_SSYNC_device_not_available(self):
+        with mock.patch('swift.obj.ssync_receiver.Receiver.missing_check')\
+                as mock_missing_check:
+            self.connection = bufferedhttp.BufferedHTTPConnection(
+                '127.0.0.1:%s' % self.rx_port)
+            self.connection.putrequest('SSYNC', '/sdc1/0')
+            self.connection.putheader('Transfer-Encoding', 'chunked')
+            self.connection.putheader('X-Backend-Storage-Policy-Index',
+                                      int(POLICIES[0]))
+            self.connection.endheaders()
+            resp = self.connection.getresponse()
+        self.assertEqual(507, resp.status)
+        resp.read()
+        resp.close()
+        # sanity check that the receiver did not proceed to missing_check
+        self.assertFalse(mock_missing_check.called)
+
+    def test_SSYNC_read_error(self):
+        # verify that read errors from wsgi reader are caught and reported
+        def do_send(data):
+            self.rx_logger.clear()
+            self.connection = bufferedhttp.BufferedHTTPConnection(
+                '127.0.0.1:%s' % self.rx_port)
+            self.connection.putrequest('SSYNC', '/sda1/0')
+            self.connection.putheader('Transfer-Encoding', 'chunked')
+            self.connection.putheader('X-Backend-Storage-Policy-Index',
+                                      int(POLICIES[0]))
+            self.connection.endheaders()
+            resp = self.connection.getresponse()
+            self.assertEqual(200, resp.status)
+            resp.close()
+            self.connection.send(data)
+            self.connection.close()
+            for sleep_time in (0, 0.1, 1):
+                lines = self.rx_logger.get_lines_for_level('error')
+                if lines:
+                    return lines
+                eventlet.sleep(sleep_time)
+            return []
+
+        # check read errors during missing_check phase
+        error_lines = do_send(b'')
+        self.assertEqual(1, len(error_lines))
+        self.assertIn('missing_check start: invalid literal', error_lines[0])
+
+        error_lines = do_send(b'1\r\n')
+        self.assertEqual(1, len(error_lines))
+        self.assertIn('missing_check start: unexpected end of file',
+                      error_lines[0])
+
+        error_lines = do_send(b'17\r\n:MISSING_CHECK: START\r\n\r\nx\r\n')
+        self.assertEqual(1, len(error_lines))
+        self.assertIn('missing_check line: invalid literal', error_lines[0])
+
+        error_lines = do_send(b'17\r\n:MISSING_CHECK: START\r\n\r\n12\r\n')
+        self.assertEqual(1, len(error_lines))
+        self.assertIn('missing_check line: unexpected end of file',
+                      error_lines[0])
+
+        # check read errors during updates phase
+        with mock.patch('swift.obj.ssync_receiver.Receiver.missing_check'):
+            error_lines = do_send(b'')
+        self.assertEqual(1, len(error_lines))
+        self.assertIn('updates start: invalid literal', error_lines[0])
+
+        with mock.patch('swift.obj.ssync_receiver.Receiver.missing_check'):
+            error_lines = do_send(b'1\r\n')
+        self.assertEqual(1, len(error_lines))
+        self.assertIn('updates start: unexpected end of file', error_lines[0])
+
+        with mock.patch('swift.obj.ssync_receiver.Receiver.missing_check'):
+            error_lines = do_send(b'11\r\n:UPDATES: START\r\n\r\nx\r\n')
+        self.assertEqual(1, len(error_lines))
+        self.assertIn('updates line: invalid literal', error_lines[0])
+
+        with mock.patch('swift.obj.ssync_receiver.Receiver.missing_check'):
+            error_lines = do_send(b'11\r\n:UPDATES: START\r\n\r\n12\r\n')
+        self.assertEqual(1, len(error_lines))
+        self.assertIn('updates line: unexpected end of file', error_lines[0])
+
+    def test_SSYNC_invalid_policy(self):
+        valid_indices = sorted([int(policy) for policy in POLICIES])
+        bad_index = valid_indices[-1] + 1
+        with mock.patch('swift.obj.ssync_receiver.Receiver.missing_check')\
+                as mock_missing_check:
+            self.connection = bufferedhttp.BufferedHTTPConnection(
+                '127.0.0.1:%s' % self.rx_port)
+            self.connection.putrequest('SSYNC', '/sda1/0')
+            self.connection.putheader('Transfer-Encoding', 'chunked')
+            self.connection.putheader('X-Backend-Storage-Policy-Index',
+                                      bad_index)
+            self.connection.endheaders()
+            resp = self.connection.getresponse()
+        self.assertEqual(503, resp.status)
+        resp.read()
+        resp.close()
+        # sanity check that the receiver did not proceed to missing_check
+        self.assertFalse(mock_missing_check.called)
+
+    def test_bad_request_invalid_frag_index(self):
+        with mock.patch('swift.obj.ssync_receiver.Receiver.missing_check')\
+                as mock_missing_check:
+            self.connection = bufferedhttp.BufferedHTTPConnection(
+                '127.0.0.1:%s' % self.rx_port)
+            self.connection.putrequest('SSYNC', '/sda1/0')
+            self.connection.putheader('Transfer-Encoding', 'chunked')
+            self.connection.putheader('X-Backend-Ssync-Frag-Index',
+                                      'None')
+            self.connection.endheaders()
+            resp = self.connection.getresponse()
+        self.assertEqual(400, resp.status)
+        error_msg = resp.read()
+        self.assertIn(b"Invalid X-Backend-Ssync-Frag-Index 'None'", error_msg)
+        resp.close()
+        # sanity check that the receiver did not proceed to missing_check
+        self.assertFalse(mock_missing_check.called)
+
+
+class TestModuleMethods(unittest.TestCase):
+    def test_decode_missing(self):
+        object_hash = '9d41d8cd98f00b204e9800998ecf0abc'
+        ts_iter = make_timestamp_iter()
+        t_data = next(ts_iter)
+        t_meta = next(ts_iter)
+        t_ctype = next(ts_iter)
+        d_meta_data = t_meta.raw - t_data.raw
+        d_ctype_data = t_ctype.raw - t_data.raw
+
+        # legacy single timestamp string
+        msg = '%s %s' % (object_hash, t_data.internal)
+        expected = dict(object_hash=object_hash,
+                        ts_meta=t_data,
+                        ts_data=t_data,
+                        ts_ctype=t_data,
+                        durable=True)
+        self.assertEqual(expected,
+                         ssync_receiver.decode_missing(msg.encode('ascii')))
+
+        # hex meta delta encoded as extra message part
+        msg = '%s %s m:%x' % (object_hash, t_data.internal, d_meta_data)
+        expected = dict(object_hash=object_hash,
+                        ts_data=t_data,
+                        ts_meta=t_meta,
+                        ts_ctype=t_data,
+                        durable=True)
+        self.assertEqual(expected,
+                         ssync_receiver.decode_missing(msg.encode('ascii')))
+
+        # hex content type delta encoded in extra message part
+        msg = '%s %s t:%x,m:%x' % (object_hash, t_data.internal,
+                                   d_ctype_data, d_meta_data)
+        expected = dict(object_hash=object_hash,
+                        ts_data=t_data,
+                        ts_meta=t_meta,
+                        ts_ctype=t_ctype,
+                        durable=True)
+        self.assertEqual(
+            expected, ssync_receiver.decode_missing(msg.encode('ascii')))
+
+        # order of subparts does not matter
+        msg = '%s %s m:%x,t:%x' % (object_hash, t_data.internal,
+                                   d_meta_data, d_ctype_data)
+        self.assertEqual(
+            expected, ssync_receiver.decode_missing(msg.encode('ascii')))
+
+        # timestamps have offsets
+        t_data_offset = utils.Timestamp(t_data, offset=99)
+        t_meta_offset = utils.Timestamp(t_meta, offset=1)
+        t_ctype_offset = utils.Timestamp(t_ctype, offset=2)
+        expected = dict(object_hash=object_hash,
+                        ts_data=t_data_offset,
+                        ts_meta=t_meta_offset,
+                        ts_ctype=t_ctype_offset,
+                        durable=True)
+        expected = ('%s %s_0000000000000063 m:%x__1,t:%x__2'
+                    % (object_hash, t_data.internal, d_meta_data,
+                       d_ctype_data))
+        self.assertEqual(
+            expected.encode('ascii'),
+            ssync_sender.encode_missing(
+                object_hash, t_data_offset, t_meta_offset, t_ctype_offset,
+                durable=True))
+
+        # hex content type delta may be zero
+        msg = '%s %s t:0,m:%x' % (object_hash, t_data.internal, d_meta_data)
+        expected = dict(object_hash=object_hash,
+                        ts_data=t_data,
+                        ts_meta=t_meta,
+                        ts_ctype=t_data,
+                        durable=True)
+        self.assertEqual(
+            expected, ssync_receiver.decode_missing(msg.encode('ascii')))
+
+        # unexpected zero delta is tolerated
+        msg = '%s %s m:0' % (object_hash, t_data.internal)
+        expected = dict(object_hash=object_hash,
+                        ts_meta=t_data,
+                        ts_data=t_data,
+                        ts_ctype=t_data,
+                        durable=True)
+        self.assertEqual(expected,
+                         ssync_receiver.decode_missing(msg.encode('ascii')))
+
+        # unexpected subparts in timestamp delta part are tolerated
+        msg = '%s %s c:12345,m:%x,junk' % (object_hash,
+                                           t_data.internal,
+                                           d_meta_data)
+        expected = dict(object_hash=object_hash,
+                        ts_meta=t_meta,
+                        ts_data=t_data,
+                        ts_ctype=t_data,
+                        durable=True)
+        self.assertEqual(
+            expected, ssync_receiver.decode_missing(msg.encode('ascii')))
+
+        # extra message parts tolerated
+        msg = '%s %s m:%x future parts' % (object_hash,
+                                           t_data.internal,
+                                           d_meta_data)
+        expected = dict(object_hash=object_hash,
+                        ts_meta=t_meta,
+                        ts_data=t_data,
+                        ts_ctype=t_data,
+                        durable=True)
+        self.assertEqual(expected,
+                         ssync_receiver.decode_missing(msg.encode('ascii')))
+
+        # not durable
+        def check_non_durable(durable_val):
+            msg = '%s %s m:%x,durable:%s' % (object_hash,
+                                             t_data.internal,
+                                             d_meta_data,
+                                             durable_val)
+            expected = dict(object_hash=object_hash,
+                            ts_meta=t_meta,
+                            ts_data=t_data,
+                            ts_ctype=t_data,
+                            durable=False)
+            self.assertEqual(
+                expected, ssync_receiver.decode_missing(msg.encode('ascii')))
+        check_non_durable('no')
+        check_non_durable('false')
+        check_non_durable('False')
+
+        # explicit durable (as opposed to True by default)
+        def check_durable(durable_val):
+            msg = '%s %s m:%x,durable:%s' % (object_hash,
+                                             t_data.internal,
+                                             d_meta_data,
+                                             durable_val)
+            expected = dict(object_hash=object_hash,
+                            ts_meta=t_meta,
+                            ts_data=t_data,
+                            ts_ctype=t_data,
+                            durable=True)
+            self.assertEqual(
+                expected, ssync_receiver.decode_missing(msg.encode('ascii')))
+        check_durable('yes')
+        check_durable('true')
+        check_durable('True')
+
+    def test_encode_wanted(self):
+        ts_iter = make_timestamp_iter()
+        old_t_data = next(ts_iter)
+        t_data = next(ts_iter)
+        old_t_meta = next(ts_iter)
+        t_meta = next(ts_iter)
+
+        remote = {
+            'object_hash': 'theremotehash',
+            'ts_data': t_data,
+            'ts_meta': t_meta,
+        }
+
+        # missing
+        local = {}
+        expected = 'theremotehash dm'
+        self.assertEqual(ssync_receiver.encode_wanted(remote, local),
+                         expected)
+
+        # in-sync
+        local = {
+            'ts_data': t_data,
+            'ts_meta': t_meta,
+        }
+        expected = None
+        self.assertEqual(ssync_receiver.encode_wanted(remote, local),
+                         expected)
+
+        # out-of-sync
+        local = {
+            'ts_data': old_t_data,
+            'ts_meta': old_t_meta,
+        }
+        expected = 'theremotehash dm'
+        self.assertEqual(ssync_receiver.encode_wanted(remote, local),
+                         expected)
+
+        # old data
+        local = {
+            'ts_data': old_t_data,
+            'ts_meta': t_meta,
+        }
+        expected = 'theremotehash d'
+        self.assertEqual(ssync_receiver.encode_wanted(remote, local),
+                         expected)
+
+        # old metadata
+        local = {
+            'ts_data': t_data,
+            'ts_meta': old_t_meta,
+        }
+        expected = 'theremotehash m'
+        self.assertEqual(ssync_receiver.encode_wanted(remote, local),
+                         expected)
+
+        # in-sync tombstone
+        local = {
+            'ts_data': t_data,
+        }
+        expected = None
+        self.assertEqual(ssync_receiver.encode_wanted(remote, local),
+                         expected)
+
+        # old tombstone
+        local = {
+            'ts_data': old_t_data,
+        }
+        expected = 'theremotehash d'
+        self.assertEqual(ssync_receiver.encode_wanted(remote, local),
+                         expected)
+
+
+class TestSsyncInputProxy(unittest.TestCase):
+    def test_read_line(self):
+        body = io.BytesIO(b'f\r\nDELETE /a/c/o\r\n\r\n'
+                          b'10\r\nDELETE /a/c/o1\r\n\r\n'
+                          b'13\r\nDELETE /a/c/oh my\r\n\r\n')
+        wsgi_input = eventlet.wsgi.Input(
+            rfile=body, content_length=123, sock=mock.MagicMock(),
+            chunked_input=True)
+        inpt = SsyncInputProxy(wsgi_input, chunk_size=65536, timeout=60)
+        self.assertEqual(b'DELETE /a/c/o\r\n', inpt.read_line('ctxt'))
+        self.assertEqual(b'DELETE /a/c/o1\r\n', inpt.read_line('ctxt'))
+        self.assertEqual(b'DELETE /a/c/oh my\r\n', inpt.read_line('ctxt'))
+
+    def test_read_line_timeout(self):
+        body = SlowBytesIO(b'f\r\nDELETE /a/c/o\r\n\r\n'
+                           b'10\r\nDELETE /a/c/o1\r\n\r\n',
+                           # timeout reading second line...
+                           sleep_index=23)
+        wsgi_input = eventlet.wsgi.Input(
+            rfile=body, content_length=123, sock=mock.MagicMock(),
+            chunked_input=True)
+        inpt = SsyncInputProxy(wsgi_input, chunk_size=65536, timeout=0.01)
+        self.assertEqual(b'DELETE /a/c/o\r\n', inpt.read_line('ctxt'))
+        with self.assertRaises(MessageTimeout) as cm:
+            inpt.read_line('ctxt')
+        self.assertEqual('0.01 seconds: ctxt', str(cm.exception))
+        # repeat
+        with self.assertRaises(MessageTimeout) as cm:
+            inpt.read_line('ctxt')
+        self.assertEqual('0.01 seconds: ctxt', str(cm.exception))
+        # check subreq input will also fail
+        sub_input = inpt.make_subreq_input('ctxt2', 123)
+        with self.assertRaises(MessageTimeout) as cm:
+            sub_input.read()
+        self.assertEqual('0.01 seconds: ctxt', str(cm.exception))
+
+    def test_read_line_chunk_read_error(self):
+        body = SlowBytesIO(b'f\r\nDELETE /a/c/o\r\n\r\n'
+                           # bad chunk length...
+                           b'x\r\nDELETE /a/c/o1\r\n\r\n',
+                           sleep_index=23)
+        wsgi_input = eventlet.wsgi.Input(
+            rfile=body, content_length=123, sock=mock.MagicMock(),
+            chunked_input=True)
+        inpt = SsyncInputProxy(wsgi_input, chunk_size=65536, timeout=0.01)
+        self.assertEqual(b'DELETE /a/c/o\r\n', inpt.read_line('ctxt'))
+        with self.assertRaises(ChunkReadError) as cm:
+            inpt.read_line('ctxt')
+        self.assertEqual(
+            "ctxt: invalid literal for int() with base 16: b'x\\r\\n'",
+            str(cm.exception))
+        # repeat
+        with self.assertRaises(ChunkReadError) as cm:
+            inpt.read_line('ctxt')
+        self.assertEqual(
+            "ctxt: invalid literal for int() with base 16: b'x\\r\\n'",
+            str(cm.exception))
+        # check subreq input will also fail
+        sub_input = inpt.make_subreq_input('ctxt2', 123)
+        with self.assertRaises(ChunkReadError) as cm:
+            sub_input.read()
+        self.assertEqual(
+            "ctxt: invalid literal for int() with base 16: b'x\\r\\n'",
+            str(cm.exception))
+
+    def test_read_line_protocol_error(self):
+        body = io.BytesIO(
+            b'17\r\n:MISSING_CHECK: START\r\n\r\n'
+            b'15\r\n:MISSING_CHECK: END\r\n\r\n'
+            b'11\r\n:UPDATES: START\r\n\r\n'
+            b'd\r\n:UPDATES: END\r\n'  # note: chunk is missing its newline
+            b'0\r\n\r\n'
+        )
+        wsgi_input = eventlet.wsgi.Input(
+            rfile=body, content_length=123, sock=mock.MagicMock(),
+            chunked_input=True)
+        inpt = SsyncInputProxy(wsgi_input, chunk_size=65536, timeout=0.01)
+        self.assertEqual(b':MISSING_CHECK: START\r\n', inpt.read_line('ctxt'))
+        self.assertEqual(b':MISSING_CHECK: END\r\n', inpt.read_line('ctxt'))
+        self.assertEqual(b':UPDATES: START\r\n', inpt.read_line('ctxt'))
+        with self.assertRaises(ChunkReadError) as cm:
+            inpt.read_line('ctxt')
+        self.assertEqual('ctxt: missing newline', str(cm.exception))
+
+    def test_subreq_input(self):
+        body = io.BytesIO(b'1a\r\nchunk1                    \r\n'
+                          b'1b\r\nchunktwo                   \r\n'
+                          b'1c\r\nchunkthree                  \r\n'
+                          b'f\r\nDELETE /a/c/o\r\n\r\n')
+        wsgi_input = eventlet.wsgi.Input(
+            rfile=body, content_length=123, sock=mock.MagicMock(),
+            chunked_input=True)
+        inpt = SsyncInputProxy(wsgi_input, chunk_size=20, timeout=60)
+        sub_input = inpt.make_subreq_input('ctxt', content_length=81)
+        self.assertEqual(b'chunk1                    '
+                         b'chunktwo                   '
+                         b'chunkthree                  ',
+                         sub_input.read())
+        # check next read_line (note: chunk_size needs to be big enough to read
+        # whole ssync protocol 'line'
+        self.assertEqual(b'DELETE /a/c/o\r\n', inpt.read_line('ctxt'))
+
+    def test_subreq_input_content_length_less_than_body(self):
+        body = io.BytesIO(b'1a\r\nchunk1                    \r\n'
+                          b'1b\r\nchunktwo                   \r\n')
+        wsgi_input = eventlet.wsgi.Input(
+            rfile=body, content_length=123, sock=mock.MagicMock(),
+            chunked_input=True)
+        inpt = SsyncInputProxy(wsgi_input, chunk_size=20, timeout=60)
+        sub_input = inpt.make_subreq_input('ctxt', content_length=3)
+        self.assertEqual(b'chu', sub_input.read())
+
+    def test_subreq_input_content_length_more_than_body(self):
+        body = io.BytesIO(b'1a\r\nchunk1                    \r\n')
+        wsgi_input = eventlet.wsgi.Input(
+            rfile=body, content_length=123, sock=mock.MagicMock(),
+            chunked_input=True)
+        inpt = SsyncInputProxy(wsgi_input, chunk_size=20, timeout=60)
+        sub_input = inpt.make_subreq_input('ctxt', content_length=81)
+        with self.assertRaises(ChunkReadError) as cm:
+            sub_input.read()
+        self.assertEqual("ctxt: invalid literal for int() with base 16: b''",
+                         str(cm.exception))
+
+    def test_subreq_input_early_termination(self):
+        body = io.BytesIO(b'1a\r\nchunk1                    \r\n'
+                          b'0\r\n\r\n')  # the sender disconnected
+        wsgi_input = eventlet.wsgi.Input(
+            rfile=body, content_length=123, sock=mock.MagicMock(),
+            chunked_input=True)
+        inpt = SsyncInputProxy(wsgi_input, chunk_size=20, timeout=60)
+        sub_input = inpt.make_subreq_input('ctxt', content_length=81)
+        with self.assertRaises(ChunkReadError) as cm:
+            sub_input.read()
+        self.assertEqual('Early termination for ctxt', str(cm.exception))
+
+    def test_subreq_input_timeout(self):
+        body = SlowBytesIO(b'1a\r\nchunk1                    \r\n'
+                           b'1b\r\nchunktwo                   \r\n',
+                           sleep_index=25)
+        wsgi_input = eventlet.wsgi.Input(
+            rfile=body, content_length=123, sock=mock.MagicMock(),
+            chunked_input=True)
+        inpt = SsyncInputProxy(wsgi_input, chunk_size=16, timeout=0.01)
+        sub_input = inpt.make_subreq_input('ctxt', content_length=81)
+        self.assertEqual(b'chunk1          ', sub_input.read(16))
+        with self.assertRaises(MessageTimeout) as cm:
+            sub_input.read()
+        self.assertEqual('0.01 seconds: ctxt', str(cm.exception))
+        # repeat
+        self.assertEqual(b'', sub_input.read())
+        # check next read_line
+        with self.assertRaises(MessageTimeout) as cm:
+            inpt.read_line('ctxt2')
+        self.assertEqual('0.01 seconds: ctxt', str(cm.exception))
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/obj/test_ssync_sender.py b/test/unit/obj/test_ssync_sender.py
new file mode 100644
index 0000000000..332c74ebdb
--- /dev/null
+++ b/test/unit/obj/test_ssync_sender.py
@@ -0,0 +1,2185 @@
+# Copyright (c) 2013 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import io
+import os
+import time
+import unittest
+
+import eventlet
+from unittest import mock
+import urllib.parse
+
+from swift.common import exceptions, utils
+from swift.common.storage_policy import POLICIES
+from swift.common.swob import wsgi_to_bytes, wsgi_to_str
+from swift.common.utils import Timestamp
+from swift.obj import ssync_sender, diskfile, ssync_receiver
+from swift.obj.replicator import ObjectReplicator
+
+from test.debug_logger import debug_logger
+from test.unit.obj.common import BaseTest
+from test.unit import patch_policies, make_timestamp_iter, skip_if_no_xattrs
+
+
+class NullBufferedHTTPConnection(object):
+
+    def __init__(*args, **kwargs):
+        pass
+
+    def putrequest(*args, **kwargs):
+        pass
+
+    def putheader(*args, **kwargs):
+        pass
+
+    def endheaders(*args, **kwargs):
+        pass
+
+    def getresponse(*args, **kwargs):
+        pass
+
+    def close(*args, **kwargs):
+        pass
+
+
+class FakeResponse(ssync_sender.SsyncBufferedHTTPResponse):
+
+    def __init__(self, chunk_body='', headers=None):
+        self.status = 200
+        self.close_called = False
+        chunk_body = chunk_body.encode('ascii')
+        if chunk_body:
+            self.fp = io.BytesIO(
+                b'%x\r\n%s\r\n0\r\n\r\n' % (len(chunk_body), chunk_body))
+        self.ssync_response_buffer = b''
+        self.ssync_response_chunk_left = 0
+        self.headers = headers or {}
+
+    def read(self, *args, **kwargs):
+        return b''
+
+    def close(self):
+        self.close_called = True
+
+    def getheader(self, header_name, default=None):
+        return str(self.headers.get(header_name, default))
+
+    def getheaders(self):
+        return self.headers.items()
+
+
+class FakeConnection(object):
+
+    def __init__(self, sleeps=None):
+        self.sleeps = sleeps
+        self.sent = []
+        self.closed = False
+
+    def send(self, data):
+        self.sent.append(data)
+        if self.sleeps:
+            eventlet.sleep(self.sleeps.pop(0))
+
+    def close(self):
+        self.closed = True
+
+
+class SenderBase(BaseTest):
+    def assertConnectionMessages(self, expected_messages, messages,
+                                 cmds_with_newlines=False):
+        """Assert ssync sender messages
+
+        You only need to provide the expected lines of text. The
+        hex length and \\r\\n will be added automatically, eg:
+
+          [':MISSING_CHECK: START', '<obj hash> <ts>', ':MISSING_CHECK: END' ]
+
+        Commands in the ssync protocol need to end with a \\r\\n. If you
+        decide to provide them (because request data tends to not incude them)
+        then you can use the `cmds_with_newlines` flag to indicate this.
+
+        """
+        expected = b""
+        for line in expected_messages:
+            if isinstance(line, str):
+                line = wsgi_to_bytes(line)
+            if line:
+                if not cmds_with_newlines:
+                    line = b"%s\r\n" % line
+            expected += b'%x\r\n%s\r\n' % (len(line), line)
+
+        self.assertEqual(expected, b''.join(messages))
+
+
+@patch_policies()
+class TestSender(SenderBase):
+
+    def setUp(self):
+        skip_if_no_xattrs()
+        super(TestSender, self).setUp()
+        self.daemon_logger = debug_logger('test-ssync-sender')
+        self.daemon = ObjectReplicator(self.daemon_conf,
+                                       self.daemon_logger)
+        self.job = {'policy': POLICIES.legacy,
+                    'device': 'test-dev',
+                    'partition': '99'}  # sufficient for Sender.__init__
+        self.sender = ssync_sender.Sender(self.daemon, None, self.job, None)
+
+    def test_call_catches_MessageTimeout(self):
+
+        def connect(self):
+            exc = exceptions.MessageTimeout(1, 'test connect')
+            # Cancels Eventlet's raising of this since we're about to do it.
+            exc.cancel()
+            raise exc
+
+        with mock.patch.object(ssync_sender.Sender, 'connect', connect):
+            node = dict(replication_ip='1.2.3.4', replication_port=5678,
+                        device='sda1')
+            job = dict(partition='9', policy=POLICIES.legacy)
+            self.sender = ssync_sender.Sender(self.daemon, node, job, None)
+            self.sender.suffixes = ['abc']
+            success, candidates = self.sender()
+            self.assertFalse(success)
+            self.assertEqual(candidates, {})
+        error_lines = self.daemon_logger.get_lines_for_level('error')
+        self.assertEqual(1, len(error_lines))
+        self.assertEqual('1.2.3.4:5678/sda1/9 1 second: test connect',
+                         error_lines[0])
+
+    def test_call_catches_ReplicationException(self):
+
+        def connect(self):
+            raise exceptions.ReplicationException('test connect')
+
+        with mock.patch.object(ssync_sender.Sender, 'connect', connect):
+            node = dict(replication_ip='1.2.3.4', replication_port=5678,
+                        device='sda1')
+            job = dict(partition='9', policy=POLICIES.legacy)
+            self.sender = ssync_sender.Sender(self.daemon, node, job, None)
+            self.sender.suffixes = ['abc']
+            success, candidates = self.sender()
+            self.assertFalse(success)
+            self.assertEqual(candidates, {})
+        error_lines = self.daemon_logger.get_lines_for_level('error')
+        self.assertEqual(1, len(error_lines))
+        self.assertEqual('1.2.3.4:5678/sda1/9 test connect',
+                         error_lines[0])
+
+    def test_call_catches_other_exceptions(self):
+        node = dict(replication_ip='1.2.3.4', replication_port=5678,
+                    device='sda1')
+        job = dict(partition='9', policy=POLICIES.legacy)
+        self.sender = ssync_sender.Sender(self.daemon, node, job, None)
+        self.sender.suffixes = ['abc']
+        self.sender.connect = 'cause exception'
+        success, candidates = self.sender()
+        self.assertFalse(success)
+        self.assertEqual(candidates, {})
+        error_lines = self.daemon_logger.get_lines_for_level('error')
+        for line in error_lines:
+            self.assertTrue(line.startswith(
+                '1.2.3.4:5678/sda1/9 EXCEPTION in ssync.Sender: '))
+
+    def test_call_catches_exception_handling_exception(self):
+        self.sender.node = None  # Will cause inside exception handler to fail
+        self.sender.suffixes = ['abc']
+        self.sender.connect = 'cause exception'
+        success, candidates = self.sender()
+        self.assertFalse(success)
+        self.assertEqual(candidates, {})
+        error_lines = self.daemon_logger.get_lines_for_level('error')
+        for line in error_lines:
+            self.assertTrue(line.startswith(
+                'EXCEPTION in ssync.Sender'))
+
+    def test_call_calls_others(self):
+        connection = FakeConnection()
+        response = FakeResponse()
+        self.sender.suffixes = ['abc']
+        self.sender.connect = mock.MagicMock(return_value=(connection,
+                                                           response))
+        self.sender.missing_check = mock.MagicMock(return_value=({}, {}))
+        self.sender.updates = mock.MagicMock()
+        self.sender.disconnect = mock.MagicMock()
+        success, candidates = self.sender()
+        self.assertTrue(success)
+        self.assertEqual(candidates, {})
+        self.sender.connect.assert_called_once_with()
+        self.sender.missing_check.assert_called_once_with(connection, response)
+        self.sender.updates.assert_called_once_with(connection, response, {})
+        self.sender.disconnect.assert_called_once_with(connection)
+
+    def test_connect(self):
+        node = dict(replication_ip='1.2.3.4', replication_port=5678,
+                    device='sda1', backend_index=0)
+        job = dict(partition='9', policy=POLICIES[1])
+        self.sender = ssync_sender.Sender(self.daemon, node, job, None)
+        self.sender.suffixes = ['abc']
+        with mock.patch(
+                'swift.obj.ssync_sender.SsyncBufferedHTTPConnection'
+        ) as mock_conn_class:
+            mock_conn = mock_conn_class.return_value
+            mock_resp = mock.MagicMock()
+            mock_resp.status = 200
+            mock_conn.getresponse.return_value = mock_resp
+            self.sender.connect()
+        mock_conn_class.assert_called_once_with('1.2.3.4:5678')
+        expectations = {
+            'putrequest': [
+                mock.call('SSYNC', '/sda1/9'),
+            ],
+            'putheader': [
+                mock.call('Transfer-Encoding', 'chunked'),
+                mock.call('X-Backend-Storage-Policy-Index', 1),
+                mock.call('X-Backend-Ssync-Frag-Index', 0),
+                mock.call('X-Backend-Ssync-Node-Index', 0),
+            ],
+            'endheaders': [mock.call()],
+        }
+        for method_name, expected_calls in expectations.items():
+            mock_method = getattr(mock_conn, method_name)
+            self.assertEqual(expected_calls, mock_method.mock_calls,
+                             'connection method "%s" got %r not %r' % (
+                                 method_name, mock_method.mock_calls,
+                                 expected_calls))
+
+    def test_connect_handoff(self):
+        node = dict(replication_ip='1.2.3.4', replication_port=5678,
+                    device='sda1')
+        job = dict(partition='9', policy=POLICIES[1], frag_index=9)
+        self.sender = ssync_sender.Sender(self.daemon, node, job, None)
+        self.sender.suffixes = ['abc']
+        with mock.patch(
+                'swift.obj.ssync_sender.SsyncBufferedHTTPConnection'
+        ) as mock_conn_class:
+            mock_conn = mock_conn_class.return_value
+            mock_resp = mock.MagicMock()
+            mock_resp.status = 200
+            mock_conn.getresponse.return_value = mock_resp
+            self.sender.connect()
+        mock_conn_class.assert_called_once_with('1.2.3.4:5678')
+        expectations = {
+            'putrequest': [
+                mock.call('SSYNC', '/sda1/9'),
+            ],
+            'putheader': [
+                mock.call('Transfer-Encoding', 'chunked'),
+                mock.call('X-Backend-Storage-Policy-Index', 1),
+            ],
+            'endheaders': [mock.call()],
+        }
+        for method_name, expected_calls in expectations.items():
+            mock_method = getattr(mock_conn, method_name)
+            self.assertEqual(expected_calls, mock_method.mock_calls,
+                             'connection method "%s" got %r not %r' % (
+                                 method_name, mock_method.mock_calls,
+                                 expected_calls))
+
+    def test_connect_handoff_no_frag(self):
+        node = dict(replication_ip='1.2.3.4', replication_port=5678,
+                    device='sda1')
+        job = dict(partition='9', policy=POLICIES[0])
+        self.sender = ssync_sender.Sender(self.daemon, node, job, None)
+        self.sender.suffixes = ['abc']
+        with mock.patch(
+                'swift.obj.ssync_sender.SsyncBufferedHTTPConnection'
+        ) as mock_conn_class:
+            mock_conn = mock_conn_class.return_value
+            mock_resp = mock.MagicMock()
+            mock_resp.status = 200
+            mock_conn.getresponse.return_value = mock_resp
+            self.sender.connect()
+        mock_conn_class.assert_called_once_with('1.2.3.4:5678')
+        expectations = {
+            'putrequest': [
+                mock.call('SSYNC', '/sda1/9'),
+            ],
+            'putheader': [
+                mock.call('Transfer-Encoding', 'chunked'),
+                mock.call('X-Backend-Storage-Policy-Index', 0),
+            ],
+            'endheaders': [mock.call()],
+        }
+        for method_name, expected_calls in expectations.items():
+            mock_method = getattr(mock_conn, method_name)
+            self.assertEqual(expected_calls, mock_method.mock_calls,
+                             'connection method "%s" got %r not %r' % (
+                                 method_name, mock_method.mock_calls,
+                                 expected_calls))
+
+    def test_connect_handoff_none_frag(self):
+        node = dict(replication_ip='1.2.3.4', replication_port=5678,
+                    device='sda1')
+        job = dict(partition='9', policy=POLICIES[1], frag_index=None)
+        self.sender = ssync_sender.Sender(self.daemon, node, job, None)
+        self.sender.suffixes = ['abc']
+        with mock.patch(
+                'swift.obj.ssync_sender.SsyncBufferedHTTPConnection'
+        ) as mock_conn_class:
+            mock_conn = mock_conn_class.return_value
+            mock_resp = mock.MagicMock()
+            mock_resp.status = 200
+            mock_conn.getresponse.return_value = mock_resp
+            self.sender.connect()
+        mock_conn_class.assert_called_once_with('1.2.3.4:5678')
+        expectations = {
+            'putrequest': [
+                mock.call('SSYNC', '/sda1/9'),
+            ],
+            'putheader': [
+                mock.call('Transfer-Encoding', 'chunked'),
+                mock.call('X-Backend-Storage-Policy-Index', 1),
+            ],
+            'endheaders': [mock.call()],
+        }
+        for method_name, expected_calls in expectations.items():
+            mock_method = getattr(mock_conn, method_name)
+            self.assertEqual(expected_calls, mock_method.mock_calls,
+                             'connection method "%s" got %r not %r' % (
+                                 method_name, mock_method.mock_calls,
+                                 expected_calls))
+
+    def test_connect_handoff_none_frag_to_primary(self):
+        node = dict(replication_ip='1.2.3.4', replication_port=5678,
+                    device='sda1', backend_index=42)
+        job = dict(partition='9', policy=POLICIES[1], frag_index=None)
+        self.sender = ssync_sender.Sender(self.daemon, node, job, None)
+        self.sender.suffixes = ['abc']
+        with mock.patch(
+                'swift.obj.ssync_sender.SsyncBufferedHTTPConnection'
+        ) as mock_conn_class:
+            mock_conn = mock_conn_class.return_value
+            mock_resp = mock.MagicMock()
+            mock_resp.status = 200
+            mock_conn.getresponse.return_value = mock_resp
+            self.sender.connect()
+        mock_conn_class.assert_called_once_with('1.2.3.4:5678')
+        expectations = {
+            'putrequest': [
+                mock.call('SSYNC', '/sda1/9'),
+            ],
+            'putheader': [
+                mock.call('Transfer-Encoding', 'chunked'),
+                mock.call('X-Backend-Storage-Policy-Index', 1),
+                mock.call('X-Backend-Ssync-Frag-Index', 42),
+                mock.call('X-Backend-Ssync-Node-Index', 42),
+            ],
+            'endheaders': [mock.call()],
+        }
+        for method_name, expected_calls in expectations.items():
+            mock_method = getattr(mock_conn, method_name)
+            self.assertEqual(expected_calls, mock_method.mock_calls,
+                             'connection method "%s" got %r not %r' % (
+                                 method_name, mock_method.mock_calls,
+                                 expected_calls))
+
+    def test_connect_handoff_replicated(self):
+        node = dict(replication_ip='1.2.3.4', replication_port=5678,
+                    device='sda1')
+        # no frag_index in rsync job
+        job = dict(partition='9', policy=POLICIES[1])
+        self.sender = ssync_sender.Sender(self.daemon, node, job, None)
+        self.sender.suffixes = ['abc']
+        with mock.patch(
+                'swift.obj.ssync_sender.SsyncBufferedHTTPConnection'
+        ) as mock_conn_class:
+            mock_conn = mock_conn_class.return_value
+            mock_resp = mock.MagicMock()
+            mock_resp.status = 200
+            mock_conn.getresponse.return_value = mock_resp
+            self.sender.connect()
+        mock_conn_class.assert_called_once_with('1.2.3.4:5678')
+        expectations = {
+            'putrequest': [
+                mock.call('SSYNC', '/sda1/9'),
+            ],
+            'putheader': [
+                mock.call('Transfer-Encoding', 'chunked'),
+                mock.call('X-Backend-Storage-Policy-Index', 1),
+            ],
+            'endheaders': [mock.call()],
+        }
+        for method_name, expected_calls in expectations.items():
+            mock_method = getattr(mock_conn, method_name)
+            self.assertEqual(expected_calls, mock_method.mock_calls,
+                             'connection method "%s" got %r not %r' % (
+                                 method_name, mock_method.mock_calls,
+                                 expected_calls))
+
+    def _do_test_connect_include_non_durable(self,
+                                             include_non_durable,
+                                             resp_headers):
+        # construct sender and make connect call
+        node = dict(replication_ip='1.2.3.4', replication_port=5678,
+                    device='sda1', backend_index=0)
+        job = dict(partition='9', policy=POLICIES[1])
+        sender = ssync_sender.Sender(self.daemon, node, job, None,
+                                     include_non_durable=include_non_durable)
+        self.assertEqual(include_non_durable, sender.include_non_durable)
+        with mock.patch(
+                'swift.obj.ssync_sender.SsyncBufferedHTTPConnection'
+        ) as mock_conn_class:
+            mock_conn = mock_conn_class.return_value
+            mock_conn.getresponse.return_value = FakeResponse('', resp_headers)
+            sender.connect()
+        mock_conn_class.assert_called_once_with('1.2.3.4:5678')
+        return sender
+
+    def test_connect_legacy_receiver(self):
+        sender = self._do_test_connect_include_non_durable(False, {})
+        self.assertFalse(sender.include_non_durable)
+        warnings = self.daemon_logger.get_lines_for_level('warning')
+        self.assertEqual([], warnings)
+
+    def test_connect_upgraded_receiver(self):
+        resp_hdrs = {'x-backend-accept-no-commit': 'True'}
+        sender = self._do_test_connect_include_non_durable(False, resp_hdrs)
+        # 'x-backend-accept-no-commit' in response does not override
+        # sender.include_non_durable
+        self.assertFalse(sender.include_non_durable)
+        warnings = self.daemon_logger.get_lines_for_level('warning')
+        self.assertEqual([], warnings)
+
+    def test_connect_legacy_receiver_include_non_durable(self):
+        sender = self._do_test_connect_include_non_durable(True, {})
+        # no 'x-backend-accept-no-commit' in response,
+        # sender.include_non_durable has been overridden
+        self.assertFalse(sender.include_non_durable)
+        warnings = self.daemon_logger.get_lines_for_level('warning')
+        self.assertEqual(['ssync receiver 1.2.3.4:5678 does not accept '
+                          'non-durable fragments'], warnings)
+
+    def test_connect_upgraded_receiver_include_non_durable(self):
+        resp_hdrs = {'x-backend-accept-no-commit': 'True'}
+        sender = self._do_test_connect_include_non_durable(True, resp_hdrs)
+        self.assertTrue(sender.include_non_durable)
+        warnings = self.daemon_logger.get_lines_for_level('warning')
+        self.assertEqual([], warnings)
+
+    def test_call(self):
+        def patch_sender(sender, available_map, send_map):
+            connection = FakeConnection()
+            response = FakeResponse()
+            sender.connect = mock.MagicMock(return_value=(connection,
+                                                          response))
+            sender.missing_check = mock.MagicMock()
+            sender.missing_check = mock.MagicMock(return_value=(available_map,
+                                                                send_map))
+            sender.updates = mock.MagicMock()
+            sender.disconnect = mock.MagicMock()
+
+        node = dict(replication_ip='1.2.3.4', replication_port=5678,
+                    device='sda1')
+        job = {
+            'device': 'dev',
+            'partition': '9',
+            'policy': POLICIES.legacy,
+            'frag_index': 0,
+        }
+        available_map = dict([('9d41d8cd98f00b204e9800998ecf0abc',
+                               '1380144470.00000'),
+                              ('9d41d8cd98f00b204e9800998ecf0def',
+                               '1380144472.22222'),
+                              ('9d41d8cd98f00b204e9800998ecf1def',
+                               '1380144474.44444')])
+
+        # no suffixes -> no work done
+        sender = ssync_sender.Sender(
+            self.daemon, node, job, [], remote_check_objs=None)
+        patch_sender(sender, available_map, {})
+        success, candidates = sender()
+        self.assertTrue(success)
+        self.assertEqual({}, candidates)
+
+        # all objs in sync
+        sender = ssync_sender.Sender(
+            self.daemon, node, job, ['ignored'], remote_check_objs=None)
+        patch_sender(sender, available_map, {})
+        success, candidates = sender()
+        self.assertTrue(success)
+        self.assertEqual(available_map, candidates)
+
+        # one obj not in sync, sync'ing faked, all objs should be in return set
+        wanted = '9d41d8cd98f00b204e9800998ecf0def'
+        sender = ssync_sender.Sender(
+            self.daemon, node, job, ['ignored'],
+            remote_check_objs=None)
+        patch_sender(sender, available_map, {wanted: []})
+        success, candidates = sender()
+        self.assertTrue(success)
+        self.assertEqual(available_map, candidates)
+
+        # one obj not in sync, remote check only so that obj is not sync'd
+        # and should not be in the return set
+        wanted = '9d41d8cd98f00b204e9800998ecf0def'
+        remote_check_objs = set(available_map.keys())
+        sender = ssync_sender.Sender(
+            self.daemon, node, job, ['ignored'],
+            remote_check_objs=remote_check_objs)
+        patch_sender(sender, available_map, {wanted: []})
+        success, candidates = sender()
+        self.assertTrue(success)
+        expected_map = dict([('9d41d8cd98f00b204e9800998ecf0abc',
+                              '1380144470.00000'),
+                             ('9d41d8cd98f00b204e9800998ecf1def',
+                              '1380144474.44444')])
+        self.assertEqual(expected_map, candidates)
+
+    def test_call_and_missing_check_metadata_legacy_response(self):
+        def yield_hashes(device, partition, policy, suffixes=None, **kwargs):
+            if device == 'dev' and partition == '9' and suffixes == ['abc'] \
+                    and policy == POLICIES.legacy:
+                yield (
+                    '9d41d8cd98f00b204e9800998ecf0abc',
+                    {'ts_data': Timestamp(1380144470.00000),
+                     'ts_meta': Timestamp(1380155570.00005)})
+            else:
+                raise Exception(
+                    'No match for %r %r %r' % (device, partition, suffixes))
+
+        connection = FakeConnection()
+        self.sender.node = {}
+        self.sender.job = {
+            'device': 'dev',
+            'partition': '9',
+            'policy': POLICIES.legacy,
+            'frag_index': 0,
+        }
+        self.sender.suffixes = ['abc']
+        response = FakeResponse(
+            chunk_body=(
+                ':MISSING_CHECK: START\r\n'
+                '9d41d8cd98f00b204e9800998ecf0abc\r\n'
+                ':MISSING_CHECK: END\r\n'
+                ':UPDATES: START\r\n'
+                ':UPDATES: END\r\n'
+            ))
+        self.sender.df_mgr.yield_hashes = yield_hashes
+        self.sender.connect = mock.MagicMock(return_value=(connection,
+                                                           response))
+        df = mock.MagicMock()
+        df.content_length = 0
+        self.sender.df_mgr.get_diskfile_from_hash = mock.MagicMock(
+            return_value=df)
+        self.sender.disconnect = mock.MagicMock()
+        success, candidates = self.sender()
+        self.assertTrue(success)
+        found_post = found_put = False
+        for chunk in connection.sent:
+            if b'POST' in chunk:
+                found_post = True
+            if b'PUT' in chunk:
+                found_put = True
+        self.assertFalse(found_post)
+        self.assertTrue(found_put)
+
+    def test_call_and_missing_check(self):
+        ts = self.ts()
+
+        def yield_hashes(device, partition, policy, suffixes=None, **kwargs):
+            if device == 'dev' and partition == '9' and suffixes == ['abc'] \
+                    and policy == POLICIES.legacy:
+                yield (
+                    '9d41d8cd98f00b204e9800998ecf0abc',
+                    {'ts_data': ts})
+            else:
+                raise Exception(
+                    'No match for %r %r %r' % (device, partition, suffixes))
+
+        connection = FakeConnection()
+        self.sender.node = {}
+        self.sender.job = {
+            'device': 'dev',
+            'partition': '9',
+            'policy': POLICIES.legacy,
+            'frag_index': 0,
+        }
+        self.sender.suffixes = ['abc']
+        response = FakeResponse(
+            chunk_body=(
+                ':MISSING_CHECK: START\r\n'
+                '9d41d8cd98f00b204e9800998ecf0abc d\r\n'
+                ':MISSING_CHECK: END\r\n'))
+        self.sender.df_mgr.yield_hashes = yield_hashes
+        self.sender.connect = mock.MagicMock(return_value=(connection,
+                                                           response))
+        self.sender.updates = mock.MagicMock()
+        self.sender.disconnect = mock.MagicMock()
+        success, candidates = self.sender()
+        self.assertTrue(success)
+        self.assertEqual(candidates,
+                         dict([('9d41d8cd98f00b204e9800998ecf0abc',
+                                {'ts_data': ts})]))
+
+    def test_call_and_missing_check_with_obj_list(self):
+        ts = self.ts()
+
+        def yield_hashes(device, partition, policy, suffixes=None, **kwargs):
+            if device == 'dev' and partition == '9' and suffixes == ['abc'] \
+                    and policy == POLICIES.legacy:
+                yield (
+                    '9d41d8cd98f00b204e9800998ecf0abc',
+                    {'ts_data': ts})
+            else:
+                raise Exception(
+                    'No match for %r %r %r' % (device, partition, suffixes))
+        job = {
+            'device': 'dev',
+            'partition': '9',
+            'policy': POLICIES.legacy,
+            'frag_index': 0,
+        }
+        self.sender = ssync_sender.Sender(self.daemon, None, job, ['abc'],
+                                          ['9d41d8cd98f00b204e9800998ecf0abc'])
+        connection = FakeConnection()
+        response = FakeResponse(
+            chunk_body=(
+                ':MISSING_CHECK: START\r\n'
+                ':MISSING_CHECK: END\r\n'))
+        self.sender.df_mgr.yield_hashes = yield_hashes
+        self.sender.connect = mock.MagicMock(return_value=(connection,
+                                                           response))
+        self.sender.updates = mock.MagicMock()
+        self.sender.disconnect = mock.MagicMock()
+        success, candidates = self.sender()
+        self.assertTrue(success)
+        self.assertEqual(candidates,
+                         dict([('9d41d8cd98f00b204e9800998ecf0abc',
+                                {'ts_data': ts})]))
+
+    def test_call_and_missing_check_with_obj_list_but_required(self):
+        def yield_hashes(device, partition, policy, suffixes=None, **kwargs):
+            if device == 'dev' and partition == '9' and suffixes == ['abc'] \
+                    and policy == POLICIES.legacy:
+                yield (
+                    '9d41d8cd98f00b204e9800998ecf0abc',
+                    {'ts_data': Timestamp(1380144470.00000)})
+            else:
+                raise Exception(
+                    'No match for %r %r %r' % (device, partition, suffixes))
+        job = {
+            'device': 'dev',
+            'partition': '9',
+            'policy': POLICIES.legacy,
+            'frag_index': 0,
+        }
+        self.sender = ssync_sender.Sender(self.daemon, {}, job, ['abc'],
+                                          ['9d41d8cd98f00b204e9800998ecf0abc'])
+        connection = FakeConnection()
+        response = FakeResponse(
+            chunk_body=(
+                ':MISSING_CHECK: START\r\n'
+                '9d41d8cd98f00b204e9800998ecf0abc d\r\n'
+                ':MISSING_CHECK: END\r\n'))
+        self.sender.df_mgr.yield_hashes = yield_hashes
+        self.sender.connect = mock.MagicMock(return_value=(connection,
+                                                           response))
+        self.sender.updates = mock.MagicMock()
+        self.sender.disconnect = mock.MagicMock()
+        success, candidates = self.sender()
+        self.assertTrue(success)
+        self.assertEqual(candidates, {})
+
+    def test_connect_send_timeout(self):
+        self.daemon.node_timeout = 0.01  # make disconnect fail fast
+        self.daemon.conn_timeout = 0.01
+        node = dict(replication_ip='1.2.3.4', replication_port=5678,
+                    device='sda1')
+        job = dict(partition='9', policy=POLICIES.legacy)
+        self.sender = ssync_sender.Sender(self.daemon, node, job, None)
+        self.sender.suffixes = ['abc']
+
+        def putrequest(*args, **kwargs):
+            eventlet.sleep(0.1)
+
+        with mock.patch.object(
+                ssync_sender.bufferedhttp.BufferedHTTPConnection,
+                'putrequest', putrequest):
+            success, candidates = self.sender()
+            self.assertFalse(success)
+            self.assertEqual(candidates, {})
+        error_lines = self.daemon_logger.get_lines_for_level('error')
+        for line in error_lines:
+            self.assertTrue(line.startswith(
+                '1.2.3.4:5678/sda1/9 0.01 seconds: connect send'))
+
+    def test_connect_receive_timeout(self):
+        self.daemon.node_timeout = 0.02
+        node = dict(replication_ip='1.2.3.4', replication_port=5678,
+                    device='sda1', index=0)
+        job = dict(partition='9', policy=POLICIES.legacy)
+        self.sender = ssync_sender.Sender(self.daemon, node, job, None)
+        self.sender.suffixes = ['abc']
+
+        class FakeBufferedHTTPConnection(NullBufferedHTTPConnection):
+
+            def getresponse(*args, **kwargs):
+                eventlet.sleep(0.1)
+
+        with mock.patch.object(
+                ssync_sender, 'SsyncBufferedHTTPConnection',
+                FakeBufferedHTTPConnection):
+            success, candidates = self.sender()
+            self.assertFalse(success)
+            self.assertEqual(candidates, {})
+        error_lines = self.daemon_logger.get_lines_for_level('error')
+        for line in error_lines:
+            self.assertTrue(line.startswith(
+                '1.2.3.4:5678/sda1/9 0.02 seconds: connect receive'))
+
+    def test_connect_bad_status(self):
+        self.daemon.node_timeout = 0.02
+        node = dict(replication_ip='1.2.3.4', replication_port=5678,
+                    device='sda1', index=0)
+        job = dict(partition='9', policy=POLICIES.legacy)
+
+        class FakeBufferedHTTPConnection(NullBufferedHTTPConnection):
+            def getresponse(*args, **kwargs):
+                response = FakeResponse()
+                response.status = 503
+                response.read = lambda: 'an error message'
+                return response
+
+        missing_check_fn = 'swift.obj.ssync_sender.Sender.missing_check'
+        with mock.patch(missing_check_fn) as mock_missing_check:
+            with mock.patch.object(
+                ssync_sender, 'SsyncBufferedHTTPConnection',
+                    FakeBufferedHTTPConnection):
+                self.sender = ssync_sender.Sender(
+                    self.daemon, node, job, ['abc'])
+                success, candidates = self.sender()
+                self.assertFalse(success)
+                self.assertEqual(candidates, {})
+        error_lines = self.daemon_logger.get_lines_for_level('error')
+        for line in error_lines:
+            self.assertTrue(line.startswith(
+                '1.2.3.4:5678/sda1/9 Expected status 200; got 503'))
+            self.assertIn('an error message', line)
+        # sanity check that Sender did not proceed to missing_check exchange
+        self.assertFalse(mock_missing_check.called)
+
+    def test_readline_newline_in_buffer(self):
+        response = FakeResponse()
+        response.ssync_response_buffer = b'Has a newline already.\r\nOkay.'
+        self.assertEqual(response.readline(), b'Has a newline already.\r\n')
+        self.assertEqual(response.ssync_response_buffer, b'Okay.')
+
+    def test_readline_buffer_exceeds_network_chunk_size_somehow(self):
+        response = FakeResponse()
+        response.ssync_response_buffer = b'1234567890'
+        self.assertEqual(response.readline(size=2), b'1234567890')
+        self.assertEqual(response.ssync_response_buffer, b'')
+
+    def test_readline_at_start_of_chunk(self):
+        response = FakeResponse()
+        response.fp = io.BytesIO(b'2\r\nx\n\r\n')
+        self.assertEqual(response.readline(), b'x\n')
+
+    def test_readline_chunk_with_extension(self):
+        response = FakeResponse()
+        response.fp = io.BytesIO(
+            b'2 ; chunk=extension\r\nx\n\r\n')
+        self.assertEqual(response.readline(), b'x\n')
+
+    def test_readline_broken_chunk(self):
+        response = FakeResponse()
+        response.fp = io.BytesIO(b'q\r\nx\n\r\n')
+        self.assertRaises(
+            exceptions.ReplicationException, response.readline)
+        self.assertTrue(response.close_called)
+
+    def test_readline_terminated_chunk(self):
+        response = FakeResponse()
+        response.fp = io.BytesIO(b'b\r\nnot enough')
+        self.assertRaises(
+            exceptions.ReplicationException, response.readline)
+        self.assertTrue(response.close_called)
+
+    def test_readline_all(self):
+        response = FakeResponse()
+        response.fp = io.BytesIO(b'2\r\nx\n\r\n0\r\n\r\n')
+        self.assertEqual(response.readline(), b'x\n')
+        self.assertEqual(response.readline(), b'')
+        self.assertEqual(response.readline(), b'')
+
+    def test_readline_all_trailing_not_newline_termed(self):
+        response = FakeResponse()
+        response.fp = io.BytesIO(
+            b'2\r\nx\n\r\n3\r\n123\r\n0\r\n\r\n')
+        self.assertEqual(response.readline(), b'x\n')
+        self.assertEqual(response.readline(), b'123')
+        self.assertEqual(response.readline(), b'')
+        self.assertEqual(response.readline(), b'')
+
+    def test_missing_check_timeout_start(self):
+        connection = FakeConnection(sleeps=[1])
+        response = FakeResponse()
+        self.sender.daemon.node_timeout = 0.01
+        self.assertFalse(self.sender.limited_by_max_objects)
+        with self.assertRaises(exceptions.MessageTimeout) as cm:
+            self.sender.missing_check(connection, response)
+        self.assertIn('0.01 seconds: missing_check start', str(cm.exception))
+        self.assertFalse(self.sender.limited_by_max_objects)
+
+    def test_call_and_missing_check_timeout_send_line(self):
+        ts1 = self.ts()
+        ts2 = self.ts()
+
+        def yield_hashes(device, partition, policy, suffixes=None, **kwargs):
+            yield (
+                '9d41d8cd98f00b204e9800998ecf0abc',
+                {'ts_data': ts1})
+            yield (
+                '9d41d8cd98f00b204e9800998ecf0def',
+                {'ts_data': ts2})
+
+        response = FakeResponse()
+        # max_objects unlimited
+        node = {'replication_ip': '1.2.3.4',
+                'replication_port': 5678,
+                'device': 'sda1'}
+        self.sender = ssync_sender.Sender(self.daemon, node, self.job, None,
+                                          max_objects=0)
+        self.sender.suffixes = ['abc']
+        self.sender.df_mgr.yield_hashes = yield_hashes
+        # arrange for timeout while sending first missing check item
+        self.sender.daemon.node_timeout = 0.01
+        connection = FakeConnection(sleeps=[0, 1])
+        self.sender.connect = mock.MagicMock(return_value=(connection,
+                                                           response))
+        self.sender.updates = mock.MagicMock()
+        self.assertFalse(self.sender.limited_by_max_objects)
+        success, candidates = self.sender()
+        self.assertFalse(success)
+        log_lines = self.daemon_logger.get_lines_for_level('error')
+        self.assertIn(
+            '1.2.3.4:5678/sda1/99 0.01 seconds: missing_check send line: '
+            '0 lines (0 bytes) sent', log_lines)
+        self.assertFalse(self.sender.limited_by_max_objects)
+        # only the first missing check item was sent, plus a disconnect line
+        self.assertConnectionMessages(
+            [b':MISSING_CHECK: START',
+             b'9d41d8cd98f00b204e9800998ecf0abc %s' %
+             ts1.internal.encode('ascii'),
+             ''],
+            connection.sent)
+
+    def test_missing_check_has_empty_suffixes(self):
+        def yield_hashes(device, partition, policy, suffixes=None, **kwargs):
+            if (device != 'dev' or partition != '9' or
+                    policy != POLICIES.legacy or
+                    suffixes != ['abc', 'def']):
+                yield  # Just here to make this a generator
+                raise Exception(
+                    'No match for %r %r %r %r' % (device, partition,
+                                                  policy, suffixes))
+
+        connection = FakeConnection()
+        self.sender.job = {
+            'device': 'dev',
+            'partition': '9',
+            'policy': POLICIES.legacy,
+        }
+        self.sender.suffixes = ['abc', 'def']
+        response = FakeResponse(
+            chunk_body=(
+                ':MISSING_CHECK: START\r\n'
+                ':MISSING_CHECK: END\r\n'))
+        self.sender.df_mgr.yield_hashes = yield_hashes
+        self.assertFalse(self.sender.limited_by_max_objects)
+        available_map, send_map = self.sender.missing_check(connection,
+                                                            response)
+        self.assertConnectionMessages(
+            [b':MISSING_CHECK: START',
+             b':MISSING_CHECK: END'],
+            connection.sent)
+        self.assertEqual(send_map, {})
+        self.assertEqual(available_map, {})
+        self.assertFalse(self.sender.limited_by_max_objects)
+
+    def test_missing_check_has_suffixes(self):
+        timestamps = [self.ts() for _ in range(6)]
+
+        def yield_hashes(device, partition, policy, suffixes=None, **kwargs):
+            if (device == 'dev' and partition == '9' and
+                    policy == POLICIES.legacy and
+                    suffixes == ['abc', 'def']):
+                yield (
+                    '9d41d8cd98f00b204e9800998ecf0abc',
+                    {'ts_data': timestamps[0]})
+                yield (
+                    '9d41d8cd98f00b204e9800998ecf0def',
+                    {'ts_data': timestamps[1],
+                     'ts_meta': timestamps[2]})
+                yield (
+                    '9d41d8cd98f00b204e9800998ecf1def',
+                    {'ts_data': timestamps[3],
+                     'ts_ctype': timestamps[4],
+                     'ts_meta': timestamps[5]})
+            else:
+                raise Exception(
+                    'No match for %r %r %r %r' % (device, partition,
+                                                  policy, suffixes))
+
+        # note: max_objects > number that would yield
+        self.sender = ssync_sender.Sender(self.daemon, None, self.job, None,
+                                          max_objects=4)
+
+        connection = FakeConnection()
+        self.sender.job = {
+            'device': 'dev',
+            'partition': '9',
+            'policy': POLICIES.legacy,
+        }
+        self.sender.suffixes = ['abc', 'def']
+        response = FakeResponse(
+            chunk_body=(
+                ':MISSING_CHECK: START\r\n'
+                ':MISSING_CHECK: END\r\n'))
+        self.sender.df_mgr.yield_hashes = yield_hashes
+        self.assertFalse(self.sender.limited_by_max_objects)
+        available_map, send_map = self.sender.missing_check(connection,
+                                                            response)
+        expected_messages = [
+            b':MISSING_CHECK: START',
+            b'9d41d8cd98f00b204e9800998ecf0abc %s' % (
+                timestamps[0].internal.encode('ascii')),
+            b'9d41d8cd98f00b204e9800998ecf0def %s m:186a0' % (
+                timestamps[1].internal.encode('ascii')),
+            (b'9d41d8cd98f00b204e9800998ecf1def %s '
+             b'm:30d40,t:186a0' % (
+                 timestamps[3].internal.encode('ascii'))),
+            b':MISSING_CHECK: END']
+        self.assertConnectionMessages(expected_messages, connection.sent)
+        self.assertEqual(send_map, {})
+        candidates = [('9d41d8cd98f00b204e9800998ecf0abc',
+                       dict(ts_data=timestamps[0])),
+                      ('9d41d8cd98f00b204e9800998ecf0def',
+                       dict(ts_data=timestamps[1],
+                            ts_meta=timestamps[2])),
+                      ('9d41d8cd98f00b204e9800998ecf1def',
+                       dict(ts_data=timestamps[3],
+                            ts_meta=timestamps[5],
+                            ts_ctype=timestamps[4]))]
+        self.assertEqual(available_map, dict(candidates))
+        self.assertEqual([], self.daemon_logger.get_lines_for_level('info'))
+        self.assertFalse(self.sender.limited_by_max_objects)
+
+    def test_missing_check_max_objects_less_than_actual_objects(self):
+        timestamps = [self.ts() for _ in range(6)]
+
+        def yield_hashes(device, partition, policy, suffixes=None, **kwargs):
+            # verify missing_check stops after 2 objects even though more
+            # objects would yield
+            if (device == 'dev' and partition == '9' and
+                    policy == POLICIES.legacy and
+                    suffixes == ['abc', 'def']):
+                yield (
+                    '9d41d8cd98f00b204e9800998ecf0abc',
+                    {'ts_data': timestamps[0]})
+                yield (
+                    '9d41d8cd98f00b204e9800998ecf0def',
+                    {'ts_data': timestamps[1],
+                     'ts_meta': timestamps[2]})
+                yield (
+                    '9d41d8cd98f00b204e9800998ecf1def',
+                    {'ts_data': timestamps[3],
+                     'ts_ctype': timestamps[4],
+                     'ts_meta': timestamps[5]})
+            else:
+                raise Exception(
+                    'No match for %r %r %r %r' % (device, partition,
+                                                  policy, suffixes))
+
+        # max_objects < number that would yield
+        self.sender = ssync_sender.Sender(self.daemon, None, self.job, None,
+                                          max_objects=2)
+
+        connection = FakeConnection()
+        self.sender.job = {
+            'device': 'dev',
+            'partition': '9',
+            'policy': POLICIES.legacy,
+        }
+        self.sender.suffixes = ['abc', 'def']
+        response = FakeResponse(
+            chunk_body=(
+                ':MISSING_CHECK: START\r\n'
+                ':MISSING_CHECK: END\r\n'))
+        self.sender.df_mgr.yield_hashes = yield_hashes
+        self.assertFalse(self.sender.limited_by_max_objects)
+        available_map, send_map = self.sender.missing_check(connection,
+                                                            response)
+        expected_messages = [
+            b':MISSING_CHECK: START',
+            b'9d41d8cd98f00b204e9800998ecf0abc %s' % (
+                timestamps[0].internal.encode('ascii')),
+            b'9d41d8cd98f00b204e9800998ecf0def %s m:186a0' % (
+                timestamps[1].internal.encode('ascii')),
+            b':MISSING_CHECK: END']
+        self.assertConnectionMessages(expected_messages, connection.sent)
+        self.assertEqual(send_map, {})
+        candidates = [('9d41d8cd98f00b204e9800998ecf0abc',
+                       dict(ts_data=timestamps[0])),
+                      ('9d41d8cd98f00b204e9800998ecf0def',
+                       dict(ts_data=timestamps[1],
+                            ts_meta=timestamps[2]))]
+        self.assertEqual(available_map, dict(candidates))
+        self.assertEqual(
+            ['ssync missing_check truncated after 2 objects: device: dev, '
+             'part: 9, policy: 0, last object hash: '
+             '9d41d8cd98f00b204e9800998ecf0def'],
+            self.daemon_logger.get_lines_for_level('info'))
+        self.assertTrue(self.sender.limited_by_max_objects)
+
+    def test_missing_check_max_objects_exactly_actual_objects(self):
+        timestamps = [self.ts() for _ in range(3)]
+
+        def yield_hashes(device, partition, policy, suffixes=None, **kwargs):
+            if (device == 'dev' and partition == '9' and
+                    policy == POLICIES.legacy and
+                    suffixes == ['abc', 'def']):
+                yield (
+                    '9d41d8cd98f00b204e9800998ecf0abc',
+                    {'ts_data': timestamps[0]})
+                yield (
+                    '9d41d8cd98f00b204e9800998ecf0def',
+                    {'ts_data': timestamps[1],
+                     'ts_meta': timestamps[2]})
+            else:
+                raise Exception(
+                    'No match for %r %r %r %r' % (device, partition,
+                                                  policy, suffixes))
+
+        # max_objects == number that would yield
+        self.sender = ssync_sender.Sender(self.daemon, None, self.job, None,
+                                          max_objects=2)
+
+        connection = FakeConnection()
+        self.sender.job = {
+            'device': 'dev',
+            'partition': '9',
+            'policy': POLICIES.legacy,
+        }
+        self.sender.suffixes = ['abc', 'def']
+        response = FakeResponse(
+            chunk_body=(
+                ':MISSING_CHECK: START\r\n'
+                ':MISSING_CHECK: END\r\n'))
+        self.sender.df_mgr.yield_hashes = yield_hashes
+        self.assertFalse(self.sender.limited_by_max_objects)
+        available_map, send_map = self.sender.missing_check(connection,
+                                                            response)
+        expected_messages = [
+            b':MISSING_CHECK: START',
+            b'9d41d8cd98f00b204e9800998ecf0abc %s' % (
+                timestamps[0].internal.encode('ascii')),
+            b'9d41d8cd98f00b204e9800998ecf0def %s m:186a0' % (
+                timestamps[1].internal.encode('ascii')),
+            b':MISSING_CHECK: END']
+        self.assertConnectionMessages(expected_messages, connection.sent)
+        self.assertEqual(send_map, {})
+        candidates = [('9d41d8cd98f00b204e9800998ecf0abc',
+                       dict(ts_data=timestamps[0])),
+                      ('9d41d8cd98f00b204e9800998ecf0def',
+                       dict(ts_data=timestamps[1],
+                            ts_meta=timestamps[2]))]
+        self.assertEqual(available_map, dict(candidates))
+        # nothing logged re: truncation
+        self.assertEqual([], self.daemon_logger.get_lines_for_level('info'))
+        self.assertFalse(self.sender.limited_by_max_objects)
+
+    def test_missing_check_far_end_disconnect(self):
+        ts = self.ts()
+
+        def yield_hashes(device, partition, policy, suffixes=None, **kwargs):
+            if (device == 'dev' and partition == '9' and
+                    policy == POLICIES.legacy and
+                    suffixes == ['abc']):
+                yield (
+                    '9d41d8cd98f00b204e9800998ecf0abc',
+                    {'ts_data': ts})
+            else:
+                raise Exception(
+                    'No match for %r %r %r %r' % (device, partition,
+                                                  policy, suffixes))
+
+        connection = FakeConnection()
+        self.sender.job = {
+            'device': 'dev',
+            'partition': '9',
+            'policy': POLICIES.legacy,
+        }
+        self.sender.suffixes = ['abc']
+        self.sender.df_mgr.yield_hashes = yield_hashes
+        self.assertFalse(self.sender.limited_by_max_objects)
+        response = FakeResponse(chunk_body='\r\n')
+        exc = None
+        try:
+            self.sender.missing_check(connection, response)
+        except exceptions.ReplicationException as err:
+            exc = err
+        self.assertEqual(str(exc), 'Early disconnect')
+        expected_messages = [
+            b':MISSING_CHECK: START',
+            b'9d41d8cd98f00b204e9800998ecf0abc %s' % (
+                ts.internal.encode('ascii')),
+            b':MISSING_CHECK: END']
+        self.assertConnectionMessages(expected_messages, connection.sent)
+        self.assertFalse(self.sender.limited_by_max_objects)
+
+    def test_missing_check_far_end_disconnect2(self):
+        ts = self.ts()
+
+        def yield_hashes(device, partition, policy, suffixes=None, **kwargs):
+            if (device == 'dev' and partition == '9' and
+                    policy == POLICIES.legacy and
+                    suffixes == ['abc']):
+                yield (
+                    '9d41d8cd98f00b204e9800998ecf0abc',
+                    {'ts_data': ts})
+            else:
+                raise Exception(
+                    'No match for %r %r %r %r' % (device, partition,
+                                                  policy, suffixes))
+
+        connection = FakeConnection()
+        self.sender.job = {
+            'device': 'dev',
+            'partition': '9',
+            'policy': POLICIES.legacy,
+        }
+        self.sender.suffixes = ['abc']
+        self.sender.df_mgr.yield_hashes = yield_hashes
+        self.assertFalse(self.sender.limited_by_max_objects)
+        response = FakeResponse(
+            chunk_body=':MISSING_CHECK: START\r\n')
+        exc = None
+        try:
+            self.sender.missing_check(connection, response)
+        except exceptions.ReplicationException as err:
+            exc = err
+        self.assertEqual(str(exc), 'Early disconnect')
+        expected_messages = [
+            b':MISSING_CHECK: START',
+            b'9d41d8cd98f00b204e9800998ecf0abc %s' % (
+                ts.internal.encode('ascii')),
+            b':MISSING_CHECK: END']
+        self.assertConnectionMessages(expected_messages, connection.sent)
+        self.assertFalse(self.sender.limited_by_max_objects)
+
+    def test_missing_check_far_end_unexpected(self):
+        ts = self.ts()
+
+        def yield_hashes(device, partition, policy, suffixes=None, **kwargs):
+            if (device == 'dev' and partition == '9' and
+                    policy == POLICIES.legacy and
+                    suffixes == ['abc']):
+                yield (
+                    '9d41d8cd98f00b204e9800998ecf0abc',
+                    {'ts_data': ts})
+            else:
+                raise Exception(
+                    'No match for %r %r %r %r' % (device, partition,
+                                                  policy, suffixes))
+
+        connection = FakeConnection()
+        self.sender.job = {
+            'device': 'dev',
+            'partition': '9',
+            'policy': POLICIES.legacy,
+        }
+        self.sender.suffixes = ['abc']
+        self.sender.df_mgr.yield_hashes = yield_hashes
+        self.assertFalse(self.sender.limited_by_max_objects)
+        response = FakeResponse(chunk_body='OH HAI\r\n')
+        exc = None
+        try:
+            self.sender.missing_check(connection, response)
+        except exceptions.ReplicationException as err:
+            exc = err
+        self.assertEqual(str(exc), "Unexpected response: 'OH HAI'")
+        expected_messages = [
+            b':MISSING_CHECK: START',
+            b'9d41d8cd98f00b204e9800998ecf0abc %s' % (
+                ts.internal.encode('ascii')),
+            b':MISSING_CHECK: END']
+        self.assertConnectionMessages(expected_messages, connection.sent)
+        self.assertFalse(self.sender.limited_by_max_objects)
+
+    def test_missing_check_send_map(self):
+        ts = self.ts()
+
+        def yield_hashes(device, partition, policy, suffixes=None, **kwargs):
+            if (device == 'dev' and partition == '9' and
+                    policy == POLICIES.legacy and
+                    suffixes == ['abc']):
+                yield (
+                    '9d41d8cd98f00b204e9800998ecf0abc',
+                    {'ts_data': ts})
+            else:
+                raise Exception(
+                    'No match for %r %r %r %r' % (device, partition,
+                                                  policy, suffixes))
+
+        connection = FakeConnection()
+        self.sender.job = {
+            'device': 'dev',
+            'partition': '9',
+            'policy': POLICIES.legacy,
+        }
+        self.sender.suffixes = ['abc']
+        response = FakeResponse(
+            chunk_body=(
+                ':MISSING_CHECK: START\r\n'
+                '0123abc dm\r\n'
+                ':MISSING_CHECK: END\r\n'))
+        self.sender.df_mgr.yield_hashes = yield_hashes
+        self.assertFalse(self.sender.limited_by_max_objects)
+        available_map, send_map = self.sender.missing_check(connection,
+                                                            response)
+        expected_messages = [
+            b':MISSING_CHECK: START',
+            b'9d41d8cd98f00b204e9800998ecf0abc %s' % (
+                ts.internal.encode('ascii')),
+            b':MISSING_CHECK: END']
+        self.assertConnectionMessages(expected_messages, connection.sent)
+        self.assertEqual(send_map, {'0123abc': {'data': True, 'meta': True}})
+        self.assertEqual(available_map,
+                         dict([('9d41d8cd98f00b204e9800998ecf0abc',
+                                {'ts_data': ts})]))
+        self.assertFalse(self.sender.limited_by_max_objects)
+
+    def test_missing_check_extra_line_parts(self):
+        # check that sender tolerates extra parts in missing check
+        # line responses to allow for protocol upgrades
+        ts = self.ts()
+
+        def yield_hashes(device, partition, policy, suffixes=None, **kwargs):
+            if (device == 'dev' and partition == '9' and
+                    policy == POLICIES.legacy and
+                    suffixes == ['abc']):
+                yield (
+                    '9d41d8cd98f00b204e9800998ecf0abc',
+                    {'ts_data': ts})
+            else:
+                raise Exception(
+                    'No match for %r %r %r %r' % (device, partition,
+                                                  policy, suffixes))
+
+        connection = FakeConnection()
+        self.sender.job = {
+            'device': 'dev',
+            'partition': '9',
+            'policy': POLICIES.legacy,
+        }
+        self.sender.suffixes = ['abc']
+        response = FakeResponse(
+            chunk_body=(
+                ':MISSING_CHECK: START\r\n'
+                '0123abc d extra response parts\r\n'
+                ':MISSING_CHECK: END\r\n'))
+        self.sender.df_mgr.yield_hashes = yield_hashes
+        self.assertFalse(self.sender.limited_by_max_objects)
+        available_map, send_map = self.sender.missing_check(connection,
+                                                            response)
+        self.assertEqual(send_map, {'0123abc': {'data': True}})
+        self.assertEqual(available_map,
+                         dict([('9d41d8cd98f00b204e9800998ecf0abc',
+                                {'ts_data': ts})]))
+        self.assertFalse(self.sender.limited_by_max_objects)
+
+    def test_updates_timeout(self):
+        connection = FakeConnection()
+        connection.send = lambda d: eventlet.sleep(1)
+        response = FakeResponse()
+        self.sender.daemon.node_timeout = 0.01
+        self.assertRaises(exceptions.MessageTimeout, self.sender.updates,
+                          connection, response, {})
+
+    def test_updates_empty_send_map(self):
+        connection = FakeConnection()
+        response = FakeResponse(
+            chunk_body=(
+                ':UPDATES: START\r\n'
+                ':UPDATES: END\r\n'))
+        self.sender.updates(connection, response, {})
+        expected_messages = [
+            b':UPDATES: START',
+            b':UPDATES: END']
+        self.assertConnectionMessages(expected_messages, connection.sent)
+
+    def test_updates_unexpected_response_lines1(self):
+        connection = FakeConnection()
+        response = FakeResponse(
+            chunk_body=(
+                'abc\r\n'
+                ':UPDATES: START\r\n'
+                ':UPDATES: END\r\n'))
+        exc = None
+        try:
+            self.sender.updates(connection, response, {})
+        except exceptions.ReplicationException as err:
+            exc = err
+        self.assertEqual(str(exc), "Unexpected response: 'abc'")
+        expected_messages = [
+            b':UPDATES: START',
+            b':UPDATES: END']
+        self.assertConnectionMessages(expected_messages, connection.sent)
+
+    def test_updates_unexpected_response_lines2(self):
+        connection = FakeConnection()
+        response = FakeResponse(
+            chunk_body=(
+                ':UPDATES: START\r\n'
+                'abc\r\n'
+                ':UPDATES: END\r\n'))
+        exc = None
+        try:
+            self.sender.updates(connection, response, {})
+        except exceptions.ReplicationException as err:
+            exc = err
+        self.assertEqual(str(exc), "Unexpected response: 'abc'")
+        expected_messages = [
+            b':UPDATES: START',
+            b':UPDATES: END']
+        self.assertConnectionMessages(expected_messages, connection.sent)
+
+    def test_updates_is_deleted(self):
+        device = 'dev'
+        part = '9'
+        object_parts = ('a', 'c', 'o')
+        df = self._make_open_diskfile(device, part, *object_parts)
+        object_hash = utils.hash_path(*object_parts)
+        delete_timestamp = utils.normalize_timestamp(time.time())
+        df.delete(delete_timestamp)
+        connection = FakeConnection()
+        self.sender.job = {
+            'device': device,
+            'partition': part,
+            'policy': POLICIES.legacy,
+            'frag_index': 0,
+        }
+        self.sender.node = {}
+        send_map = {object_hash: {'data': True}}
+        self.sender.send_delete = mock.MagicMock()
+        self.sender.send_put = mock.MagicMock()
+        response = FakeResponse(
+            chunk_body=(
+                ':UPDATES: START\r\n'
+                ':UPDATES: END\r\n'))
+        self.sender.updates(connection, response, send_map)
+        self.sender.send_delete.assert_called_once_with(
+            connection, '/a/c/o', delete_timestamp)
+        self.assertEqual(self.sender.send_put.mock_calls, [])
+        # note that the delete line isn't actually sent since we mock
+        # send_delete; send_delete is tested separately.
+        expected_messages = [
+            b':UPDATES: START',
+            b':UPDATES: END']
+        self.assertConnectionMessages(expected_messages, connection.sent)
+
+    def test_update_send_delete(self):
+        device = 'dev'
+        part = '9'
+        object_parts = ('a', 'c', 'o')
+        df = self._make_open_diskfile(device, part, *object_parts)
+        object_hash = utils.hash_path(*object_parts)
+        delete_timestamp = utils.normalize_timestamp(Timestamp.now())
+        df.delete(delete_timestamp)
+        connection = FakeConnection()
+        self.sender.job = {
+            'device': device,
+            'partition': part,
+            'policy': POLICIES.legacy,
+            'frag_index': 0,
+        }
+        self.sender.node = {}
+        send_map = {object_hash: {'data': True}}
+        response = FakeResponse(
+            chunk_body=(
+                ':UPDATES: START\r\n'
+                ':UPDATES: END\r\n'))
+        self.sender.updates(connection, response, send_map)
+        expected_messages = [
+            b':UPDATES: START',
+            b'DELETE /a/c/o\r\nX-Timestamp: %s\r\n' %
+            delete_timestamp.encode('ascii'),
+            b':UPDATES: END']
+        self.assertConnectionMessages(expected_messages, connection.sent)
+
+    def test_updates_put(self):
+        # sender has data file and meta file
+        ts_iter = make_timestamp_iter()
+        device = 'dev'
+        part = '9'
+        object_parts = ('a', 'c', 'o')
+        t1 = next(ts_iter)
+        df = self._make_open_diskfile(
+            device, part, *object_parts, timestamp=t1)
+        t2 = next(ts_iter)
+        metadata = {'X-Timestamp': t2.internal, 'X-Object-Meta-Fruit': 'kiwi'}
+        df.write_metadata(metadata)
+        object_hash = utils.hash_path(*object_parts)
+        df.open()
+        expected = df.get_metadata()
+        connection = FakeConnection()
+        self.sender.job = {
+            'device': device,
+            'partition': part,
+            'policy': POLICIES.legacy,
+            'frag_index': 0,
+        }
+        self.sender.node = {}
+        # receiver requested data only
+        send_map = {object_hash: {'data': True}}
+        self.sender.send_delete = mock.MagicMock()
+        self.sender.send_put = mock.MagicMock()
+        self.sender.send_post = mock.MagicMock()
+        response = FakeResponse(
+            chunk_body=(
+                ':UPDATES: START\r\n'
+                ':UPDATES: END\r\n'))
+        self.sender.updates(connection, response, send_map)
+        self.assertEqual(self.sender.send_delete.mock_calls, [])
+        self.assertEqual(self.sender.send_post.mock_calls, [])
+        self.assertEqual(1, len(self.sender.send_put.mock_calls))
+        args, _kwargs = self.sender.send_put.call_args
+        connection, path, df = args
+        self.assertEqual(path, '/a/c/o')
+        self.assertIsInstance(df, diskfile.DiskFile)
+        self.assertEqual(expected, df.get_metadata())
+        # note that the put line isn't actually sent since we mock send_put;
+        # send_put is tested separately.
+        expected_messages = [
+            b':UPDATES: START',
+            b':UPDATES: END']
+        self.assertConnectionMessages(expected_messages, connection.sent)
+
+    def test_updates_post(self):
+        ts_iter = make_timestamp_iter()
+        device = 'dev'
+        part = '9'
+        object_parts = ('a', 'c', 'o')
+        t1 = next(ts_iter)
+        df = self._make_open_diskfile(
+            device, part, *object_parts, timestamp=t1)
+        t2 = next(ts_iter)
+        metadata = {'X-Timestamp': t2.internal, 'X-Object-Meta-Fruit': 'kiwi'}
+        df.write_metadata(metadata)
+        object_hash = utils.hash_path(*object_parts)
+        df.open()
+        expected = df.get_metadata()
+        connection = FakeConnection()
+        self.sender.job = {
+            'device': device,
+            'partition': part,
+            'policy': POLICIES.legacy,
+            'frag_index': 0,
+        }
+        self.sender.node = {}
+        # receiver requested only meta
+        send_map = {object_hash: {'meta': True}}
+        self.sender.send_delete = mock.MagicMock()
+        self.sender.send_put = mock.MagicMock()
+        self.sender.send_post = mock.MagicMock()
+        response = FakeResponse(
+            chunk_body=(
+                ':UPDATES: START\r\n'
+                ':UPDATES: END\r\n'))
+        self.sender.updates(connection, response, send_map)
+        self.assertEqual(self.sender.send_delete.mock_calls, [])
+        self.assertEqual(self.sender.send_put.mock_calls, [])
+        self.assertEqual(1, len(self.sender.send_post.mock_calls))
+        args, _kwargs = self.sender.send_post.call_args
+        connection, path, df = args
+        self.assertEqual(path, '/a/c/o')
+        self.assertIsInstance(df, diskfile.DiskFile)
+        self.assertEqual(expected, df.get_metadata())
+        # note that the post line isn't actually sent since we mock send_post;
+        # send_post is tested separately.
+        expected_messages = [
+            b':UPDATES: START',
+            b':UPDATES: END']
+        self.assertConnectionMessages(expected_messages, connection.sent)
+
+    def test_updates_put_and_post(self):
+        ts_iter = make_timestamp_iter()
+        device = 'dev'
+        part = '9'
+        object_parts = ('a', 'c', 'o')
+        t1 = next(ts_iter)
+        df = self._make_open_diskfile(
+            device, part, *object_parts, timestamp=t1)
+        t2 = next(ts_iter)
+        metadata = {'X-Timestamp': t2.internal, 'X-Object-Meta-Fruit': 'kiwi'}
+        df.write_metadata(metadata)
+        object_hash = utils.hash_path(*object_parts)
+        df.open()
+        expected = df.get_metadata()
+        connection = FakeConnection()
+        self.sender.job = {
+            'device': device,
+            'partition': part,
+            'policy': POLICIES.legacy,
+            'frag_index': 0,
+        }
+        self.sender.node = {}
+        # receiver requested data and meta
+        send_map = {object_hash: {'meta': True, 'data': True}}
+        self.sender.send_delete = mock.MagicMock()
+        self.sender.send_put = mock.MagicMock()
+        self.sender.send_post = mock.MagicMock()
+        response = FakeResponse(
+            chunk_body=(
+                ':UPDATES: START\r\n'
+                ':UPDATES: END\r\n'))
+        self.sender.updates(connection, response, send_map)
+        self.assertEqual(self.sender.send_delete.mock_calls, [])
+        self.assertEqual(1, len(self.sender.send_put.mock_calls))
+        self.assertEqual(1, len(self.sender.send_post.mock_calls))
+
+        args, _kwargs = self.sender.send_put.call_args
+        connection, path, df = args
+        self.assertEqual(path, '/a/c/o')
+        self.assertIsInstance(df, diskfile.DiskFile)
+        self.assertEqual(expected, df.get_metadata())
+
+        args, _kwargs = self.sender.send_post.call_args
+        connection, path, df = args
+        self.assertEqual(path, '/a/c/o')
+        self.assertIsInstance(df, diskfile.DiskFile)
+        self.assertEqual(expected, df.get_metadata())
+        expected_messages = [
+            b':UPDATES: START',
+            b':UPDATES: END']
+        self.assertConnectionMessages(expected_messages, connection.sent)
+
+    def test_updates_storage_policy_index(self):
+        device = 'dev'
+        part = '9'
+        object_parts = ('a', 'c', 'o')
+        df = self._make_open_diskfile(device, part, *object_parts,
+                                      policy=POLICIES[0])
+        object_hash = utils.hash_path(*object_parts)
+        expected = df.get_metadata()
+        connection = FakeConnection()
+        self.sender.job = {
+            'device': device,
+            'partition': part,
+            'policy': POLICIES[0],
+            'frag_index': 0}
+        self.sender.node = {}
+        send_map = {object_hash: {'data': True}}
+        self.sender.send_delete = mock.MagicMock()
+        self.sender.send_put = mock.MagicMock()
+        response = FakeResponse(
+            chunk_body=(
+                ':UPDATES: START\r\n'
+                ':UPDATES: END\r\n'))
+        self.sender.updates(connection, response, send_map)
+        args, _kwargs = self.sender.send_put.call_args
+        connection, path, df = args
+        self.assertEqual(path, '/a/c/o')
+        self.assertIsInstance(df, diskfile.DiskFile)
+        self.assertEqual(expected, df.get_metadata())
+        self.assertEqual(os.path.join(self.tx_testdir, 'dev/objects/9/',
+                                      object_hash[-3:], object_hash),
+                         df._datadir)
+
+    def test_updates_read_response_timeout_start(self):
+        connection = FakeConnection()
+        response = FakeResponse(
+            chunk_body=(
+                ':UPDATES: START\r\n'
+                ':UPDATES: END\r\n'))
+        orig_readline = response.readline
+
+        def delayed_readline(*args, **kwargs):
+            eventlet.sleep(1)
+            return orig_readline(*args, **kwargs)
+
+        response.readline = delayed_readline
+        self.sender.daemon.http_timeout = 0.01
+        self.assertRaises(exceptions.MessageTimeout, self.sender.updates,
+                          connection, response, {})
+
+    def test_updates_read_response_disconnect_start(self):
+        connection = FakeConnection()
+        response = FakeResponse(chunk_body='\r\n')
+        exc = None
+        try:
+            self.sender.updates(connection, response, {})
+        except exceptions.ReplicationException as err:
+            exc = err
+        self.assertEqual(str(exc), 'Early disconnect')
+        expected_messages = [
+            b':UPDATES: START',
+            b':UPDATES: END']
+        self.assertConnectionMessages(expected_messages, connection.sent)
+
+    def test_updates_read_response_unexp_start(self):
+        connection = FakeConnection()
+        response = FakeResponse(
+            chunk_body=(
+                'anything else\r\n'
+                ':UPDATES: START\r\n'
+                ':UPDATES: END\r\n'))
+        exc = None
+        try:
+            self.sender.updates(connection, response, {})
+        except exceptions.ReplicationException as err:
+            exc = err
+        self.assertEqual(str(exc), "Unexpected response: 'anything else'")
+        expected_messages = [
+            b':UPDATES: START',
+            b':UPDATES: END']
+        self.assertConnectionMessages(expected_messages, connection.sent)
+
+    def test_updates_read_response_timeout_end(self):
+        connection = FakeConnection()
+        response = FakeResponse(
+            chunk_body=(
+                ':UPDATES: START\r\n'
+                ':UPDATES: END\r\n'))
+        orig_readline = response.readline
+
+        def delayed_readline(*args, **kwargs):
+            rv = orig_readline(*args, **kwargs)
+            if rv == b':UPDATES: END\r\n':
+                eventlet.sleep(1)
+            return rv
+
+        response.readline = delayed_readline
+        self.sender.daemon.http_timeout = 0.01
+        self.assertRaises(exceptions.MessageTimeout, self.sender.updates,
+                          connection, response, {})
+
+    def test_updates_read_response_disconnect_end(self):
+        connection = FakeConnection()
+        response = FakeResponse(
+            chunk_body=(
+                ':UPDATES: START\r\n'
+                '\r\n'))
+        exc = None
+        try:
+            self.sender.updates(connection, response, {})
+        except exceptions.ReplicationException as err:
+            exc = err
+        self.assertEqual(str(exc), 'Early disconnect')
+        expected_messages = [
+            b':UPDATES: START',
+            b':UPDATES: END']
+        self.assertConnectionMessages(expected_messages, connection.sent)
+
+    def test_updates_read_response_unexp_end(self):
+        connection = FakeConnection()
+        response = FakeResponse(
+            chunk_body=(
+                ':UPDATES: START\r\n'
+                'anything else\r\n'
+                ':UPDATES: END\r\n'))
+        exc = None
+        try:
+            self.sender.updates(connection, response, {})
+        except exceptions.ReplicationException as err:
+            exc = err
+        self.assertEqual(str(exc), "Unexpected response: 'anything else'")
+        expected_messages = [
+            b':UPDATES: START',
+            b':UPDATES: END']
+        self.assertConnectionMessages(expected_messages, connection.sent)
+
+    def test_send_delete_timeout(self):
+        connection = FakeConnection()
+        connection.send = lambda d: eventlet.sleep(1)
+        self.sender.daemon.node_timeout = 0.01
+        exc = None
+        try:
+            self.sender.send_delete(connection, '/a/c/o',
+                                    utils.Timestamp('1381679759.90941'))
+        except exceptions.MessageTimeout as err:
+            exc = err
+        self.assertEqual(str(exc), '0.01 seconds: send_delete')
+
+    def test_send_delete(self):
+        connection = FakeConnection()
+        ts = self.ts()
+        self.sender.send_delete(connection, '/a/c/o', ts)
+        expected_messages = [
+            b'DELETE /a/c/o\r\nX-Timestamp: %s\r\n'
+            % ts.internal.encode('ascii')]
+        self.assertConnectionMessages(expected_messages, connection.sent)
+
+    def test_send_put_initial_timeout(self):
+        df = self._make_open_diskfile()
+        df._disk_chunk_size = 2
+        connection = FakeConnection()
+        connection.send = lambda d: eventlet.sleep(1)
+        self.sender.daemon.node_timeout = 0.01
+        exc = None
+        try:
+            self.sender.send_put(connection, '/a/c/o', df)
+        except exceptions.MessageTimeout as err:
+            exc = err
+        self.assertEqual(str(exc), '0.01 seconds: send_put')
+
+    def test_send_put_chunk_timeout(self):
+        df = self._make_open_diskfile()
+        connection = FakeConnection()
+        self.sender.daemon.node_timeout = 0.01
+
+        one_shot = [None]
+
+        def mock_send(data):
+            try:
+                one_shot.pop()
+            except IndexError:
+                eventlet.sleep(1)
+
+        connection.send = mock_send
+
+        exc = None
+        try:
+            self.sender.send_put(connection, '/a/c/o', df)
+        except exceptions.MessageTimeout as err:
+            exc = err
+        self.assertEqual(str(exc), '0.01 seconds: send_put chunk')
+
+    def _check_send_put(self, obj_name, meta_value,
+                        meta_name='Unicode-Meta-Name', durable=True):
+        t1 = self.ts()
+        body = b'test'
+        extra_metadata = {'Some-Other-Header': 'value',
+                          meta_name: meta_value}
+        # Note that diskfile expects obj_name to be a native string
+        # but metadata to be wsgi strings
+        df = self._make_open_diskfile(obj=obj_name, body=body,
+                                      timestamp=t1,
+                                      extra_metadata=extra_metadata,
+                                      commit=durable)
+        expected = dict(df.get_metadata())
+        expected['body'] = body.decode('ascii')
+        expected['meta'] = meta_value
+        expected['meta_name'] = meta_name
+        path = urllib.parse.quote(expected['name'])
+        expected['path'] = path
+        no_commit = '' if durable else 'X-Backend-No-Commit: True\r\n'
+        expected['no_commit'] = no_commit
+        # .meta file metadata is not included in expected for data only PUT
+        t2 = self.ts()
+        metadata = {'X-Timestamp': t2.internal, 'X-Object-Meta-Fruit': 'kiwi'}
+        df.write_metadata(metadata)
+        df.open()
+        connection = FakeConnection()
+        self.sender.send_put(connection, path, df, durable=durable)
+        expected_messages = [
+            ('PUT %(path)s\r\n'
+             'Content-Length: %(Content-Length)s\r\n'
+             'ETag: %(ETag)s\r\n'
+             'Some-Other-Header: value\r\n'
+             '%(meta_name)s: %(meta)s\r\n'
+             '%(no_commit)s'
+             'X-Timestamp: %(X-Timestamp)s\r\n\r\n' % expected),
+            '%(body)s' % expected]
+        self.assertConnectionMessages(expected_messages, connection.sent,
+                                      cmds_with_newlines=True)
+
+    def test_send_put(self):
+        self._check_send_put('o', 'meta')
+
+    def test_send_put_non_durable(self):
+        self._check_send_put('o', 'meta', durable=False)
+
+    def test_send_put_unicode(self):
+        self._check_send_put(
+            wsgi_to_str('o_with_caract\xc3\xa8res_like_in_french'),
+            'm\xc3\xa8ta')
+
+    def test_send_put_unicode_header_name(self):
+        self._check_send_put(
+            wsgi_to_str('o_with_caract\xc3\xa8res_like_in_french'),
+            'm\xc3\xa8ta', meta_name='X-Object-Meta-Nam\xc3\xa8')
+
+    def _check_send_post(self, obj_name, meta_value):
+        ts_iter = make_timestamp_iter()
+        # create .data file
+        extra_metadata = {'X-Object-Meta-Foo': 'old_value',
+                          'X-Object-Sysmeta-Test': 'test_sysmeta',
+                          'Content-Type': 'test_content_type'}
+        ts_0 = next(ts_iter)
+        df = self._make_open_diskfile(obj=obj_name,
+                                      extra_metadata=extra_metadata,
+                                      timestamp=ts_0)
+        # create .meta file
+        ts_1 = next(ts_iter)
+        newer_metadata = {u'X-Object-Meta-Foo': meta_value,
+                          'X-Timestamp': ts_1.internal}
+        # Note that diskfile expects obj_name to be a native string
+        # but metadata to be wsgi strings
+        df.write_metadata(newer_metadata)
+        path = urllib.parse.quote(df.read_metadata()['name'])
+        wire_meta = wsgi_to_bytes(meta_value)
+
+        connection = FakeConnection()
+        with df.open():
+            self.sender.send_post(connection, path, df)
+        expected_messages = [
+            (b'POST %s\r\n'
+             b'X-Object-Meta-Foo: %s\r\n'
+             b'X-Timestamp: %s\r\n' % (
+                 path.encode('ascii'),
+                 wire_meta,
+                 ts_1.internal.encode('ascii')
+             ))]
+        self.assertConnectionMessages(expected_messages, connection.sent)
+
+    def test_send_post(self):
+        self._check_send_post('o', 'meta')
+
+    def test_send_post_unicode(self):
+        self._check_send_post(
+            wsgi_to_str('o_with_caract\xc3\xa8res_like_in_french'),
+            'm\xc3\xa8ta')
+
+    def test_disconnect_timeout(self):
+        connection = FakeConnection()
+        connection.send = lambda d: eventlet.sleep(1)
+        self.sender.daemon.node_timeout = 0.01
+        self.sender.disconnect(connection)
+        self.assertEqual(b''.join(connection.sent), b'')
+        self.assertTrue(connection.closed)
+
+    def test_disconnect(self):
+        connection = FakeConnection()
+        self.sender.disconnect(connection)
+        self.assertEqual(b''.join(connection.sent), b'0\r\n\r\n')
+        self.assertTrue(connection.closed)
+
+
+@patch_policies(with_ec_default=True)
+class TestSenderEC(SenderBase):
+    def setUp(self):
+        skip_if_no_xattrs()
+        super(TestSenderEC, self).setUp()
+        self.daemon_logger = debug_logger('test-ssync-sender')
+        self.daemon = ObjectReplicator(self.daemon_conf,
+                                       self.daemon_logger)
+        job = {'policy': POLICIES.legacy}  # sufficient for Sender.__init__
+        self.sender = ssync_sender.Sender(self.daemon, None, job, None)
+
+    def test_missing_check_non_durable(self):
+        # sender has durable and non-durable data files for frag index 2
+        ts_iter = make_timestamp_iter()
+        frag_index = 2
+        device = 'dev'
+        part = '9'
+        object_parts = ('a', 'c', 'o')
+        object_hash = utils.hash_path(*object_parts)
+
+        # older durable data file at t1
+        t1 = next(ts_iter)
+        df_durable = self._make_diskfile(
+            device, part, *object_parts, timestamp=t1, policy=POLICIES.default,
+            frag_index=frag_index, commit=True, verify=False)
+        with df_durable.open():
+            self.assertEqual(t1, df_durable.durable_timestamp)  # sanity
+
+        # newer non-durable data file at t2
+        t2 = next(ts_iter)
+        df_non_durable = self._make_diskfile(
+            device, part, *object_parts, timestamp=t2, policy=POLICIES.default,
+            frag_index=frag_index, commit=False, frag_prefs=[])
+        with df_non_durable.open():
+            self.assertNotEqual(df_non_durable.data_timestamp,
+                                df_non_durable.durable_timestamp)  # sanity
+
+        self.sender.job = {
+            'device': device,
+            'partition': part,
+            'policy': POLICIES.default,
+            'frag_index': frag_index,
+        }
+        self.sender.node = {}
+
+        # First call missing check with sender in default mode - expect the
+        # non-durable frag to be ignored
+        response = FakeResponse(
+            chunk_body=':MISSING_CHECK: START\r\n:MISSING_CHECK: END\r\n')
+        connection = FakeConnection()
+        available_map, send_map = self.sender.missing_check(connection,
+                                                            response)
+        expected_messages = [
+            b':MISSING_CHECK: START',
+            object_hash.encode('utf8') + b' ' + t1.internal.encode('utf8'),
+            b':MISSING_CHECK: END']
+        self.assertConnectionMessages(expected_messages, connection.sent)
+        self.assertEqual(
+            available_map, {object_hash: {'ts_data': t1, 'durable': True}})
+
+        # Now make sender send non-durables and repeat missing_check - this
+        # time the durable is ignored and the non-durable is included in
+        # available_map (but NOT sent to receiver)
+        self.sender.include_non_durable = True
+        response = FakeResponse(
+            chunk_body=':MISSING_CHECK: START\r\n:MISSING_CHECK: END\r\n')
+        connection = FakeConnection()
+        available_map, send_map = self.sender.missing_check(connection,
+                                                            response)
+        expected_messages = [
+            b':MISSING_CHECK: START',
+            object_hash.encode('utf8') + b' ' + t2.internal.encode('utf8')
+            + b' durable:False',
+            b':MISSING_CHECK: END']
+        self.assertConnectionMessages(expected_messages, connection.sent)
+        self.assertEqual(
+            available_map, {object_hash: {'ts_data': t2, 'durable': False}})
+
+        # Finally, purge the non-durable frag and repeat missing-check to
+        # confirm that the durable frag is now found and sent to receiver
+        df_non_durable.purge(t2, frag_index)
+        response = FakeResponse(
+            chunk_body=':MISSING_CHECK: START\r\n:MISSING_CHECK: END\r\n')
+        connection = FakeConnection()
+        available_map, send_map = self.sender.missing_check(connection,
+                                                            response)
+        expected_messages = [
+            b':MISSING_CHECK: START',
+            object_hash.encode('utf8') + b' ' + t1.internal.encode('utf8'),
+            b':MISSING_CHECK: END']
+        self.assertConnectionMessages(expected_messages, connection.sent)
+        self.assertEqual(
+            available_map, {object_hash: {'ts_data': t1, 'durable': True}})
+
+    def test_updates_put_non_durable(self):
+        # sender has durable and non-durable data files for frag index 2 and is
+        # initialised to include non-durables
+        ts_iter = make_timestamp_iter()
+        frag_index = 2
+        device = 'dev'
+        part = '9'
+        object_parts = ('a', 'c', 'o')
+        object_hash = utils.hash_path(*object_parts)
+
+        # older durable data file
+        t1 = next(ts_iter)
+        df_durable = self._make_diskfile(
+            device, part, *object_parts, timestamp=t1, policy=POLICIES.default,
+            frag_index=frag_index, commit=True, verify=False)
+        with df_durable.open():
+            self.assertEqual(t1, df_durable.durable_timestamp)  # sanity
+
+        # newer non-durable data file
+        t2 = next(ts_iter)
+        df_non_durable = self._make_diskfile(
+            device, part, *object_parts, timestamp=t2, policy=POLICIES.default,
+            frag_index=frag_index, commit=False, frag_prefs=[])
+        with df_non_durable.open():
+            self.assertNotEqual(df_non_durable.data_timestamp,
+                                df_non_durable.durable_timestamp)  # sanity
+
+        # pretend receiver requested data only
+        send_map = {object_hash: {'data': True}}
+
+        def check_updates(include_non_durable, expected_durable_kwarg):
+            # call updates and check that the call to send_put is as expected
+            self.sender.include_non_durable = include_non_durable
+            self.sender.job = {
+                'device': device,
+                'partition': part,
+                'policy': POLICIES.default,
+                'frag_index': frag_index,
+            }
+            self.sender.node = {}
+            self.sender.send_delete = mock.MagicMock()
+            self.sender.send_put = mock.MagicMock()
+            self.sender.send_post = mock.MagicMock()
+            response = FakeResponse(
+                chunk_body=':UPDATES: START\r\n:UPDATES: END\r\n')
+            connection = FakeConnection()
+
+            self.sender.updates(connection, response, send_map)
+
+            self.assertEqual(self.sender.send_delete.mock_calls, [])
+            self.assertEqual(self.sender.send_post.mock_calls, [])
+            self.assertEqual(1, len(self.sender.send_put.mock_calls))
+            args, kwargs = self.sender.send_put.call_args
+            connection, path, df_non_durable = args
+            self.assertEqual(path, '/a/c/o')
+            self.assertEqual({'durable': expected_durable_kwarg}, kwargs)
+            # note that the put line isn't actually sent since we mock
+            # send_put; send_put is tested separately.
+            expected_messages = [
+                b':UPDATES: START',
+                b':UPDATES: END']
+
+            self.assertConnectionMessages(expected_messages, connection.sent)
+
+        # note: we never expect the (False, False) case
+        check_updates(include_non_durable=False, expected_durable_kwarg=True)
+        # non-durable frag is newer so is sent
+        check_updates(include_non_durable=True, expected_durable_kwarg=False)
+        # remove the newer non-durable frag so that the durable frag is sent...
+        df_non_durable.purge(t2, frag_index)
+        check_updates(include_non_durable=True, expected_durable_kwarg=True)
+
+
+class TestModuleMethods(unittest.TestCase):
+    def test_encode_missing(self):
+        object_hash = '9d41d8cd98f00b204e9800998ecf0abc'
+        ts_iter = make_timestamp_iter()
+        t_data = next(ts_iter)
+        t_type = next(ts_iter)
+        t_meta = next(ts_iter)
+        d_meta_data = t_meta.raw - t_data.raw
+        d_type_data = t_type.raw - t_data.raw
+
+        # equal data and meta timestamps -> legacy single timestamp string
+        expected = '%s %s' % (object_hash, t_data.internal)
+        self.assertEqual(
+            expected.encode('ascii'),
+            ssync_sender.encode_missing(object_hash, t_data, ts_meta=t_data))
+
+        # newer meta timestamp -> hex data delta encoded as extra message part
+        expected = '%s %s m:%x' % (object_hash, t_data.internal, d_meta_data)
+        self.assertEqual(
+            expected.encode('ascii'),
+            ssync_sender.encode_missing(object_hash, t_data, ts_meta=t_meta))
+
+        # newer meta timestamp -> hex data delta encoded as extra message part
+        # content type timestamp equals data timestamp -> no delta
+        expected = '%s %s m:%x' % (object_hash, t_data.internal, d_meta_data)
+        self.assertEqual(
+            expected.encode('ascii'),
+            ssync_sender.encode_missing(object_hash, t_data, t_meta, t_data))
+
+        # content type timestamp newer data timestamp -> delta encoded
+        expected = ('%s %s m:%x,t:%x'
+                    % (object_hash, t_data.internal, d_meta_data, d_type_data))
+        self.assertEqual(
+            expected.encode('ascii'),
+            ssync_sender.encode_missing(object_hash, t_data, t_meta, t_type))
+
+        # content type timestamp equal to meta timestamp -> delta encoded
+        expected = ('%s %s m:%x,t:%x'
+                    % (object_hash, t_data.internal, d_meta_data, d_type_data))
+        self.assertEqual(
+            expected.encode('ascii'),
+            ssync_sender.encode_missing(object_hash, t_data, t_meta, t_type))
+
+        # optional durable param
+        expected = ('%s %s m:%x,t:%x'
+                    % (object_hash, t_data.internal, d_meta_data, d_type_data))
+        self.assertEqual(
+            expected.encode('ascii'),
+            ssync_sender.encode_missing(object_hash, t_data, t_meta, t_type,
+                                        durable=None))
+        expected = ('%s %s m:%x,t:%x,durable:False'
+                    % (object_hash, t_data.internal, d_meta_data, d_type_data))
+        self.assertEqual(
+            expected.encode('ascii'),
+            ssync_sender.encode_missing(object_hash, t_data, t_meta, t_type,
+                                        durable=False))
+        expected = ('%s %s m:%x,t:%x'
+                    % (object_hash, t_data.internal, d_meta_data, d_type_data))
+        self.assertEqual(
+            expected.encode('ascii'),
+            ssync_sender.encode_missing(object_hash, t_data, t_meta, t_type,
+                                        durable=True))
+
+        # timestamps have offsets
+        t_data_offset = utils.Timestamp(t_data, offset=99)
+        t_meta_offset = utils.Timestamp(t_meta, offset=1)
+        t_type_offset = utils.Timestamp(t_type, offset=2)
+        expected = ('%s %s m:%x__1,t:%x__2'
+                    % (object_hash, t_data_offset.internal, d_meta_data,
+                       d_type_data))
+        self.assertEqual(
+            expected.encode('ascii'),
+            ssync_sender.encode_missing(
+                object_hash, t_data_offset, t_meta_offset, t_type_offset,
+                durable=True))
+
+        # test encode and decode functions invert
+        expected = {'object_hash': object_hash, 'ts_meta': t_meta,
+                    'ts_data': t_data, 'ts_ctype': t_type, 'durable': False}
+        msg = ssync_sender.encode_missing(**expected)
+        actual = ssync_receiver.decode_missing(msg)
+        self.assertEqual(expected, actual)
+
+        expected = {'object_hash': object_hash, 'ts_meta': t_meta,
+                    'ts_data': t_meta, 'ts_ctype': t_meta, 'durable': True}
+        msg = ssync_sender.encode_missing(**expected)
+        actual = ssync_receiver.decode_missing(msg)
+        self.assertEqual(expected, actual)
+
+        # test encode and decode functions invert with offset
+        t_data_offset = utils.Timestamp(t_data, offset=1)
+        expected = {'object_hash': object_hash, 'ts_meta': t_meta,
+                    'ts_data': t_data_offset, 'ts_ctype': t_type,
+                    'durable': False}
+        msg = ssync_sender.encode_missing(**expected)
+        actual = ssync_receiver.decode_missing(msg)
+        self.assertEqual(expected, actual)
+
+        t_meta_offset = utils.Timestamp(t_data, offset=2)
+        expected = {'object_hash': object_hash, 'ts_meta': t_meta_offset,
+                    'ts_data': t_data, 'ts_ctype': t_type,
+                    'durable': False}
+        msg = ssync_sender.encode_missing(**expected)
+        actual = ssync_receiver.decode_missing(msg)
+        self.assertEqual(expected, actual)
+
+        t_type_offset = utils.Timestamp(t_type, offset=3)
+        expected = {'object_hash': object_hash, 'ts_meta': t_meta,
+                    'ts_data': t_data, 'ts_ctype': t_type_offset,
+                    'durable': False}
+        msg = ssync_sender.encode_missing(**expected)
+        actual = ssync_receiver.decode_missing(msg)
+        self.assertEqual(expected, actual)
+
+        expected = {'object_hash': object_hash, 'ts_meta': t_meta_offset,
+                    'ts_data': t_data_offset, 'ts_ctype': t_type_offset,
+                    'durable': False}
+        msg = ssync_sender.encode_missing(**expected)
+        actual = ssync_receiver.decode_missing(msg)
+        self.assertEqual(expected, actual)
+
+    def test_decode_wanted(self):
+        parts = ['d']
+        expected = {'data': True}
+        self.assertEqual(ssync_sender.decode_wanted(parts), expected)
+
+        parts = ['m']
+        expected = {'meta': True}
+        self.assertEqual(ssync_sender.decode_wanted(parts), expected)
+
+        parts = ['dm']
+        expected = {'data': True, 'meta': True}
+        self.assertEqual(ssync_sender.decode_wanted(parts), expected)
+
+        # you don't really expect these next few...
+        parts = ['md']
+        expected = {'data': True, 'meta': True}
+        self.assertEqual(ssync_sender.decode_wanted(parts), expected)
+
+        parts = ['xcy', 'funny', {'business': True}]
+        expected = {'data': True}
+        self.assertEqual(ssync_sender.decode_wanted(parts), expected)
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/obj/test_updater.py b/test/unit/obj/test_updater.py
index 104325b6ac..56b019b737 100644
--- a/test/unit/obj/test_updater.py
+++ b/test/unit/obj/test_updater.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -12,124 +12,716 @@
 # implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
-
-import cPickle as pickle
-import json
+import eventlet
+import pickle
+from queue import PriorityQueue
+from unittest import mock
 import os
 import unittest
-from gzip import GzipFile
+import random
+import itertools
+from collections import Counter
+from tempfile import mkdtemp
 from shutil import rmtree
+import json
+
+from swift.common.exceptions import ConnectionTimeout
+from test import listen_zero
+from test.debug_logger import debug_logger
+from test.unit import (
+    make_timestamp_iter, patch_policies, mocked_http_conn)
 from time import time
-from distutils.dir_util import mkpath
 
-from eventlet import spawn, Timeout, listen
+from eventlet import spawn, Timeout
 
-from swift.obj import updater as object_updater, server as object_server
-from swift.obj.server import ASYNCDIR
+from swift.obj import updater as object_updater
+from swift.obj.diskfile import (
+    ASYNCDIR_BASE, get_async_dir, DiskFileManager, get_tmp_dir)
 from swift.common.ring import RingData
 from swift.common import utils
+from swift.common.header_key_dict import HeaderKeyDict
+from swift.common.swob import bytes_to_wsgi
 from swift.common.utils import hash_path, normalize_timestamp, mkdirs, \
-    write_pickle
-from test.unit import FakeLogger
+    Timestamp
+from swift.common.storage_policy import StoragePolicy, POLICIES
+
+
+class MockPool(object):
+    def __init__(self, *a, **kw):
+        pass
+
+    def spawn(self, func, *args, **kwargs):
+        func(*args, **kwargs)
+
+    def waitall(self):
+        pass
 
+    def __enter__(self):
+        return self
 
+    def __exit__(self, *a, **kw):
+        pass
+
+
+_mocked_policies = [StoragePolicy(0, 'zero', False),
+                    StoragePolicy(1, 'one', True)]
+
+
+def _sorted_listdir(path):
+    return sorted(os.listdir(path))
+
+
+@patch_policies(_mocked_policies)
 class TestObjectUpdater(unittest.TestCase):
+    maxDiff = None
 
     def setUp(self):
-        utils.HASH_PATH_SUFFIX = 'endcap'
-        self.testdir = os.path.join(os.path.dirname(__file__),
-                                    'object_updater')
-        rmtree(self.testdir, ignore_errors=1)
-        os.mkdir(self.testdir)
-        pickle.dump(
-            RingData([[0, 1, 0, 1], [1, 0, 1, 0]],
-                     [{'id': 0, 'ip': '127.0.0.1', 'port': 1, 'device': 'sda1',
-                       'zone': 0},
-                      {'id': 1, 'ip': '127.0.0.1', 'port': 1, 'device': 'sda1',
-                       'zone': 2}], 30),
-            GzipFile(os.path.join(self.testdir, 'container.ring.gz'), 'wb'))
+        utils.HASH_PATH_SUFFIX = b'endcap'
+        utils.HASH_PATH_PREFIX = b''
+        self.testdir = mkdtemp()
+        ring_file = os.path.join(self.testdir, 'container.ring.gz')
+        RingData([[0, 1, 2, 0],
+                  [1, 2, 0, 1],
+                  [2, 3, 1, 2]],
+                 [{'id': 0, 'ip': '127.0.0.2', 'port': 1,
+                   'replication_ip': '127.0.0.1',
+                   # replication_port may be overridden in tests but
+                   # include here for completeness...
+                   'replication_port': 60789,
+                   'device': 'sda1', 'zone': 0, 'region': 1},
+                  {'id': 1, 'ip': '127.0.0.2', 'port': 1,
+                   'replication_ip': '127.0.0.1',
+                   'replication_port': 60789,
+                   'device': 'sda1', 'zone': 2, 'region': 1},
+                  {'id': 2, 'ip': '127.0.0.2', 'port': 1,
+                   'replication_ip': '127.0.0.1',
+                   'replication_port': 60789,
+                   'device': 'sda1', 'zone': 4, 'region': 1},
+                  {'id': 3, 'ip': '127.0.0.2', 'port': 1,
+                   'replication_ip': '127.0.0.1',
+                   'replication_port': 60789,
+                   'device': 'sda1', 'zone': 6, 'region': 1}],
+                 30).save(ring_file)
         self.devices_dir = os.path.join(self.testdir, 'devices')
         os.mkdir(self.devices_dir)
         self.sda1 = os.path.join(self.devices_dir, 'sda1')
         os.mkdir(self.sda1)
-        os.mkdir(os.path.join(self.sda1, 'tmp'))
+        for policy in POLICIES:
+            os.mkdir(os.path.join(self.sda1, get_tmp_dir(policy)))
+        self.logger = debug_logger()
+        self.ts_iter = make_timestamp_iter()
 
     def tearDown(self):
         rmtree(self.testdir, ignore_errors=1)
 
     def test_creation(self):
-        cu = object_updater.ObjectUpdater({
+        ou = object_updater.ObjectUpdater({
             'devices': self.devices_dir,
             'mount_check': 'false',
             'swift_dir': self.testdir,
             'interval': '1',
             'concurrency': '2',
-            'node_timeout': '5'})
-        self.assert_(hasattr(cu, 'logger'))
-        self.assert_(cu.logger is not None)
-        self.assertEquals(cu.devices, self.devices_dir)
-        self.assertEquals(cu.interval, 1)
-        self.assertEquals(cu.concurrency, 2)
-        self.assertEquals(cu.node_timeout, 5)
-        self.assert_(cu.get_container_ring() is not None)
-
-    def test_object_sweep(self):
-        prefix_dir = os.path.join(self.sda1, ASYNCDIR, 'abc')
-        mkpath(prefix_dir)
-
-        objects = {
-            'a': [1089.3, 18.37, 12.83, 1.3],
-            'b': [49.4, 49.3, 49.2, 49.1],
-            'c': [109984.123],
-        }
-
-        expected = set()
-        for o, timestamps in objects.iteritems():
+            'node_timeout': '5.5'})
+        self.assertTrue(hasattr(ou, 'logger'))
+        self.assertTrue(ou.logger is not None)
+        self.assertEqual(ou.devices, self.devices_dir)
+        self.assertEqual(ou.interval, 1)
+        self.assertEqual(ou.concurrency, 2)
+        self.assertEqual(ou.node_timeout, 5.5)
+        self.assertTrue(ou.get_container_ring() is not None)
+
+    def test_conf_params(self):
+        # defaults
+        daemon = object_updater.ObjectUpdater({}, logger=self.logger)
+        self.assertEqual(daemon.devices, '/srv/node')
+        self.assertEqual(daemon.mount_check, True)
+        self.assertEqual(daemon.swift_dir, '/etc/swift')
+        self.assertEqual(daemon.interval, 300)
+        self.assertEqual(daemon.concurrency, 8)
+        self.assertEqual(daemon.updater_workers, 1)
+        self.assertEqual(daemon.max_objects_per_second, 50.0)
+        self.assertEqual(daemon.max_objects_per_container_per_second, 0.0)
+        self.assertEqual(daemon.per_container_ratelimit_buckets, 1000)
+        self.assertEqual(daemon.max_deferred_updates, 10000)
+        self.assertEqual(daemon.oldest_async_pendings.max_entries, 100)
+        self.assertEqual(daemon.dump_count, 5)
+
+        # non-defaults
+        conf = {
+            'devices': '/some/where/else',
+            'mount_check': 'huh?',
+            'swift_dir': '/not/here',
+            'interval': '600.1',
+            'concurrency': '2',
+            'updater_workers': '3',
+            'objects_per_second': '10.5',
+            'max_objects_per_container_per_second': '1.2',
+            'per_container_ratelimit_buckets': '100',
+            'max_deferred_updates': '0',
+            'async_tracker_max_entries': '200',
+            'async_tracker_dump_count': '10',
+        }
+        daemon = object_updater.ObjectUpdater(conf, logger=self.logger)
+        self.assertEqual(daemon.devices, '/some/where/else')
+        self.assertEqual(daemon.mount_check, False)
+        self.assertEqual(daemon.swift_dir, '/not/here')
+        self.assertEqual(daemon.interval, 600.1)
+        self.assertEqual(daemon.concurrency, 2)
+        self.assertEqual(daemon.updater_workers, 3)
+        self.assertEqual(daemon.max_objects_per_second, 10.5)
+        self.assertEqual(daemon.max_objects_per_container_per_second, 1.2)
+        self.assertEqual(daemon.per_container_ratelimit_buckets, 100)
+        self.assertEqual(daemon.max_deferred_updates, 0)
+        self.assertEqual(daemon.oldest_async_pendings.max_entries, 200)
+        self.assertEqual(daemon.dump_count, 10)
+
+        # check deprecated option
+        daemon = object_updater.ObjectUpdater({'slowdown': '0.04'},
+                                              logger=self.logger)
+        self.assertEqual(daemon.max_objects_per_second, 20.0)
+
+        def check_bad(conf):
+            with self.assertRaises(ValueError):
+                object_updater.ObjectUpdater(conf, logger=self.logger)
+
+        check_bad({'interval': 'foo'})
+        check_bad({'concurrency': 'bar'})
+        check_bad({'concurrency': '1.0'})
+        check_bad({'updater_workers': '0'})
+        check_bad({'updater_workers': '-1'})
+        check_bad({'slowdown': 'baz'})
+        check_bad({'objects_per_second': 'quux'})
+        check_bad({'max_objects_per_container_per_second': '-0.1'})
+        check_bad({'max_objects_per_container_per_second': 'auto'})
+        check_bad({'per_container_ratelimit_buckets': '1.2'})
+        check_bad({'per_container_ratelimit_buckets': '0'})
+        check_bad({'per_container_ratelimit_buckets': '-1'})
+        check_bad({'per_container_ratelimit_buckets': 'auto'})
+        check_bad({'max_deferred_updates': '-1'})
+        check_bad({'max_deferred_updates': '1.1'})
+        check_bad({'max_deferred_updates': 'auto'})
+        check_bad({'async_tracker_max_entries': '-10'})
+        check_bad({'async_tracker_dump_count': '-5'})
+
+    @mock.patch('os.listdir')
+    def test_listdir_with_exception(self, mock_listdir):
+        e = OSError('permission_denied')
+        mock_listdir.side_effect = e
+        # setup updater
+        conf = {
+            'devices': self.devices_dir,
+            'mount_check': 'false',
+            'swift_dir': self.testdir,
+        }
+        daemon = object_updater.ObjectUpdater(conf, logger=self.logger)
+        paths = daemon._listdir('foo/bar')
+        self.assertEqual([], paths)
+        log_lines = self.logger.get_lines_for_level('error')
+        msg = ('ERROR: Unable to access foo/bar: permission_denied')
+        self.assertEqual(log_lines[0], msg)
+
+    @mock.patch('os.listdir', return_value=['foo', 'bar'])
+    def test_listdir_without_exception(self, mock_listdir):
+        # setup updater
+        conf = {
+            'devices': self.devices_dir,
+            'mount_check': 'false',
+            'swift_dir': self.testdir,
+        }
+        daemon = object_updater.ObjectUpdater(conf, logger=self.logger)
+        path = daemon._listdir('foo/bar/')
+        log_lines = self.logger.get_lines_for_level('error')
+        self.assertEqual(len(log_lines), 0)
+        self.assertEqual(path, ['foo', 'bar'])
+
+    @mock.patch('swift.obj.updater.dump_recon_cache')
+    def test_object_sweep(self, mock_recon):
+        def check_with_idx(policy_index, warn, should_skip):
+            if int(policy_index) > 0:
+                asyncdir = os.path.join(self.sda1,
+                                        ASYNCDIR_BASE + "-" + policy_index)
+            else:
+                asyncdir = os.path.join(self.sda1, ASYNCDIR_BASE)
+
+            prefix_dir = os.path.join(asyncdir, 'abc')
+            mkdirs(prefix_dir)
+
+            # A non-directory where directory is expected should just be
+            # skipped, but should not stop processing of subsequent
+            # directories.
+            not_dirs = (
+                os.path.join(self.sda1, 'not_a_dir'),
+                os.path.join(self.sda1,
+                             ASYNCDIR_BASE + '-' + 'twentington'),
+                os.path.join(self.sda1,
+                             ASYNCDIR_BASE + '-' + str(
+                                 int(policy_index) + 100)))
+
+            for not_dir in not_dirs:
+                with open(not_dir, 'w'):
+                    pass
+
+            objects = {
+                'a': [1089.3, 18.37, 12.83, 1.3],
+                'b': [49.4, 49.3, 49.2, 49.1],
+                'c': [109984.123],
+            }
+
+            expected = set()
+            for o, timestamps in objects.items():
+                ohash = hash_path('account', 'container', o)
+                for t in timestamps:
+                    o_path = os.path.join(prefix_dir, ohash + '-' +
+                                          normalize_timestamp(t))
+                    if t == timestamps[0]:
+                        expected.add((o_path, int(policy_index)))
+                    self._write_dummy_pickle(o_path, 'account', 'container', o)
+
+            seen = set()
+
+            class MockObjectUpdater(object_updater.ObjectUpdater):
+                def process_object_update(self, update_path, policy, **kwargs):
+                    seen.add((update_path, int(policy)))
+                    os.unlink(update_path)
+
+            ou = MockObjectUpdater({
+                'devices': self.devices_dir,
+                'mount_check': 'false',
+                'swift_dir': self.testdir,
+                'interval': '1',
+                'concurrency': '1',
+                'node_timeout': '5'})
+            ou.logger = mock_logger = mock.MagicMock()
+            ou.object_sweep(self.sda1)
+            self.assertEqual(mock_logger.warning.call_count, warn)
+            self.assertTrue(
+                os.path.exists(os.path.join(self.sda1, 'not_a_dir')))
+            if should_skip:
+                # if we were supposed to skip over the dir, we didn't process
+                # anything at all
+                self.assertEqual(set(), seen)
+            else:
+                self.assertEqual(expected, seen)
+
+            # test cleanup: the tempdir gets cleaned up between runs, but this
+            # way we can be called multiple times in a single test method
+            for not_dir in not_dirs:
+                os.unlink(not_dir)
+
+        # first check with valid policies
+        for pol in POLICIES:
+            check_with_idx(str(pol.idx), 0, should_skip=False)
+        # now check with a bogus async dir policy and make sure we get
+        # a warning indicating that the '99' policy isn't valid
+        check_with_idx('99', 1, should_skip=True)
+
+    def test_sweep_logs(self):
+        asyncdir = os.path.join(self.sda1, ASYNCDIR_BASE)
+        prefix_dir = os.path.join(asyncdir, 'abc')
+        mkdirs(prefix_dir)
+
+        for o, t in [('abc', 123), ('def', 234), ('ghi', 345),
+                     ('jkl', 456), ('mno', 567)]:
             ohash = hash_path('account', 'container', o)
-            for t in timestamps:
+            o_path = os.path.join(prefix_dir, ohash + '-' +
+                                  normalize_timestamp(t))
+            self._write_dummy_pickle(o_path, 'account', 'container', o)
+
+        class MockObjectUpdater(object_updater.ObjectUpdater):
+            def process_object_update(self, update_path, **kwargs):
+                os.unlink(update_path)
+                self.stats.successes += 1
+                self.stats.unlinks += 1
+
+        logger = debug_logger()
+        ou = MockObjectUpdater({
+            'devices': self.devices_dir,
+            'mount_check': 'false',
+            'swift_dir': self.testdir,
+            'interval': '1',
+            'concurrency': '1',
+            'report_interval': '10.0',
+            'node_timeout': '5'}, logger=logger)
+
+        now = [time()]
+
+        def mock_time_function():
+            rv = now[0]
+            now[0] += 4
+            return rv
+
+        # With 10s between updates, time() advancing 4s every time we look,
+        # and 5 async_pendings on disk, we should get at least two progress
+        # lines. (time is incremented by 4 each time the update app iter yields
+        # and each time the elapsed time is sampled)
+        with mock.patch('swift.obj.updater.time',
+                        mock.MagicMock(time=mock_time_function)), \
+                mock.patch.object(object_updater, 'ContextPool', MockPool):
+            ou.object_sweep(self.sda1)
+
+        info_lines = logger.get_lines_for_level('info')
+        self.assertEqual(4, len(info_lines))
+        self.assertIn("sweep starting", info_lines[0])
+        self.assertIn(self.sda1, info_lines[0])
+
+        self.assertIn("sweep progress", info_lines[1])
+        # the space ensures it's a positive number
+        self.assertIn(
+            "2 successes, 0 failures, 0 quarantines, 2 unlinks, "
+            "0 outdated_unlinks, 0 errors, 0 redirects",
+            info_lines[1])
+        self.assertIn(self.sda1, info_lines[1])
+
+        self.assertIn("sweep progress", info_lines[2])
+        self.assertIn(
+            "4 successes, 0 failures, 0 quarantines, 4 unlinks, "
+            "0 outdated_unlinks, 0 errors, 0 redirects",
+            info_lines[2])
+        self.assertIn(self.sda1, info_lines[2])
+
+        self.assertIn("sweep complete", info_lines[3])
+        self.assertIn(
+            "5 successes, 0 failures, 0 quarantines, 5 unlinks, "
+            "0 outdated_unlinks, 0 errors, 0 redirects",
+            info_lines[3])
+        self.assertIn(self.sda1, info_lines[3])
+
+    def test_sweep_logs_multiple_policies(self):
+        for policy in _mocked_policies:
+            asyncdir = os.path.join(self.sda1, get_async_dir(policy.idx))
+            prefix_dir = os.path.join(asyncdir, 'abc')
+            mkdirs(prefix_dir)
+
+            for o, t in [('abc', 123), ('def', 234), ('ghi', 345)]:
+                ohash = hash_path('account', 'container%d' % policy.idx, o)
                 o_path = os.path.join(prefix_dir, ohash + '-' +
                                       normalize_timestamp(t))
-                if t == timestamps[0]:
-                    expected.add(o_path)
-                write_pickle({}, o_path)
-
-        seen = set()
+                self._write_dummy_pickle(o_path, 'account', 'container', o)
 
         class MockObjectUpdater(object_updater.ObjectUpdater):
-            def process_object_update(self, update_path, device):
-                seen.add(update_path)
+            def process_object_update(self, update_path, **kwargs):
                 os.unlink(update_path)
+                self.stats.successes += 1
+                self.stats.unlinks += 1
+
+        logger = debug_logger()
+        ou = MockObjectUpdater({
+            'devices': self.devices_dir,
+            'mount_check': 'false',
+            'swift_dir': self.testdir,
+            'interval': '1',
+            'concurrency': '1',
+            'report_interval': '10.0',
+            'node_timeout': '5'}, logger=logger)
+
+        now = [time()]
+
+        def mock_time():
+            rv = now[0]
+            now[0] += 0.01
+            return rv
+
+        with mock.patch('swift.obj.updater.time',
+                        mock.MagicMock(time=mock_time)):
+            ou.object_sweep(self.sda1)
+
+        completion_lines = [l for l in logger.get_lines_for_level('info')
+                            if "sweep complete" in l]
 
-        cu = MockObjectUpdater({
+        self.assertEqual(len(completion_lines), 1)
+        self.assertIn("sweep complete", completion_lines[0])
+        self.assertIn(
+            "6 successes, 0 failures, 0 quarantines, 6 unlinks, "
+            "0 outdated_unlinks, 0 errors, 0 redirects",
+            completion_lines[0])
+
+    @mock.patch.object(object_updater, 'check_drive')
+    @mock.patch('swift.obj.updater.os')
+    def test_run_once_with_disk_unmounted(self, mock_os, mock_check_drive):
+        def fake_mount_check(root, device, mount_check=True):
+            raise ValueError('%s is unmounted' % device)
+        mock_check_drive.side_effect = fake_mount_check
+        mock_os.path = os.path
+        mock_os.listdir = _sorted_listdir
+
+        # mount_check False
+        ou = object_updater.ObjectUpdater({
             'devices': self.devices_dir,
             'mount_check': 'false',
             'swift_dir': self.testdir,
             'interval': '1',
             'concurrency': '1',
-            'node_timeout': '5'})
-        cu.object_sweep(self.sda1)
-        self.assert_(not os.path.exists(prefix_dir))
-        self.assertEqual(expected, seen)
+            'node_timeout': '15'}, logger=self.logger)
+
+        ou.run_once()
+        self.assertEqual([
+            mock.call(self.devices_dir, 'sda1', False),
+        ], mock_check_drive.mock_calls)
+        mock_check_drive.reset_mock()
+        self.assertEqual([], mock_os.mock_calls)
+        self.assertEqual(['Skipping: sda1 is unmounted'],
+                         self.logger.get_lines_for_level('warning'))
+        self.logger.clear()
+
+        # mount_check True
+        ou = object_updater.ObjectUpdater({
+            'devices': self.devices_dir,
+            'mount_check': 'TrUe',
+            'swift_dir': self.testdir,
+            'interval': '1',
+            'concurrency': '1',
+            'node_timeout': '15'}, logger=self.logger)
+        ou.run_once()
+        self.assertEqual([
+            mock.call(self.devices_dir, 'sda1', True),
+        ], mock_check_drive.mock_calls)
+        mock_check_drive.reset_mock()
+        self.assertEqual([], mock_os.mock_calls)
+        self.assertEqual(['Skipping: sda1 is unmounted'],
+                         self.logger.get_lines_for_level('warning'))
+        self.logger.clear()
+        self.assertEqual(ou.logger.statsd_client.get_stats_counts(), {})
+
+        # multiple devices, one unmounted
+        NUM_DEVICES = 4
+
+        def fake_list_dir(path):
+            if path == self.devices_dir:
+                return ['sda' + str(i)
+                        for i in range(NUM_DEVICES)]
+            else:
+                return os.listdir(path)
+        mock_os.listdir = fake_list_dir
+
+        def fake_mount_check(root, device, mount_check=True):
+            if device == 'sda2':
+                raise ValueError('%s is unmounted' % device)
+            else:
+                return os.path.join(root, device)
+        mock_check_drive.side_effect = fake_mount_check
+
+        def fake_list_dir(path):
+            if path == self.devices_dir:
+                return ['sda1', 'sda0', 'sda2', 'sda3']
+            else:
+                return os.listdir(path)
+        mock_os.listdir.side_effect = fake_list_dir
+
+        pids = [i + 1 for i in range(NUM_DEVICES)]
+        mock_os.fork.side_effect = list(pids)
+        mock_os.wait.side_effect = [(p, 0) for p in pids]
+        ou.run_once()
+        self.assertEqual([
+            mock.call(self.devices_dir, 'sda0', True),
+            mock.call(self.devices_dir, 'sda1', True),
+            mock.call(self.devices_dir, 'sda2', True),
+            mock.call(self.devices_dir, 'sda3', True),
+        ], mock_check_drive.mock_calls)
+        # we fork/wait for each mounted device
+        self.assertEqual([
+            mock.call.fork(),
+            mock.call.wait(),
+        ] * (NUM_DEVICES - 1), mock_os.mock_calls)
+        self.assertEqual(['Skipping: sda2 is unmounted'],
+                         self.logger.get_lines_for_level('warning'))
+        self.logger.clear()
+        self.assertEqual(ou.logger.statsd_client.get_stats_counts(), {})
+
+    @mock.patch('swift.obj.updater.os')
+    def test_run_once_child(self, mock_os):
+        mock_os.path = os.path
+        mock_os.listdir = _sorted_listdir
+        ou = object_updater.ObjectUpdater({
+            'devices': self.devices_dir,
+            'mount_check': 'false',
+            'swift_dir': self.testdir,
+            'interval': '1',
+            'concurrency': '1',
+            'node_timeout': '15'}, logger=self.logger)
+        devices = []
+        NUM_DEVICES = 4
+        for i in range(1, NUM_DEVICES + 1):
+            device = os.path.join(self.devices_dir, 'sda' + str(i))
+            devices.append(device)
+            async_dir = os.path.join(device, get_async_dir(POLICIES[0]))
+            mkdirs(async_dir)
+
+        mock_os.fork.side_effect = [0]
+        mock_process = ou._process_device_in_child = mock.MagicMock()
+        with self.assertRaises(SystemExit):
+            ou.run_once()
+        self.assertEqual([
+            mock.call(self.sda1, 'sda1'),
+        ], mock_process.mock_calls)
+
+    @mock.patch('swift.obj.updater.os')
+    def test_run_once_subsequent_children(self, mock_os):
+        mock_os.path = os.path
+        mock_os.listdir = _sorted_listdir
+        ou = object_updater.ObjectUpdater({
+            'devices': self.devices_dir,
+            'mount_check': 'false',
+            'swift_dir': self.testdir,
+            'updater_workers': '4',
+            'interval': '1',
+            'concurrency': '1',
+            'node_timeout': '15'}, logger=self.logger)
+        devices = []
+        NUM_DEVICES = 4
+        for i in range(NUM_DEVICES):
+            device = os.path.join(self.devices_dir, 'sda' + str(i))
+            devices.append(device)
+            async_dir = os.path.join(device, get_async_dir(POLICIES[0]))
+            mkdirs(async_dir)
+
+        mock_process = ou._process_device_in_child = mock.MagicMock()
+        pids = [i + 1 for i in range(NUM_DEVICES)]
+        for i in range(4):
+            mock_os.fork.side_effect = pids[:i] + [0]
+            with self.assertRaises(SystemExit):
+                ou.run_once()
+
+        self.assertEqual([
+            mock.call(os.path.join(self.devices_dir, 'sda0'), 'sda0'),
+            mock.call(os.path.join(self.devices_dir, 'sda1'), 'sda1'),
+            mock.call(os.path.join(self.devices_dir, 'sda2'), 'sda2'),
+            mock.call(os.path.join(self.devices_dir, 'sda3'), 'sda3'),
+        ], mock_process.mock_calls)
+
+    @mock.patch('swift.obj.updater.os')
+    def test_run_once_child_with_more_workers(self, mock_os):
+        mock_os.path = os.path
+        mock_os.listdir = _sorted_listdir
+        ou = object_updater.ObjectUpdater({
+            'devices': self.devices_dir,
+            'mount_check': 'false',
+            'swift_dir': self.testdir,
+            'updater_workers': '3',
+            'interval': '1',
+            'concurrency': '1',
+            'node_timeout': '15'}, logger=self.logger)
+        devices = []
+        NUM_DEVICES = 3
+        for i in range(NUM_DEVICES):
+            device = os.path.join(self.devices_dir, 'sda{0}'.format(i))
+            devices.append(device)
+            async_dir = os.path.join(device, get_async_dir(POLICIES[0]))
+            mkdirs(async_dir)
+
+        mock_os.fork.side_effect = [1, 2, 0]
+        mock_process = ou._process_device_in_child = mock.MagicMock()
+        with self.assertRaises(SystemExit):
+            ou.run_once()
+        self.assertEqual([
+            mock.call(os.path.join(self.devices_dir, 'sda2'), 'sda2'),
+        ], mock_process.mock_calls)
+
+    @mock.patch.object(object_updater, 'check_drive')
+    @mock.patch('swift.obj.updater.os')
+    def test_run_once_parent_default(self, mock_os, mock_check_drive):
+        mock_os.path = os.path
+        mock_os.listdir = _sorted_listdir
+        ou = object_updater.ObjectUpdater({
+            'devices': self.devices_dir,
+            'mount_check': 'on',
+            'swift_dir': self.testdir,
+            'interval': '1',
+            'concurrency': '1',
+            'node_timeout': '15'}, logger=self.logger)
+
+        NUM_DEVICES = 2
+        for i in range(NUM_DEVICES):
+            device = os.path.join(self.devices_dir, 'sda' + str(i))
+            async_dir = os.path.join(device, get_async_dir(POLICIES[0]))
+            mkdirs(async_dir)
+
+        pids = [i + 1 for i in range(NUM_DEVICES)]
+        mock_os.fork.side_effect = pids
+        mock_os.wait.side_effect = [(i, 0) for i in pids]
+        ou.run_once()
+        self.assertEqual([
+            mock.call(self.devices_dir, 'sda0', True),
+            mock.call(self.devices_dir, 'sda1', True),
+        ], mock_check_drive.mock_calls)
+        self.assertEqual([
+            mock.call.fork(),
+            mock.call.wait(),
+            mock.call.fork(),
+            mock.call.wait(),
+        ], mock_os.mock_calls)
+
+    @mock.patch.object(object_updater, 'check_drive')
+    @mock.patch('swift.obj.updater.os')
+    def test_run_once_parent_more_updater_workers(self, mock_os,
+                                                  mock_check_drive):
+        # unpatch listdir and path
+        mock_os.path = os.path
+        mock_os.listdir = _sorted_listdir
+        ou = object_updater.ObjectUpdater({
+            'devices': self.devices_dir,
+            'mount_check': '1',
+            'swift_dir': self.testdir,
+            'updater_workers': '4',
+            'interval': '1',
+            'concurrency': '1',
+            'node_timeout': '15'}, logger=self.logger)
+        NUM_DEVICES = 4
+        for i in range(NUM_DEVICES):
+            device = os.path.join(self.devices_dir, 'sda' + str(i))
+            async_dir = os.path.join(device, get_async_dir(POLICIES[0]))
+            mkdirs(async_dir)
+
+        pids = [i + 1 for i in range(NUM_DEVICES)]
+        mock_os.fork.side_effect = pids
+        mock_os.wait.side_effect = [(i, 0) for i in pids]
+        ou.run_once()
+        self.assertEqual([
+            mock.call(self.devices_dir, 'sda0', True),
+            mock.call(self.devices_dir, 'sda1', True),
+            mock.call(self.devices_dir, 'sda2', True),
+            mock.call(self.devices_dir, 'sda3', True),
+        ], mock_check_drive.mock_calls)
+        self.assertEqual([
+            mock.call.fork(),
+            mock.call.fork(),
+            mock.call.fork(),
+            mock.call.fork(),
+            mock.call.wait(),
+            mock.call.wait(),
+            mock.call.wait(),
+            mock.call.wait(),
+        ], mock_os.mock_calls)
 
-    def test_run_once(self):
-        cu = object_updater.ObjectUpdater({
+    @mock.patch('swift.obj.updater.dump_recon_cache')
+    def test_process_devices_in_child(self, mock_dump_recon):
+        ou = object_updater.ObjectUpdater({
             'devices': self.devices_dir,
             'mount_check': 'false',
             'swift_dir': self.testdir,
             'interval': '1',
             'concurrency': '1',
-            'node_timeout': '15'})
-        cu.run_once()
-        async_dir = os.path.join(self.sda1, object_server.ASYNCDIR)
+            'node_timeout': '15'}, logger=self.logger)
+        ou._process_device_in_child(self.sda1, 'sda1')
+        self.assertEqual([], ou.logger.get_lines_for_level('error'))
+        async_dir = os.path.join(self.sda1, get_async_dir(POLICIES[0]))
         os.mkdir(async_dir)
-        cu.run_once()
-        self.assert_(os.path.exists(async_dir))
+        ou._process_device_in_child(self.sda1, 'sda1')
+        self.assertTrue(os.path.exists(async_dir))
+        self.assertEqual([], ou.logger.get_lines_for_level('error'))
 
-        odd_dir = os.path.join(async_dir, 'not really supposed to be here')
+        ou = object_updater.ObjectUpdater({
+            'devices': self.devices_dir,
+            'swift_dir': self.testdir,
+            'interval': '1',
+            'concurrency': '1',
+            'node_timeout': '15'}, logger=self.logger)
+        odd_dir = os.path.join(async_dir, 'not really supposed '
+                               'to be here')
         os.mkdir(odd_dir)
-        cu.run_once()
-        self.assert_(os.path.exists(async_dir))
-        self.assert_(not os.path.exists(odd_dir))
+
+        ou._process_device_in_child(self.sda1, 'sda1')
+        self.assertTrue(os.path.exists(async_dir))
+        self.assertEqual([], ou.logger.get_lines_for_level('error'))
 
         ohash = hash_path('a', 'c', 'o')
         odir = os.path.join(async_dir, ohash[-3:])
@@ -142,80 +734,2369 @@ def test_run_once(self):
             '%s-%s' % (ohash, normalize_timestamp(time())))
         for path in (op_path, older_op_path):
             with open(path, 'wb') as async_pending:
-                pickle.dump({'op': 'PUT', 'account': 'a', 'container': 'c',
+                pickle.dump({'op': 'PUT', 'account': 'a',
+                             'container': 'c',
                              'obj': 'o', 'headers': {
-                            'X-Container-Timestamp': normalize_timestamp(0)}},
+                                 'X-Container-Timestamp':
+                                 normalize_timestamp(0)}},
                             async_pending)
-        cu.logger = FakeLogger()
-        cu.run_once()
-        self.assert_(not os.path.exists(older_op_path))
-        self.assert_(os.path.exists(op_path))
-        self.assertEqual(cu.logger.get_increment_counts(),
-                         {'failures': 1, 'unlinks': 1})
+        ou._process_device_in_child(self.sda1, 'sda1')
+        self.assertTrue(not os.path.exists(older_op_path))
+        self.assertTrue(os.path.exists(op_path))
+        self.assertEqual(ou.logger.statsd_client.get_stats_counts(),
+                         {'failures': 1, 'outdated_unlinks': 1})
+        self.assertIsNone(pickle.load(open(op_path, 'rb')).get('successes'))
+        self.assertEqual(
+            ['ERROR with remote server 127.0.0.1:60789/sda1: '
+             'Connection refused'] * 3,
+            ou.logger.get_lines_for_level('error'))
+        self.assertEqual(
+            sorted(ou.logger.statsd_client.calls['timing']),
+            sorted([(('updater.timing.status.500', mock.ANY), {}), ] * 3))
+        ou.logger.clear()
 
-        bindsock = listen(('127.0.0.1', 0))
+        bindsock = listen_zero()
 
         def accepter(sock, return_code):
             try:
                 with Timeout(3):
                     inc = sock.makefile('rb')
                     out = sock.makefile('wb')
-                    out.write('HTTP/1.1 %d OK\r\nContent-Length: 0\r\n\r\n' %
+                    out.write(b'HTTP/1.1 %d OK\r\nContent-Length: 0\r\n\r\n' %
                               return_code)
                     out.flush()
-                    self.assertEquals(inc.readline(),
-                                      'PUT /sda1/0/a/c/o HTTP/1.1\r\n')
-                    headers = {}
-                    line = inc.readline()
+                    self.assertEqual(inc.readline(),
+                                     b'PUT /sda1/0/a/c/o HTTP/1.1\r\n')
+                    headers = HeaderKeyDict()
+                    line = bytes_to_wsgi(inc.readline())
                     while line and line != '\r\n':
-                        headers[line.split(':')[0].lower()] = \
+                        headers[line.split(':')[0]] = \
                             line.split(':')[1].strip()
-                        line = inc.readline()
-                    self.assert_('x-container-timestamp' in headers)
-            except BaseException, err:
+                        line = bytes_to_wsgi(inc.readline())
+                    self.assertIn('x-container-timestamp', headers)
+                    self.assertIn('X-Backend-Storage-Policy-Index',
+                                  headers)
+            except BaseException as err:
                 return err
             return None
 
         def accept(return_codes):
-            codes = iter(return_codes)
             try:
                 events = []
-                for x in xrange(len(return_codes)):
+                for code in return_codes:
                     with Timeout(3):
                         sock, addr = bindsock.accept()
                         events.append(
-                            spawn(accepter, sock, codes.next()))
+                            spawn(accepter, sock, code))
                 for event in events:
                     err = event.wait()
                     if err:
                         raise err
-            except BaseException, err:
+            except BaseException as err:
                 return err
             return None
 
-        event = spawn(accept, [201, 500])
-        for dev in cu.get_container_ring().devs:
+        # only 1/3 updates succeeds
+        event = spawn(accept, [201, 500, 500])
+        for dev in ou.get_container_ring().devs:
             if dev is not None:
-                dev['port'] = bindsock.getsockname()[1]
+                dev['replication_port'] = bindsock.getsockname()[1]
 
-        cu.logger = FakeLogger()
-        cu.run_once()
+        ou.logger._clear()
+        ou._process_device_in_child(self.sda1, 'sda1')
         err = event.wait()
         if err:
             raise err
-        self.assert_(os.path.exists(op_path))
-        self.assertEqual(cu.logger.get_increment_counts(),
+        self.assertTrue(os.path.exists(op_path))
+        self.assertEqual(ou.logger.statsd_client.get_stats_counts(),
+                         {'failures': 1})
+        self.assertEqual([0],
+                         pickle.load(open(op_path, 'rb')).get('successes'))
+        self.assertEqual([], ou.logger.get_lines_for_level('error'))
+        self.assertEqual(
+            sorted(ou.logger.statsd_client.calls['timing']),
+            sorted([
+                (('updater.timing.status.201', mock.ANY), {}),
+                (('updater.timing.status.500', mock.ANY), {}),
+                (('updater.timing.status.500', mock.ANY), {}),
+            ]))
+
+        # only 1/2 updates succeeds
+        event = spawn(accept, [404, 201])
+        ou.logger.clear()
+        ou._process_device_in_child(self.sda1, 'sda1')
+        err = event.wait()
+        if err:
+            raise err
+        self.assertTrue(os.path.exists(op_path))
+        self.assertEqual(ou.logger.statsd_client.get_stats_counts(),
+                         {'failures': 1})
+        self.assertEqual([0, 2],
+                         pickle.load(open(op_path, 'rb')).get('successes'))
+        self.assertEqual([], ou.logger.get_lines_for_level('error'))
+        self.assertEqual(
+            sorted(ou.logger.statsd_client.calls['timing']),
+            sorted([
+                (('updater.timing.status.404', mock.ANY), {}),
+                (('updater.timing.status.201', mock.ANY), {}),
+            ]))
+
+        # final update has Timeout
+        ou.logger.clear()
+        with Timeout(99) as exc, \
+                mock.patch('swift.obj.updater.http_connect') as mock_connect:
+            mock_connect.return_value.getresponse.side_effect = exc
+            ou._process_device_in_child(self.sda1, 'sda1')
+        self.assertTrue(os.path.exists(op_path))
+        self.assertEqual(ou.logger.statsd_client.get_stats_counts(),
+                         {'failures': 1})
+        self.assertEqual([0, 2],
+                         pickle.load(open(op_path, 'rb')).get('successes'))
+        self.assertEqual([], ou.logger.get_lines_for_level('error'))
+        self.assertIn(
+            'Timeout waiting on remote server 127.0.0.1:%d/sda1: 99 seconds'
+            % bindsock.getsockname()[1], ou.logger.get_lines_for_level('info'))
+        self.assertEqual(
+            sorted(ou.logger.statsd_client.calls['timing']),
+            sorted([
+                (('updater.timing.status.499', mock.ANY), {})]))
+
+        # final update has ConnectionTimeout
+        ou.logger.clear()
+        with ConnectionTimeout(9) as exc, \
+                mock.patch('swift.obj.updater.http_connect') as mock_connect:
+            mock_connect.return_value.getresponse.side_effect = exc
+            ou._process_device_in_child(self.sda1, 'sda1')
+        self.assertTrue(os.path.exists(op_path))
+        self.assertEqual(ou.logger.statsd_client.get_stats_counts(),
                          {'failures': 1})
+        self.assertEqual([0, 2],
+                         pickle.load(open(op_path, 'rb')).get('successes'))
+        self.assertEqual([], ou.logger.get_lines_for_level('error'))
+        self.assertIn(
+            'Timeout connecting to remote server 127.0.0.1:%d/sda1: 9 seconds'
+            % bindsock.getsockname()[1], ou.logger.get_lines_for_level('info'))
+        self.assertEqual(
+            sorted(ou.logger.statsd_client.calls['timing']),
+            sorted([
+                (('updater.timing.status.500', mock.ANY), {})
+            ]))
 
+        # final update succeeds
         event = spawn(accept, [201])
-        cu.logger = FakeLogger()
-        cu.run_once()
+        ou.logger.clear()
+        ou._process_device_in_child(self.sda1, 'sda1')
         err = event.wait()
         if err:
             raise err
-        self.assert_(not os.path.exists(op_path))
-        self.assertEqual(cu.logger.get_increment_counts(),
+
+        # we remove the async_pending and its containing suffix dir, but not
+        # anything above that
+        self.assertFalse(os.path.exists(op_path))
+        self.assertFalse(os.path.exists(os.path.dirname(op_path)))
+        self.assertTrue(os.path.exists(os.path.dirname(os.path.dirname(
+            op_path))))
+        self.assertEqual([], ou.logger.get_lines_for_level('error'))
+        self.assertEqual(ou.logger.statsd_client.get_stats_counts(),
                          {'unlinks': 1, 'successes': 1})
+        self.assertEqual(
+            sorted(ou.logger.statsd_client.calls['timing']),
+            sorted([
+                (('updater.timing.status.201', mock.ANY), {}),
+            ]))
+
+    @mock.patch('swift.obj.updater.dump_recon_cache')
+    def test_run_once_recon_dump(self, mock_dump_recon):
+        self.maxDiff = None
+
+        def assert_and_reset_recon_dump_per_device(exp):
+            recon_dumps = [call[0][0]
+                           for call in mock_dump_recon.call_args_list]
+            self.assertEqual([exp], recon_dumps)
+            mock_dump_recon.reset_mock()
+
+        async_dir = os.path.join(self.sda1, get_async_dir(POLICIES[0]))
+        os.mkdir(async_dir)
+
+        ou = object_updater.ObjectUpdater({
+            'devices': self.devices_dir,
+            'swift_dir': self.testdir,
+            'interval': '1',
+            'concurrency': '1',
+            'node_timeout': '15'}, logger=self.logger)
+        # There are no asyncs so there are no failures
+        ts = next(self.ts_iter)
+        now = float(next(self.ts_iter))
+        with mock.patch('swift.obj.updater.time.time', return_value=now):
+            with mock.patch.object(ou, 'object_update',
+                                   return_value=(False, 'node-id', None)):
+                ou._process_device_in_child(self.sda1, 'sda1')
+        exp_recon_dump = {
+            'object_updater_per_device': {
+                'sda1': {
+                    'failures_account_container_count': 0,
+                    'failures_oldest_timestamp': None,
+                    'failures_oldest_timestamp_account_containers': {
+                        'oldest_count': 0,
+                        'oldest_entries': [],
+                    },
+                    'failures_oldest_timestamp_age': None,
+                    'tracker_memory_usage': mock.ANY,
+                }
+            }
+        }
+        assert_and_reset_recon_dump_per_device(exp_recon_dump)
+
+        ohash = hash_path('a', 'c', 'o')
+        odir = os.path.join(async_dir, ohash[-3:])
+        mkdirs(odir)
+        op_path = os.path.join(odir, '%s-%s' % (ohash, ts.internal))
+        with open(op_path, 'wb') as async_pending:
+            pickle.dump({'op': 'PUT', 'account': 'a',
+                         'container': 'c',
+                         'obj': 'o', 'headers': {
+                             'X-Container-Timestamp':
+                             normalize_timestamp(0)}},
+                        async_pending)
+        with mock.patch('swift.obj.updater.time.time', return_value=now):
+            with mock.patch.object(ou, 'object_update',
+                                   return_value=(False, 'node-id', None)):
+                ou._process_device_in_child(self.sda1, 'sda1')
+        exp_recon_dump = {
+            'object_updater_per_device': {
+                'sda1': {
+                    'failures_account_container_count': 1,
+                    'failures_oldest_timestamp': float(ts),
+                    'failures_oldest_timestamp_account_containers': {
+                        'oldest_count': 1,
+                        'oldest_entries': [{'account': 'a',
+                                            'container': 'c',
+                                            'timestamp': float(ts)}]
+                    },
+                    'failures_oldest_timestamp_age': now - float(ts),
+                    'tracker_memory_usage': mock.ANY,
+                }
+            }
+        }
+        assert_and_reset_recon_dump_per_device(exp_recon_dump)
+
+    def test_gather_recon_stats(self):
+        ou = object_updater.ObjectUpdater({})
+        with mock.patch.object(
+            ou.oldest_async_pendings,
+            'get_oldest_timestamp', return_value=123.456
+        ):
+            with mock.patch.object(
+                ou.oldest_async_pendings,
+                'get_oldest_timestamp_age',
+                return_value=789.012,
+            ):
+                with mock.patch.object(
+                    ou.oldest_async_pendings,
+                    'ac_to_timestamp',
+                    return_value={('account1', 'container1'): 123.456},
+                ):
+                    with mock.patch.object(
+                        ou.oldest_async_pendings,
+                        'get_n_oldest_timestamp_acs',
+                        return_value=[
+                            {'account': 'AUTH_1',
+                             'container': 'cont_1',
+                             'timestamp': 123.456},
+                        ],
+                    ):
+                        with mock.patch.object(
+                            ou.oldest_async_pendings,
+                            'get_memory_usage',
+                            return_value=1024,
+                        ):
+                            ou.oldest_async_pendings.ac_to_timestamp = {
+                                ('AUTH_1', 'cont_1'): 123.456}
+                            stats = ou._gather_recon_stats()
+
+        expected_stats = {
+            'failures_oldest_timestamp': 123.456,
+            'failures_oldest_timestamp_age': 789.012,
+            'failures_account_container_count': 1,
+            'failures_oldest_timestamp_account_containers': [
+                {'account': 'AUTH_1',
+                 'container': 'cont_1',
+                 'timestamp': 123.456},
+            ],
+            'tracker_memory_usage': 1024,
+        }
+        self.assertEqual(stats, expected_stats)
+
+    def test_aggregate_and_dump_recon_with_missing_keys(self):
+        """
+        Test aggregation logic when device stats are missing some keys.
+        """
+        recon_path = os.path.join(self.testdir, 'recon')
+        recon_file = os.path.join(recon_path, 'object.recon')
+        os.mkdir(recon_path)
+
+        ou = object_updater.ObjectUpdater({
+            'devices': self.devices_dir,
+            'swift_dir': self.testdir,
+            'updater_workers': 1,
+            'recon_cache_path': recon_path,
+            'async_tracker_dump_count': 3,
+        }, logger=self.logger)
+
+        incomplete_recon = {
+            'object_updater_per_device': {
+                'sda1': {
+                    'tracker_memory_usage': 256,
+                    'failures_account_container_count': 1,
+                },
+                # N.B. this is unrealistic test stub to cover failures modes
+                # where workers die weird, for the expected aggregated stats
+                # calculation sda2 & sda3 are contributing to the count of
+                # devices when averaging per-worker device memory but no actual
+                # values; so the reported "tracker_memory_usage" appears
+                # artifically deflated under failure
+                'sda2': {
+                    'failures_oldest_timestamp': 124.56789,
+                    'failures_oldest_timestamp_age': 789.012,
+                },
+                'sda3': None,
+            }
+        }
+        utils.dump_recon_cache(incomplete_recon, ou.rcache, ou.logger)
+        now = float(next(self.ts_iter))
+        ou.aggregate_and_dump_recon(['sda1', 'sda2', 'sda3'], 30, now)
+
+        with open(recon_file) as f:
+            found_data = json.load(f)
+
+        expected_aggregated_stats = {
+            'failures_account_container_count': 1,
+            'tracker_memory_usage': 256.0 / 3.0,
+            'failures_oldest_timestamp': 124.56789,
+            'failures_oldest_timestamp_age': 789.012,
+            'failures_oldest_timestamp_account_containers': {
+                'oldest_count': 0,
+                'oldest_entries': []
+            },
+        }
+
+        expected_recon = {
+            'object_updater_sweep': 30,
+            'object_updater_stats': expected_aggregated_stats,
+            'object_updater_last': now,
+            'object_updater_per_device': {
+                'sda1': {
+                    'tracker_memory_usage': 256,
+                    'failures_account_container_count': 1,
+                },
+                'sda2': {
+                    'failures_oldest_timestamp': 124.56789,
+                    'failures_oldest_timestamp_age': 789.012,
+                },
+                'sda3': None,
+            },
+        }
+        self.assertEqual(expected_recon, found_data)
+
+    def test_aggregate_and_dump_recon_all_empty_devices(self):
+        """
+        Test aggregation logic when all devices are empty or missing.
+        """
+        recon_path = os.path.join(self.testdir, 'recon')
+        recon_file = os.path.join(recon_path, 'object.recon')
+        os.mkdir(recon_path)
+
+        ou = object_updater.ObjectUpdater({
+            'devices': self.devices_dir,
+            'swift_dir': self.testdir,
+            'updater_workers': 2,
+            'recon_cache_path': recon_path,
+            'async_tracker_dump_count': 5,
+        }, logger=self.logger)
+
+        empty_recon = {
+            'object_updater_per_device': {
+                'sda1': {},
+                'sda2': {},
+            }
+        }
+        utils.dump_recon_cache(empty_recon, ou.rcache, ou.logger)
+        with open(recon_file) as f:
+            found_data = json.load(f)
+        # N.B. recon doesn't let you write second level keys with empty values;
+        # because it's hijacked that spelling to mean "remove this sub-key"
+        self.assertEqual({'object_updater_per_device': {}}, found_data)
+        now = float(next(self.ts_iter))
+        ou.aggregate_and_dump_recon(['sda1', 'sda2', 'sda3'], 30, now)
+
+        with open(recon_file) as f:
+            found_data = json.load(f)
+
+        expected_aggregated_stats = {
+            'failures_account_container_count': 0,
+            'tracker_memory_usage': 0,
+            'failures_oldest_timestamp': None,
+            'failures_oldest_timestamp_age': None,
+            'failures_oldest_timestamp_account_containers': {
+                'oldest_count': 0,
+                'oldest_entries': []
+            },
+        }
+
+        expected_recon = {
+            'object_updater_sweep': 30,
+            'object_updater_stats': expected_aggregated_stats,
+            'object_updater_last': now,
+            'object_updater_per_device': {},
+        }
+        self.assertEqual(expected_recon, found_data)
+
+    def test_aggregate_and_dump_recon_wrong_type_per_device(self):
+        """
+        Test aggregation when object_updater_per_device is the wrong type.
+        """
+        recon_path = os.path.join(self.testdir, 'recon')
+        os.mkdir(recon_path)
+
+        ou = object_updater.ObjectUpdater({
+            'devices': self.devices_dir,
+            'swift_dir': self.testdir,
+            'updater_workers': 2,
+            'recon_cache_path': recon_path,
+            'async_tracker_dump_count': 5,
+        }, logger=self.logger)
+
+        # object_updater_per_device as a list instead of dict
+        malformed_recon = {
+            'object_updater_per_device': ['invalid_data_type']
+        }
+        utils.dump_recon_cache(malformed_recon, ou.rcache, ou.logger)
+
+        with self.assertRaises(TypeError) as cm:
+            now = float(next(self.ts_iter))
+            ou.aggregate_and_dump_recon(['sda1', 'sda2'], 30, now)
+
+        self.assertIn(
+            'object_updater_per_device must be a dict', str(cm.exception))
+
+    def test_aggregate_and_dump_recon_partial_device_updates(self):
+        """
+        Test when some devices are removed and partial updates exist.
+        """
+        recon_path = os.path.join(self.testdir, 'recon')
+        recon_file = os.path.join(recon_path, 'object.recon')
+        os.mkdir(recon_path)
+
+        ou = object_updater.ObjectUpdater({
+            'devices': self.devices_dir,
+            'swift_dir': self.testdir,
+            # N.B. we have less devices than workers!
+            'updater_workers': 2,
+            'recon_cache_path': recon_path,
+            'async_tracker_dump_count': 2,
+        }, logger=self.logger)
+
+        existing_recon = {
+            'object_updater_per_device': {
+                'sda1': {
+                    'failures_account_container_count': 2,
+                    'tracker_memory_usage': 384,
+                },
+                # this is a relatively realistic example of existing recon data
+                # for a pre-existing per-device key for a removed device
+                'sda2': {
+                    'failures_account_container_count': 1,
+                    'tracker_memory_usage': 256,
+                },
+                # N.B. this sda3 is an unrealistic test stub to cover failures
+                # modes where workers die weird
+                'sda3': None,
+            }
+        }
+        utils.dump_recon_cache(existing_recon, ou.rcache, ou.logger)
+        now = float(next(self.ts_iter))
+        # N.B. because neither sda2 nor sda3 are passed in as expected devices
+        # to aggregate neither contribute to device count when calculating
+        # per-worker averages in during aggregate
+        ou.aggregate_and_dump_recon(['sda1'], 30, now)
+
+        with open(recon_file) as f:
+            found_data = json.load(f)
+
+        expected_aggregated_stats = {
+            'failures_account_container_count': 2,
+            # only sda1 should be considered because it's the only device value
+            # that wouldn't be stale
+            'tracker_memory_usage': 384,
+            'failures_oldest_timestamp': None,
+            'failures_oldest_timestamp_age': None,
+            'failures_oldest_timestamp_account_containers': {
+                'oldest_count': 0,
+                'oldest_entries': [],
+            },
+        }
+
+        expected_recon = {
+            'object_updater_per_device': {
+                'sda1': {
+                    'failures_account_container_count': 2,
+                    'tracker_memory_usage': 384,
+                },
+            },
+            'object_updater_sweep': 30,
+            'object_updater_stats': expected_aggregated_stats,
+            'object_updater_last': now,
+        }
+        self.assertEqual(expected_recon, found_data)
+
+    def test_dump_device_recon(self):
+        recon_path = os.path.join(self.testdir, 'recon')
+        recon_file = os.path.join(recon_path, 'object.recon')
+        os.mkdir(recon_path)
+        ou = object_updater.ObjectUpdater({
+            'devices': self.devices_dir,
+            'swift_dir': self.testdir,
+            'recon_cache_path': recon_path,
+            'async_tracker_dump_count': '6',
+        })
+        ou.dump_device_recon('sda1')
+        with open(recon_file) as f:
+            found_data = json.load(f)
+        self.assertEqual({
+            'object_updater_per_device': {
+                'sda1': {
+                    'failures_account_container_count': 0,
+                    'failures_oldest_timestamp': None,
+                    'failures_oldest_timestamp_account_containers': {
+                        'oldest_count': 0,
+                        'oldest_entries': [],
+                    },
+                    'failures_oldest_timestamp_age': None,
+                    'tracker_memory_usage': mock.ANY,
+                }
+            }
+        }, found_data)
+
+        # now add some data
+        timestamps = []
+        for a in range(3):
+            account = 'AUTH_%s' % a
+            for c in range(4):
+                container = 'cont_%s' % c
+                for ts in range(5):
+                    ts = next(self.ts_iter)
+                    timestamps.append(float(ts))
+                    ou.oldest_async_pendings.add_update(
+                        account, container, ts)
+
+        now = float(next(self.ts_iter))
+        with mock.patch('swift.obj.updater.time.time', return_value=now):
+            ou.dump_device_recon('sda1')
+        with open(recon_file) as f:
+            found_data = json.load(f)
+        self.assertEqual({
+            'object_updater_per_device': {
+                'sda1': {
+                    'failures_account_container_count': 12,
+                    'failures_oldest_timestamp': timestamps[0],
+                    'failures_oldest_timestamp_account_containers': {
+                        'oldest_count': 6,
+                        'oldest_entries': [{
+                            'account': 'AUTH_0',
+                            'container': 'cont_0',
+                            'timestamp': timestamps[0],
+                        }, {
+                            'account': 'AUTH_0',
+                            'container': 'cont_1',
+                            'timestamp': timestamps[5],
+                        }, {
+                            'account': 'AUTH_0',
+                            'container': 'cont_2',
+                            'timestamp': timestamps[10],
+                        }, {
+                            'account': 'AUTH_0',
+                            'container': 'cont_3',
+                            'timestamp': timestamps[15],
+                        }, {
+                            'account': 'AUTH_1',
+                            'container': 'cont_0',
+                            'timestamp': timestamps[20],
+                        }, {
+                            'account': 'AUTH_1',
+                            'container': 'cont_1',
+                            'timestamp': timestamps[25],
+                        }],
+                    },
+                    'failures_oldest_timestamp_age': now - timestamps[0],
+                    'tracker_memory_usage': mock.ANY,
+                }
+            }
+        }, found_data)
+
+    def test_aggregate_and_dump_recon(self):
+        self.maxDiff = None
+        recon_path = os.path.join(self.testdir, 'recon')
+        recon_file = os.path.join(recon_path, 'object.recon')
+        os.mkdir(recon_path)
+        ou = object_updater.ObjectUpdater({
+            'devices': self.devices_dir,
+            'swift_dir': self.testdir,
+            'updater_workers': 2,
+            'recon_cache_path': recon_path,
+            'async_tracker_dump_count': 2,
+        }, logger=self.logger)
+        existing_recon = {
+            'object_updater_per_device': {
+                'sda1': {
+                    'failures_account_container_count': 1,
+                    'tracker_memory_usage': 512,
+                    'failures_oldest_timestamp': 123.45678,
+                    'failures_oldest_timestamp_age': 789.012,
+                    'failures_oldest_timestamp_account_containers': {
+                        'oldest_count': 1,
+                        'oldest_entries': [
+                            {'account': 'a', 'container': 'c',
+                             'timestamp': 123.45678}
+                        ],
+                    },
+                },
+                'sda2': {
+                    'failures_account_container_count': 2,
+                    'tracker_memory_usage': 256,
+                    'failures_oldest_timestamp': 124.56789,
+                    'failures_oldest_timestamp_age': 789.012,
+                    'failures_oldest_timestamp_account_containers': {
+                        'oldest_count': 2,
+                        'oldest_entries': [
+                            {'account': 'x', 'container': 'y',
+                             'timestamp': 124.56789},
+                            {'account': 'm', 'container': 'n',
+                             'timestamp': 125.67890},
+                        ],
+                    },
+                },
+            },
+        }
+        utils.dump_recon_cache(existing_recon, ou.rcache, ou.logger)
+        # add an "empty" device
+        with mock.patch.object(ou.oldest_async_pendings, 'get_memory_usage',
+                               return_value=128):
+            ou.dump_device_recon('sda3')
+        # and also an unmounted one
+        ou.dump_device_recon('sdx')
+        existing_recon['object_updater_per_device'].update({
+            'sda3': {
+                'failures_account_container_count': 0,
+                'failures_oldest_timestamp': None,
+                'failures_oldest_timestamp_account_containers': {
+                    'oldest_count': 0,
+                    'oldest_entries': [],
+                },
+                'failures_oldest_timestamp_age': None,
+                'tracker_memory_usage': 128,
+            },
+            'sdx': {
+                'failures_account_container_count': 0,
+                'failures_oldest_timestamp': None,
+                'failures_oldest_timestamp_account_containers': {
+                    'oldest_count': 0,
+                    'oldest_entries': [],
+                },
+                'failures_oldest_timestamp_age': None,
+                'tracker_memory_usage': mock.ANY,
+            },
+        })
+        with open(recon_file) as f:
+            found_data = json.load(f)
+        self.assertEqual(existing_recon, found_data)  # sanity
+
+        # we're setting this up like sdx is stale/unmounted
+        now = float(next(self.ts_iter))
+        ou.aggregate_and_dump_recon(['sda1', 'sda2', 'sda3'], 30, now)
+        with open(recon_file) as f:
+            found_data = json.load(f)
+
+        expected_aggregated_stats = {
+            'failures_account_container_count': 2,
+            'tracker_memory_usage': mock.ANY,
+            'failures_oldest_timestamp': 123.45678,
+            'failures_oldest_timestamp_age': 789.012,
+            'failures_oldest_timestamp_account_containers': {
+                'oldest_count': 2,
+                'oldest_entries': [
+                    {'account': 'a', 'container': 'c', 'timestamp': 123.45678},
+                    {'account': 'x', 'container': 'y', 'timestamp': 124.56789},
+                ],
+            },
+        }
+        expected_recon = dict(existing_recon, **{
+            'object_updater_sweep': 30,
+            'object_updater_stats': expected_aggregated_stats,
+            'object_updater_last': now,
+        })
+        # and sda4 is removed
+        del expected_recon['object_updater_per_device']['sdx']
+        self.assertEqual(expected_recon, found_data)
+
+        self.assertEqual(
+            (512 + 256 + 128) / 3 * 2,
+            found_data['object_updater_stats']['tracker_memory_usage'],
+        )
+
+    def test_obj_put_legacy_updates(self):
+        ts = (normalize_timestamp(t) for t in
+              itertools.count(int(time())))
+        policy = POLICIES.get_by_index(0)
+        # setup updater
+        conf = {
+            'devices': self.devices_dir,
+            'mount_check': 'false',
+            'swift_dir': self.testdir,
+        }
+        async_dir = os.path.join(self.sda1, get_async_dir(policy))
+        os.mkdir(async_dir)
+
+        account, container, obj = 'a', 'c', 'o'
+        # write an async
+        for op in ('PUT', 'DELETE'):
+            self.logger.clear()
+            daemon = object_updater.ObjectUpdater(conf, logger=self.logger)
+            dfmanager = DiskFileManager(conf, daemon.logger)
+            # don't include storage-policy-index in headers_out pickle
+            headers_out = HeaderKeyDict({
+                'x-size': 0,
+                'x-content-type': 'text/plain',
+                'x-etag': 'd41d8cd98f00b204e9800998ecf8427e',
+                'x-timestamp': next(ts),
+            })
+            data = {'op': op, 'account': account, 'container': container,
+                    'obj': obj, 'headers': headers_out}
+            dfmanager.pickle_async_update(self.sda1, account, container, obj,
+                                          data, next(ts), policy)
+
+            request_log = []
+
+            def capture(*args, **kwargs):
+                request_log.append((args, kwargs))
+
+            # run once
+            fake_status_codes = [200, 200, 200]
+            with mocked_http_conn(*fake_status_codes, give_connect=capture):
+                daemon._process_device_in_child(self.sda1, 'sda1')
+
+            self.assertEqual(len(fake_status_codes), len(request_log))
+            for request_args, request_kwargs in request_log:
+                ip, part, method, path, headers, qs, ssl = request_args
+                self.assertEqual(method, op)
+                self.assertEqual(headers['X-Backend-Storage-Policy-Index'],
+                                 str(int(policy)))
+            self.assertEqual(
+                daemon.logger.statsd_client.get_stats_counts(),
+                {'successes': 1, 'unlinks': 1, 'async_pendings': 1})
+
+    def _write_async_update(self, dfmanager, timestamp, policy,
+                            headers=None, container_path=None):
+        # write an async
+        account, container, obj = 'a', 'c', 'o'
+        op = 'PUT'
+        headers_out = headers or {
+            'x-size': 0,
+            'x-content-type': 'text/plain',
+            'x-etag': 'd41d8cd98f00b204e9800998ecf8427e',
+            'x-timestamp': timestamp.internal,
+            'X-Backend-Storage-Policy-Index': int(policy),
+            'User-Agent': 'object-server %s' % os.getpid()
+        }
+        data = {'op': op, 'account': account, 'container': container,
+                'obj': obj, 'headers': headers_out}
+        if container_path:
+            data['container_path'] = container_path
+        dfmanager.pickle_async_update(self.sda1, account, container, obj,
+                                      data, timestamp, policy)
+
+    def test_obj_put_async_updates(self):
+        policies = list(POLICIES)
+        random.shuffle(policies)
+
+        # setup updater
+        conf = {
+            'devices': self.devices_dir,
+            'mount_check': 'false',
+            'swift_dir': self.testdir,
+        }
+        daemon = object_updater.ObjectUpdater(conf, logger=self.logger)
+        async_dir = os.path.join(self.sda1, get_async_dir(policies[0]))
+        os.mkdir(async_dir)
+
+        def do_test(headers_out, expected, container_path=None):
+            # write an async
+            dfmanager = DiskFileManager(conf, daemon.logger)
+            self._write_async_update(dfmanager, next(self.ts_iter),
+                                     policies[0], headers=headers_out,
+                                     container_path=container_path)
+            request_log = []
+
+            def capture(*args, **kwargs):
+                request_log.append((args, kwargs))
+
+            # run once
+            fake_status_codes = [
+                200,  # object update success
+                200,  # object update success
+                200,  # object update conflict
+            ]
+            with mocked_http_conn(*fake_status_codes, give_connect=capture):
+                daemon._process_device_in_child(self.sda1, 'sda1')
+            self.assertEqual(len(fake_status_codes), len(request_log))
+            for request_args, request_kwargs in request_log:
+                ip, part, method, path, headers, qs, ssl = request_args
+                self.assertEqual(method, 'PUT')
+                self.assertDictEqual(expected, headers)
+            self.assertEqual(
+                daemon.logger.statsd_client.get_stats_counts(),
+                {'successes': 1, 'unlinks': 1, 'async_pendings': 1})
+            self.assertFalse(os.listdir(async_dir))
+            daemon.logger.clear()
+
+        ts = next(self.ts_iter)
+        # use a dict rather than HeaderKeyDict so we can vary the case of the
+        # pickled headers
+        headers_out = {
+            'x-size': 0,
+            'x-content-type': 'text/plain',
+            'x-etag': 'd41d8cd98f00b204e9800998ecf8427e',
+            'x-timestamp': ts.normal,
+            'X-Backend-Storage-Policy-Index': int(policies[0]),
+            'User-Agent': 'object-server %s' % os.getpid()
+        }
+        expected = {
+            'X-Size': '0',
+            'X-Content-Type': 'text/plain',
+            'X-Etag': 'd41d8cd98f00b204e9800998ecf8427e',
+            'X-Timestamp': ts.normal,
+            'X-Backend-Storage-Policy-Index': str(int(policies[0])),
+            'User-Agent': 'object-updater %s' % os.getpid(),
+            'X-Backend-Accept-Redirect': 'true',
+            'X-Backend-Accept-Quoted-Location': 'true',
+        }
+        # always expect X-Backend-Accept-Redirect and
+        # X-Backend-Accept-Quoted-Location to be true
+        do_test(headers_out, expected, container_path='.shards_a/shard_c')
+        do_test(headers_out, expected)
+
+        # ...unless they're already set
+        expected['X-Backend-Accept-Redirect'] = 'false'
+        expected['X-Backend-Accept-Quoted-Location'] = 'false'
+        headers_out_2 = dict(headers_out)
+        headers_out_2['X-Backend-Accept-Redirect'] = 'false'
+        headers_out_2['X-Backend-Accept-Quoted-Location'] = 'false'
+        do_test(headers_out_2, expected)
+
+        # updater should add policy header if missing
+        expected['X-Backend-Accept-Redirect'] = 'true'
+        expected['X-Backend-Accept-Quoted-Location'] = 'true'
+        headers_out['X-Backend-Storage-Policy-Index'] = None
+        do_test(headers_out, expected)
+
+        # updater should not overwrite a mismatched policy header
+        headers_out['X-Backend-Storage-Policy-Index'] = int(policies[1])
+        expected['X-Backend-Storage-Policy-Index'] = str(int(policies[1]))
+        do_test(headers_out, expected)
+
+        # check for case insensitivity
+        headers_out['user-agent'] = headers_out.pop('User-Agent')
+        headers_out['x-backend-storage-policy-index'] = headers_out.pop(
+            'X-Backend-Storage-Policy-Index')
+        do_test(headers_out, expected)
+
+    def _check_update_requests(self, requests, timestamp, policy):
+        # do some sanity checks on update request
+        expected_headers = {
+            'X-Size': '0',
+            'X-Content-Type': 'text/plain',
+            'X-Etag': 'd41d8cd98f00b204e9800998ecf8427e',
+            'X-Timestamp': timestamp.internal,
+            'X-Backend-Storage-Policy-Index': str(int(policy)),
+            'User-Agent': 'object-updater %s' % os.getpid(),
+            'X-Backend-Accept-Redirect': 'true',
+            'X-Backend-Accept-Quoted-Location': 'true'}
+        for request in requests:
+            self.assertEqual('PUT', request['method'])
+            self.assertDictEqual(expected_headers, request['headers'])
+
+    def test_obj_put_async_root_update_redirected(self):
+        policies = list(POLICIES)
+        random.shuffle(policies)
+        # setup updater
+        conf = {
+            'devices': self.devices_dir,
+            'mount_check': 'false',
+            'swift_dir': self.testdir,
+        }
+        daemon = object_updater.ObjectUpdater(conf, logger=self.logger)
+        async_dir = os.path.join(self.sda1, get_async_dir(policies[0]))
+        os.mkdir(async_dir)
+        dfmanager = DiskFileManager(conf, daemon.logger)
+
+        ts_obj = next(self.ts_iter)
+        self._write_async_update(dfmanager, ts_obj, policies[0])
+
+        # run once
+        ts_redirect_1 = next(self.ts_iter)
+        ts_redirect_2 = next(self.ts_iter)
+        fake_responses = [
+            # first round of update attempts, newest redirect should be chosen
+            (200, {}),
+            (301, {'Location': '/.shards_a/c_shard_new/o',
+                   'X-Backend-Redirect-Timestamp': ts_redirect_2.internal}),
+            (301, {'Location': '/.shards_a/c_shard_old/o',
+                   'X-Backend-Redirect-Timestamp': ts_redirect_1.internal}),
+            # second round of update attempts
+            (200, {}),
+            (200, {}),
+            (200, {}),
+        ]
+        fake_status_codes, fake_headers = zip(*fake_responses)
+        with mocked_http_conn(
+                *fake_status_codes, headers=fake_headers) as conn:
+            with mock.patch('swift.obj.updater.dump_recon_cache'):
+                daemon._process_device_in_child(self.sda1, 'sda1')
+
+        self._check_update_requests(conn.requests[:3], ts_obj, policies[0])
+        self._check_update_requests(conn.requests[3:], ts_obj, policies[0])
+        self.assertEqual(['/sda1/0/a/c/o'] * 3 +
+                         ['/sda1/0/.shards_a/c_shard_new/o'] * 3,
+                         [req['path'] for req in conn.requests])
+        self.assertEqual(
+            {'redirects': 1, 'successes': 1,
+             'unlinks': 1, 'async_pendings': 1},
+            daemon.logger.statsd_client.get_stats_counts())
+        self.assertFalse(os.listdir(async_dir))  # no async file
+
+    def test_obj_put_async_root_update_redirected_previous_success(self):
+        policies = list(POLICIES)
+        random.shuffle(policies)
+        # setup updater
+        conf = {
+            'devices': self.devices_dir,
+            'mount_check': 'false',
+            'swift_dir': self.testdir,
+        }
+        daemon = object_updater.ObjectUpdater(conf, logger=self.logger)
+        async_dir = os.path.join(self.sda1, get_async_dir(policies[0]))
+        os.mkdir(async_dir)
+        dfmanager = DiskFileManager(conf, daemon.logger)
+
+        ts_obj = next(self.ts_iter)
+        self._write_async_update(dfmanager, ts_obj, policies[0])
+        orig_async_path, orig_async_data = self._check_async_file(async_dir)
+
+        # run once
+        with mocked_http_conn(
+                507, 200, 507) as conn:
+            with mock.patch('swift.obj.updater.dump_recon_cache'):
+                daemon._process_device_in_child(self.sda1, 'sda1')
+
+        self._check_update_requests(conn.requests, ts_obj, policies[0])
+        self.assertEqual(['/sda1/0/a/c/o'] * 3,
+                         [req['path'] for req in conn.requests])
+        self.assertEqual(
+            {'failures': 1, 'async_pendings': 1},
+            daemon.logger.statsd_client.get_stats_counts())
+        async_path, async_data = self._check_async_file(async_dir)
+        self.assertEqual(dict(orig_async_data, successes=[1]), async_data)
+
+        # run again - expect 3 redirected updates despite previous success
+        ts_redirect = next(self.ts_iter)
+        resp_headers_1 = {'Location': '/.shards_a/c_shard_1/o',
+                          'X-Backend-Redirect-Timestamp': ts_redirect.internal}
+        fake_responses = (
+            # 1st round of redirects, 2nd round of redirects
+            [(301, resp_headers_1)] * 2 + [(200, {})] * 3)
+        fake_status_codes, fake_headers = zip(*fake_responses)
+        with mocked_http_conn(
+                *fake_status_codes, headers=fake_headers) as conn:
+            with mock.patch('swift.obj.updater.dump_recon_cache'):
+                daemon._process_device_in_child(self.sda1, 'sda1')
+
+        self._check_update_requests(conn.requests[:2], ts_obj, policies[0])
+        self._check_update_requests(conn.requests[2:], ts_obj, policies[0])
+        root_part = daemon.container_ring.get_part('a/c')
+        shard_1_part = daemon.container_ring.get_part('.shards_a/c_shard_1')
+        self.assertEqual(
+            ['/sda1/%s/a/c/o' % root_part] * 2 +
+            ['/sda1/%s/.shards_a/c_shard_1/o' % shard_1_part] * 3,
+            [req['path'] for req in conn.requests])
+        self.assertEqual(
+            {'redirects': 1, 'successes': 1, 'failures': 1, 'unlinks': 1,
+             'async_pendings': 1},
+            daemon.logger.statsd_client.get_stats_counts())
+        self.assertFalse(os.listdir(async_dir))  # no async file
+
+    def _check_async_file(self, async_dir):
+        async_subdirs = os.listdir(async_dir)
+        self.assertEqual([mock.ANY], async_subdirs)
+        async_files = os.listdir(os.path.join(async_dir, async_subdirs[0]))
+        self.assertEqual([mock.ANY], async_files)
+        async_path = os.path.join(
+            async_dir, async_subdirs[0], async_files[0])
+        with open(async_path, 'rb') as fd:
+            async_data = pickle.load(fd)
+        return async_path, async_data
+
+    def _check_obj_put_async_update_bad_redirect_headers(self, headers):
+        policies = list(POLICIES)
+        random.shuffle(policies)
+        # setup updater
+        conf = {
+            'devices': self.devices_dir,
+            'mount_check': 'false',
+            'swift_dir': self.testdir,
+        }
+        daemon = object_updater.ObjectUpdater(conf, logger=self.logger)
+        async_dir = os.path.join(self.sda1, get_async_dir(policies[0]))
+        os.mkdir(async_dir)
+        dfmanager = DiskFileManager(conf, daemon.logger)
+
+        ts_obj = next(self.ts_iter)
+        self._write_async_update(dfmanager, ts_obj, policies[0])
+        orig_async_path, orig_async_data = self._check_async_file(async_dir)
+
+        fake_responses = [
+            (301, headers),
+            (301, headers),
+            (301, headers),
+        ]
+        fake_status_codes, fake_headers = zip(*fake_responses)
+        with mocked_http_conn(
+                *fake_status_codes, headers=fake_headers) as conn:
+            with mock.patch('swift.obj.updater.dump_recon_cache'):
+                daemon._process_device_in_child(self.sda1, 'sda1')
+
+        self._check_update_requests(conn.requests, ts_obj, policies[0])
+        self.assertEqual(['/sda1/0/a/c/o'] * 3,
+                         [req['path'] for req in conn.requests])
+        self.assertEqual(
+            {'failures': 1, 'async_pendings': 1},
+            daemon.logger.statsd_client.get_stats_counts())
+        # async file still intact
+        async_path, async_data = self._check_async_file(async_dir)
+        self.assertEqual(orig_async_path, async_path)
+        self.assertEqual(orig_async_data, async_data)
+        return daemon
+
+    def test_obj_put_async_root_update_missing_location_header(self):
+        headers = {
+            'X-Backend-Redirect-Timestamp': next(self.ts_iter).internal}
+        self._check_obj_put_async_update_bad_redirect_headers(headers)
+
+    def test_obj_put_async_root_update_bad_location_header(self):
+        headers = {
+            'Location': 'bad bad bad',
+            'X-Backend-Redirect-Timestamp': next(self.ts_iter).internal}
+        daemon = self._check_obj_put_async_update_bad_redirect_headers(headers)
+        error_lines = daemon.logger.get_lines_for_level('error')
+        self.assertIn('Container update failed', error_lines[0])
+        self.assertIn('Invalid path: bad%20bad%20bad', error_lines[0])
+
+    def test_obj_put_async_shard_update_redirected_twice(self):
+        policies = list(POLICIES)
+        random.shuffle(policies)
+        # setup updater
+        conf = {
+            'devices': self.devices_dir,
+            'mount_check': 'false',
+            'swift_dir': self.testdir,
+        }
+        daemon = object_updater.ObjectUpdater(conf, logger=self.logger)
+        async_dir = os.path.join(self.sda1, get_async_dir(policies[0]))
+        os.mkdir(async_dir)
+        dfmanager = DiskFileManager(conf, daemon.logger)
+
+        ts_obj = next(self.ts_iter)
+        self._write_async_update(dfmanager, ts_obj, policies[0],
+                                 container_path='.shards_a/c_shard_older')
+        orig_async_path, orig_async_data = self._check_async_file(async_dir)
+
+        # run once
+        ts_redirect_1 = next(self.ts_iter)
+        ts_redirect_2 = next(self.ts_iter)
+        ts_redirect_3 = next(self.ts_iter)
+        fake_responses = [
+            # 1st round of redirects, newest redirect should be chosen
+            (301, {'Location': '/.shards_a/c_shard_old/o',
+                   'X-Backend-Redirect-Timestamp': ts_redirect_1.internal}),
+            (301, {'Location': '/.shards_a/c%5Fshard%5Fnew/o',
+                   'X-Backend-Location-Is-Quoted': 'true',
+                   'X-Backend-Redirect-Timestamp': ts_redirect_2.internal}),
+            (301, {'Location': '/.shards_a/c%5Fshard%5Fold/o',
+                   'X-Backend-Location-Is-Quoted': 'true',
+                   'X-Backend-Redirect-Timestamp': ts_redirect_1.internal}),
+            # 2nd round of redirects
+            (301, {'Location': '/.shards_a/c_shard_newer/o',
+                   'X-Backend-Redirect-Timestamp': ts_redirect_3.internal}),
+            (301, {'Location': '/.shards_a/c_shard_newer/o',
+                   'X-Backend-Redirect-Timestamp': ts_redirect_3.internal}),
+            (301, {'Location': '/.shards_a/c_shard_newer/o',
+                   'X-Backend-Redirect-Timestamp': ts_redirect_3.internal}),
+        ]
+        fake_status_codes, fake_headers = zip(*fake_responses)
+        with mocked_http_conn(
+                *fake_status_codes, headers=fake_headers) as conn:
+            with mock.patch('swift.obj.updater.dump_recon_cache'):
+                daemon._process_device_in_child(self.sda1, 'sda1')
+
+        self._check_update_requests(conn.requests, ts_obj, policies[0])
+        # only *one* set of redirected requests is attempted per cycle
+        older_part = daemon.container_ring.get_part('.shards_a/c_shard_older')
+        new_part = daemon.container_ring.get_part('.shards_a/c_shard_new')
+        newer_part = daemon.container_ring.get_part('.shards_a/c_shard_newer')
+        self.assertEqual(
+            ['/sda1/%s/.shards_a/c_shard_older/o' % older_part] * 3 +
+            ['/sda1/%s/.shards_a/c_shard_new/o' % new_part] * 3,
+            [req['path'] for req in conn.requests])
+        self.assertEqual(
+            {'redirects': 2, 'async_pendings': 1},
+            daemon.logger.statsd_client.get_stats_counts())
+        # update failed, we still have pending file with most recent redirect
+        # response Location header value added to data
+        async_path, async_data = self._check_async_file(async_dir)
+        self.assertEqual(orig_async_path, async_path)
+        self.assertEqual(
+            dict(orig_async_data, container_path='.shards_a/c_shard_newer',
+                 redirect_history=['.shards_a/c_shard_new',
+                                   '.shards_a/c_shard_newer']),
+            async_data)
+
+        # next cycle, should get latest redirect from pickled async update
+        fake_responses = [(200, {})] * 3
+        fake_status_codes, fake_headers = zip(*fake_responses)
+        with mocked_http_conn(
+                *fake_status_codes, headers=fake_headers) as conn:
+            with mock.patch('swift.obj.updater.dump_recon_cache'):
+                daemon._process_device_in_child(self.sda1, 'sda1')
+
+        self._check_update_requests(conn.requests, ts_obj, policies[0])
+        self.assertEqual(
+            ['/sda1/%s/.shards_a/c_shard_newer/o' % newer_part] * 3,
+            [req['path'] for req in conn.requests])
+        self.assertEqual(
+            {'redirects': 2, 'successes': 1, 'unlinks': 1,
+             'async_pendings': 1},
+            daemon.logger.statsd_client.get_stats_counts())
+        self.assertFalse(os.listdir(async_dir))  # no async file
+
+    def test_obj_put_async_update_redirection_loop(self):
+        policies = list(POLICIES)
+        random.shuffle(policies)
+        # setup updater
+        conf = {
+            'devices': self.devices_dir,
+            'mount_check': 'false',
+            'swift_dir': self.testdir,
+        }
+        daemon = object_updater.ObjectUpdater(conf, logger=self.logger)
+        async_dir = os.path.join(self.sda1, get_async_dir(policies[0]))
+        os.mkdir(async_dir)
+        dfmanager = DiskFileManager(conf, daemon.logger)
+
+        ts_obj = next(self.ts_iter)
+        self._write_async_update(dfmanager, ts_obj, policies[0])
+        orig_async_path, orig_async_data = self._check_async_file(async_dir)
+
+        # run once
+        ts_redirect = next(self.ts_iter)
+
+        resp_headers_1 = {'Location': '/.shards_a/c_shard_1/o',
+                          'X-Backend-Redirect-Timestamp': ts_redirect.internal}
+        resp_headers_2 = {'Location': '/.shards_a/c_shard_2/o',
+                          'X-Backend-Redirect-Timestamp': ts_redirect.internal}
+        fake_responses = (
+            # 1st round of redirects, 2nd round of redirects
+            [(301, resp_headers_1)] * 3 + [(301, resp_headers_2)] * 3)
+        fake_status_codes, fake_headers = zip(*fake_responses)
+        with mocked_http_conn(
+                *fake_status_codes, headers=fake_headers) as conn:
+            with mock.patch('swift.obj.updater.dump_recon_cache'):
+                daemon._process_device_in_child(self.sda1, 'sda1')
+        self._check_update_requests(conn.requests[:3], ts_obj, policies[0])
+        self._check_update_requests(conn.requests[3:], ts_obj, policies[0])
+        # only *one* set of redirected requests is attempted per cycle
+        root_part = daemon.container_ring.get_part('a/c')
+        shard_1_part = daemon.container_ring.get_part('.shards_a/c_shard_1')
+        shard_2_part = daemon.container_ring.get_part('.shards_a/c_shard_2')
+        shard_3_part = daemon.container_ring.get_part('.shards_a/c_shard_3')
+        self.assertEqual(['/sda1/%s/a/c/o' % root_part] * 3 +
+                         ['/sda1/%s/.shards_a/c_shard_1/o' % shard_1_part] * 3,
+                         [req['path'] for req in conn.requests])
+        self.assertEqual(
+            {'redirects': 2, 'async_pendings': 1},
+            daemon.logger.statsd_client.get_stats_counts())
+        # update failed, we still have pending file with most recent redirect
+        # response Location header value added to data
+        async_path, async_data = self._check_async_file(async_dir)
+        self.assertEqual(orig_async_path, async_path)
+        self.assertEqual(
+            dict(orig_async_data, container_path='.shards_a/c_shard_2',
+                 redirect_history=['.shards_a/c_shard_1',
+                                   '.shards_a/c_shard_2']),
+            async_data)
+
+        # next cycle, more redirects! first is to previously visited location
+        resp_headers_3 = {'Location': '/.shards_a/c_shard_3/o',
+                          'X-Backend-Redirect-Timestamp': ts_redirect.internal}
+        fake_responses = (
+            # 1st round of redirects, 2nd round of redirects
+            [(301, resp_headers_1)] * 3 + [(301, resp_headers_3)] * 3)
+        fake_status_codes, fake_headers = zip(*fake_responses)
+        with mocked_http_conn(
+                *fake_status_codes, headers=fake_headers) as conn:
+            with mock.patch('swift.obj.updater.dump_recon_cache'):
+                daemon._process_device_in_child(self.sda1, 'sda1')
+        self._check_update_requests(conn.requests[:3], ts_obj, policies[0])
+        self._check_update_requests(conn.requests[3:], ts_obj, policies[0])
+        # first try the previously persisted container path, response to that
+        # creates a loop so ignore and send to root
+        self.assertEqual(
+            ['/sda1/%s/.shards_a/c_shard_2/o' % shard_2_part] * 3 +
+            ['/sda1/%s/a/c/o' % root_part] * 3,
+            [req['path'] for req in conn.requests])
+        self.assertEqual(
+            {'redirects': 4, 'async_pendings': 1},
+            daemon.logger.statsd_client.get_stats_counts())
+        # update failed, we still have pending file with most recent redirect
+        # response Location header value from root added to persisted data
+        async_path, async_data = self._check_async_file(async_dir)
+        self.assertEqual(orig_async_path, async_path)
+        # note: redirect_history was reset when falling back to root
+        self.assertEqual(
+            dict(orig_async_data, container_path='.shards_a/c_shard_3',
+                 redirect_history=['.shards_a/c_shard_3']),
+            async_data)
+
+        # next cycle, more redirects! first is to a location visited previously
+        # but not since last fall back to root, so that location IS tried;
+        # second is to a location visited since last fall back to root so that
+        # location is NOT tried
+        fake_responses = (
+            # 1st round of redirects, 2nd round of redirects
+            [(301, resp_headers_1)] * 3 + [(301, resp_headers_3)] * 3)
+        fake_status_codes, fake_headers = zip(*fake_responses)
+        with mocked_http_conn(
+                *fake_status_codes, headers=fake_headers) as conn:
+            with mock.patch('swift.obj.updater.dump_recon_cache'):
+                daemon._process_device_in_child(self.sda1, 'sda1')
+        self._check_update_requests(conn.requests, ts_obj, policies[0])
+        self.assertEqual(
+            ['/sda1/%s/.shards_a/c_shard_3/o' % shard_3_part] * 3 +
+            ['/sda1/%s/.shards_a/c_shard_1/o' % shard_1_part] * 3,
+            [req['path'] for req in conn.requests])
+        self.assertEqual(
+            {'redirects': 6, 'async_pendings': 1},
+            daemon.logger.statsd_client.get_stats_counts())
+        # update failed, we still have pending file, but container_path is None
+        # because most recent redirect location was a repeat
+        async_path, async_data = self._check_async_file(async_dir)
+        self.assertEqual(orig_async_path, async_path)
+        self.assertEqual(
+            dict(orig_async_data, container_path=None,
+                 redirect_history=[]),
+            async_data)
+
+        # next cycle, persisted container path is None so update should go to
+        # root, this time it succeeds
+        fake_responses = [(200, {})] * 3
+        fake_status_codes, fake_headers = zip(*fake_responses)
+        with mocked_http_conn(
+                *fake_status_codes, headers=fake_headers) as conn:
+            with mock.patch('swift.obj.updater.dump_recon_cache'):
+                daemon._process_device_in_child(self.sda1, 'sda1')
+        self._check_update_requests(conn.requests, ts_obj, policies[0])
+        self.assertEqual(['/sda1/%s/a/c/o' % root_part] * 3,
+                         [req['path'] for req in conn.requests])
+        self.assertEqual(
+            {'redirects': 6, 'successes': 1, 'unlinks': 1,
+             'async_pendings': 1},
+            daemon.logger.statsd_client.get_stats_counts())
+        self.assertFalse(os.listdir(async_dir))  # no async file
+
+    def test_obj_update_quarantine(self):
+        policies = list(POLICIES)
+        random.shuffle(policies)
+
+        # setup updater
+        conf = {
+            'devices': self.devices_dir,
+            'mount_check': 'false',
+            'swift_dir': self.testdir,
+        }
+        daemon = object_updater.ObjectUpdater(conf, logger=self.logger)
+        async_dir = os.path.join(self.sda1, get_async_dir(policies[0]))
+        os.mkdir(async_dir)
+
+        ohash = hash_path('a', 'c', 'o')
+        odir = os.path.join(async_dir, ohash[-3:])
+        mkdirs(odir)
+        op_path = os.path.join(
+            odir,
+            '%s-%s' % (ohash, next(self.ts_iter).internal))
+        with open(op_path, 'wb') as async_pending:
+            async_pending.write(b'\xff')  # invalid pickle
+
+        with mocked_http_conn():
+            with mock.patch('swift.obj.updater.dump_recon_cache'):
+                daemon._process_device_in_child(self.sda1, 'sda1')
+
+        self.assertEqual(
+            {'quarantines': 1},
+            daemon.logger.statsd_client.get_stats_counts())
+        self.assertFalse(os.listdir(async_dir))  # no asyncs
+
+    def test_obj_update_gone_missing(self):
+        # if you've got multiple updaters running (say, both a background
+        # and foreground process), _load_update may get a file
+        # that doesn't exist
+        policies = list(POLICIES)
+        random.shuffle(policies)
+
+        # setup updater
+        conf = {
+            'devices': self.devices_dir,
+            'mount_check': 'false',
+            'swift_dir': self.testdir,
+        }
+        daemon = object_updater.ObjectUpdater(conf, logger=self.logger)
+        async_dir = os.path.join(self.sda1, get_async_dir(policies[0]))
+        os.mkdir(async_dir)
+
+        ohash = hash_path('a', 'c', 'o')
+        odir = os.path.join(async_dir, ohash[-3:])
+        mkdirs(odir)
+        op_path = os.path.join(
+            odir,
+            '%s-%s' % (ohash, next(self.ts_iter).internal))
+
+        self.assertEqual(os.listdir(async_dir), [ohash[-3:]])
+        self.assertFalse(os.listdir(odir))
+        with mocked_http_conn():
+            with mock.patch('swift.obj.updater.dump_recon_cache'):
+                daemon._load_update(self.sda1, op_path)
+        self.assertEqual(
+            {}, daemon.logger.statsd_client.get_stats_counts())
+        self.assertEqual(os.listdir(async_dir), [ohash[-3:]])
+        self.assertFalse(os.listdir(odir))
+
+    def _write_dummy_pickle(self, path, a, c, o, cp=None):
+        update = {
+            'op': 'PUT',
+            'account': a,
+            'container': c,
+            'obj': o,
+            'headers': {'X-Container-Timestamp': normalize_timestamp(0)}
+        }
+        if cp:
+            update['container_path'] = cp
+        with open(path, 'wb') as async_pending:
+            pickle.dump(update, async_pending)
+
+    def _make_async_pending_pickle(self, a, c, o, cp=None):
+        ohash = hash_path(a, c, o)
+        odir = os.path.join(self.async_dir, ohash[-3:])
+        mkdirs(odir)
+        path = os.path.join(
+            odir,
+            '%s-%s' % (ohash, normalize_timestamp(time())))
+        self._write_dummy_pickle(path, a, c, o, cp)
+
+    def _find_async_pending_files(self):
+        found_files = []
+        for root, dirs, files in os.walk(self.async_dir):
+            found_files.extend(files)
+        return found_files
+
+    @mock.patch('swift.obj.updater.dump_recon_cache')
+    def test_per_container_rate_limit(self, mock_recon):
+        conf = {
+            'devices': self.devices_dir,
+            'mount_check': 'false',
+            'swift_dir': self.testdir,
+            'max_objects_per_container_per_second': 1,
+            'max_deferred_updates': 0,  # do not re-iterate
+            'concurrency': 1
+        }
+        daemon = object_updater.ObjectUpdater(conf, logger=self.logger)
+        self.async_dir = os.path.join(self.sda1, get_async_dir(POLICIES[0]))
+        os.mkdir(self.async_dir)
+        num_c1_files = 10
+        for i in range(num_c1_files):
+            obj_name = 'o%02d' % i
+            self._make_async_pending_pickle('a', 'c1', obj_name)
+        c1_part, _ = daemon.get_container_ring().get_nodes('a', 'c1')
+        # make one more in a different container, with a container_path
+        self._make_async_pending_pickle('a', 'c2', obj_name,
+                                        cp='.shards_a/c2_shard')
+        c2_part, _ = daemon.get_container_ring().get_nodes('.shards_a',
+                                                           'c2_shard')
+        expected_total = num_c1_files + 1
+        self.assertEqual(expected_total,
+                         len(self._find_async_pending_files()))
+        expected_success = 2
+        fake_status_codes = [200] * 3 * expected_success
+        with mocked_http_conn(*fake_status_codes) as fake_conn:
+            daemon._process_device_in_child(self.sda1, 'sda1')
+        self.assertEqual(expected_success, daemon.stats.successes)
+        expected_skipped = expected_total - expected_success
+        self.assertEqual(expected_skipped, daemon.stats.skips)
+        self.assertEqual(expected_skipped,
+                         len(self._find_async_pending_files()))
+        self.assertEqual(
+            Counter(
+                '/'.join(req['path'].split('/')[:5])
+                for req in fake_conn.requests),
+            {'/sda1/%s/a/c1' % c1_part: 3,
+             '/sda1/%s/.shards_a/c2_shard' % c2_part: 3})
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertTrue(info_lines)
+        self.assertIn('2 successes, 0 failures, 0 quarantines, 2 unlinks, '
+                      '0 outdated_unlinks, 0 errors, 0 redirects, 9 skips, '
+                      '9 deferrals, 0 drains',
+                      info_lines[-1])
+        self.assertEqual({'skips': 9, 'successes': 2, 'unlinks': 2,
+                          'deferrals': 9},
+                         self.logger.statsd_client.get_stats_counts())
+
+    @mock.patch('swift.obj.updater.dump_recon_cache')
+    def test_per_container_rate_limit_unlimited(self, mock_recon):
+        conf = {
+            'devices': self.devices_dir,
+            'mount_check': 'false',
+            'swift_dir': self.testdir,
+            'max_objects_per_container_per_second': 0,
+        }
+        daemon = object_updater.ObjectUpdater(conf, logger=self.logger)
+        self.async_dir = os.path.join(self.sda1, get_async_dir(POLICIES[0]))
+        os.mkdir(self.async_dir)
+        num_c1_files = 10
+        for i in range(num_c1_files):
+            obj_name = 'o%02d' % i
+            self._make_async_pending_pickle('a', 'c1', obj_name)
+        c1_part, _ = daemon.get_container_ring().get_nodes('a', 'c1')
+        # make one more in a different container, with a container_path
+        self._make_async_pending_pickle('a', 'c2', obj_name,
+                                        cp='.shards_a/c2_shard')
+        c2_part, _ = daemon.get_container_ring().get_nodes('.shards_a',
+                                                           'c2_shard')
+        expected_total = num_c1_files + 1
+        self.assertEqual(expected_total,
+                         len(self._find_async_pending_files()))
+        fake_status_codes = [200] * 3 * expected_total
+        with mocked_http_conn(*fake_status_codes):
+            daemon._process_device_in_child(self.sda1, 'sda1')
+        self.assertEqual(expected_total, daemon.stats.successes)
+        self.assertEqual(0, daemon.stats.skips)
+        self.assertEqual([], self._find_async_pending_files())
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertTrue(info_lines)
+        self.assertIn('11 successes, 0 failures, 0 quarantines, 11 unlinks, '
+                      '0 outdated_unlinks, 0 errors, 0 redirects, 0 skips, '
+                      '0 deferrals, 0 drains',
+                      info_lines[-1])
+        self.assertEqual({'successes': 11, 'unlinks': 11},
+                         self.logger.statsd_client.get_stats_counts())
+
+    @mock.patch('swift.obj.updater.dump_recon_cache')
+    def test_per_container_rate_limit_some_limited(self, mock_recon):
+        # simulate delays between buckets being fed so that only some updates
+        # are skipped
+        conf = {
+            'devices': self.devices_dir,
+            'mount_check': 'false',
+            'swift_dir': self.testdir,
+            'max_objects_per_container_per_second': 10,
+            'max_deferred_updates': 0,  # do not re-iterate
+        }
+        daemon = object_updater.ObjectUpdater(conf, logger=self.logger)
+        self.async_dir = os.path.join(self.sda1, get_async_dir(POLICIES[0]))
+        os.mkdir(self.async_dir)
+        # all updates for same container
+        num_c1_files = 4
+        for i in range(num_c1_files):
+            obj_name = 'o%02d' % i
+            self._make_async_pending_pickle('a', 'c1', obj_name)
+        c1_part, _ = daemon.get_container_ring().get_nodes('a', 'c1')
+        expected_total = num_c1_files
+        self.assertEqual(expected_total,
+                         len(self._find_async_pending_files()))
+        # first one always succeeds, second is skipped because it is only 0.05s
+        # behind the first, second succeeds because it is 0.11 behind the
+        # first, fourth is skipped
+        latencies = [0, 0.05, .051, 0]
+        expected_success = 2
+        fake_status_codes = [200] * 3 * expected_success
+
+        contexts_fed_in = []
+
+        def ratelimit_if(value):
+            contexts_fed_in.append(value)
+            # make each update delay before the iter being called again
+            eventlet.sleep(latencies.pop(0))
+            return False  # returning False overrides normal ratelimiting
+
+        orig_rate_limited_iterator = utils.RateLimitedIterator
+
+        def fake_rate_limited_iterator(*args, **kwargs):
+            # insert our own rate limiting function
+            kwargs['ratelimit_if'] = ratelimit_if
+            return orig_rate_limited_iterator(*args, **kwargs)
+
+        with mocked_http_conn(*fake_status_codes) as fake_conn, \
+                mock.patch('swift.obj.updater.RateLimitedIterator',
+                           fake_rate_limited_iterator):
+            daemon._process_device_in_child(self.sda1, 'sda1')
+        self.assertEqual(expected_success, daemon.stats.successes)
+        expected_skipped = expected_total - expected_success
+        self.assertEqual(expected_skipped, daemon.stats.skips)
+        self.assertEqual(expected_skipped,
+                         len(self._find_async_pending_files()))
+        paths_fed_in = ['/sda1/%(part)s/%(account)s/%(container)s/%(obj)s'
+                        % dict(ctx['update'], part=c1_part)
+                        for ctx in contexts_fed_in]
+        expected_update_paths = paths_fed_in[:1] * 3 + paths_fed_in[2:3] * 3
+        actual_update_paths = [req['path'] for req in fake_conn.requests]
+        self.assertEqual(expected_update_paths, actual_update_paths)
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertTrue(info_lines)
+        self.assertIn('2 successes, 0 failures, 0 quarantines, 2 unlinks, '
+                      '0 outdated_unlinks, 0 errors, 0 redirects, 2 skips, '
+                      '2 deferrals, 0 drains',
+                      info_lines[-1])
+        self.assertEqual({'skips': 2, 'successes': 2, 'unlinks': 2,
+                          'deferrals': 2},
+                         self.logger.statsd_client.get_stats_counts())
+
+    @mock.patch('swift.obj.updater.dump_recon_cache')
+    def test_per_container_rate_limit_defer_2_skip_1(self, mock_recon):
+        # limit length of deferral queue so that some defer and some skip
+        conf = {
+            'devices': self.devices_dir,
+            'mount_check': 'false',
+            'swift_dir': self.testdir,
+            'max_objects_per_container_per_second': 10,
+            # only one bucket needed for test
+            'per_container_ratelimit_buckets': 1,
+            'max_deferred_updates': 1,
+        }
+        daemon = object_updater.ObjectUpdater(conf, logger=self.logger)
+        self.async_dir = os.path.join(self.sda1, get_async_dir(POLICIES[0]))
+        os.mkdir(self.async_dir)
+        # all updates for same container
+        num_c1_files = 4
+        for i in range(num_c1_files):
+            obj_name = 'o%02d' % i
+            self._make_async_pending_pickle('a', 'c1', obj_name)
+        c1_part, _ = daemon.get_container_ring().get_nodes('a', 'c1')
+        expected_total = num_c1_files
+        self.assertEqual(expected_total,
+                         len(self._find_async_pending_files()))
+        # first succeeds, second is deferred, third succeeds, fourth is
+        # deferred and bumps second out of deferral queue, fourth is re-tried
+        latencies = [0, 0.05, .051, 0, 0, .11]
+        expected_success = 3
+
+        contexts_fed_in = []
+        captured_queues = []
+        captured_skips_stats = []
+
+        def ratelimit_if(value):
+            contexts_fed_in.append(value)
+            return False  # returning False overrides normal ratelimiting
+
+        orig_rate_limited_iterator = utils.RateLimitedIterator
+
+        def fake_rate_limited_iterator(*args, **kwargs):
+            # insert our own rate limiting function
+            kwargs['ratelimit_if'] = ratelimit_if
+            return orig_rate_limited_iterator(*args, **kwargs)
+
+        now = [time()]
+
+        def fake_get_time(bucket_iter):
+            captured_skips_stats.append(
+                daemon.logger.statsd_client.get_stats_counts().get(
+                    'skips', 0))
+            captured_queues.append(list(bucket_iter.buckets[0].deque))
+            # make each update delay before the iter being called again
+            now[0] += latencies.pop(0)
+            return now[0]
+
+        captured_updates = []
+
+        def fake_object_update(node, part, op, obj, *args, **kwargs):
+            captured_updates.append((node, part, op, obj))
+            return True, node['id'], False
+
+        with mock.patch(
+                'swift.obj.updater.BucketizedUpdateSkippingLimiter._get_time',
+                fake_get_time), \
+                mock.patch.object(daemon, 'object_update',
+                                  fake_object_update), \
+                mock.patch('swift.obj.updater.RateLimitedIterator',
+                           fake_rate_limited_iterator):
+            daemon._process_device_in_child(self.sda1, 'sda1')
+        self.assertEqual(expected_success, daemon.stats.successes)
+        expected_skipped = expected_total - expected_success
+        self.assertEqual(expected_skipped, daemon.stats.skips)
+        self.assertEqual(expected_skipped,
+                         len(self._find_async_pending_files()))
+
+        orig_iteration = contexts_fed_in[:num_c1_files]
+        # we first capture every async fed in one by one
+        objs_fed_in = [ctx['update']['obj'] for ctx in orig_iteration]
+        self.assertEqual(num_c1_files, len(set(objs_fed_in)))
+        # keep track of this order for context
+        aorder = {ctx['update']['obj']: 'a%02d' % i
+                  for i, ctx in enumerate(orig_iteration)}
+        expected_drops = (1,)
+        expected_updates_sent = []
+        for i, obj in enumerate(objs_fed_in):
+            if i in expected_drops:
+                continue
+            # triple replica, request to 3 nodes each obj!
+            expected_updates_sent.extend([obj] * 3)
+
+        actual_updates_sent = [
+            utils.split_path(update[3], minsegs=3)[-1]
+            for update in captured_updates
+        ]
+        self.assertEqual([aorder[o] for o in expected_updates_sent],
+                         [aorder[o] for o in actual_updates_sent])
+
+        self.assertEqual([0, 0, 0, 0, 1], captured_skips_stats)
+
+        expected_deferrals = [
+            [],
+            [],
+            [objs_fed_in[1]],
+            [objs_fed_in[1]],
+            [objs_fed_in[3]],
+        ]
+        self.assertEqual(
+            expected_deferrals,
+            [[ctx['update']['obj'] for ctx in q] for q in captured_queues])
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertTrue(info_lines)
+        self.assertIn('3 successes, 0 failures, 0 quarantines, 3 unlinks, '
+                      '0 outdated_unlinks, 0 errors, 0 redirects, 1 skips, '
+                      '2 deferrals, 1 drains',
+                      info_lines[-1])
+        self.assertEqual(
+            {'skips': 1, 'successes': 3, 'unlinks': 3, 'deferrals': 2,
+             'drains': 1}, self.logger.statsd_client.get_stats_counts())
+
+    @mock.patch('swift.obj.updater.dump_recon_cache')
+    def test_per_container_rate_limit_defer_3_skip_1(self, mock_recon):
+        # limit length of deferral queue so that some defer and some skip
+        conf = {
+            'devices': self.devices_dir,
+            'mount_check': 'false',
+            'swift_dir': self.testdir,
+            'max_objects_per_container_per_second': 10,
+            # only one bucket needed for test
+            'per_container_ratelimit_buckets': 1,
+            'max_deferred_updates': 2,
+        }
+        daemon = object_updater.ObjectUpdater(conf, logger=self.logger)
+        self.async_dir = os.path.join(self.sda1, get_async_dir(POLICIES[0]))
+        os.mkdir(self.async_dir)
+        # all updates for same container
+        num_c1_files = 5
+        for i in range(num_c1_files):
+            obj_name = 'o%02d' % i
+            self._make_async_pending_pickle('a', 'c1', obj_name)
+        c1_part, _ = daemon.get_container_ring().get_nodes('a', 'c1')
+        expected_total = num_c1_files
+        self.assertEqual(expected_total,
+                         len(self._find_async_pending_files()))
+        # indexes 0, 2 succeed; 1, 3, 4 deferred but 1 is bumped from deferral
+        # queue by 4; 4, 3 are then drained
+        latencies = [0, 0.05, .051, 0, 0, 0, .11]
+        expected_success = 4
+
+        contexts_fed_in = []
+        captured_queues = []
+        captured_skips_stats = []
+
+        def ratelimit_if(value):
+            contexts_fed_in.append(value)
+            return False  # returning False overrides normal ratelimiting
+
+        orig_rate_limited_iterator = utils.RateLimitedIterator
+
+        def fake_rate_limited_iterator(*args, **kwargs):
+            # insert our own rate limiting function
+            kwargs['ratelimit_if'] = ratelimit_if
+            return orig_rate_limited_iterator(*args, **kwargs)
+
+        now = [time()]
+
+        def fake_get_time(bucket_iter):
+            captured_skips_stats.append(
+                daemon.logger.statsd_client.get_stats_counts().get(
+                    'skips', 0))
+            captured_queues.append(list(bucket_iter.buckets[0].deque))
+            # make each update delay before the iter being called again
+            now[0] += latencies.pop(0)
+            return now[0]
+
+        captured_updates = []
+
+        def fake_object_update(node, part, op, obj, *args, **kwargs):
+            captured_updates.append((node, part, op, obj))
+            return True, node['id'], False
+
+        with mock.patch(
+                'swift.obj.updater.BucketizedUpdateSkippingLimiter._get_time',
+                fake_get_time), \
+                mock.patch.object(daemon, 'object_update',
+                                  fake_object_update), \
+                mock.patch('swift.obj.updater.RateLimitedIterator',
+                           fake_rate_limited_iterator), \
+                mock.patch('swift.common.utils.eventlet.sleep') as mock_sleep:
+            daemon._process_device_in_child(self.sda1, 'sda1')
+        self.assertEqual(expected_success, daemon.stats.successes)
+        expected_skipped = expected_total - expected_success
+        self.assertEqual(expected_skipped, daemon.stats.skips)
+        self.assertEqual(expected_skipped,
+                         len(self._find_async_pending_files()))
+
+        orig_iteration = contexts_fed_in[:num_c1_files]
+        # we first capture every async fed in one by one
+        objs_fed_in = [ctx['update']['obj'] for ctx in orig_iteration]
+        self.assertEqual(num_c1_files, len(set(objs_fed_in)))
+        # keep track of this order for context
+        aorder = {ctx['update']['obj']: 'a%02d' % i
+                  for i, ctx in enumerate(orig_iteration)}
+        expected_updates_sent = []
+        for index_sent in (0, 2, 4, 3):
+            expected_updates_sent.extend(
+                [contexts_fed_in[index_sent]['update']['obj']] * 3)
+        actual_updates_sent = [
+            utils.split_path(update[3], minsegs=3)[-1]
+            for update in captured_updates
+        ]
+        self.assertEqual([aorder[o] for o in expected_updates_sent],
+                         [aorder[o] for o in actual_updates_sent])
+
+        self.assertEqual([0, 0, 0, 0, 0, 1, 1], captured_skips_stats)
+
+        expected_deferrals = [
+            [],
+            [],
+            [objs_fed_in[1]],
+            [objs_fed_in[1]],
+            [objs_fed_in[1], objs_fed_in[3]],
+            [objs_fed_in[3], objs_fed_in[4]],
+            [objs_fed_in[3]],  # note: rightmost element is drained
+        ]
+        self.assertEqual(
+            expected_deferrals,
+            [[ctx['update']['obj'] for ctx in q] for q in captured_queues])
+        actual_sleeps = [call[0][0] for call in mock_sleep.call_args_list]
+        self.assertEqual(2, len(actual_sleeps))
+        self.assertAlmostEqual(0.1, actual_sleeps[0], 3)
+        self.assertAlmostEqual(0.09, actual_sleeps[1], 3)
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertTrue(info_lines)
+        self.assertIn('4 successes, 0 failures, 0 quarantines, 4 unlinks, '
+                      '0 outdated_unlinks, 0 errors, 0 redirects, 1 skips, '
+                      '3 deferrals, 2 drains',
+                      info_lines[-1])
+        self.assertEqual(
+            {'skips': 1, 'successes': 4, 'unlinks': 4, 'deferrals': 3,
+             'drains': 2}, self.logger.statsd_client.get_stats_counts())
+
+    @mock.patch('swift.obj.updater.dump_recon_cache')
+    def test_per_container_rate_limit_unsent_deferrals(self, mock_recon):
+        # make some updates defer until interval is reached and cycle
+        # terminates
+        conf = {
+            'devices': self.devices_dir,
+            'mount_check': 'false',
+            'swift_dir': self.testdir,
+            'max_objects_per_container_per_second': 10,
+            # only one bucket needed for test
+            'per_container_ratelimit_buckets': 1,
+            'max_deferred_updates': 5,
+            'interval': 0.4,
+        }
+        daemon = object_updater.ObjectUpdater(conf, logger=self.logger)
+        self.async_dir = os.path.join(self.sda1, get_async_dir(POLICIES[0]))
+        os.mkdir(self.async_dir)
+        # all updates for same container
+        num_c1_files = 7
+        for i in range(num_c1_files):
+            obj_name = 'o%02d' % i
+            self._make_async_pending_pickle('a', 'c1', obj_name)
+        c1_part, _ = daemon.get_container_ring().get_nodes('a', 'c1')
+        expected_total = num_c1_files
+        self.assertEqual(expected_total,
+                         len(self._find_async_pending_files()))
+        # first pass: 0, 2 and 5 succeed, 1, 3, 4, 6 deferred
+        # last 2 deferred items sent before interval elapses
+        latencies = [0, .05, 0.051, 0, 0, .11, 0, 0,
+                     0.1, 0.1, 0]  # total 0.411
+        expected_success = 5
+
+        contexts_fed_in = []
+        captured_queues = []
+        captured_skips_stats = []
+
+        def ratelimit_if(value):
+            contexts_fed_in.append(value)
+            return False  # returning False overrides normal ratelimiting
+
+        orig_rate_limited_iterator = utils.RateLimitedIterator
+
+        def fake_rate_limited_iterator(*args, **kwargs):
+            # insert our own rate limiting function
+            kwargs['ratelimit_if'] = ratelimit_if
+            return orig_rate_limited_iterator(*args, **kwargs)
+
+        start = time()
+        now = [start]
+
+        def fake_get_time(bucket_iter):
+            if not captured_skips_stats:
+                daemon.begin = now[0]
+            captured_skips_stats.append(
+                daemon.logger.statsd_client.get_stats_counts().get(
+                    'skips', 0))
+            captured_queues.append(list(bucket_iter.buckets[0].deque))
+            # insert delay each time iter is called
+            now[0] += latencies.pop(0)
+            return now[0]
+
+        captured_updates = []
+
+        def fake_object_update(node, part, op, obj, *args, **kwargs):
+            captured_updates.append((node, part, op, obj))
+            return True, node['id'], False
+
+        with mock.patch(
+                'swift.obj.updater.BucketizedUpdateSkippingLimiter._get_time',
+                fake_get_time), \
+                mock.patch.object(daemon, 'object_update',
+                                  fake_object_update), \
+                mock.patch('swift.obj.updater.RateLimitedIterator',
+                           fake_rate_limited_iterator), \
+                mock.patch('swift.common.utils.eventlet.sleep') as mock_sleep:
+            daemon._process_device_in_child(self.sda1, 'sda1')
+        self.assertEqual(expected_success, daemon.stats.successes)
+        expected_skipped = expected_total - expected_success
+        self.assertEqual(expected_skipped, daemon.stats.skips)
+        self.assertEqual(expected_skipped,
+                         len(self._find_async_pending_files()))
+
+        expected_updates_sent = []
+        for index_sent in (0, 2, 5, 6, 4):
+            expected_updates_sent.extend(
+                [contexts_fed_in[index_sent]['update']['obj']] * 3)
+
+        actual_updates_sent = [
+            utils.split_path(update[3], minsegs=3)[-1]
+            for update in captured_updates
+        ]
+        self.assertEqual(expected_updates_sent, actual_updates_sent)
+
+        # skips (un-drained deferrals) not reported until end of cycle
+        self.assertEqual([0] * 10, captured_skips_stats)
+
+        objs_fed_in = [ctx['update']['obj'] for ctx in contexts_fed_in]
+        expected_deferrals = [
+            # queue content before app_iter feeds next update_ctx
+            [],
+            [],
+            [objs_fed_in[1]],
+            [objs_fed_in[1]],
+            [objs_fed_in[1], objs_fed_in[3]],
+            [objs_fed_in[1], objs_fed_in[3], objs_fed_in[4]],
+            [objs_fed_in[1], objs_fed_in[3], objs_fed_in[4]],
+            # queue content before each update_ctx is drained from queue...
+            # note: rightmost element is drained
+            [objs_fed_in[1], objs_fed_in[3], objs_fed_in[4], objs_fed_in[6]],
+            [objs_fed_in[1], objs_fed_in[3], objs_fed_in[4]],
+            [objs_fed_in[1], objs_fed_in[3]],
+        ]
+        self.assertEqual(
+            expected_deferrals,
+            [[ctx['update']['obj'] for ctx in q] for q in captured_queues])
+        actual_sleeps = [call[0][0] for call in mock_sleep.call_args_list]
+        self.assertEqual(2, len(actual_sleeps))
+        self.assertAlmostEqual(0.1, actual_sleeps[0], 3)
+        self.assertAlmostEqual(0.1, actual_sleeps[1], 3)
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertTrue(info_lines)
+        self.assertIn('5 successes, 0 failures, 0 quarantines, 5 unlinks, '
+                      '0 outdated_unlinks, 0 errors, 0 redirects, 2 skips, '
+                      '4 deferrals, 2 drains',
+                      info_lines[-1])
+        self.assertEqual({
+            'successes': 5,
+            'unlinks': 5,
+            'deferrals': 4,
+            'drains': 2,
+            'skips': 2,
+        }, self.logger.statsd_client.counters)
+        self.assertEqual(
+            2, self.logger.statsd_client.get_stats_counts()['skips'])
+
+
+class TestObjectUpdaterFunctions(unittest.TestCase):
+    def test_split_update_path(self):
+        update = {
+            'op': 'PUT',
+            'account': 'a',
+            'container': 'c',
+            'obj': 'o',
+            'headers': {
+                'X-Container-Timestamp': normalize_timestamp(0),
+            }
+        }
+        actual = object_updater.split_update_path(update)
+        self.assertEqual(('a', 'c'), actual)
+
+        update['container_path'] = None
+        actual = object_updater.split_update_path(update)
+        self.assertEqual(('a', 'c'), actual)
+
+        update['container_path'] = '.shards_a/c_shard_n'
+        actual = object_updater.split_update_path(update)
+        self.assertEqual(('.shards_a', 'c_shard_n'), actual)
+
+
+class TestBucketizedUpdateSkippingLimiter(unittest.TestCase):
+
+    def setUp(self):
+        self.logger = debug_logger()
+        self.stats = object_updater.SweepStats()
+
+    def test_init(self):
+        it = object_updater.BucketizedUpdateSkippingLimiter(
+            [3, 1], self.logger, self.stats, 1000, 10)
+        self.assertEqual(1000, it.num_buckets)
+        self.assertEqual([10] * 1000, [b.max_rate for b in it.buckets])
+        self.assertEqual([3, 1], [x for x in it.iterator])
+
+        # rate of 0 implies unlimited
+        it = object_updater.BucketizedUpdateSkippingLimiter(
+            iter([3, 1]), self.logger, self.stats, 9, 0)
+        self.assertEqual(9, it.num_buckets)
+        self.assertEqual([0] * 9, [b.max_rate for b in it.buckets])
+        self.assertEqual([3, 1], [x for x in it.iterator])
+
+        # num_buckets is collared at 1
+        it = object_updater.BucketizedUpdateSkippingLimiter(
+            iter([3, 1]), self.logger, self.stats, 0, 1)
+        self.assertEqual(1, it.num_buckets)
+        self.assertEqual([1], [b.max_rate for b in it.buckets])
+        self.assertEqual([3, 1], [x for x in it.iterator])
+
+    def test_iteration_unlimited(self):
+        # verify iteration at unlimited rate
+        update_ctxs = [
+            {'update': {'account': '%d' % i, 'container': '%s' % i}}
+            for i in range(20)]
+        it = object_updater.BucketizedUpdateSkippingLimiter(
+            iter(update_ctxs), self.logger, self.stats, 9, 0)
+        self.assertEqual(update_ctxs, [x for x in it])
+        self.assertEqual(0, self.stats.skips)
+        self.assertEqual(0, self.stats.drains)
+        self.assertEqual(0, self.stats.deferrals)
+
+    def test_iteration_ratelimited(self):
+        # verify iteration at limited rate - single bucket
+        update_ctxs = [
+            {'update': {'account': '%d' % i, 'container': '%s' % i}}
+            for i in range(2)]
+        it = object_updater.BucketizedUpdateSkippingLimiter(
+            iter(update_ctxs), self.logger, self.stats, 1, 0.1)
+        # second update is skipped
+        self.assertEqual(update_ctxs[:1], [x for x in it])
+        self.assertEqual(1, self.stats.skips)
+        self.assertEqual(0, self.stats.drains)
+        self.assertEqual(1, self.stats.deferrals)
+
+    def test_deferral_single_bucket(self):
+        # verify deferral - single bucket
+        now = time()
+        update_ctxs = [
+            {'update': {'account': '%d' % i, 'container': '%s' % i}}
+            for i in range(4)]
+
+        # enough capacity for all deferrals
+        with mock.patch('swift.obj.updater.time.time',
+                        side_effect=[now, now, now, now, now, now]):
+            with mock.patch('swift.common.utils.eventlet.sleep') as mock_sleep:
+                it = object_updater.BucketizedUpdateSkippingLimiter(
+                    iter(update_ctxs[:3]), self.logger, self.stats, 1, 10,
+                    max_deferred_elements=2,
+                    drain_until=now + 10)
+                actual = [x for x in it]
+        self.assertEqual([update_ctxs[0],
+                          update_ctxs[2],  # deferrals...
+                          update_ctxs[1]],
+                         actual)
+        self.assertEqual(2, mock_sleep.call_count)
+        self.assertEqual(0, self.stats.skips)
+        self.assertEqual(2, self.stats.drains)
+        self.assertEqual(2, self.stats.deferrals)
+        self.stats.reset()
+
+        # only space for one deferral
+        with mock.patch('swift.obj.updater.time.time',
+                        side_effect=[now, now, now, now, now]):
+            with mock.patch('swift.common.utils.eventlet.sleep') as mock_sleep:
+                it = object_updater.BucketizedUpdateSkippingLimiter(
+                    iter(update_ctxs[:3]), self.logger, self.stats, 1, 10,
+                    max_deferred_elements=1,
+                    drain_until=now + 10)
+                actual = [x for x in it]
+        self.assertEqual([update_ctxs[0],
+                          update_ctxs[2]],  # deferrals...
+                         actual)
+        self.assertEqual(1, mock_sleep.call_count)
+        self.assertEqual(1, self.stats.skips)
+        self.assertEqual(1, self.stats.drains)
+        self.assertEqual(2, self.stats.deferrals)
+        self.stats.reset()
+
+        # only time for one deferral
+        with mock.patch('swift.obj.updater.time.time',
+                        side_effect=[now, now, now, now, now + 20, now + 20]):
+            with mock.patch('swift.common.utils.eventlet.sleep') as mock_sleep:
+                it = object_updater.BucketizedUpdateSkippingLimiter(
+                    iter(update_ctxs[:3]), self.logger, self.stats, 1, 10,
+                    max_deferred_elements=2,
+                    drain_until=now + 10)
+                actual = [x for x in it]
+        self.assertEqual([update_ctxs[0],
+                          update_ctxs[2]],  # deferrals...
+                         actual)
+        self.assertEqual(1, mock_sleep.call_count)
+        self.assertEqual(1, self.stats.skips)
+        self.assertEqual(1, self.stats.drains)
+        self.assertEqual(2, self.stats.deferrals)
+        self.stats.reset()
+
+        # only space for two deferrals, only time for one deferral
+        with mock.patch('swift.obj.updater.time.time',
+                        side_effect=[now, now, now, now, now,
+                                     now + 20, now + 20]):
+            with mock.patch('swift.common.utils.eventlet.sleep') as mock_sleep:
+                it = object_updater.BucketizedUpdateSkippingLimiter(
+                    iter(update_ctxs), self.logger, self.stats, 1, 10,
+                    max_deferred_elements=2,
+                    drain_until=now + 10)
+                actual = [x for x in it]
+        self.assertEqual([update_ctxs[0],
+                          update_ctxs[3]],  # deferrals...
+                         actual)
+        self.assertEqual(1, mock_sleep.call_count)
+        self.assertEqual(2, self.stats.skips)
+        self.assertEqual(1, self.stats.drains)
+        self.assertEqual(3, self.stats.deferrals)
+        self.stats.reset()
+
+    def test_deferral_multiple_buckets(self):
+        # verify deferral - multiple buckets
+        update_ctxs_1 = [
+            {'update': {'account': 'a', 'container': 'c1', 'obj': '%3d' % i}}
+            for i in range(3)]
+        update_ctxs_2 = [
+            {'update': {'account': 'a', 'container': 'c2', 'obj': '%3d' % i}}
+            for i in range(3)]
+
+        time_iter = itertools.count(time(), 0.001)
+
+        # deferrals stick in both buckets
+        with mock.patch('swift.obj.updater.time.time',
+                        side_effect=[next(time_iter) for _ in range(12)]):
+            with mock.patch('swift.common.utils.eventlet.sleep') as mock_sleep:
+                it = object_updater.BucketizedUpdateSkippingLimiter(
+                    iter(update_ctxs_1 + update_ctxs_2),
+                    self.logger, self.stats, 4, 10,
+                    max_deferred_elements=4,
+                    drain_until=next(time_iter))
+                it.salt = ''  # make container->bucket hashing predictable
+                actual = [x for x in it]
+        self.assertEqual([update_ctxs_1[0],
+                          update_ctxs_2[0],
+                          update_ctxs_1[2],  # deferrals...
+                          update_ctxs_2[2],
+                          update_ctxs_1[1],
+                          update_ctxs_2[1],
+                          ],
+                         actual)
+        self.assertEqual(4, mock_sleep.call_count)
+        self.assertEqual(0, self.stats.skips)
+        self.assertEqual(4, self.stats.drains)
+        self.assertEqual(4, self.stats.deferrals)
+        self.stats.reset()
+
+        # oldest deferral bumped from one bucket due to max_deferrals == 3
+        with mock.patch('swift.obj.updater.time.time',
+                        side_effect=[next(time_iter) for _ in range(10)]):
+            with mock.patch('swift.common.utils.eventlet.sleep') as mock_sleep:
+                it = object_updater.BucketizedUpdateSkippingLimiter(
+                    iter(update_ctxs_1 + update_ctxs_2),
+                    self.logger, self.stats, 4, 10,
+                    max_deferred_elements=3,
+                    drain_until=next(time_iter))
+                it.salt = ''  # make container->bucket hashing predictable
+                actual = [x for x in it]
+        self.assertEqual([update_ctxs_1[0],
+                          update_ctxs_2[0],
+                          update_ctxs_1[2],  # deferrals...
+                          update_ctxs_2[2],
+                          update_ctxs_2[1],
+                          ],
+                         actual)
+        self.assertEqual(3, mock_sleep.call_count)
+        self.assertEqual(1, self.stats.skips)
+        self.assertEqual(3, self.stats.drains)
+        self.assertEqual(4, self.stats.deferrals)
+        self.stats.reset()
+
+        # older deferrals bumped from one bucket due to max_deferrals == 2
+        with mock.patch('swift.obj.updater.time.time',
+                        side_effect=[next(time_iter) for _ in range(10)]):
+            with mock.patch('swift.common.utils.eventlet.sleep') as mock_sleep:
+                it = object_updater.BucketizedUpdateSkippingLimiter(
+                    iter(update_ctxs_1 + update_ctxs_2),
+                    self.logger, self.stats, 4, 10,
+                    max_deferred_elements=2,
+                    drain_until=next(time_iter))
+                it.salt = ''  # make container->bucket hashing predictable
+                actual = [x for x in it]
+        self.assertEqual([update_ctxs_1[0],
+                          update_ctxs_2[0],
+                          update_ctxs_2[2],  # deferrals...
+                          update_ctxs_2[1],
+                          ],
+                         actual)
+        self.assertEqual(2, mock_sleep.call_count)
+        self.assertEqual(2, self.stats.skips)
+        self.assertEqual(2, self.stats.drains)
+        self.assertEqual(4, self.stats.deferrals)
+        self.stats.reset()
+
+
+class TestRateLimiterBucket(unittest.TestCase):
+    def test_len(self):
+        b1 = object_updater.RateLimiterBucket(0.1)
+        b1.deque.append(1)
+        b1.deque.append(2)
+        self.assertEqual(2, len(b1))
+        b1.deque.pop()
+        self.assertEqual(1, len(b1))
+
+    def test_bool(self):
+        b1 = object_updater.RateLimiterBucket(0.1)
+        self.assertFalse(b1)
+        b1.deque.append(1)
+        self.assertTrue(b1)
+        b1.deque.pop()
+        self.assertFalse(b1)
+
+    def test_bucket_ordering(self):
+        time_iter = itertools.count(time(), step=0.001)
+        b1 = object_updater.RateLimiterBucket(10)
+        b2 = object_updater.RateLimiterBucket(10)
+
+        b2.running_time = next(time_iter)
+        buckets = PriorityQueue()
+        buckets.put(b1)
+        buckets.put(b2)
+        self.assertEqual([b1, b2], [buckets.get_nowait() for _ in range(2)])
+
+        b1.running_time = next(time_iter)
+        buckets.put(b1)
+        buckets.put(b2)
+        self.assertEqual([b2, b1], [buckets.get_nowait() for _ in range(2)])
+
+
+class TestOldestAsyncPendingTracker(unittest.TestCase):
+    def setUp(self):
+        self.manager = object_updater.OldestAsyncPendingTracker(3)
+
+    def test_add_update_new_pair(self):
+        self.manager.add_update('a1', 'c1', Timestamp(1000.0).internal)
+        self.assertEqual(self.manager.ac_to_timestamp[('a1', 'c1')], 1000.0)
+        self.assertIn((1000.0, ('a1', 'c1')), self.manager.sorted_entries)
+        self.manager.add_update(
+            'a2', 'c2', Timestamp(2000.0, offset=123).internal)
+        self.assertEqual(self.manager.ac_to_timestamp[('a2', 'c2')], 2000.0)
+        self.assertIn((2000.0, ('a2', 'c2')), self.manager.sorted_entries)
+
+    def test_add_update_existing_pair(self):
+        self.manager.add_update('a1', 'c1', Timestamp(1000.0).internal)
+        self.assertIn((1000.0, ('a1', 'c1')), self.manager.sorted_entries)
+        self.manager.add_update('a1', 'c1', Timestamp(900.0).internal)
+        self.assertEqual(self.manager.ac_to_timestamp[('a1', 'c1')], 900.0)
+        self.assertNotIn((1000.0, ('a1', 'c1')), self.manager.sorted_entries)
+        self.assertIn((900.0, ('a1', 'c1')), self.manager.sorted_entries)
+        self.manager.add_update('a1', 'c1', 1100.0)
+        self.assertEqual(self.manager.ac_to_timestamp[('a1', 'c1')], 900.0)
+        self.assertNotIn((1100.0, ('a1', 'c1')), self.manager.sorted_entries)
+        self.assertIn((900.0, ('a1', 'c1')), self.manager.sorted_entries)
+
+    def test_eviction_when_limit_exceeded(self):
+        self.manager.add_update('a1', 'c1', Timestamp(1000.0).internal)
+        self.manager.add_update('a2', 'c2', Timestamp(2000.0).internal)
+        self.manager.add_update('a3', 'c3', Timestamp(3000.0).internal)
+
+        self.manager.add_update('a4', 'c4', Timestamp(2500.0).internal)
+        self.assertIn(('a4', 'c4'), self.manager.ac_to_timestamp)
+        self.assertNotIn(('a3', 'c3'), self.manager.ac_to_timestamp)
+
+    def test_newest_pairs_not_added_when_limit_exceeded(self):
+        self.manager.add_update('a1', 'c1', Timestamp(1000.0).internal)
+        self.manager.add_update('a2', 'c2', Timestamp(2000.0).internal)
+        self.manager.add_update('a3', 'c3', Timestamp(3000.0).internal)
+
+        self.manager.add_update('a4', 'c4', Timestamp(4000.0).internal)
+        self.assertNotIn(('a4', 'c4'), self.manager.ac_to_timestamp)
+        self.assertIn(('a3', 'c3'), self.manager.ac_to_timestamp)
+
+    def test_get_n_oldest_timestamp_acs(self):
+        self.manager.add_update('a1', 'c1', Timestamp(1000.0).internal)
+        self.manager.add_update('a2', 'c2', Timestamp(2000.0).internal)
+        self.manager.add_update('a3', 'c3', Timestamp(3000.0).internal)
+
+        oldest_pairs = self.manager.get_n_oldest_timestamp_acs(2)
+        expected_output = {
+            'oldest_count': 2,
+            'oldest_entries': [
+                {'timestamp': 1000.0, 'account': 'a1', 'container': 'c1'},
+                {'timestamp': 2000.0, 'account': 'a2', 'container': 'c2'},
+            ],
+        }
+        self.assertEqual(oldest_pairs, expected_output)
+
+    def test_get_oldest_timestamp(self):
+        self.manager.add_update('a1', 'c1', Timestamp(1000.0).internal)
+        self.manager.add_update('a2', 'c2', Timestamp(2000.0).internal)
+
+        oldest_timestamp = self.manager.get_oldest_timestamp()
+        self.assertEqual(oldest_timestamp, 1000.0)
+
+        self.manager.add_update('a3', 'c3', Timestamp(3000.0).internal)
+        oldest_timestamp = self.manager.get_oldest_timestamp()
+        self.assertEqual(oldest_timestamp, 1000.0)
+
+        self.manager.ac_to_timestamp.clear()
+        self.manager.sorted_entries = []
+        oldest_timestamp = self.manager.get_oldest_timestamp()
+        self.assertEqual(oldest_timestamp, None)
+
+    def test_get_oldest_timestamp_age(self):
+        current_time = time()
+        ts = Timestamp(current_time - 200).internal
+        self.manager.add_update('a1', 'c1', ts)
+
+        age = self.manager.get_oldest_timestamp_age()
+        self.assertAlmostEqual(age, 200.0, delta=1)
+
+    def test_get_oldest_timestamp_age_no_updates(self):
+        age = self.manager.get_oldest_timestamp_age()
+        self.assertEqual(age, None)
+
+    def test_eviction_when_multiple_same_timestamps(self):
+        self.manager.add_update('a1', 'c1', Timestamp(1000.0).internal)
+        self.manager.add_update('a2', 'c2', Timestamp(1000.0).internal)
+        self.manager.add_update('a3', 'c3', Timestamp(1000.0).internal)
+
+        self.manager.add_update('a4', 'c4', Timestamp(500.0).internal)
+
+        expected_present = [('a1', 'c1'), ('a2', 'c2'), ('a4', 'c4')]
+        expected_absent = [('a3', 'c3')]
+
+        for account_container in expected_present:
+            self.assertIn(account_container, self.manager.ac_to_timestamp)
+
+        for account_container in expected_absent:
+            self.assertNotIn(account_container, self.manager.ac_to_timestamp)
+
+        self.assertEqual(len(self.manager.ac_to_timestamp), 3)
+
+    def test_reset(self):
+        self.manager.add_update('a1', 'c1', Timestamp(1000.0).internal)
+        self.manager.add_update('a2', 'c2', Timestamp(2000.0).internal)
+        self.manager.reset()
+        self.assertEqual(len(self.manager.ac_to_timestamp), 0)
+        self.assertEqual(len(self.manager.sorted_entries), 0)
+
+    def test_memory_usage(self):
+        self.manager.add_update('a1', 'c1', Timestamp(1000.0).internal)
+        memory_usage_before_reset = self.manager.get_memory_usage()
+        self.assertGreater(memory_usage_before_reset, 0)
+
+        self.manager.reset()
+        memory_usage_after_reset = self.manager.get_memory_usage()
+        self.assertLess(memory_usage_after_reset, memory_usage_before_reset)
+
+    def test_no_eviction_when_below_max_entries(self):
+        self.manager.add_update('a1', 'c1', Timestamp(1000.0).internal)
+        self.manager.add_update('a2', 'c2', Timestamp(2000.0).internal)
+
+        self.assertIn(('a1', 'c1'), self.manager.ac_to_timestamp)
+        self.assertIn(('a2', 'c2'), self.manager.ac_to_timestamp)
+        self.assertEqual(len(self.manager.ac_to_timestamp), 2)
+
+    def test_get_n_oldest_timestamp_acs_exceeding_dump_count(self):
+        self.manager.add_update('a1', 'c1', Timestamp(1000.0).internal)
+        self.manager.add_update('a2', 'c2', Timestamp(2000.0).internal)
+        self.manager.add_update('a3', 'c3', Timestamp(3000.0).internal)
+
+        oldest_pairs = self.manager.get_n_oldest_timestamp_acs(5)
+        expected_output = {
+            'oldest_count': 3,
+            'oldest_entries': [
+                {'timestamp': 1000.0, 'account': 'a1', 'container': 'c1'},
+                {'timestamp': 2000.0, 'account': 'a2', 'container': 'c2'},
+                {'timestamp': 3000.0, 'account': 'a3', 'container': 'c3'},
+            ],
+        }
+        self.assertEqual(oldest_pairs, expected_output)
+
+
+class TestSweepStats(unittest.TestCase):
+    def test_copy(self):
+        num_props = len(vars(object_updater.SweepStats()))
+        stats = object_updater.SweepStats(*range(1, num_props + 1))
+        stats2 = stats.copy()
+        self.assertEqual(vars(stats), vars(stats2))
+
+    def test_since(self):
+        stats = object_updater.SweepStats(1, 2, 3, 4, 5, 6, 7, 8, 9)
+        stats2 = object_updater.SweepStats(4, 6, 8, 10, 12, 14, 16, 18, 20)
+        expected = object_updater.SweepStats(3, 4, 5, 6, 7, 8, 9, 10, 11)
+        self.assertEqual(vars(expected), vars(stats2.since(stats)))
+
+    def test_reset(self):
+        num_props = len(vars(object_updater.SweepStats()))
+        stats = object_updater.SweepStats(*range(1, num_props + 1))
+        stats.reset()
+        expected = object_updater.SweepStats()
+        self.assertEqual(vars(expected), vars(stats))
+
+    def test_str(self):
+        num_props = len(vars(object_updater.SweepStats()))
+        stats = object_updater.SweepStats(*range(1, num_props + 1))
+        self.assertEqual(
+            '4 successes, 2 failures, 3 quarantines, 5 unlinks, '
+            '6 outdated_unlinks, 1 errors, 7 redirects, 8 skips, 9 deferrals, '
+            '10 drains', str(stats))
 
 
 if __name__ == '__main__':
diff --git a/test/unit/proxy/controllers/test_account.py b/test/unit/proxy/controllers/test_account.py
new file mode 100644
index 0000000000..910a6b5158
--- /dev/null
+++ b/test/unit/proxy/controllers/test_account.py
@@ -0,0 +1,430 @@
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from unittest import mock
+import unittest
+
+from swift.common.swob import Request, Response
+from swift.common.middleware.acl import format_acl
+from swift.proxy import server as proxy_server
+from swift.proxy.controllers.base import headers_to_account_info
+from swift.common import constraints
+from test.unit import fake_http_connect, FakeRing, mocked_http_conn
+from swift.common.storage_policy import StoragePolicy
+from swift.common.request_helpers import get_sys_meta_prefix
+import swift.proxy.controllers.base
+from swift.proxy.controllers.base import get_account_info
+
+from test.unit import patch_policies
+
+
+@patch_policies([StoragePolicy(0, 'zero', True, object_ring=FakeRing())])
+class TestAccountController(unittest.TestCase):
+
+    ACCOUNT_REPLICAS = 3
+
+    def setUp(self):
+        self.app = proxy_server.Application(
+            None,
+            account_ring=FakeRing(), container_ring=FakeRing())
+
+    def _make_callback_func(self, context):
+        def callback(ipaddr, port, device, partition, method, path,
+                     headers=None, query_string=None, ssl=False):
+            context['method'] = method
+            context['path'] = path
+            context['headers'] = headers or {}
+        return callback
+
+    def _assert_responses(self, method, test_cases):
+        if method in ('PUT', 'DELETE'):
+            self.app.allow_account_management = True
+        controller = proxy_server.AccountController(self.app, 'AUTH_bob')
+
+        for responses, expected in test_cases:
+            with mock.patch(
+                    'swift.proxy.controllers.base.http_connect',
+                    fake_http_connect(*responses)):
+                req = Request.blank('/v1/AUTH_bob')
+                resp = getattr(controller, method)(req)
+
+            self.assertEqual(expected,
+                             resp.status_int,
+                             'Expected %s but got %s. Failed case: %s' %
+                             (expected, resp.status_int, str(responses)))
+
+    def test_account_info_in_response_env(self):
+        controller = proxy_server.AccountController(self.app, 'AUTH_bob')
+        with mocked_http_conn(200) as mock_conn:
+            req = Request.blank('/v1/AUTH_bob')
+            resp = controller.HEAD(req)
+        self.assertEqual(2, resp.status_int // 100)
+        self.assertEqual(['/AUTH_bob'],
+                         # requests are like /sdX/0/..
+                         [r['path'][6:] for r in mock_conn.requests])
+        info_cache = resp.environ['swift.infocache']
+        self.assertIn('account/AUTH_bob', info_cache)
+        header_info = headers_to_account_info(resp.headers)
+        self.assertEqual(header_info, info_cache['account/AUTH_bob'])
+
+        # The failure doesn't lead to cache eviction
+        errors = [500] * self.ACCOUNT_REPLICAS
+        with mocked_http_conn(*errors) as mock_conn:
+            req = Request.blank('/v1/AUTH_bob', {
+                'PATH_INFO': '/v1/AUTH_bob', 'swift.infocache': info_cache})
+            resp = controller.HEAD(req)
+        self.assertEqual(5, resp.status_int // 100)
+        self.assertEqual(['/AUTH_bob'] * self.ACCOUNT_REPLICAS,
+                         # requests are like /sdX/0/..
+                         [r['path'][6:] for r in mock_conn.requests])
+        self.assertIs(info_cache, resp.environ['swift.infocache'])
+        # The *old* header info is all still there
+        self.assertIn('account/AUTH_bob', info_cache)
+        self.assertEqual(header_info, info_cache['account/AUTH_bob'])
+
+    def test_swift_owner(self):
+        owner_headers = {
+            'x-account-meta-temp-url-key': 'value',
+            'x-account-meta-temp-url-key-2': 'value'}
+        controller = proxy_server.AccountController(self.app, 'a')
+
+        req = Request.blank('/v1/a')
+        with mock.patch('swift.proxy.controllers.base.http_connect',
+                        fake_http_connect(200, headers=owner_headers)):
+            resp = controller.HEAD(req)
+        self.assertEqual(2, resp.status_int // 100)
+        for key in owner_headers:
+            self.assertNotIn(key, resp.headers)
+
+        req = Request.blank('/v1/a', environ={'swift_owner': True})
+        with mock.patch('swift.proxy.controllers.base.http_connect',
+                        fake_http_connect(200, headers=owner_headers)):
+            resp = controller.HEAD(req)
+        self.assertEqual(2, resp.status_int // 100)
+        for key in owner_headers:
+            self.assertIn(key, resp.headers)
+
+    def test_get_deleted_account(self):
+        resp_headers = {
+            'x-backend-timestamp': '123.456',
+            'x-account-status': 'deleted',
+        }
+        controller = proxy_server.AccountController(self.app, 'a')
+
+        req = Request.blank('/v1/a')
+        with mock.patch('swift.proxy.controllers.base.http_connect',
+                        fake_http_connect(404, headers=resp_headers)):
+            resp = controller.HEAD(req)
+        self.assertEqual(410, resp.status_int)
+
+    def test_long_acct_names(self):
+        long_acct_name = '%sLongAccountName' % (
+            'Very' * (constraints.MAX_ACCOUNT_NAME_LENGTH // 4))
+        controller = proxy_server.AccountController(self.app, long_acct_name)
+
+        req = Request.blank('/v1/%s' % long_acct_name)
+        with mock.patch('swift.proxy.controllers.base.http_connect',
+                        fake_http_connect(200)):
+            resp = controller.HEAD(req)
+        self.assertEqual(400, resp.status_int)
+
+        with mock.patch('swift.proxy.controllers.base.http_connect',
+                        fake_http_connect(200)):
+            resp = controller.GET(req)
+        self.assertEqual(400, resp.status_int)
+
+        with mock.patch('swift.proxy.controllers.base.http_connect',
+                        fake_http_connect(200)):
+            resp = controller.POST(req)
+        self.assertEqual(400, resp.status_int)
+
+    def test_sys_meta_headers_PUT(self):
+        # check that headers in sys meta namespace make it through
+        # the proxy controller
+        sys_meta_key = '%stest' % get_sys_meta_prefix('account')
+        sys_meta_key = sys_meta_key.title()
+        user_meta_key = 'X-Account-Meta-Test'
+        # allow PUTs to account...
+        self.app.allow_account_management = True
+        controller = proxy_server.AccountController(self.app, 'a')
+        context = {}
+        callback = self._make_callback_func(context)
+        hdrs_in = {sys_meta_key: 'foo',
+                   user_meta_key: 'bar',
+                   'x-timestamp': '1.0'}
+        req = Request.blank('/v1/a', headers=hdrs_in)
+        with mock.patch('swift.proxy.controllers.base.http_connect',
+                        fake_http_connect(200, 200, give_connect=callback)):
+            controller.PUT(req)
+        self.assertEqual(context['method'], 'PUT')
+        self.assertIn(sys_meta_key, context['headers'])
+        self.assertEqual(context['headers'][sys_meta_key], 'foo')
+        self.assertIn(user_meta_key, context['headers'])
+        self.assertEqual(context['headers'][user_meta_key], 'bar')
+        self.assertNotEqual(context['headers']['x-timestamp'], '1.0')
+
+    def test_sys_meta_headers_POST(self):
+        # check that headers in sys meta namespace make it through
+        # the proxy controller
+        sys_meta_key = '%stest' % get_sys_meta_prefix('account')
+        sys_meta_key = sys_meta_key.title()
+        user_meta_key = 'X-Account-Meta-Test'
+        controller = proxy_server.AccountController(self.app, 'a')
+        context = {}
+        callback = self._make_callback_func(context)
+        hdrs_in = {sys_meta_key: 'foo',
+                   user_meta_key: 'bar',
+                   'x-timestamp': '1.0'}
+        req = Request.blank('/v1/a', headers=hdrs_in)
+        with mock.patch('swift.proxy.controllers.base.http_connect',
+                        fake_http_connect(200, 200, give_connect=callback)):
+            controller.POST(req)
+        self.assertEqual(context['method'], 'POST')
+        self.assertIn(sys_meta_key, context['headers'])
+        self.assertEqual(context['headers'][sys_meta_key], 'foo')
+        self.assertIn(user_meta_key, context['headers'])
+        self.assertEqual(context['headers'][user_meta_key], 'bar')
+        self.assertNotEqual(context['headers']['x-timestamp'], '1.0')
+
+    def _make_user_and_sys_acl_headers_data(self):
+        acl = {
+            'admin': ['AUTH_alice', 'AUTH_bob'],
+            'read-write': ['AUTH_carol'],
+            'read-only': [],
+        }
+        user_prefix = 'x-account-'  # external, user-facing
+        user_headers = {(user_prefix + 'access-control'): format_acl(
+            version=2, acl_dict=acl)}
+        sys_prefix = get_sys_meta_prefix('account')   # internal, system-facing
+        sys_headers = {(sys_prefix + 'core-access-control'): format_acl(
+            version=2, acl_dict=acl)}
+        return user_headers, sys_headers
+
+    def test_account_acl_headers_translated_for_GET_HEAD(self):
+        # Verify that a GET/HEAD which receives X-Account-Sysmeta-Acl-* headers
+        # from the account server will remap those headers to X-Account-Acl-*
+
+        hdrs_ext, hdrs_int = self._make_user_and_sys_acl_headers_data()
+        controller = proxy_server.AccountController(self.app, 'acct')
+
+        for verb in ('GET', 'HEAD'):
+            req = Request.blank('/v1/acct', environ={'swift_owner': True})
+            controller.GETorHEAD_base = lambda *_: Response(
+                headers=hdrs_int, environ={
+                    'PATH_INFO': '/acct',
+                    'REQUEST_METHOD': verb,
+                })
+            method = getattr(controller, verb)
+            resp = method(req)
+            for header, value in hdrs_ext.items():
+                if value:
+                    self.assertEqual(resp.headers.get(header), value)
+                else:
+                    # blank ACLs should result in no header
+                    self.assertNotIn(header, resp.headers)
+
+    def test_add_acls_impossible_cases(self):
+        # For test coverage: verify that defensive coding does defend, in cases
+        # that shouldn't arise naturally
+
+        # add_acls should do nothing if REQUEST_METHOD isn't HEAD/GET/PUT/POST
+        resp = Response()
+        controller = proxy_server.AccountController(self.app, 'a')
+        resp.environ['PATH_INFO'] = '/a'
+        resp.environ['REQUEST_METHOD'] = 'OPTIONS'
+        controller.add_acls_from_sys_metadata(resp)
+        self.assertEqual(1, len(resp.headers))  # we always get Content-Type
+        self.assertEqual(2, len(resp.environ))
+
+    def test_cache_key_impossible_cases(self):
+        # For test coverage: verify that defensive coding does defend, in cases
+        # that shouldn't arise naturally
+        with self.assertRaises(ValueError):
+            # Container needs account
+            swift.proxy.controllers.base.get_cache_key(None, 'c')
+
+        with self.assertRaises(ValueError):
+            # Object needs account
+            swift.proxy.controllers.base.get_cache_key(None, 'c', 'o')
+
+        with self.assertRaises(ValueError):
+            # Object needs container
+            swift.proxy.controllers.base.get_cache_key('a', None, 'o')
+
+    def test_stripping_swift_admin_headers(self):
+        # Verify that a GET/HEAD which receives privileged headers from the
+        # account server will strip those headers for non-swift_owners
+
+        headers = {
+            'x-account-meta-harmless': 'hi mom',
+            'x-account-meta-temp-url-key': 's3kr1t',
+        }
+        controller = proxy_server.AccountController(self.app, 'acct')
+
+        for verb in ('GET', 'HEAD'):
+            for env in ({'swift_owner': True}, {'swift_owner': False}):
+                req = Request.blank('/v1/acct', environ=env)
+                controller.GETorHEAD_base = lambda *_: Response(
+                    headers=headers, environ={
+                        'PATH_INFO': '/acct',
+                        'REQUEST_METHOD': verb,
+                    })
+                method = getattr(controller, verb)
+                resp = method(req)
+                self.assertEqual(resp.headers.get('x-account-meta-harmless'),
+                                 'hi mom')
+                privileged_header_present = (
+                    'x-account-meta-temp-url-key' in resp.headers)
+                self.assertEqual(privileged_header_present, env['swift_owner'])
+
+    def test_response_code_for_PUT(self):
+        PUT_TEST_CASES = [
+            ((201, 201, 201), 201),
+            ((201, 201, 404), 201),
+            ((201, 201, 503), 201),
+            ((201, 404, 404), 404),
+            ((201, 404, 503), 503),
+            ((201, 503, 503), 503),
+            ((404, 404, 404), 404),
+            ((404, 404, 503), 404),
+            ((404, 503, 503), 503),
+            ((503, 503, 503), 503)
+        ]
+        self._assert_responses('PUT', PUT_TEST_CASES)
+
+    def test_response_code_for_DELETE(self):
+        DELETE_TEST_CASES = [
+            ((204, 204, 204), 204),
+            ((204, 204, 404), 204),
+            ((204, 204, 503), 204),
+            ((204, 404, 404), 404),
+            ((204, 404, 503), 503),
+            ((204, 503, 503), 503),
+            ((404, 404, 404), 404),
+            ((404, 404, 503), 404),
+            ((404, 503, 503), 503),
+            ((503, 503, 503), 503)
+        ]
+        self._assert_responses('DELETE', DELETE_TEST_CASES)
+
+    def test_response_code_for_POST(self):
+        POST_TEST_CASES = [
+            ((204, 204, 204), 204),
+            ((204, 204, 404), 204),
+            ((204, 204, 503), 204),
+            ((204, 404, 404), 404),
+            ((204, 404, 503), 503),
+            ((204, 503, 503), 503),
+            ((404, 404, 404), 404),
+            ((404, 404, 503), 404),
+            ((404, 503, 503), 503),
+            ((503, 503, 503), 503)
+        ]
+        self._assert_responses('POST', POST_TEST_CASES)
+
+
+@patch_policies(
+    [StoragePolicy(0, 'zero', True, object_ring=FakeRing(replicas=4))])
+class TestAccountController4Replicas(TestAccountController):
+
+    ACCOUNT_REPLICAS = 4
+
+    def setUp(self):
+        self.app = proxy_server.Application(
+            None,
+            account_ring=FakeRing(replicas=4),
+            container_ring=FakeRing(replicas=4))
+
+    def test_response_code_for_PUT(self):
+        PUT_TEST_CASES = [
+            ((201, 201, 201, 201), 201),
+            ((201, 201, 201, 404), 201),
+            ((201, 201, 201, 503), 201),
+            ((201, 201, 404, 404), 201),
+            ((201, 201, 404, 503), 201),
+            ((201, 201, 503, 503), 201),
+            ((201, 404, 404, 404), 404),
+            ((201, 404, 404, 503), 404),
+            ((201, 404, 503, 503), 503),
+            ((201, 503, 503, 503), 503),
+            ((404, 404, 404, 404), 404),
+            ((404, 404, 404, 503), 404),
+            ((404, 404, 503, 503), 404),
+            ((404, 503, 503, 503), 503),
+            ((503, 503, 503, 503), 503)
+        ]
+        self._assert_responses('PUT', PUT_TEST_CASES)
+
+    def test_response_code_for_DELETE(self):
+        DELETE_TEST_CASES = [
+            ((204, 204, 204, 204), 204),
+            ((204, 204, 204, 404), 204),
+            ((204, 204, 204, 503), 204),
+            ((204, 204, 404, 404), 204),
+            ((204, 204, 404, 503), 204),
+            ((204, 204, 503, 503), 204),
+            ((204, 404, 404, 404), 404),
+            ((204, 404, 404, 503), 404),
+            ((204, 404, 503, 503), 503),
+            ((204, 503, 503, 503), 503),
+            ((404, 404, 404, 404), 404),
+            ((404, 404, 404, 503), 404),
+            ((404, 404, 503, 503), 404),
+            ((404, 503, 503, 503), 503),
+            ((503, 503, 503, 503), 503)
+        ]
+        self._assert_responses('DELETE', DELETE_TEST_CASES)
+
+    def test_response_code_for_POST(self):
+        POST_TEST_CASES = [
+            ((204, 204, 204, 204), 204),
+            ((204, 204, 204, 404), 204),
+            ((204, 204, 204, 503), 204),
+            ((204, 204, 404, 404), 204),
+            ((204, 204, 404, 503), 204),
+            ((204, 204, 503, 503), 204),
+            ((204, 404, 404, 404), 404),
+            ((204, 404, 404, 503), 404),
+            ((204, 404, 503, 503), 503),
+            ((204, 503, 503, 503), 503),
+            ((404, 404, 404, 404), 404),
+            ((404, 404, 404, 503), 404),
+            ((404, 404, 503, 503), 404),
+            ((404, 503, 503, 503), 503),
+            ((503, 503, 503, 503), 503)
+        ]
+        self._assert_responses('POST', POST_TEST_CASES)
+
+
+@patch_policies([StoragePolicy(0, 'zero', True, object_ring=FakeRing())])
+class TestGetAccountInfo(unittest.TestCase):
+    def setUp(self):
+        self.app = proxy_server.Application(
+            None,
+            account_ring=FakeRing(), container_ring=FakeRing())
+
+    def test_get_deleted_account_410(self):
+        resp_headers = {'x-account-status': 'deleted',
+                        'x-backend-timestamp': '123.456'}
+
+        req = Request.blank('/v1/a')
+        with mock.patch('swift.proxy.controllers.base.http_connect',
+                        fake_http_connect(404, headers=resp_headers)):
+            info = get_account_info(req.environ, self.app)
+        self.assertEqual(410, info.get('status'))
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/proxy/controllers/test_base.py b/test/unit/proxy/controllers/test_base.py
index 13bb11e3c1..c8fca31132 100644
--- a/test/unit/proxy/controllers/test_base.py
+++ b/test/unit/proxy/controllers/test_base.py
@@ -1,4 +1,4 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2010-2012 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -12,39 +12,1836 @@
 # implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
-
+import operator
+import os
+import random
+from argparse import Namespace
+import itertools
+import json
+from collections import defaultdict
 import unittest
-from swift.proxy.controllers.base import headers_to_container_info
+from unittest import mock
+
+from swift.proxy import server as proxy_server
+from swift.proxy.controllers.base import headers_to_container_info, \
+    headers_to_account_info, headers_to_object_info, get_container_info, \
+    get_cache_key, get_account_info, get_info, get_object_info, \
+    Controller, GetOrHeadHandler, bytes_to_skip, clear_info_cache, \
+    set_info_cache, NodeIter, headers_from_container_info, \
+    record_cache_op_metrics, GetterSource, get_namespaces_from_cache, \
+    set_namespaces_in_cache
+from swift.common.swob import Request, HTTPException, RESPONSE_REASONS, \
+    bytes_to_wsgi
+from swift.common import exceptions
+from swift.common.utils import split_path, Timestamp, \
+    GreenthreadSafeIterator, GreenAsyncPile, NamespaceBoundList
+from swift.common.header_key_dict import HeaderKeyDict
+from swift.common.http import is_success
+from swift.common.storage_policy import StoragePolicy, StoragePolicyCollection
+from test.debug_logger import debug_logger
+from test.unit import (
+    fake_http_connect, FakeRing, FakeMemcache, PatchPolicies, patch_policies,
+    FakeSource, StubResponse, CaptureIteratorFactory, make_timestamp_iter)
+from swift.common.request_helpers import (
+    get_sys_meta_prefix, get_object_transient_sysmeta
+)
+
+
+class FakeResponse(object):
+
+    base_headers = {}
+
+    def __init__(self, status_int=200, headers=None, body=b''):
+        self.status_int = status_int
+        self._headers = headers or {}
+        self.body = body
+
+    @property
+    def headers(self):
+        if is_success(self.status_int):
+            self._headers.update(self.base_headers)
+        return self._headers
+
+
+class AccountResponse(FakeResponse):
+
+    base_headers = {
+        'x-account-container-count': 333,
+        'x-account-object-count': 1000,
+        'x-account-bytes-used': 6666,
+    }
+
+
+class ContainerResponse(FakeResponse):
+
+    base_headers = {
+        'x-container-object-count': 1000,
+        'x-container-bytes-used': 6666,
+        'x-versions-location': bytes_to_wsgi(
+            u'\U0001F334'.encode('utf8')),
+    }
+
+
+class ObjectResponse(FakeResponse):
+
+    base_headers = {
+        'content-length': 5555,
+        'content-type': 'text/plain'
+    }
+
+
+class DynamicResponseFactory(object):
+
+    def __init__(self, *statuses):
+        if statuses:
+            self.statuses = iter(statuses)
+        else:
+            self.statuses = itertools.repeat(200)
+        self.stats = defaultdict(int)
+
+    response_type = {
+        'obj': ObjectResponse,
+        'container': ContainerResponse,
+        'account': AccountResponse,
+    }
+
+    def _get_response(self, type_):
+        self.stats[type_] += 1
+        class_ = self.response_type[type_]
+        return class_(next(self.statuses))
+
+    def get_response(self, environ):
+        (version, account, container, obj) = split_path(
+            environ['PATH_INFO'], 2, 4, True)
+        if obj:
+            resp = self._get_response('obj')
+        elif container:
+            resp = self._get_response('container')
+        else:
+            resp = self._get_response('account')
+        resp.account = account
+        resp.container = container
+        resp.obj = obj
+        return resp
+
+
+class ZeroCacheAccountResponse(FakeResponse):
+    base_headers = {
+        'X-Backend-Recheck-Account-Existence': '0',
+        'x-account-container-count': 333,
+        'x-account-object-count': 1000,
+        'x-account-bytes-used': 6666,
+    }
+
+
+class ZeroCacheContainerResponse(FakeResponse):
+    base_headers = {
+        'X-Backend-Recheck-Container-Existence': '0',
+        'x-container-object-count': 1000,
+        'x-container-bytes-used': 6666,
+    }
+
+
+class ZeroCacheDynamicResponseFactory(DynamicResponseFactory):
+    response_type = {
+        'obj': ObjectResponse,
+        'container': ZeroCacheContainerResponse,
+        'account': ZeroCacheAccountResponse,
+    }
+
+
+class FakeApp(object):
+
+    recheck_container_existence = 30
+    container_existence_skip_cache = 0
+    recheck_account_existence = 30
+    account_existence_skip_cache = 0
+    logger = None
+
+    def __init__(self, response_factory=None, statuses=None):
+        self.responses = response_factory or \
+            DynamicResponseFactory(*statuses or [])
+        self.captured_envs = []
+
+    def __call__(self, environ, start_response):
+        self.captured_envs.append(environ)
+        response = self.responses.get_response(environ)
+        reason = RESPONSE_REASONS[response.status_int][0]
+        start_response('%d %s' % (response.status_int, reason),
+                       [(k, v) for k, v in response.headers.items()])
+        return iter(response.body)
+
+
+class FakeCache(FakeMemcache):
+    def __init__(self, stub=None, **pre_cached):
+        super(FakeCache, self).__init__()
+        if pre_cached:
+            self.store.update(pre_cached)
+        # Fake a json roundtrip
+        self.stub = json.loads(json.dumps(stub))
+
+    def get(self, key, raise_on_error=False):
+        return self.stub or super(FakeCache, self).get(key, raise_on_error)
+
+
+class BaseTest(unittest.TestCase):
+
+    def setUp(self):
+        self.logger = debug_logger()
+        self.cache = FakeCache()
+        self.conf = {}
+        self.account_ring = FakeRing()
+        self.container_ring = FakeRing()
+        self.app = proxy_server.Application(self.conf,
+                                            logger=self.logger,
+                                            account_ring=self.account_ring,
+                                            container_ring=self.container_ring)
+
+
+@patch_policies([StoragePolicy(0, 'zero', True, object_ring=FakeRing())])
+class TestFuncs(BaseTest):
+
+    def test_get_namespaces_from_cache_miss(self):
+        cache_key = 'shard-updating-v2/a/c/'
+        req = Request.blank('a/c')
+        req.environ['swift.cache'] = self.cache
+        actual = get_namespaces_from_cache(req, cache_key, 0)
+        self.assertEqual((None, 'miss'), actual)
+
+    def test_get_namespaces_from_cache_infocache_hit(self):
+        cache_key = 'shard-updating-v2/a/c/'
+        ns_bound_list1 = NamespaceBoundList([['', 'sr1'], ['k', 'sr2']])
+        ns_bound_list2 = NamespaceBoundList([['', 'sr3'], ['t', 'sr4']])
+        req = Request.blank('a/c')
+        req.environ['swift.cache'] = self.cache
+        req.environ['swift.infocache'] = {cache_key: ns_bound_list1}
+        # memcache ignored if infocache hits
+        self.cache.set(cache_key, ns_bound_list2.bounds)
+        actual = get_namespaces_from_cache(req, cache_key, 0)
+        self.assertEqual((ns_bound_list1, 'infocache_hit'), actual)
+
+    def test_get_namespaces_from_cache_hit(self):
+        cache_key = 'shard-updating-v2/a/c/'
+        ns_bound_list = NamespaceBoundList([['', 'sr3'], ['t', 'sr4']])
+        req = Request.blank('a/c')
+        req.environ['swift.cache'] = self.cache
+        req.environ['swift.infocache'] = {}
+        self.cache.set(cache_key, ns_bound_list.bounds)
+        actual = get_namespaces_from_cache(req, 'shard-updating-v2/a/c/', 0)
+        self.assertEqual((ns_bound_list, 'hit'), actual)
+        self.assertEqual({cache_key: ns_bound_list},
+                         req.environ['swift.infocache'])
+
+    def test_get_namespaces_from_cache_skips(self):
+        cache_key = 'shard-updating-v2/a/c/'
+        ns_bound_list = NamespaceBoundList([['', 'sr1'], ['k', 'sr2']])
+
+        self.cache.set(cache_key, ns_bound_list.bounds)
+        req = Request.blank('a/c')
+        req.environ['swift.cache'] = self.cache
+        with mock.patch('swift.proxy.controllers.base.random.random',
+                        return_value=0.099):
+            actual = get_namespaces_from_cache(req, cache_key, 0.1)
+        self.assertEqual((None, 'skip'), actual)
+
+        req = Request.blank('a/c')
+        req.environ['swift.cache'] = self.cache
+        with mock.patch('swift.proxy.controllers.base.random.random',
+                        return_value=0.1):
+            actual = get_namespaces_from_cache(req, cache_key, 0.1)
+        self.assertEqual((ns_bound_list, 'hit'), actual)
+
+    def test_get_namespaces_from_cache_error(self):
+        cache_key = 'shard-updating-v2/a/c/'
+        ns_bound_list = NamespaceBoundList([['', 'sr1'], ['k', 'sr2']])
+        self.cache.set(cache_key, ns_bound_list.bounds)
+        # sanity check
+        req = Request.blank('a/c')
+        req.environ['swift.cache'] = self.cache
+        actual = get_namespaces_from_cache(req, cache_key, 0.0)
+        self.assertEqual((ns_bound_list, 'hit'), actual)
+
+        req = Request.blank('a/c')
+        req.environ['swift.cache'] = self.cache
+        self.cache.error_on_get = [True]
+        actual = get_namespaces_from_cache(req, cache_key, 0.0)
+        self.assertEqual((None, 'error'), actual)
+
+    def test_set_namespaces_in_cache_disabled(self):
+        cache_key = 'shard-testing-v2/a/c/'
+        ns_bound_list = NamespaceBoundList([['', 'sr1'], ['k', 'sr2']])
+        req = Request.blank('a/c')
+        actual = set_namespaces_in_cache(req, cache_key, ns_bound_list, 123)
+        self.assertEqual('disabled', actual)
+        self.assertEqual({cache_key: ns_bound_list},
+                         req.environ['swift.infocache'])
+
+    def test_set_namespaces_in_cache_ok(self):
+        cache_key = 'shard-testing-v2/a/c/'
+        ns_bound_list = NamespaceBoundList([['', 'sr1'], ['k', 'sr2']])
+        req = Request.blank('a/c')
+        req.environ['swift.cache'] = self.cache
+        actual = set_namespaces_in_cache(req, cache_key, ns_bound_list, 123)
+        self.assertEqual('set', actual)
+        self.assertEqual({cache_key: ns_bound_list},
+                         req.environ['swift.infocache'])
+        self.assertEqual(ns_bound_list.bounds, self.cache.store.get(cache_key))
+        self.assertEqual(123, self.cache.times.get(cache_key))
+
+    def test_set_namespaces_in_cache_infocache_exists(self):
+        cache_key = 'shard-testing-v2/a/c/'
+        ns_bound_list = NamespaceBoundList([['', 'sr1'], ['k', 'sr2']])
+        req = Request.blank('a/c')
+        req.environ['swift.infocache'] = {'already': 'exists'}
+        actual = set_namespaces_in_cache(req, cache_key, ns_bound_list, 123)
+        self.assertEqual('disabled', actual)
+        self.assertEqual({'already': 'exists', cache_key: ns_bound_list},
+                         req.environ['swift.infocache'])
+
+    def test_set_namespaces_in_cache_error(self):
+        cache_key = 'shard-testing-v2/a/c/'
+        ns_bound_list = NamespaceBoundList([['', 'sr1'], ['k', 'sr2']])
+        req = Request.blank('a/c')
+        req.environ['swift.cache'] = self.cache
+        self.cache.error_on_set = [True]
+        actual = set_namespaces_in_cache(req, cache_key, ns_bound_list, 123)
+        self.assertEqual('set_error', actual)
+        self.assertEqual(ns_bound_list,
+                         req.environ['swift.infocache'].get(cache_key))
+
+    def test_set_namespaces_in_cache_raises_exception(self):
+        cache_key = 'shard-updating-v2/a/c/'
+        ns_bound_list = NamespaceBoundList([['', 'sr1'], ['k', 'sr2']])
+        req = Request.blank('a/c')
+        with self.assertRaises(ValueError) as cm:
+            set_namespaces_in_cache(req, cache_key, ns_bound_list, 123)
+        self.assertIn('shard-updating cache should use '
+                      'CooperativeNamespaceCachePopulator',
+                      str(cm.exception))
+
+    def test_get_info_zero_recheck(self):
+        mock_cache = mock.Mock()
+        mock_cache.get.return_value = None
+        app = FakeApp(ZeroCacheDynamicResponseFactory())
+        env = {'swift.cache': mock_cache}
+        info_a = get_info(app, env, 'a')
+        # Check that you got proper info
+        self.assertEqual(info_a['status'], 200)
+        self.assertEqual(info_a['bytes'], 6666)
+        self.assertEqual(info_a['total_object_count'], 1000)
+        self.assertEqual(info_a['container_count'], 333)
+        # Make sure the env cache is set
+        exp_cached_info_a = {
+            k: str(v) if k in (
+                'bytes', 'container_count', 'total_object_count') else v
+            for k, v in info_a.items()}
+        self.assertEqual(env['swift.infocache'].get('account/a'),
+                         exp_cached_info_a)
+        # Make sure the app was called
+        self.assertEqual(app.responses.stats['account'], 1)
+        self.assertEqual(app.responses.stats['container'], 0)
+        # Make sure memcache was called
+        self.assertEqual(mock_cache.mock_calls, [
+            mock.call.get('account/a'),
+            mock.call.set('account/a', exp_cached_info_a, time=0),
+        ])
+
+        mock_cache.reset_mock()
+        info_c = get_info(app, env, 'a', 'c')
+        # Check that you got proper info
+        self.assertEqual(info_c['status'], 200)
+        self.assertEqual(info_c['bytes'], 6666)
+        self.assertEqual(info_c['object_count'], 1000)
+        # Make sure the env cache is set
+        exp_cached_info_c = {
+            k: str(v) if k in (
+                'bytes', 'object_count', 'storage_policy') else v
+            for k, v in info_c.items()}
+        self.assertEqual(env['swift.infocache'].get('account/a'),
+                         exp_cached_info_a)
+        self.assertEqual(env['swift.infocache'].get('container/a/c'),
+                         exp_cached_info_c)
+        # Check app call for container, but no new calls for account
+        self.assertEqual(app.responses.stats['account'], 1)
+        self.assertEqual(app.responses.stats['container'], 1)
+        # Make sure container info was cached
+        self.assertEqual(mock_cache.mock_calls, [
+            mock.call.get('container/a/c'),
+            mock.call.set('container/a/c', exp_cached_info_c, time=0),
+        ])
+
+        # reset call counts
+        app = FakeApp(ZeroCacheDynamicResponseFactory())
+        env = {'swift.cache': mock_cache}
+        mock_cache.reset_mock()
+        info_c = get_info(app, env, 'a', 'c')
+        # Check that you got proper info
+        self.assertEqual(info_c['status'], 200)
+        self.assertEqual(info_c['bytes'], 6666)
+        self.assertEqual(info_c['object_count'], 1000)
+        # Make sure the env cache is set
+        self.assertEqual(env['swift.infocache'].get('account/a'),
+                         exp_cached_info_a)
+        self.assertEqual(env['swift.infocache'].get('container/a/c'),
+                         exp_cached_info_c)
+        # check app calls both account and container
+        self.assertEqual(app.responses.stats['account'], 1)
+        self.assertEqual(app.responses.stats['container'], 1)
+        # Make sure account info was cached but container was not
+        self.assertEqual(mock_cache.mock_calls, [
+            mock.call.get('container/a/c'),
+            mock.call.get('account/a'),
+            mock.call.set('account/a', exp_cached_info_a, time=0),
+            mock.call.set('container/a/c', exp_cached_info_c, time=0),
+        ])
+
+    def test_get_info(self):
+        app = FakeApp()
+        # Do a non cached call to account
+        env = {}
+        info_a = get_info(app, env, 'a')
+        # Check that you got proper info
+        self.assertEqual(info_a['status'], 200)
+        self.assertEqual(info_a['bytes'], 6666)
+        self.assertEqual(info_a['total_object_count'], 1000)
+
+        # Make sure the app was called
+        self.assertEqual(app.responses.stats['account'], 1)
+
+        # Make sure the return value matches get_account_info
+        account_info = get_account_info({'PATH_INFO': '/v1/a'}, app)
+        self.assertEqual(info_a, account_info)
+
+        # Do an env cached call to account
+        app.responses.stats['account'] = 0
+        app.responses.stats['container'] = 0
+
+        info_a = get_info(app, env, 'a')
+        # Check that you got proper info
+        self.assertEqual(info_a['status'], 200)
+        self.assertEqual(info_a['bytes'], 6666)
+        self.assertEqual(info_a['total_object_count'], 1000)
+
+        # Make sure the app was NOT called AGAIN
+        self.assertEqual(app.responses.stats['account'], 0)
+
+        # This time do env cached call to account and non cached to container
+        app.responses.stats['account'] = 0
+        app.responses.stats['container'] = 0
+
+        info_c = get_info(app, env, 'a', 'c')
+        # Check that you got proper info
+        self.assertEqual(info_c['status'], 200)
+        self.assertEqual(info_c['bytes'], 6666)
+        self.assertEqual(info_c['object_count'], 1000)
+        # Make sure the app was called for container but not account
+        self.assertEqual(app.responses.stats['account'], 0)
+        self.assertEqual(app.responses.stats['container'], 1)
+
+        # This time do a non-cached call to account then non-cached to
+        # container
+        app.responses.stats['account'] = 0
+        app.responses.stats['container'] = 0
+        app = FakeApp()
+        env = {}  # abandon previous call to env
+        info_c = get_info(app, env, 'a', 'c')
+        # Check that you got proper info
+        self.assertEqual(info_c['status'], 200)
+        self.assertEqual(info_c['bytes'], 6666)
+        self.assertEqual(info_c['object_count'], 1000)
+        # check app calls both account and container
+        self.assertEqual(app.responses.stats['account'], 1)
+        self.assertEqual(app.responses.stats['container'], 1)
+
+        # This time do an env-cached call to container while account is not
+        # cached
+        app.responses.stats['account'] = 0
+        app.responses.stats['container'] = 0
+        info_c = get_info(app, env, 'a', 'c')
+        # Check that you got proper info
+        self.assertEqual(info_a['status'], 200)
+        self.assertEqual(info_c['bytes'], 6666)
+        self.assertEqual(info_c['object_count'], 1000)
+
+        # no additional calls were made
+        self.assertEqual(app.responses.stats['account'], 0)
+        self.assertEqual(app.responses.stats['container'], 0)
+
+    def test_get_container_info_swift_source(self):
+        app = FakeApp()
+        req = Request.blank("/v1/a/c", environ={'swift.cache': FakeCache()})
+        get_container_info(req.environ, app, swift_source='MC')
+        self.assertEqual([e['swift.source'] for e in app.captured_envs],
+                         ['MC', 'MC'])
+
+    def test_get_container_info_in_pipeline(self):
+        final_app = FakeApp()
+
+        def factory(app, include_pipeline_ref=True):
+            def wsgi_filter(env, start_response):
+                # lots of middlewares get info...
+                if env['PATH_INFO'].count('/') > 2:
+                    get_container_info(env, app)
+                else:
+                    get_account_info(env, app)
+                # ...then decide to no-op based on the result
+                return app(env, start_response)
+
+            if include_pipeline_ref:
+                # Note that we have to do some book-keeping in tests to mimic
+                # what would be done in swift.common.wsgi.load_app
+                wsgi_filter._pipeline_final_app = final_app
+                wsgi_filter._pipeline_request_logging_app = final_app
+            return wsgi_filter
+
+        # build up a pipeline
+        filtered_app = factory(factory(factory(final_app)))
+        req = Request.blank("/v1/a/c/o", environ={'swift.cache': FakeCache()})
+        req.get_response(filtered_app)
+        self.assertEqual([e['PATH_INFO'] for e in final_app.captured_envs],
+                         ['/v1/a', '/v1/a/c', '/v1/a/c/o'])
+
+        # but we can't completely rely on our run_server pipeline-building
+        # attaching proxy-app references; some 3rd party middlewares may
+        # compose themselves as multiple filters, and only the outer-most one
+        # would have the reference
+        filtered_app = factory(factory(factory(final_app), False))
+        del final_app.captured_envs[:]
+        req = Request.blank("/v1/a/c/o", environ={'swift.cache': FakeCache()})
+        req.get_response(filtered_app)
+        self.assertEqual([e['PATH_INFO'] for e in final_app.captured_envs], [
+            '/v1/a', '/v1/a', '/v1/a/c', '/v1/a/c', '/v1/a/c/o'])
+
+    def test_get_account_info_uses_logging_app(self):
+        def factory(app, func=None):
+            calls = []
+
+            def wsgi_filter(env, start_response):
+                calls.append(env)
+                if func:
+                    func(env, app)
+                return app(env, start_response)
+
+            return wsgi_filter, calls
+
+        # build up a pipeline, pretend there is a proxy_logging middleware
+        final_app = FakeApp()
+        logging_app, logging_app_calls = factory(final_app)
+        filtered_app, filtered_app_calls = factory(logging_app,
+                                                   func=get_account_info)
+        # mimic what would be done in swift.common.wsgi.load_app
+        for app in (filtered_app, logging_app):
+            app._pipeline_final_app = final_app
+            app._pipeline_request_logging_app = logging_app
+        req = Request.blank("/v1/a/c/o", environ={'swift.cache': FakeCache()})
+        req.get_response(filtered_app)
+        self.assertEqual([e['PATH_INFO'] for e in final_app.captured_envs],
+                         ['/v1/a', '/v1/a/c/o'])
+        self.assertEqual([e['PATH_INFO'] for e in logging_app_calls],
+                         ['/v1/a', '/v1/a/c/o'])
+        self.assertEqual([e['PATH_INFO'] for e in filtered_app_calls],
+                         ['/v1/a/c/o'])
+
+    def test_get_container_info_uses_logging_app(self):
+        def factory(app, func=None):
+            calls = []
+
+            def wsgi_filter(env, start_response):
+                calls.append(env)
+                if func:
+                    func(env, app)
+                return app(env, start_response)
+
+            return wsgi_filter, calls
+
+        # build up a pipeline, pretend there is a proxy_logging middleware
+        final_app = FakeApp()
+        logging_app, logging_app_calls = factory(final_app)
+        filtered_app, filtered_app_calls = factory(logging_app,
+                                                   func=get_container_info)
+        # mimic what would be done in swift.common.wsgi.load_app
+        for app in (filtered_app, logging_app):
+            app._pipeline_final_app = final_app
+            app._pipeline_request_logging_app = logging_app
+        req = Request.blank("/v1/a/c/o", environ={'swift.cache': FakeCache()})
+        req.get_response(filtered_app)
+        self.assertEqual([e['PATH_INFO'] for e in final_app.captured_envs],
+                         ['/v1/a', '/v1/a/c', '/v1/a/c/o'])
+        self.assertEqual([e['PATH_INFO'] for e in logging_app_calls],
+                         ['/v1/a', '/v1/a/c', '/v1/a/c/o'])
+        self.assertEqual([e['PATH_INFO'] for e in filtered_app_calls],
+                         ['/v1/a/c/o'])
+
+    def test_get_object_info_swift_source(self):
+        app = FakeApp()
+        req = Request.blank("/v1/a/c/o",
+                            environ={'swift.cache': FakeCache()})
+        get_object_info(req.environ, app, swift_source='LU')
+        self.assertEqual([e['swift.source'] for e in app.captured_envs],
+                         ['LU'])
+
+    def test_get_container_info_no_cache(self):
+        req = Request.blank("/v1/AUTH_account/cont",
+                            environ={'swift.cache': FakeCache({})})
+        resp = get_container_info(req.environ, FakeApp())
+        self.assertEqual(resp['storage_policy'], 0)
+        self.assertEqual(resp['bytes'], 6666)
+        self.assertEqual(resp['object_count'], 1000)
+        expected = u'\U0001F334'
+        self.assertEqual(resp['versions'], expected)
+
+    def test_get_container_info_no_account(self):
+        app = FakeApp(statuses=[404, 200])
+        req = Request.blank("/v1/AUTH_does_not_exist/cont")
+        info = get_container_info(req.environ, app)
+        self.assertEqual(info['status'], 0)
+
+    def test_get_container_info_no_container_gets_cached(self):
+        fake_cache = FakeCache({})
+        app = FakeApp(statuses=[200, 404])
+        req = Request.blank("/v1/AUTH_account/does_not_exist",
+                            environ={'swift.cache': fake_cache})
+        info = get_container_info(req.environ, app)
+        self.assertEqual(info['status'], 404)
+        key = get_cache_key("AUTH_account", "does_not_exist")
+        self.assertIn(key, fake_cache.store)
+        self.assertEqual(fake_cache.store[key]['status'], 404)
+
+    def test_get_container_info_bad_path(self):
+        fake_cache = FakeCache({})
+        req = Request.blank("/non-swift/AUTH_account/does_not_exist",
+                            environ={'swift.cache': fake_cache})
+        info = get_container_info(req.environ, FakeApp(statuses=[400]))
+        self.assertEqual(info['status'], 0)
+        # *not* cached
+        key = get_cache_key("AUTH_account", "does_not_exist")
+        self.assertNotIn(key, fake_cache.store)
+        # not even the "account" is cached
+        key = get_cache_key("AUTH_account")
+        self.assertNotIn(key, fake_cache.store)
+
+        # but if for some reason the account *already was* cached...
+        fake_cache.store[key] = headers_to_account_info({}, 200)
+        req = Request.blank("/non-swift/AUTH_account/does_not_exist",
+                            environ={'swift.cache': fake_cache})
+        info = get_container_info(req.environ, FakeApp(statuses=[400]))
+        self.assertEqual(info['status'], 0)
+        # resp *still* not cached
+        key = get_cache_key("AUTH_account", "does_not_exist")
+        self.assertNotIn(key, fake_cache.store)
+
+        # still nothing, even if the container is already cached, too
+        fake_cache.store[key] = headers_to_container_info({}, 200)
+        req = Request.blank("/non-swift/AUTH_account/does_not_exist",
+                            environ={'swift.cache': fake_cache})
+        info = get_container_info(req.environ, FakeApp(statuses=[400]))
+        self.assertEqual(info['status'], 0)
+
+    def test_get_container_info_no_auto_account(self):
+        app = FakeApp(statuses=[200])
+        req = Request.blank("/v1/.system_account/cont")
+        info = get_container_info(req.environ, app)
+        self.assertEqual(info['status'], 200)
+        self.assertEqual(info['bytes'], 6666)
+        self.assertEqual(info['object_count'], 1000)
+
+    def test_get_container_info_cache(self):
+        cache_stub = {
+            'status': 404, 'bytes': 3333, 'object_count': 10,
+            'versions': u"\U0001F4A9",
+            'meta': {u'some-\N{SNOWMAN}': u'non-ascii meta \U0001F334'}}
+        req = Request.blank("/v1/account/cont",
+                            environ={'swift.cache': FakeCache(cache_stub)})
+        resp = get_container_info(req.environ, FakeApp())
+        self.assertEqual([(k, type(k)) for k in resp],
+                         [(k, str) for k in resp])
+        self.assertEqual(resp['storage_policy'], 0)
+        self.assertEqual(resp['bytes'], 3333)
+        self.assertEqual(resp['object_count'], 10)
+        self.assertEqual(resp['status'], 404)
+        expected = u'\U0001F4A9'
+        self.assertEqual(resp['versions'], expected)
+
+        for subdict in resp.values():
+            if isinstance(subdict, dict):
+                self.assertEqual([(k, type(k), v, type(v))
+                                  for k, v in subdict.items()],
+                                 [(k, str, v, str)
+                                  for k, v in subdict.items()])
+
+    def test_get_container_info_only_lookup_cache(self):
+        # no container info is cached in cache.
+        req = Request.blank("/v1/AUTH_account/cont",
+                            environ={'swift.cache': FakeCache({})})
+        resp = get_container_info(
+            req.environ, self.app, swift_source=None, cache_only=True)
+        self.assertEqual(resp['storage_policy'], 0)
+        self.assertEqual(resp['bytes'], 0)
+        self.assertEqual(resp['object_count'], 0)
+        self.assertEqual(resp['versions'], None)
+        self.assertEqual(
+            [x[0][0] for x in
+             self.logger.logger.statsd_client.calls['increment']],
+            ['container.info.cache.miss'])
+
+        # container info is cached in cache.
+        self.logger.clear()
+        cache_stub = {
+            'status': 404, 'bytes': 3333, 'object_count': 10,
+            'versions': u"\U0001F4A9",
+            'meta': {u'some-\N{SNOWMAN}': u'non-ascii meta \U0001F334'}}
+        req = Request.blank("/v1/account/cont",
+                            environ={'swift.cache': FakeCache(cache_stub)})
+        resp = get_container_info(
+            req.environ, self.app, swift_source=None, cache_only=True)
+        self.assertEqual([(k, type(k)) for k in resp],
+                         [(k, str) for k in resp])
+        self.assertEqual(resp['storage_policy'], 0)
+        self.assertEqual(resp['bytes'], 3333)
+        self.assertEqual(resp['object_count'], 10)
+        self.assertEqual(resp['status'], 404)
+        expected = u'\U0001F4A9'
+        self.assertEqual(resp['versions'], expected)
+        for subdict in resp.values():
+            if isinstance(subdict, dict):
+                self.assertEqual([(k, type(k), v, type(v))
+                                  for k, v in subdict.items()],
+                                 [(k, str, v, str)
+                                  for k, v in subdict.items()])
+        self.assertEqual(
+            [x[0][0] for x in
+             self.logger.logger.statsd_client.calls['increment']],
+            ['container.info.cache.hit'])
+
+    def test_get_cache_key(self):
+        self.assertEqual(get_cache_key("account", "cont"),
+                         'container/account/cont')
+        self.assertEqual(get_cache_key(b"account", b"cont", b'obj'),
+                         'object/account/cont/obj')
+        self.assertEqual(get_cache_key(u"account", u"cont", b'obj'),
+                         'object/account/cont/obj')
+
+        # Expected result should always be native string
+        expected = u'container/\N{SNOWMAN}/\U0001F334'
+
+        self.assertEqual(get_cache_key(u"\N{SNOWMAN}", u"\U0001F334"),
+                         expected)
+        self.assertEqual(get_cache_key(u"\N{SNOWMAN}".encode('utf8'),
+                                       u"\U0001F334".encode('utf8')),
+                         expected)
+
+        self.assertEqual(get_cache_key("account", "cont", shard="listing"),
+                         'shard-listing-v2/account/cont')
+        self.assertEqual(get_cache_key("account", "cont", shard="updating"),
+                         'shard-updating-v2/account/cont')
+        self.assertRaises(ValueError,
+                          get_cache_key, "account", shard="listing")
+        self.assertRaises(ValueError,
+                          get_cache_key, "account", "cont", "obj",
+                          shard="listing")
+
+    def test_get_container_info_env(self):
+        cache_key = get_cache_key("account", "cont")
+        req = Request.blank(
+            "/v1/account/cont",
+            environ={'swift.infocache': {cache_key: {'bytes': 3867}},
+                     'swift.cache': FakeCache({})})
+        resp = get_container_info(req.environ, 'xxx')
+        self.assertEqual(resp['bytes'], 3867)
+
+    def test_info_clearing(self):
+        def check_in_cache(req, cache_key):
+            self.assertIn(cache_key, req.environ['swift.infocache'])
+            self.assertIn(cache_key, req.environ['swift.cache'].store)
+
+        def check_not_in_cache(req, cache_key):
+            self.assertNotIn(cache_key, req.environ['swift.infocache'])
+            self.assertNotIn(cache_key, req.environ['swift.cache'].store)
+
+        app = FakeApp(statuses=[200, 200])
+        acct_cache_key = get_cache_key("account")
+        cont_cache_key = get_cache_key("account", "cont")
+        req = Request.blank(
+            "/v1/account/cont", environ={"swift.cache": FakeCache()})
+        # populate caches
+        info = get_container_info(req.environ, app)
+        self.assertEqual(info['status'], 200)
+
+        check_in_cache(req, acct_cache_key)
+        check_in_cache(req, cont_cache_key)
+
+        clear_info_cache(req.environ, 'account', 'cont')
+        check_in_cache(req, acct_cache_key)
+        check_not_in_cache(req, cont_cache_key)
+
+        # Can also use set_info_cache interface
+        set_info_cache(req.environ, 'account', None, None)
+        check_not_in_cache(req, acct_cache_key)
+        check_not_in_cache(req, cont_cache_key)
+
+        # check shard cache-keys
+        shard_cache_key = get_cache_key('account', 'cont', shard='listing')
+        shard_data = [{'shard': 'ranges'}]
+        req.environ['swift.infocache'][shard_cache_key] = shard_data
+        req.environ['swift.cache'].set(shard_cache_key, shard_data, time=600)
+        check_in_cache(req, shard_cache_key)
+        clear_info_cache(req.environ, 'account', 'cont',
+                         shard='listing')
+        check_not_in_cache(req, shard_cache_key)
+
+    def test_record_cache_op_metrics(self):
+        record_cache_op_metrics(
+            self.logger, 'container', 'shard_listing', 'infocache_hit')
+        self.assertEqual(
+            self.logger.statsd_client.get_stats_counts().get(
+                'container.shard_listing.infocache.hit'),
+            1)
+        record_cache_op_metrics(
+            self.logger, 'container', 'shard_listing', 'hit')
+        self.assertEqual(
+            self.logger.statsd_client.get_stats_counts().get(
+                'container.shard_listing.cache.hit'),
+            1)
+        resp = FakeResponse(status_int=200)
+        record_cache_op_metrics(
+            self.logger, 'object', 'shard_updating', 'skip', resp)
+        self.assertEqual(
+            self.logger.statsd_client.get_stats_counts().get(
+                'object.shard_updating.cache.skip.200'),
+            1)
+        resp = FakeResponse(status_int=503)
+        record_cache_op_metrics(
+            self.logger, 'object', 'shard_updating', 'disabled', resp)
+        self.assertEqual(
+            self.logger.statsd_client.get_stats_counts().get(
+                'object.shard_updating.cache.disabled.503'),
+            1)
+
+        # test a cache miss call without response, expect no metric recorded.
+        self.app.logger = mock.Mock()
+        record_cache_op_metrics(
+            self.logger, 'object', 'shard_updating', 'miss')
+        self.app.logger.increment.assert_not_called()
+
+    def test_get_account_info_swift_source(self):
+        app = FakeApp()
+        req = Request.blank("/v1/a", environ={'swift.cache': FakeCache()})
+        get_account_info(req.environ, app, swift_source='MC')
+        self.assertEqual([e['swift.source'] for e in app.captured_envs],
+                         ['MC'])
+
+    def test_get_account_info_swift_owner(self):
+        app = FakeApp()
+        req = Request.blank("/v1/a", environ={'swift.cache': FakeCache()})
+        get_account_info(req.environ, app)
+        self.assertEqual([e['swift_owner'] for e in app.captured_envs],
+                         [True])
+
+    def test_get_account_info_infocache(self):
+        app = FakeApp()
+        ic = {}
+        req = Request.blank("/v1/a", environ={'swift.cache': FakeCache(),
+                                              'swift.infocache': ic})
+        get_account_info(req.environ, app)
+        got_infocaches = [e['swift.infocache'] for e in app.captured_envs]
+        self.assertEqual(1, len(got_infocaches))
+        self.assertIs(ic, got_infocaches[0])
+
+    def test_get_account_info_no_cache(self):
+        app = FakeApp()
+        req = Request.blank("/v1/AUTH_account",
+                            environ={'swift.cache': FakeCache({})})
+        resp = get_account_info(req.environ, app)
+        self.assertEqual(resp['bytes'], 6666)
+        self.assertEqual(resp['total_object_count'], 1000)
+
+    def test_get_account_info_cache(self):
+        # Works with fake apps that return ints in the headers
+        cached = {'status': 404,
+                  'bytes': 3333,
+                  'total_object_count': 10}
+        req = Request.blank("/v1/account/cont",
+                            environ={'swift.cache': FakeCache(cached)})
+        resp = get_account_info(req.environ, FakeApp())
+        self.assertEqual(resp['bytes'], 3333)
+        self.assertEqual(resp['total_object_count'], 10)
+        self.assertEqual(resp['status'], 404)
+
+        # Works with strings too, like you get when parsing HTTP headers
+        # that came in through a socket from the account server
+        cached = {'status': 404,
+                  'bytes': '3333',
+                  'container_count': '234',
+                  'total_object_count': '10',
+                  'meta': {}}
+        req = Request.blank("/v1/account/cont",
+                            environ={'swift.cache': FakeCache(cached)})
+        resp = get_account_info(req.environ, FakeApp())
+        self.assertEqual(resp['status'], 404)
+        self.assertEqual(resp['bytes'], 3333)
+        self.assertEqual(resp['container_count'], 234)
+        self.assertEqual(resp['meta'], {})
+        self.assertEqual(resp['total_object_count'], 10)
+
+    def test_get_account_info_env(self):
+        cache_key = get_cache_key("account")
+        req = Request.blank(
+            "/v1/account",
+            environ={'swift.infocache': {cache_key: {'bytes': 3867}},
+                     'swift.cache': FakeCache({})})
+        resp = get_account_info(req.environ, 'xxx')
+        self.assertEqual(resp['bytes'], 3867)
 
+    def test_get_account_info_bad_path(self):
+        fake_cache = FakeCache({})
+        req = Request.blank("/non-swift/AUTH_account",
+                            environ={'swift.cache': fake_cache})
+        info = get_account_info(req.environ, FakeApp(statuses=[400]))
+        self.assertEqual(info['status'], 0)
+        # *not* cached
+        key = get_cache_key("AUTH_account")
+        self.assertNotIn(key, fake_cache.store)
+
+        # but if for some reason the account *already was* cached...
+        fake_cache.store[key] = headers_to_account_info({}, 200)
+        req = Request.blank("/non-swift/AUTH_account/does_not_exist",
+                            environ={'swift.cache': fake_cache})
+        info = get_account_info(req.environ, FakeApp(statuses=[400]))
+        self.assertEqual(info['status'], 0)
+
+    def test_get_object_info_env(self):
+        cached = {'status': 200,
+                  'length': 3333,
+                  'type': 'application/json',
+                  'meta': {}}
+        cache_key = get_cache_key("account", "cont", "obj")
+        req = Request.blank(
+            "/v1/account/cont/obj",
+            environ={'swift.infocache': {cache_key: cached},
+                     'swift.cache': FakeCache({})})
+        resp = get_object_info(req.environ, 'xxx')
+        self.assertEqual(resp['length'], 3333)
+        self.assertEqual(resp['type'], 'application/json')
+
+    def test_get_object_info_no_env(self):
+        app = FakeApp()
+        req = Request.blank("/v1/account/cont/obj",
+                            environ={'swift.cache': FakeCache({})})
+        resp = get_object_info(req.environ, app)
+        self.assertEqual(app.responses.stats['account'], 0)
+        self.assertEqual(app.responses.stats['container'], 0)
+        self.assertEqual(app.responses.stats['obj'], 1)
+        self.assertEqual(resp['length'], 5555)
+        self.assertEqual(resp['type'], 'text/plain')
+
+    def test_options(self):
+        base = Controller(self.app)
+        base.account_name = 'a'
+        base.container_name = 'c'
+        origin = 'http://m.com'
+        self.app.cors_allow_origin = [origin]
+        req = Request.blank('/v1/a/c/o',
+                            environ={'swift.cache': FakeCache()},
+                            headers={'Origin': origin,
+                                     'Access-Control-Request-Method': 'GET'})
+
+        with mock.patch('swift.proxy.controllers.base.'
+                        'http_connect', fake_http_connect(200)):
+            resp = base.OPTIONS(req)
+        self.assertEqual(resp.status_int, 200)
+
+    def test_options_with_null_allow_origin(self):
+        base = Controller(self.app)
+        base.account_name = 'a'
+        base.container_name = 'c'
+
+        def my_container_info(*args):
+            return {
+                'cors': {
+                    'allow_origin': '*',
+                }
+            }
+        base.container_info = my_container_info
+        req = Request.blank('/v1/a/c/o',
+                            environ={'swift.cache': FakeCache()},
+                            headers={'Origin': '*',
+                                     'Access-Control-Request-Method': 'GET'})
+
+        with mock.patch('swift.proxy.controllers.base.'
+                        'http_connect', fake_http_connect(200)):
+            resp = base.OPTIONS(req)
+        self.assertEqual(resp.status_int, 200)
+
+    def test_options_unauthorized(self):
+        base = Controller(self.app)
+        base.account_name = 'a'
+        base.container_name = 'c'
+        self.app.cors_allow_origin = ['http://NOT_IT']
+        req = Request.blank('/v1/a/c/o',
+                            environ={'swift.cache': FakeCache()},
+                            headers={'Origin': 'http://m.com',
+                                     'Access-Control-Request-Method': 'GET'})
+
+        with mock.patch('swift.proxy.controllers.base.'
+                        'http_connect', fake_http_connect(200)):
+            resp = base.OPTIONS(req)
+        self.assertEqual(resp.status_int, 401)
 
-class TestFuncs(unittest.TestCase):
     def test_headers_to_container_info_missing(self):
         resp = headers_to_container_info({}, 404)
-        self.assertEquals(resp['status'], 404)
-        self.assertEquals(resp['read_acl'], None)
-        self.assertEquals(resp['write_acl'], None)
+        self.assertEqual(resp['status'], 404)
+        self.assertIsNone(resp['read_acl'])
+        self.assertIsNone(resp['write_acl'])
+        self.assertIsNone(resp['sync_key'])
+        self.assertIsNone(resp['sync_to'])
 
     def test_headers_to_container_info_meta(self):
         headers = {'X-Container-Meta-Whatevs': 14,
                    'x-container-meta-somethingelse': 0}
         resp = headers_to_container_info(headers.items(), 200)
-        self.assertEquals(len(resp['meta']), 2)
-        self.assertEquals(resp['meta']['whatevs'], 14)
-        self.assertEquals(resp['meta']['somethingelse'], 0)
+        self.assertEqual(len(resp['meta']), 2)
+        self.assertEqual(resp['meta']['whatevs'], 14)
+        self.assertEqual(resp['meta']['somethingelse'], 0)
+
+    def test_headers_to_container_info_sys_meta(self):
+        prefix = get_sys_meta_prefix('container')
+        headers = {'%sWhatevs' % prefix: 14,
+                   '%ssomethingelse' % prefix: 0}
+        resp = headers_to_container_info(headers.items(), 200)
+        self.assertEqual(len(resp['sysmeta']), 2)
+        self.assertEqual(resp['sysmeta']['whatevs'], 14)
+        self.assertEqual(resp['sysmeta']['somethingelse'], 0)
 
     def test_headers_to_container_info_values(self):
         headers = {
             'x-container-read': 'readvalue',
             'x-container-write': 'writevalue',
             'x-container-sync-key': 'keyvalue',
+            'x-container-sync-to': '//r/c/a/c',
             'x-container-meta-access-control-allow-origin': 'here',
         }
         resp = headers_to_container_info(headers.items(), 200)
-        self.assertEquals(resp['read_acl'], 'readvalue')
-        self.assertEquals(resp['write_acl'], 'writevalue')
-        self.assertEquals(resp['cors']['allow_origin'], 'here')
+        self.assertEqual(resp['read_acl'], 'readvalue')
+        self.assertEqual(resp['write_acl'], 'writevalue')
+        self.assertEqual(resp['sync_key'], 'keyvalue')
+        self.assertEqual(resp['sync_to'], '//r/c/a/c')
+        self.assertEqual(resp['cors']['allow_origin'], 'here')
 
         headers['x-unused-header'] = 'blahblahblah'
-        self.assertEquals(
+        self.assertEqual(
             resp,
             headers_to_container_info(headers.items(), 200))
+
+    def test_headers_from_container_info(self):
+        self.assertIsNone(headers_from_container_info(None))
+        self.assertIsNone(headers_from_container_info({}))
+
+        meta = {'fruit': 'cake'}
+        sysmeta = {'green': 'land'}
+        info = {
+            'status': 200,
+            'read_acl': 'my-read-acl',
+            'write_acl': 'my-write-acl',
+            'sync_to': 'my-sync-to',
+            'sync_key': 'my-sync-key',
+            'object_count': 99,
+            'bytes': 999,
+            'versions': 'my-versions',
+            'storage_policy': '0',
+            'cors': {
+                'allow_origin': 'my-cors-origin',
+                'expose_headers': 'my-cors-hdrs',
+                'max_age': 'my-cors-age'},
+            'created_at': '123.456_12',
+            'put_timestamp': '234.567_34',
+            'delete_timestamp': '345_67',
+            'status_changed_at': '246.8_9',
+            'meta': meta,
+            'sysmeta': sysmeta,
+            'sharding_state': 'unsharded'
+        }
+
+        res = headers_from_container_info(info)
+
+        expected = {
+            'X-Backend-Delete-Timestamp': '345_67',
+            'X-Backend-Put-Timestamp': '234.567_34',
+            'X-Backend-Sharding-State': 'unsharded',
+            'X-Backend-Status-Changed-At': '246.8_9',
+            'X-Backend-Storage-Policy-Index': '0',
+            'X-Backend-Timestamp': '123.456_12',
+            'X-Container-Bytes-Used': '999',
+            'X-Container-Meta-Fruit': 'cake',
+            'X-Container-Object-Count': '99',
+            'X-Container-Read': 'my-read-acl',
+            'X-Container-Sync-Key': 'my-sync-key',
+            'X-Container-Sync-To': 'my-sync-to',
+            'X-Container-Sysmeta-Green': 'land',
+            'X-Container-Write': 'my-write-acl',
+            'X-Put-Timestamp': '0000000234.56700',
+            'X-Storage-Policy': 'zero',
+            'X-Timestamp': '0000000123.45600',
+            'X-Versions-Location': 'my-versions',
+            'X-Container-Meta-Access-Control-Allow-Origin': 'my-cors-origin',
+            'X-Container-Meta-Access-Control-Expose-Headers': 'my-cors-hdrs',
+            'X-Container-Meta-Access-Control-Max-Age': 'my-cors-age',
+        }
+
+        self.assertEqual(expected, res)
+
+        for required in (
+                'created_at', 'put_timestamp', 'delete_timestamp',
+                'status_changed_at', 'storage_policy', 'object_count', 'bytes',
+                'sharding_state'):
+            incomplete_info = dict(info)
+            incomplete_info.pop(required)
+            self.assertIsNone(headers_from_container_info(incomplete_info))
+
+        for hdr, optional in (
+                ('X-Container-Read', 'read_acl'),
+                ('X-Container-Write', 'write_acl'),
+                ('X-Container-Sync-Key', 'sync_key'),
+                ('X-Container-Sync-To', 'sync_to'),
+                ('X-Versions-Location', 'versions'),
+                ('X-Container-Meta-Fruit', 'meta'),
+                ('X-Container-Sysmeta-Green', 'sysmeta'),
+        ):
+            incomplete_info = dict(info)
+            incomplete_info.pop(optional)
+            incomplete_expected = dict(expected)
+            incomplete_expected.pop(hdr)
+            self.assertEqual(incomplete_expected,
+                             headers_from_container_info(incomplete_info))
+
+        for hdr, optional in (
+            ('Access-Control-Allow-Origin', 'allow_origin'),
+            ('Access-Control-Expose-Headers', 'expose_headers'),
+            ('Access-Control-Max-Age', 'max_age'),
+        ):
+            incomplete_info = dict(info)
+            incomplete_cors = dict(info['cors'])
+            incomplete_cors.pop(optional)
+            incomplete_info['cors'] = incomplete_cors
+            incomplete_expected = dict(expected)
+            incomplete_expected.pop('X-Container-Meta-' + hdr)
+            self.assertEqual(incomplete_expected,
+                             headers_from_container_info(incomplete_info))
+
+    def test_container_info_preserves_storage_policy(self):
+        base = Controller(self.app)
+        base.account_name = 'a'
+        base.container_name = 'c'
+
+        fake_info = {'status': 404, 'storage_policy': 1}
+
+        with mock.patch('swift.proxy.controllers.base.'
+                        'get_container_info', return_value=fake_info):
+            container_info = \
+                base.container_info(base.account_name, base.container_name,
+                                    Request.blank('/'))
+        self.assertEqual(container_info['status'], 404)
+        self.assertEqual(container_info['storage_policy'], 1)
+        self.assertEqual(container_info['partition'], None)
+        self.assertEqual(container_info['nodes'], None)
+
+    def test_container_info_needs_req(self):
+        base = Controller(self.app)
+        base.account_name = 'a'
+        base.container_name = 'c'
+
+        with mock.patch('swift.proxy.controllers.base.'
+                        'http_connect', fake_http_connect(200)):
+            container_info = \
+                base.container_info(base.account_name,
+                                    base.container_name, Request.blank('/'))
+        self.assertEqual(container_info['status'], 503)
+
+    def test_headers_to_account_info_missing(self):
+        resp = headers_to_account_info({}, 404)
+        self.assertEqual(resp['status'], 404)
+        self.assertIsNone(resp['bytes'])
+        self.assertIsNone(resp['container_count'])
+
+    def test_headers_to_account_info_meta(self):
+        headers = {'X-Account-Meta-Whatevs': 14,
+                   'x-account-meta-somethingelse': 0}
+        resp = headers_to_account_info(headers.items(), 200)
+        self.assertEqual(len(resp['meta']), 2)
+        self.assertEqual(resp['meta']['whatevs'], 14)
+        self.assertEqual(resp['meta']['somethingelse'], 0)
+
+    def test_headers_to_account_info_sys_meta(self):
+        prefix = get_sys_meta_prefix('account')
+        headers = {'%sWhatevs' % prefix: 14,
+                   '%ssomethingelse' % prefix: 0}
+        resp = headers_to_account_info(headers.items(), 200)
+        self.assertEqual(len(resp['sysmeta']), 2)
+        self.assertEqual(resp['sysmeta']['whatevs'], 14)
+        self.assertEqual(resp['sysmeta']['somethingelse'], 0)
+
+    def test_headers_to_account_info_values(self):
+        headers = {
+            'x-account-object-count': '10',
+            'x-account-container-count': '20',
+        }
+        resp = headers_to_account_info(headers.items(), 200)
+        self.assertEqual(resp['total_object_count'], '10')
+        self.assertEqual(resp['container_count'], '20')
+
+        headers['x-unused-header'] = 'blahblahblah'
+        self.assertEqual(
+            resp,
+            headers_to_account_info(headers.items(), 200))
+
+    def test_headers_to_account_info_storage_policies(self):
+        headers = {
+            'x-account-storage-policy-zero-object-count': '13',
+            'x-account-storage-policy-zero-container-count': '120',
+            'x-account-storage-policy-zero-bytes-used': '1002',
+            'x-account-storage-policy-one-object-count': '10',
+            'x-account-storage-policy-one-container-count': '20',
+        }
+        spc = StoragePolicyCollection([StoragePolicy(0, 'zero', True),
+                                       StoragePolicy(1, 'one', False)])
+        with PatchPolicies(spc):
+            resp = headers_to_account_info(headers.items(), 200)
+        self.assertEqual(resp['storage_policies'], {
+            0: {'object_count': 13,
+                'container_count': 120,
+                'bytes': 1002},
+            1: {'object_count': 10,
+                'container_count': 20,
+                'bytes': 0},
+        })
+
+    def test_headers_to_object_info_missing(self):
+        resp = headers_to_object_info({}, 404)
+        self.assertEqual(resp['status'], 404)
+        self.assertIsNone(resp['length'])
+        self.assertIsNone(resp['etag'])
+
+    def test_headers_to_object_info_meta(self):
+        headers = {'X-Object-Meta-Whatevs': 14,
+                   'x-object-meta-somethingelse': 0}
+        resp = headers_to_object_info(headers.items(), 200)
+        self.assertEqual(len(resp['meta']), 2)
+        self.assertEqual(resp['meta']['whatevs'], 14)
+        self.assertEqual(resp['meta']['somethingelse'], 0)
+
+    def test_headers_to_object_info_sys_meta(self):
+        prefix = get_sys_meta_prefix('object')
+        headers = {'%sWhatevs' % prefix: 14,
+                   '%ssomethingelse' % prefix: 0}
+        resp = headers_to_object_info(headers.items(), 200)
+        self.assertEqual(len(resp['sysmeta']), 2)
+        self.assertEqual(resp['sysmeta']['whatevs'], 14)
+        self.assertEqual(resp['sysmeta']['somethingelse'], 0)
+
+    def test_headers_to_object_info_transient_sysmeta(self):
+        headers = {get_object_transient_sysmeta('Whatevs'): 14,
+                   get_object_transient_sysmeta('somethingelse'): 0}
+        resp = headers_to_object_info(headers.items(), 200)
+        self.assertEqual(len(resp['transient_sysmeta']), 2)
+        self.assertEqual(resp['transient_sysmeta']['whatevs'], 14)
+        self.assertEqual(resp['transient_sysmeta']['somethingelse'], 0)
+
+    def test_headers_to_object_info_values(self):
+        headers = {
+            'content-length': '1024',
+            'content-type': 'application/json',
+        }
+        resp = headers_to_object_info(headers.items(), 200)
+        self.assertEqual(resp['length'], '1024')
+        self.assertEqual(resp['type'], 'application/json')
+
+        headers['x-unused-header'] = 'blahblahblah'
+        self.assertEqual(
+            resp,
+            headers_to_object_info(headers.items(), 200))
+
+    def test_base_have_quorum(self):
+        base = Controller(self.app)
+        # just throw a bunch of test cases at it
+        self.assertFalse(base.have_quorum([201, 404], 3))
+        self.assertTrue(base.have_quorum([201, 201], 4))
+        self.assertFalse(base.have_quorum([201], 4))
+        self.assertTrue(base.have_quorum([201, 201, 404, 404], 4))
+        self.assertFalse(base.have_quorum([201, 302, 418, 503], 4))
+        self.assertTrue(base.have_quorum([201, 503, 503, 201], 4))
+        self.assertTrue(base.have_quorum([201, 201], 3))
+        self.assertTrue(base.have_quorum([404, 404], 3))
+        self.assertTrue(base.have_quorum([201, 201], 2))
+        self.assertTrue(base.have_quorum([201, 404], 2))
+        self.assertTrue(base.have_quorum([404, 404], 2))
+        self.assertTrue(base.have_quorum([201, 404, 201, 201], 4))
+
+    def test_best_response_overrides(self):
+        base = Controller(self.app)
+        responses = [
+            (302, 'Found', '', b'The resource has moved temporarily.'),
+            (100, 'Continue', '', b''),
+            (404, 'Not Found', '', b'Custom body'),
+        ]
+        server_type = "Base DELETE"
+        req = Request.blank('/v1/a/c/o', method='DELETE')
+        statuses, reasons, headers, bodies = zip(*responses)
+
+        # First test that you can't make a quorum with only overridden
+        # responses
+        overrides = {302: 204, 100: 204}
+        resp = base.best_response(req, statuses, reasons, bodies, server_type,
+                                  headers=headers, overrides=overrides)
+        self.assertEqual(resp.status, '503 Service Unavailable')
+
+        # next make a 404 quorum and make sure the last delete (real) 404
+        # status is the one returned.
+        overrides = {100: 404}
+        resp = base.best_response(req, statuses, reasons, bodies, server_type,
+                                  headers=headers, overrides=overrides)
+        self.assertEqual(resp.status, '404 Not Found')
+        self.assertEqual(resp.body, b'Custom body')
+
+    def test_transfer_headers_with_sysmeta(self):
+        base = Controller(self.app)
+        good_hdrs = {'x-base-sysmeta-foo': 'ok',
+                     'X-Base-sysmeta-Bar': 'also ok'}
+        bad_hdrs = {'x-base-sysmeta-': 'too short'}
+        hdrs = dict(good_hdrs)
+        hdrs.update(bad_hdrs)
+        dst_hdrs = HeaderKeyDict()
+        base.transfer_headers(hdrs, dst_hdrs)
+        self.assertEqual(HeaderKeyDict(good_hdrs), dst_hdrs)
+
+    def test_generate_request_headers(self):
+        base = Controller(self.app)
+        src_headers = {'x-remove-base-meta-owner': 'x',
+                       'x-base-meta-size': '151M',
+                       'x-base-sysmeta-mysysmeta': 'myvalue',
+                       'x-Backend-No-Timestamp-Update': 'true',
+                       'X-Backend-Storage-Policy-Index': '3',
+                       'x-backendoftheworld': 'ignored',
+                       'new-owner': 'Kun'}
+        req = Request.blank('/v1/a/c/o', headers=src_headers)
+        dst_headers = base.generate_request_headers(req)
+        expected_headers = {'x-backend-no-timestamp-update': 'true',
+                            'x-backend-storage-policy-index': '3',
+                            'x-timestamp': mock.ANY,
+                            'x-trans-id': '-',
+                            'Referer': 'GET http://localhost/v1/a/c/o',
+                            'connection': 'close',
+                            'user-agent': 'proxy-server %d' % os.getpid()}
+        for k, v in expected_headers.items():
+            self.assertIn(k, dst_headers)
+            self.assertEqual(v, dst_headers[k])
+        for k, v in expected_headers.items():
+            dst_headers.pop(k)
+        self.assertFalse(dst_headers)
+
+        # with transfer=True
+        req = Request.blank('/v1/a/c/o', headers=src_headers)
+        dst_headers = base.generate_request_headers(req, transfer=True)
+        expected_headers.update({'x-base-meta-owner': '',
+                                 'x-base-meta-size': '151M',
+                                 'x-base-sysmeta-mysysmeta': 'myvalue'})
+        for k, v in expected_headers.items():
+            self.assertIn(k, dst_headers)
+            self.assertEqual(v, dst_headers[k])
+        for k, v in expected_headers.items():
+            dst_headers.pop(k)
+        self.assertFalse(dst_headers)
+
+        # with additional
+        req = Request.blank('/v1/a/c/o', headers=src_headers)
+        dst_headers = base.generate_request_headers(
+            req, transfer=True,
+            additional=src_headers)
+        expected_headers.update({'x-remove-base-meta-owner': 'x',
+                                 'x-backendoftheworld': 'ignored',
+                                 'new-owner': 'Kun'})
+        for k, v in expected_headers.items():
+            self.assertIn(k, dst_headers)
+            self.assertEqual(v, dst_headers[k])
+        for k, v in expected_headers.items():
+            dst_headers.pop(k)
+        self.assertFalse(dst_headers)
+
+        # with additional, verify precedence
+        req = Request.blank('/v1/a/c/o', headers=src_headers)
+        dst_headers = base.generate_request_headers(
+            req, transfer=False,
+            additional={'X-Backend-Storage-Policy-Index': '2',
+                        'X-Timestamp': '1234.56789'})
+        expected_headers = {'x-backend-no-timestamp-update': 'true',
+                            'x-backend-storage-policy-index': '2',
+                            'x-timestamp': '1234.56789',
+                            'x-trans-id': '-',
+                            'Referer': 'GET http://localhost/v1/a/c/o',
+                            'connection': 'close',
+                            'user-agent': 'proxy-server %d' % os.getpid()}
+        for k, v in expected_headers.items():
+            self.assertIn(k, dst_headers)
+            self.assertEqual(v, dst_headers[k])
+        for k, v in expected_headers.items():
+            dst_headers.pop(k)
+        self.assertFalse(dst_headers)
+
+    def test_generate_request_headers_change_backend_user_agent(self):
+        base = Controller(self.app)
+        self.app.backend_user_agent = "swift-flux-capacitor"
+        src_headers = {'x-remove-base-meta-owner': 'x',
+                       'x-base-meta-size': '151M',
+                       'new-owner': 'Kun'}
+        req = Request.blank('/v1/a/c/o', headers=src_headers)
+        dst_headers = base.generate_request_headers(req, transfer=True)
+        expected_headers = {'x-base-meta-owner': '',
+                            'x-base-meta-size': '151M',
+                            'connection': 'close',
+                            'user-agent': 'swift-flux-capacitor'}
+        for k, v in expected_headers.items():
+            self.assertIn(k, dst_headers)
+            self.assertEqual(v, dst_headers[k])
+        self.assertNotIn('new-owner', dst_headers)
+
+    def test_generate_request_headers_with_sysmeta(self):
+        base = Controller(self.app)
+        good_hdrs = {'x-base-sysmeta-foo': 'ok',
+                     'X-Base-sysmeta-Bar': 'also ok'}
+        bad_hdrs = {'x-base-sysmeta-': 'too short'}
+        hdrs = dict(good_hdrs)
+        hdrs.update(bad_hdrs)
+        req = Request.blank('/v1/a/c/o', headers=hdrs)
+        dst_headers = base.generate_request_headers(req, transfer=True)
+        for k, v in good_hdrs.items():
+            self.assertIn(k.lower(), dst_headers)
+            self.assertEqual(v, dst_headers[k.lower()])
+        for k, v in bad_hdrs.items():
+            self.assertNotIn(k.lower(), dst_headers)
+
+    def test_generate_request_headers_with_no_orig_req(self):
+        base = Controller(self.app)
+        src_headers = {'x-remove-base-meta-owner': 'x',
+                       'x-base-meta-size': '151M',
+                       'new-owner': 'Kun'}
+        dst_headers = base.generate_request_headers(None,
+                                                    additional=src_headers,
+                                                    transfer=True)
+        expected_headers = {'x-base-meta-size': '151M',
+                            'connection': 'close'}
+        for k, v in expected_headers.items():
+            self.assertIn(k, dst_headers)
+            self.assertEqual(v, dst_headers[k])
+        self.assertEqual('', dst_headers['Referer'])
+
+    def test_bytes_to_skip(self):
+        # if you start at the beginning, skip nothing
+        self.assertEqual(bytes_to_skip(1024, 0), 0)
+
+        # missed the first 10 bytes, so we've got 1014 bytes of partial
+        # record
+        self.assertEqual(bytes_to_skip(1024, 10), 1014)
+
+        # skipped some whole records first
+        self.assertEqual(bytes_to_skip(1024, 4106), 1014)
+
+        # landed on a record boundary
+        self.assertEqual(bytes_to_skip(1024, 1024), 0)
+        self.assertEqual(bytes_to_skip(1024, 2048), 0)
+
+        # big numbers
+        self.assertEqual(bytes_to_skip(2 ** 20, 2 ** 32), 0)
+        self.assertEqual(bytes_to_skip(2 ** 20, 2 ** 32 + 1), 2 ** 20 - 1)
+        self.assertEqual(bytes_to_skip(2 ** 20, 2 ** 32 + 2 ** 19), 2 ** 19)
+
+        # odd numbers
+        self.assertEqual(bytes_to_skip(123, 0), 0)
+        self.assertEqual(bytes_to_skip(123, 23), 100)
+        self.assertEqual(bytes_to_skip(123, 247), 122)
+
+        # prime numbers
+        self.assertEqual(bytes_to_skip(11, 7), 4)
+        self.assertEqual(bytes_to_skip(97, 7873823), 55)
+
+
+@patch_policies([StoragePolicy(0, 'zero', True, object_ring=FakeRing())])
+class TestNodeIter(BaseTest):
+
+    def test_iter_default_fake_ring(self):
+        for ring in (self.account_ring, self.container_ring):
+            self.assertEqual(ring.replica_count, 3.0)
+            node_iter = NodeIter('db', self.app, ring, 0, self.logger,
+                                 request=Request.blank(''))
+            self.assertEqual(6, node_iter.nodes_left)
+            self.assertEqual(3, node_iter.primaries_left)
+            count = 0
+            for node in node_iter:
+                count += 1
+            self.assertEqual(count, 3)
+            self.assertEqual(0, node_iter.primaries_left)
+            # default fake_ring has NO handoffs, so nodes_left is kind of a lie
+            self.assertEqual(3, node_iter.nodes_left)
+
+    def test_iter_with_handoffs(self):
+        ring = FakeRing(replicas=3, max_more_nodes=20)  # handoffs available
+        policy = StoragePolicy(0, 'zero', object_ring=ring)
+        node_iter = NodeIter(
+            'object', self.app, policy.object_ring, 0, self.logger,
+            policy=policy, request=Request.blank(''))
+        self.assertEqual(6, node_iter.nodes_left)
+        self.assertEqual(3, node_iter.primaries_left)
+        primary_indexes = set()
+        handoff_indexes = []
+        count = 0
+        for node in node_iter:
+            if 'index' in node:
+                primary_indexes.add(node['index'])
+            else:
+                handoff_indexes.append(node['handoff_index'])
+            count += 1
+        self.assertEqual(count, 6)
+        self.assertEqual(0, node_iter.primaries_left)
+        self.assertEqual(0, node_iter.nodes_left)
+        self.assertEqual({0, 1, 2}, primary_indexes)
+        self.assertEqual([0, 1, 2], handoff_indexes)
+
+    def test_multi_iteration(self):
+        ring = FakeRing(replicas=8, max_more_nodes=20)
+        policy = StoragePolicy(0, 'ec', object_ring=ring)
+
+        # sanity
+        node_iter = NodeIter(
+            'object', self.app, policy.object_ring, 0, self.logger,
+            policy=policy, request=Request.blank(''))
+        self.assertEqual(16, len([n for n in node_iter]))
+
+        node_iter = NodeIter(
+            'object', self.app, policy.object_ring, 0, self.logger,
+            policy=policy, request=Request.blank(''))
+        self.assertEqual(16, node_iter.nodes_left)
+        self.assertEqual(8, node_iter.primaries_left)
+        pile = GreenAsyncPile(5)
+
+        def eat_node(node_iter):
+            return next(node_iter)
+
+        safe_iter = GreenthreadSafeIterator(node_iter)
+        for i in range(5):
+            pile.spawn(eat_node, safe_iter)
+
+        nodes = []
+        for node in pile:
+            nodes.append(node)
+
+        primary_indexes = {n['index'] for n in nodes}
+        self.assertEqual(5, len(primary_indexes))
+        self.assertEqual(3, node_iter.primaries_left)
+
+        # it's problematic we don't decrement nodes_left until we resume
+        self.assertEqual(12, node_iter.nodes_left)
+        for node in node_iter:
+            nodes.append(node)
+        self.assertEqual(17, len(nodes))
+
+    def test_annotate_node_with_use_replication(self):
+        ring = FakeRing(replicas=8, max_more_nodes=20)
+        policy = StoragePolicy(0, 'ec', object_ring=ring)
+
+        node_iter = NodeIter(
+            'object', self.app, policy.object_ring, 0, self.logger,
+            policy=policy, request=Request.blank(''))
+        for node in node_iter:
+            self.assertIn('use_replication', node)
+            self.assertFalse(node['use_replication'])
+
+        req = Request.blank('a/c')
+        node_iter = NodeIter(
+            'object', self.app, policy.object_ring, 0, self.logger,
+            policy=policy, request=req)
+        for node in node_iter:
+            self.assertIn('use_replication', node)
+            self.assertFalse(node['use_replication'])
+
+        req = Request.blank(
+            'a/c', headers={'x-backend-use-replication-network': 'False'})
+        node_iter = NodeIter(
+            'object', self.app, policy.object_ring, 0, self.logger,
+            policy=policy, request=req)
+        for node in node_iter:
+            self.assertIn('use_replication', node)
+            self.assertFalse(node['use_replication'])
+
+        req = Request.blank(
+            'a/c', headers={'x-backend-use-replication-network': 'yes'})
+        node_iter = NodeIter(
+            'object', self.app, policy.object_ring, 0, self.logger,
+            policy=policy, request=req)
+        for node in node_iter:
+            self.assertIn('use_replication', node)
+            self.assertTrue(node['use_replication'])
+
+    def test_iter_does_not_mutate_supplied_nodes(self):
+        ring = FakeRing(replicas=8, max_more_nodes=20)
+        policy = StoragePolicy(0, 'ec', object_ring=ring)
+        other_iter = ring.get_part_nodes(0)
+        node_iter = NodeIter(
+            'object', self.app, policy.object_ring, 0, self.logger,
+            policy=policy, node_iter=iter(other_iter),
+            request=Request.blank(''))
+        nodes = list(node_iter)
+        self.assertEqual(len(other_iter), len(nodes))
+        for node in nodes:
+            self.assertIn('use_replication', node)
+            self.assertFalse(node['use_replication'])
+        self.assertEqual(other_iter, ring.get_part_nodes(0))
+
+
+class TestGetterSource(unittest.TestCase):
+    def _make_source(self, headers, node):
+        resp = StubResponse(200, headers=headers)
+        return GetterSource(self.app, resp, node)
+
+    def setUp(self):
+        self.app = FakeApp()
+        self.node = {'ip': '1.2.3.4', 'port': '999'}
+        self.headers = {'X-Timestamp': '1234567.12345'}
+        self.resp = StubResponse(200, headers=self.headers)
+        self.ts_iter = make_timestamp_iter()
+
+    def test_init(self):
+        src = GetterSource(self.app, self.resp, self.node)
+        self.assertIs(self.app, src.app)
+        self.assertIs(self.resp, src.resp)
+        self.assertEqual(self.node, src.node)
+
+    def test_timestamp(self):
+        # first test the no timestamp header case. Defaults to 0.
+        headers = {}
+        src = self._make_source(headers, self.node)
+        self.assertIsInstance(src.timestamp, Timestamp)
+        self.assertEqual(Timestamp.zero(), src.timestamp)
+        # now x-timestamp
+        headers = dict(self.headers)
+        src = self._make_source(headers, self.node)
+        self.assertIsInstance(src.timestamp, Timestamp)
+        self.assertEqual(Timestamp(headers['X-Timestamp']), src.timestamp)
+        headers['x-put-timestamp'] = '1234567.11111'
+        src = self._make_source(headers, self.node)
+        self.assertIsInstance(src.timestamp, Timestamp)
+        self.assertEqual(Timestamp('1234567.11111'), src.timestamp)
+        headers['x-backend-timestamp'] = '1234567.22222'
+        src = self._make_source(headers, self.node)
+        self.assertIsInstance(src.timestamp, Timestamp)
+        self.assertEqual(Timestamp('1234567.22222'), src.timestamp)
+        headers['x-backend-data-timestamp'] = '1234567.33333'
+        src = self._make_source(headers, self.node)
+        self.assertIsInstance(src.timestamp, Timestamp)
+        self.assertEqual(Timestamp('1234567.33333'), src.timestamp)
+        ts_data = Timestamp.now(offset=123)
+        headers['x-backend-data-timestamp'] = ts_data.internal
+        src = self._make_source(headers, self.node)
+        self.assertIsInstance(src.timestamp, Timestamp)
+        self.assertEqual(ts_data, src.timestamp)
+
+    def test_sort_by_x_timestamp(self):
+        # verify sorting by timestamp
+        srcs = [
+            self._make_source(
+                {'X-Timestamp': next(self.ts_iter).normal,
+                 'X-Put-Timestamp': next(self.ts_iter).normal},
+                {'ip': '1.2.3.9', 'port': '7'}),
+            self._make_source({'X-Timestamp': next(self.ts_iter).normal},
+                              {'ip': '1.2.3.7', 'port': '9'}),
+            self._make_source({'X-Timestamp': next(self.ts_iter).normal},
+                              {'ip': '1.2.3.8', 'port': '8'}),
+        ]
+        actual = sorted(random.sample(srcs, k=len(srcs)),
+                        key=operator.attrgetter('timestamp'))
+        self.assertEqual(srcs, actual)
+
+    def test_sort_by_x_backend_timestamp(self):
+        # verify x-backend-timestamp is preferred over x-timestamp
+        src_headers = [{'X-Backend-Timestamp': next(self.ts_iter).internal}
+                       for _ in range(3)]
+        for headers in reversed(src_headers):
+            headers['X-Timestamp'] = next(self.ts_iter).normal
+        srcs = [
+            self._make_source(headers,
+                              {'ip': '1.2.3.%d' % i, 'port': '%d' % i})
+            for i, headers in enumerate(src_headers)
+        ]
+        actual = sorted(random.sample(srcs, k=len(srcs)),
+                        key=operator.attrgetter('timestamp'))
+        self.assertEqual(srcs, actual)
+
+    def test_close(self):
+        # verify close is robust...
+        # source has no resp
+        src = GetterSource(self.app, None, self.node)
+        src.close()
+        # resp has no swift_conn
+        src = GetterSource(self.app, self.resp, self.node)
+        self.assertFalse(hasattr(src.resp, 'swift_conn'))
+        src.close()
+        # verify close is plumbed through...
+        src.resp.swift_conn = mock.MagicMock()
+        src.resp.nuke_from_orbit = mock.MagicMock()
+        src.close()
+        src.resp.nuke_from_orbit.assert_called_once_with()
+
+
+@patch_policies([StoragePolicy(0, 'zero', True, object_ring=FakeRing())])
+class TestGetOrHeadHandler(BaseTest):
+    def test_init_node_timeout(self):
+        conf = {'node_timeout': 5, 'recoverable_node_timeout': 3}
+        app = proxy_server.Application(conf,
+                                       logger=self.logger,
+                                       account_ring=self.account_ring,
+                                       container_ring=self.container_ring)
+        # x-newest set
+        req = Request.blank('/v1/a/c/o', headers={'X-Newest': 'true'})
+        node_iter = Namespace(num_primary_nodes=3)
+        # app.node_timeout
+        getter = GetOrHeadHandler(
+            app, req, 'Object', node_iter, None, None, {})
+        self.assertEqual(5, getter.node_timeout)
+
+        # x-newest not set
+        req = Request.blank('/v1/a/c/o')
+        node_iter = Namespace(num_primary_nodes=3)
+        # app.recoverable_node_timeout
+        getter = GetOrHeadHandler(
+            app, req, 'Object', node_iter, None, None, {})
+        self.assertEqual(3, getter.node_timeout)
+
+        # app.node_timeout
+        getter = GetOrHeadHandler(
+            app, req, 'Account', node_iter, None, None, {})
+        self.assertEqual(5, getter.node_timeout)
+
+        getter = GetOrHeadHandler(
+            app, req, 'Container', node_iter, None, None, {})
+        self.assertEqual(5, getter.node_timeout)
+
+    def test_disconnected_logging(self):
+        req = Request.blank('/v1/a/c/o')
+        headers = {'content-type': 'text/plain'}
+        source = FakeSource([], headers=headers, body=b'the cake is a lie')
+
+        node = {'ip': '1.2.3.4', 'port': 6200, 'device': 'sda'}
+        handler = GetOrHeadHandler(
+            self.app, req, 'Object', Namespace(num_primary_nodes=1), None,
+            'some-path', {})
+
+        def mock_find_source():
+            handler.source = GetterSource(self.app, source, node)
+            return True
+
+        factory = CaptureIteratorFactory(handler._iter_parts_from_response)
+        with mock.patch.object(handler, '_find_source', mock_find_source):
+            with mock.patch.object(
+                    handler, '_iter_parts_from_response', factory):
+                resp = handler.get_working_response()
+                resp.app_iter.close()
+        # verify that iter exited
+        self.assertEqual({1: ['__next__', 'close', '__del__']},
+                         factory.captured_calls)
+        self.assertEqual(["Client disconnected on read of 'some-path'"],
+                         self.logger.get_lines_for_level('info'))
+
+        self.logger.clear()
+        node = {'ip': '1.2.3.4', 'port': 6200, 'device': 'sda'}
+        handler = GetOrHeadHandler(
+            self.app, req, 'Object', Namespace(num_primary_nodes=1), None,
+            None, {})
+
+        factory = CaptureIteratorFactory(handler._iter_parts_from_response)
+        with mock.patch.object(handler, '_find_source', mock_find_source):
+            with mock.patch.object(
+                    handler, '_iter_parts_from_response', factory):
+                resp = handler.get_working_response()
+                next(resp.app_iter)
+            resp.app_iter.close()
+        self.assertEqual({1: ['__next__', 'close', '__del__']},
+                         factory.captured_calls)
+        self.assertEqual([], self.logger.get_lines_for_level('warning'))
+        self.assertEqual([], self.logger.get_lines_for_level('info'))
+
+    def test_range_fast_forward(self):
+        req = Request.blank('/')
+        handler = GetOrHeadHandler(
+            self.app, req, 'test', Namespace(num_primary_nodes=3), None, None,
+            {})
+        handler.fast_forward(50)
+        self.assertEqual(handler.backend_headers['Range'], 'bytes=50-')
+
+        handler = GetOrHeadHandler(
+            self.app, req, 'test', Namespace(num_primary_nodes=3), None, None,
+            {'Range': 'bytes=23-50'})
+        handler.fast_forward(20)
+        self.assertEqual(handler.backend_headers['Range'], 'bytes=43-50')
+        self.assertRaises(HTTPException,
+                          handler.fast_forward, 80)
+        self.assertRaises(exceptions.RangeAlreadyComplete,
+                          handler.fast_forward, 8)
+
+        handler = GetOrHeadHandler(
+            self.app, req, 'test', Namespace(num_primary_nodes=3), None, None,
+            {'Range': 'bytes=23-'})
+        handler.fast_forward(20)
+        self.assertEqual(handler.backend_headers['Range'], 'bytes=43-')
+
+        handler = GetOrHeadHandler(
+            self.app, req, 'test', Namespace(num_primary_nodes=3), None, None,
+            {'Range': 'bytes=-100'})
+        handler.fast_forward(20)
+        self.assertEqual(handler.backend_headers['Range'], 'bytes=-80')
+        self.assertRaises(HTTPException,
+                          handler.fast_forward, 100)
+        self.assertRaises(exceptions.RangeAlreadyComplete,
+                          handler.fast_forward, 80)
+
+        handler = GetOrHeadHandler(
+            self.app, req, 'test', Namespace(num_primary_nodes=3), None, None,
+            {'Range': 'bytes=0-0'})
+        self.assertRaises(exceptions.RangeAlreadyComplete,
+                          handler.fast_forward, 1)
+
+        handler = GetOrHeadHandler(
+            self.app, req, 'test', Namespace(num_primary_nodes=3), None, None,
+            {'Range': 'bytes=23-',
+             'X-Backend-Ignore-Range-If-Metadata-Present':
+             'X-Static-Large-Object'})
+        handler.fast_forward(20)
+        self.assertEqual(handler.backend_headers['Range'], 'bytes=43-')
+        self.assertNotIn('X-Backend-Ignore-Range-If-Metadata-Present',
+                         handler.backend_headers)
+
+    def test_range_fast_forward_after_data_timeout(self):
+        req = Request.blank('/')
+
+        # We get a 200 and learn that it's a 1000-byte object, but receive 0
+        # bytes of data, so then we get a new node, fast_forward(0), and
+        # send out a new request. That new request must be for all 1000
+        # bytes.
+        handler = GetOrHeadHandler(
+            self.app, req, 'test', Namespace(num_primary_nodes=3), None, None,
+            {})
+        handler.learn_size_from_content_range(0, 999, 1000)
+        handler.fast_forward(0)
+        self.assertEqual(handler.backend_headers['Range'], 'bytes=0-999')
+
+        # Same story as above, but a 1-byte object so we can have our byte
+        # indices be 0.
+        handler = GetOrHeadHandler(
+            self.app, req, 'test', Namespace(num_primary_nodes=3), None, None,
+            {})
+        handler.learn_size_from_content_range(0, 0, 1)
+        handler.fast_forward(0)
+        self.assertEqual(handler.backend_headers['Range'], 'bytes=0-0')
+
+        # last 100 bytes
+        handler = GetOrHeadHandler(
+            self.app, req, 'test', Namespace(num_primary_nodes=3), None, None,
+            {'Range': 'bytes=-100'})
+        handler.learn_size_from_content_range(900, 999, 1000)
+        handler.fast_forward(0)
+        self.assertEqual(handler.backend_headers['Range'], 'bytes=900-999')
diff --git a/test/unit/proxy/controllers/test_container.py b/test/unit/proxy/controllers/test_container.py
new file mode 100644
index 0000000000..fd127d3322
--- /dev/null
+++ b/test/unit/proxy/controllers/test_container.py
@@ -0,0 +1,4326 @@
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import json
+
+from unittest import mock
+import socket
+import unittest
+
+from eventlet import Timeout
+import urllib.parse
+from itertools import zip_longest
+
+from swift.common.constraints import CONTAINER_LISTING_LIMIT
+from swift.common.swob import Request, bytes_to_wsgi, str_to_wsgi, wsgi_quote
+from swift.common.utils import ShardRange, Timestamp, Namespace, \
+    NamespaceBoundList
+from swift.proxy import server as proxy_server
+from swift.proxy.controllers.base import headers_to_container_info, \
+    Controller, get_container_info, get_cache_key
+from test.unit import fake_http_connect, FakeRing, FakeMemcache, \
+    make_timestamp_iter
+from swift.common.storage_policy import StoragePolicy
+from swift.common.request_helpers import get_sys_meta_prefix
+
+from test.debug_logger import debug_logger
+from test.unit import patch_policies, mocked_http_conn
+from test.unit.common.ring.test_ring import TestRingBase
+from test.unit.proxy.test_server import node_error_count
+
+
+@patch_policies([StoragePolicy(0, 'zero', True, object_ring=FakeRing())])
+class BaseTestContainerController(TestRingBase):
+    CONTAINER_REPLICAS = 3
+
+    def setUp(self):
+        TestRingBase.setUp(self)
+        self.logger = debug_logger()
+        self.container_ring = FakeRing(replicas=self.CONTAINER_REPLICAS,
+                                       max_more_nodes=9)
+        self.app = proxy_server.Application(None,
+                                            logger=self.logger,
+                                            account_ring=FakeRing(),
+                                            container_ring=self.container_ring)
+
+        self.account_info = {
+            'status': 200,
+            'container_count': '10',
+            'total_object_count': '100',
+            'bytes': '1000',
+            'meta': {},
+            'sysmeta': {},
+        }
+
+        class FakeAccountInfoContainerController(
+                proxy_server.ContainerController):
+
+            def account_info(controller, *args, **kwargs):
+                patch_path = 'swift.proxy.controllers.base.get_account_info'
+                with mock.patch(patch_path) as mock_get_info:
+                    mock_get_info.return_value = dict(self.account_info)
+                    return super(FakeAccountInfoContainerController,
+                                 controller).account_info(
+                                     *args, **kwargs)
+        _orig_get_controller = self.app.get_controller
+
+        def wrapped_get_controller(*args, **kwargs):
+            with mock.patch('swift.proxy.server.ContainerController',
+                            new=FakeAccountInfoContainerController):
+                return _orig_get_controller(*args, **kwargs)
+        self.app.get_controller = wrapped_get_controller
+        self.ts_iter = make_timestamp_iter()
+
+    def _make_callback_func(self, context):
+        def callback(ipaddr, port, device, partition, method, path,
+                     headers=None, query_string=None, ssl=False):
+            context['method'] = method
+            context['path'] = path
+            context['headers'] = headers or {}
+        return callback
+
+    def _assert_responses(self, method, test_cases):
+        controller = proxy_server.ContainerController(self.app, 'a', 'c')
+
+        for responses, expected in test_cases:
+            with mock.patch(
+                    'swift.proxy.controllers.base.http_connect',
+                    fake_http_connect(*responses)):
+                cache = FakeMemcache()
+                cache.set(get_cache_key('a'), {'status': 204})
+                req = Request.blank('/v1/a/c', environ={'swift.cache': cache})
+                resp = getattr(controller, method)(req)
+
+            self.assertEqual(expected,
+                             resp.status_int,
+                             'Expected %s but got %s. Failed case: %s' %
+                             (expected, resp.status_int, str(responses)))
+
+
+class TestContainerController(BaseTestContainerController):
+    def test_container_info_got_cached(self):
+        memcache = FakeMemcache()
+        controller = proxy_server.ContainerController(self.app, 'a', 'c')
+        with mocked_http_conn(200, 200) as mock_conn:
+            req = Request.blank('/v1/a/c', {'swift.cache': memcache})
+            resp = controller.HEAD(req)
+        self.assertEqual(2, resp.status_int // 100)
+        self.assertEqual(['/a', '/a/c'],
+                         # requests are like /sdX/0/..
+                         [r['path'][6:] for r in mock_conn.requests])
+        # Make sure it's in both swift.infocache and memcache
+        header_info = headers_to_container_info(resp.headers)
+        info_cache = resp.environ['swift.infocache']
+        self.assertIn("container/a/c", resp.environ['swift.infocache'])
+        self.assertEqual(header_info, info_cache['container/a/c'])
+        self.assertEqual(header_info, memcache.get('container/a/c'))
+
+        # The failure doesn't lead to cache eviction
+        errors = [500] * self.CONTAINER_REPLICAS * 2
+        with mocked_http_conn(*errors) as mock_conn:
+            req = Request.blank('/v1/a/c', {'swift.infocache': info_cache,
+                                            'swift.cache': memcache})
+            resp = controller.HEAD(req)
+        self.assertEqual(5, resp.status_int // 100)
+        self.assertEqual(['/a/c'] * self.CONTAINER_REPLICAS * 2,
+                         # requests are like /sdX/0/..
+                         [r['path'][6:] for r in mock_conn.requests])
+        self.assertIs(info_cache, resp.environ['swift.infocache'])
+        self.assertIn("container/a/c", resp.environ['swift.infocache'])
+        # NB: this is the *old* header_info, from the good req
+        self.assertEqual(header_info, info_cache['container/a/c'])
+        self.assertEqual(header_info, memcache.get('container/a/c'))
+
+    @mock.patch('swift.proxy.controllers.container.clear_info_cache')
+    @mock.patch.object(Controller, 'make_requests')
+    def test_container_cache_cleared_after_PUT(
+            self, mock_make_requests, mock_clear_info_cache):
+        parent_mock = mock.Mock()
+        parent_mock.attach_mock(mock_make_requests, 'make_requests')
+        parent_mock.attach_mock(mock_clear_info_cache, 'clear_info_cache')
+        controller = proxy_server.ContainerController(self.app, 'a', 'c')
+        callback = self._make_callback_func({})
+        req = Request.blank('/v1/a/c')
+        with mock.patch('swift.proxy.controllers.base.http_connect',
+                        fake_http_connect(200, 200, give_connect=callback)):
+            controller.PUT(req)
+
+        # Ensure cache is cleared after the PUT request
+        self.assertEqual(parent_mock.mock_calls[0][0], 'make_requests')
+        self.assertEqual(parent_mock.mock_calls[1][0], 'clear_info_cache')
+
+    def test_swift_owner(self):
+        owner_headers = {
+            'x-container-read': 'value', 'x-container-write': 'value',
+            'x-container-sync-key': 'value', 'x-container-sync-to': 'value'}
+        controller = proxy_server.ContainerController(self.app, 'a', 'c')
+
+        req = Request.blank('/v1/a/c')
+        with mock.patch('swift.proxy.controllers.base.http_connect',
+                        fake_http_connect(200, 200, headers=owner_headers)):
+            resp = controller.HEAD(req)
+        self.assertEqual(2, resp.status_int // 100)
+        for key in owner_headers:
+            self.assertNotIn(key, resp.headers)
+
+        req = Request.blank('/v1/a/c', environ={'swift_owner': True})
+        with mock.patch('swift.proxy.controllers.base.http_connect',
+                        fake_http_connect(200, 200, headers=owner_headers)):
+            resp = controller.HEAD(req)
+        self.assertEqual(2, resp.status_int // 100)
+        for key in owner_headers:
+            self.assertIn(key, resp.headers)
+
+    def test_reseller_admin(self):
+        reseller_internal_headers = {
+            get_sys_meta_prefix('container') + 'sharding': 'True'}
+        reseller_external_headers = {'x-container-sharding': 'on'}
+        controller = proxy_server.ContainerController(self.app, 'a', 'c')
+
+        # Normal users, even swift owners, can't set it
+        req = Request.blank('/v1/a/c', method='PUT',
+                            headers=reseller_external_headers,
+                            environ={'swift_owner': True})
+        with mocked_http_conn(*[201] * self.CONTAINER_REPLICAS) as mock_conn:
+            resp = req.get_response(self.app)
+        self.assertEqual(2, resp.status_int // 100)
+        for key in reseller_internal_headers:
+            for captured in mock_conn.requests:
+                self.assertNotIn(key.title(), captured['headers'])
+
+        req = Request.blank('/v1/a/c', method='POST',
+                            headers=reseller_external_headers,
+                            environ={'swift_owner': True})
+        with mocked_http_conn(*[204] * self.CONTAINER_REPLICAS) as mock_conn:
+            resp = req.get_response(self.app)
+        self.assertEqual(2, resp.status_int // 100)
+        for key in reseller_internal_headers:
+            for captured in mock_conn.requests:
+                self.assertNotIn(key.title(), captured['headers'])
+
+        req = Request.blank('/v1/a/c', environ={'swift_owner': True})
+        # Heck, they don't even get to know
+        with mock.patch('swift.proxy.controllers.base.http_connect',
+                        fake_http_connect(200, 200,
+                                          headers=reseller_internal_headers)):
+            resp = controller.HEAD(req)
+        self.assertEqual(2, resp.status_int // 100)
+        for key in reseller_external_headers:
+            self.assertNotIn(key, resp.headers)
+
+        with mock.patch('swift.proxy.controllers.base.http_connect',
+                        fake_http_connect(200, 200,
+                                          headers=reseller_internal_headers)):
+            resp = controller.GET(req)
+        self.assertEqual(2, resp.status_int // 100)
+        for key in reseller_external_headers:
+            self.assertNotIn(key, resp.headers)
+
+        # But reseller admins can set it
+        req = Request.blank('/v1/a/c', method='PUT',
+                            headers=reseller_external_headers,
+                            environ={'reseller_request': True})
+        with mocked_http_conn(*[201] * self.CONTAINER_REPLICAS) as mock_conn:
+            resp = req.get_response(self.app)
+        self.assertEqual(2, resp.status_int // 100)
+        for key in reseller_internal_headers:
+            for captured in mock_conn.requests:
+                self.assertIn(key.title(), captured['headers'])
+
+        req = Request.blank('/v1/a/c', method='POST',
+                            headers=reseller_external_headers,
+                            environ={'reseller_request': True})
+        with mocked_http_conn(*[204] * self.CONTAINER_REPLICAS) as mock_conn:
+            resp = req.get_response(self.app)
+        self.assertEqual(2, resp.status_int // 100)
+        for key in reseller_internal_headers:
+            for captured in mock_conn.requests:
+                self.assertIn(key.title(), captured['headers'])
+
+        # And see that they have
+        req = Request.blank('/v1/a/c', environ={'reseller_request': True})
+        with mock.patch('swift.proxy.controllers.base.http_connect',
+                        fake_http_connect(200, 200,
+                                          headers=reseller_internal_headers)):
+            resp = controller.HEAD(req)
+        self.assertEqual(2, resp.status_int // 100)
+        for key in reseller_external_headers:
+            self.assertIn(key, resp.headers)
+            self.assertEqual(resp.headers[key], 'True')
+
+        with mock.patch('swift.proxy.controllers.base.http_connect',
+                        fake_http_connect(200, 200,
+                                          headers=reseller_internal_headers)):
+            resp = controller.GET(req)
+        self.assertEqual(2, resp.status_int // 100)
+        for key in reseller_external_headers:
+            self.assertEqual(resp.headers[key], 'True')
+
+    def test_sys_meta_headers_PUT(self):
+        # check that headers in sys meta namespace make it through
+        # the container controller
+        sys_meta_key = '%stest' % get_sys_meta_prefix('container')
+        sys_meta_key = sys_meta_key.title()
+        user_meta_key = 'X-Container-Meta-Test'
+        controller = proxy_server.ContainerController(self.app, 'a', 'c')
+
+        context = {}
+        callback = self._make_callback_func(context)
+        hdrs_in = {sys_meta_key: 'foo',
+                   user_meta_key: 'bar',
+                   'x-timestamp': '1.0'}
+        req = Request.blank('/v1/a/c', headers=hdrs_in)
+        with mock.patch('swift.proxy.controllers.base.http_connect',
+                        fake_http_connect(200, 200, give_connect=callback)):
+            controller.PUT(req)
+        self.assertEqual(context['method'], 'PUT')
+        self.assertIn(sys_meta_key, context['headers'])
+        self.assertEqual(context['headers'][sys_meta_key], 'foo')
+        self.assertIn(user_meta_key, context['headers'])
+        self.assertEqual(context['headers'][user_meta_key], 'bar')
+        self.assertNotEqual(context['headers']['x-timestamp'], '1.0')
+
+    def test_sys_meta_headers_POST(self):
+        # check that headers in sys meta namespace make it through
+        # the container controller
+        sys_meta_key = '%stest' % get_sys_meta_prefix('container')
+        sys_meta_key = sys_meta_key.title()
+        user_meta_key = 'X-Container-Meta-Test'
+        controller = proxy_server.ContainerController(self.app, 'a', 'c')
+        context = {}
+        callback = self._make_callback_func(context)
+        hdrs_in = {sys_meta_key: 'foo',
+                   user_meta_key: 'bar',
+                   'x-timestamp': '1.0'}
+        req = Request.blank('/v1/a/c', headers=hdrs_in)
+        with mock.patch('swift.proxy.controllers.base.http_connect',
+                        fake_http_connect(200, 200, give_connect=callback)):
+            controller.POST(req)
+        self.assertEqual(context['method'], 'POST')
+        self.assertIn(sys_meta_key, context['headers'])
+        self.assertEqual(context['headers'][sys_meta_key], 'foo')
+        self.assertIn(user_meta_key, context['headers'])
+        self.assertEqual(context['headers'][user_meta_key], 'bar')
+        self.assertNotEqual(context['headers']['x-timestamp'], '1.0')
+
+    def test_node_errors(self):
+        self.app.sort_nodes = lambda n, *args, **kwargs: n
+
+        for method in ('PUT', 'DELETE', 'POST'):
+            def test_status_map(statuses, expected):
+                self.app.error_limiter.stats.clear()
+                req = Request.blank('/v1/a/c', method=method)
+                with mocked_http_conn(*statuses) as fake_conn:
+                    resp = req.get_response(self.app)
+                self.assertEqual(resp.status_int, expected)
+                for req in fake_conn.requests:
+                    self.assertEqual(req['method'], method)
+                    self.assertTrue(req['path'].endswith('/a/c'))
+
+            base_status = [201] * self.CONTAINER_REPLICAS
+            # test happy path
+            test_status_map(list(base_status), 201)
+            for i in range(self.CONTAINER_REPLICAS):
+                self.assertEqual(node_error_count(
+                    self.app, self.container_ring.devs[i]), 0)
+            # single node errors and test isolation
+            for i in range(self.CONTAINER_REPLICAS):
+                test_status_map(base_status[:i] + [503] + base_status[i:], 201)
+                for j in range(self.CONTAINER_REPLICAS):
+                    expected = 1 if j == i else 0
+                    self.assertEqual(node_error_count(
+                        self.app, self.container_ring.devs[j]), expected)
+            # timeout
+            test_status_map(base_status[:1] + [Timeout()] + base_status[1:],
+                            201)
+            self.assertEqual(node_error_count(
+                self.app, self.container_ring.devs[1]), 1)
+
+            # exception
+            test_status_map([Exception('kaboom!')] + base_status, 201)
+            self.assertEqual(node_error_count(
+                self.app, self.container_ring.devs[0]), 1)
+
+            # insufficient storage
+            test_status_map(base_status[:2] + [507] + base_status[2:], 201)
+            self.assertEqual(node_error_count(
+                self.app, self.container_ring.devs[2]),
+                self.app.error_limiter.suppression_limit + 1)
+
+    def test_response_codes_for_GET(self):
+        nodes = self.app.container_ring.replicas
+        handoffs = self.app.request_node_count(nodes) - nodes
+        GET_TEST_CASES = [
+            ([socket.error()] * (nodes + handoffs), 503),
+            ([500] * (nodes + handoffs), 503),
+            ([200], 200),
+            ([404, 200], 200),
+            ([404] * nodes + [200], 200),
+            ([Timeout()] * nodes + [404] * handoffs, 503),
+            ([Timeout()] * (nodes + handoffs), 503),
+            ([Timeout()] * (nodes + handoffs - 1) + [404], 503),
+            ([Timeout()] * (nodes - 1) + [404] * (handoffs + 1), 503),
+            ([Timeout()] * (nodes - 2) + [404] * (handoffs + 2), 404),
+            ([500] * (nodes - 1) + [404] * (handoffs + 1), 503),
+            ([503, 200], 200),
+            ([507, 200], 200),
+        ]
+        failures = []
+        for case, expected in GET_TEST_CASES:
+            try:
+                with mocked_http_conn(*case):
+                    req = Request.blank('/v1/a/c')
+                    resp = req.get_response(self.app)
+                    try:
+                        self.assertEqual(resp.status_int, expected)
+                    except AssertionError:
+                        msg = '%r => %s (expected %s)' % (
+                            case, resp.status_int, expected)
+                        failures.append(msg)
+            except AssertionError as e:
+                # left over status failure
+                msg = '%r => %s' % (case, e)
+                failures.append(msg)
+        if failures:
+            self.fail('Some requests did not have expected response:\n' +
+                      '\n'.join(failures))
+
+        # One more test, simulating all nodes being error-limited
+        class FakeIter(object):
+            num_primary_nodes = 3
+
+            def __iter__(self):
+                return iter([])
+
+        with mocked_http_conn(), mock.patch(
+                'swift.proxy.controllers.container.NodeIter',
+                return_value=FakeIter()):
+            req = Request.blank('/v1/a/c')
+            resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 503)
+
+    def test_handoff_has_deleted_database(self):
+        nodes = self.app.container_ring.replicas
+        handoffs = self.app.request_node_count(nodes) - nodes
+        status = [Timeout()] * nodes + [404] * handoffs
+        timestamps = tuple([None] * nodes + ['1'] + [None] * (handoffs - 1))
+        with mocked_http_conn(*status, timestamps=timestamps):
+            req = Request.blank('/v1/a/c')
+            resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 404)
+
+    def test_response_code_for_PUT(self):
+        PUT_TEST_CASES = [
+            ((201, 201, 201), 201),
+            ((201, 201, 404), 201),
+            ((201, 201, 503), 201),
+            ((201, 404, 404), 404),
+            ((201, 404, 503), 503),
+            ((201, 503, 503), 503),
+            ((404, 404, 404), 404),
+            ((404, 404, 503), 404),
+            ((404, 503, 503), 503),
+            ((503, 503, 503), 503)
+        ]
+        self._assert_responses('PUT', PUT_TEST_CASES)
+
+    def test_response_code_for_DELETE(self):
+        DELETE_TEST_CASES = [
+            ((204, 204, 204), 204),
+            ((204, 204, 404), 204),
+            ((204, 204, 503), 204),
+            ((204, 404, 404), 404),
+            ((204, 404, 503), 503),
+            ((204, 503, 503), 503),
+            ((404, 404, 404), 404),
+            ((404, 404, 503), 404),
+            ((404, 503, 503), 503),
+            ((503, 503, 503), 503)
+        ]
+        self._assert_responses('DELETE', DELETE_TEST_CASES)
+
+    def test_response_code_for_POST(self):
+        POST_TEST_CASES = [
+            ((204, 204, 204), 204),
+            ((204, 204, 404), 204),
+            ((204, 204, 503), 204),
+            ((204, 404, 404), 404),
+            ((204, 404, 503), 503),
+            ((204, 503, 503), 503),
+            ((404, 404, 404), 404),
+            ((404, 404, 503), 404),
+            ((404, 503, 503), 503),
+            ((503, 503, 503), 503)
+        ]
+        self._assert_responses('POST', POST_TEST_CASES)
+
+    def test_GET_bad_requests(self):
+        # verify that the proxy controller enforces checks on request params
+        req = Request.blank(
+            '/v1/a/c?limit=%d' % (CONTAINER_LISTING_LIMIT + 1))
+        self.assertEqual(412, req.get_response(self.app).status_int)
+        req = Request.blank('/v1/a/c?delimiter=%ff')
+        self.assertEqual(400, req.get_response(self.app).status_int)
+        req = Request.blank('/v1/a/c?marker=%ff')
+        self.assertEqual(400, req.get_response(self.app).status_int)
+        req = Request.blank('/v1/a/c?end_marker=%ff')
+        self.assertEqual(400, req.get_response(self.app).status_int)
+        req = Request.blank('/v1/a/c?prefix=%ff')
+        self.assertEqual(400, req.get_response(self.app).status_int)
+        req = Request.blank('/v1/a/c?format=%ff')
+        self.assertEqual(400, req.get_response(self.app).status_int)
+        req = Request.blank('/v1/a/c?path=%ff')
+        self.assertEqual(400, req.get_response(self.app).status_int)
+        req = Request.blank('/v1/a/c?includes=%ff')
+        self.assertEqual(400, req.get_response(self.app).status_int)
+        req = Request.blank('/v1/a/c?states=%ff')
+        self.assertEqual(400, req.get_response(self.app).status_int)
+
+
+class TestGetShardedContainer(BaseTestContainerController):
+    RESP_SHARD_FORMAT_HEADERS = {'X-Backend-Record-Shard-Format': 'namespace'}
+
+    def setUp(self):
+        super(TestGetShardedContainer, self).setUp()
+
+    def _make_root_resp_hdrs(self, object_count, bytes_used, extra_hdrs=None,
+                             extra_shard_hdrs=None):
+        # basic headers that backend will return...
+        root_resp_hdrs = {'X-Backend-Sharding-State': 'sharded',
+                          'X-Backend-Timestamp': '99',
+                          'X-Container-Object-Count': object_count,
+                          'X-Container-Bytes-Used': bytes_used,
+                          'X-Container-Meta-Flavour': 'peach',
+                          'X-Backend-Storage-Policy-Index': 0}
+        if extra_hdrs:
+            root_resp_hdrs.update(extra_hdrs)
+
+        # headers returned when namespaces are returned...
+        root_shard_resp_hdrs = dict(root_resp_hdrs)
+        root_shard_resp_hdrs.update(
+            {'X-Backend-Record-Type': 'shard'})
+        root_shard_resp_hdrs.update(self.RESP_SHARD_FORMAT_HEADERS)
+        if extra_shard_hdrs:
+            root_shard_resp_hdrs.update(extra_shard_hdrs)
+        return root_resp_hdrs, root_shard_resp_hdrs
+
+    def _make_shard_resp_hdrs(self, sr_objs, extra_hdrs=None):
+        # headers returned from unsharded shard backends...
+        hdrs = []
+        for i, _ in enumerate(sr_objs):
+            shard_hdrs = {'X-Backend-Sharding-State': 'unsharded',
+                          'X-Container-Object-Count': len(sr_objs[i]),
+                          'X-Container-Bytes-Used':
+                              sum([obj['bytes'] for obj in sr_objs[i]]),
+                          'X-Container-Meta-Flavour': 'flavour%d' % i,
+                          'X-Backend-Storage-Policy-Index': 0,
+                          'X-Backend-Record-Type': 'object'}
+            if extra_hdrs:
+                shard_hdrs.update(extra_hdrs)
+            hdrs.append(shard_hdrs)
+        return hdrs
+
+    def _make_shard_objects(self, shard_range):
+        lower = ord(shard_range.lower[0] if shard_range.lower else '@')
+        upper = ord(shard_range.upper[0] if shard_range.upper
+                    else '\U0001ffff')
+
+        objects = [{'name': chr(i), 'bytes': i,
+                    'hash': 'hash%s' % chr(i),
+                    'content_type': 'text/plain', 'deleted': 0,
+                    'last_modified': next(self.ts_iter).isoformat}
+                   for i in range(lower + 1, upper + 1)][:1024]
+        return objects
+
+    def _check_GET_shard_listing(self, mock_responses, expected_objects,
+                                 expected_requests, query_string='',
+                                 reverse=False, expected_status=200,
+                                 memcache=False, req_headers=None):
+        # mock_responses is a list of tuples (status, json body, headers)
+        # expected objects is a list of dicts
+        # expected_requests is a list of tuples (path, hdrs dict, params dict)
+
+        # sanity check that expected objects is name ordered with no repeats
+        def name(obj):
+            return obj.get('name', obj.get('subdir'))
+
+        for (prev, next_) in zip(expected_objects, expected_objects[1:]):
+            if reverse:
+                self.assertGreater(name(prev), name(next_))
+            else:
+                self.assertLess(name(prev), name(next_))
+        container_path = '/v1/a/c' + query_string
+        codes = (resp[0] for resp in mock_responses)
+        bodies = iter([json.dumps(resp[1]).encode('ascii')
+                       for resp in mock_responses])
+        exp_headers = [resp[2] for resp in mock_responses]
+        request = Request.blank(container_path)
+        if req_headers:
+            request.headers.update(req_headers)
+        if memcache:
+            # memcache exists, which causes backend to ignore constraints and
+            # reverse params for shard range GETs
+            request.environ['swift.cache'] = FakeMemcache()
+
+        with mocked_http_conn(
+                *codes, body_iter=bodies, headers=exp_headers) as fake_conn:
+            resp = request.get_response(self.app)
+        for backend_req in fake_conn.requests:
+            self.assertEqual(request.headers['X-Trans-Id'],
+                             backend_req['headers']['X-Trans-Id'])
+            self.assertTrue(backend_req['headers']['User-Agent'].startswith(
+                'proxy-server'))
+        self.assertEqual(expected_status, resp.status_int)
+        if expected_status == 200:
+            actual_objects = json.loads(resp.body)
+            self.assertEqual(len(expected_objects), len(actual_objects))
+            self.assertEqual(expected_objects, actual_objects)
+            self.assertEqual(len(expected_requests), len(fake_conn.requests))
+        for i, ((exp_path, exp_headers, exp_params), req) in enumerate(
+                zip(expected_requests, fake_conn.requests)):
+            with self.subTest(index=i):
+                # strip off /sdx/0/ from path
+                self.assertEqual(exp_path, req['path'][7:])
+                got_params = dict(urllib.parse.parse_qsl(
+                    req['qs'], True, encoding='latin1'))
+                self.assertEqual(dict(exp_params, format='json'), got_params)
+                for k, v in exp_headers.items():
+                    self.assertIn(k, req['headers'])
+                    self.assertEqual(v, req['headers'][k], k)
+                self.assertNotIn('X-Backend-Override-Delete', req['headers'])
+                if memcache:
+                    self.assertEqual('sharded', req['headers'].get(
+                        'X-Backend-Override-Shard-Name-Filter'))
+                else:
+                    self.assertNotIn('X-Backend-Override-Shard-Name-Filter',
+                                     req['headers'])
+        return resp
+
+    def check_listing_response(self, resp, root_resp_hdrs,
+                               expected_objects=None,
+                               exp_sharding_state='sharded'):
+        info_hdrs = dict(root_resp_hdrs)
+        if expected_objects is None:
+            # default is to expect whatever the root container sent
+            expected_obj_count = root_resp_hdrs['X-Container-Object-Count']
+            expected_bytes_used = root_resp_hdrs['X-Container-Bytes-Used']
+        else:
+            expected_bytes_used = sum([o['bytes'] for o in expected_objects])
+            expected_obj_count = len(expected_objects)
+            info_hdrs['X-Container-Bytes-Used'] = expected_bytes_used
+            info_hdrs['X-Container-Object-Count'] = expected_obj_count
+        self.assertEqual(expected_bytes_used,
+                         int(resp.headers['X-Container-Bytes-Used']))
+        self.assertEqual(expected_obj_count,
+                         int(resp.headers['X-Container-Object-Count']))
+        self.assertEqual(exp_sharding_state,
+                         resp.headers['X-Backend-Sharding-State'])
+        self.assertNotIn('X-Backend-Record-Type', resp.headers)
+        self.assertNotIn('X-Backend-Record-Shard-Format', resp.headers)
+        for k, v in root_resp_hdrs.items():
+            if k.lower().startswith('x-container-meta'):
+                self.assertEqual(v, resp.headers[k])
+        # check that info cache is correct for root container
+        info = get_container_info(resp.request.environ, self.app)
+        self.assertEqual(headers_to_container_info(info_hdrs), info)
+
+    def create_server_namespace_dict(self, name, lower, upper):
+        # return a dict representation of an instance of the type the backend
+        # server returns for shard format = 'namespace'
+        return dict(Namespace(name, lower, upper))
+
+    def create_server_response_data(self, bounds, states=None,
+                                    name_prefix='.shards_a/c_'):
+        if not isinstance(bounds[0], (list, tuple)):
+            bounds = [(l, u) for l, u in zip(bounds[:-1], bounds[1:])]
+        # some tests use bounds with '/' char, so replace this before using the
+        # upper bound to synthesize a valid container name
+        namespaces = [Namespace(name_prefix + upper.replace('/', '-'),
+                                lower, upper)
+                      for lower, upper in bounds]
+        ns_dicts = [dict(ns) for ns in namespaces]
+        ns_objs = [self._make_shard_objects(ns) for ns in namespaces]
+        return namespaces, ns_dicts, ns_objs
+
+    def test_GET_sharded_container_no_memcache(self):
+        # Don't worry, ShardRange._encode takes care of unicode/bytes issues
+        shard_bounds = ('', 'ham', 'pie', u'\N{SNOWMAN}', u'\U0001F334', '')
+        namespaces, ns_dicts, sr_objs = self.create_server_response_data(
+            shard_bounds)
+        shard_resp_hdrs = self._make_shard_resp_hdrs(sr_objs)
+
+        all_objects = []
+        for objects in sr_objs:
+            all_objects.extend(objects)
+        size_all_objects = sum([obj['bytes'] for obj in all_objects])
+        num_all_objects = len(all_objects)
+        limit = CONTAINER_LISTING_LIMIT
+        expected_objects = all_objects
+        # pretend root object stats are not yet updated
+        root_resp_hdrs, root_shard_resp_hdrs = self._make_root_resp_hdrs(
+            num_all_objects - 1, size_all_objects - 1)
+
+        # GET all objects
+        # include some failed responses
+        mock_responses = [
+            # status, body, headers
+            (404, '', {}),
+            (200, ns_dicts, root_shard_resp_hdrs),
+            (200, sr_objs[0], shard_resp_hdrs[0]),
+            (200, sr_objs[1], shard_resp_hdrs[1]),
+            (200, sr_objs[2], shard_resp_hdrs[2]),
+            (200, sr_objs[3], shard_resp_hdrs[3]),
+            (200, sr_objs[4], shard_resp_hdrs[4]),
+        ]
+        expected_requests = [
+            # path, headers, params
+            ('a/c', {'X-Backend-Record-Type': 'auto'},
+             dict(states='listing')),  # 404
+            ('a/c', {'X-Backend-Record-Type': 'auto'},
+             dict(states='listing')),  # 200
+            (wsgi_quote(str_to_wsgi(namespaces[0].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='', end_marker='ham\x00', limit=str(limit),
+                  states='listing')),  # 200
+            (wsgi_quote(str_to_wsgi(namespaces[1].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='h', end_marker='pie\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0])))),  # 200
+            (wsgi_quote(str_to_wsgi(namespaces[2].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='p', end_marker='\xe2\x98\x83\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0] + sr_objs[1])))),  # 200
+            (wsgi_quote(str_to_wsgi(namespaces[3].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='\xd1\xb0', end_marker='\xf0\x9f\x8c\xb4\x00',
+                  states='listing',
+                  limit=str(limit - len(sr_objs[0] + sr_objs[1]
+                                        + sr_objs[2])))),  # 200
+            (wsgi_quote(str_to_wsgi(namespaces[4].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='\xe2\xa8\x83', end_marker='', states='listing',
+                  limit=str(limit - len(sr_objs[0] + sr_objs[1] + sr_objs[2]
+                                        + sr_objs[3])))),  # 200
+        ]
+
+        resp = self._check_GET_shard_listing(
+            mock_responses, expected_objects, expected_requests)
+        # root object count will overridden by actual length of listing
+        self.check_listing_response(resp, root_resp_hdrs,
+                                    expected_objects=expected_objects)
+
+        resp = self._check_GET_shard_listing(
+            mock_responses, expected_objects, expected_requests,
+            req_headers={'X-Backend-Record-Type': 'auto'})
+        self.check_listing_response(resp, root_resp_hdrs,
+                                    expected_objects=expected_objects)
+
+        resp = self._check_GET_shard_listing(
+            mock_responses, expected_objects, expected_requests,
+            req_headers={'X-Backend-Record-Type': 'banana'})
+        self.check_listing_response(resp, root_resp_hdrs,
+                                    expected_objects=expected_objects)
+
+        # GET all objects - sharding, final shard range points back to root
+        root_range = ShardRange('a/c', Timestamp.now(), 'pie', '')
+        mock_responses = [
+            # status, body, headers
+            (200, ns_dicts[:2] + [dict(root_range)], root_shard_resp_hdrs),
+            (200, sr_objs[0], shard_resp_hdrs[0]),
+            (200, sr_objs[1], shard_resp_hdrs[1]),
+            (200, sr_objs[2] + sr_objs[3] + sr_objs[4], root_resp_hdrs)
+        ]
+        expected_requests = [
+            # path, headers, params
+            ('a/c', {'X-Backend-Record-Type': 'auto'},
+             dict(states='listing')),  # 200
+            (namespaces[0].name,
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='', end_marker='ham\x00', limit=str(limit),
+                  states='listing')),  # 200
+            (namespaces[1].name,
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='h', end_marker='pie\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0])))),  # 200
+            (root_range.name,
+             {'X-Backend-Record-Type': 'object',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='p', end_marker='',
+                  limit=str(limit - len(sr_objs[0] + sr_objs[1]))))  # 200
+        ]
+
+        resp = self._check_GET_shard_listing(
+            mock_responses, expected_objects, expected_requests)
+        # root object count will overridden by actual length of listing
+        self.check_listing_response(resp, root_resp_hdrs,
+                                    expected_objects=expected_objects)
+
+        # GET all objects in reverse and *blank* limit
+        mock_responses = [
+            # status, body, headers
+            # NB: the backend returns reversed shard range list
+            (200, list(reversed(ns_dicts)), root_shard_resp_hdrs),
+            (200, list(reversed(sr_objs[4])), shard_resp_hdrs[4]),
+            (200, list(reversed(sr_objs[3])), shard_resp_hdrs[3]),
+            (200, list(reversed(sr_objs[2])), shard_resp_hdrs[2]),
+            (200, list(reversed(sr_objs[1])), shard_resp_hdrs[1]),
+            (200, list(reversed(sr_objs[0])), shard_resp_hdrs[0]),
+        ]
+        expected_requests = [
+            # path, headers, params
+            ('a/c', {'X-Backend-Record-Type': 'auto'},
+             dict(states='listing', reverse='true', limit='')),
+            (wsgi_quote(str_to_wsgi(namespaces[4].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='', end_marker='\xf0\x9f\x8c\xb4', states='listing',
+                  reverse='true', limit=str(limit))),  # 200
+            (wsgi_quote(str_to_wsgi(namespaces[3].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='\xf0\x9f\x8c\xb5', end_marker='\xe2\x98\x83',
+                  states='listing', reverse='true',
+                  limit=str(limit - len(sr_objs[4])))),  # 200
+            (wsgi_quote(str_to_wsgi(namespaces[2].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='\xe2\x98\x84', end_marker='pie', states='listing',
+                  reverse='true',
+                  limit=str(limit - len(sr_objs[4] + sr_objs[3])))),  # 200
+            (wsgi_quote(str_to_wsgi(namespaces[1].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='q', end_marker='ham', states='listing',
+                  reverse='true',
+                  limit=str(limit - len(sr_objs[4] + sr_objs[3]
+                                        + sr_objs[2])))),  # 200
+            (wsgi_quote(str_to_wsgi(namespaces[0].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='i', end_marker='', states='listing', reverse='true',
+                  limit=str(limit - len(sr_objs[4] + sr_objs[3] + sr_objs[2]
+                                        + sr_objs[1])))),  # 200
+        ]
+
+        resp = self._check_GET_shard_listing(
+            mock_responses, list(reversed(expected_objects)),
+            expected_requests, query_string='?reverse=true&limit=',
+            reverse=True)
+        # root object count will overridden by actual length of listing
+        self.check_listing_response(resp, root_resp_hdrs,
+                                    expected_objects=expected_objects)
+
+        # GET with limit param
+        limit = len(sr_objs[0]) + len(sr_objs[1]) + 1
+        expected_objects = all_objects[:limit]
+        mock_responses = [
+            (404, '', {}),
+            (200, ns_dicts, root_shard_resp_hdrs),
+            (200, sr_objs[0], shard_resp_hdrs[0]),
+            (200, sr_objs[1], shard_resp_hdrs[1]),
+            (200, sr_objs[2][:1], shard_resp_hdrs[2])
+        ]
+        expected_requests = [
+            ('a/c', {'X-Backend-Record-Type': 'auto'},
+             dict(limit=str(limit), states='listing')),  # 404
+            ('a/c', {'X-Backend-Record-Type': 'auto'},
+             dict(limit=str(limit), states='listing')),  # 200
+            (wsgi_quote(str_to_wsgi(namespaces[0].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},  # 200
+             dict(marker='', end_marker='ham\x00', states='listing',
+                  limit=str(limit))),
+            (wsgi_quote(str_to_wsgi(namespaces[1].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},  # 200
+             dict(marker='h', end_marker='pie\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0])))),
+            (wsgi_quote(str_to_wsgi(namespaces[2].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},   # 200
+             dict(marker='p', end_marker='\xe2\x98\x83\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0] + sr_objs[1])))),
+        ]
+        resp = self._check_GET_shard_listing(
+            mock_responses, expected_objects, expected_requests,
+            query_string='?limit=%s' % limit)
+        self.check_listing_response(resp, root_resp_hdrs)
+
+        # GET with marker
+        marker = bytes_to_wsgi(sr_objs[3][2]['name'].encode('utf8'))
+        first_included = (len(sr_objs[0]) + len(sr_objs[1])
+                          + len(sr_objs[2]) + 2)
+        limit = CONTAINER_LISTING_LIMIT
+        expected_objects = all_objects[first_included:]
+        mock_responses = [
+            (404, '', {}),
+            (200, ns_dicts[3:], root_shard_resp_hdrs),
+            (404, '', {}),
+            (200, sr_objs[3][2:], shard_resp_hdrs[3]),
+            (200, sr_objs[4], shard_resp_hdrs[4]),
+        ]
+        expected_requests = [
+            ('a/c', {'X-Backend-Record-Type': 'auto'},
+             dict(marker=marker, states='listing')),  # 404
+            ('a/c', {'X-Backend-Record-Type': 'auto'},
+             dict(marker=marker, states='listing')),  # 200
+            (wsgi_quote(str_to_wsgi(namespaces[3].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},  # 200
+             dict(marker=marker, end_marker='\xf0\x9f\x8c\xb4\x00',
+                  states='listing', limit=str(limit))),
+            (wsgi_quote(str_to_wsgi(namespaces[3].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},  # 200
+             dict(marker=marker, end_marker='\xf0\x9f\x8c\xb4\x00',
+                  states='listing', limit=str(limit))),
+            (wsgi_quote(str_to_wsgi(namespaces[4].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},  # 200
+             dict(marker='\xe2\xa8\x83', end_marker='', states='listing',
+                  limit=str(limit - len(sr_objs[3][2:])))),
+        ]
+        resp = self._check_GET_shard_listing(
+            mock_responses, expected_objects, expected_requests,
+            query_string='?marker=%s' % marker)
+        self.check_listing_response(resp, root_resp_hdrs)
+
+        # GET with end marker
+        end_marker = bytes_to_wsgi(sr_objs[3][6]['name'].encode('utf8'))
+        first_excluded = (len(sr_objs[0]) + len(sr_objs[1])
+                          + len(sr_objs[2]) + 6)
+        expected_objects = all_objects[:first_excluded]
+        mock_responses = [
+            (404, '', {}),
+            (200, ns_dicts[:4], root_shard_resp_hdrs),
+            (200, sr_objs[0], shard_resp_hdrs[0]),
+            (404, '', {}),
+            (200, sr_objs[1], shard_resp_hdrs[1]),
+            (200, sr_objs[2], shard_resp_hdrs[2]),
+            (404, '', {}),
+            (200, sr_objs[3][:6], shard_resp_hdrs[3]),
+        ]
+        expected_requests = [
+            ('a/c', {'X-Backend-Record-Type': 'auto'},
+             dict(end_marker=end_marker, states='listing')),  # 404
+            ('a/c', {'X-Backend-Record-Type': 'auto'},
+             dict(end_marker=end_marker, states='listing')),  # 200
+            (wsgi_quote(str_to_wsgi(namespaces[0].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},  # 200
+             dict(marker='', end_marker='ham\x00', states='listing',
+                  limit=str(limit))),
+            (wsgi_quote(str_to_wsgi(namespaces[1].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},  # 404
+             dict(marker='h', end_marker='pie\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0])))),
+            (wsgi_quote(str_to_wsgi(namespaces[1].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},  # 200
+             dict(marker='h', end_marker='pie\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0])))),
+            (wsgi_quote(str_to_wsgi(namespaces[2].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},  # 200
+             dict(marker='p', end_marker='\xe2\x98\x83\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0] + sr_objs[1])))),
+            (wsgi_quote(str_to_wsgi(namespaces[3].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},  # 404
+             dict(marker='\xd1\xb0', end_marker=end_marker, states='listing',
+                  limit=str(limit - len(sr_objs[0] + sr_objs[1]
+                                        + sr_objs[2])))),
+            (wsgi_quote(str_to_wsgi(namespaces[3].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},  # 200
+             dict(marker='\xd1\xb0', end_marker=end_marker, states='listing',
+                  limit=str(limit - len(sr_objs[0] + sr_objs[1]
+                                        + sr_objs[2])))),
+        ]
+        resp = self._check_GET_shard_listing(
+            mock_responses, expected_objects, expected_requests,
+            query_string='?end_marker=%s' % end_marker)
+        self.check_listing_response(resp, root_resp_hdrs)
+
+        # GET with prefix
+        prefix = 'hat'
+        # they're all 1-character names; the important thing
+        # is which shards we query
+        expected_objects = []
+        mock_responses = [
+            (404, '', {}),
+            (200, ns_dicts, root_shard_resp_hdrs),
+            (200, [], shard_resp_hdrs[1]),
+        ]
+        expected_requests = [
+            ('a/c', {'X-Backend-Record-Type': 'auto'},
+             dict(prefix=prefix, states='listing')),  # 404
+            ('a/c', {'X-Backend-Record-Type': 'auto'},
+             dict(prefix=prefix, states='listing')),  # 200
+            (wsgi_quote(str_to_wsgi(namespaces[1].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},  # 404
+             dict(prefix=prefix, marker='', end_marker='pie\x00',
+                  states='listing', limit=str(limit))),
+        ]
+        resp = self._check_GET_shard_listing(
+            mock_responses, expected_objects, expected_requests,
+            query_string='?prefix=%s' % prefix)
+        self.check_listing_response(resp, root_resp_hdrs)
+
+        # marker and end_marker and limit
+        limit = 2
+        expected_objects = all_objects[first_included:first_excluded]
+        mock_responses = [
+            (200, ns_dicts[3:4], root_shard_resp_hdrs),
+            (200, sr_objs[3][2:6], shard_resp_hdrs[1])
+        ]
+        expected_requests = [
+            ('a/c', {'X-Backend-Record-Type': 'auto'},
+             dict(states='listing', limit=str(limit),
+                  marker=marker, end_marker=end_marker)),  # 200
+            (wsgi_quote(str_to_wsgi(namespaces[3].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},  # 200
+             dict(marker=marker, end_marker=end_marker, states='listing',
+                  limit=str(limit))),
+        ]
+        resp = self._check_GET_shard_listing(
+            mock_responses, expected_objects, expected_requests,
+            query_string='?marker=%s&end_marker=%s&limit=%s'
+            % (marker, end_marker, limit))
+        self.check_listing_response(resp, root_resp_hdrs)
+
+        # reverse with marker, end_marker, and limit
+        expected_objects.reverse()
+        mock_responses = [
+            (200, ns_dicts[3:4], root_shard_resp_hdrs),
+            (200, list(reversed(sr_objs[3][2:6])), shard_resp_hdrs[1])
+        ]
+        expected_requests = [
+            ('a/c', {'X-Backend-Record-Type': 'auto'},
+             dict(marker=end_marker, reverse='true', end_marker=marker,
+                  limit=str(limit), states='listing',)),  # 200
+            (wsgi_quote(str_to_wsgi(namespaces[3].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},  # 200
+             dict(marker=end_marker, end_marker=marker, states='listing',
+                  limit=str(limit), reverse='true')),
+        ]
+        self._check_GET_shard_listing(
+            mock_responses, expected_objects, expected_requests,
+            query_string='?marker=%s&end_marker=%s&limit=%s&reverse=true'
+            % (end_marker, marker, limit), reverse=True)
+        self.check_listing_response(resp, root_resp_hdrs)
+
+    def test_GET_sharded_container_with_memcache(self):
+        # verify alternative code path in ContainerController when memcache is
+        # available...
+        shard_bounds = ('', 'ham', 'pie', u'\N{SNOWMAN}', u'\U0001F334', '')
+        namespaces, ns_dicts, sr_objs = self.create_server_response_data(
+            shard_bounds)
+        shard_resp_hdrs = self._make_shard_resp_hdrs(sr_objs)
+
+        all_objects = []
+        for objects in sr_objs:
+            all_objects.extend(objects)
+        size_all_objects = sum([obj['bytes'] for obj in all_objects])
+        num_all_objects = len(all_objects)
+        limit = CONTAINER_LISTING_LIMIT
+        expected_objects = all_objects
+        # pretend root object stats are not yet updated
+        root_resp_hdrs, root_shard_resp_hdrs = self._make_root_resp_hdrs(
+            num_all_objects - 1, size_all_objects - 1,
+            extra_shard_hdrs={'x-backend-override-shard-name-filter': 'true'})
+
+        # GET all objects
+        # include some failed responses
+        mock_responses = [
+            # status, body, headers
+            (404, '', {}),
+            (200, ns_dicts, root_shard_resp_hdrs),
+            (200, sr_objs[0], shard_resp_hdrs[0]),
+            (200, sr_objs[1], shard_resp_hdrs[1]),
+            (200, sr_objs[2], shard_resp_hdrs[2]),
+            (200, sr_objs[3], shard_resp_hdrs[3]),
+            (200, sr_objs[4], shard_resp_hdrs[4]),
+        ]
+        expected_requests = [
+            # path, headers, params
+            ('a/c', {'X-Backend-Record-Type': 'auto',
+                     'X-Backend-Override-Shard-Name-Filter': 'sharded'},
+             dict(states='listing')),  # 404
+            ('a/c', {'X-Backend-Record-Type': 'auto',
+                     'X-Backend-Override-Shard-Name-Filter': 'sharded'},
+             dict(states='listing')),  # 200
+            (wsgi_quote(str_to_wsgi(namespaces[0].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='', end_marker='ham\x00', limit=str(limit),
+                  states='listing')),  # 200
+            (wsgi_quote(str_to_wsgi(namespaces[1].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='h', end_marker='pie\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0])))),  # 200
+            (wsgi_quote(str_to_wsgi(namespaces[2].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='p', end_marker='\xe2\x98\x83\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0] + sr_objs[1])))),  # 200
+            (wsgi_quote(str_to_wsgi(namespaces[3].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='\xd1\xb0', end_marker='\xf0\x9f\x8c\xb4\x00',
+                  states='listing',
+                  limit=str(limit - len(sr_objs[0] + sr_objs[1]
+                                        + sr_objs[2])))),  # 200
+            (wsgi_quote(str_to_wsgi(namespaces[4].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='\xe2\xa8\x83', end_marker='', states='listing',
+                  limit=str(limit - len(sr_objs[0] + sr_objs[1] + sr_objs[2]
+                                        + sr_objs[3])))),  # 200
+        ]
+
+        resp = self._check_GET_shard_listing(
+            mock_responses, expected_objects, expected_requests, memcache=True)
+        # root object count will overridden by actual length of listing
+        self.check_listing_response(resp, root_resp_hdrs,
+                                    expected_objects=expected_objects)
+        self.assertIn('swift.cache', resp.request.environ)
+        cached_keys = set(k for k in resp.request.environ['swift.cache'].store
+                          if k.startswith('shard-listing'))
+        self.assertEqual({'shard-listing-v2/a/c'}, cached_keys)
+
+        resp = self._check_GET_shard_listing(
+            mock_responses, expected_objects, expected_requests, memcache=True,
+            req_headers={'X-Backend-Record-Type': 'auto'})
+        self.check_listing_response(resp, root_resp_hdrs,
+                                    expected_objects=expected_objects)
+
+        resp = self._check_GET_shard_listing(
+            mock_responses, expected_objects, expected_requests, memcache=True,
+            req_headers={'X-Backend-Record-Type': 'banana'})
+        self.check_listing_response(resp, root_resp_hdrs,
+                                    expected_objects=expected_objects)
+
+        # GET all objects - sharding, final shard range points back to root
+        root_range = ShardRange('a/c', Timestamp.now(), 'pie', '')
+        mock_responses = [
+            # status, body, headers
+            (200, ns_dicts[:2] + [dict(root_range)], root_shard_resp_hdrs),
+            (200, sr_objs[0], shard_resp_hdrs[0]),
+            (200, sr_objs[1], shard_resp_hdrs[1]),
+            (200, sr_objs[2] + sr_objs[3] + sr_objs[4], root_resp_hdrs)
+        ]
+        expected_requests = [
+            # path, headers, params
+            ('a/c', {'X-Backend-Record-Type': 'auto',
+                     'X-Backend-Override-Shard-Name-Filter': 'sharded'},
+             dict(states='listing')),  # 200
+            (namespaces[0].name,
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='', end_marker='ham\x00', limit=str(limit),
+                  states='listing')),  # 200
+            (namespaces[1].name,
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='h', end_marker='pie\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0])))),  # 200
+            (root_range.name,
+             {'X-Backend-Record-Type': 'object',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='p', end_marker='',
+                  limit=str(limit - len(sr_objs[0] + sr_objs[1]))))  # 200
+        ]
+
+        resp = self._check_GET_shard_listing(
+            mock_responses, expected_objects, expected_requests, memcache=True)
+        # root object count will overridden by actual length of listing
+        self.check_listing_response(resp, root_resp_hdrs,
+                                    expected_objects=expected_objects)
+        self.assertIn('swift.cache', resp.request.environ)
+        cached_keys = set(k for k in resp.request.environ['swift.cache'].store
+                          if k.startswith('shard-listing'))
+        self.assertEqual({'shard-listing-v2/a/c'}, cached_keys)
+
+        # GET all objects in reverse and *blank* limit
+        mock_responses = [
+            # status, body, headers
+            (200, list(ns_dicts), root_shard_resp_hdrs),
+            (200, list(reversed(sr_objs[4])), shard_resp_hdrs[4]),
+            (200, list(reversed(sr_objs[3])), shard_resp_hdrs[3]),
+            (200, list(reversed(sr_objs[2])), shard_resp_hdrs[2]),
+            (200, list(reversed(sr_objs[1])), shard_resp_hdrs[1]),
+            (200, list(reversed(sr_objs[0])), shard_resp_hdrs[0]),
+        ]
+        expected_requests = [
+            # path, headers, params
+            ('a/c', {'X-Backend-Record-Type': 'auto',
+                     'X-Backend-Override-Shard-Name-Filter': 'sharded'},
+             dict(states='listing', reverse='true', limit='')),
+            (wsgi_quote(str_to_wsgi(namespaces[4].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='', end_marker='\xf0\x9f\x8c\xb4', states='listing',
+                  reverse='true', limit=str(limit))),  # 200
+            (wsgi_quote(str_to_wsgi(namespaces[3].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='\xf0\x9f\x8c\xb5', end_marker='\xe2\x98\x83',
+                  states='listing', reverse='true',
+                  limit=str(limit - len(sr_objs[4])))),  # 200
+            (wsgi_quote(str_to_wsgi(namespaces[2].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='\xe2\x98\x84', end_marker='pie', states='listing',
+                  reverse='true',
+                  limit=str(limit - len(sr_objs[4] + sr_objs[3])))),  # 200
+            (wsgi_quote(str_to_wsgi(namespaces[1].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='q', end_marker='ham', states='listing',
+                  reverse='true',
+                  limit=str(limit - len(sr_objs[4] + sr_objs[3]
+                                        + sr_objs[2])))),  # 200
+            (wsgi_quote(str_to_wsgi(namespaces[0].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='i', end_marker='', states='listing', reverse='true',
+                  limit=str(limit - len(sr_objs[4] + sr_objs[3] + sr_objs[2]
+                                        + sr_objs[1])))),  # 200
+        ]
+
+        resp = self._check_GET_shard_listing(
+            mock_responses, list(reversed(expected_objects)),
+            expected_requests, query_string='?reverse=true&limit=',
+            reverse=True, memcache=True)
+        # root object count will overridden by actual length of listing
+        self.check_listing_response(resp, root_resp_hdrs,
+                                    expected_objects=expected_objects)
+        self.assertIn('swift.cache', resp.request.environ)
+        cached_keys = set(k for k in resp.request.environ['swift.cache'].store
+                          if k.startswith('shard-listing'))
+        self.assertEqual({'shard-listing-v2/a/c'}, cached_keys)
+
+        # GET with limit param
+        limit = len(sr_objs[0]) + len(sr_objs[1]) + 1
+        expected_objects = all_objects[:limit]
+        mock_responses = [
+            (404, '', {}),
+            (200, ns_dicts, root_shard_resp_hdrs),
+            (200, sr_objs[0], shard_resp_hdrs[0]),
+            (200, sr_objs[1], shard_resp_hdrs[1]),
+            (200, sr_objs[2][:1], shard_resp_hdrs[2])
+        ]
+        expected_requests = [
+            ('a/c', {'X-Backend-Record-Type': 'auto',
+                     'X-Backend-Override-Shard-Name-Filter': 'sharded'},
+             dict(limit=str(limit), states='listing')),  # 404
+            ('a/c', {'X-Backend-Record-Type': 'auto',
+                     'X-Backend-Override-Shard-Name-Filter': 'sharded'},
+             dict(limit=str(limit), states='listing')),  # 200
+            (wsgi_quote(str_to_wsgi(namespaces[0].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},  # 200
+             dict(marker='', end_marker='ham\x00', states='listing',
+                  limit=str(limit))),
+            (wsgi_quote(str_to_wsgi(namespaces[1].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},  # 200
+             dict(marker='h', end_marker='pie\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0])))),
+            (wsgi_quote(str_to_wsgi(namespaces[2].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},   # 200
+             dict(marker='p', end_marker='\xe2\x98\x83\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0] + sr_objs[1])))),
+        ]
+        resp = self._check_GET_shard_listing(
+            mock_responses, expected_objects, expected_requests,
+            query_string='?limit=%s' % limit, memcache=True)
+        self.check_listing_response(resp, root_resp_hdrs)
+        self.assertIn('swift.cache', resp.request.environ)
+        cached_keys = set(k for k in resp.request.environ['swift.cache'].store
+                          if k.startswith('shard-listing'))
+        self.assertEqual({'shard-listing-v2/a/c'}, cached_keys)
+
+        # GET with marker
+        marker = bytes_to_wsgi(sr_objs[3][2]['name'].encode('utf8'))
+        first_included = (len(sr_objs[0]) + len(sr_objs[1])
+                          + len(sr_objs[2]) + 2)
+        limit = CONTAINER_LISTING_LIMIT
+        expected_objects = all_objects[first_included:]
+        mock_responses = [
+            (404, '', {}),
+            # NB: proxy sent X-Backend-Override-Shard-Name-Filter so root
+            # returns complete shard listing despite marker
+            (200, ns_dicts, root_shard_resp_hdrs),
+            (404, '', {}),
+            (200, sr_objs[3][2:], shard_resp_hdrs[3]),
+            (200, sr_objs[4], shard_resp_hdrs[4]),
+        ]
+        expected_requests = [
+            ('a/c', {'X-Backend-Record-Type': 'auto',
+                     'X-Backend-Override-Shard-Name-Filter': 'sharded'},
+             dict(marker=marker, states='listing')),  # 404
+            ('a/c', {'X-Backend-Record-Type': 'auto',
+                     'X-Backend-Override-Shard-Name-Filter': 'sharded'},
+             dict(marker=marker, states='listing')),  # 200
+            (wsgi_quote(str_to_wsgi(namespaces[3].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},  # 200
+             dict(marker=marker, end_marker='\xf0\x9f\x8c\xb4\x00',
+                  states='listing', limit=str(limit))),
+            (wsgi_quote(str_to_wsgi(namespaces[3].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},  # 200
+             dict(marker=marker, end_marker='\xf0\x9f\x8c\xb4\x00',
+                  states='listing', limit=str(limit))),
+            (wsgi_quote(str_to_wsgi(namespaces[4].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},  # 200
+             dict(marker='\xe2\xa8\x83', end_marker='', states='listing',
+                  limit=str(limit - len(sr_objs[3][2:])))),
+        ]
+        resp = self._check_GET_shard_listing(
+            mock_responses, expected_objects, expected_requests,
+            query_string='?marker=%s' % marker, memcache=True)
+        self.check_listing_response(resp, root_resp_hdrs)
+        self.assertIn('swift.cache', resp.request.environ)
+        cached_keys = set(k for k in resp.request.environ['swift.cache'].store
+                          if k.startswith('shard-listing'))
+        self.assertEqual({'shard-listing-v2/a/c'}, cached_keys)
+
+        # GET with end marker
+        end_marker = bytes_to_wsgi(sr_objs[3][6]['name'].encode('utf8'))
+        first_excluded = (len(sr_objs[0]) + len(sr_objs[1])
+                          + len(sr_objs[2]) + 6)
+        expected_objects = all_objects[:first_excluded]
+        mock_responses = [
+            (404, '', {}),
+            (200, ns_dicts, root_shard_resp_hdrs),
+            (200, sr_objs[0], shard_resp_hdrs[0]),
+            (404, '', {}),
+            (200, sr_objs[1], shard_resp_hdrs[1]),
+            (200, sr_objs[2], shard_resp_hdrs[2]),
+            (404, '', {}),
+            (200, sr_objs[3][:6], shard_resp_hdrs[3]),
+        ]
+        expected_requests = [
+            ('a/c', {'X-Backend-Record-Type': 'auto',
+                     'X-Backend-Override-Shard-Name-Filter': 'sharded'},
+             dict(end_marker=end_marker, states='listing')),  # 404
+            ('a/c', {'X-Backend-Record-Type': 'auto',
+                     'X-Backend-Override-Shard-Name-Filter': 'sharded'},
+             dict(end_marker=end_marker, states='listing')),  # 200
+            (wsgi_quote(str_to_wsgi(namespaces[0].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},  # 200
+             dict(marker='', end_marker='ham\x00', states='listing',
+                  limit=str(limit))),
+            (wsgi_quote(str_to_wsgi(namespaces[1].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},  # 404
+             dict(marker='h', end_marker='pie\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0])))),
+            (wsgi_quote(str_to_wsgi(namespaces[1].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},  # 200
+             dict(marker='h', end_marker='pie\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0])))),
+            (wsgi_quote(str_to_wsgi(namespaces[2].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},  # 200
+             dict(marker='p', end_marker='\xe2\x98\x83\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0] + sr_objs[1])))),
+            (wsgi_quote(str_to_wsgi(namespaces[3].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},  # 404
+             dict(marker='\xd1\xb0', end_marker=end_marker, states='listing',
+                  limit=str(limit - len(sr_objs[0] + sr_objs[1]
+                                        + sr_objs[2])))),
+            (wsgi_quote(str_to_wsgi(namespaces[3].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},  # 200
+             dict(marker='\xd1\xb0', end_marker=end_marker, states='listing',
+                  limit=str(limit - len(sr_objs[0] + sr_objs[1]
+                                        + sr_objs[2])))),
+        ]
+        resp = self._check_GET_shard_listing(
+            mock_responses, expected_objects, expected_requests,
+            query_string='?end_marker=%s' % end_marker, memcache=True)
+        self.check_listing_response(resp, root_resp_hdrs)
+        self.assertIn('swift.cache', resp.request.environ)
+        cached_keys = set(k for k in resp.request.environ['swift.cache'].store
+                          if k.startswith('shard-listing'))
+        self.assertEqual({'shard-listing-v2/a/c'}, cached_keys)
+
+        # GET with prefix
+        prefix = 'hat'
+        # they're all 1-character names; the important thing
+        # is which shards we query
+        expected_objects = []
+        mock_responses = [
+            (404, '', {}),
+            (200, ns_dicts, root_shard_resp_hdrs),
+            (200, [], shard_resp_hdrs[1]),
+        ]
+        expected_requests = [
+            ('a/c', {'X-Backend-Record-Type': 'auto',
+                     'X-Backend-Override-Shard-Name-Filter': 'sharded'},
+             dict(prefix=prefix, states='listing')),  # 404
+            ('a/c', {'X-Backend-Record-Type': 'auto',
+                     'X-Backend-Override-Shard-Name-Filter': 'sharded'},
+             dict(prefix=prefix, states='listing')),  # 200
+            (wsgi_quote(str_to_wsgi(namespaces[1].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},  # 404
+             dict(prefix=prefix, marker='', end_marker='pie\x00',
+                  states='listing', limit=str(limit))),
+        ]
+        resp = self._check_GET_shard_listing(
+            mock_responses, expected_objects, expected_requests,
+            query_string='?prefix=%s' % prefix, memcache=True)
+        self.check_listing_response(resp, root_resp_hdrs)
+        self.assertIn('swift.cache', resp.request.environ)
+        cached_keys = set(k for k in resp.request.environ['swift.cache'].store
+                          if k.startswith('shard-listing'))
+        self.assertEqual({'shard-listing-v2/a/c'}, cached_keys)
+
+        # marker and end_marker and limit
+        limit = 2
+        expected_objects = all_objects[first_included:first_excluded]
+        mock_responses = [
+            (200, ns_dicts, root_shard_resp_hdrs),
+            (200, sr_objs[3][2:6], shard_resp_hdrs[1])
+        ]
+        expected_requests = [
+            ('a/c', {'X-Backend-Record-Type': 'auto',
+                     'X-Backend-Override-Shard-Name-Filter': 'sharded'},
+             dict(states='listing', limit=str(limit),
+                  marker=marker, end_marker=end_marker)),  # 200
+            (wsgi_quote(str_to_wsgi(namespaces[3].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},  # 200
+             dict(marker=marker, end_marker=end_marker, states='listing',
+                  limit=str(limit))),
+        ]
+        resp = self._check_GET_shard_listing(
+            mock_responses, expected_objects, expected_requests,
+            query_string='?marker=%s&end_marker=%s&limit=%s'
+            % (marker, end_marker, limit), memcache=True)
+        self.check_listing_response(resp, root_resp_hdrs)
+
+        # reverse with marker, end_marker, and limit
+        expected_objects.reverse()
+        mock_responses = [
+            (200, ns_dicts, root_shard_resp_hdrs),
+            (200, list(reversed(sr_objs[3][2:6])), shard_resp_hdrs[1])
+        ]
+        expected_requests = [
+            ('a/c', {'X-Backend-Record-Type': 'auto',
+                     'X-Backend-Override-Shard-Name-Filter': 'sharded'},
+             dict(marker=end_marker, reverse='true', end_marker=marker,
+                  limit=str(limit), states='listing',)),  # 200
+            (wsgi_quote(str_to_wsgi(namespaces[3].name)),
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},  # 200
+             dict(marker=end_marker, end_marker=marker, states='listing',
+                  limit=str(limit), reverse='true')),
+        ]
+        self._check_GET_shard_listing(
+            mock_responses, expected_objects, expected_requests,
+            query_string='?marker=%s&end_marker=%s&limit=%s&reverse=true'
+            % (end_marker, marker, limit), reverse=True, memcache=True)
+        self.check_listing_response(resp, root_resp_hdrs)
+        self.assertIn('swift.cache', resp.request.environ)
+        cached_keys = set(k for k in resp.request.environ['swift.cache'].store
+                          if k.startswith('shard-listing'))
+        self.assertEqual({'shard-listing-v2/a/c'}, cached_keys)
+
+    def _do_test_GET_sharded_container_with_deleted_shards(self, shard_specs):
+        # verify that if a shard fails to return its listing component then the
+        # client response is 503
+        shard_bounds = (('a', 'b'), ('b', 'c'), ('c', ''))
+        namespaces, ns_dicts, sr_objs = self.create_server_response_data(
+            shard_bounds)
+        shard_resp_hdrs = self._make_shard_resp_hdrs(sr_objs)
+
+        all_objects = []
+        for objects in sr_objs:
+            all_objects.extend(objects)
+
+        # pretend root object stats are not yet updated
+        root_resp_hdrs, root_shard_resp_hdrs = self._make_root_resp_hdrs(6, 12)
+        mock_responses = [
+            # status, body, headers
+            (200, ns_dicts, root_shard_resp_hdrs),
+        ]
+        for i, spec in enumerate(shard_specs):
+            if spec == 200:
+                mock_responses.append((200, sr_objs[i], shard_resp_hdrs[i]))
+            else:
+                mock_responses.extend(
+                    [(spec, '', {})] * 2 * self.CONTAINER_REPLICAS)
+
+        codes = (resp[0] for resp in mock_responses)
+        bodies = iter([json.dumps(resp[1]).encode('ascii')
+                       for resp in mock_responses])
+        exp_headers = [resp[2] for resp in mock_responses]
+        request = Request.blank('/v1/a/c')
+        with mocked_http_conn(
+                *codes, body_iter=bodies, headers=exp_headers) as fake_conn:
+            resp = request.get_response(self.app)
+        self.assertEqual(len(mock_responses), len(fake_conn.requests))
+        return request, resp
+
+    def test_GET_sharded_container_with_deleted_shard(self):
+        req, resp = self._do_test_GET_sharded_container_with_deleted_shards(
+            [404])
+        warning_lines = self.app.logger.get_lines_for_level('warning')
+        start = 'Failed to get container auto listing from /v1/.shards_a/c_b?'
+        msg, _, status_txn = warning_lines[0].partition(': ')
+        self.assertEqual(start, msg[:len(start)])
+        actual_qs = msg[len(start):]
+        actual_params = dict(
+            urllib.parse.parse_qsl(actual_qs, keep_blank_values=True))
+        self.assertEqual({'format': 'json',
+                          'limit': '10000',
+                          'marker': '',
+                          'end_marker': 'b\x00',
+                          'states': 'listing'},
+                         actual_params)
+        self.assertEqual('404', status_txn[:3])
+        self.assertFalse(warning_lines[1:])
+        self.assertEqual(resp.status_int, 503)
+        errors = self.logger.get_lines_for_level('error')
+        self.assertEqual(
+            ['Aborting listing from shards due to bad response: %s'
+             % ([404])], errors)
+
+    def test_GET_sharded_container_with_mix_ok_and_deleted_shard(self):
+        req, resp = self._do_test_GET_sharded_container_with_deleted_shards(
+            [200, 200, 404])
+        warning_lines = self.app.logger.get_lines_for_level('warning')
+        start = 'Failed to get container auto listing from /v1/.shards_a/c_?'
+        msg, _, status_txn = warning_lines[0].partition(': ')
+        self.assertEqual(start, msg[:len(start)])
+        actual_qs = msg[len(start):]
+        actual_params = dict(
+            urllib.parse.parse_qsl(actual_qs, keep_blank_values=True))
+        self.assertEqual({'format': 'json',
+                          'limit': '9998',
+                          'marker': 'c',
+                          'end_marker': '',
+                          'states': 'listing'},
+                         actual_params)
+        self.assertEqual('404', status_txn[:3])
+        self.assertFalse(warning_lines[1:])
+        self.assertEqual(resp.status_int, 503)
+        errors = self.logger.get_lines_for_level('error')
+        self.assertEqual(
+            ['Aborting listing from shards due to bad response: %s'
+             % ([200, 200, 404],)], errors)
+
+    def test_GET_sharded_container_mix_ok_and_unavailable_shards(self):
+        req, resp = self._do_test_GET_sharded_container_with_deleted_shards(
+            [200, 200, 503])
+        warning_lines = self.app.logger.get_lines_for_level('warning')
+        start = 'Failed to get container auto listing from /v1/.shards_a/c_?'
+        msg, _, status_txn = warning_lines[0].partition(': ')
+        self.assertEqual(start, msg[:len(start)])
+        actual_qs = msg[len(start):]
+        actual_params = dict(
+            urllib.parse.parse_qsl(actual_qs, keep_blank_values=True))
+        self.assertEqual({'format': 'json',
+                          'limit': '9998',
+                          'marker': 'c',
+                          'end_marker': '',
+                          'states': 'listing'},
+                         actual_params)
+        self.assertEqual('503', status_txn[:3])
+        self.assertFalse(warning_lines[1:])
+        self.assertEqual(resp.status_int, 503)
+        errors = self.logger.get_lines_for_level('error')
+        self.assertEqual(
+            ['Aborting listing from shards due to bad response: %s'
+             % ([200, 200, 503],)], errors[-1:])
+
+    def test_GET_sharded_container_marker_beyond_end_marker_memcache(self):
+        # verify that if request params result in the filtered namespaces list
+        # being empty the response body still has an empty object list
+        shard_bounds = (('a', 'b'), ('b', 'c'), ('c', ''))
+        namespaces, ns_dicts, _ = self.create_server_response_data(
+            shard_bounds)
+        root_resp_hdrs, root_shard_resp_hdrs = self._make_root_resp_hdrs(
+            6, 12, extra_shard_hdrs={
+                'x-backend-override-shard-name-filter': 'true'})
+
+        # NB: root returns complete shard listing
+        mock_responses = [
+            # status, body, headers
+            (200, ns_dicts, root_shard_resp_hdrs),
+        ]
+        expected_requests = [
+            ('a/c', {'X-Backend-Record-Type': 'auto'},
+             dict(states='listing', marker='bb', end_marker='aa')),  # 200
+        ]
+        expected_objects = []
+        resp = self._check_GET_shard_listing(
+            mock_responses, expected_objects, expected_requests,
+            query_string='?marker=bb&end_marker=aa', memcache=True)
+        self.check_listing_response(resp, root_resp_hdrs)
+
+    def test_GET_sharded_container_with_delimiter_no_memcache(self):
+        shard_bounds = (('', 'ha/ppy'), ('ha/ppy', 'ha/ptic'),
+                        ('ha/ptic', 'ham'), ('ham', 'pie'), ('pie', ''))
+        namespaces, ns_dicts, _ = self.create_server_response_data(
+            shard_bounds)
+        shard_resp_hdrs = {'X-Backend-Sharding-State': 'unsharded',
+                           'X-Container-Object-Count': 2,
+                           'X-Container-Bytes-Used': 4,
+                           'X-Backend-Storage-Policy-Index': 0}
+
+        limit = CONTAINER_LISTING_LIMIT
+        # pretend root object stats are not yet updated
+        root_resp_hdrs, root_shard_resp_hdrs = self._make_root_resp_hdrs(6, 12)
+
+        sr_0_obj = {'name': 'apple',
+                    'bytes': 1,
+                    'hash': 'hash',
+                    'content_type': 'text/plain',
+                    'deleted': 0,
+                    'last_modified': next(self.ts_iter).isoformat}
+        sr_5_obj = {'name': 'pumpkin',
+                    'bytes': 1,
+                    'hash': 'hash',
+                    'content_type': 'text/plain',
+                    'deleted': 0,
+                    'last_modified': next(self.ts_iter).isoformat}
+        subdir = {'subdir': 'ha/'}
+        mock_responses = [
+            # status, body, headers
+            (200, ns_dicts, root_shard_resp_hdrs),
+            (200, [sr_0_obj, subdir], shard_resp_hdrs),
+            (200, [], shard_resp_hdrs),
+            (200, [], shard_resp_hdrs),
+            (200, [sr_5_obj], shard_resp_hdrs)
+        ]
+        expected_requests = [
+            ('a/c', {'X-Backend-Record-Type': 'auto'},
+             dict(states='listing', delimiter='/')),  # 200
+            (namespaces[0].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='', end_marker='ha/ppy\x00', limit=str(limit),
+                  states='listing', delimiter='/')),  # 200
+            (namespaces[2].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='ha/', end_marker='ham\x00', states='listing',
+                  limit=str(limit - 2), delimiter='/')),  # 200
+            (namespaces[3].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='ha/', end_marker='pie\x00', states='listing',
+                  limit=str(limit - 2), delimiter='/')),  # 200
+            (namespaces[4].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='ha/', end_marker='', states='listing',
+                  limit=str(limit - 2), delimiter='/')),  # 200
+        ]
+
+        expected_objects = [sr_0_obj, subdir, sr_5_obj]
+        resp = self._check_GET_shard_listing(
+            mock_responses, expected_objects, expected_requests,
+            query_string='?delimiter=/')
+        self.check_listing_response(resp, root_resp_hdrs)
+
+    def test_GET_sharded_container_with_delimiter_reverse_no_memcache(self):
+        shard_bounds = ('', 'ha.d', 'ha/ppy', 'ha/ptic', 'ham', 'pie', '')
+        namespaces, ns_dicts, _ = self.create_server_response_data(
+            shard_bounds)
+        shard_resp_hdrs = {'X-Backend-Sharding-State': 'unsharded',
+                           'X-Container-Object-Count': 2,
+                           'X-Container-Bytes-Used': 4,
+                           'X-Backend-Storage-Policy-Index': 0}
+
+        limit = CONTAINER_LISTING_LIMIT
+        # pretend root object stats are not yet updated
+        root_resp_hdrs, root_shard_resp_hdrs = self._make_root_resp_hdrs(6, 12)
+
+        sr_0_obj = {'name': 'apple',
+                    'bytes': 1,
+                    'hash': 'hash',
+                    'content_type': 'text/plain',
+                    'deleted': 0,
+                    'last_modified': next(self.ts_iter).isoformat}
+        sr_1_obj = {'name': 'ha.ggle',
+                    'bytes': 1,
+                    'hash': 'hash',
+                    'content_type': 'text/plain',
+                    'deleted': 0,
+                    'last_modified': next(self.ts_iter).isoformat}
+        sr_5_obj = {'name': 'pumpkin',
+                    'bytes': 1,
+                    'hash': 'hash',
+                    'content_type': 'text/plain',
+                    'deleted': 0,
+                    'last_modified': next(self.ts_iter).isoformat}
+        subdir = {'subdir': 'ha/'}
+        mock_responses = [
+            # status, body, headers
+            (200, list(reversed(ns_dicts)), root_shard_resp_hdrs),
+            (200, [sr_5_obj], shard_resp_hdrs),
+            (200, [], shard_resp_hdrs),
+            (200, [subdir], shard_resp_hdrs),
+            (200, [sr_1_obj], shard_resp_hdrs),
+            (200, [sr_0_obj], shard_resp_hdrs),
+        ]
+        expected_requests = [
+            ('a/c', {'X-Backend-Record-Type': 'auto'},
+             dict(states='listing', delimiter='/', reverse='on')),  # 200
+            (namespaces[5].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='', end_marker='pie', states='listing',
+                  limit=str(limit), delimiter='/', reverse='on')),  # 200
+            (namespaces[4].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='pumpkin', end_marker='ham', states='listing',
+                  limit=str(limit - 1), delimiter='/', reverse='on')),  # 200
+            (namespaces[3].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='pumpkin', end_marker='ha/ptic', states='listing',
+                  limit=str(limit - 1), delimiter='/', reverse='on')),  # 200
+            (namespaces[1].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='ha/', end_marker='ha.d', limit=str(limit - 2),
+                  states='listing', delimiter='/', reverse='on')),  # 200
+            (namespaces[0].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='ha.ggle', end_marker='', limit=str(limit - 3),
+                  states='listing', delimiter='/', reverse='on')),  # 200
+        ]
+
+        expected_objects = [sr_5_obj, subdir, sr_1_obj, sr_0_obj]
+        resp = self._check_GET_shard_listing(
+            mock_responses, expected_objects, expected_requests,
+            query_string='?delimiter=/&reverse=on', reverse=True)
+        self.check_listing_response(resp, root_resp_hdrs)
+
+    def test_GET_sharded_container_shard_redirects_to_root_no_memcache(self):
+        # check that if the root redirects listing to a shard, but the shard
+        # returns the root shard (e.g. it was the final shard to shrink into
+        # the root) objects are requested from the root, rather than a loop.
+
+        # single shard spanning entire namespace
+        shard_bounds = ('', '')
+        namespaces, _, sr_objs = self.create_server_response_data(
+            shard_bounds)
+        all_objects = sr_objs[0]
+        size_all_objects = sum([obj['bytes'] for obj in all_objects])
+        num_all_objects = len(all_objects)
+        limit = CONTAINER_LISTING_LIMIT
+
+        # when shrinking the final shard will return the root shard range into
+        # which it is shrinking
+        shard_resp_hdrs = {
+            'X-Backend-Sharding-State': 'sharding',
+            'X-Container-Object-Count': 0,
+            'X-Container-Bytes-Used': 0,
+            'X-Backend-Storage-Policy-Index': 0,
+            'X-Backend-Record-Type': 'shard'
+        }
+
+        # root still thinks it has a shard
+        root_resp_hdrs, root_shard_resp_hdrs = self._make_root_resp_hdrs(
+            num_all_objects, size_all_objects)
+
+        root_sr_dict = self.create_server_namespace_dict('a/c', '', '')
+        mock_responses = [
+            # status, body, headers
+            (200, [dict(namespaces[0])], root_shard_resp_hdrs),  # from root
+            (200, [root_sr_dict], shard_resp_hdrs),  # from shard
+            (200, all_objects, root_resp_hdrs),  # from root
+        ]
+        expected_requests = [
+            # path, headers, params
+            # first request to root should specify auto record type
+            ('a/c', {'X-Backend-Record-Type': 'auto'},
+             dict(states='listing')),
+            # request to shard should specify auto record type
+            (wsgi_quote(str_to_wsgi(namespaces[0].name)),
+             {'X-Backend-Record-Type': 'auto'},
+             dict(marker='', end_marker='', limit=str(limit),
+                  states='listing')),  # 200
+            # second request to root should specify object record type
+            ('a/c', {'X-Backend-Record-Type': 'object'},
+             dict(marker='', end_marker='', limit=str(limit))),  # 200
+        ]
+
+        expected_objects = all_objects
+        resp = self._check_GET_shard_listing(
+            mock_responses, expected_objects, expected_requests)
+        self.check_listing_response(resp, root_resp_hdrs,
+                                    expected_objects=expected_objects)
+        self.assertEqual(
+            [('a', 'c'), ('.shards_a', 'c_')],
+            resp.request.environ.get('swift.shard_listing_history'))
+        lines = [line for line in self.app.logger.get_lines_for_level('debug')
+                 if line.startswith('Found 1024 objects in shard')]
+        self.assertEqual(2, len(lines), lines)
+        self.assertIn("(state=sharded), total = 1024", lines[0])  # shard->root
+        self.assertIn("(state=sharding), total = 1024", lines[1])  # shard
+
+    def test_GET_sharded_container_shard_redirects_between_shards(self):
+        # check that if one shard redirects listing to another shard that
+        # somehow redirects listing back to the first shard, then we will break
+        # out of the loop (this isn't an expected scenario, but could perhaps
+        # happen if multiple conflicting shard-shrinking decisions are made)
+        shard_bounds = ('', 'a', 'b', '')
+        namespaces, ns_dicts, sr_objs = self.create_server_response_data(
+            shard_bounds)
+        self.assertEqual([
+            '.shards_a/c_a',
+            '.shards_a/c_b',
+            '.shards_a/c_',
+        ], [sr.name for sr in namespaces])
+        all_objects = []
+        for objects in sr_objs:
+            all_objects.extend(objects)
+        size_all_objects = sum([obj['bytes'] for obj in all_objects])
+        num_all_objects = len(all_objects)
+
+        # pretend root object stats are not yet updated
+        _, root_shard_resp_hdrs = self._make_root_resp_hdrs(
+            num_all_objects, size_all_objects)
+
+        shard_resp_hdrs = {'X-Backend-Sharding-State': 'unsharded',
+                           'X-Container-Object-Count': 2,
+                           'X-Container-Bytes-Used': 4,
+                           'X-Backend-Storage-Policy-Index': 0,
+                           'X-Backend-Record-Storage-Policy-Index': 0,
+                           }
+        shrinking_resp_hdrs = {
+            'X-Backend-Sharding-State': 'sharded',
+            'X-Backend-Record-Type': 'shard',
+            'X-Backend-Storage-Policy-Index': 0
+        }
+        shrinking_resp_hdrs.update(self.RESP_SHARD_FORMAT_HEADERS)
+        limit = CONTAINER_LISTING_LIMIT
+
+        mock_responses = [
+            # status, body, headers
+            (200, ns_dicts, root_shard_resp_hdrs),  # from root
+            (200, sr_objs[0], shard_resp_hdrs),  # objects from 1st shard
+            (200, [ns_dicts[2]], shrinking_resp_hdrs),  # 2nd points to 3rd
+            (200, [ns_dicts[1]], shrinking_resp_hdrs),  # 3rd points to 2nd
+            (200, sr_objs[1], shard_resp_hdrs),  # objects from 2nd
+            (200, sr_objs[2], shard_resp_hdrs),  # objects from 3rd
+        ]
+        expected_requests = [
+            # each list item is tuple (path, headers, params)
+            # request to root
+            # context GET(a/c)
+            ('a/c', {'X-Backend-Record-Type': 'auto'},
+             dict(states='listing')),
+            # request to 1st shard as per shard list from root;
+            # context GET(a/c);
+            # end_marker dictated by 1st shard range upper bound
+            ('.shards_a/c_a', {'X-Backend-Record-Type': 'auto'},
+             dict(marker='', end_marker='a\x00', states='listing',
+                  limit=str(limit))),  # 200
+            # request to 2nd shard as per shard list from root;
+            # context GET(a/c);
+            # end_marker dictated by 2nd shard range upper bound
+            ('.shards_a/c_b', {'X-Backend-Record-Type': 'auto'},
+             dict(marker='a', end_marker='b\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0])))),
+            # request to 3rd shard as per shard list from *2nd shard*;
+            # new context GET(a/c)->GET(.shards_a/c_b);
+            # end_marker still dictated by 2nd shard range upper bound
+            ('.shards_a/c_', {'X-Backend-Record-Type': 'auto'},
+             dict(marker='a', end_marker='b\x00', states='listing',
+                  limit=str(
+                      limit - len(sr_objs[0])))),
+            # request to 2nd shard as per shard list from *3rd shard*; this one
+            # should specify record type object;
+            # new context GET(a/c)->GET(.shards_a/c_b)->GET(.shards_a/c_);
+            # end_marker still dictated by 2nd shard range upper bound
+            ('.shards_a/c_b', {'X-Backend-Record-Type': 'object'},
+             dict(marker='a', end_marker='b\x00',
+                  limit=str(
+                      limit - len(sr_objs[0])))),
+            # request to 3rd shard *as per shard list from root*; this one
+            # should specify record type object;
+            # context GET(a/c);
+            # end_marker dictated by 3rd shard range upper bound
+            ('.shards_a/c_', {'X-Backend-Record-Type': 'object'},
+             dict(marker='b', end_marker='',
+                  limit=str(
+                      limit - len(sr_objs[0]) - len(sr_objs[1])))),  # 200
+        ]
+        resp = self._check_GET_shard_listing(
+            mock_responses, all_objects, expected_requests)
+        self.check_listing_response(resp, root_shard_resp_hdrs,
+                                    expected_objects=all_objects)
+        self.assertEqual(
+            [('a', 'c'), ('.shards_a', 'c_b'), ('.shards_a', 'c_')],
+            resp.request.environ.get('swift.shard_listing_history'))
+
+    def test_GET_sharded_container_overlapping_shards_no_memcache(self):
+        # verify ordered listing even if unexpected overlapping shard ranges
+        shard_bounds = (('', 'ham'), ('', 'pie'), ('lemon', ''))
+        shard_states = (ShardRange.CLEAVED, ShardRange.ACTIVE,
+                        ShardRange.ACTIVE)
+        namespaces, ns_dicts, sr_objs = self.create_server_response_data(
+            shard_bounds, states=shard_states)
+        shard_resp_hdrs = self._make_shard_resp_hdrs(sr_objs)
+
+        all_objects = []
+        for objects in sr_objs:
+            all_objects.extend(objects)
+        size_all_objects = sum([obj['bytes'] for obj in all_objects])
+        num_all_objects = len(all_objects)
+        limit = CONTAINER_LISTING_LIMIT
+        # pretend root object stats are not yet updated
+        root_resp_hdrs, root_shard_resp_hdrs = self._make_root_resp_hdrs(
+            num_all_objects - 1, size_all_objects - 1)
+
+        # forwards listing
+
+        # expect subset of second shard range
+        objs_1 = [o for o in sr_objs[1] if o['name'] > sr_objs[0][-1]['name']]
+        # expect subset of third shard range
+        objs_2 = [o for o in sr_objs[2] if o['name'] > sr_objs[1][-1]['name']]
+        mock_responses = [
+            # status, body, headers
+            (200, ns_dicts, root_shard_resp_hdrs),
+            (200, sr_objs[0], shard_resp_hdrs[0]),
+            (200, objs_1, shard_resp_hdrs[1]),
+            (200, objs_2, shard_resp_hdrs[2])
+        ]
+        # NB marker always advances to last object name
+        expected_requests = [
+            # path, headers, params
+            ('a/c', {'X-Backend-Record-Type': 'auto'},
+             dict(states='listing')),  # 200
+            (namespaces[0].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='', end_marker='ham\x00', states='listing',
+                  limit=str(limit))),  # 200
+            (namespaces[1].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='h', end_marker='pie\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0])))),  # 200
+            (namespaces[2].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='p', end_marker='', states='listing',
+                  limit=str(limit - len(sr_objs[0] + objs_1))))  # 200
+        ]
+
+        expected_objects = sr_objs[0] + objs_1 + objs_2
+        resp = self._check_GET_shard_listing(
+            mock_responses, expected_objects, expected_requests)
+        # root object count will overridden by actual length of listing
+        self.check_listing_response(resp, root_resp_hdrs,
+                                    expected_objects=expected_objects)
+
+        # reverse listing
+
+        # expect subset of third shard range
+        objs_0 = [o for o in sr_objs[0] if o['name'] < sr_objs[1][0]['name']]
+        # expect subset of second shard range
+        objs_1 = [o for o in sr_objs[1] if o['name'] < sr_objs[2][0]['name']]
+        mock_responses = [
+            # status, body, headers
+            (200, list(reversed(ns_dicts)), root_shard_resp_hdrs),
+            (200, list(reversed(sr_objs[2])), shard_resp_hdrs[2]),
+            (200, list(reversed(objs_1)), shard_resp_hdrs[1]),
+            (200, list(reversed(objs_0)), shard_resp_hdrs[0]),
+        ]
+        # NB marker always advances to last object name
+        expected_requests = [
+            # path, headers, params
+            ('a/c', {'X-Backend-Record-Type': 'auto'},
+             dict(states='listing', reverse='true')),  # 200
+            (namespaces[2].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='', end_marker='lemon', states='listing',
+                  limit=str(limit),
+                  reverse='true')),  # 200
+            (namespaces[1].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='m', end_marker='', reverse='true', states='listing',
+                  limit=str(limit - len(sr_objs[2])))),  # 200
+            (namespaces[0].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='A', end_marker='', reverse='true', states='listing',
+                  limit=str(limit - len(sr_objs[2] + objs_1))))  # 200
+        ]
+
+        expected_objects = list(reversed(objs_0 + objs_1 + sr_objs[2]))
+        resp = self._check_GET_shard_listing(
+            mock_responses, expected_objects, expected_requests,
+            query_string='?reverse=true', reverse=True)
+        # root object count will overridden by actual length of listing
+        self.check_listing_response(resp, root_resp_hdrs,
+                                    expected_objects=expected_objects)
+
+    def test_GET_sharded_container_gap_in_shards_no_memcache(self):
+        # verify ordered listing even if unexpected gap between shard ranges
+        shard_bounds = (('', 'ham'), ('onion', 'pie'), ('rhubarb', ''))
+        namespaces, ns_dicts, sr_objs = self.create_server_response_data(
+            shard_bounds)
+        shard_resp_hdrs = self._make_shard_resp_hdrs(sr_objs)
+
+        all_objects = []
+        for objects in sr_objs:
+            all_objects.extend(objects)
+        size_all_objects = sum([obj['bytes'] for obj in all_objects])
+        num_all_objects = len(all_objects)
+        limit = CONTAINER_LISTING_LIMIT
+        # pretend root object stats are not yet updated
+        root_resp_hdrs, root_shard_resp_hdrs = self._make_root_resp_hdrs(
+            num_all_objects, size_all_objects)
+
+        mock_responses = [
+            # status, body, headers
+            (200, ns_dicts, root_shard_resp_hdrs),
+            (200, sr_objs[0], shard_resp_hdrs[0]),
+            (200, sr_objs[1], shard_resp_hdrs[1]),
+            (200, sr_objs[2], shard_resp_hdrs[2])
+        ]
+        # NB marker always advances to last object name
+        expected_requests = [
+            # path, headers, params
+            ('a/c', {'X-Backend-Record-Type': 'auto'},
+             dict(states='listing')),  # 200
+            (namespaces[0].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='', end_marker='ham\x00', states='listing',
+                  limit=str(limit))),  # 200
+            (namespaces[1].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='h', end_marker='pie\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0])))),  # 200
+            (namespaces[2].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='p', end_marker='', states='listing',
+                  limit=str(limit - len(sr_objs[0] + sr_objs[1]))))  # 200
+        ]
+
+        resp = self._check_GET_shard_listing(
+            mock_responses, all_objects, expected_requests, memcache=False)
+        # root object count will be overridden by actual length of listing
+        self.check_listing_response(resp, root_resp_hdrs)
+        self.assertNotIn('swift.cache', resp.request.environ)
+
+    def test_GET_sharding_container_gap_in_shards_with_memcache(self):
+        # verify ordered listing even if unexpected gap between shard ranges;
+        # root is sharding so shard ranges are not cached
+        shard_bounds = (('', 'ham'), ('onion', 'pie'), ('rhubarb', ''))
+        namespaces, ns_dicts, sr_objs = self.create_server_response_data(
+            shard_bounds)
+        shard_resp_hdrs = self._make_shard_resp_hdrs(sr_objs)
+
+        all_objects = []
+        for objects in sr_objs:
+            all_objects.extend(objects)
+        size_all_objects = sum([obj['bytes'] for obj in all_objects])
+        num_all_objects = len(all_objects)
+        limit = CONTAINER_LISTING_LIMIT
+        root_resp_hdrs, root_shard_resp_hdrs = self._make_root_resp_hdrs(
+            num_all_objects, size_all_objects,
+            extra_hdrs={'X-Backend-Sharding-State': 'sharding'})
+
+        mock_responses = [
+            # status, body, headers
+            (200, ns_dicts, root_shard_resp_hdrs),
+            (200, sr_objs[0], shard_resp_hdrs[0]),
+            (200, sr_objs[1], shard_resp_hdrs[1]),
+            (200, sr_objs[2], shard_resp_hdrs[2])
+        ]
+        # NB marker always advances to last object name
+        # NB end_markers are upper of the current available shard range
+        expected_requests = [
+            # path, headers, params
+            ('a/c', {'X-Backend-Record-Type': 'auto'},
+             dict(states='listing')),  # 200
+            (namespaces[0].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='', end_marker='ham\x00', states='listing',
+                  limit=str(limit))),  # 200
+            (namespaces[1].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='h', end_marker='pie\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0])))),  # 200
+            (namespaces[2].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='p', end_marker='', states='listing',
+                  limit=str(limit - len(sr_objs[0] + sr_objs[1]))))  # 200
+        ]
+
+        resp = self._check_GET_shard_listing(
+            mock_responses, all_objects, expected_requests, memcache=True)
+        # root object count will be overridden by actual length of listing
+        self.check_listing_response(resp, root_resp_hdrs,
+                                    exp_sharding_state='sharding')
+        self.assertIn('swift.cache', resp.request.environ)
+        cached_keys = set(k for k in resp.request.environ['swift.cache'].store
+                          if k.startswith('shard-listing'))
+        self.assertFalse(cached_keys)
+
+    def test_GET_sharded_container_gap_in_shards_with_memcache(self):
+        # verify ordered listing even if unexpected gap between shard ranges
+        shard_bounds = (('', 'ham'), ('onion', 'pie'), ('rhubarb', ''))
+        namespaces, ns_dicts, sr_objs = self.create_server_response_data(
+            shard_bounds)
+        shard_resp_hdrs = self._make_shard_resp_hdrs(sr_objs)
+
+        all_objects = []
+        for objects in sr_objs:
+            all_objects.extend(objects)
+        size_all_objects = sum([obj['bytes'] for obj in all_objects])
+        num_all_objects = len(all_objects)
+        limit = CONTAINER_LISTING_LIMIT
+        root_resp_hdrs, root_shard_resp_hdrs = self._make_root_resp_hdrs(
+            num_all_objects, size_all_objects,
+            extra_shard_hdrs={'x-backend-override-shard-name-filter': 'true'})
+
+        mock_responses = [
+            # status, body, headers
+            (200, ns_dicts, root_shard_resp_hdrs),
+            (200, sr_objs[0], shard_resp_hdrs[0]),
+            (200, sr_objs[1], shard_resp_hdrs[1]),
+            (200, sr_objs[2], shard_resp_hdrs[2])
+        ]
+        # NB marker always advances to last object name
+        # NB compaction of shard range data to cached bounds loses the gaps, so
+        # end_markers are lower of the next available shard range
+        expected_requests = [
+            # path, headers, params
+            ('a/c', {'X-Backend-Record-Type': 'auto'},
+             dict(states='listing')),  # 200
+            (namespaces[0].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='', end_marker='onion\x00', states='listing',
+                  limit=str(limit))),  # 200
+            (namespaces[1].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='h', end_marker='rhubarb\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0])))),  # 200
+            (namespaces[2].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='p', end_marker='', states='listing',
+                  limit=str(limit - len(sr_objs[0] + sr_objs[1]))))  # 200
+        ]
+
+        resp = self._check_GET_shard_listing(
+            mock_responses, all_objects, expected_requests, memcache=True)
+        # root object count will be overridden by actual length of listing
+        self.check_listing_response(resp, root_resp_hdrs)
+        self.assertIn('swift.cache', resp.request.environ)
+        cached_keys = set(k for k in resp.request.environ['swift.cache'].store
+                          if k.startswith('shard-listing'))
+        self.assertEqual({'shard-listing-v2/a/c'}, cached_keys)
+        # NB compact bounds in cache do not reveal the gap in shard ranges
+        self.assertEqual(
+            [['', '.shards_a/c_ham'],
+             ['onion', '.shards_a/c_pie'],
+             ['rhubarb', '.shards_a/c_']],
+            resp.request.environ['swift.cache'].store['shard-listing-v2/a/c'])
+
+    def test_GET_sharded_container_empty_shard_no_memcache(self):
+        # verify ordered listing when a shard is empty
+        shard_bounds = (('', 'ham'), ('ham', 'pie'), ('pie', ''))
+        namespaces, ns_dicts, sr_objs = self.create_server_response_data(
+            shard_bounds)
+        shard_resp_hdrs = self._make_shard_resp_hdrs(sr_objs)
+        empty_shard_resp_hdrs = {
+            'X-Backend-Sharding-State': 'unsharded',
+            'X-Container-Object-Count': 0,
+            'X-Container-Bytes-Used': 0,
+            'X-Container-Meta-Flavour': 'flavour',
+            'X-Backend-Storage-Policy-Index': 0}
+
+        # empty first shard range
+        all_objects = sr_objs[1] + sr_objs[2]
+        size_all_objects = sum([obj['bytes'] for obj in all_objects])
+        num_all_objects = len(all_objects)
+        root_resp_hdrs, root_shard_resp_hdrs = self._make_root_resp_hdrs(
+            num_all_objects, size_all_objects)
+
+        mock_responses = [
+            # status, body, headers
+            (200, ns_dicts, root_shard_resp_hdrs),
+            (200, [], empty_shard_resp_hdrs),
+            (200, sr_objs[1], shard_resp_hdrs[1]),
+            (200, sr_objs[2], shard_resp_hdrs[2])
+        ]
+        # NB marker does not advance until an object is in the listing
+        limit = CONTAINER_LISTING_LIMIT
+        expected_requests = [
+            # path, headers, params
+            ('a/c', {'X-Backend-Record-Type': 'auto'},
+             dict(states='listing')),  # 200
+            (namespaces[0].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='', end_marker='ham\x00', states='listing',
+                  limit=str(limit))),  # 200
+            (namespaces[1].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='', end_marker='pie\x00', states='listing',
+                  limit=str(limit))),  # 200
+            (namespaces[2].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='p', end_marker='', states='listing',
+                  limit=str(limit - len(sr_objs[1]))))  # 200
+        ]
+
+        resp = self._check_GET_shard_listing(
+            mock_responses, sr_objs[1] + sr_objs[2], expected_requests)
+        self.check_listing_response(resp, root_resp_hdrs)
+
+        # empty last shard range, reverse
+        all_objects = sr_objs[0] + sr_objs[1]
+        size_all_objects = sum([obj['bytes'] for obj in all_objects])
+        root_resp_hdrs = {'X-Backend-Sharding-State': 'sharded',
+                          'X-Backend-Timestamp': '99',
+                          'X-Container-Object-Count': len(all_objects),
+                          'X-Container-Bytes-Used': size_all_objects,
+                          'X-Container-Meta-Flavour': 'peach',
+                          'X-Backend-Storage-Policy-Index': 0}
+        root_shard_resp_hdrs = dict(root_resp_hdrs)
+        root_shard_resp_hdrs['X-Backend-Record-Type'] = 'shard'
+        root_shard_resp_hdrs.update(self.RESP_SHARD_FORMAT_HEADERS)
+
+        mock_responses = [
+            # status, body, headers
+            (200, list(reversed(ns_dicts)), root_shard_resp_hdrs),
+            (200, [], empty_shard_resp_hdrs),
+            (200, list(reversed(sr_objs[1])), shard_resp_hdrs[1]),
+            (200, list(reversed(sr_objs[0])), shard_resp_hdrs[0]),
+        ]
+        limit = CONTAINER_LISTING_LIMIT
+        expected_requests = [
+            # path, headers, params
+            ('a/c', {'X-Backend-Record-Type': 'auto'},
+             dict(states='listing', reverse='true')),  # 200
+            (namespaces[2].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='', end_marker='pie', states='listing',
+                  limit=str(limit), reverse='true')),  # 200
+            (namespaces[1].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='', end_marker='ham', states='listing',
+                  limit=str(limit), reverse='true')),  # 200
+            (namespaces[0].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker=sr_objs[1][0]['name'], end_marker='',
+                  states='listing', reverse='true',
+                  limit=str(limit - len(sr_objs[1]))))  # 200
+        ]
+
+        resp = self._check_GET_shard_listing(
+            mock_responses, list(reversed(sr_objs[0] + sr_objs[1])),
+            expected_requests, query_string='?reverse=true', reverse=True)
+        self.check_listing_response(resp, root_resp_hdrs)
+
+        # empty second shard range
+        all_objects = sr_objs[0] + sr_objs[2]
+        size_all_objects = sum([obj['bytes'] for obj in all_objects])
+        root_resp_hdrs = {'X-Backend-Sharding-State': 'sharded',
+                          'X-Backend-Timestamp': '99',
+                          'X-Container-Object-Count': len(all_objects),
+                          'X-Container-Bytes-Used': size_all_objects,
+                          'X-Container-Meta-Flavour': 'peach',
+                          'X-Backend-Storage-Policy-Index': 0}
+        root_shard_resp_hdrs = dict(root_resp_hdrs)
+        root_shard_resp_hdrs['X-Backend-Record-Type'] = 'shard'
+        root_shard_resp_hdrs.update(self.RESP_SHARD_FORMAT_HEADERS)
+
+        mock_responses = [
+            # status, body, headers
+            (200, ns_dicts, root_shard_resp_hdrs),
+            (200, sr_objs[0], shard_resp_hdrs[0]),
+            (200, [], empty_shard_resp_hdrs),
+            (200, sr_objs[2], shard_resp_hdrs[2])
+        ]
+        # NB marker always advances to last object name
+        limit = CONTAINER_LISTING_LIMIT
+        expected_requests = [
+            # path, headers, params
+            ('a/c', {'X-Backend-Record-Type': 'auto'},
+             dict(states='listing')),  # 200
+            (namespaces[0].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='', end_marker='ham\x00', states='listing',
+                  limit=str(limit))),  # 200
+            (namespaces[1].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='h', end_marker='pie\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0])))),  # 200
+            (namespaces[2].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='h', end_marker='', states='listing',
+                  limit=str(limit - len(sr_objs[0]))))  # 200
+        ]
+
+        resp = self._check_GET_shard_listing(
+            mock_responses, sr_objs[0] + sr_objs[2], expected_requests)
+        # root object count will overridden by actual length of listing
+        self.check_listing_response(resp, root_resp_hdrs)
+
+        # marker in empty second range
+        mock_responses = [
+            # status, body, headers
+            (200, ns_dicts[1:], root_shard_resp_hdrs),
+            (200, [], empty_shard_resp_hdrs),
+            (200, sr_objs[2], shard_resp_hdrs[2])
+        ]
+        # NB marker unchanged when getting from third range
+        expected_requests = [
+            # path, headers, params
+            ('a/c', {'X-Backend-Record-Type': 'auto'},
+             dict(states='listing', marker='koolaid')),  # 200
+            (namespaces[1].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='koolaid', end_marker='pie\x00', states='listing',
+                  limit=str(limit))),  # 200
+            (namespaces[2].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='koolaid', end_marker='', states='listing',
+             limit=str(limit)))  # 200
+        ]
+
+        resp = self._check_GET_shard_listing(
+            mock_responses, sr_objs[2], expected_requests,
+            query_string='?marker=koolaid')
+        # root object count will overridden by actual length of listing
+        self.check_listing_response(resp, root_resp_hdrs)
+
+        # marker in empty second range, reverse
+        mock_responses = [
+            # status, body, headers
+            (200, list(reversed(ns_dicts[:2])), root_shard_resp_hdrs),
+            (200, [], empty_shard_resp_hdrs),
+            (200, list(reversed(sr_objs[0])), shard_resp_hdrs[2])
+        ]
+        # NB marker unchanged when getting from first range
+        expected_requests = [
+            # path, headers, params
+            ('a/c', {'X-Backend-Record-Type': 'auto'},
+             dict(states='listing', marker='koolaid', reverse='true')),  # 200
+            (namespaces[1].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='koolaid', end_marker='ham', reverse='true',
+                  states='listing', limit=str(limit))),  # 200
+            (namespaces[0].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='koolaid', end_marker='', reverse='true',
+                  states='listing', limit=str(limit)))  # 200
+        ]
+
+        resp = self._check_GET_shard_listing(
+            mock_responses, list(reversed(sr_objs[0])), expected_requests,
+            query_string='?marker=koolaid&reverse=true', reverse=True)
+        # root object count will overridden by actual length of listing
+        self.check_listing_response(resp, root_resp_hdrs)
+
+    def _check_GET_sharded_container_shard_error(self, error):
+        # verify ordered listing when a shard is empty
+        shard_bounds = (('', 'ham'), ('ham', 'pie'), ('lemon', ''))
+        namespaces, ns_dicts, sr_objs = self.create_server_response_data(
+            shard_bounds)
+        # empty second shard range
+        sr_objs[1] = []
+        shard_resp_hdrs = self._make_shard_resp_hdrs(sr_objs)
+
+        all_objects = []
+        for objects in sr_objs:
+            all_objects.extend(objects)
+        size_all_objects = sum([obj['bytes'] for obj in all_objects])
+        num_all_objects = len(all_objects)
+        limit = CONTAINER_LISTING_LIMIT
+        root_resp_hdrs, root_shard_resp_hdrs = self._make_root_resp_hdrs(
+            num_all_objects, size_all_objects)
+
+        mock_responses = [
+            # status, body, headers
+            (200, ns_dicts, root_shard_resp_hdrs),
+            (200, sr_objs[0], shard_resp_hdrs[0])] + \
+            [(error, [], {})] * 2 * self.CONTAINER_REPLICAS
+
+        # NB marker always advances to last object name
+        expected_requests = [
+            # path, headers, params
+            ('a/c', {'X-Backend-Record-Type': 'auto'},
+             dict(states='listing')),  # 200
+            (namespaces[0].name, {'X-Backend-Record-Type': 'auto'},
+             dict(marker='', end_marker='ham\x00', states='listing',
+                  limit=str(limit)))] \
+            + [(namespaces[1].name, {'X-Backend-Record-Type': 'auto'},
+                dict(marker='h', end_marker='pie\x00', states='listing',
+                     limit=str(limit - len(sr_objs[0]))))
+               ] * 2 * self.CONTAINER_REPLICAS
+
+        self._check_GET_shard_listing(
+            mock_responses, all_objects, expected_requests,
+            expected_status=503)
+
+    def test_GET_sharded_container_shard_errors_no_memcache(self):
+        self._check_GET_sharded_container_shard_error(404)
+        self._check_GET_sharded_container_shard_error(500)
+
+    def test_GET_sharded_container_sharding_shard_no_memcache(self):
+        # one shard is in process of sharding
+        shard_bounds = (('', 'ham'), ('ham', 'pie'), ('pie', ''))
+        namespaces, ns_dicts, sr_objs = self.create_server_response_data(
+            shard_bounds)
+        # headers returned with obj listing from shard containers...
+        shard_obj_resp_hdrs = self._make_shard_resp_hdrs(sr_objs)
+        # modify second shard's obj listing resp - this one is sharding...
+        shard_obj_resp_hdrs[1]['X-Backend-Sharding-State'] = 'sharding'
+        # ...and will return shards in 'response' to auto record-type...
+        shard_1_shard_resp_hdrs = dict(shard_obj_resp_hdrs[1])
+        shard_1_shard_resp_hdrs['X-Backend-Record-Type'] = 'shard'
+        shard_1_shard_resp_hdrs.update(self.RESP_SHARD_FORMAT_HEADERS)
+
+        # second shard is sharding and has cleaved two out of three sub shards
+        sub_shard_bounds = (('ham', 'juice'), ('juice', 'lemon'))
+        sub_namespaces, sub_ns_dicts, sub_sr_objs = \
+            self.create_server_response_data(sub_shard_bounds,
+                                             name_prefix='a/c_sub_')
+        filler_sr_dict = self.create_server_namespace_dict(
+            namespaces[1].name, lower=sub_ns_dicts[-1]['upper'],
+            upper=namespaces[1].upper)
+        sub_sr_objs = [self._make_shard_objects(sr) for sr in sub_namespaces]
+        sub_shard_resp_hdrs = [
+            {'X-Backend-Sharding-State': 'unsharded',
+             'X-Container-Object-Count': len(sub_sr_objs[i]),
+             'X-Container-Bytes-Used':
+                 sum([obj['bytes'] for obj in sub_sr_objs[i]]),
+             'X-Container-Meta-Flavour': 'flavour%d' % i,
+             'X-Backend-Storage-Policy-Index': 0}
+            for i in range(2)]
+
+        all_objects = []
+        for objects in sr_objs:
+            all_objects.extend(objects)
+        size_all_objects = sum([obj['bytes'] for obj in all_objects])
+        num_all_objects = len(all_objects)
+        limit = CONTAINER_LISTING_LIMIT
+        root_resp_hdrs = {'X-Backend-Sharding-State': 'sharded',
+                          'X-Backend-Timestamp': '99',
+                          'X-Container-Object-Count': num_all_objects,
+                          'X-Container-Bytes-Used': size_all_objects,
+                          'X-Container-Meta-Flavour': 'peach',
+                          'X-Backend-Storage-Policy-Index': 0}
+        # headers returned with root response to auto record-type listing...
+        root_shard_resp_hdrs = dict(root_resp_hdrs)
+        root_shard_resp_hdrs['X-Backend-Record-Type'] = 'shard'
+        root_shard_resp_hdrs.update(self.RESP_SHARD_FORMAT_HEADERS)
+
+        mock_responses = [
+            # status, body, headers
+            (200, ns_dicts, root_shard_resp_hdrs),
+            (200, sr_objs[0], shard_obj_resp_hdrs[0]),
+            (200, sub_ns_dicts + [filler_sr_dict], shard_1_shard_resp_hdrs),
+            (200, sub_sr_objs[0], sub_shard_resp_hdrs[0]),
+            (200, sub_sr_objs[1], sub_shard_resp_hdrs[1]),
+            (200, sr_objs[1][len(sub_sr_objs[0] + sub_sr_objs[1]):],
+             shard_obj_resp_hdrs[1]),
+            (200, sr_objs[2], shard_obj_resp_hdrs[2])
+        ]
+        # NB marker always advances to last object name
+        expected_requests = [
+            # get root shard ranges
+            ('a/c', {'X-Backend-Record-Type': 'auto'},
+             dict(states='listing')),  # 200
+            # get first shard objects
+            (namespaces[0].name,
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='', end_marker='ham\x00', states='listing',
+                  limit=str(limit))),  # 200
+            # get second shard sub-shard ranges
+            (namespaces[1].name,
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='h', end_marker='pie\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0])))),
+            # get first sub-shard objects
+            (sub_namespaces[0].name,
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='h', end_marker='juice\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0])))),
+            # get second sub-shard objects
+            (sub_namespaces[1].name,
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='j', end_marker='lemon\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0] + sub_sr_objs[0])))),
+            # get remainder of first shard objects
+            (namespaces[1].name,
+             {'X-Backend-Record-Type': 'object',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='l', end_marker='pie\x00',
+                  limit=str(limit - len(sr_objs[0] + sub_sr_objs[0] +
+                                        sub_sr_objs[1])))),  # 200
+            # get third shard objects
+            (namespaces[2].name,
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='p', end_marker='', states='listing',
+                  limit=str(limit - len(sr_objs[0] + sr_objs[1]))))  # 200
+        ]
+        expected_objects = (
+            sr_objs[0] + sub_sr_objs[0] + sub_sr_objs[1] +
+            sr_objs[1][len(sub_sr_objs[0] + sub_sr_objs[1]):] + sr_objs[2])
+        resp = self._check_GET_shard_listing(
+            mock_responses, expected_objects, expected_requests)
+        # root object count will overridden by actual length of listing
+        self.check_listing_response(resp, root_resp_hdrs)
+
+    def test_GET_sharded_container_sharding_shard_with_memcache(self):
+        # one shard is in process of sharding
+        shard_bounds = (('', 'ham'), ('ham', 'pie'), ('pie', ''))
+        namespaces, ns_dicts, sr_objs = self.create_server_response_data(
+            shard_bounds)
+        # headers returned with obj listing from shard containers...
+        shard_obj_resp_hdrs = self._make_shard_resp_hdrs(sr_objs)
+        # modify second shard's obj listing resp - this one is sharding...
+        shard_obj_resp_hdrs[1]['X-Backend-Sharding-State'] = 'sharding'
+        # ...and will return shards in 'response' to auto record-type...
+        shard_1_shard_resp_hdrs = dict(shard_obj_resp_hdrs[1])
+        shard_1_shard_resp_hdrs['X-Backend-Record-Type'] = 'shard'
+        shard_1_shard_resp_hdrs.update(self.RESP_SHARD_FORMAT_HEADERS)
+
+        # second shard is sharding and has cleaved two out of three sub shards
+        sub_shard_bounds = (('ham', 'juice'), ('juice', 'lemon'))
+        sub_namespaces, sub_ns_dicts, sub_sr_objs = \
+            self.create_server_response_data(sub_shard_bounds,
+                                             name_prefix='a/c_sub_')
+        filler_sr_dict = self.create_server_namespace_dict(
+            namespaces[1].name, lower=sub_ns_dicts[-1]['upper'],
+            upper=namespaces[1].upper)
+        sub_shard_resp_hdrs = [
+            {'X-Backend-Sharding-State': 'unsharded',
+             'X-Container-Object-Count': len(sub_sr_objs[i]),
+             'X-Container-Bytes-Used':
+                 sum([obj['bytes'] for obj in sub_sr_objs[i]]),
+             'X-Container-Meta-Flavour': 'flavour%d' % i,
+             'X-Backend-Storage-Policy-Index': 0}
+            for i in range(2)]
+
+        all_objects = []
+        for objects in sr_objs:
+            all_objects.extend(objects)
+        size_all_objects = sum([obj['bytes'] for obj in all_objects])
+        num_all_objects = len(all_objects)
+        limit = CONTAINER_LISTING_LIMIT
+        root_resp_hdrs = {'X-Backend-Sharding-State': 'sharded',
+                          'X-Backend-Timestamp': '99',
+                          'X-Container-Object-Count': num_all_objects,
+                          'X-Container-Bytes-Used': size_all_objects,
+                          'X-Container-Meta-Flavour': 'peach',
+                          'X-Backend-Storage-Policy-Index': 0}
+        # headers returned with root response to auto record-type listing...
+        root_shard_resp_hdrs = dict(root_resp_hdrs)
+        root_shard_resp_hdrs['X-Backend-Record-Type'] = 'shard'
+        root_shard_resp_hdrs['X-Backend-Override-Shard-Name-Filter'] = 'true'
+        root_shard_resp_hdrs.update(self.RESP_SHARD_FORMAT_HEADERS)
+
+        mock_responses = [
+            # status, body, headers
+            (200, ns_dicts, root_shard_resp_hdrs),
+            (200, sr_objs[0], shard_obj_resp_hdrs[0]),
+            (200, sub_ns_dicts + [filler_sr_dict], shard_1_shard_resp_hdrs),
+            (200, sub_sr_objs[0], sub_shard_resp_hdrs[0]),
+            (200, sub_sr_objs[1], sub_shard_resp_hdrs[1]),
+            (200, sr_objs[1][len(sub_sr_objs[0] + sub_sr_objs[1]):],
+             shard_obj_resp_hdrs[1]),
+            (200, sr_objs[2], shard_obj_resp_hdrs[2])
+        ]
+        # NB marker always advances to last object name
+        expected_requests = [
+            # get root shard ranges
+            ('a/c', {'X-Backend-Record-Type': 'auto',
+                     'X-Backend-Override-Shard-Name-Filter': 'sharded'},
+             dict(states='listing')),  # 200
+            # get first shard objects
+            (namespaces[0].name,
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='', end_marker='ham\x00', states='listing',
+                  limit=str(limit))),  # 200
+            # get second shard sub-shard ranges
+            (namespaces[1].name,
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='h', end_marker='pie\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0])))),
+            # get first sub-shard objects
+            (sub_namespaces[0].name,
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='h', end_marker='juice\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0])))),
+            # get second sub-shard objects
+            (sub_namespaces[1].name,
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='j', end_marker='lemon\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0] + sub_sr_objs[0])))),
+            # get remainder of first shard objects (filler shard range)
+            (namespaces[1].name,
+             {'X-Backend-Record-Type': 'object',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='l', end_marker='pie\x00',
+                  limit=str(limit - len(sr_objs[0] + sub_sr_objs[0] +
+                                        sub_sr_objs[1])))),  # 200
+            # get third shard objects
+            (namespaces[2].name,
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='p', end_marker='', states='listing',
+                  limit=str(limit - len(sr_objs[0] + sr_objs[1]))))  # 200
+        ]
+        expected_objects = (
+            sr_objs[0] + sub_sr_objs[0] + sub_sr_objs[1] +
+            sr_objs[1][len(sub_sr_objs[0] + sub_sr_objs[1]):] + sr_objs[2])
+        resp = self._check_GET_shard_listing(
+            mock_responses, expected_objects, expected_requests, memcache=True)
+        # root object count will overridden by actual length of listing
+        self.check_listing_response(resp, root_resp_hdrs)
+        self.assertIn('swift.cache', resp.request.environ)
+        # sub-shards are not cached because the shard is still 'sharding'...
+        cached_keys = set(k for k in resp.request.environ['swift.cache'].store
+                          if k.startswith('shard-listing'))
+        self.assertEqual({'shard-listing-v2/a/c'}, cached_keys)
+
+    def test_GET_sharded_container_sharded_shard_with_memcache(self):
+        # one shard is sharded but still in shard listing returned by root
+        shard_bounds = (('', 'ham'), ('ham', 'pie'), ('pie', ''))
+        namespaces, ns_dicts, sr_objs = self.create_server_response_data(
+            shard_bounds)
+        shard_resp_hdrs = self._make_shard_resp_hdrs(sr_objs)
+        shard_1_shard_resp_hdrs = dict(shard_resp_hdrs[1])
+        shard_1_shard_resp_hdrs['X-Backend-Record-Type'] = 'shard'
+        shard_1_shard_resp_hdrs['X-Backend-Sharding-State'] = 'sharded'
+        shard_1_shard_resp_hdrs[
+            'X-Backend-Override-Shard-Name-Filter'] = 'true'
+        shard_1_shard_resp_hdrs.update(self.RESP_SHARD_FORMAT_HEADERS)
+
+        # second shard is sharded and has cleaved three sub shards
+        sub_shard_bounds = (('ham', 'juice'), ('juice', 'lemon'),
+                            ('lemon', 'pie'))
+        sub_namespaces, sub_ns_dicts, sub_sr_objs = \
+            self.create_server_response_data(sub_shard_bounds,
+                                             name_prefix='a/c_sub_')
+        sub_shard_resp_hdrs = [
+            {'X-Backend-Sharding-State': 'unsharded',
+             'X-Container-Object-Count': len(sub_sr_objs[i]),
+             'X-Container-Bytes-Used':
+                 sum([obj['bytes'] for obj in sub_sr_objs[i]]),
+             'X-Container-Meta-Flavour': 'flavour%d' % i,
+             'X-Backend-Storage-Policy-Index': 0}
+            for i in range(3)]
+
+        all_objects = []
+        for objects in sr_objs:
+            all_objects.extend(objects)
+        size_all_objects = sum([obj['bytes'] for obj in all_objects])
+        num_all_objects = len(all_objects)
+        limit = CONTAINER_LISTING_LIMIT
+        root_resp_hdrs = {'X-Backend-Sharding-State': 'sharded',
+                          'X-Backend-Timestamp': '99',
+                          'X-Container-Object-Count': num_all_objects,
+                          'X-Container-Bytes-Used': size_all_objects,
+                          'X-Container-Meta-Flavour': 'peach',
+                          'X-Backend-Storage-Policy-Index': 0}
+        root_shard_resp_hdrs = dict(root_resp_hdrs)
+        root_shard_resp_hdrs['X-Backend-Record-Type'] = 'shard'
+        root_shard_resp_hdrs['X-Backend-Override-Shard-Name-Filter'] = 'true'
+        root_shard_resp_hdrs.update(self.RESP_SHARD_FORMAT_HEADERS)
+
+        mock_responses = [
+            # status, body, headers
+            (200, ns_dicts, root_shard_resp_hdrs),
+            (200, sr_objs[0], shard_resp_hdrs[0]),
+            (200, sub_ns_dicts, shard_1_shard_resp_hdrs),
+            (200, sub_sr_objs[0], sub_shard_resp_hdrs[0]),
+            (200, sub_sr_objs[1], sub_shard_resp_hdrs[1]),
+            (200, sub_sr_objs[2], sub_shard_resp_hdrs[2]),
+            (200, sr_objs[2], shard_resp_hdrs[2])
+        ]
+        # NB marker always advances to last object name
+        expected_requests = [
+            # get root shard ranges
+            ('a/c', {'X-Backend-Record-Type': 'auto',
+                     'X-Backend-Override-Shard-Name-Filter': 'sharded'},
+             dict(states='listing')),  # 200
+            # get first shard objects
+            (namespaces[0].name,
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='', end_marker='ham\x00', states='listing',
+                  limit=str(limit))),  # 200
+            # get second shard sub-shard ranges
+            (namespaces[1].name,
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='h', end_marker='pie\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0])))),
+            # get first sub-shard objects
+            (sub_namespaces[0].name,
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='h', end_marker='juice\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0])))),
+            # get second sub-shard objects
+            (sub_namespaces[1].name,
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='j', end_marker='lemon\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0] + sub_sr_objs[0])))),
+            # get third sub-shard objects
+            (sub_namespaces[2].name,
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='l', end_marker='pie\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0] + sub_sr_objs[0] +
+                                        sub_sr_objs[1])))),
+            # get third shard objects
+            (namespaces[2].name,
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Override-Shard-Name-Filter': 'sharded',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='p', end_marker='', states='listing',
+                  limit=str(limit - len(sr_objs[0] + sr_objs[1]))))  # 200
+        ]
+        expected_objects = (
+            sr_objs[0] + sub_sr_objs[0] + sub_sr_objs[1] + sub_sr_objs[2] +
+            sr_objs[2])
+        resp = self._check_GET_shard_listing(
+            mock_responses, expected_objects, expected_requests, memcache=True)
+        # root object count will overridden by actual length of listing
+        self.check_listing_response(resp, root_resp_hdrs)
+        self.assertIn('swift.cache', resp.request.environ)
+        cached_keys = set(k for k in resp.request.environ['swift.cache'].store
+                          if k.startswith('shard-listing'))
+        self.assertEqual(
+            {'shard-listing-v2/a/c', 'shard-listing-v2/.shards_a/c_pie'},
+            cached_keys)
+
+    @patch_policies([
+        StoragePolicy(0, 'zero', True, object_ring=FakeRing()),
+        StoragePolicy(1, 'one', False, object_ring=FakeRing())
+    ])
+    def test_GET_sharded_container_sharding_shard_mixed_policies(self):
+        # scenario: one shard is in process of sharding, shards have different
+        # policy than root, expect listing to always request root policy index
+        shard_bounds = (('', 'ham'), ('ham', 'pie'), ('pie', ''))
+        namespaces, ns_dicts, sr_objs = self.create_server_response_data(
+            shard_bounds)
+        shard_obj_resp_hdrs = self._make_shard_resp_hdrs(
+            sr_objs, extra_hdrs={
+                'X-Backend-Storage-Policy-Index': 1,
+                'X-Backend-Record-Storage-Policy-Index': 0})
+        # second shard is sharding and has cleaved two out of three sub shards
+        shard_obj_resp_hdrs[1]['X-Backend-Sharding-State'] = 'sharding'
+        shard_1_shard_resp_hdrs = dict(shard_obj_resp_hdrs[1])
+        shard_1_shard_resp_hdrs['X-Backend-Record-Type'] = 'shard'
+        shard_1_shard_resp_hdrs.update(self.RESP_SHARD_FORMAT_HEADERS)
+
+        sub_shard_bounds = (('ham', 'juice'), ('juice', 'lemon'))
+        sub_namespaces, sub_ns_dicts, sub_sr_objs = \
+            self.create_server_response_data(sub_shard_bounds,
+                                             name_prefix='a/c_sub_')
+        filler_sr_dict = self.create_server_namespace_dict(
+            namespaces[1].name, lower=sub_ns_dicts[-1]['upper'],
+            upper=namespaces[1].upper)
+        sub_shard_resp_hdrs = self._make_shard_resp_hdrs(
+            sub_sr_objs, extra_hdrs={
+                'X-Backend-Storage-Policy-Index': 1,
+                'X-Backend-Record-Storage-Policy-Index': 0})
+
+        all_objects = []
+        for objects in sr_objs:
+            all_objects.extend(objects)
+        size_all_objects = sum([obj['bytes'] for obj in all_objects])
+        num_all_objects = len(all_objects)
+        limit = CONTAINER_LISTING_LIMIT
+        root_resp_hdrs = {'X-Backend-Sharding-State': 'sharded',
+                          'X-Backend-Timestamp': '99',
+                          'X-Container-Object-Count': num_all_objects,
+                          'X-Container-Bytes-Used': size_all_objects,
+                          'X-Container-Meta-Flavour': 'peach',
+                          'X-Backend-Storage-Policy-Index': 0}
+        root_shard_resp_hdrs = dict(root_resp_hdrs)
+        root_shard_resp_hdrs['X-Backend-Record-Type'] = 'shard'
+        root_shard_resp_hdrs.update(self.RESP_SHARD_FORMAT_HEADERS)
+
+        mock_responses = [
+            # status, body, headers
+            (200, ns_dicts, root_shard_resp_hdrs),
+            (200, sr_objs[0], shard_obj_resp_hdrs[0]),
+            (200, sub_ns_dicts + [filler_sr_dict], shard_1_shard_resp_hdrs),
+            (200, sub_sr_objs[0], sub_shard_resp_hdrs[0]),
+            (200, sub_sr_objs[1], sub_shard_resp_hdrs[1]),
+            (200, sr_objs[1][len(sub_sr_objs[0] + sub_sr_objs[1]):],
+             shard_obj_resp_hdrs[1]),
+            (200, sr_objs[2], shard_obj_resp_hdrs[2])
+        ]
+        # NB marker always advances to last object name
+        expected_requests = [
+            # get root shard ranges
+            ('a/c', {'X-Backend-Record-Type': 'auto'},
+             dict(states='listing')),  # 200
+            # get first shard objects
+            (namespaces[0].name,
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='', end_marker='ham\x00', states='listing',
+                  limit=str(limit))),  # 200
+            # get second shard sub-shard ranges
+            (namespaces[1].name,
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='h', end_marker='pie\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0])))),
+            # get first sub-shard objects
+            (sub_namespaces[0].name,
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='h', end_marker='juice\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0])))),
+            # get second sub-shard objects
+            (sub_namespaces[1].name,
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='j', end_marker='lemon\x00', states='listing',
+                  limit=str(limit - len(sr_objs[0] + sub_sr_objs[0])))),
+            # get remainder of second shard objects
+            (namespaces[1].name,
+             {'X-Backend-Record-Type': 'object',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='l', end_marker='pie\x00',
+                  limit=str(limit - len(sr_objs[0] + sub_sr_objs[0] +
+                                        sub_sr_objs[1])))),  # 200
+            # get third shard objects
+            (namespaces[2].name,
+             {'X-Backend-Record-Type': 'auto',
+              'X-Backend-Storage-Policy-Index': '0'},
+             dict(marker='p', end_marker='', states='listing',
+                  limit=str(limit - len(sr_objs[0] + sr_objs[1]))))  # 200
+        ]
+        expected_objects = (
+            sr_objs[0] + sub_sr_objs[0] + sub_sr_objs[1] +
+            sr_objs[1][len(sub_sr_objs[0] + sub_sr_objs[1]):] + sr_objs[2])
+        resp = self._check_GET_shard_listing(
+            mock_responses, expected_objects, expected_requests)
+        # root object count will overridden by actual length of listing
+        self.check_listing_response(resp, root_resp_hdrs)
+
+    @patch_policies([
+        StoragePolicy(0, 'zero', True, object_ring=FakeRing()),
+        StoragePolicy(1, 'one', False, object_ring=FakeRing())
+    ])
+    def test_GET_sharded_container_mixed_policies_error(self):
+        # scenario: shards have different policy than root, listing requests
+        # root policy index but shards not upgraded and respond with their own
+        # policy index
+        def do_test(shard_policy):
+            # only need first shard for this test...
+            shard_bounds = ('', 'pie')
+            namespaces, _, sr_objs = self.create_server_response_data(
+                shard_bounds)
+            sr = namespaces[0]
+            sr_objs = sr_objs[0]
+            shard_resp_hdrs = {
+                'X-Backend-Sharding-State': 'unsharded',
+                'X-Container-Object-Count': len(sr_objs),
+                'X-Container-Bytes-Used':
+                    sum([obj['bytes'] for obj in sr_objs]),
+            }
+
+            if shard_policy is not None:
+                shard_resp_hdrs['X-Backend-Storage-Policy-Index'] = \
+                    shard_policy
+
+            size_all_objects = sum([obj['bytes'] for obj in sr_objs])
+            num_all_objects = len(sr_objs)
+            limit = CONTAINER_LISTING_LIMIT
+            root_resp_hdrs, root_shard_resp_hdrs = self._make_root_resp_hdrs(
+                num_all_objects, size_all_objects,
+                extra_hdrs={'X-Backend-Storage-Policy-Index': 1})
+
+            mock_responses = [
+                # status, body, headers
+                (200, [dict(sr)], root_shard_resp_hdrs),
+                (200, sr_objs, shard_resp_hdrs),
+            ]
+            # NB marker always advances to last object name
+            expected_requests = [
+                # get root shard ranges
+                ('a/c', {'X-Backend-Record-Type': 'auto'},
+                 dict(states='listing')),  # 200
+                # get first shard objects
+                (sr.name,
+                 {'X-Backend-Record-Type': 'auto',
+                  'X-Backend-Storage-Policy-Index': '1'},
+                 dict(marker='', end_marker='pie\x00', states='listing',
+                      limit=str(limit))),  # 200
+                # error to client; no request for second shard objects
+            ]
+            self._check_GET_shard_listing(
+                mock_responses, [], expected_requests,
+                expected_status=503)
+
+        do_test(0)
+        do_test(None)
+
+    def test_GET_record_type_shard(self):
+        # explicit request for namespaces
+        memcache = FakeMemcache()
+        shard_bounds = ('', 'pie')
+        namespaces, ns_dicts, sr_objs = self.create_server_response_data(
+            shard_bounds)
+        _, root_shard_resp_hdrs = self._make_root_resp_hdrs(2, 4)
+
+        body = json.dumps(ns_dicts).encode('ascii')
+        req = Request.blank('/v1/a/c', {'swift.cache': memcache})
+        req.headers['X-Backend-Record-Type'] = 'shard'
+        req.headers['X-Backend-Record-Shard-Format'] = 'namespace'
+        with mocked_http_conn(200, body_iter=[body],
+                              headers=root_shard_resp_hdrs) as fake_conn:
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(1, len(fake_conn.requests))
+        exp_backend_hdrs = {
+            'X-Backend-Record-Type': 'shard',
+            'X-Backend-Record-Shard-Format': 'namespace',
+            'Host': mock.ANY, 'X-Trans-Id': mock.ANY, 'X-Timestamp': mock.ANY,
+            'Connection': 'close', 'User-Agent': mock.ANY,
+            'Referer': mock.ANY}
+        self.assertEqual(exp_backend_hdrs, fake_conn.requests[0]['headers'])
+        self.assertNotIn('state=', fake_conn.requests[0]['qs'])
+        # NB: no namespaces cached
+        self.assertEqual([mock.call.set('container/a/c', mock.ANY, time=60)],
+                         memcache.calls)
+        self.assertEqual(ns_dicts, json.loads(resp.body))
+
+    def test_GET_record_type_shard_with_listing_state(self):
+        # explicit request for namespaces specifying list state
+        memcache = FakeMemcache()
+        shard_bounds = ('', 'pie')
+        namespaces, ns_dicts, sr_objs = self.create_server_response_data(
+            shard_bounds)
+        _, root_shard_resp_hdrs = self._make_root_resp_hdrs(2, 4)
+
+        body = json.dumps(ns_dicts).encode('ascii')
+        req = Request.blank('/v1/a/c?state=listing', {'swift.cache': memcache})
+        req.headers['X-Backend-Record-Type'] = 'shard'
+        req.headers['X-Backend-Record-Shard-Format'] = 'namespace'
+        with mocked_http_conn(200, body_iter=[body],
+                              headers=root_shard_resp_hdrs) as fake_conn:
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(1, len(fake_conn.requests))
+        exp_backend_hdrs = {
+            'X-Backend-Record-Type': 'shard',
+            'X-Backend-Record-Shard-Format': 'namespace',
+            'Host': mock.ANY, 'X-Trans-Id': mock.ANY, 'X-Timestamp': mock.ANY,
+            'Connection': 'close', 'User-Agent': mock.ANY,
+            'Referer': mock.ANY}
+        self.assertEqual(exp_backend_hdrs, fake_conn.requests[0]['headers'])
+        self.assertIn('state=listing', fake_conn.requests[0]['qs'])
+        # NB: no namespaces cached
+        self.assertEqual([mock.call.set('container/a/c', mock.ANY, time=60)],
+                         memcache.calls)
+        self.assertEqual(ns_dicts, json.loads(resp.body))
+
+    def test_GET_record_type_object(self):
+        # explicit request for objects
+        memcache = FakeMemcache()
+        shard_bounds = ('', 'pie')
+        namespaces, ns_dicts, sr_objs = self.create_server_response_data(
+            shard_bounds)
+        all_objs = sum(sr_objs, [])
+        root_resp_hdrs, _ = self._make_root_resp_hdrs(
+            len(all_objs), 4, extra_hdrs={'X-Backend-Record-Type': 'object'})
+        body = json.dumps(sr_objs[0]).encode('ascii')
+        req = Request.blank('/v1/a/c', {'swift.cache': memcache})
+        req.headers['X-Backend-Record-Type'] = 'object'
+        with mocked_http_conn(200, body_iter=[body],
+                              headers=root_resp_hdrs) as fake_conn:
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(1, len(fake_conn.requests))
+        exp_backend_hdrs = {
+            'X-Backend-Record-Type': 'object',
+            'Host': mock.ANY, 'X-Trans-Id': mock.ANY, 'X-Timestamp': mock.ANY,
+            'Connection': 'close', 'User-Agent': mock.ANY,
+            'Referer': 'GET http://localhost/v1/a/c?format=json'}
+        self.assertEqual(exp_backend_hdrs, fake_conn.requests[0]['headers'])
+        self.assertEqual([mock.call.set('container/a/c', mock.ANY, time=60)],
+                         memcache.calls)
+        self.assertEqual(all_objs, json.loads(resp.body))
+        self.assertEqual('object', resp.headers.get('X-Backend-Record-Type'))
+
+
+@patch_policies([StoragePolicy(0, 'zero', True, object_ring=FakeRing())])
+class TestGetShardedContainerLegacy(TestGetShardedContainer):
+    """
+    Test all existing test cases to query Namespaces from container server but
+    get ShardRanges returned. This is to test backward compatibility that new
+    proxy-servers ask for new Namespace format from the older version container
+    servers who don't support Namespace format yet.
+    """
+    # old container servers did not return this header
+    RESP_SHARD_FORMAT_HEADERS = {}
+
+    def create_server_namespace_dict(self, name, lower, upper):
+        # return a dict representation of an instance of the type the backend
+        # server returns for shard format = 'namespace'
+        return dict(ShardRange(name, Timestamp.now(), lower, upper,
+                               state=ShardRange.ACTIVE))
+
+    def create_server_response_data(self, bounds, states=None,
+                                    name_prefix='.shards_a/c_'):
+        if not isinstance(bounds[0], (list, tuple)):
+            bounds = [(l, u) for l, u in zip(bounds[:-1], bounds[1:])]
+        if not states:
+            states = []
+        shard_ranges = [
+            ShardRange(name_prefix + bound[1].replace('/', '-'),
+                       Timestamp.now(), bound[0], bound[1], state=state)
+            for bound, state in zip_longest(
+                bounds, states, fillvalue=ShardRange.FOUND)]
+        sr_dicts = [dict(sr, last_modified=sr.timestamp.isoformat)
+                    for sr in shard_ranges]
+        sr_objs = [self._make_shard_objects(sr) for sr in shard_ranges]
+        return shard_ranges, sr_dicts, sr_objs
+
+
+class BaseTestContainerControllerGetPath(BaseTestContainerController):
+    def setUp(self):
+        super(BaseTestContainerControllerGetPath, self).setUp()
+        self.memcache = FakeMemcache()
+        shard_bounds = (('', 'ham'), ('ham', 'pie'), ('pie', ''))
+        self.ns_dicts = [{'name': '.shards_a/c_%s' % upper,
+                          'lower': lower,
+                          'upper': upper}
+                         for lower, upper in shard_bounds]
+        self.root_resp_hdrs = {
+            'Accept-Ranges': 'bytes',
+            'Content-Type': 'application/json',
+            'Last-Modified': 'Thu, 01 Jan 1970 00:00:03 GMT',
+            'X-Backend-Timestamp': '2',
+            'X-Backend-Put-Timestamp': '3',
+            'X-Backend-Delete-Timestamp': '0',
+            'X-Backend-Status-Changed-At': '0',
+            'X-Timestamp': '2',
+            'X-Put-Timestamp': '3',
+            'X-Container-Object-Count': '6',
+            'X-Container-Bytes-Used': '12',
+            'X-Backend-Storage-Policy-Index': '0'}
+
+    def _call_app(self, req):
+        return req.get_response(self.app)
+
+    def _build_request(self, headers, params, infocache=None):
+        # helper to make a GET request with caches set in environ
+        query_string = '?' + '&'.join('%s=%s' % (k, v)
+                                      for k, v in params.items())
+        container_path = '/v1/a/c' + query_string
+        request = Request.blank(container_path, headers=headers)
+        request.environ['swift.cache'] = self.memcache
+        request.environ['swift.infocache'] = infocache if infocache else {}
+        return request
+
+    def _check_response(self, resp, exp_listing, extra_hdrs):
+        # helper to check a shard listing response
+        actual_shards = json.loads(resp.body)
+        self.assertEqual(exp_listing, actual_shards)
+        exp_hdrs = dict(self.root_resp_hdrs)
+        # x-put-timestamp is sent from backend but removed in proxy base
+        # controller GETorHEAD_base so not expected in response from proxy
+        exp_hdrs.pop('X-Put-Timestamp')
+        self.assertIn('X-Timestamp', resp.headers)
+        actual_timestamp = resp.headers.pop('X-Timestamp')
+        exp_timestamp = exp_hdrs.pop('X-Timestamp')
+        self.assertEqual(Timestamp(exp_timestamp),
+                         Timestamp(actual_timestamp))
+        exp_hdrs.update(extra_hdrs)
+        exp_hdrs.update(
+            {'X-Storage-Policy': 'zero',  # added in container controller
+             'Content-Length':
+                 str(len(json.dumps(exp_listing).encode('ascii'))),
+             }
+        )
+        # we expect this header to be removed by proxy
+        exp_hdrs.pop('X-Backend-Override-Shard-Name-Filter', None)
+        for ignored in ('x-account-container-count', 'x-object-meta-test',
+                        'x-delete-at', 'etag', 'x-works'):
+            # FakeConn adds these
+            resp.headers.pop(ignored, None)
+        self.assertEqual(exp_hdrs, resp.headers)
+
+    def _capture_backend_request(self, req, resp_status, resp_body,
+                                 resp_extra_hdrs, num_resp=1):
+        self.assertGreater(num_resp, 0)  # sanity check
+        resp_hdrs = dict(self.root_resp_hdrs)
+        resp_hdrs.update(resp_extra_hdrs)
+        resp_status = [resp_status] * num_resp
+        with mocked_http_conn(
+                *resp_status, body_iter=[resp_body] * num_resp,
+                headers=[resp_hdrs] * num_resp) as fake_conn:
+            resp = self._call_app(req)
+        self.assertEqual(resp_status[0], resp.status_int)
+        self.assertEqual(num_resp, len(fake_conn.requests))
+        return fake_conn.requests[0], resp
+
+    def _check_backend_req(self, req, backend_req, extra_params=None,
+                           extra_hdrs=None):
+        self.assertEqual('a/c', backend_req['path'][7:])
+
+        expected_params = {'states': 'listing', 'format': 'json'}
+        if extra_params:
+            expected_params.update(extra_params)
+        backend_params = dict(urllib.parse.parse_qsl(
+            backend_req['qs'], True, encoding='latin1'))
+        self.assertEqual(expected_params, backend_params)
+
+        backend_hdrs = backend_req['headers']
+        self.assertIsNotNone(backend_hdrs.pop('Referer', None))
+        self.assertIsNotNone(backend_hdrs.pop('X-Timestamp', None))
+        self.assertTrue(backend_hdrs.pop('User-Agent', '').startswith(
+            'proxy-server'))
+        expected_headers = {
+            'Connection': 'close',
+            'Host': 'localhost:80',
+            'X-Trans-Id': req.headers['X-Trans-Id']}
+        if extra_hdrs:
+            expected_headers.update(extra_hdrs)
+        self.assertEqual(expected_headers, backend_hdrs)
+        for k, v in expected_headers.items():
+            self.assertIn(k, backend_hdrs)
+            self.assertEqual(v, backend_hdrs.get(k))
+
+
+class TestGetPathNamespaceCaching(BaseTestContainerControllerGetPath):
+    # These tests are verifying the content and caching of the backend
+    # namespace responses so we're not interested in gathering objects from the
+    # shards. We therefore mock _get_from_shards so that the response actually
+    # contains a fake listing and also capture the namespace listing passed to
+    # _get_from_shards. This avoids faking all the object listing responses
+    # from shards, and facilitates making assertions about the namespaces
+    # passed to _get_from_shards.
+    RESP_SHARD_FORMAT_HEADERS = {'X-Backend-Record-Shard-Format': 'namespace'}
+    bogus_listing = [{'name': 'x'}, {'name': 'y'}]
+    bogus_listing_body = json.dumps(bogus_listing).encode('ascii')
+
+    def setUp(self):
+        super(TestGetPathNamespaceCaching, self).setUp()
+        self.namespaces = [Namespace(**ns) for ns in self.ns_dicts]
+        self.ns_bound_list = NamespaceBoundList.parse(self.namespaces)
+        self._setup_namespace_stubs()
+        self.get_from_shards_lists = []
+
+    def _fake_get_from_shards(self, req, resp, namespaces):
+        self.get_from_shards_lists.append(namespaces)
+        resp.body = self.bogus_listing_body
+        return resp
+
+    def _call_app(self, req):
+        # override base class method to mock get_from_shards
+        self.get_from_shards_lists = []
+        with mock.patch(
+                'swift.proxy.controllers.container.'
+                'ContainerController._get_from_shards',
+                side_effect=self._fake_get_from_shards):
+            return req.get_response(self.app)
+
+    def _setup_namespace_stubs(self):
+        self._stub_namespaces = self.ns_dicts
+        self._stub_namespaces_dump = json.dumps(
+            self._stub_namespaces).encode('ascii')
+
+    def _do_test_GET_namespace_caching(self, record_type, exp_recheck_listing,
+                                       extra_backend_req_hdrs=None):
+        # this test gets shard ranges into cache and then reads from cache
+        exp_backend_req_hdrs = {
+            'X-Backend-Record-Type': 'auto',
+            'X-Backend-Record-Shard-Format': 'namespace',
+            'X-Backend-Include-Deleted': 'false',
+            'X-Backend-Override-Shard-Name-Filter': 'sharded'}
+        if extra_backend_req_hdrs:
+            exp_backend_req_hdrs.update(extra_backend_req_hdrs)
+        sharding_state = 'sharded'
+        exp_noncache_resp_hdrs = {
+            'X-Backend-Recheck-Container-Existence': '60',
+            'X-Backend-Sharding-State': 'sharded'}
+        exp_cache_resp_hdrs = {
+            'X-Backend-Cached-Results': 'true',
+            'X-Backend-Sharding-State': sharding_state}
+        self.memcache.delete_all()
+        # container is sharded but proxy does not have that state cached;
+        # expect a backend request and expect namespaces to be cached
+        self.memcache.clear_calls()
+        self.logger.clear()
+        req = self._build_request({'X-Backend-Record-Type': record_type},
+                                  {'states': 'listing'}, {})
+        backend_resp_hdrs = {'X-Backend-Record-Type': 'shard',
+                             'X-Backend-Sharding-State': 'sharded',
+                             'X-Backend-Override-Shard-Name-Filter': 'true'}
+        backend_resp_hdrs.update(self.RESP_SHARD_FORMAT_HEADERS)
+
+        backend_req, resp = self._capture_backend_request(
+            req, 200, self._stub_namespaces_dump, backend_resp_hdrs)
+
+        self._check_backend_req(
+            req, backend_req, extra_hdrs=exp_backend_req_hdrs)
+        self._check_response(resp, self.bogus_listing, exp_noncache_resp_hdrs)
+
+        cache_key = 'shard-listing-v2/a/c'
+        self.assertEqual(
+            [mock.call.get('container/a/c'),
+             mock.call.set(cache_key, self.ns_bound_list.bounds,
+                           time=exp_recheck_listing, raise_on_error=True),
+             mock.call.set('container/a/c', mock.ANY, time=60)],
+            self.memcache.calls)
+        self.assertEqual('sharded',
+                         self.memcache.calls[2][1][1]['sharding_state'])
+        self.assertIn('swift.infocache', req.environ)
+        self.assertIn(cache_key, req.environ['swift.infocache'])
+        self.assertEqual(self.ns_bound_list,
+                         req.environ['swift.infocache'][cache_key])
+        self.assertEqual(
+            [x[0][0] for x in
+             self.logger.logger.statsd_client.calls['increment']],
+            ['container.info.cache.miss',
+             'container.shard_listing.cache.bypass.200'])
+
+        # container is sharded and proxy has that state cached, but
+        # no namespaces cached; expect a cache miss and write-back
+        self.memcache.delete(cache_key)
+        self.memcache.clear_calls()
+        self.logger.clear()
+        req = self._build_request({'X-Backend-Record-Type': record_type},
+                                  {'states': 'listing'}, {})
+        backend_req, resp = self._capture_backend_request(
+            req, 200, self._stub_namespaces_dump, backend_resp_hdrs)
+        self._check_backend_req(
+            req, backend_req, extra_hdrs=exp_backend_req_hdrs)
+        self._check_response(resp, self.bogus_listing, exp_noncache_resp_hdrs)
+        self.assertEqual(
+            [mock.call.get('container/a/c'),
+             mock.call.get(cache_key, raise_on_error=True),
+             mock.call.set(cache_key, self.ns_bound_list.bounds,
+                           time=exp_recheck_listing, raise_on_error=True),
+             # Since there was a backend request, we go ahead and cache
+             # container info, too
+             mock.call.set('container/a/c', mock.ANY, time=60)],
+            self.memcache.calls)
+        self.assertIn('swift.infocache', req.environ)
+        self.assertIn(cache_key, req.environ['swift.infocache'])
+        self.assertEqual(self.ns_bound_list,
+                         req.environ['swift.infocache'][cache_key])
+        self.assertEqual(
+            [x[0][0] for x in
+             self.logger.logger.statsd_client.calls['increment']],
+            ['container.info.cache.hit',
+             'container.shard_listing.cache.miss.200'])
+
+        # container is sharded and proxy does have that state cached and
+        # also has namespaces cached; expect a read from cache
+        self.memcache.clear_calls()
+        self.logger.clear()
+        req = self._build_request({'X-Backend-Record-Type': record_type},
+                                  {'states': 'listing'}, {})
+        resp = self._call_app(req)
+        self._check_response(resp, self.bogus_listing, exp_cache_resp_hdrs)
+        self.assertEqual(
+            [mock.call.get('container/a/c'),
+             mock.call.get(cache_key, raise_on_error=True)],
+            self.memcache.calls)
+        self.assertIn('swift.infocache', req.environ)
+        self.assertIn(cache_key, req.environ['swift.infocache'])
+        self.assertEqual(self.ns_bound_list,
+                         req.environ['swift.infocache'][cache_key])
+        self.assertEqual(
+            [x[0][0] for x in
+             self.logger.logger.statsd_client.calls['increment']],
+            ['container.info.cache.hit',
+             'container.shard_listing.cache.hit'])
+
+        # if there's a chance to skip cache, maybe we go to disk again...
+        self.memcache.clear_calls()
+        self.logger.clear()
+        self.app.container_listing_shard_ranges_skip_cache = 0.10
+        req = self._build_request({'X-Backend-Record-Type': record_type},
+                                  {'states': 'listing'}, {})
+        with mock.patch('random.random', return_value=0.05):
+            backend_req, resp = self._capture_backend_request(
+                req, 200, self._stub_namespaces_dump, backend_resp_hdrs)
+        self._check_backend_req(
+            req, backend_req, extra_hdrs=exp_backend_req_hdrs)
+        self._check_response(resp, self.bogus_listing, exp_noncache_resp_hdrs)
+        self.assertEqual(
+            [mock.call.get('container/a/c'),
+             mock.call.set(cache_key, self.ns_bound_list.bounds,
+                           time=exp_recheck_listing, raise_on_error=True),
+             # Since there was a backend request, we go ahead and cache
+             # container info, too
+             mock.call.set('container/a/c', mock.ANY, time=60)],
+            self.memcache.calls)
+        self.assertIn('swift.infocache', req.environ)
+        self.assertIn(cache_key, req.environ['swift.infocache'])
+        self.assertEqual(self.ns_bound_list,
+                         req.environ['swift.infocache'][cache_key])
+        self.assertEqual(
+            [x[0][0] for x in
+             self.logger.logger.statsd_client.calls['increment']],
+            ['container.info.cache.hit',
+             'container.shard_listing.cache.skip.200'])
+
+        # ... or maybe we serve from cache
+        self.memcache.clear_calls()
+        self.logger.clear()
+        req = self._build_request({'X-Backend-Record-Type': record_type},
+                                  {'states': 'listing'}, {})
+        with mock.patch('random.random', return_value=0.11):
+            resp = self._call_app(req)
+            self._check_response(resp, self.bogus_listing, exp_cache_resp_hdrs)
+        self.assertEqual(
+            [mock.call.get('container/a/c'),
+             mock.call.get(cache_key, raise_on_error=True)],
+            self.memcache.calls)
+        self.assertIn('swift.infocache', req.environ)
+        self.assertIn(cache_key, req.environ['swift.infocache'])
+        self.assertEqual(self.ns_bound_list,
+                         req.environ['swift.infocache'][cache_key])
+        self.assertEqual(
+            [x[0][0] for x in
+             self.logger.logger.statsd_client.calls['increment']],
+            ['container.info.cache.hit',
+             'container.shard_listing.cache.hit'])
+
+        # test request to hit infocache.
+        self.memcache.clear_calls()
+        self.logger.clear()
+        req = self._build_request(
+            {'X-Backend-Record-Type': record_type},
+            {'states': 'listing'},
+            infocache=req.environ['swift.infocache'])
+        with mock.patch('random.random', return_value=0.11):
+            resp = self._call_app(req)
+        self._check_response(resp, self.bogus_listing, exp_cache_resp_hdrs)
+        self.assertEqual([], self.memcache.calls)
+        self.assertIn('swift.infocache', req.environ)
+        self.assertIn(cache_key, req.environ['swift.infocache'])
+        self.assertEqual(self.ns_bound_list,
+                         req.environ['swift.infocache'][cache_key])
+        self.assertEqual(
+            [x[0][0] for x in
+             self.logger.logger.statsd_client.calls['increment']],
+            ['container.info.infocache.hit',
+             'container.shard_listing.infocache.hit'])
+
+        # put this back the way we found it for later subtests
+        self.app.container_listing_shard_ranges_skip_cache = 0.0
+
+        # delete the container; check that namespaces are evicted from cache
+        self.memcache.clear_calls()
+        infocache = {}
+        req = Request.blank('/v1/a/c', method='DELETE')
+        req.environ['swift.cache'] = self.memcache
+        req.environ['swift.infocache'] = infocache
+        self._capture_backend_request(req, 204, b'', {},
+                                      num_resp=self.CONTAINER_REPLICAS)
+        self.assertEqual(
+            [mock.call.delete('container/a/c'),
+             mock.call.delete(cache_key)],
+            self.memcache.calls)
+
+    def test_GET_namespace_caching(self):
+        # no record type defaults to 'auto' in backend requests;
+        # expect shard ranges cache time to be default value of 600
+        self._do_test_GET_namespace_caching('', 600)
+        # expect shard ranges cache time to be configured value of 120
+        self.app.recheck_listing_shard_ranges = 120
+        self._do_test_GET_namespace_caching('', 120)
+        # explicitly requesting record type 'auto'
+        self._do_test_GET_namespace_caching('auto', 120)
+        # nonsense record type defaults to 'auto'
+        self._do_test_GET_namespace_caching('banana', 120)
+
+    def test_get_from_shards_add_root_spi(self):
+        shard_resp = mock.MagicMock(status_int=204,
+                                    headers={'x-backend-record-type': 'shard'})
+
+        def mock_get_container_listing(self_, req, *args, **kargs):
+            captured_hdrs.update(req.headers)
+            return None, shard_resp
+
+        # header in response -> header added to request
+        captured_hdrs = {}
+        req = Request.blank('/v1/a/c', environ={'REQUEST_METHOD': 'GET'})
+        resp_hdrs = dict(self.root_resp_hdrs)
+        resp_hdrs['x-backend-record-type'] = 'shard'
+        resp_hdrs.update(self.RESP_SHARD_FORMAT_HEADERS)
+
+        resp = mock.MagicMock(status_int=200,
+                              headers=resp_hdrs,
+                              request=req)
+        resp.headers['X-Backend-Storage-Policy-Index'] = '0'
+        with mock.patch('swift.proxy.controllers.container.'
+                        'ContainerController._get_container_listing',
+                        mock_get_container_listing):
+            controller_cls, d = self.app.get_controller(req)
+            controller = controller_cls(self.app, **d)
+            controller._get_from_shards(req, resp, list(self.namespaces))
+
+        self.assertIn('X-Backend-Storage-Policy-Index', captured_hdrs)
+        self.assertEqual(
+            captured_hdrs['X-Backend-Storage-Policy-Index'], '0')
+
+        captured_hdrs = {}
+        req = Request.blank('/v1/a/c', environ={'REQUEST_METHOD': 'GET'})
+        resp = mock.MagicMock(status_int=200,
+                              headers=resp_hdrs,
+                              request=req)
+        resp.headers['X-Backend-Storage-Policy-Index'] = '1'
+        with mock.patch('swift.proxy.controllers.container.'
+                        'ContainerController._get_container_listing',
+                        mock_get_container_listing):
+            controller_cls, d = self.app.get_controller(req)
+            controller = controller_cls(self.app, **d)
+            controller._get_from_shards(req, resp, list(self.namespaces))
+
+        self.assertIn('X-Backend-Storage-Policy-Index', captured_hdrs)
+        self.assertEqual(
+            captured_hdrs['X-Backend-Storage-Policy-Index'], '1')
+
+        # header not added to request if not root request
+        captured_hdrs = {}
+        req = Request.blank('/v1/a/c',
+                            environ={
+                                'REQUEST_METHOD': 'GET',
+                                'swift.shard_listing_history': [('a', 'c')]}
+                            )
+        resp = mock.MagicMock(status_int=200,
+                              headers=self.root_resp_hdrs,
+                              request=req)
+        resp.headers['X-Backend-Storage-Policy-Index'] = '0'
+        with mock.patch('swift.proxy.controllers.container.'
+                        'ContainerController._get_container_listing',
+                        mock_get_container_listing):
+            controller_cls, d = self.app.get_controller(req)
+            controller = controller_cls(self.app, **d)
+            controller._get_from_shards(req, resp, list(self.namespaces))
+
+        self.assertNotIn('X-Backend-Storage-Policy-Index', captured_hdrs)
+
+        # existing X-Backend-Storage-Policy-Index in request is respected
+        captured_hdrs = {}
+        req = Request.blank('/v1/a/c', environ={'REQUEST_METHOD': 'GET'})
+        req.headers['X-Backend-Storage-Policy-Index'] = '0'
+        resp = mock.MagicMock(status_int=200,
+                              headers=resp_hdrs,
+                              request=req)
+        resp.headers['X-Backend-Storage-Policy-Index'] = '1'
+        with mock.patch('swift.proxy.controllers.container.'
+                        'ContainerController._get_container_listing',
+                        mock_get_container_listing):
+            controller_cls, d = self.app.get_controller(req)
+            controller = controller_cls(self.app, **d)
+            controller._get_from_shards(req, resp, list(self.namespaces))
+
+        self.assertIn('X-Backend-Storage-Policy-Index', captured_hdrs)
+        self.assertEqual(
+            captured_hdrs['X-Backend-Storage-Policy-Index'], '0')
+
+    def test_GET_namespaces_404_response(self):
+        # pre-warm cache with container info but not shard ranges so that the
+        # backend request tries to get a cacheable listing, but backend 404's
+        info = headers_to_container_info(self.root_resp_hdrs)
+        info['status'] = 200
+        info['sharding_state'] = 'sharded'
+        self.memcache.set('container/a/c', info)
+        self.memcache.clear_calls()
+        req = self._build_request({'X-Backend-Record-Type': ''},
+                                  {'states': 'listing'}, {})
+        backend_req, resp = self._capture_backend_request(
+            req, 404, b'', {}, num_resp=2 * self.CONTAINER_REPLICAS)
+        self._check_backend_req(
+            req, backend_req,
+            extra_hdrs={'X-Backend-Record-Type': 'auto',
+                        'X-Backend-Record-Shard-Format': 'namespace',
+                        'X-Backend-Include-Deleted': 'false',
+                        'X-Backend-Override-Shard-Name-Filter': 'sharded'})
+        self.assertNotIn('X-Backend-Cached-Results', resp.headers)
+        # Note: container metadata is updated in cache but shard ranges are not
+        # deleted from cache
+        self.assertEqual(
+            [mock.call.get('container/a/c'),
+             mock.call.get('shard-listing-v2/a/c', raise_on_error=True),
+             mock.call.set('container/a/c', mock.ANY, time=6.0)],
+            self.memcache.calls)
+        self.assertEqual(404, self.memcache.calls[2][1][1]['status'])
+        self.assertEqual(b'', resp.body)
+        self.assertEqual(404, resp.status_int)
+        self.assertEqual({'container.info.cache.hit': 1,
+                          'container.shard_listing.cache.miss.404': 1},
+                         self.logger.statsd_client.get_stats_counts())
+
+    def test_GET_namespaces_read_from_cache_error(self):
+        info = headers_to_container_info(self.root_resp_hdrs)
+        info['status'] = 200
+        info['sharding_state'] = 'sharded'
+        self.memcache.set('container/a/c', info)
+        self.memcache.clear_calls()
+        self.memcache.error_on_get = [False, True]
+
+        req = self._build_request({'X-Backend-Record-Type': ''},
+                                  {'states': 'listing'}, {})
+        backend_req, resp = self._capture_backend_request(
+            req, 404, b'', {}, num_resp=2 * self.CONTAINER_REPLICAS)
+        self._check_backend_req(
+            req, backend_req,
+            extra_hdrs={'X-Backend-Record-Type': 'auto',
+                        'X-Backend-Record-Shard-Format': 'namespace',
+                        'X-Backend-Include-Deleted': 'false',
+                        'X-Backend-Override-Shard-Name-Filter': 'sharded'})
+        self.assertNotIn('X-Backend-Cached-Results', resp.headers)
+        self.assertEqual(
+            [mock.call.get('container/a/c'),
+             mock.call.get('shard-listing-v2/a/c', raise_on_error=True),
+             mock.call.set('container/a/c', mock.ANY, time=6.0)],
+            self.memcache.calls)
+        self.assertEqual(404, self.memcache.calls[2][1][1]['status'])
+        self.assertEqual(b'', resp.body)
+        self.assertEqual(404, resp.status_int)
+        self.assertEqual({'container.info.cache.hit': 1,
+                          'container.shard_listing.cache.error.404': 1},
+                         self.logger.statsd_client.get_stats_counts())
+
+    def test_GET_namespaces_read_from_cache_empty_list(self):
+        info = headers_to_container_info(self.root_resp_hdrs)
+        info['status'] = 200
+        info['sharding_state'] = 'sharded'
+        self.memcache.set('container/a/c', info)
+        # note: an empty list in cache is unexpected and is treated as a miss
+        self.memcache.set('shard-listing-v2/a/c', [])
+        self.memcache.clear_calls()
+
+        req = self._build_request({'X-Backend-Record-Type': ''},
+                                  {'states': 'listing'}, {})
+        backend_req, resp = self._capture_backend_request(
+            req, 404, b'', {}, num_resp=2 * self.CONTAINER_REPLICAS)
+        self._check_backend_req(
+            req, backend_req,
+            extra_hdrs={'X-Backend-Record-Type': 'auto',
+                        'X-Backend-Record-Shard-Format': 'namespace',
+                        'X-Backend-Include-Deleted': 'false',
+                        'X-Backend-Override-Shard-Name-Filter': 'sharded'})
+        self.assertNotIn('X-Backend-Cached-Results', resp.headers)
+        self.assertEqual(
+            [mock.call.get('container/a/c'),
+             mock.call.get('shard-listing-v2/a/c', raise_on_error=True),
+             mock.call.set('container/a/c', mock.ANY, time=6.0)],
+            self.memcache.calls)
+        self.assertEqual(404, self.memcache.calls[2][1][1]['status'])
+        self.assertEqual(b'', resp.body)
+        self.assertEqual(404, resp.status_int)
+        self.assertEqual({'container.info.cache.hit': 1,
+                          'container.shard_listing.cache.miss.404': 1},
+                         self.logger.statsd_client.get_stats_counts())
+
+    def _do_test_GET_namespaces_read_from_cache(self, params, record_type):
+        # pre-warm cache with container metadata and shard ranges and verify
+        # that shard range listing are read from cache when appropriate
+        self.memcache.delete_all()
+        self.logger.clear()
+        info = headers_to_container_info(self.root_resp_hdrs)
+        info['status'] = 200
+        info['sharding_state'] = 'sharded'
+        self.memcache.set('container/a/c', info)
+        self.memcache.set('shard-listing-v2/a/c', self.ns_bound_list.bounds)
+        self.memcache.clear_calls()
+
+        req_hdrs = {'X-Backend-Record-Type': record_type}
+        req = self._build_request(req_hdrs, params, {})
+        resp = self._call_app(req)
+        self.assertEqual(
+            [mock.call.get('container/a/c'),
+             mock.call.get('shard-listing-v2/a/c', raise_on_error=True)],
+            self.memcache.calls)
+        self.assertEqual({'container.info.cache.hit': 1,
+                          'container.shard_listing.cache.hit': 1},
+                         self.logger.statsd_client.get_stats_counts())
+        return resp
+
+    def test_GET_namespaces_read_from_cache(self):
+        exp_resp_hdrs = {'X-Backend-Cached-Results': 'true',
+                         'X-Backend-Override-Shard-Name-Filter': 'true',
+                         'X-Backend-Sharding-State': 'sharded'}
+
+        resp = self._do_test_GET_namespaces_read_from_cache(
+            {'states': 'listing'}, 'auto')
+        self._check_response(resp, self.bogus_listing, exp_resp_hdrs)
+        self.assertEqual([self.namespaces], self.get_from_shards_lists)
+
+        # no record type defaults to auto
+        resp = self._do_test_GET_namespaces_read_from_cache(
+            {'states': 'listing'}, '')
+        self._check_response(resp, self.bogus_listing, exp_resp_hdrs)
+        self.assertEqual([self.namespaces], self.get_from_shards_lists)
+
+        resp = self._do_test_GET_namespaces_read_from_cache(
+            {'states': 'listing', 'reverse': 'true'}, 'auto')
+        self._check_response(resp, self.bogus_listing, exp_resp_hdrs)
+        exp_shards = list(self.namespaces)
+        exp_shards.reverse()
+        self.assertEqual([exp_shards], self.get_from_shards_lists)
+
+        resp = self._do_test_GET_namespaces_read_from_cache(
+            {'states': 'listing', 'marker': 'jam'}, 'auto')
+        self._check_response(resp, self.bogus_listing, exp_resp_hdrs)
+        self.assertEqual([self.namespaces[1:]], self.get_from_shards_lists)
+
+        resp = self._do_test_GET_namespaces_read_from_cache(
+            {'states': 'listing', 'marker': 'jam', 'end_marker': 'kale'},
+            'auto')
+        self._check_response(resp, self.bogus_listing, exp_resp_hdrs)
+        self.assertEqual([self.namespaces[1:2]], self.get_from_shards_lists)
+
+        resp = self._do_test_GET_namespaces_read_from_cache(
+            {'states': 'listing', 'includes': 'egg'}, 'auto')
+        self._check_response(resp, self.bogus_listing, exp_resp_hdrs)
+        self.assertEqual([self.namespaces[:1]], self.get_from_shards_lists)
+
+    def _do_test_GET_namespaces_write_to_cache(self, params, record_type):
+        # verify that namespace listing is written to cache when appropriate
+        self.logger.clear()
+        self.memcache.delete_all()
+        self.memcache.clear_calls()
+        # set request up for cacheable listing
+        req_hdrs = {'X-Backend-Record-Type': record_type}
+        req = self._build_request(req_hdrs, params, {})
+        # response indicates cacheable listing
+        resp_hdrs = {'X-Backend-Record-Type': 'shard',
+                     'X-Backend-Override-Shard-Name-Filter': 'true',
+                     'X-Backend-Sharding-State': 'sharded'}
+        resp_hdrs.update(self.RESP_SHARD_FORMAT_HEADERS)
+        backend_req, resp = self._capture_backend_request(
+            req, 200, self._stub_namespaces_dump, resp_hdrs)
+        self._check_backend_req(
+            req, backend_req,
+            extra_params=params,
+            extra_hdrs={'X-Backend-Record-Type': 'auto',
+                        'X-Backend-Record-Shard-Format': 'namespace',
+                        'X-Backend-Include-Deleted': 'false',
+                        'X-Backend-Override-Shard-Name-Filter': 'sharded'})
+        expected_hdrs = {'X-Backend-Recheck-Container-Existence': '60'}
+        expected_hdrs.update(resp_hdrs)
+        self.assertEqual(
+            [mock.call.get('container/a/c'),
+             mock.call.set('shard-listing-v2/a/c', self.ns_bound_list.bounds,
+                           time=600, raise_on_error=True),
+             mock.call.set('container/a/c', mock.ANY, time=60)],
+            self.memcache.calls)
+        info_lines = self.logger.get_lines_for_level('info')
+        self.assertIn(
+            'Caching listing namespaces for shard-listing-v2/a/c '
+            '(3 namespaces)', info_lines)
+        # shards were cached
+        self.assertEqual('sharded',
+                         self.memcache.calls[2][1][1]['sharding_state'])
+        self.assertEqual({'container.info.cache.miss': 1,
+                          'container.shard_listing.cache.bypass.200': 1},
+                         self.logger.statsd_client.get_stats_counts())
+        return resp
+
+    def test_GET_namespaces_write_to_cache(self):
+        exp_resp_hdrs = {'X-Backend-Recheck-Container-Existence': '60',
+                         'X-Backend-Override-Shard-Name-Filter': 'true',
+                         'X-Backend-Sharding-State': 'sharded'}
+
+        resp = self._do_test_GET_namespaces_write_to_cache(
+            {'states': 'listing'}, 'auto')
+        self._check_response(resp, self.bogus_listing, exp_resp_hdrs)
+        self.assertEqual([self.namespaces], self.get_from_shards_lists)
+
+        # no record type defaults to auto
+        resp = self._do_test_GET_namespaces_write_to_cache(
+            {'states': 'listing'}, '')
+        self._check_response(resp, self.bogus_listing, exp_resp_hdrs)
+        self.assertEqual([self.namespaces], self.get_from_shards_lists)
+
+        resp = self._do_test_GET_namespaces_write_to_cache(
+            {'states': 'listing', 'reverse': 'true'}, 'auto')
+        self._check_response(resp, self.bogus_listing, exp_resp_hdrs)
+        exp_shards = list(self.namespaces)
+        exp_shards.reverse()
+        self.assertEqual([exp_shards], self.get_from_shards_lists)
+
+        resp = self._do_test_GET_namespaces_write_to_cache(
+            {'states': 'listing', 'marker': 'jam'}, 'auto')
+        self._check_response(resp, self.bogus_listing, exp_resp_hdrs)
+        self.assertEqual([self.namespaces[1:]], self.get_from_shards_lists)
+
+        resp = self._do_test_GET_namespaces_write_to_cache(
+            {'states': 'listing', 'marker': 'jam', 'end_marker': 'kale'},
+            'auto')
+        self._check_response(resp, self.bogus_listing, exp_resp_hdrs)
+        self.assertEqual([self.namespaces[1:2]], self.get_from_shards_lists)
+
+        resp = self._do_test_GET_namespaces_write_to_cache(
+            {'states': 'listing', 'includes': 'egg'}, 'auto')
+        self._check_response(resp, self.bogus_listing, exp_resp_hdrs)
+        self.assertEqual([self.namespaces[:1]], self.get_from_shards_lists)
+
+    def test_GET_namespaces_write_to_cache_with_x_newest(self):
+        # when x-newest is sent, verify that there is no cache lookup to check
+        # sharding state but then backend requests are made requesting complete
+        # namespace list which can be cached
+        req_hdrs = {'X-Backend-Record-Type': 'auto',
+                    'X-Newest': 'true'}
+        params = {'states': 'listing'}
+        req = self._build_request(req_hdrs, params, {})
+        resp_hdrs = {'X-Backend-Record-Type': 'shard',
+                     'X-Backend-Override-Shard-Name-Filter': 'true',
+                     'X-Backend-Sharding-State': 'sharded'}
+        resp_hdrs.update(self.RESP_SHARD_FORMAT_HEADERS)
+
+        backend_req, resp = self._capture_backend_request(
+            req, 200, self._stub_namespaces_dump, resp_hdrs,
+            num_resp=2 * self.CONTAINER_REPLICAS)
+        self._check_backend_req(
+            req, backend_req,
+            extra_hdrs={'X-Backend-Record-Type': 'auto',
+                        'X-Backend-Record-Shard-Format': 'namespace',
+                        'X-Backend-Include-Deleted': 'false',
+                        'X-Newest': 'true',
+                        'X-Backend-Override-Shard-Name-Filter': 'sharded'})
+        exp_resp_hdrs = {'X-Backend-Recheck-Container-Existence': '60',
+                         'X-Backend-Override-Shard-Name-Filter': 'true',
+                         'X-Backend-Sharding-State': 'sharded'}
+        self._check_response(resp, self.bogus_listing, exp_resp_hdrs)
+        self.assertEqual([self.namespaces], self.get_from_shards_lists)
+        self.assertEqual(
+            [mock.call.get('container/a/c'),
+             mock.call.set('shard-listing-v2/a/c', self.ns_bound_list.bounds,
+                           time=600, raise_on_error=True),
+             mock.call.set('container/a/c', mock.ANY, time=60)],
+            self.memcache.calls)
+        self.assertEqual('sharded',
+                         self.memcache.calls[2][1][1]['sharding_state'])
+        self.assertEqual({'container.info.cache.miss': 1,
+                          'container.shard_listing.cache.force_skip.200': 1},
+                         self.logger.statsd_client.get_stats_counts())
+
+    def _do_test_GET_namespaces_no_cache_write(self, resp_hdrs):
+        # verify that there is a cache lookup to check container info but then
+        # a backend request is made requesting complete shard list, but do not
+        # expect shard ranges to be cached; check that marker, end_marker etc
+        # are passed to backend
+        self.logger.clear()
+        self.memcache.clear_calls()
+        req = self._build_request(
+            {'X-Backend-Record-Type': ''},  # no record type defaults to auto
+            {'states': 'listing', 'marker': 'egg', 'end_marker': 'jam',
+             'reverse': 'true'}, {})
+        resp_namespaces = self._stub_namespaces[:2]
+        resp_namespaces.reverse()
+        backend_req, resp = self._capture_backend_request(
+            req, 200, json.dumps(resp_namespaces).encode('ascii'),
+            resp_hdrs)
+        self._check_backend_req(
+            req, backend_req,
+            extra_params={'marker': 'egg', 'end_marker': 'jam',
+                          'reverse': 'true'},
+            extra_hdrs={'X-Backend-Record-Type': 'auto',
+                        'X-Backend-Record-Shard-Format': 'namespace',
+                        'X-Backend-Include-Deleted': 'false',
+                        'X-Backend-Override-Shard-Name-Filter': 'sharded'})
+        exp_resp_hdrs = {'X-Backend-Recheck-Container-Existence': '60',
+                         'X-Backend-Override-Shard-Name-Filter': 'true'}
+        if 'X-Backend-Sharding-State' in resp_hdrs:
+            exp_resp_hdrs['X-Backend-Sharding-State'] = \
+                resp_hdrs['X-Backend-Sharding-State']
+        self._check_response(resp, self.bogus_listing, exp_resp_hdrs)
+        expected_shards = self.namespaces[:2]
+        expected_shards.reverse()
+        self.assertEqual([expected_shards], self.get_from_shards_lists)
+        # container metadata is looked up in memcache for sharding state
+        # container metadata is set in memcache
+        self.assertEqual(
+            [mock.call.get('container/a/c'),
+             mock.call.set('container/a/c', mock.ANY, time=60)],
+            self.memcache.calls)
+        self.assertEqual(resp.headers.get('X-Backend-Sharding-State'),
+                         self.memcache.calls[1][1][1]['sharding_state'])
+        self.memcache.delete_all()
+
+    def test_GET_namespaces_no_cache_write_with_cached_container_info(self):
+        # pre-warm cache with container info, but verify that shard range cache
+        # lookup is only attempted when the cached sharding state and status
+        # are suitable, and full set of headers can be constructed from cache;
+        # Note: backend response has state unsharded so no shard ranges cached
+
+        def do_test(info):
+            self.memcache.set('container/a/c', info)
+            # expect the same outcomes as if there was no cached container info
+            resp_headers = {'X-Backend-Record-Type': 'shard',
+                            'X-Backend-Override-Shard-Name-Filter': 'true',
+                            'X-Backend-Sharding-State': 'unsharded'}
+            resp_headers.update(self.RESP_SHARD_FORMAT_HEADERS)
+            self._do_test_GET_namespaces_no_cache_write(resp_headers)
+
+        # setup a default 'good' info
+        info = headers_to_container_info(self.root_resp_hdrs)
+        info['status'] = 200
+        info['sharding_state'] = 'sharded'
+        do_test(dict(info, status=404))
+        do_test(dict(info, sharding_state='unsharded'))
+        do_test(dict(info, sharding_state='sharding'))
+        do_test(dict(info, sharding_state='collapsed'))
+        do_test(dict(info, sharding_state='unexpected'))
+
+        stale_info = dict(info)
+        stale_info.pop('created_at')
+        do_test(stale_info)
+
+        stale_info = dict(info)
+        stale_info.pop('put_timestamp')
+        do_test(stale_info)
+
+        stale_info = dict(info)
+        stale_info.pop('delete_timestamp')
+        do_test(stale_info)
+
+        stale_info = dict(info)
+        stale_info.pop('status_changed_at')
+        do_test(stale_info)
+
+    def test_GET_namespaces_no_cache_write_for_non_sharded_states(self):
+        # verify that namespaces are not written to cache when container
+        # state returned by backend is not 'sharded'; we don't expect
+        # 'X-Backend-Override-Shard-Name-Filter': 'true' to be returned unless
+        # the sharding state is 'sharded' but include it in this test to check
+        # that the state is checked by proxy controller
+        resp_hdrs = {'X-Backend-Record-Type': 'shard',
+                     'X-Backend-Override-Shard-Name-Filter': 'true',
+                     'X-Backend-Sharding-State': 'unsharded'}
+        resp_hdrs.update(self.RESP_SHARD_FORMAT_HEADERS)
+        resp_hdrs['X-Backend-Sharding-State'] = 'sharding'
+        self._do_test_GET_namespaces_no_cache_write(resp_hdrs)
+        resp_hdrs['X-Backend-Sharding-State'] = 'collapsed'
+        self._do_test_GET_namespaces_no_cache_write(resp_hdrs)
+        resp_hdrs['X-Backend-Sharding-State'] = 'unexpected'
+        self._do_test_GET_namespaces_no_cache_write(resp_hdrs)
+
+    def test_GET_namespaces_no_cache_write_for_incomplete_listing(self):
+        # verify that namespaces are not written to cache when container
+        # response does not acknowledge x-backend-override-shard-name-filter
+        # e.g. container server not upgraded
+        resp_hdrs = {'X-Backend-Record-Type': 'shard',
+                     'X-Backend-Sharding-State': 'sharded'}
+        resp_hdrs.update(self.RESP_SHARD_FORMAT_HEADERS)
+        self._do_test_GET_namespaces_no_cache_write(resp_hdrs)
+        resp_hdrs['X-Backend-Override-Shard-Name-Filter'] = 'false'
+        self._do_test_GET_namespaces_no_cache_write(resp_hdrs)
+        resp_hdrs['X-Backend-Override-Shard-Name-Filter'] = 'rogue'
+        self._do_test_GET_namespaces_no_cache_write(resp_hdrs)
+
+    def _do_test_GET_namespaces_no_cache_write_not_namespaces(self, resp_hdrs):
+        # verify that there's no cache write for namespaces when backend
+        # response doesn't return namespaces
+        self.logger.clear()
+        self.memcache.clear_calls()
+        req = self._build_request(
+            {'X-Backend-Record-Type': ''},  # no record type defaults to auto
+            {'states': 'listing'}, {})
+
+        backend_req, resp = self._capture_backend_request(
+            req, 200, self.bogus_listing_body, resp_hdrs)
+        self._check_backend_req(
+            req, backend_req,
+            extra_hdrs={'X-Backend-Record-Type': 'auto',
+                        'X-Backend-Record-Shard-Format': 'namespace',
+                        'X-Backend-Include-Deleted': 'false',
+                        'X-Backend-Override-Shard-Name-Filter': 'sharded'})
+        exp_resp_hdrs = {'X-Backend-Recheck-Container-Existence': '60',
+                         'X-Backend-Override-Shard-Name-Filter': 'true'}
+        for k in ('X-Backend-Record-Shard-Format', 'X-Backend-Sharding-State'):
+            if k in resp_hdrs:
+                exp_resp_hdrs[k] = resp_hdrs[k]
+        self._check_response(resp, self.bogus_listing, exp_resp_hdrs)
+        self.assertEqual([], self.get_from_shards_lists)
+        # container metadata is looked up in memcache for sharding state
+        # container metadata is set in memcache
+        self.assertEqual(
+            [mock.call.get('container/a/c'),
+             mock.call.set('container/a/c', mock.ANY, time=60)],
+            self.memcache.calls)
+        self.assertEqual(resp.headers.get('X-Backend-Sharding-State'),
+                         self.memcache.calls[1][1][1]['sharding_state'])
+        self.memcache.delete_all()
+
+    def test_GET_namespaces_no_cache_write_for_object_listing(self):
+        # verify that namespaces are not written to cache when container
+        # response does not return shard ranges
+        self._do_test_GET_namespaces_no_cache_write_not_namespaces(
+            {'X-Backend-Record-Type': 'object',
+             'X-Backend-Override-Shard-Name-Filter': 'true',
+             'X-Backend-Sharding-State': 'sharded'})
+        self._do_test_GET_namespaces_no_cache_write_not_namespaces(
+            {'X-Backend-Record-Type': 'other',
+             'X-Backend-Override-Shard-Name-Filter': 'true',
+             'X-Backend-Sharding-State': 'sharded'})
+        self._do_test_GET_namespaces_no_cache_write_not_namespaces(
+            {'X-Backend-Record-Type': 'true',
+             'X-Backend-Override-Shard-Name-Filter': 'true',
+             'X-Backend-Sharding-State': 'sharded'})
+        self._do_test_GET_namespaces_no_cache_write_not_namespaces(
+            {'X-Backend-Override-Shard-Name-Filter': 'true',
+             'X-Backend-Sharding-State': 'sharded'})
+
+    def _do_test_GET_namespaces_bad_response_body(self, resp_body):
+        # verify that resp body is not cached if shard range parsing fails;
+        # check the original unparseable response body is returned
+        self.bogus_listing_body = json.dumps(resp_body).encode('ascii')
+        self.memcache.clear_calls()
+        req = self._build_request(
+            {'X-Backend-Record-Type': ''},
+            {'states': 'listing'}, {})
+        resp_hdrs = {'X-Backend-Record-Type': 'shard',
+                     'X-Backend-Override-Shard-Name-Filter': 'true',
+                     'X-Backend-Sharding-State': 'sharded'}
+        resp_hdrs.update(self.RESP_SHARD_FORMAT_HEADERS)
+
+        backend_req, resp = self._capture_backend_request(
+            req, 200, self.bogus_listing_body, resp_hdrs)
+        self._check_backend_req(
+            req, backend_req,
+            extra_hdrs={'X-Backend-Record-Type': 'auto',
+                        'X-Backend-Record-Shard-Format': 'namespace',
+                        'X-Backend-Include-Deleted': 'false',
+                        'X-Backend-Override-Shard-Name-Filter': 'sharded'})
+        exp_resp_hdrs = {'X-Backend-Recheck-Container-Existence': '60',
+                         'X-Backend-Override-Shard-Name-Filter': 'true'}
+        if 'X-Backend-Sharding-State' in resp_hdrs:
+            exp_resp_hdrs['X-Backend-Sharding-State'] = \
+                resp_hdrs['X-Backend-Sharding-State']
+        self._check_response(resp, resp_body, exp_resp_hdrs)
+        # container metadata is looked up in memcache for sharding state
+        # container metadata is set in memcache
+        self.assertEqual(
+            [mock.call.get('container/a/c'),
+             mock.call.set('container/a/c', mock.ANY, time=60)],
+            self.memcache.calls)
+        self.assertEqual(resp.headers.get('X-Backend-Sharding-State'),
+                         self.memcache.calls[1][1][1]['sharding_state'])
+        self.assertEqual({'container.info.cache.miss': 1,
+                          'container.shard_listing.cache.bypass.200': 1},
+                         self.logger.statsd_client.get_stats_counts())
+        self.memcache.delete_all()
+
+    def test_GET_namespaces_bad_response_body(self):
+        self._do_test_GET_namespaces_bad_response_body(
+            {'bad': 'data', 'not': ' a list'})
+        error_lines = self.logger.get_lines_for_level('error')
+        start = 'Problem with container shard listing response from /v1/a/c?'
+        msg, _, _ = error_lines[0].partition(':')
+        self.assertEqual(start, msg[:len(start)])
+        actual_qs = msg[len(start):]
+        actual_params = dict(
+            urllib.parse.parse_qsl(actual_qs, keep_blank_values=True))
+        self.assertEqual({'format': 'json', 'states': 'listing'},
+                         actual_params)
+        self.assertFalse(error_lines[1:])
+
+        self.logger.clear()
+        self._do_test_GET_namespaces_bad_response_body(
+            [{'not': 'a namespace'}])
+        error_lines = self.logger.get_lines_for_level('error')
+        start = 'Failed to get namespaces from /v1/a/c?'
+        msg, _, _ = error_lines[0].partition(':')
+        self.assertEqual(start, msg[:len(start)])
+        actual_qs = msg[len(start):]
+        actual_params = dict(
+            urllib.parse.parse_qsl(actual_qs, keep_blank_values=True))
+        self.assertEqual({'format': 'json', 'states': 'listing'},
+                         actual_params)
+        self.assertFalse(error_lines[1:])
+
+        self.logger.clear()
+        self._do_test_GET_namespaces_bad_response_body('not a list')
+        error_lines = self.logger.get_lines_for_level('error')
+        start = 'Problem with container shard listing response from /v1/a/c?'
+        msg, _, _ = error_lines[0].partition(':')
+        self.assertEqual(start, msg[:len(start)])
+        actual_qs = msg[len(start):]
+        actual_params = dict(
+            urllib.parse.parse_qsl(actual_qs, keep_blank_values=True))
+        self.assertEqual({'format': 'json', 'states': 'listing'},
+                         actual_params)
+        self.assertFalse(error_lines[1:])
+
+    def _do_test_GET_namespaces_cache_unused(self, sharding_state, req_params,
+                                             req_hdrs=None):
+        # verify cases when a GET request does not lookup in cache or attempt
+        # to cache namespaces fetched from backend
+        self.memcache.delete_all()
+        self.memcache.clear_calls()
+        req_params.update(dict(marker='egg', end_marker='jam'))
+        hdrs = {'X-Backend-Record-Type': ''}
+        if req_hdrs:
+            hdrs.update(req_hdrs)
+
+        req = self._build_request(hdrs, req_params, {})
+        resp_shards = self._stub_namespaces[:2]
+
+        resp_headers = {'X-Backend-Record-Type': 'shard',
+                        'X-Backend-Sharding-State': sharding_state}
+        resp_headers.update(self.RESP_SHARD_FORMAT_HEADERS)
+        backend_req, resp = self._capture_backend_request(
+            req, 200, json.dumps(resp_shards).encode('ascii'),
+            resp_headers)
+
+        exp_backend_req_hdrs = dict(hdrs)
+        exp_backend_req_hdrs.update({
+            'X-Backend-Record-Type': 'auto',
+            'X-Backend-Record-Shard-Format': 'namespace',
+            'X-Backend-Include-Deleted': 'false',
+        })
+        self._check_backend_req(
+            req, backend_req, extra_hdrs=exp_backend_req_hdrs,
+            extra_params=req_params)
+        self._check_response(resp, self.bogus_listing, {
+            'X-Backend-Recheck-Container-Existence': '60',
+            'X-Backend-Sharding-State': sharding_state})
+        self.assertEqual([self.namespaces[:2]], self.get_from_shards_lists)
+
+    def _do_test_GET_namespaces_cache_unused_listing(self, sharding_state):
+        # container metadata from backend response is set in memcache
+        self._do_test_GET_namespaces_cache_unused(sharding_state,
+                                                  {'states': 'listing'})
+        self.assertEqual(
+            [mock.call.get('container/a/c'),
+             mock.call.set('container/a/c', mock.ANY, time=60)],
+            self.memcache.calls)
+        self.assertEqual(sharding_state,
+                         self.memcache.calls[1][1][1]['sharding_state'])
+
+    def test_GET_namespaces_cache_unused_recheck_listing_shard_ranges(self):
+        # verify that a GET does not lookup or store namespaces in cache when
+        # cache expiry time is set to  zero
+        self.app.recheck_listing_shard_ranges = 0
+        self._do_test_GET_namespaces_cache_unused_listing('unsharded')
+        self._do_test_GET_namespaces_cache_unused_listing('sharding')
+        self._do_test_GET_namespaces_cache_unused_listing('sharded')
+        self._do_test_GET_namespaces_cache_unused_listing('collapsed')
+        self._do_test_GET_namespaces_cache_unused_listing('unexpected')
+
+    def test_GET_namespaces_no_memcache_available(self):
+        req_hdrs = {'X-Backend-Record-Type': ''}
+        params = {'states': 'listing'}
+        req = self._build_request(req_hdrs, params, {})
+        req.environ['swift.cache'] = None
+
+        resp_hdrs = {'X-Backend-Record-Type': 'shard',
+                     'X-Backend-Sharding-State': 'sharded'}
+        resp_hdrs.update(self.RESP_SHARD_FORMAT_HEADERS)
+        backend_req, resp = self._capture_backend_request(
+            req, 200, self._stub_namespaces_dump, resp_hdrs)
+
+        exp_backend_req_hdrs = dict(req_hdrs)
+        exp_backend_req_hdrs.update(
+            {'X-Backend-Record-Type': 'auto',
+             'X-Backend-Record-Shard-Format': 'namespace',
+             'X-Backend-Include-Deleted': 'false',
+             })
+        self._check_backend_req(
+            req, backend_req, extra_params=params,
+            extra_hdrs=exp_backend_req_hdrs)
+        self._check_response(resp, self.bogus_listing, {
+            'X-Backend-Recheck-Container-Existence': '60',
+            'X-Backend-Sharding-State': 'sharded'})
+        self.assertEqual([self.namespaces], self.get_from_shards_lists)
+        self.assertEqual([], self.memcache.calls)  # sanity check
+
+    def test_cache_clearing(self):
+        # verify that both metadata and shard ranges are purged from memcache
+        # on PUT, POST and DELETE
+        def do_test(method, resp_status, num_resp):
+            self.assertGreater(num_resp, 0)  # sanity check
+            memcache = FakeMemcache()
+            cont_key = get_cache_key('a', 'c')
+            shard_key = get_cache_key('a', 'c', shard='listing')
+            memcache.set(cont_key, 'container info', 60)
+            memcache.set(shard_key, 'shard ranges', 600)
+            req = Request.blank('/v1/a/c', method=method)
+            req.environ['swift.cache'] = memcache
+            self.assertIn(cont_key, req.environ['swift.cache'].store)
+            self.assertIn(shard_key, req.environ['swift.cache'].store)
+            resp_status = [resp_status] * num_resp
+            with mocked_http_conn(
+                    *resp_status, body_iter=[b''] * num_resp,
+                    headers=[{}] * num_resp):
+                resp = self._call_app(req)
+            self.assertEqual(resp_status[0], resp.status_int)
+            self.assertNotIn(cont_key, req.environ['swift.cache'].store)
+            self.assertNotIn(shard_key, req.environ['swift.cache'].store)
+        do_test('DELETE', 204, self.CONTAINER_REPLICAS)
+        do_test('POST', 204, self.CONTAINER_REPLICAS)
+        do_test('PUT', 202, self.CONTAINER_REPLICAS)
+
+
+class TestGetPathNamespaceCachingLegacy(TestGetPathNamespaceCaching):
+    # old container servers did not return this header
+    RESP_SHARD_FORMAT_HEADERS = {}
+
+    def setUp(self):
+        super(TestGetPathNamespaceCachingLegacy, self).setUp()
+
+    def _setup_namespace_stubs(self):
+        # old container servers always returned full format ShardRange dicts
+        self._stub_namespaces = [
+            dict(ShardRange(timestamp=Timestamp.now(), **ns))
+            for ns in self.ns_dicts]
+        self._stub_namespaces_dump = json.dumps(self._stub_namespaces).encode(
+            'ascii')
+
+
+class TestGetExplicitRecordType(BaseTestContainerControllerGetPath):
+    RESP_SHARD_FORMAT_HEADERS = {'X-Backend-Record-Shard-Format': 'full'}
+
+    def setUp(self):
+        super(TestGetExplicitRecordType, self).setUp()
+        self._setup_shard_range_stubs()
+
+    def _setup_shard_range_stubs(self):
+        self._stub_shards = [dict(ShardRange(timestamp=Timestamp.now(), **ns))
+                             for ns in self.ns_dicts]
+        self._stub_shards_dump = json.dumps(self.ns_dicts).encode('ascii')
+
+    def _do_test_GET_shard_ranges_no_cache(self, sharding_state, req_params,
+                                           req_hdrs=None):
+        # verify that an explicit shard GET request does not lookup in cache or
+        # attempt to cache shard ranges fetched from backend
+        self.memcache.delete_all()
+        self.memcache.clear_calls()
+        req_params.update(dict(marker='egg', end_marker='jam'))
+        hdrs = {'X-Backend-Record-Type': 'shard'}
+        if req_hdrs:
+            hdrs.update(req_hdrs)
+
+        req = self._build_request(hdrs, req_params, {})
+        resp_shards = self._stub_shards[:2]
+
+        resp_headers = {'X-Backend-Record-Type': 'shard',
+                        'X-Backend-Sharding-State': sharding_state}
+        resp_headers.update(self.RESP_SHARD_FORMAT_HEADERS)
+        backend_req, resp = self._capture_backend_request(
+            req, 200, json.dumps(resp_shards).encode('ascii'),
+            resp_headers)
+
+        exp_backend_req_hdrs = dict(hdrs)
+        exp_backend_req_hdrs.update({
+            'X-Backend-Record-Type': 'shard',
+        })
+        self._check_backend_req(
+            req, backend_req, extra_hdrs=exp_backend_req_hdrs,
+            extra_params=req_params)
+        expected_shards = self._stub_shards[:2]
+        exp_resp_hdrs = dict(resp_headers)
+        exp_resp_hdrs.update(self.RESP_SHARD_FORMAT_HEADERS)
+        exp_resp_hdrs['X-Backend-Recheck-Container-Existence'] = '60'
+        self._check_response(resp, expected_shards, exp_resp_hdrs)
+
+    def _do_test_GET_shard_ranges_no_cache_updating(self, sharding_state):
+        # container metadata from backend response is set in memcache
+        self._do_test_GET_shard_ranges_no_cache(sharding_state,
+                                                {'states': 'updating'})
+        self.assertEqual(
+            [mock.call.set('container/a/c', mock.ANY, time=60)],
+            self.memcache.calls)
+        self.assertEqual(sharding_state,
+                         self.memcache.calls[0][1][1]['sharding_state'])
+
+    def test_GET_shard_ranges_no_cache_when_requesting_updating_shards(self):
+        # verify that a GET for shard record type in updating states does not
+        # lookup or store in cache
+        self._do_test_GET_shard_ranges_no_cache_updating('unsharded')
+        self._do_test_GET_shard_ranges_no_cache_updating('sharding')
+        self._do_test_GET_shard_ranges_no_cache_updating('sharded')
+        self._do_test_GET_shard_ranges_no_cache_updating('collapsed')
+        self._do_test_GET_shard_ranges_no_cache_updating('unexpected')
+
+    def _do_test_GET_shard_ranges_no_cache_listing(self, sharding_state):
+        # container metadata from backend response is set in memcache
+        self._do_test_GET_shard_ranges_no_cache(sharding_state,
+                                                {'states': 'listing'})
+        self.assertEqual(
+            [mock.call.set('container/a/c', mock.ANY, time=60)],
+            self.memcache.calls)
+        self.assertEqual(sharding_state,
+                         self.memcache.calls[0][1][1]['sharding_state'])
+
+    def test_GET_shard_ranges_no_cache_when_requesting_listing_shards(self):
+        # verify that a GET for shard record type in listing states does not
+        # lookup or store in cache
+        self._do_test_GET_shard_ranges_no_cache_listing('unsharded')
+        self._do_test_GET_shard_ranges_no_cache_listing('sharding')
+        self._do_test_GET_shard_ranges_no_cache_listing('sharded')
+        self._do_test_GET_shard_ranges_no_cache_listing('collapsed')
+        self._do_test_GET_shard_ranges_no_cache_listing('unexpected')
+
+    def test_GET_shard_ranges_no_cache_when_include_deleted_shards(self):
+        # verify that a GET for shards in listing states does not lookup or
+        # store in cache if x-backend-include-deleted is true
+        self._do_test_GET_shard_ranges_no_cache(
+            'unsharded', {'states': 'listing'},
+            {'X-Backend-Include-Deleted': 'true'})
+        self._do_test_GET_shard_ranges_no_cache(
+            'sharding', {'states': 'listing'},
+            {'X-Backend-Include-Deleted': 'true'})
+        self._do_test_GET_shard_ranges_no_cache(
+            'sharded', {'states': 'listing'},
+            {'X-Backend-Include-Deleted': 'true'})
+        self._do_test_GET_shard_ranges_no_cache(
+            'collapsed', {'states': 'listing'},
+            {'X-Backend-Include-Deleted': 'true'})
+        self._do_test_GET_shard_ranges_no_cache(
+            'unexpected', {'states': 'listing'},
+            {'X-Backend-Include-Deleted': 'true'})
+
+    def test_GET_record_type_object_makes_no_cache_lookup(self):
+        # verify that an GET request explicitly asking for record-type 'object'
+        # does not lookup container metadata in cache
+        req_hdrs = {'X-Backend-Record-Type': 'object'}
+        # we would not expect states=listing to be used with an object request
+        # but include it here to verify that it is ignored
+        req = self._build_request(req_hdrs, {'states': 'listing'}, {})
+        resp_body = json.dumps(['object listing']).encode('ascii')
+        backend_req, resp = self._capture_backend_request(
+            req, 200, resp_body,
+            {'X-Backend-Record-Type': 'object',
+             'X-Backend-Sharding-State': 'sharded'})
+        self._check_backend_req(
+            req, backend_req,
+            extra_hdrs=req_hdrs)
+        self._check_response(resp, ['object listing'], {
+            'X-Backend-Recheck-Container-Existence': '60',
+            'X-Backend-Record-Type': 'object',
+            'X-Backend-Sharding-State': 'sharded'})
+        # container metadata from backend response is set in memcache
+        self.assertEqual(
+            [mock.call.set('container/a/c', mock.ANY, time=60)],
+            self.memcache.calls)
+        self.assertEqual('sharded',
+                         self.memcache.calls[0][1][1]['sharding_state'])
+
+
+class TestGetExplicitRecordTypeLegacy(TestGetExplicitRecordType):
+    # old container servers did not return this header
+    RESP_SHARD_FORMAT_HEADERS = {}
+
+
+@patch_policies(
+    [StoragePolicy(0, 'zero', True, object_ring=FakeRing(replicas=4))])
+class TestContainerController4Replicas(TestContainerController):
+
+    CONTAINER_REPLICAS = 4
+
+    def test_response_code_for_PUT(self):
+        PUT_TEST_CASES = [
+            ((201, 201, 201, 201), 201),
+            ((201, 201, 201, 404), 201),
+            ((201, 201, 201, 503), 201),
+            ((201, 201, 404, 404), 201),
+            ((201, 201, 404, 503), 201),
+            ((201, 201, 503, 503), 201),
+            ((201, 404, 404, 404), 404),
+            ((201, 404, 404, 503), 404),
+            ((201, 404, 503, 503), 503),
+            ((201, 503, 503, 503), 503),
+            ((404, 404, 404, 404), 404),
+            ((404, 404, 404, 503), 404),
+            ((404, 404, 503, 503), 404),
+            ((404, 503, 503, 503), 503),
+            ((503, 503, 503, 503), 503)
+        ]
+        self._assert_responses('PUT', PUT_TEST_CASES)
+
+    def test_response_code_for_DELETE(self):
+        DELETE_TEST_CASES = [
+            ((204, 204, 204, 204), 204),
+            ((204, 204, 204, 404), 204),
+            ((204, 204, 204, 503), 204),
+            ((204, 204, 404, 404), 204),
+            ((204, 204, 404, 503), 204),
+            ((204, 204, 503, 503), 204),
+            ((204, 404, 404, 404), 404),
+            ((204, 404, 404, 503), 404),
+            ((204, 404, 503, 503), 503),
+            ((204, 503, 503, 503), 503),
+            ((404, 404, 404, 404), 404),
+            ((404, 404, 404, 503), 404),
+            ((404, 404, 503, 503), 404),
+            ((404, 503, 503, 503), 503),
+            ((503, 503, 503, 503), 503)
+        ]
+        self._assert_responses('DELETE', DELETE_TEST_CASES)
+
+    def test_response_code_for_POST(self):
+        POST_TEST_CASES = [
+            ((204, 204, 204, 204), 204),
+            ((204, 204, 204, 404), 204),
+            ((204, 204, 204, 503), 204),
+            ((204, 204, 404, 404), 204),
+            ((204, 204, 404, 503), 204),
+            ((204, 204, 503, 503), 204),
+            ((204, 404, 404, 404), 404),
+            ((204, 404, 404, 503), 404),
+            ((204, 404, 503, 503), 503),
+            ((204, 503, 503, 503), 503),
+            ((404, 404, 404, 404), 404),
+            ((404, 404, 404, 503), 404),
+            ((404, 404, 503, 503), 404),
+            ((404, 503, 503, 503), 503),
+            ((503, 503, 503, 503), 503)
+        ]
+        self._assert_responses('POST', POST_TEST_CASES)
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/proxy/controllers/test_info.py b/test/unit/proxy/controllers/test_info.py
new file mode 100644
index 0000000000..410e69e92f
--- /dev/null
+++ b/test/unit/proxy/controllers/test_info.py
@@ -0,0 +1,294 @@
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import json
+import unittest
+import time
+from unittest.mock import Mock
+
+from swift.proxy.controllers import InfoController
+from swift.proxy.server import Application as ProxyApp
+from swift.common import registry, digest
+from swift.common.swob import Request, HTTPException
+from test.debug_logger import debug_logger
+
+
+class TestInfoController(unittest.TestCase):
+
+    def setUp(self):
+        registry._swift_info = {}
+        registry._swift_admin_info = {}
+
+    def get_controller(self, expose_info=None, disallowed_sections=None,
+                       admin_key=None):
+        disallowed_sections = disallowed_sections or []
+
+        app = Mock(spec=ProxyApp, logger=debug_logger())
+        return InfoController(app, None, expose_info,
+                              disallowed_sections, admin_key)
+
+    def start_response(self, status, headers):
+        self.got_statuses.append(status)
+        for h in headers:
+            self.got_headers.append({h[0]: h[1]})
+
+    def test_disabled_info(self):
+        controller = self.get_controller(expose_info=False)
+
+        req = Request.blank(
+            '/info', environ={'REQUEST_METHOD': 'GET'})
+        resp = controller.GET(req)
+        self.assertIsInstance(resp, HTTPException)
+        self.assertEqual('403 Forbidden', str(resp))
+
+    def test_get_info(self):
+        controller = self.get_controller(expose_info=True)
+        registry._swift_info = {'foo': {'bar': 'baz'}}
+        registry._swift_admin_info = {'qux': {'quux': 'corge'}}
+
+        req = Request.blank(
+            '/info', environ={'REQUEST_METHOD': 'GET'})
+        resp = controller.GET(req)
+        self.assertIsInstance(resp, HTTPException)
+        self.assertEqual('200 OK', str(resp))
+        info = json.loads(resp.body)
+        self.assertNotIn('admin', info)
+        self.assertIn('foo', info)
+        self.assertIn('bar', info['foo'])
+        self.assertEqual(info['foo']['bar'], 'baz')
+
+    def test_options_info(self):
+        controller = self.get_controller(expose_info=True)
+
+        req = Request.blank(
+            '/info', environ={'REQUEST_METHOD': 'GET'})
+        resp = controller.OPTIONS(req)
+        self.assertIsInstance(resp, HTTPException)
+        self.assertEqual('200 OK', str(resp))
+        self.assertIn('Allow', resp.headers)
+
+    def test_get_info_cors(self):
+        controller = self.get_controller(expose_info=True)
+        registry._swift_info = {'foo': {'bar': 'baz'}}
+        registry._swift_admin_info = {'qux': {'quux': 'corge'}}
+
+        req = Request.blank(
+            '/info', environ={'REQUEST_METHOD': 'GET'},
+            headers={'Origin': 'http://example.com'})
+        resp = controller.GET(req)
+        self.assertIsInstance(resp, HTTPException)
+        self.assertEqual('200 OK', str(resp))
+        info = json.loads(resp.body)
+        self.assertNotIn('admin', info)
+        self.assertIn('foo', info)
+        self.assertIn('bar', info['foo'])
+        self.assertEqual(info['foo']['bar'], 'baz')
+        self.assertIn('Access-Control-Allow-Origin', resp.headers)
+        self.assertIn('Access-Control-Expose-Headers', resp.headers)
+
+    def test_head_info(self):
+        controller = self.get_controller(expose_info=True)
+        registry._swift_info = {'foo': {'bar': 'baz'}}
+        registry._swift_admin_info = {'qux': {'quux': 'corge'}}
+
+        req = Request.blank(
+            '/info', environ={'REQUEST_METHOD': 'HEAD'})
+        resp = controller.HEAD(req)
+        self.assertIsInstance(resp, HTTPException)
+        self.assertEqual('200 OK', str(resp))
+
+    def test_disallow_info(self):
+        controller = self.get_controller(expose_info=True,
+                                         disallowed_sections=['foo2'])
+        registry._swift_info = {'foo': {'bar': 'baz'},
+                                'foo2': {'bar2': 'baz2'}}
+        registry._swift_admin_info = {'qux': {'quux': 'corge'}}
+
+        req = Request.blank(
+            '/info', environ={'REQUEST_METHOD': 'GET'})
+        resp = controller.GET(req)
+        self.assertIsInstance(resp, HTTPException)
+        self.assertEqual('200 OK', str(resp))
+        info = json.loads(resp.body)
+        self.assertIn('foo', info)
+        self.assertIn('bar', info['foo'])
+        self.assertEqual(info['foo']['bar'], 'baz')
+        self.assertNotIn('foo2', info)
+
+    def test_disabled_admin_info(self):
+        controller = self.get_controller(expose_info=True, admin_key='')
+        registry._swift_info = {'foo': {'bar': 'baz'}}
+        registry._swift_admin_info = {'qux': {'quux': 'corge'}}
+
+        expires = int(time.time() + 86400)
+        sig = digest.get_hmac('GET', '/info', expires, '')
+        path = '/info?swiftinfo_sig={sig}&swiftinfo_expires={expires}'.format(
+            sig=sig, expires=expires)
+        req = Request.blank(
+            path, environ={'REQUEST_METHOD': 'GET'})
+        resp = controller.GET(req)
+        self.assertIsInstance(resp, HTTPException)
+        self.assertEqual('403 Forbidden', str(resp))
+
+    def test_get_admin_info(self):
+        controller = self.get_controller(expose_info=True,
+                                         admin_key='secret-admin-key')
+        registry._swift_info = {'foo': {'bar': 'baz'}}
+        registry._swift_admin_info = {'qux': {'quux': 'corge'}}
+
+        expires = int(time.time() + 86400)
+        sig = digest.get_hmac('GET', '/info', expires, 'secret-admin-key')
+        path = '/info?swiftinfo_sig={sig}&swiftinfo_expires={expires}'.format(
+            sig=sig, expires=expires)
+        req = Request.blank(
+            path, environ={'REQUEST_METHOD': 'GET'})
+        resp = controller.GET(req)
+        self.assertIsInstance(resp, HTTPException)
+        self.assertEqual('200 OK', str(resp))
+        info = json.loads(resp.body)
+        self.assertIn('admin', info)
+        self.assertIn('qux', info['admin'])
+        self.assertIn('quux', info['admin']['qux'])
+        self.assertEqual(info['admin']['qux']['quux'], 'corge')
+
+    def test_head_admin_info(self):
+        controller = self.get_controller(expose_info=True,
+                                         admin_key='secret-admin-key')
+        registry._swift_info = {'foo': {'bar': 'baz'}}
+        registry._swift_admin_info = {'qux': {'quux': 'corge'}}
+
+        expires = int(time.time() + 86400)
+        sig = digest.get_hmac('GET', '/info', expires, 'secret-admin-key')
+        path = '/info?swiftinfo_sig={sig}&swiftinfo_expires={expires}'.format(
+            sig=sig, expires=expires)
+        req = Request.blank(
+            path, environ={'REQUEST_METHOD': 'HEAD'})
+        resp = controller.GET(req)
+        self.assertIsInstance(resp, HTTPException)
+        self.assertEqual('200 OK', str(resp))
+
+        expires = int(time.time() + 86400)
+        sig = digest.get_hmac('HEAD', '/info', expires, 'secret-admin-key')
+        path = '/info?swiftinfo_sig={sig}&swiftinfo_expires={expires}'.format(
+            sig=sig, expires=expires)
+        req = Request.blank(
+            path, environ={'REQUEST_METHOD': 'HEAD'})
+        resp = controller.GET(req)
+        self.assertIsInstance(resp, HTTPException)
+        self.assertEqual('200 OK', str(resp))
+
+    def test_get_admin_info_invalid_method(self):
+        controller = self.get_controller(expose_info=True,
+                                         admin_key='secret-admin-key')
+        registry._swift_info = {'foo': {'bar': 'baz'}}
+        registry._swift_admin_info = {'qux': {'quux': 'corge'}}
+
+        expires = int(time.time() + 86400)
+        sig = digest.get_hmac('HEAD', '/info', expires, 'secret-admin-key')
+        path = '/info?swiftinfo_sig={sig}&swiftinfo_expires={expires}'.format(
+            sig=sig, expires=expires)
+        req = Request.blank(
+            path, environ={'REQUEST_METHOD': 'GET'})
+        resp = controller.GET(req)
+        self.assertIsInstance(resp, HTTPException)
+        self.assertEqual('401 Unauthorized', str(resp))
+
+    def test_get_admin_info_invalid_expires(self):
+        controller = self.get_controller(expose_info=True,
+                                         admin_key='secret-admin-key')
+        registry._swift_info = {'foo': {'bar': 'baz'}}
+        registry._swift_admin_info = {'qux': {'quux': 'corge'}}
+
+        expires = 1
+        sig = digest.get_hmac('GET', '/info', expires, 'secret-admin-key')
+        path = '/info?swiftinfo_sig={sig}&swiftinfo_expires={expires}'.format(
+            sig=sig, expires=expires)
+        req = Request.blank(
+            path, environ={'REQUEST_METHOD': 'GET'})
+        resp = controller.GET(req)
+        self.assertIsInstance(resp, HTTPException)
+        self.assertEqual('401 Unauthorized', str(resp))
+
+        expires = 'abc'
+        sig = digest.get_hmac('GET', '/info', expires, 'secret-admin-key')
+        path = '/info?swiftinfo_sig={sig}&swiftinfo_expires={expires}'.format(
+            sig=sig, expires=expires)
+        req = Request.blank(
+            path, environ={'REQUEST_METHOD': 'GET'})
+        resp = controller.GET(req)
+        self.assertIsInstance(resp, HTTPException)
+        self.assertEqual('401 Unauthorized', str(resp))
+
+    def test_get_admin_info_invalid_path(self):
+        controller = self.get_controller(expose_info=True,
+                                         admin_key='secret-admin-key')
+        registry._swift_info = {'foo': {'bar': 'baz'}}
+        registry._swift_admin_info = {'qux': {'quux': 'corge'}}
+
+        expires = int(time.time() + 86400)
+        sig = digest.get_hmac('GET', '/foo', expires, 'secret-admin-key')
+        path = '/info?swiftinfo_sig={sig}&swiftinfo_expires={expires}'.format(
+            sig=sig, expires=expires)
+        req = Request.blank(
+            path, environ={'REQUEST_METHOD': 'GET'})
+        resp = controller.GET(req)
+        self.assertIsInstance(resp, HTTPException)
+        self.assertEqual('401 Unauthorized', str(resp))
+
+    def test_get_admin_info_invalid_key(self):
+        controller = self.get_controller(expose_info=True,
+                                         admin_key='secret-admin-key')
+        registry._swift_info = {'foo': {'bar': 'baz'}}
+        registry._swift_admin_info = {'qux': {'quux': 'corge'}}
+
+        expires = int(time.time() + 86400)
+        sig = digest.get_hmac('GET', '/foo', expires, 'invalid-admin-key')
+        path = '/info?swiftinfo_sig={sig}&swiftinfo_expires={expires}'.format(
+            sig=sig, expires=expires)
+        req = Request.blank(
+            path, environ={'REQUEST_METHOD': 'GET'})
+        resp = controller.GET(req)
+        self.assertIsInstance(resp, HTTPException)
+        self.assertEqual('401 Unauthorized', str(resp))
+
+    def test_admin_disallow_info(self):
+        controller = self.get_controller(expose_info=True,
+                                         disallowed_sections=['foo2'],
+                                         admin_key='secret-admin-key')
+        registry._swift_info = {'foo': {'bar': 'baz'},
+                                'foo2': {'bar2': 'baz2'}}
+        registry._swift_admin_info = {'qux': {'quux': 'corge'}}
+
+        expires = int(time.time() + 86400)
+        sig = digest.get_hmac('GET', '/info', expires, 'secret-admin-key')
+        path = '/info?swiftinfo_sig={sig}&swiftinfo_expires={expires}'.format(
+            sig=sig, expires=expires)
+        req = Request.blank(
+            path, environ={'REQUEST_METHOD': 'GET'})
+        resp = controller.GET(req)
+        self.assertIsInstance(resp, HTTPException)
+        self.assertEqual('200 OK', str(resp))
+        info = json.loads(resp.body)
+        self.assertNotIn('foo2', info)
+        self.assertIn('admin', info)
+        self.assertIn('disallowed_sections', info['admin'])
+        self.assertIn('foo2', info['admin']['disallowed_sections'])
+        self.assertIn('qux', info['admin'])
+        self.assertIn('quux', info['admin']['qux'])
+        self.assertEqual(info['admin']['qux']['quux'], 'corge')
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/proxy/controllers/test_obj.py b/test/unit/proxy/controllers/test_obj.py
new file mode 100644
index 0000000000..8b186cf1b1
--- /dev/null
+++ b/test/unit/proxy/controllers/test_obj.py
@@ -0,0 +1,9166 @@
+#!/usr/bin/env python
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import collections
+import itertools
+import random
+import time
+import unittest
+import argparse
+from collections import defaultdict
+from contextlib import contextmanager
+import json
+
+from unittest import mock
+import eventlet
+from eventlet import Timeout, sleep
+from eventlet.queue import Empty
+
+from io import StringIO
+from urllib.parse import quote, parse_qsl
+from email.parser import BytesFeedParser as EmailFeedParser
+
+import swift
+from swift.common import utils, swob, exceptions
+from swift.common.exceptions import ChunkWriteTimeout, ShortReadError, \
+    ChunkReadTimeout, RangeAlreadyComplete
+from swift.common.utils import Timestamp, list_from_csv, md5, FileLikeIter, \
+    ShardRange, Namespace, NamespaceBoundList, quorum_size
+from swift.proxy import server as proxy_server
+from swift.proxy.controllers import obj
+from swift.proxy.controllers.base import \
+    get_container_info as _real_get_container_info, GetterSource, \
+    NodeIter
+from swift.common.storage_policy import POLICIES, ECDriverError, \
+    StoragePolicy, ECStoragePolicy
+from swift.common.swob import Request, Response, wsgi_to_str, \
+    date_header_format
+from test import BaseTestCase
+from test.debug_logger import debug_logger, debug_labeled_statsd_client
+from test.unit import (
+    FakeRing, fake_http_connect, patch_policies, SlowBody, FakeStatus,
+    DEFAULT_TEST_EC_TYPE, encode_frag_archive_bodies, make_ec_object_stub,
+    fake_ec_node_response, StubResponse, mocked_http_conn,
+    quiet_eventlet_exceptions, FakeSource, make_timestamp_iter, FakeMemcache,
+    node_error_count, node_error_counts)
+
+
+def unchunk_body(chunked_body):
+    body = b''
+    remaining = chunked_body
+    while remaining:
+        hex_length, remaining = remaining.split(b'\r\n', 1)
+        length = int(hex_length, 16)
+        body += remaining[:length]
+        remaining = remaining[length + 2:]
+    return body
+
+
+@contextmanager
+def set_http_connect(*args, **kwargs):
+    old_connect = swift.proxy.controllers.base.http_connect
+    new_connect = fake_http_connect(*args, **kwargs)
+    try:
+        swift.proxy.controllers.base.http_connect = new_connect
+        swift.proxy.controllers.obj.http_connect = new_connect
+        swift.proxy.controllers.account.http_connect = new_connect
+        swift.proxy.controllers.container.http_connect = new_connect
+        yield new_connect
+        left_over_status = list(new_connect.code_iter)
+        if left_over_status:
+            raise AssertionError('%d left over statuses %r'
+                                 % (len(left_over_status), left_over_status))
+        if new_connect.unexpected_requests:
+            raise AssertionError(' %d unexpected requests'
+                                 % len(new_connect.unexpected_requests))
+
+    finally:
+        swift.proxy.controllers.base.http_connect = old_connect
+        swift.proxy.controllers.obj.http_connect = old_connect
+        swift.proxy.controllers.account.http_connect = old_connect
+        swift.proxy.controllers.container.http_connect = old_connect
+
+
+class PatchedObjControllerApp(proxy_server.Application):
+    """
+    This patch is just a hook over the proxy server's __call__ to ensure
+    that calls to get_container_info will return the stubbed value for
+    container_info if it's a container info call.
+    """
+
+    container_info = {}
+    per_container_info = {}
+
+    def __call__(self, *args, **kwargs):
+
+        def _fake_get_container_info(env, app, swift_source=None):
+            _vrs, account, container, _junk = utils.split_path(
+                swob.wsgi_to_str(env['PATH_INFO']), 3, 4)
+
+            # Seed the cache with our container info so that the real
+            # get_container_info finds it.
+            ic = env.setdefault('swift.infocache', {})
+            cache_key = "container/%s/%s" % (account, container)
+
+            old_value = ic.get(cache_key)
+
+            # Copy the container info so we don't hand out a reference to a
+            # mutable thing that's set up only once at compile time. Nothing
+            # *should* mutate it, but it's better to be paranoid than wrong.
+            if container in self.per_container_info:
+                ic[cache_key] = self.per_container_info[container].copy()
+            else:
+                ic[cache_key] = self.container_info.copy()
+
+            real_info = _real_get_container_info(env, app, swift_source)
+
+            if old_value is None:
+                del ic[cache_key]
+            else:
+                ic[cache_key] = old_value
+
+            return real_info
+
+        with mock.patch('swift.proxy.server.get_container_info',
+                        new=_fake_get_container_info), \
+                mock.patch('swift.proxy.controllers.base.get_container_info',
+                           new=_fake_get_container_info):
+            return super(
+                PatchedObjControllerApp, self).__call__(*args, **kwargs)
+
+
+def make_footers_callback(body=None):
+    # helper method to create a footers callback that will generate some fake
+    # footer metadata
+    cont_etag = 'container update etag may differ'
+    crypto_etag = '20242af0cd21dd7195a10483eb7472c9'
+    etag_crypto_meta = \
+        '{"cipher": "AES_CTR_256", "iv": "sD+PSw/DfqYwpsVGSo0GEw=="}'
+    etag = md5(body,
+               usedforsecurity=False).hexdigest() if body is not None else None
+    footers_to_add = {
+        'X-Object-Sysmeta-Container-Update-Override-Etag': cont_etag,
+        'X-Object-Sysmeta-Crypto-Etag': crypto_etag,
+        'X-Object-Sysmeta-Crypto-Meta-Etag': etag_crypto_meta,
+        'X-I-Feel-Lucky': 'Not blocked',
+        'Etag': etag}
+
+    def footers_callback(footers):
+        footers.update(footers_to_add)
+
+    return footers_callback
+
+
+class BaseObjectControllerMixin(object):
+    def fake_container_info(self, extra_info=None):
+        container_info = {
+            'status': 200,
+            'read_acl': None,
+            'write_acl': None,
+            'sync_key': None,
+            'versions': None,
+            'storage_policy': '0',
+            'partition': 50,
+            'nodes': [],
+            'sharding_state': 'unsharded',
+        }
+
+        if extra_info:
+            container_info.update(extra_info)
+        return container_info
+
+    # this needs to be set on the test case
+    controller_cls = None
+
+    def setUp(self):
+        # setup fake rings with handoffs
+        for policy in POLICIES:
+            policy.object_ring.max_more_nodes = policy.object_ring.replicas
+
+        self.logger = debug_logger('proxy-server')
+        self.logger.thread_locals = ('txn1', '127.0.0.2')
+        # increase connection timeout to avoid intermittent failures
+        self.conf = {'conn_timeout': 1.0}
+        self._make_app()
+
+        # default policy and ring references
+        self.policy = POLICIES.default
+        self.obj_ring = self.policy.object_ring
+        self._ts_iter = make_timestamp_iter()
+
+    def _make_app(self):
+        self.app = PatchedObjControllerApp(
+            self.conf, account_ring=FakeRing(),
+            container_ring=FakeRing(), logger=self.logger)
+        self.logger.clear()  # startup/loading debug msgs not helpful
+
+        # you can over-ride the container_info just by setting it on the app
+        # (see PatchedObjControllerApp for details)
+        self.app.container_info = dict(self.fake_container_info())
+
+    def ts(self):
+        return next(self._ts_iter)
+
+    def replicas(self, policy=None):
+        policy = policy or POLICIES.default
+        return policy.object_ring.replicas
+
+    def quorum(self, policy=None):
+        policy = policy or POLICIES.default
+        return policy.quorum
+
+
+class CommonObjectControllerMixin(BaseObjectControllerMixin):
+    # defines tests that are common to all storage policy types
+
+    def test_GET_all_primaries_error_limited(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o')
+        obj_ring = self.app.get_object_ring(int(self.policy))
+        _part, primary_nodes = obj_ring.get_nodes('a', 'c', 'o')
+        for dev in primary_nodes:
+            self.app.error_limiter.limit(dev)
+
+        num_handoff = (
+            2 * self.policy.object_ring.replica_count) - len(primary_nodes)
+        codes = [404] * num_handoff
+        with mocked_http_conn(*codes):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 503)
+
+    def test_iter_nodes_local_first_noops_when_no_affinity(self):
+        # this test needs a stable node order - most don't
+        self.app.sort_nodes = lambda l, *args, **kwargs: l
+        controller = self.controller_cls(
+            self.app, 'a', 'c', 'o')
+        policy = self.policy
+        self.app.get_policy_options(policy).write_affinity_is_local_fn = None
+        object_ring = policy.object_ring
+        all_nodes = object_ring.get_part_nodes(1)
+        all_nodes.extend(object_ring.get_more_nodes(1))
+
+        for node in all_nodes:
+            node['use_replication'] = False
+        local_first_nodes = list(controller.iter_nodes_local_first(
+            object_ring, 1, Request.blank('')))
+
+        self.maxDiff = None
+
+        self.assertEqual(all_nodes, local_first_nodes)
+
+    def test_iter_nodes_local_first_moves_locals_first(self):
+        controller = self.controller_cls(
+            self.app, 'a', 'c', 'o')
+        policy_conf = self.app.get_policy_options(self.policy)
+        policy_conf.write_affinity_is_local_fn = (
+            lambda node: node['region'] == 1)
+        # we'll write to one more than replica count local nodes
+        policy_conf.write_affinity_node_count_fn = lambda r: r + 1
+
+        object_ring = self.policy.object_ring
+        # make our fake ring have plenty of nodes, and not get limited
+        # artificially by the proxy max request node count
+        object_ring.max_more_nodes = 100000
+        # nothing magic about * 2 + 3, just a way to make it bigger
+        self.app.request_node_count = lambda r: r * 2 + 3
+
+        all_nodes = object_ring.get_part_nodes(1)
+        all_nodes.extend(object_ring.get_more_nodes(1))
+        for node in all_nodes:
+            node['use_replication'] = False
+
+        # limit to the number we're going to look at in this request
+        nodes_requested = self.app.request_node_count(object_ring.replicas)
+        all_nodes = all_nodes[:nodes_requested]
+
+        # make sure we have enough local nodes (sanity)
+        all_local_nodes = [n for n in all_nodes if
+                           policy_conf.write_affinity_is_local_fn(n)]
+        self.assertGreaterEqual(len(all_local_nodes), self.replicas() + 1)
+
+        # finally, create the local_first_nodes iter and flatten it out
+        local_first_nodes = list(controller.iter_nodes_local_first(
+            object_ring, 1, Request.blank('')))
+
+        # the local nodes move up in the ordering
+        self.assertEqual([1] * (self.replicas() + 1), [
+            node['region'] for node in local_first_nodes[
+                :self.replicas() + 1]])
+        # we don't skip any nodes
+        self.assertEqual(len(all_nodes), len(local_first_nodes))
+        self.assertEqual(sorted(all_nodes, key=lambda dev: dev['id']),
+                         sorted(local_first_nodes, key=lambda dev: dev['id']))
+
+        for node in all_nodes:
+            node['use_replication'] = True
+
+        req = Request.blank(
+            '/v1/a/c', headers={'x-backend-use-replication-network': 'yes'})
+        local_first_nodes = list(controller.iter_nodes_local_first(
+            object_ring, 1, request=req))
+        self.assertEqual([1] * (self.replicas() + 1), [
+            node['region'] for node in local_first_nodes[
+                :self.replicas() + 1]])
+        # we don't skip any nodes
+        self.assertEqual(len(all_nodes), len(local_first_nodes))
+        self.assertEqual(sorted(all_nodes, key=lambda dev: dev['id']),
+                         sorted(local_first_nodes, key=lambda dev: dev['id']))
+
+    def test_iter_nodes_local_first_best_effort(self):
+        controller = self.controller_cls(
+            self.app, 'a', 'c', 'o')
+        policy_conf = self.app.get_policy_options(self.policy)
+        policy_conf.write_affinity_is_local_fn = (
+            lambda node: node['region'] == 1)
+
+        object_ring = self.policy.object_ring
+        all_nodes = object_ring.get_part_nodes(1)
+        all_nodes.extend(object_ring.get_more_nodes(1))
+        for node in all_nodes:
+            node['use_replication'] = False
+
+        local_first_nodes = list(controller.iter_nodes_local_first(
+            object_ring, 1, request=Request.blank('')))
+
+        # we won't have quite enough local nodes...
+        self.assertEqual(len(all_nodes), self.replicas() +
+                         POLICIES.default.object_ring.max_more_nodes)
+        all_local_nodes = [n for n in all_nodes if
+                           policy_conf.write_affinity_is_local_fn(n)]
+        self.assertEqual(len(all_local_nodes), self.replicas())
+        # but the local nodes we do have are at the front of the local iter
+        first_n_local_first_nodes = local_first_nodes[:len(all_local_nodes)]
+        self.assertEqual(sorted(all_local_nodes, key=lambda dev: dev['id']),
+                         sorted(first_n_local_first_nodes,
+                                key=lambda dev: dev['id']))
+        # but we *still* don't *skip* any nodes
+        self.assertEqual(len(all_nodes), len(local_first_nodes))
+        self.assertEqual(sorted(all_nodes, key=lambda dev: dev['id']),
+                         sorted(local_first_nodes, key=lambda dev: dev['id']))
+
+    def test_iter_nodes_local_handoff_first_noops_when_no_affinity(self):
+        # this test needs a stable node order - most don't
+        self.app.sort_nodes = lambda l, *args, **kwargs: l
+        controller = self.controller_cls(
+            self.app, 'a', 'c', 'o')
+        policy = self.policy
+        self.app.get_policy_options(policy).write_affinity_is_local_fn = None
+        object_ring = policy.object_ring
+        all_nodes = object_ring.get_part_nodes(1)
+        all_nodes.extend(object_ring.get_more_nodes(1))
+        for node in all_nodes:
+            node['use_replication'] = False
+
+        local_first_nodes = list(controller.iter_nodes_local_first(
+            object_ring, 1, local_handoffs_first=True,
+            request=Request.blank('')))
+
+        self.maxDiff = None
+
+        self.assertEqual(all_nodes, local_first_nodes)
+
+    def test_iter_nodes_handoff_local_first_default(self):
+        controller = self.controller_cls(
+            self.app, 'a', 'c', 'o')
+        policy_conf = self.app.get_policy_options(self.policy)
+        policy_conf.write_affinity_is_local_fn = (
+            lambda node: node['region'] == 1)
+
+        object_ring = self.policy.object_ring
+        primary_nodes = object_ring.get_part_nodes(1)
+        handoff_nodes_iter = object_ring.get_more_nodes(1)
+        all_nodes = primary_nodes + list(handoff_nodes_iter)
+        for node in all_nodes:
+            node['use_replication'] = False
+        handoff_nodes_iter = object_ring.get_more_nodes(1)
+        local_handoffs = [n for n in handoff_nodes_iter if
+                          policy_conf.write_affinity_is_local_fn(n)]
+
+        prefered_nodes = list(controller.iter_nodes_local_first(
+            object_ring, 1, local_handoffs_first=True,
+            request=Request.blank('')))
+
+        self.assertEqual(len(all_nodes), self.replicas() +
+                         POLICIES.default.object_ring.max_more_nodes)
+
+        first_primary_nodes = prefered_nodes[:len(primary_nodes)]
+        self.assertEqual(sorted(primary_nodes, key=lambda dev: dev['id']),
+                         sorted(first_primary_nodes,
+                                key=lambda dev: dev['id']))
+
+        handoff_count = self.replicas() - len(primary_nodes)
+        first_handoffs = prefered_nodes[len(primary_nodes):][:handoff_count]
+        self.assertEqual(first_handoffs, local_handoffs[:handoff_count])
+
+    def test_iter_nodes_handoff_local_first_non_default(self):
+        # Obviously this test doesn't work if we're testing 1 replica.
+        # In that case, we don't have any failovers to check.
+        if self.replicas() == 1:
+            return
+
+        controller = self.controller_cls(
+            self.app, 'a', 'c', 'o')
+        policy_conf = self.app.get_policy_options(self.policy)
+        policy_conf.write_affinity_is_local_fn = (
+            lambda node: node['region'] == 1)
+        policy_conf.write_affinity_handoff_delete_count = 1
+
+        object_ring = self.policy.object_ring
+        primary_nodes = object_ring.get_part_nodes(1)
+        handoff_nodes_iter = object_ring.get_more_nodes(1)
+        all_nodes = primary_nodes + list(handoff_nodes_iter)
+        for node in all_nodes:
+            node['use_replication'] = False
+        handoff_nodes_iter = object_ring.get_more_nodes(1)
+        local_handoffs = [n for n in handoff_nodes_iter if
+                          policy_conf.write_affinity_is_local_fn(n)]
+        for node in local_handoffs:
+            node['use_replication'] = False
+
+        prefered_nodes = list(controller.iter_nodes_local_first(
+            object_ring, 1, local_handoffs_first=True,
+            request=Request.blank('')))
+
+        self.assertEqual(len(all_nodes), self.replicas() +
+                         POLICIES.default.object_ring.max_more_nodes)
+
+        first_primary_nodes = prefered_nodes[:len(primary_nodes)]
+        self.assertEqual(sorted(primary_nodes, key=lambda dev: dev['id']),
+                         sorted(first_primary_nodes,
+                                key=lambda dev: dev['id']))
+
+        handoff_count = policy_conf.write_affinity_handoff_delete_count
+        first_handoffs = prefered_nodes[len(primary_nodes):][:handoff_count]
+        self.assertEqual(first_handoffs, local_handoffs[:handoff_count])
+
+    def test_connect_put_node_timeout(self):
+        controller = self.controller_cls(
+            self.app, 'a', 'c', 'o')
+        req = swift.common.swob.Request.blank('/v1/a/c/o')
+        self.app.conn_timeout = 0.05
+        with set_http_connect(slow_connect=True):
+            nodes = [dict(ip='', port='', device='')]
+            res = controller._connect_put_node(nodes, '', req, {}, ('', ''))
+        self.assertIsNone(res)
+
+    def test_DELETE_simple(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='DELETE')
+        codes = [204] * self.replicas()
+        with set_http_connect(*codes):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 204)
+
+    def test_object_DELETE_backend_update_container_ip_default(self):
+        self.policy.object_ring = FakeRing(separate_replication=True)
+        self.app.container_ring = FakeRing(separate_replication=True)
+        # sanity, devs have different ip & replication_ip
+        for ring in (self.policy.object_ring, self.app.container_ring):
+            for dev in ring.devs:
+                self.assertNotEqual(dev['ip'], dev['replication_ip'])
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='DELETE')
+        codes = [204] * self.replicas()
+        with mocked_http_conn(*codes) as log:
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 204)
+
+        # sanity, object hosts use node ip/port
+        object_hosts = {'%(ip)s:%(port)s' % req for req in log.requests}
+        object_ring = self.app.get_object_ring(int(self.policy))
+        part, object_nodes = object_ring.get_nodes('a', 'c', 'o')
+        expected_object_hosts = {'%(ip)s:%(port)s' % n for n in object_nodes}
+        self.assertEqual(object_hosts, expected_object_hosts)
+
+        # container hosts use node ip/port
+        container_hosts = {req['headers']['x-container-host']
+                           for req in log.requests}
+        part, container_nodes = self.app.container_ring.get_nodes('a', 'c')
+        expected_container_hosts = {'%(ip)s:%(port)s' % n
+                                    for n in container_nodes}
+        self.assertEqual(container_hosts, expected_container_hosts)
+
+    def test_repl_object_DELETE_backend_update_container_repl_ip(self):
+        self.policy.object_ring = FakeRing(separate_replication=True)
+        self.app.container_ring = FakeRing(separate_replication=True)
+        # sanity, devs have different ip & replication_ip
+        for ring in (self.policy.object_ring, self.app.container_ring):
+            for dev in ring.devs:
+                self.assertNotEqual(dev['ip'], dev['replication_ip'])
+        req = swift.common.swob.Request.blank(
+            '/v1/a/c/o', method='DELETE', headers={
+                'x-backend-use-replication-network': 'true'})
+        codes = [204] * self.replicas()
+        with mocked_http_conn(*codes) as log:
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 204)
+
+        # sanity, object hosts use node replication ip/port
+        object_hosts = {'%(ip)s:%(port)s' % req for req in log.requests}
+        object_ring = self.app.get_object_ring(int(self.policy))
+        part, object_nodes = object_ring.get_nodes('a', 'c', 'o')
+        expected_object_hosts = {
+            '%(replication_ip)s:%(replication_port)s' % n
+            for n in object_nodes}
+        self.assertEqual(object_hosts, expected_object_hosts)
+
+        # container hosts use node replication ip/port
+        container_hosts = {req['headers']['x-container-host']
+                           for req in log.requests}
+        part, container_nodes = self.app.container_ring.get_nodes('a', 'c')
+        expected_container_hosts = {
+            '%(replication_ip)s:%(replication_port)s' % n
+            for n in container_nodes}
+        self.assertEqual(container_hosts, expected_container_hosts)
+
+    def test_DELETE_all_found(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='DELETE')
+        codes = [204] * self.replicas()
+        headers = []
+        ts = self.ts()
+        for _ in codes:
+            headers.append({'x-backend-timestamp': ts.internal})
+        with mocked_http_conn(*codes, headers=headers):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(ts.internal, resp.headers.get('X-Backend-Timestamp'))
+
+    def test_DELETE_none_found(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='DELETE')
+        codes = [404] * self.replicas()
+        headers = []
+        ts = self.ts()
+        for _ in codes:
+            headers.append({'x-backend-timestamp': ts.internal})
+        with mocked_http_conn(*codes, headers=headers):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 404)
+        self.assertEqual(ts.internal, resp.headers.get('X-Backend-Timestamp'))
+
+    def test_DELETE_missing_one(self):
+        # Obviously this test doesn't work if we're testing 1 replica.
+        # In that case, we don't have any failovers to check.
+        if self.replicas() == 1:
+            return
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='DELETE')
+        codes = [404] + [204] * (self.replicas() - 1)
+        random.shuffle(codes)
+        with set_http_connect(*codes):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 204)
+
+    def test_DELETE_one_found(self):
+        # Obviously this test doesn't work if we're testing 1 replica.
+        # In that case, we don't have any failovers to check.
+        if self.replicas() == 1:
+            return
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='DELETE')
+        codes = [404] * (self.replicas() - 1) + [204]
+        with set_http_connect(*codes):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 404)
+
+    def test_DELETE_mostly_found(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='DELETE')
+        mostly_204s = [204] * self.quorum()
+        codes = mostly_204s + [404] * (self.replicas() - len(mostly_204s))
+        self.assertEqual(len(codes), self.replicas())
+        with set_http_connect(*codes):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 204)
+
+    def test_DELETE_mostly_not_found(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='DELETE')
+        mostly_404s = [404] * self.quorum()
+        codes = mostly_404s + [204] * (self.replicas() - len(mostly_404s))
+        self.assertEqual(len(codes), self.replicas())
+        with set_http_connect(*codes):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 404)
+
+    def test_DELETE_insufficient_found_plus_404_507(self):
+        # one less 204 than a quorum...
+        primary_success = quorum_size(self.replicas()) - 1
+        primary_failure = self.replicas() - primary_success - 1
+        primary_codes = [204] * primary_success + [404] + \
+                        [507] * primary_failure
+        handoff_codes = [404] * primary_failure
+        ts = self.ts()
+        headers = []
+        for status in primary_codes + handoff_codes:
+            if status in (204, 404):
+                headers.append({'x-backend-timestamp': ts.internal})
+            else:
+                headers.append({})
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='DELETE')
+        with mocked_http_conn(*(primary_codes + handoff_codes),
+                              headers=headers):
+            resp = req.get_response(self.app)
+        # primary and handoff 404s form a quorum...
+        self.assertEqual(resp.status_int, 404,
+                         'replicas = %s' % self.replicas())
+        self.assertEqual(ts.internal, resp.headers.get('X-Backend-Timestamp'))
+
+    def test_DELETE_insufficient_found_plus_timeouts(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o')
+        req.method = 'DELETE'
+        primary_success = quorum_size(self.replicas()) - 1
+        primary_failure = self.replicas() - primary_success
+        primary_codes = [204] * primary_success + [Timeout()] * primary_failure
+        handoff_codes = [404] * primary_failure
+        ts = self.ts()
+        headers = []
+        for status in primary_codes + handoff_codes:
+            if status in (204, 404):
+                headers.append({'x-backend-timestamp': ts.internal})
+            else:
+                headers.append({})
+        with mocked_http_conn(*(primary_codes + handoff_codes),
+                              headers=headers):
+            resp = req.get_response(self.app)
+        # handoff 404s form a quorum...
+        self.assertEqual(404, resp.status_int,
+                         'replicas = %s' % self.replicas())
+        self.assertEqual(ts.internal, resp.headers.get('X-Backend-Timestamp'))
+
+    def test_DELETE_insufficient_found_plus_404_507_and_handoffs_fail(self):
+        if self.replicas() < 3:
+            return
+        primary_success = quorum_size(self.replicas()) - 1
+        primary_failure = self.replicas() - primary_success - 1
+        primary_codes = [204] * primary_success + [404] + \
+                        [507] * primary_failure
+        handoff_codes = [507] * self.replicas()
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='DELETE')
+        ts = self.ts()
+        headers = []
+        for status in primary_codes + handoff_codes:
+            if status in (204, 404):
+                headers.append({'x-backend-timestamp': ts.internal})
+            else:
+                headers.append({})
+        with mocked_http_conn(*(primary_codes + handoff_codes),
+                              headers=headers):
+            resp = req.get_response(self.app)
+        # overrides convert the 404 to a 204 so a quorum is formed...
+        self.assertEqual(resp.status_int, 204,
+                         'replicas = %s' % self.replicas())
+
+    def test_DELETE_insufficient_found_plus_507_and_handoffs_fail(self):
+        primary_success = quorum_size(self.replicas()) - 1
+        primary_failure = self.replicas() - primary_success
+        primary_codes = [204] * primary_success + [507] * primary_failure
+        handoff_codes = [507] * self.replicas()
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='DELETE')
+        ts = self.ts()
+        headers = []
+        for status in primary_codes + handoff_codes:
+            if status in (204, 404):
+                headers.append({'x-backend-timestamp': ts.internal})
+            else:
+                headers.append({})
+        with mocked_http_conn(*(primary_codes + handoff_codes),
+                              headers=headers):
+            resp = req.get_response(self.app)
+        # no quorum...
+        self.assertEqual(resp.status_int, 503,
+                         'replicas = %s' % self.replicas())
+
+    def test_DELETE_half_not_found_statuses(self):
+        self.obj_ring.set_replicas(4)
+
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='DELETE')
+        with set_http_connect(404, 204, 404, 204):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 204)
+
+    def test_DELETE_half_not_found_headers_and_body(self):
+        # Transformed responses have bogus bodies and headers, so make sure we
+        # send the client headers and body from a real node's response.
+        self.obj_ring.set_replicas(4)
+
+        status_codes = (404, 404, 204, 204)
+        bodies = (b'not found', b'not found', b'', b'')
+        headers = [{}, {}, {'Pick-Me': 'yes'}, {'Pick-Me': 'yes'}]
+
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='DELETE')
+        with set_http_connect(*status_codes, body_iter=bodies,
+                              headers=headers):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 204)
+        self.assertEqual(resp.headers.get('Pick-Me'), 'yes')
+        self.assertEqual(resp.body, b'')
+
+    def test_DELETE_handoff(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='DELETE')
+        codes = [204] * self.replicas()
+        with set_http_connect(507, *codes):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 204)
+
+    def test_DELETE_limits_expirer_queue_updates(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='DELETE')
+        codes = [204] * self.replicas()
+        captured_headers = []
+
+        def capture_headers(ip, port, device, part, method, path,
+                            headers=None, **kwargs):
+            captured_headers.append(headers)
+
+        with set_http_connect(*codes, give_connect=capture_headers):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 204)  # sanity check
+
+        counts = {True: 0, False: 0, None: 0}
+        for headers in captured_headers:
+            v = headers.get('X-Backend-Clean-Expiring-Object-Queue')
+            norm_v = None if v is None else utils.config_true_value(v)
+            counts[norm_v] += 1
+
+        max_queue_updates = 2
+        o_replicas = self.replicas()
+        self.assertEqual(counts, {
+            True: min(max_queue_updates, o_replicas),
+            False: max(o_replicas - max_queue_updates, 0),
+            None: 0,
+        })
+
+    def test_expirer_DELETE_suppresses_expirer_queue_updates(self):
+        req = swift.common.swob.Request.blank(
+            '/v1/a/c/o', method='DELETE', headers={
+                'X-Backend-Clean-Expiring-Object-Queue': 'no'})
+        codes = [204] * self.replicas()
+        captured_headers = []
+
+        def capture_headers(ip, port, device, part, method, path,
+                            headers=None, **kwargs):
+            captured_headers.append(headers)
+
+        with set_http_connect(*codes, give_connect=capture_headers):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 204)  # sanity check
+
+        counts = {True: 0, False: 0, None: 0}
+        for headers in captured_headers:
+            v = headers.get('X-Backend-Clean-Expiring-Object-Queue')
+            norm_v = None if v is None else utils.config_true_value(v)
+            counts[norm_v] += 1
+
+        o_replicas = self.replicas()
+        self.assertEqual(counts, {
+            True: 0,
+            False: o_replicas,
+            None: 0,
+        })
+
+        # Make sure we're not sending any expirer-queue update headers here.
+        # Since we're not updating the expirer queue, these headers would be
+        # superfluous.
+        for headers in captured_headers:
+            self.assertNotIn('X-Delete-At-Container', headers)
+            self.assertNotIn('X-Delete-At-Partition', headers)
+            self.assertNotIn('X-Delete-At-Host', headers)
+            self.assertNotIn('X-Delete-At-Device', headers)
+
+    def test_DELETE_write_affinity_after_replication(self):
+        policy_conf = self.app.get_policy_options(self.policy)
+        policy_conf.write_affinity_handoff_delete_count = self.replicas() // 2
+        policy_conf.write_affinity_is_local_fn = (
+            lambda node: node['region'] == 1)
+        handoff_count = policy_conf.write_affinity_handoff_delete_count
+
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='DELETE')
+        codes = [204] * self.replicas() + [404] * handoff_count
+        with set_http_connect(*codes):
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 204)
+
+    def test_DELETE_write_affinity_before_replication(self):
+        policy_conf = self.app.get_policy_options(self.policy)
+        policy_conf.write_affinity_handoff_delete_count = self.replicas() // 2
+        policy_conf.write_affinity_is_local_fn = (
+            lambda node: node['region'] == 1)
+        handoff_count = policy_conf.write_affinity_handoff_delete_count
+
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='DELETE')
+        codes = ([204] * (self.replicas() - handoff_count) +
+                 [404] * handoff_count +
+                 [204] * handoff_count)
+        with set_http_connect(*codes):
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 204)
+
+    def test_PUT_limits_expirer_queue_deletes(self):
+        req = swift.common.swob.Request.blank(
+            '/v1/a/c/o', method='PUT', body=b'',
+            headers={'Content-Type': 'application/octet-stream'})
+        codes = [201] * self.replicas()
+        captured_headers = []
+
+        def capture_headers(ip, port, device, part, method, path,
+                            headers=None, **kwargs):
+            captured_headers.append(headers)
+
+        expect_headers = {
+            'X-Obj-Metadata-Footer': 'yes',
+            'X-Obj-Multiphase-Commit': 'yes'
+        }
+        with set_http_connect(*codes, give_connect=capture_headers,
+                              expect_headers=expect_headers):
+            # this req may or may not succeed depending on the Putter type used
+            # but that's ok because we're only interested in verifying the
+            # headers that were sent
+            req.get_response(self.app)
+
+        counts = {True: 0, False: 0, None: 0}
+        for headers in captured_headers:
+            v = headers.get('X-Backend-Clean-Expiring-Object-Queue')
+            norm_v = None if v is None else utils.config_true_value(v)
+            counts[norm_v] += 1
+
+        max_queue_updates = 2
+        o_replicas = self.replicas()
+        self.assertEqual(counts, {
+            True: min(max_queue_updates, o_replicas),
+            False: max(o_replicas - max_queue_updates, 0),
+            None: 0,
+        })
+
+    def test_POST_limits_expirer_queue_deletes(self):
+        req = swift.common.swob.Request.blank(
+            '/v1/a/c/o', method='POST', body=b'',
+            headers={'Content-Type': 'application/octet-stream'})
+        codes = [201] * self.replicas()
+        captured_headers = []
+
+        def capture_headers(ip, port, device, part, method, path,
+                            headers=None, **kwargs):
+            captured_headers.append(headers)
+
+        with set_http_connect(*codes, give_connect=capture_headers):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 201)  # sanity check
+
+        counts = {True: 0, False: 0, None: 0}
+        for headers in captured_headers:
+            v = headers.get('X-Backend-Clean-Expiring-Object-Queue')
+            norm_v = None if v is None else utils.config_true_value(v)
+            counts[norm_v] += 1
+
+        max_queue_updates = 2
+        o_replicas = self.replicas()
+        self.assertEqual(counts, {
+            True: min(max_queue_updates, o_replicas),
+            False: max(o_replicas - max_queue_updates, 0),
+            None: 0,
+        })
+
+    def test_POST_non_int_delete_after(self):
+        t = str(int(time.time() + 100)) + '.1'
+        req = swob.Request.blank('/v1/a/c/o', method='POST',
+                                 headers={'Content-Type': 'foo/bar',
+                                          'X-Delete-After': t})
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 400)
+        self.assertEqual(b'Non-integer X-Delete-After', resp.body)
+
+    def test_PUT_non_int_delete_after(self):
+        t = str(int(time.time() + 100)) + '.1'
+        req = swob.Request.blank('/v1/a/c/o', method='PUT', body=b'',
+                                 headers={'Content-Type': 'foo/bar',
+                                          'X-Delete-After': t})
+        with set_http_connect():
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 400)
+        self.assertEqual(b'Non-integer X-Delete-After', resp.body)
+
+    def test_POST_negative_delete_after(self):
+        req = swob.Request.blank('/v1/a/c/o', method='POST',
+                                 headers={'Content-Type': 'foo/bar',
+                                          'X-Delete-After': '-60'})
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 400)
+        self.assertEqual(b'X-Delete-After in past', resp.body)
+
+    def test_PUT_negative_delete_after(self):
+        req = swob.Request.blank('/v1/a/c/o', method='PUT', body=b'',
+                                 headers={'Content-Type': 'foo/bar',
+                                          'X-Delete-After': '-60'})
+        with set_http_connect():
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 400)
+        self.assertEqual(b'X-Delete-After in past', resp.body)
+
+    def test_POST_delete_at_non_integer(self):
+        t = str(int(time.time() + 100)) + '.1'
+        req = swob.Request.blank('/v1/a/c/o', method='POST',
+                                 headers={'Content-Type': 'foo/bar',
+                                          'X-Delete-At': t})
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 400)
+        self.assertEqual(b'Non-integer X-Delete-At', resp.body)
+
+    def test_PUT_delete_at_non_integer(self):
+        t = str(int(time.time() - 100)) + '.1'
+        req = swob.Request.blank('/v1/a/c/o', method='PUT', body=b'',
+                                 headers={'Content-Type': 'foo/bar',
+                                          'X-Delete-At': t})
+        with set_http_connect():
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 400)
+        self.assertEqual(b'Non-integer X-Delete-At', resp.body)
+
+    def test_POST_delete_at_in_past(self):
+        t = str(int(time.time() - 100))
+        req = swob.Request.blank('/v1/a/c/o', method='POST',
+                                 headers={'Content-Type': 'foo/bar',
+                                          'X-Delete-At': t})
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 400)
+        self.assertEqual(b'X-Delete-At in past', resp.body)
+
+    def test_PUT_delete_at_in_past(self):
+        t = str(int(time.time() - 100))
+        req = swob.Request.blank('/v1/a/c/o', method='PUT', body=b'',
+                                 headers={'Content-Type': 'foo/bar',
+                                          'X-Delete-At': t})
+        with set_http_connect():
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 400)
+        self.assertEqual(b'X-Delete-At in past', resp.body)
+
+    def _test_x_open_expired(self, method, num_reqs, headers=None):
+        req = swift.common.swob.Request.blank(
+            '/v1/a/c/o', method=method, headers=headers)
+        codes = [404] * num_reqs
+        with mocked_http_conn(*codes) as fake_conn:
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 404)
+        return fake_conn.requests
+
+    def test_x_open_expired_default_config(self):
+        for method, num_reqs in (
+                ('GET',
+                 self.obj_ring.replicas + self.obj_ring.max_more_nodes),
+                ('HEAD',
+                 self.obj_ring.replicas + self.obj_ring.max_more_nodes),
+                ('POST', self.obj_ring.replicas)):
+            requests = self._test_x_open_expired(method, num_reqs)
+            for r in requests:
+                self.assertNotIn('X-Open-Expired', r['headers'])
+                self.assertNotIn('X-Backend-Open-Expired', r['headers'])
+
+            requests = self._test_x_open_expired(
+                method, num_reqs, headers={'X-Open-Expired': 'true'})
+            for r in requests:
+                self.assertEqual(r['headers']['X-Open-Expired'], 'true')
+                self.assertNotIn('X-Backend-Open-Expired', r['headers'])
+
+            requests = self._test_x_open_expired(
+                method, num_reqs, headers={'X-Open-Expired': 'false'})
+            for r in requests:
+                self.assertEqual(r['headers']['X-Open-Expired'], 'false')
+                self.assertNotIn('X-Backend-Open-Expired', r['headers'])
+
+    def test_x_open_expired_custom_config(self):
+        # helper to check that PUT is not supported in all cases
+        def test_put_unsupported():
+            req = swift.common.swob.Request.blank(
+                '/v1/a/c/o', method='PUT', headers={
+                    'Content-Length': '0',
+                    'X-Open-Expired': 'true'})
+            codes = [201] * self.obj_ring.replicas
+            expect_headers = {
+                'X-Obj-Metadata-Footer': 'yes',
+                'X-Obj-Multiphase-Commit': 'yes'
+            }
+            with mocked_http_conn(
+                    *codes, expect_headers=expect_headers) as fake_conn:
+                resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 201)
+            for r in fake_conn.requests:
+                self.assertEqual(r['headers']['X-Open-Expired'], 'true')
+                self.assertNotIn('X-Backend-Open-Expired', r['headers'])
+
+        # Allow open expired
+        # Override app configuration
+        conf = {'allow_open_expired': 'true'}
+        # Create a new proxy instance for test with config
+        self.app = PatchedObjControllerApp(
+            conf, account_ring=FakeRing(),
+            container_ring=FakeRing(), logger=None)
+        # Use the same container info as the app used in other tests
+        self.app.container_info = dict(self.fake_container_info())
+        self.obj_ring = self.app.get_object_ring(int(self.policy))
+
+        for method, num_reqs in (
+                ('GET',
+                 self.obj_ring.replicas + self.obj_ring.max_more_nodes),
+                ('HEAD',
+                 self.obj_ring.replicas + self.obj_ring.max_more_nodes),
+                ('POST', self.obj_ring.replicas)):
+            requests = self._test_x_open_expired(
+                method, num_reqs, headers={'X-Open-Expired': 'true'})
+            for r in requests:
+                # If the proxy server config is has allow_open_expired set
+                # to true, then we set x-backend-open-expired to true
+                self.assertEqual(r['headers']['X-Open-Expired'], 'true')
+                self.assertEqual(r['headers']['X-Backend-Open-Expired'],
+                                 'true')
+
+        for method, num_reqs in (
+                ('GET',
+                 self.obj_ring.replicas + self.obj_ring.max_more_nodes),
+                ('HEAD',
+                 self.obj_ring.replicas + self.obj_ring.max_more_nodes),
+                ('POST', self.obj_ring.replicas)):
+            requests = self._test_x_open_expired(
+                method, num_reqs, headers={'X-Open-Expired': 'false'})
+            for r in requests:
+                # If the proxy server config has allow_open_expired set
+                # to false, then we set x-backend-open-expired to false
+                self.assertEqual(r['headers']['X-Open-Expired'], 'false')
+                self.assertNotIn('X-Backend-Open-Expired', r['headers'])
+
+        # we don't support x-open-expired on PUT when allow_open_expired
+        test_put_unsupported()
+
+        # Disallow open expired
+        conf = {'allow_open_expired': 'false'}
+        # Create a new proxy instance for test with config
+        self.app = PatchedObjControllerApp(
+            conf, account_ring=FakeRing(),
+            container_ring=FakeRing(), logger=None)
+        # Use the same container info as the app used in other tests
+        self.app.container_info = dict(self.fake_container_info())
+        self.obj_ring = self.app.get_object_ring(int(self.policy))
+
+        for method, num_reqs in (
+                ('GET',
+                 self.obj_ring.replicas + self.obj_ring.max_more_nodes),
+                ('HEAD',
+                 self.obj_ring.replicas + self.obj_ring.max_more_nodes),
+                ('POST', self.obj_ring.replicas)):
+            # This case is different: we never add the 'X-Backend-Open-Expired'
+            # header if the proxy server config disables this feature
+            requests = self._test_x_open_expired(
+                method, num_reqs, headers={'X-Open-Expired': 'true'})
+            for r in requests:
+                self.assertEqual(r['headers']['X-Open-Expired'], 'true')
+                self.assertNotIn('X-Backend-Open-Expired', r['headers'])
+
+        # we don't support x-open-expired on PUT when not allow_open_expired
+        test_put_unsupported()
+
+    def test_HEAD_simple(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='HEAD')
+        with set_http_connect(200):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 200)
+        self.assertIn('Accept-Ranges', resp.headers)
+
+    def test_HEAD_x_newest(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='HEAD',
+                                              headers={'X-Newest': 'true'})
+        with set_http_connect(*([200] * 2 * self.replicas())):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 200)
+
+    def test_HEAD_x_newest_different_timestamps(self):
+        req = swob.Request.blank('/v1/a/c/o', method='HEAD',
+                                 headers={'X-Newest': 'true'})
+        num_expected_requests = 2 * self.replicas()
+        timestamps = [self.ts() for i in range(num_expected_requests)]
+        newest_timestamp = timestamps[-1]
+        random.shuffle(timestamps)
+        backend_response_headers = [{
+            'X-Backend-Timestamp': t.internal,
+            'X-Timestamp': t.normal
+        } for t in timestamps]
+        with set_http_connect(*([200] * num_expected_requests),
+                              headers=backend_response_headers):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['x-timestamp'], newest_timestamp.normal)
+
+    def test_HEAD_x_newest_with_two_vector_timestamps(self):
+        req = swob.Request.blank('/v1/a/c/o', method='HEAD',
+                                 headers={'X-Newest': 'true'})
+        # constant float part, varying offset...
+        now = Timestamp.now()
+        ts = (Timestamp(now, offset) for offset in itertools.count())
+        num_expected_requests = 2 * self.replicas()
+        timestamps = [next(ts) for i in range(num_expected_requests)]
+        newest_timestamp = timestamps[-1]
+        self.assertGreater(newest_timestamp, timestamps[0])
+        random.shuffle(timestamps)
+        backend_response_headers = [{
+            'X-Backend-Timestamp': t.internal,
+            'X-Timestamp': t.normal
+        } for t in timestamps]
+        with set_http_connect(*([200] * num_expected_requests),
+                              headers=backend_response_headers):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['x-backend-timestamp'],
+                         newest_timestamp.internal, timestamps)
+
+    def test_HEAD_x_newest_with_some_missing(self):
+        req = swob.Request.blank('/v1/a/c/o', method='HEAD',
+                                 headers={'X-Newest': 'true'})
+        request_count = self.app.request_node_count(self.obj_ring.replicas)
+        backend_response_headers = [{
+            'x-timestamp': self.ts().normal,
+        } for i in range(request_count)]
+        responses = [404] * (request_count - 1)
+        responses.append(200)
+        request_log = []
+
+        def capture_requests(ip, port, device, part, method, path,
+                             headers=None, **kwargs):
+            req = {
+                'ip': ip,
+                'port': port,
+                'device': device,
+                'part': part,
+                'method': method,
+                'path': path,
+                'headers': headers,
+            }
+            request_log.append(req)
+        with set_http_connect(*responses,
+                              headers=backend_response_headers,
+                              give_connect=capture_requests):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 200)
+        for req in request_log:
+            self.assertEqual(req['method'], 'HEAD')
+            self.assertEqual(req['path'], '/a/c/o')
+
+    def test_some_404s_and_507s(self):
+        self.policy.object_ring.max_more_nodes = (3 * self.replicas())
+        req = swob.Request.blank('/v1/a/c/o', method='HEAD')
+        responses = [StubResponse(
+            404, headers={'X-Backend-Timestamp': '2'})] * self.replicas()
+        responses += [StubResponse(507, headers={})] * (
+            self.policy.object_ring.max_more_nodes - self.replicas())
+        self.assertEqual(len(responses), 3 * self.replicas())  # sanity
+
+        def get_response(req):
+            return responses.pop(0)
+
+        with capture_http_requests(get_response):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 404)
+        self.assertEqual(resp.headers['X-Backend-Timestamp'], '2')
+
+    def test_container_sync_delete(self):
+        test_indexes = [None] + [int(p) for p in POLICIES]
+        for policy_index in test_indexes:
+            req = swob.Request.blank(
+                '/v1/a/c/o', method='DELETE', headers={
+                    'X-Timestamp': self.ts().internal})
+            codes = [409] * self.obj_ring.replicas
+            ts_iter = itertools.repeat(self.ts().internal)
+            with set_http_connect(*codes, timestamps=ts_iter):
+                resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 409)
+
+    def test_PUT_requires_length(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='PUT')
+        resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 411)
+
+    def test_container_update_backend_requests(self):
+        for policy in POLICIES:
+            req = swift.common.swob.Request.blank(
+                '/v1/a/c/o', method='PUT',
+                headers={'Content-Length': '0',
+                         'X-Backend-Storage-Policy-Index': int(policy)})
+            controller = self.controller_cls(self.app, 'a', 'c', 'o')
+
+            # This is the number of container updates we're doing, simulating
+            # 1 to 15 container replicas.
+            for num_containers in range(1, 16):
+                containers = [{'ip': '1.0.0.%s' % i,
+                               'port': '60%s' % str(i).zfill(2),
+                               'device': 'sdb'} for i in range(num_containers)]
+
+                container_info = self.fake_container_info(
+                    {'nodes': containers})
+                backend_headers = controller._backend_requests(
+                    req, self.replicas(policy), container_info)
+
+                # how many of the backend headers have a container update
+                n_container_updates = len(
+                    [headers for headers in backend_headers
+                     if 'X-Container-Partition' in headers])
+
+                # how many object-server PUTs can fail and still let the
+                # client PUT succeed
+                n_can_fail = self.replicas(policy) - self.quorum(policy)
+                n_expected_updates = (
+                    n_can_fail + utils.quorum_size(num_containers))
+
+                # you get at least one update per container no matter what
+                n_expected_updates = max(
+                    n_expected_updates, num_containers)
+
+                # you can't have more object requests with updates than you
+                # have object requests (the container stuff gets doubled up,
+                # but that's not important for purposes of durability)
+                n_expected_updates = min(
+                    n_expected_updates, self.replicas(policy))
+                self.assertEqual(n_expected_updates, n_container_updates)
+
+    def test_delete_at_backend_requests(self):
+        t = str(int(time.time() + 100))
+        for policy in POLICIES:
+            req = swift.common.swob.Request.blank(
+                '/v1/a/c/o', method='PUT',
+                headers={'Content-Length': '0',
+                         'X-Backend-Storage-Policy-Index': int(policy),
+                         'X-Delete-At': t})
+            controller = self.controller_cls(self.app, 'a', 'c', 'o')
+
+            for num_del_at_nodes in range(1, 16):
+                containers = [
+                    {'ip': '2.0.0.%s' % i, 'port': '70%s' % str(i).zfill(2),
+                     'device': 'sdc'} for i in range(num_del_at_nodes)]
+                del_at_nodes = [
+                    {'ip': '1.0.0.%s' % i, 'port': '60%s' % str(i).zfill(2),
+                     'device': 'sdb'} for i in range(num_del_at_nodes)]
+
+                container_info = self.fake_container_info(
+                    {'nodes': containers})
+
+                backend_headers = controller._backend_requests(
+                    req, self.replicas(policy), container_info,
+                    delete_at_container='dac', delete_at_partition=2,
+                    delete_at_nodes=del_at_nodes)
+
+                devices = []
+                hosts = []
+                part = ctr = 0
+                for given_headers in backend_headers:
+                    self.assertEqual(given_headers.get('X-Delete-At'), t)
+                    if 'X-Delete-At-Partition' in given_headers:
+                        self.assertEqual(
+                            given_headers.get('X-Delete-At-Partition'), '2')
+                        part += 1
+                    if 'X-Delete-At-Container' in given_headers:
+                        self.assertEqual(
+                            given_headers.get('X-Delete-At-Container'), 'dac')
+                        ctr += 1
+                    devices += (
+                        list_from_csv(given_headers.get('X-Delete-At-Device')))
+                    hosts += (
+                        list_from_csv(given_headers.get('X-Delete-At-Host')))
+
+                # same as in test_container_update_backend_requests
+                n_can_fail = self.replicas(policy) - self.quorum(policy)
+                n_expected_updates = (
+                    n_can_fail + utils.quorum_size(num_del_at_nodes))
+
+                n_expected_hosts = max(
+                    n_expected_updates, num_del_at_nodes)
+
+                self.assertEqual(len(hosts), n_expected_hosts)
+                self.assertEqual(len(devices), n_expected_hosts)
+
+                # parts don't get doubled up, maximum is count of obj requests
+                n_expected_parts = min(
+                    n_expected_hosts, self.replicas(policy))
+                self.assertEqual(part, n_expected_parts)
+                self.assertEqual(ctr, n_expected_parts)
+
+                # check that hosts are correct
+                self.assertEqual(
+                    set(hosts),
+                    set('%s:%s' % (h['ip'], h['port']) for h in del_at_nodes))
+                self.assertEqual(set(devices), set(('sdb',)))
+
+    def test_smooth_distributed_backend_requests(self):
+        t = str(int(time.time() + 100))
+        for policy in POLICIES:
+            req = swift.common.swob.Request.blank(
+                '/v1/a/c/o', method='PUT',
+                headers={'Content-Length': '0',
+                         'X-Backend-Storage-Policy-Index': int(policy),
+                         'X-Delete-At': t})
+            controller = self.controller_cls(self.app, 'a', 'c', 'o')
+
+            for num_containers in range(1, 16):
+                containers = [
+                    {'ip': '2.0.0.%s' % i, 'port': '70%s' % str(i).zfill(2),
+                     'device': 'sdc'} for i in range(num_containers)]
+                del_at_nodes = [
+                    {'ip': '1.0.0.%s' % i, 'port': '60%s' % str(i).zfill(2),
+                     'device': 'sdb'} for i in range(num_containers)]
+
+                container_info = self.fake_container_info(
+                    {'nodes': containers})
+
+                backend_headers = controller._backend_requests(
+                    req, self.replicas(policy), container_info,
+                    delete_at_container='dac', delete_at_partition=2,
+                    delete_at_nodes=del_at_nodes)
+
+                # caculate no of expected updates, see
+                # test_container_update_backend_requests for explanation
+                n_expected_updates = min(max(
+                    self.replicas(policy) - self.quorum(policy) +
+                    utils.quorum_size(num_containers), num_containers),
+                    self.replicas(policy))
+
+                # the first n_expected_updates servers should have received
+                # a container update
+                self.assertTrue(
+                    all([h.get('X-Container-Partition')
+                         for h in backend_headers[:n_expected_updates]]))
+                # the last n_expected_updates servers should have received
+                # the x-delete-at* headers
+                self.assertTrue(
+                    all([h.get('X-Delete-At-Container')
+                         for h in backend_headers[-n_expected_updates:]]))
+
+    def _check_write_affinity(
+            self, conf, policy_conf, policy, affinity_regions, affinity_count):
+        conf['policy_config'] = policy_conf
+        app = PatchedObjControllerApp(
+            conf, account_ring=FakeRing(),
+            container_ring=FakeRing(), logger=self.logger)
+
+        controller = self.controller_cls(app, 'a', 'c', 'o')
+
+        object_ring = app.get_object_ring(int(policy))
+        # make our fake ring have plenty of nodes, and not get limited
+        # artificially by the proxy max request node count
+        object_ring.max_more_nodes = 100
+
+        all_nodes = object_ring.get_part_nodes(1)
+        all_nodes.extend(object_ring.get_more_nodes(1))
+
+        # make sure we have enough local nodes (sanity)
+        all_local_nodes = [n for n in all_nodes if
+                           n['region'] in affinity_regions]
+        self.assertGreaterEqual(len(all_local_nodes), affinity_count)
+
+        # finally, create the local_first_nodes iter and flatten it out
+        local_first_nodes = list(controller.iter_nodes_local_first(
+            object_ring, 1, Request.blank(''), policy))
+
+        # check that the required number of local nodes were moved up the order
+        node_regions = [node['region'] for node in local_first_nodes]
+        self.assertTrue(
+            all(r in affinity_regions for r in node_regions[:affinity_count]),
+            'Unexpected region found in local nodes, expected %s but got %s' %
+            (affinity_regions, node_regions))
+        return app
+
+    def test_write_affinity_not_configured(self):
+        # default is no write affinity so expect both regions 0 and 1
+        self._check_write_affinity({}, {}, POLICIES[0], [0, 1],
+                                   2 * self.replicas(POLICIES[0]))
+        self._check_write_affinity({}, {}, POLICIES[1], [0, 1],
+                                   2 * self.replicas(POLICIES[1]))
+
+    def test_write_affinity_proxy_server_config(self):
+        # without overrides policies use proxy-server config section options
+        conf = {'write_affinity_node_count': '1 * replicas',
+                'write_affinity': 'r0'}
+        self._check_write_affinity(conf, {}, POLICIES[0], [0],
+                                   self.replicas(POLICIES[0]))
+        self._check_write_affinity(conf, {}, POLICIES[1], [0],
+                                   self.replicas(POLICIES[1]))
+
+    def test_write_affinity_per_policy_config(self):
+        # check only per-policy configuration is sufficient
+        conf = {}
+        policy_conf = {'0': {'write_affinity_node_count': '1 * replicas',
+                             'write_affinity': 'r1'},
+                       '1': {'write_affinity_node_count': '5',
+                             'write_affinity': 'r0'}}
+        self._check_write_affinity(conf, policy_conf, POLICIES[0], [1],
+                                   self.replicas(POLICIES[0]))
+        self._check_write_affinity(conf, policy_conf, POLICIES[1], [0], 5)
+
+    def test_write_affinity_per_policy_config_overrides_and_inherits(self):
+        # check per-policy config is preferred over proxy-server section config
+        conf = {'write_affinity_node_count': '1 * replicas',
+                'write_affinity': 'r0'}
+        policy_conf = {'0': {'write_affinity': 'r1'},
+                       '1': {'write_affinity_node_count': '3 * replicas'}}
+        # policy 0 inherits default node count, override affinity to r1
+        self._check_write_affinity(conf, policy_conf, POLICIES[0], [1],
+                                   self.replicas(POLICIES[0]))
+        # policy 1 inherits default affinity to r0, overrides node count
+        self._check_write_affinity(conf, policy_conf, POLICIES[1], [0],
+                                   3 * self.replicas(POLICIES[1]))
+
+    def test_POST_all_primaries_succeed(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='POST')
+        primary_codes = [202] * self.replicas()
+        with mocked_http_conn(*primary_codes) as mock_conn:
+            resp = req.get_response(self.app)
+        self.assertEqual(202, resp.status_int,
+                         'replicas = %s' % self.replicas())
+
+        timestamps = [captured['headers'].get('X-Timestamp')
+                      for captured in mock_conn.requests]
+        self.assertEqual(self.replicas(), len(timestamps))
+        self.assertEqual(1, len(set(timestamps)))
+        self.assert_valid_timestamp(timestamps[0])
+
+    def test_POST_sufficient_primaries_succeed_others_404(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='POST')
+        # NB: for POST to EC object quorum_size is sufficient for success
+        # rather than policy.quorum
+        primary_success = quorum_size(self.replicas())
+        primary_failure = self.replicas() - primary_success
+        primary_codes = [202] * primary_success + [404] * primary_failure
+        with mocked_http_conn(*primary_codes):
+            resp = req.get_response(self.app)
+        self.assertEqual(202, resp.status_int,
+                         'replicas = %s' % self.replicas())
+
+    def test_POST_sufficient_primaries_succeed_others_fail(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='POST')
+        # NB: for POST to EC object quorum_size is sufficient for success
+        # rather than policy.quorum
+        primary_success = quorum_size(self.replicas())
+        primary_failure = self.replicas() - primary_success
+        primary_codes = [202] * primary_success + [Timeout()] * primary_failure
+        handoff_codes = [404] * primary_failure
+        with mocked_http_conn(*(primary_codes + handoff_codes)):
+            resp = req.get_response(self.app)
+        self.assertEqual(202, resp.status_int,
+                         'replicas = %s' % self.replicas())
+
+    def test_POST_mixed_primaries_with_handoff_success(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='POST')
+        if self.replicas() == 1:
+            # with single replica, what you get is what you get
+            for status in (404, 202):
+                with mocked_http_conn(status):
+                    resp = req.get_response(self.app)
+                self.assertEqual(status, resp.status_int)
+            return
+        primary_success = quorum_size(self.replicas()) - 1
+        primary_failure = self.replicas() - primary_success
+        primary_codes = [404] * primary_failure + [202] * primary_success
+        handoff_codes = [202] * primary_failure
+        codes = primary_codes + handoff_codes
+        with mocked_http_conn(*codes):
+            resp = req.get_response(self.app)
+        self.assertEqual(202, resp.status_int,
+                         'replicas = %s' % self.replicas())
+
+    def test_POST_mixed_primaries_with_partial_handoff_success(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='POST')
+        if self.replicas() == 1:
+            # with single replica, what you get is what you get
+            for status in (404, 202):
+                with mocked_http_conn(status):
+                    resp = req.get_response(self.app)
+                self.assertEqual(status, resp.status_int)
+            return
+        primary_success = quorum_size(self.replicas()) - 1
+        primary_failure = self.replicas() - primary_success
+        primary_codes = [404] * primary_failure + [202] * primary_success
+        handoff_codes = [404] * (primary_failure // 2) + \
+                        [202] * (primary_failure - primary_failure // 2)
+        codes = primary_codes + handoff_codes
+        # object-server POST responses have no backend timestamps anyway, but
+        # it's important the handoffs don't have timestamps so that
+        # is_useful_response replaces them with 503s
+        headers = [{'x-backend-timestamp': None}] * len(codes)
+        with mocked_http_conn(*codes, headers=headers) as log:
+            resp = req.get_response(self.app)
+        self.assertEqual(202, resp.status_int,
+                         'replicas = %s' % self.replicas())
+        requested_nodes = [r['ip'] for r in log.requests]
+        self.assertEqual(len(requested_nodes), len(set(requested_nodes)))
+
+    def test_POST_mixed_primaries_with_handoff_missing(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='POST')
+        if self.replicas() == 1:
+            # with single replica, what you get is what you get
+            for status in (404, 202):
+                with mocked_http_conn(status):
+                    resp = req.get_response(self.app)
+                self.assertEqual(status, resp.status_int)
+            return
+        primary_success = quorum_size(self.replicas()) - 1
+        primary_failure = self.replicas() - primary_success
+        primary_codes = [404] * primary_failure + [202] * primary_success
+        handoff_codes = [404] * primary_failure
+        codes = primary_codes + handoff_codes
+        # object-server POST responses have no backend timestamps anyway, but
+        # it's important the handoffs don't have timestamps so that
+        # is_useful_response replaces them with 503s
+        headers = [{'x-backend-timestamp': None}] * len(codes)
+        with mocked_http_conn(*codes, headers=headers):
+            resp = req.get_response(self.app)
+        self.assertEqual(503, resp.status_int,
+                         'replicas = %s' % self.replicas())
+
+    def test_POST_insufficient_primaries_others_fail_handoffs_404(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='POST')
+        primary_success = quorum_size(self.replicas()) - 1
+        primary_failure = self.replicas() - primary_success
+        primary_codes = [Timeout()] * primary_failure + [202] * primary_success
+        handoff_codes = [404] * primary_failure
+        # note: by default fake_http_connect will return an x-backend-timestamp
+        # header; we need to override that for handoffs by setting to None
+        with mocked_http_conn(
+                *(primary_codes + handoff_codes),
+                headers=[{}] * len(primary_codes) +
+                        [{'x-backend-timestamp': None}] * len(handoff_codes)):
+            resp = req.get_response(self.app)
+        self.assertEqual(503, resp.status_int,
+                         'replicas = %s' % self.replicas())
+
+    def test_POST_primary_timeout_mixed_handoff(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='POST')
+        primary_success = 1
+        primary_failure = min(self.replicas() - 1, 1)
+        primary_missing = max(self.replicas() - 2, 0)
+        primary_codes = ([Timeout()] * primary_failure
+                         + [202] * primary_success
+                         + [404] * primary_missing)
+        handoff_codes = [404] * primary_failure + [202] * primary_missing
+        # make sure handoff 404 doesn't have a timestamp
+        headers = ([{}] * len(primary_codes)
+                   + [{'x-backend-timestamp': None}] * len(handoff_codes))
+        with mocked_http_conn(*(primary_codes + handoff_codes),
+                              headers=headers) as log:
+            resp = req.get_response(self.app)
+        self.assertEqual(202, resp.status_int,
+                         'replicas = %s' % self.replicas())
+        # we want to make sure we don't double up requests to any handoffs
+        requested_nodes = [r['ip'] for r in log.requests]
+        self.assertEqual(len(requested_nodes), len(set(requested_nodes)))
+
+    def test_POST_insufficient_primaries_others_fail_handoffs_fail(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='POST')
+        primary_success = quorum_size(self.replicas()) - 1
+        primary_failure = self.replicas() - primary_success
+        primary_codes = [Timeout()] * primary_failure + [202] * primary_success
+        handoff_codes = [507] * self.replicas()
+        with mocked_http_conn(*(primary_codes + handoff_codes)):
+            resp = req.get_response(self.app)
+        self.assertEqual(503, resp.status_int,
+                         'replicas = %s' % self.replicas())
+
+    def test_POST_all_primaries_fail_insufficient_handoff_succeeds(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='POST')
+        handoff_success = quorum_size(self.replicas()) - 1
+        handoff_not_found = self.replicas() - handoff_success
+        primary_codes = [Timeout()] * self.replicas()
+        handoff_codes = [202] * handoff_success + [404] * handoff_not_found
+        # note: by default fake_http_connect will return an x-backend-timestamp
+        # header; we need to override that for handoffs by setting to None
+        with mocked_http_conn(
+                *(primary_codes + handoff_codes),
+                headers=[{}] * len(primary_codes) +
+                        [{'x-backend-timestamp': None}] * len(handoff_codes)):
+            resp = req.get_response(self.app)
+        self.assertEqual(503, resp.status_int,
+                         'replicas = %s' % self.replicas())
+
+    def test_POST_all_primaries_fail_sufficient_handoff_succeeds(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='POST')
+        handoff_success = quorum_size(self.replicas())
+        handoff_not_found = self.replicas() - handoff_success
+        primary_codes = [Timeout()] * self.replicas()
+        handoff_codes = [202] * handoff_success + [404] * handoff_not_found
+        with mocked_http_conn(*(primary_codes + handoff_codes)):
+            resp = req.get_response(self.app)
+        self.assertEqual(202, resp.status_int,
+                         'replicas = %s' % self.replicas())
+
+# end of CommonObjectControllerMixin
+
+
+@patch_policies()
+class TestReplicatedObjController(CommonObjectControllerMixin,
+                                  BaseTestCase):
+
+    controller_cls = obj.ReplicatedObjectController
+
+    def test_PUT_simple(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='PUT')
+        req.headers['content-length'] = '0'
+        with mocked_http_conn(201, 201, 201) as mock_conn:
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 201)
+        timestamps = [captured['headers'].get('X-Timestamp')
+                      for captured in mock_conn.requests]
+        self.assertEqual(3, len(timestamps))
+        self.assertEqual(1, len(set(timestamps)))
+        self.assert_valid_timestamp(timestamps[0])
+
+    def test_PUT_error_with_footers(self):
+        footers_callback = make_footers_callback(b'')
+        env = {'swift.callback.update_footers': footers_callback}
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='PUT',
+                                              environ=env)
+        req.headers['content-length'] = '0'
+        codes = [503] * self.replicas()
+        expect_headers = {
+            'X-Obj-Metadata-Footer': 'yes'
+        }
+
+        with set_http_connect(*codes, expect_headers=expect_headers):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 503)
+
+    def _test_PUT_with_no_footers(self, test_body=b'', chunked=False):
+        # verify that when no footers are required then the PUT uses a regular
+        # single part body
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='PUT',
+                                              body=test_body)
+        if chunked:
+            req.headers['Transfer-Encoding'] = 'chunked'
+        etag = md5(test_body, usedforsecurity=False).hexdigest()
+        req.headers['Etag'] = etag
+
+        put_requests = defaultdict(
+            lambda: {'headers': None, 'chunks': [], 'connection': None})
+
+        def capture_body(conn, chunk):
+            put_requests[conn.connection_id]['chunks'].append(chunk)
+            put_requests[conn.connection_id]['connection'] = conn
+
+        def capture_headers(ip, port, device, part, method, path, headers,
+                            **kwargs):
+            conn_id = kwargs['connection_id']
+            put_requests[conn_id]['headers'] = headers
+
+        codes = [201] * self.replicas()
+        expect_headers = {'X-Obj-Metadata-Footer': 'yes'}
+        resp_headers = {
+            'Some-Header': 'Four',
+            'Etag': '"%s"' % etag,
+        }
+        with set_http_connect(*codes, expect_headers=expect_headers,
+                              give_send=capture_body,
+                              give_connect=capture_headers,
+                              headers=resp_headers):
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 201)
+        timestamps = {captured_req['headers']['x-timestamp']
+                      for captured_req in put_requests.values()}
+        self.assertEqual(1, len(timestamps), timestamps)
+        self.assertEqual(dict(resp.headers), {
+            'Content-Type': 'text/html; charset=UTF-8',
+            'Content-Length': '0',
+            'Etag': etag,
+            'Last-Modified':
+                date_header_format(Timestamp(timestamps.pop())),
+        })
+        for connection_id, info in put_requests.items():
+            body = b''.join(info['chunks'])
+            headers = info['headers']
+            if chunked or not test_body:
+                body = unchunk_body(body)
+                self.assertEqual('100-continue', headers['Expect'])
+                self.assertEqual('chunked', headers['Transfer-Encoding'])
+                self.assertNotIn('Content-Length', headers)
+            else:
+                self.assertNotIn('Transfer-Encoding', headers)
+            if body or not test_body:
+                self.assertEqual('100-continue', headers['Expect'])
+            else:
+                self.assertNotIn('Expect', headers)
+            self.assertNotIn('X-Backend-Obj-Multipart-Mime-Boundary', headers)
+            self.assertNotIn('X-Backend-Obj-Metadata-Footer', headers)
+            self.assertNotIn('X-Backend-Obj-Multiphase-Commit', headers)
+            self.assertEqual(etag, headers['Etag'])
+
+            self.assertEqual(test_body, body)
+            self.assertTrue(info['connection'].closed)
+
+    def test_PUT_with_chunked_body_and_no_footers(self):
+        self._test_PUT_with_no_footers(test_body=b'asdf', chunked=True)
+
+    def test_PUT_with_body_and_no_footers(self):
+        self._test_PUT_with_no_footers(test_body=b'asdf', chunked=False)
+
+    def test_PUT_with_no_body_and_no_footers(self):
+        self._test_PUT_with_no_footers(test_body=b'', chunked=False)
+
+    def test_txn_id_logging_on_PUT(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='PUT')
+        self.app.logger.txn_id = req.environ['swift.trans_id'] = 'test-txn-id'
+        req.headers['content-length'] = '0'
+        # we capture stdout since the debug log formatter prints the formatted
+        # message to stdout
+        stdout = StringIO()
+        with set_http_connect((100, Timeout()), 503, 503), \
+                mock.patch('sys.stdout', stdout):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 503)
+        for line in stdout.getvalue().splitlines():
+            self.assertIn('test-txn-id', line)
+        self.assertIn('Trying to get final status of PUT to',
+                      stdout.getvalue())
+
+    def test_PUT_empty_bad_etag(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='PUT')
+        req.headers['Content-Length'] = '0'
+        req.headers['Etag'] = '"catbus"'
+
+        # The 2-tuple here makes getexpect() return 422, not 100. For objects
+        # that are >0 bytes, you get a 100 Continue and then a 422
+        # Unprocessable Entity after sending the body. For zero-byte objects,
+        # though, you get the 422 right away because no Expect header is sent
+        # with zero-byte PUT. The second status in the tuple should not be
+        # consumed, it's just there to make the FakeStatus treat the first as
+        # an expect status, but we'll make it something other than a 422 so
+        # that if it is consumed then the test should fail.
+        codes = [FakeStatus((422, 200))
+                 for _junk in range(self.replicas())]
+
+        with set_http_connect(*codes):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 422)
+
+    def test_PUT_if_none_match(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='PUT')
+        req.headers['if-none-match'] = '*'
+        req.headers['content-length'] = '0'
+        with set_http_connect(201, 201, 201):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 201)
+
+    def test_PUT_if_none_match_denied(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='PUT')
+        req.headers['if-none-match'] = '*'
+        req.headers['content-length'] = '0'
+        with set_http_connect(201, 412, 201):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 412)
+
+    def test_PUT_if_none_match_not_star(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='PUT')
+        req.headers['if-none-match'] = 'somethingelse'
+        req.headers['content-length'] = '0'
+        with set_http_connect():
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 400)
+
+    def test_PUT_connect_exceptions(self):
+        object_ring = self.app.get_object_ring(None)
+        self.app.sort_nodes = lambda n, *args, **kwargs: n  # disable shuffle
+
+        def test_status_map(statuses, expected):
+            self.app.error_limiter.stats.clear()
+            req = swob.Request.blank('/v1/a/c/o.jpg', method='PUT',
+                                     body=b'test body')
+            with set_http_connect(*statuses):
+                resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, expected)
+
+        base_status = [201] * 3
+        # test happy path
+        test_status_map(list(base_status), 201)
+        for i in range(3):
+            self.assertEqual(node_error_count(
+                self.app, object_ring.devs[i]), 0)
+        # single node errors and test isolation
+        for i in range(3):
+            status_list = list(base_status)
+            status_list[i] = 503
+            test_status_map(status_list, 201)
+            for j in range(3):
+                self.assertEqual(node_error_count(
+                    self.app, object_ring.devs[j]), 1 if j == i else 0)
+        # connect errors
+        test_status_map((201, Timeout(), 201, 201), 201)
+        self.assertEqual(node_error_count(
+            self.app, object_ring.devs[1]), 1)
+        test_status_map((Exception('kaboom!'), 201, 201, 201), 201)
+        self.assertEqual(node_error_count(
+            self.app, object_ring.devs[0]), 1)
+        # expect errors
+        test_status_map((201, 201, (503, None), 201), 201)
+        self.assertEqual(node_error_count(
+            self.app, object_ring.devs[2]), 1)
+        test_status_map(((507, None), 201, 201, 201), 201)
+        self.assertEqual(
+            node_error_count(self.app, object_ring.devs[0]),
+            self.app.error_limiter.suppression_limit + 1)
+        # response errors
+        test_status_map(((100, Timeout()), 201, 201), 201)
+        self.assertEqual(
+            node_error_count(self.app, object_ring.devs[0]), 1)
+        test_status_map((201, 201, (100, Exception())), 201)
+        self.assertEqual(
+            node_error_count(self.app, object_ring.devs[2]), 1)
+        test_status_map((201, (100, 507), 201), 201)
+        self.assertEqual(
+            node_error_count(self.app, object_ring.devs[1]),
+            self.app.error_limiter.suppression_limit + 1)
+
+    def test_PUT_connect_exception_with_unicode_path(self):
+        expected = 201
+        statuses = (
+            Exception('Connection refused: Please insert ten dollars'),
+            201, 201, 201)
+
+        req = swob.Request.blank('/v1/AUTH_kilroy/%ED%88%8E/%E9%90%89',
+                                 method='PUT',
+                                 body=b'life is utf-gr8')
+        self.app.logger.clear()
+        with set_http_connect(*statuses):
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, expected)
+        log_lines = self.app.logger.get_lines_for_level('error')
+        self.assertFalse(log_lines[1:])
+        self.assertIn('ERROR with Object server', log_lines[0])
+        self.assertIn(quote(req.swift_entity_path), log_lines[0])
+        self.assertIn('re: Expect: 100-continue', log_lines[0])
+
+    def test_PUT_get_expect_errors_with_unicode_path(self):
+        def do_test(statuses):
+            req = swob.Request.blank('/v1/AUTH_kilroy/%ED%88%8E/%E9%90%89',
+                                     method='PUT',
+                                     body=b'life is utf-gr8')
+            self.app.logger.clear()
+            with set_http_connect(*statuses):
+                resp = req.get_response(self.app)
+
+            self.assertEqual(resp.status_int, 201)
+            log_lines = self.app.logger.get_lines_for_level('error')
+            self.assertFalse(log_lines[1:])
+            return log_lines
+
+        log_lines = do_test((201, (507, None), 201, 201))
+        self.assertIn('ERROR Insufficient Storage', log_lines[0])
+
+        log_lines = do_test((201, (503, None), 201, 201))
+        self.assertIn('ERROR 503 Expect: 100-continue From Object Server',
+                      log_lines[0])
+
+    def test_PUT_send_exception_with_unicode_path(self):
+        def do_test(exc):
+            conns = set()
+
+            def capture_send(conn, data):
+                conns.add(conn)
+                if len(conns) == 2:
+                    raise exc
+
+            req = swob.Request.blank('/v1/AUTH_kilroy/%ED%88%8E/%E9%90%89',
+                                     method='PUT',
+                                     body=b'life is utf-gr8')
+            self.app.logger.clear()
+            with set_http_connect(201, 201, 201, give_send=capture_send):
+                resp = req.get_response(self.app)
+
+            self.assertEqual(resp.status_int, 201)
+            log_lines = self.app.logger.get_lines_for_level('error')
+            self.assertFalse(log_lines[1:])
+            self.assertIn('ERROR with Object server', log_lines[0])
+            self.assertIn(quote(req.swift_entity_path), log_lines[0])
+            self.assertIn('Trying to write to', log_lines[0])
+
+        do_test(Exception('Exception while sending data on connection'))
+        do_test(ChunkWriteTimeout())
+
+    def test_PUT_final_response_errors_with_unicode_path(self):
+        def do_test(statuses):
+            req = swob.Request.blank('/v1/AUTH_kilroy/%ED%88%8E/%E9%90%89',
+                                     method='PUT',
+                                     body=b'life is utf-gr8')
+            self.app.logger.clear()
+            with set_http_connect(*statuses):
+                resp = req.get_response(self.app)
+
+            self.assertEqual(resp.status_int, 201)
+            log_lines = self.app.logger.get_lines_for_level('error')
+            self.assertFalse(log_lines[1:])
+            return req, log_lines
+
+        req, log_lines = do_test((201, (100, Exception('boom')), 201))
+        self.assertIn('ERROR with Object server', log_lines[0])
+        self.assertIn(req.path, log_lines[0])
+        self.assertIn('Trying to get final status of PUT', log_lines[0])
+
+        req, log_lines = do_test((201, (100, Timeout()), 201))
+        self.assertIn('ERROR with Object server', log_lines[0])
+        self.assertIn(req.path, log_lines[0])
+        self.assertIn('Trying to get final status of PUT', log_lines[0])
+
+        req, log_lines = do_test((201, (100, 507), 201))
+        self.assertIn('ERROR Insufficient Storage', log_lines[0])
+
+        req, log_lines = do_test((201, (100, 500), 201))
+        # We allow the b'' in logs because we want to see bad characters.
+        self.assertIn(
+            "ERROR 500 b'' Trying to PUT /v1/AUTH_kilroy/%ED%88%8E/"
+            "%E9%90%89 From Object Server", log_lines[0])
+        self.assertIn(req.path, log_lines[0])
+
+    def test_DELETE_errors(self):
+        # verify logged errors with and without non-ascii characters in path
+        def do_test(path, statuses):
+
+            req = swob.Request.blank('/v1' + path,
+                                     method='DELETE',
+                                     body=b'life is utf-gr8')
+            self.app.logger.clear()
+            with set_http_connect(*statuses):
+                resp = req.get_response(self.app)
+
+            self.assertEqual(resp.status_int, 201)
+            log_lines = self.app.logger.get_lines_for_level('error')
+            self.assertFalse(log_lines[1:])
+            return req, log_lines
+
+        req, log_lines = do_test('/AUTH_kilroy/ascii/ascii',
+                                 (201, 500, 201, 201))
+        self.assertIn('Trying to DELETE', log_lines[0])
+        self.assertIn(req.swift_entity_path, log_lines[0])
+        self.assertIn(' From Object Server', log_lines[0])
+
+        req, log_lines = do_test('/AUTH_kilroy/%ED%88%8E/%E9%90%89',
+                                 (201, 500, 201, 201))
+        self.assertIn('Trying to DELETE', log_lines[0])
+        self.assertIn(req.swift_entity_path, log_lines[0])
+        self.assertIn(' From Object Server', log_lines[0])
+
+        req, log_lines = do_test('/AUTH_kilroy/ascii/ascii',
+                                 (201, 507, 201, 201))
+        self.assertIn('ERROR Insufficient Storage', log_lines[0])
+
+        req, log_lines = do_test('/AUTH_kilroy/%ED%88%8E/%E9%90%89',
+                                 (201, 507, 201, 201))
+        self.assertIn('ERROR Insufficient Storage', log_lines[0])
+
+        req, log_lines = do_test('/AUTH_kilroy/ascii/ascii',
+                                 (201, Exception(), 201, 201))
+        self.assertIn('Trying to DELETE', log_lines[0])
+        self.assertIn(req.swift_entity_path, log_lines[0])
+        self.assertIn('ERROR with Object server', log_lines[0])
+
+        req, log_lines = do_test('/AUTH_kilroy/%ED%88%8E/%E9%90%89',
+                                 (201, Exception(), 201, 201))
+        self.assertIn('Trying to DELETE', log_lines[0])
+        self.assertIn(req.swift_entity_path, log_lines[0])
+        self.assertIn('ERROR with Object server', log_lines[0])
+
+    def test_DELETE_with_write_affinity(self):
+        policy_conf = self.app.get_policy_options(self.policy)
+        policy_conf.write_affinity_handoff_delete_count = self.replicas() // 2
+        policy_conf.write_affinity_is_local_fn = (
+            lambda node: node['region'] == 1)
+
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='DELETE')
+
+        codes = [204, 204, 404, 204]
+        with mocked_http_conn(*codes):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 204)
+
+        codes = [204, 404, 404, 204]
+        with mocked_http_conn(*codes):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 204)
+
+        policy_conf.write_affinity_handoff_delete_count = 2
+
+        codes = [204, 204, 404, 204, 404]
+        with mocked_http_conn(*codes):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 204)
+
+        codes = [204, 404, 404, 204, 204]
+        with mocked_http_conn(*codes):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 204)
+
+    def test_PUT_error_during_transfer_data(self):
+        class FakeReader(object):
+            def read(self, size):
+                raise IOError('error message')
+
+        req = swob.Request.blank('/v1/a/c/o.jpg', method='PUT',
+                                 body=b'test body')
+
+        req.environ['wsgi.input'] = FakeReader()
+        req.headers['content-length'] = '6'
+        with set_http_connect(201, 201, 201):
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 499)
+
+    def test_PUT_chunkreadtimeout_during_transfer_data(self):
+        class FakeReader(object):
+            def read(self, size):
+                raise exceptions.ChunkReadTimeout()
+
+        req = swob.Request.blank('/v1/a/c/o.jpg', method='PUT',
+                                 body=b'test body')
+
+        req.environ['wsgi.input'] = FakeReader()
+        req.headers['content-length'] = '6'
+        with set_http_connect(201, 201, 201):
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 408)
+
+    def test_PUT_timeout_during_transfer_data(self):
+        class FakeReader(object):
+            def read(self, size):
+                raise Timeout()
+        conns = []
+
+        def capture_expect(conn):
+            # stash connections so that we can verify they all get closed
+            conns.append(conn)
+
+        req = swob.Request.blank('/v1/a/c/o.jpg', method='PUT',
+                                 body=b'test body')
+
+        req.environ['wsgi.input'] = FakeReader()
+        req.headers['content-length'] = '6'
+        with set_http_connect(201, 201, 201, give_expect=capture_expect):
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 499)
+        self.assertEqual(self.replicas(), len(conns))
+        for conn in conns:
+            self.assertTrue(conn.closed)
+
+    def test_PUT_insufficient_data_from_client(self):
+        class FakeReader(object):
+            def read(self, size):
+                raise Timeout()
+        conns = []
+
+        def capture_expect(conn):
+            # stash connections so that we can verify they all get closed
+            conns.append(conn)
+
+        req = swob.Request.blank('/v1/a/c/o.jpg', method='PUT',
+                                 body='7 bytes')
+        req.headers['content-length'] = '99'
+        with set_http_connect(201, 201, 201, give_expect=capture_expect):
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 499)
+        warning_lines = self.app.logger.get_lines_for_level('warning')
+        self.assertEqual(1, len(warning_lines))
+        self.assertIn('Client disconnected without sending enough data',
+                      warning_lines[0])
+        self.assertEqual(self.replicas(), len(conns))
+        for conn in conns:
+            self.assertTrue(conn.closed)
+
+    def test_PUT_exception_during_transfer_data(self):
+        class FakeReader(object):
+            def read(self, size):
+                raise Exception('exception message')
+
+        req = swob.Request.blank('/v1/a/c/o.jpg', method='PUT',
+                                 body=b'test body')
+
+        req.environ['wsgi.input'] = FakeReader()
+        req.headers['content-length'] = '6'
+        with set_http_connect(201, 201, 201):
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 500)
+
+    def test_GET_simple(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o')
+        with set_http_connect(200, headers={'Connection': 'close'}):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 200)
+        self.assertIn('Accept-Ranges', resp.headers)
+        self.assertNotIn('Connection', resp.headers)
+
+    def test_GET_slow_read(self):
+        self.app.recoverable_node_timeout = 0.01
+        self.app.client_timeout = 0.1
+        self.app.object_chunk_size = 10
+        body = b'test'
+        etag = md5(body, usedforsecurity=False).hexdigest()
+        headers = {
+            'Etag': etag,
+            'Content-Length': len(body),
+            'X-Timestamp': Timestamp(self.ts()).normal,
+        }
+        responses = [(200, body, headers)] * 2
+        status_codes, body_iter, headers = zip(*responses)
+        req = swift.common.swob.Request.blank('/v1/a/c/o')
+        # make the first response slow...
+        read_sleeps = [0.1, 0]
+        with mocked_http_conn(*status_codes, body_iter=body_iter,
+                              headers=headers, slow=read_sleeps) as log:
+            resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 200)
+            body = resp.body
+        self.assertEqual(b'test', body)
+        self.assertEqual(len(log.requests), 2)
+
+        def make_key(r):
+            r['device'] = r['path'].split('/')[1]
+            return '%(ip)s:%(port)s/%(device)s' % r
+        # the first node got errors incr'd
+        expected_error_limiting = {
+            make_key(log.requests[0]): {
+                'errors': 1,
+                'last_error': mock.ANY,
+            }
+        }
+        actual = {}
+        for n in self.app.get_object_ring(int(self.policy)).devs:
+            node_key = self.app.error_limiter.node_key(n)
+            stats = self.app.error_limiter.stats.get(node_key) or {}
+            if stats:
+                actual[self.app.error_limiter.node_key(n)] = stats
+        self.assertEqual(actual, expected_error_limiting)
+        for read_line in self.app.logger.get_lines_for_level('error'):
+            self.assertIn("Trying to read object during GET (retrying)",
+                          read_line)
+        self.assertEqual(
+            len(self.logger.logger.records['ERROR']), 1,
+            'Expected 1 ERROR lines, got %r' % (
+                self.logger.logger.records['ERROR'], ))
+
+    def _do_test_GET_with_multirange_slow_body_resumes(
+            self, slowdown_after=0, resume_bytes=0):
+        self.app.logger.clear()
+        self.app.recoverable_node_timeout = 0.01
+        self.app.object_chunk_size = 10
+        obj_data = b''.join([b'testing%03d' % i for i in range(100)])
+        etag = md5(obj_data, usedforsecurity=False).hexdigest()
+        boundary1 = b'81eb9c110b32ced5fe'
+        resp_body1 = b'\r\n'.join([
+            b'--' + boundary1,
+            b'Content-Type: application/octet-stream',
+            b'Content-Range: bytes 0-49/700',
+            b'',
+            obj_data[0:50],
+            b'--' + boundary1,
+            b'Content-Type: application/octet-stream',
+            b'Content-Range: bytes 100-104/700',
+            b'',
+            obj_data[100:105],
+            b'--' + boundary1 + b'--',
+        ])
+        boundary2 = b'aaeb9c110b32ced5fe'
+        resp_body2 = b'\r\n'.join([
+            b'--' + boundary2,
+            b'Content-Type: application/octet-stream',
+            b'Content-Range: bytes %d-49/700' % resume_bytes,
+            b'',
+            obj_data[resume_bytes:50],
+            b'--' + boundary2,
+            b'Content-Type: application/octet-stream',
+            b'Content-Range: bytes 100-104/700',
+            b'',
+            obj_data[100:105],
+            b'--' + boundary2 + b'--',
+        ])
+
+        headers1 = {
+            'Etag': etag,
+            'Content-Type': b'multipart/byteranges;boundary=' + boundary1,
+            'Content-Length': len(resp_body1),
+            'X-Timestamp': Timestamp(self.ts()).normal,
+        }
+        headers2 = {
+            'Etag': etag,
+            'Content-Type': b'multipart/byteranges;boundary=' + boundary2,
+            'Content-Length': len(resp_body2),
+            'X-Timestamp': Timestamp(self.ts()).normal,
+        }
+        responses = [
+            StubResponse(206, resp_body1, headers1, slowdown=0.1,
+                         slowdown_after=slowdown_after),
+            StubResponse(206, resp_body2, headers2)
+        ]
+        req_range_hdrs = []
+
+        def get_response(req):
+            req_range_hdrs.append(req['headers'].get('Range'))
+            return responses.pop(0) if responses else StubResponse(404)
+
+        req = swob.Request.blank('/v1/a/c/o', headers={
+            'Range': 'bytes=0-49,100-104'})
+        with capture_http_requests(get_response) as captured_requests:
+            resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 206)
+            actual_body = resp.body
+
+        self.assertEqual(resp.status_int, 206)
+        self.assertEqual(2, len(captured_requests))
+        self.assertEqual([1] + [0] * (self.replicas() - 1),
+                         node_error_counts(self.app, self.obj_ring.devs))
+        # note: client response uses boundary from first backend response
+        self.assertEqual(resp_body1, actual_body)
+        return req_range_hdrs
+
+    def test_GET_with_multirange_slow_body_resumes(self):
+        req_range_hdrs = self._do_test_GET_with_multirange_slow_body_resumes(
+            slowdown_after=0)
+        self.assertEqual(['bytes=0-49,100-104'] * 2, req_range_hdrs)
+        error_lines = self.app.logger.get_lines_for_level('error')
+        self.assertEqual(1, len(error_lines))
+        self.assertIn('Trying to read next part of object multi-part GET '
+                      '(retrying)', error_lines[0])
+
+    def test_GET_with_multirange_slow_body_resumes_before_body_started(self):
+        # First response times out while first part boundary/headers are being
+        # read. No part body has been yielded to the client so range header is
+        # not adjusted for the second backend request.
+        req_range_hdrs = self._do_test_GET_with_multirange_slow_body_resumes(
+            slowdown_after=40, resume_bytes=0)
+        self.assertEqual(['bytes=0-49,100-104'] * 2, req_range_hdrs)
+        error_lines = self.app.logger.get_lines_for_level('error')
+        self.assertEqual(1, len(error_lines))
+        self.assertIn('Trying to read next part of object multi-part GET '
+                      '(retrying)', error_lines[0])
+
+    def test_GET_with_multirange_slow_body_resumes_after_body_started(self):
+        # First response times out after first part boundary/headers have been
+        # read. Some part body has been yielded to the client so range header
+        # is adjusted for the second backend request.
+        # 140 bytes before timeout is sufficient for the part boundary, headers
+        # and approx 50 body bytes to be read, but _MultipartMimeFileLikeObject
+        # buffers bytes from the backend response such that only 20 bytes are
+        # actually yielded to the client.
+        req_range_hdrs = self._do_test_GET_with_multirange_slow_body_resumes(
+            slowdown_after=140, resume_bytes=20)
+        self.assertEqual(['bytes=0-49,100-104', 'bytes=20-49,100-104'],
+                         req_range_hdrs)
+        error_lines = self.app.logger.get_lines_for_level('error')
+        self.assertEqual(1, len(error_lines))
+        self.assertIn('Trying to read object during GET (retrying) ',
+                      error_lines[0])
+
+    def test_GET_with_multirange_slow_body_unable_to_resume(self):
+        self.app.recoverable_node_timeout = 0.01
+        obj_data = b'testing' * 100
+        etag = md5(obj_data, usedforsecurity=False).hexdigest()
+        boundary = b'81eb9c110b32ced5fe'
+
+        resp_body = b'\r\n'.join([
+            b'--' + boundary,
+            b'Content-Type: application/octet-stream',
+            b'Content-Range: bytes 0-49/700',
+            b'',
+            obj_data[0:50],
+            b'--' + boundary,
+            b'Content-Type: application/octet-stream',
+            b'Content-Range: bytes 100-104/700',
+            b'',
+            obj_data[100:105],
+            b'--' + boundary + b'--',
+        ])
+
+        headers = {
+            'Etag': etag,
+            'Content-Type': b'multipart/byteranges;boundary=' + boundary,
+            'Content-Length': len(resp_body),
+            'X-Timestamp': Timestamp(self.ts()).normal,
+        }
+        responses = [
+            StubResponse(206, resp_body, headers, slowdown=0.1),
+            StubResponse(206, resp_body, headers, slowdown=0.1),
+            StubResponse(206, resp_body, headers, slowdown=0.1),
+        ]
+
+        def get_response(req):
+            return responses.pop(0) if responses else StubResponse(404)
+
+        req = swob.Request.blank('/v1/a/c/o', headers={
+            'Range': 'bytes=0-49,100-104'})
+        response_chunks = []
+        with capture_http_requests(get_response) as log:
+            resp = req.get_response(self.app)
+            with self.assertRaises(ChunkReadTimeout):
+                # note: the error is raised while the resp_iter is read...
+                for chunk in resp.app_iter:
+                    response_chunks.append(chunk)
+        self.assertEqual(response_chunks, [])
+        self.assertEqual(resp.status_int, 206)
+        self.assertEqual([1, 1, 1],
+                         node_error_counts(self.app, self.obj_ring.devs))
+        self.assertEqual(6, len(log))
+        error_lines = self.app.logger.get_lines_for_level('error')
+        self.assertEqual(3, len(error_lines))
+        for line in error_lines:
+            self.assertIn('Trying to read next part of object multi-part GET '
+                          '(retrying)', line)
+
+    def test_GET_unable_to_resume(self):
+        self.app.recoverable_node_timeout = 0.01
+        self.app.client_timeout = 0.1
+        self.app.object_chunk_size = 10
+        resp_body = b'length 8'
+        etag = md5(resp_body, usedforsecurity=False).hexdigest()
+        headers = {
+            'Etag': etag,
+            'Content-Type': b'plain/text',
+            'Content-Length': len(resp_body),
+            'X-Timestamp': Timestamp(self.ts()).normal,
+        }
+
+        # make all responses slow...
+        responses = [
+            StubResponse(200, resp_body, headers, slowdown=0.1),
+            StubResponse(200, resp_body, headers, slowdown=0.1),
+            StubResponse(200, resp_body, headers, slowdown=0.1),
+        ]
+
+        def get_response(req):
+            return responses.pop(0) if responses else StubResponse(404)
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(get_response):
+            resp = req.get_response(self.app)
+            with self.assertRaises(ChunkReadTimeout):
+                _ = resp.body
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(etag, resp.headers.get('ETag'))
+        self.assertEqual([1] * self.replicas(),
+                         node_error_counts(self.app, self.obj_ring.devs))
+
+        error_lines = self.app.logger.get_lines_for_level('error')
+        self.assertEqual(3, len(error_lines))
+        for line in error_lines[:3]:
+            self.assertIn('Trying to read object during GET', line)
+
+    def test_GET_newest_will_not_resume(self):
+        # verify that request with x-newest use node_timeout and don't resume
+        self.app.node_timeout = 0.01
+        # set recoverable_node_timeout crazy high to verify that this is not
+        # the timeout value that is used
+        self.app.recoverable_node_timeout = 1000
+        self.app.client_timeout = 0.1
+        self.app.object_chunk_size = 10
+        resp_body = b'length 8'
+        etag = md5(resp_body, usedforsecurity=False).hexdigest()
+        headers = {
+            'Etag': etag,
+            'Content-Type': b'plain/text',
+            'Content-Length': len(resp_body),
+            'X-Timestamp': Timestamp(self.ts()).normal,
+        }
+
+        # make all responses slow...
+        responses = [
+            StubResponse(200, resp_body, headers, slowdown=0.1),
+        ]
+
+        def get_response(req):
+            return responses.pop(0) if responses else StubResponse(404)
+
+        req = swob.Request.blank('/v1/a/c/o', headers={'X-Newest': 'true'})
+        with capture_http_requests(get_response):
+            resp = req.get_response(self.app)
+            with self.assertRaises(ChunkReadTimeout):
+                _ = resp.body
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(etag, resp.headers.get('ETag'))
+        error_lines = self.app.logger.get_lines_for_level('error')
+        self.assertEqual(0, len(error_lines))
+
+    def test_GET_resuming_ignores_416(self):
+        # verify that a resuming getter will not try to use the content of a
+        # 416 response (because it's etag will mismatch that from the first
+        # response)
+        self.app.recoverable_node_timeout = 0.01
+        self.app.client_timeout = 0.1
+        self.app.object_chunk_size = 10
+        body = b'length 8'
+        body_short = b'four'
+        body_416 = b'<html><h1>Requested Range Not Satisfiable</h1>' \
+                   b'<p>The Range requested is not available.</p></html>'
+        etag = md5(body, usedforsecurity=False).hexdigest()
+        etag_short = md5(body_short, usedforsecurity=False).hexdigest()
+        headers_206 = {
+            'Etag': etag,
+            'Content-Length': len(body),
+            'X-Timestamp': Timestamp(self.ts()).normal,
+            'Content-Range': 'bytes 7-8/8'
+        }
+        headers_416 = {
+            # note: 416 when applying the same range implies different object
+            # length and therefore different etag
+            'Etag': etag_short,
+            'Content-Length': len(body_416),
+            'X-Timestamp': Timestamp(self.ts()).normal,
+            'Content-Range': 'bytes */4'
+        }
+        req = swift.common.swob.Request.blank(
+            '/v1/a/c/o', headers={'Range': 'bytes=7-8'})
+        # make the first response slow...
+        read_sleeps = [0.1, 0]
+        with mocked_http_conn(206, 416, 206, body_iter=[body, body_416, body],
+                              headers=[headers_206, headers_416, headers_206],
+                              slow=read_sleeps) as log:
+            resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 206)
+            resp_body = resp.body
+        self.assertEqual(b'length 8', resp_body)
+        self.assertEqual(len(log.requests), 3)
+        self.assertEqual('bytes=7-8', log.requests[0]['headers']['Range'])
+        self.assertEqual('bytes=7-8', log.requests[1]['headers']['Range'])
+        self.assertEqual('bytes=7-8', log.requests[2]['headers']['Range'])
+
+    def test_GET_resuming(self):
+        self.app.recoverable_node_timeout = 0.01
+        self.app.client_timeout = 0.1
+        self.app.object_chunk_size = 10
+        body = b'length 8'
+        etag = md5(body, usedforsecurity=False).hexdigest()
+        headers_200 = {
+            'Etag': etag,
+            'Content-Length': len(body),
+            'X-Timestamp': Timestamp(self.ts()).normal,
+        }
+        headers_206 = {
+            # note: use of 'X-Backend-Ignore-Range-If-Metadata-Present' in
+            # request means that 200 response did not evaluate the Range and
+            # the proxy modifies requested backend range accordingly
+            'Etag': etag,
+            'Content-Length': len(body),
+            'X-Timestamp': Timestamp(self.ts()).normal,
+            'Content-Range': 'bytes 0-7/8'
+        }
+        req = swift.common.swob.Request.blank(
+            '/v1/a/c/o',
+            headers={'Range': 'bytes=9-10, 20-30',
+                     'X-Backend-Ignore-Range-If-Metadata-Present':
+                         'X-Static-Large-Object'})
+        # make the first 2 responses slow...
+        read_sleeps = [0.1, 0.1, 0]
+        with mocked_http_conn(200, 206, 206, body_iter=[body, body, body],
+                              headers=[headers_200, headers_206, headers_206],
+                              slow=read_sleeps) as log:
+            resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 200)
+            resp_body = resp.body
+        self.assertEqual(b'length 8', resp_body)
+        self.assertEqual(len(log.requests), 3)
+        # NB: original range is not satisfiable but is ignored
+        self.assertEqual('bytes=9-10, 20-30',
+                         log.requests[0]['headers']['Range'])
+        self.assertIn('X-Backend-Ignore-Range-If-Metadata-Present',
+                      log.requests[0]['headers'])
+        # backend Range is updated to something that is satisfiable
+        self.assertEqual('bytes=0-7,20-30',
+                         log.requests[1]['headers']['Range'])
+        self.assertNotIn('X-Backend-Ignore-Range-If-Metadata-Present',
+                         log.requests[1]['headers'])
+        self.assertEqual('bytes=0-7,20-30',
+                         log.requests[2]['headers']['Range'])
+        self.assertNotIn('X-Backend-Ignore-Range-If-Metadata-Present',
+                         log.requests[2]['headers'])
+        self.assertEqual([1, 1] + [0] * (self.replicas() - 2),
+                         node_error_counts(self.app, self.obj_ring.devs))
+
+    def test_GET_transfer_encoding_chunked(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o')
+        with set_http_connect(200, headers={'transfer-encoding': 'chunked'}):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['Transfer-Encoding'], 'chunked')
+
+    def _test_removes_swift_bytes(self, method):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method=method)
+        with set_http_connect(
+                200, headers={'content-type': 'image/jpeg; swift_bytes=99'}):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['Content-Type'], 'image/jpeg')
+
+    def test_GET_removes_swift_bytes(self):
+        self._test_removes_swift_bytes('GET')
+
+    def test_HEAD_removes_swift_bytes(self):
+        self._test_removes_swift_bytes('HEAD')
+
+    def test_GET_error(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o')
+        self.app.logger.txn_id = req.environ['swift.trans_id'] = 'my-txn-id'
+        stdout = StringIO()
+        with set_http_connect(503, 200), \
+                mock.patch('sys.stdout', stdout):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 200)
+        for line in stdout.getvalue().splitlines():
+            self.assertIn('my-txn-id', line)
+        self.assertIn('From Object Server', stdout.getvalue())
+
+    def test_GET_handoff(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o')
+        codes = [503] * self.obj_ring.replicas + [200]
+        with set_http_connect(*codes):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 200)
+
+    def test_GET_not_found(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o')
+        codes = [404] * (self.obj_ring.replicas +
+                         self.obj_ring.max_more_nodes)
+        with set_http_connect(*codes):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 404)
+
+    def test_GET_primaries_explode(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o')
+        codes = [Exception('kaboom!')] * self.obj_ring.replicas + (
+            [404] * self.obj_ring.max_more_nodes)
+        with set_http_connect(*codes):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 503)
+
+    def test_GET_primaries_timeout(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o')
+        codes = [Timeout()] * self.obj_ring.replicas + (
+            [404] * self.obj_ring.max_more_nodes)
+        with set_http_connect(*codes):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 503)
+        self.assertEqual([1] * self.replicas(),
+                         node_error_counts(self.app, self.obj_ring.devs))
+
+    def test_HEAD_error_limit_supression_count(self):
+        def do_test(primary_codes, expected, clear_stats=True):
+            if clear_stats:
+                self.app.error_limiter.stats.clear()
+            random.shuffle(primary_codes)
+            handoff_codes = [404] * self.obj_ring.max_more_nodes
+            with set_http_connect(*primary_codes + handoff_codes):
+                req = swift.common.swob.Request.blank(
+                    '/v1/a/c/o', method='HEAD')
+                resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, expected)
+
+        policy_opts = self.app.get_policy_options(None)
+        policy_opts.rebalance_missing_suppression_count = 1
+        # even with disks unmounted you can run with suppression_count = 1
+        do_test([507, 404, 404], 404)
+        # error limiting can make things wonky
+        do_test([404, 404], 404, clear_stats=False)
+        # and it gets a little dicy rebooting nodes
+        do_test([Timeout(), 404], 503, clear_stats=False)
+        do_test([507, Timeout(), 404], 503)
+        # unless you turn it off
+        policy_opts.rebalance_missing_suppression_count = 0
+        do_test([507, Timeout(), 404], 404)
+
+    def test_GET_primaries_error_during_rebalance(self):
+        def do_test(primary_codes, expected, include_timestamp=False):
+            random.shuffle(primary_codes)
+            handoff_codes = [404] * self.obj_ring.max_more_nodes
+            headers = None
+            if include_timestamp:
+                headers = [{'X-Backend-Timestamp': '123.456'}] * 3
+                headers.extend({} for _ in handoff_codes)
+            with set_http_connect(*primary_codes + handoff_codes,
+                                  headers=headers):
+                req = swift.common.swob.Request.blank('/v1/a/c/o')
+                resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, expected)
+
+        # with two of out three backend errors a client should retry
+        do_test([Timeout(), Exception('kaboom!'), 404], 503)
+        # unless there's a timestamp associated
+        do_test([Timeout(), Exception('kaboom!'), 404], 404,
+                include_timestamp=True)
+        # when there's more 404s, we trust it more
+        do_test([Timeout(), 404, 404], 404)
+        # unless we explicitly *don't* want to trust it
+        policy_opts = self.app.get_policy_options(None)
+        policy_opts.rebalance_missing_suppression_count = 2
+        do_test([Timeout(), 404, 404], 503)
+
+        # overloaded primary after double rebalance
+        # ... opts should increase rebalance_missing_suppression_count
+        policy_opts.rebalance_missing_suppression_count = 2
+        do_test([Timeout(), 404, 404], 503)
+
+        # two primaries out, but no rebalance
+        # ... default is fine for tombstones
+        policy_opts.rebalance_missing_suppression_count = 1
+        do_test([Timeout(), Exception('kaboom!'), 404], 404,
+                include_timestamp=True)
+        # ... but maybe not ideal for missing names
+        # (N.B. 503 isn't really a BAD response here)
+        do_test([Timeout(), Exception('kaboom!'), 404], 503)
+        # still ... ops might think they should tune it down
+        policy_opts.rebalance_missing_suppression_count = 0
+        do_test([Timeout(), Exception('kaboom!'), 404], 404)
+        # and we could maybe leave it like this for the next rebalance
+        do_test([Timeout(), 404, 404], 404)
+        # ... but it gets bad when faced with timeouts, b/c we can't trust a
+        # single primary 404 response during rebalance
+        do_test([Timeout(), Timeout(), 404], 404)
+        # ops needs to fix configs to get the 503
+        policy_opts.rebalance_missing_suppression_count = 1
+        do_test([Timeout(), Timeout(), 404], 503)
+
+    def test_GET_primaries_mixed_explode_and_timeout(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o')
+        primaries = []
+        for i in range(self.obj_ring.replicas):
+            if i % 2:
+                primaries.append(Timeout())
+            else:
+                primaries.append(Exception('kaboom!'))
+        codes = primaries + [404] * self.obj_ring.max_more_nodes
+        with set_http_connect(*codes):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 503)
+
+    def test_primary_returns_some_nonsense_timestamp(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o')
+        # an un-handled ValueError in _make_node_request should just continue
+        # to the next node rather than hang the request
+        headers = [{'X-Backend-Timestamp': 'not-a-timestamp'}, {}]
+        codes = [200, 200]
+        with quiet_eventlet_exceptions(), set_http_connect(
+                *codes, headers=headers):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 200)
+
+    def test_GET_not_found_when_404_newer(self):
+        # if proxy receives a 404, it keeps waiting for other connections until
+        # max number of nodes in hopes of finding an object, but if 404 is
+        # more recent than a 200, then it should ignore 200 and return 404
+        req = swift.common.swob.Request.blank('/v1/a/c/o')
+        codes = [404] * self.obj_ring.replicas + \
+                [200] * self.obj_ring.max_more_nodes
+        ts_iter = iter([2] * self.obj_ring.replicas +
+                       [1] * self.obj_ring.max_more_nodes)
+        with set_http_connect(*codes, timestamps=ts_iter):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 404)
+
+    def test_GET_x_newest_not_found_when_404_newer(self):
+        # if proxy receives a 404, it keeps waiting for other connections until
+        # max number of nodes in hopes of finding an object, but if 404 is
+        # more recent than a 200, then it should ignore 200 and return 404
+        req = swift.common.swob.Request.blank('/v1/a/c/o',
+                                              headers={'X-Newest': 'true'})
+        codes = ([200] +
+                 [404] * self.obj_ring.replicas +
+                 [200] * (self.obj_ring.max_more_nodes - 1))
+        ts_iter = iter([1] +
+                       [2] * self.obj_ring.replicas +
+                       [1] * (self.obj_ring.max_more_nodes - 1))
+        with set_http_connect(*codes, timestamps=ts_iter):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 404)
+
+    def test_PUT_delete_at(self):
+        t = str(int(time.time() + 100))
+        expected_part, expected_nodes, expected_delete_at_container = \
+            self.app.expirer_config.get_delete_at_nodes(t, 'a', 'c', 'o')
+        req = swob.Request.blank('/v1/a/c/o', method='PUT', body=b'',
+                                 headers={'Content-Type': 'foo/bar',
+                                          'X-Delete-At': t})
+        put_headers = []
+
+        def capture_headers(ip, port, device, part, method, path, headers,
+                            **kwargs):
+            if method == 'PUT':
+                put_headers.append(headers)
+        codes = [201] * self.obj_ring.replicas
+        with set_http_connect(*codes, give_connect=capture_headers):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 201)
+        found_host_device = set()
+        for given_headers in put_headers:
+            found_host_device.add('%s/%s' % (
+                given_headers['X-Delete-At-Host'],
+                given_headers['X-Delete-At-Device']))
+            self.assertEqual(given_headers.get('X-Delete-At'), t)
+            self.assertEqual(str(expected_part),
+                             given_headers['X-Delete-At-Partition'])
+            self.assertEqual(expected_delete_at_container,
+                             given_headers['X-Delete-At-Container'])
+        self.assertEqual({'%(ip)s:%(port)s/%(device)s' % n
+                          for n in expected_nodes},
+                         found_host_device)
+
+    def test_POST_delete_at_configure_task_container_per_day(self):
+        self.assertEqual(100, self.app.expirer_config.task_container_per_day)
+        t = str(int(time.time() + 100))
+        expected_part, expected_nodes, expected_delete_at_container = \
+            self.app.expirer_config.get_delete_at_nodes(t, 'a', 'c', 'o')
+        req = swob.Request.blank('/v1/a/c/o', method='POST', body=b'',
+                                 headers={'Content-Type': 'foo/bar',
+                                          'X-Delete-At': t})
+        post_headers = []
+
+        def capture_headers(ip, port, device, part, method, path, headers,
+                            **kwargs):
+            if method == 'POST':
+                post_headers.append(headers)
+        codes = [201] * self.obj_ring.replicas
+
+        with set_http_connect(*codes, give_connect=capture_headers):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 201)
+        found_host_device = set()
+        for given_headers in post_headers:
+            found_host_device.add('%s/%s' % (
+                given_headers['X-Delete-At-Host'],
+                given_headers['X-Delete-At-Device']))
+            self.assertEqual(given_headers.get('X-Delete-At'), t)
+            self.assertEqual(str(expected_part),
+                             given_headers['X-Delete-At-Partition'])
+            self.assertEqual(expected_delete_at_container,
+                             given_headers['X-Delete-At-Container'])
+        self.assertEqual({'%(ip)s:%(port)s/%(device)s' % n
+                          for n in expected_nodes},
+                         found_host_device)
+
+    def test_POST_delete_at_with_x_open_expired(self):
+        t_delete = str(int(time.time() + 30))
+
+        def capture_headers(ip, port, device, part, method, path, headers,
+                            **kwargs):
+            if method == 'POST':
+                post_headers.append(headers)
+
+        def do_post(extra_headers):
+            headers = {'Content-Type': 'foo/bar',
+                       'X-Delete-At': t_delete}
+            headers.update(extra_headers)
+            req_post = swob.Request.blank('/v1/a/c/o', method='POST', body=b'',
+                                          headers=headers)
+
+            post_codes = [202] * self.obj_ring.replicas
+            with set_http_connect(*post_codes, give_connect=capture_headers):
+                resp = req_post.get_response(self.app)
+            self.assertEqual(resp.status_int, 202)
+            self.assertEqual(len(post_headers), self.obj_ring.replicas)
+            for given_headers in post_headers:
+                self.assertEqual(given_headers.get('X-Delete-At'), t_delete)
+                self.assertIn('X-Delete-At-Host', given_headers)
+                self.assertIn('X-Delete-At-Device', given_headers)
+                self.assertIn('X-Delete-At-Partition', given_headers)
+                self.assertIn('X-Delete-At-Container', given_headers)
+
+        # Check when allow_open_expired config is set to true
+        self.conf['allow_open_expired'] = 'true'
+        self._make_app()
+        self.obj_ring = self.app.get_object_ring(int(self.policy))
+
+        post_headers = []
+        do_post({})
+        for given_headers in post_headers:
+            self.assertNotIn('X-Backend-Open-Expired', given_headers)
+
+        post_headers = []
+        do_post({'X-Open-Expired': 'false'})
+        for given_headers in post_headers:
+            self.assertNotIn('X-Backend-Open-Expired', given_headers)
+
+        post_headers = []
+        do_post({'X-Open-Expired': 'true'})
+        for given_headers in post_headers:
+            self.assertEqual(given_headers.get('X-Backend-Open-Expired'),
+                             'true')
+
+        # Check when allow_open_expired config is set to false
+        conf = {'allow_open_expired': 'false'}
+        self.app = PatchedObjControllerApp(
+            conf, account_ring=FakeRing(),
+            container_ring=FakeRing(), logger=None)
+        self.app.container_info = dict(self.fake_container_info())
+        self.obj_ring = self.app.get_object_ring(int(self.policy))
+
+        post_headers = []
+        do_post({})
+        for given_headers in post_headers:
+            self.assertNotIn('X-Backend-Open-Expired', given_headers)
+
+        post_headers = []
+        do_post({'X-Open-Expired': 'false'})
+        for given_headers in post_headers:
+            self.assertNotIn('X-Backend-Open-Expired', given_headers)
+
+        post_headers = []
+        do_post({'X-Open-Expired': 'true'})
+        for given_headers in post_headers:
+            self.assertNotIn('X-Backend-Open-Expired', given_headers)
+
+    def test_PUT_converts_delete_after_to_delete_at(self):
+        req = swob.Request.blank('/v1/a/c/o', method='PUT', body=b'',
+                                 headers={'Content-Type': 'foo/bar',
+                                          'X-Delete-After': '60'})
+        put_headers = []
+
+        def capture_headers(ip, port, device, part, method, path, headers,
+                            **kwargs):
+            if method == 'PUT':
+                put_headers.append(headers)
+        codes = [201] * self.obj_ring.replicas
+        t = time.time()
+        with set_http_connect(*codes, give_connect=capture_headers):
+            with mock.patch('time.time', lambda: t):
+                resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 201)
+        expected_delete_at = str(int(t) + 60)
+        for given_headers in put_headers:
+            self.assertEqual(given_headers.get('X-Delete-At'),
+                             expected_delete_at)
+            self.assertIn('X-Delete-At-Host', given_headers)
+            self.assertIn('X-Delete-At-Device', given_headers)
+            self.assertIn('X-Delete-At-Partition', given_headers)
+            self.assertIn('X-Delete-At-Container', given_headers)
+
+    def test_container_sync_put_x_timestamp_not_found(self):
+        test_indexes = [None] + [int(p) for p in POLICIES]
+        for policy_index in test_indexes:
+            self.app.container_info['storage_policy'] = policy_index
+            put_timestamp = utils.Timestamp.now().normal
+            req = swob.Request.blank(
+                '/v1/a/c/o', method='PUT', headers={
+                    'Content-Length': 0,
+                    'X-Timestamp': put_timestamp})
+            codes = [201] * self.obj_ring.replicas
+            with set_http_connect(*codes):
+                resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 201)
+
+    def test_container_sync_put_x_timestamp_match(self):
+        test_indexes = [None] + [int(p) for p in POLICIES]
+        for policy_index in test_indexes:
+            self.app.container_info['storage_policy'] = policy_index
+            put_timestamp = utils.Timestamp.now().normal
+            req = swob.Request.blank(
+                '/v1/a/c/o', method='PUT', headers={
+                    'Content-Length': 0,
+                    'X-Timestamp': put_timestamp})
+            ts_iter = itertools.repeat(put_timestamp)
+            codes = [409] * self.obj_ring.replicas
+            with set_http_connect(*codes, timestamps=ts_iter):
+                resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 202)
+
+    def test_container_sync_put_x_timestamp_older(self):
+        test_indexes = [None] + [int(p) for p in POLICIES]
+        for policy_index in test_indexes:
+            self.app.container_info['storage_policy'] = policy_index
+            req = swob.Request.blank(
+                '/v1/a/c/o', method='PUT', headers={
+                    'Content-Length': 0,
+                    'X-Timestamp': self.ts().internal})
+            ts_iter = itertools.repeat(self.ts().internal)
+            codes = [409] * self.obj_ring.replicas
+            with set_http_connect(*codes, timestamps=ts_iter):
+                resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 202)
+
+    def test_container_sync_put_x_timestamp_newer(self):
+        test_indexes = [None] + [int(p) for p in POLICIES]
+        for policy_index in test_indexes:
+            orig_timestamp = self.ts().internal
+            req = swob.Request.blank(
+                '/v1/a/c/o', method='PUT', headers={
+                    'Content-Length': 0,
+                    'X-Timestamp': self.ts().internal})
+            ts_iter = itertools.repeat(orig_timestamp)
+            codes = [201] * self.obj_ring.replicas
+            with set_http_connect(*codes, timestamps=ts_iter):
+                resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 201)
+
+    def test_put_x_timestamp_conflict(self):
+        req = swob.Request.blank(
+            '/v1/a/c/o', method='PUT', headers={
+                'Content-Length': 0,
+                'X-Timestamp': self.ts().internal})
+        ts_iter = iter([self.ts().internal, None, None])
+        codes = [409] + [201] * (self.obj_ring.replicas - 1)
+        with set_http_connect(*codes, timestamps=ts_iter):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 202)
+
+    def test_put_x_timestamp_conflict_with_missing_backend_timestamp(self):
+        req = swob.Request.blank(
+            '/v1/a/c/o', method='PUT', headers={
+                'Content-Length': 0,
+                'X-Timestamp': self.ts().internal})
+        ts_iter = iter([None, None, None])
+        codes = [409] * self.obj_ring.replicas
+        with set_http_connect(*codes, timestamps=ts_iter):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 202)
+
+    def test_put_x_timestamp_conflict_with_other_weird_success_response(self):
+        req = swob.Request.blank(
+            '/v1/a/c/o', method='PUT', headers={
+                'Content-Length': 0,
+                'X-Timestamp': self.ts().internal})
+        ts_iter = iter([self.ts().internal, None, None])
+        codes = [409] + [(201, 'notused')] * (self.obj_ring.replicas - 1)
+        with set_http_connect(*codes, timestamps=ts_iter):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 202)
+
+    def test_put_x_timestamp_conflict_with_if_none_match(self):
+        req = swob.Request.blank(
+            '/v1/a/c/o', method='PUT', headers={
+                'Content-Length': 0,
+                'If-None-Match': '*',
+                'X-Timestamp': self.ts().internal})
+        ts_iter = iter([self.ts().internal, None, None])
+        codes = [409] + [(412, 'notused')] * (self.obj_ring.replicas - 1)
+        with set_http_connect(*codes, timestamps=ts_iter):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 412)
+
+    def test_container_sync_put_x_timestamp_race(self):
+        test_indexes = [None] + [int(p) for p in POLICIES]
+        for policy_index in test_indexes:
+            put_timestamp = self.ts().internal
+            req = swob.Request.blank(
+                '/v1/a/c/o', method='PUT', headers={
+                    'Content-Length': 0,
+                    'X-Timestamp': put_timestamp})
+
+            # object nodes they respond 409 because another in-flight request
+            # finished and now the on disk timestamp is equal to the request.
+            put_ts = [put_timestamp] * self.obj_ring.replicas
+            codes = [409] * self.obj_ring.replicas
+
+            ts_iter = iter(put_ts)
+            with set_http_connect(*codes, timestamps=ts_iter):
+                resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 202)
+
+    def test_container_sync_put_x_timestamp_unsynced_race(self):
+        test_indexes = [None] + [int(p) for p in POLICIES]
+        for policy_index in test_indexes:
+            put_timestamp = self.ts().internal
+            req = swob.Request.blank(
+                '/v1/a/c/o', method='PUT', headers={
+                    'Content-Length': 0,
+                    'X-Timestamp': put_timestamp})
+
+            # only one in-flight request finished
+            put_ts = [None] * (self.obj_ring.replicas - 1)
+            put_resp = [201] * (self.obj_ring.replicas - 1)
+            put_ts += [put_timestamp]
+            put_resp += [409]
+
+            ts_iter = iter(put_ts)
+            codes = put_resp
+            with set_http_connect(*codes, timestamps=ts_iter):
+                resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 202)
+
+    def test_x_timestamp_not_overridden(self):
+        def do_test(method, base_headers, resp_code):
+            # no given x-timestamp
+            req = swob.Request.blank(
+                '/v1/a/c/o', method=method, headers=base_headers)
+            codes = [resp_code] * self.replicas()
+            with mocked_http_conn(*codes) as fake_conn:
+                resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, resp_code)
+            self.assertEqual(self.replicas(), len(fake_conn.requests))
+            for req in fake_conn.requests:
+                self.assertIn('X-Timestamp', req['headers'])
+                # check value can be parsed as valid timestamp
+                Timestamp(req['headers']['X-Timestamp'])
+
+            # given x-timestamp is retained
+            def do_check(ts):
+                headers = dict(base_headers)
+                headers['X-Timestamp'] = ts.internal
+                req = swob.Request.blank(
+                    '/v1/a/c/o', method=method, headers=headers)
+                codes = [resp_code] * self.replicas()
+                with mocked_http_conn(*codes) as fake_conn:
+                    resp = req.get_response(self.app)
+                self.assertEqual(resp.status_int, resp_code)
+                self.assertEqual(self.replicas(), len(fake_conn.requests))
+                for req in fake_conn.requests:
+                    self.assertEqual(ts.internal,
+                                     req['headers']['X-Timestamp'])
+
+            do_check(Timestamp.now())
+            do_check(Timestamp.now(offset=123))
+
+            # given x-timestamp gets sanity checked
+            headers = dict(base_headers)
+            headers['X-Timestamp'] = 'bad timestamp'
+            req = swob.Request.blank(
+                '/v1/a/c/o', method=method, headers=headers)
+            with mocked_http_conn() as fake_conn:
+                resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 400)
+            self.assertIn(b'X-Timestamp should be a UNIX timestamp ',
+                          resp.body)
+
+        do_test('PUT', {'Content-Length': 0}, 200)
+        do_test('DELETE', {}, 204)
+
+
+@patch_policies(
+    [StoragePolicy(0, '1-replica', True),
+     StoragePolicy(1, '4-replica', False),
+     StoragePolicy(2, '8-replica', False),
+     StoragePolicy(3, '15-replica', False)],
+    fake_ring_args=[
+        {'replicas': 1}, {'replicas': 4}, {'replicas': 8}, {'replicas': 15}])
+class TestReplicatedObjControllerVariousReplicas(CommonObjectControllerMixin,
+                                                 BaseTestCase):
+    controller_cls = obj.ReplicatedObjectController
+
+    def test_DELETE_with_write_affinity(self):
+        policy_index = 1
+        self.policy = POLICIES[policy_index]
+        policy_conf = self.app.get_policy_options(self.policy)
+        self.app.container_info['storage_policy'] = policy_index
+        policy_conf.write_affinity_handoff_delete_count = \
+            self.replicas(self.policy) // 2
+        policy_conf.write_affinity_is_local_fn = (
+            lambda node: node['region'] == 1)
+
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='DELETE')
+
+        codes = [204, 204, 404, 404, 204, 204]
+        with mocked_http_conn(*codes):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 204)
+
+        policy_conf.write_affinity_handoff_delete_count = 1
+
+        codes = [204, 204, 404, 404, 204]
+        with mocked_http_conn(*codes):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 204)
+
+
+@patch_policies()
+class TestReplicatedObjControllerMimePutter(BaseObjectControllerMixin,
+                                            BaseTestCase):
+    # tests specific to PUTs using a MimePutter
+    expect_headers = {
+        'X-Obj-Metadata-Footer': 'yes'
+    }
+
+    def setUp(self):
+        super(TestReplicatedObjControllerMimePutter, self).setUp()
+        # force use of a MimePutter
+        self.app.use_put_v1 = False
+
+    def test_PUT_error(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='PUT',
+                                              body=b'')
+        codes = [503] * self.replicas()
+        with set_http_connect(*codes, expect_headers=self.expect_headers):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 503)
+
+    def _test_PUT_with_footers(self, test_body=b''):
+        # verify that when footers are required the PUT body is multipart
+        # and the footers are appended
+        footers_callback = make_footers_callback(test_body)
+        env = {'swift.callback.update_footers': footers_callback}
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='PUT',
+                                              environ=env)
+        req.body = test_body
+        # send bogus Etag header to differentiate from footer value
+        req.headers['Etag'] = 'header_etag'
+        codes = [201] * self.replicas()
+
+        put_requests = defaultdict(
+            lambda: {'headers': None, 'chunks': [], 'connection': None})
+
+        def capture_body(conn, chunk):
+            put_requests[conn.connection_id]['chunks'].append(chunk)
+            put_requests[conn.connection_id]['connection'] = conn
+
+        def capture_headers(ip, port, device, part, method, path, headers,
+                            **kwargs):
+            conn_id = kwargs['connection_id']
+            put_requests[conn_id]['headers'] = headers
+
+        resp_headers = {
+            'Etag': '"resp_etag"',
+            # NB: ignored!
+            'Some-Header': 'Four',
+        }
+        with set_http_connect(*codes, expect_headers=self.expect_headers,
+                              give_send=capture_body,
+                              give_connect=capture_headers,
+                              headers=resp_headers):
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 201)
+        timestamps = {captured_req['headers']['x-timestamp']
+                      for captured_req in put_requests.values()}
+        self.assertEqual(1, len(timestamps), timestamps)
+        self.assertEqual(dict(resp.headers), {
+            'Content-Type': 'text/html; charset=UTF-8',
+            'Content-Length': '0',
+            'Etag': 'resp_etag',
+            'Last-Modified':
+                date_header_format(Timestamp(timestamps.pop())),
+        })
+        for connection_id, info in put_requests.items():
+            body = unchunk_body(b''.join(info['chunks']))
+            headers = info['headers']
+            boundary = headers['X-Backend-Obj-Multipart-Mime-Boundary']
+            self.assertTrue(boundary is not None,
+                            "didn't get boundary for conn %r" % (
+                                connection_id,))
+            self.assertEqual('chunked', headers['Transfer-Encoding'])
+            self.assertEqual('100-continue', headers['Expect'])
+            self.assertEqual('yes', headers['X-Backend-Obj-Metadata-Footer'])
+            self.assertNotIn('X-Backend-Obj-Multiphase-Commit', headers)
+            self.assertEqual('header_etag', headers['Etag'])
+
+            # email.parser.FeedParser doesn't know how to take a multipart
+            # message and boundary together and parse it; it only knows how
+            # to take a string, parse the headers, and figure out the
+            # boundary on its own.
+            parser = EmailFeedParser()
+            parser.feed(
+                ("Content-Type: multipart/nobodycares; boundary=%s\r\n\r\n" %
+                 boundary).encode('ascii'))
+            parser.feed(body)
+            message = parser.close()
+
+            self.assertTrue(message.is_multipart())  # sanity check
+            mime_parts = message.get_payload()
+            # notice, no commit confirmation
+            self.assertEqual(len(mime_parts), 2)
+            obj_part, footer_part = mime_parts
+
+            self.assertEqual(obj_part['X-Document'], 'object body')
+            self.assertEqual(test_body, obj_part.get_payload(decode=True))
+
+            # validate footer metadata
+            self.assertEqual(footer_part['X-Document'], 'object metadata')
+            footer_metadata = json.loads(footer_part.get_payload())
+            self.assertTrue(footer_metadata)
+            expected = {}
+            footers_callback(expected)
+            self.assertDictEqual(expected, footer_metadata)
+
+            self.assertTrue(info['connection'].closed)
+
+    def test_PUT_with_body_and_footers(self):
+        self._test_PUT_with_footers(test_body=b'asdf')
+
+    def test_PUT_with_no_body_and_footers(self):
+        self._test_PUT_with_footers()
+
+
+@contextmanager
+def capture_http_requests(get_response):
+
+    class FakeConn(object):
+
+        def __init__(self, req):
+            self.req = req
+            self.resp = None
+            self.path = "/"
+            self.closed = False
+
+        def getresponse(self):
+            self.resp = get_response(self.req)
+            return self.resp
+
+        def putrequest(self, method, path, **kwargs):
+            pass
+
+        def putheader(self, k, v):
+            pass
+
+        def endheaders(self):
+            pass
+
+        def close(self):
+            self.closed = True
+
+    class ConnectionLog(object):
+
+        def __init__(self):
+            self.connections = []
+
+        def __len__(self):
+            return len(self.connections)
+
+        def __getitem__(self, i):
+            return self.connections[i]
+
+        def __iter__(self):
+            return iter(self.connections)
+
+        def __call__(self, ip, port, method, path, headers, qs, ssl):
+            req = {
+                'ip': ip,
+                'port': port,
+                'method': method,
+                'path': path,
+                'headers': headers,
+                'qs': qs,
+                'ssl': ssl,
+            }
+            conn = FakeConn(req)
+            self.connections.append(conn)
+            return conn
+
+    fake_conn = ConnectionLog()
+
+    with mock.patch('swift.common.bufferedhttp.http_connect_raw',
+                    new=fake_conn):
+        yield fake_conn
+
+
+class ECObjectControllerMixin(CommonObjectControllerMixin):
+    # Add a few helper methods for EC tests.
+    def _make_ec_archive_bodies(self, test_body, policy=None):
+        policy = policy or self.policy
+        return encode_frag_archive_bodies(policy, test_body)
+
+    def _make_ec_object_stub(self, pattern='test', policy=None,
+                             timestamp=None):
+        policy = policy or self.policy
+        if isinstance(pattern, str):
+            pattern = pattern.encode('utf-8')
+        test_body = pattern * policy.ec_segment_size
+        test_body = test_body[:-random.randint(1, 1000)]
+        return make_ec_object_stub(test_body, policy, timestamp)
+
+    def _fake_ec_node_response(self, node_frags):
+        return fake_ec_node_response(node_frags, self.policy)
+
+    def test_GET_with_duplicate_but_sufficient_frag_indexes(self):
+        obj1 = self._make_ec_object_stub()
+        # proxy should ignore duplicated frag indexes and continue search for
+        # a set of unique indexes, finding last one on a handoff
+        node_frags = [
+            {'obj': obj1, 'frag': 0},
+            {'obj': obj1, 'frag': 0},  # duplicate frag
+            {'obj': obj1, 'frag': 1},
+            {'obj': obj1, 'frag': 1},  # duplicate frag
+            {'obj': obj1, 'frag': 2},
+            {'obj': obj1, 'frag': 2},  # duplicate frag
+            {'obj': obj1, 'frag': 3},
+            {'obj': obj1, 'frag': 3},  # duplicate frag
+            {'obj': obj1, 'frag': 4},
+            {'obj': obj1, 'frag': 4},  # duplicate frag
+            {'obj': obj1, 'frag': 10},
+            {'obj': obj1, 'frag': 11},
+            {'obj': obj1, 'frag': 12},
+            {'obj': obj1, 'frag': 13},
+        ] * self.policy.ec_duplication_factor
+        node_frags.append({'obj': obj1, 'frag': 5})  # first handoff
+
+        fake_response = self._fake_ec_node_response(node_frags)
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(fake_response) as log:
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['etag'], obj1['etag'])
+        self.assertEqual(md5(
+            resp.body, usedforsecurity=False).hexdigest(), obj1['etag'])
+
+        # expect a request to all primaries plus one handoff
+        self.assertEqual(self.replicas() + 1, len(log))
+        collected_indexes = defaultdict(list)
+        for conn in log:
+            fi = conn.resp.headers.get('X-Object-Sysmeta-Ec-Frag-Index')
+            if fi is not None:
+                collected_indexes[fi].append(conn)
+        self.assertEqual(len(collected_indexes), self.policy.ec_ndata)
+
+    def test_GET_with_duplicate_but_insufficient_frag_indexes(self):
+        obj1 = self._make_ec_object_stub()
+        # proxy should ignore duplicated frag indexes and continue search for
+        # a set of unique indexes, but fails to find one
+        node_frags = [
+            {'obj': obj1, 'frag': 0},
+            {'obj': obj1, 'frag': 0},  # duplicate frag
+            {'obj': obj1, 'frag': 1},
+            {'obj': obj1, 'frag': 1},  # duplicate frag
+            {'obj': obj1, 'frag': 2},
+            {'obj': obj1, 'frag': 2},  # duplicate frag
+            {'obj': obj1, 'frag': 3},
+            {'obj': obj1, 'frag': 3},  # duplicate frag
+            {'obj': obj1, 'frag': 4},
+            {'obj': obj1, 'frag': 4},  # duplicate frag
+            {'obj': obj1, 'frag': 10},
+            {'obj': obj1, 'frag': 11},
+            {'obj': obj1, 'frag': 12},
+            {'obj': obj1, 'frag': 13},
+        ]
+
+        # ... and the rest are 404s which is limited by request_count
+        # (2 * replicas in default) rather than max_extra_requests limitation
+        # because the retries will be in ResumingGetter if the responses
+        # are 404s
+        node_frags += [[]] * (self.replicas() * 2 - len(node_frags))
+        fake_response = self._fake_ec_node_response(node_frags)
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(fake_response) as log:
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 503)
+
+        # expect a request to all nodes
+        self.assertEqual(2 * self.replicas(), len(log))
+        collected_indexes = defaultdict(list)
+        for conn in log:
+            fi = conn.resp.headers.get('X-Object-Sysmeta-Ec-Frag-Index')
+            if fi is not None:
+                collected_indexes[fi].append(conn)
+        self.assertEqual(len(collected_indexes), self.policy.ec_ndata - 1)
+
+
+@patch_policies(with_ec_default=True)
+class TestECObjController(ECObjectControllerMixin, BaseTestCase):
+    container_info = {
+        'status': 200,
+        'read_acl': None,
+        'write_acl': None,
+        'sync_key': None,
+        'versions': None,
+        'storage_policy': '0',
+    }
+
+    controller_cls = obj.ECObjectController
+
+    def _add_frag_index(self, index, headers):
+        # helper method to add a frag index header to an existing header dict
+        hdr_name = 'X-Object-Sysmeta-Ec-Frag-Index'
+        return dict(list(headers.items()) + [(hdr_name, index)])
+
+    def test_determine_chunk_destinations(self):
+        class FakePutter(object):
+            def __init__(self, index):
+                self.node_index = index
+
+        controller = self.controller_cls(
+            self.app, 'a', 'c', 'o')
+
+        # create a dummy list of putters, check no handoffs
+        putters = []
+        expected = {}
+        for index in range(self.policy.object_ring.replica_count):
+            p = FakePutter(index)
+            putters.append(p)
+            expected[p] = self.policy.get_backend_index(index)
+        got = controller._determine_chunk_destinations(putters, self.policy)
+        self.assertEqual(got, expected)
+
+        def _test_one_handoff(index):
+            with mock.patch.object(putters[index], 'node_index', None):
+                got = controller._determine_chunk_destinations(
+                    putters, self.policy)
+                self.assertEqual(got, expected)
+                # Check that we don't mutate the putter
+                self.assertEqual([p.node_index for p in putters],
+                                 [None if i == index else i
+                                  for i, _ in enumerate(putters)])
+
+        # now lets make a handoff at the end
+        _test_one_handoff(self.policy.object_ring.replica_count - 1)
+        # now lets make a handoff at the start
+        _test_one_handoff(0)
+        # now lets make a handoff in the middle
+        _test_one_handoff(2)
+
+        # now lets make all of them handoffs
+        for index in range(self.policy.object_ring.replica_count):
+            putters[index].node_index = None
+        got = controller._determine_chunk_destinations(putters, self.policy)
+        self.assertEqual(sorted(got, key=lambda p: id(p)),
+                         sorted(expected, key=lambda p: id(p)))
+
+    def test_GET_simple(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o')
+        get_statuses = [200] * self.policy.ec_ndata
+        get_hdrs = [{
+            'Connection': 'close',
+            'X-Object-Sysmeta-Ec-Scheme': self.policy.ec_scheme_description,
+        }] * self.policy.ec_ndata
+        with set_http_connect(*get_statuses, headers=get_hdrs):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 200)
+        self.assertIn('Accept-Ranges', resp.headers)
+        self.assertNotIn('Connection', resp.headers)
+        self.assertFalse([h for h in resp.headers
+                          if h.lower().startswith('x-object-sysmeta-ec-')])
+
+    def test_GET_disconnect(self):
+        self.app.recoverable_node_timeout = 0.01
+        self.app.client_timeout = 0.1
+        # Before, we used the default 64k chunk size, so the entire ~16k test
+        # data would come in the first chunk, and the generator should
+        # cleanly exit by the time we reiterate() the response.
+        self.app.object_chunk_size = 10
+        segment_size = self.policy.ec_segment_size
+        test_data = (b'test' * segment_size)[:-743]
+        etag = md5(test_data, usedforsecurity=False).hexdigest()
+        ec_archive_bodies = self._make_ec_archive_bodies(test_data)
+        headers = {
+            'X-Object-Sysmeta-Ec-Etag': etag,
+            'X-Object-Sysmeta-Ec-Content-Length': len(test_data),
+            'X-Timestamp': Timestamp(self.ts()).normal,
+        }
+        num_slow = 4
+        responses = [
+            (200, SlowBody(body, 0.1 if i < num_slow else 0.0),
+             self._add_frag_index(i, headers))
+            for i, body in enumerate(ec_archive_bodies)
+        ] * self.policy.ec_duplication_factor
+
+        status_codes, body_iter, headers = zip(*responses)
+        req = swift.common.swob.Request.blank('/v1/a/c/o')
+        with mocked_http_conn(*status_codes, body_iter=body_iter,
+                              headers=headers) as log:
+            resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 200)
+            resp.app_iter.close()
+        self.assertEqual(len(log.requests),
+                         self.policy.ec_ndata + num_slow)
+
+        def make_key(r):
+            r['device'] = r['path'].split('/')[1]
+            return '%(ip)s:%(port)s/%(device)s' % r
+        # the first four slow nodes get errors incr'd
+        expected_error_limiting = {
+            make_key(r): {
+                'errors': 1,
+                'last_error': mock.ANY,
+            }
+            for r in log.requests[:4]
+        }
+        actual = {}
+        for n in self.app.get_object_ring(int(self.policy)).devs:
+            node_key = self.app.error_limiter.node_key(n)
+            stats = self.app.error_limiter.stats.get(node_key) or {}
+            if stats:
+                actual[self.app.error_limiter.node_key(n)] = stats
+        self.assertEqual(actual, expected_error_limiting)
+        expected = ["Client disconnected on read of EC frag '/a/c/o'"] * 10
+        self.assertEqual(
+            self.app.logger.get_lines_for_level('warning'),
+            expected)
+        for read_line in self.app.logger.get_lines_for_level('error'):
+            self.assertIn("Trying to read EC fragment during GET (retrying)",
+                          read_line)
+        self.assertEqual(
+            len(self.logger.logger.records['ERROR']), 4,
+            'Expected 4 ERROR lines, got %r' % (
+                self.logger.logger.records['ERROR'], ))
+
+    def test_GET_not_found_when_404_newer(self):
+        # if proxy receives a 404, it keeps waiting for other connections until
+        # max number of nodes in hopes of finding an object, but if 404 is
+        # more recent than a 200, then it should ignore 200 and return 404
+        req = swift.common.swob.Request.blank('/v1/a/c/o')
+        rest = 2 * self.policy.object_ring.replica_count - 2
+        codes = [200, 404] + [200] * rest
+        ts_iter = iter([1, 2] + [1] * rest)
+        with set_http_connect(*codes, timestamps=ts_iter):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 404)
+
+    def test_GET_primaries_error_during_rebalance(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o')
+        codes = [404] * (2 * self.policy.object_ring.replica_count)
+        with mocked_http_conn(*codes):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 404)
+        for i in range(self.policy.object_ring.replica_count - 2):
+            codes[i] = Timeout()
+            with mocked_http_conn(*codes):
+                resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 404)
+            self.app.error_limiter.stats.clear()  # Reset error limiting
+
+        # one more timeout is past the tipping point
+        codes[self.policy.object_ring.replica_count - 2] = Timeout()
+        with mocked_http_conn(*codes):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 503)
+        self.app.error_limiter.stats.clear()  # Reset error limiting
+
+        # unless we have tombstones
+        with mocked_http_conn(*codes, headers={'X-Backend-Timestamp': '1'}):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 404)
+
+    def _test_if_match(self, method):
+        def _do_test(match_value, backend_status, num_responses,
+                     etag_is_at='X-Object-Sysmeta-Does-Not-Exist'):
+            req = swift.common.swob.Request.blank(
+                '/v1/a/c/o', method=method,
+                headers={'If-Match': match_value,
+                         'X-Backend-Etag-Is-At': etag_is_at})
+            get_resp = [backend_status] * num_responses
+            resp_headers = {'Etag': 'frag_etag',
+                            'X-Object-Sysmeta-Ec-Etag': 'data_etag',
+                            'X-Object-Sysmeta-Alternate-Etag': 'alt_etag'}
+            with set_http_connect(*get_resp, headers=resp_headers):
+                resp = req.get_response(self.app)
+            self.assertEqual('data_etag', resp.headers['Etag'])
+            return resp
+
+        num_ok_responses = self.policy.ec_ndata if method == 'GET' else 1
+        # wildcard
+        resp = _do_test('*', 200, num_ok_responses)
+        self.assertEqual(resp.status_int, 200)
+
+        # match
+        resp = _do_test('"data_etag"', 200, num_ok_responses)
+        self.assertEqual(resp.status_int, 200)
+
+        # no match
+        resp = _do_test('"frag_etag"', 412,
+                        2 * self.policy.ec_n_unique_fragments)
+        self.assertEqual(resp.status_int, 412)
+
+        # match wildcard against an alternate etag
+        resp = _do_test('*', 200, num_ok_responses,
+                        etag_is_at='X-Object-Sysmeta-Alternate-Etag')
+        self.assertEqual(resp.status_int, 200)
+
+        # match against an alternate etag
+        resp = _do_test('"alt_etag"', 200, num_ok_responses,
+                        etag_is_at='X-Object-Sysmeta-Alternate-Etag')
+        self.assertEqual(resp.status_int, 200)
+
+        # no match against an alternate etag
+        resp = _do_test('"data_etag"', 412,
+                        2 * self.policy.ec_n_unique_fragments,
+                        etag_is_at='X-Object-Sysmeta-Alternate-Etag')
+        self.assertEqual(resp.status_int, 412)
+
+    def test_GET_if_match(self):
+        self._test_if_match('GET')
+
+    def test_HEAD_if_match(self):
+        self._test_if_match('HEAD')
+
+    def _test_if_none_match(self, method):
+        def _do_test(match_value, backend_status, num_responses,
+                     etag_is_at='X-Object-Sysmeta-Does-Not-Exist'):
+            req = swift.common.swob.Request.blank(
+                '/v1/a/c/o', method=method,
+                headers={'If-None-Match': match_value,
+                         'X-Backend-Etag-Is-At': etag_is_at})
+            get_resp = [backend_status] * num_responses
+            resp_headers = {'Etag': 'frag_etag',
+                            'X-Object-Sysmeta-Ec-Etag': 'data_etag',
+                            'X-Object-Sysmeta-Alternate-Etag': 'alt_etag'}
+            with set_http_connect(*get_resp, headers=resp_headers):
+                resp = req.get_response(self.app)
+            self.assertEqual('data_etag', resp.headers['Etag'])
+            return resp
+
+        if method == 'GET':
+            num_ok_responses = self.policy.ec_ndata
+            num_304_responses = 2 * self.policy.ec_n_unique_fragments
+        else:
+            num_ok_responses = num_304_responses = 1
+
+        # wildcard
+        resp = _do_test('*', 304, num_304_responses)
+        self.assertEqual(resp.status_int, 304)
+
+        # match
+        resp = _do_test('"data_etag"', 304, num_304_responses)
+        self.assertEqual(resp.status_int, 304)
+
+        # no match
+        resp = _do_test('"frag_etag"', 200, num_ok_responses)
+        self.assertEqual(resp.status_int, 200)
+
+        # match wildcard against an alternate etag
+        resp = _do_test('*', 304,
+                        num_304_responses,
+                        etag_is_at='X-Object-Sysmeta-Alternate-Etag')
+        self.assertEqual(resp.status_int, 304)
+
+        # match against an alternate etag
+        resp = _do_test('"alt_etag"', 304,
+                        num_304_responses,
+                        etag_is_at='X-Object-Sysmeta-Alternate-Etag')
+        self.assertEqual(resp.status_int, 304)
+
+        # no match against an alternate etag
+        resp = _do_test('"data_etag"', 200, num_ok_responses,
+                        etag_is_at='X-Object-Sysmeta-Alternate-Etag')
+        self.assertEqual(resp.status_int, 200)
+
+    def test_GET_if_none_match(self):
+        self._test_if_none_match('GET')
+
+    def test_HEAD_if_none_match(self):
+        self._test_if_none_match('HEAD')
+
+    def test_GET_simple_x_newest(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o',
+                                              headers={'X-Newest': 'true'})
+        codes = [200] * self.policy.ec_ndata
+        with set_http_connect(*codes):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 200)
+
+    def test_GET_error(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o')
+        get_resp = [503] + [200] * self.policy.ec_ndata
+        with set_http_connect(*get_resp):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 200)
+
+    def test_GET_no_response_error(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o')
+        num_responses = 2 * self.policy.ec_n_unique_fragments
+        with set_http_connect(*([Timeout()] * num_responses)):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 503)
+
+    def test_feed_remaining_primaries(self):
+        controller = self.controller_cls(
+            self.app, 'a', 'c', 'o')
+        safe_iter = utils.GreenthreadSafeIterator(NodeIter(
+            'object', self.app, self.policy.object_ring, 0, self.logger,
+            policy=self.policy, request=Request.blank('')))
+        controller._fragment_GET_request = lambda *a, **k: next(safe_iter)
+        pile = utils.GreenAsyncPile(self.policy.ec_ndata)
+        for i in range(self.policy.ec_ndata):
+            pile.spawn(controller._fragment_GET_request)
+        req = swob.Request.blank('/v1/a/c/o')
+
+        feeder_q = mock.MagicMock()
+
+        def feeder_timeout(*a, **kw):
+            # simulate trampoline
+            sleep()
+            # timeout immediately
+            raise Empty
+        feeder_q.get.side_effect = feeder_timeout
+        controller.feed_remaining_primaries(
+            safe_iter, pile, req, 0, self.policy,
+            mock.MagicMock(), feeder_q, mock.MagicMock())
+        expected_timeout = self.app.get_policy_options(
+            self.policy).concurrency_timeout
+        expected_call = mock.call(timeout=expected_timeout)
+        expected_num_calls = self.policy.ec_nparity + 1
+        self.assertEqual(feeder_q.get.call_args_list,
+                         [expected_call] * expected_num_calls)
+
+    def test_GET_timeout(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o')
+        self.app.recoverable_node_timeout = 0.01
+        codes = [FakeStatus(404, response_sleep=1.0)] * 2 + \
+            [200] * (self.policy.ec_ndata)
+        with mocked_http_conn(*codes) as log:
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(self.policy.ec_ndata + 2, len(log.requests))
+        self.assertEqual(
+            len(self.logger.logger.records['ERROR']), 2,
+            'Expected 2 ERROR lines, got %r' % (
+                self.logger.logger.records['ERROR'], ))
+        for retry_line in self.logger.logger.records['ERROR']:
+            self.assertIn('ERROR with Object server', retry_line)
+            self.assertIn('Trying to GET', retry_line)
+            self.assertIn('Timeout (0.01s)', retry_line)
+            self.assertIn(req.headers['x-trans-id'], retry_line)
+
+    def test_GET_with_slow_primaries(self):
+        segment_size = self.policy.ec_segment_size
+        test_data = (b'test' * segment_size)[:-743]
+        etag = md5(test_data, usedforsecurity=False).hexdigest()
+        ec_archive_bodies = self._make_ec_archive_bodies(test_data)
+        ts = self.ts()
+        headers = []
+        for i, body in enumerate(ec_archive_bodies):
+            headers.append({
+                'X-Object-Sysmeta-Ec-Etag': etag,
+                'X-Object-Sysmeta-Ec-Content-Length': len(body),
+                'X-Object-Sysmeta-Ec-Frag-Index':
+                    self.policy.get_backend_index(i),
+                'X-Backend-Timestamp': ts.internal,
+                'X-Timestamp': ts.normal,
+                'X-Backend-Durable-Timestamp': ts.internal,
+                'X-Backend-Data-Timestamp': ts.internal,
+            })
+
+        req = swift.common.swob.Request.blank('/v1/a/c/o')
+
+        policy_opts = self.app.get_policy_options(self.policy)
+        policy_opts.concurrent_gets = True
+        policy_opts.concurrency_timeout = 0.1
+
+        status_codes = ([
+            FakeStatus(200, response_sleep=2.0),
+        ] * self.policy.ec_nparity) + ([
+            FakeStatus(200),
+        ] * self.policy.ec_ndata)
+        self.assertEqual(len(status_codes), len(ec_archive_bodies))
+        with mocked_http_conn(*status_codes, body_iter=ec_archive_bodies,
+                              headers=headers) as log:
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(len(log.requests),
+                         self.policy.ec_n_unique_fragments)
+
+    def test_GET_with_some_slow_primaries(self):
+        segment_size = self.policy.ec_segment_size
+        test_data = (b'test' * segment_size)[:-289]
+        etag = md5(test_data, usedforsecurity=False).hexdigest()
+        ec_archive_bodies = self._make_ec_archive_bodies(test_data)
+        ts = self.ts()
+        headers = []
+        for i, body in enumerate(ec_archive_bodies):
+            headers.append({
+                'X-Object-Sysmeta-Ec-Etag': etag,
+                'X-Object-Sysmeta-Ec-Content-Length': len(body),
+                'X-Object-Sysmeta-Ec-Frag-Index':
+                    self.policy.get_backend_index(i),
+                'X-Backend-Timestamp': ts.internal,
+                'X-Timestamp': ts.normal,
+                'X-Backend-Durable-Timestamp': ts.internal,
+                'X-Backend-Data-Timestamp': ts.internal,
+            })
+
+        req = swift.common.swob.Request.blank('/v1/a/c/o')
+
+        policy_opts = self.app.get_policy_options(self.policy)
+        policy_opts.concurrent_gets = True
+        policy_opts.concurrency_timeout = 0.1
+
+        slow_count = self.policy.ec_nparity
+        status_codes = ([
+            FakeStatus(200, response_sleep=2.0),
+        ] * slow_count) + ([
+            FakeStatus(200),
+        ] * (self.policy.ec_ndata - slow_count))
+        random.shuffle(status_codes)
+        status_codes.extend([
+            FakeStatus(200),
+        ] * slow_count)
+        self.assertEqual(len(status_codes), len(ec_archive_bodies))
+        with mocked_http_conn(*status_codes, body_iter=ec_archive_bodies,
+                              headers=headers) as log:
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(len(log.requests),
+                         self.policy.ec_n_unique_fragments)
+
+    def test_ec_concurrent_GET_with_slow_leaders(self):
+        segment_size = self.policy.ec_segment_size
+        test_data = (b'test' * segment_size)[:-289]
+        etag = md5(test_data).hexdigest()
+        ec_archive_bodies = self._make_ec_archive_bodies(test_data)
+        ts = self.ts()
+        headers = []
+        for i, body in enumerate(ec_archive_bodies):
+            headers.append({
+                'X-Object-Sysmeta-Ec-Etag': etag,
+                'X-Object-Sysmeta-Ec-Content-Length': len(body),
+                'X-Object-Sysmeta-Ec-Frag-Index':
+                    self.policy.get_backend_index(i),
+                'X-Backend-Timestamp': ts.internal,
+                'X-Timestamp': ts.normal,
+                'X-Backend-Durable-Timestamp': ts.internal,
+                'X-Backend-Data-Timestamp': ts.internal,
+            })
+
+        req = swift.common.swob.Request.blank('/v1/a/c/o')
+
+        policy_opts = self.app.get_policy_options(self.policy)
+        policy_opts.concurrent_gets = True
+        policy_opts.concurrency_timeout = 0.0
+
+        slow_count = 4
+        status_codes = ([
+            FakeStatus(200, response_sleep=0.2),
+        ] * slow_count) + ([
+            FakeStatus(200, response_sleep=0.1),
+        ] * (self.policy.ec_n_unique_fragments - slow_count))
+        for i in range(slow_count):
+            # poison the super slow requests
+            ec_archive_bodies[i] = ''
+        with mocked_http_conn(*status_codes, body_iter=ec_archive_bodies,
+                              headers=headers) as log:
+            resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual(resp.body, test_data, '%r != %r' % (
+                resp.body if len(resp.body) < 60 else '%s...' % resp.body[:60],
+                test_data if len(test_data) < 60 else '%s...' % test_data[:60],
+            ))
+        self.assertEqual(len(log.requests), self.policy.ec_n_unique_fragments)
+
+    def test_GET_with_slow_nodes_and_failures(self):
+        segment_size = self.policy.ec_segment_size
+        test_data = (b'test' * segment_size)[:-289]
+        etag = md5(test_data, usedforsecurity=False).hexdigest()
+        ec_archive_bodies = self._make_ec_archive_bodies(test_data)
+        ts = self.ts()
+        headers = []
+        for i, body in enumerate(ec_archive_bodies):
+            headers.append({
+                'X-Object-Sysmeta-Ec-Etag': etag,
+                'X-Object-Sysmeta-Ec-Content-Length': len(body),
+                'X-Object-Sysmeta-Ec-Frag-Index':
+                    self.policy.get_backend_index(i),
+                'X-Backend-Timestamp': ts.internal,
+                'X-Timestamp': ts.normal,
+                'X-Backend-Durable-Timestamp': ts.internal,
+                'X-Backend-Data-Timestamp': ts.internal,
+            })
+
+        req = swift.common.swob.Request.blank('/v1/a/c/o')
+
+        policy_opts = self.app.get_policy_options(self.policy)
+        policy_opts.concurrent_gets = True
+        policy_opts.concurrency_timeout = 0.1
+
+        unused_resp = [
+            FakeStatus(200, response_sleep=2.0),
+            FakeStatus(200, response_sleep=2.0),
+            500,
+            416,
+        ]
+        self.assertEqual(len(unused_resp), self.policy.ec_nparity)
+        status_codes = (
+            [200] * (self.policy.ec_ndata - 4)) + unused_resp
+        self.assertEqual(len(status_codes), self.policy.ec_ndata)
+        # random.shuffle(status_codes)
+        # make up for the failures
+        status_codes.extend([200] * self.policy.ec_nparity)
+        self.assertEqual(len(status_codes), len(ec_archive_bodies))
+        bodies_with_errors = []
+        for code, body in zip(status_codes, ec_archive_bodies):
+            if code == 500:
+                bodies_with_errors.append('Kaboom')
+            elif code == 416:
+                bodies_with_errors.append('That Range is no.')
+            else:
+                bodies_with_errors.append(body)
+        with mocked_http_conn(*status_codes, body_iter=bodies_with_errors,
+                              headers=headers) as log:
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(len(log.requests),
+                         self.policy.ec_n_unique_fragments)
+
+    def test_GET_with_one_slow_frag_lane(self):
+        segment_size = self.policy.ec_segment_size
+        test_data = (b'test' * segment_size)[:-454]
+        etag = md5(test_data, usedforsecurity=False).hexdigest()
+        ec_archive_bodies = self._make_ec_archive_bodies(test_data)
+        ts = self.ts()
+        headers = []
+        for i, body in enumerate(ec_archive_bodies):
+            headers.append({
+                'X-Object-Sysmeta-Ec-Etag': etag,
+                'X-Object-Sysmeta-Ec-Content-Length': len(body),
+                'X-Object-Sysmeta-Ec-Frag-Index':
+                    self.policy.get_backend_index(i),
+                'X-Backend-Timestamp': ts.internal,
+                'X-Timestamp': ts.normal,
+                'X-Backend-Durable-Timestamp': ts.internal,
+                'X-Backend-Data-Timestamp': ts.internal,
+            })
+
+        req = swift.common.swob.Request.blank('/v1/a/c/o')
+
+        policy_opts = self.app.get_policy_options(self.policy)
+        policy_opts.concurrent_gets = True
+        policy_opts.concurrency_timeout = 0.1
+
+        status_codes = [
+            FakeStatus(200, response_sleep=2.0),
+        ] + ([
+            FakeStatus(200),
+        ] * (self.policy.ec_ndata - 1))
+        random.shuffle(status_codes)
+        status_codes.extend([
+            FakeStatus(200, response_sleep=2.0),
+            FakeStatus(200, response_sleep=2.0),
+            FakeStatus(200, response_sleep=2.0),
+            FakeStatus(200),
+        ])
+        self.assertEqual(len(status_codes), len(ec_archive_bodies))
+        with mocked_http_conn(*status_codes, body_iter=ec_archive_bodies,
+                              headers=headers) as log:
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(len(log.requests),
+                         self.policy.ec_n_unique_fragments)
+
+    def test_GET_with_concurrent_ec_extra_requests(self):
+        segment_size = self.policy.ec_segment_size
+        test_data = (b'test' * segment_size)[:-454]
+        etag = md5(test_data, usedforsecurity=False).hexdigest()
+        ec_archive_bodies = self._make_ec_archive_bodies(test_data)
+        ts = self.ts()
+        headers = []
+        for i, body in enumerate(ec_archive_bodies):
+            headers.append({
+                'X-Object-Sysmeta-Ec-Etag': etag,
+                'X-Object-Sysmeta-Ec-Content-Length': len(body),
+                'X-Object-Sysmeta-Ec-Frag-Index':
+                    self.policy.get_backend_index(i),
+                'X-Backend-Timestamp': ts.internal,
+                'X-Timestamp': ts.normal,
+                'X-Backend-Durable-Timestamp': ts.internal,
+                'X-Backend-Data-Timestamp': ts.internal,
+            })
+        policy_opts = self.app.get_policy_options(self.policy)
+        policy_opts.concurrent_ec_extra_requests = self.policy.ec_nparity - 1
+        req = swift.common.swob.Request.blank('/v1/a/c/o')
+        # w/o concurrent_gets ec_extra_requests has no effect
+        status_codes = [200] * self.policy.ec_ndata
+        with mocked_http_conn(*status_codes, body_iter=ec_archive_bodies,
+                              headers=headers) as log:
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(len(log.requests), self.policy.ec_ndata)
+        self.assertEqual(resp.body, test_data)
+
+        policy_opts.concurrent_gets = True
+        status_codes = [200] * (self.policy.object_ring.replicas - 1)
+        with mocked_http_conn(*status_codes, body_iter=ec_archive_bodies,
+                              headers=headers) as log:
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(len(log.requests),
+                         self.policy.object_ring.replicas - 1)
+        self.assertEqual(resp.body, test_data)
+
+    def test_GET_with_body(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o')
+        # turn a real body into fragments
+        segment_size = self.policy.ec_segment_size
+        real_body = (b'asdf' * segment_size)[:-10]
+        # split it up into chunks
+        chunks = [real_body[x:x + segment_size]
+                  for x in range(0, len(real_body), segment_size)]
+        fragment_payloads = []
+        for chunk in chunks:
+            fragments = self.policy.pyeclib_driver.encode(chunk)
+            if not fragments:
+                break
+            fragment_payloads.append(
+                fragments * self.policy.ec_duplication_factor)
+        # sanity
+        sanity_body = b''
+        for fragment_payload in fragment_payloads:
+            sanity_body += self.policy.pyeclib_driver.decode(
+                fragment_payload)
+        self.assertEqual(len(real_body), len(sanity_body))
+        self.assertEqual(real_body, sanity_body)
+
+        # list(zip(...)) since zip is lazy
+        node_fragments = list(zip(*fragment_payloads))
+        self.assertEqual(len(node_fragments), self.replicas())  # sanity
+        headers = {'X-Object-Sysmeta-Ec-Content-Length': str(len(real_body))}
+        responses = [(200, b''.join(node_fragments[i]), headers)
+                     for i in range(POLICIES.default.ec_ndata)]
+        status_codes, body_iter, headers = zip(*responses)
+        with set_http_connect(*status_codes, body_iter=body_iter,
+                              headers=headers):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(len(real_body), len(resp.body))
+        self.assertEqual(real_body, resp.body)
+
+    def test_GET_with_frags_swapped_around(self):
+        segment_size = self.policy.ec_segment_size
+        test_data = (b'test' * segment_size)[:-657]
+        etag = md5(test_data, usedforsecurity=False).hexdigest()
+        ec_archive_bodies = self._make_ec_archive_bodies(test_data)
+
+        _part, primary_nodes = self.obj_ring.get_nodes('a', 'c', 'o')
+
+        node_key = lambda n: (n['ip'], n['port'])
+        backend_index = self.policy.get_backend_index
+        ts = self.ts()
+
+        response_map = {
+            node_key(n): StubResponse(
+                200, ec_archive_bodies[backend_index(i)], {
+                    'X-Object-Sysmeta-Ec-Content-Length': len(test_data),
+                    'X-Object-Sysmeta-Ec-Etag': etag,
+                    'X-Object-Sysmeta-Ec-Frag-Index': backend_index(i),
+                    'X-Timestamp': ts.normal,
+                    'X-Backend-Timestamp': ts.internal
+                }) for i, n in enumerate(primary_nodes)
+        }
+
+        # swap a parity response into a data node
+        data_node = random.choice(primary_nodes[:self.policy.ec_ndata])
+        parity_node = random.choice(
+            primary_nodes[
+                self.policy.ec_ndata:self.policy.ec_n_unique_fragments])
+        (response_map[node_key(data_node)],
+         response_map[node_key(parity_node)]) = \
+            (response_map[node_key(parity_node)],
+             response_map[node_key(data_node)])
+
+        def get_response(req):
+            req_key = (req['ip'], req['port'])
+            return response_map.pop(req_key)
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(get_response) as log:
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(len(log), self.policy.ec_ndata)
+        self.assertEqual(len(response_map),
+                         len(primary_nodes) - self.policy.ec_ndata)
+
+    def test_GET_with_no_success(self):
+        node_frags = [[]] * 28  # no frags on any node
+
+        fake_response = self._fake_ec_node_response(node_frags)
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(fake_response) as log:
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 404)
+        self.assertEqual(len(log), 2 * self.replicas())
+
+    def test_GET_with_only_handoffs(self):
+        obj1 = self._make_ec_object_stub()
+
+        node_frags = [[]] * self.replicas()  # all primaries missing
+        node_frags = node_frags + [  # handoffs
+            {'obj': obj1, 'frag': 0},
+            {'obj': obj1, 'frag': 1},
+            {'obj': obj1, 'frag': 2},
+            {'obj': obj1, 'frag': 3},
+            {'obj': obj1, 'frag': 4},
+            {'obj': obj1, 'frag': 5},
+            {'obj': obj1, 'frag': 6},
+            {'obj': obj1, 'frag': 7},
+            {'obj': obj1, 'frag': 8},
+            {'obj': obj1, 'frag': 9},
+            {'obj': obj1, 'frag': 10},  # parity
+            {'obj': obj1, 'frag': 11},  # parity
+            {'obj': obj1, 'frag': 12},  # parity
+            {'obj': obj1, 'frag': 13},  # parity
+        ]
+
+        fake_response = self._fake_ec_node_response(node_frags)
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(fake_response) as log:
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['etag'], obj1['etag'])
+        self.assertEqual(md5(
+            resp.body, usedforsecurity=False).hexdigest(), obj1['etag'])
+
+        collected_responses = defaultdict(list)
+        for conn in log:
+            etag = conn.resp.headers['X-Object-Sysmeta-Ec-Etag']
+            index = conn.resp.headers['X-Object-Sysmeta-Ec-Frag-Index']
+            collected_responses[etag].append(index)
+
+        # GETS would be required to all primaries and then ndata handoffs
+        self.assertEqual(len(log), self.replicas() + self.policy.ec_ndata)
+        self.assertEqual(2, len(collected_responses))
+        # 404s
+        self.assertEqual(self.replicas(), len(collected_responses[None]))
+        self.assertEqual(self.policy.ec_ndata,
+                         len(collected_responses[obj1['etag']]))
+
+    def test_GET_with_single_missed_overwrite_does_not_need_handoff(self):
+        obj1 = self._make_ec_object_stub(pattern='obj1')
+        obj2 = self._make_ec_object_stub(pattern='obj2')
+
+        node_frags = [
+            {'obj': obj2, 'frag': 0},
+            {'obj': obj2, 'frag': 1},
+            {'obj': obj1, 'frag': 2},  # missed over write
+            {'obj': obj2, 'frag': 3},
+            {'obj': obj2, 'frag': 4},
+            {'obj': obj2, 'frag': 5},
+            {'obj': obj2, 'frag': 6},
+            {'obj': obj2, 'frag': 7},
+            {'obj': obj2, 'frag': 8},
+            {'obj': obj2, 'frag': 9},
+            {'obj': obj2, 'frag': 10},  # parity
+            {'obj': obj2, 'frag': 11},  # parity
+            {'obj': obj2, 'frag': 12},  # parity
+            {'obj': obj2, 'frag': 13},  # parity
+            # {'obj': obj2, 'frag': 2},  # handoff (not used in this test)
+        ]
+
+        fake_response = self._fake_ec_node_response(node_frags)
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with mock.patch('swift.proxy.server.shuffle', lambda n: n), \
+                capture_http_requests(fake_response) as log:
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['etag'], obj2['etag'])
+        closed_conn = defaultdict(set)
+        for conn in log:
+            etag = conn.resp.headers['X-Object-Sysmeta-Ec-Etag']
+            closed_conn[etag].add(conn.closed)
+        self.assertEqual({
+            obj1['etag']: {True},
+            obj2['etag']: {False},
+        }, closed_conn)
+        self.assertEqual(md5(
+            resp.body, usedforsecurity=False).hexdigest(), obj2['etag'])
+        self.assertEqual({True}, {conn.closed for conn in log})
+
+        collected_responses = defaultdict(set)
+        for conn in log:
+            etag = conn.resp.headers['X-Object-Sysmeta-Ec-Etag']
+            index = conn.resp.headers['X-Object-Sysmeta-Ec-Frag-Index']
+            collected_responses[etag].add(index)
+
+        self.assertEqual(len(log), self.policy.ec_ndata + 1)
+        expected = {
+            obj1['etag']: 1,
+            obj2['etag']: self.policy.ec_ndata,
+        }
+        self.assertEqual(expected, {
+            e: len(f) for e, f in collected_responses.items()})
+
+    def test_GET_with_many_missed_overwrite_will_need_handoff(self):
+        obj1 = self._make_ec_object_stub(pattern='obj1')
+        obj2 = self._make_ec_object_stub(pattern='obj2')
+
+        node_frags = [
+            {'obj': obj2, 'frag': 0},
+            {'obj': obj2, 'frag': 1},
+            {'obj': obj1, 'frag': 2},  # missed
+            {'obj': obj2, 'frag': 3},
+            {'obj': obj2, 'frag': 4},
+            {'obj': obj2, 'frag': 5},
+            {'obj': obj1, 'frag': 6},  # missed
+            {'obj': obj2, 'frag': 7},
+            {'obj': obj2, 'frag': 8},
+            {'obj': obj1, 'frag': 9},  # missed
+            {'obj': obj1, 'frag': 10},  # missed
+            {'obj': obj1, 'frag': 11},  # missed
+            {'obj': obj2, 'frag': 12},
+            {'obj': obj2, 'frag': 13},
+            {'obj': obj2, 'frag': 6},  # handoff
+        ]
+
+        fake_response = self._fake_ec_node_response(node_frags)
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(fake_response) as log:
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['etag'], obj2['etag'])
+        self.assertEqual(md5(
+            resp.body, usedforsecurity=False).hexdigest(), obj2['etag'])
+
+        collected_responses = defaultdict(set)
+        for conn in log:
+            etag = conn.resp.headers['X-Object-Sysmeta-Ec-Etag']
+            index = conn.resp.headers['X-Object-Sysmeta-Ec-Frag-Index']
+            collected_responses[etag].add(index)
+
+        # there's not enough of the obj2 etag on the primaries, we would
+        # have collected responses for both etags, and would have made
+        # one more request to the handoff node
+        self.assertEqual(len(log), self.replicas() + 1)
+        self.assertEqual(len(collected_responses), 2)
+
+        # ... regardless we should never need to fetch more than ec_ndata
+        # frags for any given etag
+        for etag, frags in collected_responses.items():
+            self.assertLessEqual(len(frags), self.policy.ec_ndata,
+                                 'collected %s frags for etag %s' % (
+                                     len(frags), etag))
+
+    def test_GET_with_missing_and_mixed_frags_will_dig_deep_but_succeed(self):
+        obj1 = self._make_ec_object_stub(pattern='obj1', timestamp=self.ts())
+        obj2 = self._make_ec_object_stub(pattern='obj2', timestamp=self.ts())
+
+        node_frags = [
+            {'obj': obj1, 'frag': 0},
+            {'obj': obj2, 'frag': 0},
+            [],
+            {'obj': obj1, 'frag': 1},
+            {'obj': obj2, 'frag': 1},
+            [],
+            {'obj': obj1, 'frag': 2},
+            {'obj': obj2, 'frag': 2},
+            [],
+            {'obj': obj1, 'frag': 3},
+            {'obj': obj2, 'frag': 3},
+            [],
+            {'obj': obj1, 'frag': 4},
+            {'obj': obj2, 'frag': 4},
+            [],
+            {'obj': obj1, 'frag': 5},
+            {'obj': obj2, 'frag': 5},
+            [],
+            {'obj': obj1, 'frag': 6},
+            {'obj': obj2, 'frag': 6},
+            [],
+            {'obj': obj1, 'frag': 7},
+            {'obj': obj2, 'frag': 7},
+            [],
+            {'obj': obj1, 'frag': 8},
+            {'obj': obj2, 'frag': 8},
+            [],
+            {'obj': obj2, 'frag': 9},
+        ]
+
+        fake_response = self._fake_ec_node_response(node_frags)
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(fake_response) as log:
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['etag'], obj2['etag'])
+        self.assertEqual(md5(
+            resp.body, usedforsecurity=False).hexdigest(), obj2['etag'])
+
+        collected_responses = defaultdict(set)
+        for conn in log:
+            etag = conn.resp.headers['X-Object-Sysmeta-Ec-Etag']
+            index = conn.resp.headers['X-Object-Sysmeta-Ec-Frag-Index']
+            collected_responses[etag].add(index)
+
+        # we go exactly as long as we have to, finding two different
+        # etags and some 404's (i.e. collected_responses[None])
+        self.assertEqual(len(log), len(node_frags))
+        self.assertEqual(len(collected_responses), 3)
+
+        # ... regardless we should never need to fetch more than ec_ndata
+        # frags for any given etag
+        for etag, frags in collected_responses.items():
+            self.assertLessEqual(len(frags), self.policy.ec_ndata,
+                                 'collected %s frags for etag %s' % (
+                                     len(frags), etag))
+
+    def test_GET_with_missing_and_mixed_frags_will_dig_deep_but_stop(self):
+        obj1 = self._make_ec_object_stub(pattern='obj1')
+        obj2 = self._make_ec_object_stub(pattern='obj2')
+
+        node_frags = [
+            {'obj': obj1, 'frag': 0},
+            {'obj': obj2, 'frag': 0},
+            [],
+            {'obj': obj1, 'frag': 1},
+            {'obj': obj2, 'frag': 1},
+            [],
+            {'obj': obj1, 'frag': 2},
+            {'obj': obj2, 'frag': 2},
+            [],
+            {'obj': obj1, 'frag': 3},
+            {'obj': obj2, 'frag': 3},
+            [],
+            {'obj': obj1, 'frag': 4},
+            {'obj': obj2, 'frag': 4},
+            [],
+            {'obj': obj1, 'frag': 5},
+            {'obj': obj2, 'frag': 5},
+            [],
+            {'obj': obj1, 'frag': 6},
+            {'obj': obj2, 'frag': 6},
+            [],
+            {'obj': obj1, 'frag': 7},
+            {'obj': obj2, 'frag': 7},
+            [],
+            {'obj': obj1, 'frag': 8},
+            {'obj': obj2, 'frag': 8},
+            [],
+            # handoffs are iter'd in order so proxy will see 404 from this
+            # final handoff
+            [],
+        ]
+
+        fake_response = self._fake_ec_node_response(node_frags)
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(fake_response) as log:
+            resp = req.get_response(self.app)
+
+        closed_conn = defaultdict(set)
+        for conn in log:
+            etag = conn.resp.headers.get('X-Object-Sysmeta-Ec-Etag')
+            closed_conn[etag].add(conn.closed)
+        self.assertEqual({
+            obj1['etag']: {True},
+            obj2['etag']: {True},
+            None: {True},
+        }, dict(closed_conn))
+        self.assertEqual(resp.status_int, 503)
+
+        collected_responses = defaultdict(set)
+        for conn in log:
+            etag = conn.resp.headers['X-Object-Sysmeta-Ec-Etag']
+            index = conn.resp.headers['X-Object-Sysmeta-Ec-Frag-Index']
+            collected_responses[etag].add(index)
+
+        # default node_iter will exhaust at 2 * replicas
+        self.assertEqual(len(log), 2 * self.replicas())
+        self.assertEqual(len(collected_responses), 3)
+
+        # ... regardless we should never need to fetch more than ec_ndata
+        # frags for any given etag
+        for etag, frags in collected_responses.items():
+            self.assertLessEqual(len(frags), self.policy.ec_ndata,
+                                 'collected %s frags for etag %s' % (
+                                     len(frags), etag))
+
+    def test_GET_with_duplicate_and_hidden_frag_indexes(self):
+        obj1 = self._make_ec_object_stub()
+        # proxy should ignore duplicated frag indexes and continue search for
+        # a set of unique indexes, finding last one on a handoff
+        node_frags = [
+            [{'obj': obj1, 'frag': 0}, {'obj': obj1, 'frag': 5}],
+            {'obj': obj1, 'frag': 0},  # duplicate frag
+            {'obj': obj1, 'frag': 1},
+            {'obj': obj1, 'frag': 1},  # duplicate frag
+            {'obj': obj1, 'frag': 2},
+            {'obj': obj1, 'frag': 2},  # duplicate frag
+            {'obj': obj1, 'frag': 3},
+            {'obj': obj1, 'frag': 3},  # duplicate frag
+            {'obj': obj1, 'frag': 4},
+            {'obj': obj1, 'frag': 4},  # duplicate frag
+            {'obj': obj1, 'frag': 10},
+            {'obj': obj1, 'frag': 11},
+            {'obj': obj1, 'frag': 12},
+            {'obj': obj1, 'frag': 13},
+        ]
+
+        fake_response = self._fake_ec_node_response(node_frags)
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(fake_response) as log:
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['etag'], obj1['etag'])
+        self.assertEqual(md5(
+            resp.body, usedforsecurity=False).hexdigest(), obj1['etag'])
+
+        # Expect a maximum of one request to each primary plus one extra
+        # request to node 1. Actual value could be less if the extra request
+        # occurs and quorum is reached before requests to nodes with a
+        # duplicate frag.
+        self.assertLessEqual(len(log), self.replicas() + 1)
+        collected_indexes = defaultdict(list)
+        for conn in log:
+            fi = conn.resp.headers.get('X-Object-Sysmeta-Ec-Frag-Index')
+            if fi is not None:
+                collected_indexes[fi].append(conn)
+        self.assertEqual(len(collected_indexes), self.policy.ec_ndata)
+
+    def test_GET_with_missing_and_mixed_frags_may_503(self):
+        obj1 = self._make_ec_object_stub(pattern='obj1')
+        obj2 = self._make_ec_object_stub(pattern='obj2')
+        # we get a 503 when all the handoffs return 200
+        node_frags = [[]] * self.replicas()  # primaries have no frags
+        node_frags = node_frags + [  # handoffs all have frags
+            {'obj': obj1, 'frag': 0},
+            {'obj': obj2, 'frag': 0},
+            {'obj': obj1, 'frag': 1},
+            {'obj': obj2, 'frag': 1},
+            {'obj': obj1, 'frag': 2},
+            {'obj': obj2, 'frag': 2},
+            {'obj': obj1, 'frag': 3},
+            {'obj': obj2, 'frag': 3},
+            {'obj': obj1, 'frag': 4},
+            {'obj': obj2, 'frag': 4},
+            {'obj': obj1, 'frag': 5},
+            {'obj': obj2, 'frag': 5},
+            {'obj': obj1, 'frag': 6},
+            {'obj': obj2, 'frag': 6},
+        ]
+        fake_response = self._fake_ec_node_response(node_frags)
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(fake_response) as log:
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 503)
+        # never get a quorum so all nodes are searched
+        self.assertEqual(len(log), 2 * self.replicas())
+        collected_indexes = defaultdict(list)
+        for conn in log:
+            fi = conn.resp.headers.get('X-Object-Sysmeta-Ec-Frag-Index')
+            if fi is not None:
+                collected_indexes[fi].append(conn)
+        self.assertEqual(len(collected_indexes), 7)
+
+    def test_GET_with_mixed_nondurable_frags_and_will_404(self):
+        # all nodes have a frag but there is no one set that reaches quorum,
+        # which means there is no backend 404 response, but proxy should still
+        # return 404 rather than 503
+        obj1 = self._make_ec_object_stub(pattern='obj1')
+        obj2 = self._make_ec_object_stub(pattern='obj2')
+        obj3 = self._make_ec_object_stub(pattern='obj3')
+        obj4 = self._make_ec_object_stub(pattern='obj4')
+
+        node_frags = [
+            {'obj': obj1, 'frag': 0, 'durable': False},
+            {'obj': obj2, 'frag': 0, 'durable': False},
+            {'obj': obj3, 'frag': 0, 'durable': False},
+            {'obj': obj1, 'frag': 1, 'durable': False},
+            {'obj': obj2, 'frag': 1, 'durable': False},
+            {'obj': obj3, 'frag': 1, 'durable': False},
+            {'obj': obj1, 'frag': 2, 'durable': False},
+            {'obj': obj2, 'frag': 2, 'durable': False},
+            {'obj': obj3, 'frag': 2, 'durable': False},
+            {'obj': obj1, 'frag': 3, 'durable': False},
+            {'obj': obj2, 'frag': 3, 'durable': False},
+            {'obj': obj3, 'frag': 3, 'durable': False},
+            {'obj': obj1, 'frag': 4, 'durable': False},
+            {'obj': obj2, 'frag': 4, 'durable': False},
+            {'obj': obj3, 'frag': 4, 'durable': False},
+            {'obj': obj1, 'frag': 5, 'durable': False},
+            {'obj': obj2, 'frag': 5, 'durable': False},
+            {'obj': obj3, 'frag': 5, 'durable': False},
+            {'obj': obj1, 'frag': 6, 'durable': False},
+            {'obj': obj2, 'frag': 6, 'durable': False},
+            {'obj': obj3, 'frag': 6, 'durable': False},
+            {'obj': obj1, 'frag': 7, 'durable': False},
+            {'obj': obj2, 'frag': 7, 'durable': False},
+            {'obj': obj3, 'frag': 7, 'durable': False},
+            {'obj': obj1, 'frag': 8, 'durable': False},
+            {'obj': obj2, 'frag': 8, 'durable': False},
+            {'obj': obj3, 'frag': 8, 'durable': False},
+            {'obj': obj4, 'frag': 8, 'durable': False},
+        ]
+
+        fake_response = self._fake_ec_node_response(node_frags)
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(fake_response) as log:
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 404)
+
+        collected_etags = set()
+        collected_status = set()
+        closed_conn = defaultdict(set)
+        for conn in log:
+            etag = conn.resp.headers['X-Object-Sysmeta-Ec-Etag']
+            collected_etags.add(etag)
+            collected_status.add(conn.resp.status)
+            closed_conn[etag].add(conn.closed)
+
+        # default node_iter will exhaust at 2 * replicas
+        self.assertEqual(len(log), 2 * self.replicas())
+        self.assertEqual(
+            {obj1['etag'], obj2['etag'], obj3['etag'], obj4['etag']},
+            collected_etags)
+        self.assertEqual({200}, collected_status)
+        self.assertEqual({
+            obj1['etag']: {True},
+            obj2['etag']: {True},
+            obj3['etag']: {True},
+            obj4['etag']: {True},
+        }, closed_conn)
+
+    def test_GET_with_mixed_durable_and_nondurable_frags_will_503(self):
+        # all nodes have a frag but there is no one set that reaches quorum,
+        # but since one is marked durable we *should* be able to reconstruct,
+        # so proxy should 503
+        obj1 = self._make_ec_object_stub(pattern='obj1')
+        obj2 = self._make_ec_object_stub(pattern='obj2')
+        obj3 = self._make_ec_object_stub(pattern='obj3')
+        obj4 = self._make_ec_object_stub(pattern='obj4')
+
+        node_frags = [
+            {'obj': obj1, 'frag': 0, 'durable': False},
+            {'obj': obj2, 'frag': 0, 'durable': False},
+            {'obj': obj3, 'frag': 0, 'durable': False},
+            {'obj': obj1, 'frag': 1, 'durable': False},
+            {'obj': obj2, 'frag': 1, 'durable': False},
+            {'obj': obj3, 'frag': 1, 'durable': False},
+            {'obj': obj1, 'frag': 2, 'durable': False},
+            {'obj': obj2, 'frag': 2, 'durable': False},
+            {'obj': obj3, 'frag': 2, 'durable': False},
+            {'obj': obj1, 'frag': 3, 'durable': False},
+            {'obj': obj2, 'frag': 3, 'durable': False},
+            {'obj': obj3, 'frag': 3, 'durable': False},
+            {'obj': obj1, 'frag': 4, 'durable': False},
+            {'obj': obj2, 'frag': 4, 'durable': False},
+            {'obj': obj3, 'frag': 4, 'durable': False},
+            {'obj': obj1, 'frag': 5, 'durable': False},
+            {'obj': obj2, 'frag': 5, 'durable': False},
+            {'obj': obj3, 'frag': 5, 'durable': False},
+            {'obj': obj1, 'frag': 6, 'durable': False},
+            {'obj': obj2, 'frag': 6, 'durable': False},
+            {'obj': obj3, 'frag': 6, 'durable': False},
+            {'obj': obj1, 'frag': 7, 'durable': False},
+            {'obj': obj2, 'frag': 7, 'durable': False},
+            {'obj': obj3, 'frag': 7},
+            {'obj': obj1, 'frag': 8, 'durable': False},
+            {'obj': obj2, 'frag': 8, 'durable': False},
+            {'obj': obj3, 'frag': 8, 'durable': False},
+            {'obj': obj4, 'frag': 8, 'durable': False},
+        ]
+
+        fake_response = self._fake_ec_node_response(node_frags)
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(fake_response) as log:
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 503)
+
+        closed_conn = defaultdict(set)
+        collected_etags = set()
+        collected_status = set()
+        for conn in log:
+            etag = conn.resp.headers['X-Object-Sysmeta-Ec-Etag']
+            collected_etags.add(etag)
+            collected_status.add(conn.resp.status)
+            closed_conn[etag].add(conn.closed)
+
+        # default node_iter will exhaust at 2 * replicas
+        self.assertEqual(len(log), 2 * self.replicas())
+        self.assertEqual(
+            {obj1['etag'], obj2['etag'], obj3['etag'], obj4['etag']},
+            collected_etags)
+        self.assertEqual({200}, collected_status)
+        self.assertEqual({
+            obj1['etag']: {True},
+            obj2['etag']: {True},
+            obj3['etag']: {True},
+            obj4['etag']: {True},
+        }, closed_conn)
+
+    def test_GET_with_mixed_durable_frags_and_no_quorum_will_503(self):
+        # all nodes have a frag but there is no one set that reaches quorum,
+        # and since at least one is marked durable we *should* be able to
+        # reconstruct, so proxy will 503
+        obj1 = self._make_ec_object_stub(pattern='obj1')
+        obj2 = self._make_ec_object_stub(pattern='obj2')
+        obj3 = self._make_ec_object_stub(pattern='obj3')
+        obj4 = self._make_ec_object_stub(pattern='obj4')
+
+        node_frags = [
+            {'obj': obj1, 'frag': 0},
+            {'obj': obj2, 'frag': 0},
+            {'obj': obj3, 'frag': 0},
+            {'obj': obj1, 'frag': 1},
+            {'obj': obj2, 'frag': 1},
+            {'obj': obj3, 'frag': 1},
+            {'obj': obj1, 'frag': 2},
+            {'obj': obj2, 'frag': 2},
+            {'obj': obj3, 'frag': 2},
+            {'obj': obj1, 'frag': 3},
+            {'obj': obj2, 'frag': 3},
+            {'obj': obj3, 'frag': 3},
+            {'obj': obj1, 'frag': 4},
+            {'obj': obj2, 'frag': 4},
+            {'obj': obj3, 'frag': 4},
+            {'obj': obj1, 'frag': 5},
+            {'obj': obj2, 'frag': 5},
+            {'obj': obj3, 'frag': 5},
+            {'obj': obj1, 'frag': 6},
+            {'obj': obj2, 'frag': 6},
+            {'obj': obj3, 'frag': 6},
+            {'obj': obj1, 'frag': 7},
+            {'obj': obj2, 'frag': 7},
+            {'obj': obj3, 'frag': 7},
+            {'obj': obj1, 'frag': 8},
+            {'obj': obj2, 'frag': 8},
+            {'obj': obj3, 'frag': 8},
+            {'obj': obj4, 'frag': 8},
+        ]
+
+        fake_response = self._fake_ec_node_response(node_frags)
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(fake_response) as log:
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 503)
+
+        for conn in log:
+            etag = conn.resp.headers.get('X-Object-Sysmeta-Ec-Etag')
+
+        collected_etags = set()
+        collected_status = set()
+        closed_conn = defaultdict(set)
+        for conn in log:
+            etag = conn.resp.headers['X-Object-Sysmeta-Ec-Etag']
+            collected_etags.add(etag)
+            collected_status.add(conn.resp.status)
+            closed_conn[etag].add(conn.closed)
+
+        # default node_iter will exhaust at 2 * replicas
+        self.assertEqual(len(log), 2 * self.replicas())
+        self.assertEqual(
+            {obj1['etag'], obj2['etag'], obj3['etag'], obj4['etag']},
+            collected_etags)
+        self.assertEqual({200}, collected_status)
+        self.assertEqual({
+            obj1['etag']: {True},
+            obj2['etag']: {True},
+            obj3['etag']: {True},
+            obj4['etag']: {True},
+        }, closed_conn)
+
+    def test_GET_with_quorum_durable_files(self):
+        # verify that only (ec_nparity + 1) nodes need to be durable for a GET
+        # to be completed with ec_ndata requests.
+        obj1 = self._make_ec_object_stub()
+
+        node_frags = [
+            {'obj': obj1, 'frag': 0, 'durable': True},  # durable
+            {'obj': obj1, 'frag': 1, 'durable': True},  # durable
+            {'obj': obj1, 'frag': 2, 'durable': True},  # durable
+            {'obj': obj1, 'frag': 3, 'durable': True},  # durable
+            {'obj': obj1, 'frag': 4, 'durable': True},  # durable
+            {'obj': obj1, 'frag': 5, 'durable': False},
+            {'obj': obj1, 'frag': 6, 'durable': False},
+            {'obj': obj1, 'frag': 7, 'durable': False},
+            {'obj': obj1, 'frag': 8, 'durable': False},
+            {'obj': obj1, 'frag': 9, 'durable': False},
+            {'obj': obj1, 'frag': 10, 'durable': False},  # parity
+            {'obj': obj1, 'frag': 11, 'durable': False},  # parity
+            {'obj': obj1, 'frag': 12, 'durable': False},  # parity
+            {'obj': obj1, 'frag': 13, 'durable': False},  # parity
+        ] + [[]] * self.replicas()  # handoffs all 404
+
+        fake_response = self._fake_ec_node_response(list(node_frags))
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(fake_response) as log:
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['etag'], obj1['etag'])
+        self.assertEqual(md5(
+            resp.body, usedforsecurity=False).hexdigest(), obj1['etag'])
+
+        self.assertGreaterEqual(len(log), self.policy.ec_ndata)
+        collected_durables = []
+        for conn in log:
+            if not conn.resp.headers.get('X-Backend-Data-Timestamp'):
+                continue
+            if (conn.resp.headers.get('X-Backend-Durable-Timestamp')
+                    == conn.resp.headers.get('X-Backend-Data-Timestamp')):
+                collected_durables.append(conn)
+        # because nodes are shuffled we can't be sure how many durables are
+        # returned but it must be at least 1 and cannot exceed 5
+        self.assertLessEqual(len(collected_durables), 5)
+        self.assertGreaterEqual(len(collected_durables), 1)
+
+    def test_GET_with_single_durable_file(self):
+        # verify that a single durable is sufficient for a GET
+        # to be completed with ec_ndata requests.
+        obj1 = self._make_ec_object_stub()
+
+        node_frags = [
+            {'obj': obj1, 'frag': 0, 'durable': True},  # durable
+            {'obj': obj1, 'frag': 1, 'durable': False},
+            {'obj': obj1, 'frag': 2, 'durable': False},
+            {'obj': obj1, 'frag': 3, 'durable': False},
+            {'obj': obj1, 'frag': 4, 'durable': False},
+            {'obj': obj1, 'frag': 5, 'durable': False},
+            {'obj': obj1, 'frag': 6, 'durable': False},
+            {'obj': obj1, 'frag': 7, 'durable': False},
+            {'obj': obj1, 'frag': 8, 'durable': False},
+            {'obj': obj1, 'frag': 9, 'durable': False},
+            {'obj': obj1, 'frag': 10, 'durable': False},  # parity
+            {'obj': obj1, 'frag': 11, 'durable': False},  # parity
+            {'obj': obj1, 'frag': 12, 'durable': False},  # parity
+            {'obj': obj1, 'frag': 13, 'durable': False},  # parity
+        ] + [[]] * self.replicas()  # handoffs all 404
+
+        fake_response = self._fake_ec_node_response(list(node_frags))
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(fake_response) as log:
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['etag'], obj1['etag'])
+        self.assertEqual(md5(
+            resp.body, usedforsecurity=False).hexdigest(), obj1['etag'])
+
+        collected_durables = []
+        for conn in log:
+            if not conn.resp.headers.get('X-Backend-Data-Timestamp'):
+                continue
+            if (conn.resp.headers.get('X-Backend-Durable-Timestamp')
+                    == conn.resp.headers.get('X-Backend-Data-Timestamp')):
+                collected_durables.append(conn)
+        # because nodes are shuffled we can't be sure how many non-durables
+        # are returned before the durable, but we do expect a single durable
+        self.assertEqual(1, len(collected_durables))
+
+    def test_GET_with_no_durable_files(self):
+        # verify that at least one durable is necessary for a successful GET
+        obj1 = self._make_ec_object_stub()
+        node_frags = [
+            {'obj': obj1, 'frag': 0, 'durable': False},
+            {'obj': obj1, 'frag': 1, 'durable': False},
+            {'obj': obj1, 'frag': 2, 'durable': False},
+            {'obj': obj1, 'frag': 3, 'durable': False},
+            {'obj': obj1, 'frag': 4, 'durable': False},
+            {'obj': obj1, 'frag': 5, 'durable': False},
+            {'obj': obj1, 'frag': 6, 'durable': False},
+            {'obj': obj1, 'frag': 7, 'durable': False},
+            {'obj': obj1, 'frag': 8, 'durable': False},
+            {'obj': obj1, 'frag': 9, 'durable': False},
+            {'obj': obj1, 'frag': 10, 'durable': False},  # parity
+            {'obj': obj1, 'frag': 11, 'durable': False},  # parity
+            {'obj': obj1, 'frag': 12, 'durable': False},  # parity
+            {'obj': obj1, 'frag': 13, 'durable': False},  # parity
+        ] + [[]] * self.replicas()  # handoffs
+
+        fake_response = self._fake_ec_node_response(list(node_frags))
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(fake_response) as log:
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 404)
+        # all 28 nodes tried with an optimistic get, none are durable and none
+        # report having a durable timestamp
+        self.assertEqual(28, len(log))
+        self.assertEqual([], self.app.logger.get_lines_for_level('error'))
+
+    def test_GET_nondurable_when_node_iter_runs_out_of_nodes(self):
+        policy_opts = self.app.get_policy_options(self.policy)
+        policy_opts.concurrent_gets = True
+        policy_opts.concurrent_ec_extra_requests = 1
+        policy_opts.concurrency_timeout = 0.1
+
+        obj1 = self._make_ec_object_stub(pattern='obj1')
+        node_frags = [
+            {'obj': obj1, 'frag': i, 'durable': False}
+            for i in range(self.policy.ec_ndata + 1)
+        ]
+        fake_response = self._fake_ec_node_response(node_frags)
+        # limit remaining nodes
+        obj_ring = self.app.get_object_ring(int(self.policy))
+        part, nodes = obj_ring.get_nodes('a', 'c', 'o')
+        nodes.extend(list(obj_ring.get_more_nodes(part)))
+        for dev in nodes[self.policy.ec_ndata + 1:]:
+            self.app.error_limiter.limit(dev)
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(fake_response) as log:
+            resp = req.get_response(self.app)
+
+        # non-durable responds 404
+        self.assertEqual(resp.status_int, 404)
+        self.assertEqual(len(log), self.policy.ec_ndata + 1)
+        self.assertEqual([], self.app.logger.get_lines_for_level('error'))
+
+    def test_GET_with_missing_durable_files_and_mixed_etags(self):
+        obj1 = self._make_ec_object_stub(pattern='obj1')
+        obj2 = self._make_ec_object_stub(pattern='obj2')
+
+        # non-quorate durables for another object won't stop us finding the
+        # quorate object
+        node_frags = [
+            # ec_ndata - 1 frags of obj2 are available and durable
+            {'obj': obj2, 'frag': 0, 'durable': True},
+            {'obj': obj2, 'frag': 1, 'durable': True},
+            {'obj': obj2, 'frag': 2, 'durable': True},
+            {'obj': obj2, 'frag': 3, 'durable': True},
+            {'obj': obj2, 'frag': 4, 'durable': True},
+            {'obj': obj2, 'frag': 5, 'durable': True},
+            {'obj': obj2, 'frag': 6, 'durable': True},
+            {'obj': obj2, 'frag': 7, 'durable': True},
+            {'obj': obj2, 'frag': 8, 'durable': True},
+            # ec_ndata frags of obj1 are available and one is durable
+            {'obj': obj1, 'frag': 0, 'durable': False},
+            {'obj': obj1, 'frag': 1, 'durable': False},
+            {'obj': obj1, 'frag': 2, 'durable': False},
+            {'obj': obj1, 'frag': 3, 'durable': False},
+            {'obj': obj1, 'frag': 4, 'durable': False},
+            {'obj': obj1, 'frag': 5, 'durable': False},
+            {'obj': obj1, 'frag': 6, 'durable': False},
+            {'obj': obj1, 'frag': 7, 'durable': False},
+            {'obj': obj1, 'frag': 8, 'durable': False},
+            {'obj': obj1, 'frag': 9, 'durable': True},
+        ]
+
+        fake_response = self._fake_ec_node_response(list(node_frags))
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(fake_response) as log:
+            resp = req.get_response(self.app)
+
+        closed_conn = defaultdict(set)
+        for conn in log:
+            etag = conn.resp.headers.get('X-Object-Sysmeta-Ec-Etag')
+            closed_conn[etag].add(conn.closed)
+        self.assertEqual({
+            obj1['etag']: {False},
+            obj2['etag']: {True},
+        }, closed_conn)
+
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['etag'], obj1['etag'])
+        self.assertEqual(md5(
+            resp.body, usedforsecurity=False).hexdigest(), obj1['etag'])
+
+        # Quorum of non-durables for a different object won't
+        # prevent us hunting down the durable object
+        node_frags = [
+            # primaries
+            {'obj': obj2, 'frag': 0, 'durable': False},
+            {'obj': obj2, 'frag': 1, 'durable': False},
+            {'obj': obj2, 'frag': 2, 'durable': False},
+            {'obj': obj2, 'frag': 3, 'durable': False},
+            {'obj': obj2, 'frag': 4, 'durable': False},
+            {'obj': obj2, 'frag': 5, 'durable': False},
+            {'obj': obj2, 'frag': 6, 'durable': False},
+            {'obj': obj2, 'frag': 7, 'durable': False},
+            {'obj': obj2, 'frag': 8, 'durable': False},
+            {'obj': obj2, 'frag': 9, 'durable': False},
+            {'obj': obj2, 'frag': 10, 'durable': False},
+            {'obj': obj2, 'frag': 11, 'durable': False},
+            {'obj': obj2, 'frag': 12, 'durable': False},
+            {'obj': obj2, 'frag': 13, 'durable': False},
+            # handoffs
+            {'obj': obj1, 'frag': 0, 'durable': False},
+            {'obj': obj1, 'frag': 1, 'durable': False},
+            {'obj': obj1, 'frag': 2, 'durable': False},
+            {'obj': obj1, 'frag': 3, 'durable': False},
+            {'obj': obj1, 'frag': 4, 'durable': False},
+            {'obj': obj1, 'frag': 5, 'durable': False},
+            {'obj': obj1, 'frag': 6, 'durable': False},
+            {'obj': obj1, 'frag': 7, 'durable': False},
+            {'obj': obj1, 'frag': 8, 'durable': False},
+            {'obj': obj1, 'frag': 9, 'durable': False},
+            {'obj': obj1, 'frag': 10, 'durable': False},  # parity
+            {'obj': obj1, 'frag': 11, 'durable': False},  # parity
+            {'obj': obj1, 'frag': 12, 'durable': False},  # parity
+            {'obj': obj1, 'frag': 13, 'durable': True},  # parity
+        ]
+
+        fake_response = self._fake_ec_node_response(list(node_frags))
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(fake_response):
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['etag'], obj1['etag'])
+        self.assertEqual(md5(
+            resp.body, usedforsecurity=False).hexdigest(), obj1['etag'])
+
+    def test_GET_with_missing_durables_and_older_durables(self):
+        # scenario: non-durable frags of newer obj1 obscure all durable frags
+        # of older obj2, so first 14 requests result in a non-durable set.
+        # At that point (or before) the proxy knows that a durable set of
+        # frags for obj2 exists so will fetch them, requiring another 10
+        # directed requests.
+        obj2 = self._make_ec_object_stub(pattern='obj2', timestamp=self.ts())
+        obj1 = self._make_ec_object_stub(pattern='obj1', timestamp=self.ts())
+
+        node_frags = [
+            [{'obj': obj1, 'frag': 0, 'durable': False}],  # obj2 missing
+            [{'obj': obj1, 'frag': 1, 'durable': False},
+             {'obj': obj2, 'frag': 1, 'durable': True}],
+            [{'obj': obj1, 'frag': 2, 'durable': False}],  # obj2 missing
+            [{'obj': obj1, 'frag': 3, 'durable': False},
+             {'obj': obj2, 'frag': 3, 'durable': True}],
+            [{'obj': obj1, 'frag': 4, 'durable': False},
+             {'obj': obj2, 'frag': 4, 'durable': True}],
+            [{'obj': obj1, 'frag': 5, 'durable': False},
+             {'obj': obj2, 'frag': 5, 'durable': True}],
+            [{'obj': obj1, 'frag': 6, 'durable': False},
+             {'obj': obj2, 'frag': 6, 'durable': True}],
+            [{'obj': obj1, 'frag': 7, 'durable': False},
+             {'obj': obj2, 'frag': 7, 'durable': True}],
+            [{'obj': obj1, 'frag': 8, 'durable': False},
+             {'obj': obj2, 'frag': 8, 'durable': True}],
+            [{'obj': obj1, 'frag': 9, 'durable': False}],  # obj2 missing
+            [{'obj': obj1, 'frag': 10, 'durable': False},
+             {'obj': obj2, 'frag': 10, 'durable': True}],
+            [{'obj': obj1, 'frag': 11, 'durable': False},
+             {'obj': obj2, 'frag': 11, 'durable': True}],
+            [{'obj': obj1, 'frag': 12, 'durable': False}],  # obj2 missing
+            [{'obj': obj1, 'frag': 13, 'durable': False},
+             {'obj': obj2, 'frag': 13, 'durable': True}],
+        ]
+
+        fake_response = self._fake_ec_node_response(list(node_frags))
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(fake_response) as log:
+            resp = req.get_response(self.app)
+
+        closed_conn = defaultdict(set)
+        for conn in log:
+            etag = conn.resp.headers.get('X-Object-Sysmeta-Ec-Etag')
+            closed_conn[etag].add(conn.closed)
+        self.assertEqual({
+            obj1['etag']: {True},
+            obj2['etag']: {False},
+        }, closed_conn)
+
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['etag'], obj2['etag'])
+        self.assertEqual(md5(
+            resp.body, usedforsecurity=False).hexdigest(), obj2['etag'])
+        # max: proxy will GET all non-durable obj1 frags and then 10 obj frags
+        self.assertLessEqual(len(log), self.replicas() + self.policy.ec_ndata)
+        # min: proxy will GET 10 non-durable obj1 frags and then 10 obj frags
+        self.assertGreaterEqual(len(log), 2 * self.policy.ec_ndata)
+
+    def test_GET_with_missing_durables_and_older_obscured_durables(self):
+        # scenario: obj3 has 14 frags but only 2 are durable and these are
+        # obscured by two non-durable frags of obj1. There is also a single
+        # non-durable frag of obj2. The proxy will need to do at least 10
+        # GETs to see all the obj3 frags plus 1 more to GET a durable frag.
+        # The proxy may also do one more GET if the obj2 frag is found.
+        # i.e. 10 + 1 durable for obj3, 2 for obj1 and 1 more if obj2 found
+        obj2 = self._make_ec_object_stub(pattern='obj2', timestamp=self.ts())
+        obj3 = self._make_ec_object_stub(pattern='obj3', timestamp=self.ts())
+        obj1 = self._make_ec_object_stub(pattern='obj1', timestamp=self.ts())
+
+        node_frags = [
+            [{'obj': obj1, 'frag': 0, 'durable': False},  # obj1 frag
+             {'obj': obj3, 'frag': 0, 'durable': True}],
+            [{'obj': obj1, 'frag': 1, 'durable': False},  # obj1 frag
+             {'obj': obj3, 'frag': 1, 'durable': True}],
+            [{'obj': obj2, 'frag': 2, 'durable': False},  # obj2 frag
+             {'obj': obj3, 'frag': 2, 'durable': False}],
+            [{'obj': obj3, 'frag': 3, 'durable': False}],
+            [{'obj': obj3, 'frag': 4, 'durable': False}],
+            [{'obj': obj3, 'frag': 5, 'durable': False}],
+            [{'obj': obj3, 'frag': 6, 'durable': False}],
+            [{'obj': obj3, 'frag': 7, 'durable': False}],
+            [{'obj': obj3, 'frag': 8, 'durable': False}],
+            [{'obj': obj3, 'frag': 9, 'durable': False}],
+            [{'obj': obj3, 'frag': 10, 'durable': False}],
+            [{'obj': obj3, 'frag': 11, 'durable': False}],
+            [{'obj': obj3, 'frag': 12, 'durable': False}],
+            [{'obj': obj3, 'frag': 13, 'durable': False}],
+        ] + [[]] * self.replicas()  # handoffs 404
+
+        fake_response = self._fake_ec_node_response(list(node_frags))
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(fake_response) as log:
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['etag'], obj3['etag'])
+        self.assertEqual(md5(
+            resp.body, usedforsecurity=False).hexdigest(), obj3['etag'])
+        self.assertGreaterEqual(len(log), self.policy.ec_ndata + 1)
+        self.assertLessEqual(len(log), (self.policy.ec_ndata * 2) + 1)
+
+    def test_GET_with_missing_durables_and_older_non_durables(self):
+        # scenario: non-durable frags of newer obj1 obscure all frags
+        # of older obj2, so first 28 requests result in a non-durable set.
+        # There are only 10 frags for obj2 and one is not durable.
+        obj2 = self._make_ec_object_stub(pattern='obj2', timestamp=self.ts())
+        obj1 = self._make_ec_object_stub(pattern='obj1', timestamp=self.ts())
+
+        node_frags = [
+            [{'obj': obj1, 'frag': 0, 'durable': False}],  # obj2 missing
+            [{'obj': obj1, 'frag': 1, 'durable': False},
+             {'obj': obj2, 'frag': 1, 'durable': False}],  # obj2 non-durable
+            [{'obj': obj1, 'frag': 2, 'durable': False}],  # obj2 missing
+            [{'obj': obj1, 'frag': 3, 'durable': False},
+             {'obj': obj2, 'frag': 3, 'durable': True}],
+            [{'obj': obj1, 'frag': 4, 'durable': False},
+             {'obj': obj2, 'frag': 4, 'durable': True}],
+            [{'obj': obj1, 'frag': 5, 'durable': False},
+             {'obj': obj2, 'frag': 5, 'durable': True}],
+            [{'obj': obj1, 'frag': 6, 'durable': False},
+             {'obj': obj2, 'frag': 6, 'durable': True}],
+            [{'obj': obj1, 'frag': 7, 'durable': False},
+             {'obj': obj2, 'frag': 7, 'durable': True}],
+            [{'obj': obj1, 'frag': 8, 'durable': False},
+             {'obj': obj2, 'frag': 8, 'durable': True}],
+            [{'obj': obj1, 'frag': 9, 'durable': False}],  # obj2 missing
+            [{'obj': obj1, 'frag': 10, 'durable': False},
+             {'obj': obj2, 'frag': 10, 'durable': True}],
+            [{'obj': obj1, 'frag': 11, 'durable': False},
+             {'obj': obj2, 'frag': 11, 'durable': True}],
+            [{'obj': obj1, 'frag': 12, 'durable': False}],  # obj2 missing
+            [{'obj': obj1, 'frag': 13, 'durable': False},
+             {'obj': obj2, 'frag': 13, 'durable': True}],
+            [],                                             # 1 empty primary
+        ]
+
+        fake_response = self._fake_ec_node_response(list(node_frags))
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(fake_response) as log:
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['etag'], obj2['etag'])
+        self.assertEqual(md5(
+            resp.body, usedforsecurity=False).hexdigest(), obj2['etag'])
+        # max: proxy will GET all non-durable obj1 frags and then 10 obj2 frags
+        self.assertLessEqual(len(log), self.replicas() + self.policy.ec_ndata)
+        # min: proxy will GET 10 non-durable obj1 frags and then 10 obj2 frags
+        self.assertGreaterEqual(len(log), 2 * self.policy.ec_ndata)
+
+    def test_GET_with_mixed_etags_at_same_timestamp(self):
+        # this scenario should never occur but if there are somehow
+        # fragments for different content at the same timestamp then the
+        # object controller should handle it gracefully
+        ts = self.ts()  # force equal timestamps for two objects
+        obj1 = self._make_ec_object_stub(timestamp=ts, pattern='obj1')
+        obj2 = self._make_ec_object_stub(timestamp=ts, pattern='obj2')
+        self.assertNotEqual(obj1['etag'], obj2['etag'])  # sanity
+
+        node_frags = [
+            # 7 frags of obj2 are available and durable
+            {'obj': obj2, 'frag': 0, 'durable': True},
+            {'obj': obj2, 'frag': 1, 'durable': True},
+            {'obj': obj2, 'frag': 2, 'durable': True},
+            {'obj': obj2, 'frag': 3, 'durable': True},
+            {'obj': obj2, 'frag': 4, 'durable': True},
+            {'obj': obj2, 'frag': 5, 'durable': True},
+            {'obj': obj2, 'frag': 6, 'durable': True},
+            # 7 frags of obj1 are available and durable
+            {'obj': obj1, 'frag': 7, 'durable': True},
+            {'obj': obj1, 'frag': 8, 'durable': True},
+            {'obj': obj1, 'frag': 9, 'durable': True},
+            {'obj': obj1, 'frag': 10, 'durable': True},
+            {'obj': obj1, 'frag': 11, 'durable': True},
+            {'obj': obj1, 'frag': 12, 'durable': True},
+            {'obj': obj1, 'frag': 13, 'durable': True},
+        ] + [[]] * self.replicas()  # handoffs
+
+        fake_response = self._fake_ec_node_response(list(node_frags))
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(fake_response) as log:
+            resp = req.get_response(self.app)
+        # read body to provoke any EC decode errors
+        self.assertTrue(resp.body)
+
+        self.assertEqual(resp.status_int, 503)
+        self.assertEqual(len(log), self.replicas() * 2)
+        collected_etags = set()
+        for conn in log:
+            etag = conn.resp.headers['X-Object-Sysmeta-Ec-Etag']
+            collected_etags.add(etag)  # will be None from handoffs
+        self.assertEqual({obj1['etag'], obj2['etag'], None}, collected_etags)
+        log_lines = self.app.logger.get_lines_for_level('error')
+        self.assertEqual(log_lines,
+                         ['Problem with fragment response: ETag mismatch'] * 7
+                         + ['Object returning 503 for []'])
+        # Note the empty list above -- that log line comes out of
+        # best_response but we've already thrown out the "good" responses :-/
+
+    def test_GET_mixed_success_with_range(self):
+        fragment_size = self.policy.fragment_size
+
+        ec_stub = self._make_ec_object_stub()
+        frag_archives = ec_stub['frags']
+        frag_archive_size = len(ec_stub['frags'][0])
+
+        headers = {
+            'Content-Type': 'text/plain',
+            'Content-Length': fragment_size,
+            'Content-Range': 'bytes 0-%s/%s' % (fragment_size - 1,
+                                                frag_archive_size),
+            'X-Object-Sysmeta-Ec-Content-Length': len(ec_stub['body']),
+            'X-Object-Sysmeta-Ec-Etag': ec_stub['etag'],
+            'X-Timestamp': Timestamp(self.ts()).normal,
+        }
+        responses = [
+            StubResponse(206, frag_archives[0][:fragment_size], headers, 0),
+            StubResponse(206, frag_archives[1][:fragment_size], headers, 1),
+            StubResponse(206, frag_archives[2][:fragment_size], headers, 2),
+            StubResponse(206, frag_archives[3][:fragment_size], headers, 3),
+            StubResponse(206, frag_archives[4][:fragment_size], headers, 4),
+            # data nodes with old frag
+            StubResponse(416, frag_index=5),
+            StubResponse(416, frag_index=6),
+            StubResponse(206, frag_archives[7][:fragment_size], headers, 7),
+            StubResponse(206, frag_archives[8][:fragment_size], headers, 8),
+            StubResponse(206, frag_archives[9][:fragment_size], headers, 9),
+            # hopefully we ask for two more
+            StubResponse(206, frag_archives[10][:fragment_size], headers, 10),
+            StubResponse(206, frag_archives[11][:fragment_size], headers, 11),
+        ]
+
+        def get_response(req):
+            return responses.pop(0) if responses else StubResponse(404)
+
+        req = swob.Request.blank('/v1/a/c/o', headers={'Range': 'bytes=0-3'})
+        with capture_http_requests(get_response) as log:
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 206)
+        self.assertEqual(resp.body, b'test')
+        self.assertEqual(len(log), self.policy.ec_ndata + 2)
+
+        # verify that even when last responses to be collected are 416's
+        # the shortfall of 2xx responses still triggers extra spawned requests
+        responses = [
+            StubResponse(206, frag_archives[0][:fragment_size], headers, 0),
+            StubResponse(206, frag_archives[1][:fragment_size], headers, 1),
+            StubResponse(206, frag_archives[2][:fragment_size], headers, 2),
+            StubResponse(206, frag_archives[3][:fragment_size], headers, 3),
+            StubResponse(206, frag_archives[4][:fragment_size], headers, 4),
+            StubResponse(206, frag_archives[7][:fragment_size], headers, 7),
+            StubResponse(206, frag_archives[8][:fragment_size], headers, 8),
+            StubResponse(206, frag_archives[9][:fragment_size], headers, 9),
+            StubResponse(206, frag_archives[10][:fragment_size], headers, 10),
+            # data nodes with old frag
+            StubResponse(416, frag_index=5),
+            # hopefully we ask for one more
+            StubResponse(416, frag_index=6),
+            # and hopefully we ask for another
+            StubResponse(206, frag_archives[11][:fragment_size], headers, 11),
+        ]
+
+        req = swob.Request.blank('/v1/a/c/o', headers={'Range': 'bytes=0-3'})
+        with capture_http_requests(get_response) as log:
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 206)
+        self.assertEqual(resp.body, b'test')
+        self.assertEqual(len(log), self.policy.ec_ndata + 2)
+
+    def test_GET_with_range_unsatisfiable_mixed_success(self):
+        responses = [
+            StubResponse(416, frag_index=0),
+            StubResponse(416, frag_index=1),
+            StubResponse(416, frag_index=2),
+            StubResponse(416, frag_index=3),
+            StubResponse(416, frag_index=4),
+            StubResponse(416, frag_index=5),
+            StubResponse(416, frag_index=6),
+            # sneak a couple bogus extra responses
+            StubResponse(404),
+            StubResponse(206, frag_index=8),
+            # and then just "enough" more 416's
+            StubResponse(416, frag_index=9),
+            StubResponse(416, frag_index=10),
+            StubResponse(416, frag_index=11),
+        ]
+
+        def get_response(req):
+            return responses.pop(0) if responses else StubResponse(404)
+
+        req = swob.Request.blank('/v1/a/c/o', headers={
+            'Range': 'bytes=%s-' % 100000000000000})
+        with capture_http_requests(get_response) as log:
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 416)
+        # we're going to engage ndata primaries, plus the bogus extra
+        # self.assertEqual(len(log), self.policy.ec_ndata + 2)
+        self.assertEqual([c.resp.status for c in log],
+                         ([416] * 7) + [404, 206] + ([416] * 3))
+
+    def test_GET_with_missing_and_range_unsatisifiable(self):
+        responses = [  # not quite ec_ndata frags on primaries
+            StubResponse(416, frag_index=0),
+            StubResponse(416, frag_index=1),
+            StubResponse(416, frag_index=2),
+            StubResponse(416, frag_index=3),
+            StubResponse(416, frag_index=4),
+            StubResponse(416, frag_index=5),
+            StubResponse(416, frag_index=6),
+            StubResponse(416, frag_index=7),
+            StubResponse(416, frag_index=8),
+        ]
+
+        def get_response(req):
+            return responses.pop(0) if responses else StubResponse(404)
+
+        req = swob.Request.blank('/v1/a/c/o', headers={
+            'Range': 'bytes=%s-' % 100000000000000})
+        with capture_http_requests(get_response) as log:
+            resp = req.get_response(self.app)
+
+        # TODO: does 416 make sense without a quorum, or should this be a 404?
+        # a non-range GET of same object would return 404
+        self.assertEqual(resp.status_int, 416)
+        self.assertEqual(len(log), 2 * self.replicas())
+
+    @patch_policies(
+        [ECStoragePolicy(0, name='ec', is_default=True,
+                         ec_type=DEFAULT_TEST_EC_TYPE, ec_ndata=4,
+                         ec_nparity=4, ec_segment_size=4096)],
+        fake_ring_args=[{'replicas': 8}]
+    )
+    def test_GET_ndata_equals_nparity_with_missing_and_errors(self):
+        # when ec_ndata == ec_nparity it is possible for the shortfall of a bad
+        # bucket (412's) to equal ec_ndata; verify that the 412 bucket is still
+        # chosen ahead of the initial 'dummy' bad bucket
+        POLICIES.default.object_ring.max_more_nodes = 8
+        responses = [
+            StubResponse(412, frag_index=0),
+            StubResponse(412, frag_index=1),
+        ]
+
+        def get_response(req):
+            return responses.pop(0) if responses else StubResponse(404)
+
+        req = swob.Request.blank('/v1/a/c/o', headers={
+            'Range': 'bytes=%s-' % 100000000000000})
+        with capture_http_requests(get_response) as log:
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 412)
+        self.assertEqual(len(log), 2 * 8)
+
+    def test_GET_with_multirange(self):
+        self.app.object_chunk_size = 256
+        test_body = b'test' * self.policy.ec_segment_size
+        ec_stub = make_ec_object_stub(test_body, self.policy, None)
+        frag_archives = ec_stub['frags']
+        self.assertEqual(len(frag_archives[0]), 1960)
+        boundary = b'81eb9c110b32ced5fe'
+
+        def make_mime_body(frag_archive):
+            return b'\r\n'.join([
+                b'--' + boundary,
+                b'Content-Type: application/octet-stream',
+                b'Content-Range: bytes 0-489/1960',
+                b'',
+                frag_archive[0:490],
+                b'--' + boundary,
+                b'Content-Type: application/octet-stream',
+                b'Content-Range: bytes 1470-1959/1960',
+                b'',
+                frag_archive[1470:],
+                b'--' + boundary + b'--',
+            ])
+
+        obj_resp_bodies = [make_mime_body(fa) for fa
+                           in ec_stub['frags'][:self.policy.ec_ndata]]
+
+        headers = {
+            'Content-Type': b'multipart/byteranges;boundary=' + boundary,
+            'Content-Length': len(obj_resp_bodies[0]),
+            'X-Object-Sysmeta-Ec-Content-Length': len(ec_stub['body']),
+            'X-Object-Sysmeta-Ec-Etag': ec_stub['etag'],
+            'X-Timestamp': Timestamp(self.ts()).normal,
+        }
+
+        responses = [
+            StubResponse(206, body, headers, i)
+            for i, body in enumerate(obj_resp_bodies)
+        ]
+
+        def get_response(req):
+            # there's some math going on here I don't quite understand, the
+            # fragment_size is 490 and there's like 4 of them because ec_body
+            # is 'test' * segment_size
+            self.assertEqual(req['headers']['Range'], 'bytes=0-489,1470-1959')
+            return responses.pop(0) if responses else StubResponse(404)
+
+        req = swob.Request.blank('/v1/a/c/o', headers={
+            'Range': 'bytes=1000-2000,14000-15000'})
+        with capture_http_requests(get_response) as log:
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 206)
+        self.assertEqual(len(log), self.policy.ec_ndata)
+        resp_boundary = resp.headers['content-type'].rsplit('=', 1)[1].encode()
+        expected = b'\r\n'.join([
+            b'--' + resp_boundary,
+            b'Content-Type: application/octet-stream',
+            b'Content-Range: bytes 1000-2000/16384',
+            b'',
+            ec_stub['body'][1000:2001],
+            b'--' + resp_boundary,
+            b'Content-Type: application/octet-stream',
+            b'Content-Range: bytes 14000-15000/16384',
+            b'',
+            ec_stub['body'][14000:15001],
+            b'--' + resp_boundary + b'--',
+        ])
+        self.assertEqual(resp.body, expected)
+
+    def test_GET_with_multirange_slow_body(self):
+        self.app.object_chunk_size = 256
+        self.app.recoverable_node_timeout = 0.01
+        test_body = b'test' * self.policy.ec_segment_size
+        ec_stub = make_ec_object_stub(test_body, self.policy, None)
+        frag_archives = ec_stub['frags']
+        self.assertEqual(len(frag_archives[0]), 1960)
+        boundary = b'81eb9c110b32ced5fe'
+
+        def make_mime_body(frag_archive):
+            return b'\r\n'.join([
+                b'--' + boundary,
+                b'Content-Type: application/octet-stream',
+                b'Content-Range: bytes 0-489/1960',
+                b'',
+                frag_archive[0:490],
+                b'--' + boundary,
+                b'Content-Type: application/octet-stream',
+                b'Content-Range: bytes 1470-1959/1960',
+                b'',
+                frag_archive[1470:],
+                b'--' + boundary + b'--',
+            ])
+
+        obj_resp_bodies = [make_mime_body(fa) for fa
+                           in ec_stub['frags'][:self.policy.ec_ndata + 1]]
+
+        headers = {
+            'Content-Type': b'multipart/byteranges;boundary=' + boundary,
+            'Content-Length': len(obj_resp_bodies[0]),
+            'X-Object-Sysmeta-Ec-Content-Length': len(ec_stub['body']),
+            'X-Object-Sysmeta-Ec-Etag': ec_stub['etag'],
+            'X-Timestamp': Timestamp(self.ts()).normal,
+        }
+
+        responses = [
+            StubResponse(206, body, headers, i,
+                         # make the first one slow
+                         slowdown=0.1 if i == 0 else None)
+            for i, body in enumerate(obj_resp_bodies)
+        ]
+
+        def get_response(req):
+            # there's some math going on here I don't quite understand, the
+            # fragment_size is 490 and there's like 4 of them because ec_body
+            # is 'test' * segment_size
+            self.assertEqual(req['headers']['Range'], 'bytes=0-489,1470-1959')
+            return responses.pop(0) if responses else StubResponse(404)
+
+        req = swob.Request.blank('/v1/a/c/o', headers={
+            'Range': 'bytes=1000-2000,14000-15000'})
+        with capture_http_requests(get_response) as log:
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 206)
+        self.assertEqual(len(log), self.policy.ec_ndata + 1)
+        resp_boundary = resp.headers['content-type'].rsplit('=', 1)[1].encode()
+        expected = b'\r\n'.join([
+            b'--' + resp_boundary,
+            b'Content-Type: application/octet-stream',
+            b'Content-Range: bytes 1000-2000/16384',
+            b'',
+            ec_stub['body'][1000:2001],
+            b'--' + resp_boundary,
+            b'Content-Type: application/octet-stream',
+            b'Content-Range: bytes 14000-15000/16384',
+            b'',
+            ec_stub['body'][14000:15001],
+            b'--' + resp_boundary + b'--',
+        ])
+        self.assertEqual(resp.body, expected)
+
+    def test_GET_with_multirange_unable_to_resume(self):
+        self.app.object_chunk_size = 256
+        self.app.recoverable_node_timeout = 0.01
+        test_body = b'test' * self.policy.ec_segment_size
+        ec_stub = make_ec_object_stub(test_body, self.policy, None)
+        frag_archives = ec_stub['frags']
+        self.assertEqual(len(frag_archives[0]), 1960)
+        boundary = b'81eb9c110b32ced5fe'
+
+        def make_mime_body(frag_archive):
+            return b'\r\n'.join([
+                b'--' + boundary,
+                b'Content-Type: application/octet-stream',
+                b'Content-Range: bytes 0-489/1960',
+                b'',
+                frag_archive[0:490],
+                b'--' + boundary,
+                b'Content-Type: application/octet-stream',
+                b'Content-Range: bytes 1470-1959/1960',
+                b'',
+                frag_archive[1470:],
+                b'--' + boundary + b'--',
+            ])
+
+        obj_resp_bodies = [make_mime_body(fa) for fa
+                           # no extra good responses
+                           in ec_stub['frags'][:self.policy.ec_ndata]]
+
+        headers = {
+            'Content-Type': b'multipart/byteranges;boundary=' + boundary,
+            'Content-Length': len(obj_resp_bodies[0]),
+            'X-Object-Sysmeta-Ec-Content-Length': len(ec_stub['body']),
+            'X-Object-Sysmeta-Ec-Etag': ec_stub['etag'],
+            'X-Timestamp': Timestamp(self.ts()).normal,
+        }
+
+        responses = [
+            StubResponse(206, body, headers, i,
+                         # make the first one slow
+                         slowdown=0.1 if i == 0 else None)
+            for i, body in enumerate(obj_resp_bodies)
+        ]
+
+        def get_response(req):
+            # there's some math going on here I don't quite understand, the
+            # fragment_size is 490 and there's like 4 of them because ec_body
+            # is 'test' * segment_size
+            self.assertEqual(req['headers']['Range'], 'bytes=0-489,1470-1959')
+            return responses.pop(0) if responses else StubResponse(404)
+
+        req = swob.Request.blank('/v1/a/c/o', headers={
+            'Range': 'bytes=1000-2000,14000-15000'})
+        with capture_http_requests(get_response) as log:
+            resp = req.get_response(self.app)
+            # note: the error is raised before the resp_iter is read
+            self.assertIn(b'Internal Error', resp.body)
+        self.assertEqual(resp.status_int, 500)
+        self.assertEqual(len(log), self.policy.ec_n_unique_fragments * 2)
+        log_lines = self.app.logger.get_lines_for_level('error')
+        self.assertEqual(3, len(log_lines), log_lines)
+        self.assertIn('Trying to read next part of EC fragment multi-part GET',
+                      log_lines[0])
+        self.assertIn('Trying to read during GET: ChunkReadTimeout',
+                      log_lines[1])
+        # not the most graceful ending
+        self.assertIn('Unhandled exception in request: ChunkReadTimeout',
+                      log_lines[2])
+
+    def test_GET_with_multirange_unable_to_resume_body_started(self):
+        self.app.object_chunk_size = 256
+        self.app.recoverable_node_timeout = 0.01
+        test_body = b'test' * self.policy.ec_segment_size
+        ec_stub = make_ec_object_stub(test_body, self.policy, None)
+        frag_archives = ec_stub['frags']
+        self.assertEqual(len(frag_archives[0]), 1960)
+        boundary = b'81eb9c110b32ced5fe'
+
+        def make_mime_body(frag_archive):
+            return b'\r\n'.join([
+                b'--' + boundary,
+                b'Content-Type: application/octet-stream',
+                b'Content-Range: bytes 0-489/1960',
+                b'',
+                frag_archive[0:490],
+                b'--' + boundary,
+                b'Content-Type: application/octet-stream',
+                b'Content-Range: bytes 1470-1959/1960',
+                b'',
+                frag_archive[1470:],
+                b'--' + boundary + b'--',
+            ])
+
+        obj_resp_bodies = [make_mime_body(fa) for fa
+                           # no extra good responses
+                           in ec_stub['frags'][:self.policy.ec_ndata]]
+
+        headers = {
+            'Content-Type': b'multipart/byteranges;boundary=' + boundary,
+            'Content-Length': len(obj_resp_bodies[0]),
+            'X-Object-Sysmeta-Ec-Content-Length': len(ec_stub['body']),
+            'X-Object-Sysmeta-Ec-Etag': ec_stub['etag'],
+            'X-Timestamp': Timestamp(self.ts()).normal,
+        }
+
+        responses = [
+            StubResponse(206, body, headers, i,
+                         # make the first one slow
+                         slowdown=0.1 if i == 0 else None)
+            for i, body in enumerate(obj_resp_bodies)
+        ]
+        # the first response serves some bytes before slowing down
+        responses[0].slowdown_after = 1000
+
+        def get_response(req):
+            return responses.pop(0) if responses else StubResponse(404)
+
+        req = swob.Request.blank('/v1/a/c/o', headers={
+            'Range': 'bytes=1000-2000,14000-15000'})
+        response_chunks = []
+        with capture_http_requests(get_response) as log:
+            resp = req.get_response(self.app)
+            with self.assertRaises(ChunkReadTimeout):
+                # note: the error is raised while the resp_iter is read
+                for chunk in resp.app_iter:
+                    response_chunks.append(chunk)
+        boundary = resp.headers['Content-Type'].split('=', 1)[1]
+        self.assertEqual(response_chunks, [
+            b'\r\n'.join([
+                b'--' + boundary.encode('ascii'),
+                b'Content-Type: application/octet-stream',
+                b'Content-Range: bytes 1000-2000/16384',
+                b'',
+                b'',
+            ]),
+            test_body[0:1001],
+            b'\r\n',
+        ])
+        self.assertEqual(resp.status_int, 206)
+        self.assertEqual(len(log), self.policy.ec_n_unique_fragments * 2)
+        log_lines = self.app.logger.get_lines_for_level('error')
+        self.assertEqual(2, len(log_lines), log_lines)
+        self.assertIn('Trying to read next part of EC fragment multi-part GET',
+                      log_lines[0])
+        self.assertIn('Trying to read during GET: ChunkReadTimeout',
+                      log_lines[1])
+
+    def test_GET_with_multirange_short_resume_body(self):
+        self.app.object_chunk_size = 256
+        self.app.recoverable_node_timeout = 0.01
+        test_body = b'test' * self.policy.ec_segment_size
+        ec_stub = make_ec_object_stub(test_body, self.policy, None)
+        frag_archives = ec_stub['frags']
+        self.assertEqual(len(frag_archives[0]), 1960)
+        boundary = b'81eb9c110b32ced5fe'
+
+        def make_mime_body(frag_archive):
+            return b'\r\n'.join([
+                b'--' + boundary,
+                b'Content-Type: application/octet-stream',
+                b'Content-Range: bytes 0-489/1960',
+                b'',
+                frag_archive[0:490],
+                b'--' + boundary,
+                b'Content-Type: application/octet-stream',
+                b'Content-Range: bytes 1470-1959/1960',
+                b'',
+                frag_archive[1470:],
+                b'--' + boundary + b'--',
+            ])
+
+        obj_resp_bodies = [make_mime_body(fa) for fa
+                           # no extra good responses
+                           in ec_stub['frags'][:self.policy.ec_ndata]]
+
+        headers = {
+            'Content-Type': b'multipart/byteranges;boundary=' + boundary,
+            'Content-Length': len(obj_resp_bodies[0]),
+            'X-Object-Sysmeta-Ec-Content-Length': len(ec_stub['body']),
+            'X-Object-Sysmeta-Ec-Etag': ec_stub['etag'],
+            'X-Timestamp': Timestamp(self.ts()).normal,
+        }
+
+        responses = [
+            StubResponse(206, body, headers, i,
+                         # make the first one slow
+                         slowdown=0.1 if i == 0 else None)
+            for i, body in enumerate(obj_resp_bodies)
+        ]
+        # add a short read response for the resume
+        short_body = obj_resp_bodies[0][:512]
+        responses.append(StubResponse(206, short_body, headers, 0))
+
+        def get_response(req):
+            # there's some math going on here I don't quite understand, the
+            # fragment_size is 490 and there's like 4 of them because ec_body
+            # is 'test' * segment_size
+            self.assertEqual(req['headers']['Range'], 'bytes=0-489,1470-1959')
+            return responses.pop(0) if responses else StubResponse(404)
+
+        req = swob.Request.blank('/v1/a/c/o', headers={
+            'Range': 'bytes=1000-2000,14000-15000'})
+        with capture_http_requests(get_response) as log:
+            resp = req.get_response(self.app)
+            resp_boundary = resp.headers['content-type'].rsplit(
+                '=', 1)[1].encode()
+            expected = b'\r\n'.join([
+                b'--' + resp_boundary,
+                b'Content-Type: application/octet-stream',
+                b'Content-Range: bytes 1000-2000/16384',
+                b'',
+                b'',
+                b'--' + resp_boundary + b'--',
+            ])
+            self.assertEqual(expected, resp.body)
+        self.assertEqual(resp.status_int, 206)
+        self.assertEqual(len(log), self.policy.ec_n_unique_fragments * 2)
+        log_lines = self.app.logger.get_lines_for_level('error')
+        self.assertIn("Trying to read next part of EC fragment multi-part "
+                      "GET (retrying)", log_lines[0])
+        # not the most graceful ending
+        self.assertIn("Exception fetching fragments for '/a/c/o'",
+                      log_lines[-1])
+
+    def test_GET_with_success_and_507_will_503(self):
+        responses = [  # only 9 good nodes
+            StubResponse(200),
+            StubResponse(200),
+            StubResponse(200),
+            StubResponse(200),
+            StubResponse(200),
+            StubResponse(200),
+            StubResponse(200),
+            StubResponse(200),
+            StubResponse(200),
+        ]
+
+        def get_response(req):
+            # bad disk on all other nodes
+            return responses.pop(0) if responses else StubResponse(507)
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(get_response) as log:
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 503)
+        self.assertEqual(len(log), 2 * self.replicas())
+
+    def test_GET_with_success_and_404_will_404(self):
+        responses = [  # only 9 good nodes
+            StubResponse(200),
+            StubResponse(200),
+            StubResponse(200),
+            StubResponse(200),
+            StubResponse(200),
+            StubResponse(200),
+            StubResponse(200),
+            StubResponse(200),
+            StubResponse(200),
+        ]
+
+        def get_response(req):
+            # no frags on other nodes
+            return responses.pop(0) if responses else StubResponse(404)
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(get_response) as log:
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 404)
+        self.assertEqual(len(log), 2 * self.replicas())
+
+    def test_ranged_get(self):
+        self.app.object_chunk_size = 256
+        segment_size = self.policy.ec_segment_size
+        frag_size = self.policy.fragment_size
+        data = (b'test' * segment_size)[:-492]
+        etag = md5(data).hexdigest()
+        archives = self._make_ec_archive_bodies(data)
+        frag_archive_size = len(archives[0])
+        range_size = frag_size * 2
+        headers = {
+            'Content-Type': 'text/plain',
+            'Content-Length': range_size,
+            'Content-Range': 'bytes 0-%s/%s' % (range_size - 1,
+                                                frag_archive_size),
+            'X-Object-Sysmeta-Ec-Content-Length': len(data),
+            'X-Object-Sysmeta-Ec-Etag': etag,
+            'X-Backend-Timestamp': Timestamp(self.ts()).internal
+        }
+        responses = [
+            StubResponse(206, body[:range_size], headers, i)
+            for i, body in enumerate(archives[:self.policy.ec_ndata])
+        ]
+
+        obj_req_ranges = set()
+
+        def get_response(req):
+            obj_req_ranges.add(req['headers']['Range'])
+            return responses.pop(0) if responses else StubResponse(404)
+
+        req = swob.Request.blank('/v1/a/c/o', headers={
+            'Range': 'bytes=3000-5000'})
+        with capture_http_requests(get_response) as log:
+            resp = req.get_response(self.app)
+        self.assertEqual(obj_req_ranges, {'bytes=0-%s' % (range_size - 1)})
+        self.assertEqual(resp.status_int, 206)
+        self.assertEqual(resp.headers['Content-Range'],
+                         'bytes 3000-5000/%s' % len(data))
+        self.assertEqual(resp.body, data[3000:5001])
+        self.assertEqual(len(log), self.policy.ec_ndata)
+
+    def test_ranged_get_with_slow_resp(self):
+        self.app.object_chunk_size = 256
+        self.app.recoverable_node_timeout = 0.01
+        segment_size = self.policy.ec_segment_size
+        frag_size = self.policy.fragment_size
+        data = (b'test' * segment_size)[:-492]
+        etag = md5(data).hexdigest()
+        archives = self._make_ec_archive_bodies(data)
+        frag_archive_size = len(archives[0])
+        range_size = frag_size * 2
+        headers = {
+            'Content-Type': 'text/plain',
+            'Content-Length': range_size,
+            'Content-Range': 'bytes 0-%s/%s' % (range_size - 1,
+                                                frag_archive_size),
+            'X-Object-Sysmeta-Ec-Content-Length': len(data),
+            'X-Object-Sysmeta-Ec-Etag': etag,
+            'X-Backend-Timestamp': Timestamp(self.ts()).internal
+        }
+        responses = [
+            StubResponse(206, body[:range_size], headers, i,
+                         # the first body comes up slow
+                         slowdown=0.1 if i == 0 else None)
+            for i, body in enumerate(archives[:self.policy.ec_ndata])
+        ]
+        responses.append(StubResponse(
+            206, archives[self.policy.ec_ndata][:range_size],
+            headers, self.policy.ec_ndata))
+
+        obj_req_ranges = set()
+
+        def get_response(req):
+            obj_req_ranges.add(req['headers']['Range'])
+            return responses.pop(0) if responses else StubResponse(404)
+
+        req = swob.Request.blank('/v1/a/c/o', headers={
+            'Range': 'bytes=3000-5000'})
+        with capture_http_requests(get_response) as log:
+            resp = req.get_response(self.app)
+            self.assertEqual(resp.body, data[3000:5001])
+        self.assertEqual(resp.status_int, 206)
+        self.assertEqual(obj_req_ranges, {'bytes=0-%s' % (range_size - 1)})
+        self.assertEqual(resp.headers['Content-Range'],
+                         'bytes 3000-5000/%s' % len(data))
+        self.assertEqual(len(log), self.policy.ec_ndata + 1)
+
+    def test_ranged_get_with_short_resp(self):
+        self.app.object_chunk_size = 256
+        segment_size = self.policy.ec_segment_size
+        frag_size = self.policy.fragment_size
+        data = (b'test' * segment_size)[:-492]
+        etag = md5(data).hexdigest()
+        archives = self._make_ec_archive_bodies(data)
+        frag_archive_size = len(archives[0])
+        range_size = frag_size * 2
+        headers = {
+            'Content-Type': 'text/plain',
+            'Content-Length': range_size,
+            'Content-Range': 'bytes 0-%s/%s' % (range_size - 1,
+                                                frag_archive_size),
+            'X-Object-Sysmeta-Ec-Content-Length': len(data),
+            'X-Object-Sysmeta-Ec-Etag': etag,
+            'X-Backend-Timestamp': Timestamp(self.ts()).internal
+        }
+        responses = [
+            StubResponse(
+                206,
+                # the first body comes up short
+                body[:frag_size] if i == 0 else body[:range_size],
+                headers, i)
+            for i, body in enumerate(archives[:self.policy.ec_ndata])
+        ]
+        responses.append(StubResponse(
+            206, archives[self.policy.ec_ndata][frag_size:range_size], {
+                'Content-Type': 'text/plain',
+                'Content-Length': frag_size,
+                'Content-Range': 'bytes %s-%s/%s' % (
+                    frag_size, range_size - 1, frag_archive_size),
+                'X-Object-Sysmeta-Ec-Content-Length': len(data),
+                'X-Object-Sysmeta-Ec-Etag': etag,
+                'X-Backend-Timestamp': Timestamp(self.ts()).internal,
+            }, self.policy.ec_ndata))
+
+        obj_req_ranges = []
+
+        def get_response(req):
+            obj_req_ranges.append(req['headers']['Range'])
+            return responses.pop(0) if responses else StubResponse(404)
+
+        req = swob.Request.blank('/v1/a/c/o', headers={
+            'Range': 'bytes=3000-5000'})
+        with capture_http_requests(get_response) as log:
+            resp = req.get_response(self.app)
+            self.assertEqual(resp.body, data[3000:5001])
+        self.assertEqual(resp.status_int, 206)
+        self.assertEqual(obj_req_ranges,
+                         ['bytes=0-%s' % (range_size - 1)] *
+                         self.policy.ec_ndata +
+                         ['bytes=%s-%s' % (frag_size, range_size - 1)])
+        self.assertEqual(resp.headers['Content-Range'],
+                         'bytes 3000-5000/%s' % len(data))
+        self.assertEqual(len(log), self.policy.ec_ndata + 1)
+
+    def test_ranged_get_with_short_resp_timeout(self):
+        self.app.object_chunk_size = 256
+        self.app.recoverable_node_timeout = 0.01
+        segment_size = self.policy.ec_segment_size
+        frag_size = self.policy.fragment_size
+        data = (b'test' * segment_size)[:-492]
+        etag = md5(data).hexdigest()
+        archives = self._make_ec_archive_bodies(data)
+        frag_archive_size = len(archives[0])
+        range_size = frag_size * 2
+        headers = {
+            'Content-Type': 'text/plain',
+            'Content-Length': range_size,
+            'Content-Range': 'bytes 0-%s/%s' % (range_size - 1,
+                                                frag_archive_size),
+            'X-Object-Sysmeta-Ec-Content-Length': len(data),
+            'X-Object-Sysmeta-Ec-Etag': etag,
+            'X-Backend-Timestamp': Timestamp(self.ts()).internal
+        }
+        responses = [
+            StubResponse(
+                206, body[:range_size], headers, i,
+                # the first body slows down after awhile
+                slowdown=[None] * 3 + [0.1] if i == 0 else None)
+            for i, body in enumerate(archives[:self.policy.ec_ndata])
+        ]
+        responses.append(StubResponse(
+            206, archives[self.policy.ec_ndata][frag_size:range_size], {
+                'Content-Type': 'text/plain',
+                'Content-Length': frag_size,
+                'Content-Range': 'bytes %s-%s/%s' % (
+                    frag_size, range_size - 1, frag_archive_size),
+                'X-Object-Sysmeta-Ec-Content-Length': len(data),
+                'X-Object-Sysmeta-Ec-Etag': etag,
+                'X-Backend-Timestamp': Timestamp(self.ts()).internal,
+            }, self.policy.ec_ndata))
+
+        obj_req_ranges = []
+
+        def get_response(req):
+            obj_req_ranges.append(req['headers']['Range'])
+            return responses.pop(0) if responses else StubResponse(404)
+
+        req = swob.Request.blank('/v1/a/c/o', headers={
+            'Range': 'bytes=3000-5000'})
+        with capture_http_requests(get_response) as log:
+            resp = req.get_response(self.app)
+            self.assertEqual(resp.body, data[3000:5001])
+        self.assertEqual(resp.status_int, 206)
+        self.assertEqual(['bytes=0-%s' % (range_size - 1)] *
+                         self.policy.ec_ndata +
+                         ['bytes=%s-%s' % (frag_size, range_size - 1)],
+                         obj_req_ranges)
+        self.assertEqual(resp.headers['Content-Range'],
+                         'bytes 3000-5000/%s' % len(data))
+        self.assertEqual(len(log), self.policy.ec_ndata + 1)
+
+    def test_GET_mixed_ranged_responses_success(self):
+        segment_size = self.policy.ec_segment_size
+        frag_size = self.policy.fragment_size
+        new_data = (b'test' * segment_size)[:-492]
+        new_etag = md5(new_data, usedforsecurity=False).hexdigest()
+        new_archives = self._make_ec_archive_bodies(new_data)
+        old_data = (b'junk' * segment_size)[:-492]
+        old_etag = md5(old_data, usedforsecurity=False).hexdigest()
+        old_archives = self._make_ec_archive_bodies(old_data)
+        frag_archive_size = len(new_archives[0])
+
+        # here we deliberately omit X-Backend-Data-Timestamp to check that
+        # proxy will tolerate responses from object server that have not been
+        # upgraded to send that header
+        old_headers = {
+            'Content-Type': 'text/plain',
+            'Content-Length': frag_size,
+            'Content-Range': 'bytes 0-%s/%s' % (frag_size - 1,
+                                                frag_archive_size),
+            'X-Object-Sysmeta-Ec-Content-Length': len(old_data),
+            'X-Object-Sysmeta-Ec-Etag': old_etag,
+            'X-Backend-Timestamp': Timestamp(self.ts()).internal
+        }
+        new_headers = {
+            'Content-Type': 'text/plain',
+            'Content-Length': frag_size,
+            'Content-Range': 'bytes 0-%s/%s' % (frag_size - 1,
+                                                frag_archive_size),
+            'X-Object-Sysmeta-Ec-Content-Length': len(new_data),
+            'X-Object-Sysmeta-Ec-Etag': new_etag,
+            'X-Backend-Timestamp': Timestamp(self.ts()).internal
+        }
+        # 7 primaries with stale frags, 3 handoffs failed to get new frags
+        responses = [
+            StubResponse(206, old_archives[0][:frag_size], old_headers, 0),
+            StubResponse(206, new_archives[1][:frag_size], new_headers, 1),
+            StubResponse(206, old_archives[2][:frag_size], old_headers, 2),
+            StubResponse(206, new_archives[3][:frag_size], new_headers, 3),
+            StubResponse(206, old_archives[4][:frag_size], old_headers, 4),
+            StubResponse(206, new_archives[5][:frag_size], new_headers, 5),
+            StubResponse(206, old_archives[6][:frag_size], old_headers, 6),
+            StubResponse(206, new_archives[7][:frag_size], new_headers, 7),
+            StubResponse(206, old_archives[8][:frag_size], old_headers, 8),
+            StubResponse(206, new_archives[9][:frag_size], new_headers, 9),
+            StubResponse(206, old_archives[10][:frag_size], old_headers, 10),
+            StubResponse(206, new_archives[11][:frag_size], new_headers, 11),
+            StubResponse(206, old_archives[12][:frag_size], old_headers, 12),
+            StubResponse(206, new_archives[13][:frag_size], new_headers, 13),
+            StubResponse(206, new_archives[0][:frag_size], new_headers, 0),
+            StubResponse(404),
+            StubResponse(404),
+            StubResponse(206, new_archives[6][:frag_size], new_headers, 6),
+            StubResponse(404),
+            StubResponse(206, new_archives[10][:frag_size], new_headers, 10),
+            StubResponse(206, new_archives[12][:frag_size], new_headers, 12),
+        ]
+
+        def get_response(req):
+            return responses.pop(0) if responses else StubResponse(404)
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(get_response) as log:
+            resp = req.get_response(self.app)
+
+        closed_conn = defaultdict(set)
+        for conn in log:
+            etag = conn.resp.headers.get('X-Object-Sysmeta-Ec-Etag')
+            closed_conn[etag].add(conn.closed)
+        self.assertEqual({
+            old_etag: {True},
+            new_etag: {False},
+            None: {True},
+        }, dict(closed_conn))
+
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.body, new_data[:segment_size])
+        self.assertEqual(len(log), self.policy.ec_ndata + 10)
+
+    def test_GET_mismatched_fragment_archives(self):
+        segment_size = self.policy.ec_segment_size
+        test_data1 = (b'test' * segment_size)[:-333]
+        # N.B. the object data *length* here is different
+        test_data2 = (b'blah1' * segment_size)[:-333]
+
+        etag1 = md5(test_data1, usedforsecurity=False).hexdigest()
+        etag2 = md5(test_data2, usedforsecurity=False).hexdigest()
+
+        ec_archive_bodies1 = self._make_ec_archive_bodies(test_data1)
+        ec_archive_bodies2 = self._make_ec_archive_bodies(test_data2)
+
+        headers1 = {'X-Object-Sysmeta-Ec-Etag': etag1,
+                    'X-Object-Sysmeta-Ec-Content-Length': '333'}
+        # here we're going to *lie* and say the etag here matches
+        headers2 = {'X-Object-Sysmeta-Ec-Etag': etag1,
+                    'X-Object-Sysmeta-Ec-Content-Length': '333'}
+
+        responses1 = [(200, body, self._add_frag_index(fi, headers1))
+                      for fi, body in enumerate(ec_archive_bodies1)]
+        responses2 = [(200, body, self._add_frag_index(fi, headers2))
+                      for fi, body in enumerate(ec_archive_bodies2)]
+
+        req = swob.Request.blank('/v1/a/c/o')
+
+        orig_decode = self.policy.pyeclib_driver.decode
+        captured_fragments = []
+
+        def mock_decode(fragments):
+            captured_fragments.append(fragments)
+            return orig_decode(fragments)
+
+        # sanity check responses1 and capture frag lengths
+        responses = responses1[:self.policy.ec_ndata]
+        status_codes, body_iter, headers = zip(*responses)
+        with set_http_connect(*status_codes, body_iter=body_iter,
+                              headers=headers):
+            with mock.patch.object(
+                    self.policy.pyeclib_driver, 'decode', mock_decode):
+                resp = req.get_response(self.app)
+                self.assertEqual(resp.status_int, 200)
+                # read body while decode is mocked
+                self.assertEqual(
+                    md5(resp.body, usedforsecurity=False).hexdigest(),
+                    etag1)
+        fragment_lengths1 = [[len(frag) for frag in frags]
+                             for frags in captured_fragments]
+        self.assertEqual(  # sanity check
+            len(ec_archive_bodies1[0]),
+            sum([length for length in [lengths[0]
+                                       for lengths in fragment_lengths1]]))
+
+        # sanity check responses2 and capture frag lengths
+        captured_fragments = []
+        responses = responses2[:self.policy.ec_ndata]
+        status_codes, body_iter, headers = zip(*responses)
+        with set_http_connect(*status_codes, body_iter=body_iter,
+                              headers=headers):
+            with mock.patch.object(
+                    self.policy.pyeclib_driver, 'decode', mock_decode):
+                resp = req.get_response(self.app)
+                self.assertEqual(resp.status_int, 200)
+                # read body while decode is mocked
+                self.assertEqual(
+                    md5(resp.body, usedforsecurity=False).hexdigest(),
+                    etag2)
+        fragment_lengths2 = [[len(frag) for frag in frags]
+                             for frags in captured_fragments]
+        self.assertEqual(  # sanity check
+            len(ec_archive_bodies2[0]),
+            sum([length for length in [lengths[0]
+                                       for lengths in fragment_lengths2]]))
+
+        # now mix the responses a bit
+        mix_index = random.randint(0, self.policy.ec_ndata - 1)
+        mixed_responses = responses1[:self.policy.ec_ndata]
+        mixed_responses[mix_index] = responses2[mix_index]
+
+        num_segments = len(fragment_lengths1)
+        mixed_lengths = fragment_lengths1[num_segments - 1]
+        mixed_lengths[mix_index] = fragment_lengths2[
+            num_segments - 1][mix_index]
+
+        status_codes, body_iter, headers = zip(*mixed_responses)
+        with set_http_connect(*status_codes, body_iter=body_iter,
+                              headers=headers):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 200)
+        try:
+            resp.body
+        except ECDriverError:
+            resp._app_iter.close()
+        else:
+            self.fail('invalid ec fragment response body did not blow up!')
+        error_lines = self.logger.get_lines_for_level('error')
+        self.assertEqual(1, len(error_lines))
+        msg = error_lines[0]
+        self.assertIn('Error decoding fragments', msg)
+        self.assertIn('/a/c/o', msg)
+        self.assertIn('Segments decoded: %d' % (num_segments - 1), msg)
+        self.assertIn(
+            "[%s]" % ", ".join([str(length) for length in mixed_lengths]), msg)
+        self.assertIn("Invalid fragment payload in ECPyECLibDriver.decode",
+                      msg)
+
+    def test_GET_read_timeout(self):
+        # verify EC GET behavior when initial batch of nodes time out then
+        # remaining primary nodes also time out and handoffs return 404
+        segment_size = self.policy.ec_segment_size
+        test_data = (b'test' * segment_size)[:-333]
+        etag = md5(test_data, usedforsecurity=False).hexdigest()
+        ec_archive_bodies = self._make_ec_archive_bodies(test_data)
+        headers = {'X-Object-Sysmeta-Ec-Etag': etag}
+        self.app.recoverable_node_timeout = 0.01
+        responses = [
+            (200, SlowBody(body, 0.1), self._add_frag_index(i, headers))
+            for i, body in enumerate(ec_archive_bodies)
+        ] * self.policy.ec_duplication_factor
+
+        req = swob.Request.blank('/v1/a/c/o')
+
+        status_codes, body_iter, headers = zip(*responses + [
+            (404, [b''], {}) for i in range(
+                self.policy.object_ring.max_more_nodes)])
+        with mocked_http_conn(*status_codes, body_iter=body_iter,
+                              headers=headers):
+            resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 200)
+            # do this inside the fake http context manager, it'll try to
+            # resume but won't be able to give us all the right bytes
+            self.assertNotEqual(
+                md5(resp.body, usedforsecurity=False).hexdigest(),
+                etag)
+        error_lines = self.logger.get_lines_for_level('error')
+        # all primaries timeout and get error limited
+        error_limit_lines = [
+            line for line in error_lines
+            if 'Trying to read EC fragment during GET (retrying)' in line]
+        self.assertEqual(self.policy.ec_n_unique_fragments,
+                         len(error_limit_lines))
+        # all ec_ndata frag getters eventually get a read timeout
+        read_timeout_lines = [
+            line for line in error_lines if 'ChunkReadTimeout (0.01s' in line]
+        self.assertEqual(self.policy.ec_ndata,
+                         len(read_timeout_lines))
+        for line in self.logger.logger.records['ERROR']:
+            self.assertIn(req.headers['x-trans-id'], line)
+
+    def test_GET_write_timeout(self):
+        # verify EC GET behavior when there's a timeout sending decoded frags
+        # via the queue.
+        segment_size = self.policy.ec_segment_size
+        test_data = (b'test' * segment_size)[:-333]
+        etag = md5(test_data, usedforsecurity=False).hexdigest()
+        ec_archive_bodies = self._make_ec_archive_bodies(test_data)
+        headers = {'X-Object-Sysmeta-Ec-Etag': etag,
+                   'X-Object-Sysmeta-Ec-Content-Length': '333'}
+        ndata = self.policy.ec_ndata
+        responses = [
+            (200, body, self._add_frag_index(i, headers))
+            for i, body in enumerate(ec_archive_bodies[:ndata])
+        ] * self.policy.ec_duplication_factor
+
+        req = swob.Request.blank('/v1/a/c/o')
+
+        status_codes, body_iter, headers = zip(*responses)
+        self.app.client_timeout = 0.01
+        with mocked_http_conn(*status_codes, body_iter=body_iter,
+                              headers=headers):
+            resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 200)
+            resp_body = next(resp.app_iter)
+            sleep(0.5)  # lazy client
+            # remaining resp truncated
+            resp_body += b''.join(resp.app_iter)
+        # we log errors
+        log_lines = self.app.logger.get_lines_for_level('error')
+        self.assertTrue(log_lines)
+        for line in log_lines:
+            self.assertIn('ChunkWriteTimeout feeding fragments', line)
+        # client gets a short read
+        self.assertEqual(16051, len(test_data))
+        self.assertEqual(8192, len(resp_body))
+        self.assertNotEqual(
+            md5(resp_body, usedforsecurity=False).hexdigest(),
+            etag)
+
+    def test_GET_read_timeout_retrying_but_no_more_useful_nodes(self):
+        # verify EC GET behavior when initial batch of nodes time out then
+        # remaining nodes either return 404 or return data for different etag
+        segment_size = self.policy.ec_segment_size
+        test_data = (b'test' * segment_size)[:-333]
+        etag = md5(test_data).hexdigest()
+        ec_archive_bodies = self._make_ec_archive_bodies(test_data)
+        headers = {'X-Object-Sysmeta-Ec-Etag': etag}
+        self.app.recoverable_node_timeout = 0.01
+        ndata = self.policy.ec_ndata
+        # only ndata responses, all of which have SlowBody
+        responses = [
+            (200, SlowBody(body, 0.1), self._add_frag_index(i, headers))
+            for i, body in enumerate(ec_archive_bodies[:ndata])
+        ] * self.policy.ec_duplication_factor
+        # 2 primaries return 404
+        responses += [
+            (404, '', {}), (404, '', {})
+        ] * self.policy.ec_duplication_factor
+        # 2 primaries return different etag
+        headers2 = {'X-Object-Sysmeta-Ec-Etag': 'other_etag'}
+        responses += [
+            (200, body, self._add_frag_index(i, headers2))
+            for i, body in enumerate(ec_archive_bodies[ndata + 2:])
+        ] * self.policy.ec_duplication_factor
+
+        req = swob.Request.blank('/v1/a/c/o')
+
+        # all other (handoff) responses are 404
+        status_codes, body_iter, headers = zip(*responses + [
+            (404, [b''], {}) for i in range(
+                self.policy.object_ring.max_more_nodes)])
+        with mocked_http_conn(*status_codes, body_iter=body_iter,
+                              headers=headers):
+            resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 200)
+            # do this inside the fake http context manager, it'll try to
+            # resume but won't be able to give us all the right bytes
+            self.assertNotEqual(md5(resp.body).hexdigest(), etag)
+        error_lines = self.logger.get_lines_for_level('error')
+        # only ec_ndata primaries that timeout get error limited (404 or
+        # different etag primaries do not get error limited)
+        error_limit_lines = [
+            line for line in error_lines
+            if 'Trying to read EC fragment during GET (retrying)' in line]
+        self.assertEqual(self.policy.ec_ndata, len(error_limit_lines))
+        # all ec_ndata frag getters eventually get a read timeout
+        read_timeout_lines = [
+            line for line in error_lines if 'ChunkReadTimeout (0.01s' in line]
+        self.assertEqual(self.policy.ec_ndata,
+                         len(read_timeout_lines))
+
+        debug_lines = self.logger.get_lines_for_level('debug')
+        nparity = self.policy.ec_nparity
+        nhandoffs = self.policy.object_ring.max_more_nodes
+        ignore_404 = ignore_404_handoff = 0
+        for line in debug_lines:
+            if 'Ignoring 404 from primary' in line:
+                ignore_404 += 1
+            if 'Ignoring 404 from handoff' in line:
+                ignore_404_handoff += 1
+        self.assertEqual(nparity - 2, ignore_404, debug_lines)
+        self.assertEqual(nhandoffs, ignore_404_handoff, debug_lines)
+        self.assertEqual(len(debug_lines), ignore_404_handoff + ignore_404)
+        self.assertEqual(self.logger.get_lines_for_level('warning'), [
+            'Skipping source (etag mismatch: got other_etag, '
+            'expected %s)' % etag] * 2)
+
+    def test_GET_read_timeout_resume(self):
+        segment_size = self.policy.ec_segment_size
+        test_data = (b'test' * segment_size)[:-333]
+        etag = md5(test_data, usedforsecurity=False).hexdigest()
+        ec_archive_bodies = self._make_ec_archive_bodies(test_data)
+        headers = {
+            'X-Object-Sysmeta-Ec-Etag': etag,
+            'X-Object-Sysmeta-Ec-Content-Length': len(test_data),
+        }
+        self.app.recoverable_node_timeout = 0.05
+        # first one is slow
+        responses = [(200, SlowBody(ec_archive_bodies[0], 0.1),
+                      self._add_frag_index(0, headers))]
+        # ... the rest are fine
+        responses += [(200, body, self._add_frag_index(i, headers))
+                      for i, body in enumerate(ec_archive_bodies[1:], start=1)]
+
+        req = swob.Request.blank('/v1/a/c/o')
+
+        status_codes, body_iter, headers = zip(
+            *responses[:self.policy.ec_ndata + 1])
+        with set_http_connect(*status_codes, body_iter=body_iter,
+                              headers=headers):
+            resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual(
+                md5(resp.body, usedforsecurity=False).hexdigest(),
+                etag)
+        error_lines = self.logger.get_lines_for_level('error')
+        self.assertEqual(1, len(error_lines))
+        self.assertIn('retrying', error_lines[0])
+        for line in self.logger.logger.records['ERROR']:
+            self.assertIn(req.headers['x-trans-id'], line)
+
+    def _do_test_GET_read_timeout_fast_forward_fails(self, error):
+        segment_size = self.policy.ec_segment_size
+        test_data = (b'test' * segment_size)[:-333]
+        etag = md5(test_data).hexdigest()
+        ec_archive_bodies = self._make_ec_archive_bodies(test_data)
+        headers = {
+            'X-Object-Sysmeta-Ec-Etag': etag,
+            'X-Object-Sysmeta-Ec-Content-Length': len(test_data),
+        }
+        self.app.recoverable_node_timeout = 0.05
+        # first one is slow
+        responses = [(200, SlowBody(ec_archive_bodies[0], 0.1),
+                      self._add_frag_index(0, headers))]
+        # ... the rest are fine
+        responses += [(200, body, self._add_frag_index(i, headers))
+                      for i, body in enumerate(ec_archive_bodies[1:], start=1)]
+
+        req = swob.Request.blank('/v1/a/c/o')
+
+        status_codes, body_iter, headers = zip(
+            *responses[:self.policy.ec_ndata])
+        # I don't know why fast_forward would blow up, but if it does we
+        # re-raise the ChunkReadTimeout and still want a txn-id
+        with set_http_connect(*status_codes, body_iter=body_iter,
+                              headers=headers), \
+                mock.patch(
+                    'swift.proxy.controllers.obj.ECFragGetter.fast_forward',
+                    side_effect=error):
+            resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 200)
+            self.assertNotEqual(md5(resp.body).hexdigest(), etag)
+
+        for line in self.logger.logger.records['ERROR'] + \
+                self.logger.logger.records['WARNING']:
+            self.assertIn(req.headers['x-trans-id'], line)
+
+    def test_GET_read_timeout_fast_forward_fails(self):
+        self._do_test_GET_read_timeout_fast_forward_fails(ValueError())
+
+        error_lines = self.logger.get_lines_for_level('error')
+        self.assertEqual(2, len(error_lines))
+        self.assertIn('Unable to fast forward', error_lines[0])
+        self.assertIn('Timeout fetching', error_lines[1])
+        warning_lines = self.logger.get_lines_for_level('warning')
+        self.assertEqual(1, len(warning_lines))
+        self.assertIn(
+            'Un-recoverable fragment rebuild. Only received 9/10 fragments',
+            warning_lines[0])
+
+    def test_GET_read_timeout_fast_forward_range_complete(self):
+        self._do_test_GET_read_timeout_fast_forward_fails(
+            RangeAlreadyComplete())
+
+        error_lines = self.logger.get_lines_for_level('error')
+        self.assertEqual(0, len(error_lines))
+        # the test is a little bogus - presumably if the range was complete
+        # then the fragment would be ok to rebuild. But the test pretends range
+        # was complete without actually feeding the bytes to the getter...
+        warning_lines = self.logger.get_lines_for_level('warning')
+        self.assertEqual(1, len(warning_lines))
+        self.assertIn(
+            'Un-recoverable fragment rebuild. Only received 9/10 fragments',
+            warning_lines[0])
+
+    def test_GET_one_short_fragment_archive(self):
+        # verify that a warning is logged when one fragment archive returns
+        # less whole fragments than others
+        segment_size = self.policy.ec_segment_size
+        test_data = (b'test' * segment_size)[:-333]
+        etag = md5(test_data).hexdigest()
+        ec_archive_bodies = self._make_ec_archive_bodies(test_data)
+
+        def do_test(missing_length):
+            self.logger.clear()
+            headers = {
+                'X-Object-Sysmeta-Ec-Etag': etag,
+                'X-Object-Sysmeta-Ec-Content-Length': len(test_data),
+            }
+            responses = [(200, ec_archive_bodies[0][:(-1 * missing_length)],
+                          self._add_frag_index(0, headers))]
+            # ... the rest are fine
+            responses += [
+                (200, body, self._add_frag_index(i, headers))
+                for i, body in enumerate(ec_archive_bodies[1:], start=1)]
+
+            req = swob.Request.blank('/v1/a/c/o')
+
+            status_codes, body_iter, headers = zip(
+                *responses[:self.policy.ec_ndata])
+            with set_http_connect(*status_codes, body_iter=body_iter,
+                                  headers=headers):
+                resp = req.get_response(self.app)
+                self.assertEqual(resp.status_int, 200)
+                self.assertNotEqual(md5(resp.body).hexdigest(), etag)
+            error_lines = self.logger.get_lines_for_level('error')
+            self.assertEqual([], error_lines)
+            warning_lines = self.logger.get_lines_for_level('warning')
+            self.assertEqual(1, len(warning_lines))
+            self.assertIn(
+                'Un-recoverable fragment rebuild. '
+                'Only received 9/10 fragments', warning_lines[0])
+
+        # each fragment archive has 4 fragments of sizes [490, 490, 490, 458];
+        # try dropping whole fragment(s) from one archive
+        do_test(458)
+        do_test(490 + 458)
+        do_test(490 + 490 + 458)
+        do_test(490 + 490 + 490 + 458)
+
+    def test_GET_trigger_ec_metadata_check_failure(self):
+        # verify that a warning is logged when there are only k - 1 fragment
+        segment_size = self.policy.ec_segment_size
+        test_data = (b'test' * segment_size)[:-333]
+        etag = md5(test_data).hexdigest()
+        ec_archive_bodies = self._make_ec_archive_bodies(test_data)
+        bad_bodies = [b'd' * segment_size] * (self.policy.ec_nparity + 1)
+        ec_archive_bodies = \
+            ec_archive_bodies[:self.policy.ec_ndata - 1] + bad_bodies
+
+        self.logger.clear()
+        headers = {
+            'X-Object-Sysmeta-Ec-Etag': etag,
+            'X-Object-Sysmeta-Ec-Content-Length': len(test_data),
+        }
+        responses = [
+            (200, body, self._add_frag_index(i, headers))
+            for i, body in enumerate(ec_archive_bodies)]
+
+        req = swob.Request.blank('/v1/a/c/o')
+
+        status_codes, body_iter, headers = zip(
+            *responses[:self.policy.ec_ndata])
+        with set_http_connect(*status_codes, body_iter=body_iter,
+                              headers=headers):
+            resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 500)
+            self.assertNotEqual(md5(resp.body).hexdigest(), etag)
+        error_lines = self.logger.get_lines_for_level('error')
+        expected_log_line = (
+            "Error decoding fragments for '/a/c/o'. "
+            "Segments decoded: 0, Lengths: "
+            "[490, 490, 490, 490, 490, 490, 490, 490, 490, 490]: "
+            "pyeclib_c_decode ERROR: Fragment integrity check failed. "
+            "Please inspect syslog for liberasurecode error report.")
+        self.assertEqual(expected_log_line, error_lines[0])
+
+    def test_GET_read_timeout_resume_mixed_etag(self):
+        segment_size = self.policy.ec_segment_size
+        test_data2 = (b'blah1' * segment_size)[:-333]
+        test_data1 = (b'test' * segment_size)[:-333]
+        etag2 = md5(test_data2, usedforsecurity=False).hexdigest()
+        etag1 = md5(test_data1, usedforsecurity=False).hexdigest()
+        ec_archive_bodies2 = self._make_ec_archive_bodies(test_data2)
+        ec_archive_bodies1 = self._make_ec_archive_bodies(test_data1)
+        headers2 = {'X-Object-Sysmeta-Ec-Etag': etag2,
+                    'X-Object-Sysmeta-Ec-Content-Length': len(test_data2),
+                    'X-Backend-Timestamp': self.ts().internal}
+        headers1 = {'X-Object-Sysmeta-Ec-Etag': etag1,
+                    'X-Object-Sysmeta-Ec-Content-Length': len(test_data1),
+                    'X-Backend-Timestamp': self.ts().internal}
+        responses = [
+            # 404
+            (404, [b''], {}),
+            # etag1
+            (200, ec_archive_bodies1[1], self._add_frag_index(1, headers1)),
+            # 404
+            (404, [b''], {}),
+            # etag1
+            (200, SlowBody(ec_archive_bodies1[3], 0.1), self._add_frag_index(
+                3, headers1)),
+            # etag2
+            (200, ec_archive_bodies2[4], self._add_frag_index(4, headers2)),
+            # etag1
+            (200, ec_archive_bodies1[5], self._add_frag_index(5, headers1)),
+            # etag2
+            (200, ec_archive_bodies2[6], self._add_frag_index(6, headers2)),
+            # etag1
+            (200, ec_archive_bodies1[7], self._add_frag_index(7, headers1)),
+            # etag2
+            (200, ec_archive_bodies2[8], self._add_frag_index(8, headers2)),
+            # etag1
+            (200, SlowBody(ec_archive_bodies1[9], 0.1), self._add_frag_index(
+                9, headers1)),
+            # etag2
+            (200, ec_archive_bodies2[10], self._add_frag_index(10, headers2)),
+            # etag1
+            (200, ec_archive_bodies1[11], self._add_frag_index(11, headers1)),
+            # etag2
+            (200, ec_archive_bodies2[12], self._add_frag_index(12, headers2)),
+            # 404
+            (404, [b''], {}),
+            # handoffs start here
+            # etag2
+            (200, ec_archive_bodies2[0], self._add_frag_index(0, headers2)),
+            # 404
+            (404, [b''], {}),
+            # etag1
+            (200, ec_archive_bodies1[2], self._add_frag_index(2, headers1)),
+            # 404
+            (404, [b''], {}),
+            # etag1
+            (200, ec_archive_bodies1[4], self._add_frag_index(4, headers1)),
+            # etag2
+            (200, ec_archive_bodies2[1], self._add_frag_index(1, headers2)),
+            # etag1
+            (200, ec_archive_bodies1[6], self._add_frag_index(6, headers1)),
+            # etag2
+            (200, ec_archive_bodies2[7], self._add_frag_index(7, headers2)),
+            # etag1
+            (200, ec_archive_bodies1[8], self._add_frag_index(8, headers1)),
+            # resume requests start here
+            # 404
+            (404, [b''], {}),
+            # etag2
+            (200, ec_archive_bodies2[3], self._add_frag_index(3, headers2)),
+            # 404
+            (404, [b''], {}),
+            # etag1
+            (200, ec_archive_bodies1[10], self._add_frag_index(10, headers1)),
+            # etag1
+            (200, ec_archive_bodies1[12], self._add_frag_index(12, headers1)),
+        ]
+        self.app.recoverable_node_timeout = 0.01
+        req = swob.Request.blank('/v1/a/c/o')
+        status_codes, body_iter, headers = zip(*responses)
+        with mocked_http_conn(*status_codes, body_iter=body_iter,
+                              headers=headers) as log:
+            resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual(
+                md5(resp.body, usedforsecurity=False).hexdigest(),
+                etag1)
+        error_lines = self.logger.get_lines_for_level('error')
+        self.assertEqual(2, len(error_lines))
+        for line in error_lines:
+            self.assertIn('retrying', line)
+        for line in self.logger.logger.records['ERROR']:
+            self.assertIn(req.headers['x-trans-id'], line)
+        etag2_conns = []
+        for conn in log.responses:
+            if conn._headers.get('X-Object-Sysmeta-Ec-Etag') == etag2:
+                etag2_conns.append(conn)
+        self.assertEqual(
+            ([True] * 8) + [False],  # the resumed etag2 doesn't get closed
+            [conn.closed for conn in etag2_conns])
+
+    def test_fix_response_HEAD(self):
+        headers = {'X-Object-Sysmeta-Ec-Content-Length': '10',
+                   'X-Object-Sysmeta-Ec-Etag': 'foo'}
+
+        # sucsessful HEAD
+        responses = [(200, b'', headers)]
+        status_codes, body_iter, headers = zip(*responses)
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='HEAD')
+        with set_http_connect(*status_codes, body_iter=body_iter,
+                              headers=headers):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.body, b'')
+        # 200OK shows original object content length
+        self.assertEqual(resp.headers['Content-Length'], '10')
+        self.assertEqual(resp.headers['Etag'], 'foo')
+
+        # not found HEAD
+        responses = [(404, b'', {})] * self.replicas() * 2
+        status_codes, body_iter, headers = zip(*responses)
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='HEAD')
+        with set_http_connect(*status_codes, body_iter=body_iter,
+                              headers=headers):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 404)
+        # 404 shows actual response body size (i.e. 0 for HEAD)
+        self.assertEqual(resp.headers['Content-Length'], '0')
+
+    def test_GET_with_invalid_ranges(self):
+        # real body size is segment_size - 10 (just 1 segment)
+        segment_size = self.policy.ec_segment_size
+        real_body = (b'a' * segment_size)[:-10]
+
+        # range is out of real body but in segment size
+        self._test_invalid_ranges('GET', real_body,
+                                  segment_size, '%s-' % (segment_size - 10))
+        # range is out of both real body and segment size
+        self._test_invalid_ranges('GET', real_body,
+                                  segment_size, '%s-' % (segment_size + 10))
+
+    def _test_invalid_ranges(self, method, real_body, segment_size, req_range):
+        # make a request with range starts from more than real size.
+        body_etag = md5(real_body, usedforsecurity=False).hexdigest()
+        req = swift.common.swob.Request.blank(
+            '/v1/a/c/o', method=method,
+            headers={'Destination': 'c1/o',
+                     'Range': 'bytes=%s' % (req_range)})
+
+        fragments = self.policy.pyeclib_driver.encode(real_body)
+        fragment_payloads = [fragments * self.policy.ec_duplication_factor]
+
+        node_fragments = list(zip(*fragment_payloads))
+        self.assertEqual(len(node_fragments), self.replicas())  # sanity
+        headers = {'X-Object-Sysmeta-Ec-Content-Length': str(len(real_body)),
+                   'X-Object-Sysmeta-Ec-Etag': body_etag}
+        start = int(req_range.split('-')[0])
+        self.assertGreaterEqual(start, 0)  # sanity
+        title, exp = swob.RESPONSE_REASONS[416]
+        range_not_satisfiable_body = \
+            '<html><h1>%s</h1><p>%s</p></html>' % (title, exp)
+        range_not_satisfiable_body = range_not_satisfiable_body.encode('utf-8')
+        if start >= segment_size:
+            responses = [(416, range_not_satisfiable_body,
+                          self._add_frag_index(i, headers))
+                         for i in range(POLICIES.default.ec_ndata)]
+        else:
+            responses = [(200, b''.join(node_fragments[i]),
+                          self._add_frag_index(i, headers))
+                         for i in range(POLICIES.default.ec_ndata)]
+        status_codes, body_iter, headers = zip(*responses)
+        expect_headers = {
+            'X-Obj-Metadata-Footer': 'yes',
+            'X-Obj-Multiphase-Commit': 'yes'
+        }
+        with set_http_connect(*status_codes, body_iter=body_iter,
+                              headers=headers, expect_headers=expect_headers):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 416)
+        self.assertEqual(resp.content_length, len(range_not_satisfiable_body))
+        self.assertEqual(resp.body, range_not_satisfiable_body)
+        self.assertEqual(resp.etag, body_etag)
+        self.assertEqual(resp.headers['Accept-Ranges'], 'bytes')
+
+    def test_non_durable_ec_response_bucket(self):
+        ts = self.ts()
+        bucket = obj.ECGetResponseBucket(self.policy, ts)
+        self.assertEqual(bucket.shortfall, self.policy.ec_ndata)
+        for i in range(1, self.policy.ec_ndata - self.policy.ec_nparity + 1):
+            stub_getter = mock.MagicMock(last_status=200, last_headers={
+                'X-Backend-Timestamp': ts.internal,
+                'X-Object-Sysmeta-Ec-Etag': 'the-etag',
+                'X-Object-Sysmeta-Ec-Frag-Index': str(i),
+            })
+            bucket.add_response(stub_getter, None)
+            self.assertEqual(bucket.shortfall, self.policy.ec_ndata - i)
+        self.assertEqual(bucket.shortfall, self.policy.ec_nparity)
+        self.assertFalse(bucket.durable)
+        expectations = (
+            4,  # 7
+            4,  # 8
+            4,  # 9
+            4,  # 10
+            3,  # 11
+            2,  # 12
+            1,  # 13
+            1,  # 14
+        )
+        for i, expected in zip(range(
+                self.policy.ec_ndata - self.policy.ec_nparity + 1,
+                self.policy.object_ring.replica_count + 1), expectations):
+            stub_getter = mock.MagicMock(last_status=200, last_headers={
+                'X-Backend-Timestamp': ts.internal,
+                'X-Object-Sysmeta-Ec-Etag': 'the-etag',
+                'X-Object-Sysmeta-Ec-Frag-Index': str(i),
+            })
+            bucket.add_response(stub_getter, None)
+            msg = 'With %r resp, expected shortfall %s != %s' % (
+                bucket.gets.keys(), expected, bucket.shortfall)
+            self.assertEqual(bucket.shortfall, expected, msg)
+
+
+class TestECFunctions(unittest.TestCase):
+    def test_chunk_transformer(self):
+        def do_test(dup_factor, segments):
+            segment_size = 1024
+            orig_chunks = []
+            for i in range(segments):
+                orig_chunks.append(
+                    chr(i + 97).encode('latin-1') * segment_size)
+            policy = ECStoragePolicy(0, 'ec8-2', ec_type=DEFAULT_TEST_EC_TYPE,
+                                     ec_ndata=8, ec_nparity=2,
+                                     object_ring=FakeRing(
+                                         replicas=10 * dup_factor),
+                                     ec_segment_size=segment_size,
+                                     ec_duplication_factor=dup_factor)
+            encoded_chunks = [[] for _ in range(policy.ec_n_unique_fragments)]
+            for orig_chunk in orig_chunks:
+                # each segment produces a set of frags
+                frag_set = policy.pyeclib_driver.encode(orig_chunk)
+                for frag_index, frag_data in enumerate(frag_set):
+                    encoded_chunks[frag_index].append(frag_data)
+            # chunk_transformer buffers and concatenates multiple frags
+            expected = [b''.join(frags) for frags in encoded_chunks]
+
+            transform = obj.chunk_transformer(policy)
+            transform.send(None)
+            backend_chunks = transform.send(b''.join(orig_chunks))
+            self.assertIsNotNone(backend_chunks)  # sanity
+            self.assertEqual(
+                len(backend_chunks), policy.ec_n_unique_fragments)
+            self.assertEqual(expected, backend_chunks)
+
+            # flush out last chunk buffer
+            backend_chunks = transform.send(b'')
+            self.assertEqual(
+                len(backend_chunks), policy.ec_n_unique_fragments)
+            self.assertEqual([b''] * policy.ec_n_unique_fragments,
+                             backend_chunks)
+
+        do_test(dup_factor=1, segments=1)
+        do_test(dup_factor=2, segments=1)
+        do_test(dup_factor=3, segments=1)
+        do_test(dup_factor=1, segments=2)
+        do_test(dup_factor=2, segments=2)
+        do_test(dup_factor=3, segments=2)
+
+    def test_chunk_transformer_non_aligned_last_chunk(self):
+        last_chunk = b'a' * 128
+
+        def do_test(dup):
+            policy = ECStoragePolicy(0, 'ec8-2', ec_type=DEFAULT_TEST_EC_TYPE,
+                                     ec_ndata=8, ec_nparity=2,
+                                     object_ring=FakeRing(replicas=10 * dup),
+                                     ec_segment_size=1024,
+                                     ec_duplication_factor=dup)
+            expected = policy.pyeclib_driver.encode(last_chunk)
+            transform = obj.chunk_transformer(policy)
+            transform.send(None)
+
+            transform.send(last_chunk)
+            # flush out last chunk buffer
+            backend_chunks = transform.send(b'')
+
+            self.assertEqual(
+                len(backend_chunks), policy.ec_n_unique_fragments)
+            self.assertEqual(expected, backend_chunks)
+
+        do_test(1)
+        do_test(2)
+
+    def test_client_range_to_segment_range(self):
+        actual = obj.client_range_to_segment_range(100, 700, 512)
+        self.assertEqual(actual, (0, 1023))
+        self.assertEqual([type(x) for x in actual], [int, int])
+
+        actual = obj.client_range_to_segment_range(100, 700, 256)
+        self.assertEqual(actual, (0, 767))
+        self.assertEqual([type(x) for x in actual], [int, int])
+
+        actual = obj.client_range_to_segment_range(300, None, 256)
+        self.assertEqual(actual, (256, None))
+        self.assertEqual([type(x) for x in actual], [int, type(None)])
+
+    def test_segment_range_to_fragment_range(self):
+        actual = obj.segment_range_to_fragment_range(0, 1023, 512, 300)
+        self.assertEqual(actual, (0, 599))
+        self.assertEqual([type(x) for x in actual], [int, int])
+
+        actual = obj.segment_range_to_fragment_range(0, 767, 256, 100)
+        self.assertEqual(actual, (0, 299))
+        self.assertEqual([type(x) for x in actual], [int, int])
+
+        actual = obj.segment_range_to_fragment_range(256, None, 256, 100)
+        self.assertEqual(actual, (100, None))
+        self.assertEqual([type(x) for x in actual], [int, type(None)])
+
+
+@patch_policies([ECStoragePolicy(0, name='ec', is_default=True,
+                                 ec_type=DEFAULT_TEST_EC_TYPE, ec_ndata=10,
+                                 ec_nparity=4, ec_segment_size=4096,
+                                 ec_duplication_factor=2),
+                 StoragePolicy(1, name='unu')],
+                fake_ring_args=[{'replicas': 28}, {}])
+class TestECDuplicationObjController(
+        ECObjectControllerMixin, BaseTestCase):
+    container_info = {
+        'status': 200,
+        'read_acl': None,
+        'write_acl': None,
+        'sync_key': None,
+        'versions': None,
+        'storage_policy': '0',
+    }
+
+    controller_cls = obj.ECObjectController
+
+    def _test_GET_with_duplication_factor(self, node_frags, obj):
+        # This is basic tests in the healthy backends status
+        fake_response = self._fake_ec_node_response(node_frags)
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(fake_response) as log:
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['etag'], obj['etag'])
+        self.assertEqual(
+            md5(resp.body, usedforsecurity=False).hexdigest(),
+            obj['etag'])
+
+        collected_responses = defaultdict(set)
+        for conn in log:
+            etag = conn.resp.headers['X-Object-Sysmeta-Ec-Etag']
+            index = conn.resp.headers['X-Object-Sysmeta-Ec-Frag-Index']
+            collected_responses[etag].add(index)
+
+        # the backend requests should be >= num_data_fragments
+        self.assertGreaterEqual(len(log), self.policy.ec_ndata)
+        # but <= # of replicas
+        self.assertLessEqual(len(log), self.replicas())
+        self.assertEqual(len(collected_responses), 1)
+
+        etag, frags = list(collected_responses.items())[0]
+        # the backend requests will stop at enough ec_ndata responses
+        self.assertEqual(
+            len(frags), self.policy.ec_ndata,
+            'collected %s frags (expected %s) for etag %s' % (
+                len(frags), self.policy.ec_ndata, etag))
+
+    # TODO: actually "frags" in node_frags is meaning "node_index" right now
+    # in following tests. Reconsidering the name and semantics change needed.
+    # Or, just mapping to be correct as frag_index is enough?.
+    def test_GET_with_duplication_factor(self):
+        obj = self._make_ec_object_stub()
+        node_frags = [
+            {'obj': obj, 'frag': 0},
+            {'obj': obj, 'frag': 1},
+            {'obj': obj, 'frag': 2},
+            {'obj': obj, 'frag': 3},
+            {'obj': obj, 'frag': 4},
+            {'obj': obj, 'frag': 5},
+            {'obj': obj, 'frag': 6},
+            {'obj': obj, 'frag': 7},
+            {'obj': obj, 'frag': 8},
+            {'obj': obj, 'frag': 9},
+            {'obj': obj, 'frag': 10},
+            {'obj': obj, 'frag': 11},
+            {'obj': obj, 'frag': 12},
+            {'obj': obj, 'frag': 13},
+        ] * 2  # duplicated!
+        self._test_GET_with_duplication_factor(node_frags, obj)
+
+    def test_GET_with_duplication_factor_almost_duplicate_dispersion(self):
+        obj = self._make_ec_object_stub()
+        node_frags = [
+            # first half of # of replicas are 0, 1, 2, 3, 4, 5, 6
+            {'obj': obj, 'frag': 0},
+            {'obj': obj, 'frag': 0},
+            {'obj': obj, 'frag': 1},
+            {'obj': obj, 'frag': 1},
+            {'obj': obj, 'frag': 2},
+            {'obj': obj, 'frag': 2},
+            {'obj': obj, 'frag': 3},
+            {'obj': obj, 'frag': 3},
+            {'obj': obj, 'frag': 4},
+            {'obj': obj, 'frag': 4},
+            {'obj': obj, 'frag': 5},
+            {'obj': obj, 'frag': 5},
+            {'obj': obj, 'frag': 6},
+            {'obj': obj, 'frag': 6},
+            # second half of # of replicas are 7, 8, 9, 10, 11, 12, 13
+            {'obj': obj, 'frag': 7},
+            {'obj': obj, 'frag': 7},
+            {'obj': obj, 'frag': 8},
+            {'obj': obj, 'frag': 8},
+            {'obj': obj, 'frag': 9},
+            {'obj': obj, 'frag': 9},
+            {'obj': obj, 'frag': 10},
+            {'obj': obj, 'frag': 10},
+            {'obj': obj, 'frag': 11},
+            {'obj': obj, 'frag': 11},
+            {'obj': obj, 'frag': 12},
+            {'obj': obj, 'frag': 12},
+            {'obj': obj, 'frag': 13},
+            {'obj': obj, 'frag': 13},
+        ]
+        # ...but it still works!
+        self._test_GET_with_duplication_factor(node_frags, obj)
+
+    def test_GET_with_missing_and_mixed_frags_will_dig_deep_but_stop(self):
+        obj1 = self._make_ec_object_stub(pattern='obj1')
+        obj2 = self._make_ec_object_stub(pattern='obj2')
+
+        # both of obj1 and obj2 has only 9 frags which is not able to decode
+        node_frags = [
+            {'obj': obj1, 'frag': 0},
+            {'obj': obj2, 'frag': 0},
+            {'obj': obj1, 'frag': 1},
+            {'obj': obj2, 'frag': 1},
+            {'obj': obj1, 'frag': 2},
+            {'obj': obj2, 'frag': 2},
+            {'obj': obj1, 'frag': 3},
+            {'obj': obj2, 'frag': 3},
+            {'obj': obj1, 'frag': 4},
+            {'obj': obj2, 'frag': 4},
+            {'obj': obj1, 'frag': 5},
+            {'obj': obj2, 'frag': 5},
+            {'obj': obj1, 'frag': 6},
+            {'obj': obj2, 'frag': 6},
+            {'obj': obj1, 'frag': 7},
+            {'obj': obj2, 'frag': 7},
+            {'obj': obj1, 'frag': 8},
+            {'obj': obj2, 'frag': 8},
+        ]
+        # ... and the rest are 404s which is limited by request_count
+        # (2 * replicas in default) rather than max_extra_requests limitation
+        # because the retries will be in ResumingGetter if the responses
+        # are 404s
+        node_frags += [[]] * (self.replicas() * 2 - len(node_frags))
+        fake_response = self._fake_ec_node_response(node_frags)
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(fake_response) as log:
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 503)
+
+        collected_responses = defaultdict(set)
+        for conn in log:
+            etag = conn.resp.headers['X-Object-Sysmeta-Ec-Etag']
+            index = conn.resp.headers['X-Object-Sysmeta-Ec-Frag-Index']
+            collected_responses[etag].add(index)
+
+        # default node_iter will exhaust to the last of handoffs
+        self.assertEqual(len(log), self.replicas() * 2)
+        # we have obj1, obj2, and 404 NotFound in collected_responses
+        self.assertEqual(len(list(collected_responses.keys())), 3)
+        self.assertIn(obj1['etag'], collected_responses)
+        self.assertIn(obj2['etag'], collected_responses)
+        self.assertIn(None, collected_responses)
+
+        # ... regardless we should never need to fetch more than ec_ndata
+        # frags for any given etag
+        for etag, frags in collected_responses.items():
+            self.assertLessEqual(len(frags), self.policy.ec_ndata,
+                                 'collected %s frags for etag %s' % (
+                                     len(frags), etag))
+
+    def test_GET_with_many_missed_overwrite_will_need_handoff(self):
+        obj1 = self._make_ec_object_stub(pattern='obj1')
+        obj2 = self._make_ec_object_stub(pattern='obj2')
+        # primaries
+        node_frags = [
+            {'obj': obj2, 'frag': 0},
+            {'obj': obj2, 'frag': 1},
+            {'obj': obj1, 'frag': 2},  # missed
+            {'obj': obj2, 'frag': 3},
+            {'obj': obj2, 'frag': 4},
+            {'obj': obj2, 'frag': 5},
+            {'obj': obj1, 'frag': 6},  # missed
+            {'obj': obj2, 'frag': 7},
+            {'obj': obj2, 'frag': 8},
+            {'obj': obj1, 'frag': 9},  # missed
+            {'obj': obj1, 'frag': 10},  # missed
+            {'obj': obj1, 'frag': 11},  # missed
+            {'obj': obj2, 'frag': 12},
+            {'obj': obj2, 'frag': 13},
+        ]
+
+        node_frags = node_frags * 2  # 2 duplication
+
+        # so the primaries have indexes 0, 1, 3, 4, 5, 7, 8, 12, 13
+        # (9 indexes) for obj2 and then a handoff has index 6
+        node_frags += [
+            {'obj': obj2, 'frag': 6},  # handoff
+        ]
+        fake_response = self._fake_ec_node_response(node_frags)
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(fake_response) as log:
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['etag'], obj2['etag'])
+        self.assertEqual(
+            md5(resp.body, usedforsecurity=False).hexdigest(),
+            obj2['etag'])
+
+        collected_responses = defaultdict(set)
+        for conn in log:
+            etag = conn.resp.headers['X-Object-Sysmeta-Ec-Etag']
+            index = conn.resp.headers['X-Object-Sysmeta-Ec-Frag-Index']
+            collected_responses[etag].add(index)
+
+        # there's not enough of the obj2 etag on the primaries, we would
+        # have collected responses for both etags, and would have made
+        # one more request to the handoff node
+        self.assertEqual(len(log), self.replicas() + 1)
+        self.assertEqual(len(collected_responses), 2)
+
+        # ... regardless we should never need to fetch more than ec_ndata
+        # frags for any given etag
+        for etag, frags in collected_responses.items():
+            self.assertLessEqual(len(frags), self.policy.ec_ndata,
+                                 'collected %s frags for etag %s' % (
+                                 len(frags), etag))
+
+    def test_GET_with_missing_and_mixed_frags_will_dig_deep_but_succeed(self):
+        obj1 = self._make_ec_object_stub(pattern='obj1',
+                                         timestamp=self.ts())
+        obj2 = self._make_ec_object_stub(pattern='obj2',
+                                         timestamp=self.ts())
+
+        # 28 nodes are here
+        node_frags = [
+            {'obj': obj1, 'frag': 0},
+            {'obj': obj2, 'frag': 0},
+            [],
+            {'obj': obj1, 'frag': 1},
+            {'obj': obj2, 'frag': 1},
+            [],
+            {'obj': obj1, 'frag': 2},
+            {'obj': obj2, 'frag': 2},
+            [],
+            {'obj': obj1, 'frag': 3},
+            {'obj': obj2, 'frag': 3},
+            [],
+            {'obj': obj1, 'frag': 4},
+            {'obj': obj2, 'frag': 4},
+            [],
+            {'obj': obj1, 'frag': 5},
+            {'obj': obj2, 'frag': 5},
+            [],
+            {'obj': obj1, 'frag': 6},
+            {'obj': obj2, 'frag': 6},
+            [],
+            {'obj': obj1, 'frag': 7},
+            {'obj': obj2, 'frag': 7},
+            [],
+            {'obj': obj1, 'frag': 8},
+            {'obj': obj2, 'frag': 8},
+            [],
+            [],
+        ]
+
+        node_frags += [[]] * 13  # Plus 13 nodes in handoff
+
+        # finally 10th fragment for obj2 found
+        node_frags += [[{'obj': obj2, 'frag': 9}]]
+
+        fake_response = self._fake_ec_node_response(node_frags)
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(fake_response) as log:
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['etag'], obj2['etag'])
+        self.assertEqual(
+            md5(resp.body, usedforsecurity=False).hexdigest(),
+            obj2['etag'])
+
+        collected_responses = defaultdict(set)
+        for conn in log:
+            etag = conn.resp.headers['X-Object-Sysmeta-Ec-Etag']
+            index = conn.resp.headers['X-Object-Sysmeta-Ec-Frag-Index']
+            collected_responses[etag].add(index)
+
+        # we go exactly as long as we have to, finding two different
+        # etags and some 404's (i.e. collected_responses[None])
+        self.assertEqual(len(log), len(node_frags))
+        self.assertEqual(len(collected_responses), 3)
+
+        # ... regardless we should never need to fetch more than ec_ndata
+        # frags for any given etag
+        for etag, frags in collected_responses.items():
+            self.assertLessEqual(len(frags), self.policy.ec_ndata,
+                                 'collected %s frags for etag %s' % (
+                                 len(frags), etag))
+
+    def test_GET_with_mixed_frags_and_no_quorum_will_503(self):
+        # all nodes have a frag but there is no one set that reaches quorum,
+        # which means there is no backend 404 response, but proxy should still
+        # return 404 rather than 503
+        stub_objects = [
+            self._make_ec_object_stub(pattern='obj1'),
+            self._make_ec_object_stub(pattern='obj2'),
+            self._make_ec_object_stub(pattern='obj3'),
+            self._make_ec_object_stub(pattern='obj4'),
+            self._make_ec_object_stub(pattern='obj5'),
+            self._make_ec_object_stub(pattern='obj6'),
+            self._make_ec_object_stub(pattern='obj7'),
+        ]
+        etags = collections.Counter(stub['etag'] for stub in stub_objects)
+        self.assertEqual(len(etags), 7, etags)  # sanity
+
+        # primaries and handoffs for required nodes
+        # this is 10-4 * 2 case so that 56 requests (2 * replicas) required
+        # to give up. we prepares 7 different objects above so responses
+        # will have 8 fragments for each object
+        required_nodes = self.replicas() * 2
+        # fill them out to the primary and handoff nodes
+        node_frags = []
+        for frag in range(8):
+            for stub_obj in stub_objects:
+                if len(node_frags) >= required_nodes:
+                    # we already have enough responses
+                    break
+                node_frags.append({'obj': stub_obj, 'frag': frag})
+
+        # sanity
+        self.assertEqual(required_nodes, len(node_frags))
+
+        fake_response = self._fake_ec_node_response(node_frags)
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(fake_response) as log:
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 503)
+
+        collected_etags = set()
+        collected_status = set()
+        for conn in log:
+            etag = conn.resp.headers['X-Object-Sysmeta-Ec-Etag']
+            collected_etags.add(etag)
+            collected_status.add(conn.resp.status)
+
+        self.assertEqual(required_nodes, len(log))
+        self.assertEqual(len(collected_etags), 7)
+        self.assertEqual({200}, collected_status)
+
+    def test_GET_with_no_durable_files(self):
+        # verify that at least one durable is necessary for a successful GET
+        obj1 = self._make_ec_object_stub()
+        node_frags = [
+            {'obj': obj1, 'frag': 0, 'durable': False},
+            {'obj': obj1, 'frag': 1, 'durable': False},
+            {'obj': obj1, 'frag': 2, 'durable': False},
+            {'obj': obj1, 'frag': 3, 'durable': False},
+            {'obj': obj1, 'frag': 4, 'durable': False},
+            {'obj': obj1, 'frag': 5, 'durable': False},
+            {'obj': obj1, 'frag': 6, 'durable': False},
+            {'obj': obj1, 'frag': 7, 'durable': False},
+            {'obj': obj1, 'frag': 8, 'durable': False},
+            {'obj': obj1, 'frag': 9, 'durable': False},
+            {'obj': obj1, 'frag': 10, 'durable': False},  # parity
+            {'obj': obj1, 'frag': 11, 'durable': False},  # parity
+            {'obj': obj1, 'frag': 12, 'durable': False},  # parity
+            {'obj': obj1, 'frag': 13, 'durable': False},  # parity
+        ]
+
+        node_frags = node_frags * 2  # 2 duplications
+
+        node_frags += [[]] * self.replicas()  # handoffs
+
+        fake_response = self._fake_ec_node_response(list(node_frags))
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(fake_response) as log:
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 404)
+        # all 28 nodes tried with an optimistic get, none are durable and none
+        # report having a durable timestamp
+        self.assertEqual(self.replicas() * 2, len(log))
+
+    def test_GET_with_missing_and_mixed_frags_may_503(self):
+        obj1 = self._make_ec_object_stub(pattern='obj1')
+        obj2 = self._make_ec_object_stub(pattern='obj2')
+        obj3 = self._make_ec_object_stub(pattern='obj3')
+        obj4 = self._make_ec_object_stub(pattern='obj4')
+        # we get a 503 when all the handoffs return 200
+        node_frags = [[]] * self.replicas()  # primaries have no frags
+        # plus, 4 different objects and 7 indexes will b 28 node responses
+        # here for handoffs
+        node_frags = node_frags + [  # handoffs all have frags
+            {'obj': obj1, 'frag': 0},
+            {'obj': obj2, 'frag': 0},
+            {'obj': obj3, 'frag': 0},
+            {'obj': obj4, 'frag': 0},
+            {'obj': obj1, 'frag': 1},
+            {'obj': obj2, 'frag': 1},
+            {'obj': obj3, 'frag': 1},
+            {'obj': obj4, 'frag': 1},
+            {'obj': obj1, 'frag': 2},
+            {'obj': obj2, 'frag': 2},
+            {'obj': obj3, 'frag': 2},
+            {'obj': obj4, 'frag': 2},
+            {'obj': obj1, 'frag': 3},
+            {'obj': obj2, 'frag': 3},
+            {'obj': obj3, 'frag': 3},
+            {'obj': obj4, 'frag': 3},
+            {'obj': obj1, 'frag': 4},
+            {'obj': obj2, 'frag': 4},
+            {'obj': obj3, 'frag': 4},
+            {'obj': obj4, 'frag': 4},
+            {'obj': obj1, 'frag': 5},
+            {'obj': obj2, 'frag': 5},
+            {'obj': obj3, 'frag': 5},
+            {'obj': obj4, 'frag': 5},
+            {'obj': obj1, 'frag': 6},
+            {'obj': obj2, 'frag': 6},
+            {'obj': obj3, 'frag': 6},
+            {'obj': obj4, 'frag': 6},
+        ]
+
+        fake_response = self._fake_ec_node_response(node_frags)
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(fake_response) as log:
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 503)
+        # never get a quorum so all nodes are searched
+        self.assertEqual(len(log), 2 * self.replicas())
+        collected_indexes = defaultdict(list)
+        for conn in log:
+            fi = conn.resp.headers.get('X-Object-Sysmeta-Ec-Frag-Index')
+            if fi is not None:
+                collected_indexes[fi].append(conn)
+        self.assertEqual(len(collected_indexes), 7)
+
+    def test_GET_with_mixed_etags_at_same_timestamp(self):
+        # the difference from parent class is only handoff stub length
+
+        ts = self.ts()  # force equal timestamps for two objects
+        obj1 = self._make_ec_object_stub(timestamp=ts, pattern='obj1')
+        obj2 = self._make_ec_object_stub(timestamp=ts, pattern='obj2')
+        self.assertNotEqual(obj1['etag'], obj2['etag'])  # sanity
+
+        node_frags = [
+            # 7 frags of obj2 are available and durable
+            {'obj': obj2, 'frag': 0, 'durable': True},
+            {'obj': obj2, 'frag': 1, 'durable': True},
+            {'obj': obj2, 'frag': 2, 'durable': True},
+            {'obj': obj2, 'frag': 3, 'durable': True},
+            {'obj': obj2, 'frag': 4, 'durable': True},
+            {'obj': obj2, 'frag': 5, 'durable': True},
+            {'obj': obj2, 'frag': 6, 'durable': True},
+            # 7 frags of obj1 are available and durable
+            {'obj': obj1, 'frag': 7, 'durable': True},
+            {'obj': obj1, 'frag': 8, 'durable': True},
+            {'obj': obj1, 'frag': 9, 'durable': True},
+            {'obj': obj1, 'frag': 10, 'durable': True},
+            {'obj': obj1, 'frag': 11, 'durable': True},
+            {'obj': obj1, 'frag': 12, 'durable': True},
+            {'obj': obj1, 'frag': 13, 'durable': True},
+            # handoffs
+        ]
+
+        node_frags += [[]] * (self.replicas() * 2 - len(node_frags))
+
+        fake_response = self._fake_ec_node_response(list(node_frags))
+
+        req = swob.Request.blank('/v1/a/c/o')
+        with capture_http_requests(fake_response) as log:
+            resp = req.get_response(self.app)
+        # read body to provoke any EC decode errors
+        self.assertTrue(resp.body)
+
+        self.assertEqual(resp.status_int, 503)
+        self.assertEqual(len(log), self.replicas() * 2)
+        collected_etags = set()
+        for conn in log:
+            etag = conn.resp.headers['X-Object-Sysmeta-Ec-Etag']
+            collected_etags.add(etag)  # will be None from handoffs
+        self.assertEqual({obj1['etag'], obj2['etag'], None}, collected_etags)
+        log_lines = self.app.logger.get_lines_for_level('error')
+        self.assertEqual(log_lines,
+                         ['Problem with fragment response: ETag mismatch'] * 7
+                         + ['Object returning 503 for []'])
+
+    def _test_determine_chunk_destinations_prioritize(
+            self, missing_two, missing_one):
+        # This scenario is only likely for ec_duplication_factor >= 2. If we
+        # have multiple failures such that the putters collection is missing
+        # two primary nodes for frag index 'missing_two' and missing one
+        # primary node for frag index 'missing_one', then we should prioritize
+        # finding a handoff for frag index 'missing_two'.
+
+        class FakePutter(object):
+            def __init__(self, index):
+                self.node_index = index
+
+        controller = self.controller_cls(self.app, 'a', 'c', 'o')
+
+        # sanity, caller must set missing_two < than ec_num_unique_fragments
+        self.assertLess(missing_two, self.policy.ec_n_unique_fragments)
+
+        # create a dummy list of putters, check no handoffs
+        putters = []
+        for index in range(self.policy.object_ring.replica_count):
+            putters.append(FakePutter(index))
+
+        # sanity - all putters have primary nodes
+        got = controller._determine_chunk_destinations(putters, self.policy)
+        expected = {}
+        for i, p in enumerate(putters):
+            expected[p] = self.policy.get_backend_index(i)
+        self.assertEqual(got, expected)
+
+        # now, for fragment index that is missing two copies, lets make one
+        # putter be a handoff
+        handoff_putter = putters[missing_two]
+        handoff_putter.node_index = None
+
+        # and then pop another putter for a copy of same fragment index
+        putters.pop(missing_two + self.policy.ec_n_unique_fragments)
+
+        # also pop one copy of a different fragment to make one missing hole
+        putters.pop(missing_one)
+
+        # then determine chunk destinations: we have 26 putters here;
+        # missing_two frag index is missing two copies;  missing_one frag index
+        # is missing one copy, therefore the handoff node should be assigned to
+        # missing_two frag index
+        got = controller._determine_chunk_destinations(putters, self.policy)
+        # N.B. len(putters) is now len(expected - 2) due to pop twice
+        self.assertEqual(len(putters), len(got))
+        # sanity, no node index - for handoff putter
+        self.assertIsNone(handoff_putter.node_index)
+        self.assertEqual(got[handoff_putter], missing_two)
+        # sanity, other nodes except handoff_putter have node_index
+        self.assertTrue(all(
+            [putter.node_index is not None for putter in got if
+             putter != handoff_putter]))
+
+    def test_determine_chunk_destinations_prioritize_more_missing(self):
+        # drop node_index 0, 14 and 1 should work
+        self._test_determine_chunk_destinations_prioritize(0, 1)
+        # drop node_index 1, 15 and 0 should work, too
+        self._test_determine_chunk_destinations_prioritize(1, 0)
+
+
+class ECCommonPutterMixin(object):
+    # EC PUT tests common to both Mime and PUT+POST protocols
+    expect_headers = {}
+
+    def test_PUT_ec_error_during_transfer_data(self):
+        class FakeReader(object):
+            def read(self, size):
+                raise IOError('error message')
+
+        req = swob.Request.blank('/v1/a/c/o.jpg', method='PUT',
+                                 body=b'test body')
+
+        req.environ['wsgi.input'] = FakeReader()
+        req.headers['content-length'] = '6'
+        codes = [201] * self.replicas()
+        with set_http_connect(*codes, expect_headers=self.expect_headers):
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 499)
+
+    def test_PUT_ec_chunkreadtimeout_during_transfer_data(self):
+        class FakeReader(object):
+            def read(self, size):
+                raise exceptions.ChunkReadTimeout()
+
+        req = swob.Request.blank('/v1/a/c/o.jpg', method='PUT',
+                                 body=b'test body')
+
+        req.environ['wsgi.input'] = FakeReader()
+        req.headers['content-length'] = '6'
+        codes = [201] * self.replicas()
+        with set_http_connect(*codes, expect_headers=self.expect_headers):
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 408)
+
+    def test_PUT_ec_timeout_during_transfer_data(self):
+        class FakeReader(object):
+            def read(self, size):
+                raise exceptions.Timeout()
+
+        req = swob.Request.blank('/v1/a/c/o.jpg', method='PUT',
+                                 body=b'test body')
+
+        req.environ['wsgi.input'] = FakeReader()
+        req.headers['content-length'] = '6'
+        codes = [201] * self.replicas()
+        with set_http_connect(*codes, expect_headers=self.expect_headers):
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 499)
+
+    def test_PUT_ec_exception_during_transfer_data(self):
+        class FakeReader(object):
+            def read(self, size):
+                raise Exception('exception message')
+
+        req = swob.Request.blank('/v1/a/c/o.jpg', method='PUT',
+                                 body=b'test body')
+
+        req.environ['wsgi.input'] = FakeReader()
+        req.headers['content-length'] = '6'
+        codes = [201] * self.replicas()
+        with set_http_connect(*codes, expect_headers=self.expect_headers):
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 500)
+
+
+# This is how CommonObjectControllerMixin is supposed to be used:
+# @patch_policies(with_ec_default=True)
+# class TestECObjControllerDoublePutter(BaseObjectControllerMixin,
+#                                       ECCommonPutterMixin,
+#                                       unittest.TestCase):
+#     # tests specific to the PUT+POST protocol
+#
+#     def setUp(self):
+#         super(TestECObjControllerDoublePutter, self).setUp()
+#         # force use of the DoublePutter class
+#         self.app.use_put_v1 = True
+
+
+@patch_policies(with_ec_default=True)
+class TestECObjControllerMimePutter(BaseObjectControllerMixin,
+                                    ECCommonPutterMixin,
+                                    BaseTestCase):
+    # tests specific to the older PUT protocol using a MimePutter
+    expect_headers = {
+        'X-Obj-Metadata-Footer': 'yes',
+        'X-Obj-Multiphase-Commit': 'yes'
+    }
+
+    def setUp(self):
+        super(TestECObjControllerMimePutter, self).setUp()
+        # force use of the MimePutter class
+        self.app.use_put_v1 = False
+
+    def test_PUT_simple(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='PUT',
+                                              body=b'')
+        codes = [201] * self.replicas()
+        with mocked_http_conn(*codes,
+                              expect_headers=self.expect_headers) as mock_conn:
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 201)
+        timestamps = [captured['headers'].get('X-Timestamp')
+                      for captured in mock_conn.requests]
+        self.assertEqual(self.replicas(), len(timestamps))
+        self.assertEqual(1, len(set(timestamps)))
+        self.assert_valid_timestamp(timestamps[0])
+
+    def test_PUT_with_body_and_bad_etag(self):
+        segment_size = self.policy.ec_segment_size
+        test_body = (b'asdf' * segment_size)[:-10]
+        codes = [201] * self.replicas()
+        conns = []
+
+        def capture_expect(conn):
+            # stash the backend connection so we can verify that it is closed
+            # (no data will be sent)
+            conns.append(conn)
+
+        # send a bad etag in the request headers
+        headers = {'Etag': 'bad etag'}
+        req = swift.common.swob.Request.blank(
+            '/v1/a/c/o', method='PUT', headers=headers, body=test_body)
+        with set_http_connect(*codes, expect_headers=self.expect_headers,
+                              give_expect=capture_expect):
+            resp = req.get_response(self.app)
+        self.assertEqual(422, resp.status_int)
+        self.assertEqual(self.replicas(), len(conns))
+        for conn in conns:
+            self.assertTrue(conn.closed)
+
+        # make the footers callback send the correct etag
+        footers_callback = make_footers_callback(test_body)
+        env = {'swift.callback.update_footers': footers_callback}
+        headers = {'Etag': 'bad etag'}
+        req = swift.common.swob.Request.blank(
+            '/v1/a/c/o', method='PUT', headers=headers, environ=env,
+            body=test_body)
+        with set_http_connect(*codes, expect_headers=self.expect_headers):
+            resp = req.get_response(self.app)
+        self.assertEqual(201, resp.status_int)
+
+        # make the footers callback send a bad Etag footer
+        footers_callback = make_footers_callback(b'not the test body')
+        env = {'swift.callback.update_footers': footers_callback}
+        req = swift.common.swob.Request.blank(
+            '/v1/a/c/o', method='PUT', environ=env, body=test_body)
+        with set_http_connect(*codes, expect_headers=self.expect_headers):
+            resp = req.get_response(self.app)
+        self.assertEqual(422, resp.status_int)
+
+    def test_txn_id_logging_ECPUT(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='PUT',
+                                              body=b'')
+        self.app.logger.txn_id = req.environ['swift.trans_id'] = 'test-txn-id'
+        codes = [(100, Timeout(), 503, 503)] * self.replicas()
+        stdout = StringIO()
+        with set_http_connect(*codes, expect_headers=self.expect_headers), \
+                mock.patch('sys.stdout', stdout):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 503)
+        for line in stdout.getvalue().splitlines():
+            self.assertIn('test-txn-id', line)
+        self.assertIn('Trying to get ', stdout.getvalue())
+
+    def test_PUT_with_explicit_commit_status(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='PUT',
+                                              body=b'')
+        codes = [(100, 100, 201)] * self.replicas()
+        with set_http_connect(*codes, expect_headers=self.expect_headers):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 201)
+
+    def test_PUT_mostly_success(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='PUT',
+                                              body=b'')
+        codes = [201] * self.quorum()
+        codes += [503] * (self.replicas() - len(codes))
+        random.shuffle(codes)
+        with set_http_connect(*codes, expect_headers=self.expect_headers):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 201)
+
+    def test_PUT_error_commit(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='PUT',
+                                              body=b'')
+        codes = [(100, 503, Exception('not used'))] * self.replicas()
+        with set_http_connect(*codes, expect_headers=self.expect_headers):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 503)
+
+    def test_PUT_mostly_success_commit(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='PUT',
+                                              body=b'')
+        codes = [201] * self.quorum()
+        codes += [(100, 503, Exception('not used'))] * (
+            self.replicas() - len(codes))
+        random.shuffle(codes)
+        with set_http_connect(*codes, expect_headers=self.expect_headers):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 201)
+
+    def test_PUT_mostly_error_commit(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='PUT',
+                                              body=b'')
+        codes = [(100, 503, Exception('not used'))] * self.quorum()
+        if isinstance(self.policy, ECStoragePolicy):
+            codes *= self.policy.ec_duplication_factor
+        codes += [201] * (self.replicas() - len(codes))
+        random.shuffle(codes)
+        with set_http_connect(*codes, expect_headers=self.expect_headers):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 503)
+
+    def test_PUT_commit_timeout(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='PUT',
+                                              body=b'')
+        codes = [201] * (self.replicas() - 1)
+        codes.append((100, Timeout(), Exception('not used')))
+        with set_http_connect(*codes, expect_headers=self.expect_headers):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 201)
+
+    def test_PUT_commit_exception(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='PUT',
+                                              body=b'')
+        codes = [201] * (self.replicas() - 1)
+        codes.append((100, Exception('kaboom!'), Exception('not used')))
+        with set_http_connect(*codes, expect_headers=self.expect_headers):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 201)
+
+    def test_PUT_with_body(self):
+        self._test_PUT_with_body()
+
+    def test_PUT_with_chunked_body(self):
+        self._test_PUT_with_body(chunked=True, content_length=False)
+
+    def test_PUT_with_both_body(self):
+        self._test_PUT_with_body(chunked=True, content_length=True)
+
+    def _test_PUT_with_body(self, chunked=False, content_length=True):
+        segment_size = self.policy.ec_segment_size
+        test_body = (b'asdf' * segment_size)[:-10]
+        # make the footers callback not include Etag footer so that we can
+        # verify that the correct EC-calculated Etag is included in footers
+        # sent to backend
+        footers_callback = make_footers_callback()
+        env = {'swift.callback.update_footers': footers_callback}
+        req = swift.common.swob.Request.blank(
+            '/v1/a/c/o', method='PUT', environ=env)
+        etag = md5(test_body, usedforsecurity=False).hexdigest()
+        size = len(test_body)
+        req.body = test_body
+        if chunked:
+            req.headers['Transfer-Encoding'] = 'chunked'
+        if not content_length:
+            del req.headers['Content-Length']
+        codes = [201] * self.replicas()
+        resp_headers = {
+            'Some-Other-Header': 'Four',
+            'Etag': 'ignored',
+        }
+
+        put_requests = defaultdict(lambda: {'boundary': None, 'chunks': []})
+
+        def capture_body(conn, chunk):
+            put_requests[conn.connection_id]['chunks'].append(chunk)
+
+        def capture_headers(ip, port, device, part, method, path, headers,
+                            **kwargs):
+            conn_id = kwargs['connection_id']
+            put_requests[conn_id]['boundary'] = headers[
+                'X-Backend-Obj-Multipart-Mime-Boundary']
+            put_requests[conn_id]['backend-content-length'] = headers.get(
+                'X-Backend-Obj-Content-Length')
+            put_requests[conn_id]['x-timestamp'] = headers[
+                'X-Timestamp']
+
+        with set_http_connect(*codes, expect_headers=self.expect_headers,
+                              give_send=capture_body,
+                              give_connect=capture_headers,
+                              headers=resp_headers):
+            resp = req.get_response(self.app)
+
+        self.assertEqual(resp.status_int, 201)
+        timestamps = {captured_req['x-timestamp']
+                      for captured_req in put_requests.values()}
+        self.assertEqual(1, len(timestamps), timestamps)
+        self.assertEqual(dict(resp.headers), {
+            'Content-Type': 'text/html; charset=UTF-8',
+            'Content-Length': '0',
+            'Last-Modified':
+                date_header_format(Timestamp(timestamps.pop())),
+            'Etag': etag,
+        })
+        frag_archives = []
+        for connection_id, info in put_requests.items():
+            body = unchunk_body(b''.join(info['chunks']))
+            self.assertIsNotNone(info['boundary'],
+                                 "didn't get boundary for conn %r" % (
+                                     connection_id,))
+
+            # email.parser.FeedParser doesn't know how to take a multipart
+            # message and boundary together and parse it; it only knows how
+            # to take a string, parse the headers, and figure out the
+            # boundary on its own.
+            parser = EmailFeedParser()
+            parser.feed(
+                ("Content-Type: multipart/nobodycares; boundary=%s\r\n\r\n" %
+                 info['boundary']).encode('ascii'))
+            parser.feed(body)
+            message = parser.close()
+
+            self.assertTrue(message.is_multipart())  # sanity check
+            mime_parts = message.get_payload()
+            self.assertEqual(len(mime_parts), 3)
+            obj_part, footer_part, commit_part = mime_parts
+
+            # attach the body to frag_archives list
+            self.assertEqual(obj_part['X-Document'], 'object body')
+            obj_payload = obj_part.get_payload(decode=True)
+            frag_archives.append(obj_payload)
+
+            if chunked:
+                self.assertIsNone(info['backend-content-length'])
+            else:
+                self.assertTrue(
+                    size > int(info['backend-content-length']) > 0,
+                    "invalid backend-content-length for conn %r" % (
+                        connection_id,))
+                # assert length was correct for this connection
+                self.assertEqual(int(info['backend-content-length']),
+                                 len(frag_archives[-1]))
+                # assert length was the same for all connections
+                self.assertEqual(int(info['backend-content-length']),
+                                 len(frag_archives[0]))
+
+            # validate some footer metadata
+            self.assertEqual(footer_part['X-Document'], 'object metadata')
+            footer_metadata = json.loads(footer_part.get_payload())
+            self.assertTrue(footer_metadata)
+            expected = {}
+            # update expected with footers from the callback...
+            footers_callback(expected)
+            expected.update({
+                'X-Object-Sysmeta-Ec-Content-Length': str(size),
+                'X-Backend-Container-Update-Override-Size': str(size),
+                'X-Object-Sysmeta-Ec-Etag': etag,
+                'X-Backend-Container-Update-Override-Etag': etag,
+                'X-Object-Sysmeta-Ec-Segment-Size': str(segment_size),
+                'Etag': md5(obj_payload, usedforsecurity=False).hexdigest()})
+            for header, value in expected.items():
+                self.assertEqual(footer_metadata[header], value)
+
+            # sanity on commit message
+            self.assertEqual(commit_part['X-Document'], 'put commit')
+
+        self.assertEqual(len(frag_archives), self.replicas())
+        fragment_size = self.policy.fragment_size
+        node_payloads = []
+        for fa in frag_archives:
+            payload = [fa[x:x + fragment_size]
+                       for x in range(0, len(fa), fragment_size)]
+            node_payloads.append(payload)
+        fragment_payloads = zip(*node_payloads)
+
+        expected_body = b''
+        for fragment_payload in fragment_payloads:
+            self.assertEqual(len(fragment_payload), self.replicas())
+            if True:
+                fragment_payload = list(fragment_payload)
+            expected_body += self.policy.pyeclib_driver.decode(
+                fragment_payload)
+
+        self.assertEqual(len(test_body), len(expected_body))
+        self.assertEqual(test_body, expected_body)
+
+    def test_PUT_with_footers(self):
+        # verify footers supplied by a footers callback being added to
+        # trailing metadata
+        segment_size = self.policy.ec_segment_size
+        test_body = (b'asdf' * segment_size)[:-10]
+        etag = md5(test_body, usedforsecurity=False).hexdigest()
+        size = len(test_body)
+        codes = [201] * self.replicas()
+        resp_headers = {
+            'Some-Other-Header': 'Four',
+            'Etag': 'ignored',
+        }
+
+        def do_test(footers_to_add, expect_added):
+            put_requests = defaultdict(
+                lambda: {'boundary': None, 'chunks': []})
+
+            def capture_body(conn, chunk):
+                put_requests[conn.connection_id]['chunks'].append(chunk)
+
+            def capture_headers(ip, port, device, part, method, path, headers,
+                                **kwargs):
+                conn_id = kwargs['connection_id']
+                put_requests[conn_id]['boundary'] = headers[
+                    'X-Backend-Obj-Multipart-Mime-Boundary']
+                put_requests[conn_id]['x-timestamp'] = headers[
+                    'X-Timestamp']
+
+            def footers_callback(footers):
+                footers.update(footers_to_add)
+            env = {'swift.callback.update_footers': footers_callback}
+            req = swift.common.swob.Request.blank(
+                '/v1/a/c/o', method='PUT', environ=env, body=test_body)
+
+            with set_http_connect(*codes, expect_headers=self.expect_headers,
+                                  give_send=capture_body,
+                                  give_connect=capture_headers,
+                                  headers=resp_headers):
+                resp = req.get_response(self.app)
+
+            self.assertEqual(resp.status_int, 201)
+            timestamps = {captured_req['x-timestamp']
+                          for captured_req in put_requests.values()}
+            self.assertEqual(1, len(timestamps), timestamps)
+            self.assertEqual(dict(resp.headers), {
+                'Content-Type': 'text/html; charset=UTF-8',
+                'Content-Length': '0',
+                'Last-Modified':
+                    date_header_format(Timestamp(timestamps.pop())),
+                'Etag': etag,
+            })
+            for connection_id, info in put_requests.items():
+                body = unchunk_body(b''.join(info['chunks']))
+                # email.parser.FeedParser doesn't know how to take a multipart
+                # message and boundary together and parse it; it only knows how
+                # to take a string, parse the headers, and figure out the
+                # boundary on its own.
+                parser = EmailFeedParser()
+                parser.feed(
+                    ("Content-Type: multipart/nobodycares; boundary=%s\r\n\r\n"
+                     % info['boundary']).encode('ascii'))
+                parser.feed(body)
+                message = parser.close()
+
+                self.assertTrue(message.is_multipart())  # sanity check
+                mime_parts = message.get_payload()
+                self.assertEqual(len(mime_parts), 3)
+                obj_part, footer_part, commit_part = mime_parts
+
+                # validate EC footer metadata - should always be present
+                self.assertEqual(footer_part['X-Document'], 'object metadata')
+                footer_metadata = json.loads(footer_part.get_payload())
+                self.assertIsNotNone(
+                    footer_metadata.pop('X-Object-Sysmeta-Ec-Frag-Index'))
+                expected = {
+                    'X-Object-Sysmeta-Ec-Scheme':
+                        self.policy.ec_scheme_description,
+                    'X-Object-Sysmeta-Ec-Content-Length': str(size),
+                    'X-Object-Sysmeta-Ec-Etag': etag,
+                    'X-Object-Sysmeta-Ec-Segment-Size': str(segment_size),
+                    'Etag': md5(
+                        obj_part.get_payload(decode=True),
+                        usedforsecurity=False).hexdigest()}
+                expected.update(expect_added)
+                for header, value in expected.items():
+                    self.assertIn(header, footer_metadata)
+                    self.assertEqual(value, footer_metadata[header])
+                    footer_metadata.pop(header)
+                self.assertFalse(footer_metadata)
+
+        # sanity check - middleware sets no footer, expect EC overrides
+        footers_to_add = {}
+        expect_added = {
+            'X-Backend-Container-Update-Override-Size': str(size),
+            'X-Backend-Container-Update-Override-Etag': etag}
+        do_test(footers_to_add, expect_added)
+
+        # middleware cannot overwrite any EC sysmeta
+        footers_to_add = {
+            'X-Object-Sysmeta-Ec-Content-Length': str(size + 1),
+            'X-Object-Sysmeta-Ec-Etag': 'other etag',
+            'X-Object-Sysmeta-Ec-Segment-Size': str(segment_size + 1),
+            'X-Object-Sysmeta-Ec-Unused-But-Reserved': 'ignored'}
+        do_test(footers_to_add, expect_added)
+
+        # middleware can add x-object-sysmeta- headers including
+        # x-object-sysmeta-container-update-override headers
+        footers_to_add = {
+            'X-Object-Sysmeta-Foo': 'bar',
+            'X-Object-Sysmeta-Container-Update-Override-Size':
+                str(size + 1),
+            'X-Object-Sysmeta-Container-Update-Override-Etag': 'other etag',
+            'X-Object-Sysmeta-Container-Update-Override-Ping': 'pong'
+        }
+        expect_added.update(footers_to_add)
+        do_test(footers_to_add, expect_added)
+
+        # middleware can also overwrite x-backend-container-update-override
+        # headers
+        override_footers = {
+            'X-Backend-Container-Update-Override-Wham': 'bam',
+            'X-Backend-Container-Update-Override-Size': str(size + 2),
+            'X-Backend-Container-Update-Override-Etag': 'another etag'}
+        footers_to_add.update(override_footers)
+        expect_added.update(override_footers)
+        do_test(footers_to_add, expect_added)
+
+    def test_PUT_old_obj_server(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='PUT',
+                                              body=b'')
+        responses = [
+            # one server will response 100-continue but not include the
+            # needful expect headers and the connection will be dropped
+            ((100, Exception('not used')), {}),
+        ] + [
+            # and pleanty of successful responses too
+            (201, {
+                'X-Obj-Metadata-Footer': 'yes',
+                'X-Obj-Multiphase-Commit': 'yes',
+            }),
+        ] * self.replicas()
+        random.shuffle(responses)
+        if responses[-1][0] != 201:
+            # whoops, stupid random
+            responses = responses[1:] + [responses[0]]
+        codes, expect_headers = zip(*responses)
+        with set_http_connect(*codes, expect_headers=expect_headers):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 201)
+
+    def test_PUT_with_slow_commits(self):
+        # It's important that this timeout be much less than the delay in
+        # the slow commit responses so that the slow commits are not waited
+        # for.
+        self.app.post_quorum_timeout = 0.01
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='PUT',
+                                              body=b'')
+        # plenty of slow commits
+        response_sleep = 5.0
+        codes = [FakeStatus(201, response_sleep=response_sleep)
+                 for i in range(self.replicas())]
+        # swap out some with regular fast responses
+        number_of_fast_responses_needed_to_be_quick_enough = \
+            self.policy.quorum
+        fast_indexes = random.sample(
+            range(self.replicas()),
+            number_of_fast_responses_needed_to_be_quick_enough)
+        for i in fast_indexes:
+            codes[i] = 201
+        with set_http_connect(*codes, expect_headers=self.expect_headers):
+            start = time.time()
+            resp = req.get_response(self.app)
+            response_time = time.time() - start
+        self.assertEqual(resp.status_int, 201)
+        self.assertLess(response_time, response_sleep)
+
+    def test_PUT_with_just_enough_durable_responses(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='PUT',
+                                              body=b'')
+
+        codes = [201] * (self.policy.ec_ndata + 1)
+        codes += [503] * (self.policy.ec_nparity - 1)
+        self.assertEqual(len(codes), self.policy.ec_n_unique_fragments)
+        random.shuffle(codes)
+        with set_http_connect(*codes, expect_headers=self.expect_headers):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 201)
+
+    def test_PUT_with_less_durable_responses(self):
+        req = swift.common.swob.Request.blank('/v1/a/c/o', method='PUT',
+                                              body=b'')
+
+        codes = [201] * (self.policy.ec_ndata)
+        codes += [503] * (self.policy.ec_nparity)
+        self.assertEqual(len(codes), self.policy.ec_n_unique_fragments)
+        random.shuffle(codes)
+        with set_http_connect(*codes, expect_headers=self.expect_headers):
+            resp = req.get_response(self.app)
+        self.assertEqual(resp.status_int, 503)
+
+
+class TestNumContainerUpdates(unittest.TestCase):
+    def test_it(self):
+        test_cases = [
+            # (container replicas, object replicas, object quorum, expected)
+            (3, 17, 13, 6),  # EC 12+5
+            (3, 9, 4, 7),    # EC 3+6
+            (3, 14, 11, 5),  # EC 10+4
+            (5, 14, 11, 6),  # EC 10+4, 5 container replicas
+            (7, 14, 11, 7),  # EC 10+4, 7 container replicas
+            (3, 19, 16, 5),  # EC 15+4
+            (5, 19, 16, 6),  # EC 15+4, 5 container replicas
+            (3, 28, 22, 8),  # EC (10+4)x2
+            (5, 28, 22, 9),  # EC (10+4)x2, 5 container replicas
+            (3, 1, 1, 3),    # 1 object replica
+            (3, 2, 1, 3),    # 2 object replicas
+            (3, 3, 2, 3),    # 3 object replicas
+            (3, 4, 2, 4),    # 4 object replicas
+            (3, 5, 3, 4),    # 5 object replicas
+            (3, 6, 3, 5),    # 6 object replicas
+            (3, 7, 4, 5),    # 7 object replicas
+        ]
+
+        for c_replica, o_replica, o_quorum, exp in test_cases:
+            c_quorum = utils.quorum_size(c_replica)
+            got = obj.num_container_updates(c_replica, c_quorum,
+                                            o_replica, o_quorum)
+            self.assertEqual(
+                exp, got,
+                "Failed for c_replica=%d, o_replica=%d, o_quorum=%d" % (
+                    c_replica, o_replica, o_quorum))
+
+
+@patch_policies(with_ec_default=True)
+class TestECFragGetter(BaseObjectControllerMixin, unittest.TestCase):
+    def setUp(self):
+        super(TestECFragGetter, self).setUp()
+        req = Request.blank(path='/v1/a/c/o')
+        self.getter = obj.ECFragGetter(
+            self.app, req, None, None, self.policy, 'a/c/o',
+            {}, None, self.logger.thread_locals,
+            self.logger)
+
+    def test_init_node_timeout(self):
+        app = argparse.Namespace(node_timeout=2, recoverable_node_timeout=3)
+        getter = obj.ECFragGetter(
+            app, None, None, None, self.policy, 'a/c/o',
+            {}, None, None, self.logger)
+        self.assertEqual(3, getter.node_timeout)
+
+    def test_iter_bytes_from_response_part(self):
+        part = FileLikeIter([b'some', b'thing'])
+        it = self.getter._iter_bytes_from_response_part(part, nbytes=None)
+        self.assertEqual(b'something', b''.join(it))
+
+    def test_iter_bytes_from_response_part_insufficient_bytes(self):
+        part = FileLikeIter([b'some', b'thing'])
+        it = self.getter._iter_bytes_from_response_part(part, nbytes=100)
+        with mock.patch.object(self.getter, '_find_source',
+                               return_value=False):
+            with self.assertRaises(ShortReadError) as cm:
+                b''.join(it)
+        self.assertEqual('Too few bytes; read 9, expecting 100',
+                         str(cm.exception))
+
+    def test_iter_bytes_from_response_part_read_timeout(self):
+        part = FileLikeIter([b'some', b'thing'])
+        it = self.getter._iter_bytes_from_response_part(part, nbytes=9)
+        exc = ChunkReadTimeout()
+        # set this after __init__ to keep it off the eventlet scheduler
+        exc.seconds = 9
+        with mock.patch.object(self.getter, '_find_source',
+                               return_value=False):
+            with mock.patch.object(part, 'read', side_effect=[b'some', exc]):
+                with self.assertRaises(ChunkReadTimeout) as cm:
+                    b''.join(it)
+        self.assertEqual('9 seconds', str(cm.exception))
+
+    def test_iter_bytes_from_response_part_small_fragment_size(self):
+        self.getter.fragment_size = 4
+        part = FileLikeIter([b'some', b'thing', b''])
+        it = self.getter._iter_bytes_from_response_part(part, nbytes=None)
+        self.assertEqual([b'some', b'thin', b'g'], [ch for ch in it])
+        self.getter.fragment_size = 1
+        part = FileLikeIter([b'some', b'thing', b''])
+        it = self.getter._iter_bytes_from_response_part(part, nbytes=None)
+        self.assertEqual([c.encode() for c in 'something'], [ch for ch in it])
+
+    def test_fragment_size(self):
+        source = FakeSource((
+            b'abcd', b'1234', b'abc', b'd1', b'234abcd1234abcd1', b'2'))
+
+        def mock_source_gen():
+            yield GetterSource(self.app, source, {})
+
+        self.getter.fragment_size = 8
+        with mock.patch.object(self.getter, '_source_gen', mock_source_gen):
+            it = self.getter.response_parts_iter()
+            fragments = list(next(it)['part_iter'])
+
+        self.assertEqual(fragments, [
+            b'abcd1234', b'abcd1234', b'abcd1234', b'abcd12'])
+
+    def test_fragment_size_resuming(self):
+        node = {'ip': '1.2.3.4', 'port': 6200, 'device': 'sda'}
+
+        source1 = FakeSource([b'abcd', b'1234', None,
+                              b'efgh', b'5678', b'lots', b'more', b'data'])
+        # incomplete reads of fragment_size will be re-fetched
+        source2 = FakeSource([b'efgh', b'5678', b'lots', None])
+        source3 = FakeSource([b'lots', b'more', b'data'])
+        range_headers = []
+        sources = [GetterSource(self.app, src, node)
+                   for src in (source1, source2, source3)]
+
+        def mock_source_gen():
+            for source in sources:
+                range_headers.append(self.getter.backend_headers.get('Range'))
+                yield source
+
+        self.getter.fragment_size = 8
+        with mock.patch.object(self.getter, '_source_gen',
+                               mock_source_gen):
+            it = self.getter.response_parts_iter()
+            fragments = list(next(it)['part_iter'])
+
+        self.assertEqual(fragments, [
+            b'abcd1234', b'efgh5678', b'lotsmore', b'data'])
+        self.assertEqual(range_headers, [None, 'bytes=8-27', 'bytes=16-27'])
+
+    def test_fragment_size_resuming_chunked(self):
+        node = {'ip': '1.2.3.4', 'port': 6200, 'device': 'sda'}
+        headers = {'transfer-encoding': 'chunked',
+                   'content-type': 'text/plain'}
+        source1 = FakeSource([b'abcd', b'1234', b'abc', None], headers=headers)
+        source2 = FakeSource([b'efgh5678'], headers=headers)
+        range_headers = []
+        sources = [GetterSource(self.app, src, node)
+                   for src in (source1, source2)]
+
+        def mock_source_gen():
+            for source in sources:
+                range_headers.append(self.getter.backend_headers.get('Range'))
+                yield source
+
+        self.getter.fragment_size = 8
+        with mock.patch.object(self.getter, '_source_gen',
+                               mock_source_gen):
+            it = self.getter.response_parts_iter()
+            fragments = list(next(it)['part_iter'])
+        self.assertEqual(fragments, [b'abcd1234', b'efgh5678'])
+        self.assertEqual(range_headers, [None, 'bytes=8-'])
+
+
+@patch_policies()
+class TestGetUpdateShard(BaseObjectControllerMixin, unittest.TestCase):
+    bound_prefix = 'x'
+    item = 'x1_test'
+
+    def setUp(self):
+        super(TestGetUpdateShard, self).setUp()
+        self.ctrl = obj.BaseObjectController(self.app, 'a', 'c', 'o')
+        self.memcache = FakeMemcache()
+        ts_iter = make_timestamp_iter()
+        # NB: these shard ranges have gaps
+        self.shard_ranges = [ShardRange(
+            '.sharded_a/sr%d' % i, next(ts_iter),
+            self.bound_prefix + u'%d_lower' % i,
+            self.bound_prefix + u'%d_upper' % i,
+            object_count=i, bytes_used=1024 * i,
+            meta_timestamp=next(ts_iter))
+            for i in range(3)]
+
+    def _create_response_data(self, shards, includes=None):
+        resp_headers = {'X-Backend-Record-Type': 'shard',
+                        'X-Backend-Record-Shard-Format': 'namespace'}
+        namespaces = [Namespace(sr.name, sr.lower, sr.upper)
+                      for sr in shards]
+        if includes is not None:
+            namespaces = [ns for ns in namespaces if includes in ns]
+        body = json.dumps([dict(ns) for ns in namespaces]).encode('ascii')
+        return body, resp_headers
+
+    def test_get_update_shard_cache_writing(self):
+        # verify case when complete set of shards is returned
+        req = Request.blank('/v1/a/c/o', method='PUT',
+                            environ={'swift.cache': self.memcache})
+        body, resp_headers = self._create_response_data(self.shard_ranges)
+        with mocked_http_conn(
+                200, 200, body_iter=iter([b'', body]),
+                headers=resp_headers) as fake_conn:
+            actual = self.ctrl._get_update_shard(req, 'a', 'c', self.item)
+
+        # account info
+        captured = fake_conn.requests
+        self.assertEqual('HEAD', captured[0]['method'])
+        self.assertEqual('a', captured[0]['path'][7:])
+        # container GET
+        self.assertEqual('GET', captured[1]['method'])
+        self.assertEqual('a/c', captured[1]['path'][7:])
+        params = sorted(captured[1]['qs'].split('&'))
+        self.assertEqual(
+            ['format=json', 'states=updating'], params)
+        captured_hdrs = captured[1]['headers']
+        self.assertEqual('shard', captured_hdrs.get('X-Backend-Record-Type'))
+        self.assertEqual('namespace',
+                         captured_hdrs.get('X-Backend-Record-Shard-Format'))
+        exp_bounds = NamespaceBoundList.parse(self.shard_ranges).bounds
+        self.assertEqual(json.loads(json.dumps(exp_bounds)),
+                         self.memcache.get('shard-updating-v2/a/c'))
+        exp_ns = Namespace(self.shard_ranges[1].name,
+                           self.shard_ranges[1].lower,
+                           self.shard_ranges[2].lower)
+        self.assertEqual(exp_ns, actual)
+        self.assertFalse(self.app.logger.get_lines_for_level('error'))
+
+    def test_get_update_shard_cache_reading(self):
+        # verify case when complete set of shards is in cache
+        cached_bounds = NamespaceBoundList.parse(self.shard_ranges).bounds
+        self.memcache.set('shard-updating-v2/a/c', cached_bounds)
+        req = Request.blank('/v1/a/c/o', method='PUT',
+                            environ={'swift.cache': self.memcache})
+
+        actual = self.ctrl._get_update_shard(req, 'a', 'c', self.item)
+
+        self.assertEqual(json.loads(json.dumps(cached_bounds)),
+                         self.memcache.get('shard-updating-v2/a/c'))
+        exp_ns = Namespace(self.shard_ranges[1].name,
+                           self.shard_ranges[1].lower,
+                           self.shard_ranges[2].lower)
+        self.assertEqual(exp_ns, actual)
+        self.assertFalse(self.app.logger.get_lines_for_level('error'))
+
+    def test_get_update_shard_cache_recheck_time_zero(self):
+        # verify case when shard caching is disabled
+        req = Request.blank('/v1/a/c/o', method='PUT',
+                            environ={'swift.cache': self.memcache})
+        body, resp_headers = self._create_response_data(
+            self.shard_ranges, self.item)
+        with mock.patch.object(self.app, 'recheck_updating_shard_ranges', 0):
+            with mocked_http_conn(
+                    200, 200, body_iter=iter([b'', body]),
+                    headers=resp_headers) as fake_conn:
+                actual = self.ctrl._get_update_shard(req, 'a', 'c', self.item)
+
+        # account info
+        captured = fake_conn.requests
+        self.assertEqual('HEAD', captured[0]['method'])
+        self.assertEqual('a', captured[0]['path'][7:])
+        # container GET
+        self.assertEqual('GET', captured[1]['method'])
+        self.assertEqual('a/c', captured[1]['path'][7:])
+        params = sorted(captured[1]['qs'].split('&'))
+        self.assertEqual(
+            ['format=json', 'includes=' + quote(self.item), 'states=updating'],
+            params)
+        captured_hdrs = captured[1]['headers']
+        self.assertEqual('shard', captured_hdrs.get('X-Backend-Record-Type'))
+        self.assertEqual('namespace',
+                         captured_hdrs.get('X-Backend-Record-Shard-Format'))
+        self.assertIsNone(self.memcache.get('shard-updating-v2/a/c'))
+        exp_ns = Namespace(self.shard_ranges[1].name,
+                           self.shard_ranges[1].lower,
+                           self.shard_ranges[1].upper)
+        self.assertEqual(exp_ns, actual)
+        self.assertFalse(self.app.logger.get_lines_for_level('error'))
+
+    def test_get_update_shard_cache_not_available(self):
+        # when memcache is not available, object controller will only need to
+        # retrieve a specific shard range from the container server to send the
+        # update request to.
+        req = Request.blank('/v1/a/c/o', method='PUT')
+        body, resp_headers = self._create_response_data([self.shard_ranges[1]])
+        with mocked_http_conn(
+                200, 200, body_iter=iter([b'', body]),
+                headers=resp_headers) as fake_conn:
+            actual = self.ctrl._get_update_shard(req, 'a', 'c', self.item)
+
+        # account info
+        captured = fake_conn.requests
+        self.assertEqual('HEAD', captured[0]['method'])
+        self.assertEqual('a', captured[0]['path'][7:])
+        # container GET
+        self.assertEqual('GET', captured[1]['method'])
+        self.assertEqual('a/c', captured[1]['path'][7:])
+        params = sorted(captured[1]['qs'].split('&'))
+        self.assertEqual(
+            ['format=json', 'includes=' + quote(self.item), 'states=updating'],
+            params
+        )
+        captured_hdrs = captured[1]['headers']
+        self.assertEqual('shard', captured_hdrs.get('X-Backend-Record-Type'))
+        self.assertEqual('namespace',
+                         captured_hdrs.get('X-Backend-Record-Shard-Format'))
+        self.assertIsNone(self.memcache.get('shard-updating-v2/a/c'))
+        exp_ns = Namespace(self.shard_ranges[1].name,
+                           self.shard_ranges[1].lower,
+                           self.shard_ranges[1].upper)
+        self.assertEqual(exp_ns, actual)
+        self.assertFalse(self.app.logger.get_lines_for_level('error'))
+
+    def test_get_update_shard_empty_body(self):
+        # verify case when no shards are returned
+        req = Request.blank('/v1/a/c/o', method='PUT',
+                            environ={'swift.cache': self.memcache})
+
+        body, resp_headers = self._create_response_data(self.shard_ranges)
+        with mocked_http_conn(
+                200, 200, body_iter=[b'', b''],
+                headers=resp_headers) as fake_conn:
+            actual = self.ctrl._get_update_shard(req, 'a', 'c', self.item)
+
+        # account info
+        captured = fake_conn.requests
+        self.assertEqual('HEAD', captured[0]['method'])
+        self.assertEqual('a', captured[0]['path'][7:])
+        # container GET
+        self.assertEqual('GET', captured[1]['method'])
+        self.assertEqual('a/c', captured[1]['path'][7:])
+        params = sorted(captured[1]['qs'].split('&'))
+        self.assertEqual(
+            ['format=json', 'states=updating'], params)
+        captured_hdrs = captured[1]['headers']
+        self.assertEqual('shard', captured_hdrs.get('X-Backend-Record-Type'))
+        self.assertEqual('namespace',
+                         captured_hdrs.get('X-Backend-Record-Shard-Format'))
+        self.assertIsNone(self.memcache.get('shard-updating-v2/a/c'))
+        self.assertIsNone(actual)
+
+        error_lines = self.logger.get_lines_for_level('error')
+        start = 'Problem with container shard listing response from /v1/a/c?'
+        msg, _, _ = error_lines[0].partition(':')
+        self.assertEqual(start, msg[:len(start)])
+        actual_qs = msg[len(start):]
+        actual_params = dict(parse_qsl(actual_qs, keep_blank_values=True))
+        self.assertEqual({'format': 'json', 'states': 'updating'},
+                         actual_params)
+        self.assertFalse(error_lines[1:])
+
+
+class TestGetUpdateShardUTF8(TestGetUpdateShard):
+    bound_prefix = u'\u1234'
+    item = wsgi_to_str('\xe1\x88\xb41_test')
+
+
+class TestGetUpdateShardLegacy(TestGetUpdateShard):
+    def _create_response_data(self, shards, includes=None):
+        # older container servers never return the shorter 'namespace' format
+        # nor the 'X-Backend-Record-Shard-Format' header
+        resp_headers = {'X-Backend-Record-Type': 'shard'}
+        if includes is not None:
+            shards = [sr for sr in shards if includes in sr]
+        body = json.dumps([dict(sr) for sr in shards]).encode('ascii')
+        return body, resp_headers
+
+
+class TestGetUpdateShardLegacyUTF8(TestGetUpdateShard):
+    bound_prefix = u'\u1234'
+    item = wsgi_to_str('\xe1\x88\xb41_test')
+
+
+@patch_policies()
+class TestGetUpdatingNamespacesErrors(BaseObjectControllerMixin,
+                                      unittest.TestCase):
+    def setUp(self):
+        super(TestGetUpdatingNamespacesErrors, self).setUp()
+        self.ctrl = obj.BaseObjectController(self.app, 'a', 'c', 'o')
+
+    def _check_get_namespaces_bad_data(self, body):
+        req = Request.blank('/v1/a/c/o', method='PUT')
+        # empty response
+        resp_headers = {'X-Backend-Record-Type': 'shard'}
+        with mocked_http_conn(200, 200, body_iter=iter([b'', body]),
+                              headers=resp_headers):
+            actual, resp = self.ctrl._do_get_updating_namespaces(
+                req, 'a', 'c', '1_test')
+        self.assertEqual(200, resp.status_int)
+        self.assertIsNone(actual)
+        lines = self.app.logger.get_lines_for_level('error')
+        return lines
+
+    def test_get_namespaces_empty_body(self):
+        error_lines = self._check_get_namespaces_bad_data(b'')
+        start = 'Problem with container shard listing response from /v1/a/c?'
+        msg, _, err = error_lines[0].partition(':')
+        self.assertEqual(start, msg[:len(start)])
+        actual_qs = msg[len(start):]
+        actual_params = dict(parse_qsl(actual_qs, keep_blank_values=True))
+        self.assertEqual({'format': 'json',
+                          'includes': '1_test',
+                          'states': 'updating'},
+                         actual_params)
+        self.assertIn('JSONDecodeError', err)
+        self.assertFalse(error_lines[1:])
+
+    def test_get_namespaces_not_a_list(self):
+        body = json.dumps({}).encode('ascii')
+        error_lines = self._check_get_namespaces_bad_data(body)
+        start = 'Problem with container shard listing response from /v1/a/c?'
+        msg, _, err = error_lines[0].partition(':')
+        self.assertEqual(start, msg[:len(start)])
+        actual_qs = msg[len(start):]
+        actual_params = dict(parse_qsl(actual_qs, keep_blank_values=True))
+        self.assertEqual({'format': 'json',
+                          'includes': '1_test',
+                          'states': 'updating'},
+                         actual_params)
+        self.assertIn('ValueError', err)
+        self.assertFalse(error_lines[1:])
+
+    def test_get_namespaces_key_missing(self):
+        body = json.dumps([{}]).encode('ascii')
+        error_lines = self._check_get_namespaces_bad_data(body)
+        self.assertIn('Failed to get namespaces', error_lines[0])
+        self.assertIn('KeyError', error_lines[0])
+        self.assertFalse(error_lines[1:])
+
+    def test_get_namespaces_invalid_shard_range(self):
+        # lower > upper !
+        bad_ns_data = {'name': 'name', 'lower': 'z', 'upper': 'a'}
+        body = json.dumps([bad_ns_data]).encode('ascii')
+        error_lines = self._check_get_namespaces_bad_data(body)
+        self.assertIn('Failed to get namespaces', error_lines[0])
+        self.assertIn('ValueError', error_lines[0])
+        self.assertFalse(error_lines[1:])
+
+    def test_get_namespaces_missing_record_type(self):
+        req = Request.blank('/v1/a/c/o', method='PUT')
+        sr = utils.Namespace('a/c', 'l', 'u')
+        body = json.dumps([dict(sr)]).encode('ascii')
+        with mocked_http_conn(
+                200, 200, body_iter=iter([b'', body])):
+            actual, resp = self.ctrl._do_get_updating_namespaces(
+                req, 'a', 'c', '1_test')
+        self.assertEqual(200, resp.status_int)
+        self.assertIsNone(actual)
+        error_lines = self.app.logger.get_lines_for_level('error')
+        self.assertIn('Failed to get shard ranges', error_lines[0])
+        self.assertIn('unexpected record type', error_lines[0])
+        self.assertIn('/a/c', error_lines[0])
+        self.assertFalse(error_lines[1:])
+
+    def test_get_namespaces_wrong_record_type(self):
+        req = Request.blank('/v1/a/c/o', method='PUT')
+        sr = utils.Namespace('a/c', 'l', 'u')
+        body = json.dumps([dict(sr)]).encode('ascii')
+        headers = {'X-Backend-Record-Type': 'object'}
+        with mocked_http_conn(
+                200, 200, body_iter=iter([b'', body]),
+                headers=headers):
+            actual, resp = self.ctrl._do_get_updating_namespaces(
+                req, 'a', 'c', '1_test')
+        self.assertEqual(200, resp.status_int)
+        self.assertIsNone(actual)
+        error_lines = self.app.logger.get_lines_for_level('error')
+        self.assertIn('Failed to get shard ranges', error_lines[0])
+        self.assertIn('unexpected record type', error_lines[0])
+        self.assertIn('/a/c', error_lines[0])
+        self.assertFalse(error_lines[1:])
+
+    def test_get_namespaces_request_failed(self):
+        req = Request.blank('/v1/a/c/o', method='PUT')
+        with mocked_http_conn(200, 404, 404, 404):
+            actual, resp = self.ctrl._do_get_updating_namespaces(
+                req, 'a', 'c', '1_test')
+        self.assertEqual(404, resp.status_int)
+        self.assertIsNone(actual)
+        self.assertFalse(self.app.logger.get_lines_for_level('error'))
+        warning_lines = self.app.logger.get_lines_for_level('warning')
+        start = 'Failed to get container shard listing from /v1/a/c?'
+        msg, _, status_txn = warning_lines[0].partition(': ')
+        self.assertEqual(start, msg[:len(start)])
+        actual_qs = msg[len(start):]
+        actual_params = dict(parse_qsl(actual_qs, keep_blank_values=True))
+        self.assertEqual({'format': 'json',
+                          'includes': '1_test',
+                          'states': 'updating'},
+                         actual_params)
+        self.assertEqual('404', status_txn[:3])
+        self.assertFalse(warning_lines[1:])
+
+
+@patch_policies([
+    StoragePolicy(0, 'zero', is_default=True, object_ring=FakeRing()),
+    StoragePolicy(1, 'one', object_ring=FakeRing()),
+])
+class TestCooperativeToken(BaseObjectControllerMixin, unittest.TestCase):
+    """
+    Test suite for cooperative token functionality in object controllers
+    """
+
+    def setUp(self):
+        super(TestCooperativeToken, self).setUp()
+        conf = {
+            'log_statsd_host': 'host',
+            'log_statsd_port': 8125,
+            'statsd_label_mode': 'dogstatsd',
+            'statsd_emit_legacy': True,
+        }
+        self.statsd = debug_labeled_statsd_client(conf)
+        # Reset the application with statsd
+        self.app = PatchedObjControllerApp(
+            conf, account_ring=FakeRing(),
+            container_ring=FakeRing(), logger=self.logger)
+        self.app.statsd = self.statsd
+        self.logger.clear()
+
+    def _check_request(self, request, method=None, path=None, headers=None,
+                       params=None):
+        """Helper method to check request attributes"""
+        if method:
+            self.assertEqual(request['method'], method)
+        if path:
+            self.assertEqual(request['path'], path)
+        if headers:
+            for header, value in headers.items():
+                self.assertEqual(request['headers'][header], value)
+        if params:
+            actual_params = dict(parse_qsl(request['qs'],
+                                           keep_blank_values=True))
+            self.assertEqual(actual_params, params)
+
+    def test_get_backend_updating_shard_with_cooperative_token_configs(self):
+        conf = {}
+        self.app = proxy_server.Application(
+            conf,
+            logger=self.logger,
+            account_ring=FakeRing(),
+            container_ring=FakeRing())
+        self.assertEqual(self.app.namespace_avg_backend_fetch_time, 0.3)
+        self.assertEqual(self.app.namespace_cache_tokens_per_session, 3)
+
+        conf = {'namespace_cache_tokens_per_session': '0'}
+        self.app = proxy_server.Application(
+            conf,
+            logger=self.logger,
+            account_ring=FakeRing(),
+            container_ring=FakeRing())
+        self.assertEqual(self.app.namespace_avg_backend_fetch_time, 0.3)
+        self.assertEqual(self.app.namespace_cache_tokens_per_session, 0)
+
+        conf = {'namespace_avg_backend_fetch_time': 0.2,
+                'namespace_cache_tokens_per_session': 1}
+        self.app = proxy_server.Application(
+            conf,
+            logger=self.logger,
+            account_ring=FakeRing(),
+            container_ring=FakeRing())
+        self.assertEqual(self.app.namespace_avg_backend_fetch_time, 0.2)
+        self.assertEqual(self.app.namespace_cache_tokens_per_session, 1)
+
+        conf = {'namespace_avg_backend_fetch_time': 0.2,
+                'namespace_cache_tokens_per_session': 1}
+        self.app = proxy_server.Application(
+            conf,
+            logger=self.logger,
+            account_ring=FakeRing(),
+            container_ring=FakeRing())
+        self.assertEqual(self.app.namespace_avg_backend_fetch_time, 0.2)
+        self.assertEqual(self.app.namespace_cache_tokens_per_session, 1)
+
+    def test_get_backend_updating_shard_with_cooperative_token_acquired(self):
+        # verify that the request to get updating shard from the container
+        # backend works with cooperative token acquired.
+        # reset the router post patch_policies
+        conf = {}
+        self.app = proxy_server.Application(
+            conf,
+            logger=self.logger,
+            statsd=self.statsd,
+            account_ring=FakeRing(),
+            container_ring=FakeRing())
+        self.app.sort_nodes = lambda nodes, *args, **kwargs: nodes
+
+        def do_test(method, sharding_state):
+            self.app.logger.clear()  # clean capture state
+            self.app.statsd.clear()
+            req = Request.blank(
+                '/v1/a/c/o', {'swift.cache': FakeMemcache()},
+                method=method, body='', headers={'Content-Type': 'text/plain'})
+
+            cache_key = 'shard-updating-v2/a/c'
+            token_key = "_cache_token/%s" % cache_key
+            if not random.choice([True, False]):
+                # Add some randomization to this test case. If True, this
+                # request which gets updating shard will be the first to
+                # acquire a token; otherwise, it would be the second one.
+                req.environ['swift.cache'].incr(token_key)
+
+            # we want the container_info response to say policy index of 1 and
+            # sharding state
+            # acc HEAD, cont HEAD, cont shard GET, obj POSTs
+            status_codes = (200, 200, 200, 202, 202, 202)
+            resp_headers = {'X-Backend-Storage-Policy-Index': 1,
+                            'x-backend-sharding-state': sharding_state,
+                            'X-Backend-Record-Type': 'shard'}
+            shard_ranges = [
+                utils.ShardRange(
+                    '.shards_a/c_not_used', utils.Timestamp.now(), '', 'l'),
+                utils.ShardRange(
+                    '.shards_a/c_shard', utils.Timestamp.now(), 'l', 'u'),
+                utils.ShardRange(
+                    '.shards_a/c_nope', utils.Timestamp.now(), 'u', ''),
+            ]
+            body = json.dumps([
+                dict(shard_range)
+                for shard_range in shard_ranges]).encode('ascii')
+            with mocked_http_conn(*status_codes, headers=resp_headers,
+                                  body=body) as fake_conn:
+                resp = req.get_response(self.app)
+
+            self.assertEqual(resp.status_int, 202)
+            stats = self.app.logger.statsd_client.get_stats_counts()
+            self.assertEqual(
+                {
+                    "account.info.cache.miss.200": 1,
+                    "account.info.infocache.hit": 2,
+                    "container.info.cache.miss.200": 1,
+                    "container.info.infocache.hit": 1,
+                    "object.shard_updating.cache.miss.200": 1,
+                    "object.shard_updating.cache.set": 1,
+                },
+                stats,
+            )
+            stats = self.app.statsd.get_labeled_stats_counts()
+            self.assertEqual({
+                ('swift_coop_cache', frozenset((
+                    ('resource', 'shard_updating'),
+                    ('account', 'a'),
+                    ('container', 'c'),
+                    ('event', 'backend_reqs'),
+                    ('set_cache_state', 'set'),
+                    ('token', 'with_token'),
+                    ('status', 200)),
+                )): 1,
+            }, stats)
+            self.assertEqual([], self.app.logger.log_dict['set_statsd_prefix'])
+            info_lines = self.logger.get_lines_for_level('info')
+            self.assertIn(
+                'Caching updating shards for shard-updating-v2/a/c (3 shards)'
+                ' with a finished token',
+                info_lines)
+
+            backend_requests = fake_conn.requests
+            account_request = backend_requests[0]
+            self._check_request(
+                account_request, method='HEAD', path='/sda/0/a')
+            container_request = backend_requests[1]
+            self._check_request(
+                container_request, method='HEAD', path='/sda/0/a/c')
+            container_request_shard = backend_requests[2]
+            self._check_request(
+                container_request_shard, method='GET', path='/sda/0/a/c',
+                params={'states': 'updating', 'format': 'json'},
+                headers={'X-Backend-Record-Type': 'shard'})
+
+            self.assertIn(cache_key, req.environ['swift.cache'].store)
+            cached_namespaces = NamespaceBoundList.parse(shard_ranges)
+            self.assertEqual(
+                req.environ['swift.cache'].store[cache_key],
+                cached_namespaces.bounds)
+            self.assertIn(cache_key, req.environ.get('swift.infocache'))
+            self.assertEqual(
+                req.environ['swift.infocache'][cache_key].bounds,
+                cached_namespaces.bounds)
+
+            # make sure backend requests included expected container headers
+            for (i, device), request in zip(
+                    enumerate(['sda', 'sdb', 'sdc']), backend_requests[3:]):
+                expectations = {
+                    'method': method,
+                    'path': f'/{device}/0/a/c/o',
+                    'headers': {
+                        'X-Container-Partition': '0',
+                        'Host': 'localhost:80',
+                        'Referer': '%s http://localhost/v1/a/c/o' % method,
+                        'X-Backend-Storage-Policy-Index': '1',
+                        'X-Backend-Quoted-Container-Path':
+                            shard_ranges[1].name,
+                        'X-Container-Device': device,
+                        'X-Container-Host': '10.0.0.%d:100%d' % (i, i),
+                    },
+                }
+                self._check_request(request, **expectations)
+
+        do_test('POST', 'sharding')
+        do_test('POST', 'sharded')
+        do_test('DELETE', 'sharding')
+        do_test('DELETE', 'sharded')
+        do_test('PUT', 'sharding')
+        do_test('PUT', 'sharded')
+
+    def test_get_backend_updating_shard_wo_cooperative_token_acquired(self):
+        # verify that the request to get updating shard from the container
+        # backend will be served out of memcached when other requests have
+        # grabbed all available cooperative tokens and filled the updating
+        # shard ranges into the memcache.
+        # reset the router post patch_policies
+        conf = {
+            'namespace_cache_tokens_per_session': 2,
+            'namespace_avg_backend_fetch_time': 0.05,
+        }
+        self.app = proxy_server.Application(
+            conf,
+            logger=self.logger,
+            statsd=self.statsd,
+            account_ring=FakeRing(),
+            container_ring=FakeRing())
+        self.app.sort_nodes = lambda nodes, *args, **kwargs: nodes
+        cache_key = 'shard-updating-v2/a/c'
+        token_key = "_cache_token/%s" % cache_key
+
+        def do_test(method, sharding_state):
+            retries = 0
+
+            class CustomizedFakeCache(FakeMemcache):
+                def get(self, key, raise_on_error=False):
+                    nonlocal retries
+                    if key != cache_key:
+                        return super(CustomizedFakeCache, self).get(key)
+
+                    retries += 1
+                    if retries < 4:
+                        return super(CustomizedFakeCache, self).get(
+                            "NOT_EXISTED_YET")
+                    else:
+                        return super(CustomizedFakeCache, self).get(key)
+
+            self.app.logger.clear()  # clean capture state
+            self.app.statsd.clear()
+            req = Request.blank(
+                '/v1/a/c/o', {'swift.cache': CustomizedFakeCache()},
+                method=method, body='', headers={'Content-Type': 'text/plain'})
+
+            # we want the container_info response to say policy index of 1 and
+            # sharding state
+            # acc HEAD, cont HEAD, obj POSTs
+            status_codes = (200, 200, 202, 202, 202)
+            resp_headers = {'X-Backend-Storage-Policy-Index': 1,
+                            'x-backend-sharding-state': sharding_state,
+                            'X-Backend-Record-Type': 'shard'}
+            shard_ranges = [
+                utils.ShardRange(
+                    '.shards_a/c_not_used', utils.Timestamp.now(), '', 'l'),
+                utils.ShardRange(
+                    '.shards_a/c_shard', utils.Timestamp.now(), 'l', 'u'),
+                utils.ShardRange(
+                    '.shards_a/c_nope', utils.Timestamp.now(), 'u', ''),
+            ]
+            cached_namespaces = NamespaceBoundList.parse(shard_ranges)
+            body = json.dumps([
+                dict(shard_range)
+                for shard_range in shard_ranges]).encode('ascii')
+
+            # Preset 'token_key' to be value of 3, then make this request of
+            # getting updating shard to not able to acquire a token.
+            req.environ['swift.cache'].incr(token_key, 3)
+            # Preset the cache value, but only available after 4 retries.
+            req.environ['swift.cache'].set(cache_key, cached_namespaces.bounds)
+
+            with mock.patch('swift.common.utils.eventlet.sleep'), \
+                    mocked_http_conn(*status_codes, headers=resp_headers,
+                                     body=body) as fake_conn:
+                resp = req.get_response(self.app)
+
+            self.assertEqual(4, retries)
+            self.assertEqual(resp.status_int, 202)
+            stats = self.app.logger.statsd_client.get_stats_counts()
+            self.assertEqual({'account.info.cache.miss.200': 1,
+                              'account.info.infocache.hit': 1,
+                              'container.info.cache.miss.200': 1,
+                              'container.info.infocache.hit': 1,
+                              'object.shard_updating.cache.miss': 1,
+                              },
+                             stats)
+            stats = self.app.statsd.get_labeled_stats_counts()
+            self.assertEqual({
+                ('swift_coop_cache', frozenset((
+                    ('resource', 'shard_updating'),
+                    ('account', 'a'),
+                    ('container', 'c'),
+                    ('event', 'cache_served'),
+                    ('token', 'no_token'),
+                    ('lack_retries', False)),
+                )): 1,
+            }, stats)
+            self.assertEqual([], self.app.logger.log_dict['set_statsd_prefix'])
+
+            backend_requests = fake_conn.requests
+            account_request = backend_requests[0]
+            self._check_request(
+                account_request, method='HEAD', path='/sda/0/a')
+            container_request = backend_requests[1]
+            self._check_request(
+                container_request, method='HEAD', path='/sda/0/a/c')
+
+            self.assertIn(cache_key, req.environ['swift.cache'].store)
+            self.assertEqual(
+                req.environ['swift.cache'].store[cache_key],
+                cached_namespaces.bounds)
+
+            # make sure backend requests included expected container headers
+            for (i, device), request in zip(
+                    enumerate(['sda', 'sdb', 'sdc']), backend_requests[2:]):
+                expectations = {
+                    'method': method,
+                    'path': f'/{device}/0/a/c/o',
+                    'headers': {
+                        'X-Container-Partition': '0',
+                        'Host': 'localhost:80',
+                        'Referer': '%s http://localhost/v1/a/c/o' % method,
+                        'X-Backend-Storage-Policy-Index': '1',
+                        'X-Backend-Quoted-Container-Path':
+                            shard_ranges[1].name,
+                        'X-Container-Device': device,
+                        'X-Container-Host': '10.0.0.%d:100%d' % (i, i),
+                    },
+                }
+                self._check_request(request, **expectations)
+
+        do_test('POST', 'sharding')
+        do_test('POST', 'sharded')
+        do_test('DELETE', 'sharding')
+        do_test('DELETE', 'sharded')
+        do_test('PUT', 'sharding')
+        do_test('PUT', 'sharded')
+
+    def test_get_backend_updating_shard_wo_token_lack_retries(self):
+        # verify that the request to get updating shard from the container
+        # backend will be served out of memcached when other requests have
+        # grabbed all available cooperative tokens. Due to simulated busy
+        # eventlet scheduler, this request would be underserved and only get
+        # two normal retries during the token session, but eventually get data
+        # from cache by use of the forced retry.
+        # reset the router post patch_policies
+        conf = {
+            'namespace_avg_backend_fetch_time': 0.005,
+        }
+        self.app = proxy_server.Application(
+            conf,
+            logger=self.logger,
+            statsd=self.statsd,
+            account_ring=FakeRing(),
+            container_ring=FakeRing())
+        self.app.obj_controller_router = proxy_server.ObjectControllerRouter()
+        self.app.sort_nodes = lambda nodes, *args, **kwargs: nodes
+        self.app.recheck_updating_shard_ranges = 3600
+        cache_key = 'shard-updating-v2/a/c'
+        token_key = "_cache_token/%s" % cache_key
+
+        def do_test(method, sharding_state):
+            retries = 0
+
+            class CustomizedFakeCache(FakeMemcache):
+                def get(self, key, raise_on_error=False):
+                    nonlocal retries
+                    if key != cache_key:
+                        return super(CustomizedFakeCache, self).get(key)
+
+                    retries += 1
+                    if retries < 3:
+                        return super(CustomizedFakeCache, self).get(
+                            "NOT_EXISTED_YET")
+                    else:
+                        return super(CustomizedFakeCache, self).get(key)
+
+            self.app.logger.clear()  # clean capture state
+            self.app.statsd.clear()
+            req = Request.blank(
+                '/v1/a/c/o', {'swift.cache': CustomizedFakeCache()},
+                method=method, body='', headers={'Content-Type': 'text/plain'})
+
+            # we want the container_info response to say policy index of 1 and
+            # sharding state
+            # acc HEAD, cont HEAD, obj POSTs
+            status_codes = (200, 200, 202, 202, 202)
+            resp_headers = {'X-Backend-Storage-Policy-Index': 1,
+                            'x-backend-sharding-state': sharding_state,
+                            'X-Backend-Record-Type': 'shard'}
+            shard_ranges = [
+                utils.ShardRange(
+                    '.shards_a/c_not_used', utils.Timestamp.now(), '', 'l'),
+                utils.ShardRange(
+                    '.shards_a/c_shard', utils.Timestamp.now(), 'l', 'u'),
+                utils.ShardRange(
+                    '.shards_a/c_nope', utils.Timestamp.now(), 'u', ''),
+            ]
+            cached_namespaces = NamespaceBoundList.parse(shard_ranges)
+            body = json.dumps([
+                dict(shard_range)
+                for shard_range in shard_ranges]).encode('ascii')
+
+            # Preset 'token_key' to be value of 3, then make this request of
+            # getting updating shard to not able to acquire a token.
+            req.environ['swift.cache'].incr(token_key, 3)
+            # Preset the cache value, but only available after 4 retries.
+            req.environ['swift.cache'].set(cache_key, cached_namespaces.bounds)
+
+            with mock.patch(
+                    'swift.proxy.controllers.obj.time.time') as mock_time, \
+                mock.patch('swift.common.utils.sleep') as mock_sleep, \
+                mocked_http_conn(
+                    *status_codes, headers=resp_headers, body=body) \
+                    as fake_conn:
+                mock_time.side_effect = itertools.count(4000.99, 1.0)
+                resp = req.get_response(self.app)
+
+            # our populator only sleeps once, when it wakes up we're past the
+            # deadline and make one more try!
+            self.assertEqual([mock.call(0.005 * 1.5)],
+                             mock_sleep.call_args_list)
+            # N.B. one of these memcache.get "attempts" happens *before*
+            # coop-populator; it's very first "retry" is already after cuttoff!
+            self.assertEqual(3, retries)
+            self.assertEqual(resp.status_int, 202)
+            stats = self.app.logger.statsd_client.get_stats_counts()
+            self.assertEqual({'account.info.cache.miss.200': 1,
+                              'account.info.infocache.hit': 1,
+                              'container.info.cache.miss.200': 1,
+                              'container.info.infocache.hit': 1,
+                              'object.shard_updating.cache.miss': 1},
+                             stats)
+            stats = self.app.statsd.get_labeled_stats_counts()
+            self.assertEqual({
+                ('swift_coop_cache', frozenset((
+                    ('resource', 'shard_updating'),
+                    ('account', 'a'),
+                    ('container', 'c'),
+                    ('event', 'cache_served'),
+                    ('token', 'no_token'),
+                    ('lack_retries', True)),
+                )): 1,
+            }, stats)
+            self.assertEqual([], self.app.logger.log_dict['set_statsd_prefix'])
+
+            backend_requests = fake_conn.requests
+            account_request = backend_requests[0]
+            self._check_request(
+                account_request, method='HEAD', path='/sda/0/a')
+            container_request = backend_requests[1]
+            self._check_request(
+                container_request, method='HEAD', path='/sda/0/a/c')
+
+            self.assertIn(cache_key, req.environ['swift.cache'].store)
+            self.assertEqual(
+                req.environ['swift.cache'].store[cache_key],
+                cached_namespaces.bounds)
+
+            # make sure backend requests included expected container headers
+            for (i, device), request in zip(
+                    enumerate(['sda', 'sdb', 'sdc']), backend_requests[2:]):
+                expectations = {
+                    'method': method,
+                    'path': f'/{device}/0/a/c/o',
+                    'headers': {
+                        'X-Container-Partition': '0',
+                        'Host': 'localhost:80',
+                        'Referer': '%s http://localhost/v1/a/c/o' % method,
+                        'X-Backend-Storage-Policy-Index': '1',
+                        'X-Backend-Quoted-Container-Path':
+                            shard_ranges[1].name,
+                        'X-Container-Device': device,
+                        'X-Container-Host': '10.0.0.%d:100%d' % (i, i),
+                    },
+                }
+                self._check_request(request, **expectations)
+
+        do_test('POST', 'sharding')
+        do_test('POST', 'sharded')
+        do_test('DELETE', 'sharding')
+        do_test('DELETE', 'sharded')
+        do_test('PUT', 'sharding')
+        do_test('PUT', 'sharded')
+
+    def test_get_backend_updating_shard_with_cooperative_token_timeout(self):
+        # verify that the request to get updating shard from the container
+        # backend works with cooperative token timeout.
+        conf = {
+            'namespace_avg_backend_fetch_time': 0.01,
+        }
+        self.app = proxy_server.Application(
+            conf,
+            logger=self.logger,
+            statsd=self.statsd,
+            account_ring=FakeRing(),
+            container_ring=FakeRing())
+        self.app.obj_controller_router = proxy_server.ObjectControllerRouter()
+        self.app.sort_nodes = lambda nodes, *args, **kwargs: nodes
+        self.app.recheck_updating_shard_ranges = 3600
+        cache_key = 'shard-updating-v2/a/c'
+        token_key = "_cache_token/%s" % cache_key
+
+        def do_test(method, sharding_state):
+
+            class CustomizedFakeCache(FakeMemcache):
+                def get(self, key, raise_on_error=False):
+                    if key != cache_key:
+                        return super(CustomizedFakeCache, self).get(key)
+                    # all fail forever - just like real memcache!
+                    return super(CustomizedFakeCache, self).get(
+                        "NOT_EXISTED_YET")
+
+            self.app.logger.clear()  # clean capture state
+            self.app.statsd.clear()
+            req = Request.blank(
+                '/v1/a/c/o', {'swift.cache': CustomizedFakeCache()},
+                method=method, body='', headers={'Content-Type': 'text/plain'})
+
+            # Preset 'token_key' to be value of 3+, then make this request of
+            # getting updating shard to not able to acquire a token.
+            req.environ['swift.cache'].incr(token_key, 30)
+
+            # we want the container_info response to say policy index of 1 and
+            # sharding state
+            # acc HEAD, cont HEAD, cont shard GET, obj POSTs
+            status_codes = (200, 200, 200, 202, 202, 202)
+            resp_headers = {'X-Backend-Storage-Policy-Index': 1,
+                            'x-backend-sharding-state': sharding_state,
+                            'X-Backend-Record-Type': 'shard'}
+            shard_ranges = [
+                utils.ShardRange(
+                    '.shards_a/c_not_used', utils.Timestamp.now(), '', 'l'),
+                utils.ShardRange(
+                    '.shards_a/c_shard', utils.Timestamp.now(), 'l', 'u'),
+                utils.ShardRange(
+                    '.shards_a/c_nope', utils.Timestamp.now(), 'u', ''),
+            ]
+            body = json.dumps([
+                dict(shard_range)
+                for shard_range in shard_ranges]).encode('ascii')
+            with mocked_http_conn(*status_codes, headers=resp_headers,
+                                  body=body) as fake_conn:
+                resp = req.get_response(self.app)
+
+            self.assertEqual(resp.status_int, 202)
+            stats = self.app.logger.statsd_client.get_stats_counts()
+            self.assertEqual(
+                {
+                    'account.info.cache.miss.200': 1,
+                    'account.info.infocache.hit': 2,
+                    'container.info.cache.miss.200': 1,
+                    'container.info.infocache.hit': 1,
+                    'object.shard_updating.cache.miss.200': 1,
+                    'object.shard_updating.cache.set': 1,
+                },
+                stats
+            )
+            stats = self.app.statsd.get_labeled_stats_counts()
+            self.assertEqual({
+                ('swift_coop_cache', frozenset((
+                    ('resource', 'shard_updating'),
+                    ('account', 'a'),
+                    ('container', 'c'),
+                    ('event', 'backend_reqs'),
+                    ('token', 'no_token'),
+                    ('lack_retries', False),
+                    ('set_cache_state', 'set'),
+                    ('status', 200)),
+                )): 1,
+            }, stats)
+            self.assertEqual([], self.app.logger.log_dict['set_statsd_prefix'])
+            info_lines = self.logger.get_lines_for_level('info')
+            self.assertIn(
+                'Caching updating shards for shard-updating-v2/a/c (3 shards)',
+                info_lines)
+
+            backend_requests = fake_conn.requests
+            account_request = backend_requests[0]
+            self._check_request(
+                account_request, method='HEAD', path='/sda/0/a')
+            container_request = backend_requests[1]
+            self._check_request(
+                container_request, method='HEAD', path='/sda/0/a/c')
+            container_request_shard = backend_requests[2]
+            self._check_request(
+                container_request_shard, method='GET', path='/sda/0/a/c',
+                params={'states': 'updating', 'format': 'json'},
+                headers={'X-Backend-Record-Type': 'shard'})
+
+            self.assertIn(cache_key, req.environ['swift.cache'].store)
+            cached_namespaces = NamespaceBoundList.parse(shard_ranges)
+            self.assertEqual(
+                req.environ['swift.cache'].store[cache_key],
+                cached_namespaces.bounds)
+            self.assertIn(cache_key, req.environ.get('swift.infocache'))
+            self.assertEqual(
+                req.environ['swift.infocache'][cache_key].bounds,
+                cached_namespaces.bounds)
+
+            # make sure backend requests included expected container headers
+            for (i, device), request in zip(
+                    enumerate(['sda', 'sdb', 'sdc']), backend_requests[3:]):
+                expectations = {
+                    'method': method,
+                    'path': f'/{device}/0/a/c/o',
+                    'headers': {
+                        'X-Container-Partition': '0',
+                        'Host': 'localhost:80',
+                        'Referer': '%s http://localhost/v1/a/c/o' % method,
+                        'X-Backend-Storage-Policy-Index': '1',
+                        'X-Backend-Quoted-Container-Path':
+                            shard_ranges[1].name,
+                        'X-Container-Device': device,
+                        'X-Container-Host': '10.0.0.%d:100%d' % (i, i),
+                    },
+                }
+                self._check_request(request, **expectations)
+
+        do_test('POST', 'sharding')
+        do_test('POST', 'sharded')
+        do_test('DELETE', 'sharding')
+        do_test('DELETE', 'sharded')
+        do_test('PUT', 'sharding')
+        do_test('PUT', 'sharded')
+
+    def test_get_backend_updating_shard_concurrent_reqs_cooperatively(self):
+        self.memcache = FakeMemcache()
+        self.logger.clear()
+        self.statsd.clear()
+        conf = {
+            'namespace_cache_use_token': 'True',
+            'namespace_avg_backend_fetch_time': 0.003,
+        }
+        shard_ranges = [
+            utils.ShardRange(
+                '.shards_a/c_not_used', utils.Timestamp.now(), '', 'l'),
+            utils.ShardRange(
+                '.shards_a/c_shard', utils.Timestamp.now(), 'l', 'u'),
+            utils.ShardRange(
+                '.shards_a/c_nope', utils.Timestamp.now(), 'u', ''),
+        ]
+        cache_key = 'shard-updating-v2/a/c'
+
+        def delayed_fetch_backend(self):
+            eventlet.sleep(0.0005)
+            body = json.dumps([
+                dict(shard_range)
+                for shard_range in shard_ranges]).encode('ascii')
+            resp = Response(body=body, status=200)
+            return NamespaceBoundList.parse(shard_ranges), resp
+
+        def worker(method, unique_path):
+            app = proxy_server.Application(
+                conf,
+                logger=self.logger,
+                statsd=self.statsd,
+                account_ring=FakeRing(),
+                container_ring=FakeRing())
+            app.obj_controller_router = proxy_server.ObjectControllerRouter()
+            app.sort_nodes = lambda nodes, *args, **kwargs: nodes
+            app.recheck_updating_shard_ranges = 3600
+            req = Request.blank(
+                unique_path, {'swift.cache': self.memcache},
+                method=method, body='', headers={'Content-Type': 'text/plain'})
+            resp = req.get_response(app)
+            self.assertEqual(resp.status_int, 200)
+
+        num_processes = 10
+        status_codes = (200, 200, 200, 200, 200) * num_processes
+        # we want the container_info response to say policy index of 1 and
+        # sharding state
+        resp_headers = {
+            'X-Backend-Storage-Policy-Index': 1,
+            'x-backend-sharding-state': 'sharding',
+            'X-Backend-Record-Type': 'shard'
+        }
+        with mocked_http_conn(*status_codes, headers=resp_headers), \
+            mock.patch(
+                'swift.proxy.controllers.obj.'
+                'CooperativeNamespaceCachePopulator.do_fetch_backend',
+                delayed_fetch_backend):
+            pool = eventlet.GreenPool()
+            for i in range(num_processes):
+                pool.spawn(worker, 'POST', '/v1/a/c/o' + str(i))
+            pool.waitall()
+
+        stats = self.app.logger.statsd_client.get_stats_counts()
+        self.assertEqual(
+            {
+                "account.info.cache.miss.200": num_processes,
+                "account.info.infocache.hit": num_processes,
+                "container.info.cache.miss.200": num_processes,
+                "container.info.infocache.hit": num_processes,
+                "object.shard_updating.cache.set": 3,
+                "object.shard_updating.cache.miss.200": 3,
+                'object.shard_updating.cache.miss': num_processes - 3,
+            },
+            stats,
+        )
+        stats = self.app.statsd.get_labeled_stats_counts()
+        self.assertEqual({
+            ('swift_coop_cache', frozenset((
+                ('account', 'a'),
+                ('container', 'c'),
+                ('resource', 'shard_updating'),
+                ('event', 'backend_reqs'),
+                ('token', 'with_token'),
+                ('set_cache_state', 'set'),
+                ('status', 200)),
+            )): 3,
+            ('swift_coop_cache', frozenset((
+                ('account', 'a'),
+                ('container', 'c'),
+                ('resource', 'shard_updating'),
+                ('event', 'cache_served'),
+                ('token', 'no_token'),
+                ('lack_retries', False)),
+            )): num_processes - 3
+        }, stats)
+        self.assertEqual([], self.app.logger.log_dict['set_statsd_prefix'])
+        self.assertIn(cache_key, self.memcache.store)
+        cached_namespaces = NamespaceBoundList.parse(shard_ranges)
+        self.assertEqual(
+            self.memcache.store[cache_key], cached_namespaces.bounds)
+
+    def test_get_backend_updating_shard_concurrent_reqs_with_failures(self):
+        # Tests token-based cooperative caching resilience when 1-2 of the 3
+        # token winners fail to fetch shard ranges (503 errors) during 100
+        # concurrent requests. Verifies that other token winners successfully
+        # retry and cache results, serving the remaining 97-99 requests from
+        # cache without additional backend calls, demonstrating proper failure
+        # handling.
+        self.memcache = FakeMemcache()
+        self.logger.clear()
+        conf = {'namespace_cache_use_token': 'True'}
+        shard_ranges = [
+            utils.ShardRange(
+                '.shards_a/c_not_used', utils.Timestamp.now(), '', 'l'),
+            utils.ShardRange(
+                '.shards_a/c_shard', utils.Timestamp.now(), 'l', 'u'),
+            utils.ShardRange(
+                '.shards_a/c_nope', utils.Timestamp.now(), 'u', ''),
+        ]
+        cache_key = 'shard-updating-v2/a/c'
+        failures = random.randint(1, 2)
+        failures_injected = 0
+
+        def delayed_fetch_backend(self):
+            nonlocal failures_injected
+            eventlet.sleep(0.2)
+            body = json.dumps([
+                dict(shard_range)
+                for shard_range in shard_ranges]).encode('ascii')
+            resp = Response(body=body, status=200)
+            if failures_injected < failures:
+                failures_injected += 1
+                return None, Response(status=503)
+            else:
+                return NamespaceBoundList.parse(shard_ranges), resp
+
+        def worker(method, unique_path):
+            app = proxy_server.Application(
+                conf,
+                logger=self.logger,
+                statsd=self.statsd,
+                account_ring=FakeRing(),
+                container_ring=FakeRing())
+            app.obj_controller_router = proxy_server.ObjectControllerRouter()
+            app.sort_nodes = lambda nodes, *args, **kwargs: nodes
+            app.recheck_updating_shard_ranges = 3600
+            req = Request.blank(
+                unique_path, {'swift.cache': self.memcache},
+                method=method, body='', headers={'Content-Type': 'text/plain'})
+            resp = req.get_response(app)
+            self.assertEqual(resp.status_int, 200)
+
+        num_processes = 100
+        status_codes = ([200, 200, 200, 200, 200] * num_processes)
+        # we want the container_info response to say policy index of 1 and
+        # sharding state
+        resp_headers = {
+            'X-Backend-Storage-Policy-Index': 1,
+            'x-backend-sharding-state': 'sharding',
+            'X-Backend-Record-Type': 'shard'
+        }
+        with mocked_http_conn(*status_codes, headers=resp_headers), \
+                mock.patch(
+                    'swift.proxy.controllers.obj.'
+                    'CooperativeNamespaceCachePopulator.do_fetch_backend',
+                    delayed_fetch_backend):
+            pool = eventlet.GreenPool()
+            for i in range(num_processes):
+                pool.spawn(worker, 'POST', '/v1/a/c/o' + str(i))
+            pool.waitall()
+
+        stats = self.app.logger.statsd_client.get_stats_counts()
+        expected = {
+            'account.info.cache.miss.200': num_processes,
+            'account.info.infocache.hit': num_processes,
+            'container.info.cache.miss.200': num_processes,
+            'container.info.infocache.hit': num_processes,
+            'object.shard_updating.cache.miss.503': failures,
+            'object.shard_updating.cache.set': 3 - failures,
+            'object.shard_updating.cache.miss.200': 3 - failures,
+            'object.shard_updating.cache.miss': num_processes - 3,
+        }
+        self.assertEqual(expected, stats)
+
+        stats = self.app.statsd.get_labeled_stats_counts()
+        self.assertEqual({
+            ('swift_coop_cache', frozenset((
+                ('account', 'a'),
+                ('container', 'c'),
+                ('resource', 'shard_updating'),
+                ('event', 'backend_reqs'),
+                ('token', 'with_token'),
+                ('status', 503)),
+            )): failures,
+            ('swift_coop_cache', frozenset((
+                ('account', 'a'),
+                ('container', 'c'),
+                ('resource', 'shard_updating'),
+                ('event', 'backend_reqs'),
+                ('set_cache_state', 'set'),
+                ('token', 'with_token'),
+                ('status', 200)),
+            )): 3 - failures,
+            ('swift_coop_cache', frozenset((
+                ('account', 'a'),
+                ('container', 'c'),
+                ('resource', 'shard_updating'),
+                ('event', 'cache_served'),
+                ('token', 'no_token'),
+                ('lack_retries', False)),
+            )): num_processes - 3
+        }, stats)
+        self.assertEqual([], self.app.logger.log_dict['set_statsd_prefix'])
+        self.assertIn(cache_key, self.memcache.store)
+        cached_namespaces = NamespaceBoundList.parse(shard_ranges)
+        self.assertEqual(
+            self.memcache.store[cache_key], cached_namespaces.bounds)
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/proxy/test_mem_server.py b/test/unit/proxy/test_mem_server.py
new file mode 100644
index 0000000000..4dda8c5f87
--- /dev/null
+++ b/test/unit/proxy/test_mem_server.py
@@ -0,0 +1,84 @@
+# Copyright (c) 2010-2013 OpenStack, LLC.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+
+from test.unit.proxy import test_server
+
+from swift.obj import mem_server
+
+
+def setUpModule():
+    test_server.do_setup(mem_server)
+
+
+def tearDownModule():
+    test_server.tearDownModule()
+
+
+class TestController(test_server.TestController):
+    pass
+
+
+class TestProxyServer(test_server.TestProxyServer):
+    pass
+
+
+class TestReplicatedObjectController(
+        test_server.TestReplicatedObjectController):
+    def test_PUT_no_etag_fallocate(self):
+        # mem server doesn't call fallocate(), believe it or not
+        pass
+
+    # these tests all go looking in the filesystem
+    def test_policy_IO(self):
+        pass
+
+    def test_GET_short_read(self):
+        pass
+
+    def test_GET_short_read_resuming(self):
+        pass
+
+
+class TestECObjectController(test_server.TestECObjectController):
+    def test_PUT_ec(self):
+        pass
+
+    def test_PUT_ec_multiple_segments(self):
+        pass
+
+    def test_PUT_ec_fragment_archive_etag_mismatch(self):
+        pass
+
+    def test_reload_ring_ec(self):
+        pass
+
+
+class TestContainerController(test_server.TestContainerController):
+    pass
+
+
+class TestAccountController(test_server.TestAccountController):
+    pass
+
+
+class TestAccountControllerFakeGetResponse(
+        test_server.TestAccountControllerFakeGetResponse):
+    pass
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/unit/proxy/test_server.py b/test/unit/proxy/test_server.py
old mode 100755
new mode 100644
index bbac1ebf03..14ec3ba7c5
--- a/test/unit/proxy/test_server.py
+++ b/test/unit/proxy/test_server.py
@@ -1,4 +1,5 @@
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# -*- coding: utf-8 -*-
+# Copyright (c) 2010-2016 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,411 +14,246 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-from __future__ import with_statement
-import cPickle as pickle
+import email.parser
 import logging
-from logging.handlers import SysLogHandler
+import json
+import math
 import os
+import posix
+import socket
+import errno
 import sys
+import traceback
 import unittest
-import urlparse
-import signal
-from ConfigParser import ConfigParser
 from contextlib import contextmanager
-from cStringIO import StringIO
-from gzip import GzipFile
-from httplib import HTTPException
-from shutil import rmtree
-from time import time
-from urllib import unquote, quote
-from hashlib import md5
-from tempfile import mkdtemp
-
-import eventlet
-from eventlet import sleep, spawn, Timeout, util, wsgi, listen
-import simplejson
-
-from test.unit import connect_tcp, readuntil2crlfs, FakeLogger
+from shutil import rmtree, copyfile, move
+import gc
+import time
+from textwrap import dedent
+import collections
+from pyeclib.ec_iface import ECDriverError
+from tempfile import mkdtemp, NamedTemporaryFile
+import weakref
+import operator
+import functools
+from swift.obj import diskfile
+import re
+import random
+from collections import defaultdict
+import uuid
+
+from unittest import mock
+from eventlet import sleep, spawn, wsgi, Timeout, debug
+from eventlet.green.http import client as http_client
+from io import BytesIO
+
+from urllib.parse import quote, parse_qsl
+
+from test import listen_zero, BaseTestCase
+from test.debug_logger import debug_logger, FakeStatsdClient, \
+    debug_labeled_statsd_client
+from test.unit import (
+    connect_tcp, readuntil2crlfs, fake_http_connect, FakeRing,
+    FakeMemcache, patch_policies, write_fake_ring, mocked_http_conn,
+    DEFAULT_TEST_EC_TYPE, make_timestamp_iter, skip_if_no_xattrs,
+    FakeHTTPResponse, node_error_count, node_last_error, set_node_errors)
+from test.unit.helpers import setup_servers, teardown_servers
+from swift.common.statsd_client import StatsdClient
 from swift.proxy import server as proxy_server
-from swift.account import server as account_server
-from swift.container import server as container_server
+from swift.proxy.controllers.obj import ReplicatedObjectController
 from swift.obj import server as object_server
-from swift.common import ring
-from swift.common.exceptions import ChunkReadTimeout
-from swift.common.constraints import MAX_META_NAME_LENGTH, \
-    MAX_META_VALUE_LENGTH, MAX_META_COUNT, MAX_META_OVERALL_SIZE, \
-    MAX_FILE_SIZE, MAX_ACCOUNT_NAME_LENGTH, MAX_CONTAINER_NAME_LENGTH
-from swift.common import utils
-from swift.common.utils import mkdirs, normalize_timestamp, NullLogger
-from swift.common.wsgi import monkey_patch_mimetools
-from swift.proxy.controllers.obj import SegmentedIterable
-from swift.proxy.controllers.base import get_container_memcache_key, \
-    get_account_memcache_key
+from swift.common.bufferedhttp import BufferedHTTPResponse
+from swift.common.middleware import proxy_logging, versioned_writes, \
+    copy, listing_formats
+from swift.common.middleware.acl import parse_acl, format_acl
+from swift.common.exceptions import ChunkReadTimeout, DiskFileNotExist, \
+    DiskFileDeleted, APIVersionError, ChunkReadError
+from swift.common import utils, constraints, registry
+from swift.common.utils import hash_path, storage_directory, \
+    ShardRange, parse_content_type, parse_mime_headers, \
+    iter_multipart_mime_documents, public, mkdirs, NullLogger, md5, \
+    node_to_string, NamespaceBoundList
+from swift.common.wsgi import loadapp, ConfigString
+from swift.common.http_protocol import SwiftHttpProtocol
+from swift.container.backend import NOTFOUND, UNSHARDED, SHARDING, SHARDED, \
+    COLLAPSED
+from swift.proxy.controllers import base as proxy_base
+from swift.proxy.controllers.base import get_cache_key, cors_validation, \
+    get_account_info, get_container_info
 import swift.proxy.controllers
-from swift.common.swob import Request, Response, HTTPNotFound, \
-    HTTPUnauthorized
+import swift.proxy.controllers.obj
+from swift.common.header_key_dict import HeaderKeyDict
+from swift.common.swob import Request, Response, HTTPUnauthorized, \
+    HTTPException, HTTPBadRequest, wsgi_to_str
+from swift.common.storage_policy import StoragePolicy, POLICIES
+import swift.common.request_helpers
+from swift.common.request_helpers import get_sys_meta_prefix, get_reserved_name
 
 # mocks
 logging.getLogger().addHandler(logging.StreamHandler(sys.stdout))
 
 
-_request_instances = 0
-
-
-def request_init(self, *args, **kwargs):
-    global _request_instances
-    self._orig_init(*args, **kwargs)
-    _request_instances += 1
-
-
-def request_del(self):
-    global _request_instances
-    if self._orig_del:
-        self._orig_del()
-    _request_instances -= 1
-
-
-def setup():
-    utils.HASH_PATH_SUFFIX = 'endcap'
-    global _testdir, _test_servers, _test_sockets, \
-        _orig_container_listing_limit, _test_coros
-    Request._orig_init = Request.__init__
-    Request.__init__ = request_init
-    Request._orig_del = getattr(Request, '__del__', None)
-    Request.__del__ = request_del
-    monkey_patch_mimetools()
-    # Since we're starting up a lot here, we're going to test more than
-    # just chunked puts; we're also going to test parts of
-    # proxy_server.Application we couldn't get to easily otherwise.
-    _testdir = \
-        os.path.join(mkdtemp(), 'tmp_test_proxy_server_chunked')
-    mkdirs(_testdir)
-    rmtree(_testdir)
-    mkdirs(os.path.join(_testdir, 'sda1'))
-    mkdirs(os.path.join(_testdir, 'sda1', 'tmp'))
-    mkdirs(os.path.join(_testdir, 'sdb1'))
-    mkdirs(os.path.join(_testdir, 'sdb1', 'tmp'))
-    _orig_container_listing_limit = \
-        swift.proxy.controllers.obj.CONTAINER_LISTING_LIMIT
-    conf = {'devices': _testdir, 'swift_dir': _testdir,
-            'mount_check': 'false', 'allowed_headers':
-            'content-encoding, x-object-manifest, content-disposition, foo',
-            'allow_versions': 'True'}
-    prolis = listen(('localhost', 0))
-    acc1lis = listen(('localhost', 0))
-    acc2lis = listen(('localhost', 0))
-    con1lis = listen(('localhost', 0))
-    con2lis = listen(('localhost', 0))
-    obj1lis = listen(('localhost', 0))
-    obj2lis = listen(('localhost', 0))
-    _test_sockets = \
-        (prolis, acc1lis, acc2lis, con1lis, con2lis, obj1lis, obj2lis)
-    pickle.dump(ring.RingData([[0, 1, 0, 1], [1, 0, 1, 0]],
-                [{'id': 0, 'zone': 0, 'device': 'sda1', 'ip': '127.0.0.1',
-                  'port': acc1lis.getsockname()[1]},
-                 {'id': 1, 'zone': 1, 'device': 'sdb1', 'ip': '127.0.0.1',
-                  'port': acc2lis.getsockname()[1]}], 30),
-                GzipFile(os.path.join(_testdir, 'account.ring.gz'), 'wb'))
-    pickle.dump(ring.RingData([[0, 1, 0, 1], [1, 0, 1, 0]],
-                [{'id': 0, 'zone': 0, 'device': 'sda1', 'ip': '127.0.0.1',
-                  'port': con1lis.getsockname()[1]},
-                 {'id': 1, 'zone': 1, 'device': 'sdb1', 'ip': '127.0.0.1',
-                  'port': con2lis.getsockname()[1]}], 30),
-                GzipFile(os.path.join(_testdir, 'container.ring.gz'), 'wb'))
-    pickle.dump(ring.RingData([[0, 1, 0, 1], [1, 0, 1, 0]],
-                [{'id': 0, 'zone': 0, 'device': 'sda1', 'ip': '127.0.0.1',
-                  'port': obj1lis.getsockname()[1]},
-                 {'id': 1, 'zone': 1, 'device': 'sdb1', 'ip': '127.0.0.1',
-                  'port': obj2lis.getsockname()[1]}], 30),
-                GzipFile(os.path.join(_testdir, 'object.ring.gz'), 'wb'))
-    prosrv = proxy_server.Application(conf, FakeMemcacheReturnsNone())
-    acc1srv = account_server.AccountController(conf)
-    acc2srv = account_server.AccountController(conf)
-    con1srv = container_server.ContainerController(conf)
-    con2srv = container_server.ContainerController(conf)
-    obj1srv = object_server.ObjectController(conf)
-    obj2srv = object_server.ObjectController(conf)
-    _test_servers = \
-        (prosrv, acc1srv, acc2srv, con1srv, con2srv, obj1srv, obj2srv)
-    nl = NullLogger()
-    prospa = spawn(wsgi.server, prolis, prosrv, nl)
-    acc1spa = spawn(wsgi.server, acc1lis, acc1srv, nl)
-    acc2spa = spawn(wsgi.server, acc2lis, acc2srv, nl)
-    con1spa = spawn(wsgi.server, con1lis, con1srv, nl)
-    con2spa = spawn(wsgi.server, con2lis, con2srv, nl)
-    obj1spa = spawn(wsgi.server, obj1lis, obj1srv, nl)
-    obj2spa = spawn(wsgi.server, obj2lis, obj2srv, nl)
-    _test_coros = \
-        (prospa, acc1spa, acc2spa, con1spa, con2spa, obj1spa, obj2spa)
-    # Create account
-    ts = normalize_timestamp(time())
-    partition, nodes = prosrv.account_ring.get_nodes('a')
-    for node in nodes:
-        conn = swift.proxy.controllers.obj.http_connect(node['ip'],
-                                                        node['port'],
-                                                        node['device'],
-                                                        partition, 'PUT', '/a',
-                                                        {'X-Timestamp': ts,
-                                                         'x-trans-id': 'test'})
-        resp = conn.getresponse()
-        assert(resp.status == 201)
-    # Create container
-    sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-    fd = sock.makefile()
-    fd.write('PUT /v1/a/c HTTP/1.1\r\nHost: localhost\r\n'
-             'Connection: close\r\nX-Auth-Token: t\r\n'
-             'Content-Length: 0\r\n\r\n')
-    fd.flush()
-    headers = readuntil2crlfs(fd)
-    exp = 'HTTP/1.1 201'
-    assert(headers[:len(exp)] == exp)
-
-
-def teardown():
-    for server in _test_coros:
-        server.kill()
-    swift.proxy.controllers.obj.CONTAINER_LISTING_LIMIT = \
-        _orig_container_listing_limit
-    rmtree(os.path.dirname(_testdir))
-    Request.__init__ = Request._orig_init
-    if Request._orig_del:
-        Request.__del__ = Request._orig_del
-
-
-def fake_http_connect(*code_iter, **kwargs):
-
-    class FakeConn(object):
-
-        def __init__(self, status, etag=None, body='', timestamp='1',
-                     expect_status=None):
-            self.status = status
-            if expect_status is None:
-                self.expect_status = self.status
-            else:
-                self.expect_status = expect_status
-            self.reason = 'Fake'
-            self.host = '1.2.3.4'
-            self.port = '1234'
-            self.sent = 0
-            self.received = 0
-            self.etag = etag
-            self.body = body
-            self.timestamp = timestamp
-
-        def getresponse(self):
-            if kwargs.get('raise_exc'):
-                raise Exception('test')
-            if kwargs.get('raise_timeout_exc'):
-                raise Timeout()
-            return self
-
-        def getexpect(self):
-            if self.expect_status == -2:
-                raise HTTPException()
-            if self.expect_status == -3:
-                return FakeConn(507)
-            if self.expect_status == -4:
-                return FakeConn(201)
-            return FakeConn(100)
-
-        def getheaders(self):
-            headers = {'content-length': len(self.body),
-                       'content-type': 'x-application/test',
-                       'x-timestamp': self.timestamp,
-                       'last-modified': self.timestamp,
-                       'x-object-meta-test': 'testing',
-                       'etag':
-                       self.etag or '"68b329da9893e34099c7d8ad5cb9c940"',
-                       'x-works': 'yes',
-                       'x-account-container-count': 12345}
-            if not self.timestamp:
-                del headers['x-timestamp']
-            try:
-                if container_ts_iter.next() is False:
-                    headers['x-container-timestamp'] = '1'
-            except StopIteration:
-                pass
-            if 'slow' in kwargs:
-                headers['content-length'] = '4'
-            if 'headers' in kwargs:
-                headers.update(kwargs['headers'])
-            return headers.items()
-
-        def read(self, amt=None):
-            if 'slow' in kwargs:
-                if self.sent < 4:
-                    self.sent += 1
-                    sleep(0.1)
-                    return ' '
-            rv = self.body[:amt]
-            self.body = self.body[amt:]
-            return rv
-
-        def send(self, amt=None):
-            if 'slow' in kwargs:
-                if self.received < 4:
-                    self.received += 1
-                    sleep(0.1)
-
-        def getheader(self, name, default=None):
-            return dict(self.getheaders()).get(name.lower(), default)
-
-    timestamps_iter = iter(kwargs.get('timestamps') or ['1'] * len(code_iter))
-    etag_iter = iter(kwargs.get('etags') or [None] * len(code_iter))
-    x = kwargs.get('missing_container', [False] * len(code_iter))
-    if not isinstance(x, (tuple, list)):
-        x = [x] * len(code_iter)
-    container_ts_iter = iter(x)
-    code_iter = iter(code_iter)
-    static_body = kwargs.get('body', None)
-    body_iter = kwargs.get('body_iter', None)
-    if body_iter:
-        body_iter = iter(body_iter)
-
-    def connect(*args, **ckwargs):
-        if 'give_content_type' in kwargs:
-            if len(args) >= 7 and 'Content-Type' in args[6]:
-                kwargs['give_content_type'](args[6]['Content-Type'])
-            else:
-                kwargs['give_content_type']('')
-        if 'give_connect' in kwargs:
-            kwargs['give_connect'](*args, **ckwargs)
-        status = code_iter.next()
-        if isinstance(status, tuple):
-            status, expect_status = status
-        else:
-            expect_status = status
-        etag = etag_iter.next()
-        timestamp = timestamps_iter.next()
-
-        if status <= 0:
-            raise HTTPException()
-        if body_iter is None:
-            body = static_body or ''
-        else:
-            body = body_iter.next()
-        return FakeConn(status, etag, body=body, timestamp=timestamp,
-                        expect_status=expect_status)
-
-    return connect
-
+STATIC_TIME = time.time()
+_test_context = _test_servers = _test_sockets = _testdir = \
+    _test_POLICIES = None
 
-class FakeRing(object):
 
-    def __init__(self):
-        # 9 total nodes (6 more past the initial 3) is the cap, no matter if
-        # this is set higher.
-        self.max_more_nodes = 0
-        self.devs = {}
+def do_setup(object_server):
+    # setup test context and break out some globals for convenience
+    global _test_context, _testdir, _test_servers, _test_sockets, \
+        _test_POLICIES
+    _test_context = setup_servers(object_server)
+    _testdir = _test_context["testdir"]
+    _test_servers = _test_context["test_servers"]
+    _test_sockets = _test_context["test_sockets"]
+    _test_POLICIES = _test_context["test_POLICIES"]
 
-    def get_nodes(self, account, container=None, obj=None):
-        devs = []
-        for x in xrange(3):
-            devs.append(self.devs.get(x))
-            if devs[x] is None:
-                self.devs[x] = devs[x] = \
-                    {'ip': '10.0.0.%s' % x, 'port': 1000 + x, 'device': 'sda'}
-        return 1, devs
 
-    def get_part_nodes(self, part):
-        return self.get_nodes('blah')[1]
+def unpatch_policies(f):
+    """
+    This will unset a TestCase level patch_policies to use the module level
+    policies setup for the _test_servers instead.
 
-    def get_more_nodes(self, nodes):
-        # 9 is the true cap
-        for x in xrange(3, min(3 + self.max_more_nodes, 9)):
-            yield {'ip': '10.0.0.%s' % x, 'port': 1000 + x, 'device': 'sda'}
+    N.B. You should NEVER modify the _test_server policies or rings during a
+    test because they persist for the life of the entire module!
+    """
+    @functools.wraps(f)
+    def wrapper(*args, **kwargs):
+        with patch_policies(_test_POLICIES):
+            return f(*args, **kwargs)
+    return wrapper
 
 
-class FakeMemcache(object):
+def setUpModule():
+    do_setup(object_server)
 
-    def __init__(self):
-        self.store = {}
 
-    def get(self, key):
-        return self.store.get(key)
+def tearDownModule():
+    teardown_servers(_test_context)
 
-    def keys(self):
-        return self.store.keys()
 
-    def set(self, key, value, timeout=0):
-        self.store[key] = value
-        return True
+def sortHeaderNames(headerNames):
+    """
+    Return the given string of header names sorted.
 
-    def incr(self, key, timeout=0):
-        self.store[key] = self.store.setdefault(key, 0) + 1
-        return self.store[key]
+    headerName: a comma-delimited list of header names
+    """
+    headers = [a.strip() for a in headerNames.split(',') if a.strip()]
+    headers.sort()
+    return ', '.join(headers)
 
-    @contextmanager
-    def soft_lock(self, key, timeout=0, retries=5):
-        yield True
-
-    def delete(self, key):
-        try:
-            del self.store[key]
-        except Exception:
-            pass
-        return True
 
-
-class FakeMemcacheReturnsNone(FakeMemcache):
-
-    def get(self, key):
-        # Returns None as the timestamp of the container; assumes we're only
-        # using the FakeMemcache for container existence checks.
-        return None
+def parse_headers_string(headers_str):
+    headers_dict = HeaderKeyDict()
+    for line in headers_str.decode('utf8').split('\r\n'):
+        if ': ' in line:
+            header, value = line.split(': ', 1)
+            headers_dict[header] = value
+    return headers_dict
 
 
 @contextmanager
 def save_globals():
     orig_http_connect = getattr(swift.proxy.controllers.base, 'http_connect',
                                 None)
-    orig_account_info = getattr(proxy_server.Controller, 'account_info', None)
+    orig_account_info = getattr(swift.proxy.controllers.Controller,
+                                'account_info', None)
+    orig_container_info = getattr(swift.proxy.controllers.Controller,
+                                  'container_info', None)
+
     try:
         yield True
     finally:
-        proxy_server.Controller.account_info = orig_account_info
+        swift.proxy.controllers.Controller.account_info = orig_account_info
         swift.proxy.controllers.base.http_connect = orig_http_connect
         swift.proxy.controllers.obj.http_connect = orig_http_connect
         swift.proxy.controllers.account.http_connect = orig_http_connect
         swift.proxy.controllers.container.http_connect = orig_http_connect
+        swift.proxy.controllers.Controller.container_info = orig_container_info
 
 
 def set_http_connect(*args, **kwargs):
+    if kwargs.get('body') is not None and not isinstance(
+            kwargs['body'], bytes):
+        kwargs['body'] = kwargs['body'].encode('ascii')
     new_connect = fake_http_connect(*args, **kwargs)
     swift.proxy.controllers.base.http_connect = new_connect
     swift.proxy.controllers.obj.http_connect = new_connect
     swift.proxy.controllers.account.http_connect = new_connect
     swift.proxy.controllers.container.http_connect = new_connect
-
-
-def set_shuffle():
-    shuffle = lambda l: None
-    proxy_server.shuffle = shuffle
-    swift.proxy.controllers.base.shuffle = shuffle
-    swift.proxy.controllers.obj.shuffle = shuffle
-    swift.proxy.controllers.account.shuffle = shuffle
-    swift.proxy.controllers.container.shuffle = shuffle
+    return new_connect
+
+
+def _make_callback_func(calls):
+    def callback(ipaddr, port, device, partition, method, path,
+                 headers=None, query_string=None, ssl=False):
+        context = {}
+        context['method'] = method
+        context['path'] = path
+        context['headers'] = headers or {}
+        calls.append(context)
+    return callback
+
+
+def _limit_max_file_size(f):
+    """
+    This will limit constraints.MAX_FILE_SIZE for the duration of the
+    wrapped function, based on whether MAX_FILE_SIZE exceeds the
+    sys.maxsize limit on the system running the tests.
+
+    This allows successful testing on 32 bit systems.
+    """
+    @functools.wraps(f)
+    def wrapper(*args, **kwargs):
+        test_max_file_size = constraints.MAX_FILE_SIZE
+        if constraints.MAX_FILE_SIZE >= sys.maxsize:
+            test_max_file_size = (2 ** 30 + 2)
+        with mock.patch.object(constraints, 'MAX_FILE_SIZE',
+                               test_max_file_size):
+            return f(*args, **kwargs)
+    return wrapper
 
 
 # tests
 class TestController(unittest.TestCase):
 
     def setUp(self):
+        skip_if_no_xattrs()
+        _test_servers[0].error_limiter.stats.clear()  # clear out errors
         self.account_ring = FakeRing()
         self.container_ring = FakeRing()
         self.memcache = FakeMemcache()
-
-        app = proxy_server.Application(None, self.memcache,
+        app = proxy_server.Application(None, logger=debug_logger(),
                                        account_ring=self.account_ring,
-                                       container_ring=self.container_ring,
-                                       object_ring=FakeRing())
-        self.controller = proxy_server.Controller(app)
+                                       container_ring=self.container_ring)
+        self.controller = swift.proxy.controllers.Controller(app)
+
+        class FakeReq(object):
+            def __init__(self, memcache):
+                self.url = "/foo/bar"
+                self.method = "METHOD"
+                self.environ = {"swift.cache": memcache}
+
+            def as_referer(self):
+                return self.method + ' ' + self.url
 
         self.account = 'some_account'
         self.container = 'some_container'
+        self.request = FakeReq(self.memcache)
         self.read_acl = 'read_acl'
         self.write_acl = 'write_acl'
 
+    def test_transfer_headers(self):
+        src_headers = {'x-remove-base-meta-owner': 'x',
+                       'x-base-meta-size': '151M',
+                       'new-owner': 'Kun'}
+        dst_headers = {'x-base-meta-owner': 'Gareth',
+                       'x-base-meta-size': '150M'}
+        self.controller.transfer_headers(src_headers, dst_headers)
+        expected_headers = {'x-base-meta-owner': '',
+                            'x-base-meta-size': '151M'}
+        self.assertEqual(dst_headers, expected_headers)
+
     def check_account_info_return(self, partition, nodes, is_none=False):
         if is_none:
             p, n = None, None
@@ -426,14 +262,42 @@ def check_account_info_return(self, partition, nodes, is_none=False):
         self.assertEqual(p, partition)
         self.assertEqual(n, nodes)
 
+    def test_account_info_container_count(self):
+        cache_key = get_cache_key(self.account)
+        with save_globals():
+            set_http_connect(200, count=123)
+            partition, nodes, count = \
+                self.controller.account_info(self.account, self.request)
+            self.assertEqual(count, 123)
+        with save_globals():
+            set_http_connect(200, count='123')
+            del self.request.environ['swift.infocache'][cache_key]
+            partition, nodes, count = \
+                self.controller.account_info(self.account, self.request)
+            self.assertEqual(count, 123)
+        with save_globals():
+            account_info = {'status': 200, 'container_count': 1234}
+            self.memcache.set(cache_key, account_info)
+            del self.request.environ['swift.infocache'][cache_key]
+            partition, nodes, count = \
+                self.controller.account_info(self.account, self.request)
+            self.assertEqual(count, 1234)
+        with save_globals():
+            account_info = {'status': 200, 'container_count': '1234'}
+            self.memcache.set(cache_key, account_info)
+            del self.request.environ['swift.infocache'][cache_key]
+            partition, nodes, count = \
+                self.controller.account_info(self.account, self.request)
+            self.assertEqual(count, 1234)
+
     def test_make_requests(self):
         with save_globals():
             set_http_connect(200)
             partition, nodes, count = \
-                self.controller.account_info(self.account)
+                self.controller.account_info(self.account, self.request)
             set_http_connect(201, raise_timeout_exc=True)
             self.controller._make_request(
-                nodes, partition, 'POST', '/', '', '',
+                nodes, partition, 'POST', '/', {}, '', None,
                 self.controller.app.logger.thread_locals)
 
     # tests if 200 is cached and used
@@ -441,108 +305,88 @@ def test_account_info_200(self):
         with save_globals():
             set_http_connect(200)
             partition, nodes, count = \
-                self.controller.account_info(self.account)
+                self.controller.account_info(self.account, self.request)
             self.check_account_info_return(partition, nodes)
-            self.assertEquals(count, 12345)
-
-            cache_key = get_account_memcache_key(self.account)
-            self.assertEquals({'status': 200, 'container_count': 12345},
-                              self.memcache.get(cache_key))
+            self.assertEqual(count, 12345)
+
+            # Test the internal representation in memcache
+            # 'container_count' changed from int to str
+            cache_key = get_cache_key(self.account)
+            container_info = {'status': 200,
+                              'account_really_exists': True,
+                              'container_count': '12345',
+                              'total_object_count': None,
+                              'bytes': None,
+                              'storage_policies': {str(p.idx): {
+                                  'container_count': 0,
+                                  'object_count': 0,
+                                  'bytes': 0} for p in POLICIES},
+                              'meta': {},
+                              'sysmeta': {}}
+            self.assertEqual(container_info,
+                             self.memcache.get(cache_key))
 
             set_http_connect()
             partition, nodes, count = \
-                self.controller.account_info(self.account)
+                self.controller.account_info(self.account, self.request)
             self.check_account_info_return(partition, nodes)
-            self.assertEquals(count, 12345)
+            self.assertEqual(count, 12345)
 
     # tests if 404 is cached and used
     def test_account_info_404(self):
         with save_globals():
             set_http_connect(404, 404, 404)
             partition, nodes, count = \
-                self.controller.account_info(self.account)
+                self.controller.account_info(self.account, self.request)
             self.check_account_info_return(partition, nodes, True)
-            self.assertEquals(count, None)
-
-            cache_key = get_account_memcache_key(self.account)
-            self.assertEquals({'status': 404, 'container_count': 0},
-                              self.memcache.get(cache_key))
+            self.assertIsNone(count)
+
+            # Test the internal representation in memcache
+            # 'container_count' changed from 0 to None
+            cache_key = get_cache_key(self.account)
+            account_info = {'status': 404,
+                            'container_count': None,  # internally keep None
+                            'total_object_count': None,
+                            'bytes': None,
+                            'storage_policies': {str(p.idx): {
+                                'container_count': 0,
+                                'object_count': 0,
+                                'bytes': 0} for p in POLICIES},
+                            'meta': {},
+                            'sysmeta': {}}
+            self.assertEqual(account_info,
+                             self.memcache.get(cache_key))
 
             set_http_connect()
             partition, nodes, count = \
-                self.controller.account_info(self.account)
+                self.controller.account_info(self.account, self.request)
             self.check_account_info_return(partition, nodes, True)
-            self.assertEquals(count, None)
+            self.assertIsNone(count)
 
     # tests if some http status codes are not cached
     def test_account_info_no_cache(self):
         def test(*status_list):
             set_http_connect(*status_list)
             partition, nodes, count = \
-                self.controller.account_info(self.account)
+                self.controller.account_info(self.account, self.request)
             self.assertEqual(len(self.memcache.keys()), 0)
             self.check_account_info_return(partition, nodes, True)
-            self.assertEquals(count, None)
+            self.assertIsNone(count)
 
         with save_globals():
-            test(503, 404, 404)
-            test(404, 404, 503)
+            # We cache if we have two 404 responses - fail if only one
+            test(503, 503, 404)
+            test(504, 404, 503)
             test(404, 507, 503)
             test(503, 503, 503)
 
-    def test_account_info_account_autocreate(self):
+    def test_account_info_no_account(self):
         with save_globals():
-            self.memcache.store = {}
-            set_http_connect(404, 404, 404, 201, 201, 201)
-            partition, nodes, count = \
-                self.controller.account_info(self.account, autocreate=False)
-            self.check_account_info_return(partition, nodes, is_none=True)
-            self.assertEquals(count, None)
-
-            self.memcache.store = {}
-            set_http_connect(404, 404, 404, 201, 201, 201)
-            partition, nodes, count = \
-                self.controller.account_info(self.account)
-            self.check_account_info_return(partition, nodes, is_none=True)
-            self.assertEquals(count, None)
-
-            self.memcache.store = {}
-            set_http_connect(404, 404, 404, 201, 201, 201)
-            partition, nodes, count = \
-                self.controller.account_info(self.account, autocreate=True)
-            self.check_account_info_return(partition, nodes)
-            self.assertEquals(count, 0)
-
-            self.memcache.store = {}
-            set_http_connect(404, 404, 404, 503, 201, 201)
-            partition, nodes, count = \
-                self.controller.account_info(self.account, autocreate=True)
-            self.check_account_info_return(partition, nodes)
-            self.assertEquals(count, 0)
-
-            self.memcache.store = {}
-            set_http_connect(404, 404, 404, 503, 201, 503)
-            exc = None
-            partition, nodes, count = \
-                self.controller.account_info(self.account, autocreate=True)
-            self.check_account_info_return(partition, nodes, is_none=True)
-            self.assertEquals(None, count)
-
-            self.memcache.store = {}
-            set_http_connect(404, 404, 404, 403, 403, 403)
-            exc = None
-            partition, nodes, count = \
-                self.controller.account_info(self.account, autocreate=True)
-            self.check_account_info_return(partition, nodes, is_none=True)
-            self.assertEquals(None, count)
-
-            self.memcache.store = {}
-            set_http_connect(404, 404, 404, 409, 409, 409)
-            exc = None
+            set_http_connect(404, 404, 404)
             partition, nodes, count = \
-                self.controller.account_info(self.account, autocreate=True)
+                self.controller.account_info(self.account, self.request)
             self.check_account_info_return(partition, nodes, is_none=True)
-            self.assertEquals(None, count)
+            self.assertIsNone(count)
 
     def check_container_info_return(self, ret, is_none=False):
         if is_none:
@@ -557,114 +401,340 @@ def check_container_info_return(self, ret, is_none=False):
         self.assertEqual(write_acl, ret['write_acl'])
 
     def test_container_info_invalid_account(self):
-        def account_info(self, account, autocreate=False):
+        def account_info(self, account, request, autocreate=False):
             return None, None
 
         with save_globals():
-            proxy_server.Controller.account_info = account_info
+            swift.proxy.controllers.Controller.account_info = account_info
             ret = self.controller.container_info(self.account,
-                                                 self.container)
+                                                 self.container,
+                                                 self.request)
             self.check_container_info_return(ret, True)
 
     # tests if 200 is cached and used
     def test_container_info_200(self):
-        def account_info(self, account, autocreate=False):
-            return True, True, 0
 
         with save_globals():
             headers = {'x-container-read': self.read_acl,
                        'x-container-write': self.write_acl}
-            proxy_server.Controller.account_info = account_info
-            set_http_connect(200, headers=headers)
-            ret = self.controller.container_info(self.account,
-                                                 self.container)
+            set_http_connect(200,  # account_info is found
+                             200, headers=headers)  # container_info is found
+            ret = self.controller.container_info(
+                self.account, self.container, self.request)
             self.check_container_info_return(ret)
 
-            cache_key = get_container_memcache_key(self.account,
-                                                   self.container)
+            cache_key = get_cache_key(self.account, self.container)
             cache_value = self.memcache.get(cache_key)
-            self.assertTrue(isinstance(cache_value, dict))
-            self.assertEquals(200, cache_value.get('status'))
+            self.assertIsInstance(cache_value, dict)
+            self.assertEqual(200, cache_value.get('status'))
 
             set_http_connect()
-            ret = self.controller.container_info(self.account,
-                                                 self.container)
+            ret = self.controller.container_info(
+                self.account, self.container, self.request)
             self.check_container_info_return(ret)
 
     # tests if 404 is cached and used
     def test_container_info_404(self):
-        def account_info(self, account, autocreate=False):
+        def account_info(self, account, request):
             return True, True, 0
 
         with save_globals():
-            proxy_server.Controller.account_info = account_info
-            set_http_connect(404, 404, 404)
-            ret = self.controller.container_info(self.account,
-                                                 self.container)
+            set_http_connect(503, 204,  # account_info found
+                             504, 404, 404)  # container_info 'NotFound'
+            ret = self.controller.container_info(
+                self.account, self.container, self.request)
             self.check_container_info_return(ret, True)
 
-            cache_key = get_container_memcache_key(self.account,
-                                                   self.container)
+            cache_key = get_cache_key(self.account, self.container)
             cache_value = self.memcache.get(cache_key)
-            self.assertTrue(isinstance(cache_value, dict))
-            self.assertEquals(404, cache_value.get('status'))
+            self.assertIsInstance(cache_value, dict)
+            self.assertEqual(404, cache_value.get('status'))
 
             set_http_connect()
-            ret = self.controller.container_info(self.account,
-                                                 self.container)
+            ret = self.controller.container_info(
+                self.account, self.container, self.request)
+            self.check_container_info_return(ret, True)
+
+            set_http_connect(503, 404, 404)  # account_info 'NotFound'
+            ret = self.controller.container_info(
+                self.account, self.container, self.request)
+            self.check_container_info_return(ret, True)
+
+            cache_key = get_cache_key(self.account, self.container)
+            cache_value = self.memcache.get(cache_key)
+            self.assertIsInstance(cache_value, dict)
+            self.assertEqual(404, cache_value.get('status'))
+
+            set_http_connect()
+            ret = self.controller.container_info(
+                self.account, self.container, self.request)
             self.check_container_info_return(ret, True)
 
     # tests if some http status codes are not cached
     def test_container_info_no_cache(self):
         def test(*status_list):
             set_http_connect(*status_list)
-            ret = self.controller.container_info(self.account,
-                                                 self.container)
+            ret = self.controller.container_info(
+                self.account, self.container, self.request)
             self.assertEqual(len(self.memcache.keys()), 0)
             self.check_container_info_return(ret, True)
 
         with save_globals():
-            test(503, 404, 404)
-            test(404, 404, 503)
+            # We cache if we have two 404 responses - fail if only one
+            test(503, 503, 404)
+            test(504, 404, 503)
             test(404, 507, 503)
             test(503, 503, 503)
 
+    def test_get_account_info_returns_values_as_strings(self):
+        app = mock.MagicMock()
+        app._pipeline_request_logging_app = app._pipeline_final_app = app
+        app.account_existence_skip_cache = 0.0
+        memcache = mock.MagicMock()
+        memcache.get = mock.MagicMock()
+        memcache.get.return_value = {
+            u'foo': u'\u2603',
+            u'meta': {u'bar': u'\u2603'},
+            u'sysmeta': {u'baz': u'\u2603'}}
+        env = {'PATH_INFO': '/v1/a', 'swift.cache': memcache}
+        ai = get_account_info(env, app)
+
+        # Test info is returned as strings
+        self.assertEqual(ai.get('foo'), wsgi_to_str('\xe2\x98\x83'))
+        self.assertIsInstance(ai.get('foo'), str)
+
+        # Test info['meta'] is returned as strings
+        m = ai.get('meta', {})
+        self.assertEqual(m.get('bar'), wsgi_to_str('\xe2\x98\x83'))
+        self.assertIsInstance(m.get('bar'), str)
+
+        # Test info['sysmeta'] is returned as strings
+        m = ai.get('sysmeta', {})
+        self.assertEqual(m.get('baz'), wsgi_to_str('\xe2\x98\x83'))
+        self.assertIsInstance(m.get('baz'), str)
+
+    def test_get_container_info_returns_values_as_strings(self):
+        app = mock.MagicMock()
+        app._pipeline_request_logging_app = app._pipeline_final_app = app
+        app.container_existence_skip_cache = 0.0
+        memcache = mock.MagicMock()
+        memcache.get = mock.MagicMock()
+        memcache.get.return_value = {
+            u'foo': u'\u2603',
+            u'meta': {u'bar': u'\u2603'},
+            u'sysmeta': {u'baz': u'\u2603'},
+            u'cors': {u'expose_headers': u'\u2603'}}
+        env = {'PATH_INFO': '/v1/a/c', 'swift.cache': memcache}
+        ci = get_container_info(env, app)
+
+        # Test info is returned as strings
+        self.assertEqual(ci.get('foo'), wsgi_to_str('\xe2\x98\x83'))
+        self.assertIsInstance(ci.get('foo'), str)
+
+        # Test info['meta'] is returned as strings
+        m = ci.get('meta', {})
+        self.assertEqual(m.get('bar'), wsgi_to_str('\xe2\x98\x83'))
+        self.assertIsInstance(m.get('bar'), str)
+
+        # Test info['sysmeta'] is returned as strings
+        m = ci.get('sysmeta', {})
+        self.assertEqual(m.get('baz'), wsgi_to_str('\xe2\x98\x83'))
+        self.assertIsInstance(m.get('baz'), str)
+
+        # Test info['cors'] is returned as strings
+        m = ci.get('cors', {})
+        self.assertEqual(m.get('expose_headers'), wsgi_to_str('\xe2\x98\x83'))
+        self.assertIsInstance(m.get('expose_headers'), str)
+
+
+@patch_policies([StoragePolicy(0, 'zero', True, object_ring=FakeRing())])
+class TestProxyServerConfiguration(unittest.TestCase):
 
+    def setUp(self):
+        self.logger = debug_logger('test-proxy-config')
+
+    def _make_app(self, conf):
+        self.logger.clear()
+        # helper function to instantiate a proxy server instance
+        return proxy_server.Application(conf,
+                                        container_ring=FakeRing(),
+                                        account_ring=FakeRing(),
+                                        logger=self.logger)
+
+    def test_auto_create_account(self):
+        app = self._make_app({})
+        self.assertEqual(app.auto_create_account_prefix, '.')
+        self.assertEqual(self.logger.get_lines_for_level('warning'), [])
+
+    def test_node_timeout(self):
+        # later config should be extended to assert more config options
+        app = self._make_app({'node_timeout': '3.5',
+                              'recoverable_node_timeout': '1.5'})
+        self.assertEqual(app.node_timeout, 3.5)
+        self.assertEqual(app.recoverable_node_timeout, 1.5)
+
+    def test_cors_options(self):
+        # check defaults
+        app = self._make_app({})
+        self.assertFalse(app.cors_allow_origin)
+        self.assertFalse(app.cors_expose_headers)
+        self.assertTrue(app.strict_cors_mode)
+
+        # check custom configs
+        app = self._make_app({
+            'cors_allow_origin': '',
+            'cors_expose_headers': '',
+            'strict_cors_mode': 'True'})
+        self.assertTrue(app.strict_cors_mode)
+
+        app = self._make_app({
+            'cors_allow_origin': ' http://X.com,http://Y.com ,,  http://Z.com',
+            'cors_expose_headers': ' custom1,,,  custom2,custom3,,',
+            'strict_cors_mode': 'False'})
+        self.assertEqual({'http://X.com', 'http://Y.com', 'http://Z.com'},
+                         set(app.cors_allow_origin))
+        self.assertEqual({'custom1', 'custom2', 'custom3'},
+                         set(app.cors_expose_headers))
+        self.assertFalse(app.strict_cors_mode)
+
+    def test_memcache_recheck_options(self):
+        # check default options
+        app = self._make_app({})
+        self.assertEqual(app.recheck_account_existence, 60)
+        self.assertEqual(app.recheck_container_existence, 60)
+        self.assertEqual(app.recheck_updating_shard_ranges, 3600)
+        self.assertEqual(app.recheck_listing_shard_ranges, 600)
+        # check custom options
+        app = self._make_app({'recheck_account_existence': '30',
+                              'recheck_container_existence': '40',
+                              'recheck_updating_shard_ranges': '1800',
+                              'recheck_listing_shard_ranges': ' 900'})
+        self.assertEqual(app.recheck_account_existence, 30)
+        self.assertEqual(app.recheck_container_existence, 40)
+        self.assertEqual(app.recheck_updating_shard_ranges, 1800)
+        self.assertEqual(app.recheck_listing_shard_ranges, 900)
+
+    def test_memcache_skip_options(self):
+        # check default options
+        app = self._make_app({})
+        self.assertEqual(app.container_listing_shard_ranges_skip_cache, 0)
+        self.assertEqual(app.container_updating_shard_ranges_skip_cache, 0)
+        # check custom options
+        app = self._make_app({
+            'container_listing_shard_ranges_skip_cache_pct': '0.01',
+            'container_updating_shard_ranges_skip_cache_pct': '0.1'})
+        self.assertEqual(app.container_listing_shard_ranges_skip_cache, 0.0001)
+        self.assertEqual(app.container_updating_shard_ranges_skip_cache, 0.001)
+
+
+@patch_policies([StoragePolicy(0, 'zero', True, object_ring=FakeRing())])
 class TestProxyServer(unittest.TestCase):
 
+    def test_get_object_ring(self):
+        baseapp = proxy_server.Application({},
+                                           container_ring=FakeRing(),
+                                           account_ring=FakeRing())
+        with patch_policies([
+            StoragePolicy(0, 'a', False, object_ring=123),
+            StoragePolicy(1, 'b', True, object_ring=456),
+            StoragePolicy(2, 'd', False, object_ring=789)
+        ]):
+            # None means legacy so always use policy 0
+            ring = baseapp.get_object_ring(None)
+            self.assertEqual(ring, 123)
+            ring = baseapp.get_object_ring('')
+            self.assertEqual(ring, 123)
+            ring = baseapp.get_object_ring('0')
+            self.assertEqual(ring, 123)
+            ring = baseapp.get_object_ring('1')
+            self.assertEqual(ring, 456)
+            ring = baseapp.get_object_ring('2')
+            self.assertEqual(ring, 789)
+            # illegal values
+            self.assertRaises(ValueError, baseapp.get_object_ring, '99')
+            self.assertRaises(ValueError, baseapp.get_object_ring, 'asdf')
+
     def test_unhandled_exception(self):
 
         class MyApp(proxy_server.Application):
 
             def get_controller(self, path):
-                raise Exception('this shouldnt be caught')
+                raise Exception('this shouldn\'t be caught')
 
-        app = MyApp(None, FakeMemcache(), account_ring=FakeRing(),
-                    container_ring=FakeRing(), object_ring=FakeRing())
-        req = Request.blank('/account', environ={'REQUEST_METHOD': 'HEAD'})
+        app = MyApp(None, account_ring=FakeRing(),
+                    container_ring=FakeRing())
+        req = Request.blank('/v1/account', environ={'REQUEST_METHOD': 'HEAD'})
         app.update_request(req)
         resp = app.handle_request(req)
-        self.assertEquals(resp.status_int, 500)
+        self.assertEqual(resp.status_int, 500)
 
     def test_internal_method_request(self):
         baseapp = proxy_server.Application({},
-                                           FakeMemcache(),
                                            container_ring=FakeRing(),
-                                           object_ring=FakeRing(),
                                            account_ring=FakeRing())
         resp = baseapp.handle_request(
             Request.blank('/v1/a', environ={'REQUEST_METHOD': '__init__'}))
-        self.assertEquals(resp.status, '405 Method Not Allowed')
+        self.assertEqual(resp.status, '405 Method Not Allowed')
 
     def test_inexistent_method_request(self):
         baseapp = proxy_server.Application({},
-                                           FakeMemcache(),
                                            container_ring=FakeRing(),
-                                           account_ring=FakeRing(),
-                                           object_ring=FakeRing())
+                                           account_ring=FakeRing())
         resp = baseapp.handle_request(
             Request.blank('/v1/a', environ={'REQUEST_METHOD': '!invalid'}))
-        self.assertEquals(resp.status, '405 Method Not Allowed')
+        self.assertEqual(resp.status, '405 Method Not Allowed')
+
+    def test_private_method_request(self):
+        baseapp = proxy_server.Application({},
+                                           container_ring=FakeRing(),
+                                           account_ring=FakeRing())
+        baseapp.logger = debug_logger()
+        resp = baseapp.handle_request(
+            Request.blank('/v1/a/c', environ={'REQUEST_METHOD': 'UPDATE'}))
+        self.assertEqual(resp.status, '405 Method Not Allowed')
+        # Note that UPDATE definitely *isn't* advertised
+        self.assertEqual(sorted(resp.headers['Allow'].split(', ')), [
+            'DELETE', 'GET', 'HEAD', 'OPTIONS', 'POST', 'PUT'])
+
+        # But with appropriate (internal-only) overrides, you can still use it
+        resp = baseapp.handle_request(
+            Request.blank('/v1/a/c', environ={'REQUEST_METHOD': 'UPDATE'},
+                          headers={'X-Backend-Allow-Private-Methods': 'True',
+                                   'X-Backend-Storage-Policy-Index': '0'}))
+        # Now we actually make the requests, but there aren't any nodes
+        self.assertEqual(resp.status, '503 Service Unavailable')
+
+        # Bad method with overrides advertises private methods
+        resp = baseapp.handle_request(
+            Request.blank('/v1/a/c', environ={'REQUEST_METHOD': 'BOGUS'},
+                          headers={'X-Backend-Allow-Private-Methods': '1'}))
+        self.assertEqual(resp.status, '405 Method Not Allowed')
+        self.assertEqual(sorted(resp.headers['Allow'].split(', ')), [
+            'DELETE', 'GET', 'HEAD', 'OPTIONS', 'POST', 'PUT', 'UPDATE'])
+
+    def test_internal_reserved_name_request(self):
+        # set account info
+        fake_cache = FakeMemcache()
+        fake_cache.store[get_cache_key('a')] = {'status': 200}
+        app = proxy_server.Application({},
+                                       container_ring=FakeRing(),
+                                       account_ring=FakeRing())
+        # build internal container request
+        container = get_reserved_name('c')
+        req = Request.blank('/v1/a/%s' % container,
+                            {'swift.cache': fake_cache})
+        app.update_request(req)
+
+        # try client request to reserved name
+        resp = app.handle_request(req)
+        self.assertEqual(resp.status_int, 412)
+        self.assertEqual(resp.body, b'Invalid UTF8 or contains NULL')
+
+        # set backend header
+        req.headers['X-Backend-Allow-Reserved-Names'] = 'true'
+        with mocked_http_conn(200):
+            resp = app.handle_request(req)
+        self.assertEqual(resp.status_int, 200)
 
     def test_calls_authorize_allow(self):
         called = [False]
@@ -673,15 +743,14 @@ def authorize(req):
             called[0] = True
         with save_globals():
             set_http_connect(200)
-            app = proxy_server.Application(None, FakeMemcache(),
+            app = proxy_server.Application(None,
                                            account_ring=FakeRing(),
-                                           container_ring=FakeRing(),
-                                           object_ring=FakeRing())
+                                           container_ring=FakeRing())
             req = Request.blank('/v1/a')
             req.environ['swift.authorize'] = authorize
             app.update_request(req)
-            resp = app.handle_request(req)
-        self.assert_(called[0])
+            app.handle_request(req)
+        self.assertTrue(called[0])
 
     def test_calls_authorize_deny(self):
         called = [False]
@@ -689,31 +758,66 @@ def test_calls_authorize_deny(self):
         def authorize(req):
             called[0] = True
             return HTTPUnauthorized(request=req)
-        app = proxy_server.Application(None, FakeMemcache(),
+        app = proxy_server.Application(None,
                                        account_ring=FakeRing(),
-                                       container_ring=FakeRing(),
-                                       object_ring=FakeRing())
+                                       container_ring=FakeRing())
         req = Request.blank('/v1/a')
         req.environ['swift.authorize'] = authorize
         app.update_request(req)
-        resp = app.handle_request(req)
-        self.assert_(called[0])
+        app.handle_request(req)
+        self.assertTrue(called[0])
 
     def test_negative_content_length(self):
         swift_dir = mkdtemp()
         try:
             baseapp = proxy_server.Application({'swift_dir': swift_dir},
-                                               FakeMemcache(), FakeLogger(),
-                                               FakeRing(), FakeRing(),
-                                               FakeRing())
+                                               debug_logger(),
+                                               FakeRing(), FakeRing())
             resp = baseapp.handle_request(
                 Request.blank('/', environ={'CONTENT_LENGTH': '-1'}))
-            self.assertEquals(resp.status, '400 Bad Request')
-            self.assertEquals(resp.body, 'Invalid Content-Length')
+            self.assertEqual(resp.status, '400 Bad Request')
+            self.assertEqual(resp.body, b'Invalid Content-Length')
             resp = baseapp.handle_request(
                 Request.blank('/', environ={'CONTENT_LENGTH': '-123'}))
-            self.assertEquals(resp.status, '400 Bad Request')
-            self.assertEquals(resp.body, 'Invalid Content-Length')
+            self.assertEqual(resp.status, '400 Bad Request')
+            self.assertEqual(resp.body, b'Invalid Content-Length')
+        finally:
+            rmtree(swift_dir, ignore_errors=True)
+
+    def test_adds_transaction_id(self):
+        swift_dir = mkdtemp()
+        try:
+            logger = debug_logger()
+            baseapp = proxy_server.Application({'swift_dir': swift_dir},
+                                               logger,
+                                               container_ring=debug_logger(),
+                                               account_ring=FakeRing())
+            baseapp.handle_request(
+                Request.blank('/info',
+                              environ={'HTTP_X_TRANS_ID_EXTRA': 'sardine',
+                                       'REQUEST_METHOD': 'GET'}))
+            # This is kind of a hokey way to get the transaction ID; it'd be
+            # better to examine response headers, but the catch_errors
+            # middleware is what sets the X-Trans-Id header, and we don't have
+            # that available here.
+            self.assertTrue(logger.txn_id.endswith('-sardine'))
+        finally:
+            rmtree(swift_dir, ignore_errors=True)
+
+    def test_adds_transaction_id_length_limit(self):
+        swift_dir = mkdtemp()
+        try:
+            logger = debug_logger()
+            baseapp = proxy_server.Application({'swift_dir': swift_dir},
+                                               logger,
+                                               container_ring=debug_logger(),
+                                               account_ring=FakeRing())
+            baseapp.handle_request(
+                Request.blank('/info',
+                              environ={'HTTP_X_TRANS_ID_EXTRA': 'a' * 1000,
+                                       'REQUEST_METHOD': 'GET'}))
+            self.assertTrue(logger.txn_id.endswith(
+                '-aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa'))
         finally:
             rmtree(swift_dir, ignore_errors=True)
 
@@ -723,25 +827,1523 @@ def test_denied_host_header(self):
             baseapp = proxy_server.Application({'swift_dir': swift_dir,
                                                 'deny_host_headers':
                                                 'invalid_host.com'},
-                                               FakeMemcache(), FakeLogger(),
-                                               FakeRing(), FakeRing(),
-                                               FakeRing())
+                                               container_ring=debug_logger(),
+                                               account_ring=FakeRing())
             resp = baseapp.handle_request(
                 Request.blank('/v1/a/c/o',
                               environ={'HTTP_HOST': 'invalid_host.com'}))
-            self.assertEquals(resp.status, '403 Forbidden')
+            self.assertEqual(resp.status, '403 Forbidden')
         finally:
             rmtree(swift_dir, ignore_errors=True)
 
+    def test_node_timing(self):
+        baseapp = proxy_server.Application({'sorting_method': 'timing'},
+                                           container_ring=FakeRing(),
+                                           account_ring=FakeRing())
+        self.assertEqual(baseapp.node_timings, {})
+
+        req = Request.blank('/v1/account', environ={'REQUEST_METHOD': 'HEAD'})
+        baseapp.update_request(req)
+        with mocked_http_conn(Timeout(), Timeout(), Timeout()):
+            resp = baseapp.handle_request(req)
+        self.assertEqual(resp.status_int, 503)  # couldn't connect to anything
+        exp_timings = {}
+        self.assertEqual(baseapp.node_timings, exp_timings)
+
+        times = [time.time()]
+        exp_timings = {'127.0.0.1': (0.1, times[0] + baseapp.timing_expiry)}
+        with mock.patch('swift.proxy.server.time', lambda: times.pop(0)):
+            baseapp.set_node_timing({'ip': '127.0.0.1'}, 0.1)
+        self.assertEqual(baseapp.node_timings, exp_timings)
+
+        nodes = [{'ip': '127.0.0.1'}, {'ip': '127.0.0.2'}, {'ip': '127.0.0.3'}]
+        with mock.patch('swift.proxy.server.shuffle', lambda l: l):
+            res = baseapp.sort_nodes(nodes)
+        exp_sorting = [{'ip': '127.0.0.2'}, {'ip': '127.0.0.3'},
+                       {'ip': '127.0.0.1'}]
+        self.assertEqual(res, exp_sorting)
+
+    def _do_sort_nodes(self, conf, policy_conf, nodes, policy,
+                       node_timings=None):
+        # Note with shuffling mocked out, sort_nodes will by default return
+        # nodes in the order they are given
+        nodes = list(nodes)
+        conf = dict(conf, policy_config=policy_conf)
+        baseapp = proxy_server.Application(conf,
+                                           logger=debug_logger(),
+                                           container_ring=FakeRing(),
+                                           account_ring=FakeRing())
+        if node_timings:
+            for i, n in enumerate(nodes):
+                baseapp.set_node_timing(n, node_timings[i])
+        with mock.patch('swift.proxy.server.shuffle', lambda x: x):
+            app_sorted = baseapp.sort_nodes(nodes, policy)
+        self.assertFalse(baseapp.logger.get_lines_for_level('warning'))
+        return baseapp, app_sorted
+
+    def test_sort_nodes_default(self):
+        nodes = [{'region': 0, 'zone': 1, 'ip': '127.0.0.3'},
+                 {'region': 1, 'zone': 1, 'ip': '127.0.0.1'},
+                 {'region': 2, 'zone': 2, 'ip': '127.0.0.2'}]
+
+        # sanity check - no affinity conf results in node order unchanged
+        app, actual = self._do_sort_nodes({}, {}, nodes, None)
+        self.assertEqual(nodes, actual)
+
+    def test_sort_nodes_by_affinity_proxy_server_config(self):
+        nodes = [{'region': 0, 'zone': 1, 'ip': '127.0.0.3'},
+                 {'region': 1, 'zone': 1, 'ip': '127.0.0.1'},
+                 {'region': 2, 'zone': 2, 'ip': '127.0.0.2'}]
+
+        # proxy-server affinity conf is to prefer r2
+        conf = {'sorting_method': 'affinity', 'read_affinity': 'r2=1'}
+        app, actual = self._do_sort_nodes(conf, {}, nodes, None)
+        self.assertEqual([nodes[2], nodes[0], nodes[1]], actual)
+        app, actual = self._do_sort_nodes(conf, {}, nodes, POLICIES[0])
+        self.assertEqual([nodes[2], nodes[0], nodes[1]], actual)
+        # check that node timings are not collected if sorting_method != timing
+        self.assertFalse(app.sorts_by_timing)  # sanity check
+        self.assertFalse(app.node_timings)  # sanity check
+
+        # proxy-server affinity conf is to prefer region 1
+        conf = {'sorting_method': 'affinity', 'read_affinity': 'r1=1'}
+        app, actual = self._do_sort_nodes(conf, {}, nodes, None)
+        self.assertEqual([nodes[1], nodes[0], nodes[2]], actual)
+        app, actual = self._do_sort_nodes(conf, {}, nodes, POLICIES[0])
+        self.assertEqual([nodes[1], nodes[0], nodes[2]], actual)
+
+    @patch_policies([StoragePolicy(0, 'zero', True, object_ring=FakeRing()),
+                     StoragePolicy(1, 'one', False, object_ring=FakeRing())])
+    def test_sort_nodes_by_affinity_per_policy(self):
+        nodes = [{'region': 0, 'zone': 1, 'ip': '127.0.0.4'},
+                 {'region': 1, 'zone': 0, 'ip': '127.0.0.3'},
+                 {'region': 2, 'zone': 1, 'ip': '127.0.0.1'},
+                 {'region': 3, 'zone': 0, 'ip': '127.0.0.2'}]
+        conf = {'sorting_method': 'affinity', 'read_affinity': 'r3=1'}
+        per_policy = {'0': {'sorting_method': 'affinity',
+                            'read_affinity': 'r1=1'},
+                      '1': {'sorting_method': 'affinity',
+                            'read_affinity': 'r2=1'}}
+        # policy 0 affinity prefers r1
+        app, actual = self._do_sort_nodes(conf, per_policy, nodes, POLICIES[0])
+        self.assertEqual([nodes[1], nodes[0], nodes[2], nodes[3]], actual)
+        # policy 1 affinity prefers r2
+        app, actual = self._do_sort_nodes(conf, per_policy, nodes, POLICIES[1])
+        self.assertEqual([nodes[2], nodes[0], nodes[1], nodes[3]], actual)
+        # default affinity prefers r3
+        app, actual = self._do_sort_nodes(conf, per_policy, nodes, None)
+        self.assertEqual([nodes[3], nodes[0], nodes[1], nodes[2]], actual)
+
+    def test_sort_nodes_by_affinity_per_policy_with_no_default(self):
+        # no proxy-server setting but policy 0 prefers r0
+        nodes = [{'region': 1, 'zone': 1, 'ip': '127.0.0.1'},
+                 {'region': 0, 'zone': 2, 'ip': '127.0.0.2'}]
+        conf = {}
+        per_policy = {'0': {'sorting_method': 'affinity',
+                            'read_affinity': 'r0=0'}}
+        # policy 0 uses affinity sorting
+        app, actual = self._do_sort_nodes(conf, per_policy, nodes, POLICIES[0])
+        self.assertEqual([nodes[1], nodes[0]], actual)
+        # any other policy will use default sorting
+        app, actual = self._do_sort_nodes(conf, per_policy, nodes, None)
+        self.assertEqual(nodes, actual)
+
+    def test_sort_nodes_by_affinity_per_policy_inherits(self):
+        # policy 0 has read_affinity but no sorting_method override,
+        nodes = [{'region': 1, 'zone': 1, 'ip': '127.0.0.1'},
+                 {'region': 0, 'zone': 2, 'ip': '127.0.0.2'}]
+        conf = {}
+        per_policy = {'0': {'read_affinity': 'r0=0'}}
+        # policy 0 uses the default sorting method instead of affinity sorting
+        app, actual = self._do_sort_nodes(conf, per_policy, nodes, POLICIES[0])
+        self.assertEqual(nodes, actual)
+        # but if proxy-server sorting_method is affinity then policy 0 inherits
+        conf = {'sorting_method': 'affinity'}
+        app, actual = self._do_sort_nodes(conf, per_policy, nodes, POLICIES[0])
+        self.assertEqual([nodes[1], nodes[0]], actual)
+
+    def test_sort_nodes_by_affinity_per_policy_overrides(self):
+        # default setting is to sort by timing but policy 0 uses read affinity
+        nodes = [{'region': 0, 'zone': 1, 'ip': '127.0.0.3'},
+                 {'region': 1, 'zone': 1, 'ip': '127.0.0.1'},
+                 {'region': 2, 'zone': 2, 'ip': '127.0.0.2'}]
+        node_timings = [10, 1, 100]
+        conf = {'sorting_method': 'timing'}
+        per_policy = {'0': {'sorting_method': 'affinity',
+                            'read_affinity': 'r1=1,r2=2'}}
+        app, actual = self._do_sort_nodes(conf, per_policy, nodes, POLICIES[0],
+                                          node_timings=node_timings)
+        self.assertEqual([nodes[1], nodes[2], nodes[0]], actual)
+        # check that timings are collected despite one policy using affinity
+        self.assertTrue(app.sorts_by_timing)
+        self.assertEqual(3, len(app.node_timings))
+        # check app defaults to sorting by timing when no policy specified
+        app, actual = self._do_sort_nodes(conf, per_policy, nodes, None,
+                                          node_timings=node_timings)
+        self.assertEqual([nodes[1], nodes[0], nodes[2]], actual)
+
+    @patch_policies([StoragePolicy(0, 'zero', True, object_ring=FakeRing()),
+                     StoragePolicy(1, 'one', False, object_ring=FakeRing())])
+    def test_sort_nodes_by_timing_per_policy(self):
+        # default setting is to sort by affinity but policy 0 uses timing
+        nodes = [{'region': 0, 'zone': 1, 'ip': '127.0.0.3'},
+                 {'region': 1, 'zone': 1, 'ip': '127.0.0.1'},
+                 {'region': 2, 'zone': 2, 'ip': '127.0.0.2'}]
+        node_timings = [10, 1, 100]
+
+        conf = {'sorting_method': 'affinity', 'read_affinity': 'r1=1,r2=2'}
+        per_policy = {'0': {'sorting_method': 'timing',
+                            'read_affinity': 'r1=1,r2=2'},  # should be ignored
+                      '1': {'read_affinity': 'r2=1'}}
+        # policy 0 uses timing
+        app, actual = self._do_sort_nodes(conf, per_policy, nodes, POLICIES[0],
+                                          node_timings=node_timings)
+        self.assertEqual([nodes[1], nodes[0], nodes[2]], actual)
+        self.assertTrue(app.sorts_by_timing)
+        self.assertEqual(3, len(app.node_timings))
+
+        # policy 1 uses policy specific read affinity
+        app, actual = self._do_sort_nodes(conf, per_policy, nodes, POLICIES[1],
+                                          node_timings=node_timings)
+        self.assertEqual([nodes[2], nodes[0], nodes[1]], actual)
+
+        # check that with no policy specified the default read affinity is used
+        app, actual = self._do_sort_nodes(conf, per_policy, nodes, None,
+                                          node_timings=node_timings)
+        self.assertEqual([nodes[1], nodes[2], nodes[0]], actual)
+
+    def test_node_concurrency(self):
+        nodes = [{'region': 1, 'zone': 1, 'ip': '127.0.0.1', 'port': 6010,
+                  'device': 'sda'},
+                 {'region': 2, 'zone': 2, 'ip': '127.0.0.2', 'port': 6010,
+                  'device': 'sda'},
+                 {'region': 3, 'zone': 3, 'ip': '127.0.0.3', 'port': 6010,
+                  'device': 'sda'}]
+        timings = {'127.0.0.1': 2, '127.0.0.2': 1, '127.0.0.3': 0}
+        statuses = {'127.0.0.1': 200, '127.0.0.2': 200, '127.0.0.3': 200}
+        req = Request.blank('/v1/account', environ={'REQUEST_METHOD': 'GET'})
+
+        def fake_iter_nodes(*arg, **karg):
+            class FakeNodeIter(object):
+                num_primary_nodes = 3
+
+                def __iter__(self):
+                    return iter(nodes)
+
+            return FakeNodeIter()
+
+        class FakeConn(object):
+            def __init__(self, ip, *args, **kargs):
+                self.ip = ip
+                self.args = args
+                self.kargs = kargs
+
+            def getresponse(self):
+                body = 'Response from %s' % self.ip
+
+                def mygetheader(header, *args, **kargs):
+                    if header == "Content-Type":
+                        return ""
+                    elif header == "Content-Length":
+                        return str(len(body))
+                    else:
+                        return "1"
+
+                resp = mock.Mock()
+                resp.read.side_effect = [body.encode('ascii'), b'']
+                resp.getheader = mygetheader
+                resp.getheaders.return_value = {}
+                resp.reason = ''
+                resp.status = statuses[self.ip]
+                sleep(timings[self.ip])
+                return resp
+
+        def myfake_http_connect_raw(ip, *args, **kargs):
+            conn = FakeConn(ip, *args, **kargs)
+            return conn
+
+        with mock.patch('swift.proxy.controllers.account.NodeIter',
+                        fake_iter_nodes):
+            with mock.patch('swift.common.bufferedhttp.http_connect_raw',
+                            myfake_http_connect_raw):
+                app_conf = {'concurrent_gets': 'on',
+                            'concurrency_timeout': 0}
+                baseapp = proxy_server.Application(app_conf,
+                                                   container_ring=FakeRing(),
+                                                   account_ring=FakeRing())
+                policy_opts = baseapp.get_policy_options(None)
+                self.assertTrue(policy_opts.concurrent_gets)
+                self.assertEqual(policy_opts.concurrency_timeout, 0)
+
+                baseapp.update_request(req)
+                resp = baseapp.handle_request(req)
+
+                # Should get 127.0.0.3 as this has a wait of 0 seconds.
+                self.assertEqual(resp.body, b'Response from 127.0.0.3')
+
+                # lets try again, with 127.0.0.1 with 0 timing but returns an
+                # error.
+                timings['127.0.0.1'] = 0
+                statuses['127.0.0.1'] = 500
+
+                # Should still get 127.0.0.3 as this has a wait of 0 seconds
+                # and a success
+                baseapp.update_request(req)
+                resp = baseapp.handle_request(req)
+                self.assertEqual(resp.body, b'Response from 127.0.0.3')
+
+                # Now lets set the concurrency_timeout
+                app_conf['concurrency_timeout'] = 2
+                baseapp = proxy_server.Application(app_conf,
+                                                   container_ring=FakeRing(),
+                                                   account_ring=FakeRing())
+                policy_opts = baseapp.get_policy_options(None)
+                self.assertEqual(policy_opts.concurrency_timeout, 2)
+                baseapp.update_request(req)
+                resp = baseapp.handle_request(req)
+
+                # Should get 127.0.0.2 as this has a wait of 1 seconds.
+                self.assertEqual(resp.body, b'Response from 127.0.0.2')
+
+    def test_info_defaults(self):
+        app = proxy_server.Application({},
+                                       account_ring=FakeRing(),
+                                       container_ring=FakeRing())
+
+        self.assertTrue(app.expose_info)
+        self.assertIsInstance(app.disallowed_sections, list)
+        self.assertEqual(2, len(app.disallowed_sections))
+        self.assertEqual([
+            'swift.auto_create_account_prefix',
+            'swift.valid_api_versions',
+        ], sorted(app.disallowed_sections))
+        self.assertIsNone(app.admin_key)
+
+    def test_get_info_controller(self):
+        req = Request.blank('/info')
+        app = proxy_server.Application({},
+                                       account_ring=FakeRing(),
+                                       container_ring=FakeRing())
+
+        controller, path_parts = app.get_controller(req)
+
+        self.assertIn('version', path_parts)
+        self.assertIsNone(path_parts['version'])
+        self.assertIn('disallowed_sections', path_parts)
+        self.assertIn('expose_info', path_parts)
+        self.assertIn('admin_key', path_parts)
+
+        self.assertEqual(controller.__name__, 'InfoController')
+
+    def test_exception_occurred_replication_ip_port_logging(self):
+        logger = debug_logger('test')
+        app = proxy_server.Application(
+            {},
+            account_ring=FakeRing(separate_replication=True),
+            container_ring=FakeRing(separate_replication=True),
+            logger=logger)
+        app.sort_nodes = lambda nodes, policy: nodes
+        part = app.container_ring.get_part('a', 'c')
+        nodes = app.container_ring.get_part_nodes(part)
+        self.assertNotEqual(nodes[0]['ip'], nodes[0]['replication_ip'])
+        self.assertEqual(0, sum([node_error_count(app, node)
+                                 for node in nodes]))  # sanity
+
+        # no use_replication header...
+        req = Request.blank('/v1/a/c')
+        with mocked_http_conn(200, 503, 200) as mocked_conn:
+            req.get_response(app)
+
+        expected = [(n['ip'], n['port']) for n in nodes[:2]]
+        actual = [(req['ip'], req['port']) for req in mocked_conn.requests[1:]]
+        self.assertEqual(expected, actual)
+        line = logger.get_lines_for_level('error')[-1]
+        self.assertIn('Container Server', line)
+        self.assertIn('%s:%s/%s' % (nodes[0]['ip'],
+                                    nodes[0]['port'],
+                                    nodes[0]['device']), line)
+        self.assertEqual(1, sum([node_error_count(app, node)
+                                 for node in nodes]))
+        annotated_nodes = [dict(node, use_replication=True) for node in nodes]
+        self.assertEqual(0, sum([node_error_count(app, node)
+                                 for node in annotated_nodes]))
+
+        logger.clear()
+        req = Request.blank(
+            '/v1/a/c',
+            headers={'x-backend-use-replication-network': True})
+        with mocked_http_conn(200, 503, 200):
+            req.get_response(app)
+        line = logger.get_lines_for_level('error')[-1]
+        self.assertIn('Container Server', line)
+        self.assertIn('%s:%s/%s' % (nodes[0]['replication_ip'],
+                                    nodes[0]['replication_port'],
+                                    nodes[0]['device']), line)
+        self.assertEqual(1, sum([node_error_count(app, node)
+                                 for node in nodes]))
+        annotated_nodes = [dict(node, use_replication=True) for node in nodes]
+        self.assertEqual(1, sum([node_error_count(app, node)
+                                 for node in annotated_nodes]))
+
+    def test_exception_occurred(self):
+        def do_test(expected_info):
+            logger = debug_logger('test')
+            suppression_limit = 10
+            app = proxy_server.Application(
+                {'error_suppression_limit': suppression_limit},
+                account_ring=FakeRing(),
+                container_ring=FakeRing(),
+                logger=logger)
+            node = app.container_ring.get_part_nodes(0)[0]
+            node_key = app.error_limiter.node_key(node)
+            self.assertNotIn(node_key, app.error_limiter.stats)  # sanity
+
+            incremented_limit_samples = []
+            for i in range(suppression_limit + 1):
+                try:
+                    raise Exception('kaboom1!')
+                except Exception as err:
+                    caught_exc = err
+                    app.exception_occurred(
+                        node, 'server-type', expected_info)
+                self.assertEqual(i + 1, node_error_count(app, node))
+                line = logger.get_lines_for_level('error')[i]
+                self.assertIn('server-type server', line)
+                self.assertIn(expected_info, line)
+                self.assertIn(node['ip'], line)
+                self.assertIn(str(node['port']), line)
+                self.assertIn(node['device'], line)
+                log_args, log_kwargs = logger.log_dict['error'][i]
+                self.assertTrue(log_kwargs['exc_info'])
+                self.assertIs(caught_exc, log_kwargs['exc_info'][1])
+                incremented_limit_samples.append(
+                    logger.statsd_client.get_stats_counts().get(
+                        'error_limiter.incremented_limit', 0))
+            self.assertEqual([0] * 10 + [1], incremented_limit_samples)
+            self.assertEqual(
+                ('Node will be error limited for 60.00s: %s' %
+                 node_to_string(node)),
+                logger.get_lines_for_level('error')[suppression_limit + 1])
+
+        do_test('success')
+        do_test('succès')
+        do_test(u'success')
+
+    def test_error_occurred(self):
+        def do_test(msg):
+            logger = debug_logger('test')
+            suppression_limit = 10
+            app = proxy_server.Application(
+                {'error_suppression_limit': suppression_limit},
+                account_ring=FakeRing(),
+                container_ring=FakeRing(),
+                logger=logger)
+            node = app.container_ring.get_part_nodes(0)[0]
+            node_key = app.error_limiter.node_key(node)
+            self.assertNotIn(node_key, app.error_limiter.stats)  # sanity
+
+            expected_msg = msg
+            incremented_limit_samples = []
+            for i in range(suppression_limit + 1):
+                app.error_occurred(node, msg)
+                self.assertEqual(i + 1, node_error_count(app, node))
+                line = logger.get_lines_for_level('error')[i]
+                self.assertIn(expected_msg, line)
+                self.assertIn(node_to_string(node), line)
+                incremented_limit_samples.append(
+                    logger.statsd_client.get_stats_counts().get(
+                        'error_limiter.incremented_limit', 0))
+
+            self.assertEqual([0] * 10 + [1], incremented_limit_samples)
+            self.assertEqual(
+                ('Node will be error limited for 60.00s: %s' %
+                 node_to_string(node)),
+                logger.get_lines_for_level('error')[-1])
+
+            # error limiting is extended if another error occurs
+            app.error_occurred(node, msg)
+            self.assertEqual(suppression_limit + 2,
+                             node_error_count(app, node))
+            line = logger.get_lines_for_level('error')[-2]
+            self.assertIn(expected_msg, line)
+            self.assertIn(node_to_string(node), line)
+            self.assertEqual(
+                2, logger.statsd_client.get_stats_counts().get(
+                    'error_limiter.incremented_limit', 0))
+            self.assertEqual(
+                ('Node will be error limited for 60.00s: %s' %
+                 node_to_string(node)),
+                logger.get_lines_for_level('error')[-1])
+
+        do_test('success')
+        do_test('succès')
+        do_test(u'success')
+
+    def test_error_limit_methods(self):
+        logger = debug_logger('test')
+        app = proxy_server.Application({},
+                                       account_ring=FakeRing(),
+                                       container_ring=FakeRing(),
+                                       logger=logger)
+        node = app.container_ring.get_part_nodes(0)[0]
+        # error occurred
+        app.error_occurred(node, 'test msg')
+        self.assertTrue('test msg' in
+                        logger.get_lines_for_level('error')[-1])
+        self.assertEqual(1, node_error_count(app, node))
+
+        # exception occurred
+        expected_err = None
+        try:
+            raise Exception('kaboom1!')
+        except Exception as e1:
+            expected_err = e1
+            app.exception_occurred(node, 'test1', 'test1 msg')
+        line = logger.get_lines_for_level('error')[-1]
+        self.assertIn('test1 server', line)
+        self.assertIn('test1 msg', line)
+        log_args, log_kwargs = logger.log_dict['error'][-1]
+        self.assertTrue(log_kwargs['exc_info'])
+        self.assertIs(log_kwargs['exc_info'][1], expected_err)
+        self.assertEqual(2, node_error_count(app, node))
+
+        # warning exception occurred
+        try:
+            raise Exception('kaboom2!')
+        except Exception as e2:
+            expected_err = e2
+            app.exception_occurred(node, 'test2', 'test2 msg',
+                                   level=logging.WARNING)
+        line = logger.get_lines_for_level('warning')[-1]
+        self.assertIn('test2 server', line)
+        self.assertIn('test2 msg', line)
+        log_args, log_kwargs = logger.log_dict['warning'][-1]
+        self.assertTrue(log_kwargs['exc_info'])
+        self.assertIs(log_kwargs['exc_info'][1], expected_err)
+        self.assertEqual(3, node_error_count(app, node))
+
+        # custom exception occurred
+        try:
+            raise Exception('kaboom3!')
+        except Exception as e3:
+            expected_err = e3
+            e3_info = sys.exc_info()
+            try:
+                raise Exception('kaboom4!')
+            except Exception:
+                pass
+            app.exception_occurred(node, 'test3', 'test3 msg',
+                                   level=logging.WARNING, exc_info=e3_info)
+        line = logger.get_lines_for_level('warning')[-1]
+        self.assertIn('test3 server', line)
+        self.assertIn('test3 msg', line)
+        log_args, log_kwargs = logger.log_dict['warning'][-1]
+        self.assertTrue(log_kwargs['exc_info'])
+        self.assertIs(log_kwargs['exc_info'][1], expected_err)
+        self.assertEqual(4, node_error_count(app, node))
+
+    def test_check_response_200(self):
+        app = proxy_server.Application({},
+                                       account_ring=FakeRing(),
+                                       container_ring=FakeRing(),
+                                       logger=debug_logger())
+        node = app.container_ring.get_part_nodes(1)[0]
+        resp = FakeHTTPResponse(Response())
+        ret = app.check_response(node, 'Container', resp, 'PUT', '/v1/a/c')
+        self.assertTrue(ret)
+        error_lines = app.logger.get_lines_for_level('error')
+        self.assertFalse(error_lines)
+        self.assertEqual(0, node_error_count(app, node))
+
+    def test_check_response_507(self):
+        app = proxy_server.Application({},
+                                       account_ring=FakeRing(),
+                                       container_ring=FakeRing(),
+                                       logger=debug_logger())
+        node = app.container_ring.get_part_nodes(1)[0]
+        resp = FakeHTTPResponse(Response(status=507))
+        ret = app.check_response(node, 'Container', resp, 'PUT', '/v1/a/c')
+        self.assertFalse(ret)
+        error_lines = app.logger.get_lines_for_level('error')
+        self.assertEqual(1, len(error_lines))
+        self.assertEqual(
+            'Node will be error limited for 60.00s: 10.0.0.0:1000/sda, '
+            'error: ERROR Insufficient Storage', error_lines[0])
+        self.assertEqual(11, node_error_count(app, node))
+        self.assertTrue(app.error_limited(node))
+
+        app.logger.clear()
+        ret = app.check_response(node, 'Account', resp, 'PUT', '/v1/a/c',
+                                 body='full')
+        self.assertFalse(ret)
+        error_lines = app.logger.get_lines_for_level('error')
+        self.assertEqual(1, len(error_lines))
+        self.assertEqual(
+            'Node will be error limited for 60.00s: 10.0.0.0:1000/sda, '
+            'error: ERROR Insufficient Storage', error_lines[0])
+        self.assertEqual(11, node_error_count(app, node))
+        self.assertTrue(app.error_limited(node))
+
+    def test_check_response_503(self):
+        app = proxy_server.Application({},
+                                       account_ring=FakeRing(),
+                                       container_ring=FakeRing(),
+                                       logger=debug_logger())
+        node = app.container_ring.get_part_nodes(1)[0]
+        resp = FakeHTTPResponse(Response(status=503))
+        app.logger.clear()
+        ret = app.check_response(node, 'Container', resp, 'PUT', '/v1/a/c')
+        self.assertFalse(ret)
+        error_lines = app.logger.get_lines_for_level('error')
+        self.assertEqual(1, len(error_lines))
+        self.assertEqual('ERROR 503 Trying to PUT /v1/a/c From Container '
+                         'Server 10.0.0.0:1000/sda', error_lines[0])
+        self.assertEqual(1, node_error_count(app, node))
+        self.assertFalse(app.error_limited(node))
+
+        app.logger.clear()
+        ret = app.check_response(node, 'Object', resp, 'GET', '/v1/a/c/o',
+                                 body='full')
+        self.assertFalse(ret)
+        error_lines = app.logger.get_lines_for_level('error')
+        self.assertEqual(1, len(error_lines))
+        self.assertEqual('ERROR 503 full Trying to GET /v1/a/c/o From Object '
+                         'Server 10.0.0.0:1000/sda', error_lines[0])
+        self.assertEqual(2, node_error_count(app, node))
+        self.assertFalse(app.error_limited(node))
+
+    def test_valid_api_version(self):
+        app = proxy_server.Application({},
+                                       account_ring=FakeRing(),
+                                       container_ring=FakeRing())
+
+        # The version string is only checked for account, container and object
+        # requests; the raised APIVersionError returns a 404 to the client
+        for path in [
+                '/v2/a',
+                '/v2/a/c',
+                '/v2/a/c/o']:
+            req = Request.blank(path)
+            self.assertRaises(APIVersionError, app.get_controller, req)
+
+        # Default valid API versions are ok
+        for path in [
+                '/v1/a',
+                '/v1/a/c',
+                '/v1/a/c/o',
+                '/v1.0/a',
+                '/v1.0/a/c',
+                '/v1.0/a/c/o']:
+            req = Request.blank(path)
+            controller, path_parts = app.get_controller(req)
+            self.assertIsNotNone(controller)
+
+        # Ensure settings valid API version constraint works
+        for version in ["42", 42]:
+            try:
+                with NamedTemporaryFile('w+t') as f:
+                    f.write('[swift-constraints]\n')
+                    f.write('valid_api_versions = %s\n' % version)
+                    f.flush()
+                    with mock.patch.object(utils, 'SWIFT_CONF_FILE', f.name):
+                        constraints.reload_constraints()
+
+                    req = Request.blank('/%s/a' % version)
+                    controller, _ = app.get_controller(req)
+                    self.assertIsNotNone(controller)
+
+                    # In this case v1 is invalid
+                    req = Request.blank('/v1/a')
+                    self.assertRaises(APIVersionError, app.get_controller, req)
+            finally:
+                constraints.reload_constraints()
+
+        # Check that the valid_api_versions is not exposed by default
+        req = Request.blank('/info')
+        controller, path_parts = app.get_controller(req)
+        self.assertTrue('swift.valid_api_versions' in
+                        path_parts.get('disallowed_sections'))
+
+    def test_statsd_prefix(self):
+        app = proxy_server.Application({'log_statsd_host': 'example.com'},
+                                       account_ring=FakeRing(),
+                                       container_ring=FakeRing())
+        self.assertIsNotNone(app.logger.logger.statsd_client)
+        self.assertIsInstance(app.logger.logger.statsd_client,
+                              StatsdClient)
+        self.assertEqual('proxy-server.',
+                         app.logger.logger.statsd_client._prefix)
+
+        app = proxy_server.Application({'log_statsd_metric_prefix': 'foo',
+                                        'log_name': 'bar',
+                                        'log_statsd_host': 'example.com'},
+                                       account_ring=FakeRing(),
+                                       container_ring=FakeRing())
+        self.assertIsNotNone(app.logger.logger.statsd_client)
+        self.assertIsInstance(app.logger.logger.statsd_client,
+                              StatsdClient)
+        self.assertEqual('foo.proxy-server.',
+                         app.logger.logger.statsd_client._prefix)
 
-class TestObjectController(unittest.TestCase):
+
+@patch_policies([
+    StoragePolicy(0, 'zero', is_default=True),
+    StoragePolicy(1, 'one'),
+])
+class TestProxyServerLoading(unittest.TestCase):
 
     def setUp(self):
-        self.app = proxy_server.Application(None, FakeMemcache(),
-                                            account_ring=FakeRing(),
-                                            container_ring=FakeRing(),
-                                            object_ring=FakeRing())
-        monkey_patch_mimetools()
+        self._orig_hash_suffix = utils.HASH_PATH_SUFFIX
+        utils.HASH_PATH_SUFFIX = b'endcap'
+        self.tempdir = mkdtemp()
+
+    def tearDown(self):
+        rmtree(self.tempdir)
+        utils.HASH_PATH_SUFFIX = self._orig_hash_suffix
+        for policy in POLICIES:
+            policy.object_ring = None
+
+    def test_float_timeouts(self):
+        conf = {
+            'node_timeout': '2.3',
+            'recoverable_node_timeout': '1.4',
+            'conn_timeout': '0.7',
+            'client_timeout': '1.7',
+            'post_quorum_timeout': '0.3',
+            'concurrency_timeout': '0.2',
+
+        }
+        for policy in POLICIES:
+            policy.object_ring = FakeRing()
+        app = proxy_server.Application(conf, debug_logger(),
+                                       FakeRing(), FakeRing())
+        self.assertEqual(app.node_timeout, 2.3)
+        self.assertEqual(app.recoverable_node_timeout, 1.4)
+        self.assertEqual(app.conn_timeout, 0.7)
+        self.assertEqual(app.client_timeout, 1.7)
+        self.assertEqual(app.post_quorum_timeout, 0.3)
+        self.assertEqual(app.get_policy_options(
+            None).concurrency_timeout, 0.2)
+
+    def test_concurrent_ec_options(self):
+        conf = {
+            'concurrent_gets': 'on',
+            'concurrency_timeout': '0.5',
+            'concurrent_ec_extra_requests': '4',
+        }
+        for policy in POLICIES:
+            policy.object_ring = FakeRing()
+        app = proxy_server.Application(conf, debug_logger(),
+                                       FakeRing(), FakeRing())
+        for policy in POLICIES:
+            policy_opts = app.get_policy_options(policy)
+            self.assertEqual(policy_opts.concurrent_ec_extra_requests, 4)
+            self.assertEqual(policy_opts.concurrent_gets, True)
+            self.assertEqual(policy_opts.concurrency_timeout, 0.5)
+
+    def test_load_policy_rings(self):
+        for policy in POLICIES:
+            self.assertFalse(policy.object_ring)
+        conf_path = os.path.join(self.tempdir, 'proxy-server.conf')
+        conf_body = """
+        [DEFAULT]
+        swift_dir = %s
+
+        [pipeline:main]
+        pipeline = catch_errors cache proxy-server
+
+        [app:proxy-server]
+        use = egg:swift#proxy
+
+        [filter:cache]
+        use = egg:swift#memcache
+
+        [filter:catch_errors]
+        use = egg:swift#catch_errors
+        """ % self.tempdir
+        with open(conf_path, 'w') as f:
+            f.write(dedent(conf_body))
+        account_ring_path = os.path.join(self.tempdir, 'account.ring.gz')
+        write_fake_ring(account_ring_path)
+        container_ring_path = os.path.join(self.tempdir, 'container.ring.gz')
+        write_fake_ring(container_ring_path)
+        for policy in POLICIES:
+            object_ring_path = os.path.join(self.tempdir,
+                                            policy.ring_name + '.ring.gz')
+            write_fake_ring(object_ring_path)
+        app = loadapp(conf_path)._pipeline_final_app
+
+        # validate loaded rings
+        self.assertEqual(app.account_ring.serialized_path,
+                         account_ring_path)
+        self.assertEqual(app.container_ring.serialized_path,
+                         container_ring_path)
+        for policy in POLICIES:
+            self.assertEqual(policy.object_ring,
+                             app.get_object_ring(int(policy)))
+
+    def test_missing_rings(self):
+        conf_path = os.path.join(self.tempdir, 'proxy-server.conf')
+        conf_body = """
+        [DEFAULT]
+        swift_dir = %s
+
+        [pipeline:main]
+        pipeline = catch_errors cache proxy-server
+
+        [app:proxy-server]
+        use = egg:swift#proxy
+
+        [filter:cache]
+        use = egg:swift#memcache
+
+        [filter:catch_errors]
+        use = egg:swift#catch_errors
+        """ % self.tempdir
+        with open(conf_path, 'w') as f:
+            f.write(dedent(conf_body))
+        ring_paths = [
+            os.path.join(self.tempdir, 'account.ring.gz'),
+            os.path.join(self.tempdir, 'container.ring.gz'),
+        ]
+        for policy in POLICIES:
+            self.assertFalse(policy.object_ring)
+            object_ring_path = os.path.join(self.tempdir,
+                                            policy.ring_name + '.ring.gz')
+            ring_paths.append(object_ring_path)
+        for policy in POLICIES:
+            self.assertFalse(policy.object_ring)
+        for ring_path in ring_paths:
+            self.assertFalse(os.path.exists(ring_path))
+            self.assertRaises(IOError, loadapp, conf_path)
+            write_fake_ring(ring_path)
+        # all rings exist, app should load
+        loadapp(conf_path)
+        for policy in POLICIES:
+            self.assertTrue(policy.object_ring)
+
+
+@patch_policies()
+class TestProxyServerConfigLoading(unittest.TestCase):
+
+    def setUp(self):
+        skip_if_no_xattrs()
+        _test_servers[0].error_limiter.stats.clear()  # clear out errors
+        self.tempdir = mkdtemp()
+        account_ring_path = os.path.join(self.tempdir, 'account.ring.gz')
+        write_fake_ring(account_ring_path)
+        container_ring_path = os.path.join(self.tempdir, 'container.ring.gz')
+        write_fake_ring(container_ring_path)
+
+    def tearDown(self):
+        rmtree(self.tempdir)
+
+    def _write_conf(self, conf_body):
+        # this is broken out to a method so that subclasses can override
+        conf_path = os.path.join(self.tempdir, 'proxy-server.conf')
+        with open(conf_path, 'w') as f:
+            f.write(dedent(conf_body))
+        return conf_path
+
+    def _default_conf(self):
+        conf_path = os.path.abspath(os.path.join(
+            os.path.dirname(__file__),
+            '../../../',
+            'etc/proxy-server.conf-sample'
+        ))
+        with open(conf_path) as f:
+            conf_body = f.read()
+        fixed_body = conf_body.replace('# swift_dir = /etc/swift',
+                                       'swift_dir = %s' % self.tempdir)
+        conf_path = self._write_conf(fixed_body)
+        return conf_path
+
+    def test_default_proxy_config(self):
+        app = loadapp(self._default_conf())
+        req = Request.blank('/info')
+        resp = req.get_response(app)
+        self.assertEqual(resp.status_int, 200)
+
+    def _write_conf_and_load_app(self, conf_sections, app_name='proxy-server'):
+        # write proxy-server.conf file, load app
+        conf_body = dedent("""
+        [DEFAULT]
+        swift_dir = %s
+
+        [pipeline:main]
+        pipeline = %s
+
+        %s
+        """) % (self.tempdir, app_name, dedent(conf_sections))
+
+        conf_path = self._write_conf(conf_body)
+        with mock.patch('swift.proxy.server.get_logger',
+                        return_value=debug_logger()):
+            app = loadapp(conf_path, allow_modify_pipeline=False)
+        return app
+
+    def _check_policy_options(self, app, exp_options, exp_is_local):
+        # verify expected config
+        for policy, options in exp_options.items():
+            for k, v in options.items():
+                actual = getattr(app.get_policy_options(policy), k)
+                if k == "write_affinity_node_count_fn":
+                    if policy:  # this check only applies when using a policy
+                        actual = actual(policy.object_ring.replica_count)
+                        self.assertEqual(v, actual)
+                    continue
+                self.assertEqual(v, actual,
+                                 "Expected %s=%s but got %s=%s for policy %s" %
+                                 (k, v, k, actual, policy))
+
+        for policy, nodes in exp_is_local.items():
+            fn = app.get_policy_options(policy).write_affinity_is_local_fn
+            if nodes is None:
+                self.assertIsNone(fn)
+                continue
+            for node, expected_result in nodes:
+                actual = fn(node)
+                self.assertIs(expected_result, actual,
+                              "Expected %s but got %s for %s, policy %s" %
+                              (expected_result, actual, node, policy))
+
+    def test_per_policy_conf_none_configured(self):
+        conf_sections = """
+        [app:proxy-server]
+        use = egg:swift#proxy
+        """
+        expected_default = {"read_affinity": "",
+                            "sorting_method": "shuffle",
+                            "write_affinity": "",
+                            "write_affinity_node_count_fn": 6}
+        exp_options = {None: expected_default,
+                       POLICIES[0]: expected_default,
+                       POLICIES[1]: expected_default}
+        exp_is_local = {POLICIES[0]: None,
+                        POLICIES[1]: None}
+        app = self._write_conf_and_load_app(conf_sections)
+        self._check_policy_options(app, exp_options, exp_is_local)
+
+    def test_per_policy_conf_one_configured(self):
+        conf_sections = """
+        [app:proxy-server]
+        use = egg:swift#proxy
+
+        [proxy-server:policy:0]
+        sorting_method = affinity
+        read_affinity = r1=100
+        write_affinity = r1
+        write_affinity_node_count = 1 * replicas
+        write_affinity_handoff_delete_count = 4
+        rebalance_missing_suppression_count = 2
+        """
+        expected_default = {"read_affinity": "",
+                            "sorting_method": "shuffle",
+                            "write_affinity": "",
+                            "write_affinity_node_count_fn": 6,
+                            "write_affinity_handoff_delete_count": None,
+                            "rebalance_missing_suppression_count": 1}
+        exp_options = {None: expected_default,
+                       POLICIES[0]: {"read_affinity": "r1=100",
+                                     "sorting_method": "affinity",
+                                     "write_affinity": "r1",
+                                     "write_affinity_node_count_fn": 3,
+                                     "write_affinity_handoff_delete_count": 4,
+                                     "rebalance_missing_suppression_count": 2},
+                       POLICIES[1]: expected_default}
+        exp_is_local = {POLICIES[0]: [({'region': 1, 'zone': 2}, True),
+                                      ({'region': 2, 'zone': 1}, False)],
+                        POLICIES[1]: None}
+        app = self._write_conf_and_load_app(conf_sections)
+        self._check_policy_options(app, exp_options, exp_is_local)
+
+        default_options = app.get_policy_options(None)
+        self.assertEqual(
+            "ProxyOverrideOptions({}, {'sorting_method': 'shuffle', "
+            "'read_affinity': '', 'write_affinity': '', "
+            "'write_affinity_node_count': '2 * replicas', "
+            "'write_affinity_handoff_delete_count': None, "
+            "'rebalance_missing_suppression_count': 1, "
+            "'concurrent_gets': False, 'concurrency_timeout': 0.5, "
+            "'concurrent_ec_extra_requests': 0"
+            "}, app)",
+            repr(default_options))
+        self.assertEqual(default_options, eval(repr(default_options), {
+            'ProxyOverrideOptions': default_options.__class__, 'app': app}))
+
+        policy_0_options = app.get_policy_options(POLICIES[0])
+        self.assertEqual(
+            "ProxyOverrideOptions({}, {'sorting_method': 'affinity', "
+            "'read_affinity': 'r1=100', 'write_affinity': 'r1', "
+            "'write_affinity_node_count': '1 * replicas', "
+            "'write_affinity_handoff_delete_count': 4, "
+            "'rebalance_missing_suppression_count': 2, "
+            "'concurrent_gets': False, 'concurrency_timeout': 0.5, "
+            "'concurrent_ec_extra_requests': 0"
+            "}, app)",
+            repr(policy_0_options))
+        self.assertEqual(policy_0_options, eval(repr(policy_0_options), {
+            'ProxyOverrideOptions': default_options.__class__, 'app': app}))
+        self.assertNotEqual(default_options, policy_0_options)
+
+        policy_1_options = app.get_policy_options(POLICIES[1])
+        self.assertIs(default_options, policy_1_options)
+
+    def test_per_policy_conf_equality(self):
+        conf_sections = """
+        [app:proxy-server]
+        use = egg:swift#proxy
+        """
+        app = self._write_conf_and_load_app(conf_sections)
+        self.assertIs(app.get_policy_options(None),
+                      app.get_policy_options(POLICIES[0]))
+
+        conf_sections = """
+        [app:proxy-server]
+        use = egg:swift#proxy
+
+        [proxy-server:policy:0]
+        concurrent_ec_extra_requests = 1
+        """
+        app = self._write_conf_and_load_app(conf_sections)
+        self.assertNotEqual(app.get_policy_options(None),
+                            app.get_policy_options(POLICIES[0]))
+
+    def test_per_policy_conf_inherits_defaults(self):
+        conf_sections = """
+        [app:proxy-server]
+        use = egg:swift#proxy
+        sorting_method = affinity
+        write_affinity_node_count = 1 * replicas
+        write_affinity_handoff_delete_count = 3
+
+        [proxy-server:policy:0]
+        read_affinity = r1=100
+        write_affinity = r1
+        """
+        expected_default = {"read_affinity": "",
+                            "sorting_method": "affinity",
+                            "write_affinity": "",
+                            "write_affinity_node_count_fn": 3,
+                            "write_affinity_handoff_delete_count": 3}
+        exp_options = {None: expected_default,
+                       POLICIES[0]: {"read_affinity": "r1=100",
+                                     "sorting_method": "affinity",
+                                     "write_affinity": "r1",
+                                     "write_affinity_node_count_fn": 3,
+                                     "write_affinity_handoff_delete_count": 3},
+                       POLICIES[1]: expected_default}
+        exp_is_local = {POLICIES[0]: [({'region': 1, 'zone': 2}, True),
+                                      ({'region': 2, 'zone': 1}, False)],
+                        POLICIES[1]: None}
+        app = self._write_conf_and_load_app(conf_sections)
+        self._check_policy_options(app, exp_options, exp_is_local)
+
+    def test_per_policy_conf_overrides_default_affinity(self):
+        conf_sections = """
+        [app:proxy-server]
+        use = egg:swift#proxy
+        sorting_method = affinity
+        read_affinity = r2=10
+        write_affinity_node_count = 1 * replicas
+        write_affinity = r2
+        write_affinity_handoff_delete_count = 2
+
+        [proxy-server:policy:0]
+        read_affinity = r1=100
+        write_affinity = r1
+        write_affinity_node_count = 5
+        write_affinity_handoff_delete_count = 3
+
+        [proxy-server:policy:1]
+        read_affinity = r1=1
+        write_affinity = r3
+        write_affinity_node_count = 4
+        write_affinity_handoff_delete_count = 4
+        """
+        exp_options = {None: {"read_affinity": "r2=10",
+                              "sorting_method": "affinity",
+                              "write_affinity": "r2",
+                              "write_affinity_node_count_fn": 3,
+                              "write_affinity_handoff_delete_count": 2},
+                       POLICIES[0]: {"read_affinity": "r1=100",
+                                     "sorting_method": "affinity",
+                                     "write_affinity": "r1",
+                                     "write_affinity_node_count_fn": 5,
+                                     "write_affinity_handoff_delete_count": 3},
+                       POLICIES[1]: {"read_affinity": "r1=1",
+                                     "sorting_method": "affinity",
+                                     "write_affinity": "r3",
+                                     "write_affinity_node_count_fn": 4,
+                                     "write_affinity_handoff_delete_count": 4}}
+        exp_is_local = {POLICIES[0]: [({'region': 1, 'zone': 2}, True),
+                                      ({'region': 2, 'zone': 1}, False)],
+                        POLICIES[1]: [({'region': 3, 'zone': 2}, True),
+                                      ({'region': 1, 'zone': 1}, False),
+                                      ({'region': 2, 'zone': 1}, False)]}
+        app = self._write_conf_and_load_app(conf_sections)
+        self._check_policy_options(app, exp_options, exp_is_local)
+
+    def test_per_policy_conf_overrides_default_sorting_method(self):
+        conf_sections = """
+        [app:proxy-server]
+        use = egg:swift#proxy
+        sorting_method = timing
+
+        [proxy-server:policy:0]
+        sorting_method = affinity
+        read_affinity = r1=100
+
+        [proxy-server:policy:1]
+        sorting_method = affinity
+        read_affinity = r1=1
+        """
+        exp_options = {None: {"read_affinity": "",
+                              "sorting_method": "timing"},
+                       POLICIES[0]: {"read_affinity": "r1=100",
+                                     "sorting_method": "affinity"},
+                       POLICIES[1]: {"read_affinity": "r1=1",
+                                     "sorting_method": "affinity"}}
+        app = self._write_conf_and_load_app(conf_sections)
+        self._check_policy_options(app, exp_options, {})
+
+    def test_per_policy_conf_with_DEFAULT_options(self):
+        conf_body = """
+        [DEFAULT]
+        write_affinity = r0
+        read_affinity = r0=100
+        swift_dir = %s
+
+        [pipeline:main]
+        pipeline = proxy-server
+
+        [app:proxy-server]
+        use = egg:swift#proxy
+        # in a paste-deploy section, DEFAULT section value overrides
+        write_affinity = r2
+        # ...but the use of 'set' overrides the DEFAULT section value
+        set read_affinity = r1=100
+
+        [proxy-server:policy:0]
+        # not a paste-deploy section so any value here overrides DEFAULT
+        sorting_method = affinity
+        write_affinity = r2
+        read_affinity = r2=100
+
+        [proxy-server:policy:1]
+        sorting_method = affinity
+        """ % self.tempdir
+
+        # Don't just use _write_conf_and_load_app, as we don't want to have
+        # duplicate DEFAULT sections
+        conf_path = self._write_conf(conf_body)
+        with mock.patch('swift.proxy.server.get_logger',
+                        return_value=debug_logger()):
+            app = loadapp(conf_path, allow_modify_pipeline=False)
+
+        exp_options = {
+            # default read_affinity is r1, set in proxy-server section
+            None: {"read_affinity": "r1=100",
+                   "sorting_method": "shuffle",
+                   "write_affinity": "r0",
+                   "write_affinity_node_count_fn": 6,
+                   "write_affinity_handoff_delete_count": None},
+            # policy 0 read affinity is r2, dictated by policy 0 section
+            POLICIES[0]: {"read_affinity": "r2=100",
+                          "sorting_method": "affinity",
+                          "write_affinity": "r2",
+                          "write_affinity_node_count_fn": 6,
+                          "write_affinity_handoff_delete_count": None},
+            # policy 1 read_affinity is r0, dictated by DEFAULT section,
+            # overrides proxy server section
+            POLICIES[1]: {"read_affinity": "r0=100",
+                          "sorting_method": "affinity",
+                          "write_affinity": "r0",
+                          "write_affinity_node_count_fn": 6,
+                          "write_affinity_handoff_delete_count": None}}
+        exp_is_local = {
+            # default write_affinity is r0, dictated by DEFAULT section
+            None: [({'region': 0, 'zone': 2}, True),
+                   ({'region': 1, 'zone': 1}, False)],
+            # policy 0 write_affinity is r2, dictated by policy 0 section
+            POLICIES[0]: [({'region': 0, 'zone': 2}, False),
+                          ({'region': 2, 'zone': 1}, True)],
+            # policy 1 write_affinity is r0, inherited from default
+            POLICIES[1]: [({'region': 0, 'zone': 2}, True),
+                          ({'region': 1, 'zone': 1}, False)]}
+        self._check_policy_options(app, exp_options, exp_is_local)
+
+    def test_per_policy_conf_warns_about_sorting_method_mismatch(self):
+        # verify that policy specific warnings are emitted when read_affinity
+        # is set but sorting_method is not affinity
+        conf_sections = """
+        [app:proxy-server]
+        use = egg:swift#proxy
+        read_affinity = r2=10
+        sorting_method = timing
+
+        [proxy-server:policy:0]
+        read_affinity = r1=100
+
+        [proxy-server:policy:1]
+        sorting_method = affinity
+        read_affinity = r1=1
+        """
+        exp_options = {None: {"read_affinity": "r2=10",
+                              "sorting_method": "timing"},
+                       POLICIES[0]: {"read_affinity": "r1=100",
+                                     "sorting_method": "timing"},
+                       POLICIES[1]: {"read_affinity": "r1=1",
+                                     "sorting_method": "affinity"}}
+        app = self._write_conf_and_load_app(conf_sections)
+        self._check_policy_options(app, exp_options, {})
+        lines = app.logger.get_lines_for_level('warning')
+        labels = {'default', 'policy 0 (nulo)'}
+        for line in lines[:2]:
+            self.assertIn(
+                "sorting_method is set to 'timing', not 'affinity'", line)
+            for label in labels:
+                if label in line:
+                    labels.remove(label)
+                    break
+            else:
+                self.fail("None of %s found in warning: %r" % (labels, line))
+        self.assertFalse(labels)
+
+    def test_per_policy_conf_warns_override_sorting_method_mismatch(self):
+        # verify that policy specific warnings are emitted when read_affinity
+        # is set but sorting_method is not affinity in a policy config
+        conf_sections = """
+        [app:proxy-server]
+        use = egg:swift#proxy
+        sorting_method = affinity
+        read_affinity = r2=10
+
+        [proxy-server:policy:0]
+        sorting_method = timing
+        """
+        exp_options = {None: {"read_affinity": "r2=10",
+                              "write_affinity": "",
+                              "sorting_method": "affinity"},
+                       POLICIES[0]: {"read_affinity": "r2=10",
+                                     "write_affinity": "",
+                                     "sorting_method": "timing"}}
+        app = self._write_conf_and_load_app(conf_sections)
+        self._check_policy_options(app, exp_options, {})
+        lines = app.logger.get_lines_for_level('warning')
+        for line in lines:
+            # proxy-server gets instantiated twice during loadapp so expect two
+            # warnings; check that both warnings refer to policy 0 and not the
+            # default config
+            self.assertIn(
+                "sorting_method is set to 'timing', not 'affinity'", line)
+            self.assertIn('policy 0 (nulo)', line)
+        self.assertFalse(lines[2:])
+
+    def test_per_policy_conf_section_name_inherits_from_app_section_name(self):
+        conf_sections = """
+        [app:proxy-srv]
+        use = egg:swift#proxy
+        sorting_method = affinity
+
+        [proxy-server:policy:0]
+        sorting_method = timing
+        # ignored!
+
+        [proxy-srv:policy:1]
+        sorting_method = shuffle
+        """
+        exp_options = {None: {'sorting_method': 'affinity'},
+                       POLICIES[0]: {'sorting_method': 'affinity'},
+                       POLICIES[1]: {'sorting_method': 'shuffle'}}
+        app = self._write_conf_and_load_app(conf_sections, 'proxy-srv')
+        self._check_policy_options(app, exp_options, {})
+
+    def test_per_policy_conf_with_unknown_policy(self):
+        # verify that unknown policy section raises an error
+        conf_sections = """
+        [app:proxy-server]
+        use = egg:swift#proxy
+        read_affinity = r2=10
+        sorting_method = affinity
+
+        [proxy-server:policy:999]
+        read_affinity = r2z1=1
+        """
+        with self.assertRaises(ValueError) as cm:
+            self._write_conf_and_load_app(conf_sections)
+        self.assertIn('No policy found for override config, index: 999',
+                      cm.exception.args[0])
+
+    def test_per_policy_conf_sets_timing_sorting_method(self):
+        conf_sections = """
+        [app:proxy-server]
+        use = egg:swift#proxy
+        sorting_method = affinity
+
+        [proxy-server:policy:0]
+        sorting_method = timing
+
+        [proxy-server:policy:1]
+        read_affinity = r1=1
+        """
+        exp_options = {None: {"read_affinity": "",
+                              "sorting_method": "affinity"},
+                       POLICIES[0]: {"read_affinity": "",
+                                     "sorting_method": "timing"},
+                       POLICIES[1]: {"read_affinity": "r1=1",
+                                     "sorting_method": "affinity"}}
+        app = self._write_conf_and_load_app(conf_sections)
+        self._check_policy_options(app, exp_options, {})
+
+    def test_per_policy_conf_invalid_sorting_method_value(self):
+        def do_test(conf_sections, scope):
+            with self.assertRaises(ValueError) as cm:
+                self._write_conf_and_load_app(conf_sections)
+            self.assertEqual(
+                'Invalid sorting_method value; must be one of shuffle, '
+                "timing, affinity, not 'broken' for %s" % scope,
+                cm.exception.args[0])
+
+        conf_sections = """
+        [app:proxy-server]
+        use = egg:swift#proxy
+        sorting_method = shuffle
+
+        [proxy-server:policy:0]
+        sorting_method = broken
+        """
+        do_test(conf_sections, 'policy 0 (nulo)')
+
+        conf_sections = """
+        [app:proxy-server]
+        use = egg:swift#proxy
+        sorting_method = broken
+
+        [proxy-server:policy:0]
+        sorting_method = shuffle
+        """
+        do_test(conf_sections, '(default)')
+
+    def test_per_policy_conf_invalid_read_affinity_value(self):
+        def do_test(conf_sections, label):
+            with self.assertRaises(ValueError) as cm:
+                self._write_conf_and_load_app(conf_sections)
+            self.assertIn('broken', cm.exception.args[0])
+            self.assertIn(
+                'Invalid read_affinity value:', cm.exception.args[0])
+            self.assertIn(label, cm.exception.args[0])
+
+        conf_sections = """
+        [app:proxy-server]
+        use = egg:swift#proxy
+        sorting_method = affinity
+        read_affinity = r1=1
+
+        [proxy-server:policy:0]
+        sorting_method = affinity
+        read_affinity = broken
+        """
+        do_test(conf_sections, 'policy 0 (nulo)')
+
+        conf_sections = """
+        [app:proxy-server]
+        use = egg:swift#proxy
+        sorting_method = affinity
+        read_affinity = broken
+
+        [proxy-server:policy:0]
+        sorting_method = affinity
+        read_affinity = r1=1
+        """
+        do_test(conf_sections, '(default)')
+
+    def test_per_policy_conf_invalid_write_affinity_value(self):
+        def do_test(conf_sections, label):
+            with self.assertRaises(ValueError) as cm:
+                self._write_conf_and_load_app(conf_sections)
+            self.assertIn('broken', cm.exception.args[0])
+            self.assertIn(
+                'Invalid write_affinity value:', cm.exception.args[0])
+            self.assertIn(label, cm.exception.args[0])
+
+        conf_sections = """
+        [app:proxy-server]
+        use = egg:swift#proxy
+        write_affinity = r1
+
+        [proxy-server:policy:0]
+        sorting_method = affinity
+        write_affinity = broken
+        """
+        do_test(conf_sections, 'policy 0 (nulo)')
+
+        conf_sections = """
+        [app:proxy-server]
+        use = egg:swift#proxy
+        write_affinity = broken
+
+        [proxy-server:policy:0]
+        write_affinity = r1
+        """
+        do_test(conf_sections, '(default)')
+
+    def test_per_policy_conf_invalid_write_affinity_node_count_value(self):
+        def do_test(conf_sections, label):
+            with self.assertRaises(ValueError) as cm:
+                self._write_conf_and_load_app(conf_sections)
+            self.assertIn('2* replicas', cm.exception.args[0])
+            self.assertIn('Invalid write_affinity_node_count value:',
+                          cm.exception.args[0])
+            self.assertIn(label, cm.exception.args[0])
+
+        conf_sections = """
+        [app:proxy-server]
+        use = egg:swift#proxy
+        write_affinity_node_count = 2 * replicas
+
+        [proxy-server:policy:0]
+        sorting_method = affinity
+        write_affinity_node_count = 2* replicas
+        """
+        do_test(conf_sections, 'policy 0 (nulo)')
+
+        conf_sections = """
+        [app:proxy-server]
+        use = egg:swift#proxy
+        write_affinity_node_count = 2* replicas
+
+        [proxy-server:policy:0]
+        write_affinity_node_count = 2 * replicas
+        """
+        do_test(conf_sections, '(default)')
+
+    def test_per_policy_conf_bad_section_name(self):
+        def do_test(policy):
+            conf_sections = """
+                [app:proxy-server]
+                use = egg:swift#proxy
+
+                [proxy-server:policy:%s]
+            """ % policy
+            with self.assertRaises(ValueError) as cm:
+                self._write_conf_and_load_app(conf_sections)
+            self.assertEqual(
+                "Override config must refer to policy index: %r" % policy,
+                cm.exception.args[0])
+
+        do_test('')
+        do_test('uno')
+        do_test('0.0')
+
+    def test_per_policy_conf_overrides_default_concurrency_settings(self):
+        conf_sections = """
+        [app:proxy-server]
+        use = egg:swift#proxy
+        concurrent_gets = True
+        concurrency_timeout = 0.5
+
+        [proxy-server:policy:0]
+        concurrent_gets = off
+        concurrency_timeout = 0.6
+
+        [proxy-server:policy:1]
+        concurrent_gets = True
+        concurrency_timeout = 0.3
+        concurrent_ec_extra_requests = 1
+        """
+        exp_options = {
+            None: {
+                "concurrent_gets": True,
+                "concurrency_timeout": 0.5,
+                "concurrent_ec_extra_requests": 0,
+            }, POLICIES[0]: {
+                "concurrent_gets": False,
+                "concurrency_timeout": 0.6,
+                "concurrent_ec_extra_requests": 0,
+            }, POLICIES[1]: {
+                "concurrent_gets": True,
+                "concurrency_timeout": 0.3,
+                "concurrent_ec_extra_requests": 1,
+            }}
+        app = self._write_conf_and_load_app(conf_sections)
+        self._check_policy_options(app, exp_options, {})
+
+    def test_log_name(self):
+        # defaults...
+        conf_sections = """
+        [DEFAULT]
+        log_statsd_host = example.com
+        swift_dir = %s
+
+        [pipeline:main]
+        pipeline = proxy-server
+
+        [app:proxy-server]
+        use = egg:swift#proxy
+        """ % self.tempdir
+        conf_path = self._write_conf(dedent(conf_sections))
+        with mock.patch('swift.common.statsd_client.StatsdClient',
+                        FakeStatsdClient):
+            app = loadapp(conf_path, allow_modify_pipeline=False)
+        # logger name is hard-wired 'proxy-server'
+        self.assertEqual('proxy-server', app.logger.name)
+        self.assertEqual('swift', app.logger.server)
+        self.assertIsInstance(app.logger.logger.statsd_client, StatsdClient)
+        self.assertEqual(app.logger.logger.statsd_client._host, 'example.com')
+        self.assertEqual(app.logger.logger.statsd_client._port, 8125)
+        self.assertEqual(app.logger.logger.statsd_client._prefix,
+                         'proxy-server.')
+        self.assertTrue(app.logger.logger.statsd_client.emit_legacy)
+
+        conf_sections = """
+        [DEFAULT]
+        log_name = test-name
+        log_statsd_host = example.com
+        swift_dir = %s
+
+        [pipeline:main]
+        pipeline = proxy-server
+
+        [app:proxy-server]
+        use = egg:swift#proxy
+        """ % self.tempdir
+        conf_path = self._write_conf(dedent(conf_sections))
+
+        with mock.patch('swift.common.statsd_client.StatsdClient',
+                        FakeStatsdClient):
+            app = loadapp(conf_path, allow_modify_pipeline=False)
+        # logger name is hard-wired 'proxy-server'
+        self.assertEqual('proxy-server', app.logger.name)
+        # server is defined by log_name option
+        self.assertEqual('test-name', app.logger.server)
+        # statsd tail prefix is hard-wired 'proxy-server'
+        self.assertIsInstance(app.logger.logger.statsd_client, StatsdClient)
+        self.assertEqual(app.logger.logger.statsd_client._host, 'example.com')
+        self.assertEqual(app.logger.logger.statsd_client._port, 8125)
+        self.assertEqual(app.logger.logger.statsd_client._prefix,
+                         'proxy-server.')
+        self.assertTrue(app.logger.logger.statsd_client.emit_legacy)
+
+
+class TestProxyServerConfigStringLoading(TestProxyServerConfigLoading):
+    # The proxy may be loaded from a conf string rather than a conf file, for
+    # example when ContainerSync creates an InternalClient from a default
+    # config string. So repeat super-class tests using a string loader.
+    def _write_conf(self, conf_body):
+        # this is broken out to a method so that subclasses can override
+        return ConfigString(conf_body)
+
+
+class BaseTestObjectController(object):
+    """
+    A root of TestObjController that implements helper methods for child
+    TestObjControllers.
+    """
+
+    def setUp(self):
+        # clear proxy logger result for each test
+        _test_servers[0].logger._clear()
 
     def assert_status_map(self, method, statuses, expected, raise_exc=False):
         with save_globals():
@@ -750,373 +2352,1738 @@ def assert_status_map(self, method, statuses, expected, raise_exc=False):
                 kwargs['raise_exc'] = raise_exc
 
             set_http_connect(*statuses, **kwargs)
-            self.app.memcache.store = {}
-            req = Request.blank('/a/c/o',
+            req = Request.blank('/v1/a/c/o',
                                 headers={'Content-Length': '0',
                                          'Content-Type': 'text/plain'})
             self.app.update_request(req)
-            res = method(req)
-            self.assertEquals(res.status_int, expected)
+            try:
+                res = method(req)
+            except HTTPException as res:  # noqa: F841
+                pass
+            self.assertEqual(res.status_int, expected)
 
             # repeat test
             set_http_connect(*statuses, **kwargs)
-            self.app.memcache.store = {}
-            req = Request.blank('/a/c/o',
+            req = Request.blank('/v1/a/c/o',
                                 headers={'Content-Length': '0',
                                          'Content-Type': 'text/plain'})
             self.app.update_request(req)
-            res = method(req)
-            self.assertEquals(res.status_int, expected)
-
-    def test_GET_newest_large_file(self):
-        calls = [0]
-
-        def handler(_junk1, _junk2):
-            calls[0] += 1
-
-        old_handler = signal.signal(signal.SIGPIPE, handler)
-        try:
-            prolis = _test_sockets[0]
-            prosrv = _test_servers[0]
-            sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-            fd = sock.makefile()
-            obj = 'a' * (1024 * 1024)
-            path = '/v1/a/c/o.large'
-            fd.write('PUT %s HTTP/1.1\r\n'
-                     'Host: localhost\r\n'
-                     'Connection: close\r\n'
-                     'X-Storage-Token: t\r\n'
-                     'Content-Length: %s\r\n'
-                     'Content-Type: application/octet-stream\r\n'
-                     '\r\n%s' % (path, str(len(obj)),  obj))
-            fd.flush()
-            headers = readuntil2crlfs(fd)
-            exp = 'HTTP/1.1 201'
-            self.assertEqual(headers[:len(exp)], exp)
-            req = Request.blank(path,
-                                environ={'REQUEST_METHOD': 'GET'},
-                                headers={'Content-Type':
-                                         'application/octet-stream',
-                                         'X-Newest': 'true'})
-            res = req.get_response(prosrv)
-            self.assertEqual(res.status_int, 200)
-            self.assertEqual(res.body, obj)
-            self.assertEqual(calls[0], 0)
-        finally:
-            signal.signal(signal.SIGPIPE, old_handler)
+            try:
+                res = method(req)
+            except HTTPException as res:  # noqa: F841
+                pass
+            self.assertEqual(res.status_int, expected)
 
-    def test_PUT_expect_header_zero_content_length(self):
-        test_errors = []
+    def _sleep_enough(self, condition):
+        for sleeptime in (0.1, 1.0):
+            sleep(sleeptime)
+            if condition():
+                break
 
-        def test_connect(ipaddr, port, device, partition, method, path,
-                         headers=None, query_string=None):
-            if path == '/a/c/o.jpg':
-                if 'expect' in headers or 'Expect' in headers:
-                    test_errors.append('Expect was in headers for object '
-                                       'server!')
+    def put_container(self, policy_name, container_name, prolis=None):
+        # Note: only works if called with unpatched policies
+        prolis = prolis or _test_sockets[0]
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        fd.write(('PUT /v1/a/%s HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Connection: close\r\n'
+                  'Content-Length: 0\r\n'
+                  'X-Storage-Token: t\r\n'
+                  'X-Storage-Policy: %s\r\n'
+                  '\r\n' % (container_name, policy_name)).encode('ascii'))
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 2'
+        self.assertEqual(headers[:len(exp)], exp)
 
-        with save_globals():
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-            # The (201, -4) tuples in there have the effect of letting the
-            # initial connect succeed, after which getexpect() gets called and
-            # then the -4 makes the response of that actually be 201 instead of
-            # 100.  Perfectly straightforward.
-            set_http_connect(200, 200, (201, -4), (201, -4), (201, -4),
-                             give_connect=test_connect)
-            req = Request.blank('/a/c/o.jpg', {})
-            req.content_length = 0
-            self.app.update_request(req)
-            self.app.memcache.store = {}
-            res = controller.PUT(req)
-            self.assertEqual(test_errors, [])
-            self.assertTrue(res.status.startswith('201 '), res.status)
+    def _test_conditional_GET(self, policy):
+        container_name = uuid.uuid4().hex
+        object_path = '/v1/a/%s/conditionals' % container_name
+        self.put_container(policy.name, container_name)
 
-    def test_PUT_expect_header_nonzero_content_length(self):
-        test_errors = []
+        obj = b'this object has an etag and is otherwise unimportant'
+        etag = md5(obj, usedforsecurity=False).hexdigest()
+        not_etag = md5(obj + b"blahblah", usedforsecurity=False).hexdigest()
 
-        def test_connect(ipaddr, port, device, partition, method, path,
-                         headers=None, query_string=None):
-            if path == '/a/c/o.jpg':
-                if 'Expect' not in headers:
-                    test_errors.append('Expect was not in headers for '
-                                       'non-zero byte PUT!')
+        prolis = _test_sockets[0]
+        prosrv = _test_servers[0]
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        fd.write(('PUT %s HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Connection: close\r\n'
+                  'Content-Length: %d\r\n'
+                  'X-Storage-Token: t\r\n'
+                  'Content-Type: application/octet-stream\r\n'
+                  '\r\n' % (object_path, len(obj))).encode('ascii'))
+        fd.write(obj)
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
 
-        with save_globals():
-            controller = \
-                proxy_server.ObjectController(self.app, 'a', 'c', 'o.jpg')
-            set_http_connect(200, 200, 201, 201, 201,
-                             give_connect=test_connect)
-            req = Request.blank('/a/c/o.jpg', {})
-            req.content_length = 1
-            req.body = 'a'
-            self.app.update_request(req)
-            self.app.memcache.store = {}
-            res = controller.PUT(req)
-            self.assertTrue(res.status.startswith('201 '))
+        for verb, body in (('GET', obj), ('HEAD', b'')):
+            # If-Match
+            req = Request.blank(
+                object_path,
+                environ={'REQUEST_METHOD': verb},
+                headers={'If-Match': etag})
+            resp = req.get_response(prosrv)
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual(resp.body, body)
+            self.assertEqual(etag, resp.headers.get('etag'))
+            self.assertEqual('bytes', resp.headers.get('accept-ranges'))
 
-    def test_expirer_DELETE_on_versioned_object(self):
-        test_errors = []
+            req = Request.blank(
+                object_path,
+                environ={'REQUEST_METHOD': verb},
+                headers={'If-Match': not_etag})
+            resp = req.get_response(prosrv)
+            self.assertEqual(resp.status_int, 412)
+            self.assertEqual(etag, resp.headers.get('etag'))
 
-        def test_connect(ipaddr, port, device, partition, method, path,
-                         headers=None, query_string=None):
-            if method == 'DELETE':
-                if 'x-if-delete-at' in headers or 'X-If-Delete-At' in headers:
-                    test_errors.append('X-If-Delete-At in headers')
-
-        body = simplejson.dumps(
-            [{"name": "001o/1",
-              "hash": "x",
-              "bytes": 0,
-              "content_type": "text/plain",
-              "last_modified": "1970-01-01T00:00:01.000000"}])
-        body_iter = ('', '', body, '', '', '', '', '', '', '', '', '', '', '')
-        with save_globals():
-            controller = proxy_server.ObjectController(self.app, 'a', 'c', 'o')
-            #                HEAD HEAD GET  GET  HEAD GET  GET  GET  PUT  PUT
-            #                PUT  DEL  DEL  DEL
-            set_http_connect(200, 200, 200, 200, 200, 200, 200, 200, 201, 201,
-                             201, 200, 200, 200,
-                             give_connect=test_connect,
-                             body_iter=body_iter,
-                             headers={'x-versions-location': 'foo'})
-            self.app.memcache.store = {}
-            req = Request.blank('/a/c/o',
-                                headers={'X-If-Delete-At': 1},
-                                environ={'REQUEST_METHOD': 'DELETE'})
-            self.app.update_request(req)
-            res = controller.DELETE(req)
-            self.assertEquals(test_errors, [])
+            req = Request.blank(
+                object_path,
+                environ={'REQUEST_METHOD': verb},
+                headers={'If-Match': "*"})
+            resp = req.get_response(prosrv)
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual(resp.body, body)
+            self.assertEqual(etag, resp.headers.get('etag'))
+            self.assertEqual('bytes', resp.headers.get('accept-ranges'))
 
-    def test_GET_manifest_no_segments(self):
-        response_bodies = (
-            '',                     # HEAD /a
-            '',                     # HEAD /a/c
-            '',                     # GET manifest
-            simplejson.dumps([]))   # GET empty listing
+            # If-None-Match
+            req = Request.blank(
+                object_path,
+                environ={'REQUEST_METHOD': verb},
+                headers={'If-None-Match': etag})
+            resp = req.get_response(prosrv)
+            self.assertEqual(resp.status_int, 304)
+            self.assertEqual(etag, resp.headers.get('etag'))
+            self.assertEqual('bytes', resp.headers.get('accept-ranges'))
 
-        with save_globals():
-            controller = proxy_server.ObjectController(
-                self.app, 'a', 'c', 'manifest')
-            set_http_connect(
-                200,    # HEAD /a
-                200,    # HEAD /a/c
-                200,    # GET manifest
-                200,    # GET empty listing
-                headers={"X-Object-Manifest": "segments/seg"},
-                body_iter=response_bodies)
-
-            req = Request.blank('/a/c/manifest')
-            resp = controller.GET(req)
+            req = Request.blank(
+                object_path,
+                environ={'REQUEST_METHOD': verb},
+                headers={'If-None-Match': not_etag})
+            resp = req.get_response(prosrv)
             self.assertEqual(resp.status_int, 200)
-            self.assertEqual(resp.body, '')
-
-    def test_GET_manifest_limited_listing(self):
-        listing1 = [{"hash": "454dfc73af632012ce3e6217dc464241",
-                     "last_modified": "2012-11-08T04:05:37.866820",
-                     "bytes": 2,
-                     "name": "seg01",
-                     "content_type": "application/octet-stream"},
-                    {"hash": "474bab96c67528d42d5c0c52b35228eb",
-                     "last_modified": "2012-11-08T04:05:37.846710",
-                     "bytes": 2,
-                     "name": "seg02",
-                     "content_type": "application/octet-stream"}]
-
-        listing2 = [{"hash": "116baa5508693d1d1ca36abdd9f9478b",
-                     "last_modified": "2012-11-08T04:05:37.849510",
-                     "bytes": 2,
-                     "name": "seg03",
-                     "content_type": "application/octet-stream"},
-                    {"hash": "7bd6aaa1ef6013353f0420459574ac9d",
-                     "last_modified": "2012-11-08T04:05:37.855180",
-                     "bytes": 2,
-                     "name": "seg04",
-                     "content_type": "application/octet-stream"
-                     }]
-
-        listing3 = [{"hash": "6605f80e3cefaa24e9823544df4edbd6",
-                     "last_modified": "2012-11-08T04:05:37.853710",
-                     "bytes": 2,
-                     "name": "seg05",
-                     "content_type": "application/octet-stream"}]
-
-        response_bodies = (
-            '',                           # HEAD /a
-            '',                           # HEAD /a/c
-            '',                           # GET manifest
-            simplejson.dumps(listing1),   # GET listing1
-            'Aa',                         # GET seg01
-            'Bb',                         # GET seg02
-            simplejson.dumps(listing2),   # GET listing2
-            'Cc',                         # GET seg03
-            'Dd',                         # GET seg04
-            simplejson.dumps(listing3),   # GET listing3
-            'Ee',                         # GET seg05
-            simplejson.dumps([]))         # GET final empty listing
-        with save_globals():
-            try:
-                swift.proxy.controllers.obj.CONTAINER_LISTING_LIMIT = 2
-                controller = proxy_server.ObjectController(
-                    self.app, 'a', 'c', 'manifest')
-
-                requested = []
-                def capture_requested_paths(ipaddr, port, device, partition,
-                                            method, path, headers=None,
-                                            query_string=None):
-                    qs_dict = dict(urlparse.parse_qsl(query_string or ''))
-                    requested.append([method, path, qs_dict])
-
-                set_http_connect(
-                    200,    # HEAD /a
-                    200,    # HEAD /a/c
-                    200,    # GET manifest
-                    200,    # GET listing1
-                    200,    # GET seg01
-                    200,    # GET seg02
-                    200,    # GET listing2
-                    200,    # GET seg03
-                    200,    # GET seg04
-                    200,    # GET listing3
-                    200,    # GET seg05
-                    200,    # GET final empty listing
-                    headers={"X-Object-Manifest": "segments/seg"},
-                    body_iter=response_bodies,
-                    give_connect=capture_requested_paths)
-
-                req = Request.blank('/a/c/manifest')
-                resp = controller.GET(req)
-                self.assertEqual(resp.status_int, 200)
-                self.assertEqual(resp.body, 'AaBbCcDdEe')
+            self.assertEqual(resp.body, body)
+            self.assertEqual(etag, resp.headers.get('etag'))
+            self.assertEqual('bytes', resp.headers.get('accept-ranges'))
 
-                self.assertEqual(
-                    requested,
-                    [['HEAD', '/a', {}],
-                     ['HEAD', '/a/c', {}],
-                     ['GET', '/a/c/manifest', {}],
-                     ['GET', '/a/segments',
-                      {'format': 'json', 'prefix': 'seg'}],
-                     ['GET', '/a/segments/seg01', {}],
-                     ['GET', '/a/segments/seg02', {}],
-                     ['GET', '/a/segments',
-                      {'format': 'json', 'prefix': 'seg', 'marker': 'seg02'}],
-                     ['GET', '/a/segments/seg03', {}],
-                     ['GET', '/a/segments/seg04', {}],
-                     ['GET', '/a/segments',
-                      {'format': 'json', 'prefix': 'seg', 'marker': 'seg04'}],
-                     ['GET', '/a/segments/seg05', {}],
-                     ['GET', '/a/segments',
-                      {'format': 'json', 'prefix': 'seg', 'marker': 'seg05'}]])
+            req = Request.blank(
+                object_path,
+                environ={'REQUEST_METHOD': verb},
+                headers={'If-None-Match': "*"})
+            resp = req.get_response(prosrv)
+            self.assertEqual(resp.status_int, 304)
+            self.assertEqual(etag, resp.headers.get('etag'))
+            self.assertEqual('bytes', resp.headers.get('accept-ranges'))
+
+        error_lines = prosrv.logger.get_lines_for_level('error')
+        warn_lines = prosrv.logger.get_lines_for_level('warning')
+        self.assertEqual(len(error_lines), 0)  # sanity
+        self.assertEqual(len(warn_lines), 0)  # sanity
+
+    @unpatch_policies
+    def test_GET_pipeline(self):
+        conf = _test_context['conf']
+        conf['client_timeout'] = 0.1
+        prosrv = proxy_server.Application(conf, logger=debug_logger('proxy'))
+        with in_process_proxy(
+                prosrv, socket_timeout=conf['client_timeout']) as prolis:
+            self.put_container(self.policy.name, self.policy.name,
+                               prolis=prolis)
+
+            obj = b'0123456' * 11 * 17
 
-            finally:
-                # other tests in this file get very unhappy if this
-                # isn't set back, which leads to time-wasting
-                # debugging of other tests.
-                swift.proxy.controllers.obj.CONTAINER_LISTING_LIMIT = \
-                    _orig_container_listing_limit
+            sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+            fd = sock.makefile('rwb')
+            fd.write(('PUT /v1/a/%s/go-get-it HTTP/1.1\r\n'
+                      'Host: localhost\r\n'
+                      'Content-Length: %d\r\n'
+                      'X-Storage-Token: t\r\n'
+                      'X-Object-Meta-Color: chartreuse\r\n'
+                      'Content-Type: application/octet-stream\r\n'
+                      '\r\n' % (
+                          self.policy.name,
+                          len(obj),
+                      )).encode('ascii'))
+            fd.write(obj)
+            fd.flush()
+            headers = readuntil2crlfs(fd)
+            exp = b'HTTP/1.1 201'
+            self.assertEqual(headers[:len(exp)], exp)
 
-    def test_PUT_auto_content_type(self):
-        with save_globals():
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-
-            def test_content_type(filename, expected):
-                # The three responses here are for account_info() (HEAD to
-                # account server), container_info() (HEAD to container server)
-                # and three calls to _connect_put_node() (PUT to three object
-                # servers)
-                set_http_connect(201, 201, 201, 201, 201,
-                                 give_content_type=lambda content_type:
-                                 self.assertEquals(content_type,
-                                                   expected.next()))
-                # We need into include a transfer-encoding to get past
-                # constraints.check_object_creation()
-                req = Request.blank('/a/c/%s' % filename, {},
-                                    headers={'transfer-encoding': 'chunked'})
-                self.app.update_request(req)
-                self.app.memcache.store = {}
-                res = controller.PUT(req)
-                # If we don't check the response here we could miss problems
-                # in PUT()
-                self.assertEquals(res.status_int, 201)
+            fd.write(('GET /v1/a/%s/go-get-it HTTP/1.1\r\n'
+                      'Host: localhost\r\n'
+                      'X-Storage-Token: t\r\n'
+                      '\r\n' % self.policy.name).encode('ascii'))
+            fd.flush()
+            headers = readuntil2crlfs(fd)
+            exp = b'HTTP/1.1 200'
+            self.assertEqual(headers[:len(exp)], exp)
+            for line in headers.splitlines():
+                if b'Content-Length' in line:
+                    h, v = line.split()
+                    content_length = int(v.strip())
+                    break
+            else:
+                self.fail("Didn't find content-length in %r" % (headers,))
 
-            test_content_type('test.jpg', iter(['', '', 'image/jpeg',
-                                                'image/jpeg', 'image/jpeg']))
-            test_content_type('test.html', iter(['', '', 'text/html',
-                                                 'text/html', 'text/html']))
-            test_content_type('test.css', iter(['', '', 'text/css',
-                                                'text/css', 'text/css']))
+            gotten_obj = fd.read(content_length)
+            self.assertEqual(gotten_obj, obj)
 
-    def test_custom_mime_types_files(self):
-        swift_dir = mkdtemp()
-        try:
-            with open(os.path.join(swift_dir, 'mime.types'), 'w') as fp:
-                fp.write('foo/bar foo\n')
-            ba = proxy_server.Application({'swift_dir': swift_dir},
-                                          FakeMemcache(), FakeLogger(),
-                                          FakeRing(), FakeRing(),
-                                          FakeRing())
-            self.assertEquals(proxy_server.mimetypes.guess_type('blah.foo')[0],
-                              'foo/bar')
-            self.assertEquals(proxy_server.mimetypes.guess_type('blah.jpg')[0],
-                              'image/jpeg')
-        finally:
-            rmtree(swift_dir, ignore_errors=True)
+            sleep(0.3)  # client_timeout should kick us off
 
-    def test_PUT(self):
-        with save_globals():
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
+            fd.write(('GET /v1/a/%s/go-get-it HTTP/1.1\r\n'
+                      'Host: localhost\r\n'
+                      'X-Storage-Token: t\r\n'
+                      '\r\n' % self.policy.name).encode('ascii'))
+            fd.flush()
+            # makefile is a little weird, but this is disconnected
+            self.assertEqual(b'', fd.read())
+            # I expected this to raise a socket error
+            self.assertEqual(b'', sock.recv(1024))
+            time.sleep(0.01)
+            # ... but we ARE disconnected
+            with self.assertRaises(socket.error) as caught:
+                sock.send(b'test')
+            self.assertIn(caught.exception.errno,
+                          (errno.EPIPE, errno.ECONNRESET))
+            # and logging confirms we've timed out
+            last_debug_msg = prosrv.logger.get_lines_for_level('debug')[-1]
+            self.assertIn('timed out', last_debug_msg)
+
+
+@patch_policies([StoragePolicy(0, 'zero', True,
+                               object_ring=FakeRing(base_port=3000))])
+class TestReplicatedObjectController(
+        BaseTestObjectController, BaseTestCase):
+    """
+    Test suite for replication policy
+    """
 
-            def test_status_map(statuses, expected):
-                set_http_connect(*statuses)
-                req = Request.blank('/a/c/o.jpg', {})
-                req.content_length = 0
-                self.app.update_request(req)
-                self.app.memcache.store = {}
-                res = controller.PUT(req)
-                expected = str(expected)
-                self.assertEquals(res.status[:len(expected)], expected)
-            test_status_map((200, 200, 201, 201, 201), 201)
-            test_status_map((200, 200, 201, 201, 500), 201)
-            test_status_map((200, 200, 204, 404, 404), 404)
-            test_status_map((200, 200, 204, 500, 404), 503)
+    def setUp(self):
+        skip_if_no_xattrs()
+        _test_servers[0].error_limiter.stats.clear()  # clear out errors
+        self.logger = debug_logger('proxy-ut')
+        conf = {
+            'log_statsd_host': 'host',
+            'log_statsd_port': 8125,
+            'statsd_label_mode': 'dogstatsd',
+            'statsd_emit_legacy': True,
+        }
+        self.statsd = debug_labeled_statsd_client(conf)
+        self.app = proxy_server.Application(
+            conf,
+            logger=self.logger,
+            statsd=self.statsd,
+            account_ring=FakeRing(),
+            container_ring=FakeRing())
+        self.policy = POLICIES[0]
+        super(TestReplicatedObjectController, self).setUp()
+
+    def tearDown(self):
+        self.app.account_ring.set_replicas(3)
+        self.app.container_ring.set_replicas(3)
+        for policy in POLICIES:
+            policy.object_ring = FakeRing(base_port=3000)
+
+    @unpatch_policies
+    def test_policy_IO(self):
+        def check_file(policy, cont, devs, check_val):
+            partition, nodes = policy.object_ring.get_nodes('a', cont, 'o')
+            conf = {'devices': _testdir, 'mount_check': 'false'}
+            df_mgr = diskfile.DiskFileManager(conf, debug_logger())
+            for dev in devs:
+                file = df_mgr.get_diskfile(dev, partition, 'a',
+                                           cont, 'o',
+                                           policy=policy)
+                if check_val is True:
+                    file.open()
 
-    def test_PUT_connect_exceptions(self):
-        with save_globals():
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
+        prolis = _test_sockets[0]
+        prosrv = _test_servers[0]
 
-            def test_status_map(statuses, expected):
-                set_http_connect(*statuses)
-                self.app.memcache.store = {}
-                req = Request.blank('/a/c/o.jpg', {})
-                req.content_length = 0
-                self.app.update_request(req)
+        # check policy 0: put file on c, read it back, check loc on disk
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        obj = b'test_object0'
+        path = '/v1/a/c/o'
+        fd.write(('PUT %s HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Connection: close\r\n'
+                  'X-Storage-Token: t\r\n'
+                  'Content-Length: %s\r\n'
+                  'Content-Type: text/plain\r\n'
+                  '\r\n' % (path, str(len(obj)))).encode('ascii'))
+        fd.write(obj)
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
+        req = Request.blank(path,
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Content-Type':
+                                     'text/plain'})
+        res = req.get_response(prosrv)
+        self.assertEqual(res.status_int, 200)
+        self.assertEqual(res.body, obj)
+
+        check_file(POLICIES[0], 'c', ['sda1', 'sdb1'], True)
+        check_file(POLICIES[0], 'c', ['sdc1', 'sdd1', 'sde1', 'sdf1'], False)
+
+        # check policy 1: put file on c1, read it back, check loc on disk
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        path = '/v1/a/c1/o'
+        obj = b'test_object1'
+        fd.write(('PUT %s HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Connection: close\r\n'
+                  'X-Storage-Token: t\r\n'
+                  'Content-Length: %s\r\n'
+                  'Content-Type: text/plain\r\n'
+                  '\r\n' % (path, str(len(obj)))).encode('ascii'))
+        fd.write(obj)
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        self.assertEqual(headers[:len(exp)], exp)
+        req = Request.blank(path,
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Content-Type':
+                                     'text/plain'})
+        res = req.get_response(prosrv)
+        self.assertEqual(res.status_int, 200)
+        self.assertEqual(res.body, obj)
+
+        check_file(POLICIES[1], 'c1', ['sdc1', 'sdd1'], True)
+        check_file(POLICIES[1], 'c1', ['sda1', 'sdb1', 'sde1', 'sdf1'], False)
+
+        # check policy 2: put file on c2, read it back, check loc on disk
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        path = '/v1/a/c2/o'
+        obj = b'test_object2'
+        fd.write(('PUT %s HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Connection: close\r\n'
+                  'X-Storage-Token: t\r\n'
+                  'Content-Length: %s\r\n'
+                  'Content-Type: text/plain\r\n'
+                  '\r\n' % (path, str(len(obj)))).encode('ascii'))
+        fd.write(obj)
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        self.assertEqual(headers[:len(exp)], exp)
+        req = Request.blank(path,
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Content-Type':
+                                     'text/plain'})
+        res = req.get_response(prosrv)
+        self.assertEqual(res.status_int, 200)
+        self.assertEqual(res.body, obj)
+
+        check_file(POLICIES[2], 'c2', ['sde1', 'sdf1'], True)
+        check_file(POLICIES[2], 'c2', ['sda1', 'sdb1', 'sdc1', 'sdd1'], False)
+
+    @unpatch_policies
+    def test_policy_IO_override(self):
+        if hasattr(_test_servers[-1], '_filesystem'):
+            # ironically, the _filesystem attribute on the object server means
+            # the in-memory diskfile is in use, so this test does not apply
+            return
+
+        prosrv = _test_servers[0]
+
+        # validate container policy is 1
+        req = Request.blank('/v1/a/c1', method='HEAD')
+        res = req.get_response(prosrv)
+        self.assertEqual(res.status_int, 204)  # sanity check
+        self.assertEqual(POLICIES[1].name, res.headers['x-storage-policy'])
+
+        # check overrides: put it in policy 2 (not where the container says)
+        req = Request.blank(
+            '/v1/a/c1/wrong-o',
+            environ={'REQUEST_METHOD': 'PUT',
+                     'wsgi.input': BytesIO(b"hello")},
+            headers={'Content-Type': 'text/plain',
+                     'Content-Length': '5',
+                     'X-Backend-Storage-Policy-Index': '2'})
+        res = req.get_response(prosrv)
+        self.assertEqual(res.status_int, 201)  # sanity check
+
+        # go to disk to make sure it's there
+        partition, nodes = prosrv.get_object_ring(2).get_nodes(
+            'a', 'c1', 'wrong-o')
+        node = nodes[0]
+        conf = {'devices': _testdir, 'mount_check': 'false'}
+        df_mgr = diskfile.DiskFileManager(conf, debug_logger())
+        df = df_mgr.get_diskfile(node['device'], partition, 'a',
+                                 'c1', 'wrong-o', policy=POLICIES[2])
+        with df.open():
+            contents = b''.join(df.reader())
+            self.assertEqual(contents, b"hello")
+
+        # can't get it from the normal place
+        req = Request.blank('/v1/a/c1/wrong-o',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Content-Type': 'text/plain'})
+        res = req.get_response(prosrv)
+        self.assertEqual(res.status_int, 404)  # sanity check
+
+        # but we can get it from policy 2
+        req = Request.blank('/v1/a/c1/wrong-o',
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Content-Type': 'text/plain',
+                                     'X-Backend-Storage-Policy-Index': '2'})
+
+        res = req.get_response(prosrv)
+        self.assertEqual(res.status_int, 200)
+        self.assertEqual(res.body, b'hello')
+
+        # and we can delete it the same way
+        req = Request.blank('/v1/a/c1/wrong-o',
+                            environ={'REQUEST_METHOD': 'DELETE'},
+                            headers={'Content-Type': 'text/plain',
+                                     'X-Backend-Storage-Policy-Index': '2'})
+
+        res = req.get_response(prosrv)
+        self.assertEqual(res.status_int, 204)
+
+        df = df_mgr.get_diskfile(node['device'], partition, 'a',
+                                 'c1', 'wrong-o', policy=POLICIES[2])
+        with self.assertRaises(DiskFileDeleted) as cm:
+            df.open()
+        self.assertGreater(cm.exception.timestamp, utils.Timestamp.zero())
+
+    @unpatch_policies
+    def test_GET_newest_large_file(self):
+        prolis = _test_sockets[0]
+        prosrv = _test_servers[0]
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        obj = b'a' * (1024 * 1024)
+        path = '/v1/a/c/o.large'
+        fd.write(('PUT %s HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Connection: close\r\n'
+                  'X-Storage-Token: t\r\n'
+                  'Content-Length: %s\r\n'
+                  'Content-Type: application/octet-stream\r\n'
+                  '\r\n' % (path, str(len(obj)))).encode('ascii'))
+        fd.write(obj)
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
+        req = Request.blank(path,
+                            environ={'REQUEST_METHOD': 'GET'},
+                            headers={'Content-Type':
+                                     'application/octet-stream',
+                                     'X-Newest': 'true'})
+        res = req.get_response(prosrv)
+        self.assertEqual(res.status_int, 200)
+        self.assertEqual(res.body, obj)
+
+    @unpatch_policies
+    def test_GET_ranges(self):
+        prolis = _test_sockets[0]
+        prosrv = _test_servers[0]
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        obj = ''.join(
+            ('beans lots of beans lots of beans lots of beans yeah %04d ' % i)
+            for i in range(100)).encode('ascii')
+
+        path = '/v1/a/c/o.beans'
+        fd.write(('PUT %s HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Connection: close\r\n'
+                  'X-Storage-Token: t\r\n'
+                  'Content-Length: %s\r\n'
+                  'Content-Type: application/octet-stream\r\n'
+                  '\r\n' % (path, str(len(obj)))).encode('ascii'))
+        fd.write(obj)
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
+
+        # one byte range
+        req = Request.blank(
+            path,
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Content-Type': 'application/octet-stream',
+                     'Range': 'bytes=10-200'})
+        res = req.get_response(prosrv)
+        self.assertEqual(res.status_int, 206)
+        self.assertEqual(res.body, obj[10:201])
+
+        req = Request.blank(path, environ={'REQUEST_METHOD': 'GET'}, headers={
+            'Content-Type': 'application/octet-stream',
+            'X-Backend-Ignore-Range-If-Metadata-Present': 'Content-Type',
+            'Range': 'bytes=10-200'})
+        res = req.get_response(prosrv)
+        self.assertEqual(res.status_int, 200)
+        self.assertEqual(res.body, obj)
+
+        # multiple byte ranges
+        req = Request.blank(
+            path,
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Content-Type': 'application/octet-stream',
+                     'Range': 'bytes=10-200,1000-1099,4123-4523'})
+        res = req.get_response(prosrv)
+        self.assertEqual(res.status_int, 206)
+        ct, params = parse_content_type(res.headers['Content-Type'])
+        self.assertEqual(ct, 'multipart/byteranges')
+
+        boundary = dict(params).get('boundary')
+        self.assertIsNotNone(boundary)
+        if not isinstance(boundary, bytes):
+            boundary = boundary.encode('ascii')
+
+        got_mime_docs = []
+        for mime_doc_fh in iter_multipart_mime_documents(BytesIO(res.body),
+                                                         boundary):
+            headers = parse_mime_headers(mime_doc_fh)
+            body = mime_doc_fh.read()
+            got_mime_docs.append((headers, body))
+        self.assertEqual(len(got_mime_docs), 3)
+
+        first_range_headers = got_mime_docs[0][0]
+        first_range_body = got_mime_docs[0][1]
+        self.assertEqual(first_range_headers['Content-Range'],
+                         'bytes 10-200/5800')
+        self.assertEqual(first_range_body, obj[10:201])
+
+        second_range_headers = got_mime_docs[1][0]
+        second_range_body = got_mime_docs[1][1]
+        self.assertEqual(second_range_headers['Content-Range'],
+                         'bytes 1000-1099/5800')
+        self.assertEqual(second_range_body, obj[1000:1100])
+
+        second_range_headers = got_mime_docs[2][0]
+        second_range_body = got_mime_docs[2][1]
+        self.assertEqual(second_range_headers['Content-Range'],
+                         'bytes 4123-4523/5800')
+        self.assertEqual(second_range_body, obj[4123:4524])
+
+    @unpatch_policies
+    def test_GET_bad_range_zero_byte(self):
+        prolis = _test_sockets[0]
+        prosrv = _test_servers[0]
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+
+        path = '/v1/a/c/o.zerobyte'
+        fd.write(('PUT %s HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Connection: close\r\n'
+                  'X-Storage-Token: t\r\n'
+                  'Content-Length: 0\r\n'
+                  'Content-Type: application/octet-stream\r\n'
+                  '\r\n' % (path,)).encode('ascii'))
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
+
+        # bad byte-range
+        req = Request.blank(
+            path,
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Content-Type': 'application/octet-stream',
+                     'Range': 'bytes=spaghetti-carbonara'})
+        res = req.get_response(prosrv)
+        self.assertEqual(res.status_int, 200)
+        self.assertEqual(res.body, b'')
+
+        # not a byte-range
+        req = Request.blank(
+            path,
+            environ={'REQUEST_METHOD': 'GET'},
+            headers={'Content-Type': 'application/octet-stream',
+                     'Range': 'Kotta'})
+        res = req.get_response(prosrv)
+        self.assertEqual(res.status_int, 200)
+        self.assertEqual(res.body, b'')
+
+    @unpatch_policies
+    def test_PUT_GET_unicode_metadata(self):
+        prolis = _test_sockets[0]
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+
+        path = b'/v1/a/c/o.zerobyte'
+        fd.write(b'PUT %s HTTP/1.1\r\n'
+                 b'Host: localhost\r\n'
+                 b'X-Storage-Token: t\r\n'
+                 b'Expect: 100-continue\r\n'
+                 b'Transfer-Encoding: chunked\r\n'
+                 b'Content-Type: application/octet-stream\r\n'
+                 b'X-Object-Meta-\xf0\x9f\x8c\xb4: \xf0\x9f\x91\x8d\r\n'
+                 b'\r\n0\r\n\r\n' % (path,))
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 100'
+        self.assertEqual(headers[:len(exp)], exp)
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
+
+        fd.write(b'GET %s HTTP/1.1\r\n'
+                 b'Host: localhost\r\n'
+                 b'Connection: close\r\n'
+                 b'X-Storage-Token: t\r\n'
+                 b'\r\n' % (path,))
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 200'
+        self.assertEqual(headers[:len(exp)], exp)
+        self.assertIn(b'X-Object-Meta-\xf0\x9f\x8c\xb4: \xf0\x9f\x91\x8d',
+                      headers.split(b'\r\n'))
+
+    @unpatch_policies
+    def test_HEAD_absolute_uri(self):
+        prolis = _test_sockets[0]
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+
+        # sanity, this resource is created in setup
+        path = b'/v1/a'
+        fd.write(b'HEAD %s HTTP/1.1\r\n'
+                 b'Host: localhost\r\n'
+                 b'Connection: keep-alive\r\n'
+                 b'X-Storage-Token: t\r\n'
+                 b'\r\n' % (path,))
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 204'
+        self.assertEqual(headers[:len(exp)], exp)
+
+        # RFC says we should accept this, too
+        abs_path = b'http://saio.example.com:8080/v1/a'
+        fd.write(b'HEAD %s HTTP/1.1\r\n'
+                 b'Host: localhost\r\n'
+                 b'Connection: keep-alive\r\n'
+                 b'X-Storage-Token: t\r\n'
+                 b'\r\n' % (abs_path,))
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 204'
+        self.assertEqual(headers[:len(exp)], exp)
+
+    @unpatch_policies
+    def test_GET_short_read(self):
+        prolis = _test_sockets[0]
+        prosrv = _test_servers[0]
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        obj = (b''.join(
+            (b'%d bottles of beer on the wall\n' % i)
+            for i in reversed(range(1, 200))))
+
+        # if the object is too short, then we don't have a mid-stream
+        # exception after the headers are sent, but instead an early one
+        # before the headers
+        self.assertGreater(len(obj), wsgi.MINIMUM_CHUNK_SIZE)
+
+        path = '/v1/a/c/o.bottles'
+        fd.write(('PUT %s HTTP/1.1\r\n'
+                  'Connection: keep-alive\r\n'
+                  'Host: localhost\r\n'
+                  'X-Storage-Token: t\r\n'
+                  'Content-Length: %s\r\n'
+                  'Content-Type: application/beer-stream\r\n'
+                  '\r\n' % (path, str(len(obj)))).encode('ascii'))
+        fd.write(obj)
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
+
+        # go shorten that object by a few bytes
+        shrinkage = 100   # bytes
+        shortened = 0
+        for dirpath, _, filenames in os.walk(_testdir):
+            for filename in filenames:
+                if filename.endswith(".data"):
+                    with open(os.path.join(dirpath, filename), "r+") as fh:
+                        fh.truncate(len(obj) - shrinkage)
+                        shortened += 1
+        self.assertGreater(shortened, 0)  # ensure test is working
+
+        real_fstat = os.fstat
+
+        # stop the object server from immediately quarantining the object
+        # and returning 404
+        def lying_fstat(fd):
+            sr = real_fstat(fd)
+            fake_stat_result = posix.stat_result((
+                sr.st_mode, sr.st_ino, sr.st_dev, sr.st_nlink, sr.st_uid,
+                sr.st_gid,
+                sr.st_size + shrinkage,   # here's the lie
+                sr.st_atime, sr.st_mtime, sr.st_ctime))
+            return fake_stat_result
+
+        # Read the object back
+        with mock.patch('os.fstat', lying_fstat), \
+                mock.patch.object(prosrv, 'client_chunk_size', 32), \
+                mock.patch.object(prosrv, 'object_chunk_size', 32):
+            fd.write(('GET %s HTTP/1.1\r\n'
+                      'Host: localhost\r\n'
+                      'Connection: keep-alive\r\n'
+                      'X-Storage-Token: t\r\n'
+                      '\r\n' % (path,)).encode('ascii'))
+            fd.flush()
+            headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 200'
+        self.assertEqual(headers[:len(exp)], exp)
+
+        obj_parts = []
+        while True:
+            buf = fd.read(1024)
+            if not buf:
+                break
+            obj_parts.append(buf)
+        got_obj = b''.join(obj_parts)
+        self.assertLessEqual(len(got_obj), len(obj) - shrinkage)
+
+        # Make sure the server closed the connection
+        with self.assertRaises(socket.error):
+            # Two calls are necessary; you can apparently write to a socket
+            # that the peer has closed exactly once without error, then the
+            # kernel discovers that the connection is not open and
+            # subsequent send attempts fail.
+            sock.sendall(b'GET /info HTTP/1.1\r\n')
+            # OS X especially seems to want this to detect the close
+            time.sleep(0.001)
+            sock.sendall(b'Host: localhost\r\n'
+                         b'X-Storage-Token: t\r\n'
+                         b'\r\n')
+
+    @unpatch_policies
+    def test_GET_short_read_resuming(self):
+        prolis = _test_sockets[0]
+        prosrv = _test_servers[0]
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        obj = (b''.join(
+            (b'%d bottles of beer on the wall\n' % i)
+            for i in reversed(range(1, 200))))
+
+        # if the object is too short, then we don't have a mid-stream
+        # exception after the headers are sent, but instead an early one
+        # before the headers
+        self.assertGreater(len(obj), wsgi.MINIMUM_CHUNK_SIZE)
+
+        path = '/v1/a/c/o.bottles'
+        fd.write(('PUT %s HTTP/1.1\r\n'
+                  'Connection: keep-alive\r\n'
+                  'Host: localhost\r\n'
+                  'X-Storage-Token: t\r\n'
+                  'Content-Length: %s\r\n'
+                  'Content-Type: application/beer-stream\r\n'
+                  '\r\n' % (path, str(len(obj)))).encode('ascii'))
+        fd.write(obj)
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
+
+        # we shorten the first replica of the object by 200 bytes and leave
+        # the others untouched
+        _, obj_nodes = POLICIES.default.object_ring.get_nodes(
+            "a", "c", "o.bottles")
+
+        shortened = 0
+        for dirpath, _, filenames in os.walk(
+                os.path.join(_testdir, obj_nodes[0]['device'])):
+            for filename in filenames:
+                if filename.endswith(".data"):
+                    if shortened == 0:
+                        with open(os.path.join(dirpath, filename), "r+") as fh:
+                            fh.truncate(len(obj) - 200)
+                            shortened += 1
+        self.assertEqual(shortened, 1)  # sanity check
+
+        real_fstat = os.fstat
+
+        # stop the object server from immediately quarantining the object
+        # and returning 404
+        def lying_fstat(fd):
+            sr = real_fstat(fd)
+            fake_stat_result = posix.stat_result((
+                sr.st_mode, sr.st_ino, sr.st_dev, sr.st_nlink, sr.st_uid,
+                sr.st_gid,
+                len(obj),  # sometimes correct, sometimes not
+                sr.st_atime, sr.st_mtime, sr.st_ctime))
+            return fake_stat_result
+
+        # Read the object back
+        with mock.patch('os.fstat', lying_fstat), \
+                mock.patch.object(prosrv, 'client_chunk_size', 32), \
+                mock.patch.object(prosrv, 'object_chunk_size', 32), \
+                mock.patch.object(prosrv, 'sort_nodes',
+                                  lambda nodes, **kw: nodes):
+            fd.write(('GET %s HTTP/1.1\r\n'
+                      'Host: localhost\r\n'
+                      'Connection: close\r\n'
+                      'X-Storage-Token: t\r\n'
+                      '\r\n' % (path,)).encode('ascii'))
+            fd.flush()
+            headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 200'
+        self.assertEqual(headers[:len(exp)], exp)
+
+        obj_parts = []
+        while True:
+            buf = fd.read(1024)
+            if not buf:
+                break
+            obj_parts.append(buf)
+        got_obj = b''.join(obj_parts)
+
+        # technically this is a redundant test, but it saves us from screens
+        # full of error message when got_obj is shorter than obj
+        self.assertEqual(len(obj), len(got_obj))
+        self.assertEqual(obj, got_obj)
+
+    @unpatch_policies
+    def test_GET_ranges_resuming(self):
+        prolis = _test_sockets[0]
+        prosrv = _test_servers[0]
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        obj = (b''.join(
+            (b'Smurf! The smurfing smurf is completely smurfed. %03d ' % i)
+            for i in range(1000)))
+
+        path = '/v1/a/c/o.smurfs'
+        fd.write(('PUT %s HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Connection: close\r\n'
+                  'X-Storage-Token: t\r\n'
+                  'Content-Length: %s\r\n'
+                  'Content-Type: application/smurftet-stream\r\n'
+                  '\r\n' % (path, str(len(obj)))).encode('ascii'))
+        fd.write(obj)
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
+
+        kaboomed = [0]
+        bytes_before_timeout = [None]
+
+        class FileLikeKaboom(object):
+            def __init__(self, inner_file_like):
+                self.inner_file_like = inner_file_like
+
+            # close(), etc.
+            def __getattr__(self, attr):
+                return getattr(self.inner_file_like, attr)
+
+            def readline(self, *a, **kw):
+                if bytes_before_timeout[0] <= 0:
+                    kaboomed[0] += 1
+                    raise ChunkReadTimeout(None)
+                result = self.inner_file_like.readline(*a, **kw)
+                if len(result) > bytes_before_timeout[0]:
+                    result = result[:bytes_before_timeout[0]]
+                bytes_before_timeout[0] -= len(result)
+                return result
+
+            def read(self, length=None):
+                result = self.inner_file_like.read(length)
+                if bytes_before_timeout[0] <= 0:
+                    kaboomed[0] += 1
+                    raise ChunkReadTimeout(None)
+                if len(result) > bytes_before_timeout[0]:
+                    result = result[:bytes_before_timeout[0]]
+                bytes_before_timeout[0] -= len(result)
+                return result
+
+        orig_hrtdi = swift.common.request_helpers. \
+            http_response_to_document_iters
+
+        # Use this to mock out http_response_to_document_iters. On the first
+        # call, the result will be sabotaged to blow up with
+        # ChunkReadTimeout after some number of bytes are read. On
+        # subsequent calls, no sabotage will be added.
+
+        def sabotaged_hrtdi(*a, **kw):
+            resp_parts = orig_hrtdi(*a, **kw)
+            for sb, eb, l, h, range_file in resp_parts:
+                if bytes_before_timeout[0] <= 0:
+                    # simulate being unable to read MIME part of
+                    # multipart/byteranges response
+                    kaboomed[0] += 1
+                    raise ChunkReadTimeout(None)
+                boomer = FileLikeKaboom(range_file)
+                yield sb, eb, l, h, boomer
+
+        sabotaged = [False]
+
+        def single_sabotage_hrtdi(*a, **kw):
+            if not sabotaged[0]:
+                sabotaged[0] = True
+                return sabotaged_hrtdi(*a, **kw)
+            else:
+                return orig_hrtdi(*a, **kw)
+
+        # We want sort of an end-to-end test of object resuming, so what we
+        # do is mock out stuff so the proxy thinks it only read a certain
+        # number of bytes before it got a timeout.
+        bytes_before_timeout[0] = 300
+        with mock.patch.object(proxy_base,
+                               'http_response_to_document_iters',
+                               single_sabotage_hrtdi):
+            req = Request.blank(
+                path,
+                environ={'REQUEST_METHOD': 'GET'},
+                headers={'Content-Type': 'application/octet-stream',
+                         'Range': 'bytes=0-500'})
+            res = req.get_response(prosrv)
+            body = res.body   # read the whole thing
+        self.assertEqual(kaboomed[0], 1)  # sanity check
+        self.assertEqual(res.status_int, 206)
+        self.assertEqual(len(body), 501)
+        self.assertEqual(body, obj[:501])
+
+        # Sanity-check for multi-range resume: make sure we actually break
+        # in the middle of the second byterange. This test is partially
+        # about what happens when all the object servers break at once, and
+        # partially about validating all these mocks we do. After all, the
+        # point of resuming is that the client can't tell anything went
+        # wrong, so we need a test where we can't resume and something
+        # *does* go wrong so we can observe it.
+        bytes_before_timeout[0] = 700
+        kaboomed[0] = 0
+        sabotaged[0] = False
+        prosrv.error_limiter.stats.clear()  # clear out errors
+        with mock.patch.object(proxy_base,
+                               'http_response_to_document_iters',
+                               sabotaged_hrtdi):  # perma-broken
+            req = Request.blank(
+                path,
+                environ={'REQUEST_METHOD': 'GET'},
+                headers={'Range': 'bytes=0-500,1000-1500,2000-2500'})
+            res = req.get_response(prosrv)
+            body = b''
+            try:
+                for chunk in res.app_iter:
+                    body += chunk
+            except (ChunkReadTimeout, ChunkReadError):
+                pass
+
+        self.assertEqual(res.status_int, 206)
+        self.assertGreater(kaboomed[0], 0)  # sanity check
+
+        ct, params = parse_content_type(res.headers['Content-Type'])
+        self.assertEqual(ct, 'multipart/byteranges')  # sanity check
+        boundary = dict(params).get('boundary')
+        self.assertIsNotNone(boundary)  # sanity check
+        if not isinstance(boundary, bytes):
+            boundary = boundary.encode('ascii')
+        got_byteranges = []
+        for mime_doc_fh in iter_multipart_mime_documents(BytesIO(body),
+                                                         boundary):
+            parse_mime_headers(mime_doc_fh)
+            body = mime_doc_fh.read()
+            got_byteranges.append(body)
+
+        self.assertEqual(len(got_byteranges), 2)
+        self.assertEqual(len(got_byteranges[0]), 501)
+        self.assertEqual(len(got_byteranges[1]), 199)  # partial
+
+        # Multi-range resume, resuming in the middle of the first byterange
+        bytes_before_timeout[0] = 300
+        kaboomed[0] = 0
+        sabotaged[0] = False
+        prosrv.error_limiter.stats.clear()  # clear out errors
+        with mock.patch.object(proxy_base,
+                               'http_response_to_document_iters',
+                               single_sabotage_hrtdi):
+            req = Request.blank(
+                path,
+                environ={'REQUEST_METHOD': 'GET'},
+                headers={'Range': 'bytes=0-500,1000-1500,2000-2500'})
+            res = req.get_response(prosrv)
+            body = b''.join(res.app_iter)
+
+        self.assertEqual(res.status_int, 206)
+        self.assertEqual(kaboomed[0], 1)  # sanity check
+
+        ct, params = parse_content_type(res.headers['Content-Type'])
+        self.assertEqual(ct, 'multipart/byteranges')  # sanity check
+        boundary = dict(params).get('boundary')
+        self.assertIsNotNone(boundary)  # sanity check
+        if not isinstance(boundary, bytes):
+            boundary = boundary.encode('ascii')
+        got_byteranges = []
+        for mime_doc_fh in iter_multipart_mime_documents(BytesIO(body),
+                                                         boundary):
+            parse_mime_headers(mime_doc_fh)
+            body = mime_doc_fh.read()
+            got_byteranges.append(body)
+
+        self.assertEqual(len(got_byteranges), 3)
+        self.assertEqual(len(got_byteranges[0]), 501)
+        self.assertEqual(got_byteranges[0], obj[:501])
+        self.assertEqual(len(got_byteranges[1]), 501)
+        self.assertEqual(got_byteranges[1], obj[1000:1501])
+        self.assertEqual(len(got_byteranges[2]), 501)
+        self.assertEqual(got_byteranges[2], obj[2000:2501])
+
+        # Multi-range resume, first GET dies in the middle of the second set
+        # of MIME headers
+        bytes_before_timeout[0] = 501
+        kaboomed[0] = 0
+        sabotaged[0] = False
+        prosrv.error_limiter.stats.clear()  # clear out errors
+        with mock.patch.object(proxy_base,
+                               'http_response_to_document_iters',
+                               single_sabotage_hrtdi):
+            req = Request.blank(
+                path,
+                environ={'REQUEST_METHOD': 'GET'},
+                headers={'Range': 'bytes=0-500,1000-1500,2000-2500'})
+            res = req.get_response(prosrv)
+            body = b''.join(res.app_iter)
+
+        self.assertEqual(res.status_int, 206)
+        self.assertGreaterEqual(kaboomed[0], 1)  # sanity check
+
+        ct, params = parse_content_type(res.headers['Content-Type'])
+        self.assertEqual(ct, 'multipart/byteranges')  # sanity check
+        boundary = dict(params).get('boundary')
+        self.assertIsNotNone(boundary)  # sanity check
+        if not isinstance(boundary, bytes):
+            boundary = boundary.encode('ascii')
+        got_byteranges = []
+        for mime_doc_fh in iter_multipart_mime_documents(BytesIO(body),
+                                                         boundary):
+            parse_mime_headers(mime_doc_fh)
+            body = mime_doc_fh.read()
+            got_byteranges.append(body)
+
+        self.assertEqual(len(got_byteranges), 3)
+        self.assertEqual(len(got_byteranges[0]), 501)
+        self.assertEqual(got_byteranges[0], obj[:501])
+        self.assertEqual(len(got_byteranges[1]), 501)
+        self.assertEqual(got_byteranges[1], obj[1000:1501])
+        self.assertEqual(len(got_byteranges[2]), 501)
+        self.assertEqual(got_byteranges[2], obj[2000:2501])
+
+        # Multi-range resume, first GET dies in the middle of the second
+        # byterange
+        bytes_before_timeout[0] = 750
+        kaboomed[0] = 0
+        sabotaged[0] = False
+        prosrv.error_limiter.stats.clear()  # clear out errors
+        with mock.patch.object(proxy_base,
+                               'http_response_to_document_iters',
+                               single_sabotage_hrtdi):
+            req = Request.blank(
+                path,
+                environ={'REQUEST_METHOD': 'GET'},
+                headers={'Range': 'bytes=0-500,1000-1500,2000-2500'})
+            res = req.get_response(prosrv)
+            body = b''.join(res.app_iter)
+
+        self.assertEqual(res.status_int, 206)
+        self.assertGreaterEqual(kaboomed[0], 1)  # sanity check
+
+        ct, params = parse_content_type(res.headers['Content-Type'])
+        self.assertEqual(ct, 'multipart/byteranges')  # sanity check
+        boundary = dict(params).get('boundary')
+        self.assertIsNotNone(boundary)  # sanity check
+        if not isinstance(boundary, bytes):
+            boundary = boundary.encode('ascii')
+        got_byteranges = []
+        for mime_doc_fh in iter_multipart_mime_documents(BytesIO(body),
+                                                         boundary):
+            parse_mime_headers(mime_doc_fh)
+            body = mime_doc_fh.read()
+            got_byteranges.append(body)
+
+        self.assertEqual(len(got_byteranges), 3)
+        self.assertEqual(len(got_byteranges[0]), 501)
+        self.assertEqual(got_byteranges[0], obj[:501])
+        self.assertEqual(len(got_byteranges[1]), 501)
+        self.assertEqual(got_byteranges[1], obj[1000:1501])
+        self.assertEqual(len(got_byteranges[2]), 501)
+        self.assertEqual(got_byteranges[2], obj[2000:2501])
+
+    @unpatch_policies
+    def test_conditional_GET_replication(self):
+        policy = POLICIES[0]
+        self.assertEqual('replication', policy.policy_type)  # sanity
+        self._test_conditional_GET(policy)
+
+    def test_PUT_expect_header_zero_content_length(self):
+        test_errors = []
+
+        def test_connect(ipaddr, port, device, partition, method, path,
+                         headers=None, query_string=None):
+            if path == '/a/c/o.jpg':
+                if headers.get('Transfer-Encoding') != 'chunked':
+                    test_errors.append('"Transfer-Encoding: chunked" should '
+                                       'be in headers for object server!')
+                if 'Expect' not in headers:
+                    test_errors.append('Expect should be in headers for '
+                                       'object server!')
+
+        with save_globals():
+            controller = ReplicatedObjectController(
+                self.app, 'account', 'container', 'object')
+            # The (201, Exception('test')) tuples in there have the effect of
+            # changing the status of the initial expect response.  The default
+            # expect response from FakeConn for 201 is 100.
+            # But the object server won't send a 100 continue line if the
+            # client doesn't send a expect 100 header (as is the case with
+            # zero byte PUTs as validated by this test), nevertheless the
+            # object controller calls getexpect without prejudice.  In this
+            # case the status from the response shows up early in getexpect
+            # instead of having to wait until getresponse.  The Exception is
+            # in there to ensure that the object controller also *uses* the
+            # result of getexpect instead of calling getresponse in which case
+            # our FakeConn will blow up.
+            success_codes = [(201, Exception('test'))] * 3
+            set_http_connect(200, 200, *success_codes,
+                             give_connect=test_connect)
+            req = Request.blank('/v1/a/c/o.jpg', {})
+            req.content_length = 0
+            self.app.update_request(req)
+            res = controller.PUT(req)
+            self.assertEqual(test_errors, [])
+            self.assertTrue(res.status.startswith('201 '), res.status)
+
+    def test_PUT_expect_header_nonzero_content_length(self):
+        test_errors = []
+
+        def test_connect(ipaddr, port, device, partition, method, path,
+                         headers=None, query_string=None):
+            if path == '/a/c/o.jpg':
+                if 'Expect' not in headers:
+                    test_errors.append('Expect was not in headers for '
+                                       'non-zero byte PUT!')
+
+        with save_globals():
+            controller = ReplicatedObjectController(
+                self.app, 'a', 'c', 'o.jpg')
+            # the (100, 201) tuples in there are just being extra explicit
+            # about the FakeConn returning the 100 Continue status when the
+            # object controller calls getexpect.  Which is FakeConn's default
+            # for 201 if no expect_status is specified.
+            success_codes = [(100, 201)] * 3
+            set_http_connect(200, 200, *success_codes,
+                             give_connect=test_connect)
+            req = Request.blank('/v1/a/c/o.jpg', {})
+            req.content_length = 1
+            req.body = 'a'
+            self.app.update_request(req)
+            res = controller.PUT(req)
+            self.assertEqual(test_errors, [])
+            self.assertTrue(res.status.startswith('201 '))
+
+    def _check_PUT_respects_write_affinity(self, conf, policy,
+                                           expected_region):
+        written_to = []
+
+        def test_connect(ipaddr, port, device, partition, method, path,
+                         headers=None, query_string=None):
+            if path == '/a/c/o.jpg':
+                written_to.append((ipaddr, port, device))
+
+        # mock shuffle to be a no-op to ensure that the only way nodes would
+        # not be used in ring order is if affinity is respected.
+        with mock.patch('swift.proxy.server.shuffle', lambda x: x):
+            app = proxy_server.Application(
+                conf,
+                logger=debug_logger('proxy-ut'),
+                account_ring=FakeRing(),
+                container_ring=FakeRing())
+            with save_globals():
+                object_ring = app.get_object_ring(policy)
+                object_ring.max_more_nodes = 100
+                controller = \
+                    ReplicatedObjectController(
+                        app, 'a', 'c', 'o.jpg')
+                # requests go to acc, con, obj, obj, obj
+                set_http_connect(200, 200, 201, 201, 201,
+                                 give_connect=test_connect)
+                req = Request.blank(
+                    '/v1/a/c/o.jpg', method='PUT', body='a',
+                    headers={'X-Backend-Storage-Policy-Index': str(policy)})
                 res = controller.PUT(req)
+        self.assertTrue(res.status.startswith('201 '))
+        self.assertEqual(3, len(written_to))
+        for ip, port, device in written_to:
+            # this is kind of a hokey test, but in FakeRing, the port is even
+            # when the region is 0, and odd when the region is 1, so this test
+            # asserts that we only wrote to nodes in region 0.
+            self.assertEqual(expected_region, port % 2)
+
+    @patch_policies([StoragePolicy(0, 'zero', True, object_ring=FakeRing()),
+                     StoragePolicy(1, 'one', False, object_ring=FakeRing())])
+    def test_PUT_respects_write_affinity(self):
+        # nodes in fake ring order have r0z0, r1z1, r0z2
+        # Check default conf via proxy server conf
+        conf = {'write_affinity': 'r0'}
+        self._check_PUT_respects_write_affinity(conf, 0, 0)
+
+        # policy 0 and policy 1 have conf via per policy conf section
+        conf = {
+            'write_affinity': '',
+            'policy_config': {
+                '0': {'write_affinity': 'r0'},
+                '1': {'write_affinity': 'r1'}
+            }
+        }
+        self._check_PUT_respects_write_affinity(conf, 0, 0)
+        self._check_PUT_respects_write_affinity(conf, 1, 1)
+
+        # policy 0 conf via per policy conf section override proxy server conf,
+        # policy 1 uses default
+        conf = {
+            'write_affinity': 'r0',
+            'policy_config': {
+                '0': {'write_affinity': 'r1'}
+            }
+        }
+        self._check_PUT_respects_write_affinity(conf, 0, 1)
+        self._check_PUT_respects_write_affinity(conf, 1, 0)
+
+    def test_PUT_respects_write_affinity_with_507s(self):
+        written_to = []
+
+        def test_connect(ipaddr, port, device, partition, method, path,
+                         headers=None, query_string=None):
+            if path == '/a/c/o.jpg':
+                written_to.append((ipaddr, port, device))
+
+        with save_globals():
+            def is_r0(node):
+                return node['region'] == 0
+
+            object_ring = self.app.get_object_ring(0)
+            object_ring.max_more_nodes = 100
+            policy_options = self.app.get_policy_options(POLICIES[0])
+            policy_options.write_affinity_is_local_fn = is_r0
+            policy_options.write_affinity_node_count_fn = lambda r: 3
+
+            controller = \
+                ReplicatedObjectController(
+                    self.app, 'a', 'c', 'o.jpg')
+            error_node = object_ring.get_part_nodes(1)[0]
+            self.app.error_limit(error_node, 'test')
+            self.assertEqual(
+                1, self.logger.statsd_client.get_stats_counts().get(
+                    'error_limiter.forced_limit', 0))
+            line = self.logger.get_lines_for_level('error')[-1]
+            self.assertEqual(
+                ('Node will be error limited for 60.00s: %s, error: %s'
+                 % (node_to_string(error_node), 'test')), line)
+
+            # no error limited checking yet.
+            self.assertEqual(
+                0, self.logger.statsd_client.get_stats_counts().get(
+                    'error_limiter.is_limited', 0))
+            set_http_connect(200, 200,        # account, container
+                             201, 201, 201,   # 3 working backends
+                             give_connect=test_connect)
+            req = Request.blank('/v1/a/c/o.jpg', {})
+            req.content_length = 1
+            req.body = 'a'
+            res = controller.PUT(req)
+            self.assertTrue(res.status.startswith('201 '))
+            # error limited happened during PUT.
+            self.assertEqual(
+                1, self.logger.statsd_client.get_stats_counts().get(
+                    'error_limiter.is_limited', 0))
+
+        # this is kind of a hokey test, but in FakeRing, the port is even when
+        # the region is 0, and odd when the region is 1, so this test asserts
+        # that we wrote to 2 nodes in region 0, then went to 1 non-r0 node.
+        def get_region(x):
+            return x[1] % 2  # it's (ip, port, device)
+
+        self.assertEqual([0, 0, 1], [get_region(x) for x in written_to])
+
+    @unpatch_policies
+    def test_PUT_no_etag_fallocate(self):
+        with mock.patch('swift.obj.diskfile.fallocate') as mock_fallocate:
+            prolis = _test_sockets[0]
+            sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+            fd = sock.makefile('rwb')
+            obj = b'hemoleucocytic-surfactant'
+            fd.write(('PUT /v1/a/c/o HTTP/1.1\r\n'
+                      'Host: localhost\r\n'
+                      'Connection: close\r\n'
+                      'Content-Length: %d\r\n'
+                      'X-Storage-Token: t\r\n'
+                      'Content-Type: application/octet-stream\r\n'
+                      '\r\n' % (len(obj))).encode('ascii'))
+            fd.write(obj)
+            fd.flush()
+            headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
+        # one for each obj server; this test has 2
+        self.assertEqual(len(mock_fallocate.mock_calls), 2)
+
+    @unpatch_policies
+    def test_PUT_message_length_using_content_length(self):
+        prolis = _test_sockets[0]
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        obj = b'j' * 20
+        fd.write(('PUT /v1/a/c/o.content-length HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Connection: close\r\n'
+                  'X-Storage-Token: t\r\n'
+                  'Content-Length: %s\r\n'
+                  'Content-Type: application/octet-stream\r\n'
+                  '\r\n' % (str(len(obj)))).encode('ascii'))
+        fd.write(obj)
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
+
+    @unpatch_policies
+    def test_PUT_message_length_using_transfer_encoding(self):
+        prolis = _test_sockets[0]
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        fd.write(b'PUT /v1/a/c/o.chunked HTTP/1.1\r\n'
+                 b'Host: localhost\r\n'
+                 b'Connection: close\r\n'
+                 b'X-Storage-Token: t\r\n'
+                 b'Content-Type: application/octet-stream\r\n'
+                 b'Transfer-Encoding: chunked\r\n\r\n'
+                 b'2\r\n'
+                 b'oh\r\n'
+                 b'4\r\n'
+                 b' say\r\n'
+                 b'4\r\n'
+                 b' can\r\n'
+                 b'4\r\n'
+                 b' you\r\n'
+                 b'4\r\n'
+                 b' see\r\n'
+                 b'3\r\n'
+                 b' by\r\n'
+                 b'4\r\n'
+                 b' the\r\n'
+                 b'8\r\n'
+                 b' dawns\'\n\r\n'
+                 b'0\r\n\r\n')
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
+
+    @unpatch_policies
+    def test_PUT_message_length_using_both(self):
+        prolis = _test_sockets[0]
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        with mock.patch('swift.obj.diskfile.fallocate') as mock_fallocate:
+            fd.write(b'PUT /v1/a/c/o.chunked HTTP/1.1\r\n'
+                     b'Host: localhost\r\n'
+                     b'Connection: keep-alive\r\n'
+                     b'X-Storage-Token: t\r\n'
+                     b'Content-Type: application/octet-stream\r\n'
+                     b'Content-Length: 33\r\n'
+                     b'Transfer-Encoding: chunked\r\n\r\n'
+                     b'2\r\n'
+                     b'oh\r\n'
+                     b'4\r\n'
+                     b' say\r\n'
+                     b'4\r\n'
+                     b' can\r\n'
+                     b'4\r\n'
+                     b' you\r\n'
+                     b'4\r\n'
+                     b' see\r\n'
+                     b'3\r\n'
+                     b' by\r\n'
+                     b'4\r\n'
+                     b' the\r\n'
+                     b'8\r\n'
+                     b' dawns\'\n\r\n'
+                     b'0\r\n\r\n')
+            fd.flush()
+            headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
+        self.assertFalse(mock_fallocate.mock_calls)
+
+        fd.write(b'GET /v1/a/c/o.chunked HTTP/1.1\r\n'
+                 b'Host: localhost\r\n'
+                 b'Connection: close\r\n'
+                 b'X-Storage-Token: t\r\n'
+                 b'\r\n')
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 200'
+        self.assertEqual(headers[:len(exp)], exp)
+        self.assertIn(b'Content-Length: 33', headers.split(b'\r\n'))
+        self.assertEqual(b"oh say can you see by the dawns'\n", fd.read(33))
+
+    @unpatch_policies
+    def test_PUT_message_length_using_both_with_crazy_meta(self):
+        prolis = _test_sockets[0]
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        fd.write(b'PUT /v1/a/c/o.chunked HTTP/1.1\r\n'
+                 b'Host: localhost\r\n'
+                 b'X-Storage-Token: t\r\n'
+                 b'Content-Type: message/rfc822\r\n'
+                 b'Content-Length: 33\r\n'
+                 b'X-Object-Meta-\xf0\x9f\x8c\xb4: \xf0\x9f\x91\x8d\r\n'
+                 b'X-Object-Meta-\xe2\x98\x85: \xe2\x98\x85\r\n'
+                 b'Expect: 100-continue\r\n'
+                 b'Transfer-Encoding: chunked\r\n\r\n')
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 100 Continue'
+        self.assertEqual(headers[:len(exp)], exp)
+        # Since we got our 100 Continue, now we can send the body
+        fd.write(b'2\r\n'
+                 b'oh\r\n'
+                 b'4\r\n'
+                 b' say\r\n'
+                 b'4\r\n'
+                 b' can\r\n'
+                 b'4\r\n'
+                 b' you\r\n'
+                 b'4\r\n'
+                 b' see\r\n'
+                 b'3\r\n'
+                 b' by\r\n'
+                 b'4\r\n'
+                 b' the\r\n'
+                 b'8\r\n'
+                 b' dawns\'\n\r\n'
+                 b'0\r\n\r\n')
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
+
+        fd.write(b'GET /v1/a/c/o.chunked HTTP/1.1\r\n'
+                 b'Host: localhost\r\n'
+                 b'Connection: close\r\n'
+                 b'X-Storage-Token: t\r\n'
+                 b'\r\n')
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 200'
+        self.assertEqual(headers[:len(exp)], exp)
+        header_lines = headers.split(b'\r\n')
+        self.assertIn(b'Content-Length: 33', header_lines)
+        self.assertIn(b'Content-Type: message/rfc822', header_lines)
+        self.assertIn(b'X-Object-Meta-\xf0\x9f\x8c\xb4: \xf0\x9f\x91\x8d',
+                      header_lines)
+        self.assertIn(b'X-Object-Meta-\xe2\x98\x85: \xe2\x98\x85',
+                      header_lines)
+        self.assertEqual(b"oh say can you see by the dawns'\n", fd.read(33))
+
+    @unpatch_policies
+    def test_PUT_bad_message_length(self):
+        prolis = _test_sockets[0]
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        fd.write(b'PUT /v1/a/c/o.chunked HTTP/1.1\r\n'
+                 b'Host: localhost\r\n'
+                 b'Connection: close\r\n'
+                 b'X-Storage-Token: t\r\n'
+                 b'Content-Type: application/octet-stream\r\n'
+                 b'Content-Length: 33\r\n'
+                 b'Transfer-Encoding: gzip\r\n\r\n'
+                 b'2\r\n'
+                 b'oh\r\n'
+                 b'4\r\n'
+                 b' say\r\n'
+                 b'4\r\n'
+                 b' can\r\n'
+                 b'4\r\n'
+                 b' you\r\n'
+                 b'4\r\n'
+                 b' see\r\n'
+                 b'3\r\n'
+                 b' by\r\n'
+                 b'4\r\n'
+                 b' the\r\n'
+                 b'8\r\n'
+                 b' dawns\'\n\r\n'
+                 b'0\r\n\r\n')
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 400'
+        self.assertEqual(headers[:len(exp)], exp)
+
+    @unpatch_policies
+    def test_PUT_message_length_unsup_xfr_encoding(self):
+        prolis = _test_sockets[0]
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        fd.write(b'PUT /v1/a/c/o.chunked HTTP/1.1\r\n'
+                 b'Host: localhost\r\n'
+                 b'Connection: close\r\n'
+                 b'X-Storage-Token: t\r\n'
+                 b'Content-Type: application/octet-stream\r\n'
+                 b'Content-Length: 33\r\n'
+                 b'Transfer-Encoding: gzip,chunked\r\n\r\n'
+                 b'2\r\n'
+                 b'oh\r\n'
+                 b'4\r\n'
+                 b' say\r\n'
+                 b'4\r\n'
+                 b' can\r\n'
+                 b'4\r\n'
+                 b' you\r\n'
+                 b'4\r\n'
+                 b' see\r\n'
+                 b'3\r\n'
+                 b' by\r\n'
+                 b'4\r\n'
+                 b' the\r\n'
+                 b'8\r\n'
+                 b' dawns\'\n\r\n'
+                 b'0\r\n\r\n')
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 501'
+        self.assertEqual(headers[:len(exp)], exp)
+
+    @unpatch_policies
+    def test_PUT_message_length_too_large(self):
+        with mock.patch('swift.common.constraints.MAX_FILE_SIZE', 10):
+            prolis = _test_sockets[0]
+            sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+            fd = sock.makefile('rwb')
+            fd.write(b'PUT /v1/a/c/o.chunked HTTP/1.1\r\n'
+                     b'Host: localhost\r\n'
+                     b'Connection: close\r\n'
+                     b'X-Storage-Token: t\r\n'
+                     b'Content-Type: application/octet-stream\r\n'
+                     b'Content-Length: 33\r\n\r\n'
+                     b'oh say can you see by the dawns\'\n')
+            fd.flush()
+            headers = readuntil2crlfs(fd)
+            exp = b'HTTP/1.1 413'
+            self.assertEqual(headers[:len(exp)], exp)
+
+    @unpatch_policies
+    def test_PUT_POST_last_modified(self):
+        prolis = _test_sockets[0]
+
+        def _do_HEAD():
+            # do a HEAD to get reported last modified time
+            sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+            fd = sock.makefile('rwb')
+            fd.write(b'HEAD /v1/a/c/o.last_modified HTTP/1.1\r\n'
+                     b'Host: localhost\r\nConnection: close\r\n'
+                     b'X-Storage-Token: t\r\n\r\n')
+            fd.flush()
+            headers = readuntil2crlfs(fd)
+            exp = b'HTTP/1.1 200'
+            self.assertEqual(headers[:len(exp)], exp)
+            last_modified_head = [line for line in headers.split(b'\r\n')
+                                  if lm_hdr in line][0][len(lm_hdr):]
+            return last_modified_head
+
+        def _do_conditional_GET_checks(last_modified_time):
+            # check If-(Un)Modified-Since GETs
+            sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+            fd = sock.makefile('rwb')
+            fd.write(b'GET /v1/a/c/o.last_modified HTTP/1.1\r\n'
+                     b'Host: localhost\r\nConnection: close\r\n'
+                     b'If-Modified-Since: %s\r\n'
+                     b'X-Storage-Token: t\r\n\r\n' % last_modified_time)
+            fd.flush()
+            headers = readuntil2crlfs(fd)
+            exp = b'HTTP/1.1 304'
+            self.assertEqual(headers[:len(exp)], exp)
+
+            sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+            fd = sock.makefile('rwb')
+            fd.write(b'GET /v1/a/c/o.last_modified HTTP/1.1\r\n'
+                     b'Host: localhost\r\nConnection: close\r\n'
+                     b'If-Unmodified-Since: %s\r\n'
+                     b'X-Storage-Token: t\r\n\r\n' % last_modified_time)
+            fd.flush()
+            headers = readuntil2crlfs(fd)
+            exp = b'HTTP/1.1 200'
+            self.assertEqual(headers[:len(exp)], exp)
+
+        # PUT the object
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        fd.write(b'PUT /v1/a/c/o.last_modified HTTP/1.1\r\n'
+                 b'Host: localhost\r\nConnection: close\r\n'
+                 b'X-Storage-Token: t\r\nContent-Length: 0\r\n\r\n')
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 201'
+        lm_hdr = b'Last-Modified: '
+        self.assertEqual(headers[:len(exp)], exp)
+
+        last_modified_put = [line for line in headers.split(b'\r\n')
+                             if lm_hdr in line][0][len(lm_hdr):]
+
+        last_modified_head = _do_HEAD()
+        self.assertEqual(last_modified_put, last_modified_head)
+
+        _do_conditional_GET_checks(last_modified_put)
+
+        # now POST to the object
+        # last-modified rounded in sec so sleep a sec to increment
+        sleep(1)
+
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        fd.write(b'POST /v1/a/c/o.last_modified HTTP/1.1\r\n'
+                 b'Host: localhost\r\nConnection: close\r\n'
+                 b'X-Storage-Token: t\r\nContent-Length: 0\r\n\r\n')
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 202'
+        self.assertEqual(headers[:len(exp)], exp)
+        for line in headers.split(b'\r\n'):
+            self.assertFalse(line.startswith(lm_hdr))
+
+        # last modified time will have changed due to POST
+        last_modified_head = _do_HEAD()
+        self.assertNotEqual(last_modified_put, last_modified_head)
+        _do_conditional_GET_checks(last_modified_head)
+
+    @unpatch_policies
+    def test_PUT_auto_content_type(self):
+        prolis = _test_sockets[0]
+
+        def do_test(ext, content_type):
+            sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+            fd = sock.makefile('rwb')
+            fd.write(b'PUT /v1/a/c/o.%s HTTP/1.1\r\n'
+                     b'Host: localhost\r\n'
+                     b'X-Storage-Token: t\r\nContent-Length: 0\r\n\r\n' %
+                     ext.encode())
+            fd.flush()
+            headers = readuntil2crlfs(fd)
+            exp = b'HTTP/1.1 201'
+            self.assertEqual(headers[:len(exp)], exp)
+
+            fd.write(b'GET /v1/a/c/o.%s HTTP/1.1\r\n'
+                     b'Host: localhost\r\nConnection: close\r\n'
+                     b'X-Storage-Token: t\r\n\r\n' % ext.encode())
+            fd.flush()
+            headers = readuntil2crlfs(fd)
+            exp = b'HTTP/1.1 200'
+            self.assertIn(b'Content-Type: %s' % content_type.encode(),
+                          headers.split(b'\r\n'))
+            sock.close()
+
+        do_test('jpg', 'image/jpeg')
+        do_test('html', 'text/html')
+        do_test('css', 'text/css')
+
+    def test_custom_mime_types_files(self):
+        swift_dir = mkdtemp()
+        try:
+            with open(os.path.join(swift_dir, 'mime.types'), 'w') as fp:
+                fp.write('foo/bar foo\n')
+            proxy_server.Application({'swift_dir': swift_dir},
+                                     debug_logger(),
+                                     FakeRing(), FakeRing())
+            self.assertEqual(proxy_server.mimetypes.guess_type('blah.foo')[0],
+                             'foo/bar')
+            self.assertEqual(proxy_server.mimetypes.guess_type('blah.jpg')[0],
+                             'image/jpeg')
+        finally:
+            rmtree(swift_dir, ignore_errors=True)
+
+    def test_PUT(self):
+        with save_globals():
+            controller = ReplicatedObjectController(
+                self.app, 'account', 'container', 'object')
+
+            def test_status_map(statuses, expected):
+                req = Request.blank('/v1/a/c/o.jpg', {})
+                req.content_length = 0
+                self.app.update_request(req)
+                with mocked_http_conn(*statuses) as mock_conn:
+                    res = controller.PUT(req)
                 expected = str(expected)
-                self.assertEquals(res.status[:len(expected)], expected)
-            test_status_map((200, 200, 201, 201, -1), 201)
-            test_status_map((200, 200, 201, 201, -2), 201)  # expect timeout
-            test_status_map((200, 200, 201, 201, -3), 201)  # error limited
-            test_status_map((200, 200, 201, -1, -1), 503)
-            test_status_map((200, 200, 503, 503, -1), 503)
+                self.assertEqual(res.status[:len(expected)], expected)
+                timestamps = [captured['headers'].get('X-Timestamp')
+                              for captured in mock_conn.requests[-3:]]
+                self.assertEqual(3, len(timestamps))
+                self.assertEqual(1, len(set(timestamps)))
+                self.assert_valid_timestamp(timestamps[0])
+            test_status_map((200, 200, 201, 201, 201), 201)
+            test_status_map((200, 200, 201, 201, 500), 201)
+            test_status_map((200, 200, 204, 404, 404), 404)
+            test_status_map((200, 200, 204, 500, 404), 503)
+            test_status_map((200, 200, 202, 202, 204), 204)
+
+    def test_PUT_connect_exceptions(self):
+        with save_globals():
+            controller = ReplicatedObjectController(
+                self.app, 'account', 'container', 'object')
+
+            def test_status_map(statuses, expected):
+                set_http_connect(*statuses)
+                req = Request.blank('/v1/a/c/o.jpg', {})
+                req.content_length = 0
+                self.app.update_request(req)
+                try:
+                    res = controller.PUT(req)
+                except HTTPException as res:  # noqa: F841
+                    pass
+                expected = str(expected)
+                self.assertEqual(res.status[:len(expected)], expected)
+            test_status_map((200, 200, 201, 201, -1), 201)  # connect exc
+            # connect errors
+            test_status_map((200, 200, Timeout(), 201, 201, ), 201)
+            test_status_map((200, 200, 201, 201, Exception()), 201)
+            # expect errors
+            test_status_map((200, 200, (Timeout(), None), 201, 201), 201)
+            test_status_map((200, 200, (Exception(), None), 201, 201), 201)
+            # response errors
+            test_status_map((200, 200, (100, Timeout()), 201, 201), 201)
+            test_status_map((200, 200, (100, Exception()), 201, 201), 201)
+            test_status_map((200, 200, 507, 201, 201), 201)  # error limited
+            test_status_map((200, 200, -1, 201, -1), 503)
+            test_status_map((200, 200, 503, -1, 503), 503)
 
     def test_PUT_send_exceptions(self):
         with save_globals():
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
+            controller = ReplicatedObjectController(
+                self.app, 'account', 'container', 'object')
 
             def test_status_map(statuses, expected):
-                self.app.memcache.store = {}
                 set_http_connect(*statuses)
-                req = Request.blank('/a/c/o.jpg',
+                req = Request.blank('/v1/a/c/o.jpg',
                                     environ={'REQUEST_METHOD': 'PUT'},
                                     body='some data')
                 self.app.update_request(req)
-                res = controller.PUT(req)
+                try:
+                    res = controller.PUT(req)
+                except HTTPException as res:  # noqa: F841
+                    pass
                 expected = str(expected)
-                self.assertEquals(res.status[:len(expected)], expected)
+                self.assertEqual(res.status[:len(expected)], expected)
             test_status_map((200, 200, 201, -1, 201), 201)
             test_status_map((200, 200, 201, -1, -1), 503)
             test_status_map((200, 200, 503, 503, -1), 503)
@@ -1124,118 +4091,1065 @@ def test_status_map(statuses, expected):
     def test_PUT_max_size(self):
         with save_globals():
             set_http_connect(201, 201, 201)
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-            req = Request.blank('/a/c/o', {}, headers={
-                'Content-Length': str(MAX_FILE_SIZE + 1),
+            controller = ReplicatedObjectController(
+                self.app, 'account', 'container', 'object')
+            req = Request.blank('/v1/a/c/o', {}, headers={
+                'Content-Length': str(constraints.MAX_FILE_SIZE + 1),
                 'Content-Type': 'foo/bar'})
             self.app.update_request(req)
             res = controller.PUT(req)
-            self.assertEquals(res.status_int, 413)
+            self.assertEqual(res.status_int, 413)
+
+    def test_PUT_bad_content_type(self):
+        with save_globals():
+            set_http_connect(201, 201, 201)
+            controller = ReplicatedObjectController(
+                self.app, 'account', 'container', 'object')
+            req = Request.blank('/v1/a/c/o', {}, headers={
+                'Content-Length': 0, 'Content-Type': 'foo/bar;swift_hey=45'})
+            self.app.update_request(req)
+            res = controller.PUT(req)
+            self.assertEqual(res.status_int, 400)
 
     def test_PUT_getresponse_exceptions(self):
 
         with save_globals():
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
+            controller = ReplicatedObjectController(
+                self.app, 'account', 'container', 'object')
 
             def test_status_map(statuses, expected):
-                self.app.memcache.store = {}
                 set_http_connect(*statuses)
-                req = Request.blank('/a/c/o.jpg', {})
+                req = Request.blank('/v1/a/c/o.jpg', {})
                 req.content_length = 0
                 self.app.update_request(req)
-                res = controller.PUT(req)
+                try:
+                    res = controller.PUT(req)
+                except HTTPException as res:  # noqa: F841
+                    pass
                 expected = str(expected)
-                self.assertEquals(res.status[:len(str(expected))],
-                                  str(expected))
+                self.assertEqual(res.status[:len(str(expected))],
+                                 str(expected))
             test_status_map((200, 200, 201, 201, -1), 201)
             test_status_map((200, 200, 201, -1, -1), 503)
             test_status_map((200, 200, 503, 503, -1), 503)
 
     def test_POST(self):
         with save_globals():
-            self.app.object_post_as_copy = False
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-
             def test_status_map(statuses, expected):
-                set_http_connect(*statuses)
-                self.app.memcache.store = {}
-                req = Request.blank('/a/c/o', {},
+                req = Request.blank('/v1/a/c/o', {}, method='POST',
                                     headers={'Content-Type': 'foo/bar'})
                 self.app.update_request(req)
-                res = controller.POST(req)
+                with mocked_http_conn(*statuses) as mock_conn:
+                    res = req.get_response(self.app)
                 expected = str(expected)
-                self.assertEquals(res.status[:len(expected)], expected)
+                self.assertEqual(res.status[:len(expected)], expected)
+                timestamps = [captured['headers'].get('X-Timestamp')
+                              for captured in mock_conn.requests[-3:]]
+                self.assertEqual(3, len(timestamps))
+                self.assertEqual(1, len(set(timestamps)))
+                self.assert_valid_timestamp(timestamps[0])
             test_status_map((200, 200, 202, 202, 202), 202)
             test_status_map((200, 200, 202, 202, 500), 202)
             test_status_map((200, 200, 202, 500, 500), 503)
             test_status_map((200, 200, 202, 404, 500), 503)
-            test_status_map((200, 200, 202, 404, 404), 404)
+            test_status_map((200, 200, 202, 404, 404), 503)
             test_status_map((200, 200, 404, 500, 500), 503)
             test_status_map((200, 200, 404, 404, 404), 404)
 
-    def test_POST_as_copy(self):
-        with save_globals():
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
+    @patch_policies([
+        StoragePolicy(0, 'zero', is_default=True, object_ring=FakeRing()),
+        StoragePolicy(1, 'one', object_ring=FakeRing()),
+    ])
+    def test_POST_backend_headers(self):
+        self.app = proxy_server.Application(
+            {},
+            account_ring=FakeRing(separate_replication=True),
+            container_ring=FakeRing(separate_replication=True))
+
+        part = self.app.container_ring.get_part('a', 'c')
+        nodes = self.app.container_ring.get_part_nodes(part)
+        self.assertNotEqual(nodes[0]['ip'], nodes[0]['replication_ip'])
+
+        # reset the router post patch_policies
+        self.app.obj_controller_router = proxy_server.ObjectControllerRouter()
+        self.app.sort_nodes = lambda nodes, *args, **kwargs: nodes
+
+        def do_test(resp_headers, use_replication=False):
+            backend_requests = []
+
+            def capture_requests(ip, port, method, path, headers, *args,
+                                 **kwargs):
+                backend_requests.append((method, path, headers))
+
+            replication_aware = 'true' if use_replication else 'false'
+            req = Request.blank('/v1/a/c/o', {}, method='POST',
+                                headers={'X-Object-Meta-Color': 'Blue',
+                                         'Content-Type': 'text/plain',
+                                         'x-backend-use-replication-network':
+                                             replication_aware})
+
+            # we want the container_info response to says a policy index of 1
+            with mocked_http_conn(
+                    200, 200, 202, 202, 202,
+                    headers=resp_headers, give_connect=capture_requests
+            ) as fake_conn:
+                resp = req.get_response(self.app)
+            with self.assertRaises(StopIteration):
+                next(fake_conn.code_iter)
+
+            self.assertEqual(resp.status_int, 202)
+            self.assertEqual(len(backend_requests), 5)
+
+            def check_request(req, method, path, headers=None):
+                req_method, req_path, req_headers = req
+                self.assertEqual(method, req_method)
+                # caller can ignore leading path parts
+                self.assertTrue(req_path.endswith(path),
+                                'expected path to end with %s, it was %s' % (
+                                    path, req_path))
+                headers = headers or {}
+                # caller can ignore some headers
+                for k, v in headers.items():
+                    self.assertEqual(req_headers[k], v)
+                self.assertNotIn('X-Backend-Container-Path', req_headers)
+
+            account_request = backend_requests.pop(0)
+            check_request(account_request, method='HEAD', path='/sda/0/a')
+            container_request = backend_requests.pop(0)
+            check_request(container_request, method='HEAD', path='/sda/0/a/c')
+            # make sure backend requests included expected container headers
+            container_headers = {}
+            for request in backend_requests:
+                req_headers = request[2]
+                device = req_headers['x-container-device']
+                host = req_headers['x-container-host']
+                container_headers[device] = host
+                expectations = {
+                    'method': 'POST',
+                    'path': '/0/a/c/o',
+                    'headers': {
+                        'X-Container-Partition': '0',
+                        'Connection': 'close',
+                        'User-Agent': 'proxy-server %s' % os.getpid(),
+                        'Host': 'localhost:80',
+                        'Referer': 'POST http://localhost/v1/a/c/o',
+                        'X-Object-Meta-Color': 'Blue',
+                        'X-Backend-Storage-Policy-Index': '1'
+                    },
+                }
+                check_request(request, **expectations)
+
+            expected = {}
+            for i, device in enumerate(['sda', 'sdb', 'sdc']):
+                if use_replication:
+                    expected[device] = '10.0.1.%d:110%d' % (i, i)
+                else:
+                    expected[device] = '10.0.0.%d:100%d' % (i, i)
+            self.assertEqual(container_headers, expected)
+
+            # and again with policy override
+            backend_requests = []
+            req = Request.blank('/v1/a/c/o', {}, method='POST',
+                                headers={'X-Object-Meta-Color': 'Blue',
+                                         'Content-Type': 'text/plain',
+                                         'X-Backend-Storage-Policy-Index': 0})
+            with mocked_http_conn(
+                    200, 200, 202, 202, 202,
+                    headers=resp_headers, give_connect=capture_requests
+            ) as fake_conn:
+                resp = req.get_response(self.app)
+            with self.assertRaises(StopIteration):
+                next(fake_conn.code_iter)
+            self.assertEqual(resp.status_int, 202)
+            self.assertEqual(len(backend_requests), 5)
+            for request in backend_requests[2:]:
+                expectations = {
+                    'method': 'POST',
+                    'path': '/0/a/c/o',  # ignore device bit
+                    'headers': {
+                        'X-Object-Meta-Color': 'Blue',
+                        'X-Backend-Storage-Policy-Index': '0',
+                    }
+                }
+                check_request(request, **expectations)
+
+        resp_headers = {'X-Backend-Storage-Policy-Index': 1}
+        do_test(resp_headers)
+        resp_headers['X-Backend-Sharding-State'] = 'unsharded'
+        do_test(resp_headers)
+        do_test(resp_headers, use_replication=True)
+
+    def _check_request(self, req, method, path, headers=None, params=None):
+        self.assertEqual(method, req['method'])
+        # caller can ignore leading path parts
+        self.assertTrue(req['path'].endswith(path),
+                        'expected path to end with %s, it was %s' % (
+                            path, req['path']))
+        headers = headers or {}
+        # caller can ignore some headers
+        for k, v in headers.items():
+            self.assertEqual(req['headers'][k], v,
+                             'Expected %s but got %s for key %s' %
+                             (v, req['headers'][k], k))
+        params = params or {}
+        req_params = dict(parse_qsl(req['qs'])) if req['qs'] else {}
+        for k, v in params.items():
+            self.assertEqual(req_params[k], v,
+                             'Expected %s but got %s for key %s' %
+                             (v, req_params[k], k))
+
+    @patch_policies([
+        StoragePolicy(0, 'zero', is_default=True, object_ring=FakeRing()),
+        StoragePolicy(1, 'one', object_ring=FakeRing()),
+    ])
+    def test_backend_headers_update_shard_container_no_cache(self):
+        # verify that when container is sharded the backend container update is
+        # directed to the shard container
+        # reset the router post patch_policies
+        self.app.obj_controller_router = proxy_server.ObjectControllerRouter()
+        self.app.sort_nodes = lambda nodes, *args, **kwargs: nodes
+        self.app.recheck_updating_shard_ranges = 0
+
+        def do_test(method, sharding_state):
+            self.app.logger.clear()  # clean capture state
+            req = Request.blank('/v1/a/c/o', {}, method=method, body='',
+                                headers={'Content-Type': 'text/plain'})
+
+            # we want the container_info response to say policy index of 1 and
+            # sharding state
+            # acc HEAD, cont HEAD, cont shard GET, obj POSTs
+            status_codes = (200, 200, 200, 202, 202, 202)
+            resp_headers = {'X-Backend-Storage-Policy-Index': 1,
+                            'x-backend-sharding-state': sharding_state,
+                            'X-Backend-Record-Type': 'shard'}
+            shard_range = utils.ShardRange(
+                '.shards_a/c_shard', utils.Timestamp.now(), 'l', 'u')
+            body = json.dumps([dict(shard_range)]).encode('ascii')
+            with mocked_http_conn(*status_codes, headers=resp_headers,
+                                  body=body) as fake_conn:
+                resp = req.get_response(self.app)
+
+            self.assertEqual(resp.status_int, 202)
+            stats = self.app.logger.statsd_client.get_stats_counts()
+            self.assertEqual(
+                {'account.info.cache.disabled.200': 1,
+                 'account.info.infocache.hit': 2,
+                 'container.info.cache.disabled.200': 1,
+                 'container.info.infocache.hit': 1,
+                 'object.shard_updating.cache.disabled.200': 1},
+                stats)
+            backend_requests = fake_conn.requests
+            # verify statsd prefix is not mutated
+            self.assertEqual([], self.app.logger.log_dict['set_statsd_prefix'])
+
+            account_request = backend_requests[0]
+            self._check_request(
+                account_request, method='HEAD', path='/sda/0/a')
+            container_request = backend_requests[1]
+            self._check_request(
+                container_request, method='HEAD', path='/sda/0/a/c')
+            container_request_shard = backend_requests[2]
+            self._check_request(
+                container_request_shard, method='GET', path='/sda/0/a/c',
+                params={'includes': 'o', 'states': 'updating'},
+                headers={'X-Backend-Record-Type': 'shard'})
+
+            # make sure backend requests included expected container headers
+            container_headers = {}
+
+            for request in backend_requests[3:]:
+                req_headers = request['headers']
+                device = req_headers['x-container-device']
+                container_headers[device] = req_headers['x-container-host']
+                expectations = {
+                    'method': method,
+                    'path': '/0/a/c/o',
+                    'headers': {
+                        'X-Container-Partition': '0',
+                        'Host': 'localhost:80',
+                        'Referer': '%s http://localhost/v1/a/c/o' % method,
+                        'X-Backend-Storage-Policy-Index': '1',
+                        'X-Backend-Quoted-Container-Path': shard_range.name
+                    },
+                }
+                self._check_request(request, **expectations)
+
+            expected = {}
+            for i, device in enumerate(['sda', 'sdb', 'sdc']):
+                expected[device] = '10.0.0.%d:100%d' % (i, i)
+            self.assertEqual(container_headers, expected)
+
+        do_test('POST', 'sharding')
+        do_test('POST', 'sharded')
+        do_test('DELETE', 'sharding')
+        do_test('DELETE', 'sharded')
+        do_test('PUT', 'sharding')
+        do_test('PUT', 'sharded')
+
+    @patch_policies([
+        StoragePolicy(0, 'zero', is_default=True, object_ring=FakeRing()),
+        StoragePolicy(1, 'one', object_ring=FakeRing()),
+    ])
+    def test_backend_headers_update_shard_container_with_empty_cache(self):
+        # verify that when container is sharded the backend container update is
+        # directed to the shard container
+        # reset the router post patch_policies
+        self.app.obj_controller_router = proxy_server.ObjectControllerRouter()
+        self.app.sort_nodes = lambda nodes, *args, **kwargs: nodes
+        self.app.recheck_updating_shard_ranges = 3600
+        self.app.namespace_cache_tokens_per_session = 0
+
+        def do_test(method, sharding_state):
+            self.app.logger.clear()  # clean capture state
+            self.app.statsd.clear()
+            req = Request.blank(
+                '/v1/a/c/o', {'swift.cache': FakeMemcache()},
+                method=method, body='', headers={'Content-Type': 'text/plain'})
+
+            # we want the container_info response to say policy index of 1 and
+            # sharding state
+            # acc HEAD, cont HEAD, cont shard GET, obj POSTs
+            status_codes = (200, 200, 200, 202, 202, 202)
+            resp_headers = {'X-Backend-Storage-Policy-Index': 1,
+                            'x-backend-sharding-state': sharding_state,
+                            'X-Backend-Record-Type': 'shard'}
+            shard_ranges = [
+                utils.ShardRange(
+                    '.shards_a/c_not_used', utils.Timestamp.now(), '', 'l'),
+                utils.ShardRange(
+                    '.shards_a/c_shard', utils.Timestamp.now(), 'l', 'u'),
+                utils.ShardRange(
+                    '.shards_a/c_nope', utils.Timestamp.now(), 'u', ''),
+            ]
+            body = json.dumps([
+                dict(shard_range)
+                for shard_range in shard_ranges]).encode('ascii')
+            with mocked_http_conn(*status_codes, headers=resp_headers,
+                                  body=body) as fake_conn:
+                resp = req.get_response(self.app)
+
+            self.assertEqual(resp.status_int, 202)
+            stats = self.app.logger.statsd_client.get_stats_counts()
+            self.assertEqual(stats, {
+                'account.info.cache.miss.200': 1,
+                'account.info.infocache.hit': 2,
+                'container.info.cache.miss.200': 1,
+                'container.info.infocache.hit': 1,
+                'object.shard_updating.cache.miss.200': 1,
+                'object.shard_updating.cache.set': 1
+            })
+            stats = self.app.statsd.get_labeled_stats_counts()
+            self.assertEqual({
+                ('swift_coop_cache', frozenset((
+                    ('resource', 'shard_updating'),
+                    ('account', 'a'),
+                    ('container', 'c'),
+                    ('event', 'backend_reqs'),
+                    ('set_cache_state', 'set'),
+                    ('token', 'disabled'),
+                    ('status', 200)),
+                )): 1,
+            }, stats)
+            self.assertEqual([], self.app.logger.log_dict['set_statsd_prefix'])
+            info_lines = self.logger.get_lines_for_level('info')
+            self.assertIn(
+                'Caching updating shards for shard-updating-v2/a/c (3 shards)',
+                info_lines)
+
+            backend_requests = fake_conn.requests
+            account_request = backend_requests[0]
+            self._check_request(
+                account_request, method='HEAD', path='/sda/0/a')
+            container_request = backend_requests[1]
+            self._check_request(
+                container_request, method='HEAD', path='/sda/0/a/c')
+            container_request_shard = backend_requests[2]
+            self._check_request(
+                container_request_shard, method='GET', path='/sda/0/a/c',
+                params={'states': 'updating'},
+                headers={'X-Backend-Record-Type': 'shard'})
+
+            cache_key = 'shard-updating-v2/a/c'
+            self.assertIn(cache_key, req.environ['swift.cache'].store)
+            cached_namespaces = NamespaceBoundList.parse(shard_ranges)
+            self.assertEqual(
+                req.environ['swift.cache'].store[cache_key],
+                cached_namespaces.bounds)
+            self.assertIn(cache_key, req.environ.get('swift.infocache'))
+            self.assertEqual(
+                req.environ['swift.infocache'][cache_key].bounds,
+                cached_namespaces.bounds)
+
+            # make sure backend requests included expected container headers
+            container_headers = {}
+
+            for request in backend_requests[3:]:
+                req_headers = request['headers']
+                device = req_headers['x-container-device']
+                container_headers[device] = req_headers['x-container-host']
+                expectations = {
+                    'method': method,
+                    'path': '/0/a/c/o',
+                    'headers': {
+                        'X-Container-Partition': '0',
+                        'Host': 'localhost:80',
+                        'Referer': '%s http://localhost/v1/a/c/o' % method,
+                        'X-Backend-Storage-Policy-Index': '1',
+                        'X-Backend-Quoted-Container-Path': shard_ranges[1].name
+                    },
+                }
+                self._check_request(request, **expectations)
+
+            expected = {}
+            for i, device in enumerate(['sda', 'sdb', 'sdc']):
+                expected[device] = '10.0.0.%d:100%d' % (i, i)
+            self.assertEqual(container_headers, expected)
+
+        do_test('POST', 'sharding')
+        do_test('POST', 'sharded')
+        do_test('DELETE', 'sharding')
+        do_test('DELETE', 'sharded')
+        do_test('PUT', 'sharding')
+        do_test('PUT', 'sharded')
+
+    @patch_policies([
+        StoragePolicy(0, 'zero', is_default=True, object_ring=FakeRing()),
+        StoragePolicy(1, 'one', object_ring=FakeRing()),
+    ])
+    def test_backend_headers_update_shard_container_with_live_cache(self):
+        # verify that when container is sharded the backend container update is
+        # directed to the shard container
+        # reset the router post patch_policies
+        self.app.obj_controller_router = proxy_server.ObjectControllerRouter()
+        self.app.sort_nodes = lambda nodes, *args, **kwargs: nodes
+        self.app.recheck_updating_shard_ranges = 3600
+
+        def do_test(method, sharding_state):
+            self.app.logger.clear()  # clean capture state
+            shard_ranges = [
+                utils.ShardRange(
+                    '.shards_a/c_not_used', utils.Timestamp.now(), '', 'l'),
+                utils.ShardRange(
+                    '.shards_a/c_shard', utils.Timestamp.now(), 'l', 'u'),
+                utils.ShardRange(
+                    '.shards_a/c_nope', utils.Timestamp.now(), 'u', ''),
+            ]
+            cache = FakeMemcache()
+            cache.set(
+                'shard-updating-v2/a/c',
+                tuple(
+                    [shard_range.lower_str, str(shard_range.name)]
+                    for shard_range in shard_ranges))
+            req = Request.blank('/v1/a/c/o', {'swift.cache': cache},
+                                method=method, body='',
+                                headers={'Content-Type': 'text/plain'})
+
+            # we want the container_info response to say policy index of 1 and
+            # sharding state
+            # acc HEAD, cont HEAD, obj POSTs
+            status_codes = (200, 200, 202, 202, 202)
+            resp_headers = {'X-Backend-Storage-Policy-Index': 1,
+                            'x-backend-sharding-state': sharding_state,
+                            'X-Backend-Record-Type': 'shard'}
+            with mocked_http_conn(*status_codes,
+                                  headers=resp_headers) as fake_conn:
+                resp = req.get_response(self.app)
+
+            self.assertEqual(resp.status_int, 202)
+
+            stats = self.app.logger.statsd_client.get_stats_counts()
+            self.assertEqual({'account.info.cache.miss.200': 1,
+                              'account.info.infocache.hit': 1,
+                              'container.info.cache.miss.200': 1,
+                              'container.info.infocache.hit': 1,
+                              'object.shard_updating.cache.hit': 1}, stats)
+            # verify statsd prefix is not mutated
+            self.assertEqual([], self.app.logger.log_dict['set_statsd_prefix'])
+
+            backend_requests = fake_conn.requests
+            account_request = backend_requests[0]
+            self._check_request(
+                account_request, method='HEAD', path='/sda/0/a')
+            container_request = backend_requests[1]
+            self._check_request(
+                container_request, method='HEAD', path='/sda/0/a/c')
+
+            # infocache gets populated from memcache
+            cache_key = 'shard-updating-v2/a/c'
+            self.assertIn(cache_key, req.environ.get('swift.infocache'))
+            self.assertEqual(
+                req.environ['swift.infocache'][cache_key].bounds,
+                NamespaceBoundList.parse(shard_ranges).bounds)
+
+            # make sure backend requests included expected container headers
+            container_headers = {}
+
+            for request in backend_requests[2:]:
+                req_headers = request['headers']
+                device = req_headers['x-container-device']
+                container_headers[device] = req_headers['x-container-host']
+                expectations = {
+                    'method': method,
+                    'path': '/0/a/c/o',
+                    'headers': {
+                        'X-Container-Partition': '0',
+                        'Host': 'localhost:80',
+                        'Referer': '%s http://localhost/v1/a/c/o' % method,
+                        'X-Backend-Storage-Policy-Index': '1',
+                        'X-Backend-Quoted-Container-Path': shard_ranges[1].name
+                    },
+                }
+                self._check_request(request, **expectations)
+
+            expected = {}
+            for i, device in enumerate(['sda', 'sdb', 'sdc']):
+                expected[device] = '10.0.0.%d:100%d' % (i, i)
+            self.assertEqual(container_headers, expected)
+
+        do_test('POST', 'sharding')
+        do_test('POST', 'sharded')
+        do_test('DELETE', 'sharding')
+        do_test('DELETE', 'sharded')
+        do_test('PUT', 'sharding')
+        do_test('PUT', 'sharded')
+
+    @patch_policies([
+        StoragePolicy(0, 'zero', is_default=True, object_ring=FakeRing()),
+        StoragePolicy(1, 'one', object_ring=FakeRing()),
+    ])
+    def test_backend_headers_update_shard_container_with_live_infocache(self):
+        # verify that when container is sharded the backend container update is
+        # directed to the shard container
+        # reset the router post patch_policies
+        self.app.obj_controller_router = proxy_server.ObjectControllerRouter()
+        self.app.sort_nodes = lambda nodes, *args, **kwargs: nodes
+        self.app.recheck_updating_shard_ranges = 3600
+
+        def do_test(method, sharding_state):
+            self.app.logger.clear()  # clean capture state
+            shard_ranges = [
+                utils.ShardRange(
+                    '.shards_a/c_not_used', utils.Timestamp.now(), '', 'l'),
+                utils.ShardRange(
+                    '.shards_a/c_shard', utils.Timestamp.now(), 'l', 'u'),
+                utils.ShardRange(
+                    '.shards_a/c_nope', utils.Timestamp.now(), 'u', ''),
+            ]
+            cache = FakeMemcache()
+            infocache = {
+                'shard-updating-v2/a/c':
+                NamespaceBoundList.parse(shard_ranges)}
+            req = Request.blank('/v1/a/c/o',
+                                {'swift.cache': cache,
+                                 'swift.infocache': infocache},
+                                method=method, body='',
+                                headers={'Content-Type': 'text/plain'})
+
+            # we want the container_info response to say policy index of 1 and
+            # sharding state
+            # acc HEAD, cont HEAD, obj POSTs
+            status_codes = (200, 200, 202, 202, 202)
+            resp_headers = {'X-Backend-Storage-Policy-Index': 1,
+                            'x-backend-sharding-state': sharding_state,
+                            'X-Backend-Record-Type': 'shard'}
+            with mocked_http_conn(*status_codes,
+                                  headers=resp_headers) as fake_conn:
+                resp = req.get_response(self.app)
+
+            # verify request hitted infocache.
+            self.assertEqual(resp.status_int, 202)
+
+            stats = self.app.logger.statsd_client.get_stats_counts()
+            self.assertEqual({'account.info.cache.miss.200': 1,
+                              'account.info.infocache.hit': 1,
+                              'container.info.cache.miss.200': 1,
+                              'container.info.infocache.hit': 1,
+                              'object.shard_updating.infocache.hit': 1}, stats)
+            # verify statsd prefix is not mutated
+            self.assertEqual([], self.app.logger.log_dict['set_statsd_prefix'])
+
+            backend_requests = fake_conn.requests
+            account_request = backend_requests[0]
+            self._check_request(
+                account_request, method='HEAD', path='/sda/0/a')
+            container_request = backend_requests[1]
+            self._check_request(
+                container_request, method='HEAD', path='/sda/0/a/c')
+
+            # verify content in infocache.
+            cache_key = 'shard-updating-v2/a/c'
+            self.assertIn(cache_key, req.environ.get('swift.infocache'))
+            self.assertEqual(
+                req.environ['swift.infocache'][cache_key].bounds,
+                NamespaceBoundList.parse(shard_ranges).bounds)
+
+            # make sure backend requests included expected container headers
+            container_headers = {}
+
+            for request in backend_requests[2:]:
+                req_headers = request['headers']
+                device = req_headers['x-container-device']
+                container_headers[device] = req_headers['x-container-host']
+                expectations = {
+                    'method': method,
+                    'path': '/0/a/c/o',
+                    'headers': {
+                        'X-Container-Partition': '0',
+                        'Host': 'localhost:80',
+                        'Referer': '%s http://localhost/v1/a/c/o' % method,
+                        'X-Backend-Storage-Policy-Index': '1',
+                        'X-Backend-Quoted-Container-Path': shard_ranges[1].name
+                    },
+                }
+                self._check_request(request, **expectations)
+
+            expected = {}
+            for i, device in enumerate(['sda', 'sdb', 'sdc']):
+                expected[device] = '10.0.0.%d:100%d' % (i, i)
+            self.assertEqual(container_headers, expected)
+
+        do_test('POST', 'sharding')
+        do_test('POST', 'sharded')
+        do_test('DELETE', 'sharding')
+        do_test('DELETE', 'sharded')
+        do_test('PUT', 'sharding')
+        do_test('PUT', 'sharded')
+
+    @patch_policies([
+        StoragePolicy(0, 'zero', is_default=True, object_ring=FakeRing()),
+        StoragePolicy(1, 'one', object_ring=FakeRing()),
+    ])
+    def test_backend_headers_update_shard_container_can_skip_cache(self):
+        # verify that when container is sharded the backend container update is
+        # directed to the shard container
+        # reset the router post patch_policies
+        self.app.obj_controller_router = proxy_server.ObjectControllerRouter()
+        self.app.sort_nodes = lambda nodes, *args, **kwargs: nodes
+        self.app.recheck_updating_shard_ranges = 3600
+        self.app.container_updating_shard_ranges_skip_cache = 0.001
+        self.app.namespace_cache_tokens_per_session = 0
+
+        def do_test(method, sharding_state):
+            self.app.logger.clear()  # clean capture state
+            self.app.statsd.clear()
+            cached_shard_ranges = [
+                utils.ShardRange(
+                    '.shards_a/c_nope', utils.Timestamp.now(), '', 'l'),
+                utils.ShardRange(
+                    '.shards_a/c_uhn_uh', utils.Timestamp.now(), 'l', 'u'),
+                utils.ShardRange(
+                    '.shards_a/c_no_way', utils.Timestamp.now(), 'u', ''),
+            ]
+            cache = FakeMemcache()
+            cache.set('shard-updating-v2/a/c',
+                      tuple(
+                          [sr.lower_str, str(sr.name)]
+                          for sr in cached_shard_ranges))
+
+            # sanity check: we can get the old shard from cache
+            req = Request.blank(
+                '/v1/a/c/o', {'swift.cache': cache},
+                method=method, body='', headers={'Content-Type': 'text/plain'})
+            # acc HEAD, cont HEAD, obj POSTs
+            # we want the container_info response to say policy index of 1 and
+            # sharding state
+            status_codes = (200, 200, 202, 202, 202)
+            resp_headers = {'X-Backend-Storage-Policy-Index': 1,
+                            'x-backend-sharding-state': sharding_state,
+                            'X-Backend-Record-Type': 'shard'}
+            with mock.patch('random.random', return_value=1), \
+                    mocked_http_conn(*status_codes, headers=resp_headers):
+                resp = req.get_response(self.app)
+
+            self.assertEqual(resp.status_int, 202)
+
+            stats = self.app.logger.statsd_client.get_stats_counts()
+            self.assertEqual({'account.info.cache.miss.200': 1,
+                              'account.info.infocache.hit': 1,
+                              'container.info.cache.miss.200': 1,
+                              'container.info.infocache.hit': 1,
+                              'object.shard_updating.cache.hit': 1}, stats)
+
+            # cached shard ranges are still there
+            cache_key = 'shard-updating-v2/a/c'
+            self.assertIn(cache_key, req.environ['swift.cache'].store)
+            cached_namespaces = NamespaceBoundList.parse(cached_shard_ranges)
+            self.assertEqual(
+                req.environ['swift.cache'].store[cache_key],
+                cached_namespaces.bounds)
+            self.assertIn(cache_key, req.environ.get('swift.infocache'))
+            self.assertEqual(
+                req.environ['swift.infocache'][cache_key].bounds,
+                cached_namespaces.bounds)
+
+            # ...but we have some chance to skip cache
+            req = Request.blank(
+                '/v1/a/c/o', {'swift.cache': cache},
+                method=method, body='', headers={'Content-Type': 'text/plain'})
+            # cont shard GET, obj POSTs
+            status_codes = (200, 202, 202, 202)
+            resp_headers = {'X-Backend-Storage-Policy-Index': 1,
+                            'x-backend-sharding-state': sharding_state,
+                            'X-Backend-Record-Type': 'shard'}
+            shard_ranges = [
+                utils.ShardRange(
+                    '.shards_a/c_not_used', utils.Timestamp.now(), '', 'l'),
+                utils.ShardRange(
+                    '.shards_a/c_shard', utils.Timestamp.now(), 'l', 'u'),
+                utils.ShardRange(
+                    '.shards_a/c_nope', utils.Timestamp.now(), 'u', ''),
+            ]
+            body = json.dumps([
+                dict(shard_range)
+                for shard_range in shard_ranges]).encode('ascii')
+            with mock.patch('random.random', return_value=0), \
+                mocked_http_conn(*status_codes, headers=resp_headers,
+                                 body=body) as fake_conn:
+                resp = req.get_response(self.app)
+
+            self.assertEqual(resp.status_int, 202)
+
+            stats = self.app.logger.statsd_client.get_stats_counts()
+            self.assertEqual(stats, {
+                'account.info.cache.miss.200': 1,
+                'account.info.infocache.hit': 1,
+                'container.info.cache.miss.200': 1,
+                'container.info.infocache.hit': 2,
+                'object.shard_updating.cache.hit': 1,
+                'container.info.cache.hit': 1,
+                'account.info.cache.hit': 1,
+                'object.shard_updating.cache.skip.200': 1,
+                'object.shard_updating.cache.set': 1
+            })
+            stats = self.app.statsd.get_labeled_stats_counts()
+            self.assertEqual({
+                ('swift_coop_cache', frozenset((
+                    ('resource', 'shard_updating'),
+                    ('account', 'a'),
+                    ('container', 'c'),
+                    ('event', 'backend_reqs'),
+                    ('set_cache_state', 'set'),
+                    ('token', 'disabled'),
+                    ('status', 200)),
+                )): 1,
+            }, stats)
+            # verify statsd prefix is not mutated
+            self.assertEqual([], self.app.logger.log_dict['set_statsd_prefix'])
+
+            backend_requests = fake_conn.requests
+            container_request_shard = backend_requests[0]
+            self._check_request(
+                container_request_shard, method='GET', path='/sda/0/a/c',
+                params={'states': 'updating'},
+                headers={'X-Backend-Record-Type': 'shard'})
+
+            # and skipping cache will refresh it
+            cache_key = 'shard-updating-v2/a/c'
+            self.assertIn(cache_key, req.environ['swift.cache'].store)
+            cached_namespaces = NamespaceBoundList.parse(shard_ranges)
+            self.assertEqual(
+                req.environ['swift.cache'].store[cache_key],
+                cached_namespaces.bounds)
+            self.assertIn(cache_key, req.environ.get('swift.infocache'))
+            self.assertEqual(
+                req.environ['swift.infocache'][cache_key].bounds,
+                cached_namespaces.bounds)
+
+            # make sure backend requests included expected container headers
+            container_headers = {}
+
+            for request in backend_requests[1:]:
+                req_headers = request['headers']
+                device = req_headers['x-container-device']
+                container_headers[device] = req_headers['x-container-host']
+                expectations = {
+                    'method': method,
+                    'path': '/0/a/c/o',
+                    'headers': {
+                        'X-Container-Partition': '0',
+                        'Host': 'localhost:80',
+                        'Referer': '%s http://localhost/v1/a/c/o' % method,
+                        'X-Backend-Storage-Policy-Index': '1',
+                        'X-Backend-Quoted-Container-Path': shard_ranges[1].name
+                    },
+                }
+                self._check_request(request, **expectations)
+
+            expected = {}
+            for i, device in enumerate(['sda', 'sdb', 'sdc']):
+                expected[device] = '10.0.0.%d:100%d' % (i, i)
+            self.assertEqual(container_headers, expected)
+
+            # shard lookup in memcache may error...
+            req = Request.blank(
+                '/v1/a/c/o', {'swift.cache': cache},
+                method=method, body='', headers={'Content-Type': 'text/plain'})
+            cache.error_on_get = [False, True]
+            with mock.patch('random.random', return_value=1.0), \
+                    mocked_http_conn(*status_codes, headers=resp_headers,
+                                     body=body):
+                resp = req.get_response(self.app)
+
+            self.assertEqual(resp.status_int, 202)
+            stats = self.app.logger.statsd_client.get_stats_counts()
+            self.assertEqual(stats, {
+                'account.info.cache.hit': 2,
+                'account.info.cache.miss.200': 1,
+                'account.info.infocache.hit': 1,
+                'container.info.cache.hit': 2,
+                'container.info.cache.miss.200': 1,
+                'container.info.infocache.hit': 3,
+                'object.shard_updating.cache.skip.200': 1,
+                'object.shard_updating.cache.hit': 1,
+                'object.shard_updating.cache.error.200': 1,
+                'object.shard_updating.cache.set': 2
+            })
+            stats = self.app.statsd.get_labeled_stats_counts()
+            self.assertEqual({
+                ('swift_coop_cache', frozenset((
+                    ('resource', 'shard_updating'),
+                    ('account', 'a'),
+                    ('container', 'c'),
+                    ('event', 'backend_reqs'),
+                    ('set_cache_state', 'set'),
+                    ('token', 'disabled'),
+                    ('status', 200)),
+                )): 2,
+            }, stats)
+
+        do_test('POST', 'sharding')
+        do_test('POST', 'sharded')
+        do_test('DELETE', 'sharding')
+        do_test('DELETE', 'sharded')
+        do_test('PUT', 'sharding')
+        do_test('PUT', 'sharded')
+
+    @patch_policies([
+        StoragePolicy(0, 'zero', is_default=True, object_ring=FakeRing()),
+        StoragePolicy(1, 'one', object_ring=FakeRing()),
+    ])
+    def test_backend_headers_update_shard_container_cache_set_error(self):
+        # verify that backend container update is directed to the shard
+        # container despite memcache set error
+        # reset the router post patch_policies
+        self.app.obj_controller_router = proxy_server.ObjectControllerRouter()
+        self.app.sort_nodes = lambda nodes, *args, **kwargs: nodes
+        self.app.recheck_updating_shard_ranges = 3600
+        self.app.container_updating_shard_ranges_skip_cache = 0.001
+        self.app.namespace_cache_tokens_per_session = 0
+
+        def do_test(method, sharding_state):
+            self.app.logger.clear()  # clean capture state
+            self.app.statsd.clear()
+            # simulate memcache error when setting updating namespaces;
+            # expect 4 memcache sets: account info, container info, container
+            # info again from namespaces GET subrequest, namespaces
+            cache = FakeMemcache(error_on_set=[False, False, False, True])
+            req = Request.blank(
+                '/v1/a/c/o', {'swift.cache': cache},
+                method=method, body='', headers={'Content-Type': 'text/plain'})
+            # acct HEAD, cont HEAD, cont shard GET, obj POSTs
+            status_codes = (200, 200, 200, 202, 202, 202)
+            resp_headers = {'X-Backend-Storage-Policy-Index': 1,
+                            'x-backend-sharding-state': sharding_state,
+                            'X-Backend-Record-Type': 'shard'}
+            shard_ranges = [
+                utils.ShardRange(
+                    '.shards_a/c_not_used', utils.Timestamp.now(), '', 'l'),
+                utils.ShardRange(
+                    '.shards_a/c_shard', utils.Timestamp.now(), 'l', 'u'),
+                utils.ShardRange(
+                    '.shards_a/c_nope', utils.Timestamp.now(), 'u', ''),
+            ]
+            body = json.dumps([
+                dict(shard_range)
+                for shard_range in shard_ranges]).encode('ascii')
+            with mock.patch('random.random', return_value=0), \
+                mocked_http_conn(*status_codes, headers=resp_headers,
+                                 body=body) as fake_conn:
+                resp = req.get_response(self.app)
+
+            self.assertEqual(resp.status_int, 202)
+
+            stats = self.app.logger.statsd_client.get_stats_counts()
+            self.assertEqual(stats, {
+                'account.info.cache.miss.200': 1,
+                'account.info.infocache.hit': 2,
+                'container.info.cache.miss.200': 1,
+                'container.info.infocache.hit': 1,
+                'object.shard_updating.cache.skip.200': 1,
+                'object.shard_updating.cache.set_error': 1
+            })
+            stats = self.app.statsd.get_labeled_stats_counts()
+            self.assertEqual({
+                ('swift_coop_cache', frozenset((
+                    ('resource', 'shard_updating'),
+                    ('account', 'a'),
+                    ('container', 'c'),
+                    ('event', 'backend_reqs'),
+                    ('set_cache_state', 'set_error'),
+                    ('token', 'disabled'),
+                    ('status', 200)),
+                )): 1,
+            }, stats)
+            # verify statsd prefix is not mutated
+            self.assertEqual([], self.app.logger.log_dict['set_statsd_prefix'])
+            # sanity check: namespaces not in cache
+            cache_key = 'shard-updating-v2/a/c'
+            self.assertNotIn(cache_key, req.environ['swift.cache'].store)
+
+            # make sure backend requests included expected container headers
+            container_headers = {}
+            for backend_request in fake_conn.requests[3:]:
+                req_headers = backend_request['headers']
+                device = req_headers['x-container-device']
+                container_headers[device] = req_headers['x-container-host']
+                expectations = {
+                    'method': method,
+                    'path': '/0/a/c/o',
+                    'headers': {
+                        'X-Container-Partition': '0',
+                        'Host': 'localhost:80',
+                        'Referer': '%s http://localhost/v1/a/c/o' % method,
+                        'X-Backend-Storage-Policy-Index': '1',
+                        'X-Backend-Quoted-Container-Path': shard_ranges[1].name
+                    },
+                }
+                self._check_request(backend_request, **expectations)
+
+            expected = {}
+            for i, device in enumerate(['sda', 'sdb', 'sdc']):
+                expected[device] = '10.0.0.%d:100%d' % (i, i)
+            self.assertEqual(container_headers, expected)
+
+        do_test('POST', 'sharding')
+        do_test('POST', 'sharded')
+        do_test('DELETE', 'sharding')
+        do_test('DELETE', 'sharded')
+        do_test('PUT', 'sharding')
+        do_test('PUT', 'sharded')
+
+    @patch_policies([
+        StoragePolicy(0, 'zero', is_default=True, object_ring=FakeRing()),
+        StoragePolicy(1, 'one', object_ring=FakeRing()),
+    ])
+    def test_backend_headers_update_shard_container_errors(self):
+        # verify that update target reverts to root if get shard ranges fails
+        # reset the router post patch_policies
+        self.app.obj_controller_router = proxy_server.ObjectControllerRouter()
+        self.app.sort_nodes = lambda nodes, *args, **kwargs: nodes
+        self.app.recheck_updating_shard_ranges = 0
+
+        def do_test(method, sharding_state):
+            self.app.logger.clear()  # clean capture state
+            req = Request.blank('/v1/a/c/o', {}, method=method, body='',
+                                headers={'Content-Type': 'text/plain'})
+
+            # we want the container_info response to say policy index of 1 and
+            # sharding state, but we want shard range listings to fail
+            # acc HEAD, cont HEAD, cont shard GETs, obj POSTs
+            status_codes = (200, 200, 404, 404, 404, 202, 202, 202)
+            resp_headers = {'X-Backend-Storage-Policy-Index': 1,
+                            'x-backend-sharding-state': sharding_state}
+            with mocked_http_conn(*status_codes,
+                                  headers=resp_headers) as fake_conn:
+                resp = req.get_response(self.app)
+
+            self.assertEqual(resp.status_int, 202)
+            stats = self.app.logger.statsd_client.get_stats_counts()
+            self.assertEqual(
+                {'account.info.cache.disabled.200': 1,
+                 'account.info.infocache.hit': 2,
+                 'container.info.cache.disabled.200': 1,
+                 'container.info.infocache.hit': 1,
+                 'object.shard_updating.cache.disabled.404': 1},
+                stats)
+
+            backend_requests = fake_conn.requests
+            account_request = backend_requests[0]
+            self._check_request(
+                account_request, method='HEAD', path='/sda/0/a')
+            container_request = backend_requests[1]
+            self._check_request(
+                container_request, method='HEAD', path='/sda/0/a/c')
+            container_request_shard = backend_requests[2]
+            self._check_request(
+                container_request_shard, method='GET', path='/sda/0/a/c',
+                params={'includes': 'o', 'states': 'updating'},
+                headers={'X-Backend-Record-Type': 'shard'})
+
+            # infocache does not get populated from memcache
+            cache_key = 'shard-updating-v2/a/c'
+            self.assertNotIn(cache_key, req.environ.get('swift.infocache'))
+
+            # make sure backend requests included expected container headers
+            container_headers = {}
+
+            for request in backend_requests[5:]:
+                req_headers = request['headers']
+                device = req_headers['x-container-device']
+                container_headers[device] = req_headers['x-container-host']
+                expectations = {
+                    'method': method,
+                    'path': '/0/a/c/o',
+                    'headers': {
+                        'X-Container-Partition': '0',
+                        'Host': 'localhost:80',
+                        'Referer': '%s http://localhost/v1/a/c/o' % method,
+                        'X-Backend-Storage-Policy-Index': '1',
+                        # X-Backend-Quoted-Container-Path is not sent
+                    },
+                }
+                self._check_request(request, **expectations)
 
-            def test_status_map(statuses, expected):
-                set_http_connect(*statuses)
-                self.app.memcache.store = {}
-                req = Request.blank('/a/c/o', {},
-                                    headers={'Content-Type': 'foo/bar'})
-                self.app.update_request(req)
-                res = controller.POST(req)
-                expected = str(expected)
-                self.assertEquals(res.status[:len(expected)], expected)
-            test_status_map((200, 200, 200, 200, 200, 202, 202, 202), 202)
-            test_status_map((200, 200, 200, 200, 200, 202, 202, 500), 202)
-            test_status_map((200, 200, 200, 200, 200, 202, 500, 500), 503)
-            test_status_map((200, 200, 200, 200, 200, 202, 404, 500), 503)
-            test_status_map((200, 200, 200, 200, 200, 202, 404, 404), 404)
-            test_status_map((200, 200, 200, 200, 200, 404, 500, 500), 503)
-            test_status_map((200, 200, 200, 200, 200, 404, 404, 404), 404)
+            expected = {}
+            for i, device in enumerate(['sda', 'sdb', 'sdc']):
+                expected[device] = '10.0.0.%d:100%d' % (i, i)
+            self.assertEqual(container_headers, expected)
+
+        do_test('POST', 'sharding')
+        do_test('POST', 'sharded')
+        do_test('DELETE', 'sharding')
+        do_test('DELETE', 'sharded')
+        do_test('PUT', 'sharding')
+        do_test('PUT', 'sharded')
 
     def test_DELETE(self):
         with save_globals():
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-
             def test_status_map(statuses, expected):
-                set_http_connect(*statuses)
-                self.app.memcache.store = {}
-                req = Request.blank('/a/c/o', {})
+                req = Request.blank('/v1/a/c/o', {'REQUEST_METHOD': 'DELETE'})
                 self.app.update_request(req)
-                res = controller.DELETE(req)
-                self.assertEquals(res.status[:len(str(expected))],
-                                  str(expected))
+                with mocked_http_conn(*statuses) as mock_conn:
+                    res = req.get_response(self.app)
+                self.assertEqual(res.status[:len(str(expected))],
+                                 str(expected))
+                timestamps = [captured['headers'].get('X-Timestamp')
+                              for captured in mock_conn.requests[-3:]]
+                self.assertEqual(3, len(timestamps))
+                self.assertEqual(1, len(set(timestamps)))
+                self.assert_valid_timestamp(timestamps[0])
+
             test_status_map((200, 200, 204, 204, 204), 204)
             test_status_map((200, 200, 204, 204, 500), 204)
             test_status_map((200, 200, 204, 404, 404), 404)
-            test_status_map((200, 200, 204, 500, 404), 503)
+            test_status_map((200, 204, 500, 500, 404), 503)
             test_status_map((200, 200, 404, 404, 404), 404)
-            test_status_map((200, 200, 404, 404, 500), 404)
+            test_status_map((200, 200, 400, 400, 400), 400)
 
     def test_HEAD(self):
         with save_globals():
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-
             def test_status_map(statuses, expected):
                 set_http_connect(*statuses)
-                self.app.memcache.store = {}
-                req = Request.blank('/a/c/o', {})
+                req = Request.blank('/v1/a/c/o', {'REQUEST_METHOD': 'HEAD'})
                 self.app.update_request(req)
-                res = controller.HEAD(req)
-                self.assertEquals(res.status[:len(str(expected))],
-                                  str(expected))
+                res = req.get_response(self.app)
+                self.assertEqual(res.status[:len(str(expected))],
+                                 str(expected))
                 if expected < 400:
-                    self.assert_('x-works' in res.headers)
-                    self.assertEquals(res.headers['x-works'], 'yes')
-                    self.assert_('accept-ranges' in res.headers)
-                    self.assertEquals(res.headers['accept-ranges'], 'bytes')
+                    self.assertIn('x-works', res.headers)
+                    self.assertEqual(res.headers['x-works'], 'yes')
+                    self.assertIn('accept-ranges', res.headers)
+                    self.assertEqual(res.headers['accept-ranges'], 'bytes')
 
             test_status_map((200, 200, 200, 404, 404), 200)
             test_status_map((200, 200, 200, 500, 404), 200)
@@ -1244,22 +5158,26 @@ def test_status_map(statuses, expected):
             test_status_map((200, 200, 404, 404, 500), 404)
             test_status_map((200, 200, 500, 500, 500), 503)
 
+            POLICIES.default.object_ring.max_more_nodes = 3
+            test_status_map(
+                (200, 200,
+                 Timeout(), Timeout(), Timeout(),  # Can't reach primaries
+                 404, 404, 404),  # No surprise: handoffs know nothing
+                503)
+
     def test_HEAD_newest(self):
         with save_globals():
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-
             def test_status_map(statuses, expected, timestamps,
                                 expected_timestamp):
                 set_http_connect(*statuses, timestamps=timestamps)
-                self.app.memcache.store = {}
-                req = Request.blank('/a/c/o', {}, headers={'x-newest': 'true'})
+                req = Request.blank('/v1/a/c/o', {'REQUEST_METHOD': 'HEAD'},
+                                    headers={'x-newest': 'true'})
                 self.app.update_request(req)
-                res = controller.HEAD(req)
-                self.assertEquals(res.status[:len(str(expected))],
-                                  str(expected))
-                self.assertEquals(res.headers.get('last-modified'),
-                                  expected_timestamp)
+                res = req.get_response(self.app)
+                self.assertEqual(res.status[:len(str(expected))],
+                                 str(expected))
+                self.assertEqual(res.headers.get('last-modified'),
+                                 expected_timestamp)
 
             #                acct cont obj  obj  obj
             test_status_map((200, 200, 200, 200, 200), 200, ('0', '0', '1',
@@ -1274,23 +5192,22 @@ def test_status_map(statuses, expected, timestamps,
                                                              None, None), None)
             test_status_map((200, 200, 200, 200, 200), 200, ('0', '0', None,
                                                              None, '1'), '1')
+            test_status_map((200, 200, 404, 404, 200), 200, ('0', '0', None,
+                                                             None, '1'), '1')
 
     def test_GET_newest(self):
         with save_globals():
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-
             def test_status_map(statuses, expected, timestamps,
                                 expected_timestamp):
                 set_http_connect(*statuses, timestamps=timestamps)
-                self.app.memcache.store = {}
-                req = Request.blank('/a/c/o', {}, headers={'x-newest': 'true'})
+                req = Request.blank('/v1/a/c/o', {'REQUEST_METHOD': 'GET'},
+                                    headers={'x-newest': 'true'})
                 self.app.update_request(req)
-                res = controller.GET(req)
-                self.assertEquals(res.status[:len(str(expected))],
-                                  str(expected))
-                self.assertEquals(res.headers.get('last-modified'),
-                                  expected_timestamp)
+                res = req.get_response(self.app)
+                self.assertEqual(res.status[:len(str(expected))],
+                                 str(expected))
+                self.assertEqual(res.headers.get('last-modified'),
+                                 expected_timestamp)
 
             test_status_map((200, 200, 200, 200, 200), 200, ('0', '0', '1',
                                                              '2', '3'), '3')
@@ -1306,20 +5223,16 @@ def test_status_map(statuses, expected, timestamps,
                                                              None, '1'), '1')
 
         with save_globals():
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-
             def test_status_map(statuses, expected, timestamps,
                                 expected_timestamp):
                 set_http_connect(*statuses, timestamps=timestamps)
-                self.app.memcache.store = {}
-                req = Request.blank('/a/c/o', {})
+                req = Request.blank('/v1/a/c/o', {'REQUEST_METHOD': 'HEAD'})
                 self.app.update_request(req)
-                res = controller.HEAD(req)
-                self.assertEquals(res.status[:len(str(expected))],
-                                  str(expected))
-                self.assertEquals(res.headers.get('last-modified'),
-                                  expected_timestamp)
+                res = req.get_response(self.app)
+                self.assertEqual(res.status[:len(str(expected))],
+                                 str(expected))
+                self.assertEqual(res.headers.get('last-modified'),
+                                 expected_timestamp)
 
             test_status_map((200, 200, 200, 200, 200), 200, ('0', '0', '1',
                                                              '2', '3'), '1')
@@ -1334,136 +5247,153 @@ def test_status_map(statuses, expected, timestamps,
 
     def test_POST_meta_val_len(self):
         with save_globals():
-            limit = MAX_META_VALUE_LENGTH
-            self.app.object_post_as_copy = False
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
+            limit = constraints.MAX_META_VALUE_LENGTH
+            ReplicatedObjectController(
+                self.app, 'account', 'container', 'object')
             set_http_connect(200, 200, 202, 202, 202)
             #                acct cont obj  obj  obj
-            req = Request.blank('/a/c/o', {}, headers={
-                                'Content-Type': 'foo/bar',
-                                'X-Object-Meta-Foo': 'x' * limit})
+            req = Request.blank('/v1/a/c/o', {'REQUEST_METHOD': 'POST'},
+                                headers={'Content-Type': 'foo/bar',
+                                         'X-Object-Meta-Foo': 'x' * limit})
             self.app.update_request(req)
-            res = controller.POST(req)
-            self.assertEquals(res.status_int, 202)
+            res = req.get_response(self.app)
+            self.assertEqual(res.status_int, 202)
             set_http_connect(202, 202, 202)
-            req = Request.blank('/a/c/o', {}, headers={
-                                'Content-Type': 'foo/bar',
-                                'X-Object-Meta-Foo': 'x' * (limit + 1)})
+            req = Request.blank(
+                '/v1/a/c/o', {'REQUEST_METHOD': 'POST'},
+                headers={'Content-Type': 'foo/bar',
+                         'X-Object-Meta-Foo': 'x' * (limit + 1)})
             self.app.update_request(req)
-            res = controller.POST(req)
-            self.assertEquals(res.status_int, 400)
+            res = req.get_response(self.app)
+            self.assertEqual(res.status_int, 400)
 
-    def test_POST_as_copy_meta_val_len(self):
+    def test_POST_meta_authorize(self):
+        def authorize(req):
+            req.headers['X-Object-Meta-Foo'] = 'x' * (limit + 1)
+            return
         with save_globals():
-            limit = MAX_META_VALUE_LENGTH
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-            set_http_connect(200, 200, 200, 200, 200, 202, 202, 202)
-            #                acct cont objc objc objc obj  obj  obj
-            req = Request.blank('/a/c/o', {}, headers={
-                                'Content-Type': 'foo/bar',
-                                'X-Object-Meta-Foo': 'x' * limit})
-            self.app.update_request(req)
-            res = controller.POST(req)
-            self.assertEquals(res.status_int, 202)
-            set_http_connect(202, 202, 202)
-            req = Request.blank('/a/c/o', {}, headers={
-                                'Content-Type': 'foo/bar',
-                                'X-Object-Meta-Foo': 'x' * (limit + 1)})
+            limit = constraints.MAX_META_VALUE_LENGTH
+            controller = ReplicatedObjectController(
+                self.app, 'account', 'container', 'object')
+            set_http_connect(200, 200, 202, 202, 202)
+            #                acct cont obj  obj  obj
+            req = Request.blank('/v1/a/c/o', {'REQUEST_METHOD': 'POST'},
+                                headers={'Content-Type': 'foo/bar',
+                                         'X-Object-Meta-Foo': 'x'})
+            req.environ['swift.authorize'] = authorize
             self.app.update_request(req)
             res = controller.POST(req)
-            self.assertEquals(res.status_int, 400)
+            self.assertEqual(res.status_int, 400)
 
     def test_POST_meta_key_len(self):
         with save_globals():
-            limit = MAX_META_NAME_LENGTH
-            self.app.object_post_as_copy = False
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
+            limit = constraints.MAX_META_NAME_LENGTH
             set_http_connect(200, 200, 202, 202, 202)
             #                acct cont obj  obj  obj
-            req = Request.blank('/a/c/o', {}, headers={
-                'Content-Type': 'foo/bar',
-                ('X-Object-Meta-' + 'x' * limit): 'x'})
-            self.app.update_request(req)
-            res = controller.POST(req)
-            self.assertEquals(res.status_int, 202)
-            set_http_connect(202, 202, 202)
-            req = Request.blank('/a/c/o', {}, headers={
-                'Content-Type': 'foo/bar',
-                ('X-Object-Meta-' + 'x' * (limit + 1)): 'x'})
-            self.app.update_request(req)
-            res = controller.POST(req)
-            self.assertEquals(res.status_int, 400)
-
-    def test_POST_as_copy_meta_key_len(self):
-        with save_globals():
-            limit = MAX_META_NAME_LENGTH
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-            set_http_connect(200, 200, 200, 200, 200, 202, 202, 202)
-            #                acct cont objc objc objc obj  obj  obj
-            req = Request.blank('/a/c/o', {}, headers={
-                'Content-Type': 'foo/bar',
-                ('X-Object-Meta-' + 'x' * limit): 'x'})
+            req = Request.blank(
+                '/v1/a/c/o', {'REQUEST_METHOD': 'POST'},
+                headers={'Content-Type': 'foo/bar',
+                         ('X-Object-Meta-' + 'x' * limit): 'x'})
             self.app.update_request(req)
-            res = controller.POST(req)
-            self.assertEquals(res.status_int, 202)
+            res = req.get_response(self.app)
+            self.assertEqual(res.status_int, 202)
             set_http_connect(202, 202, 202)
-            req = Request.blank('/a/c/o', {}, headers={
-                'Content-Type': 'foo/bar',
-                ('X-Object-Meta-' + 'x' * (limit + 1)): 'x'})
+            req = Request.blank(
+                '/v1/a/c/o', {'REQUEST_METHOD': 'POST'},
+                headers={'Content-Type': 'foo/bar',
+                         ('X-Object-Meta-' + 'x' * (limit + 1)): 'x'})
             self.app.update_request(req)
-            res = controller.POST(req)
-            self.assertEquals(res.status_int, 400)
+            res = req.get_response(self.app)
+            self.assertEqual(res.status_int, 400)
 
     def test_POST_meta_count(self):
         with save_globals():
-            limit = MAX_META_COUNT
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
+            limit = constraints.MAX_META_COUNT
             headers = dict(
-                (('X-Object-Meta-' + str(i), 'a') for i in xrange(limit + 1)))
+                (('X-Object-Meta-' + str(i), 'a') for i in range(limit + 1)))
             headers.update({'Content-Type': 'foo/bar'})
             set_http_connect(202, 202, 202)
-            req = Request.blank('/a/c/o', {}, headers=headers)
+            req = Request.blank('/v1/a/c/o', {'REQUEST_METHOD': 'POST'},
+                                headers=headers)
             self.app.update_request(req)
-            res = controller.POST(req)
-            self.assertEquals(res.status_int, 400)
+            res = req.get_response(self.app)
+            self.assertEqual(res.status_int, 400)
 
     def test_POST_meta_size(self):
         with save_globals():
-            limit = MAX_META_OVERALL_SIZE
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-            count = limit / 256  # enough to cause the limit to be reched
+            limit = constraints.MAX_META_OVERALL_SIZE
+            count = limit // 256  # enough to cause the limit to be reached
             headers = dict(
                 (('X-Object-Meta-' + str(i), 'a' * 256)
-                    for i in xrange(count + 1)))
+                    for i in range(count + 1)))
             headers.update({'Content-Type': 'foo/bar'})
             set_http_connect(202, 202, 202)
-            req = Request.blank('/a/c/o', {}, headers=headers)
+            req = Request.blank('/v1/a/c/o', {'REQUEST_METHOD': 'POST'},
+                                headers=headers)
             self.app.update_request(req)
-            res = controller.POST(req)
-            self.assertEquals(res.status_int, 400)
+            res = req.get_response(self.app)
+            self.assertEqual(res.status_int, 400)
+
+    def test_PUT_not_autodetect_content_type(self):
+        with save_globals():
+            headers = {'Content-Type': 'something/right', 'Content-Length': 0}
+            it_worked = []
+
+            def verify_content_type(ipaddr, port, device, partition,
+                                    method, path, headers=None,
+                                    query_string=None):
+                if path == '/a/c/o.html':
+                    it_worked.append(
+                        headers['Content-Type'].startswith('something/right'))
+
+            set_http_connect(204, 204, 201, 201, 201,
+                             give_connect=verify_content_type)
+            req = Request.blank('/v1/a/c/o.html', {'REQUEST_METHOD': 'PUT'},
+                                headers=headers)
+            self.app.update_request(req)
+            req.get_response(self.app)
+            self.assertNotEqual(it_worked, [])
+            self.assertTrue(all(it_worked))
+
+    def test_PUT_autodetect_content_type(self):
+        with save_globals():
+            headers = {'Content-Type': 'something/wrong', 'Content-Length': 0,
+                       'X-Detect-Content-Type': 'True'}
+            it_worked = []
+
+            def verify_content_type(ipaddr, port, device, partition,
+                                    method, path, headers=None,
+                                    query_string=None):
+                if path == '/a/c/o.html':
+                    it_worked.append(
+                        headers['Content-Type'].startswith('text/html'))
+
+            set_http_connect(204, 204, 201, 201, 201,
+                             give_connect=verify_content_type)
+            req = Request.blank('/v1/a/c/o.html', {'REQUEST_METHOD': 'PUT'},
+                                headers=headers)
+            self.app.update_request(req)
+            req.get_response(self.app)
+            self.assertNotEqual(it_worked, [])
+            self.assertTrue(all(it_worked))
 
     def test_client_timeout(self):
         with save_globals():
             self.app.account_ring.get_nodes('account')
-            for dev in self.app.account_ring.devs.values():
+            for dev in self.app.account_ring.devs:
                 dev['ip'] = '127.0.0.1'
                 dev['port'] = 1
             self.app.container_ring.get_nodes('account')
-            for dev in self.app.container_ring.devs.values():
+            for dev in self.app.container_ring.devs:
                 dev['ip'] = '127.0.0.1'
                 dev['port'] = 1
-            self.app.object_ring.get_nodes('account')
-            for dev in self.app.object_ring.devs.values():
+            object_ring = self.app.get_object_ring(None)
+            object_ring.get_nodes('account')
+            for dev in object_ring.devs:
                 dev['ip'] = '127.0.0.1'
                 dev['port'] = 1
 
-            class SlowBody():
+            class SlowBody(object):
 
                 def __init__(self):
                     self.sent = 0
@@ -1472,272 +5402,616 @@ def read(self, size=-1):
                     if self.sent < 4:
                         sleep(0.1)
                         self.sent += 1
-                        return ' '
-                    return ''
+                        return b' '
+                    return b''
 
-            req = Request.blank('/a/c/o',
+            req = Request.blank('/v1/a/c/o',
                                 environ={'REQUEST_METHOD': 'PUT',
+                                         'swift.cache': FakeMemcache(),
                                          'wsgi.input': SlowBody()},
                                 headers={'Content-Length': '4',
                                          'Content-Type': 'text/plain'})
             self.app.update_request(req)
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
             set_http_connect(200, 200, 201, 201, 201)
             #                acct cont obj  obj  obj
-            resp = controller.PUT(req)
-            self.assertEquals(resp.status_int, 201)
-            self.app.client_timeout = 0.1
-            req = Request.blank('/a/c/o',
-                                environ={'REQUEST_METHOD': 'PUT',
-                                         'wsgi.input': SlowBody()},
-                                headers={'Content-Length': '4',
-                                         'Content-Type': 'text/plain'})
+            resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 201)
+            self.app.client_timeout = 0.05
+
+            req.environ['wsgi.input'] = SlowBody()  # Need a fresh instance
             self.app.update_request(req)
             set_http_connect(201, 201, 201)
             #                obj  obj  obj
-            resp = controller.PUT(req)
-            self.assertEquals(resp.status_int, 408)
+            resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 408)
 
     def test_client_disconnect(self):
         with save_globals():
             self.app.account_ring.get_nodes('account')
-            for dev in self.app.account_ring.devs.values():
+            for dev in self.app.account_ring.devs:
                 dev['ip'] = '127.0.0.1'
                 dev['port'] = 1
             self.app.container_ring.get_nodes('account')
-            for dev in self.app.container_ring.devs.values():
+            for dev in self.app.container_ring.devs:
                 dev['ip'] = '127.0.0.1'
                 dev['port'] = 1
-            self.app.object_ring.get_nodes('account')
-            for dev in self.app.object_ring.devs.values():
+            object_ring = self.app.get_object_ring(None)
+            object_ring.get_nodes('account')
+            for dev in object_ring.devs:
                 dev['ip'] = '127.0.0.1'
                 dev['port'] = 1
 
-            class SlowBody():
+            class DisconnectedBody(object):
 
                 def __init__(self):
                     self.sent = 0
 
                 def read(self, size=-1):
-                    raise Exception('Disconnected')
+                    return b''
 
-            req = Request.blank('/a/c/o',
+            req = Request.blank('/v1/a/c/o',
                                 environ={'REQUEST_METHOD': 'PUT',
-                                         'wsgi.input': SlowBody()},
+                                         'wsgi.input': DisconnectedBody()},
                                 headers={'Content-Length': '4',
                                          'Content-Type': 'text/plain'})
             self.app.update_request(req)
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
             set_http_connect(200, 200, 201, 201, 201)
             #                acct cont obj  obj  obj
-            resp = controller.PUT(req)
-            self.assertEquals(resp.status_int, 499)
+            resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 499)
 
-    def test_node_read_timeout(self):
-        with save_globals():
-            self.app.account_ring.get_nodes('account')
-            for dev in self.app.account_ring.devs.values():
-                dev['ip'] = '127.0.0.1'
-                dev['port'] = 1
-            self.app.container_ring.get_nodes('account')
-            for dev in self.app.container_ring.devs.values():
-                dev['ip'] = '127.0.0.1'
-                dev['port'] = 1
-            self.app.object_ring.get_nodes('account')
-            for dev in self.app.object_ring.devs.values():
-                dev['ip'] = '127.0.0.1'
-                dev['port'] = 1
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'GET'})
+            # chunked transfers basically go "until I stop sending bytes"
+            req = Request.blank('/v1/a/c/o',
+                                environ={'REQUEST_METHOD': 'PUT',
+                                         'wsgi.input': DisconnectedBody()},
+                                headers={'Transfer-Encoding': 'chunked',
+                                         'Content-Type': 'text/plain'})
             self.app.update_request(req)
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-            set_http_connect(200, 200, 200, slow=True)
-            req.sent_size = 0
-            resp = controller.GET(req)
-            got_exc = False
-            try:
+            set_http_connect(200, 200, 201, 201, 201)
+            #                acct cont obj  obj  obj
+            resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 201)  # ... so, no disconnect
+
+            # chunked transfer trumps content-length
+            req = Request.blank('/v1/a/c/o',
+                                environ={'REQUEST_METHOD': 'PUT',
+                                         'wsgi.input': DisconnectedBody()},
+                                headers={'Content-Length': '4',
+                                         'Transfer-Encoding': 'chunked',
+                                         'Content-Type': 'text/plain'})
+            self.app.update_request(req)
+            set_http_connect(200, 200, 201, 201, 201)
+            #                acct cont obj  obj  obj
+            resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 201)
+
+    def _do_test_node_read_timeout(self, slow=None, etags=None):
+        # this helper gets as far as making the first backend request,
+        # returning 200, but the response body isn't read - callers read the
+        # body and trigger any resuming GETs.
+        object_ring = self.app.get_object_ring(None)
+        # there are only 3 devices so no handoff requests expected
+        self.assertEqual(3, len(object_ring.devs))
+        self.app.recoverable_node_timeout = 0.2
+
+        self.logger.clear()
+        req = Request.blank('/v1/a/c/o', environ={'REQUEST_METHOD': 'GET'})
+        self.app.update_request(req)
+
+        request_log = []
+
+        # we don't use mocked_http_conn because we return before the code_iter
+        # is empty and would get a "left over status" AssertionError
+        def capture_req(ipaddr, port, device, partition, method, path,
+                        headers=None, query_string=None):
+            request_log.append((method, path))
+
+        # account HEAD, container HEAD, obj GET x 3
+        set_http_connect(200, 200, 200, 200, 200, body=b'lalala',
+                         slow=slow, etags=etags, give_connect=capture_req)
+        resp = req.get_response(self.app)
+        self.assertEqual(200, resp.status_int)
+        # at this point we've only made the request to the first object
+        self.assertEqual([
+            ('HEAD', '/a'),
+            ('HEAD', '/a/c'),
+            ('GET', '/a/c/o'),
+        ], request_log)
+        return resp, request_log
+
+    def test_node_read_timeout_retry_three_time_out(self):
+        with save_globals():
+            # all obj nodes time out
+            resp, req_log = self._do_test_node_read_timeout(
+                slow=[0.0, 0.0, 1.0, 1.0, 1.0])
+            with self.assertRaises(ChunkReadTimeout):
                 resp.body
-            except ChunkReadTimeout:
-                got_exc = True
-            self.assert_(not got_exc)
-            self.app.node_timeout = 0.1
-            set_http_connect(200, 200, 200, slow=True)
-            resp = controller.GET(req)
-            got_exc = False
-            try:
+            # two nodes left to attempt resume, both timeout reading body
+            self.assertEqual([
+                ('GET', '/a/c/o'),
+                ('GET', '/a/c/o'),
+            ], req_log[3:])
+            error_lines = self.logger.get_lines_for_level('error')
+            self.assertEqual(3, len(error_lines))
+            for line in error_lines[:3]:
+                self.assertIn('Trying to read object during GET', line)
+
+    def test_node_read_timeout_retry_only_first_time_out(self):
+        with save_globals():
+            resp, req_log = self._do_test_node_read_timeout(
+                slow=[0, 0, 1.0])
+            self.assertEqual([], req_log[3:])  # sanity
+            # we get the body
+            self.assertEqual(resp.body, b'lalala')
+            # only one retry
+            self.assertEqual([
+                ('GET', '/a/c/o'),
+            ], req_log[3:])
+            error_lines = self.logger.get_lines_for_level('error')
+            self.assertEqual(1, len(error_lines))
+            self.assertIn('Trying to read object during GET', error_lines[0])
+
+    def test_node_read_timeout_retry_two_time_out(self):
+        with save_globals():
+            resp, req_log = self._do_test_node_read_timeout(
+                slow=[0, 0, 1.0, 1.0])
+            self.assertEqual([], req_log[3:])  # sanity
+            # first 2 obj nodes time out
+            self.assertEqual(resp.body, b'lalala')
+            # ... so two retries
+            self.assertEqual([
+                ('GET', '/a/c/o'),
+                ('GET', '/a/c/o'),
+            ], req_log[3:])
+            error_lines = self.logger.get_lines_for_level('error')
+            self.assertEqual(2, len(error_lines))
+            for line in error_lines[:2]:
+                self.assertIn('Trying to read object during GET', line)
+
+    def test_node_read_timeout_retry_first_two_time_out_etags_match(self):
+        with save_globals():
+            resp, req_log = self._do_test_node_read_timeout(
+                slow=[0, 0, 1.0, 1.0],
+                etags=['account', 'container', 'a', 'a', 'a'])
+            self.assertEqual([], req_log[3:])  # sanity
+            # we get the body
+            self.assertEqual(resp.body, b'lalala')
+            # this is the same as above test, but explicit etag match
+            self.assertEqual([
+                ('GET', '/a/c/o'),
+                ('GET', '/a/c/o'),
+            ], req_log[3:])
+            error_lines = self.logger.get_lines_for_level('error')
+            self.assertEqual(2, len(error_lines))
+            for line in error_lines[:2]:
+                self.assertIn('Trying to read object during GET', line)
+
+    def test_node_read_timeout_retry_one_time_out_one_etag_mismatch(self):
+        with save_globals():
+            resp, req_log = self._do_test_node_read_timeout(
+                slow=[0, 0, 1.0],
+                etags=['account', 'container', 'a', 'b', 'a'])
+            self.assertEqual([], req_log[3:])  # sanity
+            self.assertEqual(resp.body, b'lalala')
+            # N.B. even if you break the proxy to return second response, this
+            # header was sent with the original 200 ok
+            self.assertEqual(resp.etag, 'a')
+            # but we can know we got the right response because we had to retry
+            # twice because of etag
+            self.assertEqual([
+                ('GET', '/a/c/o'),
+                ('GET', '/a/c/o'),
+            ], req_log[3:])
+            error_lines = self.logger.get_lines_for_level('error')
+            # only one timeout error for the first source because the second
+            # source with wrong etag is not read
+            self.assertEqual(1, len(error_lines))
+            self.assertIn('Trying to read object during GET', error_lines[0])
+
+    def test_node_read_timeout_retry_one_time_out_two_etag_mismatch(self):
+        with save_globals():
+            resp, req_log = self._do_test_node_read_timeout(
+                slow=[0, 0, 1.0],
+                etags=['account', 'container', 'a', 'b', 'b'])
+            with self.assertRaises(ChunkReadTimeout):
                 resp.body
-            except ChunkReadTimeout:
-                got_exc = True
-            self.assert_(got_exc)
+            self.assertEqual([
+                ('GET', '/a/c/o'),
+                ('GET', '/a/c/o'),
+            ], req_log[3:])
+            error_lines = self.logger.get_lines_for_level('error')
+            # only one timeout error for the first source because the second
+            # and third sources with wrong etag are not read
+            self.assertEqual(1, len(error_lines))
+            self.assertIn('Trying to read object during GET', error_lines[0])
 
     def test_node_write_timeout(self):
         with save_globals():
-            self.app.account_ring.get_nodes('account')
-            for dev in self.app.account_ring.devs.values():
-                dev['ip'] = '127.0.0.1'
-                dev['port'] = 1
-            self.app.container_ring.get_nodes('account')
-            for dev in self.app.container_ring.devs.values():
-                dev['ip'] = '127.0.0.1'
-                dev['port'] = 1
-            self.app.object_ring.get_nodes('account')
-            for dev in self.app.object_ring.devs.values():
-                dev['ip'] = '127.0.0.1'
-                dev['port'] = 1
-            req = Request.blank('/a/c/o',
+            req = Request.blank('/v1/a/c/o',
                                 environ={'REQUEST_METHOD': 'PUT'},
                                 headers={'Content-Length': '4',
                                          'Content-Type': 'text/plain'},
                                 body='    ')
             self.app.update_request(req)
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-            set_http_connect(200, 200, 201, 201, 201, slow=True)
-            resp = controller.PUT(req)
-            self.assertEquals(resp.status_int, 201)
+            set_http_connect(200, 200, 201, 201, 201, slow=0.1)
+            resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 201)
             self.app.node_timeout = 0.1
-            set_http_connect(201, 201, 201, slow=True)
-            req = Request.blank('/a/c/o',
+            req = Request.blank('/v1/a/c/o',
                                 environ={'REQUEST_METHOD': 'PUT'},
                                 headers={'Content-Length': '4',
                                          'Content-Type': 'text/plain'},
                                 body='    ')
             self.app.update_request(req)
-            resp = controller.PUT(req)
-            self.assertEquals(resp.status_int, 503)
+            set_http_connect(201, 201, 201, slow=1.0)
+            resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 503)
+
+    def test_node_request_setting(self):
+        # default is 2 * replicas
+        baseapp = proxy_server.Application({},
+                                           container_ring=FakeRing(),
+                                           account_ring=FakeRing())
+        self.assertEqual(6, baseapp.request_node_count(3))
+
+        def do_test(value, replicas, expected):
+            baseapp = proxy_server.Application({'request_node_count': value},
+                                               container_ring=FakeRing(),
+                                               account_ring=FakeRing())
+            self.assertEqual(expected, baseapp.request_node_count(replicas))
+
+        do_test('3', 4, 3)
+        do_test('1 * replicas', 4, 4)
+        do_test('2 * replicas', 4, 8)
+        do_test('4', 4, 4)
+        do_test('5', 4, 5)
+
+        for bad in ('1.1', 1.1, 'auto', 'bad',
+                    '2.5 * replicas', 'two * replicas'):
+            with self.assertRaises(ValueError):
+                proxy_server.Application({'request_node_count': bad},
+                                         container_ring=FakeRing(),
+                                         account_ring=FakeRing())
 
     def test_iter_nodes(self):
         with save_globals():
             try:
-                self.app.object_ring.max_more_nodes = 2
-                controller = proxy_server.ObjectController(self.app, 'account',
-                                                           'container',
-                                                           'object')
-                partition, nodes = self.app.object_ring.get_nodes('account',
-                                                                  'container',
-                                                                  'object')
+                object_ring = self.app.get_object_ring(None)
+                object_ring.max_more_nodes = 2
+                partition, nodes = object_ring.get_nodes('account',
+                                                         'container',
+                                                         'object')
                 collected_nodes = []
-                for node in controller.iter_nodes(partition, nodes,
-                                                  self.app.object_ring):
+                for node in proxy_base.NodeIter(
+                        'object', self.app, object_ring, partition,
+                        self.logger, request=Request.blank('')):
                     collected_nodes.append(node)
-                self.assertEquals(len(collected_nodes), 5)
-
-                self.app.object_ring.max_more_nodes = 20
-                controller = proxy_server.ObjectController(self.app, 'account',
-                                                           'container',
-                                                           'object')
-                partition, nodes = self.app.object_ring.get_nodes('account',
-                                                                  'container',
-                                                                  'object')
+                self.assertEqual(len(collected_nodes), 5)
+
+                object_ring.max_more_nodes = 6
+                self.app.request_node_count = lambda r: 20
+                partition, nodes = object_ring.get_nodes('account',
+                                                         'container',
+                                                         'object')
+                collected_nodes = []
+                for node in proxy_base.NodeIter(
+                        'object', self.app, object_ring, partition,
+                        self.logger, request=Request.blank('')):
+                    collected_nodes.append(node)
+                self.assertEqual(len(collected_nodes), 9)
+
+                # zero error-limited primary nodes -> no handoff warnings
+                self.app.log_handoffs = True
+                self.app.logger.clear()  # clean capture state
+                self.app.request_node_count = lambda r: 7
+                object_ring.max_more_nodes = 20
+                partition, nodes = object_ring.get_nodes('account',
+                                                         'container',
+                                                         'object')
+                collected_nodes = []
+                for node in proxy_base.NodeIter(
+                        'object', self.app, object_ring, partition,
+                        self.logger, request=Request.blank('')):
+                    collected_nodes.append(node)
+                self.assertEqual(len(collected_nodes), 7)
+                self.assertEqual(self.app.logger.log_dict['warning'], [])
+                self.assertEqual(
+                    self.app.logger.statsd_client.get_increments(), [])
+
+                # one error-limited primary node -> one handoff warning
+                self.app.log_handoffs = True
+                self.app.logger.clear()  # clean capture state
+                self.app.request_node_count = lambda r: 7
+                self.app.error_limiter.stats.clear()  # clear out errors
+                set_node_errors(self.app, object_ring._devs[0], 999,
+                                last_error=(2 ** 63 - 1))
+
                 collected_nodes = []
-                for node in controller.iter_nodes(partition, nodes,
-                                                  self.app.object_ring):
+                for node in proxy_base.NodeIter(
+                        'object', self.app, object_ring, partition,
+                        self.logger, request=Request.blank('')):
                     collected_nodes.append(node)
-                self.assertEquals(len(collected_nodes), 9)
+                self.assertEqual(len(collected_nodes), 7)
+                self.assertEqual(
+                    self.app.logger.get_lines_for_level('warning'), [
+                        'Handoff requested (5)'])
+                self.assertEqual(
+                    self.app.logger.statsd_client.get_increments(),
+                    ['error_limiter.is_limited', 'object.handoff_count'])
 
+                # two error-limited primary nodes -> two handoff warnings
                 self.app.log_handoffs = True
-                self.app.logger = FakeLogger()
-                self.app.object_ring.max_more_nodes = 2
-                controller = proxy_server.ObjectController(self.app, 'account',
-                                                           'container',
-                                                           'object')
-                partition, nodes = self.app.object_ring.get_nodes('account',
-                                                                  'container',
-                                                                  'object')
+                self.app.logger.clear()  # clean capture state
+                self.app.request_node_count = lambda r: 7
+                self.app.error_limiter.stats.clear()  # clear out errors
+                for i in range(2):
+                    set_node_errors(self.app, object_ring._devs[i], 999,
+                                    last_error=(2 ** 63 - 1))
+
                 collected_nodes = []
-                for node in controller.iter_nodes(partition, nodes,
-                                                  self.app.object_ring):
+                for node in proxy_base.NodeIter(
+                        'object', self.app, object_ring, partition,
+                        self.logger, request=Request.blank('')):
                     collected_nodes.append(node)
-                self.assertEquals(len(collected_nodes), 5)
-                self.assertEquals(
-                    self.app.logger.log_dict['warning'],
-                    [(('Handoff requested (1)',), {}),
-                     (('Handoff requested (2)',), {})])
-
-                self.app.log_handoffs = False
-                self.app.logger = FakeLogger()
-                self.app.object_ring.max_more_nodes = 2
-                controller = proxy_server.ObjectController(self.app, 'account',
-                                                           'container',
-                                                           'object')
-                partition, nodes = self.app.object_ring.get_nodes('account',
-                                                                  'container',
-                                                                  'object')
+                self.assertEqual(len(collected_nodes), 7)
+                self.assertEqual(
+                    self.app.logger.get_lines_for_level('warning'), [
+                        'Handoff requested (5)',
+                        'Handoff requested (6)',
+                    ])
+                stats = self.app.logger.statsd_client.get_stats_counts()
+                self.assertEqual(2, stats.get('error_limiter.is_limited', 0))
+                self.assertEqual(2, stats.get('object.handoff_count', 0))
+
+                # all error-limited primary nodes -> four handoff warnings,
+                # plus a handoff-all metric
+                self.app.log_handoffs = True
+                self.app.logger.clear()  # clean capture state
+                self.app.request_node_count = lambda r: 10
+                object_ring.set_replicas(4)  # otherwise we run out of handoffs
+                self.app.error_limiter.stats.clear()  # clear out errors
+                for i in range(4):
+                    set_node_errors(self.app, object_ring._devs[i], 999,
+                                    last_error=(2 ** 63 - 1))
+
                 collected_nodes = []
-                for node in controller.iter_nodes(partition, nodes,
-                                                  self.app.object_ring):
+                for node in proxy_base.NodeIter(
+                        'object', self.app, object_ring, partition,
+                        self.logger, request=Request.blank('')):
                     collected_nodes.append(node)
-                self.assertEquals(len(collected_nodes), 5)
-                self.assertEquals(self.app.logger.log_dict['warning'], [])
+                self.assertEqual(len(collected_nodes), 10)
+                self.assertEqual(
+                    self.app.logger.get_lines_for_level('warning'), [
+                        'Handoff requested (7)',
+                        'Handoff requested (8)',
+                        'Handoff requested (9)',
+                        'Handoff requested (10)',
+                    ])
+                stats = self.app.logger.statsd_client.get_stats_counts()
+                self.assertEqual(4, stats.get('error_limiter.is_limited', 0))
+                self.assertEqual(4, stats.get('object.handoff_count', 0))
+                self.assertEqual(1, stats.get('object.handoff_all_count', 0))
+
             finally:
-                self.app.object_ring.max_more_nodes = 0
+                object_ring.max_more_nodes = 0
+
+    def test_iter_nodes_calls_sort_nodes(self):
+        called = []
+
+        def fake_sort_nodes(nodes, **kwargs):
+            # caller might mutate the list we return during iteration, we're
+            # interested in the value as of call time
+            called.append(mock.call(list(nodes), **kwargs))
+            return nodes
+        with mock.patch.object(self.app, 'sort_nodes',
+                               side_effect=fake_sort_nodes):
+            object_ring = self.app.get_object_ring(None)
+            for node in proxy_base.NodeIter(
+                    'object', self.app, object_ring, 0, self.logger,
+                    request=Request.blank('')):
+                pass
+            self.assertEqual(called, [
+                mock.call(object_ring.get_part_nodes(0), policy=None)
+            ])
+
+    def test_iter_nodes_skips_error_limited(self):
+        with mock.patch.object(self.app, 'sort_nodes',
+                               lambda n, *args, **kwargs: n):
+            object_ring = self.app.get_object_ring(None)
+            first_nodes = list(proxy_base.NodeIter(
+                'object', self.app, object_ring, 0, self.logger,
+                request=Request.blank('')))
+            second_nodes = list(proxy_base.NodeIter(
+                'object', self.app, object_ring, 0, self.logger,
+                request=Request.blank('')))
+            self.assertIn(first_nodes[0], second_nodes)
+
+            self.assertEqual(
+                0, self.logger.statsd_client.get_stats_counts().get(
+                    'error_limiter.is_limited', 0))
+            self.assertEqual(
+                0, self.logger.statsd_client.get_stats_counts().get(
+                    'error_limiter.forced_limit', 0))
+
+            self.app.error_limit(first_nodes[0], 'test')
+            self.assertEqual(
+                1, self.logger.statsd_client.get_stats_counts().get(
+                    'error_limiter.forced_limit', 0))
+            line = self.logger.get_lines_for_level('error')[-1]
+            self.assertEqual(
+                ('Node will be error limited for 60.00s: %s, error: %s'
+                 % (node_to_string(first_nodes[0]), 'test')), line)
+
+            second_nodes = list(proxy_base.NodeIter(
+                'object', self.app, object_ring, 0, self.logger,
+                request=Request.blank('')))
+            self.assertNotIn(first_nodes[0], second_nodes)
+            self.assertEqual(
+                1, self.logger.statsd_client.get_stats_counts().get(
+                    'error_limiter.is_limited', 0))
+            third_nodes = list(proxy_base.NodeIter(
+                'object', self.app, object_ring, 0, self.logger,
+                request=Request.blank('')))
+            self.assertNotIn(first_nodes[0], third_nodes)
+            self.assertEqual(
+                2, self.logger.statsd_client.get_stats_counts().get(
+                    'error_limiter.is_limited', 0))
+
+    def test_iter_nodes_gives_extra_if_error_limited_inline(self):
+        object_ring = self.app.get_object_ring(None)
+        with mock.patch.object(self.app, 'sort_nodes',
+                               lambda n, *args, **kwargs: n), \
+                mock.patch.object(self.app, 'request_node_count',
+                                  lambda r: 6), \
+                mock.patch.object(object_ring, 'max_more_nodes', 99):
+            first_nodes = list(proxy_base.NodeIter(
+                'object', self.app, object_ring, 0, self.logger,
+                request=Request.blank('')))
+            second_nodes = []
+            for node in proxy_base.NodeIter(
+                    'object', self.app, object_ring, 0, self.logger,
+                    request=Request.blank('')):
+                if not second_nodes:
+                    self.app.error_limit(node, 'test')
+                second_nodes.append(node)
+            self.assertEqual(len(first_nodes), 6)
+            self.assertEqual(len(second_nodes), 7)
+
+    def test_iter_nodes_without_replication_network(self):
+        object_ring = self.app.get_object_ring(None)
+        node_list = [dict(id=n, ip='1.2.3.4', port=n, device='D',
+                          use_replication=False)
+                     for n in range(10)]
+        expected = [dict(n) for n in node_list]
+        with mock.patch.object(self.app, 'sort_nodes',
+                               lambda n, *args, **kwargs: n), \
+                mock.patch.object(self.app, 'request_node_count',
+                                  lambda r: 3):
+            got_nodes = list(proxy_base.NodeIter(
+                'object', self.app, object_ring, 0, self.logger,
+                Request.blank(''), node_iter=iter(node_list)))
+        self.assertEqual(expected[:3], got_nodes)
+
+        req = Request.blank('/v1/a/c')
+        node_list = [dict(id=n, ip='1.2.3.4', port=n, device='D')
+                     for n in range(10)]
+        with mock.patch.object(self.app, 'sort_nodes',
+                               lambda n, *args, **kwargs: n), \
+                mock.patch.object(self.app, 'request_node_count',
+                                  lambda r: 1000000):
+            got_nodes = list(proxy_base.NodeIter(
+                'object', self.app, object_ring, 0, self.logger, req,
+                node_iter=iter(node_list)))
+        self.assertEqual(expected, got_nodes)
+
+    def test_iter_nodes_with_replication_network(self):
+        object_ring = self.app.get_object_ring(None)
+        node_list = [dict(id=n, ip='1.2.3.4', port=n, device='D',
+                          use_replication=False)
+                     for n in range(10)]
+        req = Request.blank(
+            '/v1/a/c', headers={'x-backend-use-replication-network': 'true'})
+        with mock.patch.object(self.app, 'sort_nodes',
+                               lambda n, *args, **kwargs: n), \
+                mock.patch.object(self.app, 'request_node_count',
+                                  lambda r: 3):
+            got_nodes = list(proxy_base.NodeIter(
+                'object', self.app, object_ring, 0, self.logger, req,
+                node_iter=iter(node_list)))
+        expected = [dict(n, use_replication=True) for n in node_list]
+        self.assertEqual(expected[:3], got_nodes)
+        req = Request.blank(
+            '/v1/a/c', headers={'x-backend-use-replication-network': 'false'})
+        expected = [dict(n, use_replication=False) for n in node_list]
+        with mock.patch.object(self.app, 'sort_nodes',
+                               lambda n, *args, **kwargs: n), \
+                mock.patch.object(self.app, 'request_node_count',
+                                  lambda r: 13):
+            got_nodes = list(proxy_base.NodeIter(
+                'object', self.app, object_ring, 0, self.logger, req,
+                node_iter=iter(node_list)))
+        self.assertEqual(expected, got_nodes)
+
+    def test_best_response_sets_headers(self):
+        controller = ReplicatedObjectController(
+            self.app, 'account', 'container', 'object')
+        req = Request.blank('/v1/a/c/o', environ={'REQUEST_METHOD': 'GET'})
+        resp = controller.best_response(req, [200] * 3, ['OK'] * 3, [b''] * 3,
+                                        'Object', headers=[{'X-Test': '1'},
+                                                           {'X-Test': '2'},
+                                                           {'X-Test': '3'}])
+        self.assertEqual(resp.headers['X-Test'], '1')
 
     def test_best_response_sets_etag(self):
-        controller = proxy_server.ObjectController(self.app, 'account',
-                                                   'container', 'object')
-        req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'GET'})
-        resp = controller.best_response(req, [200] * 3, ['OK'] * 3, [''] * 3,
+        controller = ReplicatedObjectController(
+            self.app, 'account', 'container', 'object')
+        req = Request.blank('/v1/a/c/o', environ={'REQUEST_METHOD': 'GET'})
+        resp = controller.best_response(req, [200] * 3, ['OK'] * 3, [b''] * 3,
                                         'Object')
-        self.assertEquals(resp.etag, None)
-        resp = controller.best_response(req, [200] * 3, ['OK'] * 3, [''] * 3,
+        self.assertIsNone(resp.etag)
+        resp = controller.best_response(req, [200] * 3, ['OK'] * 3, [b''] * 3,
                                         'Object',
                                         etag='68b329da9893e34099c7d8ad5cb9c940'
                                         )
-        self.assertEquals(resp.etag, '68b329da9893e34099c7d8ad5cb9c940')
+        self.assertEqual(resp.etag, '68b329da9893e34099c7d8ad5cb9c940')
 
     def test_proxy_passes_content_type(self):
         with save_globals():
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'GET'})
+            req = Request.blank('/v1/a/c/o', environ={'REQUEST_METHOD': 'GET'})
             self.app.update_request(req)
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
             set_http_connect(200, 200, 200)
-            resp = controller.GET(req)
-            self.assertEquals(resp.status_int, 200)
-            self.assertEquals(resp.content_type, 'x-application/test')
+            resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual(resp.content_type, 'x-application/test')
             set_http_connect(200, 200, 200)
-            resp = controller.GET(req)
-            self.assertEquals(resp.status_int, 200)
-            self.assertEquals(resp.content_length, 0)
+            resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual(resp.content_length, 0)
             set_http_connect(200, 200, 200, slow=True)
-            resp = controller.GET(req)
-            self.assertEquals(resp.status_int, 200)
-            self.assertEquals(resp.content_length, 4)
+            resp = req.get_response(self.app)
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual(resp.content_length, 4)
 
     def test_proxy_passes_content_length_on_head(self):
         with save_globals():
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'HEAD'})
+            req = Request.blank('/v1/a/c/o',
+                                environ={'REQUEST_METHOD': 'HEAD'})
             self.app.update_request(req)
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
+            controller = ReplicatedObjectController(
+                self.app, 'account', 'container', 'object')
             set_http_connect(200, 200, 200)
             resp = controller.HEAD(req)
-            self.assertEquals(resp.status_int, 200)
-            self.assertEquals(resp.content_length, 0)
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual(resp.content_length, 0)
             set_http_connect(200, 200, 200, slow=True)
             resp = controller.HEAD(req)
-            self.assertEquals(resp.status_int, 200)
-            self.assertEquals(resp.content_length, 4)
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual(resp.content_length, 4)
 
     def test_error_limiting(self):
         with save_globals():
-            set_shuffle()
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
+            controller = ReplicatedObjectController(
+                self.app, 'account', 'container', 'object')
+            controller.app.sort_nodes = lambda l, *args, **kwargs: l
+            object_ring = controller.app.get_object_ring(None)
             self.assert_status_map(controller.HEAD, (200, 200, 503, 200, 200),
                                    200)
-            self.assertEquals(controller.app.object_ring.devs[0]['errors'], 2)
-            self.assert_('last_error' in controller.app.object_ring.devs[0])
-            for _junk in xrange(self.app.error_suppression_limit):
+            self.assertEqual(
+                node_error_count(controller.app, object_ring.devs[0]), 2)
+            self.assertTrue(
+                node_last_error(controller.app, object_ring.devs[0])
+                is not None)
+            for _junk in range(self.app.error_limiter.suppression_limit):
                 self.assert_status_map(controller.HEAD, (200, 200, 503, 503,
                                                          503), 503)
-            self.assertEquals(controller.app.object_ring.devs[0]['errors'],
-                              self.app.error_suppression_limit + 1)
+            self.assertEqual(
+                node_error_count(controller.app, object_ring.devs[0]),
+                self.app.error_limiter.suppression_limit + 1)
             self.assert_status_map(controller.HEAD, (200, 200, 200, 200, 200),
                                    503)
-            self.assert_('last_error' in controller.app.object_ring.devs[0])
+            self.assertTrue(
+                node_last_error(controller.app, object_ring.devs[0])
+                is not None)
             self.assert_status_map(controller.PUT, (200, 200, 200, 201, 201,
                                                     201), 503)
             self.assert_status_map(controller.POST,
@@ -1745,7 +6019,7 @@ def test_error_limiting(self):
                                     202), 503)
             self.assert_status_map(controller.DELETE,
                                    (200, 200, 200, 204, 204, 204), 503)
-            self.app.error_suppression_interval = -300
+            self.app.error_limiter.suppression_interval = -300
             self.assert_status_map(controller.HEAD, (200, 200, 200, 200, 200),
                                    200)
             self.assertRaises(BaseException,
@@ -1753,601 +6027,537 @@ def test_error_limiting(self):
                               (200, 200, 200, 204, 204, 204), 503,
                               raise_exc=True)
 
+    def test_error_limiting_survives_ring_reload(self):
+        with save_globals():
+            controller = ReplicatedObjectController(
+                self.app, 'account', 'container', 'object')
+            controller.app.sort_nodes = lambda l, *args, **kwargs: l
+            object_ring = controller.app.get_object_ring(None)
+            self.assert_status_map(controller.HEAD, (200, 200, 503, 200, 200),
+                                   200)
+            self.assertEqual(
+                node_error_count(controller.app, object_ring.devs[0]), 2)
+            self.assertTrue(
+                node_last_error(controller.app, object_ring.devs[0])
+                is not None)
+            for _junk in range(self.app.error_limiter.suppression_limit):
+                self.assert_status_map(controller.HEAD, (200, 200, 503, 503,
+                                                         503), 503)
+            self.assertEqual(
+                node_error_count(controller.app, object_ring.devs[0]),
+                self.app.error_limiter.suppression_limit + 1)
+
+            # wipe out any state in the ring
+            for policy in POLICIES:
+                policy.object_ring = FakeRing(base_port=3000)
+
+            # and we still get an error, which proves that the
+            # error-limiting info survived a ring reload
+            self.assert_status_map(controller.HEAD, (200, 200, 200, 200, 200),
+                                   503)
+
+    def test_PUT_error_limiting(self):
+        with save_globals():
+            controller = ReplicatedObjectController(
+                self.app, 'account', 'container', 'object')
+            controller.app.sort_nodes = lambda l, *args, **kwargs: l
+            object_ring = controller.app.get_object_ring(None)
+            # acc con obj obj obj
+            self.assert_status_map(controller.PUT, (200, 200, 503, 200, 200),
+                                   200)
+
+            # 2, not 1, because assert_status_map() calls the method twice
+            odevs = object_ring.devs
+            self.assertEqual(node_error_count(controller.app, odevs[0]), 2)
+            self.assertEqual(node_error_count(controller.app, odevs[1]), 0)
+            self.assertEqual(node_error_count(controller.app, odevs[2]), 0)
+            self.assertIsNotNone(node_last_error(controller.app, odevs[0]))
+            self.assertIsNone(node_last_error(controller.app, odevs[1]))
+            self.assertIsNone(node_last_error(controller.app, odevs[2]))
+
+    def test_PUT_error_limiting_last_node(self):
+        with save_globals():
+            controller = ReplicatedObjectController(
+                self.app, 'account', 'container', 'object')
+            controller.app.sort_nodes = lambda l, *args, **kwargs: l
+            object_ring = controller.app.get_object_ring(None)
+            # acc con obj obj obj
+            self.assert_status_map(controller.PUT, (200, 200, 200, 200, 503),
+                                   200)
+
+            # 2, not 1, because assert_status_map() calls the method twice
+            odevs = object_ring.devs
+            self.assertEqual(node_error_count(controller.app, odevs[0]), 0)
+            self.assertEqual(node_error_count(controller.app, odevs[1]), 0)
+            self.assertEqual(node_error_count(controller.app, odevs[2]), 2)
+            self.assertIsNone(node_last_error(controller.app, odevs[0]))
+            self.assertIsNone(node_last_error(controller.app, odevs[1]))
+            self.assertIsNotNone(node_last_error(controller.app, odevs[2]))
+
     def test_acc_or_con_missing_returns_404(self):
         with save_globals():
-            self.app.memcache = FakeMemcacheReturnsNone()
-            for dev in self.app.account_ring.devs.values():
-                del dev['errors']
-                del dev['last_error']
-            for dev in self.app.container_ring.devs.values():
-                del dev['errors']
-                del dev['last_error']
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
+            self.app.error_limiter.stats.clear()
+            controller = ReplicatedObjectController(
+                self.app, 'account', 'container', 'object')
             set_http_connect(200, 200, 200, 200, 200, 200)
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'DELETE'})
+            req = Request.blank('/v1/a/c/o',
+                                environ={'REQUEST_METHOD': 'DELETE'})
             self.app.update_request(req)
             resp = getattr(controller, 'DELETE')(req)
-            self.assertEquals(resp.status_int, 200)
+            self.assertEqual(resp.status_int, 200)
 
             set_http_connect(404, 404, 404)
             #                acct acct acct
+            # make sure to use a fresh request without cached env
+            req = Request.blank('/v1/a/c/o',
+                                environ={'REQUEST_METHOD': 'DELETE'})
             resp = getattr(controller, 'DELETE')(req)
-            self.assertEquals(resp.status_int, 404)
+            self.assertEqual(resp.status_int, 404)
 
             set_http_connect(503, 404, 404)
             #                acct acct acct
+            # make sure to use a fresh request without cached env
+            req = Request.blank('/v1/a/c/o',
+                                environ={'REQUEST_METHOD': 'DELETE'})
             resp = getattr(controller, 'DELETE')(req)
-            self.assertEquals(resp.status_int, 404)
+            self.assertEqual(resp.status_int, 404)
 
             set_http_connect(503, 503, 404)
             #                acct acct acct
+            # make sure to use a fresh request without cached env
+            req = Request.blank('/v1/a/c/o',
+                                environ={'REQUEST_METHOD': 'DELETE'})
             resp = getattr(controller, 'DELETE')(req)
-            self.assertEquals(resp.status_int, 404)
+            self.assertEqual(resp.status_int, 404)
 
             set_http_connect(503, 503, 503)
             #                acct acct acct
+            # make sure to use a fresh request without cached env
+            req = Request.blank('/v1/a/c/o',
+                                environ={'REQUEST_METHOD': 'DELETE'})
             resp = getattr(controller, 'DELETE')(req)
-            self.assertEquals(resp.status_int, 404)
+            self.assertEqual(resp.status_int, 404)
 
             set_http_connect(200, 200, 204, 204, 204)
             #                acct cont obj  obj  obj
+            # make sure to use a fresh request without cached env
+            req = Request.blank('/v1/a/c/o',
+                                environ={'REQUEST_METHOD': 'DELETE'})
             resp = getattr(controller, 'DELETE')(req)
-            self.assertEquals(resp.status_int, 204)
+            self.assertEqual(resp.status_int, 204)
 
             set_http_connect(200, 404, 404, 404)
             #                acct cont cont cont
+            # make sure to use a fresh request without cached env
+            req = Request.blank('/v1/a/c/o',
+                                environ={'REQUEST_METHOD': 'DELETE'})
             resp = getattr(controller, 'DELETE')(req)
-            self.assertEquals(resp.status_int, 404)
+            self.assertEqual(resp.status_int, 404)
 
             set_http_connect(200, 503, 503, 503)
             #                acct cont cont cont
+            # make sure to use a fresh request without cached env
+            req = Request.blank('/v1/a/c/o',
+                                environ={'REQUEST_METHOD': 'DELETE'})
             resp = getattr(controller, 'DELETE')(req)
-            self.assertEquals(resp.status_int, 404)
+            self.assertEqual(resp.status_int, 404)
 
-            for dev in self.app.account_ring.devs.values():
-                dev['errors'] = self.app.error_suppression_limit + 1
-                dev['last_error'] = time()
+            for dev in self.app.account_ring.devs:
+                set_node_errors(
+                    self.app, dev,
+                    self.app.error_limiter.suppression_limit + 1,
+                    time.time())
             set_http_connect(200)
             #                acct [isn't actually called since everything
             #                      is error limited]
+            # make sure to use a fresh request without cached env
+            req = Request.blank('/v1/a/c/o',
+                                environ={'REQUEST_METHOD': 'DELETE'})
             resp = getattr(controller, 'DELETE')(req)
-            self.assertEquals(resp.status_int, 404)
-
-            for dev in self.app.account_ring.devs.values():
-                dev['errors'] = 0
-            for dev in self.app.container_ring.devs.values():
-                dev['errors'] = self.app.error_suppression_limit + 1
-                dev['last_error'] = time()
+            self.assertEqual(resp.status_int, 404)
+
+            for dev in self.app.account_ring.devs:
+                set_node_errors(self.app, dev, 0, last_error=None)
+            for dev in self.app.container_ring.devs:
+                set_node_errors(
+                    self.app, dev,
+                    self.app.error_limiter.suppression_limit + 1,
+                    time.time())
             set_http_connect(200, 200)
             #                acct cont [isn't actually called since
             #                           everything is error limited]
+            # make sure to use a fresh request without cached env
+            req = Request.blank('/v1/a/c/o',
+                                environ={'REQUEST_METHOD': 'DELETE'})
             resp = getattr(controller, 'DELETE')(req)
-            self.assertEquals(resp.status_int, 404)
+            self.assertEqual(resp.status_int, 404)
 
     def test_PUT_POST_requires_container_exist(self):
         with save_globals():
-            self.app.object_post_as_copy = False
-            self.app.memcache = FakeMemcacheReturnsNone()
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
+            controller = ReplicatedObjectController(
+                self.app, 'account', 'container', 'object')
 
             set_http_connect(200, 404, 404, 404, 200, 200, 200)
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'PUT'})
+            req = Request.blank('/v1/a/c/o',
+                                environ={'REQUEST_METHOD': 'PUT'})
             self.app.update_request(req)
             resp = controller.PUT(req)
-            self.assertEquals(resp.status_int, 404)
+            self.assertEqual(resp.status_int, 404)
 
             set_http_connect(200, 404, 404, 404, 200, 200)
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'POST'},
-                                headers={'Content-Type': 'text/plain'})
-            self.app.update_request(req)
-            resp = controller.POST(req)
-            self.assertEquals(resp.status_int, 404)
-
-    def test_PUT_POST_as_copy_requires_container_exist(self):
-        with save_globals():
-            self.app.memcache = FakeMemcacheReturnsNone()
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-            set_http_connect(200, 404, 404, 404, 200, 200, 200)
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'PUT'})
-            self.app.update_request(req)
-            resp = controller.PUT(req)
-            self.assertEquals(resp.status_int, 404)
-
-            set_http_connect(200, 404, 404, 404, 200, 200, 200, 200, 200, 200)
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'POST'},
+            req = Request.blank('/v1/a/c/o',
+                                environ={'REQUEST_METHOD': 'POST'},
                                 headers={'Content-Type': 'text/plain'})
             self.app.update_request(req)
             resp = controller.POST(req)
-            self.assertEquals(resp.status_int, 404)
+            self.assertEqual(resp.status_int, 404)
+
+    def test_PUT_object_to_container_does_not_exist(self):
+        self.app.container_ring.max_more_nodes = 3  # that's 3 handoffs
+
+        # no container found anywhere!
+        req = Request.blank('/v1/a/c/o', method='PUT')
+        with mocked_http_conn(*([200] + [404] * 6)) as fake_conn:
+            resp = req.get_response(self.app)
+        # object create returns error
+        self.assertEqual(resp.status_int, 404)
+        self.assertEqual(['HEAD'] * 7,
+                         [r['method'] for r in fake_conn.requests])
+        self.assertEqual(['/a'] + ['/a/c'] * 6, [
+            r['path'][len('/sdX/0'):] for r in fake_conn.requests])
+
+    def test_PUT_object_to_container_exist_on_handoff(self):
+        self.app.container_ring.max_more_nodes = 3  # that's 3 handoffs
+
+        # finally get info after three requests
+        req = Request.blank('/v1/a/c/o', method='PUT', content_length=0)
+        account_status = [200]
+        container_status = ([404] * 5) + [200]
+        object_status = [201, 201, 201]
+        status = account_status + container_status + object_status
+        with mocked_http_conn(*status) as fake_conn:
+            resp = req.get_response(self.app)
+        # object created
+        self.assertEqual(resp.status_int, 201)
+
+        account_requests = fake_conn.requests[:len(account_status)]
+        self.assertEqual(['HEAD'],
+                         [r['method'] for r in account_requests])
+        self.assertEqual(['/a'], [
+            r['path'][len('/sdX/0'):] for r in account_requests])
+
+        container_requests = fake_conn.requests[
+            len(account_status):len(account_status) + len(container_status)]
+        self.assertEqual(['HEAD'] * 6,
+                         [r['method'] for r in container_requests])
+        self.assertEqual(['/a/c'] * 6, [
+            r['path'][len('/sdX/0'):] for r in container_requests])
+
+        obj_requests = fake_conn.requests[
+            len(account_status) + len(container_status):]
+        self.assertEqual(['PUT'] * 3,
+                         [r['method'] for r in obj_requests])
+        self.assertEqual(['/a/c/o'] * 3, [
+            r['path'][len('/sdX/0'):] for r in obj_requests])
+
+    def test_PUT_object_to_primary_timeout_container_exist(self):
+        self.app.container_ring.max_more_nodes = 3  # that's 3 handoffs
+
+        req = Request.blank('/v1/a/c/o', method='PUT', content_length=0)
+        account_status = [200]
+        # no response from primaries but container exists on a handoff!
+        container_status = ([Timeout()] * 3) + [200]
+        object_status = [201, 201, 201]
+        status = account_status + container_status + object_status
+        with mocked_http_conn(*status) as fake_conn:
+            resp = req.get_response(self.app)
+        # object created
+        self.assertEqual(resp.status_int, 201)
+
+        account_requests = fake_conn.requests[:len(account_status)]
+        self.assertEqual(['HEAD'],
+                         [r['method'] for r in account_requests])
+        self.assertEqual(['/a'], [
+            r['path'][len('/sdX/0'):] for r in account_requests])
+
+        container_requests = fake_conn.requests[
+            len(account_status):len(account_status) + len(container_status)]
+        self.assertEqual(['HEAD'] * 4,
+                         [r['method'] for r in container_requests])
+        self.assertEqual(['/a/c'] * 4, [
+            r['path'][len('/sdX/0'):] for r in container_requests])
+
+        obj_requests = fake_conn.requests[
+            len(account_status) + len(container_status):]
+        self.assertEqual(['PUT'] * 3,
+                         [r['method'] for r in obj_requests])
+        self.assertEqual(['/a/c/o'] * 3, [
+            r['path'][len('/sdX/0'):] for r in obj_requests])
+
+    def test_PUT_object_to_all_containers_error(self):
+        self.app.container_ring.max_more_nodes = 2  # 2 handoffs
+
+        req = Request.blank('/v1/a/c/o', method='PUT', content_length=0)
+        account_status = [200]
+        container_status = [503] * 5  # 3 replicas + 2 handoffs
+        status = account_status + container_status
+        with mocked_http_conn(*status) as fake_conn:
+            resp = req.get_response(self.app)
+
+        account_requests = fake_conn.requests[:len(account_status)]
+        self.assertEqual(['HEAD'],
+                         [r['method'] for r in account_requests])
+        self.assertEqual(['/a'], [
+            r['path'][len('/sdX/0'):] for r in account_requests])
+
+        container_requests = fake_conn.requests[
+            len(account_status):len(account_status) + len(container_status)]
+        self.assertEqual(['HEAD'] * 5,
+                         [r['method'] for r in container_requests])
+        self.assertEqual(['/a/c'] * 5, [
+            r['path'][len('/sdX/0'):] for r in container_requests])
+
+        # object is not created!
+        self.assertEqual(resp.status_int, 503)
+
+    def test_PUT_object_to_primary_containers_timeout(self):
+        self.app.container_ring.max_more_nodes = 2  # 2 handoffs
+
+        req = Request.blank('/v1/a/c/o', method='PUT', content_length=0)
+        account_status = [200]
+        # primary timeout db lock & handoffs 404
+        container_status = [Timeout()] * 3 + [404] * 2
+        status = account_status + container_status
+        with mocked_http_conn(*status) as fake_conn:
+            resp = req.get_response(self.app)
+
+        account_requests = fake_conn.requests[:len(account_status)]
+        self.assertEqual(['HEAD'],
+                         [r['method'] for r in account_requests])
+        self.assertEqual(['/a'], [
+            r['path'][len('/sdX/0'):] for r in account_requests])
+
+        container_requests = fake_conn.requests[
+            len(account_status):len(account_status) + len(container_status)]
+        self.assertEqual(['HEAD'] * 5,
+                         [r['method'] for r in container_requests])
+        self.assertEqual(['/a/c'] * 5, [
+            r['path'][len('/sdX/0'):] for r in container_requests])
+
+        # object is not created!
+        self.assertEqual(resp.status_int, 503)
 
     def test_bad_metadata(self):
         with save_globals():
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
+            controller = ReplicatedObjectController(
+                self.app, 'account', 'container', 'object')
+            cache = FakeMemcache()
             set_http_connect(200, 200, 201, 201, 201)
             #                acct cont obj  obj  obj
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                                headers={'Content-Length': '0'})
+            req = Request.blank(
+                '/v1/a/c/o',
+                environ={'REQUEST_METHOD': 'PUT', 'swift.cache': cache},
+                headers={'Content-Length': '0'})
             self.app.update_request(req)
             resp = controller.PUT(req)
-            self.assertEquals(resp.status_int, 201)
+            self.assertEqual(resp.status_int, 201)
 
             set_http_connect(201, 201, 201)
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                                headers={'Content-Length': '0',
-                                         'X-Object-Meta-' + ('a' *
-                                         MAX_META_NAME_LENGTH): 'v'})
+            req = Request.blank(
+                '/v1/a/c/o',
+                environ={'REQUEST_METHOD': 'PUT', 'swift.cache': cache},
+                headers={'Content-Length': '0',
+                         'X-Object-Meta-' + (
+                             'a' * constraints.MAX_META_NAME_LENGTH): 'v'})
             self.app.update_request(req)
             resp = controller.PUT(req)
-            self.assertEquals(resp.status_int, 201)
+            self.assertEqual(resp.status_int, 201)
             set_http_connect(201, 201, 201)
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                                headers={'Content-Length': '0',
-                                         'X-Object-Meta-' + ('a' *
-                                         (MAX_META_NAME_LENGTH + 1)): 'v'})
+            req = Request.blank(
+                '/v1/a/c/o',
+                environ={'REQUEST_METHOD': 'PUT', 'swift.cache': cache},
+                headers={
+                    'Content-Length': '0',
+                    'X-Object-Meta-' + (
+                        'a' * (constraints.MAX_META_NAME_LENGTH + 1)): 'v'})
             self.app.update_request(req)
             resp = controller.PUT(req)
-            self.assertEquals(resp.status_int, 400)
+            self.assertEqual(resp.status_int, 400)
 
             set_http_connect(201, 201, 201)
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                                headers={'Content-Length': '0',
-                                         'X-Object-Meta-Too-Long': 'a' *
-                                         MAX_META_VALUE_LENGTH})
+            req = Request.blank(
+                '/v1/a/c/o',
+                environ={'REQUEST_METHOD': 'PUT', 'swift.cache': cache},
+                headers={'Content-Length': '0',
+                         'X-Object-Meta-Too-Long': 'a' *
+                         constraints.MAX_META_VALUE_LENGTH})
             self.app.update_request(req)
             resp = controller.PUT(req)
-            self.assertEquals(resp.status_int, 201)
+            self.assertEqual(resp.status_int, 201)
             set_http_connect(201, 201, 201)
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                                headers={'Content-Length': '0',
-                                         'X-Object-Meta-Too-Long': 'a' *
-                                         (MAX_META_VALUE_LENGTH + 1)})
+            req = Request.blank(
+                '/v1/a/c/o',
+                environ={'REQUEST_METHOD': 'PUT', 'swift.cache': cache},
+                headers={'Content-Length': '0',
+                         'X-Object-Meta-Too-Long': 'a' *
+                         (constraints.MAX_META_VALUE_LENGTH + 1)})
             self.app.update_request(req)
             resp = controller.PUT(req)
-            self.assertEquals(resp.status_int, 400)
+            self.assertEqual(resp.status_int, 400)
 
             set_http_connect(201, 201, 201)
             headers = {'Content-Length': '0'}
-            for x in xrange(MAX_META_COUNT):
+            for x in range(constraints.MAX_META_COUNT):
                 headers['X-Object-Meta-%d' % x] = 'v'
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                                headers=headers)
+            req = Request.blank(
+                '/v1/a/c/o',
+                environ={'REQUEST_METHOD': 'PUT', 'swift.cache': cache},
+                headers=headers)
             self.app.update_request(req)
             resp = controller.PUT(req)
-            self.assertEquals(resp.status_int, 201)
+            self.assertEqual(resp.status_int, 201)
             set_http_connect(201, 201, 201)
             headers = {'Content-Length': '0'}
-            for x in xrange(MAX_META_COUNT + 1):
+            for x in range(constraints.MAX_META_COUNT + 1):
                 headers['X-Object-Meta-%d' % x] = 'v'
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                                headers=headers)
+            req = Request.blank(
+                '/v1/a/c/o',
+                environ={'REQUEST_METHOD': 'PUT', 'swift.cache': cache},
+                headers=headers)
             self.app.update_request(req)
             resp = controller.PUT(req)
-            self.assertEquals(resp.status_int, 400)
+            self.assertEqual(resp.status_int, 400)
 
             set_http_connect(201, 201, 201)
             headers = {'Content-Length': '0'}
-            header_value = 'a' * MAX_META_VALUE_LENGTH
-            size = 0
-            x = 0
-            while size < MAX_META_OVERALL_SIZE - 4 - \
-                    MAX_META_VALUE_LENGTH:
-                size += 4 + MAX_META_VALUE_LENGTH
-                headers['X-Object-Meta-%04d' % x] = header_value
-                x += 1
-            if MAX_META_OVERALL_SIZE - size > 1:
-                headers['X-Object-Meta-a'] = \
-                    'a' * (MAX_META_OVERALL_SIZE - size - 1)
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                                headers=headers)
-            self.app.update_request(req)
-            resp = controller.PUT(req)
-            self.assertEquals(resp.status_int, 201)
-            set_http_connect(201, 201, 201)
-            headers['X-Object-Meta-a'] = \
-                'a' * (MAX_META_OVERALL_SIZE - size)
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                                headers=headers)
-            self.app.update_request(req)
-            resp = controller.PUT(req)
-            self.assertEquals(resp.status_int, 400)
-
-    def test_copy_from(self):
-        with save_globals():
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-            # initial source object PUT
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                                headers={'Content-Length': '0'})
-            self.app.update_request(req)
-            set_http_connect(200, 200, 201, 201, 201)
-            #                acct cont obj  obj  obj
-            resp = controller.PUT(req)
-            self.assertEquals(resp.status_int, 201)
-
-            # basic copy
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                                headers={'Content-Length': '0',
-                                         'X-Copy-From': 'c/o'})
-            self.app.update_request(req)
-            set_http_connect(200, 200, 200, 200, 200, 200, 200, 201, 201, 201)
-            #                acct cont acct cont objc objc objc obj  obj  obj
-            self.app.memcache.store = {}
-            resp = controller.PUT(req)
-            self.assertEquals(resp.status_int, 201)
-            self.assertEquals(resp.headers['x-copied-from'], 'c/o')
-
-            # non-zero content length
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                                headers={'Content-Length': '5',
-                                         'X-Copy-From': 'c/o'})
-            self.app.update_request(req)
-            set_http_connect(200, 200, 200, 200, 200, 200, 200)
-            #                acct cont acct cont objc objc objc
-            self.app.memcache.store = {}
-            resp = controller.PUT(req)
-            self.assertEquals(resp.status_int, 400)
-
-            # extra source path parsing
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                                headers={'Content-Length': '0',
-                                         'X-Copy-From': 'c/o/o2'})
-            req.account = 'a'
-            set_http_connect(200, 200, 200, 200, 200, 200, 200, 201, 201, 201)
-            #                acct cont acct cont objc objc objc obj  obj  obj
-            self.app.memcache.store = {}
-            resp = controller.PUT(req)
-            self.assertEquals(resp.status_int, 201)
-            self.assertEquals(resp.headers['x-copied-from'], 'c/o/o2')
-
-            # space in soure path
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                                headers={'Content-Length': '0',
-                                         'X-Copy-From': 'c/o%20o2'})
-            req.account = 'a'
-            set_http_connect(200, 200, 200, 200, 200, 200, 200, 201, 201, 201)
-            #                acct cont acct cont objc objc objc obj  obj  obj
-            self.app.memcache.store = {}
-            resp = controller.PUT(req)
-            self.assertEquals(resp.status_int, 201)
-            self.assertEquals(resp.headers['x-copied-from'], 'c/o%20o2')
-
-            # repeat tests with leading /
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                                headers={'Content-Length': '0',
-                                         'X-Copy-From': '/c/o'})
-            self.app.update_request(req)
-            set_http_connect(200, 200, 200, 200, 200, 200, 200, 201, 201, 201)
-            #                acct cont acct cont objc objc objc obj  obj  obj
-            self.app.memcache.store = {}
-            resp = controller.PUT(req)
-            self.assertEquals(resp.status_int, 201)
-            self.assertEquals(resp.headers['x-copied-from'], 'c/o')
-
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                                headers={'Content-Length': '0',
-                                         'X-Copy-From': '/c/o/o2'})
-            req.account = 'a'
-            set_http_connect(200, 200, 200, 200, 200, 200, 200, 201, 201, 201)
-            #                acct cont acct cont objc objc objc obj  obj  obj
-            self.app.memcache.store = {}
-            resp = controller.PUT(req)
-            self.assertEquals(resp.status_int, 201)
-            self.assertEquals(resp.headers['x-copied-from'], 'c/o/o2')
-
-            # negative tests
-
-            # invalid x-copy-from path
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                                headers={'Content-Length': '0',
-                                         'X-Copy-From': '/c'})
-            self.app.update_request(req)
-            self.app.memcache.store = {}
-            resp = controller.PUT(req)
-            self.assertEquals(resp.status_int // 100, 4)  # client error
-
-            # server error
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                                headers={'Content-Length': '0',
-                                         'X-Copy-From': '/c/o'})
-            self.app.update_request(req)
-            set_http_connect(200, 200, 503, 503, 503)
-            #                acct cont objc objc objc
-            self.app.memcache.store = {}
-            resp = controller.PUT(req)
-            self.assertEquals(resp.status_int, 503)
-
-            # not found
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                                headers={'Content-Length': '0',
-                                         'X-Copy-From': '/c/o'})
-            self.app.update_request(req)
-            set_http_connect(200, 200, 404, 404, 404)
-            #                acct cont objc objc objc
-            self.app.memcache.store = {}
-            resp = controller.PUT(req)
-            self.assertEquals(resp.status_int, 404)
-
-            # some missing containers
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                                headers={'Content-Length': '0',
-                                         'X-Copy-From': '/c/o'})
+            header_value = 'a' * constraints.MAX_META_VALUE_LENGTH
+            size = 0
+            x = 0
+            while size < constraints.MAX_META_OVERALL_SIZE - 4 - \
+                    constraints.MAX_META_VALUE_LENGTH:
+                size += 4 + constraints.MAX_META_VALUE_LENGTH
+                headers['X-Object-Meta-%04d' % x] = header_value
+                x += 1
+            if constraints.MAX_META_OVERALL_SIZE - size > 1:
+                headers['X-Object-Meta-a'] = \
+                    'a' * (constraints.MAX_META_OVERALL_SIZE - size - 1)
+            req = Request.blank(
+                '/v1/a/c/o',
+                environ={'REQUEST_METHOD': 'PUT', 'swift.cache': cache},
+                headers=headers)
             self.app.update_request(req)
-            set_http_connect(200, 200, 404, 404, 200, 201, 201, 201)
-            #                acct cont objc objc objc obj  obj  obj
-            self.app.memcache.store = {}
             resp = controller.PUT(req)
-            self.assertEquals(resp.status_int, 201)
-
-            # test object meta data
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                                headers={'Content-Length': '0',
-                                         'X-Copy-From': '/c/o',
-                                         'X-Object-Meta-Ours': 'okay'})
+            self.assertEqual(resp.status_int, 201)
+            set_http_connect(201, 201, 201)
+            headers['X-Object-Meta-a'] = \
+                'a' * (constraints.MAX_META_OVERALL_SIZE - size)
+            req = Request.blank(
+                '/v1/a/c/o',
+                environ={'REQUEST_METHOD': 'PUT', 'swift.cache': cache},
+                headers=headers)
             self.app.update_request(req)
-            set_http_connect(200, 200, 200, 200, 200, 201, 201, 201)
-            #                acct cont objc objc objc obj  obj  obj
-            self.app.memcache.store = {}
-            resp = controller.PUT(req)
-            self.assertEquals(resp.status_int, 201)
-            self.assertEquals(resp.headers.get('x-object-meta-test'),
-                              'testing')
-            self.assertEquals(resp.headers.get('x-object-meta-ours'), 'okay')
-
-    def test_COPY(self):
-        with save_globals():
-            controller = proxy_server.ObjectController(self.app, 'a', 'c', 'o')
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                                headers={'Content-Length': '0'})
-            req.account = 'a'
-            set_http_connect(200, 200, 201, 201, 201)
-            #                acct cont obj  obj  obj
             resp = controller.PUT(req)
-            self.assertEquals(resp.status_int, 201)
-
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'COPY'},
-                                headers={'Destination': 'c/o'})
-            req.account = 'a'
-            set_http_connect(200, 200, 200, 200, 200, 200, 200, 201, 201, 201)
-            #                acct cont acct cont objc objc objc obj  obj  obj
-            self.app.memcache.store = {}
-            resp = controller.COPY(req)
-            self.assertEquals(resp.status_int, 201)
-            self.assertEquals(resp.headers['x-copied-from'], 'c/o')
-
-            req = Request.blank('/a/c/o/o2',
-                                environ={'REQUEST_METHOD': 'COPY'},
-                                headers={'Destination': 'c/o'})
-            req.account = 'a'
-            controller.object_name = 'o/o2'
-            set_http_connect(200, 200, 200, 200, 200, 200, 200, 201, 201, 201)
-            #                acct cont acct cont objc objc objc obj  obj  obj
-            self.app.memcache.store = {}
-            resp = controller.COPY(req)
-            self.assertEquals(resp.status_int, 201)
-            self.assertEquals(resp.headers['x-copied-from'], 'c/o/o2')
-
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'COPY'},
-                                headers={'Destination': '/c/o'})
-            req.account = 'a'
-            controller.object_name = 'o'
-            set_http_connect(200, 200, 200, 200, 200, 200, 200, 201, 201, 201)
-            #                acct cont acct cont objc objc objc obj  obj  obj
-            self.app.memcache.store = {}
-            resp = controller.COPY(req)
-            self.assertEquals(resp.status_int, 201)
-            self.assertEquals(resp.headers['x-copied-from'], 'c/o')
-
-            req = Request.blank('/a/c/o/o2',
-                                environ={'REQUEST_METHOD': 'COPY'},
-                                headers={'Destination': '/c/o'})
-            req.account = 'a'
-            controller.object_name = 'o/o2'
-            set_http_connect(200, 200, 200, 200, 200, 200, 200, 201, 201, 201)
-            #                acct cont acct cont objc objc objc obj  obj  obj
-            self.app.memcache.store = {}
-            resp = controller.COPY(req)
-            self.assertEquals(resp.status_int, 201)
-            self.assertEquals(resp.headers['x-copied-from'], 'c/o/o2')
-
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'COPY'},
-                                headers={'Destination': 'c_o'})
-            req.account = 'a'
-            controller.object_name = 'o'
-            set_http_connect(200, 200)
-            #                acct cont
-            self.app.memcache.store = {}
-            resp = controller.COPY(req)
-            self.assertEquals(resp.status_int, 412)
-
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'COPY'},
-                                headers={'Destination': '/c/o'})
-            req.account = 'a'
-            controller.object_name = 'o'
-            set_http_connect(200, 200, 503, 503, 503)
-            #                acct cont objc objc objc
-            self.app.memcache.store = {}
-            resp = controller.COPY(req)
-            self.assertEquals(resp.status_int, 503)
-
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'COPY'},
-                                headers={'Destination': '/c/o'})
-            req.account = 'a'
-            controller.object_name = 'o'
-            set_http_connect(200, 200, 404, 404, 404)
-            #                acct cont objc objc objc
-            self.app.memcache.store = {}
-            resp = controller.COPY(req)
-            self.assertEquals(resp.status_int, 404)
-
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'COPY'},
-                                headers={'Destination': '/c/o'})
-            req.account = 'a'
-            controller.object_name = 'o'
-            set_http_connect(200, 200, 404, 404, 200, 201, 201, 201)
-            #                acct cont objc objc objc obj  obj  obj
-            self.app.memcache.store = {}
-            resp = controller.COPY(req)
-            self.assertEquals(resp.status_int, 201)
-
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'COPY'},
-                                headers={'Destination': '/c/o',
-                                         'X-Object-Meta-Ours': 'okay'})
-            req.account = 'a'
-            controller.object_name = 'o'
-            set_http_connect(200, 200, 200, 200, 200, 201, 201, 201)
-            #                acct cont objc objc objc obj  obj  obj
-            self.app.memcache.store = {}
-            resp = controller.COPY(req)
-            self.assertEquals(resp.status_int, 201)
-            self.assertEquals(resp.headers.get('x-object-meta-test'),
-                              'testing')
-            self.assertEquals(resp.headers.get('x-object-meta-ours'), 'okay')
-
-    def test_COPY_newest(self):
-        with save_globals():
-            controller = proxy_server.ObjectController(self.app, 'a', 'c', 'o')
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'COPY'},
-                                headers={'Destination': '/c/o'})
-            req.account = 'a'
-            controller.object_name = 'o'
-            set_http_connect(200, 200, 200, 200, 200, 201, 201, 201,
-                             #act cont objc objc objc obj  obj  obj
-                             timestamps=('1', '1', '1', '3', '2', '4', '4',
-                                         '4'))
-            self.app.memcache.store = {}
-            resp = controller.COPY(req)
-            self.assertEquals(resp.status_int, 201)
-            self.assertEquals(resp.headers['x-copied-from-last-modified'],
-                              '3')
-
-    def test_chunked_put(self):
-
-        class ChunkedFile():
-
-            def __init__(self, bytes):
-                self.bytes = bytes
-                self.read_bytes = 0
-
-            @property
-            def bytes_left(self):
-                return self.bytes - self.read_bytes
-
-            def read(self, amt=None):
-                if self.read_bytes >= self.bytes:
-                    raise StopIteration()
-                if not amt:
-                    amt = self.bytes_left
-                data = 'a' * min(amt, self.bytes_left)
-                self.read_bytes += len(data)
-                return data
+            self.assertEqual(resp.status_int, 400)
 
+    @contextmanager
+    def controller_context(self, req, *args, **kwargs):
+        _v, account, container, obj = utils.split_path(req.path, 4, 4, True)
+        controller = ReplicatedObjectController(
+            self.app, account, container, obj)
+        self.app.update_request(req)
         with save_globals():
-            set_http_connect(201, 201, 201, 201)
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'COPY'},
-                                headers={'Transfer-Encoding': 'chunked',
-                                         'Content-Type': 'foo/bar'})
-
-            req.body_file = ChunkedFile(10)
-            self.app.memcache.store = {}
-            self.app.update_request(req)
-            res = controller.PUT(req)
-            self.assertEquals(res.status_int // 100, 2)  # success
-
-            # test 413 entity to large
-            set_http_connect(201, 201, 201, 201)
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'COPY'},
-                                headers={'Transfer-Encoding': 'chunked',
-                                'Content-Type': 'foo/bar'})
-            req.body_file = ChunkedFile(11)
-            self.app.memcache.store = {}
-            self.app.update_request(req)
-            try:
-                swift.proxy.controllers.obj.MAX_FILE_SIZE = 10
-                res = controller.PUT(req)
-                self.assertEquals(res.status_int, 413)
-            finally:
-                swift.proxy.controllers.obj.MAX_FILE_SIZE = MAX_FILE_SIZE
-
+            new_connect = set_http_connect(*args, **kwargs)
+            yield controller
+            unused_status_list = []
+            while True:
+                try:
+                    unused_status_list.append(next(new_connect.code_iter))
+                except StopIteration:
+                    break
+            if unused_status_list:
+                raise self.fail('UN-USED STATUS CODES: %r' %
+                                unused_status_list)
+
+    @unpatch_policies
     def test_chunked_put_bad_version(self):
         # Check bad version
         (prolis, acc1lis, acc2lis, con1lis, con2lis, obj1lis,
-         obj2lis) = _test_sockets
+         obj2lis, obj3lis, obj4lis, obj5lis, obj6lis) = _test_sockets
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('GET /v0 HTTP/1.1\r\nHost: localhost\r\n'
-                 'Connection: close\r\nContent-Length: 0\r\n\r\n')
+        fd = sock.makefile('rwb')
+        fd.write(b'GET /v0 HTTP/1.1\r\nHost: localhost\r\n'
+                 b'Connection: close\r\nContent-Length: 0\r\n\r\n')
         fd.flush()
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 412'
-        self.assertEquals(headers[:len(exp)], exp)
+        exp = b'HTTP/1.1 412'
+        self.assertEqual(headers[:len(exp)], exp)
 
+    @unpatch_policies
     def test_chunked_put_bad_path(self):
         # Check bad path
         (prolis, acc1lis, acc2lis, con1lis, con2lis, obj1lis,
-         obj2lis) = _test_sockets
+         obj2lis, obj3lis, obj4lis, obj5lis, obj6lis) = _test_sockets
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('GET invalid HTTP/1.1\r\nHost: localhost\r\n'
-                 'Connection: close\r\nContent-Length: 0\r\n\r\n')
+        fd = sock.makefile('rwb')
+        fd.write(b'GET invalid HTTP/1.1\r\nHost: localhost\r\n'
+                 b'Connection: close\r\nContent-Length: 0\r\n\r\n')
         fd.flush()
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 404'
-        self.assertEquals(headers[:len(exp)], exp)
+        exp = b'HTTP/1.1 404'
+        self.assertEqual(headers[:len(exp)], exp)
 
+    @unpatch_policies
     def test_chunked_put_bad_utf8(self):
         # Check invalid utf-8
         (prolis, acc1lis, acc2lis, con1lis, con2lis, obj1lis,
-         obj2lis) = _test_sockets
+         obj2lis, obj3lis, obj4lis, obj5lis, obj6lis) = _test_sockets
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('GET /v1/a%80 HTTP/1.1\r\nHost: localhost\r\n'
-                 'Connection: close\r\nX-Auth-Token: t\r\n'
-                 'Content-Length: 0\r\n\r\n')
+        fd = sock.makefile('rwb')
+        fd.write(b'GET /v1/a%80 HTTP/1.1\r\nHost: localhost\r\n'
+                 b'Connection: close\r\nX-Auth-Token: t\r\n'
+                 b'Content-Length: 0\r\n\r\n')
         fd.flush()
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 412'
-        self.assertEquals(headers[:len(exp)], exp)
+        exp = b'HTTP/1.1 412'
+        self.assertEqual(headers[:len(exp)], exp)
 
+    @unpatch_policies
     def test_chunked_put_bad_path_no_controller(self):
         # Check bad path, no controller
         (prolis, acc1lis, acc2lis, con1lis, con2lis, obj1lis,
-         obj2lis) = _test_sockets
+         obj2lis, obj3lis, obj4lis, obj5lis, obj6lis) = _test_sockets
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('GET /v1 HTTP/1.1\r\nHost: localhost\r\n'
-                 'Connection: close\r\nX-Auth-Token: t\r\n'
-                 'Content-Length: 0\r\n\r\n')
+        fd = sock.makefile('rwb')
+        fd.write(b'GET /v1 HTTP/1.1\r\nHost: localhost\r\n'
+                 b'Connection: close\r\nX-Auth-Token: t\r\n'
+                 b'Content-Length: 0\r\n\r\n')
         fd.flush()
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 412'
-        self.assertEquals(headers[:len(exp)], exp)
+        exp = b'HTTP/1.1 412'
+        self.assertEqual(headers[:len(exp)], exp)
 
+    @unpatch_policies
     def test_chunked_put_bad_method(self):
         # Check bad method
         (prolis, acc1lis, acc2lis, con1lis, con2lis, obj1lis,
-         obj2lis) = _test_sockets
+         obj2lis, obj3lis, obj4lis, obj5lis, obj6lis) = _test_sockets
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('LICK /v1/a HTTP/1.1\r\nHost: localhost\r\n'
-                 'Connection: close\r\nX-Auth-Token: t\r\n'
-                 'Content-Length: 0\r\n\r\n')
+        fd = sock.makefile('rwb')
+        fd.write(b'LICK /v1/a HTTP/1.1\r\nHost: localhost\r\n'
+                 b'Connection: close\r\nX-Auth-Token: t\r\n'
+                 b'Content-Length: 0\r\n\r\n')
         fd.flush()
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 405'
-        self.assertEquals(headers[:len(exp)], exp)
+        exp = b'HTTP/1.1 405'
+        self.assertEqual(headers[:len(exp)], exp)
 
+    @unpatch_policies
     def test_chunked_put_unhandled_exception(self):
         # Check unhandled exception
         (prosrv, acc1srv, acc2srv, con1srv, con2srv, obj1srv,
-         obj2srv) = _test_servers
+         obj2srv, obj3srv, obj4srv, obj5srv, obj6srv) = _test_servers
         (prolis, acc1lis, acc2lis, con1lis, con2lis, obj1lis,
-         obj2lis) = _test_sockets
+         obj2lis, obj3lis, obj4lis, obj5lis, obj6lis) = _test_sockets
         orig_update_request = prosrv.update_request
 
         def broken_update_request(*args, **kwargs):
@@ -2355,1458 +6565,3726 @@ def broken_update_request(*args, **kwargs):
 
         prosrv.update_request = broken_update_request
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('HEAD /v1/a HTTP/1.1\r\nHost: localhost\r\n'
-                 'Connection: close\r\nX-Auth-Token: t\r\n'
-                 'Content-Length: 0\r\n\r\n')
+        fd = sock.makefile('rwb')
+        fd.write(b'HEAD /v1/a HTTP/1.1\r\nHost: localhost\r\n'
+                 b'Connection: close\r\nX-Auth-Token: t\r\n'
+                 b'Content-Length: 0\r\n\r\n')
         fd.flush()
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 500'
-        self.assertEquals(headers[:len(exp)], exp)
+        exp = b'HTTP/1.1 500'
+        self.assertEqual(headers[:len(exp)], exp)
         prosrv.update_request = orig_update_request
 
+    @unpatch_policies
     def test_chunked_put_head_account(self):
         # Head account, just a double check and really is here to test
         # the part Application.log_request that 'enforces' a
         # content_length on the response.
         (prolis, acc1lis, acc2lis, con1lis, con2lis, obj1lis,
-         obj2lis) = _test_sockets
+         obj2lis, obj3lis, obj4lis, obj5lis, obj6lis) = _test_sockets
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('HEAD /v1/a HTTP/1.1\r\nHost: localhost\r\n'
-                 'Connection: close\r\nX-Auth-Token: t\r\n'
-                 'Content-Length: 0\r\n\r\n')
+        fd = sock.makefile('rwb')
+        fd.write(b'HEAD /v1/a HTTP/1.1\r\nHost: localhost\r\n'
+                 b'Connection: close\r\nX-Auth-Token: t\r\n'
+                 b'Content-Length: 0\r\n\r\n')
         fd.flush()
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 204'
-        self.assertEquals(headers[:len(exp)], exp)
-        self.assert_('\r\nContent-Length: 0\r\n' in headers)
+        exp = b'HTTP/1.1 204'
+        self.assertEqual(headers[:len(exp)], exp)
+        self.assertIn(b'\r\nContent-Length: 0\r\n', headers)
 
+    @unpatch_policies
     def test_chunked_put_utf8_all_the_way_down(self):
         # Test UTF-8 Unicode all the way through the system
-        ustr = '\xe1\xbc\xb8\xce\xbf\xe1\xbd\xba \xe1\xbc\xb0\xce' \
-               '\xbf\xe1\xbd\xbb\xce\x87 \xcf\x84\xe1\xbd\xb0 \xcf' \
-               '\x80\xe1\xbd\xb1\xce\xbd\xcf\x84\xca\xbc \xe1\xbc' \
-               '\x82\xce\xbd \xe1\xbc\x90\xce\xbe\xe1\xbd\xb5\xce' \
-               '\xba\xce\xbf\xce\xb9 \xcf\x83\xce\xb1\xcf\x86\xe1' \
-               '\xbf\x86.Test'
-        ustr_short = '\xe1\xbc\xb8\xce\xbf\xe1\xbd\xbatest'
+        ustr = b'\xe1\xbc\xb8\xce\xbf\xe1\xbd\xba \xe1\xbc\xb0\xce' \
+               b'\xbf\xe1\xbd\xbb\xce\x87 \xcf\x84\xe1\xbd\xb0 \xcf' \
+               b'\x80\xe1\xbd\xb1\xce\xbd\xcf\x84\xca\xbc \xe1\xbc' \
+               b'\x82\xce\xbd \xe1\xbc\x90\xce\xbe\xe1\xbd\xb5\xce' \
+               b'\xba\xce\xbf\xce\xb9 \xcf\x83\xce\xb1\xcf\x86\xe1' \
+               b'\xbf\x86.Test'
+        ustr_short = b'\xe1\xbc\xb8\xce\xbf\xe1\xbd\xbatest'
         # Create ustr container
         (prolis, acc1lis, acc2lis, con1lis, con2lis, obj1lis,
-         obj2lis) = _test_sockets
+         obj2lis, obj3lis, obj4lis, obj5lis, obj6lis) = _test_sockets
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('PUT /v1/a/%s HTTP/1.1\r\nHost: localhost\r\n'
-                 'Connection: close\r\nX-Storage-Token: t\r\n'
-                 'Content-Length: 0\r\n\r\n' % quote(ustr))
+        fd = sock.makefile('rwb')
+        fd.write(b'PUT /v1/a/%s HTTP/1.1\r\nHost: localhost\r\n'
+                 b'Connection: close\r\nX-Storage-Token: t\r\n'
+                 b'Content-Length: 0\r\n\r\n' % quote(ustr).encode('ascii'))
         fd.flush()
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 201'
-        self.assertEquals(headers[:len(exp)], exp)
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
         # List account with ustr container (test plain)
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('GET /v1/a HTTP/1.1\r\nHost: localhost\r\n'
-                 'Connection: close\r\nX-Storage-Token: t\r\n'
-                 'Content-Length: 0\r\n\r\n')
+        fd = sock.makefile('rwb')
+        fd.write(b'GET /v1/a HTTP/1.1\r\nHost: localhost\r\n'
+                 b'Connection: close\r\nX-Storage-Token: t\r\n'
+                 b'Content-Length: 0\r\n\r\n')
         fd.flush()
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 200'
-        self.assertEquals(headers[:len(exp)], exp)
-        containers = fd.read().split('\n')
-        self.assert_(ustr in containers)
+        exp = b'HTTP/1.1 200'
+        self.assertEqual(headers[:len(exp)], exp)
+        containers = fd.read().split(b'\n')
+        self.assertIn(ustr, containers)
         # List account with ustr container (test json)
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('GET /v1/a?format=json HTTP/1.1\r\n'
-                 'Host: localhost\r\nConnection: close\r\n'
-                 'X-Storage-Token: t\r\nContent-Length: 0\r\n\r\n')
+        fd = sock.makefile('rwb')
+        fd.write(b'GET /v1/a?format=json HTTP/1.1\r\n'
+                 b'Host: localhost\r\nConnection: close\r\n'
+                 b'X-Storage-Token: t\r\nContent-Length: 0\r\n\r\n')
         fd.flush()
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 200'
-        self.assertEquals(headers[:len(exp)], exp)
-        listing = simplejson.loads(fd.read())
-        self.assert_(ustr.decode('utf8') in [l['name'] for l in listing])
+        exp = b'HTTP/1.1 200'
+        self.assertEqual(headers[:len(exp)], exp)
+        listing = json.loads(fd.read())
+        self.assertIn(ustr.decode('utf8'), [l['name'] for l in listing])
         # List account with ustr container (test xml)
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('GET /v1/a?format=xml HTTP/1.1\r\n'
-                 'Host: localhost\r\nConnection: close\r\n'
-                 'X-Storage-Token: t\r\nContent-Length: 0\r\n\r\n')
+        fd = sock.makefile('rwb')
+        fd.write(b'GET /v1/a?format=xml HTTP/1.1\r\n'
+                 b'Host: localhost\r\nConnection: close\r\n'
+                 b'X-Storage-Token: t\r\nContent-Length: 0\r\n\r\n')
         fd.flush()
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 200'
-        self.assertEquals(headers[:len(exp)], exp)
-        self.assert_('<name>%s</name>' % ustr in fd.read())
+        exp = b'HTTP/1.1 200'
+        self.assertEqual(headers[:len(exp)], exp)
+        self.assertIn(b'<name>%s</name>' % ustr, fd.read())
         # Create ustr object with ustr metadata in ustr container
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('PUT /v1/a/%s/%s HTTP/1.1\r\nHost: localhost\r\n'
-                 'Connection: close\r\nX-Storage-Token: t\r\n'
-                 'X-Object-Meta-%s: %s\r\nContent-Length: 0\r\n\r\n' %
-                 (quote(ustr), quote(ustr), quote(ustr_short),
-                  quote(ustr)))
+        fd = sock.makefile('rwb')
+        fd.write(b'PUT /v1/a/%s/%s HTTP/1.1\r\nHost: localhost\r\n'
+                 b'Connection: close\r\nX-Storage-Token: t\r\n'
+                 b'X-Object-Meta-%s: %s\r\nContent-Length: 0\r\n\r\n' %
+                 (quote(ustr).encode('ascii'), quote(ustr).encode('ascii'),
+                  quote(ustr_short).encode('ascii'),
+                  quote(ustr).encode('ascii')))
         fd.flush()
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 201'
-        self.assertEquals(headers[:len(exp)], exp)
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
         # List ustr container with ustr object (test plain)
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('GET /v1/a/%s HTTP/1.1\r\nHost: localhost\r\n'
-                 'Connection: close\r\nX-Storage-Token: t\r\n'
-                 'Content-Length: 0\r\n\r\n' % quote(ustr))
+        fd = sock.makefile('rwb')
+        fd.write(b'GET /v1/a/%s HTTP/1.1\r\nHost: localhost\r\n'
+                 b'Connection: close\r\nX-Storage-Token: t\r\n'
+                 b'Content-Length: 0\r\n\r\n' % quote(ustr).encode('ascii'))
         fd.flush()
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 200'
-        self.assertEquals(headers[:len(exp)], exp)
-        objects = fd.read().split('\n')
-        self.assert_(ustr in objects)
+        exp = b'HTTP/1.1 200'
+        self.assertEqual(headers[:len(exp)], exp)
+        objects = fd.read().split(b'\n')
+        self.assertIn(ustr, objects)
         # List ustr container with ustr object (test json)
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('GET /v1/a/%s?format=json HTTP/1.1\r\n'
-                 'Host: localhost\r\nConnection: close\r\n'
-                 'X-Storage-Token: t\r\nContent-Length: 0\r\n\r\n' %
-                 quote(ustr))
+        fd = sock.makefile('rwb')
+        fd.write(b'GET /v1/a/%s?format=json HTTP/1.1\r\n'
+                 b'Host: localhost\r\nConnection: close\r\n'
+                 b'X-Storage-Token: t\r\nContent-Length: 0\r\n\r\n' %
+                 quote(ustr).encode('ascii'))
         fd.flush()
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 200'
-        self.assertEquals(headers[:len(exp)], exp)
-        listing = simplejson.loads(fd.read())
-        self.assertEquals(listing[0]['name'], ustr.decode('utf8'))
+        exp = b'HTTP/1.1 200'
+        self.assertEqual(headers[:len(exp)], exp)
+        listing = json.loads(fd.read())
+        self.assertEqual(listing[0]['name'], ustr.decode('utf8'))
         # List ustr container with ustr object (test xml)
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('GET /v1/a/%s?format=xml HTTP/1.1\r\n'
-                 'Host: localhost\r\nConnection: close\r\n'
-                 'X-Storage-Token: t\r\nContent-Length: 0\r\n\r\n' %
-                 quote(ustr))
+        fd = sock.makefile('rwb')
+        fd.write(b'GET /v1/a/%s?format=xml HTTP/1.1\r\n'
+                 b'Host: localhost\r\nConnection: close\r\n'
+                 b'X-Storage-Token: t\r\nContent-Length: 0\r\n\r\n' %
+                 quote(ustr).encode('ascii'))
         fd.flush()
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 200'
-        self.assertEquals(headers[:len(exp)], exp)
-        self.assert_('<name>%s</name>' % ustr in fd.read())
+        exp = b'HTTP/1.1 200'
+        self.assertEqual(headers[:len(exp)], exp)
+        self.assertIn(b'<name>%s</name>' % ustr, fd.read())
         # Retrieve ustr object with ustr metadata
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('GET /v1/a/%s/%s HTTP/1.1\r\nHost: localhost\r\n'
-                 'Connection: close\r\nX-Storage-Token: t\r\n'
-                 'Content-Length: 0\r\n\r\n' %
-                 (quote(ustr), quote(ustr)))
+        fd = sock.makefile('rwb')
+        fd.write(b'GET /v1/a/%s/%s HTTP/1.1\r\nHost: localhost\r\n'
+                 b'Connection: close\r\nX-Storage-Token: t\r\n'
+                 b'Content-Length: 0\r\n\r\n' %
+                 (quote(ustr).encode('ascii'), quote(ustr).encode('ascii')))
         fd.flush()
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 200'
-        self.assertEquals(headers[:len(exp)], exp)
-        self.assert_('\r\nX-Object-Meta-%s: %s\r\n' %
-                     (quote(ustr_short).lower(), quote(ustr)) in headers)
+        exp = b'HTTP/1.1 200'
+        self.assertEqual(headers[:len(exp)], exp)
+        self.assertIn(b'\r\nX-Object-Meta-%s: %s\r\n' %
+                      (quote(ustr_short).title().encode('ascii'),
+                       quote(ustr).encode('ascii')), headers)
 
+    @unpatch_policies
     def test_chunked_put_chunked_put(self):
         # Do chunked object put
         (prolis, acc1lis, acc2lis, con1lis, con2lis, obj1lis,
-         obj2lis) = _test_sockets
+         obj2lis, obj3lis, obj4lis, obj5lis, obj6lis) = _test_sockets
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
+        fd = sock.makefile('rwb')
         # Also happens to assert that x-storage-token is taken as a
         # replacement for x-auth-token.
-        fd.write('PUT /v1/a/c/o/chunky HTTP/1.1\r\nHost: localhost\r\n'
-                 'Connection: close\r\nX-Storage-Token: t\r\n'
-                 'Transfer-Encoding: chunked\r\n\r\n'
-                 '2\r\noh\r\n4\r\n hai\r\nf\r\n123456789abcdef\r\n'
-                 '0\r\n\r\n')
+        fd.write(b'PUT /v1/a/c/o/chunky HTTP/1.1\r\nHost: localhost\r\n'
+                 b'Connection: close\r\nX-Storage-Token: t\r\n'
+                 b'Transfer-Encoding: chunked\r\n\r\n'
+                 b'2\r\noh\r\n4\r\n hai\r\nf\r\n123456789abcdef\r\n'
+                 b'0\r\n\r\n')
         fd.flush()
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 201'
-        self.assertEquals(headers[:len(exp)], exp)
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
         # Ensure we get what we put
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('GET /v1/a/c/o/chunky HTTP/1.1\r\nHost: localhost\r\n'
-                 'Connection: close\r\nX-Auth-Token: t\r\n\r\n')
+        fd = sock.makefile('rwb')
+        fd.write(b'GET /v1/a/c/o/chunky HTTP/1.1\r\nHost: localhost\r\n'
+                 b'Connection: close\r\nX-Auth-Token: t\r\n\r\n')
         fd.flush()
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 200'
-        self.assertEquals(headers[:len(exp)], exp)
+        exp = b'HTTP/1.1 200'
+        self.assertEqual(headers[:len(exp)], exp)
         body = fd.read()
-        self.assertEquals(body, 'oh hai123456789abcdef')
+        self.assertEqual(body, b'oh hai123456789abcdef')
 
-    def test_version_manifest(self):
-        versions_to_create = 3
-        # Create a container for our versioned object testing
-        (prolis, acc1lis, acc2lis, con1lis, con2lis, obj1lis,
-         obj2lis) = _test_sockets
-        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('PUT /v1/a/versions HTTP/1.1\r\nHost: localhost\r\n'
-                 'Connection: close\r\nX-Storage-Token: t\r\n'
-                 'Content-Length: 0\r\nX-Versions-Location: vers\r\n\r\n')
-        fd.flush()
-        headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 201'
-        self.assertEquals(headers[:len(exp)], exp)
-        # check that the header was set
+    @unpatch_policies
+    def test_conditional_range_get(self):
+        (prolis, acc1lis, acc2lis, con1lis, con2lis, obj1lis, obj2lis,
+         obj3lis, obj4lis, obj5lis, obj6lis) = _test_sockets
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('GET /v1/a/versions HTTP/1.1\r\nHost: localhost\r\n'
-                 'Connection: close\r\nX-Storage-Token: t\r\n\r\n\r\n')
+
+        # make a container
+        fd = sock.makefile('rwb')
+        fd.write(b'PUT /v1/a/con HTTP/1.1\r\nHost: localhost\r\n'
+                 b'Connection: close\r\nX-Storage-Token: t\r\n'
+                 b'Content-Length: 0\r\n\r\n')
         fd.flush()
+        exp = b'HTTP/1.1 201'
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 2'  # 2xx series response
-        self.assertEquals(headers[:len(exp)], exp)
-        self.assert_('X-Versions-Location: vers' in headers)
-        # make the container for the object versions
+        self.assertEqual(headers[:len(exp)], exp)
+
+        # put an object in it
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('PUT /v1/a/vers HTTP/1.1\r\nHost: localhost\r\n'
-                 'Connection: close\r\nX-Storage-Token: t\r\n'
-                 'Content-Length: 0\r\n\r\n')
+        fd = sock.makefile('rwb')
+        fd.write(b'PUT /v1/a/con/o HTTP/1.1\r\n'
+                 b'Host: localhost\r\n'
+                 b'Connection: close\r\n'
+                 b'X-Storage-Token: t\r\n'
+                 b'Content-Length: 10\r\n'
+                 b'Content-Type: text/plain\r\n'
+                 b'\r\n'
+                 b'abcdefghij\r\n')
         fd.flush()
+        exp = b'HTTP/1.1 201'
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 201'
-        self.assertEquals(headers[:len(exp)], exp)
-        # Create the versioned file
+        self.assertEqual(headers[:len(exp)], exp)
+
+        # request with both If-None-Match and Range
+        etag = md5(b"abcdefghij",
+                   usedforsecurity=False).hexdigest().encode('ascii')
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('PUT /v1/a/versions/name HTTP/1.1\r\nHost: '
-                 'localhost\r\nConnection: close\r\nX-Storage-Token: '
-                 't\r\nContent-Length: 5\r\nContent-Type: text/jibberish0\r\n'
-                 'X-Object-Meta-Foo: barbaz\r\n\r\n00000\r\n')
+        fd = sock.makefile('rwb')
+        fd.write(b'GET /v1/a/con/o HTTP/1.1\r\n' +
+                 b'Host: localhost\r\n' +
+                 b'Connection: close\r\n' +
+                 b'X-Storage-Token: t\r\n' +
+                 b'If-None-Match: "' + etag + b'"\r\n' +
+                 b'Range: bytes=3-8\r\n' +
+                 b'\r\n')
         fd.flush()
+        exp = b'HTTP/1.1 304'
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 201'
-        self.assertEquals(headers[:len(exp)], exp)
-        # Create the object versions
-        for segment in xrange(1, versions_to_create):
-            sleep(.01)  # guarantee that the timestamp changes
+        self.assertEqual(headers[:len(exp)], exp)
+
+    def test_mismatched_etags(self):
+        with save_globals():
+            # no etag supplied, object servers return success w/ diff values
+            controller = ReplicatedObjectController(
+                self.app, 'account', 'container', 'object')
+            req = Request.blank('/v1/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                                headers={'Content-Length': '0'})
+            self.app.update_request(req)
+            set_http_connect(200, 201, 201, 201,
+                             etags=[None,
+                                    '68b329da9893e34099c7d8ad5cb9c940',
+                                    '68b329da9893e34099c7d8ad5cb9c940',
+                                    '68b329da9893e34099c7d8ad5cb9c941'])
+            resp = controller.PUT(req)
+            self.assertEqual(resp.status_int // 100, 5)  # server error
+
+            # req supplies etag, object servers return 422 - mismatch
+            headers = {'Content-Length': '0',
+                       'ETag': '68b329da9893e34099c7d8ad5cb9c940'}
+            req = Request.blank('/v1/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                                headers=headers)
+            self.app.update_request(req)
+            set_http_connect(200, 422, 422, 503,
+                             etags=['68b329da9893e34099c7d8ad5cb9c940',
+                                    '68b329da9893e34099c7d8ad5cb9c941',
+                                    None,
+                                    None])
+            resp = controller.PUT(req)
+            self.assertEqual(resp.status_int // 100, 4)  # client error
+
+    def test_response_get_accept_ranges_header(self):
+        with save_globals():
+            req = Request.blank('/v1/a/c/o', environ={'REQUEST_METHOD': 'GET'})
+            self.app.update_request(req)
+            controller = ReplicatedObjectController(
+                self.app, 'account', 'container', 'object')
+            set_http_connect(200, 200, 200)
+            resp = controller.GET(req)
+            self.assertIn('accept-ranges', resp.headers)
+            self.assertEqual(resp.headers['accept-ranges'], 'bytes')
+
+    def test_response_head_accept_ranges_header(self):
+        with save_globals():
+            req = Request.blank('/v1/a/c/o',
+                                environ={'REQUEST_METHOD': 'HEAD'})
+            self.app.update_request(req)
+            controller = ReplicatedObjectController(
+                self.app, 'account', 'container', 'object')
+            set_http_connect(200, 200, 200)
+            resp = controller.HEAD(req)
+            self.assertIn('accept-ranges', resp.headers)
+            self.assertEqual(resp.headers['accept-ranges'], 'bytes')
+
+    def test_GET_calls_authorize(self):
+        called = [False]
+
+        def authorize(req):
+            called[0] = True
+            return HTTPUnauthorized(request=req)
+        with save_globals():
+            set_http_connect(200, 200, 201, 201, 201)
+            controller = ReplicatedObjectController(
+                self.app, 'account', 'container', 'object')
+            req = Request.blank('/v1/a/c/o')
+            req.environ['swift.authorize'] = authorize
+            self.app.update_request(req)
+            controller.GET(req)
+        self.assertTrue(called[0])
+
+    def _check_GET_respects_read_affinity(self, conf, policy, expected_nodes):
+        actual_nodes = []
+
+        def test_connect(ipaddr, port, device, partition, method, path,
+                         headers=None, query_string=None):
+            if path == '/a/c/o.jpg':
+                actual_nodes.append(ipaddr)
+
+        # mock shuffle to be a no-op to ensure that the only way nodes would
+        # not be used in ring order is if affinity is respected.
+        with mock.patch('swift.proxy.server.shuffle', lambda x: x):
+            app = proxy_server.Application(
+                conf,
+                logger=debug_logger('proxy-ut'),
+                account_ring=FakeRing(),
+                container_ring=FakeRing())
+            with save_globals():
+                object_ring = app.get_object_ring(policy)
+                object_ring.max_more_nodes = 100
+                controller = \
+                    ReplicatedObjectController(
+                        app, 'a', 'c', 'o.jpg')
+                # requests go to acc, con, obj, obj, obj
+                set_http_connect(200, 200, 404, 404, 200,
+                                 give_connect=test_connect)
+                req = Request.blank(
+                    '/v1/a/c/o.jpg',
+                    headers={'X-Backend-Storage-Policy-Index': str(policy)})
+                res = controller.GET(req)
+        self.assertTrue(res.status.startswith('200 '))
+        self.assertEqual(3, len(actual_nodes))
+        self.assertEqual(expected_nodes, actual_nodes)
+
+    @patch_policies([StoragePolicy(0, 'zero', True, object_ring=FakeRing()),
+                     StoragePolicy(1, 'one', False, object_ring=FakeRing())])
+    def test_GET_respects_read_affinity(self):
+        # nodes in fake ring order have r0z0, r1z1, r0z2
+        # Check default conf via proxy server conf
+        conf = {'read_affinity': 'r0z2=1, r1=2',
+                'sorting_method': 'affinity'}
+        expected_nodes = ['10.0.0.2', '10.0.0.1', '10.0.0.0']
+        self._check_GET_respects_read_affinity(conf, 0, expected_nodes)
+
+        # policy 0 and policy 1 have conf via per policy conf section
+        conf = {
+            'read_affinity': '',
+            'sorting_method': 'shuffle',
+            'policy_config': {
+                '0': {'read_affinity': 'r1z1=1, r0z2=2',
+                      'sorting_method': 'affinity'},
+                '1': {'read_affinity': 'r0z2=1, r0z0=2',
+                      'sorting_method': 'affinity'}
+            }
+        }
+        expected_nodes = ['10.0.0.1', '10.0.0.2', '10.0.0.0']
+        self._check_GET_respects_read_affinity(conf, 0, expected_nodes)
+        expected_nodes = ['10.0.0.2', '10.0.0.0', '10.0.0.1']
+        self._check_GET_respects_read_affinity(conf, 1, expected_nodes)
+
+        # policy 0 conf via per policy conf section overrides proxy server conf
+        conf = {
+            'read_affinity': 'r1z1=1, r0z2=2',
+            'sorting_method': 'affinity',
+            'policy_config': {
+                '0': {'read_affinity': 'r0z2=1, r0=2',
+                      'sorting_method': 'affinity'}
+            }
+        }
+        expected_nodes = ['10.0.0.2', '10.0.0.0', '10.0.0.1']
+        self._check_GET_respects_read_affinity(conf, 0, expected_nodes)
+
+    def test_HEAD_calls_authorize(self):
+        called = [False]
+
+        def authorize(req):
+            called[0] = True
+            return HTTPUnauthorized(request=req)
+        with save_globals():
+            set_http_connect(200, 200, 201, 201, 201)
+            controller = ReplicatedObjectController(
+                self.app, 'account', 'container', 'object')
+            req = Request.blank('/v1/a/c/o', {'REQUEST_METHOD': 'HEAD'})
+            req.environ['swift.authorize'] = authorize
+            self.app.update_request(req)
+            controller.HEAD(req)
+        self.assertTrue(called[0])
+
+    def test_POST_calls_authorize(self):
+        called = [False]
+
+        def authorize(req):
+            called[0] = True
+            return HTTPUnauthorized(request=req)
+        with save_globals():
+            set_http_connect(200, 200, 201, 201, 201)
+            controller = ReplicatedObjectController(
+                self.app, 'account', 'container', 'object')
+            req = Request.blank('/v1/a/c/o',
+                                environ={'REQUEST_METHOD': 'POST'},
+                                headers={'Content-Length': '5'}, body='12345')
+            req.environ['swift.authorize'] = authorize
+            self.app.update_request(req)
+            controller.POST(req)
+        self.assertTrue(called[0])
+
+    def test_PUT_calls_authorize(self):
+        called = [False]
+
+        def authorize(req):
+            called[0] = True
+            return HTTPUnauthorized(request=req)
+        with save_globals():
+            set_http_connect(200, 200, 201, 201, 201)
+            controller = ReplicatedObjectController(
+                self.app, 'account', 'container', 'object')
+            req = Request.blank('/v1/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                                headers={'Content-Length': '5'}, body='12345')
+            req.environ['swift.authorize'] = authorize
+            self.app.update_request(req)
+            controller.PUT(req)
+        self.assertTrue(called[0])
+
+    def test_POST_converts_delete_after_to_delete_at(self):
+        with save_globals():
+            controller = ReplicatedObjectController(
+                self.app, 'account', 'container', 'object')
+            set_http_connect(200, 200, 202, 202, 202)
+            orig_time = time.time
+            try:
+                t = time.time()
+                time.time = lambda: t
+                req = Request.blank('/v1/a/c/o', {},
+                                    headers={'Content-Type': 'foo/bar',
+                                             'X-Delete-After': '60'})
+                self.app.update_request(req)
+                res = controller.POST(req)
+                self.assertEqual(res.status, '202 Fake')
+                self.assertEqual(req.headers.get('x-delete-at'),
+                                 str(int(t + 60)))
+            finally:
+                time.time = orig_time
+
+    @unpatch_policies
+    def test_leak_1(self):
+        _request_instances = weakref.WeakKeyDictionary()
+        _orig_init = Request.__init__
+
+        def request_init(self, *args, **kwargs):
+            _orig_init(self, *args, **kwargs)
+            _request_instances[self] = None
+
+        with mock.patch.object(Request, "__init__", request_init):
+            prolis = _test_sockets[0]
+            prosrv = _test_servers[0]
+            obj_len = prosrv.client_chunk_size * 2
+            # PUT test file
             sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-            fd = sock.makefile()
-            fd.write('PUT /v1/a/versions/name HTTP/1.1\r\nHost: '
-                     'localhost\r\nConnection: close\r\nX-Storage-Token: '
-                     't\r\nContent-Length: 5\r\nContent-Type: text/jibberish%s'
-                     '\r\n\r\n%05d\r\n' % (segment, segment))
+            fd = sock.makefile('rwb')
+            fd.write(b'PUT /v1/a/c/test_leak_1 HTTP/1.1\r\n'
+                     b'Host: localhost\r\n'
+                     b'Connection: close\r\n'
+                     b'X-Auth-Token: t\r\n'
+                     b'Content-Length: %d\r\n'
+                     b'Content-Type: application/octet-stream\r\n'
+                     b'\r\n%s' % (obj_len, b'a' * obj_len))
             fd.flush()
             headers = readuntil2crlfs(fd)
-            exp = 'HTTP/1.1 201'
-            self.assertEquals(headers[:len(exp)], exp)
-            # Ensure retrieving the manifest file gets the latest version
+            exp = b'HTTP/1.1 201'
+            self.assertEqual(headers[:len(exp)], exp)
+            # Remember Request instance count, make sure the GC is run for
+            # pythons without reference counting.
+            for i in range(4):
+                sleep(0)  # let eventlet do its thing
+                gc.collect()
+            else:
+                sleep(0)
+            before_request_instances = len(_request_instances)
+            # GET test file, but disconnect early
             sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-            fd = sock.makefile()
-            fd.write('GET /v1/a/versions/name HTTP/1.1\r\nHost: '
-                     'localhost\r\nConnection: close\r\nX-Auth-Token: t\r\n'
-                     '\r\n')
+            fd = sock.makefile('rwb')
+            fd.write(b'GET /v1/a/c/test_leak_1 HTTP/1.1\r\n'
+                     b'Host: localhost\r\n'
+                     b'Connection: close\r\n'
+                     b'X-Auth-Token: t\r\n'
+                     b'\r\n')
             fd.flush()
             headers = readuntil2crlfs(fd)
-            exp = 'HTTP/1.1 200'
-            self.assertEquals(headers[:len(exp)], exp)
-            self.assert_('Content-Type: text/jibberish%s' % segment in headers)
-            self.assert_('X-Object-Meta-Foo: barbaz' not in headers)
-            body = fd.read()
-            self.assertEquals(body, '%05d' % segment)
-        # Ensure we have the right number of versions saved
-        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('GET /v1/a/vers?prefix=004name/ HTTP/1.1\r\nHost: '
-                 'localhost\r\nConnection: close\r\nX-Auth-Token: t\r\n\r\n')
-        fd.flush()
-        headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 200'
-        self.assertEquals(headers[:len(exp)], exp)
-        body = fd.read()
-        versions = [x for x in body.split('\n') if x]
-        self.assertEquals(len(versions), versions_to_create - 1)
-        # copy a version and make sure the version info is stripped
+            exp = b'HTTP/1.1 200'
+            self.assertEqual(headers[:len(exp)], exp)
+            fd.read(1)
+            sock.fd._real_close()
+            # Make sure the GC is run again for pythons without reference
+            # counting
+            for i in range(4):
+                sleep(0)  # let eventlet do its thing
+                gc.collect()
+            else:
+                sleep(0)
+            self.assertEqual(
+                before_request_instances, len(_request_instances))
+
+    def test_OPTIONS(self):
+        with save_globals():
+            controller = ReplicatedObjectController(
+                self.app, 'a', 'c', 'o.jpg')
+
+            def my_empty_container_info(*args):
+                return {}
+            controller.container_info = my_empty_container_info
+            req = Request.blank(
+                '/v1/a/c/o.jpg',
+                {'REQUEST_METHOD': 'OPTIONS'},
+                headers={'Origin': 'http://foo.com',
+                         'Access-Control-Request-Method': 'GET'})
+            resp = controller.OPTIONS(req)
+            self.assertEqual(401, resp.status_int)
+            self.assertNotIn('Access-Control-Allow-Origin', resp.headers)
+            self.assertNotIn('Vary', resp.headers)
+
+            def my_empty_origin_container_info(*args):
+                return {'cors': {'allow_origin': None}}
+            controller.container_info = my_empty_origin_container_info
+            req = Request.blank(
+                '/v1/a/c/o.jpg',
+                {'REQUEST_METHOD': 'OPTIONS'},
+                headers={'Origin': 'http://foo.com',
+                         'Access-Control-Request-Method': 'GET'})
+            resp = controller.OPTIONS(req)
+            self.assertEqual(401, resp.status_int)
+            self.assertNotIn('Access-Control-Allow-Origin', resp.headers)
+            self.assertNotIn('Vary', resp.headers)
+
+            def my_container_info(*args):
+                return {
+                    'cors': {
+                        'allow_origin': 'http://foo.bar:8080 https://foo.bar',
+                        'max_age': '999',
+                    }
+                }
+            controller.container_info = my_container_info
+            req = Request.blank(
+                '/v1/a/c/o.jpg',
+                {'REQUEST_METHOD': 'OPTIONS'},
+                headers={'Origin': 'https://foo.bar',
+                         'Access-Control-Request-Method': 'GET'})
+            req.content_length = 0
+            resp = controller.OPTIONS(req)
+            self.assertEqual(200, resp.status_int)
+            self.assertEqual(
+                'https://foo.bar',
+                resp.headers['access-control-allow-origin'])
+            self.assertEqual('Origin', resp.headers.get('vary'))
+            self.assertEqual(
+                sorted(resp.headers['access-control-allow-methods']
+                       .split(', ')),
+                sorted('OPTIONS GET POST PUT DELETE HEAD'.split()))
+            self.assertEqual('999', resp.headers['access-control-max-age'])
+
+            req = Request.blank(
+                '/v1/a/c/o.jpg',
+                {'REQUEST_METHOD': 'OPTIONS'},
+                headers={'Origin': 'https://foo.bar'})
+            req.content_length = 0
+            resp = controller.OPTIONS(req)
+            self.assertEqual(401, resp.status_int)
+            self.assertNotIn('Access-Control-Allow-Origin', resp.headers)
+            self.assertNotIn('Vary', resp.headers)
+
+            req = Request.blank('/v1/a/c/o.jpg', {'REQUEST_METHOD': 'OPTIONS'})
+            req.content_length = 0
+            resp = controller.OPTIONS(req)
+            self.assertEqual(200, resp.status_int)
+            self.assertEqual(
+                sorted(resp.headers['Allow'].split(', ')),
+                sorted('OPTIONS GET POST PUT DELETE HEAD'.split()))
+            self.assertNotIn('Access-Control-Allow-Origin', resp.headers)
+            self.assertNotIn('Vary', resp.headers)
+
+            req = Request.blank(
+                '/v1/a/c/o.jpg',
+                {'REQUEST_METHOD': 'OPTIONS'},
+                headers={'Origin': 'http://foo.com'})
+            resp = controller.OPTIONS(req)
+            self.assertEqual(401, resp.status_int)
+            self.assertNotIn('Access-Control-Allow-Origin', resp.headers)
+            self.assertNotIn('Vary', resp.headers)
+
+            req = Request.blank(
+                '/v1/a/c/o.jpg',
+                {'REQUEST_METHOD': 'OPTIONS'},
+                headers={'Origin': 'http://foo.bar',
+                         'Access-Control-Request-Method': 'GET'})
+            controller.app.cors_allow_origin = ['http://foo.bar', ]
+            resp = controller.OPTIONS(req)
+            self.assertEqual(200, resp.status_int)
+            self.assertEqual('Origin', resp.headers.get('vary'))
+
+            def my_container_info_wildcard(*args):
+                return {
+                    'cors': {
+                        'allow_origin': '*',
+                        'max_age': '999',
+                    }
+                }
+            controller.container_info = my_container_info_wildcard
+            req = Request.blank(
+                '/v1/a/c/o.jpg',
+                {'REQUEST_METHOD': 'OPTIONS'},
+                headers={'Origin': 'https://bar.baz',
+                         'Access-Control-Request-Method': 'GET'})
+            req.content_length = 0
+            resp = controller.OPTIONS(req)
+            self.assertEqual(200, resp.status_int)
+            self.assertEqual('*', resp.headers['access-control-allow-origin'])
+            self.assertNotIn('Vary', resp.headers)
+            self.assertEqual(
+                sorted(resp.headers['access-control-allow-methods']
+                       .split(', ')),
+                sorted('OPTIONS GET POST PUT DELETE HEAD'.split()))
+            self.assertEqual('999', resp.headers['access-control-max-age'])
+
+    def _get_CORS_response(self, container_cors, strict_mode, object_get=None):
+        with save_globals():
+            controller = ReplicatedObjectController(
+                self.app, 'a', 'c', 'o')
+
+            def stubContainerInfo(*args):
+                return {
+                    'cors': container_cors
+                }
+
+            controller.container_info = stubContainerInfo
+            controller.app.strict_cors_mode = strict_mode
+
+            def objectGET(controller, req):
+                return Response(headers={
+                    'X-Object-Meta-Color': 'red',
+                    'X-Super-Secret': 'hush',
+                })
+
+            mock_object_get = object_get or objectGET
+
+            req = Request.blank(
+                '/v1/a/c/o.jpg',
+                {'REQUEST_METHOD': 'GET'},
+                headers={'Origin': 'http://foo.bar'})
+
+            resp = cors_validation(mock_object_get)(controller, req)
+
+            return resp
+
+    def test_CORS_valid_non_strict(self):
+        # test expose_headers to non-allowed origins
+        container_cors = {'allow_origin': 'http://not.foo.bar',
+                          'expose_headers': 'X-Object-Meta-Color '
+                                            'X-Object-Meta-Color-Ex'}
+        resp = self._get_CORS_response(
+            container_cors=container_cors, strict_mode=False)
+
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual('http://foo.bar',
+                         resp.headers['access-control-allow-origin'])
+        self.assertEqual('Origin', resp.headers['vary'])
+        self.assertEqual('red', resp.headers['x-object-meta-color'])
+        # X-Super-Secret is in the response, but not "exposed"
+        self.assertEqual('hush', resp.headers['x-super-secret'])
+        self.assertIn('access-control-expose-headers', resp.headers)
+        exposed = set(
+            h.strip() for h in
+            resp.headers['access-control-expose-headers'].split(','))
+        expected_exposed = set([
+            'cache-control', 'content-language', 'content-type', 'expires',
+            'last-modified', 'pragma', 'etag', 'x-timestamp', 'x-trans-id',
+            'x-openstack-request-id', 'x-object-meta-color',
+            'x-object-meta-color-ex'])
+        self.assertEqual(expected_exposed, exposed)
+
+        # test allow_origin *
+        container_cors = {'allow_origin': '*'}
+
+        resp = self._get_CORS_response(
+            container_cors=container_cors, strict_mode=False)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual('*',
+                         resp.headers['access-control-allow-origin'])
+        self.assertNotIn('vary', resp.headers)
+
+        # test allow_origin empty
+        container_cors = {'allow_origin': ''}
+        resp = self._get_CORS_response(
+            container_cors=container_cors, strict_mode=False)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual('http://foo.bar',
+                         resp.headers['access-control-allow-origin'])
+        self.assertEqual('Origin', resp.headers['vary'])
+
+    def test_CORS_valid_strict(self):
+        # test expose_headers to non-allowed origins
+        container_cors = {'allow_origin': 'http://not.foo.bar',
+                          'expose_headers': 'X-Object-Meta-Color '
+                                            'X-Object-Meta-Color-Ex'}
+        resp = self._get_CORS_response(
+            container_cors=container_cors, strict_mode=True)
+
+        self.assertEqual(200, resp.status_int)
+        self.assertNotIn('access-control-expose-headers', resp.headers)
+        self.assertNotIn('access-control-allow-origin', resp.headers)
+
+        # test allow_origin *
+        container_cors = {'allow_origin': '*'}
+
+        resp = self._get_CORS_response(
+            container_cors=container_cors, strict_mode=True)
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual('*',
+                         resp.headers['access-control-allow-origin'])
+        self.assertNotIn('vary', resp.headers)
+        self.assertEqual('red', resp.headers['x-object-meta-color'])
+        # X-Super-Secret is in the response, but not "exposed"
+        self.assertEqual('hush', resp.headers['x-super-secret'])
+        self.assertIn('access-control-expose-headers', resp.headers)
+        exposed = set(
+            h.strip() for h in
+            resp.headers['access-control-expose-headers'].split(','))
+        expected_exposed = set([
+            'cache-control', 'content-language', 'content-type', 'expires',
+            'last-modified', 'pragma', 'etag', 'x-timestamp', 'x-trans-id',
+            'x-openstack-request-id', 'x-object-meta-color'])
+        self.assertEqual(expected_exposed, exposed)
+
+        # test allow_origin empty
+        container_cors = {'allow_origin': ''}
+        resp = self._get_CORS_response(
+            container_cors=container_cors, strict_mode=True)
+        self.assertNotIn('access-control-expose-headers', resp.headers)
+        self.assertNotIn('access-control-allow-origin', resp.headers)
+        self.assertNotIn('vary', resp.headers)
+
+        # test proxy server cors_allow_origin option
+        self.app.cors_allow_origin = ['http://foo.bar']
+        resp = self._get_CORS_response(
+            container_cors=container_cors, strict_mode=True)
+        self.assertEqual('http://foo.bar',
+                         resp.headers['access-control-allow-origin'])
+        self.assertEqual('Origin', resp.headers['vary'])
+        self.assertEqual(expected_exposed, exposed)
+
+    def test_CORS_valid_with_obj_headers(self):
+        container_cors = {'allow_origin': 'http://foo.bar'}
+
+        def objectGET(controller, req):
+            return Response(headers={
+                'X-Object-Meta-Color': 'red',
+                'X-Super-Secret': 'hush',
+                'Access-Control-Allow-Origin': 'http://obj.origin',
+                'Access-Control-Expose-Headers': 'x-trans-id'
+            })
+
+        resp = self._get_CORS_response(
+            container_cors=container_cors, strict_mode=True,
+            object_get=objectGET)
+
+        self.assertEqual(200, resp.status_int)
+        self.assertEqual('http://obj.origin',
+                         resp.headers['access-control-allow-origin'])
+        self.assertEqual('x-trans-id',
+                         resp.headers['access-control-expose-headers'])
+
+    def test_CORS_expose_headers(self):
+        default_expected_exposed = set([
+            'cache-control', 'content-language', 'content-type', 'expires',
+            'last-modified', 'pragma', 'etag', 'x-timestamp', 'x-trans-id',
+            'x-openstack-request-id'])
+
+        def objectGET(controller, req):
+            return Response(headers={
+                'X-Custom-Operator': 'hush',
+                'X-Custom-User': 'hush',
+            })
+
+        # test default expose_headers
+        self.app.cors_expose_headers = []
+        container_cors = {'allow_origin': 'http://foo.bar'}
+        resp = self._get_CORS_response(container_cors=container_cors,
+                                       strict_mode=False, object_get=objectGET)
+
+        self.assertEqual(200, resp.status_int)
+        self.assertIn('access-control-expose-headers', resp.headers)
+        exposed = set(
+            h.strip() for h in
+            resp.headers['access-control-expose-headers'].split(','))
+        self.assertEqual(default_expected_exposed, exposed)
+
+        # test operator expose_headers
+        self.app.cors_expose_headers = ['x-custom-operator', ]
+        container_cors = {'allow_origin': 'http://foo.bar'}
+        resp = self._get_CORS_response(container_cors=container_cors,
+                                       strict_mode=False, object_get=objectGET)
+
+        self.assertEqual(200, resp.status_int)
+        self.assertIn('access-control-expose-headers', resp.headers)
+        exposed = set(
+            h.strip() for h in
+            resp.headers['access-control-expose-headers'].split(','))
+        self.assertEqual(default_expected_exposed | set(['x-custom-operator']),
+                         exposed)
+
+        # test user expose_headers
+        self.app.cors_expose_headers = []
+        container_cors = {'allow_origin': 'http://foo.bar',
+                          'expose_headers': 'x-custom-user'}
+        resp = self._get_CORS_response(container_cors=container_cors,
+                                       strict_mode=False, object_get=objectGET)
+
+        self.assertEqual(200, resp.status_int)
+        self.assertIn('access-control-expose-headers', resp.headers)
+        exposed = set(
+            h.strip() for h in
+            resp.headers['access-control-expose-headers'].split(','))
+        self.assertEqual(default_expected_exposed | set(['x-custom-user']),
+                         exposed)
+
+        # test user and operator expose_headers
+        self.app.cors_expose_headers = ['x-custom-operator', ]
+        container_cors = {'allow_origin': 'http://foo.bar',
+                          'expose_headers': 'x-custom-user'}
+        resp = self._get_CORS_response(container_cors=container_cors,
+                                       strict_mode=False, object_get=objectGET)
+
+        self.assertEqual(200, resp.status_int)
+        self.assertIn('access-control-expose-headers', resp.headers)
+        exposed = set(
+            h.strip() for h in
+            resp.headers['access-control-expose-headers'].split(','))
+        self.assertEqual(default_expected_exposed | set(['x-custom-user',
+                                                         'x-custom-operator']),
+                         exposed)
+
+    def _gather_x_container_headers(self, controller_call, req, *connect_args,
+                                    **kwargs):
+        header_list = kwargs.pop('header_list', ['X-Container-Device',
+                                                 'X-Container-Host',
+                                                 'X-Container-Partition',
+                                                 'X-Container-Root-Db-State'])
+        seen_headers = []
+
+        def capture_headers(ipaddr, port, device, partition, method,
+                            path, headers=None, query_string=None):
+            captured = {}
+            for header in header_list:
+                captured[header] = headers.get(header)
+            seen_headers.append(captured)
+
+        with save_globals():
+            self.app.allow_account_management = True
+
+            set_http_connect(*connect_args, give_connect=capture_headers,
+                             **kwargs)
+            resp = controller_call(req)
+            self.assertEqual(2, resp.status_int // 100)  # sanity check
+
+            if kwargs.get('no_heads', False):
+                results = seen_headers
+            else:
+                # don't care about the account/container HEADs, so chuck
+                # the first two requests
+                results = seen_headers[2:]
+            return sorted(results,
+                          key=lambda d: d.get(header_list[0]) or 'z')
+
+    def test_x_container_headers_db_states(self):
+        # let's force the db_states by inserting a crafted container
+        # info into info cache
+        crafted_container_info = {
+            'status': 200, 'read_acl': None, 'write_acl': None,
+            'sync_to': None, 'sync_key': None, 'object_count': 0, 'bytes': 0,
+            'versions': None, 'storage_policy': 0,
+            'cors': {
+                'allow_origin': None, 'expose_headers': None, 'max_age': None},
+            'meta': {}, 'sysmeta': {},
+            'created_at': '1', 'put_timestamp': None,
+            'delete_timestamp': None,
+            'status_changed_at': None
+        }
+        shardrange = ShardRange('.sharded_a/c_something', 0, 'm', 'z')
+
+        # We should always get X-Container-Root-Db-State with the current
+        # db_state and when db_state is either sharding or sharded we should
+        # also get an X-Backend-Quoted-Container-Path with a shard name.
+        for db_state, expect_cont_path in (
+                (NOTFOUND, False), (UNSHARDED, False), (SHARDING, True),
+                (SHARDED, True), (COLLAPSED, False)):
+            crafted_container_info['sharding_state'] = db_state
+            req = Request.blank(
+                '/v1/a/c/o',
+                environ={'REQUEST_METHOD': 'PUT', 'swift.infocache': {}},
+                headers={'Content-Length': '5'}, body='12345')
+            req.environ['swift.infocache']['container/a/c'] = \
+                crafted_container_info
+
+            exp_seen_header_list = [
+                'X-Container-Device', 'X-Container-Host',
+                'X-Container-Partition', 'X-Container-Root-Db-State']
+            expected_headers = [
+                {'X-Container-Host': '10.0.0.0:1000',
+                    'X-Container-Partition': '0',
+                    'X-Container-Device': 'sda',
+                    'X-Container-Root-Db-State': db_state},
+                {'X-Container-Host': '10.0.0.1:1001',
+                    'X-Container-Partition': '0',
+                    'X-Container-Device': 'sdb',
+                    'X-Container-Root-Db-State': db_state},
+                {'X-Container-Host': '10.0.0.2:1002',
+                    'X-Container-Partition': '0',
+                    'X-Container-Device': 'sdc',
+                    'X-Container-Root-Db-State': db_state}]
+            if expect_cont_path:
+                exp_seen_header_list.append('X-Backend-Quoted-Container-Path')
+                for headers in expected_headers:
+                    headers['X-Backend-Quoted-Container-Path'] = \
+                        shardrange.name
+
+            with mock.patch('swift.proxy.controllers.obj.BaseObjectController.'
+                            '_get_update_shard', return_value=shardrange):
+                controller = ReplicatedObjectController(
+                    self.app, 'a', 'c', 'o')
+                seen_headers = self._gather_x_container_headers(
+                    controller.PUT, req,
+                    201, 201, 201,  # PUT PUT PUT
+                    header_list=exp_seen_header_list, no_heads=True)
+
+            self.assertEqual(seen_headers, expected_headers)
+
+    def test_PUT_x_container_headers_with_equal_replicas(self):
+        req = Request.blank('/v1/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Content-Length': '5'}, body='12345')
+        controller = ReplicatedObjectController(
+            self.app, 'a', 'c', 'o')
+        seen_headers = self._gather_x_container_headers(
+            controller.PUT, req,
+            200, 200, 201, 201, 201)   # HEAD HEAD PUT PUT PUT
+        self.assertEqual(
+            seen_headers, [
+                {'X-Container-Host': '10.0.0.0:1000',
+                 'X-Container-Partition': '0',
+                 'X-Container-Device': 'sda',
+                 'X-Container-Root-Db-State': 'unsharded'},
+                {'X-Container-Host': '10.0.0.1:1001',
+                 'X-Container-Partition': '0',
+                 'X-Container-Device': 'sdb',
+                 'X-Container-Root-Db-State': 'unsharded'},
+                {'X-Container-Host': '10.0.0.2:1002',
+                 'X-Container-Partition': '0',
+                 'X-Container-Device': 'sdc',
+                 'X-Container-Root-Db-State': 'unsharded'}])
+
+    def test_PUT_x_container_headers_with_fewer_container_replicas(self):
+        self.app.container_ring.set_replicas(2)
+
+        req = Request.blank('/v1/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Content-Length': '5'}, body='12345')
+        controller = ReplicatedObjectController(
+            self.app, 'a', 'c', 'o')
+        seen_headers = self._gather_x_container_headers(
+            controller.PUT, req,
+            200, 200, 201, 201, 201)   # HEAD HEAD PUT PUT PUT
+
+        self.assertEqual(
+            seen_headers, [
+                {'X-Container-Host': '10.0.0.0:1000',
+                 'X-Container-Partition': '0',
+                 'X-Container-Device': 'sda',
+                 'X-Container-Root-Db-State': 'unsharded'},
+                {'X-Container-Host': '10.0.0.1:1001',
+                 'X-Container-Partition': '0',
+                 'X-Container-Device': 'sdb',
+                 'X-Container-Root-Db-State': 'unsharded'},
+                {'X-Container-Host': None,
+                 'X-Container-Partition': None,
+                 'X-Container-Device': None,
+                 'X-Container-Root-Db-State': None}])
+
+    def test_PUT_x_container_headers_with_many_object_replicas(self):
+        POLICIES[0].object_ring.set_replicas(11)
+
+        req = Request.blank('/v1/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Content-Length': '5'}, body='12345')
+        controller = ReplicatedObjectController(
+            self.app, 'a', 'c', 'o')
+        seen_headers = self._gather_x_container_headers(
+            controller.PUT, req,
+            # HEAD HEAD PUT PUT PUT PUT PUT PUT PUT PUT PUT PUT PUT
+            200, 200, 201, 201, 201, 201, 201, 201, 201, 201, 201, 201, 201)
+
+        self.assertEqual(
+            dict(collections.Counter(tuple(sorted(h.items()))
+                                     for h in seen_headers)),
+            {(('X-Container-Device', 'sda'),
+              ('X-Container-Host', '10.0.0.0:1000'),
+              ('X-Container-Partition', '0'),
+              ('X-Container-Root-Db-State', 'unsharded')): 3,
+             (('X-Container-Device', 'sdb'),
+              ('X-Container-Host', '10.0.0.1:1001'),
+              ('X-Container-Partition', '0'),
+              ('X-Container-Root-Db-State', 'unsharded')): 2,
+             (('X-Container-Device', 'sdc'),
+              ('X-Container-Host', '10.0.0.2:1002'),
+              ('X-Container-Partition', '0'),
+              ('X-Container-Root-Db-State', 'unsharded')): 2,
+             (('X-Container-Device', None),
+              ('X-Container-Host', None),
+              ('X-Container-Partition', None),
+              ('X-Container-Root-Db-State', None)): 4})
+
+    def test_PUT_x_container_headers_with_more_container_replicas(self):
+        self.app.container_ring.set_replicas(4)
+
+        req = Request.blank('/v1/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Content-Length': '5'}, body='12345')
+        controller = ReplicatedObjectController(
+            self.app, 'a', 'c', 'o')
+        seen_headers = self._gather_x_container_headers(
+            controller.PUT, req,
+            200, 200, 201, 201, 201)   # HEAD HEAD PUT PUT PUT
+
+        self.assertEqual(
+            seen_headers, [
+                {'X-Container-Host': '10.0.0.0:1000,10.0.0.3:1003',
+                 'X-Container-Partition': '0',
+                 'X-Container-Device': 'sda,sdd',
+                 'X-Container-Root-Db-State': 'unsharded'},
+                {'X-Container-Host': '10.0.0.1:1001',
+                 'X-Container-Partition': '0',
+                 'X-Container-Device': 'sdb',
+                 'X-Container-Root-Db-State': 'unsharded'},
+                {'X-Container-Host': '10.0.0.2:1002',
+                 'X-Container-Partition': '0',
+                 'X-Container-Device': 'sdc',
+                 'X-Container-Root-Db-State': 'unsharded'}])
+
+    def test_POST_x_container_headers_with_more_container_replicas(self):
+        self.app.container_ring.set_replicas(4)
+
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'POST'},
+                            headers={'Content-Type': 'application/stuff'})
+        controller = ReplicatedObjectController(
+            self.app, 'a', 'c', 'o')
+        seen_headers = self._gather_x_container_headers(
+            controller.POST, req,
+            200, 200, 200, 200, 200)   # HEAD HEAD POST POST POST
+
+        self.assertEqual(
+            seen_headers, [
+                {'X-Container-Host': '10.0.0.0:1000,10.0.0.3:1003',
+                 'X-Container-Partition': '0',
+                 'X-Container-Device': 'sda,sdd',
+                 'X-Container-Root-Db-State': 'unsharded'},
+                {'X-Container-Host': '10.0.0.1:1001',
+                 'X-Container-Partition': '0',
+                 'X-Container-Device': 'sdb',
+                 'X-Container-Root-Db-State': 'unsharded'},
+                {'X-Container-Host': '10.0.0.2:1002',
+                 'X-Container-Partition': '0',
+                 'X-Container-Device': 'sdc',
+                 'X-Container-Root-Db-State': 'unsharded'}])
+
+    def test_DELETE_x_container_headers_with_more_container_replicas(self):
+        self.app.container_ring.set_replicas(4)
+
+        req = Request.blank('/v1/a/c/o',
+                            environ={'REQUEST_METHOD': 'DELETE'},
+                            headers={'Content-Type': 'application/stuff'})
+        controller = ReplicatedObjectController(
+            self.app, 'a', 'c', 'o')
+        seen_headers = self._gather_x_container_headers(
+            controller.DELETE, req,
+            200, 200, 200, 200, 200)   # HEAD HEAD DELETE DELETE DELETE
+
+        self.maxDiff = None
+        self.assertEqual(seen_headers, [
+            {'X-Container-Host': '10.0.0.0:1000,10.0.0.3:1003',
+             'X-Container-Partition': '0',
+             'X-Container-Device': 'sda,sdd',
+             'X-Container-Root-Db-State': 'unsharded'},
+            {'X-Container-Host': '10.0.0.1:1001',
+             'X-Container-Partition': '0',
+             'X-Container-Device': 'sdb',
+             'X-Container-Root-Db-State': 'unsharded'},
+            {'X-Container-Host': '10.0.0.2:1002',
+             'X-Container-Partition': '0',
+             'X-Container-Device': 'sdc',
+             'X-Container-Root-Db-State': 'unsharded'}
+        ])
+
+    @mock.patch('time.time', new=lambda: STATIC_TIME)
+    def test_PUT_x_delete_at_with_fewer_container_replicas(self):
+        self.app.container_ring.set_replicas(2)
+
+        delete_at_timestamp = int(time.time()) + 100000
+        delete_at_container = self.app.expirer_config.get_expirer_container(
+            delete_at_timestamp, 'a', 'c', 'o')
+        req = Request.blank('/v1/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Content-Type': 'application/stuff',
+                                     'Content-Length': '0',
+                                     'X-Delete-At': str(delete_at_timestamp)})
+        controller = ReplicatedObjectController(
+            self.app, 'a', 'c', 'o')
+        seen_headers = self._gather_x_container_headers(
+            controller.PUT, req,
+            200, 200, 201, 201, 201,   # HEAD HEAD PUT PUT PUT
+            header_list=('X-Delete-At-Host', 'X-Delete-At-Device',
+                         'X-Delete-At-Partition', 'X-Delete-At-Container'))
+
+        self.assertEqual(seen_headers, [
+            {'X-Delete-At-Host': '10.0.0.0:1000',
+             'X-Delete-At-Container': delete_at_container,
+             'X-Delete-At-Partition': '0',
+             'X-Delete-At-Device': 'sda'},
+            {'X-Delete-At-Host': '10.0.0.1:1001',
+             'X-Delete-At-Container': delete_at_container,
+             'X-Delete-At-Partition': '0',
+             'X-Delete-At-Device': 'sdb'},
+            {'X-Delete-At-Host': None,
+             'X-Delete-At-Partition': None,
+             'X-Delete-At-Container': None,
+             'X-Delete-At-Device': None},
+        ])
+
+    @mock.patch('time.time', new=lambda: STATIC_TIME)
+    def test_PUT_x_delete_at_with_more_container_replicas(self):
+        self.app.container_ring.set_replicas(4)
+        self.app.expirer_config = proxy_server.expirer.ExpirerConfig(
+            {
+                'expiring_objects_account_name': 'expires',
+                'expiring_objects_container_divisor': 600,
+            }, logger=self.logger, container_ring=self.app.container_ring)
+        self.assertEqual([
+            'expiring_objects_container_divisor is deprecated',
+            'expiring_objects_account_name is deprecated; you need to migrate '
+            'to the standard .expiring_objects account',
+        ], self.logger.get_lines_for_level('warning'))
+        self.assertIs(self.app.container_ring,
+                      self.app.expirer_config.container_ring)
+
+        delete_at_timestamp = int(time.time()) + 100000
+        delete_at_container = self.app.expirer_config.get_expirer_container(
+            delete_at_timestamp, 'a', 'c', 'o')
+        req = Request.blank('/v1/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
+                            headers={'Content-Type': 'application/stuff',
+                                     'Content-Length': 0,
+                                     'X-Delete-At': str(delete_at_timestamp)})
+        controller = ReplicatedObjectController(
+            self.app, 'a', 'c', 'o')
+        seen_headers = self._gather_x_container_headers(
+            controller.PUT, req,
+            200, 200, 201, 201, 201,   # HEAD HEAD PUT PUT PUT
+            header_list=('X-Delete-At-Host', 'X-Delete-At-Device',
+                         'X-Delete-At-Partition', 'X-Delete-At-Container'))
+        self.assertEqual(seen_headers, [
+            {'X-Delete-At-Host': '10.0.0.0:1000,10.0.0.3:1003',
+             'X-Delete-At-Container': delete_at_container,
+             'X-Delete-At-Partition': '0',
+             'X-Delete-At-Device': 'sda,sdd'},
+            {'X-Delete-At-Host': '10.0.0.1:1001',
+             'X-Delete-At-Container': delete_at_container,
+             'X-Delete-At-Partition': '0',
+             'X-Delete-At-Device': 'sdb'},
+            {'X-Delete-At-Host': '10.0.0.2:1002',
+             'X-Delete-At-Container': delete_at_container,
+             'X-Delete-At-Partition': '0',
+             'X-Delete-At-Device': 'sdc'}
+        ])
+
+
+@contextmanager
+def in_process_proxy(prosrv, **extra_server_kwargs):
+    server_kwargs = {
+        'protocol': SwiftHttpProtocol,
+        'capitalize_response_headers': False,
+    }
+    server_kwargs.update(extra_server_kwargs)
+    prolis = listen_zero()
+    try:
+        proxy_thread = spawn(wsgi.server, prolis, prosrv,
+                             prosrv.logger, **server_kwargs)
+        yield prolis
+    finally:
+        proxy_thread.kill()
+
+
+class BaseTestECObjectController(BaseTestObjectController):
+    def test_PUT_ec(self):
+        self.put_container(self.ec_policy.name, self.ec_policy.name)
+
+        obj = b'abCD' * 10  # small, so we don't get multiple EC stripes
+        prolis = _test_sockets[0]
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('COPY /v1/a/versions/name HTTP/1.1\r\nHost: '
-                 'localhost\r\nConnection: close\r\nX-Auth-Token: '
-                 't\r\nDestination: versions/copied_name\r\n'
-                 'Content-Length: 0\r\n\r\n')
+        fd = sock.makefile('rwb')
+        fd.write(('PUT /v1/a/%s/o1 HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Connection: close\r\n'
+                  'Etag: "%s"\r\n'
+                  'Content-Length: %d\r\n'
+                  'X-Storage-Token: t\r\n'
+                  'Content-Type: application/octet-stream\r\n'
+                  '\r\n' % (self.ec_policy.name,
+                            md5(obj, usedforsecurity=False).hexdigest(),
+                            len(obj))).encode('ascii'))
+        fd.write(obj)
         fd.flush()
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 2'  # 2xx series response to the COPY
-        self.assertEquals(headers[:len(exp)], exp)
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
+
+        ecd = self.ec_policy.pyeclib_driver
+        expected_pieces = set(ecd.encode(obj))
+
+        # go to disk to make sure it's there and all erasure-coded
+        partition, nodes = self.ec_policy.object_ring.get_nodes(
+            'a', self.ec_policy.name, 'o1')
+        conf = {'devices': _testdir, 'mount_check': 'false'}
+        df_mgr = diskfile.DiskFileRouter(conf, debug_logger())[self.ec_policy]
+
+        got_pieces = set()
+        got_indices = set()
+        got_durable = []
+        for node_index, node in enumerate(nodes):
+            df = df_mgr.get_diskfile(node['device'], partition,
+                                     'a', self.ec_policy.name, 'o1',
+                                     policy=self.ec_policy)
+            with df.open():
+                meta = df.get_metadata()
+                contents = b''.join(df.reader())
+                got_pieces.add(contents)
+
+                lmeta = dict((k.lower(), v) for k, v in meta.items())
+                got_indices.add(
+                    lmeta['x-object-sysmeta-ec-frag-index'])
+
+                self.assertEqual(
+                    lmeta['x-object-sysmeta-ec-etag'],
+                    md5(obj, usedforsecurity=False).hexdigest())
+                self.assertEqual(
+                    lmeta['x-object-sysmeta-ec-content-length'],
+                    str(len(obj)))
+                self.assertEqual(
+                    lmeta['x-object-sysmeta-ec-segment-size'],
+                    '4096')
+                self.assertEqual(
+                    lmeta['x-object-sysmeta-ec-scheme'],
+                    '%s 2+1' % DEFAULT_TEST_EC_TYPE)
+                self.assertEqual(
+                    lmeta['etag'],
+                    md5(contents, usedforsecurity=False).hexdigest())
+
+                # check presence for a durable data file for the timestamp
+                durable_file = (
+                    utils.Timestamp(df.timestamp).internal +
+                    '#%s' % lmeta['x-object-sysmeta-ec-frag-index'] +
+                    '#d.data')
+                durable_file = os.path.join(
+                    _testdir, node['device'], storage_directory(
+                        diskfile.get_data_dir(self.ec_policy),
+                        partition, hash_path('a', self.ec_policy.name, 'o1')),
+                    durable_file)
+                if os.path.isfile(durable_file):
+                    got_durable.append(True)
+
+        self.assertEqual(expected_pieces, got_pieces)
+        self.assertEqual(set(('0', '1', '2')), got_indices)
+
+        # verify at least 2 puts made it all the way to the end of 2nd
+        # phase, ie at least 2 durable statuses were written
+        num_durable_puts = sum(d is True for d in got_durable)
+        self.assertGreaterEqual(num_durable_puts, 2)
+
+    def test_PUT_ec_multiple_segments(self):
+        self.put_container(self.ec_policy.name, self.ec_policy.name)
+
+        pyeclib_header_size = len(self.ec_policy.pyeclib_driver.encode(b"")[0])
+        segment_size = self.ec_policy.ec_segment_size
+
+        # Big enough to have multiple segments. Also a multiple of the
+        # segment size to get coverage of that path too.
+        obj = b'ABC' * segment_size
+
+        prolis = _test_sockets[0]
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('GET /v1/a/versions/copied_name HTTP/1.1\r\nHost: '
-                 'localhost\r\nConnection: close\r\nX-Auth-Token: t\r\n\r\n')
+        fd = sock.makefile('rwb')
+        fd.write(('PUT /v1/a/%s/o2 HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Connection: close\r\n'
+                  'Content-Length: %d\r\n'
+                  'X-Storage-Token: t\r\n'
+                  'Content-Type: application/octet-stream\r\n'
+                  '\r\n' % (self.ec_policy.name, len(obj))).encode('ascii'))
+        fd.write(obj)
         fd.flush()
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 200'
-        self.assertEquals(headers[:len(exp)], exp)
-        body = fd.read()
-        self.assertEquals(body, '%05d' % segment)
-        # post and make sure it's updated
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
+
+        # it's a 2+1 erasure code, so each fragment archive should be half
+        # the length of the object, plus three inline pyeclib metadata
+        # things (one per segment)
+        expected_length = (len(obj) // 2 + pyeclib_header_size * 3)
+
+        partition, nodes = self.ec_policy.object_ring.get_nodes(
+            'a', self.ec_policy.name, 'o2')
+
+        conf = {'devices': _testdir, 'mount_check': 'false'}
+        df_mgr = diskfile.DiskFileRouter(conf, debug_logger())[self.ec_policy]
+
+        got_durable = []
+        fragment_archives = []
+        for node in nodes:
+            df = df_mgr.get_diskfile(
+                node['device'], partition, 'a',
+                self.ec_policy.name, 'o2', policy=self.ec_policy)
+            with df.open():
+                meta = df.get_metadata()
+                contents = b''.join(df.reader())
+                fragment_archives.append(contents)
+                self.assertEqual(len(contents), expected_length)
+
+                durable_file = (
+                    utils.Timestamp(df.timestamp).internal +
+                    '#%s' % meta['X-Object-Sysmeta-Ec-Frag-Index'] +
+                    '#d.data')
+                durable_file = os.path.join(
+                    _testdir, node['device'], storage_directory(
+                        diskfile.get_data_dir(self.ec_policy),
+                        partition, hash_path('a', self.ec_policy.name, 'o2')),
+                    durable_file)
+                if os.path.isfile(durable_file):
+                    got_durable.append(True)
+
+        # Verify that we can decode each individual fragment and that they
+        # are all the correct size
+        fragment_size = self.ec_policy.fragment_size
+        nfragments = int(
+            math.ceil(float(len(fragment_archives[0])) / fragment_size))
+
+        for fragment_index in range(nfragments):
+            fragment_start = fragment_index * fragment_size
+            fragment_end = (fragment_index + 1) * fragment_size
+
+            try:
+                frags = [fa[fragment_start:fragment_end]
+                         for fa in fragment_archives]
+                seg = self.ec_policy.pyeclib_driver.decode(frags)
+            except ECDriverError:
+                self.fail("Failed to decode fragments %d; this probably "
+                          "means the fragments are not the sizes they "
+                          "should be" % fragment_index)
+
+            segment_start = fragment_index * segment_size
+            segment_end = (fragment_index + 1) * segment_size
+
+            self.assertEqual(seg, obj[segment_start:segment_end])
+
+        # verify at least 2 puts made it all the way to the end of 2nd
+        # phase, ie at least 2 .durable statuses were written
+        num_durable_puts = sum(d is True for d in got_durable)
+        self.assertGreaterEqual(num_durable_puts, 2)
+
+    def test_PUT_ec_object_etag_mismatch(self):
+        self.put_container(self.ec_policy.name, self.ec_policy.name)
+
+        obj = b'90:6A:02:60:B1:08-96da3e706025537fc42464916427727e'
+        prolis = _test_sockets[0]
+        prosrv = _test_servers[0]
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('POST /v1/a/versions/name HTTP/1.1\r\nHost: '
-                 'localhost\r\nConnection: close\r\nX-Auth-Token: '
-                 't\r\nContent-Type: foo/bar\r\nContent-Length: 0\r\n'
-                 'X-Object-Meta-Bar: foo\r\n\r\n')
+        fd = sock.makefile('rwb')
+        fd.write(('PUT /v1/a/%s/o3 HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Connection: close\r\n'
+                  'Etag: %s\r\n'
+                  'Content-Length: %d\r\n'
+                  'X-Storage-Token: t\r\n'
+                  'Content-Type: application/octet-stream\r\n'
+                  '\r\n' % (self.ec_policy.name,
+                            md5(b'something else',
+                                usedforsecurity=False).hexdigest(),
+                            len(obj))).encode('ascii'))
+        fd.write(obj)
         fd.flush()
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 2'  # 2xx series response to the POST
-        self.assertEquals(headers[:len(exp)], exp)
+        exp = b'HTTP/1.1 422'
+        self.assertEqual(headers[:len(exp)], exp)
+
+        # nothing should have made it to disk on the object servers
+        partition, nodes = prosrv.get_object_ring(
+            int(self.ec_policy)).get_nodes('a', self.ec_policy.name, 'o3')
+        conf = {'devices': _testdir, 'mount_check': 'false'}
+
+        df_mgr = diskfile.DiskFileRouter(conf, debug_logger())[self.ec_policy]
+
+        for node in nodes:
+            df = df_mgr.get_diskfile(node['device'], partition,
+                                     'a', self.ec_policy.name, 'o3',
+                                     policy=self.ec_policy)
+            self.assertRaises(DiskFileNotExist, df.open)
+
+    def test_PUT_ec_fragment_archive_etag_mismatch(self):
+        self.put_container(self.ec_policy.name, self.ec_policy.name)
+
+        # Cause a hash mismatch by feeding one particular MD5 hasher some
+        # extra data. The goal here is to get exactly more than one of the
+        # hashers in an object server.
+        count = (
+            self.ec_policy.object_ring.replica_count - self.ec_policy.ec_ndata)
+        countdown = [count]
+
+        def busted_md5_constructor(initial_str=b"", usedforsecurity=True):
+            hasher = md5(initial_str, usedforsecurity=usedforsecurity)
+            if countdown[0] > 0:
+                hasher.update(b'wrong')
+            countdown[0] -= 1
+            return hasher
+
+        obj = b'uvarovite-esurience-cerated-symphysic'
+        prolis = _test_sockets[0]
+        prosrv = _test_servers[0]
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('GET /v1/a/versions/name HTTP/1.1\r\nHost: '
-                 'localhost\r\nConnection: close\r\nX-Auth-Token: t\r\n\r\n')
-        fd.flush()
-        headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 200'
-        self.assertEquals(headers[:len(exp)], exp)
-        self.assert_('Content-Type: foo/bar' in headers)
-        self.assert_('X-Object-Meta-Bar: foo' in headers)
-        body = fd.read()
-        self.assertEquals(body, '%05d' % segment)
-        # Delete the object versions
-        for segment in xrange(versions_to_create - 1, 0, -1):
-            sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-            fd = sock.makefile()
-            fd.write('DELETE /v1/a/versions/name HTTP/1.1\r\nHost: localhost\r'
-                     '\nConnection: close\r\nX-Storage-Token: t\r\n\r\n')
-            fd.flush()
-            headers = readuntil2crlfs(fd)
-            exp = 'HTTP/1.1 2'  # 2xx series response
-            self.assertEquals(headers[:len(exp)], exp)
-            # Ensure retrieving the manifest file gets the latest version
-            sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-            fd = sock.makefile()
-            fd.write('GET /v1/a/versions/name HTTP/1.1\r\nHost: localhost\r\n'
-                     'Connection: close\r\nX-Auth-Token: t\r\n\r\n')
-            fd.flush()
-            headers = readuntil2crlfs(fd)
-            exp = 'HTTP/1.1 200'
-            self.assertEquals(headers[:len(exp)], exp)
-            self.assert_('Content-Type: text/jibberish%s' % (segment - 1)
-                         in headers)
-            body = fd.read()
-            self.assertEquals(body, '%05d' % (segment - 1))
-            # Ensure we have the right number of versions saved
-            sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-            fd = sock.makefile()
-            fd.write('GET /v1/a/vers?prefix=004name/ HTTP/1.1\r\nHost: '
-                     'localhost\r\nConnection: close\r\nX-Auth-Token: t\r\n\r'
-                     '\n')
+        with mock.patch('swift.obj.diskfile.md5',
+                        busted_md5_constructor):
+            fd = sock.makefile('rwb')
+            fd.write(('PUT /v1/a/%s/pimento HTTP/1.1\r\n'
+                      'Host: localhost\r\n'
+                      'Connection: close\r\n'
+                      'Etag: %s\r\n'
+                      'Content-Length: %d\r\n'
+                      'X-Storage-Token: t\r\n'
+                      'Content-Type: application/octet-stream\r\n'
+                      '\r\n' % (self.ec_policy.name,
+                                md5(obj, usedforsecurity=False).hexdigest(),
+                                len(obj))).encode('ascii'))
+            fd.write(obj)
             fd.flush()
             headers = readuntil2crlfs(fd)
-            exp = 'HTTP/1.1 2'  # 2xx series response
-            self.assertEquals(headers[:len(exp)], exp)
-            body = fd.read()
-            versions = [x for x in body.split('\n') if x]
-            self.assertEquals(len(versions), segment - 1)
-        # there is now one segment left (in the manifest)
-        # Ensure we have no saved versions
-        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('GET /v1/a/vers?prefix=004name/ HTTP/1.1\r\nHost: '
-                 'localhost\r\nConnection: close\r\nX-Auth-Token: t\r\n\r\n')
-        fd.flush()
-        headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 204 No Content'
-        self.assertEquals(headers[:len(exp)], exp)
-        # delete the last verision
-        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('DELETE /v1/a/versions/name HTTP/1.1\r\nHost: localhost\r\n'
-                 'Connection: close\r\nX-Storage-Token: t\r\n\r\n')
-        fd.flush()
-        headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 2'  # 2xx series response
-        self.assertEquals(headers[:len(exp)], exp)
-        # Ensure it's all gone
-        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('GET /v1/a/versions/name HTTP/1.1\r\nHost: '
-                 'localhost\r\nConnection: close\r\nX-Auth-Token: t\r\n\r\n')
-        fd.flush()
-        headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 404'
-        self.assertEquals(headers[:len(exp)], exp)
+        exp = b'HTTP/1.1 503'  # no quorum
+        self.assertEqual(headers[:len(exp)], exp)
 
-        # make sure manifest files don't get versioned
-        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('PUT /v1/a/versions/name HTTP/1.1\r\nHost: '
-                 'localhost\r\nConnection: close\r\nX-Storage-Token: '
-                 't\r\nContent-Length: 0\r\nContent-Type: text/jibberish0\r\n'
-                 'Foo: barbaz\r\nX-Object-Manifest: vers/foo_\r\n\r\n')
-        fd.flush()
-        headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 201'
-        self.assertEquals(headers[:len(exp)], exp)
-        # Ensure we have no saved versions
-        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('GET /v1/a/vers?prefix=004name/ HTTP/1.1\r\nHost: '
-                 'localhost\r\nConnection: close\r\nX-Auth-Token: t\r\n\r\n')
-        fd.flush()
-        headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 204 No Content'
-        self.assertEquals(headers[:len(exp)], exp)
+        # replica count - 1 of the fragment archives should have
+        # landed on disk
+        partition, nodes = prosrv.get_object_ring(
+            int(self.ec_policy)).get_nodes('a', self.ec_policy.name, 'pimento')
+        conf = {'devices': _testdir, 'mount_check': 'false'}
 
-        # DELETE v1/a/c/obj shouldn't delete v1/a/c/obj/sub versions
-        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('PUT /v1/a/versions/name HTTP/1.1\r\nHost: '
-                 'localhost\r\nConnection: close\r\nX-Storage-Token: '
-                 't\r\nContent-Length: 5\r\nContent-Type: text/jibberish0\r\n'
-                 'Foo: barbaz\r\n\r\n00000\r\n')
-        fd.flush()
-        headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 201'
-        self.assertEquals(headers[:len(exp)], exp)
-        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('PUT /v1/a/versions/name HTTP/1.1\r\nHost: '
-                 'localhost\r\nConnection: close\r\nX-Storage-Token: '
-                 't\r\nContent-Length: 5\r\nContent-Type: text/jibberish0\r\n'
-                 'Foo: barbaz\r\n\r\n00001\r\n')
-        fd.flush()
-        headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 201'
-        self.assertEquals(headers[:len(exp)], exp)
-        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('PUT /v1/a/versions/name/sub HTTP/1.1\r\nHost: '
-                 'localhost\r\nConnection: close\r\nX-Storage-Token: '
-                 't\r\nContent-Length: 4\r\nContent-Type: text/jibberish0\r\n'
-                 'Foo: barbaz\r\n\r\nsub1\r\n')
-        fd.flush()
-        headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 201'
-        self.assertEquals(headers[:len(exp)], exp)
-        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('PUT /v1/a/versions/name/sub HTTP/1.1\r\nHost: '
-                 'localhost\r\nConnection: close\r\nX-Storage-Token: '
-                 't\r\nContent-Length: 4\r\nContent-Type: text/jibberish0\r\n'
-                 'Foo: barbaz\r\n\r\nsub2\r\n')
-        fd.flush()
-        headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 201'
-        self.assertEquals(headers[:len(exp)], exp)
-        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('DELETE /v1/a/versions/name HTTP/1.1\r\nHost: localhost\r\n'
-                 'Connection: close\r\nX-Storage-Token: t\r\n\r\n')
-        fd.flush()
-        headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 2'  # 2xx series response
-        self.assertEquals(headers[:len(exp)], exp)
-        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('GET /v1/a/vers?prefix=008name/sub/ HTTP/1.1\r\nHost: '
-                 'localhost\r\nConnection: close\r\nX-Auth-Token: t\r\n\r\n')
-        fd.flush()
-        headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 2'  # 2xx series response
-        self.assertEquals(headers[:len(exp)], exp)
-        body = fd.read()
-        versions = [x for x in body.split('\n') if x]
-        self.assertEquals(len(versions), 1)
+        df_mgr = diskfile.DiskFileRouter(conf, debug_logger())[self.ec_policy]
 
-        # Check for when the versions target container doesn't exist
-        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('PUT /v1/a/whoops HTTP/1.1\r\nHost: localhost\r\n'
-                 'Connection: close\r\nX-Storage-Token: t\r\n'
-                 'Content-Length: 0\r\nX-Versions-Location: none\r\n\r\n')
-        fd.flush()
-        headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 201'
-        self.assertEquals(headers[:len(exp)], exp)
-        # Create the versioned file
-        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('PUT /v1/a/whoops/foo HTTP/1.1\r\nHost: '
-                 'localhost\r\nConnection: close\r\nX-Storage-Token: '
-                 't\r\nContent-Length: 5\r\n\r\n00000\r\n')
-        fd.flush()
-        headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 201'
-        self.assertEquals(headers[:len(exp)], exp)
-        # Create another version
-        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('PUT /v1/a/whoops/foo HTTP/1.1\r\nHost: '
-                 'localhost\r\nConnection: close\r\nX-Storage-Token: '
-                 't\r\nContent-Length: 5\r\n\r\n00001\r\n')
-        fd.flush()
-        headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 412'
-        self.assertEquals(headers[:len(exp)], exp)
-        # Delete the object
-        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('DELETE /v1/a/whoops/foo HTTP/1.1\r\nHost: localhost\r\n'
-                 'Connection: close\r\nX-Storage-Token: t\r\n\r\n')
-        fd.flush()
-        headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 2'  # 2xx response
-        self.assertEquals(headers[:len(exp)], exp)
+        found = 0
+        for node in nodes:
+            df = df_mgr.get_diskfile(node['device'], partition,
+                                     'a', self.ec_policy.name, 'pimento',
+                                     policy=self.ec_policy)
+            try:
+                # diskfile open won't succeed because no durable was written,
+                # so look under the hood for data files.
+                files = os.listdir(df._datadir)
+                if len(files) > 0:
+                    # Although the third fragment archive hasn't landed on
+                    # disk, the directory df._datadir is pre-maturely created
+                    # and is empty when we use O_TMPFILE + linkat()
+                    num_data_files = \
+                        len([f for f in files if f.endswith('.data')])
+                    self.assertEqual(1, num_data_files)
+                    found += 1
+            except OSError:
+                pass
+        self.assertEqual(found, self.ec_policy.ec_ndata)
+
+    def test_PUT_ec_fragment_quorum_archive_etag_mismatch(self):
+        self.put_container("ec", "ec-con")
 
-    def test_chunked_put_lobjects_with_nonzero_size_manifest_file(self):
-        # Create a container for our segmented/manifest object testing
-        (prolis, acc1lis, acc2lis, con1lis, con2lis, obj1lis, obj2lis) = \
-            _test_sockets
+        def busted_md5_constructor(initial_str=b"", usedforsecurity=True):
+            hasher = md5(initial_str, usedforsecurity=usedforsecurity)
+            hasher.update(b'wrong')
+            return hasher
+
+        obj = b'uvarovite-esurience-cerated-symphysic'
+        prolis = _test_sockets[0]
+        prosrv = _test_servers[0]
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('PUT /v1/a/segmented_nonzero HTTP/1.1\r\nHost: localhost\r\n'
-                 'Connection: close\r\nX-Storage-Token: t\r\n'
-                 'Content-Length: 0\r\n\r\n')
-        fd.flush()
-        headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 201'
-        self.assertEquals(headers[:len(exp)], exp)
-        # Create the object segments
-        segment_etags = []
-        for segment in xrange(5):
-            sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-            fd = sock.makefile()
-            fd.write('PUT /v1/a/segmented_nonzero/name/%s HTTP/1.1\r\nHost: '
-                     'localhost\r\nConnection: close\r\nX-Storage-Token: '
-                     't\r\nContent-Length: 5\r\n\r\n1234 ' % str(segment))
+
+        call_count = [0]
+
+        def mock_committer(self):
+            call_count[0] += 1
+
+        commit_confirmation = \
+            'swift.proxy.controllers.obj.MIMEPutter.send_commit_confirmation'
+        diskfile_md5 = 'swift.obj.diskfile.md5'
+        mem_diskfile_md5 = 'swift.obj.mem_diskfile.md5'
+
+        with mock.patch(diskfile_md5, busted_md5_constructor), \
+                mock.patch(mem_diskfile_md5, busted_md5_constructor), \
+                mock.patch(commit_confirmation, mock_committer):
+            fd = sock.makefile('rwb')
+            fd.write(('PUT /v1/a/ec-con/quorum HTTP/1.1\r\n'
+                      'Host: localhost\r\n'
+                      'Connection: close\r\n'
+                      'Etag: %s\r\n'
+                      'Content-Length: %d\r\n'
+                      'X-Storage-Token: t\r\n'
+                      'Content-Type: application/octet-stream\r\n'
+                      '\r\n' % (md5(obj, usedforsecurity=False).hexdigest(),
+                                len(obj))).encode('ascii'))
+            fd.write(obj)
             fd.flush()
             headers = readuntil2crlfs(fd)
-            exp = 'HTTP/1.1 201'
-            self.assertEquals(headers[:len(exp)], exp)
-            segment_etags.append(md5('1234 ').hexdigest())
+        exp = b'HTTP/1.1 503'  # no quorum
+        self.assertEqual(headers[:len(exp)], exp)
+        # Don't send commit to object-server if quorum responses consist of 4xx
+        self.assertEqual(0, call_count[0])
 
-        # Create the nonzero size manifest file
-        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('PUT /v1/a/segmented_nonzero/name HTTP/1.1\r\nHost: '
-                 'localhost\r\nConnection: close\r\nX-Storage-Token: '
-                 't\r\nContent-Length: 5\r\n\r\nabcd ')
-        fd.flush()
-        headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 201'
-        self.assertEquals(headers[:len(exp)], exp)
+        # no fragment archives should have landed on disk
+        partition, nodes = prosrv.get_object_ring(3).get_nodes(
+            'a', 'ec-con', 'quorum')
+        conf = {'devices': _testdir, 'mount_check': 'false'}
 
-        # Create the object manifest file
-        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('POST /v1/a/segmented_nonzero/name HTTP/1.1\r\nHost: '
-                 'localhost\r\nConnection: close\r\nX-Storage-Token: t\r\n'
-                 'X-Object-Manifest: segmented_nonzero/name/\r\n'
-                 'Foo: barbaz\r\nContent-Type: text/jibberish\r\n'
-                 '\r\n\r\n')
-        fd.flush()
-        headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 202'
-        self.assertEquals(headers[:len(exp)], exp)
+        df_mgr = diskfile.DiskFileRouter(conf, debug_logger())[self.ec_policy]
 
-        # Ensure retrieving the manifest file gets the whole object
-        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('GET /v1/a/segmented_nonzero/name HTTP/1.1\r\nHost: '
-                 'localhost\r\nConnection: close\r\nX-Auth-Token: '
-                 't\r\n\r\n')
-        fd.flush()
-        headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 200'
-        self.assertEquals(headers[:len(exp)], exp)
-        self.assert_('X-Object-Manifest: segmented_nonzero/name/' in headers)
-        self.assert_('Content-Type: text/jibberish' in headers)
-        self.assert_('Foo: barbaz' in headers)
-        expected_etag = md5(''.join(segment_etags)).hexdigest()
-        self.assert_('Etag: "%s"' % expected_etag in headers)
-        body = fd.read()
-        self.assertEquals(body, '1234 1234 1234 1234 1234 ')
+        for node in nodes:
+            df = df_mgr.get_diskfile(node['device'], partition,
+                                     'a', 'ec-con', 'quorum',
+                                     policy=self.ec_policy)
+            if os.path.exists(df._datadir):
+                self.assertFalse(os.listdir(df._datadir))  # should be empty
 
-        # Get lobjects with Range smaller than manifest file
-        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('GET /v1/a/segmented_nonzero/name HTTP/1.1\r\nHost: '
-                 'localhost\r\nConnection: close\r\nX-Auth-Token: t\r\n'
-                 'Range: bytes=0-4\r\n\r\n')
-        fd.flush()
-        headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 206'
-        self.assertEquals(headers[:len(exp)], exp)
-        self.assert_('X-Object-Manifest: segmented_nonzero/name/' in headers)
-        self.assert_('Content-Type: text/jibberish' in headers)
-        self.assert_('Foo: barbaz' in headers)
-        expected_etag = md5(''.join(segment_etags)).hexdigest()
-        body = fd.read()
-        self.assertEquals(body, '1234 ')
+    def test_PUT_ec_fragment_quorum_bad_request(self):
+        self.put_container("ec", "ec-con")
 
-        # Get lobjects with Range bigger than manifest file
+        obj = b'uvarovite-esurience-cerated-symphysic'
+        prolis = _test_sockets[0]
+        prosrv = _test_servers[0]
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('GET /v1/a/segmented_nonzero/name HTTP/1.1\r\nHost: '
-                 'localhost\r\nConnection: close\r\nX-Auth-Token: t\r\n'
-                 'Range: bytes=11-15\r\n\r\n')
-        fd.flush()
-        headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 206'
-        self.assertEquals(headers[:len(exp)], exp)
-        self.assert_('X-Object-Manifest: segmented_nonzero/name/' in headers)
-        self.assert_('Content-Type: text/jibberish' in headers)
-        self.assert_('Foo: barbaz' in headers)
-        expected_etag = md5(''.join(segment_etags)).hexdigest()
-        body = fd.read()
-        self.assertEquals(body, '234 1')
 
-    def test_chunked_put_lobjects(self):
-        # Create a container for our segmented/manifest object testing
-        (prolis, acc1lis, acc2lis, con1lis, con2lis, obj1lis,
-         obj2lis) = _test_sockets
-        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('PUT /v1/a/segmented%20object HTTP/1.1\r\n'
-                 'Host: localhost\r\n'
-                 'Connection: close\r\n'
-                 'X-Storage-Token: t\r\n'
-                 'Content-Length: 0\r\n'
-                 '\r\n')
-        fd.flush()
-        headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 201'
-        self.assertEquals(headers[:len(exp)], exp)
-        # Create the object segments
-        segment_etags = []
-        for segment in xrange(5):
-            sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-            fd = sock.makefile()
-            fd.write('PUT /v1/a/segmented%%20object/object%%20name/%s '
-                     'HTTP/1.1\r\n'
-                     'Host: localhost\r\n'
-                     'Connection: close\r\n'
-                     'X-Storage-Token: t\r\n'
-                     'Content-Length: 5\r\n'
-                     '\r\n'
-                     '1234 ' % str(segment))
+        call_count = [0]
+
+        def mock_committer(self):
+            call_count[0] += 1
+
+        read_footer = \
+            'swift.obj.server.ObjectController._read_metadata_footer'
+        commit_confirmation = \
+            'swift.proxy.controllers.obj.MIMEPutter.send_commit_confirmation'
+
+        with mock.patch(read_footer) as read_footer_call, \
+                mock.patch(commit_confirmation, mock_committer):
+            # Emulate missing footer MIME doc in all object-servers
+            read_footer_call.side_effect = HTTPBadRequest(
+                body="couldn't find footer MIME doc")
+
+            fd = sock.makefile('rwb')
+            fd.write(('PUT /v1/a/ec-con/quorum HTTP/1.1\r\n'
+                      'Host: localhost\r\n'
+                      'Connection: close\r\n'
+                      'Etag: %s\r\n'
+                      'Content-Length: %d\r\n'
+                      'X-Storage-Token: t\r\n'
+                      'Content-Type: application/octet-stream\r\n'
+                      '\r\n' % (md5(obj, usedforsecurity=False).hexdigest(),
+                                len(obj))).encode('ascii'))
+            fd.write(obj)
             fd.flush()
             headers = readuntil2crlfs(fd)
-            exp = 'HTTP/1.1 201'
-            self.assertEquals(headers[:len(exp)], exp)
-            segment_etags.append(md5('1234 ').hexdigest())
-        # Create the object manifest file
-        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('PUT /v1/a/segmented%20object/object%20name HTTP/1.1\r\n'
-                 'Host: localhost\r\n'
-                 'Connection: close\r\n'
-                 'X-Storage-Token: t\r\n'
-                 'Content-Length: 0\r\n'
-                 'X-Object-Manifest: segmented%20object/object%20name/\r\n'
-                 'Content-Type: text/jibberish\r\n'
-                 'Foo: barbaz\r\n'
-                 '\r\n')
-        fd.flush()
-        headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 201'
-        self.assertEquals(headers[:len(exp)], exp)
-        # Check retrieving the listing the manifest would retrieve
-        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('GET /v1/a/segmented%20object?prefix=object%20name/ '
-                 'HTTP/1.1\r\n'
-                 'Host: localhost\r\n'
-                 'Connection: close\r\n'
-                 'X-Auth-Token: t\r\n'
-                 '\r\n')
-        fd.flush()
-        headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 200'
-        self.assertEquals(headers[:len(exp)], exp)
-        body = fd.read()
-        self.assertEquals(
-            body,
-            'object name/0\n'
-            'object name/1\n'
-            'object name/2\n'
-            'object name/3\n'
-            'object name/4\n')
-        # Ensure retrieving the manifest file gets the whole object
-        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('GET /v1/a/segmented%20object/object%20name HTTP/1.1\r\n'
-                 'Host: localhost\r\n'
-                 'Connection: close\r\n'
-                 'X-Auth-Token: t\r\n'
-                 '\r\n')
-        fd.flush()
-        headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 200'
-        self.assertEquals(headers[:len(exp)], exp)
-        self.assert_('X-Object-Manifest: segmented%20object/object%20name/' in
-                     headers)
-        self.assert_('Content-Type: text/jibberish' in headers)
-        self.assert_('Foo: barbaz' in headers)
-        expected_etag = md5(''.join(segment_etags)).hexdigest()
-        self.assert_('Etag: "%s"' % expected_etag in headers)
-        body = fd.read()
-        self.assertEquals(body, '1234 1234 1234 1234 1234 ')
-        # Do it again but exceeding the container listing limit
-        swift.proxy.controllers.obj.CONTAINER_LISTING_LIMIT = 2
-        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
 
-        fd = sock.makefile()
-        fd.write('GET /v1/a/segmented%20object/object%20name HTTP/1.1\r\n'
-                 'Host: localhost\r\n'
-                 'Connection: close\r\n'
-                 'X-Auth-Token: t\r\n'
-                 '\r\n')
-        fd.flush()
-        headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 200'
-        self.assertEquals(headers[:len(exp)], exp)
-        self.assert_('X-Object-Manifest: segmented%20object/object%20name/' in
-                     headers)
-        self.assert_('Content-Type: text/jibberish' in headers)
-        body = fd.read()
-        # A bit fragile of a test; as it makes the assumption that all
-        # will be sent in a single chunk.
-        self.assertEquals(
-            body, '19\r\n1234 1234 1234 1234 1234 \r\n0\r\n\r\n')
-        # Make a copy of the manifested object, which should
-        # error since the number of segments exceeds
-        # CONTAINER_LISTING_LIMIT.
-        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('PUT /v1/a/segmented%20object/copy HTTP/1.1\r\n'
-                 'Host: localhost\r\n'
-                 'Connection: close\r\n'
-                 'X-Auth-Token: t\r\n'
-                 'X-Copy-From: segmented%20object/object%20name\r\n'
-                 'Content-Length: 0\r\n'
-                 '\r\n')
-        fd.flush()
-        headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 413'
-        self.assertEquals(headers[:len(exp)], exp)
-        body = fd.read()
-        # After adjusting the CONTAINER_LISTING_LIMIT, make a copy of
-        # the manifested object which should consolidate the segments.
-        swift.proxy.controllers.obj.CONTAINER_LISTING_LIMIT = 10000
-        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('PUT /v1/a/segmented%20object/copy HTTP/1.1\r\n'
-                 'Host: localhost\r\n'
-                 'Connection: close\r\n'
-                 'X-Auth-Token: t\r\n'
-                 'X-Copy-From: segmented%20object/object%20name\r\n'
-                 'Content-Length: 0\r\n'
-                 '\r\n')
-        fd.flush()
-        headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 201'
-        self.assertEquals(headers[:len(exp)], exp)
-        body = fd.read()
-        # Retrieve and validate the copy.
-        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('GET /v1/a/segmented%20object/copy HTTP/1.1\r\n'
-                 'Host: localhost\r\n'
-                 'Connection: close\r\n'
-                 'X-Auth-Token: t\r\n'
-                 '\r\n')
-        fd.flush()
-        headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 200'
-        self.assertEquals(headers[:len(exp)], exp)
-        self.assert_('x-object-manifest:' not in headers.lower())
-        self.assert_('Content-Length: 25\r' in headers)
-        body = fd.read()
-        self.assertEquals(body, '1234 1234 1234 1234 1234 ')
-        # Create an object manifest file pointing to nothing
+        # Don't show a result of the bad conversation between proxy-server
+        # and object-server
+        exp = b'HTTP/1.1 503'
+        self.assertEqual(headers[:len(exp)], exp)
+        # Don't send commit to object-server if quorum responses consist of 4xx
+        self.assertEqual(0, call_count[0])
+
+        # no fragment archives should have landed on disk
+        partition, nodes = prosrv.get_object_ring(3).get_nodes(
+            'a', 'ec-con', 'quorum')
+        conf = {'devices': _testdir, 'mount_check': 'false'}
+
+        df_mgr = diskfile.DiskFileRouter(conf, debug_logger())[self.ec_policy]
+
+        for node in nodes:
+            df = df_mgr.get_diskfile(node['device'], partition,
+                                     'a', 'ec-con', 'quorum',
+                                     policy=self.ec_policy)
+            if os.path.exists(df._datadir):
+                self.assertFalse(os.listdir(df._datadir))  # should be empty
+
+    def test_PUT_ec_if_none_match(self):
+        self.put_container(self.ec_policy.name, self.ec_policy.name)
+
+        obj = b'ananepionic-lepidophyllous-ropewalker-neglectful'
+        prolis = _test_sockets[0]
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('PUT /v1/a/segmented%20object/empty HTTP/1.1\r\n'
-                 'Host: localhost\r\n'
-                 'Connection: close\r\n'
-                 'X-Storage-Token: t\r\n'
-                 'Content-Length: 0\r\n'
-                 'X-Object-Manifest: segmented%20object/empty/\r\n'
-                 'Content-Type: text/jibberish\r\n'
-                 '\r\n')
+        fd = sock.makefile('rwb')
+        fd.write(('PUT /v1/a/%s/inm HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Connection: close\r\n'
+                  'Etag: "%s"\r\n'
+                  'Content-Length: %d\r\n'
+                  'X-Storage-Token: t\r\n'
+                  'Content-Type: application/octet-stream\r\n'
+                  '\r\n' % (self.ec_policy.name,
+                            md5(obj, usedforsecurity=False).hexdigest(),
+                            len(obj))).encode('ascii'))
+        fd.write(obj)
         fd.flush()
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 201'
-        self.assertEquals(headers[:len(exp)], exp)
-        # Ensure retrieving the manifest file gives a zero-byte file
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
+
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('GET /v1/a/segmented%20object/empty HTTP/1.1\r\n'
-                 'Host: localhost\r\n'
-                 'Connection: close\r\n'
-                 'X-Auth-Token: t\r\n'
-                 '\r\n')
+        fd = sock.makefile('rwb')
+        fd.write(('PUT /v1/a/%s/inm HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Connection: close\r\n'
+                  'If-None-Match: *\r\n'
+                  'Etag: "%s"\r\n'
+                  'Content-Length: %d\r\n'
+                  'X-Storage-Token: t\r\n'
+                  'Content-Type: application/octet-stream\r\n'
+                  '\r\n' % (self.ec_policy.name,
+                            md5(obj, usedforsecurity=False).hexdigest(),
+                            len(obj))).encode('ascii'))
+        fd.write(obj)
         fd.flush()
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 200'
-        self.assertEquals(headers[:len(exp)], exp)
-        self.assert_('X-Object-Manifest: segmented%20object/empty/' in headers)
-        self.assert_('Content-Type: text/jibberish' in headers)
-        body = fd.read()
-        self.assertEquals(body, '')
-        # Check copy content type
+        exp = b'HTTP/1.1 412'
+        self.assertEqual(headers[:len(exp)], exp)
+
+    def test_GET_ec(self):
+        prolis = _test_sockets[0]
+        prosrv = _test_servers[0]
+
+        self.put_container(self.ec_policy.name, self.ec_policy.name)
+
+        obj = b'0123456' * 11 * 17
+
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('PUT /v1/a/c/obj HTTP/1.1\r\n'
-                 'Host: localhost\r\n'
-                 'Connection: close\r\n'
-                 'X-Storage-Token: t\r\n'
-                 'Content-Length: 0\r\n'
-                 'Content-Type: text/jibberish\r\n'
-                 '\r\n')
+        fd = sock.makefile('rwb')
+        fd.write(('PUT /v1/a/%s/go-get-it HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Connection: close\r\n'
+                  'Content-Length: %d\r\n'
+                  'X-Storage-Token: t\r\n'
+                  'X-Object-Meta-Color: chartreuse\r\n'
+                  'Content-Type: application/octet-stream\r\n'
+                  '\r\n' % (self.ec_policy.name, len(obj))).encode('ascii'))
+        fd.write(obj)
         fd.flush()
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 201'
-        self.assertEquals(headers[:len(exp)], exp)
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
+
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('PUT /v1/a/c/obj2 HTTP/1.1\r\n'
-                 'Host: localhost\r\n'
-                 'Connection: close\r\n'
-                 'X-Storage-Token: t\r\n'
-                 'Content-Length: 0\r\n'
-                 'X-Copy-From: c/obj\r\n'
-                 '\r\n')
+        fd = sock.makefile('rwb')
+        fd.write(('GET /v1/a/%s/go-get-it HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Connection: close\r\n'
+                  'X-Storage-Token: t\r\n'
+                  '\r\n' % self.ec_policy.name).encode('ascii'))
         fd.flush()
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 201'
-        self.assertEquals(headers[:len(exp)], exp)
-        # Ensure getting the copied file gets original content-type
+        exp = b'HTTP/1.1 200'
+        self.assertEqual(headers[:len(exp)], exp)
+
+        headers = parse_headers_string(headers)
+        self.assertEqual(str(len(obj)), headers['Content-Length'])
+        self.assertEqual(
+            md5(obj, usedforsecurity=False).hexdigest(),
+            headers['Etag'])
+        self.assertEqual('chartreuse', headers['X-Object-Meta-Color'])
+
+        gotten_obj = b''
+        while True:
+            buf = fd.read(64)
+            if not buf:
+                break
+            gotten_obj += buf
+        self.assertEqual(gotten_obj, obj)
+        error_lines = prosrv.logger.get_lines_for_level('error')
+        warn_lines = prosrv.logger.get_lines_for_level('warning')
+        self.assertEqual(len(error_lines), 0)  # sanity
+        self.assertEqual(len(warn_lines), 0)  # sanity
+
+    def test_GET_ec_deleted(self):
+        prolis = _test_sockets[0]
+        prosrv = _test_servers[0]
+
+        container_name = 'ec_deleted'
+        self.put_container(self.ec_policy.name, container_name)
+
+        # delete container
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('GET /v1/a/c/obj2 HTTP/1.1\r\n'
-                 'Host: localhost\r\n'
-                 'Connection: close\r\n'
-                 'X-Auth-Token: t\r\n'
-                 '\r\n')
+        fd = sock.makefile('rwb')
+        fd.write(('DELETE /v1/a/%s HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Connection: close\r\n'
+                  '\r\n' % container_name).encode('ascii'))
         fd.flush()
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 200'
-        self.assertEquals(headers[:len(exp)], exp)
-        self.assert_('Content-Type: text/jibberish' in headers)
-        # Check set content type
+        exp = b'HTTP/1.1 20'
+        self.assertEqual(headers[:len(exp)], exp)
+
+        # download from deleted container
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('PUT /v1/a/c/obj3 HTTP/1.1\r\n'
-                 'Host: localhost\r\n'
-                 'Connection: close\r\n'
-                 'X-Storage-Token: t\r\n'
-                 'Content-Length: 0\r\n'
-                 'Content-Type: foo/bar\r\n'
-                 '\r\n')
+        fd = sock.makefile('rwb')
+        fd.write(('GET /v1/a/%s/no-object-there HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Connection: close\r\n'
+                  'X-Storage-Token: t\r\n'
+                  '\r\n' % container_name).encode('ascii'))
         fd.flush()
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 201'
-        self.assertEquals(headers[:len(exp)], exp)
-        # Ensure getting the copied file gets original content-type
+        exp = b'HTTP/1.1 404'
+        self.assertEqual(headers[:len(exp)], exp)
+
+        error_lines = prosrv.logger.get_lines_for_level('error')
+        warn_lines = prosrv.logger.get_lines_for_level('warning')
+        self.assertEqual(len(error_lines), 0)  # sanity
+        self.assertEqual(len(warn_lines), 0)  # sanity
+
+    def test_conditional_GET_ec(self):
+        # sanity
+        self.assertEqual('erasure_coding', self.ec_policy.policy_type)
+        self._test_conditional_GET(self.ec_policy)
+
+    def test_GET_ec_big(self):
+        prolis = _test_sockets[0]
+        prosrv = _test_servers[0]
+
+        self.put_container(self.ec_policy.name, self.ec_policy.name)
+
+        # our EC segment size is 4 KiB, so this is multiple (3) segments;
+        # we'll verify that with a sanity check
+        obj = b'a moose once bit my sister' * 400
+        self.assertGreater(
+            len(obj), self.ec_policy.ec_segment_size * 2,
+            "object is too small for proper testing")
+
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('GET /v1/a/c/obj3 HTTP/1.1\r\n'
-                 'Host: localhost\r\n'
-                 'Connection: close\r\n'
-                 'X-Auth-Token: t\r\n'
-                 '\r\n')
+        fd = sock.makefile('rwb')
+        fd.write(('PUT /v1/a/%s/big-obj-get HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Connection: close\r\n'
+                  'Content-Length: %d\r\n'
+                  'X-Storage-Token: t\r\n'
+                  'Content-Type: application/octet-stream\r\n'
+                  '\r\n' % (self.ec_policy.name, len(obj))).encode('ascii'))
+        fd.write(obj)
         fd.flush()
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 200'
-        self.assertEquals(headers[:len(exp)], exp)
-        self.assert_('Content-Type: foo/bar' in
-                     headers.split('\r\n'), repr(headers.split('\r\n')))
-        # Check set content type with charset
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
+
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('PUT /v1/a/c/obj4 HTTP/1.1\r\n'
-                 'Host: localhost\r\n'
-                 'Connection: close\r\n'
-                 'X-Storage-Token: t\r\n'
-                 'Content-Length: 0\r\n'
-                 'Content-Type: foo/bar; charset=UTF-8\r\n'
-                 '\r\n')
+        fd = sock.makefile('rwb')
+        fd.write(('GET /v1/a/%s/big-obj-get HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Connection: close\r\n'
+                  'X-Storage-Token: t\r\n'
+                  '\r\n' % self.ec_policy.name).encode('ascii'))
         fd.flush()
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 201'
-        self.assertEquals(headers[:len(exp)], exp)
-        # Ensure getting the copied file gets original content-type
+        exp = b'HTTP/1.1 200'
+        self.assertEqual(headers[:len(exp)], exp)
+
+        headers = parse_headers_string(headers)
+        self.assertEqual(str(len(obj)), headers['Content-Length'])
+        self.assertEqual(
+            md5(obj, usedforsecurity=False).hexdigest(),
+            headers['Etag'])
+
+        gotten_obj = b''
+        while True:
+            buf = fd.read(64)
+            if not buf:
+                break
+            gotten_obj += buf
+        # This may look like a redundant test, but when things fail, this
+        # has a useful failure message while the subsequent one spews piles
+        # of garbage and demolishes your terminal's scrollback buffer.
+        self.assertEqual(len(gotten_obj), len(obj))
+        self.assertEqual(gotten_obj, obj)
+        error_lines = prosrv.logger.get_lines_for_level('error')
+        warn_lines = prosrv.logger.get_lines_for_level('warning')
+        self.assertEqual(len(error_lines), 0)  # sanity
+        self.assertEqual(len(warn_lines), 0)  # sanity
+
+    def test_GET_ec_failure_handling(self):
+        self.put_container(self.ec_policy.name, self.ec_policy.name)
+
+        obj = b'look at this object; it is simply amazing ' * 500
+        prolis = _test_sockets[0]
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('GET /v1/a/c/obj4 HTTP/1.1\r\n'
-                 'Host: localhost\r\n'
-                 'Connection: close\r\n'
-                 'X-Auth-Token: t\r\n'
-                 '\r\n')
+        fd = sock.makefile('rwb')
+        fd.write(('PUT /v1/a/%s/crash-test-dummy HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Connection: close\r\n'
+                  'Content-Length: %d\r\n'
+                  'X-Storage-Token: t\r\n'
+                  'Content-Type: application/octet-stream\r\n'
+                  '\r\n' % (self.ec_policy.name, len(obj))).encode('ascii'))
+        fd.write(obj)
         fd.flush()
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 200'
-        self.assertEquals(headers[:len(exp)], exp)
-        self.assert_('Content-Type: foo/bar; charset=UTF-8' in
-                     headers.split('\r\n'), repr(headers.split('\r\n')))
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
 
-    def test_mismatched_etags(self):
-        with save_globals():
-            # no etag supplied, object servers return success w/ diff values
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                                headers={'Content-Length': '0'})
-            self.app.update_request(req)
-            set_http_connect(200, 201, 201, 201,
-                             etags=[None,
-                                    '68b329da9893e34099c7d8ad5cb9c940',
-                                    '68b329da9893e34099c7d8ad5cb9c940',
-                                    '68b329da9893e34099c7d8ad5cb9c941'])
-            resp = controller.PUT(req)
-            self.assertEquals(resp.status_int // 100, 5)  # server error
+        def explodey_iter(inner_iter):
+            yield next(inner_iter)
+            raise Exception("doom ba doom")
+
+        def explodey_doc_parts_iter(inner_iter_iter):
+            try:
+                for item in inner_iter_iter:
+                    item = item.copy()  # paranoia about mutable data
+                    item['part_iter'] = explodey_iter(item['part_iter'])
+                    yield item
+            except GeneratorExit:
+                inner_iter_iter.close()
+                raise
+
+        real_ec_app_iter = swift.proxy.controllers.obj.ECAppIter
+
+        def explodey_ec_app_iter(path, policy, iterators, *a, **kw):
+            # Each thing in `iterators` here is a document-parts iterator,
+            # and we want to fail after getting a little into each part.
+            #
+            # That way, we ensure we've started streaming the response to
+            # the client when things go wrong.
+            return real_ec_app_iter(
+                path, policy,
+                [explodey_doc_parts_iter(i) for i in iterators],
+                *a, **kw)
+
+        with mock.patch("swift.proxy.controllers.obj.ECAppIter",
+                        explodey_ec_app_iter):
+            sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+            fd = sock.makefile('rwb')
+            fd.write(('GET /v1/a/%s/crash-test-dummy HTTP/1.1\r\n'
+                      'Host: localhost\r\n'
+                      'Connection: close\r\n'
+                      'X-Storage-Token: t\r\n'
+                      '\r\n' % self.ec_policy.name).encode('ascii'))
+            fd.flush()
+            headers = readuntil2crlfs(fd)
+            exp = b'HTTP/1.1 200'
+            self.assertEqual(headers[:len(exp)], exp)
 
-            # req supplies etag, object servers return 422 - mismatch
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                                headers={
-                                    'Content-Length': '0',
-                                    'ETag': '68b329da9893e34099c7d8ad5cb9c940',
-                                })
-            self.app.update_request(req)
-            set_http_connect(200, 422, 422, 503,
-                             etags=['68b329da9893e34099c7d8ad5cb9c940',
-                                    '68b329da9893e34099c7d8ad5cb9c941',
-                                    None,
-                                    None])
-            resp = controller.PUT(req)
-            self.assertEquals(resp.status_int // 100, 4)  # client error
+            headers = parse_headers_string(headers)
+            self.assertEqual(str(len(obj)), headers['Content-Length'])
+            self.assertEqual(
+                md5(obj, usedforsecurity=False).hexdigest(),
+                headers['Etag'])
 
-    def test_response_get_accept_ranges_header(self):
-        with save_globals():
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'GET'})
-            self.app.update_request(req)
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-            set_http_connect(200, 200, 200)
-            resp = controller.GET(req)
-            self.assert_('accept-ranges' in resp.headers)
-            self.assertEquals(resp.headers['accept-ranges'], 'bytes')
+            gotten_obj = b''
+            try:
+                # don't hang the test run when this fails
+                with Timeout(300):
+                    while True:
+                        buf = fd.read(64)
+                        if not buf:
+                            break
+                        gotten_obj += buf
+            except Timeout:
+                self.fail("GET hung when connection failed")
 
-    def test_response_head_accept_ranges_header(self):
-        with save_globals():
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'HEAD'})
-            self.app.update_request(req)
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-            set_http_connect(200, 200, 200)
-            resp = controller.HEAD(req)
-            self.assert_('accept-ranges' in resp.headers)
-            self.assertEquals(resp.headers['accept-ranges'], 'bytes')
+            # Ensure we failed partway through, otherwise the mocks could
+            # get out of date without anyone noticing
+            self.assertTrue(0 < len(gotten_obj) < len(obj))
 
-    def test_GET_calls_authorize(self):
-        called = [False]
+    def test_HEAD_ec(self):
+        prolis = _test_sockets[0]
+        prosrv = _test_servers[0]
 
-        def authorize(req):
-            called[0] = True
-            return HTTPUnauthorized(request=req)
-        with save_globals():
-            set_http_connect(200, 200, 201, 201, 201)
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-            req = Request.blank('/a/c/o')
-            req.environ['swift.authorize'] = authorize
-            self.app.update_request(req)
-            res = controller.GET(req)
-        self.assert_(called[0])
+        self.put_container(self.ec_policy.name, self.ec_policy.name)
 
-    def test_HEAD_calls_authorize(self):
-        called = [False]
+        obj = b'0123456' * 11 * 17
 
-        def authorize(req):
-            called[0] = True
-            return HTTPUnauthorized(request=req)
-        with save_globals():
-            set_http_connect(200, 200, 201, 201, 201)
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-            req = Request.blank('/a/c/o', {'REQUEST_METHOD': 'HEAD'})
-            req.environ['swift.authorize'] = authorize
-            self.app.update_request(req)
-            res = controller.HEAD(req)
-        self.assert_(called[0])
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        fd.write(('PUT /v1/a/%s/go-head-it HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Connection: close\r\n'
+                  'Content-Length: %d\r\n'
+                  'X-Storage-Token: t\r\n'
+                  'X-Object-Meta-Color: chartreuse\r\n'
+                  'Content-Type: application/octet-stream\r\n'
+                  '\r\n' % (self.ec_policy.name, len(obj))).encode('ascii'))
+        fd.write(obj)
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
 
-    def test_POST_calls_authorize(self):
-        called = [False]
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        fd.write(('HEAD /v1/a/%s/go-head-it HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Connection: close\r\n'
+                  'X-Storage-Token: t\r\n'
+                  '\r\n' % self.ec_policy.name).encode('ascii'))
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 200'
+        self.assertEqual(headers[:len(exp)], exp)
 
-        def authorize(req):
-            called[0] = True
-            return HTTPUnauthorized(request=req)
-        with save_globals():
-            self.app.object_post_as_copy = False
-            set_http_connect(200, 200, 201, 201, 201)
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'POST'},
-                                headers={'Content-Length': '5'}, body='12345')
-            req.environ['swift.authorize'] = authorize
-            self.app.update_request(req)
-            res = controller.POST(req)
-        self.assert_(called[0])
+        headers = parse_headers_string(headers)
+        self.assertEqual(str(len(obj)), headers['Content-Length'])
+        self.assertEqual(
+            md5(obj, usedforsecurity=False).hexdigest(),
+            headers['Etag'])
+        self.assertEqual('chartreuse', headers['X-Object-Meta-Color'])
 
-    def test_POST_as_copy_calls_authorize(self):
-        called = [False]
+        error_lines = prosrv.logger.get_lines_for_level('error')
+        warn_lines = prosrv.logger.get_lines_for_level('warning')
+        self.assertEqual(len(error_lines), 0)  # sanity
+        self.assertEqual(len(warn_lines), 0)  # sanity
 
-        def authorize(req):
-            called[0] = True
-            return HTTPUnauthorized(request=req)
-        with save_globals():
-            set_http_connect(200, 200, 200, 200, 200, 201, 201, 201)
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'POST'},
-                                headers={'Content-Length': '5'}, body='12345')
-            req.environ['swift.authorize'] = authorize
-            self.app.update_request(req)
-            res = controller.POST(req)
-        self.assert_(called[0])
+    def test_GET_ec_404(self):
+        prolis = _test_sockets[0]
+        prosrv = _test_servers[0]
 
-    def test_PUT_calls_authorize(self):
-        called = [False]
+        self.put_container(self.ec_policy.name, self.ec_policy.name)
 
-        def authorize(req):
-            called[0] = True
-            return HTTPUnauthorized(request=req)
-        with save_globals():
-            set_http_connect(200, 200, 201, 201, 201)
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
-                                headers={'Content-Length': '5'}, body='12345')
-            req.environ['swift.authorize'] = authorize
-            self.app.update_request(req)
-            res = controller.PUT(req)
-        self.assert_(called[0])
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        fd.write(('GET /v1/a/%s/yes-we-have-no-bananas HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Connection: close\r\n'
+                  'X-Storage-Token: t\r\n'
+                  '\r\n' % self.ec_policy.name).encode('ascii'))
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 404'
+        self.assertEqual(headers[:len(exp)], exp)
 
-    def test_COPY_calls_authorize(self):
-        called = [False]
+        error_lines = prosrv.logger.get_lines_for_level('error')
+        warn_lines = prosrv.logger.get_lines_for_level('warning')
+        self.assertEqual(len(error_lines), 0)  # sanity
+        self.assertEqual(len(warn_lines), 0)  # sanity
 
-        def authorize(req):
-            called[0] = True
-            return HTTPUnauthorized(request=req)
-        with save_globals():
-            set_http_connect(200, 200, 200, 200, 200, 201, 201, 201)
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-            req = Request.blank('/a/c/o', environ={'REQUEST_METHOD': 'COPY'},
-                                headers={'Destination': 'c/o'})
-            req.environ['swift.authorize'] = authorize
-            self.app.update_request(req)
-            res = controller.COPY(req)
-        self.assert_(called[0])
+    def test_HEAD_ec_404(self):
+        prolis = _test_sockets[0]
+        prosrv = _test_servers[0]
 
-    def test_POST_converts_delete_after_to_delete_at(self):
-        with save_globals():
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-            set_http_connect(200, 200, 200, 200, 200, 202, 202, 202)
-            self.app.memcache.store = {}
-            orig_time = proxy_server.time.time
-            try:
-                t = time()
-                proxy_server.time.time = lambda: t
-                req = Request.blank('/a/c/o', {},
-                                    headers={'Content-Type': 'foo/bar',
-                                             'X-Delete-After': '60'})
-                self.app.update_request(req)
-                res = controller.POST(req)
-                self.assertEquals(res.status, '202 Fake')
-                self.assertEquals(req.headers.get('x-delete-at'),
-                                  str(int(t + 60)))
-
-                self.app.object_post_as_copy = False
-                controller = proxy_server.ObjectController(self.app, 'account',
-                                                           'container',
-                                                           'object')
-                set_http_connect(200, 200, 202, 202, 202)
-                self.app.memcache.store = {}
-                req = Request.blank('/a/c/o', {},
-                                    headers={'Content-Type': 'foo/bar',
-                                             'X-Delete-After': '60'})
-                self.app.update_request(req)
-                res = controller.POST(req)
-                self.assertEquals(res.status, '202 Fake')
-                self.assertEquals(req.headers.get('x-delete-at'),
-                                  str(int(t + 60)))
-            finally:
-                proxy_server.time.time = orig_time
+        self.put_container(self.ec_policy.name, self.ec_policy.name)
 
-    def test_POST_non_int_delete_after(self):
-        with save_globals():
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-            set_http_connect(200, 200, 200, 200, 200, 202, 202, 202)
-            self.app.memcache.store = {}
-            req = Request.blank('/a/c/o', {},
-                                headers={'Content-Type': 'foo/bar',
-                                         'X-Delete-After': '60.1'})
-            self.app.update_request(req)
-            res = controller.POST(req)
-            self.assertEquals(res.status, '400 Bad Request')
-            self.assertTrue('Non-integer X-Delete-After' in res.body)
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        fd.write(('HEAD /v1/a/%s/yes-we-have-no-bananas HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Connection: close\r\n'
+                  'X-Storage-Token: t\r\n'
+                  '\r\n' % self.ec_policy.name).encode('ascii'))
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 404'
+        self.assertEqual(headers[:len(exp)], exp)
 
-    def test_POST_negative_delete_after(self):
-        with save_globals():
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-            set_http_connect(200, 200, 200, 200, 200, 202, 202, 202)
-            self.app.memcache.store = {}
-            req = Request.blank('/a/c/o', {},
-                                headers={'Content-Type': 'foo/bar',
-                                         'X-Delete-After': '-60'})
-            self.app.update_request(req)
-            res = controller.POST(req)
-            self.assertEquals(res.status, '400 Bad Request')
-            self.assertTrue('X-Delete-At in past' in res.body)
+        error_lines = prosrv.logger.get_lines_for_level('error')
+        warn_lines = prosrv.logger.get_lines_for_level('warning')
+        self.assertEqual(len(error_lines), 0)  # sanity
+        self.assertEqual(len(warn_lines), 0)  # sanity
 
-    def test_POST_delete_at(self):
-        with save_globals():
-            given_headers = {}
+    def test_reload_ring_ec(self):
+        self.put_container("ec", "ec-con")
 
-            def fake_make_requests(req, ring, part, method, path, headers,
-                                   query_string=''):
-                given_headers.update(headers[0])
+        orig_rtime = self.ec_policy.object_ring._rtime
+        orig_replica_count = self.ec_policy.object_ring.replica_count
+        # save original file as back up
+        copyfile(self.ec_policy.object_ring.serialized_path,
+                 self.ec_policy.object_ring.serialized_path + '.bak')
 
-            self.app.object_post_as_copy = False
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-            controller.make_requests = fake_make_requests
-            set_http_connect(200, 200)
-            self.app.memcache.store = {}
-            t = str(int(time() + 100))
-            req = Request.blank('/a/c/o', {},
-                                headers={'Content-Type': 'foo/bar',
-                                         'X-Delete-At': t})
-            self.app.update_request(req)
-            controller.POST(req)
-            self.assertEquals(given_headers.get('X-Delete-At'), t)
-            self.assertTrue('X-Delete-At-Host' in given_headers)
-            self.assertTrue('X-Delete-At-Device' in given_headers)
-            self.assertTrue('X-Delete-At-Partition' in given_headers)
+        try:
+            # overwrite with 2 replica, 2 devices ring
+            obj_devs = []
+            obj_devs.append(
+                {'port': _test_sockets[-3].getsockname()[1],
+                 'device': 'sdg1'})
+            obj_devs.append(
+                {'port': _test_sockets[-2].getsockname()[1],
+                 'device': 'sdh1'})
+            write_fake_ring(self.ec_policy.object_ring.serialized_path,
+                            *obj_devs)
+
+            def get_ring_reloaded_response(method):
+                # force to reload at the request
+                self.ec_policy.object_ring._rtime = 0
+
+                trans_data = ['%s /v1/a/ec-con/o2 HTTP/1.1\r\n' % method,
+                              'Host: localhost\r\n',
+                              'Connection: close\r\n',
+                              'X-Storage-Token: t\r\n']
+
+                if method == 'PUT':
+                    # small, so we don't get multiple EC stripes
+                    obj = b'abCD' * 10
+
+                    extra_trans_data = [
+                        'Etag: "%s"\r\n' % md5(
+                            obj, usedforsecurity=False).hexdigest(),
+                        'Content-Length: %d\r\n' % len(obj),
+                        'Content-Type: application/octet-stream\r\n',
+                        '\r\n%s' % obj.decode('ascii')
+                    ]
+                    trans_data.extend(extra_trans_data)
+                else:
+                    trans_data.append('\r\n')
 
-            t = str(int(time() + 100)) + '.1'
-            req = Request.blank('/a/c/o', {},
-                                headers={'Content-Type': 'foo/bar',
-                                         'X-Delete-At': t})
-            self.app.update_request(req)
-            resp = controller.POST(req)
-            self.assertEquals(resp.status_int, 400)
-            self.assertTrue('Non-integer X-Delete-At' in resp.body)
+                prolis = _test_sockets[0]
+                sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+                fd = sock.makefile('rwb')
+                fd.write(''.join(trans_data).encode('ascii'))
+                fd.flush()
+                headers = readuntil2crlfs(fd)
 
-            t = str(int(time() - 100))
-            req = Request.blank('/a/c/o', {},
-                                headers={'Content-Type': 'foo/bar',
-                                         'X-Delete-At': t})
-            self.app.update_request(req)
-            resp = controller.POST(req)
-            self.assertEquals(resp.status_int, 400)
-            self.assertTrue('X-Delete-At in past' in resp.body)
+                # use older ring with rollbacking
+                return headers
 
-    def test_PUT_converts_delete_after_to_delete_at(self):
-        with save_globals():
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-            set_http_connect(200, 200, 201, 201, 201)
-            self.app.memcache.store = {}
-            orig_time = proxy_server.time.time
-            try:
-                t = time()
-                proxy_server.time.time = lambda: t
-                req = Request.blank('/a/c/o', {},
-                                    headers={'Content-Length': '0',
-                                             'Content-Type': 'foo/bar',
-                                             'X-Delete-After': '60'})
-                self.app.update_request(req)
-                res = controller.PUT(req)
-                self.assertEquals(res.status, '201 Fake')
-                self.assertEquals(req.headers.get('x-delete-at'),
-                                  str(int(t + 60)))
-            finally:
-                proxy_server.time.time = orig_time
+            for method in ('PUT', 'HEAD', 'GET', 'POST', 'DELETE'):
+                headers = get_ring_reloaded_response(method)
+                exp = b'HTTP/1.1 20'
+                self.assertEqual(headers[:len(exp)], exp)
 
-    def test_PUT_non_int_delete_after(self):
-        with save_globals():
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-            set_http_connect(200, 200, 201, 201, 201)
-            self.app.memcache.store = {}
-            req = Request.blank('/a/c/o', {},
-                                headers={'Content-Length': '0',
-                                         'Content-Type': 'foo/bar',
-                                         'X-Delete-After': '60.1'})
-            self.app.update_request(req)
-            res = controller.PUT(req)
-            self.assertEquals(res.status, '400 Bad Request')
-            self.assertTrue('Non-integer X-Delete-After' in res.body)
+                # proxy didn't load newest ring, use older one
+                self.assertEqual(orig_replica_count,
+                                 self.ec_policy.object_ring.replica_count)
 
-    def test_PUT_negative_delete_after(self):
-        with save_globals():
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-            set_http_connect(200, 200, 201, 201, 201)
-            self.app.memcache.store = {}
-            req = Request.blank('/a/c/o', {},
-                                headers={'Content-Length': '0',
-                                         'Content-Type': 'foo/bar',
-                                         'X-Delete-After': '-60'})
-            self.app.update_request(req)
-            res = controller.PUT(req)
-            self.assertEquals(res.status, '400 Bad Request')
-            self.assertTrue('X-Delete-At in past' in res.body)
+                if method == 'POST':
+                    headers = get_ring_reloaded_response(method)
 
-    def test_PUT_delete_at(self):
-        with save_globals():
-            given_headers = {}
+                    exp = b'HTTP/1.1 20'
+                    self.assertEqual(headers[:len(exp)], exp)
+                    # sanity
+                    self.assertEqual(orig_replica_count,
+                                     self.ec_policy.object_ring.replica_count)
 
-            def fake_connect_put_node(nodes, part, path, headers,
-                                      logger_thread_locals):
-                given_headers.update(headers)
+        finally:
+            self.ec_policy.object_ring._rtime = orig_rtime
+            os.rename(self.ec_policy.object_ring.serialized_path + '.bak',
+                      self.ec_policy.object_ring.serialized_path)
 
-            controller = proxy_server.ObjectController(self.app, 'account',
-                                                       'container', 'object')
-            controller._connect_put_node = fake_connect_put_node
-            set_http_connect(200, 200)
-            self.app.memcache.store = {}
-            t = str(int(time() + 100))
-            req = Request.blank('/a/c/o', {},
-                                headers={'Content-Length': '0',
-                                         'Content-Type': 'foo/bar',
-                                         'X-Delete-At': t})
-            self.app.update_request(req)
-            controller.PUT(req)
-            self.assertEquals(given_headers.get('X-Delete-At'), t)
-            self.assertTrue('X-Delete-At-Host' in given_headers)
-            self.assertTrue('X-Delete-At-Device' in given_headers)
-            self.assertTrue('X-Delete-At-Partition' in given_headers)
+    def test_ec_client_disconnect(self):
+        prolis = _test_sockets[0]
 
-            t = str(int(time() + 100)) + '.1'
-            req = Request.blank('/a/c/o', {},
-                                headers={'Content-Length': '0',
-                                         'Content-Type': 'foo/bar',
-                                         'X-Delete-At': t})
-            self.app.update_request(req)
-            resp = controller.PUT(req)
-            self.assertEquals(resp.status_int, 400)
-            self.assertTrue('Non-integer X-Delete-At' in resp.body)
+        # create connection
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+
+        # create container
+        fd.write(('PUT /v1/a/%s-discon HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Content-Length: 0\r\n'
+                  'X-Storage-Token: t\r\n'
+                  'X-Storage-Policy: %s\r\n'
+                  '\r\n' % (self.ec_policy.name,
+                            self.ec_policy.name)).encode('ascii'))
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 2'
+        self.assertEqual(headers[:len(exp)], exp)
 
-            t = str(int(time() - 100))
-            req = Request.blank('/a/c/o', {},
-                                headers={'Content-Length': '0',
-                                         'Content-Type': 'foo/bar',
-                                         'X-Delete-At': t})
-            self.app.update_request(req)
-            resp = controller.PUT(req)
-            self.assertEquals(resp.status_int, 400)
-            self.assertTrue('X-Delete-At in past' in resp.body)
+        # create object
+        obj = b'a' * 4 * 64 * 2 ** 10
+        fd.write(('PUT /v1/a/%s-discon/test HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Content-Length: %d\r\n'
+                  'X-Storage-Token: t\r\n'
+                  'Content-Type: donuts\r\n'
+                  '\r\n' % (self.ec_policy.name, len(obj))).encode('ascii'))
+        fd.write(obj)
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
 
-    def test_leak_1(self):
-        global _request_instances
+        class WrappedTimeout(utils.WatchdogTimeout):
+            def __enter__(self):
+                timeouts[self] = traceback.extract_stack()
+                return super(WrappedTimeout, self).__enter__()
+
+            def __exit__(self, typ, value, tb):
+                timeouts[self] = None
+                return super(WrappedTimeout, self).__exit__(typ, value, tb)
+
+        timeouts = {}
+        with mock.patch('swift.proxy.controllers.obj.WatchdogTimeout',
+                        WrappedTimeout):
+            with mock.patch.object(_test_servers[0], 'client_timeout', new=5):
+                # get object
+                fd.write(('GET /v1/a/%s-discon/test HTTP/1.1\r\n'
+                          'Host: localhost\r\n'
+                          'Connection: close\r\n'
+                          'X-Storage-Token: t\r\n'
+                          '\r\n' % self.ec_policy.name).encode('ascii'))
+                fd.flush()
+                headers = readuntil2crlfs(fd)
+                exp = b'HTTP/1.1 200'
+                self.assertEqual(headers[:len(exp)], exp)
+
+                # read most of the object, and disconnect
+                fd.read(10)
+                sock.fd._real_close()
+                self._sleep_enough(
+                    lambda:
+                    _test_servers[0].logger.get_lines_for_level('warning'))
+
+        # check for disconnect message!
+        expected = [
+            "Client disconnected on read of EC frag '/a/%s-discon/test'"
+            % self.ec_policy.name] * 2
+        self.assertEqual(
+            _test_servers[0].logger.get_lines_for_level('warning'),
+            expected)
+        # check that no coro was left waiting to write
+        self.assertTrue(timeouts)  # sanity - WrappedTimeout did get called
+        missing_exits = [tb for tb in timeouts.values() if tb is not None]
+        self.assertFalse(
+            missing_exits, 'Failed to exit all ChunkWriteTimeouts.\n' +
+            ''.join(['No exit from ChunkWriteTimeout entered at:\n' +
+                     ''.join(traceback.format_list(tb)[:-1])
+                     for tb in missing_exits]))
+        # and check that the ChunkWriteTimeouts did not raise Exceptions
+        self.assertFalse(_test_servers[0].logger.get_lines_for_level('error'))
+
+    def test_ec_client_put_disconnect(self):
         prolis = _test_sockets[0]
-        prosrv = _test_servers[0]
-        obj_len = prosrv.client_chunk_size * 2
-        # PUT test file
+
+        # create connection
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('PUT /v1/a/c/test_leak_1 HTTP/1.1\r\n'
-                 'Host: localhost\r\n'
-                 'Connection: close\r\n'
-                 'X-Auth-Token: t\r\n'
-                 'Content-Length: %s\r\n'
-                 'Content-Type: application/octet-stream\r\n'
-                 '\r\n%s' % (obj_len,  'a' * obj_len))
+        fd = sock.makefile('rwb')
+
+        # create container
+        fd.write(('PUT /v1/a/%s-discon HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Content-Length: 0\r\n'
+                  'X-Storage-Token: t\r\n'
+                  'X-Storage-Policy: %s\r\n'
+                  '\r\n' % (self.ec_policy.name,
+                            self.ec_policy.name)).encode('ascii'))
         fd.flush()
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 201'
+        exp = b'HTTP/1.1 2'
         self.assertEqual(headers[:len(exp)], exp)
-        # Remember Request instance count
-        before_request_instances = _request_instances
-        # GET test file, but disconnect early
+
+        # create object
+        obj = b'a' * 4 * 64 * 2 ** 10
+        fd.write(('PUT /v1/a/%s-discon/test HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Content-Length: %d\r\n'
+                  'X-Storage-Token: t\r\n'
+                  'Content-Type: donuts\r\n'
+                  '\r\n' % (self.ec_policy.name, len(obj))).encode('ascii'))
+        fd.write(obj[:-10])
+        fd.flush()
+        fd.close()
+        sock.close()
+        # sleep to trampoline enough
+        condition = \
+            lambda: _test_servers[0].logger.get_lines_for_level('warning')
+        self._sleep_enough(condition)
+        expected = ['Client disconnected without sending enough data']
+        warns = _test_servers[0].logger.get_lines_for_level('warning')
+        self.assertEqual(expected, warns)
+        errors = _test_servers[0].logger.get_lines_for_level('error')
+        self.assertEqual([], errors)
+
+        # try it chunked
+        _test_servers[0].logger.clear()
+        chunk = 'a' * 64 * 2 ** 10
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        fd.write(('PUT /v1/a/%s-discon/test HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Transfer-Encoding: chunked\r\n'
+                  'X-Storage-Token: t\r\n'
+                  'Content-Type: donuts\r\n'
+                  '\r\n' % (self.ec_policy.name,)).encode('ascii'))
+        fd.write(('%x\r\n%s\r\n' % (len(chunk), chunk)).encode('ascii'))
+        # no zero-byte end chunk
+        fd.flush()
+        fd.close()
+        sock.close()
+        # sleep to trampoline enough
+        condition = \
+            lambda: _test_servers[0].logger.get_lines_for_level('warning')
+        self._sleep_enough(condition)
+        expected = ['Client disconnected without sending last chunk']
+        warns = _test_servers[0].logger.get_lines_for_level('warning')
+        self.assertEqual(expected, warns)
+        errors = _test_servers[0].logger.get_lines_for_level('error')
+        self.assertEqual([], errors)
+
+        _test_servers[0].logger.clear()
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        fd.write(('PUT /v1/a/%s-discon/test HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Transfer-Encoding: chunked\r\n'
+                  'X-Storage-Token: t\r\n'
+                  'Content-Type: donuts\r\n'
+                  '\r\n' % (self.ec_policy.name,)).encode('ascii'))
+        fd.write(('%x\r\n%s\r\n' % (len(chunk), chunk)).encode('ascii')[:-10])
+        fd.flush()
+        fd.close()
+        sock.close()
+        # sleep to trampoline enough
+        condition = \
+            lambda: _test_servers[0].logger.get_lines_for_level('warning')
+        self._sleep_enough(condition)
+        expected = ['Client disconnected without sending last chunk']
+        warns = _test_servers[0].logger.get_lines_for_level('warning')
+        self.assertEqual(expected, warns)
+        errors = _test_servers[0].logger.get_lines_for_level('error')
+        self.assertEqual([], errors)
+
+        _test_servers[0].logger.clear()
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        fd.write(('PUT /v1/a/%s-discon/test HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Transfer-Encoding: chunked\r\n'
+                  'X-Storage-Token: t\r\n'
+                  'Content-Type: donuts\r\n'
+                  '\r\n' % (self.ec_policy.name,)).encode('ascii'))
+        fd.write(('%x\r\n' % len(chunk)).encode('ascii'))
+        fd.flush()
+        fd.close()
+        sock.close()
+        # sleep to trampoline enough
+        condition = \
+            lambda: _test_servers[0].logger.get_lines_for_level('warning')
+        self._sleep_enough(condition)
+        expected = ['Client disconnected without sending last chunk']
+        warns = _test_servers[0].logger.get_lines_for_level('warning')
+        self.assertEqual(expected, warns)
+        errors = _test_servers[0].logger.get_lines_for_level('error')
+        self.assertEqual([], errors)
+
+        # Do a valid guy with conflicting headers
+        _test_servers[0].logger.clear()
+        chunk = 'a' * 64 * 2 ** 10
         sock = connect_tcp(('localhost', prolis.getsockname()[1]))
-        fd = sock.makefile()
-        fd.write('GET /v1/a/c/test_leak_1 HTTP/1.1\r\n'
-                 'Host: localhost\r\n'
-                 'Connection: close\r\n'
-                 'X-Auth-Token: t\r\n'
-                 '\r\n')
+        fd = sock.makefile('rwb')
+        fd.write(('PUT /v1/a/%s-discon/test HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Transfer-Encoding: chunked\r\n'
+                  'Content-Length: 999999999999999999999999\r\n'
+                  'X-Storage-Token: t\r\n'
+                  'Content-Type: donuts\r\n'
+                  '\r\n' % (self.ec_policy.name,)).encode('ascii'))
+        fd.write(('%x\r\n%s\r\n0\r\n\r\n' % (
+            len(chunk), chunk)).encode('ascii'))
+        # no zero-byte end chunk
         fd.flush()
         headers = readuntil2crlfs(fd)
-        exp = 'HTTP/1.1 200'
+        exp = b'HTTP/1.1 201'
         self.assertEqual(headers[:len(exp)], exp)
-        fd.read(1)
         fd.close()
         sock.close()
-        self.assertEquals(before_request_instances, _request_instances)
+        warns = _test_servers[0].logger.get_lines_for_level('warning')
+        self.assertEqual([], warns)
+        errors = _test_servers[0].logger.get_lines_for_level('error')
+        self.assertEqual([], errors)
 
-    def test_OPTIONS(self):
-        with save_globals():
-            controller = proxy_server.ObjectController(self.app, 'a',
-                                                       'c', 'o.jpg')
 
-            def my_empty_container_info(*args):
-                return {}
-            controller.container_info = my_empty_container_info
-            req = Request.blank(
-                '/a/c/o.jpg',
-                {'REQUEST_METHOD': 'OPTIONS'},
-                headers={'Origin': 'http://foo.com',
-                         'Access-Control-Request-Method': 'GET'})
-            resp = controller.OPTIONS(req)
-            self.assertEquals(401, resp.status_int)
+class TestECObjectController(BaseTestECObjectController, unittest.TestCase):
+    def setUp(self):
+        skip_if_no_xattrs()
+        self.policy = self.ec_policy = POLICIES[3]
+        super(TestECObjectController, self).setUp()
 
-            def my_empty_origin_container_info(*args):
-                return {'cors': {'allow_origin': None}}
-            controller.container_info = my_empty_origin_container_info
-            req = Request.blank(
-                '/a/c/o.jpg',
-                {'REQUEST_METHOD': 'OPTIONS'},
-                headers={'Origin': 'http://foo.com',
-                         'Access-Control-Request-Method': 'GET'})
-            resp = controller.OPTIONS(req)
-            self.assertEquals(401, resp.status_int)
 
-            def my_container_info(*args):
-                return {
-                    'cors': {
-                        'allow_origin': 'http://foo.bar:8080 https://foo.bar',
-                        'allow_headers': 'x-foo',
-                        'max_age': '999',
-                    }
-                }
-            controller.container_info = my_container_info
-            req = Request.blank(
-                '/a/c/o.jpg',
-                {'REQUEST_METHOD': 'OPTIONS'},
-                headers={'Origin': 'https://foo.bar',
-                         'Access-Control-Request-Method': 'GET'})
-            req.content_length = 0
-            resp = controller.OPTIONS(req)
-            self.assertEquals(200, resp.status_int)
-            self.assertEquals(
-                'https://foo.bar',
-                resp.headers['access-control-allow-origin'])
-            for verb in 'OPTIONS COPY GET POST PUT DELETE HEAD'.split():
-                self.assertTrue(
-                    verb in resp.headers['access-control-allow-methods'])
-            self.assertEquals(
-                len(resp.headers['access-control-allow-methods'].split(', ')),
-                7)
-            self.assertEquals('999', resp.headers['access-control-max-age'])
-            self.assertEquals(
-                'x-foo',
-                resp.headers['access-control-allow-headers'])
-            req = Request.blank(
-                '/a/c/o.jpg',
-                {'REQUEST_METHOD': 'OPTIONS'},
-                headers={'Origin': 'https://foo.bar'})
-            req.content_length = 0
-            resp = controller.OPTIONS(req)
-            self.assertEquals(401, resp.status_int)
-            req = Request.blank('/a/c/o.jpg', {'REQUEST_METHOD': 'OPTIONS'})
-            req.content_length = 0
-            resp = controller.OPTIONS(req)
-            self.assertEquals(200, resp.status_int)
-            for verb in 'OPTIONS COPY GET POST PUT DELETE HEAD'.split():
-                self.assertTrue(
-                    verb in resp.headers['Allow'])
-            self.assertEquals(len(resp.headers['Allow'].split(', ')), 7)
-            req = Request.blank(
-                '/a/c/o.jpg',
-                {'REQUEST_METHOD': 'OPTIONS'},
-                headers={'Origin': 'http://foo.com'})
-            resp = controller.OPTIONS(req)
-            self.assertEquals(401, resp.status_int)
-            req = Request.blank(
-                '/a/c/o.jpg',
-                {'REQUEST_METHOD': 'OPTIONS'},
-                headers={'Origin': 'http://foo.bar',
-                         'Access-Control-Request-Method': 'GET'})
-            controller.app.cors_allow_origin = ['http://foo.bar', ]
-            resp = controller.OPTIONS(req)
-            self.assertEquals(200, resp.status_int)
+class TestECDuplicationObjectController(
+        BaseTestECObjectController, unittest.TestCase):
+    def setUp(self):
+        skip_if_no_xattrs()
+        self.policy = self.ec_policy = POLICIES[4]
+        super(TestECDuplicationObjectController, self).setUp()
+
+
+class TestECMismatchedFA(unittest.TestCase):
+    def setUp(self):
+        skip_if_no_xattrs()
+
+    def tearDown(self):
+        prosrv = _test_servers[0]
+        # don't leak error limits and poison other tests
+        prosrv.error_limiter.stats.clear()
+
+    def test_mixing_different_objects_fragment_archives(self):
+        (prosrv, acc1srv, acc2srv, con1srv, con2srv, obj1srv,
+         obj2srv, obj3srv, obj4srv, obj5srv, obj6srv) = _test_servers
+
+        ec_policy = POLICIES[3]
+
+        @public
+        def bad_disk(req):
+            return Response(status=507, body="borken")
+
+        ensure_container = Request.blank(
+            "/v1/a/ec-crazytown",
+            environ={"REQUEST_METHOD": "PUT"},
+            headers={"X-Storage-Policy": "ec", "X-Auth-Token": "t"})
+        resp = ensure_container.get_response(prosrv)
+        self.assertIn(resp.status_int, (201, 202))
+
+        obj1 = "first version..."
+        put_req1 = Request.blank(
+            "/v1/a/ec-crazytown/obj",
+            environ={"REQUEST_METHOD": "PUT"},
+            headers={"X-Auth-Token": "t"})
+        put_req1.body = obj1
+
+        obj2 = u"versión segundo".encode("utf-8")
+        put_req2 = Request.blank(
+            "/v1/a/ec-crazytown/obj",
+            environ={"REQUEST_METHOD": "PUT"},
+            headers={"X-Auth-Token": "t"})
+        put_req2.body = obj2
+
+        # pyeclib has checks for unequal-length; we don't want to trip those
+        self.assertEqual(len(obj1), len(obj2))
+
+        # Server obj1 will have the first version of the object (obj2 also
+        # gets it, but that gets stepped on later)
+        prosrv.error_limiter.stats.clear()
+        with mock.patch.object(obj3srv, 'PUT', bad_disk), \
+                mock.patch(
+                    'swift.common.storage_policy.ECStoragePolicy.quorum'):
+            type(ec_policy).quorum = mock.PropertyMock(return_value=2)
+            resp = put_req1.get_response(prosrv)
+        self.assertEqual(resp.status_int, 201)
+
+        # Servers obj2 and obj3 will have the second version of the object.
+        prosrv.error_limiter.stats.clear()
+        with mock.patch.object(obj1srv, 'PUT', bad_disk), \
+                mock.patch(
+                    'swift.common.storage_policy.ECStoragePolicy.quorum'):
+            type(ec_policy).quorum = mock.PropertyMock(return_value=2)
+            resp = put_req2.get_response(prosrv)
+        self.assertEqual(resp.status_int, 201)
+
+        # A GET that only sees 1 fragment archive should fail
+        get_req = Request.blank("/v1/a/ec-crazytown/obj",
+                                environ={"REQUEST_METHOD": "GET"},
+                                headers={"X-Auth-Token": "t"})
+        prosrv.error_limiter.stats.clear()
+        with mock.patch.object(obj1srv, 'GET', bad_disk), \
+                mock.patch.object(obj2srv, 'GET', bad_disk):
+            resp = get_req.get_response(prosrv)
+        self.assertEqual(resp.status_int, 503)
+
+        # A GET that sees 2 matching FAs will work
+        get_req = Request.blank("/v1/a/ec-crazytown/obj",
+                                environ={"REQUEST_METHOD": "GET"},
+                                headers={"X-Auth-Token": "t"})
+        prosrv.error_limiter.stats.clear()
+        with mock.patch.object(obj1srv, 'GET', bad_disk):
+            resp = get_req.get_response(prosrv)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.body, obj2)
+
+        # A GET that sees 2 mismatching FAs will fail
+        get_req = Request.blank("/v1/a/ec-crazytown/obj",
+                                environ={"REQUEST_METHOD": "GET"},
+                                headers={"X-Auth-Token": "t"})
+        prosrv.error_limiter.stats.clear()
+        with mock.patch.object(obj2srv, 'GET', bad_disk):
+            resp = get_req.get_response(prosrv)
+        self.assertEqual(resp.status_int, 503)
+
+    def test_mixing_different_objects_fragment_archives_with_dup_factor(self):
+        (prosrv, acc1srv, acc2srv, con1srv, con2srv, obj1srv,
+         obj2srv, obj3srv, obj4srv, obj5srv, obj6srv) = _test_servers
+
+        ec_policy = POLICIES[4]
+
+        @public
+        def bad_disk(req):
+            return Response(status=507, body="borken")
+
+        ensure_container = Request.blank(
+            "/v1/a/ec-dup-crazytown",
+            environ={"REQUEST_METHOD": "PUT"},
+            headers={"X-Storage-Policy": "ec-dup", "X-Auth-Token": "t"})
+        resp = ensure_container.get_response(prosrv)
+        self.assertIn(resp.status_int, (201, 202))
+
+        obj1 = "first version..."
+        put_req1 = Request.blank(
+            "/v1/a/ec-dup-crazytown/obj",
+            environ={"REQUEST_METHOD": "PUT"},
+            headers={"X-Auth-Token": "t"})
+        put_req1.body = obj1
+
+        obj2 = u"versión segundo".encode("utf-8")
+        put_req2 = Request.blank(
+            "/v1/a/ec-dup-crazytown/obj",
+            environ={"REQUEST_METHOD": "PUT"},
+            headers={"X-Auth-Token": "t"})
+        put_req2.body = obj2
+
+        # pyeclib has checks for unequal-length; we don't want to trip those
+        self.assertEqual(len(obj1), len(obj2))
+
+        # First subset of object server will have the first version of the
+        # object
+        prosrv.error_limiter.stats.clear()
+        with mock.patch.object(obj4srv, 'PUT', bad_disk), \
+                mock.patch.object(obj5srv, 'PUT', bad_disk), \
+                mock.patch.object(obj6srv, 'PUT', bad_disk), \
+                mock.patch(
+                    'swift.common.storage_policy.ECStoragePolicy.quorum'):
+            type(ec_policy).quorum = mock.PropertyMock(return_value=3)
+            resp = put_req1.get_response(prosrv)
+        self.assertEqual(resp.status_int, 201)
+
+        # Second subset will have the second version of the object.
+        prosrv.error_limiter.stats.clear()
+        with mock.patch.object(obj1srv, 'PUT', bad_disk), \
+                mock.patch.object(obj2srv, 'PUT', bad_disk), \
+                mock.patch.object(obj3srv, 'PUT', bad_disk), \
+                mock.patch(
+                    'swift.common.storage_policy.ECStoragePolicy.quorum'):
+            type(ec_policy).quorum = mock.PropertyMock(return_value=3)
+            resp = put_req2.get_response(prosrv)
+        self.assertEqual(resp.status_int, 201)
+
+        # A GET that only sees 1 fragment archive should fail
+        get_req = Request.blank("/v1/a/ec-dup-crazytown/obj",
+                                environ={"REQUEST_METHOD": "GET"},
+                                headers={"X-Auth-Token": "t"})
+        prosrv.error_limiter.stats.clear()
+        with mock.patch.object(obj2srv, 'GET', bad_disk), \
+                mock.patch.object(obj3srv, 'GET', bad_disk), \
+                mock.patch.object(obj4srv, 'GET', bad_disk), \
+                mock.patch.object(obj5srv, 'GET', bad_disk), \
+                mock.patch.object(obj6srv, 'GET', bad_disk):
+            resp = get_req.get_response(prosrv)
+        self.assertEqual(resp.status_int, 503)
+
+        # A GET that sees 2 matching FAs will work
+        get_req = Request.blank("/v1/a/ec-dup-crazytown/obj",
+                                environ={"REQUEST_METHOD": "GET"},
+                                headers={"X-Auth-Token": "t"})
+        prosrv.error_limiter.stats.clear()
+        with mock.patch.object(obj1srv, 'GET', bad_disk), \
+                mock.patch.object(obj2srv, 'GET', bad_disk), \
+                mock.patch.object(obj3srv, 'GET', bad_disk), \
+                mock.patch.object(obj6srv, 'GET', bad_disk):
+            resp = get_req.get_response(prosrv)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.body, obj2)
+
+        # A GET that sees 2 mismatching FAs will fail
+        get_req = Request.blank("/v1/a/ec-dup-crazytown/obj",
+                                environ={"REQUEST_METHOD": "GET"},
+                                headers={"X-Auth-Token": "t"})
+        prosrv.error_limiter.stats.clear()
+        with mock.patch.object(obj2srv, 'GET', bad_disk), \
+                mock.patch.object(obj3srv, 'GET', bad_disk), \
+                mock.patch.object(obj4srv, 'GET', bad_disk), \
+                mock.patch.object(obj6srv, 'GET', bad_disk):
+            resp = get_req.get_response(prosrv)
+        self.assertEqual(resp.status_int, 503)
+
+
+class TestECGets(unittest.TestCase):
+    def setUp(self):
+        super(TestECGets, self).setUp()
+        skip_if_no_xattrs()
+        self.tempdir = mkdtemp()
+
+    def tearDown(self):
+        rmtree(self.tempdir, ignore_errors=True)
+        prosrv = _test_servers[0]
+        # don't leak error limits and poison other tests
+        prosrv.error_limiter.stats.clear()
+        super(TestECGets, self).tearDown()
+
+    def _setup_nodes_and_do_GET(self, objs, node_state):
+        """
+        A helper method that creates object fragments, stashes them in temp
+        dirs, and then moves selected fragments back into the hash_dirs on each
+        node according to a specified desired node state description.
+
+        :param objs: a dict that maps object references to dicts that describe
+                     the object timestamp and content. Object frags will be
+                     created for each item in this dict.
+        :param node_state: a dict that maps a node index to the desired state
+                           for that node. Each desired state is a list of
+                           dicts, with each dict describing object reference,
+                           frag_index and whether the file moved to the node's
+                           hash_dir should be marked as durable or not, or
+                           converted to a meta file.
+        """
+        (prosrv, acc1srv, acc2srv, con1srv, con2srv, obj1srv,
+         obj2srv, obj3srv, _obj4srv, _obj5srv, _obj6srv) = _test_servers
+        ec_policy = POLICIES[3]
+        container_name = uuid.uuid4().hex
+        obj_name = uuid.uuid4().hex
+        obj_path = os.path.join(os.sep, 'v1', 'a', container_name, obj_name)
+
+        # PUT container, make sure it worked
+        container_path = os.path.join(os.sep, 'v1', 'a', container_name)
+        ec_container = Request.blank(
+            container_path, environ={"REQUEST_METHOD": "PUT"},
+            headers={"X-Storage-Policy": "ec", "X-Auth-Token": "t"})
+        resp = ec_container.get_response(prosrv)
+        self.assertIn(resp.status_int, (201, 202))
+
+        partition, nodes = \
+            ec_policy.object_ring.get_nodes('a', container_name, obj_name)
+
+        # map nodes to hash dirs
+        node_hash_dirs = {}
+        node_tmp_dirs = collections.defaultdict(dict)
+        for node in nodes:
+            node_hash_dirs[node['index']] = os.path.join(
+                _testdir, node['device'], storage_directory(
+                    diskfile.get_data_dir(ec_policy),
+                    partition, hash_path('a', container_name, obj_name)))
+
+        def _put_object(ref, timestamp, body):
+            # PUT an object and then move its disk files to a temp dir
+            headers = {"X-Timestamp": timestamp.internal}
+            put_req1 = Request.blank(obj_path, method='PUT', headers=headers)
+            put_req1.body = body
+            resp = put_req1.get_response(prosrv)
+            self.assertEqual(resp.status_int, 201)
+
+            # GET the obj, should work fine
+            get_req = Request.blank(obj_path, method="GET")
+            resp = get_req.get_response(prosrv)
+            self.assertEqual(resp.status_int, 200)
+            self.assertEqual(resp.body, body)
+
+            # move all hash dir files to per-node, per-obj tempdir
+            for node_index, hash_dir in node_hash_dirs.items():
+                node_tmp_dirs[node_index][ref] = mkdtemp(dir=self.tempdir)
+                for f in os.listdir(hash_dir):
+                    move(os.path.join(hash_dir, f),
+                         os.path.join(node_tmp_dirs[node_index][ref], f))
+
+        for obj_ref, obj_info in objs.items():
+            _put_object(obj_ref, **obj_info)
+
+        # sanity check - all hash_dirs are empty and GET returns a 404
+        for hash_dir in node_hash_dirs.values():
+            self.assertFalse(os.listdir(hash_dir))
+        get_req = Request.blank(obj_path, method="GET")
+        resp = get_req.get_response(prosrv)
+        self.assertEqual(resp.status_int, 404)
+
+        # node state is in form:
+        # {node_index: [{ref: object reference,
+        #                frag_index: index,
+        #                durable: True or False,
+        #                meta: True or False}, ...],
+        #  node_index: ...}
+        # meta takes precedence over durable
+        for node_index, state in node_state.items():
+            dest = node_hash_dirs[node_index]
+            for frag_info in state:
+                src = node_tmp_dirs[frag_info['frag_index']][frag_info['ref']]
+                src_files = os.listdir(src)
+                # sanity check, expect just a single .data file
+                self.assertFalse(src_files[1:])
+                dest_file = src_files[0]
+                if frag_info.get('meta', False):
+                    # morph a data file into a meta file;
+                    # note: a real meta file would not have content
+                    dest_file = dest_file.replace(
+                        '#%d#d.data' % frag_info['frag_index'], '.meta')
+                elif not frag_info.get('durable', False):
+                    dest_file = dest_file.replace('#d', '')
+                move(os.path.join(src, src_files[0]),
+                     os.path.join(dest, dest_file))
+
+        # do an object GET
+        get_req = Request.blank(obj_path, method='GET')
+        return get_req.get_response(prosrv)
+
+    def test_GET_with_missing_durables(self):
+        # verify object GET behavior when durable files are missing
+        ts_iter = make_timestamp_iter()
+        objs = {'obj1': dict(timestamp=next(ts_iter), body=b'body')}
+
+        # durable missing from 2/3 nodes
+        node_state = {
+            0: [dict(ref='obj1', frag_index=0, durable=True)],
+            1: [dict(ref='obj1', frag_index=1, durable=False)],
+            2: [dict(ref='obj1', frag_index=2, durable=False)]
+        }
+
+        resp = self._setup_nodes_and_do_GET(objs, node_state)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.body, objs['obj1']['body'])
+
+        # all files missing on 1 node, durable missing from 1/2 other nodes
+        # durable missing from 2/3 nodes
+        node_state = {
+            0: [dict(ref='obj1', frag_index=0, durable=True)],
+            1: [],
+            2: [dict(ref='obj1', frag_index=2, durable=False)]
+        }
+
+        resp = self._setup_nodes_and_do_GET(objs, node_state)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.body, objs['obj1']['body'])
+
+        # durable missing from all 3 nodes
+        node_state = {
+            0: [dict(ref='obj1', frag_index=0, durable=False)],
+            1: [dict(ref='obj1', frag_index=1, durable=False)],
+            2: [dict(ref='obj1', frag_index=2, durable=False)]
+        }
+
+        resp = self._setup_nodes_and_do_GET(objs, node_state)
+        self.assertEqual(resp.status_int, 404)
+
+    def test_GET_with_multiple_frags_per_node(self):
+        # verify object GET behavior when multiple fragments are on same node
+        ts_iter = make_timestamp_iter()
+        objs = {'obj1': dict(timestamp=next(ts_iter), body=b'body')}
+
+        # scenario: only two frags, both on same node
+        node_state = {
+            0: [],
+            1: [dict(ref='obj1', frag_index=0, durable=True),
+                dict(ref='obj1', frag_index=1, durable=False)],
+            2: []
+        }
+
+        resp = self._setup_nodes_and_do_GET(objs, node_state)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.body, objs['obj1']['body'])
+
+        # scenario: all 3 frags on same node
+        node_state = {
+            0: [],
+            1: [dict(ref='obj1', frag_index=0, durable=True),
+                dict(ref='obj1', frag_index=1, durable=False),
+                dict(ref='obj1', frag_index=2, durable=False)],
+            2: []
+        }
+
+        resp = self._setup_nodes_and_do_GET(objs, node_state)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.body, objs['obj1']['body'])
+
+    def test_GET_with_multiple_timestamps_on_nodes(self):
+        ts_iter = make_timestamp_iter()
+
+        ts_1, ts_2, ts_3 = [next(ts_iter) for _ in range(3)]
+        objs = {'obj1': dict(timestamp=ts_1, body=b'body1'),
+                'obj2': dict(timestamp=ts_2, body=b'body2'),
+                'obj3': dict(timestamp=ts_3, body=b'body3')}
+
+        # newer non-durable frags do not prevent proxy getting the durable obj1
+        node_state = {
+            0: [dict(ref='obj3', frag_index=0, durable=False),
+                dict(ref='obj2', frag_index=0, durable=False),
+                dict(ref='obj1', frag_index=0, durable=True)],
+            1: [dict(ref='obj3', frag_index=1, durable=False),
+                dict(ref='obj2', frag_index=1, durable=False),
+                dict(ref='obj1', frag_index=1, durable=True)],
+            2: [dict(ref='obj3', frag_index=2, durable=False),
+                dict(ref='obj2', frag_index=2, durable=False),
+                dict(ref='obj1', frag_index=2, durable=True)],
+        }
+
+        resp = self._setup_nodes_and_do_GET(objs, node_state)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.body, objs['obj1']['body'])
+        self.assertEqual(ts_1.normal, resp.headers['X-Timestamp'])
+
+        # durable frags at two timestamps: in this scenario proxy is guaranteed
+        # to see the durable at ts_2 with one of the first 2 responses, so will
+        # then prefer that when requesting from third obj server
+        node_state = {
+            0: [dict(ref='obj3', frag_index=0, durable=False),
+                dict(ref='obj2', frag_index=0, durable=False),
+                dict(ref='obj1', frag_index=0, durable=True)],
+            1: [dict(ref='obj3', frag_index=1, durable=False),
+                dict(ref='obj2', frag_index=1, durable=True)],
+            2: [dict(ref='obj3', frag_index=2, durable=False),
+                dict(ref='obj2', frag_index=2, durable=True)],
+        }
+
+        resp = self._setup_nodes_and_do_GET(objs, node_state)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.body, objs['obj2']['body'])
+        self.assertEqual(ts_2.normal, resp.headers['X-Timestamp'])
+
+        # older durable, plus some newer non-durable, plus some even newer
+        # metadata files; in this scenario the fragment X-Timestamp's are
+        # determined by the metadata so we're checking that X-Timestamp or
+        # X-Backend-Timestamp do *not* interfere with the proxy EC getter
+        # response buckets, which should be based on X-Backend-Data-Timestamp
+        node_state = {
+            0: [dict(ref='obj3', frag_index=0, meta=True),
+                dict(ref='obj2', frag_index=0, durable=False),
+                dict(ref='obj1', frag_index=0, durable=True)],
+            1: [dict(ref='obj3', frag_index=1, meta=True),
+                dict(ref='obj1', frag_index=1, durable=True)],
+            2: [dict(ref='obj3', frag_index=2, meta=True),
+                dict(ref='obj2', frag_index=2, durable=False),
+                dict(ref='obj1', frag_index=2, durable=True)],
+        }
+
+        resp = self._setup_nodes_and_do_GET(objs, node_state)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.body, objs['obj1']['body'])
+        self.assertEqual(ts_3.normal, resp.headers['X-Timestamp'])
+
+    def test_GET_with_same_frag_index_on_multiple_nodes(self):
+        ts_iter = make_timestamp_iter()
+
+        # this is a trick to be able to get identical frags placed onto
+        # multiple nodes: since we cannot *copy* frags, we generate three sets
+        # of identical frags at same timestamp so we have enough to *move*
+        ts_1 = next(ts_iter)
+        objs = {'obj1a': dict(timestamp=ts_1, body=b'body'),
+                'obj1b': dict(timestamp=ts_1, body=b'body'),
+                'obj1c': dict(timestamp=ts_1, body=b'body')}
+
+        # arrange for duplicate frag indexes across nodes: because the object
+        # server prefers the highest available frag index, proxy will first get
+        # back two responses with frag index 1, and will then return to node 0
+        # for frag_index 0.
+        node_state = {
+            0: [dict(ref='obj1a', frag_index=0, durable=False),
+                dict(ref='obj1a', frag_index=1, durable=False)],
+            1: [dict(ref='obj1b', frag_index=1, durable=True)],
+            2: [dict(ref='obj1c', frag_index=1, durable=True)]
+        }
+
+        resp = self._setup_nodes_and_do_GET(objs, node_state)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.body, objs['obj1a']['body'])
+
+        # if all we have across nodes are frags with same index then expect a
+        # 404 (the third, 'extra', obj server GET will return 404 because it
+        # will be sent frag prefs that exclude frag_index 1)
+        node_state = {
+            0: [dict(ref='obj1a', frag_index=1, durable=False)],
+            1: [dict(ref='obj1b', frag_index=1, durable=False)],
+            2: [dict(ref='obj1c', frag_index=1, durable=False)]
+        }
+
+        resp = self._setup_nodes_and_do_GET(objs, node_state)
+        self.assertEqual(resp.status_int, 404)
+
+        # if we know it should be durable, we can be more specific.
+        # note that we need to set *both* of those first ones durable
+        # to avoid a flaky test -- in the future we can be smarter and
+        # let the durability bubble up, even from a duplicate frag
+        node_state = {
+            0: [dict(ref='obj1a', frag_index=1, durable=True)],
+            1: [dict(ref='obj1b', frag_index=1, durable=True)],
+            2: [dict(ref='obj1c', frag_index=1, durable=False)]
+        }
+
+        resp = self._setup_nodes_and_do_GET(objs, node_state)
+        self.assertEqual(resp.status_int, 503)
+
+
+class TestObjectDisconnectCleanup(unittest.TestCase):
+
+    # update this if you need to make more different devices in do_setup
+    device_pattern = re.compile('sd[a-z][0-9]')
+
+    def _cleanup_devices(self):
+        # make sure all the object data is cleaned up
+        for dev in os.listdir(_testdir):
+            if not self.device_pattern.match(dev):
+                continue
+            device_path = os.path.join(_testdir, dev)
+            for datadir in os.listdir(device_path):
+                if any(p in datadir for p in ('account', 'container')):
+                    continue
+                data_path = os.path.join(device_path, datadir)
+                rmtree(data_path, ignore_errors=True)
+                mkdirs(data_path)
 
-            def my_container_info_wildcard(*args):
-                return {
-                    'cors': {
-                        'allow_origin': '*',
-                        'allow_headers': 'x-foo',
-                        'max_age': '999',
-                    }
-                }
-            controller.container_info = my_container_info_wildcard
-            req = Request.blank(
-                '/a/c/o.jpg',
-                {'REQUEST_METHOD': 'OPTIONS'},
-                headers={'Origin': 'https://bar.baz',
-                         'Access-Control-Request-Method': 'GET'})
-            req.content_length = 0
-            resp = controller.OPTIONS(req)
-            self.assertEquals(200, resp.status_int)
-            self.assertEquals(
-                'https://bar.baz',
-                resp.headers['access-control-allow-origin'])
-            for verb in 'OPTIONS COPY GET POST PUT DELETE HEAD'.split():
-                self.assertTrue(
-                    verb in resp.headers['access-control-allow-methods'])
-            self.assertEquals(
-                len(resp.headers['access-control-allow-methods'].split(', ')),
-                7)
-            self.assertEquals('999', resp.headers['access-control-max-age'])
-            self.assertEquals(
-                'x-foo',
-                resp.headers['access-control-allow-headers'])
+    def setUp(self):
+        skip_if_no_xattrs()
+        debug.hub_exceptions(False)
+        self._cleanup_devices()
+        _test_servers[0].error_limiter.stats.clear()  # clear out errors
+
+    def tearDown(self):
+        debug.hub_exceptions(True)
+        self._cleanup_devices()
+        _test_servers[0].error_limiter.stats.clear()  # clear out errors
+
+    def _check_disconnect_cleans_up(self, policy_name, is_chunked=False):
+        proxy_port = _test_sockets[0].getsockname()[1]
+
+        def put(path, headers=None, body=None):
+            conn = http_client.HTTPConnection('localhost', proxy_port)
+            try:
+                conn.connect()
+                conn.putrequest('PUT', path)
+                for k, v in (headers or {}).items():
+                    conn.putheader(k, v)
+                conn.endheaders()
+                body = body or [b'']
+                for chunk in body:
+                    if is_chunked:
+                        chunk = b'%x\r\n%s\r\n' % (len(chunk), chunk)
+                    conn.send(chunk)
+                resp = conn.getresponse()
+                body = resp.read()
+            finally:
+                # seriously - shut this mother down
+                if conn.sock:
+                    conn.sock.fd._real_close()
+            return resp, body
+
+        # ensure container
+        container_path = '/v1/a/%s-disconnect-test' % policy_name
+        resp, _body = put(container_path, headers={
+            'Connection': 'close',
+            'X-Storage-Policy': policy_name,
+            'Content-Length': '0',
+        })
+        self.assertIn(resp.status, (201, 202))
+
+        def exploding_body():
+            for i in range(3):
+                yield b'\x00' * (64 * 2 ** 10)
+            raise Exception('kaboom!')
+
+        headers = {}
+        if is_chunked:
+            headers['Transfer-Encoding'] = 'chunked'
+        else:
+            headers['Content-Length'] = 64 * 2 ** 20
+
+        obj_path = container_path + '/disconnect-data'
+        try:
+            resp, _body = put(obj_path, headers=headers,
+                              body=exploding_body())
+        except Exception as e:
+            if str(e) != 'kaboom!':
+                raise
+        else:
+            self.fail('obj put connection did not ka-splod')
+
+        sleep(0.1)
+
+    def find_files(self):
+        found_files = defaultdict(list)
+        for root, dirs, files in os.walk(_testdir):
+            for fname in files:
+                filename, ext = os.path.splitext(fname)
+                found_files[ext].append(os.path.join(root, fname))
+        return found_files
+
+    def test_repl_disconnect_cleans_up(self):
+        self._check_disconnect_cleans_up('zero')
+        found_files = self.find_files()
+        self.assertEqual(found_files['.data'], [])
+
+    def test_ec_disconnect_cleans_up(self):
+        self._check_disconnect_cleans_up('ec')
+        found_files = self.find_files()
+        self.assertEqual(found_files['.data'], [])
+
+    def test_repl_chunked_transfer_disconnect_cleans_up(self):
+        self._check_disconnect_cleans_up('zero', is_chunked=True)
+        found_files = self.find_files()
+        self.assertEqual(found_files['.data'], [])
 
+    def test_ec_chunked_transfer_disconnect_cleans_up(self):
+        self._check_disconnect_cleans_up('ec', is_chunked=True)
+        found_files = self.find_files()
+        self.assertEqual(found_files['.data'], [])
 
-class TestContainerController(unittest.TestCase):
+
+class TestObjectECRangedGET(unittest.TestCase):
+    def setUp(self):
+        _test_servers[0].logger._clear()
+        _test_servers[0].error_limiter.stats.clear()  # clear out errors
+        self.app = proxy_server.Application(
+            None,
+            logger=debug_logger('proxy-ut'),
+            account_ring=FakeRing(),
+            container_ring=FakeRing())
+
+    def tearDown(self):
+        prosrv = _test_servers[0]
+        self.assertFalse(prosrv.logger.get_lines_for_level('error'))
+        self.assertFalse(prosrv.logger.get_lines_for_level('warning'))
+        prosrv.error_limiter.stats.clear()  # clear out errors
+
+    @classmethod
+    def setUpClass(cls):
+        skip_if_no_xattrs()
+        cls.obj_name = 'range-get-test'
+        cls.tiny_obj_name = 'range-get-test-tiny'
+        cls.aligned_obj_name = 'range-get-test-aligned'
+        cls.zero_byte_obj_name = 'range-get-test-zero-byte'
+
+        # Note: only works if called with unpatched policies
+        prolis = _test_sockets[0]
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        fd.write(('PUT /v1/a/ec-con HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Connection: close\r\n'
+                  'Content-Length: 0\r\n'
+                  'X-Storage-Token: t\r\n'
+                  'X-Storage-Policy: ec\r\n'
+                  '\r\n').encode('ascii'))
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 2'
+        assert headers[:len(exp)] == exp, "container PUT failed"
+
+        seg_size = POLICIES.get_by_name("ec").ec_segment_size
+        cls.seg_size = seg_size
+        # EC segment size is 4 KiB, hence this gives 4 segments, which we
+        # then verify with a quick sanity check
+        cls.obj = ' my hovercraft is full of eels '.join(
+            str(s) for s in range(431)).encode('ascii')
+        assert seg_size * 4 > len(cls.obj) > seg_size * 3, \
+            "object is wrong number of segments"
+        cls.obj_etag = md5(cls.obj, usedforsecurity=False).hexdigest()
+        cls.tiny_obj = b'tiny, tiny object'
+        assert len(cls.tiny_obj) < seg_size, "tiny_obj too large"
+
+        cls.aligned_obj = "".join(
+            "abcdEFGHijkl%04d" % x for x in range(512)).encode('ascii')
+        assert len(cls.aligned_obj) % seg_size == 0, "aligned obj not aligned"
+
+        for obj_name, obj in ((cls.obj_name, cls.obj),
+                              (cls.tiny_obj_name, cls.tiny_obj),
+                              (cls.aligned_obj_name, cls.aligned_obj),
+                              (cls.zero_byte_obj_name, b"")):
+            sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+            fd = sock.makefile('rwb')
+            fd.write(('PUT /v1/a/ec-con/%s HTTP/1.1\r\n'
+                      'Host: localhost\r\n'
+                      'Connection: close\r\n'
+                      'Content-Length: %d\r\n'
+                      'X-Storage-Token: t\r\n'
+                      'Content-Type: donuts\r\n'
+                      '\r\n' % (obj_name, len(obj))).encode('ascii'))
+            fd.write(obj)
+            fd.flush()
+            headers = readuntil2crlfs(fd)
+            exp = b'HTTP/1.1 201'
+            assert headers[:len(exp)] == exp, \
+                "object PUT failed %s" % obj_name
+
+    def _get_obj(self, range_value, obj_name=None, ignore_range_if=''):
+        if obj_name is None:
+            obj_name = self.obj_name
+        if ignore_range_if:
+            ignore_range_if = (
+                'X-Backend-Ignore-Range-If-Metadata-Present: %s\r\n'
+                % ignore_range_if)
+
+        prolis = _test_sockets[0]
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        fd.write((
+            'GET /v1/a/ec-con/%s HTTP/1.1\r\n'
+            'Host: localhost\r\n'
+            'Connection: close\r\n'
+            'X-Storage-Token: t\r\n'
+            'Range: %s\r\n'
+            '%s'
+            '\r\n' % (obj_name, range_value, ignore_range_if)
+        ).encode('ascii'))
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        # e.g. "HTTP/1.1 206 Partial Content\r\n..."
+        status_code = int(headers[9:12])
+        headers = parse_headers_string(headers)
+
+        gotten_obj = b''
+        while True:
+            buf = fd.read(64)
+            if not buf:
+                break
+            gotten_obj += buf
+
+        # if we get this wrong, clients will either get truncated data or
+        # they'll hang waiting for bytes that aren't coming, so it warrants
+        # being asserted for every test case
+        if 'Content-Length' in headers:
+            self.assertEqual(int(headers['Content-Length']), len(gotten_obj))
+        else:
+            self.assertIn('Transfer-Encoding', headers)
+            self.assertEqual(headers['Transfer-Encoding'], 'chunked')
+
+        # likewise, if we say MIME and don't send MIME or vice versa,
+        # clients will be horribly confused
+        if headers.get('Content-Type', '').startswith(
+                'multipart/byteranges'):
+            self.assertEqual(gotten_obj[:2], b"--")
+        else:
+            # In general, this isn't true, as you can start an object with
+            # "--". However, in this test, we don't start any objects with
+            # "--", or even include "--" in their contents anywhere.
+            self.assertNotEqual(gotten_obj[:2], b"--")
+
+        return (status_code, headers, gotten_obj)
+
+    def _parse_multipart(self, content_type, body):
+        parser = email.parser.BytesFeedParser()
+        if not isinstance(content_type, bytes):
+            content_type = content_type.encode('utf8')
+        parser.feed(b"Content-Type: %s\r\n\r\n" % content_type)
+        parser.feed(body)
+        root_message = parser.close()
+        self.assertTrue(root_message.is_multipart())
+        byteranges = root_message.get_payload()
+        self.assertFalse(root_message.defects)
+        for i, message in enumerate(byteranges):
+            self.assertFalse(message.defects, "Part %d had defects" % i)
+            self.assertFalse(message.is_multipart(),
+                             "Nested multipart at %d" % i)
+        return byteranges
+
+    def test_bogus(self):
+        status, headers, gotten_obj = self._get_obj("tacos=3-5")
+        self.assertEqual(status, 200)
+        self.assertEqual(len(gotten_obj), len(self.obj))
+        self.assertEqual(gotten_obj, self.obj)
+
+    def test_unaligned(self):
+        # One segment's worth of data, but straddling two segment boundaries
+        # (so it has data from three segments)
+        status, headers, gotten_obj = self._get_obj("bytes=3783-7878")
+        self.assertEqual(status, 206)
+        self.assertEqual(headers['Content-Length'], "4096")
+        self.assertEqual(headers['Content-Range'], "bytes 3783-7878/14513")
+        self.assertEqual(len(gotten_obj), 4096)
+        self.assertEqual(gotten_obj, self.obj[3783:7879])
+
+    def test_aligned_left(self):
+        # First byte is aligned to a segment boundary, last byte is not
+        status, headers, gotten_obj = self._get_obj("bytes=0-5500")
+        self.assertEqual(status, 206)
+        self.assertEqual(headers['Content-Length'], "5501")
+        self.assertEqual(headers['Content-Range'], "bytes 0-5500/14513")
+        self.assertEqual(len(gotten_obj), 5501)
+        self.assertEqual(gotten_obj, self.obj[:5501])
+
+    def test_aligned_range(self):
+        # Ranged GET that wants exactly one segment
+        status, headers, gotten_obj = self._get_obj("bytes=4096-8191")
+        self.assertEqual(status, 206)
+        self.assertEqual(headers['Content-Length'], "4096")
+        self.assertEqual(headers['Content-Range'], "bytes 4096-8191/14513")
+        self.assertEqual(len(gotten_obj), 4096)
+        self.assertEqual(gotten_obj, self.obj[4096:8192])
+
+    def test_aligned_range_end(self):
+        # Ranged GET that wants exactly the last segment
+        status, headers, gotten_obj = self._get_obj("bytes=12288-14512")
+        self.assertEqual(status, 206)
+        self.assertEqual(headers['Content-Length'], "2225")
+        self.assertEqual(headers['Content-Range'], "bytes 12288-14512/14513")
+        self.assertEqual(len(gotten_obj), 2225)
+        self.assertEqual(gotten_obj, self.obj[12288:])
+
+    def test_aligned_range_aligned_obj(self):
+        # Ranged GET that wants exactly the last segment, which is full-size
+        status, headers, gotten_obj = self._get_obj("bytes=4096-8191",
+                                                    self.aligned_obj_name)
+        self.assertEqual(status, 206)
+        self.assertEqual(headers['Content-Length'], "4096")
+        self.assertEqual(headers['Content-Range'], "bytes 4096-8191/8192")
+        self.assertEqual(len(gotten_obj), 4096)
+        self.assertEqual(gotten_obj, self.aligned_obj[4096:8192])
+
+    def test_ignore_range_if_metadata_present(self):
+        # Ranged GET that actually wants the whole object
+        status, headers, gotten_obj = self._get_obj(
+            "bytes=4096-8191", ignore_range_if='content-type')
+        self.assertEqual(status, 200)
+        self.assertEqual(headers['Content-Length'], str(len(self.obj)))
+        self.assertNotIn('Content-Range', headers)
+        self.assertEqual(len(gotten_obj), len(self.obj))
+        self.assertEqual(gotten_obj, self.obj)
+
+    def test_byte_0(self):
+        # Just the first byte, but it's index 0, so that's easy to get wrong
+        status, headers, gotten_obj = self._get_obj("bytes=0-0")
+        self.assertEqual(status, 206)
+        self.assertEqual(headers['Content-Length'], "1")
+        self.assertEqual(headers['Content-Range'], "bytes 0-0/14513")
+        self.assertEqual(gotten_obj, self.obj[0:1])
+
+    def test_unsatisfiable(self):
+        # Goes just one byte too far off the end of the object, so it's
+        # unsatisfiable. This should be close enough that the object servers
+        # actually responded 206
+        obj_len = len(self.obj)
+        status, headers, _junk = self._get_obj(
+            "bytes=%d-%d" % (obj_len, obj_len + 100))
+        self.assertEqual(status, 416)
+        self.assertEqual(self.obj_etag, headers.get('Etag'))
+        self.assertEqual('bytes', headers.get('Accept-Ranges'))
+        self.assertIn('Content-Range', headers)
+        self.assertEqual('bytes */%d' % obj_len, headers['Content-Range'])
+
+        # Goes *way* too far off the end of the object, so we're looking at
+        # the (massaged) 416 from an object server
+        status, headers, _junk = self._get_obj(
+            "bytes=%d-" % (obj_len + 2 ** 30))
+        self.assertEqual(status, 416)
+        self.assertEqual(self.obj_etag, headers.get('Etag'))
+        self.assertEqual('bytes', headers.get('Accept-Ranges'))
+        self.assertIn('Content-Range', headers)
+        self.assertEqual('bytes */%d' % obj_len, headers['Content-Range'])
+
+    def test_unsatisfiable_socket_leak(self):
+        unclosed_http_responses = {}
+        tracked_responses = [0]
+
+        class LeakTrackingHTTPResponse(BufferedHTTPResponse):
+            def begin(self):
+                retval = super(BufferedHTTPResponse, self).begin()
+                if self.status != 204:
+                    # This mock is overly broad and catches account and
+                    # container HEAD requests too. We don't care about
+                    # those; it's the object GETs that were leaky.
+                    #
+                    # Unfortunately, we don't have access to the request
+                    # path here, so we use "status == 204" as a crude proxy
+                    # for "not an object response".
+                    unclosed_http_responses[id(self)] = self
+                    tracked_responses[0] += 1
+                return retval
+
+            def close(self, *args, **kwargs):
+                rv = BufferedHTTPResponse.close(self, *args, **kwargs)
+                unclosed_http_responses.pop(id(self), None)
+                return rv
+
+            def __repr__(self):
+                swift_conn = getattr(self, 'swift_conn', None)
+                method = getattr(swift_conn, '_method', '<unknown>')
+                path = getattr(swift_conn, '_path', '<unknown>')
+                return '%s<method=%r path=%r>' % (
+                    self.__class__.__name__, method, path)
+
+        obj_len = len(self.obj)
+        with mock.patch('swift.common.bufferedhttp.BufferedHTTPConnection'
+                        '.response_class', LeakTrackingHTTPResponse):
+            status, headers, _junk = self._get_obj(
+                "bytes=%d-%d" % (obj_len, obj_len + 100))
+        self.assertEqual(status, 416)  # sanity check
+        self.assertGreater(tracked_responses[0], 0)  # ensure tracking happened
+        self.assertEqual(unclosed_http_responses, {})
+
+    def test_off_end(self):
+        # Ranged GET that's mostly off the end of the object, but overlaps
+        # it in just the last byte
+        status, headers, gotten_obj = self._get_obj(
+            "bytes=%d-%d" % (len(self.obj) - 1, len(self.obj) + 100))
+        self.assertEqual(status, 206)
+        self.assertEqual(headers['Content-Length'], '1')
+        self.assertEqual(headers['Content-Range'], 'bytes 14512-14512/14513')
+        self.assertEqual(gotten_obj, self.obj[-1:])
+
+    def test_aligned_off_end(self):
+        # Ranged GET that starts on a segment boundary but asks for a whole lot
+        status, headers, gotten_obj = self._get_obj(
+            "bytes=%d-%d" % (8192, len(self.obj) + 100))
+        self.assertEqual(status, 206)
+        self.assertEqual(headers['Content-Length'], '6321')
+        self.assertEqual(headers['Content-Range'], 'bytes 8192-14512/14513')
+        self.assertEqual(gotten_obj, self.obj[8192:])
+
+    def test_way_off_end(self):
+        # Ranged GET that's mostly off the end of the object, but overlaps
+        # it in just the last byte, and wants multiple segments' worth off
+        # the end
+        status, headers, gotten_obj = self._get_obj(
+            "bytes=%d-%d" % (len(self.obj) - 1, len(self.obj) * 1000))
+        self.assertEqual(status, 206)
+        self.assertEqual(headers['Content-Length'], '1')
+        self.assertEqual(headers['Content-Range'], 'bytes 14512-14512/14513')
+        self.assertEqual(gotten_obj, self.obj[-1:])
+
+    def test_boundaries(self):
+        # Wants the last byte of segment 1 + the first byte of segment 2
+        status, headers, gotten_obj = self._get_obj("bytes=4095-4096")
+        self.assertEqual(status, 206)
+        self.assertEqual(headers['Content-Length'], '2')
+        self.assertEqual(headers['Content-Range'], 'bytes 4095-4096/14513')
+        self.assertEqual(gotten_obj, self.obj[4095:4097])
+
+    def test_until_end(self):
+        # Wants the last byte of segment 1 + the rest
+        status, headers, gotten_obj = self._get_obj("bytes=4095-")
+        self.assertEqual(status, 206)
+        self.assertEqual(headers['Content-Length'], '10418')
+        self.assertEqual(headers['Content-Range'], 'bytes 4095-14512/14513')
+        self.assertEqual(gotten_obj, self.obj[4095:])
+
+    def test_small_suffix(self):
+        # Small range-suffix GET: the last 100 bytes (less than one segment)
+        status, headers, gotten_obj = self._get_obj("bytes=-100")
+        self.assertEqual(status, 206)
+        self.assertEqual(headers['Content-Length'], '100')
+        self.assertEqual(headers['Content-Range'], 'bytes 14413-14512/14513')
+        self.assertEqual(len(gotten_obj), 100)
+        self.assertEqual(gotten_obj, self.obj[-100:])
+
+    def test_small_suffix_aligned(self):
+        # Small range-suffix GET: the last 100 bytes, last segment is
+        # full-size
+        status, headers, gotten_obj = self._get_obj("bytes=-100",
+                                                    self.aligned_obj_name)
+        self.assertEqual(status, 206)
+        self.assertEqual(headers['Content-Length'], '100')
+        self.assertEqual(headers['Content-Range'], 'bytes 8092-8191/8192')
+        self.assertEqual(len(gotten_obj), 100)
+
+    def test_suffix_zero_byte_object(self):
+        status, headers, gotten_obj = self._get_obj("bytes=-100",
+                                                    self.zero_byte_obj_name)
+        self.assertEqual(status, 200)
+        self.assertEqual(len(gotten_obj), 0)
+        self.assertEqual(gotten_obj, b"")
+
+    def test_suffix_two_segs(self):
+        # Ask for enough data that we need the last two segments. The last
+        # segment is short, though, so this ensures we compensate for that.
+        #
+        # Note that the total range size is less than one full-size segment.
+        suffix_len = len(self.obj) % self.seg_size + 1
+
+        status, headers, gotten_obj = self._get_obj("bytes=-%d" % suffix_len)
+        self.assertEqual(status, 206)
+        self.assertEqual(headers['Content-Length'], str(suffix_len))
+        self.assertEqual(headers['Content-Range'],
+                         'bytes %d-%d/%d' % (len(self.obj) - suffix_len,
+                                             len(self.obj) - 1,
+                                             len(self.obj)))
+        self.assertEqual(len(gotten_obj), suffix_len)
+
+    def test_large_suffix(self):
+        # Large range-suffix GET: the last 5000 bytes (more than one segment)
+        status, headers, gotten_obj = self._get_obj("bytes=-5000")
+        self.assertEqual(status, 206)
+        self.assertEqual(headers['Content-Length'], '5000')
+        self.assertEqual(headers['Content-Range'], 'bytes 9513-14512/14513')
+        self.assertEqual(len(gotten_obj), 5000)
+        self.assertEqual(gotten_obj, self.obj[-5000:])
+
+    def test_overlarge_suffix(self):
+        # The last N+1 bytes of an N-byte object
+        status, headers, gotten_obj = self._get_obj(
+            "bytes=-%d" % (len(self.obj) + 1))
+        self.assertEqual(status, 206)
+        self.assertEqual(headers['Content-Length'], '14513')
+        self.assertEqual(headers['Content-Range'], 'bytes 0-14512/14513')
+        self.assertEqual(len(gotten_obj), len(self.obj))
+        self.assertEqual(gotten_obj, self.obj)
+
+    def test_small_suffix_tiny_object(self):
+        status, headers, gotten_obj = self._get_obj(
+            "bytes=-5", self.tiny_obj_name)
+        self.assertEqual(status, 206)
+        self.assertEqual(headers['Content-Length'], '5')
+        self.assertEqual(headers['Content-Range'], 'bytes 12-16/17')
+        self.assertEqual(gotten_obj, self.tiny_obj[12:])
+
+    def test_overlarge_suffix_tiny_object(self):
+        status, headers, gotten_obj = self._get_obj(
+            "bytes=-1234567890", self.tiny_obj_name)
+        self.assertEqual(status, 206)
+        self.assertEqual(headers['Content-Length'], '17')
+        self.assertEqual(headers['Content-Range'], 'bytes 0-16/17')
+        self.assertEqual(len(gotten_obj), len(self.tiny_obj))
+        self.assertEqual(gotten_obj, self.tiny_obj)
+
+    def test_multiple_ranges(self):
+        status, headers, gotten_obj = self._get_obj(
+            "bytes=0-100,4490-5010", self.obj_name)
+        self.assertEqual(status, 206)
+        self.assertEqual(headers["Content-Length"], str(len(gotten_obj)))
+
+        content_type, content_type_params = parse_content_type(
+            headers['Content-Type'])
+        content_type_params = dict(content_type_params)
+
+        self.assertEqual(content_type, 'multipart/byteranges')
+        boundary = content_type_params.get('boundary')
+        self.assertIsNotNone(boundary)
+
+        got_byteranges = self._parse_multipart(headers['Content-Type'],
+                                               gotten_obj)
+        self.assertEqual(len(got_byteranges), 2)
+        first_byterange, second_byterange = got_byteranges
+
+        self.assertEqual(first_byterange['Content-Range'],
+                         'bytes 0-100/14513')
+        self.assertEqual(first_byterange.get_payload(decode=True),
+                         self.obj[:101])
+
+        self.assertEqual(second_byterange['Content-Range'],
+                         'bytes 4490-5010/14513')
+        self.assertEqual(second_byterange.get_payload(decode=True),
+                         self.obj[4490:5011])
+
+    def test_multiple_ranges_overlapping_in_segment(self):
+        status, headers, gotten_obj = self._get_obj(
+            "bytes=0-9,20-29,40-49,60-69,80-89")
+        self.assertEqual(status, 206)
+        got_byteranges = self._parse_multipart(headers['Content-Type'],
+                                               gotten_obj)
+        self.assertEqual(len(got_byteranges), 5)
+
+    def test_multiple_ranges_off_end(self):
+        status, headers, gotten_obj = self._get_obj(
+            "bytes=0-10,14500-14513")  # there is no byte 14513, only 0-14512
+        self.assertEqual(status, 206)
+        got_byteranges = self._parse_multipart(headers['Content-Type'],
+                                               gotten_obj)
+        self.assertEqual(len(got_byteranges), 2)
+        self.assertEqual(got_byteranges[0]['Content-Range'],
+                         "bytes 0-10/14513")
+        self.assertEqual(got_byteranges[1]['Content-Range'],
+                         "bytes 14500-14512/14513")
+
+    def test_multiple_ranges_suffix_off_end(self):
+        status, headers, gotten_obj = self._get_obj(
+            "bytes=0-10,-13")
+        self.assertEqual(status, 206)
+        got_byteranges = self._parse_multipart(headers['Content-Type'],
+                                               gotten_obj)
+        self.assertEqual(len(got_byteranges), 2)
+        self.assertEqual(got_byteranges[0]['Content-Range'],
+                         "bytes 0-10/14513")
+        self.assertEqual(got_byteranges[1]['Content-Range'],
+                         "bytes 14500-14512/14513")
+
+    def test_multiple_ranges_one_barely_unsatisfiable(self):
+        # The thing about 14515-14520 is that it comes from the last segment
+        # in the object. When we turn this range into a fragment range,
+        # it'll be for the last fragment, so the object servers see
+        # something satisfiable.
+        #
+        # Basically, we'll get 3 byteranges from the object server, but we
+        # have to filter out the unsatisfiable one on our own.
+        status, headers, gotten_obj = self._get_obj(
+            "bytes=0-10,14515-14520,40-50")
+        self.assertEqual(status, 206)
+        got_byteranges = self._parse_multipart(headers['Content-Type'],
+                                               gotten_obj)
+        self.assertEqual(len(got_byteranges), 2)
+        self.assertEqual(got_byteranges[0]['Content-Range'],
+                         "bytes 0-10/14513")
+        self.assertEqual(got_byteranges[0].get_payload(decode=True),
+                         self.obj[0:11])
+        self.assertEqual(got_byteranges[1]['Content-Range'],
+                         "bytes 40-50/14513")
+        self.assertEqual(got_byteranges[1].get_payload(decode=True),
+                         self.obj[40:51])
+
+    def test_multiple_ranges_some_unsatisfiable(self):
+        status, headers, gotten_obj = self._get_obj(
+            "bytes=0-100,4090-5010,999999-9999999", self.obj_name)
+        self.assertEqual(status, 206)
+
+        content_type, content_type_params = parse_content_type(
+            headers['Content-Type'])
+        content_type_params = dict(content_type_params)
+
+        self.assertEqual(content_type, 'multipart/byteranges')
+        boundary = content_type_params.get('boundary')
+        self.assertIsNotNone(boundary)
+
+        got_byteranges = self._parse_multipart(headers['Content-Type'],
+                                               gotten_obj)
+        self.assertEqual(len(got_byteranges), 2)
+        first_byterange, second_byterange = got_byteranges
+
+        self.assertEqual(first_byterange['Content-Range'],
+                         'bytes 0-100/14513')
+        self.assertEqual(first_byterange.get_payload(decode=True),
+                         self.obj[:101])
+
+        self.assertEqual(second_byterange['Content-Range'],
+                         'bytes 4090-5010/14513')
+        self.assertEqual(second_byterange.get_payload(decode=True),
+                         self.obj[4090:5011])
+
+    def test_two_ranges_one_unsatisfiable(self):
+        status, headers, gotten_obj = self._get_obj(
+            "bytes=0-100,999999-9999999", self.obj_name)
+        self.assertEqual(status, 206)
+
+        content_type, content_type_params = parse_content_type(
+            headers['Content-Type'])
+
+        # According to RFC 7233, this could be either a multipart/byteranges
+        # response with one part or it could be a single-part response (just
+        # the bytes, no MIME). We're locking it down here: single-part
+        # response. That's what replicated objects do, and we don't want any
+        # client-visible differences between EC objects and replicated ones.
+        self.assertEqual(content_type, 'donuts')
+        self.assertEqual(gotten_obj, self.obj[:101])
+
+    def test_two_ranges_one_unsatisfiable_same_segment(self):
+        # Like test_two_ranges_one_unsatisfiable(), but where both ranges
+        # fall within the same EC segment.
+        status, headers, gotten_obj = self._get_obj(
+            "bytes=14500-14510,14520-14530")
+
+        self.assertEqual(status, 206)
+
+        content_type, content_type_params = parse_content_type(
+            headers['Content-Type'])
+
+        self.assertEqual(content_type, 'donuts')
+        self.assertEqual(gotten_obj, self.obj[14500:14511])
+
+    def test_multiple_ranges_some_unsatisfiable_out_of_order(self):
+        status, headers, gotten_obj = self._get_obj(
+            "bytes=0-100,99999998-99999999,4090-5010", self.obj_name)
+        self.assertEqual(status, 206)
+
+        content_type, content_type_params = parse_content_type(
+            headers['Content-Type'])
+        content_type_params = dict(content_type_params)
+
+        self.assertEqual(content_type, 'multipart/byteranges')
+        boundary = content_type_params.get('boundary')
+        self.assertIsNotNone(boundary)
+
+        got_byteranges = self._parse_multipart(headers['Content-Type'],
+                                               gotten_obj)
+        self.assertEqual(len(got_byteranges), 2)
+        first_byterange, second_byterange = got_byteranges
+
+        self.assertEqual(first_byterange['Content-Range'],
+                         'bytes 0-100/14513')
+        self.assertEqual(first_byterange.get_payload(decode=True),
+                         self.obj[:101])
+
+        self.assertEqual(second_byterange['Content-Range'],
+                         'bytes 4090-5010/14513')
+        self.assertEqual(second_byterange.get_payload(decode=True),
+                         self.obj[4090:5011])
+
+
+@patch_policies([
+    StoragePolicy(0, 'zero', True, object_ring=FakeRing(base_port=3000)),
+    StoragePolicy(1, 'one', False, object_ring=FakeRing(base_port=3000)),
+    StoragePolicy(2, 'two', False, True, object_ring=FakeRing(base_port=3000))
+])
+class TestContainerController(BaseTestCase):
     "Test swift.proxy_server.ContainerController"
 
     def setUp(self):
-        self.app = proxy_server.Application(None, FakeMemcache(),
-                                            account_ring=FakeRing(),
-                                            container_ring=FakeRing(),
-                                            object_ring=FakeRing())
+        super().setUp()
+        self.app = proxy_server.Application(
+            None,
+            account_ring=FakeRing(),
+            container_ring=FakeRing(base_port=2000),
+            logger=debug_logger())
+
+    def test_convert_policy_to_index(self):
+        controller = swift.proxy.controllers.ContainerController(self.app,
+                                                                 'a', 'c')
+        expected = {
+            'zero': 0,
+            'ZeRo': 0,
+            'one': 1,
+            'OnE': 1,
+        }
+        for name, index in expected.items():
+            req = Request.blank('/a/c', headers={'Content-Length': '0',
+                                                 'Content-Type': 'text/plain',
+                                                 'X-Storage-Policy': name})
+            self.assertEqual(controller._convert_policy_to_index(req), index)
+        # default test
+        req = Request.blank('/a/c', headers={'Content-Length': '0',
+                                             'Content-Type': 'text/plain'})
+        self.assertIsNone(controller._convert_policy_to_index(req))
+        # negative test
+        req = Request.blank('/a/c',
+                            headers={'Content-Length': '0',
+                                     'Content-Type': 'text/plain',
+                                     'X-Storage-Policy': 'nada'})
+        self.assertRaises(HTTPException, controller._convert_policy_to_index,
+                          req)
+        # storage policy two is deprecated
+        req = Request.blank('/a/c', headers={'Content-Length': '0',
+                                             'Content-Type': 'text/plain',
+                                             'X-Storage-Policy': 'two'})
+        self.assertRaises(HTTPException, controller._convert_policy_to_index,
+                          req)
+
+    def test_convert_index_to_name(self):
+        policy = random.choice(list(POLICIES))
+        req = Request.blank('/v1/a/c')
+        with mocked_http_conn(
+                200, 200,
+                headers={'X-Backend-Storage-Policy-Index': int(policy)},
+        ) as fake_conn:
+            resp = req.get_response(self.app)
+        with self.assertRaises(StopIteration):
+            next(fake_conn.code_iter)
+        self.assertEqual(resp.status_int, 200)
+        self.assertEqual(resp.headers['X-Storage-Policy'], policy.name)
+
+    def test_no_convert_index_to_name_when_container_not_found(self):
+        policy = random.choice(list(POLICIES))
+        req = Request.blank('/v1/a/c')
+        with mocked_http_conn(
+                200, 404, 404, 404,
+                headers={'X-Backend-Storage-Policy-Index':
+                         int(policy)}) as fake_conn:
+            resp = req.get_response(self.app)
+        with self.assertRaises(StopIteration):
+            next(fake_conn.code_iter)
+        self.assertEqual(resp.status_int, 404)
+        self.assertIsNone(resp.headers['X-Storage-Policy'])
+
+    def test_error_convert_index_to_name(self):
+        req = Request.blank('/v1/a/c')
+        with mocked_http_conn(
+                200, 200,
+                headers={'X-Backend-Storage-Policy-Index': '-1'}) as fake_conn:
+            resp = req.get_response(self.app)
+        with self.assertRaises(StopIteration):
+            next(fake_conn.code_iter)
+        self.assertEqual(resp.status_int, 200)
+        self.assertIsNone(resp.headers['X-Storage-Policy'])
+        error_lines = self.app.logger.get_lines_for_level('error')
+        self.assertEqual(2, len(error_lines))
+        for msg in error_lines:
+            expected = "Could not translate " \
+                "X-Backend-Storage-Policy-Index ('-1')"
+            self.assertIn(expected, msg)
+
+    def test_transfer_headers(self):
+        src_headers = {'x-remove-versions-location': 'x',
+                       'x-container-read': '*:user',
+                       'x-remove-container-sync-key': 'x'}
+        dst_headers = {'x-versions-location': 'backup'}
+        controller = swift.proxy.controllers.ContainerController(self.app,
+                                                                 'a', 'c')
+        controller.transfer_headers(src_headers, dst_headers)
+        expected_headers = {'x-versions-location': '',
+                            'x-container-read': '*:user',
+                            'x-container-sync-key': ''}
+        self.assertEqual(dst_headers, expected_headers)
 
     def assert_status_map(self, method, statuses, expected,
                           raise_exc=False, missing_container=False):
         with save_globals():
-            kwargs = {}
+            kwargs = {'missing_container': missing_container}
             if raise_exc:
                 kwargs['raise_exc'] = raise_exc
-            kwargs['missing_container'] = missing_container
             set_http_connect(*statuses, **kwargs)
-            self.app.memcache.store = {}
-            req = Request.blank('/a/c', headers={'Content-Length': '0',
+            req = Request.blank('/v1/a/c', headers={'Content-Length': '0',
                                 'Content-Type': 'text/plain'})
             self.app.update_request(req)
             res = method(req)
-            self.assertEquals(res.status_int, expected)
+            self.assertEqual(res.status_int, expected)
             set_http_connect(*statuses, **kwargs)
-            self.app.memcache.store = {}
-            req = Request.blank('/a/c/', headers={'Content-Length': '0',
+            req = Request.blank('/v1/a/c/', headers={'Content-Length': '0',
                                 'Content-Type': 'text/plain'})
             self.app.update_request(req)
             res = method(req)
-            self.assertEquals(res.status_int, expected)
+            self.assertEqual(res.status_int, expected)
 
-    def test_HEAD(self):
+    def test_HEAD_GET(self):
         with save_globals():
-            controller = proxy_server.ContainerController(self.app, 'account',
-                                                          'container')
+            controller = proxy_server.ContainerController(self.app, 'a', 'c')
 
-            def test_status_map(statuses, expected, **kwargs):
+            def test_status_map(statuses, expected,
+                                c_expected=None, a_expected=None, **kwargs):
                 set_http_connect(*statuses, **kwargs)
-                self.app.memcache.store = {}
-                req = Request.blank('/a/c', {})
+                req = Request.blank('/v1/a/c', {})
                 self.app.update_request(req)
                 res = controller.HEAD(req)
-                self.assertEquals(res.status[:len(str(expected))],
-                                  str(expected))
+                self.assertEqual(res.status[:len(str(expected))],
+                                 str(expected))
+                infocache = res.environ.get('swift.infocache', {})
+                if expected < 400:
+                    self.assertIn('x-works', res.headers)
+                    self.assertEqual(res.headers['x-works'], 'yes')
+                if expected < 300:
+                    self.assertIn('last-modified', res.headers)
+                    self.assertEqual(res.headers['last-modified'], '1')
+                if c_expected:
+                    self.assertIn('container/a/c', infocache)
+                    self.assertEqual(
+                        infocache['container/a/c']['status'],
+                        c_expected)
+                else:
+                    self.assertNotIn('container/a/c', infocache)
+                if a_expected:
+                    self.assertIn('account/a', infocache)
+                    self.assertEqual(infocache['account/a']['status'],
+                                     a_expected)
+                else:
+                    self.assertNotIn('account/a', res.environ)
+
+                set_http_connect(*statuses, **kwargs)
+                req = Request.blank('/v1/a/c', {})
+                self.app.update_request(req)
+                res = controller.GET(req)
+                self.assertEqual(res.status[:len(str(expected))],
+                                 str(expected))
+                infocache = res.environ.get('swift.infocache', {})
                 if expected < 400:
-                    self.assert_('x-works' in res.headers)
-                    self.assertEquals(res.headers['x-works'], 'yes')
-            test_status_map((200, 200, 404, 404), 200)
-            test_status_map((200, 200, 500, 404), 200)
-            test_status_map((200, 304, 500, 404), 304)
-            test_status_map((200, 404, 404, 404), 404)
-            test_status_map((200, 404, 404, 500), 404)
-            test_status_map((200, 500, 500, 500), 503)
+                    self.assertIn('x-works', res.headers)
+                    self.assertEqual(res.headers['x-works'], 'yes')
+                if expected < 300:
+                    self.assertIn('last-modified', res.headers)
+                    self.assertEqual(res.headers['last-modified'], '1')
+                if c_expected:
+                    self.assertIn('container/a/c', infocache)
+                    self.assertEqual(
+                        infocache['container/a/c']['status'],
+                        c_expected)
+                else:
+                    self.assertNotIn('container/a/c', infocache)
+                if a_expected:
+                    self.assertIn('account/a', infocache)
+                    self.assertEqual(infocache['account/a']['status'],
+                                     a_expected)
+                else:
+                    self.assertNotIn('account/a', infocache)
+            # In all the following tests cache 200 for account
+            # return and cache vary for container
+            # return 200 and cache 200 for account and container
+            test_status_map((200, 200, 404, 404), 200, 200, 200)
+            test_status_map((200, 200, 500, 404), 200, 200, 200)
+            # return 304 don't cache container
+            test_status_map((200, 304, 500, 404), 304, None, 200)
+            # return 404 and cache 404 for container
+            test_status_map((200, 404, 404, 404), 404, 404, 200)
+            test_status_map((200, 404, 404, 500), 404, 404, 200)
+            # return 503, don't cache container
+            test_status_map((200, 500, 500, 500), 503, None, 200)
+            self.assertFalse(self.app.account_autocreate)
+
+            # return 404 (as account is not found) and don't cache container
+            test_status_map((404, 404, 404), 404, None, 404)
+
+            # cache a 200 for the account because it appears to be created
+            self.app.account_autocreate = True
+            test_status_map((404, 404, 404), 404, None, 200)
+
+    def test_PUT_policy_headers(self):
+        backend_requests = []
+
+        def capture_requests(ipaddr, port, device, partition, method,
+                             path, headers=None, query_string=None):
+            if method == 'PUT':
+                backend_requests.append(headers)
+
+        def test_policy(requested_policy):
+            with save_globals():
+                mock_conn = set_http_connect(200, 201, 201, 201,
+                                             give_connect=capture_requests)
+                req = Request.blank('/v1/a/test', method='PUT',
+                                    headers={'Content-Length': 0})
+                if requested_policy:
+                    expected_policy = requested_policy
+                    req.headers['X-Storage-Policy'] = policy.name
+                else:
+                    expected_policy = POLICIES.default
+                res = req.get_response(self.app)
+                if expected_policy.is_deprecated:
+                    self.assertEqual(res.status_int, 400)
+                    self.assertEqual(0, len(backend_requests))
+                    expected = b'is deprecated'
+                    self.assertIn(expected, res.body,
+                                  '%r did not include %r' % (
+                                      res.body, expected))
+                    return
+                self.assertEqual(res.status_int, 201)
+                self.assertEqual(
+                    expected_policy.object_ring.replicas,
+                    len(backend_requests))
+                for headers in backend_requests:
+                    if not requested_policy:
+                        self.assertNotIn('X-Backend-Storage-Policy-Index',
+                                         headers)
+                        self.assertIn('X-Backend-Storage-Policy-Default',
+                                      headers)
+                        self.assertEqual(
+                            int(expected_policy),
+                            int(headers['X-Backend-Storage-Policy-Default']))
+                    else:
+                        self.assertIn('X-Backend-Storage-Policy-Index',
+                                      headers)
+                        self.assertEqual(int(headers
+                                         ['X-Backend-Storage-Policy-Index']),
+                                         int(policy))
+                # make sure all mocked responses are consumed
+                with self.assertRaises(StopIteration):
+                    next(mock_conn.code_iter)
+
+        test_policy(None)  # no policy header
+        for policy in POLICIES:
+            backend_requests = []  # reset backend requests
+            test_policy(policy)
 
     def test_PUT(self):
         with save_globals():
@@ -3814,18 +10292,161 @@ def test_PUT(self):
                                                           'container')
 
             def test_status_map(statuses, expected, **kwargs):
+                req = Request.blank('/v1/a/c', {})
+                req.content_length = 0
+                self.app.update_request(req)
+                with mocked_http_conn(*statuses, **kwargs) as mock_conn:
+                    res = controller.PUT(req)
+                expected = str(expected)
+                self.assertEqual(res.status[:len(expected)], expected)
+                timestamps = [captured['headers'].get('X-Timestamp')
+                              for captured in mock_conn.requests[-3:]]
+                self.assertEqual(3, len(timestamps))
+                self.assertEqual(1, len(set(timestamps)))
+                self.assert_valid_timestamp(timestamps[0])
+
+            test_status_map((200, 201, 201, 201), 201, missing_container=True)
+            test_status_map((200, 201, 201, 500), 201, missing_container=True)
+            test_status_map((200, 204, 404, 404), 404, missing_container=True)
+            test_status_map((200, 204, 500, 404), 503, missing_container=True)
+            self.assertFalse(self.app.account_autocreate)
+            test_status_map((404, 404, 404), 404, missing_container=True)
+            self.app.account_autocreate = True
+            # fail to retrieve account info
+            test_status_map(
+                (503, 503, 503,   # account_info fails on 503
+                 503, 503, 503),  # account PUT fails
+                503, missing_container=True)
+            test_status_map(
+                (503, 503, 404,   # account_info fails on 404
+                 503, 503, 503),  # account PUT fails
+                503, missing_container=True)
+            # account fail after creation
+            test_status_map(
+                (404, 404, 404,   # account_info fails on 404
+                 201, 201, 201,   # PUT account
+                 404, 404, 404),  # account_info fail
+                404, missing_container=True)
+            # put fails
+            test_status_map(
+                (404, 404, 404,   # account_info fails on 404
+                 201, 201, 201,   # PUT account
+                 200,             # account_info success
+                 503, 503, 201),  # put container fail
+                503, missing_container=True)
+            # all goes according to plan
+            test_status_map(
+                (404, 404, 404,   # account_info fails on 404
+                 201, 201, 201,   # PUT account
+                 200,             # account_info success
+                 201, 201, 201),  # put container success
+                201, missing_container=True)
+            test_status_map(
+                (503, 404, 404,   # account_info fails on 404
+                 503, 201, 201,   # PUT account
+                 503, 200,        # account_info success
+                 503, 201, 201),  # put container success
+                201, missing_container=True)
+
+    def test_PUT_autocreate_account_with_sysmeta(self):
+        # x-account-sysmeta headers in a container PUT request should be
+        # transferred to the account autocreate PUT request
+        with save_globals():
+            controller = proxy_server.ContainerController(self.app, 'account',
+                                                          'container')
+
+            def test_status_map(statuses, expected, headers=None, **kwargs):
+                set_http_connect(*statuses, **kwargs)
+                req = Request.blank('/v1/a/c', {}, headers=headers)
+                req.content_length = 0
+                self.app.update_request(req)
+                res = controller.PUT(req)
+                expected = str(expected)
+                self.assertEqual(res.status[:len(expected)], expected)
+
+            self.app.account_autocreate = True
+            calls = []
+            callback = _make_callback_func(calls)
+            key, value = 'X-Account-Sysmeta-Blah', 'something'
+            headers = {key: value}
+
+            # all goes according to plan
+            test_status_map(
+                (404, 404, 404,   # account_info fails on 404
+                 201, 201, 201,   # PUT account
+                 200,             # account_info success
+                 201, 201, 201),  # put container success
+                201, missing_container=True,
+                headers=headers,
+                give_connect=callback)
+
+            self.assertEqual(10, len(calls))
+            for call in calls[3:6]:
+                self.assertEqual('/account', call['path'])
+                self.assertIn(key, call['headers'],
+                              '%s call, key %s missing in headers %s' % (
+                                  call['method'], key, call['headers']))
+                self.assertEqual(value, call['headers'][key])
+
+    def test_PUT_autocreate_account_utf8(self):
+        with save_globals():
+            controller = proxy_server.ContainerController(
+                self.app, wsgi_to_str('\xe2\x98\x83'),
+                wsgi_to_str('\xe2\x98\x83'))
+
+            def test_status_map(statuses, expected, headers=None, **kwargs):
                 set_http_connect(*statuses, **kwargs)
-                self.app.memcache.store = {}
-                req = Request.blank('/a/c', {})
+                req = Request.blank('/v1/a/c', {}, headers=headers)
                 req.content_length = 0
                 self.app.update_request(req)
                 res = controller.PUT(req)
                 expected = str(expected)
-                self.assertEquals(res.status[:len(expected)], expected)
+                self.assertEqual(res.status[:len(expected)], expected)
+
+            self.app.account_autocreate = True
+            calls = []
+            callback = _make_callback_func(calls)
+
+            # all goes according to plan
+            test_status_map(
+                (404, 404, 404,   # account_info fails on 404
+                 201, 201, 201,   # PUT account
+                 200,             # account_info success
+                 201, 201, 201),  # put container success
+                201, missing_container=True,
+                give_connect=callback)
+
+            self.assertEqual(10, len(calls))
+            for call in calls[3:6]:
+                self.assertEqual(wsgi_to_str('/\xe2\x98\x83'), call['path'])
+
+    def test_POST(self):
+        with save_globals():
+            controller = proxy_server.ContainerController(self.app, 'account',
+                                                          'container')
+
+            def test_status_map(statuses, expected, **kwargs):
+                req = Request.blank('/v1/a/c', {})
+                req.content_length = 0
+                self.app.update_request(req)
+                with mocked_http_conn(*statuses, **kwargs) as mock_conn:
+                    res = controller.POST(req)
+                expected = str(expected)
+                self.assertEqual(res.status[:len(expected)], expected)
+                timestamps = [captured['headers'].get('X-Timestamp')
+                              for captured in mock_conn.requests[-3:]]
+                self.assertEqual(3, len(timestamps))
+                self.assertEqual(1, len(set(timestamps)))
+                self.assert_valid_timestamp(timestamps[0])
+
             test_status_map((200, 201, 201, 201), 201, missing_container=True)
             test_status_map((200, 201, 201, 500), 201, missing_container=True)
             test_status_map((200, 204, 404, 404), 404, missing_container=True)
             test_status_map((200, 204, 500, 404), 503, missing_container=True)
+            self.assertFalse(self.app.account_autocreate)
+            test_status_map((404, 404, 404), 404, missing_container=True)
+            self.app.account_autocreate = True
+            test_status_map((404, 404, 404), 404, missing_container=True)
 
     def test_PUT_max_containers_per_account(self):
         with save_globals():
@@ -3833,13 +10454,20 @@ def test_PUT_max_containers_per_account(self):
             controller = proxy_server.ContainerController(self.app, 'account',
                                                           'container')
             self.assert_status_map(controller.PUT,
-                                   (200, 200, 200, 201, 201, 201), 201,
+                                   (200, 201, 201, 201), 201,
                                    missing_container=True)
 
             self.app.max_containers_per_account = 12345
             controller = proxy_server.ContainerController(self.app, 'account',
                                                           'container')
-            self.assert_status_map(controller.PUT, (201, 201, 201), 403,
+            self.assert_status_map(controller.PUT,
+                                   (200, 200, 201, 201, 201), 201,
+                                   missing_container=True)
+
+            controller = proxy_server.ContainerController(self.app, 'account',
+                                                          'container_new')
+
+            self.assert_status_map(controller.PUT, (200, 404, 404, 404), 403,
                                    missing_container=True)
 
             self.app.max_containers_per_account = 12345
@@ -3847,21 +10475,40 @@ def test_PUT_max_containers_per_account(self):
             controller = proxy_server.ContainerController(self.app, 'account',
                                                           'container')
             self.assert_status_map(controller.PUT,
-                                   (200, 200, 200, 201, 201, 201), 201,
+                                   (200, 201, 201, 201), 201,
                                    missing_container=True)
 
     def test_PUT_max_container_name_length(self):
-        with save_globals():
-            limit = MAX_CONTAINER_NAME_LENGTH
-            controller = proxy_server.ContainerController(self.app, 'account',
-                                                          '1' * limit)
-            self.assert_status_map(controller.PUT,
-                                   (200, 200, 200, 201, 201, 201), 201,
-                                   missing_container=True)
-            controller = proxy_server.ContainerController(self.app, 'account',
-                                                          '2' * (limit + 1))
-            self.assert_status_map(controller.PUT, (201, 201, 201), 400,
-                                   missing_container=True)
+        limit = constraints.MAX_CONTAINER_NAME_LENGTH
+        controller = proxy_server.ContainerController(self.app, 'account',
+                                                      '1' * limit)
+        self.assert_status_map(controller.PUT, (200, 201, 201, 201), 201,
+                               missing_container=True)
+        controller = proxy_server.ContainerController(self.app, 'account',
+                                                      '2' * (limit + 1))
+        self.assert_status_map(controller.PUT, (), 400,
+                               missing_container=True)
+
+        # internal auto-created-accounts get higher limits
+        limit *= 2
+        controller = proxy_server.ContainerController(self.app, '.account',
+                                                      '3' * limit)
+        self.assert_status_map(controller.PUT, (200, 201, 201, 201), 201,
+                               missing_container=True)
+        controller = proxy_server.ContainerController(self.app, '.account',
+                                                      '4' * (limit + 1))
+        self.assert_status_map(controller.PUT, (), 400,
+                               missing_container=True)
+
+        self.app.auto_create_account_prefix = 'acc'
+        controller = proxy_server.ContainerController(self.app, 'account',
+                                                      '1' * limit)
+        self.assert_status_map(controller.PUT, (200, 201, 201, 201), 201,
+                               missing_container=True)
+        controller = proxy_server.ContainerController(self.app, 'account',
+                                                      '2' * (limit + 1))
+        self.assert_status_map(controller.PUT, (), 400,
+                               missing_container=True)
 
     def test_PUT_connect_exceptions(self):
         with save_globals():
@@ -3877,10 +10524,7 @@ def test_PUT_connect_exceptions(self):
     def test_acc_missing_returns_404(self):
         for meth in ('DELETE', 'PUT'):
             with save_globals():
-                self.app.memcache = FakeMemcacheReturnsNone()
-                for dev in self.app.account_ring.devs.values():
-                    del dev['errors']
-                    del dev['last_error']
+                self.app.error_limiter.stats.clear()
                 controller = proxy_server.ContainerController(self.app,
                                                               'account',
                                                               'container')
@@ -3889,79 +10533,74 @@ def test_acc_missing_returns_404(self):
                                      missing_container=True)
                 else:
                     set_http_connect(200, 200, 200, 200)
-                self.app.memcache.store = {}
-                req = Request.blank('/a/c', environ={'REQUEST_METHOD': meth})
+                req = Request.blank('/v1/a/c',
+                                    environ={'REQUEST_METHOD': meth})
                 self.app.update_request(req)
                 resp = getattr(controller, meth)(req)
-                self.assertEquals(resp.status_int, 200)
+                self.assertEqual(resp.status_int, 200)
 
                 set_http_connect(404, 404, 404, 200, 200, 200)
+                # Make sure it is a blank request wthout env caching
+                req = Request.blank('/v1/a/c',
+                                    environ={'REQUEST_METHOD': meth})
                 resp = getattr(controller, meth)(req)
-                self.assertEquals(resp.status_int, 404)
+                self.assertEqual(resp.status_int, 404)
 
                 set_http_connect(503, 404, 404)
+                # Make sure it is a blank request wthout env caching
+                req = Request.blank('/v1/a/c',
+                                    environ={'REQUEST_METHOD': meth})
                 resp = getattr(controller, meth)(req)
-                self.assertEquals(resp.status_int, 404)
+                self.assertEqual(resp.status_int, 404)
 
                 set_http_connect(503, 404, raise_exc=True)
+                # Make sure it is a blank request wthout env caching
+                req = Request.blank('/v1/a/c',
+                                    environ={'REQUEST_METHOD': meth})
                 resp = getattr(controller, meth)(req)
-                self.assertEquals(resp.status_int, 404)
+                self.assertEqual(resp.status_int, 404)
 
-                for dev in self.app.account_ring.devs.values():
-                    dev['errors'] = self.app.error_suppression_limit + 1
-                    dev['last_error'] = time()
+                for dev in self.app.account_ring.devs:
+                    set_node_errors(
+                        self.app, dev,
+                        self.app.error_limiter.suppression_limit + 1,
+                        time.time())
                 set_http_connect(200, 200, 200, 200, 200, 200)
+                # Make sure it is a blank request wthout env caching
+                req = Request.blank('/v1/a/c',
+                                    environ={'REQUEST_METHOD': meth})
                 resp = getattr(controller, meth)(req)
-                self.assertEquals(resp.status_int, 404)
-
-    def test_put_locking(self):
-
-        class MockMemcache(FakeMemcache):
-
-            def __init__(self, allow_lock=None):
-                self.allow_lock = allow_lock
-                super(MockMemcache, self).__init__()
-
-            @contextmanager
-            def soft_lock(self, key, timeout=0, retries=5):
-                if self.allow_lock:
-                    yield True
-                else:
-                    raise MemcacheLockError()
-
-        with save_globals():
-            controller = proxy_server.ContainerController(self.app, 'account',
-                                                          'container')
-            self.app.memcache = MockMemcache(allow_lock=True)
-            set_http_connect(200, 200, 200, 201, 201, 201,
-                             missing_container=True)
-            req = Request.blank('/a/c', environ={'REQUEST_METHOD': 'PUT'})
-            self.app.update_request(req)
-            res = controller.PUT(req)
-            self.assertEquals(res.status_int, 201)
+                self.assertEqual(resp.status_int, 404)
 
     def test_error_limiting(self):
         with save_globals():
-            set_shuffle()
             controller = proxy_server.ContainerController(self.app, 'account',
                                                           'container')
+            container_ring = controller.app.container_ring
+            controller.app.sort_nodes = lambda l, *args, **kwargs: l
             self.assert_status_map(controller.HEAD, (200, 503, 200, 200), 200,
                                    missing_container=False)
-            self.assertEquals(
-                controller.app.container_ring.devs[0]['errors'], 2)
-            self.assert_('last_error' in controller.app.container_ring.devs[0])
-            for _junk in xrange(self.app.error_suppression_limit):
+
+            self.assertEqual(
+                node_error_count(controller.app, container_ring.devs[0]), 2)
+            self.assertTrue(
+                node_last_error(controller.app, container_ring.devs[0])
+                is not None)
+            for _junk in range(self.app.error_limiter.suppression_limit):
                 self.assert_status_map(controller.HEAD,
                                        (200, 503, 503, 503), 503)
-            self.assertEquals(controller.app.container_ring.devs[0]['errors'],
-                              self.app.error_suppression_limit + 1)
+            self.assertEqual(
+                node_error_count(controller.app, container_ring.devs[0]),
+                self.app.error_limiter.suppression_limit + 1)
             self.assert_status_map(controller.HEAD, (200, 200, 200, 200), 503)
-            self.assert_('last_error' in controller.app.container_ring.devs[0])
+            self.assertTrue(
+                node_last_error(controller.app, container_ring.devs[0])
+                is not None)
             self.assert_status_map(controller.PUT, (200, 201, 201, 201), 503,
                                    missing_container=True)
             self.assert_status_map(controller.DELETE,
                                    (200, 204, 204, 204), 503)
-            self.app.error_suppression_interval = -300
+            self.app.error_limiter.suppression_interval = -300
             self.assert_status_map(controller.HEAD, (200, 200, 200, 200), 200)
             self.assert_status_map(controller.DELETE, (200, 204, 204, 204),
                                    404, raise_exc=True)
@@ -3983,7 +10622,6 @@ def test_DELETE(self):
             self.assert_status_map(controller.DELETE,
                                    (200, 204, 503, 404), 503)
 
-            self.app.memcache = FakeMemcacheReturnsNone()
             # 200: Account check, 404x3: Container check
             self.assert_status_map(controller.DELETE,
                                    (200, 404, 404, 404), 404)
@@ -3993,10 +10631,10 @@ def test_response_get_accept_ranges_header(self):
             set_http_connect(200, 200, body='{}')
             controller = proxy_server.ContainerController(self.app, 'account',
                                                           'container')
-            req = Request.blank('/a/c?format=json')
+            req = Request.blank('/v1/a/c?format=json')
             self.app.update_request(req)
             res = controller.GET(req)
-            self.assert_('accept-ranges' in res.headers)
+            self.assertIn('accept-ranges', res.headers)
             self.assertEqual(res.headers['accept-ranges'], 'bytes')
 
     def test_response_head_accept_ranges_header(self):
@@ -4004,10 +10642,10 @@ def test_response_head_accept_ranges_header(self):
             set_http_connect(200, 200, body='{}')
             controller = proxy_server.ContainerController(self.app, 'account',
                                                           'container')
-            req = Request.blank('/a/c?format=json')
+            req = Request.blank('/v1/a/c?format=json')
             self.app.update_request(req)
             res = controller.HEAD(req)
-            self.assert_('accept-ranges' in res.headers)
+            self.assertIn('accept-ranges', res.headers)
             self.assertEqual(res.headers['accept-ranges'], 'bytes')
 
     def test_PUT_metadata(self):
@@ -4036,7 +10674,7 @@ def test_connect(ipaddr, port, device, partition, method, path,
                         find_header = \
                             find_header.lower().replace('-remove', '', 1)
                         find_value = ''
-                    for k, v in headers.iteritems():
+                    for k, v in headers.items():
                         if k.lower() == find_header.lower() and \
                                 v == find_value:
                             break
@@ -4047,11 +10685,13 @@ def test_connect(ipaddr, port, device, partition, method, path,
                 controller = \
                     proxy_server.ContainerController(self.app, 'a', 'c')
                 set_http_connect(200, 201, 201, 201, give_connect=test_connect)
-                req = Request.blank('/a/c', environ={'REQUEST_METHOD': method},
-                                    headers={test_header: test_value})
+                req = Request.blank(
+                    '/v1/a/c',
+                    environ={'REQUEST_METHOD': method, 'swift_owner': True},
+                    headers={test_header: test_value})
                 self.app.update_request(req)
-                res = getattr(controller, method)(req)
-                self.assertEquals(test_errors, [])
+                getattr(controller, method)(req)
+                self.assertEqual(test_errors, [])
 
     def test_PUT_bad_metadata(self):
         self.bad_metadata_helper('PUT')
@@ -4063,85 +10703,87 @@ def bad_metadata_helper(self, method):
         with save_globals():
             controller = proxy_server.ContainerController(self.app, 'a', 'c')
             set_http_connect(200, 201, 201, 201)
-            req = Request.blank('/a/c', environ={'REQUEST_METHOD': method})
+            req = Request.blank('/v1/a/c', environ={'REQUEST_METHOD': method})
             self.app.update_request(req)
             resp = getattr(controller, method)(req)
-            self.assertEquals(resp.status_int, 201)
+            self.assertEqual(resp.status_int, 201)
 
             set_http_connect(201, 201, 201)
-            req = Request.blank('/a/c', environ={'REQUEST_METHOD': method},
+            req = Request.blank('/v1/a/c', environ={'REQUEST_METHOD': method},
                                 headers={'X-Container-Meta-' +
-                                ('a' * MAX_META_NAME_LENGTH): 'v'})
+                                ('a' * constraints.MAX_META_NAME_LENGTH): 'v'})
             self.app.update_request(req)
             resp = getattr(controller, method)(req)
-            self.assertEquals(resp.status_int, 201)
+            self.assertEqual(resp.status_int, 201)
             set_http_connect(201, 201, 201)
-            req = Request.blank('/a/c', environ={'REQUEST_METHOD': method},
-                                headers={'X-Container-Meta-' +
-                                ('a' * (MAX_META_NAME_LENGTH + 1)): 'v'})
+            req = Request.blank(
+                '/v1/a/c', environ={'REQUEST_METHOD': method},
+                headers={'X-Container-Meta-' +
+                         ('a' * (constraints.MAX_META_NAME_LENGTH + 1)): 'v'})
             self.app.update_request(req)
             resp = getattr(controller, method)(req)
-            self.assertEquals(resp.status_int, 400)
+            self.assertEqual(resp.status_int, 400)
 
             set_http_connect(201, 201, 201)
-            req = Request.blank('/a/c', environ={'REQUEST_METHOD': method},
+            req = Request.blank('/v1/a/c', environ={'REQUEST_METHOD': method},
                                 headers={'X-Container-Meta-Too-Long':
-                                'a' * MAX_META_VALUE_LENGTH})
+                                'a' * constraints.MAX_META_VALUE_LENGTH})
             self.app.update_request(req)
             resp = getattr(controller, method)(req)
-            self.assertEquals(resp.status_int, 201)
+            self.assertEqual(resp.status_int, 201)
             set_http_connect(201, 201, 201)
-            req = Request.blank('/a/c', environ={'REQUEST_METHOD': method},
+            req = Request.blank('/v1/a/c', environ={'REQUEST_METHOD': method},
                                 headers={'X-Container-Meta-Too-Long':
-                                'a' * (MAX_META_VALUE_LENGTH + 1)})
+                                'a' * (constraints.MAX_META_VALUE_LENGTH + 1)})
             self.app.update_request(req)
             resp = getattr(controller, method)(req)
-            self.assertEquals(resp.status_int, 400)
+            self.assertEqual(resp.status_int, 400)
 
             set_http_connect(201, 201, 201)
             headers = {}
-            for x in xrange(MAX_META_COUNT):
+            for x in range(constraints.MAX_META_COUNT):
                 headers['X-Container-Meta-%d' % x] = 'v'
-            req = Request.blank('/a/c', environ={'REQUEST_METHOD': method},
+            req = Request.blank('/v1/a/c', environ={'REQUEST_METHOD': method},
                                 headers=headers)
             self.app.update_request(req)
             resp = getattr(controller, method)(req)
-            self.assertEquals(resp.status_int, 201)
+            self.assertEqual(resp.status_int, 201)
             set_http_connect(201, 201, 201)
             headers = {}
-            for x in xrange(MAX_META_COUNT + 1):
+            for x in range(constraints.MAX_META_COUNT + 1):
                 headers['X-Container-Meta-%d' % x] = 'v'
-            req = Request.blank('/a/c', environ={'REQUEST_METHOD': method},
+            req = Request.blank('/v1/a/c', environ={'REQUEST_METHOD': method},
                                 headers=headers)
             self.app.update_request(req)
             resp = getattr(controller, method)(req)
-            self.assertEquals(resp.status_int, 400)
+            self.assertEqual(resp.status_int, 400)
 
             set_http_connect(201, 201, 201)
             headers = {}
-            header_value = 'a' * MAX_META_VALUE_LENGTH
+            header_value = 'a' * constraints.MAX_META_VALUE_LENGTH
             size = 0
             x = 0
-            while size < MAX_META_OVERALL_SIZE - 4 - MAX_META_VALUE_LENGTH:
-                size += 4 + MAX_META_VALUE_LENGTH
+            while size < (constraints.MAX_META_OVERALL_SIZE - 4
+                          - constraints.MAX_META_VALUE_LENGTH):
+                size += 4 + constraints.MAX_META_VALUE_LENGTH
                 headers['X-Container-Meta-%04d' % x] = header_value
                 x += 1
-            if MAX_META_OVERALL_SIZE - size > 1:
+            if constraints.MAX_META_OVERALL_SIZE - size > 1:
                 headers['X-Container-Meta-a'] = \
-                    'a' * (MAX_META_OVERALL_SIZE - size - 1)
-            req = Request.blank('/a/c', environ={'REQUEST_METHOD': method},
+                    'a' * (constraints.MAX_META_OVERALL_SIZE - size - 1)
+            req = Request.blank('/v1/a/c', environ={'REQUEST_METHOD': method},
                                 headers=headers)
             self.app.update_request(req)
             resp = getattr(controller, method)(req)
-            self.assertEquals(resp.status_int, 201)
+            self.assertEqual(resp.status_int, 201)
             set_http_connect(201, 201, 201)
             headers['X-Container-Meta-a'] = \
-                'a' * (MAX_META_OVERALL_SIZE - size)
-            req = Request.blank('/a/c', environ={'REQUEST_METHOD': method},
+                'a' * (constraints.MAX_META_OVERALL_SIZE - size)
+            req = Request.blank('/v1/a/c', environ={'REQUEST_METHOD': method},
                                 headers=headers)
             self.app.update_request(req)
             resp = getattr(controller, method)(req)
-            self.assertEquals(resp.status_int, 400)
+            self.assertEqual(resp.status_int, 400)
 
     def test_POST_calls_clean_acl(self):
         called = [False]
@@ -4153,23 +10795,23 @@ def clean_acl(header, value):
             set_http_connect(200, 201, 201, 201)
             controller = proxy_server.ContainerController(self.app, 'account',
                                                           'container')
-            req = Request.blank('/a/c', environ={'REQUEST_METHOD': 'POST'},
+            req = Request.blank('/v1/a/c', environ={'REQUEST_METHOD': 'POST'},
                                 headers={'X-Container-Read': '.r:*'})
             req.environ['swift.clean_acl'] = clean_acl
             self.app.update_request(req)
-            res = controller.POST(req)
-        self.assert_(called[0])
+            controller.POST(req)
+        self.assertTrue(called[0])
         called[0] = False
         with save_globals():
             set_http_connect(200, 201, 201, 201)
             controller = proxy_server.ContainerController(self.app, 'account',
                                                           'container')
-            req = Request.blank('/a/c', environ={'REQUEST_METHOD': 'POST'},
+            req = Request.blank('/v1/a/c', environ={'REQUEST_METHOD': 'POST'},
                                 headers={'X-Container-Write': '.r:*'})
             req.environ['swift.clean_acl'] = clean_acl
             self.app.update_request(req)
-            res = controller.POST(req)
-        self.assert_(called[0])
+            controller.POST(req)
+        self.assertTrue(called[0])
 
     def test_PUT_calls_clean_acl(self):
         called = [False]
@@ -4181,34 +10823,59 @@ def clean_acl(header, value):
             set_http_connect(200, 201, 201, 201)
             controller = proxy_server.ContainerController(self.app, 'account',
                                                           'container')
-            req = Request.blank('/a/c', environ={'REQUEST_METHOD': 'PUT'},
+            req = Request.blank('/v1/a/c', environ={'REQUEST_METHOD': 'PUT'},
                                 headers={'X-Container-Read': '.r:*'})
             req.environ['swift.clean_acl'] = clean_acl
             self.app.update_request(req)
-            res = controller.PUT(req)
-        self.assert_(called[0])
+            controller.PUT(req)
+        self.assertTrue(called[0])
         called[0] = False
         with save_globals():
             set_http_connect(200, 201, 201, 201)
             controller = proxy_server.ContainerController(self.app, 'account',
                                                           'container')
-            req = Request.blank('/a/c', environ={'REQUEST_METHOD': 'PUT'},
+            req = Request.blank('/v1/a/c', environ={'REQUEST_METHOD': 'PUT'},
                                 headers={'X-Container-Write': '.r:*'})
             req.environ['swift.clean_acl'] = clean_acl
             self.app.update_request(req)
-            res = controller.PUT(req)
-        self.assert_(called[0])
+            controller.PUT(req)
+        self.assertTrue(called[0])
 
     def test_GET_no_content(self):
         with save_globals():
             set_http_connect(200, 204, 204, 204)
-            controller = proxy_server.ContainerController(self.app, 'account',
-                                                          'container')
-            req = Request.blank('/a/c')
+            controller = proxy_server.ContainerController(self.app, 'a', 'c')
+            req = Request.blank('/v1/a/c')
+            self.app.update_request(req)
+            res = controller.GET(req)
+            self.assertEqual(res.status_int, 204)
+            ic = res.environ['swift.infocache']
+            self.assertEqual(ic['container/a/c']['status'], 204)
+            self.assertEqual(res.content_length, 0)
+            self.assertNotIn('transfer-encoding', res.headers)
+
+    def test_GET_account_non_existent(self):
+        with save_globals():
+            set_http_connect(404, 404, 404)
+            controller = proxy_server.ContainerController(self.app, 'a', 'c')
+            req = Request.blank('/v1/a/c')
+            self.app.update_request(req)
+            res = controller.GET(req)
+            self.assertEqual(res.status_int, 404)
+            self.assertNotIn('container/a/c', res.environ['swift.infocache'])
+
+    def test_GET_auto_create_prefix_account_non_existent(self):
+        with save_globals():
+            set_http_connect(404, 404, 404, 204, 204, 204)
+            controller = proxy_server.ContainerController(self.app, '.a', 'c')
+            req = Request.blank('/v1/a/c')
             self.app.update_request(req)
             res = controller.GET(req)
-            self.assertEquals(res.content_length, 0)
-            self.assertTrue('transfer-encoding' not in res.headers)
+            self.assertEqual(res.status_int, 204)
+            ic = res.environ['swift.infocache']
+            self.assertEqual(ic['container/.a/c']['status'], 204)
+            self.assertEqual(res.content_length, 0)
+            self.assertNotIn('transfer-encoding', res.headers)
 
     def test_GET_calls_authorize(self):
         called = [False]
@@ -4218,13 +10885,15 @@ def authorize(req):
             return HTTPUnauthorized(request=req)
         with save_globals():
             set_http_connect(200, 201, 201, 201)
-            controller = proxy_server.ContainerController(self.app, 'account',
-                                                          'container')
-            req = Request.blank('/a/c')
+            controller = proxy_server.ContainerController(self.app, 'a', 'c')
+            req = Request.blank('/v1/a/c')
             req.environ['swift.authorize'] = authorize
             self.app.update_request(req)
             res = controller.GET(req)
-        self.assert_(called[0])
+        self.assertEqual(
+            res.environ['swift.infocache']['container/a/c']['status'],
+            201)
+        self.assertTrue(called[0])
 
     def test_HEAD_calls_authorize(self):
         called = [False]
@@ -4234,13 +10903,111 @@ def authorize(req):
             return HTTPUnauthorized(request=req)
         with save_globals():
             set_http_connect(200, 201, 201, 201)
-            controller = proxy_server.ContainerController(self.app, 'account',
-                                                          'container')
-            req = Request.blank('/a/c', {'REQUEST_METHOD': 'HEAD'})
+            controller = proxy_server.ContainerController(self.app, 'a', 'c')
+            req = Request.blank('/v1/a/c', {'REQUEST_METHOD': 'HEAD'})
             req.environ['swift.authorize'] = authorize
             self.app.update_request(req)
-            res = controller.HEAD(req)
-        self.assert_(called[0])
+            controller.HEAD(req)
+        self.assertTrue(called[0])
+
+    def test_unauthorized_requests_when_account_not_found(self):
+        # verify unauthorized container requests always return response
+        # from swift.authorize
+        called = [0, 0]
+
+        def authorize(req):
+            called[0] += 1
+            return HTTPUnauthorized(request=req)
+
+        def account_info(*args):
+            called[1] += 1
+            return None, None, None
+
+        def _do_test(method):
+            with save_globals():
+                swift.proxy.controllers.Controller.account_info = account_info
+                app = proxy_server.Application(None,
+                                               account_ring=FakeRing(),
+                                               container_ring=FakeRing())
+                set_http_connect(201, 201, 201)
+                req = Request.blank('/v1/a/c', {'REQUEST_METHOD': method})
+                req.environ['swift.authorize'] = authorize
+                self.app.update_request(req)
+                res = app.handle_request(req)
+            return res
+
+        for method in ('PUT', 'POST', 'DELETE'):
+            # no delay_denial on method, expect one call to authorize
+            called = [0, 0]
+            res = _do_test(method)
+            self.assertEqual(401, res.status_int)
+            self.assertEqual([1, 0], called)
+
+        for method in ('HEAD', 'GET'):
+            # delay_denial on method, expect two calls to authorize
+            called = [0, 0]
+            res = _do_test(method)
+            self.assertEqual(401, res.status_int)
+            self.assertEqual([2, 1], called)
+
+    def test_authorized_requests_when_account_not_found(self):
+        # verify authorized container requests always return 404 when
+        # account not found
+        called = [0, 0]
+
+        def authorize(req):
+            called[0] += 1
+
+        def account_info(*args):
+            called[1] += 1
+            return None, None, None
+
+        def _do_test(method):
+            with save_globals():
+                swift.proxy.controllers.Controller.account_info = account_info
+                app = proxy_server.Application(None,
+                                               account_ring=FakeRing(),
+                                               container_ring=FakeRing())
+                set_http_connect(201, 201, 201)
+                req = Request.blank('/v1/a/c', {'REQUEST_METHOD': method})
+                req.environ['swift.authorize'] = authorize
+                self.app.update_request(req)
+                res = app.handle_request(req)
+            return res
+
+        for method in ('PUT', 'POST', 'DELETE', 'HEAD', 'GET'):
+            # expect one call to authorize
+            called = [0, 0]
+            res = _do_test(method)
+            self.assertEqual(404, res.status_int)
+            self.assertEqual([1, 1], called)
+
+    def test_OPTIONS_get_info_drops_origin(self):
+        with save_globals():
+            controller = proxy_server.ContainerController(self.app, 'a', 'c')
+
+            count = [0]
+
+            def my_get_info(app, env, account, container=None,
+                            ret_not_found=False, swift_source=None):
+                if count[0] > 11:
+                    return {}
+                count[0] += 1
+                if not container:
+                    return {'some': 'stuff'}
+                return proxy_base.was_get_info(
+                    app, env, account, container, ret_not_found, swift_source)
+
+            proxy_base.was_get_info = proxy_base.get_info
+            with mock.patch.object(proxy_base, 'get_info', my_get_info):
+                proxy_base.get_info = my_get_info
+                req = Request.blank(
+                    '/v1/a/c',
+                    {'REQUEST_METHOD': 'OPTIONS'},
+                    headers={'Origin': 'http://foo.com',
+                             'Access-Control-Request-Method': 'GET'})
+                controller.OPTIONS(req)
+                self.assertLess(count[0], 11)
 
     def test_OPTIONS(self):
         with save_globals():
@@ -4250,315 +11017,668 @@ def my_empty_container_info(*args):
                 return {}
             controller.container_info = my_empty_container_info
             req = Request.blank(
-                '/a/c',
+                '/v1/a/c',
                 {'REQUEST_METHOD': 'OPTIONS'},
                 headers={'Origin': 'http://foo.com',
                          'Access-Control-Request-Method': 'GET'})
             resp = controller.OPTIONS(req)
-            self.assertEquals(401, resp.status_int)
+            self.assertEqual(401, resp.status_int)
 
             def my_empty_origin_container_info(*args):
                 return {'cors': {'allow_origin': None}}
             controller.container_info = my_empty_origin_container_info
             req = Request.blank(
-                '/a/c',
+                '/v1/a/c',
                 {'REQUEST_METHOD': 'OPTIONS'},
                 headers={'Origin': 'http://foo.com',
                          'Access-Control-Request-Method': 'GET'})
             resp = controller.OPTIONS(req)
-            self.assertEquals(401, resp.status_int)
+            self.assertEqual(401, resp.status_int)
 
             def my_container_info(*args):
                 return {
                     'cors': {
                         'allow_origin': 'http://foo.bar:8080 https://foo.bar',
-                        'allow_headers': 'x-foo',
                         'max_age': '999',
                     }
                 }
             controller.container_info = my_container_info
             req = Request.blank(
-                '/a/c',
+                '/v1/a/c',
                 {'REQUEST_METHOD': 'OPTIONS'},
                 headers={'Origin': 'https://foo.bar',
                          'Access-Control-Request-Method': 'GET'})
             req.content_length = 0
             resp = controller.OPTIONS(req)
-            self.assertEquals(200, resp.status_int)
-            self.assertEquals(
+            self.assertEqual(200, resp.status_int)
+            self.assertEqual(
                 'https://foo.bar',
                 resp.headers['access-control-allow-origin'])
             for verb in 'OPTIONS GET POST PUT DELETE HEAD'.split():
-                self.assertTrue(
-                    verb in resp.headers['access-control-allow-methods'])
-            self.assertEquals(
+                self.assertIn(verb,
+                              resp.headers['access-control-allow-methods'])
+            self.assertEqual(
                 len(resp.headers['access-control-allow-methods'].split(', ')),
                 6)
-            self.assertEquals('999', resp.headers['access-control-max-age'])
-            self.assertEquals(
-                'x-foo',
-                resp.headers['access-control-allow-headers'])
+            self.assertEqual('999', resp.headers['access-control-max-age'])
             req = Request.blank(
-                '/a/c',
+                '/v1/a/c',
                 {'REQUEST_METHOD': 'OPTIONS'},
                 headers={'Origin': 'https://foo.bar'})
             req.content_length = 0
             resp = controller.OPTIONS(req)
-            self.assertEquals(401, resp.status_int)
-            req = Request.blank('/a/c', {'REQUEST_METHOD': 'OPTIONS'})
+            self.assertEqual(401, resp.status_int)
+            req = Request.blank('/v1/a/c', {'REQUEST_METHOD': 'OPTIONS'})
             req.content_length = 0
             resp = controller.OPTIONS(req)
-            self.assertEquals(200, resp.status_int)
+            self.assertEqual(200, resp.status_int)
             for verb in 'OPTIONS GET POST PUT DELETE HEAD'.split():
-                self.assertTrue(
-                    verb in resp.headers['Allow'])
-            self.assertEquals(len(resp.headers['Allow'].split(', ')), 6)
+                self.assertIn(verb, resp.headers['Allow'])
+            self.assertEqual(len(resp.headers['Allow'].split(', ')), 6)
             req = Request.blank(
-                '/a/c',
+                '/v1/a/c',
                 {'REQUEST_METHOD': 'OPTIONS'},
                 headers={'Origin': 'http://foo.bar',
                          'Access-Control-Request-Method': 'GET'})
             resp = controller.OPTIONS(req)
-            self.assertEquals(401, resp.status_int)
+            self.assertEqual(401, resp.status_int)
             req = Request.blank(
-                '/a/c',
+                '/v1/a/c',
                 {'REQUEST_METHOD': 'OPTIONS'},
                 headers={'Origin': 'http://foo.bar',
                          'Access-Control-Request-Method': 'GET'})
             controller.app.cors_allow_origin = ['http://foo.bar', ]
             resp = controller.OPTIONS(req)
-            self.assertEquals(200, resp.status_int)
+            self.assertEqual(200, resp.status_int)
 
             def my_container_info_wildcard(*args):
                 return {
                     'cors': {
                         'allow_origin': '*',
-                        'allow_headers': 'x-foo',
                         'max_age': '999',
                     }
                 }
             controller.container_info = my_container_info_wildcard
             req = Request.blank(
-                '/a/c/o.jpg',
+                '/v1/a/c/o.jpg',
                 {'REQUEST_METHOD': 'OPTIONS'},
                 headers={'Origin': 'https://bar.baz',
+                         'Access-Control-Request-Headers': ' , ,,',
                          'Access-Control-Request-Method': 'GET'})
             req.content_length = 0
             resp = controller.OPTIONS(req)
-            self.assertEquals(200, resp.status_int)
-            self.assertEquals(
-                'https://bar.baz',
-                resp.headers['access-control-allow-origin'])
+            self.assertEqual(200, resp.status_int)
+            self.assertEqual('*', resp.headers['access-control-allow-origin'])
+            self.assertNotIn('access-control-allow-headers', resp.headers)
             for verb in 'OPTIONS GET POST PUT DELETE HEAD'.split():
-                self.assertTrue(
-                    verb in resp.headers['access-control-allow-methods'])
-            self.assertEquals(
+                self.assertIn(verb,
+                              resp.headers['access-control-allow-methods'])
+            self.assertEqual(
                 len(resp.headers['access-control-allow-methods'].split(', ')),
                 6)
-            self.assertEquals('999', resp.headers['access-control-max-age'])
-            self.assertEquals(
-                'x-foo',
-                resp.headers['access-control-allow-headers'])
+            self.assertEqual('999', resp.headers['access-control-max-age'])
+
+            req = Request.blank(
+                '/v1/a/c/o.jpg',
+                {'REQUEST_METHOD': 'OPTIONS'},
+                headers={'Origin': 'https://bar.baz',
+                         'Access-Control-Request-Headers':
+                         'x-foo, x-bar, , x-auth-token',
+                         'Access-Control-Request-Method': 'GET'}
+            )
+            req.content_length = 0
+            resp = controller.OPTIONS(req)
+            self.assertEqual(200, resp.status_int)
+            self.assertEqual(
+                sortHeaderNames('x-foo, x-bar, x-auth-token'),
+                sortHeaderNames(resp.headers['access-control-allow-headers']))
+            self.assertEqual('Access-Control-Request-Headers',
+                             resp.headers.get('vary'))
+
+    def test_CORS_valid(self):
+        with save_globals():
+            controller = proxy_server.ContainerController(self.app, 'a', 'c')
+
+            def stubContainerInfo(*args):
+                return {
+                    'cors': {
+                        'allow_origin': 'http://foo.bar'
+                    }
+                }
+            controller.container_info = stubContainerInfo
 
+            def containerGET(controller, req):
+                return Response(headers={
+                    'X-Container-Meta-Color': 'red',
+                    'X-Super-Secret': 'hush',
+                })
+
+            req = Request.blank(
+                '/v1/a/c',
+                {'REQUEST_METHOD': 'GET'},
+                headers={'Origin': 'http://foo.bar'})
+
+            resp = cors_validation(containerGET)(controller, req)
+
+            self.assertEqual(200, resp.status_int)
+            self.assertEqual('http://foo.bar',
+                             resp.headers['access-control-allow-origin'])
+            self.assertEqual('red', resp.headers['x-container-meta-color'])
+            # X-Super-Secret is in the response, but not "exposed"
+            self.assertEqual('hush', resp.headers['x-super-secret'])
+            self.assertIn('access-control-expose-headers', resp.headers)
+            exposed = set(
+                h.strip() for h in
+                resp.headers['access-control-expose-headers'].split(','))
+            expected_exposed = set([
+                'cache-control', 'content-language', 'content-type', 'expires',
+                'last-modified', 'pragma', 'etag', 'x-timestamp', 'x-trans-id',
+                'x-openstack-request-id', 'x-container-meta-color'])
+            self.assertEqual(expected_exposed, exposed)
+
+    def _gather_x_account_headers(self, controller_call, req, *connect_args,
+                                  **kwargs):
+        seen_headers = []
+        to_capture = ('X-Account-Partition', 'X-Account-Host',
+                      'X-Account-Device')
+
+        def capture_headers(ipaddr, port, device, partition, method,
+                            path, headers=None, query_string=None):
+            captured = {}
+            for header in to_capture:
+                captured[header] = headers.get(header)
+            seen_headers.append(captured)
+
+        with save_globals():
+            self.app.allow_account_management = True
+
+            set_http_connect(*connect_args, give_connect=capture_headers,
+                             **kwargs)
+            resp = controller_call(req)
+            self.assertEqual(2, resp.status_int // 100)  # sanity check
+
+            # don't care about the account HEAD, so throw away the
+            # first element
+            return sorted(seen_headers[1:],
+                          key=lambda d: d['X-Account-Host'] or 'Z')
+
+    def test_PUT_x_account_headers_with_fewer_account_replicas(self):
+        self.app.account_ring.set_replicas(2)
+        req = Request.blank('/v1/a/c', headers={'': ''})
+        controller = proxy_server.ContainerController(self.app, 'a', 'c')
+
+        seen_headers = self._gather_x_account_headers(
+            controller.PUT, req,
+            200, 201, 201, 201)    # HEAD PUT PUT PUT
+        self.assertEqual(seen_headers, [
+            {'X-Account-Host': '10.0.0.0:1000',
+             'X-Account-Partition': '0',
+             'X-Account-Device': 'sda'},
+            {'X-Account-Host': '10.0.0.1:1001',
+             'X-Account-Partition': '0',
+             'X-Account-Device': 'sdb'},
+            {'X-Account-Host': None,
+             'X-Account-Partition': None,
+             'X-Account-Device': None}
+        ])
+
+    def test_PUT_x_account_headers_with_more_account_replicas(self):
+        self.app.account_ring.set_replicas(4)
+        req = Request.blank('/v1/a/c', headers={'': ''})
+        controller = proxy_server.ContainerController(self.app, 'a', 'c')
+
+        seen_headers = self._gather_x_account_headers(
+            controller.PUT, req,
+            200, 201, 201, 201)    # HEAD PUT PUT PUT
+        self.assertEqual(seen_headers, [
+            {'X-Account-Host': '10.0.0.0:1000,10.0.0.3:1003',
+             'X-Account-Partition': '0',
+             'X-Account-Device': 'sda,sdd'},
+            {'X-Account-Host': '10.0.0.1:1001',
+             'X-Account-Partition': '0',
+             'X-Account-Device': 'sdb'},
+            {'X-Account-Host': '10.0.0.2:1002',
+             'X-Account-Partition': '0',
+             'X-Account-Device': 'sdc'}
+        ])
+
+    def test_DELETE_x_account_headers_with_fewer_account_replicas(self):
+        self.app.account_ring.set_replicas(2)
+        req = Request.blank('/v1/a/c', headers={'': ''})
+        controller = proxy_server.ContainerController(self.app, 'a', 'c')
+
+        seen_headers = self._gather_x_account_headers(
+            controller.DELETE, req,
+            200, 204, 204, 204)    # HEAD DELETE DELETE DELETE
+        self.assertEqual(seen_headers, [
+            {'X-Account-Host': '10.0.0.0:1000',
+             'X-Account-Partition': '0',
+             'X-Account-Device': 'sda'},
+            {'X-Account-Host': '10.0.0.1:1001',
+             'X-Account-Partition': '0',
+             'X-Account-Device': 'sdb'},
+            {'X-Account-Host': None,
+             'X-Account-Partition': None,
+             'X-Account-Device': None}
+        ])
+
+    def test_DELETE_x_account_headers_with_more_account_replicas(self):
+        self.app.account_ring.set_replicas(4)
+        req = Request.blank('/v1/a/c', headers={'': ''})
+        controller = proxy_server.ContainerController(self.app, 'a', 'c')
+
+        seen_headers = self._gather_x_account_headers(
+            controller.DELETE, req,
+            200, 204, 204, 204)    # HEAD DELETE DELETE DELETE
+        self.assertEqual(seen_headers, [
+            {'X-Account-Host': '10.0.0.0:1000,10.0.0.3:1003',
+             'X-Account-Partition': '0',
+             'X-Account-Device': 'sda,sdd'},
+            {'X-Account-Host': '10.0.0.1:1001',
+             'X-Account-Partition': '0',
+             'X-Account-Device': 'sdb'},
+            {'X-Account-Host': '10.0.0.2:1002',
+             'X-Account-Partition': '0',
+             'X-Account-Device': 'sdc'}
+        ])
+
+    def test_PUT_backed_x_timestamp_header(self):
+        timestamps = []
+
+        def capture_timestamps(*args, **kwargs):
+            headers = kwargs['headers']
+            timestamps.append(headers.get('X-Timestamp'))
+
+        req = Request.blank('/v1/a/c', method='PUT', headers={'': ''})
+        with save_globals():
+            new_connect = set_http_connect(200,  # account existence check
+                                           201, 201, 201,
+                                           give_connect=capture_timestamps)
+            resp = self.app.handle_request(req)
+
+        # sanity
+        with self.assertRaises(StopIteration):
+            next(new_connect.code_iter)
+        self.assertEqual(2, resp.status_int // 100)
+
+        timestamps.pop(0)  # account existence check
+        self.assertEqual(3, len(timestamps))
+        for timestamp in timestamps:
+            self.assertEqual(timestamp, timestamps[0])
+            self.assertTrue(re.match(r'[0-9]{10}\.[0-9]{5}', timestamp))
+
+    def test_DELETE_backed_x_timestamp_header(self):
+        timestamps = []
+
+        def capture_timestamps(*args, **kwargs):
+            headers = kwargs['headers']
+            timestamps.append(headers.get('X-Timestamp'))
+
+        req = Request.blank('/v1/a/c', method='DELETE', headers={'': ''})
+        self.app.update_request(req)
+        with save_globals():
+            new_connect = set_http_connect(200,  # account existence check
+                                           201, 201, 201,
+                                           give_connect=capture_timestamps)
+            resp = self.app.handle_request(req)
+
+        # sanity
+        with self.assertRaises(StopIteration):
+            next(new_connect.code_iter)
+        self.assertEqual(2, resp.status_int // 100)
+
+        timestamps.pop(0)  # account existence check
+        self.assertEqual(3, len(timestamps))
+        self.assertEqual(1, len(set(timestamps)))
+        self.assert_valid_timestamp(timestamps[0])
+
+    def test_node_read_timeout_no_retry_to_container(self):
+        with save_globals():
+            req = Request.blank('/v1/a/c', environ={'REQUEST_METHOD': 'GET'})
+            self.app.node_timeout = 0.1
+            # account HEAD, container GET
+            set_http_connect(200, 200, body='abcdef', slow=[0.0, 1.0])
+            resp = req.get_response(self.app)
+            self.assertEqual(200, resp.status_int)
+            with self.assertRaises(ChunkReadTimeout):
+                resp.body
+            error_lines = self.app.logger.get_lines_for_level('error')
+            self.assertEqual(0, len(error_lines))
 
-class TestAccountController(unittest.TestCase):
+
+@patch_policies([StoragePolicy(0, 'zero', True, object_ring=FakeRing())])
+class TestAccountController(BaseTestCase):
 
     def setUp(self):
-        self.app = proxy_server.Application(None, FakeMemcache(),
+        conf = {'error_suppression_interval': 0}
+        self.app = proxy_server.Application(conf,
                                             account_ring=FakeRing(),
-                                            container_ring=FakeRing(),
-                                            object_ring=FakeRing)
+                                            container_ring=FakeRing())
 
-    def assert_status_map(self, method, statuses, expected):
+    def assert_status_map(self, method, statuses, expected, env_expected=None,
+                          headers=None, **kwargs):
+        headers = headers or {}
         with save_globals():
-            set_http_connect(*statuses)
-            req = Request.blank('/a', {})
+            req = Request.blank('/v1/a', {}, headers=headers)
             self.app.update_request(req)
-            res = method(req)
-            self.assertEquals(res.status_int, expected)
-            set_http_connect(*statuses)
-            req = Request.blank('/a/', {})
+            with mocked_http_conn(*statuses, **kwargs) as mock_conn:
+                res = method(req)
+            self.assertEqual(res.status_int, expected)
+            infocache = res.environ.get('swift.infocache', {})
+            if env_expected:
+                self.assertEqual(infocache['account/a']['status'],
+                                 env_expected)
+            req = Request.blank('/v1/a/', {}, headers=headers)
             self.app.update_request(req)
-            res = method(req)
-            self.assertEquals(res.status_int, expected)
+            with mocked_http_conn(*statuses, **kwargs) as mock_conn:
+                res = method(req)
+            infocache = res.environ.get('swift.infocache', {})
+            self.assertEqual(res.status_int, expected)
+            if env_expected:
+                self.assertEqual(infocache['account/a']['status'],
+                                 env_expected)
+            return mock_conn
 
     def test_OPTIONS(self):
         with save_globals():
             self.app.allow_account_management = False
             controller = proxy_server.AccountController(self.app, 'account')
-            req = Request.blank('/account', {'REQUEST_METHOD': 'OPTIONS'})
+            req = Request.blank('/v1/account', {'REQUEST_METHOD': 'OPTIONS'})
+            req.content_length = 0
+            resp = controller.OPTIONS(req)
+            self.assertEqual(200, resp.status_int)
+            for verb in 'OPTIONS GET POST HEAD'.split():
+                self.assertIn(verb, resp.headers['Allow'])
+            self.assertEqual(len(resp.headers['Allow'].split(', ')), 4)
+
+            # Test a CORS OPTIONS request (i.e. including Origin and
+            # Access-Control-Request-Method headers)
+            self.app.allow_account_management = False
+            controller = proxy_server.AccountController(self.app, 'account')
+            req = Request.blank(
+                '/v1/account', {'REQUEST_METHOD': 'OPTIONS'},
+                headers={'Origin': 'http://foo.com',
+                         'Access-Control-Request-Method': 'GET'})
             req.content_length = 0
             resp = controller.OPTIONS(req)
-            self.assertEquals(200, resp.status_int)
+            self.assertEqual(200, resp.status_int)
             for verb in 'OPTIONS GET POST HEAD'.split():
-                self.assertTrue(
-                    verb in resp.headers['Allow'])
-            self.assertEquals(len(resp.headers['Allow'].split(', ')), 4)
+                self.assertIn(verb, resp.headers['Allow'])
+            self.assertEqual(len(resp.headers['Allow'].split(', ')), 4)
+
             self.app.allow_account_management = True
             controller = proxy_server.AccountController(self.app, 'account')
-            req = Request.blank('/account', {'REQUEST_METHOD': 'OPTIONS'})
+            req = Request.blank('/v1/account', {'REQUEST_METHOD': 'OPTIONS'})
             req.content_length = 0
             resp = controller.OPTIONS(req)
-            self.assertEquals(200, resp.status_int)
-            print resp.headers['Allow']
+            self.assertEqual(200, resp.status_int)
             for verb in 'OPTIONS GET POST PUT DELETE HEAD'.split():
-                self.assertTrue(
-                    verb in resp.headers['Allow'])
-            self.assertEquals(len(resp.headers['Allow'].split(', ')), 6)
+                self.assertIn(verb, resp.headers['Allow'])
+            self.assertEqual(len(resp.headers['Allow'].split(', ')), 6)
 
     def test_GET(self):
         with save_globals():
-            controller = proxy_server.AccountController(self.app, 'account')
-            self.assert_status_map(controller.GET, (200, 200, 200), 200)
-            self.assert_status_map(controller.GET, (200, 200, 503), 200)
-            self.assert_status_map(controller.GET, (200, 503, 503), 200)
-            self.assert_status_map(controller.GET, (204, 204, 204), 204)
-            self.assert_status_map(controller.GET, (204, 204, 503), 204)
-            self.assert_status_map(controller.GET, (204, 503, 503), 204)
-            self.assert_status_map(controller.GET, (204, 204, 200), 204)
-            self.assert_status_map(controller.GET, (204, 200, 200), 204)
-            self.assert_status_map(controller.GET, (404, 404, 404), 404)
-            self.assert_status_map(controller.GET, (404, 404, 200), 200)
-            self.assert_status_map(controller.GET, (404, 200, 200), 200)
-            self.assert_status_map(controller.GET, (404, 404, 503), 404)
+            controller = proxy_server.AccountController(self.app, 'a')
+            # GET returns after the first successful call to an Account Server
+            self.assert_status_map(controller.GET, (200,), 200, 200)
+            self.assert_status_map(controller.GET, (503, 200), 200, 200)
+            self.assert_status_map(controller.GET, (503, 503, 200), 200, 200)
+            self.assert_status_map(controller.GET, (204,), 204, 204)
+            self.assert_status_map(controller.GET, (503, 204), 204, 204)
+            self.assert_status_map(controller.GET, (503, 503, 204), 204, 204)
+            self.assert_status_map(controller.GET, (404, 200), 200, 200)
+            self.assert_status_map(controller.GET, (404, 404, 200), 200, 200)
+            self.assert_status_map(controller.GET, (404, 503, 204), 204, 204)
+            # If Account servers fail, if autocreate = False, return majority
+            # response
+            self.assert_status_map(controller.GET, (404, 404, 404), 404, 404)
+            self.assert_status_map(controller.GET, (404, 404, 503), 404, 404)
             self.assert_status_map(controller.GET, (404, 503, 503), 503)
-            self.assert_status_map(controller.GET, (404, 204, 503), 204)
 
-            self.app.memcache = FakeMemcacheReturnsNone()
-            self.assert_status_map(controller.GET, (404, 404, 404), 404)
+            self.assert_status_map(controller.GET, (404, 404, 404), 404, 404)
 
     def test_GET_autocreate(self):
         with save_globals():
-            controller = proxy_server.AccountController(self.app, 'account')
-            self.app.memcache = FakeMemcacheReturnsNone()
-            self.assert_status_map(controller.GET,
-                                   (404, 404, 404, 201, 201, 201, 204), 404)
-            controller.app.account_autocreate = True
+            controller = proxy_server.AccountController(self.app, 'a')
+            self.assertFalse(self.app.account_autocreate)
+            # Repeat the test for autocreate = False and 404 by all
             self.assert_status_map(controller.GET,
-                                   (404, 404, 404, 201, 201, 201, 204), 204)
+                                   (404, 404, 404), 404)
             self.assert_status_map(controller.GET,
-                                   (404, 404, 404, 403, 403, 403, 403), 403)
+                                   (404, 503, 404), 404)
+            # When autocreate is True, if none of the nodes respond 2xx
+            # And quorum of the nodes responded 404,
+            # ALL nodes are asked to create the account
+            # If successful, the GET request is repeated.
+            controller.app.account_autocreate = True
+            expected = 200
+            self.assert_status_map(controller.GET, (404, 404, 404), expected)
+            self.assert_status_map(controller.GET, (404, 503, 404), expected)
+            # We always return 503 if no majority between 4xx, 3xx or 2xx found
             self.assert_status_map(controller.GET,
-                                   (404, 404, 404, 409, 409, 409, 409), 409)
+                                   (500, 500, 400), 503)
+
+    def _check_autocreate_listing_with_query_string(self, query_string):
+        controller = proxy_server.AccountController(self.app, 'a')
+        controller.app.account_autocreate = True
+        statuses = (404, 404, 404)
+        expected = 200
+        # get the response to check it has json content
+        with save_globals():
+            set_http_connect(*statuses)
+            req = Request.blank('/v1/a' + query_string)
+            self.app.update_request(req)
+            res = controller.GET(req)
+            headers = res.headers
+            self.assertEqual(
+                'yes', headers.get('X-Backend-Fake-Account-Listing'))
+            self.assertEqual(
+                'application/json; charset=utf-8',
+                headers.get('Content-Type'))
+            self.assertEqual([], json.loads(res.body))
+            self.assertEqual(res.status_int, expected)
+
+    def test_auto_create_account_listing_response_is_json(self):
+        self._check_autocreate_listing_with_query_string('')
+        self._check_autocreate_listing_with_query_string('?format=plain')
+        self._check_autocreate_listing_with_query_string('?format=json')
+        self._check_autocreate_listing_with_query_string('?format=xml')
 
     def test_HEAD(self):
+        # Same behaviour as GET
         with save_globals():
-            controller = proxy_server.AccountController(self.app, 'account')
-            self.assert_status_map(controller.HEAD, (200, 200, 200), 200)
-            self.assert_status_map(controller.HEAD, (200, 200, 503), 200)
-            self.assert_status_map(controller.HEAD, (200, 503, 503), 200)
-            self.assert_status_map(controller.HEAD, (204, 204, 204), 204)
-            self.assert_status_map(controller.HEAD, (204, 204, 503), 204)
-            self.assert_status_map(controller.HEAD, (204, 503, 503), 204)
-            self.assert_status_map(controller.HEAD, (204, 204, 200), 204)
-            self.assert_status_map(controller.HEAD, (204, 200, 200), 204)
-            self.assert_status_map(controller.HEAD, (404, 404, 404), 404)
-            self.assert_status_map(controller.HEAD, (404, 404, 200), 200)
-            self.assert_status_map(controller.HEAD, (404, 200, 200), 200)
-            self.assert_status_map(controller.HEAD, (404, 404, 503), 404)
+            controller = proxy_server.AccountController(self.app, 'a')
+            self.assert_status_map(controller.HEAD, (200,), 200, 200)
+            self.assert_status_map(controller.HEAD, (503, 200), 200, 200)
+            self.assert_status_map(controller.HEAD, (503, 503, 200), 200, 200)
+            self.assert_status_map(controller.HEAD, (204,), 204, 204)
+            self.assert_status_map(controller.HEAD, (503, 204), 204, 204)
+            self.assert_status_map(controller.HEAD, (204,), 204, 204)
+            self.assert_status_map(controller.HEAD, (204,), 204, 204)
+            self.assert_status_map(controller.HEAD, (404, 404, 404), 404, 404)
+            self.assert_status_map(controller.HEAD, (404, 404, 200), 200, 200)
+            self.assert_status_map(controller.HEAD, (404, 200), 200, 200)
+            self.assert_status_map(controller.HEAD, (404, 404, 503), 404, 404)
             self.assert_status_map(controller.HEAD, (404, 503, 503), 503)
-            self.assert_status_map(controller.HEAD, (404, 204, 503), 204)
+            self.assert_status_map(controller.HEAD, (404, 503, 204), 204, 204)
 
     def test_HEAD_autocreate(self):
+        # Same behaviour as GET
         with save_globals():
-            controller = proxy_server.AccountController(self.app, 'account')
-            self.app.memcache = FakeMemcacheReturnsNone()
+            controller = proxy_server.AccountController(self.app, 'a')
+            self.assertFalse(self.app.account_autocreate)
             self.assert_status_map(controller.HEAD,
-                                   (404, 404, 404, 201, 201, 201, 204), 404)
+                                   (404, 404, 404), 404)
             controller.app.account_autocreate = True
             self.assert_status_map(controller.HEAD,
-                                   (404, 404, 404, 201, 201, 201, 204), 204)
+                                   (404, 404, 404), 200)
             self.assert_status_map(controller.HEAD,
-                                   (404, 404, 404, 403, 403, 403, 403), 403)
+                                   (500, 404, 404), 200)
+            # We always return 503 if no majority between 4xx, 3xx or 2xx found
             self.assert_status_map(controller.HEAD,
-                                   (404, 404, 404, 409, 409, 409, 409), 409)
+                                   (500, 500, 400), 503)
 
     def test_POST_autocreate(self):
         with save_globals():
-            controller = proxy_server.AccountController(self.app, 'account')
-            self.app.memcache = FakeMemcacheReturnsNone()
+            controller = proxy_server.AccountController(self.app, 'a')
+            # first test with autocreate being False
+            self.assertFalse(self.app.account_autocreate)
             self.assert_status_map(controller.POST,
-                                   (404, 404, 404, 201, 201, 201), 404)
+                                   (404, 404, 404), 404)
+            # next turn it on and test account being created than updated
             controller.app.account_autocreate = True
+            self.assert_status_map(
+                controller.POST,
+                (404, 404, 404, 202, 202, 202, 201, 201, 201), 201)
+            # account_info  PUT account  POST account
+            self.assert_status_map(
+                controller.POST,
+                (404, 404, 503, 201, 201, 503, 204, 204, 504), 204)
+            # what if create fails
+            self.assert_status_map(
+                controller.POST,
+                (404, 404, 404, 403, 403, 403, 400, 400, 400), 400)
+
+    def test_POST_autocreate_with_sysmeta(self):
+        with save_globals():
+            controller = proxy_server.AccountController(self.app, 'a')
+            # first test with autocreate being False
+            self.assertFalse(self.app.account_autocreate)
             self.assert_status_map(controller.POST,
-                                   (404, 404, 404, 201, 201, 201), 201)
-            self.assert_status_map(controller.POST,
-                                   (404, 404, 404, 403, 403, 403, 403), 403)
-            self.assert_status_map(controller.POST,
-                                   (404, 404, 404, 409, 409, 409, 409), 409)
+                                   (404, 404, 404), 404)
+            # next turn it on and test account being created than updated
+            controller.app.account_autocreate = True
+            key, value = 'X-Account-Sysmeta-Blah', 'something'
+            headers = {key: value}
+            mock_conn = self.assert_status_map(
+                controller.POST,
+                (404, 404, 404, 202, 202, 202, 201, 201, 201), 201,
+                #  POST       , autocreate PUT, POST again
+                headers=headers)
+            self.assertEqual(9, len(mock_conn.requests))
+            for request in mock_conn.requests:
+                self.assertIn(key, request['headers'],
+                              '%s call, key %s missing in headers %s' %
+                              (request['method'], key, request['headers']))
+                self.assertEqual(value, request['headers'][key])
 
     def test_connection_refused(self):
         self.app.account_ring.get_nodes('account')
-        for dev in self.app.account_ring.devs.values():
+        for dev in self.app.account_ring.devs:
             dev['ip'] = '127.0.0.1'
             dev['port'] = 1  # can't connect on this port
         controller = proxy_server.AccountController(self.app, 'account')
-        req = Request.blank('/account', environ={'REQUEST_METHOD': 'HEAD'})
+        req = Request.blank('/v1/account', environ={'REQUEST_METHOD': 'HEAD'})
         self.app.update_request(req)
         resp = controller.HEAD(req)
-        self.assertEquals(resp.status_int, 503)
+        self.assertEqual(resp.status_int, 503)
 
     def test_other_socket_error(self):
         self.app.account_ring.get_nodes('account')
-        for dev in self.app.account_ring.devs.values():
+        for dev in self.app.account_ring.devs:
             dev['ip'] = '127.0.0.1'
             dev['port'] = -1  # invalid port number
         controller = proxy_server.AccountController(self.app, 'account')
-        req = Request.blank('/account', environ={'REQUEST_METHOD': 'HEAD'})
+        req = Request.blank('/v1/account', environ={'REQUEST_METHOD': 'HEAD'})
         self.app.update_request(req)
         resp = controller.HEAD(req)
-        self.assertEquals(resp.status_int, 503)
+        self.assertEqual(resp.status_int, 503)
 
     def test_response_get_accept_ranges_header(self):
         with save_globals():
             set_http_connect(200, 200, body='{}')
             controller = proxy_server.AccountController(self.app, 'account')
-            req = Request.blank('/a?format=json')
+            req = Request.blank('/v1/a?format=json')
             self.app.update_request(req)
             res = controller.GET(req)
-            self.assert_('accept-ranges' in res.headers)
+            self.assertIn('accept-ranges', res.headers)
             self.assertEqual(res.headers['accept-ranges'], 'bytes')
 
     def test_response_head_accept_ranges_header(self):
         with save_globals():
             set_http_connect(200, 200, body='{}')
             controller = proxy_server.AccountController(self.app, 'account')
-            req = Request.blank('/a?format=json')
+            req = Request.blank('/v1/a?format=json')
             self.app.update_request(req)
             res = controller.HEAD(req)
             res.body
-            self.assert_('accept-ranges' in res.headers)
+            self.assertIn('accept-ranges', res.headers)
             self.assertEqual(res.headers['accept-ranges'], 'bytes')
 
     def test_PUT(self):
         with save_globals():
             controller = proxy_server.AccountController(self.app, 'account')
+            self.app.allow_account_management = True
 
             def test_status_map(statuses, expected, **kwargs):
-                set_http_connect(*statuses, **kwargs)
-                self.app.memcache.store = {}
-                req = Request.blank('/a', {})
+                req = Request.blank('/v1/a', {})
                 req.content_length = 0
                 self.app.update_request(req)
-                res = controller.PUT(req)
+                with mocked_http_conn(*statuses, **kwargs) as mock_conn:
+                    res = controller.PUT(req)
                 expected = str(expected)
-                self.assertEquals(res.status[:len(expected)], expected)
-            test_status_map((201, 201, 201), 405)
-            self.app.allow_account_management = True
+                self.assertEqual(res.status[:len(expected)], expected)
+                timestamps = [captured['headers'].get('X-Timestamp')
+                              for captured in mock_conn.requests[-3:]]
+                self.assertEqual(3, len(timestamps))
+                self.assertEqual(1, len(set(timestamps)))
+                self.assert_valid_timestamp(timestamps[0])
+
             test_status_map((201, 201, 201), 201)
             test_status_map((201, 201, 500), 201)
             test_status_map((201, 500, 500), 503)
             test_status_map((204, 500, 404), 503)
 
-    def test_PUT_max_account_name_length(self):
+    def test_PUT_allow_account_management_false(self):
         with save_globals():
-            self.app.allow_account_management = True
-            limit = MAX_ACCOUNT_NAME_LENGTH
-            controller = proxy_server.AccountController(self.app, '1' * limit)
-            self.assert_status_map(controller.PUT, (201, 201, 201), 201)
-            controller = proxy_server.AccountController(
-                self.app, '2' * (limit + 1))
-            self.assert_status_map(controller.PUT, (201, 201, 201), 400)
+            controller = proxy_server.AccountController(self.app, 'account')
+            self.assertFalse(self.app.allow_account_management)
+
+            def test_status_map(statuses, expected, **kwargs):
+                req = Request.blank('/v1/a', {})
+                req.content_length = 0
+                self.app.update_request(req)
+                with mocked_http_conn(*statuses, **kwargs):
+                    res = controller.PUT(req)
+                expected = str(expected)
+                self.assertEqual(res.status[:len(expected)], expected)
+
+            test_status_map((), 405)
+
+    def test_PUT_max_account_name_length(self):
+        self.app.allow_account_management = True
+        limit = constraints.MAX_ACCOUNT_NAME_LENGTH
+        controller = proxy_server.AccountController(self.app, '1' * limit)
+        self.assert_status_map(controller.PUT, (201, 201, 201), 201)
+        controller = proxy_server.AccountController(
+            self.app, '2' * (limit + 1))
+        self.assert_status_map(controller.PUT, (), 400)
+
+        # internal auto-created accounts get higher limits
+        limit *= 2
+        controller = proxy_server.AccountController(
+            self.app, '.' + '3' * (limit - 1))
+        self.assert_status_map(controller.PUT, (201, 201, 201), 201)
+        controller = proxy_server.AccountController(
+            self.app, '.' + '4' * limit)
+        self.assert_status_map(controller.PUT, (), 400)
+
+        self.app.auto_create_account_prefix = 'FOO_'
+        limit //= 2
+        controller = proxy_server.AccountController(
+            self.app, '.' + '5' * (limit - 1))
+        self.assert_status_map(controller.PUT, (201, 201, 201), 201)
+        controller = proxy_server.AccountController(
+            self.app, '.' + '6' * limit)
+        self.assert_status_map(controller.PUT, (), 400)
+
+        limit *= 2
+        controller = proxy_server.AccountController(
+            self.app, 'FOO_' + '7' * (limit - 4))
+        self.assert_status_map(controller.PUT, (201, 201, 201), 201)
+        controller = proxy_server.AccountController(
+            self.app, 'FOO_' + '8' * (limit - 3))
+        self.assert_status_map(controller.PUT, (), 400)
 
     def test_PUT_connect_exceptions(self):
         with save_globals():
@@ -4568,6 +11688,12 @@ def test_PUT_connect_exceptions(self):
             self.assert_status_map(controller.PUT, (201, -1, -1), 503)
             self.assert_status_map(controller.PUT, (503, 503, -1), 503)
 
+    def test_PUT_status(self):
+        with save_globals():
+            self.app.allow_account_management = True
+            controller = proxy_server.AccountController(self.app, 'account')
+            self.assert_status_map(controller.PUT, (201, 201, 202), 202)
+
     def test_PUT_metadata(self):
         self.metadata_helper('PUT')
 
@@ -4590,7 +11716,7 @@ def test_connect(ipaddr, port, device, partition, method, path,
                         find_header = \
                             find_header.lower().replace('-remove', '', 1)
                         find_value = ''
-                    for k, v in headers.iteritems():
+                    for k, v in headers.items():
                         if k.lower() == find_header.lower() and \
                                 v == find_value:
                             break
@@ -4602,11 +11728,12 @@ def test_connect(ipaddr, port, device, partition, method, path,
                 controller = \
                     proxy_server.AccountController(self.app, 'a')
                 set_http_connect(201, 201, 201, give_connect=test_connect)
-                req = Request.blank('/a/c', environ={'REQUEST_METHOD': method},
+                req = Request.blank('/v1/a/c',
+                                    environ={'REQUEST_METHOD': method},
                                     headers={test_header: test_value})
                 self.app.update_request(req)
-                res = getattr(controller, method)(req)
-                self.assertEquals(test_errors, [])
+                getattr(controller, method)(req)
+                self.assertEqual(test_errors, [])
 
     def test_PUT_bad_metadata(self):
         self.bad_metadata_helper('PUT')
@@ -4619,390 +11746,1004 @@ def bad_metadata_helper(self, method):
             self.app.allow_account_management = True
             controller = proxy_server.AccountController(self.app, 'a')
             set_http_connect(200, 201, 201, 201)
-            req = Request.blank('/a/c', environ={'REQUEST_METHOD': method})
+            req = Request.blank('/v1/a/c', environ={'REQUEST_METHOD': method})
             self.app.update_request(req)
             resp = getattr(controller, method)(req)
-            self.assertEquals(resp.status_int, 201)
+            self.assertEqual(resp.status_int, 201)
 
             set_http_connect(201, 201, 201)
-            req = Request.blank('/a/c', environ={'REQUEST_METHOD': method},
+            req = Request.blank('/v1/a/c', environ={'REQUEST_METHOD': method},
                                 headers={'X-Account-Meta-' +
-                                ('a' * MAX_META_NAME_LENGTH): 'v'})
+                                ('a' * constraints.MAX_META_NAME_LENGTH): 'v'})
             self.app.update_request(req)
             resp = getattr(controller, method)(req)
-            self.assertEquals(resp.status_int, 201)
+            self.assertEqual(resp.status_int, 201)
             set_http_connect(201, 201, 201)
-            req = Request.blank('/a/c', environ={'REQUEST_METHOD': method},
-                                headers={'X-Account-Meta-' +
-                                ('a' * (MAX_META_NAME_LENGTH + 1)): 'v'})
+            req = Request.blank(
+                '/v1/a/c', environ={'REQUEST_METHOD': method},
+                headers={'X-Account-Meta-' +
+                         ('a' * (constraints.MAX_META_NAME_LENGTH + 1)): 'v'})
             self.app.update_request(req)
             resp = getattr(controller, method)(req)
-            self.assertEquals(resp.status_int, 400)
+            self.assertEqual(resp.status_int, 400)
 
             set_http_connect(201, 201, 201)
-            req = Request.blank('/a/c', environ={'REQUEST_METHOD': method},
+            req = Request.blank('/v1/a/c', environ={'REQUEST_METHOD': method},
                                 headers={'X-Account-Meta-Too-Long':
-                                'a' * MAX_META_VALUE_LENGTH})
+                                'a' * constraints.MAX_META_VALUE_LENGTH})
             self.app.update_request(req)
             resp = getattr(controller, method)(req)
-            self.assertEquals(resp.status_int, 201)
+            self.assertEqual(resp.status_int, 201)
             set_http_connect(201, 201, 201)
-            req = Request.blank('/a/c', environ={'REQUEST_METHOD': method},
+            req = Request.blank('/v1/a/c', environ={'REQUEST_METHOD': method},
                                 headers={'X-Account-Meta-Too-Long':
-                                'a' * (MAX_META_VALUE_LENGTH + 1)})
+                                'a' * (constraints.MAX_META_VALUE_LENGTH + 1)})
             self.app.update_request(req)
             resp = getattr(controller, method)(req)
-            self.assertEquals(resp.status_int, 400)
+            self.assertEqual(resp.status_int, 400)
 
             set_http_connect(201, 201, 201)
             headers = {}
-            for x in xrange(MAX_META_COUNT):
+            for x in range(constraints.MAX_META_COUNT):
                 headers['X-Account-Meta-%d' % x] = 'v'
-            req = Request.blank('/a/c', environ={'REQUEST_METHOD': method},
+            req = Request.blank('/v1/a/c', environ={'REQUEST_METHOD': method},
                                 headers=headers)
             self.app.update_request(req)
             resp = getattr(controller, method)(req)
-            self.assertEquals(resp.status_int, 201)
+            self.assertEqual(resp.status_int, 201)
             set_http_connect(201, 201, 201)
             headers = {}
-            for x in xrange(MAX_META_COUNT + 1):
+            for x in range(constraints.MAX_META_COUNT + 1):
                 headers['X-Account-Meta-%d' % x] = 'v'
-            req = Request.blank('/a/c', environ={'REQUEST_METHOD': method},
+            req = Request.blank('/v1/a/c', environ={'REQUEST_METHOD': method},
                                 headers=headers)
             self.app.update_request(req)
             resp = getattr(controller, method)(req)
-            self.assertEquals(resp.status_int, 400)
+            self.assertEqual(resp.status_int, 400)
 
             set_http_connect(201, 201, 201)
             headers = {}
-            header_value = 'a' * MAX_META_VALUE_LENGTH
+            header_value = 'a' * constraints.MAX_META_VALUE_LENGTH
             size = 0
             x = 0
-            while size < MAX_META_OVERALL_SIZE - 4 - MAX_META_VALUE_LENGTH:
-                size += 4 + MAX_META_VALUE_LENGTH
+            while size < (constraints.MAX_META_OVERALL_SIZE - 4
+                          - constraints.MAX_META_VALUE_LENGTH):
+                size += 4 + constraints.MAX_META_VALUE_LENGTH
                 headers['X-Account-Meta-%04d' % x] = header_value
                 x += 1
-            if MAX_META_OVERALL_SIZE - size > 1:
+            if constraints.MAX_META_OVERALL_SIZE - size > 1:
                 headers['X-Account-Meta-a'] = \
-                    'a' * (MAX_META_OVERALL_SIZE - size - 1)
-            req = Request.blank('/a/c', environ={'REQUEST_METHOD': method},
+                    'a' * (constraints.MAX_META_OVERALL_SIZE - size - 1)
+            req = Request.blank('/v1/a/c', environ={'REQUEST_METHOD': method},
                                 headers=headers)
             self.app.update_request(req)
             resp = getattr(controller, method)(req)
-            self.assertEquals(resp.status_int, 201)
+            self.assertEqual(resp.status_int, 201)
             set_http_connect(201, 201, 201)
             headers['X-Account-Meta-a'] = \
-                'a' * (MAX_META_OVERALL_SIZE - size)
-            req = Request.blank('/a/c', environ={'REQUEST_METHOD': method},
+                'a' * (constraints.MAX_META_OVERALL_SIZE - size)
+            req = Request.blank('/v1/a/c', environ={'REQUEST_METHOD': method},
                                 headers=headers)
             self.app.update_request(req)
             resp = getattr(controller, method)(req)
-            self.assertEquals(resp.status_int, 400)
+            self.assertEqual(resp.status_int, 400)
 
     def test_DELETE(self):
         with save_globals():
             controller = proxy_server.AccountController(self.app, 'account')
+            self.app.allow_account_management = True
 
             def test_status_map(statuses, expected, **kwargs):
-                set_http_connect(*statuses, **kwargs)
-                self.app.memcache.store = {}
-                req = Request.blank('/a', {'REQUEST_METHOD': 'DELETE'})
+                req = Request.blank('/v1/a', {'REQUEST_METHOD': 'DELETE'})
                 req.content_length = 0
                 self.app.update_request(req)
-                res = controller.DELETE(req)
+                with mocked_http_conn(*statuses, **kwargs) as mock_conn:
+                    res = controller.DELETE(req)
                 expected = str(expected)
-                self.assertEquals(res.status[:len(expected)], expected)
-            test_status_map((201, 201, 201), 405)
-            self.app.allow_account_management = True
+                self.assertEqual(res.status[:len(expected)], expected)
+                timestamps = [captured['headers'].get('X-Timestamp')
+                              for captured in mock_conn.requests[-3:]]
+                self.assertEqual(3, len(timestamps))
+                self.assertEqual(1, len(set(timestamps)))
+                self.assert_valid_timestamp(timestamps[0])
+
             test_status_map((201, 201, 201), 201)
             test_status_map((201, 201, 500), 201)
             test_status_map((201, 500, 500), 503)
             test_status_map((204, 500, 404), 503)
 
+    def test_DELETE_allow_account_management_false(self):
+        with save_globals():
+            controller = proxy_server.AccountController(self.app, 'account')
+            self.assertFalse(self.app.allow_account_management)
 
-class FakeObjectController(object):
-
-    def __init__(self):
-        self.app = self
-        self.logger = self
-        self.account_name = 'a'
-        self.container_name = 'c'
-        self.object_name = 'o'
-        self.trans_id = 'tx1'
-        self.object_ring = FakeRing()
-        self.node_timeout = 1
-        self.rate_limit_after_segment = 3
-        self.rate_limit_segments_per_sec = 2
-
-    def exception(self, *args):
-        self.exception_args = args
-        self.exception_info = sys.exc_info()
-
-    def GETorHEAD_base(self, *args):
-        self.GETorHEAD_base_args = args
-        req = args[0]
-        path = args[4]
-        body = data = path[-1] * int(path[-1])
-        if req.range:
-            r = req.range.ranges_for_length(len(data))
-            if r:
-                (start, stop) = r[0]
-                body = data[start:stop]
-        resp = Response(app_iter=iter(body))
-        return resp
-
-    def iter_nodes(self, partition, nodes, ring):
-        for node in nodes:
-            yield node
-        for node in ring.get_more_nodes(partition):
-            yield node
+            def test_status_map(statuses, expected, **kwargs):
+                req = Request.blank('/v1/a', {'REQUEST_METHOD': 'DELETE'})
+                req.content_length = 0
+                self.app.update_request(req)
+                with mocked_http_conn(*statuses, **kwargs):
+                    res = controller.DELETE(req)
+                expected = str(expected)
+                self.assertEqual(res.status[:len(expected)], expected)
+
+            test_status_map((), 405)
 
+    def test_DELETE_with_query_string(self):
+        # Extra safety in case someone typos a query string for an
+        # account-level DELETE request that was really meant to be caught by
+        # some middleware.
+        with save_globals():
+            controller = proxy_server.AccountController(self.app, 'account')
 
-class Stub(object):
-    pass
+            def test_status_map(statuses, expected, **kwargs):
+                set_http_connect(*statuses, **kwargs)
+                req = Request.blank('/v1/a?whoops',
+                                    environ={'REQUEST_METHOD': 'DELETE'})
+                req.content_length = 0
+                self.app.update_request(req)
+                res = controller.DELETE(req)
+                expected = str(expected)
+                self.assertEqual(res.status[:len(expected)], expected)
+            test_status_map((201, 201, 201), 400)
+            self.app.allow_account_management = True
+            test_status_map((201, 201, 201), 400)
+            test_status_map((201, 201, 500), 400)
+            test_status_map((201, 500, 500), 400)
+            test_status_map((204, 500, 404), 400)
 
 
-class TestSegmentedIterable(unittest.TestCase):
+@patch_policies([StoragePolicy(0, 'zero', True, object_ring=FakeRing())])
+class TestAccountControllerFakeGetResponse(unittest.TestCase):
+    """
+    Test all the faked-out GET responses for accounts that don't exist. They
+    have to match the responses for empty accounts that really exist.
+    """
 
     def setUp(self):
-        self.controller = FakeObjectController()
-
-    def test_load_next_segment_unexpected_error(self):
-        # Iterator value isn't a dict
-        self.assertRaises(Exception,
-                          SegmentedIterable(self.controller, None,
-                                            [None])._load_next_segment)
-        self.assert_(self.controller.exception_args[0].startswith(
-                     'ERROR: While processing manifest'))
-
-    def test_load_next_segment_with_no_segments(self):
-        self.assertRaises(StopIteration,
-                          SegmentedIterable(self.controller, 'lc',
-                                            [])._load_next_segment)
-
-    def test_load_next_segment_with_one_segment(self):
-        segit = SegmentedIterable(self.controller, 'lc', [{'name':
-                                  'o1'}])
-        segit._load_next_segment()
-        self.assertEquals(self.controller.GETorHEAD_base_args[4], '/a/lc/o1')
-        data = ''.join(segit.segment_iter)
-        self.assertEquals(data, '1')
-
-    def test_load_next_segment_with_two_segments(self):
-        segit = SegmentedIterable(self.controller, 'lc', [{'name':
-                                  'o1'}, {'name': 'o2'}])
-        segit._load_next_segment()
-        self.assertEquals(self.controller.GETorHEAD_base_args[4], '/a/lc/o1')
-        data = ''.join(segit.segment_iter)
-        self.assertEquals(data, '1')
-        segit._load_next_segment()
-        self.assertEquals(self.controller.GETorHEAD_base_args[4], '/a/lc/o2')
-        data = ''.join(segit.segment_iter)
-        self.assertEquals(data, '22')
-
-    def test_load_next_segment_rate_limiting(self):
-        sleep_calls = []
-
-        def _stub_sleep(sleepy_time):
-            sleep_calls.append(sleepy_time)
-        orig_sleep = swift.proxy.controllers.obj.sleep
-        try:
-            swift.proxy.controllers.obj.sleep = _stub_sleep
-            segit = SegmentedIterable(
-                self.controller, 'lc', [
-                    {'name': 'o1'}, {'name': 'o2'}, {'name': 'o3'},
-                    {'name': 'o4'}, {'name': 'o5'}])
-
-            # rate_limit_after_segment == 3, so the first 3 segments should
-            # invoke no sleeping.
-            for _ in xrange(3):
-                segit._load_next_segment()
-            self.assertEquals([], sleep_calls)
-            self.assertEquals(self.controller.GETorHEAD_base_args[4],
-                              '/a/lc/o3')
-
-            # Loading of next (4th) segment starts rate-limiting.
-            segit._load_next_segment()
-            self.assertAlmostEqual(0.5, sleep_calls[0], places=2)
-            self.assertEquals(self.controller.GETorHEAD_base_args[4],
-                              '/a/lc/o4')
-
-            sleep_calls = []
-            segit._load_next_segment()
-            self.assertAlmostEqual(0.5, sleep_calls[0], places=2)
-            self.assertEquals(self.controller.GETorHEAD_base_args[4],
-                              '/a/lc/o5')
-        finally:
-            swift.proxy.controllers.obj.sleep = orig_sleep
-
-    def test_load_next_segment_with_two_segments_skip_first(self):
-        segit = SegmentedIterable(self.controller, 'lc', [{'name':
-                                  'o1'}, {'name': 'o2'}])
-        segit.segment = 0
-        segit.listing.next()
-        segit._load_next_segment()
-        self.assertEquals(self.controller.GETorHEAD_base_args[4], '/a/lc/o2')
-        data = ''.join(segit.segment_iter)
-        self.assertEquals(data, '22')
-
-    def test_load_next_segment_with_seek(self):
-        segit = SegmentedIterable(self.controller, 'lc', [{'name':
-                                  'o1'}, {'name': 'o2'}])
-        segit.segment = 0
-        segit.listing.next()
-        segit.seek = 1
-        segit._load_next_segment()
-        self.assertEquals(self.controller.GETorHEAD_base_args[4], '/a/lc/o2')
-        self.assertEquals(str(self.controller.GETorHEAD_base_args[0].range),
-                          'bytes=1-')
-        data = ''.join(segit.segment_iter)
-        self.assertEquals(data, '2')
-
-    def test_load_next_segment_with_get_error(self):
-
-        def local_GETorHEAD_base(*args):
-            return HTTPNotFound()
-
-        self.controller.GETorHEAD_base = local_GETorHEAD_base
-        self.assertRaises(Exception,
-                          SegmentedIterable(self.controller, 'lc',
-                          [{'name': 'o1'}])._load_next_segment)
-        self.assert_(self.controller.exception_args[0].startswith(
-                     'ERROR: While processing manifest'))
-        self.assertEquals(str(self.controller.exception_info[1]),
-                          'Could not load object segment /a/lc/o1: 404')
-
-    def test_iter_unexpected_error(self):
-        # Iterator value isn't a dict
-        self.assertRaises(Exception, ''.join,
-                          SegmentedIterable(self.controller, None, [None]))
-        self.assert_(self.controller.exception_args[0].startswith(
-            'ERROR: While processing manifest'))
-
-    def test_iter_with_no_segments(self):
-        segit = SegmentedIterable(self.controller, 'lc', [])
-        self.assertEquals(''.join(segit), '')
-
-    def test_iter_with_one_segment(self):
-        segit = SegmentedIterable(self.controller, 'lc', [{'name':
-                                  'o1'}])
-        segit.response = Stub()
-        self.assertEquals(''.join(segit), '1')
-
-    def test_iter_with_two_segments(self):
-        segit = SegmentedIterable(self.controller, 'lc', [{'name':
-                                  'o1'}, {'name': 'o2'}])
-        segit.response = Stub()
-        self.assertEquals(''.join(segit), '122')
-
-    def test_iter_with_get_error(self):
-
-        def local_GETorHEAD_base(*args):
-            return HTTPNotFound()
-
-        self.controller.GETorHEAD_base = local_GETorHEAD_base
-        self.assertRaises(Exception, ''.join,
-                          SegmentedIterable(self.controller, 'lc', [{'name':
-                                                                    'o1'}]))
-        self.assert_(self.controller.exception_args[0].startswith(
-                     'ERROR: While processing manifest'))
-        self.assertEquals(str(self.controller.exception_info[1]),
-                          'Could not load object segment /a/lc/o1: 404')
-
-    def test_app_iter_range_unexpected_error(self):
-        # Iterator value isn't a dict
-        self.assertRaises(Exception,
-                          SegmentedIterable(self.controller, None,
-                                            [None]).app_iter_range(None,
-                                                                   None).next)
-        self.assert_(self.controller.exception_args[0].startswith(
-            'ERROR: While processing manifest'))
-
-    def test_app_iter_range_with_no_segments(self):
-        self.assertEquals(''.join(SegmentedIterable(
-            self.controller, 'lc', []).app_iter_range(None, None)), '')
-        self.assertEquals(''.join(SegmentedIterable(
-            self.controller, 'lc', []).app_iter_range(3, None)), '')
-        self.assertEquals(''.join(SegmentedIterable(
-            self.controller, 'lc', []).app_iter_range(3, 5)), '')
-        self.assertEquals(''.join(SegmentedIterable(
-            self.controller, 'lc', []).app_iter_range(None, 5)), '')
-
-    def test_app_iter_range_with_one_segment(self):
-        listing = [{'name': 'o1', 'bytes': 1}]
-
-        segit = SegmentedIterable(self.controller, 'lc', listing)
-        segit.response = Stub()
-        self.assertEquals(''.join(segit.app_iter_range(None, None)), '1')
-
-        segit = SegmentedIterable(self.controller, 'lc', listing)
-        self.assertEquals(''.join(segit.app_iter_range(3, None)), '')
-
-        segit = SegmentedIterable(self.controller, 'lc', listing)
-        self.assertEquals(''.join(segit.app_iter_range(3, 5)), '')
-
-        segit = SegmentedIterable(self.controller, 'lc', listing)
-        segit.response = Stub()
-        self.assertEquals(''.join(segit.app_iter_range(None, 5)), '1')
-
-    def test_app_iter_range_with_two_segments(self):
-        listing = [{'name': 'o1', 'bytes': 1}, {'name': 'o2', 'bytes': 2}]
-
-        segit = SegmentedIterable(self.controller, 'lc', listing)
-        segit.response = Stub()
-        self.assertEquals(''.join(segit.app_iter_range(None, None)), '122')
-
-        segit = SegmentedIterable(self.controller, 'lc', listing)
-        segit.response = Stub()
-        self.assertEquals(''.join(segit.app_iter_range(1, None)), '22')
-
-        segit = SegmentedIterable(self.controller, 'lc', listing)
-        segit.response = Stub()
-        self.assertEquals(''.join(segit.app_iter_range(1, 5)), '22')
-
-        segit = SegmentedIterable(self.controller, 'lc', listing)
-        segit.response = Stub()
-        self.assertEquals(''.join(segit.app_iter_range(None, 2)), '12')
-
-    def test_app_iter_range_with_many_segments(self):
-        listing = [{'name': 'o1', 'bytes': 1}, {'name': 'o2', 'bytes': 2},
-                   {'name': 'o3', 'bytes': 3}, {'name': 'o4', 'bytes': 4},
-                   {'name': 'o5', 'bytes': 5}]
-
-        segit = SegmentedIterable(self.controller, 'lc', listing)
-        segit.response = Stub()
-        self.assertEquals(''.join(segit.app_iter_range(None, None)),
-                          '122333444455555')
-
-        segit = SegmentedIterable(self.controller, 'lc', listing)
-        segit.response = Stub()
-        self.assertEquals(''.join(segit.app_iter_range(3, None)),
-                          '333444455555')
-
-        segit = SegmentedIterable(self.controller, 'lc', listing)
-        segit.response = Stub()
-        self.assertEquals(''.join(segit.app_iter_range(5, None)), '3444455555')
-
-        segit = SegmentedIterable(self.controller, 'lc', listing)
-        segit.response = Stub()
-        self.assertEquals(''.join(segit.app_iter_range(None, 6)), '122333')
-
-        segit = SegmentedIterable(self.controller, 'lc', listing)
-        segit.response = Stub()
-        self.assertEquals(''.join(segit.app_iter_range(None, 7)), '1223334')
-
-        segit = SegmentedIterable(self.controller, 'lc', listing)
-        segit.response = Stub()
-        self.assertEquals(''.join(segit.app_iter_range(3, 7)), '3334')
-
-        segit = SegmentedIterable(self.controller, 'lc', listing)
-        segit.response = Stub()
-        self.assertEquals(''.join(segit.app_iter_range(5, 7)), '34')
+        conf = {'account_autocreate': 'yes'}
+        self.app = listing_formats.ListingFilter(
+            proxy_server.Application(conf,
+                                     account_ring=FakeRing(),
+                                     container_ring=FakeRing()),
+            {})
+
+    def test_GET_autocreate_accept_json(self):
+        with save_globals():
+            set_http_connect(*([404] * 100))  # nonexistent: all backends 404
+            req = Request.blank(
+                '/v1/a', headers={'Accept': 'application/json'},
+                environ={'REQUEST_METHOD': 'GET',
+                         'PATH_INFO': '/v1/a'})
+            resp = req.get_response(self.app)
+            self.assertEqual(200, resp.status_int)
+            self.assertEqual('application/json; charset=utf-8',
+                             resp.headers['Content-Type'])
+            self.assertEqual(b"[]", resp.body)
+
+    def test_GET_autocreate_format_json(self):
+        with save_globals():
+            set_http_connect(*([404] * 100))  # nonexistent: all backends 404
+            req = Request.blank('/v1/a?format=json',
+                                environ={'REQUEST_METHOD': 'GET',
+                                         'PATH_INFO': '/v1/a',
+                                         'QUERY_STRING': 'format=json'})
+            resp = req.get_response(self.app)
+            self.assertEqual(200, resp.status_int)
+            self.assertEqual('application/json; charset=utf-8',
+                             resp.headers['Content-Type'])
+            self.assertEqual(b"[]", resp.body)
+
+    def test_GET_autocreate_accept_xml(self):
+        with save_globals():
+            set_http_connect(*([404] * 100))  # nonexistent: all backends 404
+            req = Request.blank('/v1/a', headers={"Accept": "text/xml"},
+                                environ={'REQUEST_METHOD': 'GET',
+                                         'PATH_INFO': '/v1/a'})
+
+            resp = req.get_response(self.app)
+            self.assertEqual(200, resp.status_int)
+
+            self.assertEqual('text/xml; charset=utf-8',
+                             resp.headers['Content-Type'])
+            empty_xml_listing = (b'<?xml version="1.0" encoding="UTF-8"?>\n'
+                                 b'<account name="a">\n</account>')
+            self.assertEqual(empty_xml_listing, resp.body)
+
+    def test_GET_autocreate_format_xml(self):
+        with save_globals():
+            set_http_connect(*([404] * 100))  # nonexistent: all backends 404
+            req = Request.blank('/v1/a?format=xml',
+                                environ={'REQUEST_METHOD': 'GET',
+                                         'PATH_INFO': '/v1/a',
+                                         'QUERY_STRING': 'format=xml'})
+            resp = req.get_response(self.app)
+            self.assertEqual(200, resp.status_int)
+            self.assertEqual('application/xml; charset=utf-8',
+                             resp.headers['Content-Type'])
+            empty_xml_listing = (b'<?xml version="1.0" encoding="UTF-8"?>\n'
+                                 b'<account name="a">\n</account>')
+            self.assertEqual(empty_xml_listing, resp.body)
+
+    def test_GET_autocreate_accept_unknown(self):
+        with save_globals():
+            set_http_connect(*([404] * 100))  # nonexistent: all backends 404
+            req = Request.blank('/v1/a', headers={"Accept": "mystery/meat"},
+                                environ={'REQUEST_METHOD': 'GET',
+                                         'PATH_INFO': '/v1/a'})
+            resp = req.get_response(self.app)
+            self.assertEqual(406, resp.status_int)
+
+    def test_GET_autocreate_bad_accept(self):
+        with save_globals():
+            set_http_connect(*([404] * 100))  # nonexistent: all backends 404
+            req = Request.blank('/v1/a', headers={"Accept": "a/b;q=nope"},
+                                environ={'REQUEST_METHOD': 'GET',
+                                         'PATH_INFO': '/v1/a'})
+            resp = req.get_response(self.app)
+            self.assertEqual(400, resp.status_int)
+            self.assertEqual(b'Invalid Accept header', resp.body)
+
+            set_http_connect(*([404] * 100))  # nonexistent: all backends 404
+            req = Request.blank('/v1/a', headers={"Accept": "a/b;q=0.5;q=1"},
+                                environ={'REQUEST_METHOD': 'GET',
+                                         'PATH_INFO': '/v1/a'})
+            resp = req.get_response(self.app)
+            self.assertEqual(400, resp.status_int)
+            self.assertEqual(b'Invalid Accept header', resp.body)
+
+    def test_GET_autocreate_format_invalid_utf8(self):
+        with save_globals():
+            set_http_connect(*([404] * 100))  # nonexistent: all backends 404
+            req = Request.blank('/v1/a?format=\xff\xfe',
+                                environ={'REQUEST_METHOD': 'GET',
+                                         'PATH_INFO': '/v1/a',
+                                         'QUERY_STRING': 'format=\xff\xfe'})
+            resp = req.get_response(self.app)
+            self.assertEqual(400, resp.status_int)
+
+    def test_GET_autocreate_utf8(self):
+        with save_globals():
+            set_http_connect(*([404] * 100))  # nonexistent: all backends 404
+            req = Request.blank('/v1/\xe2\x98\x83',
+                                environ={'REQUEST_METHOD': 'GET',
+                                         'PATH_INFO': '/v1/\xe2\x98\x83'})
+            resp = req.get_response(self.app)
+            self.assertEqual(204, resp.status_int)
+
+    def test_account_acl_header_access(self):
+        acl = {
+            'admin': ['AUTH_alice'],
+            'read-write': ['AUTH_bob'],
+            'read-only': ['AUTH_carol'],
+        }
+        prefix = get_sys_meta_prefix('account')
+        privileged_headers = {(prefix + 'core-access-control'): format_acl(
+            version=2, acl_dict=acl)}
+
+        app = proxy_server.Application(
+            None, account_ring=FakeRing(),
+            container_ring=FakeRing())
+
+        with save_globals():
+            # Mock account server will provide privileged information (ACLs)
+            set_http_connect(200, 200, 200, headers=privileged_headers)
+            req = Request.blank('/v1/a', environ={'REQUEST_METHOD': 'GET'})
+            resp = app.handle_request(req)
+
+            # Not a swift_owner -- ACLs should NOT be in response
+            header = 'X-Account-Access-Control'
+            self.assertNotIn(header, resp.headers, '%r was in %r' % (
+                header, resp.headers))
+
+            # Same setup -- mock acct server will provide ACLs
+            set_http_connect(200, 200, 200, headers=privileged_headers)
+            req = Request.blank('/v1/a', environ={'REQUEST_METHOD': 'GET',
+                                                  'swift_owner': True})
+            resp = app.handle_request(req)
+
+            # For a swift_owner, the ACLs *should* be in response
+            self.assertIn(header, resp.headers, '%r not in %r' % (
+                header, resp.headers))
+
+    def test_account_acls_through_delegation(self):
+
+        # Define a way to grab the requests sent out from the AccountController
+        # to the Account Server, and a way to inject responses we'd like the
+        # Account Server to return.
+        resps_to_send = []
+
+        @contextmanager
+        def patch_account_controller_method(verb):
+            old_method = getattr(proxy_server.AccountController, verb)
+            new_method = lambda self, req, *_, **__: resps_to_send.pop(0)
+            try:
+                setattr(proxy_server.AccountController, verb, new_method)
+                yield
+            finally:
+                setattr(proxy_server.AccountController, verb, old_method)
+
+        def make_test_request(http_method, swift_owner=True):
+            env = {
+                'REQUEST_METHOD': http_method,
+                'swift_owner': swift_owner,
+            }
+            acl = {
+                'admin': ['foo'],
+                'read-write': ['bar'],
+                'read-only': ['bas'],
+            }
+            headers = {} if http_method in ('GET', 'HEAD') else {
+                'x-account-access-control': format_acl(version=2, acl_dict=acl)
+            }
+
+            return Request.blank('/v1/a', environ=env, headers=headers)
+
+        # Our AccountController will invoke methods to communicate with the
+        # Account Server, and they will return responses like these:
+        def make_canned_response(http_method):
+            acl = {
+                'admin': ['foo'],
+                'read-write': ['bar'],
+                'read-only': ['bas'],
+            }
+            headers = {'x-account-sysmeta-core-access-control': format_acl(
+                version=2, acl_dict=acl)}
+            canned_resp = Response(headers=headers)
+            canned_resp.environ = {
+                'PATH_INFO': '/acct',
+                'REQUEST_METHOD': http_method,
+            }
+            resps_to_send.append(canned_resp)
+
+        app = proxy_server.Application(
+            None, account_ring=FakeRing(),
+            container_ring=FakeRing())
+        app.allow_account_management = True
+
+        ext_header = 'x-account-access-control'
+        with patch_account_controller_method('GETorHEAD_base'):
+            # GET/HEAD requests should remap sysmeta headers from acct server
+            for verb in ('GET', 'HEAD'):
+                make_canned_response(verb)
+                req = make_test_request(verb)
+                resp = app.handle_request(req)
+                h = parse_acl(version=2, data=resp.headers.get(ext_header))
+                self.assertEqual(h['admin'], ['foo'])
+                self.assertEqual(h['read-write'], ['bar'])
+                self.assertEqual(h['read-only'], ['bas'])
+
+                # swift_owner = False: GET/HEAD shouldn't return sensitive info
+                make_canned_response(verb)
+                req = make_test_request(verb, swift_owner=False)
+                resp = app.handle_request(req)
+                h = resp.headers
+                self.assertIsNone(h.get(ext_header))
+
+                # swift_owner unset: GET/HEAD shouldn't return sensitive info
+                make_canned_response(verb)
+                req = make_test_request(verb, swift_owner=False)
+                del req.environ['swift_owner']
+                resp = app.handle_request(req)
+                h = resp.headers
+                self.assertIsNone(h.get(ext_header))
+
+        # Verify that PUT/POST requests remap sysmeta headers from acct server
+        with patch_account_controller_method('make_requests'):
+            make_canned_response('PUT')
+            req = make_test_request('PUT')
+            resp = app.handle_request(req)
+
+            h = parse_acl(version=2, data=resp.headers.get(ext_header))
+            self.assertEqual(h['admin'], ['foo'])
+            self.assertEqual(h['read-write'], ['bar'])
+            self.assertEqual(h['read-only'], ['bas'])
+
+            make_canned_response('POST')
+            req = make_test_request('POST')
+            resp = app.handle_request(req)
+
+            h = parse_acl(version=2, data=resp.headers.get(ext_header))
+            self.assertEqual(h['admin'], ['foo'])
+            self.assertEqual(h['read-write'], ['bar'])
+            self.assertEqual(h['read-only'], ['bas'])
+
+
+class TestProxyObjectPerformance(unittest.TestCase):
+
+    def setUp(self):
+        # This is just a simple test that can be used to verify and debug the
+        # various data paths between the proxy server and the object
+        # server. Used as a play ground to debug buffer sizes for sockets.
+        skip_if_no_xattrs()
+        _test_servers[0].error_limiter.stats.clear()  # clear out errors
+        prolis = _test_sockets[0]
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        # Client is transmitting in 2 MB chunks
+        fd = sock.makefile('rwb', 2 * 1024 * 1024)
+        # Small, fast for testing
+        obj_len = 2 * 64 * 1024
+        # Use 1 GB or more for measurements
+        # obj_len = 2 * 512 * 1024 * 1024
+        self.path = '/v1/a/c/o.large'
+        fd.write(('PUT %s HTTP/1.1\r\n'
+                  'Host: localhost\r\n'
+                  'Connection: close\r\n'
+                  'X-Storage-Token: t\r\n'
+                  'Content-Length: %s\r\n'
+                  'Content-Type: application/octet-stream\r\n'
+                  '\r\n' % (self.path, str(obj_len))).encode('ascii'))
+        fd.write(b'a' * obj_len)
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
+        self.obj_len = obj_len
+
+    def test_GET_debug_large_file(self):
+        for i in range(10):
+            start = time.time()
+
+            prolis = _test_sockets[0]
+            sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+            # Client is reading in 2 MB chunks
+            fd = sock.makefile('rwb', 2 * 1024 * 1024)
+            fd.write(('GET %s HTTP/1.1\r\n'
+                      'Host: localhost\r\n'
+                      'Connection: close\r\n'
+                      'X-Storage-Token: t\r\n'
+                      '\r\n' % self.path).encode('ascii'))
+            fd.flush()
+            headers = readuntil2crlfs(fd)
+            exp = b'HTTP/1.1 200'
+            self.assertEqual(headers[:len(exp)], exp)
+
+            total = 0
+            while True:
+                buf = fd.read(100000)
+                if not buf:
+                    break
+                total += len(buf)
+            self.assertEqual(total, self.obj_len)
+
+            end = time.time()
+            print("Run %02d took %07.03f" % (i, end - start))
+
+
+@patch_policies([StoragePolicy(0, 'migrated', object_ring=FakeRing()),
+                 StoragePolicy(1, 'ernie', True, object_ring=FakeRing()),
+                 StoragePolicy(2, 'deprecated', is_deprecated=True,
+                               object_ring=FakeRing()),
+                 StoragePolicy(3, 'bert', object_ring=FakeRing())])
+class TestSwiftInfo(unittest.TestCase):
+    def setUp(self):
+        registry._swift_info = {}
+        registry._swift_admin_info = {}
+
+    def test_registered_defaults(self):
+        app = proxy_server.Application({},
+                                       account_ring=FakeRing(),
+                                       container_ring=FakeRing())
+        req = Request.blank('/info')
+        resp = req.get_response(app)
+        si = json.loads(resp.body)['swift']
+
+        self.assertIn('version', si)
+        self.assertEqual(si['max_file_size'], constraints.MAX_FILE_SIZE)
+        self.assertEqual(si['max_meta_name_length'],
+                         constraints.MAX_META_NAME_LENGTH)
+        self.assertEqual(si['max_meta_value_length'],
+                         constraints.MAX_META_VALUE_LENGTH)
+        self.assertEqual(si['max_meta_count'], constraints.MAX_META_COUNT)
+        self.assertEqual(si['max_header_size'], constraints.MAX_HEADER_SIZE)
+        self.assertEqual(si['max_meta_overall_size'],
+                         constraints.MAX_META_OVERALL_SIZE)
+        self.assertEqual(si['account_listing_limit'],
+                         constraints.ACCOUNT_LISTING_LIMIT)
+        self.assertEqual(si['container_listing_limit'],
+                         constraints.CONTAINER_LISTING_LIMIT)
+        self.assertEqual(si['max_account_name_length'],
+                         constraints.MAX_ACCOUNT_NAME_LENGTH)
+        self.assertEqual(si['max_container_name_length'],
+                         constraints.MAX_CONTAINER_NAME_LENGTH)
+        self.assertEqual(si['max_object_name_length'],
+                         constraints.MAX_OBJECT_NAME_LENGTH)
+        self.assertEqual(si['max_request_line'], constraints.MAX_REQUEST_LINE)
+        self.assertIn('strict_cors_mode', si)
+        self.assertFalse(si['allow_account_management'])
+        self.assertFalse(si['allow_open_expired'])
+        self.assertFalse(si['account_autocreate'])
+        # this next test is deliberately brittle in order to alert if
+        # other items are added to swift info
+        self.assertEqual(len(si), 19)
+
+        si = registry.get_swift_info()['swift']
+        # Tehse settings is by default excluded by disallowed_sections
+        self.assertEqual(si['valid_api_versions'],
+                         constraints.VALID_API_VERSIONS)
+        self.assertEqual(si['auto_create_account_prefix'],
+                         constraints.AUTO_CREATE_ACCOUNT_PREFIX)
+
+        self.assertIn('policies', si)
+        sorted_pols = sorted(si['policies'], key=operator.itemgetter('name'))
+        self.assertEqual(len(sorted_pols), 3)
+        for policy in sorted_pols:
+            self.assertNotEqual(policy['name'], 'deprecated')
+        self.assertEqual(sorted_pols[0]['name'], 'bert')
+        self.assertEqual(sorted_pols[1]['name'], 'ernie')
+        self.assertEqual(sorted_pols[2]['name'], 'migrated')
+
+
+class TestSocketObjectVersions(unittest.TestCase):
+
+    def setUp(self):
+        global _test_sockets
+        skip_if_no_xattrs()
+        _test_servers[0].error_limiter.stats.clear()  # clear out errors
+        self.prolis = prolis = listen_zero()
+        self._orig_prolis = _test_sockets[0]
+        allowed_headers = ', '.join([
+            'content-encoding',
+            'x-object-manifest',
+            'content-disposition',
+            'foo'
+        ])
+        conf = {'devices': _testdir, 'swift_dir': _testdir,
+                'mount_check': 'false', 'allowed_headers': allowed_headers}
+        prosrv = listing_formats.ListingFilter(
+            copy.ServerSideCopyMiddleware(
+                versioned_writes.VersionedWritesMiddleware(
+                    proxy_logging.ProxyLoggingMiddleware(
+                        _test_servers[0], conf,
+                        logger=_test_servers[0].logger), {}),
+                {}
+            ),
+            {}, logger=_test_servers[0].logger
+        )
+        self.coro = spawn(wsgi.server, prolis, prosrv, NullLogger(),
+                          protocol=SwiftHttpProtocol)
+        # replace global prosrv with one that's filtered with version
+        # middleware
+        self.sockets = list(_test_sockets)
+        self.sockets[0] = prolis
+        _test_sockets = tuple(self.sockets)
+
+    def tearDown(self):
+        self.coro.kill()
+        # put the global state back
+        global _test_sockets
+        self.sockets[0] = self._orig_prolis
+        _test_sockets = tuple(self.sockets)
+        _test_servers[0].error_limiter.stats.clear()  # clear out errors
+
+    def test_version_manifest(self, oc=b'versions', vc=b'vers', o=b'name'):
+        versions_to_create = 3
+        # Create a container for our versioned object testing
+        (prolis, acc1lis, acc2lis, con1lis, con2lis, obj1lis,
+         obj2lis, obj3lis, obj4lis, obj5lis, obj6lis) = _test_sockets
+        pre = quote('%03x' % len(o)).encode('ascii')
+        osub = b'%s/sub' % o
+        presub = quote('%03x' % len(osub)).encode('ascii')
+        osub = quote(osub).encode('ascii')
+        presub = quote(presub).encode('ascii')
+        oc = quote(oc).encode('ascii')
+        vc = quote(vc).encode('ascii')
+
+        def put_container():
+            sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+            fd = sock.makefile('rwb')
+            fd.write(b'PUT /v1/a/%s HTTP/1.1\r\nHost: localhost\r\n'
+                     b'Connection: close\r\nX-Storage-Token: t\r\n'
+                     b'Content-Length: 0\r\nX-Versions-Location: %s\r\n\r\n'
+                     % (oc, vc))
+            fd.flush()
+            headers = readuntil2crlfs(fd)
+            fd.read()
+            return headers
+
+        headers = put_container()
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
+
+        def get_container():
+            sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+            fd = sock.makefile('rwb')
+            fd.write(b'GET /v1/a/%s HTTP/1.1\r\nHost: localhost\r\n'
+                     b'Connection: close\r\n'
+                     b'X-Storage-Token: t\r\n\r\n\r\n' % oc)
+            fd.flush()
+            headers = readuntil2crlfs(fd)
+            body = fd.read()
+            return headers, body
+
+        # check that the header was set
+        headers, body = get_container()
+        exp = b'HTTP/1.1 2'  # 2xx series response
+        self.assertEqual(headers[:len(exp)], exp)
+        self.assertIn(b'X-Versions-Location: %s' % vc, headers)
+
+        def put_version_container():
+            sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+            fd = sock.makefile('rwb')
+            fd.write(b'PUT /v1/a/%s HTTP/1.1\r\nHost: localhost\r\n'
+                     b'Connection: close\r\nX-Storage-Token: t\r\n'
+                     b'Content-Length: 0\r\n\r\n' % vc)
+            fd.flush()
+            headers = readuntil2crlfs(fd)
+            fd.read()
+            return headers
+
+        # make the container for the object versions
+        headers = put_version_container()
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
+
+        def put(version):
+            sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+            fd = sock.makefile('rwb')
+            fd.write(b'PUT /v1/a/%s/%s HTTP/1.1\r\nHost: '
+                     b'localhost\r\nConnection: close\r\nX-Storage-Token: t'
+                     b'\r\nContent-Length: 5\r\nContent-Type: text/jibberish%d'
+                     b'\r\n\r\n%05d\r\n' % (oc, o, version, version))
+            fd.flush()
+            headers = readuntil2crlfs(fd)
+            fd.read()
+            return headers
+
+        def get(container=oc, obj=o):
+            sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+            fd = sock.makefile('rwb')
+            fd.write(b'GET /v1/a/%s/%s HTTP/1.1\r\nHost: '
+                     b'localhost\r\nConnection: close\r\nX-Auth-Token: t\r\n'
+                     b'\r\n' % (container, obj))
+            fd.flush()
+            headers = readuntil2crlfs(fd)
+            body = fd.read()
+            return headers, body
+
+        # Create the versioned file
+        headers = put(0)
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
+
+        # Create the object versions
+        for version in range(1, versions_to_create):
+            sleep(.01)  # guarantee that the timestamp changes
+            headers = put(version)
+            exp = b'HTTP/1.1 201'
+            self.assertEqual(headers[:len(exp)], exp)
+
+            # Ensure retrieving the manifest file gets the latest version
+            headers, body = get()
+            exp = b'HTTP/1.1 200'
+            self.assertEqual(headers[:len(exp)], exp)
+            self.assertIn(b'Content-Type: text/jibberish%d' % version, headers)
+            self.assertNotIn(b'X-Object-Meta-Foo: barbaz', headers)
+            self.assertEqual(body, b'%05d' % version)
+
+        def get_version_container():
+            sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+            fd = sock.makefile('rwb')
+            fd.write(b'GET /v1/a/%s HTTP/1.1\r\nHost: localhost\r\n'
+                     b'Connection: close\r\n'
+                     b'X-Storage-Token: t\r\n\r\n' % vc)
+            fd.flush()
+            headers = readuntil2crlfs(fd)
+            body = fd.read()
+            return headers, body
+
+        # Ensure we have the right number of versions saved
+        headers, body = get_version_container()
+        exp = b'HTTP/1.1 200'
+        self.assertEqual(headers[:len(exp)], exp)
+        versions = [x for x in body.split(b'\n') if x]
+        self.assertEqual(len(versions), versions_to_create - 1)
+
+        def delete():
+            sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+            fd = sock.makefile('rwb')
+            fd.write(b'DELETE /v1/a/%s/%s HTTP/1.1\r\nHost: localhost\r'
+                     b'\nConnection: close\r\nX-Storage-Token: t\r\n\r\n'
+                     % (oc, o))
+            fd.flush()
+            headers = readuntil2crlfs(fd)
+            fd.read()
+            return headers
+
+        def copy():
+            sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+            fd = sock.makefile('rwb')
+            fd.write(b'COPY /v1/a/%s/%s HTTP/1.1\r\nHost: '
+                     b'localhost\r\nConnection: close\r\nX-Auth-Token: '
+                     b't\r\nDestination: %s/copied_name\r\n'
+                     b'Content-Length: 0\r\n\r\n' % (oc, o, oc))
+            fd.flush()
+            headers = readuntil2crlfs(fd)
+            fd.read()
+            return headers
+
+        # copy a version and make sure the version info is stripped
+        headers = copy()
+        exp = b'HTTP/1.1 2'  # 2xx series response to the COPY
+        self.assertEqual(headers[:len(exp)], exp)
+
+        def get_copy():
+            sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+            fd = sock.makefile('rwb')
+            fd.write(b'GET /v1/a/%s/copied_name HTTP/1.1\r\nHost: '
+                     b'localhost\r\nConnection: close\r\n'
+                     b'X-Auth-Token: t\r\n\r\n' % oc)
+            fd.flush()
+            headers = readuntil2crlfs(fd)
+            body = fd.read()
+            return headers, body
+
+        headers, body = get_copy()
+        exp = b'HTTP/1.1 200'
+        self.assertEqual(headers[:len(exp)], exp)
+        self.assertEqual(body, b'%05d' % version)
+
+        def post():
+            sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+            fd = sock.makefile('rwb')
+            fd.write(b'POST /v1/a/%s/%s HTTP/1.1\r\nHost: '
+                     b'localhost\r\nConnection: close\r\nX-Auth-Token: '
+                     b't\r\nContent-Type: foo/bar\r\nContent-Length: 0\r\n'
+                     b'X-Object-Meta-Bar: foo\r\n\r\n' % (oc, o))
+            fd.flush()
+            headers = readuntil2crlfs(fd)
+            fd.read()
+            return headers
+
+        # post and make sure it's updated
+        headers = post()
+        exp = b'HTTP/1.1 2'  # 2xx series response to the POST
+        self.assertEqual(headers[:len(exp)], exp)
+
+        headers, body = get()
+        self.assertIn(b'Content-Type: foo/bar', headers)
+        self.assertIn(b'X-Object-Meta-Bar: foo', headers)
+        self.assertEqual(body, b'%05d' % version)
+
+        # check container listing
+        headers, body = get_container()
+        exp = b'HTTP/1.1 200'
+        self.assertEqual(headers[:len(exp)], exp)
+
+        # Delete the object versions
+        for segment in range(versions_to_create - 1, 0, -1):
+
+            headers = delete()
+            exp = b'HTTP/1.1 2'  # 2xx series response
+            self.assertEqual(headers[:len(exp)], exp)
+
+            # Ensure retrieving the manifest file gets the latest version
+            headers, body = get()
+            exp = b'HTTP/1.1 200'
+            self.assertEqual(headers[:len(exp)], exp)
+            self.assertIn(b'Content-Type: text/jibberish%d' % (segment - 1),
+                          headers)
+            self.assertEqual(body, b'%05d' % (segment - 1))
+            # Ensure we have the right number of versions saved
+            sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+            fd = sock.makefile('rwb')
+            fd.write(b'GET /v1/a/%s?prefix=%s%s/ HTTP/1.1\r\nHost: '
+                     b'localhost\r\nConnection: close\r\nX-Auth-Token: t\r\n\r'
+                     b'\n' % (vc, pre, o))
+            fd.flush()
+            headers = readuntil2crlfs(fd)
+            exp = b'HTTP/1.1 2'  # 2xx series response
+            self.assertEqual(headers[:len(exp)], exp)
+            body = fd.read()
+            versions = [x for x in body.split(b'\n') if x]
+            self.assertEqual(len(versions), segment - 1)
+
+        # there is now one version left (in the manifest)
+        # Ensure we have no saved versions
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        fd.write(b'GET /v1/a/%s?prefix=%s%s/ HTTP/1.1\r\nHost: '
+                 b'localhost\r\nConnection: close\r\nX-Auth-Token: t\r\n\r\n'
+                 % (vc, pre, o))
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 204 No Content'
+        self.assertEqual(headers[:len(exp)], exp)
+
+        # delete the last version
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        fd.write(b'DELETE /v1/a/%s/%s HTTP/1.1\r\nHost: localhost\r\n'
+                 b'Connection: close\r\nX-Storage-Token: t\r\n\r\n' % (oc, o))
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 2'  # 2xx series response
+        self.assertEqual(headers[:len(exp)], exp)
+
+        # Ensure it's all gone
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        fd.write(b'GET /v1/a/%s/%s HTTP/1.1\r\nHost: '
+                 b'localhost\r\nConnection: close\r\nX-Auth-Token: t\r\n\r\n'
+                 % (oc, o))
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 404'
+        self.assertEqual(headers[:len(exp)], exp)
+
+        # make sure manifest files are also versioned
+        for _junk in range(0, versions_to_create):
+            sleep(.01)  # guarantee that the timestamp changes
+            sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+            fd = sock.makefile('rwb')
+            fd.write(b'PUT /v1/a/%s/%s HTTP/1.1\r\nHost: '
+                     b'localhost\r\nConnection: close\r\nX-Storage-Token: '
+                     b't\r\nContent-Length: 0\r\n'
+                     b'Content-Type: text/jibberish0\r\n'
+                     b'Foo: barbaz\r\nX-Object-Manifest: %s/%s/\r\n\r\n'
+                     % (oc, o, oc, o))
+            fd.flush()
+            headers = readuntil2crlfs(fd)
+            exp = b'HTTP/1.1 201'
+            self.assertEqual(headers[:len(exp)], exp)
+
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        fd.write(b'GET /v1/a/%s?prefix=%s%s/ HTTP/1.1\r\nhost: '
+                 b'localhost\r\nconnection: close\r\nx-auth-token: t\r\n\r\n'
+                 % (vc, pre, o))
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 200 OK'
+        self.assertEqual(headers[:len(exp)], exp)
+        body = fd.read()
+        versions = [x for x in body.split(b'\n') if x]
+        self.assertEqual(versions_to_create - 1, len(versions))
+
+        # DELETE v1/a/c/obj shouldn't delete v1/a/c/obj/sub versions
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        fd.write(b'PUT /v1/a/%s/%s HTTP/1.1\r\nHost: '
+                 b'localhost\r\nConnection: close\r\nX-Storage-Token: '
+                 b't\r\nContent-Length: 5\r\nContent-Type: text/jibberish0\r\n'
+                 b'Foo: barbaz\r\n\r\n00000\r\n' % (oc, o))
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        fd.write(b'PUT /v1/a/%s/%s HTTP/1.1\r\nHost: '
+                 b'localhost\r\nConnection: close\r\nX-Storage-Token: '
+                 b't\r\nContent-Length: 5\r\nContent-Type: text/jibberish0\r\n'
+                 b'Foo: barbaz\r\n\r\n00001\r\n' % (oc, o))
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        fd.write(b'PUT /v1/a/%s/%s HTTP/1.1\r\nHost: '
+                 b'localhost\r\nConnection: close\r\nX-Storage-Token: '
+                 b't\r\nContent-Length: 4\r\nContent-Type: text/jibberish0\r\n'
+                 b'Foo: barbaz\r\n\r\nsub1\r\n' % (oc, osub))
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        fd.write(b'PUT /v1/a/%s/%s HTTP/1.1\r\nHost: '
+                 b'localhost\r\nConnection: close\r\nX-Storage-Token: '
+                 b't\r\nContent-Length: 4\r\nContent-Type: text/jibberish0\r\n'
+                 b'Foo: barbaz\r\n\r\nsub2\r\n' % (oc, osub))
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        fd.write(b'DELETE /v1/a/%s/%s HTTP/1.1\r\nHost: localhost\r\n'
+                 b'Connection: close\r\nX-Storage-Token: t\r\n\r\n' % (oc, o))
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 2'  # 2xx series response
+        self.assertEqual(headers[:len(exp)], exp)
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        fd.write(b'GET /v1/a/%s?prefix=%s%s/ HTTP/1.1\r\nHost: '
+                 b'localhost\r\nConnection: close\r\nX-Auth-Token: t\r\n\r\n'
+                 % (vc, presub, osub))
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 2'  # 2xx series response
+        self.assertEqual(headers[:len(exp)], exp)
+        body = fd.read()
+        versions = [x for x in body.split(b'\n') if x]
+        self.assertEqual(len(versions), 1)
+
+        # Check for when the versions target container doesn't exist
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        fd.write(b'PUT /v1/a/%swhoops HTTP/1.1\r\nHost: localhost\r\n'
+                 b'Connection: close\r\nX-Storage-Token: t\r\n'
+                 b'Content-Length: 0\r\n'
+                 b'X-Versions-Location: none\r\n\r\n' % oc)
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
+        # Create the versioned file
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        fd.write(b'PUT /v1/a/%swhoops/foo HTTP/1.1\r\nHost: '
+                 b'localhost\r\nConnection: close\r\nX-Storage-Token: '
+                 b't\r\nContent-Length: 5\r\n\r\n00000\r\n' % oc)
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 201'
+        self.assertEqual(headers[:len(exp)], exp)
+        # Create another version
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        fd.write(b'PUT /v1/a/%swhoops/foo HTTP/1.1\r\nHost: '
+                 b'localhost\r\nConnection: close\r\nX-Storage-Token: '
+                 b't\r\nContent-Length: 5\r\n\r\n00001\r\n' % oc)
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 412'
+        self.assertEqual(headers[:len(exp)], exp)
+        # Delete the object
+        sock = connect_tcp(('localhost', prolis.getsockname()[1]))
+        fd = sock.makefile('rwb')
+        fd.write(b'DELETE /v1/a/%swhoops/foo HTTP/1.1\r\nHost: localhost\r\n'
+                 b'Connection: close\r\nX-Storage-Token: t\r\n\r\n' % oc)
+        fd.flush()
+        headers = readuntil2crlfs(fd)
+        exp = b'HTTP/1.1 2'  # 2xx response
+        self.assertEqual(headers[:len(exp)], exp)
+
+    def test_version_manifest_utf8(self):
+        oc = b'0_oc_non_ascii\xc2\xa3'
+        vc = b'0_vc_non_ascii\xc2\xa3'
+        o = b'0_o_non_ascii\xc2\xa3'
+        self.test_version_manifest(oc, vc, o)
+
+    def test_version_manifest_utf8_container(self):
+        oc = b'1_oc_non_ascii\xc2\xa3'
+        vc = b'1_vc_ascii'
+        o = b'1_o_ascii'
+        self.test_version_manifest(oc, vc, o)
+
+    def test_version_manifest_utf8_version_container(self):
+        oc = b'2_oc_ascii'
+        vc = b'2_vc_non_ascii\xc2\xa3'
+        o = b'2_o_ascii'
+        self.test_version_manifest(oc, vc, o)
+
+    def test_version_manifest_utf8_containers(self):
+        oc = b'3_oc_non_ascii\xc2\xa3'
+        vc = b'3_vc_non_ascii\xc2\xa3'
+        o = b'3_o_ascii'
+        self.test_version_manifest(oc, vc, o)
+
+    def test_version_manifest_utf8_object(self):
+        oc = b'4_oc_ascii'
+        vc = b'4_vc_ascii'
+        o = b'4_o_non_ascii\xc2\xa3'
+        self.test_version_manifest(oc, vc, o)
+
+    def test_version_manifest_utf8_version_container_utf_object(self):
+        oc = b'5_oc_ascii'
+        vc = b'5_vc_non_ascii\xc2\xa3'
+        o = b'5_o_non_ascii\xc2\xa3'
+        self.test_version_manifest(oc, vc, o)
+
+    def test_version_manifest_utf8_container_utf_object(self):
+        oc = b'6_oc_non_ascii\xc2\xa3'
+        vc = b'6_vc_ascii'
+        o = b'6_o_non_ascii\xc2\xa3'
+        self.test_version_manifest(oc, vc, o)
 
 
 if __name__ == '__main__':
-    setup()
-    try:
-        unittest.main()
-    finally:
-        teardown()
+    unittest.main()
diff --git a/test/unit/proxy/test_sysmeta.py b/test/unit/proxy/test_sysmeta.py
new file mode 100644
index 0000000000..c672140d37
--- /dev/null
+++ b/test/unit/proxy/test_sysmeta.py
@@ -0,0 +1,477 @@
+# Copyright (c) 2010-2012 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from urllib.parse import quote
+
+import unittest
+import os
+from tempfile import mkdtemp
+import shutil
+
+from swift.common.middleware.copy import ServerSideCopyMiddleware
+from swift.common.storage_policy import StoragePolicy
+from swift.common.swob import Request
+from swift.common.utils import mkdirs, split_path
+from swift.common.wsgi import WSGIContext
+from swift.obj import server as object_server
+from swift.proxy import server as proxy
+import swift.proxy.controllers
+from swift.proxy.controllers.base import get_object_info
+from test.debug_logger import debug_logger
+from test.unit import FakeMemcache, FakeRing, fake_http_connect, \
+    patch_policies, skip_if_no_xattrs
+
+
+class FakeServerConnection(WSGIContext):
+    '''Fakes an HTTPConnection to a server instance.'''
+    def __init__(self, app):
+        super(FakeServerConnection, self).__init__(app)
+        self.data = b''
+
+    def getheaders(self):
+        return self._response_headers
+
+    def read(self, amt=None):
+        try:
+            return next(self.resp_iter)
+        except StopIteration:
+            return b''
+
+    def getheader(self, name, default=None):
+        result = self._response_header_value(name)
+        return result if result else default
+
+    def getresponse(self):
+        environ = {'REQUEST_METHOD': self.method}
+        req = Request.blank(self.path, environ, headers=self.req_headers,
+                            body=self.data)
+        self.data = b''
+        self.resp = self._app_call(req.environ)
+        self.resp_iter = iter(self.resp)
+        if self._response_headers is None:
+            self._response_headers = []
+        status_parts = self._response_status.split(' ', 1)
+        self.status = int(status_parts[0])
+        self.reason = status_parts[1] if len(status_parts) == 2 else ''
+        return self
+
+    def getexpect(self):
+        class ContinueResponse(object):
+            status = 100
+        return ContinueResponse()
+
+    def send(self, data):
+        self.data += data
+
+    def close(self):
+        pass
+
+    def __call__(self, ipaddr, port, device, partition, method, path,
+                 headers=None, query_string=None):
+        self.path = quote('/' + device + '/' + str(partition) + path)
+        self.method = method
+        self.req_headers = headers
+        return self
+
+
+def get_http_connect(account_func, container_func, object_func):
+    '''Returns a http_connect function that delegates to
+    entity-specific http_connect methods based on request path.
+    '''
+    def http_connect(ipaddr, port, device, partition, method, path,
+                     headers=None, query_string=None):
+        a, c, o = split_path(path, 1, 3, True)
+        if o:
+            func = object_func
+        elif c:
+            func = container_func
+        else:
+            func = account_func
+        resp = func(ipaddr, port, device, partition, method, path,
+                    headers=headers, query_string=query_string)
+        return resp
+
+    return http_connect
+
+
+@patch_policies([StoragePolicy(0, 'zero', True,
+                               object_ring=FakeRing(replicas=1))])
+class TestObjectSysmeta(unittest.TestCase):
+    '''Tests object sysmeta is correctly handled by combination
+    of proxy server and object server.
+    '''
+    def _assertStatus(self, resp, expected):
+        self.assertEqual(resp.status_int, expected,
+                         'Expected %d, got %s'
+                         % (expected, resp.status))
+
+    def _assertInHeaders(self, resp, expected):
+        for key, val in expected.items():
+            self.assertIn(key, resp.headers,
+                          'Header %s missing from %s' % (key, resp.headers))
+            self.assertEqual(val, resp.headers[key],
+                             'Expected header %s:%s, got %s:%s'
+                             % (key, val, key, resp.headers[key]))
+
+    def _assertNotInHeaders(self, resp, unexpected):
+        for key, val in unexpected.items():
+            self.assertNotIn(key, resp.headers,
+                             'Header %s not expected in %s'
+                             % (key, resp.headers))
+
+    def setUp(self):
+        skip_if_no_xattrs()
+        self.app = proxy.Application(None,
+                                     logger=debug_logger('proxy-ut'),
+                                     account_ring=FakeRing(replicas=1),
+                                     container_ring=FakeRing(replicas=1))
+        self.copy_app = ServerSideCopyMiddleware(self.app, {})
+        self.tmpdir = mkdtemp()
+        self.testdir = os.path.join(self.tmpdir,
+                                    'tmp_test_object_server_ObjectController')
+        mkdirs(os.path.join(self.testdir, 'sda', 'tmp'))
+        conf = {'devices': self.testdir, 'mount_check': 'false'}
+        self.obj_ctlr = object_server.ObjectController(
+            conf, logger=debug_logger('obj-ut'))
+
+        http_connect = get_http_connect(fake_http_connect(200),
+                                        fake_http_connect(200),
+                                        FakeServerConnection(self.obj_ctlr))
+
+        self.orig_base_http_connect = swift.proxy.controllers.base.http_connect
+        self.orig_obj_http_connect = swift.proxy.controllers.obj.http_connect
+        swift.proxy.controllers.base.http_connect = http_connect
+        swift.proxy.controllers.obj.http_connect = http_connect
+
+    def tearDown(self):
+        shutil.rmtree(self.tmpdir)
+        swift.proxy.controllers.base.http_connect = self.orig_base_http_connect
+        swift.proxy.controllers.obj.http_connect = self.orig_obj_http_connect
+
+    original_sysmeta_headers_1 = {'x-object-sysmeta-test0': 'val0',
+                                  'x-object-sysmeta-test1': 'val1'}
+    original_sysmeta_headers_2 = {'x-object-sysmeta-test2': 'val2'}
+    changed_sysmeta_headers = {'x-object-sysmeta-test0': '',
+                               'x-object-sysmeta-test1': 'val1 changed'}
+    new_sysmeta_headers = {'x-object-sysmeta-test3': 'val3'}
+    original_meta_headers_1 = {'x-object-meta-test0': 'meta0',
+                               'x-object-meta-test1': 'meta1'}
+    original_meta_headers_2 = {'x-object-meta-test2': 'meta2'}
+    changed_meta_headers = {'x-object-meta-test0': '',
+                            'x-object-meta-test1': 'meta1 changed'}
+    new_meta_headers = {'x-object-meta-test3': 'meta3'}
+    bad_headers = {'x-account-sysmeta-test1': 'bad1'}
+    # these transient_sysmeta headers get changed...
+    original_transient_sysmeta_headers_1 = \
+        {'x-object-transient-sysmeta-testA': 'A'}
+    # these transient_sysmeta headers get deleted...
+    original_transient_sysmeta_headers_2 = \
+        {'x-object-transient-sysmeta-testB': 'B'}
+    # these are replacement transient_sysmeta headers
+    changed_transient_sysmeta_headers = \
+        {'x-object-transient-sysmeta-testA': 'changed_A'}
+    new_transient_sysmeta_headers_1 = {'x-object-transient-sysmeta-testC': 'C'}
+    new_transient_sysmeta_headers_2 = {'x-object-transient-sysmeta-testD': 'D'}
+
+    def test_PUT_sysmeta_then_GET(self):
+        path = '/v1/a/c/o'
+
+        env = {'REQUEST_METHOD': 'PUT'}
+        hdrs = dict(self.original_sysmeta_headers_1)
+        hdrs.update(self.original_meta_headers_1)
+        hdrs.update(self.bad_headers)
+        hdrs.update(self.original_transient_sysmeta_headers_1)
+        req = Request.blank(path, environ=env, headers=hdrs, body=b'x')
+        resp = req.get_response(self.app)
+        self._assertStatus(resp, 201)
+
+        req = Request.blank(path, environ={})
+        resp = req.get_response(self.app)
+        self._assertStatus(resp, 200)
+        self._assertInHeaders(resp, self.original_sysmeta_headers_1)
+        self._assertInHeaders(resp, self.original_meta_headers_1)
+        self._assertInHeaders(resp, self.original_transient_sysmeta_headers_1)
+        self._assertNotInHeaders(resp, self.bad_headers)
+
+    def test_PUT_sysmeta_then_HEAD(self):
+        path = '/v1/a/c/o'
+
+        env = {'REQUEST_METHOD': 'PUT'}
+        hdrs = dict(self.original_sysmeta_headers_1)
+        hdrs.update(self.original_meta_headers_1)
+        hdrs.update(self.bad_headers)
+        hdrs.update(self.original_transient_sysmeta_headers_1)
+        req = Request.blank(path, environ=env, headers=hdrs, body=b'x')
+        resp = req.get_response(self.app)
+        self._assertStatus(resp, 201)
+
+        env = {'REQUEST_METHOD': 'HEAD'}
+        req = Request.blank(path, environ=env)
+        resp = req.get_response(self.app)
+        self._assertStatus(resp, 200)
+        self._assertInHeaders(resp, self.original_sysmeta_headers_1)
+        self._assertInHeaders(resp, self.original_meta_headers_1)
+        self._assertInHeaders(resp, self.original_transient_sysmeta_headers_1)
+        self._assertNotInHeaders(resp, self.bad_headers)
+
+    def test_sysmeta_replaced_by_PUT(self):
+        path = '/v1/a/c/o'
+        cache = FakeMemcache()
+
+        env = {'REQUEST_METHOD': 'PUT', 'swift.cache': cache}
+        hdrs = dict(self.original_sysmeta_headers_1)
+        hdrs.update(self.original_sysmeta_headers_2)
+        hdrs.update(self.original_meta_headers_1)
+        hdrs.update(self.original_meta_headers_2)
+        req = Request.blank(path, environ=env, headers=hdrs, body=b'x')
+        resp = req.get_response(self.app)
+        self._assertStatus(resp, 201)
+
+        env = {'REQUEST_METHOD': 'PUT', 'swift.cache': cache}
+        hdrs = dict(self.changed_sysmeta_headers)
+        hdrs.update(self.new_sysmeta_headers)
+        hdrs.update(self.changed_meta_headers)
+        hdrs.update(self.new_meta_headers)
+        hdrs.update(self.bad_headers)
+        req = Request.blank(path, environ=env, headers=hdrs, body=b'x')
+        resp = req.get_response(self.app)
+        self._assertStatus(resp, 201)
+
+        req = Request.blank(path, environ={'swift.cache': cache})
+        resp = req.get_response(self.app)
+        self._assertStatus(resp, 200)
+        self._assertInHeaders(resp, self.changed_sysmeta_headers)
+        self._assertInHeaders(resp, self.new_sysmeta_headers)
+        self._assertNotInHeaders(resp, self.original_sysmeta_headers_2)
+        self._assertInHeaders(resp, self.changed_meta_headers)
+        self._assertInHeaders(resp, self.new_meta_headers)
+        self._assertNotInHeaders(resp, self.original_meta_headers_2)
+
+    def test_sysmeta_not_updated_by_POST(self):
+        # check sysmeta is not changed by a POST but user meta is replaced
+        path = '/v1/a/c/o'
+        cache = FakeMemcache()
+
+        env = {'REQUEST_METHOD': 'PUT', 'swift.cache': cache}
+        hdrs = dict(self.original_sysmeta_headers_1)
+        hdrs.update(self.original_meta_headers_1)
+        req = Request.blank(path, environ=env, headers=hdrs, body=b'x')
+        resp = req.get_response(self.app)
+        self._assertStatus(resp, 201)
+
+        env = {'REQUEST_METHOD': 'POST', 'swift.cache': cache}
+        hdrs = dict(self.changed_sysmeta_headers)
+        hdrs.update(self.new_sysmeta_headers)
+        hdrs.update(self.changed_meta_headers)
+        hdrs.update(self.new_meta_headers)
+        hdrs.update(self.bad_headers)
+        req = Request.blank(path, environ=env, headers=hdrs)
+        resp = req.get_response(self.app)
+        self._assertStatus(resp, 202)
+
+        req = Request.blank(path, environ={'swift.cache': cache})
+        resp = req.get_response(self.app)
+        self._assertStatus(resp, 200)
+        self._assertInHeaders(resp, self.original_sysmeta_headers_1)
+        self._assertNotInHeaders(resp, self.new_sysmeta_headers)
+        self._assertInHeaders(resp, self.changed_meta_headers)
+        self._assertInHeaders(resp, self.new_meta_headers)
+        self._assertNotInHeaders(resp, self.bad_headers)
+
+        env = {'REQUEST_METHOD': 'PUT', 'swift.cache': cache}
+        hdrs = dict(self.changed_sysmeta_headers)
+        hdrs.update(self.new_sysmeta_headers)
+        hdrs.update(self.bad_headers)
+        req = Request.blank(path, environ=env, headers=hdrs, body=b'x')
+        resp = req.get_response(self.app)
+        self._assertStatus(resp, 201)
+
+        req = Request.blank(path, environ={'swift.cache': cache})
+        resp = req.get_response(self.app)
+        self._assertStatus(resp, 200)
+        self._assertInHeaders(resp, self.changed_sysmeta_headers)
+        self._assertInHeaders(resp, self.new_sysmeta_headers)
+        self._assertNotInHeaders(resp, self.original_sysmeta_headers_2)
+
+    def test_sysmeta_updated_by_COPY(self):
+        # check sysmeta is updated by a COPY in same way as user meta by
+        # issuing requests to the copy middleware app
+        path = '/v1/a/c/o'
+        dest = '/c/o2'
+        cache = FakeMemcache()
+        env = {'REQUEST_METHOD': 'PUT', 'swift.cache': cache}
+        hdrs = dict(self.original_sysmeta_headers_1)
+        hdrs.update(self.original_sysmeta_headers_2)
+        hdrs.update(self.original_meta_headers_1)
+        hdrs.update(self.original_meta_headers_2)
+        hdrs.update(self.original_transient_sysmeta_headers_1)
+        hdrs.update(self.original_transient_sysmeta_headers_2)
+        req = Request.blank(path, environ=env, headers=hdrs, body=b'x')
+        resp = req.get_response(self.copy_app)
+        self._assertStatus(resp, 201)
+
+        env = {'REQUEST_METHOD': 'COPY', 'swift.cache': cache}
+        hdrs = dict(self.changed_sysmeta_headers)
+        hdrs.update(self.new_sysmeta_headers)
+        hdrs.update(self.changed_meta_headers)
+        hdrs.update(self.new_meta_headers)
+        hdrs.update(self.changed_transient_sysmeta_headers)
+        hdrs.update(self.new_transient_sysmeta_headers_1)
+        hdrs.update(self.bad_headers)
+        hdrs.update({'Destination': dest})
+        req = Request.blank(path, environ=env, headers=hdrs)
+        resp = req.get_response(self.copy_app)
+        self._assertStatus(resp, 201)
+        self._assertInHeaders(resp, self.changed_sysmeta_headers)
+        self._assertInHeaders(resp, self.new_sysmeta_headers)
+        self._assertInHeaders(resp, self.original_sysmeta_headers_2)
+        self._assertInHeaders(resp, self.changed_meta_headers)
+        self._assertInHeaders(resp, self.new_meta_headers)
+        self._assertInHeaders(resp, self.original_meta_headers_2)
+        self._assertInHeaders(resp, self.changed_transient_sysmeta_headers)
+        self._assertInHeaders(resp, self.new_transient_sysmeta_headers_1)
+        self._assertInHeaders(resp, self.original_transient_sysmeta_headers_2)
+        self._assertNotInHeaders(resp, self.bad_headers)
+
+        req = Request.blank('/v1/a/c/o2', environ={'swift.cache': cache})
+        resp = req.get_response(self.copy_app)
+        self._assertStatus(resp, 200)
+        self._assertInHeaders(resp, self.changed_sysmeta_headers)
+        self._assertInHeaders(resp, self.new_sysmeta_headers)
+        self._assertInHeaders(resp, self.original_sysmeta_headers_2)
+        self._assertInHeaders(resp, self.changed_meta_headers)
+        self._assertInHeaders(resp, self.new_meta_headers)
+        self._assertInHeaders(resp, self.original_meta_headers_2)
+        self._assertInHeaders(resp, self.changed_transient_sysmeta_headers)
+        self._assertInHeaders(resp, self.new_transient_sysmeta_headers_1)
+        self._assertInHeaders(resp, self.original_transient_sysmeta_headers_2)
+        self._assertNotInHeaders(resp, self.bad_headers)
+
+    def test_sysmeta_updated_by_COPY_from(self):
+        # check sysmeta is updated by a PUT with x-copy-from in same way as
+        # user meta by issuing requests to the copy middleware app
+        path = '/v1/a/c/o'
+        cache = FakeMemcache()
+        env = {'REQUEST_METHOD': 'PUT', 'swift.cache': cache}
+        hdrs = dict(self.original_sysmeta_headers_1)
+        hdrs.update(self.original_sysmeta_headers_2)
+        hdrs.update(self.original_meta_headers_1)
+        hdrs.update(self.original_meta_headers_2)
+        req = Request.blank(path, environ=env, headers=hdrs, body=b'x')
+        resp = req.get_response(self.copy_app)
+        self._assertStatus(resp, 201)
+
+        env = {'REQUEST_METHOD': 'PUT', 'swift.cache': cache}
+        hdrs = dict(self.changed_sysmeta_headers)
+        hdrs.update(self.new_sysmeta_headers)
+        hdrs.update(self.changed_meta_headers)
+        hdrs.update(self.new_meta_headers)
+        hdrs.update(self.bad_headers)
+        hdrs.update({'X-Copy-From': '/c/o'})
+        req = Request.blank('/v1/a/c/o2', environ=env, headers=hdrs, body=b'')
+        resp = req.get_response(self.copy_app)
+        self._assertStatus(resp, 201)
+        self._assertInHeaders(resp, self.changed_sysmeta_headers)
+        self._assertInHeaders(resp, self.new_sysmeta_headers)
+        self._assertInHeaders(resp, self.original_sysmeta_headers_2)
+        self._assertInHeaders(resp, self.changed_meta_headers)
+        self._assertInHeaders(resp, self.new_meta_headers)
+        self._assertInHeaders(resp, self.original_meta_headers_2)
+        self._assertNotInHeaders(resp, self.bad_headers)
+
+        req = Request.blank('/v1/a/c/o2', environ={'swift.cache': cache})
+        resp = req.get_response(self.copy_app)
+        self._assertStatus(resp, 200)
+        self._assertInHeaders(resp, self.changed_sysmeta_headers)
+        self._assertInHeaders(resp, self.new_sysmeta_headers)
+        self._assertInHeaders(resp, self.original_sysmeta_headers_2)
+        self._assertInHeaders(resp, self.changed_meta_headers)
+        self._assertInHeaders(resp, self.new_meta_headers)
+        self._assertInHeaders(resp, self.original_meta_headers_2)
+        self._assertNotInHeaders(resp, self.bad_headers)
+
+    def test_transient_sysmeta_replaced_by_PUT_or_POST(self):
+        # check transient_sysmeta is replaced en-masse by a POST
+        path = '/v1/a/c/o'
+        cache = FakeMemcache()
+
+        env = {'REQUEST_METHOD': 'PUT', 'swift.cache': cache}
+        hdrs = dict(self.original_transient_sysmeta_headers_1)
+        hdrs.update(self.original_transient_sysmeta_headers_2)
+        hdrs.update(self.original_meta_headers_1)
+        req = Request.blank(path, environ=env, headers=hdrs, body=b'x')
+        resp = req.get_response(self.app)
+        self._assertStatus(resp, 201)
+
+        req = Request.blank(path, environ={})
+        resp = req.get_response(self.app)
+        self._assertStatus(resp, 200)
+        self._assertInHeaders(resp, self.original_transient_sysmeta_headers_1)
+        self._assertInHeaders(resp, self.original_transient_sysmeta_headers_2)
+        self._assertInHeaders(resp, self.original_meta_headers_1)
+
+        info = get_object_info(req.environ, self.app)
+        self.assertEqual(2, len(info.get('transient_sysmeta', ())))
+        self.assertEqual({'testa': 'A', 'testb': 'B'},
+                         info['transient_sysmeta'])
+
+        # POST will replace all existing transient_sysmeta and usermeta values
+        env = {'REQUEST_METHOD': 'POST', 'swift.cache': cache}
+        hdrs = dict(self.changed_transient_sysmeta_headers)
+        hdrs.update(self.new_transient_sysmeta_headers_1)
+        req = Request.blank(path, environ=env, headers=hdrs)
+        resp = req.get_response(self.app)
+        self._assertStatus(resp, 202)
+
+        req = Request.blank(path, environ={})
+        resp = req.get_response(self.app)
+        self._assertStatus(resp, 200)
+        self._assertInHeaders(resp, self.changed_transient_sysmeta_headers)
+        self._assertInHeaders(resp, self.new_transient_sysmeta_headers_1)
+        self._assertNotInHeaders(resp, self.original_meta_headers_1)
+        self._assertNotInHeaders(resp,
+                                 self.original_transient_sysmeta_headers_2)
+
+        info = get_object_info(req.environ, self.app)
+        self.assertEqual(2, len(info.get('transient_sysmeta', ())))
+        self.assertEqual({'testa': 'changed_A', 'testc': 'C'},
+                         info['transient_sysmeta'])
+
+        # subsequent PUT replaces all transient_sysmeta and usermeta values
+        env = {'REQUEST_METHOD': 'PUT', 'swift.cache': cache}
+        hdrs = dict(self.new_transient_sysmeta_headers_2)
+        hdrs.update(self.original_meta_headers_2)
+        req = Request.blank(path, environ=env, headers=hdrs, body=b'x')
+        resp = req.get_response(self.app)
+        self._assertStatus(resp, 201)
+
+        req = Request.blank(path, environ={'swift.cache': cache})
+        resp = req.get_response(self.app)
+        self._assertStatus(resp, 200)
+        self._assertInHeaders(resp, self.original_meta_headers_2)
+        self._assertInHeaders(resp, self.new_transient_sysmeta_headers_2)
+        # meta from previous POST should have gone away...
+        self._assertNotInHeaders(resp, self.changed_transient_sysmeta_headers)
+        self._assertNotInHeaders(resp, self.new_transient_sysmeta_headers_1)
+        # sanity check that meta from first PUT did not re-appear...
+        self._assertNotInHeaders(resp, self.original_meta_headers_1)
+        self._assertNotInHeaders(resp,
+                                 self.original_transient_sysmeta_headers_1)
+        self._assertNotInHeaders(resp,
+                                 self.original_transient_sysmeta_headers_2)
+
+        info = get_object_info(req.environ, self.app)
+        self.assertEqual(1, len(info.get('transient_sysmeta', ())))
+        self.assertEqual({'testd': 'D'}, info['transient_sysmeta'])
diff --git a/tools/pip-requires b/tools/pip-requires
deleted file mode 100644
index 3647e235ea..0000000000
--- a/tools/pip-requires
+++ /dev/null
@@ -1,7 +0,0 @@
-eventlet==0.9.15
-greenlet==0.3.1
-netifaces==0.6
-pastedeploy==1.3.3
-simplejson==2.0.9
-xattr==0.4
-python-swiftclient
diff --git a/tools/playbooks/ceph-s3tests/ceph-s3.conf b/tools/playbooks/ceph-s3tests/ceph-s3.conf
new file mode 100644
index 0000000000..f9b06f7c99
--- /dev/null
+++ b/tools/playbooks/ceph-s3tests/ceph-s3.conf
@@ -0,0 +1,29 @@
+[DEFAULT]
+host = localhost
+port = 8080
+is_secure = no
+
+[fixtures]
+bucket prefix = ceph-s3tests-{random}-
+
+[s3 main]
+user_id = test:tester
+display_name = test:tester
+email = test:tester
+access_key = test:tester
+secret_key = testing
+
+[s3 alt]
+user_id = test:tester2
+display_name = test:tester2
+email = test:tester2
+access_key = test:tester2
+secret_key = testing2
+
+[s3 tenant]
+# XXX(tburke): I have no idea if this even begins to make any sense...
+user_id = test2:tester2
+display_name = test2:tester2
+email = test2:tester2
+access_key = test2:tester2
+secret_key = testing2
diff --git a/tools/playbooks/ceph-s3tests/post.yaml b/tools/playbooks/ceph-s3tests/post.yaml
new file mode 100644
index 0000000000..a0692147c5
--- /dev/null
+++ b/tools/playbooks/ceph-s3tests/post.yaml
@@ -0,0 +1,26 @@
+- hosts: all
+  become: true
+  tasks:
+    - name: Check for s3-tests outputs
+      stat:
+        path: '{{ ansible_env.HOME }}/s3compat/output'
+      register: s3_tests_output
+    - name: Copy s3-tests outputs from worker nodes to executor node
+      synchronize:
+        src: '{{ ansible_env.HOME }}/s3compat/output'
+        dest: '{{ zuul.executor.log_root }}'
+        mode: pull
+        copy_links: true
+        verify_host: true
+      when: s3_tests_output.stat.exists == true
+    - name: Check for s3-tests output summary
+      stat:
+        path: '{{ ansible_env.HOME }}/s3compat/output/ceph-s3-summary.log'
+      register: s3_tests_output_summary
+    - zuul_return:
+        data:
+          zuul:
+            artifacts:
+              - name: s3compat test summary
+                url: output/ceph-s3-summary.log
+      when: s3_tests_output_summary.stat.exists == true
diff --git a/tools/playbooks/ceph-s3tests/run.yaml b/tools/playbooks/ceph-s3tests/run.yaml
new file mode 100644
index 0000000000..45bb1745ee
--- /dev/null
+++ b/tools/playbooks/ceph-s3tests/run.yaml
@@ -0,0 +1,56 @@
+# Copyright (c) 2018 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+- hosts: all
+  tasks:
+    - name: Clone s3compat repository
+      git:
+          repo: "https://github.com/tipabu/s3compat.git"
+          dest: "{{ ansible_env.HOME }}/s3compat"
+
+    - name: Install virtualenv
+      pip:
+        name: virtualenv
+      become: true
+
+    - name: Install s3compat requirements
+      pip:
+          requirements: "{{ ansible_env.HOME }}/s3compat/requirements.txt"
+          virtualenv: "{{ ansible_env.HOME }}/venv"
+          virtualenv_python: python3
+      become: true
+
+    - name: Run s3compat tests
+      shell: '{{ ansible_env.HOME }}/venv/bin/python {{ ansible_env.HOME }}/s3compat/bin/run_ceph_tests.py "$@"'
+      ignore_errors: true
+      environment:
+          S3TEST_CONF: "{{ ansible_env.HOME }}/{{ zuul.project.src_dir }}/tools/playbooks/ceph-s3tests/ceph-s3.conf"
+      args:
+          chdir: '{{ ansible_env.HOME }}/s3compat'
+      tags:
+        - tests
+
+    - name: Show report
+      shell: |
+        set -o pipefail
+        "{{ ansible_env.HOME }}/venv/bin/python" ./bin/get_ceph_test_attributes.py
+        "{{ ansible_env.HOME }}/venv/bin/python" ./bin/report.py --detailed "{{ ansible_env.HOME }}/s3compat/output/ceph-s3.out.yaml" \
+            --known-failures "{{ ansible_env.HOME}}/{{ zuul.project.src_dir }}/doc/s3api/conf/ceph-known-failures-tempauth.yaml" \
+            --detailedformat console "{{ ansible_env.HOME }}/s3compat/output/ceph-s3.out.xml" | \
+            tee "{{ ansible_env.HOME }}/s3compat/output/ceph-s3-summary.log"
+      args:
+          chdir:
+              "{{ ansible_env.HOME }}/s3compat"
+      tags:
+        - tests
diff --git a/tools/playbooks/common/cover-post.yaml b/tools/playbooks/common/cover-post.yaml
new file mode 100644
index 0000000000..946b0c1019
--- /dev/null
+++ b/tools/playbooks/common/cover-post.yaml
@@ -0,0 +1,3 @@
+- hosts: all
+  roles:
+    - role: fetch-coverage-output
diff --git a/tools/playbooks/common/install_dependencies.yaml b/tools/playbooks/common/install_dependencies.yaml
new file mode 100644
index 0000000000..bb801ed488
--- /dev/null
+++ b/tools/playbooks/common/install_dependencies.yaml
@@ -0,0 +1,43 @@
+# Copyright (c) 2018 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+- hosts: all
+  become: true
+  roles:
+    - ensure-pip
+  tasks:
+    - name: upgrade pip
+      pip:
+        name: pip
+        extra_args: --upgrade
+
+    - name: install rsync-daemon - CentOS 8, 9
+      package:
+        name: rsync-daemon
+        state: present
+      when:
+        - ansible_facts['distribution'] == "CentOS"
+        - ansible_facts['distribution_major_version'] != "7"
+
+    - name: install python modules with pip
+      pip: name={{ item }} state=present extra_args='--upgrade'
+      with_items:
+        - mock
+        - crudini
+        - eventlet
+        - pyeclib
+        - pytest
+        - pytest-cov
+        - python-swiftclient
+        - 'boto3>=1.9'
diff --git a/bin/swift-object-server b/tools/playbooks/common/restart_swift.yaml
old mode 100755
new mode 100644
similarity index 65%
rename from bin/swift-object-server
rename to tools/playbooks/common/restart_swift.yaml
index 3d2aa7e5b8..4223e37741
--- a/bin/swift-object-server
+++ b/tools/playbooks/common/restart_swift.yaml
@@ -1,5 +1,4 @@
-#!/usr/bin/env python
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2018 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,10 +12,13 @@
 # implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
+- hosts: all
+  tasks:
+    - name: Shutdown main swift services
+      shell: "swift-init stop main"
+      become: true
+      ignore_errors: true
 
-from swift.common.utils import parse_options
-from swift.common.wsgi import run_wsgi
-
-if __name__ == '__main__':
-    conf_file, options = parse_options()
-    run_wsgi(conf_file, 'object-server', default_port=6000, **options)
+    - name: Start main swift services
+      shell: "swift-init start main"
+      become: true
diff --git a/tools/playbooks/cors/install_selenium.yaml b/tools/playbooks/cors/install_selenium.yaml
new file mode 100644
index 0000000000..f617388f36
--- /dev/null
+++ b/tools/playbooks/cors/install_selenium.yaml
@@ -0,0 +1,32 @@
+- hosts: all
+  become: true
+  tasks:
+    - name: install virtual frame buffer
+      yum:
+        name: xorg-x11-server-Xvfb
+        state: present
+    - name: install selenium
+      pip:
+        name: 'selenium<4'
+        state: present
+    - name: install firefox
+      yum:
+        name: firefox
+        state: present
+    - name: fetch firefox driver
+      get_url:
+        url: https://github.com/mozilla/geckodriver/releases/download/v0.34.0/geckodriver-v0.34.0-linux64.tar.gz
+        dest: /tmp/geckodriver.tar.gz
+    - name: unpack firefox driver
+      unarchive:
+        src: /tmp/geckodriver.tar.gz
+        dest: /usr/local/bin
+        remote_src: true
+    - name: check selenium version
+      command: pip show selenium
+    - name: check firefox version
+      command: firefox --version
+    #- name: install chromium
+    #  yum:
+    #    name: chromium-headless
+    #    state: present
diff --git a/tools/playbooks/cors/post.yaml b/tools/playbooks/cors/post.yaml
new file mode 100644
index 0000000000..4bc84bdcdc
--- /dev/null
+++ b/tools/playbooks/cors/post.yaml
@@ -0,0 +1,38 @@
+- hosts: all
+  become: true
+  tasks:
+    - name: Check for geckodriver log
+      stat:
+        path: '{{ ansible_env.HOME }}/geckodriver.log'
+      register: geckodriver_output
+
+    - name: Copy geckodriver log from worker nodes to executor node
+      synchronize:
+        src: '{{ ansible_env.HOME }}/geckodriver.log'
+        dest: '{{ zuul.executor.log_root }}'
+        mode: pull
+        copy_links: true
+        verify_host: true
+      when: geckodriver_output.stat.exists == true
+
+    - name: Check for CORS test output
+      stat:
+        path: '{{ ansible_env.HOME }}/cors-test-results.txt'
+      register: test_output
+
+    - name: Copy CORS tests output from worker nodes to executor node
+      synchronize:
+        src: '{{ ansible_env.HOME }}/cors-test-results.txt'
+        dest: '{{ zuul.executor.log_root }}'
+        mode: pull
+        copy_links: true
+        verify_host: true
+      when: test_output.stat.exists == true
+
+    - zuul_return:
+        data:
+          zuul:
+            artifacts:
+              - name: CORS test results
+                url: cors-test-results.txt
+      when: test_output.stat.exists == true
diff --git a/tools/playbooks/cors/run.yaml b/tools/playbooks/cors/run.yaml
new file mode 100644
index 0000000000..a90fc86b05
--- /dev/null
+++ b/tools/playbooks/cors/run.yaml
@@ -0,0 +1,15 @@
+- hosts: all
+  tasks:
+    - name: Shutdown main swift services
+      shell: "swift-init stop main"
+      ignore_errors: true
+
+    - name: Start main swift services
+      shell: "swift-init start main"
+
+    - name: Run CORS tests
+      shell: >
+        python3
+        {{ ansible_env.HOME }}/{{ zuul.project.src_dir }}/test/cors/main.py
+        --output {{ ansible_env.HOME }}/cors-test-results.txt
+        all
diff --git a/tools/playbooks/dsvm/post.yaml b/tools/playbooks/dsvm/post.yaml
new file mode 100644
index 0000000000..7f0cb19824
--- /dev/null
+++ b/tools/playbooks/dsvm/post.yaml
@@ -0,0 +1,4 @@
+- hosts: all
+  roles:
+    - fetch-tox-output
+    - fetch-subunit-output
diff --git a/tools/playbooks/dsvm/pre.yaml b/tools/playbooks/dsvm/pre.yaml
new file mode 100644
index 0000000000..23c6ec2d2d
--- /dev/null
+++ b/tools/playbooks/dsvm/pre.yaml
@@ -0,0 +1,12 @@
+- hosts: all
+  roles:
+    - orchestrate-devstack
+    # Run bindep and test-setup after devstack so that they won't interfere
+    - role: bindep
+      bindep_profile: test
+      bindep_dir: "{{ zuul_work_dir }}"
+    - test-setup
+    - ensure-tox
+    - additional-tempauth-users
+    - additional-keystone-users
+    - dsvm-additional-middlewares
diff --git a/tools/playbooks/dsvm/run.yaml b/tools/playbooks/dsvm/run.yaml
new file mode 100644
index 0000000000..b0e96bc79b
--- /dev/null
+++ b/tools/playbooks/dsvm/run.yaml
@@ -0,0 +1,11 @@
+- hosts: all
+  tasks:
+    - name: Run func tests with Keystone users
+      include_role:
+        name: tox
+    - name: Run func tests with tempauth users
+      include_role:
+        name: tox
+      vars:
+        tox_environment:
+          SWIFT_TEST_CONFIG_FILE: test/sample.conf
diff --git a/tools/playbooks/multinode_setup/common_config.yaml b/tools/playbooks/multinode_setup/common_config.yaml
new file mode 100644
index 0000000000..a81f449e3b
--- /dev/null
+++ b/tools/playbooks/multinode_setup/common_config.yaml
@@ -0,0 +1,75 @@
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+- hosts: swift-cluster
+  become: true
+  tasks:
+
+    - name: create /var/run/swift
+      file:
+        path: '/var/run/swift'
+        owner: '{{ ansible_user_id }}'
+        group: '{{ ansible_user_gid }}'
+        state: directory
+
+    - name: create /var/cache/swift
+      file:
+        path: '/var/cache/swift'
+        owner: '{{ ansible_user_id }}'
+        group: '{{ ansible_user_gid }}'
+        state: directory
+
+    - name: create rc.local from template
+      template: src=rc.local.j2 dest=/etc/rc.d/rc.local owner=root group=root mode=0755
+
+    - name: set selinux to permissive
+      selinux: policy=targeted state=disabled
+
+    - name: configure rsyslog
+      command: cp {{ zuul.project.src_dir }}/doc/saio/rsyslog.d/10-swift.conf /etc/rsyslog.d/
+
+    - name: modify /etc/rsyslog.conf
+      lineinfile: dest=/etc/rsyslog.conf
+                  line="$PrivDropToGroup adm"
+                  create=yes
+                  insertafter="^#### GLOBAL DIRECTIVES"
+
+    - name: assure /var/log/swift directory exists
+      file:
+         path: '/var/log/swift'
+         state: directory
+         owner: root
+         group: adm
+         mode: 'g+wt'
+
+    - name: restart rsyslog
+      service: name=rsyslog state=restarted enabled=yes
+
+    - name: clean up /etc/swift directory
+      file:
+        path: '/etc/swift'
+        state: absent
+
+    - name: create /etc/swift directory
+      file:
+        path: '/etc/swift'
+        state: directory
+        owner: '{{ ansible_user_id }}'
+        group: '{{ ansible_user_gid }}'
+
+- hosts: test-runner
+  tasks:
+    - name: add new env. variable for running tests
+      lineinfile: dest=/home/{{ ansible_user }}/.bashrc line="export SWIFT_TEST_CONFIG_FILE=/home/{{ ansible_user}}/test.conf"
+
+    - name: copy the sample configuration files for running tests
+      template: src=test.conf.j2 dest=/home/{{ ansible_user }}/test.conf
diff --git a/tools/playbooks/multinode_setup/configure_loopback.yaml b/tools/playbooks/multinode_setup/configure_loopback.yaml
new file mode 100644
index 0000000000..f1b134e8d7
--- /dev/null
+++ b/tools/playbooks/multinode_setup/configure_loopback.yaml
@@ -0,0 +1,64 @@
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+- hosts: storage
+  become: true
+  tasks:
+    - name: assure /srv directory exists
+      file:
+        path: '/srv'
+        state: directory
+
+    - name: create loopback device
+      command: truncate -s 1GB /srv/swift-disk creates=/srv/swift-disk
+
+    - name: create filesystem /srv/swift-disk
+      become: true
+      filesystem: fstype=xfs dev=/srv/swift-disk
+
+    - name: create mount path /mnt/sdb1
+      file:
+        path: '/mnt/sdb1'
+        state: directory
+
+    - name: mount /mnt/sdb1
+      mount: name=/mnt/sdb1 src=/srv/swift-disk fstype=xfs opts="loop,noatime" dump=0 passno=0 state=mounted
+
+    - name: create sub-partitions
+      file:
+        path: '/mnt/sdb1/{{ item }}'
+        state: directory
+        owner: '{{ ansible_user_id }}'
+        group: '{{ ansible_user_gid }}'
+      with_items:
+        - 1
+
+    - name: create symlinks
+      become: true
+      file:
+        src: '/mnt/sdb1/{{ item }}'
+        dest: '/srv/{{ item }}'
+        owner: '{{ ansible_user_id }}'
+        group: '{{ ansible_user_gid }}'
+        state: link
+      with_items:
+        - 1
+
+    - name: create node partition directories
+      file:
+        path: '/srv/1/node/sdb{{ item }}'
+        owner: '{{ ansible_user_id }}'
+        group: '{{ ansible_user_gid }}'
+        state: directory
+      with_items:
+        - [1, 2, 3, 4, 5, 6, 7, 8]
+
diff --git a/tools/playbooks/multinode_setup/make_rings.yaml b/tools/playbooks/multinode_setup/make_rings.yaml
new file mode 100644
index 0000000000..aea55e5e7b
--- /dev/null
+++ b/tools/playbooks/multinode_setup/make_rings.yaml
@@ -0,0 +1,145 @@
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+- hosts: all
+  tasks:
+    - name: get latest release
+      shell:
+        cmd: git describe --abbrev=0
+        executable: /bin/bash
+        chdir: '{{ zuul.project.src_dir }}'
+      register: latest_swift_release
+
+    - name: "checkout a previous version: {{ previous_swift_version | default(latest_swift_release.stdout) }}"
+      shell:
+        cmd: git checkout {{ previous_swift_version | default(latest_swift_release.stdout) }} -b previous_swift_version
+        executable: /bin/bash
+        chdir: '{{ zuul.project.src_dir }}'
+
+    - name: confirm checked out version
+      shell:
+        cmd: git describe
+        executable: /bin/bash
+        chdir: '{{ zuul.project.src_dir }}'
+
+    - name: build swift
+      shell:
+        cmd: python3 setup.py sdist
+        executable: /bin/bash
+        chdir: '{{ zuul.project.src_dir }}'
+
+    - name: install swift
+      become: true
+      shell:
+        cmd: pip install dist/swift-*.tar.gz
+        executable: /bin/bash
+        chdir: '{{ zuul.project.src_dir }}'
+
+
+- hosts: proxy
+  become: true
+  tasks:
+    - name: start memcache
+      service: name=memcached state=started enabled=yes
+
+    - name: copy proxy-server.conf file
+      command: cp -r {{ zuul.project.src_dir }}/doc/saio/swift/proxy-server.conf /etc/swift
+
+    - name: set the options in the proxy config file
+      shell:
+        cmd: |
+          crudini --set /etc/swift/proxy-server.conf DEFAULT bind_ip {{ hostvars['proxy1'].nodepool.private_ipv4 }}
+          crudini --set /etc/swift/proxy-server.conf DEFAULT user {{ ansible_user_id }}
+          crudini --set /etc/swift/proxy-server.conf app:proxy-server node_timeout 20
+        executable: /bin/bash
+
+- hosts: account
+  become: true
+  tasks:
+    - name: copy account-server.conf file
+      command: cp -r {{ zuul.project.src_dir }}/doc/saio/swift/account-server/1.conf /etc/swift/account-server.conf
+
+    - name: set the options in the account config file
+      shell:
+        cmd: |
+          crudini --set /etc/swift/account-server.conf DEFAULT bind_ip {{ hostvars['account1'].nodepool.private_ipv4 }}
+          crudini --set /etc/swift/account-server.conf DEFAULT user {{ ansible_user_id }}
+        executable: /bin/bash
+
+- hosts: container
+  become: true
+  tasks:
+    - name: copy container-server.conf file
+      command: cp -r {{ zuul.project.src_dir }}/doc/saio/swift/container-server/1.conf /etc/swift/container-server.conf
+
+    - name: set the options in the container config file
+      shell:
+        cmd: |
+          crudini --set /etc/swift/container-server.conf DEFAULT bind_ip {{ hostvars['container1'].nodepool.private_ipv4 }}
+          crudini --set /etc/swift/container-server.conf DEFAULT user {{ ansible_user_id }}
+        executable: /bin/bash
+
+- hosts: object
+  become: true
+  tasks:
+    - name: copy object-server.conf file
+      command: cp -r {{ zuul.project.src_dir }}/doc/saio/swift/object-server/1.conf /etc/swift/object-server.conf
+
+    - name: set the options in the object config file
+      shell:
+        cmd: |
+          crudini --set /etc/swift/object-server.conf DEFAULT bind_ip {{ hostvars['object1'].nodepool.private_ipv4 }}
+          crudini --set /etc/swift/object-server.conf DEFAULT user {{ ansible_user_id }}
+          crudini --set /etc/swift/object-server.conf DEFAULT conn_timeout 3
+          crudini --set /etc/swift/object-server.conf DEFAULT container_update_timeout 3
+        executable: /bin/bash
+
+- hosts: swift-cluster
+  become: true
+  tasks:
+    - name: copy swift.conf
+      command: cp -r {{ zuul.project.src_dir }}/doc/saio/swift/swift.conf /etc/swift
+
+    - name: set correct ownership of /etc/swift
+      file: path=/etc/swift owner={{ ansible_user_id }} group={{ ansible_user_gid }} recurse=yes
+
+- hosts: test-runner
+  tasks:
+
+    - name: Set base port for old stable branches
+      set_fact:
+        swift_base_port: 6000
+      when: previous_swift_version | default(latest_swift_release.stdout) is match("^(rocky|stein|train|ussuri)-em.*|^2\.(1?[0-9]|2[0-5])\.|^(origin/)?stable/[a-u].*")
+
+    - name: Set base port for Victoria and later
+      set_fact:
+        swift_base_port: 6200
+      when: previous_swift_version | default(latest_swift_release.stdout) is not match("^(rocky|stein|train|ussuri)-em.*|^2\.(1?[0-9]|2[0-5])\.|^(origin/)?stable/[a-u].*")
+
+    - name: create remakerings from template
+      template: src=make_multinode_rings.j2 dest=/home/{{ ansible_user }}/make_multinode_rings mode=0755
+
+    - name: create rings dir
+      file: >
+        path=/home/{{ ansible_user }}/rings
+        state=directory
+
+    - name: make rings
+      shell:
+        cmd: /home/{{ ansible_user }}/make_multinode_rings
+        executable: /bin/bash
+
+    - name: scp rings to all swift-cluster nodes
+      command: scp -o UserKnownHostsFile=/dev/null -o StrictHostKeyChecking=no -o ConnectTimeout=5 -o ConnectionAttempts=360 /home/{{ ansible_user }}/rings/{{ item[0] }} {{ ansible_user }}@{{ hostvars[item[1]].nodepool.private_ipv4 }}:/etc/swift
+      with_nested:
+        - ['account.ring.gz', 'container.ring.gz', 'object.ring.gz', 'object-1.ring.gz', 'object-2.ring.gz']
+        - "{{ groups['swift-cluster'] }}"
diff --git a/tools/playbooks/multinode_setup/pre.yaml b/tools/playbooks/multinode_setup/pre.yaml
new file mode 100644
index 0000000000..55eb8d1991
--- /dev/null
+++ b/tools/playbooks/multinode_setup/pre.yaml
@@ -0,0 +1,7 @@
+- hosts: all
+  roles:
+    # Run bindep and test-setup after devstack so that they won't interfere
+    - role: bindep
+      bindep_dir: "{{ zuul_work_dir }}"
+    - test-setup
+    - ensure-tox
diff --git a/tools/playbooks/multinode_setup/run.yaml b/tools/playbooks/multinode_setup/run.yaml
new file mode 100644
index 0000000000..a842a36236
--- /dev/null
+++ b/tools/playbooks/multinode_setup/run.yaml
@@ -0,0 +1,49 @@
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+- hosts: storage
+  tasks:
+
+    - name: remove old swift
+      become: true
+      shell:
+        cmd: pip uninstall -y swift
+        executable: /bin/bash
+        chdir: '{{ zuul.project.src_dir }}'
+
+    - name: checkout master swift
+      shell:
+        cmd: git checkout master
+        executable: /bin/bash
+        chdir: '{{ zuul.project.src_dir }}'
+
+    - name: install swift
+      become: true
+      shell:
+        cmd: python3 setup.py develop
+        executable: /bin/bash
+        chdir: '{{ zuul.project.src_dir }}'
+
+- hosts: swift-cluster
+  tasks:
+    - name: start services
+      command: swift-init main start
+
+- hosts: test-runner
+  tasks:
+    - name: Run func tests with tempauth users
+      include_role:
+        name: tox
+      vars:
+        tox_environment:
+          TOX_CONSTRAINTS_FILE: https://releases.openstack.org/constraints/upper/yoga
+          SWIFT_TEST_CONFIG_FILE: /home/{{ ansible_user }}/test.conf
diff --git a/tools/playbooks/multinode_setup/templates/make_multinode_rings.j2 b/tools/playbooks/multinode_setup/templates/make_multinode_rings.j2
new file mode 100755
index 0000000000..500448f3d9
--- /dev/null
+++ b/tools/playbooks/multinode_setup/templates/make_multinode_rings.j2
@@ -0,0 +1,38 @@
+#!/bin/bash
+
+set -e
+
+cd /home/{{ ansible_user }}/rings
+
+rm -f *.builder *.ring.gz backups/*.builder backups/*.ring.gz
+
+swift-ring-builder object.builder create 10 3 1
+swift-ring-builder object.builder add r1z1-{{ hostvars['object1'].nodepool.private_ipv4 }}:{{ swift_base_port + 10 }}/sdb1 1
+swift-ring-builder object.builder add r1z1-{{ hostvars['object1'].nodepool.private_ipv4 }}:{{ swift_base_port + 10 }}/sdb2 1
+swift-ring-builder object.builder add r1z1-{{ hostvars['object1'].nodepool.private_ipv4 }}:{{ swift_base_port + 10 }}/sdb3 1
+swift-ring-builder object.builder rebalance
+swift-ring-builder object-1.builder create 10 2 1
+swift-ring-builder object-1.builder add r1z1-{{ hostvars['object1'].nodepool.private_ipv4 }}:{{ swift_base_port + 10 }}/sdb1 1
+swift-ring-builder object-1.builder add r1z1-{{ hostvars['object1'].nodepool.private_ipv4 }}:{{ swift_base_port + 10 }}/sdb2 1
+swift-ring-builder object-1.builder add r1z1-{{ hostvars['object1'].nodepool.private_ipv4 }}:{{ swift_base_port + 10 }}/sdb3 1
+swift-ring-builder object-1.builder rebalance
+swift-ring-builder object-2.builder create 10 6 1
+swift-ring-builder object-2.builder add r1z1-{{ hostvars['object1'].nodepool.private_ipv4 }}:{{ swift_base_port + 10 }}/sdb1 1
+swift-ring-builder object-2.builder add r1z1-{{ hostvars['object1'].nodepool.private_ipv4 }}:{{ swift_base_port + 10 }}/sdb2 1
+swift-ring-builder object-2.builder add r1z1-{{ hostvars['object1'].nodepool.private_ipv4 }}:{{ swift_base_port + 10 }}/sdb3 1
+swift-ring-builder object-2.builder add r1z1-{{ hostvars['object1'].nodepool.private_ipv4 }}:{{ swift_base_port + 10 }}/sdb4 1
+swift-ring-builder object-2.builder add r1z1-{{ hostvars['object1'].nodepool.private_ipv4 }}:{{ swift_base_port + 10 }}/sdb5 1
+swift-ring-builder object-2.builder add r1z1-{{ hostvars['object1'].nodepool.private_ipv4 }}:{{ swift_base_port + 10 }}/sdb6 1
+swift-ring-builder object-2.builder add r1z1-{{ hostvars['object1'].nodepool.private_ipv4 }}:{{ swift_base_port + 10 }}/sdb7 1
+swift-ring-builder object-2.builder add r1z1-{{ hostvars['object1'].nodepool.private_ipv4 }}:{{ swift_base_port + 10 }}/sdb8 1
+swift-ring-builder object-2.builder rebalance
+swift-ring-builder container.builder create 10 3 1
+swift-ring-builder container.builder add r1z1-{{ hostvars['container1'].nodepool.private_ipv4 }}:{{ swift_base_port + 11 }}/sdb1 1
+swift-ring-builder container.builder add r1z1-{{ hostvars['container1'].nodepool.private_ipv4 }}:{{ swift_base_port + 11 }}/sdb2 1
+swift-ring-builder container.builder add r1z1-{{ hostvars['container1'].nodepool.private_ipv4 }}:{{ swift_base_port + 11 }}/sdb3 1
+swift-ring-builder container.builder rebalance
+swift-ring-builder account.builder create 10 3 1
+swift-ring-builder account.builder add r1z1-{{ hostvars['account1'].nodepool.private_ipv4 }}:{{ swift_base_port + 12 }}/sdb1 1
+swift-ring-builder account.builder add r1z1-{{ hostvars['account1'].nodepool.private_ipv4 }}:{{ swift_base_port + 12 }}/sdb2 1
+swift-ring-builder account.builder add r1z1-{{ hostvars['account1'].nodepool.private_ipv4 }}:{{ swift_base_port + 12 }}/sdb3 1
+swift-ring-builder account.builder rebalance
diff --git a/tools/playbooks/multinode_setup/templates/rc.local.j2 b/tools/playbooks/multinode_setup/templates/rc.local.j2
new file mode 100644
index 0000000000..6e783bb6ce
--- /dev/null
+++ b/tools/playbooks/multinode_setup/templates/rc.local.j2
@@ -0,0 +1,8 @@
+#!/bin/bash
+
+mkdir -p /var/cache/swift
+chown {{ ansible_user_id }}:{{ ansible_user_gid }} /var/cache/swift*
+mkdir -p /var/run/swift
+chown {{ ansible_user_id }}:{{ ansible_user_gid }} /var/run/swift
+
+exit 0
diff --git a/tools/playbooks/multinode_setup/templates/test.conf.j2 b/tools/playbooks/multinode_setup/templates/test.conf.j2
new file mode 100644
index 0000000000..59328ee3bf
--- /dev/null
+++ b/tools/playbooks/multinode_setup/templates/test.conf.j2
@@ -0,0 +1,122 @@
+[func_test]
+# Sample config for Swift with tempauth
+auth_host = {{ hostvars['proxy1'].nodepool.private_ipv4 }}
+auth_port = 8080
+auth_ssl = no
+auth_prefix = /auth/
+# Sample config for Swift with Keystone v2 API.
+# For keystone v2 change auth_version to 2 and auth_prefix to /v2.0/.
+# And "allow_account_management" should not be set "true".
+#auth_version = 3
+#auth_host = localhost
+#auth_port = 5000
+#auth_ssl = no
+#auth_prefix = /v3/
+
+# Primary functional test account (needs admin access to the account)
+account = test
+username = tester
+password = testing
+s3_access_key = test:tester
+s3_secret_key = testing
+
+# User on a second account (needs admin access to the account)
+account2 = test2
+username2 = tester2
+password2 = testing2
+
+# User on same account as first, but without admin access
+username3 = tester3
+password3 = testing3
+# s3api requires the same account with the primary one and different users
+s3_access_key2 = test:tester3
+s3_secret_key2 = testing3
+
+# Fourth user is required for keystone v3 specific tests.
+# Account must be in a non-default domain.
+#account4 = test4
+#username4 = tester4
+#password4 = testing4
+#domain4 = test-domain
+
+# Fifth user is required for service token-specific tests.
+# The account must be different from the primary test account.
+# The user must not have a group (tempauth) or role (keystoneauth) on
+# the primary test account. The user must have a group/role that is unique
+# and not given to the primary tester and is specified in the options
+# <prefix>_require_group (tempauth) or <prefix>_service_roles (keystoneauth).
+#account5 = test5
+#username5 = tester5
+#password5 = testing5
+
+# The service_prefix option is used for service token-specific tests.
+# If service_prefix or username5 above is not supplied, the tests are skipped.
+# To set the value and enable the service token tests, look at the
+# reseller_prefix option in /etc/swift/proxy-server.conf. There must be at
+# least two prefixes. If not, add a prefix as follows (where we add SERVICE):
+#     reseller_prefix = AUTH, SERVICE
+# The service_prefix must match the <prefix> used in <prefix>_require_group
+# (tempauth) or <prefix>_service_roles (keystoneauth); for example:
+#    SERVICE_require_group = service
+#    SERVICE_service_roles = service
+# Note: Do not enable service token tests if the first prefix in
+# reseller_prefix is the empty prefix AND the primary functional test
+# account contains an underscore.
+#service_prefix = SERVICE
+
+# Sixth user is required for access control tests.
+# Account must have a role for reseller_admin_role(keystoneauth).
+#account6 = test
+#username6 = tester6
+#password6 = testing6
+
+collate = C
+
+# Only necessary if a pre-existing server uses self-signed certificate
+insecure = no
+
+# Tests that are dependent on domain_remap middleware being installed also
+# require one of the domain_remap storage_domain values to be specified here,
+# otherwise those tests will be skipped.
+storage_domain =
+
+[unit_test]
+fake_syslog = False
+
+[probe_test]
+# check_server_timeout = 30
+# validate_rsync = false
+
+[swift-constraints]
+# The functional test runner will try to use the constraint values provided in
+# the swift-constraints section of test.conf.
+#
+# If a constraint value does not exist in that section, or because the
+# swift-constraints section does not exist, the constraints values found in
+# the /info API call (if successful) will be used.
+#
+# If a constraint value cannot be found in the /info results, either because
+# the /info API call failed, or a value is not present, the constraint value
+# used will fall back to those loaded by the constraints module at time of
+# import (which will attempt to load /etc/swift/swift.conf, see the
+# swift.common.constraints module for more information).
+#
+# Note that the cluster must have "sane" values for the test suite to pass
+# (for some definition of sane).
+#
+#max_file_size = 5368709122
+#max_meta_name_length = 128
+#max_meta_value_length = 256
+#max_meta_count = 90
+#max_meta_overall_size = 4096
+#max_header_size = 8192
+#extra_header_count = 0
+#max_object_name_length = 1024
+#container_listing_limit = 10000
+#account_listing_limit = 10000
+#max_account_name_length = 256
+#max_container_name_length = 256
+
+# Newer swift versions default to strict cors mode, but older ones were the
+# opposite.
+#strict_cors_mode = true
diff --git a/tools/playbooks/probetests/post.yaml b/tools/playbooks/probetests/post.yaml
new file mode 100644
index 0000000000..e9dfea1ca4
--- /dev/null
+++ b/tools/playbooks/probetests/post.yaml
@@ -0,0 +1,31 @@
+- hosts: all
+  become: true
+  tasks:
+    - name: Ensure swift logs are readable before syncing
+      file:
+        path: '/var/log/swift'
+        mode: u=rwX,g=rX,o=rX
+        state: directory
+        recurse: yes
+    - name: Copy swift logs from worker nodes to executor node
+      synchronize:
+        src: '/var/log/swift/'
+        dest: '{{ zuul.executor.log_root }}'
+        mode: pull
+        copy_links: true
+        verify_host: true
+      failed_when: false
+    - name: Ensure swift configs are readable before syncing
+      file:
+        path: '/etc/swift'
+        mode: u=rwX,g=rX,o=rX
+        state: directory
+        recurse: yes
+    - name: Copy swift config from worker nodes to executor node
+      synchronize:
+        src: '/etc/swift/'
+        dest: '{{ zuul.executor.log_root }}'
+        mode: pull
+        copy_links: true
+        verify_host: true
+      failed_when: false
diff --git a/bin/swift-proxy-server b/tools/playbooks/probetests/run.yaml
old mode 100755
new mode 100644
similarity index 65%
rename from bin/swift-proxy-server
rename to tools/playbooks/probetests/run.yaml
index 9aa938ddb3..e6ea0a21ff
--- a/bin/swift-proxy-server
+++ b/tools/playbooks/probetests/run.yaml
@@ -1,5 +1,6 @@
-#!/usr/bin/env python
-# Copyright (c) 2010-2012 OpenStack, LLC.
+
+
+# Copyright (c) 2018 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,10 +14,13 @@
 # implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
+- hosts: all
 
-from swift.common.utils import parse_options
-from swift.common.wsgi import run_wsgi
-
-if __name__ == '__main__':
-    conf_file, options = parse_options()
-    run_wsgi(conf_file, 'proxy-server', default_port=8080, **options)
+  tasks:
+    - name: run probe tests
+      shell:
+        cmd: |
+          source ~/.bashrc
+          pytest test/probe/ || pytest --last-failed test/probe/
+        executable: /bin/bash
+        chdir: '{{ zuul.project.src_dir }}'
diff --git a/bin/swift-account-server b/tools/playbooks/s3api-tests/run.yaml
old mode 100755
new mode 100644
similarity index 65%
rename from bin/swift-account-server
rename to tools/playbooks/s3api-tests/run.yaml
index 13dd048bf6..d73c2d840f
--- a/bin/swift-account-server
+++ b/tools/playbooks/s3api-tests/run.yaml
@@ -1,5 +1,4 @@
-#!/usr/bin/env python
-# Copyright (c) 2010-2012 OpenStack, LLC.
+# Copyright (c) 2022 NVIDIA
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,10 +12,12 @@
 # implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
-
-from swift.common.utils import parse_options
-from swift.common.wsgi import run_wsgi
-
-if __name__ == '__main__':
-    conf_file, options = parse_options()
-    run_wsgi(conf_file, 'account-server', default_port=6002, **options)
+- hosts: all
+  roles:
+    - ensure-tox
+  tasks:
+    - name: Run s3api tests
+      include_role:
+        name: tox
+      vars:
+        tox_envlist: s3api
diff --git a/tools/playbooks/saio_single_node_setup/add_s3api.yaml b/tools/playbooks/saio_single_node_setup/add_s3api.yaml
new file mode 100644
index 0000000000..24160cfba9
--- /dev/null
+++ b/tools/playbooks/saio_single_node_setup/add_s3api.yaml
@@ -0,0 +1,31 @@
+# Copyright (c) 2018 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+- hosts: all
+  tasks:
+    # TODO: remove this task when s3api is in the pipeline by default
+    - name: Add s3api in proxy-server.conf
+      replace:
+          path: "/etc/swift/proxy-server.conf"
+          regexp: "container_sync tempauth"
+          replace: "container_sync s3api tempauth"
+      become: true
+
+    - name: Set s3_acl option
+      ini_file:
+          path: "/etc/swift/proxy-server.conf"
+          section: "filter:s3api"
+          option: "s3_acl"
+          value: "{{ s3_acl }}"
+      become: true
diff --git a/bin/swift-account-auditor b/tools/playbooks/saio_single_node_setup/make_rings.yaml
old mode 100755
new mode 100644
similarity index 61%
rename from bin/swift-account-auditor
rename to tools/playbooks/saio_single_node_setup/make_rings.yaml
index a342f6ae2f..f68a7a47c6
--- a/bin/swift-account-auditor
+++ b/tools/playbooks/saio_single_node_setup/make_rings.yaml
@@ -1,5 +1,5 @@
-#!/usr/bin/env python
-# Copyright (c) 2010-2012 OpenStack, LLC.
+
+# Copyright (c) 2018 OpenStack Foundation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,11 +13,18 @@
 # implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
+- hosts: all
+  tasks:
+    - name: install swift
+      become: true
+      pip:
+        state: present
+        name: .
+        chdir: '{{ zuul.project.src_dir }}'
+        editable: true
 
-from swift.account.auditor import AccountAuditor
-from swift.common.utils import parse_options
-from swift.common.daemon import run_daemon
-
-if __name__ == '__main__':
-    conf_file, options = parse_options(once=True)
-    run_daemon(AccountAuditor, conf_file, **options)
+    - name: make rings
+      shell:
+        cmd: remakerings
+        executable: /bin/bash
+        chdir: '/etc/swift'
diff --git a/tools/playbooks/saio_single_node_setup/setup_saio.yaml b/tools/playbooks/saio_single_node_setup/setup_saio.yaml
new file mode 100644
index 0000000000..5353be184f
--- /dev/null
+++ b/tools/playbooks/saio_single_node_setup/setup_saio.yaml
@@ -0,0 +1,182 @@
+# Copyright (c) 2018 OpenStack Foundation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+- hosts: all
+  become: true
+  tasks:
+    - name: assure /srv directory exists
+      file: path=/srv state=directory
+
+    - name: create loopback device
+      command: truncate -s 10GB /srv/swift-disk creates=/srv/swift-disk
+
+    - name: create filesystem /srv/swift-disk
+      become: true
+      filesystem: fstype=xfs dev=/srv/swift-disk
+
+    - name: create mount path /mnt/sdb1
+      file: path=/mnt/sdb1 state=directory
+
+    - name: mount /mnt/sdb1
+      mount: name=/mnt/sdb1 src=/srv/swift-disk fstype=xfs opts="loop,noatime" dump=0 passno=0 state=mounted
+
+    - name: create sub-partitions
+      file: >
+        path=/mnt/sdb1/{{ item }}
+        state=directory
+        owner={{ ansible_user_id }}
+        group={{ ansible_user_gid }}
+      with_items:
+        - 1
+        - 2
+        - 3
+        - 4
+
+    - name: create symlinks
+      become: true
+      file: >
+        src=/mnt/sdb1/{{ item }}
+        dest=/srv/{{ item }}
+        owner={{ ansible_user_id }}
+        group={{ ansible_user_gid }}
+        state=link
+      with_items:
+        - 1
+        - 2
+        - 3
+        - 4
+
+    - name: create node partition directories
+      file: >
+        path=/srv/{{ item[1] }}/node/sdb{{ item[0] + item[1] }}
+        owner={{ ansible_user_id }}
+        group={{ ansible_user_gid }}
+        state=directory
+      with_nested:
+        - [0, 4]
+        - [1, 2, 3, 4]
+
+    - name: create /var/run/swift
+      file: >
+        path=/var/run/swift
+        owner={{ ansible_user_id }}
+        group={{ ansible_user_gid }}
+        state=directory
+
+    - name: create /var/cache/swift
+      file: >
+        path=/var/cache/swift
+        owner={{ ansible_user_id }}
+        group={{ ansible_user_gid }}
+        state=directory
+
+    - name: create /var/cache/swift[n]
+      file: >
+        path=/var/cache/swift{{ item }}
+        owner={{ ansible_user_id }}
+        group={{ ansible_user_gid }}
+        state=directory
+      with_items:
+        - 2
+        - 3
+        - 4
+
+    - name: create rc.local from template
+      template: src=rc.local.j2 dest=/etc/rc.d/rc.local owner=root group=root mode=0755
+
+    - name: create /etc/rsyncd.conf
+      command: cp {{ zuul.project.src_dir }}/doc/saio/rsyncd.conf /etc/
+
+    - name: update rsyncd.conf with correct username
+      replace: dest=/etc/rsyncd.conf regexp=<your-user-name> replace={{ ansible_user_id }}
+
+    - name: enable rsync
+      lineinfile: dest=/etc/xinetd.d/rsync line="disable = no" create=yes
+
+    - name: set selinux to permissive
+      selinux: policy=targeted state=disabled
+
+    - name: restart rsync
+      service: name=rsyncd state=restarted enabled=yes
+
+    - name: start memcache
+      service: name=memcached state=started enabled=yes
+
+    - name: configure rsyslog
+      command: cp {{ zuul.project.src_dir }}/doc/saio/rsyslog.d/10-swift.conf /etc/rsyslog.d/
+
+    - name: modify /etc/rsyslog.conf
+      lineinfile: dest=/etc/rsyslog.conf
+                  line="$PrivDropToGroup adm"
+                  create=yes
+                  insertafter="^#### GLOBAL DIRECTIVES"
+
+    - name: assure /var/log/swift directory exists
+      file: path=/var/log/swift
+            state=directory
+            owner=root
+            group=adm
+            mode="g+w"
+
+    - name: restart rsyslog
+      service: name=rsyslog state=restarted enabled=yes
+
+    - name: clean up /etc/swift directory
+      file: path=/etc/swift state=absent
+
+    - name: create clean /etc/swift
+      command: cp -r {{ zuul.project.src_dir }}/doc/saio/swift /etc/swift
+
+    - name: copy the sample configuration files for running tests
+      command: cp -r {{ zuul.project.src_dir }}/test/sample.conf /etc/swift/test.conf
+
+    - name: set correct ownership of /etc/swift
+      file: path=/etc/swift owner={{ ansible_user_id }} group={{ ansible_user_gid }} recurse=yes
+
+    - name: find config files to modify user option
+      find: paths="/etc/swift" patterns="*.conf" recurse=yes
+      register: find_result
+
+    - name: replace user name
+      replace: dest={{ item.path }} regexp=<your-user-name> replace={{ ansible_user_id }}
+      with_items: "{{ find_result.files }}"
+
+    - name: set the options in the proxy config file
+      ini_file:
+        path: /etc/swift/proxy-server.conf
+        section: app:proxy-server
+        option: node_timeout
+        value: 20
+        create: no
+
+    - name: copy the SAIO scripts for resetting the environment
+      command: cp -r {{ zuul.project.src_dir }}/doc/saio/bin /home/{{ ansible_user }}/bin creates=/home/{{ ansible_user }}/bin
+
+    - name: set the correct file mode for SAIO scripts
+      file: dest=/home/{{ ansible_user }}/bin mode=0777 recurse=yes
+
+    - name: add new env. variable for loopback device
+      lineinfile: dest=/home/{{ ansible_user }}/.bashrc line="export SAIO_BLOCK_DEVICE=/srv/swift-disk"
+
+    - name: remove line from resetswift
+      lineinfile: dest=/home/{{ ansible_user }}/bin/resetswift line="sudo find /var/log/swift -type f -exec rm -f {} \;" state=absent
+
+    - name: add new env. variable for running tests
+      lineinfile: dest=/home/{{ ansible_user }}/.bashrc line="export SWIFT_TEST_CONFIG_FILE=/etc/swift/test.conf"
+
+    - name: make sure PATH includes the bin directory
+      lineinfile: dest=/home/{{ ansible_user }}/.bashrc line="export PATH=${PATH}:/home/{{ ansible_user }}/bin"
+
+    - name: increase open files limit to run probe tests
+      lineinfile: dest=/home/{{ ansible_user }}/.bashrc line="ulimit -n 4096"
diff --git a/tools/playbooks/saio_single_node_setup/templates/rc.local.j2 b/tools/playbooks/saio_single_node_setup/templates/rc.local.j2
new file mode 100644
index 0000000000..6d6eda23a5
--- /dev/null
+++ b/tools/playbooks/saio_single_node_setup/templates/rc.local.j2
@@ -0,0 +1,8 @@
+#!/bin/bash
+
+mkdir -p /var/cache/swift /var/cache/swift2 /var/cache/swift3 /var/cache/swift4
+chown {{ ansible_user_id }}:{{ ansible_user_gid }} /var/cache/swift*
+mkdir -p /var/run/swift
+chown {{ ansible_user_id }}:{{ ansible_user_gid }} /var/run/swift
+
+exit 0
diff --git a/tools/test-requires b/tools/test-requires
deleted file mode 100644
index 01c80d919f..0000000000
--- a/tools/test-requires
+++ /dev/null
@@ -1,8 +0,0 @@
-coverage
-nose
-nosexcover
-openstack.nose_plugin
-nosehtmloutput
-pep8==1.3.3
-sphinx>=1.1.2
-mock>=0.8.0
diff --git a/tools/test-setup.sh b/tools/test-setup.sh
new file mode 100755
index 0000000000..b2e41fc856
--- /dev/null
+++ b/tools/test-setup.sh
@@ -0,0 +1,42 @@
+#!/bin/bash -xe
+
+# Set up a partition formatted with XFS to use as TMPDIR for our tests.
+# OpenStack CI will invoke this script as part of tox based tests.
+# The file .zuul.yaml set TMPDIR to $HOME/xfstmp.
+
+# Create a large-ish file that we will mount as a loopback
+truncate -s 1GB $HOME/1G_xfs_file
+# Format the new file as XFS.
+/sbin/mkfs.xfs $HOME/1G_xfs_file
+# loopback mount the file
+mkdir -p $HOME/xfstmp
+sudo mount -o loop,noatime,nodiratime $HOME/1G_xfs_file $HOME/xfstmp
+sudo chmod 777 $HOME/xfstmp
+
+# Install liberasurecode-devel for CentOS from RDO repository.
+
+function is_rhel8 {
+    [ -f /usr/bin/dnf ] && \
+        cat /etc/*release | grep -q -e "Red Hat" -e "CentOS" -e "CloudLinux" && \
+        cat /etc/*release | grep -q 'release 8'
+}
+function is_rhel9 {
+    [ -f /usr/bin/dnf ] && \
+        cat /etc/*release | grep -q -e "Red Hat" -e "CentOS" -e "CloudLinux" && \
+        cat /etc/*release | grep -q 'release 9'
+}
+
+
+if is_rhel8; then
+    # Install CentOS OpenStack repos so that we have access to some extra
+    # packages.
+    sudo dnf install -y centos-release-openstack-xena
+    sudo dnf install -y liberasurecode-devel
+fi
+
+if is_rhel9; then
+    # Install CentOS OpenStack repos so that we have access to some extra
+    # packages.
+    sudo dnf install -y centos-release-openstack-yoga
+    sudo dnf install -y liberasurecode-devel
+fi
diff --git a/tox.ini b/tox.ini
index 004958cc49..1036f66baf 100644
--- a/tox.ini
+++ b/tox.ini
@@ -1,30 +1,159 @@
 [tox]
-envlist = py26,py27,pep8
+envlist = py3,pep8
+minversion = 3.18.0
+
+[pytest]
+addopts = --verbose -p no:requests_mock -r a
 
 [testenv]
+usedevelop = True
+install_command = pip install {opts} {packages}
 setenv = VIRTUAL_ENV={envdir}
-         NOSE_WITH_OPENSTACK=1
-         NOSE_OPENSTACK_COLOR=1
-         NOSE_OPENSTACK_RED=0.05
-         NOSE_OPENSTACK_YELLOW=0.025
-         NOSE_OPENSTACK_SHOW_ELAPSED=1
-         NOSE_OPENSTACK_STDOUT=1
 deps =
-  -r{toxinidir}/tools/pip-requires
-  -r{toxinidir}/tools/test-requires
-commands = nosetests test/unit {posargs}
+  -c{env:TOX_CONSTRAINTS_FILE:https://releases.openstack.org/constraints/upper/master}
+  -r{toxinidir}/requirements.txt
+  -r{toxinidir}/test-requirements.txt
+commands =
+  find {envdir} ( -type f -o -type l ) -name "*.py[co]" -delete
+  find {envdir} -type d -name "__pycache__" -delete
+  bash -ec "pytest --cov=swift --cov-branch --cov-report=html:cover --cov-report term {posargs:test/unit} || pytest --last-failed {posargs:test/unit}"
+allowlist_externals =
+  bash
+  find
+passenv = SWIFT_*
+          COLUMNS
+
+[testenv:s3api]
+usedevelop = False
+deps = {[testenv:py37]deps}
+commands =
+  pytest {posargs:test/s3api}
+# For some reason we hit some EPERM issue when building the package for these tests?
+# (CentOS 8, CPython 3.6, tox 3.28.0)
+skipsdist = True
+skip_install = True
+
+[testenv:py37]
+deps =
+  -c{toxinidir}/py3-constraints.txt
+  -r{toxinidir}/requirements.txt
+  -r{toxinidir}/test-requirements.txt
 
-[tox:jenkins]
-downloadcache = ~/cache/pip
+[testenv:py38]
+deps = {[testenv:py37]deps}
+
+[testenv:py39]
+deps = {[testenv:py37]deps}
+
+[testenv:cover]
+setenv = VIRTUAL_ENV={envdir}
 
 [testenv:pep8]
-deps = pep8==1.3.3
+allowlist_externals =
+  ./.manpages
 commands =
-  pep8 --repeat --show-source --exclude=.venv,.tox,dist,doc,test .
-  pep8 --repeat --show-pep8 --show-source --filename=swift* bin
+  flake8 {posargs:swift test doc setup.py}
+  python ./setup.py check --restructuredtext --strict
+  bandit -c bandit.yaml -r swift -n 5
+  ./.manpages {posargs}
 
-[testenv:cover]
-setenv = NOSE_WITH_COVERAGE=1
+[testenv:func]
+deps = {[testenv:py37]deps}
+allowlist_externals =
+  ./.functests
+commands = ./.functests {posargs}
+
+[testenv:func-ec]
+deps = {[testenv:py37]deps}
+allowlist_externals =
+  ./.functests
+commands = ./.functests {posargs}
+setenv = SWIFT_TEST_IN_PROCESS=1
+         SWIFT_TEST_IN_PROCESS_CONF_LOADER=ec
+
+[testenv:func-encryption]
+deps = {[testenv:py37]deps}
+allowlist_externals =
+  ./.functests
+commands = ./.functests {posargs}
+setenv = SWIFT_TEST_IN_PROCESS=1
+         SWIFT_TEST_IN_PROCESS_CONF_LOADER=encryption
 
 [testenv:venv]
 commands = {posargs}
+
+[testenv:docs]
+deps =
+  -c{env:TOX_CONSTRAINTS_FILE:https://releases.openstack.org/constraints/upper/master}
+  -r{toxinidir}/doc/requirements.txt
+commands = sphinx-build -W -b html doc/source doc/build/html
+
+[testenv:api-ref]
+# This environment is called from CI scripts to test and publish
+# the API Ref to docs.openstack.org.
+deps = {[testenv:docs]deps}
+allowlist_externals =
+  rm
+commands =
+  rm -rf api-ref/build
+  sphinx-build -W -b html -d api-ref/build/doctrees api-ref/source api-ref/build/html
+
+[flake8]
+# it's not a bug that we aren't using all of hacking, ignore:
+# H101: Use TODO(NAME)
+# H202: assertRaises Exception too broad
+# H214: Use assertIn/NotIn ...
+# H216: The unittest.mock module should be used rather than ...
+# H301: one import per line
+# H306: imports not in alphabetical order (time, os)
+# H404: multi line docstring should start without a leading new line
+# H405: multi line docstring summary not separated with an empty line
+# H501: Do not use self.__dict__ for string formatting
+# Disabled with going to hacking 2.0, needs further investigation and
+# changes to enable:
+# E402: module level import not at top of file
+# E731 do not assign a lambda expression, use a def
+# E741 ambiguous variable name
+# Swift team needs to decide if they want to enable either of these:
+# W503: line break before binary operator
+# W504: line break after binary operator
+ignore = H101,H202,H214,H216,H301,H306,H404,H405,H501,W503,W504,E402,E731,E741
+exclude = .venv,.tox,dist,*egg
+filename = *.py
+show-source = True
+# Optional, off-by-default checks:
+# H106: Don't put vim configuration in source files
+# H203: Use assertIs(Not)None to check for None
+# H204: Use assert(Not)Equal to check for equality.
+# H205: Use assert(Greater|Less)(Equal) for comparison.
+# H210: Require ‘autospec’, ‘spec’, or ‘spec_set’ in mock.patch/mock.patch.object calls
+# H904: Delay string interpolations at logging calls.
+enable-extensions = H106,H904
+
+[testenv:bindep]
+# Do not install any requirements. We want this to be fast and work even if
+# system dependencies are missing, since it's used to tell you what system
+# dependencies are missing! This also means that bindep must be installed
+# separately, outside of the requirements files.
+skip_install = True
+deps = bindep
+commands = bindep test doc
+
+[testenv:releasenotes]
+deps = {[testenv:docs]deps}
+commands = sphinx-build -a -W -E -d releasenotes/build/doctrees -b html releasenotes/source releasenotes/build/html
+
+[testenv:lower-constraints]
+deps =
+  -c{toxinidir}/lower-constraints.txt
+  -r{toxinidir}/test-requirements.txt
+  -r{toxinidir}/requirements.txt
+basepython = python3.7
+
+[testenv:pdf-docs]
+deps = {[testenv:docs]deps}
+allowlist_externals =
+  make
+commands =
+  sphinx-build -W -b latex doc/source doc/build/pdf
+  make -C doc/build/pdf